[
  {
    "path": ".github/workflows/ci.yaml",
    "content": "name: Continuous Integration\n\non:\n  push:\n    branches:\n      - main\n  pull_request:\n    branches:\n      - main\n  workflow_dispatch:\n\njobs:\n  build:\n    name: \"build ${{ matrix.name-prefix }} (py ${{ matrix.python-version }} on ${{ matrix.os }})\"\n    runs-on: ${{ matrix.os }}\n    strategy:\n      matrix:\n        include:\n          - name-prefix: \"all tests\"\n            python-version: '3.12'\n            os: ubuntu-latest\n\n    steps:\n    - uses: actions/checkout@v6\n    - name: Set up uv\n      uses: astral-sh/setup-uv@v7\n      with:\n        enable-cache: true\n        cache-dependency-glob: \"uv.lock\"\n\n    - name: Set up Python ${{ matrix.python-version }}\n      run: uv python install ${{ matrix.python-version }}\n\n    - name: Install dependencies\n      run: sudo apt-get install -y hmmer\n\n    - name: Install Python dependencies\n      run: uv sync --frozen --all-groups\n\n    - name: Build data\n      run: uv run build_data\n\n    - name: Run CPU-only tests\n      run: uv run python run_alphafold_data_test.py\n"
  },
  {
    "path": "CMakeLists.txt",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\ncmake_minimum_required(VERSION 3.28)\n\n# This forces Git to use the 'files' backend for all FetchContent operations.\n# This fixes libcifpp and dssp incompatibility with newer git versions.\nset(ENV{GIT_CONFIG_PARAMETERS} \"'init.defaultRefFormat=files'\")\n\nproject(\n  \"${SKBUILD_PROJECT_NAME}\"\n  LANGUAGES CXX\n  VERSION \"${SKBUILD_PROJECT_VERSION}\")\n\ninclude(FetchContent)\nset(CMAKE_CXX_STANDARD 20)\nset(CMAKE_CXX_STANDARD_REQUIRED ON)\nset(CMAKE_POSITION_INDEPENDENT_CODE TRUE)\nset(ABSL_PROPAGATE_CXX_STD ON)\n\n# Remove support for scan deps, which is only useful when using C++ modules.\nunset(CMAKE_CXX_SCANDEP_SOURCE)\n\nFetchContent_Declare(\n  abseil-cpp\n  GIT_REPOSITORY https://github.com/abseil/abseil-cpp\n  GIT_TAG d7aaad83b488fd62bd51c81ecf16cd938532cc0a # 20240116.2\n  EXCLUDE_FROM_ALL)\n\nFetchContent_Declare(\n  pybind11\n  GIT_REPOSITORY https://github.com/pybind/pybind11\n  GIT_TAG 2e0815278cb899b20870a67ca8205996ef47e70f # v2.12.0\n  EXCLUDE_FROM_ALL)\n\nFetchContent_Declare(\n  pybind11_abseil\n  GIT_REPOSITORY https://github.com/pybind/pybind11_abseil\n  GIT_TAG bddf30141f9fec8e577f515313caec45f559d319 # HEAD @ 2024-08-07\n  EXCLUDE_FROM_ALL)\n\nFetchContent_Declare(\n  cifpp\n  GIT_REPOSITORY https://github.com/pdb-redo/libcifpp\n  GIT_TAG ac98531a2fc8daf21131faa0c3d73766efa46180 # v7.0.3\n  # Don't `EXCLUDE_FROM_ALL` as necessary for build_data.\n)\n\nFetchContent_Declare(\n  dssp\n  GIT_REPOSITORY https://github.com/PDB-REDO/dssp\n  GIT_TAG 57560472b4260dc41f457706bc45fc6ef0bc0f10 # v4.4.7\n  EXCLUDE_FROM_ALL)\n\nFetchContent_MakeAvailable(pybind11 abseil-cpp pybind11_abseil cifpp dssp)\n\nfind_package(\n  Python3\n  COMPONENTS Interpreter Development NumPy\n  REQUIRED)\n\ninclude_directories(${PYTHON_INCLUDE_DIRS})\ninclude_directories(src/)\n\nfile(GLOB_RECURSE cpp_srcs src/alphafold3/*.cc)\nlist(FILTER cpp_srcs EXCLUDE REGEX \".*\\(_test\\|_main\\|_benchmark\\).cc$\")\n\nadd_compile_definitions(NPY_NO_DEPRECATED_API=NPY_1_7_API_VERSION)\n\npybind11_add_module(cpp ${cpp_srcs})\n\ntarget_link_libraries(\n  cpp\n  PRIVATE absl::check\n          absl::flat_hash_map\n          absl::node_hash_map\n          absl::strings\n          absl::status\n          absl::statusor\n          absl::log\n          pybind11_abseil::absl_casters\n          Python3::NumPy\n          dssp::dssp\n          cifpp::cifpp)\n\ntarget_compile_definitions(cpp PRIVATE VERSION_INFO=${PROJECT_VERSION})\ninstall(TARGETS cpp LIBRARY DESTINATION alphafold3)\ninstall(\n  FILES LICENSE\n        OUTPUT_TERMS_OF_USE.md\n        WEIGHTS_PROHIBITED_USE_POLICY.md\n        WEIGHTS_TERMS_OF_USE.md\n  DESTINATION alphafold3)\n"
  },
  {
    "path": "CONTRIBUTING.md",
    "content": "# How to Contribute\n\nWe welcome small patches related to bug fixes and documentation, but we do not\nplan to make any major changes to this repository.\n\n## AI Generated Code\n\nWe welcome the use of AI tools for the generation of code, documentation and/or\nPull Request (PR) description as long as:\n\n1.  It has been transparently labelled as such. Make sure to declare it in the\n    PR message.\n2.  You have manually reviewed the code before sending the PR.\n3.  The change has been manually tested. We might ask you to fold a certain\n    input to check correctness of the PR.\n\nPlease do not submit AI generated PRs where test results have been hallucinated.\n\n## Contributor License Agreement\n\nContributions to this project must be accompanied by a Contributor License\nAgreement. You (or your employer) retain the copyright to your contribution,\nthis simply gives us permission to use and redistribute your contributions as\npart of the project. Head over to <https://cla.developers.google.com/> to see\nyour current agreements on file or to sign a new one.\n\nYou generally only need to submit a CLA once, so if you've already submitted one\n(even if it was for a different project), you probably don't need to do it\nagain.\n\n## Code reviews\n\nAll submissions, including submissions by project members, require review. We\nuse GitHub pull requests for this purpose. Consult\n[GitHub Help](https://help.github.com/articles/about-pull-requests/) for more\ninformation on using pull requests.\n"
  },
  {
    "path": "LICENSE",
    "content": "Attribution-NonCommercial-ShareAlike 4.0 International\n\n=======================================================================\n\nCreative Commons Corporation (\"Creative Commons\") is not a law firm and\ndoes not provide legal services or legal advice. Distribution of\nCreative Commons public licenses does not create a lawyer-client or\nother relationship. Creative Commons makes its licenses and related\ninformation available on an \"as-is\" basis. Creative Commons gives no\nwarranties regarding its licenses, any material licensed under their\nterms and conditions, or any related information. Creative Commons\ndisclaims all liability for damages resulting from their use to the\nfullest extent possible.\n\nUsing Creative Commons Public Licenses\n\nCreative Commons public licenses provide a standard set of terms and\nconditions that creators and other rights holders may use to share\noriginal works of authorship and other material subject to copyright\nand certain other rights specified in the public license below. The\nfollowing considerations are for informational purposes only, are not\nexhaustive, and do not form part of our licenses.\n\n     Considerations for licensors: Our public licenses are\n     intended for use by those authorized to give the public\n     permission to use material in ways otherwise restricted by\n     copyright and certain other rights. Our licenses are\n     irrevocable. Licensors should read and understand the terms\n     and conditions of the license they choose before applying it.\n     Licensors should also secure all rights necessary before\n     applying our licenses so that the public can reuse the\n     material as expected. Licensors should clearly mark any\n     material not subject to the license. This includes other CC-\n     licensed material, or material used under an exception or\n     limitation to copyright. More considerations for licensors:\n    wiki.creativecommons.org/Considerations_for_licensors\n\n     Considerations for the public: By using one of our public\n     licenses, a licensor grants the public permission to use the\n     licensed material under specified terms and conditions. If\n     the licensor's permission is not necessary for any reason--for\n     example, because of any applicable exception or limitation to\n     copyright--then that use is not regulated by the license. Our\n     licenses grant only permissions under copyright and certain\n     other rights that a licensor has authority to grant. Use of\n     the licensed material may still be restricted for other\n     reasons, including because others have copyright or other\n     rights in the material. A licensor may make special requests,\n     such as asking that all changes be marked or described.\n     Although not required by our licenses, you are encouraged to\n     respect those requests where reasonable. More considerations\n     for the public:\n    wiki.creativecommons.org/Considerations_for_licensees\n\n=======================================================================\n\nCreative Commons Attribution-NonCommercial-ShareAlike 4.0 International\nPublic License\n\nBy exercising the Licensed Rights (defined below), You accept and agree\nto be bound by the terms and conditions of this Creative Commons\nAttribution-NonCommercial-ShareAlike 4.0 International Public License\n(\"Public License\"). To the extent this Public License may be\ninterpreted as a contract, You are granted the Licensed Rights in\nconsideration of Your acceptance of these terms and conditions, and the\nLicensor grants You such rights in consideration of benefits the\nLicensor receives from making the Licensed Material available under\nthese terms and conditions.\n\n\nSection 1 -- Definitions.\n\n  a. Adapted Material means material subject to Copyright and Similar\n     Rights that is derived from or based upon the Licensed Material\n     and in which the Licensed Material is translated, altered,\n     arranged, transformed, or otherwise modified in a manner requiring\n     permission under the Copyright and Similar Rights held by the\n     Licensor. For purposes of this Public License, where the Licensed\n     Material is a musical work, performance, or sound recording,\n     Adapted Material is always produced where the Licensed Material is\n     synched in timed relation with a moving image.\n\n  b. Adapter's License means the license You apply to Your Copyright\n     and Similar Rights in Your contributions to Adapted Material in\n     accordance with the terms and conditions of this Public License.\n\n  c. BY-NC-SA Compatible License means a license listed at\n     creativecommons.org/compatiblelicenses, approved by Creative\n     Commons as essentially the equivalent of this Public License.\n\n  d. Copyright and Similar Rights means copyright and/or similar rights\n     closely related to copyright including, without limitation,\n     performance, broadcast, sound recording, and Sui Generis Database\n     Rights, without regard to how the rights are labeled or\n     categorized. For purposes of this Public License, the rights\n     specified in Section 2(b)(1)-(2) are not Copyright and Similar\n     Rights.\n\n  e. Effective Technological Measures means those measures that, in the\n     absence of proper authority, may not be circumvented under laws\n     fulfilling obligations under Article 11 of the WIPO Copyright\n     Treaty adopted on December 20, 1996, and/or similar international\n     agreements.\n\n  f. Exceptions and Limitations means fair use, fair dealing, and/or\n     any other exception or limitation to Copyright and Similar Rights\n     that applies to Your use of the Licensed Material.\n\n  g. License Elements means the license attributes listed in the name\n     of a Creative Commons Public License. The License Elements of this\n     Public License are Attribution, NonCommercial, and ShareAlike.\n\n  h. Licensed Material means the artistic or literary work, database,\n     or other material to which the Licensor applied this Public\n     License.\n\n  i. Licensed Rights means the rights granted to You subject to the\n     terms and conditions of this Public License, which are limited to\n     all Copyright and Similar Rights that apply to Your use of the\n     Licensed Material and that the Licensor has authority to license.\n\n  j. Licensor means the individual(s) or entity(ies) granting rights\n     under this Public License.\n\n  k. NonCommercial means not primarily intended for or directed towards\n     commercial advantage or monetary compensation. For purposes of\n     this Public License, the exchange of the Licensed Material for\n     other material subject to Copyright and Similar Rights by digital\n     file-sharing or similar means is NonCommercial provided there is\n     no payment of monetary compensation in connection with the\n     exchange.\n\n  l. Share means to provide material to the public by any means or\n     process that requires permission under the Licensed Rights, such\n     as reproduction, public display, public performance, distribution,\n     dissemination, communication, or importation, and to make material\n     available to the public including in ways that members of the\n     public may access the material from a place and at a time\n     individually chosen by them.\n\n  m. Sui Generis Database Rights means rights other than copyright\n     resulting from Directive 96/9/EC of the European Parliament and of\n     the Council of 11 March 1996 on the legal protection of databases,\n     as amended and/or succeeded, as well as other essentially\n     equivalent rights anywhere in the world.\n\n  n. You means the individual or entity exercising the Licensed Rights\n     under this Public License. Your has a corresponding meaning.\n\n\nSection 2 -- Scope.\n\n  a. License grant.\n\n       1. Subject to the terms and conditions of this Public License,\n          the Licensor hereby grants You a worldwide, royalty-free,\n          non-sublicensable, non-exclusive, irrevocable license to\n          exercise the Licensed Rights in the Licensed Material to:\n\n            a. reproduce and Share the Licensed Material, in whole or\n               in part, for NonCommercial purposes only; and\n\n            b. produce, reproduce, and Share Adapted Material for\n               NonCommercial purposes only.\n\n       2. Exceptions and Limitations. For the avoidance of doubt, where\n          Exceptions and Limitations apply to Your use, this Public\n          License does not apply, and You do not need to comply with\n          its terms and conditions.\n\n       3. Term. The term of this Public License is specified in Section\n          6(a).\n\n       4. Media and formats; technical modifications allowed. The\n          Licensor authorizes You to exercise the Licensed Rights in\n          all media and formats whether now known or hereafter created,\n          and to make technical modifications necessary to do so. The\n          Licensor waives and/or agrees not to assert any right or\n          authority to forbid You from making technical modifications\n          necessary to exercise the Licensed Rights, including\n          technical modifications necessary to circumvent Effective\n          Technological Measures. For purposes of this Public License,\n          simply making modifications authorized by this Section 2(a)\n          (4) never produces Adapted Material.\n\n       5. Downstream recipients.\n\n            a. Offer from the Licensor -- Licensed Material. Every\n               recipient of the Licensed Material automatically\n               receives an offer from the Licensor to exercise the\n               Licensed Rights under the terms and conditions of this\n               Public License.\n\n            b. Additional offer from the Licensor -- Adapted Material.\n               Every recipient of Adapted Material from You\n               automatically receives an offer from the Licensor to\n               exercise the Licensed Rights in the Adapted Material\n               under the conditions of the Adapter's License You apply.\n\n            c. No downstream restrictions. You may not offer or impose\n               any additional or different terms or conditions on, or\n               apply any Effective Technological Measures to, the\n               Licensed Material if doing so restricts exercise of the\n               Licensed Rights by any recipient of the Licensed\n               Material.\n\n       6. No endorsement. Nothing in this Public License constitutes or\n          may be construed as permission to assert or imply that You\n          are, or that Your use of the Licensed Material is, connected\n          with, or sponsored, endorsed, or granted official status by,\n          the Licensor or others designated to receive attribution as\n          provided in Section 3(a)(1)(A)(i).\n\n  b. Other rights.\n\n       1. Moral rights, such as the right of integrity, are not\n          licensed under this Public License, nor are publicity,\n          privacy, and/or other similar personality rights; however, to\n          the extent possible, the Licensor waives and/or agrees not to\n          assert any such rights held by the Licensor to the limited\n          extent necessary to allow You to exercise the Licensed\n          Rights, but not otherwise.\n\n       2. Patent and trademark rights are not licensed under this\n          Public License.\n\n       3. To the extent possible, the Licensor waives any right to\n          collect royalties from You for the exercise of the Licensed\n          Rights, whether directly or through a collecting society\n          under any voluntary or waivable statutory or compulsory\n          licensing scheme. In all other cases the Licensor expressly\n          reserves any right to collect such royalties, including when\n          the Licensed Material is used other than for NonCommercial\n          purposes.\n\n\nSection 3 -- License Conditions.\n\nYour exercise of the Licensed Rights is expressly made subject to the\nfollowing conditions.\n\n  a. Attribution.\n\n       1. If You Share the Licensed Material (including in modified\n          form), You must:\n\n            a. retain the following if it is supplied by the Licensor\n               with the Licensed Material:\n\n                 i. identification of the creator(s) of the Licensed\n                    Material and any others designated to receive\n                    attribution, in any reasonable manner requested by\n                    the Licensor (including by pseudonym if\n                    designated);\n\n                ii. a copyright notice;\n\n               iii. a notice that refers to this Public License;\n\n                iv. a notice that refers to the disclaimer of\n                    warranties;\n\n                 v. a URI or hyperlink to the Licensed Material to the\n                    extent reasonably practicable;\n\n            b. indicate if You modified the Licensed Material and\n               retain an indication of any previous modifications; and\n\n            c. indicate the Licensed Material is licensed under this\n               Public License, and include the text of, or the URI or\n               hyperlink to, this Public License.\n\n       2. You may satisfy the conditions in Section 3(a)(1) in any\n          reasonable manner based on the medium, means, and context in\n          which You Share the Licensed Material. For example, it may be\n          reasonable to satisfy the conditions by providing a URI or\n          hyperlink to a resource that includes the required\n          information.\n       3. If requested by the Licensor, You must remove any of the\n          information required by Section 3(a)(1)(A) to the extent\n          reasonably practicable.\n\n  b. ShareAlike.\n\n     In addition to the conditions in Section 3(a), if You Share\n     Adapted Material You produce, the following conditions also apply.\n\n       1. The Adapter's License You apply must be a Creative Commons\n          license with the same License Elements, this version or\n          later, or a BY-NC-SA Compatible License.\n\n       2. You must include the text of, or the URI or hyperlink to, the\n          Adapter's License You apply. You may satisfy this condition\n          in any reasonable manner based on the medium, means, and\n          context in which You Share Adapted Material.\n\n       3. You may not offer or impose any additional or different terms\n          or conditions on, or apply any Effective Technological\n          Measures to, Adapted Material that restrict exercise of the\n          rights granted under the Adapter's License You apply.\n\n\nSection 4 -- Sui Generis Database Rights.\n\nWhere the Licensed Rights include Sui Generis Database Rights that\napply to Your use of the Licensed Material:\n\n  a. for the avoidance of doubt, Section 2(a)(1) grants You the right\n     to extract, reuse, reproduce, and Share all or a substantial\n     portion of the contents of the database for NonCommercial purposes\n     only;\n\n  b. if You include all or a substantial portion of the database\n     contents in a database in which You have Sui Generis Database\n     Rights, then the database in which You have Sui Generis Database\n     Rights (but not its individual contents) is Adapted Material,\n     including for purposes of Section 3(b); and\n\n  c. You must comply with the conditions in Section 3(a) if You Share\n     all or a substantial portion of the contents of the database.\n\nFor the avoidance of doubt, this Section 4 supplements and does not\nreplace Your obligations under this Public License where the Licensed\nRights include other Copyright and Similar Rights.\n\n\nSection 5 -- Disclaimer of Warranties and Limitation of Liability.\n\n  a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE\n     EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS\n     AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF\n     ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS,\n     IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION,\n     WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR\n     PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS,\n     ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT\n     KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT\n     ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU.\n\n  b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE\n     TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION,\n     NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT,\n     INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES,\n     COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR\n     USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN\n     ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR\n     DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR\n     IN PART, THIS LIMITATION MAY NOT APPLY TO YOU.\n\n  c. The disclaimer of warranties and limitation of liability provided\n     above shall be interpreted in a manner that, to the extent\n     possible, most closely approximates an absolute disclaimer and\n     waiver of all liability.\n\n\nSection 6 -- Term and Termination.\n\n  a. This Public License applies for the term of the Copyright and\n     Similar Rights licensed here. However, if You fail to comply with\n     this Public License, then Your rights under this Public License\n     terminate automatically.\n\n  b. Where Your right to use the Licensed Material has terminated under\n     Section 6(a), it reinstates:\n\n       1. automatically as of the date the violation is cured, provided\n          it is cured within 30 days of Your discovery of the\n          violation; or\n\n       2. upon express reinstatement by the Licensor.\n\n     For the avoidance of doubt, this Section 6(b) does not affect any\n     right the Licensor may have to seek remedies for Your violations\n     of this Public License.\n\n  c. For the avoidance of doubt, the Licensor may also offer the\n     Licensed Material under separate terms or conditions or stop\n     distributing the Licensed Material at any time; however, doing so\n     will not terminate this Public License.\n\n  d. Sections 1, 5, 6, 7, and 8 survive termination of this Public\n     License.\n\n\nSection 7 -- Other Terms and Conditions.\n\n  a. The Licensor shall not be bound by any additional or different\n     terms or conditions communicated by You unless expressly agreed.\n\n  b. Any arrangements, understandings, or agreements regarding the\n     Licensed Material not stated herein are separate from and\n     independent of the terms and conditions of this Public License.\n\n\nSection 8 -- Interpretation.\n\n  a. For the avoidance of doubt, this Public License does not, and\n     shall not be interpreted to, reduce, limit, restrict, or impose\n     conditions on any use of the Licensed Material that could lawfully\n     be made without permission under this Public License.\n\n  b. To the extent possible, if any provision of this Public License is\n     deemed unenforceable, it shall be automatically reformed to the\n     minimum extent necessary to make it enforceable. If the provision\n     cannot be reformed, it shall be severed from this Public License\n     without affecting the enforceability of the remaining terms and\n     conditions.\n\n  c. No term or condition of this Public License will be waived and no\n     failure to comply consented to unless expressly agreed to by the\n     Licensor.\n\n  d. Nothing in this Public License constitutes or may be interpreted\n     as a limitation upon, or waiver of, any privileges and immunities\n     that apply to the Licensor or You, including from the legal\n     processes of any jurisdiction or authority.\n\n=======================================================================\n\nCreative Commons is not a party to its public\nlicenses. Notwithstanding, Creative Commons may elect to apply one of\nits public licenses to material it publishes and in those instances\nwill be considered the “Licensor.” The text of the Creative Commons\npublic licenses is dedicated to the public domain under the CC0 Public\nDomain Dedication. Except for the limited purpose of indicating that\nmaterial is shared under a Creative Commons public license or as\notherwise permitted by the Creative Commons policies published at\ncreativecommons.org/policies, Creative Commons does not authorize the\nuse of the trademark \"Creative Commons\" or any other trademark or logo\nof Creative Commons without its prior written consent including,\nwithout limitation, in connection with any unauthorized modifications\nto any of its public licenses or any other arrangements,\nunderstandings, or agreements concerning use of licensed material. For\nthe avoidance of doubt, this paragraph does not form part of the\npublic licenses.\n\nCreative Commons may be contacted at creativecommons.org.\n"
  },
  {
    "path": "OUTPUT_TERMS_OF_USE.md",
    "content": "# ALPHAFOLD 3 OUTPUT TERMS OF USE\n\nLast Modified: 2024-11-09\n\nBy using AlphaFold 3 Output (as defined below), without having agreed to\n[AlphaFold 3 Model Parameters Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md),\nyou agree to be bound by these AlphaFold 3 Output Terms of Use between you (or\nyour organization, as applicable) and Google LLC (these \"**Terms**\").\n\nIf you are using Output on behalf of an organization, you confirm you are\nauthorized either explicitly or implicitly to agree to, and are agreeing to,\nthese Terms as an employee on behalf of, or otherwise on behalf of, your\norganization.\n\nIf you have agreed to\n[AlphaFold 3 Model Parameters Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md),\nyour use of Output are governed by those terms. **If you have not agreed to\n[AlphaFold 3 Model Parameters Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md)\nand do not agree to these Terms, do not use Output or permit any third party to\ndo so on your behalf.**\n\nWhen we say \"**you**\", we mean the individual or organization using Output. When\nwe say \"**we**\", \"**us**\" or \"**Google**\", we mean the entities that belong to\nthe Google group of companies, which means Google LLC and its affiliates.\n\n## Key Definitions\n\nAs used in these Terms:\n\n\"**AlphaFold 3**\" means the AlphaFold 3 Code and Model Parameters.\n\n\"**AlphaFold 3 Code**\" means the AlphaFold 3 source code: (a) identified at\n[public GitHub repo](https://github.com/google-deepmind/alphafold3/), or such\nother location in which we may make it available from time to time, regardless\nof the source that it was obtained from; and (b) made available by Google to\norganizations for their use in accordance with the\n[AlphaFold 3 Model Parameters Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md)\n(not these Terms) together with (i) modifications to that code, (ii) works based\non that code, or (iii) other code or machine learning model which incorporates,\nin full or in part, that code.\n\n\"**Model Parameters**\" means the trained model weights and parameters made\navailable by Google to organizations (at its sole discretion) for their use in\naccordance with the\n[AlphaFold 3 Model Parameters Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md)\n(not these Terms), together with (a) modifications to those weights and\nparameters, (b) works based on those weights and parameters, or (c) other code\nor machine learning model which incorporates, in full or in part, those weights\nand parameters.\n\n\"**Output**\" means the structure predictions and all related information\nprovided by AlphaFold 3, together with any visual representations, computational\npredictions, descriptions, modifications, copies, or adaptations that are\nsubstantially derived from Output.\n\n## Use restrictions\n\n[AlphaFold 3](https://blog.google/technology/ai/google-deepmind-isomorphic-alphafold-3-ai-model/)\nbelongs to us. Output are made available free of charge, for non-commercial use\nonly, in accordance with the following use restrictions. You must not use nor\nallow others to use Output:\n\n1.  **On behalf of a commercial organization or in connection with any\n    commercial activities, including research on behalf of commercial\n    organizations.**\n\n    1.  This means that only non-commercial organizations (*i.e.*, universities,\n        non-profit organizations and research institutes, educational,\n        journalism and government bodies) may use Output for their\n        non-commercial activities. Output are not available for use by any other\n        types of organization, even if conducting non-commercial work.\n\n    2.  If you are a researcher affiliated with a non-commercial organization,\n        provided **you are not a commercial organisation or acting on behalf of\n        a commercial organisation**, you can use Output for your non-commercial\n        affiliated research.\n\n    3.  You must not share Output with any commercial organization. The only\n        exception is making Output publicly available (including, indirectly, to\n        commercial organizations) via a scientific publication or open source\n        release or using these to support journalism, each of which are\n        permitted.\n\n2.  **To misinform, misrepresent or mislead**, including:\n\n    1.  providing false or inaccurate information in relation to your access to\n        or use of Output;\n\n    2.  misrepresenting your relationship with Google - including by using\n        Google’s trademarks, trade names, logos or suggesting endorsement by\n        Google without Google’s permission to do so - nothing in these Terms\n        grants such permission;\n\n    3.  misrepresenting the origin of Output;\n\n    4.  distributing misleading claims of expertise or capability, or engaging\n        in the unauthorized or unlicensed practice of any profession,\n        particularly in sensitive areas (*e.g.*, health); or\n\n    5.  making decisions in domains that affect material or individual rights or\n        well-being (*e.g.*, healthcare).\n\n3.  **To perform, promote or facilitate dangerous, illegal or malicious\n    activities**, including:\n\n    1.  promoting or facilitating the sale of, or providing instructions for\n        synthesizing or accessing, illegal substances, goods or services;\n\n    2.  abusing, harming, interfering, or disrupting any services, including\n        generating or distributing content for deceptive or fraudulent\n        activities or malware;\n\n    3.  generating or distributing any content that infringes, misappropriates,\n        or otherwise violates any individual’s or entity’s rights (including,\n        but not limited to rights in copyrighted content); or\n\n    4.  attempting to circumvent these Terms.\n\n4.  **To train or create machine learning models or related technology for\n    biomolecular structure prediction similar to AlphaFold 3 as made available\n    by Google (\"Derived Models\"),** including via distillation or other\n    methods**.** For the avoidance of doubt, the use restrictions set out in\n    these Terms would apply in full to any Derived Models created in breach of\n    these Terms.\n\n5.  **Without providing conspicuous notice that published or distributed Output\n    is provided under and subject to these Terms and of any modifications you\n    make to Output.**\n\n    1.  This means if you remove, or cause to be removed (for example by using\n        third-party software), these Terms, or any notice of these Terms, from\n        Output, you must ensure further distribution or publication is\n        accompanied by a copy of the\n        [AlphaFold 3 Output Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n        and a \"*Legally Binding Terms of Use*\" text file that contains the\n        following notice:\n\n        \"*By using this information, you agree to AlphaFold 3 Output Terms of\n        Use found at\n        https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md.*\n\n        *To request access to the AlphaFold 3 model parameters, follow the\n        process set out at https://github.com/google-deepmind/alphafold3. You\n        may only use these if received directly from Google. Use is subject to\n        terms of use available at\n        https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.*\"\n\n    2.  You must not include any additional or different terms that conflict\n        with the\n        [AlphaFold 3 Output Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\n6.  **Distribute Output, or disclose findings arising from using AlphaFold 3\n    without citing our paper:** [Abramson, J et al. Accurate structure\n    prediction of biomolecular interactions with AlphaFold 3. *Nature*\n    (2024)](https://www.nature.com/articles/s41586-024-07487-w). For the\n    avoidance of doubt, this is an additional requirement to the notice\n    requirements set out above.\n\nWe grant you a non-exclusive, royalty-free, revocable, non-transferable and\nnon-sublicensable (except as expressly permitted in these Terms) license to any\nintellectual property rights we have in Output to the extent necessary for these\npurposes. You agree that your right to use and share Output is subject to your\ncompliance with these Terms. If you breach these Terms, Google reserves the\nright to request that you delete and cease use or sharing of Output in your\npossession or control and prohibit you from using the AlphaFold 3 Assets\n(including as made available via\n[AlphaFold Server](https://alphafoldserver.com/about)). You agree to immediately\ncomply with any such request.\n\n## Disclaimers\n\nNothing in these Terms restricts any rights that cannot be restricted under\napplicable law or limits Google’s responsibilities except as allowed by\napplicable law.\n\n**Output are provided on an \"as is\" basis, without warranties or conditions of\nany kind, either express or implied, including any warranties or conditions of\ntitle, non-infringement, merchantability, or fitness for a particular purpose.\nYou are solely responsible for determining the appropriateness of using or\ndistributing any of the Output and assume any and all risks associated with your\nuse or distribution of any Output and your exercise of rights and obligations\nunder these Terms. You and anyone you share Output with are solely responsible\nfor these and their subsequent uses.**\n\n**Output are predictions with varying levels of confidence and should be\ninterpreted carefully. Use discretion before relying on, publishing, downloading\nor otherwise using Output.**\n\n**Output are for theoretical modeling only. These are not intended, validated,\nor approved for clinical use. You should not use these for clinical purposes or\nrely on them for medical or other professional advice. Any content regarding\nthose topics is provided for informational purposes only and is not a substitute\nfor advice from a qualified professional.**\n\n## Liabilities\n\nTo the extent allowed by applicable law, you will indemnify Google and its\ndirectors, officers, employees, and contractors for any third-party legal\nproceedings (including actions by government authorities) arising out of or\nrelating to your unlawful use of Output or violation of these Terms. This\nindemnity covers any liability or expense arising from claims, losses, damages,\njudgments, fines, litigation costs, and legal fees, except to the extent a\nliability or expense is caused by Google's breach, negligence, or willful\nmisconduct. If you are legally exempt from certain responsibilities, including\nindemnification, then those responsibilities don’t apply to you under these\nterms.\n\nIn no circumstances will Google be responsible for any indirect, special,\nincidental, exemplary, consequential, or punitive damages, or lost profits of\nany kind, even if Google has been advised of the possibility of such damages.\nGoogle’s total, aggregate liability for all claims arising out of or in\nconnection with these Terms or Output, including for its own negligence, is\nlimited to $500.\n\n## Governing law and disputes\n\nThese Terms will be governed by the laws of the State of California. The state\nor federal courts of Santa Clara County, California shall have exclusive\njurisdiction of any dispute arising out of these Terms.\n\nGiven the nature of scientific research, it may take some time for any breach of\nthese Terms to become apparent. To the extent allowed by applicable law, any\nlegal claims relating to these Terms or Output can be initiated until the later\nof (a) the cut-off date under applicable law for bringing the legal claim; or\n(b) two years from the date you or Google (as applicable) became aware, or\nshould reasonably have become aware, of the facts giving rise to that claim. You\nwill not argue limitation, time bar, delay, waiver or the like in an attempt to\nbar an action filed within that time period, and neither will we.\n\nAll rights not specifically and expressly granted to you by these Terms are\nreserved to Google. No delay, act or omission by Google in exercising any right\nor remedy will be deemed a waiver of any breach of these Terms and Google\nexpressly reserves any and all rights and remedies available under these Terms\nor at law or in equity or otherwise, including the remedy of injunctive relief\nagainst any threatened or actual breach of these Terms without the necessity of\nproving actual damages.\n\n## Miscellaneous\n\nGoogle may update these Terms (1) to reflect changes in how it does business,\n(2) for legal, regulatory or security reasons, or (3) to prevent abuse or harm.\nThe version of these Terms that were effective on the date the relevant Output\nwas generated will apply to your use of that Output.\n\nIf it turns out that a particular provision of these Terms is not valid or\nenforceable, this will not affect any other provisions.\n"
  },
  {
    "path": "README.md",
    "content": "![header](docs/header.jpg)\n\n# AlphaFold 3\n\nThis package provides an implementation of the inference pipeline of AlphaFold\n3. See below for how to access the model parameters. You may only use AlphaFold\n3 model parameters if received directly from Google. Use is subject to these\n[terms of use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md).\n\nAny publication that discloses findings arising from using this source code, the\nmodel parameters or outputs produced by those should [cite](#citing-this-work)\nthe\n[Accurate structure prediction of biomolecular interactions with AlphaFold 3](https://doi.org/10.1038/s41586-024-07487-w)\npaper.\n\nPlease also refer to the Supplementary Information for a detailed description of\nthe method.\n\nAlphaFold 3 is also available at\n[alphafoldserver.com](https://alphafoldserver.com) for non-commercial use,\nthough with a more limited set of ligands and covalent modifications.\n\nIf you have any questions, please contact the AlphaFold team at\n[alphafold@google.com](mailto:alphafold@google.com).\n\n## Obtaining Model Parameters\n\nThis repository contains all necessary code for AlphaFold 3 inference. To\nrequest access to the AlphaFold 3 model parameters, please complete\n[this form](https://forms.gle/svvpY4u2jsHEwWYS6). Access will be granted at\nGoogle DeepMind’s sole discretion. We will aim to respond to requests within 2–3\nbusiness days. You may only use AlphaFold 3 model parameters if received\ndirectly from Google. Use is subject to these\n[terms of use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md).\n\n## Installation and Running Your First Prediction\n\nSee the [installation documentation](docs/installation.md).\n\nOnce you have installed AlphaFold 3, you can test your setup using e.g. the\nfollowing input JSON file named `fold_input.json`:\n\n```json\n{\n  \"name\": \"2PV7\",\n  \"sequences\": [\n    {\n      \"protein\": {\n        \"id\": [\"A\", \"B\"],\n        \"sequence\": \"GMRESYANENQFGFKTINSDIHKIVIVGGYGKLGGLFARYLRASGYPISILDREDWAVAESILANADVVIVSVPINLTLETIERLKPYLTENMLLADLTSVKREPLAKMLEVHTGAVLGLHPMFGADIASMAKQVVVRCDGRFPERYEWLLEQIQIWGAKIYQTNATEHDHNMTYIQALRHFSTFANGLHLSKQPINLANLLALSSPIYRLELAMIGRLFAQDAELYADIIMDKSENLAVIETLKQTYDEALTFFENNDRQGFIDAFHKVRDWFGDYSEQFLKESRQLLQQANDLKQG\"\n      }\n    }\n  ],\n  \"modelSeeds\": [1],\n  \"dialect\": \"alphafold3\",\n  \"version\": 1\n}\n```\n\nYou can then run AlphaFold 3 using the following command:\n\n```\ndocker run -it \\\n    --volume $HOME/af_input:/root/af_input \\\n    --volume $HOME/af_output:/root/af_output \\\n    --volume <MODEL_PARAMETERS_DIR>:/root/models \\\n    --volume <DATABASES_DIR>:/root/public_databases \\\n    --gpus all \\\n    alphafold3 \\\n    python run_alphafold.py \\\n    --json_path=/root/af_input/fold_input.json \\\n    --model_dir=/root/models \\\n    --output_dir=/root/af_output\n```\n\nThere are various flags that you can pass to the `run_alphafold.py` command, to\nlist them all run `python run_alphafold.py --help`. Two fundamental flags that\ncontrol which parts AlphaFold 3 will run are:\n\n*   `--run_data_pipeline` (defaults to `true`): whether to run the data\n    pipeline, i.e. genetic and template search. This part is CPU-only, time\n    consuming and could be run on a machine without a GPU.\n*   `--run_inference` (defaults to `true`): whether to run the inference. This\n    part requires a GPU.\n\n## AlphaFold 3 Input\n\nSee the [input documentation](docs/input.md).\n\n## AlphaFold 3 Output\n\nSee the [output documentation](docs/output.md).\n\n## Performance\n\nSee the [performance documentation](docs/performance.md).\n\n## Known Issues\n\nKnown issues are documented in the\n[known issues documentation](docs/known_issues.md).\n\nPlease\n[create an issue](https://github.com/google-deepmind/alphafold3/issues/new/choose)\nif it is not already listed in [Known Issues](docs/known_issues.md) or in the\n[issues tracker](https://github.com/google-deepmind/alphafold3/issues).\n\n## Citing This Work\n\nAny publication that discloses findings arising from using this source code, the\nmodel parameters or outputs produced by those should cite:\n\n```bibtex\n@article{Abramson2024,\n  author  = {Abramson, Josh and Adler, Jonas and Dunger, Jack and Evans, Richard and Green, Tim and Pritzel, Alexander and Ronneberger, Olaf and Willmore, Lindsay and Ballard, Andrew J. and Bambrick, Joshua and Bodenstein, Sebastian W. and Evans, David A. and Hung, Chia-Chun and O’Neill, Michael and Reiman, David and Tunyasuvunakool, Kathryn and Wu, Zachary and Žemgulytė, Akvilė and Arvaniti, Eirini and Beattie, Charles and Bertolli, Ottavia and Bridgland, Alex and Cherepanov, Alexey and Congreve, Miles and Cowen-Rivers, Alexander I. and Cowie, Andrew and Figurnov, Michael and Fuchs, Fabian B. and Gladman, Hannah and Jain, Rishub and Khan, Yousuf A. and Low, Caroline M. R. and Perlin, Kuba and Potapenko, Anna and Savy, Pascal and Singh, Sukhdeep and Stecula, Adrian and Thillaisundaram, Ashok and Tong, Catherine and Yakneen, Sergei and Zhong, Ellen D. and Zielinski, Michal and Žídek, Augustin and Bapst, Victor and Kohli, Pushmeet and Jaderberg, Max and Hassabis, Demis and Jumper, John M.},\n  journal = {Nature},\n  title   = {Accurate structure prediction of biomolecular interactions with AlphaFold 3},\n  year    = {2024},\n  volume  = {630},\n  number  = {8016},\n  pages   = {493–-500},\n  doi     = {10.1038/s41586-024-07487-w}\n}\n```\n\n## Acknowledgements\n\nAlphaFold 3's release was made possible by the invaluable contributions of the\nfollowing people:\n\nAndrew Cowie, Bella Hansen, Charlie Beattie, Chris Jones, Grace Margand,\nJacob Kelly, James Spencer, Josh Abramson, Kathryn Tunyasuvunakool, Kuba Perlin,\nLindsay Willmore, Max Bileschi, Molly Beck, Oleg Kovalevskiy,\nSebastian Bodenstein, Sukhdeep Singh, Tim Green, Toby Sargeant, Uchechi Okereke,\nYotam Doron, and Augustin Žídek (engineering lead).\n\nWe also extend our gratitude to our collaborators at Google and Isomorphic Labs.\n\nAlphaFold 3 uses the following separate libraries and packages:\n\n*   [abseil-cpp](https://github.com/abseil/abseil-cpp) and\n    [abseil-py](https://github.com/abseil/abseil-py)\n*   [Docker](https://www.docker.com)\n*   [DSSP](https://github.com/PDB-REDO/dssp)\n*   [HMMER Suite](https://github.com/EddyRivasLab/hmmer)\n*   [Haiku](https://github.com/deepmind/dm-haiku)\n*   [JAX](https://github.com/jax-ml/jax/)\n*   [libcifpp](https://github.com/pdb-redo/libcifpp)\n*   [NumPy](https://github.com/numpy/numpy)\n*   [pybind11](https://github.com/pybind/pybind11) and\n    [pybind11_abseil](https://github.com/pybind/pybind11_abseil)\n*   [RDKit](https://github.com/rdkit/rdkit)\n*   [Tokamax](https://github.com/openxla/tokamax)\n*   [tqdm](https://github.com/tqdm/tqdm)\n\nWe thank all their contributors and maintainers!\n\n## Get in Touch\n\nIf you have any questions not covered in this overview, please contact the\nAlphaFold team at alphafold@google.com.\n\nWe would love to hear your feedback and understand how AlphaFold 3 has been\nuseful in your research. Share your stories with us at\n[alphafold@google.com](mailto:alphafold@google.com).\n\n## Licence and Disclaimer\n\nThis is not an officially supported Google product.\n\nCopyright 2024 DeepMind Technologies Limited.\n\n### AlphaFold 3 Source Code and Model Parameters\n\nThe AlphaFold 3 source code is licensed under the Creative Commons\nAttribution-Non-Commercial ShareAlike International License, Version 4.0\n(CC-BY-NC-SA 4.0) (the \"License\"); you may not use this file except in\ncompliance with the License. You may obtain a copy of the License at\n[https://github.com/google-deepmind/alphafold3/blob/main/LICENSE](https://github.com/google-deepmind/alphafold3/blob/main/LICENSE).\n\nThe AlphaFold 3 model parameters are made available under the\n[AlphaFold 3 Model Parameters Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md)\n(the \"Terms\"); you may not use these except in compliance with the Terms. You\nmay obtain a copy of the Terms at\n[https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md).\n\nUnless required by applicable law, AlphaFold 3 and its output are distributed on\nan \"AS IS\" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express\nor implied. You are solely responsible for determining the appropriateness of\nusing AlphaFold 3, or using or distributing its source code or output, and\nassume any and all risks associated with such use or distribution and your\nexercise of rights and obligations under the relevant terms. Output are\npredictions with varying levels of confidence and should be interpreted\ncarefully. Use discretion before relying on, publishing, downloading or\notherwise using the AlphaFold 3 Assets.\n\nAlphaFold 3 and its output are for theoretical modeling only. They are not\nintended, validated, or approved for clinical use. You should not use the\nAlphaFold 3 or its output for clinical purposes or rely on them for medical or\nother professional advice. Any content regarding those topics is provided for\ninformational purposes only and is not a substitute for advice from a qualified\nprofessional. See the relevant terms for the specific language governing\npermissions and limitations under the terms.\n\n### Third-party Software\n\nUse of the third-party software, libraries or code referred to in the\n[Acknowledgements](#acknowledgements) section above may be governed by separate\nterms and conditions or license provisions. Your use of the third-party\nsoftware, libraries or code is subject to any such terms and you should check\nthat you can comply with any applicable restrictions or terms and conditions\nbefore use.\n\n### Mirrored and Reference Databases\n\nThe following databases have been: (1) mirrored by Google DeepMind; and (2) in\npart, included with the inference code package for testing purposes, and are\navailable with reference to the following:\n\n*   [BFD](https://bfd.mmseqs.com/) (modified), by Steinegger M. and Söding J.,\n    modified by Google DeepMind, available under a\n    [Creative Commons Attribution 4.0 International License](https://creativecommons.org/licenses/by/4.0/deed.en).\n    See the Methods section of the\n    [AlphaFold proteome paper](https://www.nature.com/articles/s41586-021-03828-1)\n    for details.\n*   [PDB](https://wwpdb.org) (unmodified), by H.M. Berman et al., available free\n    of all copyright restrictions and made fully and freely available for both\n    non-commercial and commercial use under\n    [CC0 1.0 Universal (CC0 1.0) Public Domain Dedication](https://creativecommons.org/publicdomain/zero/1.0/).\n*   [MGnify: v2022\\_05](https://ftp.ebi.ac.uk/pub/databases/metagenomics/peptide_database/2022_05/README.txt)\n    (unmodified), by Mitchell AL et al., available free of all copyright\n    restrictions and made fully and freely available for both non-commercial and\n    commercial use under\n    [CC0 1.0 Universal (CC0 1.0) Public Domain Dedication](https://creativecommons.org/publicdomain/zero/1.0/).\n*   [UniProt: 2021\\_04](https://www.uniprot.org/) (unmodified), by The UniProt\n    Consortium, available under a\n    [Creative Commons Attribution 4.0 International License](https://creativecommons.org/licenses/by/4.0/deed.en).\n*   [UniRef90: 2022\\_05](https://www.uniprot.org/) (unmodified) by The UniProt\n    Consortium, available under a\n    [Creative Commons Attribution 4.0 International License](https://creativecommons.org/licenses/by/4.0/deed.en).\n*   [NT: 2023\\_02\\_23](https://www.ncbi.nlm.nih.gov/nucleotide/) (modified) See\n    the Supplementary Information of the\n    [AlphaFold 3 paper](https://nature.com/articles/s41586-024-07487-w) for\n    details.\n*   [RFam: 14\\_4](https://rfam.org/) (modified), by I. Kalvari et al., available\n    free of all copyright restrictions and made fully and freely available for\n    both non-commercial and commercial use under\n    [CC0 1.0 Universal (CC0 1.0) Public Domain Dedication](https://creativecommons.org/publicdomain/zero/1.0/).\n    See the Supplementary Information of the\n    [AlphaFold 3 paper](https://nature.com/articles/s41586-024-07487-w) for\n    details.\n*   [RNACentral: 21\\_0](https://rnacentral.org/) (modified), by The RNAcentral\n    Consortium available free of all copyright restrictions and made fully and\n    freely available for both non-commercial and commercial use under\n    [CC0 1.0 Universal (CC0 1.0) Public Domain Dedication](https://creativecommons.org/publicdomain/zero/1.0/).\n    See the Supplementary Information of the\n    [AlphaFold 3 paper](https://nature.com/articles/s41586-024-07487-w) for\n    details.\n"
  },
  {
    "path": "WEIGHTS_PROHIBITED_USE_POLICY.md",
    "content": "# ALPHAFOLD 3 MODEL PARAMETERS PROHIBITED USE POLICY\n\nLast Modified: 2024-11-09\n\nAlphaFold 3 can help you accelerate scientific research by predicting the 3D\nstructure of biological molecules. Google makes the AlphaFold Assets available\nfree of charge for certain non-commercial uses in accordance with the\nrestrictions set out below. This policy uses the same defined terms as the\n[AlphaFold 3 Model Parameters Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md).\n\n**You must not access or use nor allow others to access or use the AlphaFold 3\nAssets:**\n\n1.  **On behalf of a commercial organization or in connection with any\n    commercial activities, including research on behalf of commercial\n    organizations.**\n\n    1.  This means that only non-commercial organizations (*i.e.*, universities,\n        non-profit organizations and research institutes, educational,\n        journalism and government bodies) may use the AlphaFold 3 Assets for\n        their non-commercial activities. The AlphaFold 3 Assets are not\n        available for any other types of organization, even if conducting\n        non-commercial work.\n\n    2.  If you are a researcher affiliated with a non-commercial organization,\n        provided **you are not a commercial organisation or acting on behalf of\n        a commercial organisation,** you can use the AlphaFold 3 Assets for your\n        non-commercial affiliated research.\n\n    3.  You must not share the AlphaFold 3 Assets with any commercial\n        organization or use the AlphaFold 3 Assets in a manner that will grant a\n        commercial organization any rights in these. The only exception is\n        making Output publicly available (including indirectly to commercial\n        organizations) via a scientific publication or open source release or\n        using it to support journalism, each of which is permitted.\n\n2.  **To misinform, misrepresent or mislead**, including:\n\n    1.  providing false or inaccurate information in relation to your access to\n        or use of AlphaFold 3 or Output, including accessing or using the Model\n        Parameters on behalf of an organization without telling us or submitting\n        a request to access the Model Parameters where Google has prohibited\n        your use of AlphaFold 3 in full or in part (including as made available\n        via [AlphaFold Server](https://alphafoldserver.com/about));\n\n    2.  misrepresenting your relationship with us, including by using Google’s\n        trademarks, trade names, logos or suggesting endorsement by Google\n        without Google’s permission to do so - nothing in the Terms grants such\n        permission;\n\n    3.  misrepresenting the origin of AlphaFold 3 in full or in part;\n\n    4.  distributing misleading claims of expertise or capability, or engaging\n        in the unauthorized or unlicensed practice of any profession,\n        particularly in sensitive areas (*e.g.*, health); or\n\n    5.  to make decisions in domains that affect material or individual rights\n        or well-being (*e.g.*, healthcare).\n\n3.  **To perform, promote or facilitate dangerous, illegal or malicious\n    activities**, including:\n\n    1.  promoting or facilitating the sale of, or providing instructions for\n        synthesizing or accessing, illegal substances, goods or services;\n\n    2.  abusing, harming, interfering, or disrupting any services, including\n        generating or distributing content for deceptive or fraudulent\n        activities or malware;\n\n    3.  generating or distributing any content, including Output, that\n        infringes, misappropriates, or otherwise violates any individual's or\n        entity's rights (including, but not limited to rights in copyrighted\n        content); or\n\n    4.  attempting to circumvent, or intentionally causing (directly or\n        indirectly) AlphaFold 3 to act in a manner that contravenes the Terms.\n\n**You must not nor allow others to:**\n\n1.  **Use Output to train or create machine learning models or related\n    technology for biomolecular structure prediction similar to AlphaFold 3\n    (\"Derived Models\"),** including via distillation or other methods. For the\n    avoidance of doubt, the use restrictions set out in the Terms would apply in\n    full to any Derived Models created in breach of the Terms.\n\n2.  **Distribute Output without providing conspicuous notice that what you\n    Distribute is provided under and subject to the\n    [AlphaFold 3 Output Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n    and of any modifications you make.**\n\n    1.  This means if you remove, or cause to be removed (for example by using\n        third-party software), the notices and terms we provide when you\n        generate Output using AlphaFold 3, you must ensure any further\n        Distribution of Output is accompanied by a copy of the\n        [AlphaFold 3 Output Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n        and a \"Legally Binding Terms of Use\" text file that contains the\n        following notice:\n\n        \"*By using this information, you agree to AlphaFold 3 Output Terms of\n        Use found at\n        https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md.*\n\n        *To request access to the AlphaFold 3 model parameters, follow the\n        process set out at https://github.com/google-deepmind/alphafold3. You\n        may only use these if received directly from Google. Use is subject to\n        terms of use available at\n        https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.*\"\n\n    2.  You must not include any additional or different terms that conflict\n        with the\n        [AlphaFold 3 Output Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\n3.  **Distribute Output, or disclose findings arising from using AlphaFold 3\n    without citing our paper:** [Abramson, J et al. Accurate structure\n    prediction of biomolecular interactions with AlphaFold 3. *Nature*\n    (2024)](https://www.nature.com/articles/s41586-024-07487-w). For the\n    avoidance of doubt, this is an additional requirement to the notice\n    requirements set out above.\n\n4.  **Circumvent access restrictions relating to the Model Parameters, including\n    utilising, sharing or making available the Model Parameters when you have\n    not been expressly authorized to do so by Google.** Google will grant access\n    to the Model Parameters to either:\n\n    1.  you for your individual use on behalf of your organization, in which\n        case you cannot share your copy of Model Parameters with anyone else; or\n\n    2.  an authorized representative of your organization, with full legal\n        authority to bind that organization to these Terms in which case you may\n        share that organization’s copy of the Model Parameters with employees,\n        consultants, contractors and agents of the organization as authorized by\n        that representative.\n"
  },
  {
    "path": "WEIGHTS_TERMS_OF_USE.md",
    "content": "# ALPHAFOLD 3 MODEL PARAMETERS TERMS OF USE\n\nLast Modified: 2024-11-09\n\n[AlphaFold 3](https://blog.google/technology/ai/google-deepmind-isomorphic-alphafold-3-ai-model/)\nis an AI model developed by [Google DeepMind](https://deepmind.google/) and\n[Isomorphic Labs](https://www.isomorphiclabs.com/). It generates 3D structure\npredictions of biological molecules, providing model confidence for the\nstructure predictions. We make the trained model parameters and output generated\nusing those available free of charge for certain non-commercial uses, in\naccordance with these terms of use and the\n[AlphaFold 3 Model Parameters Prohibited Use Policy](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_PROHIBITED_USE_POLICY.md).\n\n**Key things to know when using the AlphaFold 3 model parameters and output**\n\n1.  The AlphaFold 3 model parameters and output are **only** available for\n    non-commercial use by, or on behalf of, non-commercial organizations\n    (*i.e.*, universities, non-profit organizations and research institutes,\n    educational, journalism and government bodies). If you are a researcher\n    affiliated with a non-commercial organization, provided **you are not a\n    commercial organisation or acting on behalf of a commercial organisation,**\n    this means you can use these for your non-commercial affiliated research.\n2.  You **must not** use nor allow others to use:\n    1.  AlphaFold 3 model parameters or output in connection with **any\n        commercial activities, including research** **on behalf of commercial\n        organizations;** or\n    2.  AlphaFold 3 output to **train machine learning models** or related\n        technology for **biomolecular structure prediction** similar to\n        AlphaFold 3.\n3.  You ***must not* publish or share AlphaFold 3 model parameters**, except\n    sharing these within your organization in accordance with these Terms.\n4.  You ***can* publish, share and adapt AlphaFold 3 *output*** in accordance\n    with these Terms, including the requirements to provide clear notice of any\n    modifications you make and that ongoing use of AlphaFold 3 output and\n    derivatives are subject to the\n    [AlphaFold 3 Output Terms of Use](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\nBy using, reproducing, modifying, performing, distributing or displaying any\nportion or element of the Model Parameters (as defined below) or otherwise\naccepting the terms of this agreement, you agree to be bound by (1) these terms\nof use, and (2) the\n[AlphaFold 3 Model Parameters Prohibited Use Policy](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_PROHIBITED_USE_POLICY.md)\nwhich is incorporated herein by reference (together, the \"**Terms**\"), in each\ncase (a) as modified from time to time in accordance with the Terms, and (b)\nbetween you and (i) if you are from a country in the European Economic Area or\nSwitzerland, Google Ireland Limited, or (ii) otherwise, Google LLC.\n\nYou confirm you are authorized either explicitly or implicitly to enter, and are\nentering, into the Terms as an employee on behalf of, or otherwise on behalf of,\nyour organization.\n\nPlease read these Terms carefully. They establish what you can expect from us as\nyou access and use the AlphaFold 3 Assets (as defined below), and what Google\nexpects from you. When we say \"**you**\", we mean the individual or organization\nusing the AlphaFold 3 Assets. When we say \"**we**\", \"**us**\" or \"**Google**\", we\nmean the entities that belong to the Google group of companies, which means\nGoogle LLC and its affiliates.\n\n## 1. Key Definitions\n\nAs used in these Terms:\n\n\"**AlphaFold 3**\" means: (a) the AlphaFold 3 source code made available\n[here](https://github.com/google-deepmind/alphafold3/) and licensed under the\nterms of the Creative Commons Attribution-NonCommercial-Sharealike 4.0\nInternational (CC-BY-NC-SA 4.0) license and any derivative source code, and (b)\nModel Parameters.\n\n\"**AlphaFold 3 Assets**\" means the Model Parameters and Output.\n\n\"**Distribution**\" or \"**Distribute**\" means any transmission, publication, or\nother sharing of Output publicly or to any other person.\n\n\"**Model Parameters**\" means the trained model weights and parameters made\navailable by Google to organizations (at its sole discretion) for their use in\naccordance with these Terms, together with (a) modifications to those weights\nand parameters, (b) works based on those weights and parameters, or (c) other\ncode or machine learning models which incorporate, in full or in part, those\nweights and parameters.\n\n\"**Output**\" means the structure predictions and all ancillary and related\ninformation provided by AlphaFold 3 or using the Model Parameters, together with\nany visual representations, computational predictions, descriptions,\nmodifications, copies, or adaptations that are substantially derived from\nOutput.\n\n\"**Including\"** means \"**including without limitation**\".\n\n## 2. Accessing and using the AlphaFold 3 Assets\n\nSubject to your compliance with the Terms, including the\n[AlphaFold 3 Model Parameters Prohibited Use Policy](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_PROHIBITED_USE_POLICY.md),\nyou may access, use and modify the AlphaFold 3 Assets and Distribute the Output\nas set out in these Terms. We grant you a non-exclusive, royalty-free,\nrevocable, non-transferable and non-sublicensable (except as expressly permitted\nin these Terms) license to any intellectual property rights we have in the\nAlphaFold Assets to the extent necessary for these purposes. In order to verify\nyour access and use of AlphaFold 3, we may from time-to-time ask for additional\ninformation from you, including verification of your name, organization, and\nother identifying information.\n\nBy accessing, using, or modifying the AlphaFold 3 Assets, Distributing Output,\nor requesting to access the Model Parameters, you represent and warrant that (a)\nyou have full power and authority to enter into these Terms (including being of\nsufficient age of consent), (b) Google has never previously terminated your\naccess and right to use AlphaFold 3 (including as made available via\n[AlphaFold Server](https://alphafoldserver.com/about)) due to your breach of\napplicable terms of use, (c) entering into or performing your rights and\nobligations under these Terms will not violate any agreement you have with a\nthird party or any third-party rights, (d) any information provided by you to\nGoogle in relation to AlphaFold 3, including (where applicable) in order to\nrequest access to the Model Parameters, is correct and current, and (e) you are\nnot (i) resident of a embargoed country, (ii) ordinarily resident in a US\nembargoed country, or (iii) otherwise prohibited by applicable export controls\nand sanctions programs from accessing, using, or modifying the AlphaFold 3\nAssets.\n\nIf you choose to give Google feedback, such as suggestions to improve AlphaFold\n3, you undertake any such information is non-confidential and non-proprietary,\nand Google may act on your feedback without obligation to you.\n\n## 3. Use Restrictions\n\nYou must not use any of the AlphaFold 3 Assets:\n\n1.  for the restricted uses set forth in the\n    [AlphaFold 3 Model Parameters Prohibited Use Policy](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_PROHIBITED_USE_POLICY.md);\n    or\n2.  in violation of applicable laws and regulations.\n\nTo the maximum extent permitted by law and without limiting any of our other\nrights, Google reserves the right to revoke your right to use, and (to the\nextent feasible) restrict usage of any of the AlphaFold 3 Assets that Google\nreasonably believes is in violation of these Terms.\n\n## 4. Generated Output\n\nAlthough you must comply with these Terms when using the AlphaFold 3 Assets, we\nwill not claim ownership in original Output you generate using AlphaFold 3.\nHowever, you acknowledge that AlphaFold 3 may generate the same or similar\nOutput for multiple users, including Google, and we reserve all our rights in\nthis respect.\n\n## 5. Changes to the AlphaFold 3 Assets or these Terms\n\nGoogle may add or remove functionalities or features of the AlphaFold 3 Assets\nat any time and may stop offering access to the AlphaFold 3 Assets altogether.\n\nGoogle may update these Terms and the access mechanism for the Model Parameters\nat any time. We'll post any modifications to the Terms\n[in the AlphaFold 3 GitHub repository](https://github.com/google-deepmind/alphafold3).\nChanges will generally become effective 14 days after they are posted. However,\nchanges addressing functionality or made for legal reasons will be effective\nimmediately.\n\nYou should review the Terms whenever we update them or you use the AlphaFold 3\nAssets. If you do not agree to any modifications to the Terms, you must stop\nusing the AlphaFold 3 Assets immediately.\n\n## 6. Suspending or terminating your right to use the AlphaFold 3 Assets\n\nGoogle may at any time suspend or terminate your right to use and, as applicable\naccess to, the AlphaFold 3 Assets because of, among other reasons, your failure\nto fully comply with the Terms. If Google suspends or terminates your right to\naccess or use the AlphaFold 3 Assets, you must immediately delete and cease use\nand Distribution of all copies of the AlphaFold 3 Assets in your possession or\ncontrol and are prohibited from using the AlphaFold 3 Assets, including by\nsubmitting an application to use the Model Parameters. Google will endeavour to\ngive you reasonable notice prior to any such suspension or termination, but no\nnotice or prior warning will be given if the suspension or termination is for\nyour failure to fully comply with the Terms or other serious grounds.\n\nOf course, you are always free to stop using the AlphaFold 3 Assets. If you do\nstop using these, we would appreciate knowing why (via\n[alphafold@google.com](mailto:alphafold@google.com)) so that we can continue to\nimprove our technologies.\n\n## 7. Confidentiality\n\nYou agree not to disclose or make available Google Confidential Information to\nanyone without our prior written consent. \"**Google Confidential Information**\"\nmeans (a) the AlphaFold 3 Model Parameters and all software, technology and\ndocumentation relating to AlphaFold 3, except for the AlphaFold 3 source code,\nand (b) any other information made available by Google that is marked\nconfidential or would normally be considered confidential under the\ncircumstances in which it is presented. Google Confidential Information does not\ninclude (a) information that you already knew prior to your access to, or use\nof, the AlphaFold 3 Assets (including via\n[AlphaFold Server](https://alphafoldserver.com/about)), (b) that becomes public\nthrough no fault of yours (for example, your breach of the Terms), (c) that was\nindependently developed by you without reference to Google Confidential\nInformation, or (d) that was lawfully given to you by a third party (without\nyour or their breach of the Terms).\n\n## 8. Disclaimers\n\nNothing in the Terms restricts any rights that cannot be restricted under\napplicable law or limits Google's responsibilities except as allowed by\napplicable law.\n\n**AlphaFold 3 and Output are provided on an \"as is\" basis, without warranties or\nconditions of any kind, either express or implied, including any warranties or\nconditions of title, non-infringement, merchantability, or fitness for a\nparticular purpose. You are solely responsible for determining the\nappropriateness of using AlphaFold 3, or using or distributing Output, and\nassume any and all risks associated with such use or distribution and your\nexercise of rights and obligations under these Terms. You and anyone you share\nOutput with are solely responsible for these and their subsequent uses.**\n\n**Output are predictions with varying levels of confidence and should be\ninterpreted carefully. Use discretion before relying on, publishing, downloading\nor otherwise using AlphaFold 3.**\n\n**AlphaFold 3 and Outputs are for theoretical modeling only. They are not\nintended, validated, or approved for clinical use. You should not use AlphaFold\n3 or Output for clinical purposes or rely on them for medical or other\nprofessional advice. Any content regarding those topics is provided for\ninformational purposes only and is not a substitute for advice from a qualified\nprofessional.**\n\n## 9. Liabilities\n\nTo the extent allowed by applicable law, you will indemnify Google and its\ndirectors, officers, employees, and contractors for any third-party legal\nproceedings (including actions by government authorities) arising out of or\nrelating to your unlawful use of the AlphaFold 3 Assets or violation of the\nTerms. This indemnity covers any liability or expense arising from claims,\nlosses, damages, judgments, fines, litigation costs, and legal fees, except to\nthe extent a liability or expense is caused by Google's breach, negligence, or\nwillful misconduct. If you are legally exempt from certain responsibilities,\nincluding indemnification, then those responsibilities do not apply to you under\nthe Terms.\n\nIn no circumstances will Google be responsible for any indirect, special,\nincidental, exemplary, consequential, or punitive damages, or lost profits of\nany kind in connection with the Terms or the AlphaFold 3 Assets, even if Google\nhas been advised of the possibility of such damages. Google's total aggregate\nliability for all claims arising out of or in connection with the Terms or the\nAlphaFold 3 Assets, including for its own negligence, is limited to $500.\n\n## 10. Miscellaneous\n\nBy law, you have certain rights that cannot be limited by a contract like the\nTerms. The Terms are in no way intended to restrict those rights.\n\nThe Terms are our entire agreement relating to your use of the AlphaFold 3\nAssets and supersede any prior or contemporaneous agreements on that subject.\n\nIf it turns out that a particular provision of the Terms is not enforceable, the\nbalance of the Terms will remain in full force and effect.\n\n## 11. Disputes\n\nCalifornia law will govern all disputes arising out of or relating to the Terms\nor in connection to the AlphaFold 3 Assets. These disputes will be resolved\nexclusively in the federal or state courts of Santa Clara County, California,\nUSA and you and Google consent to personal jurisdiction in those courts. To the\nextent that applicable local law prevents certain disputes from being resolved\nin a California court, you and Google can file those disputes in your local\ncourts. If applicable local law prevents your local court from applying\nCalifornia law to resolve these disputes, then these disputes will be governed\nby the applicable local laws of your country, state, or other place of\nresidence. If you are using the AlphaFold 3 Assets on behalf of a government\norganization other than US federal government organizations (where the foregoing\nprovisions shall apply to the extent permitted by federal law), these Terms will\nbe silent regarding governing law and courts.\n\nGiven the nature of scientific research, it may take some time for any breach of\nthe Terms to become apparent. To protect you, Google and the AlphaFold 3 Assets,\nto the extent allowed by applicable law you agree that:\n\n1.  any legal claims relating to the Terms or the AlphaFold 3 Assets can be\n    initiated until the later of:\n    1.  the cut-off date under applicable law for bringing the legal claim; or\n    2.  two years from the date you or Google (as applicable) became aware, or\n        should reasonably have become aware, of the facts giving rise to that\n        claim; and\n2.  you will not argue limitation, time bar, delay, waiver, or the like in an\n    attempt to bar an action filed within that time period, and neither will\n    Google.\n\nAll rights not specifically and expressly granted to you by the Terms are\nreserved to Google. No delay, act or omission by Google in exercising any right\nor remedy will be deemed a waiver of any breach of the Terms and Google\nexpressly reserves any and all rights and remedies available under the Terms or\nat law or in equity or otherwise, including the remedy of injunctive relief\nagainst any threatened or actual breach of the Terms without the necessity of\nproving actual damages.\n"
  },
  {
    "path": "docker/Dockerfile",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nFROM nvidia/cuda:12.6.3-base-ubuntu24.04\n\n# Some RUN statements are combined together to make Docker build run faster.\n# Get latest package listing, install python, git, wget, compilers and libs.\n# * git is required for pyproject.toml toolchain's use of CMakeLists.txt.\n# * gcc, g++, make are required for compiling HMMER and AlphaFold 3 libaries.\n# * zlib is a required dependency of AlphaFold 3.\nRUN DEBIAN_FRONTEND=noninteractive \\\napt-get update --quiet \\\n&& apt-get install --yes --quiet python3.12 python3.12-dev \\\n&& apt-get install --yes --quiet git wget gcc g++ make zlib1g-dev zstd\n\n# Install uv from the official repository. The version is pinned for\n# reproducibility.\nCOPY --from=ghcr.io/astral-sh/uv:0.9.24 /uv /uvx /bin/\n\n# UV_COMPILE_BYTECODE=1 speeds up future container starts.\n# UV_PROJECT_ENVIRONMENT explicitly sets the virtual environment location.\nENV UV_COMPILE_BYTECODE=1\nENV UV_PROJECT_ENVIRONMENT=/alphafold3_venv\nRUN uv venv $UV_PROJECT_ENVIRONMENT\n\nENV PATH=\"/hmmer/bin:/alphafold3_venv/bin:$PATH\"\n\n# Install HMMER. Do so before copying the source code, so that docker can cache\n# the image layer containing HMMER. Alternatively, you could also install it\n# using `apt-get install hmmer` instead of bulding it from source, but we want\n# to have control over the exact version of HMMER and also apply the sequence\n# limit patch. Also note that eddylab.org unfortunately doesn't support HTTPS\n# and the tar file published on GitHub is explicitly not recommended to be used\n# for building from source.\n\n# Download, check hash, and extract the HMMER source code.\nRUN mkdir /hmmer_build /hmmer ; \\\n    wget http://eddylab.org/software/hmmer/hmmer-3.4.tar.gz --directory-prefix /hmmer_build ; \\\n    (cd /hmmer_build && echo \"ca70d94fd0cf271bd7063423aabb116d42de533117343a9b27a65c17ff06fbf3 hmmer-3.4.tar.gz\" | sha256sum --check) && \\\n    (cd /hmmer_build && tar zxf hmmer-3.4.tar.gz && rm hmmer-3.4.tar.gz)\n\n# Apply the --seq_limit patch to HMMER.\nCOPY docker/jackhmmer_seq_limit.patch /hmmer_build/\nRUN (cd /hmmer_build && patch -p0 < jackhmmer_seq_limit.patch)\n\n# Build HMMER.\nRUN (cd /hmmer_build/hmmer-3.4 && ./configure --prefix /hmmer) ; \\\n    (cd /hmmer_build/hmmer-3.4 && make -j) ; \\\n    (cd /hmmer_build/hmmer-3.4 && make install) ; \\\n    (cd /hmmer_build/hmmer-3.4/easel && make install) ; \\\n    rm -R /hmmer_build\n\n# Copy the AlphaFold 3 source code from the local machine to the container and\n# set the working directory to there.\nCOPY . /app/alphafold\nWORKDIR /app/alphafold\n\n# Install the exact dependency tree using uv and cache the build artifacts.\n# --frozen: do not update the lockfile during build.\n# --all-groups: install development/test dependencies defined in pyproject.toml.\n# --no-editable: install as a static package.\n# If using this as a recipe for local installation, we recommend removing the\n# --frozen and --no-editable flags.\nRUN --mount=type=cache,target=/root/.cache/uv \\ \n    UV_LINK_MODE=copy uv sync --frozen --all-groups --no-editable\n\n# Build chemical components database (this binary was installed by uv sync).\nRUN uv run build_data\n\n# To work around a known XLA issue causing the compilation time to greatly\n# increase, the following environment variable setting XLA flags must be enabled\n# when running AlphaFold 3. Note that if using CUDA capability 7 GPUs, it is\n# necessary to set the following XLA_FLAGS value instead:\n# ENV XLA_FLAGS=\"--xla_disable_hlo_passes=custom-kernel-fusion-rewriter\"\n# (no need to disable gemm in that case as it is not supported for such GPU).\nENV XLA_FLAGS=\"--xla_gpu_enable_triton_gemm=false\"\n# Memory settings used for folding up to 5,120 tokens on A100 80 GB.\nENV XLA_PYTHON_CLIENT_PREALLOCATE=true\nENV XLA_CLIENT_MEM_FRACTION=0.95\n\nCMD [\"uv\", \"run\", \"python3\", \"run_alphafold.py\"]\n"
  },
  {
    "path": "docker/dockerignore",
    "content": "dockerignore\nDockerfile"
  },
  {
    "path": "docker/jackhmmer_seq_limit.patch",
    "content": "--- hmmer-3.4/src/jackhmmer.c\n+++ hmmer-3.4/src/jackhmmer.c\n@@ -73,6 +73,7 @@ static ESL_OPTIONS options[] = {\n   { \"--noali\",      eslARG_NONE,        FALSE, NULL, NULL,      NULL,    NULL,  NULL,            \"don't output alignments, so output is smaller\",                2 },\n   { \"--notextw\",    eslARG_NONE,         NULL, NULL, NULL,      NULL,    NULL, \"--textw\",        \"unlimit ASCII text output line width\",                         2 },\n   { \"--textw\",      eslARG_INT,         \"120\", NULL, \"n>=120\",  NULL,    NULL, \"--notextw\",      \"set max width of ASCII text output lines\",                     2 },\n+  { \"--seq_limit\",  eslARG_INT,          NULL, NULL, NULL,      NULL,    NULL, \"--seq_limit\",    \"if set, truncate all hits after this value is reached\",        2 },\n /* Control of scoring system */\n   { \"--popen\",      eslARG_REAL,       \"0.02\", NULL, \"0<=x<0.5\",NULL,    NULL,  NULL,            \"gap open probability\",                                         3 },\n   { \"--pextend\",    eslARG_REAL,        \"0.4\", NULL, \"0<=x<1\",  NULL,    NULL,  NULL,            \"gap extend probability\",                                       3 },\n@@ -298,6 +299,7 @@ output_header(FILE *ofp, ESL_GETOPTS *go\n   if (esl_opt_IsUsed(go, \"--noali\")      && fprintf(ofp, \"# show alignments in output:       no\\n\")                                                   < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n   if (esl_opt_IsUsed(go, \"--notextw\")    && fprintf(ofp, \"# max ASCII text line length:      unlimited\\n\")                                            < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n   if (esl_opt_IsUsed(go, \"--textw\")      && fprintf(ofp, \"# max ASCII text line length:      %d\\n\",             esl_opt_GetInteger(go, \"--textw\"))    < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n+  if (esl_opt_IsUsed(go, \"--seq_limit\")  && fprintf(ofp, \"# set max sequence hits to return: %d\\n\",             esl_opt_GetInteger(go, \"--seq_limit\")) < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n   if (esl_opt_IsUsed(go, \"--popen\")      && fprintf(ofp, \"# gap open probability:            %f\\n\",             esl_opt_GetReal   (go, \"--popen\"))    < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n   if (esl_opt_IsUsed(go, \"--pextend\")    && fprintf(ofp, \"# gap extend probability:          %f\\n\",             esl_opt_GetReal   (go, \"--pextend\"))  < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n   if (esl_opt_IsUsed(go, \"--mx\")         && fprintf(ofp, \"# subst score matrix (built-in):   %s\\n\",             esl_opt_GetString (go, \"--mx\"))       < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n@@ -674,6 +676,13 @@ serial_master(ESL_GETOPTS *go, struct cf\n \t  /* Print the results. */\n \t  p7_tophits_SortBySortkey(info->th);\n \t  p7_tophits_Threshold(info->th, info->pli);\n+\t  /* Limit the number of hits if specified. */\n+\t  if (esl_opt_IsOn(go, \"--seq_limit\"))\n+\t  {\n+\t    int seq_limit = esl_opt_GetInteger(go, \"--seq_limit\");\n+\t    info->th->N = ESL_MIN(info->th->N, seq_limit);\n+\t  }\n+\n \t  p7_tophits_CompareRanking(info->th, kh, &nnew_targets);\n \t  p7_tophits_Targets(ofp, info->th, info->pli, textw); if (fprintf(ofp, \"\\n\\n\") < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n \t  p7_tophits_Domains(ofp, info->th, info->pli, textw); if (fprintf(ofp, \"\\n\\n\") < 0) ESL_EXCEPTION_SYS(eslEWRITE, \"write failed\");\n"
  },
  {
    "path": "docs/community_tools.md",
    "content": "# Community Tools\n\n## JAAG: a JSON input file Assembler for AlphaFold 3 (with Glycan Integration)\n\nJAAG is a lightweight, web-based GUI tool that helps generate AlphaFold 3 input\nJSON files with integrated glycan support. It automates the creation of correct\nglycan syntax (including `bondedAtomPairs` + CCD), reducing manual errors when\npreparing glycoprotein or glycan–protein complexes.\n\n*   Web app: https://biofgreat.org/JAAG\n*   Source code: https://github.com/chinchc/JAAG\n*   Paper: https://doi.org/10.1093/glycob/cwaf083\n\nNote: JAAG is compatible with standalone AlphaFold 3, but not with the AlphaFold\n3 server.\n\n## Modeling glycans with AlphaFold 3: capabilities, caveats, and limitations\n\nPaper on modeling glycans (and other ligands) with AF3 that modeled and assessed\nmajor glycan classes and provides:\n\n*   Step-by-step tutorial for building ligand inputs (applicable beyond glycans)\n*   Ready-to-run scripts for each glycan class\n*   Comprehensive CCD table for all SNFG monosaccharides\n*   Discussion of caveats and limitations of AF3\n*   Full AF3 inputs/outputs archived on ModelArchive for reproducibility\n\nUseful resource if your AF3 ligand models appear stereochemically off.\n\n*   Paper: https://doi.org/10.1093/glycob/cwaf048\n*   ModelArchive: https://doi.org/10.5452/ma-af3glycan\n"
  },
  {
    "path": "docs/contributing.md",
    "content": "# How to Contribute\n\nWe welcome small patches related to bug fixes and documentation, but we do not\nplan to make any major changes to this repository.\n\n## Before You Begin\n\n### Sign Our Contributor License Agreement\n\nContributions to this project must be accompanied by a\n[Contributor License Agreement](https://cla.developers.google.com/about) (CLA).\nYou (or your employer) retain the copyright to your contribution; this simply\ngives us permission to use and redistribute your contributions as part of the\nproject.\n\nIf you or your current employer have already signed the Google CLA (even if it\nwas for a different project), you probably don't need to do it again.\n\nVisit <https://cla.developers.google.com/> to see your current agreements or to\nsign a new one.\n\n### Review Our Community Guidelines\n\nThis project follows\n[Google's Open Source Community Guidelines](https://opensource.google/conduct/).\n\n## Contribution Process\n\nWe won't accept pull requests directly, but if you send one, we will review it.\nIf we send a fix based on your pull request, we will make sure to credit you in\nthe release notes.\n"
  },
  {
    "path": "docs/input.md",
    "content": "# AlphaFold 3 Input\n\n## Specifying Input Files\n\nYou can provide inputs to `run_alphafold.py` in one of two ways:\n\n-   Single input file: Use the `--json_path` flag followed by the path to a\n    single JSON file.\n-   Multiple input files: Use the `--input_dir` flag followed by the path to a\n    directory of JSON files.\n\n## Input Format\n\nAlphaFold 3 uses a custom JSON input format differing from the\n[AlphaFold Server JSON input format](https://github.com/google-deepmind/alphafold/tree/main/server).\nSee [below](#alphafold-server-json-compatibility) for more information.\n\nThe custom AlphaFold 3 format allows:\n\n*   Specifying protein, RNA, and DNA chains, including modified residues.\n*   Specifying custom multiple sequence alignment (MSA) for protein and RNA\n    chains.\n*   Specifying custom structural templates for protein chains.\n*   Specifying ligands using\n    [Chemical Component Dictionary (CCD)](https://www.wwpdb.org/data/ccd) codes.\n*   Specifying ligands using SMILES.\n*   Specifying ligands by defining them using the CCD mmCIF format and supplying\n    them via the [user-provided CCD](#user-provided-ccd).\n*   Specifying covalent bonds between entities.\n*   Specifying multiple random seeds.\n\n## AlphaFold Server JSON Compatibility\n\nThe [AlphaFold Server](https://alphafoldserver.com/) uses a separate\n[JSON format](https://github.com/google-deepmind/alphafold/tree/main/server)\nfrom the one used here in the AlphaFold 3 codebase. In particular, the JSON\nformat used in the AlphaFold 3 codebase offers more flexibility and control in\ndefining custom ligands, branched glycans, and covalent bonds between entities.\n\nWe provide a converter in `run_alphafold.py` which automatically detects the\ninput JSON format, denoted `dialect` in the converter code. The converter\ndenotes the AlphaFoldServer JSON as `alphafoldserver`, and the JSON format\ndefined here in the AlphaFold 3 codebase as `alphafold3`. If the detected input\nJSON format is `alphafoldserver`, then the converter will translate that into\nthe JSON format `alphafold3`.\n\n### Multiple Inputs\n\nThe top-level of the `alphafoldserver` JSON format is a list, allowing\nspecification of multiple inputs in a single JSON. In contrast, the `alphafold3`\nJSON format requires exactly one input per JSON file. Specifying multiple inputs\nin a single `alphafoldserver` JSON is fully supported.\n\nNote that the converter distinguishes between `alphafoldserver` and `alphafold3`\nJSON formats by checking if the top-level of the JSON is a list or not. In\nparticular, if you pass in a `alphafoldserver`-style JSON without a top-level\nlist, then this is considered incorrect and `run_alphafold.py` will raise an\nerror.\n\n### Glycans\n\nIf the JSON in `alphafoldserver` format specifies glycans, the converter will\nraise an error. This is because translating glycans specified in the\n`alphafoldserver` format to the `alphafold3` format is not currently supported.\n\n### Random Seeds\n\nThe `alphafoldserver` JSON format allows users to specify `\"modelSeeds\": []`, in\nwhich case a seed is chosen randomly for the user. On the other hand, the\n`alphafold3` format requires users to specify a seed.\n\nThe converter will choose a seed randomly if `\"modelSeeds\": []` is set when\ntranslating from `alphafoldserver` JSON format to `alphafold3` JSON format. If\nseeds are specified in the `alphafoldserver` JSON format, then those will be\npreserved in the translation to the `alphafold3` JSON format.\n\n### Ions\n\nWhile AlphaFold Server treats ions and ligands as different entity types in the\nJSON format, AlphaFold 3 treats ions as ligands. Therefore, to specify e.g. a\nmagnesium ion, one would specify it as an entity of type `ligand` with\n`ccdCodes: [\"MG\"]`.\n\n### Sequence IDs\n\nThe `alphafold3` JSON format requires the user to specify a unique identifier\n(`id`) for each entity. On the other hand, the `alphafoldserver` does not allow\nspecification of an `id` for each entity. Thus, the converter automatically\nassigns one.\n\nThe converter iterates through the list provided in the `sequences` field of the\n`alphafoldserver` JSON format, assigning an `id` to each entity using the\nfollowing order (\"reverse spreadsheet style\"):\n\n```\nA, B, ..., Z, AA, BA, CA, ..., ZA, AB, BB, CB, ..., ZB, ...\n```\n\nFor any entity with `count > 1`, an `id` is assigned arbitrarily to each \"copy\"\nof the entity.\n\n## Top-level Structure\n\nThe top-level structure of the input JSON is:\n\n```json\n{\n  \"name\": \"Job name goes here\",\n  \"modelSeeds\": [1, 2],  # At least one seed required.\n  \"sequences\": [\n    {\"protein\": {...}},\n    {\"rna\": {...}},\n    {\"dna\": {...}},\n    {\"ligand\": {...}}\n  ],\n  \"bondedAtomPairs\": [...],  # Optional.\n  \"userCCD\": \"...\",  # Optional, mutually exclusive with userCCDPath.\n  \"userCCDPath\": \"...\",  # Optional, mutually exclusive with userCCD.\n  \"dialect\": \"alphafold3\",  # Required.\n  \"version\": 4  # Required.\n}\n```\n\nThe fields specify the following:\n\n*   `name: str`: The name of the job. A sanitised version of this name is used\n    for naming the output files.\n*   `modelSeeds: list[int]`: A list of integer random seeds. The pipeline and\n    the model will be invoked with each of the seeds in the list. I.e. if you\n    provide *n* random seeds, you will get *n* predicted structures, each with\n    the respective random seed. You must provide at least one random seed.\n*   `sequences: list[Protein | RNA | DNA | Ligand]`: A list of sequence\n    dictionaries, each defining a molecular entity, see below.\n*   `bondedAtomPairs: list[Bond]`: An optional list of covalently bonded atoms.\n    These can link atoms within an entity, or across two entities. See more\n    below.\n*   `userCCD: str`: An optional string with user-provided chemical components\n    dictionary. This is an expert mode for providing custom molecules when\n    SMILES is not sufficient. This should also be used when you have a custom\n    molecule that needs to be bonded with other entities - SMILES can't be used\n    in such cases since it doesn't give the possibility of uniquely naming all\n    atoms. It can also be used to provide a reference conformer for cases where\n    RDKit fails to generate a conformer. See more below.\n*   `userCCDPath: str`: An optional path to a file that contains the\n    user-provided chemical components dictionary instead of providing it inline\n    using the `userCCD` field. The path can be either absolute, or relative to\n    the input JSON path. The file must be in the\n    [CCD mmCIF format](https://www.wwpdb.org/data/ccd#mmcifFormat), and could be\n    either plain text, or compressed using gzip, xz, or zstd.\n*   `dialect: str`: The dialect of the input JSON. This must be set to\n    `alphafold3`. See\n    [AlphaFold Server JSON Compatibility](#alphafold-server-json-compatibility)\n    for more information.\n*   `version: int`: The version of the input JSON. This must be set to 1 or 2.\n    See\n    [AlphaFold Server JSON Compatibility](#alphafold-server-json-compatibility)\n    and [versions](#versions) below for more information.\n\n## Versions\n\nThe top-level `version` field (for the `alphafold3` dialect) can be either `1`,\n`2`, or `3`. The following features have been added in respective versions:\n\n*   `1`: the initial AlphaFold 3 input format.\n*   `2`: added the option of specifying external MSA and templates using newly\n    added fields `unpairedMsaPath`, `pairedMsaPath`, and `mmcifPath`.\n*   `3`: added the option of specifying external user-provided CCD using newly\n    added field `userCCDPath`.\n*   `4`: added the option of specifying textual `description` of protein chains,\n    RNA chains, DNA chains, or ligands.\n\n## Sequences\n\nThe `sequences` section specifies the protein chains, RNA chains, DNA chains,\nand ligands. Every entity in `sequences` must have a unique ID. IDs don't have\nto be sorted alphabetically.\n\n### Protein\n\nSpecifies a single protein chain.\n\n```json\n{\n  \"protein\": {\n    \"id\": \"A\",\n    \"sequence\": \"PVLSCGEWQL\",\n    \"modifications\": [\n      {\"ptmType\": \"HY3\", \"ptmPosition\": 1},\n      {\"ptmType\": \"P1L\", \"ptmPosition\": 5}\n    ],\n    \"description\": ...,  # Optional.\n    \"unpairedMsa\": ...,  # Mutually exclusive with unpairedMsaPath.\n    \"unpairedMsaPath\": ...,  # Mutually exclusive with unpairedMsa.\n    \"pairedMsa\": ...,  # Mutually exclusive with pairedMsaPath.\n    \"pairedMsaPath\": ...,  # Mutually exclusive with pairedMsa.\n    \"templates\": [...]\n  }\n}\n```\n\nThe fields specify the following:\n\n*   `id: str | list[str]`: An uppercase letter or multiple letters specifying\n    the unique IDs for each copy of this protein chain. The IDs are then also\n    used in the output mmCIF file. Specifying a list of IDs (e.g. `[\"A\", \"B\",\n    \"C\"]`) implies a homomeric chain with multiple copies.\n*   `sequence: str`: The amino-acid sequence, specified as a string that uses\n    the 1-letter standard amino acid codes.\n*   `modifications: list[ProteinModification]`: An optional list of\n    post-translational modifications. Each modification is specified using its\n    CCD code and 1-based residue position. In the example above, we see that the\n    first residue won't be a proline (`P`) but instead `HY3`.\n*   `description: str`: An optional textual description of this chain. This\n    field will is only used in the JSON format and serves as a comment\n    describing this chain.\n*   `unpairedMsa: str`: An optional multiple sequence alignment for this chain.\n    This is specified using the A3M format (equivalent to the FASTA format, but\n    also allows gaps denoted by the hyphen `-` character). See more details\n    below.\n*   `unpairedMsaPath: str`: An optional path to a file that contains the\n    multiple sequence alignment for this chain instead of providing it inline\n    using the `unpairedMsa` field. The path can be either absolute, or relative\n    to the input JSON path. The file must be in the A3M format, and could be\n    either plain text, or compressed using gzip, xz, or zstd.\n*   `pairedMsa: str`: We recommend *not* using this optional field and using the\n    `unpairedMsa` for the purposes of pairing. See more details below.\n*   `pairedMsaPath: str`: An optional path to a file that contains the multiple\n    sequence alignment for this chain instead of providing it inline using the\n    `pairedMsa` field. The path can be either absolute, or relative to the input\n    JSON path. The file must be in the A3M format, and could be either plain\n    text, or compressed using gzip, xz, or zstd.\n*   `templates: list[Template]`: An optional list of structural templates. See\n    more details below.\n\n### RNA\n\nSpecifies a single RNA chain.\n\n```json\n{\n  \"rna\": {\n    \"id\": \"A\",\n    \"sequence\": \"AGCU\",\n    \"modifications\": [\n      {\"modificationType\": \"2MG\", \"basePosition\": 1},\n      {\"modificationType\": \"5MC\", \"basePosition\": 4}\n    ],\n    \"description\": ...,  # Optional.\n    \"unpairedMsa\": ...,  # Mutually exclusive with unpairedMsaPath.\n    \"unpairedMsaPath\": ...  # Mutually exclusive with unpairedMsa.\n  }\n}\n```\n\nThe fields specify the following:\n\n*   `id: str | list[str]`: An uppercase letter or multiple letters specifying\n    the unique IDs for each copy of this RNA chain. The IDs are then also used\n    in the output mmCIF file. Specifying a list of IDs (e.g. `[\"A\", \"B\", \"C\"]`)\n    implies a homomeric chain with multiple copies.\n*   `sequence: str`: The RNA sequence, specified as a string using only the\n    letters `A`, `C`, `G`, `U`.\n*   `modifications: list[RnaModification]`: An optional list of modifications.\n    Each modification is specified using its CCD code and 1-based base position.\n*   `description: str`: An optional textual description of this chain. This\n    field will is only used in the JSON format and serves as a comment\n    describing this chain.\n*   `unpairedMsa: str`: An optional multiple sequence alignment for this chain.\n    This is specified using the A3M format. See more details below.\n*   `unpairedMsaPath: str`: An optional path to a file that contains the\n    multiple sequence alignment for this chain instead of providing it inline\n    using the `unpairedMsa` field. The path can be either absolute, or relative\n    to the input JSON path. The file must be in the A3M format, and could be\n    either plain text, or compressed using gzip, xz, or zstd.\n\n### DNA\n\nSpecifies a single DNA chain.\n\n```json\n{\n  \"dna\": {\n    \"id\": \"A\",\n    \"sequence\": \"GACCTCT\",\n    \"modifications\": [\n      {\"modificationType\": \"6OG\", \"basePosition\": 1},\n      {\"modificationType\": \"6MA\", \"basePosition\": 2}\n    ],\n    \"description\": ...  # Optional.\n  }\n}\n```\n\nThe fields specify the following:\n\n*   `id: str | list[str]`: An uppercase letter or multiple letters specifying\n    the unique IDs for each copy of this DNA chain. The IDs are then also used\n    in the output mmCIF file. Specifying a list of IDs (e.g. `[\"A\", \"B\", \"C\"]`)\n    implies a homomeric chain with multiple copies.\n*   `sequence: str`: The DNA sequence, specified as a string using only the\n    letters `A`, `C`, `G`, `T`.\n*   `modifications: list[DnaModification]`: An optional list of modifications.\n    Each modification is specified using its CCD code and 1-based base position.\n*   `description: str`: An optional textual description of this chain. This\n    field will is only used in the JSON format and serves as a comment\n    describing this chain.\n\n### Ligands\n\nSpecifies a single ligand. Ligands can be specified using 3 different formats:\n\n1.  [CCD code(s)](https://www.wwpdb.org/data/ccd). This is the easiest way to\n    specify ligands. Supports specifying covalent bonds to other entities. CCD\n    from 2022-09-28 is used. If multiple CCD codes are specified, you may want\n    to specify a bond between these and/or a bond to some other entity. See the\n    [bonds](#bonds) section below.\n2.  [SMILES string](https://en.wikipedia.org/wiki/Simplified_Molecular_Input_Line_Entry_System).\n    This enables specifying ligands that are not in CCD. If using SMILES, you\n    cannot specify covalent bonds to other entities as these rely on specific\n    atom names - see the next option for what to use for this case.\n3.  User-provided CCD + custom ligand codes. This enables specifying ligands not\n    in CCD, while also supporting specification of covalent bonds to other\n    entities and backup reference coordinates for when RDKit fails to generate a\n    conformer. This offers the most flexibility, but also requires careful\n    attention to get all of the details right.\n\n```json\n{\n  \"ligand\": {\n    \"id\": [\"G\", \"H\", \"I\"],\n    \"ccdCodes\": [\"ATP\"],\n    \"description\": ...  # Optional.\n  }\n},\n{\n  \"ligand\": {\n    \"id\": \"J\",\n    \"ccdCodes\": [\"LIG-1337\"],\n    \"description\": ...  # Optional.\n  }\n},\n{\n  \"ligand\": {\n    \"id\": \"K\",\n    \"smiles\": \"CC(=O)OC1C[NH+]2CCC1CC2\",\n    \"description\": ...  # Optional.\n  }\n}\n```\n\nThe fields specify the following:\n\n*   `id: str | list[str]`: An uppercase letter (or multiple letters) specifying\n    the unique ID of this ligand. This ID is then also used in the output mmCIF\n    file. Specifying a list of IDs (e.g. `[\"A\", \"B\", \"C\"]`) implies a ligand\n    that has multiple copies.\n*   `ccdCodes: list[str]`: An optional list of CCD codes. These could be either\n    standard CCD codes, or custom codes pointing to the\n    [user-provided CCD](#user-provided-ccd).\n*   `smiles: str`: An optional string defining the ligand using a SMILES string.\n    The SMILES string must be correctly JSON-escaped.\n*   `description: str`: An optional textual description of this chain. This\n    field will is only used in the JSON format and serves as a comment\n    describing this ligand.\n\nEach ligand may be specified using CCD codes or SMILES but not both, i.e. for a\ngiven ligand, the `ccdCodes` and `smiles` fields are mutually exclusive.\n\n#### SMILES string JSON escaping\n\nThe SMILES string must be correctly JSON-escaped, in particular the backslash\ncharacter must be escaped as two backslashes, otherwise the JSON parser will\nfail with a `JSONDecodeError`. For instance, the following SMILES string\n`CCC[C@@H](O)CC\\C=C\\C=C\\C#CC#C\\C=C\\CO` has to be specified as:\n\n```json\n{\n  \"ligand\": {\n    \"id\": \"A\",\n    \"smiles\": \"CCC[C@@H](O)CC\\\\C=C\\\\C=C\\\\C#CC#C\\\\C=C\\\\CO\"\n  }\n}\n```\n\nYou can JSON-escape the SMILES string using the\n[`jq`](https://github.com/jqlang/jq) command-line tool which should be easily\ninstallable on most Linux systems:\n\n```bash\njq -R . <<< 'CCC[C@@H](O)CC\\C=C\\C=C\\C#CC#C\\C=C\\CO'  # Replace with your SMILES.\n```\n\nAlternatively, you can use this Python code:\n\n```python\nimport json\n\nsmiles = r'CCC[C@@H](O)CC\\C=C\\C=C\\C#CC#C\\C=C\\CO'  # Replace with your SMILES.\nprint(json.dumps(smiles))\n```\n\n#### Reference structure construction with SMILES\n\nFor some ligands and some random seeds, RDKit might fail to generate a\nconformer, indicated by the `Failed to construct RDKit reference structure`\nerror message. In this case, you can either provide a reference structure for\nthe ligand using the [user-provided CCD Format](#user-provided-ccd-format), or\ntry increasing the number of RDKit conformer iterations using the\n`--conformer_max_iterations=...` flag.\n\n### Ions\n\nIons are treated as ligands, e.g. a magnesium ion would simply be a ligand with\n`ccdCodes: [\"MG\"]`.\n\n## Multiple Sequence Alignment\n\nProtein and RNA chains allow setting a custom Multiple Sequence Alignment (MSA).\nIf not set, the data pipeline will automatically build MSAs for protein and RNA\nentities using Jackhmmer/Nhmmer search over genetic databases as described in\nthe paper.\n\n### RNA Multiple Sequence Alignment\n\nRNA `unpairedMsa` can be either:\n\n1.  Unset (or set explicitly to `null`). AlphaFold 3 will build MSA for this RNA\n    chain automatically. This is the recommended option.\n2.  Set to an empty string (`\"\"`). AlphaFold 3 won't build the MSA for this RNA\n    chain and the MSA input to the model will be just the RNA chain (equivalent\n    to running MSA-free for this RNA chain).\n3.  Set to a non-empty A3M string. AlphaFold 3 will use the provided MSA for\n    this RNA chain.\n\n### Protein Multiple Sequence Alignment\n\nFor protein chains, the situation is slightly more complicated due to paired and\nunpaired MSA (see [MSA Pairing](#msa-pairing) below for more details).\n\nThe following combinations are valid for a given protein chain:\n\n1.  Both `unpairedMsa` and `pairedMsa` fields are unset (or set explicitly to\n    `null`), AlphaFold 3 will build both MSAs automatically. This is the\n    recommended option.\n2.  The `unpairedMsa` is set to to a non-empty A3M string, `pairedMsa` set to an\n    empty string (`\"\"`). AlphaFold 3 won't build MSA, will use the `unpairedMsa`\n    as is and run `pairedMSA`-free.\n3.  The `pairedMsa` is set to to a non-empty A3M string, `unpairedMsa` set to an\n    empty string (`\"\"`). AlphaFold 3 won't build MSA, will use the `pairedMsa`\n    and run `unpairedMSA`-free. **This option is not recommended**, see\n    [MSA Pairing](#msa-pairing) below.\n4.  Both `unpairedMsa` and `pairedMsa` fields are set to an empty string (`\"\"`).\n    AlphaFold 3 will not build the MSA and the MSA input to the model will be\n    just the query sequence (equivalent to running completely MSA-free).\n5.  Both `unpairedMsa` and `pairedMsa` fields are set to a custom non-empty A3M\n    string, AlphaFold 3 will use the provided MSA instead of building one as\n    part of the data pipeline. This is considered an expert option.\n\nNote that both `unpairedMsa` and `pairedMsa` have to either be *both* set (i.e.\nnon-`null`), or both unset (i.e. both `null`, explicitly or implicitly).\nTypically, when setting `unpairedMsa`, you will set the `pairedMsa` to an empty\nstring (`\"\"`). For example this will run the protein chain A with the given MSA,\nbut without any templates (template-free):\n\n```json\n{\n  \"protein\": {\n    \"id\": \"A\",\n    \"sequence\": ...,\n    \"unpairedMsa\": \"The A3M you want to run with\",\n    \"pairedMsa\": \"\",\n    \"templates\": []\n  }\n}\n```\n\nWhen setting your own MSA, you have to make sure that:\n\n1.  The MSA is in the A3M format. This means adhering to the FASTA format while\n    also allowing lowercase characters denoting inserted residues and hyphens\n    (`-`) denoting gaps in sequences.\n2.  The first sequence is exactly equal to the query sequence.\n3.  If all insertions are removed from MSA hits (i.e. all lowercase letters are\n    removed), all sequences have exactly the same length as the query (they form\n    an exact rectangular matrix).\n\n### MSA Pairing\n\nMSA pairing matters only when folding multiple chains (multimers), since we need\nto find a way to concatenate MSAs for the individual chains along the sequence\ndimension. If done naively, by simply concatenating the individual MSA matrices\nalong the sequence dimension and padding so that all MSAs have the same depth,\none can end up with rows in the concatenated MSA that are formed by sequences\nfrom different organisms.\n\nIt may be desirable to ensure that across multiple chains, sequences in the MSA\nthat are from the same organism end up in the same MSA row. AlphaFold 3\ninternally achieves this by looking for the UniProt organism ID in the\n`pairedMsa` and pairing sequences based on this information.\n\nWe recommend users do the pairing manually or use the output of an appropriate\nsoftware and then provide the MSA using only the `unpairedMsa` field. This\nmethod gives exact control over the placement of each sequence in the MSA, as\nopposed to relying on name-matching post-processing heuristics used for\n`pairedMsa`.\n\nWhen setting `unpairedMsa` manually, the `pairedMsa` must be explicitly set to\nan empty string (`\"\"`).\n\nMake sure to run with `--resolve_msa_overlaps=false`. This prevents\ndeduplication of the unpaired MSA within each chain against the paired MSA\nsequences. Even if you set `pairedMsa` to an empty string, the query sequence(s)\nwill still be added in there and the deduplication procedure could destroy the\ncarefully crafted sequence positioning in the unpaired MSA.\n\nFor instance, if there are two chains `DEEP` and `MIND` which we want to be\npaired on organism A and C, we can achieve it as follows:\n\n```txt\n> query\nDEEP\n> match 1 (organism A)\nD--P\n> match 2 (organism B)\nDD-P\n> match 3 (organism C)\nDD-P\n```\n\n```txt\n> query\nMIND\n> match 1 (organism A)\nM--D\n> Empty hit to make sure pairing is achieved\n----\n> match 2 (organism C)\nMIN-\n```\n\nThe resulting MSA when chains are concatenated will then be:\n\n```txt\n> query\nDEEPMIND\n> match 1 + match 1\nD--PM--D\n> match 2 + padding\nDD-P----\n> match 3 + match 2\nDD-PMIN-\n```\n\n## Structural Templates\n\nStructural templates can be specified only for protein chains:\n\n```json\n\"templates\": [\n  {\n    \"mmcif\": ...,  # Mutually exclusive with mmcifPath.\n    \"mmcifPath\": ...,  # Mutually exclusive with mmcif.\n    \"queryIndices\": [0, 1, 2, 4, 5, 6],\n    \"templateIndices\": [0, 1, 2, 3, 4, 8]\n  }\n]\n```\n\nThe fields specify the following:\n\n*   `mmcif: str`: A string containing the single chain protein structural\n    template in the mmCIF format.\n*   `mmcifPath: str`: An optional path to a file that contains the mmCIF with\n    the structural template instead of providing it inline using the `mmcifPath`\n    field. The path can be either absolute, or relative to the input JSON path.\n    The file must be in the mmCIF format, and could be either plain text, or\n    compressed using gzip, xz, or zstd.\n*   `queryIndices: list[int]`: O-based indices in the query sequence, defining\n    the mapping from query residues to template residues.\n*   `templateIndices: list[int]`: O-based indices in the template sequence,\n    specifying the mapping from query residues to template residues defined in\n    the mmCIF file. Note that unresolved mmCIF residues must be taken into\n    account when specifying template indices.\n\nA template is specified as an mmCIF string containing a single chain with the\nstructural template together with a 0-based mapping that maps query residue\nindices to the template residue indices. The mapping is specified using two\nlists of the same length. E.g. to express a mapping `{0: 0, 1: 2, 2: 5, 3: 6}`,\nyou would specify the two indices lists as:\n\n```json\n\"queryIndices\":    [0, 1, 2, 3],\n\"templateIndices\": [0, 2, 5, 6]\n```\n\nNote that mmCIFs can have residues with missing atom coordinates (present in\nresidue tables but missing in the `_atom_site` table) – these must be taken into\naccount when specifying template indices. E.g. to align residues 4–7 in a\ntemplate with unresolved residues 1, 2, 3 and resolved residues 4, 5, 6, 7, you\nneed to set the template indices to 3, 4, 5, 6 (since 0-based indexing is used).\nAn example of a protein with unresolved residues 1–20 can be found here:\nhttps://www.rcsb.org/structure/8UXY.\n\nYou can provide multiple structural templates. Note that if an mmCIF containing\nmore than one chain is provided, you will get an error since it is not possible\nto determine which of the chains should be used as the template.\n\nYou can run template-free (but still run genetic search and build MSA) by\nsetting templates to `[]` and either explicitly setting both `unpairedMsa` and\n`pairedMsa` to `null`:\n\n```json\n\"protein\": {\n  \"id\": \"A\",\n  \"sequence\": ...,\n  \"pairedMsa\": null,\n  \"unpairedMsa\": null,\n  \"templates\": []\n}\n```\n\nOr you can simply fully omit them:\n\n```json\n\"protein\": {\n  \"id\": \"A\",\n  \"sequence\": ...,\n  \"templates\": []\n}\n```\n\nYou can also run with pre-computed MSA, but let AlphaFold 3 search for\ntemplates. This can be achieved by setting `unpairedMsa` and `pairedMsa`, but\nkeeping templates unset (or set to `null`). The profile given as an input to\nHmmsearch when searching for templates will be built from the provided\n`unpairedMsa`:\n\n```json\n\"protein\": {\n  \"id\": \"A\",\n  \"sequence\": ...,\n  \"unpairedMsa\": ...,\n  \"pairedMsa\": ...,\n  \"templates\": null\n}\n```\n\nOr you can simply fully omit the `templates` field thus setting it implicitly to\n`null`:\n\n```json\n\"protein\": {\n  \"id\": \"A\",\n  \"sequence\": ...,\n  \"unpairedMsa\": ...,\n  \"pairedMsa\": ...,\n}\n```\n\n## Bonds\n\nTo manually specify covalent bonds, use the `bondedAtomPairs` field. This is\nintended for modelling covalent ligands, and for defining multi-CCD ligands\n(e.g. glycans). Defining covalent bonds between or within polymer entities is\nnot currently supported.\n\nBonds are specified as pairs of (source atom, destination atom), with each atom\nbeing uniquely addressed using 3 fields:\n\n*   **Entity ID** (`str`): this corresponds to the `id` field for that entity.\n*   **Residue ID** (`int`): this is 1-based residue index *within* the chain.\n    For single-residue ligands, this is simply set to 1.\n*   **Atom name** (`str`): this is the unique atom name *within* the given\n    residue. The atom name for protein/RNA/DNA residues or CCD ligands can be\n    looked up in the CCD for the given chemical component. This also explains\n    why SMILES ligands don't support bonds: there is no atom name that could be\n    used to define the bond. This shortcoming can be addressed by using the\n    user-provided CCD format (see below).\n\nThe example below shows two bonds:\n\n```json\n\"bondedAtomPairs\": [\n  [[\"A\", 145, \"SG\"], [\"L\", 1, \"C04\"]],\n  [[\"J\", 1, \"O6\"], [\"J\", 2, \"C1\"]]\n]\n```\n\nThe first bond is between chain A, residue 145, atom SG and chain L, residue 1,\natom C04. This is a typical example for a covalent ligand. The second bond is\nbetween chain J, residue 1, atom O6 and chain J, residue 2, atom C1. This bond\nis within the same entity and is a typical example when defining a glycan.\n\nAll bonds are implicitly assumed to be covalent bonds. Other bond types are not\nsupported.\n\n### Defining Glycans\n\nGlycans are bound to a protein residue, and they are typically formed of\nmultiple chemical components. To define a glycan, define a new ligand with all\nof the chemical components of the glycan. Then define a bond that links the\nglycan to the protein residue, and all bonds that are within the glycan between\nits individual chemical components.\n\nFor example, to define the following glycan composed of 4 components (CMP1,\nCMP2, CMP3, CMP4) bound to an asparagine in a protein chain A:\n\n```\n ⋮\nALA            CMP4\n |              |\nASN ―― CMP1 ―― CMP2\n |              |\nALA            CMP3\n ⋮\n```\n\nYou will need to specify:\n\n1.  Protein chain A.\n2.  Ligand chain B with the 4 components.\n3.  Bonds ASN-CMP1, CMP1-CMP2, CMP2-CMP3, CMP2-CMP4.\n\n## User-provided CCD\n\nThere are two approaches to model a custom ligand not defined in the CCD:\n\n1.  If the ligand is not bonded to other entities, it can be defined using a\n    [SMILES string](https://en.wikipedia.org/wiki/Simplified_Molecular_Input_Line_Entry_System).\n2.  If it is bonded to other entities, or to be able to customise relevant\n    features (such as bond orders, atom names and ideal coordinates used when\n    conformer generation fails), it is necessary to define that particular\n    ligand using the\n    [CCD mmCIF format](https://www.wwpdb.org/data/ccd#mmcifFormat).\n\nNote that if a full CCD mmCIF is provided, any SMILES string input as part of\nthat mmCIF is ignored.\n\nOnce defined, this ligand needs to be assigned a name that doesn't clash with\nexisting CCD ligand names (e.g. `LIG-1`). Avoid underscores (`_`) in the name,\nas it could cause issues in the mmCIF format.\n\nThe newly defined ligand can then be used as a standard CCD ligand using its\ncustom name, and bonds can be linked to it using its named atom scheme.\n\n### Conformer Generation\n\nThe data pipeline attempts to generate a conformer for ligands using RDKit. The\n`Mol` used to generate the conformer is constructed either from the information\nprovided in the CCD mmCIF, or from the SMILES string if that is the only\ninformation provided.\n\nIf conformer generation fails, the model will fall back to using the ideal\ncoordinates in the CCD mmCIF if these are provided. If they are not provided,\nthe model will use the reference coordinates if the last modification date given\nin the CCD mmCIF is prior to the training cutoff date. If no coordinates can be\nfound in this way, all conformer coordinates are set to zero and the model will\noutput `NaN` (`null` in the output JSON) confidences for the ligand.\n\nNote that sometimes conformer generation failures can be resolved by\nincreasinging the number of RDKit conformer iterations using the\n`--conformer_max_iterations=...` flag.\n\n### User-provided CCD Format\n\nThe user-provided CCD must be passed either:\n\n*   In the `userCCD` field (in the root of the input JSON) as a string. Note\n    that JSON doesn't allow newlines within strings, so newline characters\n    (`\\n`) must be used to delimit lines. Single rather than double quotes\n    should also be used around strings like the chemical formula.\n*   In the `userCCDPath` field, as a path to a file that contains the\n    user-provided chemical components dictionary. The path can be either\n    absolute, or relative to the input JSON path. The file must be in the\n    [CCD mmCIF format](https://www.wwpdb.org/data/ccd#mmcifFormat), and could be\n    either plain text, or compressed using gzip, xz, or zstd.\n\nThe main pieces of information used are the atom names and elements, bonds, and\nalso the ideal coordinates (`pdbx_model_Cartn_{x,y,z}_ideal`) which essentially\nserve as a structural template for the ligand if RDKit fails to generate\nconformers for that ligand.\n\nThe user-provided CCD can also be used to redefine standard chemical components\nin the CCD. This can be useful if you need to redefine the ideal coordinates.\n\nBelow is an example user-provided CCD redefining component X7F, which serves to\nillustrate the required sections. For readability purposes, newlines have not\nbeen replaced by `\\n`.\n\n```\ndata_MY-X7F\n#\n_chem_comp.id MY-X7F\n_chem_comp.name '5,8-bis(oxidanyl)naphthalene-1,4-dione'\n_chem_comp.type non-polymer\n_chem_comp.formula 'C10 H6 O4'\n_chem_comp.mon_nstd_parent_comp_id ?\n_chem_comp.pdbx_synonyms ?\n_chem_comp.formula_weight 190.152\n#\nloop_\n_chem_comp_atom.comp_id\n_chem_comp_atom.atom_id\n_chem_comp_atom.type_symbol\n_chem_comp_atom.charge\n_chem_comp_atom.pdbx_leaving_atom_flag\n_chem_comp_atom.pdbx_model_Cartn_x_ideal\n_chem_comp_atom.pdbx_model_Cartn_y_ideal\n_chem_comp_atom.pdbx_model_Cartn_z_ideal\nMY-X7F C02 C 0 N -1.418 -1.260 0.018\nMY-X7F C03 C 0 N -0.665 -2.503 -0.247\nMY-X7F C04 C 0 N 0.677 -2.501 -0.235\nMY-X7F C05 C 0 N 1.421 -1.257 0.043\nMY-X7F C06 C 0 N 0.706 0.032 0.008\nMY-X7F C07 C 0 N -0.706 0.030 -0.004\nMY-X7F C08 C 0 N -1.397 1.240 -0.037\nMY-X7F C10 C 0 N -0.685 2.443 -0.057\nMY-X7F C11 C 0 N 0.679 2.445 -0.045\nMY-X7F C12 C 0 N 1.394 1.243 -0.013\nMY-X7F O01 O 0 N -2.611 -1.301 0.247\nMY-X7F O09 O 0 N -2.752 1.249 -0.049\nMY-X7F O13 O 0 N 2.750 1.257 -0.001\nMY-X7F O14 O 0 N 2.609 -1.294 0.298\nMY-X7F H1 H 0 N -1.199 -3.419 -0.452\nMY-X7F H2 H 0 N 1.216 -3.416 -0.429\nMY-X7F H3 H 0 N -1.221 3.381 -0.082\nMY-X7F H4 H 0 N 1.212 3.384 -0.062\nMY-X7F H5 H 0 N -3.154 1.271 0.830\nMY-X7F H6 H 0 N 3.151 1.241 -0.880\n#\nloop_\n_chem_comp_bond.atom_id_1\n_chem_comp_bond.atom_id_2\n_chem_comp_bond.value_order\n_chem_comp_bond.pdbx_aromatic_flag\nO01 C02 DOUB N\nO09 C08 SING N\nC02 C03 SING N\nC02 C07 SING N\nC03 C04 DOUB N\nC08 C07 DOUB Y\nC08 C10 SING Y\nC07 C06 SING Y\nC10 C11 DOUB Y\nC04 C05 SING N\nC06 C05 SING N\nC06 C12 DOUB Y\nC11 C12 SING Y\nC05 O14 DOUB N\nC12 O13 SING N\nC03 H1 SING N\nC04 H2 SING N\nC10 H3 SING N\nC11 H4 SING N\nO09 H5 SING N\nO13 H6 SING N\n#\n```\n\n### Mandatory fields\n\nParsing the user-provided CCD needs only a subset of the fields that CCD uses.\nThe mandatory fields are described below. Refer to\n[CCD documentation](https://www.wwpdb.org/data/ccd#mmcifFormat) for more\ndetailed explanation of each field. Note that not all of these fields are input\nto the model, but they are necessary for the data pipeline to run – see the\n[Model input fields](#model-input-fields) section below.\n\n**Singular fields (containing just a single value)**\n\n*   `_chem_comp.id`: The ID of the component. Must match the `_data` record and\n    must not contain special CIF characters (like `_` or `#`).\n*   `_chem_comp.name`: Optional full name of the component. If unknown, set to\n    `?`.\n*   `_chem_comp.type`: Type of the component, typically `non-polymer`.\n*   `_chem_comp.formula`: Optional component formula. If unknown, set to `?`.\n*   `_chem_comp.mon_nstd_parent_comp_id`: Optional parent component ID. If\n    unknown, set to `?`.\n*   `_chem_comp.pdbx_synonyms`: Optional synonym IDs. If unknown, set to `?`.\n*   `_chem_comp.formula_weight`: Optional weight of the component. If unknown,\n    set to `?`.\n\n**Per-atom fields (containing one record per atom)**\n\n*   `_chem_comp_atom.comp_id`: Component ID.\n*   `_chem_comp_atom.atom_id`: Atom ID.\n*   `_chem_comp_atom.type_symbol`: Atom element type.\n*   `_chem_comp_atom.charge`: Atom charge.\n*   `_chem_comp_atom.pdbx_leaving_atom_flag`: Optional flag determining whether\n    this is a leaving atom. If unset, assumed to be no (`N`) for all atoms.\n*   `_chem_comp_atom.pdbx_model_Cartn_x_ideal`: Ideal x coordinate.\n*   `_chem_comp_atom.pdbx_model_Cartn_y_ideal`: Ideal y coordinate.\n*   `_chem_comp_atom.pdbx_model_Cartn_z_ideal`: Ideal z coordinate.\n\n**Per-bond fields (containing one record per bond)**\n\n*   `_chem_comp_bond.atom_id_1`: The ID of the first of the two atoms that\n    define the bond.\n*   `_chem_comp_bond.atom_id_2`: The ID of the second of the two atoms that\n    define the bond.\n*   `_chem_comp_bond.value_order`: The bond order of the chemical bond\n    associated with the specified atoms.\n*   `_chem_comp_bond.pdbx_aromatic_flag`: Whether the bond is aromatic.\n\n### Model input fields\n\nThe following fields are used to generate input for the model:\n\n*   `_chem_comp_atom.atom_id`: Atom ID.\n*   `_chem_comp_atom.type_symbol`: Atom element type.\n*   `_chem_comp_atom.charge`: Atom charge.\n*   `_chem_comp_atom.pdbx_model_Cartn_x_ideal`: Ideal x coordinate. Only used if\n    conformer generation fails.\n*   `_chem_comp_atom.pdbx_model_Cartn_y_ideal`: Ideal y coordinate. Only used if\n    conformer generation fails.\n*   `_chem_comp_atom.pdbx_model_Cartn_z_ideal`: Ideal z coordinate. Only used if\n    conformer generation fails.\n*   `_chem_comp_bond.atom_id_1`: The ID of the first of the two atoms that\n    define the bond.\n*   `_chem_comp_bond.atom_id_2`: The ID of the second of the two atoms that\n    define the bond.\n\n## Full Example\n\nAn example illustrating all the aspects of the input format is provided below.\nNote that AlphaFold 3 won't run this input out of the box as it abbreviates\ncertain fields and the sequences are not biologically meaningful.\n\n```json\n{\n  \"name\": \"Hello fold\",\n  \"modelSeeds\": [10, 42],\n  \"sequences\": [\n    {\n      \"protein\": {\n        \"id\": \"A\",\n        \"sequence\": \"PVLSCGEWQL\",\n        \"modifications\": [\n          {\"ptmType\": \"HY3\", \"ptmPosition\": 1},\n          {\"ptmType\": \"P1L\", \"ptmPosition\": 5}\n        ],\n        \"description\": \"10-residue protein with 2 modifications\",\n        \"unpairedMsa\": ...,\n        \"pairedMsa\": \"\"\n      }\n    },\n    {\n      \"protein\": {\n        \"id\": \"B\",\n        \"sequence\": \"RPACQLW\",\n        \"templates\": [\n          {\n            \"mmcif\": ...,\n            \"queryIndices\": [0, 1, 2, 4, 5, 6],\n            \"templateIndices\": [0, 1, 2, 3, 4, 8]\n          }\n        ]\n      }\n    },\n    {\n      \"dna\": {\n        \"id\": \"C\",\n        \"sequence\": \"GACCTCT\",\n        \"modifications\": [\n          {\"modificationType\": \"6OG\", \"basePosition\": 1},\n          {\"modificationType\": \"6MA\", \"basePosition\": 2}\n        ]\n      }\n    },\n    {\n      \"rna\": {\n        \"id\": \"E\",\n        \"sequence\": \"AGCU\",\n        \"modifications\": [\n          {\"modificationType\": \"2MG\", \"basePosition\": 1},\n          {\"modificationType\": \"5MC\", \"basePosition\": 4}\n        ],\n        \"unpairedMsa\": ...\n      }\n    },\n    {\n      \"ligand\": {\n        \"id\": [\"F\", \"G\", \"H\"],\n        \"ccdCodes\": [\"ATP\"]\n      }\n    },\n    {\n      \"ligand\": {\n        \"id\": \"I\",\n        \"ccdCodes\": [\"NAG\", \"FUC\"]\n      }\n    },\n    {\n      \"ligand\": {\n        \"id\": \"Z\",\n        \"smiles\": \"CC(=O)OC1C[NH+]2CCC1CC2\"\n      }\n    }\n  ],\n  \"bondedAtomPairs\": [\n    [[\"A\", 1, \"CA\"], [\"G\", 1, \"CHA\"]],\n    [[\"I\", 1, \"O6\"], [\"I\", 2, \"C1\"]]\n  ],\n  \"userCCD\": ...,\n  \"dialect\": \"alphafold3\",\n  \"version\": 4\n}\n```\n"
  },
  {
    "path": "docs/installation.md",
    "content": "# Installation and Running Your First Prediction\n\nYou will need a machine running Linux; AlphaFold 3 does not support other\noperating systems. Full installation requires up to 1 TB of disk space to keep\ngenetic databases (SSD storage is recommended) and an NVIDIA GPU with Compute\nCapability 8.0 or greater (GPUs with more memory can predict larger protein\nstructures). We have verified that inputs with up to 5,120 tokens can fit on a\nsingle NVIDIA A100 80 GB, or a single NVIDIA H100 80 GB. We have verified\nnumerical accuracy on both NVIDIA A100 and H100 GPUs.\n\nEspecially for long targets, the genetic search stage can consume a lot of RAM –\nwe recommend running with at least 64 GB of RAM.\n\nWe provide installation instructions for a machine with an NVIDIA A100 80 GB GPU\nand a clean Ubuntu 22.04 LTS installation, and expect that these instructions\nshould aid others with different setups. If you are installing locally outside\nof a Docker container, please ensure CUDA, cuDNN, and JAX are correctly\ninstalled; the\n[JAX installation documentation](https://jax.readthedocs.io/en/latest/installation.html#nvidia-gpu)\nis a useful reference for this case. Please note that the Docker container\nrequires that the host machine has CUDA 12.6 installed.\n\nThe instructions provided below describe how to:\n\n1.  Provision a machine on GCP.\n1.  Install Docker.\n1.  Install NVIDIA drivers for an A100.\n1.  Obtain genetic databases.\n1.  Obtain model parameters.\n1.  Build the AlphaFold 3 Docker container or Singularity image.\n\n## Provisioning a Machine\n\nClean Ubuntu images are available on Google Cloud, AWS, Azure, and other major\nplatforms.\n\nUsing an existing Google Cloud project, we provisioned a new machine:\n\n*   We recommend using `--machine-type a2-ultragpu-1g` but feel free to use\n    `--machine-type a2-highgpu-1g` for smaller predictions.\n*   If desired, replace `--zone us-central1-a` with a zone that has quota for\n    the machine you have selected. See\n    [gpu-regions-zones](https://cloud.google.com/compute/docs/gpus/gpu-regions-zones).\n\n```sh\ngcloud compute instances create alphafold3 \\\n    --machine-type a2-ultragpu-1g \\\n    --zone us-central1-a \\\n    --image-family ubuntu-2204-lts \\\n    --image-project ubuntu-os-cloud \\\n    --maintenance-policy TERMINATE \\\n    --boot-disk-size 1000 \\\n    --boot-disk-type pd-balanced\n```\n\nThis provisions a bare Ubuntu 22.04 LTS image on an\n[A2 Ultra](https://cloud.google.com/compute/docs/accelerator-optimized-machines#a2-vms)\nmachine with 12 CPUs, 170 GB RAM, 1 TB disk and NVIDIA A100 80 GB GPU attached.\nWe verified the following installation steps from this point.\n\n## Installing Docker\n\nThese instructions are for rootless Docker.\n\n### Installing Docker on Host\n\nNote these instructions only apply to Ubuntu 22.04 LTS images, see above.\n\nAdd Docker's official GPG key. Official Docker instructions are\n[here](https://docs.docker.com/engine/install/ubuntu/#install-using-the-repository).\nThe commands we ran are:\n\n```sh\nsudo apt-get update\nsudo apt-get install ca-certificates curl\nsudo install -m 0755 -d /etc/apt/keyrings\nsudo curl -fsSL https://download.docker.com/linux/ubuntu/gpg -o /etc/apt/keyrings/docker.asc\nsudo chmod a+r /etc/apt/keyrings/docker.asc\n```\n\nAdd the repository to apt sources:\n\n```sh\necho \\\n  \"deb [arch=$(dpkg --print-architecture) signed-by=/etc/apt/keyrings/docker.asc] https://download.docker.com/linux/ubuntu \\\n  $(. /etc/os-release && echo \"$VERSION_CODENAME\") stable\" | \\\n  sudo tee /etc/apt/sources.list.d/docker.list > /dev/null\nsudo apt-get update\nsudo apt-get install -y docker-ce docker-ce-cli containerd.io docker-buildx-plugin docker-compose-plugin\nsudo docker run hello-world\n```\n\n### Enabling Rootless Docker\n\nOfficial Docker instructions are\n[here](https://docs.docker.com/engine/security/rootless/#distribution-specific-hint).\nThe commands we ran are:\n\n```sh\nsudo apt-get install -y uidmap systemd-container\n\nsudo machinectl shell $(whoami)@ /bin/bash -c 'dockerd-rootless-setuptool.sh install && sudo loginctl enable-linger $(whoami) && DOCKER_HOST=unix:///run/user/1001/docker.sock docker context use rootless'\n```\n\n## Installing GPU Support\n\n### Installing NVIDIA Drivers\n\nOfficial Ubuntu instructions are\n[here](https://documentation.ubuntu.com/server/how-to/graphics/install-nvidia-drivers/).\nThe commands we ran are:\n\n```sh\nsudo apt-get -y install alsa-utils ubuntu-drivers-common\nsudo ubuntu-drivers install\n\nsudo nvidia-smi --gpu-reset\n\nnvidia-smi  # Check that the drivers are installed.\n```\n\nAccept the \"Pending kernel upgrade\" dialog if it appears.\n\nYou will need to reboot the instance with `sudo reboot now` to reset the GPU if\nyou see the following warning:\n\n```text\nNVIDIA-SMI has failed because it couldn't communicate with the NVIDIA driver.\nMake sure that the latest NVIDIA driver is installed and running.\n```\n\nProceed only if `nvidia-smi` has a sensible output.\n\n### Installing NVIDIA Support for Docker\n\nOfficial NVIDIA instructions are\n[here](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/install-guide.html).\nThe commands we ran are:\n\n```sh\ncurl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | sudo gpg --dearmor -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg \\\n  && curl -s -L https://nvidia.github.io/libnvidia-container/stable/deb/nvidia-container-toolkit.list | \\\n    sed 's#deb https://#deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://#g' | \\\n    sudo tee /etc/apt/sources.list.d/nvidia-container-toolkit.list\nsudo apt-get update\nsudo apt-get install -y nvidia-container-toolkit\nnvidia-ctk runtime configure --runtime=docker --config=$HOME/.config/docker/daemon.json\nsystemctl --user restart docker\nsudo nvidia-ctk config --set nvidia-container-cli.no-cgroups --in-place\n```\n\nCheck that your container can see the GPU:\n\n```sh\ndocker run --rm --gpus all nvidia/cuda:12.6.0-base-ubuntu22.04 nvidia-smi\n```\n\nExample output:\n\n```text\nMon Nov  11 12:00:00 2024\n+-----------------------------------------------------------------------------------------+\n| NVIDIA-SMI 550.120                Driver Version: 550.120        CUDA Version: 12.6     |\n|-----------------------------------------+------------------------+----------------------+\n| GPU  Name                 Persistence-M | Bus-Id          Disp.A | Volatile Uncorr. ECC |\n| Fan  Temp   Perf          Pwr:Usage/Cap |           Memory-Usage | GPU-Util  Compute M. |\n|                                         |                        |               MIG M. |\n|=========================================+========================+======================|\n|   0  NVIDIA A100-SXM4-80GB          Off |   00000000:00:05.0 Off |                    0 |\n| N/A   34C    P0             51W /  400W |       1MiB /  81920MiB |      0%      Default |\n|                                         |                        |             Disabled |\n+-----------------------------------------+------------------------+----------------------+\n\n+-----------------------------------------------------------------------------------------+\n| Processes:                                                                              |\n|  GPU   GI   CI        PID   Type   Process name                              GPU Memory |\n|        ID   ID                                                               Usage      |\n|=========================================================================================|\n|  No running processes found                                                             |\n+-----------------------------------------------------------------------------------------+\n```\n\n## Obtaining AlphaFold 3 Source Code\n\nInstall `git` and download the AlphaFold 3 repository:\n\n```sh\ngit clone https://github.com/google-deepmind/alphafold3.git\n```\n\n## Obtaining Genetic Databases\n\nThis step requires `wget` and `zstd` to be installed on your machine. On\nDebian-based systems install them by running `sudo apt install wget zstd`.\n\nAlphaFold 3 needs multiple genetic (sequence) protein and RNA databases to run:\n\n*   [BFD small](https://bfd.mmseqs.com/)\n*   [MGnify](https://www.ebi.ac.uk/metagenomics/)\n*   [PDB](https://www.rcsb.org/) (structures in the mmCIF format)\n*   [PDB seqres](https://www.rcsb.org/)\n*   [UniProt](https://www.uniprot.org/uniprot/)\n*   [UniRef90](https://www.uniprot.org/help/uniref)\n*   [NT](https://www.ncbi.nlm.nih.gov/nucleotide/)\n*   [RFam](https://rfam.org/)\n*   [RNACentral](https://rnacentral.org/)\n\nWe provide a bash script `fetch_databases.sh` that can be used to download and\nset up all of these databases. This process takes around 45 minutes when not\ninstalling on local SSD. We recommend running the following in a `screen` or\n`tmux` session as downloading and decompressing the databases takes some time.\n\n```sh\ncd alphafold3  # Navigate to the directory with cloned AlphaFold 3 repository.\n./fetch_databases.sh [<DB_DIR>]\n```\n\nThis script downloads the databases from a mirror hosted on GCS, with all\nversions being the same as used in the AlphaFold 3 paper, to the directory\n`<DB_DIR>`. If not specified, the default `<DB_DIR>` is\n`$HOME/public_databases`.\n\n:ledger: **Note: The download directory `<DB_DIR>` should *not* be a\nsubdirectory in the AlphaFold 3 repository directory.** If it is, the Docker\nbuild will be slow as the large databases will be copied during the image\ncreation.\n\n:ledger: **Note: The total download size for the full databases is around 252 GB\nand the total size when unzipped is 630 GB. Please make sure you have sufficient\nhard drive space, bandwidth, and time to download. We recommend using an SSD for\nbetter genetic search performance.**\n\n:ledger: **Note: If the download directory and datasets don't have full read and\nwrite permissions, it can cause errors with the MSA tools, with opaque\n(external) error messages. Please ensure the required permissions are applied,\ne.g. with the `sudo chmod 755 --recursive <DB_DIR>` command.**\n\nOnce the script has finished, you should have the following directory structure:\n\n```sh\nmmcif_files/  # Directory containing ~200k PDB mmCIF files.\nbfd-first_non_consensus_sequences.fasta\nmgy_clusters_2022_05.fa\nnt_rna_2023_02_23_clust_seq_id_90_cov_80_rep_seq.fasta\npdb_seqres_2022_09_28.fasta\nrfam_14_9_clust_seq_id_90_cov_80_rep_seq.fasta\nrnacentral_active_seq_id_90_cov_80_linclust.fasta\nuniprot_all_2021_04.fa\nuniref90_2022_05.fa\n```\n\nOptionally, after the script finishes, you may want copy databases to an SSD.\nYou can use theses two scripts:\n\n*   `src/scripts/gcp_mount_ssd.sh [<SSD_MOUNT_PATH>]` Mounts and formats an\n    unmounted GCP SSD drive to the specified path. It will skip the either step\n    if the disk is either already formatted or already mounted. The default\n    `<SSD_MOUNT_PATH>` is `/mnt/disks/ssd`.\n*   `src/scripts/copy_to_ssd.sh [<DB_DIR>] [<SSD_DB_DIR>]` this will copy as\n    many files that it can fit on to the SSD. The default `<DB_DIR>` is\n    `$HOME/public_databases`, and must match the path used in the\n    `fetch_databases.sh` command above, and the default `<SSD_DB_DIR>` is\n    `/mnt/disks/ssd/public_databases`.\n\n## Obtaining Model Parameters\n\nTo request access to the AlphaFold 3 model parameters, please complete\n[this form](https://forms.gle/svvpY4u2jsHEwWYS6). Access will be granted at\nGoogle DeepMind’s sole discretion. We will aim to respond to requests within 2–3\nbusiness days. You may only use AlphaFold 3 model parameters if received\ndirectly from Google. Use is subject to these\n[terms of use](https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md).\n\nOnce access has been granted, download the model parameters to a directory of\nyour choosing, referred to as `<MODEL_PARAMETERS_DIR>` in the following\ninstructions. As with the databases, this should *not* be a subdirectory in the\nAlphaFold 3 repository directory.\n\n## Building the Docker Container That Will Run AlphaFold 3\n\nThen, build the Docker container. This builds a container with all the right\npython dependencies:\n\n```sh\ndocker build -t alphafold3 -f docker/Dockerfile .\n```\n\nIf you hit `No file descriptors available (os error 24)` on systems like\nAlmaLinux/Rocky/RHEL, you need to manually expand the file descriptor limits\nduring the build by appending `--ulimit nofile=65535:65535`:\n\n```sh\ndocker build --ulimit nofile=65535:65535 -t alphafold3 -f docker/Dockerfile .\n```\n\nCreate an input JSON file, using either the example in the\n[README](https://github.com/google-deepmind/alphafold3?tab=readme-ov-file#installation-and-running-your-first-prediction)\nor a\n[custom input](https://github.com/google-deepmind/alphafold3/blob/main/docs/input.md),\nand place it in a directory, e.g. `$HOME/af_input`. You can now run AlphaFold 3!\n\n```sh\ndocker run -it \\\n    --volume $HOME/af_input:/root/af_input \\\n    --volume $HOME/af_output:/root/af_output \\\n    --volume <MODEL_PARAMETERS_DIR>:/root/models \\\n    --volume <DB_DIR>:/root/public_databases \\\n    --gpus all \\\n    alphafold3 \\\n    python run_alphafold.py \\\n    --json_path=/root/af_input/fold_input.json \\\n    --model_dir=/root/models \\\n    --output_dir=/root/af_output\n```\n\nwhere `$HOME/af_input` is the directory containing the input JSON file;\n`$HOME/af_output` is the directory where the output will be written to; and\n`<DB_DIR>` and `<MODEL_PARAMETERS_DIR>` are the directories containing the\ndatabases and model parameters. The values of these directories must match the\ndirectories used in previous steps for downloading databases and model weights,\nand for the input file.\n\n:ledger: Note: You may also need to create the output directory,\n`$HOME/af_output` directory before running the `docker` command and make it and\nthe input directory writable from the docker container, e.g. by running `chmod\n755 $HOME/af_input $HOME/af_output`. In most cases `docker` and\n`run_alphafold.py` will create the output directory if it does not exist.\n\n:ledger: **Note: In the example above the databases have been placed on the\npersistent disk, which is slow.** If you want better genetic and template search\nperformance, make sure all databases are placed on a local SSD.\n\nIf you have some databases on an SSD in the `<SSD_DB_DIR>` directory and some\ndatabases on a slower disk in the `<DB_DIR>` directory, you can mount both\ndirectories and specify `db_dir` multiple times. This will enable the fast\naccess to databases with a fallback to the larger, slower disk:\n\n```sh\ndocker run -it \\\n    --volume $HOME/af_input:/root/af_input \\\n    --volume $HOME/af_output:/root/af_output \\\n    --volume <MODEL_PARAMETERS_DIR>:/root/models \\\n    --volume <SSD_DB_DIR>:/root/public_databases \\\n    --volume <DB_DIR>:/root/public_databases_fallback \\\n    --gpus all \\\n    alphafold3 \\\n    python run_alphafold.py \\\n    --json_path=/root/af_input/fold_input.json \\\n    --model_dir=/root/models \\\n    --db_dir=/root/public_databases \\\n    --db_dir=/root/public_databases_fallback \\\n    --output_dir=/root/af_output\n```\n\nIf you get an error like the following, make sure the models and data are in the\npaths (flags named `--volume` above) in the correct locations.\n\n```\ndocker: Error response from daemon: error while creating mount source path '/srv/alphafold3_data/models': mkdir /srv/alphafold3_data/models: permission denied.\n```\n\n`run_alphafold.py` supports many flags for controlling performance, running on\nmultiple input files, specifying external binary paths, and more. See\n\n```sh\ndocker run alphafold3 python run_alphafold.py --help\n```\n\nfor more information.\n\n## Running Using Singularity Instead of Docker\n\nYou may prefer to run AlphaFold 3 within Singularity. You'll still need to\n*build* the Singularity image from the Docker container. Afterwards, you will\nnot have to depend on Docker (at structure prediction time).\n\n### Install Singularity\n\nOfficial Singularity instructions are\n[here](https://docs.sylabs.io/guides/3.3/user-guide/installation.html). The\ncommands we ran are:\n\n```sh\nwget https://github.com/sylabs/singularity/releases/download/v4.2.1/singularity-ce_4.2.1-jammy_amd64.deb\nsudo dpkg --install singularity-ce_4.2.1-jammy_amd64.deb\nsudo apt-get install -f\n```\n\n### Build the Singularity Container From the Docker Image\n\nAfter building the *Docker* container above with `docker build -t`, start a\nlocal Docker registry and upload your image `alphafold3` to it. Singularity's\ninstructions are [here](https://github.com/apptainer/singularity/issues/1537).\nThe commands we ran are:\n\n```sh\ndocker run -d -p 5000:5000 --restart=always --name registry registry:2\ndocker tag alphafold3 localhost:5000/alphafold3\ndocker push localhost:5000/alphafold3\n```\n\nThen build the Singularity container:\n\n```sh\nSINGULARITY_NOHTTPS=1 singularity build alphafold3.sif docker://localhost:5000/alphafold3:latest\n```\n\nYou can confirm your build by starting a shell and inspecting the environment.\nFor example, you may want to ensure the Singularity image can access your GPU.\nYou may want to restart your computer if you have issues with this.\n\n```sh\nsingularity exec --nv alphafold3.sif sh -c 'nvidia-smi'\n```\n\nYou can now run AlphaFold 3!\n\n```sh\nsingularity exec --nv alphafold3.sif <<args>>\n```\n\nFor example:\n\n```sh\nsingularity exec \\\n     --nv \\\n     --bind $HOME/af_input:/root/af_input \\\n     --bind $HOME/af_output:/root/af_output \\\n     --bind <MODEL_PARAMETERS_DIR>:/root/models \\\n     --bind <DB_DIR>:/root/public_databases \\\n     alphafold3.sif \\\n     python run_alphafold.py \\\n     --json_path=/root/af_input/fold_input.json \\\n     --model_dir=/root/models \\\n     --db_dir=/root/public_databases \\\n     --output_dir=/root/af_output\n```\n\nOr with some databases on SSD in location `<SSD_DB_DIR>`:\n\n```sh\nsingularity exec \\\n     --nv \\\n     --bind $HOME/af_input:/root/af_input \\\n     --bind $HOME/af_output:/root/af_output \\\n     --bind <MODEL_PARAMETERS_DIR>:/root/models \\\n     --bind <SSD_DB_DIR>:/root/public_databases \\\n     --bind <DB_DIR>:/root/public_databases_fallback \\\n     alphafold3.sif \\\n     python run_alphafold.py \\\n     --json_path=/root/af_input/fold_input.json \\\n     --model_dir=/root/models \\\n     --db_dir=/root/public_databases \\\n     --db_dir=/root/public_databases_fallback \\\n     --output_dir=/root/af_output\n```\n"
  },
  {
    "path": "docs/known_issues.md",
    "content": "# Known Issues\n\n## Numerical performance for CUDA Capability 7.x GPUs\n\nAll CUDA Capability 7.x GPUs (e.g. V100) produce obviously bad output, with lots\nof clashing residues (the clashes cause a ranking score of -99 or lower), unless\nthe environment variable `XLA_FLAGS` is set to include\n`--xla_disable_hlo_passes=custom-kernel-fusion-rewriter`.\n\n## Incorrect handling of two-letter atoms in SMILES ligands\n\nBetween commits https://github.com/google-deepmind/alphafold3/commit/f8df1c7 and\nhttps://github.com/google-deepmind/alphafold3/commit/4e4023c, AlphaFold 3\nhandled incorrectly any two-letter atoms (e.g. Cl, Br) in ligands defined using\nSMILES strings.\n\n## MSA discrepancy between AlphaFold 3 and AlphaFold Server\n\n### The root cause of the problem\n\nThe released AlphaFold 3 and AlphaFold Server use the same model weights and\nequivalent featurisation and model code. However, the way they run genetic\nsearch is slightly different. The released AlphaFold 3 searches each database in\none go, while AlphaFold Server has a sharded version of each database (split\ninto multiple smaller FASTA files) and searches all of the shards in parallel.\nThe results of these parallel searches are then merged together at the end.\n\nThe discrepancy is caused by a different (deeper) MSA on AlphaFold Server in\nsome cases. We discovered that the issue is caused by running sharded Jackhmmer\nin AlphaFold Server without the `--domZ` flag (has to be set together with the\n`--Z` flag and set to the same value) which means that effectively the AlphaFold\nServer is running with roughly 100× more permissive `--domE` filter. This means\nmore sequences are sometimes included in the MSA.\n\nWe are keeping behaviour unchanged in both the released AlphaFold 3 and in the\nAlphaFold Server, however, we are giving users with local installs an option to\nreplicate AlphaFold Server behaviour locally. In our large scale tests the\ndifference did not matter, it is only very specific inputs that get better\naccuracy with the deeper MSA.\n\nSee https://github.com/google-deepmind/alphafold3/issues/492 for an example\ninput where a protein-DNA complex gets significantly higher ipTM and pTM with\nAlphaFold Server compared to a local run.\n\n### Replicating AlphaFold Server behaviour locally\n\nIf you want to replicate AlphaFold Server behaviour (i.e. better folding\naccuracy in some cases), you can increase the value of the Jackhmmer/Nhmmer\n`--domE` flag by 100× compared to its default value.\n\nAlternatively, you can run the sharded MSA search while not setting the `--domZ`\nvalue – you would have to modify the code to do it. We added support for\nsearching against sharded databases in AlphaFold 3 in\nhttps://github.com/google-deepmind/alphafold3/commit/805adc3863841d83d631ccd18136ad58ce3ecb34\nand the way to run AlphaFold 3 with sharded databases is documented in\nhttps://github.com/google-deepmind/alphafold3/blob/main/docs/performance.md#sharded-genetic-databases.\nIt can provide 10–30× speedup (potentially even more, depending on hardware) of\nthe genetic search.\n\nIn general, we recommend experimenting with MSA if you are seeing a prediction\nwith low predicted confidence. Typically adding more *relevant* sequences in the\nMSA will increase AlphaFold prediction accuracy and model confidence scores.\n"
  },
  {
    "path": "docs/metadata_antibody_antigen.csv",
    "content": "pdb_id,chain_id_1,chain_id_2,cluster_key_chain_1,cluster_key_chain_2,interface_cluster_key\n7fci,A,B,5581,5964,5581|5964\n7fci,A,C,5581,17640,17640|5581\n7mnl,A,C,8677,17640,17640|8677\n7n0a,A,B,33602,5964,33602|5964\n7n0a,A,C,33602,17640,17640|33602\n7ox1,A,G,17640,41184,17640|41184\n7ox1,B,G,5964,41184,41184|5964\n7ox2,A,C,17640,41184,17640|41184\n7ox2,B,C,5964,41184,41184|5964\n7ox3,A,C,5964,41184,41184|5964\n7ox3,B,C,17640,41184,17640|41184\n7ox4,A,C,17640,41184,17640|41184\n7ox4,B,C,5964,41184,41184|5964\n7q6c,A,B,15496,17640,15496|17640\n7q6c,A,D,15496,5964,15496|5964\n7r58,A,B,30790,17640,17640|30790\n7r58,A,C,30790,5964,30790|5964\n7ru6,A,B,7068,17640,17640|7068\n7sbd,A,C,17640,20692,17640|20692\n7sbd,B,C,5964,20692,20692|5964\n7sbg,A,C,17640,20692,17640|20692\n7sbg,B,C,5964,20692,20692|5964\n7sjo,A,F,7390,17640,17640|7390\n7sjo,A,I,7390,5964,5964|7390\n7sjo,B,G,7390,17640,17640|7390\n7sjo,B,H,7390,5964,5964|7390\n7sjo,C,D,7390,17640,17640|7390\n7sjo,C,E,7390,5964,5964|7390\n7sk3,A,C,45640,5964,45640|5964\n7sk3,A,D,45640,17640,17640|45640\n7sk3,A,E,45640,5964,45640|5964\n7sk3,A,F,45640,17640,17640|45640\n7sk4,A,C,45640,5964,45640|5964\n7sk4,A,D,45640,17640,17640|45640\n7sk4,A,E,45640,5964,45640|5964\n7sk4,A,F,45640,17640,17640|45640\n7sk5,A,B,45640,17640,17640|45640\n7sk5,A,D,45640,5964,45640|5964\n7sk6,A,C,45640,5964,45640|5964\n7sk6,A,D,45640,17640,17640|45640\n7sk7,A,C,45640,5964,45640|5964\n7sk7,A,D,45640,17640,17640|45640\n7sk8,A,C,45640,5964,45640|5964\n7sk8,A,D,45640,17640,17640|45640\n7sk8,A,E,45640,5964,45640|5964\n7sk8,A,F,45640,17640,17640|45640\n7sk9,A,B,45640,17640,17640|45640\n7sk9,A,C,45640,5964,45640|5964\n7st8,A,C,17640,41188,17640|41188\n7st8,B,C,5964,41188,41188|5964\n7t6x,E,H,5964,24273,24273|5964\n7t82,A,C,9703,5964,5964|9703\n7t82,A,D,9703,17640,17640|9703\n7t9m,A,C,17640,13210,13210|17640\n7t9m,B,C,5964,13210,13210|5964\n7t9n,A,D,5964,13210,13210|5964\n7t9n,B,D,17640,13210,13210|17640\n7tuf,A,B,22549,17640,17640|22549\n7tuf,A,C,22549,5964,22549|5964\n7tuf,A,E,22549,17640,17640|22549\n7tuf,B,D,17640,22549,17640|22549\n7tuf,D,E,22549,17640,17640|22549\n7tuf,D,F,22549,5964,22549|5964\n7tug,A,B,22549,17640,17640|22549\n7tug,A,C,22549,5964,22549|5964\n7u8c,A,B,20081,17640,17640|20081\n7u8c,A,C,20081,5964,20081|5964\n7u8g,A,C,29632,17640,17640|29632\n7u8g,A,D,29632,5964,29632|5964\n7uih,A,B,11223,5964,11223|5964\n7uih,A,C,11223,17640,11223|17640\n7uih,A,D,11223,5964,11223|5964\n7uih,A,E,11223,17640,11223|17640\n7um3,A,E,17640,33649,17640|33649\n7um3,B,E,5964,33649,33649|5964\n7ura,A,B,44530,5964,44530|5964\n7ura,A,C,44530,17640,17640|44530\n7urc,A,B,44530,5964,44530|5964\n7urc,A,C,44530,17640,17640|44530\n7urd,A,C,44530,5964,44530|5964\n7urd,A,D,44530,17640,17640|44530\n7ure,A,B,44530,5964,44530|5964\n7ure,A,C,44530,17640,17640|44530\n7uvf,A,C,23558,17640,17640|23558\n7uvf,A,D,23558,5964,23558|5964\n7uvf,B,E,23558,5964,23558|5964\n7uvf,B,F,23558,17640,17640|23558\n7vad,A,B,5581,17640,17640|5581\n7vad,A,C,5581,5964,5581|5964\n7vae,A,B,5581,17640,17640|5581\n7vae,A,C,5581,5964,5581|5964\n7vaf,A,C,17640,5581,17640|5581\n7vaf,B,C,5964,5581,5581|5964\n7vag,A,B,5581,17640,17640|5581\n7vag,A,C,5581,5964,5581|5964\n7vgr,A,E,5964,33673,33673|5964\n7vgr,A,F,5964,33673,33673|5964\n7vgr,B,E,17640,33673,17640|33673\n7vgr,B,F,17640,33673,17640|33673\n7vgr,C,E,5964,33673,33673|5964\n7vgr,C,F,5964,33673,33673|5964\n7vgr,D,E,17640,33673,17640|33673\n7vgr,D,F,17640,33673,17640|33673\n7vgs,A,B,33673,5964,33673|5964\n7vgs,A,C,33673,17640,17640|33673\n7vgs,A,E,33673,5964,33673|5964\n7vgs,B,D,5964,33673,33673|5964\n7vgs,D,E,33673,5964,33673|5964\n7vgs,D,F,33673,17640,17640|33673\n7vn9,A,C,17640,20046,17640|20046\n7vn9,B,C,5964,20046,20046|5964\n7vng,A,B,20046,17640,17640|20046\n7vng,A,C,20046,5964,20046|5964\n7w71,A,E,24335,17640,17640|24335\n7w71,A,F,24335,5964,24335|5964\n7wsi,A,B,5581,17640,17640|5581\n7wsi,A,C,5581,5964,5581|5964\n7xq8,A,B,26372,5964,26372|5964\n7xq8,C,D,26372,5964,26372|5964\n7zlg,A,D,17640,29547,17640|29547\n7zlg,C,D,5964,29547,29547|5964\n7zlh,A,D,17640,29547,17640|29547\n7zlh,C,D,5964,29547,29547|5964\n7zli,A,D,17640,29547,17640|29547\n7zli,C,D,5964,29547,29547|5964\n7zlj,A,D,17640,29547,17640|29547\n7zlj,C,D,5964,29547,29547|5964\n7zwi,A,C,7003,5964,5964|7003\n7zxf,A,C,7003,5964,5964|7003\n7zxf,A,E,7003,5964,5964|7003\n7zxg,A,C,7003,5964,5964|7003\n7zxk,A,F,26707,5964,26707|5964\n7zxk,A,G,26707,17640,17640|26707\n7zyi,A,B,5581,17640,17640|5581\n7zyi,A,C,5581,5964,5581|5964\n8cz5,A,B,24059,17640,17640|24059\n8cz5,A,C,24059,5964,24059|5964\n8dcy,A,C,17640,23342,17640|23342\n8dcy,B,C,5964,23342,23342|5964\n8ddk,A,C,17640,23342,17640|23342\n8ddk,B,C,5964,23342,23342|5964\n8djk,A,E,15456,17640,15456|17640\n8djk,B,D,15455,5964,15455|5964\n8djk,B,E,15455,17640,15455|17640\n8djm,A,E,15456,17640,15456|17640\n8djm,B,D,15455,5964,15455|5964\n8djm,B,E,15455,17640,15455|17640\n8dke,A,B,13979,17640,13979|17640\n8dke,A,C,13979,5964,13979|5964\n8dki,A,B,13979,17640,13979|17640\n8dki,A,C,13979,5964,13979|5964\n8dkm,A,C,17640,13979,13979|17640\n8dkm,B,C,5964,13979,13979|5964\n8dkw,A,C,17640,13979,13979|17640\n8dkw,B,C,5964,13979,13979|5964\n8dkx,A,C,17640,13979,13979|17640\n8dkx,B,C,5964,13979,13979|5964\n8hii,A,B,21158,17640,17640|21158\n8hii,A,D,21158,5964,21158|5964\n8hij,A,B,21158,17640,17640|21158\n8hij,A,D,21158,5964,21158|5964\n8hik,A,B,21158,17640,17640|21158\n8hik,A,D,21158,5964,21158|5964\n7so7,A,F,3006,5964,3006|5964\n7xy8,A,C,2517,17640,17640|2517\n7xy8,A,E,2517,5964,2517|5964"
  },
  {
    "path": "docs/metadata_antibody_antigen.md",
    "content": "# Metadata for Antibody-Antigen pairs used to create figure 5a\n\nFigure 5a in the AlphaFold 3 paper was created using 71 antibody–antigen\ncomplexes, containing 166 antibody–antigen interfaces spanning 65 interface\nclusters. Scores were averaged within each interface cluster then across\nclusters. Note that the first bioassembly is used in all cases.\n\nWe provide metadata for these complexes and the associated clusters in this CSV\nfile:\n\nhttps://github.com/google-deepmind/alphafold3/blob/main/docs/metadata_antibody_antigen.csv\n"
  },
  {
    "path": "docs/model_parameters.md",
    "content": "# Model Parameters\n\nAlphaFold 3 layer names, shapes, and dtypes are documented in the table below.\nThis can be used for example to generate random parameters for AlphaFold 3\nperformance optimisation on new accelerators without having to obtain the\nofficial parameters. It is important to not generate zero-only parameters for\nperformance optimisations as accelerators often have shortcuts for zero-only\narguments (e.g. `0 * tensor` can be optimised to a no-op).\n\nProducing random parameters could be done similarly to the following snippet:\n\n```py\nfrom alphafold3.model import params\nimport numpy as np\nimport zstandard\n\nparameters = ...  # Data from the parameters schema.\n\nwith zstandard.open('random_weights.bin.zst', 'wb') as compressed:\n  for scope_name, shape, dtype in parameters:\n    if scope_name == '__meta__:__identifier__':\n      # The identifier can be all zeros.\n      arr = np.zeros(shape=shape, dtype=dtype)\n    else:\n      # Do not use all-zero params, instead sample uniformly between -1 and 1.\n      arr = np.random.uniform(low=-1, high=1, size=shape).astype(dtype)\n    scope_name = scope_name.split(':')\n    compressed.write(params.encode_record(*scope_name, arr))\n```\n\n## Parameters Schema\n\n```\nname=__meta__:__identifier__                                                                                                                                                             dtype=uint8     shape=(64,)\nname=diffuser/~/diffusion_head/diffusion_atom_features_layer_norm:scale                                                                                                                  dtype=float32   shape=(128,)\nname=diffuser/~/diffusion_head/diffusion_atom_features_to_position_update:weights                                                                                                        dtype=float32   shape=(128, 3)\nname=diffuser/~/diffusion_head/diffusion_atom_positions_to_features:weights                                                                                                              dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderadaptive_zero_cond:bias                                 dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderadaptive_zero_cond:weights                              dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderffw_adaptive_zero_cond:bias                             dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderffw_adaptive_zero_cond:weights                          dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderffw_single_cond_bias:weights                            dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderffw_single_cond_layer_norm:scale                        dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderffw_single_cond_scale:bias                              dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderffw_single_cond_scale:weights                           dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderffw_transition1:weights                                 dtype=float32   shape=(3, 128, 512)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderffw_transition2:weights                                 dtype=float32   shape=(3, 256, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decodergating_query:weights                                    dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderk_projection:weights                                    dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderksingle_cond_bias:weights                               dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderksingle_cond_layer_norm:scale                           dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderksingle_cond_scale:bias                                 dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderksingle_cond_scale:weights                              dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderq_projection:bias                                       dtype=float32   shape=(3, 4, 32)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderq_projection:weights                                    dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderqsingle_cond_bias:weights                               dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderqsingle_cond_layer_norm:scale                           dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderqsingle_cond_scale:bias                                 dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderqsingle_cond_scale:weights                              dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decodertransition2:weights                                     dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/__layer_stack_with_per_layer/diffusion_atom_transformer_decoderv_projection:weights                                    dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/pair_input_layer_norm:scale                                                                                            dtype=float32   shape=(16,)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_decoder/pair_logits_projection:weights                                                                                         dtype=float32   shape=(16, 3, 4)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderadaptive_zero_cond:bias                                 dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderadaptive_zero_cond:weights                              dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderffw_adaptive_zero_cond:bias                             dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderffw_adaptive_zero_cond:weights                          dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderffw_single_cond_bias:weights                            dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderffw_single_cond_layer_norm:scale                        dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderffw_single_cond_scale:bias                              dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderffw_single_cond_scale:weights                           dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderffw_transition1:weights                                 dtype=float32   shape=(3, 128, 512)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderffw_transition2:weights                                 dtype=float32   shape=(3, 256, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encodergating_query:weights                                    dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderk_projection:weights                                    dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderksingle_cond_bias:weights                               dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderksingle_cond_layer_norm:scale                           dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderksingle_cond_scale:bias                                 dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderksingle_cond_scale:weights                              dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderq_projection:bias                                       dtype=float32   shape=(3, 4, 32)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderq_projection:weights                                    dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderqsingle_cond_bias:weights                               dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderqsingle_cond_layer_norm:scale                           dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderqsingle_cond_scale:bias                                 dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderqsingle_cond_scale:weights                              dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encodertransition2:weights                                     dtype=float32   shape=(3, 128, 128)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/__layer_stack_with_per_layer/diffusion_atom_transformer_encoderv_projection:weights                                    dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/pair_input_layer_norm:scale                                                                                            dtype=float32   shape=(16,)\nname=diffuser/~/diffusion_head/diffusion_atom_transformer_encoder/pair_logits_projection:weights                                                                                         dtype=float32   shape=(16, 3, 4)\nname=diffuser/~/diffusion_head/diffusion_embed_pair_distances_1:weights                                                                                                                  dtype=float32   shape=(1, 16)\nname=diffuser/~/diffusion_head/diffusion_embed_pair_distances:weights                                                                                                                    dtype=float32   shape=(1, 16)\nname=diffuser/~/diffusion_head/diffusion_embed_pair_offsets_1:weights                                                                                                                    dtype=float32   shape=(3, 16)\nname=diffuser/~/diffusion_head/diffusion_embed_pair_offsets_valid:weights                                                                                                                dtype=float32   shape=(1, 16)\nname=diffuser/~/diffusion_head/diffusion_embed_pair_offsets:weights                                                                                                                      dtype=float32   shape=(3, 16)\nname=diffuser/~/diffusion_head/diffusion_embed_ref_atom_name:weights                                                                                                                     dtype=float32   shape=(256, 128)\nname=diffuser/~/diffusion_head/diffusion_embed_ref_charge:weights                                                                                                                        dtype=float32   shape=(1, 128)\nname=diffuser/~/diffusion_head/diffusion_embed_ref_element:weights                                                                                                                       dtype=float32   shape=(128, 128)\nname=diffuser/~/diffusion_head/diffusion_embed_ref_mask:weights                                                                                                                          dtype=float32   shape=(1, 128)\nname=diffuser/~/diffusion_head/diffusion_embed_ref_pos:weights                                                                                                                           dtype=float32   shape=(3, 128)\nname=diffuser/~/diffusion_head/diffusion_embed_trunk_pair_cond:weights                                                                                                                   dtype=float32   shape=(128, 16)\nname=diffuser/~/diffusion_head/diffusion_embed_trunk_single_cond:weights                                                                                                                 dtype=float32   shape=(384, 128)\nname=diffuser/~/diffusion_head/diffusion_lnorm_trunk_pair_cond:scale                                                                                                                     dtype=float32   shape=(128,)\nname=diffuser/~/diffusion_head/diffusion_lnorm_trunk_single_cond:scale                                                                                                                   dtype=float32   shape=(384,)\nname=diffuser/~/diffusion_head/diffusion_pair_mlp_1:weights                                                                                                                              dtype=float32   shape=(16, 16)\nname=diffuser/~/diffusion_head/diffusion_pair_mlp_2:weights                                                                                                                              dtype=float32   shape=(16, 16)\nname=diffuser/~/diffusion_head/diffusion_pair_mlp_3:weights                                                                                                                              dtype=float32   shape=(16, 16)\nname=diffuser/~/diffusion_head/diffusion_project_atom_features_for_aggr:weights                                                                                                          dtype=float32   shape=(128, 768)\nname=diffuser/~/diffusion_head/diffusion_project_token_features_for_broadcast:weights                                                                                                    dtype=float32   shape=(768, 128)\nname=diffuser/~/diffusion_head/diffusion_single_to_pair_cond_col_1:weights                                                                                                               dtype=float32   shape=(128, 16)\nname=diffuser/~/diffusion_head/diffusion_single_to_pair_cond_col:weights                                                                                                                 dtype=float32   shape=(128, 16)\nname=diffuser/~/diffusion_head/diffusion_single_to_pair_cond_row_1:weights                                                                                                               dtype=float32   shape=(128, 16)\nname=diffuser/~/diffusion_head/diffusion_single_to_pair_cond_row:weights                                                                                                                 dtype=float32   shape=(128, 16)\nname=diffuser/~/diffusion_head/noise_embedding_initial_norm:scale                                                                                                                        dtype=float32   shape=(256,)\nname=diffuser/~/diffusion_head/noise_embedding_initial_projection:weights                                                                                                                dtype=float32   shape=(256, 384)\nname=diffuser/~/diffusion_head/output_norm:scale                                                                                                                                         dtype=float32   shape=(768,)\nname=diffuser/~/diffusion_head/pair_cond_initial_norm:scale                                                                                                                              dtype=float32   shape=(267,)\nname=diffuser/~/diffusion_head/pair_cond_initial_projection:weights                                                                                                                      dtype=float32   shape=(267, 128)\nname=diffuser/~/diffusion_head/pair_transition_0ffw_layer_norm:offset                                                                                                                    dtype=float32   shape=(128,)\nname=diffuser/~/diffusion_head/pair_transition_0ffw_layer_norm:scale                                                                                                                     dtype=float32   shape=(128,)\nname=diffuser/~/diffusion_head/pair_transition_0ffw_transition1:weights                                                                                                                  dtype=float32   shape=(128, 512)\nname=diffuser/~/diffusion_head/pair_transition_0ffw_transition2:weights                                                                                                                  dtype=float32   shape=(256, 128)\nname=diffuser/~/diffusion_head/pair_transition_1ffw_layer_norm:offset                                                                                                                    dtype=float32   shape=(128,)\nname=diffuser/~/diffusion_head/pair_transition_1ffw_layer_norm:scale                                                                                                                     dtype=float32   shape=(128,)\nname=diffuser/~/diffusion_head/pair_transition_1ffw_transition1:weights                                                                                                                  dtype=float32   shape=(128, 512)\nname=diffuser/~/diffusion_head/pair_transition_1ffw_transition2:weights                                                                                                                  dtype=float32   shape=(256, 128)\nname=diffuser/~/diffusion_head/single_cond_embedding_norm:scale                                                                                                                          dtype=float32   shape=(384,)\nname=diffuser/~/diffusion_head/single_cond_embedding_projection:weights                                                                                                                  dtype=float32   shape=(384, 768)\nname=diffuser/~/diffusion_head/single_cond_initial_norm:scale                                                                                                                            dtype=float32   shape=(831,)\nname=diffuser/~/diffusion_head/single_cond_initial_projection:weights                                                                                                                    dtype=float32   shape=(831, 384)\nname=diffuser/~/diffusion_head/single_transition_0ffw_layer_norm:offset                                                                                                                  dtype=float32   shape=(384,)\nname=diffuser/~/diffusion_head/single_transition_0ffw_layer_norm:scale                                                                                                                   dtype=float32   shape=(384,)\nname=diffuser/~/diffusion_head/single_transition_0ffw_transition1:weights                                                                                                                dtype=float32   shape=(384, 1536)\nname=diffuser/~/diffusion_head/single_transition_0ffw_transition2:weights                                                                                                                dtype=float32   shape=(768, 384)\nname=diffuser/~/diffusion_head/single_transition_1ffw_layer_norm:offset                                                                                                                  dtype=float32   shape=(384,)\nname=diffuser/~/diffusion_head/single_transition_1ffw_layer_norm:scale                                                                                                                   dtype=float32   shape=(384,)\nname=diffuser/~/diffusion_head/single_transition_1ffw_transition1:weights                                                                                                                dtype=float32   shape=(384, 1536)\nname=diffuser/~/diffusion_head/single_transition_1ffw_transition2:weights                                                                                                                dtype=float32   shape=(768, 384)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformeradaptive_zero_cond:bias                                                  dtype=float32   shape=(6, 4, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformeradaptive_zero_cond:weights                                               dtype=float32   shape=(6, 4, 384, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerffw_adaptive_zero_cond:bias                                              dtype=float32   shape=(6, 4, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerffw_adaptive_zero_cond:weights                                           dtype=float32   shape=(6, 4, 384, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerffw_single_cond_bias:weights                                             dtype=float32   shape=(6, 4, 384, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerffw_single_cond_layer_norm:scale                                         dtype=float32   shape=(6, 4, 384)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerffw_single_cond_scale:bias                                               dtype=float32   shape=(6, 4, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerffw_single_cond_scale:weights                                            dtype=float32   shape=(6, 4, 384, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerffw_transition1:weights                                                  dtype=float32   shape=(6, 4, 768, 3072)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerffw_transition2:weights                                                  dtype=float32   shape=(6, 4, 1536, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformergating_query:weights                                                     dtype=float32   shape=(6, 4, 768, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerk_projection:weights                                                     dtype=float32   shape=(6, 4, 768, 16, 48)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerq_projection:bias                                                        dtype=float32   shape=(6, 4, 16, 48)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerq_projection:weights                                                     dtype=float32   shape=(6, 4, 768, 16, 48)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformersingle_cond_bias:weights                                                 dtype=float32   shape=(6, 4, 384, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformersingle_cond_layer_norm:scale                                             dtype=float32   shape=(6, 4, 384)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformersingle_cond_scale:bias                                                   dtype=float32   shape=(6, 4, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformersingle_cond_scale:weights                                                dtype=float32   shape=(6, 4, 384, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformertransition2:weights                                                      dtype=float32   shape=(6, 4, 768, 768)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/__layer_stack_with_per_layer/transformerv_projection:weights                                                     dtype=float32   shape=(6, 4, 768, 16, 48)\nname=diffuser/~/diffusion_head/transformer/__layer_stack_with_per_layer/pair_logits_projection:weights                                                                                   dtype=float32   shape=(6, 128, 4, 16)\nname=diffuser/~/diffusion_head/transformer/pair_input_layer_norm:scale                                                                                                                   dtype=float32   shape=(128,)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention1/act_norm:offset                                                                           dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention1/act_norm:scale                                                                            dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention1/gating_query:weights                                                                      dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention1/k_projection:weights                                                                      dtype=bfloat16  shape=(4, 4, 32, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention1/output_projection:weights                                                                 dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention1/pair_bias_projection:weights                                                              dtype=bfloat16  shape=(4, 128, 4)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention1/q_projection:weights                                                                      dtype=bfloat16  shape=(4, 4, 32, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention1/v_projection:weights                                                                      dtype=bfloat16  shape=(4, 128, 4, 32)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention2/act_norm:offset                                                                           dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention2/act_norm:scale                                                                            dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention2/gating_query:weights                                                                      dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention2/k_projection:weights                                                                      dtype=bfloat16  shape=(4, 4, 32, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention2/output_projection:weights                                                                 dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention2/pair_bias_projection:weights                                                              dtype=bfloat16  shape=(4, 128, 4)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention2/q_projection:weights                                                                      dtype=bfloat16  shape=(4, 4, 32, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_attention2/v_projection:weights                                                                      dtype=bfloat16  shape=(4, 128, 4, 32)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_transition/input_layer_norm:offset                                                                   dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_transition/input_layer_norm:scale                                                                    dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_transition/transition1:weights                                                                       dtype=bfloat16  shape=(4, 128, 1024)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/pair_transition/transition2:weights                                                                       dtype=bfloat16  shape=(4, 512, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_attention_gating_query:weights                                                                     dtype=bfloat16  shape=(4, 384, 384)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_attention_k_projection:weights                                                                     dtype=bfloat16  shape=(4, 384, 16, 24)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_attention_layer_norm:offset                                                                        dtype=float32   shape=(4, 384)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_attention_layer_norm:scale                                                                         dtype=float32   shape=(4, 384)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_attention_q_projection:bias                                                                        dtype=bfloat16  shape=(4, 16, 24)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_attention_q_projection:weights                                                                     dtype=bfloat16  shape=(4, 384, 16, 24)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_attention_transition2:weights                                                                      dtype=bfloat16  shape=(4, 384, 384)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_attention_v_projection:weights                                                                     dtype=bfloat16  shape=(4, 384, 16, 24)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_pair_logits_norm:offset                                                                            dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_pair_logits_norm:scale                                                                             dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_pair_logits_projection:weights                                                                     dtype=bfloat16  shape=(4, 128, 16)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_transition/input_layer_norm:offset                                                                 dtype=float32   shape=(4, 384)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_transition/input_layer_norm:scale                                                                  dtype=float32   shape=(4, 384)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_transition/transition1:weights                                                                     dtype=bfloat16  shape=(4, 384, 3072)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/single_transition/transition2:weights                                                                     dtype=bfloat16  shape=(4, 1536, 384)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_incoming/center_norm:offset                                                       dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_incoming/center_norm:scale                                                        dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_incoming/gate:weights                                                             dtype=bfloat16  shape=(4, 128, 256)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_incoming/gating_linear:weights                                                    dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_incoming/left_norm_input:offset                                                   dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_incoming/left_norm_input:scale                                                    dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_incoming/output_projection:weights                                                dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_incoming/projection:weights                                                       dtype=bfloat16  shape=(4, 128, 256)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_outgoing/center_norm:offset                                                       dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_outgoing/center_norm:scale                                                        dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_outgoing/gate:weights                                                             dtype=bfloat16  shape=(4, 128, 256)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_outgoing/gating_linear:weights                                                    dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_outgoing/left_norm_input:offset                                                   dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_outgoing/left_norm_input:scale                                                    dtype=float32   shape=(4, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_outgoing/output_projection:weights                                                dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/confidence_head/__layer_stack_no_per_layer/confidence_pairformer/triangle_multiplication_outgoing/projection:weights                                                       dtype=bfloat16  shape=(4, 128, 256)\nname=diffuser/confidence_head/~_embed_features/distogram_feat_project:weights                                                                                                            dtype=bfloat16  shape=(39, 128)\nname=diffuser/confidence_head/~_embed_features/left_target_feat_project:weights                                                                                                          dtype=bfloat16  shape=(447, 128)\nname=diffuser/confidence_head/~_embed_features/right_target_feat_project:weights                                                                                                         dtype=bfloat16  shape=(447, 128)\nname=diffuser/confidence_head/experimentally_resolved_ln:offset                                                                                                                          dtype=float32   shape=(384,)\nname=diffuser/confidence_head/experimentally_resolved_ln:scale                                                                                                                           dtype=float32   shape=(384,)\nname=diffuser/confidence_head/experimentally_resolved_logits:weights                                                                                                                     dtype=float32   shape=(384, 24, 2)\nname=diffuser/confidence_head/left_half_distance_logits:weights                                                                                                                          dtype=float32   shape=(128, 64)\nname=diffuser/confidence_head/logits_ln:offset                                                                                                                                           dtype=float32   shape=(128,)\nname=diffuser/confidence_head/logits_ln:scale                                                                                                                                            dtype=float32   shape=(128,)\nname=diffuser/confidence_head/pae_logits_ln:offset                                                                                                                                       dtype=float32   shape=(128,)\nname=diffuser/confidence_head/pae_logits_ln:scale                                                                                                                                        dtype=float32   shape=(128,)\nname=diffuser/confidence_head/pae_logits:weights                                                                                                                                         dtype=float32   shape=(128, 64)\nname=diffuser/confidence_head/plddt_logits_ln:offset                                                                                                                                     dtype=float32   shape=(384,)\nname=diffuser/confidence_head/plddt_logits_ln:scale                                                                                                                                      dtype=float32   shape=(384,)\nname=diffuser/confidence_head/plddt_logits:weights                                                                                                                                       dtype=float32   shape=(384, 24, 50)\nname=diffuser/distogram_head/half_logits:weights                                                                                                                                         dtype=float32   shape=(128, 64)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderadaptive_zero_cond:bias                        dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderadaptive_zero_cond:weights                     dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderffw_adaptive_zero_cond:bias                    dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderffw_adaptive_zero_cond:weights                 dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderffw_single_cond_bias:weights                   dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderffw_single_cond_layer_norm:scale               dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderffw_single_cond_scale:bias                     dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderffw_single_cond_scale:weights                  dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderffw_transition1:weights                        dtype=float32   shape=(3, 128, 512)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderffw_transition2:weights                        dtype=float32   shape=(3, 256, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encodergating_query:weights                           dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderk_projection:weights                           dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderksingle_cond_bias:weights                      dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderksingle_cond_layer_norm:scale                  dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderksingle_cond_scale:bias                        dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderksingle_cond_scale:weights                     dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderq_projection:bias                              dtype=float32   shape=(3, 4, 32)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderq_projection:weights                           dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderqsingle_cond_bias:weights                      dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderqsingle_cond_layer_norm:scale                  dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderqsingle_cond_scale:bias                        dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderqsingle_cond_scale:weights                     dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encodertransition2:weights                            dtype=float32   shape=(3, 128, 128)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/__layer_stack_with_per_layer/evoformer_conditioning_atom_transformer_encoderv_projection:weights                           dtype=float32   shape=(3, 128, 4, 32)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/pair_input_layer_norm:scale                                                                                                dtype=float32   shape=(16,)\nname=diffuser/evoformer_conditioning_atom_transformer_encoder/pair_logits_projection:weights                                                                                             dtype=float32   shape=(16, 3, 4)\nname=diffuser/evoformer_conditioning_embed_pair_distances_1:weights                                                                                                                      dtype=float32   shape=(1, 16)\nname=diffuser/evoformer_conditioning_embed_pair_distances:weights                                                                                                                        dtype=float32   shape=(1, 16)\nname=diffuser/evoformer_conditioning_embed_pair_offsets_1:weights                                                                                                                        dtype=float32   shape=(3, 16)\nname=diffuser/evoformer_conditioning_embed_pair_offsets_valid:weights                                                                                                                    dtype=float32   shape=(1, 16)\nname=diffuser/evoformer_conditioning_embed_pair_offsets:weights                                                                                                                          dtype=float32   shape=(3, 16)\nname=diffuser/evoformer_conditioning_embed_ref_atom_name:weights                                                                                                                         dtype=float32   shape=(256, 128)\nname=diffuser/evoformer_conditioning_embed_ref_charge:weights                                                                                                                            dtype=float32   shape=(1, 128)\nname=diffuser/evoformer_conditioning_embed_ref_element:weights                                                                                                                           dtype=float32   shape=(128, 128)\nname=diffuser/evoformer_conditioning_embed_ref_mask:weights                                                                                                                              dtype=float32   shape=(1, 128)\nname=diffuser/evoformer_conditioning_embed_ref_pos:weights                                                                                                                               dtype=float32   shape=(3, 128)\nname=diffuser/evoformer_conditioning_pair_mlp_1:weights                                                                                                                                  dtype=float32   shape=(16, 16)\nname=diffuser/evoformer_conditioning_pair_mlp_2:weights                                                                                                                                  dtype=float32   shape=(16, 16)\nname=diffuser/evoformer_conditioning_pair_mlp_3:weights                                                                                                                                  dtype=float32   shape=(16, 16)\nname=diffuser/evoformer_conditioning_project_atom_features_for_aggr:weights                                                                                                              dtype=float32   shape=(128, 384)\nname=diffuser/evoformer_conditioning_single_to_pair_cond_col_1:weights                                                                                                                   dtype=float32   shape=(128, 16)\nname=diffuser/evoformer_conditioning_single_to_pair_cond_col:weights                                                                                                                     dtype=float32   shape=(128, 16)\nname=diffuser/evoformer_conditioning_single_to_pair_cond_row_1:weights                                                                                                                   dtype=float32   shape=(128, 16)\nname=diffuser/evoformer_conditioning_single_to_pair_cond_row:weights                                                                                                                     dtype=float32   shape=(128, 16)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention1/act_norm:offset                                                                                    dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention1/act_norm:scale                                                                                     dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention1/gating_query:weights                                                                               dtype=bfloat16  shape=(48, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention1/k_projection:weights                                                                               dtype=bfloat16  shape=(48, 4, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention1/output_projection:weights                                                                          dtype=bfloat16  shape=(48, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention1/pair_bias_projection:weights                                                                       dtype=bfloat16  shape=(48, 128, 4)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention1/q_projection:weights                                                                               dtype=bfloat16  shape=(48, 4, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention1/v_projection:weights                                                                               dtype=bfloat16  shape=(48, 128, 4, 32)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention2/act_norm:offset                                                                                    dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention2/act_norm:scale                                                                                     dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention2/gating_query:weights                                                                               dtype=bfloat16  shape=(48, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention2/k_projection:weights                                                                               dtype=bfloat16  shape=(48, 4, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention2/output_projection:weights                                                                          dtype=bfloat16  shape=(48, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention2/pair_bias_projection:weights                                                                       dtype=bfloat16  shape=(48, 128, 4)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention2/q_projection:weights                                                                               dtype=bfloat16  shape=(48, 4, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_attention2/v_projection:weights                                                                               dtype=bfloat16  shape=(48, 128, 4, 32)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_transition/input_layer_norm:offset                                                                            dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_transition/input_layer_norm:scale                                                                             dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_transition/transition1:weights                                                                                dtype=bfloat16  shape=(48, 128, 1024)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/pair_transition/transition2:weights                                                                                dtype=bfloat16  shape=(48, 512, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_attention_gating_query:weights                                                                              dtype=bfloat16  shape=(48, 384, 384)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_attention_k_projection:weights                                                                              dtype=bfloat16  shape=(48, 384, 16, 24)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_attention_layer_norm:offset                                                                                 dtype=float32   shape=(48, 384)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_attention_layer_norm:scale                                                                                  dtype=float32   shape=(48, 384)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_attention_q_projection:bias                                                                                 dtype=bfloat16  shape=(48, 16, 24)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_attention_q_projection:weights                                                                              dtype=bfloat16  shape=(48, 384, 16, 24)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_attention_transition2:weights                                                                               dtype=bfloat16  shape=(48, 384, 384)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_attention_v_projection:weights                                                                              dtype=bfloat16  shape=(48, 384, 16, 24)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_pair_logits_norm:offset                                                                                     dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_pair_logits_norm:scale                                                                                      dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_pair_logits_projection:weights                                                                              dtype=bfloat16  shape=(48, 128, 16)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_transition/input_layer_norm:offset                                                                          dtype=float32   shape=(48, 384)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_transition/input_layer_norm:scale                                                                           dtype=float32   shape=(48, 384)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_transition/transition1:weights                                                                              dtype=bfloat16  shape=(48, 384, 3072)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/single_transition/transition2:weights                                                                              dtype=bfloat16  shape=(48, 1536, 384)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_incoming/center_norm:offset                                                                dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_incoming/center_norm:scale                                                                 dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_incoming/gate:weights                                                                      dtype=bfloat16  shape=(48, 128, 256)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_incoming/gating_linear:weights                                                             dtype=bfloat16  shape=(48, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_incoming/left_norm_input:offset                                                            dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_incoming/left_norm_input:scale                                                             dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_incoming/output_projection:weights                                                         dtype=bfloat16  shape=(48, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_incoming/projection:weights                                                                dtype=bfloat16  shape=(48, 128, 256)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_outgoing/center_norm:offset                                                                dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_outgoing/center_norm:scale                                                                 dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_outgoing/gate:weights                                                                      dtype=bfloat16  shape=(48, 128, 256)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_outgoing/gating_linear:weights                                                             dtype=bfloat16  shape=(48, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_outgoing/left_norm_input:offset                                                            dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_outgoing/left_norm_input:scale                                                             dtype=float32   shape=(48, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_outgoing/output_projection:weights                                                         dtype=bfloat16  shape=(48, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer_1/trunk_pairformer/triangle_multiplication_outgoing/projection:weights                                                                dtype=bfloat16  shape=(48, 128, 256)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_attention1/act_norm:offset                                                                                              dtype=float32   shape=(4, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_attention1/act_norm:scale                                                                                               dtype=float32   shape=(4, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_attention1/gating_query:weights                                                                                         dtype=bfloat16  shape=(4, 64, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_attention1/output_projection:weights                                                                                    dtype=bfloat16  shape=(4, 64, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_attention1/pair_logits:weights                                                                                          dtype=bfloat16  shape=(4, 128, 8)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_attention1/pair_norm:offset                                                                                             dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_attention1/pair_norm:scale                                                                                              dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_attention1/v_projection:weights                                                                                         dtype=bfloat16  shape=(4, 64, 8, 8)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_transition/input_layer_norm:offset                                                                                      dtype=float32   shape=(4, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_transition/input_layer_norm:scale                                                                                       dtype=float32   shape=(4, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_transition/transition1:weights                                                                                          dtype=bfloat16  shape=(4, 64, 512)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/msa_transition/transition2:weights                                                                                          dtype=bfloat16  shape=(4, 256, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/outer_product_mean:output_b                                                                                                 dtype=bfloat16  shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/outer_product_mean:output_w                                                                                                 dtype=bfloat16  shape=(4, 32, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/outer_product_mean/layer_norm_input:offset                                                                                  dtype=float32   shape=(4, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/outer_product_mean/layer_norm_input:scale                                                                                   dtype=float32   shape=(4, 64)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/outer_product_mean/left_projection:weights                                                                                  dtype=bfloat16  shape=(4, 64, 32)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/outer_product_mean/right_projection:weights                                                                                 dtype=bfloat16  shape=(4, 64, 32)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention1/act_norm:offset                                                                                             dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention1/act_norm:scale                                                                                              dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention1/gating_query:weights                                                                                        dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention1/k_projection:weights                                                                                        dtype=bfloat16  shape=(4, 4, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention1/output_projection:weights                                                                                   dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention1/pair_bias_projection:weights                                                                                dtype=bfloat16  shape=(4, 128, 4)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention1/q_projection:weights                                                                                        dtype=bfloat16  shape=(4, 4, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention1/v_projection:weights                                                                                        dtype=bfloat16  shape=(4, 128, 4, 32)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention2/act_norm:offset                                                                                             dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention2/act_norm:scale                                                                                              dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention2/gating_query:weights                                                                                        dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention2/k_projection:weights                                                                                        dtype=bfloat16  shape=(4, 4, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention2/output_projection:weights                                                                                   dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention2/pair_bias_projection:weights                                                                                dtype=bfloat16  shape=(4, 128, 4)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention2/q_projection:weights                                                                                        dtype=bfloat16  shape=(4, 4, 32, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_attention2/v_projection:weights                                                                                        dtype=bfloat16  shape=(4, 128, 4, 32)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_transition/input_layer_norm:offset                                                                                     dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_transition/input_layer_norm:scale                                                                                      dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_transition/transition1:weights                                                                                         dtype=bfloat16  shape=(4, 128, 1024)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/pair_transition/transition2:weights                                                                                         dtype=bfloat16  shape=(4, 512, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_incoming/center_norm:offset                                                                         dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_incoming/center_norm:scale                                                                          dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_incoming/gate:weights                                                                               dtype=bfloat16  shape=(4, 128, 256)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_incoming/gating_linear:weights                                                                      dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_incoming/left_norm_input:offset                                                                     dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_incoming/left_norm_input:scale                                                                      dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_incoming/output_projection:weights                                                                  dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_incoming/projection:weights                                                                         dtype=bfloat16  shape=(4, 128, 256)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_outgoing/center_norm:offset                                                                         dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_outgoing/center_norm:scale                                                                          dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_outgoing/gate:weights                                                                               dtype=bfloat16  shape=(4, 128, 256)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_outgoing/gating_linear:weights                                                                      dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_outgoing/left_norm_input:offset                                                                     dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_outgoing/left_norm_input:scale                                                                      dtype=float32   shape=(4, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_outgoing/output_projection:weights                                                                  dtype=bfloat16  shape=(4, 128, 128)\nname=diffuser/evoformer/__layer_stack_no_per_layer/msa_stack/triangle_multiplication_outgoing/projection:weights                                                                         dtype=bfloat16  shape=(4, 128, 256)\nname=diffuser/evoformer/~_relative_encoding/position_activations:weights                                                                                                                 dtype=bfloat16  shape=(139, 128)\nname=diffuser/evoformer/bond_embedding:weights                                                                                                                                           dtype=bfloat16  shape=(1, 128)\nname=diffuser/evoformer/extra_msa_target_feat:weights                                                                                                                                    dtype=bfloat16  shape=(447, 64)\nname=diffuser/evoformer/left_single:weights                                                                                                                                              dtype=bfloat16  shape=(447, 128)\nname=diffuser/evoformer/msa_activations:weights                                                                                                                                          dtype=bfloat16  shape=(34, 64)\nname=diffuser/evoformer/prev_embedding_layer_norm:offset                                                                                                                                 dtype=float32   shape=(128,)\nname=diffuser/evoformer/prev_embedding_layer_norm:scale                                                                                                                                  dtype=float32   shape=(128,)\nname=diffuser/evoformer/prev_embedding:weights                                                                                                                                           dtype=bfloat16  shape=(128, 128)\nname=diffuser/evoformer/prev_single_embedding_layer_norm:offset                                                                                                                          dtype=float32   shape=(384,)\nname=diffuser/evoformer/prev_single_embedding_layer_norm:scale                                                                                                                           dtype=float32   shape=(384,)\nname=diffuser/evoformer/prev_single_embedding:weights                                                                                                                                    dtype=bfloat16  shape=(384, 384)\nname=diffuser/evoformer/right_single:weights                                                                                                                                             dtype=bfloat16  shape=(447, 128)\nname=diffuser/evoformer/single_activations:weights                                                                                                                                       dtype=bfloat16  shape=(447, 384)\nname=diffuser/evoformer/template_embedding/output_linear:weights                                                                                                                         dtype=bfloat16  shape=(64, 128)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention1/act_norm:offset                             dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention1/act_norm:scale                              dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention1/gating_query:weights                        dtype=bfloat16  shape=(2, 64, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention1/k_projection:weights                        dtype=bfloat16  shape=(2, 4, 16, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention1/output_projection:weights                   dtype=bfloat16  shape=(2, 64, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention1/pair_bias_projection:weights                dtype=bfloat16  shape=(2, 64, 4)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention1/q_projection:weights                        dtype=bfloat16  shape=(2, 4, 16, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention1/v_projection:weights                        dtype=bfloat16  shape=(2, 64, 4, 16)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention2/act_norm:offset                             dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention2/act_norm:scale                              dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention2/gating_query:weights                        dtype=bfloat16  shape=(2, 64, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention2/k_projection:weights                        dtype=bfloat16  shape=(2, 4, 16, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention2/output_projection:weights                   dtype=bfloat16  shape=(2, 64, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention2/pair_bias_projection:weights                dtype=bfloat16  shape=(2, 64, 4)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention2/q_projection:weights                        dtype=bfloat16  shape=(2, 4, 16, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_attention2/v_projection:weights                        dtype=bfloat16  shape=(2, 64, 4, 16)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_transition/input_layer_norm:offset                     dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_transition/input_layer_norm:scale                      dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_transition/transition1:weights                         dtype=bfloat16  shape=(2, 64, 256)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/pair_transition/transition2:weights                         dtype=bfloat16  shape=(2, 128, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_incoming/center_norm:offset         dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_incoming/center_norm:scale          dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_incoming/gate:weights               dtype=bfloat16  shape=(2, 64, 128)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_incoming/gating_linear:weights      dtype=bfloat16  shape=(2, 64, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_incoming/left_norm_input:offset     dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_incoming/left_norm_input:scale      dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_incoming/output_projection:weights  dtype=bfloat16  shape=(2, 64, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_incoming/projection:weights         dtype=bfloat16  shape=(2, 64, 128)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_outgoing/center_norm:offset         dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_outgoing/center_norm:scale          dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_outgoing/gate:weights               dtype=bfloat16  shape=(2, 64, 128)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_outgoing/gating_linear:weights      dtype=bfloat16  shape=(2, 64, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_outgoing/left_norm_input:offset     dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_outgoing/left_norm_input:scale      dtype=float32   shape=(2, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_outgoing/output_projection:weights  dtype=bfloat16  shape=(2, 64, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/__layer_stack_no_per_layer/template_embedding_iteration/triangle_multiplication_outgoing/projection:weights         dtype=bfloat16  shape=(2, 64, 128)\nname=diffuser/evoformer/template_embedding/single_template_embedding/output_layer_norm:offset                                                                                            dtype=float32   shape=(64,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/output_layer_norm:scale                                                                                             dtype=float32   shape=(64,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/query_embedding_norm:offset                                                                                         dtype=float32   shape=(128,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/query_embedding_norm:scale                                                                                          dtype=float32   shape=(128,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_0:weights                                                                                   dtype=bfloat16  shape=(39, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_1:weights                                                                                   dtype=bfloat16  shape=(64,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_2:weights                                                                                   dtype=bfloat16  shape=(31, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_3:weights                                                                                   dtype=bfloat16  shape=(31, 64)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_4:weights                                                                                   dtype=bfloat16  shape=(64,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_5:weights                                                                                   dtype=bfloat16  shape=(64,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_6:weights                                                                                   dtype=bfloat16  shape=(64,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_7:weights                                                                                   dtype=bfloat16  shape=(64,)\nname=diffuser/evoformer/template_embedding/single_template_embedding/template_pair_embedding_8:weights                                                                                   dtype=bfloat16  shape=(128, 64)\n```\n"
  },
  {
    "path": "docs/output.md",
    "content": "# AlphaFold 3 Output\n\n## Output Directory Structure\n\nFor every input job, AlphaFold 3 writes all its outputs in a directory called by\nthe sanitized version of the job name. E.g. for job name \"My first fold (TEST)\",\nAlphaFold 3 will write its outputs in a directory called `My_first_fold_TEST`\n(the case is respected). If such directory already exists, AlphaFold 3 will\nappend a timestamp to the directory name to avoid overwriting existing data\nunless `--force_output_dir` is passed.\n\nThe following structure is used within the output directory:\n\n*   Sub-directories with results for each sample and seed. There will be\n    *num\\_seeds* \\* *num\\_samples* such sub-directories. The naming pattern is\n    `seed-<seed value>_sample-<sample number>`. Each of these directories\n    contains a confidence JSON, summary confidence JSON, and the mmCIF with the\n    predicted structure.\n*   Distogram for each seed: `seed-<seed value>_distogram/distogram.npz`. The\n    Numpy zip file contains a single key: `distogram`. The distogram can be\n    large, its shape is `(num_tokens, num_tokens, 64)` and dtype `np.float16`\n    (almost 3 GiB for a 5,000-token input). Only saved if AlphaFold 3 is run\n    with `--save_distogram=true`.\n*   Embeddings for each seed: `seed-<seed value>_embeddings/embeddings.npz`. The\n    Numpy zip file contains 2 keys: `single_embeddings` and `pair_embeddings`.\n    The embeddings can be large, their shapes are `(num_tokens, 384)` for\n    `single_embeddings`, and `(num_tokens, num_tokens, 128)` for\n    `pair_embeddings`. Their dtype is `np.float16` (almost 6 GiB for a\n    5,000-token input). Only saved if AlphaFold 3 is run with\n    `--save_embeddings=true`.\n*   Top-ranking prediction mmCIF: `<job_name>_model.cif`. This file contains the\n    predicted coordinates and should be compatible with most structural biology\n    tools. We do not provide the output in the PDB format, the CIF file can be\n    easily converted into one if needed.\n*   Top-ranking prediction confidence JSON: `<job_name>_confidences.json`.\n*   Top-ranking prediction summary confidence JSON:\n    `<job_name>_summary_confidences.json`.\n*   Job input JSON file with the MSA and template data added by the data\n    pipeline: `<job_name>_data.json`.\n*   Ranking scores for all predictions: `ranking_scores.csv`. The prediction\n    with highest ranking is the one included in the root directory.\n*   Output terms of use: `TERMS_OF_USE.md`.\n\nBelow is an example AlphaFold 3 output directory listing for a job called \"Hello\nFold\", that has been ran with 1 seed and 5 samples:\n\n```txt\nhello_fold/\n├── seed-1234_distogram                        # Only if --save_distogram=true.\n│   └── hello_fold_seed-1234_distogram.npz     # Only if --save_distogram=true.\n├── seed-1234_embeddings                       # Only if --save_embeddings=true.\n│   └── hello_fold_seed-1234_embeddings.npz    # Only if --save_embeddings=true.\n├── seed-1234_sample-0/\n│   ├── hello_fold_seed-1234_sample-0_confidences.json\n│   ├── hello_fold_seed-1234_sample-0_model.cif\n│   └── hello_fold_seed-1234_sample-0_summary_confidences.json\n├── seed-1234_sample-1/\n│   ├── hello_fold_seed-1234_sample-1_confidences.json\n│   ├── hello_fold_seed-1234_sample-1_model.cif\n│   └── hello_fold_seed-1234_sample-1_summary_confidences.json\n├── seed-1234_sample-2/\n│   ├── hello_fold_seed-1234_sample-2_confidences.json\n│   ├── hello_fold_seed-1234_sample-2_model.cif\n│   └── hello_fold_seed-1234_sample-2_summary_confidences.json\n├── seed-1234_sample-3/\n│   ├── hello_fold_seed-1234_sample-3_confidences.json\n│   ├── hello_fold_seed-1234_sample-3_model.cif\n│   └── hello_fold_seed-1234_sample-3_summary_confidences.json\n├── seed-1234_sample-4/\n│   ├── hello_fold_seed-1234_sample-4_confidences.json\n│   ├── hello_fold_seed-1234_sample-4_model.cif\n│   └── hello_fold_seed-1234_sample-4_summary_confidences.json\n├── TERMS_OF_USE.md\n├── hello_fold_confidences.json\n├── hello_fold_data.json\n├── hello_fold_model.cif\n├── hello_fold_ranking_scores.csv\n└── hello_fold_summary_confidences.json\n```\n\n## Confidence Metrics\n\nSimilar to AlphaFold 2 and AlphaFold-Multimer, AlphaFold 3 outputs include\nconfidence metrics. The main metrics are:\n\n*   **pLDDT:** a per-atom confidence estimate on a 0-100 scale where a higher\n    value indicates higher confidence. pLDDT aims to predict a modified LDDT\n    score that only considers distances to polymers. For proteins this is\n    similar to the\n    [lDDT-Cα metric](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3799472/) but\n    with more granularity as it can vary per atom not just per residue. For\n    ligand atoms, the modified LDDT considers the errors only between the ligand\n    atom and polymers, not other ligand atoms. For DNA/RNA a wider radius of 30\n    Å is used for the modified LDDT instead of 15 Å.\n*   **PAE (predicted aligned error)**: an estimate of the error in the relative\n    position and orientation between two tokens in the predicted structure.\n    Higher values indicate higher predicted error and therefore lower\n    confidence. For proteins and nucleic acids, PAE score is essentially the\n    same as AlphaFold 2, where the error is measured relative to frames\n    constructed from the protein backbone. For small molecules and\n    post-translational modifications, a frame is constructed for each atom from\n    its closest neighbors from a reference conformer.\n*   **pTM and ipTM scores**: the predicted template modeling (pTM) score and the\n    interface predicted template modeling (ipTM) score are both derived from a\n    measure called the template modeling (TM) score. This measures the accuracy\n    of the entire structure\n    ([Zhang and Skolnick, 2004](https://doi.org/10.1002/prot.20264);\n    [Xu and Zhang, 2010](https://doi.org/10.1093/bioinformatics/btq066)). A pTM\n    score above 0.5 means the overall predicted fold for the complex might be\n    similar to the true structure. ipTM measures the accuracy of the predicted\n    relative positions of the subunits within the complex. Values higher than\n    0.8 represent confident high-quality predictions, while values below 0.6\n    suggest a failed prediction. ipTM values between 0.6 and 0.8 are a gray zone\n    where predictions could be correct or incorrect. The TM score is very strict\n    for small structures or short chains, so pTM assigns values less than 0.05\n    when fewer than 20 tokens are involved; for these cases PAE or pLDDT may be\n    more indicative of prediction quality.\n\nFor detailed description of these confidence metrics see the\n[AlphaFold 3 paper](https://www.nature.com/articles/s41586-024-07487-w). For\nprotein components, the\n[AlphaFold: A Practical guide](https://www.ebi.ac.uk/training/online/courses/alphafold/inputs-and-outputs/evaluating-alphafolds-predicted-structures-using-confidence-scores/)\ncourse for structures provides additional tutorials on the confidence metrics.\n\nIf you are interested in a specific entity or interaction, then there are\nconfidences available in the outputs which are specific to each chain or\nchain-pair, as opposed to the full complex. See below for more details on all\nthe confidence metrics that are returned.\n\n## Multi-Seed and Multi-Sample Results\n\nBy default, the model samples five predictions per seed. The top-ranked\nprediction across all samples and seeds is available at the top-level of the\noutput directory. All samples along with their associated confidences are\navailable in subdirectories of the output directory.\n\nFor ranking of the full complex use the `ranking_score` (higher is better). This\nscore uses overall structure confidences (pTM and ipTM), but also includes terms\nthat penalize clashes and encourage disordered regions not to have spurious\nhelices – these extra terms mean the score should only be used to rank\nstructures.\n\nIf you are interested in a specific entity or interaction, you may want to rank\nby a metric specific to that chain or chain-pair, as opposed to the full\ncomplex. In that case, use the per chain or per chain-pair confidence metrics\ndescribed below for ranking.\n\n## Metrics in Confidences JSON\n\nFor each predicted sample we provide two JSON files. One contains summary\nmetrics – summaries for either the whole structure, per chain or per chain-pair\n– and the other contains full 1D or 2D arrays.\n\nSummary outputs:\n\n*   `ptm`: A scalar in the range 0-1 indicating the predicted TM-score for the\n    full structure.\n*   `iptm`: A scalar in the range 0-1 indicating predicted interface TM-score\n    (confidence in the predicted interfaces) for all interfaces in the\n    structure.\n*   `fraction_disordered`: A scalar in the range 0-1 that indicates what\n    fraction of the prediction structure is disordered, as measured by\n    accessible surface area, see our\n    [paper](https://www.nature.com/articles/s41586-024-07487-w) for details.\n*   `has_clash`: A boolean indicating if the structure has a significant number\n    of clashing atoms (more than 50% of a chain, or a chain with more than 100\n    clashing atoms).\n*   `ranking_score`: A scalar in the range \\[-100, 1.5\\] that can be used for\n    ranking predictions, it incorporates `ptm`, `iptm`, `fraction_disordered`\n    and `has_clash` into a single number with the following equation: 0.8 × ipTM\n    \\+ 0.2 × pTM \\+ 0.5 × disorder − 100 × has_clash.\n*   `chain_pair_pae_min`: A \\[num_chains, num_chains\\] array. Element (i, j) of\n    the array contains the lowest PAE value across rows restricted to chain i\n    and columns restricted to chain j. This has been found to correlate with\n    whether two chains interact or not, and in some cases can be used to\n    distinguish binders from non-binders.\n*   `chain_pair_iptm`: A \\[num_chains, num_chains\\] array. Off-diagonal element\n    (i, j) of the array contains the ipTM restricted to tokens from chains i and\n    j. Diagonal element (i, i) contains the pTM restricted to chain i. Can be\n    used for ranking a specific interface between two chains, when you know that\n    they interact, e.g. for antibody-antigen interactions\n*   `chain_ptm`: A \\[num_chains\\] array. Element i contains the pTM restricted\n    to chain i. Can be used for ranking individual chains when the structure of\n    that chain is most of interest, rather than the cross-chain interactions it\n    is involved with.\n*   `chain_iptm:` A \\[num_chains\\] array that gives the average confidence\n    (interface pTM) in the interface between each chain and all other chains.\n    Can be used for ranking a specific chain, when you care about where the\n    chain binds to the rest of the complex and you do not know which other\n    chains you expect it to interact with. This is often the case with ligands.\n\nFull array outputs:\n\n*   `pae`: A \\[num\\_tokens, num\\_tokens\\] array. Element (i, j) indicates the\n    predicted error in the position of token j, when the prediction is aligned\n    to the ground truth using the frame of token i.\n*   `atom_plddts`: A \\[num_atoms\\] array, element i indicates the predicted\n    local distance difference test (pLDDT) for atom i in the prediction.\n*   `contact_probs`: A \\[num_tokens, num_tokens\\] array. Element (i, j)\n    indicates the predicted probability that token i and token j are in contact\n    (8 Å between the representative atom for each token), see\n    [paper](https://www.nature.com/articles/s41586-024-07487-w) for details.\n*   `token_chain_ids`: A \\[num_tokens\\] array indicating the chain ids\n    corresponding to each token in the prediction.\n*   `atom_chain_ids`: A \\[num_atoms\\] array indicating the chain ids\n    corresponding to each atom in the prediction.\n\n## Embeddings\n\nAlphaFold 3 can be run with `--save_embeddings=true` to save the embeddings for\neach seed. The file is in the\n[compressed Numpy `.npz` format](https://numpy.org/doc/stable/reference/generated/numpy.savez_compressed.html)\nand can be loaded using `numpy.load` as a dictionary-like object with two\narrays:\n\n*   `single_embeddings`: A \\`[num\\_tokens, 384\\] array containing the embeddings\n    for each token.\n*   `pair_embeddings`: A \\[num\\_tokens, num\\_tokens, 128\\] array containing the\n    pairwise embeddings between all tokens.\n\nYou can use for instance the following Python code to load the embeddings:\n\n```py\nimport numpy as np\n\nwith open('embeddings.npz', 'rb') as f:\n  embeddings = np.load(f)\n  single_embeddings = embeddings['single_embeddings']\n  pair_embeddings = embeddings['pair_embeddings']\n```\n\n## Chirality checks\n\nIn the AlphaFold 3 paper Posebusters results, a penalty was applied to the\nranking score if the ligand of interest contained chiral errors. By running\nmultiple seeds and using this chiral aware ranking, chiral error rates were\ngreatly reduced.\n\nWe provide the method `compare_chirality` in\n[`model/scoring/chirality.py`](https://github.com/google-deepmind/alphafold3/blob/main/src/alphafold3/model/scoring/chirality.py)\nto replicate these chiral checks. Chirality is checked against CCD structures if\navailable, otherwise users can supply custom RDKit Mol objects for comparison.\n"
  },
  {
    "path": "docs/performance.md",
    "content": "# Performance\n\n## Running the Pipeline in Stages\n\nThe `run_alphafold.py` script can be executed in stages to optimise resource\nutilisation. This can be useful for:\n\n1.  Splitting the CPU-only data pipeline from model inference (which requires a\n    GPU), to optimise cost and resource usage.\n1.  Generating the JSON output file from the data pipeline only run and then\n    using it for multiple different inference only runs across seeds or across\n    variations of other features (e.g. a ligand or a partner chain).\n1.  Generating the JSON output for multiple individual monomer chains (e.g. for\n    chains A, B, C, D), then running the inference on all possible chain pairs\n    (AB, AC, AD, BC, BD, CD) by creating dimer JSONs by merging the monomer\n    JSONs. By doing this, the MSA and template search need to be run just 4\n    times (once for each chain), instead of 12 times.\n\n### Data Pipeline Only\n\nLaunch `run_alphafold.py` with `--norun_inference` to generate Multiple Sequence\nAlignments (MSAs) and templates, without running featurisation and model\ninference. This stage can be quite costly in terms of runtime, CPU, and RAM use.\nThe output will be JSON files augmented with MSAs and templates that can then be\ndirectly used as input for running inference.\n\n### Pre-computing and reusing MSA and templates\n\nWhen folding multiple candidate chains with a set of fixed chains (i.e. chains\nthat are the same for all the runs), you can optimize the process by computing\nthe MSA and templates for the fixed chains only once. The computations for the\nchanging candidate chains will still be performed for each run:\n\n1.  Run the AlphaFold 3 data pipeline for the fixed chains using the\n    `--run_inference=false` flag. This step generates a JSON file containing the\n    MSA and template data for these chains.\n2.  When constructing your multimer input JSONs, populate the entries for the\n    fixed chains using the data generated in the previous step.\n    *   For the fixed chains: Specifically, copy the `unpairedMsa`, `pairedMsa`,\n        and `templates` fields from the pre-computed JSON into the multimer\n        input JSON. This prevents these fields from being recomputed.\n    *   For the candidate chains: Leave these fields unset (or `null`) in the\n        multimer input JSON. This will signal the pipeline to compute them\n        dynamically for each run.\n\nThis technique can also be extended to efficiently process all combinations of\n*n* first chains and *m* second chains. Instead of performing *n* × *m* full\ncomputations, you can reduce this to *n* + *m* data pipeline runs.\n\nIn this scenario:\n\n1.  Run the data pipeline (step 1 above, with `--run_inference=false`) for all\n    *n* individual first chains and all *m* individual second chains.\n2.  Assemble the dimer input JSONs for each desired pair by combining their\n    respective pre-computed monomer JSONs.\n3.  Run only the inference step on these assembled JSONs using the\n    `--run_data_pipeline=false` flag.\n\nThis approach has been discussed in multiple GitHub issues, such as:\nhttps://github.com/google-deepmind/alphafold3/issues/171 (which links to other\nsimilar issues).\n\n### Featurisation and Model Inference Only\n\nLaunch `run_alphafold.py` with `--norun_data_pipeline` to skip the data pipeline\nand run only featurisation and model inference. This stage requires the input\nJSON file to contain pre-computed MSAs and templates (or they must be explicitly\nset to empty if you want to run MSA and template free).\n\n## Data Pipeline\n\nThe runtime of the data pipeline (i.e. genetic sequence search and template\nsearch) can vary significantly depending on the size of the input and the number\nof homologous sequences found, as well as the available hardware – the disk\nspeed can influence genetic search speed in particular.\n\nIf you would like to improve performance, it's recommended to increase the disk\nspeed (e.g. by leveraging a RAM-backed filesystem), or increase the available\nCPU cores and add more parallelisation. This can help because AlphaFold 3 runs\ngenetic search against 4 databases in parallel, so the optimal number of cores\nis the number of cores used for each Jackhmmer process times 4. Also note that\nfor sequences with deep MSAs, Jackhmmer or Nhmmer may need a substantial amount\nof RAM beyond the recommended 64 GB of RAM.\n\n### Sharded genetic databases\n\nThe run time of the genetic database search can be *significantly* sped up by\nsplitting the genetic databases if a machine with many CPU cores is used and the\ndatabases are on very fast SSD or in a RAM-backed filesystem. With this\ntechnique you can make Jackhmmer/Nhmmer genetic search fully utilize your\nhardware and take advantage of multi-core systems.\n\nEach genetic database with *n* sequences is split into *s* shards, each\ncontaining roughly *n* / *s* sequences. We recommend splitting the sequences\nbetween shards randomly to make sure each shard has similar sequence length\ndistribution. This could be achieved using standard tools:\n\n1.  Shuffle the sequences in the fasta. This can be done for example by running:\n    `seqkit shuffle --two-pass <db.fasta>`\n2.  Split the shuffled fasta in *s* shards. This can be done for example by\n    running: `seqkit split2 --by-part <s> <db.fasta>`\n\nMake sure the shards names follow this pattern:\n`prefix-<shard_index>-of-<total_shards>`, both `shard_index` and `total_shards`\nhaving always 5 digits, with leading zeros as needed. The `shard_index` goes\nfrom 0 to `total_shards - 1`. A file \"path\" (spec) for a sharded file is\n`prefix@<total_shards>`.\n\nE.g. for a file named `uniprot.fasta` split into 3 shards, the names of the\nshards should be:\n\n*   `uniprot.fasta-00000-of-00003`\n*   `uniprot.fasta-00001-of-00003`\n*   `uniprot.fasta-00002-of-00003`\n\nThe file spec for these files is `uniprot.fasta@3`.\n\nSave the total number of sequences in the protein databases, and the total\nnumber of nucleic bases in the RNA databases – these will be needed later as a\nflag to Jackhmmer/Nhmmer to correctly scale e-values across all shards.\n\nSave the sharded databases on a fast SSD or in a RAM-backed filesystem, then\nlaunch AlphaFold with the sharded paths instead of normal paths and set the\nZ-values.\n\nFor instance with each database sharded into 16 shards:\n\n```bash\npython run_alphafold.py \\\n    --small_bfd_database_path=\"bfd-first_non_consensus_sequences.fasta@64\" \\\n    --small_bfd_z_value=65984053 \\\n    --mgnify_database_path=\"mgy_clusters_2022_05.fa@512\" \\\n    --mgnify_z_value=623796864 \\\n    --uniprot_cluster_annot_database_path=\"uniprot_cluster_annot_2021_04.fasta@256\" \\\n    --uniprot_cluster_annot_z_value=225619586 \\\n    --uniref90_database_path=\"uniref90_2022_05.fasta@128\" \\\n    --uniref90_z_value=153742194 \\\n    --ntrna_database_path=\"nt_rna_2023_02_23_clust_seq_id_90_cov_80_rep_seq.fasta@256\" \\\n    --ntrna_z_value=76752.808514 \\\n    --rfam_database_path=\"rfam_14_9_clust_seq_id_90_cov_80_rep_seq.fasta@16\" \\\n    --rfam_z_value=138.115553 \\\n    --rna_central_database_path=\"rnacentral_active_seq_id_90_cov_80_linclust.fasta@64\" \\\n    --rna_central_z_value=13271.415730\n    --jackhmmer_n_cpu=2 \\\n    --jackhmmer_max_parallel_shards=16 \\\n    --nhmmer_n_cpu=2 \\\n    --nhmmer_max_parallel_shards=16\n```\n\nThis run will utilize (2 CPUs) × (16 max parallel shards) × (4 protein dbs\nsearched in parallel) = 128 cores for each protein chain, and (2 CPUs) × (16 max\nparallel shards) × (3 RNA dbs searched in parallel) = 96 cores for each RNA\nchain. Make sure to tune:\n\n*   the Jackhmmer/Nhmmer number of CPUs,\n*   the maximum number of shards searched in parallel,\n*   and the number of shards for each database\n\nso that the memory bandwidth and CPUs on your machine are optimally utilized.\nYou should aim for consistent shard sizes across all databases (so e.g. if\ndatabase A is split into 16 shards and is 3× smaller than database B, database B\nshould be split into 3 × 16 = 48 shards).\n\n## Model Inference\n\nTable 8 in the Supplementary Information of the\n[AlphaFold 3 paper](https://nature.com/articles/s41586-024-07487-w) provides\ncompile-free inference timings for AlphaFold 3 when configured to run on 16\nNVIDIA A100s, with 40 GB of memory per device. In contrast, this repository\nsupports running AlphaFold 3 on a single NVIDIA A100 with 80 GB of memory in a\nconfiguration optimised to maximise throughput.\n\nWe compare compile-free inference timings of these two setups in the table below\nusing GPU seconds (i.e. multiplying by 16 when using 16 A100s). The setup in\nthis repository is more efficient (by at least 2×) across all token sizes,\nindicating its suitability for high-throughput applications.\n\nNum Tokens | 1 A100 80 GB (GPU secs) | 16 A100 40 GB (GPU secs) | Improvement\n:--------- | ----------------------: | -----------------------: | ----------:\n1024       | 62                      | 352                      | 5.7×\n2048       | 275                     | 1136                     | 4.1×\n3072       | 703                     | 2016                     | 2.9×\n4096       | 1434                    | 3648                     | 2.5×\n5120       | 2547                    | 5552                     | 2.2×\n\n## Accelerator Hardware Requirements\n\nWe officially support the following configurations, and have extensively tested\nthem for numerical accuracy and throughput efficiency:\n\n-   1 NVIDIA A100 (80 GB)\n-   1 NVIDIA H100 (80 GB)\n\nWe compare compile-free inference timings of both configurations in the\nfollowing table:\n\nNum Tokens | 1 A100 80 GB (seconds) | 1 H100 80 GB (seconds)\n:--------- | ---------------------: | ---------------------:\n1024       | 62                     | 34\n2048       | 275                    | 144\n3072       | 703                    | 367\n4096       | 1434                   | 774\n5120       | 2547                   | 1416\n\n### Other Hardware Configurations\n\n#### NVIDIA A100 (40 GB)\n\nAlphaFold 3 can run on inputs of size up to 4,352 tokens on a single NVIDIA A100\n(40 GB) with the following configuration changes:\n\n1.  Enabling [unified memory](#unified-memory).\n1.  Adjusting `pair_transition_shard_spec` in `model_config.py`:\n\n    ```py\n      pair_transition_shard_spec: Sequence[_Shape2DType] = (\n          (2048, None),\n          (3072, 1024),\n          (None, 512),\n      )\n    ```\n\nThe format of entries in `pair_transition_shard_spec` is\n`(num_tokens_upper_bound, shard_size)`. Setting `shard_size=None` means there is\nno upper bound.\n\nFor the example above:\n\n*   `(2048, None)`: for sequences up to 2,048 tokens, do not shard\n*   `(3072, 1024)`: for sequences up to 3,072 tokens, shard in chunks of 1,024\n*   `(None, 512)`: for all other sequences, shard in chunks of 512\n\nWhile numerically accurate, this configuration will have lower throughput\ncompared to the set up on the NVIDIA A100 (80 GB), due to less available memory.\n\n#### NVIDIA V100\n\nThere are known numerical issues with CUDA Capability 7.x devices. To work\naround the issue, set the ENV XLA_FLAGS to include\n`--xla_disable_hlo_passes=custom-kernel-fusion-rewriter`.\n\nWith the above flag set, AlphaFold 3 can run on inputs of size up to 1,280\ntokens on a single NVIDIA V100 using [unified memory](#unified-memory).\n\n#### NVIDIA P100\n\nAlphaFold 3 can run on inputs of size up to 1,024 tokens on a single NVIDIA P100\nwith no configuration changes needed.\n\n#### Other devices\n\nLarge-scale numerical tests have not been performed on any other devices but\nthey are believed to be numerically accurate.\n\nThere are known numerical issues with CUDA Capability 7.x devices. To work\naround the issue, set the environment variable `XLA_FLAGS` to include\n`--xla_disable_hlo_passes=custom-kernel-fusion-rewriter`.\n\n## Compilation Buckets\n\nTo avoid excessive re-compilation of the model, AlphaFold 3 implements\ncompilation buckets: ranges of input sizes using a single compilation of the\nmodel.\n\nWhen featurising an input, AlphaFold 3 determines the smallest bucket the input\nfits into, then adds any necessary padding. This may avoid re-compiling the\nmodel when running inference on the input if it belongs to the same bucket as a\npreviously processed input.\n\nThe configuration of bucket sizes involves a trade-off: more buckets leads to\nmore re-compilations of the model, but less padding.\n\nBy default, the largest bucket size is 5,120 tokens. Processing inputs larger\nthan this maximum bucket size triggers the creation of a new bucket for exactly\nthat input size, and a re-compilation of the model. In this case, you may wish\nto redefine the compilation bucket sizes via the `--buckets` flag in\n`run_alphafold.py` to add additional larger bucket sizes. For example, suppose\nyou are running inference on inputs with token sizes: `5132, 5280, 5342`. Using\nthe default bucket sizes configured in `run_alphafold.py` will trigger three\nseparate model compilations, one for each unique token size. If instead you pass\nin the following flag to `run_alphafold.py`\n\n```\n--buckets 256,512,768,1024,1280,1536,2048,2560,3072,3584,4096,4608,5120,5376\n```\n\nwhen running inference on the above three input sizes, the model will be\ncompiled only once for the bucket size `5376`. **Note:** for this specific\nexample with input sizes `5132, 5280, 5342`, passing in `--buckets 5376` is\nsufficient to achieve the desired compilation behaviour. The provided example\nwith multiple buckets illustrates a more general solution suitable for diverse\ninput sizes.\n\n## Additional Flags\n\n### Compilation Time Workaround with XLA Flags\n\nTo work around a known XLA issue causing the compilation time to greatly\nincrease, the following environment variable must be set (it is set by default\nin the provided `Dockerfile`).\n\n```sh\nENV XLA_FLAGS=\"--xla_gpu_enable_triton_gemm=false\"\n```\n\n### CUDA Capability 7.x GPUs\n\nFor all CUDA Capability 7.x GPUs (e.g. V100) the environment variable\n`XLA_FLAGS` must be changed to include\n`--xla_disable_hlo_passes=custom-kernel-fusion-rewriter`. Disabling the Tritron\nGEMM kernels is not necessary as they are not supported for such GPUs.\n\n```sh\nENV XLA_FLAGS=\"--xla_disable_hlo_passes=custom-kernel-fusion-rewriter\"\n```\n\n### GPU Memory\n\nThe following environment variables (set by default in the `Dockerfile`) enable\nfolding a single input of size up to 5,120 tokens on a single A100 (80 GB) or a\nsingle H100 (80 GB):\n\n```sh\nENV XLA_PYTHON_CLIENT_PREALLOCATE=true\nENV XLA_CLIENT_MEM_FRACTION=0.95\n```\n\n#### Unified Memory\n\nIf you would like to run AlphaFold 3 on inputs larger than 5,120 tokens, or on a\nGPU with less memory (an A100 with 40 GB of memory, for instance), we recommend\nenabling unified memory. Enabling unified memory allows the program to spill GPU\nmemory to host memory if there isn't enough space. This prevents an OOM, at the\ncost of making the program slower by accessing host memory instead of device\nmemory. To learn more, check out the\n[NVIDIA blog post](https://developer.nvidia.com/blog/unified-memory-cuda-beginners/).\n\nYou can enable unified memory by setting the following environment variables in\nyour `Dockerfile`:\n\n```sh\nENV XLA_PYTHON_CLIENT_PREALLOCATE=false\nENV TF_FORCE_UNIFIED_MEMORY=true\nENV XLA_CLIENT_MEM_FRACTION=3.2\n```\n\n### JAX Persistent Compilation Cache\n\nYou may also want to make use of the JAX persistent compilation cache, to avoid\nunnecessary recompilation of the model between runs. You can enable the\ncompilation cache with the `--jax_compilation_cache_dir <YOUR_DIRECTORY>` flag\nin `run_alphafold.py`.\n\nMore detailed instructions are available in the\n[JAX documentation](https://jax.readthedocs.io/en/latest/persistent_compilation_cache.html#persistent-compilation-cache),\nand more specifically the instructions for use on\n[Google Cloud](https://jax.readthedocs.io/en/latest/persistent_compilation_cache.html#persistent-compilation-cache).\nIn particular, note that if you would like to make use of a non-local\nfilesystem, such as Google Cloud Storage, you will need to install\n[`etils`](https://github.com/google/etils) (this is not included by default in\nthe AlphaFold 3 Docker container).\n"
  },
  {
    "path": "fetch_databases.sh",
    "content": "#!/bin/bash\n# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nset -euo pipefail\n\nreadonly db_dir=${1:-$HOME/public_databases}\n\nfor cmd in wget tar zstd ; do\n  if ! command -v \"${cmd}\" > /dev/null 2>&1; then\n    echo \"${cmd} is not installed. Please install it.\"\n    exit 1\n  fi\ndone\n\necho \"Fetching databases to ${db_dir}\"\nmkdir -p \"${db_dir}\"\n\nreadonly SOURCE=https://storage.googleapis.com/alphafold-databases/v3.0\n\necho \"Start Fetching and Untarring 'pdb_2022_09_28_mmcif_files.tar'\"\nwget --quiet --output-document=- \\\n    \"${SOURCE}/pdb_2022_09_28_mmcif_files.tar.zst\" | \\\n    tar --no-same-owner --no-same-permissions \\\n    --use-compress-program=zstd -xf - --directory=\"${db_dir}\" &\n\nfor NAME in mgy_clusters_2022_05.fa \\\n            bfd-first_non_consensus_sequences.fasta \\\n            uniref90_2022_05.fa uniprot_all_2021_04.fa \\\n            pdb_seqres_2022_09_28.fasta \\\n            rnacentral_active_seq_id_90_cov_80_linclust.fasta \\\n            nt_rna_2023_02_23_clust_seq_id_90_cov_80_rep_seq.fasta \\\n            rfam_14_9_clust_seq_id_90_cov_80_rep_seq.fasta ; do\n  echo \"Start Fetching '${NAME}'\"\n  wget --quiet --output-document=- \"${SOURCE}/${NAME}.zst\" | \\\n      zstd --decompress > \"${db_dir}/${NAME}\" &\ndone\n\nwait\necho \"Complete\"\n"
  },
  {
    "path": "legal/WEIGHTS_PROHIBITED_USE_POLICY-Bahasa-Indonesia.md",
    "content": "# KEBIJAKAN PENGGUNAAN TERLARANG UNTUK PARAMETER MODEL ALPHAFOLD 3\n\nTerakhir diubah: 2024-11-09\n\nAlphaFold 3 dapat membantu Anda mempercepat riset ilmiah dengan memprediksi\nstruktur 3D molekul biologis. Google menyediakan Aset AlphaFold tanpa biaya\nuntuk penggunaan non-komersial tertentu, sesuai dengan pembatasan yang\nditetapkan di bawah. Kebijakan ini menggunakan persyaratan yang sama dengan\n[Persyaratan Penggunaan Parameter Model AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_TERMS_OF_USE-Bahasa-Indonesia.md).\n\n**Anda tidak boleh mengakses atau menggunakan, atau mengizinkan orang lain\nmengakses atau menggunakan Aset AlphaFold 3:**\n\n1.  **Atas nama organisasi komersial atau sehubungan dengan aktivitas komersial\n    apa pun, termasuk riset atas nama organisasi komersial.**\n\n    1.  Artinya, hanya organisasi non-komersial (*yaitu*, universitas,\n        organisasi non-profit dan institusi riset, serta lembaga pendidikan,\n        jurnalistik, dan pemerintah) yang dapat menggunakan Aset AlphaFold 3\n        untuk aktivitas non-komersial mereka. Aset AlphaFold 3 tidak tersedia\n        untuk jenis organisasi lainnya, meskipun organisasi tersebut melakukan\n        pekerjaan non-komersial.\n\n    2.  Jika Anda adalah peneliti yang berafiliasi dengan organisasi\n        non-komersial, Anda dapat menggunakan Aset AlphaFold 3 untuk riset\n        terafiliasi non-komersial Anda, dengan syarat Anda bukan organisasi\n        komersial atau bertindak atas nama organisasi komersial.\n\n    3.  Anda tidak boleh membagikan Aset AlphaFold 3 kepada organisasi komersial\n        mana pun atau menggunakan Aset AlphaFold 3 dengan cara yang akan memberi\n        organisasi komersial hak apa pun atas Aset ini. Satu-satunya\n        pengecualian adalah menyediakan Output secara publik (termasuk secara\n        tidak langsung kepada organisasi komersial) melalui publikasi ilmiah\n        atau rilis open source atau menggunakannya untuk mendukung jurnalisme,\n        yang masing-masing diizinkan.\n\n2.  **Untuk menyebarkan misinformasi, memberikan pernyataan tidak benar, atau\n    menyesatkan pengguna**, termasuk:\n\n    1.  menyediakan informasi palsu atau tidak akurat sehubungan dengan akses ke\n        atau penggunaan AlphaFold 3 atau Output oleh Anda, termasuk mengakses\n        atau menggunakan Parameter Model atas nama organisasi tanpa memberi tahu\n        kami atau mengirimkan permintaan untuk mengakses Parameter Model di mana\n        Google telah melarang penggunaan AlphaFold 3 oleh Anda secara\n        keseluruhan atau sebagian (termasuk yang disediakan melalui\n        [Server AlphaFold](https://alphafoldserver.com/about));\n\n    2.  memberikan pernyataan tidak benar tentang hubungan Anda dengan kami;\n        termasuk dengan menggunakan merek dagang, nama dagang, atau logo Google,\n        atau menyiratkan dukungan oleh Google tanpa seizin Google - Tidak ada di\n        dalam Persyaratan memberikan izin semacam itu;\n\n    3.  memberikan pernyataan tidak benar tentang asal AlphaFold 3 secara\n        keseluruhan atau sebagian;\n\n    4.  menyebarkan klaim menyesatkan tentang keahlian atau kemampuan, atau\n        terlibat dalam praktik profesional yang tidak sah atau tanpa lisensi,\n        khususnya di bidang yang sensitif (misalnya, kesehatan); atau\n\n    5.  membuat keputusan dalam ranah yang memengaruhi hak atau kesejahteraan\n        individu atau material (misalnya, layanan kesehatan).\n\n3.  **Untuk melakukan, mempromosikan, atau memfasilitasi aktivitas berbahaya,\n    ilegal, atau jahat, termasuk:**\n\n    1.  mempromosikan atau memfasilitasi penjualan, ataupun memberikan petunjuk\n        untuk membuat atau mengakses, zat, barang, atau layanan ilegal;\n\n    2.  menyalahgunakan, merugikan, mengganggu, atau mengacaukan layanan apa\n        pun, termasuk membuat atau mendistribusikan konten untuk aktivitas\n        penipuan atau penyebaran malware;\n\n    3.  membuat atau mendistribusikan konten, termasuk Output, yang menyalahi,\n        menyalahgunakan, atau melanggar hak individu atau entitas apa pun\n        (termasuk, tetapi tidak terbatas pada hak atas konten yang dilindungi\n        hak cipta); atau\n\n    4.  mencoba mengakali, atau dengan sengaja menyebabkan (secara langsung atau\n        tidak langsung) AlphaFold 3 untuk bertindak dengan cara yang melanggar\n        Persyaratan.\n\n**Anda tidak boleh atau mengizinkan orang lain:**\n\n1.  **Menggunakan Output guna melatih atau membuat model machine learning atau\n    teknologi terkait untuk prediksi struktur biomolekuler yang mirip dengan\n    AlphaFold 3 (\"Model Turunan\"),** termasuk melalui distilasi atau metode\n    lainnya. Untuk menegaskan, pembatasan penggunaan yang ditetapkan dalam\n    Persyaratan akan berlaku sepenuhnya untuk semua Model Turunan yang dibuat\n    dengan melanggar Persyaratan.\n\n2.  **Mendistribusikan Output tanpa memberikan pemberitahuan yang jelas bahwa\n    apa yang Anda Distribusikan disediakan berdasarkan dan tunduk pada\n    [Persyaratan Penggunaan Output AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n    serta tentang modifikasi apa pun yang Anda buat.**\n\n    1.  Artinya, jika Anda menghapus, atau menyebabkan penghapusan (misalnya\n        dengan menggunakan perangkat lunak pihak ketiga), pemberitahuan dan\n        syarat yang kami berikan saat Anda menghasilkan Output menggunakan\n        AlphaFold 3, Anda harus memastikan Distribusi Output berikutnya\n        menyertakan salinan\n        [Persyaratan Penggunaan Output AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n        dan file teks \"Persyaratan Penggunaan yang Mengikat secara Hukum\" yang\n        berisi pemberitahuan berikut:\n\n        \"*Dengan menggunakan informasi ini, Anda menyetujui Persayatan\n        Penggunaan Output AlphaFold 3 yang terdapat di\n        https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md.*\n\n        *Untuk meminta akses ke parameter model AlphaFold 3, ikuti proses yang\n        ditetapkan di https://github.com/google-deepmind/alphafold3. Anda hanya\n        dapat menggunakan parameter model ini jika menerimanya langsung dari\n        Google. Penggunaannya tunduk pada persyaratan penggunaan yang tersedia\n        di\n        https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.*\"\n\n    1.  Anda tidak boleh menyertakan persyaratan tambahan atau berbeda yang\n        bertentangan dengan\n        [Persyaratan Penggunaan Output AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\n3.  **Mendistribusikan Output, atau mengungkapkan temuan yang didapatkan dari\n    penggunaan AlphaFold 3 tanpa mengutip makalah kami**: [Abramson, J et al.\n    Accurate structure prediction of biomolecular interactions with AlphaFold\n    3.](https://www.nature.com/articles/s41586-024-07487-w). Untuk menegaskan,\n    hal ini merupakan persyaratan tambahan selain persyaratan pemberitahuan yang\n    ditetapkan di atas.\n\n4.  **Mengakali pembatasan akses terkait Parameter Model, termasuk menggunakan,\n    membagikan, atau menyediakan Parameter Model ketika Google belum mengizinkan\n    Anda secara tegas untuk melakukan hal tersebut.** Google akan memberikan\n    akses ke Parameter Model kepada:\n\n    1.  Anda untuk penggunaan pribadi Anda atas nama organisasi Anda, dimana\n        Anda tidak dapat membagikan salinan Parameter Model Anda kepada siapa\n        pun; atau\n\n    2.  perwakilan resmi organisasi Anda, dengan kewenangan hukum penuh untuk\n        mengikat organisasi tersebut pada Persyaratan ini. Dalam hal ini, Anda\n        dapat membagikan salinan Parameter Model milik organisasi tersebut\n        kepada karyawan, konsultan, kontraktor, serta agen organisasi\n        sebagaimana diizinkan oleh perwakilan tersebut.\n"
  },
  {
    "path": "legal/WEIGHTS_PROHIBITED_USE_POLICY-Espanol-Latinoamerica.md",
    "content": "# POLÍTICA DE USO PROHIBIDO DE PARÁMETROS DEL MODELO ALPHAFOLD 3\n\nÚltima modificación: 9 de noviembre de 2024\n\nAlphaFold 3 puede ayudar a acelerar la investigación científica, ya que predice\nla estructura 3D de moléculas biológicas. Google pone a disposición los Recursos\nde AlphaFold sin costo para determinados usos no comerciales de conformidad con\nlas restricciones que se establecen a continuación. Esta política usa los mismos\ntérminos definidos que en las\n[Condiciones de Uso de los Parámetros del Modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Espanol-Latinoamerica.md).\n\n**No debe acceder o utilizar ni permitir que otros accedan o utilicen los\nRecursos de AlphaFold 3 en los siguientes casos:**\n\n1.  **En nombre de una organización comercial o en conexión con cualquier\n    actividad comercial, incluida la investigación en nombre de organizaciones\n    comerciales.**\n\n    1.  Esto significa que solo las organizaciones no comerciales (*por\n        ejemplo*, universidades, institutos de investigación y organizaciones\n        sin fines de lucro, y organismos educativos, gubernamentales y\n        periodísticos) pueden usar los Recursos de AlphaFold 3 para sus\n        actividades no comerciales. Los Recursos de AlphaFold 3 no están\n        disponibles para ningún otro tipo de organización, aunque realicen\n        trabajos no comerciales.\n\n    2.  Si usted es un investigador afiliado de una organización no comercial,\n        dado que no pertenece a una organización comercial, puede usar los\n        Recursos de AlphaFold 3 para su investigación de afiliación no\n        comercial.\n\n    3.  No debe compartir los Recursos de AlphaFold 3 con ninguna organización\n        comercial ni usarlos de manera que otorgue a una organización comercial\n        algún derecho sobre estos. La única excepción es poner los Resultados a\n        disposición del público (lo que incluye indirectamente a las\n        organizaciones comerciales) a través de una publicación científica o una\n        publicación de código abierto, o utilizarlos para apoyar la actividad\n        periodística, opciones que están todas permitidas.\n\n2.  **Para desinformar, tergiversar o engañar, entre lo que se incluye lo\n    siguiente:**\n\n    1.  proporcionar información falsa o errónea en relación con su acceso o uso\n        de AlphaFold 3 o los Resultados, incluido el uso o acceso a los\n        Parámetros del Modelo en nombre de una organización sin informarnos o\n        enviarnos una solicitud para acceder a los Parámetros del Modelo cuando\n        Google le ha prohibido el uso de AlphaFold 3 de forma parcial o total\n        (incluido como se pone a disposición a través de\n        [AlphaFold Server](https://alphafoldserver.com/about)),\n\n    2.  tergiversar su relación con nosotros, incluido el uso de marcas,\n        comerciales, nombres comerciales o logotipos de Google, o sugerir\n        recomendación por parte de Google sin el permiso de Google para hacerlo\n        (ningún punto de las Condiciones otorga ese permiso)\n\n    3.  tergiversar el origen de AlphaFold 3 de forma parcial o total,\n\n    4.  distribuir declaraciones engañosas sobre experiencia o capacidad, o\n        participar en la práctica de cualquier profesión sin autorización o\n        licencia, en particular si se trata de áreas sensibles (*p. ej.*, la de\n        la salud), o\n\n    5.  tomar decisiones en ámbitos que afectan el bienestar o los derechos\n        materiales o individuales (*p. ej.*, atención médica).\n\n3.  **Para realizar, promover o facilitar actividades peligrosas, ilegales o\n    maliciosas, entre lo que se incluye lo siguiente:**\n\n    1.  promover o facilitar la venta de sustancias, bienes o servicios\n        ilegales, o bien proporcionar instrucciones para sintetizarlos o acceder\n        a ellos,\n\n    2.  abusar, interferir, dañar o interrumpir servicios, lo que incluye\n        generar o distribuir contenido para actividades engañosas o fraudulentas\n        o software malicioso,\n\n    3.  generar o distribuir contenido, incluidos los Resultados, que incumpla,\n        se apropie indebidamente o infrinja los derechos de un individuo o una\n        entidad (incluidos, sin limitaciones, los derechos de contenido\n        protegido por derechos de autor), o\n\n    4.  intentar eludir o causar de forma intencional (directa o indirectamente)\n        que AlphaFold 3 actúe de manera que incumpla las Condiciones.\n\n**No debe utilizar ni permitir que otros:**\n\n1.  **Utilicen los Resultados para entrenar o crear modelos de aprendizaje\n    automático o tecnología relacionada para la predicción de estructura\n    biomolecular similar a la de AlphaFold 3 (\"Modelos Derivados\"),** lo que\n    incluye métodos a través de destilación o de otro tipo. En aras de evitar\n    dudas, las restricciones de uso establecidas en las Condiciones se aplicarán\n    en su totalidad a cualquier Modelo Derivado que se cree incumpliendo las\n    Condiciones.\n\n2.  **Distribuir los Resultados sin brindar un aviso claro de que lo que usted\n    Distribuye se proporciona de acuerdo con las\n    [Condiciones de Uso de los Resultados de AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n    y cualquier modificación que usted haga.**\n\n    1.  Esto quiere decir que si usted quita o hace que se quiten (por ejemplo,\n        con software de terceros) los avisos y las condiciones que\n        proporcionamos cuando genera Resultados usando AlphaFold 3, debe\n        asegurarse de que cualquier Distribución adicional de los Resultados\n        esté acompañada por una copia de las\n        [Condiciones de Uso de Resultados de AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n        y un archivo de texto llamado \"Condiciones de Uso Legalmente\n        Vinculantes\" que contenga el siguiente aviso:\n\n        \"*Si utiliza esta información, usted acepta las Condiciones de Uso de\n        Resultados de AlphaFold 3, que se encuentran en\n        https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md.*\n\n        *Para solicitar acceso a los parámetros del modelo AlphaFold 3, siga el\n        proceso que se establece en\n        https://github.com/google-deepmind/alphafold3. Solo puede usarlos si los\n        recibe directamente de Google. El uso está sujeto a las Condiciones de\n        Uso disponibles en\n        https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.*\"\n\n    2.  No debe incluir ninguna condición adicional o diferente que entre en\n        conflicto con las\n        [Condiciones de Uso de Resultados de AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\n3.  **Distribuir Resultados, o divulgar descubrimientos que surjan del uso de\n    AlphaFold 3 sin citar nuestro artículo** [Abramson, J et al. Accurate\n    structure prediction of biomolecular interactions with AlphaFold 3\n    (Predicción precisa de la estructura de las interacciones biomoleculares con\n    AlphaFold 3). *Nature*\n    (2024)](https://www.nature.com/articles/s41586-024-07487-w). En aras de\n    evitar dudas, este es un requisito adicional a los requisitos de aviso que\n    se establecen más arriba.\n\n4.  **Eludir las restricciones de acceso relacionadas con los Parámetros del\n    Modelo, lo que incluye utilizar, compartir o poner a disponibilidad los\n    Parámetros del Modelo cuando no recibió autorización expresa por parte de\n    Google para hacerlo.** Google otorgará acceso a los Parámetros del Modelo a:\n\n    1.  Usted para su uso individual o para usarlos en nombre de su\n        organización, en cuyo caso no puede compartir su copia de los Parámetros\n        del Modelo con nadie más, o\n\n    2.  Un representante autorizado de su organización con autoridad legal total\n        para obligar a esa organización con estas Condiciones (en cuyo caso\n        usted podrá compartir la copia de los Parámetros del Modelo de esa\n        organización con empleados, consultores, contratistas y agentes de la\n        organización, según lo autorizado por ese representante)\n"
  },
  {
    "path": "legal/WEIGHTS_PROHIBITED_USE_POLICY-Francais-Canada.md",
    "content": "# POLITIQUE D'UTILISATION INTERDITE DES PARAMÈTRES DU MODÈLE ALPHAFOLD 3\n\nDernière modification: 2024-11-09\n\nAlphaFold 3 peut vous aider à accélérer la recherche scientifique en prévoyant\nla structure 3D des molécules biologiques. Pour certaines utilisations non\ncommerciales, Google met gratuitement à disposition les Éléments d'AlphaFold\ndans le respect des restrictions énoncées ci-dessous. Cette politique utilise\nles mêmes conditions d'utilisation telles que définies dans les\n[Conditions d'utilisation des paramètres du modèle AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Francais-Canada.md).\n\n**Vous ne devez pas accéder aux Éléments d'AlphaFold 3 ni les utiliser ou\npermettre à d'autres personnes de le faire:**\n\n1.  **Au nom d'une organisation commerciale ou en connexion avec des activités\n    commerciales, y compris la recherche au nom d'organisations commerciales.**\n\n    1.  Cela signifie que seules les organisations non commerciales (*c.-à-d*.\n        universités, organismes sans but lucratif, instituts de recherche et\n        organismes éducatifs, journalistiques et gouvernementaux) peuvent\n        utiliser les Éléments d'AlphaFold 3 dans le cadre de leurs activités non\n        commerciales. Les Éléments AlphaFold 3 ne sont pas offerts à d'autres\n        types d'organisations, même si elles effectuent des travaux non\n        commerciaux.\n\n    2.  Si vous êtes un chercheur affilié à une organisation non commerciale, à\n        la condition que **vous ne soyez pas une organisation commerciale ou que\n        vous n'agissez pas au nom d'une organisation commerciale**, vous pouvez\n        utiliser les Éléments AlphaFold 3 pour vos recherches affiliées non\n        commerciales.\n\n    3.  Vous ne devez pas partager les Éléments d'AlphaFold 3 avec une\n        organisation commerciale ni les utiliser d'une manière qui confère à une\n        organisation commerciale des droits sur ces éléments. La seule exception\n        est la mise à disposition publique des Résultats (y compris\n        indirectement à des organisations commerciales) par le biais d'une\n        publication scientifique ou d'une version open source, ou l'utilisation\n        de ces résultats pour soutenir le journalisme, qui sont toutes deux\n        autorisées.\n\n2.  **Pour désinformer ou déformer ou induire en erreur**, y compris:\n\n    1.  fournir des informations fausses ou inexactes concernant votre accès à\n        AlphaFold 3 ou à ses Résultats, ou à l'utilisation de ceux-ci, y compris\n        l'accès aux Paramètres du modèle ou l'utilisation de ceux-ci au nom\n        d'une organisation sans nous en informer ou sans soumettre une demande\n        d'accès aux Paramètres du modèle lorsque Google a interdit l'utilisation\n        d'AlphaFold 3 en totalité ou en partie (y compris tel que mis à\n        disposition par le biais du\n        [Serveur d'AlphaFold](https://alphafoldserver.com/about));\n\n    2.  présenter de manière inexacte votre relation avec nous, y compris en\n        utilisant les marques de commerce, les noms commerciaux et les logos de\n        Google ou en suggérant l'approbation de Google sans son autorisation.\n        Rien dans les présentes Conditions ne permet d'accorder une telle\n        autorisation;\n\n    3.  présenter de manière inexacte l'origine d'AlphaFold 3, en tout ou en\n        partie;\n\n    4.  distribuer des déclarations trompeuses quant au savoir-faire ou aux\n        capacités, ou exercer une activité professionnelle sans autorisation ou\n        sans licence, en particulier dans des domaines sensibles (*p. ex.* les\n        soins de santé); ou\n\n    5.  prendre des décisions dans des domaines qui touchent les droits\n        matériels ou individuels ou le bien-être (*p. ex.* les soins de santé).\n\n3.  **Pour effectuer ou faciliter des activités dangereuses, illégales ou\n    malveillantes**, y compris:\n\n    1.  la promotion ou l'aide à la vente, ou la fourniture d'instructions pour\n        synthétiser ou accéder à des substances, des biens ou des services\n        illégaux, ou l'accès à ces derniers;\n\n    2.  abuser, nuire, interférer ou perturber tout service, y compris en\n        générant ou en distribuant du contenu pour des activités trompeuses ou\n        frauduleuses ou pour des logiciels malveillants;\n\n    3.  générer ou distribuer tout contenu, y compris des Résultats, qui\n        enfreigne, détourne ou viole de toute autre manière les droits d'un\n        individu ou d'une entité (y compris, mais sans s'y limiter, les droits\n        sur les contenus protégés par des droits d'auteur); ou\n\n    4.  tenter de contourner, ou causer intentionnellement (directement ou\n        indirectement) AlphaFold 3 à agir d'une manière qui contrevient aux\n        Conditions.\n\n**Vous ne devez pas, et vous ne devez pas permettre aux autres:**\n\n1.  **D'utiliser les Résultats pour entraîner ou créer des modèles\n    d'apprentissage automatique ou une technologie connexe pour la prédiction de\n    la structure biomoléculaire semblable à AlphaFold 3 (« Modèles dérivés »)**,\n    y compris par distillation ou d'autres méthodes. Pour éviter le doute, les\n    restrictions d'utilisation énoncées dans les présentes Conditions\n    s'appliquent intégralement à tout Modèle dérivé créé en violation des\n    présentes Conditions.\n\n2.  **De Distribuer les Résultats sans indiquer clairement que ce que vous\n    Distribuez est fourni dans le cadre et sous réserve des\n    [Conditions d'utilisation des résultats d'AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n    et de toutes les modifications que vous y apportez.**\n\n    1.  Cela signifie que si vous retirez, ou faites retirer (par exemple en\n        utilisant un logiciel tiers), les avis et les conditions d'utilisation\n        que nous fournissons lorsque vous générez des Résultats à l'aide\n        d'AlphaFold 3, vous devez vous assurer que toute Distribution ultérieure\n        de Résultats est accompagnée d'une copie des\n        [Conditions d'utilisation des résultats d'AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n        et d'un fichier texte des « Conditions d'utilisation légalement\n        contraignantes » qui contient l'avis suivant:\n\n        « *En utilisant cette information,vous acceptez les Conditions\n        d'utilisation des résultats d'AlphaFold 3 qui se trouve à l'adresse\n        https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md.*\n\n        *Pour demander l'accès aux paramètres du modèle AlphaFold 3, suivez le\n        processus décrit à l'adresse\n        https://github.com/google-deepmind/alphafold3. Vous ne pouvez les\n        utiliser que si vous les recevez directement de Google. L'utilisation\n        est soumise aux conditions d'utilisation disponibles à l'adresse\n        https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.*\n        »\n\n    2.  Vous ne devez pas inclure de conditions d'utilisation supplémentaires ou\n        différentes qui seraient en contradiction avec les\n        [Conditions d'utilisation des résultats d'AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\n3.  **De Distribuer les Résultats ou de divulguer les résultats découlant de\n    l'utilisation d'AlphaFold 3 sans citer notre article:** « [Abramson, J et\n    al. Accurate structure prediction of biomolecular interactions with\n    AlphaFold 3. *Nature*\n    (2024)](https://www.nature.com/articles/s41586-024-07487-w) ». Pour éviter\n    toute ambiguïté, il s'agit d'une exigence supplémentaire par rapport aux\n    exigences de notification énoncées ci-dessus.\n\n4.  **De contourner les restrictions d'accès relatives aux Paramètres du modèle,\n    y compris l'utilisation, le partage ou la mise à disposition des Paramètres\n    du modèle alors que vous n'y avez pas été expressément autorisé par\n    Google.** Google accordera l'accès aux Paramètres du modèle à soit:\n\n    1.  vous, pour votre utilisation individuelle au nom de votre organisation,\n        auquel cas vous ne pouvez pas partager votre copie des Paramètres du\n        modèle avec quelqu'un d'autre; ou\n\n    2.  un représentant autorisé de votre organisation, disposant de la pleine\n        autorité légale pour lier cette organisation aux présentes Conditions,\n        auquel cas vous pouvez partager la copie des Paramètres du modèle de\n        cette organisation avec les employés, les consultants, les entrepreneurs\n        et les agents de l'organisation, tel qu'autorisé par ce représentant.\n"
  },
  {
    "path": "legal/WEIGHTS_PROHIBITED_USE_POLICY-Portugues-Brazil.md",
    "content": "# POLÍTICA DE USO PROIBIDO DOS PARÂMETROS DO MODELO ALPHAFOLD 3\n\nÚltima modificação: 2024-11-09\n\nO AlphaFold 3 ajuda você a acelerar pesquisas científicas ao prever a estrutura\n3D de moléculas biológicas. O Google disponibiliza os Recursos do AlphaFold sem\ncusto financeiro para certos usos não comerciais, de acordo com as restrições\nabaixo. Esta política usa os mesmos termos definidos nos\n[Termos de Uso dos Parâmetros do Modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Portugues-Brazil.md).\n\n**Você não deve acessar, usar nem permitir que outras pessoas acessem ou usem os\nRecursos do AlphaFold 3 nos seguintes casos:**\n\n1.  **Em nome de uma organização comercial ou em associação a atividades\n    comerciais, incluindo pesquisas em nome de organizações comerciais.**\n\n    1.  Isso significa que apenas organizações não comerciais (*ou seja*,\n        universidades, organizações sem fins lucrativos, institutos de pesquisa\n        e órgãos governamentais, educacionais e de notícias) podem usar os\n        Recursos do AlphaFold 3 para suas atividades não comerciais. Os Recursos\n        do AlphaFold 3 não estão disponíveis para qualquer outro tipo de\n        organização, mesmo as que conduzem trabalhos não comerciais.\n\n    2.  Se você for um pesquisador afiliado a uma organização não comercial,\n        você tem permissão para usar esses recursos em sua pesquisa afiliada a\n        organizações sem fins lucrativos, desde que você não seja uma\n        organização comercial nem esteja agindo em nome de uma.\n\n    3.  É proibido compartilhar os Recursos do AlphaFold 3 com qualquer\n        organização comercial ou usar os Recursos do AlphaFold 3 de modo a\n        conceder a uma organização comercial qualquer direito em relação a eles.\n        A única exceção é a disponibilização da Saída para o público (incluindo\n        indiretamente para organizações comerciais) mediante uma publicação\n        científica, versão de código aberto ou em apoio ao jornalismo, o que é\n        permitido.\n\n2.  **Para gerar desinformação, deturpar ou enganar**, incluindo:\n\n    1.  fornecer informações falsas ou imprecisas em relação ao seu acesso ou\n        uso do AlphaFold 3 ou da Saída gerada, incluindo acessar ou usar os\n        Parâmetros do Modelo em nome de uma organização sem nos informar ou\n        solicitar o acesso aos Parâmetros do Modelo caso o Google tenha proibido\n        totalmente ou parcialmente seu uso do AlphaFold 3 (incluindo conforme\n        disponibilizado pelo\n        [Servidor do AlphaFold](https://alphafoldserver.com/about));\n\n    2.  deturpar sua relação conosco, incluindo ao usar marcas registradas,\n        nomes comerciais e logotipos do Google, ou sugerir o endosso do Google\n        sem a nossa permissão – nada nestes Termos concede tal permissão;\n\n    3.  deturpar a origem do AlphaFold 3 total ou parcialmente;\n\n    4.  distribuir declarações enganosas sobre conhecimento ou capacidade, ou\n        participar do exercício não autorizado ou não licenciado de qualquer\n        profissão, especialmente em áreas sensíveis (*por exemplo*, saúde); ou\n\n    5.  tomar decisões em áreas que afetam o bem-estar ou direitos materiais ou\n        individuais (*por exemplo*, saúde).\n\n3.  **Para realizar, promover ou facilitar atividades perigosas, ilegais ou\n    maliciosas**, incluindo:\n\n    1.  promover ou facilitar a venda ou fornecer instruções para sintetizar ou\n        ter acesso a substâncias, produtos ou serviços ilegais;\n\n    2.  abusar, prejudicar, interferir ou interromper quaisquer serviços,\n        incluindo gerar ou distribuir conteúdo para atividades enganosas ou\n        fraudulentas ou malware;\n\n    3.  gerar ou distribuir qualquer conteúdo, incluindo a Saída, que infrinja,\n        se aproprie indevidamente ou viole de outra forma os direitos de\n        qualquer indivíduo ou entidade (incluindo, mas não se limitando a\n        direitos autorais do conteúdo); ou\n\n    4.  tentar burlar ou levar intencionalmente (direta ou indiretamente) o\n        AlphaFold 3 a agir de maneira que viole os Termos.\n\n**Não é permitido que você nem outras pessoas:**\n\n1.  **Usem os Resultados para treinar ou criar modelos de aprendizado de máquina\n    ou tecnologias relacionadas para previsão de estrutura biomolecular\n    semelhante ao AlphaFold 3 (\"Modelos Derivados\"),** incluindo pela destilação\n    ou outros métodos. Para evitar dúvidas, as restrições de uso definidas nos\n    Termos são totalmente válidas para quaisquer Modelos Derivados criados em\n    violação dos Termos.\n\n2.  **Distribuam a Saída sem apresentar aviso evidente de que o que você\n    Distribui é oferecido de acordo com e sujeito aos\n    [Termos de Uso dos Resultados do AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n    e quaisquer modificações realizadas.**\n\n    1.  Isso significa que, se você remover ou causar a remoção (por exemplo,\n        usando um software de terceiros) dos avisos e termos que fornecemos\n        quando você gera Resultados usando o AlphaFold 3, você precisa garantir\n        que a Distribuição da Saída posterior esteja acompanhada de uma cópia\n        dos\n        [Termos de Uso dos Resultados do AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md)\n        e de um arquivo de texto \"Termos de Uso Juridicamente Vinculativos\" com\n        o seguinte aviso:\n\n        \"*Ao usar estas informações, você concorda com os Termos de Uso da Saída\n        do AlphaFold 3 disponíveis em\n        https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md.*\n\n        *Para solicitar acesso aos parâmetros do modelo AlphaFold 3, siga o\n        processo descrito em https://github.com/google-deepmind/alphafold3. Você\n        só pode usar os parâmetros se os receber diretamente do Google. O uso\n        está sujeito aos Termos de Uso disponíveis em\n        https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.*\"\n\n    2.  É proibido incluir quaisquer termos adicionais ou diferentes que entrem\n        em conflito com os\n        [Termos de Uso da Saída do AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\n3.  **Distribuam a Saída ou divulguem descobertas provenientes do uso do\n    AlphaFold 3 sem citar nosso artigo:** [Abramson, J et al. Accurate structure\n    prediction of biomolecular interactions with AlphaFold 3. *Nature*\n    (2024)](https://www.nature.com/articles/s41586-024-07487-w). Para evitar\n    dúvidas, esse é um requisito adicional às exigências de aviso definidas\n    acima.\n\n4.  **Burlem as restrições de acesso relacionadas aos Parâmetros do Modelo,\n    incluindo usar, compartilhar ou disponibilizar os Parâmetros do Modelo sem\n    autorização explícita do Google.** O Google concederá acesso aos Parâmetros\n    do Modelo a:\n\n    1.  você, para uso individual em nome da sua organização, sendo proibido\n        compartilhar sua cópia dos Parâmetros do Modelo com qualquer indivíduo;\n        ou\n\n    2.  um representante autorizado da sua organização, com autoridade legal\n        total para vincular tal organização a estes Termos, sendo permitido\n        compartilhar a cópia dos Parâmetros do Modelo pertencente a essa\n        organização com funcionários, consultores, prestadores de serviço e\n        agentes da organização, conforme autorizado por esse representante.\n"
  },
  {
    "path": "legal/WEIGHTS_TERMS_OF_USE-Bahasa-Indonesia.md",
    "content": "# PERSYARATAN PENGGUNAAN PARAMETER MODEL ALPHAFOLD 3\n\nTerakhir diubah: 09-11-2024\n\n[AlphaFold 3](https://blog.google/technology/ai/google-deepmind-isomorphic-alphafold-3-ai-model/)\nadalah model AI yang dikembangkan oleh\n[Google DeepMind](https://deepmind.google/) dan\n[Isomorphic Labs](https://www.isomorphiclabs.com/). Program ini membuat prediksi\nstruktur 3D molekul biologis, serta memberikan keyakinan model untuk prediksi\nstruktur tersebut. Kami membuat parameter model terlatih dan output yang\ndihasilkan menggunakan aset yang tersedia tanpa biaya untuk penggunaan\nnon-komersial tertentu, sehubungan dengan persyaratan penggunaan ini dan\n[Kebijakan Penggunaan Terlarang untuk Parameter Model AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Bahasa-Indonesia.md).\n\n**Hal penting yang perlu diketahui saat menggunakan parameter dan output model\nAlphaFold 3**\n\n1.  Parameter dan output model AlphaFold 3 hanya tersedia untuk penggunaan\n    non-komersial oleh, atau atas nama, organisasi non-komersial (*yaitu*\n    universitas, organisasi nonprofit dan institusi riset, serta lembaga\n    pendidikan, jurnalistik, dan pemerintah). Jika Anda adalah peneliti yang\n    berafiliasi dengan organisasi non-komersial, dengan syarat Anda bukan\n    organisasi komersial atau bertindak atas nama organisasi komersial, artinya\n    Anda dapat menggunakannya untuk riset terafiliasi non-komersial Anda.\n2.  Anda tidak boleh menggunakan atau mengizinkan orang lain menggunakan:\n    1.  Parameter atau Output model AlphaFold 3 sehubungan dengan aktivitas\n        komersial apa pun, termasuk riset atas nama organisasi komersial; atau\n    1.  Output AlphaFold 3 untuk melatih model machine learning atau teknologi\n        terkait untuk prediksi struktur biomolekuler yang mirip dengan AlphaFold\n        3\n3.  Anda *tidak boleh* mempublikasikan atau membagikan parameter model AlphaFold\n    3, kecuali membagikannya dalam organisasi Anda sesuai dengan Persyaratan\n    ini.\n4.  Anda *dapat* mempublikasikan, membagikan, dan mengadaptasi *output*\n    AlphaFold 3 sesuai dengan Persyaratan ini, termasuk persyaratan untuk\n    memberikan pemberitahuan yang jelas atas setiap modifikasi yang Anda buat\n    dan bahwa penggunaan yang sedang berlangsung atas output AlphaFold 3 dan\n    turunannya tunduk pada\n    [Persyaratan Penggunaan Output AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\nDengan menggunakan, mereproduksi, memodifikasi, menjalankan, mendistribusikan,\natau menampilkan bagian atau elemen apa pun dari Parameter Model (sebagaimana\ndidefinisikan di bawah) atau menyetujui persyaratan perjanjian ini, Anda setuju\nuntuk terikat oleh (1) persyaratan penggunaan ini, dan (2)\n[Kebijakan Penggunaan Terlarang untuk Parameter Model AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Bahasa-Indonesia.md)\nyang disertakan di sini sebagai referensi (secara kolektif disebut\n\"**Persyaratan**\"), dalam setiap kasus (a) sebagaimana diubah dari waktu ke\nwaktu sesuai dengan Persyaratan, serta (b) antara Anda dan (i) Google Ireland\nLimited, jika Anda berasal dari negara di Wilayah Ekonomi Eropa atau Swiss, atau\n(ii) Google LLC, jika Anda berasal dari wilayah lain.\n\nAnda mengonfirmasi bahwa Anda berwenang baik secara eksplisit maupun implisit\nuntuk masuk, dan sedang memasuki, ke dalam Persyaratan ini sebagai karyawan yang\nmewakili, atau atas nama, organisasi Anda.\n\nHarap baca Persyaratan ini dengan cermat. Persyaratan ini menetapkan apa yang\ndapat Anda harapkan dari kami saat Anda mengakses dan menggunakan Aset AlphaFold\n3 (sebagaimana di definisikan di bawah), dan apa yang Google harapkan dari Anda.\nPenyebutan \"**Anda**\" di sini mengacu pada individu atau organisasi yang\nmenggunakan Aset AlphaFold 3. Penyebutan \"**kami**\", \"**kita**\", atau\n\"**Google**\" di sini mengacu pada entitas milik grup perusahaan Google, yaitu\nGoogle LLC beserta afiliasinya.\n\n## 1. Definisi Penting\n\nSebagaimana digunakan dalam Persyaratan ini:\n\n\"**AlphaFold 3**\" adalah: (a) kode sumber AlphaFold 3 yang disediakan\n[di sini](https://github.com/google-deepmind/alphafold3/) dan yang dilisensikan\nberdasarkan persyaratan lisensi Creative Commons\nAttribution-NonCommercial-Sharealike 4.0 International (CC-BY-NC-SA 4.0) dan\nkode sumber turunan apa pun, serta (b) Parameter Model.\n\n\"**Aset AlphaFold 3**\" adalah Parameter dan output Model.\n\n\"**Distribusi**\" atau \"**Mendistribusikan**\" adalah mengirimkan,\nmempublikasikan, atau membagikan Output secara publik atau kepada orang lain.\n\n\"**Parameter Model**\" adalah bobot dan parameter model terlatih yang disediakan\noleh Google bagi organisasi (atas pertimbangannya sendiri) untuk digunakan\nsesuai dengan Persyaratan ini, bersama dengan (a) modifikasi pada bobot dan\nparameter tersebut, (b) pekerjaan yang didasarkan pada bobot dan parameter\ntersebut, atau (c) kode atau model machine learning lainnya yang menggabungkan,\nseluruh atau sebagian, bobot dan parameter tersebut.\n\n\"**Output**\" adalah prediksi struktur serta semua informasi tambahan dan\ninformasi terkait yang disediakan oleh AlphaFold 3 atau penggunaan Parameter\nModel, bersama dengan representasi visual, prediksi komputasional, deskripsi,\nmodifikasi, salinan, atau adaptasi apa pun yang secara substansial berasal dari\nOutput.\n\n\"**Termasuk**\" adalah \"**termasuk, tetapi tidak terbatas pada**\".\n\n## 2. Mengakses dan menggunakan Aset AlphaFold 3\n\nDengan tunduk pada kepatuhan Anda terhadap Persyaratan, termasuk\n[Kebijakan Penggunaan Terlarang untuk Parameter Model AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Bahasa-Indonesia.md),\nAnda dapat mengakses, menggunakan, dan memodifikasi Aset AlphaFold 3 serta\nMendistribusikan Output sebagaimana ditetapkan dalam Persyaratan ini. Kami\nmemberi Anda lisensi non-eksklusif, bebas royalti, dapat dibatalkan, tidak dapat\ndipindahtangankan, dan tidak dapat disublisensikan (kecuali secara tegas\ndiizinkan dalam Persyaratan ini) untuk hak atas kekayaan intelektual apa pun\nyang kami miliki dalam Aset AlphaFold sejauh diperlukan untuk tujuan ini. Untuk\nmemverifikasi akses dan penggunaan AlphaFold 3 oleh Anda, kami dapat meminta\nAnda memberikan informasi tambahan dari waktu ke waktu, termasuk verifikasi\nnama, organisasi, serta informasi identitas Anda lainnya.\n\nDengan mengakses, menggunakan, atau memodifikasi Aset AlphaFold 3,\nMendistribusikan Output, atau meminta akses ke Parameter Model, Anda menyatakan\ndan menjamin bahwa (a) Anda memiliki kuasa dan wewenang penuh untuk menyetujui\nPersyaratan ini (termasuk telah berusia dewasa), (b) Google sebelumnya tidak\npernah menghentikan akses dan hak Anda untuk menggunakan AlphaFold 3 (termasuk\nyang disediakan melalui [Server AlphaFold](https://alphafoldserver.com/about))\nkarena pelanggaran Anda terhadap persyaratan penggunaan yang berlaku, (c)\nmenyetujui atau menjalankan hak dan kewajiban Anda berdasarkan Persyaratan ini\ntidak akan melanggar hak pihak ketiga mana pun atau perjanjian yang Anda\nsepakati dengan pihak ketiga, (d) informasi apa pun yang Anda berikan ke Google\nsehubungan dengan AlphaFold 3, termasuk (jika berlaku) untuk meminta akses ke\nParameter Model, sudah benar dan aktual, serta (e) Anda bukan (i) berstatus\nwarga dari negara yang diembargo, (ii) berstatus menetap di negara yang\ndiembargo Amerika Serikat, atau (iii) dinyatakan dilarang oleh program sanksi\ndan kontrol ekspor yang berlaku untuk mengakses, menggunakan, atau memodifikasi\nAset AlphaFold 3.\n\nJika Anda memilih untuk memberikan masukan ke Google, seperti saran untuk\nmeningkatkan kualitas AlphaFold 3, Anda setuju bahwa informasi tersebut tidak\nbersifat rahasia dan eksklusif, serta Google dapat menindaklanjuti masukan Anda\ntanpa kewajiban kepada Anda.\n\n## 3. Pembatasan Penggunaan\n\nAnda tidak boleh menggunakan Aset AlphaFold 3 apa pun:\n\n1.  untuk penggunaan terbatas yang ditetapkan dalam\n    [Kebijakan Penggunaan Terlarang untuk Parameter Model AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Bahasa-Indonesia.md);\n    atau\n2.  dengan cara yang melanggar hukum dan peraturan yang berlaku.\n\nSelama diizinkan oleh hukum dan tanpa membatasi hak kami lainnya, Google berhak\nmencabut hak penggunaan Anda, dan (selama memungkinkan) membatasi penggunaan\nAset AlphaFold 3 apa pun yang menurut Google secara wajar melanggar Persyaratan\nini.\n\n## 4. Output yang Dihasilkan\n\nMeskipun Anda harus mematuhi Persyaratan ini saat menggunakan Aset AlphaFold 3,\nkami tidak akan mengklaim kepemilikan atas Output orisinal yang Anda hasilkan\nmenggunakan AlphaFold 3. Namun, Anda memahami bahwa AlphaFold 3 dapat\nmenghasilkan Output yang sama atau mirip untuk beberapa pengguna, termasuk\nGoogle, dan kami berhak mengklaim Output tersebut.\n\n## 5. Perubahan pada Aset AlphaFold 3 atau Persyaratan ini\n\nGoogle dapat menambahkan atau menghapus fungsi atau fitur Aset AlphaFold 3 kapan\nsaja dan dapat berhenti menawarkan akses ke Aset AlphaFold 3 sepenuhnya.\n\nGoogle dapat memperbarui Persyaratan ini dan mekanisme akses untuk Parameter\nModel kapan saja. Kami akan memposting setiap perubahan pada Persyaratan\n[di repositori GitHub AlphaFold 3](https://github.com/google-deepmind/alphafold3).\nPerubahan umumnya akan berlaku 14 hari setelah diposting. Namun, perubahan yang\nberkaitan dengan fungsi atau yang dibuat karena alasan hukum akan langsung\nberlaku.\n\nAnda harus meninjau Persyaratan ini setiap kali kami memperbaruinya atau saat\nAnda menggunakan Aset AlphaFold 3. Jika Anda tidak menyetujui perubahan pada\nPersyaratan, Anda harus segera menghentikan penggunaan Aset AlphaFold 3.\n\n## 6. Menangguhkan atau menghentikan hak Anda untuk menggunakan Aset AlphaFold 3\n\nGoogle dapat sewaktu-waktu menangguhkan atau menghentikan hak Anda untuk\nmenggunakan dan mengakses Aset AlphaFold 3 sebagaimana berlaku karena, antara\nlain, kegagalan Anda untuk sepenuhnya mematuhi Persyaratan. Jika Google\nmenangguhkan atau menghentikan hak Anda untuk mengakses atau menggunakan Aset\nAlphaFold 3, Anda harus segera menghapus dan menghentikan penggunaan serta\nDistribusi semua salinan Aset AlphaFold 3 yang Anda miliki atau kontrol, dan\nAnda dilarang menggunakan Aset AlphaFold 3, termasuk mengajukan permohonan untuk\nmenggunakan Parameter Model. Google akan berupaya memberikan pemberitahuan\nsewajarnya kepada Anda sebelum penangguhan atau penghentian tersebut. Namun,\nAnda tidak akan menerima pemberitahuan atau peringatan sebelumnya jika\npenangguhan atau penghentian tersebut terjadi karena Anda tidak sepenuhnya\nmematuhi Persyaratan atau karena alasan serius lainnya.\n\nAnda tentunya dapat menghentikan penggunaan Aset AlphaFold 3 kapan saja. Jika\nAnda berhenti menggunakannya, harap beri tahu kami alasannya (melalui\nalphafold@google.com) sehingga kami dapat terus meningkatkan kualitas teknologi\nkami.\n\n## 7. Kerahasiaan\n\nAnda setuju untuk tidak mengungkapkan atau menyediakan Informasi Rahasia Google\nkepada siapa pun tanpa izin tertulis dari kami sebelumnya. \"**Informasi Rahasia\nGoogle**\" berarti (a) Parameter Model AlphaFold 3 dan semua software, teknologi,\nserta dokumentasi yang terkait dengan AlphaFold 3, kecuali kode sumber AlphaFold\n3, dan (b) informasi lain apa pun yang disediakan oleh Google yang ditandai\nsebagai rahasia atau umumnya dianggap rahasia berdasarkan penyajian informasi\ntersebut. Informasi Rahasia Google tidak mencakup (a) informasi yang sudah Anda\nketahui sebelum Anda mengakses atau menggunakan Aset AlphaFold 3 (termasuk\nmelalui [Server AlphaFold](https://alphafoldserver.com/about)), (b) yang\nterungkap ke publik bukan karena kesalahan Anda (misalnya, pelanggaran Anda\nterhadap Persyaratan ini), (c) yang Anda kembangkan sendiri tanpa mengacu pada\nInformasi Rahasia Google, atau (d) yang diberikan kepada Anda oleh pihak ketiga\nsesuai hukum yang berlaku (Tanpa anda atau pihak ketiga tersebut melanggar\nPersyaratan).\n\n## 8. Pernyataan penyangkalan\n\nTidak ada di dalam Persyaratan membatasi hak apa pun yang tidak dapat dibatasi\nberdasarkan hukum yang berlaku atau membatasi tanggung jawab Google kecuali\nsebagaimana diizinkan oleh hukum yang berlaku.\n\n**AlphaFold 3 dan Output disediakan \"apa adanya\", tanpa jaminan atau ketentuan\napa pun, baik tersurat maupun tersirat, termasuk jaminan atau ketentuan tentang\nkepemilikan, ketiadaan pelanggaran, kelayakan untuk diperdagangkan, atau\nkesesuaian untuk tujuan tertentu. Anda bertanggung jawab sepenuhnya untuk\nmenentukan kesesuaian penggunaan AlphaFold 3, atau penggunaan atau\npendistribusian Output, dan menanggung semua risiko yang terkait dengan\npenggunaan atau pendistribusian tersebut serta pelaksanaan hak dan kewajiban\noleh Anda berdasarkan Persyaratan ini. Anda dan siapa pun yang Anda beri Output\nbertanggung jawab sepenuhnya atas Output tersebut serta penggunaannya\nselanjutnya.**\n\n**Output merupakan prediksi dengan tingkat keyakinan yang berbeda-beda dan harus\nditafsirkan dengan cermat. Gunakan pertimbangan sebelum mengandalkan,\nmemublikasikan, mendownload, atau menggunakan AlphaFold 3.**\n\n**AlphaFold 3 dan Output hanya ditujukan untuk pemodelan teoretis. Aset tersebut\ntidak dimaksudkan, divalidasi, atau disetujui untuk penggunaan klinis. Anda\ntidak boleh menggunakan AlphaFold 3 atau Output untuk tujuan klinis atau\nmengandalkannya untuk saran medis atau profesional lainnya. Konten apa pun\nterkait topik tersebut hanya diberikan untuk tujuan informasi dan bukan\nmerupakan pengganti saran dari profesional yang berkualifikasi.**\n\n## 9. Kewajiban\n\nSelama diizinkan hukum yang berlaku, Anda akan melindungi Google serta direktur,\npetugas, karyawan, dan kontraktornya terhadap kerugian dari proses hukum pihak\nketiga (termasuk tindakan oleh otoritas pemerintah) yang timbul dari atau\nberkaitan dengan penggunaan Aset AlphaFold 3 oleh Anda yang melanggar hukum atau\npelanggaran Anda terhadap Persyaratan. Perlindungan terhadap kerugian ini\nmencakup kewajiban atau pengeluaran yang timbul dari klaim, kerugian, kerusakan,\nputusan pengadilan, denda, biaya proses pengadilan, dan biaya hukum, kecuali\njika kewajiban atau pengeluaran disebabkan oleh pelanggaran, kelalaian, atau\nperbuatan tidak pantas yang disengaja oleh Google. Jika Anda dikecualikan secara\nhukum dari tanggung jawab tertentu, termasuk perlindungan terhadap kerugian,\ntanggung jawab tersebut tidak berlaku bagi Anda berdasarkan Persyaratan.\n\nDalam keadaan apa pun, Google tidak akan bertanggung jawab atas ganti rugi tidak\nlangsung, ganti rugi khusus, ganti rugi insidental, ganti rugi sebagai\nperingatan, ganti rugi sebagai akibat, atau ganti rugi penghukuman, atau\nhilangnya keuntungan dalam bentuk apa pun sehubungan dengan Persyaratan atau\nAset AlphaFold 3, meskipun Google telah diberi tahu tentang kemungkinan adanya\nganti rugi tersebut. Total kewajiban kumulatif Google untuk semua klaim yang\ntimbul dari atau sehubungan dengan Persyaratan atau Aset AlphaFold 3, termasuk\nkarena kelalaiannya sendiri, dibatasi hingga $500.\n\n## 10. Ketentuan lainnya\n\nSecara hukum, Anda memiliki hak tertentu yang tidak dapat dibatasi oleh kontrak\nseperti Persyaratan. Persyaratan sama sekali tidak dimaksudkan untuk membatasi\nhak tersebut.\n\nPersyaratan merupakan keseluruhan perjanjian kami terkait penggunaan Aset\nAlphaFold 3 oleh Anda dan menggantikan perjanjian sebelumnya atau pada saat yang\nsama yang menyangkut penggunaan tersebut.\n\nJika ternyata ada ketentuan dalam Persyaratan yang tidak memiliki kekuatan\nhukum, ketentuan lainnya dalam Persyaratan akan tetap berlaku dan memiliki\nkekuatan hukum penuh.\n\n## 11. Sengketa\n\nHukum California akan mengatur semua sengketa yang timbul dari atau berkaitan\ndengan Persyaratan atau sehubungan dengan Aset AlphaFold 3. Sengketa ini akan\ndiselesaikan secara eksklusif di pengadilan federal atau negara bagian Santa\nClara County, California, Amerika Serikat dan Anda serta Google menyetujui\nwilayah hukum pribadi di pengadilan tersebut. Jika hukum setempat yang berlaku\nmencegah sengketa tertentu diselesaikan di pengadilan California, Anda dan\nGoogle dapat mengajukan sengketa tersebut di pengadilan setempat Anda. Jika\nhukum setempat yang berlaku mencegah pengadilan setempat Anda menerapkan hukum\nCalifornia untuk menyelesaikan sengketa ini, sengketa ini akan diatur oleh hukum\nsetempat yang berlaku dari negara, negara bagian, atau tempat tinggal Anda yang\nlain. Jika Anda menggunakan Aset AlphaFold 3 atas nama organisasi pemerintah\nselain organisasi pemerintah federal Amerika Serikat (dengan ketentuan yang\ndisebutkan sebelumnya akan berlaku selama diizinkan oleh hukum federal),\nPersyaratan ini tidak akan berlaku untuk pengadilan dan hukum yang mengatur.\n\nMengingat sifat riset ilmiah, mungkin perlu waktu beberapa saat hingga\npelanggaran terhadap Persyaratan terlihat jelas. Untuk melindungi Anda, Google,\ndan Aset AlphaFold 3, selama diizinkan hukum yang berlaku, Anda setuju bahwa:\n\n1.  klaim hukum apa pun terkait Persyaratan atau Aset AlphaFold 3 dapat diajukan\n    hingga:\n    1.  tanggal batas waktu berdasarkan hukum yang berlaku untuk mengajukan\n        klaim hukum; atau\n    2.  dua tahun sejak tanggal Anda atau Google (sebagaimana berlaku)\n        mengetahui, atau seharusnya secara wajar mengetahui, fakta yang\n        menimbulkan klaim tersebut; dan\n2.  Anda dan Google tidak akan memperdebatkan pembatasan, batas waktu,\n    penundaan, pelepasan hak, atau sejenisnya dalam upaya untuk menghalangi\n    gugatan yang diajukan dalam jangka waktu tersebut.\n\nSemua hak yang tidak secara khusus dan tegas diberikan kepada Anda oleh\nPersyaratan menjadi hak milik Google. Penundaan, tindakan, atau kelalaian oleh\nGoogle dalam melaksanakan hak atau upaya hukum apa pun tidak akan dianggap\nsebagai pelepasan hak atas pelanggaran terhadap Persyaratan, dan Google secara\ntegas memiliki semua hak dan upaya hukum yang tersedia berdasarkan Persyaratan,\nhukum, ekuitas, atau lainnya, termasuk upaya hukum yang menyangkut penyelesaian\ndengan perintah pengadilan atas setiap ancaman atau pelanggaran nyata terhadap\nPersyaratan tanpa perlu membuktikan kerugian yang sebenarnya.\n"
  },
  {
    "path": "legal/WEIGHTS_TERMS_OF_USE-Espanol-Latinoamerica.md",
    "content": "# CONDICIONES DE USO DE LOS PARÁMETROS DEL MODELO ALPHAFOLD 3\n\nÚltima modificación: 9 de noviembre de 2024\n\n[AlphaFold 3](https://blog.google/technology/ai/google-deepmind-isomorphic-alphafold-3-ai-model/)\nes un modelo de IA desarrollado por [Google DeepMind](https://deepmind.google/)\ny por [Isomorphic Labs](https://www.isomorphiclabs.com/). Genera predicciones de\nestructuras 3D de moléculas biológicas, lo que proporciona confianza del modelo\npara las predicciones de estructuras. Creamos los parámetros del modelo\nentrenado y los resultados generados y los ponemos a disposición sin costo para\ndeterminados usos no comerciales de conformidad con las condiciones de uso y la\n[Política de Uso Prohibido de los Parámetros del Modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Espanol-Latinoamerica.md).\n\n**Puntos clave para tener en cuenta al usar los parámetros y los resultados del\nmodelo AlphaFold 3**\n\n1.  Los parámetros y los resultados del modelo AlphaFold 3 solo están\n    disponibles para usos no comerciales de organizaciones no comerciales (*es\n    decir*, universidades, organizaciones sin fines de lucro, instituciones de\n    investigación y organismos educativos, periodísticos y gubernamentales), o\n    bien en su nombre. Si usted es un investigador afiliado de una organización\n    no comercial, en la medida en que no pertenezca a una organización comercial\n    ni actúe en nombre de una, puede usar estos recursos para su investigación\n    de afiliación no comercial.\n    1.  No debe utilizar ni permitir que otros utilicen AlphaFold 3 ni sus\n        parámetros o resultados en los siguientes casos:\n    2.  En conexión con cualquier actividad comercial, incluidas investigaciones\n        en nombre de organizaciones comerciales\n2.  Para entrenar modelos de aprendizaje automático, o bien tecnologías\n    relacionadas para la predicción de estructuras biomoleculares, similares a\n    AlphaFold 3\n3.  No *debe* publicar ni compartir los parámetros del modelo AlphaFold 3,\n    excepto dentro de su organización, de acuerdo con estas Condiciones.\n4.  Puede publicar, compartir y adaptar los *resultados* de AlphaFold 3 de\n    conformidad con estas Condiciones, que incluyen el requisito de brindar un\n    aviso claro de que cualquier modificación que haga y el uso continuo de los\n    resultados de AlphaFold 3 y sus derivaciones están sujetas a las\n    [Condiciones de Uso de los Resultados de AlphaFold](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\nAl usar, reproducir, modificar, realizar, distribuir o mostrar cualquier porción\no elemento de los Parámetros del Modelo (como se definen a continuación), o bien\nal aceptar las condiciones de este acuerdo, usted se compromete a cumplir con lo\nsiguiente: (1) estas Condiciones de Uso y (2) la\n[Política de Uso Prohibido de los Parámetros del Modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Espanol-Latinoamerica.md),\nque se incorpora por referencia en este documento (en conjunto, las\n\"**Condiciones**\"), en cada caso, (a) según las modificaciones ocasionales que\nse hagan de acuerdo con las Condiciones y (b) entre usted y (i) si es de un país\ndel Espacio Económico Europeo o Suiza, Google Ireland Limited o (ii) en\ncualquier otro caso, Google LLC.\n\nConfirma que tiene la autorización explícita o implícita para celebrar, y está\ncelebrando, las Condiciones como empleado o de otra manera en nombre de su\norganización.\n\nLea cuidadosamente estas Condiciones. En ellas, se establece lo que usted puede\nesperar de nosotros cuando usa los Recursos de AlphaFold 3, como se describen a\ncontinuación, y lo que Google espera de usted. Cuando decimos \"**usted**\",\nhacemos referencia al individuo o la organización que usa los Recursos de\nAlphaFold 3. Cuando decimos \"**nosotros**\" o \"**Google**\", hacemos referencia a\nlas entidades que pertenecen al grupo de empresas de Google, que comprende a\nGoogle LLC y sus afiliadas.\n\n## 1. Definiciones clave\n\nSegún su uso en estas Condiciones:\n\n\"**AlphaFold 3**\" significa: (a) el código fuente de AlphaFold 3 disponible\n[aquí](https://github.com/google-deepmind/alphafold3/) y con licencia en virtud\nde las condiciones de la Atribución/Reconocimiento-NoComercial-CompartirIgual\n4.0 Internacional (CC-BY-NC-SA 4.0) de Creative Commons, y cualquier código\nfuente derivado, y (b) los Parámetros del Modelo.\n\n\"**Recursos de AlphaFold 3**\" hace referencia a los Resultados y los Parámetros\ndel Modelo.\n\n\"**Distribución\" o \"Distribuir**\" incluye cualquier transmisión, publicación y\notras instancias en las que se comparten los Resultados de manera pública o a\notra persona.\n\n\"**Parámetros del Modelo**\" hace referencia a las ponderaciones y los parámetros\ndel modelo entrenado, que Google pone a disposición para las organizaciones (a\nsu entera discreción) para su uso de acuerdo con estas Condiciones, junto con\n(a) las modificaciones a esas ponderaciones y parámetros, (b) los trabajos\nbasados en esas ponderaciones y parámetros, o bien (c) otros modelos de\naprendizaje automático y código que incorporan, en su totalidad o en parte,\nestos parámetros y ponderaciones.\n\n\"**Resultados**\" hace referencia a las predicciones de estructura y toda la\ninformación adicional y relacionada que brinda AlphaFold 3 o el uso de los\nParámetros del Modelo, además de toda representación visual, predicción\ncomputacional, descripción, modificación, copia o adaptación que esté\nsustancialmente derivada de los Resultados.\n\n\"**Lo que incluye**\" significa \"**incluido, sin limitarse a ello**\".\n\n## 2. Acceso y uso de los Recursos de AlphaFold 3\n\nSujeto al cumplimiento de estas Condiciones, lo que incluye la\n[Política de Uso Prohibido de los Parámetros del Modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Espanol-Latinoamerica.md),\npuede acceder a los Recursos de AlphaFold 3, usarlos y modificarlos, y\nDistribuir los Resultados como se define en estas Condiciones. Le otorgamos una\nlicencia no exclusiva, libre de regalías, revocable, no transferible y no\nsusceptible de someterse a otras licencias (excepto como se indica expresamente\nen estas Condiciones) respecto de cualquier derecho de propiedad intelectual que\ntengamos sobre los Recursos de AlphaFold en la medida necesaria para estos\npropósitos. Para verificar su acceso a AlphaFold 3 y el uso correspondiente,\npodríamos solicitarle ocasionalmente información adicional sobre usted, ya sea\nque verifique su nombre, su organización o cualquier otra información\nidentificatoria.\n\nAl acceder a los Recursos de AlphaFold 3 y usarlos o modificarlos, así como al\nDistribuir Resultados o solicitar acceso a los Parámetros del Modelo, manifiesta\ny garantiza que (a) tiene plenas facultades y atribuciones para celebrar estas\nCondiciones (lo que incluye tener la edad de consentimiento), (b) Google nunca\nrescindió en el pasado su acceso a AlphaFold 3 ni su derecho de uso (lo que\nincluye su disponibilidad a través de\n[AlphaFold Server](https://alphafoldserver.com/about)) debido a su\nincumplimiento de las Condiciones de Uso correspondientes, (c) el cumplimiento\nde estas Condiciones o el ejercicio de sus derechos y obligaciones no infringirá\nningún acuerdo que tenga con un tercero ni ningún derecho de terceros, (d)\ncualquier información que usted proporcione a Google en relación con AlphaFold\n3, incluida la necesaria (cuando corresponda) para solicitar acceso a los\nParámetros del Modelo, es correcta y actual, y (e) usted no (i) es residente de\nun país bajo embargo, (ii) es residente de un país bajo el embargo de EE.UU. ni\n(iii) tiene prohibiciones a través de controles de exportación aplicables y\nprogramas de sanción el acceso a los Recursos de AlphaFold 3, así como su uso y\nmodificación.\n\nSi decide enviarle comentarios a Google, como sugerencias para mejorar AlphaFold\n3, asegura que esa información no es confidencial ni de su propiedad, y que\nGoogle puede actuar respecto de sus comentarios sin tener ninguna obligación con\nusted.\n\n## 3. Restricciones de uso\n\nNo debe usar ninguno de los Recursos de AlphaFold 3 en los siguientes casos:\n\n1.  Los usos restringidos establecidos en la\n    [Política de Uso Prohibido de los Parámetros del Modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Espanol-Latinoamerica.md)\n\n2.  En incumplimiento de las leyes y reglamentaciones aplicables\n\nEn el sentido más amplio permitido por la ley y sin limitar ninguno de nuestros\notros derechos, Google se reserva el derecho de revocar su derecho de usar y (en\nla medida que sea viable) restringir el uso de cualquiera de los Recursos de\nAlphaFold 3 que Google razonablemente cree que infringe estas Condiciones.\n\n## 4. Resultados generados\n\nAunque debe cumplir con estas Condiciones cuando usa los Recursos de AlphaFold\n3, no reclamaremos la propiedad de los Resultados originales que genere usando\nAlphaFold 3. Sin embargo, usted reconoce que AlphaFold 3 puede generar los\nmismos Resultados, o bien otros similares, para varios usuarios, incluido\nGoogle, y nos reservamos todos nuestros derechos al respecto.\n\n## 5. Cambios en los Recursos de AlphaFold 3 o estas Condiciones\n\nGoogle podría agregar o quitar funciones de los Recursos de AlphaFold 3 en\ncualquier momento, y también podría quitar por completo el acceso a los Recursos\nde AlphaFold 3.\n\nGoogle podría actualizar estas Condiciones y el mecanismo de acceso a los\nParámetros del Modelo en cualquier momento. Publicaremos cualquier modificación\na las Condiciones\n[en el repositorio de GitHub de AlphaFold 3](https://github.com/google-deepmind/alphafold3).\nEn general, los cambios entrarán en vigencia 14 días después de su publicación.\nSin embargo, los cambios relacionados con funciones o realizados por motivos\nlegales entrarán en vigencia de inmediato.\n\nDebería revisar las Condiciones siempre que realicemos actualizaciones o que use\nlos Recursos de AlphaFold 3. Si no está de acuerdo con las modificaciones de las\nCondiciones, debe dejar de usar los Recursos de AlphaFold 3 de inmediato.\n\n## 6. Suspensión o rescisión de su derecho de uso de los Recursos de AlphaFold 3\n\nGoogle puede, en cualquier momento, suspender o rescindir su derecho de uso y,\nsegún corresponda, acceso a los Recursos de AlphaFold 3 debido a, entre otros\nmotivos, su incumplimiento de estas Condiciones. Si Google suspende o rescinde\nsu derecho de acceso o uso de los Recursos de AlphaFold 3, debe borrarlos y\ndejar de usar y Distribuir todas las copias correspondientes que tenga en su\nposesión o control, y se le prohibirá usar los Recursos de AlphaFold 3, lo que\nincluye el envío de solicitudes para usar los Parámetros del Modelo. Google\ntratará de darle un aviso con una antelación razonable antes de cualquier\nsuspensión o rescisión, pero no se le dará ningún aviso ni advertencia previos\nsi la suspensión o rescisión se deben a su incumplimiento de las Condiciones o\nalguna otra razón grave.\n\nTenga en cuenta que puede dejar de usar los Recursos de AlphaFold 3 cuando lo\ndesee. Si los deja de usar, le agradeceríamos saber el motivo (a través de\nalphafold@google.com) para que podamos continuar mejorando nuestras tecnologías.\n\n## 7. Confidencialidad\n\nUsted acepta no divulgar ni poner a disposición Información Confidencial de\nGoogle sin obtener nuestro previo consentimiento por escrito. \"Información\nConfidencial de Google\" hace referencia a (a) los Parámetros del Modelo\nAlphaFold 3 y todo el software, la tecnología y la documentación relacionada con\nAlphaFold 3, excepto el código fuente de AlphaFold 3, y (b) cualquier otra\ninformación que Google ponga a disposición y se marque como confidencial o que\nnormalmente se consideraría confidencial en las circunstancias en las que se\npresenta. La Información Confidencial de Google no incluye (a) información que\nusted ya conocía antes de acceder a los Recursos de AlphaFold 3 o de usarlos\n(que se incluye a través de\n[AlphaFold Server](https://alphafoldserver.com/about)), (b) información que se\ncomparte de manera pública por una razón que no lo responsabiliza (por ejemplo,\nsu incumplimiento de las Condiciones), (c) información que usted desarrolló de\nmanera independiente sin hacer referencia a la Información Confidencial de\nGoogle, o (d) información que recibió de manera legal de parte de un tercero\n(sin que usted o ese tercero hayan incumplido las Condiciones).\n\n## 8. Renuncias de responsabilidad\n\nNinguna disposición de las Condiciones restringe ningún derecho que no pueda\nrestringirse en función de la ley aplicable ni limita las responsabilidades de\nGoogle, excepto según lo que permite la ley aplicable.\n\n**AlphaFold 3 y los Resultados se brindan \"tal cual son\", sin garantías de\nningún tipo, ya sean explícitas o implícitas, lo que incluye garantías o\ncondiciones de titularidad, no incumplimiento, comerciabilidad o adecuación para\nun propósito particular. Usted es el único responsable de determinar la\nidoneidad del uso de AlphaFold 3, o bien del uso o la distribución de los\nResultados, y asume todos los riesgos asociados con ese uso o distribución y su\nejercicio de los derechos y las obligaciones según estas Condiciones. Usted y\ntodas las personas con quienes comparta los Resultados serán los únicos\nresponsables de estos usos y sus usos posteriores.**\n\n**Los Resultados son predicciones con diversos niveles de confianza y deberían\ninterpretarse con cuidado. Sea prudente antes de basarse en el contenido de\nAlphaFold 3, o bien publicarlo, descargarlo o usarlo de cualquier otro modo.**\n\n**AlphaFold 3 y los Resultados deben usarse únicamente para el modelado teórico.\nNo están pensados, validados ni aprobados para uso clínico. No debe usar\nAlphaFold 3 ni los Resultados con fines clínicos, ni basarse en ellos para dar\nconsejos médicos ni de índole profesional. Cualquier contenido relacionado con\nesos temas se proporciona solo con fines informativos y no sustituye el\nasesoramiento de un profesional calificado.**\n\n## 9. Responsabilidades\n\nEn la medida en que lo permita la legislación aplicable, usted indemnizará a\nGoogle y sus directores, funcionarios, empleados y contratistas por cualquier\nprocedimiento legal de terceros (incluidas las acciones de las autoridades\ngubernamentales) que surja de su uso ilegal de los Recursos de AlphaFold 3 o del\nincumplimiento de estas Condiciones. Esta indemnización cubrirá cualquier\nresponsabilidad o gasto que surja a partir de reclamos, pérdidas, daños,\njuicios, multas, costos de litigios y honorarios legales, excepto en la medida\nen que una responsabilidad o un gasto sean causados por un incumplimiento,\nnegligencia o conducta inapropiada voluntaria por parte de Google. Si en su caso\nse aplica una exención legal de ciertas responsabilidades, lo que incluye la\nindemnización, no deberá hacerse cargo de estas responsabilidades según estas\nCondiciones.\n\nEn ningún caso Google será responsable de daños indirectos, especiales,\nincidentales, ejemplares, resultantes ni punitivos, ni de la pérdida de\nganancias de ningún tipo en conexión con estas Condiciones o los Recursos de\nAlphaFold 3, incluso si se le advirtió sobre la posibilidad de dichos daños. La\nresponsabilidad conjunta de Google por todos los reclamos que surjan en conexión\ncon estas Condiciones o los Recursos de AlphaFold 3, lo que incluye los que\nsurjan de su propia negligencia, se limita a USD 500.\n\n## 10. Varios\n\nPor ley, tiene ciertos derechos que no pueden estar limitados por un contrato,\ncomo estas Condiciones. Las Condiciones no tienen la intención de restringir\nesos derechos.\n\nLas Condiciones son nuestro acuerdo completo relacionado con su uso de los\nAlphaFold 3 y sustituyen cualquier acuerdo anterior o contemporáneo sobre la\nmateria.\n\nSi cualquier disposición de estas Condiciones resultase inejecutable, el resto\nseguirá plenamente en vigencia.\n\n## 11. Disputas\n\nLa ley de California regirá todas las disputas que surjan de las Condiciones o\nen conexión con los Recursos de AlphaFold 3. Estas disputas se resolverán\nexclusivamente en los tribunales federales o estatales del Condado de Santa\nClara, California, EE.UU., y usted y Google aceptan someterse a la jurisdicción\npersonal de dichos tribunales. En la medida en que la ley local aplicable impida\nque ciertas disputas se resuelvan en un tribunal de California, usted y Google\npueden presentarlas en los tribunales locales de su jurisdicción. Si la ley\nlocal aplicable impide que su tribunal local aplique la ley de California para\nresolver las disputas, estas se regirán por las leyes locales aplicables de su\npaís, estado o lugar de residencia. Si usará los Recursos de AlphaFold 3 en\nnombre de una organización gubernamental que no sea del gobierno federal de\nEstados Unidos (donde se aplican las disposiciones mencionadas anteriormente en\nla medida en que la ley federal lo permita), estas Condiciones no se aplicarán\nen relación con la ley aplicable y los tribunales.\n\nDada la naturaleza de la investigación científica, el incumplimiento de las\nCondiciones puede tardar algún tiempo en hacerse evidente. Para protegerlo a\nusted, y proteger a Google y a los Recursos de AlphaFold 3, en la medida en que\nlo permita la ley aplicable, usted acepta lo siguiente:\n\n1.  Cualquier demanda legal relacionada con las Condiciones o los Recursos de\n    AlphaFold 3 podrá iniciarse hasta la fecha posterior de lo siguiente:\n    1.  la fecha límite que establece la ley aplicable para interponer una\n        demanda legal; o\n    2.  dos años a partir de la fecha en que usted o Google (según corresponda)\n        tomaron conocimiento, o debieron haber tomado conocimiento\n        razonablemente, de los hechos que dieron lugar a dicha demanda, y\n2.  Ni usted ni Google alegarán prescripción, caducidad, demora, renuncia o\n    similares para intentar impedir una acción presentada dentro de ese período.\n\nTodos los derechos que no se le otorguen específica y expresamente en las\nCondiciones quedan reservados a Google. Ninguna demora, omisión o acto de Google\nen el ejercicio de cualquier derecho o recurso se considerará una renuncia de\ncualquier incumplimiento de las Condiciones y Google se reserva expresamente\ntodos los derechos y recursos disponibles según las Condiciones, la ley, por\nacuerdo implícito o de cualquier otro modo, lo que incluye el recurso de medida\ncautelar contra cualquier amenaza o hecho de infracción de las Condiciones sin\nla necesidad de mostrar daños reales.\n"
  },
  {
    "path": "legal/WEIGHTS_TERMS_OF_USE-Francais-Canada.md",
    "content": "# CONDITIONS D'UTILISATION DES PARAMÈTRES DU MODÈLE ALPHAFOLD 3\n\nDernière modification: 2024-11-09\n\n[AlphaFold 3](https://blog.google/technology/ai/google-deepmind-isomorphic-alphafold-3-ai-model/)\nest un modèle d'IA développé par [Google DeepMind](https://deepmind.google/) et\n[Isomorphic Labs](https://www.isomorphiclabs.com/). Il génère des prédictions de\nstructures 3D de molécules biologiques en fournissant la confiance du modèle\npour les prédictions de structures. Pour certaines utilisations non\ncommerciales, nous mettons gratuitement à disposition les paramètres du modèle\nentraîné et les résultats générés à l'aide de ces paramètres, conformément aux\nprésentes conditions d'utilisation et à la\n[Politique d'utilisation interdite des paramètres du modèle AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Francais-Canada.md).\n\n**Éléments clés à connaître lors de l'utilisation des paramètres du modèle\nAlphaFold 3 et les résultats**\n\n1.  Les paramètres du modèle AlphaFold 3 et les résultats sont **uniquement**\n    disponibles pour un usage non commercial par des organisations non\n    commerciales ou au nom de celles-ci (*c.-à-d.* universités, organismes sans\n    but lucratif, instituts de recherche et organismes éducatifs,\n    journalistiques et gouvernementaux). Si vous êtes un chercheur affilié à une\n    organisation non commerciale, **à la condition que vous ne soyez pas une\n    organisation commerciale ou que vous n'agissiez pas au nom d'une\n    organisation commerciale**, cela signifie que vous pouvez les utiliser pour\n    votre recherche affiliée non commerciale.\n2.  Vous **ne devez pas** utiliser ni permettre à d'autres personnes d'utiliser:\n    1.  les paramètres du modèle AlphaFold 3 ou les résultats dans le cadre de\n        **toute activité commerciale, y compris la recherche au nom\n        d'organisations commerciales**; ou\n    2.  les résultats d'AlphaFold 3 pour **entraîner des modèles d'apprentissage\n        automatique** ou une technologie connexe de **prédiction de structures\n        biomoléculaires** semblable à AlphaFold 3.\n3.  Vous ***ne devez pas* publier ni partager les paramètres du modèle AlphaFold\n    3**, sauf si vous les partagez au sein de votre organisation conformément\n    aux présentes Conditions.\n4.  Vous ***pouvez* publier, partager ou adapter les *résultats* d'AlphaFold 3**\n    conformément aux présentes Conditions, y compris à l'exigence de fournir un\n    préavis clair de toute modification que vous apportez et à celle stipulant\n    que l'utilisation continue des résultats et des œuvres dérivées d'AlphaFold\n    3 est soumise aux\n    C[onditions d'utilisation des résultats d'AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\nEn utilisant, reproduisant, modifiant, exécutant, distribuant ou affichant toute\nportion ou tout élément des Paramètres du modèle (comme défini ci-dessous) ou en\nacceptant autrement les conditions de ce contrat, vous acceptez d'être lié par\n(1) ces conditions d'utilisation et (2) la\n[Politique d'utilisation interdite des paramètres du modèle AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Francais-Canada.md)\nqui est incorporée aux présentes par référence (collectivement, les « Conditions\n»), dans chaque cas (a) tel que modifié de temps à autre conformément aux\nConditions et (b) entre vous et (i) si vous êtes d'un pays de l'Espace\néconomique européen ou de la Suisse, Google Ireland Limited, ou (ii) autrement,\nGoogle LLC.\n\nVous confirmez que vous êtes autorisé, soit explicitement ou implicitement, à\naccepter les Conditions et que vous les acceptez, en tant qu'employé ou\nautrement, au nom de votre organisation.\n\nVeuillez lire ces Conditions attentivement. Elles établissent ce à quoi vous\npouvez vous attendre de nous lorsque vous accédez aux Éléments d'AlphaFold 3 et\nque vous les utilisez (comme défini ci-dessous), et ce à quoi Google s'attend de\nvous. Par « **vous** », nous entendons l’individu ou l'organisation qui utilise\nles Éléments d'AlphaFold 3. Par « **nous** », « **notre** » ou « **Google** »,\nnous entendons les entités qui appartiennent au groupe d'entreprises Google,\nc'est-à-dire Google LLC et ses filiales.\n\n## 1. Définitions clés\n\nTelle qu’utilisées dans ces Conditions: \\\n« **AlphaFold 3** » désigne: (a) le code source d'AlphaFold 3 rendu accessible\n[ici](https://github.com/google-deepmind/alphafold3/) et sous les conditions de\nla licence « Creative Commons Attribution-NonCommercial-Sharealike 4.0\nInternational (CC-BY-NC-SA 4.0) » ainsi que tout code source d'œuvres dérivées\net (b) les Paramètres du modèle.\n\n« **Éléments d'AlphaFold 3** » signifie les Paramètres du modèle et les\nRésultats.\n\n« **Distribution** » ou « **Distribuer** » signifient toute transmission,\npublication ou tout autre partage de Résultats effectués publiquement ou avec\nune autre personne.\n\n« **Paramètres du modèle** » désigne les poids du modèle entrainé et paramètres\nmis à disposition par Google pour les organisations (à sa seule discrétion) pour\nleur utilisation conformément à ces Conditions, ainsi que (a) les modifications\napportées à ces poids et paramètres (b) les travaux basés sur ces poids et\nparamètres ou (c) tout autre code ou tout autre modèle d'apprentissage\nautomatique qui intègre, en totalité ou en partie, ces poids et paramètres.\n\n« **Résultats** » désigne les prédictions de structures et toutes les\ninformations auxiliaires et connexes fournies par AlphaFold 3 ou utilisant les\nParamètres du modèle ainsi que toutes les représentations visuelles, les\nprédictions informatiques, les descriptions, les modifications, les copies ou\nles adaptations qui sont substantiellement dérivées des Résultats.\n\n« **Y compris** » signifie « **y compris, sans s'y limiter** ».\n\n## 2. Accéder aux Éléments d'AlphaFold 3 et les utiliser\n\nSous réserve de votre conformité aux Conditions, y compris la\nP[olitique d'utilisation interdite des paramètres du modèle AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Francais-Canada.md),\nvous pouvez accéder aux Éléments d'AlphaFold 3, les utiliser et les modifier, et\nDistribuer les Résultats comme indiqué dans ces Conditions. Nous vous accordons\nune licence non exclusive, libre de redevances, révocable, non transférable et\nnon susceptible de faire l'objet d'une sous-licence (sauf si expressément permis\ndans ces Conditions) sur tout droit de propriété intellectuelle que nous\ndétenons sur les Éléments d'AlphaFold, dans la mesure nécessaire à ces fins.\nAfin de vérifier votre accès à AlphaFold 3 et votre utilisation de celui-ci,\nnous pouvons de temps à autre vous demander des informations supplémentaires, y\ncompris la validation de votre nom, de votre organisation et d'autres\ninformations d'identification.\n\nEn accédant aux Éléments d'AlphaFold 3, en les utilisant ou en les modifiant, en\nDistribuant des Résultats ou en demandant l'accès aux Paramètres du modèle, vous\ndéclarez et garantissez que (a) vous avez les pleins pouvoirs et l'autorité\nnécessaire pour accepter ces Conditions (y compris avoir l'âge de consentement\nrequis) (b) Google n'a jamais précédemment résilié votre accès à AlphaFold 3 ni\nvotre droit de l'utiliser (y compris au moyen du\n[Serveur AlphaFold](https://alphafoldserver.com/about)) en raison de votre\nviolation des conditions d'utilisation applicables (c) l'acceptation de ces\nConditions ou l'exécution de vos droits et obligations en vertu de ces\nConditions ne violera aucun contrat que vous avez avec un tiers ni aucun droit\nd'un tiers (d) toute information que vous fournissez à Google en relation avec\nAlphaFold 3, y compris (le cas échéant) pour demander l'accès aux Paramètres du\nmodèle, est correcte et à jour, et (e) vous n'êtes pas (i) résident d'un pays\nsoumis à un embargo (ii) habituellement résident d'un pays sous embargo\naméricain ni (iii) autrement soumis à une interdiction, par les contrôles\nd'exportation et les programmes de sanctions applicables, d'accéder aux Éléments\nd'AlphaFold 3, de les utiliser ou de les modifier.\n\nSi vous choisissez de donner des commentaires à Google, comme des suggestions\npour améliorer AlphaFold 3, vous vous engagez à ce que ces informations soient\nnon confidentielles et non propriétaire, et Google pourra agir en fonction de\nvos commentaires sans aucune obligation envers vous.\n\n## 3. Restrictions d'utilisation\n\nVous ne devez pas utiliser les Éléments d'AlphaFold 3:\n\n1.  pour les utilisations restreintes énoncées dans la\n    P[olitique d'utilisation interdite des paramètres du modèle AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Francais-Canada.md);\n2.  en violation des lois et règlements applicables.\n\nDans toute la mesure permise par la loi et sans limiter aucun de nos autres\ndroits, Google se réserve le droit de révoquer votre droit d'utilisation et\n(dans la mesure du possible) de restreindre l'utilisation de tout Élément\nd'AlphaFold 3 que Google estime raisonnablement être en violation de ces\nConditions.\n\n## 4. Résultats générés\n\nBien que vous deviez respecter ces Conditions lors de l'utilisation des Éléments\nd'AlphaFold 3, nous ne revendiquerons pas la propriété des Résultats d'origine\nque vous générez en utilisant AlphaFold 3. Cependant, vous reconnaissez\nqu'AlphaFold 3 peut générer les mêmes Résultats ou des Résultats semblables pour\nplusieurs utilisateurs, y compris Google, et nous nous réservons tous nos droits\nà cet égard.\n\n## 5. Modifications aux Éléments d'AlphaFold 3 ou aux présentes Conditions\n\nGoogle peut ajouter ou retirer des fonctions ou fonctionnalités des Éléments\nd'AlphaFold 3 à tout moment et peut cesser d'offrir l'accès aux Éléments\nd'AlphaFold 3.\n\nGoogle peut mettre à jour ces Conditions et le mécanisme d'accès aux Paramètres\ndu modèle à tout moment. Nous allons publier toute modification apportée aux\nConditions\n[dans le référentiel GitHub d'AlphaFold 3](https://github.com/google-deepmind/alphafold3).\nLes modifications entreront généralement en vigueur 14 jours après leur\npublication. Cependant, les modifications concernant la fonctionnalité ou celles\napportées pour des raisons juridiques entreront en vigueur immédiatement.\n\nVous devriez revoir les Conditions chaque fois que nous les mettons à jour ou\nque vous utilisez les Éléments d'AlphaFold 3. Si vous n'acceptez pas les\nmodifications apportées aux Conditions, vous devez cesser d'utiliser les\nÉléments d'AlphaFold 3 immédiatement.\n\n## 6. Suspendre ou résilier votre droit d'utiliser les Éléments d'AlphaFold 3\n\nGoogle peut à tout moment suspendre ou résilier votre droit d'utiliser les\nÉléments d'AlphaFold 3 et, le cas échéant, d'y accéder pour différentes raisons,\nnotamment votre manquement à respecter entièrement les présentes Conditions. Si\nGoogle suspend ou résilie votre droit d'accéder aux Éléments d'AlphaFold 3 ou de\nles utiliser, vous devez immédiatement supprimer toutes les copies des Éléments\nd'AlphaFold 3 en votre possession ou sous votre contrôle et cesser de les\nutiliser et de les Distribuer, et il vous est interdit d'utiliser les Éléments\nd'AlphaFold 3, y compris en soumettant une demande pour utiliser les Paramètres\ndu modèle. Google s'efforcera de vous donner un préavis raisonnable avant toute\nsuspension ou résiliation, mais aucun avis ni avertissement préalable ne sera\ndonné si la suspension ou la résiliation est due à votre manquement à respecter\nentièrement les présentes Conditions ou à d'autres motifs sérieux.\n\nBien entendu, vous êtes toujours libre de cesser d'utiliser les Éléments\nd'AlphaFold 3. Si vous cessez de les utiliser, nous aimerions savoir pourquoi (à\nl'adresse alphafold@google.com) afin de pouvoir continuer à améliorer nos\ntechnologies.\n\n## 7. Confidentialité\n\nVous acceptez de ne pas divulguer ni rendre disponibles les renseignements\nconfidentiels de Google à quiconque sans notre consentement écrit préalable. «\n**Renseignements confidentiels de Google** » désigne (a) les Paramètres du\nmodèle AlphaFold 3 et tous les logiciels, la technologie et la documentation en\nlien avec AlphaFold 3, excepté le code source d'AlphaFold 3, et (b) toute autre\ninformation mise à disposition par Google qui est marquée comme confidentielle\nou qui serait normalement considérée comme confidentielle dans les circonstances\ndans lesquelles elle est présentée. Les Renseignements confidentiels de Google\nn'incluent pas (a) les informations que vous connaissiez déjà avant d'accéder\naux Éléments d'AlphaFold 3 ou de les utiliser (y compris au moyen du\n[Serveur AlphaFold](https://alphafoldserver.com/about)) (b) qui deviennent\npubliques sans que vous en soyez responsable (par exemple, par votre violation\ndes Conditions) (c) qui ont été développées indépendamment par vous sans\nréférence aux Renseignements confidentiels de Google ou (d) qui vous ont été\nlégalement fournies par un tiers (sans violation des Conditions par vous-même ou\npar le tiers).\n\n## 8. Clauses de non-responsabilité\n\nRien dans les Conditions ne restreint les droits qui ne peuvent pas être\nrestreints en vertu de la loi applicable ni ne limite les responsabilités de\nGoogle, sauf si cela est permis par la loi applicable.\n\nAlphaFold 3 et les Résultats sont fournis « tels quels », sans garantie ni\ncondition de quelque nature que ce soit, explicite ou implicite, y compris toute\ngarantie ou condition de titre, d'absence de violation, de qualité marchande ou\nd'adéquation avec un usage particulier. Vous êtes seul responsable de déterminer\nla légitimité de l'utilisation d'AlphaFold 3 ou celle de l'utilisation et de la\ndistribution des Résultats, et vous assumez tous les risques liés à une telle\nutilisation ou distribution ainsi qu'à l'exercice de vos droits et obligations\nen vertu de ces Conditions. Vous et toute personne avec qui vous partagez des\nRésultats êtes les seuls responsables de ces utilisations et de celles qui\ns’ensuivent.\n\nLes Résultats sont des prédictions avec des niveaux de confiance variables et\ndoivent être interprétés avec prudence. Faites preuve de discernement avant de\nvous fier à AlphaFold 3, de le publier, de le télécharger ou de l’utiliser d'une\nautre manière.\n\nAlphaFold 3 et les Résultats sont uniquement destinés à la modélisation\nthéorique. Ils ne sont pas prévus, validés, ni approuvés pour une utilisation\nclinique. Vous ne devez pas utiliser AlphaFold 3 ni les Résultats à des fins\ncliniques ni les considérer comme des conseils médicaux ou professionnels. Tout\ncontenu concernant ces sujets est fourni à titre informatif uniquement et ne\nremplace pas les conseils d'un professionnel qualifié.\n\n## 9. Responsabilités\n\nDans la mesure permise par la loi applicable, vous indemniserez Google et ses\nadministrateurs, dirigeants, employés et sous-traitants pour toutes poursuites\njudiciaires intentées par des tiers (y compris des actions menées par des\nautorités gouvernementales) découlant de ou en rapport avec votre utilisation\nillégale des Éléments d'AlphaFold 3 ou à votre violation des présentes\nConditions. Cette indemnité couvre toute responsabilité ou charge financière\nrésultant de réclamations, de pertes, de dommages, de jugements, d'amendes, de\ndébours et de frais juridiques, sauf dans la mesure où une responsabilité ou une\ncharge financière est causée par une violation, une négligence ou une inconduite\nintentionnelle de Google. Si vous êtes légalement exempté de certaines\nresponsabilités, y compris l'indemnisation, alors ces responsabilités ne\ns'appliquent pas à vous en vertu des présentes Conditions.\n\nGoogle n'est pas responsable, en aucun cas, des dommages-intérêts indirects,\nspéciaux, accessoires, exemplaires, consécutifs ou punitifs ni des pertes de\nprofits de quelque nature que ce soit en rapport avec les Conditions ou les\nÉléments d'AlphaFold 3, même si Google a été informée de la possibilité de tels\ndommages. L'obligation globale et totale de Google pour toutes les réclamations\ndécoulant des Conditions ou des Éléments d'AlphaFold 3 ou en lien avec ceux-ci,\ny compris pour sa propre négligence, est limitée à 500,00USD.\n\n## 10. Divers\n\nSelon la loi, vous avez certains droits qui ne peuvent pas être limités par un\ncontrat tel que les Conditions. Les présentes Conditions ne visent aucunement à\nrestreindre ces droits.\n\nLes Conditions constituent l'intégralité de notre contrat concernant votre\nutilisation des Éléments d'AlphaFold 3 et remplacent tous les contrats\nantérieurs ou contemporains sur ce sujet.\n\nSi une disposition particulière des présentes Conditions s'avère inapplicable,\nle reste des conditions restera en vigueur.\n\n## 11. Contestations\n\nLes lois de la Californie régiront toutes les contestations découlant de ou en\nrapport avec ces Conditions ou en lien avec les Éléments d'AlphaFold 3. Ces\ncontestations seront résolues exclusivement par les tribunaux fédéraux ou\nétatiques du comté de Santa Clara, en Californie, aux États-Unis, et vous et\nGoogle consentez à la compétence territoriale de ces tribunaux. Dans la mesure\noù la loi locale applicable s'oppose à ce que certaines contestations soient\nrésolues devant un tribunal de la Californie, vous et Google pouvez les\nsoumettre à vos tribunaux locaux. Si la loi locale applicable s'oppose à ce que\nvotre tribunal local applique la loi californienne pour résoudre ces\ncontestations, elles seront régies par les lois locales applicables de votre\npays, de votre État ou de votre autre lieu de résidence. Si vous utilisez les\nÉléments d'AlphaFold 3 au nom d'une organisation gouvernementale autre que les\norganisations gouvernementales fédérales américaines (où les dispositions\nprécédentes s'appliquent dans la mesure permise par la loi fédérale), ces\nConditions seront silencieuses en ce qui concerne la loi applicable et les\ntribunaux.\n\nConsidérant la nature de la recherche scientifique, il peut s'écouler un certain\ntemps avant que toute violation des présentes Conditions devienne évidente. \\\nDans la mesure permise par la loi applicable, pour vous protéger, Google et les\nÉléments d'AlphaFold 3, vous acceptez que:\n\n1.  toute réclamation légale liée aux présentes Conditions ou aux Éléments\n    d'AlphaFold 3 peut être intentée jusqu'à la date la plus tardive entre:\n    1.  la date limite prévue par la loi applicable pour intenter la réclamation\n        légale; ou\n    2.  deux années à partir de la date à laquelle vous ou Google (selon le cas)\n        avez pris connaissance ou auriez dû raisonnablement prendre connaissance\n        des faits à l'origine de cette réclamation; et\n2.  vous n'invoquerez pas la limitation, la prescription, le retard, la\n    renonciation ou des arguments semblables pour tenter de faire obstacle à une\n    action intentée dans ce délai et Google non plus.\n\nTous les droits qui ne vous sont pas précisément et expressément accordés par\nles présentes Conditions sont réservés à Google. Aucun retard, acte ni aucune\nomission de la part de Google dans l'exercice d'un droit ou d'un recours ne sera\nconsidéré comme une renonciation à une violation des Conditions, et Google se\nréserve expressément tous les droits et recours disponibles en vertu des\nConditions ou de la loi, en équité ou autrement, y compris le recours à une\ninjonction contre toute menace de violation ou violation réelle des Conditions\nsans qu'il soit nécessaire de prouver des dommages réels.\n"
  },
  {
    "path": "legal/WEIGHTS_TERMS_OF_USE-Portugues-Brazil.md",
    "content": "# TERMOS DE USO DOS PARÂMETROS DO MODELO ALPHAFOLD 3\n\nÚltima modificação: 2024-11-09\n\nO\n[AlphaFold 3](https://blog.google/technology/ai/google-deepmind-isomorphic-alphafold-3-ai-model/)\né um modelo de IA desenvolvido pelo [Google DeepMind](https://deepmind.google/)\ne pela [Isomorphic Labs](https://www.isomorphiclabs.com/). Ele gera previsões\nsobre a estrutura 3D de moléculas biológicas, apresentando a confiança do\nmodelo. Disponibilizamos os parâmetros do modelo treinado e as saídas geradas\npor ele sem custo financeiro para determinados usos não comerciais, de acordo\ncom estes Termos de Uso e com a\n[Política de uso proibido dos parâmetros do modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Portugues-Brazil.md).\n\n**Observações importantes sobre o uso dos parâmetros e das saídas do modelo\nAlphaFold 3**\n\n1.  Os parâmetros e as saídas do modelo AlphaFold 3 só estão disponíveis para\n    uso não comercial por organizações não comerciais ou em nome delas (*por\n    exemplo*, universidades, organizações sem fins lucrativos, institutos de\n    pesquisa e órgãos governamentais, educacionais e de notícias). Se você for\n    um pesquisador afiliado a uma organização não comercial, você tem permissão\n    para usar esses recursos em sua pesquisa afiliada a organizações sem fins\n    lucrativos, desde que você não seja uma organização comercial nem esteja\n    agindo em nome de uma.\n2.  Não use nem permita que outras pessoas usem:\n    1.  os parâmetros ou as saídas do modelo AlphaFold 3 em relação a qualquer\n        atividade comercial, incluindo a pesquisa em nome de organizações\n        comerciais; ou\n    2.  a saída do AlphaFold 3 para treinar modelos de aprendizado de máquina ou\n        tecnologia relacionada na previsão de estrutura biomolecular semelhante\n        ao AlphaFold 3.\n3.  Você *não tem permissão* para publicar ou compartilhar os parâmetros do\n    modelo AlphaFold 3, exceto compartilhar dentro da sua organização de acordo\n    com estes Termos.\n4.  Você *tem permissão* para publicar, compartilhar e adaptar as *saídas* do\n    AlphaFold 3 de acordo com estes Termos, incluindo os requisitos de oferecer\n    aviso claro de quaisquer modificações e de que o uso contínuo das saídas e\n    derivados do modelo estão sujeitos aos\n    [Termos de Uso das saídas do AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md).\n\nAo usar, reproduzir, modificar, realizar, distribuir ou exibir qualquer parte ou\nelemento dos Parâmetros do modelo (conforme definido abaixo) ou aceitar de outra\nforma os termos deste contrato, você concorda em se vincular (1) a estes Termos\nde Uso e (2) à\n[Política de uso proibido dos parâmetros do modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Portugues-Brazil.md),\nincorporada aqui como referência (em conjunto, os \"**Termos**\"), em cada caso\n(a) conforme modificado periodicamente de acordo com os Termos e (b) entre você\ne (i), se você for de um país no Espaço Econômico Europeu ou da Suíça, a Google\nIreland Limited ou (ii), caso contrário, a Google LLC.\n\nVocê confirma que tem autorização explícita ou implícita para celebrar, e está\ncelebrando, estes Termos como funcionário ou de outro modo em nome da sua\norganização.\n\nLeia estes Termos com atenção. Eles definem o que você pode esperar de nós ao\nacessar e usar os Recursos do AlphaFold 3 (conforme definido abaixo) e o que o\nGoogle espera de você. \"**Você**\" significa o indivíduo ou a organização que\nestá usando os Recursos do AlphaFold 3. \"**Nós**\", \"**nos**\" ou \"**Google**\"\nsignificam as entidades que pertencem ao grupo de empresas do Google, ou seja, a\nGoogle LLC e suas afiliadas.\n\n## 1. Principais definições\n\nConforme usado nestes Termos:\n\n\"**AlphaFold 3**\" significa: (a) o código-fonte do AlphaFold 3 disponível\n[neste link](https://github.com/google-deepmind/alphafold3/) e licenciado nos\ntermos da licença Creative Commons Attribution-NonCommercial-Sharealike 4.0\nInternational (CC-BY-NC-SA 4.0), bem como qualquer código-fonte derivado, e (b)\nParâmetros do modelo.\n\n\"**Recursos do AlphaFold 3**\" significam as Saídas e os Parâmetros do modelo.\n\n\"**Distribuição**\" ou \"**Distribuir**\" significam qualquer transmissão,\npublicação ou outra forma de compartilhamento das Saídas publicamente ou com\nqualquer outra pessoa.\n\n\"**Parâmetros do modelo**\" significam os pesos e os parâmetros do modelo\ntreinado disponibilizados pelo Google às organizações (a critério próprio) para\nuso de acordo com estes Termos, com (a) modificações nesses pesos e parâmetros,\ncom (b) trabalhos baseados nesses pesos e parâmetros ou (c) com outros códigos\nou modelos de aprendizado de máquina que incorporam esses pesos e parâmetros na\níntegra ou em partes.\n\n\"**Saída**\" significa as previsões de estrutura e todas as informações\nadicionais e relacionadas que são fornecidas pelo AlphaFold 3 ou usam os\nParâmetros do modelo, com quaisquer representações visuais, previsões\ncomputacionais, descrições, modificações, cópias ou adaptações derivadas\nconsideravelmente da Saída.\n\n\"**Incluindo**\" significa \"**incluindo, sem limitação**\".\n\n## 2. Acesso e uso dos Recursos do AlphaFold 3\n\nSujeito à sua compliance com os Termos, incluindo a\n[Política de uso proibido do AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Portugues-Brazil.md),\nvocê pode acessar, usar e modificar os Recursos do AlphaFold 3 e Distribuir as\nSaídas conforme definido nestes Termos. Concedemos a você uma licença não\nexclusiva, livre de royalties, revogável, intransferível e não sublicenciável\n(exceto conforme expressamente permitido nestes Termos) para todos os nossos\ndireitos de propriedade intelectual dos Recursos do AlphaFold na medida\nnecessária para esses fins. Para verificar seu acesso e uso do AlphaFold 3,\npodemos solicitar informações adicionais periodicamente, incluindo a verificação\ndo seu nome, organização e outras informações de identificação.\n\nAo acessar, usar ou modificar os Recursos do AlphaFold 3, Distribuir a Saída ou\nsolicitar acesso aos Parâmetros do modelo, você declara e garante que (a) tem\ntotal capacidade legal para celebrar estes Termos (incluindo a idade mínima de\nconsentimento), (b) o Google nunca rescindiu seu acesso e direito de usar o\nAlphaFold 3 (incluindo conforme disponibilizado pelo\n[Servidor da AlphaFold](https://alphafoldserver.com/about)) devido à sua\nviolação dos Termos de Uso relevantes, (c) celebrar ou exercer seus direitos e\nobrigações de acordo com estes Termos não violará nenhum contrato firmado entre\nvocê e um terceiro ou quaisquer direitos de terceiros, (d) quaisquer informações\nque você fornecer ao Google em relação ao AlphaFold 3, incluindo solicitar\nacesso aos Parâmetros do modelo (quando aplicável), são verdadeiras e atuais, e\n(e) você (i) não é residente de um país embargado, (ii) não é residente\nordinário de um país embargado pelos EUA ou (iii) não tem nenhuma outra\nproibição de acessar, usar ou modificar os Recursos do AlphaFold 3 pelos\nprogramas de sanções e controles de exportação aplicáveis.\n\nAo optar por dar feedback ao Google, como sugestões para melhorar o AlphaFold 3,\nvocê assume que essas informações não são confidenciais nem reservadas, e\npoderemos agir de acordo com seu feedback sem qualquer compromisso com você.\n\n## 3. Restrições de uso\n\nVocê não tem permissão para usar qualquer Recurso do AlphaFold 3:\n\n1.  para os usos restritos estabelecidos na\n    [Política de uso proibido dos Parâmetros do modelo AlphaFold 3](https://github.com/google-deepmind/alphafold3/blob/main/legal/WEIGHTS_PROHIBITED_USE_POLICY-Portugues-Brazil.md);\n    ou\n2.  em violação das leis e regulamentações aplicáveis.\n\nAté o limite permitido pela legislação e sem limitação de quaisquer outros\ndireitos, o Google reserva o direito de revogar e (até onde possível) restringir\nseu uso de qualquer Recurso do AlphaFold 3 que acreditamos razoavelmente violar\nestes Termos.\n\n## 4. Saída gerada\n\nEmbora você precise cumprir com estes Termos ao usar os Recursos do AlphaFold 3,\nnão reivindicaremos propriedade da Saída original que você gerar usando o\nAlphaFold 3. No entanto, você reconhece que o AlphaFold 3 pode gerar uma Saída\nigual ou semelhante para vários usuários, incluindo o Google, e reservamos todos\nos direitos nesse sentido.\n\n## 5. Mudanças nos Recursos do AlphaFold 3 ou nestes Termos\n\nO Google pode adicionar ou remover funcionalidades ou funções dos Recursos do\nAlphaFold 3 a qualquer momento e parar de oferecer acesso a elas completamente.\n\nO Google pode atualizar estes Termos e o mecanismo de acesso aos Parâmetros do\nmodelo a qualquer momento. Quaisquer modificações nestes Termos serão postadas\n[no repositório GitHub do AlphaFold 3](https://github.com/google-deepmind/alphafold3).\nGeralmente, as alterações entrarão em vigor 14 dias após a postagem. No entanto,\nas alterações relacionadas à funcionalidade ou feitas por motivos jurídicos\nserão aplicadas imediatamente.\n\nConsulte os Termos sempre que forem atualizados ou você usar os Recursos do\nAlphaFold 3. Se você não concordar com quaisquer modificações nos Termos, pare\nde usar os Recursos do AlphaFold 3 imediatamente.\n\n## 6. Suspensão ou encerramento do seu direito de usar os Recursos do AlphaFold 3\n\nO Google pode suspender ou encerrar a qualquer momento seu direito de usar e,\nconforme aplicável, acessar os Recursos do AlphaFold 3 devido ao não cumprimento\ndos Termos, entre outros motivos. Se o Google suspender ou encerrar seu direito\nde acessar ou usar os Recursos do AlphaFold 3, você precisará excluir e parar de\nusar e Distribuir imediatamente todas as cópias dos Recursos do AlphaFold 3 em\nsua posse ou controle. Você não poderá usar os Recursos do AlphaFold 3,\nincluindo o envio de um aplicativo para usar os Parâmetros do modelo. O Google\nfará o possível para fornecer aviso prévio razoável antes de qualquer suspensão\nou encerramento, mas não daremos nenhum aviso ou alerta com antecedência se a\nsuspensão ou o encerramento for por não obedecer totalmente aos Termos ou outras\njustificativas graves.\n\nVocê pode parar de usar os Recursos do AlphaFold 3 a qualquer momento. Nesse\ncaso, queremos saber o motivo (via alphafold@google.com) para continuarmos\nmelhorando nossas tecnologias.\n\n## 7. Confidencialidade\n\nVocê concorda em não divulgar nem disponibilizar Informações confidenciais do\nGoogle a qualquer pessoa sem nosso consentimento prévio por escrito.\n\"**Informações confidenciais do Google**\" significam (a) os Parâmetros do modelo\ne todo software, tecnologia e documentação associados ao AlphaFold 3, exceto\npara o código-fonte do AlphaFold 3, e (b) quaisquer outras informações\ndisponibilizadas pelo Google que foram marcadas como confidenciais ou que seriam\nnormalmente consideradas assim nas circunstâncias em que são apresentadas. As\nInformações confidenciais do Google não incluem (a) informações que você já\nsabia antes do seu acesso ou uso dos Recursos do AlphaFold 3 (incluindo pelo\n[Servidor do AlphaFold](https://alphafoldserver.com/about)), (b) que se tornaram\npúblicas sem sua culpa (por exemplo, sua violação dos Termos), (c) que foram\ndesenvolvidas de maneira independente por você sem referência às Informações\nconfidenciais do Google ou (d) foram fornecidas legalmente a você por um\nterceiro (sem que você nem o terceiro violassem os Termos).\n\n## 8. Exoneração de responsabilidade\n\nOs Termos não restringem quaisquer direitos que não possam ser restritos de\nacordo com a legislação aplicável nem limitam as responsabilidades do Google,\nexceto conforme permitido pela legislação aplicável.\n\n**O AlphaFold 3 e as Saídas são fornecidos no estado em que se encontram, sem\ngarantias ou condições de qualquer tipo, sejam explícitas ou implícitas,\nincluindo quaisquer garantias ou condições de título, comercialidade, adequação\npara uma finalidade específica e não violação. Você é a única pessoa responsável\npor determinar se o uso do AlphaFold 3, ou uso/distribuição das Saídas, é\nadequado e assume qualquer e todo risco associado a esse uso ou distribuição e\nao exercício dos seus direitos e obrigações de acordo com estes Termos. Você e\nqualquer pessoa com quem compartilhar as Saídas são exclusivamente responsáveis\npor elas e pelos usos subsequentes delas.**\n\n**As Saídas são previsões com níveis variados de confiança e devem ser\ninterpretadas com cuidado. Tenha cautela antes de confiar, publicar, baixar ou\nusar de outra forma o AlphaFold 3.**\n\n**O AlphaFold 3 e as Saídas servem apenas para modelagem teórica. Eles não são\ndestinados, validados nem aprovados para uso clínico. Não os use para\nfinalidades clínicas nem conte com eles para aconselhamento médico ou de outra\nnatureza. Todo conteúdo sobre esses assuntos é fornecido somente para fins\ninformativos e não substitui a orientação de um profissional qualificado.**\n\n## 9. Responsabilidades\n\nNa medida permitida pela lei, você indenizará o Google e os diretores,\nexecutivos, funcionários e prestadores de serviço dele por qualquer processo\njudicial de terceiros (incluindo ações de órgãos do governo) decorrente ou\nrelacionado ao uso ilegal dos Recursos do AlphaFold ou a violações dos Termos.\nEssa indenização cobre qualquer responsabilidade ou despesa decorrente de ações\njudiciais, perdas, danos, julgamentos, multas, custos de litígios e honorários\njurídicos, exceto se a responsabilidade ou despesa for causada por violação,\nnegligência ou má conduta intencional do Google. Se você for passível de isenção\nlegal de certas responsabilidades, incluindo indenização, essas\nresponsabilidades não se aplicarão a você de acordo com os Termos.\n\nEm hipótese alguma o Google será responsável por quaisquer danos indiretos,\nespeciais, incidentais, exemplares, emergentes ou punitivos ou por perdas de\nlucros de qualquer tipo em relação aos Termos ou aos Recursos do AlphaFold 3,\nmesmo se o Google tiver sido advertido da possibilidade de tais danos. A\nresponsabilidade agregada total do Google para todas as ações judiciais\ndecorrentes de ou relacionadas aos Termos ou aos Recursos do AlphaFold 3,\nincluindo pela nossa negligência, é limitada a US$ 500.\n\n## 10. Disposições gerais\n\nPor lei, você tem certos direitos que não podem ser limitados por um contrato\ncomo os Termos. Os Termos não têm, de forma alguma, o objetivo de restringir\nesses direitos.\n\nOs Termos constituem a integralidade do nosso contrato relacionado ao seu uso\ndos Recursos do AlphaFold 3 e substituem quaisquer contratos anteriores ou\ncontemporâneos sobre esse assunto.\n\nSe uma disposição específica dos Termos não for aplicável, o saldo dos Termos\npermanecerá vigente.\n\n## 11. Disputas\n\nAs leis da Califórnia vão reger todas as disputas que surgirem com relação aos\nTermos ou em relação aos Recursos do AlphaFold 3. Essas disputas serão\nresolvidas exclusivamente nos tribunais federais ou estaduais do condado de\nSanta Clara, Califórnia, EUA, e você e o Google concordam com a jurisdição\npessoal nesses tribunais. Se a legislação local aplicável impedir que alguma\ndisputa seja tratada em um tribunal na Califórnia, você e o Google podem entrar\ncom a petição no seu foro local. Da mesma forma, se a legislação local aplicável\nimpedir que o tribunal local aplique a lei da Califórnia para resolver essas\ndisputas, elas serão regidas pelas leis do seu país, estado ou outro local de\nresidência. Se você usar os Recursos do AlphaFold 3 em nome de uma organização\ngovernamental que não seja do governo federal dos EUA (onde as disposições acima\nse aplicam até onde permitido pela legislação federal), estes Termos não se\naplicarão quanto à legislação aplicável e aos tribunais.\n\nConsiderando a natureza das pesquisas científicas, pode levar algum tempo para\nqualquer violação dos Termos se tornar aparente. Para proteger você, o Google e\nos Recursos do AlphaFold 3, até onde permitido pela legislação aplicável, você\nconcorda que:\n\n1.  qualquer ação judicial relacionada aos Termos ou Recursos do AlphaFold 3\n    pode ser iniciada até o que ocorrer por último:\n    1.  a data-limite de acordo com a legislação aplicável para iniciar a ação\n        judicial; ou\n    2.  dois anos após a data em que você ou o Google (conforme aplicável) tomou\n        conhecimento, ou deve ter tomado conhecimento de forma razoável, dos\n        fatos que deram origem a essa ação; e\n2.  você não alegará limitação, prazo de prescrição, atraso, renúncia ou\n    semelhantes para tentar impedir uma ação registrada nesse período, e o\n    Google também não.\n\nTodos os direitos que não forem concedidos a você de maneira específica e\nexplícita pelos Termos são reservados ao Google. Nenhum atraso, ação ou omissão\ndo Google em exercer qualquer direito ou correção será considerado uma renúncia\na qualquer violação dos Termos, e o Google reserva expressamente todos e\nquaisquer direitos e correções disponíveis de acordo com os Termos ou com base\nna lei, na equidade ou de outra forma, incluindo a correção da tutela de\nurgência contra qualquer violação real dos Termos ou ameaça disso sem precisar\ncomprovar danos reais.\n"
  },
  {
    "path": "pyproject.toml",
    "content": "[build-system]\nrequires = [\n    \"scikit_build_core\",\n    \"pybind11\",\n    \"cmake>=3.28\",\n    \"ninja\",\n    \"numpy\",\n]\nbuild-backend = \"scikit_build_core.build\"\n\n[project]\nname = \"alphafold3\"\nversion = \"3.0.1\"\nrequires-python = \">=3.12\"\nreadme = \"README.md\"\nlicense = {file = \"LICENSE\"}\ndependencies = [\n    \"absl-py>=2.3.1\",\n    \"dm-haiku==0.0.16\",\n    \"jax==0.9.1\",\n    \"jax[cuda12]==0.9.1\",\n    \"numpy\",\n    \"rdkit==2025.9.4\",\n    \"tokamax==0.0.11\",\n    \"tqdm\",\n    \"zstandard\",\n]\n\n[dependency-groups]\ndev = [\n    \"pytest>=6.0\",\n]\n\n[tool.uv]\npackage = true\nenvironments = [\n    \"sys_platform == 'linux' and platform_machine == 'x86_64'\",\n    \"sys_platform == 'linux' and platform_machine == 'aarch64'\",\n]\n\n[tool.scikit-build]\nwheel.exclude = [\n    \"**.pyx\",\n    \"**/CMakeLists.txt\",\n    \"**.cc\",\n    \"**.h\"\n]\nsdist.include = [\n    \"LICENSE\",\n    \"OUTPUT_TERMS_OF_USE.md\",\n    \"WEIGHTS_PROHIBITED_USE_POLICY.md\",\n    \"WEIGHTS_TERMS_OF_USE.md\",\n]\n\n[tool.cibuildwheel]\nbuild = \"cp3*-manylinux_x86_64\"\nmanylinux-x86_64-image = \"manylinux_2_28\"\n\n[project.scripts]\nbuild_data = \"alphafold3.build_data:build_data\"\n"
  },
  {
    "path": "run_alphafold.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"AlphaFold 3 structure prediction script.\n\nAlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\nthis license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n\nTo request access to the AlphaFold 3 model parameters, follow the process set\nout at https://github.com/google-deepmind/alphafold3. You may only use these\nif received directly from Google. Use is subject to terms of use available at\nhttps://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\"\"\"\n\nfrom collections.abc import Callable, Sequence\nimport csv\nimport dataclasses\nimport datetime\nimport functools\nimport os\nimport pathlib\nimport shutil\nimport string\nimport textwrap\nimport time\nimport typing\nfrom typing import overload\n\nfrom absl import app\nfrom absl import flags\nfrom alphafold3.common import folding_input\nfrom alphafold3.common import resources\nfrom alphafold3.constants import chemical_components\nimport alphafold3.cpp\nfrom alphafold3.data import featurisation\nfrom alphafold3.data import pipeline\nfrom alphafold3.data.tools import shards\nfrom alphafold3.model import features\nfrom alphafold3.model import model\nfrom alphafold3.model import params\nfrom alphafold3.model import post_processing\nfrom alphafold3.model.components import utils\nimport haiku as hk\nimport jax\nfrom jax import numpy as jnp\nimport numpy as np\nimport tokamax\n\n\n_HOME_DIR = pathlib.Path(os.environ.get('HOME'))\n_DEFAULT_MODEL_DIR = _HOME_DIR / 'models'\n_DEFAULT_DB_DIR = _HOME_DIR / 'public_databases'\n\n\n# Input and output paths.\n_JSON_PATH = flags.DEFINE_string(\n    'json_path',\n    None,\n    'Path to the input JSON file.',\n)\n_INPUT_DIR = flags.DEFINE_string(\n    'input_dir',\n    None,\n    'Path to the directory containing input JSON files.',\n)\n_OUTPUT_DIR = flags.DEFINE_string(\n    'output_dir',\n    None,\n    'Path to a directory where the results will be saved.',\n)\nMODEL_DIR = flags.DEFINE_string(\n    'model_dir',\n    _DEFAULT_MODEL_DIR.as_posix(),\n    'Path to the model to use for inference.',\n)\n\n# Control which stages to run.\n_RUN_DATA_PIPELINE = flags.DEFINE_bool(\n    'run_data_pipeline',\n    True,\n    'Whether to run the data pipeline on the fold inputs.',\n)\n_RUN_INFERENCE = flags.DEFINE_bool(\n    'run_inference',\n    True,\n    'Whether to run inference on the fold inputs.',\n)\n\n# Binary paths.\n_JACKHMMER_BINARY_PATH = flags.DEFINE_string(\n    'jackhmmer_binary_path',\n    shutil.which('jackhmmer'),\n    'Path to the Jackhmmer binary.',\n)\n_NHMMER_BINARY_PATH = flags.DEFINE_string(\n    'nhmmer_binary_path',\n    shutil.which('nhmmer'),\n    'Path to the Nhmmer binary.',\n)\n_HMMALIGN_BINARY_PATH = flags.DEFINE_string(\n    'hmmalign_binary_path',\n    shutil.which('hmmalign'),\n    'Path to the Hmmalign binary.',\n)\n_HMMSEARCH_BINARY_PATH = flags.DEFINE_string(\n    'hmmsearch_binary_path',\n    shutil.which('hmmsearch'),\n    'Path to the Hmmsearch binary.',\n)\n_HMMBUILD_BINARY_PATH = flags.DEFINE_string(\n    'hmmbuild_binary_path',\n    shutil.which('hmmbuild'),\n    'Path to the Hmmbuild binary.',\n)\n\n# Database paths.\nDB_DIR = flags.DEFINE_multi_string(\n    'db_dir',\n    (_DEFAULT_DB_DIR.as_posix(),),\n    'Path to the directory containing the databases. Can be specified multiple'\n    ' times to search multiple directories in order.',\n)\n\n_SMALL_BFD_DATABASE_PATH = flags.DEFINE_string(\n    'small_bfd_database_path',\n    '${DB_DIR}/bfd-first_non_consensus_sequences.fasta',\n    'Small BFD database path, used for protein MSA search.',\n)\n_SMALL_BFD_Z_VALUE = flags.DEFINE_integer(\n    'small_bfd_z_value',\n    None,\n    'The Z-value representing the database size in number of sequences for'\n    ' E-value calculation. Must be set for sharded databases.',\n    lower_bound=0,\n)\n_MGNIFY_DATABASE_PATH = flags.DEFINE_string(\n    'mgnify_database_path',\n    '${DB_DIR}/mgy_clusters_2022_05.fa',\n    'Mgnify database path, used for protein MSA search.',\n)\n_MGNIFY_Z_VALUE = flags.DEFINE_integer(\n    'mgnify_z_value',\n    None,\n    'The Z-value representing the database size in number of sequences for'\n    ' E-value calculation. Must be set for sharded databases.',\n    lower_bound=0,\n)\n_UNIPROT_CLUSTER_ANNOT_DATABASE_PATH = flags.DEFINE_string(\n    'uniprot_cluster_annot_database_path',\n    '${DB_DIR}/uniprot_all_2021_04.fa',\n    'UniProt database path, used for protein paired MSA search.',\n)\n_UNIPROT_CLUSTER_ANNOT_Z_VALUE = flags.DEFINE_integer(\n    'uniprot_cluster_annot_z_value',\n    None,\n    'The Z-value representing the database size in number of sequences for'\n    ' E-value calculation. Must be set for sharded databases.',\n    lower_bound=0,\n)\n_UNIREF90_DATABASE_PATH = flags.DEFINE_string(\n    'uniref90_database_path',\n    '${DB_DIR}/uniref90_2022_05.fa',\n    'UniRef90 database path, used for MSA search. The MSA obtained by '\n    'searching it is used to construct the profile for template search.',\n)\n_UNIREF90_Z_VALUE = flags.DEFINE_integer(\n    'uniref90_z_value',\n    None,\n    'The Z-value representing the database size in number of sequences for'\n    ' E-value calculation. Must be set for sharded databases.',\n    lower_bound=0,\n)\n_NTRNA_DATABASE_PATH = flags.DEFINE_string(\n    'ntrna_database_path',\n    '${DB_DIR}/nt_rna_2023_02_23_clust_seq_id_90_cov_80_rep_seq.fasta',\n    'NT-RNA database path, used for RNA MSA search.',\n)\n_NTRNA_Z_VALUE = flags.DEFINE_float(\n    'ntrna_z_value',\n    None,\n    'The Z-value representing the database size in megabases for E-value'\n    ' calculation. Must be set for sharded databases.',\n    lower_bound=0.0,\n)\n_RFAM_DATABASE_PATH = flags.DEFINE_string(\n    'rfam_database_path',\n    '${DB_DIR}/rfam_14_9_clust_seq_id_90_cov_80_rep_seq.fasta',\n    'Rfam database path, used for RNA MSA search.',\n)\n_RFAM_Z_VALUE = flags.DEFINE_float(\n    'rfam_z_value',\n    None,\n    'The Z-value representing the database size in megabases for E-value'\n    ' calculation. Must be set for sharded databases.',\n    lower_bound=0.0,\n)\n_RNA_CENTRAL_DATABASE_PATH = flags.DEFINE_string(\n    'rna_central_database_path',\n    '${DB_DIR}/rnacentral_active_seq_id_90_cov_80_linclust.fasta',\n    'RNAcentral database path, used for RNA MSA search.',\n)\n_RNA_CENTRAL_Z_VALUE = flags.DEFINE_float(\n    'rna_central_z_value',\n    None,\n    'The Z-value representing the database size in megabases for E-value'\n    ' calculation. Must be set for sharded databases.',\n    lower_bound=0.0,\n)\n_PDB_DATABASE_PATH = flags.DEFINE_string(\n    'pdb_database_path',\n    '${DB_DIR}/mmcif_files',\n    'PDB database directory with mmCIF files path, used for template search.',\n)\n_SEQRES_DATABASE_PATH = flags.DEFINE_string(\n    'seqres_database_path',\n    '${DB_DIR}/pdb_seqres_2022_09_28.fasta',\n    'PDB sequence database path, used for template search.',\n)\n\n# Number of CPUs to use for MSA tools.\n_JACKHMMER_N_CPU = flags.DEFINE_integer(\n    'jackhmmer_n_cpu',\n    # Unfortunately, os.process_cpu_count() is only available in Python 3.13+.\n    min(len(os.sched_getaffinity(0)), 8),\n    'Number of CPUs to use for Jackhmmer. Defaults to min(cpu_count, 8). Going'\n    ' above 8 CPUs provides very little additional speedup.',\n    lower_bound=0,\n)\n_JACKHMMER_MAX_PARALLEL_SHARDS = flags.DEFINE_integer(\n    'jackhmmer_max_parallel_shards',\n    None,\n    'Maximum number of shards to search against in parallel. If unset, one'\n    ' Jackhmmer instance will be run per shard. Only applicable if the'\n    ' database is sharded.',\n    lower_bound=1,\n)\n_NHMMER_N_CPU = flags.DEFINE_integer(\n    'nhmmer_n_cpu',\n    # Unfortunately, os.process_cpu_count() is only available in Python 3.13+.\n    min(len(os.sched_getaffinity(0)), 8),\n    'Number of CPUs to use for Nhmmer. Defaults to min(cpu_count, 8). Going'\n    ' above 8 CPUs provides very little additional speedup.',\n    lower_bound=0,\n)\n_NHMMER_MAX_PARALLEL_SHARDS = flags.DEFINE_integer(\n    'nhmmer_max_parallel_shards',\n    None,\n    'Maximum number of shards to search against in parallel. If unset, one'\n    ' Nhmmer instance will be run per shard. Only applicable if the'\n    ' database is sharded.',\n    lower_bound=1,\n)\n\n# Data pipeline configuration.\n_RESOLVE_MSA_OVERLAPS = flags.DEFINE_bool(\n    'resolve_msa_overlaps',\n    True,\n    'Whether to deduplicate unpaired MSA against paired MSA. The default'\n    ' behaviour matches the method described in the AlphaFold 3 paper. Set this'\n    ' to false if providing custom paired MSA using the unpaired MSA field to'\n    ' keep it exactly as is as deduplication against the paired MSA could break'\n    ' the manually crafted pairing between MSA sequences.',\n)\n_MAX_TEMPLATE_DATE = flags.DEFINE_string(\n    'max_template_date',\n    '2021-09-30',  # By default, use the date from the AlphaFold 3 paper.\n    'Maximum template release date to consider. Format: YYYY-MM-DD. All'\n    ' templates released after this date will be ignored. Controls also whether'\n    ' to allow use of model coordinates for a chemical component from the CCD'\n    ' if RDKit conformer generation fails and the component does not have ideal'\n    ' coordinates set. Only for components that have been released before this'\n    ' date the model coordinates can be used as a fallback.',\n)\n_CONFORMER_MAX_ITERATIONS = flags.DEFINE_integer(\n    'conformer_max_iterations',\n    None,  # Default to RDKit default parameters value.\n    'Optional override for maximum number of iterations to run for RDKit '\n    'conformer search.',\n    lower_bound=0,\n)\n\n# JAX inference performance tuning.\n_JAX_COMPILATION_CACHE_DIR = flags.DEFINE_string(\n    'jax_compilation_cache_dir',\n    None,\n    'Path to a directory for the JAX compilation cache.',\n)\n_GPU_DEVICE = flags.DEFINE_integer(\n    'gpu_device',\n    0,\n    'Optional override for the GPU device to use for inference, uses zero-based'\n    ' indexing. Defaults to the 0th GPU on the system. Useful on multi-GPU'\n    ' systems to pin each run to a specific GPU. Note that if GPUs are already'\n    ' pre-filtered by the environment (e.g. by using CUDA_VISIBLE_DEVICES),'\n    ' this flag refers to the GPU index after the filtering has been done.',\n)\n_BUCKETS = flags.DEFINE_list(\n    'buckets',\n    # pyformat: disable\n    ['256', '512', '768', '1024', '1280', '1536', '2048', '2560', '3072',\n     '3584', '4096', '4608', '5120'],\n    # pyformat: enable\n    'Strictly increasing order of token sizes for which to cache compilations.'\n    ' For any input with more tokens than the largest bucket size, a new bucket'\n    ' is created for exactly that number of tokens.',\n)\n_FLASH_ATTENTION_IMPLEMENTATION = flags.DEFINE_enum(\n    'flash_attention_implementation',\n    default='triton',\n    enum_values=['triton', 'cudnn', 'xla'],\n    help=(\n        \"Flash attention implementation to use. 'triton' and 'cudnn' uses a\"\n        ' Triton and cuDNN flash attention implementation, respectively. The'\n        ' Triton kernel is fastest and has been tested more thoroughly. The'\n        \" Triton and cuDNN kernels require Ampere GPUs or later. 'xla' uses an\"\n        ' XLA attention implementation (no flash attention) and is portable'\n        ' across GPU devices.'\n    ),\n)\n_NUM_RECYCLES = flags.DEFINE_integer(\n    'num_recycles',\n    10,\n    'Number of recycles to use during inference.',\n    lower_bound=1,\n)\n_NUM_DIFFUSION_SAMPLES = flags.DEFINE_integer(\n    'num_diffusion_samples',\n    5,\n    'Number of diffusion samples to generate.',\n    lower_bound=1,\n)\n_NUM_SEEDS = flags.DEFINE_integer(\n    'num_seeds',\n    None,\n    'Number of seeds to use for inference. If set, only a single seed must be'\n    ' provided in the input JSON. AlphaFold 3 will then generate random seeds'\n    ' in sequence, starting from the single seed specified in the input JSON.'\n    ' The full input JSON produced by AlphaFold 3 will include the generated'\n    ' random seeds. If not set, AlphaFold 3 will use the seeds as provided in'\n    ' the input JSON.',\n    lower_bound=1,\n)\n\n# Output controls.\n_SAVE_EMBEDDINGS = flags.DEFINE_bool(\n    'save_embeddings',\n    False,\n    'Whether to save the final trunk single and pair embeddings in the output.'\n    ' Note that the embeddings are large float16 arrays: num_tokens * 384'\n    ' + num_tokens * num_tokens * 128.',\n)\n_SAVE_DISTOGRAM = flags.DEFINE_bool(\n    'save_distogram',\n    False,\n    'Whether to save the final distogram in the output. Note that the distogram'\n    ' is a large float16 array: num_tokens * num_tokens * 64.',\n)\n_FORCE_OUTPUT_DIR = flags.DEFINE_bool(\n    'force_output_dir',\n    False,\n    'Whether to force the output directory to be used even if it already exists'\n    ' and is non-empty. Useful to set this to True to run the data pipeline and'\n    ' the inference separately, but use the same output directory.',\n)\n_COMPRESS_LARGE_OUTPUT_FILES = flags.DEFINE_bool(\n    'compress_large_output_files',\n    False,\n    'If True, compresses the output mmCIF and confidences JSON files (the two'\n    ' largest files) using zstandard. Note that embeddings and distogram, if'\n    ' saved, are already stored in a compressed format.',\n)\n\n\ndef make_model_config(\n    *,\n    flash_attention_implementation: tokamax.DotProductAttentionImplementation = 'triton',\n    num_diffusion_samples: int = 5,\n    num_recycles: int = 10,\n    return_embeddings: bool = False,\n    return_distogram: bool = False,\n) -> model.Model.Config:\n  \"\"\"Returns a model config with some defaults overridden.\"\"\"\n  config = model.Model.Config()\n  config.global_config.flash_attention_implementation = (\n      flash_attention_implementation\n  )\n  config.heads.diffusion.eval.num_samples = num_diffusion_samples\n  config.num_recycles = num_recycles\n  config.return_embeddings = return_embeddings\n  config.return_distogram = return_distogram\n  return config\n\n\nclass ModelRunner:\n  \"\"\"Helper class to run structure prediction stages.\"\"\"\n\n  def __init__(\n      self,\n      config: model.Model.Config,\n      device: jax.Device,\n      model_dir: pathlib.Path,\n  ):\n    self._model_config = config\n    self._device = device\n    self._model_dir = model_dir\n\n  @functools.cached_property\n  def model_params(self) -> hk.Params:\n    \"\"\"Loads model parameters from the model directory.\"\"\"\n    return params.get_model_haiku_params(model_dir=self._model_dir)\n\n  @functools.cached_property\n  def _model(\n      self,\n  ) -> Callable[[jnp.ndarray, features.BatchDict], model.ModelResult]:\n    \"\"\"Loads model parameters and returns a jitted model forward pass.\"\"\"\n\n    @hk.transform\n    def forward_fn(batch):\n      return model.Model(self._model_config)(batch)\n\n    return functools.partial(\n        jax.jit(forward_fn.apply, device=self._device), self.model_params\n    )\n\n  def run_inference(\n      self, featurised_example: features.BatchDict, rng_key: jnp.ndarray\n  ) -> model.ModelResult:\n    \"\"\"Computes a forward pass of the model on a featurised example.\"\"\"\n    featurised_example = jax.device_put(\n        jax.tree_util.tree_map(\n            jnp.asarray, utils.remove_invalidly_typed_feats(featurised_example)\n        ),\n        self._device,\n    )\n\n    result = self._model(rng_key, featurised_example)\n    result = jax.tree.map(np.asarray, result)\n    result = jax.tree.map(\n        lambda x: x.astype(jnp.float32) if x.dtype == jnp.bfloat16 else x,\n        result,\n    )\n    result = dict(result)\n    identifier = self.model_params['__meta__']['__identifier__'].tobytes()\n    result['__identifier__'] = identifier\n    return result\n\n  def extract_inference_results(\n      self,\n      batch: features.BatchDict,\n      result: model.ModelResult,\n      target_name: str,\n  ) -> list[model.InferenceResult]:\n    \"\"\"Extracts inference results from model outputs.\"\"\"\n    return list(\n        model.Model.get_inference_result(\n            batch=batch, result=result, target_name=target_name\n        )\n    )\n\n  def extract_embeddings(\n      self, result: model.ModelResult, num_tokens: int\n  ) -> dict[str, np.ndarray] | None:\n    \"\"\"Extracts embeddings from model outputs.\"\"\"\n    embeddings = {}\n    if 'single_embeddings' in result:\n      embeddings['single_embeddings'] = result['single_embeddings'][\n          :num_tokens\n      ].astype(np.float16)\n    if 'pair_embeddings' in result:\n      embeddings['pair_embeddings'] = result['pair_embeddings'][\n          :num_tokens, :num_tokens\n      ].astype(np.float16)\n    return embeddings or None\n\n  def extract_distogram(\n      self, result: model.ModelResult, num_tokens: int\n  ) -> np.ndarray | None:\n    \"\"\"Extracts distogram from model outputs.\"\"\"\n    if 'distogram' not in result['distogram']:\n      return None\n    distogram = result['distogram']['distogram'][:num_tokens, :num_tokens, :]\n    return distogram\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass ResultsForSeed:\n  \"\"\"Stores the inference results (diffusion samples) for a single seed.\n\n  Attributes:\n    seed: The seed used to generate the samples.\n    inference_results: The inference results, one per sample.\n    full_fold_input: The fold input that must also include the results of\n      running the data pipeline - MSA and templates.\n    embeddings: The final trunk single and pair embeddings, if requested.\n    distogram: The token distance histogram, if requested.\n  \"\"\"\n\n  seed: int\n  inference_results: Sequence[model.InferenceResult]\n  full_fold_input: folding_input.Input\n  embeddings: dict[str, np.ndarray] | None = None\n  distogram: np.ndarray | None = None\n\n\ndef predict_structure(\n    fold_input: folding_input.Input,\n    model_runner: ModelRunner,\n    buckets: Sequence[int] | None = None,\n    ref_max_modified_date: datetime.date | None = None,\n    conformer_max_iterations: int | None = None,\n    resolve_msa_overlaps: bool = True,\n) -> Sequence[ResultsForSeed]:\n  \"\"\"Runs the full inference pipeline to predict structures for each seed.\"\"\"\n\n  print(f'Featurising data with {len(fold_input.rng_seeds)} seed(s)...')\n  featurisation_start_time = time.time()\n  ccd = chemical_components.Ccd(user_ccd=fold_input.user_ccd)\n  featurised_examples = featurisation.featurise_input(\n      fold_input=fold_input,\n      buckets=buckets,\n      ccd=ccd,\n      verbose=True,\n      ref_max_modified_date=ref_max_modified_date,\n      conformer_max_iterations=conformer_max_iterations,\n      resolve_msa_overlaps=resolve_msa_overlaps,\n  )\n  print(\n      f'Featurising data with {len(fold_input.rng_seeds)} seed(s) took'\n      f' {time.time() - featurisation_start_time:.2f} seconds.'\n  )\n  print(\n      'Running model inference and extracting output structure samples with'\n      f' {len(fold_input.rng_seeds)} seed(s)...'\n  )\n  all_inference_start_time = time.time()\n  all_inference_results = []\n  for seed, example in zip(fold_input.rng_seeds, featurised_examples):\n    print(f'Running model inference with seed {seed}...')\n    inference_start_time = time.time()\n    rng_key = jax.random.PRNGKey(seed)\n    result = model_runner.run_inference(example, rng_key)\n    print(\n        f'Running model inference with seed {seed} took'\n        f' {time.time() - inference_start_time:.2f} seconds.'\n    )\n    print(f'Extracting inference results with seed {seed}...')\n    extract_structures = time.time()\n    inference_results = model_runner.extract_inference_results(\n        batch=example, result=result, target_name=fold_input.name\n    )\n    num_tokens = len(inference_results[0].metadata['token_chain_ids'])\n    embeddings = model_runner.extract_embeddings(\n        result=result, num_tokens=num_tokens\n    )\n    distogram = model_runner.extract_distogram(\n        result=result, num_tokens=num_tokens\n    )\n    print(\n        f'Extracting {len(inference_results)} inference samples with'\n        f' seed {seed} took {time.time() - extract_structures:.2f} seconds.'\n    )\n\n    all_inference_results.append(\n        ResultsForSeed(\n            seed=seed,\n            inference_results=inference_results,\n            full_fold_input=fold_input,\n            embeddings=embeddings,\n            distogram=distogram,\n        )\n    )\n  print(\n      'Running model inference and extracting output structures with'\n      f' {len(fold_input.rng_seeds)} seed(s) took'\n      f' {time.time() - all_inference_start_time:.2f} seconds.'\n  )\n  return all_inference_results\n\n\ndef write_fold_input_json(\n    fold_input: folding_input.Input,\n    output_dir: os.PathLike[str] | str,\n) -> None:\n  \"\"\"Writes the input JSON to the output directory.\"\"\"\n  os.makedirs(output_dir, exist_ok=True)\n  path = os.path.join(output_dir, f'{fold_input.sanitised_name()}_data.json')\n  print(f'Writing model input JSON to {path}')\n  with open(path, 'wt') as f:\n    f.write(fold_input.to_json())\n\n\ndef write_outputs(\n    all_inference_results: Sequence[ResultsForSeed],\n    output_dir: os.PathLike[str] | str,\n    job_name: str,\n    compress_large_output_files: bool = False,\n) -> None:\n  \"\"\"Writes outputs to the specified output directory.\"\"\"\n  ranking_scores = []\n  max_ranking_score = None\n  max_ranking_result = None\n\n  output_terms = (\n      pathlib.Path(alphafold3.cpp.__file__).parent / 'OUTPUT_TERMS_OF_USE.md'\n  ).read_text()\n\n  os.makedirs(output_dir, exist_ok=True)\n  for results_for_seed in all_inference_results:\n    seed = results_for_seed.seed\n    for sample_idx, result in enumerate(results_for_seed.inference_results):\n      sample_dir = os.path.join(output_dir, f'seed-{seed}_sample-{sample_idx}')\n      os.makedirs(sample_dir, exist_ok=True)\n      post_processing.write_output(\n          inference_result=result,\n          output_dir=sample_dir,\n          name=f'{job_name}_seed-{seed}_sample-{sample_idx}',\n          compress=compress_large_output_files,\n      )\n      ranking_score = float(result.metadata['ranking_score'])\n      ranking_scores.append((seed, sample_idx, ranking_score))\n      if max_ranking_score is None or ranking_score > max_ranking_score:\n        max_ranking_score = ranking_score\n        max_ranking_result = result\n\n    if embeddings := results_for_seed.embeddings:\n      embeddings_dir = os.path.join(output_dir, f'seed-{seed}_embeddings')\n      os.makedirs(embeddings_dir, exist_ok=True)\n      post_processing.write_embeddings(\n          embeddings=embeddings,\n          output_dir=embeddings_dir,\n          name=f'{job_name}_seed-{seed}',\n      )\n\n    if (distogram := results_for_seed.distogram) is not None:\n      distogram_dir = os.path.join(output_dir, f'seed-{seed}_distogram')\n      os.makedirs(distogram_dir, exist_ok=True)\n      distogram_path = os.path.join(\n          distogram_dir, f'{job_name}_seed-{seed}_distogram.npz'\n      )\n      with open(distogram_path, 'wb') as f:\n        np.savez_compressed(f, distogram=distogram.astype(np.float16))\n\n  if max_ranking_result is not None:  # True iff ranking_scores non-empty.\n    post_processing.write_output(\n        inference_result=max_ranking_result,\n        output_dir=output_dir,\n        # The output terms of use are the same for all seeds/samples.\n        terms_of_use=output_terms,\n        name=job_name,\n        compress=compress_large_output_files,\n    )\n    # Save csv of ranking scores with seeds and sample indices, to allow easier\n    # comparison of ranking scores across different runs.\n    with open(\n        os.path.join(output_dir, f'{job_name}_ranking_scores.csv'), 'wt'\n    ) as f:\n      writer = csv.writer(f)\n      writer.writerow(['seed', 'sample', 'ranking_score'])\n      writer.writerows(ranking_scores)\n\n\ndef replace_db_dir(path_with_db_dir: str, db_dirs: Sequence[str]) -> str:\n  \"\"\"Replaces the DB_DIR placeholder in a path with the given DB_DIR.\"\"\"\n  template = string.Template(path_with_db_dir)\n  if 'DB_DIR' in template.get_identifiers():\n    for db_dir in db_dirs:\n      path = template.substitute(DB_DIR=db_dir)\n      if os.path.exists(path):\n        return path\n    raise FileNotFoundError(\n        f'{path_with_db_dir} with ${{DB_DIR}} not found in any of {db_dirs}.'\n    )\n  if (sharded_paths := shards.get_sharded_paths(path_with_db_dir)) is not None:\n    db_exists = all(os.path.exists(p) for p in sharded_paths)\n  else:\n    db_exists = os.path.exists(path_with_db_dir)\n  if not db_exists:\n    raise FileNotFoundError(f'{path_with_db_dir} does not exist.')\n  return path_with_db_dir\n\n\n@overload\ndef process_fold_input(\n    fold_input: folding_input.Input,\n    data_pipeline_config: pipeline.DataPipelineConfig | None,\n    *,\n    model_runner: None,\n    output_dir: os.PathLike[str] | str,\n    buckets: Sequence[int] | None = None,\n    ref_max_modified_date: datetime.date | None = None,\n    conformer_max_iterations: int | None = None,\n    resolve_msa_overlaps: bool = True,\n    force_output_dir: bool = False,\n    compress_large_output_files: bool = False,\n) -> folding_input.Input:\n  ...\n\n\n@overload\ndef process_fold_input(\n    fold_input: folding_input.Input,\n    data_pipeline_config: pipeline.DataPipelineConfig | None,\n    *,\n    model_runner: ModelRunner,\n    output_dir: os.PathLike[str] | str,\n    buckets: Sequence[int] | None = None,\n    ref_max_modified_date: datetime.date | None = None,\n    conformer_max_iterations: int | None = None,\n    resolve_msa_overlaps: bool = True,\n    force_output_dir: bool = False,\n    compress_large_output_files: bool = False,\n) -> Sequence[ResultsForSeed]:\n  ...\n\n\ndef process_fold_input(\n    fold_input: folding_input.Input,\n    data_pipeline_config: pipeline.DataPipelineConfig | None,\n    *,\n    model_runner: ModelRunner | None,\n    output_dir: os.PathLike[str] | str,\n    buckets: Sequence[int] | None = None,\n    ref_max_modified_date: datetime.date | None = None,\n    conformer_max_iterations: int | None = None,\n    resolve_msa_overlaps: bool = True,\n    force_output_dir: bool = False,\n    compress_large_output_files: bool = False,\n) -> folding_input.Input | Sequence[ResultsForSeed]:\n  \"\"\"Runs data pipeline and/or inference on a single fold input.\n\n  Args:\n    fold_input: Fold input to process.\n    data_pipeline_config: Data pipeline config to use. If None, skip the data\n      pipeline.\n    model_runner: Model runner to use. If None, skip inference.\n    output_dir: Output directory to write to.\n    buckets: Bucket sizes to pad the data to, to avoid excessive re-compilation\n      of the model. If None, calculate the appropriate bucket size from the\n      number of tokens. If not None, must be a sequence of at least one integer,\n      in strictly increasing order. Will raise an error if the number of tokens\n      is more than the largest bucket size.\n    ref_max_modified_date: Optional maximum date that controls whether to allow\n      use of model coordinates for a chemical component from the CCD if RDKit\n      conformer generation fails and the component does not have ideal\n      coordinates set. Only for components that have been released before this\n      date the model coordinates can be used as a fallback.\n    conformer_max_iterations: Optional override for maximum number of iterations\n      to run for RDKit conformer search.\n    resolve_msa_overlaps: Whether to deduplicate unpaired MSA against paired\n      MSA. The default behaviour matches the method described in the AlphaFold 3\n      paper. Set this to false if providing custom paired MSA using the unpaired\n      MSA field to keep it exactly as is as deduplication against the paired MSA\n      could break the manually crafted pairing between MSA sequences.\n    force_output_dir: If True, do not create a new output directory even if the\n      existing one is non-empty. Instead use the existing output directory and\n      potentially overwrite existing files. If False, create a new timestamped\n      output directory instead if the existing one is non-empty.\n    compress_large_output_files: If True, compress large output files (mmCIF and\n      confidences JSON) using zstandard.\n\n  Returns:\n    The processed fold input, or the inference results for each seed.\n\n  Raises:\n    ValueError: If the fold input has no chains.\n  \"\"\"\n  print(f'\\nRunning fold job {fold_input.name}...')\n\n  if not fold_input.chains:\n    raise ValueError('Fold input has no chains.')\n\n  if (\n      not force_output_dir\n      and os.path.exists(output_dir)\n      and os.listdir(output_dir)\n  ):\n    new_output_dir = (\n        f'{output_dir}_{datetime.datetime.now().strftime(\"%Y%m%d_%H%M%S\")}'\n    )\n    print(\n        f'Output will be written in {new_output_dir} since {output_dir} is'\n        ' non-empty.'\n    )\n    output_dir = new_output_dir\n  else:\n    print(f'Output will be written in {output_dir}')\n\n  if data_pipeline_config is None:\n    print('Skipping data pipeline...')\n  else:\n    print('Running data pipeline...')\n    fold_input = pipeline.DataPipeline(data_pipeline_config).process(fold_input)\n\n  write_fold_input_json(fold_input, output_dir)\n  if model_runner is None:\n    print('Skipping model inference...')\n    output = fold_input\n  else:\n    print(\n        f'Predicting 3D structure for {fold_input.name} with'\n        f' {len(fold_input.rng_seeds)} seed(s)...'\n    )\n    all_inference_results = predict_structure(\n        fold_input=fold_input,\n        model_runner=model_runner,\n        buckets=buckets,\n        ref_max_modified_date=ref_max_modified_date,\n        conformer_max_iterations=conformer_max_iterations,\n        resolve_msa_overlaps=resolve_msa_overlaps,\n    )\n    print(f'Writing outputs with {len(fold_input.rng_seeds)} seed(s)...')\n    write_outputs(\n        all_inference_results=all_inference_results,\n        output_dir=output_dir,\n        job_name=fold_input.sanitised_name(),\n        compress_large_output_files=compress_large_output_files,\n    )\n    output = all_inference_results\n\n  print(f'Fold job {fold_input.name} done, output written to {output_dir}\\n')\n  return output\n\n\ndef main(_):\n  if _JAX_COMPILATION_CACHE_DIR.value is not None:\n    jax.config.update(\n        'jax_compilation_cache_dir', _JAX_COMPILATION_CACHE_DIR.value\n    )\n\n  if _JSON_PATH.value is None == _INPUT_DIR.value is None:\n    raise ValueError(\n        'Exactly one of --json_path or --input_dir must be specified.'\n    )\n\n  if not _RUN_INFERENCE.value and not _RUN_DATA_PIPELINE.value:\n    raise ValueError(\n        'At least one of --run_inference or --run_data_pipeline must be'\n        ' set to true.'\n    )\n\n  if _INPUT_DIR.value is not None:\n    fold_inputs = folding_input.load_fold_inputs_from_dir(\n        pathlib.Path(_INPUT_DIR.value)\n    )\n  elif _JSON_PATH.value is not None:\n    fold_inputs = folding_input.load_fold_inputs_from_path(\n        pathlib.Path(_JSON_PATH.value)\n    )\n  else:\n    raise AssertionError(\n        'Exactly one of --json_path or --input_dir must be specified.'\n    )\n\n  # Make sure we can create the output directory before running anything.\n  try:\n    os.makedirs(_OUTPUT_DIR.value, exist_ok=True)\n  except OSError as e:\n    print(f'Failed to create output directory {_OUTPUT_DIR.value}: {e}')\n    raise\n\n  if _RUN_INFERENCE.value:\n    # Fail early on incompatible devices, but only if we're running inference.\n    gpu_devices = jax.local_devices(backend='gpu')\n    if gpu_devices:\n      compute_capability = float(\n          gpu_devices[_GPU_DEVICE.value].compute_capability\n      )\n      if compute_capability < 6.0:\n        raise ValueError(\n            'AlphaFold 3 requires at least GPU compute capability 6.0 (see'\n            ' https://developer.nvidia.com/cuda-gpus).'\n        )\n      elif 7.0 <= compute_capability < 8.0:\n        xla_flags = os.environ.get('XLA_FLAGS')\n        required_flag = '--xla_disable_hlo_passes=custom-kernel-fusion-rewriter'\n        if not xla_flags or required_flag not in xla_flags:\n          raise ValueError(\n              'For devices with GPU compute capability 7.x (see'\n              ' https://developer.nvidia.com/cuda-gpus) the ENV XLA_FLAGS must'\n              f' include \"{required_flag}\".'\n          )\n        if _FLASH_ATTENTION_IMPLEMENTATION.value != 'xla':\n          raise ValueError(\n              'For devices with GPU compute capability 7.x (see'\n              ' https://developer.nvidia.com/cuda-gpus) the'\n              ' --flash_attention_implementation must be set to \"xla\".'\n          )\n\n  notice = textwrap.wrap(\n      'Running AlphaFold 3. Please note that standard AlphaFold 3 model'\n      ' parameters are only available under terms of use provided at'\n      ' https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.'\n      ' If you do not agree to these terms and are using AlphaFold 3 derived'\n      ' model parameters, cancel execution of AlphaFold 3 inference with'\n      ' CTRL-C, and do not use the model parameters.',\n      break_long_words=False,\n      break_on_hyphens=False,\n      width=80,\n  )\n  print('\\n' + '\\n'.join(notice) + '\\n')\n\n  max_template_date = datetime.date.fromisoformat(_MAX_TEMPLATE_DATE.value)\n  if _RUN_DATA_PIPELINE.value:\n    expand_path = lambda x: replace_db_dir(x, DB_DIR.value)\n    data_pipeline_config = pipeline.DataPipelineConfig(\n        jackhmmer_binary_path=_JACKHMMER_BINARY_PATH.value,\n        nhmmer_binary_path=_NHMMER_BINARY_PATH.value,\n        hmmalign_binary_path=_HMMALIGN_BINARY_PATH.value,\n        hmmsearch_binary_path=_HMMSEARCH_BINARY_PATH.value,\n        hmmbuild_binary_path=_HMMBUILD_BINARY_PATH.value,\n        small_bfd_database_path=expand_path(_SMALL_BFD_DATABASE_PATH.value),\n        small_bfd_z_value=_SMALL_BFD_Z_VALUE.value,\n        mgnify_database_path=expand_path(_MGNIFY_DATABASE_PATH.value),\n        mgnify_z_value=_MGNIFY_Z_VALUE.value,\n        uniprot_cluster_annot_database_path=expand_path(\n            _UNIPROT_CLUSTER_ANNOT_DATABASE_PATH.value\n        ),\n        uniprot_cluster_annot_z_value=_UNIPROT_CLUSTER_ANNOT_Z_VALUE.value,\n        uniref90_database_path=expand_path(_UNIREF90_DATABASE_PATH.value),\n        uniref90_z_value=_UNIREF90_Z_VALUE.value,\n        ntrna_database_path=expand_path(_NTRNA_DATABASE_PATH.value),\n        ntrna_z_value=_NTRNA_Z_VALUE.value,\n        rfam_database_path=expand_path(_RFAM_DATABASE_PATH.value),\n        rfam_z_value=_RFAM_Z_VALUE.value,\n        rna_central_database_path=expand_path(_RNA_CENTRAL_DATABASE_PATH.value),\n        rna_central_z_value=_RNA_CENTRAL_Z_VALUE.value,\n        pdb_database_path=expand_path(_PDB_DATABASE_PATH.value),\n        seqres_database_path=expand_path(_SEQRES_DATABASE_PATH.value),\n        jackhmmer_n_cpu=_JACKHMMER_N_CPU.value,\n        jackhmmer_max_parallel_shards=_JACKHMMER_MAX_PARALLEL_SHARDS.value,\n        nhmmer_n_cpu=_NHMMER_N_CPU.value,\n        nhmmer_max_parallel_shards=_NHMMER_MAX_PARALLEL_SHARDS.value,\n        max_template_date=max_template_date,\n    )\n  else:\n    data_pipeline_config = None\n\n  if _RUN_INFERENCE.value:\n    devices = jax.local_devices(backend='gpu')\n    print(\n        f'Found local devices: {devices}, using device {_GPU_DEVICE.value}:'\n        f' {devices[_GPU_DEVICE.value]}'\n    )\n\n    print('Building model from scratch...')\n    model_runner = ModelRunner(\n        config=make_model_config(\n            flash_attention_implementation=typing.cast(\n                tokamax.DotProductAttentionImplementation,\n                _FLASH_ATTENTION_IMPLEMENTATION.value,\n            ),\n            num_diffusion_samples=_NUM_DIFFUSION_SAMPLES.value,\n            num_recycles=_NUM_RECYCLES.value,\n            return_embeddings=_SAVE_EMBEDDINGS.value,\n            return_distogram=_SAVE_DISTOGRAM.value,\n        ),\n        device=devices[_GPU_DEVICE.value],\n        model_dir=pathlib.Path(MODEL_DIR.value),\n    )\n    # Check we can load the model parameters before launching anything.\n    print('Checking that model parameters can be loaded...')\n    _ = model_runner.model_params\n  else:\n    model_runner = None\n\n  num_fold_inputs = 0\n  for fold_input in fold_inputs:\n    if _NUM_SEEDS.value is not None:\n      print(f'Expanding fold job {fold_input.name} to {_NUM_SEEDS.value} seeds')\n      fold_input = fold_input.with_multiple_seeds(_NUM_SEEDS.value)\n    process_fold_input(\n        fold_input=fold_input,\n        data_pipeline_config=data_pipeline_config,\n        model_runner=model_runner,\n        output_dir=os.path.join(_OUTPUT_DIR.value, fold_input.sanitised_name()),\n        buckets=tuple(int(bucket) for bucket in _BUCKETS.value),\n        ref_max_modified_date=max_template_date,\n        conformer_max_iterations=_CONFORMER_MAX_ITERATIONS.value,\n        resolve_msa_overlaps=_RESOLVE_MSA_OVERLAPS.value,\n        force_output_dir=_FORCE_OUTPUT_DIR.value,\n        compress_large_output_files=_COMPRESS_LARGE_OUTPUT_FILES.value,\n    )\n    num_fold_inputs += 1\n\n  print(f'Done running {num_fold_inputs} fold jobs.')\n\n\nif __name__ == '__main__':\n  flags.mark_flags_as_required(['output_dir'])\n  app.run(main)\n"
  },
  {
    "path": "run_alphafold_data_test.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Tests the AlphaFold 3 data pipeline.\"\"\"\n\nimport contextlib\nimport datetime\nimport difflib\nimport functools\nimport hashlib\nimport json\nimport os\nimport pathlib\nimport pickle\nfrom typing import Any\n\nfrom absl.testing import absltest\nfrom absl.testing import parameterized\nfrom alphafold3 import structure\nfrom alphafold3.common import folding_input\nfrom alphafold3.common import resources\nfrom alphafold3.common.testing import data as testing_data\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.data import featurisation\nfrom alphafold3.data import pipeline\nfrom alphafold3.model.atom_layout import atom_layout\nimport jax\nimport numpy as np\n\nimport run_alphafold\nimport shutil\n\n\n_JACKHMMER_BINARY_PATH = shutil.which('jackhmmer')\n_NHMMER_BINARY_PATH = shutil.which('nhmmer')\n_HMMALIGN_BINARY_PATH = shutil.which('hmmalign')\n_HMMSEARCH_BINARY_PATH = shutil.which('hmmsearch')\n_HMMBUILD_BINARY_PATH = shutil.which('hmmbuild')\n\n\n@contextlib.contextmanager\ndef _output(name: str):\n  with open(result_path := f'{absltest.TEST_TMPDIR.value}/{name}', \"wb\") as f:\n    yield result_path, f\n\n\n@functools.singledispatch\ndef _hash_data(x: Any, /) -> str:\n  if x is None:\n    return '<<None>>'\n  return _hash_data(json.dumps(x).encode('utf-8'))\n\n\n@_hash_data.register\ndef _(x: bytes, /) -> str:\n  return hashlib.sha256(x).hexdigest()\n\n\n@_hash_data.register\ndef _(x: jax.Array) -> str:\n  return _hash_data(jax.device_get(x))\n\n\n@_hash_data.register\ndef _(x: np.ndarray) -> str:\n  if x.dtype == object:\n    return ';'.join(map(_hash_data, x.ravel().tolist()))\n  return _hash_data(x.tobytes())\n\n\n@_hash_data.register\ndef _(_: structure.Structure) -> str:\n  return '<<structure>>'\n\n\n@_hash_data.register\ndef _(_: atom_layout.AtomLayout) -> str:\n  return '<<atom-layout>>'\n\n\ndef _generate_diff(actual: str, expected: str) -> str:\n  return '\\n'.join(\n      difflib.unified_diff(\n          expected.split('\\n'),\n          actual.split('\\n'),\n          fromfile='expected',\n          tofile='actual',\n          lineterm='',\n      )\n  )\n\n\nclass DataPipelineTest(parameterized.TestCase):\n  \"\"\"Test AlphaFold 3 inference.\"\"\"\n\n  def setUp(self):\n    super().setUp()\n    small_bfd_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/bfd-first_non_consensus_sequences__subsampled_1000.fasta'\n    ).path()\n    mgnify_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/mgy_clusters__subsampled_1000.fa'\n    ).path()\n    uniprot_cluster_annot_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/uniprot_all__subsampled_1000.fasta'\n    ).path()\n    uniref90_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/uniref90__subsampled_1000.fasta'\n    ).path()\n    ntrna_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/nt_rna_2023_02_23_clust_seq_id_90_cov_80_rep_seq__subsampled_1000.fasta'\n    ).path()\n    rfam_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/rfam_14_4_clustered_rep_seq__subsampled_1000.fasta'\n    ).path()\n    rna_central_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/rnacentral_active_seq_id_90_cov_80_linclust__subsampled_1000.fasta'\n    ).path()\n    pdb_database_path = testing_data.Data(\n        resources.ROOT / 'test_data/miniature_databases/pdb_mmcif'\n    ).path()\n    seqres_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/pdb_seqres_2022_09_28__subsampled_1000.fasta'\n    ).path()\n\n    self._data_pipeline_config = pipeline.DataPipelineConfig(\n        jackhmmer_binary_path=_JACKHMMER_BINARY_PATH,\n        nhmmer_binary_path=_NHMMER_BINARY_PATH,\n        hmmalign_binary_path=_HMMALIGN_BINARY_PATH,\n        hmmsearch_binary_path=_HMMSEARCH_BINARY_PATH,\n        hmmbuild_binary_path=_HMMBUILD_BINARY_PATH,\n        small_bfd_database_path=small_bfd_database_path,\n        mgnify_database_path=mgnify_database_path,\n        uniprot_cluster_annot_database_path=uniprot_cluster_annot_database_path,\n        uniref90_database_path=uniref90_database_path,\n        ntrna_database_path=ntrna_database_path,\n        rfam_database_path=rfam_database_path,\n        rna_central_database_path=rna_central_database_path,\n        pdb_database_path=pdb_database_path,\n        seqres_database_path=seqres_database_path,\n        max_template_date=datetime.date(2021, 9, 30),\n    )\n    test_input = {\n        'name': '5tgy',\n        'modelSeeds': [1234],\n        'sequences': [\n            {\n                'protein': {\n                    'id': 'P',\n                    'sequence': (\n                        'SEFEKLRQTGDELVQAFQRLREIFDKGDDDSLEQVLEEIEELIQKHRQLFDNRQEAADTEAAKQGDQWVQLFQRFREAIDKGDKDSLEQLLEELEQALQKIRELAEKKN'\n                    ),\n                    'modifications': [],\n                    'unpairedMsa': None,\n                    'pairedMsa': None,\n                }\n            },\n            {'ligand': {'id': 'LL', 'ccdCodes': ['7BU']}},\n        ],\n        'dialect': folding_input.JSON_DIALECT,\n        'version': folding_input.JSON_VERSION,\n    }\n    self._test_input_json = json.dumps(test_input)\n\n  def compare_golden(self, result_path: str) -> None:\n    filename = os.path.split(result_path)[1]\n    golden_path = testing_data.Data(\n        resources.ROOT / f'test_data/{filename}'\n    ).path()\n    with open(golden_path, 'r') as golden_file:\n      golden_text = golden_file.read()\n    with open(result_path, 'r') as result_file:\n      result_text = result_file.read()\n\n    diff = _generate_diff(result_text, golden_text)\n\n    self.assertEqual(diff, \"\", f\"Result differs from golden:\\n{diff}\")\n\n  def test_config(self):\n    model_config = run_alphafold.make_model_config()\n    model_config_as_str = json.dumps(\n        model_config.as_dict(), sort_keys=True, indent=2\n    )\n    with _output('model_config.json') as (result_path, output):\n      output.write(model_config_as_str.encode('utf-8'))\n    self.compare_golden(result_path)\n\n  def test_featurisation(self):\n    \"\"\"Run featurisation and assert that the output is as expected.\"\"\"\n    fold_input = folding_input.Input.from_json(self._test_input_json)\n    data_pipeline = pipeline.DataPipeline(self._data_pipeline_config)\n    full_fold_input = data_pipeline.process(fold_input)\n    featurised_example = featurisation.featurise_input(\n        full_fold_input,\n        ccd=chemical_components.Ccd(),\n        buckets=None,\n    )\n    del featurised_example[0]['ref_pos']  # Depends on specific RDKit version.\n\n    with _output('featurised_example.pkl') as (_, output):\n      output.write(pickle.dumps(featurised_example))\n    featurised_example = jax.tree_util.tree_map(_hash_data, featurised_example)\n    with _output('featurised_example.json') as (result_path, output):\n      output.write(\n          json.dumps(featurised_example, sort_keys=True, indent=2).encode(\n              'utf-8'\n          )\n      )\n    self.compare_golden(result_path)\n\n  def test_write_input_json(self):\n    fold_input = folding_input.Input.from_json(self._test_input_json)\n    output_dir = self.create_tempdir().full_path\n    run_alphafold.write_fold_input_json(fold_input, output_dir)\n    with open(\n        os.path.join(output_dir, f'{fold_input.sanitised_name()}_data.json'),\n        'rt',\n    ) as f:\n      actual_fold_input = folding_input.Input.from_json(f.read())\n\n    self.assertEqual(actual_fold_input, fold_input)\n\n  def test_process_fold_input_runs_only_data_pipeline(self):\n    fold_input = folding_input.Input.from_json(self._test_input_json)\n    output_dir = self.create_tempdir().full_path\n    run_alphafold.process_fold_input(\n        fold_input=fold_input,\n        data_pipeline_config=self._data_pipeline_config,\n        model_runner=None,\n        output_dir=output_dir,\n    )\n    with open(\n        os.path.join(output_dir, f'{fold_input.sanitised_name()}_data.json'),\n        'rt',\n    ) as f:\n      actual_fold_input = folding_input.Input.from_json(f.read())\n\n    featurisation.validate_fold_input(actual_fold_input)\n\n  @parameterized.product(num_db_dirs=tuple(range(1, 3)))\n  def test_replace_db_dir(self, num_db_dirs: int) -> None:\n    \"\"\"Test that the db_dir is replaced correctly.\"\"\"\n    db_dirs = [pathlib.Path(self.create_tempdir()) for _ in range(num_db_dirs)]\n    db_dirs_posix = [db_dir.as_posix() for db_dir in db_dirs]\n\n    for i, db_dir in enumerate(db_dirs):\n      for j in range(i + 1):\n        (db_dir / f'filename{j}.txt').write_text(f'hello world {i}')\n\n    for i in range(num_db_dirs):\n      self.assertEqual(\n          pathlib.Path(\n              run_alphafold.replace_db_dir(\n                  f'${{DB_DIR}}/filename{i}.txt', db_dirs_posix\n              )\n          ).read_text(),\n          f'hello world {i}',\n      )\n    with self.assertRaises(FileNotFoundError):\n      run_alphafold.replace_db_dir(\n          f'${{DB_DIR}}/filename{num_db_dirs}.txt', db_dirs_posix\n      )\n\n\nif __name__ == '__main__':\n  absltest.main()\n"
  },
  {
    "path": "run_alphafold_test.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Tests end-to-end running of AlphaFold 3.\"\"\"\n\nimport contextlib\nimport csv\nimport dataclasses\nimport datetime\nimport difflib\nimport json\nimport os\nimport pathlib\nimport pickle\n\nfrom absl import logging\nfrom absl.testing import absltest\nfrom absl.testing import parameterized\nfrom alphafold3.common import folding_input\nfrom alphafold3.common import resources\nfrom alphafold3.common.testing import data as testing_data\nfrom alphafold3.data import pipeline\nfrom alphafold3.model.scoring import alignment\nimport jax\nimport numpy as np\n\nimport run_alphafold\nimport shutil\n\n\n_JACKHMMER_BINARY_PATH = shutil.which('jackhmmer')\n_NHMMER_BINARY_PATH = shutil.which('nhmmer')\n_HMMALIGN_BINARY_PATH = shutil.which('hmmalign')\n_HMMSEARCH_BINARY_PATH = shutil.which('hmmsearch')\n_HMMBUILD_BINARY_PATH = shutil.which('hmmbuild')\n\n\n@contextlib.contextmanager\ndef _output(name: str):\n  with open(result_path := f'{absltest.TEST_TMPDIR.value}/{name}', \"wb\") as f:\n    yield result_path, f\n\n\njax.config.update('jax_enable_compilation_cache', False)\n\n\ndef _generate_diff(actual: str, expected: str) -> str:\n  return '\\n'.join(\n      difflib.unified_diff(\n          expected.split('\\n'),\n          actual.split('\\n'),\n          fromfile='expected',\n          tofile='actual',\n          lineterm='',\n      )\n  )\n\n\nclass InferenceTest(parameterized.TestCase):\n  \"\"\"Test AlphaFold 3 inference.\"\"\"\n\n  def setUp(self):\n    super().setUp()\n    small_bfd_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/bfd-first_non_consensus_sequences__subsampled_1000.fasta'\n    ).path()\n    mgnify_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/mgy_clusters__subsampled_1000.fa'\n    ).path()\n    uniprot_cluster_annot_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/uniprot_all__subsampled_1000.fasta'\n    ).path()\n    uniref90_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/uniref90__subsampled_1000.fasta'\n    ).path()\n    ntrna_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/nt_rna_2023_02_23_clust_seq_id_90_cov_80_rep_seq__subsampled_1000.fasta'\n    ).path()\n    rfam_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/rfam_14_4_clustered_rep_seq__subsampled_1000.fasta'\n    ).path()\n    rna_central_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/rnacentral_active_seq_id_90_cov_80_linclust__subsampled_1000.fasta'\n    ).path()\n    pdb_database_path = testing_data.Data(\n        resources.ROOT / 'test_data/miniature_databases/pdb_mmcif'\n    ).path()\n    seqres_database_path = testing_data.Data(\n        resources.ROOT\n        / 'test_data/miniature_databases/pdb_seqres_2022_09_28__subsampled_1000.fasta'\n    ).path()\n\n    self._data_pipeline_config = pipeline.DataPipelineConfig(\n        jackhmmer_binary_path=_JACKHMMER_BINARY_PATH,\n        nhmmer_binary_path=_NHMMER_BINARY_PATH,\n        hmmalign_binary_path=_HMMALIGN_BINARY_PATH,\n        hmmsearch_binary_path=_HMMSEARCH_BINARY_PATH,\n        hmmbuild_binary_path=_HMMBUILD_BINARY_PATH,\n        small_bfd_database_path=small_bfd_database_path,\n        mgnify_database_path=mgnify_database_path,\n        uniprot_cluster_annot_database_path=uniprot_cluster_annot_database_path,\n        uniref90_database_path=uniref90_database_path,\n        ntrna_database_path=ntrna_database_path,\n        rfam_database_path=rfam_database_path,\n        rna_central_database_path=rna_central_database_path,\n        pdb_database_path=pdb_database_path,\n        seqres_database_path=seqres_database_path,\n        max_template_date=datetime.date(2021, 9, 30),\n    )\n    test_input = {\n        'name': '5tgy',\n        'modelSeeds': [1234],\n        'sequences': [\n            {\n                'protein': {\n                    'id': 'P',\n                    'sequence': (\n                        'SEFEKLRQTGDELVQAFQRLREIFDKGDDDSLEQVLEEIEELIQKHRQLFDNRQEAADTEAAKQGDQWVQLFQRFREAIDKGDKDSLEQLLEELEQALQKIRELAEKKN'\n                    ),\n                    'modifications': [],\n                    'unpairedMsa': None,\n                    'pairedMsa': None,\n                }\n            },\n            {'ligand': {'id': 'LL', 'ccdCodes': ['7BU']}},\n        ],\n        'dialect': folding_input.JSON_DIALECT,\n        'version': folding_input.JSON_VERSION,\n    }\n    self._test_input_json = json.dumps(test_input)\n    self._model_config = run_alphafold.make_model_config(\n        flash_attention_implementation='triton',\n        return_embeddings=True,\n        return_distogram=True,\n    )\n    self._runner = run_alphafold.ModelRunner(\n        config=self._model_config,\n        device=jax.local_devices()[0],\n        model_dir=pathlib.Path(run_alphafold.MODEL_DIR.value),\n    )\n\n  def test_model_inference(self):\n    \"\"\"Run model inference and assert that output exists.\"\"\"\n    featurised_examples = pickle.loads(\n        (resources.ROOT / 'test_data' / 'featurised_example.pkl').read_bytes()\n    )\n\n    self.assertLen(featurised_examples, 1)\n    featurised_example = featurised_examples[0]\n    result = self._runner.run_inference(\n        featurised_example, jax.random.PRNGKey(0)\n    )\n    self.assertIsNotNone(result)\n    inference_results = self._runner.extract_inference_results(\n        batch=featurised_example, result=result, target_name='target'\n    )\n    embeddings = self._runner.extract_embeddings(\n        result=result,\n        num_tokens=len(inference_results[0].metadata['token_chain_ids']),\n    )\n    self.assertLen(embeddings, 2)\n\n  def test_process_fold_input_runs_only_inference(self):\n    with self.assertRaisesRegex(ValueError, 'missing unpaired MSA.'):\n      run_alphafold.process_fold_input(\n          fold_input=folding_input.Input.from_json(self._test_input_json),\n          # No data pipeline config, so featurisation will run first, and fail\n          # since the input is missing MSAs.\n          data_pipeline_config=None,\n          model_runner=self._runner,\n          output_dir=self.create_tempdir().full_path,\n      )\n\n  @parameterized.named_parameters(\n      {\n          'testcase_name': 'default_bucket',\n          'bucket': None,\n          'seed': 1,\n      },\n      {\n          'testcase_name': 'bucket_1024',\n          'bucket': 1024,\n          'seed': 42,\n      },\n  )\n  def test_inference(self, bucket, seed):\n    \"\"\"Run AlphaFold 3 inference.\"\"\"\n\n    ### Prepare inputs with modified seed.\n    fold_input = folding_input.Input.from_json(self._test_input_json)\n    fold_input = dataclasses.replace(fold_input, rng_seeds=[seed])\n\n    output_dir = self.create_tempdir().full_path\n    actual = run_alphafold.process_fold_input(\n        fold_input,\n        self._data_pipeline_config,\n        model_runner=run_alphafold.ModelRunner(\n            config=self._model_config,\n            device=jax.local_devices(backend='gpu')[0],\n            model_dir=pathlib.Path(run_alphafold.MODEL_DIR.value),\n        ),\n        output_dir=output_dir,\n        buckets=None if bucket is None else [bucket],\n    )\n    logging.info('finished get_inference_result')\n    expected_model_cif_filename = f'{fold_input.sanitised_name()}_model.cif'\n    expected_summary_confidences_filename = (\n        f'{fold_input.sanitised_name()}_summary_confidences.json'\n    )\n    expected_confidences_filename = (\n        f'{fold_input.sanitised_name()}_confidences.json'\n    )\n    expected_data_json_filename = f'{fold_input.sanitised_name()}_data.json'\n\n    prefix = f'seed-{seed}'\n    self.assertSameElements(\n        os.listdir(output_dir),\n        [\n            # Subdirectories, one for each sample and one for embeddings.\n            f'{prefix}_sample-0',\n            f'{prefix}_sample-1',\n            f'{prefix}_sample-2',\n            f'{prefix}_sample-3',\n            f'{prefix}_sample-4',\n            f'{prefix}_embeddings',\n            f'{prefix}_distogram',\n            # Top ranking result.\n            expected_confidences_filename,\n            expected_model_cif_filename,\n            expected_summary_confidences_filename,\n            # Ranking scores for all samples.\n            f'{fold_input.sanitised_name()}_ranking_scores.csv',\n            # The input JSON defining the job.\n            expected_data_json_filename,\n            # The output terms of use.\n            'TERMS_OF_USE.md',\n        ],\n    )\n\n    for sample_index in range(5):\n      sample_dir = os.path.join(output_dir, f'{prefix}_sample-{sample_index}')\n      sample_prefix = (\n          f'{fold_input.sanitised_name()}_seed-{seed}_sample-{sample_index}'\n      )\n      self.assertSameElements(\n          os.listdir(sample_dir),\n          [\n              f'{sample_prefix}_confidences.json',\n              f'{sample_prefix}_model.cif',\n              f'{sample_prefix}_summary_confidences.json',\n          ],\n      )\n\n    embeddings_dir = os.path.join(output_dir, f'{prefix}_embeddings')\n    embeddings_filename = (\n        f'{fold_input.sanitised_name()}_{prefix}_embeddings.npz'\n    )\n    self.assertSameElements(os.listdir(embeddings_dir), [embeddings_filename])\n\n    with open(os.path.join(embeddings_dir, embeddings_filename), 'rb') as f:\n      embeddings = np.load(f)\n      self.assertSameElements(\n          embeddings.keys(), ['single_embeddings', 'pair_embeddings']\n      )\n      # Ligand 7BU has 41 tokens.\n      num_tokens = len(fold_input.protein_chains[0].sequence) + 41\n      self.assertEqual(embeddings['single_embeddings'].shape, (num_tokens, 384))\n      self.assertEqual(embeddings['single_embeddings'].dtype, np.float16)\n      self.assertEqual(\n          embeddings['pair_embeddings'].shape, (num_tokens, num_tokens, 128)\n      )\n      self.assertEqual(embeddings['pair_embeddings'].dtype, np.float16)\n\n    distogram_dir = os.path.join(output_dir, f'{prefix}_distogram')\n    distogram_filename = f'{fold_input.sanitised_name()}_{prefix}_distogram.npz'\n    self.assertSameElements(os.listdir(distogram_dir), [distogram_filename])\n\n    with open(os.path.join(distogram_dir, distogram_filename), 'rb') as f:\n      distogram = np.load(f)['distogram']\n      self.assertEqual(distogram.shape, (num_tokens, num_tokens, 64))\n      self.assertEqual(distogram.dtype, np.float16)\n\n    with open(os.path.join(output_dir, expected_data_json_filename), 'rt') as f:\n      actual_input_json = json.load(f)\n\n    self.assertEqual(\n        actual_input_json['sequences'][0]['protein']['sequence'],\n        fold_input.protein_chains[0].sequence,\n    )\n    self.assertSequenceEqual(\n        actual_input_json['sequences'][1]['ligand']['ccdCodes'],\n        fold_input.ligands[0].ccd_ids,\n    )\n    self.assertNotEmpty(\n        actual_input_json['sequences'][0]['protein']['unpairedMsa']\n    )\n    self.assertNotEmpty(\n        actual_input_json['sequences'][0]['protein']['pairedMsa']\n    )\n    self.assertIsNotNone(\n        actual_input_json['sequences'][0]['protein']['templates']\n    )\n\n    ranking_scores_filename = (\n        f'{fold_input.sanitised_name()}_ranking_scores.csv'\n    )\n    with open(os.path.join(output_dir, ranking_scores_filename), 'rt') as f:\n      ranking_scores = list(csv.DictReader(f))\n\n    self.assertLen(ranking_scores, 5)\n    self.assertEqual([int(s['seed']) for s in ranking_scores], [seed] * 5)\n    self.assertEqual(\n        [int(s['sample']) for s in ranking_scores], [0, 1, 2, 3, 4]\n    )\n\n    # Ranking score should be in the expected range for all samples.\n    ranking_scores = [float(s['ranking_score']) for s in ranking_scores]\n    lower = 0.66\n    upper = 0.78\n    scores_ok = [lower <= score <= upper for score in ranking_scores]\n    if not all(scores_ok):\n      printable_scores = [f'{score:.2f}' for score in ranking_scores]\n      self.fail(\n          f'Ranking scores {printable_scores} not in expected range '\n          f'[{lower:.2f}, {upper:.2f}]'\n      )\n\n    with open(os.path.join(output_dir, 'TERMS_OF_USE.md'), 'rt') as f:\n      actual_terms_of_use = f.read()\n    self.assertStartsWith(\n        actual_terms_of_use, '# ALPHAFOLD 3 OUTPUT TERMS OF USE'\n    )\n\n    bucket_label = 'default' if bucket is None else bucket\n    output_filename = f'run_alphafold_test_output_bucket_{bucket_label}.pkl'\n\n    # Convert to dict to enable simple serialization.\n    actual_dict = [\n        dict(\n            seed=actual_inf.seed,\n            inference_results=actual_inf.inference_results,\n            full_fold_input=actual_inf.full_fold_input,\n        )\n        for actual_inf in actual\n    ]\n    with _output(output_filename) as (_, output):\n      output.write(pickle.dumps(actual_dict))\n\n    logging.info('Comparing inference results with expected values.')\n\n    ### Assert that output is as expected.\n    expected_dict = pickle.loads(\n        (\n            resources.ROOT\n            / 'test_data'\n            / 'alphafold_run_outputs'\n            / output_filename\n        ).read_bytes()\n    )\n    expected = [\n        run_alphafold.ResultsForSeed(**expected_inf)\n        for expected_inf in expected_dict\n    ]\n\n    actual_rmsds = []\n    mask_proportions = []\n    actual_masked_rmsds = []\n    for actual_inf, expected_inf in zip(actual, expected, strict=True):\n      for actual_inf, expected_inf in zip(\n          actual_inf.inference_results,\n          expected_inf.inference_results,\n          strict=True,\n      ):\n        # Make sure the token chain IDs are the same as the input chain IDs.\n        self.assertEqual(\n            actual_inf.metadata['token_chain_ids'],\n            ['P'] * len(fold_input.protein_chains[0].sequence) + ['LL'] * 41,\n        )\n        # All atom occupancies should be 1.0.\n        np.testing.assert_array_equal(\n            actual_inf.predicted_structure.atom_occupancy,\n            [1.0] * actual_inf.predicted_structure.num_atoms,\n        )\n        actual_rmsds.append(\n            alignment.rmsd_from_coords(\n                decoy_coords=actual_inf.predicted_structure.coords,\n                gt_coords=expected_inf.predicted_structure.coords,\n            )\n        )\n        # Mask out atoms with b_factor < 80.0 (i.e. lower confidence regions).\n        mask = actual_inf.predicted_structure.atom_b_factor > 80.0\n        mask_proportions.append(\n            np.sum(mask) / actual_inf.predicted_structure.num_atoms\n        )\n        actual_masked_rmsds.append(\n            alignment.rmsd_from_coords(\n                decoy_coords=actual_inf.predicted_structure.coords,\n                gt_coords=expected_inf.predicted_structure.coords,\n                include_idxs=mask,\n            )\n        )\n    # 5tgy is stably predicted, samples should be all within 3.0 RMSD\n    # regardless of seed, bucket, device type, etc.\n    if any(rmsd > 3.0 for rmsd in actual_rmsds):\n      self.fail(f'Full RMSD too high: {actual_rmsds=}')\n    # Check proportion of atoms with b_factor > 80 is at least 70%.\n    if any(prop < 0.7 for prop in mask_proportions):\n      self.fail(f'Too many residues with low pLDDT: {mask_proportions=}')\n    # Check masked RMSD is within tolerance (lower than full RMSD due to masking\n    # of lower confidence regions).\n    if any(rmsd > 1.4 for rmsd in actual_masked_rmsds):\n      self.fail(f'Masked RMSD too high: {actual_masked_rmsds=}')\n\n\nif __name__ == '__main__':\n  absltest.main()\n"
  },
  {
    "path": "src/alphafold3/__init__.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"An implementation of the inference pipeline of AlphaFold 3.\"\"\"\n"
  },
  {
    "path": "src/alphafold3/build_data.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Script for building intermediate data.\"\"\"\n\nfrom importlib import resources\nimport os\nimport pathlib\nimport site\n\nimport alphafold3.constants.converters\nfrom alphafold3.constants.converters import ccd_pickle_gen\nfrom alphafold3.constants.converters import chemical_component_sets_gen\n\n\ndef build_data():\n  \"\"\"Builds intermediate data.\"\"\"\n  libcifpp_data_dir = os.environ.get('LIBCIFPP_DATA_DIR')\n  if libcifpp_data_dir:\n    cif_path = pathlib.Path(libcifpp_data_dir) / 'components.cif'\n  else:\n    for site_path in site.getsitepackages():\n      path = pathlib.Path(site_path) / 'share/libcifpp/components.cif'\n      if path.exists():\n        cif_path = path\n        break\n    else:\n      raise ValueError(\n          'Could not find components.cif. If libcifpp is installed in a'\n          ' non-standard location, please set the LIBCIFPP_DATA_DIR environment'\n          ' variable to the directory where libcifpp is installed.'\n      )\n\n  out_root = resources.files(alphafold3.constants.converters)\n  ccd_pickle_path = out_root.joinpath('ccd.pickle')\n  chemical_component_sets_pickle_path = out_root.joinpath(\n      'chemical_component_sets.pickle'\n  )\n  ccd_pickle_gen.main(['', str(cif_path), str(ccd_pickle_path)])\n  chemical_component_sets_gen.main(\n      ['', str(chemical_component_sets_pickle_path)]\n  )\n"
  },
  {
    "path": "src/alphafold3/common/base_config.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Config for the protein folding model and experiment.\"\"\"\n\nfrom collections.abc import Mapping\nimport copy\nimport dataclasses\nimport types\nimport typing\nfrom typing import Any, ClassVar, TypeVar\n\n\n_T = TypeVar('_T')\n_ConfigT = TypeVar('_ConfigT', bound='BaseConfig')\n\n\ndef _strip_optional(t: type[Any]) -> type[Any]:\n  \"\"\"Transforms type annotations of the form `T | None` to `T`.\"\"\"\n  if typing.get_origin(t) in (typing.Union, types.UnionType):\n    args = set(typing.get_args(t)) - {types.NoneType}\n    if len(args) == 1:\n      return args.pop()\n  return t\n\n\n_NO_UPDATE = object()\n\n\nclass _Autocreate:\n\n  def __init__(self, **defaults: Any):\n    self.defaults = defaults\n\n\ndef autocreate(**defaults: Any) -> Any:\n  \"\"\"Marks a field as having a default factory derived from its type.\"\"\"\n  return _Autocreate(**defaults)\n\n\ndef _clone_field(\n    field: dataclasses.Field[_T], new_default: _T\n) -> dataclasses.Field[_T]:\n  if new_default is _NO_UPDATE:\n    return copy.copy(field)\n  return dataclasses.field(\n      default=new_default,\n      init=True,\n      kw_only=True,\n      repr=field.repr,\n      hash=field.hash,\n      compare=field.compare,\n      metadata=field.metadata,\n  )\n\n\n@typing.dataclass_transform()\nclass ConfigMeta(type):\n  \"\"\"Metaclass that synthesizes a __post_init__ that coerces dicts to Config subclass instances.\"\"\"\n\n  def __new__(mcs, name, bases, classdict):\n    cls = super().__new__(mcs, name, bases, classdict)\n\n    def _coercable_fields(self) -> Mapping[str, tuple[ConfigMeta, Any]]:\n      type_hints = typing.get_type_hints(self.__class__)\n      fields = dataclasses.fields(self.__class__)\n      field_to_type_and_default = {\n          field.name: (_strip_optional(type_hints[field.name]), field.default)\n          for field in fields\n      }\n      coercable_fields = {\n          f: t\n          for f, t in field_to_type_and_default.items()\n          if issubclass(type(t[0]), ConfigMeta)\n      }\n      return coercable_fields\n\n    cls._coercable_fields = property(_coercable_fields)\n\n    old_post_init = getattr(cls, '__post_init__', None)\n\n    def _post_init(self) -> None:\n      # Use get_type_hints instead of Field.type to ensure that forward\n      # references are resolved.\n      for field_name, (\n          field_type,\n          field_default,\n      ) in self._coercable_fields.items():  # pylint: disable=protected-access\n        field_value = getattr(self, field_name)\n        if field_value is None:\n          continue\n        try:\n          match field_value:\n            case _Autocreate():\n              # Construct from field defaults.\n              setattr(self, field_name, field_type(**field_value.defaults))\n            case Mapping():\n              # Field value is not yet a `Config` instance; Assume we can create\n              # one by splatting keys and values.\n              args = {}\n              # Apply default args first, if present.\n              if isinstance(field_default, _Autocreate):\n                args.update(field_default.defaults)\n              args.update(field_value)\n              setattr(self, field_name, field_type(**args))\n            case _:\n              pass\n        except TypeError as e:\n          raise TypeError(\n              f'Failure while coercing field {field_name!r} of'\n              f' {self.__class__.__qualname__}'\n          ) from e\n      if old_post_init:\n        old_post_init(self)\n\n    cls.__post_init__ = _post_init\n\n    return dataclasses.dataclass(kw_only=True)(cls)\n\n\nclass BaseConfig(metaclass=ConfigMeta):\n  \"\"\"Config base class.\n\n  Subclassing Config automatically makes the subclass a kw_only dataclass with\n  a `__post_init__` that coerces Config-subclass field values from mappings to\n  instances of the right type.\n  \"\"\"\n  # Provided by dataclasses.make_dataclass\n  __dataclass_fields__: ClassVar[dict[str, dataclasses.Field[Any]]]\n\n  # Overridden by metaclass\n  @property\n  def _coercable_fields(self) -> Mapping[str, tuple[type['BaseConfig'], Any]]:\n    return {}\n\n  def as_dict(self) -> Mapping[str, Any]:\n    result = dataclasses.asdict(self)\n    for field_name in self._coercable_fields:\n      field_value = getattr(self, field_name, None)\n      if isinstance(field_value, BaseConfig):\n        result[field_name] = field_value.as_dict()\n    return result\n"
  },
  {
    "path": "src/alphafold3/common/folding_input.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Model input dataclass.\"\"\"\n\nfrom collections.abc import Collection, Iterator, Mapping, Sequence\nimport dataclasses\nimport gzip\nimport json\nimport logging\nimport lzma\nimport os\nimport pathlib\nimport random\nimport re\nimport string\nfrom typing import Any, Final, Self, TypeAlias, cast\n\nfrom alphafold3 import structure\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.constants import residue_names\nfrom alphafold3.cpp import cif_dict\nfrom alphafold3.structure import mmcif as mmcif_lib\nimport rdkit.Chem as rd_chem\nimport zstandard as zstd\n\n\nBondAtomId: TypeAlias = tuple[str, int, str]\n\nJSON_DIALECT: Final[str] = 'alphafold3'\nJSON_VERSIONS: Final[tuple[int, ...]] = (1, 2, 3, 4)\nJSON_VERSION: Final[int] = JSON_VERSIONS[-1]\n\nALPHAFOLDSERVER_JSON_DIALECT: Final[str] = 'alphafoldserver'\nALPHAFOLDSERVER_JSON_VERSION: Final[int] = 1\n\n\ndef _validate_keys(actual: Collection[str], expected: Collection[str]):\n  \"\"\"Validates that the JSON doesn't contain any extra unwanted keys.\"\"\"\n  if bad_keys := set(actual) - set(expected):\n    raise ValueError(f'Unexpected JSON keys in: {\", \".join(sorted(bad_keys))}')\n\n\ndef _read_file(path: pathlib.Path, json_path: pathlib.Path | None) -> str:\n  \"\"\"Reads a maybe compressed (gzip, xz, zstd) file from the given path.\n\n  Args:\n    path: The path to the file to read. This can be either absolute path, or a\n      path relative to the JSON file path.\n    json_path: The path to the JSON file. If None, the path must be absolute.\n\n  Returns:\n    The contents of the file.\n  \"\"\"\n  if not path.is_absolute():\n    if json_path is None:\n      raise ValueError('json_path must be specified if path is not absolute.')\n    path = (json_path.parent / path).resolve()\n\n  with open(path, 'rb') as f:\n    first_six_bytes = f.read(6)\n    f.seek(0)\n\n    # Detect the compression type using the magic number in the header.\n    if first_six_bytes[:2] == b'\\x1f\\x8b':\n      with gzip.open(f, 'rt') as gzip_f:\n        return cast(str, gzip_f.read())\n    elif first_six_bytes == b'\\xfd\\x37\\x7a\\x58\\x5a\\x00':\n      with lzma.open(f, 'rt') as xz_f:\n        return cast(str, xz_f.read())\n    elif first_six_bytes[:4] == b'\\x28\\xb5\\x2f\\xfd':\n      with zstd.open(f, 'rt') as zstd_f:\n        return cast(str, zstd_f.read())\n    else:\n      return f.read().decode('utf-8')\n\n\nclass Template:\n  \"\"\"Structural template input.\"\"\"\n\n  __slots__ = ('_mmcif', '_query_to_template')\n\n  def __init__(self, *, mmcif: str, query_to_template_map: Mapping[int, int]):\n    \"\"\"Initializes the template.\n\n    Args:\n      mmcif: The structural template in mmCIF format. The mmCIF should have only\n        one protein chain.\n      query_to_template_map: A mapping from query residue index to template\n        residue index.\n    \"\"\"\n    self._mmcif = mmcif\n    # Needed to make the Template class hashable.\n    self._query_to_template = tuple(query_to_template_map.items())\n\n  @property\n  def query_to_template_map(self) -> Mapping[int, int]:\n    return dict(self._query_to_template)\n\n  @property\n  def mmcif(self) -> str:\n    return self._mmcif\n\n  def __hash__(self) -> int:\n    return hash((self._mmcif, tuple(sorted(self._query_to_template))))\n\n  def __eq__(self, other: Self) -> bool:\n    mmcifs_equal = self._mmcif == other._mmcif\n    maps_equal = sorted(self._query_to_template) == sorted(\n        other._query_to_template\n    )\n    return mmcifs_equal and maps_equal\n\n\nclass ProteinChain:\n  \"\"\"Protein chain input.\"\"\"\n\n  __slots__ = (\n      '_id',\n      '_sequence',\n      '_ptms',\n      '_description',\n      '_paired_msa',\n      '_unpaired_msa',\n      '_templates',\n  )\n\n  def __init__(\n      self,\n      *,\n      id: str,  # pylint: disable=redefined-builtin\n      sequence: str,\n      ptms: Sequence[tuple[str, int]],\n      description: str | None = None,\n      paired_msa: str | None = None,\n      unpaired_msa: str | None = None,\n      templates: Sequence[Template] | None = None,\n  ):\n    \"\"\"Initializes a single protein chain input.\n\n    Args:\n      id: Unique protein chain identifier.\n      sequence: The amino acid sequence of the chain.\n      ptms: A list of tuples containing the post-translational modification type\n        and the (1-based) residue index where the modification is applied.\n      description: An optional textual description of the protein chain.\n      paired_msa: Paired A3M-formatted MSA for this chain. This MSA is not\n        deduplicated and will be used to compute paired features. If None, this\n        field is unset and must be filled in by the data pipeline before\n        featurisation. If set to an empty string, it will be treated as a custom\n        MSA with no sequences.\n      unpaired_msa: Unpaired A3M-formatted MSA for this chain. This will be\n        deduplicated and used to compute unpaired features. If None, this field\n        is unset and must be filled in by the data pipeline before\n        featurisation. If set to an empty string, it will be treated as a custom\n        MSA with no sequences.\n      templates: A list of structural templates for this chain. If None, this\n        field is unset and must be filled in by the data pipeline before\n        featurisation. The list can be empty or contain up to 20 templates.\n    \"\"\"\n    if not all(res.isalpha() for res in sequence):\n      raise ValueError(f'Protein must contain only letters, got \"{sequence}\"')\n    if any(not 0 < mod[1] <= len(sequence) for mod in ptms):\n      raise ValueError(f'Invalid protein modification index: {ptms}')\n    if any(mod[0].startswith('CCD_') for mod in ptms):\n      raise ValueError(\n          f'Protein ptms must not contain the \"CCD_\" prefix, got {ptms}'\n      )\n    # Use hashable containers for ptms and templates.\n    self._id = id\n    self._sequence = sequence\n    self._ptms = tuple(ptms)\n    self._description = description\n    self._paired_msa = paired_msa\n    self._unpaired_msa = unpaired_msa\n    self._templates = tuple(templates) if templates is not None else None\n\n  @property\n  def id(self) -> str:\n    return self._id\n\n  @property\n  def sequence(self) -> str:\n    \"\"\"Returns a single-letter sequence, taking modifications into account.\n\n    Uses 'X' for all unknown residues.\n    \"\"\"\n    return ''.join([\n        residue_names.letters_three_to_one(r, default='X')\n        for r in self.to_ccd_sequence()\n    ])\n\n  @property\n  def ptms(self) -> Sequence[tuple[str, int]]:\n    return self._ptms\n\n  @property\n  def description(self) -> str | None:\n    return self._description\n\n  @property\n  def paired_msa(self) -> str | None:\n    return self._paired_msa\n\n  @property\n  def unpaired_msa(self) -> str | None:\n    return self._unpaired_msa\n\n  @property\n  def templates(self) -> Sequence[Template] | None:\n    return self._templates\n\n  def __len__(self) -> int:\n    return len(self._sequence)\n\n  def __eq__(self, other: Self) -> bool:\n    return (\n        self._id == other._id\n        and self._sequence == other._sequence\n        and self._ptms == other._ptms\n        and self._description == other._description\n        and self._paired_msa == other._paired_msa\n        and self._unpaired_msa == other._unpaired_msa\n        and self._templates == other._templates\n    )\n\n  def __hash__(self) -> int:\n    return hash((\n        self._id,\n        self._sequence,\n        self._ptms,\n        self._description,\n        self._paired_msa,\n        self._unpaired_msa,\n        self._templates,\n    ))\n\n  def hash_without_id(self) -> int:\n    \"\"\"Returns a hash ignoring the ID - useful for deduplication.\"\"\"\n    return hash((\n        self._sequence,\n        self._ptms,\n        self._description,\n        self._paired_msa,\n        self._unpaired_msa,\n        self._templates,\n    ))\n\n  @classmethod\n  def from_alphafoldserver_dict(\n      cls, json_dict: Mapping[str, Any], seq_id: str\n  ) -> Self:\n    \"\"\"Constructs ProteinChain from the AlphaFoldServer JSON dict.\"\"\"\n    _validate_keys(\n        json_dict.keys(),\n        {\n            'sequence',\n            'glycans',\n            'modifications',\n            'count',\n            'maxTemplateDate',\n            'useStructureTemplate',\n        },\n    )\n    sequence = json_dict['sequence']\n\n    if 'glycans' in json_dict:\n      raise ValueError(\n          f'Specifying glycans in the `{ALPHAFOLDSERVER_JSON_DIALECT}` format'\n          ' is not supported.'\n      )\n\n    if 'maxTemplateDate' in json_dict:\n      raise ValueError(\n          f'Specifying maxTemplateDate in the `{ALPHAFOLDSERVER_JSON_DIALECT}`'\n          ' format is not supported, use the --max_template_date flag instead.'\n      )\n\n    templates = None  # Search for templates unless explicitly disabled.\n    if not json_dict.get('useStructureTemplate', True):\n      templates = []  # Do not use any templates.\n\n    ptms = [\n        (mod['ptmType'].removeprefix('CCD_'), mod['ptmPosition'])\n        for mod in json_dict.get('modifications', [])\n    ]\n    return cls(id=seq_id, sequence=sequence, ptms=ptms, templates=templates)\n\n  @classmethod\n  def from_dict(\n      cls,\n      json_dict: Mapping[str, Any],\n      json_path: pathlib.Path | None = None,\n      seq_id: str | None = None,\n  ) -> Self:\n    \"\"\"Constructs ProteinChain from the AlphaFold JSON dict.\"\"\"\n    json_dict = json_dict['protein']\n    _validate_keys(\n        json_dict.keys(),\n        {\n            'id',\n            'sequence',\n            'modifications',\n            'description',\n            'unpairedMsa',\n            'unpairedMsaPath',\n            'pairedMsa',\n            'pairedMsaPath',\n            'templates',\n        },\n    )\n\n    sequence = json_dict['sequence']\n    ptms = [\n        (mod['ptmType'], mod['ptmPosition'])\n        for mod in json_dict.get('modifications', [])\n    ]\n\n    unpaired_msa = json_dict.get('unpairedMsa', None)\n    unpaired_msa_path = json_dict.get('unpairedMsaPath', None)\n    if unpaired_msa and unpaired_msa_path:\n      raise ValueError('Only one of unpairedMsa/unpairedMsaPath can be set.')\n    if (\n        unpaired_msa\n        and len(unpaired_msa) < 256\n        and os.path.exists(unpaired_msa)\n    ):\n      raise ValueError(\n          'Set the unpaired MSA path using the \"unpairedMsaPath\" field.'\n      )\n    elif unpaired_msa_path:\n      unpaired_msa = _read_file(pathlib.Path(unpaired_msa_path), json_path)\n\n    paired_msa = json_dict.get('pairedMsa', None)\n    paired_msa_path = json_dict.get('pairedMsaPath', None)\n    if paired_msa and paired_msa_path:\n      raise ValueError('Only one of pairedMsa/pairedMsaPath can be set.')\n    if paired_msa and len(paired_msa) < 256 and os.path.exists(paired_msa):\n      raise ValueError(\n          'Set the paired MSA path using the \"pairedMsaPath\" field.'\n      )\n    elif paired_msa_path:\n      paired_msa = _read_file(pathlib.Path(paired_msa_path), json_path)\n\n    raw_templates = json_dict.get('templates', None)\n\n    if raw_templates is None:\n      templates = None\n    else:\n      templates = []\n      for raw_template in raw_templates:\n        _validate_keys(\n            raw_template.keys(),\n            {'mmcif', 'mmcifPath', 'queryIndices', 'templateIndices'},\n        )\n        mmcif = raw_template.get('mmcif', None)\n        mmcif_path = raw_template.get('mmcifPath', None)\n        if mmcif and mmcif_path:\n          raise ValueError('Only one of mmcif/mmcifPath can be set.')\n        if mmcif and len(mmcif) < 256 and os.path.exists(mmcif):\n          raise ValueError('Set the template path using the \"mmcifPath\" field.')\n        if mmcif_path:\n          mmcif = _read_file(pathlib.Path(mmcif_path), json_path)\n        query_to_template_map = dict(\n            zip(raw_template['queryIndices'], raw_template['templateIndices'])\n        )\n        templates.append(\n            Template(mmcif=mmcif, query_to_template_map=query_to_template_map)\n        )\n\n    return cls(\n        id=seq_id or json_dict['id'],\n        sequence=sequence,\n        ptms=ptms,\n        description=json_dict.get('description', None),\n        paired_msa=paired_msa,\n        unpaired_msa=unpaired_msa,\n        templates=templates,\n    )\n\n  def to_dict(\n      self, seq_id: str | Sequence[str] | None = None\n  ) -> Mapping[str, Mapping[str, Any]]:\n    \"\"\"Converts ProteinChain to an AlphaFold JSON dict.\"\"\"\n    if self._templates is None:\n      templates = None\n    else:\n      templates = [\n          {\n              'mmcif': template.mmcif,\n              'queryIndices': list(template.query_to_template_map.keys()),\n              'templateIndices': (\n                  list(template.query_to_template_map.values()) or None\n              ),\n          }\n          for template in self._templates\n      ]\n    contents = {\n        'id': seq_id or self._id,\n        'sequence': self._sequence,\n        'modifications': [\n            {'ptmType': ptm[0], 'ptmPosition': ptm[1]} for ptm in self._ptms\n        ],\n        'unpairedMsa': self._unpaired_msa,\n        'pairedMsa': self._paired_msa,\n        'templates': templates,\n    }\n    if self._description is not None:\n      contents['description'] = self._description\n    return {'protein': contents}\n\n  def to_ccd_sequence(self) -> Sequence[str]:\n    \"\"\"Converts to a sequence of CCD codes.\"\"\"\n    ccd_coded_seq = [\n        residue_names.PROTEIN_COMMON_ONE_TO_THREE.get(res, residue_names.UNK)\n        for res in self._sequence\n    ]\n    for ptm_code, ptm_index in self._ptms:\n      ccd_coded_seq[ptm_index - 1] = ptm_code\n    return ccd_coded_seq\n\n  def fill_missing_fields(self) -> Self:\n    \"\"\"Fill missing MSA and template fields with default values.\"\"\"\n    return ProteinChain(\n        id=self.id,\n        sequence=self._sequence,\n        ptms=self._ptms,\n        description=self._description,\n        unpaired_msa=self._unpaired_msa or '',\n        paired_msa=self._paired_msa or '',\n        templates=self._templates or [],\n    )\n\n\nclass RnaChain:\n  \"\"\"RNA chain input.\"\"\"\n\n  __slots__ = (\n      '_id',\n      '_sequence',\n      '_modifications',\n      '_description',\n      '_unpaired_msa',\n  )\n\n  def __init__(\n      self,\n      *,\n      id: str,  # pylint: disable=redefined-builtin\n      sequence: str,\n      modifications: Sequence[tuple[str, int]],\n      description: str | None = None,\n      unpaired_msa: str | None = None,\n  ):\n    \"\"\"Initializes a single strand RNA chain input.\n\n    Args:\n      id: Unique RNA chain identifier.\n      sequence: The RNA sequence of the chain.\n      modifications: A list of tuples containing the modification type and the\n        (1-based) residue index where the modification is applied.\n      description: An optional textual description of the RNA chain.\n      unpaired_msa: Unpaired A3M-formatted MSA for this chain. This will be\n        deduplicated and used to compute unpaired features. If None, this field\n        is unset and must be filled in by the data pipeline before\n        featurisation. If set to an empty string, it will be treated as a custom\n        MSA with no sequences.\n    \"\"\"\n    if not all(res.isalpha() for res in sequence):\n      raise ValueError(f'RNA must contain only letters, got \"{sequence}\"')\n    if any(not 0 < mod[1] <= len(sequence) for mod in modifications):\n      raise ValueError(f'Invalid RNA modification index: {modifications}')\n    if any(mod[0].startswith('CCD_') for mod in modifications):\n      raise ValueError(\n          'RNA modifications must not contain the \"CCD_\" prefix, got'\n          f' {modifications}'\n      )\n    self._id = id\n    self._sequence = sequence\n    # Use hashable container for modifications.\n    self._modifications = tuple(modifications)\n    self._description = description\n    self._unpaired_msa = unpaired_msa\n\n  @property\n  def id(self) -> str:\n    return self._id\n\n  @property\n  def sequence(self) -> str:\n    \"\"\"Returns a single-letter sequence, taking modifications into account.\n\n    Uses 'N' for all unknown residues.\n    \"\"\"\n    return ''.join([\n        residue_names.letters_three_to_one(r, default='N')\n        for r in self.to_ccd_sequence()\n    ])\n\n  @property\n  def modifications(self) -> Sequence[tuple[str, int]]:\n    return self._modifications\n\n  @property\n  def description(self) -> str | None:\n    return self._description\n\n  @property\n  def unpaired_msa(self) -> str | None:\n    return self._unpaired_msa\n\n  def __len__(self) -> int:\n    return len(self._sequence)\n\n  def __eq__(self, other: Self) -> bool:\n    return (\n        self._id == other._id\n        and self._sequence == other._sequence\n        and self._modifications == other._modifications\n        and self._description == other._description\n        and self._unpaired_msa == other._unpaired_msa\n    )\n\n  def __hash__(self) -> int:\n    return hash((\n        self._id,\n        self._sequence,\n        self._modifications,\n        self._description,\n        self._unpaired_msa,\n    ))\n\n  def hash_without_id(self) -> int:\n    \"\"\"Returns a hash ignoring the ID - useful for deduplication.\"\"\"\n    return hash((\n        self._sequence,\n        self._modifications,\n        self._description,\n        self._unpaired_msa,\n    ))\n\n  @classmethod\n  def from_alphafoldserver_dict(\n      cls, json_dict: Mapping[str, Any], seq_id: str\n  ) -> Self:\n    \"\"\"Constructs RnaChain from the AlphaFoldServer JSON dict.\"\"\"\n    _validate_keys(json_dict.keys(), {'sequence', 'modifications', 'count'})\n    sequence = json_dict['sequence']\n    modifications = [\n        (mod['modificationType'].removeprefix('CCD_'), mod['basePosition'])\n        for mod in json_dict.get('modifications', [])\n    ]\n    return cls(id=seq_id, sequence=sequence, modifications=modifications)\n\n  @classmethod\n  def from_dict(\n      cls,\n      json_dict: Mapping[str, Any],\n      json_path: pathlib.Path | None = None,\n      seq_id: str | None = None,\n  ) -> Self:\n    \"\"\"Constructs RnaChain from the AlphaFold JSON dict.\"\"\"\n    json_dict = json_dict['rna']\n    _validate_keys(\n        json_dict.keys(),\n        {\n            'id',\n            'sequence',\n            'modifications',\n            'description',\n            'unpairedMsa',\n            'unpairedMsaPath',\n        },\n    )\n    sequence = json_dict['sequence']\n    modifications = [\n        (mod['modificationType'], mod['basePosition'])\n        for mod in json_dict.get('modifications', [])\n    ]\n\n    unpaired_msa = json_dict.get('unpairedMsa', None)\n    unpaired_msa_path = json_dict.get('unpairedMsaPath', None)\n    if unpaired_msa and unpaired_msa_path:\n      raise ValueError('Only one of unpairedMsa/unpairedMsaPath can be set.')\n    if (\n        unpaired_msa\n        and len(unpaired_msa) < 256\n        and os.path.exists(unpaired_msa)\n    ):\n      raise ValueError(\n          'Set the unpaired MSA path using the \"unpairedMsaPath\" field.'\n      )\n    elif unpaired_msa_path:\n      unpaired_msa = _read_file(pathlib.Path(unpaired_msa_path), json_path)\n\n    return cls(\n        id=seq_id or json_dict['id'],\n        sequence=sequence,\n        modifications=modifications,\n        description=json_dict.get('description', None),\n        unpaired_msa=unpaired_msa,\n    )\n\n  def to_dict(\n      self, seq_id: str | Sequence[str] | None = None\n  ) -> Mapping[str, Mapping[str, Any]]:\n    \"\"\"Converts RnaChain to an AlphaFold JSON dict.\"\"\"\n    contents = {\n        'id': seq_id or self._id,\n        'sequence': self._sequence,\n        'modifications': [\n            {'modificationType': mod[0], 'basePosition': mod[1]}\n            for mod in self._modifications\n        ],\n        'unpairedMsa': self._unpaired_msa,\n    }\n    if self._description is not None:\n      contents['description'] = self._description\n    return {'rna': contents}\n\n  def to_ccd_sequence(self) -> Sequence[str]:\n    \"\"\"Converts to a sequence of CCD codes.\"\"\"\n    mapping = {r: r for r in residue_names.RNA_TYPES}  # Same 1-letter and CCD.\n    ccd_coded_seq = [\n        mapping.get(res, residue_names.UNK_RNA) for res in self._sequence\n    ]\n    for ccd_code, modification_index in self._modifications:\n      ccd_coded_seq[modification_index - 1] = ccd_code\n    return ccd_coded_seq\n\n  def fill_missing_fields(self) -> Self:\n    \"\"\"Fill missing MSA fields with default values.\"\"\"\n    return RnaChain(\n        id=self.id,\n        sequence=self.sequence,\n        modifications=self.modifications,\n        unpaired_msa=self._unpaired_msa or '',\n    )\n\n\nclass DnaChain:\n  \"\"\"Single strand DNA chain input.\"\"\"\n\n  __slots__ = ('_id', '_sequence', '_modifications', '_description')\n\n  def __init__(\n      self,\n      *,\n      id: str,  # pylint: disable=redefined-builtin\n      sequence: str,\n      modifications: Sequence[tuple[str, int]],\n      description: str | None = None,\n  ):\n    \"\"\"Initializes a single strand DNA chain input.\n\n    Args:\n      id: Unique DNA chain identifier.\n      sequence: The DNA sequence of the chain.\n      modifications: A list of tuples containing the modification type and the\n        (1-based) residue index where the modification is applied.\n      description: An optional textual description of the DNA chain.\n    \"\"\"\n    if not all(res.isalpha() for res in sequence):\n      raise ValueError(f'DNA must contain only letters, got \"{sequence}\"')\n    if any(not 0 < mod[1] <= len(sequence) for mod in modifications):\n      raise ValueError(f'Invalid DNA modification index: {modifications}')\n    if any(mod[0].startswith('CCD_') for mod in modifications):\n      raise ValueError(\n          'DNA modifications must not contain the \"CCD_\" prefix, got'\n          f' {modifications}'\n      )\n    self._id = id\n    self._sequence = sequence\n    # Use hashable container for modifications.\n    self._modifications = tuple(modifications)\n    self._description = description\n\n  @property\n  def id(self) -> str:\n    return self._id\n\n  @property\n  def sequence(self) -> str:\n    \"\"\"Returns a single-letter sequence, taking modifications into account.\n\n    Uses 'N' for all unknown residues.\n    \"\"\"\n    return ''.join([\n        residue_names.letters_three_to_one(r, default='N')\n        for r in self.to_ccd_sequence()\n    ])\n\n  @property\n  def description(self) -> str | None:\n    return self._description\n\n  def __len__(self) -> int:\n    return len(self._sequence)\n\n  def __eq__(self, other: Self) -> bool:\n    return (\n        self._id == other._id\n        and self._sequence == other._sequence\n        and self._modifications == other._modifications\n        and self._description == other._description\n    )\n\n  def __hash__(self) -> int:\n    return hash(\n        (self._id, self._sequence, self._modifications, self._description)\n    )\n\n  def modifications(self) -> Sequence[tuple[str, int]]:\n    return self._modifications\n\n  def hash_without_id(self) -> int:\n    \"\"\"Returns a hash ignoring the ID - useful for deduplication.\"\"\"\n    return hash((self._sequence, self._modifications, self._description))\n\n  @classmethod\n  def from_alphafoldserver_dict(\n      cls, json_dict: Mapping[str, Any], seq_id: str\n  ) -> Self:\n    \"\"\"Constructs DnaChain from the AlphaFoldServer JSON dict.\"\"\"\n    _validate_keys(json_dict.keys(), {'sequence', 'modifications', 'count'})\n    sequence = json_dict['sequence']\n    modifications = [\n        (mod['modificationType'].removeprefix('CCD_'), mod['basePosition'])\n        for mod in json_dict.get('modifications', [])\n    ]\n    return cls(id=seq_id, sequence=sequence, modifications=modifications)\n\n  @classmethod\n  def from_dict(\n      cls, json_dict: Mapping[str, Any], seq_id: str | None = None\n  ) -> Self:\n    \"\"\"Constructs DnaChain from the AlphaFold JSON dict.\"\"\"\n    json_dict = json_dict['dna']\n    _validate_keys(\n        json_dict.keys(), {'id', 'sequence', 'modifications', 'description'}\n    )\n    sequence = json_dict['sequence']\n    modifications = [\n        (mod['modificationType'], mod['basePosition'])\n        for mod in json_dict.get('modifications', [])\n    ]\n    return cls(\n        id=seq_id or json_dict['id'],\n        sequence=sequence,\n        modifications=modifications,\n        description=json_dict.get('description', None),\n    )\n\n  def to_dict(\n      self, seq_id: str | Sequence[str] | None = None\n  ) -> Mapping[str, Mapping[str, Any]]:\n    \"\"\"Converts DnaChain to an AlphaFold JSON dict.\"\"\"\n    contents = {\n        'id': seq_id or self._id,\n        'sequence': self._sequence,\n        'modifications': [\n            {'modificationType': mod[0], 'basePosition': mod[1]}\n            for mod in self._modifications\n        ],\n    }\n    if self._description is not None:\n      contents['description'] = self._description\n    return {'dna': contents}\n\n  def to_ccd_sequence(self) -> Sequence[str]:\n    \"\"\"Converts to a sequence of CCD codes.\"\"\"\n    ccd_coded_seq = [\n        residue_names.DNA_COMMON_ONE_TO_TWO.get(res, residue_names.UNK_DNA)\n        for res in self._sequence\n    ]\n    for ccd_code, modification_index in self._modifications:\n      ccd_coded_seq[modification_index - 1] = ccd_code\n    return ccd_coded_seq\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass Ligand:\n  \"\"\"Ligand input.\n\n  Attributes:\n    id: Unique ligand \"chain\" identifier.\n    ccd_ids: The Chemical Component Dictionary or user-defined CCD IDs of the\n      chemical components of the ligand. Typically, this is just a single ID,\n      but some ligands are composed of multiple components. If that is the case,\n      a bond linking these components should be added to the bonded_atom_pairs\n      Input field.\n    smiles: The SMILES representation of the ligand.\n    description: An optional textual description of the ligand.\n  \"\"\"\n\n  id: str\n  ccd_ids: Sequence[str] | None = None\n  smiles: str | None = None\n  description: str | None = None\n\n  def __post_init__(self):\n    if (self.ccd_ids is None) == (self.smiles is None):\n      raise ValueError('Ligand must have one of CCD ID or SMILES set.')\n\n    if self.smiles is not None:\n      mol = rd_chem.MolFromSmiles(self.smiles)\n      if not mol:\n        raise ValueError(f'Unable to make RDKit Mol from SMILES: {self.smiles}')\n\n    # Use hashable types for ccd_ids.\n    if self.ccd_ids is not None:\n      object.__setattr__(self, 'ccd_ids', tuple(self.ccd_ids))\n\n  def __len__(self) -> int:\n    if self.ccd_ids is not None:\n      return len(self.ccd_ids)\n    else:\n      return 1\n\n  def hash_without_id(self) -> int:\n    \"\"\"Returns a hash ignoring the ID - useful for deduplication.\"\"\"\n    return hash((self.ccd_ids, self.smiles, self.description))\n\n  @classmethod\n  def from_alphafoldserver_dict(\n      cls, json_dict: Mapping[str, Any], seq_id: str\n  ) -> Self:\n    \"\"\"Constructs Ligand from the AlphaFoldServer JSON dict.\"\"\"\n    # Ligand can be specified either as a ligand, or ion (special-case).\n    _validate_keys(json_dict.keys(), {'ligand', 'ion', 'count'})\n    if 'ligand' in json_dict:\n      return cls(id=seq_id, ccd_ids=[json_dict['ligand'].removeprefix('CCD_')])\n    elif 'ion' in json_dict:\n      return cls(id=seq_id, ccd_ids=[json_dict['ion']])\n    else:\n      raise ValueError(f'Unknown ligand type: {json_dict}')\n\n  @classmethod\n  def from_dict(\n      cls, json_dict: Mapping[str, Any], seq_id: str | None = None\n  ) -> Self:\n    \"\"\"Constructs Ligand from the AlphaFold JSON dict.\"\"\"\n    json_dict = json_dict['ligand']\n    _validate_keys(\n        json_dict.keys(), {'id', 'ccdCodes', 'smiles', 'description'}\n    )\n    if json_dict.get('ccdCodes') and json_dict.get('smiles'):\n      raise ValueError(\n          'Ligand cannot have both CCD code and SMILES set at the same time, '\n          f'got CCD: {json_dict[\"ccdCodes\"]} and SMILES: {json_dict[\"smiles\"]}'\n      )\n\n    if 'ccdCodes' in json_dict:\n      ccd_codes = json_dict['ccdCodes']\n      if not isinstance(ccd_codes, (list, tuple)):\n        raise ValueError(\n            'CCD codes must be a list of strings, got '\n            f'{type(ccd_codes).__name__} instead: {ccd_codes}'\n        )\n      return cls(\n          id=seq_id or json_dict['id'],\n          ccd_ids=ccd_codes,\n          description=json_dict.get('description', None),\n      )\n    elif 'smiles' in json_dict:\n      return cls(\n          id=seq_id or json_dict['id'],\n          smiles=json_dict['smiles'],\n          description=json_dict.get('description', None),\n      )\n    else:\n      raise ValueError(f'Unknown ligand type: {json_dict}')\n\n  def to_dict(\n      self, seq_id: str | Sequence[str] | None = None\n  ) -> Mapping[str, Mapping[str, Any]]:\n    \"\"\"Converts Ligand to an AlphaFold JSON dict.\"\"\"\n    contents = {'id': seq_id or self.id}\n    if self.ccd_ids is not None:\n      contents['ccdCodes'] = self.ccd_ids\n    if self.smiles is not None:\n      contents['smiles'] = self.smiles\n    if self.description is not None:\n      contents['description'] = self.description\n    return {'ligand': contents}\n\n\ndef _sample_rng_seed() -> int:\n  \"\"\"Sample a random seed for AlphaFoldServer job.\"\"\"\n  # See https://alphafoldserver.com/faq#what-are-seeds-and-how-are-they-set.\n  return random.randint(0, 2**32 - 1)\n\n\ndef _validate_user_ccd_keys(keys: Sequence[str], component_name: str) -> None:\n  \"\"\"Validates the keys of the user-defined CCD dictionary.\"\"\"\n  mandatory_keys = (\n      '_chem_comp.id',\n      '_chem_comp.name',\n      '_chem_comp.type',\n      '_chem_comp.formula',\n      '_chem_comp.mon_nstd_parent_comp_id',\n      '_chem_comp.pdbx_synonyms',\n      '_chem_comp.formula_weight',\n      '_chem_comp_atom.comp_id',\n      '_chem_comp_atom.atom_id',\n      '_chem_comp_atom.type_symbol',\n      '_chem_comp_atom.charge',\n      '_chem_comp_atom.pdbx_model_Cartn_x_ideal',\n      '_chem_comp_atom.pdbx_model_Cartn_y_ideal',\n      '_chem_comp_atom.pdbx_model_Cartn_z_ideal',\n      '_chem_comp_bond.atom_id_1',\n      '_chem_comp_bond.atom_id_2',\n      '_chem_comp_bond.value_order',\n      '_chem_comp_bond.pdbx_aromatic_flag',\n  )\n  if missing_keys := set(mandatory_keys) - set(keys):\n    raise ValueError(\n        f'Component {component_name} in the user-defined CCD is missing these'\n        f' keys: {missing_keys}'\n    )\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass Input:\n  \"\"\"AlphaFold input.\n\n  Attributes:\n    name: The name of the target.\n    chains: Protein chains, RNA chains, DNA chains, or ligands.\n    protein_chains: Protein chains.\n    rna_chains: RNA chains.\n    dna_chains: Single strand DNA chains.\n    ligands: Ligand (including ion) inputs.\n    rng_seeds: Random number generator seeds, one for each model execution.\n    bonded_atom_pairs: A list of tuples of atoms that are bonded to each other.\n      Each atom is defined by a tuple of (chain_id, res_id, atom_name). Chain\n      IDs must be set if there are any bonded atoms. Residue IDs are 1-indexed.\n      Atoms in ligands defined by SMILES can't be bonded since SMILES doesn't\n      define unique atom names.\n    user_ccd: Optional user-defined chemical component dictionary in the CIF\n      format. This can be used to provide additional CCD entries that are not\n      present in the default CCD and thus define arbitrary new ligands. This is\n      more expressive than SMILES since it allows to name all atoms within the\n      ligand which in turn makes it possible to define bonds using those atoms.\n  \"\"\"\n\n  name: str\n  chains: Sequence[ProteinChain | RnaChain | DnaChain | Ligand]\n  rng_seeds: Sequence[int]\n  bonded_atom_pairs: Sequence[tuple[BondAtomId, BondAtomId]] | None = None\n  user_ccd: str | None = None\n\n  def __post_init__(self):\n    if not self.rng_seeds:\n      raise ValueError('Input must have at least one RNG seed.')\n\n    if not self.name.strip() or not self.sanitised_name():\n      raise ValueError(\n          'Input name must be non-empty and contain at least one valid'\n          ' character (letters, numbers, dots, dashes, underscores).'\n      )\n\n    chain_ids = [c.id for c in self.chains]\n    if any(not c.id.isalpha() or c.id.islower() for c in self.chains):\n      raise ValueError(f'IDs must be upper case letters, got: {chain_ids}')\n    if len(set(chain_ids)) != len(chain_ids):\n      raise ValueError('Input JSON contains sequences with duplicate IDs.')\n\n    # Use hashable types for chains, rng_seeds, and bonded_atom_pairs.\n    object.__setattr__(self, 'chains', tuple(self.chains))\n    object.__setattr__(self, 'rng_seeds', tuple(self.rng_seeds))\n    if self.bonded_atom_pairs is not None:\n      object.__setattr__(\n          self, 'bonded_atom_pairs', tuple(self.bonded_atom_pairs)\n      )\n\n    if self.user_ccd is not None:\n      for component_name, component_cif in cif_dict.parse_multi_data_cif(\n          self.user_ccd\n      ).items():\n        _validate_user_ccd_keys(component_cif.keys(), component_name)\n\n  @property\n  def protein_chains(self) -> Sequence[ProteinChain]:\n    return [chain for chain in self.chains if isinstance(chain, ProteinChain)]\n\n  @property\n  def rna_chains(self) -> Sequence[RnaChain]:\n    return [chain for chain in self.chains if isinstance(chain, RnaChain)]\n\n  @property\n  def dna_chains(self) -> Sequence[DnaChain]:\n    return [chain for chain in self.chains if isinstance(chain, DnaChain)]\n\n  @property\n  def ligands(self) -> Sequence[Ligand]:\n    return [chain for chain in self.chains if isinstance(chain, Ligand)]\n\n  def sanitised_name(self) -> str:\n    \"\"\"Returns sanitised version of the name that can be used as a filename.\"\"\"\n    spaceless_name = self.name.replace(' ', '_')\n    allowed_chars = set(string.ascii_letters + string.digits + '_-.')\n    return ''.join(l for l in spaceless_name if l in allowed_chars)\n\n  @classmethod\n  def from_alphafoldserver_fold_job(cls, fold_job: Mapping[str, Any]) -> Self:\n    \"\"\"Constructs Input from an AlphaFoldServer fold job.\"\"\"\n\n    # Validate the fold job has the correct format.\n    _validate_keys(\n        fold_job.keys(),\n        {'name', 'modelSeeds', 'sequences', 'dialect', 'version'},\n    )\n    if 'dialect' not in fold_job and 'version' not in fold_job:\n      dialect = ALPHAFOLDSERVER_JSON_DIALECT\n      version = ALPHAFOLDSERVER_JSON_VERSION\n    elif 'dialect' in fold_job and 'version' in fold_job:\n      dialect = fold_job['dialect']\n      version = fold_job['version']\n    else:\n      raise ValueError(\n          'AlphaFold Server input JSON must either contain both `dialect` and'\n          ' `version` fields, or neither. If neither is specified, it is'\n          f' assumed that `dialect=\"{ALPHAFOLDSERVER_JSON_DIALECT}\"` and'\n          f' `version=\"{ALPHAFOLDSERVER_JSON_VERSION}\"`.'\n      )\n\n    if dialect != ALPHAFOLDSERVER_JSON_DIALECT:\n      raise ValueError(\n          f'AlphaFold Server input JSON has unsupported dialect: {dialect}, '\n          f'expected {ALPHAFOLDSERVER_JSON_DIALECT}.'\n      )\n\n    # For now, there is only one AlphaFold Server JSON version.\n    if version != ALPHAFOLDSERVER_JSON_VERSION:\n      raise ValueError(\n          f'AlphaFold Server input JSON has unsupported version: {version}, '\n          f'expected {ALPHAFOLDSERVER_JSON_VERSION}.'\n      )\n\n    # Parse the chains.\n    chains = []\n    for sequence in fold_job['sequences']:\n      if 'proteinChain' in sequence:\n        for _ in range(sequence['proteinChain'].get('count', 1)):\n          chains.append(\n              ProteinChain.from_alphafoldserver_dict(\n                  sequence['proteinChain'],\n                  seq_id=mmcif_lib.int_id_to_str_id(len(chains) + 1),\n              )\n          )\n      elif 'rnaSequence' in sequence:\n        for _ in range(sequence['rnaSequence'].get('count', 1)):\n          chains.append(\n              RnaChain.from_alphafoldserver_dict(\n                  sequence['rnaSequence'],\n                  seq_id=mmcif_lib.int_id_to_str_id(len(chains) + 1),\n              )\n          )\n      elif 'dnaSequence' in sequence:\n        for _ in range(sequence['dnaSequence'].get('count', 1)):\n          chains.append(\n              DnaChain.from_alphafoldserver_dict(\n                  sequence['dnaSequence'],\n                  seq_id=mmcif_lib.int_id_to_str_id(len(chains) + 1),\n              )\n          )\n      elif 'ion' in sequence:\n        for _ in range(sequence['ion'].get('count', 1)):\n          chains.append(\n              Ligand.from_alphafoldserver_dict(\n                  sequence['ion'],\n                  seq_id=mmcif_lib.int_id_to_str_id(len(chains) + 1),\n              )\n          )\n      elif 'ligand' in sequence:\n        for _ in range(sequence['ligand'].get('count', 1)):\n          chains.append(\n              Ligand.from_alphafoldserver_dict(\n                  sequence['ligand'],\n                  seq_id=mmcif_lib.int_id_to_str_id(len(chains) + 1),\n              )\n          )\n      else:\n        raise ValueError(f'Unknown sequence type: {sequence}')\n\n    if 'modelSeeds' in fold_job and fold_job['modelSeeds']:\n      rng_seeds = [int(seed) for seed in fold_job['modelSeeds']]\n    else:\n      rng_seeds = [_sample_rng_seed()]\n\n    return cls(name=fold_job['name'], chains=chains, rng_seeds=rng_seeds)\n\n  @classmethod\n  def from_json(\n      cls, json_str: str, json_path: pathlib.Path | None = None\n  ) -> Self:\n    \"\"\"Loads the input from the AlphaFold JSON string.\"\"\"\n    raw_json = json.loads(json_str)\n\n    _validate_keys(\n        raw_json.keys(),\n        {\n            'dialect',\n            'version',\n            'name',\n            'modelSeeds',\n            'sequences',\n            'bondedAtomPairs',\n            'userCCD',\n            'userCCDPath',\n        },\n    )\n\n    if 'dialect' not in raw_json or 'version' not in raw_json:\n      raise ValueError(\n          'AlphaFold 3 input JSON must contain `dialect` and `version` fields.'\n      )\n\n    if raw_json['dialect'] != JSON_DIALECT:\n      raise ValueError(\n          'AlphaFold 3 input JSON has unsupported dialect:'\n          f' {raw_json[\"dialect\"]}, expected {JSON_DIALECT}.'\n      )\n\n    if raw_json['version'] not in JSON_VERSIONS:\n      raise ValueError(\n          'AlphaFold 3 input JSON has unsupported version:'\n          f' {raw_json[\"version\"]}, expected one of {JSON_VERSIONS}.'\n      )\n\n    if 'sequences' not in raw_json:\n      raise ValueError('AlphaFold 3 input JSON does not contain any sequences.')\n\n    if 'modelSeeds' not in raw_json or not raw_json['modelSeeds']:\n      raise ValueError(\n          'AlphaFold 3 input JSON must specify at least one rng seed in'\n          ' `modelSeeds`.'\n      )\n\n    sequences = raw_json['sequences']\n\n    # Make sure sequence IDs are all set.\n    raw_sequence_ids = [next(iter(s.values())).get('id') for s in sequences]\n    if all(raw_sequence_ids):\n      sequence_ids = []\n      for sequence_id in raw_sequence_ids:\n        if isinstance(sequence_id, list):\n          sequence_ids.append(sequence_id)\n        else:\n          sequence_ids.append([sequence_id])\n    else:\n      raise ValueError(\n          'AlphaFold 3 input JSON contains sequences with unset IDs.'\n      )\n\n    flat_seq_ids = []\n    for seq_ids in sequence_ids:\n      flat_seq_ids.extend(seq_ids)\n\n    chains = []\n    for seq_ids, sequence in zip(sequence_ids, sequences, strict=True):\n      if len(sequence) != 1:\n        raise ValueError(f'Chain {seq_ids} has more than 1 sequence.')\n      for seq_id in seq_ids:\n        if 'protein' in sequence:\n          chains.append(ProteinChain.from_dict(sequence, json_path, seq_id))\n        elif 'rna' in sequence:\n          chains.append(RnaChain.from_dict(sequence, json_path, seq_id))\n        elif 'dna' in sequence:\n          chains.append(DnaChain.from_dict(sequence, seq_id=seq_id))\n        elif 'ligand' in sequence:\n          chains.append(Ligand.from_dict(sequence, seq_id=seq_id))\n        else:\n          raise ValueError(f'Unknown sequence type: {sequence}')\n\n    smiles_ligand_ids = set(\n        c.id for c in chains if isinstance(c, Ligand) and c.smiles is not None\n    )\n    chain_lengths = {chain.id: len(chain) for chain in chains}\n    bonded_atom_pairs = None\n    if bonds := raw_json.get('bondedAtomPairs'):\n      bonded_atom_pairs = []\n      for bond in bonds:\n        if len(bond) != 2:\n          raise ValueError(f'Bond {bond} must have 2 atoms, got {len(bond)}.')\n        bond_beg, bond_end = bond\n        if (\n            len(bond_beg) != 3\n            or not isinstance(bond_beg[0], str)\n            or not isinstance(bond_beg[1], int)\n            or not isinstance(bond_beg[2], str)\n        ):\n          raise ValueError(\n              f'Atom {bond_beg} in bond {bond} must have 3 components: '\n              '(chain_id: str, res_id: int, atom_name: str).'\n          )\n        if (\n            len(bond_end) != 3\n            or not isinstance(bond_end[0], str)\n            or not isinstance(bond_end[1], int)\n            or not isinstance(bond_end[2], str)\n        ):\n          raise ValueError(\n              f'Atom {bond_end} in bond {bond} must have 3 components: '\n              '(chain_id: str, res_id: int, atom_name: str).'\n          )\n        if bond_beg[0] not in flat_seq_ids or bond_end[0] not in flat_seq_ids:\n          raise ValueError(f'Invalid chain ID(s) in bond {bond}')\n        if (\n            not 0 < bond_beg[1] <= chain_lengths[bond_beg[0]]\n            or not 0 < bond_end[1] <= chain_lengths[bond_end[0]]\n        ):\n          raise ValueError(f'Invalid residue ID(s) in bond {bond}')\n        if bond_beg[0] in smiles_ligand_ids:\n          raise ValueError(\n              f'Bond {bond} involves an unsupported SMILES ligand {bond_beg[0]}'\n          )\n        if bond_end[0] in smiles_ligand_ids:\n          raise ValueError(\n              f'Bond {bond} involves an unsupported SMILES ligand {bond_end[0]}'\n          )\n        bonded_atom_pairs.append((tuple(bond_beg), tuple(bond_end)))\n\n      if len(bonded_atom_pairs) != len(set(bonded_atom_pairs)):\n        raise ValueError(f'Bonds are not unique: {bonded_atom_pairs}')\n\n    user_ccd = raw_json.get('userCCD')\n    user_ccd_path = raw_json.get('userCCDPath')\n    if user_ccd and user_ccd_path:\n      raise ValueError('Only one of userCCD/userCCDPath can be set.')\n    if user_ccd and len(user_ccd) < 256 and os.path.exists(user_ccd):\n      raise ValueError('Set the user CCD path using the \"userCCDPath\" field.')\n    elif user_ccd_path:\n      user_ccd = _read_file(pathlib.Path(user_ccd_path), json_path)\n\n    return cls(\n        name=raw_json['name'],\n        chains=chains,\n        rng_seeds=[int(seed) for seed in raw_json['modelSeeds']],\n        bonded_atom_pairs=bonded_atom_pairs,\n        user_ccd=user_ccd,\n    )\n\n  @classmethod\n  def from_mmcif(cls, mmcif_str: str, ccd: chemical_components.Ccd) -> Self:\n    \"\"\"Loads the input from an mmCIF string.\n\n    WARNING: Since rng seeds are not stored in mmCIFs, an rng seed is sampled\n    in the returned `Input`.\n\n    Args:\n      mmcif_str: The mmCIF string.\n      ccd: The chemical components dictionary.\n\n    Returns:\n      The input in an Input format.\n    \"\"\"\n\n    struc = structure.from_mmcif(\n        mmcif_str,\n        # Change MSE residues to MET residues.\n        fix_mse_residues=True,\n        # Fix arginine atom names. This is not needed since the input discards\n        # any atom-level data, but kept for consistency with the paper.\n        fix_arginines=True,\n        # Fix unknown DNA residues to the correct unknown DNA residue type.\n        fix_unknown_dna=True,\n        # Do not include water molecules.\n        include_water=False,\n        # Do not include things like DNA/RNA hybrids. This will be changed once\n        # we have a way of handling these in the AlphaFold 3 input format.\n        include_other=False,\n        # Include the specific bonds defined in the mmCIF bond table, e.g.\n        # covalent bonds for PTMs.\n        include_bonds=True,\n    )\n\n    # Create default bioassembly, expanding structures implied by stoichiometry.\n    struc = struc.generate_bioassembly(None)\n\n    sequences = struc.chain_single_letter_sequence(\n        include_missing_residues=True\n    )\n\n    chains = []\n    for chain_id, chain_type in zip(\n        struc.group_by_chain.chain_id, struc.group_by_chain.chain_type\n    ):\n      sequence = sequences[chain_id]\n\n      if chain_type in mmcif_names.NON_POLYMER_CHAIN_TYPES:\n        residues = list(struc.chain_res_name_sequence()[chain_id])\n        if all(ccd.get(res) is not None for res in residues):\n          chains.append(Ligand(id=chain_id, ccd_ids=residues))\n        elif len(residues) == 1:\n          comp_name = residues[0]\n          comps = struc.chemical_components_data\n          if comps is None:\n            raise ValueError(\n                'Missing mmCIF chemical components data - this is required for '\n                f'a non-CCD ligand {comp_name} defined using SMILES string.'\n            )\n          chains.append(\n              Ligand(id=chain_id, smiles=comps.chem_comp[comp_name].pdbx_smiles)\n          )\n        else:\n          raise ValueError(\n              'Multi-component ligand must be defined using CCD IDs, defining'\n              ' using SMILES is supported only for single-component ligands. '\n              f'Got {residues}'\n          )\n      else:\n        residues = struc.chain_res_name_sequence()[chain_id]\n        fixed = struc.chain_res_name_sequence(\n            fix_non_standard_polymer_res=True\n        )[chain_id]\n        modifications = [\n            (orig, i + 1)\n            for i, (orig, fixed) in enumerate(zip(residues, fixed, strict=True))\n            if orig != fixed\n        ]\n\n        if chain_type == mmcif_names.PROTEIN_CHAIN:\n          chains.append(\n              ProteinChain(id=chain_id, sequence=sequence, ptms=modifications)\n          )\n        elif chain_type == mmcif_names.RNA_CHAIN:\n          chains.append(\n              RnaChain(\n                  id=chain_id, sequence=sequence, modifications=modifications\n              )\n          )\n        elif chain_type == mmcif_names.DNA_CHAIN:\n          chains.append(\n              DnaChain(\n                  id=chain_id, sequence=sequence, modifications=modifications\n              )\n          )\n\n    bonded_atom_pairs = []\n    chain_ids = set(c.id for c in chains)\n    for atom_a, atom_b, _ in struc.iter_bonds():\n      if atom_a['chain_id'] in chain_ids and atom_b['chain_id'] in chain_ids:\n        beg = (atom_a['chain_id'], int(atom_a['res_id']), atom_a['atom_name'])\n        end = (atom_b['chain_id'], int(atom_b['res_id']), atom_b['atom_name'])\n        bonded_atom_pairs.append((beg, end))\n\n    return cls(\n        name=struc.name,\n        chains=chains,\n        # mmCIFs don't store rng seeds, so we need to sample one here.\n        rng_seeds=[_sample_rng_seed()],\n        bonded_atom_pairs=bonded_atom_pairs or None,\n    )\n\n  def to_structure(self, ccd: chemical_components.Ccd) -> structure.Structure:\n    \"\"\"Converts Input to a Structure.\n\n    WARNING: This method does not preserve the rng seeds.\n\n    Args:\n      ccd: The chemical components dictionary.\n\n    Returns:\n      The input in a structure.Structure format.\n    \"\"\"\n    ids: list[str] = []\n    sequences: list[str] = []\n    poly_types: list[str] = []\n    formats: list[structure.SequenceFormat] = []\n\n    for chain in self.chains:\n      ids.append(chain.id)\n      match chain:\n        case ProteinChain():\n          sequences.append('(' + ')('.join(chain.to_ccd_sequence()) + ')')\n          poly_types.append(mmcif_names.PROTEIN_CHAIN)\n          formats.append(structure.SequenceFormat.CCD_CODES)\n        case RnaChain():\n          sequences.append('(' + ')('.join(chain.to_ccd_sequence()) + ')')\n          poly_types.append(mmcif_names.RNA_CHAIN)\n          formats.append(structure.SequenceFormat.CCD_CODES)\n        case DnaChain():\n          sequences.append('(' + ')('.join(chain.to_ccd_sequence()) + ')')\n          poly_types.append(mmcif_names.DNA_CHAIN)\n          formats.append(structure.SequenceFormat.CCD_CODES)\n        case Ligand():\n          if chain.ccd_ids is not None:\n            sequences.append('(' + ')('.join(chain.ccd_ids) + ')')\n            if len(chain.ccd_ids) == 1:\n              poly_types.append(mmcif_names.NON_POLYMER_CHAIN)\n            else:\n              poly_types.append(mmcif_names.BRANCHED_CHAIN)\n            formats.append(structure.SequenceFormat.CCD_CODES)\n          elif chain.smiles is not None:\n            # Convert to `<unique ligand ID>:<smiles>` format that is expected\n            # by structure.from_sequences_and_bonds.\n            sequences.append(f'LIG_{chain.id}:{chain.smiles}')\n            poly_types.append(mmcif_names.NON_POLYMER_CHAIN)\n            formats.append(structure.SequenceFormat.LIGAND_SMILES)\n          else:\n            raise ValueError('Ligand must have one of CCD ID or SMILES set.')\n\n    # Remap bond chain IDs from chain IDs to chain indices and convert to\n    # 0-based residue indexing.\n    bonded_atom_pairs = []\n    chain_indices = {cid: i for i, cid in enumerate(ids)}\n    if self.bonded_atom_pairs is not None:\n      for bond_beg, bond_end in self.bonded_atom_pairs:\n        bonded_atom_pairs.append((\n            (chain_indices[bond_beg[0]], bond_beg[1] - 1, bond_beg[2]),\n            (chain_indices[bond_end[0]], bond_end[1] - 1, bond_end[2]),\n        ))\n\n    return structure.from_sequences_and_bonds(\n        sequences=sequences,\n        chain_types=poly_types,\n        sequence_formats=formats,\n        chain_ids=ids,\n        bonded_atom_pairs=bonded_atom_pairs,\n        ccd=ccd,\n        name=self.sanitised_name(),\n        bond_type=mmcif_names.COVALENT_BOND,\n        release_date=None,\n    )\n\n  def to_json(self) -> str:\n    \"\"\"Converts Input to an AlphaFold JSON.\"\"\"\n    deduped_chains = {}\n    deduped_chain_ids = {}\n    for chain in self.chains:\n      deduped_chains[chain.hash_without_id()] = chain\n      deduped_chain_ids.setdefault(chain.hash_without_id(), []).append(chain.id)\n\n    sequences = []\n    for chain_content_hash, ids in deduped_chain_ids.items():\n      chain = deduped_chains[chain_content_hash]\n      sequences.append(chain.to_dict(seq_id=ids if len(ids) > 1 else ids[0]))\n\n    alphafold_json = json.dumps(\n        {\n            'dialect': JSON_DIALECT,\n            'version': JSON_VERSION,\n            'name': self.name,\n            'sequences': sequences,\n            'modelSeeds': self.rng_seeds,\n            'bondedAtomPairs': self.bonded_atom_pairs,\n            'userCCD': self.user_ccd,\n        },\n        indent=2,\n    )\n    # Remove newlines from the query/template indices arrays. We match the\n    # queryIndices/templatesIndices with a non-capturing group. We then match\n    # the entire region between the square brackets by looking for lines\n    # containing only whitespace, number, or a comma.\n    return re.sub(\n        r'(\"(?:queryIndices|templateIndices)\": \\[)([\\s\\n\\d,]+)(\\],?)',\n        lambda mtch: mtch[1] + re.sub(r'\\n\\s+', ' ', mtch[2].strip()) + mtch[3],\n        alphafold_json,\n    )\n\n  def fill_missing_fields(self) -> Self:\n    \"\"\"Fill missing MSA and template fields with default values.\"\"\"\n    with_missing_fields = [\n        c.fill_missing_fields()\n        if isinstance(c, (ProteinChain, RnaChain))\n        else c\n        for c in self.chains\n    ]\n    return dataclasses.replace(self, chains=with_missing_fields)\n\n  def with_multiple_seeds(self, num_seeds: int) -> Self:\n    \"\"\"Returns a copy of the input with num_seeds rng seeds.\"\"\"\n    if num_seeds <= 1:\n      raise ValueError('Number of seeds must be greater than 1.')\n    if len(self.rng_seeds) != 1:\n      raise ValueError('Input must have one rng seed to set multiple seeds.')\n\n    return dataclasses.replace(\n        self,\n        rng_seeds=list(range(self.rng_seeds[0], self.rng_seeds[0] + num_seeds)),\n    )\n\n\ndef load_fold_inputs_from_path(json_path: pathlib.Path) -> Iterator[Input]:\n  \"\"\"Loads multiple fold inputs from a JSON string.\"\"\"\n  with open(json_path, 'r') as f:\n    json_str = f.read()\n\n  # Parse the JSON string, so we can detect its format.\n  raw_json = json.loads(json_str)\n\n  if isinstance(raw_json, list):\n    # AlphaFold Server JSON.\n    logging.info('Loading %d fold jobs from %s', len(raw_json), json_path)\n    for fold_job_idx, fold_job in enumerate(raw_json):\n      try:\n        yield Input.from_alphafoldserver_fold_job(fold_job)\n      except ValueError as e:\n        raise ValueError(\n            f'Failed to load fold job {fold_job_idx} from {json_path}'\n            f' (AlphaFold Server dialect): {e}'\n        ) from e\n  else:\n    # AlphaFold 3 JSON.\n    try:\n      yield Input.from_json(json_str, json_path)\n    except ValueError as e:\n      raise ValueError(\n          f'Failed to load input from {json_path} (AlphaFold 3 dialect): {e}'\n      ) from e\n\n\ndef load_fold_inputs_from_dir(input_dir: pathlib.Path) -> Iterator[Input]:\n  \"\"\"Loads multiple fold inputs from all JSON files in a given input_dir.\n\n  Args:\n    input_dir: The directory containing the JSON files.\n\n  Yields:\n    The fold inputs from all JSON files in the input directory.\n  \"\"\"\n  for file_path in sorted(input_dir.glob('*.json')):\n    if not file_path.is_file():\n      continue\n\n    yield from load_fold_inputs_from_path(file_path)\n"
  },
  {
    "path": "src/alphafold3/common/resources.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Load external resources, such as external tools or data resources.\"\"\"\n\nfrom collections.abc import Iterator\nimport os\nimport pathlib\nimport typing\nfrom typing import BinaryIO, Final, Literal, TextIO\n\nfrom importlib import resources\nimport alphafold3.common\n\n\n_DATA_ROOT:  Final[pathlib.Path] = (\n    resources.files(alphafold3.common).joinpath('..').resolve()\n)\nROOT = _DATA_ROOT\n\n\ndef filename(name: str | os.PathLike[str]) -> str:\n  \"\"\"Returns the absolute path to an external resource.\n\n  Note that this calls resources.GetResourceFilename under the hood and hence\n  causes par file unpacking, which might be unfriendly on diskless machines.\n\n\n  Args:\n    name: the name of the resource corresponding to its path relative to the\n      root of the repository.\n  \"\"\"\n  return (_DATA_ROOT / name).as_posix()\n\n\n@typing.overload\ndef open_resource(\n    name: str | os.PathLike[str], mode: Literal['r', 'rt'] = 'rt'\n) -> TextIO:\n  ...\n\n\n@typing.overload\ndef open_resource(\n    name: str | os.PathLike[str], mode: Literal['rb']\n) -> BinaryIO:\n  ...\n\n\ndef open_resource(\n    name: str | os.PathLike[str], mode: str = 'rb'\n) -> TextIO | BinaryIO:\n  \"\"\"Returns an open file object for the named resource.\n\n  Args:\n    name: the name of the resource corresponding to its path relative to the\n      root of the repository.\n    mode: the mode to use when opening the file.\n  \"\"\"\n  return (_DATA_ROOT / name).open(mode)\n\n\ndef get_resource_dir(path: str | os.PathLike[str]) -> os.PathLike[str]:\n  return _DATA_ROOT / path\n\n\ndef walk(path: str) -> Iterator[tuple[str, list[str], list[str]]]:\n  \"\"\"Walks the directory tree of resources similar to os.walk.\"\"\"\n  return os.walk((_DATA_ROOT / path).as_posix())\n"
  },
  {
    "path": "src/alphafold3/common/safe_pickle.py",
    "content": "# Copyright 2025 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Restricted-safe wrapper around pickle for loading trusted data.\n\nThis prevents arbitrary object instantiation during unpickling by only\nallowing a small allowlist of built-in, innocuous types.\n\nIntended for loading pickled constant data that ships with the repository.\nIf the pickle is tampered with, an UnpicklingError will be raised instead\nof silently executing attacker-controlled bytecode.\n\"\"\"\n\nfrom collections.abc import Collection\nimport pickle\nfrom typing import Any, BinaryIO, Final\n\n\n# Builtin types expected from AlphaFold 3 generated data.\n_ALLOWED_BUILTINS: Final[Collection[str]] = frozenset({\n    \"NoneType\",\n    \"bool\",\n    \"bytes\",\n    \"dict\",\n    \"float\",\n    \"frozenset\",\n    \"int\",\n    \"list\",\n    \"set\",\n    \"str\",\n    \"tuple\",\n})\n\n\nclass _RestrictedUnpickler(pickle.Unpickler):\n  \"\"\"A pickle `Unpickler` that forbids loading arbitrary global classes.\"\"\"\n\n  def find_class(self, module: str, name: str) -> Any:\n    \"\"\"Returns the class for `module` and `name` if allowed.\"\"\"\n    if module == \"builtins\" and name in _ALLOWED_BUILTINS:\n      return super().find_class(module, name)\n    raise pickle.UnpicklingError(f\"Can't unpickle disallowed '{module}.{name}'\")\n\n\ndef load(file_obj: BinaryIO) -> Any:\n  \"\"\"Safely loads pickle data from an already-opened binary file handle.\n\n  Only built-in container/primitive types listed in `_ALLOWED_BUILTINS` are\n  permitted. Any attempt to load other types raises `pickle.UnpicklingError`.\n\n  Args:\n    file_obj: A binary file-like object open for reading.\n\n  Returns:\n    The unpickled data.\n  \"\"\"\n\n  return _RestrictedUnpickler(file_obj).load()\n"
  },
  {
    "path": "src/alphafold3/common/testing/data.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Module that provides an abstraction for accessing test data.\"\"\"\n\nimport os\nimport pathlib\nfrom typing import Literal, overload\n\nfrom absl.testing import absltest\n\n\nclass Data:\n  \"\"\"Provides an abstraction for accessing test data.\"\"\"\n\n  def __init__(self, data_dir: os.PathLike[str] | str):\n    \"\"\"Initiailizes data wrapper, providing users with high level data access.\n\n    Args:\n      data_dir: Directory containing test data.\n    \"\"\"\n    self._data_dir = pathlib.Path(data_dir)\n\n  def path(self, data_name: str | os.PathLike[str] | None = None) -> str:\n    \"\"\"Returns the path to a given test data.\n\n    Args:\n      data_name: the name of the test data file relative to data_dir. If not\n        set, this will return the absolute path to the data directory.\n    \"\"\"\n    data_dir_path = (\n        pathlib.Path(absltest.get_default_test_srcdir()) / self._data_dir\n    )\n\n    if data_name:\n      return str(data_dir_path / data_name)\n\n    return str(data_dir_path)\n\n  @overload\n  def load(\n      self, data_name: str | os.PathLike[str], mode: Literal['rt'] = 'rt'\n  ) -> str:\n    ...\n\n  @overload\n  def load(\n      self, data_name: str | os.PathLike[str], mode: Literal['rb'] = 'rb'\n  ) -> bytes:\n    ...\n\n  def load(\n      self, data_name: str | os.PathLike[str], mode: str = 'rt'\n  ) -> str | bytes:\n    \"\"\"Returns the contents of a given test data.\n\n    Args:\n      data_name: the name of the test data file relative to data_dir.\n      mode: the mode in which to read the data file. Defaults to text ('rt').\n    \"\"\"\n    with open(self.path(data_name), mode=mode) as f:\n      return f.read()\n"
  },
  {
    "path": "src/alphafold3/constants/atom_types.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"List of atom types with reverse look-up.\"\"\"\n\nfrom collections.abc import Mapping, Sequence, Set\nimport itertools\nimport sys\nfrom typing import Final\nfrom alphafold3.constants import residue_names\n\n# Note:\n# `sys.intern` places the values in the Python internal db for fast lookup.\n\n# 37 common residue atoms.\nN = sys.intern('N')\nCA = sys.intern('CA')\nC = sys.intern('C')\nCB = sys.intern('CB')\nO = sys.intern('O')\nCG = sys.intern('CG')\nCG1 = sys.intern('CG1')\nCG2 = sys.intern('CG2')\nOG = sys.intern('OG')\nOG1 = sys.intern('OG1')\nSG = sys.intern('SG')\nCD = sys.intern('CD')\nCD1 = sys.intern('CD1')\nCD2 = sys.intern('CD2')\nND1 = sys.intern('ND1')\nND2 = sys.intern('ND2')\nOD1 = sys.intern('OD1')\nOD2 = sys.intern('OD2')\nSD = sys.intern('SD')\nCE = sys.intern('CE')\nCE1 = sys.intern('CE1')\nCE2 = sys.intern('CE2')\nCE3 = sys.intern('CE3')\nNE = sys.intern('NE')\nNE1 = sys.intern('NE1')\nNE2 = sys.intern('NE2')\nOE1 = sys.intern('OE1')\nOE2 = sys.intern('OE2')\nCH2 = sys.intern('CH2')\nNH1 = sys.intern('NH1')\nNH2 = sys.intern('NH2')\nOH = sys.intern('OH')\nCZ = sys.intern('CZ')\nCZ2 = sys.intern('CZ2')\nCZ3 = sys.intern('CZ3')\nNZ = sys.intern('NZ')\nOXT = sys.intern('OXT')\n\n# 29 common nucleic acid atoms.\nC1PRIME = sys.intern(\"C1'\")\nC2 = sys.intern('C2')\nC2PRIME = sys.intern(\"C2'\")\nC3PRIME = sys.intern(\"C3'\")\nC4 = sys.intern('C4')\nC4PRIME = sys.intern(\"C4'\")\nC5 = sys.intern('C5')\nC5PRIME = sys.intern(\"C5'\")\nC6 = sys.intern('C6')\nC7 = sys.intern('C7')\nC8 = sys.intern('C8')\nN1 = sys.intern('N1')\nN2 = sys.intern('N2')\nN3 = sys.intern('N3')\nN4 = sys.intern('N4')\nN6 = sys.intern('N6')\nN7 = sys.intern('N7')\nN9 = sys.intern('N9')\nO2 = sys.intern('O2')\nO2PRIME = sys.intern(\"O2'\")\nO3PRIME = sys.intern(\"O3'\")\nO4 = sys.intern('O4')\nO4PRIME = sys.intern(\"O4'\")\nO5PRIME = sys.intern(\"O5'\")\nO6 = sys.intern('O6')\nOP1 = sys.intern('OP1')\nOP2 = sys.intern('OP2')\nOP3 = sys.intern('OP3')\nP = sys.intern('P')\n\n# A list of atoms (excluding hydrogen) for each AA type. PDB naming convention.\nRESIDUE_ATOMS: Mapping[str, tuple[str, ...]] = {\n    residue_names.ALA: (C, CA, CB, N, O),\n    residue_names.ARG: (C, CA, CB, CG, CD, CZ, N, NE, O, NH1, NH2),\n    residue_names.ASN: (C, CA, CB, CG, N, ND2, O, OD1),\n    residue_names.ASP: (C, CA, CB, CG, N, O, OD1, OD2),\n    residue_names.CYS: (C, CA, CB, N, O, SG),\n    residue_names.GLN: (C, CA, CB, CG, CD, N, NE2, O, OE1),\n    residue_names.GLU: (C, CA, CB, CG, CD, N, O, OE1, OE2),\n    residue_names.GLY: (C, CA, N, O),\n    residue_names.HIS: (C, CA, CB, CG, CD2, CE1, N, ND1, NE2, O),\n    residue_names.ILE: (C, CA, CB, CG1, CG2, CD1, N, O),\n    residue_names.LEU: (C, CA, CB, CG, CD1, CD2, N, O),\n    residue_names.LYS: (C, CA, CB, CG, CD, CE, N, NZ, O),\n    residue_names.MET: (C, CA, CB, CG, CE, N, O, SD),\n    residue_names.PHE: (C, CA, CB, CG, CD1, CD2, CE1, CE2, CZ, N, O),\n    residue_names.PRO: (C, CA, CB, CG, CD, N, O),\n    residue_names.SER: (C, CA, CB, N, O, OG),\n    residue_names.THR: (C, CA, CB, CG2, N, O, OG1),\n    residue_names.TRP:\n        (C, CA, CB, CG, CD1, CD2, CE2, CE3, CZ2, CZ3, CH2, N, NE1, O),\n    residue_names.TYR: (C, CA, CB, CG, CD1, CD2, CE1, CE2, CZ, N, O, OH),\n    residue_names.VAL: (C, CA, CB, CG1, CG2, N, O),\n}  # pyformat: disable\n\n# Used to identify backbone for alignment and distance calculation for sterics.\nPROTEIN_BACKBONE_ATOMS: tuple[str, ...] = (N, CA, C)\n\n# Naming swaps for ambiguous atom names. Due to symmetries in the amino acids\n# the naming of atoms is ambiguous in 4 of the 20 amino acids. (The LDDT paper\n# lists 7 amino acids as ambiguous, but the naming ambiguities in LEU, VAL and\n# ARG can be resolved by using the 3D constellations of the 'ambiguous' atoms\n# and their neighbours)\nAMBIGUOUS_ATOM_NAMES: Mapping[str, Mapping[str, str]] = {\n    residue_names.ASP: {OD1: OD2},\n    residue_names.GLU: {OE1: OE2},\n    residue_names.PHE: {CD1: CD2, CE1: CE2},\n    residue_names.TYR: {CD1: CD2, CE1: CE2},\n}\n\n# Used when we need to store atom data in a format that requires fixed atom data\n# size for every protein residue (e.g. a numpy array).\nATOM37: tuple[str, ...] = (\n    N, CA, C, CB, O, CG, CG1, CG2, OG, OG1, SG, CD, CD1, CD2, ND1, ND2, OD1,\n    OD2, SD, CE, CE1, CE2, CE3, NE, NE1, NE2, OE1, OE2, CH2, NH1, NH2, OH, CZ,\n    CZ2, CZ3, NZ, OXT)  # pyformat: disable\nATOM37_ORDER: Mapping[str, int] = {name: i for i, name in enumerate(ATOM37)}\nATOM37_NUM: Final[int] = len(ATOM37)  # := 37.\n\n# Used when we need to store protein atom data in a format that requires fixed\n# atom data size for any residue but takes less space than ATOM37 by having 14\n# fields, which is sufficient for storing atoms of all protein residues (e.g. a\n# numpy array).\nATOM14: Mapping[str, tuple[str, ...]] = {\n    residue_names.ALA: (N, CA, C, O, CB),\n    residue_names.ARG: (N, CA, C, O, CB, CG, CD, NE, CZ, NH1, NH2),\n    residue_names.ASN: (N, CA, C, O, CB, CG, OD1, ND2),\n    residue_names.ASP: (N, CA, C, O, CB, CG, OD1, OD2),\n    residue_names.CYS: (N, CA, C, O, CB, SG),\n    residue_names.GLN: (N, CA, C, O, CB, CG, CD, OE1, NE2),\n    residue_names.GLU: (N, CA, C, O, CB, CG, CD, OE1, OE2),\n    residue_names.GLY: (N, CA, C, O),\n    residue_names.HIS: (N, CA, C, O, CB, CG, ND1, CD2, CE1, NE2),\n    residue_names.ILE: (N, CA, C, O, CB, CG1, CG2, CD1),\n    residue_names.LEU: (N, CA, C, O, CB, CG, CD1, CD2),\n    residue_names.LYS: (N, CA, C, O, CB, CG, CD, CE, NZ),\n    residue_names.MET: (N, CA, C, O, CB, CG, SD, CE),\n    residue_names.PHE: (N, CA, C, O, CB, CG, CD1, CD2, CE1, CE2, CZ),\n    residue_names.PRO: (N, CA, C, O, CB, CG, CD),\n    residue_names.SER: (N, CA, C, O, CB, OG),\n    residue_names.THR: (N, CA, C, O, CB, OG1, CG2),\n    residue_names.TRP:\n        (N, CA, C, O, CB, CG, CD1, CD2, NE1, CE2, CE3, CZ2, CZ3, CH2),\n    residue_names.TYR: (N, CA, C, O, CB, CG, CD1, CD2, CE1, CE2, CZ, OH),\n    residue_names.VAL: (N, CA, C, O, CB, CG1, CG2),\n    residue_names.UNK: (),\n}  # pyformat: disable\n\n# A compact atom encoding with 14 columns, padded with '' in empty slots.\nATOM14_PADDED: Mapping[str, Sequence[str]] = {\n    k: [v for _, v in itertools.zip_longest(range(14), values, fillvalue='')]\n    for k, values in ATOM14.items()\n}\n\nATOM14_ORDER: Mapping[str, Mapping[str, int]] = {\n    k: {name: i for i, name in enumerate(v)} for k, v in ATOM14.items()\n}\nATOM14_NUM: Final[int] = max(len(v) for v in ATOM14.values())\n\n# Used when we need to store protein and nucleic atom library.\nDENSE_ATOM: Mapping[str, tuple[str, ...]] = {\n    # Protein.\n    residue_names.ALA: (N, CA, C, O, CB),\n    residue_names.ARG: (N, CA, C, O, CB, CG, CD, NE, CZ, NH1, NH2),\n    residue_names.ASN: (N, CA, C, O, CB, CG, OD1, ND2),\n    residue_names.ASP: (N, CA, C, O, CB, CG, OD1, OD2),\n    residue_names.CYS: (N, CA, C, O, CB, SG),\n    residue_names.GLN: (N, CA, C, O, CB, CG, CD, OE1, NE2),\n    residue_names.GLU: (N, CA, C, O, CB, CG, CD, OE1, OE2),\n    residue_names.GLY: (N, CA, C, O),\n    residue_names.HIS: (N, CA, C, O, CB, CG, ND1, CD2, CE1, NE2),\n    residue_names.ILE: (N, CA, C, O, CB, CG1, CG2, CD1),\n    residue_names.LEU: (N, CA, C, O, CB, CG, CD1, CD2),\n    residue_names.LYS: (N, CA, C, O, CB, CG, CD, CE, NZ),\n    residue_names.MET: (N, CA, C, O, CB, CG, SD, CE),\n    residue_names.PHE: (N, CA, C, O, CB, CG, CD1, CD2, CE1, CE2, CZ),\n    residue_names.PRO: (N, CA, C, O, CB, CG, CD),\n    residue_names.SER: (N, CA, C, O, CB, OG),\n    residue_names.THR: (N, CA, C, O, CB, OG1, CG2),\n    residue_names.TRP:\n        (N, CA, C, O, CB, CG, CD1, CD2, NE1, CE2, CE3, CZ2, CZ3, CH2),\n    residue_names.TYR: (N, CA, C, O, CB, CG, CD1, CD2, CE1, CE2, CZ, OH),\n    residue_names.VAL: (N, CA, C, O, CB, CG1, CG2),\n    residue_names.UNK: (),\n    # RNA.\n    residue_names.A:\n        (OP3, P, OP1, OP2, O5PRIME, C5PRIME, C4PRIME, O4PRIME, C3PRIME, O3PRIME,\n         C2PRIME, O2PRIME, C1PRIME, N9, C8, N7, C5, C6, N6, N1, C2, N3, C4),\n    residue_names.C:\n        (OP3, P, OP1, OP2, O5PRIME, C5PRIME, C4PRIME, O4PRIME, C3PRIME, O3PRIME,\n         C2PRIME, O2PRIME, C1PRIME, N1, C2, O2, N3, C4, N4, C5, C6),\n    residue_names.G:\n        (OP3, P, OP1, OP2, O5PRIME, C5PRIME, C4PRIME, O4PRIME, C3PRIME, O3PRIME,\n         C2PRIME, O2PRIME, C1PRIME, N9, C8, N7, C5, C6, O6, N1, C2, N2, N3, C4),\n    residue_names.U:\n        (OP3, P, OP1, OP2, O5PRIME, C5PRIME, C4PRIME, O4PRIME, C3PRIME, O3PRIME,\n         C2PRIME, O2PRIME, C1PRIME, N1, C2, O2, N3, C4, O4, C5, C6),\n    residue_names.UNK_RNA: (),\n    # DNA.\n    residue_names.DA:\n        (OP3, P, OP1, OP2, O5PRIME, C5PRIME, C4PRIME, O4PRIME, C3PRIME, O3PRIME,\n         C2PRIME, C1PRIME, N9, C8, N7, C5, C6, N6, N1, C2, N3, C4),\n    residue_names.DC:\n        (OP3, P, OP1, OP2, O5PRIME, C5PRIME, C4PRIME, O4PRIME, C3PRIME, O3PRIME,\n         C2PRIME, C1PRIME, N1, C2, O2, N3, C4, N4, C5, C6),\n    residue_names.DG:\n        (OP3, P, OP1, OP2, O5PRIME, C5PRIME, C4PRIME, O4PRIME, C3PRIME, O3PRIME,\n         C2PRIME, C1PRIME, N9, C8, N7, C5, C6, O6, N1, C2, N2, N3, C4),\n    residue_names.DT:\n        (OP3, P, OP1, OP2, O5PRIME, C5PRIME, C4PRIME, O4PRIME, C3PRIME, O3PRIME,\n         C2PRIME, C1PRIME, N1, C2, O2, N3, C4, O4, C5, C7, C6),\n    # Unknown nucleic.\n    residue_names.UNK_DNA: (),\n}  # pyformat: disable\n\nDENSE_ATOM_ORDER: Mapping[str, Mapping[str, int]] = {\n    k: {name: i for i, name in enumerate(v)} for k, v in DENSE_ATOM.items()\n}\nDENSE_ATOM_NUM: Final[int] = max(len(v) for v in DENSE_ATOM.values())\n\n# Used when we need to store atom data in a format that requires fixed atom data\n# size for every nucleic molecule (e.g. a numpy array).\nATOM29: tuple[str, ...] = (\n    \"C1'\", 'C2', \"C2'\", \"C3'\", 'C4', \"C4'\", 'C5', \"C5'\", 'C6', 'C7', 'C8', 'N1',\n    'N2', 'N3', 'N4', 'N6', 'N7', 'N9', 'OP3', 'O2', \"O2'\", \"O3'\", 'O4', \"O4'\",\n    \"O5'\", 'O6', 'OP1', 'OP2', 'P')  # pyformat: disable\nATOM29_ORDER: Mapping[str, int] = {\n    atom_type: i for i, atom_type in enumerate(ATOM29)\n}\nATOM29_NUM: Final[int] = len(ATOM29)  # := 29\n\n# Hydrogens that exist depending on the protonation state of the residue.\n# Extracted from third_party/py/openmm/app/data/hydrogens.xml\nPROTONATION_HYDROGENS: Mapping[str, Set[str]] = {\n    'ASP': {'HD2'},\n    'CYS': {'HG'},\n    'GLU': {'HE2'},\n    'HIS': {'HD1', 'HE2'},\n    'LYS': {'HZ3'},\n}\n"
  },
  {
    "path": "src/alphafold3/constants/chemical_component_sets.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Sets of chemical components.\"\"\"\n\nfrom typing import Final\n\nfrom alphafold3.common import resources\nfrom alphafold3.common import safe_pickle\n\n_CCD_SETS_CCD_PICKLE_FILE = resources.filename(\n    resources.ROOT / 'constants/converters/chemical_component_sets.pickle'\n)\n\nwith open(_CCD_SETS_CCD_PICKLE_FILE, 'rb') as f:\n  _CCD_SET = safe_pickle.load(f)\n\n# Glycan (or 'Saccharide') ligands.\n# _chem_comp.type containing 'saccharide' and 'linking' (when lower-case).\nGLYCAN_LINKING_LIGANDS: Final[frozenset[str]] = _CCD_SET['glycans_linking']\n\n# _chem_comp.type containing 'saccharide' and not 'linking' (when lower-case).\nGLYCAN_OTHER_LIGANDS: Final[frozenset[str]] = _CCD_SET['glycans_other']\n\n# Each of these molecules appears in over 1k PDB structures, are used to\n# facilitate crystallization conditions, but do not have biological relevance.\nCOMMON_CRYSTALLIZATION_AIDS: Final[frozenset[str]] = frozenset({\n    'SO4', 'GOL', 'EDO', 'PO4', 'ACT', 'PEG', 'DMS', 'TRS', 'PGE', 'PG4', 'FMT',\n    'EPE', 'MPD', 'MES', 'CD', 'IOD',\n})  # pyformat: disable\n"
  },
  {
    "path": "src/alphafold3/constants/chemical_components.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Chemical Components found in PDB (CCD) constants.\"\"\"\n\nfrom collections.abc import ItemsView, Iterator, KeysView, Mapping, Sequence, ValuesView\nimport dataclasses\nimport functools\nimport os\n\nfrom alphafold3.common import resources\nfrom alphafold3.common import safe_pickle\nfrom alphafold3.cpp import cif_dict\n\n\n_CCD_PICKLE_FILE = resources.filename(\n    resources.ROOT / 'constants/converters/ccd.pickle'\n)\n\n\n@functools.cache\ndef _load_ccd_pickle_cached(\n    path: os.PathLike[str],\n) -> dict[str, Mapping[str, Sequence[str]]]:\n  \"\"\"Loads the CCD pickle file and caches it so that it is only loaded once.\"\"\"\n  with open(path, 'rb') as f:\n    return safe_pickle.load(f)\n\n\nclass Ccd(Mapping[str, Mapping[str, Sequence[str]]]):\n  \"\"\"Chemical Components found in PDB (CCD) constants.\n\n  See https://academic.oup.com/bioinformatics/article/31/8/1274/212200 for CCD\n  CIF format documentation.\n\n  Wraps the dict to prevent accidental mutation.\n  \"\"\"\n\n  __slots__ = ('_dict', '_ccd_pickle_path')\n\n  def __init__(\n      self,\n      ccd_pickle_path: os.PathLike[str] | None = None,\n      user_ccd: str | None = None,\n  ):\n    \"\"\"Initialises the chemical components dictionary.\n\n    Args:\n      ccd_pickle_path: Path to the CCD pickle file. If None, uses the default\n        CCD pickle file included in the source code.\n      user_ccd: A string containing the user-provided CCD. This has to conform\n        to the same format as the CCD, see https://www.wwpdb.org/data/ccd. If\n        provided, takes precedence over the CCD for the the same key. This can\n        be used to override specific entries in the CCD if desired.\n    \"\"\"\n    self._ccd_pickle_path = ccd_pickle_path or _CCD_PICKLE_FILE\n    self._dict = _load_ccd_pickle_cached(self._ccd_pickle_path)\n\n    if user_ccd is not None:\n      if not user_ccd:\n        raise ValueError('User CCD cannot be an empty string.')\n      user_ccd_cifs = {\n          key: value.to_dict()\n          for key, value in cif_dict.parse_multi_data_cif(user_ccd).items()\n      }\n      self._dict.update(user_ccd_cifs)\n\n  def __getitem__(self, key: str) -> Mapping[str, Sequence[str]]:\n    return self._dict[key]\n\n  def __contains__(self, key: str) -> bool:\n    return key in self._dict\n\n  def __iter__(self) -> Iterator[str]:\n    return self._dict.__iter__()\n\n  def __len__(self) -> int:\n    return len(self._dict)\n\n  def __hash__(self) -> int:\n    return id(self)  # Ok since this is immutable.\n\n  def get(\n      self, key: str, default: None | Mapping[str, Sequence[str]] = None\n  ) -> Mapping[str, Sequence[str]] | None:\n    return self._dict.get(key, default)\n\n  def items(self) -> ItemsView[str, Mapping[str, Sequence[str]]]:\n    return self._dict.items()\n\n  def values(self) -> ValuesView[Mapping[str, Sequence[str]]]:\n    return self._dict.values()\n\n  def keys(self) -> KeysView[str]:\n    return self._dict.keys()\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass ComponentInfo:\n  name: str\n  type: str\n  pdbx_synonyms: str\n  formula: str\n  formula_weight: str\n  mon_nstd_parent_comp_id: str\n  mon_nstd_flag: str\n  pdbx_smiles: str\n\n\ndef mmcif_to_info(mmcif: Mapping[str, Sequence[str]]) -> ComponentInfo:\n  \"\"\"Converts CCD mmCIFs to component info. Missing fields are left empty.\"\"\"\n  names = mmcif['_chem_comp.name']\n  types = mmcif['_chem_comp.type']\n  mon_nstd_parent_comp_ids = mmcif['_chem_comp.mon_nstd_parent_comp_id']\n  pdbx_synonyms = mmcif['_chem_comp.pdbx_synonyms']\n  formulas = mmcif['_chem_comp.formula']\n  formula_weights = mmcif['_chem_comp.formula_weight']\n\n  def front_or_empty(values: Sequence[str]) -> str:\n    return values[0] if values else ''\n\n  type_ = front_or_empty(types)\n  mon_nstd_parent_comp_id = front_or_empty(mon_nstd_parent_comp_ids)\n  if type_.lower() == 'non-polymer':\n    # Unset for non-polymers, e.g. water or ions.\n    mon_nstd_flag = '.'\n  elif mon_nstd_parent_comp_id == '?':\n    # A standard component - it doesn't have a standard parent, e.g. MET.\n    mon_nstd_flag = 'y'\n  else:\n    # A non-standard component, e.g. MSE.\n    mon_nstd_flag = 'n'\n\n  # Default SMILES is the canonical SMILES, but we fall back to the SMILES if a\n  # canonical SMILES is not available. Of canonical SMILES, we prefer ones from\n  # the OpenEye OEToolkits program.\n  canonical_pdbx_smiles = ''\n  fallback_pdbx_smiles = ''\n  descriptor_types = mmcif.get('_pdbx_chem_comp_descriptor.type', [])\n  descriptors = mmcif.get('_pdbx_chem_comp_descriptor.descriptor', [])\n  programs = mmcif.get('_pdbx_chem_comp_descriptor.program', [])\n  for descriptor_type, descriptor, program in zip(\n      descriptor_types, descriptors, programs\n  ):\n    if descriptor_type == 'SMILES_CANONICAL':\n      if (not canonical_pdbx_smiles) or program == 'OpenEye OEToolkits':\n        canonical_pdbx_smiles = descriptor\n    if not fallback_pdbx_smiles and descriptor_type == 'SMILES':\n      fallback_pdbx_smiles = descriptor\n  pdbx_smiles = canonical_pdbx_smiles or fallback_pdbx_smiles\n\n  return ComponentInfo(\n      name=front_or_empty(names),\n      type=type_,\n      pdbx_synonyms=front_or_empty(pdbx_synonyms),\n      formula=front_or_empty(formulas),\n      formula_weight=front_or_empty(formula_weights),\n      mon_nstd_parent_comp_id=mon_nstd_parent_comp_id,\n      mon_nstd_flag=mon_nstd_flag,\n      pdbx_smiles=pdbx_smiles,\n  )\n\n\n@functools.lru_cache(maxsize=128)\ndef component_name_to_info(ccd: Ccd, res_name: str) -> ComponentInfo | None:\n  component = ccd.get(res_name)\n  if component is None:\n    return None\n  return mmcif_to_info(component)\n\n\ndef type_symbol(ccd: Ccd, res_name: str, atom_name: str) -> str:\n  \"\"\"Returns the element type for the given component name and atom name.\n\n  Args:\n    ccd: The chemical components dictionary.\n    res_name: The component name, e.g. ARG.\n    atom_name: The atom name, e.g. CB, OXT, or NH1.\n\n  Returns:\n    Element type, e.g. C for (ARG, CB), O for (ARG, OXT), N for (ARG, NH1).\n  \"\"\"\n  res = ccd.get(res_name)\n  if res is None:\n    return '?'\n  try:\n    return res['_chem_comp_atom.type_symbol'][\n        res['_chem_comp_atom.atom_id'].index(atom_name)\n    ]\n  except (ValueError, IndexError, KeyError):\n    return '?'\n"
  },
  {
    "path": "src/alphafold3/constants/converters/ccd_pickle_gen.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Reads Chemical Components gz file and generates a CCD pickle file.\"\"\"\n\nfrom collections.abc import Sequence\nimport gzip\nimport pickle\nimport sys\n\nfrom alphafold3.cpp import cif_dict\nimport tqdm\n\n\ndef main(argv: Sequence[str]) -> None:\n  if len(argv) != 3:\n    raise ValueError('Must specify input_file components.cif and output_file')\n\n  _, input_file, output_file = argv\n\n  print(f'Parsing {input_file}', flush=True)\n  if input_file.endswith('.gz'):\n    opener = gzip.open\n  else:\n    opener = open\n\n  with opener(input_file, 'rb') as f:\n    whole_file = f.read()\n  result = {\n      key: value.to_dict()\n      for key, value in tqdm.tqdm(\n          cif_dict.parse_multi_data_cif(whole_file).items(), disable=None\n      )\n  }\n  assert len(result) == whole_file.count(b'data_')\n\n  print(f'Writing {output_file}', flush=True)\n  with open(output_file, 'wb') as f:\n    pickle.dump(result, f, protocol=pickle.HIGHEST_PROTOCOL)\n  print('Done', flush=True)\n\nif __name__ == '__main__':\n  main(sys.argv)\n"
  },
  {
    "path": "src/alphafold3/constants/converters/chemical_component_sets_gen.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Script for updating chemical_component_sets.py.\"\"\"\n\nfrom collections.abc import Mapping, Sequence\nimport pathlib\nimport pickle\nimport re\nimport sys\n\nfrom alphafold3.common import resources\nfrom alphafold3.common import safe_pickle\nimport tqdm\n\n\n_CCD_PICKLE_FILE = resources.filename(\n    'constants/converters/ccd.pickle'\n)\n\n\ndef find_ions_and_glycans_in_ccd(\n    ccd: Mapping[str, Mapping[str, Sequence[str]]],\n) -> dict[str, frozenset[str]]:\n  \"\"\"Finds glycans and ions in all version of CCD.\"\"\"\n  glycans_linking = []\n  glycans_other = []\n  ions = []\n  for name, comp in tqdm.tqdm(ccd.items(), disable=None):\n    if name == 'UNX':\n      continue  # Skip \"unknown atom or ion\".\n    comp_type = comp['_chem_comp.type'][0].lower()\n    # Glycans have the type 'saccharide'.\n    if re.findall(r'\\bsaccharide\\b', comp_type):\n      # Separate out linking glycans from others.\n      if 'linking' in comp_type:\n        glycans_linking.append(name)\n      else:\n        glycans_other.append(name)\n\n    # Ions have the word 'ion' in their name.\n    comp_name = comp['_chem_comp.name'][0].lower()\n    if re.findall(r'\\bion\\b', comp_name):\n      ions.append(name)\n  result = dict(\n      glycans_linking=frozenset(glycans_linking),\n      glycans_other=frozenset(glycans_other),\n      ions=frozenset(ions),\n  )\n\n  return result\n\n\ndef main(argv: Sequence[str]) -> None:\n  if len(argv) != 2:\n    raise ValueError(\n        'Directory to write to must be specified as a command-line arguments.'\n    )\n\n  print(f'Loading {_CCD_PICKLE_FILE}', flush=True)\n  with open(_CCD_PICKLE_FILE, 'rb') as f:\n    ccd: Mapping[str, Mapping[str, Sequence[str]]] = safe_pickle.load(f)\n  output_path = pathlib.Path(argv[1])\n  output_path.parent.mkdir(exist_ok=True)\n  print('Finding ions and glycans', flush=True)\n  result = find_ions_and_glycans_in_ccd(ccd)\n  print(f'writing to {output_path}', flush=True)\n  with output_path.open('wb') as f:\n    pickle.dump(result, f)\n  print('Done', flush=True)\n\n\nif __name__ == '__main__':\n  main(sys.argv)\n"
  },
  {
    "path": "src/alphafold3/constants/mmcif_names.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Names of things in mmCIF format.\n\nSee https://www.iucr.org/__data/iucr/cifdic_html/2/cif_mm.dic/index.html\n\"\"\"\n\nfrom collections.abc import Mapping, Sequence, Set\nfrom typing import Final\n\nfrom alphafold3.constants import atom_types\nfrom alphafold3.constants import residue_names\n\n\n# The following are all possible values for the \"_entity.type\".\n# https://mmcif.wwpdb.org/dictionaries/mmcif_pdbx_v50.dic/Items/_entity.type.html\nBRANCHED_CHAIN: Final[str] = 'branched'\nMACROLIDE_CHAIN: Final[str] = 'macrolide'\nNON_POLYMER_CHAIN: Final[str] = 'non-polymer'\nPOLYMER_CHAIN: Final[str] = 'polymer'\nWATER: Final[str] = 'water'\n\nCYCLIC_PSEUDO_PEPTIDE_CHAIN: Final[str] = 'cyclic-pseudo-peptide'\nDNA_CHAIN: Final[str] = 'polydeoxyribonucleotide'\nDNA_RNA_HYBRID_CHAIN: Final[str] = (\n    'polydeoxyribonucleotide/polyribonucleotide hybrid'\n)\nOTHER_CHAIN: Final[str] = 'other'\nPEPTIDE_NUCLEIC_ACID_CHAIN: Final[str] = 'peptide nucleic acid'\nPOLYPEPTIDE_D_CHAIN: Final[str] = 'polypeptide(D)'\nPROTEIN_CHAIN: Final[str] = 'polypeptide(L)'\nRNA_CHAIN: Final[str] = 'polyribonucleotide'\n\n# Most common _entity_poly.types.\nSTANDARD_POLYMER_CHAIN_TYPES: Final[Set[str]] = {\n    PROTEIN_CHAIN,\n    DNA_CHAIN,\n    RNA_CHAIN,\n}\n\n# Possible values for _entity.type other than polymer and water.\nLIGAND_CHAIN_TYPES: Final[Set[str]] = {\n    BRANCHED_CHAIN,\n    MACROLIDE_CHAIN,\n    NON_POLYMER_CHAIN,\n}\n\n# Possible values for _entity.type other than polymer.\nNON_POLYMER_CHAIN_TYPES: Final[Set[str]] = {\n    *LIGAND_CHAIN_TYPES,\n    WATER,\n}\n\n# Peptide possible values for _entity_poly.type.\nPEPTIDE_CHAIN_TYPES: Final[Set[str]] = {\n    CYCLIC_PSEUDO_PEPTIDE_CHAIN,\n    POLYPEPTIDE_D_CHAIN,\n    PROTEIN_CHAIN,\n    PEPTIDE_NUCLEIC_ACID_CHAIN,\n}\n\n\n# Nucleic-acid possible values for _entity_poly.type.\nNUCLEIC_ACID_CHAIN_TYPES: Final[Set[str]] = {\n    RNA_CHAIN,\n    DNA_CHAIN,\n    DNA_RNA_HYBRID_CHAIN,\n}\n\n# All possible values for _entity_poly.type.\nPOLYMER_CHAIN_TYPES: Final[Set[str]] = {\n    *NUCLEIC_ACID_CHAIN_TYPES,\n    *PEPTIDE_CHAIN_TYPES,\n    OTHER_CHAIN,\n}\n\n\nTERMINAL_OXYGENS: Final[Mapping[str, str]] = {\n    PROTEIN_CHAIN: 'OXT',\n    DNA_CHAIN: 'OP3',\n    RNA_CHAIN: 'OP3',\n}\n\n\n# For each chain type, which atom should be used to represent each residue.\nRESIDUE_REPRESENTATIVE_ATOMS: Final[Mapping[str, str]] = {\n    PROTEIN_CHAIN: atom_types.CA,\n    DNA_CHAIN: atom_types.C1PRIME,\n    RNA_CHAIN: atom_types.C1PRIME,\n}\n\n# Methods involving crystallization. See the documentation at\n# mmcif.wwpdb.org/dictionaries/mmcif_pdbx_v50.dic/Items/_exptl.method.html\n# for the full list of experimental methods.\nCRYSTALLIZATION_METHODS: Final[Set[str]] = {\n    'X-RAY DIFFRACTION',\n    'NEUTRON DIFFRACTION',\n    'ELECTRON CRYSTALLOGRAPHY',\n    'POWDER CRYSTALLOGRAPHY',\n    'FIBER DIFFRACTION',\n}\n\n# Possible bond types.\nCOVALENT_BOND: Final[str] = 'covale'\nHYDROGEN_BOND: Final[str] = 'hydrog'\nMETAL_COORDINATION: Final[str] = 'metalc'\nDISULFIDE_BRIDGE: Final[str] = 'disulf'\n\n\ndef is_standard_polymer_type(chain_type: str) -> bool:\n  \"\"\"Returns if chain type is a protein, DNA or RNA chain type.\n\n  Args:\n     chain_type: The type of the chain.\n\n  Returns:\n    A bool for if the chain_type matches protein, DNA, or RNA.\n  \"\"\"\n  return chain_type in STANDARD_POLYMER_CHAIN_TYPES\n\n\ndef guess_polymer_type(chain_residues: Sequence[str]) -> str:\n  \"\"\"Guess the polymer type (protein/rna/dna/other) based on the residues.\n\n  The polymer type is guessed by first checking for any of the standard\n  protein residues. If one is present then the chain is considered to be a\n  polypeptide. Otherwise we decide by counting residue types and deciding by\n  majority voting (e.g. mostly DNA residues -> DNA). If there is a tie between\n  the counts, the ordering is rna > dna > other.\n\n  Note that we count MSE and UNK as protein residues.\n\n  Args:\n    chain_residues: A sequence of full residue name (1-letter for DNA, 2-letters\n      for RNA, 3 for protein). The _atom_site.label_comp_id column in mmCIF.\n\n  Returns:\n    The most probable chain type as set in the _entity_poly mmCIF table:\n    protein - polypeptide(L), rna - polyribonucleotide,\n    dna - polydeoxyribonucleotide or other.\n  \"\"\"\n  residue_types = {\n      **{r: RNA_CHAIN for r in residue_names.RNA_TYPES},\n      **{r: DNA_CHAIN for r in residue_names.DNA_TYPES},\n      **{r: PROTEIN_CHAIN for r in residue_names.PROTEIN_TYPES_WITH_UNKNOWN},\n      residue_names.MSE: PROTEIN_CHAIN,\n  }\n\n  counts = {PROTEIN_CHAIN: 0, RNA_CHAIN: 0, DNA_CHAIN: 0, OTHER_CHAIN: 0}\n  for residue in chain_residues:\n    residue_type = residue_types.get(residue, OTHER_CHAIN)\n    # If we ever see a protein residue we'll consider this a polypeptide(L).\n    if residue_type == PROTEIN_CHAIN:\n      return residue_type\n    counts[residue_type] += 1\n\n  # Make sure protein > rna > dna > other if there is a tie.\n  tie_braker = {PROTEIN_CHAIN: 3, RNA_CHAIN: 2, DNA_CHAIN: 1, OTHER_CHAIN: 0}\n\n  def order_fn(item):\n    name, count = item\n    return count, tie_braker[name]\n\n  most_probable_type = max(counts.items(), key=order_fn)[0]\n  return most_probable_type\n\n\ndef fix_non_standard_polymer_res(*, res_name: str, chain_type: str) -> str:\n  \"\"\"Returns the res_name of the closest standard protein/RNA/DNA residue.\n\n  Optimized for the case where a single residue needs to be converted.\n\n  If res_name is already a standard type, it is returned unaltered.\n  If a match cannot be found, returns 'UNK' for protein chains and 'N' for\n    RNA/DNA chains.\n\n  Args:\n     res_name: A residue_name (monomer code from the CCD).\n     chain_type: The type of the chain, must be PROTEIN_CHAIN, RNA_CHAIN or\n       DNA_CHAIN.\n\n  Returns:\n    An element from PROTEIN_TYPES_WITH_UNKNOWN | RNA_TYPES | DNA_TYPES | {'N'}.\n\n  Raises:\n    ValueError: If chain_type not in PEPTIDE_CHAIN_TYPES or\n      {OTHER_CHAIN, RNA_CHAIN, DNA_CHAIN, DNA_RNA_HYBRID_CHAIN}.\n  \"\"\"\n  # Map to one letter code, then back to common res_names.\n  one_letter_code = residue_names.letters_three_to_one(res_name, default='X')\n\n  if chain_type in PEPTIDE_CHAIN_TYPES or chain_type == OTHER_CHAIN:\n    return residue_names.PROTEIN_COMMON_ONE_TO_THREE.get(one_letter_code, 'UNK')\n  elif chain_type == RNA_CHAIN:\n    # RNA's CCD monomer code is single-letter.\n    return (\n        one_letter_code if one_letter_code in residue_names.RNA_TYPES else 'N'\n    )\n  elif chain_type == DNA_CHAIN:\n    return residue_names.DNA_COMMON_ONE_TO_TWO.get(one_letter_code, 'N')\n  elif chain_type == DNA_RNA_HYBRID_CHAIN:\n    return (\n        res_name\n        if res_name in residue_names.NUCLEIC_TYPES_WITH_UNKNOWN\n        else 'N'\n    )\n  else:\n    raise ValueError(f'Expected a protein/DNA/RNA chain but got {chain_type}')\n"
  },
  {
    "path": "src/alphafold3/constants/periodic_table.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Periodic table of elements.\"\"\"\n\nfrom collections.abc import Mapping, Sequence\nimport dataclasses\nfrom typing import Final\n\nimport numpy as np\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True)\nclass Element:\n  name: str\n  number: int\n  symbol: str\n  weight: float\n\n\n# Weights taken from rdkit/Code/GraphMol/atomic_data.cpp for compatibility.\n# pylint: disable=invalid-name\n\n# X is an unknown element that can be present in the CCD,\n# https://www.rcsb.org/ligand/UNX.\nX: Final[Element] = Element(name='Unknown', number=0, symbol='X', weight=0.0)\nH: Final[Element] = Element(name='Hydrogen', number=1, symbol='H', weight=1.008)\nHe: Final[Element] = Element(name='Helium', number=2, symbol='He', weight=4.003)\nLi: Final[Element] = Element(\n    name='Lithium', number=3, symbol='Li', weight=6.941\n)\nBe: Final[Element] = Element(\n    name='Beryllium', number=4, symbol='Be', weight=9.012\n)\nB: Final[Element] = Element(name='Boron', number=5, symbol='B', weight=10.812)\nC: Final[Element] = Element(name='Carbon', number=6, symbol='C', weight=12.011)\nN: Final[Element] = Element(\n    name='Nitrogen', number=7, symbol='N', weight=14.007\n)\nO: Final[Element] = Element(name='Oxygen', number=8, symbol='O', weight=15.999)\nF: Final[Element] = Element(\n    name='Fluorine', number=9, symbol='F', weight=18.998\n)\nNe: Final[Element] = Element(name='Neon', number=10, symbol='Ne', weight=20.18)\nNa: Final[Element] = Element(\n    name='Sodium', number=11, symbol='Na', weight=22.99\n)\nMg: Final[Element] = Element(\n    name='Magnesium', number=12, symbol='Mg', weight=24.305\n)\nAl: Final[Element] = Element(\n    name='Aluminium', number=13, symbol='Al', weight=26.982\n)\nSi: Final[Element] = Element(\n    name='Silicon', number=14, symbol='Si', weight=28.086\n)\nP: Final[Element] = Element(\n    name='Phosphorus', number=15, symbol='P', weight=30.974\n)\nS: Final[Element] = Element(name='Sulfur', number=16, symbol='S', weight=32.067)\nCl: Final[Element] = Element(\n    name='Chlorine', number=17, symbol='Cl', weight=35.453\n)\nAr: Final[Element] = Element(\n    name='Argon', number=18, symbol='Ar', weight=39.948\n)\nK: Final[Element] = Element(\n    name='Potassium', number=19, symbol='K', weight=39.098\n)\nCa: Final[Element] = Element(\n    name='Calcium', number=20, symbol='Ca', weight=40.078\n)\nSc: Final[Element] = Element(\n    name='Scandium', number=21, symbol='Sc', weight=44.956\n)\nTi: Final[Element] = Element(\n    name='Titanium', number=22, symbol='Ti', weight=47.867\n)\nV: Final[Element] = Element(\n    name='Vanadium', number=23, symbol='V', weight=50.942\n)\nCr: Final[Element] = Element(\n    name='Chromium', number=24, symbol='Cr', weight=51.996\n)\nMn: Final[Element] = Element(\n    name='Manganese', number=25, symbol='Mn', weight=54.938\n)\nFe: Final[Element] = Element(name='Iron', number=26, symbol='Fe', weight=55.845)\nCo: Final[Element] = Element(\n    name='Cobalt', number=27, symbol='Co', weight=58.933\n)\nNi: Final[Element] = Element(\n    name='Nickel', number=28, symbol='Ni', weight=58.693\n)\nCu: Final[Element] = Element(\n    name='Copper', number=29, symbol='Cu', weight=63.546\n)\nZn: Final[Element] = Element(name='Zinc', number=30, symbol='Zn', weight=65.39)\nGa: Final[Element] = Element(\n    name='Gallium', number=31, symbol='Ga', weight=69.723\n)\nGe: Final[Element] = Element(\n    name='Germanium', number=32, symbol='Ge', weight=72.61\n)\nAs: Final[Element] = Element(\n    name='Arsenic', number=33, symbol='As', weight=74.922\n)\nSe: Final[Element] = Element(\n    name='Selenium', number=34, symbol='Se', weight=78.96\n)\nBr: Final[Element] = Element(\n    name='Bromine', number=35, symbol='Br', weight=79.904\n)\nKr: Final[Element] = Element(\n    name='Krypton', number=36, symbol='Kr', weight=83.8\n)\nRb: Final[Element] = Element(\n    name='Rubidium', number=37, symbol='Rb', weight=85.468\n)\nSr: Final[Element] = Element(\n    name='Strontium', number=38, symbol='Sr', weight=87.62\n)\nY: Final[Element] = Element(\n    name='Yttrium', number=39, symbol='Y', weight=88.906\n)\nZr: Final[Element] = Element(\n    name='Zirconium', number=40, symbol='Zr', weight=91.224\n)\nNb: Final[Element] = Element(\n    name='Niobiu', number=41, symbol='Nb', weight=92.906\n)\nMo: Final[Element] = Element(\n    name='Molybdenum', number=42, symbol='Mo', weight=95.94\n)\nTc: Final[Element] = Element(\n    name='Technetium', number=43, symbol='Tc', weight=98\n)\nRu: Final[Element] = Element(\n    name='Ruthenium', number=44, symbol='Ru', weight=101.07\n)\nRh: Final[Element] = Element(\n    name='Rhodium', number=45, symbol='Rh', weight=102.906\n)\nPd: Final[Element] = Element(\n    name='Palladium', number=46, symbol='Pd', weight=106.42\n)\nAg: Final[Element] = Element(\n    name='Silver', number=47, symbol='Ag', weight=107.868\n)\nCd: Final[Element] = Element(\n    name='Cadmium', number=48, symbol='Cd', weight=112.412\n)\nIn: Final[Element] = Element(\n    name='Indium', number=49, symbol='In', weight=114.818\n)\nSn: Final[Element] = Element(name='Tin', number=50, symbol='Sn', weight=118.711)\nSb: Final[Element] = Element(\n    name='Antimony', number=51, symbol='Sb', weight=121.76\n)\nTe: Final[Element] = Element(\n    name='Tellurium', number=52, symbol='Te', weight=127.6\n)\nI: Final[Element] = Element(\n    name='Iodine', number=53, symbol='I', weight=126.904\n)\nXe: Final[Element] = Element(\n    name='Xenon', number=54, symbol='Xe', weight=131.29\n)\nCs: Final[Element] = Element(\n    name='Caesium', number=55, symbol='Cs', weight=132.905\n)\nBa: Final[Element] = Element(\n    name='Barium', number=56, symbol='Ba', weight=137.328\n)\nLa: Final[Element] = Element(\n    name='Lanthanum', number=57, symbol='La', weight=138.906\n)\nCe: Final[Element] = Element(\n    name='Cerium', number=58, symbol='Ce', weight=140.116\n)\nPr: Final[Element] = Element(\n    name='Praseodymium', number=59, symbol='Pr', weight=140.908\n)\nNd: Final[Element] = Element(\n    name='Neodymium', number=60, symbol='Nd', weight=144.24\n)\nPm: Final[Element] = Element(\n    name='Promethium', number=61, symbol='Pm', weight=145\n)\nSm: Final[Element] = Element(\n    name='Samarium', number=62, symbol='Sm', weight=150.36\n)\nEu: Final[Element] = Element(\n    name='Europium', number=63, symbol='Eu', weight=151.964\n)\nGd: Final[Element] = Element(\n    name='Gadolinium', number=64, symbol='Gd', weight=157.25\n)\nTb: Final[Element] = Element(\n    name='Terbium', number=65, symbol='Tb', weight=158.925\n)\nDy: Final[Element] = Element(\n    name='Dysprosium', number=66, symbol='Dy', weight=162.5\n)\nHo: Final[Element] = Element(\n    name='Holmium', number=67, symbol='Ho', weight=164.93\n)\nEr: Final[Element] = Element(\n    name='Erbium', number=68, symbol='Er', weight=167.26\n)\nTm: Final[Element] = Element(\n    name='Thulium', number=69, symbol='Tm', weight=168.934\n)\nYb: Final[Element] = Element(\n    name='Ytterbium', number=70, symbol='Yb', weight=173.04\n)\nLu: Final[Element] = Element(\n    name='Lutetium', number=71, symbol='Lu', weight=174.967\n)\nHf: Final[Element] = Element(\n    name='Hafnium', number=72, symbol='Hf', weight=178.49\n)\nTa: Final[Element] = Element(\n    name='Tantalum', number=73, symbol='Ta', weight=180.948\n)\nW: Final[Element] = Element(\n    name='Tungsten', number=74, symbol='W', weight=183.84\n)\nRe: Final[Element] = Element(\n    name='Rhenium', number=75, symbol='Re', weight=186.207\n)\nOs: Final[Element] = Element(\n    name='Osmium', number=76, symbol='Os', weight=190.23\n)\nIr: Final[Element] = Element(\n    name='Iridium', number=77, symbol='Ir', weight=192.217\n)\nPt: Final[Element] = Element(\n    name='Platinum', number=78, symbol='Pt', weight=195.078\n)\nAu: Final[Element] = Element(\n    name='Gold', number=79, symbol='Au', weight=196.967\n)\nHg: Final[Element] = Element(\n    name='Mercury', number=80, symbol='Hg', weight=200.59\n)\nTl: Final[Element] = Element(\n    name='Thallium', number=81, symbol='Tl', weight=204.383\n)\nPb: Final[Element] = Element(name='Lead', number=82, symbol='Pb', weight=207.2)\nBi: Final[Element] = Element(\n    name='Bismuth', number=83, symbol='Bi', weight=208.98\n)\nPo: Final[Element] = Element(\n    name='Polonium', number=84, symbol='Po', weight=209\n)\nAt: Final[Element] = Element(\n    name='Astatine', number=85, symbol='At', weight=210\n)\nRn: Final[Element] = Element(name='Radon', number=86, symbol='Rn', weight=222)\nFr: Final[Element] = Element(\n    name='Francium', number=87, symbol='Fr', weight=223\n)\nRa: Final[Element] = Element(name='Radium', number=88, symbol='Ra', weight=226)\nAc: Final[Element] = Element(\n    name='Actinium', number=89, symbol='Ac', weight=227\n)\nTh: Final[Element] = Element(\n    name='Thorium', number=90, symbol='Th', weight=232.038\n)\nPa: Final[Element] = Element(\n    name='Protactinium', number=91, symbol='Pa', weight=231.036\n)\nU: Final[Element] = Element(\n    name='Uranium', number=92, symbol='U', weight=238.029\n)\nNp: Final[Element] = Element(\n    name='Neptunium', number=93, symbol='Np', weight=237\n)\nPu: Final[Element] = Element(\n    name='Plutonium', number=94, symbol='Pu', weight=244\n)\nAm: Final[Element] = Element(\n    name='Americium', number=95, symbol='Am', weight=243\n)\nCm: Final[Element] = Element(name='Curium', number=96, symbol='Cm', weight=247)\nBk: Final[Element] = Element(\n    name='Berkelium', number=97, symbol='Bk', weight=247\n)\nCf: Final[Element] = Element(\n    name='Californium', number=98, symbol='Cf', weight=251\n)\nEs: Final[Element] = Element(\n    name='Einsteinium', number=99, symbol='Es', weight=252\n)\nFm: Final[Element] = Element(\n    name='Fermium', number=100, symbol='Fm', weight=257\n)\nMd: Final[Element] = Element(\n    name='Mendelevium', number=101, symbol='Md', weight=258\n)\nNo: Final[Element] = Element(\n    name='Nobelium', number=102, symbol='No', weight=259\n)\nLr: Final[Element] = Element(\n    name='Lawrencium', number=103, symbol='Lr', weight=262\n)\nRf: Final[Element] = Element(\n    name='Rutherfordium', number=104, symbol='Rf', weight=267\n)\nDb: Final[Element] = Element(\n    name='Dubnium', number=105, symbol='Db', weight=268\n)\nSg: Final[Element] = Element(\n    name='Seaborgium', number=106, symbol='Sg', weight=269\n)\nBh: Final[Element] = Element(\n    name='Bohrium', number=107, symbol='Bh', weight=270\n)\nHs: Final[Element] = Element(\n    name='Hassium', number=108, symbol='Hs', weight=269\n)\nMt: Final[Element] = Element(\n    name='Meitnerium', number=109, symbol='Mt', weight=278\n)\nDs: Final[Element] = Element(\n    name='Darmstadtium', number=110, symbol='Ds', weight=281\n)\nRg: Final[Element] = Element(\n    name='Roentgenium', number=111, symbol='Rg', weight=281\n)\nCn: Final[Element] = Element(\n    name='Copernicium', number=112, symbol='Cn', weight=285\n)\nNh: Final[Element] = Element(\n    name='Nihonium', number=113, symbol='Nh', weight=284\n)\nFl: Final[Element] = Element(\n    name='Flerovium', number=114, symbol='Fl', weight=289\n)\nMc: Final[Element] = Element(\n    name='Moscovium', number=115, symbol='Mc', weight=288\n)\nLv: Final[Element] = Element(\n    name='Livermorium', number=116, symbol='Lv', weight=293\n)\nTs: Final[Element] = Element(\n    name='Tennessine', number=117, symbol='Ts', weight=292\n)\nOg: Final[Element] = Element(\n    name='Oganesson', number=118, symbol='Og', weight=294\n)\n# pylint: enable=invalid-name\n\n# fmt: off\n# Lanthanides\n_L: Final[Sequence[Element]] = (\n    La, Ce, Pr, Nd, Pm, Sm, Eu, Gd, Tb, Dy, Ho, Er, Tm, Yb, Lu)\n# Actinides\n_A: Final[Sequence[Element]] = (\n    Ac, Th, Pa, U, Np, Pu, Am, Cm, Bk, Cf, Es, Fm, Md, No, Lr)\n\n# pylint: disable=bad-whitespace\nPERIODIC_TABLE: Final[Sequence[Element]] = (\n    X,  # Unknown\n    H,                                                                   He,\n    Li, Be,                                          B,  C,  N,  O,  F,  Ne,\n    Na, Mg,                                          Al, Si, P,  S,  Cl, Ar,\n    K,  Ca,  Sc, Ti, V,  Cr, Mn, Fe, Co, Ni, Cu, Zn, Ga, Ge, As, Se, Br, Kr,\n    Rb, Sr,  Y,  Zr, Nb, Mo, Tc, Ru, Rh, Pd, Ag, Cd, In, Sn, Sb, Te, I,  Xe,\n    Cs, Ba, *_L, Hf, Ta, W,  Re, Os, Ir, Pt, Au, Hg, Tl, Pb, Bi, Po, At, Rn,\n    Fr, Ra, *_A, Rf, Db, Sg, Bh, Hs, Mt, Ds, Rg, Cn, Nh, Fl, Mc, Lv, Ts, Og\n)\n# pylint: enable=bad-whitespace\n# fmt: on\nATOMIC_SYMBOL: Mapping[int, str] = {e.number: e.symbol for e in PERIODIC_TABLE}\nATOMIC_NUMBER = {e.symbol: e.number for e in PERIODIC_TABLE}\n# Add Deuterium as previous table contained it.\nATOMIC_NUMBER['D'] = 1\n\nATOMIC_NUMBER: Mapping[str, int] = ATOMIC_NUMBER\nATOMIC_WEIGHT: np.ndarray = np.zeros(len(PERIODIC_TABLE), dtype=np.float64)\n\nfor e in PERIODIC_TABLE:\n  ATOMIC_WEIGHT[e.number] = e.weight\nATOMIC_WEIGHT.setflags(write=False)\n"
  },
  {
    "path": "src/alphafold3/constants/residue_names.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Constants associated with residue names.\"\"\"\n\nfrom collections.abc import Mapping\nimport functools\nimport sys\n\n# pyformat: disable\n# common_typos_disable\nCCD_NAME_TO_ONE_LETTER: Mapping[str, str] = {\n    '00C': 'C', '01W': 'X', '02K': 'A', '03Y': 'C', '07O': 'C', '08P': 'C',\n    '0A0': 'D', '0A1': 'Y', '0A2': 'K', '0A8': 'C', '0AA': 'V', '0AB': 'V',\n    '0AC': 'G', '0AD': 'G', '0AF': 'W', '0AG': 'L', '0AH': 'S', '0AK': 'D',\n    '0AM': 'A', '0AP': 'C', '0AU': 'U', '0AV': 'A', '0AZ': 'P', '0BN': 'F',\n    '0C': 'C', '0CS': 'A', '0DC': 'C', '0DG': 'G', '0DT': 'T', '0FL': 'A',\n    '0G': 'G', '0NC': 'A', '0SP': 'A', '0U': 'U', '10C': 'C', '125': 'U',\n    '126': 'U', '127': 'U', '128': 'N', '12A': 'A', '143': 'C', '193': 'X',\n    '1AP': 'A', '1MA': 'A', '1MG': 'G', '1PA': 'F', '1PI': 'A', '1PR': 'N',\n    '1SC': 'C', '1TQ': 'W', '1TY': 'Y', '1X6': 'S', '200': 'F', '23F': 'F',\n    '23S': 'X', '26B': 'T', '2AD': 'X', '2AG': 'A', '2AO': 'X', '2AR': 'A',\n    '2AS': 'X', '2AT': 'T', '2AU': 'U', '2BD': 'I', '2BT': 'T', '2BU': 'A',\n    '2CO': 'C', '2DA': 'A', '2DF': 'N', '2DM': 'N', '2DO': 'X', '2DT': 'T',\n    '2EG': 'G', '2FE': 'N', '2FI': 'N', '2FM': 'M', '2GT': 'T', '2HF': 'H',\n    '2LU': 'L', '2MA': 'A', '2MG': 'G', '2ML': 'L', '2MR': 'R', '2MT': 'P',\n    '2MU': 'U', '2NT': 'T', '2OM': 'U', '2OT': 'T', '2PI': 'X', '2PR': 'G',\n    '2SA': 'N', '2SI': 'X', '2ST': 'T', '2TL': 'T', '2TY': 'Y', '2VA': 'V',\n    '2XA': 'C', '32S': 'X', '32T': 'X', '3AH': 'H', '3AR': 'X', '3CF': 'F',\n    '3DA': 'A', '3DR': 'N', '3GA': 'A', '3MD': 'D', '3ME': 'U', '3NF': 'Y',\n    '3QN': 'K', '3TY': 'X', '3XH': 'G', '4AC': 'N', '4BF': 'Y', '4CF': 'F',\n    '4CY': 'M', '4DP': 'W', '4FB': 'P', '4FW': 'W', '4HT': 'W', '4IN': 'W',\n    '4MF': 'N', '4MM': 'X', '4OC': 'C', '4PC': 'C', '4PD': 'C', '4PE': 'C',\n    '4PH': 'F', '4SC': 'C', '4SU': 'U', '4TA': 'N', '4U7': 'A', '56A': 'H',\n    '5AA': 'A', '5AB': 'A', '5AT': 'T', '5BU': 'U', '5CG': 'G', '5CM': 'C',\n    '5CS': 'C', '5FA': 'A', '5FC': 'C', '5FU': 'U', '5HP': 'E', '5HT': 'T',\n    '5HU': 'U', '5IC': 'C', '5IT': 'T', '5IU': 'U', '5MC': 'C', '5MD': 'N',\n    '5MU': 'U', '5NC': 'C', '5PC': 'C', '5PY': 'T', '5SE': 'U', '64T': 'T',\n    '6CL': 'K', '6CT': 'T', '6CW': 'W', '6HA': 'A', '6HC': 'C', '6HG': 'G',\n    '6HN': 'K', '6HT': 'T', '6IA': 'A', '6MA': 'A', '6MC': 'A', '6MI': 'N',\n    '6MT': 'A', '6MZ': 'N', '6OG': 'G', '70U': 'U', '7DA': 'A', '7GU': 'G',\n    '7JA': 'I', '7MG': 'G', '8AN': 'A', '8FG': 'G', '8MG': 'G', '8OG': 'G',\n    '9NE': 'E', '9NF': 'F', '9NR': 'R', '9NV': 'V', 'A': 'A', 'A1P': 'N',\n    'A23': 'A', 'A2L': 'A', 'A2M': 'A', 'A34': 'A', 'A35': 'A', 'A38': 'A',\n    'A39': 'A', 'A3A': 'A', 'A3P': 'A', 'A40': 'A', 'A43': 'A', 'A44': 'A',\n    'A47': 'A', 'A5L': 'A', 'A5M': 'C', 'A5N': 'N', 'A5O': 'A', 'A66': 'X',\n    'AA3': 'A', 'AA4': 'A', 'AAR': 'R', 'AB7': 'X', 'ABA': 'A', 'ABR': 'A',\n    'ABS': 'A', 'ABT': 'N', 'ACB': 'D', 'ACL': 'R', 'AD2': 'A', 'ADD': 'X',\n    'ADX': 'N', 'AEA': 'X', 'AEI': 'D', 'AET': 'A', 'AFA': 'N', 'AFF': 'N',\n    'AFG': 'G', 'AGM': 'R', 'AGT': 'C', 'AHB': 'N', 'AHH': 'X', 'AHO': 'A',\n    'AHP': 'A', 'AHS': 'X', 'AHT': 'X', 'AIB': 'A', 'AKL': 'D', 'AKZ': 'D',\n    'ALA': 'A', 'ALC': 'A', 'ALM': 'A', 'ALN': 'A', 'ALO': 'T', 'ALQ': 'X',\n    'ALS': 'A', 'ALT': 'A', 'ALV': 'A', 'ALY': 'K', 'AN8': 'A', 'AP7': 'A',\n    'APE': 'X', 'APH': 'A', 'API': 'K', 'APK': 'K', 'APM': 'X', 'APP': 'X',\n    'AR2': 'R', 'AR4': 'E', 'AR7': 'R', 'ARG': 'R', 'ARM': 'R', 'ARO': 'R',\n    'ARV': 'X', 'AS': 'A', 'AS2': 'D', 'AS9': 'X', 'ASA': 'D', 'ASB': 'D',\n    'ASI': 'D', 'ASK': 'D', 'ASL': 'D', 'ASM': 'X', 'ASN': 'N', 'ASP': 'D',\n    'ASQ': 'D', 'ASU': 'N', 'ASX': 'B', 'ATD': 'T', 'ATL': 'T', 'ATM': 'T',\n    'AVC': 'A', 'AVN': 'X', 'AYA': 'A', 'AZK': 'K', 'AZS': 'S', 'AZY': 'Y',\n    'B1F': 'F', 'B1P': 'N', 'B2A': 'A', 'B2F': 'F', 'B2I': 'I', 'B2V': 'V',\n    'B3A': 'A', 'B3D': 'D', 'B3E': 'E', 'B3K': 'K', 'B3L': 'X', 'B3M': 'X',\n    'B3Q': 'X', 'B3S': 'S', 'B3T': 'X', 'B3U': 'H', 'B3X': 'N', 'B3Y': 'Y',\n    'BB6': 'C', 'BB7': 'C', 'BB8': 'F', 'BB9': 'C', 'BBC': 'C', 'BCS': 'C',\n    'BE2': 'X', 'BFD': 'D', 'BG1': 'S', 'BGM': 'G', 'BH2': 'D', 'BHD': 'D',\n    'BIF': 'F', 'BIL': 'X', 'BIU': 'I', 'BJH': 'X', 'BLE': 'L', 'BLY': 'K',\n    'BMP': 'N', 'BMT': 'T', 'BNN': 'F', 'BNO': 'X', 'BOE': 'T', 'BOR': 'R',\n    'BPE': 'C', 'BRU': 'U', 'BSE': 'S', 'BT5': 'N', 'BTA': 'L', 'BTC': 'C',\n    'BTR': 'W', 'BUC': 'C', 'BUG': 'V', 'BVP': 'U', 'BZG': 'N', 'C': 'C',\n    'C1X': 'K', 'C25': 'C', 'C2L': 'C', 'C2S': 'C', 'C31': 'C', 'C32': 'C',\n    'C34': 'C', 'C36': 'C', 'C37': 'C', 'C38': 'C', 'C3Y': 'C', 'C42': 'C',\n    'C43': 'C', 'C45': 'C', 'C46': 'C', 'C49': 'C', 'C4R': 'C', 'C4S': 'C',\n    'C5C': 'C', 'C66': 'X', 'C6C': 'C', 'CAF': 'C', 'CAL': 'X', 'CAR': 'C',\n    'CAS': 'C', 'CAV': 'X', 'CAY': 'C', 'CB2': 'C', 'CBR': 'C', 'CBV': 'C',\n    'CCC': 'C', 'CCL': 'K', 'CCS': 'C', 'CDE': 'X', 'CDV': 'X', 'CDW': 'C',\n    'CEA': 'C', 'CFL': 'C', 'CG1': 'G', 'CGA': 'E', 'CGU': 'E', 'CH': 'C',\n    'CHF': 'X', 'CHG': 'X', 'CHP': 'G', 'CHS': 'X', 'CIR': 'R', 'CLE': 'L',\n    'CLG': 'K', 'CLH': 'K', 'CM0': 'N', 'CME': 'C', 'CMH': 'C', 'CML': 'C',\n    'CMR': 'C', 'CMT': 'C', 'CNU': 'U', 'CP1': 'C', 'CPC': 'X', 'CPI': 'X',\n    'CR5': 'G', 'CS0': 'C', 'CS1': 'C', 'CS3': 'C', 'CS4': 'C', 'CS8': 'N',\n    'CSA': 'C', 'CSB': 'C', 'CSD': 'C', 'CSE': 'C', 'CSF': 'C', 'CSI': 'G',\n    'CSJ': 'C', 'CSL': 'C', 'CSO': 'C', 'CSP': 'C', 'CSR': 'C', 'CSS': 'C',\n    'CSU': 'C', 'CSW': 'C', 'CSX': 'C', 'CSZ': 'C', 'CTE': 'W', 'CTG': 'T',\n    'CTH': 'T', 'CUC': 'X', 'CWR': 'S', 'CXM': 'M', 'CY0': 'C', 'CY1': 'C',\n    'CY3': 'C', 'CY4': 'C', 'CYA': 'C', 'CYD': 'C', 'CYF': 'C', 'CYG': 'C',\n    'CYJ': 'X', 'CYM': 'C', 'CYQ': 'C', 'CYR': 'C', 'CYS': 'C', 'CZ2': 'C',\n    'CZZ': 'C', 'D11': 'T', 'D1P': 'N', 'D3': 'N', 'D33': 'N', 'D3P': 'G',\n    'D3T': 'T', 'D4M': 'T', 'D4P': 'X', 'DA': 'A', 'DA2': 'X', 'DAB': 'A',\n    'DAH': 'F', 'DAL': 'A', 'DAR': 'R', 'DAS': 'D', 'DBB': 'T', 'DBM': 'N',\n    'DBS': 'S', 'DBU': 'T', 'DBY': 'Y', 'DBZ': 'A', 'DC': 'C', 'DC2': 'C',\n    'DCG': 'G', 'DCI': 'X', 'DCL': 'X', 'DCT': 'C', 'DCY': 'C', 'DDE': 'H',\n    'DDG': 'G', 'DDN': 'U', 'DDX': 'N', 'DFC': 'C', 'DFG': 'G', 'DFI': 'X',\n    'DFO': 'X', 'DFT': 'N', 'DG': 'G', 'DGH': 'G', 'DGI': 'G', 'DGL': 'E',\n    'DGN': 'Q', 'DHA': 'S', 'DHI': 'H', 'DHL': 'X', 'DHN': 'V', 'DHP': 'X',\n    'DHU': 'U', 'DHV': 'V', 'DI': 'I', 'DIL': 'I', 'DIR': 'R', 'DIV': 'V',\n    'DLE': 'L', 'DLS': 'K', 'DLY': 'K', 'DM0': 'K', 'DMH': 'N', 'DMK': 'D',\n    'DMT': 'X', 'DN': 'N', 'DNE': 'L', 'DNG': 'L', 'DNL': 'K', 'DNM': 'L',\n    'DNP': 'A', 'DNR': 'C', 'DNS': 'K', 'DOA': 'X', 'DOC': 'C', 'DOH': 'D',\n    'DON': 'L', 'DPB': 'T', 'DPH': 'F', 'DPL': 'P', 'DPP': 'A', 'DPQ': 'Y',\n    'DPR': 'P', 'DPY': 'N', 'DRM': 'U', 'DRP': 'N', 'DRT': 'T', 'DRZ': 'N',\n    'DSE': 'S', 'DSG': 'N', 'DSN': 'S', 'DSP': 'D', 'DT': 'T', 'DTH': 'T',\n    'DTR': 'W', 'DTY': 'Y', 'DU': 'U', 'DVA': 'V', 'DXD': 'N', 'DXN': 'N',\n    'DYS': 'C', 'DZM': 'A', 'E': 'A', 'E1X': 'A', 'ECC': 'Q', 'EDA': 'A',\n    'EFC': 'C', 'EHP': 'F', 'EIT': 'T', 'ENP': 'N', 'ESB': 'Y', 'ESC': 'M',\n    'EXB': 'X', 'EXY': 'L', 'EY5': 'N', 'EYS': 'X', 'F2F': 'F', 'FA2': 'A',\n    'FA5': 'N', 'FAG': 'N', 'FAI': 'N', 'FB5': 'A', 'FB6': 'A', 'FCL': 'F',\n    'FFD': 'N', 'FGA': 'E', 'FGL': 'G', 'FGP': 'S', 'FHL': 'X', 'FHO': 'K',\n    'FHU': 'U', 'FLA': 'A', 'FLE': 'L', 'FLT': 'Y', 'FME': 'M', 'FMG': 'G',\n    'FMU': 'N', 'FOE': 'C', 'FOX': 'G', 'FP9': 'P', 'FPA': 'F', 'FRD': 'X',\n    'FT6': 'W', 'FTR': 'W', 'FTY': 'Y', 'FVA': 'V', 'FZN': 'K', 'G': 'G',\n    'G25': 'G', 'G2L': 'G', 'G2S': 'G', 'G31': 'G', 'G32': 'G', 'G33': 'G',\n    'G36': 'G', 'G38': 'G', 'G42': 'G', 'G46': 'G', 'G47': 'G', 'G48': 'G',\n    'G49': 'G', 'G4P': 'N', 'G7M': 'G', 'GAO': 'G', 'GAU': 'E', 'GCK': 'C',\n    'GCM': 'X', 'GDP': 'G', 'GDR': 'G', 'GFL': 'G', 'GGL': 'E', 'GH3': 'G',\n    'GHG': 'Q', 'GHP': 'G', 'GL3': 'G', 'GLH': 'Q', 'GLJ': 'E', 'GLK': 'E',\n    'GLM': 'X', 'GLN': 'Q', 'GLQ': 'E', 'GLU': 'E', 'GLX': 'Z', 'GLY': 'G',\n    'GLZ': 'G', 'GMA': 'E', 'GMS': 'G', 'GMU': 'U', 'GN7': 'G', 'GND': 'X',\n    'GNE': 'N', 'GOM': 'G', 'GPL': 'K', 'GS': 'G', 'GSC': 'G', 'GSR': 'G',\n    'GSS': 'G', 'GSU': 'E', 'GT9': 'C', 'GTP': 'G', 'GVL': 'X', 'H2U': 'U',\n    'H5M': 'P', 'HAC': 'A', 'HAR': 'R', 'HBN': 'H', 'HCS': 'X', 'HDP': 'U',\n    'HEU': 'U', 'HFA': 'X', 'HGL': 'X', 'HHI': 'H', 'HIA': 'H', 'HIC': 'H',\n    'HIP': 'H', 'HIQ': 'H', 'HIS': 'H', 'HL2': 'L', 'HLU': 'L', 'HMR': 'R',\n    'HOL': 'N', 'HPC': 'F', 'HPE': 'F', 'HPH': 'F', 'HPQ': 'F', 'HQA': 'A',\n    'HRG': 'R', 'HRP': 'W', 'HS8': 'H', 'HS9': 'H', 'HSE': 'S', 'HSL': 'S',\n    'HSO': 'H', 'HTI': 'C', 'HTN': 'N', 'HTR': 'W', 'HV5': 'A', 'HVA': 'V',\n    'HY3': 'P', 'HYP': 'P', 'HZP': 'P', 'I': 'I', 'I2M': 'I', 'I58': 'K',\n    'I5C': 'C', 'IAM': 'A', 'IAR': 'R', 'IAS': 'D', 'IC': 'C', 'IEL': 'K',\n    'IG': 'G', 'IGL': 'G', 'IGU': 'G', 'IIL': 'I', 'ILE': 'I', 'ILG': 'E',\n    'ILX': 'I', 'IMC': 'C', 'IML': 'I', 'IOY': 'F', 'IPG': 'G', 'IPN': 'N',\n    'IRN': 'N', 'IT1': 'K', 'IU': 'U', 'IYR': 'Y', 'IYT': 'T', 'IZO': 'M',\n    'JJJ': 'C', 'JJK': 'C', 'JJL': 'C', 'JW5': 'N', 'K1R': 'C', 'KAG': 'G',\n    'KCX': 'K', 'KGC': 'K', 'KNB': 'A', 'KOR': 'M', 'KPI': 'K', 'KST': 'K',\n    'KYQ': 'K', 'L2A': 'X', 'LA2': 'K', 'LAA': 'D', 'LAL': 'A', 'LBY': 'K',\n    'LC': 'C', 'LCA': 'A', 'LCC': 'N', 'LCG': 'G', 'LCH': 'N', 'LCK': 'K',\n    'LCX': 'K', 'LDH': 'K', 'LED': 'L', 'LEF': 'L', 'LEH': 'L', 'LEI': 'V',\n    'LEM': 'L', 'LEN': 'L', 'LET': 'X', 'LEU': 'L', 'LEX': 'L', 'LG': 'G',\n    'LGP': 'G', 'LHC': 'X', 'LHU': 'U', 'LKC': 'N', 'LLP': 'K', 'LLY': 'K',\n    'LME': 'E', 'LMF': 'K', 'LMQ': 'Q', 'LMS': 'N', 'LP6': 'K', 'LPD': 'P',\n    'LPG': 'G', 'LPL': 'X', 'LPS': 'S', 'LSO': 'X', 'LTA': 'X', 'LTR': 'W',\n    'LVG': 'G', 'LVN': 'V', 'LYF': 'K', 'LYK': 'K', 'LYM': 'K', 'LYN': 'K',\n    'LYR': 'K', 'LYS': 'K', 'LYX': 'K', 'LYZ': 'K', 'M0H': 'C', 'M1G': 'G',\n    'M2G': 'G', 'M2L': 'K', 'M2S': 'M', 'M30': 'G', 'M3L': 'K', 'M5M': 'C',\n    'MA': 'A', 'MA6': 'A', 'MA7': 'A', 'MAA': 'A', 'MAD': 'A', 'MAI': 'R',\n    'MBQ': 'Y', 'MBZ': 'N', 'MC1': 'S', 'MCG': 'X', 'MCL': 'K', 'MCS': 'C',\n    'MCY': 'C', 'MD3': 'C', 'MD6': 'G', 'MDH': 'X', 'MDR': 'N', 'MEA': 'F',\n    'MED': 'M', 'MEG': 'E', 'MEN': 'N', 'MEP': 'U', 'MEQ': 'Q', 'MET': 'M',\n    'MEU': 'G', 'MF3': 'X', 'MG1': 'G', 'MGG': 'R', 'MGN': 'Q', 'MGQ': 'A',\n    'MGV': 'G', 'MGY': 'G', 'MHL': 'L', 'MHO': 'M', 'MHS': 'H', 'MIA': 'A',\n    'MIS': 'S', 'MK8': 'L', 'ML3': 'K', 'MLE': 'L', 'MLL': 'L', 'MLY': 'K',\n    'MLZ': 'K', 'MME': 'M', 'MMO': 'R', 'MMT': 'T', 'MND': 'N', 'MNL': 'L',\n    'MNU': 'U', 'MNV': 'V', 'MOD': 'X', 'MP8': 'P', 'MPH': 'X', 'MPJ': 'X',\n    'MPQ': 'G', 'MRG': 'G', 'MSA': 'G', 'MSE': 'M', 'MSL': 'M', 'MSO': 'M',\n    'MSP': 'X', 'MT2': 'M', 'MTR': 'T', 'MTU': 'A', 'MTY': 'Y', 'MVA': 'V',\n    'N': 'N', 'N10': 'S', 'N2C': 'X', 'N5I': 'N', 'N5M': 'C', 'N6G': 'G',\n    'N7P': 'P', 'NA8': 'A', 'NAL': 'A', 'NAM': 'A', 'NB8': 'N', 'NBQ': 'Y',\n    'NC1': 'S', 'NCB': 'A', 'NCX': 'N', 'NCY': 'X', 'NDF': 'F', 'NDN': 'U',\n    'NEM': 'H', 'NEP': 'H', 'NF2': 'N', 'NFA': 'F', 'NHL': 'E', 'NIT': 'X',\n    'NIY': 'Y', 'NLE': 'L', 'NLN': 'L', 'NLO': 'L', 'NLP': 'L', 'NLQ': 'Q',\n    'NMC': 'G', 'NMM': 'R', 'NMS': 'T', 'NMT': 'T', 'NNH': 'R', 'NP3': 'N',\n    'NPH': 'C', 'NPI': 'A', 'NSK': 'X', 'NTY': 'Y', 'NVA': 'V', 'NYM': 'N',\n    'NYS': 'C', 'NZH': 'H', 'O12': 'X', 'O2C': 'N', 'O2G': 'G', 'OAD': 'N',\n    'OAS': 'S', 'OBF': 'X', 'OBS': 'X', 'OCS': 'C', 'OCY': 'C', 'ODP': 'N',\n    'OHI': 'H', 'OHS': 'D', 'OIC': 'X', 'OIP': 'I', 'OLE': 'X', 'OLT': 'T',\n    'OLZ': 'S', 'OMC': 'C', 'OMG': 'G', 'OMT': 'M', 'OMU': 'U', 'ONE': 'U',\n    'ONH': 'A', 'ONL': 'X', 'OPR': 'R', 'ORN': 'A', 'ORQ': 'R', 'OSE': 'S',\n    'OTB': 'X', 'OTH': 'T', 'OTY': 'Y', 'OXX': 'D', 'P': 'G', 'P1L': 'C',\n    'P1P': 'N', 'P2T': 'T', 'P2U': 'U', 'P2Y': 'P', 'P5P': 'A', 'PAQ': 'Y',\n    'PAS': 'D', 'PAT': 'W', 'PAU': 'A', 'PBB': 'C', 'PBF': 'F', 'PBT': 'N',\n    'PCA': 'E', 'PCC': 'P', 'PCE': 'X', 'PCS': 'F', 'PDL': 'X', 'PDU': 'U',\n    'PEC': 'C', 'PF5': 'F', 'PFF': 'F', 'PFX': 'X', 'PG1': 'S', 'PG7': 'G',\n    'PG9': 'G', 'PGL': 'X', 'PGN': 'G', 'PGP': 'G', 'PGY': 'G', 'PHA': 'F',\n    'PHD': 'D', 'PHE': 'F', 'PHI': 'F', 'PHL': 'F', 'PHM': 'F', 'PIV': 'X',\n    'PLE': 'L', 'PM3': 'F', 'PMT': 'C', 'POM': 'P', 'PPN': 'F', 'PPU': 'A',\n    'PPW': 'G', 'PQ1': 'N', 'PR3': 'C', 'PR5': 'A', 'PR9': 'P', 'PRN': 'A',\n    'PRO': 'P', 'PRS': 'P', 'PSA': 'F', 'PSH': 'H', 'PST': 'T', 'PSU': 'U',\n    'PSW': 'C', 'PTA': 'X', 'PTH': 'Y', 'PTM': 'Y', 'PTR': 'Y', 'PU': 'A',\n    'PUY': 'N', 'PVH': 'H', 'PVL': 'X', 'PYA': 'A', 'PYO': 'U', 'PYX': 'C',\n    'PYY': 'N', 'QMM': 'Q', 'QPA': 'C', 'QPH': 'F', 'QUO': 'G', 'R': 'A',\n    'R1A': 'C', 'R4K': 'W', 'RE0': 'W', 'RE3': 'W', 'RIA': 'A', 'RMP': 'A',\n    'RON': 'X', 'RT': 'T', 'RTP': 'N', 'S1H': 'S', 'S2C': 'C', 'S2D': 'A',\n    'S2M': 'T', 'S2P': 'A', 'S4A': 'A', 'S4C': 'C', 'S4G': 'G', 'S4U': 'U',\n    'S6G': 'G', 'SAC': 'S', 'SAH': 'C', 'SAR': 'G', 'SBL': 'S', 'SC': 'C',\n    'SCH': 'C', 'SCS': 'C', 'SCY': 'C', 'SD2': 'X', 'SDG': 'G', 'SDP': 'S',\n    'SEB': 'S', 'SEC': 'A', 'SEG': 'A', 'SEL': 'S', 'SEM': 'S', 'SEN': 'S',\n    'SEP': 'S', 'SER': 'S', 'SET': 'S', 'SGB': 'S', 'SHC': 'C', 'SHP': 'G',\n    'SHR': 'K', 'SIB': 'C', 'SLA': 'P', 'SLR': 'P', 'SLZ': 'K', 'SMC': 'C',\n    'SME': 'M', 'SMF': 'F', 'SMP': 'A', 'SMT': 'T', 'SNC': 'C', 'SNN': 'N',\n    'SOC': 'C', 'SOS': 'N', 'SOY': 'S', 'SPT': 'T', 'SRA': 'A', 'SSU': 'U',\n    'STY': 'Y', 'SUB': 'X', 'SUN': 'S', 'SUR': 'U', 'SVA': 'S', 'SVV': 'S',\n    'SVW': 'S', 'SVX': 'S', 'SVY': 'S', 'SVZ': 'X', 'SYS': 'C', 'T': 'T',\n    'T11': 'F', 'T23': 'T', 'T2S': 'T', 'T2T': 'N', 'T31': 'U', 'T32': 'T',\n    'T36': 'T', 'T37': 'T', 'T38': 'T', 'T39': 'T', 'T3P': 'T', 'T41': 'T',\n    'T48': 'T', 'T49': 'T', 'T4S': 'T', 'T5O': 'U', 'T5S': 'T', 'T66': 'X',\n    'T6A': 'A', 'TA3': 'T', 'TA4': 'X', 'TAF': 'T', 'TAL': 'N', 'TAV': 'D',\n    'TBG': 'V', 'TBM': 'T', 'TC1': 'C', 'TCP': 'T', 'TCQ': 'Y', 'TCR': 'W',\n    'TCY': 'A', 'TDD': 'L', 'TDY': 'T', 'TFE': 'T', 'TFO': 'A', 'TFQ': 'F',\n    'TFT': 'T', 'TGP': 'G', 'TH6': 'T', 'THC': 'T', 'THO': 'X', 'THR': 'T',\n    'THX': 'N', 'THZ': 'R', 'TIH': 'A', 'TLB': 'N', 'TLC': 'T', 'TLN': 'U',\n    'TMB': 'T', 'TMD': 'T', 'TNB': 'C', 'TNR': 'S', 'TOX': 'W', 'TP1': 'T',\n    'TPC': 'C', 'TPG': 'G', 'TPH': 'X', 'TPL': 'W', 'TPO': 'T', 'TPQ': 'Y',\n    'TQI': 'W', 'TQQ': 'W', 'TRF': 'W', 'TRG': 'K', 'TRN': 'W', 'TRO': 'W',\n    'TRP': 'W', 'TRQ': 'W', 'TRW': 'W', 'TRX': 'W', 'TS': 'N', 'TST': 'X',\n    'TT': 'N', 'TTD': 'T', 'TTI': 'U', 'TTM': 'T', 'TTQ': 'W', 'TTS': 'Y',\n    'TY1': 'Y', 'TY2': 'Y', 'TY3': 'Y', 'TY5': 'Y', 'TYB': 'Y', 'TYI': 'Y',\n    'TYJ': 'Y', 'TYN': 'Y', 'TYO': 'Y', 'TYQ': 'Y', 'TYR': 'Y', 'TYS': 'Y',\n    'TYT': 'Y', 'TYU': 'N', 'TYW': 'Y', 'TYX': 'X', 'TYY': 'Y', 'TZB': 'X',\n    'TZO': 'X', 'U': 'U', 'U25': 'U', 'U2L': 'U', 'U2N': 'U', 'U2P': 'U',\n    'U31': 'U', 'U33': 'U', 'U34': 'U', 'U36': 'U', 'U37': 'U', 'U8U': 'U',\n    'UAR': 'U', 'UCL': 'U', 'UD5': 'U', 'UDP': 'N', 'UFP': 'N', 'UFR': 'U',\n    'UFT': 'U', 'UMA': 'A', 'UMP': 'U', 'UMS': 'U', 'UN1': 'X', 'UN2': 'X',\n    'UNK': 'X', 'UR3': 'U', 'URD': 'U', 'US1': 'U', 'US2': 'U', 'US3': 'T',\n    'US5': 'U', 'USM': 'U', 'VAD': 'V', 'VAF': 'V', 'VAL': 'V', 'VB1': 'K',\n    'VDL': 'X', 'VLL': 'X', 'VLM': 'X', 'VMS': 'X', 'VOL': 'X', 'X': 'G',\n    'X2W': 'E', 'X4A': 'N', 'XAD': 'A', 'XAE': 'N', 'XAL': 'A', 'XAR': 'N',\n    'XCL': 'C', 'XCN': 'C', 'XCP': 'X', 'XCR': 'C', 'XCS': 'N', 'XCT': 'C',\n    'XCY': 'C', 'XGA': 'N', 'XGL': 'G', 'XGR': 'G', 'XGU': 'G', 'XPR': 'P',\n    'XSN': 'N', 'XTH': 'T', 'XTL': 'T', 'XTR': 'T', 'XTS': 'G', 'XTY': 'N',\n    'XUA': 'A', 'XUG': 'G', 'XX1': 'K', 'Y': 'A', 'YCM': 'C', 'YG': 'G',\n    'YOF': 'Y', 'YRR': 'N', 'YYG': 'G', 'Z': 'C', 'Z01': 'A', 'ZAD': 'A',\n    'ZAL': 'A', 'ZBC': 'C', 'ZBU': 'U', 'ZCL': 'F', 'ZCY': 'C', 'ZDU': 'U',\n    'ZFB': 'X', 'ZGU': 'G', 'ZHP': 'N', 'ZTH': 'T', 'ZU0': 'T', 'ZZJ': 'A',\n}\n# common_typos_enable\n# pyformat: enable\n\n\n@functools.lru_cache(maxsize=64)\ndef letters_three_to_one(restype: str, *, default: str) -> str:\n  \"\"\"Returns single letter name if one exists otherwise returns default.\"\"\"\n  return CCD_NAME_TO_ONE_LETTER.get(restype, default)\n\n\nALA = sys.intern('ALA')\nARG = sys.intern('ARG')\nASN = sys.intern('ASN')\nASP = sys.intern('ASP')\nCYS = sys.intern('CYS')\nGLN = sys.intern('GLN')\nGLU = sys.intern('GLU')\nGLY = sys.intern('GLY')\nHIS = sys.intern('HIS')\nILE = sys.intern('ILE')\nLEU = sys.intern('LEU')\nLYS = sys.intern('LYS')\nMET = sys.intern('MET')\nPHE = sys.intern('PHE')\nPRO = sys.intern('PRO')\nSER = sys.intern('SER')\nTHR = sys.intern('THR')\nTRP = sys.intern('TRP')\nTYR = sys.intern('TYR')\nVAL = sys.intern('VAL')\nUNK = sys.intern('UNK')\nGAP = sys.intern('-')\n\n# Unknown ligand.\nUNL = sys.intern('UNL')\n\n# Non-standard version of MET (with Se instead of S), but often appears in PDB.\nMSE = sys.intern('MSE')\n\n# 20 standard protein amino acids (no unknown).\nPROTEIN_TYPES: tuple[str, ...] = (\n    ALA, ARG, ASN, ASP, CYS, GLN, GLU, GLY, HIS, ILE, LEU, LYS, MET, PHE, PRO,\n    SER, THR, TRP, TYR, VAL,\n)  # pyformat: disable\n\n# 20 standard protein amino acids plus the unknown (UNK) amino acid.\nPROTEIN_TYPES_WITH_UNKNOWN: tuple[str, ...] = PROTEIN_TYPES + (UNK,)\n\n# This is the standard residue order when coding AA type as a number.\n# Reproduce it by taking 3-letter AA codes and sorting them alphabetically.\n# For legacy reasons this only refers to protein residues.\n\nPROTEIN_TYPES_ONE_LETTER: tuple[str, ...] = (\n    'A', 'R', 'N', 'D', 'C', 'Q', 'E', 'G', 'H', 'I', 'L', 'K', 'M', 'F', 'P',\n    'S', 'T', 'W', 'Y', 'V',\n)  # pyformat: disable\n\nPROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN: tuple[str, ...] = (\n    PROTEIN_TYPES_ONE_LETTER + ('X',)\n)\nPROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN_AND_GAP: tuple[str, ...] = (\n    PROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN + (GAP,)\n)\n\nPROTEIN_TYPES_ONE_LETTER_TO_INT: Mapping[str, int] = {\n    r: i for i, r in enumerate(PROTEIN_TYPES_ONE_LETTER)\n}\nPROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN_TO_INT: Mapping[str, int] = {\n    r: i for i, r in enumerate(PROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN)\n}\n\nPROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN_AND_GAP_TO_INT: Mapping[str, int] = {\n    r: i for i, r in enumerate(PROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN_AND_GAP)\n}\n\n\nPROTEIN_COMMON_ONE_TO_THREE: Mapping[str, str] = {\n    'A': ALA,\n    'R': ARG,\n    'N': ASN,\n    'D': ASP,\n    'C': CYS,\n    'Q': GLN,\n    'E': GLU,\n    'G': GLY,\n    'H': HIS,\n    'I': ILE,\n    'L': LEU,\n    'K': LYS,\n    'M': MET,\n    'F': PHE,\n    'P': PRO,\n    'S': SER,\n    'T': THR,\n    'W': TRP,\n    'Y': TYR,\n    'V': VAL,\n}\n\nPROTEIN_COMMON_THREE_TO_ONE: Mapping[str, str] = {\n    v: k for k, v in PROTEIN_COMMON_ONE_TO_THREE.items()\n}\n\nA = sys.intern('A')\nG = sys.intern('G')\nC = sys.intern('C')\nU = sys.intern('U')\nT = sys.intern('T')\n\nDA = sys.intern('DA')\nDG = sys.intern('DG')\nDC = sys.intern('DC')\nDT = sys.intern('DT')\n\nUNK_NUCLEIC_ONE_LETTER = sys.intern('N')  # Unknown nucleic acid single letter.\nUNK_RNA = sys.intern('N')  # Unknown RNA.\nUNK_DNA = sys.intern('DN')  # Unknown DNA residue (differs from N).\n\nRNA_TYPES: tuple[str, ...] = (A, G, C, U)\nDNA_TYPES: tuple[str, ...] = (DA, DG, DC, DT)\n\nNUCLEIC_TYPES: tuple[str, ...] = RNA_TYPES + DNA_TYPES\n# Without UNK DNA.\nNUCLEIC_TYPES_WITH_UNKNOWN: tuple[str, ...] = NUCLEIC_TYPES + (\n    UNK_NUCLEIC_ONE_LETTER,\n)\nNUCLEIC_TYPES_WITH_2_UNKS: tuple[str, ...] = NUCLEIC_TYPES + (\n    UNK_RNA,\n    UNK_DNA,\n)\n\nRNA_TYPES_ONE_LETTER_WITH_UNKNOWN: tuple[str, ...] = RNA_TYPES + (UNK_RNA,)\nRNA_TYPES_ONE_LETTER_WITH_UNKNOWN_TO_INT: Mapping[str, int] = {\n    r: i for i, r in enumerate(RNA_TYPES_ONE_LETTER_WITH_UNKNOWN)\n}\n\nDNA_TYPES_WITH_UNKNOWN: tuple[str, ...] = DNA_TYPES + (UNK_DNA,)\nDNA_TYPES_ONE_LETTER: tuple[str, ...] = (A, G, C, T)\nDNA_TYPES_ONE_LETTER_WITH_UNKNOWN: tuple[str, ...] = DNA_TYPES_ONE_LETTER + (\n    UNK_NUCLEIC_ONE_LETTER,\n)\nDNA_TYPES_ONE_LETTER_WITH_UNKNOWN_TO_INT: Mapping[str, int] = {\n    r: i for i, r in enumerate(DNA_TYPES_ONE_LETTER_WITH_UNKNOWN)\n}\nDNA_COMMON_ONE_TO_TWO: Mapping[str, str] = {\n    'A': 'DA',\n    'G': 'DG',\n    'C': 'DC',\n    'T': 'DT',\n}\n\nSTANDARD_POLYMER_TYPES: tuple[str, ...] = PROTEIN_TYPES + NUCLEIC_TYPES\nPOLYMER_TYPES: tuple[str, ...] = PROTEIN_TYPES_WITH_UNKNOWN + NUCLEIC_TYPES\nPOLYMER_TYPES_WITH_UNKNOWN: tuple[str, ...] = (\n    PROTEIN_TYPES_WITH_UNKNOWN + NUCLEIC_TYPES_WITH_UNKNOWN\n)\nPOLYMER_TYPES_WITH_GAP: tuple[str, ...] = PROTEIN_TYPES + (GAP,) + NUCLEIC_TYPES\nPOLYMER_TYPES_WITH_UNKNOWN_AND_GAP: tuple[str, ...] = (\n    PROTEIN_TYPES_WITH_UNKNOWN + (GAP,) + NUCLEIC_TYPES_WITH_UNKNOWN\n)\nPOLYMER_TYPES_WITH_ALL_UNKS_AND_GAP: tuple[str, ...] = (\n    PROTEIN_TYPES_WITH_UNKNOWN + (GAP,) + NUCLEIC_TYPES_WITH_2_UNKS\n)\n\nPOLYMER_TYPES_ORDER = {restype: i for i, restype in enumerate(POLYMER_TYPES)}\n\nPOLYMER_TYPES_ORDER_WITH_UNKNOWN = {\n    restype: i for i, restype in enumerate(POLYMER_TYPES_WITH_UNKNOWN)\n}\n\nPOLYMER_TYPES_ORDER_WITH_UNKNOWN_AND_GAP = {\n    restype: i for i, restype in enumerate(POLYMER_TYPES_WITH_UNKNOWN_AND_GAP)\n}\n\nPOLYMER_TYPES_ORDER_WITH_ALL_UNKS_AND_GAP = {\n    restype: i for i, restype in enumerate(POLYMER_TYPES_WITH_ALL_UNKS_AND_GAP)\n}\n\nPOLYMER_TYPES_NUM = len(POLYMER_TYPES)  # := 29.\nPOLYMER_TYPES_NUM_WITH_UNKNOWN = len(POLYMER_TYPES_WITH_UNKNOWN)  # := 30.\nPOLYMER_TYPES_NUM_WITH_GAP = len(POLYMER_TYPES_WITH_GAP)  # := 29.\nPOLYMER_TYPES_NUM_WITH_UNKNOWN_AND_GAP = len(\n    POLYMER_TYPES_WITH_UNKNOWN_AND_GAP\n)  # := 31.\nPOLYMER_TYPES_NUM_ORDER_WITH_ALL_UNKS_AND_GAP = len(\n    POLYMER_TYPES_WITH_ALL_UNKS_AND_GAP\n)  # := 32.\n\nWATER_TYPES: tuple[str, ...] = ('HOH', 'DOD')\n\nUNKNOWN_TYPES: tuple[str, ...] = (UNK, UNK_RNA, UNK_DNA, UNL)\n"
  },
  {
    "path": "src/alphafold3/constants/side_chains.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Constants associated with side chains.\"\"\"\n\nfrom collections.abc import Mapping, Sequence\nimport itertools\n\n# Format: The list for each AA type contains chi1, chi2, chi3, chi4 in\n# this order (or a relevant subset from chi1 onwards). ALA and GLY don't have\n# chi angles so their chi angle lists are empty.\nCHI_ANGLES_ATOMS: Mapping[str, Sequence[tuple[str, ...]]] = {\n    'ALA': [],\n    # Chi5 in arginine is always 0 +- 5 degrees, so ignore it.\n    'ARG': [\n        ('N', 'CA', 'CB', 'CG'),\n        ('CA', 'CB', 'CG', 'CD'),\n        ('CB', 'CG', 'CD', 'NE'),\n        ('CG', 'CD', 'NE', 'CZ'),\n    ],\n    'ASN': [('N', 'CA', 'CB', 'CG'), ('CA', 'CB', 'CG', 'OD1')],\n    'ASP': [('N', 'CA', 'CB', 'CG'), ('CA', 'CB', 'CG', 'OD1')],\n    'CYS': [('N', 'CA', 'CB', 'SG')],\n    'GLN': [\n        ('N', 'CA', 'CB', 'CG'),\n        ('CA', 'CB', 'CG', 'CD'),\n        ('CB', 'CG', 'CD', 'OE1'),\n    ],\n    'GLU': [\n        ('N', 'CA', 'CB', 'CG'),\n        ('CA', 'CB', 'CG', 'CD'),\n        ('CB', 'CG', 'CD', 'OE1'),\n    ],\n    'GLY': [],\n    'HIS': [('N', 'CA', 'CB', 'CG'), ('CA', 'CB', 'CG', 'ND1')],\n    'ILE': [('N', 'CA', 'CB', 'CG1'), ('CA', 'CB', 'CG1', 'CD1')],\n    'LEU': [('N', 'CA', 'CB', 'CG'), ('CA', 'CB', 'CG', 'CD1')],\n    'LYS': [\n        ('N', 'CA', 'CB', 'CG'),\n        ('CA', 'CB', 'CG', 'CD'),\n        ('CB', 'CG', 'CD', 'CE'),\n        ('CG', 'CD', 'CE', 'NZ'),\n    ],\n    'MET': [\n        ('N', 'CA', 'CB', 'CG'),\n        ('CA', 'CB', 'CG', 'SD'),\n        ('CB', 'CG', 'SD', 'CE'),\n    ],\n    'PHE': [('N', 'CA', 'CB', 'CG'), ('CA', 'CB', 'CG', 'CD1')],\n    'PRO': [('N', 'CA', 'CB', 'CG'), ('CA', 'CB', 'CG', 'CD')],\n    'SER': [('N', 'CA', 'CB', 'OG')],\n    'THR': [('N', 'CA', 'CB', 'OG1')],\n    'TRP': [('N', 'CA', 'CB', 'CG'), ('CA', 'CB', 'CG', 'CD1')],\n    'TYR': [('N', 'CA', 'CB', 'CG'), ('CA', 'CB', 'CG', 'CD1')],\n    'VAL': [('N', 'CA', 'CB', 'CG1')],\n}\n\nCHI_GROUPS_FOR_ATOM = {}\nfor res_name, chi_angle_atoms_for_res in CHI_ANGLES_ATOMS.items():\n  for chi_group_i, chi_group in enumerate(chi_angle_atoms_for_res):\n    for atom_i, atom in enumerate(chi_group):\n      CHI_GROUPS_FOR_ATOM.setdefault((res_name, atom), []).append(\n          (chi_group_i, atom_i)\n      )\n\n# Mapping from (residue_name, atom_name) pairs to the atom's chi group index\n# and atom index within that group.\nCHI_GROUPS_FOR_ATOM: Mapping[tuple[str, str], Sequence[tuple[int, int]]] = (\n    CHI_GROUPS_FOR_ATOM\n)\n\nMAX_NUM_CHI_ANGLES: int = 4\nATOMS_PER_CHI_ANGLE: int = 4\n\n# A list of atoms for each AA type that are involved in chi angle calculations.\nCHI_ATOM_SETS: Mapping[str, set[str]] = {\n    residue_name: set(itertools.chain(*atoms))\n    for residue_name, atoms in CHI_ANGLES_ATOMS.items()\n}\n\n# If chi angles given in fixed-length array, this matrix determines how to mask\n# them for each AA type. The order is as per restype_order (see below).\nCHI_ANGLES_MASK: Sequence[Sequence[float]] = (\n    (0.0, 0.0, 0.0, 0.0),  # ALA\n    (1.0, 1.0, 1.0, 1.0),  # ARG\n    (1.0, 1.0, 0.0, 0.0),  # ASN\n    (1.0, 1.0, 0.0, 0.0),  # ASP\n    (1.0, 0.0, 0.0, 0.0),  # CYS\n    (1.0, 1.0, 1.0, 0.0),  # GLN\n    (1.0, 1.0, 1.0, 0.0),  # GLU\n    (0.0, 0.0, 0.0, 0.0),  # GLY\n    (1.0, 1.0, 0.0, 0.0),  # HIS\n    (1.0, 1.0, 0.0, 0.0),  # ILE\n    (1.0, 1.0, 0.0, 0.0),  # LEU\n    (1.0, 1.0, 1.0, 1.0),  # LYS\n    (1.0, 1.0, 1.0, 0.0),  # MET\n    (1.0, 1.0, 0.0, 0.0),  # PHE\n    (1.0, 1.0, 0.0, 0.0),  # PRO\n    (1.0, 0.0, 0.0, 0.0),  # SER\n    (1.0, 0.0, 0.0, 0.0),  # THR\n    (1.0, 1.0, 0.0, 0.0),  # TRP\n    (1.0, 1.0, 0.0, 0.0),  # TYR\n    (1.0, 0.0, 0.0, 0.0),  # VAL\n)\n"
  },
  {
    "path": "src/alphafold3/cpp.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include \"alphafold3/data/cpp/msa_profile_pybind.h\"\n#include \"alphafold3/model/mkdssp_pybind.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_pybind.h\"\n#include \"alphafold3/parsers/cpp/fasta_iterator_pybind.h\"\n#include \"alphafold3/parsers/cpp/msa_conversion_pybind.h\"\n#include \"alphafold3/structure/cpp/aggregation_pybind.h\"\n#include \"alphafold3/structure/cpp/membership_pybind.h\"\n#include \"alphafold3/structure/cpp/mmcif_atom_site_pybind.h\"\n#include \"alphafold3/structure/cpp/mmcif_layout_pybind.h\"\n#include \"alphafold3/structure/cpp/mmcif_struct_conn_pybind.h\"\n#include \"alphafold3/structure/cpp/mmcif_utils_pybind.h\"\n#include \"alphafold3/structure/cpp/string_array_pybind.h\"\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\nnamespace {\n\n// Include all modules as submodules to simplify building.\nPYBIND11_MODULE(cpp, m) {\n  RegisterModuleCifDict(m.def_submodule(\"cif_dict\"));\n  RegisterModuleFastaIterator(m.def_submodule(\"fasta_iterator\"));\n  RegisterModuleMsaConversion(m.def_submodule(\"msa_conversion\"));\n  RegisterModuleMmcifLayout(m.def_submodule(\"mmcif_layout\"));\n  RegisterModuleMmcifStructConn(m.def_submodule(\"mmcif_struct_conn\"));\n  RegisterModuleMembership(m.def_submodule(\"membership\"));\n  RegisterModuleMmcifUtils(m.def_submodule(\"mmcif_utils\"));\n  RegisterModuleAggregation(m.def_submodule(\"aggregation\"));\n  RegisterModuleStringArray(m.def_submodule(\"string_array\"));\n  RegisterModuleMmcifAtomSite(m.def_submodule(\"mmcif_atom_site\"));\n  RegisterModuleMkdssp(m.def_submodule(\"mkdssp\"));\n  RegisterModuleMsaProfile(m.def_submodule(\"msa_profile\"));\n}\n\n}  // namespace\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/data/cpp/msa_profile_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <algorithm>\n\n#include \"absl/strings/str_cat.h\"\n#include \"pybind11/cast.h\"\n#include \"pybind11/numpy.h\"\n#include \"pybind11/pybind11.h\"\n\nnamespace {\n\nnamespace py = pybind11;\n\npy::array_t<double> ComputeMsaProfile(\n    const py::array_t<int, py::array::c_style>& msa, int num_residue_types) {\n  if (msa.size() == 0) {\n    throw py::value_error(\"The MSA must be non-empty.\");\n  }\n  if (msa.ndim() != 2) {\n    throw py::value_error(absl::StrCat(\"The MSA must be rectangular, got \",\n                                       msa.ndim(), \"-dimensional MSA array.\"));\n  }\n  const int msa_depth = msa.shape()[0];\n  const int sequence_length = msa.shape()[1];\n\n  py::array_t<double> profile({sequence_length, num_residue_types});\n  std::fill(profile.mutable_data(), profile.mutable_data() + profile.size(),\n            0.0f);\n  auto profile_unchecked = profile.mutable_unchecked<2>();\n\n  const double normalized_count = 1.0 / msa_depth;\n  const int* msa_it = msa.data();\n  for (int row_index = 0; row_index < msa_depth; ++row_index) {\n    for (int column_index = 0; column_index < sequence_length; ++column_index) {\n      const int residue_code = *(msa_it++);\n      if (residue_code < 0 || residue_code >= num_residue_types) {\n        throw py::value_error(\n            absl::StrCat(\"All residue codes must be positive and smaller than \"\n                         \"num_residue_types \",\n                         num_residue_types, \", got \", residue_code));\n      }\n      profile_unchecked(column_index, residue_code) += normalized_count;\n    }\n  }\n  return profile;\n}\n\nconstexpr char kComputeMsaProfileDoc[] = R\"(\nComputes MSA profile for the given encoded MSA.\n\nArgs:\n  msa: A Numpy array of shape (num_msa, num_res) with the integer coded MSA.\n  num_residue_types: Integer that determines the number of unique residue types.\n    This will determine the shape of the output profile.\n\nReturns:\n  A float Numpy array of shape (num_res, num_residue_types) with residue\n  frequency (residue type count normalized by MSA depth) for every column of the\n  MSA.\n)\";\n\n}  // namespace\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMsaProfile(pybind11::module m) {\n  m.def(\"compute_msa_profile\", &ComputeMsaProfile, py::arg(\"msa\"),\n        py::arg(\"num_residue_types\"), py::doc(kComputeMsaProfileDoc + 1));\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/data/cpp/msa_profile_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_DATA_PYTHON_MSA_PROFILE_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_DATA_PYTHON_MSA_PROFILE_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMsaProfile(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_DATA_PYTHON_MSA_PROFILE_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/data/featurisation.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"AlphaFold 3 featurisation pipeline.\"\"\"\n\nfrom collections.abc import Sequence\nimport datetime\nimport time\n\nfrom alphafold3.common import folding_input\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.model import features\nfrom alphafold3.model.pipeline import pipeline\nimport numpy as np\n\n\ndef validate_fold_input(fold_input: folding_input.Input):\n  \"\"\"Validates the fold input contains MSA and templates for featurisation.\"\"\"\n  for i, chain in enumerate(fold_input.protein_chains):\n    if chain.unpaired_msa is None:\n      raise ValueError(f'Protein chain {i + 1} is missing unpaired MSA.')\n    if chain.paired_msa is None:\n      raise ValueError(f'Protein chain {i + 1} is missing paired MSA.')\n    if chain.templates is None:\n      raise ValueError(f'Protein chain {i + 1} is missing Templates.')\n  for i, chain in enumerate(fold_input.rna_chains):\n    if chain.unpaired_msa is None:\n      raise ValueError(f'RNA chain {i + 1} is missing unpaired MSA.')\n\n\ndef featurise_input(\n    fold_input: folding_input.Input,\n    ccd: chemical_components.Ccd,\n    buckets: Sequence[int] | None,\n    ref_max_modified_date: datetime.date | None = None,\n    conformer_max_iterations: int | None = None,\n    resolve_msa_overlaps: bool = True,\n    verbose: bool = False,\n) -> Sequence[features.BatchDict]:\n  \"\"\"Featurise the folding input.\n\n  Args:\n    fold_input: The input to featurise.\n    ccd: The chemical components dictionary.\n    buckets: Bucket sizes to pad the data to, to avoid excessive re-compilation\n      of the model. If None, calculate the appropriate bucket size from the\n      number of tokens. If not None, must be a sequence of at least one integer,\n      in strictly increasing order. Will raise an error if the number of tokens\n      is more than the largest bucket size.\n    ref_max_modified_date: Optional maximum date that controls whether to allow\n      use of model coordinates for a chemical component from the CCD if RDKit\n      conformer generation fails and the component does not have ideal\n      coordinates set. Only for components that have been released before this\n      date the model coordinates can be used as a fallback.\n    conformer_max_iterations: Optional override for maximum number of iterations\n      to run for RDKit conformer search.\n    resolve_msa_overlaps: Whether to deduplicate unpaired MSA against paired\n      MSA. The default behaviour matches the method described in the AlphaFold 3\n      paper. Set this to false if providing custom paired MSA using the unpaired\n      MSA field to keep it exactly as is as deduplication against the paired MSA\n      could break the manually crafted pairing between MSA sequences.\n    verbose: Whether to print progress messages.\n\n  Returns:\n    A featurised batch for each rng_seed in the input.\n  \"\"\"\n  validate_fold_input(fold_input)\n\n  # Set up data pipeline for single use.\n  data_pipeline = pipeline.WholePdbPipeline(\n      config=pipeline.WholePdbPipeline.Config(\n          buckets=buckets,\n          ref_max_modified_date=ref_max_modified_date,\n          conformer_max_iterations=conformer_max_iterations,\n          resolve_msa_overlaps=resolve_msa_overlaps,\n      ),\n  )\n\n  batches = []\n  for rng_seed in fold_input.rng_seeds:\n    featurisation_start_time = time.time()\n    if verbose:\n      print(f'Featurising data with seed {rng_seed}.')\n    batch = data_pipeline.process_item(\n        fold_input=fold_input,\n        ccd=ccd,\n        random_state=np.random.RandomState(rng_seed),\n        random_seed=rng_seed,\n    )\n    if verbose:\n      print(\n          f'Featurising data with seed {rng_seed} took'\n          f' {time.time() - featurisation_start_time:.2f} seconds.'\n      )\n    batches.append(batch)\n\n  return batches\n"
  },
  {
    "path": "src/alphafold3/data/msa.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Functions for getting MSA and calculating alignment features.\"\"\"\n\nfrom collections.abc import MutableMapping, Sequence\nimport string\nfrom typing import Self\n\nfrom absl import logging\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.data import msa_config\nfrom alphafold3.data import msa_features\nfrom alphafold3.data import parsers\nfrom alphafold3.data.tools import jackhmmer\nfrom alphafold3.data.tools import msa_tool\nfrom alphafold3.data.tools import nhmmer\nimport numpy as np\n\n\nclass Error(Exception):\n  \"\"\"Error indicatating a problem with MSA Search.\"\"\"\n\n\ndef _featurize(seq: str, chain_poly_type: str) -> str | list[int]:\n  if mmcif_names.is_standard_polymer_type(chain_poly_type):\n    featurized_seqs, _ = msa_features.extract_msa_features(\n        msa_sequences=[seq], chain_poly_type=chain_poly_type\n    )\n    return featurized_seqs[0].tolist()\n  # For anything else simply require an identical match.\n  return seq\n\n\ndef sequences_are_feature_equivalent(\n    sequence1: str,\n    sequence2: str,\n    chain_poly_type: str,\n) -> bool:\n  feat1 = _featurize(sequence1, chain_poly_type)\n  feat2 = _featurize(sequence2, chain_poly_type)\n  return feat1 == feat2\n\n\nclass Msa:\n  \"\"\"Multiple Sequence Alignment container with methods for manipulating it.\"\"\"\n\n  def __init__(\n      self,\n      query_sequence: str,\n      chain_poly_type: str,\n      sequences: Sequence[str],\n      descriptions: Sequence[str],\n      deduplicate: bool = True,\n  ):\n    \"\"\"Raw constructor, prefer using the from_{a3m,multiple_msas} class methods.\n\n    The first sequence must be equal (in featurised form) to the query sequence.\n    If sequences/descriptions are empty, they will be initialised to the query.\n\n    Args:\n      query_sequence: The sequence that was used to search for MSA.\n      chain_poly_type: Polymer type of the query sequence, see mmcif_names.\n      sequences: The sequences returned by the MSA search tool.\n      descriptions: Metadata for the sequences returned by the MSA search tool.\n      deduplicate: If True, the MSA sequences will be deduplicated in the input\n        order. Lowercase letters (insertions) are ignored when deduplicating.\n    \"\"\"\n    if len(sequences) != len(descriptions):\n      raise ValueError('The number of sequences and descriptions must match.')\n\n    self.query_sequence = query_sequence\n    self.chain_poly_type = chain_poly_type\n\n    if not deduplicate:\n      self.sequences = sequences\n      self.descriptions = descriptions\n    else:\n      self.sequences = []\n      self.descriptions = []\n      # A replacement table that removes all lowercase characters.\n      deletion_table = str.maketrans('', '', string.ascii_lowercase)\n      unique_sequences = set()\n      for seq, desc in zip(sequences, descriptions, strict=True):\n        # Using string.translate is faster than re.sub('[a-z]+', '').\n        sequence_no_deletions = seq.translate(deletion_table)\n        if sequence_no_deletions not in unique_sequences:\n          unique_sequences.add(sequence_no_deletions)\n          self.sequences.append(seq)\n          self.descriptions.append(desc)\n\n    # Make sure the MSA always has at least the query.\n    self.sequences = self.sequences or [query_sequence]\n    self.descriptions = self.descriptions or ['Original query']\n\n    # Check if the 1st MSA sequence matches the query sequence. Since it may be\n    # mutated by the search tool (jackhmmer) check using the featurized version.\n    if not sequences_are_feature_equivalent(\n        self.sequences[0], query_sequence, chain_poly_type\n    ):\n      raise ValueError(\n          f'First MSA sequence {self.sequences[0]} is not the {query_sequence=}'\n      )\n\n  @classmethod\n  def from_multiple_msas(\n      cls, msas: Sequence[Self], deduplicate: bool = True\n  ) -> Self:\n    \"\"\"Initializes the MSA from multiple MSAs.\n\n    Args:\n      msas: A sequence of Msa objects representing individual MSAs produced by\n        different tools/dbs.\n      deduplicate: If True, the MSA sequences will be deduplicated in the input\n        order. Lowercase letters (insertions) are ignored when deduplicating.\n\n    Returns:\n      An Msa object created by merging multiple MSAs.\n    \"\"\"\n    if not msas:\n      raise ValueError('At least one MSA must be provided.')\n\n    query_sequence = msas[0].query_sequence\n    chain_poly_type = msas[0].chain_poly_type\n    sequences = []\n    descriptions = []\n\n    for msa in msas:\n      if msa.query_sequence != query_sequence:\n        raise ValueError(\n            f'Query sequences must match: {[m.query_sequence for m in msas]}'\n        )\n      if msa.chain_poly_type != chain_poly_type:\n        raise ValueError(\n            f'Chain poly types must match: {[m.chain_poly_type for m in msas]}'\n        )\n      sequences.extend(msa.sequences)\n      descriptions.extend(msa.descriptions)\n\n    return cls(\n        query_sequence=query_sequence,\n        chain_poly_type=chain_poly_type,\n        sequences=sequences,\n        descriptions=descriptions,\n        deduplicate=deduplicate,\n    )\n\n  @classmethod\n  def from_multiple_a3ms(\n      cls, a3ms: Sequence[str], chain_poly_type: str, deduplicate: bool = True\n  ) -> Self:\n    \"\"\"Initializes the MSA from multiple A3M strings.\n\n    Args:\n      a3ms: A sequence of A3M strings representing individual MSAs produced by\n        different tools/dbs.\n      chain_poly_type: Polymer type of the query sequence, see mmcif_names.\n      deduplicate: If True, the MSA sequences will be deduplicated in the input\n        order. Lowercase letters (insertions) are ignored when deduplicating.\n\n    Returns:\n      An Msa object created by merging multiple A3Ms.\n    \"\"\"\n    if not a3ms:\n      raise ValueError('At least one A3M must be provided.')\n\n    query_sequence = None\n    all_sequences = []\n    all_descriptions = []\n\n    for a3m in a3ms:\n      sequences, descriptions = parsers.parse_fasta(a3m)\n      if query_sequence is None:\n        query_sequence = sequences[0]\n\n      if sequences[0] != query_sequence:\n        raise ValueError(\n            f'Query sequences must match: {sequences[0]=} != {query_sequence=}'\n        )\n      all_sequences.extend(sequences)\n      all_descriptions.extend(descriptions)\n\n    return cls(\n        query_sequence=query_sequence,\n        chain_poly_type=chain_poly_type,\n        sequences=all_sequences,\n        descriptions=all_descriptions,\n        deduplicate=deduplicate,\n    )\n\n  @classmethod\n  def from_a3m(\n      cls,\n      query_sequence: str,\n      chain_poly_type: str,\n      a3m: str,\n      max_depth: int | None = None,\n      deduplicate: bool = True,\n  ) -> Self:\n    \"\"\"Parses the single A3M and builds the Msa object.\"\"\"\n    sequences, descriptions = parsers.parse_fasta(a3m)\n\n    if max_depth is not None and 0 < max_depth < len(sequences):\n      logging.info(\n          'MSA cropped from depth of %d to %d for %s.',\n          len(sequences),\n          max_depth,\n          query_sequence,\n      )\n      sequences = sequences[:max_depth]\n      descriptions = descriptions[:max_depth]\n\n    return cls(\n        query_sequence=query_sequence,\n        chain_poly_type=chain_poly_type,\n        sequences=sequences,\n        descriptions=descriptions,\n        deduplicate=deduplicate,\n    )\n\n  @classmethod\n  def from_empty(cls, query_sequence: str, chain_poly_type: str) -> Self:\n    \"\"\"Creates an empty Msa containing just the query sequence.\"\"\"\n    return cls(\n        query_sequence=query_sequence,\n        chain_poly_type=chain_poly_type,\n        sequences=[],\n        descriptions=[],\n        deduplicate=False,\n    )\n\n  @property\n  def depth(self) -> int:\n    return len(self.sequences)\n\n  def __repr__(self) -> str:\n    return f'Msa({self.depth} sequences, {self.chain_poly_type})'\n\n  def to_a3m(self) -> str:\n    \"\"\"Returns the MSA in the A3M format.\"\"\"\n    a3m_lines = []\n    for desc, seq in zip(self.descriptions, self.sequences, strict=True):\n      a3m_lines.append(f'>{desc}')\n      a3m_lines.append(seq)\n    return '\\n'.join(a3m_lines) + '\\n'\n\n  def featurize(self) -> MutableMapping[str, np.ndarray]:\n    \"\"\"Featurises the MSA and returns a map of feature names to features.\n\n    Returns:\n      A dictionary mapping feature names to values.\n\n    Raises:\n      msa.Error:\n        * If the sequences in the MSA don't have the same length after deletions\n          (lower case letters) are removed.\n        * If the MSA contains an unknown amino acid code.\n        * If there are no sequences after aligning.\n    \"\"\"\n    try:\n      msa, deletion_matrix = msa_features.extract_msa_features(\n          msa_sequences=self.sequences, chain_poly_type=self.chain_poly_type\n      )\n    except ValueError as e:\n      raise Error(f'Error extracting MSA or deletion features: {e}') from e\n\n    if msa.shape == (0, 0):\n      raise Error(f'Empty MSA feature for {self}')\n\n    species_ids = msa_features.extract_species_ids(self.descriptions)\n\n    return {\n        'msa_species_identifiers': np.array(species_ids, dtype=object),\n        'num_alignments': np.array(self.depth, dtype=np.int32),\n        'msa': msa,\n        'deletion_matrix': deletion_matrix,\n    }\n\n\ndef get_msa_tool(\n    msa_tool_config: msa_config.JackhmmerConfig | msa_config.NhmmerConfig,\n) -> msa_tool.MsaTool:\n  \"\"\"Returns the requested MSA tool.\"\"\"\n\n  match msa_tool_config:\n    case msa_config.JackhmmerConfig():\n      return jackhmmer.Jackhmmer(\n          binary_path=msa_tool_config.binary_path,\n          database_path=msa_tool_config.database_config.path,\n          n_cpu=msa_tool_config.n_cpu,\n          n_iter=msa_tool_config.n_iter,\n          e_value=msa_tool_config.e_value,\n          z_value=msa_tool_config.z_value,\n          max_sequences=msa_tool_config.max_sequences,\n      )\n    case msa_config.NhmmerConfig():\n      return nhmmer.Nhmmer(\n          binary_path=msa_tool_config.binary_path,\n          hmmalign_binary_path=msa_tool_config.hmmalign_binary_path,\n          hmmbuild_binary_path=msa_tool_config.hmmbuild_binary_path,\n          database_path=msa_tool_config.database_config.path,\n          n_cpu=msa_tool_config.n_cpu,\n          e_value=msa_tool_config.e_value,\n          max_sequences=msa_tool_config.max_sequences,\n          alphabet=msa_tool_config.alphabet,\n      )\n    case _:\n      raise ValueError(f'Unknown MSA tool: {msa_tool_config}.')\n\n\ndef get_msa(\n    target_sequence: str,\n    run_config: msa_config.RunConfig,\n    chain_poly_type: str,\n    deduplicate: bool = False,\n) -> Msa:\n  \"\"\"Computes the MSA for a given query sequence.\n\n  Args:\n    target_sequence: The target amino-acid sequence.\n    run_config: MSA run configuration.\n    chain_poly_type: The type of chain for which to get an MSA.\n    deduplicate: If True, the MSA sequences will be deduplicated in the input\n      order. Lowercase letters (insertions) are ignored when deduplicating.\n\n  Returns:\n    Aligned MSA sequences.\n  \"\"\"\n\n  return Msa.from_a3m(\n      query_sequence=target_sequence,\n      chain_poly_type=chain_poly_type,\n      a3m=get_msa_tool(run_config.config).query(target_sequence).a3m,\n      max_depth=run_config.crop_size,\n      deduplicate=deduplicate,\n  )\n"
  },
  {
    "path": "src/alphafold3/data/msa_config.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Genetic search config settings for data pipelines.\"\"\"\n\nimport dataclasses\nimport datetime\nfrom typing import Self\nfrom alphafold3.constants import mmcif_names\n\n\ndef _validate_chain_poly_type(chain_poly_type: str) -> None:\n  if chain_poly_type not in mmcif_names.STANDARD_POLYMER_CHAIN_TYPES:\n    raise ValueError(\n        'chain_poly_type must be one of'\n        f' {mmcif_names.STANDARD_POLYMER_CHAIN_TYPES}: {chain_poly_type}'\n    )\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass DatabaseConfig:\n  \"\"\"Configuration for a database.\"\"\"\n\n  name: str\n  path: str\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass JackhmmerConfig:\n  \"\"\"Configuration for a jackhmmer run.\n\n  Attributes:\n      binary_path: Path to the binary of the msa tool.\n      database_config: Database configuration.\n      n_cpu: An integer with the number of CPUs to use.\n      n_iter: An integer with the number of database search iterations.\n      e_value: e-value for the database lookup.\n      z_value: The Z-value representing the database size in number of sequences\n        for E-value and domain E-value calculation. Must be set for sharded\n        databases.\n      dom_z_value: The Z-value representing the database size in number of\n        sequences for domain E-value calculation. Must be set for sharded\n        databases.\n      max_sequences: Max sequences to return in MSA.\n      max_parallel_shards: If given, the maximum number of shards to search\n        against in parallel. If None, one Jackhmmer instance will be run per\n        shard. Only applicable if the database is sharded.\n  \"\"\"\n\n  binary_path: str\n  database_config: DatabaseConfig\n  n_cpu: int\n  n_iter: int\n  e_value: float\n  z_value: int | None\n  dom_z_value: int | None\n  max_sequences: int\n  max_parallel_shards: int | None = None\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass NhmmerConfig:\n  \"\"\"Configuration for a nhmmer run.\n\n  Attributes:\n      binary_path: Path to the binary of the msa tool.\n      hmmalign_binary_path: Path to the hmmalign binary.\n      hmmbuild_binary_path: Path to the hmmbuild binary.\n      database_config: Database configuration.\n      n_cpu: An integer with the number of CPUs to use.\n      e_value: e-value for the database lookup.\n      z_value: The Z-value representing the database size in megabases for\n        E-value calculation. Allows fractional values. Must be set for sharded\n        databases.\n      max_sequences: Max sequences to return in MSA.\n      alphabet: The alphabet when building a profile with hmmbuild.\n      max_parallel_shards: If given, the maximum number of shards to search\n        against in parallel. If None, one Nhmmer instance will be run per shard.\n        Only applicable if the database is sharded.\n  \"\"\"\n\n  binary_path: str\n  hmmalign_binary_path: str\n  hmmbuild_binary_path: str\n  database_config: DatabaseConfig\n  n_cpu: int\n  e_value: float\n  z_value: float | None\n  max_sequences: int\n  alphabet: str | None\n  max_parallel_shards: int | None = None\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass RunConfig:\n  \"\"\"Configuration for an MSA run.\n\n  Attributes:\n    config: MSA tool config.\n    chain_poly_type: The chain type for which the tools will be run.\n    crop_size: The maximum number of sequences to keep in the MSA. If None, all\n      sequences are kept. Note that the query is included in the MSA, so it\n      doesn't make sense to set this to less than 2.\n  \"\"\"\n\n  config: JackhmmerConfig | NhmmerConfig\n  chain_poly_type: str\n  crop_size: int | None\n\n  def __post_init__(self):\n    if self.crop_size is not None and self.crop_size < 2:\n      raise ValueError(f'crop_size must be None or >= 2: {self.crop_size}')\n\n    _validate_chain_poly_type(self.chain_poly_type)\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass HmmsearchConfig:\n  \"\"\"Configuration for a hmmsearch.\"\"\"\n\n  hmmsearch_binary_path: str\n  hmmbuild_binary_path: str\n\n  e_value: float\n  inc_e: float\n  dom_e: float\n  incdom_e: float\n  alphabet: str = 'amino'\n  filter_f1: float | None = None\n  filter_f2: float | None = None\n  filter_f3: float | None = None\n  filter_max: bool = False\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass TemplateToolConfig:\n  \"\"\"Configuration for a template tool.\"\"\"\n\n  database_path: str\n  chain_poly_type: str\n  hmmsearch_config: HmmsearchConfig\n  max_a3m_query_sequences: int | None = 300\n\n  def __post_init__(self):\n    _validate_chain_poly_type(self.chain_poly_type)\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass TemplateFilterConfig:\n  \"\"\"Configuration for a template filter.\"\"\"\n\n  max_subsequence_ratio: float | None\n  min_align_ratio: float | None\n  min_hit_length: int | None\n  deduplicate_sequences: bool\n  max_hits: int | None\n  max_template_date: datetime.date\n\n  @classmethod\n  def no_op_filter(cls) -> Self:\n    \"\"\"Returns a config for filter that keeps everything.\"\"\"\n    return cls(\n        max_subsequence_ratio=None,\n        min_align_ratio=None,\n        min_hit_length=None,\n        deduplicate_sequences=False,\n        max_hits=None,\n        max_template_date=datetime.date(3000, 1, 1),  # Very far in the future.\n    )\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass TemplatesConfig:\n  \"\"\"Configuration for the template search pipeline.\"\"\"\n\n  template_tool_config: TemplateToolConfig\n  filter_config: TemplateFilterConfig\n"
  },
  {
    "path": "src/alphafold3/data/msa_features.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Utilities for computing MSA features.\"\"\"\n\nfrom collections.abc import Sequence\nimport re\nfrom alphafold3.constants import mmcif_names\nimport numpy as np\n\n_PROTEIN_TO_ID = {\n    'A': 0,\n    'B': 3,  # Same as D.\n    'C': 4,\n    'D': 3,\n    'E': 6,\n    'F': 13,\n    'G': 7,\n    'H': 8,\n    'I': 9,\n    'J': 20,  # Same as unknown (X).\n    'K': 11,\n    'L': 10,\n    'M': 12,\n    'N': 2,\n    'O': 20,  # Same as unknown (X).\n    'P': 14,\n    'Q': 5,\n    'R': 1,\n    'S': 15,\n    'T': 16,\n    'U': 4,  # Same as C.\n    'V': 19,\n    'W': 17,\n    'X': 20,\n    'Y': 18,\n    'Z': 6,  # Same as E.\n    '-': 21,\n}\n\n_RNA_TO_ID = {\n    # Map non-standard residues to UNK_NUCLEIC (N) -> 30\n    **{chr(i): 30 for i in range(ord('A'), ord('Z') + 1)},\n    # Continue the RNA indices from where Protein indices left off.\n    '-': 21,\n    'A': 22,\n    'G': 23,\n    'C': 24,\n    'U': 25,\n}\n\n_DNA_TO_ID = {\n    # Map non-standard residues to UNK_NUCLEIC (N) -> 30\n    **{chr(i): 30 for i in range(ord('A'), ord('Z') + 1)},\n    # Continue the DNA indices from where DNA indices left off.\n    '-': 21,\n    'A': 26,\n    'G': 27,\n    'C': 28,\n    'T': 29,\n}\n\n\ndef extract_msa_features(\n    msa_sequences: Sequence[str], chain_poly_type: str\n) -> tuple[np.ndarray, np.ndarray]:\n  \"\"\"Extracts MSA features.\n\n  Example:\n  The input raw MSA is: `[[\"AAAAAA\"], [\"Ai-CiDiiiEFa\"]]`\n  The output MSA will be: `[[\"AAAAAA\"], [\"A-CDEF\"]]`\n  The deletions will be: `[[0, 0, 0, 0, 0, 0], [0, 1, 0, 1, 3, 0]]`\n\n  Args:\n    msa_sequences: A list of strings, each string with one MSA sequence. Each\n      string must have the same, constant number of non-lowercase (matching)\n      residues.\n    chain_poly_type: Either 'polypeptide(L)' (protein), 'polyribonucleotide'\n      (RNA), or 'polydeoxyribonucleotide' (DNA). Use the appropriate string\n      constant from mmcif_names.py.\n\n  Returns:\n    A tuple with:\n    * MSA array of shape (num_seq, num_res) that contains only the uppercase\n      characters or gaps (-) from the original MSA.\n    * Deletions array of shape (num_seq, num_res) that contains the number\n      of deletions (lowercase letters in the MSA) to the left from each\n      non-deleted residue (uppercase letters in the MSA).\n\n  Raises:\n    ValueError if any of the preconditions are not met.\n  \"\"\"\n\n  # Select the appropriate character map based on the chain type.\n  if chain_poly_type == mmcif_names.RNA_CHAIN:\n    char_map = _RNA_TO_ID\n  elif chain_poly_type == mmcif_names.DNA_CHAIN:\n    char_map = _DNA_TO_ID\n  elif chain_poly_type == mmcif_names.PROTEIN_CHAIN:\n    char_map = _PROTEIN_TO_ID\n  else:\n    raise ValueError(f'{chain_poly_type=} invalid.')\n\n  # Handle empty MSA.\n  if not msa_sequences:\n    empty_msa = np.array([], dtype=np.int32).reshape((0, 0))\n    empty_deletions = np.array([], dtype=np.int32).reshape((0, 0))\n    return empty_msa, empty_deletions\n\n  # Get the number of rows and columns in the MSA.\n  num_rows = len(msa_sequences)\n  num_cols = sum(1 for c in msa_sequences[0] if c in char_map)\n\n  # Initialize the output arrays.\n  msa_arr = np.zeros((num_rows, num_cols), dtype=np.int32)\n  deletions_arr = np.zeros((num_rows, num_cols), dtype=np.int32)\n\n  # Populate the output arrays.\n  for problem_row, msa_sequence in enumerate(msa_sequences):\n    deletion_count = 0\n    upper_count = 0\n    problem_col = 0\n    problems = []\n    for current in msa_sequence:\n      msa_id = char_map.get(current, -1)\n      if msa_id == -1:\n        if not current.islower():\n          problems.append(f'({problem_row}, {problem_col}):{current}')\n        deletion_count += 1\n      else:\n        # Check the access is safe before writing to the array.\n        # We don't need to check problem_row since it's guaranteed to be within\n        # the array bounds, while upper_count is incremented in the loop.\n        if upper_count < deletions_arr.shape[1]:\n          deletions_arr[problem_row, upper_count] = deletion_count\n          msa_arr[problem_row, upper_count] = msa_id\n        deletion_count = 0\n        upper_count += 1\n      problem_col += 1\n    if problems:\n      raise ValueError(\n          f\"Unknown residues in MSA: {', '.join(problems)}. \"\n          f'target_sequence: {msa_sequences[0]}'\n      )\n    if upper_count != num_cols:\n      raise ValueError(\n          'Invalid shape all strings must have the same number '\n          'of non-lowercase characters; First string has '\n          f\"{num_cols} non-lowercase characters but '{msa_sequence}' has \"\n          f'{upper_count}. target_sequence: {msa_sequences[0]}'\n      )\n\n  return msa_arr, deletions_arr\n\n\n# UniProtKB SwissProt/TrEMBL dbs have the following description format:\n# `db|UniqueIdentifier|EntryName`, e.g. `sp|P0C2L1|A3X1_LOXLA` or\n# `tr|A0A146SKV9|A0A146SKV9_FUNHE`.\n_UNIPROT_ENTRY_NAME_REGEX = re.compile(\n    # UniProtKB TrEMBL or SwissProt database.\n    r'(?:tr|sp)\\|'\n    # A primary accession number of the UniProtKB entry.\n    r'(?:[A-Z0-9]{6,10})'\n    # Occasionally there is an isoform suffix (e.g. _1 or _10) which we ignore.\n    r'(?:_\\d+)?\\|'\n    # TrEMBL: Same as AccessionId (6-10 characters).\n    # SwissProt: A mnemonic protein identification code (1-5 characters).\n    r'(?:[A-Z0-9]{1,10}_)'\n    # A mnemonic species identification code.\n    r'(?P<SpeciesId>[A-Z0-9]{1,5})'\n)\n\n\ndef extract_species_ids(msa_descriptions: Sequence[str]) -> Sequence[str]:\n  \"\"\"Extracts species ID from MSA UniProtKB sequence identifiers.\n\n  Args:\n    msa_descriptions: The descriptions (the FASTA/A3M comment line) for each of\n      the sequences.\n\n  Returns:\n    Extracted UniProtKB species IDs if there is a regex match for each\n    description line, blank if the regex doesn't match.\n  \"\"\"\n  species_ids = []\n  for msa_description in msa_descriptions:\n    msa_description = msa_description.strip()\n    match = _UNIPROT_ENTRY_NAME_REGEX.match(msa_description)\n    if match:\n      species_ids.append(match.group('SpeciesId'))\n    else:\n      # Handle cases where the regex doesn't match\n      # (e.g., append None or raise an error depending on your needs)\n      species_ids.append('')\n  return species_ids\n"
  },
  {
    "path": "src/alphafold3/data/msa_identifiers.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Utilities for extracting identifiers from MSA sequence descriptions.\"\"\"\n\nimport dataclasses\nimport re\n\n\n# Sequences coming from UniProtKB database come in the\n# `db|UniqueIdentifier|EntryName` format, e.g. `tr|A0A146SKV9|A0A146SKV9_FUNHE`\n# or `sp|P0C2L1|A3X1_LOXLA` (for TREMBL/Swiss-Prot respectively).\n_UNIPROT_PATTERN = re.compile(\n    r\"\"\"\n    ^\n    # UniProtKB/TrEMBL or UniProtKB/Swiss-Prot\n    (?:tr|sp)\n    \\|\n    # A primary accession number of the UniProtKB entry.\n    (?P<AccessionIdentifier>[A-Za-z0-9]{6,10})\n    # Occasionally there is a _0 or _1 isoform suffix, which we ignore.\n    (?:_\\d)?\n    \\|\n    # TREMBL repeats the accession ID here. Swiss-Prot has a mnemonic\n    # protein ID code.\n    (?:[A-Za-z0-9]+)\n    _\n    # A mnemonic species identification code.\n    (?P<SpeciesIdentifier>([A-Za-z0-9]){1,5})\n    # Small BFD uses a final value after an underscore, which we ignore.\n    (?:_\\d+)?\n    $\n    \"\"\",\n    re.VERBOSE,\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass Identifiers:\n  species_id: str = ''\n\n\ndef _parse_sequence_identifier(msa_sequence_identifier: str) -> Identifiers:\n  \"\"\"Gets species from an msa sequence identifier.\n\n  The sequence identifier has the format specified by\n  _UNIPROT_TREMBL_ENTRY_NAME_PATTERN or _UNIPROT_SWISSPROT_ENTRY_NAME_PATTERN.\n  An example of a sequence identifier: `tr|A0A146SKV9|A0A146SKV9_FUNHE`\n\n  Args:\n    msa_sequence_identifier: a sequence identifier.\n\n  Returns:\n    An `Identifiers` instance with species_id. These\n    can be empty in the case where no identifier was found.\n  \"\"\"\n  matches = re.search(_UNIPROT_PATTERN, msa_sequence_identifier.strip())\n  if matches:\n    return Identifiers(species_id=matches.group('SpeciesIdentifier'))\n  return Identifiers()\n\n\ndef _extract_sequence_identifier(description: str) -> str | None:\n  \"\"\"Extracts sequence identifier from description. Returns None if no match.\"\"\"\n  split_description = description.split()\n  if split_description:\n    return split_description[0].partition('/')[0]\n  else:\n    return None\n\n\ndef get_identifiers(description: str) -> Identifiers:\n  \"\"\"Computes extra MSA features from the description.\"\"\"\n  sequence_identifier = _extract_sequence_identifier(description)\n  if sequence_identifier is None:\n    return Identifiers()\n  else:\n    return _parse_sequence_identifier(sequence_identifier)\n"
  },
  {
    "path": "src/alphafold3/data/parsers.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Functions for parsing various file formats.\"\"\"\n\nfrom collections.abc import Iterable, Sequence\nfrom typing import IO, TypeAlias\n\nfrom alphafold3.cpp import fasta_iterator\nfrom alphafold3.cpp import msa_conversion\n\n\nDeletionMatrix: TypeAlias = Sequence[Sequence[int]]\n\n\ndef lazy_parse_fasta_string(fasta_string: str) -> Iterable[tuple[str, str]]:\n  \"\"\"Lazily parses a FASTA/A3M string and yields (sequence, description) tuples.\n\n  This implementation is more memory friendly than `fasta_sequence` while\n  offering comparable performance. The underlying implementation is in C++ and\n  is therefore faster than a pure Python implementation.\n\n  Use this method when parsing FASTA files where you already have the FASTA\n  string, but need to control how far you iterate through its sequences.\n\n  Arguments:\n    fasta_string: A string with the contents of FASTA/A3M file.\n\n  Returns:\n    Iterator of (sequence, description). In the description, the leading \">\" is\n    stripped.\n\n  Raises:\n    ValueError if the FASTA/A3M file is invalid, e.g. empty.\n  \"\"\"\n\n  # The lifetime of the FastaStringIterator is tied to the lifetime of\n  # fasta_string - fasta_string must be kept while the iterator is in use.\n  return fasta_iterator.FastaStringIterator(fasta_string)\n\n\ndef parse_fasta(fasta_string: str) -> tuple[Sequence[str], Sequence[str]]:\n  \"\"\"Parses FASTA string and returns list of strings with amino-acid sequences.\n\n  Arguments:\n    fasta_string: The string contents of a FASTA file.\n\n  Returns:\n    A tuple of two lists:\n    * A list of sequences.\n    * A list of sequence descriptions taken from the comment lines. In the\n      same order as the sequences.\n  \"\"\"\n  return fasta_iterator.parse_fasta_include_descriptions(fasta_string)\n\n\ndef convert_a3m_to_stockholm(a3m: str, max_seqs: int | None = None) -> str:\n  \"\"\"Converts MSA in the A3M format to the Stockholm format.\"\"\"\n  sequences, descriptions = parse_fasta(a3m)\n  if max_seqs is not None:\n    sequences = sequences[:max_seqs]\n    descriptions = descriptions[:max_seqs]\n\n  stockholm = ['# STOCKHOLM 1.0', '']\n\n  # Add the Stockholm header with the sequence metadata.\n  names = []\n  for i, description in enumerate(descriptions):\n    name, _, rest = description.replace('\\t', ' ').partition(' ')\n    # Ensure that the names are unique - stockholm format requires that\n    # the sequence names are unique.\n    name = f'{name}_{i}'\n    names.append(name)\n    # Avoid zero-length description due to historic hmmbuild parsing bug.\n    desc = rest.strip() or '<EMPTY>'\n    stockholm.append(f'#=GS {name.strip()} DE {desc}')\n  stockholm.append('')\n\n  # Convert insertions in a sequence into gaps in all other sequences that don't\n  # have an insertion in that column as well.\n  sequences = msa_conversion.convert_a3m_to_stockholm(sequences)\n\n  # Add the MSA data.\n  max_name_width = max(len(name) for name in names)\n  for name, sequence in zip(names, sequences, strict=True):\n    # Align the names to the left and pad with spaces to the maximum length.\n    stockholm.append(f'{name:<{max_name_width}s} {sequence}')\n\n  # Add the reference annotation for the query (the first sequence).\n  ref_annotation = ''.join('.' if c == '-' else 'x' for c in sequences[0])\n  stockholm.append(f'{\"#=GC RF\":<{max_name_width}s} {ref_annotation}')\n  stockholm.append('//')\n\n  return '\\n'.join(stockholm)\n\n\ndef convert_stockholm_to_a3m(\n    stockholm: IO[str],\n    max_sequences: int | None = None,\n    remove_first_row_gaps: bool = True,\n    linewidth: int | None = None,\n) -> str:\n  \"\"\"Converts MSA in Stockholm format to the A3M format.\"\"\"\n  descriptions = {}\n  sequences = {}\n  reached_max_sequences = False\n\n  if linewidth is not None and linewidth <= 0:\n    raise ValueError('linewidth must be > 0 or None')\n\n  for line in stockholm:\n    reached_max_sequences = max_sequences and len(sequences) >= max_sequences\n    line = line.strip()\n    # Ignore blank lines, markup and end symbols - remainder are alignment\n    # sequence parts.\n    if not line or line.startswith(('#', '//')):\n      continue\n    seqname, aligned_seq = line.split(maxsplit=1)\n    if seqname not in sequences:\n      if reached_max_sequences:\n        continue\n      sequences[seqname] = ''\n    sequences[seqname] += aligned_seq\n\n  if not sequences:\n    return ''\n\n  stockholm.seek(0)\n  for line in stockholm:\n    line = line.strip()\n    if line[:4] == '#=GS':\n      # Description row - example format is:\n      # #=GS UniRef90_Q9H5Z4/4-78            DE [subseq from] cDNA: FLJ22755 ...\n      columns = line.split(maxsplit=3)\n      seqname, feature = columns[1:3]\n      value = columns[3] if len(columns) == 4 else ''\n      if feature != 'DE':\n        continue\n      if reached_max_sequences and seqname not in sequences:\n        continue\n      descriptions[seqname] = value\n      if len(descriptions) == len(sequences):\n        break\n\n  assert len(descriptions) <= len(sequences)\n\n  # Convert sto format to a3m line by line\n  a3m_sequences = {}\n  # query_sequence is assumed to be the first sequence\n  query_sequence = next(iter(sequences.values()))\n  for seqname, sto_sequence in sequences.items():\n    if remove_first_row_gaps:\n      a3m_sequences[seqname] = msa_conversion.align_sequence_to_gapless_query(\n          sequence=sto_sequence, query_sequence=query_sequence\n      ).replace('.', '')\n    else:\n      a3m_sequences[seqname] = sto_sequence.replace('.', '')\n\n  fasta_chunks = []\n\n  for seqname, seq in a3m_sequences.items():\n    fasta_chunks.append(f'>{seqname} {descriptions.get(seqname, \"\")}')\n\n    if linewidth:\n      fasta_chunks.extend(\n          seq[i : linewidth + i] for i in range(0, len(seq), linewidth)\n      )\n    else:\n      fasta_chunks.append(seq)\n\n  return '\\n'.join(fasta_chunks) + '\\n'  # Include terminating newline.\n"
  },
  {
    "path": "src/alphafold3/data/pipeline.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Functions for running the MSA and template tools for the AlphaFold model.\"\"\"\n\nfrom concurrent import futures\nimport dataclasses\nimport datetime\nimport functools\nimport logging\nimport time\n\nfrom alphafold3.common import folding_input\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.data import msa\nfrom alphafold3.data import msa_config\nfrom alphafold3.data import structure_stores\nfrom alphafold3.data import templates as templates_lib\n\n\n# Cache to avoid re-running template search for the same sequence in homomers.\n@functools.cache\ndef _get_protein_templates(\n    sequence: str,\n    input_msa_a3m: str,\n    run_template_search: bool,\n    templates_config: msa_config.TemplatesConfig,\n    pdb_database_path: str,\n) -> templates_lib.Templates:\n  \"\"\"Searches for templates for a single protein chain.\"\"\"\n  if run_template_search:\n    templates_start_time = time.time()\n    logging.info('Getting protein templates for sequence %s', sequence)\n    protein_templates = templates_lib.Templates.from_seq_and_a3m(\n        query_sequence=sequence,\n        msa_a3m=input_msa_a3m,\n        max_template_date=templates_config.filter_config.max_template_date,\n        database_path=templates_config.template_tool_config.database_path,\n        hmmsearch_config=templates_config.template_tool_config.hmmsearch_config,\n        max_a3m_query_sequences=None,\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n        structure_store=structure_stores.StructureStore(pdb_database_path),\n        filter_config=templates_config.filter_config,\n    )\n    logging.info(\n        'Getting %d protein templates took %.2f seconds for sequence %s',\n        protein_templates.num_hits,\n        time.time() - templates_start_time,\n        sequence,\n    )\n  else:\n    logging.info('Skipping template search for sequence %s', sequence)\n    protein_templates = templates_lib.Templates(\n        query_sequence=sequence,\n        hits=[],\n        max_template_date=templates_config.filter_config.max_template_date,\n        structure_store=structure_stores.StructureStore(pdb_database_path),\n    )\n  return protein_templates\n\n\n# Cache to avoid re-running the MSA tools for the same sequence in homomers.\n@functools.cache\ndef _get_protein_msa_and_templates(\n    sequence: str,\n    run_template_search: bool,\n    uniref90_msa_config: msa_config.RunConfig,\n    mgnify_msa_config: msa_config.RunConfig,\n    small_bfd_msa_config: msa_config.RunConfig,\n    uniprot_msa_config: msa_config.RunConfig,\n    templates_config: msa_config.TemplatesConfig,\n    pdb_database_path: str,\n) -> tuple[msa.Msa, msa.Msa, templates_lib.Templates]:\n  \"\"\"Processes a single protein chain.\"\"\"\n  logging.info('Getting protein MSAs for sequence %s', sequence)\n  msa_start_time = time.time()\n  # Run various MSA tools in parallel. Use a ThreadPoolExecutor because\n  # they're not blocked by the GIL, as they're sub-shelled out.\n  with futures.ThreadPoolExecutor(max_workers=4) as executor:\n    uniref90_msa_future = executor.submit(\n        msa.get_msa,\n        target_sequence=sequence,\n        run_config=uniref90_msa_config,\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n    )\n    mgnify_msa_future = executor.submit(\n        msa.get_msa,\n        target_sequence=sequence,\n        run_config=mgnify_msa_config,\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n    )\n    small_bfd_msa_future = executor.submit(\n        msa.get_msa,\n        target_sequence=sequence,\n        run_config=small_bfd_msa_config,\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n    )\n    uniprot_msa_future = executor.submit(\n        msa.get_msa,\n        target_sequence=sequence,\n        run_config=uniprot_msa_config,\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n    )\n  uniref90_msa = uniref90_msa_future.result()\n  mgnify_msa = mgnify_msa_future.result()\n  small_bfd_msa = small_bfd_msa_future.result()\n  uniprot_msa = uniprot_msa_future.result()\n  logging.info(\n      'Getting protein MSAs took %.2f seconds for sequence %s',\n      time.time() - msa_start_time,\n      sequence,\n  )\n\n  logging.info('Deduplicating MSAs for sequence %s', sequence)\n  msa_dedupe_start_time = time.time()\n  with futures.ThreadPoolExecutor() as executor:\n    unpaired_protein_msa_future = executor.submit(\n        msa.Msa.from_multiple_msas,\n        msas=[uniref90_msa, small_bfd_msa, mgnify_msa],\n        deduplicate=True,\n    )\n    paired_protein_msa_future = executor.submit(\n        msa.Msa.from_multiple_msas, msas=[uniprot_msa], deduplicate=False\n    )\n  unpaired_protein_msa = unpaired_protein_msa_future.result()\n  paired_protein_msa = paired_protein_msa_future.result()\n  logging.info(\n      'Deduplicating MSAs took %.2f seconds for sequence %s, found %d unpaired'\n      ' sequences, %d paired sequences',\n      time.time() - msa_dedupe_start_time,\n      sequence,\n      unpaired_protein_msa.depth,\n      paired_protein_msa.depth,\n  )\n\n  protein_templates = _get_protein_templates(\n      sequence=sequence,\n      input_msa_a3m=unpaired_protein_msa.to_a3m(),\n      run_template_search=run_template_search,\n      templates_config=templates_config,\n      pdb_database_path=pdb_database_path,\n  )\n\n  return unpaired_protein_msa, paired_protein_msa, protein_templates\n\n\n# Cache to avoid re-running the Nhmmer for the same sequence in homomers.\n@functools.cache\ndef _get_rna_msa(\n    sequence: str,\n    nt_rna_msa_config: msa_config.NhmmerConfig,\n    rfam_msa_config: msa_config.NhmmerConfig,\n    rnacentral_msa_config: msa_config.NhmmerConfig,\n) -> msa.Msa:\n  \"\"\"Processes a single RNA chain.\"\"\"\n  logging.info('Getting RNA MSAs for sequence %s', sequence)\n  rna_msa_start_time = time.time()\n  # Run various MSA tools in parallel. Use a ThreadPoolExecutor because\n  # they're not blocked by the GIL, as they're sub-shelled out.\n  with futures.ThreadPoolExecutor() as executor:\n    nt_rna_msa_future = executor.submit(\n        msa.get_msa,\n        target_sequence=sequence,\n        run_config=nt_rna_msa_config,\n        chain_poly_type=mmcif_names.RNA_CHAIN,\n    )\n    rfam_msa_future = executor.submit(\n        msa.get_msa,\n        target_sequence=sequence,\n        run_config=rfam_msa_config,\n        chain_poly_type=mmcif_names.RNA_CHAIN,\n    )\n    rnacentral_msa_future = executor.submit(\n        msa.get_msa,\n        target_sequence=sequence,\n        run_config=rnacentral_msa_config,\n        chain_poly_type=mmcif_names.RNA_CHAIN,\n    )\n  nt_rna_msa = nt_rna_msa_future.result()\n  rfam_msa = rfam_msa_future.result()\n  rnacentral_msa = rnacentral_msa_future.result()\n  rna_msa = msa.Msa.from_multiple_msas(\n      msas=[rfam_msa, rnacentral_msa, nt_rna_msa],\n      deduplicate=True,\n  )\n  logging.info(\n      'Getting RNA MSAs took %.2f seconds for sequence %s, found %d unpaired'\n      ' sequences',\n      time.time() - rna_msa_start_time,\n      sequence,\n      rna_msa.depth,\n  )\n  return rna_msa\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass DataPipelineConfig:\n  \"\"\"The configuration for the data pipeline.\n\n  Attributes:\n    jackhmmer_binary_path: Jackhmmer binary path, used for protein MSA search.\n    nhmmer_binary_path: Nhmmer binary path, used for RNA MSA search.\n    hmmalign_binary_path: Hmmalign binary path, used to align hits to the query\n      profile.\n    hmmsearch_binary_path: Hmmsearch binary path, used for template search.\n    hmmbuild_binary_path: Hmmbuild binary path, used to build HMM profile from\n      raw MSA in template search.\n    small_bfd_database_path: Small BFD database path, used for protein MSA\n      search.\n    small_bfd_z_value: The Z-value representing the database size in number of\n      sequences for E-value calculation. Must be set for sharded databases.\n    mgnify_database_path: Mgnify database path, used for protein MSA search.\n    mgnify_z_value: The Z-value representing the database size in number of\n      sequences for E-value calculation. Must be set for sharded databases.\n    uniprot_cluster_annot_database_path: Uniprot database path, used for protein\n      paired MSA search.\n    uniprot_cluster_annot_z_value: The Z-value representing the database size in\n      number of sequences for E-value calculation. Must be set for sharded\n      databases.\n    uniref90_database_path: UniRef90 database path, used for MSA search, and the\n      MSA obtained by searching it is used to construct the profile for template\n      search.\n    uniref90_z_value: The Z-value representing the database size in number of\n      sequences for E-value calculation. Must be set for sharded databases.\n    ntrna_database_path: NT-RNA database path, used for RNA MSA search.\n    ntrna_z_value: The Z-value representing the database size in megabases for\n      E-value calculation. Must be set for sharded databases.\n    rfam_database_path: Rfam database path, used for RNA MSA search.\n    rfam_z_value: The Z-value representing the database size in megabases for\n      E-value calculation. Must be set for sharded databases.\n    rna_central_database_path: RNAcentral database path, used for RNA MSA\n      search.\n    rna_central_z_value: The Z-value representing the database size in megabases\n      for E-value calculation. Must be set for sharded databases.\n    seqres_database_path: PDB sequence database path, used for template search.\n    pdb_database_path: PDB database directory with mmCIF files path, used for\n      template search.\n    jackhmmer_n_cpu: Number of CPUs to use for Jackhmmer.\n    jackhmmer_max_parallel_shards: Maximum number of shards to search against in\n      parallel. If None, one Jackhmmer instance will be run per shard. Only\n      applicable if the database is sharded.\n    nhmmer_n_cpu: Number of CPUs to use for Nhmmer.\n    nhmmer_max_parallel_shards: Maximum number of shards to search against in\n      parallel. If None, one Nhmmer instance will be run per shard. Only\n      applicable if the database is sharded.\n    max_template_date: The latest date of templates to use.\n  \"\"\"\n\n  # Binary paths.\n  jackhmmer_binary_path: str\n  nhmmer_binary_path: str\n  hmmalign_binary_path: str\n  hmmsearch_binary_path: str\n  hmmbuild_binary_path: str\n\n  # Jackhmmer databases.\n  small_bfd_database_path: str\n  small_bfd_z_value: int | None = None\n  mgnify_database_path: str\n  mgnify_z_value: int | None = None\n  uniprot_cluster_annot_database_path: str\n  uniprot_cluster_annot_z_value: int | None = None\n  uniref90_database_path: str\n  uniref90_z_value: int | None = None\n  # Nhmmer databases.\n  ntrna_database_path: str\n  ntrna_z_value: int | None = None\n  rfam_database_path: str\n  rfam_z_value: int | None = None\n  rna_central_database_path: str\n  rna_central_z_value: int | None = None\n  # Template search databases.\n  seqres_database_path: str\n  pdb_database_path: str\n\n  # Optional configuration for MSA tools.\n  jackhmmer_n_cpu: int = 8\n  jackhmmer_max_parallel_shards: int | None = None\n  nhmmer_n_cpu: int = 8\n  nhmmer_max_parallel_shards: int | None = None\n\n  max_template_date: datetime.date\n\n\nclass DataPipeline:\n  \"\"\"Runs the alignment tools and assembles the input features.\"\"\"\n\n  def __init__(self, data_pipeline_config: DataPipelineConfig):\n    \"\"\"Initializes the data pipeline with default configurations.\"\"\"\n    self._uniref90_msa_config = msa_config.RunConfig(\n        config=msa_config.JackhmmerConfig(\n            binary_path=data_pipeline_config.jackhmmer_binary_path,\n            database_config=msa_config.DatabaseConfig(\n                name='uniref90',\n                path=data_pipeline_config.uniref90_database_path,\n            ),\n            n_cpu=data_pipeline_config.jackhmmer_n_cpu,\n            n_iter=1,\n            e_value=1e-4,\n            z_value=data_pipeline_config.uniref90_z_value,\n            dom_z_value=data_pipeline_config.uniref90_z_value,\n            max_sequences=10_000,\n            max_parallel_shards=data_pipeline_config.jackhmmer_max_parallel_shards,\n        ),\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n        crop_size=None,\n    )\n    self._mgnify_msa_config = msa_config.RunConfig(\n        config=msa_config.JackhmmerConfig(\n            binary_path=data_pipeline_config.jackhmmer_binary_path,\n            database_config=msa_config.DatabaseConfig(\n                name='mgnify',\n                path=data_pipeline_config.mgnify_database_path,\n            ),\n            n_cpu=data_pipeline_config.jackhmmer_n_cpu,\n            n_iter=1,\n            e_value=1e-4,\n            z_value=data_pipeline_config.mgnify_z_value,\n            dom_z_value=data_pipeline_config.mgnify_z_value,\n            max_sequences=5_000,\n            max_parallel_shards=data_pipeline_config.jackhmmer_max_parallel_shards,\n        ),\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n        crop_size=None,\n    )\n    self._small_bfd_msa_config = msa_config.RunConfig(\n        config=msa_config.JackhmmerConfig(\n            binary_path=data_pipeline_config.jackhmmer_binary_path,\n            database_config=msa_config.DatabaseConfig(\n                name='small_bfd',\n                path=data_pipeline_config.small_bfd_database_path,\n            ),\n            n_cpu=data_pipeline_config.jackhmmer_n_cpu,\n            n_iter=1,\n            e_value=1e-4,\n            # Set z_value=138_515_945 to match the z_value used in the paper.\n            # In practice, this has minimal impact on predicted structures.\n            z_value=data_pipeline_config.small_bfd_z_value,\n            dom_z_value=data_pipeline_config.small_bfd_z_value,\n            max_sequences=5_000,\n            max_parallel_shards=data_pipeline_config.jackhmmer_max_parallel_shards,\n        ),\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n        crop_size=None,\n    )\n    self._uniprot_msa_config = msa_config.RunConfig(\n        config=msa_config.JackhmmerConfig(\n            binary_path=data_pipeline_config.jackhmmer_binary_path,\n            database_config=msa_config.DatabaseConfig(\n                name='uniprot_cluster_annot',\n                path=data_pipeline_config.uniprot_cluster_annot_database_path,\n            ),\n            n_cpu=data_pipeline_config.jackhmmer_n_cpu,\n            n_iter=1,\n            e_value=1e-4,\n            z_value=data_pipeline_config.uniprot_cluster_annot_z_value,\n            dom_z_value=data_pipeline_config.uniprot_cluster_annot_z_value,\n            max_sequences=50_000,\n            max_parallel_shards=data_pipeline_config.jackhmmer_max_parallel_shards,\n        ),\n        chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n        crop_size=None,\n    )\n    self._nt_rna_msa_config = msa_config.RunConfig(\n        config=msa_config.NhmmerConfig(\n            binary_path=data_pipeline_config.nhmmer_binary_path,\n            hmmalign_binary_path=data_pipeline_config.hmmalign_binary_path,\n            hmmbuild_binary_path=data_pipeline_config.hmmbuild_binary_path,\n            database_config=msa_config.DatabaseConfig(\n                name='nt_rna',\n                path=data_pipeline_config.ntrna_database_path,\n            ),\n            n_cpu=data_pipeline_config.nhmmer_n_cpu,\n            e_value=1e-3,\n            alphabet='rna',\n            z_value=data_pipeline_config.ntrna_z_value,\n            max_sequences=10_000,\n            max_parallel_shards=data_pipeline_config.nhmmer_max_parallel_shards,\n        ),\n        chain_poly_type=mmcif_names.RNA_CHAIN,\n        crop_size=None,\n    )\n    self._rfam_msa_config = msa_config.RunConfig(\n        config=msa_config.NhmmerConfig(\n            binary_path=data_pipeline_config.nhmmer_binary_path,\n            hmmalign_binary_path=data_pipeline_config.hmmalign_binary_path,\n            hmmbuild_binary_path=data_pipeline_config.hmmbuild_binary_path,\n            database_config=msa_config.DatabaseConfig(\n                name='rfam_rna',\n                path=data_pipeline_config.rfam_database_path,\n            ),\n            n_cpu=data_pipeline_config.nhmmer_n_cpu,\n            e_value=1e-3,\n            alphabet='rna',\n            z_value=data_pipeline_config.rfam_z_value,\n            max_sequences=10_000,\n            max_parallel_shards=data_pipeline_config.nhmmer_max_parallel_shards,\n        ),\n        chain_poly_type=mmcif_names.RNA_CHAIN,\n        crop_size=None,\n    )\n    self._rnacentral_msa_config = msa_config.RunConfig(\n        config=msa_config.NhmmerConfig(\n            binary_path=data_pipeline_config.nhmmer_binary_path,\n            hmmalign_binary_path=data_pipeline_config.hmmalign_binary_path,\n            hmmbuild_binary_path=data_pipeline_config.hmmbuild_binary_path,\n            database_config=msa_config.DatabaseConfig(\n                name='rna_central_rna',\n                path=data_pipeline_config.rna_central_database_path,\n            ),\n            n_cpu=data_pipeline_config.nhmmer_n_cpu,\n            e_value=1e-3,\n            alphabet='rna',\n            z_value=data_pipeline_config.rna_central_z_value,\n            max_sequences=10_000,\n            max_parallel_shards=data_pipeline_config.nhmmer_max_parallel_shards,\n        ),\n        chain_poly_type=mmcif_names.RNA_CHAIN,\n        crop_size=None,\n    )\n\n    self._templates_config = msa_config.TemplatesConfig(\n        template_tool_config=msa_config.TemplateToolConfig(\n            database_path=data_pipeline_config.seqres_database_path,\n            chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n            hmmsearch_config=msa_config.HmmsearchConfig(\n                hmmsearch_binary_path=data_pipeline_config.hmmsearch_binary_path,\n                hmmbuild_binary_path=data_pipeline_config.hmmbuild_binary_path,\n                filter_f1=0.1,\n                filter_f2=0.1,\n                filter_f3=0.1,\n                e_value=100,\n                inc_e=100,\n                dom_e=100,\n                incdom_e=100,\n                alphabet='amino',\n            ),\n        ),\n        filter_config=msa_config.TemplateFilterConfig(\n            max_subsequence_ratio=0.95,\n            min_align_ratio=0.1,\n            min_hit_length=10,\n            deduplicate_sequences=True,\n            max_hits=4,\n            max_template_date=data_pipeline_config.max_template_date,\n        ),\n    )\n    self._pdb_database_path = data_pipeline_config.pdb_database_path\n\n  def process_protein_chain(\n      self, chain: folding_input.ProteinChain\n  ) -> folding_input.ProteinChain:\n    \"\"\"Processes a single protein chain.\"\"\"\n    has_unpaired_msa = chain.unpaired_msa is not None\n    has_paired_msa = chain.paired_msa is not None\n    has_templates = chain.templates is not None\n\n    if not has_unpaired_msa and not has_paired_msa and not chain.templates:\n      # MSA None - search. Templates either [] - don't search, or None - search.\n      unpaired_msa, paired_msa, template_hits = _get_protein_msa_and_templates(\n          sequence=chain.sequence,\n          run_template_search=not has_templates,  # Skip template search if [].\n          uniref90_msa_config=self._uniref90_msa_config,\n          mgnify_msa_config=self._mgnify_msa_config,\n          small_bfd_msa_config=self._small_bfd_msa_config,\n          uniprot_msa_config=self._uniprot_msa_config,\n          templates_config=self._templates_config,\n          pdb_database_path=self._pdb_database_path,\n      )\n      unpaired_msa = unpaired_msa.to_a3m()\n      paired_msa = paired_msa.to_a3m()\n      templates = [\n          folding_input.Template(\n              mmcif=struc.to_mmcif(),\n              query_to_template_map=hit.query_to_hit_mapping,\n          )\n          for hit, struc in template_hits.get_hits_with_structures()\n      ]\n    elif has_unpaired_msa and has_paired_msa and not has_templates:\n      # Has MSA, but doesn't have templates. Search for templates only.\n      empty_msa = msa.Msa.from_empty(\n          query_sequence=chain.sequence,\n          chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n      ).to_a3m()\n      unpaired_msa = chain.unpaired_msa or empty_msa\n      paired_msa = chain.paired_msa or empty_msa\n      template_hits = _get_protein_templates(\n          sequence=chain.sequence,\n          input_msa_a3m=unpaired_msa,\n          run_template_search=True,\n          templates_config=self._templates_config,\n          pdb_database_path=self._pdb_database_path,\n      )\n      templates = [\n          folding_input.Template(\n              mmcif=struc.to_mmcif(),\n              query_to_template_map=hit.query_to_hit_mapping,\n          )\n          for hit, struc in template_hits.get_hits_with_structures()\n      ]\n    else:\n      # Has MSA and templates, don't search for anything.\n      if not has_unpaired_msa or not has_paired_msa or not has_templates:\n        raise ValueError(\n            f'Protein chain {chain.id} has unpaired MSA, paired MSA, or'\n            ' templates set only partially. If you want to run the pipeline'\n            ' with custom MSA/templates, you need to set all of them. You can'\n            ' set MSA to empty string and templates to empty list to signify'\n            ' that they should not be used and searched for.'\n        )\n      logging.info(\n          'Skipping MSA and template search for protein chain %s because it '\n          'already has MSAs and templates.',\n          chain.id,\n      )\n      if not chain.unpaired_msa:\n        logging.info('Using empty unpaired MSA for protein chain %s', chain.id)\n      if not chain.paired_msa:\n        logging.info('Using empty paired MSA for protein chain %s', chain.id)\n      if not chain.templates:\n        logging.info('Using no templates for protein chain %s', chain.id)\n      empty_msa = msa.Msa.from_empty(\n          query_sequence=chain.sequence,\n          chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n      ).to_a3m()\n      unpaired_msa = chain.unpaired_msa or empty_msa\n      paired_msa = chain.paired_msa or empty_msa\n      templates = chain.templates\n\n    return folding_input.ProteinChain(\n        id=chain.id,\n        sequence=chain.sequence,\n        ptms=chain.ptms,\n        unpaired_msa=unpaired_msa,\n        paired_msa=paired_msa,\n        templates=templates,\n    )\n\n  def process_rna_chain(\n      self, chain: folding_input.RnaChain\n  ) -> folding_input.RnaChain:\n    \"\"\"Processes a single RNA chain.\"\"\"\n    if chain.unpaired_msa is not None:\n      # Don't run MSA tools if the chain already has an MSA.\n      logging.info(\n          'Skipping MSA search for RNA chain %s because it already has MSA.',\n          chain.id,\n      )\n      if not chain.unpaired_msa:\n        logging.info('Using empty unpaired MSA for RNA chain %s', chain.id)\n      empty_msa = msa.Msa.from_empty(\n          query_sequence=chain.sequence, chain_poly_type=mmcif_names.RNA_CHAIN\n      ).to_a3m()\n      unpaired_msa = chain.unpaired_msa or empty_msa\n    else:\n      unpaired_msa = _get_rna_msa(\n          sequence=chain.sequence,\n          nt_rna_msa_config=self._nt_rna_msa_config,\n          rfam_msa_config=self._rfam_msa_config,\n          rnacentral_msa_config=self._rnacentral_msa_config,\n      ).to_a3m()\n    return folding_input.RnaChain(\n        id=chain.id,\n        sequence=chain.sequence,\n        modifications=chain.modifications,\n        unpaired_msa=unpaired_msa,\n    )\n\n  def process(self, fold_input: folding_input.Input) -> folding_input.Input:\n    \"\"\"Runs MSA and template tools and returns a new Input with the results.\"\"\"\n    processed_chains = []\n    for chain in fold_input.chains:\n      print(f'Running data pipeline for chain {chain.id}...')\n      process_chain_start_time = time.time()\n      match chain:\n        case folding_input.ProteinChain():\n          processed_chains.append(self.process_protein_chain(chain))\n        case folding_input.RnaChain():\n          processed_chains.append(self.process_rna_chain(chain))\n        case _:\n          processed_chains.append(chain)\n      print(\n          f'Running data pipeline for chain {chain.id} took'\n          f' {time.time() - process_chain_start_time:.2f} seconds',\n      )\n\n    return dataclasses.replace(fold_input, chains=processed_chains)\n"
  },
  {
    "path": "src/alphafold3/data/structure_stores.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Library for loading structure data from various sources.\"\"\"\n\nfrom collections.abc import Mapping, Sequence\nimport functools\nimport os\nimport pathlib\nimport tarfile\n\n\nclass NotFoundError(KeyError):\n  \"\"\"Raised when the structure store doesn't contain the requested target.\"\"\"\n\n\nclass StructureStore:\n  \"\"\"Handles the retrieval of mmCIF files from a filesystem.\"\"\"\n\n  def __init__(\n      self,\n      structures: str | os.PathLike[str] | Mapping[str, str],\n  ):\n    \"\"\"Initialises the instance.\n\n    Args:\n      structures: Path of the directory where the mmCIF files are or a Mapping\n        from target name to mmCIF string.\n    \"\"\"\n    if isinstance(structures, Mapping):\n      self._structure_mapping = structures\n      self._structure_path = None\n      self._structure_tar = None\n    else:\n      self._structure_mapping = None\n      path_str = os.fspath(structures)\n      if path_str.endswith('.tar'):\n        self._structure_tar = tarfile.open(path_str, 'r')\n        self._structure_path = None\n      else:\n        self._structure_path = pathlib.Path(structures)\n        self._structure_tar = None\n\n  @functools.cached_property\n  def _tar_members(self) -> Mapping[str, tarfile.TarInfo]:\n    assert self._structure_tar is not None\n    return {\n        path.stem: tarinfo\n        for tarinfo in self._structure_tar.getmembers()\n        if tarinfo.isfile()\n        and (path := pathlib.Path(tarinfo.path.lower())).suffix == '.cif'\n    }\n\n  def get_mmcif_str(self, target_name: str) -> str:\n    \"\"\"Returns an mmCIF for a given `target_name`.\n\n    Args:\n      target_name: Name specifying the target mmCIF.\n\n    Raises:\n      NotFoundError: If the target is not found.\n    \"\"\"\n    if self._structure_mapping is not None:\n      try:\n        return self._structure_mapping[target_name]\n      except KeyError as e:\n        raise NotFoundError(f'{target_name=} not found') from e\n\n    if self._structure_tar is not None:\n      try:\n        member = self._tar_members[target_name]\n        if struct_file := self._structure_tar.extractfile(member):\n          return struct_file.read().decode()\n        else:\n          raise NotFoundError(f'{target_name=} not found')\n      except KeyError:\n        raise NotFoundError(f'{target_name=} not found') from None\n\n    filepath = self._structure_path / f'{target_name}.cif'\n    try:\n      return filepath.read_text()\n    except FileNotFoundError as e:\n      raise NotFoundError(f'{target_name=} not found at {filepath=}') from e\n\n  def target_names(self) -> Sequence[str]:\n    \"\"\"Returns all targets in the store.\"\"\"\n    if self._structure_mapping is not None:\n      return [*self._structure_mapping.keys()]\n    elif self._structure_tar is not None:\n      return sorted(self._tar_members.keys())\n    elif self._structure_path is not None:\n      return sorted([path.stem for path in self._structure_path.glob('*.cif')])\n    return ()\n"
  },
  {
    "path": "src/alphafold3/data/template_realign.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Realign sequences found in PDB seqres to the actual CIF sequences.\"\"\"\n\nfrom collections.abc import Mapping\n\n\nclass AlignmentError(Exception):\n  \"\"\"Failed alignment between the hit sequence and the actual mmCIF sequence.\"\"\"\n\n\ndef realign_hit_to_structure(\n    *,\n    hit_sequence: str,\n    hit_start_index: int,\n    hit_end_index: int,\n    full_length: int,\n    structure_sequence: str,\n    query_to_hit_mapping: Mapping[int, int],\n) -> Mapping[int, int]:\n  \"\"\"Realigns the hit sequence to the Structure sequence.\n\n  For example, for the given input:\n    query_sequence : ABCDEFGHIJKL\n    hit_sequence   : ---DEFGHIJK-\n    struc_sequence : XDEFGHKL\n  the mapping is {3: 0, 4: 1, 5: 2, 6: 3, 7: 4, 8: 5, 9: 6, 10: 7}. However, the\n  actual Structure sequence has an extra X at the start as well as no IJ. So the\n  alignment from the query to the Structure sequence will be:\n    hit_sequence   : ---DEFGHIJK-\n    struc_aligned  : --XDEFGH--KL\n  and the new mapping will therefore be: {3: 1, 4: 2, 5: 3, 6: 4, 7: 5, 10: 6}.\n\n  Args:\n    hit_sequence: The PDB seqres hit sequence obtained from Hmmsearch, but\n      without any gaps. This is not the full PDB seqres template sequence but\n      rather just its subsequence from hit_start_index to hit_end_index.\n    hit_start_index: The start index of the hit sequence in the full PDB seqres\n      template sequence (inclusive).\n    hit_end_index: The end index of the hit sequence in the full PDB seqres\n      template sequence (exclusive).\n    full_length: The length of the full PDB seqres template sequence.\n    structure_sequence: The actual sequence extracted from the Structure\n      corresponding to this template. In vast majority of cases this is the same\n      as the PDB seqres sequence, but this function handles the cases when not.\n    query_to_hit_mapping: The mapping from the query sequence to the\n      hit_sequence.\n\n  Raises:\n    AlignmentError: if the alignment between the sequence returned by Hmmsearch\n      differs from the actual sequence found in the mmCIF and can't be aligned\n      using the simple alignment algorithm.\n\n  Returns:\n    A mapping from the query sequence to the actual Structure sequence.\n  \"\"\"\n  max_num_gaps = full_length - len(structure_sequence)\n  if max_num_gaps < 0:\n    raise AlignmentError(\n        f'The Structure sequence ({len(structure_sequence)}) '\n        f'must be shorter than the PDB seqres sequence ({full_length}):\\n'\n        f'Structure sequence : {structure_sequence}\\n'\n        f'PDB seqres sequence: {hit_sequence}'\n    )\n\n  if len(hit_sequence) != hit_end_index - hit_start_index:\n    raise AlignmentError(\n        f'The difference of {hit_end_index=} and {hit_start_index=} does not '\n        f'equal to the length of the {hit_sequence}: {len(hit_sequence)}'\n    )\n\n  best_score = -1\n  best_start = 0\n  best_query_to_hit_mapping = query_to_hit_mapping\n  max_num_gaps_before_subseq = min(hit_start_index, max_num_gaps)\n  # It is possible the gaps needed to align the PDB seqres subsequence and\n  # the Structure subsequence need to be inserted before the match region.\n  # Try and pick the alignment with the best number of aligned residues.\n  for num_gaps_before_subseq in range(0, max_num_gaps_before_subseq + 1):\n    start = hit_start_index - num_gaps_before_subseq\n    end = hit_end_index - num_gaps_before_subseq\n    structure_subseq = structure_sequence[start:end]\n\n    new_query_to_hit_mapping, score = _remap_to_struc_seq(\n        hit_seq=hit_sequence,\n        struc_seq=structure_subseq,\n        max_num_gaps=max_num_gaps - num_gaps_before_subseq,\n        mapping=query_to_hit_mapping,\n    )\n    if score >= best_score:\n      # Use >= to prefer matches with larger number of gaps before.\n      best_score = score\n      best_start = start\n      best_query_to_hit_mapping = new_query_to_hit_mapping\n\n  return {q: h + best_start for q, h in best_query_to_hit_mapping.items()}\n\n\ndef _remap_to_struc_seq(\n    *,\n    hit_seq: str,\n    struc_seq: str,\n    max_num_gaps: int,\n    mapping: Mapping[int, int],\n) -> tuple[Mapping[int, int], int]:\n  \"\"\"Remaps the query -> hit mapping to match the actual Structure sequence.\n\n  Args:\n    hit_seq: The hit sequence - a subsequence of the PDB seqres sequence without\n      any Hmmsearch modifications like inserted gaps or lowercased residues.\n    struc_seq: The actual sequence obtained from the corresponding Structure.\n    max_num_gaps: The maximum number of gaps that can be inserted in the\n      Structure sequence. In practice, this is the length difference between the\n      PDB seqres sequence and the actual Structure sequence.\n    mapping: The mapping from the query residues to the hit residues. This will\n      be remapped to point to the actual Structure sequence using a simple\n      realignment algorithm.\n\n  Returns:\n    A tuple of (mapping, score):\n      * Mapping from the query to the actual Structure sequence.\n      * Score which is the number of matching aligned residues.\n\n  Raises:\n    ValueError if the structure sequence isn't shorter than the seqres sequence.\n    ValueError if the alignment fails.\n  \"\"\"\n  hit_seq_idx = 0\n  struc_seq_idx = 0\n  hit_to_struc_seq_mapping = {}\n  score = 0\n\n  # This while loop is guaranteed to terminate since we increase both\n  # struc_seq_idx and hit_seq_idx by at least 1 in each iteration.\n  remaining_num_gaps = max_num_gaps\n  while hit_seq_idx < len(hit_seq) and struc_seq_idx < len(struc_seq):\n    if hit_seq[hit_seq_idx] != struc_seq[struc_seq_idx]:\n      # Explore which alignment aligns the next residue (if present).\n      best_shift = 0\n      for shift in range(0, remaining_num_gaps + 1):\n        next_hit_res = hit_seq[hit_seq_idx + shift : hit_seq_idx + shift + 1]\n        next_struc_res = struc_seq[struc_seq_idx : struc_seq_idx + 1]\n        if next_hit_res == next_struc_res:\n          best_shift = shift\n          break\n      hit_seq_idx += best_shift\n      remaining_num_gaps -= best_shift\n\n    hit_to_struc_seq_mapping[hit_seq_idx] = struc_seq_idx\n    score += hit_seq[hit_seq_idx] == struc_seq[struc_seq_idx]\n    hit_seq_idx += 1\n    struc_seq_idx += 1\n\n  fixed_mapping = {}\n  for query_idx, original_hit_idx in mapping.items():\n    fixed_hit_idx = hit_to_struc_seq_mapping.get(original_hit_idx)\n    if fixed_hit_idx is not None:\n      fixed_mapping[query_idx] = fixed_hit_idx\n\n  return fixed_mapping, score\n"
  },
  {
    "path": "src/alphafold3/data/templates.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"API for retrieving and manipulating template search results.\"\"\"\n\nfrom collections.abc import Iterable, Iterator, Mapping, Sequence\nimport dataclasses\nimport datetime\nimport functools\nimport os\nimport re\nfrom typing import Any, Final, Self, TypeAlias\n\nfrom absl import logging\nfrom alphafold3 import structure\nfrom alphafold3.common import resources\nfrom alphafold3.constants import atom_types\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.constants import residue_names\nfrom alphafold3.data import msa_config\nfrom alphafold3.data import parsers\nfrom alphafold3.data import structure_stores\nfrom alphafold3.data import template_realign\nfrom alphafold3.data.tools import hmmsearch\nfrom alphafold3.structure import mmcif\nimport numpy as np\n\n\n_POLYMER_FEATURES: Final[Mapping[str, np.float64 | np.int32 | object]] = {\n    'template_aatype': np.int32,\n    'template_all_atom_masks': np.float64,\n    'template_all_atom_positions': np.float64,\n    'template_domain_names': object,\n    'template_release_date': object,\n    'template_sequence': object,\n}\n\n_LIGAND_FEATURES: Final[Mapping[str, Any]] = {\n    'ligand_features': Mapping[str, Any]\n}\n\n\nTemplateFeatures: TypeAlias = Mapping[\n    str, np.ndarray | bytes | Mapping[str, np.ndarray | bytes]\n]\n_REQUIRED_METADATA_COLUMNS: Final[Sequence[str]] = (\n    'seq_release_date',\n    'seq_unresolved_res_num',\n    'seq_author_chain_id',\n    'seq_sequence',\n)\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True, slots=True)\nclass _Polymer:\n  \"\"\"Container for alphabet specific (dna, rna, protein) atom information.\"\"\"\n\n  min_atoms: int\n  num_atom_types: int\n  atom_order: Mapping[str, int]\n\n\n_POLYMERS = {\n    mmcif_names.PROTEIN_CHAIN: _Polymer(\n        min_atoms=5,\n        num_atom_types=atom_types.ATOM37_NUM,\n        atom_order=atom_types.ATOM37_ORDER,\n    ),\n    mmcif_names.DNA_CHAIN: _Polymer(\n        min_atoms=21,\n        num_atom_types=atom_types.ATOM29_NUM,\n        atom_order=atom_types.ATOM29_ORDER,\n    ),\n    mmcif_names.RNA_CHAIN: _Polymer(\n        min_atoms=20,\n        num_atom_types=atom_types.ATOM29_NUM,\n        atom_order=atom_types.ATOM29_ORDER,\n    ),\n}\n\n\ndef _encode_restype(\n    chain_poly_type: str,\n    sequence: str,\n) -> Sequence[int]:\n  \"\"\"Encodes a sequence of residue names as a sequence of ints.\n\n  Args:\n    chain_poly_type: Polymer chain type to determine sequence encoding.\n    sequence: Polymer residues. Protein encoded by single letters. RNA and DNA\n      encoded by  multi-letter CCD codes.\n\n  Returns:\n    A sequence of integers encoding amino acid types for the given chain type.\n  \"\"\"\n  if chain_poly_type == mmcif_names.PROTEIN_CHAIN:\n    return [\n        residue_names.PROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN_AND_GAP_TO_INT[\n            _STANDARDIZED_AA.get(res, res)\n        ]\n        for res in sequence\n    ]\n\n  unk_nucleic = residue_names.UNK_NUCLEIC_ONE_LETTER\n  unk_nucleic_idx = residue_names.POLYMER_TYPES_ORDER_WITH_UNKNOWN_AND_GAP[\n      unk_nucleic\n  ]\n  if chain_poly_type == mmcif_names.RNA_CHAIN:\n    return [\n        residue_names.POLYMER_TYPES_ORDER_WITH_UNKNOWN_AND_GAP.get(\n            res, unk_nucleic_idx\n        )\n        for res in sequence\n    ]\n  elif chain_poly_type == mmcif_names.DNA_CHAIN:\n    # Map UNK DNA to the generic nucleic UNK (N), which happens to also be the\n    # same as the RNA UNK.\n    return [\n        residue_names.POLYMER_TYPES_ORDER_WITH_UNKNOWN_AND_GAP.get(\n            residue_names.DNA_COMMON_ONE_TO_TWO.get(res, unk_nucleic),\n            unk_nucleic_idx,\n        )\n        for res in sequence\n    ]\n\n  raise NotImplementedError(f'\"{chain_poly_type}\" unsupported.')\n\n\n_DAYS_BEFORE_QUERY_DATE: Final[int] = 60\n_HIT_DESCRIPTION_REGEX = re.compile(\n    r'(?P<pdb_id>[a-z0-9]{4,})_(?P<chain_id>\\w+)/(?P<start>\\d+)-(?P<end>\\d+) '\n    r'.* length:(?P<length>\\d+)\\b.*'\n)\n\n_STANDARDIZED_AA = {'B': 'D', 'J': 'X', 'O': 'X', 'U': 'C', 'Z': 'E'}\n\n\nclass Error(Exception):\n  \"\"\"Base class for exceptions.\"\"\"\n\n\nclass HitDateError(Error):\n  \"\"\"An error indicating that invalid release date was detected.\"\"\"\n\n\nclass InvalidTemplateError(Error):\n  \"\"\"An error indicating that template is invalid.\"\"\"\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True)\nclass Hit:\n  \"\"\"Template hit metrics derived from the MSA for filtering and featurising.\n\n  Attributes:\n    pdb_id: The PDB ID of the hit.\n    auth_chain_id: The author chain ID of the hit.\n    hmmsearch_sequence: Hit sequence as given in hmmsearch a3m output.\n    structure_sequence: Hit sequence as given in PDB structure.\n    unresolved_res_indices: Indices of unresolved residues in the structure\n      sequence. 0-based.\n    query_sequence: The query nucleotide/amino acid sequence.\n    start_index: The start index of the sequence relative to the full PDB seqres\n      sequence. Inclusive and uses 0-based indexing.\n    end_index: The end index of the sequence relative to the full PDB seqres\n      sequence. Exclusive and uses 0-based indexing.\n    full_length: Length of the full PDB seqres sequence. This can be different\n      from the length from the actual sequence we get from the mmCIF and we use\n      this to detect whether we need to realign or not.\n    release_date: The release date of the PDB corresponding to this hit.\n    chain_poly_type: The polymer type of the selected hit structure.\n  \"\"\"\n\n  pdb_id: str\n  auth_chain_id: str\n  hmmsearch_sequence: str\n  structure_sequence: str\n  unresolved_res_indices: Sequence[int] | None\n  query_sequence: str\n  start_index: int\n  end_index: int\n  full_length: int\n  release_date: datetime.date\n  chain_poly_type: str\n\n  @functools.cached_property\n  def query_to_hit_mapping(self) -> Mapping[int, int]:\n    \"\"\"0-based query index to hit index mapping.\"\"\"\n    query_to_hit_mapping = {}\n    hit_index = 0\n    query_index = 0\n    for residue in self.hmmsearch_sequence:\n      # Gap inserted in the template\n      if residue == '-':\n        query_index += 1\n      # Deleted residue in the template (would be a gap in the query).\n      elif residue.islower():\n        hit_index += 1\n      # Normal aligned residue, in both query and template. Add to mapping.\n      elif residue.isupper():\n        query_to_hit_mapping[query_index] = hit_index\n        query_index += 1\n        hit_index += 1\n\n    structure_subseq = self.structure_sequence[\n        self.start_index : self.end_index\n    ]\n    if self.matching_sequence != structure_subseq:\n      # The seqres sequence doesn't match the structure sequence. Two cases:\n      # 1. The sequences have the same length. The sequences are different\n      #    because our 3->1 residue code mapping is different from the one PDB\n      #    uses. We don't do anything in this case as both sequences have the\n      #    same length, so the original query to hit mapping stays valid.\n      # 2. The sequences don't have the same length, the one in structure is\n      #    shorter. In this case we change the mapping to match the actual\n      #    structure sequence using a simple realignment algorithm.\n      # This procedure was validated on all PDB seqres (2023_01_12) sequences\n      # and handles all cases that can happen.\n      if self.full_length != len(self.structure_sequence):\n        return template_realign.realign_hit_to_structure(\n            hit_sequence=self.matching_sequence,\n            hit_start_index=self.start_index,\n            hit_end_index=self.end_index,\n            full_length=self.full_length,\n            structure_sequence=self.structure_sequence,\n            query_to_hit_mapping=query_to_hit_mapping,\n        )\n\n    # Hmmsearch returns a subsequence and so far indices have been relative to\n    # the subsequence. Add an offset to index relative to the full structure\n    # sequence.\n    return {q: h + self.start_index for q, h in query_to_hit_mapping.items()}\n\n  @property\n  def matching_sequence(self) -> str:\n    \"\"\"Returns the matching hit sequence including insertions.\n\n    Make deleted residues uppercase and remove gaps (\"-\").\n    \"\"\"\n    return self.hmmsearch_sequence.upper().replace('-', '')\n\n  @functools.cached_property\n  def output_templates_sequence(self) -> str:\n    \"\"\"Returns the final template sequence.\"\"\"\n    result_seq = ['-'] * len(self.query_sequence)\n    for query_index, template_index in self.query_to_hit_mapping.items():\n      result_seq[query_index] = self.structure_sequence[template_index]\n    return ''.join(result_seq)\n\n  @property\n  def length_ratio(self) -> float:\n    \"\"\"Ratio of the length of the hit sequence to the query.\"\"\"\n    return len(self.matching_sequence) / len(self.query_sequence)\n\n  @property\n  def align_ratio(self) -> float:\n    \"\"\"Ratio of the number of aligned residues to the query length.\"\"\"\n    return len(self.query_to_hit_mapping) / len(self.query_sequence)\n\n  @functools.cached_property\n  def is_valid(self) -> bool:\n    \"\"\"Whether hit can be used as a template.\"\"\"\n    if self.unresolved_res_indices is None:\n      return False\n\n    return bool(\n        set(self.query_to_hit_mapping.values())\n        - set(self.unresolved_res_indices)\n    )\n\n  @property\n  def full_name(self) -> str:\n    \"\"\"A full name of the hit.\"\"\"\n    return f'{self.pdb_id}_{self.auth_chain_id}'\n\n  def __post_init__(self):\n    if not self.pdb_id.islower() and not self.pdb_id.isdigit():\n      raise ValueError(f'pdb_id must be lowercase {self.pdb_id}')\n\n    if not (0 <= self.start_index <= self.end_index):\n      raise ValueError(\n          'Start must be non-negative and less than or equal to end index. '\n          f'Range: {self.start_index}-{self.end_index}'\n      )\n\n    if len(self.matching_sequence) != (self.end_index - self.start_index):\n      raise ValueError(\n          'Sequence length must be equal to end_index - start_index. '\n          f'{len(self.matching_sequence)} != {self.end_index} - '\n          f'{self.start_index}'\n      )\n\n    if self.full_length < 0:\n      raise ValueError(f'Full length must be non-negative: {self.full_length}')\n\n  def keep(\n      self,\n      *,\n      release_date_cutoff: datetime.date | None,\n      max_subsequence_ratio: float | None,\n      min_hit_length: int | None,\n      min_align_ratio: float | None,\n  ) -> bool:\n    \"\"\"Returns whether the hit should be kept.\n\n    In addition to filtering on all of the provided parameters, this method also\n    excludes hits with unresolved residues.\n\n    Args:\n      release_date_cutoff: Maximum release date of the template.\n      max_subsequence_ratio: If set, excludes hits which are an exact\n        subsequence of the query sequence, and longer than this ratio. Useful to\n        avoid ground truth leakage.\n      min_hit_length: If set, excludes hits which have fewer residues than this.\n      min_align_ratio: If set, excludes hits where the number of residues\n        aligned to the query is less than this proportion of the template\n        length.\n    \"\"\"\n    # Exclude hits which are too recent.\n    if (\n        release_date_cutoff is not None\n        and self.release_date > release_date_cutoff\n    ):\n      return False\n\n    # Exclude hits which are large duplicates of the query_sequence.\n    if (\n        max_subsequence_ratio is not None\n        and self.length_ratio > max_subsequence_ratio\n    ):\n      if self.matching_sequence in self.query_sequence:\n        return False\n\n    # Exclude hits which are too short.\n    if (\n        min_hit_length is not None\n        and len(self.matching_sequence) < min_hit_length\n    ):\n      return False\n\n    # Exclude hits with unresolved residues.\n    if not self.is_valid:\n      return False\n\n    # Exclude hits with too few alignments.\n    try:\n      if min_align_ratio is not None and self.align_ratio <= min_align_ratio:\n        return False\n    except template_realign.AlignmentError as e:\n      logging.warning('Failed to align %s: %s', self, str(e))\n      return False\n\n    return True\n\n\ndef _filter_hits(\n    hits: Iterable[Hit],\n    release_date_cutoff: datetime.date,\n    max_subsequence_ratio: float | None,\n    min_align_ratio: float | None,\n    min_hit_length: int | None,\n    deduplicate_sequences: bool,\n    max_hits: int | None,\n) -> Sequence[Hit]:\n  \"\"\"Filters hits based on the filter config.\"\"\"\n  filtered_hits = []\n  seen_before = set()\n  for hit in hits:\n    if not hit.keep(\n        max_subsequence_ratio=max_subsequence_ratio,\n        min_align_ratio=min_align_ratio,\n        min_hit_length=min_hit_length,\n        release_date_cutoff=release_date_cutoff,\n    ):\n      continue\n\n    # Remove duplicate templates, keeping the first.\n    if deduplicate_sequences:\n      if hit.output_templates_sequence in seen_before:\n        continue\n      seen_before.add(hit.output_templates_sequence)\n\n    filtered_hits.append(hit)\n    if max_hits and len(filtered_hits) == max_hits:\n      break\n\n  return filtered_hits\n\n\n@dataclasses.dataclass(init=False)\nclass Templates:\n  \"\"\"A container for templates that were found for the given query sequence.\n\n  The structure_store is constructed from the config by default. Callers can\n  optionally supply a structure_store to the constructor to avoid the cost of\n  construction and metadata loading.\n  \"\"\"\n\n  def __init__(\n      self,\n      *,\n      query_sequence: str,\n      hits: Sequence[Hit],\n      max_template_date: datetime.date,\n      structure_store: structure_stores.StructureStore,\n      query_release_date: datetime.date | None = None,\n  ):\n    self._query_sequence = query_sequence\n    self._hits = tuple(hits)\n    self._max_template_date = max_template_date\n    self._query_release_date = query_release_date\n    self._hit_structures = {}\n    self._structure_store = structure_store\n\n    if any(h.query_sequence != self._query_sequence for h in self.hits):\n      raise ValueError('All hits must match the query sequence.')\n\n    if self._hits:\n      chain_poly_type = self._hits[0].chain_poly_type\n      if any(h.chain_poly_type != chain_poly_type for h in self.hits):\n        raise ValueError('All hits must have the same chain_poly_type.')\n\n  @classmethod\n  def from_seq_and_a3m(\n      cls,\n      *,\n      query_sequence: str,\n      msa_a3m: str,\n      max_template_date: datetime.date,\n      database_path: os.PathLike[str] | str,\n      hmmsearch_config: msa_config.HmmsearchConfig,\n      max_a3m_query_sequences: int | None,\n      structure_store: structure_stores.StructureStore,\n      filter_config: msa_config.TemplateFilterConfig | None = None,\n      query_release_date: datetime.date | None = None,\n      chain_poly_type: str = mmcif_names.PROTEIN_CHAIN,\n  ) -> Self:\n    \"\"\"Creates templates from a run of hmmsearch tool against a custom a3m.\n\n    Args:\n      query_sequence: The polymer sequence of the target query.\n      msa_a3m: An a3m of related polymers aligned to the query sequence, this is\n        used to create an HMM for the hmmsearch run.\n      max_template_date: This is used to filter templates for training, ensuring\n        that they do not leak ground truth information used in testing sets.\n      database_path: A path to the sequence database to search for templates.\n      hmmsearch_config: Config with Hmmsearch settings.\n      max_a3m_query_sequences: The maximum number of input MSA sequences to use\n        to construct the profile which is then used to search for templates.\n      structure_store: Structure store to fetch template structures from.\n      filter_config: Optional config that controls which and how many hits to\n        keep. More performant than constructing and then filtering. If not\n        provided, no filtering is done.\n      query_release_date: The release_date of the template query, this is used\n        to filter templates for training, ensuring that they do not leak\n        structure information from the future.\n      chain_poly_type: The polymer type of the templates.\n\n    Returns:\n      Templates object containing a list of Hits initialised from the\n      structure_store metadata and a3m alignments.\n    \"\"\"\n    hmmsearch_a3m = run_hmmsearch_with_a3m(\n        database_path=database_path,\n        hmmsearch_config=hmmsearch_config,\n        max_a3m_query_sequences=max_a3m_query_sequences,\n        a3m=msa_a3m,\n    )\n    return cls.from_hmmsearch_a3m(\n        query_sequence=query_sequence,\n        a3m=hmmsearch_a3m,\n        max_template_date=max_template_date,\n        query_release_date=query_release_date,\n        chain_poly_type=chain_poly_type,\n        structure_store=structure_store,\n        filter_config=filter_config,\n    )\n\n  @classmethod\n  def from_hmmsearch_a3m(\n      cls,\n      *,\n      query_sequence: str,\n      a3m: str,\n      max_template_date: datetime.date,\n      structure_store: structure_stores.StructureStore,\n      filter_config: msa_config.TemplateFilterConfig | None = None,\n      query_release_date: datetime.date | None = None,\n      chain_poly_type: str = mmcif_names.PROTEIN_CHAIN,\n  ) -> Self:\n    \"\"\"Creates Templates from a Hmmsearch A3M.\n\n    Args:\n      query_sequence: The polymer sequence of the target query.\n      a3m: Results of Hmmsearch in A3M format. This provides a list of potential\n        template alignments and pdb codes.\n      max_template_date: This is used to filter templates for training, ensuring\n        that they do not leak ground truth information used in testing sets.\n      structure_store: Structure store to fetch template structures from.\n      filter_config: Optional config that controls which and how many hits to\n        keep. More performant than constructing and then filtering. If not\n        provided, no filtering is done.\n      query_release_date: The release_date of the template query, this is used\n        to filter templates for training, ensuring that they do not leak\n        structure information from the future.\n      chain_poly_type: The polymer type of the templates.\n\n    Returns:\n      Templates object containing a list of Hits initialised from the\n      structure_store metadata and a3m alignments.\n    \"\"\"\n\n    def hit_generator(a3m: str):\n      if not a3m:\n        return  # Hmmsearch could return an empty string if there are no hits.\n\n      for hit_seq, hit_desc in parsers.lazy_parse_fasta_string(a3m):\n        pdb_id, auth_chain_id, start, end, full_length = _parse_hit_description(\n            hit_desc\n        )\n\n        release_date, sequence, unresolved_res_ids = _parse_hit_metadata(\n            structure_store, pdb_id, auth_chain_id\n        )\n        if unresolved_res_ids is None:\n          continue\n\n        # seq_unresolved_res_num are 1-based, setting to 0-based indices.\n        unresolved_indices = [i - 1 for i in unresolved_res_ids]\n\n        yield Hit(\n            pdb_id=pdb_id,\n            auth_chain_id=auth_chain_id,\n            hmmsearch_sequence=hit_seq,\n            structure_sequence=sequence,\n            query_sequence=query_sequence,\n            unresolved_res_indices=unresolved_indices,\n            start_index=start - 1,  # Raw value is residue number, not index.\n            end_index=end,\n            full_length=full_length,\n            release_date=datetime.date.fromisoformat(release_date),\n            chain_poly_type=chain_poly_type,\n        )\n\n    if filter_config is None:\n      hits = tuple(hit_generator(a3m))\n    else:\n      hits = _filter_hits(\n          hit_generator(a3m),\n          release_date_cutoff=filter_config.max_template_date,\n          max_subsequence_ratio=filter_config.max_subsequence_ratio,\n          min_align_ratio=filter_config.min_align_ratio,\n          min_hit_length=filter_config.min_hit_length,\n          deduplicate_sequences=filter_config.deduplicate_sequences,\n          max_hits=filter_config.max_hits,\n      )\n\n    return Templates(\n        query_sequence=query_sequence,\n        query_release_date=query_release_date,\n        hits=hits,\n        max_template_date=max_template_date,\n        structure_store=structure_store,\n    )\n\n  @property\n  def query_sequence(self) -> str:\n    return self._query_sequence\n\n  @property\n  def hits(self) -> tuple[Hit, ...]:\n    return self._hits\n\n  @property\n  def query_release_date(self) -> datetime.date | None:\n    return self._query_release_date\n\n  @property\n  def num_hits(self) -> int:\n    return len(self._hits)\n\n  @functools.cached_property\n  def release_date_cutoff(self) -> datetime.date:\n    if self.query_release_date is None:\n      return self._max_template_date\n    return min(\n        self._max_template_date,\n        self.query_release_date\n        - datetime.timedelta(days=_DAYS_BEFORE_QUERY_DATE),\n    )\n\n  def __repr__(self) -> str:\n    return f'Templates({self.num_hits} hits)'\n\n  def filter(\n      self,\n      *,\n      max_subsequence_ratio: float | None,\n      min_align_ratio: float | None,\n      min_hit_length: int | None,\n      deduplicate_sequences: bool,\n      max_hits: int | None,\n  ) -> Self:\n    \"\"\"Returns a new Templates object with only the hits that pass all filters.\n\n    This also filters on query_release_date and max_template_date.\n\n    Args:\n      max_subsequence_ratio: If set, excludes hits which are an exact\n        subsequence of the query sequence, and longer than this ratio. Useful to\n        avoid ground truth leakage.\n      min_align_ratio: If set, excludes hits where the number of residues\n        aligned to the query is less than this proportion of the template\n        length.\n      min_hit_length: If set, excludes hits which have fewer residues than this.\n      deduplicate_sequences: Whether to exclude duplicate template sequences,\n        keeping only the first. This can be useful in increasing the diversity\n        of hits especially in the case of homomer hits.\n      max_hits: If set, excludes any hits which exceed this count.\n    \"\"\"\n    filtered_hits = _filter_hits(\n        hits=self._hits,\n        release_date_cutoff=self.release_date_cutoff,\n        max_subsequence_ratio=max_subsequence_ratio,\n        min_align_ratio=min_align_ratio,\n        min_hit_length=min_hit_length,\n        deduplicate_sequences=deduplicate_sequences,\n        max_hits=max_hits,\n    )\n    return Templates(\n        query_sequence=self.query_sequence,\n        query_release_date=self.query_release_date,\n        hits=filtered_hits,\n        max_template_date=self._max_template_date,\n        structure_store=self._structure_store,\n    )\n\n  def get_hits_with_structures(\n      self,\n  ) -> Sequence[tuple[Hit, structure.Structure]]:\n    \"\"\"Returns hits + Structures, Structures filtered to the hit's chain.\"\"\"\n    results = []\n    structures = {struc.name.lower(): struc for struc in self.structures}\n    for hit in self.hits:\n      if not hit.is_valid:\n        raise InvalidTemplateError(\n            'Hits must be filtered before calling get_hits_with_structures.'\n        )\n      struc = structures[hit.pdb_id]\n      label_chain_id = struc.polymer_auth_asym_id_to_label_asym_id().get(\n          hit.auth_chain_id\n      )\n      results.append((hit, struc.filter(chain_id=label_chain_id)))\n    return results\n\n  def featurize(\n      self,\n      include_ligand_features: bool = True,\n  ) -> TemplateFeatures:\n    \"\"\"Featurises the templates and returns a map of feature names to features.\n\n    NB: If you don't do any prefiltering, this method might be slow to run\n    as it has to fetch many CIFs and featurize them all.\n\n    Args:\n      include_ligand_features: Whether to compute ligand features.\n\n    Returns:\n      Template features: A mapping of template feature labels to features, which\n        may be numpy arrays, bytes objects, or for the special case of label\n        `ligand_features` (if `include_ligand_features` is True), a nested\n        feature map of labels to numpy arrays.\n\n    Raises:\n      InvalidTemplateError: If hits haven't been filtered before featurization.\n    \"\"\"\n    hits_by_pdb_id = {}\n    for idx, hit in enumerate(self.hits):\n      if not hit.is_valid:\n        raise InvalidTemplateError(\n            f'Hits must be filtered before featurizing, got unprocessed {hit=}'\n        )\n      hits_by_pdb_id.setdefault(hit.pdb_id, []).append((idx, hit))\n\n    unsorted_features = []\n    for struc in self.structures:\n      pdb_id = str(struc.name).lower()\n      for idx, hit in hits_by_pdb_id[pdb_id]:\n        try:\n          label_chain_id = struc.polymer_auth_asym_id_to_label_asym_id()[\n              hit.auth_chain_id\n          ]\n          hit_features = {\n              **get_polymer_features(\n                  chain=struc.filter(chain_id=label_chain_id),\n                  chain_poly_type=hit.chain_poly_type,\n                  query_sequence_length=len(hit.query_sequence),\n                  query_to_hit_mapping=hit.query_to_hit_mapping,\n              ),\n          }\n          if include_ligand_features:\n            hit_features['ligand_features'] = _get_ligand_features(struc)\n          unsorted_features.append((idx, hit_features))\n        except Error as e:\n          raise type(e)(f'Failed to featurise {hit=}') from e\n\n    sorted_features = sorted(unsorted_features, key=lambda x: x[0])\n    sorted_features = [feat for _, feat in sorted_features]\n    return package_template_features(\n        hit_features=sorted_features,\n        include_ligand_features=include_ligand_features,\n    )\n\n  @property\n  def structures(self) -> Iterator[structure.Structure]:\n    \"\"\"Yields template structures for each unique PDB ID among hits.\n\n    If there are multiple hits in the same Structure, the Structure will be\n    included only once by this method.\n\n    Yields:\n      A Structure object for each unique PDB ID among hits.\n\n    Raises:\n      HitDateError: If template's release date exceeds max cutoff date.\n    \"\"\"\n\n    for hit in self.hits:\n      if hit.release_date > self.release_date_cutoff:  # pylint: disable=comparison-with-callable\n        raise HitDateError(\n            f'Invalid release date for hit {hit.pdb_id=}, when release date '\n            f'cutoff is {self.release_date_cutoff}.'\n        )\n\n    # Get the set of pdbs to load. In particular, remove duplicate PDB IDs.\n    targets_to_load = tuple({hit.pdb_id for hit in self.hits})\n\n    for target_name in targets_to_load:\n      yield structure.from_mmcif(\n          mmcif_string=self._structure_store.get_mmcif_str(target_name),\n          fix_mse_residues=True,\n          fix_arginines=True,\n          include_water=False,\n          include_bonds=False,\n          include_other=True,  # For non-standard polymer chains.\n      )\n\n\ndef _parse_hit_description(description: str) -> tuple[str, str, int, int, int]:\n  \"\"\"Parses the hmmsearch A3M sequence description line.\"\"\"\n  # Example lines (protein, nucleic, no description):\n  # >4pqx_A/2-217 [subseq from] mol:protein length:217  Free text\n  # >4pqx_A/2-217 [subseq from] mol:na length:217  Free text\n  # >5g3r_A/1-55 [subseq from] mol:protein length:352\n  if match := re.fullmatch(_HIT_DESCRIPTION_REGEX, description):\n    return (\n        match['pdb_id'],\n        match['chain_id'],\n        int(match['start']),\n        int(match['end']),\n        int(match['length']),\n    )\n  else:\n    raise ValueError(f'Could not parse description \"{description}\"')\n\n\ndef _parse_hit_metadata(\n    structure_store: structure_stores.StructureStore,\n    pdb_id: str,\n    auth_chain_id: str,\n) -> tuple[Any, str | None, Sequence[int] | None]:\n  \"\"\"Parse hit metadata by parsing mmCIF from structure store.\"\"\"\n  try:\n    cif = mmcif.from_string(structure_store.get_mmcif_str(pdb_id))\n  except structure_stores.NotFoundError:\n    logging.warning(\n        'Failed to get mmCIF for %s (author chain %s).', pdb_id, auth_chain_id\n    )\n    return None, None, None\n  release_date = mmcif.get_release_date(cif)\n\n  try:\n    struc = structure.from_parsed_mmcif(\n        cif,\n        model_id=structure.ModelID.ALL,\n        include_water=True,\n        include_other=True,\n        include_bonds=False,\n    )\n  except ValueError:\n    struc = structure.from_parsed_mmcif(\n        cif,\n        model_id=structure.ModelID.FIRST,\n        include_water=True,\n        include_other=True,\n        include_bonds=False,\n    )\n\n  sequence = struc.polymer_author_chain_single_letter_sequence(\n      include_missing_residues=True,\n      protein=True,\n      dna=True,\n      rna=True,\n      other=True,\n  )[auth_chain_id]\n\n  unresolved_res_ids = struc.filter(\n      chain_auth_asym_id=auth_chain_id\n  ).unresolved_residues.id\n\n  return release_date, sequence, unresolved_res_ids\n\n\ndef get_polymer_features(\n    *,\n    chain: structure.Structure,\n    chain_poly_type: str,\n    query_sequence_length: int,\n    query_to_hit_mapping: Mapping[int, int],\n) -> Mapping[str, Any]:\n  \"\"\"Returns features for this polymer chain.\n\n  Args:\n    chain: Structure object representing the template. Must be already filtered\n      to a single chain.\n    chain_poly_type: The chain polymer type (protein, DNA, RNA).\n    query_sequence_length: The length of the query sequence.\n    query_to_hit_mapping: 0-based query index to hit index mapping.\n\n  Returns:\n    A dictionary with polymer features for template_chain_id in the struc.\n\n  Raises:\n    ValueError: If the input structure contains more than just a single chain.\n  \"\"\"\n  if chain.name is None:\n    raise ValueError('Template structure must have a name.')\n\n  if chain.release_date is None:\n    raise ValueError(\n        f'Template structure {chain.name} must have a release date. You can do'\n        ' this by setting \"_pdbx_audit_revision_history.revision_date\" in the'\n        ' template mmCIF to a date in the ISO-8601 format (e.g. 1989-11-17).'\n    )\n\n  num_polymer_chains = len(chain.polymer_auth_asym_id_to_label_asym_id())\n  if num_polymer_chains != 1:\n    raise ValueError(\n        f'Template structure {chain.name} must be filtered to a single polymer'\n        f' chain but got a structure with {num_polymer_chains} polymer chains.'\n    )\n\n  auth_chain_id, label_chain_id = next(\n      iter(chain.polymer_auth_asym_id_to_label_asym_id().items())\n  )\n  chain_sequence = chain.chain_single_letter_sequence()[label_chain_id]\n\n  polymer = _POLYMERS[chain_poly_type]\n  res_arrays = chain.to_res_arrays(\n      include_missing_residues=True, atom_order=polymer.atom_order\n  )\n  positions = res_arrays.atom_positions\n  positions_mask = res_arrays.atom_mask\n  template_all_atom_positions = np.zeros(\n      (query_sequence_length, polymer.num_atom_types, 3), dtype=np.float64\n  )\n  template_all_atom_masks = np.zeros(\n      (query_sequence_length, polymer.num_atom_types), dtype=np.int64\n  )\n\n  template_sequence = ['-'] * query_sequence_length\n  for query_index, template_index in query_to_hit_mapping.items():\n    template_all_atom_positions[query_index] = positions[template_index]\n    template_all_atom_masks[query_index] = positions_mask[template_index]\n    template_sequence[query_index] = chain_sequence[template_index]\n\n  template_sequence = ''.join(template_sequence)\n  template_aatype = _encode_restype(chain_poly_type, template_sequence)\n  template_name = f'{chain.name.lower()}_{auth_chain_id}'\n  release_date = chain.release_date.strftime('%Y-%m-%d')\n  return {\n      'template_all_atom_positions': template_all_atom_positions,\n      'template_all_atom_masks': template_all_atom_masks,\n      'template_sequence': template_sequence.encode(),\n      'template_aatype': np.array(template_aatype, dtype=np.int32),\n      'template_domain_names': np.array(template_name.encode(), dtype=object),\n      'template_release_date': np.array(release_date.encode(), dtype=object),\n  }\n\n\ndef _get_ligand_features(\n    struc: structure.Structure,\n) -> Mapping[str, Mapping[str, np.ndarray | bytes]]:\n  \"\"\"Returns features for the ligands in this structure.\"\"\"\n  ligand_struc = struc.filter_to_entity_type(ligand=True)\n  assert ligand_struc.coords is not None\n  assert ligand_struc.atom_name is not None\n  assert ligand_struc.atom_occupancy is not None\n\n  ligand_features = {}\n  for ligand_chain_id in ligand_struc.chains:\n    idxs = np.where(ligand_struc.chain_id == ligand_chain_id)[0]\n    if idxs.shape[0]:\n      ligand_features[ligand_chain_id] = {\n          'ligand_atom_positions': (\n              ligand_struc.coords[idxs, :].astype(np.float32)\n          ),\n          'ligand_atom_names': ligand_struc.atom_name[idxs].astype(object),\n          'ligand_atom_occupancies': (\n              ligand_struc.atom_occupancy[idxs].astype(np.float32)\n          ),\n          'ccd_id': ligand_struc.res_name[idxs][0].encode(),\n      }\n  return ligand_features\n\n\ndef package_template_features(\n    *,\n    hit_features: Sequence[Mapping[str, Any]],\n    include_ligand_features: bool,\n) -> Mapping[str, Any]:\n  \"\"\"Stacks polymer features, adds empty and keeps ligand features unstacked.\"\"\"\n\n  features_to_include = set(_POLYMER_FEATURES)\n  if include_ligand_features:\n    features_to_include.update(_LIGAND_FEATURES)\n\n  features = {\n      feat: [single_hit_features[feat] for single_hit_features in hit_features]\n      for feat in features_to_include\n  }\n\n  stacked_features = {}\n  for k, v in features.items():\n    if k in _POLYMER_FEATURES:\n      v = np.stack(v, axis=0) if v else np.array([], dtype=_POLYMER_FEATURES[k])\n    stacked_features[k] = v\n\n  return stacked_features\n\n\ndef _resolve_path(path: os.PathLike[str] | str) -> str:\n  \"\"\"Resolves path for data dep paths, stringifies otherwise.\"\"\"\n  # Data dependency paths: db baked into the binary.\n  resolved_path = resources.filename(path)\n  if os.path.exists(resolved_path):\n    return resolved_path\n  else:\n    # Other paths, e.g. local.\n    return str(path)\n\n\ndef run_hmmsearch_with_a3m(\n    *,\n    database_path: os.PathLike[str] | str,\n    hmmsearch_config: msa_config.HmmsearchConfig,\n    max_a3m_query_sequences: int | None,\n    a3m: str | None,\n) -> str:\n  \"\"\"Runs Hmmsearch to get a3m string of hits.\"\"\"\n  searcher = hmmsearch.Hmmsearch(\n      binary_path=hmmsearch_config.hmmsearch_binary_path,\n      hmmbuild_binary_path=hmmsearch_config.hmmbuild_binary_path,\n      database_path=_resolve_path(database_path),\n      e_value=hmmsearch_config.e_value,\n      inc_e=hmmsearch_config.inc_e,\n      dom_e=hmmsearch_config.dom_e,\n      incdom_e=hmmsearch_config.incdom_e,\n      alphabet=hmmsearch_config.alphabet,\n      filter_f1=hmmsearch_config.filter_f1,\n      filter_f2=hmmsearch_config.filter_f2,\n      filter_f3=hmmsearch_config.filter_f3,\n      filter_max=hmmsearch_config.filter_max,\n  )\n  # STO enables us to annotate query non-gap columns as reference columns.\n  sto = parsers.convert_a3m_to_stockholm(a3m, max_a3m_query_sequences)\n  return searcher.query_with_sto(sto, model_construction='hand')\n"
  },
  {
    "path": "src/alphafold3/data/tools/hmmalign.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"A Python wrapper for hmmalign from the HMMER Suite.\"\"\"\n\nfrom collections.abc import Mapping, Sequence\nimport os\nimport tempfile\n\nfrom alphafold3.data import parsers\nfrom alphafold3.data.tools import subprocess_utils\n\n\ndef _to_a3m(sequences: Sequence[str], name_prefix: str = 'sequence') -> str:\n  a3m = ''\n  for i, sequence in enumerate(sequences, 1):\n    a3m += f'> {name_prefix} {i}\\n{sequence}\\n'\n  return a3m\n\n\nclass Hmmalign:\n  \"\"\"Python wrapper of the hmmalign binary.\"\"\"\n\n  def __init__(self, binary_path: str):\n    \"\"\"Initializes the Python hmmalign wrapper.\n\n    Args:\n      binary_path: Path to the hmmalign binary.\n\n    Raises:\n      RuntimeError: If hmmalign binary not found within the path.\n    \"\"\"\n    self._binary_path = binary_path\n\n    subprocess_utils.check_binary_exists(\n        path=self._binary_path, name='hmmalign'\n    )\n\n  def align_sequences(\n      self,\n      sequences: Sequence[str],\n      profile: str,\n      extra_flags: Mapping[str, str] | None = None,\n  ) -> str:\n    \"\"\"Aligns sequence list to the profile and returns the alignment in A3M.\"\"\"\n    return self.align(\n        a3m_str=_to_a3m(sequences, name_prefix='query'),\n        profile=profile,\n        extra_flags=extra_flags,\n    )\n\n  def align(\n      self,\n      a3m_str: str,\n      profile: str,\n      extra_flags: Mapping[str, str] | None = None,\n  ) -> str:\n    \"\"\"Aligns sequences in A3M to the profile and returns the alignment in A3M.\n\n    Args:\n      a3m_str: A list of sequence strings.\n      profile: A hmm file with the hmm profile to align the sequences to.\n      extra_flags: Dictionary with extra flags, flag_name: flag_value, that are\n        added to hmmalign.\n\n    Returns:\n      An A3M string with the aligned sequences.\n\n    Raises:\n      RuntimeError: If hmmalign fails.\n    \"\"\"\n    with tempfile.TemporaryDirectory() as query_tmp_dir:\n      input_profile = os.path.join(query_tmp_dir, 'profile.hmm')\n      input_sequences = os.path.join(query_tmp_dir, 'sequences.a3m')\n      output_a3m_path = os.path.join(query_tmp_dir, 'output.a3m')\n\n      with open(input_profile, 'w') as f:\n        f.write(profile)\n\n      with open(input_sequences, 'w') as f:\n        f.write(a3m_str)\n\n      cmd = [\n          self._binary_path,\n          *('-o', output_a3m_path),\n          *('--outformat', 'A2M'),  # A2M is A3M in the HMMER suite.\n      ]\n      if extra_flags:\n        for flag_name, flag_value in extra_flags.items():\n          cmd.extend([flag_name, flag_value])\n      cmd.extend([input_profile, input_sequences])\n\n      subprocess_utils.run(\n          cmd=cmd,\n          cmd_name='hmmalign',\n          log_stdout=False,\n          log_stderr=True,\n          log_on_process_error=True,\n      )\n\n      with open(output_a3m_path, encoding='utf-8') as f:\n        a3m = f.read()\n\n    return a3m\n\n  def align_sequences_to_profile(self, profile: str, sequences_a3m: str) -> str:\n    \"\"\"Aligns the sequences to profile and returns the alignment in A3M string.\n\n    Uses hmmalign to align the sequences to the profile, then ouputs the\n    sequence contatenated at the beginning of the sequences in the A3M format.\n    As the sequences are represented by an alignment with possible gaps ('-')\n    and insertions (lowercase characters), the method first removes the gaps,\n    then uppercases the insertions to prepare the sequences for realignment.\n    Sequences with gaps cannot be aligned, as '-'s are not a valid symbol to\n    align; lowercase characters must be uppercased to preserve the original\n    sequences before realignment.\n\n    Args:\n      profile: The Hmmbuild profile to align the sequences to.\n      sequences_a3m: Sequences in A3M format to align to the profile.\n\n    Returns:\n      An A3M string with the aligned sequences.\n\n    Raises:\n      RuntimeError: If hmmalign fails.\n    \"\"\"\n    deletion_table = str.maketrans('', '', '-')\n    sequences_no_gaps_a3m = []\n    for seq, desc in parsers.lazy_parse_fasta_string(sequences_a3m):\n      sequences_no_gaps_a3m.append(f'>{desc}')\n      sequences_no_gaps_a3m.append(seq.translate(deletion_table))\n    sequences_no_gaps_a3m = '\\n'.join(sequences_no_gaps_a3m)\n\n    aligned_sequences = self.align(sequences_no_gaps_a3m, profile)\n\n    return aligned_sequences\n"
  },
  {
    "path": "src/alphafold3/data/tools/hmmbuild.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"A Python wrapper for hmmbuild - construct HMM profiles from MSA.\"\"\"\n\nimport os\nimport re\nimport tempfile\nfrom typing import Literal\n\nfrom alphafold3.data import parsers\nfrom alphafold3.data.tools import subprocess_utils\n\n\nclass Hmmbuild(object):\n  \"\"\"Python wrapper of the hmmbuild binary.\"\"\"\n\n  def __init__(\n      self,\n      *,\n      binary_path: str,\n      singlemx: bool = False,\n      alphabet: str | None = None,\n  ):\n    \"\"\"Initializes the Python hmmbuild wrapper.\n\n    Args:\n      binary_path: The path to the hmmbuild executable.\n      singlemx: Whether to use --singlemx flag. If True, it forces HMMBuild to\n        just use a common substitution score matrix.\n      alphabet: The alphabet to assert when building a profile. Useful when\n        hmmbuild cannot guess the alphabet. If None, no alphabet is asserted.\n\n    Raises:\n      RuntimeError: If hmmbuild binary not found within the path.\n    \"\"\"\n    self._binary_path = binary_path\n    self._singlemx = singlemx\n    self._alphabet = alphabet\n\n    subprocess_utils.check_binary_exists(\n        path=self._binary_path, name='hmmbuild'\n    )\n\n  def build_profile_from_sto(self, sto: str, model_construction='fast') -> str:\n    \"\"\"Builds a HHM for the aligned sequences given as an A3M string.\n\n    Args:\n      sto: A string with the aligned sequences in the Stockholm format.\n      model_construction: Whether to use reference annotation in the msa to\n        determine consensus columns ('hand') or default ('fast').\n\n    Returns:\n      A string with the profile in the HMM format.\n\n    Raises:\n      RuntimeError: If hmmbuild fails.\n    \"\"\"\n    return self._build_profile(\n        sto, informat='stockholm', model_construction=model_construction\n    )\n\n  def build_profile_from_a3m(self, a3m: str) -> str:\n    \"\"\"Builds a HHM for the aligned sequences given as an A3M string.\n\n    Args:\n      a3m: A string with the aligned sequences in the A3M format.\n\n    Returns:\n      A string with the profile in the HMM format.\n\n    Raises:\n      RuntimeError: If hmmbuild fails.\n    \"\"\"\n    lines = []\n    for sequence, description in parsers.lazy_parse_fasta_string(a3m):\n      sequence = re.sub('[a-z]+', '', sequence)  # Remove inserted residues.\n      lines.append(f'>{description}\\n{sequence}\\n')\n    msa = ''.join(lines)\n    return self._build_profile(msa, informat='afa')\n\n  def _build_profile(\n      self,\n      msa: str,\n      informat: Literal['afa', 'stockholm'],\n      model_construction: str = 'fast',\n  ) -> str:\n    \"\"\"Builds a HMM for the aligned sequences given as an MSA string.\n\n    Args:\n      msa: A string with the aligned sequences, in A3M or STO format.\n      informat: One of 'afa' (aligned FASTA) or 'sto' (Stockholm).\n      model_construction: Whether to use reference annotation in the msa to\n        determine consensus columns ('hand') or default ('fast').\n\n    Returns:\n      A string with the profile in the HMM format.\n\n    Raises:\n      RuntimeError: If hmmbuild fails.\n      ValueError: If unspecified arguments are provided.\n    \"\"\"\n    if model_construction not in {'hand', 'fast'}:\n      raise ValueError(f'Bad {model_construction=}. Only hand or fast allowed.')\n\n    with tempfile.TemporaryDirectory() as query_tmp_dir:\n      input_msa_path = os.path.join(query_tmp_dir, 'query.msa')\n      output_hmm_path = os.path.join(query_tmp_dir, 'output.hmm')\n\n      with open(input_msa_path, 'w') as f:\n        f.write(msa)\n\n      # Specify the format as we don't specify the input file extension. See\n      # https://github.com/EddyRivasLab/hmmer/issues/321 for more details.\n      cmd_flags = ['--informat', informat]\n      # If adding flags, we have to do so before the output and input:\n      if model_construction == 'hand':\n        cmd_flags.append(f'--{model_construction}')\n      if self._singlemx:\n        cmd_flags.append('--singlemx')\n      if self._alphabet:\n        cmd_flags.append(f'--{self._alphabet}')\n\n      cmd_flags.extend([output_hmm_path, input_msa_path])\n\n      cmd = [self._binary_path, *cmd_flags]\n\n      subprocess_utils.run(\n          cmd=cmd,\n          cmd_name='Hmmbuild',\n          log_stdout=False,\n          log_stderr=True,\n          log_on_process_error=True,\n      )\n\n      with open(output_hmm_path) as f:\n        hmm = f.read()\n\n    return hmm\n"
  },
  {
    "path": "src/alphafold3/data/tools/hmmsearch.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"A Python wrapper for hmmsearch - search profile against a sequence db.\"\"\"\n\nimport os\nimport tempfile\n\nfrom absl import logging\nfrom alphafold3.data import parsers\nfrom alphafold3.data.tools import hmmbuild\nfrom alphafold3.data.tools import subprocess_utils\n\n\nclass Hmmsearch(object):\n  \"\"\"Python wrapper of the hmmsearch binary.\"\"\"\n\n  def __init__(\n      self,\n      *,\n      binary_path: str,\n      hmmbuild_binary_path: str,\n      database_path: str,\n      alphabet: str = 'amino',\n      filter_f1: float | None = None,\n      filter_f2: float | None = None,\n      filter_f3: float | None = None,\n      e_value: float | None = None,\n      inc_e: float | None = None,\n      dom_e: float | None = None,\n      incdom_e: float | None = None,\n      filter_max: bool = False,\n  ):\n    \"\"\"Initializes the Python hmmsearch wrapper.\n\n    Args:\n      binary_path: The path to the hmmsearch executable.\n      hmmbuild_binary_path: The path to the hmmbuild executable. Used to build\n        an hmm from an input a3m.\n      database_path: The path to the hmmsearch database (FASTA format).\n      alphabet: Chain type e.g. amino, rna, dna.\n      filter_f1: MSV and biased composition pre-filter, set to >1.0 to turn off.\n      filter_f2: Viterbi pre-filter, set to >1.0 to turn off.\n      filter_f3: Forward pre-filter, set to >1.0 to turn off.\n      e_value: E-value criteria for inclusion in tblout.\n      inc_e: E-value criteria for inclusion in MSA/next round.\n      dom_e: Domain e-value criteria for inclusion in tblout.\n      incdom_e: Domain e-value criteria for inclusion of domains in MSA/next\n        round.\n      filter_max: Remove all filters, will ignore all filter_f* settings.\n\n    Raises:\n      RuntimeError: If hmmsearch binary not found within the path.\n    \"\"\"\n    self._binary_path = binary_path\n    self._hmmbuild_runner = hmmbuild.Hmmbuild(\n        alphabet=alphabet, binary_path=hmmbuild_binary_path\n    )\n    self._database_path = database_path\n    flags = []\n    if filter_max:\n      flags.append('--max')\n    else:\n      if filter_f1 is not None:\n        flags.extend(('--F1', filter_f1))\n      if filter_f2 is not None:\n        flags.extend(('--F2', filter_f2))\n      if filter_f3 is not None:\n        flags.extend(('--F3', filter_f3))\n\n    if e_value is not None:\n      flags.extend(('-E', e_value))\n    if inc_e is not None:\n      flags.extend(('--incE', inc_e))\n    if dom_e is not None:\n      flags.extend(('--domE', dom_e))\n    if incdom_e is not None:\n      flags.extend(('--incdomE', incdom_e))\n\n    self._flags = tuple(map(str, flags))\n\n    subprocess_utils.check_binary_exists(\n        path=self._binary_path, name='hmmsearch'\n    )\n\n    if not os.path.exists(self._database_path):\n      logging.error('Could not find hmmsearch database %s', database_path)\n      raise ValueError(f'Could not find hmmsearch database {database_path}')\n\n  def query_with_hmm(self, hmm: str) -> str:\n    \"\"\"Queries the database using hmmsearch using a given hmm.\"\"\"\n    with tempfile.TemporaryDirectory() as query_tmp_dir:\n      hmm_input_path = os.path.join(query_tmp_dir, 'query.hmm')\n      sto_out_path = os.path.join(query_tmp_dir, 'output.sto')\n      with open(hmm_input_path, 'w') as f:\n        f.write(hmm)\n\n      cmd = [\n          self._binary_path,\n          '--noali',  # Don't include the alignment in stdout.\n          *('--cpu', '8'),\n      ]\n      # If adding flags, we have to do so before the output and input:\n      if self._flags:\n        cmd.extend(self._flags)\n      cmd.extend([\n          *('-A', sto_out_path),\n          hmm_input_path,\n          self._database_path,\n      ])\n\n      subprocess_utils.run(\n          cmd=cmd,\n          cmd_name=f'Hmmsearch ({os.path.basename(self._database_path)})',\n          log_stdout=False,\n          log_stderr=True,\n          log_on_process_error=True,\n      )\n\n      with open(sto_out_path) as f:\n        a3m_out = parsers.convert_stockholm_to_a3m(\n            f, remove_first_row_gaps=False, linewidth=60\n        )\n\n    return a3m_out\n\n  def query_with_a3m(self, a3m_in: str) -> str:\n    \"\"\"Query the database using hmmsearch using a given a3m.\"\"\"\n\n    # Only the \"fast\" model construction makes sense with A3M, as it doesn't\n    # have any way to annotate reference columns.\n    hmm = self._hmmbuild_runner.build_profile_from_a3m(a3m_in)\n    return self.query_with_hmm(hmm)\n\n  def query_with_sto(\n      self, msa_sto: str, model_construction: str = 'fast'\n  ) -> str:\n    \"\"\"Queries the database using hmmsearch using a given stockholm msa.\"\"\"\n    hmm = self._hmmbuild_runner.build_profile_from_sto(\n        msa_sto, model_construction=model_construction\n    )\n    return self.query_with_hmm(hmm)\n"
  },
  {
    "path": "src/alphafold3/data/tools/jackhmmer.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Library to run Jackhmmer from Python.\"\"\"\n\nfrom collections.abc import Iterable, Sequence\nfrom concurrent import futures\nimport heapq\nimport os\nimport pathlib\nimport shutil\nimport tempfile\nimport time\n\nfrom absl import logging\nfrom alphafold3.data import parsers\nfrom alphafold3.data.tools import msa_tool\nfrom alphafold3.data.tools import shards\nfrom alphafold3.data.tools import subprocess_utils\n\n\nclass Jackhmmer(msa_tool.MsaTool):\n  \"\"\"Python wrapper of the Jackhmmer binary.\"\"\"\n\n  def __init__(\n      self,\n      *,\n      binary_path: str,\n      database_path: str,\n      n_cpu: int = 8,\n      n_iter: int = 3,\n      e_value: float | None = 1e-3,\n      z_value: float | int | None = None,\n      dom_e: float | None = None,\n      dom_z_value: float | int | None = None,\n      max_sequences: int = 5000,\n      filter_f1: float = 5e-4,\n      filter_f2: float = 5e-5,\n      filter_f3: float = 5e-7,\n      max_threads: int | None = None,\n      **unused_kwargs,\n  ):\n    \"\"\"Initializes the Python Jackhmmer wrapper.\n\n    NOTE: The MSA obtained by running against sharded dbs won't be always\n    exactly the same as the MSA obtained by running against an unsharded db.\n    This is because of Jackhmmer deduplication logic, which won't spot duplicate\n    hits across multiple shards. Usually this means that the sharded search\n    finds more hits (likely bounded by the number of shards), but this should\n    not pose an issue given how the results are used downstream. The problem is\n    more pronounced with deep MSAs and lower in the hit list (higher e-values).\n\n    Make sure to set the Z and domZ values when searching against a sharded\n    database, otherwise the results won't match the normal unsharded search.\n\n    Args:\n      binary_path: The path to the jackhmmer executable.\n      database_path: The path to the jackhmmer database (FASTA format). Sharded\n        file specs, e.g. `<db_path>@<num_shards>`, are supported.\n      n_cpu: The number of CPUs to give Jackhmmer.\n      n_iter: The number of Jackhmmer iterations.\n      e_value: The E-value, see Jackhmmer docs for more details.\n      z_value: The Z-value representing the number of comparisons done (i.e\n        correct database size) for E-value calculation. Make sure to set this\n        when searching against a sharded database, otherwise the e-values will\n        be incorrectly scaled.\n      dom_e: Domain e-value criteria for inclusion in tblout.\n      dom_z_value: Domain z-value representing the number of comparisons done\n        (i.e correct database size) for domain E-value calculation. Make sure to\n        set this when searching against a sharded database, otherwise the domain\n        e-values will be incorrectly scaled.\n      max_sequences: Maximum number of sequences to return in the MSA.\n      filter_f1: MSV and biased composition pre-filter, set to >1.0 to turn off.\n      filter_f2: Viterbi pre-filter, set to >1.0 to turn off.\n      filter_f3: Forward pre-filter, set to >1.0 to turn off.\n      max_threads: If given, the maximum number of threads used when running\n        sharded databases.\n\n    Raises:\n      RuntimeError: If Jackhmmer binary not found within the path.\n      ValueError: If an invalid configuration is provided in the args.\n    \"\"\"\n    self._database_path = database_path\n\n    if shard_paths := shards.get_sharded_paths(self._database_path):\n      if n_iter != 1:\n        raise ValueError('For a sharded db, only n_iter=1 is supported.')\n      if z_value is None:\n        raise ValueError(\n            'The Z-value must be set when searching against a sharded database '\n            'to correctly scale e-values.'\n        )\n      if max_sequences <= 1:\n        raise ValueError(\n            'max_sequences must be greater than 1 when running in sharded '\n            'mode, because each shard would return only the query sequence.'\n        )\n\n      self._shard_paths = shard_paths\n      self._max_threads = len(self._shard_paths)\n      if max_threads is not None:\n        self._max_threads = min(max_threads, self._max_threads)\n      logging.info('Jackhmmer running with max_threads = %d', self._max_threads)\n    else:\n      self._shard_paths = None\n      self._max_threads = None\n\n    self._binary_path = binary_path\n    subprocess_utils.check_binary_exists(\n        path=self._binary_path, name='Jackhmmer'\n    )\n\n    self._n_cpu = n_cpu\n    self._n_iter = n_iter\n    self._e_value = e_value\n    self._z_value = z_value\n    self._dom_e = dom_e\n    self._dom_z_value = dom_z_value\n    self._max_sequences = max_sequences\n    self._filter_f1 = filter_f1\n    self._filter_f2 = filter_f2\n    self._filter_f3 = filter_f3\n\n    # If Jackhmmer supports the --seq_limit flag (via our patch), use it to\n    # prevent writing out redundant sequences and increasing peak memory usage.\n    # If not, the Jackhmmer will be run without the --seq_limit flag.\n    self._supports_seq_limit = subprocess_utils.jackhmmer_seq_limit_supported(\n        self._binary_path\n    )\n\n  def query(self, target_sequence: str) -> msa_tool.MsaToolResult:\n    \"\"\"Query the database (sharded or unsharded) using Jackhmmer.\"\"\"\n    if self._shard_paths:\n      # Sharded case, run the query against each database shard in parallel.\n      logging.info(\n          'Query sequence (sharded db): %s',\n          target_sequence\n          if len(target_sequence) <= 16\n          else f'{target_sequence[:16]}... (len {len(target_sequence)})',\n      )\n\n      global_temp_dir = tempfile.mkdtemp()\n\n      def _query_shard_fn(\n          shard_path: str,\n      ) -> tuple[msa_tool.MsaToolResult, float]:\n        t_start = time.time()\n        result = self._query_db_shard(\n            target_sequence=target_sequence,\n            db_shard_path=shard_path,\n            get_tblout=True,  # Tblout contains e-values needed for merging.\n            global_temp_dir=global_temp_dir,\n        )\n        return result, time.time() - t_start\n\n      with futures.ThreadPoolExecutor(max_workers=self._max_threads) as ex:\n        tool_outputs, timings = zip(*ex.map(_query_shard_fn, self._shard_paths))\n\n      logging.info(\n          'Finished query for %d shards, shard timings (seconds): %s',\n          len(tool_outputs),\n          ', '.join(f'{t:.1f}' for t in timings),\n      )\n\n      shutil.rmtree(global_temp_dir, ignore_errors=True)\n      return _merge_jackhmmer_results(tool_outputs, self._max_sequences)\n\n    else:\n      # Non-sharded case, run the query against the whole database.\n      logging.info(\n          'Query sequence (non-sharded db): %s',\n          target_sequence\n          if len(target_sequence) <= 16\n          else f'{target_sequence[:16]}... (len {len(target_sequence)})',\n      )\n      return self._query_db_shard(\n          target_sequence=target_sequence,\n          db_shard_path=self._database_path,\n          get_tblout=False,\n      )\n\n  def _query_db_shard(\n      self,\n      *,\n      target_sequence: str,\n      db_shard_path: str,\n      get_tblout: bool,\n      global_temp_dir: str | None = None,\n  ) -> msa_tool.MsaToolResult:\n    \"\"\"Query the database shard using Jackhmmer.\"\"\"\n\n    with tempfile.TemporaryDirectory(dir=global_temp_dir) as query_tmp_dir:\n      input_fasta_path = os.path.join(query_tmp_dir, 'query.fasta')\n      subprocess_utils.create_query_fasta_file(\n          sequence=target_sequence, path=input_fasta_path\n      )\n      output_sto_path = os.path.join(query_tmp_dir, 'output.sto')\n      pathlib.Path(output_sto_path).touch()\n\n      # The F1/F2/F3 are the expected proportion to pass each of the filtering\n      # stages (which get progressively more expensive), reducing these\n      # speeds up the pipeline at the expensive of sensitivity.  They are\n      # currently set very low to make querying Mgnify run in a reasonable\n      # amount of time.\n      cmd_flags = [\n          *('-o', '/dev/null'),  # Don't pollute stdout with Jackhmmer output.\n          *('-A', output_sto_path),\n          '--noali',\n          *('--F1', str(self._filter_f1)),\n          *('--F2', str(self._filter_f2)),\n          *('--F3', str(self._filter_f3)),\n          *('--cpu', str(self._n_cpu)),\n          *('-N', str(self._n_iter)),\n      ]\n\n      if get_tblout:\n        output_tblout_path = pathlib.Path(query_tmp_dir, 'tblout.txt')\n        output_tblout_path.touch()\n        cmd_flags.extend(['--tblout', str(output_tblout_path)])\n      else:\n        output_tblout_path = None\n\n      # Report only sequences with E-values <= x in per-sequence output.\n      if self._e_value is not None:\n        cmd_flags.extend(['-E', str(self._e_value)])\n\n        # Use the same value as the reporting e-value (`-E` flag).\n        cmd_flags.extend(['--incE', str(self._e_value)])\n\n      if self._z_value is not None:\n        cmd_flags.extend(['-Z', str(self._z_value)])\n\n      if self._dom_z_value is not None:\n        cmd_flags.extend(['--domZ', str(self._dom_z_value)])\n\n      if self._dom_e is not None:\n        cmd_flags.extend(['--domE', str(self._dom_e)])\n\n      if self._max_sequences is not None and self._supports_seq_limit:\n        cmd_flags.extend(['--seq_limit', str(self._max_sequences)])\n\n      # The input FASTA and the input db are the last two arguments.\n      cmd = [self._binary_path] + cmd_flags + [input_fasta_path, db_shard_path]\n\n      subprocess_utils.run(\n          cmd=cmd,\n          cmd_name=f'Jackhmmer ({os.path.basename(db_shard_path)})',\n          log_stdout=False,\n          log_stderr=True,\n          log_on_process_error=True,\n      )\n\n      with open(output_sto_path) as f:\n        a3m = parsers.convert_stockholm_to_a3m(\n            f, max_sequences=self._max_sequences\n        )\n\n      # Get the tabular output which has e.g. e-value for each target.\n      tbl = '' if output_tblout_path is None else output_tblout_path.read_text()\n\n      return msa_tool.MsaToolResult(\n          target_sequence=target_sequence,\n          a3m=a3m,\n          e_value=self._e_value,\n          tblout=tbl,\n      )\n\n\ndef _merge_jackhmmer_results(\n    jh_results: Sequence[msa_tool.MsaToolResult], max_sequences: int\n) -> msa_tool.MsaToolResult:\n  \"\"\"Merges Jackhmmer result protos into a single one.\"\"\"\n  assert len(set(jh_res.target_sequence for jh_res in jh_results)) == 1\n  assert len(set(jh_res.e_value for jh_res in jh_results)) == 1\n\n  # Parse the TBL output, create a mapping from hit name to TBL line.\n  parsed_tbl = {}\n  for jh_result in jh_results:\n    assert jh_result.tblout is not None\n    for line in jh_result.tblout.splitlines():\n      if not line.startswith('#'):\n        parsed_tbl[line.partition(' ')[0]] = line\n\n  # Create an iterator and merge a3m info with tbl info.\n  def _merged_a3m_tbl_iter(a3m: str) -> Iterable[tuple[str, str, str, str]]:\n    # Don't parse the entire a3m, lazily parse only as many sequences as needed.\n    iterator = iter(parsers.lazy_parse_fasta_string(a3m))\n    next(iterator)  # Skip the query which isn't present in tblout.\n    for sequence, description in iterator:\n      name = description.partition(' ')[0].partition('/')[0]\n      if tbl_info := parsed_tbl.get(name):\n        # Skip sequences for which we don't have tbl information.\n        yield sequence, description, tbl_info, name\n\n  def sort_key(seq_data: tuple[str, str, str, str]) -> tuple[float, float, str]:\n    unused_seq, unused_description, tbl_info, name = seq_data\n    # Tblout lines have 19 whitespace delimited columns. \"-\" used if no value\n    # present. We want e-value (column 5) and bit score (column 6), so do only 6\n    # splits. E-value and bit score are equivalent, but bit score might have\n    # higher resolution. Use the name in case of a tie.\n    e_value, bit_score = tbl_info.split(maxsplit=6)[4:6]\n    return float(e_value), -float(bit_score), name\n\n  # A3M/TBL is sorted by e-value and name, hence we can merge them efficiently.\n  merged_a3m_and_tblout = heapq.merge(\n      *[_merged_a3m_tbl_iter(res.a3m) for res in jh_results],\n      key=sort_key,\n  )\n\n  # Truncate the a3m to max_sequences. Do not truncate the tblout.\n  merged_tblout = []\n  merged_a3m = [f'>query\\n{jh_results[0].target_sequence}']\n  for seq, description, tbl_info, _ in merged_a3m_and_tblout:\n    merged_tblout.append(tbl_info)\n    if len(merged_a3m) < max_sequences:\n      merged_a3m.append(f'>{description}\\n{seq}')\n\n  logging.info(\n      'Limiting merged MSA depth from %d to %d',\n      len(merged_tblout),\n      max_sequences,\n  )\n\n  return msa_tool.MsaToolResult(\n      target_sequence=jh_results[0].target_sequence,\n      a3m='\\n'.join(merged_a3m),\n      e_value=jh_results[0].e_value,\n      tblout=None,  # We no longer need the tblout.\n  )\n"
  },
  {
    "path": "src/alphafold3/data/tools/msa_tool.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Defines protocol for MSA tools.\"\"\"\n\nimport dataclasses\nfrom typing import Protocol\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass MsaToolResult:\n  \"\"\"The result of a MSA tool query.\n\n  Attributes:\n    target_sequence: The sequence that was used to query the MSA tool.\n    e_value: The e-value that was used to filter the MSA tool results.\n    a3m: The MSA output of the tool in the A3M format.\n    tblout: The optional tblout output of the MSA tool (needed for merging\n      results of queries against a sharded database).\n  \"\"\"\n\n  target_sequence: str\n  e_value: float\n  a3m: str\n  tblout: str | None = None\n\n\nclass MsaTool(Protocol):\n  \"\"\"Interface for MSA tools.\"\"\"\n\n  def query(self, target_sequence: str) -> MsaToolResult:\n    \"\"\"Runs the MSA tool on the target sequence.\"\"\"\n"
  },
  {
    "path": "src/alphafold3/data/tools/nhmmer.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Library to run Nhmmer from Python.\"\"\"\n\nfrom collections.abc import Iterable, Sequence\nfrom concurrent import futures\nimport heapq\nimport os\nimport pathlib\nimport shutil\nimport tempfile\nimport time\nfrom typing import Final\n\nfrom absl import logging\nfrom alphafold3.data import parsers\nfrom alphafold3.data.tools import hmmalign\nfrom alphafold3.data.tools import hmmbuild\nfrom alphafold3.data.tools import msa_tool\nfrom alphafold3.data.tools import shards\nfrom alphafold3.data.tools import subprocess_utils\n\n\n_SHORT_SEQUENCE_CUTOFF: Final[int] = 50\n\n\nclass Nhmmer(msa_tool.MsaTool):\n  \"\"\"Python wrapper of the Nhmmer binary.\"\"\"\n\n  def __init__(\n      self,\n      binary_path: str,\n      hmmalign_binary_path: str,\n      hmmbuild_binary_path: str,\n      database_path: str,\n      n_cpu: int = 8,\n      e_value: float = 1e-3,\n      z_value: float | int | None = None,\n      max_sequences: int = 5000,\n      filter_f3: float = 1e-5,\n      alphabet: str | None = None,\n      strand: str | None = None,\n      max_threads: int | None = None,\n  ):\n    \"\"\"Initializes the Python Nhmmer wrapper.\n\n    NOTE: The MSA obtained by running against sharded dbs won't be always\n    exactly the same as the MSA obtained by running against an unsharded db.\n    This is because of Jackhmmer deduplication logic, which won't spot duplicate\n    hits across multiple shards. Usually this means that the sharded search\n    finds more hits (likely bounded by the number of shards), but this should\n    not pose an issue given how the results are used downstream. The problem is\n    more pronounced with deep MSAs and lower in the hit list (higher e-values).\n\n    Make sure to set the Z value when searching against a sharded database,\n    otherwise the results won't match the normal unsharded search.\n\n    Args:\n      binary_path: Path to the Nhmmer binary.\n      hmmalign_binary_path: Path to the Hmmalign binary.\n      hmmbuild_binary_path: Path to the Hmmbuild binary.\n      database_path: MSA database path to search against. This can be either a\n        FASTA (slow) or HMMERDB produced from the FASTA using the makehmmerdb\n        binary. The HMMERDB is ~10x faster but experimental.  Sharded file\n        specs, e.g. <db_path>@<num_shards>, are supported.\n      n_cpu: The number of CPUs to give Nhmmer.\n      e_value: The E-value, see Nhmmer docs for more details. Will be\n        overwritten if bit_score is set.\n      z_value: The Z-value representing the number of comparisons done (i.e\n        correct database size) for E-value calculation. Make sure to set this\n        when searching against a sharded database, otherwise the e-values will\n        be incorrectly scaled.\n      max_sequences: Maximum number of sequences to return in the MSA.\n      filter_f3: Forward pre-filter, set to >1.0 to turn off.\n      alphabet: The alphabet to assert when building a profile with hmmbuild.\n        This must be 'rna', 'dna', or None.\n      strand: \"watson\" searches query sequence, \"crick\" searches\n        reverse-compliment and default is None which means searching for both.\n      max_threads: If given, the maximum number of threads used when running\n        sharded databases.\n\n    Raises:\n      RuntimeError: If Nhmmer binary not found within the path.\n      ValueError: If an invalid configuration is provided in the args.\n    \"\"\"\n    self._database_path = database_path\n\n    if shard_paths := shards.get_sharded_paths(self._database_path):\n      if z_value is None:\n        raise ValueError(\n            'The Z-value must be set when searching against a sharded database '\n            'to correctly scale e-values.'\n        )\n      if 'hmmerdb' in self._database_path:\n        raise ValueError('HMMERDB is not supported in sharded mode.')\n\n      if max_sequences <= 1:\n        raise ValueError(\n            'max_sequences must be greater than 1 when running in sharded '\n            'mode, because each shard would return only the query sequence.'\n        )\n\n      self._shard_paths = shard_paths\n      self._max_threads = len(self._shard_paths)\n      if max_threads is not None:\n        self._max_threads = min(max_threads, self._max_threads)\n      logging.info('Nhmmer running with max_threads = %d', self._max_threads)\n    else:\n      self._shard_paths = None\n      self._max_threads = None\n\n    self._binary_path = binary_path\n    self._hmmalign_binary_path = hmmalign_binary_path\n    self._hmmbuild_binary_path = hmmbuild_binary_path\n    subprocess_utils.check_binary_exists(path=self._binary_path, name='Nhmmer')\n\n    if strand and strand not in {'watson', 'crick'}:\n      raise ValueError(f'Invalid {strand=}. only \"watson\" or \"crick\" supported')\n\n    if alphabet and alphabet not in {'rna', 'dna'}:\n      raise ValueError(f'Invalid {alphabet=}, only \"rna\" or \"dna\" supported')\n\n    self._e_value = e_value\n    self._n_cpu = n_cpu\n    self._z_value = z_value\n    self._max_sequences = max_sequences\n    self._filter_f3 = filter_f3\n    self._alphabet = alphabet\n    self._strand = strand\n\n  def query(self, target_sequence: str) -> msa_tool.MsaToolResult:\n    \"\"\"Query the database (sharded or unsharded) using Nhmmer.\"\"\"\n    if self._shard_paths:\n      # Sharded case, run the query against each database shard in parallel.\n      logging.info(\n          'Query sequence (sharded db): %s',\n          target_sequence\n          if len(target_sequence) <= 16\n          else f'{target_sequence[:16]}... (len {len(target_sequence)})',\n      )\n\n      global_temp_dir = tempfile.mkdtemp()\n\n      def _query_shard_fn(\n          shard_path: str,\n      ) -> tuple[msa_tool.MsaToolResult, float]:\n        t_start = time.time()\n        # Get tblout as it contains e-values we need for merging sequences.\n        result = self._query_db_shard(\n            target_sequence=target_sequence,\n            db_shard_path=shard_path,\n            get_tblout=True,  # Tblout contains e-values needed for merging.\n            global_temp_dir=global_temp_dir,\n        )\n        return result, time.time() - t_start\n\n      with futures.ThreadPoolExecutor(max_workers=self._max_threads) as ex:\n        tool_outputs, timings = zip(*ex.map(_query_shard_fn, self._shard_paths))\n\n      logging.info(\n          'Finished query for %d shards, shard timings (seconds): %s',\n          len(tool_outputs),\n          ', '.join(f'{t:.1f}' for t in timings),\n      )\n\n      shutil.rmtree(global_temp_dir, ignore_errors=True)\n      return _merge_nhmmer_results(tool_outputs, self._max_sequences)\n\n    else:\n      # Non-sharded case, run the query against the whole database.\n      logging.info(\n          'Query sequence (non-sharded db): %s',\n          target_sequence\n          if len(target_sequence) <= 16\n          else f'{target_sequence[:16]}... (len {len(target_sequence)})',\n      )\n      return self._query_db_shard(\n          target_sequence=target_sequence,\n          db_shard_path=self._database_path,\n          get_tblout=False,\n      )\n\n  def _query_db_shard(\n      self,\n      *,\n      target_sequence: str,\n      db_shard_path: str,\n      get_tblout: bool,\n      global_temp_dir: str | None = None,\n  ) -> msa_tool.MsaToolResult:\n    \"\"\"Query the database shard using Nhmmer.\"\"\"\n\n    with tempfile.TemporaryDirectory(dir=global_temp_dir) as query_tmp_dir:\n      input_a3m_path = os.path.join(query_tmp_dir, 'query.a3m')\n      output_sto_path = os.path.join(query_tmp_dir, 'output.sto')\n      pathlib.Path(output_sto_path).touch()\n      subprocess_utils.create_query_fasta_file(\n          sequence=target_sequence, path=input_a3m_path\n      )\n\n      cmd_flags = [\n          *('-o', '/dev/null'),  # Don't pollute stdout with nhmmer output.\n          '--noali',  # Don't include the alignment in stdout.\n          *('--cpu', str(self._n_cpu)),\n      ]\n\n      if get_tblout:\n        output_tblout_path = pathlib.Path(query_tmp_dir, 'tblout.txt')\n        output_tblout_path.touch()\n        cmd_flags.extend(['--tblout', str(output_tblout_path)])\n      else:\n        output_tblout_path = None\n\n      cmd_flags.extend(['-E', str(self._e_value)])\n\n      if self._z_value is not None:\n        cmd_flags.extend(['-Z', str(self._z_value)])\n\n      if self._alphabet:\n        cmd_flags.extend([f'--{self._alphabet}'])\n\n      if self._strand is not None:\n        cmd_flags.extend([f'--{self._strand}'])\n\n      cmd_flags.extend(['-A', output_sto_path])\n      # As recommend by RNAcentral for short sequences.\n      if (\n          self._alphabet == 'rna'\n          and len(target_sequence) < _SHORT_SEQUENCE_CUTOFF\n      ):\n        cmd_flags.extend(['--F3', str(0.02)])\n      else:\n        cmd_flags.extend(['--F3', str(self._filter_f3)])\n\n      # The input A3M and the db are the last two arguments.\n      cmd_flags.extend((input_a3m_path, db_shard_path))\n\n      cmd = [self._binary_path, *cmd_flags]\n      subprocess_utils.run(\n          cmd=cmd,\n          cmd_name=f'Nhmmer ({os.path.basename(db_shard_path)})',\n          log_stdout=False,\n          log_stderr=True,\n          log_on_process_error=True,\n      )\n\n      if os.path.getsize(output_sto_path) > 0:\n        with open(output_sto_path) as f:\n          a3m_out = parsers.convert_stockholm_to_a3m(\n              f, max_sequences=self._max_sequences - 1  # Query not included.\n          )\n        # Nhmmer hits are generally shorter than the query sequence. To get MSA\n        # of width equal to the query sequence, align hits to the query profile.\n        logging.info('Aligning output a3m of size %d bytes', len(a3m_out))\n\n        aligner = hmmalign.Hmmalign(self._hmmalign_binary_path)\n        target_sequence_fasta = f'>query\\n{target_sequence}\\n'\n        profile_builder = hmmbuild.Hmmbuild(\n            binary_path=self._hmmbuild_binary_path, alphabet=self._alphabet\n        )\n        profile = profile_builder.build_profile_from_a3m(target_sequence_fasta)\n        a3m_out = aligner.align_sequences_to_profile(\n            profile=profile, sequences_a3m=a3m_out\n        )\n        a3m_out = ''.join([target_sequence_fasta, a3m_out])\n\n        # Parse the output a3m to remove line breaks.\n        a3m = '\\n'.join(\n            [f'>{n}\\n{s}' for s, n in parsers.lazy_parse_fasta_string(a3m_out)]\n        )\n      else:\n        # Nhmmer returns an empty file if there are no hits.\n        # In this case return only the query sequence.\n        a3m = f'>query\\n{target_sequence}'\n\n      # Get the tabular output which has e.g. e-value for each target.\n      tbl = '' if output_tblout_path is None else output_tblout_path.read_text()\n\n    return msa_tool.MsaToolResult(\n        target_sequence=target_sequence,\n        e_value=self._e_value,\n        a3m=a3m,\n        tblout=tbl,\n    )\n\n\ndef _merge_nhmmer_results(\n    nhmmer_results: Sequence[msa_tool.MsaToolResult],\n    max_sequences: int,\n) -> msa_tool.MsaToolResult:\n  \"\"\"Merges nhmmer result protos into a single one.\"\"\"\n  assert len(set(nh_res.target_sequence for nh_res in nhmmer_results)) == 1\n  assert len(set(nh_res.e_value for nh_res in nhmmer_results)) == 1\n\n  # Parse the TBL output, create a mapping from unique hit ID to TBL line.\n  parsed_tbl = {}\n  for nhmmer_result in nhmmer_results:\n    assert nhmmer_result.tblout is not None\n    for line in nhmmer_result.tblout.splitlines():\n      if not line.startswith('#'):\n        line_fields = line.split(maxsplit=15)\n        accession = line_fields[0]\n        alignment_from = line_fields[6]\n        alignment_to = line_fields[7]\n        # This is the unique ID that is used in the output A3M.\n        unique_id = f'{accession}/{alignment_from}-{alignment_to}'\n        parsed_tbl[unique_id] = line\n\n  # Create an iterator and merge a3m info with tbl info.\n  def _merged_a3m_tbl_iter(a3m: str) -> Iterable[tuple[str, str, str, str]]:\n    # Don't parse the entire a3m, lazily parse only as many sequences as needed.\n    iterator = iter(parsers.lazy_parse_fasta_string(a3m))\n    next(iterator)  # Skip the query which isn't present in tblout.\n    for sequence, description in iterator:\n      name = description.partition(' ')[0]\n      if tbl_info := parsed_tbl.get(name):\n        # Skip sequences for which we don't have tbl information.\n        yield sequence, description, tbl_info, name\n\n  def sort_key(seq_data: tuple[str, str, str, str]) -> tuple[float, str]:\n    unused_seq, unused_description, tbl_info, name = seq_data\n    # Nucleic tblout has 16 space delimited columns. \"-\" used if no value\n    # present. We want e-value in column 12, so do only 13 splits. Use the name\n    # in case of an e-value tie.\n    return float(tbl_info.split(maxsplit=13)[12]), name\n\n  # A3M/TBL is sorted by e-value and name, hence we can merge them efficiently.\n  merged_a3m_and_tblout = heapq.merge(\n      *[_merged_a3m_tbl_iter(res.a3m) for res in nhmmer_results],\n      key=sort_key,\n  )\n\n  # Truncate the a3m to max_sequences. Do not truncate the tblout.\n  merged_tblout = []\n  merged_a3m = [f'>query\\n{nhmmer_results[0].target_sequence}']\n  for seq, description, tbl_info, _ in merged_a3m_and_tblout:\n    merged_tblout.append(tbl_info)\n    if len(merged_a3m) < max_sequences:\n      merged_a3m.append(f'>{description}\\n{seq}')\n\n  logging.info(\n      'Limiting merged MSA depth from %d to %d',\n      len(merged_tblout),\n      max_sequences,\n  )\n\n  return msa_tool.MsaToolResult(\n      target_sequence=nhmmer_results[0].target_sequence,\n      a3m='\\n'.join(merged_a3m),\n      e_value=nhmmer_results[0].e_value,\n      tblout=None,  # We no longer need the tblout.\n  )\n"
  },
  {
    "path": "src/alphafold3/data/tools/rdkit_utils.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Tools for calculating features for ligands.\"\"\"\n\nimport collections\nfrom collections.abc import Mapping, Sequence\n\nfrom absl import logging\nfrom alphafold3.cpp import cif_dict\nimport numpy as np\nimport rdkit.Chem as rd_chem\nfrom rdkit.Chem import AllChem as rd_all_chem\n\n\n_RDKIT_MMCIF_TO_BOND_TYPE: Mapping[str, rd_chem.BondType] = {\n    'SING': rd_chem.BondType.SINGLE,\n    'DOUB': rd_chem.BondType.DOUBLE,\n    'TRIP': rd_chem.BondType.TRIPLE,\n}\n\n_RDKIT_BOND_TYPE_TO_MMCIF: Mapping[rd_chem.BondType, str] = {\n    v: k for k, v in _RDKIT_MMCIF_TO_BOND_TYPE.items()\n}\n\n_RDKIT_BOND_STEREO_TO_MMCIF: Mapping[rd_chem.BondStereo, str] = {\n    rd_chem.BondStereo.STEREONONE: 'N',\n    rd_chem.BondStereo.STEREOE: 'E',\n    rd_chem.BondStereo.STEREOZ: 'Z',\n    rd_chem.BondStereo.STEREOCIS: 'Z',\n    rd_chem.BondStereo.STEREOTRANS: 'E',\n}\n\n\nclass MolFromMmcifError(Exception):\n  \"\"\"Raised when conversion from mmCIF to RDKit Mol fails.\"\"\"\n\n\nclass UnsupportedMolBondError(Exception):\n  \"\"\"Raised when we try to handle unsupported RDKit bonds.\"\"\"\n\n\ndef _populate_atoms_in_mol(\n    mol: rd_chem.Mol,\n    atom_names: Sequence[str],\n    atom_types: Sequence[str],\n    atom_charges: Sequence[int],\n    implicit_hydrogens: bool,\n    ligand_name: str,\n    atom_leaving_flags: Sequence[str],\n):\n  \"\"\"Populate the atoms of a Mol given atom features.\n\n  Args:\n    mol: Mol object.\n    atom_names: Names of the atoms.\n    atom_types: Types of the atoms.\n    atom_charges: Charges of the atoms.\n    implicit_hydrogens: Whether to mark the atoms to allow implicit Hs.\n    ligand_name: Name of the ligand which the atoms are in.\n    atom_leaving_flags: Whether the atom is possibly a leaving atom. Values from\n      the CCD column `_chem_comp_atom.pdbx_leaving_atom_flag`. The expected\n      values are 'Y' (yes), 'N' (no), '?' (unknown/unset, interpreted as no).\n\n  Raises:\n    ValueError: If atom type is invalid.\n  \"\"\"\n  # Map atom names to the position they will take in the rdkit molecule.\n  atom_name_to_idx = {name: i for i, name in enumerate(atom_names)}\n\n  for atom_name, atom_type, atom_charge, atom_leaving_flag in zip(\n      atom_names, atom_types, atom_charges, atom_leaving_flags, strict=True\n  ):\n    try:\n      if atom_type == 'X':\n        atom_type = '*'\n      atom = rd_chem.Atom(atom_type)\n    except RuntimeError as e:\n      raise ValueError(f'Failed to use atom type: {str(e)}') from e\n\n    if not implicit_hydrogens:\n      atom.SetNoImplicit(True)\n\n    atom.SetProp('atom_name', atom_name)\n    atom.SetProp('atom_leaving_flag', atom_leaving_flag)\n    atom.SetFormalCharge(atom_charge)\n    residue_info = rd_chem.AtomPDBResidueInfo()\n    residue_info.SetName(_format_atom_name(atom_name, atom_type))\n    residue_info.SetIsHeteroAtom(True)\n    residue_info.SetResidueName(ligand_name)\n    residue_info.SetResidueNumber(1)\n    atom.SetPDBResidueInfo(residue_info)\n    atom_index = mol.AddAtom(atom)\n    assert atom_index == atom_name_to_idx[atom_name]\n\n\ndef _populate_bonds_in_mol(\n    mol: rd_chem.Mol,\n    atom_names: Sequence[str],\n    bond_begins: Sequence[str],\n    bond_ends: Sequence[str],\n    bond_orders: Sequence[str],\n    bond_is_aromatics: Sequence[bool],\n):\n  \"\"\"Populate the bonds of a Mol given bond features.\n\n  Args:\n    mol: Mol object.\n    atom_names: Names of atoms in the molecule.\n    bond_begins: Names of atoms at the beginning of the bond.\n    bond_ends: Names of atoms at the end of the bond.\n    bond_orders: What order the bonds are.\n    bond_is_aromatics: Whether the bonds are aromatic.\n  \"\"\"\n  atom_name_to_idx = {name: i for i, name in enumerate(atom_names)}\n  for begin, end, bond_type, is_aromatic in zip(\n      bond_begins, bond_ends, bond_orders, bond_is_aromatics, strict=True\n  ):\n    begin_name, end_name = atom_name_to_idx[begin], atom_name_to_idx[end]\n    bond_idx = mol.AddBond(begin_name, end_name, bond_type)\n    mol.GetBondWithIdx(bond_idx - 1).SetIsAromatic(is_aromatic)\n\n\ndef sanitize_mol(mol, sort_alphabetically, remove_hydrogens) -> rd_chem.Mol:\n  # https://www.rdkit.org/docs/source/rdkit.Chem.rdmolops.html#rdkit.Chem.rdmolops.SanitizeMol\n  # Kekulize, check valencies, set aromaticity, conjugation and hybridization.\n  # This can repair e.g. incorrect aromatic flags.\n  rd_chem.SanitizeMol(mol)\n  if sort_alphabetically:\n    mol = sort_atoms_by_name(mol)\n  if remove_hydrogens:\n    mol = rd_chem.RemoveHs(mol)\n  return mol\n\n\ndef _add_conformer_to_mol(mol, conformer, force_parse) -> rd_chem.Mol:\n  # Create conformer and use it to assign stereochemistry.\n  if conformer is not None:\n    try:\n      mol.AddConformer(conformer)\n      rd_chem.AssignStereochemistryFrom3D(mol)\n    except ValueError as e:\n      logging.warning('Failed to parse conformer: %s', e)\n      if not force_parse:\n        raise\n\n\ndef mol_from_ccd_cif(\n    mol_cif: cif_dict.CifDict,\n    *,\n    force_parse: bool = False,\n    sort_alphabetically: bool = True,\n    remove_hydrogens: bool = True,\n    implicit_hydrogens: bool = False,\n) -> rd_chem.Mol:\n  \"\"\"Creates an rdkit Mol object from a CCD mmcif data block.\n\n  The atoms are renumbered so that their names are in alphabetical order and\n  these names are placed on the atoms under property 'atom_name'.\n  Only hydrogens which are not required to define the molecule are removed.\n  For example, hydrogens that define stereochemistry around a double bond are\n  retained.\n  See this link for more details.\n  https://www.rdkit.org/docs/source/rdkit.Chem.rdmolops.html#rdkit.Chem.rdmolops.RemoveHs\n\n  Args:\n     mol_cif: An mmcif object representing a molecule.\n     force_parse: If True, assumes missing aromatic flags are false, substitutes\n       deuterium for hydrogen, assumes missing charges are 0 and ignores missing\n       conformer / stereochemistry information.\n     sort_alphabetically: True: sort atom alphabetically; False: keep CCD order\n     remove_hydrogens: if True, remove non-important hydrogens\n     implicit_hydrogens: Sets a marker on the atom that allows implicit Hs.\n\n  Returns:\n     An rdkit molecule, with the atoms sorted by name.\n\n  Raises:\n    MolToMmcifError: If conversion from mmcif to rdkit Mol fails. More detailed\n      error is available as this error's cause.\n  \"\"\"\n  # Read data fields.\n  try:\n    atom_names, atom_types, atom_charges, atom_leaving_flags = parse_atom_data(\n        mol_cif, force_parse\n    )\n    bond_begins, bond_ends, bond_orders, bond_is_aromatics = parse_bond_data(\n        mol_cif, force_parse\n    )\n    lig_name = mol_cif['_chem_comp.id'][0].rjust(3)\n  except (KeyError, ValueError) as e:\n    raise MolFromMmcifError from e\n\n  # Build Rdkit molecule.\n  mol = rd_chem.RWMol()\n\n  # Per atom features.\n  try:\n    _populate_atoms_in_mol(\n        mol=mol,\n        atom_names=atom_names,\n        atom_types=atom_types,\n        atom_charges=atom_charges,\n        implicit_hydrogens=implicit_hydrogens,\n        ligand_name=lig_name,\n        atom_leaving_flags=atom_leaving_flags,\n    )\n  except (ValueError, RuntimeError) as e:\n    raise MolFromMmcifError from e\n\n  _populate_bonds_in_mol(\n      mol, atom_names, bond_begins, bond_ends, bond_orders, bond_is_aromatics\n  )\n\n  try:\n    conformer = _parse_ideal_conformer(mol_cif)\n  except (KeyError, ValueError) as e:\n    logging.warning('Failed to parse ideal conformer: %s', e)\n    if not force_parse:\n      raise MolFromMmcifError from e\n    conformer = None\n\n  mol.UpdatePropertyCache(strict=False)\n\n  try:\n    _add_conformer_to_mol(mol, conformer, force_parse)\n    mol = sanitize_mol(mol, sort_alphabetically, remove_hydrogens)\n  except (\n      ValueError,\n      rd_chem.KekulizeException,\n      rd_chem.AtomValenceException,\n  ) as e:\n    raise MolFromMmcifError from e\n\n  return mol\n\n\ndef mol_to_ccd_cif(\n    mol: rd_chem.Mol,\n    component_id: str,\n    pdbx_smiles: str | None = None,\n    include_hydrogens: bool = True,\n) -> cif_dict.CifDict:\n  \"\"\"Creates a CCD-like mmcif data block from an rdkit Mol object.\n\n  Only a subset of associated mmcif fields is populated, but that is\n  sufficient for further usage, e.g. in featurization code.\n\n  Atom names can be specified via `atom_name` property. For atoms with\n  unspecified value of that property, the name is assigned based on element type\n  and the order in the Mol object.\n\n  If the Mol object has associated conformers, atom positions from the first of\n  them will be populated in the resulting mmcif file.\n\n  Args:\n     mol: An rdkit molecule.\n     component_id: Name of the molecule to use in the resulting mmcif. That is\n       equivalent to CCD code.\n     pdbx_smiles: If specified, the value will be used to populate\n       `_chem_comp.pdbx_smiles`.\n     include_hydrogens: Whether to include atom and bond data involving\n       hydrogens.\n\n  Returns:\n     An mmcif data block corresponding for the given rdkit molecule.\n\n  Raises:\n    UnsupportedMolBond: When a molecule contains a bond that can't be\n      represented with mmcif.\n  \"\"\"\n  mol = rd_chem.Mol(mol)\n  if include_hydrogens:\n    mol = rd_chem.AddHs(mol)\n  rd_chem.Kekulize(mol)\n\n  if mol.GetNumConformers() > 0:\n    ideal_conformer = mol.GetConformer(0).GetPositions()\n    ideal_conformer = np.vectorize(lambda x: f'{x:.3f}')(ideal_conformer)\n  else:\n    # No data will be populated in the resulting mmcif if the molecule doesn't\n    # have any conformers attached to it.\n    ideal_conformer = None\n\n  mol_cif = collections.defaultdict(list)\n  mol_cif['data_'] = [component_id]\n  mol_cif['_chem_comp.id'] = [component_id]\n  if pdbx_smiles:\n    mol_cif['_chem_comp.pdbx_smiles'] = [pdbx_smiles]\n\n  mol = assign_atom_names_from_graph(mol, keep_existing_names=True)\n\n  for atom_idx, atom in enumerate(mol.GetAtoms()):\n    element = atom.GetSymbol()\n    if not include_hydrogens and element in ('H', 'D'):\n      continue\n\n    mol_cif['_chem_comp_atom.comp_id'].append(component_id)\n    mol_cif['_chem_comp_atom.atom_id'].append(atom.GetProp('atom_name'))\n    mol_cif['_chem_comp_atom.type_symbol'].append(atom.GetSymbol().upper())\n    mol_cif['_chem_comp_atom.charge'].append(str(atom.GetFormalCharge()))\n    if ideal_conformer is not None:\n      coords = ideal_conformer[atom_idx]\n      mol_cif['_chem_comp_atom.pdbx_model_Cartn_x_ideal'].append(coords[0])\n      mol_cif['_chem_comp_atom.pdbx_model_Cartn_y_ideal'].append(coords[1])\n      mol_cif['_chem_comp_atom.pdbx_model_Cartn_z_ideal'].append(coords[2])\n\n  for bond in mol.GetBonds():\n    atom1 = bond.GetBeginAtom()\n    atom2 = bond.GetEndAtom()\n    if not include_hydrogens and (\n        atom1.GetSymbol() in ('H', 'D') or atom2.GetSymbol() in ('H', 'D')\n    ):\n      continue\n    mol_cif['_chem_comp_bond.comp_id'].append(component_id)\n    mol_cif['_chem_comp_bond.atom_id_1'].append(\n        bond.GetBeginAtom().GetProp('atom_name')\n    )\n    mol_cif['_chem_comp_bond.atom_id_2'].append(\n        bond.GetEndAtom().GetProp('atom_name')\n    )\n    try:\n      bond_type = bond.GetBondType()\n      # Older versions of RDKit did not have a DATIVE bond type. Convert it to\n      # SINGLE to match the AF3 training setup.\n      if bond_type == rd_chem.BondType.DATIVE:\n        bond_type = rd_chem.BondType.SINGLE\n      mol_cif['_chem_comp_bond.value_order'].append(\n          _RDKIT_BOND_TYPE_TO_MMCIF[bond_type]\n      )\n      mol_cif['_chem_comp_bond.pdbx_stereo_config'].append(\n          _RDKIT_BOND_STEREO_TO_MMCIF[bond.GetStereo()]\n      )\n    except KeyError as e:\n      raise UnsupportedMolBondError from e\n    mol_cif['_chem_comp_bond.pdbx_aromatic_flag'].append(\n        'Y' if bond.GetIsAromatic() else 'N'\n    )\n\n  return cif_dict.CifDict(mol_cif)\n\n\ndef _format_atom_name(atom_name: str, atom_type: str) -> str:\n  \"\"\"Formats an atom name to fit in the four characters specified in PDB.\n\n  See for example the following note on atom name formatting in PDB files:\n  https://www.cgl.ucsf.edu/chimera/docs/UsersGuide/tutorials/pdbintro.html#note1\n\n  Args:\n    atom_name: The unformatted atom name.\n    atom_type: The atom element symbol.\n\n  Returns:\n    formatted_atom_name: The formatted 4-character atom name.\n  \"\"\"\n  atom_name = atom_name.strip()\n  atom_type = atom_type.strip().upper()\n  if len(atom_name) == 1:\n    return atom_name.rjust(2).ljust(4)\n  elif len(atom_name) == 2:\n    if atom_name == atom_type:\n      return atom_name.ljust(4)\n    return atom_name.center(4)\n  elif len(atom_name) == 3:\n    if atom_name[:2] == atom_type:\n      return atom_name.ljust(4)\n    return atom_name.rjust(4)\n  elif len(atom_name) == 4:\n    return atom_name\n  else:\n    raise ValueError(\n        f'Atom name `{atom_name}` has more than four characters '\n        'or is an empty string.'\n    )\n\n\ndef parse_atom_data(\n    mol_cif: cif_dict.CifDict | Mapping[str, Sequence[str]], force_parse: bool\n) -> tuple[Sequence[str], Sequence[str], Sequence[int], Sequence[str]]:\n  \"\"\"Parses atoms. If force_parse is True, fix deuterium and missing charge.\"\"\"\n  atom_types = [t.capitalize() for t in mol_cif['_chem_comp_atom.type_symbol']]\n  atom_names = mol_cif['_chem_comp_atom.atom_id']\n  atom_charges = mol_cif['_chem_comp_atom.charge']\n  atom_leaving_flags = ['?'] * len(atom_names)\n  if '_chem_comp_atom.pdbx_leaving_atom_flag' in mol_cif:\n    atom_leaving_flags = mol_cif['_chem_comp_atom.pdbx_leaving_atom_flag']\n\n  if force_parse:\n    # Replace missing charges with 0.\n    atom_charges = [charge if charge != '?' else '0' for charge in atom_charges]\n    # Deuterium for hydrogen.\n    atom_types = [type_ if type_ != 'D' else 'H' for type_ in atom_types]\n\n  atom_charges = [int(atom_charge) for atom_charge in atom_charges]\n  return atom_names, atom_types, atom_charges, atom_leaving_flags\n\n\ndef parse_bond_data(\n    mol_cif: cif_dict.CifDict | Mapping[str, Sequence[str]], force_parse: bool\n) -> tuple[\n    Sequence[str], Sequence[str], Sequence[rd_chem.BondType], Sequence[bool]\n]:\n  \"\"\"Parses bond data. If force_parse is True, ignore missing aromatic flags.\"\"\"\n  # The bond table isn't present if there are no bonds. Use [] in that case.\n  begin_atoms = mol_cif.get('_chem_comp_bond.atom_id_1', [])\n  end_atoms = mol_cif.get('_chem_comp_bond.atom_id_2', [])\n  orders = mol_cif.get('_chem_comp_bond.value_order', [])\n  bond_types = [_RDKIT_MMCIF_TO_BOND_TYPE[order] for order in orders]\n\n  try:\n    aromatic_flags = mol_cif.get('_chem_comp_bond.pdbx_aromatic_flag', [])\n    is_aromatic = [{'Y': True, 'N': False}[flag] for flag in aromatic_flags]\n  except KeyError:\n    if force_parse:\n      # Set them all to not aromatic.\n      is_aromatic = [False for _ in begin_atoms]\n    else:\n      raise\n\n  return begin_atoms, end_atoms, bond_types, is_aromatic\n\n\ndef _parse_ideal_conformer(mol_cif: cif_dict.CifDict) -> rd_chem.Conformer:\n  \"\"\"Builds a conformer containing the ideal coordinates from the CCD.\n\n  Args:\n     mol_cif: An mmcif object representing a molecule.\n\n  Returns:\n     An rdkit conformer filled with the ideal positions from the mmcif.\n\n  Raises:\n     ValueError: if the positions can't be interpreted.\n  \"\"\"\n  atom_x = [\n      float(x) for x in mol_cif['_chem_comp_atom.pdbx_model_Cartn_x_ideal']\n  ]\n  atom_y = [\n      float(y) for y in mol_cif['_chem_comp_atom.pdbx_model_Cartn_y_ideal']\n  ]\n  atom_z = [\n      float(z) for z in mol_cif['_chem_comp_atom.pdbx_model_Cartn_z_ideal']\n  ]\n  atom_positions = zip(atom_x, atom_y, atom_z, strict=True)\n\n  conformer = rd_chem.Conformer(len(atom_x))\n  for atom_index, atom_position in enumerate(atom_positions):\n    conformer.SetAtomPosition(atom_index, atom_position)\n\n  return conformer\n\n\ndef sort_atoms_by_name(mol: rd_chem.Mol) -> rd_chem.Mol:\n  \"\"\"Sorts the atoms in the molecule by their names.\"\"\"\n  atom_names = {\n      atom.GetProp('atom_name'): atom.GetIdx() for atom in mol.GetAtoms()\n  }\n\n  # Sort the name, int tuples by the names.\n  sorted_atom_names = sorted(atom_names.items())\n\n  # Zip these tuples back together to the sorted indices.\n  _, new_order = zip(*sorted_atom_names, strict=True)\n\n  # Reorder the molecule.\n  # new_order is effectively an argsort of the names.\n  return rd_chem.RenumberAtoms(mol, new_order)\n\n\ndef assign_atom_names_from_graph(\n    mol: rd_chem.Mol,\n    keep_existing_names: bool = False,\n) -> rd_chem.Mol:\n  \"\"\"Assigns atom names from the molecular graph.\n\n  The atom name is stored as an atom property 'atom_name', accessible\n  with atom.GetProp('atom_name'). If the property is already specified, and\n  keep_existing_names is True we keep the original name.\n\n  We traverse the graph in the order of the rdkit atom index and give each atom\n  a name equal to '{ELEMENT_TYPE}{INDEX}'. E.g. C5 is the name for the fifth\n  unnamed carbon encountered.\n\n  NOTE: A new mol is returned, the original is not changed in place.\n\n  Args:\n    mol: Mol object.\n    keep_existing_names: If True, atoms that already have the atom_name property\n      will keep their assigned names.\n\n  Returns:\n    A new mol, with potentially new 'atom_name' properties.\n  \"\"\"\n  mol = rd_chem.Mol(mol)\n\n  specified_atom_names = {\n      atom.GetProp('atom_name')\n      for atom in mol.GetAtoms()\n      if atom.HasProp('atom_name') and keep_existing_names\n  }\n\n  element_counts = collections.Counter()\n  for atom in mol.GetAtoms():\n    if not atom.HasProp('atom_name') or not keep_existing_names:\n      element = atom.GetSymbol()\n      while True:\n        element_counts[element] += 1\n        # Standardize names by using uppercase element type, as in CCD. Only\n        # effects elements with more than one letter, e.g. 'Cl' becomes 'CL'.\n        new_name = f'{element.upper()}{element_counts[element]}'\n        if new_name not in specified_atom_names:\n          break\n      atom.SetProp('atom_name', new_name)\n\n  return mol\n\n\ndef get_random_conformer(\n    mol: rd_chem.Mol,\n    random_seed: int,\n    max_iterations: int | None,\n    logging_name: str,\n) -> rd_chem.Conformer | None:\n  \"\"\"Stochastic conformer search method using V3 ETK.\"\"\"\n  params = rd_all_chem.ETKDGv3()\n  params.randomSeed = random_seed\n  if max_iterations is not None:  # Override default value.\n    params.maxIterations = max_iterations\n  mol_copy = rd_chem.Mol(mol)\n  try:\n    conformer_id = rd_all_chem.EmbedMolecule(mol_copy, params)\n    conformer = mol_copy.GetConformer(conformer_id)\n  except ValueError:\n    logging.warning('Failed to generate conformer for: %s', logging_name)\n    conformer = None\n  return conformer\n"
  },
  {
    "path": "src/alphafold3/data/tools/shards.py",
    "content": "# Copyright 2025 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"A library to handle shards of the format file_path@NUM_SHARDS.\n\nFor instance, /path/to/file@20 will generate the following shards:\n\n- /path/to/file-00000-of-00020\n- /path/to/file-00001-of-00020\n- ...\n- /path/to/file-00019-of-00020\n\nThis also supports @* pattern, which will determine the number of shards based\non the filesystem content.\n\"\"\"\n\nfrom collections.abc import Sequence\nimport dataclasses\nimport pathlib\nimport re\n\n\n_MAX_NUM_SHARDS = 99_999\n_SHARD_RE = re.compile(\n    r\"\"\"\n    ^(?P<prefix>[^\\?\\],\\*]+)@\n     (?P<shards>(\\d{1,5})|\\*)\n     (?P<suffix>[\\._][^\\?\\]@\\*\\/]*)?\n    $\"\"\",\n    re.X,\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass ShardSpec:\n  prefix: str\n  num_shards: int\n  suffix: str\n\n\ndef parse_shard_spec(path: str) -> ShardSpec | None:\n  \"\"\"Returns the shard spec or None if the path is not a shard spec.\n\n  For instance, if the shard spec is '/path/to/file@20', the output will be\n  ('/path/to/file', 20).\n\n  Args:\n    path: the path to parse, e.g. /path/to/file@20 or /path/to/file@*.\n  \"\"\"\n  parsed = re.fullmatch(_SHARD_RE, path)\n  if not parsed:\n    return None\n  prefix = parsed.group('prefix')\n  shards = parsed.group('shards')\n  suffix = parsed.group('suffix') or ''\n\n  if shards != '*':\n    return ShardSpec(prefix=prefix, num_shards=int(shards), suffix=suffix)\n  shard_slice = slice(len(prefix) + 10, len(prefix) + 15)\n  shard_path = pathlib.Path(f'{prefix}-00000-of-?????{suffix}')\n  for shard in sorted(shard_path.parent.glob(shard_path.name), reverse=True):\n    try:\n      num_shards = int(str(shard)[shard_slice])\n      return ShardSpec(prefix=prefix, num_shards=num_shards, suffix=suffix)\n    except ValueError:\n      continue\n  return None\n\n\ndef get_sharded_paths(shard_spec: str) -> Sequence[str] | None:\n  \"\"\"Returns a list of file path or None if the input is not a shard spec.\n\n  Args:\n    shard_spec: the specifications of the shard, e.g. /path/to/file@20.\n  \"\"\"\n  parsed_spec = parse_shard_spec(shard_spec)\n  if not parsed_spec:\n    return None\n\n  prefix = parsed_spec.prefix\n  num_shards = parsed_spec.num_shards\n  suffix = parsed_spec.suffix\n  if num_shards > _MAX_NUM_SHARDS:\n    raise ValueError(f'Shard count for {shard_spec} exceeds {_MAX_NUM_SHARDS}')\n  return [\n      f'{prefix}-{i:05d}-of-{num_shards:05d}{suffix}' for i in range(num_shards)\n  ]\n"
  },
  {
    "path": "src/alphafold3/data/tools/subprocess_utils.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Helper functions for launching external tools.\"\"\"\n\nfrom collections.abc import Sequence\nimport os\nimport subprocess\nimport time\nfrom typing import Any\n\nfrom absl import logging\n\n\ndef create_query_fasta_file(sequence: str, path: str, linewidth: int = 80):\n  \"\"\"Creates a fasta file with the sequence with line width limit.\"\"\"\n  with open(path, 'w') as f:\n    f.write('>query\\n')\n\n    i = 0\n    while i < len(sequence):\n      f.write(f'{sequence[i:(i + linewidth)]}\\n')\n      i += linewidth\n\n\ndef check_binary_exists(path: str, name: str) -> None:\n  \"\"\"Checks if a binary exists on the given path and raises otherwise.\"\"\"\n  if not os.path.exists(path):\n    raise RuntimeError(f'{name} binary not found at {path}')\n\n\ndef jackhmmer_seq_limit_supported(jackhmmer_path: str) -> bool:\n  \"\"\"Checks if Jackhmmer supports the --seq-limit flag.\"\"\"\n  try:\n    subprocess.run(\n        [jackhmmer_path, '-h', '--seq_limit', '1'],\n        stdout=subprocess.DEVNULL,\n        stderr=subprocess.DEVNULL,\n        check=True,\n    )\n  except subprocess.CalledProcessError:\n    return False\n  return True\n\n\ndef run(\n    cmd: Sequence[str],\n    cmd_name: str,\n    log_on_process_error: bool = False,\n    log_stderr: bool = False,\n    log_stdout: bool = False,\n    max_out_streams_len: int | None = 500_000,\n    **run_kwargs,\n) -> subprocess.CompletedProcess[Any]:\n  \"\"\"Launches a subprocess, times it, and checks for errors.\n\n  Args:\n    cmd: Command to launch.\n    cmd_name: Human-readable command name to be used in logs.\n    log_on_process_error: Whether to use `logging.error` to log the process'\n      stderr on failure.\n    log_stderr: Whether to log the stderr of the command.\n    log_stdout: Whether to log the stdout of the command.\n    max_out_streams_len: Max length of prefix of stdout and stderr included in\n      the exception message. Set to `None` to disable truncation.\n    **run_kwargs: Any other kwargs for `subprocess.run`.\n\n  Returns:\n    The completed process object.\n\n  Raises:\n    RuntimeError: if the process completes with a non-zero return code.\n  \"\"\"\n\n  logging.info('Launching subprocess \"%s\"', ' '.join(cmd))\n\n  start_time = time.time()\n  try:\n    completed_process = subprocess.run(\n        cmd,\n        check=True,\n        stderr=subprocess.PIPE,\n        stdout=subprocess.PIPE,\n        text=True,\n        **run_kwargs,\n    )\n  except subprocess.CalledProcessError as e:\n    if log_on_process_error:\n      # Logs have a 15k character limit, so log the error line by line.\n      logging.error('%s failed. %s stderr begin:', cmd_name, cmd_name)\n      for error_line in e.stderr.splitlines():\n        if stripped_error_line := error_line.strip():\n          logging.error(stripped_error_line)\n      logging.error('%s stderr end.', cmd_name)\n\n    error_msg = (\n        f'{cmd_name} failed'\n        f'\\nstdout:\\n{e.stdout[:max_out_streams_len]}\\n'\n        f'\\nstderr:\\n{e.stderr[:max_out_streams_len]}'\n    )\n    raise RuntimeError(error_msg) from e\n  end_time = time.time()\n\n  logging.info('Finished %s in %.3f seconds', cmd_name, end_time - start_time)\n  stdout, stderr = completed_process.stdout, completed_process.stderr\n\n  if log_stdout and stdout:\n    logging.info('%s stdout:\\n%s', cmd_name, stdout)\n\n  if log_stderr and stderr:\n    logging.info('%s stderr:\\n%s', cmd_name, stderr)\n\n  return completed_process\n"
  },
  {
    "path": "src/alphafold3/jax/geometry/__init__.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Geometry Module.\"\"\"\n\nfrom alphafold3.jax.geometry import rigid_matrix_vector\nfrom alphafold3.jax.geometry import rotation_matrix\nfrom alphafold3.jax.geometry import struct_of_array\nfrom alphafold3.jax.geometry import vector\n\nRot3Array = rotation_matrix.Rot3Array\nRigid3Array = rigid_matrix_vector.Rigid3Array\n\nStructOfArray = struct_of_array.StructOfArray\n\nVec3Array = vector.Vec3Array\nsquare_euclidean_distance = vector.square_euclidean_distance\neuclidean_distance = vector.euclidean_distance\ndihedral_angle = vector.dihedral_angle\ndot = vector.dot\ncross = vector.cross\n"
  },
  {
    "path": "src/alphafold3/jax/geometry/rigid_matrix_vector.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Rigid3Array Transformations represented by a Matrix and a Vector.\"\"\"\n\nfrom typing import Any, Final, Self, TypeAlias\n\nfrom alphafold3.jax.geometry import rotation_matrix\nfrom alphafold3.jax.geometry import struct_of_array\nfrom alphafold3.jax.geometry import utils\nfrom alphafold3.jax.geometry import vector\nimport jax\nimport jax.numpy as jnp\n\n\nFloat: TypeAlias = float | jnp.ndarray\n\nVERSION: Final[str] = '0.1'\n\n\n# Disabling name in pylint, since the relevant variable in math are typically\n# referred to as X, Y in mathematical literature.\ndef _compute_covariance_matrix(\n    row_values: vector.Vec3Array,\n    col_values: vector.Vec3Array,\n    weights: jnp.ndarray,\n    epsilon=1e-6,\n) -> jnp.ndarray:\n  \"\"\"Compute covariance matrix.\n\n  The quantity computes is\n  cov_xy = weighted_avg_i(row_values[i, x] col_values[j, y]).\n  Here x and y run over the xyz coordinates.\n  This is used to construct frames when aligning points.\n\n  Args:\n    row_values: Values used for rows of covariance matrix, shape [..., n_point]\n    col_values: Values used for columns of covariance matrix, shape [...,\n      n_point]\n    weights: weights to weight points by, shape broacastable to [...]\n    epsilon: small value to add to denominator to avoid Nan's when all weights\n      are 0.\n\n  Returns:\n    Covariance Matrix as [..., 3, 3] array.\n  \"\"\"\n  weights = jnp.asarray(weights)\n  weights = jnp.broadcast_to(weights, row_values.shape)\n\n  out = []\n\n  normalized_weights = weights / (weights.sum(axis=-1, keepdims=True) + epsilon)\n\n  weighted_average = lambda x: jnp.sum(normalized_weights * x, axis=-1)\n\n  out.append(\n      jnp.stack(\n          (\n              weighted_average(row_values.x * col_values.x),\n              weighted_average(row_values.x * col_values.y),\n              weighted_average(row_values.x * col_values.z),\n          ),\n          axis=-1,\n      )\n  )\n\n  out.append(\n      jnp.stack(\n          (\n              weighted_average(row_values.y * col_values.x),\n              weighted_average(row_values.y * col_values.y),\n              weighted_average(row_values.y * col_values.z),\n          ),\n          axis=-1,\n      )\n  )\n\n  out.append(\n      jnp.stack(\n          (\n              weighted_average(row_values.z * col_values.x),\n              weighted_average(row_values.z * col_values.y),\n              weighted_average(row_values.z * col_values.z),\n          ),\n          axis=-1,\n      )\n  )\n\n  return jnp.stack(out, axis=-2)\n\n\n@struct_of_array.StructOfArray(same_dtype=True)\nclass Rigid3Array:\n  \"\"\"Rigid Transformation, i.e. element of special euclidean group.\"\"\"\n\n  rotation: rotation_matrix.Rot3Array\n  translation: vector.Vec3Array\n\n  def __matmul__(self, other: Self) -> Self:\n    new_rotation = self.rotation @ other.rotation\n    new_translation = self.apply_to_point(other.translation)\n    return Rigid3Array(new_rotation, new_translation)\n\n  def inverse(self) -> Self:\n    \"\"\"Return Rigid3Array corresponding to inverse transform.\"\"\"\n    inv_rotation = self.rotation.inverse()\n    inv_translation = inv_rotation.apply_to_point(-self.translation)\n    return Rigid3Array(inv_rotation, inv_translation)\n\n  def apply_to_point(self, point: vector.Vec3Array) -> vector.Vec3Array:\n    \"\"\"Apply Rigid3Array transform to point.\"\"\"\n    return self.rotation.apply_to_point(point) + self.translation\n\n  def apply_inverse_to_point(self, point: vector.Vec3Array) -> vector.Vec3Array:\n    \"\"\"Apply inverse Rigid3Array transform to point.\"\"\"\n    new_point = point - self.translation\n    return self.rotation.apply_inverse_to_point(new_point)\n\n  def compose_rotation(self, other_rotation: rotation_matrix.Rot3Array) -> Self:\n    rot = self.rotation @ other_rotation\n    trans = jax.tree.map(\n        lambda x: jnp.broadcast_to(x, rot.shape), self.translation\n    )\n    return Rigid3Array(rot, trans)\n\n  @classmethod\n  def identity(cls, shape: Any, dtype: jnp.dtype = jnp.float32) -> Self:\n    \"\"\"Return identity Rigid3Array of given shape.\"\"\"\n    return cls(\n        rotation_matrix.Rot3Array.identity(shape, dtype=dtype),\n        vector.Vec3Array.zeros(shape, dtype=dtype),\n    )  # pytype: disable=wrong-arg-count  # trace-all-classes\n\n  def scale_translation(self, factor: Float) -> Self:\n    \"\"\"Scale translation in Rigid3Array by 'factor'.\"\"\"\n    return Rigid3Array(self.rotation, self.translation * factor)\n\n  def to_array(self):\n    rot_array = self.rotation.to_array()\n    vec_array = self.translation.to_array()\n    return jnp.concatenate([rot_array, vec_array[..., None]], axis=-1)\n\n  @classmethod\n  def from_array(cls, array):\n    rot = rotation_matrix.Rot3Array.from_array(array[..., :3])\n    vec = vector.Vec3Array.from_array(array[..., -1])\n    return cls(rot, vec)  # pytype: disable=wrong-arg-count  # trace-all-classes\n\n  @classmethod\n  def from_array4x4(cls, array: jnp.ndarray) -> Self:\n    \"\"\"Construct Rigid3Array from homogeneous 4x4 array.\"\"\"\n    if array.shape[-2:] != (4, 4):\n      raise ValueError(f'array.shape({array.shape}) must be [..., 4, 4]')\n    rotation = rotation_matrix.Rot3Array(\n        *(array[..., 0, 0], array[..., 0, 1], array[..., 0, 2]),\n        *(array[..., 1, 0], array[..., 1, 1], array[..., 1, 2]),\n        *(array[..., 2, 0], array[..., 2, 1], array[..., 2, 2]),\n    )\n    translation = vector.Vec3Array(\n        array[..., 0, 3], array[..., 1, 3], array[..., 2, 3]\n    )\n    return cls(rotation, translation)  # pytype: disable=wrong-arg-count  # trace-all-classes\n\n  @classmethod\n  def from_point_alignment(\n      cls,\n      points_to: vector.Vec3Array,\n      points_from: vector.Vec3Array,\n      weights: Float | None = None,\n      epsilon: float = 1e-6,\n  ) -> Self:\n    \"\"\"Constructs Rigid3Array by finding transform aligning points.\n\n    This constructs the optimal Rigid Transform taking points_from to the\n    arrangement closest to points_to.\n\n    Args:\n      points_to: Points to align to.\n      points_from: Points to align from.\n      weights: weights for points.\n      epsilon: epsilon used to regularize covariance matrix.\n\n    Returns:\n      Rigid Transform.\n    \"\"\"\n    if weights is None:\n      weights = 1.0\n\n    def compute_center(value):\n      return utils.weighted_mean(value=value, weights=weights, axis=-1)\n\n    points_to_center = jax.tree.map(compute_center, points_to)\n    points_from_center = jax.tree.map(compute_center, points_from)\n    centered_points_to = points_to - points_to_center[..., None]\n    centered_points_from = points_from - points_from_center[..., None]\n    cov_mat = _compute_covariance_matrix(\n        centered_points_to,\n        centered_points_from,\n        weights=weights,\n        epsilon=epsilon,\n    )\n    rots = rotation_matrix.Rot3Array.from_svd(\n        jnp.reshape(cov_mat, cov_mat.shape[:-2] + (9,))\n    )\n\n    translations = points_to_center - rots.apply_to_point(points_from_center)\n\n    return cls(rots, translations)  # pytype: disable=wrong-arg-count  # trace-all-classes\n\n  def __getstate__(self):\n    return (VERSION, (self.rotation, self.translation))\n\n  def __setstate__(self, state):\n    version, (rot, trans) = state\n    del version\n    object.__setattr__(self, 'rotation', rot)\n    object.__setattr__(self, 'translation', trans)\n"
  },
  {
    "path": "src/alphafold3/jax/geometry/rotation_matrix.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Rot3Array Matrix Class.\"\"\"\n\nimport dataclasses\nfrom typing import Any, Final, Self\n\nfrom alphafold3.jax.geometry import struct_of_array\nfrom alphafold3.jax.geometry import utils\nfrom alphafold3.jax.geometry import vector\nimport jax\nimport jax.numpy as jnp\nimport numpy as np\n\n\nCOMPONENTS: Final[tuple[str, ...]] = (\n    *('xx', 'xy', 'xz'),\n    *('yx', 'yy', 'yz'),\n    *('zx', 'zy', 'zz'),\n)\nVERSION: Final[str] = '0.1'\n\n\ndef make_matrix_svd_factors() -> np.ndarray:\n  \"\"\"Generates factors for converting 3x3 matrix to symmetric 4x4 matrix.\"\"\"\n  factors = np.zeros((16, 9), dtype=np.float32)\n\n  factors[0, [0, 4, 8]] = 1.0\n\n  factors[[1, 4], 5] = 1.0\n  factors[[1, 4], 7] = -1.0\n\n  factors[[2, 8], 6] = 1.0\n  factors[[2, 8], 2] = -1.0\n\n  factors[[3, 12], 1] = 1.0\n  factors[[3, 12], 3] = -1.0\n\n  factors[5, 0] = 1.0\n  factors[5, [4, 8]] = -1.0\n\n  factors[[6, 9], 1] = 1.0\n  factors[[6, 9], 3] = 1.0\n\n  factors[[7, 13], 2] = 1.0\n  factors[[7, 13], 6] = 1.0\n\n  factors[10, 4] = 1.0\n  factors[10, [0, 8]] = -1.0\n\n  factors[[11, 14], 5] = 1.0\n  factors[[11, 14], 7] = 1.0\n\n  factors[15, 8] = 1.0\n  factors[15, [0, 4]] = -1.0\n\n  return factors\n\n\n@jax.custom_jvp\ndef largest_evec(m):\n  _, eigvecs = jnp.linalg.eigh(m)\n  return eigvecs[..., -1]\n\n\ndef largest_evec_jvp(primals, tangents):\n  \"\"\"jvp for largest eigenvector.\"\"\"\n  (m,) = primals\n  (t,) = tangents\n  eigvals, eigvecs = jnp.linalg.eigh(m)\n  large_eigvec = eigvecs[..., -1]\n  large_eigval = eigvals[..., -1]\n  other_eigvals = eigvals[..., :-1]\n  other_eigvecs = eigvecs[..., :-1]\n  other_ev_times_tangent = jnp.einsum(\n      '...aj,...ab -> ...bj',\n      other_eigvecs,\n      t,\n      precision=jax.lax.Precision.HIGHEST,\n  )\n  nominator = jnp.einsum(\n      '...bj,...b -> ...j',\n      other_ev_times_tangent,\n      large_eigvec,\n      precision=jax.lax.Precision.HIGHEST,\n  )\n  prefactor = nominator / jnp.maximum(\n      large_eigval[..., None] - other_eigvals, 1e-6\n  )\n  grad = jnp.sum(prefactor[..., None, :] * other_eigvecs, axis=-1)\n  return large_eigvec, grad\n\n\nlargest_evec.defjvp(largest_evec_jvp)\n\n\nMATRIX_SVD_QUAT_FACTORS = make_matrix_svd_factors()\n\n\n@struct_of_array.StructOfArray(same_dtype=True)\nclass Rot3Array:\n  \"\"\"Rot3Array Matrix in 3 dimensional Space implemented as struct of arrays.\"\"\"\n\n  xx: jnp.ndarray = dataclasses.field(metadata={'dtype': jnp.float32})\n  xy: jnp.ndarray\n  xz: jnp.ndarray\n  yx: jnp.ndarray\n  yy: jnp.ndarray\n  yz: jnp.ndarray\n  zx: jnp.ndarray\n  zy: jnp.ndarray\n  zz: jnp.ndarray\n\n  __array_ufunc__ = None\n\n  def inverse(self) -> Self:\n    \"\"\"Returns inverse of Rot3Array.\"\"\"\n    return Rot3Array(\n        *(self.xx, self.yx, self.zx),\n        *(self.xy, self.yy, self.zy),\n        *(self.xz, self.yz, self.zz),\n    )\n\n  def apply_to_point(self, point: vector.Vec3Array) -> vector.Vec3Array:\n    \"\"\"Applies Rot3Array to point.\"\"\"\n    return vector.Vec3Array(\n        self.xx * point.x + self.xy * point.y + self.xz * point.z,\n        self.yx * point.x + self.yy * point.y + self.yz * point.z,\n        self.zx * point.x + self.zy * point.y + self.zz * point.z,\n    )\n\n  def apply_inverse_to_point(self, point: vector.Vec3Array) -> vector.Vec3Array:\n    \"\"\"Applies inverse Rot3Array to point.\"\"\"\n    return self.inverse().apply_to_point(point)\n\n  def __matmul__(self, other: Self) -> Self:\n    \"\"\"Composes two Rot3Arrays.\"\"\"\n    c0 = self.apply_to_point(vector.Vec3Array(other.xx, other.yx, other.zx))\n    c1 = self.apply_to_point(vector.Vec3Array(other.xy, other.yy, other.zy))\n    c2 = self.apply_to_point(vector.Vec3Array(other.xz, other.yz, other.zz))\n    return Rot3Array(c0.x, c1.x, c2.x, c0.y, c1.y, c2.y, c0.z, c1.z, c2.z)\n\n  @classmethod\n  def identity(cls, shape: Any, dtype: jnp.dtype = jnp.float32) -> Self:\n    \"\"\"Returns identity of given shape.\"\"\"\n    ones = jnp.ones(shape, dtype=dtype)\n    zeros = jnp.zeros(shape, dtype=dtype)\n    return cls(ones, zeros, zeros, zeros, ones, zeros, zeros, zeros, ones)  # pytype: disable=wrong-arg-count  # trace-all-classes\n\n  @classmethod\n  def from_two_vectors(cls, e0: vector.Vec3Array, e1: vector.Vec3Array) -> Self:\n    \"\"\"Construct Rot3Array from two Vectors.\n\n    Rot3Array is constructed such that in the corresponding frame 'e0' lies on\n    the positive x-Axis and 'e1' lies in the xy plane with positive sign of y.\n\n    Args:\n      e0: Vector\n      e1: Vector\n\n    Returns:\n      Rot3Array\n    \"\"\"\n    # Normalize the unit vector for the x-axis, e0.\n    e0 = e0.normalized()\n    # make e1 perpendicular to e0.\n    c = e1.dot(e0)\n    e1 = (e1 - c * e0).normalized()\n    # Compute e2 as cross product of e0 and e1.\n    e2 = e0.cross(e1)\n    return cls(e0.x, e1.x, e2.x, e0.y, e1.y, e2.y, e0.z, e1.z, e2.z)  # pytype: disable=wrong-arg-count  # trace-all-classes\n\n  @classmethod\n  def from_array(cls, array: jnp.ndarray) -> Self:\n    \"\"\"Construct Rot3Array Matrix from array of shape. [..., 3, 3].\"\"\"\n    unstacked = utils.unstack(array, axis=-2)\n    unstacked = sum([utils.unstack(x, axis=-1) for x in unstacked], [])\n    return cls(*unstacked)\n\n  def to_array(self) -> jnp.ndarray:\n    \"\"\"Convert Rot3Array to array of shape [..., 3, 3].\"\"\"\n    return jnp.stack(\n        [\n            jnp.stack([self.xx, self.xy, self.xz], axis=-1),\n            jnp.stack([self.yx, self.yy, self.yz], axis=-1),\n            jnp.stack([self.zx, self.zy, self.zz], axis=-1),\n        ],\n        axis=-2,\n    )\n\n  @classmethod\n  def from_quaternion(\n      cls,\n      w: jnp.ndarray,\n      x: jnp.ndarray,\n      y: jnp.ndarray,\n      z: jnp.ndarray,\n      normalize: bool = True,\n      epsilon: float = 1e-6,\n  ) -> Self:\n    \"\"\"Construct Rot3Array from components of quaternion.\"\"\"\n    if normalize:\n      inv_norm = jax.lax.rsqrt(jnp.maximum(epsilon, w**2 + x**2 + y**2 + z**2))\n      w *= inv_norm\n      x *= inv_norm\n      y *= inv_norm\n      z *= inv_norm\n    xx = 1 - 2 * (jnp.square(y) + jnp.square(z))\n    xy = 2 * (x * y - w * z)\n    xz = 2 * (x * z + w * y)\n    yx = 2 * (x * y + w * z)\n    yy = 1 - 2 * (jnp.square(x) + jnp.square(z))\n    yz = 2 * (y * z - w * x)\n    zx = 2 * (x * z - w * y)\n    zy = 2 * (y * z + w * x)\n    zz = 1 - 2 * (jnp.square(x) + jnp.square(y))\n    return cls(xx, xy, xz, yx, yy, yz, zx, zy, zz)  # pytype: disable=wrong-arg-count  # trace-all-classes\n\n  @classmethod\n  def from_svd(cls, mat: jnp.ndarray, use_quat_formula: bool = True) -> Self:\n    \"\"\"Constructs Rot3Array from arbitrary array of shape [3 * 3] using SVD.\n\n    The case when 'use_quat_formula' is False rephrases the problem of\n    projecting the matrix to a rotation matrix as a problem of finding the\n    largest eigenvector of a certain 4x4 matrix. This has the advantage of\n    having fewer numerical issues.\n    This approach follows:\n    https://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.65.971&rep=rep1&type=pdf\n    In the other case we construct it via svd following\n    https://arxiv.org/pdf/2006.14616.pdf\n    In that case [∂L/∂M] is large if the two smallest singular values are close\n    to each other, or if they are close to 0.\n\n    Args:\n      mat: Array of shape [..., 3 * 3]\n      use_quat_formula: Whether to construct matrix via 4x4 eigenvalue problem.\n\n    Returns:\n      Rot3Array of shape [...]\n    \"\"\"\n    assert mat.shape[-1] == 9\n    if use_quat_formula:\n      symmetric_4by4 = jnp.einsum(\n          'ji, ...i -> ...j',\n          MATRIX_SVD_QUAT_FACTORS,\n          mat,\n          precision=jax.lax.Precision.HIGHEST,\n      )\n      symmetric_4by4 = jnp.reshape(symmetric_4by4, mat.shape[:-1] + (4, 4))\n      largest_eigvec = largest_evec(symmetric_4by4)\n      return cls.from_quaternion(\n          *utils.unstack(largest_eigvec, axis=-1)\n      ).inverse()\n\n    else:\n      mat = jnp.reshape(mat, mat.shape[:-1] + (3, 3))\n      u, _, v_t = jnp.linalg.svd(mat, full_matrices=False)\n      det_uv_t = jnp.linalg.det(\n          jnp.matmul(u, v_t, precision=jax.lax.Precision.HIGHEST)\n      )\n      ones = jnp.ones_like(det_uv_t)\n      diag_array = jnp.stack([ones, ones, det_uv_t], axis=-1)\n      # This is equivalent to making diag_array into a diagonal array and matrix\n      # multiplying\n      diag_times_v_t = diag_array[..., None] * v_t\n      out = jnp.matmul(u, diag_times_v_t, precision=jax.lax.Precision.HIGHEST)\n      return cls.from_array(out)\n\n  @classmethod\n  def random_uniform(cls, key, shape, dtype=jnp.float32) -> Self:\n    \"\"\"Samples uniform random Rot3Array according to Haar Measure.\"\"\"\n    quat_array = jax.random.normal(key, tuple(shape) + (4,), dtype=dtype)\n    quats = utils.unstack(quat_array)\n    return cls.from_quaternion(*quats)\n\n  def __getstate__(self):\n    return (VERSION, [np.asarray(getattr(self, field)) for field in COMPONENTS])\n\n  def __setstate__(self, state):\n    version, state = state\n    del version\n    for i, field in enumerate(COMPONENTS):\n      object.__setattr__(self, field, state[i])\n"
  },
  {
    "path": "src/alphafold3/jax/geometry/struct_of_array.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Class decorator to represent (nested) struct of arrays.\"\"\"\n\nimport dataclasses\n\nimport jax\n\n\ndef get_item(instance, key):\n  sliced = {}\n  for field in get_array_fields(instance):\n    num_trailing_dims = field.metadata.get('num_trailing_dims', 0)\n    this_key = key\n    if isinstance(key, tuple) and Ellipsis in this_key:\n      this_key += (slice(None),) * num_trailing_dims\n    sliced[field.name] = jax.tree.map(\n        lambda x: x[this_key],  # pylint: disable=cell-var-from-loop\n        getattr(instance, field.name),\n    )\n  return dataclasses.replace(instance, **sliced)\n\n\n@property\ndef get_shape(instance):\n  \"\"\"Returns Shape for given instance of dataclass.\"\"\"\n  first_field = dataclasses.fields(instance)[0]\n  num_trailing_dims = first_field.metadata.get('num_trailing_dims', None)\n  value = getattr(instance, first_field.name)\n  if num_trailing_dims:\n    return value.shape[:-num_trailing_dims]\n  else:\n    return value.shape\n\n\ndef get_len(instance):\n  \"\"\"Returns length for given instance of dataclass.\"\"\"\n  shape = instance.shape\n  if shape:\n    return shape[0]\n  else:\n    raise TypeError('len() of unsized object')  # Match jax.numpy behavior.\n\n\n@property\ndef get_dtype(instance):\n  \"\"\"Returns Dtype for given instance of dataclass.\"\"\"\n  fields = dataclasses.fields(instance)\n  sets_dtype = [\n      field.name for field in fields if field.metadata.get('sets_dtype', False)\n  ]\n  if sets_dtype:\n    assert len(sets_dtype) == 1, 'at most field can set dtype'\n    field_value = getattr(instance, sets_dtype[0])\n  elif instance.same_dtype:\n    field_value = getattr(instance, fields[0].name)\n  else:\n    # Should this be Value Error?\n    raise AttributeError(\n        'Trying to access Dtype on Struct of Array without'\n        'either \"same_dtype\" or field setting dtype'\n    )\n\n  if hasattr(field_value, 'dtype'):\n    return field_value.dtype\n  else:\n    # Should this be Value Error?\n    raise AttributeError(f'field_value {field_value} does not have dtype')\n\n\ndef replace(instance, **kwargs):\n  return dataclasses.replace(instance, **kwargs)\n\n\ndef post_init(instance):\n  \"\"\"Validate instance has same shapes & dtypes.\"\"\"\n  array_fields = get_array_fields(instance)\n  arrays = list(get_array_fields(instance, return_values=True).values())\n  first_field = array_fields[0]\n  # These slightly weird constructions about checking whether the leaves are\n  # actual arrays is since e.g. vmap internally relies on being able to\n  # construct pytree's with object() as leaves, this would break the checking\n  # as such we are only validating the object when the entries in the dataclass\n  # Are arrays or other dataclasses of arrays.\n  try:\n    dtype = instance.dtype\n  except AttributeError:\n    dtype = None\n  if dtype is not None:\n    first_shape = instance.shape\n    for array, field in zip(arrays, array_fields, strict=True):\n      num_trailing_dims = field.metadata.get('num_trailing_dims', None)\n      if num_trailing_dims:\n        array_shape = array.shape\n        field_shape = array_shape[:-num_trailing_dims]\n        msg = (\n            f'field {field} should have number of trailing dims'\n            ' {num_trailing_dims}'\n        )\n        assert len(array_shape) == len(first_shape) + num_trailing_dims, msg\n      else:\n        field_shape = array.shape\n\n      shape_msg = (\n          f\"Stripped Shape {field_shape} of field {field} doesn't \"\n          f'match shape {first_shape} of field {first_field}'\n      )\n      assert field_shape == first_shape, shape_msg\n\n      field_dtype = array.dtype\n\n      allowed_metadata_dtypes = field.metadata.get('allowed_dtypes', [])\n      if allowed_metadata_dtypes:\n        msg = f'Dtype is {field_dtype} but must be in {allowed_metadata_dtypes}'\n        assert field_dtype in allowed_metadata_dtypes, msg\n\n      if 'dtype' in field.metadata:\n        target_dtype = field.metadata['dtype']\n      else:\n        target_dtype = dtype\n\n      msg = f'Dtype is {field_dtype} but must be {target_dtype}'\n      assert field_dtype == target_dtype, msg\n\n\ndef flatten(instance):\n  \"\"\"Flatten Struct of Array instance.\"\"\"\n  array_likes = get_array_fields(instance, return_values=True).values()\n  flat_array_likes = []\n  inner_treedefs = []\n  num_arrays = []\n  for array_like in array_likes:\n    flat_array_like, inner_treedef = jax.tree_util.tree_flatten(array_like)\n    inner_treedefs.append(inner_treedef)\n    flat_array_likes += flat_array_like\n    num_arrays.append(len(flat_array_like))\n  metadata = get_metadata_fields(instance, return_values=True)\n  metadata = type(instance).metadata_cls(**metadata)\n  return flat_array_likes, (inner_treedefs, metadata, num_arrays)\n\n\ndef make_metadata_class(cls):\n  metadata_fields = get_fields(\n      cls, lambda x: x.metadata.get('is_metadata', False)\n  )\n  metadata_cls = dataclasses.make_dataclass(\n      cls_name='Meta' + cls.__name__,\n      fields=[(field.name, field.type, field) for field in metadata_fields],\n      frozen=True,\n      eq=True,\n  )\n  return metadata_cls\n\n\ndef get_fields(cls_or_instance, filterfn, return_values=False):\n  fields = dataclasses.fields(cls_or_instance)\n  fields = [field for field in fields if filterfn(field)]\n  if return_values:\n    return {\n        field.name: getattr(cls_or_instance, field.name) for field in fields\n    }\n  else:\n    return fields\n\n\ndef get_array_fields(cls, return_values=False):\n  return get_fields(\n      cls,\n      lambda x: not x.metadata.get('is_metadata', False),\n      return_values=return_values,\n  )\n\n\ndef get_metadata_fields(cls, return_values=False):\n  return get_fields(\n      cls,\n      lambda x: x.metadata.get('is_metadata', False),\n      return_values=return_values,\n  )\n\n\nclass StructOfArray:\n  \"\"\"Class Decorator for Struct Of Arrays.\"\"\"\n\n  def __init__(self, same_dtype=True):\n    self.same_dtype = same_dtype\n\n  def __call__(self, cls):\n    cls.__array_ufunc__ = None\n    cls.replace = replace\n    cls.same_dtype = self.same_dtype\n    cls.dtype = get_dtype\n    cls.shape = get_shape\n    cls.__len__ = get_len\n    cls.__getitem__ = get_item\n    cls.__post_init__ = post_init\n    new_cls = dataclasses.dataclass(cls, frozen=True, eq=False)  # pytype: disable=wrong-keyword-args\n    # pytree claims to require metadata to be hashable, not sure why,\n    # But making derived dataclass that can just hold metadata\n    new_cls.metadata_cls = make_metadata_class(new_cls)\n\n    def unflatten(aux, data):\n      inner_treedefs, metadata, num_arrays = aux\n      array_fields = [field.name for field in get_array_fields(new_cls)]\n      value_dict = {}\n      array_start = 0\n      for num_array, inner_treedef, array_field in zip(\n          num_arrays, inner_treedefs, array_fields, strict=True\n      ):\n        value_dict[array_field] = jax.tree_util.tree_unflatten(\n            inner_treedef, data[array_start : array_start + num_array]\n        )\n        array_start += num_array\n      metadata_fields = get_metadata_fields(new_cls)\n      for field in metadata_fields:\n        value_dict[field.name] = getattr(metadata, field.name)\n\n      return new_cls(**value_dict)\n\n    jax.tree_util.register_pytree_node(\n        nodetype=new_cls, flatten_func=flatten, unflatten_func=unflatten\n    )\n    return new_cls\n"
  },
  {
    "path": "src/alphafold3/jax/geometry/utils.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Utils for geometry library.\"\"\"\n\nfrom collections.abc import Iterable\nimport numbers\n\nimport jax.numpy as jnp\n\n\ndef unstack(value: jnp.ndarray, axis: int = -1) -> list[jnp.ndarray]:\n  return [\n      jnp.squeeze(v, axis=axis)\n      for v in jnp.split(value, value.shape[axis], axis=axis)\n  ]\n\n\ndef angdiff(alpha: jnp.ndarray, beta: jnp.ndarray) -> jnp.ndarray:\n  \"\"\"Compute absolute difference between two angles.\"\"\"\n  d = alpha - beta\n  d = (d + jnp.pi) % (2 * jnp.pi) - jnp.pi\n  return d\n\n\ndef weighted_mean(\n    *,\n    weights: jnp.ndarray,\n    value: jnp.ndarray,\n    axis: int | Iterable[int] | None = None,\n    eps: float = 1e-10,\n) -> jnp.ndarray:\n  \"\"\"Computes weighted mean in a safe way that avoids NaNs.\n\n  This is equivalent to jnp.average for the case eps=0.0, but adds a small\n  constant to the denominator of the weighted average to avoid NaNs.\n  'weights' should be broadcastable to the shape of value.\n\n  Args:\n    weights: Weights to weight value by.\n    value: Values to average\n    axis: Axes to average over.\n    eps: Epsilon to add to the denominator.\n\n  Returns:\n    Weighted average.\n  \"\"\"\n\n  weights = jnp.asarray(weights, dtype=value.dtype)\n  weights = jnp.broadcast_to(weights, value.shape)\n\n  weights_shape = weights.shape\n\n  if isinstance(axis, numbers.Integral):\n    axis = [axis]\n  elif axis is None:\n    axis = list(range(len(weights_shape)))\n\n  return jnp.sum(weights * value, axis=axis) / (\n      jnp.sum(weights, axis=axis) + eps\n  )\n"
  },
  {
    "path": "src/alphafold3/jax/geometry/vector.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Vec3Array Class.\"\"\"\n\nimport dataclasses\nfrom typing import Final, Self, TypeAlias\n\nfrom alphafold3.jax.geometry import struct_of_array\nfrom alphafold3.jax.geometry import utils\nimport jax\nimport jax.numpy as jnp\nimport numpy as np\n\n\nFloat: TypeAlias = float | jnp.ndarray\n\nVERSION: Final[str] = '0.1'\n\n\n@struct_of_array.StructOfArray(same_dtype=True)\nclass Vec3Array:\n  \"\"\"Vec3Array in 3 dimensional Space implemented as struct of arrays.\n\n  This is done in order to improve performance and precision.\n  On TPU small matrix multiplications are very suboptimal and will waste large\n  compute ressources, furthermore any matrix multiplication on TPU happens in\n  mixed bfloat16/float32 precision, which is often undesirable when handling\n  physical coordinates.\n\n  In most cases this will also be faster on CPUs/GPUs since it allows for easier\n  use of vector instructions.\n  \"\"\"\n\n  x: jnp.ndarray = dataclasses.field(metadata={'dtype': jnp.float32})\n  y: jnp.ndarray\n  z: jnp.ndarray\n\n  def __post_init__(self):\n    if hasattr(self.x, 'dtype'):\n      if not self.x.dtype == self.y.dtype == self.z.dtype:\n        raise ValueError(\n            f'Type mismatch: {self.x.dtype}, {self.y.dtype}, {self.z.dtype}'\n        )\n      if not self.x.shape == self.y.shape == self.z.shape:\n        raise ValueError(\n            f'Shape mismatch: {self.x.shape}, {self.y.shape}, {self.z.shape}'\n        )\n\n  def __add__(self, other: Self) -> Self:\n    return jax.tree.map(lambda x, y: x + y, self, other)\n\n  def __sub__(self, other: Self) -> Self:\n    return jax.tree.map(lambda x, y: x - y, self, other)\n\n  def __mul__(self, other: Float) -> Self:\n    return jax.tree.map(lambda x: x * other, self)\n\n  def __rmul__(self, other: Float) -> Self:\n    return self * other\n\n  def __truediv__(self, other: Float) -> Self:\n    return jax.tree.map(lambda x: x / other, self)\n\n  def __neg__(self) -> Self:\n    return jax.tree.map(lambda x: -x, self)\n\n  def __pos__(self) -> Self:\n    return jax.tree.map(lambda x: x, self)\n\n  def cross(self, other: Self) -> Self:\n    \"\"\"Compute cross product between 'self' and 'other'.\"\"\"\n    new_x = self.y * other.z - self.z * other.y\n    new_y = self.z * other.x - self.x * other.z\n    new_z = self.x * other.y - self.y * other.x\n    return Vec3Array(new_x, new_y, new_z)\n\n  def dot(self, other: Self) -> Float:\n    \"\"\"Compute dot product between 'self' and 'other'.\"\"\"\n    return self.x * other.x + self.y * other.y + self.z * other.z\n\n  def norm(self, epsilon: float = 1e-6) -> Float:\n    \"\"\"Compute Norm of Vec3Array, clipped to epsilon.\"\"\"\n    # To avoid NaN on the backward pass, we must use maximum before the sqrt\n    norm2 = self.dot(self)\n    if epsilon:\n      norm2 = jnp.maximum(norm2, epsilon**2)\n    return jnp.sqrt(norm2)\n\n  def norm2(self):\n    return self.dot(self)\n\n  def normalized(self, epsilon: float = 1e-6) -> Self:\n    \"\"\"Return unit vector with optional clipping.\"\"\"\n    return self / self.norm(epsilon)\n\n  @classmethod\n  def zeros(cls, shape, dtype=jnp.float32):\n    \"\"\"Return Vec3Array corresponding to zeros of given shape.\"\"\"\n    return cls(\n        jnp.zeros(shape, dtype),\n        jnp.zeros(shape, dtype),\n        jnp.zeros(shape, dtype),\n    )  # pytype: disable=wrong-arg-count  # trace-all-classes\n\n  def to_array(self) -> jnp.ndarray:\n    return jnp.stack([self.x, self.y, self.z], axis=-1)\n\n  @classmethod\n  def from_array(cls, array):\n    return cls(*utils.unstack(array))\n\n  def __getstate__(self):\n    return (\n        VERSION,\n        [np.asarray(self.x), np.asarray(self.y), np.asarray(self.z)],\n    )\n\n  def __setstate__(self, state):\n    version, state = state\n    del version\n    for i, letter in enumerate('xyz'):\n      object.__setattr__(self, letter, state[i])\n\n\ndef square_euclidean_distance(\n    vec1: Vec3Array, vec2: Vec3Array, epsilon: float = 1e-6\n) -> Float:\n  \"\"\"Computes square of euclidean distance between 'vec1' and 'vec2'.\n\n  Args:\n    vec1: Vec3Array to compute  distance to\n    vec2: Vec3Array to compute  distance from, should be broadcast compatible\n      with 'vec1'\n    epsilon: distance is clipped from below to be at least epsilon\n\n  Returns:\n    Array of square euclidean distances;\n    shape will be result of broadcasting 'vec1' and 'vec2'\n  \"\"\"\n  difference = vec1 - vec2\n  distance = difference.dot(difference)\n  if epsilon:\n    distance = jnp.maximum(distance, epsilon)\n  return distance\n\n\ndef dot(vector1: Vec3Array, vector2: Vec3Array) -> Float:\n  return vector1.dot(vector2)\n\n\ndef cross(vector1: Vec3Array, vector2: Vec3Array) -> Float:\n  return vector1.cross(vector2)\n\n\ndef norm(vector: Vec3Array, epsilon: float = 1e-6) -> Float:\n  return vector.norm(epsilon)\n\n\ndef normalized(vector: Vec3Array, epsilon: float = 1e-6) -> Vec3Array:\n  return vector.normalized(epsilon)\n\n\ndef euclidean_distance(\n    vec1: Vec3Array, vec2: Vec3Array, epsilon: float = 1e-6\n) -> Float:\n  \"\"\"Computes euclidean distance between 'vec1' and 'vec2'.\n\n  Args:\n    vec1: Vec3Array to compute euclidean distance to\n    vec2: Vec3Array to compute euclidean distance from, should be broadcast\n      compatible with 'vec1'\n    epsilon: distance is clipped from below to be at least epsilon\n\n  Returns:\n    Array of euclidean distances;\n    shape will be result of broadcasting 'vec1' and 'vec2'\n  \"\"\"\n  distance_sq = square_euclidean_distance(vec1, vec2, epsilon**2)\n  distance = jnp.sqrt(distance_sq)\n  return distance\n\n\ndef dihedral_angle(\n    a: Vec3Array, b: Vec3Array, c: Vec3Array, d: Vec3Array\n) -> Float:\n  \"\"\"Computes torsion angle for a quadruple of points.\n\n  For points (a, b, c, d), this is the angle between the planes defined by\n  points (a, b, c) and (b, c, d). It is also known as the dihedral angle.\n\n  Arguments:\n    a: A Vec3Array of coordinates.\n    b: A Vec3Array of coordinates.\n    c: A Vec3Array of coordinates.\n    d: A Vec3Array of coordinates.\n\n  Returns:\n    A tensor of angles in radians: [-pi, pi].\n  \"\"\"\n  v1 = a - b\n  v2 = b - c\n  v3 = d - c\n\n  c1 = v1.cross(v2)\n  c2 = v3.cross(v2)\n  c3 = c2.cross(c1)\n\n  v2_mag = v2.norm()\n  return jnp.arctan2(c3.dot(v2), v2_mag * c1.dot(c2))\n\n\ndef random_gaussian_vector(shape, key, dtype=jnp.float32) -> Vec3Array:\n  vec_array = jax.random.normal(key, shape + (3,), dtype)\n  return Vec3Array.from_array(vec_array)\n"
  },
  {
    "path": "src/alphafold3/model/atom_layout/atom_layout.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Helper functions for different atom layouts and conversion between them.\"\"\"\n\nimport collections\nfrom collections.abc import Mapping, Sequence\nimport dataclasses\nimport types\nfrom typing import Any, TypeAlias\n\nfrom alphafold3 import structure\nfrom alphafold3.constants import atom_types\nfrom alphafold3.constants import chemical_component_sets\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.constants import residue_names\nfrom alphafold3.data.tools import rdkit_utils\nfrom alphafold3.structure import chemical_components as struc_chem_comps\nimport jax.numpy as jnp\nimport numpy as np\nfrom rdkit import Chem\n\n\nxnp_ndarray: TypeAlias = np.ndarray | jnp.ndarray  # pylint: disable=invalid-name\nNumpyIndex: TypeAlias = Any\n\n\n@dataclasses.dataclass(frozen=True)\nclass AtomLayout:\n  \"\"\"Atom layout in a fixed shape (usually 1-dim or 2-dim).\n\n  Examples for atom layouts are atom37, atom14, and similar.\n  All members are np.ndarrays with the same shape, e.g.\n  - [num_atoms]\n  - [num_residues, max_atoms_per_residue]\n  - [num_fragments, max_fragments_per_residue]\n  All string arrays should have dtype=object to avoid pitfalls with Numpy's\n  fixed-size strings\n\n  Attributes:\n    atom_name: np.ndarray of str: atom names (e.g. 'CA', 'NE2'), padding\n      elements have an empty string (''), None or any other value, that maps to\n      False for .astype(bool). mmCIF field: _atom_site.label_atom_id.\n    res_id: np.ndarray of int: residue index (usually starting from 1) padding\n      elements can have an arbitrary value. mmCIF field:\n      _atom_site.label_seq_id.\n    chain_id: np.ndarray of str: chain names (e.g. 'A', 'B') padding elements\n      can have an arbitrary value. mmCIF field: _atom_site.label_seq_id.\n    atom_element: np.ndarray of str: atom elements (e.g. 'C', 'N', 'O'), padding\n      elements have an empty string (''), None or any other value, that maps to\n      False for .astype(bool). mmCIF field: _atom_site.type_symbol.\n    res_name: np.ndarray of str: residue names (e.g. 'ARG', 'TRP') padding\n      elements can have an arbitrary value. mmCIF field:\n      _atom_site.label_comp_id.\n    chain_type: np.ndarray of str: chain types (e.g. 'polypeptide(L)'). padding\n      elements can have an arbitrary value. mmCIF field: _entity_poly.type OR\n      _entity.type (for non-polymers).\n    shape: shape of the layout (just returns atom_name.shape)\n  \"\"\"\n\n  atom_name: np.ndarray\n  res_id: np.ndarray\n  chain_id: np.ndarray\n  atom_element: np.ndarray | None = None\n  res_name: np.ndarray | None = None\n  chain_type: np.ndarray | None = None\n\n  def __post_init__(self):\n    \"\"\"Assert all arrays have the same shape.\"\"\"\n    attribute_names = (\n        'atom_name',\n        'atom_element',\n        'res_name',\n        'res_id',\n        'chain_id',\n        'chain_type',\n    )\n    _assert_all_arrays_have_same_shape(\n        obj=self,\n        expected_shape=self.atom_name.shape,\n        attribute_names=attribute_names,\n    )\n    # atom_name must have dtype object, such that we can convert it to bool to\n    # obtain the mask\n    if self.atom_name.dtype != object:\n      raise ValueError(\n          'atom_name must have dtype object, such that it can '\n          'be converted converted to bool to obtain the mask'\n      )\n\n  def __getitem__(self, key: NumpyIndex) -> 'AtomLayout':\n    return AtomLayout(\n        atom_name=self.atom_name[key],\n        res_id=self.res_id[key],\n        chain_id=self.chain_id[key],\n        atom_element=(\n            self.atom_element[key] if self.atom_element is not None else None\n        ),\n        res_name=(self.res_name[key] if self.res_name is not None else None),\n        chain_type=(\n            self.chain_type[key] if self.chain_type is not None else None\n        ),\n    )\n\n  def __eq__(self, other: 'AtomLayout') -> bool:\n    if not np.array_equal(self.atom_name, other.atom_name):\n      return False\n\n    mask = self.atom_name.astype(bool)\n    # Check essential fields.\n    for field in ('res_id', 'chain_id'):\n      my_arr = getattr(self, field)\n      other_arr = getattr(other, field)\n      if not np.array_equal(my_arr[mask], other_arr[mask]):\n        return False\n\n    # Check optional fields.\n    for field in ('atom_element', 'res_name', 'chain_type'):\n      my_arr = getattr(self, field)\n      other_arr = getattr(other, field)\n      if (\n          my_arr is not None\n          and other_arr is not None\n          and not np.array_equal(my_arr[mask], other_arr[mask])\n      ):\n        return False\n\n    return True\n\n  def copy_and_pad_to(self, shape: tuple[int, ...]) -> 'AtomLayout':\n    \"\"\"Copies and pads the layout to the requested shape.\n\n    Args:\n      shape: new shape for the atom layout\n\n    Returns:\n      a copy of the atom layout padded to the requested shape\n\n    Raises:\n      ValueError: incompatible shapes.\n    \"\"\"\n    if len(shape) != len(self.atom_name.shape):\n      raise ValueError(\n          f'Incompatible shape {shape}. Current layout has shape {self.shape}.'\n      )\n    if any(new < old for old, new in zip(self.atom_name.shape, shape)):\n      raise ValueError(\n          \"Can't pad to a smaller shape. Current layout has shape \"\n          f'{self.shape} and you requested shape {shape}.'\n      )\n    pad_width = [\n        (0, new - old) for old, new in zip(self.atom_name.shape, shape)\n    ]\n    pad_val = np.array('', dtype=object)\n    return AtomLayout(\n        atom_name=np.pad(self.atom_name, pad_width, constant_values=pad_val),\n        res_id=np.pad(self.res_id, pad_width, constant_values=0),\n        chain_id=np.pad(self.chain_id, pad_width, constant_values=pad_val),\n        atom_element=(\n            np.pad(self.atom_element, pad_width, constant_values=pad_val)\n            if self.atom_element is not None\n            else None\n        ),\n        res_name=(\n            np.pad(self.res_name, pad_width, constant_values=pad_val)\n            if self.res_name is not None\n            else None\n        ),\n        chain_type=(\n            np.pad(self.chain_type, pad_width, constant_values=pad_val)\n            if self.chain_type is not None\n            else None\n        ),\n    )\n\n  def to_array(self) -> np.ndarray:\n    \"\"\"Stacks the fields to a numpy array with shape (6, <layout_shape>).\n\n    Creates a pure numpy array of type `object` by stacking the 6 fields of the\n    AtomLayout, i.e. (atom_name, atom_element, res_name, res_id, chain_id,\n    chain_type). This method together with from_array() provides an easy way to\n    apply pure numpy methods like np.concatenate() to `AtomLayout`s.\n\n    Returns:\n      np.ndarray of object with shape (6, <layout_shape>), e.g.\n      array([['N', 'CA', 'C', ..., 'CB', 'CG', 'CD'],\n       ['N', 'C', 'C', ..., 'C', 'C', 'C'],\n       ['LEU', 'LEU', 'LEU', ..., 'PRO', 'PRO', 'PRO'],\n       [1, 1, 1, ..., 403, 403, 403],\n       ['A', 'A', 'A', ..., 'D', 'D', 'D'],\n       ['polypeptide(L)', 'polypeptide(L)', ..., 'polypeptide(L)']],\n      dtype=object)\n    \"\"\"\n    if (\n        self.atom_element is None\n        or self.res_name is None\n        or self.chain_type is None\n    ):\n      raise ValueError('All optional fields need to be present.')\n\n    return np.stack(dataclasses.astuple(self), axis=0)\n\n  @classmethod\n  def from_array(cls, arr: np.ndarray) -> 'AtomLayout':\n    \"\"\"Creates an AtomLayout object from a numpy array with shape (6, ...).\n\n    see also to_array()\n    Args:\n      arr: np.ndarray of object with shape (6, <layout_shape>)\n\n    Returns:\n      AtomLayout object with shape (<layout_shape>)\n    \"\"\"\n    if arr.shape[0] != 6:\n      raise ValueError(\n          'Given array must have shape (6, ...) to match the 6 fields of '\n          'AtomLayout (atom_name, atom_element, res_name, res_id, chain_id, '\n          f'chain_type). Your array has {arr.shape=}'\n      )\n    return cls(*arr)\n\n  @property\n  def shape(self) -> tuple[int, ...]:\n    return self.atom_name.shape\n\n\n@dataclasses.dataclass(frozen=True)\nclass Residues:\n  \"\"\"List of residues with meta data.\n\n  Attributes:\n    res_name: np.ndarray of str [num_res], e.g. 'ARG', 'TRP'\n    res_id: np.ndarray of int [num_res]\n    chain_id: np.ndarray of str [num_res], e.g. 'A', 'B'\n    chain_type: np.ndarray of str [num_res], e.g. 'polypeptide(L)'\n    is_start_terminus: np.ndarray of bool [num_res]\n    is_end_terminus: np.ndarray of bool [num_res]\n    deprotonation: (optional) np.ndarray of set() [num_res], e.g. {'HD1', 'HE2'}\n    smiles_string: (optional) np.ndarray of str [num_res], e.g. 'Cc1ccccc1'\n    shape: shape of the layout (just returns res_name.shape)\n  \"\"\"\n\n  res_name: np.ndarray\n  res_id: np.ndarray\n  chain_id: np.ndarray\n  chain_type: np.ndarray\n  is_start_terminus: np.ndarray\n  is_end_terminus: np.ndarray\n  deprotonation: np.ndarray | None = None\n  smiles_string: np.ndarray | None = None\n\n  def __post_init__(self):\n    \"\"\"Assert all arrays are 1D have the same shape.\"\"\"\n    attribute_names = (\n        'res_name',\n        'res_id',\n        'chain_id',\n        'chain_type',\n        'is_start_terminus',\n        'is_end_terminus',\n        'deprotonation',\n        'smiles_string',\n    )\n    _assert_all_arrays_have_same_shape(\n        obj=self,\n        expected_shape=(self.res_name.shape[0],),\n        attribute_names=attribute_names,\n    )\n\n  def __getitem__(self, key: NumpyIndex) -> 'Residues':\n    return Residues(\n        res_name=self.res_name[key],\n        res_id=self.res_id[key],\n        chain_id=self.chain_id[key],\n        chain_type=self.chain_type[key],\n        is_start_terminus=self.is_start_terminus[key],\n        is_end_terminus=self.is_end_terminus[key],\n        deprotonation=(\n            self.deprotonation[key] if self.deprotonation is not None else None\n        ),\n        smiles_string=(\n            self.smiles_string[key] if self.smiles_string is not None else None\n        ),\n    )\n\n  def __eq__(self, other: 'Residues') -> bool:\n    return all(\n        np.array_equal(getattr(self, field.name), getattr(other, field.name))\n        for field in dataclasses.fields(self)\n    )\n\n  @property\n  def shape(self) -> tuple[int, ...]:\n    return self.res_name.shape\n\n\n@dataclasses.dataclass(frozen=True)\nclass GatherInfo:\n  \"\"\"Gather indices to translate from one atom layout to another.\n\n  All members are np or jnp ndarray (usually 1-dim or 2-dim) with the same\n  shape, e.g.\n  - [num_atoms]\n  - [num_residues, max_atoms_per_residue]\n  - [num_fragments, max_fragments_per_residue]\n\n  Attributes:\n    gather_idxs: np or jnp ndarray of int: gather indices into a flattened array\n    gather_mask: np or jnp ndarray of bool: mask for resulting array\n    input_shape: np or jnp ndarray of int: the shape of the unflattened input\n      array\n    shape: output shape. Just returns gather_idxs.shape\n  \"\"\"\n\n  gather_idxs: xnp_ndarray\n  gather_mask: xnp_ndarray\n  input_shape: xnp_ndarray\n\n  def __post_init__(self):\n    if self.gather_mask.shape != self.gather_idxs.shape:\n      raise ValueError(\n          'All arrays must have the same shape. Got\\n'\n          f'gather_idxs.shape = {self.gather_idxs.shape}\\n'\n          f'gather_mask.shape = {self.gather_mask.shape}\\n'\n      )\n\n  def __getitem__(self, key: NumpyIndex) -> 'GatherInfo':\n    return GatherInfo(\n        gather_idxs=self.gather_idxs[key],\n        gather_mask=self.gather_mask[key],\n        input_shape=self.input_shape,\n    )\n\n  @property\n  def shape(self) -> tuple[int, ...]:\n    return self.gather_idxs.shape\n\n  def as_np_or_jnp(self, xnp: types.ModuleType) -> 'GatherInfo':\n    return GatherInfo(\n        gather_idxs=xnp.array(self.gather_idxs),\n        gather_mask=xnp.array(self.gather_mask),\n        input_shape=xnp.array(self.input_shape),\n    )\n\n  def as_dict(\n      self,\n      key_prefix: str | None = None,\n  ) -> dict[str, xnp_ndarray]:\n    prefix = f'{key_prefix}:' if key_prefix else ''\n    return {\n        prefix + 'gather_idxs': self.gather_idxs,\n        prefix + 'gather_mask': self.gather_mask,\n        prefix + 'input_shape': self.input_shape,\n    }\n\n  @classmethod\n  def from_dict(\n      cls,\n      d: Mapping[str, xnp_ndarray],\n      key_prefix: str | None = None,\n  ) -> 'GatherInfo':\n    \"\"\"Creates GatherInfo from a given dictionary.\"\"\"\n    prefix = f'{key_prefix}:' if key_prefix else ''\n    return cls(\n        gather_idxs=d[prefix + 'gather_idxs'],\n        gather_mask=d[prefix + 'gather_mask'],\n        input_shape=d[prefix + 'input_shape'],\n    )\n\n\ndef fill_in_optional_fields(\n    minimal_atom_layout: AtomLayout,\n    reference_atoms: AtomLayout,\n) -> AtomLayout:\n  \"\"\"Fill in the optional fields (atom_element, res_name, chain_type).\n\n  Extracts the optional fields (atom_element, res_name, chain_type) from a\n  flat reference layout and fills them into the fields from this layout.\n\n  Args:\n    minimal_atom_layout: An AtomLayout that only contains the essential fields\n      (atom_name, res_id, chain_id).\n    reference_atoms: A flat layout that contains all fields for all atoms.\n\n  Returns:\n    An AtomLayout that contains all fields.\n\n  Raises:\n    ValueError: Reference atoms layout is not flat.\n    ValueError: Missing atoms in reference.\n  \"\"\"\n  if len(reference_atoms.shape) > 1:\n    raise ValueError('Only flat layouts are supported as reference.')\n  ref_to_self = compute_gather_idxs(\n      source_layout=reference_atoms, target_layout=minimal_atom_layout\n  )\n  atom_mask = minimal_atom_layout.atom_name.astype(bool)\n  missing_atoms_mask = atom_mask & ~ref_to_self.gather_mask\n  if np.any(missing_atoms_mask):\n    raise ValueError(\n        f'{np.sum(missing_atoms_mask)} missing atoms in reference: '\n        f'{minimal_atom_layout[missing_atoms_mask]}'\n    )\n\n  def _convert_str_array(gather: GatherInfo, arr: np.ndarray):\n    output = arr[gather.gather_idxs]\n    output[~gather.gather_mask] = ''\n    return output\n\n  return dataclasses.replace(\n      minimal_atom_layout,\n      atom_element=_convert_str_array(\n          ref_to_self, reference_atoms.atom_element\n      ),\n      res_name=_convert_str_array(ref_to_self, reference_atoms.res_name),\n      chain_type=_convert_str_array(ref_to_self, reference_atoms.chain_type),\n  )\n\n\ndef guess_deprotonation(residues: Residues) -> Residues:\n  \"\"\"Convenience function to create a plausible deprotonation field.\n\n  Assumes a pH of 7 and always prefers HE2 over HD1 for HIS.\n  Args:\n    residues: a Residues object without a depronotation field\n\n  Returns:\n    a Residues object with a depronotation field\n  \"\"\"\n  num_residues = residues.res_name.shape[0]\n  deprotonation = np.empty(num_residues, dtype=object)\n  deprotonation_at_ph7 = {\n      'ASP': 'HD2',\n      'GLU': 'HE2',\n      'HIS': 'HD1',\n  }\n  for idx, res_name in enumerate(residues.res_name):\n    deprotonation[idx] = set()\n    if res_name in deprotonation_at_ph7:\n      deprotonation[idx].add(deprotonation_at_ph7[res_name])\n    if residues.is_end_terminus[idx]:\n      deprotonation[idx].add('HXT')\n\n  return dataclasses.replace(residues, deprotonation=deprotonation)\n\n\ndef atom_layout_from_structure(\n    struct: structure.Structure,\n    *,\n    fix_non_standard_polymer_res: bool = False,\n) -> AtomLayout:\n  \"\"\"Extract AtomLayout from a Structure.\"\"\"\n\n  if not fix_non_standard_polymer_res:\n    return AtomLayout(\n        atom_name=np.array(struct.atom_name, dtype=object),\n        atom_element=np.array(struct.atom_element, dtype=object),\n        res_name=np.array(struct.res_name, dtype=object),\n        res_id=np.array(struct.res_id, dtype=int),\n        chain_id=np.array(struct.chain_id, dtype=object),\n        chain_type=np.array(struct.chain_type, dtype=object),\n    )\n\n  # Target lists.\n  target_atom_names = []\n  target_atom_elements = []\n  target_res_ids = []\n  target_res_names = []\n  target_chain_ids = []\n  target_chain_types = []\n\n  for atom in struct.iter_atoms():\n    target_atom_names.append(atom['atom_name'])\n    target_atom_elements.append(atom['atom_element'])\n    target_res_ids.append(atom['res_id'])\n    target_chain_ids.append(atom['chain_id'])\n    target_chain_types.append(atom['chain_type'])\n    if mmcif_names.is_standard_polymer_type(atom['chain_type']):\n      fixed_res_name = mmcif_names.fix_non_standard_polymer_res(\n          res_name=atom['res_name'], chain_type=atom['chain_type']\n      )\n      target_res_names.append(fixed_res_name)\n    else:\n      target_res_names.append(atom['res_name'])\n\n  return AtomLayout(\n      atom_name=np.array(target_atom_names, dtype=object),\n      atom_element=np.array(target_atom_elements, dtype=object),\n      res_name=np.array(target_res_names, dtype=object),\n      res_id=np.array(target_res_ids, dtype=int),\n      chain_id=np.array(target_chain_ids, dtype=object),\n      chain_type=np.array(target_chain_types, dtype=object),\n  )\n\n\ndef residues_from_structure(\n    struct: structure.Structure,\n    *,\n    include_missing_residues: bool = True,\n    fix_non_standard_polymer_res: bool = False,\n) -> Residues:\n  \"\"\"Create a Residues object from a Structure object.\"\"\"\n\n  def _get_smiles(res_name):\n    \"\"\"Get SMILES string from chemical components.\"\"\"\n    smiles = None\n    if (\n        struct.chemical_components_data is not None\n        and struct.chemical_components_data.chem_comp is not None\n        and struct.chemical_components_data.chem_comp.get(res_name)\n    ):\n      smiles = struct.chemical_components_data.chem_comp[res_name].pdbx_smiles\n    return smiles\n\n  res_names_per_chain = struct.chain_res_name_sequence(\n      include_missing_residues=include_missing_residues,\n      fix_non_standard_polymer_res=fix_non_standard_polymer_res,\n  )\n  res_name = []\n  res_id = []\n  chain_id = []\n  chain_type = []\n  smiles = []\n  is_start_terminus = []\n  for c in struct.iter_chains():\n    if include_missing_residues:\n      this_res_ids = [id for (_, id) in struct.all_residues[c['chain_id']]]\n    else:\n      this_res_ids = [\n          r['res_id']\n          for r in struct.iter_residues()\n          if r['chain_id'] == c['chain_id']\n      ]\n    fixed_res_names = res_names_per_chain[c['chain_id']]\n    assert len(this_res_ids) == len(\n        fixed_res_names\n    ), f'{len(this_res_ids)} != {len(fixed_res_names)}'\n    this_start_res_id = min(min(this_res_ids), 1)\n    this_is_start_terminus = [r == this_start_res_id for r in this_res_ids]\n    smiles.extend([_get_smiles(res_name) for res_name in fixed_res_names])\n    num_res = len(fixed_res_names)\n    res_name.extend(fixed_res_names)\n    res_id.extend(this_res_ids)\n    chain_id.extend([c['chain_id']] * num_res)\n    chain_type.extend([c['chain_type']] * num_res)\n    is_start_terminus.extend(this_is_start_terminus)\n  res_name = np.array(res_name, dtype=object)\n  res_id = np.array(res_id, dtype=int)\n  chain_id = np.array(chain_id, dtype=object)\n  chain_type = np.array(chain_type, dtype=object)\n  smiles = np.array(smiles, dtype=object)\n  is_start_terminus = np.array(is_start_terminus, dtype=bool)\n\n  res_uid_to_idx = {\n      uid: idx for idx, uid in enumerate(zip(chain_id, res_id, strict=True))\n  }\n\n  # Start terminus indicates whether residue index is 1 and chain is polymer.\n  is_polymer = np.isin(chain_type, tuple(mmcif_names.POLYMER_CHAIN_TYPES))\n  is_start_terminus = is_start_terminus & is_polymer\n\n  # Start also indicates whether amino acid is attached to H2 or proline to H.\n  start_terminus_atom_index = np.nonzero(\n      (struct.chain_type == mmcif_names.PROTEIN_CHAIN)\n      & (\n          (struct.atom_name == 'H2')\n          | ((struct.atom_name == 'H') & (struct.res_name == 'PRO'))\n      )\n  )[0]\n\n  # Translate atom idx to residue idx to assign start terminus.\n  for atom_idx in start_terminus_atom_index:\n    res_uid = (struct.chain_id[atom_idx], struct.res_id[atom_idx])\n    res_idx = res_uid_to_idx[res_uid]\n    is_start_terminus[res_idx] = True\n\n  # Infer end terminus: Check for OXT, or in case of\n  # include_missing_residues==True for the last residue of the chain.\n  num_all_residues = res_name.shape[0]\n  is_end_terminus = np.zeros(num_all_residues, dtype=bool)\n  end_term_atom_idxs = np.nonzero(struct.atom_name == 'OXT')[0]\n  for atom_idx in end_term_atom_idxs:\n    res_uid = (struct.chain_id[atom_idx], struct.res_id[atom_idx])\n    res_idx = res_uid_to_idx[res_uid]\n    is_end_terminus[res_idx] = True\n\n  if include_missing_residues:\n    for idx in range(num_all_residues - 1):\n      if is_polymer[idx] and chain_id[idx] != chain_id[idx + 1]:\n        is_end_terminus[idx] = True\n    if (num_all_residues > 0) and is_polymer[-1]:\n      is_end_terminus[-1] = True\n\n  # Infer (de-)protonation: Only if hydrogens are given.\n  num_hydrogens = np.sum(\n      (struct.atom_element == 'H') & (struct.chain_type == 'polypeptide(L)')\n  )\n  if num_hydrogens > 0:\n    deprotonation = np.empty(num_all_residues, dtype=object)\n    all_atom_uids = set(\n        zip(struct.chain_id, struct.res_id, struct.atom_name, strict=True)\n    )\n    for idx in range(num_all_residues):\n      deprotonation[idx] = set()\n      check_hydrogens = set()\n      if is_end_terminus[idx]:\n        check_hydrogens.add('HXT')\n      if res_name[idx] in atom_types.PROTONATION_HYDROGENS:\n        check_hydrogens.update(atom_types.PROTONATION_HYDROGENS[res_name[idx]])\n      for hydrogen in check_hydrogens:\n        if (chain_id[idx], res_id[idx], hydrogen) not in all_atom_uids:\n          deprotonation[idx].add(hydrogen)\n  else:\n    deprotonation = None\n\n  return Residues(\n      res_name=res_name,\n      res_id=res_id,\n      chain_id=chain_id,\n      chain_type=chain_type,\n      is_start_terminus=is_start_terminus.astype(bool),\n      is_end_terminus=is_end_terminus,\n      deprotonation=deprotonation,\n      smiles_string=smiles,\n  )\n\n\ndef get_link_drop_atoms(\n    res_name: str,\n    chain_type: str,\n    *,\n    is_start_terminus: bool,\n    is_end_terminus: bool,\n    bonded_atoms: set[str],\n    drop_ligand_leaving_atoms: bool = False,\n) -> set[str]:\n  \"\"\"Returns set of atoms that are dropped when this res_name gets linked.\n\n  Args:\n    res_name: residue name, e.g. 'ARG'\n    chain_type: chain_type, e.g. 'polypeptide(L)'\n    is_start_terminus: whether the residue is the n-terminus\n    is_end_terminus: whether the residue is the c-terminus\n    bonded_atoms: Names of atoms coming off this residue.\n    drop_ligand_leaving_atoms: Flag to switch on/off leaving atoms for ligands.\n\n  Returns:\n    Set of atoms that are dropped when this amino acid gets linked.\n  \"\"\"\n  drop_atoms = set()\n  if chain_type == mmcif_names.PROTEIN_CHAIN:\n    if res_name == 'PRO':\n      if not is_start_terminus:\n        drop_atoms.update({'H', 'H2', 'H3'})\n      if not is_end_terminus:\n        drop_atoms.update({'OXT', 'HXT'})\n    else:\n      if not is_start_terminus:\n        drop_atoms.update({'H2', 'H3'})\n      if not is_end_terminus:\n        drop_atoms.update({'OXT', 'HXT'})\n  elif chain_type in mmcif_names.NUCLEIC_ACID_CHAIN_TYPES:\n    if not is_start_terminus:\n      drop_atoms.update({'OP3'})\n  elif (\n      drop_ligand_leaving_atoms and chain_type in mmcif_names.LIGAND_CHAIN_TYPES\n  ):\n    if res_name in {\n        *chemical_component_sets.GLYCAN_OTHER_LIGANDS,\n        *chemical_component_sets.GLYCAN_LINKING_LIGANDS,\n    }:\n      if 'O1' not in bonded_atoms:\n        drop_atoms.update({'O1'})\n  return drop_atoms\n\n\ndef get_bonded_atoms(\n    polymer_ligand_bonds: AtomLayout,\n    ligand_ligand_bonds: AtomLayout,\n    res_id: int,\n    chain_id: str,\n) -> set[str]:\n  \"\"\"Finds the res_name on the opposite end of the bond, if a bond exists.\n\n  Args:\n    polymer_ligand_bonds: Bond information for polymer-ligand pairs.\n    ligand_ligand_bonds: Bond information for ligand-ligand pairs.\n    res_id: residue id in question.\n    chain_id: chain id of residue in question.\n\n  Returns:\n    res_name of bonded atom.\n  \"\"\"\n  bonded_atoms = set()\n  if polymer_ligand_bonds:\n    # Filter before searching to speed this up.\n    bond_idx = np.logical_and(\n        polymer_ligand_bonds.res_id == res_id,\n        polymer_ligand_bonds.chain_id == chain_id,\n    ).any(axis=1)\n    relevant_polymer_bonds = polymer_ligand_bonds[bond_idx]\n    for atom_names, res_ids, chain_ids in zip(\n        relevant_polymer_bonds.atom_name,\n        relevant_polymer_bonds.res_id,\n        relevant_polymer_bonds.chain_id,\n    ):\n      if (res_ids[0], chain_ids[0]) == (res_id, chain_id):\n        bonded_atoms.add(atom_names[0])\n      elif (res_ids[1], chain_ids[1]) == (res_id, chain_id):\n        bonded_atoms.add(atom_names[1])\n  if ligand_ligand_bonds:\n    bond_idx = np.logical_and(\n        ligand_ligand_bonds.res_id == res_id,\n        ligand_ligand_bonds.chain_id == chain_id,\n    ).any(axis=1)\n    relevant_ligand_bonds = ligand_ligand_bonds[bond_idx]\n    for atom_names, res_ids, chain_ids in zip(\n        relevant_ligand_bonds.atom_name,\n        relevant_ligand_bonds.res_id,\n        relevant_ligand_bonds.chain_id,\n    ):\n      if (res_ids[0], chain_ids[0]) == (res_id, chain_id):\n        bonded_atoms.add(atom_names[0])\n      elif (res_ids[1], chain_ids[1]) == (res_id, chain_id):\n        bonded_atoms.add(atom_names[1])\n  return bonded_atoms\n\n\ndef make_flat_atom_layout(\n    residues: Residues,\n    ccd: chemical_components.Ccd,\n    polymer_ligand_bonds: AtomLayout | None = None,\n    ligand_ligand_bonds: AtomLayout | None = None,\n    *,\n    with_hydrogens: bool = False,\n    skip_unk_residues: bool = True,\n    drop_ligand_leaving_atoms: bool = False,\n) -> AtomLayout:\n  \"\"\"Make a flat atom layout for given residues.\n\n  Create a flat layout from a `Residues` object. The required atoms for each\n  amino acid type are taken from the CCD, hydrogens and oxygens are dropped to\n  make the linked residues. Terminal OXT's and protonation state for the\n  hydrogens come from the `Residues` object.\n\n  Args:\n    residues: a `Residues` object.\n    ccd: The chemical components dictionary.\n    polymer_ligand_bonds: Bond information for polymer-ligand pairs.\n    ligand_ligand_bonds: Bond information for ligand-ligand pairs.\n    with_hydrogens: whether to create hydrogens\n    skip_unk_residues: whether to skip 'UNK' resides -- default is True to be\n      compatible with the rest of AlphaFold that does not predict atoms for\n      unknown residues\n    drop_ligand_leaving_atoms: Flag to switch on/ off leaving atoms for ligands.\n\n  Returns:\n    an `AtomLayout` object\n  \"\"\"\n  num_res = residues.res_name.shape[0]\n\n  # Target lists.\n  target_atom_names = []\n  target_atom_elements = []\n  target_res_ids = []\n  target_res_names = []\n  target_chain_ids = []\n  target_chain_types = []\n\n  for idx in range(num_res):\n    # skip 'UNK' residues if requested\n    if (\n        skip_unk_residues\n        and residues.res_name[idx] in residue_names.UNKNOWN_TYPES\n    ):\n      continue\n\n    # Get the atoms for this residue type from CCD.\n    if ccd.get(residues.res_name[idx]):\n      res_atoms = struc_chem_comps.get_all_atoms_in_entry(\n          ccd=ccd, res_name=residues.res_name[idx]\n      )\n      atom_names_elements = list(\n          zip(\n              res_atoms['_chem_comp_atom.atom_id'],\n              res_atoms['_chem_comp_atom.type_symbol'],\n              strict=True,\n          )\n      )\n    elif residues.smiles_string[idx]:\n      # Get atoms from RDKit via SMILES.\n      mol = Chem.MolFromSmiles(residues.smiles_string[idx])\n      if mol is None:\n        raise ValueError(\n            f'Failed to construct RDKit Mol for {residues.res_name[idx]} from'\n            f' SMILES string: {residues.smiles_string[idx]} . This is likely'\n            ' due to an issue with the SMILES string. Note that the userCCD'\n            ' input format provides an alternative way to define custom'\n            ' molecules directly without RDKit or SMILES.'\n        )\n      mol = rdkit_utils.assign_atom_names_from_graph(mol)\n      atom_names_elements = [\n          (a.GetProp('atom_name'), a.GetSymbol()) for a in mol.GetAtoms()\n      ]\n    else:\n      raise ValueError(\n          f'{residues.res_name[idx]} not found in CCD and no SMILES string'\n      )\n\n    # Remove hydrogens if requested.\n    if not with_hydrogens:\n      atom_names_elements = [\n          (n, e) for n, e in atom_names_elements if (e != 'H' and e != 'D')\n      ]\n    bonded_atoms = get_bonded_atoms(\n        polymer_ligand_bonds,\n        ligand_ligand_bonds,\n        residues.res_id[idx],\n        residues.chain_id[idx],\n    )\n    # Connect the amino-acids, i.e. remove OXT, HXT and H2.\n    drop_atoms = get_link_drop_atoms(\n        res_name=residues.res_name[idx],\n        chain_type=residues.chain_type[idx],\n        is_start_terminus=residues.is_start_terminus[idx],\n        is_end_terminus=residues.is_end_terminus[idx],\n        bonded_atoms=bonded_atoms,\n        drop_ligand_leaving_atoms=drop_ligand_leaving_atoms,\n    )\n\n    # If deprotonation info is available, remove the specific atoms.\n    if residues.deprotonation is not None:\n      drop_atoms.update(residues.deprotonation[idx])\n\n    atom_names_elements = [\n        (n, e) for n, e in atom_names_elements if n not in drop_atoms\n    ]\n\n    # Append the found atoms to the target lists.\n    target_atom_names.extend([n for n, _ in atom_names_elements])\n    target_atom_elements.extend([e for _, e in atom_names_elements])\n    num_atoms = len(atom_names_elements)\n    target_res_names.extend([residues.res_name[idx]] * num_atoms)\n    target_res_ids.extend([residues.res_id[idx]] * num_atoms)\n    target_chain_ids.extend([residues.chain_id[idx]] * num_atoms)\n    target_chain_types.extend([residues.chain_type[idx]] * num_atoms)\n\n  return AtomLayout(\n      atom_name=np.array(target_atom_names, dtype=object),\n      atom_element=np.array(target_atom_elements, dtype=object),\n      res_name=np.array(target_res_names, dtype=object),\n      res_id=np.array(target_res_ids, dtype=int),\n      chain_id=np.array(target_chain_ids, dtype=object),\n      chain_type=np.array(target_chain_types, dtype=object),\n  )\n\n\ndef compute_gather_idxs(\n    *,\n    source_layout: AtomLayout,\n    target_layout: AtomLayout,\n    fill_value: int = 0,\n) -> GatherInfo:\n  \"\"\"Produce gather indices and mask to convert from source layout to target.\"\"\"\n  source_uid_to_idx = {\n      uid: idx\n      for idx, uid in enumerate(\n          zip(\n              source_layout.chain_id.ravel(),\n              source_layout.res_id.ravel(),\n              source_layout.atom_name.ravel(),\n              strict=True,\n          )\n      )\n  }\n  gather_idxs = []\n  gather_mask = []\n  for uid in zip(\n      target_layout.chain_id.ravel(),\n      target_layout.res_id.ravel(),\n      target_layout.atom_name.ravel(),\n      strict=True,\n  ):\n    if uid in source_uid_to_idx:\n      gather_idxs.append(source_uid_to_idx[uid])\n      gather_mask.append(True)\n    else:\n      gather_idxs.append(fill_value)\n      gather_mask.append(False)\n  target_shape = target_layout.atom_name.shape\n  return GatherInfo(\n      gather_idxs=np.array(gather_idxs, dtype=int).reshape(target_shape),\n      gather_mask=np.array(gather_mask, dtype=bool).reshape(target_shape),\n      input_shape=np.array(source_layout.atom_name.shape),\n  )\n\n\ndef convert(\n    gather_info: GatherInfo,\n    arr: xnp_ndarray,\n    *,\n    layout_axes: tuple[int, ...] = (0,),\n) -> xnp_ndarray:\n  \"\"\"Convert an array from one atom layout to another.\"\"\"\n  # Translate negative indices to the corresponding positives.\n  layout_axes = tuple(i if i >= 0 else i + arr.ndim for i in layout_axes)\n\n  # Ensure that layout_axes are continuous.\n  layout_axes_begin = layout_axes[0]\n  layout_axes_end = layout_axes[-1] + 1\n\n  if layout_axes != tuple(range(layout_axes_begin, layout_axes_end)):\n    raise ValueError(f'layout_axes must be continuous. Got {layout_axes}.')\n  layout_shape = arr.shape[layout_axes_begin:layout_axes_end]\n\n  # Ensure that the layout shape is compatible\n  # with the gather_info. I.e. the first axis size must be equal or greater\n  # than the gather_info.input_shape, and all subsequent axes sizes must match.\n  if (len(layout_shape) != gather_info.input_shape.size) or (\n      isinstance(gather_info.input_shape, np.ndarray)\n      and (\n          (layout_shape[0] < gather_info.input_shape[0])\n          or (np.any(layout_shape[1:] != gather_info.input_shape[1:]))\n      )\n  ):\n    raise ValueError(\n        'Input array layout axes are incompatible. You specified layout '\n        f'axes {layout_axes} with an input array of shape {arr.shape}, but '\n        f'the gather info expects shape {gather_info.input_shape}. '\n        'Your first axis size must be equal or greater than the '\n        'gather_info.input_shape, and all subsequent axes sizes must '\n        'match.'\n    )\n\n  # Compute the shape of the input array with flattened layout.\n  batch_shape = arr.shape[:layout_axes_begin]\n  features_shape = arr.shape[layout_axes_end:]\n  arr_flattened_shape = batch_shape + (np.prod(layout_shape),) + features_shape\n\n  # Flatten input array and perform the gather.\n  arr_flattened = arr.reshape(arr_flattened_shape)\n  if layout_axes_begin == 0:\n    out_arr = arr_flattened[gather_info.gather_idxs, ...]\n  elif layout_axes_begin == 1:\n    out_arr = arr_flattened[:, gather_info.gather_idxs, ...]\n  elif layout_axes_begin == 2:\n    out_arr = arr_flattened[:, :, gather_info.gather_idxs, ...]\n  elif layout_axes_begin == 3:\n    out_arr = arr_flattened[:, :, :, gather_info.gather_idxs, ...]\n  elif layout_axes_begin == 4:\n    out_arr = arr_flattened[:, :, :, :, gather_info.gather_idxs, ...]\n  else:\n    raise ValueError(\n        'Only 4 batch axes supported. If you need more, the code '\n        'is easy to extend.'\n    )\n\n  # Broadcast the mask and apply it.\n  broadcasted_mask_shape = (\n      (1,) * len(batch_shape)\n      + gather_info.gather_mask.shape\n      + (1,) * len(features_shape)\n  )\n  out_arr *= gather_info.gather_mask.reshape(broadcasted_mask_shape)\n  return out_arr\n\n\ndef make_structure(\n    flat_layout: AtomLayout,\n    atom_coords: np.ndarray,\n    name: str,\n    *,\n    atom_b_factors: np.ndarray | None = None,\n    all_physical_residues: Residues | None = None,\n) -> structure.Structure:\n  \"\"\"Returns a Structure from a flat layout and atom coordinates.\n\n  The provided flat_layout must be 1-dim and must not contain any padding\n  elements. The flat_layout.atom_name must conform to the OpenMM/CCD standard\n  and must not contain deuterium.\n\n  Args:\n    flat_layout: flat 1-dim AtomLayout without pading elements\n    atom_coords: np.ndarray of float, shape (num_atoms, 3)\n    name: str: the name (usually PDB id), e.g. '1uao'\n    atom_b_factors: np.ndarray of float, shape (num_atoms,) or None. If None,\n      they will be set to all zeros.\n    all_physical_residues: a Residues object that contains all physically\n      existing residues, i.e. also those residues that have no resolved atoms.\n      This is common in experimental structures, but also appears in predicted\n      structures for 'UNK' or other non-standard residue types, where the model\n      does not predict coordinates. This will be used to create the\n      `all_residues` field of the structure object.\n  \"\"\"\n\n  if flat_layout.atom_name.ndim != 1 or not np.all(\n      flat_layout.atom_name.astype(bool)\n  ):\n    raise ValueError(\n        'flat_layout must be 1-dim and must not contain anypadding element'\n    )\n  if (\n      flat_layout.atom_element is None\n      or flat_layout.res_name is None\n      or flat_layout.chain_type is None\n  ):\n    raise ValueError('All optional fields must be present.')\n\n  if atom_b_factors is None:\n    atom_b_factors = np.zeros(atom_coords.shape[:-1])\n\n  if all_physical_residues is not None:\n    # Create the all_residues field from a Residues object\n    # (unfortunately there is no central place to keep the chain_types in\n    # the structure class, so we drop it here)\n    all_residues = collections.defaultdict(list)\n    for chain_id, res_id, res_name in zip(\n        all_physical_residues.chain_id,\n        all_physical_residues.res_id,\n        all_physical_residues.res_name,\n        strict=True,\n    ):\n      all_residues[chain_id].append((res_name, res_id))\n  else:\n    # Create the all_residues field from the flat_layout\n    all_residues = collections.defaultdict(list)\n    if flat_layout.chain_id.shape[0] > 0:\n      all_residues[flat_layout.chain_id[0]].append(\n          (flat_layout.res_name[0], flat_layout.res_id[0])\n      )\n      for i in range(1, flat_layout.shape[0]):\n        if (\n            flat_layout.chain_id[i] != flat_layout.chain_id[i - 1]\n            or flat_layout.res_name[i] != flat_layout.res_name[i - 1]\n            or flat_layout.res_id[i] != flat_layout.res_id[i - 1]\n        ):\n          all_residues[flat_layout.chain_id[i]].append(\n              (flat_layout.res_name[i], flat_layout.res_id[i])\n          )\n\n  return structure.from_atom_arrays(\n      name=name,\n      all_residues=dict(all_residues),\n      chain_id=flat_layout.chain_id,\n      chain_type=flat_layout.chain_type,\n      res_id=flat_layout.res_id.astype(np.int32),\n      res_name=flat_layout.res_name,\n      atom_name=flat_layout.atom_name,\n      atom_element=flat_layout.atom_element,\n      atom_x=atom_coords[..., 0],\n      atom_y=atom_coords[..., 1],\n      atom_z=atom_coords[..., 2],\n      atom_b_factor=atom_b_factors,\n  )\n\n\ndef _assert_all_arrays_have_same_shape(\n    *,\n    obj: AtomLayout | Residues | GatherInfo,\n    expected_shape: tuple[int, ...],\n    attribute_names: Sequence[str],\n) -> None:\n  \"\"\"Checks that given attributes of the object have the expected shape.\"\"\"\n  attribute_shapes_description = []\n  all_shapes_are_valid = True\n\n  for attribute_name in attribute_names:\n    attribute = getattr(obj, attribute_name)\n\n    if attribute is None:\n      attribute_shape = None\n    else:\n      attribute_shape = attribute.shape\n\n    if attribute_shape is not None and expected_shape != attribute_shape:\n      all_shapes_are_valid = False\n\n    attribute_shape_name = attribute_name + '.shape'\n    attribute_shapes_description.append(\n        f'{attribute_shape_name:25} = {attribute_shape}'\n    )\n\n  if not all_shapes_are_valid:\n    raise ValueError(\n        f'All arrays must have the same shape ({expected_shape=}). Got\\n'\n        + '\\n'.join(attribute_shapes_description)\n    )\n"
  },
  {
    "path": "src/alphafold3/model/components/haiku_modules.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Common Haiku modules.\"\"\"\n\nfrom collections.abc import Sequence\nimport contextlib\nimport numbers\nfrom typing import TypeAlias\n\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\nimport numpy as np\n\n\nPRECISION: TypeAlias = (\n    None\n    | str\n    | jax.lax.Precision\n    | tuple[str, str]\n    | tuple[jax.lax.Precision, jax.lax.Precision]\n)\n\n# Useful for mocking in tests.\nDEFAULT_PRECISION = None\n\n# Constant from scipy.stats.truncnorm.std(a=-2, b=2, loc=0., scale=1.)\nTRUNCATED_NORMAL_STDDEV_FACTOR = np.asarray(\n    0.87962566103423978, dtype=np.float32\n)\n\n\nclass LayerNorm(hk.LayerNorm):\n  \"\"\"LayerNorm module.\n\n  Equivalent to hk.LayerNorm but with an extra 'upcast' option that casts\n  (b)float16 inputs to float32 before computing the layer norm, and then casts\n  the output back to the input type.\n\n  The learnable parameter shapes are also different from Haiku: they are always\n  vectors rather than possibly higher-rank tensors. This makes it easier\n  to change the layout whilst keep the model weight-compatible.\n  \"\"\"\n\n  def __init__(\n      self,\n      *,\n      axis: int = -1,\n      create_scale: bool = True,\n      create_offset: bool = True,\n      eps: float = 1e-5,\n      scale_init: hk.initializers.Initializer | None = None,\n      offset_init: hk.initializers.Initializer | None = None,\n      use_fast_variance: bool = True,\n      name: str,\n      param_axis: int | None = None,\n      upcast: bool = True,\n  ):\n    super().__init__(\n        axis=axis,\n        create_scale=False,\n        create_offset=False,\n        eps=eps,\n        scale_init=None,\n        offset_init=None,\n        use_fast_variance=use_fast_variance,\n        name=name,\n        param_axis=param_axis,\n    )\n    self.upcast = upcast\n    self._temp_create_scale = create_scale\n    self._temp_create_offset = create_offset\n\n  def __call__(self, x: jnp.ndarray) -> jnp.ndarray:\n    dtype = x.dtype\n    is_16bit = x.dtype in [jnp.bfloat16, jnp.float16]\n    if self.upcast and is_16bit:\n      x = x.astype(jnp.float32)\n\n    param_axis = self.param_axis[0] if self.param_axis else -1\n    param_shape = (x.shape[param_axis],)\n\n    param_broadcast_shape = [1] * x.ndim\n    param_broadcast_shape[param_axis] = x.shape[param_axis]\n    scale = None\n    offset = None\n    if self._temp_create_scale:\n      scale = hk.get_parameter(\n          'scale', param_shape, x.dtype, init=self.scale_init\n      )\n      scale = scale.reshape(param_broadcast_shape)\n\n    if self._temp_create_offset:\n      offset = hk.get_parameter(\n          'offset', param_shape, x.dtype, init=self.offset_init\n      )\n      offset = offset.reshape(param_broadcast_shape)\n\n    out = super().__call__(x, scale=scale, offset=offset)\n\n    if self.upcast and is_16bit:\n      out = out.astype(dtype)\n\n    return out\n\n\ndef haiku_linear_get_params(\n    inputs: jax.Array | jax.ShapeDtypeStruct,\n    *,\n    num_output: int | Sequence[int],\n    use_bias: bool = False,\n    num_input_dims: int = 1,\n    initializer: str = 'linear',\n    bias_init: float = 0.0,\n    transpose_weights: bool = False,\n    name: str | None = None,\n) -> tuple[jax.Array, jax.Array | None]:\n  \"\"\"Get parameters for linear layer.\n\n  Parameters will be at least float32 or higher precision.\n\n  Arguments:\n    inputs: The input to the Linear layer. Can be either a JAX array or a\n      jax.ShapeDtypeStruct.\n    num_output: The number of output channels. Can be an integer or a sequence\n      of integers.\n    use_bias: Whether to create a bias array.\n    num_input_dims: The number of dimensions to consider as channel dims in the\n      input.\n    initializer: The name of the weight initializer to use.\n    bias_init: A float used to initialize the bias.\n    transpose_weights: If True, will create a transposed version of the weights.\n    name: The Haiku namespace to use for the weight and bias.\n\n  Returns:\n    A tuple[weight, bias] if use_bias otherwise tuple[weight, None].\n  \"\"\"\n\n  if isinstance(num_output, numbers.Integral):\n    output_shape = (num_output,)\n  else:\n    output_shape = tuple(num_output)\n\n  if num_input_dims > 0:\n    in_shape = inputs.shape[-num_input_dims:]\n  elif num_input_dims == 0:\n    in_shape = ()\n  else:\n    raise ValueError('num_input_dims must be >= 0.')\n\n  weight_init = _get_initializer_scale(initializer, in_shape)\n  with hk.name_scope(name) if name else contextlib.nullcontext():\n\n    if transpose_weights:\n      weight_shape = output_shape + in_shape\n\n      weights = hk.get_parameter(\n          'weights', shape=weight_shape, dtype=inputs.dtype, init=weight_init\n      )\n    else:\n      weight_shape = in_shape + output_shape\n      weights = hk.get_parameter(\n          name='weights',\n          shape=weight_shape,\n          dtype=inputs.dtype,\n          init=weight_init,\n      )\n\n    bias = None\n    if use_bias:\n      bias = hk.get_parameter(\n          name='bias',\n          shape=output_shape,\n          dtype=inputs.dtype,\n          init=hk.initializers.Constant(bias_init),\n      )\n  return weights, bias\n\n\nclass Linear(hk.Module):\n  \"\"\"Custom Linear Module.\n\n  This differs from the standard Linear in a few ways:\n    * It supports inputs of arbitrary rank\n    * It allows to use ntk parametrization\n    * Initializers are specified by strings\n    * It allows to explicitly specify which dimension of the input will map to\n      the tpu sublane/lane dimensions.\n  \"\"\"\n\n  def __init__(\n      self,\n      num_output: int | Sequence[int],\n      *,\n      initializer: str = 'linear',\n      num_input_dims: int = 1,\n      use_bias: bool = False,\n      bias_init: float = 0.0,\n      precision: PRECISION = None,\n      fast_scalar_mode: bool = True,\n      transpose_weights: bool = False,\n      name: str,\n  ):\n    \"\"\"Constructs Linear Module.\n\n    Args:\n      num_output: number of output channels. Can be tuple when outputting\n        multiple dimensions.\n      initializer: What initializer to use, should be one of {'linear', 'relu',\n        'zeros'}.\n      num_input_dims: Number of dimensions from the end to project.\n      use_bias: Whether to include trainable bias (False by default).\n      bias_init: Value used to initialize bias.\n      precision: What precision to use for matrix multiplication, defaults to\n        None.\n      fast_scalar_mode: Whether to use optimized path for num_input_dims = 0.\n      transpose_weights: decides whether weights have shape [input, output] or\n        [output, input], True means [output, input], this is helpful to avoid\n        padding on the tensors holding the weights.\n      name: name of module, used for name scopes.\n    \"\"\"\n    super().__init__(name=name)\n    if isinstance(num_output, numbers.Integral):\n      self.output_shape = (num_output,)\n    else:\n      self.output_shape = tuple(num_output)\n    self.initializer = initializer\n    self.use_bias = use_bias\n    self.bias_init = bias_init\n    self.num_input_dims = num_input_dims\n    self.num_output_dims = len(self.output_shape)\n    self.precision = precision if precision is not None else DEFAULT_PRECISION\n    self.fast_scalar_mode = fast_scalar_mode\n    self.transpose_weights = transpose_weights\n\n  def __call__(self, inputs: jnp.ndarray) -> jnp.ndarray:\n    \"\"\"Connects Module.\n\n    Args:\n      inputs: Tensor of shape [..., num_channel]\n\n    Returns:\n      output of shape [..., num_output]\n    \"\"\"\n\n    num_input_dims = self.num_input_dims\n\n    # Adds specialized path for scalar inputs in Linear layer,\n    # this means the linear Layer does not use the matmul units on the tpu,\n    # which is more efficient and gives compiler more flexibility over layout.\n    if num_input_dims == 0 and self.fast_scalar_mode:\n      weight_shape = self.output_shape\n      if self.initializer == 'zeros':\n        w_init = hk.initializers.Constant(0.0)\n      else:\n        distribution_stddev = jnp.array(1 / TRUNCATED_NORMAL_STDDEV_FACTOR)\n        w_init = hk.initializers.TruncatedNormal(\n            mean=0.0, stddev=distribution_stddev\n        )\n\n      weights = hk.get_parameter('weights', weight_shape, inputs.dtype, w_init)\n\n      inputs = jnp.expand_dims(\n          inputs, tuple(range(-1, -self.num_output_dims - 1, -1))\n      )\n      output = inputs * weights\n    else:\n      if self.num_input_dims > 0:\n        in_shape = inputs.shape[-self.num_input_dims :]\n      else:\n        in_shape = ()\n\n      weight_init = _get_initializer_scale(self.initializer, in_shape)\n\n      in_letters = 'abcde'[: self.num_input_dims]\n      out_letters = 'hijkl'[: self.num_output_dims]\n\n      if self.transpose_weights:\n        weight_shape = self.output_shape + in_shape\n        weights = hk.get_parameter(\n            'weights', weight_shape, inputs.dtype, weight_init\n        )\n        equation = (\n            f'...{in_letters}, {out_letters}{in_letters}->...{out_letters}'\n        )\n      else:\n        weight_shape = in_shape + self.output_shape\n        weights = hk.get_parameter(\n            'weights', weight_shape, inputs.dtype, weight_init\n        )\n\n        equation = (\n            f'...{in_letters}, {in_letters}{out_letters}->...{out_letters}'\n        )\n\n      output = jnp.einsum(equation, inputs, weights, precision=self.precision)\n\n    if self.use_bias:\n      bias = hk.get_parameter(\n          'bias',\n          self.output_shape,\n          inputs.dtype,\n          hk.initializers.Constant(self.bias_init),\n      )\n      output += bias\n\n    return output\n\n\ndef _get_initializer_scale(initializer_name, input_shape):\n  \"\"\"Get initializer for weights.\"\"\"\n\n  if initializer_name == 'zeros':\n    w_init = hk.initializers.Constant(0.0)\n  else:\n    # fan-in scaling\n    noise_scale = 1.0\n    for channel_dim in input_shape:\n      noise_scale /= channel_dim\n    if initializer_name == 'relu':\n      noise_scale *= 2\n\n    stddev = np.sqrt(noise_scale)\n    # Adjust stddev for truncation.\n    stddev = stddev / TRUNCATED_NORMAL_STDDEV_FACTOR\n    w_init = hk.initializers.TruncatedNormal(mean=0.0, stddev=stddev)\n\n  return w_init\n"
  },
  {
    "path": "src/alphafold3/model/components/mapping.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Specialized mapping functions.\"\"\"\n\nfrom collections.abc import Callable, Sequence\nimport functools\nfrom typing import Any, TypeVar\n\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\n\n\nPytree = Any\nPytreeJaxArray = Any\n\npartial = functools.partial\nPROXY = object()\n\nT = TypeVar(\"T\")\n\n\ndef _maybe_slice(array, i, slice_size, axis):\n  if axis is PROXY:\n    return array\n  else:\n    return jax.lax.dynamic_slice_in_dim(\n        array, i, slice_size=slice_size, axis=axis\n    )\n\n\ndef _maybe_get_size(array, axis):\n  if axis == PROXY:\n    return -1\n  else:\n    return array.shape[axis]\n\n\ndef _expand_axes(axes, values, name=\"sharded_apply\"):\n  values_tree_def = jax.tree_util.tree_structure(values)\n  flat_axes = jax.api_util.flatten_axes(name, values_tree_def, axes)\n  # Replace None's with PROXY.\n  flat_axes = [PROXY if x is None else x for x in flat_axes]\n  return jax.tree_util.tree_unflatten(values_tree_def, flat_axes)\n\n\ndef sharded_map(\n    fun: Callable[..., PytreeJaxArray],\n    shard_size: int | None = 1,\n    in_axes: int | Pytree = 0,\n    out_axes: int | Pytree = 0,\n) -> Callable[..., PytreeJaxArray]:\n  \"\"\"Sharded vmap.\n\n  Maps `fun` over axes, in a way similar to hk.vmap, but does so in shards of\n  `shard_size`. This allows a smooth trade-off between memory usage\n  (as in a plain map) vs higher throughput (as in a vmap).\n\n  Args:\n    fun: Function to apply smap transform to.\n    shard_size: Integer denoting shard size.\n    in_axes: Either integer or pytree describing which axis to map over for each\n      input to `fun`, None denotes broadcasting.\n    out_axes: Integer or pytree denoting to what axis in the output the mapped\n      over axis maps.\n\n  Returns:\n    Function with smap applied.\n  \"\"\"\n  if hk.running_init():\n    # Guarantees initialisation independent of shard_size. Doesn't incur a high\n    # memory cost, as long as large concrete tensors are not encountered.\n    return hk.vmap(fun, in_axes=in_axes, out_axes=out_axes, split_rng=False)\n  else:\n    vmapped_fun = hk.vmap(fun, in_axes, out_axes, split_rng=True)\n    return sharded_apply(vmapped_fun, shard_size, in_axes, out_axes)\n\n\ndef _set_docstring(docstr: str) -> Callable[[T], T]:\n  \"\"\"Decorator for setting the docstring of a function.\"\"\"\n\n  def wrapped(fun: T) -> T:\n    fun.__doc__ = docstr.format(fun=getattr(fun, \"__name__\", repr(fun)))\n    return fun\n\n  return wrapped\n\n\ndef sharded_apply(\n    fun: Callable[..., PytreeJaxArray],\n    shard_size: int | None = 1,\n    in_axes: int | Pytree = 0,\n    out_axes: int | Pytree = 0,\n    new_out_axes: bool = False,\n) -> Callable[..., PytreeJaxArray]:\n  \"\"\"Sharded apply.\n\n  Applies `fun` over shards to axes, in a way similar to vmap,\n  but does so in shards of `shard_size`. Shards are stacked after.\n  This allows a smooth trade-off between\n  memory usage (as in a plain map) vs higher throughput (as in a vmap).\n\n  Args:\n    fun: Function to apply smap transform to.\n    shard_size: Integer denoting shard size. None will return `fun` unchanged.\n    in_axes: Either integer or pytree describing which axis to map over for each\n      input to `fun`, None denotes broadcasting.\n    out_axes: Integer or pytree denoting to what axis in the output the mapped\n      over axis maps.\n    new_out_axes: Whether to stack outputs on new axes. This assumes that the\n      output sizes for each shard (including the possible remainder shard) are\n      the same.\n\n  Returns:\n    Function with smap applied.\n  \"\"\"\n  docstr = (\n      \"Mapped version of {fun}. Takes similar arguments to {fun} \"\n      \"but with additional array axes over which {fun} is mapped.\"\n  )\n  if new_out_axes:\n    raise NotImplementedError(\"New output axes not yet implemented.\")\n\n  if shard_size is None:\n    return fun\n\n  @_set_docstring(docstr)\n  @functools.wraps(fun)\n  def mapped_fn(*args, **kwargs):\n    # Expand in axes and determine loop range.\n    in_axes_ = _expand_axes(in_axes, args)\n\n    in_sizes = jax.tree.map(_maybe_get_size, args, in_axes_)\n    in_size = max(jax.tree_util.tree_leaves(in_sizes))\n\n    num_extra_shards = (in_size - 1) // shard_size\n\n    # Fix if necessary.\n    last_shard_size = in_size % shard_size\n    last_shard_size = shard_size if last_shard_size == 0 else last_shard_size\n\n    def apply_fun_to_slice(slice_start, slice_size):\n      input_slice = jax.tree.map(\n          lambda array, axis: _maybe_slice(\n              array, slice_start, slice_size, axis\n          ),\n          args,\n          in_axes_,\n      )\n      return fun(*input_slice, **kwargs)\n\n    remainder_shape_dtype = hk.eval_shape(\n        partial(apply_fun_to_slice, 0, last_shard_size)\n    )\n    out_dtypes = jax.tree.map(lambda x: x.dtype, remainder_shape_dtype)\n    out_shapes = jax.tree.map(lambda x: x.shape, remainder_shape_dtype)\n    out_axes_ = _expand_axes(out_axes, remainder_shape_dtype)\n\n    if num_extra_shards > 0:\n      regular_shard_shape_dtype = hk.eval_shape(\n          partial(apply_fun_to_slice, 0, shard_size)\n      )\n      shard_shapes = jax.tree.map(lambda x: x.shape, regular_shard_shape_dtype)\n\n      def make_output_shape(axis, shard_shape, remainder_shape):\n        return (\n            shard_shape[:axis]\n            + (shard_shape[axis] * num_extra_shards + remainder_shape[axis],)\n            + shard_shape[axis + 1 :]\n        )\n\n      out_shapes = jax.tree.map(\n          make_output_shape, out_axes_, shard_shapes, out_shapes\n      )\n\n    # Calls dynamic Update slice with different argument order.\n    # This is here since tree_map only works with positional arguments.\n    def dynamic_update_slice_in_dim(full_array, update, axis, i):\n      return jax.lax.dynamic_update_slice_in_dim(full_array, update, i, axis)\n\n    def compute_shard(outputs, slice_start, slice_size):\n      slice_out = apply_fun_to_slice(slice_start, slice_size)\n      update_slice = partial(dynamic_update_slice_in_dim, i=slice_start)\n      return jax.tree.map(update_slice, outputs, slice_out, out_axes_)\n\n    def scan_iteration(outputs, i):\n      new_outputs = compute_shard(outputs, i, shard_size)\n      return new_outputs, ()\n\n    slice_starts = jnp.arange(0, in_size - shard_size + 1, shard_size)\n\n    def allocate_buffer(dtype, shape):\n      return jnp.zeros(shape, dtype=dtype)\n\n    outputs = jax.tree.map(allocate_buffer, out_dtypes, out_shapes)\n\n    if slice_starts.shape[0] > 0:\n      outputs, _ = hk.scan(scan_iteration, outputs, slice_starts)\n\n    if last_shard_size != shard_size:\n      remainder_start = in_size - last_shard_size\n      outputs = compute_shard(outputs, remainder_start, last_shard_size)\n\n    return outputs\n\n  return mapped_fn\n\n\ndef inference_subbatch(\n    module: Callable[..., PytreeJaxArray],\n    subbatch_size: int,\n    batched_args: Sequence[PytreeJaxArray],\n    nonbatched_args: Sequence[PytreeJaxArray],\n    input_subbatch_dim: int = 0,\n    output_subbatch_dim: int | None = None,\n) -> PytreeJaxArray:\n  \"\"\"Run through subbatches (like batch apply but with split and concat).\"\"\"\n  assert len(batched_args) > 0  # pylint: disable=g-explicit-length-test\n\n  if hk.running_init():\n    args = list(batched_args) + list(nonbatched_args)\n    return module(*args)\n\n  if output_subbatch_dim is None:\n    output_subbatch_dim = input_subbatch_dim\n\n  def run_module(*batched_args):\n    args = list(batched_args) + list(nonbatched_args)\n    res = module(*args)\n    return res\n\n  sharded_module = sharded_apply(\n      run_module,\n      shard_size=subbatch_size,\n      in_axes=input_subbatch_dim,\n      out_axes=output_subbatch_dim,\n  )\n  output = sharded_module(*batched_args)\n\n  return output\n"
  },
  {
    "path": "src/alphafold3/model/components/utils.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Utility functions for training AlphaFold and similar models.\"\"\"\n\nfrom collections import abc\nimport contextlib\nimport numbers\n\nfrom alphafold3.model import features\nimport haiku as hk\nimport jax.numpy as jnp\nimport numpy as np\n\n\nVALID_DTYPES = [np.float32, np.float64, np.int8, np.int32, np.int64, bool]\n\n\ndef remove_invalidly_typed_feats(\n    batch: features.BatchDict,\n) -> features.BatchDict:\n  \"\"\"Remove features of types we don't want to send to the TPU e.g. strings.\"\"\"\n  return {\n      k: v\n      for k, v in batch.items()\n      if hasattr(v, 'dtype') and v.dtype in VALID_DTYPES\n  }\n\n\ndef bfloat16_getter(next_getter, value, context):\n  \"\"\"Ensures that a bfloat16 parameter is provided by casting if necessary.\"\"\"\n  if context.original_dtype == jnp.bfloat16:\n    if value.dtype != jnp.bfloat16:\n      value = value.astype(jnp.bfloat16)\n  return next_getter(value)\n\n\n@contextlib.contextmanager\ndef bfloat16_context():\n  with hk.custom_getter(bfloat16_getter):\n    yield\n\n\ndef mask_mean(mask, value, axis=None, keepdims=False, eps=1e-10):\n  \"\"\"Masked mean.\"\"\"\n\n  mask_shape = mask.shape\n  value_shape = value.shape\n\n  assert len(mask_shape) == len(\n      value_shape\n  ), 'Shapes are not compatible, shapes: {}, {}'.format(mask_shape, value_shape)\n\n  if isinstance(axis, numbers.Integral):\n    axis = [axis]\n  elif axis is None:\n    axis = list(range(len(mask_shape)))\n  assert isinstance(\n      axis, abc.Iterable\n  ), 'axis needs to be either an iterable, integer or \"None\"'\n\n  broadcast_factor = 1.0\n  for axis_ in axis:\n    value_size = value_shape[axis_]\n    mask_size = mask_shape[axis_]\n    if mask_size == 1:\n      broadcast_factor *= value_size\n    else:\n      error = f'Shapes are not compatible, shapes: {mask_shape}, {value_shape}'\n      assert mask_size == value_size, error\n\n  return jnp.sum(mask * value, keepdims=keepdims, axis=axis) / (\n      jnp.maximum(\n          jnp.sum(mask, keepdims=keepdims, axis=axis) * broadcast_factor, eps\n      )\n  )\n"
  },
  {
    "path": "src/alphafold3/model/confidence_types.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Confidence categories for predictions.\"\"\"\n\nimport dataclasses\nimport enum\nimport json\nfrom typing import Any, Self\n\nfrom absl import logging\nfrom alphafold3.model import model\nimport jax\nimport numpy as np\n\n\nclass StructureConfidenceFullEncoder(json.JSONEncoder):\n  \"\"\"JSON encoder for serializing confidence types.\"\"\"\n\n  def __init__(self, **kwargs):\n    super().__init__(**(kwargs | dict(separators=(',', ':'))))\n\n  def encode(self, o: 'StructureConfidenceFull'):\n    # Cast to np.float64 before rounding, since casting to Python float will\n    # cast to a 64 bit float, potentially undoing np.float32 rounding.\n    atom_plddts = np.round(\n        np.clip(np.asarray(o.atom_plddts, dtype=np.float64), 0.0, 99.99), 2\n    ).astype(float)\n    contact_probs = np.round(\n        np.clip(np.asarray(o.contact_probs, dtype=np.float64), 0.0, 1.0), 2\n    ).astype(float)\n    pae = np.round(\n        np.clip(np.asarray(o.pae, dtype=np.float64), 0.0, 99.9), 1\n    ).astype(float)\n    return \"\"\"\\\n{\n  \"atom_chain_ids\": %s,\n  \"atom_plddts\": %s,\n  \"contact_probs\": %s,\n  \"pae\": %s,\n  \"token_chain_ids\": %s,\n  \"token_res_ids\": %s\n}\"\"\" % (\n        super().encode(o.atom_chain_ids),\n        super().encode(list(atom_plddts)).replace('NaN', 'null'),\n        super().encode([list(x) for x in contact_probs]).replace('NaN', 'null'),\n        super().encode([list(x) for x in pae]).replace('NaN', 'null'),\n        super().encode(o.token_chain_ids),\n        super().encode(o.token_res_ids),\n    )\n\n\ndef _dump_json(data: Any, indent: int | None = None) -> str:\n  \"\"\"Dumps a json string with JSON compatible NaN representation.\"\"\"\n  json_str = json.dumps(\n      data,\n      sort_keys=True,\n      indent=indent,\n      separators=(',', ': '),\n  )\n  return json_str.replace('NaN', 'null')\n\n\n@enum.unique\nclass ConfidenceCategory(enum.Enum):\n  \"\"\"Confidence categories for AlphaFold predictions.\"\"\"\n\n  HIGH = 0\n  MEDIUM = 1\n  LOW = 2\n  DISORDERED = 3\n\n  @classmethod\n  def from_char(cls, char: str) -> Self:\n    match char:\n      case 'H':\n        return cls.HIGH\n      case 'M':\n        return cls.MEDIUM\n      case 'L':\n        return cls.LOW\n      case 'D':\n        return cls.DISORDERED\n      case _:\n        raise ValueError(\n            f'Unknown character. Expected one of H, M, L or D; got: {char}'\n        )\n\n  def to_char(self) -> str:\n    match self:\n      case self.HIGH:\n        return 'H'\n      case self.MEDIUM:\n        return 'M'\n      case self.LOW:\n        return 'L'\n      case self.DISORDERED:\n        return 'D'\n\n  @classmethod\n  def from_confidence_score(cls, confidence: float) -> Self:\n    if 90 <= confidence <= 100:\n      return cls.HIGH\n    if 70 <= confidence < 90:\n      return cls.MEDIUM\n    if 50 <= confidence < 70:\n      return cls.LOW\n    if 0 <= confidence < 50:\n      return cls.DISORDERED\n    raise ValueError(f'Confidence score out of range [0, 100]: {confidence}')\n\n\n@dataclasses.dataclass()\nclass AtomConfidence:\n  \"\"\"Dataclass for 1D per-atom confidences from AlphaFold.\"\"\"\n\n  chain_id: list[str]\n  atom_number: list[int]\n  confidence: list[float]\n  confidence_category: list[ConfidenceCategory]\n\n  def __post_init__(self):\n    num_res = len(self.atom_number)\n    if not all(\n        len(v) == num_res\n        for v in [self.chain_id, self.confidence, self.confidence_category]\n    ):\n      raise ValueError('All confidence fields must have the same length.')\n\n  @classmethod\n  def from_inference_result(\n      cls, inference_result: model.InferenceResult\n  ) -> Self:\n    \"\"\"Instantiates an AtomConfidence from a structure.\n\n    Args:\n      inference_result: Inference result from AlphaFold.\n\n    Returns:\n      Scores in AtomConfidence dataclass.\n    \"\"\"\n    struc = inference_result.predicted_structure\n    as_dict = {\n        'chain_id': [],\n        'atom_number': [],\n        'confidence': [],\n        'confidence_category': [],\n    }\n    for atom_number, atom in enumerate(struc.iter_atoms()):\n      this_confidence = float(struc.atom_b_factor[atom_number])\n      as_dict['chain_id'].append(atom['chain_id'])\n      as_dict['atom_number'].append(atom_number)\n      as_dict['confidence'].append(round(this_confidence, 2))\n      as_dict['confidence_category'].append(\n          ConfidenceCategory.from_confidence_score(this_confidence)\n      )\n    return cls(**as_dict)\n\n  @classmethod\n  def from_json(cls, json_string: str) -> Self:\n    \"\"\"Instantiates a AtomConfidence from a json string.\"\"\"\n    input_dict = json.loads(json_string)\n    input_dict['confidence_category'] = [\n        ConfidenceCategory.from_char(k)\n        for k in input_dict['confidence_category']\n    ]\n    return cls(**input_dict)\n\n  def to_json(self) -> str:\n    output = dataclasses.asdict(self)\n    output['confidence_category'] = [\n        k.to_char() for k in output['confidence_category']\n    ]\n    output['atom_number'] = [int(k) for k in output['atom_number']]\n    return _dump_json(output)\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass StructureConfidenceSummary:\n  \"\"\"Dataclass for the summary of structure scores from AlphaFold.\n\n  Attributes:\n   ptm: Predicted TM global score.\n   iptm: Interface predicted TM global score.\n   ranking_score: Ranking score extracted from CIF metadata.\n   fraction_disordered: Fraction disordered, measured with RASA.\n   has_clash: Has significant clashing.\n   chain_pair_pae_min: [num_chains, num_chains] Minimum cross chain PAE.\n   chain_pair_iptm: [num_chains, num_chains] Chain pair ipTM.\n   chain_ptm: [num_chains] Chain pTM.\n   chain_iptm: [num_chains] Mean cross chain ipTM for a chain.\n  \"\"\"\n\n  ptm: float\n  iptm: float\n  ranking_score: float\n  fraction_disordered: float\n  has_clash: float\n  chain_pair_pae_min: np.ndarray\n  chain_pair_iptm: np.ndarray\n  chain_ptm: np.ndarray\n  chain_iptm: np.ndarray\n\n  @classmethod\n  def from_inference_result(\n      cls, inference_result: model.InferenceResult\n  ) -> Self:\n    \"\"\"Returns a new instance based on a given inference result.\"\"\"\n    return cls(\n        ptm=float(inference_result.metadata['ptm']),\n        iptm=float(inference_result.metadata['iptm']),\n        ranking_score=float(inference_result.metadata['ranking_score']),\n        fraction_disordered=float(\n            inference_result.metadata['fraction_disordered']\n        ),\n        has_clash=float(inference_result.metadata['has_clash']),\n        chain_pair_pae_min=inference_result.metadata['chain_pair_pae_min'],\n        chain_pair_iptm=inference_result.metadata['chain_pair_iptm'],\n        chain_ptm=inference_result.metadata['iptm_ichain'],\n        chain_iptm=inference_result.metadata['iptm_xchain'],\n    )\n\n  @classmethod\n  def from_json(cls, json_string: str) -> Self:\n    \"\"\"Returns a new instance from a given json string.\"\"\"\n    return cls(**json.loads(json_string))\n\n  def to_json(self) -> str:\n    def convert(data):\n      if isinstance(data, np.ndarray):\n        # Cast to np.float64 before rounding, since casting to Python float will\n        # cast to a 64 bit float, potentially undoing np.float32 rounding.\n        rounded_data = np.round(data.astype(np.float64), decimals=2).tolist()\n      else:\n        rounded_data = np.round(data, decimals=2)\n      return rounded_data\n\n    return _dump_json(jax.tree.map(convert, dataclasses.asdict(self)), indent=1)\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass StructureConfidenceFull:\n  \"\"\"Dataclass for full structure data from AlphaFold.\"\"\"\n\n  pae: np.ndarray\n  token_chain_ids: list[str]\n  token_res_ids: list[int]\n  atom_plddts: list[float]\n  atom_chain_ids: list[str]\n  contact_probs: np.ndarray  # [num_tokens, num_tokens]\n\n  @classmethod\n  def from_inference_result(\n      cls, inference_result: model.InferenceResult\n  ) -> Self:\n    \"\"\"Returns a new instance based on a given inference result.\"\"\"\n\n    pae = inference_result.numerical_data['full_pae']\n    if not isinstance(pae, np.ndarray):\n      logging.info('%s', type(pae))\n      raise TypeError('pae should be a numpy array.')\n\n    contact_probs = inference_result.numerical_data['contact_probs']\n    if not isinstance(contact_probs, np.ndarray):\n      logging.info('%s', type(contact_probs))\n      raise TypeError('contact_probs should be a numpy array.')\n\n    struc = inference_result.predicted_structure\n    chain_ids = struc.chain_id.tolist()\n    atom_plddts = struc.atom_b_factor.tolist()\n    token_chain_ids = [\n        str(token_id)\n        for token_id in inference_result.metadata['token_chain_ids']\n    ]\n    token_res_ids = [\n        int(token_id) for token_id in inference_result.metadata['token_res_ids']\n    ]\n    return cls(\n        pae=pae,\n        token_chain_ids=token_chain_ids,\n        token_res_ids=token_res_ids,\n        atom_plddts=atom_plddts,\n        atom_chain_ids=chain_ids,\n        contact_probs=contact_probs,\n    )\n\n  @classmethod\n  def from_json(cls, json_string: str) -> Self:\n    \"\"\"Returns a new instance from a given json string.\"\"\"\n    return cls(**json.loads(json_string))\n\n  def to_json(self) -> str:\n    \"\"\"Converts StructureConfidenceFull to json string.\"\"\"\n    return json.dumps(self, cls=StructureConfidenceFullEncoder)\n"
  },
  {
    "path": "src/alphafold3/model/confidences.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Functions for extracting and processing confidences from model outputs.\"\"\"\nimport warnings\n\nfrom absl import logging\nfrom alphafold3 import structure\nfrom alphafold3.constants import residue_names\nfrom alphafold3.cpp import mkdssp\nimport jax.numpy as jnp\nimport numpy as np\nfrom scipy import spatial\n\n\n# From Sander & Rost 1994 https://doi.org/10.1002/prot.340200303\nMAX_ACCESSIBLE_SURFACE_AREA = {\n    'ALA': 106.0,\n    'ARG': 248.0,\n    'ASN': 157.0,\n    'ASP': 163.0,\n    'CYS': 135.0,\n    'GLN': 198.0,\n    'GLU': 194.0,\n    'GLY': 84.0,\n    'HIS': 184.0,\n    'ILE': 169.0,\n    'LEU': 164.0,\n    'LYS': 205.0,\n    'MET': 188.0,\n    'PHE': 197.0,\n    'PRO': 136.0,\n    'SER': 130.0,\n    'THR': 142.0,\n    'TRP': 227.0,\n    'TYR': 222.0,\n    'VAL': 142.0,\n}\n\n# Weights for ranking confidence.\n_IPTM_WEIGHT = 0.8\n_FRACTION_DISORDERED_WEIGHT = 0.5\n_CLASH_PENALIZATION_WEIGHT = 100.0\n\n\ndef windowed_solvent_accessible_area(cif: str, window: int = 25) -> np.ndarray:\n  \"\"\"Implementation of AlphaFold-RSA.\n\n  AlphaFold-RSA defined in https://www.ncbi.nlm.nih.gov/pmc/articles/PMC9601767.\n\n  Args:\n    cif: Raw cif string.\n    window: The window over which to average accessible surface area\n\n  Returns:\n    An array of size num_res that predicts disorder by using windowed solvent\n    accessible surface area.\n  \"\"\"\n  result = mkdssp.get_dssp(cif, calculate_surface_accessibility=True)\n  parse_row = False\n  rasa = []\n  for row in result.splitlines():\n    if parse_row:\n      aa = row[13:14]\n      if aa == '!':\n        continue\n      aa3 = residue_names.PROTEIN_COMMON_ONE_TO_THREE.get(aa, 'ALA')\n      max_acc = MAX_ACCESSIBLE_SURFACE_AREA[aa3]\n      acc = int(row[34:38])\n      norm_acc = acc / max_acc\n      if norm_acc > 1.0:\n        norm_acc = 1.0\n      rasa.append(norm_acc)\n    if row.startswith('  #  RESIDUE'):\n      parse_row = True\n\n  half_w = (window - 1) // 2\n  pad_rasa = np.pad(rasa, (half_w, half_w), 'reflect')\n  rasa = np.convolve(pad_rasa, np.ones(window), 'valid') / window\n  return rasa\n\n\ndef fraction_disordered(\n    struc: structure.Structure, rasa_disorder_cutoff: float = 0.581\n) -> float:\n  \"\"\"Compute fraction of protein residues that are disordered.\n\n  Args:\n    struc: A structure to compute rASA metrics on.\n    rasa_disorder_cutoff: The threshold at which residues are considered\n      disordered. Default value taken from\n      https://www.ncbi.nlm.nih.gov/pmc/articles/PMC9601767.\n\n  Returns:\n    The fraction of protein residues that are disordered\n    (rasa > rasa_disorder_cutoff).\n  \"\"\"\n  struc = struc.filter_to_entity_type(protein=True)\n  rasa = []\n  seq_rasa = {}\n  for chain_id, chain_seq in struc.chain_single_letter_sequence().items():\n    if chain_seq in seq_rasa:\n      # We assume that identical sequences have approximately similar rasa\n      # values to speed up the computation.\n      rasa.extend(seq_rasa[chain_seq])\n      continue\n    chain_struc = struc.filter(chain_id=chain_id)\n    # Rename the chain to 'A' as MKDSSP supports only single letter chain IDs.\n    chain_struc = chain_struc.rename_chain_ids(new_id_by_old_id={chain_id: 'A'})\n    try:\n      rasa_per_residue = windowed_solvent_accessible_area(\n          chain_struc.to_mmcif()\n      )\n      seq_rasa[chain_seq] = rasa_per_residue\n      rasa.extend(rasa_per_residue)\n    except (ValueError, RuntimeError) as e:\n      logging.warning('%s: rasa calculation failed: %s', struc.name, e)\n\n  if not rasa:\n    return 0.0\n  return np.mean(np.array(rasa) > rasa_disorder_cutoff)\n\n\ndef has_clash(\n    struc: structure.Structure,\n    cutoff_radius: float = 1.1,\n    min_clashes_for_overlap: int = 100,\n    min_fraction_for_overlap: float = 0.5,\n) -> bool:\n  \"\"\"Determine whether the structure has at least one clashing chain.\n\n  A clashing chain is defined as having greater than 100 polymer atoms within\n  1.1A of another polymer atom, or having more than 50% of the chain with\n  clashing atoms.\n\n  Args:\n    struc: A structure to get clash metrics for.\n    cutoff_radius: atom distances under this threshold are considered a clash.\n    min_clashes_for_overlap: The minimum number of atom-atom clashes for a chain\n      to be considered overlapping.\n    min_fraction_for_overlap: The minimum fraction of atoms within a chain that\n      are clashing for the chain to be considered overlapping.\n\n  Returns:\n    True if the structure has at least one clashing chain.\n  \"\"\"\n  struc = struc.filter_to_entity_type(protein=True, rna=True, dna=True)\n  if not struc.chains:\n    return False\n  coords = struc.coords\n  coord_kdtree = spatial.cKDTree(coords)\n  clashes_per_atom = coord_kdtree.query_ball_point(\n      coords, p=2.0, r=cutoff_radius\n  )\n  per_atom_has_clash = np.zeros(len(coords), dtype=np.int32)\n  for atom_idx, clashing_indices in enumerate(clashes_per_atom):\n    for clashing_idx in clashing_indices:\n      if np.abs(struc.res_id[atom_idx] - struc.res_id[clashing_idx]) > 1 or (\n          struc.chain_id[atom_idx] != struc.chain_id[clashing_idx]\n      ):\n        per_atom_has_clash[atom_idx] = True\n        break\n  for chain_id in struc.chains:\n    mask = struc.chain_id == chain_id\n    num_atoms = np.sum(mask)\n    if num_atoms == 0:\n      continue\n    num_clashes = np.sum(per_atom_has_clash * mask)\n    frac_clashes = num_clashes / num_atoms\n    if (\n        num_clashes > min_clashes_for_overlap\n        or frac_clashes > min_fraction_for_overlap\n    ):\n      return True\n  return False\n\n\ndef get_ranking_score(\n    ptm: float, iptm: float, fraction_disordered_: float, has_clash_: bool\n) -> float:\n  # ipTM is NaN for single chain structures. Use pTM for such cases.\n  if np.isnan(iptm):\n    ptm_iptm_average = ptm\n  else:\n    ptm_iptm_average = _IPTM_WEIGHT * iptm + (1.0 - _IPTM_WEIGHT) * ptm\n  return (\n      ptm_iptm_average\n      + _FRACTION_DISORDERED_WEIGHT * fraction_disordered_\n      - _CLASH_PENALIZATION_WEIGHT * has_clash_\n  )\n\n\ndef rank_metric(\n    full_pde: jnp.ndarray | np.ndarray, contact_probs: jnp.ndarray | np.ndarray\n) -> jnp.ndarray | np.ndarray:\n  \"\"\"Compute the metric that will be used to rank predictions, higher is better.\n\n  Args:\n    full_pde: A [num_samples, num_tokens,num_tokens] matrix of predicted\n      distance errors between pairs of tokens.\n    contact_probs: A [num_tokens, num_tokens] matrix consisting of the\n      probability of contact (<8A) that is returned from the distogram head.\n\n  Returns:\n    A scalar that can be used to rank (higher is better).\n  \"\"\"\n  if not isinstance(full_pde, type(contact_probs)):\n    raise ValueError('full_pde and contact_probs must be of the same type.')\n\n  if isinstance(full_pde, np.ndarray):\n    sum_fn = np.sum\n  elif isinstance(full_pde, jnp.ndarray):\n    sum_fn = jnp.sum\n  else:\n    raise ValueError('full_pde must be a numpy array or a jax array.')\n  # It was found that taking the contact_map weighted average was better than\n  # just the predicted distance error on its own.\n  return -sum_fn(full_pde * contact_probs[None, :, :], axis=(-2, -1)) / (\n      sum_fn(contact_probs) + 1e-6\n  )\n\n\ndef weighted_mean(mask, value, axis):\n  return np.mean(mask * value, axis=axis) / (1e-8 + np.mean(mask, axis=axis))\n\n\ndef pde_single(\n    num_tokens: int,\n    asym_ids: np.ndarray,\n    full_pde: np.ndarray,\n    contact_probs: np.ndarray,\n) -> tuple[np.ndarray, np.ndarray, np.ndarray]:\n  \"\"\"Compute 1D PDE summaries.\n\n  Args:\n    num_tokens: The number of tokens (not including padding).\n    asym_ids: The asym_ids (array of shape num_tokens).\n    full_pde: A [num_samples, num_tokens, num_tokens] matrix of predicted\n      distance errors.\n    contact_probs: A [num_tokens, num_tokens] matrix consisting of the\n      probability of contact (<8A) that is returned from the distogram head.\n\n  Returns:\n    A tuple (ichain, xchain, full_chain) where:\n      `ichain` is a [num_samples, num_chains] matrix where the\n      value assigned to each chain is an average of the full PDE matrix over all\n      its within-chain interactions, weighted by `contact_probs`.\n      `xchain` is a [num_samples, num_chains] matrix where the\n      value assigned to each chain is an average of the full PDE matrix over all\n      its cross-chain interactions, weighted by `contact_probs`.\n      `full_chain` is a [num_samples, num_tokens] matrix where the\n      value assigned to each token is an average of it PDE against all tokens,\n      weighted by `contact_probs`.\n  \"\"\"\n\n  full_pde = full_pde[:, :num_tokens, :num_tokens]\n  contact_probs = contact_probs[:num_tokens, :num_tokens]\n  asym_ids = asym_ids[:num_tokens]\n  unique_asym_ids = np.unique(asym_ids)\n  num_chains = len(unique_asym_ids)\n  num_samples = full_pde.shape[0]\n\n  asym_ids = asym_ids[None]\n  contact_probs = contact_probs[None]\n\n  ichain = np.zeros((num_samples, num_chains))\n  xchain = np.zeros((num_samples, num_chains))\n\n  for idx, asym_id in enumerate(unique_asym_ids):\n    my_asym_id = asym_ids == asym_id\n    imask = my_asym_id[:, :, None] * my_asym_id[:, None, :]\n    xmask = my_asym_id[:, :, None] * ~my_asym_id[:, None, :]\n    imask = imask * contact_probs\n    xmask = xmask * contact_probs\n    ichain[:, idx] = weighted_mean(mask=imask, value=full_pde, axis=(-2, -1))\n    xchain[:, idx] = weighted_mean(mask=xmask, value=full_pde, axis=(-2, -1))\n\n  full_chain = weighted_mean(mask=contact_probs, value=full_pde, axis=(-1,))\n\n  return ichain, xchain, full_chain\n\n\ndef chain_pair_pde(\n    num_tokens: int, asym_ids: np.ndarray, full_pde: np.ndarray\n) -> tuple[np.ndarray, np.ndarray]:\n  \"\"\"Compute predicted distance errors for all pairs of chains.\n\n  Args:\n    num_tokens: The number of tokens (not including padding).\n    asym_ids: The asym_ids (array of shape num_tokens).\n    full_pde: A [num_samples, num_tokens, num_tokens] matrix of predicted\n      distance errors.\n\n  Returns:\n    chain_pair_pred_err_mean - a [num_chains, num_chains] matrix with average\n      per chain-pair predicted distance error.\n    chain_pair_pred_err_min - a [num_chains, num_chains] matrix with min\n      per chain-pair predicted distance error.\n  \"\"\"\n  full_pde = full_pde[:, :num_tokens, :num_tokens]\n  asym_ids = asym_ids[:num_tokens]\n  unique_asym_ids = np.unique(asym_ids)\n  num_chains = len(unique_asym_ids)\n  num_samples = full_pde.shape[0]\n  chain_pair_pred_err_mean = np.zeros((num_samples, num_chains, num_chains))\n  chain_pair_pred_err_min = np.zeros((num_samples, num_chains, num_chains))\n\n  for idx1, asym_id_1 in enumerate(unique_asym_ids):\n    subset = full_pde[:, asym_ids == asym_id_1, :]\n    for idx2, asym_id_2 in enumerate(unique_asym_ids):\n      subsubset = subset[:, :, asym_ids == asym_id_2]\n      chain_pair_pred_err_mean[:, idx1, idx2] = np.mean(subsubset, axis=(1, 2))\n      chain_pair_pred_err_min[:, idx1, idx2] = np.min(subsubset, axis=(1, 2))\n  return chain_pair_pred_err_mean, chain_pair_pred_err_min\n\n\ndef weighted_nanmean(\n    value: np.ndarray, mask: np.ndarray, axis: int\n) -> np.ndarray:\n  \"\"\"Nan-mean with weighting -- empty slices return NaN.\"\"\"\n  assert mask.shape == value.shape\n  assert not np.isnan(mask).all()\n\n  nan_idxs = np.where(np.isnan(value))\n  # Need to NaN the mask to get the correct denominator weighting.\n  mask_with_nan = mask.copy()\n  mask_with_nan[nan_idxs] = np.nan\n  with warnings.catch_warnings():\n    # Mean of empty slice is ok and should return a NaN.\n    warnings.filterwarnings(action='ignore', message='Mean of empty slice')\n    warnings.filterwarnings(\n        action='ignore', message='invalid value encountered in (scalar )?divide'\n    )\n    return np.nanmean(value * mask_with_nan, axis=axis) / np.nanmean(\n        mask_with_nan, axis=axis\n    )\n\n\ndef chain_pair_pae(\n    *,\n    num_tokens: int,\n    asym_ids: np.ndarray,\n    full_pae: np.ndarray,\n    mask: np.ndarray | None = None,\n    contact_probs: np.ndarray | None = None,\n) -> tuple[np.ndarray, np.ndarray, np.ndarray]:\n  \"\"\"Compute predicted errors for all pairs of chains.\n\n  Args:\n    num_tokens: The number of tokens (not including padding).\n    asym_ids: The asym_ids (array of shape num_tokens).\n    full_pae: A [num_samples, num_tokens, num_tokens] matrix of predicted\n      errors.\n    mask: A [num_tokens, num_tokens] mask matrix.\n    contact_probs: A [num_tokens, num_tokens] matrix consisting of the\n      probability of contact (<8A) that is returned from the distogram head.\n\n  Returns:\n    chain_pair_pred_err_mean - a [num_chains, num_chains] matrix with average\n      per chain-pair predicted error.\n  \"\"\"\n  if mask is None:\n    mask = np.ones(shape=full_pae.shape[1:], dtype=bool)\n  if contact_probs is None:\n    contact_probs = np.ones(shape=full_pae.shape[1:], dtype=float)\n  assert mask.shape == full_pae.shape[1:]\n\n  full_pae = full_pae[:, :num_tokens, :num_tokens]\n  mask = mask[:num_tokens, :num_tokens]\n  asym_ids = asym_ids[:num_tokens]\n  contact_probs = contact_probs[:num_tokens, :num_tokens]\n  unique_asym_ids = np.unique(asym_ids)\n  num_chains = len(unique_asym_ids)\n  num_samples = full_pae.shape[0]\n  chain_pair_pred_err_mean = np.zeros((num_samples, num_chains, num_chains))\n  chain_pair_pred_err_min = np.zeros((num_samples, num_chains, num_chains))\n\n  for idx1, asym_id_1 in enumerate(unique_asym_ids):\n    subset = full_pae[:, asym_ids == asym_id_1, :]\n    subset_mask = mask[asym_ids == asym_id_1, :]\n    subset_contact_probs = contact_probs[asym_ids == asym_id_1, :]\n    for idx2, asym_id_2 in enumerate(unique_asym_ids):\n      subsubset = subset[:, :, asym_ids == asym_id_2]\n      subsubset_mask = subset_mask[:, asym_ids == asym_id_2]\n      subsubset_contact_probs = subset_contact_probs[:, asym_ids == asym_id_2]\n      (flat_mask_idxs,) = np.where(subsubset_mask.flatten() > 0)\n      flat_subsubset = subsubset.reshape([num_samples, -1])\n      flat_contact_probs = subsubset_contact_probs.flatten()\n      # A ligand chain will have no valid frames if it contains fewer than\n      # three non-colinear atoms (e.g. a sodium ion).\n      if not flat_mask_idxs.size:\n        chain_pair_pred_err_mean[:, idx1, idx2] = np.nan\n        chain_pair_pred_err_min[:, idx1, idx2] = np.nan\n      else:\n        chain_pair_pred_err_min[:, idx1, idx2] = np.min(\n            flat_subsubset[:, flat_mask_idxs], axis=1\n        )\n        chain_pair_pred_err_mean[:, idx1, idx2] = weighted_mean(\n            mask=flat_contact_probs[flat_mask_idxs],\n            value=flat_subsubset[:, flat_mask_idxs],\n            axis=-1,\n        )\n  return chain_pair_pred_err_mean, chain_pair_pred_err_min, unique_asym_ids\n\n\ndef reduce_chain_pair(\n    *,\n    chain_pair_met: np.ndarray,\n    num_chain_tokens: np.ndarray,\n    agg_over_col: bool,\n    agg_type: str,\n    weight_method: str,\n) -> tuple[np.ndarray, np.ndarray]:\n  \"\"\"Compute 1D summaries from a chain-pair summary.\n\n  Args:\n    chain_pair_met: A [num_samples, num_chains, num_chains] aggregate matrix.\n    num_chain_tokens: A [num_chains] array of number of tokens for each chain.\n      Used for 'per_token' weighting.\n    agg_over_col: Whether to aggregate the PAE over rows (i.e. average error\n      when aligned to me) or columns (i.e. my average error when aligned to all\n      others.)\n    agg_type: The type of aggregation to use, 'mean' or 'min'.\n    weight_method: The method to use for weighting the PAE, 'per_token' or\n      'per_chain'.\n\n  Returns:\n    A tuple (ichain, xchain) where:\n      `ichain` is a [num_samples, num_chains] matrix where the\n      value assigned to each chain is an average of the full PAE matrix over all\n      its within-chain interactions, weighted by `contact_probs`.\n      `xchain` is a [num_samples, num_chains] matrix where the\n      value assigned to each chain is an average of the full PAE matrix over all\n      its cross-chain interactions, weighted by `contact_probs`.\n  \"\"\"\n  num_samples, num_chains, _ = chain_pair_met.shape\n\n  ichain = chain_pair_met.diagonal(axis1=-2, axis2=-1)\n\n  if weight_method == 'per_chain':\n    chain_weight = np.ones((num_chains,), dtype=float)\n  elif weight_method == 'per_token':\n    chain_weight = num_chain_tokens\n  else:\n    raise ValueError(f'Unknown weight method: {weight_method}')\n\n  if agg_over_col:\n    agg_axis = -1\n  else:\n    agg_axis = -2\n\n  if agg_type == 'mean':\n    weight = np.ones((num_samples, num_chains, num_chains), dtype=float)\n    weight -= np.eye(num_chains, dtype=float)\n    weight *= chain_weight[None] * chain_weight[:, None]\n    xchain = weighted_nanmean(chain_pair_met, mask=weight, axis=agg_axis)\n  elif agg_type == 'min':\n    is_self = np.eye(num_chains)\n    with warnings.catch_warnings():\n      # Min over empty slice is ok and should return a NaN.\n      warnings.filterwarnings('ignore', message='All-NaN slice encountered')\n      xchain = np.nanmin(chain_pair_met + 1e8 * is_self, axis=agg_axis)\n  else:\n    raise ValueError(f'Unknown aggregation method: {agg_type}')\n\n  return ichain, xchain\n\n\ndef pae_metrics(\n    num_tokens: int,\n    asym_ids: np.ndarray,\n    full_pae: np.ndarray,\n    mask: np.ndarray,\n    contact_probs: np.ndarray,\n    tm_adjusted_pae: np.ndarray,\n):\n  \"\"\"PAE aggregate metrics.\"\"\"\n  assert mask.shape == full_pae.shape[1:]\n  assert contact_probs.shape == full_pae.shape[1:]\n\n  chain_pair_contact_weighted, _, unique_asym_ids = chain_pair_pae(\n      num_tokens=num_tokens,\n      asym_ids=asym_ids,\n      full_pae=full_pae,\n      mask=mask,\n      contact_probs=contact_probs,\n  )\n\n  ret = {}\n  ret['chain_pair_pae_mean'], ret['chain_pair_pae_min'], _ = chain_pair_pae(\n      num_tokens=num_tokens,\n      asym_ids=asym_ids,\n      full_pae=full_pae,\n      mask=mask,\n  )\n  chain_pair_iptm = np.stack(\n      [\n          chain_pairwise_predicted_tm_scores(\n              tm_adjusted_pae=sample_tm_adjusted_pae[:num_tokens],\n              asym_id=asym_ids[:num_tokens],\n              pair_mask=mask[:num_tokens, :num_tokens],\n          )\n          for sample_tm_adjusted_pae in tm_adjusted_pae\n      ],\n      axis=0,\n  )\n\n  num_chain_tokens = np.array(\n      [sum(asym_ids == asym_id) for asym_id in unique_asym_ids]\n  )\n\n  def reduce_chain_pair_fn(chain_pair: np.ndarray):\n    def inner(agg_over_col):\n      ichain_pae, xchain_pae = reduce_chain_pair(\n          num_chain_tokens=num_chain_tokens,\n          chain_pair_met=chain_pair,\n          agg_over_col=agg_over_col,\n          agg_type='mean',\n          weight_method='per_chain',\n      )\n      return ichain_pae, xchain_pae\n\n    ichain, xchain_row_agg = inner(False)\n    _, xchain_col_agg = inner(True)\n    with warnings.catch_warnings():\n      # Mean of empty slice is ok and should return a NaN.\n      warnings.filterwarnings(action='ignore', message='Mean of empty slice')\n      xchain = np.nanmean(\n          np.stack([xchain_row_agg, xchain_col_agg], axis=0), axis=0\n      )\n    return ichain, xchain\n\n  pae_ichain, pae_xchain = reduce_chain_pair_fn(chain_pair_contact_weighted)\n  iptm_ichain, iptm_xchain = reduce_chain_pair_fn(chain_pair_iptm)\n\n  ret.update({\n      'chain_pair_iptm': chain_pair_iptm,\n      'iptm_ichain': iptm_ichain,\n      'iptm_xchain': iptm_xchain,\n      'pae_ichain': pae_ichain,\n      'pae_xchain': pae_xchain,\n  })\n\n  return ret\n\n\ndef get_iptm_xchain(chain_pair_iptm: np.ndarray) -> np.ndarray:\n  \"\"\"Cross chain aggregate ipTM.\"\"\"\n  num_samples, num_chains, _ = chain_pair_iptm.shape\n  weight = np.ones((num_samples, num_chains, num_chains), dtype=float)\n  weight -= np.eye(num_chains, dtype=float)\n  xchain_row_agg = weighted_nanmean(chain_pair_iptm, mask=weight, axis=-2)\n  xchain_col_agg = weighted_nanmean(chain_pair_iptm, mask=weight, axis=-1)\n  with warnings.catch_warnings():\n    # Mean of empty slice is ok and should return a NaN.\n    warnings.filterwarnings(action='ignore', message='Mean of empty slice')\n    iptm_xchain = np.nanmean(\n        np.stack([xchain_row_agg, xchain_col_agg], axis=0), axis=0\n    )\n  return iptm_xchain\n\n\ndef predicted_tm_score(\n    tm_adjusted_pae: np.ndarray,\n    pair_mask: np.ndarray,\n    asym_id: np.ndarray,\n    interface: bool = False,\n) -> float:\n  \"\"\"Computes predicted TM alignment or predicted interface TM alignment score.\n\n  Args:\n    tm_adjusted_pae: [num_res, num_res] Relevant tensor for computing TMScore\n      values.\n    pair_mask: A [num_res, num_res] mask. The TM score will only aggregate over\n      masked-on entries.\n    asym_id: [num_res] asymmetric unit ID (the chain ID). Only needed for ipTM\n      calculation, i.e. when interface=True.\n    interface: If True, the interface predicted TM score is computed. If False,\n      the predicted TM score without any residue pair restrictions is computed.\n\n  Returns:\n   score: pTM or ipTM score.\n  \"\"\"\n  num_tokens, _ = tm_adjusted_pae.shape\n  if tm_adjusted_pae.shape != (num_tokens, num_tokens):\n    raise ValueError(\n        f'Bad tm_adjusted_pae shape, expected ({num_tokens, num_tokens}), got '\n        f'{tm_adjusted_pae.shape}.'\n    )\n\n  if pair_mask.shape != (num_tokens, num_tokens):\n    raise ValueError(\n        f'Bad pair_mask shape, expected ({num_tokens, num_tokens}), got '\n        f'{pair_mask.shape}.'\n    )\n  if pair_mask.dtype != bool:\n    raise TypeError(f'Bad pair mask type, expected bool, got {pair_mask.dtype}')\n  if asym_id.shape[0] != num_tokens:\n    raise ValueError(\n        f'Bad asym_id shape, expected ({num_tokens},), got {asym_id.shape}.'\n    )\n\n  # Create pair mask.\n  if interface:\n    pair_mask = pair_mask * (asym_id[:, None] != asym_id[None, :])\n\n  # Ions and other ligands with colinear atoms have ill-defined frames.\n  if pair_mask.sum() == 0:\n    return np.nan\n\n  normed_residue_mask = pair_mask / (\n      1e-8 + np.sum(pair_mask, axis=-1, keepdims=True)\n  )\n  per_alignment = np.sum(tm_adjusted_pae * normed_residue_mask, axis=-1)\n  return per_alignment.max()\n\n\ndef chain_pairwise_predicted_tm_scores(\n    tm_adjusted_pae: np.ndarray,\n    pair_mask: np.ndarray,\n    asym_id: np.ndarray,\n) -> np.ndarray:\n  \"\"\"Compute predicted TM (pTM) between each pair of chains independently.\n\n  Args:\n    tm_adjusted_pae: [num_res, num_res] Relevant tensor for computing TMScore\n      values.\n    pair_mask: A [num_res, num_res] mask specifying which frames are valid.\n      Invalid frames can be the result of chains with not enough atoms (e.g.\n      ions).\n    asym_id: [num_res] asymmetric unit ID (the chain ID).\n\n  Returns:\n    A [num_chains, num_chains] matrix, where row i, column j indicates the\n    predicted TM-score for the interface between chain i and chain j.\n  \"\"\"\n  unique_chains = list(np.unique(asym_id))\n  num_chains = len(unique_chains)\n  all_pairs_iptms = np.zeros((num_chains, num_chains))\n  for i, chain_i in enumerate(unique_chains):\n    chain_i_mask = asym_id == chain_i\n    for j, chain_j in enumerate(unique_chains[i:]):\n      chain_j_mask = asym_id == chain_j\n      mask = chain_i_mask | chain_j_mask\n      (indices,) = np.where(mask)\n      is_interface = chain_i != chain_j\n      indices = np.ix_(indices, indices)\n      iptm = predicted_tm_score(\n          tm_adjusted_pae=tm_adjusted_pae[indices],\n          pair_mask=pair_mask[indices],\n          asym_id=asym_id[mask],\n          interface=is_interface,\n      )\n      all_pairs_iptms[i, i + j] = iptm\n      all_pairs_iptms[i + j, i] = iptm\n  return all_pairs_iptms\n"
  },
  {
    "path": "src/alphafold3/model/data3.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Protein features that are computed from parsed mmCIF objects.\"\"\"\n\nfrom collections.abc import Mapping\nimport datetime\nfrom typing import TypeAlias\n\nfrom alphafold3.constants import residue_names\nfrom alphafold3.cpp import msa_profile\nfrom alphafold3.model import protein_data_processing\nimport numpy as np\n\n\nFeatureDict: TypeAlias = Mapping[str, np.ndarray]\n\n\ndef get_profile_features(\n    msa: np.ndarray, deletion_matrix: np.ndarray\n) -> FeatureDict:\n  \"\"\"Returns the MSA profile and deletion_mean features.\"\"\"\n  num_restypes = residue_names.POLYMER_TYPES_NUM_WITH_UNKNOWN_AND_GAP\n  profile = msa_profile.compute_msa_profile(\n      msa=msa, num_residue_types=num_restypes\n  )\n\n  return {\n      'profile': profile.astype(np.float32),\n      'deletion_mean': np.mean(deletion_matrix, axis=0),\n  }\n\n\ndef fix_template_features(\n    template_features: FeatureDict, num_res: int\n) -> FeatureDict:\n  \"\"\"Convert template features to AlphaFold 3 format.\n\n  Args:\n    template_features: Template features for the protein.\n    num_res: The length of the amino acid sequence of the protein.\n\n  Returns:\n    Updated template_features for the chain.\n  \"\"\"\n  if not template_features['template_aatype'].shape[0]:\n    template_features = empty_template_features(num_res)\n  else:\n    template_release_timestamp = [\n        _get_timestamp(x.decode('utf-8'))\n        for x in template_features['template_release_date']\n    ]\n\n    # Convert from atom37 to dense atom\n    dense_atom_indices = np.take(\n        protein_data_processing.PROTEIN_AATYPE_DENSE_ATOM_TO_ATOM37,\n        template_features['template_aatype'],\n        axis=0,\n    )\n\n    atom_mask = np.take_along_axis(\n        template_features['template_all_atom_masks'], dense_atom_indices, axis=2\n    )\n    atom_positions = np.take_along_axis(\n        template_features['template_all_atom_positions'],\n        dense_atom_indices[..., None],\n        axis=2,\n    )\n    atom_positions *= atom_mask[..., None]\n\n    template_features = {\n        'template_aatype': template_features['template_aatype'],\n        'template_atom_mask': atom_mask.astype(np.int32),\n        'template_atom_positions': atom_positions.astype(np.float32),\n        'template_domain_names': np.array(\n            template_features['template_domain_names'], dtype=object\n        ),\n        'template_release_timestamp': np.array(\n            template_release_timestamp, dtype=np.float32\n        ),\n    }\n  return template_features\n\n\ndef empty_template_features(num_res: int) -> FeatureDict:\n  \"\"\"Creates a fully masked out template features to allow padding to work.\n\n  Args:\n    num_res: The length of the target chain.\n\n  Returns:\n    Empty template features for the chain.\n  \"\"\"\n  template_features = {\n      'template_aatype': np.zeros(num_res, dtype=np.int32)[None, ...],\n      'template_atom_mask': np.zeros(\n          (num_res, protein_data_processing.NUM_DENSE), dtype=np.int32\n      )[None, ...],\n      'template_atom_positions': np.zeros(\n          (num_res, protein_data_processing.NUM_DENSE, 3), dtype=np.float32\n      )[None, ...],\n      'template_domain_names': np.array([b''], dtype=object),\n      'template_release_timestamp': np.array([0.0], dtype=np.float32),\n  }\n  return template_features\n\n\ndef _get_timestamp(date_str: str):\n  dt = datetime.datetime.fromisoformat(date_str)\n  dt = dt.replace(tzinfo=datetime.timezone.utc)\n  return dt.timestamp()\n"
  },
  {
    "path": "src/alphafold3/model/data_constants.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Constants shared across modules in the AlphaFold data pipeline.\"\"\"\n\nfrom alphafold3.constants import residue_names\n\nMSA_GAP_IDX = residue_names.PROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN_AND_GAP.index(\n    '-'\n)\n\n# Feature groups.\nNUM_SEQ_NUM_RES_MSA_FEATURES = ('msa', 'msa_mask', 'deletion_matrix')\nNUM_SEQ_MSA_FEATURES = ('msa_species_identifiers',)\nTEMPLATE_FEATURES = (\n    'template_aatype',\n    'template_atom_positions',\n    'template_atom_mask',\n)\nMSA_PAD_VALUES = {'msa': MSA_GAP_IDX, 'msa_mask': 1, 'deletion_matrix': 0}\n"
  },
  {
    "path": "src/alphafold3/model/feat_batch.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Batch dataclass.\"\"\"\nimport dataclasses\nfrom typing import Self\n\nfrom alphafold3.model import features\nimport jax\n\n\n@dataclasses.dataclass(frozen=True)\nclass Batch:\n  \"\"\"Dataclass containing batch.\"\"\"\n\n  msa: features.MSA\n  templates: features.Templates\n  token_features: features.TokenFeatures\n  ref_structure: features.RefStructure\n  predicted_structure_info: features.PredictedStructureInfo\n  polymer_ligand_bond_info: features.PolymerLigandBondInfo\n  ligand_ligand_bond_info: features.LigandLigandBondInfo\n  pseudo_beta_info: features.PseudoBetaInfo\n  atom_cross_att: features.AtomCrossAtt\n  convert_model_output: features.ConvertModelOutput\n  frames: features.Frames\n\n  @property\n  def num_res(self) -> int:\n    return self.token_features.aatype.shape[-1]\n\n  @classmethod\n  def from_data_dict(cls, batch: features.BatchDict) -> Self:\n    \"\"\"Construct batch object from dictionary.\"\"\"\n    return cls(\n        msa=features.MSA.from_data_dict(batch),\n        templates=features.Templates.from_data_dict(batch),\n        token_features=features.TokenFeatures.from_data_dict(batch),\n        ref_structure=features.RefStructure.from_data_dict(batch),\n        predicted_structure_info=features.PredictedStructureInfo.from_data_dict(\n            batch\n        ),\n        polymer_ligand_bond_info=features.PolymerLigandBondInfo.from_data_dict(\n            batch\n        ),\n        ligand_ligand_bond_info=features.LigandLigandBondInfo.from_data_dict(\n            batch\n        ),\n        pseudo_beta_info=features.PseudoBetaInfo.from_data_dict(batch),\n        atom_cross_att=features.AtomCrossAtt.from_data_dict(batch),\n        convert_model_output=features.ConvertModelOutput.from_data_dict(batch),\n        frames=features.Frames.from_data_dict(batch),\n    )\n\n  def as_data_dict(self) -> features.BatchDict:\n    \"\"\"Converts batch object to dictionary.\"\"\"\n    output = {\n        **self.msa.as_data_dict(),\n        **self.templates.as_data_dict(),\n        **self.token_features.as_data_dict(),\n        **self.ref_structure.as_data_dict(),\n        **self.predicted_structure_info.as_data_dict(),\n        **self.polymer_ligand_bond_info.as_data_dict(),\n        **self.ligand_ligand_bond_info.as_data_dict(),\n        **self.pseudo_beta_info.as_data_dict(),\n        **self.atom_cross_att.as_data_dict(),\n        **self.convert_model_output.as_data_dict(),\n        **self.frames.as_data_dict(),\n    }\n    return output\n\n\njax.tree_util.register_dataclass(\n    Batch,\n    data_fields=[f.name for f in dataclasses.fields(Batch)],\n    meta_fields=[],\n)\n"
  },
  {
    "path": "src/alphafold3/model/features.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Data-side of the input features processing.\"\"\"\n\nimport dataclasses\nimport datetime\nimport itertools\nfrom typing import Any, Self, TypeAlias\n\nfrom absl import logging\nfrom alphafold3 import structure\nfrom alphafold3.common import folding_input\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.constants import periodic_table\nfrom alphafold3.constants import residue_names\nfrom alphafold3.cpp import cif_dict\nfrom alphafold3.data import msa as msa_module\nfrom alphafold3.data import templates\nfrom alphafold3.data.tools import rdkit_utils\nfrom alphafold3.model import data3\nfrom alphafold3.model import data_constants\nfrom alphafold3.model import merging_features\nfrom alphafold3.model import msa_pairing\nfrom alphafold3.model.atom_layout import atom_layout\nfrom alphafold3.structure import chemical_components as struc_chem_comps\nimport jax\nimport jax.numpy as jnp\nimport numpy as np\nfrom rdkit import Chem\n\n\nxnp_ndarray: TypeAlias = np.ndarray | jnp.ndarray  # pylint: disable=invalid-name\nBatchDict: TypeAlias = dict[str, xnp_ndarray]\n\n_STANDARD_RESIDUES = frozenset({\n    *residue_names.PROTEIN_TYPES_WITH_UNKNOWN,\n    *residue_names.NUCLEIC_TYPES_WITH_2_UNKS,\n})\n\n\n@dataclasses.dataclass(frozen=True)\nclass PaddingShapes:\n  num_tokens: int\n  msa_size: int\n  num_chains: int\n  num_templates: int\n  num_atoms: int\n\n\ndef _pad_to(\n    arr: np.ndarray, shape: tuple[int | None, ...], **kwargs\n) -> np.ndarray:\n  \"\"\"Pads an array to a given shape. Wrapper around np.pad().\n\n  Args:\n    arr: numpy array to pad\n    shape: target shape, use None for axes that should stay the same\n    **kwargs: additional args for np.pad, e.g. constant_values=-1\n\n  Returns:\n    the padded array\n\n  Raises:\n    ValueError if arr and shape have a different number of axes.\n  \"\"\"\n  if arr.ndim != len(shape):\n    raise ValueError(\n        f'arr and shape have different number of axes. {arr.shape=}, {shape=}'\n    )\n\n  num_pad = []\n  for axis, width in enumerate(shape):\n    if width is None:\n      num_pad.append((0, 0))\n    else:\n      if width >= arr.shape[axis]:\n        num_pad.append((0, width - arr.shape[axis]))\n      else:\n        raise ValueError(\n            f'Can not pad to a smaller shape. {arr.shape=}, {shape=}'\n        )\n  padded_arr = np.pad(arr, pad_width=num_pad, **kwargs)\n  return padded_arr\n\n\ndef _unwrap(obj):\n  \"\"\"Unwrap an object from a zero-dim np.ndarray.\"\"\"\n  if isinstance(obj, np.ndarray) and obj.ndim == 0:\n    return obj.item()\n  else:\n    return obj\n\n\n@dataclasses.dataclass(frozen=True)\nclass Chains:\n  chain_id: np.ndarray\n  asym_id: np.ndarray\n  entity_id: np.ndarray\n  sym_id: np.ndarray\n\n\njax.tree_util.register_dataclass(\n    Chains,\n    data_fields=[f.name for f in dataclasses.fields(Chains)],\n    meta_fields=[],\n)\n\n\ndef _compute_asym_entity_and_sym_id(\n    all_tokens: atom_layout.AtomLayout,\n) -> Chains:\n  \"\"\"Compute asym_id, entity_id and sym_id.\n\n  Args:\n    all_tokens: atom layout containing a representative atom for each token.\n\n  Returns:\n    A Chains object\n  \"\"\"\n\n  # Find identical sequences and assign entity_id and sym_id to every chain.\n  seq_to_entity_id_sym_id = {}\n  seen_chain_ids = set()\n  chain_ids = []\n  asym_ids = []\n  entity_ids = []\n  sym_ids = []\n  for chain_id in all_tokens.chain_id:\n    if chain_id not in seen_chain_ids:\n      asym_id = len(seen_chain_ids) + 1\n      seen_chain_ids.add(chain_id)\n      seq = ','.join(all_tokens.res_name[all_tokens.chain_id == chain_id])\n      if seq not in seq_to_entity_id_sym_id:\n        entity_id = len(seq_to_entity_id_sym_id) + 1\n        sym_id = 1\n      else:\n        entity_id, sym_id = seq_to_entity_id_sym_id[seq]\n        sym_id += 1\n      seq_to_entity_id_sym_id[seq] = (entity_id, sym_id)\n\n      chain_ids.append(chain_id)\n      asym_ids.append(asym_id)\n      entity_ids.append(entity_id)\n      sym_ids.append(sym_id)\n\n  return Chains(\n      chain_id=np.array(chain_ids),\n      asym_id=np.array(asym_ids),\n      entity_id=np.array(entity_ids),\n      sym_id=np.array(sym_ids),\n  )\n\n\ndef tokenizer(\n    flat_output_layout: atom_layout.AtomLayout,\n    ccd: chemical_components.Ccd,\n    max_atoms_per_token: int,\n    flatten_non_standard_residues: bool,\n    logging_name: str,\n) -> tuple[atom_layout.AtomLayout, atom_layout.AtomLayout, np.ndarray]:\n  \"\"\"Maps a flat atom layout to tokens for evoformer.\n\n  Creates the evoformer tokens as one token per polymer residue and one token\n  per ligand atom. The tokens are represented as AtomLayouts all_tokens\n  (1 representative atom per token) atoms per residue, and\n  all_token_atoms_layout (num_tokens, max_atoms_per_token). The atoms in a\n  residue token use the layout of the corresponding CCD entry\n\n  Args:\n    flat_output_layout: flat AtomLayout containing all atoms that the model\n      wants to predict.\n    ccd: The chemical components dictionary.\n    max_atoms_per_token: number of slots per token.\n    flatten_non_standard_residues: whether to flatten non-standard residues,\n      i.e. whether to use one token per atom for non-standard residues.\n    logging_name: logging name for debugging (usually the mmcif_id).\n\n  Returns:\n    A tuple (all_tokens, all_tokens_atoms_layout) with\n      all_tokens: AtomLayout shape (num_tokens,) containing one representative\n        atom per token.\n      all_token_atoms_layout: AtomLayout with shape\n        (num_tokens, max_atoms_per_token) containing all atoms per token.\n      standard_token_idxs: The token index that each token would have if not\n        flattening non standard resiudes.\n  \"\"\"\n  # Select  the representative atom for each token.\n  token_idxs = []\n  single_atom_token = []\n  standard_token_idxs = []\n  current_standard_token_id = 0\n  # Iterate over residues, and provide a group_iter over the atoms of each\n  # residue.\n  for key, group_iter in itertools.groupby(\n      zip(\n          flat_output_layout.chain_type,\n          flat_output_layout.chain_id,\n          flat_output_layout.res_id,\n          flat_output_layout.res_name,\n          flat_output_layout.atom_name,\n          np.arange(flat_output_layout.shape[0]),\n      ),\n      key=lambda x: x[:3],\n  ):\n\n    # Get chain type and chain id of this residue\n    chain_type, chain_id, _ = key\n\n    # Get names and global idxs for all atoms of this residue\n    _, _, _, res_names, atom_names, idxs = zip(*group_iter)\n\n    # As of March 2023, all OTHER CHAINs in pdb are artificial nucleics.\n    is_nucleic_backbone = (\n        chain_type in mmcif_names.NUCLEIC_ACID_CHAIN_TYPES\n        or chain_type == mmcif_names.OTHER_CHAIN\n    )\n    if chain_type in mmcif_names.PEPTIDE_CHAIN_TYPES:\n      res_name = res_names[0]\n      if (\n          flatten_non_standard_residues\n          and res_name not in residue_names.PROTEIN_TYPES_WITH_UNKNOWN\n          and res_name != residue_names.MSE\n      ):\n        # For non-standard protein residues take all atoms.\n        # NOTE: This may get very large if we include hydrogens.\n        token_idxs.extend(idxs)\n        single_atom_token += [True] * len(idxs)\n        standard_token_idxs.extend([current_standard_token_id] * len(idxs))\n      else:\n        # For standard protein residues take 'CA' if it exists, else first atom.\n        if 'CA' in atom_names:\n          token_idxs.append(idxs[atom_names.index('CA')])\n        else:\n          token_idxs.append(idxs[0])\n        single_atom_token += [False]\n        standard_token_idxs.append(current_standard_token_id)\n      current_standard_token_id += 1\n    elif is_nucleic_backbone:\n      res_name = res_names[0]\n      if (\n          flatten_non_standard_residues\n          and res_name not in residue_names.NUCLEIC_TYPES_WITH_2_UNKS\n      ):\n        # For non-standard nucleic residues take all atoms.\n        token_idxs.extend(idxs)\n        single_atom_token += [True] * len(idxs)\n        standard_token_idxs.extend([current_standard_token_id] * len(idxs))\n      else:\n        # For standard nucleic residues take C1' if it exists, else first atom.\n        if \"C1'\" in atom_names:\n          token_idxs.append(idxs[atom_names.index(\"C1'\")])\n        else:\n          token_idxs.append(idxs[0])\n        single_atom_token += [False]\n        standard_token_idxs.append(current_standard_token_id)\n      current_standard_token_id += 1\n    elif chain_type in mmcif_names.NON_POLYMER_CHAIN_TYPES:\n      # For non-polymers take all atoms\n      token_idxs.extend(idxs)\n      single_atom_token += [True] * len(idxs)\n      standard_token_idxs.extend([current_standard_token_id] * len(idxs))\n      current_standard_token_id += len(idxs)\n    else:\n      # Chain type that we don't handle yet.\n      logging.warning(\n          '%s: ignoring chain %s with chain type %s.',\n          logging_name,\n          chain_id,\n          chain_type,\n      )\n\n  assert len(token_idxs) == len(single_atom_token)\n  assert len(token_idxs) == len(standard_token_idxs)\n  standard_token_idxs = np.array(standard_token_idxs, dtype=np.int32)\n\n  # Create the list of all tokens, represented as a flat AtomLayout with 1\n  # representative atom per token.\n  all_tokens = flat_output_layout[token_idxs]\n\n  # Create the 2D atoms_per_token layout\n  num_tokens = all_tokens.shape[0]\n\n  # Target lists.\n  target_atom_names = []\n  target_atom_elements = []\n  target_res_ids = []\n  target_res_names = []\n  target_chain_ids = []\n  target_chain_types = []\n\n  # uids of all atoms in the flat layout, to check whether the dense atoms\n  # exist -- This is necessary for terminal atoms (e.g. 'OP3' or 'OXT')\n  all_atoms_uids = set(\n      zip(\n          flat_output_layout.chain_id,\n          flat_output_layout.res_id,\n          flat_output_layout.atom_name,\n      )\n  )\n\n  for idx, single_atom in enumerate(single_atom_token):\n    if not single_atom:\n      # Standard protein and nucleic residues have many atoms per token\n      chain_id = all_tokens.chain_id[idx]\n      res_id = all_tokens.res_id[idx]\n      res_name = all_tokens.res_name[idx]\n      atom_names = []\n      atom_elements = []\n\n      res_atoms = struc_chem_comps.get_all_atoms_in_entry(\n          ccd=ccd, res_name=res_name\n      )\n      atom_names_elements = list(\n          zip(\n              res_atoms['_chem_comp_atom.atom_id'],\n              res_atoms['_chem_comp_atom.type_symbol'],\n              strict=True,\n          )\n      )\n\n      for atom_name, atom_element in atom_names_elements:\n        # Remove hydrogens if they are not in flat layout.\n        if atom_element in ['H', 'D'] and (\n            (chain_id, res_id, atom_name) not in all_atoms_uids\n        ):\n          continue\n        elif (chain_id, res_id, atom_name) in all_atoms_uids:\n          atom_names.append(atom_name)\n          atom_elements.append(atom_element)\n        # Leave spaces for OXT etc.\n        else:\n          atom_names.append('')\n          atom_elements.append('')\n\n      if len(atom_names) > max_atoms_per_token:\n        logging.warning(\n            'Atom list for chain %s '\n            'residue %s %s is too long and will be truncated: '\n            '%s to the max atoms limit %s. Dropped atoms: %s',\n            chain_id,\n            res_id,\n            res_name,\n            len(atom_names),\n            max_atoms_per_token,\n            list(\n                zip(\n                    atom_names[max_atoms_per_token:],\n                    atom_elements[max_atoms_per_token:],\n                    strict=True,\n                )\n            ),\n        )\n        atom_names = atom_names[:max_atoms_per_token]\n        atom_elements = atom_elements[:max_atoms_per_token]\n\n      num_pad = max_atoms_per_token - len(atom_names)\n      atom_names.extend([''] * num_pad)\n      atom_elements.extend([''] * num_pad)\n\n    else:\n      # ligands have only 1 atom per token\n      padding = [''] * (max_atoms_per_token - 1)\n      atom_names = [all_tokens.atom_name[idx]] + padding\n      atom_elements = [all_tokens.atom_element[idx]] + padding\n\n    # Append the atoms to the target lists.\n    target_atom_names.append(atom_names)\n    target_atom_elements.append(atom_elements)\n    target_res_names.append([all_tokens.res_name[idx]] * max_atoms_per_token)\n    target_res_ids.append([all_tokens.res_id[idx]] * max_atoms_per_token)\n    target_chain_ids.append([all_tokens.chain_id[idx]] * max_atoms_per_token)\n    target_chain_types.append(\n        [all_tokens.chain_type[idx]] * max_atoms_per_token\n    )\n\n  # Make sure to get the right shape also for 0 tokens\n  trg_shape = (num_tokens, max_atoms_per_token)\n  all_token_atoms_layout = atom_layout.AtomLayout(\n      atom_name=np.array(target_atom_names, dtype=object).reshape(trg_shape),\n      atom_element=np.array(target_atom_elements, dtype=object).reshape(\n          trg_shape\n      ),\n      res_name=np.array(target_res_names, dtype=object).reshape(trg_shape),\n      res_id=np.array(target_res_ids, dtype=int).reshape(trg_shape),\n      chain_id=np.array(target_chain_ids, dtype=object).reshape(trg_shape),\n      chain_type=np.array(target_chain_types, dtype=object).reshape(trg_shape),\n  )\n\n  return all_tokens, all_token_atoms_layout, standard_token_idxs\n\n\n@dataclasses.dataclass(frozen=True)\nclass MSA:\n  \"\"\"Dataclass containing MSA.\"\"\"\n\n  rows: xnp_ndarray\n  mask: xnp_ndarray\n  deletion_matrix: xnp_ndarray\n  # Occurrence of each residue type along the sequence, averaged over MSA rows.\n  profile: xnp_ndarray\n  # Occurrence of deletions along the sequence, averaged over MSA rows.\n  deletion_mean: xnp_ndarray\n  # Number of MSA alignments.\n  num_alignments: xnp_ndarray\n\n  @classmethod\n  def compute_features(\n      cls,\n      *,\n      all_tokens: atom_layout.AtomLayout,\n      standard_token_idxs: np.ndarray,\n      padding_shapes: PaddingShapes,\n      fold_input: folding_input.Input,\n      logging_name: str,\n      max_paired_sequence_per_species: int,\n      resolve_msa_overlaps: bool = True,\n  ) -> Self:\n    \"\"\"Compute the msa features.\"\"\"\n    seen_entities = {}\n\n    substruct = atom_layout.make_structure(\n        flat_layout=all_tokens,\n        atom_coords=np.zeros(all_tokens.shape + (3,)),\n        name=logging_name,\n    )\n    prot = substruct.filter_to_entity_type(protein=True)\n    num_unique_chains = len(set(prot.chain_single_letter_sequence().values()))\n    need_msa_pairing = num_unique_chains > 1\n\n    np_chains_list = []\n    input_chains_by_id = {chain.id: chain for chain in fold_input.chains}\n    nonempty_chain_ids = set(all_tokens.chain_id)\n    for asym_id, chain_info in enumerate(substruct.iter_chains(), start=1):\n      b_chain_id = chain_info['chain_id']\n      chain_type = chain_info['chain_type']\n      chain = input_chains_by_id[b_chain_id]\n\n      # Generalised \"sequence\" for ligands (can't trust residue name)\n      chain_tokens = all_tokens[all_tokens.chain_id == b_chain_id]\n      assert chain_tokens.res_name is not None\n      three_letter_sequence = ','.join(chain_tokens.res_name.tolist())\n      chain_num_tokens = len(chain_tokens.atom_name)\n      if chain_type in mmcif_names.POLYMER_CHAIN_TYPES:\n        sequence = substruct.chain_single_letter_sequence()[b_chain_id]\n        if chain_type in mmcif_names.NUCLEIC_ACID_CHAIN_TYPES:\n          # Only allow nucleic residue types for nucleic chains (can have some\n          # protein residues in e.g. tRNA, but that causes MSA search failures).\n          # Replace non nucleic residue types by UNK_NUCLEIC.\n          nucleic_types_one_letter = (\n              residue_names.DNA_TYPES_ONE_LETTER\n              + residue_names.RNA_TYPES_ONE_LETTER_WITH_UNKNOWN\n          )\n          sequence = ''.join([\n              base\n              if base in nucleic_types_one_letter\n              else residue_names.UNK_NUCLEIC_ONE_LETTER\n              for base in sequence\n          ])\n      else:\n        sequence = 'X' * chain_num_tokens\n\n      skip_chain = (\n          chain_type not in mmcif_names.STANDARD_POLYMER_CHAIN_TYPES\n          or len(sequence) <= 4\n          or b_chain_id not in nonempty_chain_ids\n      )\n      if three_letter_sequence in seen_entities:\n        entity_id = seen_entities[three_letter_sequence]\n      else:\n        entity_id = len(seen_entities) + 1\n\n      if chain_type in mmcif_names.STANDARD_POLYMER_CHAIN_TYPES:\n        unpaired_a3m = ''\n        paired_a3m = ''\n        if not skip_chain:\n          if need_msa_pairing and isinstance(chain, folding_input.ProteinChain):\n            paired_a3m = chain.paired_msa\n          if isinstance(\n              chain, folding_input.RnaChain | folding_input.ProteinChain\n          ):\n            unpaired_a3m = chain.unpaired_msa\n        # If we generated the MSA ourselves, it is already deduplicated. If it\n        # is user-provided, keep it as is to prevent destroying desired pairing.\n        unpaired_msa = msa_module.Msa.from_a3m(\n            query_sequence=sequence,\n            chain_poly_type=chain_type,\n            a3m=unpaired_a3m,\n            deduplicate=False,\n        )\n\n        paired_msa = msa_module.Msa.from_a3m(\n            query_sequence=sequence,\n            chain_poly_type=chain_type,\n            a3m=paired_a3m,\n            deduplicate=False,\n        )\n      else:\n        unpaired_msa = msa_module.Msa.from_empty(\n            query_sequence='-' * len(sequence),\n            chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n        )\n        paired_msa = msa_module.Msa.from_empty(\n            query_sequence='-' * len(sequence),\n            chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n        )\n\n      msa_features = unpaired_msa.featurize()\n      all_seqs_msa_features = paired_msa.featurize()\n\n      msa_features = msa_features | {\n          f'{k}_all_seq': v for k, v in all_seqs_msa_features.items()\n      }\n      feats = msa_features\n      feats['chain_id'] = b_chain_id\n      feats['asym_id'] = np.full(chain_num_tokens, asym_id)\n      feats['entity_id'] = entity_id\n      np_chains_list.append(feats)\n\n    # Add profile features to each chain.\n    for chain in np_chains_list:\n      chain.update(\n          data3.get_profile_features(chain['msa'], chain['deletion_matrix'])\n      )\n\n    # Allow 50% of the MSA to come from MSA pairing.\n    max_paired_sequences = padding_shapes.msa_size // 2\n    if need_msa_pairing:\n      np_chains_list = list(map(dict, np_chains_list))\n      np_chains_list = msa_pairing.create_paired_features(\n          np_chains_list,\n          max_paired_sequences=max_paired_sequences,\n          nonempty_chain_ids=nonempty_chain_ids,\n          max_hits_per_species=max_paired_sequence_per_species,\n      )\n      if resolve_msa_overlaps:\n        np_chains_list = msa_pairing.deduplicate_unpaired_sequences(\n            np_chains_list\n        )\n\n    # Remove all gapped rows from all seqs.\n    nonempty_asym_ids = []\n    for chain in np_chains_list:\n      if chain['chain_id'] in nonempty_chain_ids:\n        nonempty_asym_ids.append(chain['asym_id'][0])\n    if 'msa_all_seq' in np_chains_list[0]:\n      np_chains_list = msa_pairing.remove_all_gapped_rows_from_all_seqs(\n          np_chains_list, asym_ids=nonempty_asym_ids\n      )\n\n    # Crop MSA rows.\n    cropped_chains_list = []\n    for chain in np_chains_list:\n      unpaired_msa_size, paired_msa_size = (\n          msa_pairing.choose_paired_unpaired_msa_crop_sizes(\n              unpaired_msa=chain['msa'],\n              paired_msa=chain.get('msa_all_seq'),\n              total_msa_crop_size=padding_shapes.msa_size,\n              max_paired_sequences=max_paired_sequences,\n          )\n      )\n      cropped_chain = {\n          'asym_id': chain['asym_id'],\n          'chain_id': chain['chain_id'],\n          'profile': chain['profile'],\n          'deletion_mean': chain['deletion_mean'],\n      }\n      for feat in data_constants.NUM_SEQ_NUM_RES_MSA_FEATURES:\n        if feat in chain:\n          cropped_chain[feat] = chain[feat][:unpaired_msa_size]\n        if feat + '_all_seq' in chain:\n          cropped_chain[feat + '_all_seq'] = chain[feat + '_all_seq'][\n              :paired_msa_size\n          ]\n      cropped_chains_list.append(cropped_chain)\n\n    # Merge Chains.\n    # Make sure the chain order is unaltered before slicing with tokens.\n    curr_chain_order = [chain['chain_id'] for chain in cropped_chains_list]\n    orig_chain_order = [chain['chain_id'] for chain in substruct.iter_chains()]\n    assert curr_chain_order == orig_chain_order\n    np_example = {\n        'asym_id': np.concatenate(\n            [c['asym_id'] for c in cropped_chains_list], axis=0\n        ),\n    }\n    for feature in data_constants.NUM_SEQ_NUM_RES_MSA_FEATURES:\n      for feat in [feature, feature + '_all_seq']:\n        if feat in cropped_chains_list[0]:\n          np_example[feat] = merging_features.merge_msa_features(\n              feat, cropped_chains_list\n          )\n    for feature in ['profile', 'deletion_mean']:\n      feature_list = [c[feature] for c in cropped_chains_list]\n      np_example[feature] = np.concatenate(feature_list, axis=0)\n\n    # Crop MSA rows to maximum size given by chains participating in the crop.\n    max_allowed_unpaired = max([\n        len(chain['msa'])\n        for chain in cropped_chains_list\n        if chain['asym_id'][0] in nonempty_asym_ids\n    ])\n    np_example['msa'] = np_example['msa'][:max_allowed_unpaired]\n    if 'msa_all_seq' in np_example:\n      max_allowed_paired = max([\n          len(chain['msa_all_seq'])\n          for chain in cropped_chains_list\n          if chain['asym_id'][0] in nonempty_asym_ids\n      ])\n      np_example['msa_all_seq'] = np_example['msa_all_seq'][:max_allowed_paired]\n\n    np_example = merging_features.merge_paired_and_unpaired_msa(np_example)\n\n    # Crop MSA residues. Need to use the standard token indices, since msa does\n    # not expand non-standard residues. This means that for expanded residues,\n    # we get repeated msa columns.\n    new_cropping_idxs = standard_token_idxs\n    for feature in data_constants.NUM_SEQ_NUM_RES_MSA_FEATURES:\n      if feature in np_example:\n        np_example[feature] = np_example[feature][:, new_cropping_idxs].copy()\n    for feature in ['profile', 'deletion_mean']:\n      np_example[feature] = np_example[feature][new_cropping_idxs]\n\n    # Make MSA mask.\n    np_example['msa_mask'] = np.ones_like(np_example['msa'], dtype=np.float32)\n\n    # Count MSA size before padding.\n    num_alignments = np_example['msa'].shape[0]\n\n    # Pad:\n    msa_size, num_tokens = padding_shapes.msa_size, padding_shapes.num_tokens\n\n    def safe_cast_int8(x):\n      return np.clip(x, np.iinfo(np.int8).min, np.iinfo(np.int8).max).astype(\n          np.int8\n      )\n\n    return MSA(\n        rows=_pad_to(safe_cast_int8(np_example['msa']), (msa_size, num_tokens)),\n        mask=_pad_to(\n            np_example['msa_mask'].astype(bool), (msa_size, num_tokens)\n        ),\n        # deletion_matrix may be out of int8 range, but we mostly care about\n        # small values since we arctan it in the model.\n        deletion_matrix=_pad_to(\n            safe_cast_int8(np_example['deletion_matrix']),\n            (msa_size, num_tokens),\n        ),\n        profile=_pad_to(np_example['profile'], (num_tokens, None)),\n        deletion_mean=_pad_to(np_example['deletion_mean'], (num_tokens,)),\n        num_alignments=np.array(num_alignments, dtype=np.int32),\n    )\n\n  def index_msa_rows(self, indices: xnp_ndarray) -> Self:\n    assert indices.ndim == 1\n\n    return MSA(\n        rows=self.rows[indices, :],\n        mask=self.mask[indices, :],\n        deletion_matrix=self.deletion_matrix[indices, :],\n        profile=self.profile,\n        deletion_mean=self.deletion_mean,\n        num_alignments=self.num_alignments,\n    )\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    output = cls(\n        rows=batch['msa'],\n        mask=batch['msa_mask'],\n        deletion_matrix=batch['deletion_matrix'],\n        profile=batch['profile'],\n        deletion_mean=batch['deletion_mean'],\n        num_alignments=batch['num_alignments'],\n    )\n    return output\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        'msa': self.rows,\n        'msa_mask': self.mask,\n        'deletion_matrix': self.deletion_matrix,\n        'profile': self.profile,\n        'deletion_mean': self.deletion_mean,\n        'num_alignments': self.num_alignments,\n    }\n\n\njax.tree_util.register_dataclass(\n    MSA,\n    data_fields=[f.name for f in dataclasses.fields(MSA)],\n    meta_fields=[],\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass Templates:\n  \"\"\"Dataclass containing templates.\"\"\"\n\n  # aatype of templates, int32 w shape [num_templates, num_res]\n  aatype: xnp_ndarray\n  # atom positions of templates, float32 w shape [num_templates, num_res, 24, 3]\n  atom_positions: xnp_ndarray\n  # atom mask of templates, bool w shape [num_templates, num_res, 24]\n  atom_mask: xnp_ndarray\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_tokens: atom_layout.AtomLayout,\n      standard_token_idxs: np.ndarray,\n      padding_shapes: PaddingShapes,\n      fold_input: folding_input.Input,\n      max_templates: int,\n      logging_name: str,\n  ) -> Self:\n    \"\"\"Compute the template features.\"\"\"\n\n    seen_entities = {}\n    polymer_entity_features = {True: {}, False: {}}\n\n    substruct = atom_layout.make_structure(\n        flat_layout=all_tokens,\n        atom_coords=np.zeros(all_tokens.shape + (3,)),\n        name=logging_name,\n    )\n    np_chains_list = []\n\n    input_chains_by_id = {chain.id: chain for chain in fold_input.chains}\n\n    nonempty_chain_ids = set(all_tokens.chain_id)\n    for chain_info in substruct.iter_chains():\n      chain_id = chain_info['chain_id']\n      chain_type = chain_info['chain_type']\n      chain = input_chains_by_id[chain_id]\n\n      # Generalised \"sequence\" for ligands (can't trust residue name)\n      chain_tokens = all_tokens[all_tokens.chain_id == chain_id]\n      assert chain_tokens.res_name is not None\n      three_letter_sequence = ','.join(chain_tokens.res_name.tolist())\n      chain_num_tokens = len(chain_tokens.atom_name)\n\n      # Don't compute features for chains not included in the crop, or ligands.\n      skip_chain = (\n          chain_type != mmcif_names.PROTEIN_CHAIN\n          or chain_num_tokens <= 4  # not cache filled\n          or chain_id not in nonempty_chain_ids\n      )\n\n      if three_letter_sequence in seen_entities:\n        entity_id = seen_entities[three_letter_sequence]\n      else:\n        entity_id = len(seen_entities) + 1\n\n      if entity_id not in polymer_entity_features[skip_chain]:\n        if skip_chain:\n          template_features = data3.empty_template_features(chain_num_tokens)\n        else:\n          assert isinstance(chain, folding_input.ProteinChain)\n\n          sorted_features = []\n          for template in chain.templates:\n            struc = structure.from_mmcif(\n                template.mmcif,\n                fix_mse_residues=True,\n                fix_arginines=True,\n                include_bonds=False,\n                include_water=False,\n                include_other=True,  # For non-standard polymer chains.\n            )\n            hit_features = templates.get_polymer_features(\n                chain=struc,\n                chain_poly_type=mmcif_names.PROTEIN_CHAIN,\n                query_sequence_length=len(chain.sequence),\n                query_to_hit_mapping=dict(template.query_to_template_map),\n            )\n            sorted_features.append(hit_features)\n\n          template_features = templates.package_template_features(\n              hit_features=sorted_features,\n              include_ligand_features=False,\n          )\n\n          template_features = data3.fix_template_features(\n              template_features=template_features, num_res=len(chain.sequence)\n          )\n\n        template_features = _reduce_template_features(\n            template_features, max_templates\n        )\n        polymer_entity_features[skip_chain][entity_id] = template_features\n\n      seen_entities[three_letter_sequence] = entity_id\n      feats = polymer_entity_features[skip_chain][entity_id].copy()\n      feats['chain_id'] = chain_id\n      np_chains_list.append(feats)\n\n    # We pad the num_templates dimension before merging, so that different\n    # chains can be concatenated on the num_res dimension.  Masking will be\n    # applied so that each chains templates can't see each other.\n    for chain in np_chains_list:\n      chain['template_aatype'] = _pad_to(\n          chain['template_aatype'], (max_templates, None)\n      )\n      chain['template_atom_positions'] = _pad_to(\n          chain['template_atom_positions'], (max_templates, None, None, None)\n      )\n      chain['template_atom_mask'] = _pad_to(\n          chain['template_atom_mask'], (max_templates, None, None)\n      )\n\n    # Merge on token dimension.\n    np_example = {\n        ft: np.concatenate([c[ft] for c in np_chains_list], axis=1)\n        for ft in np_chains_list[0]\n        if ft in data_constants.TEMPLATE_FEATURES\n    }\n\n    # Crop template data. Need to use the standard token indices, since msa does\n    # not expand non-standard residues. This means that for expanded residues,\n    # we get repeated template information.\n    for feature_name, v in np_example.items():\n      np_example[feature_name] = v[:max_templates, standard_token_idxs, ...]\n\n    # Pad along the token dimension.\n    templates_features = Templates(\n        aatype=_pad_to(\n            np_example['template_aatype'], (None, padding_shapes.num_tokens)\n        ),\n        atom_positions=_pad_to(\n            np_example['template_atom_positions'],\n            (None, padding_shapes.num_tokens, None, None),\n        ),\n        atom_mask=_pad_to(\n            np_example['template_atom_mask'].astype(bool),\n            (None, padding_shapes.num_tokens, None),\n        ),\n    )\n    return templates_features\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    \"\"\"Make Template from batch dictionary.\"\"\"\n    return cls(\n        aatype=batch['template_aatype'],\n        atom_positions=batch['template_atom_positions'],\n        atom_mask=batch['template_atom_mask'],\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        'template_aatype': self.aatype,\n        'template_atom_positions': self.atom_positions,\n        'template_atom_mask': self.atom_mask,\n    }\n\n\njax.tree_util.register_dataclass(\n    Templates,\n    data_fields=[f.name for f in dataclasses.fields(Templates)],\n    meta_fields=[],\n)\n\n\ndef _reduce_template_features(\n    template_features: data3.FeatureDict,\n    max_templates: int,\n) -> data3.FeatureDict:\n  \"\"\"Reduces template features to max num templates and defined feature set.\"\"\"\n  num_templates = template_features['template_aatype'].shape[0]\n  template_keep_mask = np.arange(num_templates) < max_templates\n  template_fields = data_constants.TEMPLATE_FEATURES + (\n      'template_release_timestamp',\n  )\n  template_features = {\n      k: v[template_keep_mask]\n      for k, v in template_features.items()\n      if k in template_fields\n  }\n  return template_features\n\n\n@dataclasses.dataclass(frozen=True)\nclass TokenFeatures:\n  \"\"\"Dataclass containing features for tokens.\"\"\"\n\n  residue_index: xnp_ndarray\n  token_index: xnp_ndarray\n  aatype: xnp_ndarray\n  mask: xnp_ndarray\n  seq_length: xnp_ndarray\n\n  # Chain symmetry identifiers\n  # for an A3B2 stoichiometry the meaning of these features is as follows:\n  # asym_id:    1 2 3 4 5\n  # entity_id:  1 1 1 2 2\n  # sym_id:     1 2 3 1 2\n  asym_id: xnp_ndarray\n  entity_id: xnp_ndarray\n  sym_id: xnp_ndarray\n\n  # token type features\n  is_protein: xnp_ndarray\n  is_rna: xnp_ndarray\n  is_dna: xnp_ndarray\n  is_ligand: xnp_ndarray\n  is_nonstandard_polymer_chain: xnp_ndarray\n  is_water: xnp_ndarray\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_tokens: atom_layout.AtomLayout,\n      padding_shapes: PaddingShapes,\n  ) -> Self:\n    \"\"\"Compute the per-token features.\"\"\"\n\n    residue_index = all_tokens.res_id.astype(np.int32)\n\n    token_index = np.arange(1, len(all_tokens.atom_name) + 1).astype(np.int32)\n\n    aatype = []\n    for res_name, chain_type in zip(all_tokens.res_name, all_tokens.chain_type):\n      if chain_type in mmcif_names.POLYMER_CHAIN_TYPES:\n        res_name = mmcif_names.fix_non_standard_polymer_res(\n            res_name=res_name, chain_type=chain_type\n        )\n        if (\n            chain_type == mmcif_names.DNA_CHAIN\n            and res_name == residue_names.UNK_DNA\n        ):\n          res_name = residue_names.UNK_NUCLEIC_ONE_LETTER\n      elif chain_type in mmcif_names.NON_POLYMER_CHAIN_TYPES:\n        res_name = residue_names.UNK\n      else:\n        raise ValueError(f'Chain type {chain_type} not polymer or ligand.')\n      aa = residue_names.POLYMER_TYPES_ORDER_WITH_UNKNOWN_AND_GAP[res_name]\n      aatype.append(aa)\n    aatype = np.array(aatype, dtype=np.int32)\n\n    mask = np.ones(all_tokens.shape[0], dtype=bool)\n    chains = _compute_asym_entity_and_sym_id(all_tokens)\n    m = dict(zip(chains.chain_id, chains.asym_id))\n    asym_id = np.array([m[c] for c in all_tokens.chain_id], dtype=np.int32)\n\n    m = dict(zip(chains.chain_id, chains.entity_id))\n    entity_id = np.array([m[c] for c in all_tokens.chain_id], dtype=np.int32)\n\n    m = dict(zip(chains.chain_id, chains.sym_id))\n    sym_id = np.array([m[c] for c in all_tokens.chain_id], dtype=np.int32)\n\n    seq_length = np.array(all_tokens.shape[0], dtype=np.int32)\n\n    is_protein = all_tokens.chain_type == mmcif_names.PROTEIN_CHAIN\n    is_rna = all_tokens.chain_type == mmcif_names.RNA_CHAIN\n    is_dna = all_tokens.chain_type == mmcif_names.DNA_CHAIN\n    is_ligand = np.isin(\n        all_tokens.chain_type, list(mmcif_names.LIGAND_CHAIN_TYPES)\n    )\n    standard_polymer_chain = list(mmcif_names.NON_POLYMER_CHAIN_TYPES) + list(\n        mmcif_names.STANDARD_POLYMER_CHAIN_TYPES\n    )\n    is_nonstandard_polymer_chain = np.isin(\n        all_tokens.chain_type, standard_polymer_chain, invert=True\n    )\n    is_water = all_tokens.chain_type == mmcif_names.WATER\n\n    return TokenFeatures(\n        residue_index=_pad_to(residue_index, (padding_shapes.num_tokens,)),\n        token_index=_pad_to(token_index, (padding_shapes.num_tokens,)),\n        aatype=_pad_to(aatype, (padding_shapes.num_tokens,)),\n        mask=_pad_to(mask, (padding_shapes.num_tokens,)),\n        asym_id=_pad_to(asym_id, (padding_shapes.num_tokens,)),\n        entity_id=_pad_to(entity_id, (padding_shapes.num_tokens,)),\n        sym_id=_pad_to(sym_id, (padding_shapes.num_tokens,)),\n        seq_length=seq_length,\n        is_protein=_pad_to(is_protein, (padding_shapes.num_tokens,)),\n        is_rna=_pad_to(is_rna, (padding_shapes.num_tokens,)),\n        is_dna=_pad_to(is_dna, (padding_shapes.num_tokens,)),\n        is_ligand=_pad_to(is_ligand, (padding_shapes.num_tokens,)),\n        is_nonstandard_polymer_chain=_pad_to(\n            is_nonstandard_polymer_chain, (padding_shapes.num_tokens,)\n        ),\n        is_water=_pad_to(is_water, (padding_shapes.num_tokens,)),\n    )\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    return cls(\n        residue_index=batch['residue_index'],\n        token_index=batch['token_index'],\n        aatype=batch['aatype'],\n        mask=batch['seq_mask'],\n        entity_id=batch['entity_id'],\n        asym_id=batch['asym_id'],\n        sym_id=batch['sym_id'],\n        seq_length=batch['seq_length'],\n        is_protein=batch['is_protein'],\n        is_rna=batch['is_rna'],\n        is_dna=batch['is_dna'],\n        is_ligand=batch['is_ligand'],\n        is_nonstandard_polymer_chain=batch['is_nonstandard_polymer_chain'],\n        is_water=batch['is_water'],\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        'residue_index': self.residue_index,\n        'token_index': self.token_index,\n        'aatype': self.aatype,\n        'seq_mask': self.mask,\n        'entity_id': self.entity_id,\n        'asym_id': self.asym_id,\n        'sym_id': self.sym_id,\n        'seq_length': self.seq_length,\n        'is_protein': self.is_protein,\n        'is_rna': self.is_rna,\n        'is_dna': self.is_dna,\n        'is_ligand': self.is_ligand,\n        'is_nonstandard_polymer_chain': self.is_nonstandard_polymer_chain,\n        'is_water': self.is_water,\n    }\n\n\njax.tree_util.register_dataclass(\n    TokenFeatures,\n    data_fields=[f.name for f in dataclasses.fields(TokenFeatures)],\n    meta_fields=[],\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass PredictedStructureInfo:\n  \"\"\"Contains information necessary to work with predicted structure.\"\"\"\n\n  atom_mask: xnp_ndarray\n  residue_center_index: xnp_ndarray\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_tokens: atom_layout.AtomLayout,\n      all_token_atoms_layout: atom_layout.AtomLayout,\n      padding_shapes: PaddingShapes,\n  ) -> Self:\n    \"\"\"Compute the PredictedStructureInfo features.\n\n    Args:\n      all_tokens: flat AtomLayout with 1 representative atom per token, shape\n        (num_tokens,)\n      all_token_atoms_layout: AtomLayout for all atoms per token, shape\n        (num_tokens, max_atoms_per_token)\n      padding_shapes: padding shapes.\n\n    Returns:\n      A PredictedStructureInfo object.\n    \"\"\"\n    atom_mask = _pad_to(\n        all_token_atoms_layout.atom_name.astype(bool),\n        (padding_shapes.num_tokens, None),\n    )\n    residue_center_index = np.zeros(padding_shapes.num_tokens, dtype=np.int32)\n    for idx in range(all_tokens.shape[0]):\n      repr_atom = all_tokens.atom_name[idx]\n      atoms = list(all_token_atoms_layout.atom_name[idx, :])\n      if repr_atom in atoms:\n        residue_center_index[idx] = atoms.index(repr_atom)\n      else:\n        # Representative atoms can be missing if cropping the number of atoms\n        # per residue.\n        logging.warning(\n            'The representative atom in all_tokens (%s) is not in '\n            'all_token_atoms_layout (%s)',\n            all_tokens[idx : idx + 1],\n            all_token_atoms_layout[idx, :],\n        )\n        residue_center_index[idx] = 0\n    return cls(atom_mask=atom_mask, residue_center_index=residue_center_index)\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    return cls(\n        atom_mask=batch['pred_dense_atom_mask'],\n        residue_center_index=batch['residue_center_index'],\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        'pred_dense_atom_mask': self.atom_mask,\n        'residue_center_index': self.residue_center_index,\n    }\n\n\njax.tree_util.register_dataclass(\n    PredictedStructureInfo,\n    data_fields=[f.name for f in dataclasses.fields(PredictedStructureInfo)],\n    meta_fields=[],\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass PolymerLigandBondInfo:\n  \"\"\"Contains information about polymer-ligand bonds.\"\"\"\n\n  tokens_to_polymer_ligand_bonds: atom_layout.GatherInfo\n  # Gather indices to convert from cropped dense atom layout to bonds layout\n  # (num_tokens, 2)\n  token_atoms_to_bonds: atom_layout.GatherInfo\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_tokens: atom_layout.AtomLayout,\n      all_token_atoms_layout: atom_layout.AtomLayout,\n      bond_layout: atom_layout.AtomLayout | None,\n      padding_shapes: PaddingShapes,\n  ) -> Self:\n    \"\"\"Computes the InterChainBondInfo features.\n\n    Args:\n      all_tokens: AtomLayout for tokens; shape (num_tokens,).\n      all_token_atoms_layout: Atom Layout for all atoms (num_tokens,\n        max_atoms_per_token)\n      bond_layout: Bond layout for polymer-ligand bonds.\n      padding_shapes: Padding shapes.\n\n    Returns:\n      A PolymerLigandBondInfo object.\n    \"\"\"\n\n    if bond_layout is not None:\n      # Must convert to list before calling np.isin, will not work raw.\n      peptide_types = list(mmcif_names.PEPTIDE_CHAIN_TYPES)\n      nucleic_types = list(mmcif_names.NUCLEIC_ACID_CHAIN_TYPES) + [\n          mmcif_names.OTHER_CHAIN\n      ]\n      # These atom renames are so that we can use the atom layout code with\n      # all_tokens, which only has a single atom per token.\n      atom_names = bond_layout.atom_name.copy()\n      atom_names[np.isin(bond_layout.chain_type, peptide_types)] = 'CA'\n      atom_names[np.isin(bond_layout.chain_type, nucleic_types)] = \"C1'\"\n      adjusted_bond_layout = atom_layout.AtomLayout(\n          atom_name=atom_names,\n          res_id=bond_layout.res_id,\n          chain_id=bond_layout.chain_id,\n          chain_type=bond_layout.chain_type,\n      )\n      # Remove bonds that are not in the crop.\n      cropped_tokens_to_bonds = atom_layout.compute_gather_idxs(\n          source_layout=all_tokens, target_layout=adjusted_bond_layout\n      )\n      bond_is_in_crop = np.all(\n          cropped_tokens_to_bonds.gather_mask, axis=1\n      ).astype(bool)\n      adjusted_bond_layout = adjusted_bond_layout[bond_is_in_crop, :]\n    else:\n      # Create layout with correct shape when bond_layout is None.\n      s = (0, 2)\n      adjusted_bond_layout = atom_layout.AtomLayout(\n          atom_name=np.array([], dtype=object).reshape(s),\n          res_id=np.array([], dtype=int).reshape(s),\n          chain_id=np.array([], dtype=object).reshape(s),\n      )\n    adjusted_bond_layout = adjusted_bond_layout.copy_and_pad_to(\n        (padding_shapes.num_tokens, 2)\n    )\n    tokens_to_polymer_ligand_bonds = atom_layout.compute_gather_idxs(\n        source_layout=all_tokens, target_layout=adjusted_bond_layout\n    )\n\n    # Stuff for computing the bond loss.\n    if bond_layout is not None:\n      # Pad to num_tokens (hoping that there are never more bonds than tokens).\n      padded_bond_layout = bond_layout.copy_and_pad_to(\n          (padding_shapes.num_tokens, 2)\n      )\n      token_atoms_to_bonds = atom_layout.compute_gather_idxs(\n          source_layout=all_token_atoms_layout, target_layout=padded_bond_layout\n      )\n    else:\n      token_atoms_to_bonds = atom_layout.GatherInfo(\n          gather_idxs=np.zeros((padding_shapes.num_tokens, 2), dtype=int),\n          gather_mask=np.zeros((padding_shapes.num_tokens, 2), dtype=bool),\n          input_shape=np.array((\n              padding_shapes.num_tokens,\n              all_token_atoms_layout.shape[1],\n          )),\n      )\n\n    return cls(\n        tokens_to_polymer_ligand_bonds=tokens_to_polymer_ligand_bonds,\n        token_atoms_to_bonds=token_atoms_to_bonds,\n    )\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    return cls(\n        tokens_to_polymer_ligand_bonds=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='tokens_to_polymer_ligand_bonds'\n        ),\n        token_atoms_to_bonds=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='token_atoms_to_polymer_ligand_bonds'\n        ),\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        **self.tokens_to_polymer_ligand_bonds.as_dict(\n            key_prefix='tokens_to_polymer_ligand_bonds'\n        ),\n        **self.token_atoms_to_bonds.as_dict(\n            key_prefix='token_atoms_to_polymer_ligand_bonds'\n        ),\n    }\n\n\njax.tree_util.register_dataclass(\n    PolymerLigandBondInfo,\n    data_fields=[f.name for f in dataclasses.fields(PolymerLigandBondInfo)],\n    meta_fields=[],\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass LigandLigandBondInfo:\n  \"\"\"Contains information about the location of ligand-ligand bonds.\"\"\"\n\n  tokens_to_ligand_ligand_bonds: atom_layout.GatherInfo\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_tokens: atom_layout.AtomLayout,\n      bond_layout: atom_layout.AtomLayout | None,\n      padding_shapes: PaddingShapes,\n  ) -> Self:\n    \"\"\"Computes the InterChainBondInfo features.\n\n    Args:\n      all_tokens: AtomLayout for tokens; shape (num_tokens,).\n      bond_layout: Bond layout for ligand-ligand bonds.\n      padding_shapes: Padding shapes.\n\n    Returns:\n      A LigandLigandBondInfo object.\n    \"\"\"\n\n    if bond_layout is not None:\n      # Discard any bonds that do not join to an existing atom.\n      keep_mask = []\n      all_atom_ids = {\n          uid\n          for uid in zip(\n              all_tokens.chain_id,\n              all_tokens.res_id,\n              all_tokens.atom_name,\n              strict=True,\n          )\n      }\n      for chain_id, res_id, atom_name in zip(\n          bond_layout.chain_id,\n          bond_layout.res_id,\n          bond_layout.atom_name,\n          strict=True,\n      ):\n        atom_a = (chain_id[0], res_id[0], atom_name[0])\n        atom_b = (chain_id[1], res_id[1], atom_name[1])\n        if atom_a in all_atom_ids and atom_b in all_atom_ids:\n          keep_mask.append(True)\n        else:\n          keep_mask.append(False)\n      keep_mask = np.array(keep_mask).astype(bool)\n      bond_layout = bond_layout[keep_mask]\n      # Remove any bonds to Hydrogen atoms.\n      bond_layout = bond_layout[\n          ~np.char.startswith(bond_layout.atom_name.astype(str), 'H').any(\n              axis=1\n          )\n      ]\n      atom_names = bond_layout.atom_name\n      adjusted_bond_layout = atom_layout.AtomLayout(\n          atom_name=atom_names,\n          res_id=bond_layout.res_id,\n          chain_id=bond_layout.chain_id,\n          chain_type=bond_layout.chain_type,\n      )\n    else:\n      # Create layout with correct shape when bond_layout is None.\n      s = (0, 2)\n      adjusted_bond_layout = atom_layout.AtomLayout(\n          atom_name=np.array([], dtype=object).reshape(s),\n          res_id=np.array([], dtype=int).reshape(s),\n          chain_id=np.array([], dtype=object).reshape(s),\n      )\n    # 10 x num_tokens as max_inter_bonds_ratio + max_intra_bonds_ration = 2.061.\n    adjusted_bond_layout = adjusted_bond_layout.copy_and_pad_to(\n        (padding_shapes.num_tokens * 10, 2)\n    )\n    gather_idx = atom_layout.compute_gather_idxs(\n        source_layout=all_tokens, target_layout=adjusted_bond_layout\n    )\n    return cls(tokens_to_ligand_ligand_bonds=gather_idx)\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    return cls(\n        tokens_to_ligand_ligand_bonds=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='tokens_to_ligand_ligand_bonds'\n        )\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        **self.tokens_to_ligand_ligand_bonds.as_dict(\n            key_prefix='tokens_to_ligand_ligand_bonds'\n        )\n    }\n\n\njax.tree_util.register_dataclass(\n    LigandLigandBondInfo,\n    data_fields=[f.name for f in dataclasses.fields(LigandLigandBondInfo)],\n    meta_fields=[],\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass PseudoBetaInfo:\n  \"\"\"Contains information for extracting pseudo-beta and equivalent atoms.\"\"\"\n\n  token_atoms_to_pseudo_beta: atom_layout.GatherInfo\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_token_atoms_layout: atom_layout.AtomLayout,\n      ccd: chemical_components.Ccd,\n      padding_shapes: PaddingShapes,\n      logging_name: str,\n  ) -> Self:\n    \"\"\"Compute the PseudoBetaInfo features.\n\n    Args:\n      all_token_atoms_layout:  AtomLayout for all atoms per token, shape\n        (num_tokens, max_atoms_per_token)\n      ccd: The chemical components dictionary.\n      padding_shapes: padding shapes.\n      logging_name: logging name for debugging (usually the mmcif_id)\n\n    Returns:\n      A PseudoBetaInfo object.\n    \"\"\"\n    token_idxs = []\n    atom_idxs = []\n    for token_idx in range(all_token_atoms_layout.shape[0]):\n      chain_type = all_token_atoms_layout.chain_type[token_idx, 0]\n      atom_names = list(all_token_atoms_layout.atom_name[token_idx, :])\n      atom_idx = None\n      is_nucleic_backbone = (\n          chain_type in mmcif_names.NUCLEIC_ACID_CHAIN_TYPES\n          or chain_type == mmcif_names.OTHER_CHAIN\n      )\n      if chain_type == mmcif_names.PROTEIN_CHAIN:\n        # Protein chains\n        if 'CB' in atom_names:\n          atom_idx = atom_names.index('CB')\n        elif 'CA' in atom_names:\n          atom_idx = atom_names.index('CA')\n      elif is_nucleic_backbone:\n        # RNA / DNA chains\n        res_name = all_token_atoms_layout.res_name[token_idx, 0]\n        cifdict = ccd.get(res_name)\n        if cifdict:\n          parent = cifdict['_chem_comp.mon_nstd_parent_comp_id'][0]\n          if parent != '?':\n            res_name = parent\n        if res_name in {'A', 'G', 'DA', 'DG'}:\n          if 'C4' in atom_names:\n            atom_idx = atom_names.index('C4')\n        else:\n          if 'C2' in atom_names:\n            atom_idx = atom_names.index('C2')\n      elif chain_type in mmcif_names.NON_POLYMER_CHAIN_TYPES:\n        # Ligands: there is only one atom per token\n        atom_idx = 0\n      else:\n        logging.warning(\n            '%s: Unknown chain type for token %i. (%s)',\n            logging_name,\n            token_idx,\n            all_token_atoms_layout[token_idx : token_idx + 1],\n        )\n        atom_idx = 0\n      if atom_idx is None:\n        (valid_atom_idxs,) = np.nonzero(\n            all_token_atoms_layout.atom_name[token_idx, :]\n        )\n        if valid_atom_idxs.shape[0] > 0:\n          atom_idx = valid_atom_idxs[0]\n        else:\n          atom_idx = 0\n        logging.warning(\n            '%s token %i (%s), does not contain a pseudo-beta atom.'\n            'Using first valid atom (%s) instead.',\n            logging_name,\n            token_idx,\n            all_token_atoms_layout[token_idx : token_idx + 1],\n            all_token_atoms_layout.atom_name[token_idx, atom_idx],\n        )\n\n      token_idxs.append(token_idx)\n      atom_idxs.append(atom_idx)\n\n    pseudo_beta_layout = all_token_atoms_layout[token_idxs, atom_idxs]\n    pseudo_beta_layout = pseudo_beta_layout.copy_and_pad_to((\n        padding_shapes.num_tokens,\n    ))\n    token_atoms_to_pseudo_beta = atom_layout.compute_gather_idxs(\n        source_layout=all_token_atoms_layout, target_layout=pseudo_beta_layout\n    )\n\n    return cls(\n        token_atoms_to_pseudo_beta=token_atoms_to_pseudo_beta,\n    )\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    return cls(\n        token_atoms_to_pseudo_beta=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='token_atoms_to_pseudo_beta'\n        ),\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        **self.token_atoms_to_pseudo_beta.as_dict(\n            key_prefix='token_atoms_to_pseudo_beta'\n        ),\n    }\n\n\njax.tree_util.register_dataclass(\n    PseudoBetaInfo,\n    data_fields=[f.name for f in dataclasses.fields(PseudoBetaInfo)],\n    meta_fields=[],\n)\n\n\n_DEFAULT_BLANK_REF = {\n    'positions': np.zeros(3),\n    'mask': 0,\n    'element': 0,\n    'charge': 0,\n    'atom_name_chars': np.zeros(4),\n}\n\n\ndef random_rotation(random_state: np.random.RandomState) -> np.ndarray:\n  # Create a random rotation (Gram-Schmidt orthogonalization of two\n  # random normal vectors)\n  v0, v1 = random_state.normal(size=(2, 3))\n  e0 = v0 / np.maximum(1e-10, np.linalg.norm(v0))\n  v1 = v1 - e0 * np.dot(v1, e0)\n  e1 = v1 / np.maximum(1e-10, np.linalg.norm(v1))\n  e2 = np.cross(e0, e1)\n  return np.stack([e0, e1, e2])\n\n\ndef random_augmentation(\n    positions: np.ndarray,\n    random_state: np.random.RandomState,\n) -> np.ndarray:\n  \"\"\"Center then apply random translation and rotation.\"\"\"\n\n  center = np.mean(positions, axis=0)\n  rot = random_rotation(random_state)\n  positions_target = np.einsum('ij,kj->ki', rot, positions - center)\n\n  translation = random_state.normal(size=(3,))\n  positions_target = positions_target + translation\n  return positions_target\n\n\ndef _get_reference_positions_from_ccd_cif(\n    ccd_cif: cif_dict.CifDict,\n    ref_max_modified_date: datetime.date,\n    logging_name: str,\n) -> np.ndarray:\n  \"\"\"Creates reference positions from a CCD mmcif data block.\"\"\"\n  num_atoms = len(ccd_cif['_chem_comp_atom.atom_id'])\n  if '_chem_comp_atom.pdbx_model_Cartn_x_ideal' in ccd_cif:\n    atom_x = ccd_cif['_chem_comp_atom.pdbx_model_Cartn_x_ideal']\n    atom_y = ccd_cif['_chem_comp_atom.pdbx_model_Cartn_y_ideal']\n    atom_z = ccd_cif['_chem_comp_atom.pdbx_model_Cartn_z_ideal']\n  else:\n    atom_x = np.array(['?'] * num_atoms)\n    atom_y = np.array(['?'] * num_atoms)\n    atom_z = np.array(['?'] * num_atoms)\n  pos = np.array([[x, y, z] for x, y, z in zip(atom_x, atom_y, atom_z)])\n  # Unknown reference coordinates are specified by '?' in chem comp dict.\n  # Replace unknown reference coords with 0.\n  if '?' in pos and '_chem_comp.pdbx_modified_date' in ccd_cif:\n    # Use reference coordinates if modifed date is before cutoff.\n    modified_dates = [\n        datetime.date.fromisoformat(date)\n        for date in ccd_cif['_chem_comp.pdbx_modified_date']\n    ]\n    max_modified_date = max(modified_dates)\n    if max_modified_date < ref_max_modified_date:\n      atom_x = ccd_cif['_chem_comp_atom.model_Cartn_x']\n      atom_y = ccd_cif['_chem_comp_atom.model_Cartn_y']\n      atom_z = ccd_cif['_chem_comp_atom.model_Cartn_z']\n      pos = np.array([[x, y, z] for x, y, z in zip(atom_x, atom_y, atom_z)])\n  if '?' in pos:\n    if np.all(pos == '?'):\n      logging.warning('All ref positions unknown for: %s', logging_name)\n    else:\n      logging.warning('Some ref positions unknown for: %s', logging_name)\n    pos[pos == '?'] = 0\n  return np.array(pos, dtype=np.float32)\n\n\ndef get_reference(\n    res_name: str,\n    chemical_components_data: struc_chem_comps.ChemicalComponentsData,\n    ccd: chemical_components.Ccd,\n    random_state: np.random.RandomState,\n    ref_max_modified_date: datetime.date,\n    conformer_max_iterations: int | None,\n) -> tuple[dict[str, Any], Any, Any]:\n  \"\"\"Reference structure for residue from CCD or SMILES.\n\n  Uses CCD entry if available, otherwise uses SMILES from chemical components\n  data. Conformer generation is done using RDKit, with a fallback to CCD ideal\n  or reference coordinates if RDKit fails and those coordinates are supplied.\n\n  Args:\n    res_name: ccd code of the residue.\n    chemical_components_data: ChemicalComponentsData for making ref structure.\n    ccd: The chemical components dictionary.\n    random_state: Numpy RandomState\n    ref_max_modified_date: date beyond which reference structures must not be\n      modified to be allowed to use reference coordinates.\n    conformer_max_iterations: Optional override for maximum number of iterations\n      to run for RDKit conformer search.\n\n  Returns:\n    Mapping from atom names to features, from_atoms, dest_atoms.\n  \"\"\"\n\n  ccd_cif = ccd.get(res_name)\n\n  mol = None\n  if ccd_cif:\n    try:\n      mol = rdkit_utils.mol_from_ccd_cif(ccd_cif, remove_hydrogens=False)\n    except rdkit_utils.MolFromMmcifError:\n      logging.warning('Failed to construct mol from ccd_cif for: %s', res_name)\n  else:  # No CCD entry, use SMILES from chemical components data.\n    if not (\n        chemical_components_data.chem_comp\n        and res_name in chemical_components_data.chem_comp\n        and chemical_components_data.chem_comp[res_name].pdbx_smiles\n    ):\n      raise ValueError(f'No CCD entry or SMILES for {res_name}.')\n    smiles_string = chemical_components_data.chem_comp[res_name].pdbx_smiles\n    logging.info('Using SMILES for: %s - %s', res_name, smiles_string)\n\n    mol = Chem.MolFromSmiles(smiles_string)\n    if mol is None:\n      # In this case the model will not have any information about this molecule\n      # and will not be able to predict anything about it.\n      raise ValueError(\n          f'Failed to construct RDKit Mol for {res_name} from SMILES string: '\n          f'{smiles_string} . This is likely due to an issue with the SMILES '\n          'string. Note that the userCCD input format provides an alternative '\n          'way to define custom molecules directly without RDKit or SMILES.'\n      )\n    mol = Chem.AddHs(mol)\n    # No existing names, we assign them from the graph.\n    mol = rdkit_utils.assign_atom_names_from_graph(mol)\n    # Temporary CCD cif with just atom and bond information, no coordinates.\n    ccd_cif = rdkit_utils.mol_to_ccd_cif(mol, component_id='fake_cif')\n\n  conformer = None\n  atom_names = []\n  elements = []\n  charges = []\n  pos = []\n\n  # If mol is not None (must be True for SMILES case), then we try and generate\n  # an RDKit conformer.\n  if mol is not None:\n    conformer_random_seed = int(random_state.randint(1, 1 << 31))\n    conformer = rdkit_utils.get_random_conformer(\n        mol=mol,\n        random_seed=conformer_random_seed,\n        max_iterations=conformer_max_iterations,\n        logging_name=res_name,\n    )\n    if conformer:\n      for idx, atom in enumerate(mol.GetAtoms()):\n        atom_names.append(atom.GetProp('atom_name'))\n        elements.append(atom.GetAtomicNum())\n        charges.append(atom.GetFormalCharge())\n        coords = conformer.GetAtomPosition(idx)\n        pos.append([coords.x, coords.y, coords.z])\n      pos = np.array(pos, dtype=np.float32)\n\n  # If no mol could be generated (can only happen when using CCD), or no\n  # conformer could be generated from the mol (can happen in either case), then\n  # use CCD cif instead (which will have zero coordinates for SMILES case).\n  if conformer is None:\n    atom_names = ccd_cif['_chem_comp_atom.atom_id']\n    charges = ccd_cif['_chem_comp_atom.charge']\n    type_symbols = ccd_cif['_chem_comp_atom.type_symbol']\n    elements = [\n        periodic_table.ATOMIC_NUMBER.get(elem_type.capitalize(), 0)\n        for elem_type in type_symbols\n    ]\n    pos = _get_reference_positions_from_ccd_cif(\n        ccd_cif=ccd_cif,\n        ref_max_modified_date=ref_max_modified_date,\n        logging_name=res_name,\n    )\n\n  # Augment reference positions.\n  pos = random_augmentation(pos, random_state)\n\n  # Extract atom and bond information from CCD cif.\n  from_atom = ccd_cif.get('_chem_comp_bond.atom_id_1', None)\n  dest_atom = ccd_cif.get('_chem_comp_bond.atom_id_2', None)\n\n  features = {}\n  for atom_name in atom_names:\n    features[atom_name] = {}\n    idx = atom_names.index(atom_name)\n    charge = 0 if charges[idx] == '?' else int(charges[idx])\n    atom_name_chars = np.array([ord(c) - 32 for c in atom_name], dtype=int)\n    atom_name_chars = _pad_to(atom_name_chars, (4,))\n    features[atom_name]['positions'] = pos[idx]\n    features[atom_name]['mask'] = 1\n    features[atom_name]['element'] = elements[idx]\n    features[atom_name]['charge'] = charge\n    features[atom_name]['atom_name_chars'] = atom_name_chars\n  return features, from_atom, dest_atom\n\n\n@dataclasses.dataclass(frozen=True)\nclass RefStructure:\n  \"\"\"Contains ref structure information.\"\"\"\n\n  # Array with positions, float32, shape [num_res, max_atoms_per_token, 3]\n  positions: xnp_ndarray\n  # Array with masks, bool, shape [num_res, max_atoms_per_token]\n  mask: xnp_ndarray\n  # Array with elements, int32, shape [num_res, max_atoms_per_token]\n  element: xnp_ndarray\n  # Array with charges, float32, shape [num_res, max_atoms_per_token]\n  charge: xnp_ndarray\n  # Array with atom name characters, int32, [num_res, max_atoms_per_token, 4]\n  atom_name_chars: xnp_ndarray\n  # Array with reference space uids, int32, [num_res, max_atoms_per_token]\n  ref_space_uid: xnp_ndarray\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_token_atoms_layout: atom_layout.AtomLayout,\n      ccd: chemical_components.Ccd,\n      padding_shapes: PaddingShapes,\n      chemical_components_data: struc_chem_comps.ChemicalComponentsData,\n      random_state: np.random.RandomState,\n      ref_max_modified_date: datetime.date,\n      conformer_max_iterations: int | None,\n      ligand_ligand_bonds: atom_layout.AtomLayout | None = None,\n  ) -> tuple[Self, Any]:\n    \"\"\"Reference structure information for each residue.\"\"\"\n\n    # Get features per atom\n    padded_shape = (padding_shapes.num_tokens, all_token_atoms_layout.shape[1])\n    result = {\n        'positions': np.zeros((*padded_shape, 3), 'float32'),\n        'mask': np.zeros(padded_shape, 'bool'),\n        'element': np.zeros(padded_shape, 'int32'),\n        'charge': np.zeros(padded_shape, 'float32'),\n        'atom_name_chars': np.zeros((*padded_shape, 4), 'int32'),\n        'ref_space_uid': np.zeros((*padded_shape,), 'int32'),\n    }\n\n    atom_names_all = []\n    chain_ids_all = []\n    res_ids_all = []\n\n    # Cache reference conformations for each residue.\n    conformations = {}\n    ref_space_uids = {}\n    for idx in np.ndindex(all_token_atoms_layout.shape):\n      chain_id = all_token_atoms_layout.chain_id[idx]\n      res_id = all_token_atoms_layout.res_id[idx]\n      res_name = all_token_atoms_layout.res_name[idx]\n      is_non_standard = res_name not in _STANDARD_RESIDUES\n      atom_name = all_token_atoms_layout.atom_name[idx]\n      if not atom_name:\n        ref = _DEFAULT_BLANK_REF\n      else:\n        if (chain_id, res_id) not in conformations:\n          conf, from_atom, dest_atom = get_reference(\n              res_name=res_name,\n              chemical_components_data=chemical_components_data,\n              ccd=ccd,\n              random_state=random_state,\n              ref_max_modified_date=ref_max_modified_date,\n              conformer_max_iterations=conformer_max_iterations,\n          )\n          conformations[(chain_id, res_id)] = conf\n\n          if (\n              is_non_standard\n              and (from_atom is not None)\n              and (dest_atom is not None)\n          ):\n            # Add intra-ligand bond graph\n            atom_names_ligand = np.stack(\n                [from_atom, dest_atom], axis=1, dtype=object\n            )\n            atom_names_all.append(atom_names_ligand)\n            res_ids_all.append(\n                np.full_like(atom_names_ligand, res_id, dtype=int)\n            )\n            chain_ids_all.append(\n                np.full_like(atom_names_ligand, chain_id, dtype=object)\n            )\n\n        conformation = conformations.get(\n            (chain_id, res_id), {atom_name: _DEFAULT_BLANK_REF}\n        )\n        if atom_name not in conformation:\n          logging.warning(\n              'Missing atom \"%s\" for CCD \"%s\"',\n              atom_name,\n              all_token_atoms_layout.res_name[idx],\n          )\n        ref = conformation.get(atom_name, _DEFAULT_BLANK_REF)\n      for k in ref:\n        result[k][idx] = ref[k]\n\n      # Assign a unique reference space id to each component, to determine which\n      # reference positions live in the same reference space.\n      space_str_id = (\n          all_token_atoms_layout.chain_id[idx],\n          all_token_atoms_layout.res_id[idx],\n      )\n      if space_str_id not in ref_space_uids:\n        ref_space_uids[space_str_id] = len(ref_space_uids)\n      result['ref_space_uid'][idx] = ref_space_uids[space_str_id]\n\n    if atom_names_all:\n      atom_names_all = np.concatenate(atom_names_all, axis=0)\n      res_ids_all = np.concatenate(res_ids_all, axis=0)\n      chain_ids_all = np.concatenate(chain_ids_all, axis=0)\n      if ligand_ligand_bonds is not None:\n        adjusted_ligand_ligand_bonds = atom_layout.AtomLayout(\n            atom_name=np.concatenate(\n                [ligand_ligand_bonds.atom_name, atom_names_all], axis=0\n            ),\n            chain_id=np.concatenate(\n                [ligand_ligand_bonds.chain_id, chain_ids_all], axis=0\n            ),\n            res_id=np.concatenate(\n                [ligand_ligand_bonds.res_id, res_ids_all], axis=0\n            ),\n        )\n      else:\n        adjusted_ligand_ligand_bonds = atom_layout.AtomLayout(\n            atom_name=atom_names_all,\n            chain_id=chain_ids_all,\n            res_id=res_ids_all,\n        )\n    else:\n      adjusted_ligand_ligand_bonds = ligand_ligand_bonds\n\n    return cls(**result), adjusted_ligand_ligand_bonds\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    return cls(\n        positions=batch['ref_pos'],\n        mask=batch['ref_mask'],\n        element=batch['ref_element'],\n        charge=batch['ref_charge'],\n        atom_name_chars=batch['ref_atom_name_chars'],\n        ref_space_uid=batch['ref_space_uid'],\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        'ref_pos': self.positions,\n        'ref_mask': self.mask,\n        'ref_element': self.element,\n        'ref_charge': self.charge,\n        'ref_atom_name_chars': self.atom_name_chars,\n        'ref_space_uid': self.ref_space_uid,\n    }\n\n\njax.tree_util.register_dataclass(\n    RefStructure,\n    data_fields=[f.name for f in dataclasses.fields(RefStructure)],\n    meta_fields=[],\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass ConvertModelOutput:\n  \"\"\"Contains atom layout info.\"\"\"\n\n  cleaned_struc: structure.Structure\n  token_atoms_layout: atom_layout.AtomLayout\n  flat_output_layout: atom_layout.AtomLayout\n  empty_output_struc: structure.Structure\n  polymer_ligand_bonds: atom_layout.AtomLayout\n  ligand_ligand_bonds: atom_layout.AtomLayout\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_token_atoms_layout: atom_layout.AtomLayout,\n      padding_shapes: PaddingShapes,\n      cleaned_struc: structure.Structure,\n      flat_output_layout: atom_layout.AtomLayout,\n      empty_output_struc: structure.Structure,\n      polymer_ligand_bonds: atom_layout.AtomLayout,\n      ligand_ligand_bonds: atom_layout.AtomLayout,\n  ) -> Self:\n    \"\"\"Pads the all_token_atoms_layout and stores other data.\"\"\"\n    # Crop and pad the all_token_atoms_layout.\n    token_atoms_layout = all_token_atoms_layout.copy_and_pad_to(\n        (padding_shapes.num_tokens, all_token_atoms_layout.shape[1])\n    )\n\n    return cls(\n        cleaned_struc=cleaned_struc,\n        token_atoms_layout=token_atoms_layout,\n        flat_output_layout=flat_output_layout,\n        empty_output_struc=empty_output_struc,\n        polymer_ligand_bonds=polymer_ligand_bonds,\n        ligand_ligand_bonds=ligand_ligand_bonds,\n    )\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    \"\"\"Construct atom layout object from dictionary.\"\"\"\n\n    return cls(\n        cleaned_struc=_unwrap(batch.get('cleaned_struc', None)),\n        token_atoms_layout=_unwrap(batch.get('token_atoms_layout', None)),\n        flat_output_layout=_unwrap(batch.get('flat_output_layout', None)),\n        empty_output_struc=_unwrap(batch.get('empty_output_struc', None)),\n        polymer_ligand_bonds=_unwrap(batch.get('polymer_ligand_bonds', None)),\n        ligand_ligand_bonds=_unwrap(batch.get('ligand_ligand_bonds', None)),\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        'cleaned_struc': np.array(self.cleaned_struc, object),\n        'token_atoms_layout': np.array(self.token_atoms_layout, object),\n        'flat_output_layout': np.array(self.flat_output_layout, object),\n        'empty_output_struc': np.array(self.empty_output_struc, object),\n        'polymer_ligand_bonds': np.array(self.polymer_ligand_bonds, object),\n        'ligand_ligand_bonds': np.array(self.ligand_ligand_bonds, object),\n    }\n\n\njax.tree_util.register_dataclass(\n    ConvertModelOutput,\n    data_fields=[f.name for f in dataclasses.fields(ConvertModelOutput)],\n    meta_fields=[],\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass AtomCrossAtt:\n  \"\"\"Operate on flat atoms.\"\"\"\n\n  token_atoms_to_queries: atom_layout.GatherInfo\n  tokens_to_queries: atom_layout.GatherInfo\n  tokens_to_keys: atom_layout.GatherInfo\n  queries_to_keys: atom_layout.GatherInfo\n  queries_to_token_atoms: atom_layout.GatherInfo\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_token_atoms_layout: atom_layout.AtomLayout,  # (num_tokens, num_dense)\n      queries_subset_size: int,\n      keys_subset_size: int,\n      padding_shapes: PaddingShapes,\n  ) -> Self:\n    \"\"\"Computes gather indices and meta data to work with a flat atom list.\"\"\"\n\n    token_atoms_layout = all_token_atoms_layout.copy_and_pad_to(\n        (padding_shapes.num_tokens, all_token_atoms_layout.shape[1])\n    )\n    token_atoms_mask = token_atoms_layout.atom_name.astype(bool)\n    flat_layout = token_atoms_layout[token_atoms_mask]\n    num_atoms = flat_layout.shape[0]\n\n    padded_flat_layout = flat_layout.copy_and_pad_to((\n        padding_shapes.num_atoms,\n    ))\n\n    # Create the layout for queries\n    num_subsets = padding_shapes.num_atoms // queries_subset_size\n    lay_arr = padded_flat_layout.to_array()\n    queries_layout = atom_layout.AtomLayout.from_array(\n        lay_arr.reshape((6, num_subsets, queries_subset_size))\n    )\n\n    # Create the layout for the keys (the key subsets are centered around the\n    # query subsets)\n    # Create initial gather indices (contain out-of-bound indices)\n    subset_centers = np.arange(\n        queries_subset_size / 2, padding_shapes.num_atoms, queries_subset_size\n    )\n    flat_to_key_gathers = (\n        subset_centers[:, None]\n        + np.arange(-keys_subset_size / 2, keys_subset_size / 2)[None, :]\n    )\n    flat_to_key_gathers = flat_to_key_gathers.astype(int)\n    # Shift subsets with out-of-bound indices, such that they are fully within\n    # the bounds.\n    for row in range(flat_to_key_gathers.shape[0]):\n      if flat_to_key_gathers[row, 0] < 0:\n        flat_to_key_gathers[row, :] -= flat_to_key_gathers[row, 0]\n      elif flat_to_key_gathers[row, -1] > num_atoms - 1:\n        overflow = flat_to_key_gathers[row, -1] - (num_atoms - 1)\n        flat_to_key_gathers[row, :] -= overflow\n    # Create the keys layout.\n    keys_layout = padded_flat_layout[flat_to_key_gathers]\n\n    # Create gather indices for conversion between token atoms layout,\n    # queries layout and keys layout.\n    token_atoms_to_queries = atom_layout.compute_gather_idxs(\n        source_layout=token_atoms_layout, target_layout=queries_layout\n    )\n\n    token_atoms_to_keys = atom_layout.compute_gather_idxs(\n        source_layout=token_atoms_layout, target_layout=keys_layout\n    )\n\n    queries_to_keys = atom_layout.compute_gather_idxs(\n        source_layout=queries_layout, target_layout=keys_layout\n    )\n\n    queries_to_token_atoms = atom_layout.compute_gather_idxs(\n        source_layout=queries_layout, target_layout=token_atoms_layout\n    )\n\n    # Create gather indices for conversion of tokens layout to\n    # queries and keys layout\n    token_idxs = np.arange(padding_shapes.num_tokens).astype(np.int64)\n    token_idxs = np.broadcast_to(token_idxs[:, None], token_atoms_layout.shape)\n    tokens_to_queries = atom_layout.GatherInfo(\n        gather_idxs=atom_layout.convert(\n            token_atoms_to_queries, token_idxs, layout_axes=(0, 1)\n        ),\n        gather_mask=atom_layout.convert(\n            token_atoms_to_queries, token_atoms_mask, layout_axes=(0, 1)\n        ),\n        input_shape=np.array((padding_shapes.num_tokens,)),\n    )\n\n    tokens_to_keys = atom_layout.GatherInfo(\n        gather_idxs=atom_layout.convert(\n            token_atoms_to_keys, token_idxs, layout_axes=(0, 1)\n        ),\n        gather_mask=atom_layout.convert(\n            token_atoms_to_keys, token_atoms_mask, layout_axes=(0, 1)\n        ),\n        input_shape=np.array((padding_shapes.num_tokens,)),\n    )\n\n    return cls(\n        token_atoms_to_queries=token_atoms_to_queries,\n        tokens_to_queries=tokens_to_queries,\n        tokens_to_keys=tokens_to_keys,\n        queries_to_keys=queries_to_keys,\n        queries_to_token_atoms=queries_to_token_atoms,\n    )\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    return cls(\n        token_atoms_to_queries=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='token_atoms_to_queries'\n        ),\n        tokens_to_queries=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='tokens_to_queries'\n        ),\n        tokens_to_keys=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='tokens_to_keys'\n        ),\n        queries_to_keys=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='queries_to_keys'\n        ),\n        queries_to_token_atoms=atom_layout.GatherInfo.from_dict(\n            batch, key_prefix='queries_to_token_atoms'\n        ),\n    )\n\n  def as_data_dict(self) -> BatchDict:\n    return {\n        **self.token_atoms_to_queries.as_dict(\n            key_prefix='token_atoms_to_queries'\n        ),\n        **self.tokens_to_queries.as_dict(key_prefix='tokens_to_queries'),\n        **self.tokens_to_keys.as_dict(key_prefix='tokens_to_keys'),\n        **self.queries_to_keys.as_dict(key_prefix='queries_to_keys'),\n        **self.queries_to_token_atoms.as_dict(\n            key_prefix='queries_to_token_atoms'\n        ),\n    }\n\n\njax.tree_util.register_dataclass(\n    AtomCrossAtt,\n    data_fields=[f.name for f in dataclasses.fields(AtomCrossAtt)],\n    meta_fields=[],\n)\n\n\n@dataclasses.dataclass(frozen=True)\nclass Frames:\n  \"\"\"Features for backbone frames.\"\"\"\n\n  mask: xnp_ndarray\n\n  @classmethod\n  def compute_features(\n      cls,\n      all_tokens: atom_layout.AtomLayout,\n      all_token_atoms_layout: atom_layout.AtomLayout,\n      ref_structure: RefStructure,\n      padding_shapes: PaddingShapes,\n  ) -> Self:\n    \"\"\"Computes features for backbone frames.\"\"\"\n    num_tokens = padding_shapes.num_tokens\n    all_token_atoms_layout = all_token_atoms_layout.copy_and_pad_to(\n        (num_tokens, all_token_atoms_layout.shape[1])\n    )\n\n    all_token_atoms_to_all_tokens = atom_layout.compute_gather_idxs(\n        source_layout=all_token_atoms_layout, target_layout=all_tokens\n    )\n    ref_coordinates = atom_layout.convert(\n        all_token_atoms_to_all_tokens,\n        ref_structure.positions.astype(np.float32),\n        layout_axes=(0, 1),\n    )\n    ref_mask = atom_layout.convert(\n        all_token_atoms_to_all_tokens,\n        ref_structure.mask.astype(bool),\n        layout_axes=(0, 1),\n    )\n    ref_mask = ref_mask & all_token_atoms_to_all_tokens.gather_mask.astype(bool)\n\n    all_frame_mask = []\n\n    # Iterate over tokens\n    for idx, args in enumerate(\n        zip(all_tokens.chain_type, all_tokens.chain_id, all_tokens.res_id)\n    ):\n\n      chain_type, chain_id, res_id = args\n\n      if chain_type in list(mmcif_names.PEPTIDE_CHAIN_TYPES):\n        frame_mask = True\n      elif chain_type in list(mmcif_names.NUCLEIC_ACID_CHAIN_TYPES):\n        frame_mask = True\n      elif chain_type in list(mmcif_names.NON_POLYMER_CHAIN_TYPES):\n        # For ligands, build frames from closest atoms from the same molecule.\n        (local_token_idxs,) = np.where(\n            (all_tokens.chain_type == chain_type)\n            & (all_tokens.chain_id == chain_id)\n            & (all_tokens.res_id == res_id)\n        )\n\n        if len(local_token_idxs) < 3:\n          frame_mask = False\n\n        else:\n          # [local_tokens]\n          local_dist = np.linalg.norm(\n              ref_coordinates[idx] - ref_coordinates[local_token_idxs], axis=-1\n          )\n          local_mask = ref_mask[local_token_idxs]\n          cost = local_dist + 1e8 * ~local_mask\n          cost = cost + 1e8 * (idx == local_token_idxs)\n          # [local_tokens]\n          closest_idxs = np.argsort(cost, axis=0)\n\n          # The closest indices index an array of local tokens. Convert this\n          # to indices of the full (num_tokens,) array.\n          global_closest_idxs = local_token_idxs[closest_idxs]\n\n          # Construct frame by placing the current token at the origin and two\n          # nearest atoms on either side.\n          global_frame_idxs = np.array(\n              (global_closest_idxs[0], idx, global_closest_idxs[1])\n          )\n\n          # Check that the frame atoms are not colinear.\n          a, b, c = ref_coordinates[global_frame_idxs]\n          vec1 = a - b\n          vec2 = c - b\n          # Reference coordinates can be all zeros, in which case we have\n          # to explicitly set colinearity.\n          if np.isclose(np.linalg.norm(vec1, axis=-1), 0) or np.isclose(\n              np.linalg.norm(vec2, axis=-1), 0\n          ):\n            is_colinear = True\n            logging.info('Found identical coordinates: Assigning as colinear.')\n          else:\n            vec1 = vec1 / np.linalg.norm(vec1, axis=-1)\n            vec2 = vec2 / np.linalg.norm(vec2, axis=-1)\n            cos_angle = np.einsum('...k,...k->...', vec1, vec2)\n            # <25 degree deviation is considered colinear.\n            is_colinear = 1 - np.abs(cos_angle) < 0.0937\n\n          frame_mask = not is_colinear\n      else:\n        # No frame for other chain types.\n        frame_mask = False\n\n      all_frame_mask.append(frame_mask)\n\n    all_frame_mask = np.array(all_frame_mask, dtype=bool)\n\n    mask = _pad_to(all_frame_mask, (padding_shapes.num_tokens,))\n\n    return cls(mask=mask)\n\n  @classmethod\n  def from_data_dict(cls, batch: BatchDict) -> Self:\n    return cls(mask=batch['frames_mask'])\n\n  def as_data_dict(self) -> BatchDict:\n    return {'frames_mask': self.mask}\n\n\njax.tree_util.register_dataclass(\n    Frames,\n    data_fields=[f.name for f in dataclasses.fields(Frames)],\n    meta_fields=[],\n)\n"
  },
  {
    "path": "src/alphafold3/model/merging_features.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Methods for merging existing features to create a new example.\n\nCovers:\n- Merging features across chains.\n- Merging the paired and unpaired parts of the MSA.\n\"\"\"\n\nfrom typing import TypeAlias\n\nfrom alphafold3.model import data_constants\nimport jax.numpy as jnp\nimport numpy as np\n\nNUM_SEQ_NUM_RES_MSA_FEATURES = data_constants.NUM_SEQ_NUM_RES_MSA_FEATURES\nNUM_SEQ_MSA_FEATURES = data_constants.NUM_SEQ_MSA_FEATURES\nMSA_PAD_VALUES = data_constants.MSA_PAD_VALUES\n\n\nxnp_ndarray: TypeAlias = np.ndarray | jnp.ndarray  # pylint: disable=invalid-name\nBatchDict: TypeAlias = dict[str, xnp_ndarray]\n\n\ndef _pad_features_to_max(feat_name: str, chains: list[BatchDict], axis: int):\n  \"\"\"Pad a set of features to the maximum size amongst all chains.\n\n  Args:\n    feat_name: The feature name to pad.\n    chains: A list of chains with associated features.\n    axis: Which axis to pad to the max.\n\n  Returns:\n    A list of features, all with the same size on the given axis.\n  \"\"\"\n  max_num_seq = np.max([chain[feat_name].shape[axis] for chain in chains])\n\n  padded_feats = []\n  for chain in chains:\n    feat = chain[feat_name]\n\n    padding = np.zeros_like(feat.shape)  # pytype: disable=attribute-error\n    padding[axis] = max_num_seq - feat.shape[axis]  # pytype: disable=attribute-error\n    padding = [(0, p) for p in padding]\n    padded_feats.append(\n        np.pad(\n            feat,\n            padding,\n            mode='constant',\n            constant_values=MSA_PAD_VALUES[feat_name],\n        )\n    )\n  return padded_feats\n\n\ndef merge_msa_features(feat_name: str, chains: list[BatchDict]) -> np.ndarray:\n  \"\"\"Merges MSA features with shape (NUM_SEQ, NUM_RES) across chains.\"\"\"\n  expected_dtype = chains[0][feat_name].dtype\n  if '_all_seq' in feat_name:\n    return np.concatenate(\n        [c.get(feat_name, np.array([], expected_dtype)) for c in chains], axis=1\n    )\n  else:\n    # Since each MSA can be of different lengths, we first need to pad them\n    # all to the size of the largest MSA before concatenating.\n    padded_feats = _pad_features_to_max(feat_name, chains, axis=0)\n    return np.concatenate(padded_feats, axis=1)\n\n\ndef merge_paired_and_unpaired_msa(example: BatchDict) -> BatchDict:\n  \"\"\"Concatenates the paired (all_seq) MSA features with the unpaired ones.\"\"\"\n  new_example = dict(example)\n\n  for feature_name in NUM_SEQ_NUM_RES_MSA_FEATURES + NUM_SEQ_MSA_FEATURES:\n    if feature_name in example and feature_name + '_all_seq' in example:\n      feat = example[feature_name]\n      feat_all_seq = example[feature_name + '_all_seq']\n      merged_feat = np.concatenate([feat_all_seq, feat], axis=0)\n      new_example[feature_name] = merged_feat\n\n  new_example['num_alignments'] = np.array(\n      new_example['msa'].shape[0], dtype=np.int32\n  )\n  return new_example\n"
  },
  {
    "path": "src/alphafold3/model/mkdssp_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include \"alphafold3/model/mkdssp_pybind.h\"\n\n#include <filesystem>\n\n#include <cif++/file.hpp>\n#include <cif++/pdb.hpp>\n#include <dssp.hpp>\n#include <sstream>\n\n#include \"absl/strings/string_view.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/pytypes.h\"\n\nnamespace alphafold3 {\nnamespace py = pybind11;\n\nvoid RegisterModuleMkdssp(pybind11::module m) {\n  if (!getenv(\"LIBCIFPP_DATA_DIR\")) {\n    py::module site = py::module::import(\"site\");\n    py::list paths = py::cast<py::list>(site.attr(\"getsitepackages\")());\n    // Find the first path that contains the libcifpp components.cif file.\n    bool found = false;\n    for (const auto& py_path : paths) {\n      auto path_str =\n          std::filesystem::path(py::cast<absl::string_view>(py_path)) /\n          \"share/libcifpp/components.cif\";\n      if (std::filesystem::exists(path_str)) {\n        setenv(\"LIBCIFPP_DATA_DIR\", path_str.parent_path().c_str(), 0);\n        found = true;\n        break;\n      }\n    }\n    if (!found) {\n      throw py::type_error(\n        \"Could not find the libcifpp components.cif file.\");\n    }\n  }\n  m.def(\n      \"get_dssp\",\n      [](absl::string_view mmcif, int model_no,\n         int min_poly_proline_stretch_length,\n         bool calculate_surface_accessibility) {\n        cif::file cif_file(mmcif.data(), mmcif.size());\n        dssp result(cif_file.front(), model_no, min_poly_proline_stretch_length,\n                    calculate_surface_accessibility);\n        std::stringstream sstream;\n        result.write_legacy_output(sstream);\n        return sstream.str();\n      },\n      py::arg(\"mmcif\"), py::arg(\"model_no\") = 1,\n      py::arg(\"min_poly_proline_stretch_length\") = 3,\n      py::arg(\"calculate_surface_accessibility\") = false,\n      py::doc(\"Gets secondary structure from an mmCIF file.\"));\n}\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/model/mkdssp_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_MODEL_MKDSSP_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_MODEL_MKDSSP_PYBIND_H_\n\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMkdssp(pybind11::module m);\n\n}\n\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_MODEL_MKDSSP_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/model/mmcif_metadata.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Adds mmCIF metadata (to be ModelCIF-conformant) and author and legal info.\"\"\"\n\nfrom typing import Final\n\nfrom alphafold3.structure import mmcif\nimport numpy as np\n\n_LICENSE_URL: Final[str] = (\n    'https://github.com/google-deepmind/alphafold3/blob/main/OUTPUT_TERMS_OF_USE.md'\n)\n\n_LICENSE: Final[str] = f\"\"\"\nNon-commercial use only, by using this file you agree to the terms of use found\nat {_LICENSE_URL}.\nTo request access to the AlphaFold 3 model parameters, follow the process set\nout at https://github.com/google-deepmind/alphafold3. You may only use these if\nreceived directly from Google. Use is subject to terms of use available at\nhttps://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.\n\"\"\".strip()\n\n_DISCLAIMER: Final[str] = \"\"\"\\\nAlphaFold 3 and its output are not intended for, have not been validated for,\nand are not approved for clinical use. They are provided \"as-is\" without any\nwarranty of any kind, whether expressed or implied. No warranty is given that\nuse shall not infringe the rights of any third party.\n\"\"\".strip()\n\n_MMCIF_PAPER_AUTHORS: Final[tuple[str, ...]] = (\n    'Google DeepMind',\n    'Isomorphic Labs',\n)\n\n# Authors of the mmCIF - we set them to be equal to the authors of the paper.\n_MMCIF_AUTHORS: Final[tuple[str, ...]] = _MMCIF_PAPER_AUTHORS\n\n\ndef add_metadata_to_mmcif(\n    old_cif: mmcif.Mmcif, version: str, model_id: bytes\n) -> mmcif.Mmcif:\n  \"\"\"Adds metadata to a mmCIF to make it ModelCIF-conformant.\"\"\"\n  cif = {}\n\n  # ModelCIF conformation dictionary.\n  cif['_audit_conform.dict_name'] = ['mmcif_ma.dic']\n  cif['_audit_conform.dict_version'] = ['1.4.5']\n  cif['_audit_conform.dict_location'] = [\n      'https://raw.githubusercontent.com/ihmwg/ModelCIF/master/dist/mmcif_ma.dic'\n  ]\n\n  cif['_pdbx_data_usage.id'] = ['1', '2']\n  cif['_pdbx_data_usage.type'] = ['license', 'disclaimer']\n  cif['_pdbx_data_usage.details'] = [_LICENSE, _DISCLAIMER]\n  cif['_pdbx_data_usage.url'] = [_LICENSE_URL, '?']\n\n  # Structure author details.\n  cif['_audit_author.name'] = []\n  cif['_audit_author.pdbx_ordinal'] = []\n  for author_index, author_name in enumerate(_MMCIF_AUTHORS, start=1):\n    cif['_audit_author.name'].append(author_name)\n    cif['_audit_author.pdbx_ordinal'].append(str(author_index))\n\n  # Paper author details.\n  cif['_citation_author.citation_id'] = []\n  cif['_citation_author.name'] = []\n  cif['_citation_author.ordinal'] = []\n  for author_index, author_name in enumerate(_MMCIF_PAPER_AUTHORS, start=1):\n    cif['_citation_author.citation_id'].append('primary')\n    cif['_citation_author.name'].append(author_name)\n    cif['_citation_author.ordinal'].append(str(author_index))\n\n  # Paper citation details.\n  cif['_citation.id'] = ['primary']\n  cif['_citation.title'] = [\n      'Accurate structure prediction of biomolecular interactions with'\n      ' AlphaFold 3'\n  ]\n  cif['_citation.journal_full'] = ['Nature']\n  cif['_citation.journal_volume'] = ['630']\n  cif['_citation.page_first'] = ['493']\n  cif['_citation.page_last'] = ['500']\n  cif['_citation.year'] = ['2024']\n  cif['_citation.journal_id_ASTM'] = ['NATUAS']\n  cif['_citation.country'] = ['UK']\n  cif['_citation.journal_id_ISSN'] = ['0028-0836']\n  cif['_citation.journal_id_CSD'] = ['0006']\n  cif['_citation.book_publisher'] = ['?']\n  cif['_citation.pdbx_database_id_PubMed'] = ['38718835']\n  cif['_citation.pdbx_database_id_DOI'] = ['10.1038/s41586-024-07487-w']\n\n  # Type of data in the dataset including data used in the model generation.\n  cif['_ma_data.id'] = ['1']\n  cif['_ma_data.name'] = ['Model']\n  cif['_ma_data.content_type'] = ['model coordinates']\n\n  # Description of number of instances for each entity.\n  cif['_ma_target_entity_instance.asym_id'] = old_cif['_struct_asym.id']\n  cif['_ma_target_entity_instance.entity_id'] = old_cif[\n      '_struct_asym.entity_id'\n  ]\n  cif['_ma_target_entity_instance.details'] = ['.'] * len(\n      cif['_ma_target_entity_instance.entity_id']\n  )\n\n  # Details about the target entities.\n  cif['_ma_target_entity.entity_id'] = cif[\n      '_ma_target_entity_instance.entity_id'\n  ]\n  cif['_ma_target_entity.data_id'] = ['1'] * len(\n      cif['_ma_target_entity.entity_id']\n  )\n  cif['_ma_target_entity.origin'] = ['.'] * len(\n      cif['_ma_target_entity.entity_id']\n  )\n\n  # Details of the models being deposited.\n  cif['_ma_model_list.ordinal_id'] = ['1']\n  cif['_ma_model_list.model_id'] = ['1']\n  cif['_ma_model_list.model_group_id'] = ['1']\n  cif['_ma_model_list.model_name'] = ['Top ranked model']\n\n  cif['_ma_model_list.model_group_name'] = [\n      f'AlphaFold-beta-20231127 ({version})'\n  ]\n  cif['_ma_model_list.data_id'] = ['1']\n  cif['_ma_model_list.model_type'] = ['Ab initio model']\n\n  # Software used.\n  cif['_software.pdbx_ordinal'] = ['1']\n  cif['_software.name'] = ['AlphaFold']\n  cif['_software.version'] = [\n      f'AlphaFold-beta-20231127 ({model_id.decode(\"ascii\")})'\n  ]\n  cif['_software.type'] = ['package']\n  cif['_software.description'] = ['Structure prediction']\n  cif['_software.classification'] = ['other']\n  cif['_software.date'] = ['?']\n\n  # Collection of software into groups.\n  cif['_ma_software_group.ordinal_id'] = ['1']\n  cif['_ma_software_group.group_id'] = ['1']\n  cif['_ma_software_group.software_id'] = ['1']\n\n  # Method description to conform with ModelCIF.\n  cif['_ma_protocol_step.ordinal_id'] = ['1', '2', '3']\n  cif['_ma_protocol_step.protocol_id'] = ['1', '1', '1']\n  cif['_ma_protocol_step.step_id'] = ['1', '2', '3']\n  cif['_ma_protocol_step.method_type'] = [\n      'coevolution MSA',\n      'template search',\n      'modeling',\n  ]\n\n  # Details of the metrics use to assess model confidence.\n  cif['_ma_qa_metric.id'] = ['1', '2']\n  cif['_ma_qa_metric.name'] = ['pLDDT', 'pLDDT']\n  # Accepted values are distance, energy, normalised score, other, zscore.\n  cif['_ma_qa_metric.type'] = ['pLDDT', 'pLDDT']\n  cif['_ma_qa_metric.mode'] = ['global', 'local']\n  cif['_ma_qa_metric.software_group_id'] = ['1', '1']\n\n  # Global model confidence pLDDT value.\n  cif['_ma_qa_metric_global.ordinal_id'] = ['1']\n  cif['_ma_qa_metric_global.model_id'] = ['1']\n  cif['_ma_qa_metric_global.metric_id'] = ['1']\n  # Mean over all atoms, since AlphaFold 3 outputs pLDDT per-atom.\n  global_plddt = np.mean(\n      [float(v) for v in old_cif['_atom_site.B_iso_or_equiv']]\n  )\n  cif['_ma_qa_metric_global.metric_value'] = [f'{global_plddt:.2f}']\n\n  # Local (per residue) model confidence pLDDT value.\n  cif['_ma_qa_metric_local.ordinal_id'] = []\n  cif['_ma_qa_metric_local.model_id'] = []\n  cif['_ma_qa_metric_local.label_asym_id'] = []\n  cif['_ma_qa_metric_local.label_seq_id'] = []\n  cif['_ma_qa_metric_local.label_comp_id'] = []\n  cif['_ma_qa_metric_local.metric_id'] = []\n  cif['_ma_qa_metric_local.metric_value'] = []\n\n  plddt_grouped_by_res = {}\n  for *res, atom_plddt in zip(\n      old_cif['_atom_site.label_asym_id'],\n      old_cif['_atom_site.label_seq_id'],\n      old_cif['_atom_site.label_comp_id'],\n      old_cif['_atom_site.B_iso_or_equiv'],\n  ):\n    plddt_grouped_by_res.setdefault(tuple(res), []).append(float(atom_plddt))\n\n  for ordinal_id, ((chain_id, res_id, res_name), res_plddts) in enumerate(\n      plddt_grouped_by_res.items(), start=1\n  ):\n    res_plddt = np.mean(res_plddts)\n    cif['_ma_qa_metric_local.ordinal_id'].append(str(ordinal_id))\n    cif['_ma_qa_metric_local.model_id'].append('1')\n    cif['_ma_qa_metric_local.label_asym_id'].append(chain_id)\n    cif['_ma_qa_metric_local.label_seq_id'].append(res_id)\n    cif['_ma_qa_metric_local.label_comp_id'].append(res_name)\n    cif['_ma_qa_metric_local.metric_id'].append('2')  # See _ma_qa_metric.id.\n    cif['_ma_qa_metric_local.metric_value'].append(f'{res_plddt:.2f}')\n\n  cif['_atom_type.symbol'] = sorted(set(old_cif['_atom_site.type_symbol']))\n\n  return old_cif.copy_and_update(cif)\n\n\ndef add_legal_comment(cif: str) -> str:\n  \"\"\"Adds legal comment at the top of the mmCIF.\"\"\"\n  # fmt: off\n  # pylint: disable=line-too-long\n  comment = (\n      '# By using this file you agree to the legally binding terms of use found at\\n'\n      f'# {_LICENSE_URL}.\\n'\n      '# To request access to the AlphaFold 3 model parameters, follow the process set\\n'\n      '# out at https://github.com/google-deepmind/alphafold3. You may only use these if\\n'\n      '# received directly from Google. Use is subject to terms of use available at\\n'\n      '# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md.'\n  )\n  # pylint: enable=line-too-long\n  # fmt: on\n  return f'{comment}\\n{cif}'\n"
  },
  {
    "path": "src/alphafold3/model/model.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"AlphaFold3 model.\"\"\"\n\nfrom collections.abc import Iterable, Mapping\nimport concurrent\nimport dataclasses\nimport functools\nfrom typing import Any, TypeAlias\n\nfrom absl import logging\nfrom alphafold3 import structure\nfrom alphafold3.common import base_config\nfrom alphafold3.model import confidences\nfrom alphafold3.model import feat_batch\nfrom alphafold3.model import features\nfrom alphafold3.model import model_config\nfrom alphafold3.model.atom_layout import atom_layout\nfrom alphafold3.model.components import mapping\nfrom alphafold3.model.components import utils\nfrom alphafold3.model.network import atom_cross_attention\nfrom alphafold3.model.network import confidence_head\nfrom alphafold3.model.network import diffusion_head\nfrom alphafold3.model.network import distogram_head\nfrom alphafold3.model.network import evoformer as evoformer_network\nfrom alphafold3.model.network import featurization\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\nimport numpy as np\n\n\nModelResult: TypeAlias = Mapping[str, Any]\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True)\nclass InferenceResult:\n  \"\"\"Postprocessed model result.\n\n  Attributes:\n    predicted_structure: Predicted protein structure.\n    numerical_data: Useful numerical data (scalars or arrays) to be saved at\n      inference time.\n    metadata: Smaller numerical data (usually scalar) to be saved as inference\n      metadata.\n    debug_outputs: Additional dict for debugging, e.g. raw outputs of a model\n      forward pass.\n    model_id: Model identifier.\n  \"\"\"\n\n  predicted_structure: structure.Structure = dataclasses.field()\n  numerical_data: Mapping[str, float | int | np.ndarray] = dataclasses.field(\n      default_factory=dict\n  )\n  metadata: Mapping[str, float | int | np.ndarray] = dataclasses.field(\n      default_factory=dict\n  )\n  debug_outputs: Mapping[str, Any] = dataclasses.field(default_factory=dict)\n  model_id: bytes = b''\n\n\ndef get_predicted_structure(\n    result: ModelResult, batch: feat_batch.Batch\n) -> structure.Structure:\n  \"\"\"Creates the predicted structure and ion preditions.\n\n  Args:\n    result: model output in a model specific layout\n    batch: model input batch\n\n  Returns:\n    Predicted structure.\n  \"\"\"\n  model_output_coords = result['diffusion_samples']['atom_positions']\n\n  # Rearrange model output coordinates to the flat output layout.\n  model_output_to_flat = atom_layout.compute_gather_idxs(\n      source_layout=batch.convert_model_output.token_atoms_layout,\n      target_layout=batch.convert_model_output.flat_output_layout,\n  )\n  pred_flat_atom_coords = atom_layout.convert(\n      gather_info=model_output_to_flat,\n      arr=model_output_coords,\n      layout_axes=(-3, -2),\n  )\n\n  predicted_lddt = result.get('predicted_lddt')\n\n  if predicted_lddt is not None:\n    pred_flat_b_factors = atom_layout.convert(\n        gather_info=model_output_to_flat,\n        arr=predicted_lddt,\n        layout_axes=(-2, -1),\n    )\n  else:\n    # Handle models which don't have predicted_lddt outputs.\n    pred_flat_b_factors = np.zeros(pred_flat_atom_coords.shape[:-1])\n\n  (missing_atoms_indices,) = np.nonzero(model_output_to_flat.gather_mask == 0)\n  if missing_atoms_indices.shape[0] > 0:\n    missing_atoms_flat_layout = batch.convert_model_output.flat_output_layout[\n        missing_atoms_indices\n    ]\n    missing_atoms_uids = list(\n        zip(\n            missing_atoms_flat_layout.chain_id,\n            missing_atoms_flat_layout.res_id,\n            missing_atoms_flat_layout.res_name,\n            missing_atoms_flat_layout.atom_name,\n        )\n    )\n    logging.warning(\n        'Target %s: warning: %s atoms were not predicted by the '\n        'model, setting their coordinates to (0, 0, 0). '\n        'Missing atoms: %s',\n        batch.convert_model_output.empty_output_struc.name,\n        missing_atoms_indices.shape[0],\n        missing_atoms_uids,\n    )\n\n  # Put them into a structure\n  pred_struc = batch.convert_model_output.empty_output_struc\n  pred_struc = pred_struc.copy_and_update_atoms(\n      atom_x=pred_flat_atom_coords[..., 0],\n      atom_y=pred_flat_atom_coords[..., 1],\n      atom_z=pred_flat_atom_coords[..., 2],\n      atom_b_factor=pred_flat_b_factors,\n      atom_occupancy=np.ones(pred_flat_atom_coords.shape[:-1]),  # Always 1.0.\n  )\n  # Set manually/differently when adding metadata.\n  pred_struc = pred_struc.copy_and_update_globals(release_date=None)\n  return pred_struc\n\n\ndef create_target_feat_embedding(\n    batch: feat_batch.Batch,\n    config: evoformer_network.Evoformer.Config,\n    global_config: model_config.GlobalConfig,\n) -> jnp.ndarray:\n  \"\"\"Create target feature embedding.\"\"\"\n\n  dtype = jnp.bfloat16 if global_config.bfloat16 == 'all' else jnp.float32\n\n  with utils.bfloat16_context():\n    target_feat = featurization.create_target_feat(\n        batch,\n        append_per_atom_features=False,\n    ).astype(dtype)\n\n    enc = atom_cross_attention.atom_cross_att_encoder(\n        token_atoms_act=None,\n        trunk_single_cond=None,\n        trunk_pair_cond=None,\n        config=config.per_atom_conditioning,\n        global_config=global_config,\n        batch=batch,\n        name='evoformer_conditioning',\n    )\n    target_feat = jnp.concatenate([target_feat, enc.token_act], axis=-1).astype(\n        dtype\n    )\n\n  return target_feat\n\n\ndef _compute_ptm(\n    result: ModelResult,\n    num_tokens: int,\n    asym_id: np.ndarray,\n    pae_single_mask: np.ndarray,\n    interface: bool,\n) -> np.ndarray:\n  \"\"\"Computes the pTM metrics from PAE.\"\"\"\n  return np.stack(\n      [\n          confidences.predicted_tm_score(\n              tm_adjusted_pae=tm_adjusted_pae[:num_tokens, :num_tokens],\n              asym_id=asym_id,\n              pair_mask=pae_single_mask[:num_tokens, :num_tokens],\n              interface=interface,\n          )\n          for tm_adjusted_pae in result['tmscore_adjusted_pae_global']\n      ],\n      axis=0,\n  )\n\n\ndef _compute_chain_pair_iptm(\n    num_tokens: int,\n    asym_ids: np.ndarray,\n    mask: np.ndarray,\n    tm_adjusted_pae: np.ndarray,\n) -> np.ndarray:\n  \"\"\"Computes the chain pair ipTM metrics from PAE.\"\"\"\n  return np.stack(\n      [\n          confidences.chain_pairwise_predicted_tm_scores(\n              tm_adjusted_pae=sample_tm_adjusted_pae[:num_tokens],\n              asym_id=asym_ids[:num_tokens],\n              pair_mask=mask[:num_tokens, :num_tokens],\n          )\n          for sample_tm_adjusted_pae in tm_adjusted_pae\n      ],\n      axis=0,\n  )\n\n\nclass Model(hk.Module):\n  \"\"\"Full model. Takes in data batch and returns model outputs.\"\"\"\n\n  class HeadsConfig(base_config.BaseConfig):\n    diffusion: diffusion_head.DiffusionHead.Config = base_config.autocreate()\n    confidence: confidence_head.ConfidenceHead.Config = base_config.autocreate()\n    distogram: distogram_head.DistogramHead.Config = base_config.autocreate()\n\n  class Config(base_config.BaseConfig):\n    evoformer: evoformer_network.Evoformer.Config = base_config.autocreate()\n    global_config: model_config.GlobalConfig = base_config.autocreate()\n    heads: 'Model.HeadsConfig' = base_config.autocreate()\n    num_recycles: int = 10\n    return_embeddings: bool = False\n    return_distogram: bool = False\n\n  def __init__(self, config: Config, name: str = 'diffuser'):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = config.global_config\n    self.diffusion_module = diffusion_head.DiffusionHead(\n        self.config.heads.diffusion, self.global_config\n    )\n\n  @hk.transparent\n  def _sample_diffusion(\n      self,\n      batch: feat_batch.Batch,\n      embeddings: dict[str, jnp.ndarray],\n      *,\n      sample_config: diffusion_head.SampleConfig,\n  ) -> dict[str, jnp.ndarray]:\n    denoising_step = functools.partial(\n        self.diffusion_module,\n        batch=batch,\n        embeddings=embeddings,\n        use_conditioning=True,\n    )\n\n    sample = diffusion_head.sample(\n        denoising_step=denoising_step,\n        batch=batch,\n        key=hk.next_rng_key(),\n        config=sample_config,\n    )\n    return sample\n\n  def __call__(\n      self, batch: features.BatchDict, key: jax.Array | None = None\n  ) -> ModelResult:\n    if key is None:\n      key = hk.next_rng_key()\n\n    batch = feat_batch.Batch.from_data_dict(batch)\n\n    embedding_module = evoformer_network.Evoformer(\n        self.config.evoformer, self.global_config\n    )\n    target_feat = create_target_feat_embedding(\n        batch=batch,\n        config=embedding_module.config,\n        global_config=self.global_config,\n    )\n\n    def recycle_body(_, args):\n      prev, key = args\n      key, subkey = jax.random.split(key)\n      embeddings = embedding_module(\n          batch=batch,\n          prev=prev,\n          target_feat=target_feat,\n          key=subkey,\n      )\n      embeddings['pair'] = embeddings['pair'].astype(jnp.float32)\n      embeddings['single'] = embeddings['single'].astype(jnp.float32)\n      return embeddings, key\n\n    num_res = batch.num_res\n\n    embeddings = {\n        'pair': jnp.zeros(\n            [num_res, num_res, self.config.evoformer.pair_channel],\n            dtype=jnp.float32,\n        ),\n        'single': jnp.zeros(\n            [num_res, self.config.evoformer.seq_channel], dtype=jnp.float32\n        ),\n        'target_feat': target_feat,\n    }\n    if hk.running_init():\n      embeddings, _ = recycle_body(None, (embeddings, key))\n    else:\n      # Number of recycles is number of additional forward trunk passes.\n      num_iter = self.config.num_recycles + 1\n      embeddings, _ = hk.fori_loop(0, num_iter, recycle_body, (embeddings, key))\n\n    samples = self._sample_diffusion(\n        batch,\n        embeddings,\n        sample_config=self.config.heads.diffusion.eval,\n    )\n\n    # Compute dist_error_fn over all samples for distance error logging.\n    confidence_output = mapping.sharded_map(\n        lambda dense_atom_positions: confidence_head.ConfidenceHead(\n            self.config.heads.confidence, self.global_config\n        )(\n            dense_atom_positions=dense_atom_positions,\n            embeddings=embeddings,\n            seq_mask=batch.token_features.mask,\n            token_atoms_to_pseudo_beta=batch.pseudo_beta_info.token_atoms_to_pseudo_beta,\n            asym_id=batch.token_features.asym_id,\n        ),\n        in_axes=0,\n    )(samples['atom_positions'])\n\n    distogram = distogram_head.DistogramHead(\n        self.config.heads.distogram, self.global_config\n    )(batch, embeddings, return_distogram=self.config.return_distogram)\n\n    output = {\n        'diffusion_samples': samples,\n        'distogram': distogram,\n        **confidence_output,\n    }\n    if self.config.return_embeddings:\n      output['single_embeddings'] = embeddings['single']\n      output['pair_embeddings'] = embeddings['pair']\n    return output\n\n  @classmethod\n  def get_inference_result(\n      cls,\n      batch: features.BatchDict,\n      result: ModelResult,\n      target_name: str = '',\n  ) -> Iterable[InferenceResult]:\n    \"\"\"Get the predicted structure, scalars, and arrays for inference.\n\n    This function also computes any inference-time quantities, which are not a\n    part of the forward-pass, e.g. additional confidence scores. Note that this\n    function is not serialized, so it should be slim if possible.\n\n    Args:\n      batch: data batch used for model inference, incl. TPU invalid types.\n      result: output dict from the model's forward pass.\n      target_name: target name to be saved within structure.\n\n    Yields:\n      inference_result: dataclass object that contains a predicted structure,\n      important inference-time scalars and arrays, as well as a slightly trimmed\n      dictionary of raw model result from the forward pass (for debugging).\n    \"\"\"\n    del target_name\n    batch = feat_batch.Batch.from_data_dict(batch)\n\n    # Retrieve structure and construct a predicted structure.\n    pred_structure = get_predicted_structure(result=result, batch=batch)\n\n    num_tokens = batch.token_features.seq_length.item()\n\n    pae_single_mask = np.tile(\n        batch.frames.mask[:, None],\n        [1, batch.frames.mask.shape[0]],\n    )\n    ptm = _compute_ptm(\n        result=result,\n        num_tokens=num_tokens,\n        asym_id=batch.token_features.asym_id[:num_tokens],\n        pae_single_mask=pae_single_mask,\n        interface=False,\n    )\n    iptm = _compute_ptm(\n        result=result,\n        num_tokens=num_tokens,\n        asym_id=batch.token_features.asym_id[:num_tokens],\n        pae_single_mask=pae_single_mask,\n        interface=True,\n    )\n    ptm_iptm_average = 0.8 * iptm + 0.2 * ptm\n\n    asym_ids = batch.token_features.asym_id[:num_tokens]\n    # Map asym IDs back to chain IDs. Asym IDs are constructed from chain IDs by\n    # iterating over the chain IDs, and for each unique chain ID incrementing\n    # the asym ID by 1 and mapping it to the particular chain ID. Asym IDs are\n    # 1-indexed, so subtract 1 to get back to the chain ID.\n    chain_ids = [pred_structure.chains[asym_id - 1] for asym_id in asym_ids]\n    res_ids = batch.token_features.residue_index[:num_tokens]\n\n    if len(np.unique(asym_ids[:num_tokens])) > 1:\n      # There is more than one chain, hence interface pTM (i.e. ipTM) defined,\n      # so use it.\n      ranking_confidence = ptm_iptm_average\n    else:\n      # There is only one chain, hence ipTM=NaN, so use just pTM.\n      ranking_confidence = ptm\n\n    contact_probs = result['distogram']['contact_probs']\n    # Compute PAE related summaries.\n    _, chain_pair_pae_min, _ = confidences.chain_pair_pae(\n        num_tokens=num_tokens,\n        asym_ids=batch.token_features.asym_id,\n        full_pae=result['full_pae'],\n        mask=pae_single_mask,\n    )\n    chain_pair_pde_mean, chain_pair_pde_min = confidences.chain_pair_pde(\n        num_tokens=num_tokens,\n        asym_ids=batch.token_features.asym_id,\n        full_pde=result['full_pde'],\n    )\n    intra_chain_single_pde, cross_chain_single_pde, _ = confidences.pde_single(\n        num_tokens,\n        batch.token_features.asym_id,\n        result['full_pde'],\n        contact_probs,\n    )\n    pae_metrics = confidences.pae_metrics(\n        num_tokens=num_tokens,\n        asym_ids=batch.token_features.asym_id,\n        full_pae=result['full_pae'],\n        mask=pae_single_mask,\n        contact_probs=contact_probs,\n        tm_adjusted_pae=result['tmscore_adjusted_pae_interface'],\n    )\n    ranking_confidence_pae = confidences.rank_metric(\n        result['full_pae'],\n        contact_probs * batch.frames.mask[:, None].astype(float),\n    )\n    chain_pair_iptm = _compute_chain_pair_iptm(\n        num_tokens=num_tokens,\n        asym_ids=batch.token_features.asym_id,\n        mask=pae_single_mask,\n        tm_adjusted_pae=result['tmscore_adjusted_pae_interface'],\n    )\n    # iptm_ichain is a vector of per-chain ptm values. iptm_ichain[0],\n    # for example, is just the zeroth diagonal entry of the chain pair iptm\n    # matrix:\n    # [[x, , ],\n    #  [ , , ],\n    #  [ , , ]]]\n    iptm_ichain = chain_pair_iptm.diagonal(axis1=-2, axis2=-1)\n    # iptm_xchain is a vector of cross-chain interactions for each chain.\n    # iptm_xchain[0], for example, is an average of chain 0's interactions with\n    # other chains:\n    # [[ ,x,x],\n    #  [x, , ],\n    #  [x, , ]]]\n    iptm_xchain = confidences.get_iptm_xchain(chain_pair_iptm)\n\n    predicted_distance_errors = result['average_pde']\n\n    # Computing solvent accessible area with dssp can be slow for large\n    # structures with lots of chains, so we parallelize the call.\n    pred_structures = pred_structure.unstack()\n    with concurrent.futures.ThreadPoolExecutor(\n        max_workers=min(len(pred_structures), 32)\n    ) as executor:\n      has_clash = list(executor.map(confidences.has_clash, pred_structures))\n      fraction_disordered = list(\n          executor.map(confidences.fraction_disordered, pred_structures)\n      )\n\n    for idx, pred_structure in enumerate(pred_structures):\n      ranking_score = confidences.get_ranking_score(\n          ptm=ptm[idx],\n          iptm=iptm[idx],\n          fraction_disordered_=fraction_disordered[idx],\n          has_clash_=has_clash[idx],\n      )\n      yield InferenceResult(\n          predicted_structure=pred_structure,\n          numerical_data={\n              'full_pde': result['full_pde'][idx, :num_tokens, :num_tokens],\n              'full_pae': result['full_pae'][idx, :num_tokens, :num_tokens],\n              'contact_probs': contact_probs[:num_tokens, :num_tokens],\n          },\n          metadata={\n              'predicted_distance_error': predicted_distance_errors[idx],\n              'ranking_score': ranking_score,\n              'fraction_disordered': fraction_disordered[idx],\n              'has_clash': has_clash[idx],\n              'predicted_tm_score': ptm[idx],\n              'interface_predicted_tm_score': iptm[idx],\n              'chain_pair_pde_mean': chain_pair_pde_mean[idx],\n              'chain_pair_pde_min': chain_pair_pde_min[idx],\n              'chain_pair_pae_min': chain_pair_pae_min[idx],\n              'ptm': ptm[idx],\n              'iptm': iptm[idx],\n              'ptm_iptm_average': ptm_iptm_average[idx],\n              'intra_chain_single_pde': intra_chain_single_pde[idx],\n              'cross_chain_single_pde': cross_chain_single_pde[idx],\n              'pae_ichain': pae_metrics['pae_ichain'][idx],\n              'pae_xchain': pae_metrics['pae_xchain'][idx],\n              'ranking_confidence': ranking_confidence[idx],\n              'ranking_confidence_pae': ranking_confidence_pae[idx],\n              'chain_pair_iptm': chain_pair_iptm[idx],\n              'iptm_ichain': iptm_ichain[idx],\n              'iptm_xchain': iptm_xchain[idx],\n              'token_chain_ids': chain_ids,\n              'token_res_ids': res_ids,\n          },\n          model_id=result['__identifier__'],\n          debug_outputs={},\n      )\n"
  },
  {
    "path": "src/alphafold3/model/model_config.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Global config for the model.\"\"\"\n\nfrom collections.abc import Sequence\nfrom typing import Literal, TypeAlias\n\nfrom alphafold3.common import base_config\nimport tokamax\n\n_Shape2DType: TypeAlias = tuple[int | None, int | None]\n\n\nclass GlobalConfig(base_config.BaseConfig):\n  \"\"\"Global configuration for the AlphaFold3 model.\"\"\"\n\n  bfloat16: Literal['all', 'none', 'intermediate'] = 'all'\n  final_init: Literal['zeros', 'linear'] = 'zeros'\n  pair_attention_chunk_size: Sequence[_Shape2DType] = ((1536, 128), (None, 32))\n  pair_transition_shard_spec: Sequence[_Shape2DType] = (\n      (2048, None),\n      (None, 1024),\n  )\n  # Note: flash_attention_implementation = 'xla' means no flash attention.\n  flash_attention_implementation: tokamax.DotProductAttentionImplementation = (\n      'triton'\n  )\n"
  },
  {
    "path": "src/alphafold3/model/msa_pairing.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Functions for producing \"paired\" and \"unpaired\" MSA features for each chain.\n\nThe paired MSA:\n- Is made from the result of the all_seqs MSA query.\n- Is ordered such that you can concatenate features across chains and related\n  sequences will end up on the same row. Related here means \"from the same\n  species\". Gaps are added to facilitate this whenever a sequence has no\n  suitable pair.\n\nThe unpaired MSA:\n- Is made from the results of the remaining MSA queries.\n- Has no special ordering properties.\n- Is deduplicated such that it doesn't contain any sequences in the paired MSA.\n\"\"\"\n\nfrom typing import Mapping, MutableMapping, Sequence\nfrom alphafold3.model import data_constants\nimport numpy as np\n\n\ndef _align_species(\n    all_species: Sequence[bytes],\n    chains_species_to_rows: Sequence[Mapping[bytes, np.ndarray]],\n    min_hits_per_species: Mapping[bytes, int],\n) -> np.ndarray:\n  \"\"\"Aligns MSA row indices based on species.\n\n  Within a species, MSAs are aligned based on their original order (the first\n  sequence for a species in the first chain's MSA is aligned to the first\n  sequence for the same species in the second chain's MSA).\n\n  Args:\n    all_species: A list of all unique species identifiers.\n    chains_species_to_rows: A dictionary for each chain, that maps species to\n      the set of MSA row indices from that species in that chain.\n    min_hits_per_species: A mapping from species id, to the minimum MSA size\n      across chains for that species (ignoring chains with zero hits).\n\n  Returns:\n    A matrix of size [num_msa_rows, num_chains], where the i,j element is an\n    index into the jth chains MSA.  Each row consists of sequences from each\n    chain for the same species (or -1 if that chain has no sequences for that\n    species).\n  \"\"\"\n  # Each species block is of size [num_seqs x num_chains] and consists of\n  # indices into the respective MSAs that have been aligned and are all for the\n  # same species.\n  species_blocks = []\n  for species in all_species:\n    chain_row_indices = []\n    for species_to_rows in chains_species_to_rows:\n      min_msa_size = min_hits_per_species[species]\n      if species not in species_to_rows:\n        # If a given chain has no hits for a species then we pad it with -1's,\n        # later on these values are used to make sure each feature is padded\n        # with its appropriate pad value.\n        row_indices = np.full(min_msa_size, fill_value=-1, dtype=np.int32)\n      else:\n        # We crop down to the smallest MSA for a given species across chains.\n        row_indices = species_to_rows[species][:min_msa_size]\n      chain_row_indices.append(row_indices)\n    species_block = np.stack(chain_row_indices, axis=1)\n    species_blocks.append(species_block)\n  aligned_matrix = np.concatenate(species_blocks, axis=0)\n  return aligned_matrix\n\n\ndef create_paired_features(\n    chains: Sequence[MutableMapping[str, np.ndarray]],\n    max_paired_sequences: int,\n    nonempty_chain_ids: set[str],\n    max_hits_per_species: int,\n) -> Sequence[MutableMapping[str, np.ndarray]]:\n  \"\"\"Creates per-chain MSA features where the MSAs have been aligned.\n\n  Args:\n    chains: A list of feature dicts, one for each chain.\n    max_paired_sequences: No more than this many paired sequences will be\n      returned from this function.\n    nonempty_chain_ids: A set of chain ids (str) that are included in the crop\n      there is no reason to process chains not in this list.\n    max_hits_per_species: No more than this number of sequences will be returned\n      for a given species.\n\n  Returns:\n    An updated feature dictionary for each chain, where the {}_all_seq features\n    have been aligned so that the nth row in chain 1 is aligned to the nth row\n    in chain 2's features.\n  \"\"\"\n  # The number of chains that the given species appears in - we rank hits\n  # across more chains higher.\n  species_num_chains = {}\n\n  # For each chain we keep a mapping from species to the row indices in the\n  # original MSA for that chain.\n  chains_species_to_rows = []\n\n  # Keep track of the minimum number of hits across chains for a given species.\n  min_hits_per_species = {}\n\n  for chain in chains:\n    species_ids = chain['msa_species_identifiers_all_seq']\n\n    # The query gets an empty species_id, so no pairing happens for this row.\n    if (\n        species_ids.size == 0\n        or (species_ids.size == 1 and not species_ids[0])\n        or chain['chain_id'] not in nonempty_chain_ids\n    ):\n      chains_species_to_rows.append({})\n      continue\n\n    # For each species keep track of which row indices in the original MSA are\n    # from this species.\n    row_indices = np.arange(len(species_ids))\n    # The grouping np.split code requires that the input is already clustered\n    # by species id.\n    sort_idxs = species_ids.argsort()\n    species_ids = species_ids[sort_idxs]\n    row_indices = row_indices[sort_idxs]\n\n    species, unique_row_indices = np.unique(species_ids, return_index=True)\n    grouped_row_indices = np.split(row_indices, unique_row_indices[1:])\n    species_to_rows = dict(zip(species, grouped_row_indices, strict=True))\n    chains_species_to_rows.append(species_to_rows)\n\n    for s in species:\n      species_num_chains[s] = species_num_chains.get(s, 0) + 1\n\n    for species, row_indices in species_to_rows.items():\n      min_hits_per_species[species] = min(\n          min_hits_per_species.get(species, max_hits_per_species),\n          len(row_indices),\n      )\n\n  # Construct a mapping from the number of chains a species appears in to\n  # the list of species with that count.\n  num_chains_to_species = {}\n  for species, num_chains in species_num_chains.items():\n    if not species or num_chains <= 1:\n      continue\n    if num_chains not in num_chains_to_species:\n      num_chains_to_species[num_chains] = []\n    num_chains_to_species[num_chains].append(species)\n\n  num_rows_seen = 0\n  # We always keep the first row as it is the query sequence.\n  all_rows = [np.array([[0] * len(chains)], dtype=np.int32)]\n\n  # We prioritize species that have hits across more chains.\n  for num_chains in sorted(num_chains_to_species, reverse=True):\n    all_species = num_chains_to_species[num_chains]\n\n    # Align all the per-chain row indices by species, so every paired row is\n    # for a single species.\n    rows = _align_species(\n        all_species, chains_species_to_rows, min_hits_per_species\n    )\n    # Sort rows by the product of the original indices in the respective chain\n    # MSAS, so as to rank hits that appear higher in the original MSAs higher.\n    rank_metric = np.abs(np.prod(rows.astype(np.float32), axis=1))\n    sorted_rows = rows[np.argsort(rank_metric), :]\n    all_rows.append(sorted_rows)\n    num_rows_seen += rows.shape[0]\n    if num_rows_seen >= max_paired_sequences:\n      break\n\n  all_rows = np.concatenate(all_rows, axis=0)\n  all_rows = all_rows[:max_paired_sequences, :]\n\n  # Now we just have to select the relevant rows from the original msa and\n  # deletion matrix features\n  paired_chains = []\n  for chain_idx, chain in enumerate(chains):\n    out_chain = {k: v for k, v in chain.items() if 'all_seq' not in k}\n    selected_row_indices = all_rows[:, chain_idx]\n    for feat_name in {'msa', 'deletion_matrix'}:\n      all_seq_name = f'{feat_name}_all_seq'\n      feat_value = chain[all_seq_name]\n\n      # The selected row indices are padded to be the same shape for each chain,\n      # they are padded with -1's, so we add a single row onto the feature with\n      # the appropriate pad value.  This has the effect that we correctly pad\n      # each feature since all padded indices will select this padding row.\n      pad_value = data_constants.MSA_PAD_VALUES[feat_name]\n      feat_value = np.concatenate([\n          feat_value,\n          np.full((1, feat_value.shape[1]), pad_value, feat_value.dtype),\n      ])\n\n      feat_value = feat_value[selected_row_indices, :]\n      out_chain[all_seq_name] = feat_value\n    out_chain['num_alignments_all_seq'] = np.array(\n        out_chain['msa_all_seq'].shape[0]\n    )\n    paired_chains.append(out_chain)\n  return paired_chains\n\n\ndef deduplicate_unpaired_sequences(\n    np_chains: Sequence[MutableMapping[str, np.ndarray]],\n) -> Sequence[MutableMapping[str, np.ndarray]]:\n  \"\"\"Deduplicates unpaired sequences based on paired sequences.\"\"\"\n\n  feature_names = np_chains[0].keys()\n  msa_features = (\n      data_constants.NUM_SEQ_MSA_FEATURES\n      + data_constants.NUM_SEQ_NUM_RES_MSA_FEATURES\n  )\n\n  for chain in np_chains:\n    sequence_set = set(\n        hash(s.data.tobytes()) for s in chain['msa_all_seq'].astype(np.int8)\n    )\n    keep_rows = []\n    # Go through unpaired MSA seqs and remove any rows that correspond to the\n    # sequences that are already present in the paired MSA.\n    for row_num, seq in enumerate(chain['msa'].astype(np.int8)):\n      if hash(seq.data.tobytes()) not in sequence_set:\n        keep_rows.append(row_num)\n    for feature_name in feature_names:\n      if feature_name in msa_features:\n        chain[feature_name] = chain[feature_name][keep_rows]\n    chain['num_alignments'] = np.array(chain['msa'].shape[0], dtype=np.int32)\n  return np_chains\n\n\ndef choose_paired_unpaired_msa_crop_sizes(\n    unpaired_msa: np.ndarray,\n    paired_msa: np.ndarray | None,\n    total_msa_crop_size: int,\n    max_paired_sequences: int,\n) -> tuple[int, int | None]:\n  \"\"\"Returns the sizes of the MSA crop and MSA_all_seq crop.\n\n  NOTE: Unpaired + paired MSA sizes can exceed total_msa_size when\n    there are lots of gapped rows. Through the pairing logic another chain(s)\n    will have fewer than total_msa_size.\n\n  Args:\n     unpaired_msa: The unpaired MSA array (not all_seq).\n     paired_msa: The paired MSA array (all_seq).\n     total_msa_crop_size: The maximum total number of sequences to crop to.\n     max_paired_sequences: The maximum number of sequences that can come from\n       MSA pairing.\n\n  Returns:\n    A tuple of:\n      The size of the reduced MSA crop (not all_seq features).\n      The size of the unreduced MSA crop (for all_seq features) or None, if\n        paired_msa is None.\n  \"\"\"\n  if paired_msa is not None:\n    paired_crop_size = np.minimum(paired_msa.shape[0], max_paired_sequences)\n\n    # We reduce the number of un-paired sequences, by the number of times a\n    # sequence from this chains MSA is included in the paired MSA.  This keeps\n    # the MSA size for each chain roughly constant.\n    cropped_all_seq_msa = paired_msa[:max_paired_sequences]\n    num_non_gapped_pairs = cropped_all_seq_msa.shape[0]\n\n    assert num_non_gapped_pairs <= max_paired_sequences\n    unpaired_crop_size = np.minimum(\n        unpaired_msa.shape[0], total_msa_crop_size - num_non_gapped_pairs\n    )\n    assert unpaired_crop_size >= 0\n  else:\n    unpaired_crop_size = np.minimum(unpaired_msa.shape[0], total_msa_crop_size)\n    paired_crop_size = None\n  return unpaired_crop_size, paired_crop_size\n\n\ndef remove_all_gapped_rows_from_all_seqs(\n    chains_list: Sequence[dict[str, np.ndarray]], asym_ids: Sequence[float]\n) -> Sequence[dict[str, np.ndarray]]:\n  \"\"\"Removes all gapped rows from all_seq feat based on selected asym_ids.\"\"\"\n\n  merged_msa_all_seq = np.concatenate(\n      [\n          chain['msa_all_seq']\n          for chain in chains_list\n          if chain['asym_id'][0] in asym_ids\n      ],\n      axis=1,\n  )\n\n  non_gapped_keep_rows = np.any(\n      merged_msa_all_seq != data_constants.MSA_GAP_IDX, axis=1\n  )\n  for chain in chains_list:\n    for feat_name in list(chains_list)[0]:\n      if '_all_seq' in feat_name:\n        feat_name_split = feat_name.split('_all_seq')[0]\n        if feat_name_split in (\n            data_constants.NUM_SEQ_NUM_RES_MSA_FEATURES\n            + data_constants.NUM_SEQ_MSA_FEATURES\n        ):\n          # For consistency we do this for all chains even though the\n          # gapped rows are based on a selected set asym_ids.\n          chain[feat_name] = chain[feat_name][non_gapped_keep_rows]\n    chain['num_alignments_all_seq'] = np.sum(non_gapped_keep_rows)\n  return chains_list\n"
  },
  {
    "path": "src/alphafold3/model/network/atom_cross_attention.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Per-atom cross attention.\"\"\"\nimport dataclasses\n\nfrom alphafold3.common import base_config\nfrom alphafold3.model import feat_batch\nfrom alphafold3.model import model_config\nfrom alphafold3.model.atom_layout import atom_layout\nfrom alphafold3.model.components import haiku_modules as hm\nfrom alphafold3.model.components import utils\nfrom alphafold3.model.network import diffusion_transformer\nimport jax\nimport jax.numpy as jnp\n\n\nclass AtomCrossAttEncoderConfig(base_config.BaseConfig):\n  per_token_channels: int = 768\n  per_atom_channels: int = 128\n  atom_transformer: diffusion_transformer.CrossAttTransformer.Config = (\n      base_config.autocreate(num_intermediate_factor=2, num_blocks=3)\n  )\n  per_atom_pair_channels: int = 16\n\n\ndef _per_atom_conditioning(\n    config: AtomCrossAttEncoderConfig, batch: feat_batch.Batch, name: str\n) -> tuple[jnp.ndarray, jnp.ndarray]:\n  \"\"\"computes single and pair conditioning for all atoms in each token.\"\"\"\n\n  c = config\n  # Compute per-atom single conditioning\n  # Shape (num_tokens, num_dense, channels)\n  act = hm.Linear(\n      c.per_atom_channels, precision='highest', name=f'{name}_embed_ref_pos'\n  )(batch.ref_structure.positions)\n  act += hm.Linear(c.per_atom_channels, name=f'{name}_embed_ref_mask')(\n      batch.ref_structure.mask.astype(jnp.float32)[:, :, None]\n  )\n  # Element is encoded as atomic number if the periodic table, so\n  # 128 should be fine.\n  act += hm.Linear(c.per_atom_channels, name=f'{name}_embed_ref_element')(\n      jax.nn.one_hot(batch.ref_structure.element, 128)\n  )\n  act += hm.Linear(c.per_atom_channels, name=f'{name}_embed_ref_charge')(\n      jnp.arcsinh(batch.ref_structure.charge)[:, :, None]\n  )\n  # Characters are encoded as ASCII code minus 32, so we need 64 classes,\n  # to encode all standard ASCII characters between 32 and 96.\n  atom_name_chars_1hot = jax.nn.one_hot(batch.ref_structure.atom_name_chars, 64)\n  num_token, num_dense, _ = act.shape\n  act += hm.Linear(c.per_atom_channels, name=f'{name}_embed_ref_atom_name')(\n      atom_name_chars_1hot.reshape(num_token, num_dense, -1)\n  )\n  act *= batch.ref_structure.mask.astype(jnp.float32)[:, :, None]\n\n  # Compute pair conditioning\n  # shape (num_tokens, num_dense, num_dense, channels)\n  # Embed single features\n  row_act = hm.Linear(\n      c.per_atom_pair_channels, name=f'{name}_single_to_pair_cond_row'\n  )(jax.nn.relu(act))\n  col_act = hm.Linear(\n      c.per_atom_pair_channels, name=f'{name}_single_to_pair_cond_col'\n  )(jax.nn.relu(act))\n  pair_act = row_act[:, :, None, :] + col_act[:, None, :, :]\n  # Embed pairwise offsets\n  pair_act += hm.Linear(\n      c.per_atom_pair_channels,\n      precision='highest',\n      name=f'{name}_embed_pair_offsets',\n  )(\n      batch.ref_structure.positions[:, :, None, :]\n      - batch.ref_structure.positions[:, None, :, :]\n  )\n  # Embed pairwise inverse squared distances\n  sq_dists = jnp.sum(\n      jnp.square(\n          batch.ref_structure.positions[:, :, None, :]\n          - batch.ref_structure.positions[:, None, :, :]\n      ),\n      axis=-1,\n  )\n  pair_act += hm.Linear(\n      c.per_atom_pair_channels, name=f'{name}_embed_pair_distances'\n  )(1.0 / (1 + sq_dists[:, :, :, None]))\n\n  return act, pair_act\n\n\n@dataclasses.dataclass(frozen=True)\nclass AtomCrossAttEncoderOutput:\n  token_act: jnp.ndarray  # (num_tokens, ch)\n  skip_connection: jnp.ndarray  # (num_subsets, num_queries, ch)\n  queries_mask: jnp.ndarray  # (num_subsets, num_queries)\n  queries_single_cond: jnp.ndarray  # (num_subsets, num_queries, ch)\n  keys_mask: jnp.ndarray  # (num_subsets, num_keys)\n  keys_single_cond: jnp.ndarray  # (num_subsets, num_keys, ch)\n  pair_cond: jnp.ndarray  # (num_subsets, num_queries, num_keys, ch)\n\n\njax.tree_util.register_dataclass(\n    AtomCrossAttEncoderOutput,\n    data_fields=[f.name for f in dataclasses.fields(AtomCrossAttEncoderOutput)],\n    meta_fields=[],\n)\n\n\ndef atom_cross_att_encoder(\n    token_atoms_act: jnp.ndarray | None,  # (num_tokens, max_atoms_per_token, 3)\n    trunk_single_cond: jnp.ndarray | None,  # (num_tokens, ch)\n    trunk_pair_cond: jnp.ndarray | None,  # (num_tokens, num_tokens, ch)\n    config: AtomCrossAttEncoderConfig,\n    global_config: model_config.GlobalConfig,\n    batch: feat_batch.Batch,\n    name: str,\n) -> AtomCrossAttEncoderOutput:\n  \"\"\"Cross-attention on flat atom subsets and mapping to per-token features.\"\"\"\n  c = config\n\n  # Compute single conditioning from atom meta data and convert to queries\n  # layout.\n  # (num_subsets, num_queries, channels)\n  token_atoms_single_cond, _ = _per_atom_conditioning(config, batch, name)\n  token_atoms_mask = batch.predicted_structure_info.atom_mask\n  queries_single_cond = atom_layout.convert(\n      batch.atom_cross_att.token_atoms_to_queries,\n      token_atoms_single_cond,\n      layout_axes=(-3, -2),\n  )\n  queries_mask = atom_layout.convert(\n      batch.atom_cross_att.token_atoms_to_queries,\n      token_atoms_mask,\n      layout_axes=(-2, -1),\n  )\n\n  # If provided, broadcast single conditioning from trunk to all queries\n  if trunk_single_cond is not None:\n    trunk_single_cond = hm.Linear(\n        c.per_atom_channels,\n        precision='highest',\n        initializer=global_config.final_init,\n        name=f'{name}_embed_trunk_single_cond',\n    )(\n        hm.LayerNorm(\n            use_fast_variance=False,\n            create_offset=False,\n            name=f'{name}_lnorm_trunk_single_cond',\n        )(trunk_single_cond)\n    )\n    queries_single_cond += atom_layout.convert(\n        batch.atom_cross_att.tokens_to_queries,\n        trunk_single_cond,\n        layout_axes=(-2,),\n    )\n\n  if token_atoms_act is None:\n    # if no token_atoms_act is given (e.g. begin of evoformer), we use the\n    # static conditioning only\n    queries_act = queries_single_cond\n  else:\n    # Convert token_atoms_act to queries layout and map to per_atom_channels\n    # (num_subsets, num_queries, channels)\n    queries_act = atom_layout.convert(\n        batch.atom_cross_att.token_atoms_to_queries,\n        token_atoms_act,\n        layout_axes=(-3, -2),\n    )\n    queries_act = hm.Linear(\n        c.per_atom_channels,\n        precision='highest',\n        name=f'{name}_atom_positions_to_features',\n    )(queries_act)\n    queries_act *= queries_mask[..., None]\n    queries_act += queries_single_cond\n\n  # Gather the keys from the queries.\n  keys_single_cond = atom_layout.convert(\n      batch.atom_cross_att.queries_to_keys,\n      queries_single_cond,\n      layout_axes=(-3, -2),\n  )\n  keys_mask = atom_layout.convert(\n      batch.atom_cross_att.queries_to_keys, queries_mask, layout_axes=(-2, -1)\n  )\n\n  # Embed single features into the pair conditioning.\n  # shape (num_subsets, num_queries, num_keys, ch)\n  row_act = hm.Linear(\n      c.per_atom_pair_channels, name=f'{name}_single_to_pair_cond_row'\n  )(jax.nn.relu(queries_single_cond))\n  pair_cond_keys_input = atom_layout.convert(\n      batch.atom_cross_att.queries_to_keys,\n      queries_single_cond,\n      layout_axes=(-3, -2),\n  )\n  col_act = hm.Linear(\n      c.per_atom_pair_channels, name=f'{name}_single_to_pair_cond_col'\n  )(jax.nn.relu(pair_cond_keys_input))\n  pair_act = row_act[:, :, None, :] + col_act[:, None, :, :]\n\n  if trunk_pair_cond is not None:\n    # If provided, broadcast the pair conditioning for the trunk (evoformer\n    # pairs) to the atom pair activations. This should boost ligands, but also\n    # help for cross attention within proteins, because we always have atoms\n    # from multiple residues in a subset.\n    # Map trunk pair conditioning to per_atom_pair_channels\n    # (num_tokens, num_tokens, per_atom_pair_channels)\n    trunk_pair_cond = hm.Linear(\n        c.per_atom_pair_channels,\n        precision='highest',\n        initializer=global_config.final_init,\n        name=f'{name}_embed_trunk_pair_cond',\n    )(\n        hm.LayerNorm(\n            use_fast_variance=False,\n            create_offset=False,\n            name=f'{name}_lnorm_trunk_pair_cond',\n        )(trunk_pair_cond)\n    )\n\n    # Create the GatherInfo into a flattened trunk_pair_cond from the\n    # queries and keys gather infos.\n    num_tokens = trunk_pair_cond.shape[0]\n    # (num_subsets, num_queries)\n    tokens_to_queries = batch.atom_cross_att.tokens_to_queries\n    # (num_subsets, num_keys)\n    tokens_to_keys = batch.atom_cross_att.tokens_to_keys\n    # (num_subsets, num_queries, num_keys)\n    trunk_pair_to_atom_pair = atom_layout.GatherInfo(\n        gather_idxs=(\n            num_tokens * tokens_to_queries.gather_idxs[:, :, None]\n            + tokens_to_keys.gather_idxs[:, None, :]\n        ),\n        gather_mask=(\n            tokens_to_queries.gather_mask[:, :, None]\n            & tokens_to_keys.gather_mask[:, None, :]\n        ),\n        input_shape=jnp.array((num_tokens, num_tokens)),\n    )\n    # Gather the conditioning and add it to the atom-pair activations.\n    pair_act += atom_layout.convert(\n        trunk_pair_to_atom_pair, trunk_pair_cond, layout_axes=(-3, -2)\n    )\n\n  # Embed pairwise offsets\n  queries_ref_pos = atom_layout.convert(\n      batch.atom_cross_att.token_atoms_to_queries,\n      batch.ref_structure.positions,\n      layout_axes=(-3, -2),\n  )\n  queries_ref_space_uid = atom_layout.convert(\n      batch.atom_cross_att.token_atoms_to_queries,\n      batch.ref_structure.ref_space_uid,\n      layout_axes=(-2, -1),\n  )\n  keys_ref_pos = atom_layout.convert(\n      batch.atom_cross_att.queries_to_keys,\n      queries_ref_pos,\n      layout_axes=(-3, -2),\n  )\n  keys_ref_space_uid = atom_layout.convert(\n      batch.atom_cross_att.queries_to_keys,\n      batch.ref_structure.ref_space_uid,\n      layout_axes=(-2, -1),\n  )\n\n  offsets_valid = (\n      queries_ref_space_uid[:, :, None] == keys_ref_space_uid[:, None, :]\n  )\n  offsets = queries_ref_pos[:, :, None, :] - keys_ref_pos[:, None, :, :]\n  pair_act += (\n      hm.Linear(\n          c.per_atom_pair_channels,\n          precision='highest',\n          name=f'{name}_embed_pair_offsets',\n      )(offsets)\n      * offsets_valid[:, :, :, None]\n  )\n\n  # Embed pairwise inverse squared distances\n  sq_dists = jnp.sum(jnp.square(offsets), axis=-1)\n  pair_act += (\n      hm.Linear(c.per_atom_pair_channels, name=f'{name}_embed_pair_distances')(\n          1.0 / (1 + sq_dists[:, :, :, None])\n      )\n      * offsets_valid[:, :, :, None]\n  )\n  # Embed offsets valid mask\n  pair_act += hm.Linear(\n      c.per_atom_pair_channels, name=f'{name}_embed_pair_offsets_valid'\n  )(offsets_valid[:, :, :, None].astype(jnp.float32))\n\n  # Run a small MLP on the pair acitvations\n  pair_act2 = hm.Linear(\n      c.per_atom_pair_channels, initializer='relu', name=f'{name}_pair_mlp_1'\n  )(jax.nn.relu(pair_act))\n  pair_act2 = hm.Linear(\n      c.per_atom_pair_channels, initializer='relu', name=f'{name}_pair_mlp_2'\n  )(jax.nn.relu(pair_act2))\n  pair_act += hm.Linear(\n      c.per_atom_pair_channels,\n      initializer=global_config.final_init,\n      name=f'{name}_pair_mlp_3',\n  )(jax.nn.relu(pair_act2))\n\n  # Run the atom cross attention transformer.\n  queries_act = diffusion_transformer.CrossAttTransformer(\n      c.atom_transformer, global_config, name=f'{name}_atom_transformer_encoder'\n  )(\n      queries_act=queries_act,\n      queries_mask=queries_mask,\n      queries_to_keys=batch.atom_cross_att.queries_to_keys,\n      keys_mask=keys_mask,\n      queries_single_cond=queries_single_cond,\n      keys_single_cond=keys_single_cond,\n      pair_cond=pair_act,\n  )\n  queries_act *= queries_mask[..., None]\n  skip_connection = queries_act\n\n  # Convert back to token-atom layout and aggregate to tokens\n  queries_act = hm.Linear(\n      c.per_token_channels, name=f'{name}_project_atom_features_for_aggr'\n  )(queries_act)\n  token_atoms_act = atom_layout.convert(\n      batch.atom_cross_att.queries_to_token_atoms,\n      queries_act,\n      layout_axes=(-3, -2),\n  )\n  token_act = utils.mask_mean(\n      token_atoms_mask[..., None], jax.nn.relu(token_atoms_act), axis=-2\n  )\n\n  return AtomCrossAttEncoderOutput(\n      token_act=token_act,\n      skip_connection=skip_connection,\n      queries_mask=queries_mask,\n      queries_single_cond=queries_single_cond,\n      keys_mask=keys_mask,\n      keys_single_cond=keys_single_cond,\n      pair_cond=pair_act,\n  )\n\n\nclass AtomCrossAttDecoderConfig(base_config.BaseConfig):\n  per_atom_channels: int = 128\n  atom_transformer: diffusion_transformer.CrossAttTransformer.Config = (\n      base_config.autocreate(num_intermediate_factor=2, num_blocks=3)\n  )\n\n\ndef atom_cross_att_decoder(\n    token_act: jnp.ndarray,  # (num_tokens, ch)\n    enc: AtomCrossAttEncoderOutput,\n    config: AtomCrossAttDecoderConfig,\n    global_config: model_config.GlobalConfig,\n    batch: feat_batch.Batch,\n    name: str,\n):  # (num_tokens, max_atoms_per_token, 3)\n  \"\"\"Mapping to per-atom features and self-attention on subsets.\"\"\"\n  c = config\n  # map per-token act down to per_atom channels\n  token_act = hm.Linear(\n      c.per_atom_channels, name=f'{name}_project_token_features_for_broadcast'\n  )(token_act)\n  # Broadcast to token-atoms layout and convert to queries layout.\n  num_token, max_atoms_per_token = (\n      batch.atom_cross_att.queries_to_token_atoms.shape\n  )\n  token_atom_act = jnp.broadcast_to(\n      token_act[:, None, :],\n      (num_token, max_atoms_per_token, c.per_atom_channels),\n  )\n  queries_act = atom_layout.convert(\n      batch.atom_cross_att.token_atoms_to_queries,\n      token_atom_act,\n      layout_axes=(-3, -2),\n  )\n  queries_act += enc.skip_connection\n  queries_act *= enc.queries_mask[..., None]\n\n  # Run the atom cross attention transformer.\n  queries_act = diffusion_transformer.CrossAttTransformer(\n      c.atom_transformer, global_config, name=f'{name}_atom_transformer_decoder'\n  )(\n      queries_act=queries_act,\n      queries_mask=enc.queries_mask,\n      queries_to_keys=batch.atom_cross_att.queries_to_keys,\n      keys_mask=enc.keys_mask,\n      queries_single_cond=enc.queries_single_cond,\n      keys_single_cond=enc.keys_single_cond,\n      pair_cond=enc.pair_cond,\n  )\n  queries_act *= enc.queries_mask[..., None]\n  queries_act = hm.LayerNorm(\n      use_fast_variance=False,\n      create_offset=False,\n      name=f'{name}_atom_features_layer_norm',\n  )(queries_act)\n  queries_position_update = hm.Linear(\n      3,\n      initializer=global_config.final_init,\n      precision='highest',\n      name=f'{name}_atom_features_to_position_update',\n  )(queries_act)\n  position_update = atom_layout.convert(\n      batch.atom_cross_att.queries_to_token_atoms,\n      queries_position_update,\n      layout_axes=(-3, -2),\n  )\n  return position_update\n"
  },
  {
    "path": "src/alphafold3/model/network/confidence_head.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Confidence Head.\"\"\"\n\nfrom alphafold3.common import base_config\nfrom alphafold3.model import model_config\nfrom alphafold3.model.atom_layout import atom_layout\nfrom alphafold3.model.components import haiku_modules as hm\nfrom alphafold3.model.components import utils\nfrom alphafold3.model.network import modules\nfrom alphafold3.model.network import template_modules\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\n\n\ndef _safe_norm(x, keepdims, axis, eps=1e-8):\n  return jnp.sqrt(eps + jnp.sum(jnp.square(x), axis=axis, keepdims=keepdims))\n\n\nclass ConfidenceHead(hk.Module):\n  \"\"\"Head to predict the distance errors in a prediction.\"\"\"\n\n  class PAEConfig(base_config.BaseConfig):\n    max_error_bin: float = 31.0\n    num_bins: int = 64\n\n  class Config(base_config.BaseConfig):\n    \"\"\"Configuration for ConfidenceHead.\"\"\"\n\n    pairformer: modules.PairFormerIteration.Config = base_config.autocreate(\n        single_attention=base_config.autocreate(),\n        single_transition=base_config.autocreate(),\n        num_layer=4,\n    )\n    max_error_bin: float = 31.0\n    num_plddt_bins: int = 50\n    num_bins: int = 64\n    no_embedding_prob: float = 0.2\n    pae: 'ConfidenceHead.PAEConfig' = base_config.autocreate()\n    dgram_features: template_modules.DistogramFeaturesConfig = (\n        base_config.autocreate()\n    )\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      name='confidence_head',\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def _embed_features(\n      self,\n      dense_atom_positions,\n      token_atoms_to_pseudo_beta,\n      pair_mask,\n      pair_act,\n      target_feat,\n  ):\n    out = hm.Linear(pair_act.shape[-1], name='left_target_feat_project')(\n        target_feat\n    ).astype(pair_act.dtype)\n    out += hm.Linear(pair_act.shape[-1], name='right_target_feat_project')(\n        target_feat\n    ).astype(pair_act.dtype)[:, None]\n    positions = atom_layout.convert(\n        token_atoms_to_pseudo_beta,\n        dense_atom_positions,\n        layout_axes=(-3, -2),\n    )\n    dgram = template_modules.dgram_from_positions(\n        positions, self.config.dgram_features\n    )\n    dgram *= pair_mask[..., None]\n\n    out += hm.Linear(pair_act.shape[-1], name='distogram_feat_project')(\n        dgram.astype(pair_act.dtype)\n    )\n    return out\n\n  def __call__(\n      self,\n      dense_atom_positions: jnp.ndarray,\n      embeddings: dict[str, jnp.ndarray],\n      seq_mask: jnp.ndarray,\n      token_atoms_to_pseudo_beta: atom_layout.GatherInfo,\n      asym_id: jnp.ndarray,\n  ) -> dict[str, jnp.ndarray]:\n    \"\"\"Builds ConfidenceHead module.\n\n    Arguments:\n      dense_atom_positions: [N_res, N_atom, 3] array of positions.\n      embeddings: Dictionary of representations.\n      seq_mask: Sequence mask.\n      token_atoms_to_pseudo_beta: Pseudo beta info for atom tokens.\n      asym_id: Asym ID token features.\n\n    Returns:\n      Dictionary of results.\n    \"\"\"\n    dtype = (\n        jnp.bfloat16 if self.global_config.bfloat16 == 'all' else jnp.float32\n    )\n    with utils.bfloat16_context():\n      seq_mask_cast = seq_mask.astype(dtype)\n      pair_mask = seq_mask_cast[:, None] * seq_mask_cast[None, :]\n      pair_mask = pair_mask.astype(dtype)\n\n      pair_act = embeddings['pair'].astype(dtype)\n      single_act = embeddings['single'].astype(dtype)\n      target_feat = embeddings['target_feat'].astype(dtype)\n\n      num_residues = seq_mask.shape[0]\n      num_pair_channels = pair_act.shape[2]\n\n      pair_act += self._embed_features(\n          dense_atom_positions,\n          token_atoms_to_pseudo_beta,\n          pair_mask,\n          pair_act,\n          target_feat,\n      )\n\n      def pairformer_fn(act):\n        pair_act, single_act = act\n        return modules.PairFormerIteration(\n            self.config.pairformer,\n            self.global_config,\n            with_single=True,\n            name='confidence_pairformer',\n        )(\n            act=pair_act,\n            single_act=single_act,\n            pair_mask=pair_mask,\n            seq_mask=seq_mask,\n        )\n\n      pairformer_stack = hk.experimental.layer_stack(\n          self.config.pairformer.num_layer\n      )(pairformer_fn)\n\n      pair_act, single_act = pairformer_stack((pair_act, single_act))\n      pair_act = pair_act.astype(jnp.float32)\n      assert pair_act.shape == (num_residues, num_residues, num_pair_channels)\n\n      # Produce logits to predict a distogram of pairwise distance errors\n      # between the input prediction and the ground truth.\n\n      # Shape (num_res, num_res, num_bins)\n      left_distance_logits = hm.Linear(\n          self.config.num_bins,\n          initializer=self.global_config.final_init,\n          name='left_half_distance_logits',\n      )(hm.LayerNorm(name='logits_ln')(pair_act))\n      right_distance_logits = left_distance_logits\n      distance_logits = left_distance_logits + jnp.swapaxes(  # Symmetrize.\n          right_distance_logits, -2, -3\n      )\n      # Shape (num_bins,)\n      distance_breaks = jnp.linspace(\n          0.0, self.config.max_error_bin, self.config.num_bins - 1\n      )\n\n      step = distance_breaks[1] - distance_breaks[0]\n\n      # Add half-step to get the center\n      bin_centers = distance_breaks + step / 2\n      # Add a catch-all bin at the end.\n      bin_centers = jnp.concatenate(\n          [bin_centers, bin_centers[-1:] + step], axis=0\n      )\n\n      distance_probs = jax.nn.softmax(distance_logits, axis=-1)\n\n      pred_distance_error = (\n          jnp.sum(distance_probs * bin_centers, axis=-1) * pair_mask\n      )\n      average_pred_distance_error = jnp.sum(\n          pred_distance_error, axis=[-2, -1]\n      ) / jnp.sum(pair_mask, axis=[-2, -1])\n\n      # Predicted aligned error\n      pae_outputs = {}\n      # Shape (num_res, num_res, num_bins)\n      pae_logits = hm.Linear(\n          self.config.pae.num_bins,\n          initializer=self.global_config.final_init,\n          name='pae_logits',\n      )(hm.LayerNorm(name='pae_logits_ln')(pair_act))\n      # Shape (num_bins,)\n      pae_breaks = jnp.linspace(\n          0.0, self.config.pae.max_error_bin, self.config.pae.num_bins - 1\n      )\n      step = pae_breaks[1] - pae_breaks[0]\n      # Add half-step to get the center\n      bin_centers = pae_breaks + step / 2\n      # Add a catch-all bin at the end.\n      bin_centers = jnp.concatenate(\n          [bin_centers, bin_centers[-1:] + step], axis=0\n      )\n      pae_probs = jax.nn.softmax(pae_logits, axis=-1)\n\n      seq_mask_bool = seq_mask.astype(bool)\n      pair_mask_bool = seq_mask_bool[:, None] * seq_mask_bool[None, :]\n      pae = jnp.sum(pae_probs * bin_centers, axis=-1) * pair_mask_bool\n      pae_outputs.update({\n          'full_pae': pae,\n      })\n\n    # The pTM is computed outside of bfloat16 context.\n    tmscore_adjusted_pae_global, tmscore_adjusted_pae_interface = (\n        self._get_tmscore_adjusted_pae(\n            asym_id=asym_id,\n            seq_mask=seq_mask,\n            pair_mask=pair_mask_bool,\n            bin_centers=bin_centers,\n            pae_probs=pae_probs,\n        )\n    )\n    pae_outputs.update({\n        'tmscore_adjusted_pae_global': tmscore_adjusted_pae_global,\n        'tmscore_adjusted_pae_interface': tmscore_adjusted_pae_interface,\n    })\n    single_act = single_act.astype('float32')\n\n    # pLDDT\n    # Shape (num_res, num_atom, num_bins)\n    plddt_logits = hm.Linear(\n        (dense_atom_positions.shape[-2], self.config.num_plddt_bins),\n        initializer=self.global_config.final_init,\n        name='plddt_logits',\n    )(hm.LayerNorm(name='plddt_logits_ln')(single_act))\n\n    bin_width = 1.0 / self.config.num_plddt_bins\n    bin_centers = jnp.arange(0.5 * bin_width, 1.0, bin_width)\n    predicted_lddt = jnp.sum(\n        jax.nn.softmax(plddt_logits, axis=-1) * bin_centers, axis=-1\n    )\n    predicted_lddt = predicted_lddt * 100.0\n\n    # Experimentally resolved\n    # Shape (num_res, num_atom, 2)\n    experimentally_resolved_logits = hm.Linear(\n        (dense_atom_positions.shape[-2], 2),\n        initializer=self.global_config.final_init,\n        name='experimentally_resolved_logits',\n    )(hm.LayerNorm(name='experimentally_resolved_ln')(single_act))\n\n    predicted_experimentally_resolved = jax.nn.softmax(\n        experimentally_resolved_logits, axis=-1\n    )[..., 1]\n\n    return {\n        'predicted_lddt': predicted_lddt,\n        'predicted_experimentally_resolved': predicted_experimentally_resolved,\n        'full_pde': pred_distance_error,\n        'average_pde': average_pred_distance_error,\n        **pae_outputs,\n    }\n\n  def _get_tmscore_adjusted_pae(\n      self,\n      asym_id: jnp.ndarray,\n      seq_mask: jnp.ndarray,\n      pair_mask: jnp.ndarray,\n      bin_centers: jnp.ndarray,\n      pae_probs: jnp.ndarray,\n  ):\n    def get_tmscore_adjusted_pae(num_interface_tokens, bin_centers, pae_probs):\n      # Clip to avoid negative/undefined d0.\n      clipped_num_res = jnp.maximum(num_interface_tokens, 19)\n\n      # Compute d_0(num_res) as defined by TM-score, eqn. (5) in\n      # http://zhanglab.ccmb.med.umich.edu/papers/2004_3.pdf\n      # Yang & Skolnick \"Scoring function for automated\n      # assessment of protein structure template quality\" 2004.\n      d0 = 1.24 * (clipped_num_res - 15) ** (1.0 / 3) - 1.8\n\n      # Make compatible with [num_tokens, num_tokens, num_bins]\n      d0 = d0[:, :, None]\n      bin_centers = bin_centers[None, None, :]\n\n      # TM-Score term for every bin.\n      tm_per_bin = 1.0 / (1 + jnp.square(bin_centers) / jnp.square(d0))\n      # E_distances tm(distance).\n      predicted_tm_term = jnp.sum(pae_probs * tm_per_bin, axis=-1)\n      return predicted_tm_term\n\n    # Interface version\n    x = asym_id[None, :] == asym_id[:, None]\n    num_chain_tokens = jnp.sum(x * pair_mask, axis=-1)\n    num_interface_tokens = num_chain_tokens[None, :] + num_chain_tokens[:, None]\n    # Don't double-count within a single chain\n    num_interface_tokens -= x * (num_interface_tokens // 2)\n    num_interface_tokens = num_interface_tokens * pair_mask\n\n    num_global_tokens = jnp.full(\n        shape=pair_mask.shape, fill_value=seq_mask.sum()\n    )\n\n    assert num_global_tokens.dtype == 'int32'\n    assert num_interface_tokens.dtype == 'int32'\n    global_apae = get_tmscore_adjusted_pae(\n        num_global_tokens, bin_centers, pae_probs\n    )\n    interface_apae = get_tmscore_adjusted_pae(\n        num_interface_tokens, bin_centers, pae_probs\n    )\n    return global_apae, interface_apae\n"
  },
  {
    "path": "src/alphafold3/model/network/diffusion_head.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Diffusion Head.\"\"\"\n\nfrom collections.abc import Callable\n\nfrom alphafold3.common import base_config\nfrom alphafold3.model import feat_batch\nfrom alphafold3.model import model_config\nfrom alphafold3.model.components import haiku_modules as hm\nfrom alphafold3.model.components import utils\nfrom alphafold3.model.network import atom_cross_attention\nfrom alphafold3.model.network import diffusion_transformer\nfrom alphafold3.model.network import featurization\nfrom alphafold3.model.network import noise_level_embeddings\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\n\n\n# Carefully measured by averaging multimer training set.\nSIGMA_DATA = 16.0\n\n\ndef random_rotation(key):\n  # Create a random rotation (Gram-Schmidt orthogonalization of two\n  # random normal vectors)\n  v0, v1 = jax.random.normal(key, shape=(2, 3))\n  e0 = v0 / jnp.maximum(1e-10, jnp.linalg.norm(v0))\n  v1 = v1 - e0 * jnp.dot(v1, e0, precision=jax.lax.Precision.HIGHEST)\n  e1 = v1 / jnp.maximum(1e-10, jnp.linalg.norm(v1))\n  e2 = jnp.cross(e0, e1)\n  return jnp.stack([e0, e1, e2])\n\n\ndef random_augmentation(\n    rng_key: jnp.ndarray,\n    positions: jnp.ndarray,\n    mask: jnp.ndarray,\n) -> jnp.ndarray:\n  \"\"\"Apply random rigid augmentation.\n\n  Args:\n    rng_key: random key\n    positions: atom positions of shape (<common_axes>, 3)\n    mask: per-atom mask of shape (<common_axes>,)\n\n  Returns:\n    Transformed positions with the same shape as input positions.\n  \"\"\"\n  rotation_key, translation_key = jax.random.split(rng_key)\n\n  center = utils.mask_mean(\n      mask[..., None], positions, axis=(-2, -3), keepdims=True, eps=1e-6\n  )\n  rot = random_rotation(rotation_key)\n  translation = jax.random.normal(translation_key, shape=(3,))\n\n  augmented_positions = (\n      jnp.einsum(\n          '...i,ij->...j',\n          positions - center,\n          rot,\n          precision=jax.lax.Precision.HIGHEST,\n      )\n      + translation\n  )\n  return augmented_positions * mask[..., None]\n\n\ndef noise_schedule(t, smin=0.0004, smax=160.0, p=7):\n  return (\n      SIGMA_DATA\n      * (smax ** (1 / p) + t * (smin ** (1 / p) - smax ** (1 / p))) ** p\n  )\n\n\nclass ConditioningConfig(base_config.BaseConfig):\n  pair_channel: int\n  seq_channel: int\n  prob: float\n\n\nclass SampleConfig(base_config.BaseConfig):\n  steps: int\n  gamma_0: float = 0.8\n  gamma_min: float = 1.0\n  noise_scale: float = 1.003\n  step_scale: float = 1.5\n  num_samples: int = 1\n\n\nclass DiffusionHead(hk.Module):\n  \"\"\"Denoising Diffusion Head.\"\"\"\n\n  class Config(\n      atom_cross_attention.AtomCrossAttEncoderConfig,\n      atom_cross_attention.AtomCrossAttDecoderConfig,\n  ):\n    \"\"\"Configuration for DiffusionHead.\"\"\"\n\n    eval_batch_size: int = 5\n    eval_batch_dim_shard_size: int = 5\n    conditioning: ConditioningConfig = base_config.autocreate(\n        prob=0.8, pair_channel=128, seq_channel=384\n    )\n    eval: SampleConfig = base_config.autocreate(\n        num_samples=5,\n        steps=200,\n    )\n    transformer: diffusion_transformer.Transformer.Config = (\n        base_config.autocreate()\n    )\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      name='diffusion_head',\n  ):\n    self.config = config\n    self.global_config = global_config\n    super().__init__(name=name)\n\n  @hk.transparent\n  def _conditioning(\n      self,\n      batch: feat_batch.Batch,\n      embeddings: dict[str, jnp.ndarray],\n      noise_level: jnp.ndarray,\n      use_conditioning: bool,\n  ) -> tuple[jnp.ndarray, jnp.ndarray]:\n    single_embedding = use_conditioning * embeddings['single']\n    pair_embedding = use_conditioning * embeddings['pair']\n\n    rel_features = featurization.create_relative_encoding(\n        seq_features=batch.token_features,\n        max_relative_idx=32,\n        max_relative_chain=2,\n    ).astype(pair_embedding.dtype)\n    features_2d = jnp.concatenate([pair_embedding, rel_features], axis=-1)\n    pair_cond = hm.Linear(\n        self.config.conditioning.pair_channel,\n        precision='highest',\n        name='pair_cond_initial_projection',\n    )(\n        hm.LayerNorm(\n            use_fast_variance=False,\n            create_offset=False,\n            name='pair_cond_initial_norm',\n        )(features_2d)\n    )\n\n    for idx in range(2):\n      pair_cond += diffusion_transformer.transition_block(\n          pair_cond, 2, self.global_config, name=f'pair_transition_{idx}'\n      )\n\n    target_feat = embeddings['target_feat']\n    features_1d = jnp.concatenate([single_embedding, target_feat], axis=-1)\n    single_cond = hm.LayerNorm(\n        use_fast_variance=False,\n        create_offset=False,\n        name='single_cond_initial_norm',\n    )(features_1d)\n    single_cond = hm.Linear(\n        self.config.conditioning.seq_channel,\n        precision='highest',\n        name='single_cond_initial_projection',\n    )(single_cond)\n\n    noise_embedding = noise_level_embeddings.noise_embeddings(\n        sigma_scaled_noise_level=noise_level / SIGMA_DATA\n    )\n    single_cond += hm.Linear(\n        self.config.conditioning.seq_channel,\n        precision='highest',\n        name='noise_embedding_initial_projection',\n    )(\n        hm.LayerNorm(\n            use_fast_variance=False,\n            create_offset=False,\n            name='noise_embedding_initial_norm',\n        )(noise_embedding)\n    )\n\n    for idx in range(2):\n      single_cond += diffusion_transformer.transition_block(\n          single_cond, 2, self.global_config, name=f'single_transition_{idx}'\n      )\n\n    return single_cond, pair_cond\n\n  def __call__(\n      self,\n      # positions_noisy.shape: (num_token, max_atoms_per_token, 3)\n      positions_noisy: jnp.ndarray,\n      noise_level: jnp.ndarray,\n      batch: feat_batch.Batch,\n      embeddings: dict[str, jnp.ndarray],\n      use_conditioning: bool,\n  ) -> jnp.ndarray:\n\n    with utils.bfloat16_context():\n      # Get conditioning\n      trunk_single_cond, trunk_pair_cond = self._conditioning(\n          batch=batch,\n          embeddings=embeddings,\n          noise_level=noise_level,\n          use_conditioning=use_conditioning,\n      )\n\n      # Extract features\n      sequence_mask = batch.token_features.mask\n      atom_mask = batch.predicted_structure_info.atom_mask\n\n      # Position features\n      act = positions_noisy * atom_mask[..., None]\n      act = act / jnp.sqrt(noise_level**2 + SIGMA_DATA**2)\n\n      enc = atom_cross_attention.atom_cross_att_encoder(\n          token_atoms_act=act,\n          trunk_single_cond=embeddings['single'],\n          trunk_pair_cond=trunk_pair_cond,\n          config=self.config,\n          global_config=self.global_config,\n          batch=batch,\n          name='diffusion',\n      )\n      act = enc.token_act\n\n      # Token-token attention\n      act = jnp.asarray(act, dtype=jnp.float32)\n\n      act += hm.Linear(\n          act.shape[-1],\n          precision='highest',\n          initializer=self.global_config.final_init,\n          name='single_cond_embedding_projection',\n      )(\n          hm.LayerNorm(\n              use_fast_variance=False,\n              create_offset=False,\n              name='single_cond_embedding_norm',\n          )(trunk_single_cond)\n      )\n\n      act = jnp.asarray(act, dtype=jnp.float32)\n      trunk_single_cond = jnp.asarray(trunk_single_cond, dtype=jnp.float32)\n      trunk_pair_cond = jnp.asarray(trunk_pair_cond, dtype=jnp.float32)\n      sequence_mask = jnp.asarray(sequence_mask, dtype=jnp.float32)\n\n      transformer = diffusion_transformer.Transformer(\n          self.config.transformer, self.global_config\n      )\n      act = transformer(\n          act=act,\n          single_cond=trunk_single_cond,\n          mask=sequence_mask,\n          pair_cond=trunk_pair_cond,\n      )\n      act = hm.LayerNorm(\n          use_fast_variance=False, create_offset=False, name='output_norm'\n      )(act)\n      # (n_tokens, per_token_channels)\n\n      # (Possibly) atom-granularity decoder\n      assert isinstance(enc, atom_cross_attention.AtomCrossAttEncoderOutput)\n      position_update = atom_cross_attention.atom_cross_att_decoder(\n          token_act=act,\n          enc=enc,\n          config=self.config,\n          global_config=self.global_config,\n          batch=batch,\n          name='diffusion',\n      )\n\n      skip_scaling = SIGMA_DATA**2 / (noise_level**2 + SIGMA_DATA**2)\n      out_scaling = (\n          noise_level * SIGMA_DATA / jnp.sqrt(noise_level**2 + SIGMA_DATA**2)\n      )\n    # End `with utils.bfloat16_context()`.\n\n    return (\n        skip_scaling * positions_noisy + out_scaling * position_update\n    ) * atom_mask[..., None]\n\n\ndef sample(\n    denoising_step: Callable[[jnp.ndarray, jnp.ndarray], jnp.ndarray],\n    batch: feat_batch.Batch,\n    key: jnp.ndarray,\n    config: SampleConfig,\n) -> dict[str, jnp.ndarray]:\n  \"\"\"Sample using denoiser on batch.\n\n  Args:\n    denoising_step: the denoising function.\n    batch: the batch\n    key: random key\n    config: config for the sampling process (e.g. number of denoising steps,\n      etc.)\n\n  Returns:\n    a dict\n      {\n         'atom_positions': jnp.array(...)       # shape (<common_axes>, 3)\n         'mask': jnp.array(...)                 # shape (<common_axes>,)\n      }\n    where the <common_axes> are\n    (num_samples, num_tokens, max_atoms_per_token)\n  \"\"\"\n\n  mask = batch.predicted_structure_info.atom_mask\n\n  def apply_denoising_step(carry, noise_level):\n    key, positions, noise_level_prev = carry\n    key, key_noise, key_aug = jax.random.split(key, 3)\n\n    positions = random_augmentation(\n        rng_key=key_aug, positions=positions, mask=mask\n    )\n\n    gamma = config.gamma_0 * (noise_level > config.gamma_min)\n    t_hat = noise_level_prev * (1 + gamma)\n\n    noise_scale = config.noise_scale * jnp.sqrt(t_hat**2 - noise_level_prev**2)\n    noise = noise_scale * jax.random.normal(key_noise, positions.shape)\n    positions_noisy = positions + noise\n\n    positions_denoised = denoising_step(positions_noisy, t_hat)\n    grad = (positions_noisy - positions_denoised) / t_hat\n\n    d_t = noise_level - t_hat\n    positions_out = positions_noisy + config.step_scale * d_t * grad\n\n    return (key, positions_out, noise_level), positions_out\n\n  num_samples = config.num_samples\n\n  noise_levels = noise_schedule(jnp.linspace(0, 1, config.steps + 1))\n\n  key, noise_key = jax.random.split(key)\n  positions = jax.random.normal(noise_key, (num_samples,) + mask.shape + (3,))\n  positions *= noise_levels[0]\n\n  init = (\n      jax.random.split(key, num_samples),\n      positions,\n      jnp.tile(noise_levels[None, 0], (num_samples,)),\n  )\n\n  apply_denoising_step = hk.vmap(\n      apply_denoising_step, in_axes=(0, None), split_rng=(not hk.running_init())\n  )\n  result, _ = hk.scan(apply_denoising_step, init, noise_levels[1:], unroll=4)\n  _, positions_out, _ = result\n\n  final_dense_atom_mask = jnp.tile(mask[None], (num_samples, 1, 1))\n\n  return {'atom_positions': positions_out, 'mask': final_dense_atom_mask}\n"
  },
  {
    "path": "src/alphafold3/model/network/diffusion_transformer.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Diffusion transformer model.\"\"\"\n\nfrom alphafold3.common import base_config\nfrom alphafold3.model import model_config\nfrom alphafold3.model.atom_layout import atom_layout\nfrom alphafold3.model.components import haiku_modules as hm\nimport haiku as hk\nimport jax\nfrom jax import numpy as jnp\nimport tokamax\n\n\ndef adaptive_layernorm(x, single_cond, name):\n  \"\"\"Adaptive LayerNorm.\"\"\"\n  # Adopted from Scalable Diffusion Models with Transformers\n  # https://arxiv.org/abs/2212.09748\n  if single_cond is None:\n    x = hm.LayerNorm(name=f'{name}layer_norm', use_fast_variance=False)(x)\n  else:\n    x = hm.LayerNorm(\n        name=f'{name}layer_norm',\n        use_fast_variance=False,\n        create_scale=False,\n        create_offset=False,\n    )(x)\n    single_cond = hm.LayerNorm(\n        name=f'{name}single_cond_layer_norm',\n        use_fast_variance=False,\n        create_offset=False,\n    )(single_cond)\n    single_scale = hm.Linear(\n        x.shape[-1],\n        initializer='zeros',\n        use_bias=True,\n        name=f'{name}single_cond_scale',\n    )(single_cond)\n    single_bias = hm.Linear(\n        x.shape[-1], initializer='zeros', name=f'{name}single_cond_bias'\n    )(single_cond)\n    x = jax.nn.sigmoid(single_scale) * x + single_bias\n  return x\n\n\ndef adaptive_zero_init(\n    x, num_channels, single_cond, global_config: model_config.GlobalConfig, name\n):\n  \"\"\"Adaptive zero init, from AdaLN-zero.\"\"\"\n  if single_cond is None:\n    output = hm.Linear(\n        num_channels,\n        initializer=global_config.final_init,\n        name=f'{name}transition2',\n    )(x)\n  else:\n    output = hm.Linear(num_channels, name=f'{name}transition2')(x)\n    # Init to a small gain, sigmoid(-2) ~ 0.1\n    cond = hm.Linear(\n        output.shape[-1],\n        initializer='zeros',\n        use_bias=True,\n        bias_init=-2.0,\n        name=f'{name}adaptive_zero_cond',\n    )(single_cond)\n    output = jax.nn.sigmoid(cond) * output\n  return output\n\n\ndef transition_block(\n    x: jnp.ndarray,\n    num_intermediate_factor: int,\n    global_config: model_config.GlobalConfig,\n    single_cond: jnp.ndarray | None = None,\n    use_glu_kernel: bool = True,\n    name: str = '',\n) -> jnp.ndarray:\n  \"\"\"Transition Block.\"\"\"\n  num_channels = x.shape[-1]\n  num_intermediates = num_intermediate_factor * num_channels\n\n  x = adaptive_layernorm(x, single_cond, name=f'{name}ffw_')\n\n  if use_glu_kernel:\n    weights, _ = hm.haiku_linear_get_params(\n        x,\n        num_output=num_intermediates * 2,\n        initializer='relu',\n        name=f'{name}ffw_transition1',\n    )\n    weights = jnp.reshape(weights, (len(weights), 2, num_intermediates))\n    c = tokamax.gated_linear_unit(x=x, weights=weights, activation=jax.nn.swish)\n  else:\n    x = hm.Linear(\n        num_intermediates * 2, initializer='relu', name=f'{name}ffw_transition1'\n    )(x)\n    a, b = jnp.split(x, 2, axis=-1)\n    c = jax.nn.swish(a) * b\n\n  output = adaptive_zero_init(\n      c, num_channels, single_cond, global_config, f'{name}ffw_'\n  )\n  return output\n\n\nclass SelfAttentionConfig(base_config.BaseConfig):\n  num_head: int = 16\n  key_dim: int | None = None\n  value_dim: int | None = None\n\n\ndef self_attention(\n    x: jnp.ndarray,  # (num_tokens, ch)\n    mask: jnp.ndarray,  # (num_tokens,)\n    pair_logits: jnp.ndarray | None,  # (num_heads, num_tokens, num_tokens)\n    config: SelfAttentionConfig,\n    global_config: model_config.GlobalConfig,\n    single_cond: jnp.ndarray | None = None,  # (num_tokens, ch)\n    name: str = '',\n) -> jnp.ndarray:\n  \"\"\"Multihead self-attention.\"\"\"\n  assert len(mask.shape) == len(x.shape) - 1, f'{mask.shape}, {x.shape}'\n  # bias: ... x heads (1) x query (1) x key\n  bias = (1e9 * (mask - 1.0))[..., None, None, :]\n\n  x = adaptive_layernorm(x, single_cond, name=name)\n\n  num_channels = x.shape[-1]\n  # Sensible default for when the config keys are missing\n  key_dim = config.key_dim if config.key_dim is not None else num_channels\n  value_dim = config.value_dim if config.value_dim is not None else num_channels\n  num_head = config.num_head\n  assert key_dim % num_head == 0, f'{key_dim=} % {num_head=} != 0'\n  assert value_dim % num_head == 0, f'{value_dim=} % {num_head=} != 0'\n  key_dim = key_dim // num_head\n  value_dim = value_dim // num_head\n\n  qk_shape = (num_head, key_dim)\n  q = hm.Linear(qk_shape, use_bias=True, name=f'{name}q_projection')(x)\n  k = hm.Linear(qk_shape, use_bias=False, name=f'{name}k_projection')(x)\n\n  # In some situations the gradient norms can blow up without running this\n  # einsum in float32.\n  q = q.astype(jnp.float32)\n  k = k.astype(jnp.float32)\n  bias = bias.astype(jnp.float32)\n  logits = jnp.einsum('...qhc,...khc->...hqk', q * key_dim ** (-0.5), k) + bias\n  if pair_logits is not None:\n    logits += pair_logits  # (num_heads, seq_len, seq_len)\n  weights = jax.nn.softmax(logits, axis=-1)\n  weights = jnp.asarray(weights, dtype=x.dtype)\n\n  v_shape = (num_head, value_dim)\n  v = hm.Linear(v_shape, use_bias=False, name=f'{name}v_projection')(x)\n  weighted_avg = jnp.einsum('...hqk,...khc->...qhc', weights, v)\n  weighted_avg = jnp.reshape(weighted_avg, weighted_avg.shape[:-2] + (-1,))\n\n  gate_logits = hm.Linear(\n      num_head * value_dim,\n      bias_init=1.0,\n      initializer='zeros',\n      name=f'{name}gating_query',\n  )(x)\n  weighted_avg *= jax.nn.sigmoid(gate_logits)\n\n  output = adaptive_zero_init(\n      weighted_avg, num_channels, single_cond, global_config, name\n  )\n  return output\n\n\nclass Transformer(hk.Module):\n  \"\"\"Simple transformer stack.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    attention: SelfAttentionConfig = base_config.autocreate()\n    num_blocks: int = 24\n    block_remat: bool = False\n    super_block_size: int = 4\n    num_intermediate_factor: int = 2\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      name: str = 'transformer',\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(\n      self,\n      act: jnp.ndarray,\n      mask: jnp.ndarray,\n      single_cond: jnp.ndarray,\n      pair_cond: jnp.ndarray | None,\n  ) -> jnp.ndarray:\n    def block(act, pair_logits):\n      act += self_attention(\n          act,\n          mask,\n          pair_logits,\n          self.config.attention,\n          self.global_config,\n          single_cond,\n          name=self.name,\n      )\n      act += transition_block(\n          act,\n          self.config.num_intermediate_factor,\n          self.global_config,\n          single_cond,\n          name=self.name,\n      )\n      return act, None\n\n    # Precompute pair logits for performance\n    if pair_cond is None:\n      pair_act = None\n    else:\n      pair_act = hm.LayerNorm(\n          name='pair_input_layer_norm',\n          use_fast_variance=False,\n          create_offset=False,\n      )(pair_cond)\n\n    assert self.config.num_blocks % self.config.super_block_size == 0\n    num_super_blocks = self.config.num_blocks // self.config.super_block_size\n\n    def super_block(act):\n      if pair_act is None:\n        pair_logits = None\n      else:\n        pair_logits = hm.Linear(\n            (self.config.super_block_size, self.config.attention.num_head),\n            name='pair_logits_projection',\n        )(pair_act)\n        pair_logits = jnp.transpose(pair_logits, [2, 3, 0, 1])\n      return hk.experimental.layer_stack(\n          self.config.super_block_size, with_per_layer_inputs=True\n      )(block)(act, pair_logits)\n\n    return hk.experimental.layer_stack(\n        num_super_blocks, with_per_layer_inputs=True\n    )(super_block)(act)[0]\n\n\nclass CrossAttentionConfig(base_config.BaseConfig):\n  num_head: int = 4\n  key_dim: int = 128\n  value_dim: int = 128\n\n\ndef cross_attention(\n    x_q: jnp.ndarray,  # (..., Q, C)\n    x_k: jnp.ndarray,  # (..., K, C)\n    mask_q: jnp.ndarray,  # (..., Q)\n    mask_k: jnp.ndarray,  # (..., K)\n    config: CrossAttentionConfig,\n    global_config: model_config.GlobalConfig,\n    pair_logits: jnp.ndarray | None = None,  # (..., Q, K)\n    single_cond_q: jnp.ndarray | None = None,  # (..., Q, C)\n    single_cond_k: jnp.ndarray | None = None,  # (..., K, C)\n    name: str = '',\n) -> jnp.ndarray:\n  \"\"\"Multihead self-attention.\"\"\"\n  assert len(mask_q.shape) == len(x_q.shape) - 1, f'{mask_q.shape}, {x_q.shape}'\n  assert len(mask_k.shape) == len(x_k.shape) - 1, f'{mask_k.shape}, {x_k.shape}'\n  # bias: ... x heads (1) x query x key\n  bias = (\n      1e9\n      * (mask_q - 1.0)[..., None, :, None]\n      * (mask_k - 1.0)[..., None, None, :]\n  )\n\n  x_q = adaptive_layernorm(x_q, single_cond_q, name=f'{name}q')\n  x_k = adaptive_layernorm(x_k, single_cond_k, name=f'{name}k')\n\n  assert config.key_dim % config.num_head == 0\n  assert config.value_dim % config.num_head == 0\n  key_dim = config.key_dim // config.num_head\n  value_dim = config.value_dim // config.num_head\n\n  q = hm.Linear(\n      (config.num_head, key_dim), use_bias=True, name=f'{name}q_projection'\n  )(x_q)\n  k = hm.Linear(\n      (config.num_head, key_dim), use_bias=False, name=f'{name}k_projection'\n  )(x_k)\n\n  # In some situations the gradient norms can blow up without running this\n  # einsum in float32.\n  q = q.astype(jnp.float32)\n  k = k.astype(jnp.float32)\n  bias = bias.astype(jnp.float32)\n  logits = jnp.einsum('...qhc,...khc->...hqk', q * key_dim ** (-0.5), k) + bias\n  if pair_logits is not None:\n    logits += pair_logits\n  weights = jax.nn.softmax(logits, axis=-1)\n  weights = jnp.asarray(weights, dtype=x_q.dtype)\n\n  v = hm.Linear(\n      (config.num_head, value_dim), use_bias=False, name=f'{name}v_projection'\n  )(x_k)\n  weighted_avg = jnp.einsum('...hqk,...khc->...qhc', weights, v)\n  weighted_avg = jnp.reshape(weighted_avg, weighted_avg.shape[:-2] + (-1,))\n\n  gate_logits = hm.Linear(\n      config.num_head * value_dim,\n      bias_init=1.0,\n      initializer='zeros',\n      name=f'{name}gating_query',\n  )(x_q)\n  weighted_avg *= jax.nn.sigmoid(gate_logits)\n\n  output = adaptive_zero_init(\n      weighted_avg, x_q.shape[-1], single_cond_q, global_config, name\n  )\n  return output\n\n\nclass CrossAttTransformer(hk.Module):\n  \"\"\"Transformer that applies cross attention between two sets of subsets.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    num_intermediate_factor: int\n    num_blocks: int\n    attention: CrossAttentionConfig = base_config.autocreate()\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      name: str = 'transformer',\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(\n      self,\n      queries_act: jnp.ndarray,  # (num_subsets, num_queries, ch)\n      queries_mask: jnp.ndarray,  # (num_subsets, num_queries)\n      queries_to_keys: atom_layout.GatherInfo,  # (num_subsets, num_keys)\n      keys_mask: jnp.ndarray,  # (num_subsets, num_keys)\n      queries_single_cond: jnp.ndarray,  # (num_subsets, num_queries, ch)\n      keys_single_cond: jnp.ndarray,  # (num_subsets, num_keys, ch)\n      pair_cond: jnp.ndarray,  # (num_subsets, num_queries, num_keys, ch)\n  ) -> jnp.ndarray:\n    def block(queries_act, pair_logits):\n      # copy the queries activations to the keys layout\n      keys_act = atom_layout.convert(\n          queries_to_keys, queries_act, layout_axes=(-3, -2)\n      )\n      # cross attention\n      queries_act += cross_attention(\n          x_q=queries_act,\n          x_k=keys_act,\n          mask_q=queries_mask,\n          mask_k=keys_mask,\n          config=self.config.attention,\n          global_config=self.global_config,\n          pair_logits=pair_logits,\n          single_cond_q=queries_single_cond,\n          single_cond_k=keys_single_cond,\n          name=self.name,\n      )\n      queries_act += transition_block(\n          queries_act,\n          self.config.num_intermediate_factor,\n          self.global_config,\n          queries_single_cond,\n          name=self.name,\n      )\n      return queries_act, None\n\n    # Precompute pair logits for performance\n    pair_act = hm.LayerNorm(\n        name='pair_input_layer_norm',\n        use_fast_variance=False,\n        create_offset=False,\n    )(pair_cond)\n    # (num_subsets, num_queries, num_keys, num_blocks, num_heads)\n    pair_logits = hm.Linear(\n        (self.config.num_blocks, self.config.attention.num_head),\n        name='pair_logits_projection',\n    )(pair_act)\n    # (num_block, num_subsets, num_heads, num_queries, num_keys)\n    pair_logits = jnp.transpose(pair_logits, [3, 0, 4, 1, 2])\n\n    return hk.experimental.layer_stack(\n        self.config.num_blocks, with_per_layer_inputs=True\n    )(block)(queries_act, pair_logits)[0]\n"
  },
  {
    "path": "src/alphafold3/model/network/distogram_head.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Distogram head.\"\"\"\n\nfrom typing import Final\n\nfrom alphafold3.common import base_config\nfrom alphafold3.model import feat_batch\nfrom alphafold3.model import model_config\nfrom alphafold3.model.components import haiku_modules as hm\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\n\n\n_CONTACT_THRESHOLD: Final[float] = 8.0\n_CONTACT_EPSILON: Final[float] = 1e-3\n\n\nclass DistogramHead(hk.Module):\n  \"\"\"Distogram head.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    first_break: float = 2.3125\n    last_break: float = 21.6875\n    num_bins: int = 64\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      name='distogram_head',\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(\n      self,\n      batch: feat_batch.Batch,\n      embeddings: dict[str, jnp.ndarray],\n      return_distogram: bool = False,\n  ) -> dict[str, jnp.ndarray]:\n    pair_act = embeddings['pair']\n    seq_mask = batch.token_features.mask.astype(bool)\n    pair_mask = seq_mask[:, None] * seq_mask[None, :]\n\n    left_half_logits = hm.Linear(\n        self.config.num_bins,\n        initializer=self.global_config.final_init,\n        name='half_logits',\n    )(pair_act)\n\n    right_half_logits = left_half_logits\n    logits = left_half_logits + jnp.swapaxes(right_half_logits, -2, -3)\n    probs = jax.nn.softmax(logits, axis=-1)\n    breaks = jnp.linspace(\n        self.config.first_break,\n        self.config.last_break,\n        self.config.num_bins - 1,\n    )\n\n    bin_tops = jnp.append(breaks, breaks[-1] + (breaks[-1] - breaks[-2]))\n    threshold = _CONTACT_THRESHOLD + _CONTACT_EPSILON\n    is_contact_bin = 1.0 * (bin_tops <= threshold)\n    contact_probs = jnp.einsum(\n        'ijk,k->ij', probs, is_contact_bin, precision=jax.lax.Precision.HIGHEST\n    )\n    contact_probs = pair_mask * contact_probs\n\n    return_dict = {'bin_edges': breaks, 'contact_probs': contact_probs}\n    if return_distogram:\n      return_dict['distogram'] = logits\n\n    return return_dict\n"
  },
  {
    "path": "src/alphafold3/model/network/evoformer.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Evoformer network.\"\"\"\n\nimport functools\n\nfrom alphafold3.common import base_config\nfrom alphafold3.model import feat_batch\nfrom alphafold3.model import features\nfrom alphafold3.model import model_config\nfrom alphafold3.model.components import haiku_modules as hm\nfrom alphafold3.model.components import utils\nfrom alphafold3.model.network import atom_cross_attention\nfrom alphafold3.model.network import featurization\nfrom alphafold3.model.network import modules\nfrom alphafold3.model.network import template_modules\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\n\n\nclass Evoformer(hk.Module):\n  \"\"\"Creates 'single' and 'pair' embeddings.\"\"\"\n\n  class PairformerConfig(modules.PairFormerIteration.Config):  # pytype: disable=invalid-function-definition\n    block_remat: bool = False\n    remat_block_size: int = 8\n\n  class Config(base_config.BaseConfig):\n    \"\"\"Configuration for Evoformer.\"\"\"\n\n    max_relative_chain: int = 2\n    msa_channel: int = 64\n    seq_channel: int = 384\n    max_relative_idx: int = 32\n    num_msa: int = 1024\n    pair_channel: int = 128\n    pairformer: 'Evoformer.PairformerConfig' = base_config.autocreate(\n        single_transition=base_config.autocreate(),\n        single_attention=base_config.autocreate(),\n        num_layer=48,\n    )\n    per_atom_conditioning: atom_cross_attention.AtomCrossAttEncoderConfig = (\n        base_config.autocreate(\n            per_token_channels=384,\n            per_atom_channels=128,\n            atom_transformer=base_config.autocreate(\n                num_intermediate_factor=2,\n                num_blocks=3,\n            ),\n            per_atom_pair_channels=16,\n        )\n    )\n    template: template_modules.TemplateEmbedding.Config = (\n        base_config.autocreate()\n    )\n    msa_stack: modules.EvoformerIteration.Config = base_config.autocreate()\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      name='evoformer',\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def _relative_encoding(\n      self, batch: feat_batch.Batch, pair_activations: jnp.ndarray\n  ) -> jnp.ndarray:\n    \"\"\"Add relative position encodings.\"\"\"\n    rel_feat = featurization.create_relative_encoding(\n        seq_features=batch.token_features,\n        max_relative_idx=self.config.max_relative_idx,\n        max_relative_chain=self.config.max_relative_chain,\n    )\n    rel_feat = rel_feat.astype(pair_activations.dtype)\n\n    pair_activations += hm.Linear(\n        self.config.pair_channel, name='position_activations'\n    )(rel_feat)\n    return pair_activations\n\n  @hk.transparent\n  def _seq_pair_embedding(\n      self,\n      token_features: features.TokenFeatures,\n      target_feat: jnp.ndarray,\n  ) -> tuple[jnp.ndarray, jnp.ndarray]:\n    \"\"\"Generated Pair embedding from sequence.\"\"\"\n    left_single = hm.Linear(self.config.pair_channel, name='left_single')(\n        target_feat\n    )[:, None]\n    right_single = hm.Linear(self.config.pair_channel, name='right_single')(\n        target_feat\n    )[None]\n    dtype = left_single.dtype\n    pair_activations = left_single + right_single\n    num_residues = pair_activations.shape[0]\n    assert pair_activations.shape == (\n        num_residues,\n        num_residues,\n        self.config.pair_channel,\n    )\n    mask = token_features.mask\n    pair_mask = (mask[:, None] * mask[None, :]).astype(dtype)\n    assert pair_mask.shape == (num_residues, num_residues)\n    return pair_activations, pair_mask  # pytype: disable=bad-return-type  # jax-ndarray\n\n  @hk.transparent\n  def _embed_bonds(\n      self,\n      batch: feat_batch.Batch,\n      pair_activations: jnp.ndarray,\n  ) -> jnp.ndarray:\n    \"\"\"Embeds bond features and merges into pair activations.\"\"\"\n    # Construct contact matrix.\n    num_tokens = batch.token_features.token_index.shape[0]\n    contact_matrix = jnp.zeros((num_tokens, num_tokens))\n\n    tokens_to_polymer_ligand_bonds = (\n        batch.polymer_ligand_bond_info.tokens_to_polymer_ligand_bonds\n    )\n    gather_idxs_polymer_ligand = tokens_to_polymer_ligand_bonds.gather_idxs\n    gather_mask_polymer_ligand = (\n        tokens_to_polymer_ligand_bonds.gather_mask.prod(axis=1).astype(\n            gather_idxs_polymer_ligand.dtype\n        )[:, None]\n    )\n    # If valid mask then it will be all 1's, so idxs should be unchanged.\n    gather_idxs_polymer_ligand = (\n        gather_idxs_polymer_ligand * gather_mask_polymer_ligand\n    )\n\n    tokens_to_ligand_ligand_bonds = (\n        batch.ligand_ligand_bond_info.tokens_to_ligand_ligand_bonds\n    )\n    gather_idxs_ligand_ligand = tokens_to_ligand_ligand_bonds.gather_idxs\n    gather_mask_ligand_ligand = tokens_to_ligand_ligand_bonds.gather_mask.prod(\n        axis=1\n    ).astype(gather_idxs_ligand_ligand.dtype)[:, None]\n    gather_idxs_ligand_ligand = (\n        gather_idxs_ligand_ligand * gather_mask_ligand_ligand\n    )\n\n    gather_idxs = jnp.concatenate(\n        [gather_idxs_polymer_ligand, gather_idxs_ligand_ligand]\n    )\n    contact_matrix = contact_matrix.at[\n        gather_idxs[:, 0], gather_idxs[:, 1]\n    ].set(1.0)\n\n    # Because all the padded index's are 0's.\n    contact_matrix = contact_matrix.at[0, 0].set(0.0)\n\n    bonds_act = hm.Linear(self.config.pair_channel, name='bond_embedding')(\n        contact_matrix[:, :, None].astype(pair_activations.dtype)\n    )\n    return pair_activations + bonds_act\n\n  @hk.transparent\n  def _embed_template_pair(\n      self,\n      batch: feat_batch.Batch,\n      pair_activations: jnp.ndarray,\n      pair_mask: jnp.ndarray,\n      key: jnp.ndarray,\n  ) -> tuple[jnp.ndarray, jnp.ndarray]:\n    \"\"\"Embeds Templates and merges into pair activations.\"\"\"\n    dtype = pair_activations.dtype\n    key, subkey = jax.random.split(key)\n    template_module = template_modules.TemplateEmbedding(\n        self.config.template, self.global_config\n    )\n    templates = batch.templates\n    asym_id = batch.token_features.asym_id\n    # Construct a mask such that only intra-chain template features are\n    # computed, since all templates are for each chain individually.\n    multichain_mask = (asym_id[:, None] == asym_id[None, :]).astype(dtype)\n\n    template_fn = functools.partial(template_module, key=subkey)\n    template_act = template_fn(\n        query_embedding=pair_activations,\n        templates=templates,\n        multichain_mask_2d=multichain_mask,\n        padding_mask_2d=pair_mask,\n    )\n    return pair_activations + template_act, key\n\n  @hk.transparent\n  def _embed_process_msa(\n      self,\n      msa_batch: features.MSA,\n      pair_activations: jnp.ndarray,\n      pair_mask: jnp.ndarray,\n      key: jnp.ndarray,\n      target_feat: jnp.ndarray,\n  ) -> tuple[jnp.ndarray, jnp.ndarray]:\n    \"\"\"Processes MSA and returns updated pair activations.\"\"\"\n    dtype = pair_activations.dtype\n    msa_batch, key = featurization.shuffle_msa(key, msa_batch)\n    msa_batch = featurization.truncate_msa_batch(msa_batch, self.config.num_msa)\n    msa_feat = featurization.create_msa_feat(msa_batch).astype(dtype)\n\n    msa_activations = hm.Linear(\n        self.config.msa_channel, name='msa_activations'\n    )(msa_feat)\n\n    msa_activations += hm.Linear(\n        self.config.msa_channel, name='extra_msa_target_feat'\n    )(target_feat)[None]\n    msa_mask = msa_batch.mask.astype(dtype)\n\n    # Evoformer MSA stack.\n    evoformer_input = {'msa': msa_activations, 'pair': pair_activations}\n    masks = {'msa': msa_mask, 'pair': pair_mask}\n\n    def evoformer_fn(x):\n      return modules.EvoformerIteration(\n          self.config.msa_stack, self.global_config, name='msa_stack'\n      )(\n          activations=x,\n          masks=masks,\n      )\n\n    evoformer_stack = hk.experimental.layer_stack(\n        self.config.msa_stack.num_layer\n    )(evoformer_fn)\n\n    evoformer_output = evoformer_stack(evoformer_input)\n\n    return evoformer_output['pair'], key\n\n  def __call__(\n      self,\n      batch: feat_batch.Batch,\n      prev: dict[str, jnp.ndarray],\n      target_feat: jnp.ndarray,\n      key: jnp.ndarray,\n  ) -> dict[str, jnp.ndarray]:\n\n    assert self.global_config.bfloat16 in {'all', 'none'}\n\n    num_residues = target_feat.shape[0]\n    assert batch.token_features.aatype.shape == (num_residues,)\n\n    dtype = (\n        jnp.bfloat16 if self.global_config.bfloat16 == 'all' else jnp.float32\n    )\n\n    with utils.bfloat16_context():\n      pair_activations, pair_mask = self._seq_pair_embedding(\n          batch.token_features, target_feat\n      )\n\n      pair_activations += hm.Linear(\n          pair_activations.shape[-1],\n          name='prev_embedding',\n          initializer=self.global_config.final_init,\n      )(\n          hm.LayerNorm(name='prev_embedding_layer_norm')(\n              prev['pair'].astype(pair_activations.dtype)\n          )\n      )\n\n      pair_activations = self._relative_encoding(batch, pair_activations)\n\n      pair_activations = self._embed_bonds(\n          batch=batch, pair_activations=pair_activations\n      )\n\n      pair_activations, key = self._embed_template_pair(\n          batch=batch,\n          pair_activations=pair_activations,\n          pair_mask=pair_mask,\n          key=key,\n      )\n      pair_activations, key = self._embed_process_msa(\n          msa_batch=batch.msa,\n          pair_activations=pair_activations,\n          pair_mask=pair_mask,\n          key=key,\n          target_feat=target_feat,\n      )\n      del key  # Unused after this point.\n\n      single_activations = hm.Linear(\n          self.config.seq_channel, name='single_activations'\n      )(target_feat)\n\n      single_activations += hm.Linear(\n          single_activations.shape[-1],\n          name='prev_single_embedding',\n          initializer=self.global_config.final_init,\n      )(\n          hm.LayerNorm(name='prev_single_embedding_layer_norm')(\n              prev['single'].astype(single_activations.dtype)\n          )\n      )\n\n      def pairformer_fn(x):\n        pairformer_iteration = modules.PairFormerIteration(\n            self.config.pairformer,\n            self.global_config,\n            with_single=True,\n            name='trunk_pairformer',\n        )\n        pair_act, single_act = x\n        return pairformer_iteration(\n            act=pair_act,\n            single_act=single_act,\n            pair_mask=pair_mask,\n            seq_mask=batch.token_features.mask.astype(dtype),\n        )\n\n      pairformer_stack = hk.experimental.layer_stack(\n          self.config.pairformer.num_layer\n      )(pairformer_fn)\n\n      pair_activations, single_activations = pairformer_stack(\n          (pair_activations, single_activations)\n      )\n\n      assert pair_activations.shape == (\n          num_residues,\n          num_residues,\n          self.config.pair_channel,\n      )\n      assert single_activations.shape == (num_residues, self.config.seq_channel)\n      assert len(target_feat.shape) == 2\n      assert target_feat.shape[0] == num_residues\n      output = {\n          'single': single_activations,\n          'pair': pair_activations,\n          'target_feat': target_feat,\n      }\n\n    return output\n"
  },
  {
    "path": "src/alphafold3/model/network/featurization.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Model-side of the input features processing.\"\"\"\n\nimport functools\n\nfrom alphafold3.constants import residue_names\nfrom alphafold3.model import feat_batch\nfrom alphafold3.model import features\nfrom alphafold3.model.components import utils\nimport jax\nimport jax.numpy as jnp\n\n\ndef _grid_keys(key, shape):\n  \"\"\"Generate a grid of rng keys that is consistent with different padding.\n\n  Generate random keys such that the keys will be identical, regardless of\n  how much padding is added to any dimension.\n\n  Args:\n    key: A PRNG key.\n    shape: The shape of the output array of keys that will be generated.\n\n  Returns:\n    An array of shape `shape` consisting of random keys.\n  \"\"\"\n  if not shape:\n    return key\n  new_keys = jax.vmap(functools.partial(jax.random.fold_in, key))(\n      jnp.arange(shape[0])\n  )\n  return jax.vmap(functools.partial(_grid_keys, shape=shape[1:]))(new_keys)\n\n\ndef _padding_consistent_rng(f):\n  \"\"\"Modify any element-wise random function to be consistent with padding.\n\n  Normally if you take a function like jax.random.normal and generate an array,\n  say of size (10,10), you will get a different set of random numbers to if you\n  add padding and take the first (10,10) sub-array.\n\n  This function makes a random function that is consistent regardless of the\n  amount of padding added.\n\n  Note: The padding-consistent function is likely to be slower to compile and\n  run than the function it is wrapping, but these slowdowns are likely to be\n  negligible in a large network.\n\n  Args:\n    f: Any element-wise function that takes (PRNG key, shape) as the first 2\n      arguments.\n\n  Returns:\n    An equivalent function to f, that is now consistent for different amounts of\n    padding.\n  \"\"\"\n\n  def inner(key, shape, **kwargs):\n    keys = _grid_keys(key, shape)\n    signature = (\n        '()->()'\n        if jax.dtypes.issubdtype(keys.dtype, jax.dtypes.prng_key)\n        else '(2)->()'\n    )\n    return jnp.vectorize(\n        functools.partial(f, shape=(), **kwargs), signature=signature\n    )(keys)\n\n  return inner\n\n\ndef gumbel_argsort_sample_idx(\n    key: jnp.ndarray, logits: jnp.ndarray\n) -> jnp.ndarray:\n  \"\"\"Samples with replacement from a distribution given by 'logits'.\n\n  This uses Gumbel trick to implement the sampling an efficient manner. For a\n  distribution over k items this samples k times without replacement, so this\n  is effectively sampling a random permutation with probabilities over the\n  permutations derived from the logprobs.\n\n  Args:\n    key: prng key\n    logits: logarithm of probabilities to sample from, probabilities can be\n      unnormalized.\n\n  Returns:\n    Sample from logprobs in one-hot form.\n  \"\"\"\n  gumbel = _padding_consistent_rng(jax.random.gumbel)\n  z = gumbel(key, logits.shape)\n  # This construction is equivalent to jnp.argsort, but using a non stable sort,\n  # since stable sort's aren't supported by jax2tf\n  axis = len(logits.shape) - 1\n  iota = jax.lax.broadcasted_iota(jnp.int64, logits.shape, axis)\n  _, perm = jax.lax.sort_key_val(\n      logits + z, iota, dimension=-1, is_stable=False\n  )\n  return perm[::-1]\n\n\ndef create_msa_feat(msa: features.MSA) -> jax.Array:\n  \"\"\"Create and concatenate MSA features.\"\"\"\n  msa_1hot = jax.nn.one_hot(\n      msa.rows, residue_names.POLYMER_TYPES_NUM_WITH_UNKNOWN_AND_GAP + 1\n  )\n  deletion_matrix = msa.deletion_matrix\n  has_deletion = jnp.clip(deletion_matrix, 0.0, 1.0)[..., None]\n  deletion_value = (jnp.arctan(deletion_matrix / 3.0) * (2.0 / jnp.pi))[\n      ..., None\n  ]\n\n  msa_feat = [\n      msa_1hot,\n      has_deletion,\n      deletion_value,\n  ]\n\n  return jnp.concatenate(msa_feat, axis=-1)\n\n\ndef truncate_msa_batch(msa: features.MSA, num_msa: int) -> features.MSA:\n  indices = jnp.arange(num_msa)\n  return msa.index_msa_rows(indices)\n\n\ndef create_target_feat(\n    batch: feat_batch.Batch,\n    append_per_atom_features: bool,\n) -> jax.Array:\n  \"\"\"Make target feat.\"\"\"\n  token_features = batch.token_features\n  target_features = []\n  target_features.append(\n      jax.nn.one_hot(\n          token_features.aatype,\n          residue_names.POLYMER_TYPES_NUM_WITH_UNKNOWN_AND_GAP,\n      )\n  )\n  target_features.append(batch.msa.profile)\n  target_features.append(batch.msa.deletion_mean[..., None])\n\n  # Reference structure features\n  if append_per_atom_features:\n    ref_mask = batch.ref_structure.mask\n    element_feat = jax.nn.one_hot(batch.ref_structure.element, 128)\n    element_feat = utils.mask_mean(\n        mask=ref_mask[..., None], value=element_feat, axis=-2, eps=1e-6\n    )\n    target_features.append(element_feat)\n    pos_feat = batch.ref_structure.positions\n    pos_feat = pos_feat.reshape([pos_feat.shape[0], -1])\n    target_features.append(pos_feat)\n    target_features.append(ref_mask)\n\n  return jnp.concatenate(target_features, axis=-1)\n\n\ndef create_relative_encoding(\n    seq_features: features.TokenFeatures,\n    max_relative_idx: int,\n    max_relative_chain: int,\n) -> jax.Array:\n  \"\"\"Add relative position encodings.\"\"\"\n  rel_feats = []\n  token_index = seq_features.token_index\n  residue_index = seq_features.residue_index\n  asym_id = seq_features.asym_id\n  entity_id = seq_features.entity_id\n  sym_id = seq_features.sym_id\n\n  left_asym_id = asym_id[:, None]\n  right_asym_id = asym_id[None, :]\n\n  left_residue_index = residue_index[:, None]\n  right_residue_index = residue_index[None, :]\n\n  left_token_index = token_index[:, None]\n  right_token_index = token_index[None, :]\n\n  left_entity_id = entity_id[:, None]\n  right_entity_id = entity_id[None, :]\n\n  left_sym_id = sym_id[:, None]\n  right_sym_id = sym_id[None, :]\n\n  # Embed relative positions using a one-hot embedding of distance along chain\n  offset = left_residue_index - right_residue_index\n  clipped_offset = jnp.clip(\n      offset + max_relative_idx, min=0, max=2 * max_relative_idx\n  )\n  asym_id_same = left_asym_id == right_asym_id\n  final_offset = jnp.where(\n      asym_id_same,\n      clipped_offset,\n      (2 * max_relative_idx + 1) * jnp.ones_like(clipped_offset),\n  )\n  rel_pos = jax.nn.one_hot(final_offset, 2 * max_relative_idx + 2)\n  rel_feats.append(rel_pos)\n\n  # Embed relative token index as a one-hot embedding of distance along residue\n  token_offset = left_token_index - right_token_index\n  clipped_token_offset = jnp.clip(\n      token_offset + max_relative_idx, min=0, max=2 * max_relative_idx\n  )\n  residue_same = (left_asym_id == right_asym_id) & (\n      left_residue_index == right_residue_index\n  )\n  final_token_offset = jnp.where(\n      residue_same,\n      clipped_token_offset,\n      (2 * max_relative_idx + 1) * jnp.ones_like(clipped_token_offset),\n  )\n  rel_token = jax.nn.one_hot(final_token_offset, 2 * max_relative_idx + 2)\n  rel_feats.append(rel_token)\n\n  # Embed same entity ID\n  entity_id_same = left_entity_id == right_entity_id\n  rel_feats.append(entity_id_same.astype(rel_pos.dtype)[..., None])\n\n  # Embed relative chain ID inside each symmetry class\n  rel_sym_id = left_sym_id - right_sym_id\n\n  max_rel_chain = max_relative_chain\n\n  clipped_rel_chain = jnp.clip(\n      rel_sym_id + max_rel_chain, min=0, max=2 * max_rel_chain\n  )\n\n  final_rel_chain = jnp.where(\n      entity_id_same,\n      clipped_rel_chain,\n      (2 * max_rel_chain + 1) * jnp.ones_like(clipped_rel_chain),\n  )\n  rel_chain = jax.nn.one_hot(final_rel_chain, 2 * max_relative_chain + 2)\n\n  rel_feats.append(rel_chain)\n\n  return jnp.concatenate(rel_feats, axis=-1)\n\n\ndef shuffle_msa(\n    key: jax.Array, msa: features.MSA\n) -> tuple[features.MSA, jax.Array]:\n  \"\"\"Shuffle MSA randomly, return batch with shuffled MSA.\n\n  Args:\n    key: rng key for random number generation.\n    msa: MSA object to sample msa from.\n\n  Returns:\n    Protein with sampled msa.\n  \"\"\"\n  key, sample_key = jax.random.split(key)\n  # Sample uniformly among sequences with at least one non-masked position.\n  logits = (jnp.clip(jnp.sum(msa.mask, axis=-1), 0.0, 1.0) - 1.0) * 1e6\n  index_order = gumbel_argsort_sample_idx(sample_key, logits)\n\n  return msa.index_msa_rows(index_order), key\n"
  },
  {
    "path": "src/alphafold3/model/network/modules.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Haiku modules for the Diffuser model.\"\"\"\n\nfrom collections.abc import Sequence\nfrom typing import Literal\n\nfrom alphafold3.common import base_config\nfrom alphafold3.model import model_config\nfrom alphafold3.model.components import haiku_modules as hm\nfrom alphafold3.model.components import mapping\nfrom alphafold3.model.network import diffusion_transformer\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\nimport tokamax\n\n\ndef get_shard_size(\n    num_residues: int, shard_spec: Sequence[tuple[int | None, int | None]]\n) -> int | None:\n  shard_size = shard_spec[0][-1]\n  for num_residues_upper_bound, num_residues_shard_size in shard_spec:\n    shard_size = num_residues_shard_size\n    if (\n        num_residues_upper_bound is None\n        or num_residues <= num_residues_upper_bound\n    ):\n      break\n  return shard_size\n\n\nclass TransitionBlock(hk.Module):\n  \"\"\"Transition block for transformer.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    num_intermediate_factor: int = 4\n    use_glu_kernel: bool = True\n\n  def __init__(\n      self, config: Config, global_config: model_config.GlobalConfig, *, name\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(self, act, broadcast_dim=0):\n    num_channels = act.shape[-1]\n\n    num_intermediate = int(num_channels * self.config.num_intermediate_factor)\n\n    act = hm.LayerNorm(name='input_layer_norm')(act)\n\n    if self.config.use_glu_kernel:\n      weights, _ = hm.haiku_linear_get_params(\n          act,\n          num_output=num_intermediate * 2,\n          initializer='relu',\n          name='transition1',\n      )\n      weights = jnp.reshape(weights, (len(weights), 2, num_intermediate))\n      c = tokamax.gated_linear_unit(\n          x=act, weights=weights, activation=jax.nn.swish\n      )\n    else:\n      act = hm.Linear(\n          num_intermediate * 2, initializer='relu', name='transition1'\n      )(act)\n      a, b = jnp.split(act, 2, axis=-1)\n      c = jax.nn.swish(a) * b\n\n    return hm.Linear(\n        num_channels,\n        initializer=self.global_config.final_init,\n        name='transition2',\n    )(c)\n\n\nclass MSAAttention(hk.Module):\n  \"\"\"MSA Attention.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    num_head: int = 8\n\n  def __init__(\n      self, config: Config, global_config: model_config.GlobalConfig, *, name\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(self, act, mask, pair_act):\n    act = hm.LayerNorm(name='act_norm')(act)\n    pair_act = hm.LayerNorm(name='pair_norm')(pair_act)\n    logits = hm.Linear(\n        self.config.num_head, use_bias=False, name='pair_logits'\n    )(pair_act)\n    logits = jnp.transpose(logits, [2, 0, 1])\n    logits += 1e9 * (jnp.max(mask, axis=0) - 1.0)\n    weights = jax.nn.softmax(logits, axis=-1)\n    num_channels = act.shape[-1]\n    value_dim = num_channels // self.config.num_head\n    v = hm.Linear(\n        [self.config.num_head, value_dim], use_bias=False, name='v_projection'\n    )(act)\n    v_avg = jnp.einsum('hqk, bkhc -> bqhc', weights, v)\n    v_avg = jnp.reshape(v_avg, v_avg.shape[:-2] + (-1,))\n    gate_values = hm.Linear(\n        self.config.num_head * value_dim,\n        bias_init=1.0,\n        initializer='zeros',\n        name='gating_query',\n    )(act)\n    v_avg *= jax.nn.sigmoid(gate_values)\n\n    return hm.Linear(\n        num_channels,\n        initializer=self.global_config.final_init,\n        name='output_projection',\n    )(v_avg)\n\n\nclass GridSelfAttention(hk.Module):\n  \"\"\"Self attention that is either per-sequence or per-residue.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    num_head: int = 4\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      transpose: bool,\n      *,\n      name: str,\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n    self.transpose = transpose\n\n  @hk.transparent\n  def _attention(\n      self,\n      act,\n      mask,\n      bias,\n  ):\n    num_channels = act.shape[-1]\n    assert num_channels % self.config.num_head == 0\n    # Triton requires a minimum dimension of 16 for doing matmul.\n    qkv_dim = max(num_channels // self.config.num_head, 16)\n\n    qkv_shape = (self.config.num_head, qkv_dim)\n    q = hm.Linear(\n        qkv_shape, use_bias=False, name='q_projection', transpose_weights=True\n    )(act)\n    k = hm.Linear(\n        qkv_shape, use_bias=False, name='k_projection', transpose_weights=True\n    )(act)\n    v = hm.Linear(qkv_shape, use_bias=False, name='v_projection')(act)\n\n    # Dot product attention requires the bias term to have a batch dimension.\n    bias = jnp.expand_dims(bias, 0)\n\n    weighted_avg = tokamax.dot_product_attention(\n        q,\n        k,\n        v,\n        mask=mask,\n        bias=bias,\n        implementation=self.global_config.flash_attention_implementation,\n    )\n    weighted_avg = jnp.reshape(weighted_avg, weighted_avg.shape[:-2] + (-1,))\n\n    gate_values = hm.Linear(\n        self.config.num_head * qkv_dim,\n        bias_init=1.0,\n        initializer='zeros',\n        transpose_weights=True,\n        name='gating_query',\n    )(act)\n    weighted_avg *= jax.nn.sigmoid(gate_values)\n\n    return hm.Linear(\n        num_channels,\n        initializer=self.global_config.final_init,\n        name='output_projection',\n    )(weighted_avg)\n\n  def __call__(self, act, pair_mask):\n    \"\"\"Builds a module.\n\n    Arguments:\n      act: [num_seq, num_res, channels] activations tensor\n      pair_mask: [num_seq, num_res] mask of non-padded regions in the tensor.\n        Only used in inducing points attention currently.\n\n    Returns:\n      Result of the self-attention operation.\n    \"\"\"\n    assert len(act.shape) == 3\n    assert len(pair_mask.shape) == 2\n\n    pair_mask = jnp.swapaxes(pair_mask, -1, -2)\n    act = hm.LayerNorm(name='act_norm')(act)\n\n    nonbatched_bias = hm.Linear(\n        self.config.num_head, use_bias=False, name='pair_bias_projection'\n    )(act)\n    nonbatched_bias = jnp.transpose(nonbatched_bias, [2, 0, 1])\n\n    num_residues = act.shape[0]\n\n    chunk_size = get_shard_size(\n        num_residues, self.global_config.pair_attention_chunk_size\n    )\n\n    if self.transpose:\n      act = jnp.swapaxes(act, -2, -3)\n\n    pair_mask = pair_mask[:, None, None, :].astype(jnp.bool_)\n\n    act = mapping.inference_subbatch(\n        self._attention,\n        chunk_size,\n        batched_args=[act, pair_mask],\n        nonbatched_args=[nonbatched_bias],\n    )\n\n    if self.transpose:\n      act = jnp.swapaxes(act, -2, -3)\n\n    return act\n\n\nclass TriangleMultiplication(hk.Module):\n  \"\"\"Triangle Multiplication.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    equation: Literal['ikc,jkc->ijc', 'kjc,kic->ijc']\n    use_glu_kernel: bool = True\n\n  def __init__(\n      self, config: Config, global_config: model_config.GlobalConfig, *, name\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(self, act, mask):\n    \"\"\"Applies Module.\n\n    Args:\n      act: The activation.\n      mask: The mask.\n\n    Returns:\n      Outputs, should have same shape/type as output_act\n    \"\"\"\n    mask = mask[None, ...]\n    num_channels = act.shape[-1]\n    equation = {\n        'ikc,jkc->ijc': 'cik,cjk->cij',\n        'kjc,kic->ijc': 'ckj,cki->cij',\n    }[self.config.equation]\n\n    act = hm.LayerNorm(name='left_norm_input')(act)\n    input_act = act\n\n    if self.config.use_glu_kernel:\n      weights_projection, _ = hm.haiku_linear_get_params(\n          act, num_output=num_channels * 2, name='projection'\n      )\n      weights_gate, _ = hm.haiku_linear_get_params(\n          act,\n          num_output=num_channels * 2,\n          initializer=self.global_config.final_init,\n          name='gate',\n      )\n      weights_glu = jnp.stack([weights_gate, weights_projection], axis=1)\n\n      projection = tokamax.gated_linear_unit(\n          act, weights_glu, activation=jax.nn.sigmoid\n      )\n      projection = jnp.transpose(projection, (2, 0, 1))\n      projection *= mask\n    else:\n      projection = hm.Linear(num_channels * 2, name='projection')(act)\n      projection = jnp.transpose(projection, (2, 0, 1))\n      projection *= mask\n\n      gate = hm.Linear(\n          num_channels * 2,\n          name='gate',\n          bias_init=1.0,\n          initializer=self.global_config.final_init,\n      )(act)\n      gate = jnp.transpose(gate, (2, 0, 1))\n      projection *= jax.nn.sigmoid(gate)\n\n    projection = projection.reshape(num_channels, 2, *projection.shape[1:])\n    a, b = jnp.split(projection, 2, axis=1)\n    a, b = jnp.squeeze(a, axis=1), jnp.squeeze(b, axis=1)\n    act = jnp.einsum(equation, a, b)\n    act = hm.LayerNorm(name='center_norm', axis=0, param_axis=0)(act)\n\n    act = jnp.transpose(act, (1, 2, 0))\n    act = hm.Linear(\n        num_channels,\n        initializer=self.global_config.final_init,\n        name='output_projection',\n    )(act)\n\n    gate_out = hm.Linear(\n        num_channels,\n        name='gating_linear',\n        bias_init=1.0,\n        initializer=self.global_config.final_init,\n    )(input_act)\n    act *= jax.nn.sigmoid(gate_out)\n\n    return act\n\n\nclass OuterProductMean(hk.Module):\n  \"\"\"Computed mean outer product.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    chunk_size: int = 128\n    num_outer_channel: int = 32\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      num_output_channel,\n      *,\n      name,\n  ):\n    super().__init__(name=name)\n    self.global_config = global_config\n    self.config = config\n    self.num_output_channel = num_output_channel\n\n  def __call__(self, act, mask):\n    mask = mask[..., None]\n    act = hm.LayerNorm(name='layer_norm_input')(act)\n\n    left_act = mask * hm.Linear(\n        self.config.num_outer_channel,\n        initializer='linear',\n        name='left_projection',\n    )(act)\n\n    right_act = mask * hm.Linear(\n        self.config.num_outer_channel,\n        initializer='linear',\n        name='right_projection',\n    )(act)\n\n    if self.global_config.final_init == 'zeros':\n      w_init = hk.initializers.Constant(0.0)\n    else:\n      w_init = hk.initializers.VarianceScaling(scale=2.0, mode='fan_in')\n\n    output_w = hk.get_parameter(\n        'output_w',\n        shape=(\n            self.config.num_outer_channel,\n            self.config.num_outer_channel,\n            self.num_output_channel,\n        ),\n        dtype=act.dtype,\n        init=w_init,\n    )\n    output_b = hk.get_parameter(\n        'output_b',\n        shape=(self.num_output_channel,),\n        dtype=act.dtype,\n        init=hk.initializers.Constant(0.0),\n    )\n\n    def compute_chunk(left_act):\n      # Make sure that the 'b' dimension is the most minor batch like dimension\n      # so it will be treated as the real batch by XLA (both during the forward\n      # and the backward pass)\n      left_act = jnp.transpose(left_act, [0, 2, 1])\n      act = jnp.einsum('acb,ade->dceb', left_act, right_act)\n      act = jnp.einsum('dceb,cef->dbf', act, output_w) + output_b\n      return jnp.transpose(act, [1, 0, 2])\n\n    act = mapping.inference_subbatch(\n        compute_chunk,\n        self.config.chunk_size,\n        batched_args=[left_act],\n        nonbatched_args=[],\n        input_subbatch_dim=1,\n        output_subbatch_dim=0,\n    )\n\n    epsilon = 1e-3\n    norm = jnp.einsum('abc,adc->bdc', mask, mask)\n    return act / (epsilon + norm)\n\n\nclass PairFormerIteration(hk.Module):\n  \"\"\"Single Iteration of Pair Former.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    \"\"\"Config for PairFormerIteration.\"\"\"\n\n    num_layer: int\n    pair_attention: GridSelfAttention.Config = base_config.autocreate()\n    pair_transition: TransitionBlock.Config = base_config.autocreate()\n    single_attention: diffusion_transformer.SelfAttentionConfig | None = None\n    single_transition: TransitionBlock.Config | None = None\n    triangle_multiplication_incoming: TriangleMultiplication.Config = (\n        base_config.autocreate(equation='kjc,kic->ijc')\n    )\n    triangle_multiplication_outgoing: TriangleMultiplication.Config = (\n        base_config.autocreate(equation='ikc,jkc->ijc')\n    )\n    shard_transition_blocks: bool = True\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      with_single=False,\n      *,\n      name,\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n    self.with_single = with_single\n\n  def __call__(\n      self,\n      act,\n      pair_mask,\n      single_act=None,\n      seq_mask=None,\n  ):\n    \"\"\"Build a single iteration of the pair former.\n\n    Args:\n      act: [num_res, num_res, num_channel] Input pairwise activations.\n      pair_mask: [num_res, num_res] padding mask.\n      single_act: [num_res, single_channel] Single Input activations, optional\n      seq_mask: [num_res] Sequence Mask, optional.\n\n    Returns:\n      [num_res, num_res, num_channel] tensor of activations.\n    \"\"\"\n\n    num_residues = act.shape[0]\n\n    act += TriangleMultiplication(\n        self.config.triangle_multiplication_outgoing,\n        self.global_config,\n        name='triangle_multiplication_outgoing',\n    )(act, pair_mask)\n\n    act += TriangleMultiplication(\n        self.config.triangle_multiplication_incoming,\n        self.global_config,\n        name='triangle_multiplication_incoming',\n    )(act, pair_mask)\n\n    act += GridSelfAttention(\n        self.config.pair_attention,\n        self.global_config,\n        name='pair_attention1',\n        transpose=False,\n    )(act, pair_mask)\n\n    act += GridSelfAttention(\n        self.config.pair_attention,\n        self.global_config,\n        name='pair_attention2',\n        transpose=True,\n    )(act, pair_mask)\n\n    transition_block = TransitionBlock(\n        self.config.pair_transition, self.global_config, name='pair_transition'\n    )\n    if self.config.shard_transition_blocks:\n      transition_block = mapping.sharded_apply(\n          transition_block,\n          get_shard_size(\n              num_residues, self.global_config.pair_transition_shard_spec\n          ),\n      )\n    act += transition_block(act)\n\n    if self.with_single:\n      assert self.config.single_attention is not None\n      pair_logits = hm.Linear(\n          self.config.single_attention.num_head,\n          name='single_pair_logits_projection',\n      )(hm.LayerNorm(name='single_pair_logits_norm')(act))\n\n      pair_logits = jnp.transpose(pair_logits, [2, 0, 1])\n\n      single_act += diffusion_transformer.self_attention(\n          single_act,\n          seq_mask,\n          pair_logits=pair_logits,\n          config=self.config.single_attention,\n          global_config=self.global_config,\n          name='single_attention_',\n      )\n\n      single_act += TransitionBlock(\n          self.config.single_transition,\n          self.global_config,\n          name='single_transition',\n      )(single_act, broadcast_dim=None)\n\n      return act, single_act\n    else:\n      return act\n\n\nclass EvoformerIteration(hk.Module):\n  \"\"\"Single Iteration of Evoformer Main Stack.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    \"\"\"Configuration for EvoformerIteration.\"\"\"\n\n    num_layer: int = 4\n    msa_attention: MSAAttention.Config = base_config.autocreate()\n    outer_product_mean: OuterProductMean.Config = base_config.autocreate()\n    msa_transition: TransitionBlock.Config = base_config.autocreate()\n    pair_attention: GridSelfAttention.Config = base_config.autocreate()\n    pair_transition: TransitionBlock.Config = base_config.autocreate()\n    triangle_multiplication_incoming: TriangleMultiplication.Config = (\n        base_config.autocreate(equation='kjc,kic->ijc')\n    )\n    triangle_multiplication_outgoing: TriangleMultiplication.Config = (\n        base_config.autocreate(equation='ikc,jkc->ijc')\n    )\n    shard_transition_blocks: bool = True\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      name='evoformer_iteration',\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(self, activations, masks):\n\n    msa_act, pair_act = activations['msa'], activations['pair']\n\n    num_residues = pair_act.shape[0]\n\n    msa_mask, pair_mask = masks['msa'], masks['pair']\n\n    pair_act += OuterProductMean(\n        config=self.config.outer_product_mean,\n        global_config=self.global_config,\n        num_output_channel=int(pair_act.shape[-1]),\n        name='outer_product_mean',\n    )(msa_act, msa_mask)\n\n    msa_act += MSAAttention(\n        self.config.msa_attention, self.global_config, name='msa_attention1'\n    )(msa_act, msa_mask, pair_act=pair_act)\n\n    msa_act += TransitionBlock(\n        self.config.msa_transition, self.global_config, name='msa_transition'\n    )(msa_act)\n\n    pair_act += TriangleMultiplication(\n        self.config.triangle_multiplication_outgoing,\n        self.global_config,\n        name='triangle_multiplication_outgoing',\n    )(pair_act, pair_mask)\n\n    pair_act += TriangleMultiplication(\n        self.config.triangle_multiplication_incoming,\n        self.global_config,\n        name='triangle_multiplication_incoming',\n    )(pair_act, pair_mask)\n\n    pair_act += GridSelfAttention(\n        self.config.pair_attention,\n        self.global_config,\n        name='pair_attention1',\n        transpose=False,\n    )(pair_act, pair_mask)\n\n    pair_act += GridSelfAttention(\n        self.config.pair_attention,\n        self.global_config,\n        name='pair_attention2',\n        transpose=True,\n    )(pair_act, pair_mask)\n\n    transition_block = TransitionBlock(\n        self.config.pair_transition, self.global_config, name='pair_transition'\n    )\n    if self.config.shard_transition_blocks:\n      transition_block = mapping.sharded_apply(\n          transition_block,\n          get_shard_size(\n              num_residues, self.global_config.pair_transition_shard_spec\n          ),\n      )\n    pair_act += transition_block(pair_act)\n\n    return {'msa': msa_act, 'pair': pair_act}\n"
  },
  {
    "path": "src/alphafold3/model/network/noise_level_embeddings.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Fourier embeddings for given noise levels.\n\nWe supply fixed weights and biases for the Fourier embeddings. These were\ninitially generated by the following code, but we make them into constants\nto future proof against changes in jax rng generation:\n\n```\ndim = 256\nw_key, b_key = jax.random.split(jax.random.PRNGKey(42))\nweight = jax.random.normal(w_key, shape=[dim])\nbias = jax.random.uniform(b_key, shape=[dim])\n```\n\"\"\"\n\nimport jax.numpy as jnp\n\n# pyformat: disable\n# pylint: disable=bad-whitespace\n# pylint: disable=bad-continuation\n_WEIGHT = [\n     0.45873642,  0.06516238, -0.07278306, -0.26992258,  0.64292115,\n    -0.40763968,  3.60116863,  0.54461384, -0.32644904,  2.10888267,\n     1.30805349,  1.19838560, -1.37745857,  1.99475312, -1.64120293,\n     1.07823789, -0.02288206,  0.88305283,  0.48099944,  0.17655374,\n     0.30281949,  0.80646873,  0.62605333, -0.23965347, -1.02609432,\n     0.75006109, -0.19913037,  0.07466396,  0.66431236, -0.60990530,\n    -0.69709194, -0.44453633, -1.77656078,  0.02299878,  0.04095552,\n     0.35485864, -0.47602659, -0.98820388, -0.24106771, -1.07254291,\n    -0.99741757,  0.22697604,  1.41390419,  1.54984057, -0.12237291,\n     0.20156337,  0.61767143,  0.23959029,  0.92454034,  1.84082258,\n     0.89030224,  0.39598912, -1.52224910,  0.29669049,  1.52356744,\n    -0.33968377,  0.24155144, -0.52308381, -0.23622665,  0.92825454,\n    -0.63864607, -0.62169307,  0.78623551, -0.80352145, -0.45496067,\n     1.30877995, -0.06686528,  1.00248849, -0.63593471,  0.16372502,\n    -1.46133232,  1.10562658, -0.01693927,  0.28684548, -0.72843230,\n     0.66133535, -1.92225552,  0.70241231, -0.96868867, -0.47309339,\n    -1.66894221,  0.46018723, -0.56806105,  0.32694784, -0.46529883,\n     1.02299964,  0.84688205,  1.19581807, -1.82454145,  0.05999713,\n    -0.59530073,  1.44862521, -0.34933713, -0.46564487, -0.55005538,\n    -1.61170268,  0.17502306,  0.38670063, -1.12133658, -0.29343036,\n    -0.52527446, -1.26285112,  1.07982683,  0.51215219,  1.48963666,\n     1.09847653, -0.01563358,  0.32574457,  1.94779706, -1.29198587,\n     1.06249654, -0.86965990,  0.22975266, -0.27182648, -0.21130897,\n    -0.41773933, -0.02329035,  1.31049252,  0.05579265, -1.23127055,\n    -0.99691105,  0.27058721, -0.72509319, -0.14421797, -1.48605061,\n     1.35041201,  1.29619241, -1.01022530, -0.79787987, -0.16166858,\n     0.87210685,  1.69248152,  1.42469788, -0.72325104, -1.24823737,\n     0.07051118,  0.71332991, -0.07360429, -0.91955227, -2.68856549,\n    -0.44033936,  0.35482934, -0.57933813,  0.97468042, -0.31050494,\n    -0.88454425, -2.08785224,  0.47322822, -0.02400172,  0.26644820,\n    -0.19147627, -2.10538960, -1.27962470, -1.35999286,  2.09867334,\n     0.65099514,  0.21604492, -0.45951018,  0.15994427, -0.31420693,\n    -0.65202618, -0.61077976, -1.06100249, -1.47254968,  1.18165290,\n    -0.78656220,  1.28182006,  1.80323684,  1.09196901,  0.26118696,\n    -0.30168581,  0.39749333,  0.26812574, -1.51995814, -0.46909946,\n     0.03874255, -1.36774313,  2.30143976,  2.06959820, -0.41647521,\n     1.85624206,  0.49019700, -0.06726539,  0.00457313,  0.23915423,\n    -1.84971249, -0.20482327, -0.34097880, -0.57933033, -1.10541213,\n    -0.30269983, -0.16430426, -0.82371718,  0.10345812,  1.78753936,\n     0.04786763,  1.86778629, -0.65214992,  0.81544143, -0.28214937,\n     0.31187257,  0.57661986,  1.21938801, -1.56046617,  0.38046429,\n    -0.18235965,  0.81794524, -0.40474343,  0.46538028, -1.15558851,\n     0.59625793, -1.07801270,  0.07310858,  0.61526084,  0.55518496,\n    -0.49787554,  0.92703879, -1.27780271, -0.83373469, -0.43015575,\n     0.41877759, -1.03987372, -1.46055734,  0.61282396,  0.15590595,\n    -0.34269521,  0.56509072, -1.17904210,  0.11374855, -1.83310866,\n     0.38734794, -0.58623004,  0.77931106,  1.53930688, -0.70299625,\n    -0.11389336, -1.14818096, -0.44400632,  1.21887410,  0.64066756,\n    -0.70249403, -0.27244881,  0.38586098, -1.07925785,  0.12448707,\n    -1.28286278,  0.37827531,  0.68812364,  1.65695465,  0.12440517,\n    -0.03689830,  1.10224664, -0.28323629, -0.47939169,  0.70120829,\n    -0.67204583\n]\n\n_BIAS = [\n    0.00465965, 0.21738243, 0.22277749, 0.68463874, 0.84596848, 0.17337036,\n    0.39573753, 0.78153563, 0.86311185, 0.21782327, 0.24377882, 0.42310703,\n    0.19887352, 0.10486019, 0.48707581, 0.22205460, 0.97263455, 0.29714966,\n    0.11244559, 0.53020525, 0.36796236, 0.37294638, 0.80261672, 0.04669094,\n    0.86319661, 0.75907171, 0.77297020, 0.01114798, 0.55850804, 0.91799915,\n    0.23032320, 0.12154722, 0.26701927, 0.42934716, 0.47951782, 0.96782577,\n    0.86785042, 0.61985648, 0.05743814, 0.41800117, 0.68881893, 0.60575199,\n    0.21058667, 0.64412105, 0.63958526, 0.89390790, 0.69755554, 0.89345169,\n    0.53330755, 0.56985939, 0.30724049, 0.00984561, 0.91407037, 0.92118979,\n    0.94153070, 0.81097460, 0.70537627, 0.32810748, 0.47227263, 0.11821401,\n    0.44983089, 0.30767226, 0.31756389, 0.62969446, 0.69892538, 0.16949117,\n    0.06207097, 0.46717727, 0.95348179, 0.62363589, 0.49018729, 0.06920040,\n    0.39333904, 0.41299903, 0.52514863, 0.61197245, 0.56871891, 0.65053988,\n    0.22203422, 0.46748531, 0.86931503, 0.87050021, 0.40208721, 0.32084906,\n    0.55084610, 0.94584596, 0.76279902, 0.36250532, 0.74272907, 0.66682065,\n    0.96452832, 0.64768302, 0.88070846, 0.56995463, 0.06395614, 0.69499350,\n    0.44494808, 0.39775658, 0.20280898, 0.33363521, 0.05999005, 0.44414878,\n    0.65227020, 0.01199079, 0.71995056, 0.19045687, 0.48342144, 0.25127733,\n    0.66515994, 0.22465158, 0.22313106, 0.06302810, 0.55783665, 0.93625581,\n    0.58800840, 0.72525370, 0.52879298, 0.77195418, 0.15548682, 0.01028740,\n    0.39325142, 0.45401239, 0.71494079, 0.33011997, 0.05050695, 0.26381660,\n    0.63064706, 0.47604024, 0.08593416, 0.00383425, 0.06352687, 0.05510247,\n    0.03552997, 0.35810637, 0.56094289, 0.60922170, 0.88599777, 0.45419788,\n    0.40486634, 0.71297824, 0.34976673, 0.97825217, 0.12915993, 0.09566259,\n    0.64318919, 0.16717327, 0.82308614, 0.32672071, 0.81688786, 0.84857118,\n    0.99922776, 0.07551706, 0.18766022, 0.13051236, 0.39136350, 0.08768725,\n    0.92048228, 0.87185788, 0.39158428, 0.79224777, 0.17492688, 0.68902445,\n    0.81980729, 0.70458186, 0.59489477, 0.93324888, 0.49986637, 0.40705478,\n    0.89202917, 0.20673239, 0.39339757, 0.20996964, 0.02923799, 0.53992438,\n    0.40119815, 0.10366607, 0.08044600, 0.95551598, 0.20518017, 0.68826210,\n    0.90159297, 0.69008791, 0.86880815, 0.16246438, 0.89628279, 0.11481643,\n    0.61353648, 0.41545081, 0.92478311, 0.78212476, 0.48292696, 0.79621077,\n    0.11947489, 0.01747024, 0.22928023, 0.87387264, 0.86349785, 0.89526737,\n    0.58904779, 0.13896775, 0.68194926, 0.55824125, 0.44428205, 0.55422378,\n    0.28189969, 0.27923775, 0.09979951, 0.66994715, 0.45943546, 0.71207762,\n    0.17300689, 0.83434916, 0.02573085, 0.45858085, 0.55934799, 0.30676675,\n    0.52219367, 0.34544575, 0.19280875, 0.26937950, 0.07147646, 0.06295013,\n    0.76382887, 0.38737607, 0.58825982, 0.17423475, 0.05509448, 0.97228825,\n    0.94380617, 0.91664016, 0.18800116, 0.41771865, 0.59420645, 0.77371931,\n    0.64687788, 0.27284670, 0.22310913, 0.15663862, 0.45573199, 0.50386798,\n    0.66712272, 0.71649647, 0.28475654, 0.83415413, 0.75261366, 0.61517799,\n    0.93544555, 0.76141870, 0.85474241, 0.74766934, 0.33459592, 0.78477907,\n    0.07250881, 0.10174239, 0.95332730, 0.80793905\n]\n# pyformat: enable\n# pylint: enable=bad-whitespace\n# pylint: enable=bad-continuation\n\n\ndef noise_embeddings(sigma_scaled_noise_level: jnp.ndarray) -> jnp.ndarray:\n  \"\"\"Returns Fourier noise level embeddings for diffusion model.\"\"\"\n  transformed_noise_level = (1 / 4) * jnp.log(sigma_scaled_noise_level)\n  weight = jnp.array(_WEIGHT, dtype=jnp.float32)\n  bias = jnp.array(_BIAS, dtype=jnp.float32)\n  embeddings = transformed_noise_level[..., None] * weight + bias\n  return jnp.cos(2 * jnp.pi * embeddings)\n"
  },
  {
    "path": "src/alphafold3/model/network/template_modules.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Modules for embedding templates.\"\"\"\n\nfrom alphafold3.common import base_config\nfrom alphafold3.constants import residue_names\nfrom alphafold3.jax import geometry\nfrom alphafold3.model import features\nfrom alphafold3.model import model_config\nfrom alphafold3.model import protein_data_processing\nfrom alphafold3.model.components import haiku_modules as hm\nfrom alphafold3.model.network import modules\nfrom alphafold3.model.scoring import scoring\nimport haiku as hk\nimport jax\nimport jax.numpy as jnp\n\n\nclass DistogramFeaturesConfig(base_config.BaseConfig):\n  # The left edge of the first bin.\n  min_bin: float = 3.25\n  # The left edge of the final bin. The final bin catches everything larger than\n  # `max_bin`.\n  max_bin: float = 50.75\n  # The number of bins in the distogram.\n  num_bins: int = 39\n\n\ndef dgram_from_positions(positions, config: DistogramFeaturesConfig):\n  \"\"\"Compute distogram from amino acid positions.\n\n  Args:\n    positions: (num_res, 3) Position coordinates.\n    config: Distogram bin configuration.\n\n  Returns:\n    Distogram with the specified number of bins.\n  \"\"\"\n  lower_breaks = jnp.linspace(config.min_bin, config.max_bin, config.num_bins)\n  lower_breaks = jnp.square(lower_breaks)\n  upper_breaks = jnp.concatenate(\n      [lower_breaks[1:], jnp.array([1e8], dtype=jnp.float32)], axis=-1\n  )\n  dist2 = jnp.sum(\n      jnp.square(\n          jnp.expand_dims(positions, axis=-2)\n          - jnp.expand_dims(positions, axis=-3)\n      ),\n      axis=-1,\n      keepdims=True,\n  )\n\n  dgram = (dist2 > lower_breaks).astype(jnp.float32) * (\n      dist2 < upper_breaks\n  ).astype(jnp.float32)\n  return dgram\n\n\ndef make_backbone_rigid(\n    positions: geometry.Vec3Array,\n    mask: jnp.ndarray,\n    group_indices: jnp.ndarray,\n) -> tuple[geometry.Rigid3Array, jnp.ndarray]:\n  \"\"\"Make backbone Rigid3Array and mask.\n\n  Args:\n    positions: (num_res, num_atoms) of atom positions as Vec3Array.\n    mask: (num_res, num_atoms) for atom mask.\n    group_indices: (num_res, num_group, 3) for atom indices forming groups.\n\n  Returns:\n    tuple of backbone Rigid3Array and mask (num_res,).\n  \"\"\"\n  backbone_indices = group_indices[:, 0]\n\n  # main backbone frames differ in sidechain frame convention.\n  # for sidechain it's (C, CA, N), for backbone it's (N, CA, C)\n  # Hence using c, b, a, each of shape (num_res,).\n  c, b, a = [backbone_indices[..., i] for i in range(3)]\n\n  slice_index = jax.vmap(lambda x, i: x[i])\n  rigid_mask = (\n      slice_index(mask, a) * slice_index(mask, b) * slice_index(mask, c)\n  ).astype(jnp.float32)\n\n  frame_positions = []\n  for indices in [a, b, c]:\n    frame_positions.append(\n        jax.tree.map(lambda x, idx=indices: slice_index(x, idx), positions)\n    )\n\n  rotation = geometry.Rot3Array.from_two_vectors(\n      frame_positions[2] - frame_positions[1],\n      frame_positions[0] - frame_positions[1],\n  )\n  rigid = geometry.Rigid3Array(rotation, frame_positions[1])\n\n  return rigid, rigid_mask\n\n\nclass TemplateEmbedding(hk.Module):\n  \"\"\"Embed a set of templates.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    num_channels: int = 64\n    template_stack: modules.PairFormerIteration.Config = base_config.autocreate(\n        num_layer=2,\n        pair_transition=base_config.autocreate(num_intermediate_factor=2),\n    )\n    dgram_features: DistogramFeaturesConfig = base_config.autocreate()\n\n  def __init__(\n      self,\n      config: Config,\n      global_config: model_config.GlobalConfig,\n      name='template_embedding',\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(\n      self,\n      query_embedding: jnp.ndarray,\n      templates: features.Templates,\n      padding_mask_2d: jnp.ndarray,\n      multichain_mask_2d: jnp.ndarray,\n      key: jnp.ndarray,\n  ) -> jnp.ndarray:\n    \"\"\"Generate an embedding for a set of templates.\n\n    Args:\n      query_embedding: [num_res, num_res, num_channel] a query tensor that will\n        be used to attend over the templates to remove the num_templates\n        dimension.\n      templates: A 'Templates' object.\n      padding_mask_2d: [num_res, num_res] Pair mask for attention operations.\n      multichain_mask_2d: [num_res, num_res] Pair mask for multichain.\n      key: random key generator.\n\n    Returns:\n      An embedding of size [num_res, num_res, num_channels]\n    \"\"\"\n    c = self.config\n    num_residues = query_embedding.shape[0]\n    num_templates = templates.aatype.shape[0]\n    query_num_channels = query_embedding.shape[2]\n    num_atoms = 24\n    assert query_embedding.shape == (\n        num_residues,\n        num_residues,\n        query_num_channels,\n    )\n    assert templates.aatype.shape == (num_templates, num_residues)\n    assert templates.atom_positions.shape == (\n        num_templates,\n        num_residues,\n        num_atoms,\n        3,\n    )\n    assert templates.atom_mask.shape == (num_templates, num_residues, num_atoms)\n    assert padding_mask_2d.shape == (num_residues, num_residues)\n\n    num_templates = templates.aatype.shape[0]\n    num_res, _, query_num_channels = query_embedding.shape\n\n    # Embed each template separately.\n    template_embedder = SingleTemplateEmbedding(self.config, self.global_config)\n\n    subkeys = jnp.array(jax.random.split(key, num_templates))\n\n    def scan_fn(carry, x):\n      templates, key = x\n      embedding = template_embedder(\n          query_embedding,\n          templates,\n          padding_mask_2d,\n          multichain_mask_2d,\n          key,\n      )\n      return carry + embedding, None\n\n    scan_init = jnp.zeros(\n        (num_res, num_res, c.num_channels), dtype=query_embedding.dtype\n    )\n    summed_template_embeddings, _ = hk.scan(\n        scan_fn, scan_init, (templates, subkeys)\n    )\n\n    embedding = summed_template_embeddings / (1e-7 + num_templates)\n    embedding = jax.nn.relu(embedding)\n    embedding = hm.Linear(\n        query_num_channels, initializer='relu', name='output_linear'\n    )(embedding)\n\n    assert embedding.shape == (num_residues, num_residues, query_num_channels)\n    return embedding\n\n\nclass SingleTemplateEmbedding(hk.Module):\n  \"\"\"Embed a single template.\"\"\"\n\n  def __init__(\n      self,\n      config: TemplateEmbedding.Config,\n      global_config: model_config.GlobalConfig,\n      name='single_template_embedding',\n  ):\n    super().__init__(name=name)\n    self.config = config\n    self.global_config = global_config\n\n  def __call__(\n      self,\n      query_embedding: jnp.ndarray,\n      templates: features.Templates,\n      padding_mask_2d: jnp.ndarray,\n      multichain_mask_2d: jnp.ndarray,\n      key: jnp.ndarray,\n  ) -> jnp.ndarray:\n    \"\"\"Build the single template embedding graph.\n\n    Args:\n      query_embedding: (num_res, num_res, num_channels) - embedding of the query\n        sequence/msa.\n      templates: 'Templates' object containing single Template.\n      padding_mask_2d: Padding mask (Note: this doesn't care if a template\n        exists, unlike the template_pseudo_beta_mask).\n      multichain_mask_2d: A mask indicating intra-chain residue pairs, used to\n        mask out between chain distances/features when templates are for single\n        chains.\n      key: Random key generator.\n\n    Returns:\n      A template embedding (num_res, num_res, num_channels).\n    \"\"\"\n    gc = self.global_config\n    c = self.config\n    assert padding_mask_2d.dtype == query_embedding.dtype\n    dtype = query_embedding.dtype\n    num_channels = self.config.num_channels\n\n    def construct_input(\n        query_embedding, templates: features.Templates, multichain_mask_2d\n    ):\n\n      # Compute distogram feature for the template.\n      aatype = templates.aatype\n      dense_atom_mask = templates.atom_mask\n\n      dense_atom_positions = templates.atom_positions\n      dense_atom_positions *= dense_atom_mask[..., None]\n\n      pseudo_beta_positions, pseudo_beta_mask = scoring.pseudo_beta_fn(\n          templates.aatype, dense_atom_positions, dense_atom_mask\n      )\n      pseudo_beta_mask_2d = (\n          pseudo_beta_mask[:, None] * pseudo_beta_mask[None, :]\n      )\n      pseudo_beta_mask_2d *= multichain_mask_2d\n      dgram = dgram_from_positions(\n          pseudo_beta_positions, self.config.dgram_features\n      )\n      dgram *= pseudo_beta_mask_2d[..., None]\n      dgram = dgram.astype(dtype)\n      pseudo_beta_mask_2d = pseudo_beta_mask_2d.astype(dtype)\n      to_concat = [(dgram, 1), (pseudo_beta_mask_2d, 0)]\n\n      aatype = jax.nn.one_hot(\n          aatype,\n          residue_names.POLYMER_TYPES_NUM_WITH_UNKNOWN_AND_GAP,\n          axis=-1,\n          dtype=dtype,\n      )\n      to_concat.append((aatype[None, :, :], 1))\n      to_concat.append((aatype[:, None, :], 1))\n\n      # Compute a feature representing the normalized vector between each\n      # backbone affine - i.e. in each residues local frame, what direction are\n      # each of the other residues.\n\n      template_group_indices = jnp.take(\n          protein_data_processing.RESTYPE_RIGIDGROUP_DENSE_ATOM_IDX,\n          templates.aatype,\n          axis=0,\n      )\n      rigid, backbone_mask = make_backbone_rigid(\n          geometry.Vec3Array.from_array(dense_atom_positions),\n          dense_atom_mask,\n          template_group_indices.astype(jnp.int32),\n      )\n      points = rigid.translation\n      rigid_vec = rigid[:, None].inverse().apply_to_point(points)\n      unit_vector = rigid_vec.normalized()\n      unit_vector = [unit_vector.x, unit_vector.y, unit_vector.z]\n\n      unit_vector = [x.astype(dtype) for x in unit_vector]\n      backbone_mask = backbone_mask.astype(dtype)\n\n      backbone_mask_2d = backbone_mask[:, None] * backbone_mask[None, :]\n      backbone_mask_2d *= multichain_mask_2d\n      unit_vector = [x * backbone_mask_2d for x in unit_vector]\n\n      # Note that the backbone_mask takes into account C, CA and N (unlike\n      # pseudo beta mask which just needs CB) so we add both masks as features.\n      to_concat.extend([(x, 0) for x in unit_vector])\n      to_concat.append((backbone_mask_2d, 0))\n\n      query_embedding = hm.LayerNorm(name='query_embedding_norm')(\n          query_embedding\n      )\n      # Allow the template embedder to see the query embedding.  Note this\n      # contains the position relative feature, so this is how the network knows\n      # which residues are next to each other.\n      to_concat.append((query_embedding, 1))\n\n      act = 0\n\n      for i, (x, n_input_dims) in enumerate(to_concat):\n        act += hm.Linear(\n            num_channels,\n            num_input_dims=n_input_dims,\n            initializer='relu',\n            name=f'template_pair_embedding_{i}',\n        )(x)\n      return act\n\n    act = construct_input(query_embedding, templates, multichain_mask_2d)\n\n    if c.template_stack.num_layer:\n\n      def template_iteration_fn(x):\n        return modules.PairFormerIteration(\n            c.template_stack, gc, name='template_embedding_iteration'\n        )(act=x, pair_mask=padding_mask_2d)\n\n      template_stack = hk.experimental.layer_stack(c.template_stack.num_layer)(\n          template_iteration_fn\n      )\n      act = template_stack(act)\n\n    act = hm.LayerNorm(name='output_layer_norm')(act)\n    return act\n"
  },
  {
    "path": "src/alphafold3/model/params.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Model param loading.\"\"\"\n\nimport bisect\nimport collections\nfrom collections.abc import Iterator\nimport contextlib\nimport io\nimport os\nimport pathlib\nimport re\nimport struct\nimport sys\nfrom typing import IO\n\nimport haiku as hk\nimport jax.numpy as jnp\nimport numpy as np\nimport zstandard\n\n\nclass RecordError(Exception):\n  \"\"\"Error reading a record.\"\"\"\n\n\ndef encode_record(scope: str, name: str, arr: np.ndarray) -> bytes:\n  \"\"\"Encodes a single haiku param as bytes, preserving non-numpy dtypes.\"\"\"\n  scope = scope.encode('utf-8')\n  name = name.encode('utf-8')\n  shape = arr.shape\n  dtype = str(arr.dtype).encode('utf-8')\n  arr = np.ascontiguousarray(arr)\n  if sys.byteorder == 'big':\n    arr = arr.byteswap()\n  arr_buffer = arr.tobytes('C')\n  header = struct.pack(\n      '<5i', len(scope), len(name), len(dtype), len(shape), len(arr_buffer)\n  )\n  return header + b''.join(\n      (scope, name, dtype, struct.pack(f'{len(shape)}i', *shape), arr_buffer)\n  )\n\n\ndef _read_record(stream: IO[bytes]) -> tuple[str, str, np.ndarray] | None:\n  \"\"\"Reads a record encoded by `_encode_record` from a byte stream.\"\"\"\n  header_size = struct.calcsize('<5i')\n  header = stream.read(header_size)\n  if not header:\n    return None\n  if len(header) < header_size:\n    raise RecordError(f'Incomplete header: {len(header)=} < {header_size=}')\n  (scope_len, name_len, dtype_len, shape_len, arr_buffer_len) = struct.unpack(\n      '<5i', header\n  )\n  fmt = f'<{scope_len}s{name_len}s{dtype_len}s{shape_len}i'\n  payload_size = struct.calcsize(fmt) + arr_buffer_len\n  payload = stream.read(payload_size)\n  if len(payload) < payload_size:\n    raise RecordError(f'Incomplete payload: {len(payload)=} < {payload_size=}')\n  scope, name, dtype, *shape = struct.unpack_from(fmt, payload)\n  scope = scope.decode('utf-8')\n  name = name.decode('utf-8')\n  dtype = dtype.decode('utf-8')\n  arr = np.frombuffer(payload[-arr_buffer_len:], dtype=dtype)\n  arr = np.reshape(arr, shape)\n  if sys.byteorder == 'big':\n    arr = arr.byteswap()\n  return scope, name, arr\n\n\ndef read_records(stream: IO[bytes]) -> Iterator[tuple[str, str, np.ndarray]]:\n  \"\"\"Fully reads the contents of a byte stream.\"\"\"\n  while record := _read_record(stream):\n    yield record\n\n\nclass _MultiFileIO(io.RawIOBase):\n  \"\"\"A file-like object that presents a concatenated view of multiple files.\"\"\"\n\n  def __init__(self, files: list[pathlib.Path]):\n    self._files = files\n    self._stack = contextlib.ExitStack()\n    self._handles = [\n        self._stack.enter_context(file.open('rb')) for file in files\n    ]\n    self._sizes = []\n    for handle in self._handles:\n      handle.seek(0, os.SEEK_END)\n      self._sizes.append(handle.tell())\n    self._length = sum(self._sizes)\n    self._offsets = [0]\n    for s in self._sizes[:-1]:\n      self._offsets.append(self._offsets[-1] + s)\n    self._abspos = 0\n    self._relpos = (0, 0)\n\n  def _abs_to_rel(self, pos: int) -> tuple[int, int]:\n    idx = bisect.bisect_right(self._offsets, pos) - 1\n    return idx, pos - self._offsets[idx]\n\n  def close(self):\n    self._stack.close()\n\n  def closed(self) -> bool:\n    return all(handle.closed for handle in self._handles)\n\n  def fileno(self) -> int:\n    return -1\n\n  def readable(self) -> bool:\n    return True\n\n  def tell(self) -> int:\n    return self._abspos\n\n  def seek(self, pos: int, whence: int = os.SEEK_SET, /):\n    match whence:\n      case os.SEEK_SET:\n        pass\n      case os.SEEK_CUR:\n        pos += self._abspos\n      case os.SEEK_END:\n        pos = self._length - pos\n      case _:\n        raise ValueError(f'Invalid whence: {whence}')\n    self._abspos = pos\n    self._relpos = self._abs_to_rel(pos)\n\n  def readinto(self, b: bytearray | memoryview) -> int:\n    result = 0\n    mem = memoryview(b)\n    while mem:\n      self._handles[self._relpos[0]].seek(self._relpos[1])\n      count = self._handles[self._relpos[0]].readinto(mem)\n      result += count\n      self._abspos += count\n      self._relpos = self._abs_to_rel(self._abspos)\n      mem = mem[count:]\n      if self._abspos == self._length:\n        break\n    return result\n\n\n@contextlib.contextmanager\ndef open_for_reading(model_files: list[pathlib.Path], is_compressed: bool):\n  with contextlib.closing(_MultiFileIO(model_files)) as f:\n    if is_compressed:\n      yield zstandard.ZstdDecompressor().stream_reader(f)\n    else:\n      yield f\n\n\ndef _match_model(\n    paths: list[pathlib.Path], pattern: re.Pattern[str]\n) -> dict[str, list[pathlib.Path]]:\n  \"\"\"Match files in a directory with a pattern, and group by model name.\"\"\"\n  models = collections.defaultdict(list)\n  for path in paths:\n    match = pattern.fullmatch(path.name)\n    if match:\n      models[match.group('model_name')].append(path)\n  return {k: sorted(v) for k, v in models.items()}\n\n\ndef select_model_files(\n    model_dir: pathlib.Path, model_name: str | None = None\n) -> tuple[list[pathlib.Path], bool]:\n  \"\"\"Select the model files from a model directory.\"\"\"\n  files = [file for file in model_dir.iterdir() if file.is_file()]\n\n  for pattern, is_compressed in (\n      (r'(?P<model_name>.*)\\.[0-9]+\\.bin\\.zst$', True),\n      (r'(?P<model_name>.*)\\.bin\\.zst\\.[0-9]+$', True),\n      (r'(?P<model_name>.*)\\.[0-9]+\\.bin$', False),\n      (r'(?P<model_name>.*)\\.bin]\\.[0-9]+$', False),\n      (r'(?P<model_name>.*)\\.bin\\.zst$', True),\n      (r'(?P<model_name>.*)\\.bin$', False),\n  ):\n    models = _match_model(files, re.compile(pattern))\n    if model_name is not None:\n      if model_name in models:\n        return models[model_name], is_compressed\n    else:\n      if models:\n        if len(models) > 1:\n          raise RuntimeError(f'Multiple models matched in {model_dir}')\n        _, model_files = models.popitem()\n        return model_files, is_compressed\n  raise FileNotFoundError(f'No models matched in {model_dir}')\n\n\ndef get_model_haiku_params(model_dir: pathlib.Path) -> hk.Params:\n  \"\"\"Get the Haiku parameters from a model name.\"\"\"\n  params: dict[str, dict[str, jnp.Array]] = {}\n  model_files, is_compressed = select_model_files(model_dir)\n  with open_for_reading(model_files, is_compressed) as stream:\n    for scope, name, arr in read_records(stream):\n      params.setdefault(scope, {})[name] = jnp.array(arr)\n  if not params:\n    raise FileNotFoundError(f'Model missing from \"{model_dir}\"')\n  return params\n"
  },
  {
    "path": "src/alphafold3/model/pipeline/inter_chain_bonds.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Functions for handling inter-chain bonds.\"\"\"\n\nfrom collections.abc import Collection\nimport functools\nfrom typing import Final, NamedTuple\nfrom alphafold3 import structure\nfrom alphafold3.constants import chemical_component_sets\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.model.atom_layout import atom_layout\nimport numpy as np\n\n\nBOND_THRESHOLD_GLYCANS_ANGSTROM: Final[float] = 1.7\n# See https://pubs.acs.org/doi/10.1021/ja010331r for P-P atom bond distances.\nBOND_THRESHOLD_ALL_ANGSTROM: Final[float] = 2.4\n\n\nclass BondAtomArrays(NamedTuple):\n  chain_id: np.ndarray\n  chain_type: np.ndarray\n  res_id: np.ndarray\n  res_name: np.ndarray\n  atom_name: np.ndarray\n  coords: np.ndarray\n\n\ndef _get_bond_atom_arrays(\n    struc: structure.Structure, bond_atom_indices: np.ndarray\n) -> BondAtomArrays:\n  return BondAtomArrays(\n      chain_id=struc.chain_id[bond_atom_indices],\n      chain_type=struc.chain_type[bond_atom_indices],\n      res_id=struc.res_id[bond_atom_indices],\n      res_name=struc.res_name[bond_atom_indices],\n      atom_name=struc.atom_name[bond_atom_indices],\n      coords=struc.coords[..., bond_atom_indices, :],\n  )\n\n\n@functools.lru_cache(maxsize=1)\ndef get_polymer_ligand_and_ligand_ligand_bonds(\n    struct: structure.Structure,\n    only_glycan_ligands: bool,\n    allow_multiple_bonds_per_atom: bool,\n) -> tuple[atom_layout.AtomLayout, atom_layout.AtomLayout]:\n  \"\"\"Return polymer-ligand & ligand-ligand inter-residue bonds.\n\n  Args:\n    struct: Structure object to extract bonds from.\n    only_glycan_ligands: Whether to only include glycans in ligand category.\n    allow_multiple_bonds_per_atom: If not allowed, we greedily choose the first\n      bond seen per atom and discard the remaining on each atom..\n\n  Returns:\n    polymer_ligand, ligand_ligand_bonds: Each object is an AtomLayout object\n    [num_bonds, 2] for the bond-defining atoms.\n  \"\"\"\n  if only_glycan_ligands:\n    allowed_res_names = list({\n        *chemical_component_sets.GLYCAN_OTHER_LIGANDS,\n        *chemical_component_sets.GLYCAN_LINKING_LIGANDS,\n    })\n  else:\n    allowed_res_names = None\n  all_bonds = get_bond_layout(\n      bond_threshold=BOND_THRESHOLD_GLYCANS_ANGSTROM\n      if only_glycan_ligands\n      else BOND_THRESHOLD_ALL_ANGSTROM,\n      struct=struct,\n      allowed_chain_types1=list({\n          *mmcif_names.LIGAND_CHAIN_TYPES,\n          *mmcif_names.POLYMER_CHAIN_TYPES,\n      }),\n      allowed_chain_types2=list(mmcif_names.LIGAND_CHAIN_TYPES),\n      allowed_res_names=allowed_res_names,\n      allow_multiple_bonds_per_atom=allow_multiple_bonds_per_atom,\n  )\n  ligand_ligand_bonds_mask = np.isin(\n      all_bonds.chain_type, list(mmcif_names.LIGAND_CHAIN_TYPES)\n  )\n  polymer_ligand_bonds_mask = np.isin(\n      all_bonds.chain_type, list(mmcif_names.POLYMER_CHAIN_TYPES)\n  )\n  polymer_ligand_bonds_mask = np.logical_and(\n      ligand_ligand_bonds_mask.any(axis=1),\n      polymer_ligand_bonds_mask.any(axis=1),\n  )\n  ligand_ligand_bonds = all_bonds[ligand_ligand_bonds_mask.all(axis=1)]\n  polymer_ligand_bonds = all_bonds[polymer_ligand_bonds_mask]\n  return polymer_ligand_bonds, ligand_ligand_bonds\n\n\ndef _remove_multi_bonds(\n    bond_layout: atom_layout.AtomLayout,\n) -> atom_layout.AtomLayout:\n  \"\"\"Remove instances greedily.\"\"\"\n  uids = {}\n  keep_indx = []\n  for chain_id, res_id, atom_name in zip(\n      bond_layout.chain_id,\n      bond_layout.res_id,\n      bond_layout.atom_name,\n      strict=True,\n  ):\n    key1 = (chain_id[0], res_id[0], atom_name[0])\n    key2 = (chain_id[1], res_id[1], atom_name[1])\n    keep_indx.append(bool(key1 not in uids) and bool(key2 not in uids))\n    if key1 not in uids:\n      uids[key1] = None\n    if key2 not in uids:\n      uids[key2] = None\n  return bond_layout[np.array(keep_indx, dtype=bool)]\n\n\n@functools.lru_cache(maxsize=1)\ndef get_ligand_ligand_bonds(\n    struct: structure.Structure,\n    only_glycan_ligands: bool,\n    allow_multiple_bonds_per_atom: bool = False,\n) -> atom_layout.AtomLayout:\n  \"\"\"Return ligand-ligand inter-residue bonds.\n\n  Args:\n    struct: Structure object to extract bonds from.\n    only_glycan_ligands: Whether to only include glycans in ligand category.\n    allow_multiple_bonds_per_atom: If not allowed, we greedily choose the first\n      bond seen per atom and discard the remaining on each atom.\n\n  Returns:\n    bond_layout: AtomLayout object [num_bonds, 2] for the bond-defining atoms.\n  \"\"\"\n  if only_glycan_ligands:\n    allowed_res_names = list({\n        *chemical_component_sets.GLYCAN_OTHER_LIGANDS,\n        *chemical_component_sets.GLYCAN_LINKING_LIGANDS,\n    })\n  else:\n    allowed_res_names = None\n  return get_bond_layout(\n      bond_threshold=BOND_THRESHOLD_GLYCANS_ANGSTROM\n      if only_glycan_ligands\n      else BOND_THRESHOLD_ALL_ANGSTROM,\n      struct=struct,\n      allowed_chain_types1=list(mmcif_names.LIGAND_CHAIN_TYPES),\n      allowed_chain_types2=list(mmcif_names.LIGAND_CHAIN_TYPES),\n      allowed_res_names=allowed_res_names,\n      allow_multiple_bonds_per_atom=allow_multiple_bonds_per_atom,\n  )\n\n\n@functools.lru_cache(maxsize=1)\ndef get_polymer_ligand_bonds(\n    struct: structure.Structure,\n    only_glycan_ligands: bool,\n    allow_multiple_bonds_per_atom: bool = False,\n    bond_threshold: float | None = None,\n) -> atom_layout.AtomLayout:\n  \"\"\"Return polymer-ligand interchain bonds.\n\n  Args:\n    struct: Structure object to extract bonds from.\n    only_glycan_ligands: Whether to only include glycans in ligand category.\n    allow_multiple_bonds_per_atom: If not allowed, we greedily choose the first\n      bond seen per atom and discard the remaining on each atom.\n    bond_threshold: Euclidean distance of max allowed bond.\n\n  Returns:\n    bond_layout: AtomLayout object [num_bonds, 2] for the bond-defining atoms.\n  \"\"\"\n  if only_glycan_ligands:\n    allowed_res_names = list({\n        *chemical_component_sets.GLYCAN_OTHER_LIGANDS,\n        *chemical_component_sets.GLYCAN_LINKING_LIGANDS,\n    })\n  else:\n    allowed_res_names = None\n  if bond_threshold is None:\n    if only_glycan_ligands:\n      bond_threshold = BOND_THRESHOLD_GLYCANS_ANGSTROM\n    else:\n      bond_threshold = BOND_THRESHOLD_ALL_ANGSTROM\n  return get_bond_layout(\n      bond_threshold=bond_threshold,\n      struct=struct,\n      allowed_chain_types1=list(mmcif_names.POLYMER_CHAIN_TYPES),\n      allowed_chain_types2=list(mmcif_names.LIGAND_CHAIN_TYPES),\n      allowed_res_names=allowed_res_names,\n      allow_multiple_bonds_per_atom=allow_multiple_bonds_per_atom,\n  )\n\n\ndef get_bond_layout(\n    bond_threshold: float = BOND_THRESHOLD_ALL_ANGSTROM,\n    *,\n    struct: structure.Structure,\n    allowed_chain_types1: Collection[str],\n    allowed_chain_types2: Collection[str],\n    include_bond_types: Collection[str] = ('covale',),\n    allowed_res_names: Collection[str] | None = None,\n    allow_multiple_bonds_per_atom: bool,\n) -> atom_layout.AtomLayout:\n  \"\"\"Get bond_layout for all bonds between two sets of chain types.\n\n  There is a mask (all_mask) that runs through this script, and each bond pair\n  needs to maintain a True across all conditions in order to be preserved at the\n  end, otherwise the bond pair has invalidated a condition with a False and is\n  removed entirely. Note, we remove oxygen atom bonds as they are an edge case\n  that causes issues with scoring, due to multiple waters bonding with single\n  residues.\n\n  Args:\n    bond_threshold: Maximum bond distance in Angstrom.\n    struct: Structure object to extract bonds from.\n    allowed_chain_types1: One end of the bonds must be an atom with one of these\n      chain types.\n    allowed_chain_types2: The other end of the bond must be an atom with one of\n      these chain types.\n    include_bond_types: Only include bonds with specified type e.g. hydrog,\n      metalc, covale, disulf.\n    allowed_res_names: Further restricts from chain_types. Either end of the\n      bonds must be an atom part of these res_names. If none all will be\n      accepted after chain and bond type filtering.\n    allow_multiple_bonds_per_atom: If not allowed, we greedily choose the first\n      bond seen per atom and discard the remaining on each atom.\n\n  Returns:\n    bond_layout: AtomLayout object [num_bonds, 2] for the bond-defining atoms.\n  \"\"\"\n  if not struct.bonds:\n    return atom_layout.AtomLayout(\n        atom_name=np.empty((0, 2), dtype=object),\n        res_id=np.empty((0, 2), dtype=int),\n        res_name=np.empty((0, 2), dtype=object),\n        chain_id=np.empty((0, 2), dtype=object),\n        chain_type=np.empty((0, 2), dtype=object),\n        atom_element=np.empty((0, 2), dtype=object),\n    )\n  from_atom_idxs, dest_atom_idxs = struct.bonds.get_atom_indices(\n      struct.atom_key\n  )\n  from_atoms = _get_bond_atom_arrays(struct, from_atom_idxs)\n  dest_atoms = _get_bond_atom_arrays(struct, dest_atom_idxs)\n  # Chain type\n  chain_mask = np.logical_or(\n      np.logical_and(\n          np.isin(\n              from_atoms.chain_type,\n              allowed_chain_types1,\n          ),\n          np.isin(\n              dest_atoms.chain_type,\n              allowed_chain_types2,\n          ),\n      ),\n      np.logical_and(\n          np.isin(\n              from_atoms.chain_type,\n              allowed_chain_types2,\n          ),\n          np.isin(\n              dest_atoms.chain_type,\n              allowed_chain_types1,\n          ),\n      ),\n  )\n  if allowed_res_names:\n    # Res type\n    res_mask = np.logical_or(\n        np.isin(from_atoms.res_name, allowed_res_names),\n        np.isin(dest_atoms.res_name, allowed_res_names),\n    )\n    # All mask\n    all_mask = np.logical_and(chain_mask, res_mask)\n  else:\n    all_mask = chain_mask\n  # Bond type mask\n  type_mask = np.isin(struct.bonds.type, list(include_bond_types))\n  np.logical_and(all_mask, type_mask, out=all_mask)\n  # Bond length check. Work in square length to avoid taking many square roots.\n  bond_length_squared = np.square(from_atoms.coords - dest_atoms.coords).sum(\n      axis=1\n  )\n  bond_threshold_squared = bond_threshold * bond_threshold\n  np.logical_and(\n      all_mask, bond_length_squared < bond_threshold_squared, out=all_mask\n  )\n  # Inter-chain and inter-residue bonds for ligands\n  ligand_types = list(mmcif_names.LIGAND_CHAIN_TYPES)\n  is_ligand = np.logical_or(\n      np.isin(\n          from_atoms.chain_type,\n          ligand_types,\n      ),\n      np.isin(\n          dest_atoms.chain_type,\n          ligand_types,\n      ),\n  )\n  res_id_differs = from_atoms.res_id != dest_atoms.res_id\n  chain_id_differs = from_atoms.chain_id != dest_atoms.chain_id\n  is_inter_res = np.logical_or(res_id_differs, chain_id_differs)\n  is_inter_ligand_res = np.logical_and(is_inter_res, is_ligand)\n  is_inter_chain_not_ligand = np.logical_and(chain_id_differs, ~is_ligand)\n  # If ligand then inter-res & inter-chain bonds, otherwise inter-chain only.\n  combined_allowed_bonds = np.logical_or(\n      is_inter_chain_not_ligand, is_inter_ligand_res\n  )\n  np.logical_and(all_mask, combined_allowed_bonds, out=all_mask)\n  bond_layout = atom_layout.AtomLayout(\n      atom_name=np.stack(\n          [\n              from_atoms.atom_name[all_mask],\n              dest_atoms.atom_name[all_mask],\n          ],\n          axis=1,\n          dtype=object,\n      ),\n      res_id=np.stack(\n          [from_atoms.res_id[all_mask], dest_atoms.res_id[all_mask]],\n          axis=1,\n          dtype=int,\n      ),\n      chain_id=np.stack(\n          [\n              from_atoms.chain_id[all_mask],\n              dest_atoms.chain_id[all_mask],\n          ],\n          axis=1,\n          dtype=object,\n      ),\n  )\n  if not allow_multiple_bonds_per_atom:\n    bond_layout = _remove_multi_bonds(bond_layout)\n  return atom_layout.fill_in_optional_fields(\n      bond_layout,\n      reference_atoms=atom_layout.atom_layout_from_structure(struct),\n  )\n"
  },
  {
    "path": "src/alphafold3/model/pipeline/pipeline.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"The main featurizer.\"\"\"\n\nimport bisect\nfrom collections.abc import Sequence\nimport datetime\nimport itertools\n\nfrom absl import logging\nfrom alphafold3.common import base_config\nfrom alphafold3.common import folding_input\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.model import feat_batch\nfrom alphafold3.model import features\nfrom alphafold3.model.pipeline import inter_chain_bonds\nfrom alphafold3.model.pipeline import structure_cleaning\nfrom alphafold3.structure import chemical_components as struc_chem_comps\nimport numpy as np\n\n\n_DETERMINISTIC_FRAMES_RANDOM_SEED = 12312837\n\n\ndef calculate_bucket_size(\n    num_tokens: int, buckets: Sequence[int] | None\n) -> int:\n  \"\"\"Calculates the bucket size to pad the data to.\"\"\"\n  if buckets is None:\n    return num_tokens\n\n  if not buckets:\n    raise ValueError('Buckets must be non-empty.')\n\n  if not all(prev < curr for prev, curr in itertools.pairwise(buckets)):\n    raise ValueError(\n        f'Buckets must be in strictly increasing order. Got {buckets=}.'\n    )\n\n  bucket_idx = bisect.bisect_left(buckets, num_tokens)\n\n  if bucket_idx == len(buckets):\n    logging.warning(\n        'Creating a new bucket of size %d since the input has more tokens than'\n        ' the largest bucket size %d. This may trigger a re-compilation of the'\n        ' model. Consider additional large bucket sizes to avoid excessive'\n        ' re-compilation.',\n        num_tokens,\n        buckets[-1],\n    )\n    return num_tokens\n\n  return buckets[bucket_idx]\n\n\nclass NanDataError(Exception):\n  \"\"\"Raised if the data pipeline produces data containing nans.\"\"\"\n\n\nclass TotalNumResOutOfRangeError(Exception):\n  \"\"\"Raised if total number of residues for all chains outside allowed range.\"\"\"\n\n\nclass MmcifNumChainsError(Exception):\n  \"\"\"Raised if the mmcif file contains too many / too few chains.\"\"\"\n\n\nclass WholePdbPipeline:\n  \"\"\"Processes an entire mmcif entity and merges the content.\"\"\"\n\n  class Config(base_config.BaseConfig):\n    \"\"\"Configuration object for `WholePdbPipeline`.\n\n    Properties:\n      max_atoms_per_token: number of atom slots in one token (was called\n        num_dense, and semi-hardcoded to 24 before)\n      pad_num_chains: Size to pad NUM_CHAINS feature dimensions to, only for\n        protein chains.\n      buckets: Bucket sizes to pad the data to, to avoid excessive\n        re-compilation of the model. If None, calculate the appropriate bucket\n        size from the number of tokens. If not None, must be a sequence of at\n        least one integer, in strictly increasing order. Will raise an error if\n        the number of tokens is more than the largest bucket size.\n      max_total_residues: Any mmCIF with more total residues will be rejected.\n        If none, then no limit is applied.\n      min_total_residues: Any mmCIF with less total residues will be rejected.\n      msa_crop_size: Maximum size of MSA to take across all chains.\n      max_template_date: Optional max template date to prevent data leakage in\n        validation.\n      ref_max_modified_date: Optional maximum date that controls whether to\n        allow use of model coordinates for a chemical component from the CCD if\n        RDKit conformer generation fails and the component does not have ideal\n        coordinates set. Only for components that have been released before this\n        date the model coordinates can be used as a fallback.\n      max_templates: The maximum number of templates to send through the network\n        set to 0 to switch off templates.\n      filter_clashes: If true then will remove clashing chains.\n      filter_crystal_aids: If true ligands in the cryal aid list are removed.\n      max_paired_sequence_per_species: The maximum number of sequences per\n        species that will be used for MSA pairing.\n      drop_ligand_leaving_atoms: Flag for handling leaving atoms for ligands.\n      average_num_atoms_per_token: Target average number of atoms per token to\n        compute the padding size for flat atoms.\n      atom_cross_att_queries_subset_size: queries subset size in atom cross\n        attention\n      atom_cross_att_keys_subset_size: keys subset size in atom cross attention\n      flatten_non_standard_residues: Whether to expand non-standard polymer\n        residues into flat-atom format.\n      remove_nonsymmetric_bonds: Whether to remove nonsymmetric bonds from\n        symmetric polymer chains.\n      deterministic_frames: Whether to use fixed-seed reference positions to\n        construct deterministic frames.\n      resolve_msa_overlaps: Whether to deduplicate unpaired MSA against paired\n        MSA. The default behaviour matches the method described in the AlphaFold\n        3 paper. Set this to false if providing custom paired MSA using the\n        unpaired MSA field to keep it exactly as is as deduplication against\n        the paired MSA could break the manually crafted pairing between MSA\n        sequences.\n    \"\"\"\n\n    max_atoms_per_token: int = 24\n    pad_num_chains: int = 1000\n    buckets: list[int] | None = None\n    max_total_residues: int | None = None\n    min_total_residues: int | None = None\n    msa_crop_size: int = 16384\n    max_template_date: datetime.date | None = None\n    ref_max_modified_date: datetime.date | None = None\n    max_templates: int = 4\n    filter_clashes: bool = False\n    filter_crystal_aids: bool = False\n    max_paired_sequence_per_species: int = 600\n    drop_ligand_leaving_atoms: bool = True\n    average_num_atoms_per_token: int = 24\n    atom_cross_att_queries_subset_size: int = 32\n    atom_cross_att_keys_subset_size: int = 128\n    flatten_non_standard_residues: bool = True\n    remove_nonsymmetric_bonds: bool = False\n    deterministic_frames: bool = True\n    conformer_max_iterations: int | None = None\n    resolve_msa_overlaps: bool = True\n\n  def __init__(self, *, config: Config):\n    \"\"\"Initializes WholePdb data pipeline.\n\n    Args:\n      config: Pipeline configuration.\n    \"\"\"\n    self._config = config\n\n  def process_item(\n      self,\n      fold_input: folding_input.Input,\n      random_state: np.random.RandomState,\n      ccd: chemical_components.Ccd,\n      random_seed: int | None = None,\n  ) -> features.BatchDict:\n    \"\"\"Takes requests from in_queue, adds (key, serialized ex) to out_queue.\"\"\"\n    if random_seed is None:\n      random_seed = random_state.randint(2**31)\n\n    random_state = np.random.RandomState(seed=random_seed)\n\n    logging_name = f'{fold_input.name}, random_seed={random_seed}'\n    logging.info('processing %s', logging_name)\n    struct = fold_input.to_structure(ccd=ccd)\n\n    # Clean structure.\n    cleaned_struc, cleaning_metadata = structure_cleaning.clean_structure(\n        struct,\n        ccd=ccd,\n        drop_non_standard_atoms=True,\n        drop_missing_sequence=True,\n        filter_clashes=self._config.filter_clashes,\n        filter_crystal_aids=self._config.filter_crystal_aids,\n        filter_waters=True,\n        filter_hydrogens=True,\n        filter_leaving_atoms=self._config.drop_ligand_leaving_atoms,\n        only_glycan_ligands_for_leaving_atoms=True,\n        covalent_bonds_only=True,\n        remove_polymer_polymer_bonds=True,\n        remove_bad_bonds=True,\n        remove_nonsymmetric_bonds=self._config.remove_nonsymmetric_bonds,\n    )\n\n    num_clashing_chains_removed = cleaning_metadata[\n        'num_clashing_chains_removed'\n    ]\n\n    if num_clashing_chains_removed:\n      logging.info(\n          'Removed %d clashing chains from %s',\n          num_clashing_chains_removed,\n          logging_name,\n      )\n\n    # No chains after fixes\n    if cleaned_struc.num_chains == 0:\n      raise MmcifNumChainsError(f'{logging_name}: No chains in structure!')\n\n    polymer_ligand_bonds, ligand_ligand_bonds = (\n        inter_chain_bonds.get_polymer_ligand_and_ligand_ligand_bonds(\n            cleaned_struc,\n            only_glycan_ligands=False,\n            allow_multiple_bonds_per_atom=True,\n        )\n    )\n\n    # If empty replace with None as this causes errors downstream.\n    if ligand_ligand_bonds and not ligand_ligand_bonds.atom_name.size:\n      ligand_ligand_bonds = None\n    if polymer_ligand_bonds and not polymer_ligand_bonds.atom_name.size:\n      polymer_ligand_bonds = None\n\n    # Create the flat output AtomLayout\n    empty_output_struc, flat_output_layout = (\n        structure_cleaning.create_empty_output_struc_and_layout(\n            struc=cleaned_struc,\n            ccd=ccd,\n            polymer_ligand_bonds=polymer_ligand_bonds,\n            ligand_ligand_bonds=ligand_ligand_bonds,\n            drop_ligand_leaving_atoms=self._config.drop_ligand_leaving_atoms,\n        )\n    )\n\n    # Select the tokens for Evoformer.\n    # Each token (e.g. a residue) is encoded as one representative atom. This\n    # is flexible enough to allow the 1-token-per-atom ligand representation\n    # in the future.\n    all_tokens, all_token_atoms_layout, standard_token_idxs = (\n        features.tokenizer(\n            flat_output_layout,\n            ccd=ccd,\n            max_atoms_per_token=self._config.max_atoms_per_token,\n            flatten_non_standard_residues=self._config.flatten_non_standard_residues,\n            logging_name=logging_name,\n        )\n    )\n    total_tokens = len(all_tokens.atom_name)\n    if (\n        self._config.max_total_residues\n        and total_tokens > self._config.max_total_residues\n    ):\n      raise TotalNumResOutOfRangeError(\n          'Total Number of Residues > max_total_residues: '\n          f'({total_tokens} > {self._config.max_total_residues})'\n      )\n\n    if (\n        self._config.min_total_residues\n        and total_tokens < self._config.min_total_residues\n    ):\n      raise TotalNumResOutOfRangeError(\n          'Total Number of Residues < min_total_residues: '\n          f'({total_tokens} < {self._config.min_total_residues})'\n      )\n\n    logging.info(\n        'Calculating bucket size for input with %d tokens.', total_tokens\n    )\n    padded_token_length = calculate_bucket_size(\n        total_tokens, self._config.buckets\n    )\n    logging.info(\n        'Got bucket size %d for input with %d tokens, resulting in %d padded'\n        ' tokens.',\n        padded_token_length,\n        total_tokens,\n        padded_token_length - total_tokens,\n    )\n\n    # Padding shapes for all features.\n    num_atoms = padded_token_length * self._config.average_num_atoms_per_token\n    # Round up to next multiple of subset size.\n    num_atoms = int(\n        np.ceil(num_atoms / self._config.atom_cross_att_queries_subset_size)\n        * self._config.atom_cross_att_queries_subset_size\n    )\n    padding_shapes = features.PaddingShapes(\n        num_tokens=padded_token_length,\n        msa_size=self._config.msa_crop_size,\n        num_chains=self._config.pad_num_chains,\n        num_templates=self._config.max_templates,\n        num_atoms=num_atoms,\n    )\n\n    # Create the atom layouts for flat atom cross attention\n    batch_atom_cross_att = features.AtomCrossAtt.compute_features(\n        all_token_atoms_layout=all_token_atoms_layout,\n        queries_subset_size=self._config.atom_cross_att_queries_subset_size,\n        keys_subset_size=self._config.atom_cross_att_keys_subset_size,\n        padding_shapes=padding_shapes,\n    )\n\n    # Extract per-token features\n    batch_token_features = features.TokenFeatures.compute_features(\n        all_tokens=all_tokens,\n        padding_shapes=padding_shapes,\n    )\n\n    # Create reference structure features\n    chemical_components_data = struc_chem_comps.populate_missing_ccd_data(\n        ccd=ccd,\n        chemical_components_data=cleaned_struc.chemical_components_data,\n        populate_pdbx_smiles=True,\n    )\n\n    # Add smiles info to empty_output_struc.\n    empty_output_struc = empty_output_struc.copy_and_update_globals(\n        chemical_components_data=chemical_components_data\n    )\n    # Create layouts and store structures for model output conversion.\n    batch_convert_model_output = features.ConvertModelOutput.compute_features(\n        all_token_atoms_layout=all_token_atoms_layout,\n        padding_shapes=padding_shapes,\n        cleaned_struc=cleaned_struc,\n        flat_output_layout=flat_output_layout,\n        empty_output_struc=empty_output_struc,\n        polymer_ligand_bonds=polymer_ligand_bonds,\n        ligand_ligand_bonds=ligand_ligand_bonds,\n    )\n\n    # Create the PredictedStructureInfo\n    batch_predicted_structure_info = (\n        features.PredictedStructureInfo.compute_features(\n            all_tokens=all_tokens,\n            all_token_atoms_layout=all_token_atoms_layout,\n            padding_shapes=padding_shapes,\n        )\n    )\n\n    # Create MSA features\n    batch_msa = features.MSA.compute_features(\n        all_tokens=all_tokens,\n        standard_token_idxs=standard_token_idxs,\n        padding_shapes=padding_shapes,\n        fold_input=fold_input,\n        logging_name=logging_name,\n        max_paired_sequence_per_species=self._config.max_paired_sequence_per_species,\n        resolve_msa_overlaps=self._config.resolve_msa_overlaps,\n    )\n\n    # Create template features\n    batch_templates = features.Templates.compute_features(\n        all_tokens=all_tokens,\n        standard_token_idxs=standard_token_idxs,\n        padding_shapes=padding_shapes,\n        fold_input=fold_input,\n        max_templates=self._config.max_templates,\n        logging_name=logging_name,\n    )\n\n    ref_max_modified_date = self._config.ref_max_modified_date\n    conformer_max_iterations = self._config.conformer_max_iterations\n    batch_ref_structure, ligand_ligand_bonds = (\n        features.RefStructure.compute_features(\n            all_token_atoms_layout=all_token_atoms_layout,\n            ccd=ccd,\n            padding_shapes=padding_shapes,\n            chemical_components_data=chemical_components_data,\n            random_state=random_state,\n            ref_max_modified_date=ref_max_modified_date,\n            conformer_max_iterations=conformer_max_iterations,\n            ligand_ligand_bonds=ligand_ligand_bonds,\n        )\n    )\n    deterministic_ref_structure = None\n    if self._config.deterministic_frames:\n      deterministic_ref_structure, _ = features.RefStructure.compute_features(\n          all_token_atoms_layout=all_token_atoms_layout,\n          ccd=ccd,\n          padding_shapes=padding_shapes,\n          chemical_components_data=chemical_components_data,\n          random_state=(\n              np.random.RandomState(_DETERMINISTIC_FRAMES_RANDOM_SEED)\n          ),\n          ref_max_modified_date=ref_max_modified_date,\n          conformer_max_iterations=None,\n          ligand_ligand_bonds=ligand_ligand_bonds,\n      )\n\n    # Create ligand-polymer bond features.\n    polymer_ligand_bond_info = features.PolymerLigandBondInfo.compute_features(\n        all_tokens=all_tokens,\n        all_token_atoms_layout=all_token_atoms_layout,\n        bond_layout=polymer_ligand_bonds,\n        padding_shapes=padding_shapes,\n    )\n    # Create ligand-ligand bond features.\n    ligand_ligand_bond_info = features.LigandLigandBondInfo.compute_features(\n        all_tokens,\n        ligand_ligand_bonds,\n        padding_shapes,\n    )\n\n    # Create the Pseudo-beta layout for distogram head and distance error head.\n    batch_pseudo_beta_info = features.PseudoBetaInfo.compute_features(\n        all_token_atoms_layout=all_token_atoms_layout,\n        ccd=ccd,\n        padding_shapes=padding_shapes,\n        logging_name=logging_name,\n    )\n\n    # Frame construction.\n    batch_frames = features.Frames.compute_features(\n        all_tokens=all_tokens,\n        all_token_atoms_layout=all_token_atoms_layout,\n        ref_structure=(\n            deterministic_ref_structure\n            if self._config.deterministic_frames\n            else batch_ref_structure\n        ),\n        padding_shapes=padding_shapes,\n    )\n\n    # Assemble the Batch object.\n    batch = feat_batch.Batch(\n        msa=batch_msa,\n        templates=batch_templates,\n        token_features=batch_token_features,\n        ref_structure=batch_ref_structure,\n        predicted_structure_info=batch_predicted_structure_info,\n        polymer_ligand_bond_info=polymer_ligand_bond_info,\n        ligand_ligand_bond_info=ligand_ligand_bond_info,\n        pseudo_beta_info=batch_pseudo_beta_info,\n        atom_cross_att=batch_atom_cross_att,\n        convert_model_output=batch_convert_model_output,\n        frames=batch_frames,\n    )\n\n    np_example = batch.as_data_dict()\n    if 'num_iter_recycling' in np_example:\n      del np_example['num_iter_recycling']  # that does not belong here\n\n    for name, value in np_example.items():\n      if (\n          value.dtype.kind not in {'U', 'S'}\n          and value.dtype.name != 'object'\n          and np.isnan(np.sum(value))\n      ):\n        raise NanDataError(\n            f'Data pipeline output for {logging_name=} contains NaNs. NaN'\n            f' feature: {name}'\n        )\n\n    return np_example\n"
  },
  {
    "path": "src/alphafold3/model/pipeline/structure_cleaning.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Prepare PDB structure for training or inference.\"\"\"\n\nfrom typing import Any\n\nfrom absl import logging\nfrom alphafold3 import structure\nfrom alphafold3.constants import chemical_component_sets\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.model.atom_layout import atom_layout\nfrom alphafold3.model.pipeline import inter_chain_bonds\nfrom alphafold3.model.scoring import covalent_bond_cleaning\nfrom alphafold3.structure import sterics\nimport numpy as np\n\n\ndef _get_leaving_atom_mask(\n    struc: structure.Structure,\n    polymer_ligand_bonds: atom_layout.AtomLayout | None,\n    ligand_ligand_bonds: atom_layout.AtomLayout | None,\n    chain_id: str,\n    chain_type: str,\n    res_id: int,\n    res_name: str,\n) -> np.ndarray:\n  \"\"\"Updates a drop_leaving_atoms mask with new leaving atom locations.\"\"\"\n  bonded_atoms = atom_layout.get_bonded_atoms(\n      polymer_ligand_bonds,\n      ligand_ligand_bonds,\n      res_id,\n      chain_id,\n  )\n  # Connect the amino-acids, i.e. remove OXT, HXT and H2.\n  drop_atoms = atom_layout.get_link_drop_atoms(\n      res_name=res_name,\n      chain_type=chain_type,\n      is_start_terminus=False,\n      is_end_terminus=False,\n      bonded_atoms=bonded_atoms,\n      drop_ligand_leaving_atoms=True,\n  )\n  # Default mask where everything is false, which equates to being kept.\n  drop_atom_filter_atoms = struc.chain_id != struc.chain_id\n  for drop_atom in drop_atoms:\n    drop_atom_filter_atom = np.logical_and(\n        np.logical_and(\n            struc.atom_name == drop_atom,\n            struc.chain_id == chain_id,\n        ),\n        struc.res_id == res_id,\n    )\n    drop_atom_filter_atoms = np.logical_or(\n        drop_atom_filter_atoms, drop_atom_filter_atom\n    )\n  return drop_atom_filter_atoms\n\n\ndef clean_structure(\n    struc: structure.Structure,\n    ccd: chemical_components.Ccd,\n    *,\n    drop_missing_sequence: bool,\n    filter_clashes: bool,\n    drop_non_standard_atoms: bool,\n    filter_crystal_aids: bool,\n    filter_waters: bool,\n    filter_hydrogens: bool,\n    filter_leaving_atoms: bool,\n    only_glycan_ligands_for_leaving_atoms: bool,\n    covalent_bonds_only: bool,\n    remove_polymer_polymer_bonds: bool,\n    remove_bad_bonds: bool,\n    remove_nonsymmetric_bonds: bool,\n) -> tuple[structure.Structure, dict[str, Any]]:\n  \"\"\"Cleans structure.\n\n  Args:\n    struc: Structure to clean.\n    ccd: The chemical components dictionary.\n    drop_missing_sequence: Whether to drop chains without specified sequences.\n    filter_clashes: Whether to drop clashing chains.\n    drop_non_standard_atoms: Whether to drop non CCD standard atoms.\n    filter_crystal_aids: Whether to drop ligands in the crystal aid set.\n    filter_waters: Whether to drop water chains.\n    filter_hydrogens: Whether to drop hyrdogen atoms.\n    filter_leaving_atoms: Whether to drop leaving atoms based on heuristics.\n    only_glycan_ligands_for_leaving_atoms: Whether to only include glycan\n      ligands when filtering leaving atoms.\n    covalent_bonds_only: Only include covalent bonds.\n    remove_polymer_polymer_bonds: Remove polymer-polymer bonds.\n    remove_bad_bonds: Whether to remove badly bonded ligands.\n    remove_nonsymmetric_bonds: Whether to remove nonsymmetric polymer-ligand\n      bonds from symmetric polymer chains.\n\n  Returns:\n    Tuple of structure and metadata dict. The metadata dict has\n    information about what was cleaned from the original.\n  \"\"\"\n\n  metadata = {}\n  # Crop crystallization aids.\n  if (\n      filter_crystal_aids\n      and struc.structure_method in mmcif_names.CRYSTALLIZATION_METHODS\n  ):\n    struc = struc.filter_out(\n        res_name=chemical_component_sets.COMMON_CRYSTALLIZATION_AIDS\n    )\n\n  # Drop chains without specified sequences.\n  if drop_missing_sequence:\n    chains_with_unk_sequence = struc.find_chains_with_unknown_sequence()\n    num_with_unk_sequence = len(chains_with_unk_sequence)\n    if chains_with_unk_sequence:\n      struc = struc.filter_out(chain_id=chains_with_unk_sequence)\n  else:\n    num_with_unk_sequence = 0\n  metadata['num_with_unk_sequence'] = num_with_unk_sequence\n\n  # Remove intersecting chains.\n  if filter_clashes and struc.num_chains > 1:\n    clashing_chains = sterics.find_clashing_chains(struc)\n    if clashing_chains:\n      struc = struc.filter_out(chain_id=clashing_chains)\n  else:\n    clashing_chains = []\n  metadata['num_clashing_chains_removed'] = len(clashing_chains)\n  metadata['chains_removed'] = clashing_chains\n\n  # Drop non-standard atoms\n  if drop_non_standard_atoms:\n    struc = struc.drop_non_standard_atoms(\n        ccd=ccd, drop_unk=False, drop_non_ccd=False\n    )\n\n  # Sort chains in \"reverse-spreadsheet\" order.\n  struc = struc.with_sorted_chains\n\n  if filter_hydrogens:\n    struc = struc.without_hydrogen()\n\n  if filter_waters:\n    struc = struc.filter_out(chain_type=mmcif_names.WATER)\n\n  if filter_leaving_atoms:\n    drop_leaving_atoms_all = struc.chain_id != struc.chain_id\n    polymer_ligand_bonds = inter_chain_bonds.get_polymer_ligand_bonds(\n        struc,\n        only_glycan_ligands=only_glycan_ligands_for_leaving_atoms,\n    )\n    ligand_ligand_bonds = inter_chain_bonds.get_ligand_ligand_bonds(\n        struc,\n        only_glycan_ligands=only_glycan_ligands_for_leaving_atoms,\n    )\n    all_glycans = {\n        *chemical_component_sets.GLYCAN_OTHER_LIGANDS,\n        *chemical_component_sets.GLYCAN_LINKING_LIGANDS,\n    }\n    # If only glycan ligands and no O1 atoms, we can do parallel drop.\n    if (\n        only_glycan_ligands_for_leaving_atoms\n        and (not (ligand_ligand_bonds.atom_name == 'O1').any())\n        and (not (polymer_ligand_bonds.atom_name == 'O1').any())\n    ):\n      drop_leaving_atoms_all = np.logical_and(\n          np.isin(struc.atom_name, 'O1'),\n          np.isin(struc.res_name, list(all_glycans)),\n      )\n    else:\n      substruct = struc.group_by_residue\n      glycan_mask = np.isin(substruct.res_name, list(all_glycans))\n      substruct = substruct.filter(glycan_mask)\n      # We need to iterate over all glycan residues for this.\n      for res in substruct.iter_residues():\n        # Only need to do drop leaving atoms for glycans depending on bonds.\n        if (res_name := res['res_name']) in all_glycans:\n          drop_atom_filter = _get_leaving_atom_mask(\n              struc=struc,\n              polymer_ligand_bonds=polymer_ligand_bonds,\n              ligand_ligand_bonds=ligand_ligand_bonds,\n              chain_id=res['chain_id'],\n              chain_type=res['chain_type'],\n              res_id=res['res_id'],\n              res_name=res_name,\n          )\n          drop_leaving_atoms_all = np.logical_or(\n              drop_leaving_atoms_all, drop_atom_filter\n          )\n\n    num_atoms_before = struc.num_atoms\n    struc = struc.filter_out(drop_leaving_atoms_all)\n    num_atoms_after = struc.num_atoms\n\n    if num_atoms_before > num_atoms_after:\n      logging.error(\n          'Dropped %s atoms from GT struc: chain_id %s res_id %s res_name %s',\n          num_atoms_before - num_atoms_after,\n          struc.chain_id,\n          struc.res_id,\n          struc.res_name,\n      )\n\n  # Can filter by bond type without having to iterate over bonds.\n  if struc.bonds and covalent_bonds_only:\n    is_covalent = np.isin(struc.bonds.type, ['covale'])\n    if sum(is_covalent) > 0:\n      new_bonds = struc.bonds[is_covalent]\n    else:\n      new_bonds = structure.Bonds.make_empty()\n    struc = struc.copy_and_update(bonds=new_bonds)\n\n  # Other bond filters require iterating over individual bonds.\n  if struc.bonds and (remove_bad_bonds or remove_polymer_polymer_bonds):\n    include_bond = []\n    num_pp_bonds = 0\n    num_bad_bonds = 0\n    for bond in struc.iter_bonds():\n      dest_atom = bond.dest_atom\n      from_atom = bond.from_atom\n      if remove_polymer_polymer_bonds:\n        if (\n            from_atom['chain_type'] in mmcif_names.POLYMER_CHAIN_TYPES\n            and dest_atom['chain_type'] in mmcif_names.POLYMER_CHAIN_TYPES\n        ):\n          num_pp_bonds += 1\n          include_bond.append(False)\n          continue\n      if remove_bad_bonds:\n        dest_coords = np.array(\n            [dest_atom['atom_x'], dest_atom['atom_y'], dest_atom['atom_z']]\n        )\n        from_coords = np.array(\n            [from_atom['atom_x'], from_atom['atom_y'], from_atom['atom_z']]\n        )\n        squared_dist = np.sum(np.square(dest_coords - from_coords))\n        squared_threshold = 2.4 * 2.4\n        if squared_dist > squared_threshold:\n          num_bad_bonds += 1\n          include_bond.append(False)\n          continue\n      include_bond.append(True)\n    if sum(include_bond) < len(struc.bonds):\n      logging.info(\n          'Reducing number of bonds for %s from %s to %s, of which %s are'\n          ' polymer-polymer bonds and %s are bad bonds.',\n          struc.name,\n          len(struc.bonds),\n          sum(include_bond),\n          num_pp_bonds,\n          num_bad_bonds,\n      )\n      if sum(include_bond) > 0:\n        # Need to index bonds with bond keys or arrays of bools with same length\n        # as num bonds. In this case, we use array of bools (as elsewhere in the\n        # cleaning code).\n        new_bonds = struc.bonds[np.array(include_bond, dtype=bool)]\n      else:\n        new_bonds = structure.Bonds.make_empty()\n      struc = struc.copy_and_update(bonds=new_bonds)\n\n  if struc.bonds and remove_nonsymmetric_bonds:\n    # Check for asymmetric polymer-ligand bonds and remove if these exist.\n    polymer_ligand_bonds = inter_chain_bonds.get_polymer_ligand_bonds(\n        struc,\n        only_glycan_ligands=False,\n    )\n    if polymer_ligand_bonds:\n      if covalent_bond_cleaning.has_nonsymmetric_bonds_on_symmetric_polymer_chains(\n          struc, polymer_ligand_bonds\n      ):\n        from_atom_idxs, dest_atom_idxs = struc.bonds.get_atom_indices(\n            struc.atom_key\n        )\n        poly_chain_types = list(mmcif_names.POLYMER_CHAIN_TYPES)\n        is_polymer_bond = np.logical_or(\n            np.isin(struc.chain_type[from_atom_idxs], poly_chain_types),\n            np.isin(struc.chain_type[dest_atom_idxs], poly_chain_types),\n        )\n        struc = struc.copy_and_update(bonds=struc.bonds[~is_polymer_bond])\n\n  return struc, metadata\n\n\ndef create_empty_output_struc_and_layout(\n    struc: structure.Structure,\n    ccd: chemical_components.Ccd,\n    *,\n    with_hydrogens: bool = False,\n    skip_unk: bool = False,\n    polymer_ligand_bonds: atom_layout.AtomLayout | None = None,\n    ligand_ligand_bonds: atom_layout.AtomLayout | None = None,\n    drop_ligand_leaving_atoms: bool = False,\n) -> tuple[structure.Structure, atom_layout.AtomLayout]:\n  \"\"\"Make zero-coordinate structure from all physical residues.\n\n  Args:\n    struc: Structure object.\n    ccd: The chemical components dictionary.\n    with_hydrogens: Whether to keep hydrogen atoms in structure.\n    skip_unk: Whether to remove unknown residues from structure.\n    polymer_ligand_bonds: Bond information for polymer-ligand pairs.\n    ligand_ligand_bonds: Bond information for ligand-ligand pairs.\n    drop_ligand_leaving_atoms: Flag for handling leaving atoms for ligands.\n\n  Returns:\n    Tuple of structure with all bonds, physical residues and coordinates set to\n    0 and a flat atom layout of empty structure.\n  \"\"\"\n  bonded_atom_pairs = []\n  if polymer_ligand_bonds:\n    for chain_ids, res_ids, atom_names in zip(\n        polymer_ligand_bonds.chain_id,\n        polymer_ligand_bonds.res_id,\n        polymer_ligand_bonds.atom_name,\n        strict=True,\n    ):\n      bonded_atom_pairs.append((\n          (chain_ids[0], res_ids[0], atom_names[0]),\n          (chain_ids[1], res_ids[1], atom_names[1]),\n      ))\n  if ligand_ligand_bonds:\n    for chain_ids, res_ids, atom_names in zip(\n        ligand_ligand_bonds.chain_id,\n        ligand_ligand_bonds.res_id,\n        ligand_ligand_bonds.atom_name,\n        strict=True,\n    ):\n      bonded_atom_pairs.append((\n          (chain_ids[0], res_ids[0], atom_names[0]),\n          (chain_ids[1], res_ids[1], atom_names[1]),\n      ))\n  residues = atom_layout.residues_from_structure(\n      struc, include_missing_residues=True\n  )\n\n  flat_output_layout = atom_layout.make_flat_atom_layout(\n      residues,\n      ccd=ccd,\n      with_hydrogens=with_hydrogens,\n      skip_unk_residues=skip_unk,\n      polymer_ligand_bonds=polymer_ligand_bonds,\n      ligand_ligand_bonds=ligand_ligand_bonds,\n      drop_ligand_leaving_atoms=drop_ligand_leaving_atoms,\n  )\n\n  empty_output_struc = atom_layout.make_structure(\n      flat_layout=flat_output_layout,\n      atom_coords=np.zeros((flat_output_layout.shape[0], 3)),\n      name=struc.name,\n      atom_b_factors=None,\n      all_physical_residues=residues,\n  )\n  if bonded_atom_pairs:\n    empty_output_struc = empty_output_struc.add_bonds(\n        bonded_atom_pairs, bond_type=mmcif_names.COVALENT_BOND\n    )\n\n  return empty_output_struc, flat_output_layout\n"
  },
  {
    "path": "src/alphafold3/model/post_processing.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Post-processing utilities for AlphaFold inference results.\"\"\"\n\nimport dataclasses\nimport datetime\nimport os\n\nfrom alphafold3 import version\nfrom alphafold3.model import confidence_types\nfrom alphafold3.model import mmcif_metadata\nfrom alphafold3.model import model\nimport numpy as np\nimport zstandard\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass ProcessedInferenceResult:\n  \"\"\"Stores attributes of a processed inference result.\n\n  Attributes:\n    cif: CIF file containing an inference result.\n    mean_confidence_1d: Mean 1D confidence calculated from confidence_1d.\n    ranking_score: Ranking score extracted from CIF metadata.\n    structure_confidence_summary_json: Content of JSON file with structure\n      confidences summary calculated from CIF file.\n    structure_full_data_json: Content of JSON file with structure full\n      confidences calculated from CIF file.\n    model_id: Identifier of the model that produced the inference result.\n  \"\"\"\n\n  cif: bytes\n  mean_confidence_1d: float\n  ranking_score: float\n  structure_confidence_summary_json: bytes\n  structure_full_data_json: bytes\n  model_id: bytes\n\n\ndef post_process_inference_result(\n    inference_result: model.InferenceResult,\n) -> ProcessedInferenceResult:\n  \"\"\"Returns cif, confidence_1d_json, confidence_2d_json, mean_confidence_1d, and ranking confidence.\"\"\"\n\n  # Add mmCIF metadata fields.\n  timestamp = datetime.datetime.now().isoformat(sep=' ', timespec='seconds')\n  cif_with_metadata = mmcif_metadata.add_metadata_to_mmcif(\n      old_cif=inference_result.predicted_structure.to_mmcif_dict(),\n      version=f'{version.__version__} @ {timestamp}',\n      model_id=inference_result.model_id,\n  )\n  cif = mmcif_metadata.add_legal_comment(cif_with_metadata.to_string())\n  cif = cif.encode('utf-8')\n  confidence_1d = confidence_types.AtomConfidence.from_inference_result(\n      inference_result\n  )\n  mean_confidence_1d = np.mean(confidence_1d.confidence)\n  structure_confidence_summary_json = (\n      confidence_types.StructureConfidenceSummary.from_inference_result(\n          inference_result\n      )\n      .to_json()\n      .encode('utf-8')\n  )\n  structure_full_data_json = (\n      confidence_types.StructureConfidenceFull.from_inference_result(\n          inference_result\n      )\n      .to_json()\n      .encode('utf-8')\n  )\n  return ProcessedInferenceResult(\n      cif=cif,\n      mean_confidence_1d=mean_confidence_1d,\n      ranking_score=float(inference_result.metadata['ranking_score']),\n      structure_confidence_summary_json=structure_confidence_summary_json,\n      structure_full_data_json=structure_full_data_json,\n      model_id=inference_result.model_id,\n  )\n\n\ndef write_output(\n    inference_result: model.InferenceResult,\n    output_dir: os.PathLike[str] | str,\n    terms_of_use: str | None = None,\n    name: str | None = None,\n    compress: bool = False,\n) -> None:\n  \"\"\"Writes processed inference result to a directory.\"\"\"\n  processed_result = post_process_inference_result(inference_result)\n\n  prefix = f'{name}_' if name is not None else ''\n\n  if compress:\n    opener = zstandard.open\n    path_transform = lambda path: f'{path}.zst'\n  else:\n    opener = open\n    path_transform = lambda path: path\n\n  mmcif_path = os.path.join(output_dir, f'{prefix}model.cif')\n  with opener(path_transform(mmcif_path), 'wb') as f:\n    f.write(processed_result.cif)\n\n  full_confidences_path = os.path.join(output_dir, f'{prefix}confidences.json')\n  with opener(path_transform(full_confidences_path), 'wb') as f:\n    f.write(processed_result.structure_full_data_json)\n\n  summary_confidences_path = os.path.join(\n      output_dir, f'{prefix}summary_confidences.json'\n  )\n  with open(summary_confidences_path, 'wb') as f:\n    f.write(processed_result.structure_confidence_summary_json)\n\n  if terms_of_use is not None:\n    with open(os.path.join(output_dir, 'TERMS_OF_USE.md'), 'wt') as f:\n      f.write(terms_of_use)\n\n\ndef write_embeddings(\n    embeddings: dict[str, np.ndarray],\n    output_dir: os.PathLike[str] | str,\n    name: str | None = None,\n) -> None:\n  \"\"\"Writes embeddings to a directory.\"\"\"\n  prefix = f'{name}_' if name is not None else ''\n\n  with open(os.path.join(output_dir, f'{prefix}embeddings.npz'), 'wb') as f:\n    np.savez_compressed(f, **embeddings)\n"
  },
  {
    "path": "src/alphafold3/model/protein_data_processing.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Process Structure Data.\"\"\"\n\nfrom alphafold3.constants import atom_types\nfrom alphafold3.constants import residue_names\nfrom alphafold3.constants import side_chains\nimport numpy as np\n\n\nNUM_DENSE = atom_types.DENSE_ATOM_NUM\nNUM_AA = len(residue_names.PROTEIN_TYPES)\nNUM_AA_WITH_UNK_AND_GAP = len(\n    residue_names.PROTEIN_TYPES_ONE_LETTER_WITH_UNKNOWN_AND_GAP\n)\nNUM_RESTYPES_WITH_UNK_AND_GAP = (\n    residue_names.POLYMER_TYPES_NUM_WITH_UNKNOWN_AND_GAP\n)\n\n\ndef _make_restype_rigidgroup_dense_atom_idx():\n  \"\"\"Create Mapping from rigid_groups to dense_atom indices.\"\"\"\n  # Create an array with the atom names.\n  # shape (num_restypes, num_rigidgroups, 3_atoms):\n  # (31, 8, 3)\n  base_atom_indices = np.zeros(\n      (NUM_RESTYPES_WITH_UNK_AND_GAP, 8, 3), dtype=np.int32\n  )\n\n  # 4,5,6,7: 'chi1,2,3,4-group'\n  for restype, restype_letter in enumerate(\n      residue_names.PROTEIN_TYPES_ONE_LETTER\n  ):\n    resname = residue_names.PROTEIN_COMMON_ONE_TO_THREE[restype_letter]\n\n    dense_atom_names = atom_types.ATOM14[resname]\n    # 0: backbone frame\n    base_atom_indices[restype, 0, :] = [\n        dense_atom_names.index(atom) for atom in ['C', 'CA', 'N']\n    ]\n\n    # 3: 'psi-group'\n    base_atom_indices[restype, 3, :] = [\n        dense_atom_names.index(atom) for atom in ['CA', 'C', 'O']\n    ]\n    for chi_idx in range(4):\n      if side_chains.CHI_ANGLES_MASK[restype][chi_idx]:\n        atom_names = side_chains.CHI_ANGLES_ATOMS[resname][chi_idx]\n        base_atom_indices[restype, chi_idx + 4, :] = [\n            dense_atom_names.index(atom) for atom in atom_names[1:]\n        ]\n  dense_atom_names = atom_types.DENSE_ATOM['A']\n  nucleic_rigid_atoms = [\n      dense_atom_names.index(atom) for atom in [\"C1'\", \"C3'\", \"C4'\"]\n  ]\n  for nanum, _ in enumerate(residue_names.NUCLEIC_TYPES):\n    # 0: backbone frame only.\n    # we have aa + unk + gap, so we want to start after those\n    resnum = nanum + NUM_AA_WITH_UNK_AND_GAP\n    base_atom_indices[resnum, 0, :] = nucleic_rigid_atoms\n\n  return base_atom_indices\n\n\nRESTYPE_RIGIDGROUP_DENSE_ATOM_IDX = _make_restype_rigidgroup_dense_atom_idx()\n\n\ndef _make_restype_pseudobeta_idx():\n  \"\"\"Returns indices of residue's pseudo-beta.\"\"\"\n  restype_pseudobeta_index = np.zeros(\n      (NUM_RESTYPES_WITH_UNK_AND_GAP,), dtype=np.int32\n  )\n  for restype, restype_letter in enumerate(\n      residue_names.PROTEIN_TYPES_ONE_LETTER\n  ):\n    restype_name = residue_names.PROTEIN_COMMON_ONE_TO_THREE[restype_letter]\n    atom_names = list(atom_types.ATOM14[restype_name])\n    if restype_name in {'GLY'}:\n      restype_pseudobeta_index[restype] = atom_names.index('CA')\n    else:\n      restype_pseudobeta_index[restype] = atom_names.index('CB')\n  for nanum, resname in enumerate(residue_names.NUCLEIC_TYPES):\n    atom_names = list(atom_types.DENSE_ATOM[resname])\n    # 0: backbone frame only.\n    # we have aa + unk , so we want to start after those\n    restype = nanum + NUM_AA_WITH_UNK_AND_GAP\n    if resname in {'A', 'G', 'DA', 'DG'}:\n      restype_pseudobeta_index[restype] = atom_names.index('C4')\n    else:\n      restype_pseudobeta_index[restype] = atom_names.index('C2')\n  return restype_pseudobeta_index\n\n\nRESTYPE_PSEUDOBETA_INDEX = _make_restype_pseudobeta_idx()\n\n\ndef _make_aatype_dense_atom_to_atom37():\n  \"\"\"Map from dense_atom to atom37 per residue type.\"\"\"\n  restype_dense_atom_to_atom37 = []  # mapping (restype, dense_atom) --> atom37\n  for rt in residue_names.PROTEIN_TYPES_ONE_LETTER:\n    atom_names = list(\n        atom_types.ATOM14_PADDED[residue_names.PROTEIN_COMMON_ONE_TO_THREE[rt]]\n    )\n    atom_names.extend([''] * (NUM_DENSE - len(atom_names)))\n    restype_dense_atom_to_atom37.append(\n        [(atom_types.ATOM37_ORDER[name] if name else 0) for name in atom_names]\n    )\n  # Add dummy mapping for restype 'UNK', '-' (gap), and nucleics [but not DN].\n  for _ in range(2 + len(residue_names.NUCLEIC_TYPES_WITH_UNKNOWN)):\n    restype_dense_atom_to_atom37.append([0] * NUM_DENSE)\n\n  restype_dense_atom_to_atom37 = np.array(\n      restype_dense_atom_to_atom37, dtype=np.int32\n  )\n  return restype_dense_atom_to_atom37\n\n\nPROTEIN_AATYPE_DENSE_ATOM_TO_ATOM37 = _make_aatype_dense_atom_to_atom37()\n"
  },
  {
    "path": "src/alphafold3/model/scoring/alignment.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Alignment based metrics.\"\"\"\n\nimport numpy as np\n\n\ndef transform_ls(\n    x: np.ndarray,\n    b: np.ndarray,\n    *,\n    allow_reflection: bool = False,\n) -> np.ndarray:\n  \"\"\"Find the least squares best fit rotation between two sets of N points.\n\n  Solve Ax = b for A. Where A is the transform rotating x^T into b^T.\n\n  Args:\n    x: NxD numpy array of coordinates. Usually dimension D is 3.\n    b: NxD numpy array of coordinates. Usually dimension D is 3.\n    allow_reflection: Whether the returned transformation can reflect as well as\n      rotate.\n\n  Returns:\n    Matrix A transforming x into b, i.e. s.t. Ax^T = b^T.\n  \"\"\"\n  assert x.shape[1] >= b.shape[1]\n  assert b.shape[0] == x.shape[0], '%d, %d' % (b.shape[0], x.shape[0])\n  # First postmultiply by x.;\n  # Axx^t = b x^t\n  bxt = np.dot(b.transpose(), x) / b.shape[0]\n\n  u, _, v = np.linalg.svd(bxt)\n\n  r = np.dot(u, v)\n  if not allow_reflection:\n    flip = np.ones((v.shape[1], 1))\n    flip[v.shape[1] - 1, 0] = np.sign(np.linalg.det(r))\n    r = np.dot(u, v * flip)\n\n  return r\n\n\ndef align(\n    *,\n    x: np.ndarray,\n    y: np.ndarray,\n    x_indices: np.ndarray,\n    y_indices: np.ndarray,\n) -> np.ndarray:\n  \"\"\"Align x to y considering only included_idxs.\n\n  Args:\n    x: NxD np array of coordinates.\n    y: NxD np array of coordinates.\n    x_indices: An np array of indices for `x` that will be used in the\n      alignment. Must be of the same length as `y_included_idxs`.\n    y_indices: An np array of indices for `y` that will be used in the\n      alignment. Must be of the same length as `x_included_idxs`.\n\n  Returns:\n    NxD np array of points obtained by applying a rigid transformation to x.\n    These points are aligned to y and the alignment is the optimal alignment\n    over the points in included_idxs.\n\n  Raises:\n    ValueError: If the number of included indices is not the same for both\n    input arrays.\n  \"\"\"\n  if len(x_indices) != len(y_indices):\n    raise ValueError(\n        'Number of included indices must be the same for both input arrays,'\n        f' but got for x: {len(x_indices)}, and for y: {len(y_indices)}.'\n    )\n\n  x_mean = np.mean(x[x_indices, :], axis=0)\n  y_mean = np.mean(y[y_indices, :], axis=0)\n\n  centered_x = x - x_mean\n  centered_y = y - y_mean\n\n  t = transform_ls(centered_x[x_indices, :], centered_y[y_indices, :])\n  transformed_x = np.dot(centered_x, t.transpose()) + y_mean\n\n  return transformed_x\n\n\ndef deviations_from_coords(\n    decoy_coords: np.ndarray,\n    gt_coords: np.ndarray,\n    align_idxs: np.ndarray | None = None,\n    include_idxs: np.ndarray | None = None,\n) -> np.ndarray:\n  \"\"\"Returns the raw per-atom deviations used in RMSD computation.\"\"\"\n  if decoy_coords.shape != gt_coords.shape:\n    raise ValueError(\n        'decoy_coords.shape and gt_coords.shape must match.Found: %s and %s.'\n        % (decoy_coords.shape, gt_coords.shape)\n    )\n  # Include and align all residues unless specified otherwise.\n  if include_idxs is None:\n    include_idxs = np.arange(decoy_coords.shape[0])\n  if align_idxs is None:\n    align_idxs = include_idxs\n  aligned_decoy_coords = align(\n      x=decoy_coords,\n      y=gt_coords,\n      x_indices=align_idxs,\n      y_indices=align_idxs,\n  )\n  deviations = np.linalg.norm(\n      aligned_decoy_coords[include_idxs] - gt_coords[include_idxs], axis=1\n  )\n  return deviations\n\n\ndef rmsd_from_coords(\n    decoy_coords: np.ndarray,\n    gt_coords: np.ndarray,\n    align_idxs: np.ndarray | None = None,\n    include_idxs: np.ndarray | None = None,\n) -> float:\n  \"\"\"Computes the *aligned* RMSD of two Mx3 np arrays of coordinates.\n\n  Args:\n    decoy_coords: [M, 3] np array of decoy atom coordinates.\n    gt_coords: [M, 3] np array of gt atom coordinates.\n    align_idxs: [M] np array of indices specifying coordinates to align on.\n      Defaults to None, in which case all the include_idx (see after) are used.\n    include_idxs: [M] np array of indices specifying coordinates to score.\n      Defaults to None, in which case all indices are used for scoring.\n\n  Returns:\n    rmsd value of the aligned decoy and gt coordinates.\n  \"\"\"\n  deviations = deviations_from_coords(\n      decoy_coords, gt_coords, align_idxs, include_idxs\n  )\n  return np.sqrt(np.mean(np.square(deviations)))\n"
  },
  {
    "path": "src/alphafold3/model/scoring/chirality.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Chirality detection and comparison.\"\"\"\n\nfrom collections.abc import Mapping\n\nfrom absl import logging\nfrom alphafold3 import structure\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.data.tools import rdkit_utils\nimport rdkit.Chem as rd_chem\n\n_CHIRAL_ELEMENTS = frozenset({'C', 'S'})\n\n\ndef _find_chiral_centres(mol: rd_chem.Mol) -> dict[str, str]:\n  \"\"\"Find chiral centres and detect their chirality.\n\n  Only elements listed in _CHIRAL_ELEMENTS are considered as centres.\n\n  Args:\n    mol: The molecule for which to detect chirality.\n\n  Returns:\n    Map from chiral centre atom names to identified chirality.\n  \"\"\"\n  chiral_centres = rd_chem.FindMolChiralCenters(\n      mol, force=True, includeUnassigned=False, useLegacyImplementation=True\n  )\n  atom_name_by_idx = {\n      atom.GetIdx(): atom.GetProp('atom_name') for atom in mol.GetAtoms()\n  }\n  atom_chirality_by_name = {atom_name_by_idx[k]: v for k, v in chiral_centres}\n  return {\n      k: v\n      for k, v in atom_chirality_by_name.items()\n      if any(k[: len(el)].upper() == el for el in _CHIRAL_ELEMENTS)\n  }\n\n\ndef _chiral_match(mol1: rd_chem.Mol, mol2: rd_chem.Mol) -> bool:\n  \"\"\"Compares chirality of two Mols. Mol1 can match a subset of mol2.\"\"\"\n\n  mol1_atom_names = {a.GetProp('atom_name') for a in mol1.GetAtoms()}\n  mol2_atom_names = {a.GetProp('atom_name') for a in mol2.GetAtoms()}\n  if mol1_atom_names != mol2_atom_names:\n    if not mol1_atom_names.issubset(mol2_atom_names):\n      raise ValueError('Mol1 atoms are not a subset of mol2 atoms.')\n\n  mol1_chiral_centres = _find_chiral_centres(mol1)\n  mol2_chiral_centres = _find_chiral_centres(mol2)\n  if set(mol1_chiral_centres) != set(mol2_chiral_centres):\n    if not set(mol1_chiral_centres).issubset(mol2_chiral_centres):\n      return False\n  chirality_matches = {\n      centre_atom: chirality1 == mol2_chiral_centres[centre_atom]\n      for centre_atom, chirality1 in mol1_chiral_centres.items()\n      if '?' != mol2_chiral_centres[centre_atom]\n  }\n  return all(chirality_matches.values())\n\n\ndef _mol_from_ligand_struc(\n    ligand_struc: structure.Structure,\n    ref_mol: rd_chem.Mol,\n) -> rd_chem.Mol | None:\n  \"\"\"Creates a Mol object from a ligand structure and reference mol.\"\"\"\n\n  if ligand_struc.num_residues(count_unresolved=True) > 1:\n    raise ValueError('ligand_struc %s has more than one residue.')\n  coords_by_atom_name = dict(zip(ligand_struc.atom_name, ligand_struc.coords))\n\n  ref_mol = rdkit_utils.sanitize_mol(\n      ref_mol,\n      sort_alphabetically=False,\n      remove_hydrogens=True,\n  )\n\n  mol = rd_chem.Mol(ref_mol)\n  mol.RemoveAllConformers()\n\n  atom_indices_to_remove = [\n      a.GetIdx()\n      for a in mol.GetAtoms()\n      if a.GetProp('atom_name') not in coords_by_atom_name\n  ]\n  editable_mol = rd_chem.EditableMol(mol)\n  # Remove indices from the largest to smallest, to avoid invalidating.\n  for atom_idx in atom_indices_to_remove[::-1]:\n    editable_mol.RemoveAtom(atom_idx)\n  mol = editable_mol.GetMol()\n\n  conformer = rd_chem.Conformer(mol.GetNumAtoms())\n  for atom_idx, atom in enumerate(mol.GetAtoms()):\n    atom_name = atom.GetProp('atom_name')\n    coords = coords_by_atom_name[atom_name]\n    conformer.SetAtomPosition(atom_idx, coords.tolist())\n  mol.AddConformer(conformer)\n  try:\n    rd_chem.AssignStereochemistryFrom3D(mol)\n  except RuntimeError as e:\n    # Catch only this specific rdkit error.\n    if 'Cannot normalize a zero length vector' in str(e):\n      return None\n    else:\n      raise\n  return mol\n\n\ndef _maybe_mol_from_ccd(res_name: str) -> rd_chem.Mol | None:\n  \"\"\"Creates a Mol object from CCD information if res_name is in the CCD.\"\"\"\n  ccd = chemical_components.Ccd()\n  ccd_cif = ccd.get(res_name)\n  if not ccd_cif:\n    logging.warning('No ccd information for residue %s.', res_name)\n    return None\n  try:\n    mol = rdkit_utils.mol_from_ccd_cif(ccd_cif, force_parse=False)\n  except rdkit_utils.MolFromMmcifError as e:\n    logging.warning('Failed to create mol from ccd for %s: %s', res_name, e)\n    return None\n  if mol is None:\n    raise ValueError('Failed to create mol from ccd for %s.' % res_name)\n  mol = rdkit_utils.sanitize_mol(\n      mol,\n      sort_alphabetically=False,\n      remove_hydrogens=True,\n  )\n  return mol\n\n\ndef compare_chirality(\n    test_struc: structure.Structure,\n    ref_mol_by_chain: Mapping[str, rd_chem.Mol] | None = None,\n) -> dict[str, bool]:\n  \"\"\"Compares chirality of ligands in a structure with reference molecules.\n\n  We do not enforce that ligand atoms exactly match, only that the ligand atoms\n  and chiral centres are a subset of those in ref mol.\n\n  Args:\n    test_struc: The structure for whose ligands to match chirality.\n    ref_mol_by_chain: Optional dictionary mapping chain IDs to mol objects with\n      conformers to compare against. If this is not provided, the comparison is\n      to the corresponding ligands in the CCD if the ligand residue name is in\n      the CCD.\n\n  Returns:\n    Dictionary mapping chain id to whether chirality mismatches the ref mol.\n    Only single residue ligands where reference molecules are available are\n    compared.\n  \"\"\"\n  ref_mol_by_chain = ref_mol_by_chain or {}\n  test_struc = test_struc.filter_to_entity_type(ligand=True)\n  name = test_struc.name\n  chiral_match_by_chain_id = {}\n  for chain_id in test_struc.chains:\n    chain_struc = test_struc.filter(chain_id=chain_id)\n    # Only compare single-residue ligands.\n    if chain_struc.num_residues(count_unresolved=True) > 1:\n      logging.warning('%s: Chain %s has >1 residues. Skipping.', name, chain_id)\n      continue\n    if chain_id not in ref_mol_by_chain:\n      ref_mol = _maybe_mol_from_ccd(chain_struc.res_name[0])\n    else:\n      ref_mol = ref_mol_by_chain[chain_id]\n    if ref_mol is None:\n      logging.warning(\n          '%s: Ref mol is None for chain %s. Skipping.', name, chain_id\n      )\n      continue\n    mol = _mol_from_ligand_struc(\n        ligand_struc=chain_struc,\n        ref_mol=ref_mol,\n    )\n    if mol is None:\n      logging.warning(\n          '%s: Failed to create mol for chain %s. Skipping.', name, chain_id\n      )\n      continue\n    chiral_match_by_chain_id[chain_id] = _chiral_match(mol, ref_mol)\n  return chiral_match_by_chain_id\n"
  },
  {
    "path": "src/alphafold3/model/scoring/covalent_bond_cleaning.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Some methods to compute metrics for PTMs.\"\"\"\n\nimport collections\nfrom collections.abc import Mapping\nimport dataclasses\n\nfrom alphafold3 import structure\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.model.atom_layout import atom_layout\nimport numpy as np\n\n\n@dataclasses.dataclass(frozen=True)\nclass ResIdMapping:\n  old_res_ids: np.ndarray\n  new_res_ids: np.ndarray\n\n\ndef _count_symmetric_chains(struc: structure.Structure) -> Mapping[str, int]:\n  \"\"\"Returns a dict with each chain ID and count.\"\"\"\n  chain_res_name_sequence_from_chain_id = struc.chain_res_name_sequence(\n      include_missing_residues=True, fix_non_standard_polymer_res=False\n  )\n  counts_for_chain_res_name_sequence = collections.Counter(\n      chain_res_name_sequence_from_chain_id.values()\n  )\n  chain_symmetric_count = {}\n  for chain_id, chain_res_name in chain_res_name_sequence_from_chain_id.items():\n    chain_symmetric_count[chain_id] = counts_for_chain_res_name_sequence[\n        chain_res_name\n    ]\n  return chain_symmetric_count\n\n\ndef has_nonsymmetric_bonds_on_symmetric_polymer_chains(\n    struc: structure.Structure, polymer_ligand_bonds: atom_layout.AtomLayout\n) -> bool:\n  \"\"\"Returns true if nonsymmetric bonds found on polymer chains.\"\"\"\n  try:\n    _get_polymer_dim(polymer_ligand_bonds)\n  except ValueError:\n    return True\n  if _has_non_polymer_ligand_ptm_bonds(polymer_ligand_bonds):\n    return True\n  if _has_multiple_polymers_bonded_to_one_ligand(polymer_ligand_bonds):\n    return True\n  combined_struc, _ = _combine_polymer_ligand_ptm_chains(\n      struc, polymer_ligand_bonds\n  )\n  struc = struc.filter(chain_type=mmcif_names.POLYMER_CHAIN_TYPES)\n  combined_struc = combined_struc.filter(\n      chain_type=mmcif_names.POLYMER_CHAIN_TYPES\n  )\n  return _count_symmetric_chains(struc) != _count_symmetric_chains(\n      combined_struc\n  )\n\n\ndef _has_non_polymer_ligand_ptm_bonds(\n    polymer_ligand_bonds: atom_layout.AtomLayout,\n):\n  \"\"\"Checks if all bonds are between a polymer chain and a ligand chain type.\"\"\"\n  for start_chain_type, end_chain_type in polymer_ligand_bonds.chain_type:\n    if (\n        start_chain_type in mmcif_names.POLYMER_CHAIN_TYPES\n        and end_chain_type in mmcif_names.LIGAND_CHAIN_TYPES\n    ):\n      continue\n    elif (\n        start_chain_type in mmcif_names.LIGAND_CHAIN_TYPES\n        and end_chain_type in mmcif_names.POLYMER_CHAIN_TYPES\n    ):\n      continue\n    else:\n      return True\n  return False\n\n\ndef _combine_polymer_ligand_ptm_chains(\n    struc: structure.Structure,\n    polymer_ligand_bonds: atom_layout.AtomLayout,\n) -> tuple[structure.Structure, dict[tuple[str, str], ResIdMapping]]:\n  \"\"\"Combines the ptm polymer-ligand chains together.\n\n  This will prevent them from being permuted away from each other when chains\n  are matched to the ground truth. This function also returns the res_id mapping\n  from the separate ligand res_ids to their res_ids in the combined\n  polymer-ligand chain; this information is needed to later separate the\n  combined polymer-ligand chain.\n\n  Args:\n    struc: Structure to be modified.\n    polymer_ligand_bonds: AtomLayout with polymer-ligand bond info.\n\n  Returns:\n    A tuple of a Structure with each ptm polymer-ligand chain relabelled as one\n    chain and a dict from bond chain pair to the res_id mapping.\n  \"\"\"\n  if not _has_only_single_bond_from_each_chain(polymer_ligand_bonds):\n    if _has_multiple_ligands_bonded_to_one_polymer(polymer_ligand_bonds):\n      # For structures where a polymer chain is connected to multiple ligands,\n      # we need to sort the multiple bonds from the same chain by res_id to\n      # ensure that the combined polymer-ligand chain will always be the same\n      # when you have repeated symmetric polymer-ligand chains.\n      polymer_ligand_bonds = (\n          _sort_polymer_ligand_bonds_by_polymer_chain_and_res_id(\n              polymer_ligand_bonds\n          )\n      )\n    else:\n      raise ValueError(\n          'Code cannot handle multiple bonds from one chain unless'\n          ' its several ligands bonded to a polymer.'\n      )\n  res_id_mappings_for_bond_chain_pair = dict()\n  for (start_chain_id, end_chain_id), (start_chain_type, end_chain_type) in zip(\n      polymer_ligand_bonds.chain_id, polymer_ligand_bonds.chain_type\n  ):\n    poly_info, ligand_info = _get_polymer_and_ligand_chain_ids_and_types(\n        start_chain_id, end_chain_id, start_chain_type, end_chain_type\n    )\n    polymer_chain_id, polymer_chain_type = poly_info\n    ligand_chain_id, _ = ligand_info\n\n    # Join the ligand chain to the polymer chain.\n    ligand_res_ids = struc.filter(chain_id=ligand_chain_id).res_id\n    new_res_ids = ligand_res_ids + len(struc.all_residues[polymer_chain_id])\n    res_id_mappings_for_bond_chain_pair[(polymer_chain_id, ligand_chain_id)] = (\n        ResIdMapping(old_res_ids=ligand_res_ids, new_res_ids=new_res_ids)\n    )\n    chain_groups = []\n    chain_group_ids = []\n    chain_group_types = []\n    for chain_id, chain_type in zip(\n        struc.chains_table.id, struc.chains_table.type\n    ):\n      if chain_id == ligand_chain_id:\n        continue\n      elif chain_id == polymer_chain_id:\n        chain_groups.append([polymer_chain_id, ligand_chain_id])\n        chain_group_ids.append(polymer_chain_id)\n        chain_group_types.append(polymer_chain_type)\n      else:\n        chain_groups.append([chain_id])\n        chain_group_ids.append(chain_id)\n        chain_group_types.append(chain_type)\n\n    struc = struc.merge_chains(\n        chain_groups=chain_groups,\n        chain_group_ids=chain_group_ids,\n        chain_group_types=chain_group_types,\n    )\n\n  return struc, res_id_mappings_for_bond_chain_pair\n\n\ndef _has_only_single_bond_from_each_chain(\n    polymer_ligand_bonds: atom_layout.AtomLayout,\n) -> bool:\n  \"\"\"Checks that there is at most one bond from each chain.\"\"\"\n  chain_ids = []\n  for chains in polymer_ligand_bonds.chain_id:\n    chain_ids.extend(chains)\n  if len(chain_ids) != len(set(chain_ids)):\n    return False\n  return True\n\n\ndef _get_polymer_and_ligand_chain_ids_and_types(\n    start_chain_id: str,\n    end_chain_id: str,\n    start_chain_type: str,\n    end_chain_type: str,\n) -> tuple[tuple[str, str], tuple[str, str]]:\n  \"\"\"Finds polymer and ligand chain ids from chain types.\"\"\"\n  if (\n      start_chain_type in mmcif_names.POLYMER_CHAIN_TYPES\n      and end_chain_type in mmcif_names.LIGAND_CHAIN_TYPES\n  ):\n    return (start_chain_id, start_chain_type), (end_chain_id, end_chain_type)\n  elif (\n      start_chain_type in mmcif_names.LIGAND_CHAIN_TYPES\n      and end_chain_type in mmcif_names.POLYMER_CHAIN_TYPES\n  ):\n    return (end_chain_id, end_chain_type), (start_chain_id, start_chain_type)\n  else:\n    raise ValueError(\n        'This code only handles PTM-bonds from polymer chain to ligands.'\n    )\n\n\ndef _get_polymer_dim(polymer_ligand_bonds: atom_layout.AtomLayout) -> int:\n  \"\"\"Gets polymer dimension from the polymer-ligand bond layout.\"\"\"\n  start_chain_types = []\n  end_chain_types = []\n  for start_chain_type, end_chain_type in polymer_ligand_bonds.chain_type:\n    start_chain_types.append(start_chain_type)\n    end_chain_types.append(end_chain_type)\n  if set(start_chain_types).issubset(\n      set(mmcif_names.POLYMER_CHAIN_TYPES)\n  ) and set(end_chain_types).issubset(set(mmcif_names.LIGAND_CHAIN_TYPES)):\n    return 0\n  elif set(start_chain_types).issubset(mmcif_names.LIGAND_CHAIN_TYPES) and set(\n      end_chain_types\n  ).issubset(set(mmcif_names.POLYMER_CHAIN_TYPES)):\n    return 1\n  else:\n    raise ValueError(\n        'Polymer and ligand dimensions are not consistent within the structure.'\n    )\n\n\ndef _has_multiple_ligands_bonded_to_one_polymer(polymer_ligand_bonds):\n  \"\"\"Checks if there are multiple ligands bonded to one polymer.\"\"\"\n  polymer_dim = _get_polymer_dim(polymer_ligand_bonds)\n  polymer_chain_ids = [\n      chains[polymer_dim] for chains in polymer_ligand_bonds.chain_id\n  ]\n  if len(polymer_chain_ids) != len(set(polymer_chain_ids)):\n    return True\n  return False\n\n\ndef _has_multiple_polymers_bonded_to_one_ligand(polymer_ligand_bonds):\n  \"\"\"Checks if there are multiple polymer chains bonded to one ligand.\"\"\"\n  polymer_dim = _get_polymer_dim(polymer_ligand_bonds)\n  ligand_dim = 1 - polymer_dim\n  ligand_chain_ids = [\n      chains[ligand_dim] for chains in polymer_ligand_bonds.chain_id\n  ]\n  if len(ligand_chain_ids) != len(set(ligand_chain_ids)):\n    return True\n  return False\n\n\ndef _sort_polymer_ligand_bonds_by_polymer_chain_and_res_id(\n    polymer_ligand_bonds,\n):\n  \"\"\"Sorts bonds by res_id (for when a polymer chain has multiple bonded ligands).\"\"\"\n\n  polymer_dim = _get_polymer_dim(polymer_ligand_bonds)\n\n  polymer_chain_ids = [\n      chains[polymer_dim] for chains in polymer_ligand_bonds.chain_id\n  ]\n  polymer_res_ids = [res[polymer_dim] for res in polymer_ligand_bonds.res_id]\n\n  polymer_chain_and_res_id = zip(polymer_chain_ids, polymer_res_ids)\n  sorted_indices = [\n      idx\n      for idx, _ in sorted(\n          enumerate(polymer_chain_and_res_id), key=lambda x: x[1]\n      )\n  ]\n  return polymer_ligand_bonds[sorted_indices]\n"
  },
  {
    "path": "src/alphafold3/model/scoring/scoring.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Library of scoring methods of the model outputs.\"\"\"\n\nfrom alphafold3.model import protein_data_processing\nimport jax.numpy as jnp\nimport numpy as np\n\n\nArray = jnp.ndarray | np.ndarray\n\n\ndef pseudo_beta_fn(\n    aatype: Array,\n    dense_atom_positions: Array,\n    dense_atom_masks: Array,\n    is_ligand: Array | None = None,\n    use_jax: bool | None = True,\n) -> tuple[Array, Array] | Array:\n  \"\"\"Create pseudo beta atom positions and optionally mask.\n\n  Args:\n    aatype: [num_res] amino acid types.\n    dense_atom_positions: [num_res, NUM_DENSE, 3] vector of all atom positions.\n    dense_atom_masks: [num_res, NUM_DENSE] mask.\n    is_ligand: [num_res] flag if something is a ligand.\n    use_jax: whether to use jax for the computations.\n\n  Returns:\n    Pseudo beta dense atom positions and the corresponding mask.\n  \"\"\"\n  if use_jax:\n    xnp = jnp\n  else:\n    xnp = np\n\n  if is_ligand is None:\n    is_ligand = xnp.zeros_like(aatype)\n\n  pseudobeta_index_polymer = xnp.take(\n      protein_data_processing.RESTYPE_PSEUDOBETA_INDEX, aatype, axis=0\n  ).astype(xnp.int32)\n\n  pseudobeta_index = xnp.where(\n      is_ligand,\n      xnp.zeros_like(pseudobeta_index_polymer),\n      pseudobeta_index_polymer,\n  )\n\n  pseudo_beta = xnp.take_along_axis(\n      dense_atom_positions, pseudobeta_index[..., None, None], axis=-2\n  )\n  pseudo_beta = xnp.squeeze(pseudo_beta, axis=-2)\n\n  pseudo_beta_mask = xnp.take_along_axis(\n      dense_atom_masks, pseudobeta_index[..., None], axis=-1\n  ).astype(xnp.float32)\n  pseudo_beta_mask = xnp.squeeze(pseudo_beta_mask, axis=-1)\n\n  return pseudo_beta, pseudo_beta_mask\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/cif_dict.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nfrom typing import Any, ClassVar, Iterable, Iterator, TypeVar, overload\n\nimport numpy as np\n\n_T = TypeVar('_T')\n\nclass CifDict:\n  class ItemView:\n    def __iter__(self) -> Iterator[tuple[str, list[str]]]: ...\n    def __len__(self) -> int: ...\n\n  class KeyView:\n    @overload\n    def __contains__(self, key: str) -> bool: ...\n    @overload\n    def __contains__(self, key: object) -> bool: ...\n    def __iter__(self) -> Iterator[str]: ...\n    def __len__(self) -> int: ...\n\n  class ValueView:\n    def __iter__(self) -> Iterator[list[str]]: ...\n    def __len__(self) -> int: ...\n\n  def __init__(self, d: dict[str, Iterable[str]]) -> None: ...\n  def copy_and_update(self, d: dict[str, Iterable[str]]) -> CifDict: ...\n  def extract_loop_as_dict(self, prefix: str, index: str) -> dict:\n    \"\"\"Extracts loop associated with a prefix from mmCIF data as a dict.\n\n    For instance for an mmCIF with these fields:\n    '_a.ix': ['1', '2', '3']\n    '_a.1': ['a.1.1', 'a.1.2', 'a.1.3']\n    '_a.2': ['a.2.1', 'a.2.2', 'a.2.3']\n\n    this function called with prefix='_a.', index='_a.ix' extracts:\n    {'1': {'a.ix': '1', 'a.1': 'a.1.1', 'a.2': 'a.2.1'}\n     '2': {'a.ix': '2', 'a.1': 'a.1.2', 'a.2': 'a.2.2'}\n     '3': {'a.ix': '3', 'a.1': 'a.1.3', 'a.2': 'a.2.3'}}\n\n    Args:\n      prefix: Prefix shared by each of the data items in the loop. The prefix\n        should include the trailing period.\n      index: Which item of loop data should serve as the key.\n\n    Returns:\n      Dict of dicts; each dict represents 1 entry from an mmCIF loop,\n      indexed by the index column.\n    \"\"\"\n\n  def extract_loop_as_list(self, prefix: str) -> list:\n    \"\"\"Extracts loop associated with a prefix from mmCIF data as a list.\n\n    Reference for loop_ in mmCIF:\n    http://mmcif.wwpdb.org/docs/tutorials/mechanics/pdbx-mmcif-syntax.html\n\n    For instance for an mmCIF with these fields:\n    '_a.1': ['a.1.1', 'a.1.2', 'a.1.3']\n    '_a.2': ['a.2.1', 'a.2.2', 'a.2.3']\n\n    this function called with prefix='_a.' extracts:\n    [{'_a.1': 'a.1.1', '_a.2': 'a.2.1'}\n     {'_a.1': 'a.1.2', '_a.2': 'a.2.2'}\n     {'_a.1': 'a.1.3', '_a.2': 'a.2.3'}]\n\n    Args:\n      prefix: Prefix shared by each of the data items in the loop. The prefix\n        should include the trailing period.\n\n    Returns:\n      A list of dicts; each dict represents 1 entry from an mmCIF loop.\n    \"\"\"\n\n  def get(self, key: str, default_value: _T = ...) -> list[str] | _T: ...\n  def get_array(\n      self, key: str, dtype: object = ..., gather: object = ...\n  ) -> np.ndarray:\n    \"\"\"Returns values looked up in dict converted to a NumPy array.\n\n    Args:\n      key: Key in dictionary.\n      dtype: Optional (default `object`) Specifies output dtype of array. One of\n        [object, np.{int,uint}{8,16,32,64} np.float{32,64}]. As with NumPy use\n        `object` to return a NumPy array of strings.\n      gather: Optional one of [slice, np.{int,uint}{32,64}] non-intermediate\n        version of get_array(key, dtype)[gather].\n\n    Returns:\n      A NumPy array of given dtype. An optimised equivalent to\n      np.array(cif[key]).astype(dtype).  With support of '.' being treated\n      as np.nan if dtype is one of np.float{32,64}.\n      Identical strings will all reference the same object to save space.\n\n    Raises:\n      KeyError - if key is not found.\n      TypeError - if dtype is not valid or supported.\n      ValueError - if string cannot convert to dtype.\n    \"\"\"\n\n  def get_data_name(self) -> str: ...\n  def items(self) -> CifDict.ItemView: ...\n  def keys(self) -> CifDict.KeyView: ...\n  def to_string(self) -> str: ...\n  def to_dict(self) -> dict[str, list[str]]: ...\n  def value_length(self, key: str) -> int: ...\n  def values(self) -> CifDict.ValueView: ...\n  def __bool__(self) -> bool: ...\n  def __contains__(self, key: str) -> bool: ...\n  def __getitem__(self, key: str) -> list[str]: ...\n  def __getstate__(self) -> tuple: ...\n  def __iter__(self) -> Iterator[str]: ...\n  def __len__(self) -> int: ...\n  def __setstate__(self, state: tuple) -> None: ...\n\ndef tokenize(cif_string: str) -> list[str]: ...\ndef split_line(line: str) -> list[str]: ...\ndef from_string(mmcif_string: str | bytes) -> CifDict: ...\ndef parse_multi_data_cif(cif_string: str | bytes) -> dict[str, CifDict]: ...\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/cif_dict_lib.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n\n#include <algorithm>\n#include <array>\n#include <cstddef>\n#include <iterator>\n#include <memory>\n#include <string>\n#include <tuple>\n#include <utility>\n#include <vector>\n\n#include \"absl/algorithm/container.h\"\n#include \"absl/container/btree_map.h\"\n#include \"absl/container/flat_hash_map.h\"\n#include \"absl/container/flat_hash_set.h\"\n#include \"absl/container/node_hash_map.h\"\n#include \"absl/log/check.h\"\n#include \"absl/status/status.h\"\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/ascii.h\"\n#include \"absl/strings/match.h\"\n#include \"absl/strings/str_cat.h\"\n#include \"absl/strings/str_format.h\"\n#include \"absl/strings/str_join.h\"\n#include \"absl/strings/str_split.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/strings/strip.h\"\n\nnamespace alphafold3 {\nnamespace {\n\nbool IsQuote(const char symbol) { return symbol == '\\'' || symbol == '\"'; }\nbool IsWhitespace(const char symbol) { return symbol == ' ' || symbol == '\\t'; }\n\n// Splits line into tokens, returns whether successful.\nbool SplitLineInline(absl::string_view line,\n                     std::vector<absl::string_view>* tokens) {\n  // See https://www.iucr.org/resources/cif/spec/version1.1/cifsyntax\n  for (int i = 0, line_length = line.length(); i < line_length;) {\n    // Skip whitespace (spaces or tabs).\n    while (IsWhitespace(line[i])) {\n      if (++i == line_length) {\n        break;\n      }\n    }\n    if (i == line_length) {\n      break;\n    }\n\n    // Skip comments (from # until the end of the line). If # is a non-comment\n    // character, it must be inside a quoted token.\n    if (line[i] == '#') {\n      break;\n    }\n\n    int start_index;\n    int end_index;\n    if (IsQuote(line[i])) {\n      // Token in single or double quotes. CIF v1.1 specification considers a\n      // quote to be an opening quote only if it is at the beginning of a token.\n      // So e.g. A' B has tokens A' and B. Also, \"\"A\" is a token \"A.\n      const char quote_char = line[i++];\n      start_index = i;\n\n      // Find matching quote. The double loop is not strictly necessary, but\n      // optimises a bit better.\n      while (true) {\n        while (i < line_length && line[i] != quote_char) {\n          ++i;\n        }\n        if (i == line_length) {\n          // Reached the end of the line while still being inside a token.\n          return false;\n        }\n        if (i + 1 == line_length || IsWhitespace(line[i + 1])) {\n          break;\n        }\n        ++i;\n      }\n      end_index = i++;\n    } else {\n      // Non-quoted token. Read until reaching whitespace.\n      start_index = i++;\n      while (i < line_length && !IsWhitespace(line[i])) {\n        ++i;\n      }\n      end_index = i;\n    }\n\n    tokens->push_back(line.substr(start_index, end_index - start_index));\n  }\n\n  return true;\n}\n\nusing HeapStrings = std::vector<std::unique_ptr<std::string>>;\n\n// The majority of strings can be viewed on original cif_string.\n// heap_strings store multi-line tokens that have internal white-space stripped.\nabsl::StatusOr<std::vector<absl::string_view>> TokenizeInternal(\n    absl::string_view cif_string, HeapStrings* heap_strings) {\n  const std::vector<absl::string_view> lines = absl::StrSplit(cif_string, '\\n');\n  std::vector<absl::string_view> tokens;\n  // Heuristic: Most lines in an mmCIF are _atom_site lines with 21 tokens.\n  tokens.reserve(lines.size() * 21);\n  int line_num = 0;\n  while (line_num < lines.size()) {\n    auto line = absl::StripSuffix(lines[line_num], \"\\r\");\n    line_num++;\n\n    if (line.empty() || line[0] == '#') {\n      // Skip empty lines or lines that contain only comments.\n      continue;\n    } else if (line[0] == ';') {\n      // Leading whitespace on each line must be preserved while trailing\n      // whitespace may be stripped.\n      std::vector<absl::string_view> multiline_tokens;\n      // Strip the leading \";\".\n      multiline_tokens.push_back(\n          absl::StripTrailingAsciiWhitespace(line.substr(1)));\n      while (line_num < lines.size()) {\n        auto multiline = absl::StripTrailingAsciiWhitespace(lines[line_num]);\n        line_num++;\n        if (!multiline.empty() && multiline[0] == ';') {\n          break;\n        } else if (line_num == lines.size()) {\n          return absl::InvalidArgumentError(\n              \"Last multiline token is not terminated by a semicolon.\");\n        }\n        multiline_tokens.push_back(multiline);\n      }\n      heap_strings->push_back(\n          std::make_unique<std::string>(absl::StrJoin(multiline_tokens, \"\\n\")));\n      tokens.emplace_back(*heap_strings->back());\n    } else {\n      if (!SplitLineInline(line, &tokens)) {\n        return absl::InvalidArgumentError(\n            absl::StrCat(\"Line ended with quote open: \", line));\n      }\n    }\n  }\n  return tokens;\n}\n\n// Returns whether the token doesn't need any quoting. This is true if the token\n// isn't empty and contains only safe characters [A-Za-z0-9.?-].\nbool IsTrivialToken(const absl::string_view value) {\n  if (value.empty()) {\n    return false;\n  }\n\n  return std::all_of(value.begin(), value.end(), [](char c) {\n    return absl::ascii_isalnum(c) || c == '.' || c == '?' || c == '-';\n  });\n}\n\n// Returns whether the token needs to be a multiline token. This happens if it\n// has a newline or both single and double quotes.\nbool IsMultiLineToken(const absl::string_view value) {\n  bool has_single_quotes = false;\n  bool has_double_quotes = false;\n  for (const char c : value) {\n    if (c == '\\n') {\n      return true;\n    } else if (c == '\\'') {\n      has_single_quotes = true;\n    } else if (c == '\"') {\n      has_double_quotes = true;\n    }\n  }\n  return has_single_quotes && has_double_quotes;\n}\n\nabsl::string_view GetEscapeQuote(const absl::string_view value) {\n  // Empty values should not happen, but if so, they should be quoted.\n  if (value.empty()) {\n    return \"\\\"\";\n  }\n\n  // The value must not start with one of these CIF keywords.\n  if (absl::StartsWithIgnoreCase(value, \"data_\") ||\n      absl::StartsWithIgnoreCase(value, \"loop_\") ||\n      absl::StartsWithIgnoreCase(value, \"save_\") ||\n      absl::StartsWithIgnoreCase(value, \"stop_\") ||\n      absl::StartsWithIgnoreCase(value, \"global_\")) {\n    return \"\\\"\";\n  }\n\n  // The first character must not be a special character.\n  const char first = value.front();\n  if (first == '_' || first == '#' || first == '$' || first == '[' ||\n      first == ']' || first == ';') {\n    return \"\\\"\";\n  }\n\n  // No quotes or whitespace allowed inside. Rare case when both double and\n  // single quotes are present is handled by IsMultiLineToken.\n  bool use_double_quote = true;\n  bool use_single_quote = true;\n  bool needs_quote = false;\n  for (const char c : value) {\n    if (c == ' ' || c == '\\t') {\n      needs_quote = true;\n    } else if (c == '\"') {\n      needs_quote = true;\n      use_double_quote = false;\n    } else if (c == '\\'') {\n      needs_quote = true;\n      use_single_quote = false;\n    }\n  }\n  if (needs_quote && use_double_quote) {\n    return \"\\\"\";\n  } else if (needs_quote && use_single_quote) {\n    return \"'\";\n  }\n  return \"\";\n}\n\nint RecordIndex(absl::string_view record) {\n  if (record == \"_entry\") {\n    return 0;  // _entry is always first.\n  }\n  if (record == \"_atom_site\") {\n    return 2;  // _atom_site is always last.\n  }\n  return 1;  // other records are between _entry and _atom_site.\n}\n\nstruct RecordOrder {\n  using is_transparent = void;  // Enable heterogeneous lookup.\n  bool operator()(absl::string_view lhs, absl::string_view rhs) const {\n    std::size_t lhs_index = RecordIndex(lhs);\n    std::size_t rhs_index = RecordIndex(rhs);\n    return std::tie(lhs_index, lhs) < std::tie(rhs_index, rhs);\n  }\n};\n\n// Make sure the _atom_site loop columns are sorted in the PDB-standard way.\nconstexpr absl::string_view kAtomSiteSortOrder[] = {\n    \"_atom_site.group_PDB\",\n    \"_atom_site.id\",\n    \"_atom_site.type_symbol\",\n    \"_atom_site.label_atom_id\",\n    \"_atom_site.label_alt_id\",\n    \"_atom_site.label_comp_id\",\n    \"_atom_site.label_asym_id\",\n    \"_atom_site.label_entity_id\",\n    \"_atom_site.label_seq_id\",\n    \"_atom_site.pdbx_PDB_ins_code\",\n    \"_atom_site.Cartn_x\",\n    \"_atom_site.Cartn_y\",\n    \"_atom_site.Cartn_z\",\n    \"_atom_site.occupancy\",\n    \"_atom_site.B_iso_or_equiv\",\n    \"_atom_site.pdbx_formal_charge\",\n    \"_atom_site.auth_seq_id\",\n    \"_atom_site.auth_comp_id\",\n    \"_atom_site.auth_asym_id\",\n    \"_atom_site.auth_atom_id\",\n    \"_atom_site.pdbx_PDB_model_num\",\n};\n\nsize_t AtomSiteIndex(absl::string_view atom_site) {\n  return std::distance(std::begin(kAtomSiteSortOrder),\n                       absl::c_find(kAtomSiteSortOrder, atom_site));\n}\n\nstruct AtomSiteOrder {\n  bool operator()(absl::string_view lhs, absl::string_view rhs) const {\n    auto lhs_index = AtomSiteIndex(lhs);\n    auto rhs_index = AtomSiteIndex(rhs);\n    return std::tie(lhs_index, lhs) < std::tie(rhs_index, rhs);\n  }\n};\n\nclass Column {\n public:\n  Column(absl::string_view key, const std::vector<std::string>* values)\n      : key_(key), values_(values) {\n    int max_value_length = 0;\n    for (size_t i = 0; i < values->size(); ++i) {\n      absl::string_view value = (*values)[i];\n      if (IsTrivialToken(value)) {\n        // Shortcut for the most common cases where no quoting/multiline needed.\n        max_value_length = std::max<int>(max_value_length, value.size());\n        continue;\n      } else if (IsMultiLineToken(value)) {\n        values_with_newlines_.insert(i);\n      } else {\n        absl::string_view quote = GetEscapeQuote(value);\n        if (!quote.empty()) {\n          values_with_quotes_[i] = quote;\n        }\n        max_value_length =\n            std::max<int>(max_value_length, value.size() + quote.size() * 2);\n      }\n    }\n    max_value_length_ = max_value_length;\n  }\n\n  absl::string_view key() const { return key_; }\n\n  const std::vector<std::string>* values() const { return values_; }\n\n  int max_value_length() const { return max_value_length_; }\n\n  bool has_newlines(size_t index) const {\n    return values_with_newlines_.contains(index);\n  }\n\n  absl::string_view quote(size_t index) const {\n    if (auto it = values_with_quotes_.find(index);\n        it != values_with_quotes_.end()) {\n      return it->second;\n    }\n    return \"\";\n  }\n\n private:\n  absl::string_view key_;\n  const std::vector<std::string>* values_;\n  int max_value_length_;\n  // Values with newlines or quotes are very rare in a typical CIF file.\n  absl::flat_hash_set<size_t> values_with_newlines_;\n  absl::flat_hash_map<size_t, absl::string_view> values_with_quotes_;\n};\n\nstruct GroupedKeys {\n  std::vector<Column> grouped_columns;\n  int max_key_length;\n  int value_size;\n};\n\nabsl::Status CheckLoopColumnSizes(int num_loop_keys, int num_loop_values) {\n  if ((num_loop_keys > 0) && (num_loop_values % num_loop_keys != 0)) {\n    return absl::InvalidArgumentError(absl::StrFormat(\n        \"The number of values (%d) in a loop is not a multiple of the \"\n        \"number of the loop's columns (%d)\",\n        num_loop_values, num_loop_keys));\n  }\n  return absl::OkStatus();\n}\n\n}  // namespace\n\nabsl::StatusOr<CifDict> CifDict::FromString(absl::string_view cif_string) {\n  CifDict::Dict cif;\n\n  bool loop_flag = false;\n  absl::string_view key;\n\n  HeapStrings heap_strings;\n  auto tokens = TokenizeInternal(cif_string, &heap_strings);\n  if (!tokens.ok()) {\n    return tokens.status();\n  }\n\n  if (tokens->empty()) {\n    return absl::InvalidArgumentError(\"The CIF file must not be empty.\");\n  }\n\n  // The first token should be data_XXX. Split into key = data, value = XXX.\n  absl::string_view first_token = tokens->front();\n  if (!absl::ConsumePrefix(&first_token, \"data_\")) {\n    return absl::InvalidArgumentError(\n        \"The CIF file does not start with the data_ field.\");\n  }\n  if (first_token.empty()) {\n    return absl::InvalidArgumentError(\n        \"The CIF file does not contain a data block name.\");\n  }\n  cif[\"data_\"].emplace_back(first_token);\n\n  // Counters for CIF loop_ regions.\n  int loop_token_index = 0;\n  int num_loop_keys = 0;\n  // Loops have usually O(10) columns but could have up to O(10^6) rows. It is\n  // therefore wasteful to look up the cif vector where to add a loop value\n  // since that means doing `columns * rows` map lookups. If we save pointers to\n  // these loop column fields instead, we need only 1 cif lookup per column.\n  std::vector<std::vector<std::string>*> loop_column_values;\n\n  // Skip the first element since we already processed it above.\n  for (auto token_itr = tokens->begin() + 1; token_itr != tokens->end();\n       ++token_itr) {\n    auto token = *token_itr;\n    if (absl::EqualsIgnoreCase(token, \"loop_\")) {\n      // A new loop started, check the previous loop and get rid of its data.\n      absl::Status loop_status =\n          CheckLoopColumnSizes(num_loop_keys, loop_token_index);\n      if (!loop_status.ok()) {\n        return loop_status;\n      }\n      loop_flag = true;\n      loop_column_values.clear();\n      loop_token_index = 0;\n      num_loop_keys = 0;\n      continue;\n    } else if (loop_flag) {\n      // The second condition checks we are in the first column. Some mmCIF\n      // files (e.g. 4q9r) have values in later columns starting with an\n      // underscore and we don't want to read these as keys.\n      int token_column_index =\n          num_loop_keys == 0 ? 0 : loop_token_index % num_loop_keys;\n      if (token_column_index == 0 && !token.empty() && token[0] == '_') {\n        if (loop_token_index > 0) {\n          // We are out of the loop.\n          loop_flag = false;\n        } else {\n          // We are in the keys (column names) section of the loop.\n          auto [it, inserted] = cif.try_emplace(token);\n          if (!inserted) {\n            return absl::InvalidArgumentError(\n                absl::StrCat(\"Duplicate loop key: '\", token, \"'\"));\n          }\n          auto& columns = it->second;\n          columns.clear();\n\n          // Heuristic: _atom_site is typically the largest table in an mmCIF\n          // with ~16 columns. Make sure we reserve enough space for its values.\n          if (absl::StartsWith(token, \"_atom_site.\")) {\n            columns.reserve(tokens->size() / 20);\n          }\n\n          // Save the pointer to the loop column values.\n          loop_column_values.push_back(&columns);\n          num_loop_keys += 1;\n          continue;\n        }\n      } else {\n        // We are in the values section of the loop. We have a pointer to the\n        // loops' values, add the new token in there.\n        if (token_column_index >= loop_column_values.size()) {\n          return absl::InvalidArgumentError(\n              absl::StrCat(\"Too many columns at: '\", token,\n                           \"' at column index: \", token_column_index,\n                           \" expected at most: \", loop_column_values.size()));\n        }\n        loop_column_values[token_column_index]->emplace_back(token);\n        loop_token_index++;\n        continue;\n      }\n    }\n    if (key.empty()) {\n      key = token;\n      if (!absl::StartsWith(key, \"_\")) {\n        return absl::InvalidArgumentError(\n            absl::StrCat(\"Key '\", key, \"' does not start with an underscore.\"));\n      }\n    } else {\n      auto [it, inserted] = cif.try_emplace(key);\n      if (!inserted) {\n        return absl::InvalidArgumentError(\n            absl::StrCat(\"Duplicate key: '\", key, \"'\"));\n      }\n      (it->second).emplace_back(token);\n      key = \"\";\n    }\n  }\n  absl::Status loop_status =\n      CheckLoopColumnSizes(num_loop_keys, loop_token_index);\n  if (!loop_status.ok()) {\n    return loop_status;\n  }\n  return CifDict(std::move(cif));\n}\n\nabsl::StatusOr<std::string> CifDict::ToString() const {\n  std::string output;\n\n  absl::string_view data_name;\n  // Check that the data_ field exists.\n  if (auto name_it = (*dict_).find(\"data_\");\n      name_it == (*dict_).end() || name_it->second.empty()) {\n    return absl::InvalidArgumentError(\n        \"The CIF must contain a valid name for this data block in the special \"\n        \"data_ field.\");\n  } else {\n    data_name = name_it->second.front();\n  }\n\n  if (absl::c_any_of(data_name,\n                     [](char i) { return absl::ascii_isspace(i); })) {\n    return absl::InvalidArgumentError(absl::StrFormat(\n        \"The CIF data block name must not contain any whitespace characters, \"\n        \"got '%s'.\",\n        data_name));\n  }\n  absl::StrAppend(&output, \"data_\", data_name, \"\\n#\\n\");\n\n  // Group keys by their prefix. Use btree_map to iterate in alphabetical order,\n  // but with some keys being placed at the end (e.g. _atom_site).\n  absl::btree_map<std::string, GroupedKeys, RecordOrder> grouped_keys;\n  for (const auto& [key, values] : *dict_) {\n    if (key == \"data_\") {\n      continue;  // Skip the special data_ key, we are already done with it.\n    }\n    const std::pair<absl::string_view, absl::string_view> key_parts =\n        absl::StrSplit(key, absl::MaxSplits('.', 1));\n    const absl::string_view key_prefix = key_parts.first;\n    auto [it, inserted] = grouped_keys.emplace(key_prefix, GroupedKeys{});\n    GroupedKeys& grouped_key = it->second;\n    grouped_key.grouped_columns.push_back(Column(key, &values));\n    if (inserted) {\n      grouped_key.max_key_length = key.length();\n      grouped_key.value_size = values.size();\n    } else {\n      grouped_key.max_key_length =\n          std::max<int>(key.length(), grouped_key.max_key_length);\n      if (grouped_key.value_size != values.size()) {\n        return absl::InvalidArgumentError(\n            absl::StrFormat(\"Values for key %s have different length (%d) than \"\n                            \"the other values with the same key prefix (%d).\",\n                            key, values.size(), grouped_key.value_size));\n      }\n    }\n  }\n\n  for (auto& [key_prefix, group_info] : grouped_keys) {\n    if (key_prefix == \"_atom_site\") {\n      // Make sure we sort the _atom_site loop in the standard way.\n      absl::c_sort(group_info.grouped_columns,\n                   [](const Column& lhs, const Column& rhs) {\n                     return AtomSiteOrder{}(lhs.key(), rhs.key());\n                   });\n    } else {\n      // Make the key ordering within a key group deterministic.\n      absl::c_sort(group_info.grouped_columns,\n                   [](const Column& lhs, const Column& rhs) {\n                     return lhs.key() < rhs.key();\n                   });\n    }\n\n    // Force `_atom_site` field to always be a loop. This resolves issues with\n    // third party mmCIF parsers such as OpenBabel which always expect a loop\n    // even when there is only a single atom present.\n    if (group_info.value_size == 1 && key_prefix != \"_atom_site\") {\n      // Plain key-value pairs, output them as they are.\n      for (const Column& grouped_column : group_info.grouped_columns) {\n        int width = group_info.max_key_length + 1;\n        size_t start_pos = output.size();\n        output.append(width, ' ');\n        auto out_it = output.begin() + start_pos;\n        absl::c_copy(grouped_column.key(), out_it);\n        // Append the value, handle multi-line/quoting.\n        absl::string_view value = grouped_column.values()->front();\n        if (grouped_column.has_newlines(0)) {\n          absl::StrAppend(&output, \"\\n;\", value, \"\\n;\\n\");  // Multi-line value.\n        } else {\n          const absl::string_view quote_char = grouped_column.quote(0);\n          absl::StrAppend(&output, quote_char, value, quote_char, \"\\n\");\n        }\n      }\n    } else {\n      // CIF loop. Output the column names, then the rows with data.\n      absl::StrAppend(&output, \"loop_\\n\");\n      for (Column& grouped_column : group_info.grouped_columns) {\n        absl::StrAppend(&output, grouped_column.key(), \"\\n\");\n      }\n      // Write the loop values, line by line. This is the most expensive part\n      // since this path is taken to write the entire atom site table which has\n      // about 20 columns, but thousands of rows.\n      for (int i = 0; i < group_info.value_size; i++) {\n        for (int column_index = 0;\n             column_index < group_info.grouped_columns.size(); ++column_index) {\n          const Column& grouped_column =\n              group_info.grouped_columns[column_index];\n          const absl::string_view value = (*grouped_column.values())[i];\n          if (grouped_column.has_newlines(i)) {\n            // Multi-line. This is very rarely taken path.\n            if (column_index == 0) {\n              // No extra newline before leading ;, already inserted.\n              absl::StrAppend(&output, \";\", value, \"\\n;\\n\");\n            } else if (column_index == group_info.grouped_columns.size() - 1) {\n              // No extra newline after trailing ;, will be inserted.\n              absl::StrAppend(&output, \"\\n;\", value, \"\\n;\");\n            } else {\n              absl::StrAppend(&output, \"\\n;\", value, \"\\n;\\n\");\n            }\n          } else {\n            size_t start_pos = output.size();\n            output.append(grouped_column.max_value_length() + 1, ' ');\n            auto out_it = output.begin() + start_pos;\n            absl::string_view quote = grouped_column.quote(i);\n            if (!quote.empty()) {\n              out_it = absl::c_copy(quote, out_it);\n              out_it = absl::c_copy(value, out_it);\n              absl::c_copy(quote, out_it);\n            } else {\n              absl::c_copy(value, out_it);\n            }\n          }\n        }\n        absl::StrAppend(&output, \"\\n\");\n      }\n    }\n    absl::StrAppend(&output, \"#\\n\");  // Comment token after every key group.\n  }\n  return output;\n}\n\nabsl::StatusOr<\n    std::vector<absl::flat_hash_map<absl::string_view, absl::string_view>>>\nCifDict::ExtractLoopAsList(absl::string_view prefix) const {\n  std::vector<absl::string_view> column_names;\n  std::vector<std::vector<absl::string_view>> column_data;\n\n  for (const auto& element : *dict_) {\n    if (absl::StartsWith(element.first, prefix)) {\n      column_names.emplace_back(element.first);\n      auto& cells = column_data.emplace_back();\n      cells.insert(cells.begin(), element.second.begin(), element.second.end());\n    }\n  }\n  // Make sure all columns have the same number of rows.\n  const std::size_t num_rows = column_data.empty() ? 0 : column_data[0].size();\n  for (const auto& column : column_data) {\n    if (column.size() != num_rows) {\n      return absl::InvalidArgumentError(absl::StrCat(\n          GetDataName(),\n          \": Columns do not have the same number of rows for prefix: '\", prefix,\n          \"'. One possible reason could be not including the trailing dot, \"\n          \"e.g. '_atom_site.'.\"));\n    }\n  }\n\n  std::vector<absl::flat_hash_map<absl::string_view, absl::string_view>> result;\n  result.reserve(num_rows);\n  CHECK_EQ(column_names.size(), column_data.size());\n  for (std::size_t row_index = 0; row_index < num_rows; ++row_index) {\n    auto& row_dict = result.emplace_back();\n    row_dict.reserve(column_names.size());\n    for (int col_index = 0; col_index < column_names.size(); ++col_index) {\n      row_dict[column_names[col_index]] = column_data[col_index][row_index];\n    }\n  }\n  return result;\n}\n\nabsl::StatusOr<absl::flat_hash_map<\n    absl::string_view,\n    absl::flat_hash_map<absl::string_view, absl::string_view>>>\nCifDict::ExtractLoopAsDict(absl::string_view prefix,\n                           absl::string_view index) const {\n  if (!absl::StartsWith(index, prefix)) {\n    return absl::InvalidArgumentError(\n        absl::StrCat(GetDataName(), \": The loop index '\", index,\n                     \"' must start with the loop prefix '\", prefix, \"'.\"));\n  }\n  absl::flat_hash_map<absl::string_view,\n                      absl::flat_hash_map<absl::string_view, absl::string_view>>\n      result;\n  auto loop_as_list = ExtractLoopAsList(prefix);\n  if (!loop_as_list.ok()) {\n    return loop_as_list.status();\n  }\n  result.reserve(loop_as_list->size());\n  for (auto& entry : *loop_as_list) {\n    if (const auto it = entry.find(index); it != entry.end()) {\n      result[it->second] = entry;\n    } else {\n      return absl::InvalidArgumentError(absl::StrCat(\n          GetDataName(), \": The index column '\", index,\n          \"' could not be found in the loop with prefix '\", prefix, \"'.\"));\n    }\n  }\n  return result;\n}\n\nabsl::StatusOr<std::vector<std::string>> Tokenize(\n    absl::string_view cif_string) {\n  HeapStrings heap_strings;\n  auto tokens = TokenizeInternal(cif_string, &heap_strings);\n  if (!tokens.ok()) {\n    return tokens.status();\n  }\n  return std::vector<std::string>(tokens->begin(), tokens->end());\n}\n\nabsl::StatusOr<std::vector<absl::string_view>> SplitLine(\n    absl::string_view line) {\n  std::vector<absl::string_view> tokens;\n  if (!SplitLineInline(line, &tokens)) {\n    return absl::InvalidArgumentError(\n        absl::StrCat(\"Line ended with quote open: \", line));\n  }\n  return tokens;\n}\n\nabsl::StatusOr<absl::flat_hash_map<std::string, CifDict>> ParseMultiDataCifDict(\n    absl::string_view cif_string) {\n  absl::flat_hash_map<std::string, CifDict> mapping;\n  constexpr absl::string_view delimitor = \"data_\";\n  // Check cif_string starts with correct offset.\n  if (!cif_string.empty() && !absl::StartsWith(cif_string, delimitor)) {\n    return absl::InvalidArgumentError(\n        \"Invalid format. MultiDataCifDict must start with 'data_'\");\n  }\n  for (absl::string_view data_block :\n       absl::StrSplit(cif_string, delimitor, absl::SkipEmpty())) {\n    absl::string_view block_with_delimitor(\n        data_block.data() - delimitor.size(),\n        data_block.size() + delimitor.size());\n    absl::StatusOr<CifDict> parsed_block =\n        CifDict::FromString(block_with_delimitor);\n    if (!parsed_block.ok()) {\n      return parsed_block.status();\n    }\n    absl::string_view data_name = parsed_block->GetDataName();\n    mapping[data_name] = *std::move(parsed_block);\n  }\n\n  return mapping;\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/cif_dict_lib.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n// A C++ implementation of a CIF parser. For the format specification see\n// https://www.iucr.org/resources/cif/spec/version1.1/cifsyntax\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_CIF_DICT_LIB_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_CIF_DICT_LIB_H_\n\n#include <cstddef>\n#include <memory>\n#include <string>\n#include <utility>\n#include <vector>\n\n#include \"absl/container/flat_hash_map.h\"\n#include \"absl/container/node_hash_map.h\"\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n\nnamespace alphafold3 {\n\nclass CifDict {\n public:\n  // Use absl::node_hash_map since it guarantees pointer stability.\n  using Dict = absl::node_hash_map<std::string, std::vector<std::string>>;\n\n  CifDict() = default;\n\n  explicit CifDict(Dict dict)\n      : dict_(std::make_shared<const Dict>(std::move(dict))) {}\n\n  // Converts a CIF string into a dictionary mapping each CIF field to a list of\n  // values that field contains.\n  static absl::StatusOr<CifDict> FromString(absl::string_view cif_string);\n\n  // Converts the CIF into into a string that is a valid CIF file.\n  absl::StatusOr<std::string> ToString() const;\n\n  // Extracts loop associated with a prefix from mmCIF data as a list.\n  // Reference for loop_ in mmCIF:\n  // http://mmcif.wwpdb.org/docs/tutorials/mechanics/pdbx-mmcif-syntax.html\n  // Args:\n  // prefix: Prefix shared by each of the data items in the loop.\n  //   e.g. '_entity_poly_seq.', where the data items are _entity_poly_seq.num,\n  //   _entity_poly_seq.mon_id. Should include the trailing period.\n  //\n  // Returns a list of dicts; each dict represents 1 entry from an mmCIF loop.\n  // Lifetime of string_views tied to this.\n  absl::StatusOr<\n      std::vector<absl::flat_hash_map<absl::string_view, absl::string_view>>>\n  ExtractLoopAsList(absl::string_view prefix) const;\n\n  // Extracts loop associated with a prefix from mmCIF data as a dictionary.\n  // Args:\n  // prefix: Prefix shared by each of the data items in the loop.\n  //   e.g. '_entity_poly_seq.', where the data items are _entity_poly_seq.num,\n  //   _entity_poly_seq.mon_id. Should include the trailing period.\n  // index: Which item of loop data should serve as the key.\n  //\n  // Returns a dict of dicts; each dict represents 1 entry from an mmCIF loop,\n  // indexed by the index column.\n  // Lifetime of string_views tied to this.\n  absl::StatusOr<absl::flat_hash_map<\n      absl::string_view,\n      absl::flat_hash_map<absl::string_view, absl::string_view>>>\n  ExtractLoopAsDict(absl::string_view prefix, absl::string_view index) const;\n\n  // Returns value at key if present or an empty list.\n  absl::Span<const std::string> operator[](absl::string_view key) const {\n    auto it = dict_->find(key);\n    if (it != dict_->end()) {\n      return it->second;\n    }\n    return {};\n  }\n\n  // Returns boolean of whether dict contains key.\n  bool Contains(absl::string_view key) const { return dict_->contains(key); }\n\n  // Returns number of values for the given key if present, 0 otherwise.\n  size_t ValueLength(absl::string_view key) const {\n    return (*this)[key].size();\n  }\n\n  // Returns the size of the underlying dictionary.\n  std::size_t Length() { return dict_->size(); }\n\n  // Creates a copy of this CifDict object that will contain the original values\n  // but only if not updated by the given dictionary.\n  // E.g. if the CifDict = {a: [a1, a2], b: [b1]} and other = {a: [x], c: [z]},\n  // you will get {a: [x], b: [b1], c: [z]}.\n  CifDict CopyAndUpdate(Dict other) const {\n    other.insert(dict_->begin(), dict_->end());\n    return CifDict(std::move(other));\n  }\n\n  // Returns the value of the special CIF data_ field.\n  absl::string_view GetDataName() const {\n    // The data_ element has to be present by construction.\n    if (auto it = dict_->find(\"data_\");\n        it != dict_->end() && !it->second.empty()) {\n      return it->second.front();\n    } else {\n      return \"\";\n    }\n  }\n\n  const std::shared_ptr<const Dict>& dict() const { return dict_; }\n\n private:\n  std::shared_ptr<const Dict> dict_;\n};\n\n// Tokenizes a CIF string into a list of string tokens. This is more involved\n// than just a simple split on whitespace as CIF allows comments and quoting.\nabsl::StatusOr<std::vector<std::string>> Tokenize(absl::string_view cif_string);\n\n// Tokenizes a single line of a CIF string.\nabsl::StatusOr<std::vector<absl::string_view>> SplitLine(\n    absl::string_view line);\n\n// Parses a CIF string with multiple data records and returns a mapping from\n// record names to CifDict objects. For instance, the following CIF string:\n//\n// data_001\n// _foo bar\n//\n// data_002\n// _foo baz\n//\n// will be parsed as:\n// {'001': CifDict({'_foo': ['bar']}),\n//  '002': CifDict({'_foo': ['baz']})}\nabsl::StatusOr<absl::flat_hash_map<std::string, CifDict>> ParseMultiDataCifDict(\n    absl::string_view cif_string);\n\n}  // namespace alphafold3\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_CIF_DICT_LIB_H_\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/cif_dict_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <Python.h>\n\n#include <cstddef>\n#include <cstdint>\n#include <cstring>\n#include <limits>\n#include <memory>\n#include <string>\n#include <type_traits>\n#include <utility>\n#include <vector>\n\n#include \"numpy/ndarrayobject.h\"\n#include \"numpy/ndarraytypes.h\"\n#include \"numpy/npy_common.h\"\n#include \"absl/base/no_destructor.h\"\n#include \"absl/container/flat_hash_map.h\"\n#include \"absl/status/status.h\"\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/numbers.h\"\n#include \"absl/strings/str_cat.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n#include \"pybind11/attr.h\"\n#include \"pybind11/cast.h\"\n#include \"pybind11/gil.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/pytypes.h\"\n#include \"pybind11/stl.h\"\n\nnamespace alphafold3 {\nnamespace {\nnamespace py = pybind11;\n\ntemplate <typename Item, typename ForEach>\nbool GatherArray(size_t num_dims, npy_intp* shape_array, npy_intp* stride_array,\n                 const char* data, absl::Span<const std::string> values,\n                 ForEach&& for_each_cb) {\n  if (num_dims == 1) {\n    const npy_intp shape = shape_array[0];\n    const npy_intp stride = stride_array[0];\n    for (size_t i = 0; i < shape; ++i) {\n      Item index;\n      std::memcpy(&index, data + stride * i, sizeof(Item));\n      if (index < 0 || index >= values.size()) {\n        PyErr_SetString(PyExc_IndexError,\n                        absl::StrCat(\"index \", index,\n                                     \" is out of bounds for column with size \",\n                                     values.size())\n                            .c_str());\n        return false;\n      }\n      if (!for_each_cb(values[index])) {\n        return false;\n      }\n    }\n  } else if (num_dims == 0) {\n    Item index;\n    std::memcpy(&index, data, sizeof(Item));\n    if (index < 0 || index >= values.size()) {\n      PyErr_SetString(\n          PyExc_IndexError,\n          absl::StrCat(\"index \", index,\n                       \" is out of bounds for column with size \", values.size())\n              .c_str());\n      return false;\n    }\n    if (!for_each_cb(values[index])) {\n      return false;\n    }\n  } else {\n    const npy_intp shape = shape_array[0];\n    const npy_intp stride = stride_array[0];\n    for (size_t i = 0; i < shape; ++i) {\n      if (!GatherArray<Item>(num_dims - 1, shape_array + 1, stride_array + 1,\n                             data + stride * i, values, for_each_cb)) {\n        return false;\n      }\n    }\n  }\n  return true;\n}\n\ntemplate <typename Size, typename ForEach>\nbool Gather(PyObject* gather, absl::Span<const std::string> values,\n            Size&& size_cb, ForEach&& for_each_cb) {\n  if (gather == Py_None) {\n    npy_intp dim = static_cast<npy_intp>(values.size());\n    if (!size_cb(absl::MakeSpan(&dim, 1))) {\n      return false;\n    }\n    for (const std::string& v : values) {\n      if (!for_each_cb(v)) {\n        return false;\n      }\n    }\n    return true;\n  }\n  if (PySlice_Check(gather)) {\n    Py_ssize_t start, stop, step, slice_length;\n    if (PySlice_GetIndicesEx(gather, values.size(), &start, &stop, &step,\n                             &slice_length) != 0) {\n      return false;\n    }\n    npy_intp dim = static_cast<npy_intp>(slice_length);\n    if (!size_cb(absl::MakeSpan(&dim, 1))) {\n      return false;\n    }\n    for (size_t i = 0; i < slice_length; ++i) {\n      if (!for_each_cb(values[start + i * step])) {\n        return false;\n      }\n    }\n    return true;\n  }\n  if (PyArray_Check(gather)) {\n    PyArrayObject* gather_array = reinterpret_cast<PyArrayObject*>(gather);\n    auto shape =\n        absl::MakeSpan(PyArray_DIMS(gather_array), PyArray_NDIM(gather_array));\n    switch (PyArray_TYPE(gather_array)) {\n      case NPY_INT16:\n        if (!size_cb(shape)) {\n          return false;\n        }\n        return GatherArray<std::int16_t>(shape.size(), shape.data(),\n                                         PyArray_STRIDES(gather_array),\n                                         PyArray_BYTES(gather_array), values,\n                                         std::forward<ForEach>(for_each_cb));\n      case NPY_UINT16:\n        if (!size_cb(shape)) {\n          return false;\n        }\n        return GatherArray<std::uint16_t>(shape.size(), shape.data(),\n                                          PyArray_STRIDES(gather_array),\n                                          PyArray_BYTES(gather_array), values,\n                                          std::forward<ForEach>(for_each_cb));\n      case NPY_INT32:\n        if (!size_cb(shape)) {\n          return false;\n        }\n        return GatherArray<std::int32_t>(shape.size(), shape.data(),\n                                         PyArray_STRIDES(gather_array),\n                                         PyArray_BYTES(gather_array), values,\n                                         std::forward<ForEach>(for_each_cb));\n      case NPY_UINT32:\n        if (!size_cb(shape)) {\n          return false;\n        }\n        return GatherArray<std::uint32_t>(shape.size(), shape.data(),\n                                          PyArray_STRIDES(gather_array),\n                                          PyArray_BYTES(gather_array), values,\n                                          std::forward<ForEach>(for_each_cb));\n      case NPY_INT64:\n        if (!size_cb(shape)) {\n          return false;\n        }\n        return GatherArray<std::int64_t>(shape.size(), shape.data(),\n                                         PyArray_STRIDES(gather_array),\n                                         PyArray_BYTES(gather_array), values,\n                                         std::forward<ForEach>(for_each_cb));\n      case NPY_UINT64:\n        if (!size_cb(shape)) {\n          return false;\n        }\n        return GatherArray<std::uint64_t>(shape.size(), shape.data(),\n                                          PyArray_STRIDES(gather_array),\n                                          PyArray_BYTES(gather_array), values,\n                                          std::forward<ForEach>(for_each_cb));\n      default:\n        PyErr_SetString(PyExc_TypeError, \"Unsupported NumPy array type.\");\n        return false;\n    }\n  }\n\n  PyErr_Format(PyExc_TypeError, \"Invalid gather %R\", gather);\n  return false;\n}\n\n// Creates a NumPy array of objects of given strings. Reusing duplicates where\n// possible.\nPyObject* ConvertStrings(PyObject* gather, PyArray_Descr* type,\n                         absl::Span<const std::string> values) {\n  absl::flat_hash_map<absl::string_view, PyObject*> existing;\n\n  PyObject* ret = nullptr;\n  PyObject** dst;\n  if (Gather(\n          gather, values,\n          [&dst, &ret, type](absl::Span<const npy_intp> size) {\n            ret = PyArray_NewFromDescr(\n                /*subtype=*/&PyArray_Type,\n                /*type=*/type,\n                /*nd=*/size.size(),\n                /*dims=*/size.data(),\n                /*strides=*/nullptr,\n                /*data=*/nullptr,\n                /*flags=*/0,\n                /*obj=*/nullptr);\n            dst = static_cast<PyObject**>(\n                PyArray_DATA(reinterpret_cast<PyArrayObject*>(ret)));\n            return true;\n          },\n          [&dst, &existing](absl::string_view value) {\n            auto [it, inserted] = existing.emplace(value, nullptr);\n            if (inserted) {\n              it->second =\n                  PyUnicode_FromStringAndSize(value.data(), value.size());\n              PyUnicode_InternInPlace(&it->second);\n            } else {\n              Py_INCREF(it->second);\n            }\n            *dst++ = it->second;\n            return true;\n          })) {\n    return ret;\n  } else {\n    Py_XDECREF(ret);\n    return nullptr;\n  }\n}\n\n// Creates NumPy array with given dtype given specified converter.\n// `converter` shall have the following signature:\n// bool converter(const std::string& value, T* result);\n// It must return whether conversion is successful and store conversion in\n// result.\ntemplate <typename T, typename C>\ninline PyObject* Convert(PyObject* gather, PyArray_Descr* type,\n                         absl::Span<const std::string> values, C&& converter) {\n  py::object ret;\n  T* dst;\n  if (Gather(\n          gather, values,\n          [&dst, &ret, type](absl::Span<const npy_intp> size) {\n            // Construct uninitialised NumPy array of type T.\n            ret = py::reinterpret_steal<py::object>(PyArray_NewFromDescr(\n                /*subtype=*/&PyArray_Type,\n                /*type=*/type,\n                /*nd=*/size.size(),\n                /*dims=*/size.data(),\n                /*strides=*/nullptr,\n                /*data=*/nullptr,\n                /*flags=*/0,\n                /*obj=*/nullptr));\n\n            dst = static_cast<T*>(\n                PyArray_DATA(reinterpret_cast<PyArrayObject*>(ret.ptr())));\n            return true;\n          },\n          [&dst, &converter](const std::string& value) {\n            if (!converter(value, dst++)) {\n              PyErr_SetString(PyExc_ValueError, value.c_str());\n              return false;\n            }\n            return true;\n          })) {\n    return ret.release().ptr();\n  }\n  return nullptr;\n}\n\nPyObject* CifDictGetArray(const CifDict& self, absl::string_view key,\n                          PyObject* dtype, PyObject* gather) {\n  import_array();\n  PyArray_Descr* type = nullptr;\n  if (dtype == Py_None) {\n    type = PyArray_DescrFromType(NPY_OBJECT);\n  } else if (PyArray_DescrConverter(dtype, &type) == NPY_FAIL || !type) {\n    PyErr_Format(PyExc_TypeError, \"Invalid dtype %R\", dtype);\n    Py_XDECREF(type);\n    return nullptr;\n  }\n  auto entry = self.dict()->find(key);\n  if (entry == self.dict()->end()) {\n    Py_DECREF(type);\n    PyErr_SetObject(PyExc_KeyError,\n                    PyUnicode_FromStringAndSize(key.data(), key.size()));\n    return nullptr;\n  }\n\n  auto int_convert = [](absl::string_view str, auto* value) {\n    return absl::SimpleAtoi(str, value);\n  };\n\n  auto int_convert_bounded = [](absl::string_view str, auto* value) {\n    int64_t v;\n    if (absl::SimpleAtoi(str, &v)) {\n      using limits =\n          std::numeric_limits<std::remove_reference_t<decltype(*value)>>;\n      if (limits::min() <= v && v <= limits::max()) {\n        *value = v;\n        return true;\n      }\n    }\n    return false;\n  };\n\n  absl::Span<const std::string> values = entry->second;\n\n  switch (type->type_num) {\n    case NPY_DOUBLE:\n      return Convert<double>(\n          gather, type, values, [](absl::string_view str, double* value) {\n            if (str == \".\") {\n              *value = std::numeric_limits<double>::quiet_NaN();\n              return true;\n            }\n            return absl::SimpleAtod(str, value);\n          });\n    case NPY_FLOAT:\n      return Convert<float>(\n          gather, type, values, [](absl::string_view str, float* value) {\n            if (str == \".\") {\n              *value = std::numeric_limits<float>::quiet_NaN();\n              return true;\n            }\n            return absl::SimpleAtof(str, value);\n          });\n    case NPY_INT8:\n      return Convert<int8_t>(gather, type, values, int_convert_bounded);\n    case NPY_INT16:\n      return Convert<int16_t>(gather, type, values, int_convert_bounded);\n    case NPY_INT32:\n      return Convert<int32_t>(gather, type, values, int_convert);\n    case NPY_INT64:\n      return Convert<int64_t>(gather, type, values, int_convert);\n    case NPY_UINT8:\n      return Convert<uint8_t>(gather, type, values, int_convert_bounded);\n    case NPY_UINT16:\n      return Convert<uint16_t>(gather, type, values, int_convert_bounded);\n    case NPY_UINT32:\n      return Convert<uint32_t>(gather, type, values, int_convert);\n    case NPY_UINT64:\n      return Convert<uint64_t>(gather, type, values, int_convert);\n    case NPY_BOOL:\n      return Convert<bool>(gather, type, values,\n                           [](absl::string_view str, bool* value) {\n                             if (str == \"n\" || str == \"no\") {\n                               *value = false;\n                               return true;\n                             }\n                             if (str == \"y\" || str == \"yes\") {\n                               *value = true;\n                               return true;\n                             }\n                             return false;\n                           });\n    case NPY_OBJECT:\n      return ConvertStrings(gather, type, values);\n    default: {\n      PyErr_Format(PyExc_TypeError, \"Unsupported dtype %R\", dtype);\n      Py_XDECREF(type);\n      return nullptr;\n    }\n  }\n}\n\n}  // namespace\n\nvoid RegisterModuleCifDict(pybind11::module m) {\n  using Value = std::vector<std::string>;\n  static absl::NoDestructor<std::vector<std::string>> empty_values;\n\n  m.def(\n      \"from_string\",\n      [](absl::string_view s) {\n        absl::StatusOr<CifDict> dict = CifDict::FromString(s);\n        if (!dict.ok()) {\n          throw py::value_error(dict.status().ToString());\n        }\n        return *dict;\n      },\n      py::call_guard<py::gil_scoped_release>());\n\n  m.def(\n      \"tokenize\",\n      [](absl::string_view cif_string) {\n        absl::StatusOr<std::vector<std::string>> tokens = Tokenize(cif_string);\n        if (!tokens.ok()) {\n          throw py::value_error(tokens.status().ToString());\n        }\n        return *std::move(tokens);\n      },\n      py::arg(\"cif_string\"));\n\n  m.def(\"split_line\", [](absl::string_view line) {\n    absl::StatusOr<std::vector<absl::string_view>> tokens = SplitLine(line);\n    if (!tokens.ok()) {\n      throw py::value_error(tokens.status().ToString());\n    }\n    return *std::move(tokens);\n  });\n\n  m.def(\n      \"parse_multi_data_cif\",\n      [](absl::string_view cif_string) {\n        auto result = ParseMultiDataCifDict(cif_string);\n        if (!result.ok()) {\n          throw py::value_error(result.status().ToString());\n        }\n        py::dict dict;\n        for (auto& [key, value] : *result) {\n          dict[py::cast(key)] = py::cast(value);\n        }\n        return dict;\n      },\n      py::arg(\"cif_string\"));\n\n  auto cif_dict =\n      py::class_<CifDict>(m, \"CifDict\")\n          .def(py::init<>([](py::dict dict) {\n                 CifDict::Dict result;\n                 for (const auto& [key, value] : dict) {\n                   result.emplace(py::cast<absl::string_view>(key),\n                                  py::cast<std::vector<std::string>>(value));\n                 }\n                 return CifDict(std::move(result));\n               }),\n               \"Initialise with a map\")\n          .def(\"copy_and_update\",\n               [](const CifDict& self, py::dict dict) {\n                 CifDict::Dict result;\n                 for (const auto& [key, value] : dict) {\n                   result.emplace(py::cast<absl::string_view>(key),\n                                  py::cast<std::vector<std::string>>(value));\n                 }\n                 {\n                   py::gil_scoped_release gil_release;\n                   return self.CopyAndUpdate(std::move(result));\n                 }\n               })\n          .def(\n              \"__str__\",\n              [](const CifDict& self) {\n                absl::StatusOr<std::string> result = self.ToString();\n                if (!result.ok()) {\n                  throw py::value_error(result.status().ToString());\n                }\n                return *result;\n              },\n              \"Serialize to a string\", py::call_guard<py::gil_scoped_release>())\n          .def(\n              \"to_string\",\n              [](const CifDict& self) {\n                absl::StatusOr<std::string> result = self.ToString();\n                if (!result.ok()) {\n                  throw py::value_error(result.status().ToString());\n                }\n                return *result;\n              },\n              \"Serialize to a string\", py::call_guard<py::gil_scoped_release>())\n          .def(\n              \"to_dict\",\n              [](const CifDict& self) {\n                py::dict result;\n                for (const auto& [key, value] : *self.dict()) {\n                  result[py::cast(key)] = py::cast(value);\n                }\n                return result;\n              },\n              \"Returns the CIF data as a Python dict[str, list[str]].\")\n          .def(\"value_length\", &CifDict::ValueLength, py::arg(\"key\"),\n               \"Num elements in value\")\n          .def(\"__len__\",\n               [](const CifDict& self) { return self.dict()->size(); })\n          .def(\n              \"__bool__\",\n              [](const CifDict& self) { return !self.dict()->empty(); },\n              \"Check whether the map is nonempty\")\n          .def(\n              \"__contains__\",\n              [](const CifDict& self, absl::string_view k) {\n                return self.dict()->find(k) != self.dict()->end();\n              },\n              py::arg(\"key\"), py::call_guard<py::gil_scoped_release>())\n          .def(\"get_data_name\", &CifDict::GetDataName)\n          .def(\n              \"get\",\n              [](const CifDict& self, absl::string_view k,\n                 py::object default_value) -> py::object {\n                auto it = self.dict()->find(k);\n                if (it == self.dict()->end()) return default_value;\n                py::list result(it->second.size());\n                size_t index = 0;\n                for (const std::string& v : it->second) {\n                  result[index++] = py::cast(v);\n                }\n                return result;\n              },\n              py::arg(\"key\"), py::arg(\"default_value\") = py::none())\n          .def(\n              \"get_array\",\n              [](const CifDict& self, absl::string_view key, py::handle dtype,\n                 py::handle gather) -> py::object {\n                PyObject* obj =\n                    CifDictGetArray(self, key, dtype.ptr(), gather.ptr());\n                if (obj == nullptr) {\n                  throw py::error_already_set();\n                }\n                return py::reinterpret_steal<py::object>(obj);\n              },\n              py::arg(\"key\"), py::arg(\"dtype\") = py::none(),\n              py::arg(\"gather\") = py::none())\n          .def(\n              \"__getitem__\",\n              [](const CifDict& self, absl::string_view k) -> const Value& {\n                auto it = self.dict()->find(k);\n                if (it == self.dict()->end()) {\n                  throw py::key_error(std::string(k).c_str());\n                }\n                return it->second;\n              },\n              py::arg(\"key\"), py::call_guard<py::gil_scoped_release>())\n          .def(\n              \"extract_loop_as_dict\",\n              [](const CifDict& self, absl::string_view prefix,\n                 absl::string_view index) {\n                absl::StatusOr<absl::flat_hash_map<\n                    absl::string_view,\n                    absl::flat_hash_map<absl::string_view, absl::string_view>>>\n                    dict;\n                {\n                  py::gil_scoped_release gil_release;\n                  dict = self.ExtractLoopAsDict(prefix, index);\n                  if (!dict.ok()) {\n                    throw py::value_error(dict.status().ToString());\n                  }\n                }\n                py::dict key_value_dict;\n                for (const auto& [key, value] : *dict) {\n                  py::dict value_dict;\n                  for (const auto& [key2, value2] : value) {\n                    value_dict[py::cast(key2)] = py::cast(value2);\n                  }\n                  key_value_dict[py::cast(key)] = std::move(value_dict);\n                }\n                return key_value_dict;\n              },\n              py::arg(\"prefix\"), py::arg(\"index\"))\n          .def(\n              \"extract_loop_as_list\",\n              [](const CifDict& self, absl::string_view prefix) {\n                absl::StatusOr<std::vector<\n                    absl::flat_hash_map<absl::string_view, absl::string_view>>>\n                    list_dict;\n                {\n                  py::gil_scoped_release gil_release;\n                  list_dict = self.ExtractLoopAsList(prefix);\n                  if (!list_dict.ok()) {\n                    throw py::value_error(list_dict.status().ToString());\n                  }\n                }\n                py::list list_obj(list_dict->size());\n                size_t index = 0;\n                for (const auto& value : *list_dict) {\n                  py::dict value_dict;\n                  for (const auto& [key, value] : value) {\n                    value_dict[py::cast(key)] = py::cast(value);\n                  }\n                  list_obj[index++] = std::move(value_dict);\n                }\n                return list_obj;\n              },\n              py::arg(\"prefix\"))\n          .def(py::pickle(\n              [](const CifDict& self) {  // __getstate__.\n                py::tuple result_tuple(1);\n                py::dict result;\n                for (const auto& [key, value] : *self.dict()) {\n                  result[py::cast(key)] = py::cast(value);\n                }\n                result_tuple[0] = std::move(result);\n                return result_tuple;\n              },\n              [](py::tuple t) {  // __setstate__.\n                py::dict dict = t[0].cast<py::dict>();\n                CifDict::Dict result;\n                for (const auto& [key, value] : dict) {\n                  result.emplace(py::cast<absl::string_view>(key),\n                                 py::cast<std::vector<std::string>>(value));\n                }\n                return CifDict(std::move(result));\n              }));\n\n  // Item, value, and key views\n  struct KeyView {\n    CifDict map;\n  };\n\n  struct ValueView {\n    CifDict map;\n  };\n  struct ItemView {\n    CifDict map;\n  };\n\n  py::class_<ItemView>(cif_dict, \"ItemView\")\n      .def(\"__len__\", [](const ItemView& v) { return v.map.dict()->size(); })\n      .def(\n          \"__iter__\",\n          [](const ItemView& v) {\n            return py::make_iterator(v.map.dict()->begin(),\n                                     v.map.dict()->end());\n          },\n          py::keep_alive<0, 1>());\n\n  py::class_<KeyView>(cif_dict, \"KeyView\")\n      .def(\n          \"__contains__\",\n          [](const KeyView& v, absl::string_view k) {\n            return v.map.dict()->find(k) != v.map.dict()->end();\n          },\n          py::call_guard<py::gil_scoped_release>())\n      .def(\"__contains__\", [](const KeyView&, py::handle) { return false; })\n      .def(\"__len__\", [](const KeyView& v) { return v.map.dict()->size(); })\n      .def(\n          \"__iter__\",\n          [](const KeyView& v) {\n            return py::make_key_iterator(v.map.dict()->begin(),\n                                         v.map.dict()->end());\n          },\n          py::keep_alive<0, 1>());\n\n  py::class_<ValueView>(cif_dict, \"ValueView\")\n      .def(\"__len__\", [](const ValueView& v) { return v.map.dict()->size(); })\n      .def(\n          \"__iter__\",\n          [](const ValueView& v) {\n            return py::make_value_iterator(v.map.dict()->begin(),\n                                           v.map.dict()->end());\n          },\n          py::keep_alive<0, 1>());\n\n  cif_dict\n      .def(\n          \"__iter__\",\n          [](const CifDict& self) {\n            return py::make_key_iterator(self.dict()->begin(),\n                                         self.dict()->end());\n          },\n          py::keep_alive<0, 1>())\n      .def(\n          \"keys\", [](const CifDict& self) { return KeyView{self}; },\n          \"Returns an iterable view of the map's keys.\")\n      .def(\n          \"values\", [](const CifDict& self) { return ValueView{self}; },\n          \"Returns an iterable view of the map's values.\")\n      .def(\n          \"items\", [](const CifDict& self) { return ItemView{self}; },\n          \"Returns an iterable view of the map's items.\");\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/cif_dict_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_CIF_DICT_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_CIF_DICT_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleCifDict(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_CIF_DICT_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/fasta_iterator.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nclass FastaFileIterator:\n    def __init__(self, fasta_path: str) -> None: ...\n    def __iter__(self) -> FastaFileIterator: ...\n    def __next__(self) -> tuple[str,str]: ...\n\nclass FastaStringIterator:\n    def __init__(self, fasta_string: str | bytes) -> None: ...\n    def __iter__(self) -> FastaStringIterator: ...\n    def __next__(self) -> tuple[str,str]: ...\n\ndef parse_fasta(fasta_string: str | bytes) -> list[str]: ...\ndef parse_fasta_include_descriptions(fasta_string: str | bytes) -> tuple[list[str],list[str]]: ...\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/fasta_iterator_lib.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include \"alphafold3/parsers/cpp/fasta_iterator_lib.h\"\n\n#include <cstddef>\n#include <optional>\n#include <string>\n#include <utility>\n#include <vector>\n\n#include \"absl/status/status.h\"\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/ascii.h\"\n#include \"absl/strings/str_cat.h\"\n#include \"absl/strings/str_split.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/strings/strip.h\"\n\nnamespace alphafold3 {\n\n// Parse FASTA string and return list of strings with amino acid sequences.\n// Returns a list of amino acid sequences only.\nstd::vector<std::string> ParseFasta(absl::string_view fasta_string) {\n  std::vector<std::string> sequences;\n  std::string* sequence = nullptr;\n  for (absl::string_view line_raw : absl::StrSplit(fasta_string, '\\n')) {\n    absl::string_view line = absl::StripAsciiWhitespace(line_raw);\n    if (absl::ConsumePrefix(&line, \">\")) {\n      sequence = &sequences.emplace_back();\n    } else if (!line.empty() && sequence != nullptr) {\n      absl::StrAppend(sequence, line);\n    }\n  }\n  return sequences;\n}\n\n// Parse FASTA string and return list of strings with amino acid sequences.\n// Returns two lists: The first one with amino acid sequences, the second with\n// the descriptions associated with each sequence.\nstd::pair<std::vector<std::string>, std::vector<std::string>>\nParseFastaIncludeDescriptions(absl::string_view fasta_string) {\n  std::pair<std::vector<std::string>, std::vector<std::string>> result;\n  auto& [sequences, descriptions] = result;\n  std::string* sequence = nullptr;\n  for (absl::string_view line_raw : absl::StrSplit(fasta_string, '\\n')) {\n    absl::string_view line = absl::StripAsciiWhitespace(line_raw);\n    if (absl::ConsumePrefix(&line, \">\")) {\n      descriptions.emplace_back(line);\n      sequence = &sequences.emplace_back();\n    } else if (!line.empty() && sequence != nullptr) {\n      absl::StrAppend(sequence, line);\n    }\n  }\n  return result;\n}\n\nabsl::StatusOr<std::pair<std::string, std::string>> FastaFileIterator::Next() {\n  std::string line_str;\n  while (std::getline(reader_, line_str)) {\n    absl::string_view line = line_str;\n    line = absl::StripAsciiWhitespace(line);\n    if (absl::ConsumePrefix(&line, \">\")) {\n      if (!description_.has_value()) {\n        description_ = line;\n      } else {\n        std::pair<std::string, std::string> output(sequence_, *description_);\n        description_ = line;\n        sequence_ = \"\";\n        return output;\n      }\n    } else if (description_.has_value()) {\n      absl::StrAppend(&sequence_, line);\n    }\n  }\n  has_next_ = false;\n  reader_.close();\n  if (description_.has_value()) {\n    return std::pair(sequence_, *description_);\n  } else {\n    return absl::InvalidArgumentError(\n        absl::StrCat(\"Invalid FASTA file: \", filename_));\n  }\n}\n\nabsl::StatusOr<std::pair<std::string, std::string>>\nFastaStringIterator::Next() {\n  size_t consumed = 0;\n  for (absl::string_view line_raw : absl::StrSplit(fasta_string_, '\\n')) {\n    consumed += line_raw.size() + 1;  // +1 for the newline character.\n    absl::string_view line = absl::StripAsciiWhitespace(line_raw);\n    if (absl::ConsumePrefix(&line, \">\")) {\n      if (!description_.has_value()) {\n        description_ = line;\n      } else {\n        std::pair<std::string, std::string> output(sequence_, *description_);\n        description_ = line;\n        sequence_ = \"\";\n        fasta_string_.remove_prefix(consumed);\n        return output;\n      }\n    } else if (description_.has_value()) {\n      absl::StrAppend(&sequence_, line);\n    }\n  }\n  has_next_ = false;\n  if (description_.has_value()) {\n    return std::pair(sequence_, *description_);\n  } else {\n    return absl::InvalidArgumentError(\"Invalid FASTA string\");\n  }\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/fasta_iterator_lib.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n// A C++ implementation of a FASTA parser.\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_FASTA_ITERATOR_LIB_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_FASTA_ITERATOR_LIB_H_\n\n#include <fstream>\n#include <ios>\n#include <optional>\n#include <string>\n#include <utility>\n#include <vector>\n\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/string_view.h\"\n\nnamespace alphafold3 {\n\n// Parse FASTA string and return list of strings with amino acid sequences.\n// Returns a list of amino acid sequences only.\nstd::vector<std::string> ParseFasta(absl::string_view fasta_string);\n\n// Parse FASTA string and return list of strings with amino acid sequences.\n// Returns two lists: The first one with amino acid sequences, the second with\n// the descriptions associated with each sequence.\nstd::pair<std::vector<std::string>, std::vector<std::string>>\nParseFastaIncludeDescriptions(absl::string_view fasta_string);\n\n// Lazy FASTA parser for memory efficient FASTA parsing from a path.\nclass FastaFileIterator {\n public:\n  // Initialise FastaFileIterator with filename of fasta. If you initialize\n  // reader_ with an invalid path or empty file, it won't fail, only\n  // riegeli::ReadLine within the Next method will then return false. That will\n  // then trigger the \"Invalid FASTA file\" error.\n  explicit FastaFileIterator(absl::string_view fasta_path)\n      : filename_(fasta_path),\n        reader_(filename_, std::ios::in),\n        has_next_(true) {}\n\n  // Returns whether there are more sequences. Returns true before first call to\n  // next even if the file is empty.\n  bool HasNext() const { return has_next_; }\n\n  // Fetches the next (sequence, description) from the file.\n  absl::StatusOr<std::pair<std::string, std::string>> Next();\n\n private:\n  // Use riegeli::FileReader instead of FileLineIterator for about 2x speedup.\n  std::string filename_;\n  std::fstream reader_;\n  std::optional<std::string> description_;\n  std::string sequence_;\n  bool has_next_;\n};\n\n// Lazy FASTA parser for memory efficient FASTA parsing from a string.\nclass FastaStringIterator {\n public:\n  // Initialise FastaStringIterator with a string_view of a FASTA. If you\n  // initialize it with an invalid FASTA string, it won't fail, the Next method\n  // will then return false. That will then trigger the \"Invalid FASTA\" error.\n  // WARNING: The object backing the fasta_string string_view must not be\n  // deleted while this Iterator is alive.\n  explicit FastaStringIterator(absl::string_view fasta_string)\n      : fasta_string_(fasta_string), has_next_(true) {}\n\n  // Returns whether there are more sequences. Returns true before first call to\n  // next even if the string is empty.\n  bool HasNext() const { return has_next_; }\n\n  // Fetches the next (sequence, description) from the string.\n  absl::StatusOr<std::pair<std::string, std::string>> Next();\n\n private:\n  absl::string_view fasta_string_;\n  bool has_next_;\n  std::optional<std::string> description_;\n  std::string sequence_;\n};\n\n}  // namespace alphafold3\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_FASTA_ITERATOR_LIB_H_\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/fasta_iterator_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <utility>\n\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/string_view.h\"\n#include \"alphafold3/parsers/cpp/fasta_iterator_lib.h\"\n#include \"pybind11/attr.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/pytypes.h\"\n#include \"pybind11/stl.h\"\n\nnamespace alphafold3 {\nnamespace {\n\nnamespace py = pybind11;\n\ntemplate <typename T>\nT ValueOrThrowValueError(absl::StatusOr<T> value) {\n  if (!value.ok()) throw py::value_error(value.status().ToString());\n  return *std::move(value);\n}\n\nconstexpr char kFastaFileIteratorDoc[] = R\"(\nLazy FASTA parser for memory efficient FASTA parsing from a path.)\";\n\nconstexpr char kFastaStringIteratorDoc[] = R\"(\nLazy FASTA parser for memory efficient FASTA parsing from a string.\n\nWARNING: The object backing the fasta_string string_view must not be\ndeleted while the FastaStringIterator is alive. E.g. this will break:\n\n```\n# Make sure the fasta_string is not interned.\nfasta_string = '\\n'.join(['>d\\nS' for _ in range(10)])\niterator = fasta_iterator.FastaStringIterator(fasta_string)\ndel fasta_string\niterator.next()  # Heap use-after-free.\n```\n)\";\n\nconstexpr char kParseFastaDoc[] = R\"(\nParses a FASTA string and returns a list of amino-acid sequences.\n\nArgs:\n  fasta_string: The contents of a FASTA file.\n\nReturns:\n  List of sequences in the FASTA file. Descriptions are ignored.\n)\";\n\nconstexpr char kParseFastaIncludeDescriptionsDoc[] = R\"(\nParses a FASTA string, returns amino-acid sequences with descriptions.\n\nArgs:\n  fasta_string: The contents of a FASTA file.\n\nReturns:\n  A tuple with two lists (sequences, descriptions):\n  * A list of sequences.\n  * A list of sequence descriptions taken from the comment lines. In the\n    same order as the sequences.\n)\";\n\nclass PythonFastaStringIterator : public FastaStringIterator {\n public:\n  explicit PythonFastaStringIterator(py::object fasta_string)\n      : FastaStringIterator(py::cast<absl::string_view>(fasta_string)),\n        fasta_string_(std::move(fasta_string)) {}\n\n private:\n  py::object fasta_string_;\n};\n\n}  // namespace\n\nvoid RegisterModuleFastaIterator(pybind11::module m) {\n  py::class_<FastaFileIterator>(m, \"FastaFileIterator\", kFastaFileIteratorDoc)\n      .def(py::init<absl::string_view>(), py::arg(\"fasta_path\"))\n      .def(\"__iter__\",\n           [](FastaFileIterator& iterator) -> FastaFileIterator& {\n             return iterator;\n           })\n      .def(\n          \"__next__\",\n          [](FastaFileIterator& iterator) {\n            if (iterator.HasNext()) {\n              return ValueOrThrowValueError(iterator.Next());\n            } else {\n              throw py::stop_iteration();\n            }\n          },\n          py::call_guard<py::gil_scoped_release>());\n\n  py::class_<PythonFastaStringIterator>(m, \"FastaStringIterator\",\n                                        kFastaStringIteratorDoc)\n      .def(py::init<py::object>(), py::arg(\"fasta_string\"))\n      .def(\"__iter__\",\n           [](PythonFastaStringIterator& iterator)\n               -> PythonFastaStringIterator& { return iterator; })\n      .def(\n          \"__next__\",\n          [](PythonFastaStringIterator& iterator) {\n            if (iterator.HasNext()) {\n              return ValueOrThrowValueError(iterator.Next());\n            } else {\n              throw py::stop_iteration();\n            }\n          },\n          py::call_guard<py::gil_scoped_release>());\n\n  m.def(\"parse_fasta\", &ParseFasta, py::arg(\"fasta_string\"),\n        py::call_guard<py::gil_scoped_release>(), py::doc(kParseFastaDoc + 1));\n  m.def(\"parse_fasta_include_descriptions\", &ParseFastaIncludeDescriptions,\n        py::arg(\"fasta_string\"), py::call_guard<py::gil_scoped_release>(),\n        py::doc(kParseFastaIncludeDescriptionsDoc + 1));\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/fasta_iterator_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_FASTA_ITERATOR_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_FASTA_ITERATOR_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleFastaIterator(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_FASTA_ITERATOR_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/msa_conversion.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Type annotations for Python bindings for `msa_conversion`.\n\nThe type annotations in this file were modified from the automatically generated\nstubgen output.\n\"\"\"\n\nfrom collections.abc import Iterable\n\n\ndef align_sequence_to_gapless_query(\n    sequence: str | bytes,\n    query_sequence: str | bytes,\n) -> str: ...\n\n\ndef convert_a3m_to_stockholm(a3m_sequences: Iterable[str]) -> list[str]: ...\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/msa_conversion_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <algorithm>\n#include <cstddef>\n#include <stdexcept>\n#include <string>\n#include <vector>\n\n#include \"absl/strings/ascii.h\"\n#include \"absl/strings/str_format.h\"\n#include \"absl/strings/string_view.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/stl.h\"\n\nnamespace {\n\nnamespace py = pybind11;\n\nstd::vector<std::string> ConvertA3MToStockholm(\n    std::vector<absl::string_view> a3m_sequences) {\n  std::vector<std::string> stockholm_sequences(a3m_sequences.size());\n  auto max_length_element =\n      std::max_element(a3m_sequences.begin(), a3m_sequences.end(),\n                       [](absl::string_view lhs, absl::string_view rhs) {\n                         return lhs.size() < rhs.size();\n                       });\n\n  for (auto& out : stockholm_sequences) {\n    out.reserve(max_length_element->size());\n  }\n\n  // While any sequence has remaining columns.\n  while (std::any_of(a3m_sequences.begin(), a3m_sequences.end(),\n                     [](absl::string_view in) { return !in.empty(); })) {\n    if (std::any_of(a3m_sequences.begin(), a3m_sequences.end(),\n                    [](absl::string_view in) {\n                      return !in.empty() && absl::ascii_islower(in.front());\n                    })) {\n      // Insertion(s) found at column.\n      for (std::size_t i = 0; i < a3m_sequences.size(); ++i) {\n        absl::string_view& in = a3m_sequences[i];\n        std::string& out = stockholm_sequences[i];\n        if (!in.empty() && absl::ascii_islower(in.front())) {\n          // Consume insertion.\n          out.push_back(absl::ascii_toupper(in.front()));\n          in.remove_prefix(1);\n        } else {\n          // Row requires padding.\n          out.push_back('-');\n        }\n      }\n    } else {\n      // No insertions found.\n      for (std::size_t i = 0; i < a3m_sequences.size(); ++i) {\n        absl::string_view& in = a3m_sequences[i];\n        std::string& out = stockholm_sequences[i];\n        if (!in.empty()) {\n          // Consume entire column.\n          out.push_back(in.front());\n          in.remove_prefix(1);\n        } else {\n          // One alignment is shorter than the others. Should not happen with\n          // valid A3M input.\n          throw std::invalid_argument(absl::StrFormat(\n              \"a3m rows have inconsistent lengths; row %d has no columns left \"\n              \"but not all rows are exhausted\",\n              i));\n        }\n      }\n    }\n  }\n  return stockholm_sequences;\n}\n\nstd::string AlignSequenceToGaplessQuery(absl::string_view sequence,\n                                        absl::string_view query_sequence) {\n  if (sequence.size() != query_sequence.size()) {\n    throw py::value_error(\n        absl::StrFormat(\"The sequence (%d) and the query sequence (%d) don't \"\n                        \"have the same length.\",\n                        sequence.size(), query_sequence.size()));\n  }\n  std::string output;\n  for (std::size_t residue_index = 0, sequence_length = sequence.size();\n       residue_index < sequence_length; ++residue_index) {\n    const char query_residue = query_sequence[residue_index];\n    const char residue = sequence[residue_index];\n    if (query_residue != '-') {\n      // No gap in the query, so the residue is aligned.\n      output += residue;\n    } else if (residue == '-') {\n      // Gap in both sequence and query, simply skip.\n      continue;\n    } else {\n      // Gap only in the query, so this must be an inserted residue.\n      output += absl::ascii_tolower(residue);\n    }\n  }\n  return output;\n}\n\nconstexpr char kConvertA3mToStockholm[] = R\"(\nConverts a list of sequences in a3m format to stockholm format sequences.\n\nAs an example if the input is:\nabCD\nCgD\nfCDa\n\nThen the output will be:\nABC-D-\n--CGD-\nF-C-DA\n\nArgs:\n  a3m_sequences: A list of strings in a3m format.\n\nReturns\n  A list of strings converted to stockholm format.\n)\";\n\nconstexpr char kAlignSequenceToGaplessQuery[] = R\"(\nAligns a sequence to a gapless query sequence.\n\nThis is useful when converting Stockholm MSA to A3M MSA. Example:\nSeq  : AB--E\nQuery: A--DE\nOutput: Ab-E.\n\nArgs:\n  sequence: A string containing to be aligned.\n  query_sequence: A string containing the reference sequence to align to.\n\nReturns\n  The input sequence with gaps dropped where both the `sequence` and\n  `query_sequence` have gaps, and sequence elements non-capitalized where the\n  `query_sequence` has a gap, but the `sequence` does not.\n)\";\n\n}  // namespace\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMsaConversion(pybind11::module m) {\n  m.def(\"convert_a3m_to_stockholm\", &ConvertA3MToStockholm,\n        py::arg(\"a3m_sequences\"), py::call_guard<py::gil_scoped_release>(),\n        py::doc(kConvertA3mToStockholm + 1));\n  m.def(\"align_sequence_to_gapless_query\", &AlignSequenceToGaplessQuery,\n        py::arg(\"sequence\"), py::arg(\"query_sequence\"),\n        py::call_guard<py::gil_scoped_release>(),\n        py::doc(kAlignSequenceToGaplessQuery + 1));\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/parsers/cpp/msa_conversion_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_MSA_CONVERSION_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_MSA_CONVERSION_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMsaConversion(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_PARSERS_PYTHON_MSA_CONVERSION_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/scripts/copy_to_ssd.sh",
    "content": "#!/bin/bash\n# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nset -euo pipefail\n\nreadonly SOURCE_DIR=${1:-$HOME/public_databases}\nreadonly TARGET_DIR=${2:-/mnt/disks/ssd/public_databases}\n\nmkdir -p \"${TARGET_DIR}\"\n\nFILES=(pdb_seqres_2022_09_28.fasta \\\n      uniprot_all_2021_04.fa \\\n      mgy_clusters_2022_05.fa \\\n      uniref90_2022_05.fa \\\n      bfd-first_non_consensus_sequences.fasta \\\n      rfam_14_9_clust_seq_id_90_cov_80_rep_seq.fasta \\\n      nt_rna_2023_02_23_clust_seq_id_90_cov_80_rep_seq.fasta \\\n      rnacentral_active_seq_id_90_cov_80_linclust.fasta)\n\nNOT_COPIED_FILES=()\n\nwhile (( ${#FILES[@]} )); do\n  # Get total size of files to copy in bytes\n  SOURCE_FILES=( \"${FILES[@]/#/${SOURCE_DIR}/}\" )\n  TOTAL_SIZE=$(du -sbc \"${SOURCE_FILES[@]}\" | awk 'END{print $1}')\n\n  # Get available space on target drive in bytes\n  AVAILABLE_SPACE=$(df --portability --block-size=1 \"$TARGET_DIR\" | awk 'END{print $4}')\n\n  # Compare sizes and copy if enough space\n  if (( TOTAL_SIZE <= AVAILABLE_SPACE )); then\n    printf 'Copying files... %s\\n' \"${FILES[@]}\"\n    echo \"From ${SOURCE_DIR} -> ${TARGET_DIR}\"\n\n    for file in \"${FILES[@]}\"; do\n      cp -r \"${SOURCE_DIR}/${file}\" \"${TARGET_DIR}/\" &\n    done\n    break\n  else\n    NOT_COPIED_FILES+=(\"${FILES[-1]}\")\n    unset 'FILES[-1]'\n  fi\ndone\n\nprintf 'No room left on ssd for: %s\\n' \"${NOT_COPIED_FILES[@]}\"\nwait\n"
  },
  {
    "path": "src/alphafold3/scripts/gcp_mount_ssd.sh",
    "content": "#!/bin/bash\n# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nset -euo pipefail\n\nreadonly MOUNT_DIR=\"${1:-/mnt/disks/ssd}\"\n\nif [[ -d \"${MOUNT_DIR}\" ]]; then\n  echo \"Mount directory ${MOUNT_DIR} already exists, skipping\"\n  exit 0\nfi\n\nfor SSD_DISK in $(realpath \"$(find /dev/disk/by-id/ | grep google-local)\")\ndo\n  # Check if the disk is already formatted\n  if ! blkid -o value -s TYPE \"${SSD_DISK}\" > /dev/null 2>&1; then\n    echo \"Disk ${SSD_DISK} is not formatted, format it.\"\n    mkfs.ext4 -m 0 -E lazy_itable_init=0,lazy_journal_init=0,discard \"${SSD_DISK}\" || continue\n  fi\n\n  # Check if the disk is already mounted\n  if grep -qs \"^/dev/nvme0n1 \" /proc/mounts; then\n    grep -s \"^/dev/nvme0n1 \" /proc/mounts\n    echo \"Disk ${SSD_DISK} is already mounted, skip it.\"\n    continue\n  fi\n\n  # Disk is not mounted, mount it\n  echo \"Mounting ${SSD_DISK} to ${MOUNT_DIR}\"\n  mkdir -p \"${MOUNT_DIR}\"\n  chmod -R 777 \"${MOUNT_DIR}\"\n  mount \"${SSD_DISK}\" \"${MOUNT_DIR}\"\n  break\ndone\n\nif [[ ! -d \"${MOUNT_DIR}\" ]]; then\n  echo \"No unmounted SSD disks found\"\n  exit 1\nfi\n"
  },
  {
    "path": "src/alphafold3/structure/__init__.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Structure module initialization.\"\"\"\n\n# pylint: disable=g-importing-member\nfrom alphafold3.structure.bioassemblies import BioassemblyData\nfrom alphafold3.structure.bonds import Bonds\nfrom alphafold3.structure.chemical_components import ChemCompEntry\nfrom alphafold3.structure.chemical_components import ChemicalComponentsData\nfrom alphafold3.structure.chemical_components import get_data_for_ccd_components\nfrom alphafold3.structure.chemical_components import populate_missing_ccd_data\nfrom alphafold3.structure.mmcif import BondParsingError\nfrom alphafold3.structure.parsing import BondAtomId\nfrom alphafold3.structure.parsing import from_atom_arrays\nfrom alphafold3.structure.parsing import from_mmcif\nfrom alphafold3.structure.parsing import from_parsed_mmcif\nfrom alphafold3.structure.parsing import from_res_arrays\nfrom alphafold3.structure.parsing import from_sequences_and_bonds\nfrom alphafold3.structure.parsing import ModelID\nfrom alphafold3.structure.parsing import NoAtomsError\nfrom alphafold3.structure.parsing import SequenceFormat\nfrom alphafold3.structure.structure import ARRAY_FIELDS\nfrom alphafold3.structure.structure import AuthorNamingScheme\nfrom alphafold3.structure.structure import Bond\nfrom alphafold3.structure.structure import CascadeDelete\nfrom alphafold3.structure.structure import concat\nfrom alphafold3.structure.structure import enumerate_residues\nfrom alphafold3.structure.structure import fix_non_standard_polymer_residues\nfrom alphafold3.structure.structure import GLOBAL_FIELDS\nfrom alphafold3.structure.structure import make_empty_structure\nfrom alphafold3.structure.structure import MissingAtomError\nfrom alphafold3.structure.structure import MissingAuthorResidueIdError\nfrom alphafold3.structure.structure import multichain_residue_index\nfrom alphafold3.structure.structure import stack\nfrom alphafold3.structure.structure import Structure\nfrom alphafold3.structure.structure_tables import Atoms\nfrom alphafold3.structure.structure_tables import Chains\nfrom alphafold3.structure.structure_tables import Residues\n"
  },
  {
    "path": "src/alphafold3/structure/bioassemblies.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Utilities for parsing and manipulating bioassembly data.\"\"\"\n\nfrom collections.abc import Mapping, Sequence\nimport copy\nimport dataclasses\nfrom typing import Self\n\nfrom alphafold3.structure import mmcif\nimport numpy as np\n\n\n@dataclasses.dataclass(frozen=True)\nclass Operation:\n  \"\"\"A rigid transformation operation.\"\"\"\n\n  trans: np.ndarray  # shape: (3,)\n  rot: np.ndarray  # shape: (3, 3)\n\n  def apply_to_coords(self, coords: np.ndarray) -> np.ndarray:\n    \"\"\"Applies the rotation followed by the translation to `coords`.\"\"\"\n    return np.dot(coords, self.rot.T) + self.trans[np.newaxis, :]\n\n\n@dataclasses.dataclass(frozen=True)\nclass Transform:\n  \"\"\"A rigid transformation composed of a sequence of `Operation`s.\"\"\"\n\n  # The sequence of operations that form the transform. These will be applied\n  # right-to-left (last-to-first).\n  operations: Sequence[Operation]\n\n  # The chain IDs that this transform should be applied to. These are\n  # label_asym_ids in the mmCIF spec.\n  chain_ids: Sequence[str]\n\n  # A mapping from chain IDs (of chains that participate in this transform)\n  # to their new values in the bioassembly.\n  chain_id_rename_map: Mapping[str, str]\n\n  def apply_to_coords(self, coords: np.ndarray) -> np.ndarray:\n    \"\"\"Applies the `operations` in right-to-left order.\"\"\"\n    for operation in reversed(self.operations):\n      coords = operation.apply_to_coords(coords)\n    return coords\n\n\ndef _get_operation(oper_data: Mapping[str, str]) -> Operation:\n  \"\"\"Parses an `Operation` from a mmCIF _pdbx_struct_oper_list row.\"\"\"\n  trans = np.zeros((3,), dtype=np.float32)\n  rot = np.zeros((3, 3), dtype=np.float32)\n  for i in range(3):\n    trans[i] = float(oper_data[f'_pdbx_struct_oper_list.vector[{i + 1}]'])\n  for i in range(3):\n    for j in range(3):\n      rot[i][j] = float(\n          oper_data[f'_pdbx_struct_oper_list.matrix[{i + 1}][{j + 1}]']\n      )\n  return Operation(trans=trans, rot=rot)\n\n\nclass MissingBioassemblyDataError(Exception):\n  \"\"\"Raised when bioassembly data is missing from an mmCIF.\"\"\"\n\n\nclass BioassemblyData:\n  \"\"\"Stores and processes bioassembly data from mmCIF tables.\"\"\"\n\n  # Not all of these columns are required for internal operations, but all\n  # should be present whenever bioassemblies are defined in an mmCIF to stay\n  # consistent with external mmCIFs.\n  _REQUIRED_COLUMNS = (\n      '_pdbx_struct_assembly.id',\n      '_pdbx_struct_assembly.details',\n      '_pdbx_struct_assembly.method_details',\n      '_pdbx_struct_assembly.oligomeric_details',\n      '_pdbx_struct_assembly.oligomeric_count',\n      '_pdbx_struct_assembly_gen.assembly_id',\n      '_pdbx_struct_assembly_gen.oper_expression',\n      '_pdbx_struct_assembly_gen.asym_id_list',\n      '_pdbx_struct_oper_list.id',\n      '_pdbx_struct_oper_list.type',\n      '_pdbx_struct_oper_list.name',\n      '_pdbx_struct_oper_list.symmetry_operation',\n      '_pdbx_struct_oper_list.matrix[1][1]',\n      '_pdbx_struct_oper_list.matrix[1][2]',\n      '_pdbx_struct_oper_list.matrix[1][3]',\n      '_pdbx_struct_oper_list.vector[1]',\n      '_pdbx_struct_oper_list.matrix[2][1]',\n      '_pdbx_struct_oper_list.matrix[2][2]',\n      '_pdbx_struct_oper_list.matrix[2][3]',\n      '_pdbx_struct_oper_list.vector[2]',\n      '_pdbx_struct_oper_list.matrix[3][1]',\n      '_pdbx_struct_oper_list.matrix[3][2]',\n      '_pdbx_struct_oper_list.matrix[3][3]',\n      '_pdbx_struct_oper_list.vector[3]',\n  )\n\n  def __init__(\n      self,\n      *,\n      pdbx_struct_assembly: Mapping[str, Mapping[str, str]],\n      pdbx_struct_assembly_gen: Mapping[str, Sequence[Mapping[str, str]]],\n      pdbx_struct_oper_list: Mapping[str, Mapping[str, str]],\n      assembly_ids: Sequence[str],\n      oper_ids: Sequence[str],\n  ):\n    for assembly_id in assembly_ids:\n      for table, table_name in (\n          (pdbx_struct_assembly, '_pdbx_struct_assembly'),\n          (pdbx_struct_assembly_gen, '_pdbx_struct_assembly_gen'),\n      ):\n        if assembly_id not in table:\n          raise ValueError(\n              f'Assembly ID \"{assembly_id}\" missing from {table_name} '\n              f'with keys: {table.keys()}'\n          )\n    for oper_id in oper_ids:\n      if oper_id not in pdbx_struct_oper_list:\n        raise ValueError(\n            f'Oper ID \"{oper_id}\" missing from _pdbx_struct_oper_list '\n            f'with keys: {pdbx_struct_oper_list.keys()}'\n        )\n\n    self._pdbx_struct_assembly = pdbx_struct_assembly\n    self._pdbx_struct_assembly_gen = pdbx_struct_assembly_gen\n    self._pdbx_struct_oper_list = pdbx_struct_oper_list\n    self._operations = {\n        oper_id: _get_operation(oper_data)\n        for oper_id, oper_data in self._pdbx_struct_oper_list.items()\n    }\n    self._assembly_ids = assembly_ids\n    self._oper_ids = oper_ids\n\n  @classmethod\n  def from_mmcif(cls, cif: mmcif.Mmcif) -> Self:\n    \"\"\"Constructs an instance of `BioassemblyData` from an `Mmcif` object.\"\"\"\n    for col in cls._REQUIRED_COLUMNS:\n      if col not in cif:\n        raise MissingBioassemblyDataError(col)\n\n    pdbx_struct_assembly = cif.extract_loop_as_dict(\n        prefix='_pdbx_struct_assembly.', index='_pdbx_struct_assembly.id'\n    )\n    pdbx_struct_oper_list = cif.extract_loop_as_dict(\n        prefix='_pdbx_struct_oper_list.', index='_pdbx_struct_oper_list.id'\n    )\n\n    # _pdbx_struct_assembly_gen is unlike the other two tables because it can\n    # have multiple rows share the same assembly ID. This can happen when an\n    # assembly is constructed by applying different sets of transforms to\n    # different sets of chain IDs. Each of these would have its own row.\n    # Here we group rows by their assembly_id.\n    pdbx_struct_assembly_gen = {}\n    for assembly_id, oper_expression, asym_id_list in zip(\n        cif['_pdbx_struct_assembly_gen.assembly_id'],\n        cif['_pdbx_struct_assembly_gen.oper_expression'],\n        cif['_pdbx_struct_assembly_gen.asym_id_list'],\n    ):\n      pdbx_struct_assembly_gen.setdefault(assembly_id, []).append({\n          '_pdbx_struct_assembly_gen.assembly_id': assembly_id,\n          '_pdbx_struct_assembly_gen.oper_expression': oper_expression,\n          '_pdbx_struct_assembly_gen.asym_id_list': asym_id_list,\n      })\n\n    # We provide these separately to keep track of the original order that they\n    # appear in the mmCIF.\n    assembly_ids = cif['_pdbx_struct_assembly.id']\n    oper_ids = cif['_pdbx_struct_oper_list.id']\n    return cls(\n        pdbx_struct_assembly=pdbx_struct_assembly,\n        pdbx_struct_assembly_gen=pdbx_struct_assembly_gen,\n        pdbx_struct_oper_list=pdbx_struct_oper_list,\n        assembly_ids=assembly_ids,\n        oper_ids=oper_ids,\n    )\n\n  @property\n  def assembly_ids(self) -> Sequence[str]:\n    return self._assembly_ids\n\n  def asym_id_by_assembly_chain_id(self, assembly_id: str) -> Mapping[str, str]:\n    asym_id_by_assembly_chain_id = {}\n    for transform in self.get_transforms(assembly_id):\n      for asym_id, assembly_chain_id in transform.chain_id_rename_map.items():\n        asym_id_by_assembly_chain_id[assembly_chain_id] = asym_id\n    return asym_id_by_assembly_chain_id\n\n  def assembly_chain_ids_by_asym_id(\n      self, assembly_id: str\n  ) -> Mapping[str, set[str]]:\n    assembly_chain_ids_by_asym_id = {}\n    for transform in self.get_transforms(assembly_id):\n      for asym_id, assembly_chain_id in transform.chain_id_rename_map.items():\n        assembly_chain_ids_by_asym_id.setdefault(asym_id, set()).add(\n            assembly_chain_id\n        )\n    return assembly_chain_ids_by_asym_id\n\n  def get_default_assembly_id(self) -> str:\n    \"\"\"Gets a default assembly ID.\"\"\"\n    # The first assembly is usually (though not always) the best choice.\n    # If we find a better heuristic for picking bioassemblies then this\n    # method should be updated.\n    return min(self._assembly_ids)\n\n  def get_assembly_info(self, assembly_id: str) -> Mapping[str, str]:\n    return {\n        k.replace('_pdbx_struct_assembly.', ''): v\n        for k, v in self._pdbx_struct_assembly[assembly_id].items()\n    }\n\n  def get_transforms(self, assembly_id: str) -> Sequence[Transform]:\n    \"\"\"Returns the transforms required to generate the given assembly.\"\"\"\n    partial_transforms = []\n    all_chain_ids = set()\n    for row in self._pdbx_struct_assembly_gen[assembly_id]:\n      oper_expression = row['_pdbx_struct_assembly_gen.oper_expression']\n      parsed_oper_id_seqs = mmcif.parse_oper_expr(oper_expression)\n      label_asym_ids = row['_pdbx_struct_assembly_gen.asym_id_list'].split(',')\n      all_chain_ids |= set(label_asym_ids)\n      for parsed_oper_id_seq in parsed_oper_id_seqs:\n        partial_transforms.append((parsed_oper_id_seq, label_asym_ids))\n\n    # We start assigning new chain IDs by finding the largest chain ID in\n    # the original structure that is involved in this bioassembly, and then\n    # starting from the next one.\n    max_int_chain_id = max(mmcif.str_id_to_int_id(c) for c in all_chain_ids)\n    next_int_chain_id = max_int_chain_id + 1\n\n    transforms = []\n    has_been_renamed = set()\n    for parsed_oper_id_seq, label_asym_ids in partial_transforms:\n      chain_id_rename_map = {}\n      for label_asym_id in label_asym_ids:\n        if label_asym_id not in has_been_renamed:\n          # The first time we see a label_asym_id we don't need to rename it.\n          # This isn't strictly necessary since we don't provide any\n          # guarantees about chain naming after bioassembly extraction but\n          # can make it a bit easier to inspect and compare structures\n          # pre and post bioassembly extraction.\n          chain_id_rename_map[label_asym_id] = label_asym_id\n          has_been_renamed.add(label_asym_id)\n        else:\n          chain_id_rename_map[label_asym_id] = mmcif.int_id_to_str_id(\n              next_int_chain_id\n          )\n          next_int_chain_id += 1\n      transforms.append(\n          Transform(\n              operations=[\n                  self._operations[oper_id] for oper_id in parsed_oper_id_seq\n              ],\n              chain_ids=label_asym_ids,\n              chain_id_rename_map=chain_id_rename_map,\n          )\n      )\n    return transforms\n\n  def to_mmcif_dict(self) -> Mapping[str, Sequence[str]]:\n    \"\"\"Returns the bioassembly data as a dict suitable for `mmcif.Mmcif`.\"\"\"\n    mmcif_dict = {}\n    for assembly_id in self._assembly_ids:\n      for column, val in self._pdbx_struct_assembly[assembly_id].items():\n        mmcif_dict.setdefault(column, []).append(val)\n      for row in self._pdbx_struct_assembly_gen[assembly_id]:\n        for column, val in row.items():\n          mmcif_dict.setdefault(column, []).append(val)\n    for oper_id in self._oper_ids:\n      for column, val in self._pdbx_struct_oper_list[oper_id].items():\n        mmcif_dict.setdefault(column, []).append(val)\n    return mmcif_dict\n\n  def rename_label_asym_ids(\n      self,\n      mapping: Mapping[str, str],\n      present_chains: set[str],\n  ) -> Self:\n    \"\"\"Returns a new BioassemblyData with renamed label_asym_ids.\n\n    Args:\n      mapping: A mapping from original label_asym_ids to their new values. Any\n        label_asym_ids in this BioassemblyData that are not in this mapping will\n        remain unchanged.\n      present_chains: A set of label_asym_ids that are actually present in the\n        atom site list. All label_asym_ids that are in the BioassemblyData but\n        not in present_chains won't be included in the output BioassemblyData.\n\n    Returns:\n      A new BioassemblyData with renamed label_asym_ids.\n\n    Raises:\n      ValueError: If any two previously distinct chains do not have unique names\n          anymore after the rename.\n    \"\"\"\n    new_pdbx_struct_assembly_gen = copy.deepcopy(self._pdbx_struct_assembly_gen)\n    for rows in new_pdbx_struct_assembly_gen.values():\n      for row in rows:\n        old_asym_ids = row['_pdbx_struct_assembly_gen.asym_id_list'].split(',')\n        new_asym_ids = [\n            mapping.get(label_asym_id, label_asym_id)\n            for label_asym_id in old_asym_ids\n            if label_asym_id in present_chains\n        ]\n        if len(set(old_asym_ids) & present_chains) != len(set(new_asym_ids)):\n          raise ValueError(\n              'Can not rename chains, the new names are not unique: '\n              f'{sorted(new_asym_ids)}.'\n          )\n        row['_pdbx_struct_assembly_gen.asym_id_list'] = ','.join(new_asym_ids)  # pytype: disable=unsupported-operands\n\n    return BioassemblyData(\n        pdbx_struct_assembly=copy.deepcopy(self._pdbx_struct_assembly),\n        pdbx_struct_assembly_gen=new_pdbx_struct_assembly_gen,\n        pdbx_struct_oper_list=copy.deepcopy(self._pdbx_struct_oper_list),\n        assembly_ids=copy.deepcopy(self._assembly_ids),\n        oper_ids=copy.deepcopy(self._oper_ids),\n    )\n"
  },
  {
    "path": "src/alphafold3/structure/bonds.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Bond representation for structure module.\"\"\"\n\nimport collections\nfrom collections.abc import Mapping, Sequence\nimport dataclasses\nimport typing\nfrom typing import Self\n\nfrom alphafold3.structure import table\nimport numpy as np\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True)\nclass Bonds(table.Table):\n  \"\"\"Table of atomic bonds.\"\"\"\n\n  # mmCIF column: _struct_conn.conn_type_id\n  # mmCIF desc: This data item is a pointer to _struct_conn_type.id in the\n  #             STRUCT_CONN_TYPE category.\n  # E.g.: \"covale\", \"disulf\", \"hydrog\", \"metalc\".\n  type: np.ndarray\n\n  # mmCIF column: _struct_conn.pdbx_role\n  # mmCIF desc: The chemical or structural role of the interaction.\n  # E.g.: \"N-Glycosylation\", \"O-Glycosylation\".\n  role: np.ndarray\n\n  # mmCIF columns: _struct_conn.ptnr1_*\n  from_atom_key: np.ndarray\n\n  # mmCIF columns: _struct_conn.ptnr2_*\n  dest_atom_key: np.ndarray\n\n  @classmethod\n  def make_empty(cls) -> Self:\n    return cls(\n        key=np.empty((0,), dtype=np.int64),\n        from_atom_key=np.empty((0,), dtype=np.int64),\n        dest_atom_key=np.empty((0,), dtype=np.int64),\n        type=np.empty((0,), dtype=object),\n        role=np.empty((0,), dtype=object),\n    )\n\n  def get_atom_indices(\n      self,\n      atom_key: np.ndarray,\n  ) -> tuple[np.ndarray, np.ndarray]:\n    \"\"\"Returns the indices of the from/dest atoms in the atom_key array.\"\"\"\n    from_atom_missing = ~np.isin(self.from_atom_key, atom_key)\n    dest_atom_missing = ~np.isin(self.dest_atom_key, atom_key)\n    if np.any(from_atom_missing):\n      raise ValueError(\n          f'No atoms for from_atom_key {self.from_atom_key[from_atom_missing]}'\n      )\n    if np.any(dest_atom_missing):\n      raise ValueError(\n          f'No atoms for dest_atom_key {self.dest_atom_key[dest_atom_missing]}'\n      )\n    sort_indices = np.argsort(atom_key)\n    from_indices_sorted = np.searchsorted(\n        atom_key, self.from_atom_key, sorter=sort_indices\n    )\n    dest_indices_sorted = np.searchsorted(\n        atom_key, self.dest_atom_key, sorter=sort_indices\n    )\n    from_indices = sort_indices[from_indices_sorted]\n    dest_indices = sort_indices[dest_indices_sorted]\n    return from_indices, dest_indices\n\n  def restrict_to_atoms(self, atom_key: np.ndarray) -> Self:\n    if not self.size:  # Early-out for empty table.\n      return self\n    from_atom_mask = np.isin(self.from_atom_key, atom_key)\n    dest_atom_mask = np.isin(self.dest_atom_key, atom_key)\n    mask = np.logical_and(from_atom_mask, dest_atom_mask)\n    return typing.cast(Bonds, self.filter(mask=mask))\n\n  def to_mmcif_dict_from_atom_arrays(\n      self,\n      atom_key: np.ndarray,\n      chain_id: np.ndarray,\n      res_id: np.ndarray,\n      res_name: np.ndarray,\n      atom_name: np.ndarray,\n      auth_asym_id: np.ndarray,\n      auth_seq_id: np.ndarray,\n      insertion_code: np.ndarray,\n  ) -> Mapping[str, Sequence[str] | np.ndarray]:\n    \"\"\"Returns a dict suitable for building a CifDict, representing bonds.\n\n    Args:\n      atom_key: A (num_atom,) integer array of atom_keys.\n      chain_id: A (num_atom,) array of label_asym_id strings.\n      res_id: A (num_atom,) array of label_seq_id strings.\n      res_name: A (num_atom,) array of label_comp_id strings.\n      atom_name: A (num_atom,) array of label_atom_id strings.\n      auth_asym_id: A (num_atom,) array of auth_asym_id strings.\n      auth_seq_id: A (num_atom,) array of auth_seq_id strings.\n      insertion_code: A (num_atom,) array of insertion code strings.\n    \"\"\"\n    mmcif_dict = collections.defaultdict(list)\n    ptnr1_indices, ptnr2_indices = self.get_atom_indices(atom_key)\n\n    mmcif_dict['_struct_conn.ptnr1_label_asym_id'] = chain_id[ptnr1_indices]\n    mmcif_dict['_struct_conn.ptnr2_label_asym_id'] = chain_id[ptnr2_indices]\n    mmcif_dict['_struct_conn.ptnr1_label_comp_id'] = res_name[ptnr1_indices]\n    mmcif_dict['_struct_conn.ptnr2_label_comp_id'] = res_name[ptnr2_indices]\n    mmcif_dict['_struct_conn.ptnr1_label_seq_id'] = res_id[ptnr1_indices]\n    mmcif_dict['_struct_conn.ptnr2_label_seq_id'] = res_id[ptnr2_indices]\n    mmcif_dict['_struct_conn.ptnr1_label_atom_id'] = atom_name[ptnr1_indices]\n    mmcif_dict['_struct_conn.ptnr2_label_atom_id'] = atom_name[ptnr2_indices]\n\n    mmcif_dict['_struct_conn.ptnr1_auth_asym_id'] = auth_asym_id[ptnr1_indices]\n    mmcif_dict['_struct_conn.ptnr2_auth_asym_id'] = auth_asym_id[ptnr2_indices]\n    mmcif_dict['_struct_conn.ptnr1_auth_seq_id'] = auth_seq_id[ptnr1_indices]\n    mmcif_dict['_struct_conn.ptnr2_auth_seq_id'] = auth_seq_id[ptnr2_indices]\n    mmcif_dict['_struct_conn.pdbx_ptnr1_PDB_ins_code'] = insertion_code[\n        ptnr1_indices\n    ]\n    mmcif_dict['_struct_conn.pdbx_ptnr2_PDB_ins_code'] = insertion_code[\n        ptnr2_indices\n    ]\n\n    label_alt_id = ['?'] * self.size\n    mmcif_dict['_struct_conn.pdbx_ptnr1_label_alt_id'] = label_alt_id\n    mmcif_dict['_struct_conn.pdbx_ptnr2_label_alt_id'] = label_alt_id\n\n    # We need to set this to make visualisation work in NGL/PyMOL.\n    mmcif_dict['_struct_conn.pdbx_value_order'] = ['?'] * self.size\n\n    # We use a symmetry of 1_555 which is the no-op transformation. Other\n    # values are used when bonds involve atoms that only exist after expanding\n    # the bioassembly, but we don't support this kind of bond at the moment.\n    symmetry = ['1_555'] * self.size\n    mmcif_dict['_struct_conn.ptnr1_symmetry'] = symmetry\n    mmcif_dict['_struct_conn.ptnr2_symmetry'] = symmetry\n    bond_type_counter = collections.Counter()\n    for bond_row in self.iterrows():\n      bond_type = bond_row['type']\n      bond_type_counter[bond_type] += 1\n      mmcif_dict['_struct_conn.id'].append(\n          f'{bond_type}{bond_type_counter[bond_type]}'\n      )\n      mmcif_dict['_struct_conn.pdbx_role'].append(bond_row['role'])\n      mmcif_dict['_struct_conn.conn_type_id'].append(bond_type)\n\n    bond_types = np.unique(self.type)\n    mmcif_dict['_struct_conn_type.id'] = bond_types\n    unknown = ['?'] * len(bond_types)\n    mmcif_dict['_struct_conn_type.criteria'] = unknown\n    mmcif_dict['_struct_conn_type.reference'] = unknown\n\n    return dict(mmcif_dict)\n\n\ndef concat_with_atom_keys(\n    bonds_tables: Sequence[Bonds | None],\n    atom_key_arrays: Sequence[np.ndarray],\n) -> tuple[Bonds | None, np.ndarray]:\n  \"\"\"Concatenates bonds tables and atom keys simultaneously.\n\n  Args:\n    bonds_tables: A sequence of `Bonds` instances to concatenate. If any are\n      None then these are skipped.\n    atom_key_arrays: A sequence of integer `atom_key` arrays, where the n-th\n      bonds_table referrs to the atoms in the n-th atom_key array. These must\n      all be non-None.\n\n  Returns:\n    A pair of (bonds, atom_key) where atom_key is a unique atom_key array with\n    length equal to the sum of the input atom array sizes, and the bonds table\n    contains all the bonds from the individual bonds table inputs.\n  \"\"\"\n  if not bonds_tables or not atom_key_arrays:\n    if bonds_tables or atom_key_arrays:\n      raise ValueError(\n          'bonds_tables and atom_keys must have same length but got'\n          f' {len(bonds_tables)=} and {len(atom_key_arrays)=}'\n      )\n    return None, np.array([], dtype=np.int64)\n  max_key = -1\n  atom_keys_to_concat = []\n  types_to_concat = []\n  roles_to_concat = []\n  from_atom_keys_to_concat = []\n  dest_atom_keys_to_concat = []\n  for bonds, atom_key in zip(bonds_tables, atom_key_arrays, strict=True):\n    if not atom_key.size:\n      assert bonds is None or bonds.size == 0\n      continue\n    assert np.min(atom_key, initial=0) >= 0  # Should always be non-negative!\n    offset = max_key + 1\n    offset_atom_key = atom_key + offset\n    atom_keys_to_concat.append(offset_atom_key)\n    max_key = np.max(offset_atom_key)\n    if bonds is not None:\n      types_to_concat.append(bonds.type)\n      roles_to_concat.append(bonds.role)\n      from_atom_keys_to_concat.append(bonds.from_atom_key + offset)\n      dest_atom_keys_to_concat.append(bonds.dest_atom_key + offset)\n\n  if atom_keys_to_concat:\n    concatted_atom_keys = np.concatenate(atom_keys_to_concat, axis=0)\n  else:\n    concatted_atom_keys = np.array([], dtype=np.int64)\n\n  if types_to_concat:\n    assert (\n        len(types_to_concat)\n        == len(roles_to_concat)\n        == len(from_atom_keys_to_concat)\n        == len(dest_atom_keys_to_concat)\n    )\n    num_bonds = sum(b.size for b in bonds_tables if b is not None)\n    concatted_bonds = Bonds(\n        key=np.arange(num_bonds, dtype=np.int64),\n        type=np.concatenate(types_to_concat, axis=0),\n        role=np.concatenate(roles_to_concat, axis=0),\n        from_atom_key=np.concatenate(from_atom_keys_to_concat, axis=0),\n        dest_atom_key=np.concatenate(dest_atom_keys_to_concat, axis=0),\n    )\n  else:\n    concatted_bonds = None\n\n  return concatted_bonds, concatted_atom_keys\n"
  },
  {
    "path": "src/alphafold3/structure/chemical_components.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Utilities for manipulating chemical components data.\"\"\"\n\nfrom collections.abc import Iterable, Mapping, Sequence\nimport dataclasses\nimport functools\nfrom typing import Self\n\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.constants import residue_names\nfrom alphafold3.structure import mmcif\nimport rdkit.Chem as rd_chem\n\n\n@dataclasses.dataclass(frozen=True)\nclass ChemCompEntry:\n  \"\"\"Items of _chem_comp category.\n\n  For the full list of items and their semantics see\n  http://mmcif.rcsb.org/dictionaries/mmcif_pdbx_v50.dic/Categories/chem_comp.html\n  \"\"\"\n\n  type: str\n  name: str = '?'\n  pdbx_synonyms: str = '?'\n  formula: str = '?'\n  formula_weight: str = '?'\n  mon_nstd_flag: str = '?'\n  pdbx_smiles: str | None = None\n\n  def __post_init__(self):\n    for field, value in vars(self).items():\n      if not value and value is not None:\n        raise ValueError(f\"{field} value can't be an empty string.\")\n\n  def extends(self, other: Self) -> bool:\n    \"\"\"Checks whether this ChemCompEntry extends another one.\"\"\"\n    for field, value in vars(self).items():\n      other_value = getattr(other, field)\n      if _value_is_missing(other_value):\n        continue\n      if value != other_value:\n        return False\n    return True\n\n  @property\n  def rdkit_mol(self) -> rd_chem.Mol:\n    \"\"\"Returns an RDKit Mol, created via RDKit from entry SMILES string.\"\"\"\n    if not self.pdbx_smiles:\n      raise ValueError('Cannot construct RDKit Mol with empty pdbx_smiles')\n    return rd_chem.MolFromSmiles(self.pdbx_smiles)\n\n\n_REQUIRED_MMCIF_COLUMNS = ('_chem_comp.id', '_chem_comp.type')\n\n\nclass MissingChemicalComponentsDataError(Exception):\n  \"\"\"Raised when chemical components data is missing from an mmCIF.\"\"\"\n\n\n@dataclasses.dataclass(frozen=True)\nclass ChemicalComponentsData:\n  \"\"\"Extra information for chemical components occurring in mmCIF.\n\n  Fields:\n    chem_comp: A mapping from _chem_comp.id to associated items in the\n      chem_comp category.\n  \"\"\"\n\n  chem_comp: Mapping[str, ChemCompEntry]\n\n  @classmethod\n  def from_mmcif(\n      cls, cif: mmcif.Mmcif, fix_mse: bool, fix_unknown_dna: bool\n  ) -> Self:\n    \"\"\"Constructs an instance of ChemicalComponentsData from an Mmcif object.\"\"\"\n    for col in _REQUIRED_MMCIF_COLUMNS:\n      if col not in cif:\n        raise MissingChemicalComponentsDataError(col)\n\n    id_ = cif['_chem_comp.id']  # Guaranteed to be present.\n    type_ = cif['_chem_comp.type']  # Guaranteed to be present.\n    name = cif.get('_chem_comp.name', ['?'] * len(id_))\n    synonyms = cif.get('_chem_comp.pdbx_synonyms', ['?'] * len(id_))\n    formula = cif.get('_chem_comp.formula', ['?'] * len(id_))\n    weight = cif.get('_chem_comp.formula_weight', ['?'] * len(id_))\n    mon_nstd_flag = cif.get('_chem_comp.mon_nstd_flag', ['?'] * len(id_))\n    smiles = cif.get('_chem_comp.pdbx_smiles', ['?'] * len(id_))\n    smiles = [None if s == '?' else s for s in smiles]\n\n    chem_comp = {\n        component_name: ChemCompEntry(*entry)\n        for component_name, *entry in zip(\n            id_, type_, name, synonyms, formula, weight, mon_nstd_flag, smiles\n        )\n    }\n\n    if fix_mse and 'MSE' in chem_comp:\n      if 'MET' not in chem_comp:\n        chem_comp['MET'] = ChemCompEntry(\n            type='L-PEPTIDE LINKING',\n            name='METHIONINE',\n            pdbx_synonyms='?',\n            formula='C5 H11 N O2 S',\n            formula_weight='149.211',\n            mon_nstd_flag='y',\n            pdbx_smiles=None,\n        )\n\n    if fix_unknown_dna and 'N' in chem_comp:\n      # Do not delete 'N' as it may be needed for RNA in the system.\n      if 'DN' not in chem_comp:\n        chem_comp['DN'] = ChemCompEntry(\n            type='DNA LINKING',\n            name=\"UNKNOWN 2'-DEOXYNUCLEOTIDE\",\n            pdbx_synonyms='?',\n            formula='C5 H11 O6 P',\n            formula_weight='198.111',\n            mon_nstd_flag='y',\n            pdbx_smiles=None,\n        )\n\n    return ChemicalComponentsData(chem_comp)\n\n  def to_mmcif_dict(self) -> Mapping[str, Sequence[str]]:\n    \"\"\"Returns chemical components data as a dict suitable for `mmcif.Mmcif`.\"\"\"\n    mmcif_dict = {}\n\n    mmcif_fields = set()\n    for entry in self.chem_comp.values():\n      for field, value in vars(entry).items():\n        if value:\n          mmcif_fields.add(field)\n    chem_comp_ids = []\n    for component_id in sorted(self.chem_comp):\n      entry = self.chem_comp[component_id]\n      chem_comp_ids.append(component_id)\n      for field in mmcif_fields:\n        mmcif_dict.setdefault(f'_chem_comp.{field}', []).append(\n            getattr(entry, field) or '?'\n        )\n    if chem_comp_ids:\n      mmcif_dict['_chem_comp.id'] = chem_comp_ids\n    return mmcif_dict\n\n\ndef _value_is_missing(value: str) -> bool:\n  return not value or value in ('.', '?')\n\n\ndef get_data_for_ccd_components(\n    ccd: chemical_components.Ccd,\n    chemical_component_ids: Iterable[str],\n    populate_pdbx_smiles: bool = False,\n) -> ChemicalComponentsData:\n  \"\"\"Returns `ChemicalComponentsData` for chemical components known by PDB.\"\"\"\n  chem_comp = {}\n  for chemical_component_id in chemical_component_ids:\n    chem_data = chemical_components.component_name_to_info(\n        ccd=ccd, res_name=chemical_component_id\n    )\n    if not chem_data:\n      continue\n    chem_comp[chemical_component_id] = ChemCompEntry(\n        type=chem_data.type,\n        name=chem_data.name,\n        pdbx_synonyms=chem_data.pdbx_synonyms,\n        formula=chem_data.formula,\n        formula_weight=chem_data.formula_weight,\n        mon_nstd_flag=chem_data.mon_nstd_flag,\n        pdbx_smiles=(\n            chem_data.pdbx_smiles or None if populate_pdbx_smiles else None\n        ),\n    )\n  return ChemicalComponentsData(chem_comp=chem_comp)\n\n\ndef populate_missing_ccd_data(\n    ccd: chemical_components.Ccd,\n    chemical_components_data: ChemicalComponentsData,\n    chemical_component_ids: Iterable[str] | None = None,\n    populate_pdbx_smiles: bool = False,\n) -> ChemicalComponentsData:\n  \"\"\"Populates missing data for the chemical components from CCD.\n\n  Args:\n    ccd: The chemical components database.\n    chemical_components_data: ChemicalComponentsData to populate missing values\n      for. This function doesn't modify the object, extended version is provided\n      as a return value.\n    chemical_component_ids: chemical components to populate missing values for.\n      If not specified, the function will consider all chemical components which\n      are already present in `chemical_components_data`.\n    populate_pdbx_smiles: whether to populate `pdbx_smiles` field using SMILES\n      descriptors from _pdbx_chem_comp_descriptor CCD table. If CCD provides\n      multiple SMILES strings, any of them could be used.\n\n  Returns:\n    New instance of ChemicalComponentsData without missing values for CCD\n    entries.\n  \"\"\"\n  if chemical_component_ids is None:\n    chemical_component_ids = chemical_components_data.chem_comp.keys()\n\n  ccd_data = get_data_for_ccd_components(\n      ccd, chemical_component_ids, populate_pdbx_smiles\n  )\n  chem_comp = dict(chemical_components_data.chem_comp)\n  for component_id, ccd_entry in ccd_data.chem_comp.items():\n    if component_id not in chem_comp:\n      chem_comp[component_id] = ccd_entry\n    else:\n      already_specified_fields = {\n          field: value\n          for field, value in vars(chem_comp[component_id]).items()\n          if not _value_is_missing(value)\n      }\n      chem_comp[component_id] = ChemCompEntry(\n          **{**vars(ccd_entry), **already_specified_fields}\n      )\n  return ChemicalComponentsData(chem_comp=chem_comp)\n\n\ndef get_all_atoms_in_entry(\n    ccd: chemical_components.Ccd, res_name: str\n) -> Mapping[str, Sequence[str]]:\n  \"\"\"Get all possible atoms and bonds for this residue in a standard order.\n\n  Args:\n    ccd: The chemical components dictionary.\n    res_name: Full CCD name.\n\n  Returns:\n    A dictionary table of the atoms and bonds for this residue in this residue\n    type.\n  \"\"\"\n  # The CCD version of 'UNK' is weird. It has a CB and a CG atom. We just want\n  # the minimal amino-acid here which is GLY.\n  if res_name == 'UNK':\n    res_name = 'GLY'\n  ccd_data = ccd.get(res_name)\n  if not ccd_data:\n    raise ValueError(f'Unknown residue type {res_name}')\n\n  keys = (\n      '_chem_comp_atom.atom_id',\n      '_chem_comp_atom.type_symbol',\n      '_chem_comp_bond.atom_id_1',\n      '_chem_comp_bond.atom_id_2',\n  )\n\n  # Add terminal hydrogens for protonation of the N-terminal\n  if res_name == 'PRO':\n    res_atoms = {key: [*ccd_data.get(key, [])] for key in keys}\n    res_atoms['_chem_comp_atom.atom_id'].extend(['H2', 'H3'])\n    res_atoms['_chem_comp_atom.type_symbol'].extend(['H', 'H'])\n    res_atoms['_chem_comp_bond.atom_id_1'].extend(['N', 'N'])\n    res_atoms['_chem_comp_bond.atom_id_2'].extend(['H2', 'H3'])\n  elif res_name in residue_names.PROTEIN_TYPES_WITH_UNKNOWN:\n    res_atoms = {key: [*ccd_data.get(key, [])] for key in keys}\n    res_atoms['_chem_comp_atom.atom_id'].append('H3')\n    res_atoms['_chem_comp_atom.type_symbol'].append('H')\n    res_atoms['_chem_comp_bond.atom_id_1'].append('N')\n    res_atoms['_chem_comp_bond.atom_id_2'].append('H3')\n  else:\n    res_atoms = {key: ccd_data.get(key, []) for key in keys}\n\n  return res_atoms\n\n\n@functools.lru_cache(maxsize=128)\ndef get_res_atom_names(ccd: chemical_components.Ccd, res_name: str) -> set[str]:\n  \"\"\"Gets the names of the atoms in a given CCD residue.\"\"\"\n  atoms = get_all_atoms_in_entry(ccd, res_name)['_chem_comp_atom.atom_id']\n  return set(atoms)\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/aggregation.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nfrom collections.abc import Sequence\n\ndef indices_grouped_by_value(values: Sequence[int]) -> dict[int, list[int]]: ...\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/aggregation_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <cstdint>\n#include <vector>\n\n#include \"absl/container/flat_hash_map.h\"\n#include \"absl/types/span.h\"\n#include \"pybind11/cast.h\"\n#include \"pybind11/numpy.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11_abseil/absl_casters.h\"\n\nnamespace {\n\nnamespace py = pybind11;\n\nabsl::flat_hash_map<int64_t, std::vector<int64_t>> IndicesGroupedByValue(\n    absl::Span<const int64_t> values) {\n  absl::flat_hash_map<int64_t, std::vector<int64_t>> group_indices;\n  for (int64_t i = 0, e = values.size(); i < e; ++i) {\n    group_indices[values[i]].push_back(i);\n  }\n  return group_indices;\n}\n\nconstexpr char kIndicesGroupedByValue[] = R\"(\nReturns a map from value to a list of indices this value occupies.\n\nE.g. indices_grouped_by_value([1, 1, 2, 3, 3, 1, 1]) returns:\n{1: [0, 1, 5, 6], 2: [2], 3: [3, 4]}\n\nArgs:\n  values: a list of values to group.\n)\";\n\n}  // namespace\n\nnamespace alphafold3 {\n\nvoid RegisterModuleAggregation(py::module m) {\n  m.def(\"indices_grouped_by_value\", &IndicesGroupedByValue, py::arg(\"values\"),\n        py::doc(kIndicesGroupedByValue + 1),\n        py::call_guard<py::gil_scoped_release>());\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/aggregation_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_AGGREGATION_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_AGGREGATION_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleAggregation(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_AGGREGATION_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/membership.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nimport numpy\n\n\ndef isin(\n    array: numpy.ndarray[numpy.int64],\n    test_elements: set[int],\n    invert: bool = ...,\n) -> numpy.ndarray[bool]: ...\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/membership_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <algorithm>\n#include <cstddef>\n#include <cstdint>\n#include <vector>\n\n#include \"absl/container/flat_hash_set.h\"\n#include \"pybind11/cast.h\"\n#include \"pybind11/numpy.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11_abseil/absl_casters.h\"\n\nnamespace {\n\nnamespace py = pybind11;\n\npy::array_t<bool> IsIn(const py::array_t<int64_t, py::array::c_style>& array,\n                       const absl::flat_hash_set<int64_t>& test_elements,\n                       bool invert) {\n  const size_t num_elements = array.size();\n\n  py::array_t<bool> output(num_elements);\n  std::fill(output.mutable_data(), output.mutable_data() + output.size(),\n            invert);\n\n  // Shortcut: The output will be trivially always false if test_elements empty.\n  if (test_elements.empty()) {\n    return output;\n  }\n\n  for (size_t i = 0; i < num_elements; ++i) {\n    if (test_elements.contains(array.data()[i])) {\n      output.mutable_data()[i] = !invert;\n    }\n  }\n  if (array.ndim() > 1) {\n    auto shape =\n        std::vector<ptrdiff_t>(array.shape(), array.shape() + array.ndim());\n    return output.reshape(shape);\n  }\n  return output;\n}\n\nconstexpr char kIsInDoc[] = R\"(\nComputes whether each element is in test_elements.\n\nSame use as np.isin, but much faster. If len(array) = n, len(test_elements) = m:\n* This function has complexity O(n).\n* np.isin with kind='sort' has complexity O(m*log(m) + n * log(m)).\n\nArgs:\n  array: Input NumPy array with dtype=np.int64.\n  test_elements: The values against which to test each value of array.\n  invert: If True, the values in the returned array are inverted, as if\n    calculating `element not in test_elements`. Default is False.\n    `isin(a, b, invert=True)` is equivalent to but faster than `~isin(a, b)`.\n\nReturns\n  A boolean array of the same shape as the input array. Each value `val` is:\n  * `val in test_elements` if `invert=False`,\n  * `val not in test_elements` if `invert=True`.\n)\";\n\n}  // namespace\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMembership(pybind11::module m) {\n  m.def(\"isin\", &IsIn, py::arg(\"array\"), py::arg(\"test_elements\"),\n        py::kw_only(), py::arg(\"invert\") = false, py::doc(kIsInDoc + 1));\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/membership_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MEMBERSHIP_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MEMBERSHIP_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMembership(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MEMBERSHIP_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_altlocs.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include \"alphafold3/structure/cpp/mmcif_altlocs.h\"\n\n#include <cstddef>\n#include <cstdint>\n#include <functional>\n#include <iterator>\n#include <limits>\n#include <string>\n#include <utility>\n#include <vector>\n\n#include \"absl/algorithm/container.h\"\n#include \"absl/log/log.h\"\n#include \"absl/strings/numbers.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n#include \"alphafold3/structure/cpp/mmcif_layout.h\"\n\nnamespace alphafold3 {\nnamespace {\n\nfloat OccupancyToFloat(absl::string_view occupancy) {\n  float result = 0.0f;\n  LOG_IF(ERROR, !absl::SimpleAtof(occupancy, &result))\n      << \"Invalid Occupancy: \" << occupancy;\n  return result;\n}\n\n// Deuterium is the same atom as Hydrogen so keep equivalent for grouping.\nbool AtomEquiv(absl::string_view lhs, absl::string_view rhs) {\n  if (lhs == rhs) return true;\n  if (lhs.empty() != rhs.empty()) return false;\n  // Both lhs and rhs are guaranteed to be non-empty after this.\n  char first_lhs = lhs.front();\n  char second_rhs = rhs.front();\n  if ((first_lhs == 'H' && second_rhs == 'D') ||\n      (first_lhs == 'D' && second_rhs == 'H')) {\n    lhs.remove_prefix(1);\n    rhs.remove_prefix(1);\n    return lhs == rhs;\n  }\n  return false;\n}\n\n// Calls group_callback with that start index and count for each group of\n// equivalent values in `values`, starting at `start` and ending at `count`.\n// Example:\n// GroupBy({\"B\", \"B\", \"B\", \"C\", \"C\"}, 0, 5, [](size_t start, size_t count) {\n//   absl::Printf(\"start=%d, count=%d\\n\", start, count);\n// });\n// Would print:\n// start=0, count=3\n// start=3, count=2\ntemplate <typename GroupCallback,\n          typename IsEqual = std::equal_to<absl::string_view>>\nvoid GroupBy(absl::Span<const std::string> values, std::size_t start,\n             std::size_t count, GroupCallback&& group_callback,\n             IsEqual&& is_equal = std::equal_to<absl::string_view>{}) {\n  std::size_t span_start = start;\n  if (count > 0) {\n    for (std::size_t i = start + 1; i < start + count; ++i) {\n      if (!is_equal(values[i], values[span_start])) {\n        group_callback(span_start, i - span_start);\n        span_start = i;\n      }\n    }\n    group_callback(span_start, start + count - span_start);\n  }\n}\n\nvoid ProcessAltLocGroupsWhole(std::size_t alt_loc_start,\n                              std::size_t alt_loc_count,\n                              absl::Span<const std::string> comp_ids,\n                              absl::Span<const std::string> atom_ids,\n                              absl::Span<const std::string> alt_ids,\n                              absl::Span<const std::string> occupancies,\n                              std::vector<std::uint64_t>& in_out_keep_indices) {\n  std::pair<std::size_t, std::size_t> best_split = {alt_loc_start,\n                                                    alt_loc_count};\n  std::vector<char> alt_loc_groups;\n  float best_occupancy = -std::numeric_limits<float>::infinity();\n  char best_group = alt_ids[alt_loc_start].front();\n  std::vector<std::pair<std::size_t, float>> occupancy_stats;\n\n  // Group by residue type.\n  GroupBy(comp_ids, alt_loc_start, alt_loc_count,\n          [&](std::size_t start, std::size_t count) {\n            // This callback selects the best residue group and the best\n            // Alt-loc char within that group.\n            alt_loc_groups.clear();\n            occupancy_stats.clear();\n            // Calculate total occupancy for residue type.\n            for (std::size_t i = 0; i < count; ++i) {\n              char alt_loc_id = alt_ids[start + i].front();\n              float occupancy = OccupancyToFloat(occupancies[start + i]);\n              if (auto loc = absl::c_find(alt_loc_groups, alt_loc_id);\n                  loc == alt_loc_groups.end()) {\n                occupancy_stats.emplace_back(1, occupancy);\n                alt_loc_groups.push_back(alt_loc_id);\n              } else {\n                auto& stat =\n                    occupancy_stats[std::distance(alt_loc_groups.begin(), loc)];\n                ++stat.first;\n                stat.second += occupancy;\n              }\n            }\n            float total_occupancy = 0.0;\n            for (auto& stat : occupancy_stats) {\n              total_occupancy += stat.second / stat.first;\n            }\n            char group = *absl::c_min_element(alt_loc_groups);\n            // Compares occupancy of residue to best seen so far.\n            // Tie breaks alphabetic.\n            if (total_occupancy > best_occupancy ||\n                (total_occupancy == best_occupancy && group < best_group)) {\n              // Selects the best sub group.\n              best_group = alt_loc_groups.front();\n              float best_amount = occupancy_stats.front().second /\n                                  occupancy_stats.front().first;\n              for (std::size_t i = 1; i < occupancy_stats.size(); ++i) {\n                float amount =\n                    occupancy_stats[i].second / occupancy_stats[i].first;\n                char group = alt_loc_groups[i];\n                if (amount > best_amount ||\n                    (amount == best_amount && group < best_group)) {\n                  best_amount = amount;\n                  best_group = group;\n                }\n              }\n              best_occupancy = total_occupancy;\n              best_split = {start, count};\n            }\n          });\n\n  // Now that the best residue type has been selected and the best alt-loc\n  // within that has been selected add indices of indices to keep to the keep\n  // list.\n  auto [split_start, split_count] = best_split;\n  GroupBy(\n      atom_ids, split_start, split_count,\n      [&in_out_keep_indices, &alt_ids, best_group](std::size_t start,\n                                                   std::size_t count) {\n        // This makes sure we select an atom for each atom id even if it does\n        // not have our selected alt-loc char.\n        std::size_t best_index = start;\n        for (std::size_t i = 1; i < count; ++i) {\n          if (alt_ids[start + i].front() == best_group) {\n            best_index = start + i;\n            break;\n          }\n        }\n        in_out_keep_indices.push_back(best_index);\n      },\n      AtomEquiv);\n}\n\n// Finds the alt-loc group with the highest score and pushes the indices on to\n// the back of in_out_keep_indices.\nvoid ProcessAltLocGroupPartial(\n    std::size_t alt_loc_start, std::size_t alt_loc_count,\n    absl::Span<const std::string> atom_ids,\n    absl::Span<const std::string> alt_ids,\n    absl::Span<const std::string> occupancies,\n    std::vector<std::uint64_t>& in_out_keep_indices) {\n  GroupBy(\n      atom_ids, alt_loc_start, alt_loc_count,\n      [&](std::size_t start, std::size_t count) {\n        if (count == 1) {\n          in_out_keep_indices.push_back(start);\n        } else {\n          float best_occ = OccupancyToFloat(occupancies[start]);\n          std::size_t best_index = start;\n          char best_group = alt_ids[start].front();\n          for (std::size_t i = 0; i < count; ++i) {\n            float occ = OccupancyToFloat(occupancies[start + i]);\n            char group = alt_ids[start + i].front();\n            if (occ > best_occ || (occ == best_occ && group < best_group)) {\n              best_group = group;\n              best_index = start + i;\n              best_occ = occ;\n            }\n          }\n          in_out_keep_indices.push_back(best_index);\n        }\n      },\n      AtomEquiv);\n}\n\n}  // namespace\n\n// Resolves alt-locs returning the atom indices that will be left.\nstd::vector<std::uint64_t> ResolveMmcifAltLocs(\n    const MmcifLayout& layout, absl::Span<const std::string> comp_ids,\n    absl::Span<const std::string> atom_ids,\n    absl::Span<const std::string> alt_ids,\n    absl::Span<const std::string> occupancies,\n    absl::Span<const std::size_t> chain_indices) {\n  std::vector<std::uint64_t> keep_indices;\n  keep_indices.reserve(layout.num_atoms());\n  std::size_t alt_loc_start = 0;\n  for (std::size_t chain_index : chain_indices) {\n    auto [residues_start, residues_end] = layout.residue_range(chain_index);\n    for (std::size_t residue = residues_start; residue < residues_end;\n         ++residue) {\n      std::size_t alt_loc_count = 0;\n      auto [atom_start, atom_end] = layout.atom_range(residue);\n      for (std::size_t i = atom_start; i < atom_end; ++i) {\n        char alt_loc_id = alt_ids[i].front();\n        if (alt_loc_id == '.' || alt_loc_id == '?') {\n          if (alt_loc_count > 0) {\n            ProcessAltLocGroupPartial(alt_loc_start, alt_loc_count, atom_ids,\n                                      alt_ids, occupancies, keep_indices);\n            alt_loc_count = 0;\n          }\n          keep_indices.push_back(i);\n        } else {\n          if (alt_loc_count == 0) {\n            alt_loc_start = i;\n          }\n          ++alt_loc_count;\n        }\n      }\n      if (alt_loc_count > 0) {\n        if (atom_end - atom_start == alt_loc_count) {\n          ProcessAltLocGroupsWhole(alt_loc_start, alt_loc_count, comp_ids,\n                                   atom_ids, alt_ids, occupancies,\n                                   keep_indices);\n        } else {\n          ProcessAltLocGroupPartial(alt_loc_start, alt_loc_count, atom_ids,\n                                    alt_ids, occupancies, keep_indices);\n        }\n      }\n    }\n  }\n\n  return keep_indices;\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_altlocs.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_ALTLOCS_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_ALTLOCS_H_\n\n#include <cstddef>\n#include <cstdint>\n#include <string>\n#include <vector>\n\n#include \"absl/types/span.h\"\n#include \"alphafold3/structure/cpp/mmcif_layout.h\"\n\nnamespace alphafold3 {\n\n// Returns the list of indices that should be kept after resolving alt-locs.\n// 1) Partial Residue. Each cycle of alt-locs are resolved separately with the\n//    highest occupancy alt-loc. Tie-breaks are resolved alphabetically. See\n//    tests for examples.\n// 2) Whole Residue. These are resolved in two passes.\n//    a) The residue with the highest occupancy is chosen.\n//    b) The locations for a given residue are resolved.\n//    All tie-breaks are resolved alphabetically. See tests for examples.\n//\n// Preconditions: layout and comp_ids, alt_ids, occupancies are all from same\n// mmCIF file and chain_indices are monotonically increasing and less than\n// layout.num_chains().\n//\n// comp_ids from '_atom_site.label_comp_id'.\n// alt_ids from '_atom_site.label_alt_id'.\n// occupancies from '_atom_site.occupancy'.\nstd::vector<std::uint64_t> ResolveMmcifAltLocs(\n    const MmcifLayout& layout, absl::Span<const std::string> comp_ids,\n    absl::Span<const std::string> atom_ids,\n    absl::Span<const std::string> alt_ids,\n    absl::Span<const std::string> occupancies,\n    absl::Span<const std::size_t> chain_indices);\n\n}  // namespace alphafold3\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_ALTLOCS_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_atom_site.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nfrom collections.abc import Callable\nfrom alphafold3.cpp import cif_dict\n\n\ndef get_internal_to_author_chain_id_map(\n    mmcif: cif_dict.CifDict\n) -> dict[str,str]: ...\n\n\ndef get_or_infer_type_symbol(\n    mmcif: cif_dict.CifDict,\n    atom_id_to_type_symbol: Callable[[str, str], str],\n) -> list[str]: ...\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_atom_site_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <cstddef>\n\n#include \"absl/container/flat_hash_map.h\"\n#include \"absl/log/check.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n#include \"pybind11/gil.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/pytypes.h\"\n#include \"pybind11/stl.h\"\n#include \"pybind11_abseil/absl_casters.h\"\n\nnamespace alphafold3 {\nnamespace {\nnamespace py = pybind11;\n\n// If present, returns the _atom_site.type_symbol. If not, infers it using\n// _atom_site.label_comp_id (residue name), _atom_site.label_atom_id (atom name)\n// and the CCD.\npy::list GetOrInferTypeSymbol(const CifDict& mmcif,\n                              const py::object& atom_id_to_type_symbol) {\n  const auto& type_symbol = mmcif[\"_atom_site.type_symbol\"];\n  const int num_atom = mmcif[\"_atom_site.id\"].size();\n  py::list patched_type_symbol(num_atom);\n  if (type_symbol.empty()) {\n    const auto& label_comp_id = mmcif[\"_atom_site.label_comp_id\"];\n    const auto& label_atom_id = mmcif[\"_atom_site.label_atom_id\"];\n    CHECK_EQ(label_comp_id.size(), num_atom);\n    CHECK_EQ(label_atom_id.size(), num_atom);\n    for (int i = 0; i < num_atom; i++) {\n      patched_type_symbol[i] =\n          atom_id_to_type_symbol(label_comp_id[i], label_atom_id[i]);\n    }\n  } else {\n    for (int i = 0; i < num_atom; i++) {\n      patched_type_symbol[i] = type_symbol[i];\n    }\n  }\n  return patched_type_symbol;\n}\n\nabsl::flat_hash_map<absl::string_view, absl::string_view>\nGetInternalToAuthorChainIdMap(const CifDict& mmcif) {\n  const auto& label_asym_ids = mmcif[\"_atom_site.label_asym_id\"];\n  const auto& auth_asym_ids = mmcif[\"_atom_site.auth_asym_id\"];\n  CHECK_EQ(label_asym_ids.size(), auth_asym_ids.size());\n\n  absl::flat_hash_map<absl::string_view, absl::string_view> mapping;\n  for (size_t i = 0, num_rows = label_asym_ids.size(); i < num_rows; ++i) {\n    // Use only the first internal_chain_id occurrence to generate the mapping.\n    // It should not matter as there should not be a case where a single\n    // internal chain ID would map to more than one author chain IDs (i.e. the\n    // mapping should be injective). Since we need this method to be fast, we\n    // choose not to check it.\n    mapping.emplace(label_asym_ids[i], auth_asym_ids[i]);\n  }\n  return mapping;\n}\n\n}  // namespace\n\nnamespace py = pybind11;\n\nvoid RegisterModuleMmcifAtomSite(pybind11::module m) {\n  m.def(\"get_or_infer_type_symbol\", &GetOrInferTypeSymbol, py::arg(\"mmcif\"),\n        py::arg(\"atom_id_to_type_symbol\"));\n\n  m.def(\"get_internal_to_author_chain_id_map\", &GetInternalToAuthorChainIdMap,\n        py::arg(\"mmcif\"), py::call_guard<py::gil_scoped_release>());\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_atom_site_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_ATOM_SITE_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_ATOM_SITE_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMmcifAtomSite(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_ATOM_SITE_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_layout.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_LAYOUT_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_LAYOUT_H_\n\n#include <cstddef>\n#include <cstdint>\n#include <string>\n#include <utility>\n#include <vector>\n\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n\nnamespace alphafold3 {\n\n// Holds the layout of a parsed mmCIF file.\nclass MmcifLayout {\n public:\n  MmcifLayout(std::vector<std::size_t> chain_ends,\n              std::vector<std::size_t> residues, std::size_t model_offset,\n              std::size_t num_models)\n      : chain_ends_(std::move(chain_ends)),\n        residue_ends_(std::move(residues)),\n        model_offset_(model_offset),\n        num_models_(num_models) {}\n\n  // Reads a layout from a valid parsed mmCIF. If a valid model_id is provided\n  // the offsets will select that model from the mmCIF.\n  // If no model_id is specified, we calculate the layout of the first model\n  // only. Therefore it is a requirement that each model has identical atom\n  // layouts. An error is returned if the atom counts do not between models.\n  static absl::StatusOr<MmcifLayout> Create(const CifDict& mmcif,\n                                            absl::string_view model_id = \"\");\n\n  std::string ToDebugString() const;\n\n  // Returns the start index and one past the last residue index of a given\n  // chain. A chain_index of n refers to the n-th chain in the mmCIF. The\n  // returned residue indices are 0-based enumerations of residues in the\n  // _atom_site records, and therefore do not include missing residues.\n  std::pair<std::size_t, std::size_t> residue_range(\n      std::size_t chain_index) const {\n    if (chain_index > 0) {\n      return {chain_ends_[chain_index - 1], chain_ends_[chain_index]};\n    } else {\n      return {0, chain_ends_[0]};\n    }\n  }\n\n  // Returns the start index and one past the last index of a given residue.\n  // A residue_index of n refers to the n-th residue in the mmCIF, not\n  // including residues that are unresolved (i.e. only using _atom_site).\n  std::pair<std::size_t, std::size_t> atom_range(\n      std::size_t residue_index) const {\n    if (residue_index > 0) {\n      return {residue_ends_[residue_index - 1], residue_ends_[residue_index]};\n    } else {\n      return {model_offset_, residue_ends_[residue_index]};\n    }\n  }\n\n  // If model_id was provided during construction then this is 1, otherwise\n  // it is the number of models present in the mmCIF.\n  std::size_t num_models() const { return num_models_; }\n  // The number of atoms in the chosen model.\n  std::size_t num_atoms() const {\n    return residue_ends_.empty() ? 0 : residue_ends_.back() - model_offset_;\n  }\n  // The number of chains in the chosen model.\n  std::size_t num_chains() const { return chain_ends_.size(); }\n  // The number of residues in the chosen model, not counting unresolved\n  // residues.\n  std::size_t num_residues() const { return residue_ends_.size(); }\n\n  // Returns the first atom index that is part of the specified chain.\n  // The chain is specified using chain_index, which is a 0-based\n  // enumeration of the chains in the _atom_site table.\n  std::size_t atom_site_from_chain_index(std::size_t chain_index) const {\n    if (chain_index == 0) {\n      return model_offset_;\n    }\n    return atom_site_from_residue_index(chain_ends_[chain_index - 1]);\n  }\n\n  // Returns the first atom index that is part of the specified residue.\n  // The residue is specified using residue_index, which is a 0-based\n  // enumeration of the residues in the _atom_site table.\n  std::size_t atom_site_from_residue_index(std::size_t residues_index) const {\n    if (residues_index == 0) {\n      return model_offset_;\n    }\n    return residue_ends_[residues_index - 1];\n  }\n\n  // One past last residue index of each chain. The residue index does not\n  // include unresolved residues and is a simple 0-based enumeration of the\n  // residues in _atom_site table.\n  const std::vector<std::size_t>& chains() const { return chain_ends_; }\n\n  // Indices of the first atom of each chain. Note that this returns atom\n  // indices (like residue_starts()), not residue indices (like chains()).\n  std::vector<std::size_t> chain_starts() const;\n\n  // One past last atom index of each residue.\n  const std::vector<std::size_t>& residues() const { return residue_ends_; }\n\n  // Indices of the first atom of each residue.\n  std::vector<std::size_t> residue_starts() const {\n    std::vector<std::size_t> residue_starts;\n    if (!residue_ends_.empty()) {\n      residue_starts.reserve(residue_ends_.size());\n      residue_starts.push_back(model_offset_);\n      residue_starts.insert(residue_starts.end(), residue_ends_.begin(),\n                            residue_ends_.end() - 1);\n    }\n    return residue_starts;\n  }\n\n  // The first atom index that is part of the specified model.\n  std::size_t model_offset() const { return model_offset_; }\n\n  void Filter(absl::Span<const std::uint64_t> keep_indices);\n\n private:\n  std::vector<std::size_t> chain_ends_;\n  std::vector<std::size_t> residue_ends_;\n  std::size_t model_offset_;\n  std::size_t num_models_;\n};\n\n}  // namespace alphafold3\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_LAYOUT_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_layout.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nfrom alphafold3.cpp import cif_dict\n\nclass MmcifLayout:\n  def atom_range(self, residue_index: int) -> tuple[int, int]: ...\n  def chain_starts(self) -> list[int]: ...\n  def chains(self) -> list[int]: ...\n  def model_offset(self) -> int: ...\n  def num_atoms(self) -> int: ...\n  def num_chains(self) -> int: ...\n  def num_models(self) -> int: ...\n  def num_residues(self) -> int: ...\n  def residue_range(self, chain_index: int) -> tuple[int, int]: ...\n  def residue_starts(self) -> list[int]: ...\n  def residues(self) -> list[int]: ...\n\ndef from_mmcif(mmcif: cif_dict.CifDict, model_id: str = ...) -> MmcifLayout: ...\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_layout_lib.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <algorithm>\n#include <cstddef>\n#include <cstdint>\n#include <functional>\n#include <iterator>\n#include <string>\n#include <utility>\n#include <vector>\n\n#include \"absl/algorithm/container.h\"\n#include \"absl/status/status.h\"\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/str_cat.h\"\n#include \"absl/strings/str_format.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n#include \"alphafold3/structure/cpp/mmcif_layout.h\"\n\nnamespace alphafold3 {\n\nstd::string MmcifLayout::ToDebugString() const {\n  return absl::StrFormat(\n      \"MmcifLayout(models=%d, chains=%d, num_residues=%d, atoms=%d)\",\n      num_models(), num_chains(), num_residues(), num_atoms());\n}\n\n// Changes layout to match keep_indices removing empty chains/residues.\nvoid MmcifLayout::Filter(absl::Span<const std::uint64_t> keep_indices) {\n  if (num_chains() == 0) {\n    return;\n  }\n  // Update residue indices.\n  auto keep_it = absl::c_lower_bound(keep_indices, residue_ends_.front());\n  for (auto& residue : residue_ends_) {\n    while (keep_it != keep_indices.end() && *keep_it < residue) {\n      ++keep_it;\n    }\n    residue = std::distance(keep_indices.begin(), keep_it);\n  }\n  // Unique residue_ends_ with updating chains.\n  auto first = residue_ends_.begin();\n  auto tail = first;\n  std::size_t num_skipped = 0;\n  std::size_t current = 0;\n  for (std::size_t& chain_end : chain_ends_) {\n    for (auto e = residue_ends_.begin() + chain_end; first != e; ++first) {\n      std::size_t next = *first;\n      *tail = next;\n      if (current != next) {\n        current = next;\n        ++tail;\n      } else {\n        ++num_skipped;\n      }\n    }\n    chain_end -= num_skipped;\n  }\n  residue_ends_.erase(tail, residue_ends_.end());\n\n  current = 0;\n  chain_ends_.erase(std::remove_if(chain_ends_.begin(), chain_ends_.end(),\n                                   [&current](std::size_t next) {\n                                     bool result = current == next;\n                                     current = next;\n                                     return result;\n                                   }),\n                    chain_ends_.end());\n  model_offset_ = 0;\n}\n\nabsl::StatusOr<MmcifLayout> MmcifLayout::Create(const CifDict& mmcif,\n                                                absl::string_view model_id) {\n  auto model_ids = mmcif[\"_atom_site.pdbx_PDB_model_num\"];\n  auto chain_ids = mmcif[\"_atom_site.label_asym_id\"];     // chain ID.\n  auto label_seq_ids = mmcif[\"_atom_site.label_seq_id\"];  // residue ID.\n  auto auth_seq_ids = mmcif[\"_atom_site.auth_seq_id\"];    // author residue ID.\n  auto insertion_codes = mmcif[\"_atom_site.pdbx_PDB_ins_code\"];\n\n  if (model_ids.size() != chain_ids.size() ||\n      model_ids.size() != label_seq_ids.size() ||\n      (model_ids.size() != auth_seq_ids.size() && !auth_seq_ids.empty()) ||\n      (model_ids.size() != insertion_codes.size() &&\n       !insertion_codes.empty())) {\n    return absl::InvalidArgumentError(absl::StrCat(\n        \"Invalid _atom_site table.\",  //\n        \" len(_atom_site.pdbx_PDB_model_num): \", model_ids.size(),\n        \" len(_atom_site.label_asym_id): \", chain_ids.size(),\n        \" len(_atom_site.label_seq_id): \", label_seq_ids.size(),\n        \" len(_atom_site.auth_seq_id): \", auth_seq_ids.size(),\n        \" len(_atom_site.pdbx_PDB_ins_code): \", insertion_codes.size()));\n  }\n  std::size_t num_atoms = model_ids.size();\n  if (num_atoms == 0) {\n    return MmcifLayout({}, {}, 0, 0);\n  }\n  std::size_t model_offset = 0;\n  std::size_t num_models;\n  std::size_t num_atoms_per_model;\n  if (model_id.empty()) {\n    absl::string_view first_model_id = model_ids.front();\n\n    // Binary search for where the first model ends.\n    num_atoms_per_model = std::distance(\n        model_ids.begin(),\n        absl::c_upper_bound(model_ids, first_model_id, std::not_equal_to<>{}));\n    if (num_atoms % num_atoms_per_model != 0) {\n      return absl::InvalidArgumentError(absl::StrCat(\n          \"Each model must have the same number of atoms: (\", num_atoms, \" % \",\n          num_atoms_per_model, \" == \", num_atoms % num_atoms_per_model, \").\"));\n    }\n    num_models = num_atoms / num_atoms_per_model;\n    // Test boundary conditions for each model hold.\n    for (std::size_t i = 1; i < num_models; ++i) {\n      if ((model_ids[i * num_atoms_per_model] !=\n           model_ids[(i + 1) * num_atoms_per_model - 1]) ||\n          (model_ids[i * num_atoms_per_model - 1] ==\n           model_ids[i * num_atoms_per_model])) {\n        return absl::InvalidArgumentError(\n            absl::StrCat(\"Each model must have the same number of atoms: (\",\n                         num_atoms, \" % \", num_atoms_per_model,\n                         \" == \", num_atoms % num_atoms_per_model, \").\"));\n      }\n    }\n  } else {\n    num_models = 1;\n    model_offset =\n        std::distance(model_ids.begin(), absl::c_find(model_ids, model_id));\n    if (model_offset == model_ids.size()) {\n      return absl::InvalidArgumentError(\n          absl::StrCat(\"Unknown model_id: \", model_id));\n    }\n    model_ids.remove_prefix(model_offset);\n    chain_ids.remove_prefix(model_offset);\n    label_seq_ids.remove_prefix(model_offset);\n    if (!auth_seq_ids.empty()) auth_seq_ids.remove_prefix(model_offset);\n    if (!insertion_codes.empty()) insertion_codes.remove_prefix(model_offset);\n\n    num_atoms_per_model = std::distance(\n        model_ids.begin(), std::upper_bound(model_ids.begin(), model_ids.end(),\n                                            model_id, std::not_equal_to<>{}));\n    num_atoms = num_atoms_per_model;\n  }\n  std::vector<std::size_t> residues;\n  std::vector<std::size_t> chains;\n  absl::string_view chain_id = chain_ids.front();\n  if (!auth_seq_ids.empty() && !insertion_codes.empty()) {\n    // If author residue IDs are present then these are preferred to\n    // label residue IDs because they work for multi-residue ligands (which\n    // are given constant \".\" label residue IDs).\n    // NB: Author residue IDs require both the auth_seq_id and the insertion\n    // code to be unique.\n    absl::string_view auth_seq_id = auth_seq_ids.front();\n    absl::string_view insertion_code = insertion_codes.front();\n    for (std::size_t i = 1; i < num_atoms_per_model; ++i) {\n      if (absl::string_view current_chain_id = chain_ids[i];\n          current_chain_id != chain_id) {\n        residues.push_back(i + model_offset);\n        chains.push_back(residues.size());\n        chain_id = current_chain_id;\n        auth_seq_id = auth_seq_ids[i];\n        insertion_code = insertion_codes[i];\n      } else if (absl::string_view current_seq_id = auth_seq_ids[i],\n                 current_insertion_code = insertion_codes[i];\n                 insertion_code != current_insertion_code ||\n                 auth_seq_id != current_seq_id) {\n        residues.push_back(i + model_offset);\n        auth_seq_id = current_seq_id;\n        insertion_code = current_insertion_code;\n      }\n    }\n  } else {\n    absl::string_view label_seq_id = label_seq_ids.front();\n    for (std::size_t i = 1; i < num_atoms_per_model; ++i) {\n      if (absl::string_view current_chain_id = chain_ids[i];\n          current_chain_id != chain_id) {\n        residues.push_back(i + model_offset);\n        chains.push_back(residues.size());\n        chain_id = current_chain_id;\n        label_seq_id = label_seq_ids[i];\n      } else if (absl::string_view current_seq_id = label_seq_ids[i];\n                 label_seq_id != current_seq_id) {\n        residues.push_back(i + model_offset);\n        label_seq_id = current_seq_id;\n      }\n    }\n  }\n  residues.push_back(num_atoms_per_model + model_offset);\n  chains.push_back(residues.size());\n  return MmcifLayout(std::move(chains), std::move(residues), model_offset,\n                     num_models);\n}\n\nstd::vector<std::size_t> MmcifLayout::chain_starts() const {\n  std::vector<std::size_t> chain_starts;\n  chain_starts.reserve(chain_ends_.size());\n  for (std::size_t index = 0; index < chain_ends_.size(); ++index) {\n    chain_starts.push_back(atom_site_from_chain_index(index));\n  }\n  return chain_starts;\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_layout_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include \"alphafold3/structure/cpp/mmcif_layout.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/pytypes.h\"\n#include \"pybind11/stl.h\"\n\nnamespace alphafold3 {\n\nnamespace py = pybind11;\n\nvoid RegisterModuleMmcifLayout(pybind11::module m) {\n  py::class_<MmcifLayout>(m, \"MmcifLayout\")\n      .def(\"__str__\", &MmcifLayout::ToDebugString)\n      .def(\"num_models\", &MmcifLayout::num_models)\n      .def(\"num_chains\", &MmcifLayout::num_chains)\n      .def(\"num_residues\", &MmcifLayout::num_residues)\n      .def(\"num_atoms\", &MmcifLayout::num_atoms)\n      .def(\"residue_range\", &MmcifLayout::residue_range, py::arg(\"chain_index\"))\n      .def(\"atom_range\", &MmcifLayout::atom_range, py::arg(\"residue_index\"))\n      .def(\"chains\", &MmcifLayout::chains,\n           py::doc(\"Returns a list of indices one past the last residue of \"\n                   \"each chain.\"))\n      .def(\n          \"chain_starts\", &MmcifLayout::chain_starts,\n          py::doc(\"Returns a list of indices of the first atom of each chain.\"))\n      .def(\"residues\", &MmcifLayout::residues,\n           py::doc(\"Returns a list of indices one past the last atom of each \"\n                   \"residue.\"))\n      .def(\"residue_starts\", &MmcifLayout::residue_starts,\n           py::doc(\n               \"Returns a list of indices of the first atom of each residue.\"))\n      .def(\"model_offset\", &MmcifLayout::model_offset,\n           py::doc(\"Returns the first atom index that is part of the specified \"\n                   \"model.\"));\n\n  m.def(\"from_mmcif\", &MmcifLayout::Create, py::arg(\"mmcif\"),\n        py::arg(\"model_id\") = \"\");\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_layout_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_LAYOUT_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_LAYOUT_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMmcifLayout(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_LAYOUT_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_struct_conn.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_STRUCT_CONN_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_STRUCT_CONN_H_\n\n#include <utility>\n#include <vector>\n\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/string_view.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n\nnamespace alphafold3 {\n\n// Returns a pair of atom indices for each row in the bonds table (aka\n// _struct_conn). The indices are simple 0-based indexes into the columns of\n// the _atom_site table in the input mmCIF, and do not necessarily correspond\n// to the values in _atom_site.id, or any other column.\nabsl::StatusOr<std::pair<std::vector<std::size_t>, std::vector<std::size_t>>>\nGetBondAtomIndices(const CifDict& mmcif, absl::string_view model_id);\n\n}  // namespace alphafold3\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_STRUCT_CONN_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_struct_conn.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nfrom alphafold3.cpp import cif_dict\n\ndef get_bond_atom_indices(mmcif_dict: cif_dict.CifDict, model_id: str) -> tuple[list[int],list[int]]: ...\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_struct_conn_lib.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <cstddef>\n#include <iterator>\n#include <optional>\n#include <string>\n#include <utility>\n#include <vector>\n\n#include \"absl/algorithm/container.h\"\n#include \"absl/container/flat_hash_map.h\"\n#include \"absl/container/flat_hash_set.h\"\n#include \"absl/status/status.h\"\n#include \"absl/status/statusor.h\"\n#include \"absl/strings/str_cat.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n#include \"alphafold3/structure/cpp/mmcif_struct_conn.h\"\n\nnamespace alphafold3 {\n\nnamespace {\n\nstruct AtomId {\n  absl::string_view chain_id;\n  absl::string_view res_id_1;\n  absl::string_view res_id_2;\n  absl::string_view atom_name;\n  absl::string_view alt_id;\n\n  friend bool operator==(const AtomId&, const AtomId&) = default;\n  template <typename H>\n  friend H AbslHashValue(H h, const AtomId& m) {\n    return H::combine(std::move(h), m.chain_id, m.res_id_1, m.res_id_2,\n                      m.atom_name, m.alt_id);\n  }\n};\n\nusing StringArrayRef = absl::Span<const std::string>;\nusing BondIndexByAtom = absl::flat_hash_map<AtomId, std::vector<std::size_t>>;\nusing BondAtomIndices = std::vector<std::size_t>;\n\n// Returns whether each container is the same size.\ntemplate <typename C, typename... Cs>\nbool AreSameSize(const C& c, const Cs&... cs) {\n  return ((c.size() == cs.size()) && ...);\n}\n\nstruct ColumnSpec {\n  absl::string_view chain_id_col;\n  absl::string_view res_id_1_col;\n  absl::string_view res_id_2_col;\n  absl::string_view atom_name_col;\n  std::optional<absl::string_view> alt_id_col;  // Not used by OpenMM.\n};\n\nclass AtomColumns {\n public:\n  static absl::StatusOr<AtomColumns> Create(const CifDict& mmcif,\n                                            const ColumnSpec& column_spec) {\n    StringArrayRef chain_id = mmcif[column_spec.chain_id_col];\n    StringArrayRef res_id_1 = mmcif[column_spec.res_id_1_col];\n    StringArrayRef res_id_2 = mmcif[column_spec.res_id_2_col];\n    StringArrayRef atom_name = mmcif[column_spec.atom_name_col];\n    if (!AreSameSize(chain_id, res_id_1, res_id_2, atom_name)) {\n      return absl::InvalidArgumentError(absl::StrCat(\n          \"Atom columns are not the same size. \",                       //\n          \"len(\", column_spec.chain_id_col, \")=\", chain_id.size(),      //\n          \", len(\", column_spec.res_id_1_col, \")=\", res_id_1.size(),    //\n          \", len(\", column_spec.res_id_2_col, \")=\", res_id_2.size(),    //\n          \", len(\", column_spec.atom_name_col, \")=\", atom_name.size(),  //\n          \".\"));\n    }\n    if (column_spec.alt_id_col.has_value()) {\n      StringArrayRef alt_id = mmcif[*column_spec.alt_id_col];\n      if (!AreSameSize(alt_id, chain_id)) {\n        return absl::InvalidArgumentError(absl::StrCat(\n            \"Atom columns are not the same size. \",                   //\n            \"len(\", column_spec.chain_id_col, \")=\", chain_id.size(),  //\n            \", len(\", *column_spec.alt_id_col, \")=\", alt_id.size(),   //\n            \".\"));\n      }\n      return AtomColumns(chain_id, res_id_1, res_id_2, atom_name, alt_id,\n                         column_spec);\n    } else {\n      return AtomColumns(chain_id, res_id_1, res_id_2, atom_name, std::nullopt,\n                         column_spec);\n    }\n  }\n\n  inline std::size_t size() const { return size_; }\n\n  absl::string_view GetNormalizedAltId(const std::size_t index) const {\n    constexpr absl::string_view kFullStop = \".\";\n    if (alt_id_.has_value()) {\n      absl::string_view alt_id = (*alt_id_)[index];\n      return alt_id == \"?\" ? kFullStop : alt_id;\n    } else {\n      return kFullStop;\n    }\n  }\n\n  AtomId GetAtom(const std::size_t index) const {\n    return {.chain_id = chain_id_[index],\n            .res_id_1 = res_id_1_[index],\n            .res_id_2 = res_id_2_[index],\n            .atom_name = atom_name_[index],\n            .alt_id = GetNormalizedAltId(index)};\n  }\n\n  std::string GetAtomString(const std::size_t index) const {\n    std::string alt_id_col;\n    if (column_spec_.alt_id_col.has_value()) {\n      alt_id_col = *column_spec_.alt_id_col;\n    } else {\n      alt_id_col = \"default label_alt_id\";\n    }\n    return absl::StrCat(\n        column_spec_.chain_id_col, \"=\", chain_id_[index], \", \",    //\n        column_spec_.res_id_1_col, \"=\", res_id_1_[index], \", \",    //\n        column_spec_.res_id_2_col, \"=\", res_id_2_[index], \", \",    //\n        column_spec_.atom_name_col, \"=\", atom_name_[index], \", \",  //\n        alt_id_col, \"=\", GetNormalizedAltId(index));               //\n  }\n\n private:\n  AtomColumns(StringArrayRef chain_id, StringArrayRef res_id_1,\n              StringArrayRef res_id_2, StringArrayRef atom_name,\n              std::optional<StringArrayRef> alt_id,\n              const ColumnSpec& column_spec)\n      : chain_id_(chain_id),\n        res_id_1_(res_id_1),\n        res_id_2_(res_id_2),\n        atom_name_(atom_name),\n        alt_id_(alt_id),\n        column_spec_(column_spec),\n        size_(chain_id.size()) {}\n  StringArrayRef chain_id_;\n  StringArrayRef res_id_1_;\n  StringArrayRef res_id_2_;\n  StringArrayRef atom_name_;\n  std::optional<StringArrayRef> alt_id_;\n  ColumnSpec column_spec_;\n  std::size_t size_;\n};\n\n// Adds the atom index to any rows in the bond table involving that atom.\nabsl::Status FillInBondsForAtom(const BondIndexByAtom& bond_index_by_atom,\n                                const AtomId& atom,\n                                const std::size_t atom_index,\n                                BondAtomIndices& bond_atom_indices) {\n  if (auto bond_index_it = bond_index_by_atom.find(atom);\n      bond_index_it != bond_index_by_atom.end()) {\n    for (std::size_t bond_index : bond_index_it->second) {\n      if (bond_index < 0 || bond_index >= bond_atom_indices.size()) {\n        return absl::OutOfRangeError(\n            absl::StrCat(\"Bond index out of range: \", bond_index));\n      }\n      bond_atom_indices[bond_index] = atom_index;\n    }\n  }\n  return absl::OkStatus();\n}\n\n// Checks that the CifDict has all of the columns in the column spec.\nbool HasAllColumns(const CifDict& mmcif, const ColumnSpec& columns) {\n  return mmcif.Contains(columns.chain_id_col) &&\n         mmcif.Contains(columns.res_id_1_col) &&\n         mmcif.Contains(columns.res_id_2_col) &&\n         mmcif.Contains(columns.atom_name_col) &&\n         (!columns.alt_id_col.has_value() ||\n          mmcif.Contains(*columns.alt_id_col));\n}\n\n// Fully specified ptnr1 atom.\nconstexpr ColumnSpec kStructConnPtnr1ColumnsFull{\n    .chain_id_col = \"_struct_conn.ptnr1_label_asym_id\",\n    .res_id_1_col = \"_struct_conn.ptnr1_auth_seq_id\",\n    .res_id_2_col = \"_struct_conn.pdbx_ptnr1_PDB_ins_code\",\n    .atom_name_col = \"_struct_conn.ptnr1_label_atom_id\",\n    .alt_id_col = \"_struct_conn.pdbx_ptnr1_label_alt_id\",\n};\n\n// Fully specified ptnr2 atom.\nconstexpr ColumnSpec kStructConnPtnr2ColumnsFull{\n    .chain_id_col = \"_struct_conn.ptnr2_label_asym_id\",\n    .res_id_1_col = \"_struct_conn.ptnr2_auth_seq_id\",\n    .res_id_2_col = \"_struct_conn.pdbx_ptnr2_PDB_ins_code\",\n    .atom_name_col = \"_struct_conn.ptnr2_label_atom_id\",\n    .alt_id_col = \"_struct_conn.pdbx_ptnr2_label_alt_id\",\n};\n\n// Columns used by OpenMM for ptnr1 atoms.\nconstexpr ColumnSpec kStructConnPtnr1OpenMM{\n    .chain_id_col = \"_struct_conn.ptnr1_label_asym_id\",\n    .res_id_1_col = \"_struct_conn.ptnr1_label_seq_id\",\n    .res_id_2_col = \"_struct_conn.ptnr1_label_comp_id\",\n    .atom_name_col = \"_struct_conn.ptnr1_label_atom_id\",\n    .alt_id_col = std::nullopt,\n};\n\n// Columns used by OpenMM for ptnr2 atoms.\nconstexpr ColumnSpec kStructConnPtnr2OpenMM{\n    .chain_id_col = \"_struct_conn.ptnr2_label_asym_id\",\n    .res_id_1_col = \"_struct_conn.ptnr2_label_seq_id\",\n    .res_id_2_col = \"_struct_conn.ptnr2_label_comp_id\",\n    .atom_name_col = \"_struct_conn.ptnr2_label_atom_id\",\n    .alt_id_col = std::nullopt,\n};\n\n// Fully specified atom sites.\nconstexpr ColumnSpec kAtomSiteColumnsFull{\n    .chain_id_col = \"_atom_site.label_asym_id\",\n    .res_id_1_col = \"_atom_site.auth_seq_id\",\n    .res_id_2_col = \"_atom_site.pdbx_PDB_ins_code\",\n    .atom_name_col = \"_atom_site.label_atom_id\",\n    .alt_id_col = \"_atom_site.label_alt_id\",\n};\n\n// Atom site columns used to match OpenMM _struct_conn tables.\nconstexpr ColumnSpec kAtomSiteColumnsOpenMM{\n    .chain_id_col = \"_atom_site.label_asym_id\",\n    .res_id_1_col = \"_atom_site.label_seq_id\",\n    .res_id_2_col = \"_atom_site.label_comp_id\",\n    .atom_name_col = \"_atom_site.label_atom_id\",\n    .alt_id_col = \"_atom_site.label_alt_id\",\n};\n\n}  // namespace\n\nabsl::StatusOr<std::pair<BondAtomIndices, BondAtomIndices>> GetBondAtomIndices(\n    const CifDict& mmcif, absl::string_view model_id) {\n  ColumnSpec ptnr1_columns, ptnr2_columns, atom_site_columns;\n\n  if (HasAllColumns(mmcif, kStructConnPtnr1ColumnsFull) &&\n      HasAllColumns(mmcif, kStructConnPtnr2ColumnsFull)) {\n    ptnr1_columns = kStructConnPtnr1ColumnsFull;\n    ptnr2_columns = kStructConnPtnr2ColumnsFull;\n    atom_site_columns = kAtomSiteColumnsFull;\n  } else {\n    ptnr1_columns = kStructConnPtnr1OpenMM;\n    ptnr2_columns = kStructConnPtnr2OpenMM;\n    atom_site_columns = kAtomSiteColumnsOpenMM;\n  }\n\n  absl::StatusOr<AtomColumns> ptnr1_atoms =\n      AtomColumns::Create(mmcif, ptnr1_columns);\n  if (!ptnr1_atoms.ok()) {\n    return ptnr1_atoms.status();\n  }\n  absl::StatusOr<AtomColumns> ptnr2_atoms =\n      AtomColumns::Create(mmcif, ptnr2_columns);\n  if (!ptnr2_atoms.ok()) {\n    return ptnr2_atoms.status();\n  }\n  StringArrayRef struct_conn_id = mmcif[\"_struct_conn.id\"];\n  if (!AreSameSize(struct_conn_id, *ptnr1_atoms, *ptnr2_atoms)) {\n    return absl::InvalidArgumentError(absl::StrCat(\n        \"Invalid '_struct_conn.' loop. \",                  //\n        \"len(id) = \", struct_conn_id.size(), \", \",         //\n        \"len(ptnr1_atoms) = \", ptnr1_atoms->size(), \", \",  //\n        \"len(ptnr2_atoms) = \", ptnr2_atoms->size(), \".\"    //\n        ));\n  }\n\n  absl::StatusOr<AtomColumns> atoms =\n      AtomColumns::Create(mmcif, atom_site_columns);\n  if (!atoms.ok()) {\n    return atoms.status();\n  }\n  StringArrayRef atom_site_id = mmcif[\"_atom_site.id\"];\n  StringArrayRef atom_site_model_id = mmcif[\"_atom_site.pdbx_PDB_model_num\"];\n  if (!AreSameSize(atom_site_id, atom_site_model_id, *atoms)) {\n    return absl::InvalidArgumentError(absl::StrCat(\n        \"Invalid '_atom_site.' loop. \",                                //\n        \"len(id)= \", atom_site_id.size(), \", \",                        //\n        \"len(pdbx_PDB_model_num)= \", atom_site_model_id.size(), \", \",  //\n        \"len(atoms)= \", atoms->size(), \".\"));                          //\n  }\n\n  // Build maps from atom ID tuples to the rows in _struct_conn where that\n  // atom appears (NB could be multiple).\n  const std::size_t struct_conn_size = struct_conn_id.size();\n  BondIndexByAtom ptnr1_rows_by_atom(struct_conn_size);\n  BondIndexByAtom ptnr2_rows_by_atom(struct_conn_size);\n  for (std::size_t i = 0; i < struct_conn_size; ++i) {\n    ptnr1_rows_by_atom[ptnr1_atoms->GetAtom(i)].push_back(i);\n    ptnr2_rows_by_atom[ptnr2_atoms->GetAtom(i)].push_back(i);\n  }\n\n  // Allocate two output arrays with one element per row in struct_conn, where\n  // each element will be the index of that atom in the atom_site table.\n  // Fill the arrays with atom_site_size, which is an invalid value, so that\n  // we can check at the end that each atom has been found.\n  const std::size_t atom_site_size = atom_site_id.size();\n  BondAtomIndices ptnr1_atom_indices(struct_conn_size, atom_site_size);\n  BondAtomIndices ptnr2_atom_indices(struct_conn_size, atom_site_size);\n\n  bool model_id_ecountered = false;\n  absl::flat_hash_set<absl::string_view> seen_alt_ids;\n  for (std::size_t atom_i = 0; atom_i < atom_site_size; ++atom_i) {\n    if (atom_site_model_id[atom_i] != model_id) {\n      if (!model_id_ecountered) {\n        continue;\n      } else {\n        // Models are contiguous so once we see a different model ID after\n        // encountering our model ID then we can exit early.\n        break;\n      }\n    } else {\n      model_id_ecountered = true;\n    }\n    AtomId atom = atoms->GetAtom(atom_i);\n    seen_alt_ids.insert(atom.alt_id);\n\n    if (auto fill_in_bonds_status1 = FillInBondsForAtom(\n            ptnr1_rows_by_atom, atom, atom_i, ptnr1_atom_indices);\n        !fill_in_bonds_status1.ok()) {\n      return fill_in_bonds_status1;\n    }\n    if (auto fill_in_bonds_status2 = FillInBondsForAtom(\n            ptnr2_rows_by_atom, atom, atom_i, ptnr2_atom_indices);\n        !fill_in_bonds_status2.ok()) {\n      return fill_in_bonds_status2;\n    }\n  }\n  // The seen_alt_ids check is a workaround for a known PDB issue: some mmCIFs\n  // (2evw, 2g0v, 2g0x, 2g0z, 2g10, 2g11, 2g12, 2g14, 2grz, 2ntw as of 2024)\n  // have multiple models and they set different whole-chain altloc in each\n  // model. The bond table however doesn't distinguish between models, so there\n  // are bonds that are valid only for some models. E.g. 2grz has model 1 with\n  // chain A with altloc A, and model 2 with chain A with altloc B. The bonds\n  // table lists a bond for each of these.\n\n  // Check that a ptnr1 atom was found for every bond.\n  if (auto row_it = absl::c_find(ptnr1_atom_indices, atom_site_size);\n      row_it != ptnr1_atom_indices.end()) {\n    if (seen_alt_ids.size() > 1 || seen_alt_ids.contains(\".\") ||\n        seen_alt_ids.contains(\"?\")) {\n      std::size_t i = std::distance(ptnr1_atom_indices.begin(), row_it);\n      return absl::InvalidArgumentError(\n          absl::StrCat(\"Error parsing \\\"\", mmcif.GetDataName(), \"\\\". \",\n                       \"Cannot find atom for bond ID \", struct_conn_id[i], \": \",\n                       ptnr1_atoms->GetAtomString(i)));\n    }\n  }\n\n  // Check that a ptnr2 atom was found for every bond.\n  if (auto row_it = absl::c_find(ptnr2_atom_indices, atom_site_size);\n      row_it != ptnr2_atom_indices.end()) {\n    if (seen_alt_ids.size() > 1 || seen_alt_ids.contains(\".\") ||\n        seen_alt_ids.contains(\"?\")) {\n      std::size_t i = std::distance(ptnr2_atom_indices.begin(), row_it);\n      return absl::InvalidArgumentError(\n          absl::StrCat(\"Error parsing \\\"\", mmcif.GetDataName(), \"\\\". \",\n                       \"Cannot find atom for bond ID \", struct_conn_id[i], \": \",\n                       ptnr2_atoms->GetAtomString(i)));\n    }\n  }\n\n  if (!model_id_ecountered) {\n    return absl::InvalidArgumentError(absl::StrCat(\n        \"Error parsing \\\"\", mmcif.GetDataName(), \"\\\". model_id \\\"\", model_id,\n        \"\\\" not found in _atom_site.pdbx_PDB_model_num.\"));\n  }\n\n  return std::make_pair(std::move(ptnr1_atom_indices),\n                        std::move(ptnr2_atom_indices));\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_struct_conn_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <string>\n\n#include \"absl/strings/string_view.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n#include \"alphafold3/structure/cpp/mmcif_struct_conn.h\"\n#include \"pybind11/gil.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/pytypes.h\"\n#include \"pybind11/stl.h\"\n\nnamespace alphafold3 {\n\nnamespace py = pybind11;\n\nconstexpr char kGetBondAtomIndices[] = R\"(\nExtracts the indices of the atoms that participate in bonds.\n\nThis function has a workaround for a known PDB issue: some mmCIFs have\n(2evw, 2g0v, 2g0x, 2g0z, 2g10, 2g11, 2g12, 2g14, 2grz, 2ntw as of 2024)\nmultiple models and they set different whole-chain altloc in each model.\nThe bond table however doesn't distinguish between models, so there are\nbonds that are valid only for some models. E.g. 2grz has model 1 with\nchain A with altloc A, and model 2 with chain A with altloc B. The bonds\ntable lists a bond for each of these. This case is rather rare (10 cases\nin PDB as of 2024). For the offending bonds, the returned atom index is\nset to the size of the atom_site table, i.e. it is an invalid index.\n\nArgs:\n  mmcif: The mmCIF object to process.\n  model_id: The ID of the model that the returned atoms will belong to. This\n    should be a value in the mmCIF's _atom_site.pdbx_PDB_model_num column.\n\nReturns:\n  Two lists of atom indices, `from_atoms` and `to_atoms`, each one having\n  length num_bonds (as defined by _struct_conn, the bonds table). The bond\n  i, defined by the i'th row in _struct_conn, is a bond from atom at index\n  from_atoms[i], to the atom at index to_atoms[i]. The indices are simple\n  0-based indexes into the columns of the _atom_site table in the input\n  mmCIF, and do not necessarily correspond to the values in _atom_site.id,\n  or any other column.\n)\";\n\nvoid RegisterModuleMmcifStructConn(pybind11::module m) {\n  m.def(\n      \"get_bond_atom_indices\",\n      [](const CifDict& mmcif, absl::string_view model_id) {\n        auto result = GetBondAtomIndices(mmcif, model_id);\n        if (result.ok()) {\n          return *result;\n        }\n        throw py::value_error(std::string(result.status().message()));\n      },\n      py::arg(\"mmcif_dict\"), py::arg(\"model_id\"),\n      py::doc(kGetBondAtomIndices + 1),\n      py::call_guard<py::gil_scoped_release>());\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_struct_conn_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_STRUCT_CONN_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_STRUCT_CONN_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMmcifStructConn(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_STRUCT_CONN_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_utils.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nfrom collections.abc import Sequence\n\nimport numpy as np\n\nfrom alphafold3.cpp import cif_dict\nfrom alphafold3.structure.python import mmcif_layout\n\n\ndef filter(\n    mmcif: cif_dict.CifDict,\n    include_nucleotides: bool,\n    include_ligands: bool = ...,\n    include_water: bool = ...,\n    include_other: bool = ...,\n    model_id: str = ...,\n) -> tuple[np.ndarray[int], set[str], mmcif_layout.MmcifLayout]: ...\n\n\ndef fix_residues(\n    layout: mmcif_layout.MmcifLayout,\n    comp_id: Sequence[str],\n    atom_id: Sequence[str],\n    atom_x: Sequence[float],\n    atom_y: Sequence[float],\n    atom_z: Sequence[float],\n    fix_arg: bool = ...,\n) -> None: ...\n\n\ndef read_layout(\n    mmcif: cif_dict.CifDict, model_id: str = ...\n) -> mmcif_layout.MmcifLayout: ...\n\n\ndef selected_ligand_residue_mask(\n    layout: mmcif_layout.MmcifLayout,\n    atom_site_label_asym_ids: list[str],\n    atom_site_label_seq_ids: list[str],\n    atom_site_auth_seq_ids: list[str],\n    atom_site_label_comp_ids: list[str],\n    atom_site_pdbx_pdb_ins_codes: list[str],\n    nonpoly_asym_ids: list[str],\n    nonpoly_auth_seq_ids: list[str],\n    nonpoly_pdb_ins_codes: list[str],\n    nonpoly_mon_ids: list[str],\n    branch_asym_ids: list[str],\n    branch_auth_seq_ids: list[str],\n    branch_pdb_ins_codes: list[str],\n    branch_mon_ids: list[str],\n) -> tuple[list[bool], list[bool]]: ...\n\n\ndef selected_polymer_residue_mask(\n    layout: mmcif_layout.MmcifLayout,\n    atom_site_label_asym_ids: list[str],\n    atom_site_label_seq_ids: list[str],\n    atom_site_label_comp_ids: list[str],\n    poly_seq_asym_ids: list[str],\n    poly_seq_seq_ids: list[str],\n    poly_seq_mon_ids: list[str],\n) -> list[bool]: ...\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_utils_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <Python.h>\n\n#include <algorithm>\n#include <cstddef>\n#include <cstdint>\n#include <iterator>\n#include <memory>\n#include <new>\n#include <optional>\n#include <string>\n#include <tuple>\n#include <utility>\n#include <vector>\n\n#include \"numpy/ndarrayobject.h\"\n#include \"numpy/ndarraytypes.h\"\n#include \"numpy/npy_common.h\"\n#include \"absl/container/flat_hash_map.h\"\n#include \"absl/container/flat_hash_set.h\"\n#include \"absl/memory/memory.h\"\n#include \"absl/strings/str_cat.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n#include \"alphafold3/parsers/cpp/cif_dict_lib.h\"\n#include \"alphafold3/structure/cpp/mmcif_altlocs.h\"\n#include \"alphafold3/structure/cpp/mmcif_layout.h\"\n#include \"pybind11/cast.h\"\n#include \"pybind11/gil.h\"\n#include \"pybind11/numpy.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/pytypes.h\"\n#include \"pybind11/stl.h\"\n#include \"pybind11_abseil/absl_casters.h\"\n\nnamespace alphafold3 {\nnamespace {\nnamespace py = pybind11;\n\nstruct PyObjectDeleter {\n  inline void operator()(PyObject* obj) const { Py_CLEAR(obj); }\n};\n\nusing ScopedPyObject = std::unique_ptr<PyObject, PyObjectDeleter>;\n\nusing StringArrayRef = absl::Span<const std::string>;\nusing Indexer = absl::flat_hash_map<absl::string_view, std::size_t>;\n\n// Returns the reverse look-up map of name to index.\nIndexer MakeIndex(StringArrayRef col) {\n  Indexer index;\n  index.reserve(col.size());\n  for (std::size_t i = 0; i < col.size(); ++i) {\n    index[col[i]] = i;\n  }\n  return index;\n}\n\n// Returns whether each container is the same size.\ntemplate <typename C, typename... Cs>\nbool AreSameSize(C c, const Cs&... cs) {\n  return ((c.size() == cs.size()) && ...);\n}\n\n// Stores references to columns in `_atom_site` ensuring they all exist and\n// are the same size.\nstruct AtomSiteLoop {\n  explicit AtomSiteLoop(const CifDict& cif_dict)\n      : id(cif_dict[\"_atom_site.id\"]),\n        model_id(cif_dict[\"_atom_site.pdbx_PDB_model_num\"]),\n        chain_id(cif_dict[\"_atom_site.label_asym_id\"]),\n        seq_id(cif_dict[\"_atom_site.label_seq_id\"]),\n\n        comp_id(cif_dict[\"_atom_site.label_comp_id\"]),\n        atom_id(cif_dict[\"_atom_site.label_atom_id\"]),\n\n        alt_id(cif_dict[\"_atom_site.label_alt_id\"]),\n        occupancy(cif_dict[\"_atom_site.occupancy\"])\n\n  {\n    if (!AreSameSize(id, model_id, chain_id, seq_id, comp_id, atom_id, alt_id,\n                     occupancy)) {\n      throw py::value_error(\n          absl::StrCat(\"Invalid '_atom_site.' loop. \",                     //\n                       \"len(id)=\", id.size(), \", \",                        //\n                       \"len(pdbx_PDB_model_num)=\", model_id.size(), \", \",  //\n                       \"len(label_asym_id)=\", chain_id.size(), \", \",       //\n                       \"len(label_seq_id)=\", seq_id.size(), \", \",          //\n                       \"len(label_comp_id)=\", comp_id.size(), \", \",        //\n                       \"len(atom_id)=\", atom_id.size(), \", \",              //\n                       \"len(label_alt_id)=\", alt_id.size(), \", \",          //\n                       \"len(occupancy)=\", occupancy.size()));\n    }\n  }\n  StringArrayRef id;\n  StringArrayRef model_id;\n  StringArrayRef chain_id;\n  StringArrayRef seq_id;\n  StringArrayRef comp_id;\n  StringArrayRef atom_id;\n  StringArrayRef alt_id;\n  StringArrayRef occupancy;\n};\n\n// Stores references to columns in `_entity` ensuring they all exist and are the\n// same size.\nstruct EntityLoop {\n  explicit EntityLoop(const CifDict& cif_dict)\n      : id(cif_dict[\"_entity.id\"]), type(cif_dict[\"_entity.type\"]) {\n    if (!AreSameSize(id, type)) {\n      throw py::value_error(absl::StrCat(\"Invalid '_entity.' loop. \",  //\n                                         \"len(id)=\", id.size(), \", \",  //\n                                         \"len(type)=\", type.size()));\n    }\n  }\n  StringArrayRef id;\n  StringArrayRef type;\n};\n\n// Stores references to columns in `_entity_poly` ensuring they all exist and\n// are the same size.\nstruct EntityPolyLoop {\n  explicit EntityPolyLoop(const CifDict& cif_dict)\n      : entity_id(cif_dict[\"_entity_poly.entity_id\"]),\n        type(cif_dict[\"_entity_poly.type\"]) {\n    if (!AreSameSize(entity_id, type)) {\n      throw py::value_error(absl::StrCat(\"Invalid '_entity_poly.' loop. \",  //\n                                         \"len(entity_id)=\", entity_id.size(),\n                                         \", \",  //\n                                         \"len(type)=\", type.size()));\n    }\n  }\n  StringArrayRef entity_id;\n  StringArrayRef type;\n};\n\n// Returns a set of entity names removing ones not included by the flags\n// specified.\nabsl::flat_hash_set<absl::string_view> SelectChains(const CifDict& mmcif,\n                                                    bool include_nucleotides,\n                                                    bool include_ligands,\n                                                    bool include_water,\n                                                    bool include_other) {\n  EntityLoop entity_loop(mmcif);\n  EntityPolyLoop entity_poly(mmcif);\n  absl::flat_hash_set<absl::string_view> permitted_polymers{\"polypeptide(L)\"};\n  absl::flat_hash_set<absl::string_view> forbidden_polymers;\n  for (absl::string_view type :\n       {\"polydeoxyribonucleotide\", \"polyribonucleotide\",\n        \"polydeoxyribonucleotide/polyribonucleotide hybrid\"}) {\n    if (include_nucleotides) {\n      permitted_polymers.emplace(type);\n    } else {\n      forbidden_polymers.emplace(type);\n    }\n  }\n\n  absl::flat_hash_set<absl::string_view> permitted_nonpoly_entity_types;\n  absl::flat_hash_set<absl::string_view> forbidden_nonpoly_entity_types;\n  for (absl::string_view type : {\"non-polymer\", \"branched\"}) {\n    if (include_ligands) {\n      permitted_nonpoly_entity_types.emplace(type);\n    } else {\n      forbidden_nonpoly_entity_types.emplace(type);\n    }\n  }\n  absl::string_view water_type = \"water\";\n  if (include_water) {\n    permitted_nonpoly_entity_types.emplace(water_type);\n  } else {\n    forbidden_nonpoly_entity_types.emplace(water_type);\n  }\n\n  StringArrayRef chain_ids = mmcif[\"_struct_asym.id\"];\n  StringArrayRef entity_ids = mmcif[\"_struct_asym.entity_id\"];\n  Indexer chain_index = MakeIndex(chain_ids);\n  Indexer entity_poly_index = MakeIndex(entity_poly.entity_id);\n  Indexer entity_id_to_index = MakeIndex(entity_loop.id);\n\n  absl::flat_hash_set<absl::string_view> keep_chain_id;\n  for (std::size_t i = 0; i < chain_ids.size(); ++i) {\n    absl::string_view chain_id = chain_ids[i];\n    absl::string_view entity_id = entity_ids[i];\n    if (entity_id_to_index.empty() ||\n        entity_loop.type[entity_id_to_index[entity_id]] == \"polymer\") {\n      if (auto it = entity_poly_index.find(entity_id);\n          it != entity_poly_index.end()) {\n        absl::string_view poly_type = entity_poly.type[it->second];\n        if (include_other) {\n          if (!forbidden_polymers.contains(poly_type)) {\n            keep_chain_id.insert(chain_id);\n          }\n        } else {\n          if (permitted_polymers.contains(poly_type)) {\n            keep_chain_id.insert(chain_id);\n          }\n        }\n      }\n    } else {\n      absl::string_view entity_type =\n          entity_loop.type[entity_id_to_index[entity_id]];\n      if (include_other) {\n        if (!forbidden_nonpoly_entity_types.contains(entity_type)) {\n          keep_chain_id.insert(chain_id);\n          continue;\n        }\n      } else {\n        if (permitted_nonpoly_entity_types.contains(entity_type)) {\n          keep_chain_id.insert(chain_id);\n          continue;\n        }\n      }\n    }\n  }\n  return keep_chain_id;\n}\n\nclass ProcessResidue {\n public:\n  explicit ProcessResidue(const char* residue)\n      : residue_(PyUnicode_InternFromString(residue)) {}\n  bool IsResidue(PyObject* residue) {\n    return ArePyObjectsEqual(residue_.get(), residue);\n  }\n\n  static bool ArePyObjectsEqual(PyObject* lhs, PyObject* rhs) {\n    switch (PyObject_RichCompareBool(lhs, rhs, Py_EQ)) {\n      case -1:\n        PyErr_Clear();\n        return false;\n      case 0:\n        return false;\n      default:\n        return true;\n    }\n  }\n\n private:\n  ScopedPyObject residue_;\n};\n\nstruct Position3 {\n  float x;\n  float y;\n  float z;\n};\n\nfloat DistanceSquared(Position3 v1, Position3 v2) {\n  float dx = v1.x - v2.x;\n  float dy = v1.y - v2.y;\n  float dz = v1.z - v2.z;\n  return dx * dx + dy * dy + dz * dz;\n}\n\nclass FixArginine : public ProcessResidue {\n public:\n  FixArginine()\n      : ProcessResidue(\"ARG\"),\n        cd_(PyUnicode_InternFromString(\"CD\")),\n        nh1_(PyUnicode_InternFromString(\"NH1\")),\n        nh2_(PyUnicode_InternFromString(\"NH2\")),\n        hh11_(PyUnicode_InternFromString(\"HH11\")),\n        hh21_(PyUnicode_InternFromString(\"HH21\")),\n        hh12_(PyUnicode_InternFromString(\"HH12\")),\n        hh22_(PyUnicode_InternFromString(\"HH22\")) {}\n  void Fix(absl::Span<PyObject*> atom_ids, absl::Span<const float> atom_x,\n           absl::Span<const float> atom_y, absl::Span<const float> atom_z) {\n    std::ptrdiff_t cd_index = -1;\n    std::ptrdiff_t nh1_index = -1;\n    std::ptrdiff_t nh2_index = -1;\n    std::ptrdiff_t hh11_index = -1;\n    std::ptrdiff_t hh21_index = -1;\n    std::ptrdiff_t hh12_index = -1;\n    std::ptrdiff_t hh22_index = -1;\n    for (std::ptrdiff_t index = 0; index < atom_ids.size(); ++index) {\n      PyObject* atom_id = atom_ids[index];\n      if (cd_index == -1 && ArePyObjectsEqual(atom_id, cd_.get())) {\n        cd_index = index;\n      } else if (nh1_index == -1 && ArePyObjectsEqual(atom_id, nh1_.get())) {\n        nh1_index = index;\n      } else if (nh2_index == -1 && ArePyObjectsEqual(atom_id, nh2_.get())) {\n        nh2_index = index;\n      } else if (hh11_index == -1 && ArePyObjectsEqual(atom_id, hh11_.get())) {\n        hh11_index = index;\n      } else if (hh21_index == -1 && ArePyObjectsEqual(atom_id, hh21_.get())) {\n        hh21_index = index;\n      } else if (hh12_index == -1 && ArePyObjectsEqual(atom_id, hh12_.get())) {\n        hh12_index = index;\n      } else if (hh22_index == -1 && ArePyObjectsEqual(atom_id, hh22_.get())) {\n        hh22_index = index;\n      }\n    }\n    if (cd_index < 0 || nh1_index < 0 || nh2_index < 0) {\n      return;\n    }\n    Position3 cd_pos(atom_x[cd_index], atom_y[cd_index], atom_z[cd_index]);\n    Position3 nh1_pos(atom_x[nh1_index], atom_y[nh1_index], atom_z[nh1_index]);\n    Position3 nh2_pos(atom_x[nh2_index], atom_y[nh2_index], atom_z[nh2_index]);\n    if (DistanceSquared(nh1_pos, cd_pos) <= DistanceSquared(nh2_pos, cd_pos)) {\n      return;\n    }\n    std::swap(atom_ids[nh1_index], atom_ids[nh2_index]);\n    if (hh11_index >= 0 && hh21_index >= 0) {\n      std::swap(atom_ids[hh11_index], atom_ids[hh21_index]);\n    } else if (hh11_index >= 0) {\n      Py_DECREF(atom_ids[hh11_index]);\n      Py_INCREF(hh21_.get());\n      atom_ids[hh11_index] = hh21_.get();\n    } else if (hh21_index >= 0) {\n      Py_DECREF(atom_ids[hh21_index]);\n      Py_INCREF(hh11_.get());\n      atom_ids[hh21_index] = hh11_.get();\n    }\n    if (hh12_index >= 0 && hh22_index >= 0) {\n      std::swap(atom_ids[hh12_index], atom_ids[hh22_index]);\n    } else if (hh12_index >= 0) {\n      Py_DECREF(atom_ids[hh12_index]);\n      Py_INCREF(hh22_.get());\n      atom_ids[hh12_index] = hh22_.get();\n    } else if (hh22_index >= 0) {\n      Py_DECREF(atom_ids[hh22_index]);\n      Py_INCREF(hh21_.get());\n      atom_ids[hh22_index] = hh21_.get();\n    }\n  }\n\n private:\n  ScopedPyObject cd_;\n  ScopedPyObject nh1_;\n  ScopedPyObject nh2_;\n  ScopedPyObject hh11_;\n  ScopedPyObject hh21_;\n  ScopedPyObject hh12_;\n  ScopedPyObject hh22_;\n};\n\n// Returns the layout of the mmCIF `_atom_site` table.\ninline MmcifLayout ReadMmcifLayout(const CifDict& mmcif,\n                                   absl::string_view model_id = \"\") {\n  py::gil_scoped_release release;\n  auto mmcif_layout = MmcifLayout::Create(mmcif, model_id);\n  if (mmcif_layout.ok()) {\n    return *mmcif_layout;\n  }\n\n  throw py::value_error(std::string(mmcif_layout.status().message()));\n}\n\npy::tuple MmcifFilter(         //\n    const CifDict& mmcif,      //\n    bool include_nucleotides,  //\n    bool include_ligands,      //\n    bool include_water,        //\n    bool include_other,        //\n    absl::string_view model_id) {\n  if (_import_array() < 0) {\n    throw py::import_error(\"Failed to import NumPy.\");\n  }\n  auto layout = ReadMmcifLayout(mmcif, model_id);\n  std::unique_ptr<std::vector<std::uint64_t>> keep_indices;\n  size_t new_num_atoms;\n  absl::flat_hash_set<absl::string_view> keep_chain_ids;\n\n  {\n    py::gil_scoped_release release;\n\n    AtomSiteLoop atom_site(mmcif);\n\n    keep_chain_ids = SelectChains(mmcif, include_nucleotides, include_ligands,\n                                  include_water, include_other);\n\n    std::vector<std::size_t> chain_indices;\n    chain_indices.reserve(keep_chain_ids.size());\n    for (std::size_t i = 0; i < layout.num_chains(); ++i) {\n      if (keep_chain_ids.contains(\n              atom_site.chain_id[layout.atom_site_from_chain_index(i)])) {\n        chain_indices.push_back(i);\n      }\n    }\n\n    keep_indices =\n        absl::WrapUnique(new std::vector<std::uint64_t>(ResolveMmcifAltLocs(\n            layout, atom_site.comp_id, atom_site.atom_id, atom_site.alt_id,\n            atom_site.occupancy, chain_indices)));\n    new_num_atoms = keep_indices->size();\n\n    if (layout.num_models() > 1) {\n      keep_indices->reserve(layout.num_models() * new_num_atoms);\n      std::uint64_t* start = &(*keep_indices->begin());\n      std::size_t num_atom = keep_indices->size();\n      // Copy first model indices into all model indices offsetting each copy.\n      for (std::size_t i = 1; i < layout.num_models(); ++i) {\n        std::size_t offset = i * layout.num_atoms();\n        std::transform(start, start + num_atom,\n                       std::back_inserter(*keep_indices),\n                       [offset](std::size_t v) { return v + offset; });\n      }\n    }\n  }\n\n  layout.Filter(*keep_indices);\n\n  npy_intp shape[] = {static_cast<npy_intp>(layout.num_models()),\n                      static_cast<npy_intp>(new_num_atoms)};\n  PyObject* arr =\n      PyArray_SimpleNewFromData(2, shape, NPY_INT64, keep_indices->data());\n  // Create a capsule to hold the memory of the buffer so NumPy knows how to\n  // delete it when done with it.\n  PyObject* capsule = PyCapsule_New(\n      keep_indices.release(), nullptr, +[](PyObject* capsule_cleanup) {\n        void* memory = PyCapsule_GetPointer(capsule_cleanup, nullptr);\n        delete static_cast<std::vector<std::size_t>*>(memory);\n      });\n  PyArray_SetBaseObject(reinterpret_cast<PyArrayObject*>(arr), capsule);\n\n  return py::make_tuple(py::reinterpret_steal<py::object>(arr), keep_chain_ids,\n                        std::move(layout));\n}\n\nvoid MmcifFixResidues(               //\n    const MmcifLayout& layout,       //\n    absl::Span<PyObject*> comp_id,   //\n    absl::Span<PyObject*> atom_id,   //\n    absl::Span<const float> atom_x,  //\n    absl::Span<const float> atom_y,  //\n    absl::Span<const float> atom_z,  //\n    bool fix_arginine                //\n) {\n  std::optional<FixArginine> arginine;\n  std::size_t num_atoms = layout.num_atoms();\n  if (comp_id.size() != num_atoms || atom_id.size() != num_atoms ||\n      atom_x.size() != num_atoms || atom_y.size() != num_atoms ||\n      atom_z.size() != num_atoms) {\n    throw py::value_error(\n        absl::StrCat(\"Sizes must match. \",                   //\n                     \"num_atoms=\", num_atoms, \", \",          //\n                     \"len(comp_id)=\", comp_id.size(), \", \",  //\n                     \"len(atom_id)=\", atom_id.size(), \", \",  //\n                     \"len(atom_x)=\", atom_x.size(), \", \",    //\n                     \"len(atom_y)=\", atom_y.size(), \", \",    //\n                     \"len(atom_z)=\", atom_z.size()));\n  }\n\n  if (fix_arginine) {\n    arginine.emplace();\n  }\n  if (!arginine.has_value()) {\n    return;\n  }\n\n  for (std::size_t res_index = 0; res_index < layout.num_residues();\n       ++res_index) {\n    auto [atom_start, atom_end] = layout.atom_range(res_index);\n    std::size_t atom_count = atom_end - atom_start;\n    PyObject* resname = comp_id[atom_start];\n    if (arginine.has_value() && arginine->IsResidue(resname)) {\n      arginine->Fix(atom_id.subspan(atom_start, atom_count),\n                    atom_x.subspan(atom_start, atom_count),\n                    atom_y.subspan(atom_start, atom_count),\n                    atom_z.subspan(atom_start, atom_count));\n    }\n  }\n}\n\nstd::vector<bool> SelectedPolymerResidueMask(\n    const MmcifLayout& layout,\n    const std::vector<absl::string_view>& atom_site_label_asym_ids,  //\n    const std::vector<absl::string_view>& atom_site_label_seq_ids,   //\n    const std::vector<absl::string_view>& atom_site_label_comp_ids,  //\n    const std::vector<absl::string_view>& poly_seq_asym_ids,         //\n    const std::vector<absl::string_view>& poly_seq_seq_ids,          //\n    const std::vector<absl::string_view>& poly_seq_mon_ids           //\n) {\n  absl::flat_hash_map<std::pair<absl::string_view, absl::string_view>,\n                      absl::string_view>\n      selected;\n  selected.reserve(layout.num_residues());\n  // layout.residues() is O(1) while layout.residue_starts() is O(num_res).\n  const std::vector<std::size_t>& residue_starts = layout.residue_starts();\n  for (int i = 0; i < layout.residues().size(); ++i) {\n    std::size_t res_start = residue_starts[i];\n    std::size_t res_end = layout.residues()[i];\n    if (res_start == res_end) {\n      continue;  // Skip empty residues (containing no atoms).\n    }\n\n    absl::string_view label_seq_id = atom_site_label_seq_ids[i];\n    if (label_seq_id == \".\") {\n      continue;  // Skip non-polymers.\n    }\n\n    absl::string_view label_asym_id = atom_site_label_asym_ids[i];\n    absl::string_view label_comp_id = atom_site_label_comp_ids[i];\n    selected[std::make_pair(label_asym_id, label_seq_id)] = label_comp_id;\n  }\n\n  std::vector<bool> mask;\n  mask.reserve(poly_seq_mon_ids.size());\n  for (int i = 0; i < poly_seq_mon_ids.size(); ++i) {\n    absl::string_view poly_seq_asym_id = poly_seq_asym_ids[i];\n    absl::string_view poly_seq_seq_id = poly_seq_seq_ids[i];\n    absl::string_view poly_seq_mon_id = poly_seq_mon_ids[i];\n\n    auto it = selected.find(std::make_pair(poly_seq_asym_id, poly_seq_seq_id));\n    if (it != selected.end()) {\n      mask.push_back(it->second == poly_seq_mon_id);\n    } else {\n      mask.push_back(true);  // Missing residues are not heterogeneous.\n    }\n  }\n  return mask;\n}\n\nstd::pair<std::vector<bool>, std::vector<bool>> SelectedLigandResidueMask(\n    const MmcifLayout& layout,                                           //\n    const std::vector<absl::string_view>& atom_site_label_asym_ids,      //\n    const std::vector<absl::string_view>& atom_site_label_seq_ids,       //\n    const std::vector<absl::string_view>& atom_site_auth_seq_ids,        //\n    const std::vector<absl::string_view>& atom_site_label_comp_ids,      //\n    const std::vector<absl::string_view>& atom_site_pdbx_pdb_ins_codes,  //\n    const std::vector<absl::string_view>& nonpoly_asym_ids,              //\n    const std::vector<absl::string_view>& nonpoly_auth_seq_ids,          //\n    const std::vector<absl::string_view>& nonpoly_pdb_ins_codes,         //\n    const std::vector<absl::string_view>& nonpoly_mon_ids,               //\n    const std::vector<absl::string_view>& branch_asym_ids,               //\n    const std::vector<absl::string_view>& branch_auth_seq_ids,           //\n    const std::vector<absl::string_view>& branch_pdb_ins_codes,          //\n    const std::vector<absl::string_view>& branch_mon_ids) {\n  absl::flat_hash_map<\n      std::tuple<absl::string_view, absl::string_view, absl::string_view>,\n      absl::string_view>\n      selected;\n  selected.reserve(layout.num_residues());\n  // layout.residues() is O(1) while layout.residue_starts() is O(num_res).\n  const std::vector<std::size_t>& residue_starts = layout.residue_starts();\n  for (int i = 0; i < layout.residues().size(); ++i) {\n    std::size_t res_start = residue_starts[i];\n    std::size_t res_end = layout.residues()[i];\n    if (res_start == res_end) {\n      continue;  // Skip empty residues (containing no atoms).\n    }\n\n    absl::string_view label_seq_id = atom_site_label_seq_ids[i];\n    if (label_seq_id != \".\") {\n      continue;  // Skip polymers.\n    }\n\n    absl::string_view label_asym_id = atom_site_label_asym_ids[i];\n    absl::string_view auth_seq_id = atom_site_auth_seq_ids[i];\n    absl::string_view ins_code = atom_site_pdbx_pdb_ins_codes[i];\n    ins_code = ins_code == \"?\" ? \".\" : ins_code;  // Remap unknown to unset.\n    absl::string_view label_comp_id = atom_site_label_comp_ids[i];\n    selected[std::make_tuple(label_asym_id, auth_seq_id, ins_code)] =\n        label_comp_id;\n  }\n\n  std::vector<bool> nonpoly_mask;\n  nonpoly_mask.reserve(nonpoly_asym_ids.size());\n  for (int i = 0; i < nonpoly_asym_ids.size(); ++i) {\n    absl::string_view nonpoly_asym_id = nonpoly_asym_ids[i];\n    absl::string_view nonpoly_auth_seq_id = nonpoly_auth_seq_ids[i];\n    absl::string_view nonpoly_ins_code = nonpoly_pdb_ins_codes[i];\n    // Remap unknown to unset.\n    nonpoly_ins_code = nonpoly_ins_code == \"?\" ? \".\" : nonpoly_ins_code;\n    absl::string_view nonpoly_mon_id = nonpoly_mon_ids[i];\n\n    auto it = selected.find(std::make_tuple(\n        nonpoly_asym_id, nonpoly_auth_seq_id, nonpoly_ins_code));\n    if (it != selected.end()) {\n      nonpoly_mask.push_back(it->second == nonpoly_mon_id);\n    } else {\n      nonpoly_mask.push_back(true);  // Missing residues are not heterogeneous.\n    }\n  }\n\n  std::vector<bool> branch_mask;\n  branch_mask.reserve(branch_asym_ids.size());\n  for (int i = 0; i < branch_asym_ids.size(); ++i) {\n    absl::string_view branch_asym_id = branch_asym_ids[i];\n    absl::string_view branch_auth_seq_id = branch_auth_seq_ids[i];\n\n    // Insertion codes in _pdbx_branch_scheme are not required and can be\n    // missing. Default to unset ('.') in such case.\n    absl::string_view branch_ins_code;\n    if (i < branch_pdb_ins_codes.size()) {\n      branch_ins_code = branch_pdb_ins_codes[i];\n      // Remap unknown to unset.\n      branch_ins_code = branch_ins_code == \"?\" ? \".\" : branch_ins_code;\n    } else {\n      branch_ins_code = \".\";\n    }\n\n    absl::string_view branch_mon_id = branch_mon_ids[i];\n\n    auto it = selected.find(\n        std::make_tuple(branch_asym_id, branch_auth_seq_id, branch_ins_code));\n    if (it != selected.end()) {\n      branch_mask.push_back(it->second == branch_mon_id);\n    } else {\n      branch_mask.push_back(true);  // Missing residues are not heterogeneous.\n    }\n  }\n\n  return std::make_pair(nonpoly_mask, branch_mask);\n}\n\nconstexpr char kReadMmcifLayout[] = R\"(\nReturns the layout of the cif_dict.\n\nArgs:\n  mmcif: mmCIF to calculate the layout for.\n  model_id: If non-empty the layout of the given model is returned\n    otherwise the layout of all models are returned.\nRaises:\n  ValueError: if the mmCIF is malformed or the number of atoms in each\n    model are inconsistent.\n)\";\n\nconstexpr char kMmcifFilter[] = R\"(\nReturns NumpyArray of selected rows in `_atom_site` and new layout.\n\nArgs:\n  mmcif: mmCIF to filter.\n  include_nucleotides: Whether to include polymer entities of type:\n    \"polypeptide(L)\\\", \"polydeoxyribonucleotide\", \"polyribonucleotide\".\n    Otherwise only \"polypeptide(L)\\\". (\"polypeptide(D)\\\" is never included.)\n  include_ligands: Whether to include non-polymer entities of type:\n    \"non-polymer\", \"branched\".\n  include_water: Whether to include entities of type water.\n  include_other: Whether to include other (non-standard) entity types\n    that are not covered by any of the above parameters.\n  model_id: If non-empty the model with given name is selected otherwise\n    all models are selected.\n\nReturns:\n  A tuple containing a numpy array with a shape (num_models, num_atoms)\n  with the atom_site indices selected and the new layout.\n\nRaises:\n  ValueError error if mmCIF dict does not have all required fields.\n)\";\n\nconstexpr char kMmcifFixResidues[] = R\"(\nFixes residue columns in-place.\n\nArgs:\n  layout: layout from filter command.\n  comp_id: '_atom_site.label_comp_id' of first model.\n  group: '_atom_site.group_PDB' of first model.\n  atom_id: '_atom_site.label_atom_id' of first model.\n  type_symbol: '_atom_site.type_symbol' of first model.\n  atom_x: '_atom_site.Cartn_x' of first model.\n  atom_y: '_atom_site.Cartn_y' of first model.\n  atom_z: '_atom_site.Cartn_z' of first model.\n  fix_mse: Whether to convert MSE residues into MET residues.\n  fix_arg: Whether to ensure the atoms in ARG are in the correct order.\n  fix_unknown_dna: Whether to convert DNA residues from N to DN.\n  dna_mask: Which atoms are from DNA chains.\n\nRaises:\n  ValueError: If shapes are invalid.\n)\";\n\nconstexpr char kSelectedPolymerResidueMask[] = R\"(\nReturns a _pdbx_poly_seq_scheme mask for selected hetero residues.\n\nShould be called after filtering the layout using mmcif_utils.filter.\n\nArgs:\n  layout: Layout defining the _atom_site residue selection.\n  atom_site_label_asym_ids: Internal (label) chain ID, per selected residue.\n  atom_site_label_seq_ids: Internal (label) residue ID, per selected residue.\n  atom_site_label_comp_ids: Residue name, per selected residue.\n  poly_seq_asym_ids: Internal (label) chain ID, per residue.\n  poly_seq_seq_ids: Internal (label) residue ID, per residue.\n  poly_seq_mon_ids: Residue name, per residue.\n\nReturns:\n  A mask for the _pdbx_poly_seq_scheme table. If residues are selected\n  using this mask, they will have consistent heterogeneous residue\n  selection with the _atom_site table.\n)\";\n\nconstexpr char kSelectedLigandResidueMask[] = R\"(\nReturns masks for selected ligand hetero residues.\n\nShould be called after filtering the layout using mmcif_utils.filter.\n\nArgs:\n  layout: Layout defining the _atom_site residue selection.\n  atom_site_label_asym_ids: Internal (label) chain ID, per selected residue.\n  atom_site_label_seq_ids: Internal (author) residue ID, per selected residue.\n  atom_site_auth_seq_ids: External (author) residue ID, per selected residue.\n  atom_site_label_comp_ids: Residue name, per selected residue.\n  atom_site_pdbx_pdb_ins_codes: Insertion code, per selected residue.\n  nonpoly_asym_ids: Internal (label) chain ID, per residue from\n   _pdbx_nonpoly_scheme.\n  nonpoly_auth_seq_ids: External (author) residue ID, per residue from\n   _pdbx_nonpoly_scheme.\n  nonpoly_pdb_ins_codes: Residue name, per residue from\n   _pdbx_nonpoly_scheme.\n  nonpoly_mon_ids: Insertion code, per residue from _pdbx_nonpoly_scheme.\n  branch_asym_ids: Internal (label) chain ID, per residue from\n   _pdbx_branch_scheme.\n  branch_auth_seq_ids: External (author) residue ID, per residue from\n   _pdbx_branch_scheme.\n  branch_pdb_ins_codes: Residue name, per residue from _pdbx_branch_scheme.\n  branch_mon_ids: Insertion code, per residue from _pdbx_branch_scheme.\n\nReturns:\n  A tuple with masks for _pdbx_nonpoly_scheme and _pdbx_branch_scheme. If\n  residues are selected using these masks, they will have consistent\n  heterogeneous residue selection with the _atom_site table.\n)\";\n\n}  // namespace\n\nvoid RegisterModuleMmcifUtils(pybind11::module m) {\n  m.def(\"read_layout\", ReadMmcifLayout,\n        py::arg(\"mmcif\"),              //\n        py::arg(\"model_id\") = \"\",      //\n        py::doc(kReadMmcifLayout + 1)  //\n  );\n\n  m.def(\"filter\", MmcifFilter,               //\n        py::arg(\"mmcif\"),                    //\n        py::arg(\"include_nucleotides\"),      //\n        py::arg(\"include_ligands\") = false,  //\n        py::arg(\"include_water\") = false,    //\n        py::arg(\"include_other\") = false,    //\n        py::arg(\"model_id\") = \"\",            //\n        py::doc(kMmcifFilter + 1)            //\n  );\n\n  m.def(\"fix_residues\", MmcifFixResidues,\n        py::arg(\"layout\"),              //\n        py::arg(\"comp_id\"),             //\n        py::arg(\"atom_id\"),             //\n        py::arg(\"atom_x\"),              //\n        py::arg(\"atom_y\"),              //\n        py::arg(\"atom_z\"),              //\n        py::arg(\"fix_arg\") = false,     //\n        py::doc(kMmcifFixResidues + 1)  //\n  );\n\n  m.def(\"selected_polymer_residue_mask\", SelectedPolymerResidueMask,\n        py::arg(\"layout\"),                         //\n        py::arg(\"atom_site_label_asym_ids\"),       //\n        py::arg(\"atom_site_label_seq_ids\"),        //\n        py::arg(\"atom_site_label_comp_ids\"),       //\n        py::arg(\"poly_seq_asym_ids\"),              //\n        py::arg(\"poly_seq_seq_ids\"),               //\n        py::arg(\"poly_seq_mon_ids\"),               //\n        py::call_guard<py::gil_scoped_release>(),  //\n        py::doc(kSelectedPolymerResidueMask + 1)   //\n  );\n\n  m.def(\"selected_ligand_residue_mask\", SelectedLigandResidueMask,\n        py::arg(\"layout\"),                         //\n        py::arg(\"atom_site_label_asym_ids\"),       //\n        py::arg(\"atom_site_label_seq_ids\"),        //\n        py::arg(\"atom_site_auth_seq_ids\"),         //\n        py::arg(\"atom_site_label_comp_ids\"),       //\n        py::arg(\"atom_site_pdbx_pdb_ins_codes\"),   //\n        py::arg(\"nonpoly_asym_ids\"),               //\n        py::arg(\"nonpoly_auth_seq_ids\"),           //\n        py::arg(\"nonpoly_pdb_ins_codes\"),          //\n        py::arg(\"nonpoly_mon_ids\"),                //\n        py::arg(\"branch_asym_ids\"),                //\n        py::arg(\"branch_auth_seq_ids\"),            //\n        py::arg(\"branch_pdb_ins_codes\"),           //\n        py::arg(\"branch_mon_ids\"),                 //\n        py::call_guard<py::gil_scoped_release>(),  //\n        py::doc(kSelectedLigandResidueMask + 1)    //\n  );\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/mmcif_utils_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_UTILS_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_UTILS_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleMmcifUtils(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_MMCIF_UTILS_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/string_array.pyi",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\nfrom collections.abc import Sequence\nfrom typing import Any, overload\n\nimport numpy as np\n\n\ndef format_float_array(\n    values: Sequence[float], num_decimal_places: int\n) -> list[str]: ...\n\n\ndef isin(\n    array: np.ndarray[object],\n    test_elements: set[str | bytes],\n    *,\n    invert: bool = ...,\n) -> np.ndarray[bool]: ...\n\n\n@overload\ndef remap(\n    array: np.ndarray[object],\n    mapping: dict[str, str],\n    default_value: str,\n    inplace: bool = ...,\n) -> np.ndarray[object]: ...\n\n\n@overload\ndef remap(\n    array: np.ndarray[object],\n    mapping: dict[str, str],\n    inplace: bool = ...,\n) -> np.ndarray[object]: ...\n\n\ndef remap_multiple(\n    arrays: Sequence[np.ndarray[object]],\n    mapping: dict[tuple[Any], int],\n) -> np.ndarray[int]: ...\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/string_array_pybind.cc",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#include <Python.h>\n\n#include <algorithm>\n#include <cstddef>\n#include <cstdint>\n#include <cstring>\n#include <iterator>\n#include <limits>\n#include <string>\n#include <vector>\n\n#include \"numpy/arrayobject.h\"\n#include \"numpy/ndarrayobject.h\"\n#include \"numpy/ndarraytypes.h\"\n#include \"numpy/npy_common.h\"\n#include \"absl/algorithm/container.h\"\n#include \"absl/container/flat_hash_set.h\"\n#include \"absl/strings/str_format.h\"\n#include \"absl/strings/string_view.h\"\n#include \"absl/types/span.h\"\n#include \"pybind11/cast.h\"\n#include \"pybind11/numpy.h\"\n#include \"pybind11/pybind11.h\"\n#include \"pybind11/pytypes.h\"\n#include \"pybind11_abseil/absl_casters.h\"\n\nnamespace {\n\nnamespace py = pybind11;\n\nPyObject* RemapNumpyArrayObjects(PyObject* array, PyObject* mapping,\n                                 bool inplace, PyObject* default_value) {\n  import_array();\n  if (!PyArray_Check(array)) {\n    PyErr_SetString(PyExc_TypeError, \"'array' must be a np.ndarray.\");\n    return nullptr;\n  }\n  if (!PyDict_Check(mapping)) {\n    PyErr_SetString(PyExc_TypeError, \"'mapping' must be a Python dict.\");\n    return nullptr;\n  }\n\n  PyArrayObject* array_obj = reinterpret_cast<PyArrayObject*>(array);\n  if (PyArray_TYPE(array_obj) != NPY_OBJECT) {\n    PyErr_SetString(PyExc_TypeError, \"`array` must be an array of objects.\");\n    return nullptr;\n  }\n\n  if (inplace) {\n    // We are returning original array so we need to increase the ref count.\n    Py_INCREF(array);\n  } else {\n    // We are returning a fresh copy.\n    array = PyArray_NewCopy(array_obj, NPY_CORDER);\n    if (array == nullptr) {\n      PyErr_SetString(PyExc_MemoryError, \"Out of memory!\");\n      return nullptr;\n    }\n    array_obj = reinterpret_cast<PyArrayObject*>(array);\n  }\n\n  if (PyArray_SIZE(array_obj) == 0) {\n    return array;\n  }\n\n  if (default_value == nullptr && PyDict_Size(mapping) == 0) {\n    return array;\n  }\n\n  NpyIter* iter = NpyIter_New(\n      array_obj, NPY_ITER_READWRITE | NPY_ITER_EXTERNAL_LOOP | NPY_ITER_REFS_OK,\n      NPY_KEEPORDER, NPY_NO_CASTING, nullptr);\n  if (iter == nullptr) {\n    PyErr_SetString(PyExc_MemoryError, \"Out of memory!\");\n    Py_XDECREF(array);\n    return nullptr;\n  }\n\n  NpyIter_IterNextFunc* iter_next = NpyIter_GetIterNext(iter, nullptr);\n  if (iter_next == nullptr) {\n    NpyIter_Deallocate(iter);\n    Py_XDECREF(array);\n    PyErr_SetString(PyExc_MemoryError, \"Out of memory!\");\n    return nullptr;\n  }\n\n  // Iterating arrays taken from:\n  // https://numpy.org/doc/stable/reference/c-api/iterator.html\n  char** data_pointer = NpyIter_GetDataPtrArray(iter);\n  npy_intp* stride_pointer = NpyIter_GetInnerStrideArray(iter);\n  npy_intp* inner_size_pointer = NpyIter_GetInnerLoopSizePtr(iter);\n  do {\n    char* data = *data_pointer;\n    npy_intp stride = *stride_pointer;\n    npy_intp count = *inner_size_pointer;\n    for (size_t i = 0; i < count; ++i) {\n      PyObject* entry;\n      std::memcpy(&entry, data, sizeof(PyObject*));\n      PyObject* result = PyDict_GetItem(mapping, entry);\n      if (result != nullptr) {\n        // Replace entry.\n        Py_INCREF(result);\n        Py_XDECREF(entry);\n        std::memcpy(data, &result, sizeof(PyObject*));\n      } else if (default_value != nullptr) {\n        // Replace entry with a default value.\n        Py_INCREF(default_value);\n        Py_XDECREF(entry);\n        std::memcpy(data, &default_value, sizeof(PyObject*));\n      }\n      data += stride;\n    }\n  } while (iter_next(iter));\n\n  NpyIter_Deallocate(iter);\n  return array;\n}\n\n// Convert 1D Numpy float array to a list of strings where each string has fixed\n// number of decimal points. This is faster than Python list comprehension.\nstd::vector<std::string> FormatFloatArray(absl::Span<const float> values,\n                                          int num_decimal_places) {\n  std::vector<std::string> output;\n  output.reserve(values.size());\n\n  absl::c_transform(values, std::back_inserter(output),\n                    [num_decimal_places](float value) {\n                      return absl::StrFormat(\"%.*f\", num_decimal_places, value);\n                    });\n  return output;\n}\n\npy::array_t<bool> IsIn(\n    const py::array_t<PyObject*, py::array::c_style>& array,\n    const absl::flat_hash_set<absl::string_view>& test_elements, bool invert) {\n  const size_t num_elements = array.size();\n  py::array_t<bool> output(num_elements);\n  std::fill(output.mutable_data(), output.mutable_data() + output.size(),\n            invert);\n\n  // Shortcut: The output will be trivially always false if test_elements empty.\n  if (test_elements.empty()) {\n    return output;\n  }\n\n  for (size_t i = 0; i < num_elements; ++i) {\n    // Compare the string values instead of comparing just object pointers.\n    py::handle handle = array.data()[i];\n    if (!PyUnicode_Check(handle.ptr()) && !PyBytes_Check(handle.ptr())) {\n      continue;\n    }\n    if (test_elements.contains(py::cast<absl::string_view>(handle))) {\n      output.mutable_data()[i] = !invert;\n    }\n  }\n  if (array.ndim() > 1) {\n    auto shape =\n        std::vector<ptrdiff_t>(array.shape(), array.shape() + array.ndim());\n    return output.reshape(shape);\n  }\n  return output;\n}\n\npy::array RemapMultipleArrays(\n    const std::vector<py::array_t<PyObject*, py::array::c_style>>& arrays,\n    const py::dict& mapping) {\n  size_t array_size = arrays[0].size();\n  for (const auto& array : arrays) {\n    if (array.size() != array_size) {\n      throw py::value_error(\"All arrays must have the same length.\");\n    }\n  }\n\n  // Create a result buffer.\n  auto result = py::array_t<int64_t>(array_size);\n  absl::Span<int64_t> result_buffer(result.mutable_data(), array_size);\n  PyObject* entry = PyTuple_New(arrays.size());\n  if (entry == nullptr) {\n    throw py::error_already_set();\n  }\n  std::vector<absl::Span<PyObject* const>> array_spans;\n  array_spans.reserve(arrays.size());\n  for (const auto& array : arrays) {\n    array_spans.emplace_back(array.data(), array.size());\n  }\n\n  // Iterate over arrays and look up elements in the `py_dict`.\n  bool fail = false;\n  for (size_t i = 0; i < array_size; ++i) {\n    for (size_t j = 0; j < array_spans.size(); ++j) {\n      PyTuple_SET_ITEM(entry, j, array_spans[j][i]);\n    }\n    PyObject* result = PyDict_GetItem(mapping.ptr(), entry);\n    if (result != nullptr) {\n      int64_t result_value = PyLong_AsLongLong(result);\n      if (result_value == -1 && PyErr_Occurred()) {\n        fail = true;\n        break;\n      }\n      if (result_value > std::numeric_limits<int64_t>::max() ||\n          result_value < std::numeric_limits<int64_t>::lowest()) {\n        PyErr_SetString(PyExc_OverflowError, \"Result value too large.\");\n        fail = true;\n        break;\n      }\n      result_buffer[i] = result_value;\n    } else {\n      PyErr_Format(PyExc_KeyError, \"%R\", entry);\n      fail = true;\n      break;\n    }\n  }\n\n  for (size_t j = 0; j < array_spans.size(); ++j) {\n    PyTuple_SET_ITEM(entry, j, nullptr);\n  }\n  Py_XDECREF(entry);\n  if (fail) {\n    throw py::error_already_set();\n  }\n  return result;\n}\n\nconstexpr char kRemapNumpyArrayObjects[] = R\"(\nReplace objects in NumPy array of objects using mapping.\n\nArgs:\n  array: NumPy array with dtype=object.\n  mapping: Dict mapping old values to new values.\n  inplace: Bool (default False) whether to replace values inplace or to\n    create a new array.\n  default_value: If given, what value to map to if the mapping is missing\n    for that particular item. If not given, such items are left unchanged.\n\nReturns\n  NumPy array of dtype object with values replaced according to mapping.\n  If inplace is True the original array is modified inplace otherwise a\n  new array is returned.\n)\";\n\nconstexpr char kFormatFloatArrayDoc[] = R\"(\nConverts float -> string array with given number of decimal places.\n)\";\n\nconstexpr char kIsInDoc[] = R\"(\nComputes whether each element is in test_elements.\n\nSame use as np.isin, but much faster. If len(array) = n, len(test_elements) = m:\n* This function has complexity O(n).\n* np.isin with arrays of objects has complexity O(m*log(m) + n * log(m)).\n\nArgs:\n  array: Input NumPy array with dtype=object.\n  test_elements: The values against which to test each value of array.\n  invert: If True, the values in the returned array are inverted, as if\n    calculating `element not in test_elements`. Default is False.\n    `isin(a, b, invert=True)` is equivalent to but faster than `~isin(a, b)`.\n\nReturns\n  A boolean array of the same shape as the input array. Each value `val` is:\n  * `val in test_elements` if `invert=False`,\n  * `val not in test_elements` if `invert=True`.\n)\";\n\nconstexpr char kRemapMultipleDoc[] = R\"(\nMaps keys from multiple aligned arrays to a single array.\n\nArgs:\n  arrays: Numpy arrays of the same length. The tuple of aligned entries is used\n    as key for the mapping.\n  mapping: Dict mapping from tuples to integer values.\n\nReturns\n  NumPy array of dtype `int` with values looked up in mapping according to the\n  tuple of aligned array entries as keys.\n)\";\n\n}  // namespace\n\nnamespace alphafold3 {\n\nvoid RegisterModuleStringArray(pybind11::module m) {\n  m.def(\n      \"remap\",\n      [](py::object array, py::object mapping, bool inplace,\n         py::object default_value) -> py::object {\n        PyObject* result = RemapNumpyArrayObjects(array.ptr(), mapping.ptr(),\n                                                  inplace, default_value.ptr());\n        if (result == nullptr) {\n          throw py::error_already_set();\n        }\n        return py::reinterpret_steal<py::object>(result);\n      },\n      py::return_value_policy::take_ownership, py::arg(\"array\"),\n      py::arg(\"mapping\"), py::arg(\"inplace\") = false, py::arg(\"default_value\"),\n      py::doc(kRemapNumpyArrayObjects + 1));\n  m.def(\n      \"remap\",\n      [](py::object array, py::object mapping, bool inplace) -> py::object {\n        PyObject* result = RemapNumpyArrayObjects(array.ptr(), mapping.ptr(),\n                                                  inplace, nullptr);\n        if (result == nullptr) {\n          throw py::error_already_set();\n        }\n        return py::reinterpret_steal<py::object>(result);\n      },\n      py::return_value_policy::take_ownership, py::arg(\"array\"),\n      py::arg(\"mapping\"), py::arg(\"inplace\") = false,\n      py::doc(kRemapNumpyArrayObjects + 1));\n  m.def(\"format_float_array\", &FormatFloatArray, py::arg(\"values\"),\n        py::arg(\"num_decimal_places\"), py::doc(kFormatFloatArrayDoc + 1),\n        py::call_guard<py::gil_scoped_release>());\n  m.def(\"isin\", &IsIn, py::arg(\"array\"), py::arg(\"test_elements\"),\n        py::kw_only(), py::arg(\"invert\") = false, py::doc(kIsInDoc + 1));\n  m.def(\"remap_multiple\", &RemapMultipleArrays, py::arg(\"arrays\"),\n        py::arg(\"mapping\"), py::doc(kRemapMultipleDoc + 1));\n}\n\n}  // namespace alphafold3\n"
  },
  {
    "path": "src/alphafold3/structure/cpp/string_array_pybind.h",
    "content": "// Copyright 2024 DeepMind Technologies Limited\n//\n// AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n// this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n//\n// To request access to the AlphaFold 3 model parameters, follow the process set\n// out at https://github.com/google-deepmind/alphafold3. You may only use these\n// if received directly from Google. Use is subject to terms of use available at\n// https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n#ifndef ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_STRING_ARRAY_PYBIND_H_\n#define ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_STRING_ARRAY_PYBIND_H_\n\n#include \"pybind11/pybind11.h\"\n\nnamespace alphafold3 {\n\nvoid RegisterModuleStringArray(pybind11::module m);\n\n}\n\n#endif  // ALPHAFOLD3_SRC_ALPHAFOLD3_STRUCTURE_PYTHON_STRING_ARRAY_PYBIND_H_\n"
  },
  {
    "path": "src/alphafold3/structure/mmcif.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Low level mmCIF parsing operations and wrappers for nicer C++/Py errors.\n\nNote that the cif_dict.CifDict class has many useful methods to help with data\nextraction which are not shown in this file. You can find them in cif_dict.clif\ntogether with docstrings. The cif_dict.CifDict class behaves like an immutable\nPython dictionary (some methods are not implemented though).\n\"\"\"\nfrom collections.abc import Callable, Mapping, Sequence\nimport functools\nimport itertools\nimport re\nfrom typing import ParamSpec, TypeAlias, TypeVar\n\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.cpp import cif_dict\nfrom alphafold3.cpp import mmcif_atom_site\nfrom alphafold3.cpp import mmcif_struct_conn\nfrom alphafold3.cpp import string_array\nimport numpy as np\n\nMmcif = cif_dict.CifDict\n\n\n_P = ParamSpec('_P')\n_T = TypeVar('_T')\n_WappedFn: TypeAlias = Callable[_P, _T]\n\n\n@functools.lru_cache(maxsize=256)\ndef int_id_to_str_id(num: int) -> str:\n  \"\"\"Encodes a number as a string, using reverse spreadsheet style naming.\n\n  Args:\n    num: A positive integer.\n\n  Returns:\n    A string that encodes the positive integer using reverse spreadsheet style,\n    naming e.g. 1 = A, 2 = B, ..., 27 = AA, 28 = BA, 29 = CA, ... This is the\n    usual way to encode chain IDs in mmCIF files.\n  \"\"\"\n  if num <= 0:\n    raise ValueError(f'Only positive integers allowed, got {num}.')\n\n  num = num - 1  # 1-based indexing.\n  output = []\n  while num >= 0:\n    output.append(chr(num % 26 + ord('A')))\n    num = num // 26 - 1\n  return ''.join(output)\n\n\n@functools.lru_cache(maxsize=256)\ndef str_id_to_int_id(str_id: str) -> int:\n  \"\"\"Encodes an mmCIF-style string chain ID as an integer.\n\n  The integer IDs are one based so this function is the inverse of\n  int_id_to_str_id.\n\n  Args:\n    str_id: A string chain ID consisting only of upper case letters A-Z.\n\n  Returns:\n    An integer that can be used to order mmCIF chain IDs in the standard\n    (reverse spreadsheet style) ordering.\n  \"\"\"\n  if not re.match('^[A-Z]+$', str_id):\n    raise ValueError(f'String ID must be upper case letters, got {str_id}.')\n\n  offset = ord('A') - 1\n  output = 0\n  for i, c in enumerate(str_id):\n    output += (ord(c) - offset) * int(26**i)\n  return output\n\n\ndef from_string(mmcif_string: str | bytes) -> Mmcif:\n  return cif_dict.from_string(mmcif_string)\n\n\ndef parse_multi_data_cif(cif_string: str) -> dict[str, Mmcif]:\n  \"\"\"Parses a CIF string with multiple data records.\n\n  For instance, the CIF string:\n\n  ```\n  data_001\n  _foo bar\n  #\n  data_002\n  _foo baz\n  ```\n\n  is parsed as:\n\n  ```\n  {'001': Mmcif({'_foo': ['bar']}), '002': Mmcif({'_foo': ['baz']})}\n  ```\n\n  Args:\n    cif_string: The multi-data CIF string to be parsed.\n\n  Returns:\n    A dictionary mapping record names to Mmcif objects with data.\n  \"\"\"\n  return cif_dict.parse_multi_data_cif(cif_string)\n\n\nclass BondParsingError(Exception):\n  \"\"\"Exception raised by errors when getting bond atom indices.\"\"\"\n\n\ndef get_bond_atom_indices(\n    mmcif: Mmcif,\n    model_id: str = '1',\n) -> tuple[Sequence[int], Sequence[int]]:\n  \"\"\"Extracts the indices of the atoms that participate in bonds.\n\n  Args:\n    mmcif: The mmCIF object to process.\n    model_id: The ID of the model that the returned atoms will belong to. This\n      should be a value in the mmCIF's _atom_site.pdbx_PDB_model_num column.\n\n  Returns:\n    Two lists of atom indices, `from_atoms` and `to_atoms`, each one having\n    length num_bonds (as defined by _struct_conn, the bonds table). The bond\n    i, defined by the i'th row in _struct_conn, is a bond from atom at index\n    from_atoms[i], to the atom at index to_atoms[i]. The indices are simple\n    0-based indexes into the columns of the _atom_site table in the input\n    mmCIF, and do not necessarily correspond to the values in _atom_site.id,\n    or any other column.\n\n  Raises:\n    BondParsingError: If any of the required tables or columns are not present\n    in\n      the mmCIF, or if the _struct_conn table refers to atoms that cannot\n      be found in the _atom_site table.\n  \"\"\"\n  try:\n    return mmcif_struct_conn.get_bond_atom_indices(mmcif, model_id)\n  except ValueError as e:\n    raise BondParsingError(str(e)) from e\n\n\ndef get_or_infer_type_symbol(\n    mmcif: Mmcif, ccd: chemical_components.Ccd | None = None\n) -> Sequence[str]:\n  \"\"\"Returns the type symbol (element) for all of the atoms.\n\n  Args:\n    mmcif: A parsed mmCIF file in the Mmcif format.\n    ccd: The chemical component dictionary. If not provided, defaults to the\n      cached CCD.\n\n  If present, returns the _atom_site.type_symbol. If not, infers it using\n  _atom_site.label_comp_id (residue name), _atom_site.label_atom_id (atom name)\n  and the CCD.\n  \"\"\"\n  ccd = ccd or chemical_components.Ccd()\n  type_symbol_fn = lambda res_name, atom_name: chemical_components.type_symbol(\n      ccd, res_name, atom_name\n  )\n  return mmcif_atom_site.get_or_infer_type_symbol(mmcif, type_symbol_fn)\n\n\ndef get_chain_type_by_entity_id(mmcif: Mmcif) -> Mapping[str, str]:\n  \"\"\"Returns mapping from entity ID to its type or polymer type if available.\n\n  If the entity is in the _entity_poly table, returns its polymer chain type.\n  If not, returns the type as specified in the _entity table.\n\n  Args:\n    mmcif: CifDict holding the mmCIF.\n  \"\"\"\n  poly_entity_id = mmcif.get('_entity_poly.entity_id', [])\n  poly_type = mmcif.get('_entity_poly.type', [])\n  poly_type_by_entity_id = dict(zip(poly_entity_id, poly_type, strict=True))\n\n  chain_type_by_entity_id = {}\n  for entity_id, entity_type in zip(\n      mmcif.get('_entity.id', []), mmcif.get('_entity.type', []), strict=True\n  ):\n    chain_type = poly_type_by_entity_id.get(entity_id) or entity_type\n    chain_type_by_entity_id[entity_id] = chain_type\n\n  return chain_type_by_entity_id\n\n\ndef get_internal_to_author_chain_id_map(mmcif: Mmcif) -> Mapping[str, str]:\n  \"\"\"Returns a mapping from internal chain ID to the author chain ID.\n\n  Note that this is not a bijection. One author chain ID can map to multiple\n  internal chain IDs. For example, a protein chain and a ligand bound to it will\n  share the same author chain ID, but they will each have a unique internal\n  chain ID).\n\n  Args:\n    mmcif: CifDict holding the mmCIF.\n  \"\"\"\n  return mmcif_atom_site.get_internal_to_author_chain_id_map(mmcif)\n\n\ndef get_experimental_method(mmcif: Mmcif) -> str | None:\n  field = '_exptl.method'\n  return ','.join(mmcif[field]).lower() if field in mmcif else None\n\n\ndef get_release_date(mmcif: Mmcif) -> str | None:\n  \"\"\"Returns the oldest revision date.\"\"\"\n  if '_pdbx_audit_revision_history.revision_date' not in mmcif:\n    return None\n\n  # Release dates are ISO-8601, hence sort well.\n  return min(mmcif['_pdbx_audit_revision_history.revision_date'])\n\n\ndef get_resolution(mmcif: Mmcif) -> float | None:\n  \"\"\"Returns the resolution of the structure.\n\n  More than one resolution can be reported in an mmCIF. This function returns\n  the first one (in the order _refine.ls_d_res_high,\n  _em_3d_reconstruction.resolution, _reflns.d_resolution_high) that appears\n  in the mmCIF as is parseable as a float.\n\n  Args:\n    mmcif: An `Mmcif` object.\n\n  Returns:\n    The resolution as reported in the mmCIF.\n  \"\"\"\n  for res_key in ('_refine.ls_d_res_high',\n                  '_em_3d_reconstruction.resolution',\n                  '_reflns.d_resolution_high'):\n    if res_key in mmcif:\n      try:\n        raw_resolution = mmcif[res_key][0]\n        return float(raw_resolution)\n      except ValueError:\n        continue\n  return None\n\n\ndef parse_oper_expr(oper_expression: str) -> list[tuple[str, ...]]:\n  \"\"\"Determines which transforms to apply based on an MMCIF oper_expression str.\n\n  Args:\n    oper_expression: the field oper_expression from MMCIF format data.\n      Transform ids may be either numbers or single letters. Hyphens are used to\n      denote a numeric range of transforms to apply, and commas are used to\n      delimit a sequence of transforms. Where two sets of parentheses are\n      adjacent without a comma, the two sets of transforms should be combined as\n      a cartesian product, i.e. all possible pairs.\n      example 1,2,3 -> generate 3 copies of each chain by applying 1, 2 or 3.\n      example (1-3) -> generate 3 copies of each chain by applying 1, 2 or 3.\n      example (1-3)(4-6) -> generate 9 copies of each chain by applying one of\n        [(1,4), (1,5), (1,6),\n         (2,4), (2,5), (2,6),\n         (3,4), (3,5), (3,6)]\n      example (P) -> apply transform with id P.\n\n  Raises:\n    ValueError: Failure to parse oper_expression.\n\n  Returns:\n    A list with one element for each chain copy that should be generated.\n    Each element is a list of transform ids to apply.\n  \"\"\"\n  # Expand ranges, e.g. 1-4 -> 1,2,3,4.\n  def range_expander(match):\n    return ','.join(\n        [str(i) for i in range(int(match.group(1)),\n                               int(match.group(2)) + 1)])\n\n  ranges_expanded = re.sub(r'\\b(\\d+)-(\\d+)', range_expander, oper_expression)\n\n  if re.fullmatch(r'(\\w+,)*\\w+', ranges_expanded):\n    # No brackets, just a single range, e.g. \"1,2,3\".\n    return [(t,) for t in ranges_expanded.split(',')]\n  elif re.fullmatch(r'\\((\\w+,)*\\w+\\)', ranges_expanded):\n    # Single range in brackets, e.g. \"(1,2,3)\".\n    return [(t,) for t in ranges_expanded[1:-1].split(',')]\n  elif re.fullmatch(r'\\((\\w+,)*\\w+\\)\\((\\w+,)*\\w+\\)', ranges_expanded):\n    # Cartesian product of two ranges, e.g. \"(1,2,3)(4,5)\".\n    part1, part2 = ranges_expanded[1:-1].split(')(')\n    return list(itertools.product(part1.split(','), part2.split(',')))\n  else:\n    raise ValueError(f'Unsupported oper_expression format: {oper_expression}')\n\n\ndef format_float_array(\n    values: np.ndarray, num_decimal_places: int) -> Sequence[str]:\n  \"\"\"Converts 1D array to a list of strings with the given number of decimals.\n\n  This function is faster than converting via Python list comprehension, e.g.:\n  atoms_x = ['%.3f' % x for x in atoms_x]\n\n  Args:\n    values: A numpy array with values to convert. This array is casted to\n      float32 before doing the conversion.\n    num_decimal_places: The number of decimal points to keep, including trailing\n      zeros. E.g. for 1.07 and num_decimal_places=1: 1.1,\n      num_decimal_places=2: 1.07, num_decimal_places=3: 1.070.\n\n  Returns:\n    A list of formatted strings.\n  \"\"\"\n  if values.ndim != 1:\n    raise ValueError(f'The given array must be 1D, got {values.ndim}D')\n\n  return string_array.format_float_array(\n      values=values.astype(np.float32), num_decimal_places=num_decimal_places\n  )\n"
  },
  {
    "path": "src/alphafold3/structure/parsing.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Module for parsing various data sources and producing Structures.\"\"\"\n\nfrom collections.abc import Collection, Mapping, MutableMapping, Sequence\nimport dataclasses\nimport datetime\nimport enum\nimport functools\nimport itertools\nfrom typing import TypeAlias\n\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.constants import residue_names\nfrom alphafold3.cpp import mmcif_utils\nfrom alphafold3.cpp import string_array\nfrom alphafold3.structure import bioassemblies\nfrom alphafold3.structure import bonds\nfrom alphafold3.structure import chemical_components as struc_chem_comps\nfrom alphafold3.structure import mmcif\nfrom alphafold3.structure import structure\nfrom alphafold3.structure import structure_tables\nimport numpy as np\n\n\nChainIndex: TypeAlias = int\nResIndex: TypeAlias = int\nAtomName: TypeAlias = str\nBondAtomId: TypeAlias = tuple[ChainIndex, ResIndex, AtomName]\n\n_INSERTION_CODE_REMAP: Mapping[str, str] = {'.': '?'}\n\n\nclass NoAtomsError(Exception):\n  \"\"\"Raise when the mmCIF does not have any atoms.\"\"\"\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass BondIndices:\n  from_indices: list[int]\n  dest_indices: list[int]\n\n\n@enum.unique\nclass ModelID(enum.Enum):\n  \"\"\"Values for specifying model IDs when parsing.\"\"\"\n\n  FIRST = 1  # The first model in the file.\n  ALL = 2  # All models in the file.\n\n\n@enum.unique\nclass SequenceFormat(enum.Enum):\n  \"\"\"The possible formats for an input sequence.\"\"\"\n\n  FASTA = 'fasta'  # One-letter code used in FASTA.\n  CCD_CODES = 'ccd_codes'  # Multiple-letter chemical components dictionary ids.\n  LIGAND_SMILES = 'ligand_smiles'  # SMILES string defining a molecule.\n\n\ndef _create_bond_lookup(\n    bonded_atom_pairs: Sequence[tuple[BondAtomId, BondAtomId]],\n) -> Mapping[tuple[ChainIndex, ResIndex], Mapping[AtomName, BondIndices]]:\n  \"\"\"Creates maps to help find bonds during a loop over residues.\"\"\"\n  bond_lookup = {}\n  for bond_i, (from_atom_id, dest_atom_id) in enumerate(bonded_atom_pairs):\n    from_chain_i, from_res_i, from_atom_name = from_atom_id\n    dest_chain_i, dest_res_i, dest_atom_name = dest_atom_id\n    bonds_by_from_atom_name = bond_lookup.setdefault(\n        (from_chain_i, from_res_i), {}\n    )\n    bonds_by_dest_atom_name = bond_lookup.setdefault(\n        (dest_chain_i, dest_res_i), {}\n    )\n    bonds_by_from_atom_name.setdefault(\n        from_atom_name, BondIndices(from_indices=[], dest_indices=[])\n    ).from_indices.append(bond_i)\n    bonds_by_dest_atom_name.setdefault(\n        dest_atom_name, BondIndices(from_indices=[], dest_indices=[])\n    ).dest_indices.append(bond_i)\n  return bond_lookup\n\n\ndef _get_atom_element(\n    ccd: chemical_components.Ccd, res_name: str, atom_name: str\n) -> str:\n  type_symbol = chemical_components.type_symbol(\n      ccd, res_name=res_name, atom_name=atom_name\n  )\n  return type_symbol or '?'\n\n\ndef _get_representative_atom(\n    ccd: chemical_components.Ccd,\n    res_name: str,\n    chain_type: str,\n    sequence_format: SequenceFormat,\n) -> tuple[str, str]:\n  match sequence_format:\n    case SequenceFormat.CCD_CODES:\n      atom_name = _get_first_non_leaving_atom(ccd=ccd, res_name=res_name)\n      atom_element = _get_atom_element(\n          ccd=ccd, res_name=res_name, atom_name=atom_name\n      )\n      return atom_name, atom_element\n    case SequenceFormat.LIGAND_SMILES:\n      return '', '?'\n    case SequenceFormat.FASTA:\n      if chain_type in mmcif_names.PEPTIDE_CHAIN_TYPES:\n        return 'CA', 'C'\n      if chain_type in mmcif_names.NUCLEIC_ACID_CHAIN_TYPES:\n        return \"C1'\", 'C'\n      else:\n        raise ValueError(chain_type)\n    case _:\n      raise ValueError(sequence_format)\n\n\n@functools.lru_cache(maxsize=128)\ndef _get_first_non_leaving_atom(\n    ccd: chemical_components.Ccd, res_name: str\n) -> str:\n  \"\"\"Returns first definitely non-leaving atom if exists, as a stand-in.\"\"\"\n  all_atoms = struc_chem_comps.get_all_atoms_in_entry(ccd, res_name=res_name)[\n      '_chem_comp_atom.atom_id'\n  ]\n  representative_atom = all_atoms[0]\n  if representative_atom == 'O1' and len(all_atoms) > 1:\n    representative_atom = all_atoms[1]\n  return representative_atom\n\n\ndef _add_ligand_to_chem_comp(\n    chem_comp: MutableMapping[str, struc_chem_comps.ChemCompEntry],\n    ligand_id: str,\n    ligand_smiles: str,\n):\n  \"\"\"Adds a ligand to chemical components. Raises ValueError on mismatch.\"\"\"\n  new_entry = struc_chem_comps.ChemCompEntry(\n      type='non-polymer', pdbx_smiles=ligand_smiles\n  )\n\n  existing_entry = chem_comp.get(ligand_id)\n  if existing_entry is None:\n    chem_comp[ligand_id] = new_entry\n  elif existing_entry != new_entry:\n    raise ValueError(\n        f'Mismatching data for ligand {ligand_id}: '\n        f'{new_entry} != {existing_entry}'\n    )\n\n\ndef _get_first_model_id(cif: mmcif.Mmcif) -> str:\n  \"\"\"Returns cheaply the first model ID from the mmCIF.\"\"\"\n  return cif.get_array(\n      '_atom_site.pdbx_PDB_model_num', dtype=object, gather=slice(1)\n  )[0]\n\n\ndef _get_str_model_id(\n    cif: mmcif.Mmcif,\n    model_id: ModelID | int,\n) -> str:\n  \"\"\"Converts a user-specified model_id argument into a string.\"\"\"\n  match model_id:\n    case int():\n      str_model_id = str(model_id)\n    case enum.Enum():\n      # We compare the enum's value attribute since regular enum comparison\n      # breaks when adhoc importing.\n      match model_id.value:\n        case ModelID.FIRST.value:\n          try:\n            str_model_id = _get_first_model_id(cif)\n          except IndexError as e:\n            raise NoAtomsError(\n                'The mmCIF does not have any atoms or'\n                ' _atom_site.pdbx_PDB_model_num is missing.'\n            ) from e\n        case ModelID.ALL.value:\n          str_model_id = ''\n        case _:\n          raise ValueError(\n              f'Model ID {model_id} with value {model_id.value} not recognized.'\n          )\n    case _:\n      raise ValueError(\n          f'Model ID {model_id} with type {type(model_id)} not recognized.'\n      )\n  return str_model_id\n\n\ndef _parse_bonds(\n    cif: mmcif.Mmcif,\n    atom_key: np.ndarray,\n    model_id: str,\n) -> bonds.Bonds:\n  \"\"\"Returns the bonds table extracted from the mmCIF.\n\n  Args:\n    cif: The raw mmCIF to extract the bond information from.\n    atom_key: A numpy array defining atom key for each atom in _atom_site. Note\n      that the atom key must be computed before resolving alt-locs since this\n      function operates on the raw mmCIF!\n    model_id: The ID of the model to get bonds for.\n  \"\"\"\n  if '_struct_conn.id' not in cif:\n    # This is the category key item for the _struct_conn table, therefore\n    # we use it to determine whether to parse bond info.\n    return bonds.Bonds.make_empty()\n  from_atom, dest_atom = mmcif.get_bond_atom_indices(cif, model_id)\n  from_atom = np.array(from_atom, dtype=np.int64)\n  dest_atom = np.array(dest_atom, dtype=np.int64)\n  num_bonds = from_atom.shape[0]\n  bond_key = np.arange(num_bonds, dtype=np.int64)\n  bond_type = cif.get_array('_struct_conn.conn_type_id', dtype=object)\n  if '_struct_conn.pdbx_role' in cif:  # This column isn't always present.\n    bond_role = cif.get_array('_struct_conn.pdbx_role', dtype=object)\n  else:\n    bond_role = np.full((num_bonds,), '?', dtype=object)\n\n  bonds_mask = np.ones((num_bonds,), dtype=bool)\n  # Symmetries other than 1_555 imply the atom is not part of the asymmetric\n  # unit, and therefore this is a bond that only exists in the expanded\n  # bioassembly.\n  # We do not currently support parsing these types of bonds.\n  if '_struct_conn.ptnr1_symmetry' in cif:\n    ptnr1_symmetry = cif.get_array('_struct_conn.ptnr1_symmetry', dtype=object)\n    np.logical_and(bonds_mask, ptnr1_symmetry == '1_555', out=bonds_mask)\n  if '_struct_conn.ptnr2_symmetry' in cif:\n    ptnr2_symmetry = cif.get_array('_struct_conn.ptnr2_symmetry', dtype=object)\n    np.logical_and(bonds_mask, ptnr2_symmetry == '1_555', out=bonds_mask)\n  # Remove bonds that involve atoms that are not part of the structure,\n  # e.g. waters if include_water=False. In a rare case this also removes invalid\n  # bonds that are indicated by a key that is set to _atom_site size.\n  np.logical_and(bonds_mask, np.isin(from_atom, atom_key), out=bonds_mask)\n  np.logical_and(bonds_mask, np.isin(dest_atom, atom_key), out=bonds_mask)\n  return bonds.Bonds(\n      key=bond_key[bonds_mask],\n      type=bond_type[bonds_mask],\n      role=bond_role[bonds_mask],\n      from_atom_key=from_atom[bonds_mask],\n      dest_atom_key=dest_atom[bonds_mask],\n  )\n\n\n@dataclasses.dataclass(frozen=True, slots=True)\nclass _MmcifHeader:\n  name: str\n  resolution: float | None\n  release_date: datetime.date | None\n  structure_method: str | None\n  bioassembly_data: bioassemblies.BioassemblyData | None\n  chemical_components_data: struc_chem_comps.ChemicalComponentsData | None\n\n\ndef _get_mmcif_header(\n    cif: mmcif.Mmcif,\n    fix_mse: bool,\n    fix_unknown_dna: bool,\n) -> _MmcifHeader:\n  \"\"\"Extract header fields from an mmCIF object.\"\"\"\n  entry_id = cif.get('_entry.id')\n  name = entry_id[0] if entry_id else cif.get_data_name()\n  resolution = mmcif.get_resolution(cif)\n\n  release_date = mmcif.get_release_date(cif)\n  if release_date is not None:\n    release_date = datetime.date.fromisoformat(release_date)\n\n  experiments = cif.get('_exptl.method')\n  structure_method = ','.join(experiments) if experiments else None\n\n  try:\n    bioassembly_data = bioassemblies.BioassemblyData.from_mmcif(cif)\n  except bioassemblies.MissingBioassemblyDataError:\n    bioassembly_data = None\n\n  try:\n    chemical_components_data = (\n        struc_chem_comps.ChemicalComponentsData.from_mmcif(\n            cif, fix_mse=fix_mse, fix_unknown_dna=fix_unknown_dna\n        )\n    )\n  except struc_chem_comps.MissingChemicalComponentsDataError:\n    chemical_components_data = None\n\n  return _MmcifHeader(\n      name=name,\n      resolution=resolution,\n      release_date=release_date,\n      structure_method=structure_method,\n      bioassembly_data=bioassembly_data,\n      chemical_components_data=chemical_components_data,\n  )\n\n\ndef from_parsed_mmcif(\n    mmcif_object: mmcif.Mmcif,\n    *,\n    name: str | None = None,\n    fix_mse_residues: bool = False,\n    fix_arginines: bool = False,\n    fix_unknown_dna: bool = False,\n    include_water: bool = False,\n    include_other: bool = False,\n    include_bonds: bool = False,\n    model_id: int | ModelID = ModelID.FIRST,\n) -> structure.Structure:\n  \"\"\"Construct a Structure from a parsed mmCIF object.\n\n  This function is called by `from_mmcif` but can be useful when an mmCIF has\n  already been parsed e.g. to extract extra information from the header before\n  then converting to Structure for further manipulation.\n\n  Args:\n    mmcif_object: A parsed mmcif.Mmcif object.\n    name: Optional name for the structure. If not provided, the name will be\n      taken from the mmCIF data_ field.\n    fix_mse_residues: If True, selenium atom sites (SE) in selenomethionine\n      (MSE) residues will be changed to sulphur atom sites (SD). This is because\n      methionine (MET) residues are often replaced with MSE to aid X-Ray\n      crystallography. If False, the SE MSE atom sites won't be modified.\n    fix_arginines: If True, NH1 and NH2 in arginine will be swapped if needed so\n      that NH1 is always closer to CD than NH2. If False, no atom sites in\n      arginine will be touched. Note that HH11, HH12, HH21, HH22 are fixed too.\n    fix_unknown_dna: If True, residues with name N in DNA chains will have their\n      res_name replaced with DN. Atoms are not changed.\n    include_water: If True, water (HOH) molecules will be parsed. Water\n      molecules may be grouped into chains, where number of residues > 1. Water\n      molecules are usually grouped into chains but do not necessarily all share\n      the same chain ID.\n    include_other: If True, all other atoms that are not included by any of the\n      above parameters will be included. This covers e.g. \"polypeptide(D)\" and\n      \"macrolide\" entities, as well as all other non-standard types.\n    include_bonds: If True, bond information will be parsed from the mmCIF and\n      stored in the Structure.\n    model_id: Either the integer model ID to parse, or one of ModelID.FIRST to\n      parse the first model, or ModelID.ALL to parse all models.\n\n  Returns:\n    A Structure representation of the mmCIF object.\n  \"\"\"\n  str_model_id = _get_str_model_id(cif=mmcif_object, model_id=model_id)\n  header = _get_mmcif_header(\n      mmcif_object, fix_mse=fix_mse_residues, fix_unknown_dna=fix_unknown_dna\n  )\n\n  chains, residues, atoms = get_tables(\n      cif=mmcif_object,\n      fix_mse_residues=fix_mse_residues,\n      fix_arginines=fix_arginines,\n      fix_unknown_dna=fix_unknown_dna,\n      include_water=include_water,\n      include_other=include_other,\n      model_id=str_model_id,\n  )\n\n  if include_bonds and atoms.size > 0:\n    # NB: parsing the atom table before the bonds table allows for a more\n    # informative error message when dealing with bad multi-model mmCIFs.\n    # Also always use a specific model ID, even when parsing all models.\n    if str_model_id == '':  # pylint: disable=g-explicit-bool-comparison\n      bonds_model_id = _get_first_model_id(mmcif_object)\n    else:\n      bonds_model_id = str_model_id\n\n    bonds_table = _parse_bonds(\n        mmcif_object,\n        atom_key=atoms.key,\n        model_id=bonds_model_id,\n    )\n  else:\n    bonds_table = bonds.Bonds.make_empty()\n\n  return structure.Structure(\n      name=name if name is not None else header.name,\n      resolution=header.resolution,\n      release_date=header.release_date,\n      structure_method=header.structure_method,\n      bioassembly_data=header.bioassembly_data,\n      chemical_components_data=header.chemical_components_data,\n      bonds=bonds_table,\n      chains=chains,\n      residues=residues,\n      atoms=atoms,\n  )\n\n\ndef from_mmcif(\n    mmcif_string: str | bytes,\n    *,\n    name: str | None = None,\n    fix_mse_residues: bool = False,\n    fix_arginines: bool = False,\n    fix_unknown_dna: bool = False,\n    include_water: bool = False,\n    include_other: bool = False,\n    include_bonds: bool = False,\n    model_id: int | ModelID = ModelID.FIRST,\n) -> structure.Structure:\n  \"\"\"Construct a Structure from a mmCIF string.\n\n  Args:\n    mmcif_string: The string contents of an mmCIF file.\n    name: Optional name for the structure. If not provided, the name will be\n      taken from the mmCIF data_ field.\n    fix_mse_residues: If True, selenium atom sites (SE) in selenomethionine\n      (MSE) residues will be changed to sulphur atom sites (SD). This is because\n      methionine (MET) residues are often replaced with MSE to aid X-Ray\n      crystallography. If False, the SE MSE atom sites won't be modified.\n    fix_arginines: If True, NH1 and NH2 in arginine will be swapped if needed so\n      that NH1 is always closer to CD than NH2. If False, no atom sites in\n      arginine will be touched. Note that HH11, HH12, HH21, HH22 are fixed too.\n    fix_unknown_dna: If True, residues with name N in DNA chains will have their\n      res_name replaced with DN. Atoms are not changed.\n    include_water: If True, water (HOH) molecules will be parsed. Water\n      molecules may be grouped into chains, where number of residues > 1. Water\n      molecules are usually grouped into chains but do not necessarily all share\n      the same chain ID.\n    include_other: If True, all other atoms that are not included by any of the\n      above parameters will be included. This covers e.g. \"polypeptide(D)\" and\n      \"macrolide\" entities, as well as all other non-standard types.\n    include_bonds: If True, bond information will be parsed from the mmCIF and\n      stored in the Structure.\n    model_id: Either the integer model ID to parse, or one of ModelID.FIRST to\n      parse the first model, or ModelID.ALL to parse all models.\n\n  Returns:\n    A Structure representation of the mmCIF string.\n  \"\"\"\n  mmcif_object = mmcif.from_string(mmcif_string)\n\n  return from_parsed_mmcif(\n      mmcif_object,\n      name=name,\n      fix_mse_residues=fix_mse_residues,\n      fix_arginines=fix_arginines,\n      fix_unknown_dna=fix_unknown_dna,\n      include_water=include_water,\n      include_other=include_other,\n      include_bonds=include_bonds,\n      model_id=model_id,\n  )\n\n\ndef from_res_arrays(atom_mask: np.ndarray, **kwargs) -> structure.Structure:\n  \"\"\"Returns Structure created from from arrays with a residue dimension.\n\n  All unset fields are filled with defaults (e.g. 1.0 for occupancy) or\n  unset/unknown values (e.g. UNK for residue type, or '.' for atom element).\n\n  Args:\n    atom_mask: A array with shape (num_res, num_atom). This is used to decide\n      which atoms in the atom dimension are present in a given residue. Present\n      atoms should have a nonzero value, e.g. 1.0 or True.\n    **kwargs: A mapping from field name to values. For all array-valued fields\n      these arrays must have a dimension of length num_res. Chain and residue\n      fields should have this as their only dimension and atom fields should be\n      shaped (num_res, num_atom). Coordinate fields may also have arbitrary\n      leading dimensions (they must be the same across all coordinate fields).\n      See structure.{CHAIN,RESIDUE,ATOM}_FIELDS for a list of allowed fields.\n  \"\"\"\n  num_res, num_atom = atom_mask.shape\n  included_indices = np.flatnonzero(atom_mask)\n\n  array_fields = (\n      structure.CHAIN_FIELDS.keys()\n      | structure.RESIDUE_FIELDS.keys()\n      | structure.ATOM_FIELDS.keys()\n  )\n  initializer_kwargs = {}\n  fields = {}\n  for k, val in kwargs.items():\n    if k not in array_fields:\n      # The kwarg key isn't an array field name. Such kwargs are forwarded as-is\n      # to the constructor. They are expected to be global fields (e.g. name).\n      # Other values will raise an error when the constructor is called.\n      if k in structure.TABLE_FIELDS:\n        raise ValueError(f'Table fields must not be set. Got {k}.')\n      initializer_kwargs[k] = val\n      continue\n    elif val is None:\n      raise ValueError(f'{k} must be non-None.')\n\n    if not isinstance(val, np.ndarray):\n      raise TypeError(f'Value for {k} must be a NumPy array. Got {type(val)}.')\n    if k in structure.CHAIN_FIELDS or k in structure.RESIDUE_FIELDS:\n      if val.shape != (num_res,):\n        raise ValueError(\n            f'{k} must have shape ({num_res=},). Got {val.shape=}.'\n        )\n      # Do not reshape the chain/residue arrays, they have the shape we need.\n      fields[k] = val\n    else:\n      assert k in structure.ATOM_FIELDS\n      if val.shape[-2:] != (num_res, num_atom):\n        raise ValueError(\n            f'{k} must have final two dimensions of length '\n            f'{(num_res, num_atom)=}. Got {val.shape=}.'\n        )\n      leading_dims = val.shape[:-2]\n      flat_val = val.reshape(leading_dims + (-1,), order='C')\n      masked_val = flat_val[..., included_indices]\n      fields[k] = masked_val\n\n  # Get chain IDs or assume this is a single-chain structure.\n  chain_id = kwargs.get('chain_id', np.array(['A'] * num_res, dtype=object))\n  # Find chain starts in res-sized arrays, use these to make chain-sized arrays.\n  chain_start = np.concatenate(\n      ([0], np.where(chain_id[1:] != chain_id[:-1])[0] + 1)\n  )\n  if len(set(chain_id)) != len(chain_start):\n    raise ValueError(f'Chain IDs must be contiguous, but got {chain_id}')\n\n  chain_lengths = np.diff(chain_start, append=len(chain_id))\n  chain_key = np.repeat(np.arange(len(chain_start)), chain_lengths)\n\n  chain_entity_id = fields.get('chain_entity_id')\n  if chain_entity_id is not None:\n    entity_id = chain_entity_id[chain_start]\n  else:\n    entity_id = np.array(\n        [str(mmcif.str_id_to_int_id(cid)) for cid in chain_id[chain_start]],\n        dtype=object,\n    )\n  chain_str_empty = np.full((num_res,), '.', dtype=object)\n  chains_table = structure_tables.Chains(\n      key=chain_key[chain_start],\n      id=chain_id[chain_start],\n      type=fields.get('chain_type', chain_str_empty)[chain_start],\n      auth_asym_id=fields.get('chain_auth_asym_id', chain_id)[chain_start],\n      entity_id=entity_id,\n      entity_desc=fields.get('chain_entity_desc', chain_str_empty)[chain_start],\n  )\n\n  # Since all arrays are residue-shaped, we can use them directly.\n  res_key = np.arange(num_res, dtype=np.int64)\n  res_id = fields.get('res_id', res_key + 1).astype(np.int32)\n  residues_table = structure_tables.Residues(\n      key=res_key,\n      chain_key=chain_key,\n      id=res_id,\n      name=fields.get('res_name', np.full(num_res, 'UNK', dtype=object)),\n      auth_seq_id=fields.get(\n          'res_auth_seq_id', np.char.mod('%d', res_id).astype(object)\n      ),\n      insertion_code=fields.get(\n          'res_insertion_code', np.full(num_res, '?', dtype=object)\n      ),\n  )\n\n  # The atom-sized arrays have already been masked and reshaped.\n  num_atoms_per_res = np.sum(atom_mask, axis=1, dtype=np.int32)\n  num_atoms_total = np.sum(num_atoms_per_res, dtype=np.int32)\n  # Structure is immutable, so use the same array multiple times to save RAM.\n  atom_str_empty = np.full(num_atoms_total, '.', dtype=object)\n  atom_float32_zeros = np.zeros(num_atoms_total, dtype=np.float32)\n  atom_float32_ones = np.ones(num_atoms_total, dtype=np.float32)\n  atoms_table = structure_tables.Atoms(\n      key=np.arange(num_atoms_total, dtype=np.int64),\n      chain_key=np.repeat(chain_key, num_atoms_per_res),\n      res_key=np.repeat(res_key, num_atoms_per_res),\n      name=fields.get('atom_name', atom_str_empty),\n      element=fields.get('atom_element', atom_str_empty),\n      x=fields.get('atom_x', atom_float32_zeros),\n      y=fields.get('atom_y', atom_float32_zeros),\n      z=fields.get('atom_z', atom_float32_zeros),\n      b_factor=fields.get('atom_b_factor', atom_float32_zeros),\n      occupancy=fields.get('atom_occupancy', atom_float32_ones),\n  )\n\n  return structure.Structure(\n      chains=chains_table,\n      residues=residues_table,\n      atoms=atoms_table,\n      bonds=structure_tables.Bonds.make_empty(),  # Currently not set.\n      **initializer_kwargs,\n  )\n\n\ndef expand_sequence(\n    sequence: str, chain_type: str, sequence_format: SequenceFormat\n) -> Sequence[str]:\n  \"\"\"Returns full residue names based on a sequence string.\n\n  Args:\n    sequence: A string representing the sequence.\n    chain_type: The chain type of the sequence.\n    sequence_format: The format of the sequence argument.\n  \"\"\"\n  match sequence_format:\n    case SequenceFormat.FASTA:\n      if not all(c.isalpha() for c in sequence):\n        raise ValueError(f'Sequence \"{sequence}\" has non-alphabetic characters')\n      match chain_type:\n        case mmcif_names.PROTEIN_CHAIN:\n          res_name_map = residue_names.PROTEIN_COMMON_ONE_TO_THREE\n          default_res_name = residue_names.UNK\n        case mmcif_names.RNA_CHAIN:\n          res_name_map = {r: r for r in residue_names.RNA_TYPES}\n          default_res_name = residue_names.UNK_RNA\n        case mmcif_names.DNA_CHAIN:\n          res_name_map = residue_names.DNA_COMMON_ONE_TO_TWO\n          default_res_name = residue_names.UNK_DNA\n        case _:\n          raise ValueError(f'{chain_type=} not supported for FASTA format.')\n      return [\n          res_name_map.get(one_letter_res, default_res_name)\n          for one_letter_res in sequence\n      ]\n    case SequenceFormat.CCD_CODES:\n      return sequence.strip('()').split(')(')\n    case SequenceFormat.LIGAND_SMILES:\n      ligand_id, _ = sequence.split(':', maxsplit=1)\n      return [ligand_id]\n\n\ndef from_sequences_and_bonds(\n    *,\n    sequences: Sequence[str],\n    chain_types: Sequence[str],\n    sequence_formats: Sequence[SequenceFormat],\n    bonded_atom_pairs: Sequence[tuple[BondAtomId, BondAtomId]] | None,\n    ccd: chemical_components.Ccd,\n    chain_ids: Sequence[str] | None = None,\n    name: str = 'from_sequences_and_bonds',\n    bond_type: str | None = None,\n    **constructor_args,\n) -> structure.Structure:\n  \"\"\"Returns a minimal structure for the input sequences and bonds.\n\n  The returned structure will have at least one atom per residue. If the\n  residue has any bonded atoms, according to `bonded_atom_pairs`, then\n  all (and only) those atoms will be present for that residue. If the residue\n  is not involved in any bond then an arbitrary atom will be created.\n\n  Args:\n    sequences: A sequence of strings, each one representing a single chain.\n    chain_types: The types of each chain, e.g. polypeptide(L). The n-th element\n      describes the n-th sequence in `sequences`.\n    sequence_formats: The format of each sequence. The n-th element describes\n      the n-th sequence in `sequences`.\n    bonded_atom_pairs: A sequence of bonded atom pairs. Each atom is described\n      as a tuple of (chain_index, res_index, atom_name), where the first two\n      values are 0-based indices. The chain_index is the index of the chain in\n      the `sequences` argument, and the res_index is the index of the residue in\n      that sequence. The atom_name is the name of the atom in the residue, e.g.\n      CA. If the atom is not found in the standard atoms for that residue\n      (according to the CCD) then an error is raised.\n    ccd: The chemical components dictionary.\n    chain_ids: A sequence of chain IDs, one for each chain in `sequences`. If\n      not provided, then the chain IDs will be generated automatically based on\n      sequence indices.\n    name: A name for the returned structure.\n    bond_type: This type will be used for all bonds in the structure, where type\n      follows PDB scheme, e.g. unknown (?), hydrog, metalc, covale, disulf.\n    **constructor_args: These arguments are passed directly to the\n      structure.Structure constructor.\n  \"\"\"\n  chain_id = []\n  chain_type = []\n  chain_res_count = []\n  res_id = []\n  res_name = []\n  res_atom_count = []\n  atom_name = []\n  atom_element = []\n  chem_comp = {}\n\n  num_bonds = len(bonded_atom_pairs or ())\n  from_atom_key = np.full((num_bonds,), -1, dtype=np.int64)\n  dest_atom_key = np.full((num_bonds,), -1, dtype=np.int64)\n\n  # Create map (chain_i, res_i) -> {atom_name -> (from_idxs dest_idxs)}.\n  # This allows quick lookup of whether a residue has any bonded atoms, and\n  # which bonds those atoms participate in.\n  bond_lookup = _create_bond_lookup(bonded_atom_pairs or ())\n\n  current_atom_key = 0\n  for chain_i, (sequence, curr_chain_type, sequence_format) in enumerate(\n      zip(sequences, chain_types, sequence_formats, strict=True)\n  ):\n    if chain_ids is not None:\n      current_chain_id = chain_ids[chain_i]\n    else:\n      current_chain_id = mmcif.int_id_to_str_id(chain_i + 1)\n    num_chain_residues = 0\n    for res_i, full_res_name in enumerate(\n        expand_sequence(sequence, curr_chain_type, sequence_format)\n    ):\n      current_res_id = res_i + 1\n      num_res_atoms = 0\n\n      # Look for bonded atoms in the bond lookup and if any are found, add\n      # their atom keys to the bond atom_key columns.\n      if bond_indices_by_atom_name := bond_lookup.get((chain_i, res_i)):\n        comp_atoms = None\n        if sequence_format != SequenceFormat.LIGAND_SMILES:\n          comp_atoms = set(ccd.get(full_res_name)['_chem_comp_atom.atom_id'])\n        for bond_atom_name, bond_indices in bond_indices_by_atom_name.items():\n          if comp_atoms is not None and bond_atom_name not in comp_atoms:\n            raise ValueError(\n                f'Bonded atom \"{bond_atom_name}\" was not found in the list of'\n                f' atoms of the chemical component {full_res_name}. Valid atom'\n                f' names for {full_res_name} are: {sorted(comp_atoms)}.'\n                ' This is likely caused by an invalid atom name in the bonded'\n                f' atom (chain_id={current_chain_id}, res_id={current_res_id},'\n                f' atom_name={bond_atom_name}) specified in `bondedAtomPairs`'\n                ' in the input JSON.'\n            )\n          atom_name.append(bond_atom_name)\n          atom_element.append(\n              _get_atom_element(\n                  ccd=ccd, res_name=full_res_name, atom_name=bond_atom_name\n              )\n          )\n          for from_bond_i in bond_indices.from_indices:\n            from_atom_key[from_bond_i] = current_atom_key\n          for dest_bond_i in bond_indices.dest_indices:\n            dest_atom_key[dest_bond_i] = current_atom_key\n          current_atom_key += 1\n          num_res_atoms += 1\n      else:\n        # If this residue has no bonded atoms then we need to add one atom\n        # like in from_sequences.\n        assert num_res_atoms == 0\n        rep_atom_name, rep_atom_element = _get_representative_atom(\n            ccd=ccd,\n            res_name=full_res_name,\n            chain_type=curr_chain_type,\n            sequence_format=sequence_format,\n        )\n        atom_name.append(rep_atom_name)\n        atom_element.append(rep_atom_element)\n        num_res_atoms += 1\n        current_atom_key += 1\n\n      if sequence_format == SequenceFormat.LIGAND_SMILES:\n        # Sequence expect to be in the format <ligand_id>:<ligand_smiles>,\n        # which always corresponds to a single-residue chain.\n        ligand_id, ligand_smiles = sequence.split(':', maxsplit=1)\n        if ccd.get(ligand_id) is not None:\n          raise ValueError(\n              f'Ligand name {ligand_id} is in CCD - it is not supported to give'\n              ' ligands created from SMILES the same name as CCD components.'\n          )\n        # We need to provide additional chemical components metadata for\n        # ligands specified via SMILES strings since they might not be in CCD.\n        _add_ligand_to_chem_comp(chem_comp, ligand_id, ligand_smiles)\n\n      assert num_res_atoms >= 1\n      res_atom_count.append(num_res_atoms)\n      num_chain_residues += 1\n      res_id.append(current_res_id)\n      res_name.append(full_res_name)\n\n    chain_id.append(current_chain_id)\n    chain_type.append(curr_chain_type)\n    chain_res_count.append(num_chain_residues)\n\n  chem_comp_data = struc_chem_comps.ChemicalComponentsData(chem_comp)\n  chem_comp_data = struc_chem_comps.populate_missing_ccd_data(\n      ccd=ccd,\n      chemical_components_data=chem_comp_data,\n      chemical_component_ids=set(res_name),\n  )\n\n  if bonded_atom_pairs is not None:\n    unknown_bond_col = np.full((num_bonds,), '?', dtype=object)\n    if bond_type is None:\n      bond_type_col = unknown_bond_col\n    else:\n      bond_type_col = np.full((num_bonds,), bond_type, dtype=object)\n    bonds_table = bonds.Bonds(\n        key=np.arange(num_bonds, dtype=np.int64),\n        type=bond_type_col,\n        role=unknown_bond_col,\n        from_atom_key=from_atom_key,\n        dest_atom_key=dest_atom_key,\n    )\n  else:\n    bonds_table = structure_tables.Bonds.make_empty()\n\n  chain_key = np.arange(len(sequences), dtype=np.int64)  # 1 chain per sequence.\n  chain_id = np.array(chain_id, dtype=object)\n  chains_table = structure_tables.Chains(\n      key=chain_key,\n      id=chain_id,\n      type=np.array(chain_type, dtype=object),\n      auth_asym_id=chain_id,\n      entity_id=np.char.mod('%d', chain_key + 1).astype(object),\n      entity_desc=np.array(['.'] * len(chain_key), dtype=object),\n  )\n\n  res_key = np.arange(len(res_name), dtype=np.int64)\n  res_chain_key = np.repeat(chain_key, chain_res_count)\n  residues_table = structure_tables.Residues(\n      key=res_key,\n      chain_key=res_chain_key,\n      id=np.array(res_id, dtype=np.int32),\n      name=np.array(res_name, dtype=object),\n      auth_seq_id=np.char.mod('%d', res_id).astype(object),\n      insertion_code=np.full(len(res_name), '?', dtype=object),\n  )\n\n  num_atoms = current_atom_key\n  atom_float32_zeros = np.zeros(num_atoms, dtype=np.float32)\n  atoms_table = structure_tables.Atoms(\n      key=np.arange(num_atoms, dtype=np.int64),\n      chain_key=np.repeat(res_chain_key, res_atom_count),\n      res_key=np.repeat(res_key, res_atom_count),\n      name=np.array(atom_name, dtype=object),\n      element=np.array(atom_element, dtype=object),\n      x=atom_float32_zeros,\n      y=atom_float32_zeros,\n      z=atom_float32_zeros,\n      b_factor=atom_float32_zeros,\n      occupancy=np.ones(num_atoms, np.float32),\n  )\n\n  return structure.Structure(\n      name=name,\n      atoms=atoms_table,\n      residues=residues_table,\n      chains=chains_table,\n      bonds=bonds_table,\n      chemical_components_data=chem_comp_data,\n      **constructor_args,\n  )\n\n\nclass _ChainResBuilder:\n  \"\"\"Class for incrementally building chain and residue tables.\"\"\"\n\n  def __init__(\n      self,\n      *,\n      chain_key_by_chain_id: Mapping[str, int],\n      entity_id_by_chain_id: Mapping[str, str],\n      chain_type_by_entity_id: Mapping[str, str],\n      entity_desc_by_entity_id: Mapping[str, str],\n      fix_mse_residues: bool,\n      fix_unknown_dna: bool,\n  ):\n    # Len: num_chains.\n    self.chain_key = []\n    self.chain_id = []\n    self.chain_type = []\n    self.chain_auth_asym_id = []\n    self.chain_entity_id = []\n    self.chain_entity_desc = []\n\n    # Len: num_residues.\n    self.res_key = []\n    self.res_chain_key = []\n    self.res_id = []\n    self.res_name = []\n    self.res_auth_seq_id = []\n    self.res_insertion_code = []\n\n    self.chain_key_by_chain_id = chain_key_by_chain_id\n    self.entity_id_by_chain_id = entity_id_by_chain_id\n    self.chain_type_by_entity_id = chain_type_by_entity_id\n    self.entity_desc_by_entity_id = entity_desc_by_entity_id\n    self.key_for_res: dict[tuple[str, str, str, str], int] = {}\n\n    self._fix_mse_residues = fix_mse_residues\n    self._fix_unknown_dna = fix_unknown_dna\n\n  def add_residues(\n      self,\n      *,\n      chain_ids: np.ndarray,\n      chain_auth_asym_ids: np.ndarray,\n      res_ids: np.ndarray,\n      res_names: np.ndarray,\n      res_auth_seq_ids: np.ndarray,\n      res_ins_codes: np.ndarray,\n  ):\n    \"\"\"Adds a residue (and its chain) to the tables.\"\"\"\n    # Create chain table data.\n    if chain_ids.size == 0:\n      return\n\n    chain_ids_with_prev = np.concatenate(\n        (([self.chain_id[-1] if self.chain_id else None], chain_ids))\n    )\n    chain_change_mask = chain_ids_with_prev[:-1] != chain_ids_with_prev[1:]\n    chain_change_ids = chain_ids[chain_change_mask]\n    chain_keys = string_array.remap(\n        chain_change_ids, self.chain_key_by_chain_id, inplace=False\n    )\n    self.chain_key.extend(chain_keys)\n    self.chain_id.extend(chain_change_ids)\n    self.chain_auth_asym_id.extend(chain_auth_asym_ids[chain_change_mask])\n    chain_entity_id = string_array.remap(\n        chain_change_ids, self.entity_id_by_chain_id, inplace=False\n    )\n    self.chain_entity_id.extend(chain_entity_id)\n    chain_type = string_array.remap(\n        chain_entity_id, self.chain_type_by_entity_id, inplace=False\n    )\n    self.chain_type.extend(chain_type)\n    chain_entity_desc = string_array.remap(\n        chain_entity_id, self.entity_desc_by_entity_id, inplace=False\n    )\n    self.chain_entity_desc.extend(chain_entity_desc)\n\n    # Create residue table data.\n    num_prev_res = len(self.res_id)\n    res_keys = np.arange(num_prev_res, num_prev_res + len(res_ids))\n    res_iter = zip(\n        chain_ids,\n        res_auth_seq_ids,\n        res_names,\n        res_ins_codes,\n        strict=True,\n    )\n    key_for_res_update = {\n        res_unique_id: res_key\n        for res_key, res_unique_id in enumerate(res_iter, num_prev_res)\n    }\n    self.key_for_res.update(key_for_res_update)\n    self.res_key.extend(res_keys)\n    self.res_chain_key.extend(\n        string_array.remap(chain_ids, self.chain_key_by_chain_id, inplace=False)\n    )\n    self.res_id.extend(res_ids)\n    self.res_name.extend(res_names)\n    self.res_auth_seq_id.extend(res_auth_seq_ids)\n    self.res_insertion_code.extend(res_ins_codes)\n\n  def make_chains_table(self) -> structure_tables.Chains:\n    \"\"\"Returns the Structure chains table.\"\"\"\n    chain_key = np.array(self.chain_key, dtype=np.int64)\n    if not np.all(chain_key[:-1] <= chain_key[1:]):\n      # If the order is inconsistent with the atoms table, sort so that it is.\n      order = np.argsort(self.chain_key, kind='stable')\n      return structure_tables.Chains(\n          key=chain_key[order],\n          id=np.array(self.chain_id, dtype=object)[order],\n          type=np.array(self.chain_type, dtype=object)[order],\n          auth_asym_id=np.array(self.chain_auth_asym_id, dtype=object)[order],\n          entity_id=np.array(self.chain_entity_id, dtype=object)[order],\n          entity_desc=np.array(self.chain_entity_desc, dtype=object)[order],\n      )\n    return structure_tables.Chains(\n        key=chain_key,\n        id=np.array(self.chain_id, dtype=object),\n        type=np.array(self.chain_type, dtype=object),\n        auth_asym_id=np.array(self.chain_auth_asym_id, dtype=object),\n        entity_id=np.array(self.chain_entity_id, dtype=object),\n        entity_desc=np.array(self.chain_entity_desc, dtype=object),\n    )\n\n  def make_residues_table(self) -> structure_tables.Residues:\n    \"\"\"Returns the Structure residues table.\"\"\"\n    res_name = np.array(self.res_name, dtype=object)\n    res_chain_key = np.array(self.res_chain_key, dtype=np.int64)\n\n    if self._fix_mse_residues:\n      string_array.remap(res_name, mapping={'MSE': 'MET'}, inplace=True)\n\n    if self._fix_unknown_dna:\n      # Remap residues from N -> DN in DNA chains only.\n      dna_chain_mask = (\n          np.array(self.chain_type, dtype=object) == mmcif_names.DNA_CHAIN\n      )\n      dna_chain_key = np.array(self.chain_key, dtype=object)[dna_chain_mask]\n      res_name[(res_name == 'N') & np.isin(res_chain_key, dna_chain_key)] = 'DN'\n\n    if not np.all(res_chain_key[:-1] <= res_chain_key[1:]):\n      # If the order is inconsistent with the atoms table, sort so that it is.\n      order = np.argsort(res_chain_key, kind='stable')\n      return structure_tables.Residues(\n          key=np.array(self.res_key, dtype=np.int64)[order],\n          chain_key=res_chain_key[order],\n          id=np.array(self.res_id, dtype=np.int32)[order],\n          name=res_name[order],\n          auth_seq_id=np.array(self.res_auth_seq_id, dtype=object)[order],\n          insertion_code=np.array(self.res_insertion_code, dtype=object)[order],\n      )\n    return structure_tables.Residues(\n        key=np.array(self.res_key, dtype=np.int64),\n        chain_key=res_chain_key,\n        id=np.array(self.res_id, dtype=np.int32),\n        name=res_name,\n        auth_seq_id=np.array(self.res_auth_seq_id, dtype=object),\n        insertion_code=np.array(self.res_insertion_code, dtype=object),\n    )\n\n\ndef _get_string_array_default(cif: mmcif.Mmcif, key: str, default: list[str]):\n  try:\n    return cif.get_array(key, dtype=object)\n  except KeyError:\n    return default\n\n\ndef _generate_required_tables_if_missing(\n    cif: mmcif.Mmcif,\n) -> Mapping[str, Sequence[str]]:\n  \"\"\"Generates all required tables and columns if missing.\"\"\"\n  update = {}\n\n  atom_site_entities = _get_string_array_default(\n      cif, '_atom_site.label_entity_id', []\n  )\n\n  # OpenMM produces files that don't have any of the tables and also have\n  # _atom_site.label_entity_id set to '?' for all atoms. We infer the entities\n  # based on the _atom_site.label_asym_id column. We start with cheaper O(1)\n  # checks to prevent running the expensive O(n) check on most files.\n  if (\n      len(atom_site_entities) > 0  # pylint: disable=g-explicit-length-test\n      and '_entity.id' not in cif  # Ignore if the _entity table exists.\n      and atom_site_entities[0] == '?'  # Cheap check.\n      and set(atom_site_entities) == {'?'}  # Expensive check.\n  ):\n    label_asym_ids = cif.get_array('_atom_site.label_asym_id', dtype=object)\n    atom_site_entities = [\n        str(mmcif.str_id_to_int_id(cid)) for cid in label_asym_ids\n    ]\n    # Update _atom_site.label_entity_id to be consistent with the new tables.\n    update['_atom_site.label_entity_id'] = atom_site_entities\n\n  # Check table existence by checking the presence of its primary key.\n  if '_struct_asym.id' not in cif:\n    # Infer the _struct_asym table using the _atom_site table.\n    asym_ids = _get_string_array_default(cif, '_atom_site.label_asym_id', [])\n\n    if len(atom_site_entities) == 0 or len(asym_ids) == 0:  # pylint: disable=g-explicit-length-test\n      raise ValueError(\n          'Could not parse an mmCIF with no _struct_asym table and also no '\n          '_atom_site.label_entity_id or _atom_site.label_asym_id columns.'\n      )\n\n    # Deduplicate, but keep the order intact - dict.fromkeys maintains order.\n    entity_id_chain_id_pairs = list(\n        dict.fromkeys(zip(atom_site_entities, asym_ids, strict=True))\n    )\n    update['_struct_asym.entity_id'] = [e for e, _ in entity_id_chain_id_pairs]\n    update['_struct_asym.id'] = [c for _, c in entity_id_chain_id_pairs]\n\n  if '_entity.id' not in cif:\n    # Infer the _entity_poly and _entity tables using the _atom_site table.\n    residues = _get_string_array_default(cif, '_atom_site.label_comp_id', [])\n    group_pdb = _get_string_array_default(cif, '_atom_site.group_PDB', [])\n    if '_atom_site.label_entity_id' in cif:\n      entities = atom_site_entities\n    else:\n      # If _atom_site.label_entity_id not set, use the asym_id -> entity_id map.\n      asym_to_entity = dict(\n          zip(\n              cif['_struct_asym.id'], cif['_struct_asym.entity_id'], strict=True\n          )\n      )\n      entities = string_array.remap(\n          cif.get_array('_atom_site.label_asym_id', dtype=object),\n          mapping=asym_to_entity,\n      )\n\n    entity_ids = []\n    entity_types = []\n    entity_poly_entity_ids = []\n    entity_poly_types = []\n    entity_poly_table_missing = '_entity_poly.entity_id' not in cif\n    for entity_id, group in itertools.groupby(\n        zip(entities, residues, group_pdb, strict=True), key=lambda e: e[0]\n    ):\n      _, entity_residues, entity_group_pdb = zip(*group, strict=True)\n      entity_type = _guess_entity_type(\n          chain_residues=entity_residues, atom_types=entity_group_pdb\n      )\n      entity_ids.append(entity_id)\n      entity_types.append(entity_type)\n\n      if entity_poly_table_missing and entity_type == mmcif_names.POLYMER_CHAIN:\n        polymer_type = mmcif_names.guess_polymer_type(entity_residues)\n        entity_poly_entity_ids.append(entity_id)\n        entity_poly_types.append(polymer_type)\n\n    update['_entity.id'] = entity_ids\n    update['_entity.type'] = entity_types\n    if entity_poly_table_missing:\n      update['_entity_poly.entity_id'] = entity_poly_entity_ids\n      update['_entity_poly.type'] = entity_poly_types\n\n  if '_atom_site.type_symbol' not in cif:\n    update['_atom_site.type_symbol'] = mmcif.get_or_infer_type_symbol(cif)\n\n  return update\n\n\ndef _maybe_add_missing_scheme_tables(\n    cif: mmcif.Mmcif,\n    res_starts: Sequence[int],\n    label_asym_ids: np.ndarray,\n    label_seq_ids: np.ndarray,\n    label_comp_ids: np.ndarray,\n    auth_seq_ids: np.ndarray,\n    pdb_ins_codes: np.ndarray,\n) -> Mapping[str, Sequence[str]]:\n  \"\"\"If missing, infers the scheme tables from the _atom_site table.\"\"\"\n  update = {}\n\n  required_poly_seq_scheme_cols = (\n      '_pdbx_poly_seq_scheme.asym_id',\n      '_pdbx_poly_seq_scheme.pdb_seq_num',\n      '_pdbx_poly_seq_scheme.pdb_ins_code',\n      '_pdbx_poly_seq_scheme.seq_id',\n      '_pdbx_poly_seq_scheme.mon_id',\n      '_pdbx_poly_seq_scheme.pdb_strand_id',\n  )\n  if not all(col in cif for col in required_poly_seq_scheme_cols):\n    # Create a mask for atoms where each polymer residue start.\n    entity_id_by_chain_id = dict(\n        zip(cif['_struct_asym.id'], cif['_struct_asym.entity_id'], strict=True)\n    )\n    chain_type_by_entity_id = dict(\n        zip(cif['_entity.id'], cif['_entity.type'], strict=True)\n    )\n    # Remap asym ID -> entity ID.\n    label_entity_id = string_array.remap(\n        label_asym_ids, mapping=entity_id_by_chain_id, inplace=False\n    )\n    # Remap entity ID -> chain type.\n    chain_type = string_array.remap(\n        label_entity_id, mapping=chain_type_by_entity_id, inplace=False\n    )\n    res_mask = np.zeros_like(label_seq_ids, dtype=bool)\n    res_mask[res_starts] = True\n    res_mask &= chain_type == mmcif_names.POLYMER_CHAIN\n\n    entity_poly_seq_cols = (\n        '_entity_poly_seq.entity_id',\n        '_entity_poly_seq.num',\n        '_entity_poly_seq.mon_id',\n    )\n    if all(col in cif for col in entity_poly_seq_cols):\n      # Use _entity_poly_seq if available.\n      poly_seq_num = cif.get_array('_entity_poly_seq.num', dtype=object)\n      poly_seq_mon_id = cif.get_array('_entity_poly_seq.mon_id', dtype=object)\n      poly_seq_entity_id = cif.get_array(\n          '_entity_poly_seq.entity_id', dtype=object\n      )\n      # We have to add the entity ID to the residue ID because multiple residues\n      # can share the same ID. This also allows using string_array.remap.\n      label_seq_id_to_auth_seq_id = dict(\n          zip(\n              np.char.add(label_entity_id[res_mask], label_seq_ids[res_mask]),\n              auth_seq_ids[res_mask],\n              strict=True,\n          )\n      )\n      scheme_pdb_seq_num = string_array.remap(\n          np.char.add(poly_seq_entity_id, poly_seq_num),\n          mapping=label_seq_id_to_auth_seq_id,\n          default_value='.',\n      )\n      label_seq_id_to_ins_code = dict(\n          zip(label_seq_ids[res_mask], pdb_ins_codes[res_mask], strict=True)\n      )\n      scheme_pdb_ins_code = string_array.remap(\n          poly_seq_num, mapping=label_seq_id_to_ins_code, default_value='.'\n      )\n\n      # The _entity_poly_seq table is entity-based, while _pdbx_poly_seq_scheme\n      # is chain-based. A single entity could mean multiple chains (asym_ids),\n      # we therefore need to replicate each entity for all of the chains.\n      scheme_asym_id = []\n      select = []\n      indices = np.arange(len(poly_seq_entity_id), dtype=np.int32)\n      for asym_id, entity_id in zip(\n          cif['_struct_asym.id'], cif['_struct_asym.entity_id'], strict=True\n      ):\n        entity_mask = poly_seq_entity_id == entity_id\n        select.extend(indices[entity_mask])\n        scheme_asym_id.extend([asym_id] * sum(entity_mask))\n\n      scheme_pdb_strand_id = string_array.remap(\n          np.array(scheme_asym_id, dtype=object),\n          mapping=mmcif.get_internal_to_author_chain_id_map(cif),\n          inplace=False,\n      )\n\n      update['_pdbx_poly_seq_scheme.asym_id'] = scheme_asym_id\n      update['_pdbx_poly_seq_scheme.pdb_strand_id'] = scheme_pdb_strand_id\n      update['_pdbx_poly_seq_scheme.pdb_seq_num'] = scheme_pdb_seq_num[select]\n      update['_pdbx_poly_seq_scheme.pdb_ins_code'] = scheme_pdb_ins_code[select]\n      update['_pdbx_poly_seq_scheme.seq_id'] = poly_seq_num[select]\n      update['_pdbx_poly_seq_scheme.mon_id'] = poly_seq_mon_id[select]\n    else:\n      # _entity_poly_seq not available, fallback to _atom_site.\n      res_asym_ids = label_asym_ids[res_mask]\n      res_strand_ids = string_array.remap(\n          array=res_asym_ids,\n          mapping=mmcif.get_internal_to_author_chain_id_map(cif),\n          inplace=False,\n      )\n      update['_pdbx_poly_seq_scheme.asym_id'] = res_asym_ids\n      update['_pdbx_poly_seq_scheme.pdb_strand_id'] = res_strand_ids\n      update['_pdbx_poly_seq_scheme.pdb_seq_num'] = auth_seq_ids[res_mask]\n      update['_pdbx_poly_seq_scheme.pdb_ins_code'] = pdb_ins_codes[res_mask]\n      update['_pdbx_poly_seq_scheme.seq_id'] = label_seq_ids[res_mask]\n      update['_pdbx_poly_seq_scheme.mon_id'] = label_comp_ids[res_mask]\n\n  required_nonpoly_scheme_cols = (\n      '_pdbx_nonpoly_scheme.mon_id',\n      '_pdbx_nonpoly_scheme.asym_id',\n      '_pdbx_nonpoly_scheme.pdb_seq_num',\n      '_pdbx_nonpoly_scheme.pdb_ins_code',\n  )\n  required_branch_scheme_cols = (\n      '_pdbx_branch_scheme.mon_id',\n      '_pdbx_branch_scheme.asym_id',\n      '_pdbx_branch_scheme.pdb_seq_num',\n  )\n\n  # Generate _pdbx_nonpoly_scheme only if both tables are missing.\n  if not (\n      all(col in cif for col in required_nonpoly_scheme_cols)\n      or all(col in cif for col in required_branch_scheme_cols)\n  ):\n    # To be strictly semantically correct, multi-residue ligands should be\n    # written in _pdbx_branch_scheme. However, Structure parsing handles\n    # correctly multi-residue ligands in _pdbx_nonpoly_scheme and the tables\n    # constructed here live only while parsing, hence this is unnecessary.\n    entity_id_by_chain_id = dict(\n        zip(cif['_struct_asym.id'], cif['_struct_asym.entity_id'], strict=True)\n    )\n    chain_type_by_entity_id = dict(\n        zip(cif['_entity.id'], cif['_entity.type'], strict=True)\n    )\n    # Remap asym ID -> entity ID.\n    chain_type = string_array.remap(\n        label_asym_ids, mapping=entity_id_by_chain_id, inplace=False\n    )\n    # Remap entity ID -> chain type.\n    string_array.remap(\n        chain_type, mapping=chain_type_by_entity_id, inplace=True\n    )\n    res_mask = np.zeros_like(label_seq_ids, dtype=bool)\n    res_mask[res_starts] = True\n    res_mask &= chain_type != mmcif_names.POLYMER_CHAIN\n\n    if not np.any(res_mask):\n      return update  # Shortcut: no non-polymer residues.\n\n    ins_codes = string_array.remap(\n        pdb_ins_codes[res_mask], mapping={'?': '.'}, inplace=False\n    )\n\n    update['_pdbx_nonpoly_scheme.asym_id'] = label_asym_ids[res_mask]\n    update['_pdbx_nonpoly_scheme.pdb_seq_num'] = auth_seq_ids[res_mask]\n    update['_pdbx_nonpoly_scheme.pdb_ins_code'] = ins_codes\n    update['_pdbx_nonpoly_scheme.mon_id'] = label_comp_ids[res_mask]\n\n  return update\n\n\ndef _get_chain_key_by_chain_id(\n    resolved_chain_ids: np.ndarray, struct_asym_chain_ids: np.ndarray\n) -> Mapping[str, int]:\n  \"\"\"Returns chain key for each chain ID respecting resolved chain ordering.\"\"\"\n  # Check that all chain IDs found in the (potentially filtered) _atom_site\n  # table are present in the _struct_asym table.\n  unique_resolved_chain_ids = set(resolved_chain_ids)\n  if not unique_resolved_chain_ids.issubset(set(struct_asym_chain_ids)):\n    unique_resolved_chain_ids = sorted(unique_resolved_chain_ids)\n    unique_struct_asym_chain_ids = sorted(set(struct_asym_chain_ids))\n    raise ValueError(\n        'Bad mmCIF: chain IDs in _atom_site.label_asym_id '\n        f'{unique_resolved_chain_ids} is not a subset of chain IDs in '\n        f'_struct_asym.id {unique_struct_asym_chain_ids}.'\n    )\n\n  resolved_mask = string_array.isin(\n      struct_asym_chain_ids, unique_resolved_chain_ids\n  )\n  # For all resolved chains, use the _atom_site order they appear in. E.g.\n  # resolved_chain_ids     = [B A   E D F]\n  # struct_asym_chain_ids  = [A B C D E F]\n  # consistent_chain_order = [B A C E D F]\n  # chain_keys             = [0 1 2 3 4 5]\n  consistent_chain_order = struct_asym_chain_ids.copy()\n  consistent_chain_order[resolved_mask] = resolved_chain_ids\n  return dict(zip(consistent_chain_order, range(len(struct_asym_chain_ids))))\n\n\ndef get_tables(\n    cif: mmcif.Mmcif,\n    fix_mse_residues: bool,\n    fix_arginines: bool,\n    fix_unknown_dna: bool,\n    include_water: bool,\n    include_other: bool,\n    model_id: str,\n) -> tuple[\n    structure_tables.Chains, structure_tables.Residues, structure_tables.Atoms\n]:\n  \"\"\"Returns chain, residue, and atom tables from a parsed mmcif.\n\n  Args:\n    cif: A parsed mmcif.Mmcif.\n    fix_mse_residues: See from_mmcif.\n    fix_arginines: See from_mmcif.\n    fix_unknown_dna: See from_mmcif.\n    include_water: See from_mmcif.\n    include_other: See from_mmcif.\n    model_id: A string defining which model ID to use. If set, only coordinates,\n      b-factors and occupancies for the given model are returned. If empty,\n      coordinates, b-factors and occupanciesall for models are returned with a\n      leading dimension of num_models. Note that the model_id argument in\n      from_mmcif is an integer and has slightly different use (see from_mmcif).\n  \"\"\"\n  # Add any missing tables and columns we require for parsing.\n  if cif_update := _generate_required_tables_if_missing(cif):\n    cif = cif.copy_and_update(cif_update)\n\n  # The wanted_chain_ids include chain IDs that are not necessarily present in\n  # the _atom_site table, because we want to be able to read Structures with\n  # chains consist of only unresolved residues.\n  atom_site_all_models, wanted_chain_ids, layout = mmcif_utils.filter(\n      cif,\n      include_nucleotides=True,\n      include_ligands=True,\n      include_water=include_water,\n      include_other=include_other,\n      model_id=model_id,\n  )\n  atom_site_first_model = atom_site_all_models[0]\n\n  # Get atom information from the _atom_site table.\n  def _first_model_string_array(col: str) -> np.ndarray:\n    return cif.get_array(col, dtype=object, gather=atom_site_first_model)\n\n  def _requested_models_float_array(col: str) -> np.ndarray:\n    if not model_id:\n      # Return data for all models with a leading dimension of num_models.\n      return cif.get_array(col, dtype=np.float32, gather=atom_site_all_models)\n    else:\n      # Return data only for the single requested model.\n      return cif.get_array(col, dtype=np.float32, gather=atom_site_first_model)\n\n  # These columns are the same for all models, fetch them just for the 1st one.\n  label_comp_ids = _first_model_string_array('_atom_site.label_comp_id')\n  label_asym_ids = _first_model_string_array('_atom_site.label_asym_id')\n  label_seq_ids = _first_model_string_array('_atom_site.label_seq_id')\n  label_atom_ids = _first_model_string_array('_atom_site.label_atom_id')\n  if '_atom_site.auth_seq_id' in cif:\n    auth_seq_ids = _first_model_string_array('_atom_site.auth_seq_id')\n  else:\n    auth_seq_ids = label_seq_ids  # auth_seq_id unset, fallback to label_seq_id.\n  type_symbols = _first_model_string_array('_atom_site.type_symbol')\n  pdbx_pdb_ins_codes = _first_model_string_array('_atom_site.pdbx_PDB_ins_code')\n\n  # These columns are different for all models, fetch them as requested.\n  atom_x = _requested_models_float_array('_atom_site.Cartn_x')\n  atom_y = _requested_models_float_array('_atom_site.Cartn_y')\n  atom_z = _requested_models_float_array('_atom_site.Cartn_z')\n  atom_b_factor = _requested_models_float_array('_atom_site.B_iso_or_equiv')\n  atom_occupancy = _requested_models_float_array('_atom_site.occupancy')\n\n  # Make sure the scheme (residue) tables exist in case they are not present.\n  if cif_update := _maybe_add_missing_scheme_tables(\n      cif,\n      res_starts=layout.residue_starts(),\n      label_asym_ids=label_asym_ids,\n      label_seq_ids=label_seq_ids,\n      label_comp_ids=label_comp_ids,\n      auth_seq_ids=auth_seq_ids,\n      pdb_ins_codes=pdbx_pdb_ins_codes,\n  ):\n    cif = cif.copy_and_update(cif_update)\n\n  # Fix common issues found in mmCIF files, like swapped arginine NH atoms.\n  mmcif_utils.fix_residues(\n      layout,\n      comp_id=label_comp_ids,\n      atom_id=label_atom_ids,\n      atom_x=atom_x[0] if not model_id else atom_x,\n      atom_y=atom_y[0] if not model_id else atom_y,\n      atom_z=atom_z[0] if not model_id else atom_z,\n      fix_arg=fix_arginines,\n  )\n\n  # Get keys for chains in the order they appear in _atom_site while also\n  # dealing with empty chains.\n  resolved_chain_ids = label_asym_ids[layout.chain_starts()]\n  struct_asym_chain_ids = cif.get_array('_struct_asym.id', dtype=object)\n\n  chain_key_by_chain_id = _get_chain_key_by_chain_id(\n      resolved_chain_ids=resolved_chain_ids,\n      struct_asym_chain_ids=struct_asym_chain_ids,\n  )\n  entity_id_by_chain_id = dict(\n      zip(struct_asym_chain_ids, cif['_struct_asym.entity_id'], strict=True)\n  )\n  entity_description = cif.get(\n      '_entity.pdbx_description', ['?'] * len(cif['_entity.id'])\n  )\n  entity_desc_by_entity_id = dict(\n      zip(cif['_entity.id'], entity_description, strict=True)\n  )\n  chain_type_by_entity_id = mmcif.get_chain_type_by_entity_id(cif)\n  auth_asym_id_by_chain_id = mmcif.get_internal_to_author_chain_id_map(cif)\n\n  chain_res_builder = _ChainResBuilder(\n      chain_key_by_chain_id=chain_key_by_chain_id,\n      entity_id_by_chain_id=entity_id_by_chain_id,\n      chain_type_by_entity_id=chain_type_by_entity_id,\n      entity_desc_by_entity_id=entity_desc_by_entity_id,\n      fix_mse_residues=fix_mse_residues,\n      fix_unknown_dna=fix_unknown_dna,\n  )\n\n  # Collect data for polymer chain and residue tables. _pdbx_poly_seq_scheme is\n  # guaranteed to be present thanks to _maybe_add_missing_scheme_tables.\n  def _get_poly_seq_scheme_col(col: str) -> np.ndarray:\n    return cif.get_array(key=f'_pdbx_poly_seq_scheme.{col}', dtype=object)\n\n  poly_seq_asym_ids = _get_poly_seq_scheme_col('asym_id')\n  poly_seq_pdb_seq_nums = _get_poly_seq_scheme_col('pdb_seq_num')\n  poly_seq_seq_ids = _get_poly_seq_scheme_col('seq_id')\n  poly_seq_mon_ids = _get_poly_seq_scheme_col('mon_id')\n  poly_seq_pdb_strand_ids = _get_poly_seq_scheme_col('pdb_strand_id')\n  poly_seq_pdb_ins_codes = _get_poly_seq_scheme_col('pdb_ins_code')\n  string_array.remap(\n      poly_seq_pdb_ins_codes, mapping=_INSERTION_CODE_REMAP, inplace=True\n  )\n\n  # We resolved alt-locs earlier for the atoms table. In cases of heterogeneous\n  # residues (a residue with an alt-loc that is of different residue type), we\n  # need to also do the same resolution in the residues table. Compute a mask\n  # for the residues that were selected in the atoms table.\n  poly_seq_mask = mmcif_utils.selected_polymer_residue_mask(\n      layout=layout,\n      atom_site_label_asym_ids=label_asym_ids[layout.residue_starts()],\n      atom_site_label_seq_ids=label_seq_ids[layout.residue_starts()],\n      atom_site_label_comp_ids=label_comp_ids[layout.residue_starts()],\n      poly_seq_asym_ids=poly_seq_asym_ids,\n      poly_seq_seq_ids=poly_seq_seq_ids,\n      poly_seq_mon_ids=poly_seq_mon_ids,\n  )\n\n  if not include_other and poly_seq_mask:\n    # Mask filtered-out residues so that they are not treated as missing.\n    # Instead, we don't want them included in the chains/residues tables at all.\n    keep_mask = string_array.isin(poly_seq_asym_ids, wanted_chain_ids)\n    poly_seq_mask &= keep_mask\n\n  chain_res_builder.add_residues(\n      chain_ids=poly_seq_asym_ids[poly_seq_mask],\n      chain_auth_asym_ids=poly_seq_pdb_strand_ids[poly_seq_mask],\n      res_ids=poly_seq_seq_ids[poly_seq_mask].astype(np.int32),\n      res_names=poly_seq_mon_ids[poly_seq_mask],\n      res_auth_seq_ids=poly_seq_pdb_seq_nums[poly_seq_mask],\n      res_ins_codes=poly_seq_pdb_ins_codes[poly_seq_mask],\n  )\n\n  # Collect data for ligand chain and residue tables. _pdbx_nonpoly_scheme\n  # could be empty/unset if there are only branched ligands.\n  def _get_nonpoly_scheme_col(col: str) -> np.ndarray:\n    key = f'_pdbx_nonpoly_scheme.{col}'\n    if f'_pdbx_nonpoly_scheme.{col}' in cif:\n      return cif.get_array(key=key, dtype=object)\n    else:\n      return np.array([], dtype=object)\n\n  nonpoly_asym_ids = _get_nonpoly_scheme_col('asym_id')\n  nonpoly_auth_seq_ids = _get_nonpoly_scheme_col('pdb_seq_num')\n  nonpoly_pdb_ins_codes = _get_nonpoly_scheme_col('pdb_ins_code')\n  nonpoly_mon_ids = _get_nonpoly_scheme_col('mon_id')\n  nonpoly_auth_asym_id = string_array.remap(\n      nonpoly_asym_ids, mapping=auth_asym_id_by_chain_id, inplace=False\n  )\n\n  def _get_branch_scheme_col(col: str) -> np.ndarray:\n    key = f'_pdbx_branch_scheme.{col}'\n    if f'_pdbx_branch_scheme.{col}' in cif:\n      return cif.get_array(key=key, dtype=object)\n    else:\n      return np.array([], dtype=object)\n\n  branch_asym_ids = _get_branch_scheme_col('asym_id')\n  branch_auth_seq_ids = _get_branch_scheme_col('pdb_seq_num')\n  branch_pdb_ins_codes = _get_branch_scheme_col('pdb_ins_code')\n  branch_mon_ids = _get_branch_scheme_col('mon_id')\n  branch_auth_asym_id = string_array.remap(\n      branch_asym_ids, mapping=auth_asym_id_by_chain_id, inplace=False\n  )\n\n  if branch_asym_ids.size > 0 and branch_pdb_ins_codes.size == 0:\n    branch_pdb_ins_codes = np.array(['.'] * branch_asym_ids.size, dtype=object)\n\n  # Compute the heterogeneous residue masks as above, this time for ligands.\n  nonpoly_mask, branch_mask = mmcif_utils.selected_ligand_residue_mask(\n      layout=layout,\n      atom_site_label_asym_ids=label_asym_ids[layout.residue_starts()],\n      atom_site_label_seq_ids=label_seq_ids[layout.residue_starts()],\n      atom_site_auth_seq_ids=auth_seq_ids[layout.residue_starts()],\n      atom_site_label_comp_ids=label_comp_ids[layout.residue_starts()],\n      atom_site_pdbx_pdb_ins_codes=pdbx_pdb_ins_codes[layout.residue_starts()],\n      nonpoly_asym_ids=nonpoly_asym_ids,\n      nonpoly_auth_seq_ids=nonpoly_auth_seq_ids,\n      nonpoly_pdb_ins_codes=nonpoly_pdb_ins_codes,\n      nonpoly_mon_ids=nonpoly_mon_ids,\n      branch_asym_ids=branch_asym_ids,\n      branch_auth_seq_ids=branch_auth_seq_ids,\n      branch_pdb_ins_codes=branch_pdb_ins_codes,\n      branch_mon_ids=branch_mon_ids,\n  )\n\n  if not include_water:\n    if nonpoly_mask:\n      nonpoly_mask &= (nonpoly_mon_ids != 'HOH') & (nonpoly_mon_ids != 'DOD')\n    if branch_mask:\n      # Fix for bad mmCIFs that have water in the branch scheme table.\n      branch_mask &= (branch_mon_ids != 'HOH') & (branch_mon_ids != 'DOD')\n\n  string_array.remap(\n      pdbx_pdb_ins_codes, mapping=_INSERTION_CODE_REMAP, inplace=True\n  )\n  string_array.remap(\n      nonpoly_pdb_ins_codes, mapping=_INSERTION_CODE_REMAP, inplace=True\n  )\n  string_array.remap(\n      branch_pdb_ins_codes, mapping=_INSERTION_CODE_REMAP, inplace=True\n  )\n\n  def _ligand_residue_ids(chain_ids: np.ndarray) -> np.ndarray:\n    \"\"\"Computes internal residue ID for ligand residues that don't have it.\"\"\"\n\n    # E.g. chain_ids=[A, A, A, B, C, C, D, D, D] -> [1, 2, 3, 1, 1, 2, 1, 2, 3].\n    indices = np.arange(chain_ids.size, dtype=np.int32)\n    return (indices + 1) - np.maximum.accumulate(\n        indices * (chain_ids != np.roll(chain_ids, 1))\n    )\n\n  branch_residue_ids = _ligand_residue_ids(branch_asym_ids[branch_mask])\n  nonpoly_residue_ids = _ligand_residue_ids(nonpoly_asym_ids[nonpoly_mask])\n\n  chain_res_builder.add_residues(\n      chain_ids=branch_asym_ids[branch_mask],\n      chain_auth_asym_ids=branch_auth_asym_id[branch_mask],\n      res_ids=branch_residue_ids,\n      res_names=branch_mon_ids[branch_mask],\n      res_auth_seq_ids=branch_auth_seq_ids[branch_mask],\n      res_ins_codes=branch_pdb_ins_codes[branch_mask],\n  )\n\n  chain_res_builder.add_residues(\n      chain_ids=nonpoly_asym_ids[nonpoly_mask],\n      chain_auth_asym_ids=nonpoly_auth_asym_id[nonpoly_mask],\n      res_ids=nonpoly_residue_ids,\n      res_names=nonpoly_mon_ids[nonpoly_mask],\n      res_auth_seq_ids=nonpoly_auth_seq_ids[nonpoly_mask],\n      res_ins_codes=nonpoly_pdb_ins_codes[nonpoly_mask],\n  )\n\n  chains = chain_res_builder.make_chains_table()\n  residues = chain_res_builder.make_residues_table()\n\n  # Construct foreign residue keys for the atoms table.\n  res_ends = np.array(layout.residues(), dtype=np.int32)\n  res_starts = np.array(layout.residue_starts(), dtype=np.int32)\n  res_lengths = res_ends - res_starts\n\n  # Check just for HOH, DOD can be part e.g. of hydroxycysteine.\n  if include_water:\n    res_chain_types = chains.apply_array_to_column(\n        column_name='type', arr=residues.chain_key\n    )\n    water_mask = res_chain_types != mmcif_names.WATER\n    if 'HOH' in set(residues.name[water_mask]):\n      raise ValueError('Bad mmCIF file: non-water entity has water molecules.')\n  else:\n    # Include resolved and unresolved residues.\n    if 'HOH' in set(residues.name) | set(label_comp_ids[res_starts]):\n      raise ValueError('Bad mmCIF file: non-water entity has water molecules.')\n\n  atom_chain_key = string_array.remap(\n      label_asym_ids, mapping=chain_res_builder.chain_key_by_chain_id\n  ).astype(int)\n\n  # If any of the residue lookups failed, the mmCIF is corrupted.\n  try:\n    atom_res_key_per_res = string_array.remap_multiple(\n        (\n            label_asym_ids[res_starts],\n            auth_seq_ids[res_starts],\n            label_comp_ids[res_starts],\n            pdbx_pdb_ins_codes[res_starts],\n        ),\n        mapping=chain_res_builder.key_for_res,\n    )\n  except KeyError as e:\n    raise ValueError(\n        'Lookup for the following atom from the _atom_site table failed: '\n        f'(label_asym_id, auth_seq_id, res_name, ins_code)={e}. This typically '\n        'indicates that the _pdbx_poly_seq_scheme, _pdbx_nonpoly_scheme, or '\n        '_pdbx_branch_scheme tables do not have data for all residues present '\n        'in the _atom_site table. It could also be due to a known issue with '\n        'a small number of multi-model mmCIFs.'\n    ) from e\n\n  # The residue ID will be shared for all atoms within that residue.\n  atom_res_key = np.repeat(atom_res_key_per_res, repeats=res_lengths)\n\n  if fix_mse_residues:\n    met_residues_mask = (residues.name == 'MET')[atom_res_key]\n    unfixed_mse_selenium_mask = met_residues_mask & (label_atom_ids == 'SE')\n    label_atom_ids[unfixed_mse_selenium_mask] = 'SD'\n    type_symbols[unfixed_mse_selenium_mask] = 'S'\n\n  atoms = structure_tables.Atoms(\n      key=atom_site_first_model,\n      chain_key=atom_chain_key,\n      res_key=atom_res_key,\n      name=label_atom_ids,\n      element=type_symbols,\n      x=atom_x,\n      y=atom_y,\n      z=atom_z,\n      b_factor=atom_b_factor,\n      occupancy=atom_occupancy,\n  )\n\n  return chains, residues, atoms\n\n\ndef from_atom_arrays(\n    *,\n    res_id: np.ndarray,\n    name: str = 'unset',\n    release_date: datetime.date | None = None,\n    resolution: float | None = None,\n    structure_method: str | None = None,\n    all_residues: Mapping[str, Sequence[tuple[str, int]]] | None = None,\n    bioassembly_data: bioassemblies.BioassemblyData | None = None,\n    chemical_components_data: (\n        struc_chem_comps.ChemicalComponentsData | None\n    ) = None,\n    bond_table: structure_tables.Bonds | None = None,\n    chain_id: np.ndarray | None = None,\n    chain_type: np.ndarray | None = None,\n    res_name: np.ndarray | None = None,\n    atom_key: np.ndarray | None = None,\n    atom_name: np.ndarray | None = None,\n    atom_element: np.ndarray | None = None,\n    atom_x: np.ndarray | None = None,\n    atom_y: np.ndarray | None = None,\n    atom_z: np.ndarray | None = None,\n    atom_b_factor: np.ndarray | None = None,\n    atom_occupancy: np.ndarray | None = None,\n) -> structure.Structure:\n  \"\"\"Returns a Structure constructed from atom array level data.\n\n  All fields except name and, res_id are optional, all array fields consist of a\n  value for each atom in the structure - so residue and chain values should hold\n  the same value for each atom in the chain or residue. Fields which are not\n  defined are filled with default values.\n\n  Validation is performed by the Structure constructor where possible - but\n  author_naming scheme and all_residues must be checked in this function.\n\n  It is not possible to construct structures with chains that do not contain\n  any resolved residues using this function. If this is necessary, use the\n  structure.Structure constructor directly.\n\n  Args:\n    res_id: Integer array of shape [num_atom]. The unique residue identifier for\n      each residue. mmCIF field - _atom_site.label_seq_id.\n    name: The name of the structure. E.g. a PDB ID.\n    release_date: The release date of the structure as a `datetime.date`.\n    resolution: The resolution of the structure in Angstroms.\n    structure_method: The method used to solve this structure's coordinates.\n    all_residues: An optional mapping from each chain ID (i.e. label_asym_id) to\n      a sequence of (label_comp_id, label_seq_id) tuples, one per residue. This\n      can contain residues that aren't present in the atom arrays. This is\n      common in experimental data where some residues are not resolved but are\n      known to be present.\n    bioassembly_data: An optional instance of bioassembly.BioassemblyData. If\n      present then a new Structure representing a specific bioassembly can be\n      extracted using `Structure.generate_bioassembly(assembly_id)`.\n    chemical_components_data: An optional instance of ChemicalComponentsData.\n      Its content will be used for providing metadata about chemical components\n      in this Structure instance. If not specified information will be retrieved\n      from the standard chemical component dictionary (CCD, for more details see\n      https://www.wwpdb.org/data/ccd).\n    bond_table: A table representing manually-specified bonds. This corresponds\n      to the _struct_conn table in an mmCIF. Atoms are identified by their key,\n      as specified by the atom_key column. If this table is provided then the\n      atom_key column must also be defined.\n    chain_id: String array of shape [num_atom] of unique chain identifiers.\n      mmCIF field - _atom_site.label_asym_id.\n    chain_type: String array of shape [num_atom]. The molecular type of the\n      current chain (e.g. polyribonucleotide). mmCIF field - _entity_poly.type\n      OR _entity.type (for non-polymers).\n    res_name: String array of shape [num_atom].. The name of each residue,\n      typically a 3 letter string for polypeptides or 1-2 letter strings for\n      polynucleotides. mmCIF field - _atom_site.label_comp_id.\n    atom_key: A unique sorted integer array, used only by the bonds table to\n      identify the atoms participating in each bond. If the bonds table is\n      specified then this column must be non-None.\n    atom_name: String array of shape [num_atom]. The name of each atom (e.g CA,\n      O2', etc.). mmCIF field - _atom_site.label_atom_id.\n    atom_element: String array of shape [num_atom]. The element type of each\n      atom (e.g. C, O, N, etc.). mmCIF field - _atom_site.type_symbol.\n    atom_x: Float array of shape [..., num_atom] of atom x coordinates. May have\n      arbitrary leading dimensions, provided that these are consistent across\n      all coordinate fields.\n    atom_y: Float array of shape [..., num_atom] of atom y coordinates. May have\n      arbitrary leading dimensions, provided that these are consistent across\n      all coordinate fields.\n    atom_z: Float array of shape [..., num_atom] of atom z coordinates. May have\n      arbitrary leading dimensions, provided that these are consistent across\n      all coordinate fields.\n    atom_b_factor: Float array of shape [..., num_atom] or [num_atom] of atom\n      b-factors or equivalent. If there are no extra leading dimensions then\n      these values are assumed to apply to all coordinates for a given atom. If\n      there are leading dimensions then these must match those used by the\n      coordinate fields.\n    atom_occupancy: Float array of shape [..., num_atom] or [num_atom] of atom\n      occupancies or equivalent. If there are no extra leading dimensions then\n      these values are assumed to apply to all coordinates for a given atom. If\n      there are leading dimensions then these must match those used by the\n      coordinate fields.\n  \"\"\"\n\n  atoms, residues, chains = structure_tables.tables_from_atom_arrays(\n      res_id=res_id,\n      all_residues=all_residues,\n      chain_id=chain_id,\n      chain_type=chain_type,\n      res_name=res_name,\n      atom_key=atom_key,\n      atom_name=atom_name,\n      atom_element=atom_element,\n      atom_x=atom_x,\n      atom_y=atom_y,\n      atom_z=atom_z,\n      atom_b_factor=atom_b_factor,\n      atom_occupancy=atom_occupancy,\n  )\n\n  return structure.Structure(\n      name=name,\n      release_date=release_date,\n      resolution=resolution,\n      structure_method=structure_method,\n      bioassembly_data=bioassembly_data,\n      chemical_components_data=chemical_components_data,\n      atoms=atoms,\n      chains=chains,\n      residues=residues,\n      bonds=bond_table or structure_tables.Bonds.make_empty(),\n  )\n\n\ndef _guess_entity_type(\n    chain_residues: Collection[str], atom_types: Collection[str]\n) -> str:\n  \"\"\"Guess the entity type (polymer/non-polymer/water) based on residues/atoms.\n\n  We treat both arguments as unordered collections since we care only whether\n  all elements satisfy come conditions. The chain_residues can be either\n  grouped by residue (length num_res), or it can be raw (length num_atoms).\n  Atom type is unique for each atom in a residue, so don't group atom_types.\n\n  Args:\n    chain_residues: A sequence of full residue name (1-letter for DNA, 2-letters\n      for RNA, 3 for protein). The _atom_site.label_comp_id column in mmCIF.\n    atom_types: Atom type: ATOM or HETATM. The _atom_site.group_PDB column in\n      mmCIF.\n\n  Returns:\n    One of polymer/non-polymer/water based on the following criteria:\n    * If all atoms are HETATMs and all residues are water -> water.\n    * If all atoms are HETATMs and not all residues are water -> non-polymer.\n    * Otherwise -> polymer.\n  \"\"\"\n  if not chain_residues or not atom_types:\n    raise ValueError(\n        f'chain_residues (len {len(chain_residues)}) and atom_types (len '\n        f'{len(atom_types)}) must be both non-empty. Got: {chain_residues=} '\n        f'and {atom_types=}'\n    )\n\n  if all(a == 'HETATM' for a in atom_types):\n    if all(c in residue_names.WATER_TYPES for c in chain_residues):\n      return mmcif_names.WATER\n    return mmcif_names.NON_POLYMER_CHAIN\n  return mmcif_names.POLYMER_CHAIN\n"
  },
  {
    "path": "src/alphafold3/structure/sterics.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Functions relating to spatial locations of atoms within a structure.\"\"\"\n\nfrom collections.abc import Collection, Sequence\n\nfrom alphafold3 import structure\nfrom alphafold3.structure import mmcif\nimport numpy as np\nimport scipy\n\n\ndef _make_atom_has_clash_mask(\n    kd_query_result: np.ndarray,\n    struc: structure.Structure,\n    ignore_chains: Collection[str],\n) -> np.ndarray:\n  \"\"\"Returns a boolean NumPy array representing whether each atom has a clash.\n\n  Args:\n    kd_query_result: NumPy array containing N-atoms arrays, each array\n      containing indices to atoms that clash with the N'th atom.\n    struc: Structure over which clashes were detected.\n    ignore_chains: Collection of chains that should not be considered clashing.\n      A boolean NumPy array of length N atoms.\n  \"\"\"\n  atom_is_clashing = np.zeros((struc.num_atoms,), dtype=bool)\n  for atom_index, clashes in enumerate(kd_query_result):\n    chain_i = struc.chain_id[atom_index]\n    if chain_i in ignore_chains:\n      continue\n    islig_i = struc.is_ligand_mask[atom_index]\n    for clashing_atom_index in clashes:\n      chain_c = struc.chain_id[clashing_atom_index]\n      if chain_c in ignore_chains:\n        continue\n      islig_c = struc.is_ligand_mask[clashing_atom_index]\n      if (\n          clashing_atom_index == atom_index\n          or chain_i == chain_c\n          or islig_i != islig_c\n      ):\n        # Ignore clashes within chain or between ligand and polymer.\n        continue\n      atom_is_clashing[atom_index] = True\n  return atom_is_clashing\n\n\ndef find_clashing_chains(\n    struc: structure.Structure,\n    clash_thresh_angstrom: float = 1.7,\n    clash_thresh_fraction: float = 0.3,\n) -> Sequence[str]:\n  \"\"\"Finds chains that clash with others.\n\n  Clashes are defined by polymer backbone atoms and all ligand atoms.\n  Ligand-polymer clashes are not dropped.\n\n  Will not find clashes if all coordinates are 0. Coordinates are all 0s if\n  the structure is generated from sequences only, as done for inference in\n  dendro for example.\n\n  Args:\n    struc: The structure defining the chains and atom positions.\n    clash_thresh_angstrom: Below this distance, atoms are considered clashing.\n    clash_thresh_fraction: Chains with more than this fraction of their atoms\n      considered clashing will be dropped. This value should be in the range (0,\n      1].\n\n  Returns:\n    A sequence of chain ids for chains that clash.\n\n  Raises:\n    ValueError: If `clash_thresh_fraction` is not in range (0,1].\n  \"\"\"\n  if not 0 < clash_thresh_fraction <= 1:\n    raise ValueError('clash_thresh_fraction must be in range (0,1]')\n\n  struc_backbone = struc.filter_polymers_to_single_atom_per_res()\n  if struc_backbone.num_chains == 0:\n    return []\n\n  # If the coordinates are all 0, do not search for clashes.\n  if not np.any(struc_backbone.coords):\n    return []\n\n  coord_kdtree = scipy.spatial.cKDTree(struc_backbone.coords)\n\n  # For each atom coordinate, find all atoms within the clash thresh radius.\n  clashing_per_atom = coord_kdtree.query_ball_point(\n      struc_backbone.coords, r=clash_thresh_angstrom\n  )\n  chain_ids = struc_backbone.chains\n  if struc_backbone.atom_occupancy is not None:\n    chain_occupancy = np.array([\n        np.mean(struc_backbone.atom_occupancy[start:end])\n        for start, end in struc_backbone.iter_chain_ranges()\n    ])\n  else:\n    chain_occupancy = None\n\n  # Remove chains until no more significant clashing.\n  chains_to_remove = set()\n  for _ in range(len(chain_ids)):\n    # Calculate maximally clashing.\n    atom_has_clash = _make_atom_has_clash_mask(\n        clashing_per_atom, struc_backbone, chains_to_remove\n    )\n    clashes_per_chain = np.array([\n        atom_has_clash[start:end].mean()\n        for start, end in struc_backbone.iter_chain_ranges()\n    ])\n    max_clash = np.max(clashes_per_chain)\n    if max_clash <= clash_thresh_fraction:\n      # None of the remaining chains exceed the clash fraction threshold, so\n      # we can exit.\n      break\n\n    # Greedily remove worst with the lowest occupancy.\n    most_clashes = np.nonzero(clashes_per_chain == max_clash)[0]\n    if chain_occupancy is not None:\n      occupancy_clashing = chain_occupancy[most_clashes]\n      last_lowest_occupancy = (\n          len(occupancy_clashing) - np.argmin(occupancy_clashing[::-1]) - 1\n      )\n      worst_and_last = most_clashes[last_lowest_occupancy]\n    else:\n      worst_and_last = most_clashes[-1]\n\n    chains_to_remove.add(chain_ids[worst_and_last])\n\n  return sorted(chains_to_remove, key=mmcif.str_id_to_int_id)\n"
  },
  {
    "path": "src/alphafold3/structure/structure.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Structure class for representing and processing molecular structures.\"\"\"\n\nimport collections\nfrom collections.abc import Callable, Collection, Iterable, Iterator, Mapping, Sequence, Set\nimport dataclasses\nimport datetime\nimport enum\nimport functools\nimport itertools\nimport typing\nfrom typing import Any, ClassVar, Final, Literal, NamedTuple, Self, TypeAlias, TypeVar\n\nfrom alphafold3.constants import atom_types\nfrom alphafold3.constants import chemical_components\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.constants import residue_names\nfrom alphafold3.cpp import membership\nfrom alphafold3.cpp import string_array\nfrom alphafold3.structure import bioassemblies\nfrom alphafold3.structure import chemical_components as struc_chem_comps\nfrom alphafold3.structure import mmcif\nfrom alphafold3.structure import structure_tables\nfrom alphafold3.structure import table\nimport numpy as np\n\n# Controls the default number of decimal places for coordinates when writing to\n# mmCIF.\n_COORDS_DECIMAL_PLACES: Final[int] = 3\n\n\n@enum.unique\nclass CascadeDelete(enum.Enum):\n  NONE = 0\n  FULL = 1\n  CHAINS = 2\n\n\n# See www.python.org/dev/peps/pep-0484/#support-for-singleton-types-in-unions\nclass _UnsetSentinel(enum.Enum):\n  UNSET = object()\n\n\n_UNSET = _UnsetSentinel.UNSET\n\n\nclass Bond(NamedTuple):\n  \"\"\"Describes a bond between two atoms.\"\"\"\n\n  from_atom: Mapping[str, str | int | float | np.ndarray]\n  dest_atom: Mapping[str, str | int | float | np.ndarray]\n  bond_info: Mapping[str, str | int]\n\n\nclass MissingAtomError(Exception):\n  \"\"\"Error raised when an atom is missing during alignment.\"\"\"\n\n\nclass MissingAuthorResidueIdError(Exception):\n  \"\"\"Raised when author naming data is missing for a residue.\n\n  This can occur in certain edge cases where missing residue data is provided\n  without also providing author IDs for those missing residues.\n  \"\"\"\n\n\n# AllResidues is a mapping from label_asym_id to a sequence of (label_comp_id,\n# label_seq_id) pairs. These represent the full sequence including residues\n# that might be missing (e.g. unresolved residues in X-ray data).\nAllResidues: TypeAlias = Mapping[str, Sequence[tuple[str, int]]]\nAuthorNamingScheme: TypeAlias = structure_tables.AuthorNamingScheme\n\n\n# External residue ID given to missing residues that don't have an ID\n# already provided. In mmCIFs this data is found in _pdbx_poly_seq_scheme.\nMISSING_AUTH_SEQ_ID: Final[str] = '.'\n\n\n# Maps from structure fields to column names in the relevant table.\nCHAIN_FIELDS: Final[Mapping[str, str]] = {\n    'chain_id': 'id',\n    'chain_type': 'type',\n    'chain_auth_asym_id': 'auth_asym_id',\n    'chain_entity_id': 'entity_id',\n    'chain_entity_desc': 'entity_desc',\n}\n\n\nRESIDUE_FIELDS: Final[Mapping[str, str]] = {\n    'res_id': 'id',\n    'res_name': 'name',\n    'res_auth_seq_id': 'auth_seq_id',\n    'res_insertion_code': 'insertion_code',\n}\n\nATOM_FIELDS: Final[Mapping[str, str]] = {\n    'atom_name': 'name',\n    'atom_element': 'element',\n    'atom_x': 'x',\n    'atom_y': 'y',\n    'atom_z': 'z',\n    'atom_b_factor': 'b_factor',\n    'atom_occupancy': 'occupancy',\n    'atom_key': 'key',\n}\n\n# Fields in structure.\nARRAY_FIELDS = frozenset({\n    'atom_b_factor',\n    'atom_element',\n    'atom_key',\n    'atom_name',\n    'atom_occupancy',\n    'atom_x',\n    'atom_y',\n    'atom_z',\n    'chain_id',\n    'chain_type',\n    'res_id',\n    'res_name',\n})\n\nGLOBAL_FIELDS = frozenset({\n    'name',\n    'release_date',\n    'resolution',\n    'structure_method',\n    'bioassembly_data',\n    'chemical_components_data',\n})\n\n# Fields which can be updated in copy_and_update.\n_UPDATEABLE_FIELDS: Final[Set[str]] = frozenset({\n    'all_residues',\n    'atom_b_factor',\n    'atom_element',\n    'atom_key',\n    'atom_name',\n    'atom_occupancy',\n    'atom_x',\n    'atom_y',\n    'atom_z',\n    'bioassembly_data',\n    'bonds',\n    'chain_id',\n    'chain_type',\n    'chemical_components_data',\n    'name',\n    'release_date',\n    'res_id',\n    'res_name',\n    'resolution',\n    'structure_method',\n})\n\n\ndef fix_non_standard_polymer_residues(\n    res_names: np.ndarray, chain_type: str\n) -> np.ndarray:\n  \"\"\"Remaps residue names to the closest standard protein/RNA/DNA residue.\n\n  If residue name is already a standard type, it is not altered.\n  If a match cannot be found, returns 'UNK' for protein chainresidues and 'N'\n    for RNA/DNA chain residue.\n\n  Args:\n     res_names: A numpy array of string residue names (CCD monomer codes). E.g.\n       'ARG' (protein), 'DT' (DNA), 'N' (RNA).\n     chain_type: The type of the chain, must be PROTEIN_CHAIN, RNA_CHAIN or\n       DNA_CHAIN.\n\n  Returns:\n    An array remapped so that its elements are all from\n    PROTEIN_TYPES_WITH_UNKNOWN | RNA_TYPES | DNA_TYPES | {'N'}.\n\n  Raises:\n    ValueError: If chain_type not in PEPTIDE_CHAIN_TYPES or\n      {OTHER_CHAIN, RNA_CHAIN, DNA_CHAIN, DNA_RNA_HYBRID_CHAIN}.\n  \"\"\"\n  # Map to one letter code, then back to common res_names.\n  one_letter_codes = string_array.remap(\n      res_names, mapping=residue_names.CCD_NAME_TO_ONE_LETTER, default_value='X'\n  )\n\n  if (\n      chain_type in mmcif_names.PEPTIDE_CHAIN_TYPES\n      or chain_type == mmcif_names.OTHER_CHAIN\n  ):\n    mapping = residue_names.PROTEIN_COMMON_ONE_TO_THREE\n    default_value = 'UNK'\n  elif chain_type == mmcif_names.RNA_CHAIN:\n    # RNA has single-letter CCD monomer codes.\n    mapping = {r: r for r in residue_names.RNA_TYPES}\n    default_value = 'N'\n  elif chain_type == mmcif_names.DNA_CHAIN:\n    mapping = residue_names.DNA_COMMON_ONE_TO_TWO\n    default_value = 'N'\n  elif chain_type == mmcif_names.DNA_RNA_HYBRID_CHAIN:\n    mapping = {r: r for r in residue_names.NUCLEIC_TYPES_WITH_UNKNOWN}\n    default_value = 'N'\n  else:\n    raise ValueError(f'Expected a protein/DNA/RNA chain but got {chain_type}')\n\n  return string_array.remap(\n      one_letter_codes, mapping=mapping, default_value=default_value\n  )\n\n\ndef _get_change_indices(arr: np.ndarray) -> np.ndarray:\n  if arr.size == 0:\n    return np.array([], dtype=np.int32)\n  else:\n    changing_idxs = np.where(arr[1:] != arr[:-1])[0] + 1\n    return np.concatenate(([0], changing_idxs), axis=0)\n\n\ndef _unpack_filter_predicates(\n    predicate_by_field_name: Mapping[str, table.FilterPredicate],\n) -> tuple[\n    Mapping[str, table.FilterPredicate],\n    Mapping[str, table.FilterPredicate],\n    Mapping[str, table.FilterPredicate],\n]:\n  \"\"\"Unpacks filter kwargs into predicates for each table.\"\"\"\n  chain_predicates = {}\n  res_predicates = {}\n  atom_predicates = {}\n  for k, pred in predicate_by_field_name.items():\n    if col := CHAIN_FIELDS.get(k):\n      chain_predicates[col] = pred\n    elif col := RESIDUE_FIELDS.get(k):\n      res_predicates[col] = pred\n    elif col := ATOM_FIELDS.get(k):\n      atom_predicates[col] = pred\n    else:\n      raise ValueError(k)\n  return chain_predicates, res_predicates, atom_predicates\n\n\n_T = TypeVar('_T')\n\n\nSCALAR_FIELDS: Final[Collection[str]] = frozenset({\n    'name',\n    'release_date',\n    'resolution',\n    'structure_method',\n    'bioassembly_data',\n    'chemical_components_data',\n})\n\n\nTABLE_FIELDS: Final[Collection[str]] = frozenset(\n    {'chains', 'residues', 'atoms', 'bonds'}\n)\n\n\nV2_FIELDS: Final[Collection[str]] = frozenset({*SCALAR_FIELDS, *TABLE_FIELDS})\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass StructureTables:\n  chains: structure_tables.Chains\n  residues: structure_tables.Residues\n  atoms: structure_tables.Atoms\n  bonds: structure_tables.Bonds\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass ResArrays:\n  \"\"\"Atom-level data arrays with a residue dimension.\n\n  Attributes:\n    atom_positions: float32 of shape [num_res, num_atom_type, 3] coordinates.\n    atom_mask: float32 of shape [num_res, num_atom_type] indicating if an atom\n      is present.\n    atom_b_factor: float32 of shape [num_res, num_atom_type] b_factors.\n    atom_occupancy: float32 of shape [num_res, num_atom_type] occupancies.\n  \"\"\"\n\n  atom_positions: np.ndarray\n  atom_mask: np.ndarray\n  atom_b_factor: np.ndarray\n  atom_occupancy: np.ndarray\n\n\nclass Structure(table.Database):\n  \"\"\"Structure class for representing and processing molecular structures.\"\"\"\n\n  tables: ClassVar[Collection[str]] = TABLE_FIELDS\n\n  foreign_keys: ClassVar[Mapping[str, Collection[tuple[str, str]]]] = {\n      'residues': (('chain_key', 'chains'),),\n      'atoms': (('chain_key', 'chains'), ('res_key', 'residues')),\n      'bonds': (('from_atom_key', 'atoms'), ('dest_atom_key', 'atoms')),\n  }\n\n  def __init__(\n      self,\n      *,\n      name: str = 'unset',\n      release_date: datetime.date | None = None,\n      resolution: float | None = None,\n      structure_method: str | None = None,\n      bioassembly_data: bioassemblies.BioassemblyData | None = None,\n      chemical_components_data: (\n          struc_chem_comps.ChemicalComponentsData | None\n      ) = None,\n      chains: structure_tables.Chains,\n      residues: structure_tables.Residues,\n      atoms: structure_tables.Atoms,\n      bonds: structure_tables.Bonds,\n      skip_validation: bool = False,\n  ):\n    # Version number is written to mmCIF and should be incremented when changes\n    # are made to mmCIF writing or internals that affect this.\n    # b/345221494 Rename this variable when structure_v1 compatibility code\n    # is removed.\n    self._VERSION = '2.0.0'  # pylint: disable=invalid-name\n    self._name = name or 'unset'\n    self._release_date = release_date\n    self._resolution = resolution\n    self._structure_method = structure_method\n    self._bioassembly_data = bioassembly_data\n    self._chemical_components_data = chemical_components_data\n\n    self._chains = chains\n    self._residues = residues\n    self._atoms = atoms\n    self._bonds = bonds\n\n    if not skip_validation:\n      self._validate_table_foreign_keys()\n      self._validate_consistent_table_ordering()\n\n  def _validate_table_foreign_keys(self):\n    \"\"\"Validates that all foreign keys are present in the referred tables.\"\"\"\n    residue_keys = set(self._residues.key)\n    chain_keys = set(self._chains.key)\n    if np.any(membership.isin(self._atoms.res_key, residue_keys, invert=True)):\n      raise ValueError(\n          'Atom residue keys not in the residues table: '\n          f'{set(self._atoms.res_key).difference(self._residues.key)}'\n      )\n    if np.any(membership.isin(self._atoms.chain_key, chain_keys, invert=True)):\n      raise ValueError(\n          'Atom chain keys not in the chains table: '\n          f'{set(self._atoms.chain_key).difference(self._chains.key)}'\n      )\n    if np.any(\n        membership.isin(self._residues.chain_key, chain_keys, invert=True)\n    ):\n      raise ValueError(\n          'Residue chain keys not in the chains table: '\n          f'{set(self._residues.chain_key).difference(self._chains.key)}'\n      )\n\n  def _validate_consistent_table_ordering(self):\n    \"\"\"Validates that all tables have the same ordering.\"\"\"\n    atom_chain_keys = self._atoms.chain_key[self.chain_boundaries]\n    atom_res_keys = self._atoms.res_key[self.res_boundaries]\n\n    if not np.array_equal(self.present_chains.key, atom_chain_keys):\n      raise ValueError(\n          f'Atom table chain order\\n{atom_chain_keys}\\ndoes not match the '\n          f'chain table order\\n{self._chains.key}'\n      )\n    if not np.array_equal(self.present_residues.key, atom_res_keys):\n      raise ValueError(\n          f'Atom table residue order\\n{atom_res_keys}\\ndoes not match the '\n          f'present residue table order\\n{self.present_residues.key}'\n      )\n\n  def get_table(self, table_name: str) -> table.Table:\n    match table_name:\n      case 'chains':\n        return self.chains_table\n      case 'residues':\n        return self.residues_table\n      case 'atoms':\n        return self.atoms_table\n      case 'bonds':\n        return self.bonds_table\n      case _:\n        raise ValueError(table_name)\n\n  @property\n  def chains_table(self) -> structure_tables.Chains:\n    \"\"\"Chains table.\"\"\"\n    return self._chains\n\n  @property\n  def residues_table(self) -> structure_tables.Residues:\n    \"\"\"Residues table.\"\"\"\n    return self._residues\n\n  @property\n  def atoms_table(self) -> structure_tables.Atoms:\n    \"\"\"Atoms table.\"\"\"\n    return self._atoms\n\n  @property\n  def bonds_table(self) -> structure_tables.Bonds:\n    \"\"\"Bonds table.\"\"\"\n    return self._bonds\n\n  @property\n  def name(self) -> str:\n    return self._name\n\n  @property\n  def release_date(self) -> datetime.date | None:\n    return self._release_date\n\n  @property\n  def resolution(self) -> float | None:\n    return self._resolution\n\n  @property\n  def structure_method(self) -> str | None:\n    return self._structure_method\n\n  @property\n  def bioassembly_data(self) -> bioassemblies.BioassemblyData | None:\n    return self._bioassembly_data\n\n  @property\n  def chemical_components_data(\n      self,\n  ) -> struc_chem_comps.ChemicalComponentsData | None:\n    return self._chemical_components_data\n\n  @property\n  def bonds(self) -> structure_tables.Bonds:\n    return self._bonds\n\n  @functools.cached_property\n  def author_naming_scheme(self) -> AuthorNamingScheme:\n    auth_asym_id = {}\n    entity_id = {}\n    entity_desc = {}\n    auth_seq_id = collections.defaultdict(dict)\n    insertion_code = collections.defaultdict(dict)\n\n    for chain_i in range(self._chains.size):\n      chain_id = self._chains.id[chain_i]\n      auth_asym_id[chain_id] = self._chains.auth_asym_id[chain_i]\n      chain_entity_id = self._chains.entity_id[chain_i]\n      entity_id[chain_id] = chain_entity_id\n      entity_desc[chain_entity_id] = self._chains.entity_desc[chain_i]\n\n    chain_index_by_key = self._chains.index_by_key\n    for res_i in range(self._residues.size):\n      chain_key = self._residues.chain_key[res_i]\n      chain_id = self._chains.id[chain_index_by_key[chain_key]]\n      res_id = self._residues.id[res_i]\n      res_auth_seq_id = self._residues.auth_seq_id[res_i]\n      if res_auth_seq_id == MISSING_AUTH_SEQ_ID:\n        continue\n      auth_seq_id[chain_id][res_id] = res_auth_seq_id\n      ins_code = self._residues.insertion_code[res_i]\n      # Compatibility with Structure v1 which used None to represent . or ?.\n      insertion_code[chain_id][res_id] = (\n          ins_code if ins_code not in {'.', '?'} else None\n      )\n\n    return AuthorNamingScheme(\n        auth_asym_id=auth_asym_id,\n        entity_id=entity_id,\n        entity_desc=entity_desc,\n        auth_seq_id=dict(auth_seq_id),\n        insertion_code=dict(insertion_code),\n    )\n\n  @functools.cached_property\n  def all_residues(self) -> AllResidues:\n    chain_id_by_key = dict(zip(self._chains.key, self._chains.id))\n    residue_chain_boundaries = _get_change_indices(self._residues.chain_key)\n    boundaries = self._iter_residue_ranges(\n        residue_chain_boundaries, count_unresolved=True\n    )\n    return {\n        chain_id_by_key[self._residues.chain_key[start]]: list(\n            zip(self._residues.name[start:end], self._residues.id[start:end])\n        )\n        for start, end in boundaries\n    }\n\n  @functools.cached_property\n  def label_asym_id_to_entity_id(self) -> Mapping[str, str]:\n    return dict(zip(self._chains.id, self._chains.entity_id))\n\n  @functools.cached_property\n  def chain_entity_id(self) -> np.ndarray:\n    \"\"\"Returns the entity ID for each atom in the structure.\"\"\"\n    return self.chains_table.apply_array_to_column(\n        'entity_id', self._atoms.chain_key\n    )\n\n  @functools.cached_property\n  def chain_entity_desc(self) -> np.ndarray:\n    \"\"\"Returns the entity description for each atom in the structure.\"\"\"\n    return self.chains_table.apply_array_to_column(\n        'entity_desc', self._atoms.chain_key\n    )\n\n  @functools.cached_property\n  def chain_auth_asym_id(self) -> np.ndarray:\n    \"\"\"Returns the chain auth asym ID for each atom in the structure.\"\"\"\n    return self.chains_table.apply_array_to_column(\n        'auth_asym_id', self._atoms.chain_key\n    )\n\n  @functools.cached_property\n  def chain_id(self) -> np.ndarray:\n    chain_index_by_key = self._chains.index_by_key\n    return self._chains.id[chain_index_by_key[self._atoms.chain_key]]\n\n  @functools.cached_property\n  def chain_type(self) -> np.ndarray:\n    chain_index_by_key = self._chains.index_by_key\n    return self._chains.type[chain_index_by_key[self._atoms.chain_key]]\n\n  @functools.cached_property\n  def res_id(self) -> np.ndarray:\n    return self._residues['id', self._atoms.res_key]\n\n  @functools.cached_property\n  def res_name(self) -> np.ndarray:\n    return self._residues['name', self._atoms.res_key]\n\n  @functools.cached_property\n  def res_auth_seq_id(self) -> np.ndarray:\n    \"\"\"Returns the residue auth seq ID for each atom in the structure.\"\"\"\n    return self.residues_table.apply_array_to_column(\n        'auth_seq_id', self._atoms.res_key\n    )\n\n  @functools.cached_property\n  def res_insertion_code(self) -> np.ndarray:\n    \"\"\"Returns the residue insertion code for each atom in the structure.\"\"\"\n    return self.residues_table.apply_array_to_column(\n        'insertion_code', self._atoms.res_key\n    )\n\n  @property\n  def atom_key(self) -> np.ndarray:\n    return self._atoms.key\n\n  @property\n  def atom_name(self) -> np.ndarray:\n    return self._atoms.name\n\n  @property\n  def atom_element(self) -> np.ndarray:\n    return self._atoms.element\n\n  @property\n  def atom_x(self) -> np.ndarray:\n    return self._atoms.x\n\n  @property\n  def atom_y(self) -> np.ndarray:\n    return self._atoms.y\n\n  @property\n  def atom_z(self) -> np.ndarray:\n    return self._atoms.z\n\n  @property\n  def atom_b_factor(self) -> np.ndarray:\n    return self._atoms.b_factor\n\n  @property\n  def atom_occupancy(self) -> np.ndarray:\n    return self._atoms.occupancy\n\n  @functools.cached_property\n  def chain_boundaries(self) -> np.ndarray:\n    \"\"\"The indices in the atom fields where each present chain begins.\"\"\"\n    return _get_change_indices(self._atoms.chain_key)\n\n  @functools.cached_property\n  def res_boundaries(self) -> np.ndarray:\n    \"\"\"The indices in the atom fields where each present residue begins.\"\"\"\n    return _get_change_indices(self._atoms.res_key)\n\n  @functools.cached_property\n  def present_chains(self) -> structure_tables.Chains:\n    \"\"\"Returns table of chains which have at least 1 resolved atom.\"\"\"\n    is_present_mask = np.isin(self._chains.key, self._atoms.chain_key)\n    return typing.cast(structure_tables.Chains, self._chains[is_present_mask])\n\n  @functools.cached_property\n  def present_residues(self) -> structure_tables.Residues:\n    \"\"\"Returns table of residues which have at least 1 resolved atom.\"\"\"\n    is_present_mask = np.isin(self._residues.key, self._atoms.res_key)\n    return typing.cast(\n        structure_tables.Residues, self._residues[is_present_mask]\n    )\n\n  @functools.cached_property\n  def unresolved_residues(self) -> structure_tables.Residues:\n    \"\"\"Returns table of residues which have at least 1 resolved atom.\"\"\"\n    is_unresolved_mask = np.isin(\n        self._residues.key, self._atoms.res_key, invert=True\n    )\n    return typing.cast(\n        structure_tables.Residues, self._residues[is_unresolved_mask]\n    )\n\n  def __getitem__(self, field: str) -> Any:\n    \"\"\"Gets raw field data using field name as a string.\"\"\"\n    if field in TABLE_FIELDS:\n      return self.get_table(field)\n    else:\n      return getattr(self, field)\n\n  def __getstate__(self) -> dict[str, Any]:\n    \"\"\"Pickle calls this on dump.\n\n    Returns:\n      Members with cached properties removed.\n    \"\"\"\n    cached_props = {\n        k\n        for k, v in self.__class__.__dict__.items()\n        if isinstance(v, functools.cached_property)\n    }\n    return {k: v for k, v in self.__dict__.items() if k not in cached_props}\n\n  def __repr__(self):\n    return (\n        f'Structure({self._name}: {self.num_chains} chains, '\n        f'{self.num_residues(count_unresolved=False)} residues, '\n        f'{self.num_atoms} atoms)'\n    )\n\n  @property\n  def num_atoms(self) -> int:\n    return self._atoms.size\n\n  def num_residues(self, *, count_unresolved: bool) -> int:\n    \"\"\"Returns the number of residues in this Structure.\n\n    Args:\n      count_unresolved: Whether to include unresolved (empty) residues.\n\n    Returns:\n      Number of residues in the Structure.\n    \"\"\"\n    if count_unresolved:\n      return self._residues.size\n    else:\n      return self.present_residues.size\n\n  @property\n  def num_chains(self) -> int:\n    return self._chains.size\n\n  @property\n  def num_models(self) -> int:\n    \"\"\"The number of models of this Structure.\"\"\"\n    return self._atoms.num_models\n\n  def _atom_mask(self, entities: Set[str]) -> np.ndarray:\n    \"\"\"Boolean label indicating if each atom is from entities or not.\"\"\"\n    mask = np.zeros(self.num_atoms, dtype=bool)\n    chain_index_by_key = self._chains.index_by_key\n    for start, end in self.iter_chain_ranges():\n      chain_index = chain_index_by_key[self._atoms.chain_key[start]]\n      chain_type = self._chains.type[chain_index]\n      mask[start:end] = chain_type in entities\n    return mask\n\n  @functools.cached_property\n  def is_protein_mask(self) -> np.ndarray:\n    \"\"\"Boolean label indicating if each atom is from protein or not.\"\"\"\n    return self._atom_mask(entities={mmcif_names.PROTEIN_CHAIN})\n\n  @functools.cached_property\n  def is_dna_mask(self) -> np.ndarray:\n    \"\"\"Boolean label indicating if each atom is from DNA or not.\"\"\"\n    return self._atom_mask(entities={mmcif_names.DNA_CHAIN})\n\n  @functools.cached_property\n  def is_rna_mask(self) -> np.ndarray:\n    \"\"\"Boolean label indicating if each atom is from RNA or not.\"\"\"\n    return self._atom_mask(entities={mmcif_names.RNA_CHAIN})\n\n  @functools.cached_property\n  def is_nucleic_mask(self) -> np.ndarray:\n    \"\"\"Boolean label indicating if each atom is a nucleic acid or not.\"\"\"\n    return self._atom_mask(entities=mmcif_names.NUCLEIC_ACID_CHAIN_TYPES)\n\n  @functools.cached_property\n  def is_ligand_mask(self) -> np.ndarray:\n    \"\"\"Boolean label indicating if each atom is a ligand or not.\"\"\"\n    return self._atom_mask(entities=mmcif_names.LIGAND_CHAIN_TYPES)\n\n  @functools.cached_property\n  def is_water_mask(self) -> np.ndarray:\n    \"\"\"Boolean label indicating if each atom is from water or not.\"\"\"\n    return self._atom_mask(entities={mmcif_names.WATER})\n\n  def iter_atoms(self) -> Iterator[Mapping[str, Any]]:\n    \"\"\"Iterates over the atoms in the structure.\"\"\"\n    if self._atoms.size == 0:\n      return\n\n    current_chain = self._chains.get_row_by_key(\n        column_name_map=CHAIN_FIELDS, key=self._atoms.chain_key[0]\n    )\n    current_chain_key = self._atoms.chain_key[0]\n    current_res = self._residues.get_row_by_key(\n        column_name_map=RESIDUE_FIELDS, key=self._atoms.res_key[0]\n    )\n    current_res_key = self._atoms.res_key[0]\n    for atom_i in range(self._atoms.size):\n      atom_chain_key = self._atoms.chain_key[atom_i]\n      atom_res_key = self._atoms.res_key[atom_i]\n\n      if atom_chain_key != current_chain_key:\n        chain_index = self._chains.index_by_key[atom_chain_key]\n        current_chain = {\n            'chain_id': self._chains.id[chain_index],\n            'chain_type': self._chains.type[chain_index],\n            'chain_auth_asym_id': self._chains.auth_asym_id[chain_index],\n            'chain_entity_id': self._chains.entity_id[chain_index],\n            'chain_entity_desc': self._chains.entity_desc[chain_index],\n        }\n        current_chain_key = atom_chain_key\n      if atom_res_key != current_res_key:\n        res_index = self._residues.index_by_key[atom_res_key]\n        current_res = {\n            'res_id': self._residues.id[res_index],\n            'res_name': self._residues.name[res_index],\n            'res_auth_seq_id': self._residues.auth_seq_id[res_index],\n            'res_insertion_code': self._residues.insertion_code[res_index],\n        }\n        current_res_key = atom_res_key\n\n      yield {\n          'atom_name': self._atoms.name[atom_i],\n          'atom_element': self._atoms.element[atom_i],\n          'atom_x': self._atoms.x[..., atom_i],\n          'atom_y': self._atoms.y[..., atom_i],\n          'atom_z': self._atoms.z[..., atom_i],\n          'atom_b_factor': self._atoms.b_factor[..., atom_i],\n          'atom_occupancy': self._atoms.occupancy[..., atom_i],\n          'atom_key': self._atoms.key[atom_i],\n          **current_res,\n          **current_chain,\n      }\n\n  def iter_residues(\n      self,\n      include_unresolved: bool = False,\n  ) -> Iterator[Mapping[str, Any]]:\n    \"\"\"Iterates over the residues in the structure.\"\"\"\n    res_table = self._residues if include_unresolved else self.present_residues\n    if res_table.size == 0:\n      return\n\n    current_chain = self._chains.get_row_by_key(\n        column_name_map=CHAIN_FIELDS, key=res_table.chain_key[0]\n    )\n    current_chain_key = res_table.chain_key[0]\n    for res_i in range(res_table.size):\n      res_chain_key = res_table.chain_key[res_i]\n\n      if res_chain_key != current_chain_key:\n        current_chain = self._chains.get_row_by_key(\n            column_name_map=CHAIN_FIELDS, key=res_table.chain_key[res_i]\n        )\n        current_chain_key = res_chain_key\n\n      row = {\n          'res_id': res_table.id[res_i],\n          'res_name': res_table.name[res_i],\n          'res_auth_seq_id': res_table.auth_seq_id[res_i],\n          'res_insertion_code': res_table.insertion_code[res_i],\n      }\n      yield row | current_chain\n\n  def _iter_atom_ranges(\n      self, boundaries: Sequence[int]\n  ) -> Iterator[tuple[int, int]]:\n    \"\"\"Iterator for (start, end) pairs from an array of start indices.\"\"\"\n    yield from itertools.pairwise(boundaries)\n    # Use explicit length test as boundaries can be a NumPy array.\n    if len(boundaries) > 0:  # pylint: disable=g-explicit-length-test\n      yield boundaries[-1], self.num_atoms\n\n  def _iter_residue_ranges(\n      self,\n      boundaries: Sequence[int],\n      *,\n      count_unresolved: bool,\n  ) -> Iterator[tuple[int, int]]:\n    \"\"\"Iterator for (start, end) pairs from an array of start indices.\"\"\"\n    yield from itertools.pairwise(boundaries)\n    # Use explicit length test as boundaries can be a NumPy array.\n    if len(boundaries) > 0:  # pylint: disable=g-explicit-length-test\n      yield boundaries[-1], self.num_residues(count_unresolved=count_unresolved)\n\n  def iter_chain_ranges(self) -> Iterator[tuple[int, int]]:\n    \"\"\"Iterates pairs of (chain_start, chain_end) indices.\n\n    Yields:\n      Pairs of (start, end) indices for each chain, where end is not inclusive.\n      i.e. struc.chain_id[start:end] would be a constant array with length\n      equal to the number of atoms in the chain.\n    \"\"\"\n    yield from self._iter_atom_ranges(self.chain_boundaries)\n\n  def iter_residue_ranges(self) -> Iterator[tuple[int, int]]:\n    \"\"\"Iterates pairs of (residue_start, residue_end) indices.\n\n    Yields:\n      Pairs of (start, end) indices for each residue, where end is not\n      inclusive. i.e. struc.res_id[start:end] would be a constant array with\n      length equal to the number of atoms in the residue.\n    \"\"\"\n    yield from self._iter_atom_ranges(self.res_boundaries)\n\n  def iter_chains(self) -> Iterator[Mapping[str, Any]]:\n    \"\"\"Iterates over the chains in the structure.\"\"\"\n    for chain_i in range(self.present_chains.size):\n      yield {\n          'chain_id': self.present_chains.id[chain_i],\n          'chain_type': self.present_chains.type[chain_i],\n          'chain_auth_asym_id': self.present_chains.auth_asym_id[chain_i],\n          'chain_entity_id': self.present_chains.entity_id[chain_i],\n          'chain_entity_desc': self.present_chains.entity_desc[chain_i],\n      }\n\n  def iter_bonds(self) -> Iterator[Bond]:\n    \"\"\"Iterates over the atoms and bond information.\n\n    Example usage:\n\n    ```\n    for from_atom, dest_atom, bond_info in struc.iter_bonds():\n      print(\n          f'From atom: name={from_atom[\"atom_name\"]}, '\n          f'chain={from_atom[\"chain_id\"]}, ...'\n      )\n      # Same for dest_atom\n      print(f'Bond info: type={bond_info[\"type\"]}, role={bond_info[\"role\"]}')\n    ```\n\n    Yields:\n      A `Bond` NamedTuple for each bond in the bonds table.\n      These have fields `from_atom`, `dest_atom`, `bond_info` where each\n      is a dictionary. The first two have the same keys as the atom dicts\n      returned by self.iter_atoms() -- i.e. one key per non-None field.\n      The final dict has the same keys as self.bonds.iterrows() -- i.e. one\n      key per column in the bonds table.\n    \"\"\"\n    from_atom_iter = self._atoms.iterrows(\n        row_keys=self._bonds.from_atom_key,\n        column_name_map=ATOM_FIELDS,\n        chain_key=self._chains.with_column_names(CHAIN_FIELDS),\n        res_key=self._residues.with_column_names(RESIDUE_FIELDS),\n    )\n    dest_atom_iter = self._atoms.iterrows(\n        row_keys=self._bonds.dest_atom_key,\n        column_name_map=ATOM_FIELDS,\n        chain_key=self._chains.with_column_names(CHAIN_FIELDS),\n        res_key=self._residues.with_column_names(RESIDUE_FIELDS),\n    )\n\n    for from_atom, dest_atom, bond_info in zip(\n        from_atom_iter, dest_atom_iter, self._bonds.iterrows(), strict=True\n    ):\n      yield Bond(from_atom=from_atom, dest_atom=dest_atom, bond_info=bond_info)\n\n  def _apply_atom_index_array(\n      self,\n      index_arr: np.ndarray,\n      chain_boundaries: np.ndarray | None = None,\n      res_boundaries: np.ndarray | None = None,\n      skip_validation: bool = False,\n  ) -> Self:\n    \"\"\"Applies index_arr to the atom table using NumPy-style array indexing.\n\n    Args:\n      index_arr: A 1D NumPy array that will be used to index into the atoms\n        table. This can either be a boolean array to act as a mask, or an\n        integer array to perform a gather operation.\n      chain_boundaries: Unused in structure v2.\n      res_boundaries: Unused in structure v2.\n      skip_validation: Whether to skip the validation step that checks internal\n        consistency after applying atom index array. Do not set to True unless\n        you are certain the transform is safe, e.g. when the order of atoms is\n        guaranteed to not change.\n\n    Returns:\n      A new Structure with an updated atoms table.\n    \"\"\"\n    del chain_boundaries, res_boundaries\n\n    if index_arr.ndim != 1:\n      raise ValueError(\n          f'index_arr must be a 1D NumPy array, but has shape {index_arr.shape}'\n      )\n\n    if index_arr.dtype == bool and np.all(index_arr):\n      return self  # Shortcut: The operation is a no-op, so just return itself.\n\n    atoms = structure_tables.Atoms(\n        **{col: self._atoms[col][..., index_arr] for col in self._atoms.columns}\n    )\n    updated_tables = self._cascade_delete(atoms=atoms)\n    return self.copy_and_update(\n        atoms=updated_tables.atoms,\n        bonds=updated_tables.bonds,\n        skip_validation=skip_validation,\n    )\n\n  @property\n  def group_by_residue(self) -> Self:\n    \"\"\"Returns a Structure with one atom per residue.\n\n    e.g. restypes = struc.group_by_residue['res_id']\n\n    Returns:\n      A new Structure with one atom per residue such that per-atom arrays\n      such as res_name (i.e. Structure v1 fields) have one element per residue.\n    \"\"\"\n    # This use of _apply_atom_index_array is safe because the chain/residue/atom\n    # ordering won't change (essentially applying a residue start mask).\n    return self._apply_atom_index_array(\n        self.res_boundaries, skip_validation=True\n    )\n\n  @property\n  def group_by_chain(self) -> Self:\n    \"\"\"Returns a Structure where all fields are per-chain.\n\n    e.g. chains = struc.group_by_chain['chain_id']\n\n    Returns:\n      A new Structure with one atom per chain such that per-atom arrays\n      such as res_name (i.e. Structure v1 fields) have one element per chain.\n    \"\"\"\n    # This use of _apply_atom_index_array is safe because the chain/residue/atom\n    # ordering won't change (essentially applying a chain start mask).\n    return self._apply_atom_index_array(\n        self.chain_boundaries, skip_validation=True\n    )\n\n  @property\n  def with_sorted_chains(self) -> Self:\n    \"\"\"Returns a new structure with the chains are in reverse spreadsheet style.\n\n    This is the usual order to write chains in an mmCIF:\n    (A < B < ... < AA < BA < CA < ... < AB < BB < CB ...)\n\n    NB: this method will fail if chains do not conform to this mmCIF naming\n    convention.\n\n    Only to be used for third party metrics that rely on the chain order.\n    Elsewhere chains should be identified by name and code should be agnostic to\n    the order.\n    \"\"\"\n    sorted_chains = sorted(self.chains, key=mmcif.str_id_to_int_id)\n    return self.reorder_chains(new_order=sorted_chains)\n\n  @functools.cached_property\n  def atom_ids(self) -> Sequence[tuple[str, str, None, str]]:\n    \"\"\"Gets a list of atom ID tuples from Structure class arrays.\n\n    Returns:\n      A list of tuples of (chain_id, res_id, insertion_code, atom_name) where\n      insertion code is always None. There is one element per atom, and the\n      list is ordered according to the order of atoms in the input arrays.\n    \"\"\"\n    # Convert to Numpy strings, then to Python strings (dtype=object).\n    res_ids = self.residues_table.id.astype(str).astype(object)\n    res_ids = res_ids[\n        self.residues_table.index_by_key[self.atoms_table.res_key]\n    ]\n    ins_codes = [None] * self.num_atoms\n    return list(\n        zip(self.chain_id, res_ids, ins_codes, self.atom_name, strict=True)\n    )\n\n  def order_and_drop_atoms_to_match(\n      self,\n      other: 'Structure',\n      *,\n      allow_missing_atoms: bool = False,\n  ) -> Self:\n    \"\"\"Returns a new structure with atoms ordered & dropped to match another's.\n\n    This performs two operations simultaneously:\n      * Ordering the atoms in this structure to match the order in the other.\n      * Dropping atoms in this structure that do not appear in the other.\n\n    Example:\n    Consider a prediction and ground truth with the following atoms, described\n    using tuples of `(chain_id, res_id, atom_name)`:\n      * `prediction:   [(A, 1, CA), (A, 1, N), (A, 2, CA), (B, 1, CA)]`\n      * `ground_truth: [(B, 1, CA), (A, 1, N), (A, 1, CA)]`\n    Note how the ground truth is missing the `(A, 2, CA)` atom and also\n    has the atoms in a different order. This method returns a modified\n    prediction that has reordered atoms and without any atoms not in the ground\n    truth so that its atom list looks the same as the ground truth atom list.\n    This means `prediction.coords` and `ground_truth.coords` now have the\n    same shape and can be compared across the atom dimension.\n\n    Note that matching residues with no atoms and matching chains with no\n    residues will also be kept. E.g. in the example above, if prediction and\n    ground truth both had an unresolved residue (A, 3), the output structure\n    will also have an unresolved residue (A, 3).\n\n    Args:\n      other: Another `Structure`. This provides the reference ordering that is\n        used to sort this structure's atom arrays.\n      allow_missing_atoms: Whether to skip atoms present in `other` but not this\n        structure and return a structure containing a subset of the atoms in the\n        other structure.\n\n    Returns:\n      A new `Structure`, based on this structure, which, if\n      `allow_missing_atoms` is False, contains exactly the same atoms as in\n      the `other` structure and which matches the `other` structure in terms\n      of the order of the atoms in the field arrays. Otherwise, if missing\n      atoms are allowed then the resulting structure contains a subset of\n      those atoms in the other structure.\n\n    Raises:\n      MissingAtomError: If there are atoms present in the other structure that\n        cannot be found in this structure.\n    \"\"\"\n    atom_index_map = {atom_id: i for i, atom_id in enumerate(self.atom_ids)}\n    try:\n      if allow_missing_atoms:\n        # Only include atoms that were found in the other structure.\n        atom_indices = [\n            atom_index\n            for atom_id in other.atom_ids\n            if (atom_index := atom_index_map.get(atom_id)) is not None\n        ]\n      else:\n        atom_indices = [\n            atom_index_map[atom_id]  # Hard fail on missing.\n            for atom_id in other.atom_ids\n        ]\n    except KeyError as e:\n      if len(e.args[0]) == 4:\n        chain_id, res_id, ins_code, atom_name = e.args[0]\n        raise MissingAtomError(\n            f'No atom in this structure (name: {self._name}) matches atom in '\n            f'other structure (name: {other.name}) with internal (label) chain '\n            f'ID {chain_id}, residue ID {res_id}, insertion code {ins_code} '\n            f'and atom name {atom_name}.'\n        ) from e\n      else:\n        raise\n\n    def _iter_residues(struc: Self) -> Iterable[tuple[str, str]]:\n      yield from zip(\n          struc.chains_table['id', struc.residues_table.chain_key],\n          struc.residues_table.id,\n          strict=True,\n      )\n\n    chain_index_map = {\n        chain_id: i for i, chain_id in enumerate(self._chains.id)\n    }\n    chain_indices = [\n        chain_index\n        for chain_id in other.chains_table.id\n        if (chain_index := chain_index_map.get(chain_id)) is not None\n    ]\n    residue_index_map = {\n        res_id: i for i, res_id in enumerate(_iter_residues(self))\n    }\n    res_indices = [\n        residue_index\n        for res_id in _iter_residues(other)\n        if (residue_index := residue_index_map.get(res_id)) is not None\n    ]\n\n    # Reorder all tables.\n    chains = self._chains.apply_index(np.array(chain_indices, dtype=np.int64))\n    residues = self._residues.apply_index(np.array(res_indices, dtype=np.int64))\n    atoms = self._atoms.apply_index(np.array(atom_indices, dtype=np.int64))\n\n    # Get chain keys in the order they appear in the atoms table.\n    new_chain_boundaries = _get_change_indices(atoms.chain_key)\n    new_chain_key_order = atoms.chain_key[new_chain_boundaries]\n    if len(new_chain_key_order) != len(set(new_chain_key_order)):\n      raise ValueError(\n          f'Chain keys not contiguous after reordering: {new_chain_key_order}'\n      )\n\n    # Get residue keys in the order they appear in the atoms table.\n    new_res_boundaries = _get_change_indices(atoms.res_key)\n    new_res_key_order = atoms.res_key[new_res_boundaries]\n    if len(new_res_key_order) != len(set(new_res_key_order)):\n      raise ValueError(\n          f'Residue keys not contiguous after reordering: {new_res_key_order}'\n      )\n\n    # If any atoms were deleted, propagate that into the bonds table.\n    updated_tables = self._cascade_delete(\n        chains=chains,\n        residues=residues,\n        atoms=atoms,\n    )\n    return self.copy_and_update(\n        chains=chains,\n        residues=residues,\n        atoms=updated_tables.atoms,\n        bonds=updated_tables.bonds,\n    )\n\n  def copy_and_update(\n      self,\n      *,\n      name: str | Literal[_UNSET] = _UNSET,\n      release_date: datetime.date | None | Literal[_UNSET] = _UNSET,\n      resolution: float | None | Literal[_UNSET] = _UNSET,\n      structure_method: str | None | Literal[_UNSET] = _UNSET,\n      bioassembly_data: (\n          bioassemblies.BioassemblyData | None | Literal[_UNSET]\n      ) = _UNSET,\n      chemical_components_data: (\n          struc_chem_comps.ChemicalComponentsData | None | Literal[_UNSET]\n      ) = _UNSET,\n      chains: structure_tables.Chains | None | Literal[_UNSET] = _UNSET,\n      residues: structure_tables.Residues | None | Literal[_UNSET] = _UNSET,\n      atoms: structure_tables.Atoms | None | Literal[_UNSET] = _UNSET,\n      bonds: structure_tables.Bonds | None | Literal[_UNSET] = _UNSET,\n      skip_validation: bool = False,\n  ) -> Self:\n    \"\"\"Performs a shallow copy but with specified fields updated.\"\"\"\n\n    def all_unset(fields):\n      return all(field == _UNSET for field in fields)\n\n    if all_unset((chains, residues, atoms, bonds)):\n      if all_unset((\n          name,\n          release_date,\n          resolution,\n          structure_method,\n          bioassembly_data,\n          chemical_components_data,\n      )):\n        raise ValueError(\n            'Unnecessary call to copy_and_update with no changes. As Structure'\n            ' and its component tables are immutable, there is no need to copy'\n            ' it. Any subsequent operation that modifies structure will return'\n            ' a new object.'\n        )\n      else:\n        raise ValueError(\n            'When only changing global fields, prefer to use the specialised '\n            'copy_and_update_globals.'\n        )\n\n    def select(field, default):\n      return field if field != _UNSET else default\n\n    return Structure(\n        name=select(name, self.name),\n        release_date=select(release_date, self.release_date),\n        resolution=select(resolution, self.resolution),\n        structure_method=select(structure_method, self.structure_method),\n        bioassembly_data=select(bioassembly_data, self.bioassembly_data),\n        chemical_components_data=select(\n            chemical_components_data, self.chemical_components_data\n        ),\n        chains=select(chains, self._chains),\n        residues=select(residues, self._residues),\n        atoms=select(atoms, self._atoms),\n        bonds=select(bonds, self._bonds),\n        skip_validation=skip_validation,\n    )\n\n  def _copy_and_update(\n      self, skip_validation: bool = False, **changes: Any\n  ) -> Self:\n    \"\"\"Performs a shallow copy but with specified fields updated.\"\"\"\n    if not changes:\n      raise ValueError(\n          'Unnecessary call to copy_and_update with no changes. As Structure '\n          'and its component tables are immutable, there is no need to copy '\n          'it. Any subsequent operation that modifies structure will return a '\n          'new object.'\n      )\n\n    if 'author_naming_scheme' in changes:\n      raise ValueError(\n          'Updating using author_naming_scheme is not supported. Update '\n          'auth_asym_id, entity_id, entity_desc fields directly in the chains '\n          'table and auth_seq_id, insertion_code in the residues table.'\n      )\n\n    if all(k in GLOBAL_FIELDS for k in changes):\n      raise ValueError(\n          'When only changing global fields, prefer to use the specialised '\n          'copy_and_update_globals.'\n      )\n\n    if all(k in V2_FIELDS for k in changes):\n      constructor_kwargs = {field: self[field] for field in V2_FIELDS}\n      constructor_kwargs.update(changes)\n    elif any(k in ('atoms', 'residues', 'chains') for k in changes):\n      raise ValueError(\n          'Cannot specify atoms/chains/residues table changes with non-v2'\n          f' constructor params: {changes.keys()}'\n      )\n    elif all(k in ATOM_FIELDS for k in changes):\n      if 'atom_key' not in changes:\n        raise ValueError(\n            'When only changing atom fields, prefer to use the specialised '\n            'copy_and_update_atoms.'\n        )\n      # Only atom fields are being updated, do that directly on the atoms table.\n      updated_atoms = self._atoms.copy_and_update(\n          **{ATOM_FIELDS[k]: v for k, v in changes.items()}\n      )\n      constructor_kwargs = {\n          field: self[field] for field in V2_FIELDS if field != 'atoms'\n      }\n      constructor_kwargs['atoms'] = updated_atoms\n    else:\n      constructor_kwargs = {field: self[field] for field in _UPDATEABLE_FIELDS}\n      constructor_kwargs.update(changes)\n    return Structure(skip_validation=skip_validation, **constructor_kwargs)\n\n  def copy_and_update_coords(self, coords: np.ndarray) -> Self:\n    \"\"\"Performs a shallow copy but with coordinates updated.\"\"\"\n    if coords.shape[-2:] != (self.num_atoms, 3):\n      raise ValueError(\n          f'{coords.shape=} does not have last dimensions ({self.num_atoms}, 3)'\n      )\n    updated_atoms = self._atoms.copy_and_update_coords(coords)\n    return self.copy_and_update(atoms=updated_atoms, skip_validation=True)\n\n  def copy_and_update_from_res_arrays(\n      self,\n      *,\n      include_unresolved: bool = False,\n      **changes: np.ndarray,\n  ) -> Self:\n    \"\"\"Like copy_and_update but changes are arrays of length num_residues.\n\n    These changes are first scattered into arrays of length num_atoms such\n    that each value is repeated across the residue at that index, then they\n    are used as the new values of these fields.\n\n    E.g.\n    * This structure's res_id: 1, 1, 1, 2, 3, 3 (3 res, 6 atoms)\n    * new atom_b_factor: 7, 8, 9\n    * Returned structure's atom_b_factor: 7, 7, 7, 8, 9, 9\n\n    Args:\n      include_unresolved: Whether the provided list of new values per residue\n        include values for all residues, or only those that are resolved.\n      **changes: kwargs corresponding to atom array fields, e.g. atom_x or\n        atom_b_factor, but with length num_residues rather than num_atoms. Note\n        that changing atom_key this way is is not supported.\n\n    Returns:\n      A new `Structure` with all fields other than those specified as kwargs\n      shallow copied from this structure. The values of the kwargs are\n      scattered across the atom arrays and then used to overwrite these\n      fields for the returned structure.\n    \"\"\"\n    if not all(c in set(ATOM_FIELDS) - {'atom_key'} for c in changes):\n      raise ValueError(\n          'Changes must only be to atom fields, got changes to'\n          f' {changes.keys()}'\n      )\n\n    num_residues = self.num_residues(count_unresolved=include_unresolved)\n\n    for field_name, new_values in changes.items():\n      if len(new_values) != num_residues:\n        raise ValueError(\n            f'{field_name} array of length {len(new_values)} does not match '\n            f'{num_residues=} - is include_unresolved set correctly?'\n        )\n\n    # We cannot assume that atom_table.res_keys are the relevant indices of the\n    # residue table.\n\n    # Therefore we need to construct a map from res_key to the new values and\n    # update the atoms_table with that.\n    if include_unresolved:\n      target_keys = self.residues_table.key\n    else:\n      target_keys = self.present_residues.key\n\n    new_atom_columns = {}\n    for field_name, new_values in changes.items():\n      value_by_key = dict(zip(target_keys, new_values, strict=True))\n      # pylint: disable=cell-var-from-loop\n      new_atom_columns[field_name] = np.vectorize(lambda x: value_by_key[x])(\n          self.atoms_table.res_key\n      )\n      # pylint: enable=cell-var-from-loop\n\n    return self.copy_and_update_atoms(**new_atom_columns)\n\n  def copy_and_update_globals(\n      self,\n      *,\n      name: str | Literal[_UNSET] = _UNSET,\n      release_date: datetime.date | Literal[_UNSET] | None = _UNSET,\n      resolution: float | Literal[_UNSET] | None = _UNSET,\n      structure_method: str | Literal[_UNSET] | None = _UNSET,\n      bioassembly_data: (\n          bioassemblies.BioassemblyData | Literal[_UNSET] | None\n      ) = _UNSET,\n      chemical_components_data: (\n          struc_chem_comps.ChemicalComponentsData | Literal[_UNSET] | None\n      ) = _UNSET,\n  ) -> Self:\n    \"\"\"Returns a shallow copy with the global columns updated.\"\"\"\n\n    def select(field, default):\n      return field if field != _UNSET else default\n\n    name = select(name, self.name)\n    release_date = select(release_date, self.release_date)\n    resolution = select(resolution, self.resolution)\n    structure_method = select(structure_method, self.structure_method)\n    bioassembly_data = select(bioassembly_data, self.bioassembly_data)\n    chem_data = select(chemical_components_data, self.chemical_components_data)\n\n    return Structure(\n        name=name,\n        release_date=release_date,\n        resolution=resolution,\n        structure_method=structure_method,\n        bioassembly_data=bioassembly_data,\n        chemical_components_data=chem_data,\n        atoms=self._atoms,\n        residues=self._residues,\n        chains=self._chains,\n        bonds=self._bonds,\n    )\n\n  def copy_and_update_atoms(\n      self,\n      *,\n      atom_name: np.ndarray | None = None,\n      atom_element: np.ndarray | None = None,\n      atom_x: np.ndarray | None = None,\n      atom_y: np.ndarray | None = None,\n      atom_z: np.ndarray | None = None,\n      atom_b_factor: np.ndarray | None = None,\n      atom_occupancy: np.ndarray | None = None,\n  ) -> Self:\n    \"\"\"Returns a shallow copy with the atoms table updated.\"\"\"\n    new_atoms = structure_tables.Atoms(\n        key=self._atoms.key,\n        res_key=self._atoms.res_key,\n        chain_key=self._atoms.chain_key,\n        name=atom_name if atom_name is not None else self.atom_name,\n        element=atom_element if atom_element is not None else self.atom_element,\n        x=atom_x if atom_x is not None else self.atom_x,\n        y=atom_y if atom_y is not None else self.atom_y,\n        z=atom_z if atom_z is not None else self.atom_z,\n        b_factor=(\n            atom_b_factor if atom_b_factor is not None else self.atom_b_factor\n        ),\n        occupancy=(\n            atom_occupancy\n            if atom_occupancy is not None\n            else self.atom_occupancy\n        ),\n    )\n    return self.copy_and_update(atoms=new_atoms)\n\n  def copy_and_update_residues(\n      self,\n      *,\n      res_id: np.ndarray | None = None,\n      res_name: np.ndarray | None = None,\n      res_auth_seq_id: np.ndarray | None = None,\n      res_insertion_code: np.ndarray | None = None,\n  ) -> Self:\n    \"\"\"Returns a shallow copy with the residues table updated.\"\"\"\n    new_residues = structure_tables.Residues(\n        key=self._residues.key,\n        chain_key=self._residues.chain_key,\n        id=res_id if res_id is not None else self._residues.id,\n        name=res_name if res_name is not None else self._residues.name,\n        auth_seq_id=res_auth_seq_id\n        if res_auth_seq_id is not None\n        else self._residues.auth_seq_id,\n        insertion_code=res_insertion_code\n        if res_insertion_code is not None\n        else self._residues.insertion_code,\n    )\n    return self.copy_and_update(residues=new_residues)\n\n  def _cascade_delete(\n      self,\n      *,\n      chains: structure_tables.Chains | None = None,\n      residues: structure_tables.Residues | None = None,\n      atoms: structure_tables.Atoms | None = None,\n      bonds: structure_tables.Bonds | None = None,\n  ) -> StructureTables:\n    \"\"\"Performs a cascade delete operation on the structure's tables.\n\n    Cascade delete ensures all the tables are consistent after any table fields\n    are being updated by cascading any deletions down the hierarchy of tables:\n    chains > residues > atoms > bonds.\n\n    E.g.: if a row from residues table is removed then all the atoms in that\n    residue will also be removed from the atoms table. In turn this cascades\n    also to the bond table, by removing any bond row which involves any of those\n    removed atoms. However the chains table will not be modified, even if\n    that was the only residue in its chain, because the chains table is above\n    the residues table in the hierarchy.\n\n    Args:\n      chains: An optional new chains table.\n      residues: An optional new residues table.\n      atoms: An optional new atoms table.\n      bonds: An optional new bonds table.\n\n    Returns:\n      A StructureTables object with the updated tables.\n    \"\"\"\n    if chains_unchanged := chains is None:\n      chains = self._chains\n    if residues_unchanged := residues is None:\n      residues = self._residues\n    if atoms_unchanged := atoms is None:\n      atoms = self._atoms\n    if bonds is None:\n      bonds = self._bonds\n\n    if not chains_unchanged:\n      residues_mask = membership.isin(residues.chain_key, set(chains.key))  # pylint:disable=attribute-error\n      if not np.all(residues_mask):  # Only apply if this is not a no-op.\n        residues = residues[residues_mask]\n        residues_unchanged = False\n    if not residues_unchanged:\n      atoms_mask = membership.isin(atoms.res_key, set(residues.key))  # pylint:disable=attribute-error\n      if not np.all(atoms_mask):  # Only apply if this is not a no-op.\n        atoms = atoms[atoms_mask]\n        atoms_unchanged = False\n    if not atoms_unchanged:\n      bonds = bonds.restrict_to_atoms(atoms.key)\n    return StructureTables(\n        chains=chains, residues=residues, atoms=atoms, bonds=bonds\n    )\n\n  def filter(\n      self,\n      mask: np.ndarray | None = None,\n      *,\n      apply_per_element: bool = False,\n      invert: bool = False,\n      cascade_delete: CascadeDelete = CascadeDelete.CHAINS,\n      **predicate_by_field_name: table.FilterPredicate,\n  ) -> Self:\n    \"\"\"Filters the structure by field values and returns a new structure.\n\n    Predicates are specified as keyword arguments, with names following the\n    pattern: <table_name>_<col_name>, where table_name := (chain|res|atom).\n    For instance the auth_seq_id column in the residues table can be filtered\n    by passing `res_auth_seq_id=pred_value`. The full list of valid options\n    are defined in the `col_by_field_name` fields on the different Table\n    dataclasses.\n\n    Predicate values can be either:\n      1. A constant value, e.g. 'CA'. In this case then only rows that match\n        this value for the given field are retained.\n      2. A (non-string) iterable e.g. ('A', 'B'). In this\n        case then rows are retained if they match any of the provided values for\n        the given field.\n      3. A boolean function e.g. lambda b_fac: b_fac < 100.0.\n        In this case then only rows that evaluate to True are retained. By\n        default this function's parameter is expected to be an array, unless\n        apply_per_element=True.\n\n    Example usage:\n      # Filter to backbone atoms in residues up to 100 in chain B.\n      filtered_struc = struc.filter(\n          chain_id='B',\n          atom_name=('N', 'CA', 'C'),\n          res_id=lambda res_id: res_id < 100)\n\n    Example usage where predicate must be applied per-element:\n      # Filter to residues with IDs in either [1, 100) or [300, 400).\n      ranges = ((1, 100), (300, 400))\n      filtered_struc = struc.filter(\n          res_id=lambda i: np.any([start <= i < end for start, end in ranges]),\n          apply_per_element=True)\n\n    Example usage of providing a raw mask:\n      filtered_struc = struc.filter(struc.atom_b_factor < 10.0)\n\n    Args:\n      mask: An optional boolean NumPy array with length equal to num_atoms. If\n        provided then this will be combined with the other predicates so that an\n        atom is included if it is masked-in *and* matches all the predicates.\n      apply_per_element: Whether apply predicates to each element individually,\n        or to pass the whole column array to the predicate.\n      invert: Whether to remove, rather than retain, the entities which match\n        the specified predicates.\n      cascade_delete: Whether to remove residues and chains which are left\n        unresolved in a cascade. filter operates on the atoms table, removing\n        atoms which match the predicate. If all atoms in a residue are removed,\n        the residue is \"unresolved\". The value of this argument then determines\n        whether such residues and their parent chains should be deleted. FULL\n        implies that all unresolved residues should be deleted, and any chains\n        which are left with no resolved residues should be deleted. CHAINS is\n        the default behaviour - only chains with no resolved residues, and their\n        child residues are deleted. Unresolved residues in partially resolved\n        chains remain. NONE implies that no unresolved residues or chains should\n        be deleted.\n      **predicate_by_field_name: A mapping from field name to a predicate.\n        Filtered columns must be 1D arrays. If multiple fields are provided as\n        keyword arguments then each predicate is applied and the results are\n        combined using a boolean AND operation, so an atom is only retained if\n        it passes all predicates.\n\n    Returns:\n      A new structure representing a filtered version of the current structure.\n\n    Raises:\n      ValueError: If mask is provided and is not a bool array with shape\n        (num_atoms,).\n    \"\"\"\n    chain_predicates, res_predicates, atom_predicates = (\n        _unpack_filter_predicates(predicate_by_field_name)\n    )\n    # Get boolean masks for each table. These are None if none of the filter\n    # parameters affect the table in question.\n    chain_mask = self._chains.make_filter_mask(\n        **chain_predicates, apply_per_element=apply_per_element\n    )\n    res_mask = self._residues.make_filter_mask(\n        **res_predicates, apply_per_element=apply_per_element\n    )\n    atom_mask = self._atoms.make_filter_mask(\n        mask, **atom_predicates, apply_per_element=apply_per_element\n    )\n    if atom_mask is None:\n      atom_mask = np.ones((self._atoms.size,), dtype=bool)\n\n    # Remove atoms that belong to filtered out chains.\n    if chain_mask is not None:\n      atom_chain_mask = membership.isin(\n          self._atoms.chain_key, set(self._chains.key[chain_mask])\n      )\n      np.logical_and(atom_mask, atom_chain_mask, out=atom_mask)\n\n    # Remove atoms that belong to filtered out residues.\n    if res_mask is not None:\n      atom_res_mask = membership.isin(\n          self._atoms.res_key, set(self._residues.key[res_mask])\n      )\n      np.logical_and(atom_mask, atom_res_mask, out=atom_mask)\n\n    final_atom_mask = ~atom_mask if invert else atom_mask\n\n    if cascade_delete == CascadeDelete.NONE and np.all(final_atom_mask):\n      return self  # Shortcut: The filter is a no-op, so just return itself.\n\n    filtered_atoms = typing.cast(\n        structure_tables.Atoms, self._atoms[final_atom_mask]\n    )\n\n    match cascade_delete:\n      case CascadeDelete.FULL:\n        nonempty_residues_mask = np.isin(\n            self._residues.key, filtered_atoms.res_key\n        )\n        filtered_residues = self._residues[nonempty_residues_mask]\n        nonempty_chain_mask = np.isin(\n            self._chains.key, filtered_atoms.chain_key\n        )\n        filtered_chains = self._chains[nonempty_chain_mask]\n        updated_tables = self._cascade_delete(\n            chains=filtered_chains,\n            residues=filtered_residues,\n            atoms=filtered_atoms,\n        )\n      case CascadeDelete.CHAINS:\n        # To match v1 behavior we remove chains that have no atoms remaining,\n        # and we remove residues in those chains.\n        # NB we do not remove empty residues.\n        nonempty_chain_mask = membership.isin(\n            self._chains.key, set(filtered_atoms.chain_key)\n        )\n        filtered_chains = self._chains[nonempty_chain_mask]\n        updated_tables = self._cascade_delete(\n            chains=filtered_chains, atoms=filtered_atoms\n        )\n      case CascadeDelete.NONE:\n        updated_tables = self._cascade_delete(atoms=filtered_atoms)\n      case _:\n        raise ValueError(f'Unknown cascade_delete behaviour: {cascade_delete}')\n    return self.copy_and_update(\n        chains=updated_tables.chains,\n        residues=updated_tables.residues,\n        atoms=updated_tables.atoms,\n        bonds=updated_tables.bonds,\n        skip_validation=True,\n    )\n\n  def filter_out(self, *args, **kwargs) -> Self:\n    \"\"\"Returns a new structure with the specified elements removed.\"\"\"\n    return self.filter(*args, invert=True, **kwargs)\n\n  def filter_to_entity_type(\n      self,\n      *,\n      protein: bool = False,\n      rna: bool = False,\n      dna: bool = False,\n      dna_rna_hybrid: bool = False,\n      ligand: bool = False,\n      water: bool = False,\n  ) -> Self:\n    \"\"\"Filters the structure to only include the selected entity types.\n\n    This convenience method abstracts away the specifics of mmCIF entity\n    type names which, especially for ligands, are non-trivial.\n\n    Args:\n      protein: Whether to include protein (polypeptide(L)) chains.\n      rna: Whether to include RNA chains.\n      dna: Whether to include DNA chains.\n      dna_rna_hybrid: Whether to include DNA RNA hybrid chains.\n      ligand: Whether to include ligand (i.e. not polymer) chains.\n      water: Whether to include water chains.\n\n    Returns:\n      The filtered structure.\n    \"\"\"\n    include_types = []\n    if protein:\n      include_types.append(mmcif_names.PROTEIN_CHAIN)\n    if rna:\n      include_types.append(mmcif_names.RNA_CHAIN)\n    if dna:\n      include_types.append(mmcif_names.DNA_CHAIN)\n    if dna_rna_hybrid:\n      include_types.append(mmcif_names.DNA_RNA_HYBRID_CHAIN)\n    if ligand:\n      include_types.extend(mmcif_names.LIGAND_CHAIN_TYPES)\n    if water:\n      include_types.append(mmcif_names.WATER)\n    return self.filter(chain_type=include_types)\n\n  def get_stoichiometry(\n      self, *, fix_non_standard_polymer_res: bool = False\n  ) -> Sequence[int]:\n    \"\"\"Returns the structure's stoichiometry using chain_res_name_sequence.\n\n    Note that everything is considered (protein, RNA, DNA, ligands) except for\n    water molecules. If you are interested only in a certain type of entities,\n    filter them out before calling this method.\n\n    Args:\n      fix_non_standard_polymer_res: If True, maps non standard residues in\n        protein / RNA / DNA chains to standard residues (e.g. MSE -> MET) or UNK\n        / N if a match is not found.\n\n    Returns:\n      A list of integers, one for each unique chain in the structure,\n      determining the number of that chain appearing in the structure. The\n      numbers are sorted highest to lowest. E.g. for an A3B2 protein this method\n      will return [3, 2].\n    \"\"\"\n    filtered = self.filter_to_entity_type(\n        protein=True,\n        rna=True,\n        dna=True,\n        dna_rna_hybrid=True,\n        ligand=True,\n        water=False,\n    )\n    seqs = filtered.chain_res_name_sequence(\n        include_missing_residues=True,\n        fix_non_standard_polymer_res=fix_non_standard_polymer_res,\n    )\n\n    unique_seq_counts = collections.Counter(seqs.values())\n    return sorted(unique_seq_counts.values(), reverse=True)\n\n  def without_hydrogen(self) -> Self:\n    \"\"\"Returns the structure without hydrogen atoms.\"\"\"\n    return self.filter(\n        np.logical_and(self._atoms.element != 'H', self._atoms.element != 'D')\n    )\n\n  def without_terminal_oxygens(self) -> Self:\n    \"\"\"Returns the structure without terminal oxygen atoms.\"\"\"\n    terminal_oxygen_filter = np.zeros(self.num_atoms, dtype=bool)\n    for chain_type, atom_name in mmcif_names.TERMINAL_OXYGENS.items():\n      chain_keys = self._chains.key[self._chains.type == chain_type]\n      chain_atom_filter = np.logical_and(\n          self._atoms.name == atom_name,\n          np.isin(self._atoms.chain_key, chain_keys),\n      )\n      np.logical_or(\n          terminal_oxygen_filter, chain_atom_filter, out=terminal_oxygen_filter\n      )\n    return self.filter_out(terminal_oxygen_filter)\n\n  def reset_author_naming_scheme(self) -> Self:\n    \"\"\"Remove author chain/residue ids, entity info and use internal ids.\"\"\"\n    new_chains = structure_tables.Chains(\n        key=self._chains.key,\n        id=self._chains.id,\n        type=self._chains.type,\n        auth_asym_id=self._chains.id,\n        entity_id=np.arange(1, self.num_chains + 1).astype(str).astype(object),\n        entity_desc=np.full(self.num_chains, '.', dtype=object),\n    )\n    new_residues = structure_tables.Residues(\n        key=self._residues.key,\n        chain_key=self._residues.chain_key,\n        id=self._residues.id,\n        name=self._residues.name,\n        auth_seq_id=self._residues.id.astype(str).astype(object),\n        insertion_code=np.full(\n            self.num_residues(count_unresolved=True), '?', dtype=object\n        ),\n    )\n    return self.copy_and_update(\n        chains=new_chains, residues=new_residues, skip_validation=True\n    )\n\n  def filter_residues(self, res_mask: np.ndarray) -> Self:\n    \"\"\"Filter resolved residues using a boolean mask.\"\"\"\n    required_shape = (self.num_residues(count_unresolved=False),)\n    if res_mask.shape != required_shape:\n      raise ValueError(\n          f'res_mask must have shape {required_shape}. Got: {res_mask.shape}.'\n      )\n    if res_mask.dtype != bool:\n      raise ValueError(f'res_mask must have dtype bool. Got: {res_mask.dtype}.')\n\n    filtered_residues = self.present_residues.filter(res_mask)\n    atom_mask = np.isin(self._atoms.res_key, filtered_residues.key)\n    return self.filter(atom_mask)\n\n  def filter_coords(\n      self, coord_predicate: Callable[[np.ndarray], bool]\n  ) -> Self:\n    \"\"\"Filter a structure's atoms by a function of their coordinates.\n\n    Args:\n      coord_predicate: A boolean function of coordinate vectors (shape (3,)).\n\n    Returns:\n      A Structure filtered so that only atoms with coords passing the predicate\n      function are present.\n\n    Raises:\n      ValueError: If the coords are not shaped (num_atom, 3).\n    \"\"\"\n    coords = self.coords\n    if coords.ndim != 2 or coords.shape[-1] != 3:\n      raise ValueError(\n          f'coords should have shape (num_atom, 3). Got {coords.shape}.'\n      )\n    mask = np.vectorize(coord_predicate, signature='(n)->()')(coords)\n    # This use of _apply_atom_index_array is safe because a boolean mask is\n    # used, which means the chain/residue/atom ordering will stay unchanged.\n    return self._apply_atom_index_array(mask, skip_validation=True)\n\n  def filter_polymers_to_single_atom_per_res(\n      self,\n      representative_atom_by_chain_type: Mapping[\n          str, str\n      ] = mmcif_names.RESIDUE_REPRESENTATIVE_ATOMS,\n  ) -> Self:\n    \"\"\"Filter to one representative atom per polymer residue, ligands unchanged.\n\n    Args:\n      representative_atom_by_chain_type: Chain type str to atom name, only atoms\n        with this name will be kept for this chain type. Chains types from the\n        structure not found in this mapping will keep all their atoms.\n\n    Returns:\n      A Structure filtered so that per chain types, only specified atoms are\n      present.\n    \"\"\"\n    polymer_chain_keys = self._chains.key[\n        string_array.isin(\n            self._chains.type, set(representative_atom_by_chain_type)\n        )\n    ]\n    polymer_atoms_mask = np.isin(self._atoms.chain_key, polymer_chain_keys)\n\n    wanted_atom_by_chain_key = {\n        chain_key: representative_atom_by_chain_type.get(chain_type, None)\n        for chain_key, chain_type in zip(self._chains.key, self._chains.type)\n    }\n    wanted_atoms = string_array.remap(\n        self._atoms.chain_key.astype(object), mapping=wanted_atom_by_chain_key\n    )\n\n    representative_polymer_atoms_mask = polymer_atoms_mask & (\n        wanted_atoms == self._atoms.name\n    )\n\n    return self.filter(representative_polymer_atoms_mask | ~polymer_atoms_mask)\n\n  def drop_non_standard_protein_atoms(self, *, drop_oxt: bool = True) -> Self:\n    \"\"\"Drops non-standard atom names from protein chains.\n\n    Args:\n      drop_oxt: If True, also drop terminal oxygens (OXT).\n\n    Returns:\n      A new Structure object where the protein chains have been filtered to\n        only contain atoms with names listed in `atom_types`\n        (including OXT unless `drop_oxt` is `True`). Non-protein chains are\n        unaltered.\n    \"\"\"\n    allowed_names = set(atom_types.ATOM37)\n    if drop_oxt:\n      allowed_names = {n for n in allowed_names if n != atom_types.OXT}\n\n    return self.filter_out(\n        chain_type=mmcif_names.PROTEIN_CHAIN,\n        atom_name=lambda n: string_array.isin(n, allowed_names, invert=True),\n    )\n\n  def drop_non_standard_atoms(\n      self,\n      *,\n      ccd: chemical_components.Ccd,\n      drop_unk: bool,\n      drop_non_ccd: bool,\n      drop_terminal_oxygens: bool = False,\n  ) -> Self:\n    \"\"\"Drops atoms that are not in the CCD for the given residue type.\"\"\"\n\n    # We don't remove any atoms in UNL, as it has no standard atoms.\n    def _keep(atom_index: int) -> bool:\n      atom_name = self._atoms.name[atom_index]\n      res_name = self._residues.name[\n          self._residues.index_by_key[self._atoms.res_key[atom_index]]\n      ]\n      if drop_unk and res_name in residue_names.UNKNOWN_TYPES:\n        return False\n      else:\n        return (\n            (not drop_non_ccd and not ccd.get(res_name))\n            or atom_name in struc_chem_comps.get_res_atom_names(ccd, res_name)\n            or res_name == residue_names.UNL\n        )\n\n    standard_atom_mask = np.array(\n        [_keep(atom_i) for atom_i in range(self.num_atoms)], dtype=bool\n    )\n    standard_atoms = self.filter(mask=standard_atom_mask)\n    if drop_terminal_oxygens:\n      standard_atoms = standard_atoms.without_terminal_oxygens()\n    return standard_atoms\n\n  def find_chains_with_unknown_sequence(self) -> Sequence[str]:\n    \"\"\"Returns a sequence of chain IDs that contain only unknown residues.\"\"\"\n    unknown_sequences = []\n    for start, end in self.iter_chain_ranges():\n      try:\n        unknown_id = residue_names.UNKNOWN_TYPES.index(self.res_name[start])\n        if start + 1 == end or np.all(\n            self.res_name[start + 1 : end]\n            == residue_names.UNKNOWN_TYPES[unknown_id]\n        ):\n          unknown_sequences.append(self.chain_id[start])\n      except ValueError:\n        pass\n    return unknown_sequences\n\n  def add_bonds(\n      self,\n      bonded_atom_pairs: Sequence[\n          tuple[tuple[str, int, str], tuple[str, int, str]],\n      ],\n      bond_type: str | None = None,\n  ) -> Self:\n    \"\"\"Returns a structure with new bonds added.\n\n    Args:\n      bonded_atom_pairs: A sequence of pairs of atoms, with one pair per bond.\n        Each element of the pair is a tuple of (chain_id, res_id, atom_name),\n        matching values from the respective fields of this structure. The first\n        element is the start atom, and the second atom is the end atom of the\n        bond.\n      bond_type: This type will be used for all bonds in the structure, where\n        type follows PDB scheme, e.g. unknown (?), hydrog, metalc, covale,\n        disulf.\n\n    Returns:\n      A copy of this structure with the new bonds added. If this structure has\n      bonds already then the new bonds are concatenated onto the end of the\n      old bonds. NB: bonds are not deduplicated.\n    \"\"\"\n    atom_key_lookup: dict[tuple[str, str, None, str], int] = dict(\n        zip(self.atom_ids, self._atoms.key, strict=True)\n    )\n\n    # iter_atoms returns a 4-tuple (chain_id, res_id, ins_code, atom_name) but\n    # the insertion code is always None. It also uses string residue IDs.\n    def _to_internal_res_id(\n        bonded_atom_id: tuple[str, int, str],\n    ) -> tuple[str, str, None, str]:\n      return bonded_atom_id[0], str(bonded_atom_id[1]), None, bonded_atom_id[2]\n\n    from_atom_key = []\n    dest_atom_key = []\n    for from_atom, dest_atom in bonded_atom_pairs:\n      from_atom_key.append(atom_key_lookup[_to_internal_res_id(from_atom)])\n      dest_atom_key.append(atom_key_lookup[_to_internal_res_id(dest_atom)])\n    num_bonds = len(bonded_atom_pairs)\n    bonds_key = np.arange(num_bonds, dtype=np.int64)\n    from_atom_key = np.array(from_atom_key, dtype=np.int64)\n    dest_atom_key = np.array(dest_atom_key, dtype=np.int64)\n    all_unk_col = np.array(['?'] * num_bonds, dtype=object)\n    if bond_type is None:\n      bond_type_col = all_unk_col\n    else:\n      bond_type_col = np.full((num_bonds,), bond_type, dtype=object)\n\n    max_key = -1 if not self._bonds.size else np.max(self._bonds.key)\n    new_bonds = structure_tables.Bonds(\n        key=np.concatenate([self._bonds.key, bonds_key + max_key + 1]),\n        from_atom_key=np.concatenate(\n            [self._bonds.from_atom_key, from_atom_key]\n        ),\n        dest_atom_key=np.concatenate(\n            [self._bonds.dest_atom_key, dest_atom_key]\n        ),\n        type=np.concatenate([self._bonds.type, bond_type_col]),\n        role=np.concatenate([self._bonds.role, all_unk_col]),\n    )\n    return self.copy_and_update(bonds=new_bonds)\n\n  @property\n  def coords(self) -> np.ndarray:\n    \"\"\"A [..., num_atom, 3] shaped array of atom coordinates.\"\"\"\n    return np.stack([self._atoms.x, self._atoms.y, self._atoms.z], axis=-1)\n\n  def chain_single_letter_sequence(\n      self, include_missing_residues: bool = True\n  ) -> Mapping[str, str]:\n    \"\"\"Returns a mapping from chain ID to a single letter residue sequence.\n\n    Args:\n      include_missing_residues: Whether to include residues that have no atoms.\n    \"\"\"\n    res_table = (\n        self._residues if include_missing_residues else self.present_residues\n    )\n    residue_chain_boundaries = _get_change_indices(res_table.chain_key)\n    boundaries = self._iter_residue_ranges(\n        residue_chain_boundaries,\n        count_unresolved=include_missing_residues,\n    )\n    chain_keys = res_table.chain_key[residue_chain_boundaries]\n    chain_ids = self._chains.apply_array_to_column('id', chain_keys)\n    chain_types = self._chains.apply_array_to_column('type', chain_keys)\n    chain_seqs = {}\n    for idx, (start, end) in enumerate(boundaries):\n      chain_id = chain_ids[idx]\n      chain_type = chain_types[idx]\n      chain_res = res_table.name[start:end]\n      if chain_type in mmcif_names.PEPTIDE_CHAIN_TYPES:\n        unknown_default = 'X'\n      elif chain_type in mmcif_names.NUCLEIC_ACID_CHAIN_TYPES:\n        unknown_default = 'N'\n      else:\n        chain_seqs[chain_id] = 'X' * chain_res.size\n        continue\n\n      chain_res = string_array.remap(\n          chain_res,\n          mapping=residue_names.CCD_NAME_TO_ONE_LETTER,\n          inplace=False,\n          default_value=unknown_default,\n      )\n      chain_seqs[chain_id] = ''.join(chain_res.tolist())\n\n    return chain_seqs\n\n  def polymer_auth_asym_id_to_label_asym_id(\n      self,\n      *,\n      protein: bool = True,\n      rna: bool = True,\n      dna: bool = True,\n      other: bool = True,\n  ) -> Mapping[str, str]:\n    \"\"\"Mapping from author chain ID to internal chain ID, polymers only.\n\n    This mapping is well defined only for polymers (protein, DNA, RNA), but not\n    for ligands or water.\n\n    E.g. if a structure had the following internal chain IDs (label_asym_id):\n      A (protein), B (DNA), C (ligand bound to A), D (ligand bound to A),\n      E (ligand bound to B).\n\n    Such structure would have this internal chain ID (label_asym_id) -> author\n    chain ID (auth_asym_id) mapping:\n      A -> A, B -> B, C -> A, D -> A, E -> B\n\n    This is a bijection only for polymers (A, B), but not for ligands.\n\n    Args:\n      protein: Whether to include protein (polypeptide(L)) chains.\n      rna: Whether to include RNA chains.\n      dna: Whether to include DNA chains.\n      other: Whether to include other polymer chains, e.g. RNA/DNA hybrid or\n        polypeptide(D). Note that include_other=True must be set in from_mmcif.\n\n    Returns:\n      A mapping from author chain ID to the internal (label) chain ID for the\n      given polymer types in the Structure, ligands/water are ignored.\n\n    Raises:\n      ValueError: If the mapping from internal chain IDs to author chain IDs is\n        not a bijection for polymer chains.\n    \"\"\"\n    allowed_types = set()\n    if protein:\n      allowed_types.add(mmcif_names.PROTEIN_CHAIN)\n    if rna:\n      allowed_types.add(mmcif_names.RNA_CHAIN)\n    if dna:\n      allowed_types.add(mmcif_names.DNA_CHAIN)\n    if other:\n      non_standard_chain_types = (\n          mmcif_names.POLYMER_CHAIN_TYPES\n          - mmcif_names.STANDARD_POLYMER_CHAIN_TYPES\n      )\n      allowed_types |= non_standard_chain_types\n\n    auth_asym_id_to_label_asym_id = {}\n    for chain in self.iter_chains():\n      if chain['chain_type'] not in allowed_types:\n        continue\n      label_asym_id = chain['chain_id']\n      auth_asym_id = chain['chain_auth_asym_id']\n      # The mapping from author chain id to label chain id is only one-to-one if\n      # we restrict our attention to polymers. But check nevertheless.\n      if auth_asym_id in auth_asym_id_to_label_asym_id:\n        raise ValueError(\n            f'Author chain ID \"{auth_asym_id}\" does not have a unique mapping '\n            f'to internal chain ID \"{label_asym_id}\", it is already mapped to '\n            f'\"{auth_asym_id_to_label_asym_id[auth_asym_id]}\".'\n        )\n      auth_asym_id_to_label_asym_id[auth_asym_id] = label_asym_id\n\n    return auth_asym_id_to_label_asym_id\n\n  def polymer_author_chain_single_letter_sequence(\n      self,\n      *,\n      include_missing_residues: bool = True,\n      protein: bool = True,\n      rna: bool = True,\n      dna: bool = True,\n      other: bool = True,\n  ) -> Mapping[str, str]:\n    \"\"\"Mapping from author chain ID to single letter aa sequence, polymers only.\n\n    This mapping is well defined only for polymers (protein, DNA, RNA), but not\n    for ligands or water.\n\n    Args:\n      include_missing_residues: If True then all residues will be returned for\n        each polymer chain present in the structure. This uses the all_residues\n        field and will include residues missing due to filtering operations as\n        well as e.g. unresolved residues specified in an mmCIF header.\n      protein: Whether to include protein (polypeptide(L)) chains.\n      rna: Whether to include RNA chains.\n      dna: Whether to include DNA chains.\n      other: Whether to include other polymer chains, e.g. RNA/DNA hybrid or\n        polypeptide(D). Note that include_other=True must be set in from_mmcif.\n\n    Returns:\n      A mapping from (author) chain IDs to their single-letter sequences for all\n      polymers in the Structure, ligands/water are ignored.\n\n    Raises:\n      ValueError: If the mapping from internal chain IDs to author chain IDs is\n        not a bijection for polymer chains.\n    \"\"\"\n    label_chain_id_to_seq = self.chain_single_letter_sequence(\n        include_missing_residues=include_missing_residues\n    )\n    auth_to_label = self.polymer_auth_asym_id_to_label_asym_id(\n        protein=protein, rna=rna, dna=dna, other=other\n    )\n    return {\n        auth: label_chain_id_to_seq[label]\n        for auth, label in auth_to_label.items()\n    }\n\n  def chain_res_name_sequence(\n      self,\n      *,\n      include_missing_residues: bool = True,\n      fix_non_standard_polymer_res: bool = False,\n  ) -> Mapping[str, Sequence[str]]:\n    \"\"\"A mapping from internal chain ID to a sequence of residue names.\n\n    The residue names are the full residue names rather than single letter\n    codes. For instance, for proteins these are the 3 letter CCD codes.\n\n    Args:\n      include_missing_residues: Whether to include residues with no atoms in the\n        returned sequences.\n      fix_non_standard_polymer_res: Whether to map non standard residues in\n        protein / RNA / DNA chains to standard residues (e.g. MSE -> MET) or UNK\n        / N if a match is not found.\n\n    Returns:\n      A mapping from (internal) chain IDs to a sequence of residue names.\n    \"\"\"\n    res_table = (\n        self._residues if include_missing_residues else self.present_residues\n    )\n    residue_chain_boundaries = _get_change_indices(res_table.chain_key)\n    boundaries = self._iter_residue_ranges(\n        residue_chain_boundaries, count_unresolved=include_missing_residues\n    )\n    chain_keys = res_table.chain_key[residue_chain_boundaries]\n    chain_ids = self._chains.apply_array_to_column('id', chain_keys)\n    chain_types = self._chains.apply_array_to_column('type', chain_keys)\n    chain_seqs = {}\n    for idx, (start, end) in enumerate(boundaries):\n      chain_id = chain_ids[idx]\n      chain_type = chain_types[idx]\n      chain_res = res_table.name[start:end]\n      if (\n          fix_non_standard_polymer_res\n          and chain_type in mmcif_names.POLYMER_CHAIN_TYPES\n      ):\n        chain_seqs[chain_id] = tuple(\n            fix_non_standard_polymer_residues(\n                res_names=chain_res, chain_type=chain_type\n            )\n        )\n      else:\n        chain_seqs[chain_id] = tuple(chain_res)\n\n    return chain_seqs\n\n  def fix_non_standard_polymer_res(\n      self,\n      res_mapper: Callable[\n          [np.ndarray, str], np.ndarray\n      ] = fix_non_standard_polymer_residues,\n  ) -> Self:\n    \"\"\"Replaces non-standard polymer residues with standard alternatives or UNK.\n\n    e.g. maps 'ACE' -> 'UNK', 'MSE' -> 'MET'.\n\n    NB: Only fixes the residue names, but does not fix the atom names.\n    E.g., 'MSE' will be renamed to 'MET' but its 'SE' atom will not be renamed\n    to 'S'. Fixing MSE should be done during conversion from mmcif with the\n    `fix_mse_residues` flag.\n\n    Args:\n      res_mapper: An optional function that accepts a numpy array of residue\n        names and chain_type, and returns an array with fixed res_names. This\n        defaults to fix_non_standard_polymer_residues.\n\n    Returns:\n      A Structure containing only standard residue types (or 'UNK') in its\n      polymer chains.\n    \"\"\"\n    fixed_res_name = self._residues.name.copy()\n    chain_change_indices = _get_change_indices(self._residues.chain_key)\n    for start, end in self._iter_atom_ranges(chain_change_indices):\n      chain_key = self._residues.chain_key[start]\n      chain_type = self._chains.type[self._chains.index_by_key[chain_key]]\n      if chain_type not in mmcif_names.POLYMER_CHAIN_TYPES:\n        continue  # We don't need to change anything for non-polymers.\n      fixed_res_name[start:end] = res_mapper(\n          fixed_res_name[start:end], chain_type\n      )\n    fixed_residues = self._residues.copy_and_update(name=fixed_res_name)\n    return self.copy_and_update(residues=fixed_residues, skip_validation=True)\n\n  @property\n  def slice_leading_dims(self) -> '_LeadingDimSlice':\n    \"\"\"Used to create a new Structure by slicing into the leading dimensions.\n\n    Example usage 1:\n\n    ```\n    final_state = multi_state_struc.slice_leading_dims[-1]\n    ```\n\n    Example usage 2:\n\n    ```\n    # Structure has leading batch and time dimensions.\n    # Get final 3 time frames from first two batch elements.\n    sliced_strucs = batched_trajectories.slice_leading_dims[:2, -3:]\n    ```\n    \"\"\"\n    return _LeadingDimSlice(self)\n\n  def unstack(self, axis: int = 0) -> Sequence[Self]:\n    \"\"\"Unstacks a multi-model structure into a list of Structures.\n\n    This method is the inverse of `stack`.\n\n    Example usage:\n    ```\n    strucs = multi_dim_struc.unstack(axis=0)\n    ```\n\n    Args:\n      axis: The axis to unstack over. The structures in the returned list won't\n        have this axis in their coordinate of b-factor fields.\n\n    Returns:\n      A list of `Structure`s with length equal to the size of the specified\n      axis in the coorinate field arrays.\n\n    Raises:\n      IndexError: If axis does not refer to one of the leading dimensions of\n        `self.atoms_table.size`.\n    \"\"\"\n    ndim = self._atoms.ndim\n    if not (-ndim <= axis < ndim):\n      raise IndexError(\n          f'{axis=} is out of range for atom coordinate fields with {ndim=}.'\n      )\n    elif axis < 0:\n      axis += ndim\n    if axis == ndim - 1:\n      raise IndexError(\n          'axis must refer to one of the leading dimensions, not the final '\n          f'dimension. The atom fields have {ndim=} and {axis=} was specified.'\n      )\n    unstacked = []\n    leading_dim_slice = self.slice_leading_dims  # Compute once here.\n    for i in range(self._atoms.shape[axis]):\n      slice_i = (slice(None),) * axis + (i,)\n      unstacked.append(leading_dim_slice[slice_i])\n    return unstacked\n\n  def split_by_chain(self) -> Sequence[Self]:\n    \"\"\"Splits a Structure into single-chain Structures, one for each chain.\n\n    The obtained structures can be merged back together into the original\n    structure using the `concat` function.\n\n    Returns:\n      A list of `Structure`s, one for each chain. The order is the same as the\n      chain order in the original Structure.\n    \"\"\"\n    return [self.filter(chain_id=chain_id) for chain_id in self.chains]\n\n  def transform_states_to_chains(self) -> Self:\n    \"\"\"Transforms states to chains.\n\n    A multi-state protein structure will be transformed to a multi-chain\n    single-state protein structure. Useful for visualising multiples states to\n    examine diversity. This structure's coordinate fields must have shape\n    `(num_states, num_atoms)`.\n\n    Returns:\n      A new `Structure`, based on this structure, but with the multiple states\n      now represented as `num_states * num_chains` chains in a\n      single-state protein.\n\n    Raises:\n      ValueError: If this structure's array fields don't have shape\n        `(num_states, num_atoms)`.\n    \"\"\"\n    if self._atoms.ndim != 2:\n      raise ValueError(\n          'Coordinate field tensor must have 2 dimensions: '\n          f'(num_states, num_atoms), got {self._atoms.ndim}.'\n      )\n    return concat(self.unstack(axis=0))\n\n  def merge_chains(\n      self,\n      *,\n      chain_groups: Sequence[Sequence[str]],\n      chain_group_ids: Sequence[str] | None = None,\n      chain_group_types: Sequence[str] | None = None,\n      chain_group_entity_ids: Sequence[str] | None = None,\n  ) -> Self:\n    \"\"\"Merges chains in each group into a single chain.\n\n    If a Structure has chains A, B, C, D, E, and\n    `merge_chains([[A, C], [B, D], [E]])` is called, the new Structure will have\n    3 chains A, B, C, the first being concatenation of A+C, the second B+D, the\n    third just the original chain E.\n\n    Args:\n      chain_groups: Each group defines what chains should be merged into a\n        single chain. The output structure will therefore have len(chain_groups)\n        chains. Residue IDs (label and author) are renumbered to preserve\n        uniqueness within new chains. Order of chain groups and within each\n        group matters.\n      chain_group_ids: Optional sequence of new chain IDs for each group. If not\n        given, the new internal chain IDs (label_asym_id) are assigned in the\n        standard mmCIF order (i.e. A, B, ..., Z, AA, BA, CA, ...). Author chain\n        names (auth_asym_id) are set to be equal to the new internal chain IDs.\n      chain_group_types: Optional sequence of new chain types for each group. If\n        not given, only chains with the same type can be merged.\n      chain_group_entity_ids: Optional sequence of new entity IDs for each\n        group. If not given, the new internal entity IDs (entity_id) are\n        assigned in the standard mmCIF order (i.e. 1, 2, 3, ...). Entity\n        descriptions (entity_desc) are set to '.' for each chain.\n\n    Returns:\n      A new `Structure` with chains merged together into a single chain within\n      each chain group.\n\n    Raises:\n      ValueError: If chain_group_ids or chain_group_types are given but don't\n        match the length of chain_groups.\n      ValueError: If the chain IDs in the flattened chain_groups don't match the\n        chain IDs in the Structure.\n      ValueError: If chains in any of the groups don't have the same chain type.\n    \"\"\"\n    if chain_group_ids and len(chain_group_ids) != len(chain_groups):\n      raise ValueError(\n          'chain_group_ids must the same length as chain_groups: '\n          f'{len(chain_group_ids)=} != {len(chain_groups)=}'\n      )\n    if chain_group_types and len(chain_group_types) != len(chain_groups):\n      raise ValueError(\n          'chain_group_types must the same length as chain_groups: '\n          f'{len(chain_group_types)=} != {len(chain_groups)=}'\n      )\n    if chain_group_entity_ids and len(chain_group_entity_ids) != len(\n        chain_groups\n    ):\n      raise ValueError(\n          'chain_group_entity_ids must the same length as chain_groups: '\n          f'{len(chain_group_entity_ids)=} != {len(chain_groups)=}'\n      )\n\n    flattened = sorted(itertools.chain.from_iterable(chain_groups))\n    if flattened != sorted(self.chains):\n      raise ValueError(\n          'IDs in chain groups do not match Structure chain IDs: '\n          f'{chain_groups=}, chains={self.chains}'\n      )\n\n    new_chain_key_by_chain_id = {}\n    for new_chain_key, group_chain_ids in enumerate(chain_groups):\n      for chain_id in group_chain_ids:\n        new_chain_key_by_chain_id[chain_id] = new_chain_key\n\n    chain_key_remap = {}\n    new_chain_type_by_chain_key = {}\n    for old_chain_key, old_chain_id, old_chain_type in zip(\n        self._chains.key, self._chains.id, self._chains.type\n    ):\n      new_chain_key = new_chain_key_by_chain_id[old_chain_id]\n      chain_key_remap[old_chain_key] = new_chain_key\n\n      if new_chain_key not in new_chain_type_by_chain_key:\n        new_chain_type_by_chain_key[new_chain_key] = old_chain_type\n      elif not chain_group_types:\n        if new_chain_type_by_chain_key[new_chain_key] != old_chain_type:\n          bad_types = [\n              f'{cid}: {self._chains.type[np.where(self._chains.id == cid)][0]}'\n              for cid in chain_groups[new_chain_key]\n          ]\n          raise ValueError(\n              'Inconsistent chain types within group:\\n' + '\\n'.join(bad_types)\n          )\n\n    new_chain_key = np.arange(len(chain_groups), dtype=np.int64)\n    if chain_group_ids:\n      new_chain_id = np.array(chain_group_ids, dtype=object)\n    else:\n      new_chain_id = np.array(\n          [mmcif.int_id_to_str_id(k) for k in new_chain_key + 1], dtype=object\n      )\n    if chain_group_types:\n      new_chain_type = np.array(chain_group_types, dtype=object)\n    else:\n      new_chain_type = np.array(\n          [new_chain_type_by_chain_key[k] for k in new_chain_key], dtype=object\n      )\n    if chain_group_entity_ids:\n      new_chain_entity_id = np.array(chain_group_entity_ids, dtype=object)\n    else:\n      new_chain_entity_id = np.char.mod('%d', new_chain_key + 1).astype(object)\n    new_chains = structure_tables.Chains(\n        key=new_chain_key,\n        id=new_chain_id,\n        type=new_chain_type,\n        auth_asym_id=new_chain_id,\n        entity_id=new_chain_entity_id,\n        entity_desc=np.full(len(chain_groups), fill_value='.', dtype=object),\n    )\n\n    # Remap chain keys and sort residues to match the chain table order.\n    new_residues = self._residues.copy_and_remap(chain_key=chain_key_remap)\n    new_residues = new_residues.apply_index(\n        np.argsort(new_residues.chain_key, kind='stable')\n    )\n    # Renumber uniquely residues in each chain.\n    indices = np.arange(new_residues.chain_key.size, dtype=np.int32)\n    new_res_ids = (indices + 1) - np.maximum.accumulate(\n        indices * (new_residues.chain_key != np.roll(new_residues.chain_key, 1))\n    )\n    new_residues = new_residues.copy_and_update(\n        id=new_res_ids,\n        auth_seq_id=np.char.mod('%d', new_res_ids).astype(object),\n    )\n\n    # Remap chain keys and sort atoms to match the chain table order.\n    new_atoms = self._atoms.copy_and_remap(chain_key=chain_key_remap)\n    new_atoms = new_atoms.apply_index(\n        np.argsort(new_atoms.chain_key, kind='stable')\n    )\n\n    return self.copy_and_update(\n        chains=new_chains,\n        residues=new_residues,\n        atoms=new_atoms,\n        bonds=self._bonds,\n    )\n\n  def to_res_arrays(\n      self,\n      *,\n      include_missing_residues: bool,\n      atom_order: Mapping[str, int] = atom_types.ATOM37_ORDER,\n  ) -> ResArrays:\n    \"\"\"Returns atom-level information in arrays containing a num_res dimension.\n\n    NB: All residues in the structure will appear in the residue dimension but\n    atoms will only have a True (1.0) mask value if the residue + atom\n    combination is defined in `atom_order`. E.g. for the standard ATOM37_ORDER,\n    atoms are guaranteed to be present only for standard protein residues.\n\n    Args:\n      include_missing_residues: If True then the res arrays will include rows\n        for missing residues where all atoms will be masked out. Otherwise these\n        will simply be skipped.\n      atom_order: Atom order mapping atom names to their index in the atom\n        dimension of the returned arrays. Default is atom_order for proteins,\n        choose atom_types.ATOM29_ORDER for nucleics.\n\n    Returns:\n      A ResArrays object.\n    \"\"\"\n    num_res = self.num_residues(count_unresolved=include_missing_residues)\n    atom_type_num = len(atom_order)\n    atom_positions = np.zeros((num_res, atom_type_num, 3), dtype=np.float32)\n    atom_mask = np.zeros((num_res, atom_type_num), dtype=np.float32)\n    atom_b_factor = np.zeros((num_res, atom_type_num), dtype=np.float32)\n    atom_occupancy = np.zeros((num_res, atom_type_num), dtype=np.float32)\n\n    all_residues = None if not include_missing_residues else self.all_residues\n    for i, atom in enumerate_residues(self.iter_atoms(), all_residues):\n      atom_idx = atom_order.get(atom['atom_name'])\n      if atom_idx is not None:\n        atom_positions[i, atom_idx, 0] = atom['atom_x']\n        atom_positions[i, atom_idx, 1] = atom['atom_y']\n        atom_positions[i, atom_idx, 2] = atom['atom_z']\n        atom_mask[i, atom_idx] = 1.0\n        atom_b_factor[i, atom_idx] = atom['atom_b_factor']\n        atom_occupancy[i, atom_idx] = atom['atom_occupancy']\n\n    return ResArrays(\n        atom_positions=atom_positions,\n        atom_mask=atom_mask,\n        atom_b_factor=atom_b_factor,\n        atom_occupancy=atom_occupancy,\n    )\n\n  def to_res_atom_lists(\n      self, *, include_missing_residues: bool\n  ) -> Sequence[Sequence[Mapping[str, Any]]]:\n    \"\"\"Returns list of atom dictionaries grouped by residue.\n\n    If this is a multi-model structure, each atom will store its fields\n    atom_x, atom_y, atom_z, and atom_b_factor as Numpy arrays of shape of the\n    leading dimension(s). If this is a single-mode structure, these fields will\n    just be scalars.\n\n    Args:\n      include_missing_residues: If True, then the output list will contain an\n        empty list of atoms for missing residues. Otherwise missing residues\n        will simply be skipped.\n\n    Returns:\n      A list of size `num_res`. Each element in the list represents atoms of one\n      residue. If a residue is present is present, the list will contain an atom\n      dictionary for every atom present in that residue. If a residue is missing\n      and `include_missing_residues=True`, the list for that missing residue\n      will be empty.\n    \"\"\"\n    num_res = self.num_residues(count_unresolved=include_missing_residues)\n    residue_atoms = [[] for _ in range(num_res)]\n    all_residues = None if not include_missing_residues else self.all_residues\n\n    # We could yield directly in this loop but the code would be more complex.\n    # Let's optimise if memory usage is an issue.\n    for res_index, atom in enumerate_residues(self.iter_atoms(), all_residues):\n      residue_atoms[res_index].append(atom)\n\n    return residue_atoms\n\n  def reorder_chains(self, new_order: Sequence[str]) -> Self:\n    \"\"\"Reorders tables so that the label_asym_ids are in the given order.\n\n    This method changes the order of the chains, residues, and atoms tables so\n    that they are all consistent with each other. Moreover, it remaps chain keys\n    so that they stay monotonically increasing in chains/residues/atoms tables.\n\n    Args:\n      new_order: The order in which the chain IDs (label_asym_id) should be.\n        This must be a permutation of the current chain IDs.\n\n    Returns:\n      A structure with chains reorded.\n    \"\"\"\n    if len(new_order) != len(self.chains):\n      raise ValueError(\n          f'The new number of chains ({len(new_order)}) does not match the '\n          f'current number of chains ({len(self.chains)}).'\n      )\n    new_chain_set = set(new_order)\n    if len(new_chain_set) != len(new_order):\n      raise ValueError(f'The new order {new_order} contains non-unique IDs.')\n    if new_chain_set.symmetric_difference(set(self.chains)):\n      raise ValueError(\n          f'New chain IDs {new_order} do not match the old {set(self.chains)}'\n      )\n\n    if self.chains == tuple(new_order):\n      return self  # Shortcut: the new order is the same as the current one.\n\n    desired_chain_id_pos = {chain_id: i for i, chain_id in enumerate(new_order)}\n\n    current_chain_index_order = np.empty(self.num_chains, dtype=np.int64)\n    for index, old_chain_id in enumerate(self._chains.id):\n      current_chain_index_order[index] = desired_chain_id_pos[old_chain_id]\n    chain_reorder = np.argsort(current_chain_index_order, kind='stable')\n    chain_key_map = dict(\n        zip(self._chains.key[chain_reorder], range(self.num_chains))\n    )\n    chains = self._chains.apply_index(chain_reorder)\n    chains = chains.copy_and_remap(key=chain_key_map)\n\n    # The stable sort keeps the original residue ordering within each chain.\n    residues = self._residues.copy_and_remap(chain_key=chain_key_map)\n    residue_reorder = np.argsort(residues.chain_key, kind='stable')\n    residues = residues.apply_index(residue_reorder)\n\n    # The stable sort keeps the original atom ordering within each chain.\n    atoms = self._atoms.copy_and_remap(chain_key=chain_key_map)\n    atoms_reorder = np.argsort(atoms.chain_key, kind='stable')\n    atoms = atoms.apply_index(atoms_reorder)\n\n    # Bonds unchanged - each references 2 atom keys, hence ordering not defined.\n    return self.copy_and_update(chains=chains, residues=residues, atoms=atoms)\n\n  def rename_auth_asym_ids(self, new_id_by_old_id: Mapping[str, str]) -> Self:\n    \"\"\"Returns a new structure with renamed author chain IDs (auth_asym_ids).\n\n    Args:\n      new_id_by_old_id: A mapping from original auth_asym_ids to their new\n        values. Any auth_asym_ids in this structure that are not in the mapping\n        will remain unchanged.\n\n    Raises:\n      ValueError: If any two previously distinct polymer chains do not have\n        unique names anymore after the rename.\n    \"\"\"\n    mapped_chains = self._chains.copy_and_remap(auth_asym_id=new_id_by_old_id)\n    mapped_polymer_ids = mapped_chains.filter(\n        type=mmcif_names.POLYMER_CHAIN_TYPES\n    ).auth_asym_id\n    if len(mapped_polymer_ids) != len(set(mapped_polymer_ids)):\n      raise ValueError(\n          'The new polymer auth_asym_ids are not unique:'\n          f' {sorted(mapped_polymer_ids)}.'\n      )\n    return self.copy_and_update(chains=mapped_chains, skip_validation=True)\n\n  def rename_chain_ids(self, new_id_by_old_id: Mapping[str, str]) -> Self:\n    \"\"\"Returns a new structure with renamed chain IDs (label_asym_ids).\n\n    The chains' auth_asym_ids will be updated to be identical to the chain ID\n    since there isn't one unambiguous way to maintain the auth_asym_ids after\n    renaming the chain IDs (depending on whether you view the auth_asym_id as\n    more strongly associated with a given physical chain, or with a given\n    chain ID).\n\n    The residues' auth_seq_id will be updated to be identical to the residue ID\n    since they are strongly tied to the original author chain naming and keeping\n    them would be misleading.\n\n    Args:\n      new_id_by_old_id: A mapping from original chain ID to their new values.\n        Any chain IDs in this structure that are not in this mapping will remain\n        unchanged.\n\n    Returns:\n      A new structure with renamed chains (and bioassembly data if it is\n      present).\n\n    Raises:\n      ValueError: If any two previously distinct chains do not have unique names\n        anymore after the rename.\n    \"\"\"\n    new_chain_id = string_array.remap(self._chains.id, new_id_by_old_id)\n    if len(new_chain_id) != len(set(new_chain_id)):\n      raise ValueError(f\"New chain names aren't unique: {sorted(new_chain_id)}\")\n\n    # Map label_asym_ids in the bioassembly data.\n    if self._bioassembly_data is None:\n      new_bioassembly_data = None\n    else:\n      new_bioassembly_data = self._bioassembly_data.rename_label_asym_ids(\n          new_id_by_old_id, present_chains=set(self.present_chains.id)\n      )\n\n    # Set author residue IDs to be the string version of internal residue IDs.\n    new_residues = self._residues.copy_and_update(\n        auth_seq_id=self._residues.id.astype(str).astype(object)\n    )\n\n    new_chains = self._chains.copy_and_update(\n        id=new_chain_id, auth_asym_id=new_chain_id\n    )\n\n    return self.copy_and_update(\n        bioassembly_data=new_bioassembly_data,\n        chains=new_chains,\n        residues=new_residues,\n        skip_validation=True,\n    )\n\n  @functools.cached_property\n  def chains(self) -> tuple[str, ...]:\n    \"\"\"Ordered internal chain IDs (label_asym_id) present in the Structure.\"\"\"\n    return tuple(self._chains.id)\n\n  def rename_res_name(\n      self,\n      res_name_map: Mapping[str, str],\n      fail_if_not_found: bool = True,\n  ) -> Self:\n    \"\"\"Returns a copy of this structure with residues renamed.\n\n    Residue names in chemical components data will also be renamed.\n\n    Args:\n      res_name_map: A mapping from old residue names to new residue names. Any\n        residues that are not in this mapping will be left unchanged.\n      fail_if_not_found: Whether to fail if keys in the res_name_map mapping are\n        not found in this structure's residues' `name` column.\n\n    Raises:\n      ValueError: If `fail_if_not_found=True` and a residue name isn't found in\n        the residues table's `name` field.\n    \"\"\"\n    res_name_set = set(self._residues.name)\n    if fail_if_not_found:\n      for res_name in res_name_map:\n        if res_name not in res_name_set:\n          raise ValueError(f'\"{res_name}\" not found in this structure.')\n    new_residues = self._residues.copy_and_remap(name=res_name_map)\n\n    if self._chemical_components_data is not None:\n      chem_comp = {\n          res_name_map.get(res_name, res_name): data\n          for res_name, data in self._chemical_components_data.chem_comp.items()\n      }\n      new_chem_comp = struc_chem_comps.ChemicalComponentsData(chem_comp)\n    else:\n      new_chem_comp = None\n\n    return self.copy_and_update(\n        residues=new_residues,\n        chemical_components_data=new_chem_comp,\n        skip_validation=True,\n    )\n\n  def remap_res_id(self, res_id_map: Mapping[str, Mapping[int, int]]) -> Self:\n    \"\"\"Returns a copy of this structure with residue IDs remapped.\n\n    Example structure with 2 chains:\n    Chain A: residues 1, 2, 3; chain B: residues 6, 7, 8\n    res_id_map: {'A': {1: 1, 2: 5, 3: 6}, 'B': {6: 1, 7: 2, 8: 8}}\n    Will result in:\n    Chain A: residues 1, 5, 6; chain B: residues 1, 2, 8\n\n    Args:\n      res_id_map: A mapping from internal chain ID to a mapping from old residue\n        ID to new residue ID. A mapping must be provided for each residue in\n        each chain.\n\n    Raises:\n      KeyError: If residue ID in a given chain is not found in the mapping for\n        that chain.\n      ValueError: If residue IDs are not unique in each chain after remapping.\n    \"\"\"\n    chain_ids = self._chains.apply_array_to_column(\n        column_name='id', arr=self._residues.chain_key\n    )\n    flat_res_id_map = {}\n    for chain_id, chain_res_id_map in res_id_map.items():\n      flat_res_id_map.update({\n          (chain_id, old_res_id): new_res_id\n          for old_res_id, new_res_id in chain_res_id_map.items()\n      })\n\n    try:\n      new_res_id = string_array.remap_multiple(\n          (chain_ids, self._residues.id), flat_res_id_map\n      )\n    except KeyError as e:\n      raise KeyError(\n          f'Could not find new residue ID for residue {e} in {res_id_map=}'\n      ) from e\n\n    residue_chain_boundaries = _get_change_indices(self._residues.chain_key)\n    res_boundaries = self._iter_residue_ranges(\n        residue_chain_boundaries, count_unresolved=True\n    )\n    for idx, (start, end) in enumerate(res_boundaries):\n      chain_id = chain_ids[idx]\n      chain_res_ids = new_res_id[start:end]\n      if len(chain_res_ids) != len(set(chain_res_ids)):\n        raise ValueError(\n            f'New residue IDs not unique in chain {chain_id}: {chain_res_ids}'\n        )\n\n    return self.copy_and_update(\n        residues=self._residues.copy_and_update(id=new_res_id.astype(np.int32)),\n        skip_validation=True,\n    )\n\n  def rename_chains_to_match(\n      self,\n      other: 'Structure',\n      *,\n      fuzzy_match_non_standard_res: bool = True,\n  ) -> Self:\n    \"\"\"Returns a new structure with renamed chains to match another's.\n\n    Example:\n    This structure has chains: {'A': 'DEEP', 'B': 'MIND', 'C': 'MIND'}\n    Other structure has chains: {'X': 'DEEP', 'Z': 'MIND', 'Y': 'MIND'}\n\n    After calling this method, you will get a structure that has chains named:\n    {'X': 'DEEP', 'Z': 'MIND', Y: 'MIND'}\n\n    Args:\n      other: Another `Structure`. This provides the reference chain names that\n        is used to rename this structure's chains.\n      fuzzy_match_non_standard_res: If True, protein/RNA/DNA chains with the\n        same one letter sequence will be matched. e.g. \"MET-MET-UNK1\" will match\n        \"MET-MSE-UNK2\", since both will be mapped to \"MMX\". If False, we require\n        the full res_names to match.\n\n    Returns:\n      A new `Structure`, based on this structure, which has chains renamed to\n      match the other structure.\n    \"\"\"\n    sequences = self.chain_res_name_sequence(\n        include_missing_residues=True,\n        fix_non_standard_polymer_res=fuzzy_match_non_standard_res,\n    )\n\n    other_sequences = other.chain_res_name_sequence(\n        include_missing_residues=True,\n        fix_non_standard_polymer_res=fuzzy_match_non_standard_res,\n    )\n\n    # Check that the sequences are the same.\n    sequence_counts = collections.Counter(sequences.values())\n    other_sequence_counts = collections.Counter(other_sequences.values())\n    if other_sequence_counts != sequence_counts:\n      raise ValueError(\n          'The other structure does not have the same sequences\\n'\n          f' other: {other_sequence_counts}\\n self: {sequence_counts}'\n      )\n\n    new_decoy_id_by_old_id = {}\n    used_chain_ids = set()\n    # Sort self keys and take min over other to make matching deterministic.\n    # The matching is arbitrary but this helps debugging.\n    for self_chain_id, self_seq in sorted(sequences.items()):\n      # Find corresponding chains in the other structure.\n      other_chain_id = min(\n          k\n          for k, v in other_sequences.items()\n          if v == self_seq and k not in used_chain_ids\n      )\n\n      new_decoy_id_by_old_id[self_chain_id] = other_chain_id\n      used_chain_ids.add(other_chain_id)\n\n    return self.rename_chain_ids(new_decoy_id_by_old_id)\n\n  def _apply_bioassembly_transform(\n      self, transform: bioassemblies.Transform\n  ) -> Self:\n    \"\"\"Applies a bioassembly transform to this structure.\"\"\"\n    base_struc = self.filter(chain_id=transform.chain_ids)\n    transformed_atoms = base_struc.atoms_table.copy_and_update_coords(\n        transform.apply_to_coords(base_struc.coords)\n    )\n    transformed_chains = base_struc.chains_table.copy_and_remap(\n        id=transform.chain_id_rename_map\n    )\n    # Set the transformed author chain ID to match the label chain ID.\n    transformed_chains = transformed_chains.copy_and_update(\n        auth_asym_id=transformed_chains.id\n    )\n    return base_struc.copy_and_update(\n        chains=transformed_chains,\n        atoms=transformed_atoms,\n        skip_validation=True,\n    )\n\n  def generate_bioassembly(self, assembly_id: str | None = None) -> Self:\n    \"\"\"Generates a biological assembly as a new `Structure`.\n\n    When no assembly ID is provided this method produces a default assembly.\n    If this structure has no `bioassembly_data` then this returns itself\n    unchanged. Otherwise a default assembly ID is picked with\n    `BioassemblyData.get_default_assembly_id()`.\n\n    Args:\n      assembly_id: The assembly ID to generate, or None to generate a default\n        bioassembly.\n\n    Returns:\n      A new `Structure`, based on this one, representing the specified\n      bioassembly. Note that if the bioassembly contains copies of chains\n      in the original structure then they will be given new unique chain IDs.\n\n    Raises:\n      ValueError: If this structure's `bioassembly_data` is `None` and\n      `assembly_id` is not `None`.\n    \"\"\"\n    if self._bioassembly_data is None:\n      if assembly_id is None:\n        return self\n      else:\n        raise ValueError(\n            f'Unset bioassembly_data, cannot generate assembly {assembly_id}'\n        )\n\n    if assembly_id is None:\n      assembly_id = self._bioassembly_data.get_default_assembly_id()\n\n    transformed_strucs = [\n        self._apply_bioassembly_transform(transform)\n        for transform in self._bioassembly_data.get_transforms(assembly_id)\n    ]\n\n    # We don't need to assign unique chain IDs because the bioassembly\n    # transform takes care of remapping chain IDs to be unique.\n    concatenated = concat(\n        transformed_strucs,\n        assign_unique_chain_ids=False,\n        assign_unique_entity_ids=False,\n    )\n\n    # Copy over all scalar fields (e.g. name, release date, etc.) other than\n    # bioassembly_data because it relates only to the pre-transformed structure.\n    return concatenated.copy_and_update_globals(\n        name=self.name,\n        release_date=self.release_date,\n        resolution=self.resolution,\n        structure_method=self.structure_method,\n        bioassembly_data=None,\n        chemical_components_data=self.chemical_components_data,\n    )\n\n  def _to_mmcif_header(self) -> Mapping[str, Sequence[str]]:\n    raw_mmcif = collections.defaultdict(list)\n    raw_mmcif['data_'] = [self._name.replace(' ', '-')]\n    raw_mmcif['_entry.id'] = [self._name]\n\n    if self._release_date is not None:\n      date = [datetime.datetime.strftime(self._release_date, '%Y-%m-%d')]\n      raw_mmcif['_pdbx_audit_revision_history.revision_date'] = date\n      raw_mmcif['_pdbx_database_status.recvd_initial_deposition_date'] = date\n\n    if self._resolution is not None:\n      raw_mmcif['_refine.ls_d_res_high'] = ['%.2f' % self._resolution]\n\n    if self._structure_method is not None:\n      for method in self._structure_method.split(','):\n        raw_mmcif['_exptl.method'].append(method)\n\n    if self._bioassembly_data is not None:\n      raw_mmcif.update(self._bioassembly_data.to_mmcif_dict())\n\n    # Populate chemical components data for all residues of this Structure.\n    if self._chemical_components_data:\n      raw_mmcif.update(self._chemical_components_data.to_mmcif_dict())\n\n    # Add _software table to store version number used to generate mmCIF.\n    # Only required data items are used (+ _software.version).\n    raw_mmcif['_software.pdbx_ordinal'] = ['1']\n    raw_mmcif['_software.name'] = ['DeepMind Structure Class']\n    raw_mmcif['_software.version'] = [self._VERSION]\n    raw_mmcif['_software.classification'] = ['other']  # Required.\n\n    return raw_mmcif\n\n  def to_mmcif_dict(\n      self,\n      *,\n      coords_decimal_places: int = _COORDS_DECIMAL_PLACES,\n  ) -> mmcif.Mmcif:\n    \"\"\"Returns an Mmcif representing the structure.\"\"\"\n    header = self._to_mmcif_header()\n    sequence_tables = structure_tables.to_mmcif_sequence_and_entity_tables(\n        self._chains, self._residues, self._atoms.res_key\n    )\n    atom_and_bond_tables = structure_tables.to_mmcif_atom_site_and_bonds_table(\n        chains=self._chains,\n        residues=self._residues,\n        atoms=self._atoms,\n        bonds=self._bonds,\n        coords_decimal_places=coords_decimal_places,\n    )\n    return mmcif.Mmcif({**header, **sequence_tables, **atom_and_bond_tables})\n\n  def to_mmcif(\n      self, *, coords_decimal_places: int = _COORDS_DECIMAL_PLACES\n  ) -> str:\n    \"\"\"Returns an mmCIF string representing the structure.\n\n    Args:\n      coords_decimal_places: The number of decimal places to keep for atom\n        coordinates, including trailing zeros.\n    \"\"\"\n    return self.to_mmcif_dict(\n        coords_decimal_places=coords_decimal_places\n    ).to_string()\n\n\nclass _LeadingDimSlice:\n  \"\"\"Helper class for slicing the leading dimensions of a `Structure`.\n\n  Wraps a `Structure` instance and applies a slice operation to the coordinate\n  fields and other fields that may have leading dimensions (e.g. b_factor).\n\n  Example usage:\n    t0_struc = multi_state_struc.slice_leading_dims[0]\n  \"\"\"\n\n  def __init__(self, struc: Structure):\n    self._struc = struc\n\n  def __getitem__(self, *args, **kwargs) -> Structure:\n    sliced_atom_cols = {}\n    for col_name in structure_tables.Atoms.multimodel_cols:\n      if (col := self._struc.atoms_table.get_column(col_name)).ndim > 1:\n        sliced_col = col.__getitem__(*args, **kwargs)\n        if (\n            not sliced_col.shape\n            or sliced_col.shape[-1] != self._struc.num_atoms\n        ):\n          raise ValueError(\n              'Coordinate slice cannot change final (atom) dimension.'\n          )\n        sliced_atom_cols[col_name] = sliced_col\n    sliced_atoms = self._struc.atoms_table.copy_and_update(**sliced_atom_cols)\n    return self._struc.copy_and_update(atoms=sliced_atoms, skip_validation=True)\n\n\ndef stack(strucs: Sequence[Structure], axis: int = 0) -> Structure:\n  \"\"\"Stacks multiple structures into a single multi-model Structure.\n\n  This function is the inverse of `Structure.unstack()`.\n\n  NB: this function assumes that every structure in `strucs` is identical\n  other than the coordinates and b-factors. Under this assumption we can safely\n  copy all these identical fields from the first element of strucs w.l.o.g.\n  However this is not checked in full detail as full comparison is expensive.\n  Instead this only checks that the `atom_name` field is identical, and that\n  the coordinates have the same shape.\n\n  Usage example:\n  ```\n  multi_model_struc = structure.stack(strucs, axis=0)\n  ```\n\n  Args:\n    strucs: A sequence of structures, each with the same atoms, but they may\n      have different coordinates and b-factors. If any b-factors are not None\n      then they must have the same shape as each of the coordinate fields.\n    axis: The axis in the returned structure that represents the different\n      structures in `strucs` and will have size `len(strucs)`. This cannot be\n      the final dimension as this is reserved for `num_atoms`.\n\n  Returns:\n    A `Structure` with the same atoms as the structures in `strucs` but with\n    all of their coordinates stacked into a new leading axis.\n\n  Raises:\n    ValueError: If `strucs` is empty.\n    ValueError: If `strucs` do not all have the same `atom_name` field.\n  \"\"\"\n  if not strucs:\n    raise ValueError('Need at least one Structure to stack.')\n  struc_0, *other_strucs = strucs\n  for i, struc in enumerate(other_strucs, start=1):\n    # Check that every structure has the same atom name column.\n    # This check is intended to catch cases where the input structures might\n    # contain the same atoms, but in different orders. This won't catch every\n    # such case, e.g. if these are carbon-alpha-only structures, but should\n    # catch most cases.\n    if np.any(struc.atoms_table.name != struc_0.atoms_table.name):\n      raise ValueError(\n          f'strucs[0] and strucs[{i}] have mismatching atom name columns.'\n      )\n\n  stacked_atoms = struc_0.atoms_table.copy_and_update(\n      x=np.stack([s.atoms_table.x for s in strucs], axis=axis),\n      y=np.stack([s.atoms_table.y for s in strucs], axis=axis),\n      z=np.stack([s.atoms_table.z for s in strucs], axis=axis),\n      b_factor=np.stack([s.atoms_table.b_factor for s in strucs], axis=axis),\n      occupancy=np.stack([s.atoms_table.occupancy for s in strucs], axis=axis),\n  )\n  return struc_0.copy_and_update(atoms=stacked_atoms, skip_validation=True)\n\n\ndef _assign_unique_chain_ids(\n    strucs: Iterable[Structure],\n) -> Sequence[Structure]:\n  \"\"\"Creates a sequence of `Structure` objects with unique chain IDs.\n\n  Let e.g. [A, B] denote a structure of two chains A and B, then this function\n  performs the following kind of renaming operation:\n\n  e.g.: [Z], [C], [B, C] -> [A], [B], [C, D]\n\n  NB: This function uses Structure.rename_chain_ids which will define each\n  structure's chains.auth_asym_id to be identical to its chains.id columns.\n\n  Args:\n    strucs: Structures whose chains ids are to be uniquified.\n\n  Returns:\n    A sequence with the same number of elements as `strucs` but where each\n    element has had its chains renamed so that they aren't shared with any\n    other `Structure` in the sequence.\n  \"\"\"\n  # Start counting at 1 because mmcif.int_id_to_str_id expects integers >= 1.\n  chain_counter = 1\n  strucs_with_new_chain_ids = []\n  for struc in strucs:\n    rename_map = {}\n    for chain_id in struc.chains:\n      rename_map[chain_id] = mmcif.int_id_to_str_id(chain_counter)\n      chain_counter += 1\n    renamed = struc.rename_chain_ids(rename_map)\n    strucs_with_new_chain_ids.append(renamed)\n  return strucs_with_new_chain_ids\n\n\ndef concat(\n    strucs: Sequence[Structure],\n    *,\n    name: str | None = None,\n    assign_unique_chain_ids: bool = True,\n    assign_unique_entity_ids: bool = True,\n) -> Structure:\n  \"\"\"Concatenates structures along the atom dimension.\n\n  NB: By default this function will first assign unique chain IDs to all chains\n  in `strucs` so that the resulting structure does not contain duplicate chain\n  IDs. This will also fix entity IDs and author chain IDs. If this is disabled\n  via `assign_unique_chain_ids=False` the user must ensure that there are no\n  duplicate chains (label_asym_id). However, duplicate entity IDs and author\n  chain IDs are allowed as that might be the desired behavior.\n\n  If `assign_unique_chain_ids=True`, note also that the chain_ids may be\n  overwritten even if they are already unique.\n\n  Let e.g. [A, B] denote a structure of two chains A and B, then this function\n  performs the following kind of concatenation operation:\n\n  assign_unique_chain_ids=True:\n    label chain IDS : [Z], [C], [B, C] -> [A, B, C, D]\n    author chain IDS: [U], [V], [V, C] -> [A, B, C, D]\n    entity IDs      : [1], [1], [3, 3] -> [1, 2, 3, 4]\n  assign_unique_chain_ids=False:\n    label chain IDS : [D], [B], [C, A] -> [D, B, C, A]  (inputs must be unique)\n    author chain IDS: [U], [V], [V, A] -> [U, V, V, A]\n    entity IDs      : [1], [1], [3, 3] -> [1, 1, 3, 3]\n\n  NB: This operation loses some information from the elements of `strucs`,\n  namely the `name`, `resolution`, `release_date` and `bioassembly_data` fields.\n\n  Args:\n    strucs: The `Structure` instances to concatenate. These should all have the\n      same number and shape of leading dimensions (i.e. if any are multi-model\n      structures then they should all have the same number of models).\n    name: Optional name to give to the concatenated structure. If None, the name\n      will be concatenation of names of all concatenated structures.\n    assign_unique_chain_ids: If True, this function first assigns new unique\n      chain IDs, entity IDs and author chain IDs to every chain in `strucs`. If\n      False, you must ensure chain IDs are already unique, otherwise an\n      exception is raised. See `_assign_unique_chain_ids` for more information\n      on how this is performed.\n    assign_unique_entity_ids: If True, this function first assigns new unique\n      entity IDs to every chain in `strucs`. If False, you must ensure entity\n      IDs are already set in a way so that same entity ID implies for two chains\n      in `strucs` that they have the same residues. This option applies only if\n      `assign_unique_chain_ids == False`, otherwise it must be set to True.\n\n  Returns:\n    A new concatenated `Structure` with all of the chains in `strucs` combined\n    into one new structure. The new structure will be named by joining the\n    names of `strucs` with underscores.\n\n  Raises:\n    ValueError: If `strucs` is empty.\n    ValueError: If `assign_unique_chain_ids=False` and not all chains in\n      `strucs` have unique chain IDs.\n  \"\"\"\n  if not strucs:\n    raise ValueError('Need at least one Structure to concatenate.')\n\n  if assign_unique_chain_ids and not assign_unique_entity_ids:\n    raise ValueError(\n        'If assign_unique_chain_ids is True, assign_unique_entity_ids must be '\n        'True as well.'\n    )\n\n  if assign_unique_chain_ids:\n    strucs = _assign_unique_chain_ids(strucs)\n\n  chemical_components_data = {}\n  seen_label_chain_ids = set()\n  for i, struc in enumerate(strucs):\n    if not assign_unique_chain_ids:\n      if seen_cid := seen_label_chain_ids.intersection(struc.chains):\n        raise ValueError(\n            f'Chain IDs {seen_cid} from strucs[{i}] also exist in other'\n            ' members of strucs. All given structures must have unique chain'\n            ' IDs. Consider setting assign_unique_chain_ids=True.'\n        )\n      seen_label_chain_ids.update(struc.chains)\n\n    if struc.chemical_components_data is not None:\n      chemical_components_data.update(struc.chemical_components_data.chem_comp)  # pytype: disable=attribute-error  # always-use-property-annotation\n\n  concatted_struc = table.concat_databases(strucs)\n  name = name if name is not None else '_'.join(s.name for s in strucs)\n  # Chain IDs (label and author) are fixed at this point, fix also entity IDs.\n  if assign_unique_chain_ids or assign_unique_entity_ids:\n    numeric_ids = np.arange(1, concatted_struc.num_chains + 1)\n    entity_id = np.char.mod('%d', numeric_ids).astype(object)\n    chains = concatted_struc.chains_table.copy_and_update(entity_id=entity_id)\n  else:\n    chains = concatted_struc.chains_table\n\n  return concatted_struc.copy_and_update(\n      name=name,\n      release_date=None,\n      resolution=None,\n      structure_method=None,\n      bioassembly_data=None,\n      chemical_components_data=(\n          struc_chem_comps.ChemicalComponentsData(chemical_components_data)\n          if chemical_components_data\n          else None\n      ),\n      chains=chains,\n      skip_validation=True,  # Already validated by table.concat_databases.\n  )\n\n\ndef multichain_residue_index(\n    struc: Structure, chain_offset: int = 9000, between_chain_buffer: int = 1000\n) -> np.ndarray:\n  \"\"\"Compute a residue index array that is monotonic across all chains.\n\n  Lots of metrics (lddt, l1_long, etc) require computing a\n  distance-along-chain between two residues.  For multimers we want to ensure\n  that any residues on different chains have a high along-chain distance\n  (i.e. they should always count as long-range contacts for example).  To\n  do this we add 10000 to the residue indices of each chain, and enforce that\n  the residue index is monotonically increasing across the whole complex.\n\n  Note: This returns the same as struc.res_id for monomers.\n\n  Args:\n    struc: The structure to make a multichain residue index for.\n    chain_offset: The start of each chain is offset by at least this amount.\n      This must be larger than the absolute range of standard residue IDs.\n    between_chain_buffer: The final residue in one chain will have at least this\n      much of a buffer before the first residue in the next chain.\n\n  Returns:\n    A monotonically increasing residue index, with at least\n    `between_chain_buffer` residues in between each chain.\n  \"\"\"\n  if struc.num_atoms:\n    res_id_range = np.max(struc.res_id) - np.min(struc.res_id)\n    assert res_id_range < chain_offset\n  chain_id_int = struc.chain_id\n  monotonic_chain_id_int = np.concatenate(\n      ([0], np.cumsum(chain_id_int[1:] != chain_id_int[:-1]))\n  )\n  return struc.res_id + monotonic_chain_id_int * (\n      chain_offset + between_chain_buffer\n  )\n\n\ndef make_empty_structure() -> Structure:\n  \"\"\"Returns a new structure consisting of empty array fields.\"\"\"\n  return Structure(\n      chains=structure_tables.Chains.make_empty(),\n      residues=structure_tables.Residues.make_empty(),\n      atoms=structure_tables.Atoms.make_empty(),\n      bonds=structure_tables.Bonds.make_empty(),\n  )\n\n\ndef enumerate_residues(\n    atom_iter: Iterable[Mapping[str, Any]],\n    all_residues: AllResidues | None = None,\n) -> Iterator[tuple[int, Mapping[str, Any]]]:\n  \"\"\"Provides a zero-indexed enumeration of residues in an atom iterable.\n\n  Args:\n    atom_iter: An iterable of atom dicts as returned by Structure.iter_atoms().\n    all_residues: (Optional) A structure's all_residues field. If present then\n      this will be used to count missing residues by adding appropriate gaps in\n      the residue enumeration.\n\n  Yields:\n    (res_i, atom) pairs where atom is the unmodified atom dict and res_i is a\n    zero-based index for the residue that the atom belongs to.\n  \"\"\"\n  if all_residues is None:\n    prev_res = None\n    res_i = -1\n    for atom in atom_iter:\n      res = (atom['chain_id'], atom['res_id'])\n      if res != prev_res:\n        prev_res = res\n        res_i += 1\n      yield res_i, atom\n  else:\n    all_res_seq = []  # Sequence of (chain_id, res_id) for all chains.\n    prev_chain = None\n    res_i = 0\n    for atom in atom_iter:\n      chain_id = atom['chain_id']\n      if chain_id not in all_residues:\n        raise ValueError(\n            f'Atom {atom} does not belong to any residue in all_residues.'\n        )\n      if chain_id != prev_chain:\n        prev_chain = chain_id\n        all_res_seq.extend(\n            (chain_id, res_id) for (_, res_id) in all_residues[chain_id]\n        )\n      res = (chain_id, atom['res_id'])\n      while res_i < len(all_res_seq) and res != all_res_seq[res_i]:\n        res_i += 1\n      if res_i == len(all_res_seq):\n        raise ValueError(\n            f'Atom {atom} does not belong to a residue in all_residues.'\n        )\n      yield res_i, atom\n"
  },
  {
    "path": "src/alphafold3/structure/structure_tables.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Table implementations for the Structure class.\"\"\"\n\nimport collections\nfrom collections.abc import Mapping, Sequence\nimport dataclasses\nimport functools\nimport itertools\nimport typing\nfrom typing import Any, ClassVar, Self\n\nfrom alphafold3.constants import mmcif_names\nfrom alphafold3.constants import residue_names\nfrom alphafold3.cpp import aggregation\nfrom alphafold3.cpp import string_array\nfrom alphafold3.structure import bonds as bonds_module\nfrom alphafold3.structure import mmcif\nfrom alphafold3.structure import table\nimport numpy as np\n\n\nBonds = bonds_module.Bonds\n\n\ndef _residue_name_to_record_name(\n    residue_name: np.ndarray,\n    polymer_mask: np.ndarray,\n) -> np.ndarray:\n  \"\"\"Returns record names (ATOM/HETATM) given residue names and polymer mask.\"\"\"\n  record_name = np.array(['HETATM'] * len(residue_name), dtype=object)\n  record_name[polymer_mask] = string_array.remap(\n      residue_name[polymer_mask],\n      mapping={r: 'ATOM' for r in residue_names.STANDARD_POLYMER_TYPES},\n      default_value='HETATM',\n  )\n  return record_name\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass AuthorNamingScheme:\n  \"\"\"A mapping from internal values to author values in a mmCIF.\n\n  Fields:\n    auth_asym_id: A mapping from label_asym_id to auth_asym_id.\n    auth_seq_id: A mapping from label_asym_id to a mapping from\n      label_seq_id to auth_seq_id.\n    insertion_code: A mapping from label_asym_id to a mapping from\n      label_seq_id to insertion codes.\n    entity_id: A mapping from label_asym_id to _entity.id.\n    entity_desc: A mapping from _entity.id to _entity.pdbx_description.\n  \"\"\"\n\n  auth_asym_id: Mapping[str, str]\n  auth_seq_id: Mapping[str, Mapping[int, str]]\n  insertion_code: Mapping[str, Mapping[int, str | None]]\n  entity_id: Mapping[str, str]\n  entity_desc: Mapping[str, str]\n\n\ndef _default(\n    candidate_value: np.ndarray | None, default_value: Sequence[Any], dtype: Any\n) -> np.ndarray:\n  if candidate_value is None:\n    return np.array(default_value, dtype=dtype)\n  return np.array(candidate_value, dtype=dtype)\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass Atoms(table.Table):\n  \"\"\"Table of atoms in a Structure.\"\"\"\n\n  chain_key: np.ndarray\n  res_key: np.ndarray\n  name: np.ndarray\n  element: np.ndarray\n  x: np.ndarray\n  y: np.ndarray\n  z: np.ndarray\n  b_factor: np.ndarray\n  occupancy: np.ndarray\n  multimodel_cols: ClassVar[tuple[str, ...]] = (\n      'x',\n      'y',\n      'z',\n      'b_factor',\n      'occupancy',\n  )\n\n  def __post_init__(self):\n    # Validates that the atom coordinates, b-factors and occupancies are finite.\n    for column_name in ('x', 'y', 'z', 'b_factor', 'occupancy'):\n      column = self.get_column(column_name)\n      if not np.isfinite(column).all():\n        raise ValueError(\n            f'Column {column_name} must not contain NaN/inf values.'\n        )\n    # super().__post_init__() can't be used as that causes the following error:\n    # TypeError: super(type, obj): obj must be an instance or subtype of type\n    super(Atoms, self).__post_init__()\n\n  @classmethod\n  def make_empty(cls) -> Self:\n    return cls(\n        key=np.array([], dtype=np.int64),\n        chain_key=np.array([], dtype=np.int64),\n        res_key=np.array([], dtype=np.int64),\n        name=np.array([], dtype=object),\n        element=np.array([], dtype=object),\n        x=np.array([], dtype=np.float32),\n        y=np.array([], dtype=np.float32),\n        z=np.array([], dtype=np.float32),\n        b_factor=np.array([], dtype=np.float32),\n        occupancy=np.array([], dtype=np.float32),\n    )\n\n  @classmethod\n  def from_defaults(\n      cls,\n      *,\n      chain_key: np.ndarray,\n      res_key: np.ndarray,\n      key: np.ndarray | None = None,\n      name: np.ndarray | None = None,\n      element: np.ndarray | None = None,\n      x: np.ndarray | None = None,\n      y: np.ndarray | None = None,\n      z: np.ndarray | None = None,\n      b_factor: np.ndarray | None = None,\n      occupancy: np.ndarray | None = None,\n  ) -> Self:\n    \"\"\"Create an Atoms table with minimal user inputs.\"\"\"\n    num_atoms = len(chain_key)\n    if not num_atoms:\n      return cls.make_empty()\n    return Atoms(\n        chain_key=chain_key,\n        res_key=res_key,\n        key=_default(key, np.arange(num_atoms), np.int64),\n        name=_default(name, ['?'] * num_atoms, object),\n        element=_default(element, ['?'] * num_atoms, object),\n        x=_default(x, [0.0] * num_atoms, np.float32),\n        y=_default(y, [0.0] * num_atoms, np.float32),\n        z=_default(z, [0.0] * num_atoms, np.float32),\n        b_factor=_default(b_factor, [0.0] * num_atoms, np.float32),\n        occupancy=_default(occupancy, [1.0] * num_atoms, np.float32),\n    )\n\n  def get_value_by_index(\n      self, column_name: str, index: int\n  ) -> table.TableEntry | np.ndarray:\n    if column_name in self.multimodel_cols:\n      return self.get_column(column_name)[..., index]\n    else:\n      return self.get_column(column_name)[index]\n\n  def copy_and_update_coords(self, coords: np.ndarray) -> Self:\n    \"\"\"Returns a copy with the x, y and z columns updated.\"\"\"\n    if coords.shape[-1] != 3:\n      raise ValueError(\n          f'Expecting 3-dimensional coordinates, got {coords.shape}'\n      )\n    return typing.cast(\n        Atoms,\n        self.copy_and_update(\n            x=coords[..., 0], y=coords[..., 1], z=coords[..., 2]\n        ),\n    )\n\n  @property\n  def shape(self) -> tuple[int, ...]:\n    return self.x.shape\n\n  @property\n  def ndim(self) -> int:\n    return len(self.shape)\n\n  @functools.cached_property\n  def num_models(self) -> int:\n    \"\"\"The number of models of this Structure.\"\"\"\n    leading_dims = self.shape[:-1]\n    match leading_dims:\n      case ():\n        return 1\n      case (single_leading_dim_size,):\n        return single_leading_dim_size\n      case _:\n        raise ValueError(\n            'num_models not defined for atom tables with more than one '\n            'leading dimension.'\n        )\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass Residues(table.Table):\n  \"\"\"Table of residues in a Structure.\"\"\"\n\n  chain_key: np.ndarray\n  id: np.ndarray\n  name: np.ndarray\n  auth_seq_id: np.ndarray\n  insertion_code: np.ndarray\n\n  @classmethod\n  def make_empty(cls) -> Self:\n    return cls(\n        key=np.array([], dtype=np.int64),\n        chain_key=np.array([], dtype=np.int64),\n        id=np.array([], dtype=np.int32),\n        name=np.array([], dtype=object),\n        auth_seq_id=np.array([], dtype=object),\n        insertion_code=np.array([], dtype=object),\n    )\n\n  @classmethod\n  def from_defaults(\n      cls,\n      *,\n      id: np.ndarray,  # pylint:disable=redefined-builtin\n      chain_key: np.ndarray,\n      key: np.ndarray | None = None,\n      name: np.ndarray | None = None,\n      auth_seq_id: np.ndarray | None = None,\n      insertion_code: np.ndarray | None = None,\n  ) -> Self:\n    \"\"\"Create a Residues table with minimal user inputs.\"\"\"\n    num_res = len(id)\n    if not num_res:\n      return cls.make_empty()\n    return Residues(\n        key=_default(key, np.arange(num_res), np.int64),\n        id=id,\n        chain_key=chain_key,\n        name=_default(name, ['UNK'] * num_res, object),\n        auth_seq_id=_default(auth_seq_id, id.astype(str), object),\n        insertion_code=_default(insertion_code, ['?'] * num_res, object),\n    )\n\n\n@dataclasses.dataclass(frozen=True, slots=True, kw_only=True)\nclass Chains(table.Table):\n  \"\"\"Table of chains in a Structure.\"\"\"\n\n  id: np.ndarray\n  type: np.ndarray\n  auth_asym_id: np.ndarray\n  entity_id: np.ndarray\n  entity_desc: np.ndarray\n\n  @classmethod\n  def make_empty(cls) -> Self:\n    return cls(\n        key=np.array([], dtype=np.int64),\n        id=np.array([], dtype=object),\n        type=np.array([], dtype=object),\n        auth_asym_id=np.array([], dtype=object),\n        entity_id=np.array([], dtype=object),\n        entity_desc=np.array([], dtype=object),\n    )\n\n  @classmethod\n  def from_defaults(\n      cls,\n      *,\n      id: np.ndarray,  # pylint:disable=redefined-builtin\n      key: np.ndarray | None = None,\n      type: np.ndarray | None = None,  # pylint:disable=redefined-builtin\n      auth_asym_id: np.ndarray | None = None,\n      entity_id: np.ndarray | None = None,\n      entity_desc: np.ndarray | None = None,\n  ) -> Self:\n    \"\"\"Create a Chains table with minimal user inputs.\"\"\"\n    num_chains = len(id)\n    if not num_chains:\n      return cls.make_empty()\n\n    return Chains(\n        key=_default(key, np.arange(num_chains), np.int64),\n        id=id,\n        type=_default(type, [mmcif_names.PROTEIN_CHAIN] * num_chains, object),\n        auth_asym_id=_default(auth_asym_id, id, object),\n        entity_id=_default(\n            entity_id, np.arange(1, num_chains + 1).astype(str), object\n        ),\n        entity_desc=_default(entity_desc, ['.'] * num_chains, object),\n    )\n\n\ndef to_mmcif_sequence_and_entity_tables(\n    chains: Chains,\n    residues: Residues,\n    atom_res_key: np.ndarray,\n) -> Mapping[str, Sequence[str]]:\n  \"\"\"Returns raw sequence and entity mmCIF tables.\"\"\"\n  raw_mmcif = collections.defaultdict(list)\n  chains_by_entity_id = {}\n  written_entity_poly_seq_ids = set()\n  present_res_keys = set(atom_res_key)\n\n  # Performance optimisation: Find residue indices for each chain in advance, so\n  # that we don't have to do redunant masking work for each chain.\n  res_indices_for_chain = aggregation.indices_grouped_by_value(\n      residues.chain_key\n  )\n\n  for chain in chains.iterrows():\n    # Add all chain information to the _struct_asym table.\n    chain_id = chain['id']  # Saves multiple dict lookups.\n    auth_asym_id = chain['auth_asym_id']\n    entity_id = chain['entity_id']\n    chains_by_entity_id.setdefault(entity_id, []).append(chain)\n    raw_mmcif['_struct_asym.id'].append(chain_id)\n    raw_mmcif['_struct_asym.entity_id'].append(entity_id)\n\n    res_chain_indices = res_indices_for_chain[chain['key']]\n    chain_type = chain['type']\n    is_polymer = chain_type in mmcif_names.POLYMER_CHAIN_TYPES\n    is_water = chain_type == mmcif_names.WATER\n    is_branched = len(res_chain_indices) > 1 and not is_polymer and not is_water\n    write_entity_poly_seq = entity_id not in written_entity_poly_seq_ids\n\n    # Iterate over the individual masked residue table columns, as that doesn't\n    # create a copy (only a view), while residues[res_chain_indices] does.\n    for res_key, res_name, res_id, pdb_seq_num, res_ins_code in zip(\n        residues.key[res_chain_indices],\n        residues.name[res_chain_indices],\n        residues.id[res_chain_indices],\n        residues.auth_seq_id[res_chain_indices],\n        residues.insertion_code[res_chain_indices],\n        strict=True,\n    ):\n      is_missing = res_key not in present_res_keys\n      str_res_id = str(res_id)\n      # While atom_site uses \"?\" for insertion codes, scheme tables use \".\".\n      ins_code = (res_ins_code or '.').replace('?', '.')\n      auth_seq_num = '?' if is_missing else pdb_seq_num\n\n      if is_polymer:\n        raw_mmcif['_pdbx_poly_seq_scheme.asym_id'].append(chain_id)\n        raw_mmcif['_pdbx_poly_seq_scheme.entity_id'].append(entity_id)\n        raw_mmcif['_pdbx_poly_seq_scheme.seq_id'].append(str_res_id)\n        raw_mmcif['_pdbx_poly_seq_scheme.mon_id'].append(res_name)\n        raw_mmcif['_pdbx_poly_seq_scheme.pdb_seq_num'].append(pdb_seq_num)\n        raw_mmcif['_pdbx_poly_seq_scheme.auth_seq_num'].append(auth_seq_num)\n        raw_mmcif['_pdbx_poly_seq_scheme.pdb_strand_id'].append(auth_asym_id)\n        raw_mmcif['_pdbx_poly_seq_scheme.pdb_ins_code'].append(ins_code)\n        # Structure doesn't support heterogeneous sequences.\n        raw_mmcif['_pdbx_poly_seq_scheme.hetero'].append('n')\n        if write_entity_poly_seq:\n          raw_mmcif['_entity_poly_seq.entity_id'].append(entity_id)\n          raw_mmcif['_entity_poly_seq.num'].append(str_res_id)\n          raw_mmcif['_entity_poly_seq.mon_id'].append(res_name)\n          # Structure doesn't support heterogeneous sequences.\n          raw_mmcif['_entity_poly_seq.hetero'].append('n')\n          written_entity_poly_seq_ids.add(entity_id)\n      elif is_branched:\n        raw_mmcif['_pdbx_branch_scheme.asym_id'].append(chain_id)\n        raw_mmcif['_pdbx_branch_scheme.entity_id'].append(entity_id)\n        raw_mmcif['_pdbx_branch_scheme.mon_id'].append(res_name)\n        raw_mmcif['_pdbx_branch_scheme.num'].append(str_res_id)\n        raw_mmcif['_pdbx_branch_scheme.pdb_asym_id'].append(auth_asym_id)\n        raw_mmcif['_pdbx_branch_scheme.pdb_seq_num'].append(pdb_seq_num)\n        raw_mmcif['_pdbx_branch_scheme.auth_asym_id'].append(auth_asym_id)\n        raw_mmcif['_pdbx_branch_scheme.auth_seq_num'].append(auth_seq_num)\n        raw_mmcif['_pdbx_branch_scheme.pdb_ins_code'].append(ins_code)\n        # Structure doesn't support heterogeneous sequences.\n        raw_mmcif['_pdbx_branch_scheme.hetero'].append('n')\n      else:\n        raw_mmcif['_pdbx_nonpoly_scheme.asym_id'].append(chain_id)\n        raw_mmcif['_pdbx_nonpoly_scheme.entity_id'].append(entity_id)\n        raw_mmcif['_pdbx_nonpoly_scheme.mon_id'].append(res_name)\n        raw_mmcif['_pdbx_nonpoly_scheme.pdb_seq_num'].append(pdb_seq_num)\n        raw_mmcif['_pdbx_nonpoly_scheme.auth_seq_num'].append(auth_seq_num)\n        raw_mmcif['_pdbx_nonpoly_scheme.pdb_strand_id'].append(auth_asym_id)\n        raw_mmcif['_pdbx_nonpoly_scheme.pdb_ins_code'].append(ins_code)\n\n  # Add _entity and _entity_poly tables.\n  for entity_id, chains in chains_by_entity_id.items():\n    # chains should always be a non-empty list because of how we constructed\n    # chains_by_entity_id.\n    assert chains\n    # All chains for a given entity should have the same type and sequence\n    # so we can pick the first one without losing information.\n    key_chain = chains[0]\n    raw_mmcif['_entity.id'].append(entity_id)\n    raw_mmcif['_entity.pdbx_description'].append(key_chain['entity_desc'])\n    entity_type = key_chain['type']\n    if entity_type not in mmcif_names.POLYMER_CHAIN_TYPES:\n      raw_mmcif['_entity.type'].append(entity_type)\n    else:\n      raw_mmcif['_entity.type'].append('polymer')\n      raw_mmcif['_entity_poly.entity_id'].append(entity_id)\n      raw_mmcif['_entity_poly.type'].append(entity_type)\n\n      # _entity_poly.pdbx_strand_id is a comma-separated list of\n      # auth_asym_ids that are part of the entity.\n      raw_mmcif['_entity_poly.pdbx_strand_id'].append(\n          ','.join(chain['auth_asym_id'] for chain in chains)\n      )\n  return raw_mmcif\n\n\ndef to_mmcif_atom_site_and_bonds_table(\n    *,\n    chains: Chains,\n    residues: Residues,\n    atoms: Atoms,\n    bonds: Bonds,\n    coords_decimal_places: int,\n) -> Mapping[str, Sequence[str]]:\n  \"\"\"Returns raw _atom_site and _struct_conn mmCIF tables.\"\"\"\n  raw_mmcif = collections.defaultdict(list)\n  # Use [value] * num wherever possible since it is about 10x faster than list\n  # comprehension in such cases. Also use f-strings instead of str() - faster.\n  total_atoms = atoms.size * atoms.num_models\n  raw_mmcif['_atom_site.id'] = [f'{i}' for i in range(1, total_atoms + 1)]\n  raw_mmcif['_atom_site.label_alt_id'] = ['.'] * total_atoms\n  # Use format_float_array instead of list comprehension for performance.\n  raw_mmcif['_atom_site.Cartn_x'] = mmcif.format_float_array(\n      values=atoms.x.ravel(), num_decimal_places=coords_decimal_places\n  )\n  raw_mmcif['_atom_site.Cartn_y'] = mmcif.format_float_array(\n      values=atoms.y.ravel(), num_decimal_places=coords_decimal_places\n  )\n  raw_mmcif['_atom_site.Cartn_z'] = mmcif.format_float_array(\n      values=atoms.z.ravel(), num_decimal_places=coords_decimal_places\n  )\n\n  # atoms.b_factor or atoms.occupancy can be flat even when the coordinates have\n  # leading dimensions. In this case we tile it to match.\n  if atoms.b_factor.ndim == 1:\n    atom_b_factor = np.tile(atoms.b_factor, atoms.num_models)\n  else:\n    atom_b_factor = atoms.b_factor.ravel()\n  raw_mmcif['_atom_site.B_iso_or_equiv'] = mmcif.format_float_array(\n      values=atom_b_factor, num_decimal_places=2\n  )\n\n  if atoms.occupancy.ndim == 1:\n    atom_occupancy = np.tile(atoms.occupancy, atoms.num_models)\n  else:\n    atom_occupancy = atoms.occupancy.ravel()\n  raw_mmcif['_atom_site.occupancy'] = mmcif.format_float_array(\n      values=atom_occupancy.ravel(), num_decimal_places=2\n  )\n\n  label_atom_id = atoms.name\n  type_symbol = atoms.element\n  label_comp_id = residues.apply_array_to_column('name', atoms.res_key)\n  label_asym_id = chains.apply_array_to_column('id', atoms.chain_key)\n  label_entity_id = chains.apply_array_to_column('entity_id', atoms.chain_key)\n  # Performance optimisation: Do the int->str conversion on num_residue-sized,\n  # array, then select instead of selecting and then converting.\n  label_seq_id = residues.id.astype('str').astype(object)[\n      ..., residues.index_by_key[atoms.res_key]\n  ]\n\n  # _atom_site.label_seq_id is '.' for non-polymers.\n  non_polymer_chain_mask = string_array.isin(\n      chains.type, mmcif_names.POLYMER_CHAIN_TYPES, invert=True\n  )\n  non_polymer_chain_keys = chains.key[non_polymer_chain_mask]\n  non_polymer_atom_mask = np.isin(atoms.chain_key, non_polymer_chain_keys)\n  label_seq_id[non_polymer_atom_mask] = '.'\n\n  auth_asym_id = chains.apply_array_to_column('auth_asym_id', atoms.chain_key)\n  auth_seq_id = residues.apply_array_to_column('auth_seq_id', atoms.res_key)\n  pdbx_pdb_ins_code = residues.apply_array_to_column(\n      'insertion_code', atoms.res_key\n  )\n  string_array.remap(pdbx_pdb_ins_code, mapping={None: '?'}, inplace=True)\n\n  group_pdb = _residue_name_to_record_name(\n      residue_name=label_comp_id, polymer_mask=~non_polymer_atom_mask\n  )\n\n  def tile_for_models(arr: np.ndarray) -> list[str]:\n    if atoms.num_models == 1:\n      return arr.tolist()  # Memory optimisation: np.tile(arr, 1) does a copy.\n    return np.tile(arr, atoms.num_models).tolist()\n\n  raw_mmcif['_atom_site.group_PDB'] = tile_for_models(group_pdb)\n  raw_mmcif['_atom_site.label_atom_id'] = tile_for_models(label_atom_id)\n  raw_mmcif['_atom_site.type_symbol'] = tile_for_models(type_symbol)\n  raw_mmcif['_atom_site.label_comp_id'] = tile_for_models(label_comp_id)\n  raw_mmcif['_atom_site.label_asym_id'] = tile_for_models(label_asym_id)\n  raw_mmcif['_atom_site.label_entity_id'] = tile_for_models(label_entity_id)\n  raw_mmcif['_atom_site.label_seq_id'] = tile_for_models(label_seq_id)\n  raw_mmcif['_atom_site.auth_asym_id'] = tile_for_models(auth_asym_id)\n  raw_mmcif['_atom_site.auth_seq_id'] = tile_for_models(auth_seq_id)\n  raw_mmcif['_atom_site.pdbx_PDB_ins_code'] = tile_for_models(pdbx_pdb_ins_code)\n  model_id = np.array(\n      [str(i + 1) for i in range(atoms.num_models)], dtype=object\n  )\n  raw_mmcif['_atom_site.pdbx_PDB_model_num'] = np.repeat(\n      model_id, [atoms.size] * atoms.num_models\n  ).tolist()\n\n  if bonds.key.size > 0:\n    raw_mmcif.update(\n        bonds.to_mmcif_dict_from_atom_arrays(\n            atom_key=atoms.key,\n            chain_id=label_asym_id,\n            res_id=label_seq_id,\n            res_name=label_comp_id,\n            atom_name=label_atom_id,\n            auth_asym_id=auth_asym_id,\n            auth_seq_id=auth_seq_id,\n            insertion_code=np.array(pdbx_pdb_ins_code),\n        )\n    )\n  return raw_mmcif\n\n\ndef _flatten_author_naming_scheme_table(\n    res_table: Mapping[str, Mapping[int, str]],\n    chain_ids: np.ndarray,\n    res_chain_ids: np.ndarray,\n    res_ids: np.ndarray,\n    default_if_missing: str,\n    table_name: str,\n) -> np.ndarray:\n  \"\"\"Flattens an author naming scheme table consistently with res_ids.\"\"\"\n  if not set(chain_ids).issubset(res_table):\n    raise ValueError(\n        f'Chain IDs in the chain_id array must be a subset of {table_name} in '\n        'author naming scheme:\\n'\n        f'chain_ids: {sorted(chain_ids)}\\n'\n        f'{table_name} keys: {sorted(res_table.keys())}'\n    )\n\n  chain_change_mask = res_chain_ids[1:] != res_chain_ids[:-1]\n  res_chain_boundaries = np.concatenate(\n      ([0], np.where(chain_change_mask)[0] + 1, [len(res_chain_ids)])\n  )\n\n  flat_vals = np.empty(len(res_ids), dtype=object)\n  for chain_start, chain_end in itertools.pairwise(res_chain_boundaries):\n    chain_id = res_chain_ids[chain_start]\n    chain_res_ids = res_ids[chain_start:chain_end]\n    chain_mapping = res_table[chain_id]\n    flat_vals[chain_start:chain_end] = [\n        chain_mapping.get(r, default_if_missing) for r in chain_res_ids\n    ]\n\n  return flat_vals\n\n\ndef tables_from_atom_arrays(\n    *,\n    res_id: np.ndarray,\n    author_naming_scheme: AuthorNamingScheme | None = None,\n    all_residues: Mapping[str, Sequence[tuple[str, int]]] | None = None,\n    chain_id: np.ndarray | None = None,\n    chain_type: np.ndarray | None = None,\n    res_name: np.ndarray | None = None,\n    atom_key: np.ndarray | None = None,\n    atom_name: np.ndarray | None = None,\n    atom_element: np.ndarray | None = None,\n    atom_x: np.ndarray | None = None,\n    atom_y: np.ndarray | None = None,\n    atom_z: np.ndarray | None = None,\n    atom_b_factor: np.ndarray | None = None,\n    atom_occupancy: np.ndarray | None = None,\n) -> tuple[Atoms, Residues, Chains]:\n  \"\"\"Returns Structure tables constructed from atom array level data.\n\n  All fields except name and, res_id are optional, all array fields consist of a\n  value for each atom in the structure - so residue and chain values should hold\n  the same value for each atom in the chain or residue. Fields which are not\n  defined are filled with default values.\n\n  Validation is performed by the Structure constructor where possible - but\n  author_naming scheme and all_residues must be checked in this function.\n\n  It is not possible to construct structures with chains that do not contain\n  any resolved residues using this function. If this is necessary, use the\n  structure.Structure constructor directly.\n\n  Args:\n    res_id: Integer array of shape [num_atom]. The unique residue identifier for\n      each residue. mmCIF field - _atom_site.label_seq_id.\n    author_naming_scheme: An optional instance of AuthorNamingScheme to use when\n      converting this structure to mmCIF.\n    all_residues: An optional mapping from each chain ID (i.e. label_asym_id) to\n      a sequence of (label_comp_id, label_seq_id) tuples, one per residue. This\n      can contain residues that aren't present in the atom arrays. This is\n      common in experimental data where some residues are not resolved but are\n      known to be present.\n    chain_id: String array of shape [num_atom] of unique chain identifiers.\n      mmCIF field - _atom_site.label_asym_id.\n    chain_type: String array of shape [num_atom]. The molecular type of the\n      current chain (e.g. polyribonucleotide). mmCIF field - _entity_poly.type\n      OR _entity.type (for non-polymers).\n    res_name: String array of shape [num_atom].. The name of each residue,\n      typically a 3 letter string for polypeptides or 1-2 letter strings for\n      polynucleotides. mmCIF field - _atom_site.label_comp_id.\n    atom_key: A unique sorted integer array, used only by the bonds table to\n      identify the atoms participating in each bond. If the bonds table is\n      specified then this column must be non-None.\n    atom_name: String array of shape [num_atom]. The name of each atom (e.g CA,\n      O2', etc.). mmCIF field - _atom_site.label_atom_id.\n    atom_element: String array of shape [num_atom]. The element type of each\n      atom (e.g. C, O, N, etc.). mmCIF field - _atom_site.type_symbol.\n    atom_x: Float array of shape [..., num_atom] of atom x coordinates. May have\n      arbitrary leading dimensions, provided that these are consistent across\n      all coordinate fields.\n    atom_y: Float array of shape [..., num_atom] of atom y coordinates. May have\n      arbitrary leading dimensions, provided that these are consistent across\n      all coordinate fields.\n    atom_z: Float array of shape [..., num_atom] of atom z coordinates. May have\n      arbitrary leading dimensions, provided that these are consistent across\n      all coordinate fields.\n    atom_b_factor: Float array of shape [..., num_atom] or [num_atom] of atom\n      b-factors or equivalent. If there are no extra leading dimensions then\n      these values are assumed to apply to all coordinates for a given atom. If\n      there are leading dimensions then these must match those used by the\n      coordinate fields.\n    atom_occupancy: Float array of shape [..., num_atom] or [num_atom] of atom\n      occupancies or equivalent. If there are no extra leading dimensions then\n      these values are assumed to apply to all coordinates for a given atom. If\n      there are leading dimensions then these must match those used by the\n      coordinate fields.\n  \"\"\"\n  num_atoms = len(res_id)\n\n  for arr_name, array, dtype in (\n      ('chain_id', chain_id, object),\n      ('chain_type', chain_type, object),\n      ('res_id', res_id, np.int32),\n      ('res_name', res_name, object),\n      ('atom_key', atom_key, np.int64),\n      ('atom_name', atom_name, object),\n      ('atom_element', atom_element, object),\n  ):\n    if array is not None and array.shape != (num_atoms,):\n      raise ValueError(f'{arr_name} shape {array.shape} != ({num_atoms},)')\n    if array is not None and array.dtype != dtype:\n      raise ValueError(f'{arr_name} dtype {array.dtype} != {dtype}')\n\n  for arr_name, array in (\n      ('atom_x', atom_x),\n      ('atom_y', atom_y),\n      ('atom_z', atom_z),\n      ('atom_b_factor', atom_b_factor),\n      ('atom_occupancy', atom_occupancy),\n  ):\n    if array is not None and array.shape[-1] != num_atoms:\n      raise ValueError(f'{arr_name} last dim {array.shape[-1]} != {num_atoms=}')\n    if (\n        array is not None\n        and array.dtype != np.float32\n        and array.dtype != np.float64\n    ):\n      raise ValueError(\n          f'{arr_name} must be np.float32 or np.float64, got {array.dtype=}'\n      )\n\n  if all_residues is not None and (res_name is None or res_id is None):\n    raise ValueError(\n        'If all_residues != None, res_name and res_id must not be None either.'\n    )\n\n  if num_atoms == 0:\n    return Atoms.make_empty(), Residues.make_empty(), Chains.make_empty()\n\n  if chain_id is None:\n    chain_id = np.full(shape=num_atoms, fill_value='A', dtype=object)\n  if res_name is None:\n    res_name = np.full(shape=num_atoms, fill_value='UNK', dtype=object)\n\n  chain_change_mask = chain_id[1:] != chain_id[:-1]\n  chain_start = np.concatenate(([0], np.where(chain_change_mask)[0] + 1))\n  res_start = np.concatenate(\n      ([0], np.where((res_id[1:] != res_id[:-1]) | chain_change_mask)[0] + 1)\n  )\n\n  if len(set(chain_id)) != len(chain_start):\n    raise ValueError(f'Chain IDs must be contiguous, but got {chain_id}')\n\n  # We do not support chains with unresolved residues-only in this function.\n  chain_ids = chain_id[chain_start]\n  if all_residues and set(all_residues.keys()) != set(chain_ids):\n    raise ValueError(\n        'all_residues must contain the same set of chain IDs as the chain_id '\n        f'array:\\nall_residues keys: {sorted(all_residues.keys())}\\n'\n        f'chain_ids: {sorted(chain_ids)}.'\n    )\n  # Make sure all_residue ordering is consistent with chain_id.\n  if all_residues and np.any(list(all_residues.keys()) != chain_ids):\n    all_residues = {cid: all_residues[cid] for cid in chain_ids}\n\n  # Create the chains table.\n  num_chains = len(chain_ids)\n  chain_keys = np.arange(num_chains, dtype=np.int64)\n  chain_key_by_chain_id = dict(zip(chain_ids, chain_keys, strict=True))\n\n  if chain_type is not None:\n    chain_types = chain_type[chain_start]\n  else:\n    chain_types = np.full(num_chains, mmcif_names.PROTEIN_CHAIN, dtype=object)\n\n  if author_naming_scheme is not None:\n    auth_asym_id = string_array.remap(\n        chain_ids, author_naming_scheme.auth_asym_id\n    )\n    entity_id = string_array.remap(\n        chain_ids, author_naming_scheme.entity_id, default_value='.'\n    )\n    entity_desc = string_array.remap(\n        entity_id, author_naming_scheme.entity_desc, default_value='.'\n    )\n  else:\n    auth_asym_id = chain_ids\n    entity_id = (chain_keys + 1).astype(str).astype(object)\n    entity_desc = np.full(num_chains, '.', dtype=object)\n\n  chains = Chains(\n      key=chain_keys,\n      id=chain_ids,\n      type=chain_types,\n      auth_asym_id=auth_asym_id,\n      entity_id=entity_id,\n      entity_desc=entity_desc,\n  )\n\n  # Create the residues table.\n  if all_residues is not None:\n    residue_order = []\n    for cid, residues in all_residues.items():\n      residue_order.extend((cid, rname, int(rid)) for (rname, rid) in residues)\n    res_chain_ids, res_names, res_ids = zip(*residue_order)\n    res_chain_ids = np.array(res_chain_ids, dtype=object)\n    res_ids = np.array(res_ids, dtype=np.int32)\n    res_names = np.array(res_names, dtype=object)\n  else:\n    res_chain_ids = chain_id[res_start]\n    res_ids = res_id[res_start]\n    res_names = res_name[res_start]\n    residue_order = list(zip(res_chain_ids, res_names, res_ids))\n\n  if author_naming_scheme is not None and author_naming_scheme.auth_seq_id:\n    auth_seq_id = _flatten_author_naming_scheme_table(\n        author_naming_scheme.auth_seq_id,\n        chain_ids=chain_ids,\n        res_chain_ids=res_chain_ids,\n        res_ids=res_ids,\n        default_if_missing='.',\n        table_name='auth_seq_id',\n    )\n  else:\n    auth_seq_id = res_ids.astype(str).astype(object)\n\n  if author_naming_scheme is not None and author_naming_scheme.insertion_code:\n    insertion_code = _flatten_author_naming_scheme_table(\n        author_naming_scheme.insertion_code,\n        chain_ids=chain_ids,\n        res_chain_ids=res_chain_ids,\n        res_ids=res_ids,\n        default_if_missing='?',\n        table_name='insertion_code',\n    )\n    # Make sure insertion code of None is mapped to '.'.\n    insertion_code = string_array.remap(insertion_code, {None: '?'})\n  else:\n    insertion_code = np.full(shape=len(res_ids), fill_value='?', dtype=object)\n\n  res_key_by_res = {res: i for i, res in enumerate(residue_order)}\n  res_keys = np.arange(len(residue_order), dtype=np.int64)\n  res_chain_keys = string_array.remap(\n      res_chain_ids, chain_key_by_chain_id\n  ).astype(np.int64)\n  residues = Residues(\n      chain_key=res_chain_keys,\n      key=res_keys,\n      id=res_ids,\n      name=res_names,\n      auth_seq_id=auth_seq_id,\n      insertion_code=insertion_code,\n  )\n\n  if atom_key is None:\n    atom_key = np.arange(num_atoms, dtype=np.int64)\n\n  atom_chain_keys = string_array.remap(chain_id, chain_key_by_chain_id).astype(\n      np.int64\n  )\n\n  try:\n    atom_res_keys = [res_key_by_res[r] for r in zip(chain_id, res_name, res_id)]\n  except KeyError as e:\n    missing_chain_id, missing_res_name, missing_res_id = e.args[0]\n    raise ValueError(\n        'Inconsistent res_name, res_id and all_residues. Could not find '\n        f'residue with chain_id={missing_chain_id}, '\n        f'res_name={missing_res_name}, res_id={missing_res_id} in all_residues.'\n    ) from e\n\n  atoms = Atoms(\n      key=atom_key,\n      chain_key=atom_chain_keys,\n      res_key=np.array(atom_res_keys, dtype=np.int64),\n      name=_default(atom_name, ['?'] * num_atoms, object),\n      element=_default(atom_element, ['?'] * num_atoms, object),\n      x=_default(atom_x, [0.0] * num_atoms, np.float32),\n      y=_default(atom_y, [0.0] * num_atoms, np.float32),\n      z=_default(atom_z, [0.0] * num_atoms, np.float32),\n      b_factor=_default(atom_b_factor, [0.0] * num_atoms, np.float32),\n      occupancy=_default(atom_occupancy, [1.0] * num_atoms, np.float32),\n  )\n  return atoms, residues, chains\n"
  },
  {
    "path": "src/alphafold3/structure/table.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Table module for atom/residue/chain tables in Structure.\n\nTables are intended to be lightweight collections of columns, loosely based\non a pandas dataframe, for use in the Structure class.\n\"\"\"\n\nimport abc\nfrom collections.abc import Callable, Collection, Iterable, Iterator, Mapping, Sequence\nimport dataclasses\nimport functools\nimport graphlib\nimport typing\nfrom typing import Any, Protocol, Self, TypeAlias, TypeVar, overload\n\nfrom alphafold3.cpp import string_array\nimport numpy as np\n\n\nTableEntry: TypeAlias = str | int | float | None\nFilterPredicate: TypeAlias = (\n    TableEntry\n    | Iterable[Any]  # Workaround for b/326384670. Tighten once fixed.\n    | Callable[[Any], bool]  # Workaround for b/326384670. Tighten once fixed.\n    | Callable[[np.ndarray], bool]\n)\n\n\nclass RowLookup(Protocol):\n\n  def get_row_by_key(\n      self,\n      key: int,\n      column_name_map: Mapping[str, str] | None = None,\n  ) -> Mapping[str, Any]:\n    ...\n\n\n@dataclasses.dataclass(frozen=True, kw_only=True)\nclass Table:\n  \"\"\"Parent class for structure tables.\n\n  A table is a collection of columns of equal length, where one column is the\n  key. The key uniquely identifies each row in the table.\n\n  A table can refer to other tables by including a foreign key column, whose\n  values are key values from the other table's key column. These column can have\n  arbitrary names and are treated like any other integer-valued column.\n\n  See the `Database` class in this module for utilities for handing sets of\n  tables that are related via foreign keys.\n\n  NB: This does not correspond to an mmCIF table.\n  \"\"\"\n\n  key: np.ndarray\n\n  def __post_init__(self):\n    for col_name in self.columns:\n      if (col_len := self.get_column(col_name).shape[-1]) != self.size:\n        raise ValueError(\n            f'All columns should have length {self.size} but got \"{col_name}\"'\n            f' with length {col_len}.'\n        )\n      self.get_column(col_name).flags.writeable = False  # Make col immutable.\n    if self.key.size and self.key.min() < 0:\n      raise ValueError(\n          'Key values must be non-negative. Got negative values:'\n          f' {set(self.key[self.key < 0])}'\n      )\n    self.key.flags.writeable = False  # Make key immutable.\n\n  def __getstate__(self) -> dict[str, Any]:\n    \"\"\"Returns members with cached properties removed for pickling.\"\"\"\n    cached_props = {\n        k\n        for k, v in self.__class__.__dict__.items()\n        if isinstance(v, functools.cached_property)\n    }\n    return {k: v for k, v in self.__dict__.items() if k not in cached_props}\n\n  @functools.cached_property\n  def index_by_key(self) -> np.ndarray:\n    \"\"\"Mapping from key values to their index in the column arrays.\n\n    i.e.: self.key[index_by_key[k]] == k\n    \"\"\"\n    if not self.key.size:\n      return np.array([], dtype=np.int64)\n    else:\n      index_by_key = np.zeros(np.max(self.key) + 1, dtype=np.int64)\n      index_by_key[self.key] = np.arange(self.size)\n      return index_by_key\n\n  @functools.cached_property\n  def columns(self) -> tuple[str, ...]:\n    \"\"\"The names of the columns in the table, including the key column.\"\"\"\n    return tuple(field.name for field in dataclasses.fields(self))\n\n  @functools.cached_property\n  def items(self) -> Mapping[str, np.ndarray]:\n    \"\"\"Returns the mapping from column names to column values.\"\"\"\n    return {col: getattr(self, col) for col in self.columns}\n\n  @functools.cached_property\n  def size(self) -> int:\n    \"\"\"The number of rows in the table.\"\"\"\n    return self.key.shape[-1]\n\n  def __len__(self) -> int:\n    return self.size\n\n  def get_column(self, column_name: str) -> np.ndarray:\n    \"\"\"Gets a column by name.\"\"\"\n    # Performance optimisation: use the cached columns, instead of getattr.\n    return self.items[column_name]\n\n  def apply_array(self, arr: np.ndarray) -> Self:\n    \"\"\"Returns a sliced table using a key (!= index) array or a boolean mask.\"\"\"\n    if arr.dtype == bool and np.all(arr):\n      return self  # Shortcut: No-op, so just return.\n\n    return self.copy_and_update(**{\n        column_name: self.apply_array_to_column(column_name, arr)\n        for column_name in self.columns\n    })\n\n  def apply_index(self, index_arr: np.ndarray) -> Self:\n    \"\"\"Returns a sliced table using an index (!= key) array.\"\"\"\n    if index_arr.dtype == bool:\n      raise ValueError('The index array must not be a boolean mask.')\n\n    return self.copy_and_update(\n        **{col: self.get_column(col)[..., index_arr] for col in self.columns}\n    )\n\n  def apply_array_to_column(\n      self,\n      column_name: str,\n      arr: np.ndarray,\n  ) -> np.ndarray:\n    \"\"\"Returns a sliced column array using a key array or a boolean mask.\"\"\"\n    if arr.dtype == bool:\n      return self.get_column(column_name)[..., arr]\n    else:\n      return self.get_column(column_name)[..., self.index_by_key[arr]]\n\n  def get_value_by_index(self, column_name: str, index: int) -> Any:\n    return self.get_column(column_name)[index]\n\n  def get_value_by_key(\n      self,\n      column_name: str,\n      key: int | np.integer,\n  ) -> TableEntry:\n    \"\"\"Gets the value of a column at the row with specified key value.\"\"\"\n    return self.get_value_by_index(column_name, self.index_by_key[key])\n\n  @overload\n  def __getitem__(self, key: str) -> np.ndarray:\n    ...\n\n  @overload\n  def __getitem__(self, key: np.ndarray) -> 'Table':\n    ...\n\n  @overload\n  def __getitem__(self, key: tuple[str, int | np.integer]) -> TableEntry:\n    ...\n\n  @overload\n  def __getitem__(self, key: tuple[str, np.ndarray]) -> np.ndarray:\n    ...\n\n  def __getitem__(self, key):\n    match key:\n      case str():\n        return self.get_column(key)\n      case np.ndarray() as key_arr_or_mask:\n        return self.apply_array(key_arr_or_mask)\n      case str() as col, int() | np.integer() as key_val:\n        return self.get_value_by_key(col, key_val)\n      case str() as col, np.ndarray() as key_arr_or_mask:\n        return self.apply_array_to_column(col, key_arr_or_mask)\n      case _:\n        if isinstance(key, tuple):\n          err_msg = f'{key}, type: tuple({[type(v) for v in key]})'\n        else:\n          err_msg = f'{key}, type: {type(key)}'\n        raise KeyError(err_msg)\n\n  def get_row_by_key(\n      self,\n      key: int,\n      column_name_map: Mapping[str, str] | None = None,\n  ) -> dict[str, Any]:\n    \"\"\"Gets the row with specified key value.\"\"\"\n    return self.get_row_by_index(\n        self.index_by_key[key], column_name_map=column_name_map\n    )\n\n  def get_row_by_index(\n      self,\n      index: int,\n      column_name_map: Mapping[str, str] | None = None,\n  ) -> dict[str, Any]:\n    \"\"\"Gets the row at the specified index.\"\"\"\n    if column_name_map is not None:\n      return {\n          renamed_col: self.get_value_by_index(col, index)\n          for renamed_col, col in column_name_map.items()\n      }\n    else:\n      return {col: self.get_value_by_index(col, index) for col in self.columns}\n\n  def iterrows(\n      self,\n      *,\n      row_keys: np.ndarray | None = None,\n      column_name_map: Mapping[str, str] | None = None,\n      **table_by_foreign_key_col: RowLookup,\n  ) -> Iterator[Mapping[str, Any]]:\n    \"\"\"Yields rows from the table.\n\n    This can be used to easily convert a table to a Pandas dataframe:\n\n    ```py\n    df = pd.DataFrame(table.iterrows())\n    ```\n\n    Args:\n      row_keys: An optional array of keys of rows to yield. If None, all rows\n        will be yielded.\n      column_name_map: An optional mapping from desired keys in the row dicts to\n        the names of the columns they correspond to.\n      **table_by_foreign_key_col: An optional mapping from column names in this\n        table, which are expected to be columns of foreign keys, to the table\n        that the foreign keys point into. If provided, then the yielded rows\n        will include data from the foreign tables at the appropriate key.\n    \"\"\"\n    if row_keys is not None:\n      row_indices = self.index_by_key[row_keys]\n    else:\n      row_indices = range(self.size)\n    for i in row_indices:\n      row = self.get_row_by_index(i, column_name_map=column_name_map)\n      for key_col, table in table_by_foreign_key_col.items():\n        foreign_key = self[key_col][i]\n        foreign_row = table.get_row_by_key(foreign_key)\n        row.update(foreign_row)\n      yield row\n\n  def with_column_names(\n      self, column_name_map: Mapping[str, str]\n  ) -> 'RenamedTableView':\n    \"\"\"Returns a view of this table with mapped column names.\"\"\"\n    return RenamedTableView(self, column_name_map=column_name_map)\n\n  def make_filter_mask(\n      self,\n      mask: np.ndarray | None = None,\n      *,\n      apply_per_element: bool = False,\n      **predicate_by_col: FilterPredicate,\n  ) -> np.ndarray | None:\n    \"\"\"Returns a boolean array of rows to keep, or None if all can be kept.\n\n    Args:\n      mask: See `Table.filter`.\n      apply_per_element: See `Table.filter`.\n      **predicate_by_col: See `Table.filter`.\n\n    Returns:\n      Either a boolean NumPy array of length `(self.size,)` denoting which rows\n      should be kept according to the input mask and predicates, or None. None\n      implies there is no filtering required, and is used where possible\n      instead of an all-True array to save time and space.\n    \"\"\"\n    if mask is None:\n      if not predicate_by_col:\n        return None\n      else:\n        mask = np.ones((self.size,), dtype=bool)\n    else:\n      if mask.shape != (self.size,):\n        raise ValueError(\n            f'mask must have shape ({self.size},). Got: {mask.shape}.'\n        )\n      if mask.dtype != bool:\n        raise ValueError(f'mask must have dtype bool. Got: {mask.dtype}.')\n\n    for col, predicate in predicate_by_col.items():\n      if self[col].ndim > 1:\n        raise ValueError(\n            f'Cannot filter by column {col} with more than 1 dimension.'\n        )\n\n      callable_predicates = []\n      if not callable(predicate):\n        if isinstance(predicate, Iterable) and not isinstance(predicate, str):\n          target_vals = predicate\n        else:\n          target_vals = [predicate]\n        for target_val in target_vals:\n          callable_predicates.append(lambda x, target=target_val: x == target)\n      else:\n        callable_predicates.append(predicate)\n\n      field_mask = np.zeros_like(mask)\n      for callable_predicate in callable_predicates:\n        if not apply_per_element:\n          callable_predicate = typing.cast(\n              Callable[[np.ndarray], bool], callable_predicate\n          )\n          predicate_result = callable_predicate(self.get_column(col))\n        else:\n          predicate_result = np.array(\n              [callable_predicate(elem) for elem in self.get_column(col)]\n          )\n        np.logical_or(field_mask, predicate_result, out=field_mask)\n      np.logical_and(mask, field_mask, out=mask)  # Update in-place.\n    return mask\n\n  def filter(\n      self,\n      mask: np.ndarray | None = None,\n      *,\n      apply_per_element: bool = False,\n      invert: bool = False,\n      **predicate_by_col: FilterPredicate,\n  ) -> Self:\n    \"\"\"Filters the table using mask and/or predicates and returns a new table.\n\n    Predicates can be either:\n      1. A constant value, e.g. `'CA'`. In this case then only rows that match\n        this value for the given column are retained.\n      2. A (non-string) iterable e.g. `('A', 'B')`. In this\n        case then rows are retained if they match any of the provided values for\n        the given column.\n      3. A boolean function e.g. `lambda b_fac: b_fac < 100.0`.\n        In this case then only rows that evaluate to `True` are retained. By\n        default this function's parameter is expected to be an array, unless\n        `apply_per_element=True`.\n\n    Args:\n      mask: An optional boolean NumPy array with length equal to the table size.\n        If provided then this will be combined with the other predicates so that\n        a row is included if it is masked-in *and* matches all the predicates.\n      apply_per_element: Whether apply predicates to each element in the column\n        individually, or to pass the whole column array to the predicate.\n      invert: If True then the returned table will contain exactly those rows\n        that would be removed if this was `False`.\n      **predicate_by_col: A mapping from column name to a predicate. Filtered\n        columns must be 1D arrays. If multiple columns are provided as keyword\n        arguments then each predicate is applied and the results are combined\n        using a boolean AND operation, so an atom is only retained if it passes\n        all predicates.\n\n    Returns:\n      A new table with the desired rows retained (or filtered out if\n      `invert=True`).\n\n    Raises:\n      ValueError: If mask is provided and is not a bool array with shape\n        `(num_atoms,)`.\n    \"\"\"\n    filter_mask = self.make_filter_mask(\n        mask, apply_per_element=apply_per_element, **predicate_by_col\n    )\n    if filter_mask is None:\n      # No mask or predicate was specified, so we can return early.\n      if not invert:\n        return self\n      else:\n        return self[np.array((), dtype=np.int64)]\n    else:\n      return self[~filter_mask if invert else filter_mask]\n\n  def _validate_keys_are_column_names(self, keys: Collection[str]) -> None:\n    \"\"\"Raises an error if any of the keys are not column names.\"\"\"\n    if mismatches := set(keys) - set(self.columns):\n      raise ValueError(f'Invalid column names: {sorted(mismatches)}.')\n\n  def copy_and_update(self, **new_column_by_column_name: np.ndarray) -> Self:\n    \"\"\"Returns a copy of this table with the specified changes applied.\n\n    Args:\n      **new_column_by_column_name: New values for the specified columns.\n\n    Raises:\n      ValueError: If a specified column name is not a column in this table.\n    \"\"\"\n    self._validate_keys_are_column_names(new_column_by_column_name)\n    return dataclasses.replace(self, **new_column_by_column_name)\n\n  def copy_and_remap(\n      self, **mapping_by_col: Mapping[TableEntry, TableEntry]\n  ) -> Self:\n    \"\"\"Returns a copy of the table with the specified columns remapped.\n\n    Args:\n      **mapping_by_col: Each kwarg key should be the name of one of this table's\n        columns, and each value should be a mapping. The values in the column\n        will be looked up in the mapping and replaced with the result if one is\n        found.\n\n    Raises:\n      ValueError: If a specified column name is not a column in this table.\n    \"\"\"\n    self._validate_keys_are_column_names(mapping_by_col)\n    if not self.size:\n      return self\n    remapped_cols = {}\n    for column_name, mapping in mapping_by_col.items():\n      col_arr = self.get_column(column_name)\n      if col_arr.dtype == object:\n        remapped = string_array.remap(col_arr, mapping)\n      else:\n        remapped = np.vectorize(lambda x: mapping.get(x, x))(col_arr)  # pylint: disable=cell-var-from-loop\n      remapped_cols[column_name] = remapped\n    return self.copy_and_update(**remapped_cols)\n\n\nclass RenamedTableView:\n  \"\"\"View of a table with renamed column names.\"\"\"\n\n  def __init__(self, table: Table, column_name_map: Mapping[str, str]):\n    self._table = table\n    self._column_name_map = column_name_map\n\n  def get_row_by_key(\n      self,\n      key: int,\n      column_name_map: Mapping[str, str] | None = None,\n  ) -> Mapping[str, Any]:\n    del column_name_map\n    return self._table.get_row_by_key(\n        key, column_name_map=self._column_name_map\n    )\n\n\n_DatabaseT = TypeVar('_DatabaseT', bound='Database')\n\n\nclass Database(abc.ABC):\n  \"\"\"Relational database base class.\"\"\"\n\n  @property\n  @abc.abstractmethod\n  def tables(self) -> Collection[str]:\n    \"\"\"The names of the tables in this database.\"\"\"\n\n  @abc.abstractmethod\n  def get_table(self, table_name: str) -> Table:\n    \"\"\"Gets the table with the given name.\"\"\"\n\n  @property\n  @abc.abstractmethod\n  def foreign_keys(self) -> Mapping[str, Collection[tuple[str, str]]]:\n    \"\"\"Describes the relationship between keys in the database.\n\n    Returns:\n      A map from table names to pairs of `(column_name, foreign_table_name)`\n      where `column_name` is a column containing foreign keys in the table named\n      by the key, and the `foreign_table_name` is the name of the table that\n      those foreign keys refer to.\n    \"\"\"\n\n  @abc.abstractmethod\n  def copy_and_update(\n      self: _DatabaseT,\n      **new_field_by_field_name: ...,\n  ) -> _DatabaseT:\n    \"\"\"Returns a copy of this database with the specified changes applied.\"\"\"\n\n\ndef table_dependency_order(db: Database) -> Iterable[str]:\n  \"\"\"Yields the names of the tables in the database in dependency order.\n\n  This order guarantees that a table appears after all other tables that\n  it refers to using foreign keys. Specifically A < B implies that A contains\n  no column that refers to B.key as a foreign key.\n\n  Args:\n    db: The database that defines the table names and foreign keys.\n  \"\"\"\n  connections: dict[str, set[str]] = {}\n  for table_name in db.tables:\n    connection_set = set()\n    for _, foreign_table in db.foreign_keys.get(table_name, ()):\n      connection_set.add(foreign_table)\n    connections[table_name] = connection_set\n  yield from graphlib.TopologicalSorter(connections).static_order()\n\n\ndef concat_databases(dbs: Sequence[_DatabaseT]) -> _DatabaseT:\n  \"\"\"Concatenates the tables across a sequence of databases.\n\n  Args:\n    dbs: A non-empty sequence of database instances of the same type.\n\n  Returns:\n    A new database containing the concatenated tables from the input databases.\n\n  Raises:\n    ValueError: If `dbs` is empty or `dbs` contains different Database\n      types.\n  \"\"\"\n  if not dbs:\n    raise ValueError('Need at least one value to concatenate.')\n  distinct_db_types = {type(db) for db in dbs}\n  if len(distinct_db_types) > 1:\n    raise ValueError(\n        f'All `dbs` must be of the same type, got: {distinct_db_types}'\n    )\n\n  first_db, *other_dbs = dbs\n  concatted_tables: dict[str, Table] = {}\n  key_offsets: dict[str, list[int]] = {}\n  for table_name in table_dependency_order(first_db):\n    first_table = first_db.get_table(table_name)\n    columns: dict[str, list[np.ndarray]] = {\n        column_name: [first_table.get_column(column_name)]\n        for column_name in first_table.columns\n    }\n    key_offsets[table_name] = [\n        first_table.key.max() + 1 if first_table.size else 0\n    ]\n\n    for prev_index, db in enumerate(other_dbs):\n      table = db.get_table(table_name)\n      for col_name in table.columns:\n        columns[col_name].append(table.get_column(col_name))\n      key_offset = key_offsets[table_name][prev_index]\n      offset_key = table.key + key_offset\n      columns['key'][-1] = offset_key\n      if table.size:\n        key_offsets[table_name].append(offset_key.max() + 1)\n      else:\n        key_offsets[table_name].append(key_offsets[table_name][prev_index])\n      for fkey_col_name, foreign_table_name in first_db.foreign_keys.get(\n          table_name, []\n      ):\n        fkey_columns = columns[fkey_col_name]\n        fkey_columns[-1] = (\n            fkey_columns[-1] + key_offsets[foreign_table_name][prev_index]\n        )\n\n    concatted_columns = {\n        column_name: np.concatenate(values, axis=-1)\n        for column_name, values in columns.items()\n    }\n    concatted_tables[table_name] = (type(first_table))(**concatted_columns)\n  return first_db.copy_and_update(**concatted_tables)\n"
  },
  {
    "path": "src/alphafold3/structure/test_utils.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Utilities for structure module testing.\"\"\"\n\nimport dataclasses\n\nfrom absl.testing import parameterized\nfrom alphafold3 import structure\nfrom alphafold3.common.testing import data\nimport numpy as np\nimport tree\n\n\nclass StructureTestCase(parameterized.TestCase):\n  \"\"\"Testing utilities for working with structure.Structure.\"\"\"\n\n  def assertAuthorNamingSchemeEqual(self, ans1, ans2):  # pylint: disable=invalid-name\n    \"\"\"Walks naming scheme, making sure all elements are equal.\"\"\"\n    if ans1 is None or ans2 is None:\n      self.assertIsNone(ans1)\n      self.assertIsNone(ans2)\n      return\n    flat_ans1 = dict(tree.flatten_with_path(dataclasses.asdict(ans1)))\n    flat_ans2 = dict(tree.flatten_with_path(dataclasses.asdict(ans2)))\n    for k, v in flat_ans1.items():\n      self.assertEqual(v, flat_ans2[k], msg=str(k))\n    for k, v in flat_ans2.items():\n      self.assertEqual(v, flat_ans1[k], msg=str(k))\n\n  def assertAllResiduesEqual(self, all_res1, all_res2):  # pylint: disable=invalid-name\n    \"\"\"Walks all residues, making sure alll elements are equal.\"\"\"\n    if all_res1 is None or all_res2 is None:\n      self.assertIsNone(all_res1)\n      self.assertIsNone(all_res2)\n      return\n    self.assertSameElements(all_res1.keys(), all_res2.keys())\n    for chain_id, chain_res in all_res1.items():\n      self.assertSequenceEqual(chain_res, all_res2[chain_id], msg=chain_id)\n\n  def assertBioassemblyDataEqual(self, data1, data2):  # pylint: disable=invalid-name\n    if data1 is None or data2 is None:\n      self.assertIsNone(data1)\n      self.assertIsNone(data2)\n      return\n    self.assertDictEqual(data1.to_mmcif_dict(), data2.to_mmcif_dict())\n\n  def assertChemicalComponentsDataEqual(  # pylint: disable=invalid-name\n      self,\n      data1,\n      data2,\n      allow_chem_comp_data_extension,\n  ):\n    \"\"\"Checks whether two ChemicalComponentData objects are considered equal.\"\"\"\n    if data1 is None or data2 is None:\n      self.assertIsNone(data1)\n      self.assertIsNone(data2)\n      return\n    if (not allow_chem_comp_data_extension) or (\n        data1.chem_comp.keys() ^ data2.chem_comp.keys()\n    ):\n      self.assertDictEqual(data1.chem_comp, data2.chem_comp)\n    else:\n      mismatching_values = []\n      for component_id in data1.chem_comp:\n        found = data1.chem_comp[component_id]\n        expected = data2.chem_comp[component_id]\n        if not found.extends(expected):\n          mismatching_values.append((component_id, expected, found))\n\n      if mismatching_values:\n        mismatch_err_msgs = '\\n'.join(\n            f'{component_id}: {expected} or its extension expected,'\n            f' but {found} found.'\n            for component_id, expected, found in mismatching_values\n        )\n        self.fail(\n            f'Mismatching values for `_chem_comp` table: {mismatch_err_msgs}',\n        )\n\n  def assertBondsEqual(self, bonds1, bonds2, atom_key1, atom_key2):  # pylint: disable=invalid-name\n    \"\"\"Checks whether two Bonds objects are considered equal.\"\"\"\n    # An empty bonds table is functionally equivalent to an empty bonds table.\n    # NB: this can only ever be None in structure v1.\n    if bonds1 is None or not bonds1.size or bonds2 is None or not bonds2.size:\n      self.assertTrue(bonds1 is None or not bonds1.size, msg=f'{bonds1=}')\n      self.assertTrue(bonds2 is None or not bonds2.size, msg=f'{bonds2=}')\n      return\n\n    ptnr1_indices1, ptnr2_indices1 = bonds1.get_atom_indices(atom_key1)\n    ptnr1_indices2, ptnr2_indices2 = bonds2.get_atom_indices(atom_key2)\n    np.testing.assert_array_equal(ptnr1_indices1, ptnr1_indices2)\n    np.testing.assert_array_equal(ptnr2_indices1, ptnr2_indices2)\n    np.testing.assert_array_equal(bonds1.type, bonds2.type)\n    np.testing.assert_array_equal(bonds1.role, bonds2.role)\n\n  def assertStructuresEqual(  # pylint: disable=invalid-name\n      self,\n      struc1,\n      struc2,\n      *,\n      ignore_fields=None,\n      allow_chem_comp_data_extension=False,\n      atol=0,\n  ):\n    \"\"\"Checks whether two Structure objects could be considered equal.\n\n    Args:\n      struc1: First Structure object.\n      struc2: Second Structure object.\n      ignore_fields: Fields not taken into account during comparison.\n      allow_chem_comp_data_extension: Whether to allow data of `_chem_comp`\n        table to differ if `struc2` is missing some fields, but `struc1` has\n        specific values for them.\n      atol: Absolute tolerance for floating point comparisons (in\n        np.testing.assert_allclose).\n    \"\"\"\n    for field in sorted(structure.GLOBAL_FIELDS):\n      if ignore_fields and field in ignore_fields:\n        continue\n      if field == 'author_naming_scheme':\n        self.assertAuthorNamingSchemeEqual(struc1[field], struc2[field])\n      elif field == 'all_residues':\n        self.assertAllResiduesEqual(struc1[field], struc2[field])\n      elif field == 'bioassembly_data':\n        self.assertBioassemblyDataEqual(struc1[field], struc2[field])\n      elif field == 'chemical_components_data':\n        self.assertChemicalComponentsDataEqual(\n            struc1[field], struc2[field], allow_chem_comp_data_extension\n        )\n      elif field == 'bonds':\n        self.assertBondsEqual(\n            struc1.bonds, struc2.bonds, struc1.atom_key, struc2.atom_key\n        )\n      else:\n        self.assertEqual(struc1[field], struc2[field], msg=field)\n\n    # The chain order within a structure is arbitrary so in order to\n    # directly compare arrays we first align struc1 to struc2 and check that\n    # the number of atoms doesn't change.\n    num_atoms = struc1.num_atoms\n    self.assertEqual(struc2.num_atoms, num_atoms)\n    struc1 = struc1.order_and_drop_atoms_to_match(struc2)\n    self.assertEqual(struc1.num_atoms, num_atoms)\n\n    for field in sorted(structure.ARRAY_FIELDS):\n      if field == 'atom_key':\n        # atom_key has no external meaning, so it doesn't matter whether it\n        # differs between two structures.\n        continue\n      if ignore_fields and field in ignore_fields:\n        continue\n      self.assertEqual(struc1[field] is None, struc2[field] is None, msg=field)\n\n      if np.issubdtype(struc1[field].dtype, np.inexact):\n        np.testing.assert_allclose(\n            struc1[field], struc2[field], err_msg=field, atol=atol\n        )\n      else:\n        np.testing.assert_array_equal(\n            struc1[field], struc2[field], err_msg=field\n        )\n"
  },
  {
    "path": "src/alphafold3/test_data/featurised_example.json",
    "content": "[\n  {\n    \"aatype\": \"46551530df4e79371352989100ae6af82ccd939009517b788173bdbb323ae40a\",\n    \"asym_id\": \"42c714885d17f6c0fcfebebd171b5ed7d7e77a56cf9c4983d9ff9ff90995bd1c\",\n    \"cleaned_struc\": \"<<structure>>\",\n    \"deletion_matrix\": \"54f980b5b3be8ce80cb6490c527e38d681deade50f239f2cb7d23cf9d0108c37\",\n    \"deletion_mean\": \"655a3ef0465a9f30fddf25f4dde0c19a05c6f9069b83961800c1944165955273\",\n    \"empty_output_struc\": \"<<structure>>\",\n    \"entity_id\": \"42c714885d17f6c0fcfebebd171b5ed7d7e77a56cf9c4983d9ff9ff90995bd1c\",\n    \"flat_output_layout\": \"<<atom-layout>>\",\n    \"frames_mask\": \"e8a48532fba32c318f7d809fae3ea0999baa01376b29d94ef3c27d82f12f6a90\",\n    \"is_dna\": \"1d83518b897b14e2943990eff655838246cc0207a7c95a5f3dfccc2e395f8bbf\",\n    \"is_ligand\": \"cfa4e080dc2885de94224db5075c2feb0805567d31e8898abdebaebc6646ce12\",\n    \"is_nonstandard_polymer_chain\": \"1d83518b897b14e2943990eff655838246cc0207a7c95a5f3dfccc2e395f8bbf\",\n    \"is_protein\": \"569b0e93b5f77c1a9d430b643f29e600c7db6f44ded72b96ab1dd25351d26075\",\n    \"is_rna\": \"1d83518b897b14e2943990eff655838246cc0207a7c95a5f3dfccc2e395f8bbf\",\n    \"is_water\": \"1d83518b897b14e2943990eff655838246cc0207a7c95a5f3dfccc2e395f8bbf\",\n    \"ligand_ligand_bonds\": \"<<None>>\",\n    \"msa\": \"871c93669d8a7dd046f8ba6a1ea7b9fc52e1a2e040c8d9bdc4ae73a77f95d3f7\",\n    \"msa_mask\": \"13a46a8a2c5305d2a07bb9587ad092d97749d2b2a2d10ad5d64474a4f0f4c803\",\n    \"num_alignments\": \"26b25d457597a7b0463f9620f666dd10aa2c4373a505967c7c8d70922a2d6ece\",\n    \"polymer_ligand_bonds\": \"<<None>>\",\n    \"pred_dense_atom_mask\": \"1e388e40167a4d31291903d74c98544868d0dc574706cdfd259ddd65f56d2993\",\n    \"profile\": \"6ec7da33d5f9801357ca6c82725416ef59025c7a8810bfd67fed2262845b480b\",\n    \"queries_to_keys:gather_idxs\": \"e0a2fd867fbae573b5613a98ee037eeb575cc5aa3285db2fe5158cda0e8c49cd\",\n    \"queries_to_keys:gather_mask\": \"7ddcbfda2904f013d9ab73c55517ac933ecb3dbfbfab9bb351ee43b5fd66e54e\",\n    \"queries_to_keys:input_shape\": \"cf801b14d3da833c486e3d73e355c3c2068523012b42c2b17decc45dbd8b9972\",\n    \"queries_to_token_atoms:gather_idxs\": \"3c2d0028564167c93b2f33e877974d45756c1e2e8934270c024fc5f1e85fcf14\",\n    \"queries_to_token_atoms:gather_mask\": \"1e388e40167a4d31291903d74c98544868d0dc574706cdfd259ddd65f56d2993\",\n    \"queries_to_token_atoms:input_shape\": \"cf801b14d3da833c486e3d73e355c3c2068523012b42c2b17decc45dbd8b9972\",\n    \"ref_atom_name_chars\": \"043f3242ff4dff04fd36699ccefdff718c57c325f72c71f33f4c4774e75a64dc\",\n    \"ref_charge\": \"27898ee238963105942db19f27a980c1fe4f7aeb396c1e5ea4e82da3876deef4\",\n    \"ref_element\": \"cc437747adeea094daf8a0e551be02f406c7e7d9b0a9328a84a59d907c5492b5\",\n    \"ref_mask\": \"1e388e40167a4d31291903d74c98544868d0dc574706cdfd259ddd65f56d2993\",\n    \"ref_space_uid\": \"97afd7d9d3ba835731457ef090ba4939d707bb2a270d48fde56369bde8e58e9f\",\n    \"residue_center_index\": \"dfef3704f73a7ee9a3be86b74e25ecd43e056c76574bc9bb65b6b446eeed87a7\",\n    \"residue_index\": \"6bf4ea803d0fcd31446e07f6ba9e012f794ced1fe5ad60b7181f66bb92601638\",\n    \"seq_length\": \"5a667734987b65ef5c4d07bf176148504bcf8378a5a1a0e23a7fa2c1121cc143\",\n    \"seq_mask\": \"a795c048f28bc4307f8599dc5140fe6e971bce6a34a0349b6c18d6cbb197f75f\",\n    \"sym_id\": \"5f170600b904a3464c72817993120957c1ce2eec8c2421af02d4912b5e8d8372\",\n    \"template_aatype\": \"6c5c3e7a5e23f064f1e8791f61bde8fb59ccf837095144b29e6c8e1607081398\",\n    \"template_atom_mask\": \"8a282b7476e13f6de5afbb52c14ea7baa3434281ed77b542bb790287e8c92e82\",\n    \"template_atom_positions\": \"b032ac0c813748a81b8d50ce94487c66510a177ad25e84581c7ea5f4b524987f\",\n    \"token_atoms_layout\": \"<<atom-layout>>\",\n    \"token_atoms_to_polymer_ligand_bonds:gather_idxs\": \"a0ee989ed2a0a2e3626520afa4032e06144865c8c8f6357293c9f4cd2069eaf2\",\n    \"token_atoms_to_polymer_ligand_bonds:gather_mask\": \"d13d4a8b3b8add19b5970157f09d00c12cbda4fed4d74d8493156523f7069b66\",\n    \"token_atoms_to_polymer_ligand_bonds:input_shape\": \"6ed5c8b9711af5b9c7c3d98ba048bed4dfe5974be758f1a632abd746b8278ed2\",\n    \"token_atoms_to_pseudo_beta:gather_idxs\": \"3fd8de4dd02450c6e249f33de9c6573694f7991e6a36528d6f32b6c6334a4d4f\",\n    \"token_atoms_to_pseudo_beta:gather_mask\": \"a795c048f28bc4307f8599dc5140fe6e971bce6a34a0349b6c18d6cbb197f75f\",\n    \"token_atoms_to_pseudo_beta:input_shape\": \"6ed5c8b9711af5b9c7c3d98ba048bed4dfe5974be758f1a632abd746b8278ed2\",\n    \"token_atoms_to_queries:gather_idxs\": \"50a1708678bb3d848be6fb49816196b13fcac36891817dac585f4a7556a8310e\",\n    \"token_atoms_to_queries:gather_mask\": \"3f4ac4f311cea0c7f6b8464e225815b791a767c9a8d15f9c7fb488c49f674fa9\",\n    \"token_atoms_to_queries:input_shape\": \"6ed5c8b9711af5b9c7c3d98ba048bed4dfe5974be758f1a632abd746b8278ed2\",\n    \"token_index\": \"77627a5d3856b90a27ae1f5bf5aa14754743c03c00a97bab68f4e7961a405454\",\n    \"tokens_to_keys:gather_idxs\": \"bc16a2a2b81bdbb3fb3ff180d984704b201866a7cdc373fb345a9be417aa246e\",\n    \"tokens_to_keys:gather_mask\": \"7ddcbfda2904f013d9ab73c55517ac933ecb3dbfbfab9bb351ee43b5fd66e54e\",\n    \"tokens_to_keys:input_shape\": \"5545412ee9a21a04712910d53fc1447c73ff94a29ddd1268131b4ed30d1dbe07\",\n    \"tokens_to_ligand_ligand_bonds:gather_idxs\": \"bac3003591bd8ef44d85b82cd4d23191d48496c1992e61d3fca2a37e6ddd34ea\",\n    \"tokens_to_ligand_ligand_bonds:gather_mask\": \"4d33ec9784aaf54079b4445118c1be26b4a5555e1d6034ccc4182defd86f2068\",\n    \"tokens_to_ligand_ligand_bonds:input_shape\": \"5545412ee9a21a04712910d53fc1447c73ff94a29ddd1268131b4ed30d1dbe07\",\n    \"tokens_to_polymer_ligand_bonds:gather_idxs\": \"a0ee989ed2a0a2e3626520afa4032e06144865c8c8f6357293c9f4cd2069eaf2\",\n    \"tokens_to_polymer_ligand_bonds:gather_mask\": \"d13d4a8b3b8add19b5970157f09d00c12cbda4fed4d74d8493156523f7069b66\",\n    \"tokens_to_polymer_ligand_bonds:input_shape\": \"5545412ee9a21a04712910d53fc1447c73ff94a29ddd1268131b4ed30d1dbe07\",\n    \"tokens_to_queries:gather_idxs\": \"f82b61cc7f007a744fc9186107647ff333b598642a681b046d61aef4994931e1\",\n    \"tokens_to_queries:gather_mask\": \"3f4ac4f311cea0c7f6b8464e225815b791a767c9a8d15f9c7fb488c49f674fa9\",\n    \"tokens_to_queries:input_shape\": \"5545412ee9a21a04712910d53fc1447c73ff94a29ddd1268131b4ed30d1dbe07\"\n  }\n]"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/bfd-first_non_consensus_sequences__subsampled_1000.fasta",
    "content": ">SRR5689334_7619591\nTFRYLCRQMERRLDGRPTLVVIDEAWTKIRKQPEWLEESLRTLRKKNCAVVLATQSLSEVVESPIASVVFESCQTRLLLPNPEARTPAIRALYTQRLGLTEPQVDALASVAPKRWYMYVGGGRTRLFTLDLGPVALAFVGASGRVDVAQIDALHRR\n>SRR5262249_54877602\nWRLEHPAVREAEVVKRLVNGREAVTAVVVSDSGVSPAELCAHLGRTLPAWMIPRQFEFVGELPRTTSGKVDYPRLRSSPSHLVGEGGSRSESGEGYFMAGTPEAILAEIWSAVLGRPADPDAGFFDQGGDSLGVLQVVAGAHARGVTVPPELVAEGRSLRDIAAVLPTVDHSVAPGALTGSELEYDTAAVLDGWPSPSARRRPAGPAX\n>SRR3546814_5789022\nIVCLFYVSSCCFLFVYVFFFKQKTAYEMRISDWSSDVCSSDLTPAQIDRSFHRNTAHQVTRPAATHRRNTLAANPELLAGLRALGDFQLHATVEGRDLKLTAQGLINETDRHFAEQMLEIGRAHVX\n>B9TJ46_RICCO\nRGDRGDGDRLLLGDRARAAGRGDRAHLHCPADRARPCRDLPEGEDRRALDPRLAARAGRSRHHPGRPAGRAAPARFGARHGGGARLGGVLRSQPRHRAPPGAAGRADRDRLLPELVHPRPVRAAGALAAGDSGGGAMAAGRARRRAGDHVAAAAFLGLCAGGSAGAAHGRIYRLCLGSDHGLAVLPRAAYAGYHRRHLADRRGMLDGGAQSARHRRARSGARTVMIAIRTATPDDVPLILDLVRELAVYEREPDAVVATEAMLHDALFARRVAESLIAELDGRPVGFALFFHNFSTWTGKPGIYLEDLYVTPGARGAGAGKALLRHLAGIALDRDCGRFEWAVLDWNTPAIDFYRAMGAQAMAEWTVQRVTGDALVALAGR\n>SRR3954452_1678131\nPEAARARAAARAPAPRPPRWSLRRPGSTRRRILAGSRRVPELRELEAESLRRRLVACGVGESELDPVGAARQRPLLDAQKRQDVLALLHLQRRLAGAAEGAPAWRTAEDCRLQRAGLRRSELEDQRPTAGVTLDLAGEARCGGVGGSRRRRGDRFRRWRGCRRGGARPCAGAGAGAG\n>SRR5450756_2573138\nLHRVDRRQRQMCIRDRAYTAGLLLVCVSLIRLSSVRSEYSPGLEDAPVWNSDSPVGSKPGPAKFQPPRSRICQVVVASSPMIAENDRGTRLMSMPACAASAWYAATSCWKNVTPVTX\n>SRR6266446_6012191\nVSDLPLDSYRALKLPRCRGVGVGRGVGVGLGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGLGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGLGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGVGLGVGVGRGVGVGRGVGVGRGVGVGRGVGVGRGVGRGVGRGVGVGRGVGRGVGRGRGVGSGGLIEARIAPLFFASLSNQTSPLASCRMIACFNLX\n>ERR1712048_306589\nVARMTISRVALAFGCVLTCAHAADPTSPAGNVEAVCEYVSNGLENYGERLLRFPLPPSCQKYQGIGEEVLFKFGLQSQSCYQALSGPLCALQFSEYEASSTCKSTLDLFTTLIETCSNKNVMAATYSDCVSYDPNTRTISNPEAFCKSSFLRVDKGESPEGTSAGFEKKTFGQSEIMDCKRIAENFNACQIVGVGLLGYSNRFCMGKGFPAYCQKYPTVVRDGTFTRICKNLVIPYLLESNRRLGTKREINHCDGIYENYLMFLKSRKDAYSQKAEAAKESLESMKNSSEMFSSFKRVAQALSQDNDSLERDSTEVLNQFHQMSSQNMAFDAQILTEFQNLGASLAAAEQAATVIEYPEMTENAEENIKIFAKESPSIESLDQAITKSSVSVKNLEALIAQGGHVSYSQAYGFYPIELASIEELRTRIKKMSESLKPFTTTYSEEVLALEEPPQPGVDASFLNAAQTFGKLNDIYGEQMALLTKLQRYGSQTGNVFTAASRSFKX\n>SRR5580765_3802522\nGLGLDDAGRIADRRRSGRHRLQHHRVRADPGVVADGEAAQHLRVGADDDAAAERRMALGAAGERGAAERHPLVDGAVVTDLRGFAHDHAHAVIDEDAAADLRPRMDLDAGDETGQVRDPARHPVEAVTAPPGRLAVQDDRMQAGVTRQHLPRRPGGRIAFTDADDVFAQALEHTIFARVTRSASLSGSLFHCSGDAAQDLDLLHGERGPIGQPVQPRHQFPGRGRVEKADRCQRLLPVCDQAAHRDRIGQDAGVGPRLDRIAAQRLAPVIGEELHRLSEVERAVARIGRDREAGVAGVEVVVRQAEALRAEHERDRAAAGRQFAEDRARGEGRRAEVTRRHRRRPDPGHAVERVAESRDDAGALQHVGPSRRHQHELGKAHHLDRPRCRADVAGVAGADEDEAGRIGGHLSRPLKLRLSILQPRPGGPPPARARLQTILPMSQALHPMLNIAVKAARAAGAIINRASLDLDRLQVSAKSTNDFVTEVDHAAEAAVIDVLLGAYPGHGILAEESGSTRGAKDSDYLWIIDPLDGTTNFIHGLPTYAVSIGLSFRGQMQQAVVYDPARNDLFYATKGRGAFLNDKRLRVSKRTRMAEALIGTGFPFRQGDDLTHYLKVLEMVMKSCAGVRRPGAAALDLCYVAAGWYDGFFETGLSPWDVAAGSLIVTEAGGLVGNFTGEADFLYRREVVAGCPKVYGQLVQVLSPYSTLSGSAX\n>SRR3989441_2692536\nAASRDALLATQRTRKRVAVEHARRSSFLAPRVAGVDIDRLDDPDKWGKIPPLTKDELRALGTDEFYSGFCIQPPSAAVEFWRSGGATGRPLFYPRSAEDLPYCLLGFRRIWECIGVGAGDVVHDSFPLGIHPIGQMVARSAQEIGAGVVWAGAGTPPPSALQLELIATLRPTVWAGMSSYALHPANVAEAQGVDRAASGGGPVVCPAEQLPGARRAKLERAWGARVYDTFGMTEGSMMAAERDGVDGMRLWADLFLVEVVDEVTGKPVAEGQPGALVMTPLWSHTATPFLRWLSGDIVTLRWPEPDADPFSVFPVLKHAHRTSGFFKIRGVNVNHTELEDFMFRQPGVLDFRAELVTHHDREVLRLLIEVVRGADPAGLYFALLTKKADPAHEVTVLERTRADATFGFGVVFSDATLDNFIEADRPTGEAITRAFAHWDDIDIHYQGQVLTSTGHGFSGMSRQVLLDILHTRCAALGVTLRFQTDVTDLEPYRSADLVLAADGVNSLVRSQYAAHFQPHVDARGNRFVWLGTTFPFRAFTFIFKDSPHGLWRVPAYRYDARYSTFIVETTEATWRRAGLDQASEDDTVAFTERFFARELEGHRLLKNRSLWRSFPTIRNAHWHWDNVVLVGDAAHTAHFSIGSGTKLAMEDAIALAAALQRHRDVPSALDAYEEERRPQVESIQRAAQVSLEWFEQTERYHGRLEPLQFAFSLLTRSLRVTHDNLKVRDAKFVETVDRWFAAKAADQSKVPVAAQPMPPPMFTPLRLRELVLANRVVVSPMCQYSADDGTPNDWHVVNLGSRAVGGAGLVIAEMTDVSREARISPGCTGMYKPEHVTAWKRVVDFVHAHSPARIALQLAHAGRKGSTRRLWEGIDEPLAEGNWPLISASAIPYFPHSQIPKAMDRADMERVQADFVKAASMAEAAGFDMLELHMAHGYLLASFVSPLTNTRTDAYGGTLDNRLCYPLAVFDAVRAVWPAAPPISGKISATHSADGGVTPEESVEFARRLKAHGCDLVTVSTGQTVAHQHPAYGRLYQTPFSDRIRHEAGIATMTVGAVASYADVNSILAAGRADLCALARGHLYDPYWTRHAAWEQGFEVAWPDQYVSVKGFTPRLRX\n>ERR1700679_3575755\nARRESGSRGRWRPEHQSATCQHRIRPRCAGAHVRRSAREAPHKVSMVSWDFLNWLEIYGSELLVKYDIGLESSGVLHRRFHPECRFELQLSWMSGSERSRQPKIMPRQIGEHWPTFQDLLSKX\n>ERR1700756_3832034\nKLVQLLKASSYLSSILSSSSVVSFSGSNRARRPESMDWNPIPLTSGYKASFPSPPRVHWATLFAAIAGSEGLVLWLVPQPYRDFFVNLAIAAWAIYLCLWIRKIDIRSLSLYWALASFATGFLFSWLLWIVVIFEIREELLEHYNRREPIGLRLNLVMTLLFSFVYFQYHLNKIAKEKNQQRSIELVGAGRAFLQX\n>SRR6267378_1761704\nLARPGAGRLGARDVRARGGTAARRASARRHRGVARRAARARPAPGGRRRRRGAPARKPAARAPARPADACALPFGPPGRRAQDLPRGSPAAGRRARHRAGPRAAAALRPDPPAGADPRDDGRRRAAGHRRRLGGGLGRHPRRAPRAGARHRRHVERRQRRAPAGARPAGGVPRADVRRPARTCGRPREGRAVHRRHPRGRPALRRAAHDLQPRLRAAAGAPLPRGPAPAPAHGGRAATADRDDALRPRARARLRRGGRAVRRRLLHLARSRARKVPTSLRGGRRARDPAPERVRRRAARAAACDPEDPRRGRPRARAGVRELRRQRGRPHRVPRGDGPRRRPSRHARRAPAAKPLPLPRLRAPRLEPACVPAPAVVGRAGRLSLVGGAAGGGPRGAGVLEEARRGAELARPRRVRVAAADTARGRVARGSRAVTTVTEAVRTPYKGLSPFDDTELDALLFFGRERETKIVVANALASRLTVLYGPSGVGKSSLLRAGVVHSMRKLTELDPIAVGYYSSWAGDPLVGIEEAARGALTETFGGDPGEAAGDLADRLDAWTAALGCE\n>GraSoiStandDraft_16_1057320.scaffolds.fasta_scaffold7416948_1\nMSNKYGDGGMKRDNTSLTMIDPTMIDPIGTQQMGVDTGSFQLNLAGDTPAYTPGKGVSWMKRAGMNIGEAFGGVGSKLSNMSAGSKMGIMSGVGGILQGIIGGGARRARQRDAKTEYTKQRKAYAALDARNLSENIKNPYENMENVYEDMTVNQQQAQFEAQQGAQSRANIMQNLQGAAGSSGIGALAQAMANQSQLATQRAGASIGMQESRNQALAARGADTVQQLERRGAFEAELHKVRGAEKARDLEWQKQEMALGMAMQEKAEADRARQQATNALVGGIGTIAGSVLTGGASSVLGGLVKGDNX\n>SRR5450631_843885\nPRQRARDRPAGPPSDRRQPRGAPHANRVRAVASPGDEPGPRADPRLSAANRPRLGLRGRAGQSADLYRSAPPQARARTKPSTLDRHRARRGLPLSSRRLARKDDIVLLQARALMKRPVVPVVLSPPRRSLIDW\n>SRR5690349_11316732\nDHRRADAWRRGLCRELWRYRLRAGRRHGARLARKRFDARRVDGEQGLRGAGRGAASTREQMNELLARLAALRRNKTAVNAATATVIALAMALLAMLAVDRISFFTSADRFVRDWEVAYQSTPEDQDPNILILAVNEQTMQNFPYRSPLDRGFLANLLT\n>SRR4029077_5045757\nXKTKDITGGLPRVAELFESRKPKEHAVIAEIDGTVSFGKDTKGKRKVLVTPDRGDAKEYLISKGKHLAVREGDKIRAGEPLMDGAANPHDILKVLGEKALAKYLVDEVQEVYRLQGVKINDKHIETIVRQMLRRIRVIDVGDTGFLVDEHVEKYLFEEENERVMGKGAKPAQGEPLLLGITKASLSTESFISASSFQETTKVLTEAAVQGKVDYLRGLKENVIMGRLIPAGTGLGAYKRLSVHVEDGGAQDLPAPPMAPAAAAAAPRTCLQLRWPLRPPRRRRFPWRSSAHGTPSACNGANVGSLRARRX\n>SRR6266404_2839436\nXMDRRSRAPWAHRQELRAAHTDSRAARPGPHPPPATARTHRARFAGERHEAFGVAVVATEAREAPGPDATAQELAELIGNSSGLSGRAGCHNVQSRTLVCKPQMKMSGFSKVEMSALPPGGRDRGDGDVDHGGTGALGGADAACRAAPDTTAGRRTAGAECTPGPAARSALCRRRRRGTRVAP\n>SRR5262245_52145018\nESYGIFHALSGASSGGIADFMYESALLNPALDDCGAVSCDEVTVRRRVALLLKGFRGYFDFLKNDSEEAAIFEVVRRFYEEIKNRKIEALLDVGKDLKALKAVRKILKNEDIRSLINTEILELFELENVPSLPKNLRRLVNAVKEGAALGKTNI\n>SRR5688500_19911985\nPTPHLLTLALIARSPTALSTLPLHDALPISARVVEPDQRHTNPERQVHQLDDLFGVRRAERAAKYRKILRKDADGAAVDARMARDRKSTRLNSSHLVISYAVFCLKKKNKTSE\n>SRR6266576_2342774\nXMQRKNARVDPDGKLPKEFPLTSHPNGQYSKKHAQKPFYFGRIADGWRAALERFNHDWPYILADQVPPPMGTDPTTVEYVARMFLARSLKRLERGQLSGGSFVDMRVAVGIAATSLRQAKKVRHLKPSDFAELREDLSFRWEKQGEGETARWAKREQRIGVAALKRR\n>SRR5438552_10607511\nFLSLMCLRLLLFFSFILLPPPRSTLFPYTTLFRSVDLPDAGLPHDPRGVPLVDPPDGHHGDSTGRLRHHRRDDRHARLRRRGDRSEEHTSELQSPDHLVCRLLLEKKNRNIQKGKHE\n>SRR3954454_14771217\nRRGAARGHRPRARHHASDHAPHLRALLHLRRRRAGRRAGPGDRVGARGPHERPPDRPLPDRHDDLHLGAAGMTGPARRTLVAAAACAALAAGCGGGKDTHVVHTTTTRVEVLKGIGSAKGAFDPRAIYAKEAPGVVTIISLFAGGSITDLLGGGGGSGGQTGLGSSIVLDGKGDILTNAHVVTT\n>SRR6185503_6756615\nXMVFIDPIQAKHERLTLSQGNIKTNPNPFLIRGKARRHKHVRQCCRNRVANLSVDRAVVVIDRMTASHSSTPRKESTILLRKAACLQFPAAGNLAAYFFGLQPGFLQNLPIIERFCPGRREWNRELRE\n>SRR5581483_2541413\nAGPAHRRALQADAALRGLRARRSEQGRLAGSRRAGDDADEDRLRLVGGDREALDARDDRCGRRRRPAALARGRILRAARRRQARRRLRRLGHDEAPAVDPSRRDALRHQREPRPRPHRHPLPRGPLNLNAVAAARRTSNVELLWDLVFVFAVTQISSLMTGDLTWPGLGRALLVMALVWWAWSAFVWTANADDPNSGIVRAVLLLATVLIFITALALPHAFAAGAVLFAISYAIVRLLHLALYMDLWRRHLATFSAIAGFAVTVLAGMGLLVAGAFAGGLWLIGLWAVAAAIDYAGPGLLTRRRLVALQAVAVEHFAERYSLFVIICLGESVVAVGVGAAARGLDATVIAGATLMLLITIALWWAYFDRLAAAAEDGLRASTAPVLAASDAYSYIHLVLVAGIIVFAAGARIAVGRIDAPLPLAASLAFGGGIALYLLGVVAFRLRITQRLGVATVAGAAVAAVVAIAGVNAPAWVEAVVLLVVLAAVQLLERRSAWRX\n>SRR5688572_11341527\nAAEASVGEVTCAVREARDAAARFVGIPLTLSTRTAAIEMLQRLMARDAGRARWVCFLNSHSFNIATLDGQCREALNGAYAVFPDGCAMQVAARLCGIRIPENLPGTDLVPALLESCSGRCFLIGDRPEWIERAVCELERRFPTWSVVGFAPGYFDSEEGARRVVDRVNGAKPDLLLIGMGSPLQE\n>SRR6476661_7197889\nSDIRTCSKAAANSPGGASLATRLAVAGGGGGGGGLGTDAKSPGTILGGAGGSGGGPGGPGGPDAHADLGGQPGQQGNQASGGAAGANSAESPATAGQLGDGGYGGTAPSGGGGGGGGGLFGGGGGGAGTTTIVDPQKLIIATAGGGGGGGGSSGVPPGASG\n>SRR5690606_8821431\nXIGEDTAEMATTTKEAVVATHIFSHYTARPDERSEAEPLQRLMHYPAMRLIPILILCALSGCSLFGADFDDLDPGTFRMKADGKEMSGQATYYPERDLASQEPLVFLESDEGDFMFIRSEAFLNAISGQSVTPRASYRPLTGGVFTRRSGRVEX\n>ERR1035437_2281458\nIDEEYGTGPGGLSGNEDAGQMSAWLVLSMMGFYPVCPGKPEYVIGTPAFDEVQIKTGIKAKPFIIKAIHNSSKIQEFKSVTLNGLPLEGSIIQQIGRASCRERVXX\n>SRR6266478_5987559\nGGETAPGWSQFKFCRSSRTVIGWDHTGPRGAAARWGWTDPGAKGPPSTPKPPVYYVGCSSLNSAPQIGGAVSYRGGPIDRRRVLFRYFAMIAGLNVPTKLSNGGSRHGRRCLAEQGGRILGEGTCDQRSTTCSASSRAGAQLSQVCX\n>JI10StandDraft_1071094.scaffolds.fasta_scaffold2749928_1\nMILVSGLPATGKTTFSEWLSSEICIPLLSRDRVLEKYVEIAKVHCEYEEQRGNVADNIPAVFLGHSIPALLFWFFCEEIMKSSSALIIETVFTNQMKETIGNLIEKYKYQTVNVHLDASVEIKRHRINERSPNKKISLENLKKAHESEKIKDAKNFRYGNCIIYVDTTDFSMVSYKDISEQIRQFILRNVX\n>SRR3989344_2742104\nRSTFGPRFNIATKQDEREQGGRRFPERMIDVEKEKADRTIEISRRSAENHQNIHVGHANTKGGESVTIEWPSNNKLNRGGQHPVNIVQIQTPNFMHMFQIKHVNEHIINNDRGRNDEGKENAATSLFDLLHLFLLFFLKCPAFLLRPDQIVTQLIDELINFLKRDHRFVKLESHLLGAITSARLNHPRLLPHQLINQDRAGGAMHALNFKYEFGHCVX\n>ERR1700722_7849674\nSTRAALTHWAQCLAFLSPPSVYQVSSNSAGRSSSNPCSMARPWSSLSRWQALRSEGAVSCDRFARSTIRVRKRIAGGHNGVFARSPRSAAIGPSPKCRTPRLRSRTARQQLIGRIRMSRFYMIGGGLLASAAIAGLHAGVAQAADDEFMKMAKDYIAQASAPVTTWDGPTTGPKAQGKKVVIYVSADQKNGGASGVGDGVPEAAKAIGWDFRILDGQGSVPARSSALTQAIALKPDGIILGTIDAAEQAPIVEQAIAAGIKVVGWHAGPGPGKIEAVPGVFTNITTDPNEVAKASGLYAVVDSGGTAGVILFTDSIYAIATAKTNAEKAAVEGCTGCKVLSIEDTPIGDLSNRMGQLTTSLLAKYGKAWTYSIGVNDLYFDFAAPSLQSAGVDPATGYPRNIAAGDGSVPAFQRIREKQYQIATVAEPLHLHGWQCIDEMNRALAGQPPSGYVAHVHLFIKANIDKDGGAQNIFDPDNDYKGHYKKIWGGMX\n>GraSoiStandDraft_35_1057300.scaffolds.fasta_scaffold1321871_1\nITAQTGSFAGIVHVATEAGGLETGQKISIGREVSASHDGIWINRFNYWFTTADFRVGDATNYIQVTGSGGNFGNDTRIKMDTFTLEAGNLDINSTDETIRLGSVTDFAKDGSAKGILMGKESSGNYDFFVGKEDGNYIHWDDSDNSLKVVGTIEIGSAGSFTPDTATQNQLAALNATTGSLSSETGSLQNATASLYTSASAQYLTGSILRQDSGSMATQVTLANDGMTLNQADGTNLASYGSTIRIGKSGEGRVEITDTALDMYDGAGSPVSRVNLNSSGQLTLGKSSDNRVQITDTSFKLYEGSNERINITSTGVQILEDGNNFTEVSASGLSIHAGGQPKAYFTDKWTTLSNDARSQKENSVQIWNGGGIGIYRDANNYASMSADGMKLYQGGSHVATFGQDVYLGEVGSSKRNIFIDADAGIKIRNNTTTIAEFGEDAIIGEVGSNKRNILIDADDGISIRDNTTVKAKFDTDVILGEVGSSKRNILIDADDGISIRDNTTVKAKFDTDIVLGEVGSSKRNILIDA\n>SRR5271165_1503329\nAPRSPGTTSSWTGCLATPPGRCSSASFARYPGRVGIEPATSPEGEEQATLAEPAASSRKLERSSGRLSDLPSGESTGSRITSVITPRETLHLQEINRTRIFTVMVVALSAFVLATLTVIGGDPMAKRVFAFALLAIASSCGWLRWELRRDEGYTVERATSVAYISIFCAFTGIWFFGVFSPAPMILPFGIAFFSVGQSQRAVFGTYITCAILQAGLMLAVLGGVLPDQGLIRSSGLAPLEQ\n>SRR5258708_2540147\nLQVPGHALPHAGVGAQPVEQKQRRPPVGLGRPPLQPLQTHARAFDPTLSHERIVWEAGRRNAPQWPATTGSPAPWAGAGARCRRLMARQLAAPIASATTGTSSVGRIASMNALANTSCAIRAICSATWGGRPARWPAAELLDAPTSRPLLPALLKPSMKRWRAAAGTVLGSWAAYWMAWLWRVTPSWFCSPPPVIAPPIPPP\n>A0A0R1K2P3_9LACO\nMLRERFDKGEKKMSLRVLLVCGTGASSSFMAVSMRKAVQQLGLDYKIQARSESELENYLDEVDVIMVGPHLSFMEEEIKKSIGGRKIKVILMNPAYYAVLDGKKALDHLQSELDYKEEDSNK\n>A0A2A4RMB9_9BACT\nMNPDLKVYDTQIMIDGKTENIRTGMSCKATILIEDHEDTLFVPLQAVVGKAGETVVYVVNGKTSEARVVETGLDNNAMVHIISGINAGDKVLLTPPLGDDLFSASSKPKDAQAKGKPKGERQGKPQRGSSSQGMPKGKRP\n>ERR1719320_184571\nQSCLTSLHTNHSYTPGITNSWIMEEALLRKKAKKLRLFTFWVENHAESSSPWLRRALARADSGGKRLLADLERFLEEVEKTGGRRDGTVLCNSEMTGGNDISLIYPWLHISSSLVTINTWVRREESRDIEAAGGSLSSYPCYGSLERHEYLRSSSLRKRKVVQGTYSIVESVVPSQEVLPAGEELCILLGFRTTDDNCVDTVEAETERSGEARTWREWTGIGTLYQNMTQEDSVEVIKVEFMESHIPDHAAVFHYLVLMFLQVTSHRGKLGVLDAVARFRVRNMSGYVTVYSNLSDVTVDDRADDCLGDNLKTLQHSKQEAKKMFFKQEIIQVEQSGRKMEEX\n>SRR5215204_6862387\nGIFFFFFIFFVVEKKWNFFFFFFSSRRRHTRSLCDWSSDVCSSDLRHPNSRRRRGKGGPDQSRTRSRAGCRFRALPRCHGLPHRAGSVGRRRAHGLRRCWRPTPSRLRFLLLHQASGEAAKRGMLALLEICTEVPRSSVLRSWAREERVGASFGVSPPPTKGARWTIRKGKX\n>ERR1719195_1908659\nRRRTRMLIGEVQIQEWRLAVPSLPTCRLVVVPQSPLADQPVPLPLAARPKRSPRRRPPNQSLTPTLTWAWDFSTKQLKKPLKLFHPNFSTPLLVCLLGSGLQNCILDDSWVEIDLFLHSLKKK\n>ERR1719313_113703\nRRAGVRFQRRRALPQQALLLCTLAVVAVVAPYMWESAQRGAASLEYSNAQVSSGGRSLLSAITPHEDSAPCCSTACCKASDGRTDRDSFCAKRLESNGALNLTGTCMKRSTVLKDDQWGPSVALGLRATNASSGMLYCYSHLDCPVGHECKTAVTIQTNVNCSTNSDCSADRVACLTNTLNCTEPKCEGGTLSESGVRTTCRVQSPDSWGVCRVFDVDTEPTCDVSKGGINPRDLFSCTQKRQGALILHLIGIYWMFNALAIVCDDYFVAALEELVERWGISEDVAGATFMAAGGSAPELFTSIVGVFLAQNDVGFGTIVGSAVFNVLLVIGACSVAAGKVLELTWFPLFR\n>ERR1719245_442272\nFSLTLRAHLPSTIAAEHTAVSPSSLRVPDSPGSPPGSNKESPSKARKASLQGAGITSKLPLKQLADFAVTLSSPDEKSGGKSFGNIAKPPTPKASSPSESTPFLPAPAPADPSMPLSPTDQLKLRRKRLVHYKSNAARNNNRSDPDSPHNQLLDLESGGGAGVGGFHQRRGSGHSLPGRLLKRTNQMKRRESQALLEQIRKRGSR\n>ERR1712194_41197\nHGDAPEHMAIREAVMRTNMDTVHGEMKGSDGDHVLFSPKALLESLGEMGQGISAYVVDAHKKLLVPYVVLEFVSGIPLEIAPLSLGGSLPDEIWPKLGHVCALDILLNNMDRLPLPIFPTLGNLNNIMVQDSGRRAVAIDQQVNTITDDIGLMVYLEKVRTFVRDVARLAGEDSAETDDILGHMRDSLKTRAQTELTESNARLVLQGMWETLKHIAKAWESGDLKAAIDASVLAAGESLVSGVIEKEWSFLEDGVLAPPASCDHGPYQGVVEASAAQLRVVACEISTSVRSAGAFQLGASANGSTLQGTSSARQLADLTSSFVKX\n>SRR4051812_43875519\nAHKKGSFDEARQLYKQSEQSARAALDLARSYPPAHFELCRVLHRQALLPGPDVDALFEGAIGACRQATTVDPDDESIVAKAGTALMSAAERDLARGREPSTIDEAQLDVEHAIALNPKRSNSYRNLCDVLLVRAESLSARGRDAGPAFAA\n>A0A1V2Q3A6_9PSEU\nMQTISRGSVHIEQCENCKGVFLDGGELEQIIAAERAHYAQPYRPEGFPVPPPAPTMAVPVNVGVPVDAAVPVDVGVPVDTGVPVDVGVPVDAPVPADGAVPVEGAVPVDGEQPPPATPAPAPAPTTGPPPPYQPPPGTPMPGTPAAAPPPYQPPPGTVTGPPPPVYPPGYYQPYPHRKRSFLEELLD\n>ERR1043166_9773265\nVFFFNGTATTEIYTLSPTRRSSDLKAVSASATSAFRLRNRQRFRAGPDSRRSEEHTSELQSRFGISYADFWLKKKQHENIFDSWWRSGDRVLNHRGSTKFSQPRSEERRVGKECRSRWSPYHX\n>SRR4029434_590066\nPLSHSHTHTHTHTLTLTHTHTTHTHSNTHTHTHTHIHTHTHTHSTHTHTHTHTHTHTHTYTHTHTLPTHTHSYTHTHNYPRDGLEPVSQAWFSLLRDICFADSSGWQTGKSSDSHKTHSDEREGLDMRV\n>SRR5690554_368104\nXMELKKKVPEVRFKGFSGEWEEKELGKLFDITSASRVHKNEWTESGIPFFRSSDVVADYKGQENIKAFISYELYKELSSKTGCVQKNDILVTGGGSIGIPYLVKNDEPLYFKDADLLWLKNGNIINGNFLYTFFSTLGFRRYVNSITHIGTISHYTVEQAKLTPFKVPVRAEQDKIGDYLLKLDQLISLHQKKYNKLTNIKKAMLEKMFPKNGADVPEIRFEGFEGKWEEKKLNQVSEIIGGGTPSTIIPEFWDGDIDWYSPTEIGDKVYAEGSVKKITALGLENSSAKILPANNTVLFTSRAGIGDMAILRKDGATNQGFQSFVIKEDNDPYFVYSKGHLIKDYALKHASGSTFLEVSGKQLGNMNFSIPIALEQSRIGTWFQHLDQLITLHQKKYNKLTNIKKAMLEKMFPKNGSDVPEIRFEGFEGKWEEKKLGDFTNFRRGSFPQPYGNKEWYDGKGAMPFVQVVDVSDNLLLVNDTKQKISKLAQIRSVFVEKGKVIVTLQGSIGRVAITQYNAYVDRTILIFEGYENKTDSRFWAYTIQKIFEIEKMKAPGGTIKTITKEALSVFIVKLPVFEEQRSIGTYFQKLDHLISLQQTQIDKLKNIKKACLEKMFVX\n>ERR1700679_1367360\nKLLSYILLTHLFSIWMNEAQTAINVKPGRGTQAGKNPAVRILFYRLCRLLTLPIIPVFVFDGPDCPKMKRGVNVKTGKSHWLSSPFKKFIEVFGFSWYMVSFTSCDLGFPFKYL\n>SRR3954454_14908726\nYRLRRTPEYPAPARRAARLQLSERPARGGGRARSRCVPDLIVAGLARGERRKGTAVRLEVDQGRAVETIEATHEHTLAFDPHQPDKLRPDRIGPHGCAQRKGPTRDAVIAGALPDEVAARQVQPVEHLQALVFRDPIERCDPGLEHLDPAGRTIRTALAWARQTIDPGRVDPADEHEPGVGRRWRLYRHLAGADLVLPDHAARLYWSTATITSEVFTTAX\n>SRR5436190_15766111\nXMPPATRTELNARKLFRTRCAKNTSTPPATRPINVRPVSLIRPLPMAYCMSNPMPITSTAIPILLIRFSPMNFSRSGWRSKNEGRGGGGGVRSGGGCATNGGGVLAAVTGARTTVGAGCGGTSRTGSWIASFSAVGGLKTGGVTAGGEGTGGGAALDAPSAMDDGPDRNRSASFSMLWRVLVSSRDTLPSRANRTIINTMIAIGTSASRTKYSSIQPGFWKQSTHEAAHRSGRMQDRRLAPSIFQGYLPSICTGCRIRVRQDSRGGGGPFLPPX\n>SRR6266540_2703125\nGRDAPERRAAARLAHARAGPQADRRAQGRAREGEDRGEAPVPARRAAVEALQARGGAEGRREDPRGARDGGGGAGGRRGGGEDRREARRRRGEARRVRRGDRKARGGAGQGRRGARGARGGGRGGRAEALLGGPALLGRGRRWARRRGGGPPRRVAPVGPPLPRAARHARLRLGRVGRAALGRRARGLGADRAAPARRGRMGEEGRGALRARLSRDPRGREGARRLEAGGAEGGGRPRRRRGCGRGRVAEPARRMGARARCAGRARREGEGGGRAAGRRDAPRLRGRRVRARRPLDRFGAPAARGGRGGPRGAGRPRRRAPGAGASTARGRSAPDAARARRGRTRREPHGRGPRRGAEGVPGALRPLVPAAAGGAGGRPRQRAGPDRRPTRPGDDPRARGPRSRLHRAQALVRRAGPRRREGDRDRGGRVRRPLGGGAALRGAAPQADREAGATPPRDDRSVVPGGGGPRRLIVAEGPRDGGRRARGREAEALAAAFLEERGYRILARNHALRRGEVDLVCETGGLLCFVEVRSRTGDAHGGPEETVDRRKARRVVLAATDWAERNGGSGRNIRFDVVAVTFGESAPRVVHFPA\n>SRR3984957_4909703\nTNAAIRRRRVKPRFLKVGNAVFAWGLDRRRMGRLINSYFRAAGQLDGCFDSPSFLLRRRTLYAFSLQRFYERGQVVAHEVEVRSRQLVSAVKLTSLAVGRVDRGLGRWQRKEQPTSAGVDSAKIENITKESTVGLRVVAVEEDVSASDSGNHDDSENTILKTPRIVRPGRRRAFEEFPSGGRLSNAGVFVIRRSVLELLPFTSIYRFRGIDRLIVDLFIDDFSGFVDQESCTPRRFHRNSLNVELLGQSITACYWAPPVPENRGGHSILLGKCEVREGAVHAHTQHLGVGAFQLGQILLESLHFAGSTTGESKDKKCQGDIFLSPIVLQX\n>SRR5579862_538352\nXMVVSYPKLTPKARNAGDLGVPYARVKGLSRQARAGIAGPVLARWRAPPWPLRLRFRLRSVVYRIWYTRWVTRMAMNAKKNRGRVDHGGSSFDSFLEQEGIREEVEVEAVAVKRVLARQLQRAMQKQQKTKQAMAKQLRTSRSQLDRLLDPGNASVTLDTIARAARALGKRLIIRVADAKAEKRAX\n>SRR5262249_1788368\nALGQWPGETAQHQALTLAQLRRRRAPPPPWRRFERGDPLFQDAGIRAAVDDRPRLGDGCGGPITIAQRLQHLGLLEQAERANRRLAESAERLETAVDVVSSRGHVPAHQLGDRSGKMDLAVDALDTALASELHRLLREQGLVLPPPLLAGDE\n>SRR5438270_12444290\nRNEGLSPHDSQLLCTRKLRTQPLSILFFRFISRVIIAEFAFDPYICLCYKYRSATREYSRSRTLLSSSMAEHSAVNRRVVGSSPTSGAKFINDFQHLPPITSPNCLQILRFRREPPDIAPLQTQPLNHRSPAIEYRVGVRVDRAHDARLDHLHVDIACRRDAGVAX\n>SRR6476620_8373323\nGPLPVSSSVAADSTLPTTRFTRWWLSSSIGPFGGTPTCQNPTRPGASWTVVNGPAVSTSKADVSGEPSSTGGTGRRRPGSGATSVIGSGHLGRVVAEDDHAHRRRIEAVARVVDLRAVRDEDDHVALGPDVEVQAGRRDAVDDAERAIGADG\n>G7IQB2_MEDTR\nMEGEEGGGVRLSKRFNDDKGGGEVDYKTKSGTAWSHNFLNQKPWHPLSYPNQRRKWIAEQTHAQRERRTEEVAREYAQEQEFYRTTSLISKKDKEKVELMQAVSFMYVRPPGYNPESAKAAELNDEKKKEDTVNNEPTQTNPDGPSSLPPHGEKKKPRPKDVFGRALPTEEEFEVLKNAPRHETGVAARAKPFGVEIRNVKCLRCGNYGHQSGDRECPLKDAIMPNEENRLKRDDPLNAILAHTDLTEPLKWELKQKPGISPPRGGFKPDDPNQQIVAEEEDIFDEYGGFLNMGDIPDLLTNLSKKPKKSKNKKHKKQKLLHSEREASLDDGESRSKKKRVKESKKKRDYKESSSSGSFASEKVHGKSRNKHSDDFDSDRNDPSRKTKPERSLSLKDYDHPRHGRSKHGKRRHSFSSEESGPDCYNGNYKNRDRRSYSSEDPDSDRDDRGRKNIQKHKRKHGRKRHYNSDEKDSGPADYHLKQKGRDEHSYKSDDCNHQRQPEDKISSHKYSSIIHCDSQRHHVSFSHDRYRGSQKSRSEHSCSSNDSDVEKNDQSRRIKEERGSQKRREEHLYSSDDSDVVKNDRSRRICSSNDSDVEKNDQSRRIKEERGSQKRRAEHLYSSDDVVKNNRSRRIKEKHGNQKRRTEHSYSSDDSDEKNDRSRRIKEKYGSVKRRAEHSYSSDDSDVEKDNRSRRIKEKDGSVKRRAEHSYSSDDSDVEKDCRSRRIKEKHRSQKSRAERSYSSVDSDVEKDGRSRRIKEKHCGTPDGSEHAEIDVRQQNREKPSYHRSEKSYIHREKHKLRKRSKNLPHHESVVYLLYDSSAFSQAQSLQSVLEKVDVKATIFNQQDSGCRDLHGSRLALDCQDRFCLRHRPWQSGHFLLAYIRGLLEVGMLTNLPIADLHVGGLAWSVKWIE\n>SRR2546423_6060734\nSPVWATSCPMAACAGDPLTATDVAARAEMSMVLRRRGFISISLLAARGRAKAICPCARGAQRPGERNTSGARRLRAPVRTLLAVPSVRKPVMVRTFGELVRRWALGGAVVGAAALLGGPAAPAPAAVDRSLAR\n>SRR6187399_628079\nTYSVLQHQFADTLRAQKLAALTAEQPDVIATANVGCQLHLRDGAAVPVRHWLELLGYRAPQRSASMQDFPHHYRVGTRLTAAEDGVVLAADGLPDLDTAPPMEFGGKGDRWSPETLLVAAVCDCFVLGFKAIAAASRLTWTDLDVRVDGTLDRIDRKMRFTHFVVSARLTVPAGQETRAPRILEKAEEACLITNSLSAEVQLSSEVIVGX\n>ERR1719375_252775\nALSMGLLGTGLRVGEDRRLRGRPSWDPENRGASAAGSTPGRPACTRRPWRGQRPRRRVRGPEPRRRPCPWTSSEASPAFALDRKRLASRASRASQASLATAAAVAPRGLLGAYQAPCPTWPLEYTGPGRPVQRPASHQFMPHPSAAAALSNYELAQRTPRGWMSTRQAAPSAPKLPGLNNGALGAACRVDIHPR\n>SRR5579859_4059679\nAIRTATATLLPLGQTGTIINRIHHSCPDSPWVARGTDLAHCCFDGNRISGRRMTDVITLIRVKRDNKRPLTDQEITWLFAAYAGGEVADEQMAALLMAIYLNGLDAAELRAWTGAMIDSGERLKLGGDTRAGGRPTVDKHSTGGVGDKVSLVLAPLVASCGAI\n>SRR2546428_4694028\nGTLGFIYGMSEPMPDLLAEHSRWAATRAQELGAQSLNATNFGETFSAGAFRDPVTGRVYNAVGSRLPGGGLQGGATARPGEFVIRGYFGHAEYQLLQWAAEKGLVPVSIGASRPHCWVCADLTLHMGGTNASPLKGVS\n>ERR1719343_138255\nPGGAFIFGTFCASSVRDRFSSGPKLLLYRSEGAVLSRGVFLLLGAAPRPHAASTRGVVRPRMPREFRTYSIMAMVRMPHQRGVSSGRECQGNSGHIRSWPWSACRINEGCRQAENAKGIQDIFDHGHGPHAASTRGVVRPRMPREFRTYSIMA\n>ERR1039458_2685568\nFFLMIRRPPRSTLFPYTTLFQSISDTNILPAVSISLFLLTACRSDIALVLRKNGAPMTYKYLFASACEELKLSVWAKGESALGYNPIFYRRDIFGAWMQYNAHGDTLTHFGWEIGYITPVEQGGTNELSNLQPVQWRNNRNRTAPQPX\n>SRR5712672_4201355\nHSEKSGAGGRRLFSPDARGTVRQASGRGRRRPRQGSRGLSQIARSDAADAEQPKLSRRRRAELCRLHRVRRVSVGARRQPVQAARRRRSGLCGARALARCVRGHGAKVAELSRVRISAALNLTAAVSTARFWTSRPPSFANNPDTGSRRRPTASAGGTIHRNTSTAPTGCRRTPRHNRSRRAAARVGFLTDLSSKGPLFRPAFNSGFIRDGVMIRRKSYLDDGPREARWPAIRKPPWSRSIDSDLVHAAGPRAISSTRRPIRAVLSRPS\n>SRR4051812_7757704\nTRPRTSPRTATRCGSACGWPIPAGCARSCWAPPDRSRSCRRTGSPRASATKLCGRLRPTPRSRVPDVTWVPIAAWGAAAFIALAVLGFCAYEIMWKARRLERDLGRLQTMTGELADLQSRLALAQQRVVAARQRX\n>ERR1711998_154733\nGELSIIIAISGARPRMDMSLTNCEPWLTQESRNRRELTYPFGSSVSRTGSAYFARDAVNTTTSNISATFSRKTSTPGRFATKTSWWIPSISTLIWKSKNAVGWKEECTNVSSRSSTRHFLFLNFGSGGGRRGCLLEVLX\n>ERR1719424_536034\nRSHHTASLHESMNGMHGPMVQTEEDEALPPIISLDDLVAQQELKEEPPSTVQYIHCGSTPEERRTCIRLMQRCLQCPVLPAPRPTLSARRALLQLVCDESGQPAADDPATLRLPEPKAAAAAALADLTAQLEQCHGDDLEDQSDRDAARRAEAVRSSSSAMATTWRIR\n>SRR5947207_3404454\nIPPTFKDFVGRIEGAFLHPGSRIGGIVADLSDLTTFLPLDAQYDQITVGSWVVVENLDSTGTAIRTFHQVTDVKTITLTPLDFLSRGVFVGIEGIELQQISAILTIATTITLLTLDPAWLPRERGKDRNDLFTVLRTTTIYAQSECLPLAEVPSSESTDNQSASGEPTSQSASSGATSQCIIENDTIELDRLYPDLKSGQRLIISGERADVPGVRVSELVMLAGVKQDVGQVIVEVNGVKQSIPLSNDKLHTFLQLAVPLAFRYKCGTVTIYGNVVRATHGETRSETLGSGDGTK\n>SRR4051812_28246904\nDYVRLHQWVARRFHVHRTVLVSVSMGAIAGLQLAAHHDVPRLAGWVGVSPVLDLTSAAASGPLSDDIHLSAAQVHGLDPTRLAPGRLRGLPMAVAISREDRVVSVPAAESFARRTGARLIACAGGHATGDCYRPGVVEKMLRX\n>SRR2546428_178850\nPRDSRAGPRAVRSGHRRRAREACARRIRARLLRPAARSRGLAPTPRRGAPSPARPCSPQHLWAPSMRLWAFSAGLLSLGSPPNFAQSGQFFVYYGTATGTPPDPWHSVIAGYRVSARDPNRADPSSGRILLQVKRQKGPQHFGGGFCFGSDGMLYIGNGDSA\n>SRR5215472_1953996\nRLCSPACRPINASFIKGPSLLVLFGIESGRGGIRTHEGLAPLAVFKTAALNHSATLPRSQRQLLTHWPSQTKVDIAAESRRRPPFAGPLFGPDLSQTSRVHHGESGRRSGVDRLSGAGPALALPDQIEARRTRPQKRKPRGSAGLVPGSAYVRTARGLGESER\n>A0A2H1WYH1_SPOFR\nMKLTKHLFATIINKNLQLLPRITMGCGFALIKTSIIFGAGLYTGVYVAQNYKIDKVEDPKVLFERAQTFVKDKLAEVGDKKDK\n>SRR5580765_5835986\nLGRGPVPHLAPAALGRGQAGLDQRLQVLDDGLAGDGEVHRQVAGRLRPVVDEPLQETPPGRVGQRVEEGVDGVDQTLASAQTESQSDSTRKSHDVAAAMAVSTEAAAVSVMTRRLPRSAGSMANTTVEAACSSSSGHQRKLTYSPSTTPS\n>SRR3990170_974992\nGGRHARAGPRAGASGGCAGIGDGQPDLGREFDRAGRYRSRLELVFLHGCRQREIPLVQALDFLFEMFAIAIVVDHVIRLLQTLRATHLGGHDFTDLRFGQSAARGRALNLRAFRGVHHQNTIHEIDEPGLDQQRHHEDAVGRVKYIQFFADYFADARMQDRLKPLTFAGILEYAFAQSVPVNPAMGVENILPEGADDFVEYRLPGFGQAMRDFVGIDDRYATRGKERRHRGFSAANATGKANPQHGAGAQTAIRANCRX\n>SRR4030095_11228013\nGTRDQRGTRQGACPSDRRLSRLPGGGVPGGRNRPQPWQVQTGRGFPPAQEGGQSRRAKLQAQSAIGSEARRRFIVPGEGIVRAAAILISVGALELTGCATARMHTEADLNSAATAFGLALGQLAQDDEEKRLLFVMEANPSAPKQVCVKNWARRNHLKAVFIDALDWVGPWGGGFAALLPLPRG\n>SRR6266567_941993\nISAASGIIVRPAAAASRTADAVRSASRPAMATAAPAWASAVANAFPSPRFPPVTSAFRPCSANWSRTFMNRSLRPRTSRCASMVRMTETDLGALYGMVRVRLSGLAAEVSEPAGVPVPACPAWSVHDVVAHVVAVAEDVLSGRLTSPPTDDWTAAQVTARKDRSVADLVAEWGELAPRIEALISKGGMWAGFLDVLSHEHDIRGAIAAPAGRDAPELLLAAEFLVSRWRPDVAVTVRMGEREFSVGPADESAIGLVTSPF\n>ERR1712020_113728\nEPVGAGVHGSQWWKVKLGAVSSHELGSCPGSLSLLATLATILATTLIITASLKIAMNGLKEEGWPTPGAATRPTADGSGGRTLQYLSGGQADGQDLALPVSDGRGLGRGLRARHRVDDLLERNEWTRVWSSPEPQRISFFVPSPHTTLLHYCVSMFVVCYRVVVFVKTFVICVX\n>SRR5262245_7284194\nESGLSLLLDVLDGARQRGISGDGFCCSRRSSTEPAVVAIPPSQAKFEIEAVAQFEMRVQALLEDDPVLGMHQFEENIAPRREAAAVVSQQLAKARREPGVSRRDVEFPDSVLCAADRTIEPQPCFVLLGDIL\n>SRR5216683_8145363\nREEPRLLRALVAVDVKRKVQAGPDHATSTQLTRHDHAVRSRSQHRLGPAPHPRRGRHLPRAATVPSWSEAREVAAVCDRRALRAESPVAIHPEAGRSRDWKRLACTGAAGQGRSARLEDHAPARLDVTVQQFERPGIVVRAAAIDHHLVELSQVLGSVVVNVPTSLDRYGSGSVEVAERKVAKDQLVVLGPAN\n>ERR1719282_30391\nKMHLGTAVEDVRCDVVRWRSVRQHHVYRCRCCPKSQEGCQAQGPSCPSSIRCHDQGCCQGSCLCCCRWKEGSRILQACCQGTQGKEACCQETKGQEASCQETKEGCQEASSX\n>SRR3984957_655891\nKPPARSAAHFDRAAVTLINQAIRDSDVFRLAAAEAEDRPSRAERAVSHGRKLTASEERAGVVLRHDVAVRHIHVNATDEMKPVVVVIDAVVNVDAVEMDVPALDGPDAVIGAGVEKNIPDDQILATIKQQQMRPMIAADSRRRRDAASRAAKRVALAVDGARPFDADIPGKDGVDQPNISVAERGIPAQWDGVSRPILLSVRAPQEFSAGGDVEGDIALEFDCSDDKTAGRHHDGSALIGSAGIDSSLNGRRIECLSIARGAKIADVVDARP\n>SRR4029077_904125\nKAARQGRRQRLRHNKMHSEAQQLYEHTVWNEEFGGNLIARFARKIPAAFRSTAIPDYQMIASALAMGDLETKGGAHNWPQRRVWERFAHHFQNSKKRPDVFAAIDAHTKRFQQDMVFCQAHAALHCRKADPPDLLWDDKLLPREIAPHL\n>SRR2546429_6251402\nGCGAARWRGVLAECVWRMRNSGSRSTSYCFFFFLMIRRPPRSTLFPYTTLFRSSAHRRKHEPGRNVGRHVLHAVHRKIDGRADRSEEHTSELQSRLHLVCRLLLEKKNELRLTRSCHRGTDHPHADALRPLPPRHS\n>SRR5438046_2863571\nSTFLTSFLAQQESPAALAFSAQQADFALSQVLASPACKAGMKAKAASVKQTTSFFIMVLFRTAVNIVNTPFIPNQTVLSMDHSKRIPAVLDFVGLPRGGMLSIFVCLQQRSRFTIDIAPLRGWGAAVSLPLFRARVAAGHTDADPSDGSVKA\n>ERR1719491_2917382\nKWLLVTWHLLLSISISWWHLTRRHLTWRHLTWRVHAWLHLHLRILTRWELAWRSVLAWWELAWWELAWWILWICSSIMMHGFLLVVYLDDLVNATRGVTARIMRTNVLAMTRANQNANNDANTAEKDADADEAAAMTATTEVTAVS\n>ERR1700736_6027844\nITESGREGRIDPVKKLLLLPVVLTTLLLAFAFIMPATAANVLRSLAPATHLNLPSVISAGSGNEVAARPAASAANPGSAAFPGGSSAPGGSSPTHQDSTSRPLITVQDRGHAVTTSGGVISGCFGVGCYGVKHHELCPNWLYPLPAVHYAPPALLAGNDAAA\n>SRR6476661_8427451\nEAPNGTFVSLGSNAHGPWGPLVGSQVGCHRIRSETGQTRRETGTQSQGSSRRQSTRPPGYQAPHRQALLKGTSMVQPERTALDEPRQERQVRQAGPMAPTRGWSLDFTGSRRASVVLSLVLLLTALGTSGASAAGYDPA\n>SRR6266540_5744156\nXMSAEPLAKAELPYTLTRGGHKPRSVRVPRSRCSLSSEGLCPSARLHNATAMSAEPLAKAELPYTLSRGPQAPLRSRASLAVLAIIRGALPLGTPPQCYGDVRRTLGEGGTPLHAHSRAPSTAPFACLARGARYHPRGFAPRHACTMLRRCRPKPWRRRNSPTRSLAGPKHRSVRVPRSRCSLSSEGLRPTARLHNATAMSAEALAKTELPCTLTRGGP\n>ERR1719259_1225225\nGFHLIRIDARWFKTAKNWDVNTRLLANLFACLLTQLAHLLALHCLLHLRATLRSFIRSPTNFTHSQACENVGILMSHNQAVLNHGAATLNSVHADIPSSERVHNCVTDAVGVVLVAFALSVILPRKCETRRQHEQFLX\n>SRR5579871_1117583\nXMPGITTLRQPARKGKSQPAKKSSSGKNTRRSPASNVRKKIKHAGQSRQPATLKQTDQPSTGGVSMKFRLNDNNPKEKAIIDALAACGEREMSRFIKRAAYQLATGRDYDTGLPLYATIPSAHERNESEIPVSSGGDIQRRMSILADLDSGLDDWDSLSAX\n>JI8StandDraft_2_1071088.scaffolds.fasta_scaffold684990_1\nMALTLRLVKGTELTFDELDENFTYLNANKYEANDDAQFGTLTFGTLTDGVLDVIAFTNDVTLSSQTPEQVVPTEFAITSYIAAYHAANPYSTSDLTDVSASGTYTGVLVYDGLGEYIPTVPTMSFLQDVDVSSVSDGQILAYDADSEMWTTVTTGALSNIYLAGLTDVDLTTTPPITNDLLSFNGSEWVPATPILNLDGLQDVDLTTNPPVDGESLIYDAGTWVAGTPSTVGKMEVYAAAGETISAGRAVTIGLQDTSKTVAFPIQYADPEFGQSISLGAAVGSQSHSIWCTAQEKYIIAYINDTTGDGEFRVGELDDQGIEITLDPTIHYFGENIGGEFSVSYDIATTRTVFAWRDSITNIGYARVITLAGFSVTMSEFPIDFSLSSPIGTHSVSCDTASGNVVFHYADQESLGTGVGRLAELDGLDLLFQPPIPFTTKEVYQIHTVYNSIGNRHVSVFIDELGTGWSFVTIVSGLFLTFRTPRGIWDNMTTPFVTLMKGGSECWVAYRRTNTVPAQGWITRFTNSNNGTTNTNYTGAQYTHYPFENGQDSVETPYKMSNIDPAIIGSQDTRGATIVWGREDQLGNVSLHSTLLTFSEFGGYPIVDTDDAIKASDDSNVEFLITDQLWPVLLTNKEESRMLIPLTQPGGIKAITFGTNPITNIRDWFGIADESFSSPINPQSGFPEWNTGQITILGGTSEATSFAGGIGGVLVPGTKIYIDNSRIYRGALRTSDVGSGAIGIAVAGNKVLVTGDIEPNPDVSGVPKSLNELEDVDTKSVAPQSQQFLQWNTNKQNWVPAYAEVQGEINNLSDVDTFTNYNTGIPNSHLFAWDDFNTEWVPKLINDIIAEIGVSINELNDVNILIPQDRHVLTYSSEAGQWLSQSLELTSKLEDLLDVDMDDQSYPRSTGHFLQWQGQKWVPNAPSIPPISALPDTVIGASPITGQALVWNGTTQKWVNSFISIAGNLNSLSDVDTTATAPINGQALVWNSEAAKWVPGTVSGGGSGGGNNEGSPVGPLPGGGSSEGTVETEDGDTIVIPPLEEGDSIDDAILTGQGIVDQTYSNSTIIGFTDVISGNVHPGDIVDNVALLPKPFPIILSIAEDRLSVTVSRSVSIPQGAVCAFGTPPVIQNVAGTEGIVVSPTMSPGEYDTILTQPALPEGVVPGVAVYVSSITEYPVITGISADRLSLTVSYPIQVIPGEVITFNIVIPVKTTGGEGTLVLDDQDAGPIGPMTIASFSAGGVTINFTEDRLPLVDSGMNIIAYDELGEVEYVYIYGVDGGSTDSVNITNPTRAAELLSVGQEVYFENQASKGQTNGTLIRVQSEIDDEVKIGDYVISPRLIDAPKVTSIDINLLYVTVNKNIDVLEHGDFVTFGESVDKAIEVNIRLDELKDTAIEPGLLRDGELLVWDAELEKWTTKDLQLATSLDSLTDVRIDNRDTGQILRYVDNVEFGIRMENITPSWTADDLQDFDYSTVAENSVLAGNNGQWIQKDIVETIKSVNTLELTDLSNVSVLSATSGQGLVYNGSAWTAQNFPDEIGDLLNVNAASPSTLDALIWSGSSWNSAEIPRALEDLNALNVFELDQFPVGGFTDVPIGTANTSRFVKWTGSGFITTRFNNDDGYGIGLKLENLDDVNLENPYTADFISWDPETQMWITRSVEGAVIDIGLTVLSDVDLQTVLPQSRNTLEYDEPTGQWRPTERQGLAHYVPHEDLVLGDLVALRSDGKVEKVGEVSSSESVLFTTTATPSSASDYYGKSVYVSDNYYIVGAPGFENSTTGGKIEIYDTSTNSLLQVITNPTPGLATKFGESVSISDNFFVVGAPGYNSNAGRIYIYDLPGFTLSETIENPNLSTSTLDDQFGNRVQITNDYIVVSAITEEPINLSDNNTGVVYIFNPATGNLLHSIQSPTPSITGWGQSVAVGASGYIAIGHPLNNEVRVYQAATAGLLYTLTSPNNFEGNFGNSMGISTSGRLVVGAPNSEGGKIFVYNLVTGDFNYTITNPDRNISGGADKFGNTVAISNDYIIASATDERTIGTSWGTVYIFDVNTGRFLNEFKNPTDTNINWGYSLAVTNDYTIIGAPRLTIAGVGEIHTFSSSSFLTSNADNWVGIVEEDRLVADNKDVLVTTVGSVNKFVSGLETNKNYYLDGRGFLTLTETDYGVLGKATAETELLITGNVVSAETGVSYLNDIRDVDTVSKPPANNQGLVWDSANNRWSPKTIGYSNITTFGGLSDTSVASPTPGQSIQWTGTHWALANYIPQGSFVLNELSDVNTAGLEHGDSLVYSFILDKWIPQQTGTSNVFILDDLTDVDLQEITPVSNDVLVYNLEEDKWIPGAVSRVASLDDLTDVDLQTQAPTEADVIAYNSITSKWEPQLIANITVTSLSGLDEVDITSLGNNPLEGETLVWNAIDSVFRPGSPSLDTISLGSLGDVDTTTGGNVPEAGESLFWDGSNWVPGPTGDAVAAFIGDLVDVNVISYPPKELQVLTWDSSINRWYPRNGHSGGIEDFIAEGDILQGEVVSINLNGSVSRTGQSPFQPAWYKENPTPFGTASNDFFAYSLAASTDKLLVSADREDETGEIDSGKVYVYDALGFLEATINNNNINASPANDRFGFSLAIHGNLFAISAPFEDSGLNYQTGAVYLYNRTTNAITSQIVHPGLATFGSVQSYSPNNSQFGHSISLGGERLAVGAPFDSGNIAINSGVVYIVNPSPAVGEAQFPHIITNPNETGGSYNDQFGTKVALNSTGQYLAVASKNEGPSSTKGGVYIFDISNEEIDPVQVAYIANPGLGGGFSYNFASALKWDQVYPNLLAIGSYDSDTDYPEGYDQGRVFIWDLNTLDFRTVITNPNSYNNPTTGDRFGWSVDMKEGKLLAGATYEEQGYVGGKYTNAGKAYLLDATSGQLEAIFSNPNIYGDSTNEQFGYSVAIGGQGFNDLYHVGTPYVRNTISSDFNSGAVVTFDSQITTNADAWIGIAFEDIADGEVGNVTLFGGVAKNLFGLEAGSNYYLQVDGGYTLTLSPYGIIGKALSPNTLLITGDVESNTADQVNVLNDLNDVTSVTPQVGDGLVWNGSGWVTGAVSGGVSNIGELDDVFLPVPNLLQSGQVLTWNGVAQSWVNAATGSSNVAIINDLTDVDLDTIPPLEDQVLQFDGATWRPTDLPEGQRITGVASENITEGSIVLYGNTGQFKNVEISIGAFLASIPASVPSNYALFGSVITHQGDYYAVSAPGASAQGVGSYFGVVTVYDAVTDAPVRTFYPPREGYQVIANVSNQYFGESISIYGDYLAVGAPKGTINGAVQTGIVYVFRISTGSLVYIIPCPFNQNANDNFGASVSIDDTAILIGSPGYDSPTSFNTGRAYLYDFNDLDGYSYDVEEEEWPIIPPSKIFENSNDEGTPAGDAFGSVVSITPSSVIISAPSEDTGGTLSTGRIYIRNRVTTASIATLVNPNIDSEGFGTVLAYWPEKIIVGAPGYNANQGIVYIFSATTGALLHTIQSPEAIGDRFGVSVAIGEYQIVIGSETGKEGYPDSGKIHVYSNAAPPVYYGGFDNPGYNVSPSGERMGTAVAITPAGKAIAGAPYSDLSAGSQQNPAIDRGAVHLFDVSESAISSDAGEWIGIAAGTMTQGETGEVVILGGLTPFVYSGLVPATYYYANFDGTLTTNTTDYGLVGIATNSQQLLILGSISGVATMPDLSDVDFSSGLTPSHALTWNGQFWEGKFVSTITSITELDDVSLIDTPPEDTQALVFESLSGKWKATDIGYSNVFAFNDLNDVSISNVAVGQSLSWNGSQWVPETFSQVSTLDELTDVNTNVFKTDRDILEWDGEALEWTVARNVFGNFINIEAEGSIAAGEPVYITNNSKVAQIRGTEEITGTAVFENDFFQDISLSGYGRSIDIYEDLIVAGNPEFDLPGITNTGKAFVYSASSGELLQVLYPPTSYTYQQFGNTVATNGDLVAIIAAENPYANGKGKVHIYKGTTGEYLRSIEHPDPSRTTSNGFGYHQKSIDFQGNFLLVGDKNYRDPISNASLGRAFLFNAYTGNLVHTFEHPNSSAVNSRSFGTQVAMLDDGSKILIYDVLQDGLNSATAYIYDYAYDLVSTIEVPHYNADTIAINSNYLIVASTYSGYLYIHSLLDGTLLYTSGSAYLDYGQKSLSANEKTLVVTYGSNKGFRVFDIASRILLASETTSSVGSCASLFKTRLVYSTGYQAITYNLNDISISSKAADWVGISEGAYLAGDTTTIITGSGFVSALSGLIPGANYYVAVDGTLFPGATGFGKIGRAVSETELLVSSNTSNIDLDSDSTASLIAGIGDLTDVDTFTLFPTDGQYLQYNSVTSTWSPGDVSLPSLTDISLADIENNDLLLYSEGIWSNGTLATTNLSDIDTTVAPTASQTLIWNENTSKWEAGIPERALDSLSNMGSSVSTPTTGQILVYNTIGDQWSAVDNEFSLDGLTDVNLEGVTDNQFLQYNSTSSEWEPGTVATAVSELTDVDLTGVTEGQYLVYNDQDKWVPTTIEFAAALTDLTDVNAVGATQGQGLIYDTGTNKFELAIVGTSNVDTLEDLSNVSIPTTPNNGDVLKYNGNTDTWEATPTPSPAVVYATRNSFPAIGNLGDLSFAQDTGVLYVWEGTIWYNLKRTNAFYLVRAGQFTGPLTGTQLFQPQQTITLHEIRAQVDQPSGASLIFSVMRSGAEVQQFVIPPAAPFIEAAFTAGVVVGPADEITVDIISGPGTNLSIKFIYSX\n>EndMetStandDraft_2_1072991.scaffolds.fasta_scaffold3645261_1\nTIQMSVTFNQPVRIYKYNNSSNNGVIAPDNTGVASATQQSYILNPISAANSGTVTFQTADVGQTTATPFVLPAGAQISNIRLYQTTAAANLAGGVITVSIIQTNPTTSANTTTAIGTITPTAAGGVITWVPTATAATATILNNIGTLDATLTFAAAXVTALTXGSLXGTFDVSYTPRNYDGSIINVGQGYTNSX\n>ERR1712185_45118\nLGKGCCRAGGSVLLRDCTLEGRAVAKIRLTVVEGLNQRVVLGMDVLGREGIVLDCERGAVAFRPDVSGPGLIDSPNGLTVLDDDEDAAEYEFFYVTAKDILQAGGLDDNEEDLPNQQAVSAGDSATGQPVITDARMQQIIDDHSRVFQKRESLPGRRGLYDFAIDLYDDARPERRTLYRLSTAETKALRAEVMGLLDRGWIARSHSAWSSPVLFAKNQKKDGSLRPVYDYRSINSRTVPFNGPLPRWTEILPKLRGAAVFSVFDLAKGFQQIRVRAGDEPKTAFATPWGLYHHLVMTMGSANAAAHMQSVGNAMIEGDAEALPEFPVGHPLHDLAEENLARYSLERGAARRQQRRRDGRDEIARIALDSLGSFIILYVDDIIVYSADREAHYGHVEALLERLELFDLRLNEFSRFGESSGEFLGFTISRNEVRVKESRVQSILDWPVPTSAAAVRTFLGLVNFYRDHHLSYATWAAQITPLTGKGVPWRWTAQHDRAFAQIKEGIAARIALRLPDPDRPFVLATDASLHAVGGVLLQADPDAAIPDRLEIVACFSKQCSPAEGRYSQHSLEMLALVRCITHWRWLLDGATDLVIYTDSQALVTGKLFSESQPSWASHRMARWIARIASTRADLRHHPASARLAVAVDALTRRPDYVNGTAKDMDGWIRELSELHAARKQRAQQTQSMQVMSGIAATPQGAKCMYTLVVAESPLARIKAGTLGSDDRRMQRLGCEWRDGIWTRFGRIVVPLDAALRADLIREVHDVGHPGRLATCQVLRRRYWWPRMIDDVAEFIKQCATCSHVKSGRRHGRGSHPLPLATEVWSEVQLDFIVSLPPSGPRGFTRICTVSCRRSKEVILIPCWDAMTAADFADLFLDYVWKTKGMPRVVRTDHDPLFISQLWRRFAARLGFAATQSAPYRHQQMGGVERVNQHVEQLLRTWVASQEARWSEYLPMVQFALNYTPASTLGISPFEVVQGWLPRRGFDASDDVPLATTSLDPGQRAAEVIQWVNERLMDSEIHNTRSGSTWRPGVGDRVYLSSEHLSAKTVGVASDSRLRDRWVGPYVVVGLDDNTEAVHVELPLRWQVQQPISLDRLKPCFLAGLPPVQVEVDPDTGTKYVVAEVERIVGHTCSGRGRNRVVATLTVRFAGYEADFDRVYSIDGDDAIAGLLDTSAGVVQDYLEQHGLRLPPDLQKCLTAECAFLELDPMDVPWMFSVEAV\n>SRR3954468_8813130\nLSQGGSGPAYGDFPPGRPLTGSVTTRAGRRLAGRLVYDLDESETTETLDAPSQGVDYTIPFGLIASIVPPGRGARRARVTLHNGEELQLERIGDLGEGNAGMLIVVDGRQRAEYVPWTDVEQVDFDRPPAMSPPAVGGVYPATGAASTLCSTASSSWRLTGLVRWARKPASRLCRMSSSMPKPVRQMPLTSSPQRARIWRMRSSPLPSGRPRSLMIRSKQGSKGGVSRWARAAATEAAVSTEXX\n>A0A1Q6RLF7_9FIRM\nMEGLEKAIEQIKENIPKLDLRENEPMRNHCSFKVGGAVRAFAVPGDLFEMSKVMFYLHMNGVSPLTLGKCTNVIFPEEGLDIMVISTENLRKLRLGETENTIYAEAGVSLAKLAQFARDNGLSGLEFASGIPGSVGGGVLMNAGAYGGEMKDVIESVVVYYVPTQALTEVRGSDCGFEYRRSGFEKINCAIMGAVFKLTPDDPEAIGARMKEMNEKRTASQPLDMPSAGSAFKRPVGGYAVALIDQCGLKGYTVGGAQISRKHAGFAVNTGSATYDDVVELLDHVRREVYAQTQVTLEPEIRIYPKGMLLVDDWRERKQTIIDGMLEQAKQNAADSAAESSDVRPS\n>SRR5689334_5448804\nSGTSAALSGTRRTIFVVDRTGNARARAALEAFKDRWNSESFGRTSLPLVGIVAGRPADGCALPAAGSETDTGDVILCLDDTLTSAGVGGPLRVDAHKHTELALVKLKSATLRWTECSLRTAVAHEMGHVMGLAHNDKGGALQPSIMMSAAGPYKYGCAVWFNA\n>U2SVQ8_9FUSO\nMVVISGIIEFRNVSYSKNNNMILENISFSLKKNKYNVIIGKNGSGKSTILKLIVGLEKISGGQIFIDNEELVYKRDELYKIRKKTGIVFQESNEHIIGETVAESLIFGMENNRIPLEKMKENMTKYVKLFQLENIIDKKTVNLSGGEKQKVALAGAVITEPEIILLDEVTEMWDKVTKDKMNGIIEEFLKDGKTVVSVTHNLEEIKRSDNIVFITEEGKIVTGKSEEVNKIIEKKENTEINHEVISEYSADLTKMSLKEEEIKVKIKDISYYYEKERKIIDSFSVNIPKDSITAITGKSGTGKTTLIEIISGLAFLGENFSGEIGYNFRNENKEKEDEKLLLYKNISERELYEIRKRMGIVFQNTGEQFFSGTVLEELEYNITKKYKIKNRKSKELNDKIKEIAELFGYDEKFLMKSPFVLSGGEKKMLGLALAVCLEPEILILDEPTGALDYNMTIKFMQIVEKTKKNGTTVILVTHDENIVKQYSDYILKM\n>SRR5439155_21550961\nGVPGTQASRLHTLHNALEDECFSAGFPREARPFHPHLTSARLRSAKGSRGLAQRHKELSFEPERFNVSEVGVFRSDLLSEGPKHTAISRHNVRRANRKSQVDAYXX\n>SRR4051794_8769673\nCDGARRRRLRAGRRHGRTRHGGARARGGRRAARRAARRRRRELGRPAVGQRAQPLRRRLALLVRASDRRAAATAARARAGDGGGRRGSVRDLVVGPAADRRARHLERPATGRERADEGALARARPPRHPRERGGAGPDRHRSRAVQRRRPRRAHRPPGRGREGRVGARGAARSLRGARGDGPRGRVPALRRRVVRERRGRTGGRRAGDRAAMSDFLRVAAAQLENVVGDLDGNADRILDAMRWAEEQDADVIVFPELALTGYPLADLVLRDEFVDASLDCLRRIAARSGRTAAVIGTVDRVPPRRAWDTRPRDVAISAALACDGELRGSYHKTLLPNYEVFNEARNFAPGNDPAVLWRIGTAIAGVAICEDSWSGDGPPEDQAAAGARILLIPNASPFNLEKPAGRLELVSSVARRNAAPVVYVNFVGGQDELVFDGGSLVVDADGELLYRARQFEPERFCLDVPLGRDRPLARDPRTVHARPPAPRRRMPQPEPAVQLSDDEQVWRAIVLGTRDFV\n>SRR6478735_3307528\nSSPVGRRSEGCVASATPNSGRYRKSGDCRTASITAARPDVKVSPLVTLFSSASSASASPAASGRRYALGTQLSTNVRAQLSWLVEVVALAAQGASLASGVACTARLAISPATSLYPETRSAETVCWAASLLKPFPSTSGGRLMAGEVVSPSNSATVLLNSLRVRRRIGAELGSNVWLVQAETCVSPALALAPPRPCVAPPFAPAKPELFGPAPEPFPAVDPRLGAPGASRFALQATPSNRHKRTVTSAGAPIAGGDLLVIGGX\n>ERR1039458_4032371\nPPRSTLFPYTTALPIYALFVERCTGKIAAECANEPARPAKLFVITTEFYLRPHERSLSFDHFDGHAGQVIGQPVRPGKSKGSFADGFDQRFRLEIAIDPAARRQGVTTKRPACRIACFRDPIRVKDHNVSRLERQGYLVVDFSFTDSERQIISVYQVAQARLAVKVNYPRMQAINENEIALIQVQSDITESHETFEIDQMRRQFRMGQRDDLFRLRQLAMLGQEIGRAP\n>SRR2546423_9850065\nIQHKRNCLIASEPRFPPCGIGNTTGKDPAIRNIAKSNPDRFRISATSVINSGECLFQRNTFAESRLAGQDEAFFGQELIKMFRYLMVSIPFTIWIVEKSIAMHAARDVRAKRDPESFPGNYHCLIX\n>SRR6185437_1912756\nGDRAGARKRRRSLAAHRRKAGRNAAGSLGNAPFLEEDAVLKPASCQIPSAASLRGLGAFAPAPILEQTLAARGIARLERVRRGDPVGAEMAKALPQLTPGHDDALLVEKANPERPDGALGPCALRVVINEREFAFGADRGADLREVGRGRAFGFX\n>SRR5678815_2292360\nSTTTARVRAASSRPADVTVWTRAGASDFLPGRRRLNPSMPETIDLFVPLAELDEPLAPRVEQALGWRRGQVGELRVLRRSLDARKGRPLGQRLRVLVGREGEALGPAAARGSQRAGHDRRTGQARAAAPPRSRAADARRADAELELLFRRGRGR\n>ERR550532_1119739\nAAGVASQVLGVRCNLAGHCNCLEGNLLSSFGAAVMDVEDVEEDNVPEVFVLLTQEVPYQLEVDPQEEEDLHPNFLHKALVAVGPDSRMECYSDARIHHNCCYLGVHSHQDHPFACRNAHLGAVVLLGDLHNKDVGLGQEDLEGHLYYYTSYVAGVPX\n>SRR5690349_19480509\nKAPFPICSSSTAARASCTRRSPQRTTSACRRSRCRATRARRSSRWSASRRAASSTTGRRGWCRGGAPGALRSSPRPFAASEAESKGAALADAAEATSRGFVGELERTPERVFLPGRKDPVVLRQNSAELFLLTRLRDEAHRFAITFHRKLRRSRNFQSVLEEIPGIGAGRRKALLRTLGSLKRIKEARVEEIAAVEGFGPKAAQAVWDFFHGSAAAGDADAARAPGGLADQVDAGSGAGTGTAEALGDVTEADIDAALAEDDDAGDATAVRX\n>ERR1740129_664351\nVLLSSFSFGAAGRMCLLKRLVFIWHYSTLIEGVFLRGGLVEDPRQTLVTTPIESYIVASRSFSEDYNAVVVDYYMKSFGIYSSLHPSVVLRRDKLGVESGGGTEVINFDKTYGFGTKITFESDHFGRPRLACVDGYLPCLARNCLRTRVVRVLSHLSTVLKTCCGNLTNGWTTPGMLTVPAAFMTLHAEAERVYNPWAFQGVTNCSEAIEALNMASHKFRRSSELAGAAVHAALLHYHSDAAGHTPGATAPIPRKVVFHRYIGSHRSTILLSLLEGMSKLMESPQESLNAVEIGVYTAYTSAFILENLWQLRVWSVDPYRVERPKNRGIGSWQNVYDVDIFGQVRQLLSRYGHRSTLWRLTSKEAAQRFNDTLDLVFIDGDHSYEAVREDINLWEPFVRLGGIVAGHDYHTDSVIQAVHGHLDGTNTVLHIAPDFMWWYIVGSSGSCEVGSERPARDHTQPLRFPSX\n>SRR6202011_3201054\nXVRVVGGFGNDGCLLALAQYLDRELRPESCELRLDVADREALADAMSIITRCCASNYTAVSIEKRLVAERIGVRDAMYFERDEPVRHAGSQLLLELCLADEVALVHAHEAVETGLERRVVRRHVATPHX\n>ERR1700756_1693894\nHQTSGPREFTRLIDRRYLVSECKHRKPLRLAVEKWIGAYDEDAGFQLGKTSERSLDLGFRTCPQNMKLKSARERRRLHIFHDDVGTGVGRVDKQRNEGCGRHHFMSQLQ\n>SRR3712207_7425182\nLKERHTGGKEKREVTIVFFSSRRRHTRYWRDWSSDVCSSDLQELLGRGRLVGREAHARGELEVERRGHRDQDGAGAVGRLHLAGSEERRVGKEGRSRWSPYHLKKYIDTLAHAVTHSTISTTIS\n>ERR1719174_1663456\nPDLLFRSAGRVSSVEPIDLAGNAAAVEAVARARSYRGELIVLAATASHWPYAINAVSELALLGMEHYVFIAPSRTDCDVLRARRPGLACVFSTLVSNTTMAQEKSFTVWTTRKRYVGRWAALGLGVLQADLDVIWYANPYPALKGALRNVSLVHLQEGKCNEGRANGGMLYAQSACDGSMAHWVLREVYERVRRNEDDPRILETHYPGLFSD\n>SRR6185312_1149132\nXMNWNSPRADEVLAAAFGLKLDSIFAVASRYSKLAPVVDAACLIEPAILARTGSTPAAIVAFDVSTAMSLVPCPSRTSRGRSGAGNQRPYAAETAAIIVNDRLRAPPLRLGFVIAGDLVDLFRGHLAGDVAHLLADVVAAGAGRERLQLRLDVDSRLTAKPGTTGLVVDVAMAGAARCDVAHRRPRRDDRRCRHRRIELVRWHARQIG\n>A0A1V9EVA1_9BACT\nMATIEFLDQLLSDNKAREAKKLALIMDPAKKPFHILSFIGINEVYFIYKAFVEGDFKAARQHLYNMGMTNAWYYEKINGEIFDVLATFTYPLLSDSSFLIERYLTYTRMDSPGSFAACFGKAIQNVLKNDIDGLSLNIEGLKKRSGQGWEKNYNGVIPVFEGFIDNDKAKIEEGLMSLLAKHNKQNQPPVLKDFMNLEATALAKLAWRKGISVDVKSHLIPIVLLPVQEPDQYSGYEFFNEVS\n>SRR6478735_9024146\nTARPPRTCRRASGRRPAPARPTGRRASPRGSASSGAPPTRTRPPGPSRPGARSRRHGPSPPSPHGTRRVPRPRPVRCWACSPSSVGRGGALGVGDRGAAIGDRPLLPASGPPLGLEDAHVDLIPPSAVAPDRLPRAALVDEADPLVGPDGALVEGEHGQGDAMEAERAQGVVHHQRGRLAAVAPAPGVALADG\n>ERR1017187_5434680\nXMLVFKTTSTANQPVGATSAYHILFRILIISGSRAKSQPFPVPNGSCSGQSRKWVQGRGLLRKKRFSRGLTHGLRSSYVRLLLSKFWPRCSFDDTPFQRKRSEVQERIDAREILFEGDRGCGRGIVLVAIGCAKLQPLRHEILGANPALPNIVYAAYSGVLIMLVGATSIDQELLPVNLLVDLKICAGRGDGGX\n>SRR2546423_1398384\nDGITEVARRSLQCWLYRTIALERACPQFWNSVVSWFFSVTYNADRSITYTPGFLTALRQLLRQPRPEVVTASSLPNARLSDFAEVMSWLGTAFPFPAGAAAVAHAGFEDAGFEAALAMTRSALAGMRQAPYVPPTTYTAAPPPGATGTLLPPAPL\n>SRR5699024_12166037\nSLLPSDTVTLYLHSFPTRRSSDLRIIKRHSTFHLLFQILPGIVLRLQLLPATAWFSCFLHFTHAAPAAVHPGRGRKSSSCRCNQDRKSTRLNSSHVSISYAVFCLKX\n>SRR6266536_896491\nGTMSHDERACEHEWRRWVDKDGIAHRECWRCATYYAWPVNGEPRAGVAKGTVYYNFASKAALFEEVHTQSDYIQRYRLTKLAIVGSRHLTTQQADLVHVIIDAVLDDYPDDAVICSGGAPGVDTMAITRAHQAGRTTRLFLPHHQRWEPDGYKARNMLIASWCDDLVAIMATDSKTFGSGWTANYAESLGKNVRRLYVX\n>SRR4051794_24080993\nLARLARRTRWSSTASCAASGCALRPPARRSSSPSTRSPARNAACPIGAFGVLTQDEARREARAILGAAAKGGDPYIDRKQKAAAGCQAKAEAEFTFSRMVEAWAAAREGDRRASYLREAVSCLRRNLPGWW\n>ERR1719310_114900\nSARYVGRSQAAWQAASQRMGGLDAPPRKTAWSSSPDGLKSPRLDSRNASMQPPSGDIRGRRPSHLGLAHEVKERRPLFDALDTEKIKQQARESLQGRPAYNVFEFYHETGVFQFVAKHPLFENITLGVISLNAVYMAIDTDYNKSDTLLQAHPFFIACENMFCLYFFGEWFIRFMAFKNKCNG\n>ERR1719193_2294297\nLYCCLLRRGLLLFGPFLYFLVPGVLLRIHVLLVVLLRTGLGALLPIRVGRRGRGDVRRGGAAGPAARGDAADDPPHPRLEVPLDQGTEIDLVCEVIARDEPDVQRRVPLKLAPIFLHVYACAPFVAVPAQLLAVHLVVQVILPLARRLLRARRLPGRRLLLFGEQAVLPAVLDEGGAELPPSVAR\n>ERR1719433_1424020\nASAICILATGRASFLNFLRQNPRKSLTSLIHRNFYEFEMAEKTIQFKAKKEIFDKAAARLACSDCKVVPRDVPIFQTGQGDVLCSICKPNSKLTGIFRSSVLEDLLMSLPISCKFQKNECPVVLQDRENLSYHEEDCEHRDVLCPYGFCKERIPAIQFKNHFLEKHEIDLEEYMKAVTKMTENGMYKVK\n>ERR1700730_4647339\nXMISACRQWVRLSPRIPLFQQNPLWFESEDFARFSFAPLPRASPDHFAGAPRGLDRLAKIGQKALLPLFVVSHPPASRALHPCRLPCASALPVSAPLEPRLLRCSAGRPRRCDAGPAGNSRLPEFRPAKGRSSGGSI\n>SRR5947209_14544591\nVGNKVRPRSSDAQVVRLAQADVIDRNDGDGMCRQLPAARPGRDDVLRETNPLREVARECKLRLSRAVDAPVTSVANRDEIPNVSRLGLIEPDGNDVVGVKAAAGFAAPDAREPVLLVNDGCMFRRPAADVLPVGAEATTPEV\n>SRR6267378_108524\nXMPPSLTSALRRASSGPMPDRRLSSMCNWRWLSISCASSRSRRSLPNIPANRNNQPRSVLIGTPAETSSSRLLVAQRHHRIHTHCATRRDVASRERNECEQDCDTRECRGVRRFHLEKQTGHKASQRKRSCNPGGDAEERDSRSISHNEPQHVALLRTQCCPYADLMRSLVHGISHRAERSEEPEKQHVEAFLRKRHSDELVH\n>A0A1E5NXB1_9ACTN\nMAERVILVDDLDGKSTEGVERVEFSWQGKDYEVDLSSAHIERYSDLLDPLLKAARLRQVTGRKTGRTAAGKSKADAAETKRIRDWGKTSGLDVPDRGPVPKEVRDAYAAAQASGEAAVPSQAQPGAPVSASQG\n>ERR1719507_515787\nFFLRFVCNVFIPLSLASHIRNFWQRKKGKKAIKKGPNLWGRFQVLVVEVEAESLGVVILDDLGEEVDVACELAYVVRVRLNEVLLEEVRDRRIVARLEAGLGRNNVLVHRVLVEADRLLGRLLHHVQRRAQGVQLSKLLGDLSIFNLEAVSYRSAPLDNVLHERQPIIPHLVRVPAEVSVDAHAVDLVGVEDASHEEEAEAISEVMAHQLVQVVRVSLEVAVDGVAGTAVVLPLGPDFVITTVLDVVGAGVLPVAVGRGSRSRQYEGGGX\n>ERR1740120_427324\nRTTISLKRPRAWCRCRRRRRRLIRLCIVDRCHDPGVRLLGSGEDIAHWRSEGSAPGGRRAHFEADAQSADFVGVIHGGARCRVEHLGCSPLGVCDTIDLPHGGLHERADLTVLSSARIVCCGVGISRNDQLSEGMDVNVHSARCLIQSAMREVDGITYTEGAAAQVLYTASGTTMDYADKIGALGICFEMRPASSGGGAFAPPVSDILPGSLESYAGVMAAIDYAKNPPPPTPAPPPSANCPWFCSIICMSPDCDGCP\n>SRR5512145_1624320\nPGGGARGGSIGSVLVSPRSAGRQPRSPAPPGPRGRGAAELRAARRARVGGRSGSGSRAAKAGGERRLRQRPNKALQLASASGACSDTPPVRLTPPGGLGRLAAHFGGVSYRSAALAAERLV\n>A0A0H4L3H5_9RHOB\nMTAIIATPAALTTDLTEELAALIDAALEIRDLTAPLSFVDFFDGDEGDEENEGNEGDEDDEDNEGDEFDEGDENDEGDEDNEGNEGDEQNEPDGGDEADEGNEGNEGDEGNEDNEGNEADEGNEGDEGEEGNEDDEGNEGDEGNEADEGDEGNEGDEGNEDDEGNEGNEPDGNNEGNEGDEGNEGDEGNEDDEGNETSASGDEGDEADEDNEGNEADEGNEGNEGNEGNEGNEGDEDDEGNEGDEANEGNEGDEGNEGNEGDEGNEDNEGNEGDEGNESEGDEGDEGNEQDERDEGDEADEGDEGDEADEDDEGNEDNEGNEGDEDFNEGDESNEGDEGDEADEDNEGNEGNEGNEGDEGDEGDEPGVDPQDEGDEENEGDEGDEDDEGDEGDGTDTFDDEGDEGNEDDEDDEADEANEGNEHGTNPDDDDNEGNEGDEGNENVPGQEDNEGDEGDESNEDNEDDEGNEDDEADENDEGDEGDENDEGDEANEDDENDEGDEGDENDEFNEGNEDNENDENDENDEGDEGNEGDEDDENNEGNEALPDTGNENDENDEGDEGNEGDELDEHDEDDEGDENDEDDENDEGDEGQEGDEGDEGDEDNEFDENDENDEGDEANEGDEYDEGDEGDEANEGDEGDEGDEPVAGTGDEGDEGNEGDEIDPDIDNSGDEADEGDEGDEADEGDEADEHDENDEGDEEDEGDEGNEDDESDEDDEGDEDNEGDEADEDDEGDEHDEENEGDEADENNEGDEGNEGDESDENDEADEGDENNEGDENDESDEGDEGGINNEGDEGDEDNENDENDENDEDDEANEDDEGDEFDEGDEENEGDENDEEDENNEGDEGNEDFEGDEGDEGQEGNEGDEDDEDNEGDEDDENNEGDEGNEGDEGDEGDEADEADEENEGDEGDENDELNEEDSDDEGDEANEGNENDEGDEGDEGNEADSQADNNEGDEGDENNEGNEGDENDEDDEGNEHDEDDEGDEGDEGNEPV\n>SRR3954447_5641343\nVHVERLQVGLLPVGVARRRRAHAVALEQVLVALRVAEALVDLLELDGVLAPVGRPGNRAVRVHVRAGPVVVADVPDLRALVGRAEVLDVEREDAVLPALHQVGLDEAVLALAGARVAGALEADARRVAAGHPQPVQEPALVGLRIGDGRIRLRVDQLGDVVVVVLRARVLDPLALLRVEVTVVAGAGATEGEGRALEDARAVRRDAEDAGAAVRLVRLPPAVHRVRARLPGGDRARVRDRRARARQVDRAARVAAAGTELVAVPRVHLRERAAEVRGARRS\n>ERR1700712_4604191\nDVSIIAHGNQGEIELGSTIVTEATLNANAAALRTIGHALAPGADILLYGCDTGEGSAGQQFVDTLAAATGATVAAASHLVGDVAAGDGWNLDVTSPGAAVAAPQVLSAAALNSYDHPLVINSPPTGLPISVTTFTGNTSFVETGTAVTTTSSGYLQLTNTSTNQAGIAVYSQAFPSTAAVSVQFTYYSGGGTGADGLSFFLLNADTIT\n>ERR1719161_2539103\nLVQTDPRVACSVFGPTLVQRGLGAKRPALPRLEARMRFGFLCIAWVLEFRLQGSSALDHQGVLRSWSPSTANRNMALSAERVQLRAEESCPPGVPCSCNCHCNPGRYPPPPPPPMPYPPPPPTPPGGWPGVPYPPPPPQENPEPPPPLPLPWDAPPPPKMPPLFGIGSYKGAPKIVALRNNAGPIKAPPGFGVPPKPPWETPAPPPPPLIMPRAMTDAPPYSKPPPFTTTLPPTTTTVDAWWLRTTFPWWHYTTKEYEWTTTTEAPTTTTTAAPTTTTTPAPTTPPPTTTTTPAPTTTTAAPTTTTMPTTTTPAPTTTTPAPTTTTPVPTTTTPAPTTTTPAPTATTPAPTTTPAPTTTTSAPTTTGPAVVLAQAGMKWNAQKGKLQLHAGPDDLNPNKGGWGGGQSGDEYKLGDAYHARAAEYLGYGSRKAPNPAEEYAIPQFQEEQSAECKSICPPCEAX\n>SRR4029453_7064880\nXGGALSTQTSPPAARRRVRGWRRSNRRNGVSFGPPTLRTDQPGNLAPALTMGRFGRSLLPMKRHLFGIAAGVPLACAMAGLVSVSSSAQAPAAAPDVTFTKHIAPILQRSCQRCHRPDGGAPMPLITYEQVRPWARSIKTRTGLGPHAGVMPPWFVEKNIGIQGFKQDPSLSEAEIAMVAKWVDSGAPRGNAADMPKPLDFENADKWQLGEPDLIVRSPDVVVPASGPDRWGSLGMVPTGLKEDRYVSSVEVREVNDIPVGGAKGTVGGRYV\n>ERR1719342_652718\nTRQRYAHTLRNIILHSTPTLYPILHLDASSAWYDLKELNAISGEPIFQVMMIQVKKIQILKRRPLPLLLTMLVMMLSTTPRTRLWRKVQVTMKIMRRRIQSIRRRKSSRSIFDRLCPASQRYPFQRLNDVLLHLNSKHSGRGGGLSNVVFPGNKNDLTGLGLATCKHCGFIVYGLGQTLYKHHEKKHSGVGCMKFNVFCRLCQISSKSMVTPFEDVRALQVHISEAHTNIFDLLPEKX\n>SRR5450756_449411\nTNYSVPWTVTQAVGTYTLWVRYCSSAGKVIRSDASDAALGITPFPTPSPPNLPAGPFNVMDYGAKADGVTDDSPFIQAAVNACYSAGGGTVYMPAGTYRLNYADSSWAPPGIHGSRNNDCSCLLYTSDAADDLLCVDLGGRRIIKNKK\n>SRR5258708_35312273\nGEEGPGRIELKADPESGAEGDDEEAQRGRGREEVEGSVSDGPDHSRSGQRHDDAEADDPEPLTGDFGDDLLPLMSSDARVEEGQDAADDSGERDEGSGDQEAPATKVFSFDPLIDGQADHGREGRLDRHEGVVTFVRRELNEKAPEERPATQEAPGRAVGGIAEPARQPHNPRHEWQHGTPLPEPITITHL\n>SRR3984957_2613687\nPRVVSRIESLAFPAKLEQPLGDSPLISRIQVDGPPPLRGPAYDLDWEGLGIVHETTIAFETGLGGNFDRRFVRPPHPGRGYIGEFPLTHVHVVRSCDEISELCRAEGRLVSRFPARAQDRVSRSGRPRRRQACGRSSRQX\n>SRR6266536_1781336\nDAGDVLVTQRRESRRSSSGAEVPSHGTKDPCRVRMAAEEAGGTARVTTRHPWEAAMSPTVSDHPSIRGALDRAEALAARRRAYAPEVVALLANAEFAGRVADLAGSLGRPAAEVRGEVAGYLREMGETRTRRATSDWARFS\n>SoimicMinimDraft_7_1059735.scaffolds.fasta_scaffold44147_1\nLPKHAHMQLFGFFLSQKATKVRCRFIQLMHSAAEEAERIYRFEMGLLSKEFFPVTISKLGRYKARLFVCTFICIAYTKYTTKHKIKKDDNDSYEMLQISSEIAYTPFSMPATEDFIDKKQKEEAAGLMYKIISSINIELSNRPSPIVGESTKGLENLFTIYEGIFVESIGQKNYNSEIKERLKVRIFSHIWSGFNTMIKISQSRSISQVLFKNELGLPRLSSPX\n>SRR3954453_3871201\nLGVPLWLDRRGKYRGEEAVGQVLAGVLAGDAHRVEQAAVAAIGGELDRLDPALNSRQALEAVVPLGVDVDDRARALQEGLPGEELQGDRLAGPEAAGEQAGWWTGALAGLGEVEEDRRTAAAEGVPYIWTDLRSGVTDRVRDHRPDLVGQQVLGVLGQREPGGGKGGEEEAVLLAAGTMQLGAPVGL\n>J3L6R9_ORYBR\nMQRLLVKKNAARIAETPRVVWVNRFSCLRSSMASRAPIAIQDENLPIFRGIGGKKAGAAAAARAVGRQERKALGDLSKARKAPPASAGGGPPAAAAAAASGSKNLVKPSYLSDEEWMKCCEWAKDGIEAASFTGNDMQKLLSDKREERIRKKVEKAMRTMKLSMDNLYDIDVHSEACMVDPEDKTKLDLDTEFLPPKPYLSSRLGEHEANYVLSDMEFEHETFANCNLDLKLKDEYGT\n>SRR3990172_7523137\nXMQFVAIDMETANADMASICQIGLVKCENGILSHEWKTYVDPENYFDVINVSIHGIDEKVVEGAPTFPELADTLHSYLDGTVVVCHTHFDRVAMHQAARRYGVSTPECTWLDSARVARRTWKEFAWRGYGLSSVCQRLGYEFKHHDALEDAKAAAQILLAASNETGLDLDGWLRRVRQPIDPTAGSSDSAIRRKGNPEGPFYGEVLVFTGALEIPRRKAADLAAAIGCQVASGVTKNTTMLVVGDQDIKRLAGHEKSSKHRKAEELIEKGTPIRIVKESDFEELARVSNELQANARWTTLRSRSVLAAAGTSLHTGVWMEKKGLLQYYGLDTWWQSVLTPAERERVESLFHPLCSPHAQPLTDGVVGQIIGATSTPVSFLSELVGWLHSTPEDLAIRRKIRDKMTELVSTEPNVISRHFSLQVLLSEYYRDRDVDPSALAAAINACRQQIAIAPAVAIVMRTDFPGGLPGHVGYQQLAIILEKEKSYTDAIGVCEEAKGAGWGGEWDKRIARCTACRDKATAS\n>SRR5260370_27521811\nALVDFEVDDLRGLMPDVQPRDEARLLVEEELLDLVLRLAQERCHLYREVTAECVLEREVVVVRHLRTDGMSRRRRETERPETNQTGDVVRLEEIVLLEGGVWRLGVPAVARPHNRARIQAVRQSDARLPFGIGEDLTRHIEDRGRRVYCVERIIEKRPSSRVCRIGADELVIVESHAEVDVEAIGRLPDVRDRAGPELRPPRLX\n>ERR1719507_1551978\nATKGELHMCRKGCIACFIPQGDTDSCQNSRVLMQPEFSGALRIGEPQMSMQFFQDESCPNWFDKLDSKIAQQDVFVGDCFKARELVKNQKYAFIKEASEGKPMTLWACAAADCRTNSCEETTVAVESCATSHYVGIPDNAWYKKLRFMRYQPTEAMHVWDDPYCRERVGLIRQTMGLVQQAVDRVAAFKHLEPSCSFGTAVQDEIVEKKFAEFRGHVTDLRPQYPKRGVLWX\n>SRR5690349_24626955\nRPTLFPYTTLFRSLAGKKTVDLARRDVQRAKQNGHRRGEVFAVPRASDEKKIRQRIRTRLATEVQRVAVAAAQKTFHGGRFVVRSASACGDLRGQVRNARVERIGKLEILSAHLVGIIGRGSAQLGD\n>SRR5687768_17364510\nDKAVSTYDYFASYYTNVAMTFDQRYTLSLSGRLDQSNLFGAKTNRKIIPLYSAGIKWDISEEPFYNKAWPFITARVTYGLSGNLNKSTTAYTTSIATLVNDNTILSVITPANPYLQWERSAMWNYSIGLTDQGGHFQLNFEYYHRRSTLLTGPGDQDATLGMTSLWGNNAALKSR\n>SRR5262245_62041426\nIANLARVGILAVTQIDVLHLIAMRVDHPLQLPAEDALMIVYTGVVRLAKEIADAIGRLPLPAAALAPFEAHEAALILKAVAAIVERHELFPTAIDKGILRIHIRRQTILGPPLDKWYAQLPAHSPGAVAIAAVIVKRNLRLKLX\n>SRR5690554_5011345\nLKVSTMDCVAPRLPSGETVTVGGVLPPPPPPPPPPPPPPPPPPPPPPPPPPPPELPPQAASEMANITATRMRMAPPENGFEIFNIVRLHGESYETKPVEMTVNTPSTAGNPRKHLPWFARCSVIRKPYNGPCKKTLKGCESEVVKTRGITRCCNRETKRLSDVDVEHDEFLEVQTAFAQGAHEILFICHTAEIYRGDLDEQRLGDLEQSRAAFAERLREEDAPLGLQQCADVSKRFLGFGKQHEARGKVHCIIRSADMIVDGFQRERDVVMQACLGDAFAGALHVFIIDVYAADVKLLVTDQRRVVRERTGGADTDIEQVRAVGEARQHLRIPARRQWAEQRVVNQASDHGRRFPVGGKVFVWTMRDRIKAERKGTQCVPGQFIVSTGSADRSAPFSRR\n>SRR6185295_1157811\nXSRVGRVEPRREHLLAAAAVWLWAIAAPAAAGASGAAGNDVQRYIQAAAKLYESLDYDQALEQLAHAKALAVRADDGVEISLYEGIIYADMSGHRDQSQAAFRAALLLRPDARLPVKVSPKVEKEFEQLRKQVTQEQAKEQKEQAKRKVASKPPSPAASDRPVAGAPPTPPSLVPLEPSGRGPAPSSGFSAFGVRVPLX\n>SRR6266480_734243\nDPGFELEAARLDKLGPETDRLFFGASRPITDGGDLQVRRRGKAAAGDVRRTIARRQAGGRVQLVDRRRILEVDLVYARDPEVAAAVIAAGGGRRLVGAEESRPRDRDGRSDRFFARAQRQHPALGAEEIALRSEQLRAARRTKGHVLQAVVGRVEQIRLGNRGYRADVRRIDIGELAVLEHVIAVGDGRIERVLPVAX\n>SRR4051794_34720228\nSIERKSEGCTLPVAGWNNLQPSTCNPQRTVQFYFFLAGAAALAAGAAEVLAPAAGAAALAPAAPFAPAAGAAAAPAAGAAPGAPGTAPSAVSSFSAFASAILRCATFGRPSGLLLSSHFSSSLSLSKRSPRVSTLRX\n>SRR5258706_1188100\nFALFAGNSFAVKNVVLFQFNIVSPRLIEIRKFVRRKLALDLRRRTYDKRIRRYLRSRRQQAPGCDERIASDANAVHQDRPNADQASALDMTSVQRDAVADGDVFLKDGGMRLGADMDDSRVLDISPCADPYKIHIAANDRAKPDARVLADLNIAYDDRVVRYKRCVVNFRFDX\n>ERR1043166_2789281\nPGRKICSERKSGRNYLGADNALGQPEELTADLHRFNPVNPAFLSELSVFICGRSSFDHIQYRIGFWLRLGFWMFGMTKFAESKEHVALIRRVGQSVLLGHDTTANHLFDLTVESLHAFGLTLLHRVEQRLTFGLAAFDVFARSGRCFQNLNRCEATVAVGARX\n>A0A1X2JM77_PARBF\nMSLLKLILQNELCSINFNKNVACATNIYYNNFKISTLVYGGVEMKKYEPLGDLIYFISKELKSRMDESLKDRNLGQGQLLTLMTLFKLKNYDEITQEDLAKVMGINKANTSRNLAKLKESGFIVINQSKDDQRKKNIELTNKAFEEFLYLEKIMREIHNEMIFGLDSPSLDCTLSTLIKMKENLLNK\n>SRR5260370_10911006\nGTAGFSMDTDVMPISSCDGPSLERPASTKLRVPDLSAWLQARAEQLDLDRDLATDTLPQLGRAGPLRVGVPTDMGGSGGTILHAIEAVAAVAEDSLAAAFVFWGQRAFIECLLQSDNAVLRASLLPSLLSGDLAGAVGLSNAMKFLANMERLQVSAASLPSPGDAQRWTLTGNHPLVSNLRPEGFVAAIAADHGDGRPPSIFVVSDEVPGVIRSDDLDLVGLRASNTAAVRLNDAIADEHFQLASSAPDFLARVRPNFLGLQCGLSIGLARRSLRALDSMGPTARATIGEDGRKLEAELPLCFLSLLDGISTGEFVTRPTQLFRLRLLLATLVEDAIILEVHATGGRGYIRGQADVARRRREAAFIPIVTPSVVQLRSLLQEX\n>SRR5512139_1340698\nXMAVAQRTPEWIAARQMGIGSSDIPVLAGESPYRSPYSLWAEKTGQIMPEPDEAQAELFEIGHLMEPVLLTIYERRTGRHPRRARMMRTHPDLPWAHASLDAVAPVRRVVEAKWTTSQRWGDEGVPDDVLLQVQWQLFVVGWQVADVVALAGRRARVVEVPRDDGLIDRLVALATDFWQGVEHRVPPPVDGSEATRQTLVALHPAATAPALSPTPELVSLVDRYVEAKAVTRAAADDESTIGNALRAVIGEADGIAGLVTYRQSADVTRVNWPAVAAAYRQLLEGSGADLDALEAIHSVTSQGPRSLRLSKGVTSX\n>SRR5882757_368707\nVIPECPLRDVGWDRDVRARLLDPVRDLVRRHAGWRLRVPACAGPARGRLHGGGPHDQARLVADHRRRLGRALSVPAARQHLHPVDGGPGRGARLHRGRAAETERGPARQPVVTGSLASGLRWQGFGGGPPITLVAPGLGATPGEARIPASGLSGTRVVVTFPSHGEAADAPAGYWTYPTISTDLERVADEVGATRAVGVSMGAGGLTALLTRRPDYFERIALLLPAALDKPRATPAMWAFEQLADAVEAGDVDGLRELVAAEVPAGVGVGEHISSRADALLRLGGALRTLPEQTPTNDAALLQRVSAAALVIGAVGDPMHPEQVARDVAAALPNSRLELVDSPAPLLTHRREVRSLLVDFFVGXX\n>ERR1712082_453316\nYLKEHLDTIGPHLFVNKNSWNILGRKLGKNCKVRFLLIKRSILVRFSKFLKCYLQNYQTKLTICVIFLCDLYGPHNGPSKMNDPEKKGKKLESSFFANKTLNFGPIFKIFKMLFAELSDKTHYMCNFFVRLIRPAQWSVKDERPRKKGKFRRVX\n>SRR5271166_3589085\nQGRIAGVTTGDRSVHFEYDASGGWVIHDKDAAGERILRYDASGSLTARTDEKGRTTQYAYDGQHRLASVSDPDGSVLRYQYDDAGRVASVTGNADGSPASIAFSYDASGRPLSVTHEDGTREQYAYDAAGRVAQTTNRFGQTLSYTRDDAGRVLSIAGPSGTLANKYDGQGRLIEHDDPVEGTTRFEYAPGHIALVDAADDRTQFAFDAK\n>SRR5262249_39470886\nGSKMTVLVRFNDDILLGTRLESQPDWEGYVAPVEILLLLERQLDFSAFLEQLGRKHRFERQGERLRSLWGDTTRRKLVDERLAGDQLDGLVDRFGRRRLGNGRDVLGIDRSNLKLAFQNDRLTVAIGQLVSGDAGIIPVLIEPALGDDEVDX\n>ERR1719421_1404448\nHYVAGRGRREYEELPDVLDAVLEVSEGREALALQDAEARTALVVAVAGDSELELKDLYEELDDEETVVERSAGSPWFVRAVLACAEGRALLPQTWPAEVMTLLHLAAHADTVAAILEHAEGRKLLEARLPGQLRPVVGQHVRLRDSAQKTDGVLAEGATGIVADDDWTDQPFCVRPLENPDEDYDWYY\n>SRR5437773_2629605\nGGGCVCRCASSWSPVRWRADPLRVRLWLTAVVPPPEHSTRAATPRVVFPSRSHVLAGARDRRPVSRHCIHRLRPRLGKGVGVPGRSCRTHYPRLPPTDALSVVRRRHRGLATRSDRFWLLACRLEVRLRVSSDCCSLGAGQLAKARPX\n>SRR2546425_291204\nDSAVSAYPFCLSFRLPGAASLSPQRSRLTQVLLCRSVVRRPPRRPLIILRPSFRTVRVAFMCPVPPRTEYTAWLQMVRSVWSRVPQQKGFSGDSGLATSAELKYPVGVAVDGSGNLFIADPGNSRIRKVTPAGVISTVAGDGTSGFSGDGGPAASAQLNASSGVVADRSGNLFIADAGNSRIRKVTP\n>GraSoiStandDraft_43_1057313.scaffolds.fasta_scaffold3636311_1\nRFFYDEDDNLNLDFYSEYIKAIKKITNEEFLSTFFEKRKKNINKINSAIYSDYFLVDNNSYLKYGPGLYYFNQEDLLFRAEILKKKIKQKLNKISAIETNDQITIENKDIPGNISLTVDGLICEKLQNNWRKNFTYKIISAEYLKNKVEIKKDSPYLSNSRCIYVKFKDKFDNEVFLKKINYSLPVLFNEKEIKEKYLNYFYKKNNILFLKNKETEINEDIIIPENFTVRIKSGENIKILNNAFIISNSQWEVGDKNGRVLITGAKDNFGGGLVIKRVKQISKFYNTDFKYLSGVENRFLNNKKSEKTSFILTKYFENKKNSYIYSQVTSNDYNYGFSDKFSYTGAVNLYETKAQFQNCRFIRIDSEDALNIISSQFLIEDSIFEENSSDSIDIDFGEGIIKNSKFTSVDNDAIDLSGSKVYLENLYFLDVDDKLISSGENTKVNIKKIEGKNSYVGIASKDGSETIAEDINFINVKIPFASYQKKKSFKHGILKINDPINLENYVVKNIKDRNSYIYINKKQIRNSNKQALNIVYKKKLSLINEHX\n>SRR5690606_2703104\nNREPLVTNRFADGRERIERPACGRTNLEIVELAGREAAIAGIRDHGGVVRAELRARIHHAHVHAAAELAELGAQLAVRADAACDDERRKRRLLERALALGDERLDDGILKLASNVGARRVIELESSRRDDDRRFQAAETEVEPGPIEHRPRKTKAARFPGIRQLRERGAAGVRQPEQLCGLVERFAGRVIDRRAYDVVLPEPANFREQGMPARDEQREKRKFGRLALEHRREQMAFEMMYAX\n>ERR1043165_1439568\nXMIVQTKIEDSMTLKLVSERAEAELRLINSRELEQELANRDNHFNVRDIVAAALWKTDLMEAVIIRKIYEAIIKIDMKDLTKVENWAEEINRASQNPLAIESMKSKKKQAMPREEIITPEMYIEKVRQETDSVDVVMNEKESRQDTSPEEKERQKRRKGKEVTDIEVINTKMEMTTLDEIEEVKTKATEAGFQQQNYKDIITAIRNENDTREIEEMQDTVHQKKENSFAEAPLEQSIWSPSNRSCNSKATYAAKIPAYNVPGSSQEERTKFVRRLLAFNDHVKEVKEVFERGNAWVRAVFDYKYSREEAINKIQKKHNDWFRMIPDTDEREEDKIREHERPKQKENLVKEEEERREEGLLALTIWDLPQEISEQEVRYLVKRIGKVISCKVKRSAYRTIDRKR\n>SRR4051812_11463556\nRHAYRDRPAEPKPNIGNYLEKTSRFGTPRVLEGDRIAHNGIRQRERTNMGATATWAGTGAGRRRMEAVIETLASVHEHGESVSELAHDARTMVTALSLYCDLLDEPGVLASSHRHYASELRLVAEASRRLVEKLAQLEGGDEETSCPGRTSALQACLFPEIAQPHGGAFQGALNGMPGMEPVSGGLIHDLREELLSSRGLLAAIAGPSVTVNTATEGGAQPVRMSGENLIRALVNLVKNSAESIDGAGTIDLRLIEQWEPGKVHTLVLTLEDTGCGIPPEFLEKIFDPGFSTHPARQPGGSWTSGHRGLGLAITRSIFTAAGGRIHAENRTARGARFVIEMPVRN\n>SRR5688572_23826730\nGVLALEALGLIALSLLLGNALTLFTLGRIIGMVLRVFSFAAATVDIAIGRLGSDGRLLVGDTVVWLIVLEWLAQSILAFAVGAFVLWVSSDTIGLAGAVLSGFVRTIRRIGIHAHNGRVGLTVVLAAFAAALAGAINS\n>SRR3972149_4567815\nPPRSTLFPYTTLFRSDGLAYPFGRWSAFIVLTLAALNAFWLLKRFLGQLRLGGKVPAFFRGHLIENTMLLVSLAVFRGALGRADFPHISYNVFFTYLLALYLVVKHGLAGFVERVGGERAASRVAM\n>ERR1700722_15463975\nGITVAQELRDREREPLAAEYVVLAGPDHEPDAPLTQGVEDRQQPRASLGQAVQGRGDRRRSFFPADQPGSFQLADAVGEKVRRDSRQSVFEVGVPQSVADQQFTDDQQAPTVAHDIQSFGDRAVLSVAPHDLSLSVLQLNFKSKRLTSSSLRVTLASMRTGCRRX\n>ERR1719253_2112\nCSHETALPMILRGPHSLTSDLMSALISSVASSSIPTVLCITAQGPRYIGTLLSCLSFASLALIHRLHDWCVVLRLMDDDVVWQRHLGTHLALRVMRKHDLDLNAKHPLTHGHVADSLANVVLLRLTSGNE\n>A0A1Y4JJG6_9BACE\nMHATKEFSSISELKHIREQKSRLSEREAELVSPILTNLECIPYIYELFKNIVRTMNIPLREEIIQRKEFLFIVLFLFVPSVLAGGRIPNGVRKALEHVFPKVKPCTISNNIADVFFLYQQYKYFRSDIEIIYKEMLKRLENDDVSNGLKRFIIK\n>SRR5471032_1837456\nMLLVDVDGLSSLVVAVIPLHEIGLDLRDTQAGQLAGASGPKERTAEHSRKRDSLQCAAQVGGLAFAGFGQRQVGAARMLAGQSPGGFPMANEVNLRCHRARIAIRSSLPMDETRSSPGELPGAIVGSSTRTIGPKFEHMRPTLRVL\n>ERR1019366_9306790\nAMPITPSSANLRFSDRAVTNVPRSSANTRFFAHQQASPAARVPFAQQQRAVGQAATGAPNRATAAAPGASQAGPAQNAVRPQTPQAGAASGWRRFGEPGGSQQAPRSQTAPQNNRGWTGFGTPGSSSSAPRQQYSQPQPGYRGNSGSSAPQSLRIAPPVVQQRSGGGSYSAPRSYSGGSNGSRPSGGGGASHSSGGGSSRRGSRREKLGSREISVSSPRPRPASAGSRP\n>A0A098LH02_9BACT\nMAVLSWAQTPLSMNGRLSVTDGKLVNECGTAVQLRGLSTHGVMFHQECYTESSVKAIAQDWKADLLRLALYTENSDGATKGFAQSTNKEFYYQWIDKMVSLTEKYGIYVIIDWHILKDGNPSKYQNEAKAFFTLMSSKYKDKKHVIYEICNEPNGGTQWNQIKTYAEDIIPAIRNNDPNAVILVGTPEWSSRIDQARSNPLSGNNAKNVMYTLHFYAGSGAHNQYKNYLRDAVSAKFPVFVSEWGTTEASGAGNIDSGNSRDWLSLLEQNKISWANWQFSDKNESSSLLKEGSCIRESWIDFRTDNSGNSGKLIYDELRKTKNYTACGSVTIPVTPKPPVCPNATGSNLNIYGCPVTNTFNTNYCQGYNTKQAYVRTDFSKDTVPYFTYWKKPSEGSTVYSAVIQNEKLVITSVNADPNYSTFGFDFGKLNATTHVPIDLRANAVLKFDVSFQKTNYSANDIALYIELVDANEKSINATALGSYNRFILPVNGTTKTIVADFTNGVKRTPPATPGTNGDPKEDTYDRTTFDFSKVTKITIWVNPNVSGVYSRPPFTGTWTIDNFSLGYDETKAVSCEEYVDVDLCPEDPNKTKPGKCGCGVPEDGCDCNGVAGGTAFIDLCGVCVGGNTGKIECDGNAYSGTPYPIPGTIEAENFDKGGQGVGYYDITEGQPASSYRPGDKVFTELAGGSTNNWNVGYTSTGEWLNYTVDVKYPGTYHVSFRAASERATGKWHLEVNGQKIPNSDFSLASTGGWQTYTTLKTTQPIALSQGKQVIRLVFDGPDANIDNMTFEAFEVITSIPAKAERKVTVYPMPANGLINIRQEEMSYNKAVMMDMTGNVIKTKTLSGLTEELPLQNVARGIYMLELTGAKGTEHVRVVVE\n>DeetaT_19_FD_contig_21_9884499_length_257_multi_3_in_0_out_0_1\nMKDYIGLVDTLNMKGMVVLERGGGALLSRTYPSNKIDVKDCAFKFPLYTTEYKMGKETPELVRTQSWNGAIQVHTSKAFTAEYGYDLFMNIPPWIYYNHTNLKSQTKKQIKTASETKIMLQIKIPSIKSLFLSNAFKDWLSSGTTKENNNQPDKLLWDYILHHHDFRVYGIKPWGKSNYLHYRDLPITQMDLHIDIRGIETKDVLGLTSVAGYYARKNMAIWHNTDATENEKVVIYQSPNGIEFRKGKKSSEIYKFYDKKLQQQQQYYDAIYTPQSFASDRYKKAMKPFFEKLTDAERTTLRYEVSLRKVPSQRNAVNKVYAKYSDGIEKDIHLDDIIGNTTIYSRVASKVLQVGLYNIFGSEITKEISNLESGDNAMNDTDILQKYKSKGLKYLGIKYLMKNEGLNNEQVWKYLTNAIAGNSSYEVVRRLRNEFRDEGLALDLLDTHQQTLDRLKDVYKNALSX\n>SRR5580698_6036952\nPHHKIFDSVNFLLRTWLHWTLRVRKISESHPVPAIVSQIAGFRCCTTETSAPPQSSSPALSRSMQVREYKESDLAQLKAIHASQGFDYAFPDLSNPLFVTKLVLIDANANAATSENRQSIDSTATANGKILAAAFLRLTAETYLLLDPNAG\n>SRR5690348_4651858\nLTPGEVMQLDPEEEIILAAGQPPIRAHKLRYYADAALRARVLAPPEVTCPDRPSQMSSPWEDEGPKALAPGSRRAPRGMADTEDTEEEGHVIERGVDEDDAGPGEEEAIEEEGYVLX\n>A0A085GHN3_9GAMM\nMINNICISLYGSIEDICKQQLVNAGFRVPKETTNGYLPLLLNMNKRLIEPRKRNVHFHSTLIVPEKNRNGFALLINKMQCGSNINGYQSHHLERTNFNDDFLNDFGLHHFHLGETTQKTGKHKRYIERTGNTIFAKVDQNDIYLLGVFGHNSEEKQFIYSDEQLLKSLYDEWPHLLEQCRVRGVTGQTLSPEERNALRSNGTNVITALSDDIAIMSPGGGFMANKMSAYVSIEMIHLYRTISLLKKSLFKIQEQHYPFDADFKVITFGHDELSLFCDKNCFFTKIQILDGNHKTMSLAPGYGPVYTHGFVRGQTTKLYVALIEALNTTASRNYLHPFPSLYIRHL\n>SRR5205085_12251670\nXMNDCGALCAPFVCQGGTWEKSRKCRCFPGMRQERRKLWLEASQGAILVAALLGAVLSSRASDWHPASLVLLLLALVVATDQFAIATKRMRISGGHVSFVLAMALX\n>ERR1700748_1727377\nDSAGDPRAIYNRLAEETDESNLFLDVEAIGAGENWRTRIDNMLQKVNAVVVVIGPRWLDLLNARAAAGAFDSVRGEIAASLKRSDVQVIPVLVNGARLPAQSTLPDEIKGLTDLNAIEVRGSAWTSDVERLVKALRKSGALPTSRTRWMIRAAALAAVPVVVLAVVIAFFELRREVPNLPKNISYRFARELVSNAGLKVVGHKIEPRNGTIDVVSAQRRAPGSHLFTWQSVEVDLVAVEPYRLVCREGQNFAYGSDDDGFRFEQYKGQASIDMTEGSCAWIDRPMRQEEANVLKPLGFERNLAKHFHSAPGGLLAFCAISDYDKHNKSPRLLALSLEWYARKEGSGQLVPIIGDYMCVDRLEX\n>SRR6478672_9921535\nKLYVSHKVTVARSAVDNSETCRAYGDSVAQRRRRGLGRAPLYVARLQGDVLRTRRRELLGAGVQRLLGFVSPSHEREQRIDGELRGRRASLRGALNESHASGGGMAGGQTDLHVPELGFFTGVDLDGLCALERECRDLDLGLGLAGILCGCRRGALPLDDRVRLARLVVPETSQRHSFEFDCTGEAPGVLVEEARGNREISGEAETGSRIGAEEVX\n>G7DWE7_MIXOS\nMVNQDAKGKLKKLEPVEAAKRLAAYAAVDAHIKPHHRVIGIGSGSTVPYVVERILEQGSEINEDRWFIPTGFQSKQLIVQAGLNLGDVDQFPSIDVTIDGADEVDDDLNAIKGGGACHLREKVLAEAAADFILVADSRKDSRVLGTTWTQGIPVEVAPFAWAKVYQNLALLGCEEPILRMGKAKAGPIVTDNGNFVIDAPFSAVYMRDPADLLHRIKMLTGVLEVGLFAGMAKAAYFGQNDGSVIVRYVDASPPNSARGPPSPSLAVLQSFSFTFQNGPPEHRARIMPSTSLFSQRSVMSMFTESHIRSIKSLDDLDNAPGGRSAKPKYPYVITLRAALLGSPNGQLTLQEIYAEIANRFPYYKHAGKGWKNSVRHNLSINRCFKRIKSADPSKGSLWSVDEDEEVTTTRIRNKKRYATSSRSNYRYRARAAKSRRSFADDDEDEEEEDDRSSVSESASAAFIARSPIRTRRAVLAVDTQTKSSASSHPSATMPSSPTTSELSDANSVNSTFSPLSPAHKPIQHIQREPAPIDSFGRAGTRPTPITALNAGQSVAPRASESPRSAAFPHTESHMRSFAGHVQSPSYRFSAVQGHQMDDHYPTVWPSLGTYTPRQTTFAGAASSTVAGTGPSYPDARHSLGNYALKSDNNHEHVPSTSGAENAQPYYDYPPETEETPTSSYYRDYATVTQSDPHWWQQVYQHSSAAQQHSPTQATHPAPPPYYHHQVHQPPVTMSPLHAGHPLSSGYGTWYPAPNLPPIGHAPNGDVTSPHYPTLLPISQQKRMLQAAQ\n>SRR5437870_1888551\nARCCFLIRELQFWVLGPSRSASWSGFSRIMPLRSSPKLRRRYSVRRVVTVRRSPQNRLARRLEPTEAVLRWMSGVSEPPFVWVTPTRVRRLQSSRAPAGIGEKARGLLWLPAAWVPPFFVLSPEFHQTLSECPAARRNALIDSWATVFERAIVAAGLGRAEKLYLRSNAVDETIEARGRYKSEVCERKHWKPVLRNL\n>SRR3972149_5390364\nRLLRGGLLLGLFACLRLLCGGLLLDRLLLGGPLPRPLACPPPLPPTPLPPPGPLPPQSPPRQPPPQPYRPAAPRSRSPACERFASASPPPRGRRGPGSDDGGRPACAPARCRCPPGASPRCRGRSRSRTTCPVRQRAPRX\n>ERR1719354_373981\nNLVKLSNTTDLLIVPRKSRRTKDSLLSSRELEQMSSVLAQVLVCWLVSTKCKQHTSTTSSAQKTKTYIRKHNQFLLKPPSLKSKFAIPTTNSPSRKHTTNYEHLFIEVKPTRKHKRKKELSLFQRDGASGFDHEFLNMTNNLLERSSTHTPKEGVIFWKCLSKVDSFLPRPLQRFFLLYILTSASRGVNSLSX\n>SRR3954463_10117746\nLSFFFFLMIRRPPRSTLFPYTTLFRSVGEVAALGQGQALGQGVGAATELQDRKSTRLNSSHTIISYAVFCLKNKRIKRHEAREVACLVVVFAENPSPRLRYVIGRDAHLQIFFFLITRRPRNYTLFPNAALFD\n>ERR1700722_4865254\nVQQQFVPSLATRVDCGKMGEAQNAKGTTCDHQHFLERVFLLFLELYHSMRYTFIPRTLLLLISLSRGSLSSPGSFVSTRFPPVLQDGISCPIEQGDSHMQPLLHNHDLGTKTKLWAKVARLQGDNASVSANALX\n>ERR1035441_2809112\nGLSGREITWSPVNFRADGNGIPAPSTEDPQVTVERCNAHLNVTPTGKSDQPLRIVIPHLVVTTILIEELHHSIPLEVKQATGDRLPHGISPRQLCFSHVETVAEAISGALSGLHQHDYSIDRSVRTLPVGRLRRNRRPACLLRSEWWSTTVVAASPDR\n>SRR5215472_7227805\nGTPIVIGEASEGATLGVVAADATNILFQRYDSAGTAQGTPITVAPSPPAPRPTFIGSGGGSSLVVWGQGGGLHGSVVSSSGAGAPFDFAPGSWARTLYLSIADAGNGTFAIAWTGDTATGVTVSGFALAGAGGITGGPSIITAGSVEFRVIKLVHTPAGFGLLIAGLPGNDTVYVVPLDSAGNVTGSAHRFLGADVAWDMGAQGGGLGI\n>SRR5580700_8890822\nVLAGYSRRPVPGRSHRPLAWSRVRPGKARTRLWARRCHGANAPSMPGRRRPANRHEQPSLAIVFLSPVFVPSASCEGFPHFEIRTMKGEPHETSSSQLPCELFAAVARSRNRPRTCPRSSGLRTARQFPLGERGQRAHDRVYQHHRARTVARCNRRVRTHFRFWGRGIQKGPRRRAVRRGNGDRCGELSGLALSGGVRAEYEHMAETRRINKVHRSLSRPLTILGAERKLFFFAMCMGAATFNLLGSLLGGLLMFLLLYAMARSATQTDPQILRFLLSAARLRRQYDPMKFSPIVIRREGDAX\n>SRR6266545_3341769\nRNGSDRVLLLKREPGRKRPKPCSDTLKRLAALRLRCVTPGTCDEFSRAPADRAFPVLQESCPGIDTALANERIGVLRRGKMFGIDNEKRGAPTGTGGLFHRSRGGRVAGPVAVETKRHGVDPERCEPFKQTRAHTRSTKGGDVVDAASAELVEVEDSLDEDELLPV\n>SRR5438128_2375330\nXMRSMASGGSFHCAYRHATQQAFLEAHELAFAYFGGVFRLLRYDNLTSAVKKILRGYQREETTRFVAFRSHWGYEAQFCNAAKGNEKGGVEGDVGYSRRNYLVPIPQARDLVELNAHLLARSQEDEGRKIGDRAQSVGAGMVIETEHLLPVASEGFELGEVSFLVVDGKGCVKARTNWYSTPLRAGAKARVNVLPAWLEVWHEGRCVARHERNYGRGRQVFNLEHYLDVLERKPGALAGSTPLQQWREQGRWPDSYDRLWKNLIQRNGKLSGTREMVELLLLGRHPDFIRGYAIMVRGGSQMFPSHANLIDGFGADYKRRIKRNHPAWVIVYARGEPLQTFGNHVDIDKNVVDAWGIPVLWIHYERTENEQKMAKDAFQNLQELMHTAGAEVLSADDTLSTPGAISHEMGTTRMGNDPKSSVLNGFCQSHDLRNLFVIDGGCWPSATCQNPTETMLAVAWRASDYLAEQLRRGELX\n>SRR5262249_4210377\nFPDEGNEDREIDEPPYRLHGWIRTVSHDGALDDQDPLRNSISRSESLPGRALWSAFDLQAGQPPAKEWFRAGSLTFRTGVWSDLPESYDDSRPYRRRAGSHGSRVQIRSDLLTDLLRSVQMDLIVSVHIERSIESEYGRSYDTSTKKRKEFERIFIFRSDGX\n>SRR5258706_5404908\nDAPPLLTPPETPANVLNPQWRRIGAQAAPDAEQLRRRGFRQGVIVAAGVVLAAVALTLFLLPVRRPAASPGAASALAPGVNAAPGANATPGANAASAAADAVDLQQLAQQKSSAESWYTRVAPRVRMLADSGAAEWDAAGMSSASAALATVDALLAGRDYIAAQRQLQALDVTLRQLEAGRAAALKAALQHGADALHQHDAAAAATAYAAALRIDVSNRDAMHGARRAASLDSVLAAVARAREAEQAGRLADASAGYRKALSLDPLTSEAQAGLARTSAQVASDQFGRAMARGYAALQARPPP\n>H1UR20_ACEPA\nMRILNQCVTKCFALDLAGTAKGINLNRKGWENVTFQAARQQNSYPMPYPKDKDMETARNLMVDDQLRPSEITNLSLLSVMRELPRECCVMPDQHSVAYADITLPLGQGRVLPQPLLTARLVQAVMPAEKARVLVVGAATGYTAALFAALGANVTALESNTRLAEQGQLFCQQEALSVSWVIAPLNEGAAGNAPYDVIYFDGAILRFPAFCAAQLAASGTMAGVMASPNKLAKAFIAMREPKSASSFIVTNLFETQLPLLPDLAAPITFEF\n>SRR5687768_16770258\nISAAPARRPPSRIGAFPPERTGFRVARMGRGMHRLPLRCQMARASVGRDASSVHRIDLPCEQTGFLCPPPFDVHLKFLPNLPPLQGWTLLAHAAAGRPDALARWLAGHRGVTDVRVEPGLAPKILRAKVAVLPELWAAASPYVRVHHLDLSTEGHASWFIEGSKKDVLAF\n>ERR550537_1009424\nGKPWPPRTTSDPTSQRAGHVYLIHAAVSNVNGFLDLGVGDKFGEAASAVDPGSAAVKQRVAAVTLDHALDHESVIHVLKSDTQGFEVNVMSGGKQIHRKARLVIYELWPKGLAFAEASVKDFFTELADAGFVICYDLYQQRPANALE\n>ERR1719378_273336\nQVHFKTRLEFLKLDLQQIMKEEEIPLFPTKGLFHRTEDIAIMVQHFVSELLILPNLCSAREIYRDDFLKLLQQKSNTLFSYIEAKSLRGVDPFTHADIRQMKIDLSLNSEADFRIVLAEAEKLHPGLVSFLFQDPGSGTPYQAIRTAFVX\n>SRR5260370_18266583\nDRTGPVRPDRFAQPRNSGANVGRQTSRFLIGSKYWDVDYTRTQTASNADTDAIMRRNRKVLVGVFAPIRVVFATPGRALLGATEGNGRVGSIWHGTRFQVPKREFGSLVCSSSKYLILHDRNNLSVRS\n>A7T0A9_NEMVE\nMKSSPTFRFWNAILHYQMLVLLVVRAQRQRNFVLYVEALEELVPLFFVLDHVNYAKWTSIHIRDMKSLPQSITEKFQDEGQFVLSRTDNDFSAMPFDQAHEQENKIVKSAGGAVGLTENPTAFRRWMLPGPETTRLLQQFEGQYLDDTDSETGDRANHETGLSSQKTFKIQVNNLIDVIRKMGNPFLDNFPELVTLDSRDCMDNEEAETIVNLDALGKSQYSSFLKDVTKDRTVAIGKPLMQNKLPLFRKQASRNKPKQSKTTPLLQNNAALFAQLYIAMQSRDAEFFSHEVQPSPPSLSEFGSLRLPTAKSDLLKCLSQPPQPEPPTEVDCKVCDGAVIVHCLPVTGVMTFDDYAENVFLPYIRNLRSRRVDIVWDSYIPNCLKEATREKRGTGLRRKVEGRTKIPPKWMEFLRDPRNKQELFQFLSVKVAEFPWFTVRKEVYITRRWMLSGPETTRLLQQFEGQYLDDTDSETGDRTNHETGLSSQKTFKIQVNNLIDVIRKMGNPFLDNFPELVTLDSRDCMDNEVAETIVNLDALESNVASSGEADSFLRVTYLKDQKLKSEAFSHSGDQLTTAEWEQTMKSSPTFRFWNAILHYQMLVLLVVRAQRQRNFVLYVEALEKLVPLFFVLDHVNYARWTPIHIRDMKSLPQSITEKFQDEGQFVLSRTGYDFSAMPFDQAHEQENKIVKSAGGAVGLTENPTAFRRWMLSGPETTRLLQQFEGQYLDDTDSETGDRTNHETGLSSQKTFKIQVNNLIDVIRKMGNPFLDNFPELVTLDSRDCMDNEVAETIVNLDALGKSQYSSFLKDVIKDRTVTIGKSLKHNKLPLFRKQASRNKSKQSKTISLLQNNVALFAQLYRSSMVTVEIKKLLNIQFLVSLCGFALFIKEL\n>SRR5262249_55098951\nTLLAGDVGLYSDFRYDQTGTDILWMGSYPPASTAGIYEWHRSDGSIVQLSPTGDVVGSFAHNADWSIIAYTAKRDSGFVYDQRVLNRAVPGKALQLSNPAGTAGVLLYTGSYFFTKX\n>SRR5215218_3154104\nSPDVAAATSVPATSGAAPRTRSRGSMDAAVRVADEAVMPGTSGCWGPPLGGTMAAESPMLRPVTFRLPVPALPEGCTRDRLHPERREPPRPRRRPSLRRGGDPPVHPRVGREGRGPPRGLREDGGARVPGSSDPGTVRRIRDGLRLVRAPVRGAGARGHRVPRRAERPRRPELAHAPPVGDGGAEAALAGAPGEGREARDVRADGARRGDRRGVAGVHGTTRRRLVRAQRAQDLDLARGPRRPLP\n>SRR5699024_12259917\nSCALIILLSFPTRRSSDLKVVCAADDAAAGHLGAGLRVLRIVESLVVLGPDIDAAPADALAVRVLFLDQIEHAADDEGAGDLGTEEVLFLESDAGEFGGEGMGIRIGREIDIVGQPVQWDAHIKPSFRIGSRSAHRLRPCRAYRX\n>SRR6185437_13271781\nSVKNRVSARRCAAHAADYVGGFIAAHAALDVRLQVNGQFDGVKAGLAGLCNFVVNTAEAGGGEELLRHIVLDPGGGAQSGIGVALQIALLNGLRVFHHIPAVAGKVRSVNDKHADGAQTRGFLVLVCPAAVVGERFALEEAVVIRWRFVDDDEGYFSFHIDAGVVVPVVLGRIDAVAGEDDRRINVGALLPCLVLGNDVGAVVEIDGCAARGCEGEARLVFHGVDGNERDFLEIGAVIACRLEAGHRELRADVFGGELVAACAGAAAFEQIERKKADVRANLLRINGVCGSARGGRHAGNVGNGGLLRAEQRKRGEREYESKMHVPKLHSGGSFGLHRYAAMVIAGTAQFKAQTLRALCGALQASRADGRGX\n>ERR1700731_1967141\nWPAQLKISEISTGPVQPAFRWQRTTIPLLHDCDRAKSYRSIAPRHWRELMDSPTRSPSRPEFRTRPATPAGRQVESFFRCADNEPDAQNCSRVLLPTPRVSDRLPLKMPFRRETEPLHALKSRAGIRLCHLTGSLILEFVCCEIRFDLRASLREPTASPRTAXX\n>ERR1711974_545716\nCLRYELVPLFKSACCPPFFAKQTVSSKRTISIGSDRATSELSLELGWPIASAWGVCTEMATTGGHPPKGCLLRQATTCMGGHFVACLVRMLLNDVALKSIVLPARX\n>ERR1719506_2640246\nSAQLAGGMGGYSQHRVAETGSSKAMLGSLGVFRYVNLKFPSLAHAKRRALMLFLATWSSSHRRAVPLLTKPALQDLAVCEETLCLWDVYGLNWPHGDRTATFQLNKRYGSTVSEMISMCGHGPWSSIPSREDKGDANRLQPVGVRVASPVDEQEISRASAGNHQGKITGRGRLPQIASAASGGSTLAKASILSARTFTSSGGIVSPLKTNRKHVSSEELSSPRHRKMTLRCITGSSFSIG\n>SRR5574344_946438\nPRSLRADTLKRRSRRMVEKMTKYSFVLLSGETEGFLKWLQGLGIVDVTRSTKPVDEKSSQMLDKVSRVTKTLSILEKLDYSADPDFELIRQAADKTCIEGCKAVNTLGATARLEELKAELAAARKTMNDVA\n>ERR1712128_216805\nTAAAVFLLQLVMARSSSLVVRMVGSVWSSPSRPTAKPKEVICTKTRGHARIDIASAASQVLQPLSHQHLHQLNLQSWHHAQSHSNVEAPSASLFMKIKMIFLIGMKLEFDVWPWERELTWQNLMTWLTLX\n>SRR6266568_2358632\nPSTASSAYALVTVPRAMPRSAASTRVDGIRVPAASRPSRIAFRIASASPWPRPAAQSRCRSRPALDHSIAMPLDHTDGPVSAYRGRYERQAQSEPQGGGRIGVSRGLRTATGSAQAGRGRGDSGRSGSETGRVDQDPGVAAQRLRVLPRHAQPRRAQDRRGRAAAVRAVGLARDRLLHRTGTGRAGTDRGHDGSPPAPGRAERDLRPGRRGFQLPPVDRRGLARQRNQHVQPLRCHRPGTATVPGMNNIELAATLKSLHVPGRPLVLANVWDAASAKLVAAAGFPAVATSSVAVAETLGYPDGHGAPVAEMLGAAARIARVVDVPVTVDAEGGYGLPADEFVDRLLATGAVGCNLEDTDHAASGGLIDIDRQAKYLADVRAAADRAGVPLVLNARIDVVLATGRPADQAPLVAPIVERAQAYLAAGADCVYPIALRDPEAIRQVVAAVAPAPVNTNCPPDKAGIAAAAKLGSGRLSMGGGLWAVVRTGLAARLA\n>SRR5882762_5772273\nSRPLFAVYHQTFPRTCFGRVYRRGSRMKLSVGRYFTQASLGCGECCIFIEIGELIDWVVFSLNKENIPSRAYIAFKNEEQLATFSQGYDGHLFRDKAGAFVFVVRHSCPSSNWHCFGGLIMSLVPGNESIAVVEFAPYQKIPTEKKKADARGGTIEKDEDYLSFLESLSNKNKPTGENGEPPNLESLSVYLLSSRIPSFPHTLPLHPLLQHLYDYSLTHAFICSCRNATRPPTKNHPTSX\n>SRR5262245_8502620\nXMSWLRIEKFFLVAVATVLAHQALGAELIHPGARRVAFTRAVVNLEYLSGRLGHDEPPSIRRSAPLGESVWFGEIPRQLVGEELDSRRHYVPFAVMLDGNTVVRAWCDANMNGDLADDPSPALSAYPGSMTTRSFRVMLRWRARVGDRTLPIERLVRVVVEGPDTVGAVPTYRLQDVYGMLGTIEVEGVQRAALLYDANHDGIYTRGRSDGVFIDLDGDRHFTIDPMAPDFGPFAIPFTILHASYAVDSVALDGSSIVWRRLSPAYAAPAELGRPAPDFAFQDMQGRSVRLSGLRGKTAVLYFWATWCGICRRQAEDLRSLYAQSSRTDWELVGVCYDTDRDAAQRFQSEHSFTWPASFSGGLPAEDPVGRLYREAGAGVFYVIDHDGTLARKVFDVTELEAVLDSLRTAPTESSLTGHHYPKX\n>SRR5262249_12765844\nRAIWAAWRRFCCHERVGIIRPPKMSYPAYFFNSGCVDHTAAHGSLQDSRVRRTQQAHFQDLGAAAAIGRCAGARTRTPDAAAGRSRAARFSSPTAARAVAPATPTVAAADAGAPRTIYQGPYSAAPCSRELVNGRSMLPX\n>SRR5438132_851461\nXMADLDTTQDHRTRTLVDTAAYQPGAIAPDDATGYRDHAAVIGQTSAGPTRPVPADRRIREGEGAAGIFNAAAVAAGGVAADGAVGQRGRAAKAGQAAAETEGCAAGGVAADGGVGQRRTAAAADHSAACQAGGVAAAGAVGKRGGPDQVVHATAEDCRVAAHGGVGHHKIAVVEDAAAAGKAAKAVVFASRGVAAHGAVVQRKRAGIEHTATGVGGVAADAA\n>SRR5262249_12382799\nRPDRPTASSTNRSSALGRRADDRAVISAFLQMAAAVLAIAPLGICMNTQRGLCPPSHLMQECAMSVRDDTPAVRDLNGRAALVTGGASGIGAACARELAARGATVTVADVDEAGAKDLAQGIGGRAWAVDLLDVSSLENLRIEADILVNNAGVQSINSIVDFAPX\n>ERR1740117_695841\nLRIKYLNETQQKNPKHFQDPETGAQLEIKDQQTLSDWLLMYYGKFGIKIELVTDQSSESFQFVKGFGGIGGFLRYKLELDDIIGDAAGQYDDQPVPITVIPISNSRESTFTTTKPPVEDTFQEPSSWISNQEPWTPSELDHSDNSSDQTTSSSDKLVPVTTGLKDITPRVPSSSTPSSTSLEKKLKVAIAFKVSKSPTLSVEELDPVWEPSLSPRSERNTQTEX\n>SRR5258706_2253991\nTVEDVAILRCVAAAPHDHAQPDLALVSVAVGELVFPAPIGPIVREVPLVTIAVVPCVGAFAVLETFAEFAFVLECLRDVLALAVKALAAHGAAVDRSVGERELAYARRDFASGSRVRLRRGRRGGRRWREWRLGGNRRPWCHLRRSRGNGDRCGGYDRLFRDLVPRALGRRAVRGCDLLGRFRGGFGRSRGGLHASLRR\n>SRR6476619_4763585\nPKAQPRLHREHELRLLHVAVLRTRLSHHLCRVARPGPTRPLARRARDPHHVRTASANLSRSRRMYPRLLAAALLSPAQPPKADPNDVGVLPLGADGKPLNLDFETGDLKDWTATGDAFKGQPIKGDTVAPRRGDNRSRHQGQ\n>SRR4029079_7780467\nPEPDSGTGAVGGGVPDVSAERQADYRELVEEGPVALTALDPRGTDAVAAYCLLPTAYCLLPTAYCLLLVFPVHVVIHELLEARRQLVVGSAQRRDVLAVDEDGAVGRLARAGQADADVCGLRFAGAVDDAAHDGEGEGLDAVVLLLPRWHLLSDVALDALGQLLERRARRAAAAGTRRHARRERAEAERLEDX\n>SRR5215204_4095657\nVHGLAGLRGGQGAVARDRAVGRVARRSSALRAGSVALAEAVAVAAGVRVAAAVAVAAAVAVAARVAAAVDRVAGHGIAGVGAALAGVSAALAGVVPTALTGVPTAALAGVAAALLVVGRLGRGRADRHLRVAHAGAALGPRSRGRRGDDERDQAQQTQKSGDPAHIGPVAMRSRRLEX\n>SRR5512147_2844591\nRAYFNAERPPWFLDPAMSGGGMFGNVGLHRLALSRSCLPGLRPAAVTASVSTLPEHPVEACTAAIVTYAGGGAVLYEEVGYFPKPSWLNTGTHYIFENGIVSWDEKLW\n>SRR5579859_1021161\nDAGTVAGAGRQPRADCRDTDAESAAAAAKTRLDLGRGRRRRRGGGDQHRPRRRSGSRQGSFAVDRRRHVGQVMRAVWLCLLLAGCRTGPCKSGTLLVSVHFTGAAATADSVDVTVTVDGMNGHTTLLPLRSSSGTIEIDFAPNYPVGHTANLTVVARREGNLVGTGQLDVK\n>SRR4029079_5257423\nVRLDVSAGSDVPKEVDLVHDRPVVTACDRGCIVDDQPAGGELSEMDTAEVCRLDLANRHLCLAEPDVELLGQTAICDRPEARYGRRHLQVETRGIDDVELESSGYIPAHQPIVPTTRPARSAVAPAREACDQLPGRVRRDVTGLTTRPSRGASILENGRRSSRSSSSAGDPLDEPDVVAAPTHRARQTCGQRRVVX\n>SRR5215218_4007277\nXMKQSVLVLASVALAVLLAATGVVWAEPLAAEDQEGSGQSAASVTEASQPAGRVWSWGFNRDGQLGDGTTANRSTPVRVEGLSGVVDVSSGRQHSLALKTDGTVWAWGGNDAGQLGDGTTANRITPIRVIGLINVVEVEAGWNHSLALKDNGTVWAWGNNFQGQLGDGTTTNRRSPVKVDGLGDVVDVSAGGGGGGIGLYNHSLAVKDDGTVWAWGRTLGEFGDVVNSSKTPTKVSGLNNVADVEAGWHHSLALKDNGVVRAWGYNGGGQLRVDGLRAVKDVSGGGGHSLAAMRDRTVQASGARSFGQLGVRSLRFVVDV\n>SRR5688572_11278665\nICRAPSCTSGTARCSISTTSLRRCCSARGWCCRRTNTRSSARTCSTCSTPAAASASRSGPRTSCASVSLRSRWRRRGWARTTGTRAAARPRERRIMDRELLIEIGVEELPAAWMPDLTVQLAKRLEARLKEYRIAPGAPVESFTTPRRLTARVAGIAERQDDLDETITGPPVSAAYGADGQPTPAALGFAKKQGVPFEQLTRVKTPKGEYLACQKRHRGRSAV\n>SRR5947208_11212059\nAFALSNPPFRESVVDVGNRILMIHETRIQREGQKPAELMSFRHLANRVSIAICFLWPTITAIPALAVEPYIPLSLAIRRNSYQRKASAALATTRCCIKKNAFICVAIILYFVKRRNPLRRFAPQLCARFARTTDALPPYPAVSRLYLLX\n>SRR5439155_26842666\nXLQDDATDQGALRHARHRVRRCRQPPAPGRASSGVNGALTPMPSALIVSVGGTPDPVAFTLREHRPDFVCFLASQRSVDLVGQIKSAASLPIQDEKVLVDDADDLLACYRAALDCVGX\n>SRR6266480_5487073\nVLAEANVLPETDMDYFGDDGDRMHMMFNFQVNQNLFYALAAADTRPLIKALKATNRGRRRHSGGSFCEITTNLTSVVCKRSSGKPCLRHLDRTNRCSFTIVGSDAGLPQCSGAISAGLSWPTVX\n>ERR1719433_450597\nTGCATPKEVLTAAAAAAATAAAAEVAIAGIAAACSVQQFLSPKQEKQLGSPWNLPRGLLSRGNATVPGVRSCREGLAPAGTTPARRYAAAAREPTWSSRVWASAGPGQAGPVPPHSGGSWSVGARFRMQLGTSPGATRVHFRLIR\n>SRR6218665_3920812\nXMARAVTRIREENGVSATRRFVVPIAIVMLLVGAAMVAVILYSARKMDENIVSSQTELIDNSLNARLTRSLSEVRSVAWWDEAVTKSRGTIDTGWLDLEVGAFMTESFHHDRIMILDEQNRPVYGYNGEGRNVSPPITDSSYTEGATEGTTERRYGRSAAAVVRIGDHGELASAMAITPSVDMSLQSARPRILVSFIKLDQAYWAAAGRDMLLPDLGFGRPSGERRGDYQLKTDTGQALGTLTWTPRRPGQLLMKNVLPLVLAGLAISLLVIGAFARRLFSASRAIEAREAKAQHLANHDSLTGLPNRRKLEAEFARFTDAAKAEGHTLAIACVDVDRFKDINDTLGHHTRDQLIPSLADRLRRAMREGDFIARLGGDEFAVMRNCRDAEDGEGLLADLRDCFRTPFRVVGHLVEANSSVGVAFAEPGRSFDDLMREADIALYEAKASGRGCDVRFEAEMGQKIEKRRMLEAALKPAIAKGELSVLYQPIVEASTGQIASVEALCRWNSPRHGFVPPDVFIPIAEEAGLMADLGRVVMESAGQDSLRWAQARTPINVSAAQLRAVSILEYLISPTEKYGVNPERITI\n>SRR3989338_8474758\nXMKHGEMARRSRKPASSCKSRDCLIGSTEDFYHVEQLRDLLDNKLPLPLTVFGHLCEGKRVGRQTIERAVRDLQAIAVQFKTGPTKAERRGNMTTVGSQYRGTQEFLRVYRQLITAAEHRGLVTYTQVAHILGIHSLGHHMARQVGQILGEISEDEHRANRPMLSVVAVGSGGMPGEGFFGLARRLKKFSGSDPSSKRRFWATEQERVYKVWQPEXX\n>SRR5215472_2857866\nAERGADSKVRCRDEYDYASQKVAVCASVLVVGGLLVERGAIRADDLAVALQEQESGDRRRLGEILVALGWCRQEEVSAAQQILDSRSRATVVFETVRVAVDVLDTLTVLQCSITSVITHVNDISGTIASAAEDQSATTRETTRNVSEAAKASDEITSNIAGVADAAHGTANNAHESQKSAEDLAQMFSQLRSLVEQFKIDRNMSSARTRTAHSRERQPGWX\n>SRR5215216_7579447\nEGYLQHGNTHSDRWASVRWQACTPSLPPSWLPFRWRRARFASLFLSLGVATPSALDWQPLAPSSILYNILQLYHQKGAGVATLGLGLRVLSGPQQETNVFGLQSLAHPTHQVLVQPVQVGLLAQPRRRTRSRSLLRQHFLHYFSEDVSRGQRGIRTSMRRHICQRRRGGPLRSRALRLRVLRAMLPSALLMSQLSSDPVHRMRSFFSDYX\n>ERR1719150_3364345\nSSSSSSSDKILWFPFQPPINTGCGGVEVEVTKSTGTMLHSAAPQPFNMFPFGHPAQHPQTSHPGDMFSHPPAHHHNPQPAAQQPEAAPKPRFLFKMPRVVPNQKEKFESDEFLKRHSREGEVRYTGYRDRPIHERQNKFLNAARDGSTEIAFVATGFNLIMNFDTSSHFNPAHRQCDFDREVGKLHLKAPMILNGVCIRWRGWLDLERLDGVGCLEFDEENAMVEDAKLREQVESYNRRLREFEEQSKARSRHLAGLVSSQHSQFPSHHHLQSDILRRLDLDILQGLFPPSTANSLHTIICSQTFSLRLGRSRSNLQQRPSSPSDAGSGARLHQVHQAPEKQLPPVEASSLTATTTPSPTFDLLPLLGLPHPPDFAQHPPPALWVEVTEQQASLAAPLPAGQARLKQTNTSQSFGRRGTFRPGTCLEKINASKLGGDLLRPKKKLDPWTFVRASQLSAQMLQYHNRX\n>SRR6185312_8718178\nQPVGHAALSRFVSPPRSKGIGWAIAGYFRLTTACLLRIVSPQSRLACVGGQLPTHISISRQSRLQFAQRDVLQRFLDEPSSYSVAEVKLGLSKLQPEIARRIKGPPSPETHSFVATAVRSLGRIKGSSNCELRIQCLFDCAIYSYNNGDTAGFVTSIQLLDELGKYSNSPSWTRRIQMFGGVCHADIGNVAEAVMRYAQALEISRRANDIPGQVATLCNLGGALNYGGLHREAIPALRLAIRLAQX\n>SRR5438132_413551\nQGQANALGNLAIAYHETGKLDDALNAYQDALGIYRQIQNRLGEAATLNNIGIFERERGKLDVALSNVRESLAINRQIDDKDGIAEALNNLGNIYRDQGKFDLAISSTREALDMYREIQKPMGEAICQTTMGEIYTAQGKLSDALIALQRALELDEQAKYVPGIANVSGDMGIVFAKQKDEGKALEQLKKAIDLYVKNGIRGPELKLYQEWVTRLEGGTRTMSRX\n>ERR1719318_1879121\nKVIMVRADMLVHHATIEKAITEYDDDDKVIICSGSEKTIVSKRILILFSPIIRTLIASLPCCTPATIMIPEFSSSAVQHLTRILETGFTLGVPIESFKQVYEIIDLAKSLNIEMSDLRREVKAKVLEDEKDVKTEETHLVNNEVVNATNEETEELQSDKILILKDKQKTISKDILSFISQFRNGVEKLTCSECSETVTRANVVDHFKEHIMDLNQKIDELSKGNQSSTDKEEKITKKPEIATPAEAFKTESELDNVDIVTDMKVEENYVNEIKER\n>SRR5689334_23174827\nGRGHRGREKQISHLQARVSRQLAQQRRSLVMGLGIDLAVKDLRPVTCLRRDRDAVVDNLRISRNLLRYGQDPREVDAEVHAASLGAVSAGVSGRPGYRSSPTSASKASVYAARNDEAPAMKAARDWFTSASIRS\n>SRR5271157_4508164\nRLKHGFVARSTSIGHHVGKWRAASGGTIERCAPRLTRRVERRTRRRVGTRKLARQGGSMPEELAYARKASGLVRGLSFWDVLGIGLAFLTPIYAIWYVIGFSLSVFPRAQLLIAIGISVLTVVWASPIVWGILGGTMPRSGGEYVYNSRIITPAVALGASFAAIVAQFYWNLFNASLLGVPSLCTLGQSLGWK\n>ERR1719433_1034072\nPSYRVFVGLFTLKKRLCWFVYIEKMAVNDHPFILTSIYVAYLFLMNLGTMVGNACFGCKWWLDVILLKGDQAKNHSCTDAALFNHTQHSYTYTLGFVVFVCGLAHSWVDGDMETDAIYGPPAQDVATALGVWFLLLAVVNFYTMLGCSAGCGDIKCSEDFEFFNILVNLCFDLLLAIWLLLYSNASWSDEGEPPLYDWRVTKVVVWVGYVILVLCIIGDWIVQSVRKNIMGCGACGMKCCDDESQEVVGVGVNQEEVMPMSPNAQGMQGGMQGGGQGQVMVSGNNFDTQMVDMQQPQYGHVNYNQQYGGQPVTYGHQQYGPSGQSLMX\n>SRR6516225_9276130\nSAPRGTRRFGFESQAMIVNFPRKNIRHDIKTTALGLLPAIKTTRDIVEEIREVLKQVLAAIHNEQRRRRLRFQVFPRLMTKAQAANYCGVCVESFAVNCPVEPIRIRSGEKSVRWDTHDLNEWIESKKQDLIGSNGVDWLKRVGX\n>SRR5215831_4168361\nTDRRRGDRGFDRRAGGQVDPVPRRRAWQGPVPAAGYRRRVRAVQAAGRGRRTGAAAPAPRLVCGAGGAAGGLRARPGSMAHRPGRRSREPSRRLGVLPVGPAGGGRGGEDGVRPVAVLGNPRASHRGPPHPDRAAGQAGPGRRGAAPGPVGRRLPGAVSRRHPAARALLEAGLSAARTAGDIGAEAWASSFLGWDLYYFGDTKAGDALAQTALKLHRESGDQVGVVYALAQIGFTRLCAGEALAAADAWGECARVCESSGNVWFHAYAQWGLGVAALLRADYDSAAGLECAALRTMRHMDDPMGVV\n>SRR2546428_4767028\nGRTVRAIGAGGEQKVEPLGDRGWMGDPRPQPARAEEVPQRDFAAHPVAVGVDVRREGDAPARLQDARDRLRGPGALGGNADAICGHDNNISAAGAASRLASSAQACQLPLQHAVLAAVAEVNPEPDYQPYEQPDPRVHGEKTNITKTGGLPQQRPHGDD\n>ERR1740121_3388036\nPEPPQMAPPRDSKPTGTAWPQGNSLQSLAGVLAQIDRAVWDFDISQDELQAKFYEALEARKRCTEIVVEGELPEEEWDWRPGEDDGAVLALPPPPLAPPAKRARPSLPDLNLPVQEYGNVQEVPKHEKGPRLELILEEVVRMLKEAGGRMKLQDLGTRRLMELRKGACGNLAKFLYTQPETVFVDDSTNV\n>SRR5579859_1509829\nSCQPEVEVREHSTRNSLPLRARLSLQARVFLFALRARAGITCCVFYPGETIRLLHALPDSGLPQFAEGRVLSLRRDEHNQIIDVEVDFHRDSHTLKAELPLGDVELVISDSSLAQTAVFWGLDEPPRKVIEAAMHSLLDSGFLMRDGLNLVQLHYDRENRWWKWGEKLMDPTGALVATAAAAWDGFVVAFSGQQRFHLEFRQQRLREAVRMLHERHEVYLEQARTTHPAMSLMRVLLNLSNAAGARYCAFPVATPWIYDQDFASVLRPPLYPDFLLVPEKELPRSISTPFRLIRLTGQRSILTVLPVKSSPTETGFERSERELQVDRLRKCKALGEKYYDQMYEARFGTSGLYADAKDAFRDAIAAANELGLKEEAAELEKRLDHIKAVYRSQFSX\n>SRR5256885_8719643\nRKKEKGPAPWGARASPSPELLRGCGSGAAFFVRVFRGIAGGLAVGLTLRLVGFQLVFVRLDGVFVAGLAIGFDLVLVLLDLLLVGLHGVLRGGLRERGPAERQESGKDESRQQFHTSSCGVGLPASFNARTLNPDDTQTGPAFPRTIDDAMTRQSAIAAAQKYFDAGGFHADLARRVAIPTESQNPERQAELERYLETEMAESLAKLGLQSRIFPNPRGKGGPFLVAELLEDPKRPTVLLYGHGDVIRGQENEWRPGLGPWTLRQEGDRIYGRGTADNKGQHTINLAAIETVLRTRGRLGFNLKVLIETGEGMGSPGLKEFCEQNKALLRADVLISSDGPRLQPQRPTIYLGTRGALNFHLTVELRKGAHHSGNWGGLLANPGIVLAHAIASITDARGAIRAPEWRRGRRX\n>SRR5258706_15926144\nGFGAGGRAGLGAGGPPARRFGAGGGGAGGAGGRGGAGAERNDRRERGAQVLEPPRQVVENREDRTSHSASSMPSGRHHCHTAQRDNGSPFIVGLIVVHCGEHGGELEQLPFKTPPRX\n>SRR3972149_2856803\nTVYNAVRQGAMPRMTDERVKQLQDEILKMPQAEGSVRHIFMPGIYMRELTIPAGVVSVGHNHRYNHISMLTKGRITVLNNDGSLTELVAPFTMISSPGKKCAYSHDEVVWVNIHAAPCTDVETMEQLLYDWSDAPDRIKELPDNTSSDDYQQMLIEWGLTEDDVQAETQVDNVAPMPYGIHKCKVSDSKLHGKGVFATANISDGELIAPVFMDGLRTPIGRYMNHSGNPNAVVIKAPNGDNYLMATRNIQGCMGGNDGEEITTNYRETLRLLGGAGWSGRRDPSRAARASREACRSCPRPISPVP\n>ERR1719162_375500\nLMAGALSQPSHVDPLPGWDFICNGYVPGNLPGREGLGTTSPQWLGEVGCMRACENQGRCDFVTYDTFNGNCWMEIIPDRPTECDSNTGGWAYWRNSQPAPAPSPAPVPSHVDPLPGWDFICNGYLAGNIPGRQGLGAASTQWLGEVGCMRACENQGRCDFVTYDNLNGNCWMEIIPDRPNECDSNTGGWAYWRNSQDEVRRRSTTQQNDVRRRSTTQQNDVRRRSTTQ\n>SRR6266849_10918975\nVQMLGPQAASQALAVLEAGREEPLGLVDHLFSPIRTKAASIVPSALSRCSSMGLSGWHPGAPSPARCGARRAAPGASARGSYAERTTPSAHPDRLPVVQSPPLEEVAGIRGRPALRDQTGGPGFQGEDAPHPLVLRGLDMDVRDRDEDLVQDARPLKRREDHCPALTVQVAHVELVEESLVRADEPARLDPLLAGEEERDALSLTPFRAKTARAGVRRDDDR\n>ERR1711972_1082418\nRSKGRAMPCCYMEDGAHQHHRKRCLGRQDLAPNRAKLTTLAPLASWPSWPLPFLFRISGRPLSKLGSFWAAPEQALGGSAFDLAWEPSESAPRSPLRQRPAQLIMLGTLKPNLSRHVPPGADAPNTLMPTKASAHSPQPIVTAASTLILGTLFGKSASLQLSGCARKSSQHGMDTTRTFWRISLAASTQRCTSEPVATRMSSGSSHSTTAX\n>SRR5512136_1229453\nDTPEAEKAKNRVTRPHYTAHGYARSFFCQSTHMYLQTLSLENFRNYKKGIIEFSPYGAFFEGENGSGKTNLIESIHLLCTGRSQRNAQKKEMVNFNASYASVRGVFVSRD\n>SRR5712692_9023375\nTLGIERIECNAQDARRRDACGKCKVWLCEAAQLAMLTKLGKYEIQGELGRGAMGIVYRAEDPRLGRPVALKTTTAEVAGNPNLLKRFHREAQAAAKLTHPNIVTIYEIDEANGVPFIAMEFLEGESLQKIIADRANIPILRKVHILIDTCKGLDYAHQHGIVHRDVKPGNIVVLNNGQVKIVDFGIARVGVSSMTRTGVVLGTVMYMSPEQVQGQTVDARSDVFSLGVVLYELLTYQAPFRGDDVPSIFFKIINEPPEAITKYIPQCPALLEQIVQRALATDREERYQSAEDMGFDLQRIGDSLKRDTIDVFLQQGQRSLRQGDFTIAKESLQKVLEIDSSHQLAKSLLAQVREQIQSRQRAQKVDHNLGQAKEALQAEQYEDALSLFEEVLRLDPGNEEAKQCKQLAVERRDRSEKVRRHLERAEKLAAEADFQRAKAELEAVLTIEPGNAAALEMIDWVVKELTEQERLRQVRQYLEGARAHLAGKNFVKALETLERAREIDPINIEVEALTRLVRSSQEKEERRKVLVTRVAEIEEALSKGKLDLALACVEQALREFTDDAQVLRLHEQVLRRTEVDKKRRYVEEQLQAARDFVQKNQYSSALAVLERAIQAVPDDPRLGPFLKTVQESQEQSVLEASRRDAVREANEQIRAQNFLAAIETLEKSLVRAGQSPELIDLLQFARERYAEQQQQERVRQALARAHSHLRDEQHEEAIRVLARAQDELKSSEIDALLAAAREQQEAFERRREEVIASALKLLQSGEAARAVALFETAPKVYFTQEEFQRVYSQCRQSLDRANFVHSAVEQAEKSLAEEDIGSAHSVLEQALKPYPGEPALLALQKRLREEEFRLRREERVKLLEEAQVAVGRMEYGRAAELLTSVTWESRDLPELAVQAELLLEEAQRRERERQVLSRAQGYLRNEQYVEAEQFLLGIRNELKTGEIDALLATVRKEREAFERRREEIIAIALQFLQSGEAAKAVAIFEGAPKVFFKNENFQRVYSQCRQNLDRANFVHAAAEQIKKCLAEEDISAAESLLEQALKPYPSEPALLALQKQLREEEFRLRREERTKLLEEAQVAVGRMEYGRAAELLTSVTWESRDLPELAVQAKLLLEEAQRRERERQVLSRAQGYLRNEQYVEAEQFLLGIRNELKTGEIDALLATVRKGREAFERRREEIMAIALQFLQSGEAAKAVAIFEGAPKVFFKNENFQRVYSQCRQNLDRANFVHAAAEQIKKCLAEEDISAAESLLEQALKPYPSEPALLALQKQLREEEFRLRREERTKLLEEAQVAVGRMEYGRAAELLTSVTWESRDLPELAVQAKLLLEEAQRRERERQVLSRAQGYLRNEQYVEAEQFLLGIRNELKTGEIDALLATVRKGREAFERRREEIMAIALQFLQSGEAAKAVAI\n>ERR1719240_1252999\nIRDTTRGVSDFDYCLCGEAGAKFLVWLHDCTNKLINFEDRDHFDYEHEVWFRPPNATCASPKVKLCAESARCTLCVDPVADDHTFLVQLFGISQLIKCVGPREYAPRLPVVYEAEQNERRSLX\n>SRR6266511_3081427\nSAPMTVTPTRIFLRYGLIVSVCCGRCLYSLSPRVASETSGADHQVVRITSLAVAVAFMLIGPLLSSAAQEDVLATLRKGHPRLLVLDDDIARIKKQIETDPTARKYFEHLKIAAEKVIQQPVTERVLVGPRMLGASRAVLARVTLCAGLYRLT\n>SRR6185312_7578494\nSSDLCVHGHEAGSGDRAGGGRGSRQALLRTARLAPGRGDLPPDARDIPGPRPGSGATKLRLVRHLQGPGRQRLVGPRGPAALAGTVKGPTTMGATSTEPTSAELIRDLLEQAAAAHGMHEREIGRPDPDWPRWYAEHMARALRAGGYEVHPSHGDGGTTLPVGSRRPELAGQTVVVIGGSSGIGLETARRARAEGAELIIAGRNPERLRTAAQEIGAQGSRAFDATHPASLDRFFQELPAHIDHLMLTGGGPSYGRLVDMDLADLRRGLDEHILLILQVARRAATKLRPGGTLLFMAGTGARRPHLGLGIVPTVTAALPALAASLAIELAPVRVNSIAAGFVDTPLSASLLGEDLERRRDQLRATLPIHH\n>ERR671919_521420\nXMRGRGPGEASRRAAPRPFFPLPPRAAGRRGEGSCLSLCFEHSGGERILGRFARPQHELEGLIIALASLERSPKQRLALAGMGVGAGEQEPVAIEQKPVLAPQIEMAKPELLVDQRHQLIDFREPPLRDLEIESASEMQRLQIVAPVQRDVIVAPGARDGQREFVRGGALEAPGMNGGDVLDHIHWVGEMVVDRQCRSHTSPLWPRQSFAFPSCPSANHFVNQLYIGESRSTNAGRDPKTGFAKDSCGLRARPKPLEARATPQANDARTVKTFGASRSPGPAQESLRLLGEALDDGGLERRDPLLQGLVFLARFLRHRLDGLELLAL\n>SRR3990172_7588517\nRRCGNARSPARRVVVRGSVKPERPAMSIVRSSFLAALTLVSLTACSGTTAPTGEAARQGVVVEVTPESVSVSSGVAAAFDASVTGAADTSVRWSVLEGSPSGGSVSAAGLYTAPGTPGTYHVVATSSADATKSATATVRVAAGYGGGAGAGGEGGGEGACRDEKLRAAG\n>SRR5439155_1739346\nQASVPVESARTGLVSSSLKCSDNVAGSKRARRTARAHRCGTVAGRVPTAWLSQSARSTSREPAHLHPQTARASASGDRRDRPGQCRGRQVVRRGGGLRALLPRRTRRPRHRAPCLGAPALGLCARCPGGDGPRSGTDGLCRLPKPRSARPDADDQLGEGDHSVGEIAPARTDRELAKLRGSARTERELSLLRGAIDADVTELRTRISRDVDPRRLARRQPVAFFGTLGSVIAVLGFAVASRVKSFRRSRTETELDQVIQRLGGRLDRLKGRTRKRFRESLRKEIGEVESGPRAKQMFWETATAALVSAATLLARSIASRTVGIAPATAAPTTNAKRLMSTSGRAPGAATSNSGNEITTVAVMSAPADSSRAPRRRAMRGPTSAEGENARIVTAGSSTX\n>SRR6185312_8989730\nQIDAVAGFHRGIDNQNPYSADENVPYVYYNYERSLYDFADLEGTSQIAKCQDGGPNDPYPMIRNCPVTAYGEQGLGYLERDTKDRTSLVASITQRVKAAGYHVIKAGVDAEFETFDINKNYTGGVVWRHDAPSVATGANGRWNQREFLKVVRNLTPAEIADPTSVQLDMGQLLCAGDRAICAVASSITANTTDSNYGAYLQDSWQLRPNFTINAGLRYEDQIGYAASQLAGQETPVGEKVPSQVFNLNDLWAPRLGFIYD\n>SRR5258707_393308\nGLNSGQPSLDAQNVGATAARAVHAIADRAEVVAEHEPRIARRKGVNVAEHPRFPLAEDPQVTGITGGHPQPGRHVHAMLSAGAHYGVELNHVEAVPDPAAPVELKDADQQLDQFLTWHGLTGRALPAARGNDQSAVRTEIDAAVLLLHPRGELQDKHRRPDQDRLDALLPIEEPLDQLIGEEPSVPYVEFRRVDEVDDAEHIGEPEVGGLNGVGPEDIEAGRPLRVKVEDLQGGGDAAEKPLERPAVAVDHAPAALGPAARAAPELAVERPGHQVASLEDRG\n>SRR5213594_1844093\nNPGSVCSRIHRHVMMACFNSRLLLHESQKRSPTPRVSRSPRYSTTQQLATDHFRATGHSIPYQRPFLAQNRSCRPASQPGLGLRQDQSTIQYTFAIQQPRPQHLPRGLAQRIFSQPPRLSTSRLPLPHGSPRRSAKNALLSVTSPQSAKPRKWPPDTCGIAFEKLILKAKHADPIPYCQLGKMDVVKASNKNKALTDFRSEPQWPVRTPTPPLRLGVCRGRRRYKRPDSHPIRGRVDRRPASDRYRPVAIDWRACVAX\n>SRR5947209_20053041\nNACENYSIICCYSDGYSVAGQLISTRSLPVCCFFFFNDTATTEIYTLSLHDALPICQRTIRLVSWPQVNHFALPPLFRGSEKGRSEEHTSELQSRQYLVCRLLLEKKKKDDAKRKKIHHVVILDSKERSTEWX\n>SRR5436190_7157327\nPSLNPAPESLPSSRIVDLMLSVHKDLVPVSETGKQRFRSQFYSGRDLDDVLERVQRAGVFKREARIAGGLIRPTLADAARLNEERRAAIATALERTSEGLGAILDEAASVFRLPGRIDLRIVIVPGDGPCRFFVGAESLALSAPPGPGDAILLRAAIAIAVGCQNDMIGPMPRGIVATPCDSFLLAAIALQLAARGWVTSYGADVLESAAQRETFATEDDDAALQLCRLAVAVRPMFDDVYVRKTSFADALVAARHVWRGLYAIQYVHGAPGEIPEGW\n>ERR1700739_2321498\nXMRAVMDRTAPKRFAHSNRPARTVAGPPRHRKAVAGGRGSRIRTCDLQYPKLPRYQAAPYPAGSRHWIAFSPAPSKRRGQSMRFAENRAADTVACLDTEAAGDAGIDFEDRADREYGRDEVIGHRLGIFGDAYDPPVA\n>SRR5579862_6422017\nTRLYREAAAGCRPARREFLSSPCQRSEYGPAPSVALPPAKPGGRSEAQPSVQSQCISCLFLLNPLHHYVFTLFTWAMQRIGWGNCLAARWTRSFFASQGVPSLPGSSAAQFPLRPDRRLGKSITGQL\n>SRR5258706_10244772\nEDAVARVVGALEEDFADDALPALLEAVGDLDLVFLAVEAQFGFEELPRGRPQRRVRDVPALSVVLPQRPFVGVLRRALVALAGREPADLQELRLREEEIDGLLDRFLVRAGRIGLRLEGSDGEFGNPVRLALVDDDVDHHVAAIRRELQRVELDDGVEEALVAVDLAHREDVGLERVLDEPLALPVEEPWAVELDAGELPQSPLPEPGPGLGKRVIPADLH\n>ERR1719491_1280783\nVRDVLGRPSSLLLDCGHGPLLTAACAVRPFAPVQTVEGAGACTGARCEDPSHCRSKWGWCNAGGSYCNKDSTWTSACDGSATTTEAATTTQEHDATTSTFLPRGACTGARCEDRSHCRLKWGWCNAGGNHCNKDSIWTSACDGSATTTQAATTTKQSDATTTMRAATTATTTRVATTTATKPMLADLAPCTYSKTFTHAGWPVQQDSTDVAQMVDRCQGQHFVNNVDAATCVINSNADGYDYDKWTPQTACPYPLGQSPDVSQAQCQAEFTRWKSMGVRMVSLAGGVEAMTGIGHGVFNGVRGECALMEFQGRYAVIMQVDIRSWSMEFTEQTLNHLTNNVNPGGHCFVPNVKVIDCATVRAX\n>SRR4029453_3979317\nAVGLDPETTVQEFLDEMKQSENEAARVASTPSEVTPEDRAFLERQKRAIRLLQIAGVLVVVAAGTGAALAYMKWKKSAPADAPAAAVAPPSSPSPPTNSPAPPPGPPRPPGAGVSAPAPKSSTTTPASPPPAAGTSQSPPVTVVPPEAPAPVPVPPAPAEPLTIEFEGTSACFV\n>SRR5437868_9650668\nPNSHYSTHIIDILSLLPLYLYMQLLYFLSFFFNAPPTPDISTLSLHDALPISHLRSPETRRHRWRGRCLSPRLAGQLGKGSDHADRKSTRLNSSHVSISYAVFCLKKKKTLNHRKYLAYDYPSLINLSRIIRTLL\n>SRR3989339_1542112\nWHFLFFMDLFLIHCKSIFLKNKIERYLRVPYDFMHTGLFLCYTITMTNELGTLYVVATPIGNMEDITLRALRVLKEVDVILCEDTRTTKNLLNKYDIHTKTLSYNAHSSDNKHSNIIEMLREGKNLAMVSDAGTPCISDPGVLLVAYVREEFGKEAKVVPIPGASALVSALSASGISSAEFIFIGFLPHKKGRETLFKEMATTNRTIVFYESTHRILKTLASLDTFCKNHRVMIAREITKQFEEFVKGTPAEVLEYFTVNTDKQRGEFVVIVDPKX\n>SRR5438552_9638688\nLFRLVPVAFAVGAVPLGPPPPAGMAGRDFRLDGLQMELAWIPPGTFVMGNAEGDEDERVTTRVTISRGFWLGKDEVTQGQWDQVTGDDPSGYRDAGPTVPVENVTWYEAMAFCHRLTESEGVAGGRLPPGYEFRLPTEAEWEYACRAGGPGARSTATALDEIAWYGGNSHGRTHPVGQKK\n>SRR5580693_6454278\nRTLTKLCYILFVWNVDSALFSQKLLLSGQCLNRADQSPGNRNGQKATKVFGQTENMKTLKARVLSVLSFQPFRRGNKSDGQSKDTIIKFWRMRCSYPGPETPYECELREPLENFASKKYTVGLNGFVEFELLSKPNVAAGDSIQIDAYEPEEKILEGGNGEHNPRAGAIDDC\n>A0A1H1AGA9_9GAMM\nMATSKPHRLSSCIALALHCARAGIIGGLGCAAAFSAYAGCDSTAPVSGQTVTCDANVPNPQTTGVQAVAGSTGVTVNIVDGATLQIAAGPGVQVRDQSQVNNDGSINLSAADTFDAIFAEGSGNTVVNTGAIATAGGASDGIQSNGSNNTLTNGVGGSIVTTGANANGMLSLNGSGNALANNGTITVSGAGSSGIRIDGAAGGTNTVVNDGSIASQAGIGVLFNGSAGSTLINRGTISGATGGVTSGTGNDRLEMLGGSISGAVAQGAGDDTLIISAGQLSAVNQGDGADRFEISGTGSVTGTVQQGSGIDTFLMSGGQLGALLQGDNLDTFTMSGGRIVGAFEDGDRATMTGGRIGRVDMKLDDNVFDMSGGTIDGNLVTGFGNDTIRLSNGYIGGNISVSGGNDSITVTGGTVRGEVRVSAGDDTFEWAGGGVIYGAIDLGEGTDTATLRNLNQSHLGATPSLSGGNGVDSLSFANVTSGGVARFGNWETINAGNDTELTFDGNLVLGDAASGTGVLNVDASSTLFAGNGASASLMAFGAGQLATVNNAGRIDLTNGAASATDTFTIVGNYVGNNAALFLQTQLGDDSSPSDRLVISGGVASGTTGLEIINLNGSGGSTLLDGIMVIQAINGASSSNSAFALMGPVAAGAFEYFLFKGGVSGGTSENWYLRSTLVAPPASPPPTPAPAPDPLEPTPPPVPPTPPEPPAPPPPTLPPPPPPEVPDNPDPEVPPAPPPAPPTAPPPAEPPAPPPPLPPVPEDPAPLPTPSPEPPPVLPTPPTPGATPATGTVIPLYRVETPTYAVVPPIVHQLGLATLGTFHERQGEQALLDSEGALRSAWGRVIGQNTEQSWTGTVAPTFDGSLWGVQAGVELFAREGDDGRRDHFGLFVGRTRADGDVRGFALGWNNLTVGQTRLDDTHLGLSWTRIGTSGAYLDAVIVASRYDGEATSSRGIGIDLEGDGVTVSLEVGYPTRWGEDSRWSLEPQAQLVWQHVSLDRQQDDFASVDFDSDDALTGRIGLRLSADYSTSAGLLQPYLKLNYLRGFSGEDRLHFNTDIVETDQQFDAVELGAGLVVQFNANISAYVVLDYTTDADDADRERKTVEGNVGLRITW\n>SRR6266849_3749832\nXMGRGKSYLEESHELQEGTVWTSVQGNGRSGCEDGHDGGRGAGVADCGRRRSGDCYAKLARIREAGETNGDNTRQILLQHQGADAGGAGASQAIERKTDGGAEADRGVGERVRIPVWPGGRIAGGIGGLGGGGEQVLPVFX\n>NGEPerStandDraft_8_1074529.scaffolds.fasta_scaffold152358_1\nMAGSTAMARRLSPCPALPATARTAAGPGPGGGSGRCAGPGRHLGVPAPELGELVLRAQIHELRGEVDHAQGGDVRHAERLSGDEAGGRELVVQTAVESPGRTLPLLLRRGNLLAVRQQPGHHRAVDPRLAHGAEQLELELPVGHVHQADRHRVGAEQGRFRVERLEITADGHGFGDAGAVVELQHRHLAAGIAAQKLRRAVLAAPHVHLDGGHLDPLLGEEHPHPPRVGRRGHVVELQIRLPGCRX\n>ERR1711990_8348\nFQLVSPGTNDVNRVCIDIDPQVVIVPHHYHVHPEGHPRDTGGPPSLPSRQESPCPVRVAAEAVVQEVQVSLSSHHQEVSSAPLHGDGDVCTVALPPAPHIHHPGLHVQFPLESQQYKYGGRVLQLFIFLCNQFDL\n>SRR6185503_5987732\nGQPRAVRAHAQRAEREELAPAGERVAVEQHLLAVEGSAVRGYRRRGLVRADGTPALDAVLLALLGAGVVPVALLAHRQREVGLLGARLDLGEERLAQGGQVPRGGVGVRVLGLEVLGRRRVFLVPEPGVLVDHGVDVDRPFGRDGLGYLRLLSRHVDDVTIRSSWNTRSRDCENPEGLRKYLSGHCQ\n>ERR1700694_3206782\nKRQRAMENLFTGADQPRKLRRQPLSGLRKWTRNYIPYLEVLEDRNLLSAGTKGFGAQIRDPGFEMPAAGTGNILYDPPTSPWTFNGSAGLAGINSGFTAGNPAAPQGPQVAFLQGVGSLGQTTTFAAGTYNVSLSAAQRGNGLASSQTFQMLVDGTVV\n>Q19Z88_9CAUD\nMTLDALASLPGVAVIQLPEPTEAVTMQDCAGSGKPFKPGTLSRDGEVAKCSACRTNRYVRDDGSMWAPSGARCCGCGYRGESMILSHVRTELERSRNHRFYDRPVNKNVQAMYVWWEYMDEIDLVNGENDTMRITLTEEEVHPPPGDLFHEKPKVIRAIQTWTKISLEYQINGAYVDLRTLSAAESIRDDRWIPLEQYQIQRYCIQGRIRPGGNGYEPYRIVILAGEVSPPGVWYPWPGQPEGVPNEVLDGTYHGMFMADK\n>SRR5690554_76201\nXMRAYLSRFVLFGGFIMEIIQNIAVAIDNLRISKGLTVSELCLDICDESSYRRYKSGNRDIPIAKIKQFCDKLGIGLDEFLYNVSVKNSYEYKKIHKMFLDLQSKKYDEIRKSLPLIKVDDIGIDRNKVLFKFILYTYQYETKKITSSNYYELLLKLLPEQSGFYTFNDLIIFEKLALLEVNQNESPSLKILLDILLNTEKLYVTNTNQYVLATTYANVANYLTKRKEYEEALKICNKGLEYSKSFYVTKNIHYLYYLKAYCLFHTEDKEGATFNLSIVISWVFAIQDEYMSNYFINLIMKEFNMTKSMIYQMHQKVLANYLX\n>SRR6185369_2141686\nSSDLRAGVEVRQRRQRRLRDAREVRRQALAVRRDAALLLLRRFPLLDGGVERRLGAGRDLRLLDLRRLLDLVLLLLGFLDLLRRRRLGRVLVLRRGRLVLIALGDGLARRRAAAHRRRSEQQRQPISVELLHYFISSCWTGVLSMTMS\n>SRR5262249_26280313\nMGRLQTPFQSKEDCMDDAEAKVIELIFGSWRSQLLYGGVQLGVFDALRRGPVSADQVARELQVDARLLYRLMRALGSLELVHEDPHQHFTLTPLGEVLCRDHPQTLRGLTLLEAGPEHSAAWMQLPELITTGQQDAFGREVGQPVYAYADQDPSYAAVLDEGLNTYALLDNPLVLEALAAYDFAGIAHLCDVGGGHGLTLCSLLVQHPHLRGTVLERPHVLAQPDAFWADKLGVSDRCTYVVGDMFHAVPPADAYLLKRMLRHWNDVEGGQLLATLARAAPAQGRVFIIEQIVPGPDTPHFAKLFDLHMLILLTGRERTLEEYTRLLAGAGWTYRQTWYPASKQLGVVEAVKASDFNVLGSEQSEINGFEHHRLFHRLRNPCLIIHRASYFRSCFAEREEILVDLILVRRAHAVRRALVDRALGQFIRLHGKAVAQRGMPHANRSSIFTGSSRTRMPVACX\n>SRR5882757_3079952\nDAVEDGVAGHFQGAFQADVAEALVLEVLEDLVADGHRRGAGVLAVDVVPGVDRRGGGHHLEGGARGGDAAHPLVGVVGGGAGHRDDLAGVVVHHHGRAGVGLVVLVGDRVVGLAGVLHGRVELLFGDRLDLGVDAGDQVVAGGGRGVALLADHPAQVVDLVVGDAGLAAQLGVVRALQAGAADLVRAQQRVVAALRGGQLGVGDRGEVAEHLRGVGVVRRRVAAYGGGLGGDAREVLAALHDLQRLLGGGLVGDRDRLVGRAVPAGLRGLRVAQPHLVQHVLRLHAEHVGQLRQYGLAVVALLEQVGPVGGDHQPGLVVGERHPAVVQYRAAHRGRDDLLDLVARGFLVVLLAVADLQVPQPAAEGEQQGQGEDLQDDQPDGDPRGPAGLRDVTHLATRSPGRRIDLSHLACAPEQAALGGQAGSGGTHAGAVQASGPGTRAGAAAGAAQTAEAATEAAEAPAETAGRVLGQRVVV\n>SRR3972149_160959\nLVNCWPVFPSFFFWWWSLRLYGSSGDKIRMRCEALLAAILLLAAIPIPTATALQNTALYAPTGDVQAADSFAVNGCTYAARHTCVDEIPPGPNDGDTTRLQSNVTQDESQIDLTAYWQLDPEDSVVGMRIHFFVKTLTGSWPIGTTLMIFIQENIGGGRICYFETFSPPTSTGSYRRFSYPAGYDETCINSDVNTWEILVVLDCDTPPNCSNWLRITSIYLEILYFDRFGFPSSPENFAWIIYAILIGSGCLIAAWRIKKWRETIX\n>SRR5262249_38322783\nGLRGRGDGRMSAAVRRVLCTVLLSGLFVTVTAAQDAKMPVPAERKKALLEGTHVFRRILYDNDCTSLKNFKELVDEPSKSILIVFGDLDRIADVPGGLANFVKDGGAVLLASDRPLVDRDARAQLLAVAGVSINVETVFMNPAGGQLYRGWPYCPFPDPAAGASPALFSGDSREGGGTLSVATNVPTHLVVHGRPRGINVLARLPANCQYDVTEAERQRGFWVGRFPHDRTFLVGGDVGDGRILVAADHSVFINEMMLPDDTNNVEFSINCIRYLRGGEQRSRV\n>ERR1700745_413936\nKTENVRIPKTLLLFVYYRTRPLPHLSGVRFAMAKLCTPCRRVDVALLDALDGSLHLDLITFSCNHYRPCPPHFPGPSHRVKSAGCLRLLLWRGLSPCIPVRRSRARSGSFFLARYDRLSRYALFGSPLSSERDNEYAFCPGDVVLRPRRGMAIATLPTWNRCRVGLTGLSRAGLSSSPAV\n>SRR3954463_761953\nGPALLDEQELAARMAVPGRARTGFETPAARDGARCVERRSLPGKPRRFRVGGGLLGAHPRGRSAKQHEERAGNLYSLHGSDTTPAKLVRLKPEATNRDRSRTLRQMNRRTFLKSSGMAMVSGLAQRGAAPMERTIQTPVLSIGFEESGSPSGFPIVLLHGFPDDVR\n>SRR6266566_9387372\nAPAVSCGQEKFLAAPAQPEGLVVQPLNNCIVFRAVIKPSGVEVNDMVSRDPCHLLENGIDKEYVITIVSNHNAFVQRLQNALHLFQPVRLYNIHDVFHFVHSATCVSCQNGHLAASLSDPARHKCVRRDRGSVPTCTSSSSLSRETRRX\n>SRR6516225_4656599\nRAVRADLSQRACHENATHVCPTCSNRRAARVPKAPCGMGYGNGRTPSCPLQRRSRKPRCPSRRARRARSSGRGLLSGRLDGGLPPCNLPAGDEAIGDGKNVVKYIDAFNHFFPRRFFAGVLETPAARKDMGKRIRGIPALWDLEVRLGIVDSFPDYSQILSLAMPAIDRLWDAEHAPEWARIGNDELARARCQVSAAFSGLCGIASDERAAGRDSGSGTGPAQRRQCDPA\n>SRR3954451_7163765\nRQCFDQLLFLAGVADGAPSGIDARRQSGVRDDATIPDASDEVVLTDDTFPVPDQIVQKVEYLRGDSNRVGSLPQLPPFRIQHEIRKGVKQMHPPVVRSQCKQTVRRMEGACKALLMTLAHPRARLSSMNCLRIPRHEGEYHEADGCTDVGCHCSEALDLGRMRSRLCEPRSRSMLAAX\n>SRR5262249_15769881\nVVDANFNPVAGGDDGDKVTITTSLSSKVLLSPIAPGLSLTTVLSNQSGMRLLGFPDVIFGYAQAPFADVLLNAYDQVFRDWPIDVKDKRTVGTSSMCTEASFTVTATVRATPAPGLSSHDSVLSAAGTLGAQAPPCP\n>ERR1719265_1088395\nSVLPTSHVRFGDRRNIRPLQGAKIVYRAFDPVAGWSPLLVNNHHSVLVHGGANAVPQSWPRVLPHPYHDGPEDLGIARGSGAHNDHHVAGGNAVPPTHASLDADLPDDIQLPHPRGVGTGNLEILRRRRREVHECDESRNGAHHQRKPFARTIASASLLHLATPRARQLPDLEATQPWLVDDGLSAGX\n>SRR5680860_510741\nGSGAAGGARPRYGAGRPRCRGGRRGGPARAGRPGRCAAAGGDPVVTPVKVWPYVVGAAACALLQVAVTLGFAATVTMSGDISSASPSEPAPPLPLPGLPTPGPPPSEPSEPPSGAYAEPRDDRPVVRLRFDVADDLTTVAGSETVVFTPDLRVCELVFRLWPNKPETALAGNELSVTSASVDGASVTPVVEAAGAPSGTTGTLVELPVEGCAEPGEQVTAELEFALVLGEDTPERVGWSAEESMAWFATAFPLLAWEHGVGWMRNPAVGLAGETVASETFRLESLEVVALEGLEVMGTGASRGETDVGSSGRVAHVFSADAVRDVAVVVGELEVSTTEVDGTAVHVAVPVAGSVAGVDLWESASVESLGLVSGYLGPYPYTDLWVTVVPDFPTGVEFPGAIFYGDVDPAVFVQLVPHETAHMWLYGLVGNHQGRDPWLDEGITSFVEAHVLGVSEFLVDQPVPPPADGYLGASMPFWAELDPSGDLYGAGVYGAGASVLASARAVADPAAFDASLRAYVSAQAYQIATPEDVREAFGSVPEALAVLEDAGAFAGDAGDPX\n>SRR6266849_1400336\nVRTCSTNSGVSDGSNRSLQAPNDLDSEMRIVNDRDLRVVIEHHLQQSCARPGTADDKQIGVSNRTVFAPAFVPDHDFSEPYSLRVYARFTCASNRTCPANLFRLSRATDPAEEKPPTSRPLAEGDSAGAIPQRNQVAGTPHRPQSRAARHLFGRGIVSFGIVDASPARFADHGHGAPNEDX\n>SRR6185503_8510077\nLVEAMRGSIAVDSTPGRGTTFSVDLDLSIDASAERPLQSARTVIGYAGTRVSIVIADDDAVSRGLVADFLAGLGFEVRRAPDGAAALEQLRNAATDLLITDLVMPRVDGIELIRAVRSGLSARAPRILAVSASASDYTSHEALDAGCDAFLPKPLHLGDLLDRMTELLHIDWQYQDTPAAVGQRSAASSTFALQRELADELYHLAMQGDIAGLVERANARLSDDPSACGFCDELRALASEYDTGGIRRMLSAHSPA\n>SRR4029434_6363074\nSRCAAVGSNTARFGGRESPGNGAIVNGTAFGVSGWALDAEDATLTVQLLVDGAVVSSSPTRSARPDVCAAFPSVSHCGSSQPGVTFAWNTTAVADGPRTIAPRATGPAGLPATSATRTEMRRAHA\n>SRR4051812_49403107\nHVVRHGGIAKAAAAGCGDLSSLSKLMKGLEEELCTELFKRNPFRLLSHGRIYFAALERAREVRDAAMDQIWTETRPTLQLISAEVVTLCYFPGITRELERKHPNLQCSTESGGEEQIQRMLRDGDVNLAIAPEHEGWRGFQRAPLLELRPVLICPEKMPFRSAKEIWALPEP\n>B4ND15_DROWI\nMAKKGAVQQLQADLQNDEDFARFLERPGLLVLDVYSDWCGPCLGMVGSLRRVKLEYGGDNLQLAICKSDTITDLKRFNKRSEPTWLFVTGGKAVNIMYGTDAPKLLAVVIKELEKTLQKLPRSHVYDIAELQPIEVEQLRVKTEALEKLERIERDAKNKKQNDYLNQVTDAIMENMPDIGVTVFGPQVNRDMFKKLTEPAEPLKMQCKDRKVVQVTAEQFDIVNYACRNPMPPDVLEQLDGKELLMCFWKIDETVGTVPNVLAAYAHELTKERSAPPNEQFFEEHAIPPIISPMKIKFEVELKEGEVWVEDVSSEEEQKPVKGKKQPKLKSPTHQEDATPVPVDEEVGEQDGEEEGSEEDGPEYGADGLPSLPSMPFDIDLDLDLGDDMGEEEEEVKEEEPPKPLTRTKTVKMPAVWVPNNRRTHAALIYMFFRGQTTGFLAPDPKPEPPHIIMAFDATKRREIMHVVERHREEVPLYGYFTNDDPDGTELIANSTDKYDYYPEQLLSDKIVLKVNKVQSNMMLSLVSYGPSYVSPNVTAGHDEALKFFPDDYRQQEEPPADVKQKKVKKGKKGEEIPEKAREKAASLEPQRTTLPADAGAAVSADVQQPGEDIEKETSQTAVQGAEGEAAVPPTTEGEGAPAPEGESVVAEVTHESAPTEAAAEEAPQPGEAVAETSAPPESAPPEVAPEPPKEETPPVEAPPTEAPPPEPTPPEPTPPEAAPTEAPPAEEPPTEAPPPEAPPPDAE\n>SRR5690606_34130643\nXGLQHTPTGHRRSNRRRDRTDPLRLGVVERLIDRLARRCAPPDRLPARPERRPFDRHNPRPSQRHHEPLAQRHVITRRLQPSRPQPAIAVATVAAIALTRCALAYSNVLLTASTGVAPPSIASKIARSVAPLIASARDRADALTNPSVSASSX\n>ERR1719410_660988\nGSNLVKGVMPIWCGGSSRSRSRGNRQPHRRRSSSRRFSPPRGRGYSPPQRKDPPWRRSISRCRRRSSSRQSSLPRRSDGSRERSCSRKHSPRRPNRARSVSGGRNYSPRRVGGTKPDVPVPVDGEPAEFGKARVLKNPSTGRDETWKAEIDIETGEVNHVGRRRVMSIRGPSRTTKERAEEDARRLEAAVPQGPQAVRAVGNQLQKTKRGALGVLAELPGVHVLATYTDLPPLPALRSSGTCRRPIPCMLPDVKTIMDLRLRMGEVYMKDEAVLLRVATLRVTLGLAPEAAPC\n>SRR6266487_7083492\nWREDFARGTEVGVEVGIDRAVSQDRGGRLGAGRVDQRRSGMAIIRYHMVAVIGRDCEAQELIRRWLVADQGPGNLDLNEAAWQLAVGRADQLRSAAVATRRSGGAAVESRWVKITARRRGESCLNHIFPAGSAGYVGADAVRQRVDSAGGVIGIDRDHHLRRWIVRDSTDAIYLDQKIEVVAVAGDAERIQIGLAGDVYGTGDDSLVVEGVIEDELALIGGVEI\n>SRR5574344_1391919\nKLKPQHGALIFYVLFAAGAGLELLEEVIALVIHEDECREVFYGNLPDSFHTEFGILNALDALDGALRENSSNTADGAEIESSVLLASLSDTVATVTLGNHHERSAVCLELIHVGIHTVGSGRTHRTARIAFGSLGRSCIENRVILEVVGHTLTGIQASLELGMCDVASHDDSALEVDAGADGILRQFGTHGVDTLVEIDFDPLGTFARIAHFGRDKLCGVVVHLLKPYTVLVDLCLDVAVGRAAYTHTDGTACSVARQTDDTDVVGEILTAKLCSKSNLVSLFEQLLLKVDVAEGTTCLVACGGQX\n>ERR1700722_5898992\nVDLGAREHQVGGIERKTGQDAQRLEIGRRGNASQDGEEHQRNGAAKEPHIAAVTPRGAEGARTVVTAPERGPAWIAHGRCKAQCAYPLRGPAECGRESSARGYLNAAPPPNKSPCNYGCDTAVPSLRTCSGMGKNVLTGPAREVEAGPIGQEAETGGGKLGAPLARQHEVKLVLEGVQKQHIGGRIGDLSIGQLGRTPIGXX\n>ETNmetMinimDraft_35_1059890.scaffolds.fasta_scaffold1061826_1\nMRSLRIDAGMRGFCGVLALSVLLAGCGGVSDLAGSINPFSREKKLSGERQPVFDGADPATVATARPASVGPASGGQEWPSAGGGLANDPGNQAISVTGARVWRSNIGATGGGLTTDALRASARPVSAGGRIFIYKPNGDVVALSTNGGRQWVKNLRPEGERDVAPGGGVAVSGGRVYAATAYRQVAALDAGSGQVLWTADLSTPARGAPAVGQGHLVVVTQSNEVIALKLEDGSQAWSYQGIEEIGGILSAADPAIAGNQVVVPFSSGEIMSLDIKSGEPQWADGVTRGFRTQALSGLADVSASPVISGDTVYATGVAGRTVAASLKTGTRIWGTDLGSVHTPVVSGNALFMVDLEDRMVALDRKTGETLWSTVLPRPEKKKRRRNWAGPILASGALVAFSSDGRFAAVDAASGQIILTKDVNTKVYVTPIVAGGRVIVLDGDRAVAAFNX\n>SRR2546427_1622280\nPAFSRCHEIMVPPIFVTDSPETSAGARKEPASLGAQSRASPTPSPSASVEHASPMPSPFASACVGLGQVGQLSSTSAKPSPSVSRRTREQGDPLGREAPLDWLPRPDSPQRFLDETRX\n>SRR4051812_6966754\nSLRPRRPTKEGCSMSLRRRAVTTAFAALAVAGLTAGCASTGSQAADSGGGDVHATPDAAYPKDLGWEPMDNSLTNLACTDNSYANAVKKGIKLGIYSAAPYEYMDNGKPAGLDWDVNMAVLKYLGIKKYTTVTLQWDAMIPALKSNRID\n>SRR5262249_18224374\nTLAPLAVLIVASRSPALRLWQRRQVMELTGKQIAVTGATGFLGRYIVDALLKRGARVIGVVRNPDRVPALAQRGVEFRKADLTQRDQLVKGFAGADAVVSNAALFSVRKMFALGSSVWDEHERTNIAGTRNVFEAVTAAGVKRVVHVSSVAVYG\n>ERR1719430_1578260\nGWSSPPGGTRGGWSCPPRSSPWSPWWPAGLKWFPGHFVISECLPEILSSSPSVLSYYRSPWDFHRKRRVAIQHLIQDHTQGPPVAPGVVPTLGEHLGGDVVRGTHSGVSQLASSSLPTLSLPLGLRWVGCQVERLSLRIVFVEFCSMSFLESSAKTKVGQLDVSAGIKKDIVRLNIPVYEAKLVYX\n>ERR1712156_240685\nLNLMKQAAGKFTFQIFLFKPQSRILKRSLVSLERSNRSPFQKFTVLEGQRGLLLFVLLLKNKEKLPLKDSMVLLLKEESLEFELTKDVLSVLNKTLLIVVVAVADHKNKDLNSQNQLKDVPRFTSGIFRGSLMKRSWNNYFRSLVQSRTHEL\n>SRR5581483_5340204\nVRVFVVKQRVAARRVARGLPGVGEARLDVGEFLAMLGRVAAVAVTATQVERLLVVRVVLVLVTREAAGALHGRRLRVLAQQVEDRLADDDRFLAPAWRDPRPAAAQHQANDDRRGHPEQDGKAREKLRLDRHEGRQGTLRAGFGAAHPWRSRCFVAGRVFSVNGKPRPPRRRADRAELACFPRLPNLPSGHYPSCRIPWASCPCTQGETPMFPHLARARSRRRPFSWKPRLEVLEDRRTPSGIAKVQDLGTKADTTMAQSVSINVPAQGVAKGDTILVTVATTEADPTQGVSVTDGAGNLYHRDADVLKSNERLLVFSAPVYHALSGGGSITFTQSGMAGSPTALSATEFSGLLLHDKSAKATGIGTTASSGPTPITSEANELLFGAIAANAFNVNNPPPSTMITAGQAYTGLPQKTVVDSVERTDLKPEFAVVAATGAYTADGTIAANREFLAALTTYRQVPPLSAVAVTATVGPHTKDNRILVLAGNTDPSGGTLSVQSVSHPAHGTASX\n>ERR1719323_1321519\nGKCGNLEGVRVLLVLVHGFGVNGLGLLWPRGNRRGRRLRLVILGRRQRRHGGRGGGRAGSPDRGDGRQRGSVVRLLLQLLLLERVVVMVVGRGCLLLRVDVLLLLGVRGRRRRRRRPRPAAHGRGERRGQRRGRDRVGWSRRRVCRGGLRHK\n>SRR5690606_29123364\nLEGVPARATIRAEYTKMKQERYTFLTAELAQQVRDLIAFKHRERNLACRNSKDGTYYIAKLKPKVRPNDLLFAIYRRDETAKMAPKVQSLYNMYNVKLNALLDTMGLDAKEDDARRRRITEYSLRRYVKSAISNAX\n>SRR6516165_751239\nXMRFSTIIVLLLFASMGWGQAQVNEKLETAFIYVDVNTGSDSNPGTASQPLKTIGAATSKALSNNHQGVGSRVIINPGTYRESISMGKNVRSTSLPMTFEAATSGTVFVSGADVWTGWTPYSGNPSIYTQSWPFQWGLCQTVTGSPNNLEDIVLRREMIIVNGTSLTEVLALTAMRPGTFFPDEANATVYLWPPSGTDMSTATVEVATRPVLFSDQGQSGVVLRGLTFQYANSCREKVAVGFNSASNVLIDKDNFFWNNADGLGMFYSQNFTVQSSVGNHNGEHGLDTAFVKYGVWQSDRASYNNWRGAQGAFYLWDTGKFLYNHNNTFNDHRALFNQGPGVWFDTDAADTTLTGLIAVGNMMNGIFVEKSEGPVTLSNSYVCGNNPQGWAPYGGVGLRNSSSVSLIGNTVFGNGFSQISIVGEAGGILVTNWETGQVYNLQTENLALSQDIVVGGPTAQVFSDGTLGGEDWNVFASTLSSDYNSWWAGPNTQAFTVPSPSFENLDLSGWQNMTAQDTNSSWTSSTSPAACNVQSQGRDYWLVADLIVPVTVSPAGVAAYNLTTMPLGGMTGTVNLSLDGLSGIPGVTASFAPSSVSTSGASVLTLTTSPSTPAGTYPFTVIGTSGSITRTVTIPLVVPTTSVRLSTTSLSFATQTLGTTSSAQAVTLTNTGTLPLAMSGISVNGSFAETDTCGASVAAGASCAISVTFSPQWLGTATGTLTLNDADPTSPQLVSLTGTGQGALVTWAPTSLTFAGQAVNTTSPAQALTLSNTGNAAMTITSIATNGDFAESNNCGSRLAAGASCSVRITFTPQRVGTRNGSVTIVTNATLNPGVGLTGTGLGPLVTWSPTSLTFAGQTVKTTSPARPVTLSNTGNTAMTIASITANGDFAQSNNCGSRLAAGASCSVQITFTPQWAGTRNGNVTIVTNATSNPGVGLTGTGLGPLVTWTPTSLTFAGQAVKTTSPAKPLTLSNTGNATMTITSITANGDFAQSNNCGSSLAAGASCSVQITFTPQWVGTRNGNVTIVTNATLNPGVG\n>SRR4028118_1117479\nFNDPATTEIYTLSLHDALPISHVASTKGSIQSRPVAIACPSLVLKLSASEDRKSGSAGMPRPISYAAFCLHKTTHLRAHRLHHAPSNLAQALTCARPRLSADASSRALRPGHDRWLCVVFFLMMRRPPRSTLFPYTTLFRSDRGRASRRRSGRWGRRSAGRRGAX\n>SRR5690348_14199435\nAIVSRLVERGNTDRFAIDLCRRPDLVRPADIAWLGSKAQRASEPARALWLDLLDWVFYPLMASSARALLDAAAVNPIVHERFADWLDPVEFGSAREVTHRDRYENATRSEAPERPLGPSPRTIVRRFLRRFESGDVDAYWHLQRALQAEAATGRSHLSEMDLC\n>SRR5215217_5590548\nQADTFPPRITLTESPPANATLTSNPTIRGVVVDNPPPGVQLTVKVDGAAPVNVPLDATGQFQFTSNFTTDGGHTLEFQARDPAANLSAPKIVTFTLQTGALTVDLAAASDTGVQGNRTTTLNSVTLTGKGPANQTITLVPTGTTTTADANGNYS\n>SRR5262249_54389218\nPALGARQRDHGAVPDTERKWDDDRSGDAFGGERVLWVADYPAARWLGGRRLARQTIVICRTSKRRQFPESPVAVAHWPADTTEESPQEPALAPRVLIADDQPDVLEALRLLLKGEGYQIDSAGSPAAILDAVDAEEFDVALVDLNYTRDTTSGQEGLDLL\n>SRR5262245_362740\nAVGLPAIGMLKQALESGDPEIARQSELILKKVEKVPSEALAAAVARMLGRTKPDGALDTILAQLPVADDEQVADALRGALAQLAAKDGKPEPKLIAALSDREPARRGAAAEALIKSKLTAVEADVRKLLKDSDPGVRLRVALGLVRVWRAKDAVPTLIELLATGPANRVWLADEVLRHLAGEDAPAVSPFGTAAERARAREAWTTWWKTNGERVDLARLDKEPPHLGYTLVLKMNRNTGLGEAVELAPDGKTVRWRISGLQYPTDAQVLPNLNHVLVAEHESGAVNERDLNGKVVRTWPVSMPIACQRLPDGNTLVAHRGGLIEFNAKDEKIFAYDRNSHDIVAARKDRDGTYVFLTRNGLCERIDAKGKSVKAFNGGRTYSYASLELLPNNRVLVSQLTGVAEYDLATGKLEWSATAKRNVTSATRLPNGNTLMSSITSNSILELDRDGKVVKETRMDDGS\n>ERR1719242_22332\nSHSHFSTEHTAFNQYNQAPSSPTQNYSTHSSLPCPLSATIHVIVQYKKTKCHTLSTVTPILKEGFAEQNGGTKFIVVPLGDPHWSKRLQRRQQRSSNPGDIVPLQWRIHFDLGLGLTHFVLQFRHQSASKVLGVGGPSREHNLFIQIPSQIQIALIDAVKDTVLNAAIFRTDNGGIEQDLRCSIPGTSNTQFRTVRQLIFRCISQSTTNATRCTIPQIEVVHNIRVIRIVFGIVISTRCCTTSTTAGCSQGTDTRGSTTSHDLX\n>ERR1719359_2831734\nAQHKNLGKGVGVRNDPVFKVSNQDMLKQMDSHDFSGEGSRTQAATGIVDLMKIIKEDLQSDMKKADKIEGDAQAEYDQYKKESDKMLDDLKDKIDDYQSQKADRNTDIDDTEDAKQDEESDLADYNQAMNVLMGKGADDIPFPCEFMLREFHNRRHRREAEVEGLHE\n>SRR5437773_2584272\nPESDAKPFQHAGLSGCRGGSFLFDSRRTEGFEVDVLFRNAPLRQAVSDPAHHRPRATQEIVIVTRRQHLLENINGEPAGVLIISPQDIGFLGPAIADVHVNVVMLSRHLLNVGLLNMVGSTSRSEEHTSELQSHHDIVCRLTPRLTLFPYTTLFRSQEIVIVTRRQHLLENINGEPAGVLIISPQDIGFLGPAIADVHVNVVMLSRHLLNVGLLNMVGSTSRAVEEPYFPPX\n>SRR4029453_10054290\nTFDKDTGHPQHGTSPITRTTGELSLATNVVIQGPGASALTITRDGSGATFRIFHNQANVTSTISGVTVTGGNVPASGAFYGGEGGGILNDEGTLTLQSVVVTGNFAAHDGSGVLNGTVNGGAHATMTILDSTISGNGSVFTNAGGAIFNHPARGNIGVTATDTTISGNTAFGHGGGIQNRNDDEGTGHTAQVTLTNCTITANQANAGGGGINNLDTVSLRNTIVAGNTTGG\n>SRR5579859_1338868\nEVILAGLNDSGVLAGWYMNDVTAAAIFELVNGRFQTVSLPVPDVISASVSGLNNEGQLVGSYETSTSGHGFILSGRHLRTLDLPPNWGGTGLTPGRINDEGVVIGTYEIESDFVTVHSVVWTDGVFRKIDFPGAAATIASYLNNRGEIVGTYSTSPAGGIANTHPFLLKDGVYSDLSSLFPGTFAIVGINNRGQ\n>SRR3990172_9676722\nLLFIDEGTEMFQFPWFASRPYGFRPGWPDTTPAGFPHSGIPGSTPVCGFPGLIAAYHALHRLLVPRHPPYALSSLTPLPSGRCGQRPEPPLAPSRRGQCPGSPPTLFTCQRTRGISPPEPSCPHSPGSPGGDERSRTADPLLAKQVLSRLSYIPTESPAGTAVPFWDRPPPAGGGPFW\n>SRR5580692_1321847\nDLGLAWSYYDLAQKMTQKSLSANVSLLYFSESQKINAALERIPKSYAQGHIEERNGHKSFVDSSGTVVGQERWPGTLMSEKVRRKQAEYNTWLETRAKETSLSNIRLVPQYPRQFLVVGANGALSADHAEIAEIRVPRHIELTGVLDLDTLAIGYYKSAIEWAELCKAAGANNQGLTRPTKEEDFKE\n>SRR5262249_47273405\nXVQIHVLLAVDGNHPGAGVFVLGDDANPPPDVVRPGRAGSVGGDQAVPAHTVRVALEQRERHGATGAGAPGPVGAGLAARGSAAVGAGTAERIRAACGSVVDEPVAVLVLPVANLDPLGRVVGHAPEVRPGGSAVLVSGRSHRIGAGCCIGGSRQRNTHPIAVLDASTSIGQLAGLSSLGPVAVRRAATVTGDRAAASVGEGAPGSGTRATGRRVAAPETAVQVAGLRTRGAAGSEAPAVAGRIQLALAPDGGGVAHAGAGALVQQRATCTAX\n>SRR5438093_5564102\nSHIPDAVKILCDTRIVDHARTGEVNITNVRLAYHKRIGARAWVKDYTIECELAGDGNVSDVRNIKGRDICVFVRHRFGCPVSGCVPIIVGRIQLPSRAPSVSGGERQQTGYEETEGSFHTTVISTANAA\n>SRR5919201_5360144\nFRWFAASAETVVQPSSPTYWRSSAQIGQTRGGGPGGPAWFPQVRQTGASAVASSATAAEPFAKRRQVVVEIGRGLVAVVGLLGERLQDGVLELRIELPPHSRRRSRLSPDMLGEERKGTLLLGRLERRLAAEDLVAQDPCAVDVGAAVDGPVHNLLRRHVLRGSDHRATTVARRGRALVRGARDPEVGHFDVPGVGDHDVLRLDVAVDNALAVRTVERREHTVHPSER\n>SRR4029077_8001983\nRDSSQVQEVSRRNPGTSACTALRAARKLRATRPWMPRTLLERSGGGSGTQRDKTRRHAESWCRSFPLHDGFFLESTLGAGVSLQHAAELPVWPAAGHAPTKLEASRTTLALGIGVGLQLALQRGVLIHEFVELQLHFCQLEHQVRDQLLELRVPAPLTDDSQAGCEGYGTRNPRKQIAHTDSIGRVAGSPRLFAVSLRRASHRVRKFGGPTHIRARGGSRPPPPHR\n>SRR6266508_4076808\nWLAFAVIAVTLLVQGLTLSKVVRALKVPRDDPTQDLLAEASVQSQASQAALTRLAAEGDGAPPDVVQRLREHAEKRTNHAWERLGSQVRETPAHAYRRLRRSMLEAERDVFRQARDAGRIPEEIMAQAQRALDLEESILTRECPSMSLPVGCEDLAAAPADIEPTSKRCVDCEAIGRVGWVHLRQCLAGGRV\n>SRR6266404_7425182\nGIVRRHEVILGSPCPVPRGLEQKRQLRSYRPALFPVTTEQRLRYRRAQLSPSRWPERSVQRVLIKHVDEPITQRQHMSGKLPFTDEPNQRIDSLQRLEALFNIRRIQLESFRHDSRIELISLHARSNQQAPIFVAQLRDLALNHPAQ\n>A0A1G9LFL1_9RHOB\nMRSECVECHDGPVHCTAIKKTIEYRGNDALMRNILNAAILASFGGILLATTALADWTYSGPPYPNATIQTNDMSLEVQCDRIRFAPAGYEDSQDIVRKNGLSFRFLVNGSQEVASFQMGRENSFVQIVDNYPVEIQLSDEADYAFVLDQIAANATLNLSMVDQDVSYGIFDLKGSGAAIQSLRAECRALDQTSAPLEAPEGVVYCGGGGIKRQIEFEILDDASDEWDARVTVNGETQRAMTAYSYFGNSEPVKDFVVALLAEDRSEFLIFRNRMENWLEFGDYRYDQCN\n>SRR6218665_3367076\nXMKLSMCSKCPPLTCTHAFRRLVKSFTALLIGSCGMSSHINCKEAFSPVIVFGFGCSYDTFPAWPPHVIVKGVEIWGIWWPTVLHNDLRTVCVQLLLRDTCRVCWSAILLENEPGWHQLFAVLDKLNFHSLYGYARTIAFAPHPCSRSVCIRILSACDTFPILTALTKYWLLTAILPKHRVLYLHIRLSDEFAWLQLGCKVIKRGILSVQIAX\n>SRR5258705_1672816\nXMFGWEVDGQRSLMRRFFHIWSFVFHKFISVVTMYRCAKGVRRRTSCLADPGDAGRRVVGEAAGEALAGARAAAGAAAARRNKQVMPEVLGKWVENRMGVAEGVHGAGQVMVKALDGFSDRVSGFLGGVTSPPRIVFLVLVNRLQFALDLGLDRPELGFVVEDGFQLLLLAPERPGGP\n>SRR6266850_6431312\nCAWTCRAWGAARSRSCSIATTARRAPMRATRLWRPRWWCAARAGPGPTTRAATAPPGTGTLHRRSRAARLRLGTLRAVALAFALALALIPTAPARWCAADGRPEALSRGEIAFLDTLEQRTFRWFWELSDPRTGLTPDRAPTRSFSSVSAIGFALTAYPIGVDRTWVTRGEARERVGRTLEFLWAARQDTSRAGATGLRGFYYHFLDPASGTRFENVELSTMDTALLLAGVLFCQSYFDRRNPGETHIRALAESLYARVDWTWAQVRPPTISHGWTPEQGFLPYDWRGYNEAMVLYVMALGSTTHPVGADAWNAWTGGYRWGAFHGEPHVGFAPMFGHQYTQVWLDLRGIRDAWMRARGIDYFENSRRATLAQRAYAIANPDGWRGYGPALWGLSACDGPLDGTVSIAGRARSRRIRPTPTRTTRSATPIRRGATIATRWRCSSARCRWNATRTSSG\n>SRR6266545_636481\nEWAEGAGGVGLVGPGSGDGLGQVEFGGGGGDAAVVGLGGGQADGGDFGLGEHDPGDAGVVGAVGFAEDGVGDDPGLVLGDMGEQGVAGDEVTDPRLFPVQQPGAALDDGDLGAHAGQKLAQLDADRAAADHHHPAWDVAQGGGFPVGPHRHLVQAVDRRTYRVGAGCNDDVGCGELLPGDLYPPRATAGQPGGAFDHGGALFLVAGDLVGVVEVADHVVAVVAQPRPVQVRGGQAGGVAGLGARLDRAQQGLGRDARPVGAFPADQLPLDQRHPQPAGKQPGGGDLAAGTGANHDRVEVGAHRFYLRLLVGWGWGRRWRSAHAASVTAATASPX\n>SRR4051794_24386335\nMLSSSACEVRCWSTRATGLARGAAGGPEPYATLPASMPETRVSGAPRLDLSPYPLASHLGRIFAGRGFPLHLVGGSVRSLLLGLPAGDLDFTTPARPADITQLIRQAGGHPVPIGERFGTMAGVFAGHVTVEITTYR\n>ERR1719330_1029551\nLLQALIVTTWPDADGPRIPAAGSEPKRNRLHSILPSPSSGIQPRLHEPPCEHRSIAGANHTRRAGTRCRPWLPSALCLVQSCLTRALATQPRYLPYWNSSLPEHWNPMFASLLNLSSAVRSLLEHPSLLWLLLSSPFPGPCSTSRASQSHLSSPRIWSRMRPMLQGVPPEQLCAHETRSLPALQFLFLQYLRGQQWRRVRPGCPNSYRLDLPQKVLPSAEPCTTSDYRICSACFWQMQALLWPLCQMPSRPCTRRSDPCAEPSLQSSDLLPKRCNGLFGLRDGSFLACYTALKRLLVLIVVLFGFQNSHHVVNHLNDLVEASPGDILLTGQCQHQQFQPRFVLHGCSLHG\n>SRR6188472_3631345\nRRLLREKQFLGRRFRDSRGLARRLRGKLGGRRLPSRSDRDRAGRLVERSRRARVSPAPAIEAAVLGKKLVDALATRNPDKAVAPRLLPSAELSLSQERPNRLRRCSKRPRGFGHSEVVGHFGKMLAQPAWPSETFX\n>SRR5262249_43660061\nXEIIDAVVGSDVRDWRVVEGDHALGSEADDGEGGRSYHSLAVYRAEPAVSLVWGLTENPNFREIEWANNFADPSAKSAWFDIRYNGVPVLRELLVVVDGGRCYLPMPSRHGETRSVPSAYSRVVRLMQKLKGRHEYDDYFARAGLIETGDEWPTT\n>R8G6Q3_BACCE\nMLPEDILIVDNFYSNPDAVRKLALEINYQEFGEMQNFPGFESEKSFSSTSIKERFQKLIKNEIIISPREYIFGKFRYSTENDYAHTEVHLDHDVDWTGIVYLTKDEDCQGGLSIYHHKKLGLDSAPVQSELQDFNCKNIAEFDSKYIYPYTKLAENWNLLYYIPIKFNRLILFRGSKYFHGITEQFGNSIYNSRLTQNFFFKEKVKKGVGL\n>SRR4029079_2700613\nCQARAAAPTMYRPGQVRTTRSECGQAASSLSLDVITAQALAQERAHARVRRLAGGRIGADMDALPRMHAVGDIEPLHDGSRRRIERLITARIRRHEELAPAARHRRAERDAGGSRRPVVELADMNAPR\n>SRR5579875_498642\nXMGGGPGSGSVLQAHGGDDRRDRGDAAADGPSAGRDWQAHAAPSCSRARRAGSCRAAWRAARVIAAGLNVKTRKNPVNTRCERVREVCPPGYCRVMGRGEPVRGSGRPSGRRGGAGDRGGAGSARKGDRMRGMALAAALAGAALLGVAGCGAAPAPQGSRPAVSPSPAGHRAGPPSCVTPGTAGRARTFTITEKDNGRSYCVTSGTRLLVFLHGTLARKWGPIQASSPALRRRPSPVMMLAIGVTGGYFVAASLGTATLTSVRGSCPPGASHCRDRQVFRVSVLVRGTMX\n>SRR5215472_4865484\nSANGRSVAPLIPLPEAAQARIKAREAQAAAELEILYRACESDLSNARRNPAGYGTRHGRLDLVTEQVRQTMREAQSVGAQYIFNVHAVEYRAVTPDPVELKAVLEQLRETIIIHYGEHCRTVVQVMETREFEEAWKQKPAVDSAAPIERRGEAVGSSDYPHPLRRGDGSNHQAIPAVRRSPASRGRQVKSESGHRRLDPVVQRIKAKVREYKKANLTFKEMCERLGNSERPPRATWTHLPWPKAYEKHTSAVSKWLSEA\n>ERR1700722_18781964\nXMSWSSDIRCLYCDGKLPLYRKLTSGQFCSAGHRKLYWQEQERLGVERLHETHDSLRAFRPKEAVEALLGYPPSYPMPEPARAHGVPIQAELPPVAANPIEATPVADSYPGSYLNDADLSPQTPLWAPQEISEPDHGVEPPAPMGGFIVVHAMMPQPRWPLDRLVIPEPNPLATTGPVWIPLRTMAALIRDVLGAGAAAMPMAPRPYEGTRRLEPVHPAMLPCLDVSHSATPAGNALAAEEDAPRAEKLLALAAFAAHEPAPDGTRRDPWPAAPFSKVHKAHLPPATMERNVRLTIAAPPQAGLRSLAIDQVPLVHGTWIDSLRALKSEGELPRYELSTPAMRPRLRLATGSRYPVATRDQNPGVATVEPQNLQPSATAVAIPERAMAAAASCSAQNVPDAAGLIPLLAAVKPNEPAAQLAPSTQSLNLPQPLLTEPMRPASHLEPLDAKPVMDFMAPTPQIPSQIIKMAADEPKKDSPAMENAAALPPSESGDVTPWTVVAGFWQHAPRDLKLLVFGIPILLALALHPSLKKIPYAAPLKAGGIERNLEHNFQSKLKDQWVTVKQTMVDRGAIALA\n>SRR5947209_11779987\nPPRRPAPASPPRSRPRSGRRSGGRPRPPARPSPGPARTPRRPAAAPPARPRPPRWPARPWTRPGAGPPTWAAPSRPPPRTRSTGPPGWPPAAPPASGRRRPAAAGRRAGSARTGSAGSGSRPARPPAPRPGSRPASAASAGTSPTGRSPGRPGWSRRTPFFPPRQGGLDRLGRDRQHPVAGLELGSPEQFGVALGGQHIGQAAQVGLTGRRQRGEDAVGLGALLGGQFRSAHGSAPANEFRRPTHTPRPAAKNPPTSETHTPPGIATWELIAPPLRRGYNG\n>SRR4051812_12632978\nGRRSTARAGRSPAGTARRGTGWGPAGGSGRGSARSCRSPAAARRRPRPAGRHCGRPWRTLPRPSPRDGSRTAGESPCRLLPPASSTRGSGRPACTPATTPPLAGTVDRGREPGQTHVAGGCSGVPASYRARSGPSAVVRVTLDRPPRPATAGLGRLVAVGYPERASGASGGIGRRARFRSVCPKGRGGSTPPSRTRRRAPDPGTPRAGASSSARTAGQEAVSTVRPPRRPRAPSADDPGARDGVAGHASIYYSAGPDGCHAARHRDSRLAGPLCHKRTQIRTWRPSTGGGPPRPVTSAGSTESATPKPGVRPSRQESAPFERESAPTQRVLYRGTMDVGPCSPLRSDPRGPGRQTYQRASRTRCVTTATSHATETSPARATGPAISLRGLVKRFDDVRAVDGVDLDIARGEFFSMLGPSGSGKTTVLRLIGGFERPTSGTVELDGSDVTALAPFERNLTTVFQDYALFPHMNVLDNVAYGLRVRGVGRTERHDRAAEALATVALHGMEKRRPAQLSGGQRQRVALAPPGRPAAGGAPPRGLGRRPGRAAARRAARSARPEAARAHAGRAQADPARRRDHLRLRHPRPGGGADHERPGRGLRPRPDPAGGDPREIYERPASRFVAGFVGTSNLLSAQAAQELLGRAGTFTVRPEKVRMAAADALGDDRHVVAEGTVAEVVYAGPVTRYLVDLDVGERLTAVLQN\n>SRR5207247_1084271\nDDSKCSLAQQKGEHCVSMPPAWSEWIVQVLPISDGRSTAFSNPTQGVGGSFILSLQRDSRARPKSHQRSWWIVHTQPTKRLARPSRIPPTALVGLSGLPDGRPLGLFQQPARAQAKVRSW\n>ERR1719350_1727719\nGKPPSRRQRLFDMVVSPAFQGFFAVLIATDSVVLGVETEYVSRHRDDDRNPGFFAIRQIFAFLFFVELALKAVALRVRFFADPALRNWNVFDTLLVTNSIVELFIDGALGGDQVSELRLLRIIRTVRIFRVFRFVRMFPALKLLVNSILATLQSLLWTIFLLLVFLYLFGIVFTQVATNHFEKVGEVDE\n>SRR3954447_23639997\nYRDVVGLWVAVGTCQYDGGGNAEVEHGDDRDGRADRARNVPAGVGELPDEVRDGLPPGEREEQDDDTSADRGDAMRGERGQALQRHEWCGGGDREDQRRGHPAGESELNATADTQAEKVRADGRGEDRGGYRVGAPGPDLQRLGDVVAASERDD\n>SRR5688500_19711690\nRPLSPPSPLSLHDALPISLGGAEQRDLPAPDQRQRGQCRAHGREDATQPGHGAVTAPRCRTVAAWHAERVVGRRTVLTGAALLRSEEHTSELQSPCNLVCS\n>SRR5512143_883754\nLERIFFHDVLGAANAVQGLARLVAGDDAERAKSAAQSLVRATDQLLEEIQAQRDLMLAERGALTIREDETAVSDILEAVRQQYQWSPLAEGRELVVETAVANKRLRVDRTQLIRSLGNLVRNALEATADGQRVTVSTQPLAEGVLFQVTNPGAIAAPLQR\n>SRR5579863_223257\nALDWEGVVLVVIGESESELVHQRGSDRVVIRGHHAASLFVRAVAGQKVARRRYRPRVVELGIERILEAVAHVNLLLGIEVVVDSNIEAVRVRWDGRERLVVIGRVCYTQVRVRHWIVLQQCGRYGIDAGRARSGWNGVVRERRTGKWVEQGSGSNRLHQVIQVAGSFGCRGHQKFFGIGLCFAVALVVGEDEGLVAPVIEPWDCDRASYASTEGVKGAGRLYVEVEHGGVESAVLEVFERTALPSIGPALCDEGYVADLRELRIVIECGDLHFIDALKRWIRICEX\n>SRR6266404_1434125\nXMRVLVSHEAVSVSPLISSSLFVSLIVFATSDLVLACPASCWFPLTRLRARGVFLQDRKSTGIEVVDNPAYHLWWECTRLIDSLSRCQKFPASRHRVVLRYCHRAITFIHKSAHLQX\n>SRR4051794_20682467\nVGRGGLPRAAVVGKRTLTLDMPAATRWHVRHERAHLPVAPRRPVLGRPDRAGRRRRPAVLRGRPRLDVRRRRAGVRRLRDRAGGRGSGGRHRPAAAGDCDRLDALLRQRRRRGDREAVTDSGGTLLLPRGDVGPLGRLCVAADPTGAVFGVWQAGQHIGAGHVNAPGGLTWEDLRSPDPATAQAFYTAVFGHVVDPMPEAAPDYGLFHLPHEQAPLGGMGPIFGRDDASAHWLVYFGVADTAGAVEAAQNAGGSVTNPLFESPYGRMAGLADPAGGRFWVVETDGSCQPDRSDX\n>SRR4051794_34313143\nPVADFAHVAPSSEPVAQPEERVAVLLGDRLAELDAVLLLDLLEPVLVTELQEKTVGEVDAHARAEEPARARLPGDRAVGERAVQHREVSALGVKDAVVKLELRAQARVRLRVALLVVLEKGPDAPPRTEVIEVRLGEQRR\n>SRR5450759_4329672\nCVEETGRDVQLRALLPCYEVAVAIFDHAFHGDRFTTDREIELRAEGGRAERHTEGDVRLEVVARGVLARRPVWRGDVGVRGNLRRHLARDGLRQRPRTVGELTIETGQHDGAKLRWLDGAGHRVYGHVHGLSGGHDTVVGQGIETRAARDDERLLELALLLGETKIDFGPDRRRHRRDVAAGFARAATNPDGKMHIRARRHTQQA\n>SRR6185295_8040175\nRFSPGSGRSRPSSLSLPVLDDSVKSTPTPSGQPEHESSSIKAAVVSTAPSKRGFLVGGLGLVALALAVVIAVRPGGAPASPGPAVRAAEAVGMVSITSEPPEAMLSWNGRVLGKTPLKADLPPGTQSMVVSRPGFFDETLVITVPPAGTVERSVTLRRREDPAPLTAX\n>ERR1719401_1546905\nKLLPLLAARQTATGTGDELRFALLQAKSRTHPRTRRAQITALKRPGTRPPAKLTSSPSTHVLVSLASLHSRPDLHVVASVLPSQVAPLSAVPVLFVAAPVTKNRQDRTSAIIFSIFSMANELERQCAGLVVRX\n>SRR5207248_7680326\nGPIPRAQPRCPAYPAGRHCREPSTVCLLECSAGPRDLHSFPTRRSSDLPGTYFGTAGSALIRAAALWDDLEAAGVPGIKGVWKIDRKSTRLNSSHRTSSYAVLCFIKKRVPDNACLVEARLPGRQNVAGHT\n>ERR1039458_7977961\nVLISGPTGVSQADLSSPLLPWILPCGPVFFFNDPATTEIYTLSLHDALSISNKLFVESPATRRFLSPSNCSRTDRKSTRLNSSHLGISYAVFCLKKKPTVLLVALGYGLASLYYLDHFDKLSVLIKRQFSCIRVSIVVSVLTLSNFFFNDTATTEIYTLSLHDALPIWKRRACRCLRHLSCFWCSPCGPRDRKSTRLNSSHLGISYAVFCLKKKX\n>ERR1700760_2163761\nSPHPTAPIGDVVPSTPPANALGKPRTSAVWKTATTAGGAGARTARSRRWWYVSRRGLLSPAKFERRPSVGRFVLGDDVRGNPAALIHLVAVRPRPLADSGTLLAAGAVALTAAANLSATRFACVIHVLSKLGAELARVAGTQIDLIGQAIETKADGLSCLTAVDVIDQX\n>SRR6185437_11610463\nQDRRVWQRLQLLLHGQDHWAGSRAPVLRSAPRHRGPSAMRPTPRPISATRRRSQRVRRIARLLAAGLALAALVAGAATAEATSTGQLQQKISSGRAHISSLSGAVSAANRKVRQLDASVTATSNRLDAVQRDLDAKRAQLLSLRAQLNAAQARLKRLQATEAADEQVLATQLVGSYEGQRPDIVTVVLEARGFNDLLERLDFAQRIGHHNAQIVGAVKSARRAVAAEAIRLGVLSARQQRLTEEVLTERDNVASLRISLLSQRLGAARARDTTAGRLSSAKAQVASLTTQLNRLQAAQRAAAQRAANAGSSPAASTGSRRSSSSSGPPPSAPPSRGFPFPMPTGAVSPPD\n>SRR5260221_13052907\nSLQPTRARATRTCWACSTSCSATASGRSACSPVRREARDWRAPCHPFAHADIARTGPSVVQKSERPRAPRQVTGKWLALILALLVQAAFVAVLVVSVRWQNRTPEPVTAELYAPAPRNPVAEAPPAPAPEPAPPPAPPPAPPKPVVATPSPKVDQPDTRAADIALRA\n>SRR5437868_12203378\nLVRRGVLGPGPTDAGIHYVVSLRFGLDPMLRVAPGFVVHFFFLMSRRPPSSTLFPYTTLFRSPHQSVYCFTGSLFYRVPCSRSRSEEHTSELQSRFDLVCRLLLEKKKQWRTMCPVGVRVRSGACVLILSVCASAPACGVVRTAL\n>ERR1740130_985408\nVVTKNHAAVLKMSTRHMQGTSDSRSDRKRKNAEVAREELQRQKQRLDFHRHKTRDLKARLKDIEKGTCKEYLAQCKTLDSTTQKEIRTIALLREAHMTSTSQLYSFDTMAARHGNRDSKDALKLQLRNTVIEELKEIDDLVKSESSFRRVSKRNLRSKSKTDDVPNGTNHAGTSCLDSFRLHFPLTMREVDEDLRIIADDWHKAALEFKKSQDMIPVTVTHGKLKYDDLVIERGANILVQSELTQTQTEGHVLSIRRNEIRIKCKNGKKWQVQVEHLRTGRVHLFPAGSAEX\n>_1\nFPEDIAHTAVRNLGVPFYMIEIADDPRYRAVVGIENTTASQWLAPPDLVSVPSNGEIPIDFCLDSTFPYTTNMTYTHLMWRFVEPTRQQDDFGPTEWITVPWEMSGFVDAGNSCELLDGSNGTVLQAQIPLPDSSVGKIHYKAMLGTTNGAFPFSYPTVEEGPNYYELSIPYRASFGSSVLALLMFSLIATMVWGGLGYTLKEMFNDERDVLGLPLKCVIWRKLKWKLRMKQAQMSLVEDX\n>SRR5262245_59441811\nSGIRVLERERLRQSTAAAWRHRISGGRSAHTHSDETPCGCHRGVLSAAGPVEGCRSVQGRASSADERRIRCHVEPERPEPYAGRVVGADADHRSAKMVCPTVREEVERLVRDPRVDVYAAVVRRSGVPLAVVIRIVICGEPEVRRLMWIVHVTECVAGDAWC\n>SRR5689334_15183997\nRLGDVVLDALLQRRERFVDDAEGVIAVGHRIDEHADREEVIDLLVRPLAGLHLFVDRPQMLRSTRDFEVLDAGARQRSFERLTHLANELFSLATLGRDLLGERFVPVALEVLEREILKLPPQLRHTKAMRERRVEIARLLGNATPLFGRQPLERPHVMEAVRELDDDDAGVFGDREQQLAVALDLPLFLRATGRQLGDLRETVDDRGNVFSELPLDVGDGNLGVFDDVVDQPAGDGNRVQLEVGQNLGDIHAMRDVRVARVAHLPAMGSLAEAIGAHEQVPVELVVERSLLLPPTRYDLANRRCRRHPFSNVFSGIPSAIPTGRWGFGTLPSACSARLPSWDKQGPTTTDGPRSSTANIRGS\n>SRR5437773_4994510\nTIKIGNGTGCAVTFLRKEDGMPLRRTLELTDSQRQDLVHYRDHDPRPYVRERCAALLKIADGQSPHAVARHGLLKRRDPDTLYDWLNWYERLVSAVSGCFSTAGNIGSVFDRSDELVERLQHAPGEQARQELAPTADGPPPSRWTLRGVREIGRAHVX\n>SRR5512137_1013993\nLWHTLSAATVRMTALATRVLYQRGGGSWRERLLDQLAWPREAARSRFSGSVSSRRIVEGVGFDMEEVRRIRKWVSGATTNDVFMATVGGALRSYLQLCGDPLPPGLAAAVPVGHHDTLPGGEPGNKLNQHRVSLHIDCESGLARLRALRQASEDA\n>SRR6267143_4187927\nLGEALRADARRLAAVDLAYGRDHPVGCPVDVLGEDAARVIELRGNLSAVVWSSGRATSRSKDGRRVLRADDRVRVTKIDERDRTRIRLDVVKRVHQSDLVGARGLQRLVLPVPLLNRDEGDVIARVVRVPEGERRRVREAFGQGGRLHILQPSEVSK\n>SRR5215211_5171990\nPPWRRALPSRSPSRLLGWRNSPSLGRAPSPADGHSSSRPKLLLVLLAPMLPHRGYGPFIAEQTLGPGAGRLAAEQPHGEVSARNEQLVEGLAHVPVGNDELSPLLRGEERCPAQQLLDKGSAHASGAGYYGVEVFEFEVEALAVERDQAPPAARVGERYLRGLVYAAGSRGERRLEQVWTVGSEHEDDVCVLGEAIHLVQX\n>ERR1043166_75354\nYRLLLGSDPAEPLLNEAHGFRFEADTEIKGQPVYVLRWQQDARSFLNAMGLTNTPTSGRSFPVKAWVNTTNHLVLQLQSDLSNWAKEIMGKRPEFPVTGLLITESHSAIETAAIAASVRVFSTQLQEGVRTVERIELPPPNFAILAAPRRHFSKLIPARLSMASSNQIDLTDYYNGALIQAWHPGPPGNNLSALPNGLLQLGGVVFDVRGVVQLAGVDLLRAGGRFPQQISGIRIAQVCHELHFLQAAGWRSRDGTRIGTYLIHYADGRTQAIPVIYGEDVRDWNAAADPGPQLKRAVIAWGGINSEGRPVRLFKTTWDNPWPDTEIVSMDYVSAMAASAPFLVAITVE\n>SRR5689334_14209035\nIANNGIIATVSLIISTFIGAILYNISPGLPHTAMGVVHLVGFLLAFRLVEPKIKDAAKEKFTFKAYRQQLSNGFRHLMTPALWGFLPMMFGLLGITELMRASLVQPALAFNMGFGPEAQSGIFALQLFVAMFAANAMPFLRRRIGDWIGLVAMTLLLMVG\n>ERR1719265_2530241\nPTNTDPRCAGRVHAVRQPTLVVRVGSLDKEVVRLVQLFPQHVLVQVASVVIQETTVKIPVHVNGLATWSVIANVLAEILVSANRVACDVVVAAVVPTAETVVSRARRVQTTLSVALVFLDVHHHAGKRNLYLVQIHVA\n>SRR6266545_7407710\nASRRRHAAAVRAGDRDPAAGGEGAHVQADRRAVGDLDSYGAEPRPEHAGEAAAAQPYRAGPVRHRNRPRPGRLTSGVPMTVLAAPGATWGITGPQFLALYGGLILVSFARRGHQRPARCRQPRRPAGRAGRRPVAGAPLPDGFDPRTVRAAAAALLRKRASGSPPT\n>SRR6202166_3668028\nKDGPAAVAPAPAPPKPDMAGLDLPLPDPVRERPASNPGANASGLNLNKPGEKIPAGKAVPGPAAPRETFRRLVPDFAPLEEQRRPARAFMSENMMPDVRATFPVRKKVLGTAFLQALLRQWWPLLVAILLVVGALWLLLPHPARREAPSARVLPETPSTDAGTPARPLGLYVDSSGPVWRVSWNPGATAFRGARGVALFVRDGDDQNRIDLSPQDLQSGTYQYAAKNQEVTFRLEVTDDRGRLSAESFRLVKSVPVPPEKPTGESVRRTAEPPRPASTAKNLVHPRATHKVPPVVPAGIRPRIKSPIPVDILVHVDSHGRVTDAAPAVKQHAGLESYLAERAVTAAKQWRFDPARENGRAVPGTETIHFVFERXX\n>SRR5215217_2643638\nDDASPAVRGKVGPDVPAMQLDDLPADIEPQAESLGGIIRSSLEEALEDPVTCVGRDPDATITDRELDRAGRRQGESHDDRCSTGTVLEGVIEENGEYLLESQRIDPRFERCRHLQHDRVPVAPGSRAGDYLFQQRRQISWPPAAMSSGRPPAVRHPG\n>ERR1035438_2618940\nSSDLTDLSRQPHGTNAEVDLAFLEAKSWFVKTNQAKAERMLLSLLDAHPDDLILLNRAKGLFAAFASYTNALRITDRQLQHEPDNLQLLQEKGFLCLKAGQFSNAIPTFTRILSVTNSYPVLMSRALAYLQPRRWGEATKDYDRARQASPDSSEPYYGLSDVARHRGDPNTASQYYQQGVSNGLRVIEER\n>SRR5437762_5397717\nRAATGEKAPDARQLVAVDVQGDAHASGEQAFAQHTLPYHPRSAEQKHLHNASTIARQTASIKEARYGVRLQATRWLGGGAGDRVARGVCRVFRVQRGRRARRRRRSADLGRRSGRRGPAGGPAGVLVRIWIWMASAVGIRVLPVLLYSVLAVRPAGAVLGRRVAPAPMLWLWRLLRSSADLRRLAPARPRAHDEGAGSIANRGATNRX\n>SRR5882762_3560359\nRAPGQIFFRLHDDCIYLGGDVAQIGSLHRTEDIERRRGVVVGHDRGRDTAVNVRHAREDLRRSARSVQRRVAEIIEILQAKLRRLRRDLVLSSALGIDPERGRRLETARQRYQHVGGNRLLGQTQQLRLAAIDIHVELRIVARLVDVQIDGARNGAEFLQQLVGKFTVAVHVEAGYLHVDGGGQPEVQYLADHIGGQERERGRRIGGGEFR\n>SRR4030081_1498409\nRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLPATLSDLGVLERDEGNIDAARRHLEDAGAHERALVQADPAPHHRRSLAITLSDLGVLERDEGNIDAARRHLEAARAHERALVQADPTPNHRRRLAITLSDLGVRERDEGNIDAARRHLEAALEHNQALVQAD\n>I1BUC6_RHIO9\nMLYSRLSPAKDRIFLQKILPACNTTSKLFLNQNKLFVIRLASTRSTLYNNQSKPDNVSLNGDAKKPKRRFVKVDSEFSKANKFTYVMPQDPYVASDRVTSILKNGSVDDAIEYIKALPLDLQSVVVWNHLIGYCAQQGKAKFAEQSYVQMRRRGIAPNDRTFTHMISVYSKSTTPNAVENAEEWLKKMKNFDIKPSIIHINNLLKVYNHAQQPSKTIKLLHEMPSRRIHPDAFTYSIALKACSELSEPGQAAKEIKQIWQNIVYRLEGEDHGDSLKIENLNLKIDDGLVISLLTAISRTLSKESDMIPGLEAIHRLYSLYPPRAAAVIEKHQLFNVNQQYGFGMQPSIKALDTILRFCGKTKQYALAIKSILDGCMTLSHKYIHDQKDQHKSKYNVWNQSGRGSTYATATKSRNDTTRGPIIAAAATNLTIAVSIIASANFRC\n>SRR3984893_10676208\nQLRRAYPKWRKAGRPAGAGSDPVRAGDKPQDCEGDRPRSAADAARACRRGDRITAAVRESVPGTKRRKPRRRVYVSFWGSSGSAWTDGLGCLRRKCRVGPGELHPEPLTDPDLTLSRHPARATARRLPPSVENWRLLLLPVGSLPTAMTCLLRSTSITPASSLLQGSPPLSGASVLSASRLEPLAPFPLPSPARFSRSVPEPDX\n>SRR6185369_3836006\nIGELLSSLRLQIVRIDIELAVAVRAKVDRVSHPHRVYVVGAALGLGKLLGGVVAKTIKPYRRVEAAAIMLPLGKRLRQRVVSQSRSVGRIGRLECVWQLERLFDAAFDRNGEQLGVASGEDSARRSEQHRRSIGCESLNYVRTRMPRQPRRHSAGNRHYIDVGVSFILGGKRDERSVRREPRAGLLAFVAG\n>ERR1719376_375132\nFYPGMVNTDKMKKTSLTYTITPEQMKAEDRIFEQQIEKERRHTLMLRQARKRKKRANKNRGSVPGTLVPIRAYNSYKTRERGTRIDELRNVDQQVAQRIPEQQPKAPVIINWNDDDDGSVTDPGHHLHQTFIEAITTNIKGLDPPKENEGPSKHNIRAGAGTPWQHGMKEIPSSFVDQISIVGVKKSSFFQLMVTGNLFWLRMFLKGKEQMLLPDKLGGKSLDLDTLKVSTPALSGLSDNNYFNNCSQIIELGKTLMSKDFPHLKVYRCHNKESKKNCNLVSKFRHWTVSEDLKYLDLNGNEAFESAAHNTPDILIADTVKKYLEDVNQHDSMIEVMTMIVKILCNHLHVPLRVLKRERSFKEIIKCLVEYCMNKSITFDGTKQLQYSINKLMSKASKWIGGKRMYRKLLQSYLNELFIRRWIEYDSDKSITDLINDFSGRTMVDISDMSSITKSSFCSDVSENVRGGGGGGERYNSSSPISSKRSGLYSFRCNEMSDLLLLIVRMRSTKNLGGKIESSSEKMILDEYLLDWFFNKIKEMNLIESQVSNTNLNEGSAKITALENFMLTLALPNTDNEVTDTTTTSDASVATAIHYKWNYIEEDKYGSLESFNGTNHSDMMKHLILDNVDIDKEERKEEKLSDYIKTVDESIQNSLTNLLNNEKCWGPIRVIWGTTSYIRLLLHKYSNVLDLYSESCHVIEEIPSFKVILLRGRRX\n>ERR1719191_268510\nRNLLVLGARNAAGIIRVFHRLARLPVGAYIRIALATWRARRFVFLLRAATHGNVEKSRSARLLEQDGFCRSCCRVLFCDRRKRDLLLMLLLVFPKNSSSTTVLCFRSTGKRSETSQDTEYPKMNMNTTRTRNSIVSKPRSNSADSTALITILRKCCKEMGGCKSQRQTARSLRRTNTSYVASVRG\n>ERR1740124_282413\nRDDRRPCCEEMYVLVRESPRAAGTELRFASKPCAGEKAAMDQWRDAYNTSRSSAQLKREGKVVSVALTEQLAHEYRRFRSDHPSWLSLEPPAAVRAVAMVEADEPEAAAAAGGGDSGGGGGGGGGGGGG\n>SRR5271168_1700852\nLALLPHISHGRGIVTLFVAHCRWISGPDNYYGPTIDLESIGVRDGLVEDLVVGVVNVGPVCRVADVKGGGGIIVGIGPLGLPGRRVVIEGTYLYLVGKAGVVQGRQYGGHACGTPAGDRTCSAKVGAKKVQPGLTRLANPG\n>SRR5712692_205962\nKLFERSSKMNTMIRCLGAAFVLSLLTLCICPDASGQGWTSTATKAYLVQNLSNATLIGPLDSSTTLHVVVGLQGQNANQIQPTLRRMLTPGDPLYGTSLTVPQFITQFGPADRKSTRLNSSHSSISYAVFCLKKKKQNKKTSCYEKKKIKKTKQETTIQKQ\n>SRR5271156_1441549\nCVGAATQVLLVLIPPVLIDALGLFWTRWASLLINSIGPFDQQHLLILVDLLQLHFDDFALGGRNVAPDKRRLNRKLAMPAVDQHQQLDSLGTPMIKQGVERSTDGSPGVQHVVDQDDIASVHIKADSAGADHGANIVGREVVAVKADVQHAVVDWGLFNRADDLRQPLGQRYAAAFDADQPYIFAPVVLLNDLVGQPDQRA\n>ERR1719300_424020\nSGDQLFRSFTKFICSFFRFLTLSFATRFTLALHGFGRFLGCFSSWLLLLSSYSRTRSGCWCSTLFRSGKDLIVIRDIIIIRVFLWFRCWTFFTLGRFFLFSLFFLFLFFFFIIRSPQLLRRRIVWIHKPVGARKSLSTDLLKPTFGX\n>SRR6267378_6278353\nRLSVPKRIIHGEGIWGSDKLARVEPVWARPEYANLIPLALANGVFEINPKKIWSSVYSYNRPEITVEKVEEILAAFVKAALLFIWDDPATGKQWGFWIGIDKAGRLPAASRLKKGHDSVGPTPPLDSLQQYMKQPMASHGSANGLVGSGSGSGSGSGKDVRADSSSPHESVTPQTPKPPDEKLLVVERVWAYYVQKLGKNPKQLSFTAGRKQKGLARLRECLEKEGGDLGHAEGLMRLAVDALAESPFHRGENNRKKRYDSWEKNLFKDQDQAENWLDSTGGSKRGPVPVPLLDRRGELNDAGRTVYDKAGVSMSX\n>SRR6185503_10073111\nSSSLASRLDQQRQFARENYNWEKRAEEWERWLSGFGNATSRLPAAVADTALSAKTAGNFLRFVGEPEAAIAMYRRSLEIEPDYLPALYNLGMMLHQTDRFEEAEESFRRVIAIDP\n>SRR5438552_10382664\nSYCYSSLLYSCRHLFISLLLWFMVYFFFFLLIRRPPRSTLFPYTTLFRSTRQFLTESLVDGERSQSKSFSSCARIGRILRPFADRKSGSAGMPRPISYAVFCLKKKKNILKEALALEHTTGERWYAPELYRLKCK\n>SRR5947209_3319617\nCRAMRVLMRFYQKIGFRIIVGAVLLVSAVAGLLAWRIQGLSKEVLRTHEYADVFDETNLRFREVSSDIQTLRDELLGLFNDPVVRQLQWSEHYKEGWLPIAPPGLEDKAAFSKHARKQATEVFVQLLRRHVRYFRIEYYLDRTRT\n>W8CC99_CERCA\nMKFLLTLCFAACFIATLQAAAVDSTTAQPKAAEAADASTTVAPTEASDVVEECHQPKETGRCFGLFYRYAYNVENRQCEEFVYGGCNGNKNNFESKEDCEAKCLAAKKDEAPKEAEEGEESSTLAKEGDEDAPVVPVVEAKPVAED\n>SRR4030042_5098232\nKGDAFLLIESQRGVRRSNYCQIGKASLENLVDCDTLQAAEVLSHALPWLAGTAVECFGDDCRFSLPGREVGRERWAEKSHDRSRRCGRDVHRAAVRADKQGGATDDLPELDHVELSGQX\n>SRR5688572_19060020\nKIFRIYIQANSYFTILPACFTFTQLKILIMKTIISALFIMAAMFTACNSKSGSADAQSTPEGAANMIFDAAKSGDYSKLKGLCDASLDTDVDSKKICEVSDGNEELKKMFKDYFSKGKVVGTPTIEGDDAKVAIMFGPEGTNDETMNFKKKDGKWY\n>SRR5438552_950382\nAYRYVPATPAPDLFLADESIRLGVTAPGTSVTRDLRLANQGTAPLEICDIATDDARFAVRPASLRLAPGAHATVQVTWSASDGNPALGTLTLGSDDPGSPRRTVQLVAGAGRVAVGQPAPEVVATLLDGTTFRLSAERGHVVVVAFFATFCPACSF\n>SRR5208337_2690271\nXMAFALLVRLAEQPPMEVNIFEDAECWIKIAAKALGHVGNPANLGVPVYLAGHIAAKHMDLALLNDSDACGEPEQRRLAGAVRPDQSDHPAGGNIDGNVIQRDRLAVTMGNALDLGHDVIRHWEASRQVFPARQRRDWCGRTPFREFRSSREYDI\n>SRR5262245_35595640\nGRRHVRAVGGAQAPDRRAGRRDGRARGQPADRRRARAARRPGDRPAREDALGHRAGRLAVLPRQLRHQPLRGAGHTDGALDTADGAAHRARPHQGRARARAEPRVPDPGRGRVRLREVPRADAEARLPGPHQPRDLAHGPAPTGLRRGRGDGADLPRGRGRLRAERRATRAADDLIRAALLLGVLLAALVPGGARAQSLPDVSDDGGVLFRSELRRLGGVQTVGYPLTGRFVWEGFTVQAFQRAIFQWRPESRAVAFVNVFDRLYELGHDDWLLVHRQTPRHDPSLGDASARLALLEARPAIRAAYFGVVGDPVQANGLPTSRVQDMGNHYALRAQRVVFQEWKEDVPWARRGQVTVALGGSIARELGVLPSVA\n>ERR1719499_2701023\nLKQFCKKTCCKKAEMAVADPCYWTDDCDEKAVGSSSDESSEDSAEKAVANNRFDWSDQKGWCQGERARFNGAKKYPGKRYTSREQCLADCEKENYSGWAPKGCEYSARYGTCNVFFGKSVSGTNRGSSYRCNINRSKAADYERAYGDFILQSNANAAKDEKAVGSSSDESSEDNAEKAVANERFDWSDQKGWCQGERARFNGAKKYP\n>A0A2E9IMM2_9BACT\nMTRRLYTMALMVLGLSMLLSSTGCHEPTSRDPRVLRVGVIVSLKGPARYWGVVTMRSAQVVADYYNERGGFEVAGERVKIELVVLDDEFDATEANRVAHQLVSEGIHYTIGPLGDATVDAARRVLEGANVFYLHYGFDPALQGSGGLAVLGMPRPEQTLSIMFRHLRQEHHVSRAVVMAYGTEAGIRQKRVAEQLALDAGMELVRIARYDVSKETFDVSLDPQGIQRRVAGVVAAAPDLVVLAGCPPEAFVVIVDRLRSAGYRGFVGTQTTQDPRALAKLGEASDGIYYVGGEPADALRSEYFRTLKERYLDLAGEWDAEANKKFYALELIVSCIRAAGLEALDETSLIYPVLSELNIEDPFYQEPRALRLIGGQEEGLPRQLEIPIYITKMSGGRAVLVEESPRVLP\n>SRR5262249_35545196\nGDFGSAQGGDWHSSRKEEHLAANADAEQQTREERVDPVEHSGQAMDDPQELFDLINEDDVVVGRVRRGEAHRNPALLHRSVQVLVLDSSGQLLLQRRSQQKDLFPGYYCASASGHVMAGERYAETAARELAEELGIAPPLTYLGTTLVRSAFETEMTQVFLARSDGPFRFHPTETEGGLFLTRRALQRAQSAGSLPLTPAVLAALDILDRQLPDADARTGE\n>SRR6266550_8732594\nAAIGQRRVTRPGERDRDRVLPPVVGGSRLVVLGRAVGGRSRSIRSRLVDVDASDGGQRSIARLVEHRARERLTLTLVRESVVRLTCVYTGEIVVAGELSRNSRVVPTVRVRPRRSGAGDGWRRGIEAEALRSASTVAGVVHATARDSRRISVRDAVARRWIAALDSAQIVKLVCDRIAERVVVPVIVVGSPRERHVERWRRLVELEAL\n>SRR5438874_2142771\nLRRRKGTDMKRRDRRNGGRWGRSVLASLLVVGGLGGLGLPVVAATCVLEPQLRAITANQGIGSYATVARGKETLVRLYLSLPSCAASGSSIKVTGASLTADNGSGVKKTVSPFSPTPTSTPEIVAAGMAPAFDSDGDPKFVLPGTYLAPSYTTARFDVTFTATVNYQATANSTSSPVVSSKTFDKLSDSTPLKVTVERKTNALRLLVVPMGDGHQTYSSQFGNLDKITTQNGLTTLARLLPVPDGTGDLTSTARGGVRYRIAPTLLDLSSLMTAGKFCGKSTTWGALQSLLLGFLSSWNAANTANPAATADRVLGVVSENISVGGSGDCVDGYATFGEKQAWVRAIADTAFAPSKTGALMAMEIGHTLGAVPPDRDDDFNVRHSPNVAAVPSTALAPNRGYNVDKRAFVPNDRSAMKVSPSGAWNNTNVLFEAADWAWIQCQLSNTASTACPSPGKVGSAVGVGANPTLTITGRTDGTRSGTDVVESGFAPGGFAPGGLLTEPDPTSVYRLVQRDGATILRDDGVEVSFEESQHDGGAVFLDNPFGVFSVAFPFDTGANSIELWNGTPDGPTSVLLYARDRTAPPTLTSVNAQPPSTGTAATERASVSSAEAQTTSGSTGAQPSISADGRFVAFPSTATSLSVEADTNAQSDIFVRDRQSGTTERVSVSDSEAQATGGPSTDPVISGDGRYVAFVSSATHLVPGDTNGQPDIFLRDRQAGATVRVSVATAGTQANNRSIHPSISDDGNLVAFTSLASNLVTADTNSTDDVFVHNLTTAVTERASVSTSGTATITSTTGAVVGVAAPVSVRPNAAVSDDDIIAFDEQPGDAPSARAPAGGLNVDVTNGTADRTHALSPSTIPAGTTVKTHLLHADRPNNPVDFKSFTGTATFGADILGVIVRQSRLEATDGLSSVGTTYPVANDPQLQGLRGLDF\n>SRR3954447_7250895\nXMEAGWEMPAMSSIALAVLVSVVAFVCVWCQRAQDRADKRAELLLQQHLTTEQLAHLNRTGSLQVPSKSFESRVYTVPIRGFVSVHDEGRLVMRLCVRPGTFLPGREAILAHKMYIEAAEDEYVESATVVWRAMSLKTSATAVX\n>SRR6185437_774131\nRLHGRGDETSRYSAKSVRDLGNGAVVSLKVPSRCNLMTRKKITGLDQALGASAKLEATASAAYSRKRSITEVIPPDVTRAKAGAWLDLISPLSEWAGLKGDALRAKREQLRLQREDVLGEIARRARARITAQGLSVTPVPNKFLVPFLEQASLEDPDSSLVEIWRNLLVSAASDFSSHHTHFVSVIARLSPKQGDIFRAIIKAESLDELEYARDEIGMWFEAHSVRQGIAREYGKIPKRTRADLSDDDFAEFIHGYMKTAGISIVHGSFENEQTKS\n>ERR1719456_362451\nAMTATTLSAPILTTMTATIALVRLTTRPATDLTTTGMLLAMTLIRMTTTTLPLTLRTAMTAATLSAPILTAMTATIALVRLTTRPVTDLTTTGMLLAMTLIRMTTTTLPLTLPTATTPTTPFAPTMKAMTVTIALIISTTKLTTDWTMTLMDSVIRVTLTTTMILIPTP\n>SRR5690348_12433932\nLENVTSFDPKTGKALWSKKVFPNAPATVLSVSPDGKRVAVGGWAEICVLDARTGKEEARVPGKDLSIKLIKWLPDGKTALVVRKNPDRQGIPEDRTITLYDTATWKKV\n>SRR5438093_595488\nYNIGTYPTKSMIWVFLPSLEGLFYAVITASYLGLNKTLPRFLDKSLAWLGSLSYSFYLNHLFVIDVSYKICTALGWKVARFADALIFALLIVFPPLIVTSAATYYLIELPFLSLRRRYFRDEHDGVYSSRQPSNHESPHLPFERDDAKNVQLSSX\n>SRR6267378_3168319\nGLRRELSTMNSQTYRLQLCSSDLKVFQRTNRFCTGQRCTKLHLFQSGWTVSMTNVKMQISGKDRTHAPATTVFASIGFASLLTIIIAAPAAWDSRRTEDERVAPLSAKSAAGRPRGLWYIRSGQWQAHARTLVAAIRYILQNDSETNSGKSDGSCPALHLAMP\n>SRR5919106_1596169\nLSRSFLRCGHASAAVRSRCTDELFALRSALDLNRQDRADALRVVLALDDVGLERVDLLGHEHFVVRTDRHGDRLGKAEHLGLVLGLAGVVLLPVRVADLWLGRHDDARLGTIHPGLPRTLGADDLAVLVLGALFTEIPDGAVGVLGEPVVRVLDDLAVEGDGVAYDDARHAHHLARLVCDLHNGALKAVLGATLVHPLSTRLQWEIGVVHRGGERCRIDGRCVRDLGFVRAARSFVILVAHSRGEDDGSDRRNDGCGPDRDEGGARDRHRQSSPSSASPASSSAPTTLNDSSSWTSTWRPLSRVTSTSYMLSSSPTSVPVTSPPPVCSRAASAARSYASPEMGRSFSASSPPAATAVPTPAPTTVTPAAAAAASLDLRFIADSSRRGWTLTSCGQPAESRLKARAYPAPASYPGSRTVNRAPPSVLSAIETSPPCAVTNSATMASPSPAPPASRARASSSLTNRSKTRTLSSAPMPGPSSSTSRTTQPSRSASRSRTRERACRAALSARFRTTRRAATASASTRPADTAVVSMWRRVFARSRRASSKTRSSRSSGLACRWRACSSAAARSIRSSTRPWSLRHSALTVAPRSAGGVAFGX\n>ERR1700674_3395430\nXMALRPARPRLAGRWLEPRGDPRPRGMAAGPTGFARMGPQNPAYRPSPTAFYVPVGFVIVPPAYSWHNLGMAVLAKIGKPNTAPALFRLLEDSALSRAALGCCGIPLAMLDANAKSSPVTYVNSAFEAFFGYREGEALGRSLAAVLLRNDEPLLQRLLAESPKRWEISAWGKDGEARHVEAALAALRDASGKLTHWVVAFSDRAELERLRSEVESLKSLAAASLGIGIEAGGKPARGSQKARIEVPAADELHPDRQS\n>SRR6478672_5938487\nSVRRLSKETILAAPEKIFTALLREINASPDPKIKRACGNSWIAPHNWEGFFLNFGDMIVKNGEFEAAKEIYSTAKLSPSYNEWVYEPALEKRLLEMKENNIAFNKKQDVFALNGNDQIMINSSMSCTGCHQMSNSEFIKAGYKEP\n>SRR5262245_38459693\nKSVAAGQQECAERLTPHKRGKAFPRDERRKSGTVWRLGLTFAPAGVCEVYKFTTLIGCILAQTLGAARTGIAAGPDRPTERTGSPGPVRPFYGRGAIGGVCGFGAMPVVEPPPGAVVVRAGGLWYWKSGAFLSCSFVHVTCSFTLVGSSLPMAAPAPVVLPVLAGTTLNEFMSMATLFSPMPRKPPTPTISARILPCLSNRMSLTSPTWALSGPSTSVPLNFENTHX\n>SRR5215831_1038994\nTPDGTSESNWTNFFNIEKNLLSSNVIFPAIGNHEADGVLFAKYFALPQNGASGLSPAERTYWFKYGNSMFIALDANNPSGGSQVQWLQQELAAARADSSVQNIFVFYHQCAYSNGTGHGDTSTVDSAWVPSLEGNGGVTLVFQGHDHIYSRITHGPNTYIVAGGGGAPLYGTGASTAGTVVKTEASHHYIRVQVNGTYIQATVFRPDGTQIEAFTVGQPGGSGGSGGGGAGGGAGGSGGNPGSGGSGGTTGSGGSGNGTTDSGGCQM\n>SRR5215212_9325299\nNKCDHLSTLRLAVIVVAFGRIAGVDPILFSTCVVRHVCISHIRQFTGGHFGCRSGRFRAIDNYLGVLIGQNGGCEFRDLIGRQIERTRKVFVMVSSITECLYEHEVFSSIDLPFQIFSGNCIHSIFLLFRGHNSHDAVVVLCCGAPAVAIRGGKINESVRTFLHFTYAAVCAFEKILLTHDVSTVEYHADDPGASKAAKKVISLKLRKCQAGVKHPACGCASRRVFKKGRFHSLLCLPVMDDRPAVILAPLDEIKLIASISKPFKATWAVLSFENKIRAWLPVDPLRISDSIGPDLGTRSLLIDEWIVRGN\n>SRR3990167_6373537\nCALPICREEARDLKNEDRKATRITRAKLRGQNIIERATIRIDKLEKLNIKATDLARKMQEKEIDITLATASLQAATEKIALARASISEAKTMLDQLENAEDPLAVAKNFKSKMTEVYKTLVDARQSIKEVFAKNADTSYMRTFIEPMKNKNAVIGIVIIIIIIALLVAVRKQKYAIAPIDEQPATTAPTTPPPSITPDTTTSINDESALRELDIELNAEDDTVLPDELNIETELXX\n>A0A0J8TGQ0_COCIT\nMASMRLAFCGTEVPGIRGTVICPLLLVDESFWLGEKVRPWVLAGLNLLEFDHCTYSRLAKSV\n>SRR5262245_63831105\nLSRLLVKSFMGTFLCAVVFLVVSNSIIVYEVISYERSQLDAYRSQWGRASAWVSGLGRLFFFSSRRRHKICLSDWSSDVCSSDLCSAFGRTGRNYPRRREVGYAPLASSARFSAQQGLASLSHKCLLAPSLPGFPRTVQPVRQTRSEERRVGKECRSRCALKTIDKK\n>SRR5262249_16412955\nEVVLQARKGLRRVFRFQLRIGHRDDSRVVVHGDRATEVAVIGAEDGLTERELAAELLREVVLDAAAQEPVVVFAMPLGKRAVVVLIEQALDGAGRKTRCNHVARGTDIGDPRRRLRLLVTQTQIEPSVADARLTFDVRGIDLFLYALVVVELALX\n>SRR5579875_1120949\nTIGVDDLPIAKGTLIDQQVATNEDANGGDHAGDIVADVELVHGDLAGIASSRFVRLNDHTGADPQQADGRSDQAEGAENQWKENPADIACNLEKGHTEDHGADVLSGGGLEEVGPTSGAVAHVVAHEVGDDGGVTRVIFWNAGLDLAHEVGSHISRFSIDTTAELGEERDETGTKAETHDQRWSGSRQRGTGQAAVGRENDGDAQERKRDDQEARDRAAAQRNHQCFTKTAPCRAGGTNVRTYRDQHADVAGDTGAESPDQKCQCRVPGQANLDGLAALTEYGQYNGDHDSRDDCQCGNGSILSVEESYRSX\n>ERR1719436_269911\nIIHKFSCMPEGPFSPPSKGQYQRMMGSSSLSFLCQQALPFTSLFLINKNIPSTRLRAESGAPPKSKAIGLSFGFVEAASVEELALAKLLGWKVRVIGIFACFIVFRISPCFFCFTFSSFFQIILFLDRTDIRISSGGVHNNTKTKRFFLPCNRVLFVRVRTWFYSHFLQNQSSGDKLSX\n>A0A137STU4_9FIRM\nMKILIVGAGRLAQRVVRMLSLENHKLTVVDANAEKLGKLRRFKNHTYIEADPLGLDFYKSVNLGDFDVVVCLTRSDKTNIIIGSAAKRLGAKKTIALFKEVSPIEDLDDLKSSIGIDEVVSLNRESAQAIADLVFDDFSGKSDFFAKGKMQVLSFRANNSPDLINKTIEKVGALMPFLIVALARDNKVFIPNGNTIIEKDDLIYIAGLTKDIQKFRHIYFPAKTQVESKNIMIVGGGEVCEYAAELMSKKSCNIKLIAKDEKNVKRLRRNLSDALVVRGDFEDFRVLEGEDIEKQDVFIAATDSDELNIVTGLMSKKYKVGMAISKVEGLSYSLLLDELSIDQFVNPIGICANRIVEIIRGNKGLNTFVSFSGRAEMWEVKLRQKLPIVDKKIKDLNLADGIIIAGIEREDGLILVPRGETVIRQNDKLIVFCKNESLKNLCKVVNPESTPTFFGEIFR\n>SRR3990167_1971404\nVASAEQADAVFLLDQRNVQAIEAGTGHHAEVEGHGLALIVEGEHGGLFFVHLCHQRFAQLHKAGFLAAGDRVSHGQLLTQWVNVYAVNLELIVQVRPGGQAGGADITDDLTLLDVAAAADALGKAIHVGIQGAVALAVLNDYRIAIATVAAGQGNAAITGGLDRRAAWGSVIHTFVRTNLVQHRMAAPGAETRTDAGEIDRGADKGFAHAFASGAVVAAIALLVGVTHGGVGLAAVGEARREDIASADLLAVDHFLFVDQLELVAFTNIHGEVDVVAKYVGQIHGQTVRQAGAFGREKQRAVDHAVAIGGLDFRFDQFALETEALLALRQGNAFQVAELAVQAFQLAVGIQVELKRLAYFQACQLLGFLTAIKHVMQSGCAQAHLGKYRGQRVAVFHANRVLQWVDFFLRFFSLCGLQLIASWLLCSCCIGERXX\n>ERR1719397_1477701\nQRSRGSQRWMGTRRTLMERFSTTHSSCLLLEMEEVVSRTEEWRWKAMEEQKLDRSKKRSNLCNISKLSNGGNGGTNALWDFFFAKIQTQCLISKQKLCNISQHSYGGTGEQMLDRSKKLANVQTQCLISKQSFISKQNLCNISQYSNGEEWGEQMLDRKELAKMVISQHSNSX\n>SRR5690606_35020854\nALVRAPARRVATPPAAATAGDGDRRLRAGLVFIARHRLLRTLTLVTALMNVWWAAWTAVLVVHAVSPGPVGVSEGGYGLLLTAMAAGGVAGAALAEPARRRFGARTVLALDVVGTAAMVGVPALTTDPWLIGAAIVAGGAGSAVWRVIGASVRQLVVPDRLLGRVYSASRVVSWGVLPLGAALRGALGEALGVRSVFAVGGIAGLALLQVFAIAVRPGDLAAVGLGAQRTSRGRSVRWATSRPASTRASVPPHTGSSCSTDSTPSKPPSYRASTSRTQSTX\n>SRR6266498_1588512\nICRSWERSTLEVNSTSSRGPGMDPALGWSQGLAVEVGGAGTVASAEIVLPRLLADRVGLTTGLSGALARAGFIPLRDRGRALTDAACALAAGASCLSDIEAMTAQVEIFGPGGGASDTTMLRVLNELAARLGSDGLPGRKLAKTMAGARAKAWAQIVARHGQLPAVKVAGTGHTRPGVDQDQDAGAPRPVLFVRLDATLIEADSTKTGAAGNYKGGFGFHPLTAWCSNVGDNLAVMLRPGNAGSFTASDHIVVLDAAIAQIPAAWRTDVLVTIDGAGASHDVINHLTALNSAAAHGRRGRRIEYSIGWPVDERTLTGIGELRESDWTDALSADGKPDPNASVADLTGILRHGPGGDTMSGWPPDQRIIARRVPRPVGEQAKLGRPPRLALRRVRDQHRHRTDPMAGRPPPHPGPRRGQDEGTKDLWRRQPALSRLGPQQRLATAGGAGLLAERLAAPPRPRRRTRQSRTQNAALPAPGRPSPPRHPRPPQDPEDPTRLAMGRRSGHRLRTTPRPPRLNKRPVPTNSTTPADQWTRRPPEHIGPTNLDPDHHPAHDNRKSHYHEPRTPPRIIQVHAVRRADDSAAR\n>SRR6266481_5783698\nERDQYLRARPHVGRSRERQCPDLGSVGAPDVRQPQRERPEPRGLRRHSADVLLVRPRERCASRDPGRQAPRWVRPERLGDGLMALLSILTSVLSVLTPPAKPLVPKPDPVVSTPTPGGADVQTGRALPVSSGPSRGLASWYPMRPATCDGISVPTWVKAWTASLTLPCGSLVRLSGPTGSITVPVWDRGPEGWTGRLFDLNPAAFIAVAGNLWSGVVPVSWQPAX\n>SRR5918996_3897299\nASRWFARVRFDHVAMVTPRQAPALALLGVAAVLTSCGADEDDPEPPPPPTAVASCGEAFLGSGDPNWRRDATTSGPFGLFGAGRHFQRPVMRELDNGQLLTKLPVIVDGTRPVVLSVPEDELGRVGLDYGDLRTERAIED\n>SRR4051794_24721663\nSGDGSVRRQQGSPRRRPVPGSAAQVCDLQRGGPAGVRQPRLDLLPGCEATRCDGCQPAGPRRRRPPQGAGRACRGGRRPMTGGHANARRDMSTRSLISTDDLSDAELRALVERGATLAAGARPNDALAGQVVGIYFPLTSRRTRTAFSSGALRLGGQIIAYGPNDLQTNTGGSTEDTGAVLSRMLDLLVARTGGTDAELRGWAANGRMSVVNAMSAQEHPTQALADLSRITRHFG\n>SRR6185437_8036068\nRGAGRFRFAGAESTLRLWAAGRPPTGLAMRCRSPRLPVRFSRTTDSWRSSAKRADKDENLRNDEPTGVCCLRRLFQLADLAQLVVQGLEAHAELLGRLGLVAAMAVEGLLDGLQLDLAQTERAEGLEVRAAQPAVGELAGQMGRGDRPAVAQNCGVLDDVGQLAHIAGPYVLFERGDRIGGEQLVAGLRVRAKARQQVPSERGHVVDPVAQRRQMNX\n>SRR5215471_7291055\nAPGLPQPTSEQPTKPKTPLSPPPWFVRGFFARRLNVCRAPDMEGRSLGHHLEFDMQAARQVRWTKTLHLGVLALLERVLHAARALLPRSIKRHLARFARVAEFALTPSVQLRFDARSTALVDWQALLPADTFADGPIVHANNGLAPGGVERQIVNTLVGLQRRQRAAGLLCLRLHDDA\n>ERR1719233_1599910\nFAYAGSFLKDPAQSTLGSSFFLSWACNHHQSHLSLVLYHLQNLNYHSERLWLPWKFLQSFLLLLEIVFWILFWVRLPLFPQLLGQLSYPSLKGLCYQQFQTLPX\n>ERR1700722_19934493\nQLPWRNSQFSDAPGIEVSLTIETVLSNLNSLSRKSQCHDVAGVRNRPESLRSNAAVKNPPVPSLRWRADPSPPGPRVRAPRGGKSGKMTRRRRRKVTTTRSLDARLTSAGPKRILALDCGGVRGVISLAYLERLEAILRGRFGPATVLADYFDLIGGTSTGAIIATGLALGLTVERLIEIYLDLAHKGFRRSAFSAFLGPKFRAASLLEQIQIQVGDETLGSARLRTGLAIVAKRIDTGSVWVFHNNPRGPWFDPAGLDPAAVANKDLKLTRLLRASTAAPTYFAPEHLEIAAGVTGTFVDGGVSPHNNPGLLLFLLATLEGYGFRWPAGAEQLMLVSVGTGHHPMTQARLPGKGSPSALLAVLALRSVLDDCSWLGQTMLQFLGT\n>GraSoiStandDraft_51_1057287.scaffolds.fasta_scaffold520000_1\nVSRNPHGSGSGFATPQVKRGRPASTPPGVDTRALANPTTMHTMSPDTSCKEERPKLRKIDLGEPITVDFTGASRVATSTSMAGSLGQDADATAKVNELRQQCIAAHTEGQVNFERLDGRALHLEAEVTKMALVVAEVQRVVVDIHAQQERLKVETTRVGDELHGQQAAIVEMGDRLVGTTTSFTQHLEDMKAKLEETAGETLKKHEDNFTDVQGFAKLVDNKVVQVEATFAVMQKTMEDIHVRLQATESMAKRAEHQPPPGPPAGVRAGRWMGSAMGNAFSIGKATASCSPGCTDDHTASQSSAGKSSAMAEMTNIINEAMTMVSSQFEMV\n>ERR550519_1962169\nELSASKSQGQMALEMILDEATGVFCHDERQNLSGLFESENCKINNHENVDIITGNDENESLGEHELEVMKGLEVEQLSTSKLTTKKRKAKESDEVMKENRGLDGNILSTVLKSQSGNKKLKVTGLDGSFLSSVKKTYPRDRKLGTKITCSKCDYTTTRKDNLNRHCDRVHLKILYNCNQCDYKTSCGQSLKRHIEAVHEKIPQTKLACSKCDFTTKRKDNLNRHFDSVHKKILYNCNQCDFKITWKRALTRHIEAVHEKKLETKLACSKCDYTTQRKDTLNSHFNRMHKKILYNCNQCDYTTMWRENLIKHNEAVHENNSYSCDKCDFMSTSKLIVKKHVERVHQEINFHYNCSKCEFTTTHKQNLKNHIDVVHLKISQNCDQCDFTTKYKRALKKHIQVAHQKLGFNCTQCEFKTMWKNSLKYHIKGMHAGVSHTNYQHNAINVHKPSLSSRKSVDGEVTTNCRTRAQNVSRDVTGAVNPIRKVSENPSSISDNTEQKRVQKKSETKGGTRFTMKKRKQDEKTSRLEX\n>SRR5687768_17643082\nLLYTGLYHSLLLLFFLFQHPSTTQTYPLSLHDALPICRRVLDQAAARRCRRHHAVQLPGDGPDVDVRQRTRLREHVRAQAERERSEEHTSELQSRLHIVCRLLLEKKKENINNTRLTEYR\n>SRR4029434_9585403\nVIFFSLSVSLFLSLSLPFSLSLSLSLCLSLSLPLSLSLCLPLPFGCQATQLGCAPWWLCCVGIREPIPSHSHGNRVPECLCVFVCVCACVRVCMCVCVCLSVCVCVCVCVCVCVCVRADRERTRLHYTHSCISYSVLFHKNRTSAAVDHIAS\n>SRR5271168_4498088\nRAGGVGRRVEVVLRCRRRWRRRLRADRTGARQQERGDGAHEQAGRSGGLNHRTASPTGAPLRCPRRAAPGAPRCFCIPRRRPRSKATKGCPTMPRLAFALALLATGSTSPAGATWLYCTATGTDGTGAIEFQTTAADVGAVPPARVAYFKQRLVQHATQADADARGMQANCFSFDDQTAAMSDYS\n>SRR5713101_1804337\nHARIQARLNAARDRAEPGEGRPLAYSHRHRRAQDRNRMRLRAHRCTPARVDEYLSAVRLQSDTSIVWCCSNRRIAVLLVLYSSSMSPATPESGKAAGSTHERILRVSKSLFANRGYEHTSTSAIARQAGTSESQLMKHFGNKAGLLEAIFVEGWTQITDAARVAIQDVTSPLLKLQTISGCVLRSLERDPELKLLLLLEGRRIRKEGQMVSLTQGFLGFVQLVDGVLYEMRDLKILRPNISAQAVRSALMGMLEGMLRDRFLAERLGFPADFNHEQIREMLATAMAAFVRAX\n>SRR3954470_16959927\nVSTGLVLVGAAIPLAWLTGVVGLGWPPNASARPASAIGLDRFGAALHLTNDPLGVLRAEIALQLTGFAALVVVHRAHGLDACGESGGSSDTVIARRLRHVVADVPTTSRRPAATTSASRGLGIVLGAPTARPDRPSARDTAAAARRLRARTSWRSIVLKEHGARRRPRGP\n>SRR3954468_5071070\nNGALIGSNTGGAALGGEQVVTVTGGGIDLKGGGIGVNNRASITAVNANQTINATGTITVIGGDSGGVANSSNSSNGAFIVDNTTVGPVRTQTINAGSIELKGGAGGTENFAAIGAAKQVITSVGDVKLTGGNSDGVFTGTRIGGQGGAAPTATDLTLTTLTGDVILTGGSQANAGARLGSSGLTATTPATPVAVANKVTVNAGGNVILNEGTAVGALIGYSSAALPSAGDISVTAGKSIQMNGTTFGTAIRTTGNVELHADQPAATITQSSASRVLASGLTTTSDGSTSLNGQNQVSTYNGKSTSAGITLNNSGPLTVTGLQAATSSSITNNGAMVINGALNTGAGSLNLTTLGATSGLSLSSGAALRAVGSTVQLTAGGAITEASDAVIQSGSLITSSGGATTLVGANQVSSFNGTTTGGDLTLINSGTLDVTGLGVAGNVSVTNNGDLTISGVASSTGSQSYGAATISEASNAFILANGLTTTSAGNTTLTGPNEVSSFNGTSASGDVSLRNIGGLNLTGLNAAGSATLAAESLNGAGNVSTGTGFTVTVASDSLLSGVISGAGGLNKKGGGTLTVSGNNSYAGDTNVLVGTLALGGSDRTNSGVVNISSGATYRGSAGSFTNAGIIGGNGTLDVAATSFTNTGTLRPGGAGAIGTLTVAGNATLAATSIVDIEAQSATSHDVLAVTGAAALGGNLNVTPINGYAPANGDTLTPLTYASRSGTVFVPGTWLPTYNPSNLQLGFDSTINRWVGTTGNWNVAANWRPGHTPLASETVLIDVMGTQLVTLSDGSRFGGKLVSFENFLLSGGSLSLGGPSAFNGALSLTGGTLQGAGNVTASGAFNWTGGTLAGAGQFITGPGSLV\n>SRR6185312_6080286\nRAEEVEELLARHPAAPPHHRLFHERDVRRRSAERGEAEPQEEQRDLDERALHAGVKRARSAIPSVSSSRATASTIFSKPPCGSAFSLSSKRSCSLASSFSPTSSRNAGKSTVSSRAACGSYMRMNLASASASGLRPASLFMPAAVASLSTSAVTRR\n>SRR5215213_10844578\nXMPKTCTRCNSEPVLSARSAAVRAARSASLEPSVAKRTLVGKMLIWCPPRWTLALRLHDASRTYPVRTSENYPSTHFTWVNRGRKGILRTSASVLALVASGTSETASFGKEDTKMYWYNPTTHSSENVAAPSNDSQAIQMLAGTQDSAEFVKEYCQLRRSGTPIEQVLVLVGHEFRLRQPEYQLVLRX\n>SRR6266496_2280139\nELTMQYVLRLFENDVEVSTSSVAITPDAQSYSSVGQTIDDTWRVTDVISQARTEQLRKEQSPPRFYNYDGSVDPINVSGKEHSAQGPFMNLHCLITVVNTTQAPIKVNPVRLVVDGQERTLENAFFRLKDGSRERLKKISLRGNDKEDYELHFMFPDDQCPTSKDGELWVSSDNRPEPITLKVKFRX\n>SRR5439155_630595\nRTAAAIVVPPSVASASASGPSDSEPTRSTLSERAGGSAKTGPKSGCVPGLANPLMRTSNASRSGRSKIPTSVATTAVPPAETNFFTFWASAGVIASVAPRMNSTDAVDASGANRSHARGADEQLAIGERRVPADRLARDERGEREKVERVDRLARPTGGERVVRGAEVAGRIGTLRADRLTQRHLGAHALAEAAAERRDDEEDDRRAEDPEKRPHQTEIDARTLEPREEPLDRARDGVEERRRGSRVVNGAQRVAQRRVRTRSLDRRX\n>ERR1719277_1000244\nPDRASKAAGLRCAAEVELWEEMVVAGVRQVLQHHFGEVLARAPTTFVAWVALRTVRGDNPVQWVPQEDRLRPVLALHGIHAELASLLEPRVHHVAHAGRKEIGRGASTICPFLDAVQGVDHPGELRAGVLRDEAEEQPEPGHRENVLGDWLGQAVYPSSSPLLGVALIPAQVEVGSERPAQ\n>SRR5947207_102588\nDRREGQIPAVLAPRRHVLTCLSNNASQGVLAMSRIPGLRALFVCSALSFMAVAATAQTKVAVLNLQRAVLESDEIQKASAAMEAKFKPRQQEIEKLQRDLQGIQQQLQAGAGKLTQQAEADLTAQGQRKQRDLQRMTDDLQADVTADRNDVLGKSSQKMSEVVKKLAEKRTEEFLALLRKGDYKGAYRLWGCTDEKPCRDYAFKNFMDDWGPQSVRADNPPTITKSRACGSGVIVTVNSSKGDATLWVQQGD\n>SRR5207247_709107\nDVLAAHPRLQLSGEHNASLLRDREVHVPGRPPEPERGRPYAVTECAVRAVRAAVRVGAGDERAGENELLLGEVEVEDPVARRRAVAASGQVTSGGRRTDSGNSRRPTLIIPPERRISSSCGDSAAGSYVLPRVSLLSFLVFGSNENASPSCASSTASRLWTTVSPRFSALRRKMSPIAAPHTMNISRPASSATPLRPAGLISRELPMAQRSPATTNVSPRCTRSRKLGLRX\n>ERR1700688_3359193\nRRRRRTLERRRLSAARARDARRDGTIGVHRTGRRLRPRSALRRDHSRRVACDDRGRAGLARCARRFRPAQRTPRRALRRARSRHDHLERHPHPRPDPSPRFRGVRKIQGDRQRSQRPARRRLRRDADRATARNRRSDRRRDLERPWRPARRGASLEEPRRRRLRRPGGAPRDPRALQPRRALHSVRPPCERRLHRSREPGERRTCPRDGDRCRARCALVRRRRLPLTARALRRARWRRRGGVFRRAPFRRVRRRRHRVPWRFWGTCSGRRRLSRGRALSREPGARKSRRRRGHSAPHRRRSAARRVAAASAANACPLHRRGSGRGSRIPPTSRASARRLRDCARCPARRRRARGRGRCGAHRSLGNVAGAGSYGRTRRGRADSALRARYLPRRMSELEAIRTEIPGPRSRELTAVLARTETRGVTYVAHNFPMVWDSAQRATVTDVDGTRYLDLTSAFGVAVTGHANPAVARAIAEQAARLPHAMGDVHPSDVKIALLAKLASLTPLDEPRTFLCSSGAESIEFALKTAFLATDKPDLLSFEGAYHGLSYGALEVGGIEKFRAPWRRQLLDRTVFARFPDRRIPSTAARALAEIEAAPPRRSSIGAVVVEPIQGRAGVVIPPDGFFHALQTLCRDRDVFLIVDEIYTGFGRTGTLFACERESVRPDMLCVGKALGGGFPLSATILARRVADAWTPSRGEALHTSTYLGNPMGCAAALANVGEIERLDLPARGRAGEAKIAARLEPLRERPDVVDVRGRGMLWAIEFRDGAAAAATVVRALQNGVITLQSGVRGESLAVTPPLVIDDAQLERALALLCDAVAEKVMTX\n>SRR5262249_19266331\nXTLAARQLASRFGGDRGSCDWRHFGRLAVFTNQKKERRLQSGFQPFVRLRSSEGYVYSAANEFLREVEALKREHLSCRQRRESPRLPRETDTPVRAITSFHADLRYGGDLHRADLAWAVHAAARGLSLKKQDSRAPHRLRDRQVLNRVVWRACAVTX\n>SRR5512143_347789\nGFTGCRRVRGVECCESILQLRGETVLGSVRQVKATDQRNEIVDLSRHRTRELEREGVDVEGPRARNGIDNSPDAVAHADVAERLVNAWRVGDLVEIPCADVVDKNVVTCSRLRLEGDQVSGDSDVALLAGNGDLRLCAASDGLVIDVGLAAAGRRINRDLAVGVRETVLARCAGECSNGEYAWRGLGRRVDVTARDIRLALLPNDGVAIRTDGGVHVVQAIVGQPGHGSSAQVIDTDFALL\n>ERR1739838_676663\nEIVSHFESDTNSSLGQISDNIGFSLGEGGVSCNGGGDQSVVHFLVFSAASSVFRSVFSVTGQTKTSVLGGEIPAILVESSVASVGLVDTVQVLLLRKALPLSRDYCVVGLDGTDSSESPARSTASLVLDSGSFTLRSPVLGCGDISYKGAGEGPVSVGGGVVSEISCLLFDRQVSELVEALPPX\n>SRR5918995_363747\nHQPSSFGSSSPAAASPSSASKSTPKRSKVSPCSASTPSPTTRPSSNKPASPSTSTKRRRDGPTASIRRSANSSAPATRATARWASAPPPALSEAMLTVAVRPYPAECTSLPDDPTDLPWSVPHVVELLHPAPARRARRQLSGQLLDNSTSHRASVLDTLLMLPIGMDALDARLIRAMWETARAGVMELTRQLGVRRATVRTRLDKLQQRGIICGFEPDLDLRAMGYEVLAFVSLEIAPGRLQAVAKHLREIPEVLEIHSVTGPADLHCRVVARTNDHLQHIIGCILEAQGINRTTTQIALTEQLRHRVLPLVDLVIDHGEQATTEDPWRGGPPNPPAPTAVRSPGRSA\n>SRR3954452_4728668\nDRDDRPHRRVAASDLLDDQAVARVVERADAVLLRDRSAEIAQVPKSPGEVDVEPLRPIAVAGARDDLAVGEVASGLGDQPLLIAELEVHLNPPRRQTLQLSSSSRARTPANASAASRVRGPGASSSTSSIAATGWTSRTVEARNASLAASRSPRANVPSSTWSSRISAARVIDSRMPTSIAGVLRTPSPTQKIEEVGGSRTTPSGRTRTASSAPAARAIRLACMLAPX\n>SRR5215813_7369292\nCIDTTSMGVSSAVARVGASVRVLHPQDTPSQGSRFVAQSSSHRIRRHRLFFLWNVTQIELPRCILGERSMGGRPVDTPEDEILIDRMRQGRTDALGVLFDRYARLVFTVARRILRNDAEAEDLTQEVFIEIYKKAGLYDSGKGSVK\n>SRR5260221_1576336\nQITLLAVDRTAARNPRHGDELSSSLKLGCARPIRLPHASQHWHAAQGGPGVEHPGLGRRHGDAQDLRGFFHGKFPKLVHLHYFSTAWPKAPDGRTDNLPALTVAVIFFRIRRPVRELPLRPCLFRGARLVHRNFPDSAFLSELSQRGVDGNASQPGGKTRAPIETCEVYKCAQEGVLHCVLRVLAIACDSKRHAENHFRMPFAKYPERGAMPASCGGYQFAFAPSLDAARRVCFVKFGLTCTHQASVHRLLLTPVSTQQLCPAVLRVSFSNPLPDVGGTIFQMHSCCFTACQELLNLPVHQPYILQIQDNQSRAALKAEKGLQFPDMLSLQTTDX\n>ERR550514_625570\nETFKIISVTCTNEWTLPNPFLGAAWVTSPLVGAPNGVRPSDYVFNWDYQQKEYPLISIDTTVNNAIVPNAQYQFEVFINGNLNNPKQVISEKKGSGTFQYQPDVAGTYTFRVYVSDQCKTQIYDMPTAFTVGCGFTPEPQITGSENVAFGVTFDNFEYRVRYDNRKAGFYRVRLSCKESKMTGLPVSFKWRDVCKWNFENSNNLPTNTTKDGEITLQPIQKSGTDG\n>SRR5262249_32914110\nXAGVLTMSIAGSVAWQVREGSEISELRGADLELEVNSAYRSGGDRKHESNIVAVRITEMVIHNNLKLLGGADIRVDTLVVHGKRPGGKSDLYQPGTLRFPDVRDEQHLPFGEKGVLIYLGEPRYFLDIFINVSRDNKDAPDLHKLLTGESARNFASX\n>SRR5581483_4550651\nTVPSFIAAVAVPEITIPTCSTSQNATPACGPTCSDHLHPGSYVAQPMVIPPTLTISNFPFANKRTSSGFSNRFKITSSMLFPRFAFLLLSFYFCLPHSGHHLQPSSVHLQGRTDAVTRPRRTEEHKEVGQFLRRSEPPDRSFLPGDPVKILSPVGPGPGHSLSCRFLPGSRQDQAGVDAVDTDVVPDQFIGQALX\n>SRR6478609_4614806\nSHAMEGERPAYARIAGSDFAALSIEEQELVMKIRHVFGALTVTAITCGMTAGVSIVRAQDHHDPFLSGTSPEAVQQSSPEAVHQSSPEAVEPVVVEQTSPQVETVQKDTPRDPYILKTSPKAPKVKKVKHEKEAYSGLPKGHITIVGCFYRDVDGDGDHAHYMLADAKMGPATAVADQNCTPSGAGQLIRLKDADDVGLTQVASNRWVELYGEMGSPKDADDARKFEVKSFREVPLAQRPRIAILIPPAPAPQAAVETPPAQEVGVTESPKPMATTGETPYERKLPKTASELPLIALLGLFALAGGLVLGLVDRQKVLGRGX\n>A0A1W9U6M8_9DELT\nMEIKINRDVLLKGVSRVQGILEKRSHMPILSTILLTTKQDNIEISATDLEIGFQNSYPAEIIKPGSITISGKKLLDITRETNSKNIYILEKENNWIYISDNKAHYNLSCLPADEFPILTEPEGIIMIEINSKILTEMINKTIYSITMEDTAFKLSGVFMEIVNKNKEDFLRMVATDGHRLSLIDKKIPKLQEIDIQQGVMIPKKGLIELNKLCLENGNILFGIKQNNLVGKKEEALIVIRLLDTEFPDYKDVILPKKEDKRNIITVNRKLLLESMRRMIIIGGDQYQGVKITIGTDYLEMVSVNPDLGDVEEKIEIKYDGEPIDKKKYTASNIKVLKDLLAVRKRPAMYIGNTSTEGLHHLLYEVVDNSVDEALAGYCDQIDIKILGDNSVIVKDNGRGIPVDIHKTEKLPALEVVMTKLHAGGKFDNKTYKVSGGLHGVGVSVVNALSEYLEVEVYLNGSVYYQTTDFSFDIIRQRMRELAFLNTGLKINIYDDRTHKEKKLFYKGGIVS\n>SRR4030081_3248946\nWPPAAKRAPPTSVLSTLSWRFSLASHRRADRRPLWVRGCVKTLEPPRAQCIFGHVGSISHDFVGLNRALANLHGMLFAFSHSLGRERSFERQVGIRSAFGAARPEQAVWRGSALGPCR\n>SRR5262245_55954626\nPRAPIRPTRTASTTCRATSGNGCPIGTARITMGGERCAIRRARRSGRCGSCAAGRGSTRTSRCCGAPIVTRSRPTPTRTASDSGSYAADSGSLARADLRRRGAGAGAAAAERRRDGRRGDDPARTGSRVRHRRRRDAREEPARGAAPQRRSDERRAAASRAGAPRVRHPAHDRLRSAAGVRLRAGQTRAARVRCPQRHRSPPRRHRPNRGNPRRGGAVGRDVGERHPLRSEGSRRRRARSAAPGGRRCARPSRCRGLWRRPGRRARAARRRRPRTVDQPAAADGPDDDRRGVGGADAGRTGDDRNPRARDPDCFAAMTDADYQKARRWLIRRDPILADAIKRIGPCRMAERQRKDHLTALIGAIVSQQLSTKAAATIFGRFAALFPDNQITTAAAIDAFDDATLRGVGLSGQKVSYLRDLAARIADGRLNLDELDALPDEQVIERLTAVKGFGRWTAEMFLMFRLHRPDVLPAGDLGIVNAIQRLYRLRKRPDPKRILKMGELWRPYRSVASWYLWQTLRNEPLSTAPRSRPRSPAKSHARX\n>S3BF76_9BURK\nMNALGVWGQFFSMAILGLVLWAAVSDLLFRRIPNAAVVSIVLVEAAALAAAALGGNGGAALGLLQSGSVWAVGVLIAGFLLYLTGRMGAGDVKLAAVLSFWAGSEALLFLILLSLVGGLMVLGLPILRMIETKTGFWAERLAEAFGRPLECTPIGLLGGEAQKGLPYGLAIAAGFAAVQFGVFSHIF\n>SRR6266545_3847418\nSWRLPGRQGRPPPPSTWARSASTSVTRMGPTARCGSAAASPAACPCPRTRVPPATTTAPTPCGSARRTPTATCTSKAPTAWNAGHARPTRSTAPERRQGRLVADPLWMEHQIKFLCPTRLLGRSIPRSAAAVAQALVIPLVIQTIRRVPSGSVWIDEAPNLSGADPSGPTTSTWSTRLRIWRLGLRIPRGVDADRHGPGWRLPRGRGPLPVAAMHHLLERAPVGPLNRREGAVGGDAERDQQRTEPVLGKAQQAPRQLLVMHARMGAADAEIGGGQHDAHRRLAQVELDQVAQAGVVGLRGHQRDRRRRAGDVPGGAPHPGQLSELLPVSADHEIPRLLVAGRRCAPRGLQDPVQVLGRDRSLVVGPHVAPGPDRIPRLHLDLPQTRPERRARRPRPQX\n>Q4DQ35_TRYCC\nMVIFLAYWRNETTQTGKHANRRKCVQMIIKRWFSRVHERICVFRLCSFLFPFFFLYYFYTCKCNSIATYVMHIYIYIYIYIYIYIYLPFPLFFYLFCISIELVKKRSQMVKANYIRAGRLVRIIRGPRQDRVGVVVDIIDGNRVLVENPADKKMWRHVQNLKNVEPLKFSVELSRNCSTRTLKNVLAEKKILEKYAATKSARRIAAKRAFARSTDFERYQLRVAKRSRAFWTRKVFDENDKKKPVSWHKVALKKLQKNAKKVDSKPAAKKRIEKARAARKAKAAAGKK\n>U2C1V5_CLOSY\nMGADSMFEILLNSLGDTAVYVVRKDDYRILYFNDIVGEMVPGIRKGDFCRELWTGYKEACIFSGIGSKKPYSAVGFDETFGATVMLTASEIEWGEKKTPAFAITVKPYAMSGTEENGKEEKELLLCAMRLFGEVFLLDINTGRYLVYKSDGLPDTMFEEADFCDFNRLYGENLIHPHDRQVFYDSFTLENIRNRARERQQMISAEVRRKDRSGEYRYCELIGIFYKDREGISEKMMLTYRDTDELAKARIRERQANRRFVRAVNESYDEIYEGELYTDYLRQWKGEKSTPYFRSSPSFSEQIKWAADTIVHPEEKEVFLSRLSPDRLKEDFENGKSEVTISYRRLTPSGSYRWHSLYVRLSEMTTDCIRVMLYLKDIDDVKKEEERKQRELQNALAMAEKANEAKTDFLSRMSHDIRTPMNVIVGMASVARFVLQSEAKETANLQCDEKTGNYAKLLNCLEKIEMSSAFLLSLINDILDMSKIESGKMKIANREMNLKDTIRNIKVMIEAQAEERRQTFLVSVAPEVGEFYYCDSLRLNQILLNLLGNALKYTPEQGEIRLCVTAGKVEAGEQLIWFIISDTGIGMSEEFMARMFDPFEQQDFGGSRIFEGTGLGLSISRKLVELLNGTISAESEPGKGTVFTVKIPMKISDKKQKVRKLGETQHRETDREDSLRNKRVLLVEDNEINREIAVMLLEQTGIRCETAVNGAEGVSSFEKTVPGWYDAILMDIRMPVLNGIESAKKIREMERRDAKTIPIIAMTANAFSEEREEALEAGINDYLTKPIDAEVMYACLRNYMRR\n>SRR4029078_11775012\nIAEGAVNLPIGDTAAMRVSGRWNQSGEGWQESLLTGKDHGKKDLWSDRALLLADIGESTELLVNVHGSADNSETPLGRGIGLYDASTGGFCAAVLAGHQDDANCAMEATFYDPQFRYPSVQGDSGRKTLSDPINQFDNDGHGASIRLTSEFDAATLTSITAYERFNYGLVFDYDGSDGEFAHQHAKSQIEAWSQELRLASTTNGPLSPLPGVALATGALRA\n>SRR5260370_25801032\nTHRLCLARRQIRVHRSNPSQKSGPMRCSEAPAMHPAPPAAFPGSLEAGTERHKLNQVTGFEIKVFFVLQLAVINSDYRREITGTLRPGVIVIVTGGYYVDAFQVGEIDPRFVAMDVFSYAATKAAIQNFVAVIQRQINSLTDYIDAIGVVLVQNPETSDLGF\n>SRR3990172_1850163\nVGRRGAAGHIPAVVDGDAVEPGREARVLPEGGERQVGLEEDLLHHILGLLPALAQQPPGQPPDPARVPEDQGLEGVRVPPLAAGDPGRVVLRLGRRTHQPHPPGCGSVRLRGPPLYQEGSKGARLAESSRCLVRRPRVPPPGGGGYIMAGNQGFGADSGVKPREAGGEGGRGWPFGRRWRGRRGRWAAGSFTWWPPRATWPS\n>SRR5580700_5373870\nXMPRSQSRLLDGLTPTERWQPQPGLVLSAQLGSLAATGCIVWLLAVRSRPHVHSLPGAVTQSVVVGLVAFVCSGMFMTAFQLATARSLGFDALRTSLPTARTAVWLAPTAILLTRSSPFAVGAALALVIGTTKMLYFQWAEFESVGGPLPGRSNRWLRTSAYGVALAGQTTIVCLWMGSPLLAAALLCVSAAGLTLMCLVADAYRAREPSTLPDSLLRILFTLILGVGLTVGGRIGGFGSSSETSGEPDDRARPELIT\n>SRR3954452_18840074\nIARDALRRGYSRNPAHFLLWSEILPFWPKTLDGWFRDAVRRSAVLLASLIAHGRGPHAGGEPAGASRLPLRVELPWGRRGAPRPPRGGCRQAGRLLPRRADLVVPLAQGDPARARRRLPLHRPRLRRLRPLRQAHRPRLVHLRPPRRADGGAAGGIGPARRNRRRPRLGRADRAPLG\n>SRR6185437_12615591\nXVHPRAGLSQAPGQVVLSFPLHVLLQAGNPRWPRRPAVLPLHLIVRAVHLPETGRTPSTGEGSEAGEGRAMTTPAEQPVAQPAAPADRLVPSARSISPWTTRQKIARVLWMFVRATLFRWSFHNWYAWRVMLLRLFGAKLGHAVRIRPTVSIEIPWNLEIGADTGIGDHAILYSLX\n>SRR5689334_22958838\nLSDPERRADYDEQRFAGIRGAADLPPAAQRAAPPMRAPAIATAVLAFVLSFGVWMSQQPAVPAAKSAVVRPAAHVSPVPMVELEPESERLARLHAQSGVVATAPAPPDPQLEAVADVPAPSPVLPTSRVPDRRLAPAVRVSAHVPPPAPSTA\n>SRR5215469_4716775\nPCLSITHDDVYRMPKHLADLERRARPYQACYVRWLASNIATIGGCVAFAAENFPQFAEMRNSARTPVGKRIIAGSSTMGNPMADDEITLETLLTFQLGDMEGGIALVLGYATSAEKLSKREMDTFAIGMTREKAAELGRALVEITDKAPVTRGPRRREHX\n>ERR1711865_1142824\nIHPFFACLSHRAIRHFPGLLSSFITPDTRISVAFLGEVQTYIHLLPPGVHLVPDTPCRGFTQPRLVPQVTRAEQYRPVRLPFTLSFLSYLRLVRCTYPIAVHHNSFIPFHPSSPAPATACTPRLYLRPYRPCPAICYPHLLSCLQPLLLFNRYDYPLFVDPKHHFFYLLWLPCALLPLFSTIFILYSGTACQPLHQCRX\n>SRR5688572_31128903\nFLVVTFIILFFFFFQAEDGIRDLTVTGVQTCAFRSGCSRQAPPSRSGPVFATRCSTLGLVSPLQWLRRQFRAACMARQRCCLTRSEERRVGKECRSRWSPDHLKKKKKKDMKIKEX\n>SRR5436305_2025442\nIRARVEWFVQKCRCDRQGAEERAAERTGPLGQFGNIVEIARAPALLRMESVKRSEQAPAALIGVVVVSMFRGGNQKRASDGVTNLNFEPVIAARQCSDRDLMTASRSRIDDCQMARSSVFEMKNAFDVSGGKRAIEPDFGRPLPPDHAHRLKHSSIASFFDPCDCILYVSIFX\n>ERR1700722_19574956\nLQLADQRTGKVVSTSYQDHDIAGYKRPAPALQRHAAASLPRDPTRQRLGKDWRGGGKPLVLFGHHPWFWFGGLGRLGQRPQLHAASLSGPVSVVGQHVTFPHHPGSRQRVGEYAVDQIEHGARGPEGYIEPRFAPWFAGRLDPLAQQLVRMIERFDIRALKRI\n>SRR5512141_2661244\nXMGGPTWELFSCAIGNPNDFSALYPSERLAPSLNDSLPGIQITPFERGSEMKRILAAVMAVAFVISVAGFAVAAEKAAAPAAEKAAASAEKAATSAEKAATSAEKSAASAKKSAKAAKSYLLTGTIETLDPAAGTFSVKGRKGNVELKAGEKVKLGDFKVGDKVIVKHADGTASSVKAVKAAKVAKKAAAKAEKSAVAAEKSATAAEKSADAAKKAAPAAAPAMPAEKKX\n>B3ZYH5_BACCE\nMNIKSVYKCIATTVLLSQIMSPSILHAQEVSDKAESGVVTQPENKRTGLMGYYYNDSNFSELVMMTPEKNGELKIIKEDHGELLPEGKRNIQSIRWIGYIKPSEDGEYIFSTSSDQNIVMQIDGKTVINQSPMENKIELDKDKLYEIRLEYRQDENGKHQNLSDLKLFWSRTNSDKIVIPEENLVLPNFAPGENKTKLIPETHSFDDNSIPDTADLCLDTDDDSIPDYWETNGFTIKGNKFVEWTDDLAKKGYIKYVSNPMTAYTTGDPYTDFEKSAGQMPAAVAKEAHNPLVAAFPAVGVKMEKMIISENKDYTNAEEHAMSSNQSSGTTVGTEVHVGVSENYGITGGVSASFSHSNTTENTISKSNGNTIHLNEADAAFTNLNVRYYNSGTAPIYRVAPTTSFVLGGETIGSFTAQANQIGNDLNPGDTYPNKELHALSLNTMDQFNAQPIKMNRQQLERLRAGAPVKLETPQVAGKYAKVLSNGDISVAGDWAPKLGQIENKTADIILNTGDTVKEEKVAAREYNNPEDKTPELTLADALKLAFGAKEENGKLTFNGHNISEHSVELFYDENTKKEMKKQLEKMSNKNMYDIKLTPKMKIVIKTPTILESGTDSNIDWETTNTNQPGLDDVGYSTANIGYGILKSKLEPNTSYVLSAYFKGTKHEKEIEFGIGSGKGDYAVNQKFELSQGGNWKKVELKFTTGDDVSKFNTVRVKNDRNDETRQVYFDNIAITKLGKAEKKFDGVSEDYIKEAHTFKSVHSDKKNGTNYINSINLNVNKPIKWKYKVKMNGKEVGDLKNISEPDANGVIKINFLDLNNGSGFLSTDHIEVYAVKEGLRPVKIAENHKYNMEAILKFKNAGESGMIEPYGDIRFINNGEVFEIWKDAIENSSREYTQDQPYKKDITFRTFTPITEESNIRFIANVKEEDYLANQDDILAYGENDPKDSKGLNGNIYFTGDVADDSVNIEYKITK\n>ERR1719506_2373094\nANGQAAHAAANYDSYTEAEPPIMASGAGSATYGTGAAYGTGAATYQRANEYTGGAGSLPIEAGAGAGQSWQYTYSSGGASTKYHDSAVSGSPGSTHVVTGSSWTNDRTHRINIDEGSRVIVTVNGRDVEGGAQPVRQAVPNNFPKPPPAQFAAFGGDSIATMRARAERHAKEEAEQILRAEQGRERTEEVRKAEQILRAEAKQNPALIIEEAQRIEAKRHRGRPAAAAQPVEEEEDCPAPPELLTLPGKGCPGNVVTHCLNENKAYATLDEAWQACHTTSGCAYIEKNDLDKMYVLRRESDPDNAGPHVTMMRFM\n>SRR5919107_2884606\nSRPTTSLRRFLTVGCKSPETVVSTRSRWEMPLPSPNIKSDGCRYYVCSQHRKRGPCESVRCILGDHLCILSAGQLSQHSPLLRCPYPSCRKLRVLPLPLRSHEKAPQLLGRNPRRTRSAKRVEDQVPFPAGGHDGSPYQAQGLLGGMVAVQLLFLGHRRDRPDGGDLCRGVSAVNEVVVEGVVGPSLASPEQRLVGVGPRKSGQRRDRASTRWSDQTTSPMYSKWSSRDAEERTNALHSLRRNGX\n>SRR3990172_5150764\nLRLVNSVSYQGDALRRFSSRCGGLGGGFLVANACDLRPLAAIPLDAISALRRDTPLSLDDNIRSVPPLIGTPRCAWASGVTHEYVAVFMKRSTYASGNAPLRLAGFGRILPRPADRWNNRVSGYRMDDHAVTMDIVAQRAEVFGPADLRGPGPVPPGGEREDGRFHHHPHLRLDQRHSGDGGRELRVPPDPQSGAPEQPVPHVSRRRRVPRRRPEVRPLRVDRDRPLVPAGDRHGATERGGPPRAGPRRVRAVLRGGVRSALMDLWLVRHGEAVPEREDPARPLSPEGARAIRALVESHAGEAGPFDLVAASGKKRAIQTAAIWAEAAGYPAVKIAETAALAPNATPEAFLAFLEDRGEEGRILCVGPLPSIAAIASFFLSDGDPVRLAFSPGTVCRIRVEATRRGAGELLLFVX\n>SRR2546426_2734100\nGRASTAPDRARGRRRWKRRRPRRSAGSIAWSARRRYEIRKEANLTDANAIIERLGAVFVESFHVEVPSSDTDLLETGILDSFQFVELLFELEQRFGFRIKIESIDLDDLRTLSRIARLVAANGEAAQPVAARSSSDTAAYIVRLAGRSSIAKNQSCHGHAAYLCRGRYARR\n>ERR1700722_10537092\nLQPAAGKRRAQITRSPVLDKRHLALGHAARSVAVDIEYSHALAAQRKCDRQRQPDVTASPNHAQVKAHRKLLDLKSIRTLLPSLRRPLSNHEHLFAQKPLRRPHAKVQAYHPTGGRKSRLEAVGKELRNQQLDFEPVLHQSFTQAQMGEGCYVIVKVPVACAEIPDVRLEHQQSSAGTKPLPGLRE\n>SRR6266511_848920\nFGAEPAALVRDALGARRQAPLPTPAAPSPRLALAVMAELTAERATFTRREVVQAVARCLDAADAATIRERAKELADAVLADLEVVCLHAPERVEVPAALRRRDGWSVWDAPQAIRYTTREMLALEGRILHTAEMGRAPIAPAGVVELQTLERAVADEARPLGTDQHDALRAVTSRGRRIEVVVGPAGAGKTAMVRVAARAWHATGCEVIGLAHTAVAADVLRTEADVGAETVAKFLDWHARGEVPAGWRLTPRTVLVVDEAGMLSTRDLDRLRELVARRVGTKLVLVGDDRQLGAVRGPGGMFAALAHELGAVELRDTHRYQHSWEAHALGELRRGEGSWLEDFAAHGRVHGGTDTSARNECFARWWRAHQARRDAVMLAQDHATAGELAAKAHATRVLAGDAQPGGLRVRTETGTQTVGVEDLVETRRNDRRLTYGPAPDQWVRNHDRWHVRAIDQHRGTLEVEHARHHARLRLP\n>SRR5207249_3827138\nKMVVLNSIVSVLSAILALAKSGRPSPLRSTATTDPGWWPTAGEKARAKPPLPLLVSTERVFASGFALTKSILPSPLTSAAATHQGKLVPLGKEENIKPPLPLLVRTTSPNDAQTKSCFPSPLTSATAIETVVLLSNCEAKTKPPLPPLVNTETVGLSS\n>SRR3546814_18573071\nILSLHDTLPFLGSSKVAVVWPAWGAKAGTQGWLENARVRRYDEEQHALQAASAGHGLGLASNVLVAEAVGRGELVEYRPEVRLAGARYTVVCVPGRERQAAVRVFSEWLLGRSIAEAEDRKSTRLNSSHX\n>SRR5436190_12017692\nPTGVQDILQRVLDDGADCQAETQVAKTLEAVAAKPFGLDSTRHGKREWQIEDDEQQERRQGKIAGRIREDGKAADQKNSGEQEYGRKIEARLPLDKQPGGQTIDRHQAEAHGKIRQHLYPEH\n>SRR5438309_4153540\nCWTRRMQSFPHVRKSFSKTFIPPRGNDAQLRRQRGRRQFKTNLIIPLSSCPVRDGIRRLRARDLDYSLRNQGTGDAGPEKILSFVSRARLKYGKNKITSEFFAQISMMHFIVPAGRAFSSRPSSSSSCPIIGAEGDNLCVVVVPKPAKNYRSAEPAGIRENNLHLRTRRRQSPKLISTSRAVCTISPVGGTSRKRLTASAIGTWR\n>SRR5678815_2528847\nTRHLCACRPSSRMDDMTTCPRTRCGTASSMRSLTPRSTSSNEAVTRRSSSSRSDLSRWSVDGWRVPAHLGDNEPPASSESPLSASSPERLAEWISASPEARSRALAKCLETITLKDPRIHAWVQINPQSATETGPLSGIPFGAKDIIDTRGLVTEYGSAIYRGRVGVDDADIIAELKDRGAILIGKTQTTAFAYMTPGPTRNPRNVEHTPGGSSSGSAAAVAAGMVPLALGTQTKGSVLRLSLIH\n>SRR4051794_18478678\nRRDERRADPDFGRVHRRRPLVRLEGRRICVGAGRLRPADRSEPGRAVPDRAGARGDRGRRPDALQGGLAVRAGPAVRRGGEHGEAPRLRGVVGGGERVPRHARRLRLRRGVRRRAQVPRDTALLGRARLEQPDPRVPRPARARHAALVLMRYTRVFTETDGETRFEELETPGETIQAVESDLVGTVSVTLAVKGIYFREVVEESSPVPHTAPYPLFIIGLRGTFSIEISSGETREFPPGSVVLVEDTTGKGHTTRRVGDEPRATLMAPLAX\n>SRR5512138_1963781\nGAPTRDAVTRTTSYCVRCPPSRGACSHSAISLCGICTRRRDAMAKRRDNKEDLPEQVAGNGLLHRRVFLQSGAAMAGAAAALGAGAAQAQSIGAGSPPSMLKPGAPFSAYGVPSHWRNNITRIVTQNPPPGREGAGSSRTPLQMLEGTITPAGLHYERHHNGVPDIDPDKHELMIHGMVRQPLVFNLNSLLRYPMETRVHFVECAGNSGGIAGAAEPQQANAGVLHGLLSCSEWTGVKLSV\n>SRR4051812_18625933\nGTPEAVVLALQGGTEVLAFRTGQEPLLATARIHPGEPLAFAYRNGGRWPWLMVFARDPRGAVSWFHPQWTDAAQDPKAVPLEVEPGLHELTTAVAHPFAPGPLALCAMVLPAPLSVRQVEAALATGSEAPAGGAAALRDPGGVPLGPPRFRRRFCWWARPGPP\n>SRR5215216_1715194\nILYEAATSRKPFAGDSVIDSLHKIVYMQAPPIRESNPNAPAELQRIVRKCLAKDPADRYQSIRDVAIDLRDLLREYDSQQSISASFPPAPPSGSYTRDPSTGSHSQPHMTDSHSQIAPTMMHPQSTITGPEEALSSGPVSGATSAPQRESNRR\n>ERR1711871_72301\nNSVQSLRSPCASIDDNKSIALDPLRVSSFKPRRSIIDMVTFEESDEDDEIAGGPADEAPIWGDDRPPSVQPRRLSVRERFRNSVSTPLIGYWRRNAVTFAVKLVRHPRFDHFVLLLIVTSSVCLALESPRTANDAGLMNALRVLDVIFTMLFTLEVILKSIAMGFVTGLKPYLSNNWNRLDFFVVLTSWINLIFTWSGMGGEFGYVRALRMLRCLRPLRMISRYPGMKKVVGALLLSFWPMINVIMVLMLVWLIFAIVGVQLFGGTMYHCLPSVESCILNGTHCVTSRTQCLSRGGAWTRHDSNFDDVLNSIMVLFTVSSLEGWPEIMWNAIDGTGSDYASLYFIFFILLGVFFFLNLFVLTIFRNFMYLKQTMDGVGFLTPEQQNWVDSQKRIMASNAVRRLKPPRSVWRLTAWRVVRYRWFEPFILSMIAINVMLMATVGVKVDDWEEILDDLNTFFVVVYTLEMLLKIVALHFSQYISDRWNQLDFALVVLSLADLAIGSIDGGAVLTVRILRLTRLIRVLRMVKRAEGLRRIFLTIYLALPSLVNVGSLLLLLFFIFAVLGVNLFGEVQFDVFVNDHANFRDVLVSALTLFRCTTGEGWQDIMYELRRTGPSPYTATAFFVVFLTLASYMLINLFVMVLIDTFDGVTTRASGMRDEHMSDFKECWGVLDPNASEMVHAYQVEALLRMLLPPLGVGPHEPLHTVLEVVDQLQLIAYDGKIEYHKTFLAILNVSFGDVMEAKTKNHAMVKADNDGLKRRATHNFIHGDKSGGIGSKLRVMTRRLSSEFGLLKGGMMNELALLKARPTSVKDEVAAFRLQTWARAITGNRKWLSLVQQAKANSPKRMPSTNLAAVFLAPVPDTVLLPPVQQSSPISDKLHSPHKLPPMRTKRIESEPSVQPVTGSTRQQPLRKPARAGSLPTSPSATDVVIDLDAVLHDFQKQGINLSTGGSTQSEESPVDIEHAMAMARLTGGSVX\n>SRR6266567_3171955\nTQPLLIGALSLSSTFRLGLRDLADLQKVAVRIAEEAADLTTPVDRRRQEDGPTGFERLIRCLAVWHTQRQLMADGIRIGRRGKRDGRLVPGGPTTSHQQQPVPLKREDAGRAPIVTVDRGSQHVSIELPRAVKFTDHQQVGEGNPFRGEASVRHASAPSVVRAALATKRHAASLWMISQVCYPSNVYGKDRRLKRSSFLHRTVYPTTNHILESSAFYPADDSKEKERHDKMSMKERTITEDQPGEKMADHEDVLAQAQPFGRMGRPEAIALLLHALSPRMKLASX\n>SRR5580704_9526292\nXMASHTGISSANRRIESDFPSVFGWECCKRAKPATDRMQAATLSAWVRMRFAFPLRLAMNLALLLGAALHCFGQRELFHEYGSSDGLANLNVKCLFQDRVGFLWVGTDNGLFRYDGSTFRGYGHADGLTNTEILSLAESPNGTLWVGTNSGVAQASGERFVSVDGSEEGATR\n>SRR5215469_13096766\nTGFSALLSNGTFDFLYGRNPSVPIAQIDTGDSATSQLVIDPSSNVRGIVEVSSSAANPFLLDNYTDYDAYGNPISGSGGSVNAGGLTVDGKSGDADSASSYGFGGGYEDATSLVYLINRYLEPAIGAFASLDPALRTTGAPFAYATDSPPNRVDPHGLNTGGVCVGASAVDSITLGLLQFSTVFGQACLAETVNTPKTNNDVGFLLVSGVGKKGWGF\n>ERR1719424_287230\nWLKKAALSGAAIYIVAMAILGRWQGAVVAVAAFVLPLSAHSNAAAATAAEARLHLRGGEGVMAAGEAQGPMDVTLKSSTKPPPPPVPNPLGYGDLRAGGLGVLPTPTPMPPPPPPDPPIPPLGLPNMEEIGMDKLWEMDMPKGPVMVTGPSTTRAIGSTGVRPRRKRKRMTQPSTSLLVHMQKCLRRMKLLRRTGENDCVRPSCRSELISLHRLGRPGHERLLC\n>SRR3954454_10920512\nVSMIAMRPTWACAAVAGLVLPLLLAACSSDAAAAAAKEGCELVMSGNGIDESQLDALSTRAQNVTQAAGMLADAAAENPDYAELSGTAAAAAADLAAQLQFAEVNGFDPQGWSAEVLADYQREFPATRDDPYARLTSACAAQVTGX\n>SRR5947199_9062679\nRKKPVTWAFAASGCSRSAPNVVTMAPTSLCERDWSHRAENDKPAAHAVGVHPAAVLPGPSRRPGGDRRAARRRAVLRAVPAVLRPRHRPAVDPHRDLPADDVPEVPLPARLRTAVPGGGRLHRLAALLPCA\n>SRR3989338_3014829\nRRFGQAEGSSMILPPGQCIKSAIDFATLDFFVLLQELTKKSFTGYLTMMIRGVGGLEEGTLVYDGGKIVACTYEYLKYDNLLLGSDAFLRIVNASTAKKGIVDLYQLSSDQIKLVIAFNEKMVFVPNEKDLRNIKVTEFSPFLEDQIKEKVKTDRTEILKKLKMGEVANSGDGGKPDANADQPAETDSDM\n>RhiMetStandDraft_4_1073278.scaffolds.fasta_scaffold4497251_1\nMKIPLTFAFLIIPCFSCSAEITGYWNFNGSLKATIGENLEWAWEQGDATFGTTETFEIPGIQGNSANVLKIPDSDEFSDFSGIEVWIGDGLDEDSWLHNEYSIIVDILYPETSSAEIRAIVSNAPVEQASIIINGEGKIGGTSFHGEILANTWYRVGIVVSHASKKIMYYLDGQKVGHESIGGLVDGEGEHSLWDFFYLFTTSGLSKGGYISSLQFHNEALSDTVINDLGGTTKLDEPEDITLPGDEVMPTSDNSPGGERAPNAIDDNPSTKYLNFDKVDTGLTITTGGGVVTGLGLTSANDAPDRDPANFILSGSNDDGATFTEIASGEIPEFLERFERQTVSFDNDVAYTTYKLIFPEVVNPDGANSMQIAEIELLAGAPEAGGDEPDDNQEHHIDDMVLAPFGFRFGFSINTEEGESYTVEATGDLLQWNKIETINGTGSSVQFTDTRNEVFQYQYYRVRMAEX\n>SRR4051812_32645189\nTFNGSSTPQTFTITPTATGTITLTPTNSGGLTNPSPRTYLVTLQTATAYTVTGPTTGIVNTASTAFTVTPNGLFTGSITITPTPGFGLTPIVLNWNNTNAAESFTITPTAVGTVTLTPTNSDSLANPTAPTYVVTLPAATSYSLTGP\n>SRR5690625_3194486\nXMTMPQIVPTTSKNAMALIAGGGISMTSQEIAELVEKRHDNVKRTIETLAYQGVISRPQIEDGIKSANGVVPRHYRFTGEQGKRDSIIVVAQLSPEFTARLVDRWQELERIHSGPALPNFSNPAEAARAWAEQYEARIAAERTKAEIGSRREATAMATASAATRKAKRLEAELDQSMQYASVKRMEMLYHGQKFNWRHLKSTGTEMGIPSIDIFDANYGTVKAYHADVWREAYALDINQTEVAX\n>SRR6267142_3947303\nTQGKLEKPASEERSLHVITADRDYTEQEIAGNQSHESGYDQERDRTNLLKHPEQHREYEVQLDEQAEIPPCSIQIVENGFGRVKTIAGQAEQEAVVDRFTGPRKWRDEIYDVRSPVHRIQPQQPIPVPSGPSRWRINEVRERVGQAESAEQQKYADGMIPTLDCEYVDALEPALQHRENAVRX\n>ERR1700761_8280655\nRYVRTAACQSRSCASARRSKSEASLRRRDEQFLCIVRRSQTIRAAGEIAPGQIGRRDVPCVGDPSVASERHDLGWCEVTEERRAAGTRSLLRHLKPGADLGVRQLQREQERHGERRSGGKRGDFAERACVRLLAEVHAHAGGVYDGWLAVIKAGSHELVAP\n>SRR4029078_20332\nSAPRGWCCACSCWLWSWSWSSVMSAPGEGLAERVGFEPTDLSVSGFQDRRNRPLCHLSAGDSTAGGSESRCRCRRRARLPEQALEVEDRGVARRDEHDLDLVAQLLDVLVLEDLVRQRRRARLVGRGLGGRERDVRVGLALSLGDDLLGLDLPLGQDLLL\n>SRR2546423_8221276\nLRFNGVLKALYAPAAADCKAAAGGDSVRVFVHLSVIDLDIEKLSTDRSWWARLLPGDRFAKWVVNHVLSFAGAYIERHDARALSVWEKGGEKGLPLVPIGFPLCWGKTTDCGYVAKKSAPPGFKTATVALGKLGSITFASAGTAAPYLSASSRRFLC\n>GraSoiStandDraft_11_1057310.scaffolds.fasta_scaffold1002834_1\nMSSLDDELAEIESQTAYGVSAADYAQVTSNKRASPISTYRLASSSPTATNSPTSLNGGGGAGTATTSSGVAKVKASQLKSKSRGRRGSGFKPDDPAGEGGGAGSGAAGTNGAGGGDSAPVTKLPMSAYINPNMTPQQQAALQAMLERNPGLAKYAPPGAFSPLPGATPATQTTGGRGPPTSHRMGDMAPPPSIRMGGAAMPPSMKMGEPISRGADLTAGGQGQRGADLLVGWGQDLGEEEESDEDVYKPPVSKKMGQSAPPPTTRPGGAVSPRDAIGGQPLNPPELHESTQESLKNPTKPGADKEDDEEGGITYRPTVDAMARGGEAERIMRKQNEMYDLQMPAHRTYVGGFAAAAYETAREYHYIQKAEKAAEDNMVNKARIRDKRPPPSIX\n>ERR1039458_81816\nFAQVLVGGGNDAQVELDIFEAAETAEALIFEHAQELGLEHERDLADFVQEKGAFVGQFEDAALLLAGIREGAFFVAEQFAFEQGFRDGGAVDGDERFGLADALVVEGFGDEVLAGAVFAFEQDGGGFAGGHAAHEVERFAHCGRDGFDFEFLRGGLFGDVLGGGHRAFQAAFVIEHLGGAHDDQALHAVIGVQADGRMRRGGRLIETDEDAATGFADTAAKDVLAVAADHVLGGHTEEVFSSAVNSGYGEIRRIQDQRPDAADHHHDGEGRSEAGLGDDGHAGPSPEHCRLHLDRQFGHRRSRVHGPKEWAAAAPGGREPVGGGPPGGLTLGSFEAHPSLVNVRVTNRQLPSTFTRVSAYLPEWVT\n>ERR1719162_2616429\nGRELEQARQRCCDPHCGEGGHCPCAKDSPNPSAQPSAGDTDGSARADPGSCQERSTRSANSGASADSGACSSANLRQARWSMQFEVIDLTGAYCGPARGFEVVCVLPFCPKTKCKA\n>SRR6266571_5669770\nPTSSTAPRPTSATPTSRAPASTPSTTSTGRGSGSSSTRPPRFPDYDWGARSRNGPPIRLERSEWLDDAGYPPLHRPAAAADHGDRAHRLLDRLHRHPPAARERLPQRAQPQPLGGAGPGPPLRPRPALARPVPELADGRAARGPRRVAGQPRRQDHATVAARS\n>ERR1700722_2864867\nVLERVARALEPLDAPLEQRDRRARIADRAVGASEALRELGLLDGVEPAGLDRLAEQRDRLRVVAFPEREAAEACERLGACGPGLLVRRERPFVEAPCGLGIVEAQRDVGVDERGVVLRAEEPGGEEVGADREPRSQLTQQLDRRDALAELEPGDVGGRACLAGELALAQPGALAGLPQALSDRGRVVDMLCLLFRHALY\n>SRR5437879_7003822\nSKREWPGGSVERLISAGEDLSHEMAPAAQKDVCHLLLGLDNRAQDSRQCWVQRDDLLELVEHDDHATLALHRELLRDREQLLDCQVLILWQRQRTELDSWSAVLANGELGLEWKGPKQVKGLRPCTGHRTAQPTVERGAELVDKALLAGRAEQVCVGDEHLPVLELLACVQRDRCLAVAPRX\n>SRR5918993_323855\nAPASSRPCGYWDANAACSAPGRRQEDAAPSCLERLTKAHGSTVLTKRRLSGKLFQLQAARPHRLEAKDIALSRRKPGFESRWGHSRKPASPGESLLTRGDRIGLVWWSGGAAKTISVQRSTSDVAKSDPQRWSIPTKKPIAQNSHPIRCSGRREAIRGPTVEKATVIAVACAQYWX\n>ETNmetMinimDraft_11_1059920.scaffolds.fasta_scaffold246889_1\nMSIKTINGTKPNINPDYIAPATDNFWDKLNAAAAFTVGGSVINNIAPNDYQIQNVDYVLSNLPDREQDENFFDDRWNRKKRGLIADIIPSINEYRKQNDLEELNYKAYRYLTDSDTVSEFEKRYNELDKLAFANRTMARNPASVLGLTVGLSMVEPWNLFAGPYALVGQATAGKAALRAGAATAAIAATEEAILYRNDPHRTPGMSLLNIGAAGVIGSTIGGIVGARKSNQKALIKDISARMKSIDDEQHVVLDVDNFYTGSSPDTINLNLASFEDILEATKSIPGVGKKTAQLIVKLRNSKPNKVFDSYADLLDDPDLTKAQKKQLEIALGHCTSPCRFHVNGMPYGGDEATIIGSYGLDKVAAITSPLARLLQSEFPEIRREAVSLLNTPFMLSDNLQGVATKKSLEEIIDGNRIHYTRLIDSLENNYFNYLNIKTAPNGSVRKHIAKTRAGRILRTPSNVVRNGLRGNFSKMGTPAGKMSFEEFKLAAVKHRTGAVVSLDKNVIAASKSIDNLFDSNADAVKKLMKSIYRGKEFTWIDSEPYTHRLWNKAVISSNKEGFISFLHEQLIKKYGSKEAVEEAIGDGMQHIDASIRRSVDKIVMSPEERIDLSNIFEPLKRGATHNRFWNFVDDSDLYNTDWAVHDIEAIANSYIMGPLADVSFYNTYKTLNPETVTLRIRKAAIDNARMRYRQEGIQLDDDVVLFEKHMESLDNSLSLLESMLKRVRGSYVDVWSPVPGGTIQGVLDNIKRYNNIRLGGAFGLRSAADVGRTVMFLGLKKAYGPLFESYIKRNRKAMMMYDQASAELAAINVGNEINSMSLVSAITNTNFNTPYSDKFTQLMSKANSSMFVFNGLVLWNQSMKRNAGIGVMNEIITSAKAATLGKLDSKKASNLAKLGLEREDLYEIAKEFKAHGASYRGVHLMNFENWNADSTIADKLARAVKKEVDTIIVTPGIGDTPLLMENSFVSMMMQYRSFPMAAMLRQTIPLAQNMNRNALSGLLISVVTGMAARQYINFANDKDGPDDLDELLYQGLEDTGTLSTIGEFANYGQMIYNRNPFFLGPTVTGAGDMYKVGSSLISGEEMNQYEINAASRLVPYDGLKKLVTAIVPEIGEX\n>ERR1711988_1839548\nKSAEKQKIAARVKRRVDEKVAEAKESFQKKADKEIAKDRADEAEEVSELKEKAKAGNVGKKVKDVNDHLEAKASDKDKIDAALKSKTAANVTQVYVKANSTLHQQEEQQKTDVSQIDSQIKDLEAKKGKSQDPVEQHKIDSQIKELHAKGGNMPADYFHKTGPASK\n>SRR6266542_965261\nNNRIFLPYKPKNGLFHSDFSVHSITSTKEISIALAKKAQDDIVSYKNMEEDLKWIVHTKCKTHGSSCGGSLSQKITSGIFTINEKKVEKFAENYFSYLDEEPREILKSSLISLFDTEGYSWTHKYIDISCEESDVNKSITGDFFFMYAEEGSGEKHKVFIGLAQLTKRPATNYYFLKDYYKGNEDRVEQALKHMLYKDVKSKGLITNX\n>SRR4051812_43011536\nLNEFKSARDSVYHQMVTPERPLPERAAAMGASLDEYFSYRGLALSCGFSLAGLEKLDRMESWRTGARLTGGHQPQILRDIFGNPFRPVSFDTAWRTPSVLAVAQVIYEERRFGELPILADALEEAGAVDEQLLAHFRQQGQVHVRGCWALDLVLERRX\n>ERR1719272_2699062\nRRHAGGCWVVWIYAARMLHEVVKERVHLLLDGGRLVNGHVALGIFGERDAPRPRHTIFFAEVPKNGALYRHSPPRLNHARRGAGERLEHIHEVIAAERVRLDGGERHRLRVVDQVHVLHNHVLAPNLAGAKEAPHLDHEAAAQDVQLAHGQPLLGNEAAHHELLCELCDEVRAALDLLDVPEEPDVVKPLLVGHHRDGALEX\n>SRR4051812_6490251\nEGGIDLSDTGWGTPNQLAGAAPNTLSGGGGDASTDAAPGDPLGVPPPTEADSNAEPQPPTAPARAAKKRLNWRSGFVQLAVIGAIAGGALVFRDRLTGNATDLRVGDCFDEPAGVVTEVKDVQHHPCIEPHDGEVFFVGKHPDSGSFPGRPALEAWAGEQCVPAFATYVGQAYDVNRELDFAGFVPVQDGWNSGDHEVVCYIVRVDHAKLTKSVKAAGX\n>SRR5690242_7610662\nLNHWNYPDTEFTAQYTQQTRHRIGPYTEQPFHYCFLLGPTNSCGVLLDEPRQNKKIADFVFLATATDALDKLHGELVDQEIPLTGLDGVGCPTHYLSFGLNTIEFPLLAVQHVLSMHMARRILESWTAEQDYQRLGLPREAEEMFRVAEVGAR\n>SRR5207248_4090244\nFSCLCILYLFHNPPPPDIYTLSLHDALPISFRTIYRPSENISHTVGVIADIVTLCDASDDFVSDAMVSEFTPIRNSRHSVGQRRDVAVGNEKSADVLLNCLRESTNRCCNDRHTSDDGLESDESKRLCPERWRNECPGX\n>SRR5260370_35461453\nGGAGWEERRGQLGGGGAEVGGPVTRVREQQRRRGPTPYLDAGLAAFRQDSTAHARAGQRTMAQPLLNPLSERERDVLQLLARGDSNPEIAEVLVLSVDTVKRHVYNIFSKLGVKNRVQAVTRARALGLLSEETCFLFGLVVSTASFLTNGSVMRNNGTLAAAWARAQALPIEGSFTITFFYAIASTKYCDWIKMALX\n>SRR5438128_2108134\nRRYPVPAAQRAIPAIRRPLSAIRRSQYATLSFQSCGAGPQVRKEFHRTFATVPFVQPTVFRTRIEQVWGAWEKLADNDLRQRVAALREERRRLKDKQTDLETRGQTLNAADQRRLDESNFELDVSDFEAELRDYERQPWLNVQDPVLRNRQQLAHYYRVVGQFV\n>SRR5450755_1345668\nGTRCLGGRLEQHDSFGHLTAQITLAACQLALEFVAPAGEGVGPRLDRVLPAPGPVELDLGLPAHPVEVGVDWPQLGLAPLPLPGSAVADNRADDLVPVPEHVGGNRDGVPDAPLGRKSPTVDGRGGVLDHDPLRRPARAAVLRGSPSGELRADGACGHHCESIQNRRSGKHPGVKTFPRSSGIQLHITSLPGARLGPEAYRFLDWLASAGQSWWQVLPLGPPDRHRSPYKSSSAFAAWRGLLAQPRARVSASEIAEFRERQRFWIGDWERFSGAGAVADQVRFEREWTALRRYGAERGVRLMGDVAIYVSPGSADHVAHPELFQRGFVAGAPPDAYAVEGQLWGNPLYYWPALRRSRYRWWVERLRRTLECFDLARIDHFRGFTAYWAIPDGAANAIGGSWRRGPGRAPFDAAVRELGRSLPLVAEDLGVITPAVHRLRDSLHLPGMAVLQFGLDPEERRSPHRLENQVERQVVYMGTHDQDTARGWYESLAPARRAAVDSQLQRHGVAERQPWWALTRLALSSPARLAIAQAQDVLGLGSAARMNDPSRAGGNWRWQMEPGALTPALARRLRELTGAADRRDGRSPGQAWSERTSTELPAPVGIGRVVAQTSPPRRLELDQRRWSRRRGQAVALERRQRSLRDRDLAQRRRMHAISHHQVARAQLAQIHDQPTELVRDALDRITQLVHLGPGAGTAELQRRREGQQPVAALAQKSRGGAEARLESGYVPLGRPNVVDSDVQASKLVTCARVGGAPLERGDLGPHDIAYVCAVDRVSGKRQSERARHPQCPRLKRHAPLQLAPAVGDRIAEREQAEAASVVGIFVGGHGRRAX\n>SRR4030095_10399445\nSALSAPVTTQHRGSNSAARVSCLVTRHHDVCGRRSCVHNPRAALISVIRHSQSLRSRARHRNGGVRTSLSLTRSGQVVEDGSELRFGPLAGFLCGFKGGTTFHRIGNRFDLQALSDAFEVGNAGAFHGKRLPARRHWTVVTHKPVRALFQGVVCKITLPFDDRCAFLHLRRWSSEQGFFNLGRILRLSEGTERKCHHNNQGHESHGMTSTRSSIRFNPPIPRLISCFEISAVVNSPEMRNVLLILLLLLLASIAALPQTAGDPTTEERLRPPRAGDWLSYRRTDDVFGFSPLTQINRANVKNLRAVWSYPVQDDSRWVPTPIVANGIMYVAEGKGRVLAFDVPTGEIKWIHTRSYPEDIRASQAYLRARGVAVYDDKLYWGTAESYLVALDARTGKQVWQVKTADYKKGVGHAHPPMIVDGKVI\n>SRR5256885_12855722\nRSSSSNSLILYIYSTASLFFFFFLMIRRPPRSTLFPYTTLFRSLGLRRGGDQDRGDLAGGRALVGYERRGIAAHRDDPQEHRWRSEEHTSELQSPCNLVCRLLLEKKKKNNTMLDGHTSRTTVCCH\n>SRR5262245_11139375\nECIRLLNYPAVECSRQAVSTGKHIERTQRFQLASKVRELSICFLDRYANCPAKASVEFVEARLPVTHLVERRTECAPFDNCFKPLLGHFDSPRHPLAHSTLAIAKERQQLGTIGGQISHRMAWRQGPVVGDHVGDRKVGLVADSADYRNARGKNGVGDDLLVERPEVFEAPAAAANDHGVEPKSRSQLQPIQAMNGVGNFRSRAFALHSYWDDQDAGDGPASAQX\n>ERR1711871_676384\nVHGGFSEIAKVPHHPEHTATTSAVPLVTETQLPLPQTIFVVDPVVVRRAEEDKSTEEEKDVFLSDADQKEAADAIRKWMKMLRKNRRAGRHKRLRELERMRRMRLQRLKAARLQMKRKMQADFGGYDPGLEKRSSQEKDEAMTP\n>SRR6266852_8977469\nKRSQVKFKDHKEKLHIIFFFSSRRRHTRCYRDWSSDVCSSDLGAWLRRRRRHHRRAGVAKRLLQKDQGVRVRSEERRVGKECRSRWSPHQSKKKEAVSGTLRVQSVHESCYRYGSASRCLL\n>SRR5262249_17805584\nTGPGTPRATGAALPGAGPPHPDAARGPGRGGPGLERLPAPCACVPGAADNAGHGGGAHGPWLDEARPAVVAGAAISFGTTEAAWASFTGAAASDCTVVRTVTTVHCGATHCFFNTAFPDLTSQRPRCDIYGPAHDVKGVSRRGTRVRTDAVIYPTSQ\n>SRR5262249_30216735\nLRNGSTRNIALLTLLIAEAGAFAASGATGCSSGETTSSAEPDASPSVPPPPPLENGQTAAPHTPTAHSPRTPTHDPATDAGVTPGKANVVFVLADDFSMNLLDYMPHVQDMMKNGLTFSHYYVTDSLCCPSRTSIFTGKFPHESHVYTNGGDAGGFATF\n>SRR6266540_3007965\nASDGIHRNIRRMRGAGANTSLKTHCMRHPGSRPPAYLLLYSLKYRLFKRTGFRELFTNTKQMLIGADEDSSVGNRGRGQATFIQQVFLQQSELSPGFQHKGFPGFVQKEDFPITPNGGCGKNTSNPFLPDHFARIGIRANYNAVFSSHVNELSVTKKRRDIRSTGGDAPCYVGLGDVSLPSRSNRHVGTTAISSACVEHSVDINRHGNRHWAE\n>ERR1712159_79709\nPVTKRPTANYSQTCFTPQMSSATWEINYEPIQGANCMWMIMCTCLTGFVIGHWVMTYVKGGLNDFRNQLLCGFPISFVNTALLDDPESVPKWPVVTWKKALEKFYLFVVVIIVIFGEAALPTHQVFPEWLYVDIWCTGGAQIFWVILPRSAFLGFMEHMHHACEITLPYTHGAVWFTVFLTVLGAGIASTINTSFSGEYNRDLEYW\n>SRR5215468_965392\nNDPLILAALRQHYQRYARFLTGLIQGAQRAGQVRKDVMAAGMAWQLIHSAIGFAFIKPLQIPGHATPAAVEQAIGLLLEQLSSLKPALPTNGRVAVRRARPPRRTIHHKPARRSKX\n>GraSoiStandDraft_49_1057285.scaffolds.fasta_scaffold1147020_1\nMTKKWKLSLLRILLLASPVYAASVAGGATLDIDTGDPLSCPPSNSFWWSNERGSAFYSYCTDPRDEGACDGKGQNGETTGNASTGCCGASAEKGKEECDTCRDPEAGGGSGTNGEDPADSSTEAGRKIDKDQSCQDCPEAGMPLWSVEEPLLSVRLVDVPMWYKPAFGPKMALKLHYKSLEGSFGHADTRQANVFGFGPGWSTPWRSYIRAKAGSSPAEVWVFDGVGNVRSYFVGSPGGNAPYYHKKTGAFVETDTVGYVLTHNNGAKDFYAEEVENNSNGAGNGEKIYFLSRREDAVGRGLTFNYSTTTSGGFDQMRLANIVDAAGLSTTFTYTNVGPMNSLIHKVTNPHGFAAMMLYDANGRLETIVDTISLTSKFVYDGTDRITSVKTPYGTNRFEYVSLSDTNCLAVRVIEKEVRKHLFVFGDLPVDPWPNVADVITSLNNYMDMATNVLATTDFFYKLLDDLKGRNPAAFTNHPSARCSAYWGPLQYQNLTNTIDSSLNNSTFAINSVTTNSYNLAHVTRWRAAWGGFISNIKSFERLPGAAINGSEVGPFVFYAYDMGATHEAGTKEGFDNLPAQIFRETMLTDPTDSNLRVWDATQIEYYGLGTVRPGYVKKKMVLERNDFPEPALGIPQFCFRIHRPIRPLTGCSGSGCNRYASGVIQDENEFTCMGVSSYSTNWLASLSGTDGRYIEIIAFPWDPSTGAGIGGPGGAPIHYEYHGTNKELTKVTYEGIVEKIRAFNAAGQLQSEMFQQTTGGVTVTLWTNSWTYLNGFVRTNINPRGLAISYDTDPMGRVTKIGFPDSTYVSNRYDRLDLVETIDRNGFSTRYVYDAFRKLLYTTNAMTNVVSSSYCNCGSLSSVTDGNGQVTSYTYDNRGRKTQVTFPGGSWVATKFDAWSHPTNLTTSGGIEQGILYNLKGQVREKWLKSG\n>ERR1044072_1391978\nRNWCCSALAVPKHSQHPKEAAELAAWLTAPEQQIKAFQKTGNFPSQVEALSSPELLGTTNDYFGDVKTGELFAAQAQKVGQAQYKGPGDGQIQENATSPALQAVEQGKSPEDGWQQAVEARWCGARAPPRAAEAGERTPAGPGAGAGGAGRRAARRAPPPPRKPRL\n>SRR4051794_8328619\nXMSHPPIPPILASVIACIAAAVPARGRATFLDLLLGAAATKSGHVTDAILASGLSRGWSTYYWFLEQGRWSWLRVWAALLEVLTMLFRPAVWYAVIDDSVVERVSTEAPGALTHHNHNAKPNRPKFLRGQGWLCLAAVIERNDFAVGAVPLLLRLVRRGTNRGKLRSAGLLLHLLGQRLGHVRLLLDAWFMRAWLIHRALAAGHIVIGCVRRDLALFDVPKPPRKRRQGRPLKYGPRLTPGCGIAGAPQRPDPLRQAGSRALSHLPGCCAVPARAGGAGGVGGTGASRPARQTVPAAIADLHRPGAVRTAGDQRICQEMGGGVAVQEPQARLWPEGCLAAVASGADALGHRTGGRICDPADAGLHRPGAPGRPGPARPLACARHPHRRANPGRHRPHFTRGRAGGLHRGDLGKNRRRGIKHKRIVSAARRQSRVSHPTPPSSFRSCGANPAPRRRNVAWKLQICKTTSGSENRRDRPQGRNAPRIRPELQFNEPADLGQAETPEFPRFRPSCCRAAITGWRADTAADDTRRRDVDRGRPDLDDALYAGIDPARPSLRDDRGRDPHDDHRLFVRVRAGAAPLRPAVGPLRPAPGRARLPRALCR\n>SRR6184192_2552679\nLQAAVPEYWYRRRQSDLRSRDLLWEWTAIETTPDCTSQNYWAVDFAFRVTGNTRPTAILSIPCRKHLGDFYQTTLTKEDYVAGGRASVARVKRYRHRVVAIRGEWAHIETRSRIAKSQLENKANESIPLGFGYCPTRAVX\n>SRR5512141_912622\nXMIGSRPGCGATPILMVGQPPRAVAAGSQRPNVYRRIELINHYGRGFHEADNEQRDYKQGLMGSSPEPVVAAWIYKLRGCGRSLPRNSRFYFTEKGWREIGRMVVSACRKSGQEYRVIAIKETDAQVVWRDKHTGYEVAVQPARRRAX\n>APWor3302396189_1045246.scaffolds.fasta_scaffold344749_1\nADPTTISLPTLTWDINVNMPANETLTIRFRGITTAAPGGSSVNDSTATGTLGTLTYSASDKATVDISGLQITKTSNATGPLNPGDDIHYTIDVTNIGSIGQNNIIIRDPQPAGTHYLDDTTLVTGYTLVSGDYLDEFGAASYSNDDGSETWSTPWTEGGLESGNDPNNGRIVIIGGRLRFHDTTATGADYWLQRNVDLTGVTTATLTLSYEEAGTLEASDRVRVQVSGDNGASWTNALDINNDFGGPTNLSWDVPIPSVGNTNTVIRILVNNYQEAGVEYLYIDDVRIALTKPGAAIKDNAAGGNPDLLNGDPEQLVLAGDGFMLAPGATMRVEYDVSVNNPLLTPGLTDITNVAYASSVEEPVEISATREDPLNFIDVSLDKQINDDTPLVNDTVTFTLRVSNAMGSQTATNLTVTDIVPVGYTYVVGSILGGDTNNGDDPTGTGLTWTINSLSAGNFVDLTYQATVNLTGPYENYAEITAYAQYDLDSIPGNGQQTPDEDDDDTVTVVPEATPDLTLDKVYVDYTDNDTSGDITAGDDLNYTVTMTNTGNTTLTNVVVSDPELIPTSQTCASVAPLGTCVLTGSYTVIQSDVDAGEFENTATVTDDNICTTTPGPECEDTETVPIPQA\n>SRR5262249_48298838\nMDVKSERSSARDRQQSEPCESGTEVTRSRTGRPEASSDRAASSSHRRSERGIDPAKPRTDDRDVARDRSVRRIPDQRTGPAIASRVPAMLTPEEVALLLRTSKKAVYAMVERGQLPGIVRLGRRVLVREEALVDWLRQKSLTPSSERX\n>ERR1700737_2044360\nHRGPGVSQKCGHFAGKHVIPAGEMVQKINAAVDARHDGDLQIVARTDARAIEGLEAAIARAHAYVEAGADVTFVEAPLNFAEMQRIAREIAVPQIANMVFGGLTPPLRQTELATLGFGGVLYANAALQAALKAVSDVMQALRRDGSLDAVAEQLAGFEERQRMVGKAHYDELELRYQSAGPRRSRSAPRLSPFGRSCPLGSQPRAGAVSRQAWVCKRAVT\n>SRR5580704_900937\nPRDRHLFGAYVRKNITSTGTAVNQGARLDKQFPLVSMTRPPSDPLERDKIGKQVWTGIGLLFVMSLSDRDRSLWANPPTRPEESPEHLRLLHAFDDFLLCQFAEWGWRLLMSAEVLHRISEWEKHDPVLLERLGKELGLRSKVLRGEKCAPLGKNIHKFADPTIKELKILLRRQQLDFGSKRKAVSCEKIALRIRSEVAAHPTKFPLLSANLEQLCGFIHNLPKNHQRAAQKFERGDLRENSFFYLWYASCSNRSVKDVRNQISRSRGAHRSSX\n>SRR5947207_3184146\nNDKKEPRSGGAEVKAFRLTLSCSSAPLPLCPLLLSLVTCHFRIGASSHREWSSVIGAICFPNLNRPGEDLMSHLPFRSLAATHCLRKLWRCARTAATLATVCALLLAAAPRTAAQTFRGTILGTVTDPQGAVVAGATVTAKNLDTGVERSTVTDDAGNYSLPELPIGRYEVKVQATGFQVYLITNVRVEVAGERRVDPELSLGGSDTVTITANAVQVETTANTLGGTISGSAVVDLPINGRQFTKFQ\n>SRR3954471_2680322\nLAHHRRGVVQPDVHPTGPGHHRVEVVEGTAARANFEVVGVEDAASRTARPGDAQGGGLARLRQGRVHRVGAALGDRLDVRWREHAELLEVPAVVVVDPGGAHDVEGVAVLDRLAAVADGHGGAAGGTGQAVGVVEAEVVPHLVRRDLHGEGAVDPGVRAGHVAHPTPVAV\n>SRR5580698_10972885\nSGRPSPSTRTTWSITPTGTRATSSGPAGSCRAARTRWSRNTEVTAQQSLGRSAPARCRCRCRCRPATTGAGGQRRGSPSRRAGRAAPARPPCTRRTLLAACSPQYPGRAGLGEADCLVVGHAAAALVGVVEGILAELFPGGRADTGRVEAAVVDRAADRVG\n>ERR1700674_1031357\nVWRGWWVSVAGAPRRRVAGGRLDDERQGGSACREVDAEPLHGAGAQVVGGEVRDAVLLGPCRAPLGQVVLRRGLGGIACHLDGRTLPPVLGQPRAALERQARVGEGVALDRRGPDDGVAGPGAELALETPHGLPERRLDLPDLLAEDVGQRREVAPPRPGQRGVDPFPAVPHALPLLVVLAGKQQGEAGGTFGGGPEAGARHLPTPPPAAR\n>ERR1712151_647775\nPLPSRCRGSLQQIARERAGLTSLHLRVFFARSRERLRSLALSFLARVGLPPRAFTFAVSAPWLLLRRLFWTSFSLSRLSSLSFTLRFRFTFSFDRSSLVRSSSRFFLSLSFSFARSFPFSFSFSLR\n>SRR5258706_534337\nWGSRAPAHRHGKRARLVPTRTFGSVRAEVAVTPARGSQHSPFSLEGVSMSMDASETLERSVLESKDREQLLAIASALGAKAGSRTKKADIIDKILEQTGSGAPASNGKTPEARASDGPRTSDGPRTSGGPRTSDGPPGDAAPAAGGARAGGGTPGGAPPGGGGENVRASPAGAPGGPGSRRPRRPRPRGDDAFVGGKKPRQYGLRRGDHVTGACRPAGRN\n>SRR5215471_3001876\nXMVPENASPTRVRSNVVPGGAFMLNIGPAATSTQLAGTSAALAIPKLNTAASRLPVTRRIASSSENSRAKKLVLWAASGNGRRRVAIFRRGRDAADQQDAGNDSRGDDREGGRGREGQPLVGGVSVGQDREGIEIERPQHQRRRKLLHHIDEDKKRRGKHARTDQRQIDSHQRIPGTARQQFRSAANRRRHPLET\n>SRR6266702_5134999\nXMSCCSNPFTLFPLNTMVIRKTIGEVSSLLFQFTCKCDILNTDDAYYQPHPAETALARVFLHAILIDTGNSASSEAPPYPYNRGLIETIMHEKSLITLEYPKILEKVAKEAAFSASKELILNLEPTPNLEEARRRLAYTTEAYQLIEQYADTGIRGARDIRPILTRAAREGILSPGELLEVLATAQSAMYVAKLLERPDPENFPLLHKWVTDIPRRPQIIRRIEETISAEGEVLETASPTLHRLRANIRAANQRLQERLRRLVNEFGPSLQEPIVTIRNDRYVIPVRRSEERRVGKECRSR\n>SRR6266480_5337023\nYGFEELGALVVRRHGIGGLPQDAILVRVGKSRVREQRVEVLPLRVIGVHQVRLVQHGVRSALLEQQRHTGLGKPCGAPFDGEQRVREPAIPIDVEGRVAIETPAIVQCAVDVSDANLAAVIAGALFYFHKVVDAFEAAEVGPGREVTTRVDSELTVTITQANGGGSRLCITVDV\n>SRR5580658_3392266\nDRVALPSRRTVQAPHWARPQPNFGPLKPTTSRRTYSSGVSGAAVTSCLRPLRCRVVLVLTGRMIRPECAEGNRVKRTLLLATLGALALGAAALAAPAITTLPTGWKILGSDGPVATVGTLPEGLALARDGSRVFELEGGHRKPTLRVLDAATLHELRTVALNGAYGVPLRDPDGDGVWVNVAGTFQEQLAHVDTESGTVDRDVSLPLPFFPVALARSPDGNLLAVAGDLGGRLAFVDPRAERVVAIERVGLHPAAVAFSADGTAVFVAERGERYVDVVPVPGSGPATPADPDAPRPFSVAMRIPVGLHPDALVL\n>SRR5437879_9218440\nPRGSKAYSLKNVMRATSSPGAQTPKSPQASFGPSLSPGLNPSPPTFTDRISGHGRGRTATPAFWRIPRMGPAHPPVGGPARSVSPGIFWLRQGDFGSGLLLVVTRICDPVRAMARGSFEPPVRIPPAVDPRSLGRHGLARLRAERALVVRYADEYRRLEPRLGHIGAISTLVRRHTKEYGRMVTASAAGAPEQPGFVRRRLSA\n>SRR5438105_2884871\nAATRRTTTCGPRPWAGSSRPRGEMPSRNTRSPRRKDHSMSDKQQYAVPQHYHALDTSELAALRTALAKAERTAAGTGPWVDRTRAEQDVKIIQRQLHSAETAARSELELQRLNAPRPSETPAGNQAAGQQYVVPEPYFAEQQDYDQPSSS\n>SRR4029453_17137562\nPPPRRPVLARRRPGVRPRVGCRGRQRLARRPPGHLGLRQWLVRGALGRRAGDDRRDLAAPAPGLGGGGAVDRGPRRLPGRPRPRSPPATGPAARPAARGHADAAVRPRAPPGLGSARGADHRRNGHRVVGVRPPGRRPGRHRGHGAEPRVALGRAGHPAGGRRDRRLCRRLHLRQADPQRPAGGLRLAPELRVGPLVDDDRGSVARRRRRRRPGPAAGAEGGPVRRAAVILGVLVVMLVLAEVGARALAPYLPEPSLWTDDTTEGKVEQLDALAPGPGCVDVVFAGNSMTRDGLVPDTFTEADPEGRTTYNAALDAATPALLERWVLQEVDDRVDPDGVVLGLSSFDLNDEAKIGQSALDAYDDAPLX\n>ERR1700733_14753379\nNGLLELTPYNTPSISMSNIIEEKDNRIHTEEESQADYTPELRPTIRTDNQTIDLEISKHSTVLRPLHNLSHRLIHNRLKGPTGVELPAIIVEDSDIWKRTVGGNWDCVX\n>SRR3972149_5498235\nEPRGREHVGQHDVVFVEDGGRVIVEILDAADLRRQVEADVHPLQRPLGLAPLAQVSLEELHRRVRLQIGVALGEVVNDPDLMSPLQQPAHHGAADEPGASGYQYHAPPPLPKTRSSTLAARARSSSQTPQQSTRIGRGPEVFSRSRNDRSRKARWLVASTTTSASRTAVFRSGVSWKGSLTATRAPSAFSSSARRTAGDCRVSSISALNPIPSTATLAPTRLWERSSRRRS\n>ERR1700722_8398492\nHAPIGRGSHNRSALNGSRAVSGGAVVMERACPRVSPDECGSGNLCDRLHDLRADARSKSHLAHFVVSPIERHPQQRITPFVGVRRIQVHEVLPVGKMLRSHIHTWTDSVPMLNCSFFPGRAPVARSFPHGHSSEGSNWTFAGSGATQKSSSAYYFFRNLMVEISLKIGDAIAHRARSHKEIQPFLEDQHTGPSAGDLVGQVLAQRSLGRDWIVGFADTREK\n>ERR1719253_1353614\nRSLLRKSALSHKLHNHMLGTRIFQDQSLHWDHAPLGLSLVSFLPCGWCRALAESVLETARHSLQVLHAARAWSTTTLWLGSPLVGSDLSCRVAATCASLLLVVEGPLAATEAKPVSLGVPLSHAWSTVTHGCRCAENCQMLPANEMEP\n>SRR5206468_5774351\nGCSGYDGEILTEPFPAAVVLTDVPNTPRMHLSRVIVTFAVGFVPVASPSQYRKTQPLAEVAVIVTTELLRYGPDGGAIVKVPPPAASRESEYVGTKRAVTCSFRSIVTLTVRFVPVASPAHPSNTQPAAGLALSVTTVLLE\n>SRR5690625_4794838\nXMESVHAPIRSCTHQANGTSAQVGHIGSRTDQYTAVSHLLGHYLRGPLTIISATYSRRSVRYFRRSVTRSPPSVDCLPAFGGAAEAQHARSVAGRPHIDLFADTPLEFADMADDADESPSGAQRAELVHNRIQALGIQGAKSLIDEERAQAYSAARAGDHIGQSQCQAQRGVKSFAAGQCARLTLTPGDVIEYPKSQTGAPAAAGLDFFAADQAQPAGRHFREPRVSRLDNVFEASQQHIX\n>ERR1719284_851324\nRTVAYPVLSERCTASIHSWDSKKGLTSKDLLENSLLSTTQVRLMGKSPNKVKQQEKAAHAKNKVISVLSNKLRGACKMGGKLETNPKKNYNLAKVIAEVEKAGMN\n>SRR5579875_2658053\nWDAVLRKPRPHPGRASADDPRTRPQRQADRSRSRRARPLEDPHPARLQECQVGESNRGGEHVLAPLFRKGRILGRQRLQLVRRDLIRRLLFPAFFIGAVIGIASAAEPAHFSYIPPPPGKMVESRLVALSGAGTQGRWRAVLSRKVVGREGDQRFYQWYLTIYAPNAAGDYVQKYRAPGNGTSSLLTVVEKARGANLWFPVQTVKIVGSAELMQPGVQQLVVAVHESGADCGAATVTILRYDQASGKIAPAVSVRNGCRLDAGIVRTSSGDALRLKARITALRPLCAVRPSPRPARSSGTVPAGGSRARRIMKCRSGRTRSAGNAGYIRNTPKLVREGGAHEATSRPMPRTX\n>SRR5215469_13482869\nLGGHRVLAGPGAWRADGSIGVWDSSGCGCAYSAILHLRLSYVDSKFGTDVYGPRLDEFDALGARLLGWRDNGDAVVDRDQPGGHFAPAAATYPLDGQAELVALSPGGGAQRLVSLPGGTNRVEVAARLLDRFGGASPSIGYRLADWLRTHLDDLVGLVALTAVVVAIVLLRRRFRRRPVTX\n>SRR3954453_2381136\nRRHDHHEPDRPDPDHPAAPRGLRRRDLRGRPGRRAGGHRQLPGGLHGLPAVPAVLHHPVVGDQPGRLLLGAQGALRGGRPVRPERQLRPVQQGRLRRLRRRHPHPDPLHEQHPVRRPDRQLAGWRGAGLAARPDRGRRPLLPLLRRGAPQRPGGCLGARRTRRPRHGPGAAPDRQGAGVKYDPAVEKSPLPYSPFKSCTVPRPIGWLSSVSPDGVENLAPYSQWQTLTFDPPMVMFSANQYPDGRRKDTVLNAEQTGWFVWNMATWDLREAVNISAMALPFAESEFDRAGISKRYADLSATPMVRESPVHFECRYLSTHRLAGHSAVGTIDVVYAAVERI\n>SRR5436853_886914\nGSSPRISLWEHGSDPEEMEELPLQSPHLGPSPRISLWKRGSGLREMKALRLSQAAGASVVDVDAFLRCVYALQEETDPPRPVGSHGRELQWPLGLVQGHRPRPNDWGRKGRADPPWLHTCGLX\n>SRR2546423_1658942\nAAWDADVVVKVAPTSEEEVGRLTGDSVLIGFLSHLTNAAGVRALAAGGATAFALEAVPRISRAQSMDALSSQSNVAGYRAALMGATLLGRYYPLLVTPAGTIRPAQALVLGAGVPGRRGGRQLRALRAGRDRGQARRDDRGAAEPGQRHGRGRLPDVRAQHPVAARAHDRRGRRAEARLRRRDHRRRLRHARRRDRARGRQAGRGSGRLMLVTNLAILVLAGFVGFVVISKVPNTLHTPLMSGTNAIHGIVILGGLLVLGLSGSGTLNKVLLVIAITFGTINVVGGFLVTDRMLEMFKGRKPARQEEIEEAQDEEEKKAAX\n>SRR6185295_6827403\nXSGTYVVQDYDLAMKFIVSARGLTSGWTAHTTFTDGNATAQGTVVSAAAGNPPISGATVQCIAGCNNISITTTNGTGSYSLTFQFGGNGPTSITLQASAPGFTSQSITLTNVTKGQTRTNVNFVLTPTFRNTSTTVSCTPNPTVVGGGVSCTSTVS\n>ERR1719499_497600\nMWSSLPTELTDTVDGLASDLTAFGFNDLESLTDYDSMLETTWQNVQDNSGIDVSDIEGQMNSLIGDFEDYLTGGTDMTLDTIIADIDDAMTAVSAELEENVDNEQLVELYQNLEIVDWGVTTWNQFASETELLTDFTGNLDIVLQSIQFTSEFGDVLTYDWLDNFMTSLNDILRVDGNQYSVCDEEYIKDQVWNLYDAEYDWYTARSEYMTNCYTTNFADTWTNSLASLMSGDLSGAFTPDCSCWEDLWNDQDLVSTMNCVMDAGDSITVEGQIAECNGVIMDTVDEVSLITGALETFEELANDLTSLETD\n>SRR5574343_384457\nYLKTSKSSIYYYIKSILFYFILFYLHIKNLFIILYLYLEINLIGDNMESLTIKDLKHGKAFASDMLRENFNNYNDTDIIINFAYTDYGGTFFDNVCIEYFVQNYPNNIVQENTSWNGKNAILFGNNLVQNFIEQFENYPLGFEVLEDFYYEKESELLESDFIEFIKNNFSTDEYSYNEIDLLNFIIDNCSYNLTSNSVDYNENGLIEYIIQHYKRLNKIX\n>SRR6185503_2167616\nRVESATGCGTAWLMASRLDSYERDEVAEPAIGEQPAEARIRREPVAQRRGKRIGVYRPQRIGGQSPDLPSEGAELPAERCDTHAIDAVMTPVVIALPLLAEHLMAEASRIRRVDEQHGARPGDGAQRVDHLEGLVKMFEHGPHDDGAK\n>SRR6266567_1659920\nLYRCGASACSEHTFHPAIYKNYAHSIERELTILCYERVDRKLQSDLSTVHPPLQCCSRLFTHCNEKSPTKLEIPSSSCTPAPGSSPIATPVLLPPHGKPLRLALCERRFNPMKKERPFSWIHTIRAALFQSPGEIYQWPLATIINQRLNDT\n>SRR6187431_3469506\nCFILYLLSDFELRAVCVRPLLFFFFFLMIRRPPRSTQQSTPFPYTTLFRSPPPSAPVARHARPLVFCAARARSSSARGDRKSTRLNSSHGLLSRMPSSAXX\n>SRR5574338_764212\nDTGEPPADIRRETSRDTTGVVWYASTSPVKVQTASKKEDSDLDDNHKITISGLSSGTKYYFIIVGKDNDGDTATSTERSFTTDQVNDTTAPTISNISITVGTTTANISWKTNESSTGF\n>SRR5690606_34928301\nVDLTRFYGADANTLQTVYPVEVSEQIGQTVIIQIVPITARMNTCQHNFLIACSDELPRLLQHAFRITASGQPSRPRNNTKCTKIVTSFLNFQKGTCPFGKIGHVKLLEFPRLHNVAHSIDRLTLALQISDVIEQFVPX\n>ERR1719424_1028065\nRFAALSSPTNTALPRRRRRRRVEAIMWRTRARAAVRMPGVLRSSRRPLSNEISATSYAAALATRKDATMGRELISTEDTSIKNFTLNFGPQHPAAHGVLRLVLELQGELVARADPHIGLLHRGTEKLIEYKNYQQALPYFDRLDYVSMMAQEHTYSMAVEKLVNCDVPRRAQVIRTLFLEITRILNHLLAVSCHALDVGATTPFFTGFEEREKLMEFYERVSGARMHAAYIRPGGVHVDMPVGMAEDIYTFCEQFPSRLDEMEELLTGSRIWKGRLVDIGTVTAQEALDWGFTGVMLRGSGVPWDLRRAQPYEIYPEVEFDVPVGTSGDCYDRYLIRVEEMRQSIRIMVQCLNLLEPGCIKADDRKLCPPSRAEMKDDMESLIHHFKLYSEVRPPASTAPRPHLGRTSAAPRLHLGCTSAAPRLHLGRTSAAPRPHLNCISPRLHLGCTSATPPRSGCGRRMARRSTGGRLVACSTRWCAACLPFGATRSRTSTRRSSTRSQSTPAX\n>ERR1712137_1537553\nPPARPAPVKRTFRPAAYSLADKPVEASFDTSEGIYQLQRTHRMPPYPIPLKEAFDTIHNHPTRCSLTPCPAPAFLSSRIHEARSEKRILLSEDTGMPTDDDGFLLVYNKKDSLFLDRYFHQPLQPYQVLELPPAPKEGAPFKALTVTQWPHQIRCKRFPSCHLVAHRVTASPPREALLIVFGFSTGELIVYEPWREANCPRVSEPLHLFRTAITCMIWVPLQEGRLLLVGLLDGTVALINLEHKQISTSTAPSAETMQEYLPQDRTGRFVMWKNPHSRTHNPVMKWKFSSHPIYDIKYAPDAVQVALACGDGYIRVLPLLESKSNDLHPLETDQPGAAGFHMEVGQVAVAFQSYFGSVCCLDWSFDGEYLLAGGEDDLVALWSMRKLAVVVRGKGHRSWVSSVAFDSWRCKDGTYRFGSVGQDGRLPLWEYSKETVHRPRSLSAMAIRRRNGRHHASDQGAREGTKPMEPKELARLGHGMIVPAAGSTEVPMLEPIVEHQAHLVPSHSICFTPQAIVTAGNEPCVRVWARPGHYVAPPPKKEPVVPEVEKIPLSVLDAATPLSKSEPADPSIKDTSGNSEITDSKEEQTTVEETETTSTASLSESEEDTHLVTMKDGTSTTSPRVNGKEYDSVHDEAGAPESREIQIPHSMANEKEEKAALPVAEESFLPEQPSDPLIVQX\n>SRR5437868_9687141\nRRADRPSVEKLIGHAPAAHAGNGGAALFDGPEIAVGGAAIQPAAVLRAPRIRIGLGRYGGDAAEDQYRSCRESNAHHDLLWMAAFNAARISRLNPHRCCLVVSPVSPRYGLYRVPPGIAAVSIRGAPPSLTANVLAERRFLSHQH\n>ERR687886_608271\nESVISDVDAIALFSLSEVTAVLFVTGEVSTTETDGFSIAGARSSELAEVTSVSVLAGSDVAAAVVTTAVSDFDTSEAIASELLFVTTAESGFFGGLVDAGWPELVDVGSVSVLAGSDVAAAVVTTAVSDFDTSEAIAAELLFVTTAESGFLGVSDTIATASPVTLAEDSVVTNGCSDDTGAVDPESSGAIGTFSVEVMETSGVLDX\n>SRR5262245_18501370\nCALHSRSASASSKAFNVSSTVPRTTRSRWLLIRSSSIVMTLFSRLGVSSDMAAPSCWPGCVWPPPVQPDSGPPALPNCAKDSVRHPIESNSGRRNAVLAAAEIYFGAYWENKFVKQSLQDIINAVGWASRRRDDIAHGIIWGNIVVDHVSYGAFLFPPEYNTGRTLAFMADTPDPLRFMRTKYRYTAANIAKWGSKFTKLRDAIIDYFKAIKREDGRFPVLEARLEPLMDRAEKKRX\n>SRR4051812_41527219\nVTGAIEPTLERAEVDRVRSRPARNQDAYDFYLRALPLRLQTTRVSSEEALALLRRALELDPGFAPAQAHMLTCIIERVAQGWSAPEEQEEGTQLARKAYTDHGDDPLVLTSVADALGFLAYDPEGSLEAASRAVTLNPNSSWAQSAAGWAN\n>SRR6478672_26151\nARRAAGGHPGPGRAPARGAAAPAGRPRGPRRSVGAQRRPGPDPGPAGPRPGRPHQPAHPVQAAAGRRPGSGTPPHRTRPARRRPADPGRRHPRPAGRRHPGSAAGRPRGGARPTARSARRGPHRARRHRHRTRPGGAPGGRPGRGARAGGRRGTSNRDVGRPHRRRAARPARGRRDRGVLLLQRGPAERRQVRPSRSDRGCGPGEHRGGGVRRDRRRRRIRSGRRAGPGRRPARPGRPGIAGRRRHRGRHGSGPRDPAARRDPPRRPGRGPLRRPGSGPTRRPGRHRAHRPGRRRARTVGRRWVVTGRGVAARPLLLGAARFVIALAVYAGAAALWWSASGDPDRMPGWVAVLATGVVAVAFGMLRRPLDALADRLLLGGRNTGYATVRALLARMATTLPVDEVIPALAETAGRTVHADRAEVRVLLSDGADLSRVWAAPAVPPARTADTVTVGVRHHGTAVGEIEVEVTDQAQADHDRRLLRDLAGPAGVAVSTVRLTVELRRRAADLELLAGELAESNRRIGDARRSQLAAVHAEMTERVLPLVDRARAGLDSASGAGARGAPDITGTADAVAGALDALRTLARGVYPPRLTEAGLAVSIEGWQHRTGRVLRLRIVGDQAVLRRDEDLESLVYFGVVGMVDGLRAGGAEPPAVTLDVERAQVRLTVTGESDGPALDRAVDALRDRVEAFGGTLERTSTAAGDDARVRIVTRLPYGEGSDDMAARHRGAEA\n>ERR1719505_362534\nSTSSIILSQASFAASIGYIAHIVLTAFSMNSILALTVFTSNVMNRTTALQTVHPMGPPKFLRPSHGSRRPNPPNPGLSKSPKSSPRPPNRPRPRPPHNPRFGDNPFRPHWPRHRHGGRHGGRHGGRGLW\n>SRR6266536_3216943\nRPVGWCAATVLGPRGATRPARRGRSSPSTGGLPEHRVAGLVALPAGGGYAVRAGAAERVAHLRPARASVLTPTVRRVGLNNAVVYPPEGGCGGGDEQGDVVVQRGDAPPAAFQAGFDELVGVAPVHLRAGWAARGAAVAAGRVDDPVGHVRGGVGGDALAVAVVDVDRAFQADRVSAAGRGSHVVQPLVVVAGGGAGDDGRGFGHTTGPCRDGGGCGGLRPRPVPVIGGGRVEERRLAVGARTRGEGVLLPGYEGPRRDAHRSAPTGVPLWTLVFEVVEMVPRAARICSAVLVLMPSRTASX\n>SRR5713226_9196200\nKLYGWKLYGLEVIWMEAVWVGSYMDGSCMGWKLYGWKLYGLEVICMAVVWFGSHMDGSCMGWKLYEWKLYGLEVIWMEVVWVGSYMDGSCMGWKLYGWKLYGLEVIWMEVVWVGSYMYGSCMVWKSYGWKLYGLEVIX\n>SRR5829696_2428463\nSRPVRIADAIPSIGSPACSQASARRTFCTSLARNGAGPGRATRMPSSTSRPTSASVVPARSASPDAESPVMPPSSYERGNLRGECRSVPDRHLASVAPARPTTASRQALDCASWLFSPGLGRNAGLTCAYDPARTYEPDHLACRPYKHGSIGCLQDQPGVDLNAGGWVLTGRPVADEGQRPGWRQAPQPVSRAPATLASTGPVVVEERRVGLVGLEGPGPAPRVGADRLAVGEAELQPEVAEEMAVGPVWIVAGLLELVWVRSGGEGERQAGGVGAQVGDQDGMGVGAGRHELNRDDAGNHGLGWSRPGRDPVARGRLPGRHREEAHGGLGSGHRVWARAAAASTSPASSAACEGGICSAGQWQAKVSGPGGGRPHSHTWPPSGPLTLWYSRGGSGGWSPVGRGQRRGSLSARRPSAKRTSSRRSSPQRCSGWRGWLGRRRTARSKSNPVGYTSRPSTRTAW\n>ERR1719375_709491\nAFIALKEVLDGAASRLDRDGGAFAHEPRLGFLTSCPSNLGTALQASMLLRLPLLVQQEEAWPWRDWCREQRVQVQAAFSEEYKPVPDTFLLSNMDRIGTSDVHLVNLLVEAASLLVQMELCLETAGAGGTVDLRDLMVDIKVPGDGEAEEFPGFPAEECPDALPDLSGHCSFLADVLQKDPACYANLRNVRTPLGVSFGRCIKAALDNRGHPLVKFPGLVAGDEQCFEVFREVFDPVIKLCNVGFGEGAGGQGTGLLSTPIDPS\n>SRR3546814_8950902\nXMRISGWSSDVCSSDLVDIEQHALRALEQDALAPRPRIIQRQPDGPRELKHELGDLAQVRLQPCAIDGTLAEAGAEGIVMSAEPVDMRAELAQMGKIADPDRAAADLVFIGRTDAAPGGADLALFARLLPTRIEVAMEGEDERAIIGYLQGFRGDRKSTRLNSSHX\n>SRR5205814_2128888\nNLGVTTAGQPIANEKVTIALAASTPADYSGVAVKSASVNSSFARTTVNGATINLKSAGVFDMIQKASLQVAIPDINKTMNVAQAFSPPSTQPAATQPSAPLQIGGGAVVNVDLQREGQTTHITIPELAASKVSLVRGKRRFAFDKAIAVKLAADLAAGEKIDKIDV\n>SRR5262245_33090118\nHWALGQNHVALFLQPVAKVGPEWRGLLLTQANAQRVSAVAVQVFRLDAFLGFLLQGVELTIPGQGSMAADRIAVLRLIERAPRMRVAGHLDNGAARGQVDAVVTTERVRLQIALEAGQKALRPIAGPSRRVVEHVVRMTAIAGIDPEPALAGRVTRFVLHRQ\n>ERR1700744_713940\nQPIVEKQGIKAACHFFILSMRKLLRPAFDFLLFSNVFMSLCAVAQGLLTFYLISSKPIYPVLGLLFTSTLGIYNFSILISKPKHPEKSPYRRISWFFSHYRLMVTFTIVSLLSFIPLFFFISTPSKILMIFLAVLSFGYGLPLFTIGEQKFGLRNIPGLKLIMITLVWTMSCVLLPILESQAAHLATISMRDTTILIAKRFLFICALAIPFDIRDLFEDKQLGLKTIPVAWGEKNAYLFCQVLLAGYVALLFLFRNNGFSTDFWALTLSVVLTGWLIFRSKWEKNEYYYFFYLDGVLILQYVFVLTFNYVSRYLX\n>D4D873_TRIVH\nMLRKGAINPDIDSLAPKNTSFFLFFLCTYSFFSPTSISSCINHPFSKVHLVQVLNYTAHQTFPSASRNTNRFTHLGAMAEMRYISPDGPPLGGMPPQDFAFLQAFHMPHFMAYPSIIQNPPPGPPPASTPAPAPAAGAPAATPAPQVSTFPLTIYVVQHGLTDQVILHQTFTTNVPPPAPAPMAPASSPPRAPNPNPTAAQAPSPASPPSAAPAQGRRLPSGAYPPDSERAMVLPTGQGYIFPKKHTTLHIIEAFTAPWDNPGSTFQWRSYRVPSSMSISELIDQLCPTKAPDGRDATSRGVIECLEIGDGTWLKGSEFWIGGRRGGDDNMKRRVSQSLTAVGWTEQRGTIAQPVWITLSIAV\n>SRR5690554_8049497\nYPLLILSFFFFLMIRRPPRSTLFPYTTLFRSGKNQGVGPQFDFNGVGPASTHTLGIPNFGAHGLAFVVTRTRKIGVPAVCSQCEGPVFIIAVTFLIQEQDRILPVAPGILNHAVDARKALAGNAVLMALLFAGSAHGGKEX\n>ERR1719239_204793\nGKVAVKVSLPTRNNSCKRSSVDQESTPASTFQGHSLKYKLCSLHGCHDVDVHTSPPTSHIAVDSSIIAEDVHLGVEMFLATIIKGNQIIFFGHIAPDKSNFVLPKLLPQLDQGFFAHLTVDVRQANLGSSGQESDCKSFAEPLSRTRDDX\n>SRR5271157_3087616\nXMKLLLKILFAGILIYMVGMTTWVSLHKSILLSPDEFSWAQHPWAVATLFDAYFGFVTFYAWVFYKETSWLARMGWFAAIMGLGNIAMSGYVLIQLFRLRPEQAGIGHPVAESRVTRGFFHRRVVRPIVDLLTQGITPEKIALSIAFGLVLGVFPALGWTTLLCLLVAVWLKLNVPAMQLVNYLAYPLQLALLVPFIRAGEVLFRAPKLVISLAQILAMVRADLWHAIAALWVATLHAIVAWTLIAPVAVYLIYKILLPILTRLAQVTGLAKQEGSAASVAEVCX\n>SRR3546814_2889336\nXMLRHGKYVLVPASAHIDDDDTVFRHRRRDLGKGSDGVTGLKRRDDTFGSAKKLERLERFGVGHGGIVDPPDFLEPCVLGADARIIETCADRIAFDDLPVRSEEHTSELQSLMRISYAVFCLQKKTNRQKSA\n>SRR5262245_5483048\nDTMKQLVNAFGDYARPPKLELRPLDLNRVLGEVLDLYEDEQRLDVTRALAPDLPPLRADPVRIRQLLHNLIRNTLEAMPEGTRPRLEVATRCGSGNGVAMELEVGDNGPGLPPDFDASWFEPYTTTKPKGGGLGLAIVKKIAEEHGATVSARNRDQGGAEFLVRFPAX\n>SRR6266699_1496226\nAGIGPVPRAAEPSDPGSTPWGRLRGRLRDSLRPTVSLYVIRSCQGRSTMAGQFAGRAVTGGRGRGPRGRLTTLSSGVRHCPISGCGDQIDPSRLMCRRHWYMVPKETRDEVWATWRSGHGAYSRGHRNAVRRAVAAVLEAAGHADGHRTGHADGHADGRTTGNADGHASGHASGHASGMATVGDSAGX\n>SRR6218665_631217\nXMMLQTTYTVELHPETWYVLKVTATSSAGSTECILKFGTKSYFGATIEPLRLVHRFETPFYENIYIMVPLAVVTISCLIVIVAVALFCYRRRLRKRHKASSALRMHQEAKTALSLLRDIEKPVAAVGTEKSRDTQTYVAVPGLSTNVLKLVPQVSMDAKDNEDDEAIFRERTLSTGGLDIGLPNRVRVTAETGSQDESGTVCKDVLYGYPQKSSLF\n>SRR3972149_6447067\nRERAARALVHKGIALGHLGRPDHAIAVFDEVVGRFGEAAEPALREPVATAVFSKGVALGGRGWRPTTRSSGASARRPSRRYWNRWRWHWSTGPSRSASWSGRRMNSRP\n>SRR5678815_2305109\nXMCIRDRQPGGTWVDADRGIQVEFPTFVGSAPDAACRVNIQYAAAGAKPDPMFLTVGAGTVDLWMDNMQNGTGVYPSTQPLDGDGVPTGPGDPFAPGKVNLLNFRVRNLGAAPTPSLAVRLIAEQPPHVTCGVNPPRILDKIRLVDPIAPGGVALDGVNLEIPDNRLVRVRAEILSVPGETTTSNNKGERTFTTGANSAVLDQQYAGPVTINATFINGCPGDQLATAVPMTMPVKTGPPIPDPIFDRWRVTDPGLTLVGPGEQAQLAFTFLPPSPVTPGSGVTIPISFRAGGGLAAAGGMFGESRPQIDSMEVTIPVVEQAT\n>ERR1039458_8973043\nPPSLNRKKWGRAEPPREQKIIWQHGPPAVSPHQFSRSDTACSRKTCSADAGFPARRRPPATLPRCRNGFSPPGFSTAADNPAPSAKAAAASAHPPPPLDRIAEIVEVLDLVFGRHRLGLRLAETGTARVRQIAEREHVHRMAVRADLAVDLETALQLRLVVFSERAGERPFQPRWGHLLGQLRGPRGPDGGQRTGEDKGEDGALYVHDHPHALAPRTDSEIEFGSGFVFSKMPSSGRTIRKKAKX\n>SRR2546421_543181\nGCFRREAGAAGRDTHGMFRVHQFEKVEMFVWAPPEESWEEHERLLAIEEELVQELGLPYRVLNIAAGDLSASAAKRYDIEAWFPSQERYREITSCSNTTDYQARRLGTRFRRDGKAEAPHTLNGTGCERVPAQEVELSGVAGVFHVGVRSSFHQLVVESCDDVLPWLVEDDDAVVAVRAVFGENTHGVVDDLVSSSGVHPAVVAAEAVRRVGFLLELARQRVGFFLAGRALGVRSLLRTDRRLGAEDDPRGEQEVEDARREVEVGX\n>SRR5262249_31764099\nDDPHTLVIQGDTKTFNCNFSQDAIDRLIKDDPESAKAEIEGEFRTDLSAFLEDAVIDAAIVNDRPKEIEPRKGVYYTAFVDAAAGGCDAYCIAIGHSEGSGDSGVVEIDVLRGRRATDPYQITAEYVELCRKYGIKKVMGDKFGKSWVEMA\n>SRR5574337_5095\nNLKSGSVIPPAPFFFLKTVLAIWGRLCFHMNCEIFCSSSVKNATGNLIGIALNLQIAFGSIFAILSLPTQEHGISLHLSISSSIFFTSVLEFLSIVLSSPKVSLFLDIYFFVAMVNGIYSLIALFDFSLLVYRNVGDFCVLILYPATLLNSLISSSNFLILSLGFSMYSIISSANSESFTSFRIWIPFISFSSLIAVASTSRTMLNNSGX\n>SRR3989338_7824970\nRWNCDWSSDVCSSDLSLFCLFCISEIHAVFLFNFLGSSRIFRVVFFACFTCDPCTFLFLVLRSLGGGGCIFFFFSFFLFLTLAPDALEGFLIDGEESFEGETDTSLVDIDINDLCVNTLADREDLCRVVDVVMCEFGEMNETVDIFLESYECAVVRETHNRPCYFLANWVAFRHFLPWVICQLFHTEGKLVTIDANHFHGHSVACFCMLGRILHVAPCDLX\n>SRR5688572_19622849\nTDDEMQNPGSWTQDGRLLFSQGIRGVDGDIRILTLDSPPRVDTLLGGPAIEVLPAMSPDGRLLAYMLVEPVGQIFVRPYPNINDARIPVSNGPGMGPEWSQDGRDLYFMVRQTELFAARLESTNPIAFGKPRLVRSLREPTGDPIRVTLPPVNGRLLRQVRPQVSLSNPTEYRVVLNWTEELKARVGTKX\n>SRR5687767_14888222\nVIDAHTGKQLQVVDRLELEHGEGAGARYRAGRLDLVDGTPEQRPGAVTVVEVYRRVAPGNVVRQPLRVDAGDGSDLLTQAKTEVAATLDHEHVGIGVDRALGEGHDILADGKAGGPTQIVRDSCLGACLNAEETGVQLGITAGGRIAAVRX\n>SRR5216684_2934442\nYASRKTLPSDAKPQQHHSQGLETWLREKSKRVYARASVLLRAPVSSPHKESLGRLPINRAGFLFTLFIASFNCLRTDLLIDLLISNALVVKPDGLLRDVQSWVKPFAVSIQVSDPLVSIFAKDANFLVERVVVQSQVLQKVPLESIRICDDSFPRVVPISFAEELAPVEHAHIKEITVYGIPEVSTVRVRFEQVSELHRPSSAVVGHVAPKRPAQSLNVSEDLASRX\n>SRR5215469_11197210\nSLQVQPVRSKRLWPAIASVLLVALVGVSAIHFREHPPDSPKPIRFQLAPANVIIGSSARPSFSPDGTKLAYYATGSDGVARLWIRSMDTLESRSLSATELNANVPIFWSYDSRFVLFPSAGRLKKIDISGGPAQPLCDVAAQVVGGSWNREGVIVFGTNNTAIQRVPSEGGNATPVTALDSTLGESAHLGPVFLPDGRHFLYLRRGRPESTGIYIGSLDLKPDQQSLKRLFASDYIPEFVPFQDGRSGEILFLREGTLLAQPFDLRRLELTGDAIPLAERVGSYLGDPLFSSSRTGALVYRSGGAGEFSTLTWFDRQGKMLSNLADAFYGPFTLAVSPDGSRAVAERLETTGVNLWLVDLARGGRTRFTYTRSGIDRYAAWSPDGAKIAFSSNRGGHEDLYLHAANGAGEDELLLKSDSDKSVTDWSRDGRFLLFNQLSGKAIRELWVLPMDAAGGQKPIPFLRSDFDSRSGRFSPNGRWVAYGSNESGGNYEIYVRPFPPSAGGGKWMVSQGNGAYPRWRRDGKELFYLRPDGELMVADVGADGAVFQAGVPRPLFKATYVQGWDMSADGTKFLFPMAGGETTQFPFTVVL\n>SRR5215471_2447632\nSWRRSSGSPSRRRASTWGSSPAWPCWRASGAGRGRCTGSGRNSSAAYSSRRRTGSCGPSRSDLPNGDQRMQLVPAVLIVEDPVARRLDAGADSWDHEVVVVALTGRHGVSLGDVPLADRLEHEVTVLLLDVLRVGARLSIAALSDVELEADVVVAIGLRPLVLDQPLQRGRLAAVQQPEPARMIDMSGRRRAVGGAERNGTGRRIELGRRT\n>SRR4029077_541644\nSPASLRPAKANSAHTGPAFSSPSVPIPSAASPNFHSSICTAQIARTPTPHVFPLAPAPDPKSSVSSFPNTARSHNRHTSTHQTPFPNNQSPAQCESARIAPSEIHPARLLQQAPEKPASRPAPDSLSPPFRSSGTSLSASQIAGRAASRPPN\n>SRR3989344_1047100\nAYFEIIEKRQAPSETSAKVRVPAVFLANSRSIPIKAPNRTANANWPNISKFSPPKNPILVHQKYLVAFSDALADFNPDFFAFWRHGNLLVIILHGFNHLIKIRRRPAETKFRARFNRFFKFYDRDFNVSVEMSNYSDGLALSLPNGLFHLHRRLCFRHRFLGGFLRCFFNYFSHGHIFRNXX\n>SRR5215510_3565519\nWPRALLHRTCRRGRWRLQTGELGHGLQVQTMTVGCMRVVTFSQLPSSMPTALIQINDGVKPCSPLIKARPRPATGRPRPRSGAAVEGQADPASDISSMPRPVGLVASRHLGIAKSLRWFAELPIGDVLSRTGTRARHRHNRDRYSRRPX\n>SRR3974390_2059552\nARVIHTCLNKDAEERFQSAHDLKLQLEVLVSFAEQPAKAAPPVATKPWTARAQWVAIAVLVFVVGVTAFAWWQLRNELKPVVRSYLTAPDKSNFNTESVALSPDGRFLAFSAVSATGGKMLWVRPLSSLI\n>SRR6266566_5267620\nPLPRPPLPRRTGRSDGRAGGAACRGLPRDDGNRRRPVLRIRGGGEPARGARGELAGGGVGSGRRAGGAGAGSRGVRGGRAALAARRARSPARLRRRFRDRGDDGELPRARRRPPGRPAARARGAWVHVDGAFGLWAAAAPAREHLVAGIAAADSWALDAHKWLNVPYDSGVALCRDGAALRAAMATQAAYLLQ\n>SRR6476620_1160279\nLSNNKGTIITLAVAKKKEPTSPSSSSSHHKRTMTSNTNTANTIHPSPKPNHLHRGKNQDLHSAIPKTTTTTTSPSLSPSTLSLSPSSERPSDVPAPSPEEQQATVQKLYAASAVAASDPTNFNSPMDQQTQQQQQSCSYSDSIDKFILPFKEARFTHIRPCVTMTGTVISGLKVNADGDISFNIAVDPAYEGMLGPGNLDPSHATSSGEHGIHIEVICQEPVNSSAPMDVGACNGYNGPDFHSLLPTDHEHVMVTGRFQIEWNEAPGGLTEIHPVYDIKTIPKTX\n>SRR5580700_450720\nDMPIGDDVIVLVEHHPPCLRMMLEDDGPLLGRSLVARILAAQSQPLETTIHALAQPVQRIARHGIDGRHLVDVQLDEVFEEIHPIPTPAHDVVMAADPIRRQQPAYAVDDFADVAVVGDFKIFQLADGDEVVGQSVGRNYGAVDQDRQDLESVLLAQIQSGFELATDEIMAAVETVLGVPLRTDERDHHLARLQLAHDLGDDLVARLRDVDVEENLFLRKGRFQRLVEPTRNRPGIVAPIADEDTLRHGSPSAFLGLPGNDLALELRQQCRSDEAKEADHHDADEHGIDLEQLPGIPDHVADADLGGNEFGGDQHDEGHRDRDAQPSEDHRQRAEEHDTREHHPKARAIIARDIPVDFLDISRTRIGVDDHREEHADGDQRDLRGIAEAEGEQHERHQRHFRDREQHGNQRIEEDAHRTEHRHEEADRNRRHDADDEAGDDT\n>SRR5580658_247251\nRAKLLRALPAALFFRRRLTRRTQRAHNVLAGAVDRKKNPPGESLGLPCCRRLERTALPAEPRLHHAVAAHALIHAAGDRLHLGQLRHSKILTDYLRSAFICGRPIISGQRWCDQAPQQSCSPRSSQSSTRPEGLPHTRAYSGSFLKYRRPAWCPVCRRSTSPAPLSHKSAPCG\n>SRR4051812_49755575\nXMAIFVTRWIRRLSWSSWRVFRLSRQNSGVLWFGNSLLCLGEGRTSRVSFFERSSPHPRSDALLLLADGIRVDRCRGELGMAEPLLHHIEGDAPADSLHPEAMAQALGVGVGAVRDARRRDNLLHPPVGRHAAPRPQPHFCWAAPGCSAAGPCPPACARLPDAPGPCARSAX\n>ERR1719445_2651091\nNIYVVLLFFYVGVAFVAGEQYWWKFVHADCGYDDVSPQPACGRSHKGDVEALKACCLNTTGCGGFNTNGIIKKTDCLSNKKFESACDLYVLEDRPQPPPGTKFPPIWPLPKKYSNGTSYASVSTAFKFTSGKTTTTLTDAFTRYTNLIFLHDIKSSTVNAAVNATALSGLDVSCDSYDESHPQLETDESY\n>SRR5215211_4540433\nAAGGLQRGGAGVGGEVMLGREPANVADLAQEPGRQHRPHPEQPQQAGVGPGDRGLDSRLDRGDLLLHLAGVGDEFCGQLPTGDRRRTGRGHFTEQGGGPLGGEVTPGAAGDQVHQQPMQPVDGLGPRGHRSWRRLVNKCRTTAWSSTPTWRGAGILNAATTTETASSGSLLRPCPTDSTRTRAASLAGTSRTCSPSPTSRWASARPMPWAPSTAQQALWPALGPSPQGLVALKGGSDALLAEQLAVFVKRGAGVGGLVRGRRRSSPACGRLLEGRREQPGGQADIGALAILCXX\n>SRR5215471_16031673\nANGSNVQNEQPGSRRHDNETGKHNSRRAPAFAVRTAFRLHGSGRKDRGLEREKIARPPTCTAPLAPYRSERGVRWINWQAYSLEQRAGWSRDRFASETSVRAARMAALFRKGSESRQPLEHHFVAADWRSPQDSMGVDTLHPX\n>SRR3984893_4885850\nCCRRAATGSSRCPRRRSCVPRLSTSTAPDRPRTALPVPGQVVDHLDDLAAAVPLLPGELQQVSDLGQDGTAFGGARHRDAASAAELQQPFLAQDVQRAQDRVLFHAEDGRQVLGQRQAFARAGLAVGDGAADLRGDLVVQRSRAGSVDVDINHGPSHSSPMLDEWHGPVSAVLAPPGPSAPSEAEALFAEARRRRRPRRLAVRVACLLLAGSAAAGLMTAWPSHGAGTQYGHPGRAAVPHTPDFTLPRVRVAWVDYGGQLHIGDLATGTSRSWRRSMPRQPTP\n>SRR6266568_5935642\nYSAIRLNSLKALAALAAQKADTNVSTAKATSNPPTTTTARPSGARGRRPKPTPTRIAHHSTIPTIARAVRPEPPFSYAMQKTRIATTPAIHHVSKATRGLRRGVGSTDRTAWVRGATDMGGARLAL\n>A0A061IJV5_CRIGR\nMLCFEGLVSLVSGASCFPFFRADYWKSQPKKFCDYCKCWIADNRPSVEFHERGKNHKENVARRISEIKQKSLDKAKEEEKASKEFAAMEAAALKAYQEDLKRLGLESDIPEPSISPVTSTVQPTSTSDQPKEKKKKKEKKKKDPSKGRWVEGVTADGHCYYYDLITGASQWEKPEGFQGNLKKTAAKAVWVEGLSEDGYTYYYNTETGESKWEKPDDFIPHTGDVPSSKDKEKSPESLEESKSSDSHSDSDGEQKKPGEASAETKKLVIKFKEKNKSTEKRTDPEIQKEKSTPKQNPSTTNEEKSKPLKKLTNPYGEWQEIKQEAESQEEVDLELPSTESEYLSAPEAAAGEIKVVFKEKTVSSLGVAADGVAPXFKKRKIENGRSRNLRQRAAEMSHHLCIHLFRNPSYTRRHVFLYCQRFRQISLDTRLWDFKQNKSHVLHQVLNKSWSRSYCHQDPKMLWKHKALQKYMEGLNEEYQTLDGCLQDISGNEDSRRALCRRHAKLAPLAAIYQEIQEAEQAIEELESMCKTLHKQDEKQLQELVSEERQIIDQKINTLYSELLEQLVPKEKYDKSDVILEVTSGRTTGGDICQQFTREIFDMYQNYSYYKHWKFELLNYTPADYGGLHHAAARISGDSVYKHLKYEGGIHRVQRIPDVGLSSRMQRIHTGTMSVIVLLQPDEVDVKVDPRDLRIDTFRSRGPGGQHVNTTDSAVRLVHIPTGLVVECQQERSQLKNKEIALRVLRARLYQQILEKDKCQQQSARKLQVGTRAQSERIRTYNFTQDRVTDHRIAFEVRDIKEFLRGEKCLDQLIQRLLQSADEEAIAEFLDESLKSVK\n>SRR4051794_32399155\nADVGRASAGSCMVRRSFRTLPGDGGGATTVLSLETQTLATSSWRAELPFALSRPRISPRVALALEAGAVLAILLLAAIVRADSYMVVPRLTDETLEVMLGLRLARQGGLPLVGYAPHIGSLFTYLTAGAFLLLGPKIEAGRLLVLTTGVLTVLPTYLLGRDLGQLLVARGEGRGARDNTRRAEAERLTRGRIVGLIAALLLALSAPHVATSSRIAYSNSLTPLFIMTGLWLVSRAIGRRSDRALIGSGVAFGLALQSHVSAVTVLPGVAAAILLPLLASWKRGELARVTPGGQ\n>SRR3954453_11447405\nAENDRKNQDYDPENFRLLAGRRVERCWSDAGINECDDLDDEQRQADDQEDAVQRPEDEHRSSTVARWRRDVIECRKIFRRRFPGTGGDIRADLFWLRRSSDDRRNRRLSGEATDSDVEQAATTLGGVLLEFLTDVEDTFGERLGSGGKSSPLRRWLSAPVLAGQQSACEREIGQDAEPEALARRSHLRLDVAFEQAVVVLHADEPVETPDAHRPVRVRDLPALEVGAAEVANLATFHQLVX\n>ERR1719182_1343932\nLLKAKYVEVNALRVNGKSLADYIVMTAKKSNLCKCGGGGPTKKPTKKPKCPVAMIKCKCGHTYTMVKGCKMAKCKPCGDKTLSGGNNGGAKNLKACTGECDSEAQCAKGLKCFQRSKGEKIPGCKGNGGGKDWDYCYNPVHGGIKELGGPNDSKAKNLQRCVGECDADSQCAYGLKCFQRSKGEKIPGCKDGKKKMPGHYDYCYDPKTEVKKPDPCKKNNGGCDKARKCMNSNGKAKCGNCPKGYTNSGATKCQKNRPRGKEPERRQQRWCQEPEGVHWRMRCGFAMREGPEVLPALQGREDSRMQGQWRRQRLGLLLQSVARRRQDAERRKQRQCQEFATLHWRVRRRLAMRVRSEVLPAFQGRADSRLQGSWRRQRLGLLLRPQDRSEEARACNEVRSRQCIQLQSYQDQHPQVLRRELHPQVDWWX\n>SRR5574341_165588\nXMGGYLSSKLFRIIESGDRTMNPEQPQIFGLIGNPVTHSLSPLIFEYLFKKHRIKGSYHLFPLQPEQLKSALEGMKILGMSGLNVTAPYKEQVLPHLYNLDESATKIGAANVICNHKGKLKGYNTDVIGVRRTLKEIMYIQAKIGAVALIGAGGAARACLQVLKELKPEKIVLFNRTAEKAKQLAQQFNSSIPLQHRNLGELENCRSERDFNLVINATSGRNPAIKKAMLKGLSLGSHLFDLNYNRDYGINHRFHKRFCDGLYMLSCQAAESFRIWFGKRTEAEEIHRYLKKRLKX\n>ERR687887_1747641\nAGEAAQAQGDGAQRRVAGLDAAAGVEGAEAVDVDERQRRGPAVALGTAQLVGGGAAEGVVDEEARPGVAVAPFVELGLQRAQARLRVSQLAAQRLLLAGSEHGGSSAERRRSHSRWTRFGARSPELGTAHRRYPARPASAAARX\n>SRR5215218_6855622\nPSVRRAVMPYWSVLLGGFARIPSGENRHDDMPVRLSAFVSLLAGVWAVLAVLSVWGAGSAAAAAGTRLVISGAFHATSARTVARDEACAYRPNHTLIYQSDALRLGRSPKAVVRVQFFIRRYRGLARYPAAGSAPYRRTAVQVVTARNAATGVATAFYIATSGSVAISQAKGVARAGHRASLSGSVHAKLREQDGSRRLRLDGTWHCRIEPDANGGRPRTSRRVQERSPSMTDVGSSRHCSGEAAAGLEPTNRRPGRASAGRARGRARX\n>SRR6476619_648836\nLFFTTYIGWQPVLVTRDRHGELHCLLNTCRHSGTIVCPFQDGNAKLHVCRYHGWSYDAAGINRAITGEQDGQYPVAFKNANHNLINVARFGNYRGLLFASLCVDVPSLEEYLGDARIFLDIVLDQSENGFEFVPGPVIYTYDGNWKLQFENGLDFYHFNLLSPKSGAAADKIAALGPRLAHWNVIGASNVRNVASSRCYLRHHRNSMPFSVLARLSTYWCIAANDAMCRX\n>SRR3954447_23271464\nNWRRLWRRYRFVATLEGRLERLGLLCPPDMMQGWNKGPAIWFPPPGRARCTAETAAQCAGPNAHRQYGQRPVAPSNEIIMSARMPARGGLGVECQEAKRHGRSRKSGALEKVRGFRPRCAQGAFRRPWARTAFGLX\n>SRR5437588_9293553\nASAAEMAAAAGLSLAGASALAAGADPATAKLATEPVGPSALMDGRTAVLGGDEVAQPPVSPPGPPAGGDQGAGRLRPVALLAVVLVALAAIGIALALRGNSGSTPTTTTTSVPATTAVTRPPTTRPPVTTTSAPTTTTTSPTTTSSSSTTTSSTTSTTSGVLGRVGGRDHKNADAANIGGGX\n>ERR1719421_986179\nGSSSEDFGDQSSIQRCATLDDAYAKLQRESAVAGQFEAFAAATLDNALAERAALYRLDGAESYVDACEREASGAIMGLLDSLPGDDAPGALRALVGRALPQALRERLWSRRLTDIKVQREFRESRGDWSVRSPHEADVTAFCVRVLSDTDGDKLCCARSAFSFLDQKARESGGPLPSDVYWLAKPLLEVLALDDAVLASAVRCVLERGLEPATKPEGTLAFGDESTDNQSVLEGGAGAAALALRLGVQRKNTQRWWVPRDWLRRCRTLLVELCPSLAKALKCEEDTDDSENVIARAIGRSMRRGLSDILSTEVLLFVWDQCVLTSFDLVIPYAAACVLALLDEPLQFFLRDNEDPQVHEALMRLGKDLPLIDVEACFRRVVPKIAPDARELTDAISARPPPGLLVEASLPGAAALGGLADVVVDSLADGAGFTMHGTLHCFLRNLDCRLEWCEVFPAKDSLPNVVDRLLALPANRKCILKARQQWGDQGGFDASLREACAVAACRALPGLAALYAGSYPATIQDALKDIMKECVRFSLPVRADDDDRDGDGVKDEVEYEPTTGALLGEHVPQVDVLLRKNSKPQDPGLGPGSALLQAAGIFAIRAAPGSLWPHYSPGLMHLVYLAYNMLREQHHLAGIEESKQKEIAAAEKAIDNCRRAEAKKKELAQKERDSMNAQEQAKLDEQYRKEAREQQRKRIEAADAADEKVKDAFLACVNAAKECGDTYKKCREAFEAKERWRKQLIFRWSRGSKRP\n>SRR6266571_3544720\nERFPERGPVPTVPDSLVKSSPSNPSGNSPHSHSSPKQHLLRILEALSLSTDKALLRNMSILENNLRGNRASVTQLVDMLTRLRRPCVNEECRGPFRRLGEEEVEVAVAAICGEHLRTIHHPLSTLETGGGLKIACVGARARLGQRKAGELLAAYHLRKILLLLTRITELANALATGTVNGERKSGAGASLPAHLHSCDVNRPGKLQSTKVFWKAHAGESLLEEFPNVLARKLCLQVGLASCRLDLLLEEIAQRLKEEQIIFRSXX\n>SRR5918994_7596206\nTQERPRRNRPGGDPAAGDARRGRGGDPGKGADDVPRVRAAQGPREPGGPQPGVGNDDGGPGPPAGVRGRGQVRAGRDEQCDPVAGGDPVVGEPDGQLVHAPDEQVPGDRADIRFDDGGGGVAGAGVERGPQRGVRALRVTARWTSGPFVRTYPTNGP\n>ERR1039457_7143814\nXMLSIIGSVLVLGSVLGSFLMEGGSLLLLWHPSEFIIILGAALGAFITSNPLKVVKGSFVAIFGLLKGPRYGRADYLDLLKLLYDILVKIRKFGMLAIEADIESPGKSKMFTEYPRILADHHMIEFITDCLRLIVGGNLDPQELESLLEYELETHHKEAAEPGHAVQKVADALPGFGIVAAVLGIVNTMAAIEGADTATIGKKVGAALVVTFLGILVAYGFVGPIASAIENRAHEEGKAFEVVKMALVASVRGYAPAVAVEFARKLLWSDVRPIIVKKVKKSAAGHHGGAWKVAYADFVTAMMAFFMVMWLIAAVTKEQRAAIFEYFKNPSMEQGKSVRASLGQMGPGGASTSVINMGGGLDARRSASALSTGIGTPHNAEPTADKEKAQDKERAASSEEQARKLTEAADHKKLESLMQELRKAIDMSQALRPFKDQLLLDITPEGLRIQIVDAQNRPMFDLGSAKLKDYTATILHELAPYLNTVPNHISLSGHTDTTPYLAQNGATNWDLSADRANAARRALESGGLATEKIARVVGLSSSVLFDQDNPRNPINRRISIIVMTKQAEESALAPDAAPQAKVSELPATLAPQAPAVPSVAHX\n>SRR6185436_12656879\nPHKNFLAPLARCFRHLDRGDKKMNSAKQRGISLTVLLALSVAVVALNAAPAAAQTSTYMKVDGITGSATDPRHIGWINIASLGQSASMPVQASSLGGTSAGHVVGACDVEVLKGLDAAGPLLWAALFAGKHI\n>A0A2D6A177_9PROT\nMGQIFLATANLLALLISISASAQSNQDQFYRYFTKRIELTANGQEMALEVHAPASELPAEAGLFAEVDGLLQPFGQSQRISMNRSKGAWVMTMAFRKVPNEGRVYLVTRSSTGTKTYRFTERPWESPREGELESTRPRAIAAKPLPEMKDSDVFRPVDSYYFPAMTARFGGVTLETETNVQRTVQAITTVCPQEPLNYDPLRHKRFVVEYFPAQDDADKVEAALQAPPLSTQSLRTTPQGCLALSIEVSHLWYQCQRYFLLPIRFTDPTTGISETLTLGVNPWDEGWVFARDARDLQPHQLEQVQCRPPQIHLNSYSLDGAGMNYSIDHNLSLVVEKNYYLKLSPRVQRADSITRGRFGGAALRDGFYLLNIGLFYRAEEGEITPKDYVSSWEQIVEVKSSEIVAPLKFDLKDMTLMGARNQILMQLQPIDESKVVLKPATASGNREIDQDATLRAENLVLENTGLHSPVYQGPIIPLSAGQGPILRPSHINLEQSIKLGQLQLAELAGDFQRRYRMTHFDRMFRLKSMLHSEPEARLWLQQTFGKYILAGPLFDFSVSPDINRSYLDKQRLQASLCDGWAGRFLRQQIQLDDQTTAAQRTMQIHYFEQFLRDFRQACIRETLDDRQTFSLSPSMMIRDIDPERTKYIGGTSFNYNINESFSLGRSENWGTSQSTSSSLSFSASLKAEIGVTSLGASRTETLSSSENYGRNLNESNSISYGRGTYLVVQHSQVEFVPTEYQACQVIRPKSEFIMDLLDKEVIERRTERPRSRMVHLWDRIVDFFKVDTDDVSVDTMTYRDVFGRDLSLDLMETGLRLCEDGTRTNDDSVIEDYYYVTQHFTAGDMQDTFDNRNRPWLMMIRSTRDFNVFLSNLQGQSRLEHRGVENIAPVEILADAYDDFAGTLPAWPGIYNPTERTRSDQTRCDNQVSAPDLLVSAIRQVIAGPFVQPDGNHIFSDRDFRRIWHCGEE\n>ERR1712176_1124453\nKMKANNNMAAATANSAHADVVNASNKTERDRLAEKMKANKNMAAATANSAHAEVAKDTRRHTKALRKRTFATSNYKRFYGGAKAPVFYHQLLNNVYTVLELYTARINPTLEKDMLTEGLNDFMSLLQNDAFKNNKTLQTVDAVAEYLWTSCKRHAIVQDMEL\n>ERR1719473_1570082\nRGGDLHKKCSSGKARGTKSAQSPEEGRPTKMITRTCRTERHLVFPNNAITMKKKHFSVIVPQEPSAQQDPRDIHLLSVTQTSRALDSDFGIRRLTAWQVPHSSRLAAFEQKKERRQLCNRAIMCCVTLYEFIPLTGLKRPEILFYLSRATDSQVPHASRLPLFWPTLSQADKX\n>ERR1719473_2414288\nAGYDFNSCVPVPQATTATAGTMSMAEGEPTTLPECTCEGENGEMFCPGDSYTAPDGCNSCTCTETGVGACTLMACPEEPTTLPECTCEGENGEMFCPGDSYTAPDGCN\n>ERR1719473_87410\nISKMMRAVVLMCGFLALASSTNLRGASEDQKKKKDGPWPKLPLEHLGLKDFLDWEEPEDPIPPERPARPEGGLAAVDWDYNDAERARMEIEHSRNNEWVNGHAPTGQIDPVEPPMTEPERTLLYQLFGKATNLLEFGTGGSTIAALNFENIKKVTSIDSAERWKKLIEHRDDAKAAIEAGKLNLIYSDIGKVGTWGHPKKPNTKPIYKKTASSPGFHEDGSENGPHRSSPFGGLKMIDRIAMKRRAHEAVAQFAQYSGETPAAAGVADLILVDGRFRVASLLKALQRTPADKRSETVFAMHDYGYVSTKYNAVEQFVDKVQQADSLAVFKAKPNIDESALAQVIKTFEKNPKX\n>SRR5437660_4872881\nPLARCRRASRVTARAHPRADSASSTRLSKRGLHPGIGGNIAQAGLPELYADLRHAGIKQAVRVPIAHGVAARLTASQVSFFASDPRVDRIIYDAPVQLSDTPFDPGALASLYPQVVDAAASWSNRPSPLTGNGIGIAVIDSGIAAHPDLAGRVVVRKGFSPDVKEASDTYGHGPAVAGIIAGDGTASGGAYVGVAPRASLIHIRVNDGTGAAPTSAILNALLWATVNRKTYNIRVINLSLQASVQESYQTSPLDAAVEYAWLKGILVVVAAGNKGPNSELYAPANDPYIGVIRGRVQLAVRTLVAGGNDHQDALEPGILHRRVQRAGLIRLLDGCLQRQVDDADVVGLAVDGCPEQGVQDGGRGRRPGAVVNPDVDQAGPRRDADIRASTGRSVARDDAGHGGAMPIGVTRVVDIRVEVLAGDDPTGQVGVGRNSAIDHSDPDSIAGQRRRAIAPAGRRVHDLRIQARQRTWIEWSVGELHRGVINDPVDPGVAREEADLRRRKPGCNPVGDRNPDRLLDAGVSQVGIELGQACLGNQDHIDGGANARRAAGFTVEPFVSPRRGERWSRRQGSERQADPEAGRESCPEQGGHPVTGRX\n>SRR5674476_1677054\nGRPVAMDVSAQAVVVGATEVIDSSLPAAPVRVGASSRRAVSCSHPNPSTINRTIWFASRAGEGSQVGGCPASPLPPANPDNRAGTRVARQPPSSTGRSGTADPSEREDAAITSDGTP\n>SRR5258708_27400449\nSRRVCSALLTDGSAMFLLRHLACSVFFFFNDPAPAEISPLPLHDALPISRGRPRAALDDAPERRAVAHRRGGRRGPGDHPDGARDLKSTRLNSSHQIISYAVFSLKKKNGGLADQPPDFPPRAHLHRGAGQD\n>SRR5260221_9098150\nLVPDATPASPHRDAKVSAPRHPQPNNACRCPAPARARKDAPEAVATAPARSTRLGNTSFLPSRETSHQVAACARTLRSRAAQKACAETLRHLGTATRKGLRAAEVAWPQARIALCSCPTSRCRTPRQSPRSKKTKPHMAGQLRIVPMSRLPPRVRGDFGPAPLEQLPPIAPPCIV\n>A0A151A617_STASA\nMFDMLKTLKLYLAKDATINQYCKNRIRAYTIPETADRTDTNILIIPLIAPTPSTYASDKNLTTDYLFQIDVRSKSYEETKLVSEAIRLVMKGIGFGQQDGTDEYDSELKAYFETRRYRGNPYTIDELRHIDKDIEPTLNT\n>SRR5882724_11345676\nRQRLSRPARASMRPVACAITASGSRRWRSSIARTAKSPRTPRSTTCWPTSTSSTTGRSKGWPPRRVRSARTRRCAGTATWSTRRSSRWPTTRATIARRRSCVGSGRRRPPSSRKPRATTPAPRCASERRRCSKVQVGRGRHLGRRPARRQAFSTDRKVTSHTIGHAGNIWSVRLRSRSMRMLRGLPRGEPSRPATIETAVHPDGGLVSLLEEQVLELRGALEDAAEAICRTDASGRLISVNRAFTEMLGYAAPEILGRSWQTVIAAHDRALVSADLEAGIRAKIERQAVGLRRDGTSFAMHLVLVPLFSRRDHHDAVQGHYFYIRDLTERRRT\n>SRR5882762_10441494\nXMCSTEAIDGNVDDAAKEQRAALAFELKIQIGAPVLPLITDGKFVRQWSKLSEQDRKFSLLQEPAFVISWYRQHEALFEPIVCLGYDFSGELLGVMALARCREDGAITHAGDFHAEYSGWVALSTIDERFVEESLIAIKRTLGLKRWAWKWLAPGTPVGFLSSSRLAQNGIFATFRTERSPVWNLEDPERLNQLLKTKSIKNQINRFTKKGGFFLERVRDKERTRQLLKHLRLQCDFRQEAIQGVRPFADNPCKEPFFVERQEYPESNHFTVLWSNDRPVSFHFGACNRDTLLLGLTAYDPTESRNSPGKVHLIELARMLREEGIRRIDLTPGGDQYKEFVANESQELVVPTFYFSRAAKLWADLVEAARRTTKAALTLARISPNALRALPTRLRRATLGRLLKRIRRIFYENVVYLQYTTECKPSEAARDPEIFVQRYEDLLLYDDDNPWLGRRQLLSAALKRFGSGETLYSASRGGKLLHYGWMTPGGQTHLLQGVNATFHSPSDSVVLYDFFTHPEYRGQSWYQRTLRQMLQDLSAAGVRRAFIGVLQGNESSQRAIENVGFSPYRSFGRRRILWFEKKDERAMKPQNMTX\n>ERR1711974_149456\nNAEYMGGTSLKCYSLVSGTSDDMGTETTCPSIANKFCQKTYDSNSGIVIKNCQLTGTNGCTSVGTLPLASRHRSVQWVGNYRDQTNDCHHYCPVDNLLRKNVLGWVEENPSNFSKSLSCHX\n>SRR5919202_1515199\nGQLDHLEDPDPDPRRRRAARTTGRAQLGRPADGLADGHQRPQPEAAGRGGVCRARAAGPRRLKRIATNTPSRGDTPMNTFQKYLLVTLAVGLPATALSLPLWPPQPGADPSPLQIALFFGIFAAEGLLFGFGVAFVLFGGPLVRAATGAAGVRSWPVFVSLAWTLLSWWPHDGFHRASPLGDLDATLRIDYAFHLTLIIAAVVMARFFLATLRAT\n>SRR5947207_7774739\nSGGPRAAGCEANRPTESGTTACPVASRPANGGSPLLLRSPVPARLQTRSRRPSVRFPATHATPGRDRQDRAPARTPPPPRPAGRETAWARTTESNGAPTPPALLHRVTPTVSRRRGTRAGARAWACGRHLQIDERLWIPX\n>SRR6516225_11363389\nNVCARRVSTGANSAEGTVDPLTTRNAATLQEAKEELLDLEIPEHRGRSLHHFGDVLARQRTRIPLAERNVRDNLGLAHLHGLGYGLLLGRVGLARKVIAQFLDLRVTGPAKHSLVAGRIHEASEDWIADVSRHPSGYEGMPAARIRRVLLRTTRNQGLPVHRLHVDLEAGFLQQRLGHWRKVGKRGQIRRLHENDRGAVVP\n>ERR550534_489957\nPHPPASSGAAPRAAGRAPRQMSAADLWAQLQGALELLSNVPLTHLTQQACVPYWVFGAVFLTHLTLLTITWIFWRRIRNVYSQLEQSSEDAATLSELFSSELGRLRVQLSQSQEDSESLDEMLGSILKGGLPGHLELTSKDYWCVKTMQVVYTDQDGKRQEWRQSGYRVNCFVPGGARDIEVTFGVVGGAECKQVDRSKPKFPYVYDESGRTKLERFSYERCPANVRYEIRGPSIAAFISHVTEVHGAAQPSGGDAAKETSPDAKRERSLSDHFSVAESRVCSX\n>SRR5262245_51303680\nSRDAVRALLPRNENVVRRQHSKVVEDVVDGKPCPGYELQVCIHSCAFDGVPTCVPTSHAALAVDEHKILALRCDEMGDPPDETVSHPKCVLELPGEQSLPPRVDFPPTHGELFGDVLFVGVPYYFSLLKARHECSVTRPPGRITWCGSNPASPIRS\n>SRR5690625_3526233\nRECFFFSSRRRHTRWPRDWSSDVCSSDLYDYDYQNVGGRWVHGFGVTSPADEPFSQPGDSGGGVYQGDTAVGVISGGGNLGGESFTWVADLDHSLEQSGTDFNLEKPGDEAPENPDAPKAKDQTIEPGEEVTGKAEAGAEVEVTWKPAEEGEEEGTDNHAGEEGSETVKADEDGNFSVEGPEAEGAYTYTATATVDGEESETTEFEVTVEKDESETPAPDEREISVDPKEIAASDFVKEDEGVTITVKGFDEGEKVTLEVASGPENVKGITLEETANENGAAAFAIYGTSASDPSAYLGKYDVEVTGANDTEDEDALTGSFEVVANEDGNGGGTGGEDLKSTRLNSSHVAISYAVFCLI\n>ERR1051325_2865591\nWLEAAAGRHGGLGTKEFSRSGLLFGRDRGGSQPLHFVNATAGNRPLDLPSLPAFRFGGYSGASKVDGPSNAHDRRWLRLLLSIDSVFERQVFFRMGVGFGGGYTGRFTAELCAVAGGWQAGIGGRRHLSGALPGISHYRRVCGLAPRNGPALPGSRDLGCADQFAKSRPK\n>SRR4051794_2477398\nVSDRRWFGISVCARRSNAPRQECWRPPDQIAEAIYLMCNAMFGIMCIVTVSAATPTITILLFCAAGVSWWASEICLVFFLPATLQDLLGVLRHQRVGVPGQFRHSLHPHLLSDVETVPLEAPQNHLRVARIQQPRHCFLA\n>SRR2546422_7969508\nSATSRLLMFCFPSIHASPFYFFFFFLMIRRPPRSTLFPYTTLFRSKKQTRSVRPDSPLRPGGETHAYDEQPPVRCSSFSSRTQRDRKSTRLNSSHGYISYAVFCLKKKKKRNIKRVEAKVCARPPNAQ\n>ERR1719506_1077933\nEKADENIEEYFAHLENKSGTCRQVGTVRIGKIYNDVWSYNLACDRQYDTPCNSEGWRLLDRGSLYGGCIIVNQIEVCQFPQERYGHMATVHLNKLWVYGGFAMFCEDYCIDMWTFELPDYRGYEQNVYVPGIGVVPGQTPLPWGYDVDLYGIDPIDGHMKKLRDHQTIGHEQTKTGDFPRWNE\n>ERR1719159_229085\nPMQASMETLPCLISVCRRLAKSSALPSAVKPRGSQKPTGGCTPSSFSKALSGDASYNAQSPYAEPVSPSWKNIPMIAIIASLPFAISAASFFSFSAGSLDVSTLNPKSPFAAGVPGDWSCESSQKAPYAKICPQPATGTLEIAPKPFGMSANFKVPVAGWGQILAYGAFCELSQDQSPGTPAAKGDFGFKVLTSSDPAEKEKKLAAEIANGRLAMMAIIGMFFQDGLTGSAWGDWALYEASPLRAFEDELGVQAPVGFWDPLGYTAEGNAEDFARRRQTEIKHGRVSMLACMGYITPELTGKLPVYLSPSMGLKFADIPNGLGAISKVPLAGWGQILAYGAFCELSQDQSPGTPGAKGDFGFKVLTSSDPEEKTKKLAAEIANGRLAMMAIIGMFFQDGLTGSAWGDWSLYTASPLRAFENEL\n>ERR1700751_3884456\nLASSIYGGEQGLGDPSTVLVASQWAKWTKDYLPTDFGLLSGFPYPFPINGGLNSRTVLPPPAVQRLVEKKVYVRGYMIPLEMDAKGVSQFILVGDLNTCCYGLTGDPNTWVVVYMKKTTAFTRYDPLTVFGTLHATEIAHGNGYETIE\n>SRR3569833_572735\nLPIIPRRDAPAQIGRDTQSPALSVRLRHMGLDRVARGEIPKFDQGVLAGGEQESLGRNVKDHRLSRLFVFQALRPRLDEMEPGNLVFVSAKFELASLRHQVPYDDIRVLGTAREPHARAVKSQDGHGRAVAIEVDYSGCDLAIPEPDAAIFVSNSKHILVRLALRDSRNLGLALIVSTSTQYKTSSLAATSACPTPVPERSLDVHTMVEVLEVTRPNDLVYSYFLYD\n>ERR1719329_115142\nSGIPKGTEADTFERTVESIHTALNHGDTIHHTFSVDAVGNQHDLQTSSPGGQGGCCKLHLINSNGISKPGGGSRPGGTSNPGGKRNNASASTSESLSARVELSSCRDLLAEGQSSSSSSLSSAKYTAVSTACEQTX\n>SRR5690606_4275788\nYIGVIFNKEVAFELVEPAKPSSIHGRVLVLNQSYEPLTVCSVQRAFVLVYLQKAEIVSSLNGKRLHSVNASYAFPSIVRLSKYRRVPFKEIILSRKNIIRRDGNRCQYCGTTRPPITVDHIIPKSR\n>SRR3990172_6323865\nVVDMVDGAGVAEPCREGKETGVERPAACRDATMLPAMYFLATLFNGEIPPRAVPNRFQIFCAPAQDLSQKDGWQHDTHSVAKALGRGVWVREVPVASDEDVYIARQQGQGNGHVLLAAHQVALLANEVGGRHRELFVVRAGQEGIEHVRLSGRLEMPPRLYDDLFRQDQVEIVRQRRPHDLVRPARQPDTGDEHVGVQSDTEPTLRHS\n>ERR1719186_79813\nLILLDSLLQEIFAKSLNRKLNVKRMGDDMEYLTLKVVGTDSNEFHFKLKWVTQLGKLKQSYSERMGVPVSSVRFLFDGQRIGDDDTPKSLKMENNDEIEVFYGKGGPIDRAKTALQDAVQKDNTNVIKFLLKFGANVNAKFDGETPLDLALAAGKIANCKILIEHGAEFGLGCWFGEDYEYLLRYQQSYKKAVKQVTNNEELISENRYTELTCEEIQWLKELKAKKVKEVDSQMISMDHKLDEVTTVNKNKIKVIQNQVDEVKENCDEKITALENEITIARKKLNDLEFEKNAETLNMKTRIKTLEQQEKEIRDSTDKIEFERLVTVATKSKLNKEFKMIDFELKRKGFSESTKRTVTGKTPSKTDGLEFVEHLKQQISSMEQELECPVCLEVSEVPIYTCPSQHHICAKCWSDVKSQDYESGRYPCRRPCPVCREYIQDPPSKHRSLEKMAQQLKQARAKLDKIL\n>ERR1719186_361628\nTEETLLARRHQSRGKMSKLTDPAALKSSPQVWTLYLVPQDLLTRSLACQVLGRSLPHKTAPAHCPLTLHLVTVQSSPSTSGGGEGDPRGREGRHAGGQTRTGTAGRTRTTTRPTTLPRSWRWTEPASSPRTVWQLX\n>SRR5215208_4256899\nLCHTVSLHPKTKSLLWQICVRCAIWFCVLSRSDMLVCRRQVSPSTAVSCNRSHELVTDASGLTFGTDVVKRHGSLAHDASCSPMIHRANSGHTASSLDLKAHRGCFAINNRLDPCLLALLLGEPKGADERHRRTAGGVGAADSTCPDPGDHGLPVGSLRVEMADPLLGLVAHPVTVVTHVFGQSPCPAPALGVAYALARLRVYRRLSGELRWDLDQGLGDEDGDGVEVGAVGFEAKALGFEGDRTSPAEGVX\n>UPI0003AA342E\nMFNSGAETVSGAYIELRVDGELVNSWNVTLAEGGLRELEYDYIWAEHNPTVMGYADPGKVIDELDESNNYKSIWVAIAAPRHDVQLGAISHSGGQWVELTVELQNLLGEVPHYRLSLFVDNATAPEYQDPNQVQELYYVEGFNLAYNESRVVSIWWYNTVGFGWHNLSVEVEVVDHSYPDLNLSDNRNSTSFYLKQIFYQLSLEIEPLPEKIRLNETVRVIVHAFNFGPEILSEGAEVVITGNGTQCEPGLQRTRELDRATGEDTLEFFCTPNSTGPYVIEARIDPDNIHDEPNEDDNFATGVVNVTNEEFTPVTPPVISDDSFITQPIVWVPLATLAIIGAGMFAYYRLRGDDDFLPGTRGRQSGGSAPEQASGSATFRYDAESGITYDANTGEVIGEKKKDX\n>ERR1712099_209071\nILLCAGEEHISSGNRSISMERKRKGGSGEHTHTTEEGNYYANTSAVFNFFLFLSFFTVGARKERESISLHYHVSFRLSLNLYLLRSSEIRYGHLLIFIYTYPPGQPEFERHSIKYHQKYKKNKKKKKKKKKKKKKKKKKKKSKTKKKKKKKKKKKKKKKKETH\n>SRR5437762_3435613\nGQRTGVRDVDEPGRWRSGEVWELGQRAGRRVELVDQRVQAGQRRGQLSTQISALRKLIVDRLDREQKLGLLSEAEVLAREGEAVPVAVRDAGVGVGRAAARLRRGKAAADGEVAARVAKTSIQGRLGDRRGAHGERGVGEGLEVLR\n>SRR5579883_1301911\nPDLPRYGEFHAAVGRAVMLAAAYAGGWIMSAAIAESYMEEGVVGLEPRIVRIESNVANLNEKVGRVETRVDTLDAKVDRLDESVRSIDRGVAVLEANTENIKENVATLQIDMREMDAKLDRRFDSIDRKFESLDRKFDSMDRKFDSIDGRFDSIHQELRGVTRTLMGIVITFFTTLIGFGAAILGVLAKG\n>SRR5438034_829519\nRPDWQSGQPGRITNPSYTIGTSAPVLENTAVPKQGEIDYVSRLTPDELRFALDKPFSDAECGRYLMELGALMYLLPAPPARLLDLGCGTGWTSCFFARRGYDVVGQDIAPAMVSQAQLNKERYGVPNANFVDCDYEGLPFRDEFDCALFYDSLHHAVSEEQALRGVYRALKPGAVCVTSEPGVGHARRQSSLDAMRKFNVTERDMPPTRIIRVARRIGFRRFRLYPHMKPFGMLLYGKSESGILAKLRWLPYWVRSLALMFYASFYKRFNGLVVLEKX\n>ERR1719411_249020\nKSTVYIKPTISNSFEHEPNHHPHSPSASYSFSETNNSSTNPDFPLIEPQYGHFAHLKQRHNRPQSTPQKLVQFKAFKFDENAYDVTANSQSIHSPQFIQANTPNTITPIQTPSNQQQQQQTQNERFQQLIPNDSTTVMTPTPSPAPSINIPPVINLDLIDLGSVNKSTARDNGGHKF\n>SRR5262245_60002328\nTRLFQGFLSTLLERSDGWQAHGSAWEEALLSFGNRSQPSGRRRCHWRKEPSRYRPARSTQRLVFEDKKSCWEKPICSIQPALRLPPRGRLPRITSEPACIAQSPAAFAQRKPNCKRPASTQSPAPKPNVSSSALRMPLRGLRRLRH\n>SRR5438132_1115162\nSRNLYRAEASRGTGFPPYASDFAEAPSLARVYAQERGRVMGGELAELAARVRVGDRHGAVFRHRVEATAIRAARNAGDGPAGGDDRQIEDAERAPRVEVKHVDEGPAVGVVVEAEVPLPIAARDRRLVDAVHDAVDARLGVVAICLRGELHVDDQRLRELRGWDVVDPDAIGVGGVHADQRLRGLRSDPLDQIQGGSVVADRVIGEGTRDVDVGGDLEETRVHDGESASLAGRSDEHKPPAVRRESGGSRTVLVGERESAWKLNARDRPPGLRLDQLQCGRGCAVERVVPGSVWSRDGAAKGAQEITLRVADLDVTGGSDDELVAGRRRGRGLARPSARGEEQAGRGX\n>SRR3990172_10122028\nAPRPSRARGDPRSLAPGPRGGVARAGGCAPRAGDRGGARAGHPARPPDALGECHPPADAVVLLAADPRSAGGARDRRHPRAGAPAGLRPRAALLGPRRRPSPRPRRLAALAANPLARAPRRDGRGGCRDGADVADGRGLTPAPVTGCWWGVAE\n>SRR5262245_24698148\nADLVVPLLQPGIEHVARQPGHIRGLEHLDGHLDAAARSEEQQTQEELEESPEDYTAKPRGRVGLSVSERAAPQTAGSHQDDTGFGDSLEDVGSSAGWSESLDAVALDVPRRPQNECASLLEAILDRVNRCLDLRA\n>SRR5579863_8325721\nALPADSPRIARQRLEQLVHRGKPLFRTRAETAEQDLAQPPRYLRVLRHRLDPSADHGVADLEKAIALEGTFPVERLVQRHAKTELIRALVGLKTAVLLGRHVVRGAEDGASL\n>SRR5216684_4526886\nLSRGDIGDATGAAAAALRAAIGGARLRERRPEILGRRDGLIDVFLLRGVEAHQSFDRLDQSLGIANEIAIDLLRRHVLGNAGEEASEMQDLAVRPAHGGEAVALSQDFGELWIDIALVVALVRNYLLLNHPVCLGDQRGRALGGGVVERIDERSPPGPAAASRRSPPTWPGSKAPCRRRCFRSRSAVPVARSX\n>SRR5262245_20684417\nIALPEPLPGLIRRVRAPAPVLGALGLDEEGDDLGVTGLDSPLEPRGDLLDVARGQLVGKIHVEGGDDLTRPQVHAEHRGRGLDAGLLARDAGHGRHGLRRRALADEEGLALAGEEQRHPTQQEADRDGGEAVQNRQVQPGGGDGAGERDEQTEHRRGVLEEHDESRRILALSNGLVVPLCALGRAELSKGDPPGAALEEHRETDHRVVHHGTGHRARAEHVHEALVERDAGSQGEDQQRDDEAREIELTAVAEWVSRIRRPGGAAKTVEEQRLVGRVDERVHPFADHDRAAREAARGELRGGHEQIAEQGRVDHLPRCAARHGARPARHRPRAYQRGASDRAAFRYTAGVTKLGVLALLALLAVSPLVALLPYDTGSIRLLGVSLGWWYAVAVAPVVAVLVAALSAPRRSPSPPAX\n>SRR6218665_887351\nRHNRHNRHNRHNRHNRHNRHNRHNRHNRHNRHNRHNRHNRHNRHNTNSSYRQNAHDPETSAWISRCNSVGPHIRLLDGSALNPDRTTWGPSLGGGPQSGLVNLHRCSAPASPGQSSTLAGQPTPIQDKVRNTYPAGRGCRWISGCQRHGQQHLPRRTIYPNTTHNPPSTPPLTPPNNLRRHETESTLQRAEDPRPLGVLGQSVGERGVGRRLSFWVVSHVIYREAFFWSTVTX\n>SRR6266516_6846987\nLAGWPPGRPGLAATATWASAAFEFGGQSRNSAGVAAAEQPGSWRDWLVVRPFQVDVRLSEPLGDLDGMRSLPVRRDQVQAWHQSLARVVHFEQRDSPALAGLDAVQTMSEQALTDAARVYAEASRQLGDGDARGKDGRVLGGGSRQRVVGSQIACGKVGEVHASLFEECDLGLRQLRSRVGGGALRQDVLNGLHDQLLKVGQGQVETRTPK\n>SRR5450432_930278\nVVRKSLVACLGALLVLQACGSSSNSGSAGSMAGSPATGGASGAAGASAAAAGGSSGSPAASGSGGLAASGSGGLAASGSGGSAGSGGSAGSGGSEPAPPWDSSLRARATAGMVPLATWYSADTGLWNKTDWWTSANQLETVIDYTREVGDPKYNDEIDNTFVKNSGNDFDQFGFYDDDGWWALAWIKAYDLSHQQKYLDMAKVIFQRMTGGWDDKCGGGIYWASAKAGSNGLMNKNAIPNSLFMQVAAKLHQRTPGDTGPGSFLDWAQREWTWFKGTGMLTAKHQVVDGLDGLTTCKAGGPIFTYNNGVLVGALVDLGVGTGDATLIDEASAIASATMTLMNDGKGTLKEAPCGGDICTQFKGVFMRNLAALYRARPAADLQAYAGHQSDQLWTANRNAQDQFGYEWYVPFDKADASRQSSALDALVAAVMTANLNLALVGSTATGSAPCSAAGAASNAIDGSSRWDSKWCAGGMGGQTLVVDLGATRKIVGFRVRHAGAGGESSGWNTRDFELETSADGQTWTRVVSVTGNTADVTTHGIPPVMARDVRFHVTAAQTATDNLAARIYELEIFGTGLX\n>SRR5512147_282644\nGGEISHMLRETVVSAVVSSGLRQATFAFCPYLLPDCGAVIVFGRHLRQQAIAKPKRRVGEAAQSESIDQFLIDRRPCDNNLRTARSQTFHQTTLSKVAFREFCIHLGQGLSRDKALASGAIHIFRKRRQRCRCSRCRDHPLRSALSHALFKLAYLFPDELPHPLEFLRFGRIALDEVLGETNRSKGK\n>SRR3972149_3229708\nPQNLDALYPPRRFAEPFTGTPCTPLKHGDGARRRMDRRGTNAAGDGNRRVHTPSVQIRVYGVGHVARRRKEASNVVAYTARSYYGHAPSHIDAPRQHVEIGDGGRMIDAGDVRGSREGPGGYHYGIVPVTQHLLGTHSRVETDIDTMQFELCSVITQHFAKLRLSRDAQRKIDLSADLAACFVKRDAMPPQSGIDCHRQSGRSRAHDSNATRDPPRSKRKSRFPAGAGIHEATGRFISENVVETGLIAGNAGIDLRCATRRAF\n>SRR3954451_16501819\nWCGAGRSADRRSPPATNPPGPGRRGTPVRRPRALARLESAGRSARLRRVGGVAVGGRVDRGCVGRLVRLSWRRRPGATFRREAGGRAPGRLGPAGQLGQPGLQHLGHGQPVAVRGLVVQQGLDAARVQGPYPLAQRGDRKVVVVRQGELVVAGHAGSLPRPATAEPFPRDSSGRCRGVTDRNRLVLAATASEAPRRCRMTSPTGSPRWYWVTPSTAWSSSTASSSTAARLRSSPTATRVAPTVPX\n>SRR3989442_4700027\nSVCRRQGRGLTSHASKDTAANENPLVVEYCHLGGALDAGLVRGTPLLNLRNEKAAPDGQVQRRSQIFCNRISGNAEPGAQYPAVADKVIHNAPDRARGNGETYADVSPADGEYRSVDPDHFTGAVEQRSPRISGIDGRVRLNDVIDQFPALSLNRSPX\n>SRR5215472_13468930\nCEKGMQWTFFGQEKTLSLSGLFRNLIPENECRFLSDKRPAHAFYEFKTPATIAAVEESMNKLRRLPFLILLAPVRSSICLGAKALCRNELQNKRSLRPALIHGHNTTKNCVNPRSMVKARSDCAPVAAARSFDSEKNRGSK\n>ERR1719158_407498\nDDLSNHPLSSSRVSKYFIKFFSIKYKFYTSVCVCANYSTIRSNAPAVTCPNKTLNARTIATTSGDAVFIWIRTADIRTAEIRTSDIRTLEIRTAEITTAEIRTAEIRTAITPVSSEEYRPAVTRRGWIYGSTVATMPGRFTVX\n>SRR5262245_10967354\nDATTSSIGSLAGSNGAATVSGTGSKWTVAGGFTAGDSGNASLTIQNGGLLTATSSIVGNLLGSSGTATVSGTGALWSTSGALTVGNLGTGSLSIQNGGIVSAVSSTIGNAAVSNSTATVTGAGSQWSITGALVAGNQGVANLTIQNGGLVSTASSTMGSVAGSSGTATVTGVGSKWSTTGDFTVGDSGSATLSILNQWTFSVGNTLLIGNQGTVNLDGGTLRLGFAFGLIHLNYTSGTIQLAGNSTTGNTDVVGQIFGLSPVIPANKTLAVEGNLTVQNFSPLTIMNQGSVNVGGSLTLLGNSTVNLYGGTLRFSSYAKDPTATFNYLAGTIQLASDRSIGTDAAIQSLFGSSPTIPAGKGLTVEGTATLLTPVALNGGTLTVGDIINPGLLNFQSGMFRLTTANLQVSGGQFGSTLNVASGQNYLIDHTTNLSIDALLSISSGASFASAQTNNSGEIA\n>SRR6266481_4594428\nDFQHALGTAAIGGTVSRAAVDPARLRLWSVGAASRPAGSADDFQHALGTAAIGGTVSRAAVDPARLRLWSVGAASRPAGSADDFQHALGTAAIGGTVSRAAVDPARLRLWSVGAASRPAGSADDFQHALGTAAIGGTVSRAAVDPARLRLWSVGAASRTAGSADDFQHALGTASRAAAGTTGAVWQHSWRHRSAARRRHWWCLGAASAGATAGRPRRAVQPPAAVCSRATVDPARLRLRSVGAA\n>SRR6185312_13763440\nHFYEKKGLITSRRTSGNQRRYRRDTLRRVALVRIGQRVGIPLAEIAEVLATLPEGRTPNRRDWQELSARWQERLDDRIRDLQHLRDDFDDCIGAGCSPRPADRHPTARRSAQSAPVTAPPSGSADSARRTTPVTAGSVGSAEWVTRAPGHSACSWTWTVPANRAATSGGVTVSSSAVHTANQGSASPTRSRASSVISALPGASCRQAAGQASGATTDAVAARDVPARGAPRVTTRRALAAPSSRATH\n>SRR4029453_7084716\nXRESAPCPTGSRPRTTLEMLAPLVGVLEQRRVDRHGKWPCAHPSSFSLSLLASRSWGVVGAMAERRPASPAREPGRVAARPGTTATRTPADGGQPVSKATAARVRHPSWRDGRDQPPHPATSVQPPVSVPPASAGGTFLRVLNGWPRVDGVQGRGPAIAGTAGP\n>SRR6266850_5569252\nRRGQAAEKSGALQYCLCGQSHDGIPPAKHCEQCTSCVVLLTEPHSECAHDALDGEVAVNTQSVKESIMSITKVFRTNAIGVAWVILASGPMTWLANAAQAGESLPHKVVSFKDLNLSSTEGAGVAYRRIKSAADEVCGKRDRFELSQSHAIQTCINQAVSRAVAQVNSPMLTSLYNAKTGKADKQTTTLAQTHX\n>ERR1700690_1151612\nHHLVIHKTEGELPAFLKDLVQKLIALLDGPLHALMLDREHDRGLDGHVQGASEPQPLRLELFAIQHGKNALSARGNGALDKYGSACALRQRDHSYPASGSNLGNSAVRAKNSGSPGNPAEWNGGRRSATAWPSPTAFPQASFAAKAPASRPKYGSSAGPHAGRGRTSGMPWAGPSPRSVRLRTWFPELFPPWSCPSSPPCASX\n>SRR2546430_15524557\nIYTLSPHDALPISVERLHGARHAVTVWKIEPPASKLPNRSGVPAEATGGSSIAPPAERSPGRYVKSPIPTPLATVEPFASFRGSARPVGRPPWLFAAARCPWVTFPVVFTRCLNGSGPDRSSAMX\n>SRR5687767_7487181\nEPGPDLALEQRLRTASPYIEWSLEQTWDYWQLDIQSSRPGSDPAQRTNYIAQLNTQLRSAQVIRAVHAQNQLQEVMTWFWMNHFNVNLPDDIVRFTIHDYERQLRRHALGKFKDLLSASAHHPAMMVYLDNNLSTVSRYDNRGRLLSGLNENYGRELMELHTL\n>SRR3546814_18830037\nFLFVYIMVLHYLCFFFLVVGRIPGSPRTDTLFPDTTLFRSWGLRRGYPRRPFQRLGRRSAPVRRRRANGDGSAVPTAMRPPDRNCLRCLAGGSGRSSHRASGRIAGLATPDRSRRRPEPSQATPKAAPRRTPPPCGGYRHRTRRDRKSTRLNSSHX\n>SRR6185312_7772205\nRRTSMPLSLPDYDTLWQQIVAFFRNRFTGKDDHAESFIGKLARSVGMAIYGLLQAVAAVDADSPPSESTSSQGLRDWAFVFGVPADTDGDYGPKGPSLATGGQGDCTGTLGTVFADGLLLTAPDGQTSIKLSGAVSIPGTPPGAGSVLGSFVAVTPGSSGNLAAGTVLAWESPPSGADSTVTLKAPLRGALDAESDPSLLGRTRQRMQTPPKGGTAADFRFWAESVPGVFRAYVYPLRGGMDSVHTVVTTAGSGLARVPSDAVRSAVDVEVAADRSVTVEGYKTLVPRMVAPGMALRLRVAPYPKFGFHWSSAGASYTVTAYAPPGSAVATLX\n>ERR550525_1171417\nEKSSLFVHQCSQCSQNGFCRKCWIQFVRLQKDDDDEKSHPVSQQKTGNSKQNAVDLTSVSDEEIDDGNDESSPTFPRRKRKRPMNGQDTQERNAKKAKRTVNVDCNTQSNGDGNNSGATPIMPLVHTERGIDKSNGLNETEHSNDRK\n>SRR5690242_17665658\nRLLRHARGNLAAGSPGAQARRPRPVALSGAMARMSFANVVVWIGALAACGDNLGPVEETVDAGVTLERAFRGEDLPGCTLASPVLVDVAGDLRIVAATSEGRIAAYGRDGSARWSFDLPRAEGERAEVASTPVVVGTRVVVVWQAFAADGARIS\n>ERR1700687_127959\nRIAPPDEEQAFRLQPCGAMQQRGFERLAGHFAAGDYVLGGFAHGGIGALDGRCRLIFFASVFFATVEHHYDEAIGFQLRRDGGREVCIHDGVSSVSTVEGGTRNSAADVCRAKSLSPGRRLDAGTTGSCRAALGLGGEGARPHTSRVQQRWIHSTLVFFPGRWPPALPCRRCDGARSRACPIAVCPSPARVRLX\n>SRR5256885_2151122\nNSILKKEQIGIHICDRTPMDPIAFNEDSEVSAKAKFITERLSPGKSRRKAQQGQVILLTGAPEELETRVVGRHKQSPAALIGDLQKRLQRIFAGAIRPSVVDTFGLSIPQVIKRVARIVLLEEYCPSDLATRLKELEKVGFFPPETPTX\n>SRR5205085_4486535\nCRTRTRSLAEGGRGWRCGYAVGLYLDRSCGRRSCRDVRCILASAEPGQAKTPSWTKRAASHAGKRHRGARSWLSLKNVGMCLTCPRVPVASGAVRSRSYDPANPRAGEEAPNRDGEARGRGAIADRRGRRVVRVPRGDPRAARRSVSGGRALGVGPPPAAHARDQGATREASPGGRLVAAWRADGLEPANGSFAERTRSRIRNSPFHRPPRYWNEIEQLARERPHAEAGAEGGRDLRQPLARVDLEAVRLLEPQDEPKLVQREHRQVDARQEHRGTDDPVLARERRDEPLADRAA\n>SRR6266545_2846328\nWRSRARAPACAGRRARRTRAAGRQRGAEADRKGGPGDSIDRPGSRAAHRRRSVLAARRRPPAPGRTDRRAPRPAGTGGRSRGHDPSRGPGPPHGWQGAGDRASRHRVARRGEGSPGRLRGGLRPAQRDPGAQVLVARRPDRARPRAPGPGRRRRQRRVRFDRPDRHAGGEPRRSPRGSARLRRAAGSRHRRAPPEEDPRPMRPWRRAGPVLALAAALLALARAAGWAGPPPGAAAADLLVEAGAALGAGEHERAAALAGRVAHDPRPIARQDRAEAWRILGLAEYALGRRDRAESSFYAYLKLDPDAHLDPALVAPEVLSVFEDVRARHAAELAALRPRPQRRRSFWLNFVPLAGQWQNGEHRKMWVMGSAGALLLGANITSYALLRSWCGNSGASATCDDPDGTNSRAESARTMQVVNIASGVGFIAL\n>SRR3990172_1023493\nDLDDLGRTSGRCEMSARGAAACAFLLASTVALAQSPRVLRLEGGAAQIRQKERTARAAGVFGGLWRVEGPRLASLASAAFTWAGDSATAAQGIVAAAWRPTVESAWHTEGGVTASAFGVYALGRGGNRSAYARERVVLDDGGFWAGGAAGHTTRDGRSWHSTVVDVGAFLRSGGLETSVAFARLRTNDWPLMQASGIFLETDAAAHDLDDVTLAMRYARGALALDASHTWRGGARKTLARQTAFLWSAAYELSPRYAVIVGGGRQLADAVRGVPDAMVASAVLRVVLFPWRADAAERATARSSARVEQTAEGAVLVVRVAVNDSARVEVAGSFSGWEPVPLQRTSEGWEARVPLGPGTHRVAVRLGGGPWRAPRNLGKVRDEYGGEAGIVVVPX\n>SRR5438132_1110025\nVRGHDVTRVSAGAVLGANIRALRAQQGLSLSELARQSGIAKGTLSQLENGQGNPTIETVFSLSNALNVPVSSLLAEVPEPSVMVVRSAGLDVLSGTAVDLRLLRRMDVTDTVLELYDQRVRPGQVQQSAGQPGVERGRAAGHRAGPRRARLRHHRGRRGQCAALGQGARAGARPGHGVAAALAGADRRARAGSGVGAQGRAGRVHCGPRAAARVRR\n>SRR5581483_1731585\nVRAPADGTVAVAIDHLDDNAVGESDFYNLAGNQVVIDTGSNRFVLLAHLQKGSVLVTTGEVVHAGQPVARCGNSGKTTGPHLFLQVQDQPRFGASGVKTFPIRFRDVTCLRSGHPRTDAPFFVRRNDRIVMDPPAPVKSDTIGQTWFPNGDTIELLSVERNDDQIVARGRYHLASHDHATLGLYITSTNISRVHEGREQTMVIGRGDGSFQLIHPHPVPGMPHVTMYADGKGIATVYFGTEDEAARSKKMHLQPLASTETWTPAFATGETPDMSKILEQAQKL\n>SRR6266496_2749558\nELGGLLGLRPSCPPPYRRGTDASPHRSRWRCPEAVDLWQVSGLPMPGPDGCPTDRERSGIGVANAGPLVDAKRDALDQAHRAPRPPGHPPLVVVSERLRMLLHSDEIPVIAQPLDDLPGGRDVAAVRRYVASQAERRDESMSASVGRVLTDLLAKDEARDLNVKVX\n>ERR1017187_5553991\nRRRNSGPARACPAMCCGARLGTGWRSVGRVEAVDVIQVLDALDEAGVRHWAGGGWGVAALAGRQTRPHRDLDLAVDARDLGSCLTALGRLGYAAETDWLPARIELRSPGDRWVDVHPVAFGEGGHGRQADLDGGSFDYPPDAFSHGLIAGRSVPCLSAGQQRRFRAGYEHRPQDVHDLAQLDALRESATHGPDSWPLTNLRSYPLRISECPVCTGSSGSGPGPATVQFVPARVPAAGVTRRRWSIKGLRCGSRSEEHTS\n>A0A2G9SB67_LITCT\nSNKVPVVQPSHAVHPLTPLITYSDEHFAPGAHPSHIPSDVCSKQGMNCNSKYEKTLSCILLGEDALHYVDALQNTKHSVTKQEERKSEQKTRSALTDLLYFFILLRYSHHMVPGPPGPHTTGIPHPAIVNPQVKQEHHHNDNDLMHVKPHHEQRKEQEPKRPHIKKPLNAFMLYMKEMRANVVAECTLKESAAINQILGRRIFASQSGTIILHRNLAFYIAGSAPVHCDARREQSLAQRGFGQRTEPSDRGTLQDPGDKWHALSREEQAKYYELARKERQLHMQLYPGWSARDNYRHAASIPGKFEAHVDVESLFSQGKKKKRKREKLQESTSVASRSVQWNRSNRSDASRSDLEERFLYYFGGDLHRLLYRSRLASRHGSRVQVTSVRRPASRAASNVNRR\n>ERR1739844_819532\nMGEEYMEDHRGNIDLELLQEEITAQICLRILERSCNTNEAIDRMCLEDEDGDGELLPESGGKMMTKRRRKQRNAERDLTRIKVKLDRDIEELLGTNKHLINNVGLGVWDILSQMTIPTLSSQANVRALDLRGGAYDSS\n>SRR4029434_248713\nSRSCEERMMGWEGREEKVRGGEVWGGQGERGGERRRGVGVCSEGNLSGQRRCEKTGSQWCSVMFTPHIHTHTRTHAHRHTCTRTRIRNTHTHTCTLRSPLQSRQTVTRATNKSAANTEVELSVTYQHTPTHSTGQTICCHT\n>SRR5207248_268926\nISLDAGAHVEVAIVKQRPAAVRALQAAKINADLALKLGIDGLGEIVPHQHIFTRYRGIGFQLEYPMAVGLLPLEKGTGGALNVLFEGGNAAIVHRSRDHFVYEGRLSPRAVVPAERRSLRKQAWAREPGPIP\n>SRR2546428_1292487\nGRVHAGRFQLAANSLDSQRMTPKPRAFPLLLSLVLAMFAPQQTRAGEPHRLQVKPEQQILTAQEYFAAVLKLPDSHGTPLRNRVKPAGARDEFGELSDYEEVIVFKQLAAGYRAGIPVERVQRWISAYDAGRSHDNIFRRLASLATRPGLIDCLHNIEGRKDSLGRNVSPHMAFRYCAAGAQPDEITAQSLEGRALVILSYSDFNGALEVQQFARLLDNVRLSYRLSFALARTPADVHAAVAKHRNGPRIIAGHPVRGGIELMRESPDGILSSVAAQTLVEHLGGEALVVYSCRGGERFAPALAAGGARGRGRPRGRSAPHAGGHAERAPYTERRTPLPRRKG\n>SRR3954454_11295577\nLAMLTPVVFGFLSKQQESMDLNADGLANLLVGQKDNIKAAMPAGLEAALSSALPGGGQVLGGNGPTEPELAQVEGKSAASANRTADWHSRAVYSKPHRDAGKRLSVPVLLVLGALAVGILWARHQHNRQNDPPSVGAPAASPSETVTGSSSSVVPNMTRLINQASGTLAGIKDPASAEAATLRLRQINQQISGLRSSWSRLPESARSAASTALEPQIVKLKE\n>SRR5207245_10474605\nFFPAGCGPAPYADERMPGDSLHNAEQGRWAVYAAVLLEPRAKVRDPERVAVGQRDDRHENVGVWQVLLGRREMFRSRGSGNREAPAVGVQDAAEHRRAIGPWQTHPVNGPRVADQR\n>SRR6266480_972767\nDVVARQDHEELRPGGAQDVEILVNRIGRAAVPGRLVEPLLRRQQIEKFVHLGAQKRPAHLQMPQQAVRFVLGEDSDATDVRIEAIRQRKIYDAELAAEKHGGLGAAVRQLFEPTAAAARQHQRERTPRQPFLDPRRGQHGGVPPTTRLTQSGPRGEPIRKGKANEAKNWAYKMNRDRSAFLASSPTRSRTX\n>SRR4051812_21032643\nXMKKVMVTSCSHSHGWRSVRVTTSQMTVTVNPEMAMPHSTISASSSGSSARHFRWRWVCWTSEGMAPALLDVAHHVQDLDGVGTEVLGELVLDGFAHGLEAGLVDRGDDLDADLLQARARVTLHLEGLGRLHLVHVVGGL\n>SRR5579875_2506212\nPNPLVPRGSRVSEPASTPVVVHSRRPSPLFPGRTRAATQTNWAPRAATSASWPSTKSRLAWSSPCLPDQRAENTPGMPCSASTHRPESSATAGSPVYDAIARALSSALSANVRPVSGTSGAPGNESRPATPSANPAADRIRESSAILLRFRVASTRRGPAGSAIEGFGLPPGQLRTPGCRQVEQRRQHRPAERLAFGRALDLHKVPGPGADHVHVGLRHRVLLIAQVAPGLAVHDPDAHRRHRSDQRGPLAPPAGLQPCDGIRQRHIPAGHRGGAGAAVGLQHVAVDDDRILAERLVVHAGTQRAADEAGYLLSPPAEPPLDRLPLAPRVRRAGQHRVLGGHPAEPAPPPPPRHLLGDTRRAQHPRGAELDEHRSLGVVKPPPGKAHRTQRVRRPSIWSCHIAFLIGLIGAGSFPRAGSVYPTGIAPGCGPGTGYGPGTGCGSGAQEPGREPGQAPGAETGARAPGAGPGPARRCCSFMPTAGGCLGCSRARFERIAX\n>ERR1719468_912648\nAFDEFLIVSVNFIEKFTVKLFFNRENVTEFRSMAAHIFAIFVFFRSSFSIFSLPDFSQQGGFEGWNSRDRLFWVGNALETANLGNICNHWRAEVPPVCRLGTSFLQNLICRAGEDPLGSGSFESIALIRSFIANAGEIAVDLLTNLFNGIFRGSASDSSESFAKRTKTVFTRNRLFGRDRFASSWIFLQKQIGCFAVLDNRANGEFIRESVNWSFWPNX\n>ERR1017187_631561\nLRPRPDRRQEAADQHGSGIEGASKPRRQHQTRRGQEVLPPRYALAWQKRLQGRSDELQLRALVRTQCGRDQPKARRGPGGAGQARWTGDKVAMTAASQGPDDVGPSVSSSSPGNGFTSTKIGARLGRYEIVGTLGHGAMATVFRARDTQLGRDVAIKVMSMVHAARGGAGERFRREAHAVAALKHPAIVEIYDFVSATENEPSYIVVELIPGPTLRTMLEERGGRFLPEIAALIALPLAEALAAAHDHGVIHRDVKTDNVMIQTSGQSSRVVLTDFGVAHITGMETMTATGALVGSPAYMSPEQSRGHEVTAAADLWTFGAMLYELVTGVVPFSGKDPFTMIAAIVRGTFRRPSQVVATVGPDFEAMIMRCLKASPAERYPSASALATDLREFTRTAGLVPEAKGLRGFLDEPDAMLADLRPRVADMAVERARQFARRGQLARALAEIGHATASVPSHTGADKLLRRLSASRIAIKIAVVAAGLLAALGIVLAAKPLLTPHVPAPVAPIASPVASPIASPAGTTPAPVRKVQAVAPPT\n>SRR5699024_12213394\nXHYSAASALSPLSLHDALPILPHFAGAFVLRAPNVYGDSLRFGRGGERTADFELYTAAGDRRVRSDERKLVYIQHGIRRGGNGGEDRKSTRLNSSHVSISYAVFX\n>SRR6266508_47967\nRGSDPGAFDIELGPVAEREVEHVPRTADVISAVEQRAQSVQGDPAADLQRRGTAGDPGTADEPASPFEARRPSYRTGLVAGHRRTPDDVLGTVAERLAQDVRARGVAAGQLGAEGAGVRRLGDRVLRTDVPAGDAQLGTLVGQVRPDRERQQVAAVGELDGTAVPVRPPRYVQRRTVQPHLTVVAAGQRTQEGQIALVQLGADPARGAIEVDRRGQPVLAGQLVGDIRGRRVVESTGTPGQPQVLQPVLGEDQHLRLLGGRVVGLDRADPSLEDPPAAVLRAERDGERGTEVEDVAAEVEIAGGVVAEPVVVQPRLAPAHPDRRLLHGQGKEVARRLGVGCAGDGEDGSGYERGHSHGVLNQRSGAVGVRRSRVAAGAVARGWVRYGRGPQEYRTPAVARAVPAPRSRX\n>SRR5215831_1420303\nRMRVSVRRVKARPGIRCCAGEESVRIGGPVAHGGRTGARPRLEQSLANSGGPIEIHTFREVGQFQVVIAVFYGDGIGIRPIGVAAVSHSIKSVAPNVDGFGRLMRPDNFPRRAVHDIWPALARDQVSLTSPHLVDARIARGIRVTVPRGRGPAKRGTAIAPAVWGGRLRISDVVGSHRIFMNELHKSRNGVAPPQTCARFQLHNESEIIVAGPGAVRKRVVVNLHGSAAAMDVRSQPVGLQPGVSSDVIVAEHKARSGNAIERPAVSRKSVVFGKHEVVSPKIRAVCPRRIAVAIGVALAVPTRRGKLYKEQISSLVEKIVVNYAVEPALSLESVRTVSSD\n>SRR5690606_9332282\nRQMADSSSSLVPATKQKSFNRWEERRVGKECKAMFTVYALYSEKYNKIYIVVTSNIQQRMLSHNHLGKKGWTVRFRPWVIVYTEEFQDKQLALKREKQLKTAKGREFIREIIAAGSYPPDGGQQFESGPRYX\n>SRR5688572_13872492\nPAGGRANGQVRLRDGVPPMVAAVLRTATARRPADRYPDGAAFGAALDRAVGRRPVSPAGARRVARFRRVAALVAVPSAVVWASAASTSAGGRARGVPGSVTDRSGQFTVALPDGWQAWRARLTDTPRLAERSPAAMLITPSLGGWQSDPAVPGAFVLFTRG\n>SRR5581483_4009571\nRVREEVARAYVRRELVVPELDGGDRRAPDRLASRELAASLREVDAEAGPLGDDHVDLAVAVHVAEELLPADLVVGGAPEERLAGYDLLRRDLEVGLAGRALGRVERVGPDAVVADEDDLLRLPGREDVAHVHDHGARVDLEAEVGLLPERARGALEEDPHLAAEEEDQVLQSVAVQVLEQDLX\n>SRR4051794_2395804\nRHGSDRELQERECRRVVPCSPHRDRPYLRLCRSSGRASRRSPEAEALLHRPSDRRLEDGRHIQSTCRTWRFARSQSCHRICLCLNNQSRGISLSFSSLSRVWRDAQFFSGAGMKKISRTSMGKRHALTPLRAHAITSSTSAHSSIHKPPTCSLVSRYGPSVTSNSPLGCGRSVFVGPRPPANFLTPAAIISRLSAWISSIIASSWVDGSKLSGRX\n>GraSoiStandDraft_16_1057320.scaffolds.fasta_scaffold8539811_1\nRQRHPRLRARQHLEPQRRGEVGLDGVQPEPIAQPHRRPVHKPLTGLRDLALERALGLAAGAQGQRRQEAAHLQAARAEHAQLGQAQVHRADVAQGDLHGERPLRHQPLAARRARQPPHELQVAPPQERRARRELQVAAKEQRRRAQARGGQRPAAAAHPDDQKDQAQREQVAAAHGQGRLFAAPGRQALASFIRLDRLARPRPLARADGDLGERLGDDAGGAHAFHLGLGDEQQAVGDDVRGERLDIVGQHEVAPLQQRPRPPRVQERQRGARRGPERDPPVPPGEVDELHHIVEDLLVDVHARRHAAQLEDRLRRQHRLQLRPRLRVGAQHLLLGPELGIRHVQLHEEAVKLRLGQRVGALVLDGVLGRQDHERLWQRPRLALERDLALLHRLEQRRLRLGRGAVDLVAEDDLGEDRPLAQDKVPRRLIEDVGAGDVRRQQVGRELDAAELAADHQRERLGQGGLGDPRHPFQEHVAAAEQADEQPLHQTRVTDKYLADLLDHRLAEVLGLHQALRVX\n>A0A0C3LW61_9HOMO\nMKYSIAYFDGYKRHVLPKGKSETMWLGRPGIPKGLQAGLFHLKEGQSGTWTCNAEDGFERDIDLVDHGKQFKIPAKTQLDFEVDLESVIVGAASN\n>A0A1I2KW36_9BACI\nMKRHLTGKRLKYKSMTFIDRFSAVQLDVLKEVGNIGAGHAATALSYLLERKIGMFVPSVQLADFDEVVELSGSAEEVVVSVFLKIEGDAPGGMFFILSPPQAESFVRIMTGDASFTIHNPKSMGIGVSALKELGNILAGSYLTALSDLTQLTLYPSVPSLNIDMAGAILSFGLLELSLVSDQGIVIETCLTDPSNETKESVEGHFFLFPDPDSYDTLFKALGVSAYD\n>GraSoiStandDraft_57_1057295.scaffolds.fasta_scaffold1415339_1\nMKTYRRTELDRTGLTRIAGCGVGRAAAAMAVITACLAAVGCSTDVNARRTIGAERELPTLAGADATHGINAERATRLDRGDWEPVDFRLPVDGTVHNALLKSEPSFGDEQPRAHGLYPTAESALDLGSDRGAEAWRGVVEPVRSFVDLAIMPVRAFTDPAWGKRQSASNFKRWRSGAWYAGPVPEADSGADEDGG\n>SRR5690625_3860754\nEVFSHARGNAAFEAASFDGQYKGSLDLFTGSDTERADDALRRIISKVRVGEVDVPEMRIGHSILFRPEMVLPACVIASILDTHSFGGLRNFAIAGSAGGAIRRVVRQVKLHHAAPDGLDPLAAGGNLQALCYGSGTGGWRPASPRDLHQAKPAGAECLHHVVCTKLGNFNSSQACRAHDRGAFRHADLFSIDRELDELVRFCSGGAVVGFFHERHLFSPAPGX\n>SRR5689334_12383051\nELQRERHPRHRDVCRRGSRFPASRRQRCHNCVLDRFRQSPEDLESRPVLRGLHIYQLPDGSGLCRYRDLHQRVRRRRIELCIVQRLDPPLHVPHPGSLGNPGIRKPQLLGHPDVHLDRPVEIHSKNESPMHTLDHVQRRRKLTFLGALLAALLAAGTASAQVGLGLIPMREELALGPGAAHSGVLTLNNDSPARVRVVAELLDFFIDSTGTPQFGRQWTQEADYSCRSWLSVNPMEMELEGNSQISVRYTVRTPPAAPARGYHCAVGFSTQPTAGQARGTGLRTAVQIVAAIYVVVGKPAAQGSLKDLTLEYVADARQPGWRAVVVLANPGVMHYRPSGDLDVFDQSGKVVESVKFVPMPVLPGRDQRFLFPLKLASGPGKYTLRARVDLGDSEIQEATALVVAAKDSRX\n>ERR1719375_951704\nENAPDGGAHATWSGFSYWWDLLRPDVELHAELRVRVGVRDLPLRTRREGGLPLRPCQLRQDPPRRPPDRLRRLLHRPSCLLLLQSLFFGVTLRVLRGLQLARLFGCGPQVPLEGRRVHLPKQRRVPLVRGRWGRHNPRPFFPLREGDVERPTGPGRGGRPPEAALWSRPGGQPKEGARGHQPASQRQGLVEGEERRAFPDGAPEFGGWRAGCPLGPKVPEEVRERQNGCDLLLIPLPLGIPAELEE\n>SRR5690606_30224247\nKPLALQWCVDSWGALKERRDLITDAWHKCCVSLFNVMDPAKRIEAVAAVARQELEHTHVPAEIEEQHDSSESDSDDAGGTDGDTEDDDELDVSQPKEFGSRKSQRQRTQATAFGFQLDSSAIALTEDSEHXX\n>SRR3954447_19024062\nLGAVARQQALEPPRGVEPAEAAAGDDDAPSHASASPIEGRSKLFRKPAPHAPGAAREGVIRNCGEADLVAAEREQQVGDAIGRRQLLVGGRDAEAVDTTLPVEEQDPAGFADQPGPEPAPFQDDAGLALELTRVMTEQVAEKALRDGLRVLAARPFSAQDAGAAECVQLRNDPGMRDARDRHRCGEWLD\n>SRR5205085_4690665\nRRVGWRERHEEERGDCRPISQGHGHVHGRQGRADVRSERRRPEVQLQGSLTLRARRRSSRLPRASSMFLYGRFAWSSGDDVAADSTRWSAGAGWAALAVALCWCNCADAETEVYLVRGWFGVFSTGMDSIAQKLRAKGIRAEAIMHLSSKSTAAKIIGEREAGRTSRLVLVGHSQGX\n>SRR5712692_4144902\nRNRKEETGGVQLMDPYRLRPHLDIQRGHKERRTRKVQAWLQSLPSLQKPTDTEHIIRLDPIALFLIFFAVTSFVLVIVLTNTPINIAGPATDLGGIAVNYLLITAPIAGFAPLLVGSYFYDPRQLGPILRPVTFGKKVRRESFPDVAILGIVAALAVVTVIDYAGTYGGFTPTLSFWNTTTNRIVYADGGIFEEF\n>SRR5262249_38079830\nFADGMFEGVVRAFVPEAQTWADVRENRSYADALAAGVASDEGLMLCAGLFADELAELVGVEATPDQRESAIAVLKGTFQLPLRIYNALMYRILKDGVNVRRPEIANTIWDMQLALTIPISSQMVRTPLWLISGDSAFADAGRAAGVPHVVHRLDDYIALX\n>SRR5581483_8213852\nITITYTAMNGHQYSVRKSAPLLITYGFHQQRPWPIIVVLVTRRVLQGMPHHSRQRSVTAFKHQRVAVPPGHGRPRRHLRGSRAHRAGAAAVLLMAAGCALIGCAGSVQGLGSSSHRVDLTGGGNPPRAGNSLPLPEATARRLPAGVFYLLAGPNPLSCNVWEVSRSGKETELTHNRPNFGISSFGASRAGIVMADASTGADELVRLTAHGIVPLPGQHLGSPAINRRGEIAAVRPPGGTGTKAYFYLVVKKSFSAQPHRTYRQHPALGGLAWGPHSS\n>SRR5579863_3949436\nSDLRDRRPGRGRLAGVDGIHCARADSRLDHLAFLLRRGAQSSTICVSGDAGGVLLLVALAAGRGPSRRGTCGRRRKRDDFHDAPAIGCAMSAHPFRLNSEKLSVALRVSLFVLIAWSGLILFPWLISGVTGDFTGSALSTFAAAAVANAILVRIYEHGQLSAVGLVWQETSTRELFTGMAAAAAGAVAIVAAALILQMAMFESAPRVENAWANLAFLGLVLLFGAAGEEMLFHGYAFQLLVRALGQFATILPVAVLFGLMHLNNRNVTALAVANTMAWGVLLGYAYVRTGALWLSIGLHFGWNAASPLLGVNLSGFTIGVAGYELHWRAGILWSGGGYGLEGSLFTTVIAIALFFVVYRVIPDRDRQVIPERGTX\n>SRR5438876_2751381\nYRREHHVEDPRRRGGRHLPRAEQHGRRSRVRPAAGTGCAAVRRCGAEGGGGEEAQPSEGVTRMLDIKLIREDPEPFRTALARRGLAERVDELLAADERRRQLTGRVEELRAEQNRASKAIGRASGDEKRTLIGEVAKVSAELKEFEPELAEAETALTL\n>SRR5215831_6834791\nRFQHGCLAVSIHLFASALNSSTFAGPSFHDGSNPPGCPTLGAAHDLARFGRKAQFPKSSNPTRRSPAVGAFQHPTLTGALLPRSGRPAMRLRALIGRQRRVKKLLLRLSNREIHGAITDLTIPQVLSHRLKKGTASIWLERRTTAHDGIELTVAQFDRRHVAEFRGGQRGYVVGRX\n>SRR4051794_29872810\nEQVLLQLKLMMETELGITGGISEREVEVLELRRQGKGPAASGYQRTAVQLSPGAPVYLRHVDAAYLADLLNTPGNLPFVMDATGLLVSFDLELGKLPATLAEWNAALKGSGLCLVRGRRELPVFVLRENGGRQLTGSHQSPANS\n>ERR1719217_1201603\nGRACRWRSWAAWRGVAWRGVAWPSLPLAFLGSVAYIGARVRSMTSSALWSAFTSSRWRSSIVMGESSPEALWLRNPFGSPDAHGTIRHEITLAIMKVVRLDEPVRAAQPMAIARGDVMQGLEQLAPGRTYLLREITLAKGR\n>SRR5579884_3263431\nXMSKGLILGHTDGKASKLRSFKALFDRSLDDKVACQRFLQAFQRKSAKHLLRLTPAIHTAVFAPSGAGKNVSVVEPFLFTSEESAFVTDIKGENAELTGRFREEVFGHKIMRLDPWHLTTDKPARWNVLDLIKTDDPEALDKARALAEAIVEKNPNDQQPHWPKKAQDFIAGAIAAVTHFCPPELRSLQQVAEILADKTLLAQVIEKMKQSTAHGGLLARKGYEMSASADKELDGILSTANQSLAFLSTPAVMESTKCTSDFDLSALYEGKGATIYTIIPLQYLKSHAALMRLWVTAFTKYVVSRGIKNARPVHVILDECAAVMAGHGDTLDEMLTVGRGFNMKVTAIFQSMAQLKKLFPPGQEGVLLANASLLFFAVNEVEDAKYVASRLGEETIIVQDWGTSDSESEQPSGQGGRSKSYSRSRSLNFRQVGRQLLKPEEVIGLHPRVALTFTPGRPPIWTWLTRYYEKDFGAPTGLSPAKMIFDTACLFLSSAMLAALWTAGLFHHWFQX\n>A0A1Q9BUH2_SYMMI\nMCAEWEPRWTAQLQAPGQAWQSVLQRAGVQPTPPGDFANVSVEEMRTAISEGAGGAGFDGWTAKELRGXCTSCAWLVDDLVSLFNETLQHQSPEVLQACRDSVFAWRVVGIPKRTEAATRPIAVASSLVRAFNRAILKRCPEPPEGQQCGVSGQSAVTATLQWLAVRAQRGAELDLRRAFDTIDHRLAGCAASTYGVHPVVIRYLQQLVWCAPRSCVVGGEPPPRSIQATCGLPQGDPVSPLFLSFVLGPWFKIVCALPAISAFLYMDDRSLLDSGDRNSLEPALRLTEWHDHTLGLQEHLGKRQQWAIDGSYAARAVEHLGLTATPGVDVLPSTRAGPDDLKALASQLQYLPGAMEMKERLLAAFILPKISWAAPLIPAVEFSIVRSCFRAIRGHVTWWCQGRVWADCINLHPLFAACGCKCGQGLKSPQGYHLQAYGRRXTPKESTTSTSKLKVQLALAPVVIFKDIAYSSAAIPDFDLALPVPLLGSVGSCPGCCPRGSIGER\n>ERR1700730_765710\nHRLWCDSLHSAVAARGFNRDTTTPDKKTCSALSRSMSQRNGACGRAQLRRNCAYAGRLCRTRSGAWTDHGITDTGGPAIRAPSGMPGPVALSTQARARRSGSGCLEPGAGSALRERNLLFRHLLCNFPAQPARFRVPTQRRHVEPLVGRHEIDGNIASHRIHHAELIEGLGRRRRTPEGCAVDAVHLETSHVSVSQFPAARRCGLRGCTPSPPAETWRISGENLKGGLSKSMNRIX\n>SRR6476620_3825097\nTERCRSGSARSRGARREHRRRRGGPGCGRHFRRTRRYRAGLHEVDARALPRARGRDAAAPSARRRLDSPFRRRGGGAVSAYPHLFSPLRIGNITVRNRIMQTAHVKLFAYNAVDSQRNVAYQAARAKGGAGLLITGNRVVHPTSTTGFPRVAWAYLSEALDADQKLTDAVHEHGAA\n>SRR5438132_6851853\nAPPSRFFSIRSTMRIWSLLRRGCLETLDDALQQLNLLLLDVQQLDPFLYPQVVDAAVQLFDQHLGLQVGVQVELGLQTVFGRLAILAHHDDGRGVRGLEAQGQVEQDERVWVPRASKNFVDVQHDPGCKQKRLDDDEPPAAHGGRDTV\n>SRR4051794_37294934\nXMRSCRASSCCVIPRSSRNRRTSNASHSSSEALGSSSSARDIATPRGRVYPCLSDRGFASHGSDAGPCWVAIHPKKEDRRMDATRNVDYSVYLHAHHGATPCARDVLAGKLTEWHMPELIEDGSIIVAELVTNAARLGEVFRMTLRNPGDGMLRIEVEDRSRAIPVRKDPLADLGNDDYDANGGRGLVLVDALADDWGYELLPDGKVVWAVLSKX\n>RhiMetStandDraft_4_1073278.scaffolds.fasta_scaffold432969_1\nMYRSRFEVFFEDEFEHPFMIMIIMIMIIMIIIIMIIIIIIYRYNNIIHTMWIEDELQKDQTGIQESIQRLTRDYQSQLSRNIRSHLSENREKTTDFLKHFYHKLRNAEYILYHQHAGTGTGTGTGADCENDAYCRLTFNITEIKNSAHDLPHPRILSELQRKYEHNRGIAQPNDNGDNGDTYIPYKVYTYIREKSEFCIQFQATIYGRVITLYFITFPESHISVCNRSSSGSGGSRCAAETAVYQTYAYKAFIWLSIVTSMADKECSEKSLNVYFYMTPFKKQRPKQSASGETDTVLSAIHVNTGLTRNCETHGEIVVYRTEEWFKVFIHESMHNFNMDFIDLDLRAANEQLRRTFCIPHDDILLFETYTEAWARIINTIFNVYFVSAATSATSATSQAHFIRNVREKLTTNALFYAHQAVKVLNIMGLTYGNITIQSPENTEVSRKRYAENTNVYAYYILGGILSVYSLPFISWCCENNRSRVSAIRFSQHPSNLTKFVDFISSAARDPVMLSMVAFIEKAATTTATAATAATAVVTKTMRMTMDX\n>SRR5215217_9088951\nRRGSDRPVFPPPRRRRRNRRGRWRGCRAPCAAKGEGTRKPSTAPPEGWLKASGNHGRKERRSWAAGLFELGRREGPMGLHDVFRLGVQLLGKRDQQRLVGYDIVEDPGEETRGRGGRADGVGAQAGDRQEPTQALLVARKERKSAECDIFGLLAGNSFX\n>SRR5260221_1043445\nLHDSTTNRATRLAQTPDDLRGLIKSRLDQWDTLTPGLRREFLDNERTLRYFTHVDATNNPAERHHGPSDDEQARWNSLSENERQKITAQFNQFFELTPDEKQKTLKTLSDAERAQMEKTLQSFDKLPLPQRRECIHAFAKFADMSTQDRAEFLKNAERWSQMLPAERKIWRDLVTNIPQWPPLPTSLIMPPMPPMPIIPNNIRPLVATN\n>SRR5215204_1812972\nPFALRELVGDTVKSLALRAHAKGLELACRVAPDVPDWVVGDDDRLRQVLVNLLGNAIKFTDRGEVVLSVSRELGNSGDRELGNSGDRELGRSEDRARHQAAGKQPSSVCPEFPNSRT\n>A0A0B2WMB5_9HYPO\nMDQQLDFSTLNKSLVIKAATLFLMIVGLLACITRISMKWFTVRSLGLDDQLAVGATCLAVAQSIVVVEATSNGLGKHVGGLQAGQIDHVLKSEYAAHVIFIASLTLAKLSAITTLWALAPLYHRRTVVITSSLVVAWTLSSILPALLQCQMPRPWDYISGQCFQRAAFWMYVSVGNIVTDVAIVVIMTTIFVNLQLPLSKKLLVGGIFGSRILVTPAIIGHISTWHEAITNPGDATFRMVMPTILAELVQCLSILTACLPYLKPFLDSFQSGAMVVVDATSQNARSKGSKAGTATSAAYGGNSKNDTSTSNNNNNHINHNNMNNMNNINQHHHSQSHSQSRSHGHSYSNSSGHGRAASGVTTPRGHPDEFELADMPSSKTATTVTANQGMMDAAMEAWDGQSHTSQTVLVQQSWQVDIEHNLPARGNGRRV\n>SRR4029453_5233173\nDPRPSRTRDRSSLSRSSSHPTGLAGALRSDPWTGRPAMLAKLQLPVVAGRLPGRAGRAAIASTVSAMEPAAVVGQIGVTTIVATRDRTPPGGGSATGWPGPAARLERAAGDLAGGPRSVVAGDQAGLVPGSSVRTVLHGRATERSVIDRLLEGVRAGRGGALVIRGEVGIGKTTLLDYAAVAAGTAGTRNATVGGTAPPGRVAVRVLRGAGIQSEAEPPFAGLHP\n>SRR5690606_9372909\nYLTKSSFTMPHVAEGCIIEFSYKIISPFFFSIDDFSFQSGIPIKKLEAKFEAPSYFQFKPTYKGYLPVNPKHETKNSPQLGDVIKRTSYSLIDVPALKSEVYVDNINNYRSGISYELSAIDIPGGMYKSYTQSWDDITKNIYAYSSFGAELEKTGYFEEDLDILIKGVTDPSEKINLIFNHVKSTMNWNKYMGYGCNEGVRKAYKEKTGN\n>SRR6266436_1748777\nIEFLRRLTDVEVAAQHAQKLLDPKLLRRARTSENRALRTLVAMAKPIWQSLTGRKPSVNKVAGKRKSDFVTFVQELAKIAGGPEPTFKQVQNAFRARTLPILLTAKEVGARLKVSLSWLAKARMRSDGPPYIRIGRSIRYTEATTMTRPVAHRAAFEAQTPTEVRAKTRAGAPCIMRVVPGKRRCRFHGGLSTGPKTKAGRVVSPHAMLKLTSSPANTPHHCSPSFGKV\n>ERR1700722_19782650\nXMAHCEASAIAERFVRLRGSVVGENENCGSIKAHDCAPPFDVMAGLLPALHAGALAVNFLIHGLPAGMAGPPPAMTREGWATGLTELDTPAPRSRGEPLAEHRQAADRLRRGRLVLKNVPMLGEPAVFEAHDVGGDPRRGTTVAGKTAVGDHIIPSGEDDVIFIAQRIRQGANEIEQAIAARRNMGAVLDVSVRPEALCGGVVAFVEQRVEGFENKRLVLRSE\n>SRR6185295_4310521\nTAEEVREYVVRSSEVGKAVGARVVISSAAGMVAIKAAGRPLGARSIDLAAIEASALLGVTHQIVGRRHLLELLLGLLVAGVEVGVELLGQRAIGLLDVLLGGILGDTQNLIGIGAQGFLPSATRHLTTSAVAGHDGAWRRQRGRGAAADRGSCSRLPTPAGLCRTSPPDRRAPSPPRAAPGRKPHPRPRSFARRSARRRPPACARWLRPLRETPHHRFRARRRPRPSX\n>SRR2546428_4765453\nFNCTPVTLPDAARVCPAGREKLVSVLAIVARFDIHDRGRRFGAATLTRQQQGECTMTPRNFVVRSLLMAGLFASALPGWADCQSNFVNRITQLRPIKLGTSGSNLRDRVIFRNLECCGGTLGALLTDTNGNYYVLGNNHAMGRLNKGKKGESITQPGLIDADC\n>ERR1700722_5782801\nPTNFSCPQIEPDHDGTMLDFECEDTRYCRYREDCRRAELHDTVVTNYAHWVTMLRSPTGSRIGGFSTLILDEAHLVPDLVTDYLRVRLSRAYVQARLGLDMPEPDQSLRIWRSWATGARREAEQRAERAPERSKEGRRVSGLADTLARIADIQDGEEWLVDQTPRGAELTPVWCARYLERYLYAGIEQVVLSSATLLPAITRYMGVGAGQSVTHEIDSTFPIERRPFIYVWPQTRLQETRVQYNMSNTVRRAWAAKMDRFIGDRLDRKGLIHTRSYDRGGEIPGLSQWSSAMIVADRRNGRAATDLFKRAEAPSILLSPVVEEGVDFPDGAARWGFIAKLPSVDRRG\n>SRR3712207_4962885\nIVLIIKHVVLFFFFFQAEDGIRDIGVTGVQTCALPILRVSFNSIGADYLRTAGLPLLRGRGFTTAEATQAGGPAVALIDDALAKKLWPNGDAIGQQLQLAGERITNTSGDVTPGEAIEVVGIVPVVRSSILEKAPAGAIYLPFARGFQNNAFFYVRFKAGAQANSAATGELLRSTVRSVDPALPVLSLKTAAQHLDD\n>SRR3954447_3399888\nAQLTAWNLATVRRLNSWIIRATTSLPDPVGPRISTEISDFAAVRIHSKTISIFSSRPIISRNRCTDGDWSSVLTAARRSRNVSRSSTVASLAGRSARYRGGLLPATTAATPKSTSSLIQFSTSRRSRPNVCINDSTSKLSSGRALMYRSNPARSGDCTRLRNRVSRSAGSAVLVALAALARRALKIRSSMDRLSLSAGYRRADRGGPLAAIILGLVALDQRFHRHRVAFTVSVADDRRAATAGFDENVRQQHACINFDGGDMRHVDCFFLPPDPPWLVLHDAGRRNQDLRREKVIAGTEAAGAEHI\n>SRR5688572_24783379\nATVICGMNRPIVWRTPIASMRMSAAQTSTVRVDFISSCCRVARGLPNDHRASRACARLMAIQGMTNRNTRQVPGNALGPRVAQNAPIPKSRSTRSMNPRHLALATFLACAMPAAADCKWEWLCNGDGACKQMPVCGSVYDRPPPRPTESTPPATPPLAMRHNTFAGRGANRGPPLTCEHIMRKDHTGRWYWSEACFCTDAARAKDPTPPFANIVRCENGTKX\n>A0A1E5AL09_ALIFS\nMIVNSNNILSLTSTSRVMSINWALMNNCNYKCKYCHSDLNSGSIKSPEYNIVVVFVKKIIKQCQQLNLTPYFEFGGGEVTLLRYFSELIELIHKNDGLISIISNGSKSLDWWKANTPYLGGVSLSYHVNDIKDNNHFIDVAKILEQSKNTRLHINVMMDPERFSDCLFFAKQLKKEIRCSIALQPLYEGFGHGGITKKYTYTQEQEKEMQTFRGRADNKNLPEPRAYLDVIYLDGSKKTLSTFDLLITDNVNFIGWDCYAGIESMVITFSGEIYRAWCMQDGPIGSIYDEIITLPTTPIRCRTKICQCGADISAKKVNTTLLKHYQNSIETKYIE\n>SRR5262245_57968688\nXMICLQILVPFRFSIVSARTHWASDAKQYNKSHARPPPAPGNCPRAAVDHWAMARQFRWCLRGASRMAVLILGNDRDEHAECMRAYLSTKGAVVEFLDSQRFPAELQIAHDPAAGSGTIRLPSGSTWEFAEIESVYWRSYGGATAAELPDAEQAFIAANDARSLLESLLLCLPARWVNGLAGYRWHQTKPAALARVAALGVAVPATVVTNDPQAVLAFADRHGRCIFKPVQGGAHTQRVTREHLTEQNLASLAVAPVTIQEEVPGVDVRVFVAGPRVLACEIRTEVLDFRKDPRADIVAIDLPGGVAETCR\n>SRR2546425_387409\nPKSGWTLAAAGLLLYASASHVQAAGAFVRAGASYTVDKWDAADFVGFDSAALPPNEIIAMTQNRDGYLWLGTLNGLVRFDGVHFKVFDEENISGLSGSPVIRLFEDSQGNLWVGTEIGAIALMKDGQITTPLETGLGGRERRLMSVCEDSSGAVWLYTANGDLWRCRNGECRAFPENPRAQSVYRGVIAEPSGTVWVGSDHRQFAIGPVPGSASFELPVARQLPVAKLDFLLASQHGGHWRLADGRIQKRRGDQIEDLGAYPWGLASVSAACEDRDGNLVVGTRGAGVFWFEQDGKVASLSTTNRLSHNYIL\n>ERR1700751_958828\nLDGETGLQPGVATHVQALGAELGHAPGDHILHLPGLDPGPLDHRAIGRAQQLVGMSVLVVALLQVPAPNRGARGLDDHYLTASCRHQLSLSGTGPAPEPALRVYKHQLTVTVPRRAGPAGPRSHPSRPAPRRGRDAEPPG\n>SRR6185437_9543277\nLWSMRGSLRFGLGCRSVRALTVDVPSPCFVRGFHASARSALPRCALPSPRVTRRRRMECGCFHCIQTFEATAVIDWIDDGETPLCPYCGMDSVMLEVTDLTTLWRMRARRFGMEGLAALGEGPFSVAGPLDD\n>SRR3954464_8629952\nPLEHAIARVHGRVISFDPATSTLTARVPASALRRLSGRRDVASVAAVPVRRRLALSDFVATTGAPNFWAAGYTGGQGTNDSVPATLWIDEDLDTAHPDFHGVNWENIPGAAPGPLCGSPSNDAGGSCEHGTQVASLAIGQGVDAAHCPSGITCTASDAQQKGVAYGIAHAISTQGGGAAAPPGGYWDIFGFALGIYQTGGSSCSSPLPGATWPAQVTNESYGSGAGTVTAANLRDDSIFSAYGVLPVPGAGNDGPTASSVASPCIGYDTLCVGSYETNASVSDPADDSISDWSSRGPGPA\n>SRR5450759_3105029\nSGWSEEGEMFVQSADSATRPQFSASYSHLITCSRSSPSPSHPLSSPSHLQSPSRLKSPTLLALPLNHMVKATIFIHMKTTLNIDDALLADARRLSRIEEKTALVHAGLEALIARESALRLAALGVTERRRRPVRRRRPARTATRX\n>SRR5580765_3100358\nLPAPGDAPRALSTKNTEHQEHWAPRARRAATARIATKLTSHPIVTRIPMLAEFSAVLETVANSGPGIGAGLAAGLGAVGAGLGIGQIGSAAGEGIARQPEAADVIKGNALVLSALVEGVALFAAVIGLLLVGKGX\n>SRR5690242_3907823\nRAHPDRPPRRPRLPPFAVARERRRALDRGDAPRAGAARRGRARDVPVAEARRARAPARLLARGARAARRGRRLGAPSGGIRRGRSPSPRPPSGDSPMSKPEVLRQHAEELFSEELAELSRADDKQKPPNWKLSPWAVRTYLCGGKLPNGFEVSVKYI\n>SRR4051812_6319949\nPRPAEVMRDDRRHAADGAIGAERAATIEVSRREMIRVGAAARNHPGFESRARRRVMLPVGEYVDGRLGFGLPAHRAAQGDGLLAIERRAIGDVVDHAVVLVPREGEPAEQDVGGEGQVDVSGRAALVVIAEAGGERAGGLVLRLVLDEGNRADFRAAAKKRALGSFQHFHALEIEELDNTAPRTADRYA\n>SRR5580658_5004565\nYLKARQRTRTKRGHERNVGGIAPARHQNTADARLVMAGIECVPAFSQIGLKPGAKIHWGRIRWYADVTEIARAVAHRDVHAAAQGDGEMSKVPTYPALFGMDIPCCFGRTRVFITKFNAIVDVVADRLNKAPSSGNICELRPCDLDEAIRLAISAAEEEDERVDGEVLQCMLLRPQVHRVRFALVLHKEVRRHCELACGSMNDMAEIAENVVIGIGKNRRIELQAIPGQQVGCPGWMNTQLQDHVRGLRAIIRDLVARMNLHRYPLRTSQPRACRSLAKIIAPQKFHCDAARNKQHKSSALGSIRSLCRX\n>SRR5919197_97304\nQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSTERSAGGATQAAPAQSPKRSRERSAGGGTPAAPAQSPKRSRERSAGGATQGAPAQSPKRSTERSAGGATQAAPAQSPKRS\n>SRR5215470_420408\nEIQPGKFETLSNASKRALVAAMNKSRSSRGNARNGAELGSINLRSTAVKVDLAEPCSPARHKTGYGPLAQRRKDKGHAENEIPVLIFGSIFILWHAHVQELAKLIDRSTTGRLRQWQHSAGAAKRDGCLINDAPAVGIDFNRAPTRISEVEIQAAIECADPNVHRALPTVEMCTRLDDVERRLDRVGVRSARR\n>ERR1719223_2153901\nQAQTVSAPANFASKTVWGQNVINIRPFSIESHKTFEFVGSYKNNGQIPIFPSPEIAFLGRSNVGKSSLLNQLTALNKNIAVVGKTPGRTQSINLFKCSERQ\n>SRR2546430_7123832\nTRRRTQTRWAAPPRSTGAAPLSAPAHPPTRNLRCSPRTGEMGVAAQPCVRSPIGLQPQRCINVGKRLPAPRTNDGRRLGPRGPATSRHHLARETPSAPPDRERVRRRARARAKQRGSASGRARAPGREPRVRPGHRCRSNPPSPHPRSEEHTSELQSQSNLVCRLLLEKKTGAHAHDMRLTGTGSATIFRDGLRQEATWSRANNTDPFIFKNASGERILLDQGQTSVHVIPNDWETPSQX\n>SRR5207245_1019995\nXMYPARGPAAERKRSNWLSASSGSGLFHSVSSSAGYSRSIASRRAPAYGTSGRPSRISLRFWRARSGSAKPVARSASRLGSRSRRRGGAARSLKKSVNARWTAVVTARCRARKTPAAGAQLDVAARRPAAPAQRAVDLALHRADRGQDALVHAGPVDDGARPVHEARADARIAGGHPGLEQRLALPQLGALVVIRAEGVERQRHRAHAALRAQAQVHAEDVALLGDRLDDRDDVAADAREVLAVGQPPLGPAGGVAVGAVGEHQVECGRVIQLLAAQLAHADHRQARLVAVDVPRRADAGAEVGGGHAPGLAEADVGQPRQLLRRDAEVX\n>A0A1H8BLI9_9MICO\nMTDHISRSYRRPLTLTPTHHNGASQRGPAAHRLEPPRPDLNRPDLPGAVRLERKRARFTATTRTPALVAAATLAVLIPLAGLAAPAQAAIAGIARAATAGAGTTGVPAGTTLKVHNGDLNITRAGTVISGLDIRGLVKINAINVTIKNSIIRGRSVSAPAALINNLGGRSDLKVIDSELYPSKPSPDINGINGYNFTLTRVDIHGVIDAAHITGSNVTIANSWLHGNLHYVSDPNQGGKPSHDDSIQIQKGSNIKVYGSTLSGSHNAGVQITQDTGDVSNFSFTNNFADGGACTINVAQKSYGPIHGTVIQDNKFGRNTRLLNCAVISPTTTKISTARNYYTPDSKTVAVRTG\n>SRR5262245_45043355\nTGSMLLIGVFGGPGFAQQPATNDTLKQNKNEAVPPAPSATAPGKTVFEKVEPAKPPEKSQEAKPPVVKPDGTPAKVDEVPKPVVVKETQPAGAPVPPPDGKPELSAPVPPATVIPPVRYFVMIFGSESVPKRARFSHTWYTIVKATPKQNLPPGYDPDGNLVKYYDLTAHTISWLPSSLHIRVLKLRPDCGHNFSLH\n>SRR5512132_3388807\nTDLEILAAARAHFPTEERLAIIQASAQRALLRHAEAEAGLRAHLAANPGAHGCLMTLGQALLDQKRSAAARELAESTLRAEPRGEVAVGAHFLLATAYQQEGEREKARPHLEAMLALEPGNTRIELLLASLDREAGRLEESLARLDRLVEREPRPGNHDWDRMVTATLLGRWDAVRASAARIGMNLKGAGPIEEAWGLCRIELREPDGEIGIHHALRTGPVTARILDVARPRAPQHYGDEIVFEAAPRNAGPRPGEADHSYLYPALATRKPGGYEAFLLDGVHPGAEALDTLRRELAALGCVLAVQSDTTYVVTEAATGEARPGLFAYLAAPAGCSRRELHDLLVQHGGSPARPLVWPGLAQALEQASELEDELARQAAIIERLGLX\n>SRR5215472_956881\nRSWSPPGGCTRCRPLGVVIRPVDLAEDLIRRATAWHAGSRGAGRSGGAGRARIALWSSRARGTSWTCRPSRAGCALLGQILPRRARWRRGHVARQGDPARAVVEDRVVLQVRGRRGLPVAAPVDARQARRSSRARGALWTLRARGASRARRPGRAGGTRRASLRQHAPVGRVLGWWHVVGGVVERDVARALITDAVVFGVGRGRRPRAAPLHRDAPAAGHRWTVGALAIVVVAADRVEQAVGHPPRLRQPPLQVRLDIVAPRVLQKADHVRLERHTADX\n>SRR5258707_121040\nGRDEMCEASASNRKRTREGCSPIRFSSIVITAVRPGGELSLMPLSVALAILMCPAMRLRDLRMHRYHWAMLEARRRIHERRIRMNPPRVRLRVPVAVATIVAVVRRAVAIGRVILIMLIALILLIAALDFAAAIIRFAIAVVPIPATIINIAIAIISIVIAISGRPVLMRPVALFAEHQPIWMGLELX\n>ERR1039457_2916573\nFFFNDTATTEIYTLSLHDALPIWDAEARRDLQAGRLAGQAQAQVVGGLEGLLIEPHGAVHHAFGGSAVDLERHQVRGNQGEGAGGTEVFDDRHTQRAALLRVGGGAQFVQKHQRCGRHIERHLADIRNVGREGTEILLDGLIVADIGQDLLEEGEFGFGGGHRQRGLRHQAEEADGLESHGLAARIGAADEQRAALLREFERDRDGGFAAAAQDVFEQRMARVAQHQALPKTRDHAIELGAEAGLGEDQLQLGHGDEGLADGIAVAAQTVGDFEQDAADLALLLFGEADQLIIQVDGFERLDEQGVAAGAGAMDDAIELAALAGDHRHHETLVADGDELLLEDAILAVGAQEALERFLDRLFLTFHIAAPAGARAI\n>SRR5918993_1097003\nGCAPDITPGGRAMRNRTMALVGPFAAATVLLLAPTAAADPPPPEFGRSNMGLCSSFLGPREAARQRSSRARVPPTALDAVAAAHPVPSYRPGGPLMNRLLGMLATCAVLLGLSAFLAPAAGGQEPVPTFTYTTPEGGATPAQACANSDDAVIGQFRLDGEVVEEFPLSGPGDLTRGGCVTTITMQELSTPAYVANCKILEPEFAAANESGRPYPYAFYGNPDYTANNRADCVSFLRGFHTGTLIPGPX\n>ERR1700722_7859116\nXMKYRVYKPFLLAVVLLCVVAPHARAQAFQNLNFEAANIPPGTQPASMISASAAIPGWTTSQNTWYDAFSGGGALVSVNDSLTPIMNFSPLQGRYSAILFGGAFVPSTSISQMGLVPANAHSIQMDISLLIPSAPFTVSLGGQLITMVPLQVFPNYTVYGGDVSPFAGMIENLTITQFAPAPPNVPPAALELDDIIFSPQIVPE\n>SRR5437773_11503562\nSRWRVKARRFTRATAQRVTNPALNLQTRWLLSPRLGLIRSGCIRGRKMPRPRQTGASRNWASIVHQWRRPRIHTDTSRLHWMESGSARLTLHNGSVPTLHDLLNPPNERPQTFHRGYDVFDPVKIGFKEPPPQPTGPNGTLTQPYFFAIPEKKETAIKVTPTAPSYPARTKRNCWNIX\n>ERR1712178_671869\nSVKTIRVEIRVNENKCLLNLRSIMLQRKVLIIKLSTPDRFTTGSVTSCEITTLNHKIFNNSMKLTAFITKTFSTGGEFAKVFYGFWDSFSKETNFDCTSGFPSDSDVKEHFVSNNW\n>SRR5258708_11690673\nGVPRRPQRDVDVLGSRIGVGEESLDGLIGCAEQRPARDSRVPFRAPLFLQRRLDARGVGGVTREVEADVDGAPDGRRLPTLDLAPVVQHAAEAPELIWSDVRNVPAIGVTGDEEEGASFAHPTKPDRKAVLHGTWQARRVLRGEVLAAEGGALLGEQAADDLRGLVEHVEPYADLRKRVPERAGLGF\n>ERR1017187_4658610\nLFRSDVPAVHKGATQPGKWIARPTKKRPLRLGGPLLPGRQAENFQLPAIAVAIPVPVTVVITITVAISVAIEISAPVVPIEIAAHKAVPIAVADKVPAARNPIAAVHVSGAPGVTRSRGRWNVGKRCVHVNSKLGSLSRDACQPRCASQYRCSQHPVLHTSHNASVPAGPWFKISVTIDRPGSVPVX\n>SRR5690554_4605005\nALSLTMKNGFNFGSHQAEVQGGSWGRRVVTVESGGNDGTWGYYLNATGFEEDGWRDLSDSDALNVYGSLSWRAGDTSALNLNLQHGDSELRGNGASPVGLLATRRAAIFTAPDITENDMRMVSLDGSHFITPSIQLAGSAF\n>SRR6201996_3122915\nPFDWERSVASGCKFSRGPICSKIAPIEPYSLSQSVSRRVLLLDPPLLRFSHCVLCLLPDLLELLQPAGYLGHRAVRCFPISAGVSSHQKIKRGLPCCGVLPIVMREFCQWEVLRPIVLLIVYEKPEIGFEPLIGPFRLSVRSRVVGRRNVLPYLQEATQLRCKFX\n>SRR5438477_5602888\nRCGPDCRRGDPHPRQRGRTPGLPPAGHGRDPDRDPRPAAPGPARDRARRGGRVPVRHHAPEGHDQKEERQGEEREERHDAQERRARARSRKRARGHRRGGDRAGHARPGRHAVHGGRQGPRGLGGAARTGRMAAATARSAAANVRGRGPAARRGRPAQADHRRRRPAPDQPAAARRQRCRSDALGRSGRRGDGLGRAPDGSAGPARGHVHRPERPPARAGVLSVGSPHLRGPAHGAWPGRDRSLRSGRDRRRRAAPSGRNDPARPPGTLAVGQADGGRLGVGGGSAREAPGGVGVVHVAHRSARDRAGRVAARAARRRHRLLPARFPDRDGARQGRGVGLLDAHGVAAPRQLPGRVRGCGRRRGARGPGGRRRHRRPRGPDVRAGLDLAERGLVDGDGAAALAGRAGRPRAPAQKPRRRLPRRARALSDARAGRGDRAQAGPALLDLPADAVSGRPLPRSRLDALVPSLLTGQALVSLVPATGDHVWAAGAAWDVARAAATTDRRVALVDLWLERPTLHEVVGLSPAEGIVDAFEYDVSLTKAAHEIDRVFFIAAGTVTAHAGDLFANPRWRKLHGGFRSEDALLLLYLSAGALARLSTVPDGLIVLSADGYEPESSIGQGITAAMERGIPLLGVVRERWTPLATPAPDPRAMAPPPGRISAAVRPGLRGGGVSHRRTRPVVIAATLVAGTAGGWALLARGAEHRAPNAAVRAAPTPTATSAPAPAAPAPSQPRVDSLAWTVQLAAYARLDRALALADRLTADGITPFVTPVTLGPRRGGTVWYRVLAGGYRTRDSAVSVRATLWNRRLAQRGQGDVLRAPYSYAVSGTTTPDELRARGIPALARDGAGRLLVGALETPEQGGVLEARLKRAGVRAKLVTRMGATPX\n>ERR1719231_1158533\nHLVPYAARLNPTMVICFFPNIFMNSKNEPGGELNQDSSFFSSPSSEAVASCTSSAPLDMPKRAQMFSSTHGASASAMPIRNGTANRASVRKPRDHADTLPASSTFDMSGTCPLVARNANAASGTDTTQKSSSNSPYEMPPAMPYFLICAVISLTLSIASSPFSASSAIISSGAERGAGAGSPGSTTLRATKRCGATVDGTKAAAGMMSSSARASIV\n>SRR3954468_1616850\nAGSAVLHVGRDARASAGHETRRARARAVLAGGAGAAGLTAGSAILTVGLNVDAGAVALVLIATALRVHRPATAFGAAGEQDQRREKSRGQRRQGRLAFVHDRLLRGKLPRLKKERAAASAPAGGLEGRRHAYHNSRLGALLETYGVIARNGVPRX\n>SRR6516225_4192873\nTSASVTSTSWPLGVTPPSGIDAVLAGALSATVADNTGSGSGLIVFTFGAGDALDFLAAGEKLTITYDVTVTDNNGASSTQLVTITVIGTNDAPVITSSAQTGAVTEHTNVDNSGNLNAAGAITFSDLDLTDTHTVSFTPDGNNYLGTFKPTLTQDATGGSTGVVGWTFSVSEKTVEFLAAGQTLTQTYTVQVADNNGGFTTQDVTITITGTNEAPVITSGVQSGLVTEIADGAPGENTAPHSLNGAVTFTDVNLSDIEASSISNTQVVATLANGYTLSAAQRSALVNAFTIDAATHSTTDGTGSIGWHYNINDSALDFLGKNDQVVLTFTVQVADGNGGFASQDVKITVLGAEDAPVITSGVQSGLVTEIADGAPGENTAPHSLSGAVTFTDVDLSDIEASSISNTQVVATLANGYTLTAAQRSALVNAFTIDAATHSTTDGTGSIGWHYNINDSALDFLGKNDQVVLTFTVQVADGNGGFASQDVTITVHGAEDAPVITSGVQSGSVAHGTTTTHSLSGAVTFTDVDLSDIETSAISNTQVVATLANGATLSAAQQSALVNAFTIDAATHSTTDGTGSIGWHYNINDSALAFLGQNDQVVLTFTVQVADGNGGLTTQDVTITIGGSNEAPVITSGPQSGSVTEIADGAPGENTAPHSLNGAVTFTDVNLSDIETSSITNTQVVATLANGYTLSAAQRSALVNAFTIDAATHSTTDGTGSIGWHYNINDSALDFLGKNDQVVLTFTVQVADGNGGFASQDVKITVHGAEDAPTITAGSTTATGSFSESTGVTGSTALDSASGNIVFADVDLSDAHTVSQAAPTFSWSGGTLSASQIAALTSASTLTLTRTADSTGTGSGSVAWSYSAQDQTFDFLAAGQLLTITYQVTINDGNGGAAVQNVAVTVTGTDDAPVLSVAGTALYTQNGPPVTLLSAATVSDVDNQTMQSAIVSISSGFLTGDMLAFTNTSSTTYGNIVANYNAATGVLTLASAGATATLAQWQAALDAVQYSSTSSDPTNFGNDPGRTISWVVNDGTLASAPLQTTTLNIKASTLTIPAGSTTTLNGGTLQASVIDVEGTVIGFGTIIANVLTNNGTITSKSAHTLTIEITSGIQGTGLLEITNNTTLALDGPVGSGQTVQFDIGNGPAPILILNDPSDFQGKITGFQGSDQIDFVNIDPARIHYLNGILTITGTTNAITFVGSPNLKFASDNHGGTLIIDPPLSTTTAAVTTTAAATTTADAAVTPVAKTSTLTATKTTSSQTKATSATETASSRTNATLAAVDEASVVALSTAVAVAVALDTAVADPGKMSSLTISGDGTAVDITGTGSGLDSSTVNSSAALGFSSISHEMAGAPADKAVEVSNGKPQTADTVSETGAFKIDAAATPQLDGSDAVDALVITAGTNADAINVPGDHATKTAWHVSDDGRGGKTVHESPVSATSEEASAQSTSADHHVIVGGPLTETLSGNGDHSASPFKPNADHDATVDPGINLDSIPKNHLLQHPADNLIHIPAQPDHGADPAHPHVDGNQSANVKFADDGSAPSGALPSDPSALTALPSDPSEAHGPAARALAPGDDTPVQPTPADNGHHWGTDPEMKFASIPQNNPPEHPADNSLHAPAQQDAPAATDGTHPLRGQVDASESASPNFAANGSPQSAHATGEDTSVPVALLDNGHHGDADPKNNDIAKDPPPQHPADNSSHMQHDDGTIAATDGAHPGLGQVDGSESASPNFADNGSPQSAHATGEDTSVPAALADNGHHGDADPKNNDIAKDLPPQHPADNSSHMQHDDDGSSAASDGTHPGRGQVDGSESASPNFADNGSPQSAHATGESLSVPSTPADNGHRPITDPDINLASIAPNQPPEHPADHLPPTPAQPDDGPHPADPSVDVNEVSSFKFADNGSDHGTGPDGAHPADPQVDRNQLKLADDGSDHGTGPDGAHPAHPQVDGNQSDSFKFADSADHPGTVTNDPTAVTAPSSDSTGTHGPAAPTLAKTDVPDAGLSAAPDQFVFVDNTGHGPVTDHKTDVVEIDHTVPADIQHLLDTAHETNAVSALDPNHATASQDMTKVPPHHQGDFHFAX\n>SRR5271156_26155\nRCLPVGNFRSNRGVEHTMSSPYTFVPIWSIWRELPSPLKLFCLVLVIVCIRTLISALTTLVGLRAFPTSRKAADESRVHPCLATLCLRVENMRQLLSATVYLFVFIFCWILPWVMVTLDNSKTPGGILVMRHFFIDIAFAANVFLAFLVLHSVQWFVSSRVNTINLSAKTSPAG\n>SRR5580698_4360037\nDHLHHLTACRLSLNLTFGLGHGARLVGPATSLAQLLQPCERGCLGRRRRRGWRARLRFGDSPIGLLLIPGGVALSLRDQAGLIGPAARARELGRSLSSGVCPLLSRRDTRRRRGRGARLCVRARGPAERYARDNHTYFGNSVHRKHGVLSSSSSPFVAGFVLTVRCWS\n>SRR5947208_1864857\nSSWSQFGPRLASLGATRANAAPGMARATPPAAPMRNCRRLGSDGVFWGGVGGMCGVPDMSLATPSRPAIELTVVDSGRRERGASPGSQPTPTSGGAGATVAERRPLRNHRGRGGAVFYINSEYLSNRGPGSDGRX\n>SRR3989344_4462318\nXMDFRTRRTENIYNRIHCMKNTLTISIATLVGVLLSDTRHIVAQSVTPVPNMIWINSGTFVMGSPLNEEGHTIYEEQQTRVTLTYGFYMNKFEATQQEYLDLTCLNPSTTTNLDAPVTKTSWNGAVNYCFLLTERERSAGRIPSNWEYRLPTDAEWEYCCRAGTTTRYSFGDDPTYTLINQYEWYIGNTGTNGLFPRSVGIKLPNRWGLYDMQGNVSEYALDWFIDNPFRGSLPGGSLVDSHGPTTGDWRVFRGGSFFEGVSSCRAAVRGGISPTSTSGLIGFRVVLAPATPEWRQVIETQLERPKYSSGPVKEVGKSKLVLVTHGWIPSWDIPQLSTAWVDEMTNSIDRYLTDKGLDGWQVVGYKWIEGAHPLDLLSIAFPTRAAQTALENAKREGRKLGEYLAGQGWSEIHFIAHSAGSGLIQAATEAIKDISPSTIVHVTFLDPFVGLDYSGVSSYGNRADWAENYYSRDLDTGGENWPFTQGLFDYCYNIEVTWVDDNKILGPVYISTPLGTQRCTQTVSSHGWPIQFYQNTIPPNTQLGSAGFGFPLSRAGGNWDYAISNYMVSSNALWVLGTPDDPQCNQLYTSTPPMIGERVDFSNSPIEKSSTGEVKIHGIDSFSLITGSPVWLAAVINPTNSVNLVSFDAKFVNANGSEGLLSLYWDTNSIGSVDEPAIQLGFKRYAFMFPRAASNTLHILGFRLDAFTNVPSSVLVTNVSLVSMGVSEPFTLSFAGVYTNMLPIFALTGPTGVVYTIETSSNLVDWTTSVVLVNNSGKVRFSDLASTNALQRFYRAVAPX\n>SRR5262245_14032018\nXMSEDIDTAPPAALPPRNCTTCGKPATVAYTWEWGESGMACPEHAATLQQNAGNLNRTVTVVPLPAQGPTPLTRDERIKYNATILALEAEIEDLKSRGLELVRSNEDLAKQAQLFSMREREKTAYLEDAQAEVKQLSARLEEVETELADAVTEVERLRSIVKFTPGAQPPQQPPAGPTVVDGPRX\n>SRR5260370_42043382\nRSGGFPELTIHQTGHGLGLGVHAAPRVLIGNEQRCANPSVIILDEPSRGVDIGARRRIHDFVVEAAAGGAAVLLISSELEEVMGLSHRSYLMSEGRILGEIDPRKTSVADVLFPLFNVVGARAVAASLSRAAAPASX\n>SRR5690242_10536872\nSVAPSPMSPLPVDPQTGGLRSMDTALVTSTQPLATGPSLAGSTVFHDASGRIGYISDSAFPTLKSAWTYDIRGRLATTKLLQPQSSLASLTPITDHHMPTAFRDLRDTGSLSVTDVGHLGVPAALATEPAKWIVNDGPAHEITSKTLFLDGHVVTPTMQLGVVPPPNQIPATFNFTFEGGRRTSDGVWNTSFDEFGRLMRLENADRVIDYVYDPRGRLIGRTASQKTSSGNVLETRSEVLNRDGLPAETTFVWDPVVDRLVAMYEAGKSTQPNATA\n>ERR1719203_2165260\nDRTIDKFDQSIRVSNIALSASNAQIRIVSLVPITLQKATAMMASTAIRCPSRSPSQSSSASECKGSLLSLCRLLGRLGLLLGALPSVANVPAAPLEVLLHQLPLVFLGAPHVVVGHLRHAHQLALLGFVQVRHRRLGEVAVARHLALGLLLRHQVGDHLLPVVAVFAPAPCP\n>SRR5690349_23072571\nYFFFFFFSSRRRHTRSLRDWSSDVCSSDLLGIPTLPTGGISVALLIAFVWIVAFALPVCLWMLAFWCRPAHTFVLVIAVAALLRSEERRVGKECRSRWAPDDVRTKGVALLD\n>SRR5262252_5786708\nIRTAARDQQEHMPTGVQIIATRRKSPAHDLSSIVNIVGFYKLQTRIRRNHSVQVDDGPIVPEDYSKGIGVAIERITDDLMLRINRSREAGAISGRIQIRDTPVLPQCGVKLPIAGIGATDRLPIVVKPERHG\n>A0A0N1ILD7_LEPSE\nMSKYFEPDTTFGKDAECAVCCCLWTNPVEVNNCQHIFCRECVANLDLCPVCCGPVDHLNTPGKFILRLLDLTRGKCSACAWRGTYKDFISKHAKCLKEGEVMRSREDTNATAPEAEPMHEYYLEEGWPAAHSLARLAAASPTLTSTNSATQNAPQPAPAIAADNPEKRDLSHVSNAAREVSAEPTHAQRARWQQTLTSTARDFGMPEGEFKELVRRFPDFASLVTDRSSRLELRWRDACRLLRFMNYPSHPDDVKNLFEMAERSPKTDSISFNTLCLWLMMNRRSPAQWYQMSDAPYRQILQVAQLLDVEATGLFTVEQCRILAEQYFERDVEDSEWSQITPLLRSKDAGIRQSFIPSNRCHPDPLEDFTQSAVKLPLHDALCSFARHVNELKSLKLQSPVQQRQADFVHRIKKIVGYYEPDALPQLETTLQKFNGEEESLLMTLTAMYGPEPM\n>ERR1700733_3340046\nVVGANTSTGGSNPPLSASKPFRIPANASNPRHDRYLRLQNEGPRAFSYYVCARVSAPAIASTARFSYSCEWAMLRSDMEFRVIWEIDIHADSPKQAVEAAREVQLSTDMPATVFEVWDHARQKMHRIDLATVTGRLENGEVASLRAAFRQLQCAPDLGAGVRDFLSVMLIFLDADGGYWRRRX\n>SRR5262245_2448521\nXMNSRSRANSARRVAFLIIRLILLTTVLVRFPVQAQTDAAARFAQRLQEARQVDAAAQDDVGVMYAEADGVKRNYSKAVFWLKRSAAQGNVLGACNLALHYARGEGVRKNPILAMKWTFVSHSLDGLKCFPDDLLQFFKPRRSAVRKAWSLANAFLRSHPDLKNEFGERPWLKSGTQPNKSLDRSPDVSGFARLECLVRX\n>ERR1711873_241630\nPELTDSEGEEDSEDETEDDMLVEYRPSGNIASGISRSPKPDGYHLSERLLTSKTTIKNKSTSNTDADSSDEDTEKPQMNKEINKNRLHRKRLTYPCHPPGRYSPMIEDQQHTETSKEIGSITVKEEEVSNTDLSSSLTWGKDQEVSWLSGTSIRLELT\n>ERR1039458_8309614\nRKTSRPDRPLQQTLDYVEPQTWVPQVSPLRPGTAANQSKVRAAIAKPESMYPEATMLNSTRPAGSGESSVLSTGHSNSGFALAAISNGHLYNLRNSRRYRERRLNYTKTRPTTVSISERRKPDPRGQPGYLRIDTDQGDSPTAKGVYHINAVDEVTQWQLPPHGRRPVRGDPGAX\n>SRR4030042_4963036\nYTPSDCSTPGVIPFPSPLYVVLPVLLLAGFQLLKPKLRSSLSFVLLLCLFFFFNMSSSLRLVEASRDRHLRIVGLTSAMEETGRRYWLGEYWRCWLLTAVSKEKLIVDSYTTESSLPYSLAYWNQAESDNYVFVSPSDRERPAYYARFGRWLETIGVRSEKKEGGTFRLVYDLEPRVFQRVLFMDPPGQIPRLDLEMIEPRQGYLPLLFPNPAPGKSDLGFWLTVEIPGFSGRKELFSLNQPEVRVKIPHPSEASFSIRYFIDYIGVRIPASERKVHGSLPPDAVLVRSDPVVLLRGIPPEAPLRKAGRMICEKESWLELNRMSPGASRLRLILNSPFKFRSWLWYGKYVQQVDIAVNGTSLGKRTLDDGRNVLDVQVAKDILKPGPNLVCLRFRYHGWFPTRSPWPFSAFLERVKL\n>SRR3954469_24847718\nVACSAQAPEWTSVLGSRPQEALKRFGRALLGAVAGLRAALGLGVMVGQEGARSVAPRAADRGRRAAQVGDQRPRPPAHGAGHGVVDVGCLLVGAPGDGERSGTGPAATSPTGPVRRPGASLASRPCSMSPPPPLPPPPRPARRRX\n>SRR6478609_5279812\nRVGGRRGPRARRHRDQHHRRGAQREPVHQRGAHGRVAGRVRRDHRRARDREGRLRRGLPADVAESVTTARVRLNAALEALRKVDDSLGADVATRKARVTNAVTALVTDIDAFVSPRVDDVMWVDELAGEHRLQVAPLDVGLTLDRLLWDPPDRGGLEIAAAGPADPEDDPRYGLPTSVVLTSATIP\n>ERR1700736_2808299\nHTIRGAVTRARGLLAPNKLFRSRDKGKGRGFCPRPGFPRMADGTAGATRRDTRCQQTQCFMQILVQPGISGQSFATPEVGCQASEYRRIHFQETLDSARGTKHCGKETSGIVLLAGRRQPALKEPAGNLPKQLMLGWDPRFREXX\n>SRR5580700_6228722\nSRGSVNADARLAEDNVHRRVPAIAEGERTELNEMFARPSLPSRAGALHPDVHEALAGRLDAAAADGKVQSSRRGVVHSFVVVRQVRDGVVNGRVLSHADVLAAGGLELGQDGDAGAARVLQEHPPACKERLGVGLTGDHVYE\n>ERR1051326_2460312\nVLEFVFRRLFACAAFRGLWFLTRCASRGNSLGLGGFEAGEPPLCGAWRAKADDGQVGVFRLSKEQRIFSAAPFIELERPHEQGIAAEEGAAPGFAVAIPEFRVPGGAPDRSPDRTPQNERQGVIQPDEGISALPDHLADHIAIDDPAIPADCPSDTLAQDIRWRGCPVWPPMEGVHLYMGEH\n>SRR6185437_12123836\nPHSPTDRARRGKSNAAATARRPSGYAAPASRACTAPPSPLPRQIAQKVVVAPSRCLGSESRAKFLRSPPPVPSCAPSRVVSPPARRRCFRHRELHDALTQRTEIESHRRRGLRQQAQWCHPRQCVRLETEKFTAVRHTEVDARVAVKLERAECSQRQPLNFRRLACRELGRELLARHARRVFALVIVDLVTRENFAHRQRLVAEHAHRQFSSRNKSLDHYLIIVLQRLGHRRREISSSTNQRKTNSRPLLRRLHDHRPAQLLLDLLGLWTRTGRLANEQPVRRGHAGRPKQHLXX\n>A0A1F8KNI6_9CHLR\nMLTNVLGDYLDSISERNFDFPFMALLRAQGFYDIHFTHGQVEFGKDFIAKQSLNGNIFQYSFQLKAGNINQATWRNDIQGQMLEAVISRLSHPCFDHTVPHQNVLVITGRLIGNASLGMEDLNRTIVDKYRSRRIQLWDREKLIDMLVSAGLEEFYSTTSSGHMGYGDFHILYGKSLKGYISEKDIENHSKNWLDDLVISKNRVLGAILESEIITQNCRRNGFFYESIHSQLSALRVILFEINNVQDPSDDIFLNKILSSAVINLARDCFEYTTHVQKSWEESGHDLVKIIPGTGKIFTYLVNCARILEIAGLAFFLVQSPDEKQVLCKFISNFILSEQGCSHIPSDRYAVSIVFPVLALKKCERNEVALEFLHRLTIWLCDRYEQGNGIAGIGKSPLEEISILLGAPFSFIATMKRNDNYLATVLSDLAAFFEDDIFYSKVINDIRAVKIFPTYWQISDNNDLFIIEGRSIISYPNIEYLDHLKRFNDYDFAQHIIHEERTYGLSQKVSPVSIMTLMLLLRDRYFPTLWNLLIE\n>SRR4051794_33743283\nARSGWPGLADLRERRSRRRRASCRDAARAVKRRCRLVDREGSAGGGGKPLARGVACVVDAAVQVRADRDVRQRTCRGDRRRRGARRERERRDRGQESNYDHGERPSVAFERATELFHLPRQSPPNRERLRVSGIAAPACREPQGHQLVRRKPRQKSSPKRASRPSKGGLPRRRSRSNGPKCEGAARDTRPPSSFQGPAGPLQLSPCLAPTYAVCCEVTQPYVMCVGPCRVRPWSVQTSAALPPLSIAIEIESARSRLPSFTVQKIPFVQIPPTCMTELDADVWLNFGTASYPSVVCANVVYHGDCSGSLGVX\n>A0A1T5DHB0_9SPHN\nMARPYRNGINRSAGANGASAALRVRGTMAAAVIIIIIALTFSAAMLTGVMLIAWRSFGRPRHALLWAAAFAVATVEWIANLAFRIAHAQDNAAIYAAIAGLSCLSNALIAAGFVQRSRPQTGPGPFLIAAAGAALLIAGAAIVVPHDGVRDATGLLFGGAMMAISAAHVGRGFRSASLPERSVTLMLMLFAMLDGAMAVIALRQGIAGQGEAFALFRTILVLLYPPAFIGVGLFSVFLVAADLAETMRTLATSDVLTGVYNRRGFEDAAERAIRNAHRQRQPLSVVVADIDGFKAINDRYGHGVGDRALRHFASRVERLVRRGDLIGRIGGEEFALLLVNTRPQDAVEVVERIRRDIAAMPVSGPDRIVMTASFGVTGLRPGDISLASLLTRADRALYRSKLDGRDRVTSAEELEEA\n>ERR1017187_5107048\nMMRRPPRSTLFPYTTLFRSVGVGGKHHRRGGARVRQGIGGARRVEIRQGRRPARCRYGGGGGAEIEIRGQAVVIADGSLVKRDAIAGGIGAAIEQAEQSPGGTVVGEVGSGGRAEHGGREGSSAAIEVVGRRRAYSNELVRGKGEVDAAANAGAGQIDDIGAGILYLDELEVLVLIRAVRGRRRGVIVDLRDAQRGKGGDIKGFGRSAPCIGVEGAGDDSGIIGQRDCAAI\n>SRR5450756_1904656\nIVTPNGPGRLSSGGDGGLGGGGGKAYRAWLDAEQPAGQRLRGTLGLGEPDACRGDVEVGEAGAAEGAACRLGHGDRKHRVLLAARGEPAKHAAAPHRDPDVAVRVHGQPIGDALDPGQVDEDPSLEGVAGRRIIVEPVSYTHL\n>SRR6267143_246127\nPPSTSTRCRRAACPSRCYSAGPSSKRASKEPCRFRRSPGASRPASRCRWRPGKRSSTCISRTRATSRCSARCWTGSTATRSGAGCPPGSGRWNRCSRARRRKHEPRRDRPDRPGRALRGLPPVPVPGLGGEEPAAVQFRDAPPGILGGRASGAQLPPGRGPRPWRGAARGRSGALPPPRRAAVPLRTLAAGTRTGGRDPLPSRPGAVLLRPRGRWTGAAGRVHRALLGRARARFAPRLRAAAQPRRARSLCLPRGGAPPRAGLGAPAPGSARRRVRLAPGASGRGGRGRCGLPQPRVLAGPGGRAGNPRHHARLAHHPLRLPGGRPREPRRPLRRGRDRRDPVAPDPHPDRRREGGGPRDRSPRAGLARSDGSALPGRSDEAPRSAARAARGAPPGSARAHPTPAGRGRLRPGARGEGGHRGGRRARRPGPAAPGGHRRRRSGPRPRRLRPPLLLPRRRGGAAAMKRILVAGVGNIFLGDDGFGVEVSRRLAGRPLPDGVRVVDFGIRGLDLTYTLLDGWDAAILVDAAPRGGRPGTLYVLEPRLDPDAPAALEPHAMDPAKVLALVREMGGTPPLMRVVGCEPEAAGDFEVGLSPAVQAAVDSAVALVERIVAQLGAADAX\n>SRR3954471_23318179\nXMSTPPCRRAAPDALNAIRPAVGGCICGGARPAAISAAATTPWRVTLLRTGGSPAIPSFARSNRARTGSGTSRPTSITTVQNSLRPNAVPRTRPFPVRGAGCPATGPTSCVAASERSLRGYSVAVNKEKPDTADSDSGPSGADDDVVSDPAKSDGASGDWSDEGGAPPSGPADTGDHTQX\n>SRR2546422_8761933\nRCSLFVMRRHSLRGLARLCLLCFLCTHTALSYFFFFFFFNDTATTEIYPLSLHDALPIYLARHDGHASGDERLARHPGGGVLGEDRKSTRLNSSHGYISYAVFCLKKKKKTKKLTERIEHNTTDSPPAHADSCHTQHSPDX\n>SRR5258705_435907\nYTSYGKVRDLNELLPETAKAIAKVENPTLRDALAMELFGRGGVKMIQALTTIGNDMEGTGKKAKDLGVLLSTDVINAGKQTSIAFQRLSLAVQGLLLAIGTPLLSRITKMTEALVTWLAAHQHIIALRVHEVFEHINNSLNAFLAIAKYIVNNSGLV\n>ERR1719362_736321\nLKPYLANIAFFFSSGSCIWSHSLFGFTGVDLGSVFSIDLVVVFSLKYEGMLCCLLTVLLLCRFCISGTIWACFMGSMITLGFFTFGFNESSDIVLDMPEPFVVSKNFLIIDVLSSEPGTSVVFFSVMEGLLSKNEDASTLPMFFFVSAIVPGLLNSSRNFDFFESSLKGDVISGSVFVLTSVDFSSIKSRNALIPSLNATSLVFSQGLLEKSCKSSMKPFIALSLSLMLLASCSDF\n>SRR5262245_8711603\nCPPTEKRVGSSAAVRNDRPFGTSIGFVRRLLPALHNPPGRAGGPARLTRNRMTSRALITLLSWLTLLALSGLGSTHVGAQSGKPATAPAAAPAVPNRSGYLRFPDLNGSQVVFCAGGDLWITSDRGGASRRLTTHVGNEVYPKFSPDGRQV\n>SRR6478752_7265712\nFVSLVLLCFRPCSSLLWLDCCFLHCLFFFFLMIRRPPRSTLFPYTTLFRSHPVGELLADRPEVHARHSSIWVLATPASTCFITLPDAVRGRASSVSSTTVGTLYAANCAAQNSRSSSASTSAPGRTTTTALTSWPYTALSTP\n>ERR1740124_914837\nAAAKTRATEDARGRAREMSSMNVIMLEDGWAKLKTGGVKKIEDILEDMKDGVYKDKITTDEYSALYTTVYTMCTQKPPNNWSEHLYNNYCEAVKDYLSSRILPRIKEKHDEYMLRELVRRWENHKLMIRFLSHVFKYLDRFYVKRLSLPELAEVGSQAFHEIVFNAVKREVRTAILALIQREREGEMIDTKLVKDVVAIFVEMGGNRTSLEVYVVDFGEMLLSSTADFYSRCSSKWAEEDSFPDYMCKAEDRIKQEADRVRSYLHSSTEDKLLRVCDEQLLQTPETQLLEKENSGCEALLRDNKPDDPQEPQPNSDPPKRRRSPPPLPTVAGGSGQIDVISRLLKDRILLLGTDVNDEVANVLVAQLLYLAQDDPDADITLYINSPGGSVSAGLAIYDTMKFIPCDVQTVCFGMAASMGAFLLGAGTPGKRKSLPNARIMIHQPLGGAQGQAADIEIQAKEILFIREVRCVD\n>SRR6478735_628956\nQRRSERPWNAATWLTASWCRSDRRVLSDVGSEPLVAVSAANPLRCRSPQPSLHTEPDMDLGLTDDQRAIEQMFSSFFANEAPPAVARAAEPLGFDRSLWQRLLETGAPGMGAPESAGGGGARLSDLVVVAEAFGRSIAPAPLLEHIVASRVVYDADVLSGDAIATVALRPADADVVWRIVPA\n>SRR5256885_2358642\nFGGKTCYETENSSLLVMRFKLKASGYDVDGTDQTSLGQFSGRVQQTYKHSVPRFFVPEHGTMFTLALVRFPPTATTEIQYLNAKGTLTYTDIAVFFSSRRQHTRLQGDWSSDVCSSDLDPEATAVFPRLLASERLAGDSEPAGPDLASVTRPAERSSDDELPTAIQAPPAAGAPEPTQIGRASCRERVX\n>SRR5258705_12133918\nYVIIIKSASMNCMTDRPPGITALDERIPFLLSQLGAHIAGEFQRRMSATGVAPRTYAVLMALATEDGQSQRQLSARLGIHRNTMVSVVDALEADGLVKRTAHPDDRRAFVITLTDQARSLLPDLDNAGHALENAVTAPLSAVERNTLREMLQRIATGAGLIPGVHPDLAHSVAAIAKQRLSSDETSRRKRVDQPWPNRDPMS\n>ERR1043165_342850\nGTTAGTNFLGTTDNQALDIRANNLVRLRLNTNNSIQRDNAGNARGQNAIDLQASRANTTMVASGNYSVLSGGMDNKVLGTYAVIAGGEDNIANGDDNAIGGGASNWTNGGAATVAGGGGNDASGNYSTVGGGGNNTAQNTYSTVSGGHYNNAAGIYSSISGGLENHVLGLSSTILGGQNNYIDGNFSTIAGGAHLAITSGY\n>SRR6516162_8751238\nRFVFNGGPMRRLLLGSAIAMLGMFFAAPAMANPTPATGYLELCKYSDQTAPVTGPFTFTVTDGSYSSTQTVTTGTCTSPFQVPVGTATVKEQSVPYASVTAISALPSGNLVPGSVHLGQGGSAQFTITGGDESTTTTAEFTNKEVTGYIEICKQAVPGSGLTGSFQFAISGAMGYKQNVTVPVGACSDSIQVPAGSVIAQENPGSSTYVVSITSTAGFTTLPMGWTSNPDLLNARASVPVAAGDTSAETILTFTNSPSVLKLCKAVTNSSMLGVNYPFTVNGSPISVPAALAPNATCEIVPGIFTAGTTVNIAEGVVPGTQVQSIAVTPSGREVSGSNNPAARTDSVILGSGETVVTYTNEPAPPGTLKICKIAGFGVAPGSMWSFTVAGVPGTI\n>SRR5262245_26240924\nKANPKPEGVKTPPEKEAITVPSKAKAEPAKPKPTYVTVVGQLLDDATGQPIEKAGWEWGQADPKKPEQIAWGHSRQGDGNYPGGKFAGRVNIGADGHHHTWRVYSAGYETAIVVDDLAKPYPERIERVVRLKRGRNITGVLRDHAGKPVANGWVFFIPKGHRANIVEGVPGTDAHELPGRARDDAVAEVRTNADGTFAFSTGADGALAASTDLVDLWPFPLPEDGHAVLKMPTPSYLVIDLTYWYLDELAKKGKRELSPNSEDPNQCWLAVD\n>SRR3990172_2002343\nYTLSLHDALPICRRGIQDIFYAKSFDGGLTWTDPNLRVDDDTGSAWQAFPSVAVGPPGNVFIAWGDQRNGDADIYVARLAPAPPFVEAPTVDGFAPGSAEIDHLIGNVPAFGFTYRDLDLDRLTAYNVTVLDGALAPLWTCNRTLSAPLPDGFPIFVNYNVWPCPTSGPALADGSDYAVDLTVQDATGRWSVPERVGFHLNEVLGPTAPVQPAPGAVVPCSRSHTLSWTAPPADVEGELPVSFSYQVASDPAFTAIVASGNSTFNVTDPFTTCPGGPYHWRVRATDGWEASTWVSWNFSTFTPPNAPPSALNPAVEGYGEGSPGILRIGPDRPTFLWNYTDAEGDPQVEARVTVGTANGSNDIWDSGNLTLSGSALVYGGGTALVDGAEYWYGVRVHDGKDWSPWASVRFRVNTPPRAPLAGGGGRGGRPPHLSGLDQHHARVRVPLGLRAGLGPLRHGHGGGLHDVLLAGPGPRPARRRPEQLDVPVHHVPGPRQRDGPCHLRRAGPLRRSGDRRGVHPHVSWRRLVQPRCERHDGERRAGGLPPRPQDVPRARRDRHAPRGGPLGEPYRFLTEYLPPHP\n>SRR5262245_7034097\nYVLVTEGTTSFDTADVQVSTNNFATFTTVASRSTNLPNSSTWRSVAPVSLASFAGQTVQIRWVFDTRDGIANNFEGWYVDDVQITAPGTWNDYYSFTLGAGETATVALKNLTGSGTSLTLEDGTGATVATGLAGPTNFDRVISNFTGAPGAYFLHVSGAVAATYSAVVTRNAAFDTEANDTFLTAQPIAGGQAALGAVATSASTASTVIPNANTNVEGDFSNGFPFHISAFSLPSMRYQQIYASSQFTGGGVIDQIRFRKDVSAGTNFSTSNIDVKINLSYSATSPTAPSNIFANNVGAGVVTVFDGLLSLSSTGTGTPNPFDIVIDVANSFNYDPTQGNLLVDVFMRNSPVTTFFDAVGNSPGVTSRIFSNNTVNDTSGSSFQSGLVTRFDFVTTGAAQEDWYTVNVTNAASALRLETATPADGPNQFVNTLTPRIALFDPTGVQVASGTPLADGRNEFVQYQPLATGAYRVRLSAEAGTSGEYFLTKNFKPAVTSLSVTSPINENDVATLTGTFTDADPLDTHTVLIDWGPGEGTTTLTLAAGVTSFNSTHTYLDDNPTGTSSDNYPVSVTVTDSPGVSGSASTSVTVNNVAPSHVVLNSGNINENGTFTLTGSFADPGIQDAHTVVIAWGPGEGSSTLTLPAGVLNFTASHLYLDDNPTATDADTYPVSVTVADDDGGSGTGNTSVTVSNVAPSNVVLNSGSINENGTFTLNGSFTDPGTQDTHTVVITWGPGEGSTTLNLAAGVLSFSAAHQYLDDNPTGTASDTYPVSVTVTDDDTGVGTGTTSVTVNNAAPSNVVLNSGTINENDTFNLNGSFTDPGTQDTHTVVITWGPGEGTTTLSLAAGVLTFSAAHQYLDDNPTGTASDVYPVNVTVTDDDTGVGTGTASVTVNKLAPSAVTLSTGTINQHVTFTLTGSFADAGTLDTHHVVITWGPGEGSTTLDLPAGVLTFTASHQYLDDNPTGTPSDVIDIGVTVTDDDGGSATASTSVTVNNLAPVVTPIVAPTDPVAAGSPSPVAVSSSFTDVGTVDTHTAVWDWGDGTNTPATVTEAGGSGTVAGTHTYLAAGVYTVTLTVTDDDAGAVSVSSGYIVVYDPSAGFVTGGGWIDSPAGAYAADPGLTGRASFGFVSQYHVGTSVPDGNTQFKLHAAGFDFRSTSYDWMVIAGPKAQYKGTGTVNGIGTYKFLLTATDGQRPGGGGVDKFRIKVWDPVTGMVVYDNQMGASDTSNPVTALAGGSIQIHDNSHX\n>SRR5690349_22883871\nLYPLMSSLYSFLFVFFRLFSFTIFFFSMIRRPPMSTLFPYTTLFRSDARSAGSRSRHRPSRRRSRRSARASTPPARRRTRRRPRSEEHTSELQSRREIVCRLLLEKKKRPHLVCLLLLEKKKNTAQNTQ\n>ERR1700731_2171409\nLQDPTGAVASRGCGKVDLGVVDTVEDVGEDGGRESQADLDQLRVAIARSLDRGEILVADGATGLCELADEADQRVALGAAGGLTLADLPEHFRLRPGELGEMVVGGDAIVAAAGGADDELDHFLIALGQRARSENRTGGEDRLEGGRAVGCNGSECFRDAADGLLIPDDQQLLRTFNSPWRKNRATLVRAIKVSGAAICRGRTCARCAPNITRRIAARVLVQRAFTTQFEYSDRCFRPTRAFQSLKPCLSANSTMRRARWEPQVSASKLACRSCRRRSRTRSTMRLANAYGRSADRTGKAPTKAVLAQRYRPFICPRRFLFPF\n>SRR5688572_8862321\nERKLRWDNQQRRLPAGETGQPLAHADGHGKVLSVERVELGLVVEQFQMRRPAGLEEVDDALGLGREVGRLERSGRGRRAAGSRENGWVDQRGHRQRAQAQARARQQLTAGNEASLFQEFVHMLSRYFVITSSRFSSMLATVVYAASSVASSFSSRGDSPIERSFAAVSGFALYAANRRSKVSRSTFSSSADGACAVARRNANVIRSSAAVPPSCIIRSAS\n>SRR3546814_633682\nIDHDILYFLFFKQKTAYEMRISDWSSDVCSSDLIGKFGGEPIVDRENDGARGGSERAHRAVLAARRPHDITAAMNVEDGTPRPVRNIKQPAYRAAFAEGYGARLDAIRMAQGNFAAGHQTAEMRQIVEGKIVEIGNRRQGADQLRIDRRQCAGSRFIHLLSLPIAGLSAKQARRSVGPCGNKIGRAX\n>SRR6185369_2348986\nLVGITPPALPTLPQTSAHTTASVEPPDGTSQSARATLVGIADSATPSGPAPIGQRPTPTLNPVIEQARGTLLYFALQNNSYDLYTLNLNTRAEQQLTFNVGGDSYGIYSPDGKQIAFESDRDGDFDIYVMDADGQNLRRLTQNVVTDRLPSWSPDGQWIVFSSDVRGDTNYDLYEIHPDGTGIQLVFSDGERSSHASWSPDGRSLIFTHGNNLDGSTW\n>SRR5262245_26026989\nEPDLWPGKNDGSDFAGSAQYTIAIAIRTTPRMIAAAARRRLLLTRKKSRGPLGGGRVRGVRELAEFARDQVGRLLADVDRAVADPLDRACDDHHPQPPLAKAGLGHDVDEALDEPAVRPVDELVEIDEALGTMPLAPAERVERNADHLLRAVTHLRQDVDERRVRLGAGDELRELRNRDAPVCRPLEQQIDVEDREEEPQVACDRSLQRQXX\n>SRR5687767_9486488\nDEVSRMRVSTCLGFAVTLFVTGCDKAVGNASVTRTLDSLTTIVDSLNTRLGALEWDKLISGVEGVAVLRPSDAGYDRLATDFGSITVSLEDVVPYANGSRITLKFGNVTSATINDAAANIQWGSVDSA\n>SRR3954452_6150108\nPGHVPRQQEMRAEDLENPCKQVDFCRTAELPERAEEQREVRAVLVVAAVRDRPGVEVCGGLVVVTARRVVRQTQHPEQERADQCDRQPDGEPVAPPAGEQRGIERKRAPGTQPGAHPQPTARAAAAAASATCSTSASVSSGYMGSETTVRASSSAPASDRP\n>SRR3954453_16503950\nDRRRHVPAARRQTAVGVCVNWSRRWASRWRSTTWTVVTAVTLAQAAAWRGLAGQLVGGCASGLDARFDRTTVFTVDRVGRSAVDAGRDLTIDAPAVNQRGRRIERIHRFDRGRWRQRRQWLDHRRGQRLDGRRW\n>SRR3546814_3464296\nMSFLQYVVLLVISFFFFLRNRRPPRSTRTDTLVPYTTLFLSDRRRPGGCACRGRPHAPAGARPARPGQGAAAGVHARRHLLRRLPVAPEGPRRHRDSQWRGQPRRQQRRSEEHTSELQSLMRISYAVFCLKKKQHKKIDKSTSKTPNTQQK\n>ERR1017187_7010674\nPYTTLFRSSELRNSGRSFWDVRRATGGIHLFPCHFRLAGLDKSYQNSAATMLGGPVLPLMISVESTMAILFPSQPLGATASSFLIWLGSVRNSPAIRVPKQVIPAAVTTICSVFGSLSRRTIAX\n>SRR6266545_5506238\nRLSAALPPAACAGPRCRGGRAAGRGRSTRPGAACRSSRSAEDRDPVHGVRRAAHARVVAERRRPRDHRPRRSRHHPPVPAALPARDRRGAAAFVRHALSLHRHAAVERRGLNVRSLSRVVAATLAGVVIGLVVGYIPSLLAYGLVAGATQNTISRTGGWAEAGAVGGVVWLASAGLIVGFLQQRVLPPTARSIWWVVALAAVWAAAHVINMALRGLAGDVDLAAILPALVVISLVAGVAALRLATRVTRXX\n>ERR1041385_9034566\nRSDLGFLTDRRDDVRRDVPAEISRRDAQERDGALGAFLANPFLRRSTDRLQGREVGCIHEQDASVAPTVNYHLVQQGKIRRQYILLEAVAVDALLLIHVTIPARQEDRDSRFFGRGQSWSNRLCVSPLRDDEVVLLTDRANDPIS\n>ERR1719323_877409\nFTSTREWLVIMQNPNEDTEWNDVLRKKGIIPEKPKEAEVNEEDLVRMLEETIREKSGVKRTEDMDLDELDELEDEEEEKILLQMRNRRMAEIKARMEKSKYGGHGPGRAGRARGRGGGEDLAPDEEPEDGRDQGQNGKIKIWRRKRDYCSRLCSGSEQGRRRCVCDPALVQAGRAPLRPGQRVHEQAGAQVPHHQVHQGHLDHMHPQLPRQELAHDLRLPRGRLEVPDHRTRADARNELDRERVX\n>ERR550517_2316039\nSEASLEGTAMEEETTTVTDAVVAGGEGGDGRMEEVDEAMEEEAVDEAMVEETATVVEAVEAKTANPSQNSLAPRSTNSGAQAKLQVSAQKGSPSTMLQRPKTAVQICPQTELSVGAKAAMPKCASTAVX\n>SRR5689334_23514466\nHLRPCTVLIMRVPCFYLFFFKDAATTEIYTLSLHDALPICADHVDADVRGTPVGRVGRILFRTDERGRVPGVAGPPFLDDPSDADRKSTRLNSSHSSISYAVFCLKKKRTRPEDRTEPSLRAF\n>SRR6266436_2860317\nSPRCSKRGVMLIESSFMILFKALWLDNPKSKRSPGTLLSVKRIANNWRRNCNRVFHPQNLPVQLSSELLAVGVAFAQVIEMHRRLNGALAAQVDEMRHERHVLPVTNLLAHIAVAEFVSEKTRRQRMSLPRGGFXX\n>SRR5271166_360653\nCDARDVEFQIAERRDRDVADGEGKIERPEVVGVADIDVGDSIGKSDVNVPFDGDLYRDRDVHVLQQGMRRVEGEADVAERETAHRDRPDAQLTDRNRLQACLLYRELRDLELHDPCPPLGNELIAMSTELQNARAARPRASFLPVRRKYSLETDQRQLRREPIALSRRANGASAARSMVEEPLPPRLTRSAFAIAPLPARGX\n>SRR5438128_8400954\nIAGARSDWSRSGVAVRRGRRAARRVDGVGFPAPAQRRKRGPTGSPSDRGARSPGSVAVQSLAGTFQVFNSENRHPVRFGRGVARRGALAHPTLLRRRPMLPAVISVRAGKPASASRPSRASARVGLGIVLVALLTLSTASIVSAHAFLASTTPRAGERLLGSPSEVVLQFSEPVSVESGGVVVHTAQGAAIPLGPSESNGRSQLRIPLPPLAPAVYSVSWSVVASDGHQSAGEFAFGVGTEAIEASTAVTSDAPIAWPAAAAGAMLLVGFALGAGGLLSELAV\n>SRR5262249_6274811\nLFALAAQPDWPMAQVWREPLKSTLRRRSWGGDLDGPQESVQHVNGRVPFAGTSDDLRGRIAFRFDRRGDRLCALRGACNQKPARGLRVGQEMALPVRASRWKLDAILVAFPIAMRSAGDEALLRQLRSLVEQRDVPQIDCQPQSGAARHLQCMAEQAKARHVGX\n>ERR1700710_2726627\nCVTTRSRRTRRSGRDFPATSAGVPATRASSTRCTAPLRPQKRGKSGVLGCVPQCALGLQVFVEPVLAPLATVSAALVAAERGVEVERVVDRHLAGADPARQSTRSVQIGGX\n>SRR5438105_150411\nAADRSHGERRGRHEAHVVPALLVRRHAHPRRPATQVERGAHAAAPDLGLALLAGKAQARRAAARFVEAVHVHVLVGDPHRGPDAQAPEAEIVAPHELGRCVRAAGLRGGGARYLPQAERAADIVEVEVRVRHYAGAIEPAPLHGAEERPGVLAGAEASRFPTEAGVELAAPIGDAQGRALRYAHREAHGGGGDVAADAGIAGA\n>SRR5919112_1724051\nRGARRAALRDQGPHRARARHTALLQQDHHLPGSTELGRPRGSLPLARAREVLPYAFERAFQGADPRAQAATPDHGHPHHEQPGQPQRPFLRVQAGRGDGGSGVRDRPCLHGGARDLLYALPVGCYRGPGQYVRGEGADQDDARRPQTRRACDPLAAPLPPRAAPRRGDDLALLRGCCRTLRAHPWDPARRRPRSGGERGPPPYRGERTTGRGGAGREPRPAVLRTGRFRRGQLHGRVPRDDSGLILHPRRQAQAPLAATPYPGSPPRQSLAHARALGPARRHLQPAGRPRRRDTKRYSGRQTRQRTHRGMGRSQQGARRPHPAGSRRHKLERYLRPLHPLGRAAGDPKPHHDAGGPARGGGCAKWLKPRCELSDISYLFLLMADSAIWGGSMTLPKSLERLSVGGGALYVLAGAAGYFPGLLVAHVADAFGGDADYEAPGWELAGLGDDGAGGDDGTRADLRAVEDGCAHADETVVLDLAPVHDGVVADDASFADDRRVAWVRVQDAAVLDVGSGPDADRLCVTAQHGPVPNARFFVQVDVPDDVGSRRDPGGLCDPGEGVAVGKHVALFVQIQRGALTLYSRYTSPNFRSRX\n>SRR5258708_1650640\nPMKSRAPVMHDRCCDGARRARRSAMKRGASSGGSGGGVATLLAVVVGAAIVAGAGAARADVVLEGLPTVSVGYTDNAALAPTPVVAPGLPPRSDEFGIVAGIARARLRKAHAEHSLGYRLAETFYFHGRGPSSLAQELAWLSDLSLSAPTQLRLGASVAYGRTSNPTGVDASGAGPGAQLAISSNIISLGATEELVHIVGRRSRILQNLRFAGVHYLNAPGAFDGTFVVGAFVRGEHEVGQSLFSLELDVADNIVPGAVGVSDQVLLLQSLAGWRRDLGLAWWVELKAGALGVLDFHGTEILEPAALASLNYRQIYWFATLSGSQTATANLFIGAATISDQAMLRLALPLARSERYLLAGYGGHTYARLIDDTGPHRGYTLPPAAPPF\n>SRR5205823_11678186\nFGTMALSRFVIIRKGAIKRILSRREFYRNVIAPISRIWIVQAAVVLGQSLSHELTRFGTGLLGAGFSPIQKTVVTIWLFHGKRCPGSIGFRANCPGVNAIELTSTTRSSADFWDFLLNLVLAGSVFEAVPCAX\n>SRR5690348_5794318\nGGRGGASGSGGGAVRGDANKNRRGGGRGGASAPAPSDPTSLQPFDFEKANSLFDKDKLREEDGPLVPSAEAEAAVDDEPPAYSKDSFFDSISCEALEKQDRANYNAGRVTMDEQRRRDMETFGAVSVNDRNRYRGRGGRRYHNHNNRGGGYQRNYRVCL\n>SRR5208337_1056505\nSSSPLSSANGPTAPADDPSSSSPSSAHSSASSSSSSPTSSSPSTPASPSSSSISPASSTASPAATSPSPPPTSQISPPPRTAPKAWGSSAPPSASASSSVPSSVASSENTSAFTGFPSPPPSSPPPHSPSPSSPSPNPTTPATPTPKVSAATTPPPSSTSSHAPSSACX\n>ERR1700722_2816766\nLNRITNCGLVSKSCRIWFPFQCSGVESGEEDEDDKNAKEETAAVGDGVDNRVFVELAARALEPETHDPEEKNGDEKPETPRVLVELCRVQVRDVEGQDNDRGKAACGAEGAELLDVGDVVAAASSGDAAAFAQAFELGEALNQGEGEEEEDAEASEPGGDLDSSGGGAGDDTDGVETRQDDNVDQDGALQTQGVSEGGEEIDAKPQKEIIRFDQGQRVRX\n>SRR5262245_51317312\nCRVFSALITTKQSMMAMMAPTSISAIASPFLADAAAAAARARRRVSGCELVKRPGTPTSSLASVEAALPNDSLDPGRDESVDGTSGRESFPDRRGRHVESRDRKVFDLPSRSGWFGMLAGALDDDKRRERTGVLEPLPRRHVGDRVGPGDQEELVAVAAERLERVGGDGRLVALDLDRATIQAVDAVDRGLDERESITRRGNHEPALLPRVAGYDEEHAVERKGRARVHRGDDVPDVHRIERATEHADALRVPAHHGSVRAPVF\n>SRR5439155_7586424\nXWDAESVVDLVGHLVPVGELTARRVSRCEDGLQVGECGLSSDSSKDRVGEVIRRQLAVLVRRPARSPAVAVARPADLVRGELILTAAAFGCKARRDDDRILELARQECGGDGGAEVVVGVAARAVNHDHRAGDLLVLLVHSIRAIDQRAAGPAADRDPFRAFLLRDRARRGVSRHRRREADENTGGKDQRAFHVADDTTLTSTAWRLAPTCPCALYSIQPQDMVESX\n>SRR5262249_42789402\nGVLAVAQLDHARDAHEIDARAEIERADDRRARQDQHRELLEAVDERVRDRAAAAQVPQPERVVAVDHDATVVAALPHGDALPPAGAVFYNVPKMVTLLMFSGGLDSTAALYKLLTQDSGALRVHHVHLINREARARAERDACAAIIDWC\n>SRR5437667_1021999\nLETICLKCLEKEPGRRYATARELAEDIARFLNHEPIRARRANPVRRVWSWFIRHPWIVTGAASLVVLLTVGFAYRMWERVDALEWQHAHPKESPPFNSEYFLPVWFNFLLLFEFLFLQGVPVLSFLTLRARQQRANWFHWVFAMMGAVQLLFGLEILRRAVATQAWQPQFILGPILASIAALTNVWFGSALAWKALREARLDLPGVDLSEEPIEHPLEFTNQK\n>ERR1740121_1965673\nASWLAQERPAAAAGLAFRRARHGRTPACAEDCELRSREAVERIRQYAWQLVLQSRENISMAGKSAEWRLNNTLYERSREEQRNLQHASKQHREQALVQEREWLAAQTAHNESLRSAAEYELLSSAFSAMMKEFSKDRGLWQQLSQNATRLRQEFGDAVQDWSSAVGESSLASQTGEVLLRNSTATLYEDMRWLKEAHREVGVRLVRVGLQARPRGRVPGAAGGEPGAARAAGHADQCREAGQAGGDDYRGRGPGAGGGPLRSAQARVPSSGRARKRLFPAVSX\n>ERR1740122_63733\nTSAEPTAEADNDEPDEERQDPIFEALAILSLDGDVRGLLVAACCGARYVRRQLCRHPDADGAGFVLDAAQVHTTLELEEASVAPRVAPRVLRYPILHLTSGSLRLDTEPHEHDHVPTDDLTVVTTMLLEVHCFGVVLPEREQIDAHAEVHSQRSVGRQLCSHHVGGATSQCGLLQRQLVEGHDFDVAVGHAALLLSVCAPGPLRTRACSARIELVLNVAPSALVGHLVLPDCCCDQRVVSVGGCAAVAAPPAARDGAPHDVLNAEMSLAEHVGAIAAVIALAVLHASALPGHRGDGKRPAAAAGTLGAWLQLEAVGPLRAGVERRRHVVRNVR\n>SRR4029453_18409069\nMTMRRSDPRRLHAGRMPPLRAGLAVGETVGPRARPSGGPGSRQAPRREAHGPGVGEPAMAPRSSEVAGRLPRARRGAMAVGYTPGAGLDVQPKTGTAWRVTPAPRGPQAAGILERTAWGTITADRRALADWRAATGVTPVAMASPAASGRPVDPLREGPVAVWLVHAAHVQQGPGHQTDQAEARWWAPH\n>SRR6185503_13583503\nRLDFVARAEGWETCAVTVPRPDDVWLVSRRATAVRGRVTDAAGRPLADAQVWRVEPPNEATMTPTDSSGAFESFFTAPGAGQFRVSHPAFLEKTVAVAAPSTDVVVALEHGREVSGRVAFPDGRPLPGVPMYGENERVATTDADGRYVVTGLTEGRVDIRCGLGNDIERRFVESGTTGVDFVVDRPVARIRFVDADGRPFRFVTPRMRVCKDGKDLW\n>SRR5579875_218622\nPSSGRFCRLPRGRLIPAEVSAEALARERRMHSIVQAQDSFHNQLILLHRFGGAGADAIGERQQHQIGQRQPVDGRYERGSDAGGHRSQIGKPAQDLEETDHGSENAEGWRKSAGDFERARAAFQLALAQADAAEQRVLQFGSLRHIQREGERFSEERTAHAFEHRLNRQQAAGARVFHQRHDLVDQFGVIQLRRNKELARPPEGLNQRGAGGGHEKGPQGSAGDDQRSGGLKEIDEPYAAGRDAGQQCGGRDGDAGQHPNIQARRRRRARHFFQGGGGGQRATPARCEAIRLPRAGGRKQRRARRRRFVTGTSLKPSCLEMTRREAIVIAFGQPLAASDTRPFWEGKKPEDWTEEERRELLSRSPWTREAEVKFNGGPGPLGGPDGWLMAQPGVILNEPNGSTTRTPKKFAATVRWESALPIRLAGGNKSGKEPANYVLSVTGDLPMLGGAGEETDEEHQSRLENLKQYTRIEKRGGPLYLADFADQRGKGTEAGTRFFFDRSDPITLHDGSVTFVTRLGPIDLKCKFALKEMVYHGRLELX\n>SRR5277367_2534031\nQITSFCEEHHIDLLSTPRSRRIRTLPSRFKDAFITISVGQRVNMNNEDQYRANLYYPLINSVLIELNDRFSFENMQMLNGISALCPDSDNFLQSEVLKPFEVQMKADLSSLFNEIQVLKSMLKDTKLKSIV\n>SRR6266568_6098953\nGVTITVSAPSSAPAGLKGVHPAWSPMQPANVKSPAALMVKWLTVLPRVEVAYSCLPSAVTATPCAQSSAPAGEVGVHPARSPMQPANVGLPVASIVKWLTAPAWSPNLVVVX\n>SRR5207244_11792182\nGARGEPLGLWWARRVAGPAGARLGGALRQGAGASLPPRHALPPLAARQGSGCLHLGERPPPAGAERPDGRRAARRRSLTCSPARHRTIVGVGVRTRSALAAPAVAALVLAASAAAGPPGQWTPISKGSPLSSDEVGVARTPDGVLHVX\n>SRR6266852_3314374\nRTTSACRRCRSRVPRQRHSYDVSDQRECGPGRDNGDIRVASRSLLVGTDRPERGALRMNHNHWDDLARENAEYYICPSETDYSTPEGRRHFFAEGQLQVNRLLEDIGQDIHSHRRALEIGCGVGRLAIPMSQHFDRLSAVDVAPRMLKALAKN\n>SRR5688572_20022461\nMIRGSLGRLSSVPEAALRQRYWWSCRSSRRNQKVATAGIRMRRWKPARSPRRGTDPATRADRTPPPCSRRGACRWSGAPGGPALCTCRAALDAFPGAAGVGGELGRFILGVSDDFIDGRHAVADQPPAILAQALHALLDGRLADVMRWSALQDQRADLIAEEHHLEDAATTMVAAPLALSAAGAPVENRRH\n>SRR5579859_288497\nLSCRKSAGDNEREERKNGAAQTTHLDGTARRTLRAGGPFGAGRRHFLRDGGGNDRAEVSLDYVFAGGLRTVERRAGATGRRGSRKRGIDPPGPTNSGEGQGEEPEYRGGDAREQAIRKRYFDGFRGEPGDGRIAWEPLRQYQPGDHRCAIERRSGSSRDRRKSHEGSGRTERGSARQSPGVVGKRPGSDHRCEAGQRLAGKDSDRX\n>SRR5688572_26030911\nSRRGDRLRAHPSPARPRHGRHHRRNRVRDALRRRGPTQASCARGRSVLGAGLRSYLRRRLPMGAPYVVREPVGGSAGHRVSDYAVVHRSWLRWTVRGWPGSEPPEMALAAQRPHRLHLLDHRRGARAGRRPRRVGALRAGRVLGDPHRPAGARRVWSTAGRRDHRLDRPPGRDQPRCGHRASSHHRRPAALRVVRGVVAGGVLGSRRRARLRGARPGKLTAAKSEAFRVDRLGRSIVIAAGGTGGHIFPGLALADALRLRAPETPVSFIGTPHGLEQAIIPKRGYPLHLIDMKPFVRRIGPGPLIAIGSLILATGQATRLLRTHGAAAVVGMGGYASLPVLAAARRLHLPSLLHESGAIPGLSNRVAARMTRHVALAFDEAARSFPRSVRPRTVGMPLDASITDLERGSLRSDARSALDLPPDARVLLVLGGSLGAMRLNRVGVDLASRWRHRGDLRILLKTGAEHIEAVQAELHRREVSHLVRCFAFFERMDLAYAAADVALCRAGAGTVAELAASALPAILVPYPHAPRDHQTRNAAPLARAGGAVIVPDAEANGARIGAIAEELFGDEER\n>SRR5437867_1173916\nSAWADVALLHAALFGATIVSSRPIDDVEAEGVVLIKQHLKVGCARSPKVSRAPLTNEDAVGGGTGNRGENAAAAGESRAVGLCIGAQVVLICDNGLDDRLIRQGTVCAQIICIARKLQVAIGTDVCTGKTRTVKAYRKRKRNGGCAIIAMVAYVRVPGHDCVRRSRRGIVAASAGGSARERLLNGNHIWLDHWFGDALLGDPATAGLRQRKWDRADCDEQKX\n>A0A0T9YTR4_MYCTX\nMRSFCPGRSPQITVVRARSGRASVVISTRPGTSTSCSIPAAIISALARVRCMRSAPRSVRSCSTACSGLSRMADTRGSAEVSGTSSLVTSSDCTVTRTNSSIASTTYSIAATLRWASDTSRVDVTLTCLPAGERQCARRVSVPARRSRIRSWEINSPYRTSNGSSPTNRRKILPLVTSTTVWPASGYP\n>SRR5882724_3941186\nSLPSEGHAEGDEDTARGSGRERAVRDQRRLRLAVEVRRVAVFAEAILRVEEIGRDDAKLKRYPGRGGGCVDREDVVARLAVREWTWSDVRDAGAERPAQGPSEDEPWEVVKEGSVGAQDRAWHVRDGGARVVVCRADERQVRGFVEERSRTPQRAEPPRSSRADADDVAPLRLIEDEILVDNRLEDDRAGDERGVTQVAREGGAGLVSRDAGERGADVGDDVAGIDRADALAPAQRERKAAQWPRDQRSARQERSSRGRSDLVGLARAAEVLLCEAALVDGRVAGRRMRDGLRGAVVMHVIREQLGAAAPAEREPATEAQVGVAVEAD\n>SRR5258708_38243777\nHDVDRVVVGGQAADQLQPLAVRRGRELLVGDRVLAVALVAAAGDRLAGRARGIRTDVVVERNRTETTAAGTARSQSGCGEGGAGENRHALPDTVGPSPHLASNAELRLEWLPDRREDRRLWPAGRPALPRCTTSIARASSPATPTATSRTLALPNGVHR\n>SRR5262245_54597287\nGAVIASVGCAFTTVDAIDAPHVLAAKLSIESPLKETYHQYVPAAADEMPALGLQRPSPVGDAVPSVVPPEVPVEGAVAPVKYLNVSVPLVWPELLASVARIDVGRIAVPVPAVSGDVSERVGDHLPLRTCVTGMLAPQALLAAAFVPSVGIDA\n>ERR1700689_1111789\nAGCMRRHGENIDEALRRYEETRRPATAAIVQANRGFGPELPMQLVEERAPDGFANVADVITPEEIAEVTERYRTTAGVSLAALQRRTSLFEDPYPLSEHRGQGARKGIRDGGESPGTRATVWGKMRQWFHPIGMPQTEV\n>SRR5439155_12922379\nFFRRLMRLTGMGAETGSQKSVSRDALPVREQTPSLPVLPQRLDRSFTPARPLALETGAATKAMLALALANGDDFAGSLADAGSALDWRWMAAALALGVDRWAEPPARRSKQTNFSPKRK\n>ERR1711871_374509\nVQQHRDSNTESHTRAHSNITTQEQAIIDHANEQLRNNGLPNFQLSSDELNPYSQSTVSIVNGSGRQDVDVCSNNEGFQPIYDGPNLACPDGLLQFSHEIPGQNDWYCCMLPDDPMNISTDENGHKSSKFASMVASNLERLQSAPRAFKIGLGVTIIGITLSSKFRSLVSKIAT\n>ERR1711871_1877964\nKDYSVASEVTAVLSLILERAKYDDLGVSSSLLSEVYATLALLAQACQDNLAIGETPMSFVDDNLRMTVAMTDSIDMRNKSFAVPVSTYESYAGETSASLGMSDMADSENAAGSVGLMVLQYLSNPNAVPTNSTSLLLEATKYDSSSRRRTKRRLTSITDRRFNSGLRGRSSRQKRLARNQD\n>SRR5579859_5275108\nRPVLPAELAYAAADRVQPGRGKAREKVVLDMPIQSAQDRPPTPPDDEVLARLDLKAAPGIGTFLAEIRIVVRRDLVADAAPHLKARENEISDHGRDQPCREHLFPAVAGHRREKHILISDEDRKSVVX\n>A0A257SWG7_9GAMM\nMSAGTDSRRAPRGGALFVWCGLALVLLLIPSLAPRAAGRCGADRVDAQVRVTYVYDGDTVRLADGRHLRLIGIDTPELHPDHGGPQPLAEAARDQLRALLQRHRYQLRLRFDQDRQDRYHRLLAHAFLNDGSSVERRLLDAGLGTALVVPPNLWHLTCYHDAQAVAQHARRGLWALPAYQPVAAARLPRDADGFHLLTGRVTAVRGGRRGIWLQLDGPVVLRIPRGDLIYFVGHDLPALKGQRVLAQGWLHRSFGDRSGWFMAVRHPEALEVLR\n>SRR6266542_84348\nRDRHCRNLLRFQVLRAGPHEVYGYGPRGQEISRQTRRAVSGGAHTKGVHVKIRFARGRGGSLVAGGALLALTLAVLVQSASPSGEEGATTRFAPVDISMSGDRPSSFTPAALAGSSRTLMLQLGPAPLAAHDAAAARQGRKLSQNERAAIRAEIKSKQEPLLGRIRQGGADVVGQLQSAYDGIMVRGGDLARLAALPGVVAVRPLEKFQASNERGVPFVGTPPVWASSLTGAGVKVAIIDSGIDYTHANFGGPGTRAAYLDAFAHGTEAPPPTLVGAGAPK\n>SRR6266511_5884634\nWTSAALGTLPPHATTAAVAEGVGVGVGVGVAAGFFLGLFRMRAYAAKPRPPTATAMATDAARMRWRRRRTRSRRRRSANFANCRSRVFLLLWGMVRTDEPTGWWLLRPCDRRCRRACRSQRSGP\n>SRR4051794_24959122\nXMFSSAGSAIIGSSDEAGGGPPIPRVHHVQGQPIMEAKLRLATLVAISLMPSARSLAHAARPDVVLADFEGDDYDGWTTTGDAFGRGPAHATLPGQMPVSGFHGKGWVSSFAGGDRTTGTLTSPAFAVERNFVVFLIGGGGWEGTTCVNLLVDGRVARTARGPNTQ\n>SRR5437762_3811764\nFRPRDRVKASRVNAFQLPQDGRRPRLRWRRALILGKIPAHRDFSGVAGRQHGTIEGRLALGDDIVKRDLLDRLCQQLADAIRQRAVVDEIRRLAGDPLVVQRRPLLQVGGNVIGDRKVLSEHVSPAGGKSSRRVARYGKWFPNIAPRSGTYFRCRLPKAAAMPSGLPMRSISMSMRSPPQNNSPLNTMVGTPNTPSVSASSMMRSCSARAG\n>A0A2E6AYA7_9BACT\nMNFTAIECSTNVCSIASYKSNKLLNVIDISDSYNHSTNLPIIFKSIDDDLKKIDTKVNYYAISIGPGSFTSLRISLSFLKGIVFSKNIPILPVQTHAALNVGTEKIGKHYIIIDSSKDRCFIQKFNNHTQIGTPYIEKILNLKNLDYPIYGYSKNIEKNNYIKPSSLLIGAYVTKNYKRLIKKPAKDISPIYLSENVYKKIDDT\n>SRR5258707_10299995\nFAQDDRNGVVWWEADDGIVVIGVIVVQWFVFFFQAEDGIRDIGVTGVQTCALPISYNRTAMSRTPPPSQPDSPELLSEADYEERSEERRVGKECRSRWSPYHX\n>SRR5882757_10583142\nRINDAERRVERPAAREGQAVRPRMAGDAIPRDGEVAAPFHERGIRNPSPCAVGDSGIRCVREVGYDETGYDEAGYDETGAQAGGAIELHRGDGHGMTACQNMAPTPVPIFGGMPRARFSSTGSAVAESPRPRLPPARAVS\n>SRR3954468_7113634\nLDGHPEAPTGERSACELNVDGCTWDAIAGELNRQEIRRPTASSWSLVNTSKIARRAALVLDIYSRRIVGFALGQHHDTALAYAAFAMAECVRGGAVDGVVLHTDGGSNTPHGPSRLTAPDLGQPVDGPARAGARQTPRSSPGTPPX\n>SRR4029077_1358176\nSRSRKVPRQRCLRRSPSTGKTRGWTCAVPSPTLQGMGMDTYERPAGAGMEATQGPPQVGAVDSLLAGVLRLSHLADSTGEPREIFHALASELFAELGVEEVHVHHHAEQEDMVVVYMFGGDGRLSYLAPLGERPHGVAWVAESGKHIVPHGTRELAAAVPRLAVGGRVGAALLLPLAVRGEVEAVVILARADGRGAIGVGGSTRAAGGAAQA\n>SRR5271154_6067984\nTMRVLKPGDRILVSTSLKRANCRSLGRQDILALMYFNNYLSRDIASAEQSARKGKSIKFGNSMPTQAISSSWLSWRICKLMGHLIPSSMVSLFINVSDRRRRWDLSCCESLSFQASRQRKRFTSPGDKRDDKYPEFRTEGTVCQAHRYYFNDGNYITYRKRSMAWKSVX\n>SRR5437763_77052\nAAFHAGWHVPQLVHDQRPVSRRYRAVFDSVVVIIAGHADHFPPHAGKILAYALADRLLRIMPQIARKFLRKDDVIPLGVSIRPRVIAPGDDPVSHRLEVARRDEFIPPQGRQLAFGGRLVLGEDRIVALPPVHRDGTGRGHLGDARNRGDLVQDFVVHLYDAIVALDCRVRNRYPQRLYVLRILEPGIDAP\n>A0A1J6JVT2_NICAT\nMGSLMDESKMERMGDESKEAILYVNGRALLVYDVSKRHTFERLSSWLEDILQQRDTTVIVVGNKYDAGEIIRTVSAEGGEEFAKSNGCLFMEASVKTAVNVVAAFDKTTERICEKMGYGDVEEVDEALEINMWNWKGFRIGKNTGVK\n>ERR1700728_2000873\nGTAPLFSASQAIGRLLPCEQAHGASAHPAEPFAPDEERTPGIRCSCGQFEVANHPRALAHQRCVGSGTGAAPAMTAQRESTVTDLLLLQLIRLKGLVDAAGLASSTDAPVEAIRSTCAAWAREGLVLETPRGVRLTATGRERLADLLEQERAGLDLRALQAVYDRFGEHNGKLKAAITAWQVRDATTPNDHS\n>SRR5262245_41074620\nGRDLVREDGRRGRGHAQLGRGARRGPVDSIRALAGARAHGVREPPVAVADRRALPPAELRPDGRLLGADRPGGRQPQESIHPLRRAAQSVPAARRGGWECFAMNDVNVAVPVLIEQSGLEHQGNGRAGAERLGKVAAPPNKESTSEFFHFWVEKGKLCERTQIVTTSSQLGGRTVEFVGLVEEVYRQSRQRDMGEEVDRFDADSAVTPPFASAGFTYAKVTILRTDPVTHAPPTEESTVYLGGEREAEKGYGVDRMGKPMRVGLLRNGGTPFAGPATIDLDYLLGENGGHLNVNGIAGLGAKTSFLLHVNALLLHEAERQITALGISHSGRLQVVPVIFNVKNYDLFFIDHWGKQWQKEKLTALPEWRDYLGINTPTPFRDVQFFAPEDEGGNPAKVGRTDEKVRGYSWSLSDIIEHRLFKFLFSEEDIYDANFGGLVGELEEELTDESSGAPRLNTQGGDTATFAKLLQWFRANRDTFTDSAPGTRGKLLRRLKYIVQEG\n>SRR5262249_55421997\nXDQCANIEIIENFLRSGYDILRHDCTVTGSNLCHKMTAVRCANNGASERHDPSRVLPIQNHVIARREQSLEPIAESNALPTELVGSEHDTAQHRIQSRAIATAGQNTNPWPHVIKTRSERLGRIDESTPSRPLIVQLPPFIHQSRALSESVSA\n>ERR1719460_1257335\nAMGLGYTKKNWDNQSGKEKYPASAMKYWSELTSCGCKNQQAAATKFGYTQLTWDNKSGKEQQPHSAYKETWSLLTDDEKAAAMVLGYSQTIWDDSSKQTYPASAGKYWSQLITCAPPATAAGDAAGDANIVEDQQDQIGEDFIIGGVIALAIVLVVALVVTIAIVAAQSNKADEYSEESHNANVLDKKTDDDL\n>SRR5258705_15912\nPPFWRTWWFLISVIGAGIGIVLGVVWFLLSRQKNLFKQHALQAEQEILRLQNENLEKDICSKQAQLNASVLQSAHKNQFLEDLKANIQKIDSAETKSKSKELHRLTRSIDTELTQKNYWEQFQLTFNQVHQDFVHKLHQRHPHISATDSRLCCFIRMGF\n>SRR5665213_2795117\nQSRSSAASDVYKRQCPKPPAMFVSVLLVVAGLSSHAQQPVYPVTCILSNGDRLSGDLISISKFRLRLQHVTLGRLVLKRSSVAVCETTDSTTRVKLGDLALDTLPENSRTTVGVLPDVMPLPPGSVAPVVSLEHLMHPPKPTPLASRALPTYVSHVGWKRAIGMNYMLTRGNANVSNLGFTGSVARRADRSQVALSAKREFGSQDGNATENYFSATLRYDLALGPNDSAAKSRPSFFSEAVVEHDPFAQIGSRAVENTGVSVPLTRNKQNDIALEIGTGITHEAPTGVPSYTRFGGLLRLAARQIFGKAKSDQQLAIFPDLSGPHGHYRSNGDFNLSAPLISGVALKLGVADRYDTRPQARVRKNDVTVQSGIGIEFX\n>ERR1719443_2623778\nVHDFKRKRTMDKYVSDDSDRKPTPPLEAPRAEKGEVAAPQANAPASDTVAGVSVRGGFAGQRQLRDLKASQEKEGGGGTSKPRGEPLEEWTYSDYQNGEVLNPVNFDQQRDCGAWTAIALHAFQADISKKPIRVRENNQPQAVQKAKFSINGGPNDVINRDQDECMARNPFVSMYSDVRPNRVLRTRPPRTTLAVKKMGSVPAYTHRDAVTAKAIERSNARRTASKATYNEAAKTIQQIWRHYSDYLSSTKEWFLQCKMAAMQIQWTWRQYHVWRRQVDKLMTRVQAVARGFLVRRHIRKHFHIVRAQKICVGAHQRSKLKNMARCVRVIQRWGRGHLVRVKLRVFKGFLVQTVRVIQSYWRMRKANQEVALLQEEKQAQALLVKSAIHMQRLFRGWKGRQRVLVRQQEHAQAQLKAMMAVKCQGQMRGASCRSKVAKLRQAKLTRMNNAATYLRKMWLGYVQRKRHAEWKNFRVDQIPYIVTMQRIARGFLVRNRMWRAVEKEEREFYAVHKISRLWRGNRGREKWQRLKHSQLEREIAAACIQPVVRGWLARLSIRRGTDRTRYAHFELLKRRHLAALKILKQWKVMLPRIKISITLRKKQKAACTIIALCKGVRTRAMNALRLRQMCAILIQAHFRGALARARAEARFPRVREIRLAAVASQEICFPNRLKRKAFLIMCSGLSAPAWSTDLEVSKSKPAKTPEAKEAQLMLLEAVQRARAAGMGLIM\n>SRR3569832_936138\nAMTIRSSAARCGRTLAVMIALHVVPVLAAPADQAFRQGLSAYRSGDYGKAMKIWLPLAQKEDAAAQAGIGFMYHRGQGVALDDSKAAYWLRKAAEHGQPEGQLMLGSLYFYGTGVEKSYVKAYAWCDLAQDGGNADAQMCRDAALQSFKSEDDVKAAFRLSLELHQRFRRSRRAARYSCLFFLFFSVGFSVLPVI\n>SRR6185312_8416935\nTMWLLVRASHDERLRDSSLGWAVLTAGLAIGTKFSNGLVMLIFVPLVPWLYRRSIFSKGRLAIPWTLYGFPLTVFLPTILSWPWIWQDSGAHLGETFGHWNNYVVNELFLGRTAPAPIYYFLVAFCFTMPIGIAPLFVSGISQMFRPRAEALLRPLPPGSAFSARGWWVFLTIWLAVPFVWTFAGMRQDGIRYVYSAYGPFAILCGAGIVALGRGVAALWKNPRARYATAALTAVTACYLAVADVRTYPFX\n>SRR5919199_676836\nRKWRFNAEEVGKMRRIALEQAQLATTLFALFSIIRFSTGVGHPRQHLGIKSRLQLKTEDEGRELQEMSVIAICGEGRIAVSALRYTHHLLLASIPNIRLVACPNYSDRGYDTWYPSLSKAARAMGVDVVELDSLAAEQDLLLLSLEYRRIVKVDRFASKRLFNLHFSRLPKYRGVYMATWPILNGETEAGVTLHLMDEGIDSGPIVDQRSFALPSHITARGLYETYMDEAFELFKENFLRLIYGDYRLIEQDHSKATYYAKDSIDFAQHTKLDLSQPASRVERTVRGFYFPEYQLPTLENRPVRACHIIHGRSSEQPPGTEVCNTSIGAIYVAGDNSLVELVWAXX\n>SRR6185312_187726\nPRDVFPEHRSRRVAGYPEGVVVDTMRREEQPILMHAVMFEIFAVPLADIEEAVEAPQDAREDDRLGQADEHAAPCHELRVAAYEDGHPGAPARVRRLEIGPQTPARHDEGIEAAVGDLARDPGRIAAAKVLGRRPGCDVLEELAV\n>SRR6266851_1047964\nNCGLQVISSGGIASSTTVLSGGQEQVKTLGHALGTVLSSGGVQVVSAGGVANGTIVSNGGSVIASSGGTAGGTIVSNGGSVVASASGTASGALISSGGQEIILAGGIAKSAVLLSAGQELVSGGVASAATVSSGATLNVAAGGLVSGTQLSGGVTNISTGAVASRTTLFSGGVENVSSGGKTVSATISSGGVVNVLSGSHVGSSVIFNGGIENVLLGGVTGKARISSGGVQNMFGSTNNAIVFSGGLQNVFSGATVTATTVSLGGSTVVSSGGTVINTTIASGGTLELQGGALVSGTTTRVAGSIERIVSGYGLNNFTVQSGVTLQVGAAGAASGTIVSSGGAENVL\n>SRR6185312_1756791\nXMRAKPLCFSPASINGTSCCLSPEKLRATKVAPSVIASSTGSIGGWKLVSPFFALVPMSAEAENCPFVNPYTPLFSMMYSMFRLRRMAWQNCPSPIDRVSPSPETPMKLRLRFAALAPMAIDGMRPWTELNPWPPLTKYAVVFEEQPMPESFTTFCGSSDSSQAASTIAAVIESWPHPAHRVDSAPSYCRRVNPSAFLGREGWATLGFARNVMWTPAQRYAPAPWAVLGSALSSLRGRISWSTPSTMNEEEM\n>SRR3954471_24146024\nTGARRRRKPGPGGHRAVGVPAARAAAGLANRSDASTQGSPGMIQAQELLRRLADPGHDMVITPILDARQQIGAASVDLRLGPDIIVSRRATGTTAFDASDPQGFSRALQERQAYVRRRLGDTFHIQPGEFVIARTLEFVRLPPDLSAQALGRSSWGRLGLII\n>SRR5690606_23903138\nLEPSVITVESPEHKFLNKLMGVIEARMAESDFGVEELVMEMNMSRTVLYKKVQSITGFSVGDLVKNMRLKKAAMLFSQTSMNVSEVAYQVGFNDRKHFSREFRKFHELSPSEYIKKVKDESLNGSDL\n>SRR3569623_980461\nLVDLEVRRHKKKNTGQHHRMAAVVQGLRMPVEALHPLQFGLEFGALDRIAVRRIEAGHDHAFHRGFQVAALLVLWIAGQAAAAFDRFRSFRQDRHAVPRSLAVPETVVALRLDGRDGELLVRRLQFLQAGDVRRLALQPFEQVGEAGAYAVAVERGDAQGPGAFPGGFLYRGHRQCFFVAGLDSAGFSAGFAAGFAAGAAASLRRDSSSGRQAISRSWLGAISAPSAASGARVARAAAATPRISSGPLFTPTSGFDSVPRTCSGERSESRRRRLACGCTVRSSFSVPRSMLPSTVISASSVSMLNSRGVSTPSFATRSAAAQWMR\n>SRR5262249_45364707\nTVEVEQPALSDHLRAELAVGERGVGEFHVHPEVACRTVGEANNGNGAEIRDPMVAVARDARVDAVGLAADEPAEKIEVVDALTHEQAGLRVAVPRAGPDDRLRPRRGKEGPDPHLAGAADAPLVEEALGLLVDAAEALALDDHQLHPSGGTVS\n>SRR3990172_9952057\nRRGKEKRRRNARLIHAGILGICTSTASTIPRYSQSRAGKKRRCLPSGRGGWGTMSSEGVQTVMPVDASPIHLNPQAGKFESIKQTTPVCFHDPQTELGQLLLGLVRVRYRLPLKPELPCTAAAEALDQETLARGIFLPVHHPDRVEAMVSAVAGKILAAGLGSRLFLGLIAGLFRQLHGSGRSWIDNTVAVEVDIGPGDEETQWKGTGYPETTRVEHPPWHGGCGDIRGLQTLFSEIEEXX\n>SRR6185369_2406511\nFWASTNGGVDWTRYPAPDGSGQQFYPPYMDPYDPKHMLIAGHGSDLLAETTNGGMTWTKVTQAAGMAGGATAEVAFIDNGDPAATRKTWLWLATGTGGKIGTWRTTDGGVTWKHVESNEHVAGSTQVYQPDTKGVVFMAGVYSTQGAGVLRSTDYGQTWTHVGRNSPETIVFGTARSLYALYGVGLPADVGLEVSPVPGTGTWTTPGTPAAMKLGPAQAAILNDGQTSIILLAN\n>SRR5258706_8531874\nAMGFDLRSRNSQDRAGATNGNECDQGEPHAHATIETVQCRPPSNGRNVVSAQTQGAGPSLLRRGTRVLWRFISLHPLPFSAAVTGSVVYAITSVIGAGVLGRVTDRVITPSFSSHGHVRASTVWFYAFLIVLVALLRGCGVVSRR\n>SRR6266481_2504579\nTLRRGNDQNSRARQGRHPRRRYRQGLRAGPDLSRQPDAHHRLSLQRSDLSVLRGHDLRCSQDFSRAASESEIVLESLANQIQESMMQSSPLNLRRAIIWIGRLVLGGIFVYAGLSKLLMPNTHLWPMFVLRFSISMNISSFAQQVESYKLISPDASQVVAHTLPFVEIVLGLLLLIGWRLRIWATAITAIMVGFLAVVTRAYLLHMDINCGCFGTPEKLNGMTVVRDGAFTALALAMTIFAFIEAREPHPWSAPEKACAGLAAMKTLAEYLDLAAVAHGHLCAGQVLGVRLAMLGLRELGIDDPVSERKRIVTYVEIDRCVTDAVALVANCRLGKRALKFRDWGKVAATFVDLQTGRAVRVAAKESSKQAAREMFPELGKDAGQQKAYAQLSDEILFDKQRVKVEVQPEDLPGFKGPRVVCAQCGEGINFKREVVVKGRALCRSCAGEKYYETLSX\n>SRR6185312_10010982\nLLTGGSLNQDHIDILQNSMKPFGSNKDEDPPPDSTSLISSSNASHTELKSVSTIISAFKTLPKCVSLYAQHYISIDPANTDRLEPKFTNYGEYYKGTLDYIFYLGKSNNNNRDNIERETNEEIEMQVVKLLKMPREMDI\n>SRR5437899_3944324\nSDVCSSDLNISCGRDLRCCRPSGLSRIRFLYDGLALFWSCRRRGNIRRTGEIMRQQAHNRPERIAGHGSLQTLNPSKRNQRCPLGDPSQANLEFRFLRGPREDGRATKARGRKSVGGTPTWPAVGSRLPPRSVTRHVSLLAAQTTQWRRSDGX\n>ERR1712112_183966\nLMFDGIKDHPLNFGTLNYWVLREWASHCLGQDTREVGICPLGEKFAFVQALDPEGEHSLPSVHVCHRHTEQYPGYVGEVYMDGEVMDWETYQKRTGTLYPVQWSGYSFYLDDVGGSLQRVMVDHTVQYPTPSAYGMFASRALISGSGGDFSLGGVFPTVHVPTRPLDTSRDMGKVVYKKSPFSGDAAVLQELTENGYGFLVDKEEGFIYYSNSVAVAKGYPPVASALGWHKVPLRPLPSDWMVQLDQGQMAIGIAX\n>SRR5437660_607594\nRLGPPLPDSRRRRRSLLAPTGEGLDARLQPVRARLAPQAELDPRLLAPAEGLRPGRGAARGQVARALQPRGPPVVGRADVRARADPPAVPQAAGLSRQLGPGSLPDALPAVARNACLAPADAGVVPADRGARRALGARTPVVAAPGGGATARRGGRGRARSGGKERGARGVPGAATIAPGTGRSAHAHRLPVPDAVLRPPLGPARARPVALAHARASGPQAPPPTHAHALGGVLALARRSPPGDRDDPGRGGNGHPPGRGLRPLGPGGPRRRFGVRAHPPRSRGAWRRQTALAPSLLAAPFGRRVADTALAHGALGCGRARGRGSGRRRARCPRRDRCRAFAARVLRSDR\n>SRR5581483_1442169\nRARAQPHPHAGRLCGDLCRAGHAARLPRPSRHLHGAHRAHRCHPARPQPGAHGHHAGLPQRGLQRHQRRRRALVAAVGPDRLVLRAGGGVGAPAETDGVDARQGAGLAARRAPPRARAATARCDRPLGLCRLRAGPGLRRGLAHHQAAPHRLRRVPRHRGHGARPPRPLSPGPAAPLRAASPRVASGILGIADLGHPRALPRFRHARAMARARQLLAVNKPATVAHPPGRRVAVPRTRKTLGWRVGSTPPAADVAADGERPPERGLDLMQQDATKAELAPMTGAARVRHLRQILLWPVQLLPIEGDLQYWEHLAKGTDPSPWREVDDEFGDPTEFQERHYNEFVTFLPPVQRFLYGQGVGKAVRRIYGESPIKTMRRTDVATARVTLSRGDKPVELRIVHTDLYFFFDIDIAILAMEIAADDLPLPVAQEAVFRFGRAYPAYX\n>ERR1712159_470442\nNGAPEQDRLLPDETDLLSKPLHIELAKVGAVEGDGPLVRIIKSFHQLNRSRFTTPTRTHERHGSTCLHLEAVSVADFGVGAAWVTEMHILKHDPALDAGQSFALVTMGIDHRLSVDHFENSLGSFTCLSHRCEPWGNATKTLCSNLQAKHRDQDVAAREVTCRCGETATVLTRAVSGVLKLLRVFDGTVEEAECAHDVPGGKHET\n>SRR3546814_65869\nYCVFFHSFLLLFSLRSLLMCSLVCWIYTFSLLLFFFFFKQKTAYEMRISDWSSDVCSSDLFAGFVVSTQSVSAPGVQFTGVVCDHCADDSDGTCDACQSLCLELPRAVRVRHAGVLIAAGVRDFFAAKPAARTVTVVHPAAGRIHGPRAGIRDRRRARAALAQRAQGVWRGGCAGRGRRCRDCDPPSVVAVIAPRPRSRLRPGAGVHAX\n>SRR4051794_20208749\nPGQYGVVGLARNVDSMHPKSGGAKGLNAKIRNTLLCASAILVLTTVARAQPADPIGDLLAQAQTTPAMPPSLRQTVAHPISSADQALFAQAMSAAKRGDVSGARNAIANLSDPIAKKTATWWLVDQNAESLSFWEVDAA\n>SRR6266852_3879948\nXMGRLNANQPRELALTVSKNLASYADGGPELGVRFHLFLSFLQRSRHVNENRYRSVFMSIRDRSIRRSGLLVRTAVRRPSSCTKARRVLPNSLAQNEFPIALDQGRTWX\n>SRR5215204_675534\nGEIAGFEEAAAAAPAALAAAPGAGDDMRLGVREGAEALHDDGRWGVLGEVGHGARSFWCGAGARNPPGAPGRVRLRCQRARVLFRPPGEGRWDAGGPAGLGLNAGHDRRPTRFLPGFPVPGPGFHDRLDPTSRALRPRRIGENSAPSGQRGRPVVAGEWCSWG\n>F2U329_SALR5\nMMMGVAPVIACCLVLSLLALGAVAQDVDVTVYPGRLFRADLSLQFGAAASVEAIATLTGNPAPPAWLRVNLLPIIYGQVPDDIAGDRFSAAILLRINDQPVTRTLNLMVDRTQGLPRVAFEVHATNANETQLVGDRYDDLETAVGITRARLSADTGQVGSGVLFVRSVAPFETDRRNINPMTSNPPLPVNNAYINGTAWLTLGSKLSDSQLTCAELEATAGSLFAAQGLQLDFDLCTPFPISTNATIDRSRVLATVEMRTWARTKDDFNETIIPASVIAAFIFFPFALIFIIHYFARSSDEAIEQQMHRLVKNMLRRNRAHTLRVISDDNTIAAAWLANSEEEEVVPPRLSTVSKPSNTSLPTSEHSRNLRYRTHTRPPTYRPPPQHDF\n>SRR5919199_6745454\nRVPKTTDGESHKEEETHSSLDFPSRLCYPGNIITCRMGQNLLNYTTEIPVEKTITEIQQVLVKAHATSILTEYDNGAIKAIMFKIRGKNGQELPFRLPAKVDEAYQVMYGNRQQWEVRRYGEKWQQHARRTAWRILLTWVKAQLALIELELAKPEEVFLPYLLVKGNKTLFEDVQDKQFLLGSGTEEX\n>ERR1700761_7736419\nGQRFDSAQLHQPSLAMRAKAAAAQPAQQAKTGCRQVRKPARSALQHPRFSALGALPMLFPVIDSLLYVFNTVLGIYEFVVILAILVTWLIPAGVISMRNDVVRSIVNALDALTDPVLRRIRRVIPPIGGVDLSAIALLIALEVIKRLVNGYAPLLYTVX\n>ERR1719296_360158\nTHRTGPLADCVAWPSREGQPQALLRRAAARQPTALRAGTRSRACSLAEAESFSTGATCEAAARVAATEGAGAIVLLCRRRRRRRRRRCGPRGGEHAADVDGNLGCLLLVAPKLGNVLVAEDVQRTFLELAPIVLFKCD\n>SRR5262245_40312332\nAGRRDRTFCSGERPAAARLRLPAAGRGAQFLYGQAGGGKMPFNVWGRVKNMTRETKLGLVVSCSFLCLLGVVLGLKMTEPPEEDQGAEVAATEPAEGPPAPPTGAQPDTQPRPAKAADKSAPPAKADTAPPPLPPNVNNAIELTAGTAGQKKAAPG\n>SRR5579871_2118101\nESTQDPGMSDLELPPEVTLRAAPLLGDRRKVEQDRPLEEVRPARELVDAVQEHGALRVEDRLGVVRVELPRREASSGGQPAERIGDPRLEPAQVVEGKTPRVLRGDREIPLLPRQATERGGRGVHTRPEETRRRALGAALLADQDYDLVRTTRSKGRNEPANEEDEVVVAGDVDEPTKLLNGTTASRAGERTHSSGPTEPYERHSHDPPPLLRHLHAGPRVVSEVEVDRSFVLGEADVDLALRTAERGFALEHSRRVHDGLTPGRLLRPVEVKLREEPPELLRAEGPRLAMTAASDRGVTDAVGVVEEFDTSLASELDELRRNGPAVLLLVVVGGTRAAPRRLDPLGSLLPRAELRGEELEERLLEAARPLGRAP\n>SRR5256886_992629\nMFAQLSYAQAPNGTIPATFFGMTFSGGNAPSEYAAQPAAITSSMGTMGKESAAEWSYIEQNAPTGSGCPGTTNCTHTYNWTVLDGYVNTAFNHGLPFMFFFTEAPPWATNSVGCRSIAPGQACRGPIVSGHTADQQAFVTALVTRYGSKIGSYELGNEEDYQGTWAQYAAQSDLYVKAIKAVSPSALIVGMGWDHPDGHYAQGGDFDQFWSAWGAIPNNSRHLDVVSFHGYPHTFCAPSCVVPEIVISNNGLGTQGSGDCATTGFAKCAQNAIARNGVTTFTGGTPLLRDTEGSWGTTNYTIPAPAFISRMLLLNWAAGVSEHQWSYPDGGSVYGQLDGITANISAYQQTYNWMAGSTMTSPCAIQSGTVWTCGLTESSGKSALAVWNTAGASSYTITAGAYPDYKGLSGNTTTIASGVTSINIGAQPILLERNGSHAPRAP\n>SRR5688500_8464034\nAVELDPGSRVLLMAVDRWVQLGAKDKARRTLLNAPSSTWENVPRTQGAEALLNMGESKAAAALLRGAPDSEQEPAAKLALARVLTANGEFKSARELYLIALTKSPYVALETRIEYFEFERLHGSARDALAAYDKLRGEGFAADSLARHRLSLFVSRPGLAWAWRDALGVLTLLGVTLAFCIMPLLIIVPVHYRGLALRASGRAPAREGTSWTLLDAWYASGVFLLVGFVCSYVFALPYLE\n>SRR5215218_300340\nSPATSPRDSGAARWQQRSSSAAAFPLAPRNSTTGSPKNVRPTGAWVRSFDQLAAYQPFFGNCTRLLRGFGQRYLCFRSQGTNRFCTIRNLGLAAAFSKWGRAAGSREAFMPAYRLRDVAVLVGAVVVGAAAGFNGGWFAAVPPKVVTVDAPNKLATGTADTRTPATAPAPAPQAPPPIQGTAAPVTPAPPAAPAEATPQSDARNVRVIRPVEQANEISATARQ\n>SRR4051794_31039054\nPGCAGSPRPVHRRDDPSAVAAGPEEAEGVSRVRPVGRGARAPRGGWRKERRRLTLGATGVHAMVHQVRYSVWVALGWIGVYMMLWVALAMVPVLGLFLEKKSPWGWAALGVFLVCWVAHSRQYWRRLFDRTPQIEL\n>SRR5688572_28435885\nGALLPIYFFYDSAPSFLTLLLDTNGAMLGSILIFIGLRKLAKLLDIQTHFASPAVLASTLLVFLLLGLLFPENGSVSKNAVVQFIAQVGPIVDALRYGFSASLVWVIRKNANRTYSWALGWFFVALLSNALNTALIALDPLLMMTGLPVELLSMPFILNTFIFAIAGAAFYKMAHAAPKPTQDAGVLEVVMFTASLTSKPSDVDPILDPVRKITARHQAGDFTPQEIATLSGVYTKLEDYLVTQEPLRRVTREHLQAMIKERFDWSPSAAX\n>SRR5450759_1044538\nSCATATTTEWPVASRNVTRPAMKSAETTLPNPSGVRATPWMWLITVSWLGSSTSVVGIPSRLRELGATDPATPAPKYDRTSSSPRHASRPYHGEKWRPRFAVQMRVEGRMDESFRANQRKPLVVNVAAVQAGVGAGSLKTIKPSVYPRPVGYDEX\n>ERR1043165_7129941\nRRPAGGIVPWLARAGDQTAFAGGALGTETHIFRPGKVLHRLEGVSTSSFDASPEQLRAAAQKAHAALDPSRPRFLYVHVMWMHRPLWNHPAYHEALPELDVALGALHAEIGPEALWIVTADHGEEYGEHGGSFHANTLFDE\n>SRR5258708_5362479\nGRAKLRRAQGHALCPLAAQRRQPAHAALVALPAGGDSFARPQRLALAQLVEPRRGGALRNQNSLRPFVEAGIALVVLAQRAAVEPQGAARQPRQERAVVADQQQPGAVRCQPLFQPFDGGDVEVVGRLVEQQDVGIAGQRTGEADPPSLAAGQRRQRLAGTDPDLVQRRFDQMPVDKPPAHIFGGREIRIERRQLRRVGDPRAWLPEHRPGLQLDLAGQRLEQGRLAGAVAPDQAYPVAEPERYRDAGEDRPPVELNAGIAQSNKRRRGHDDAAAGSTRVGESPAGSTTYNSIASCPRRCPSVLGKFRTQLTAHAALPLTLWRDWSWXX\n>SRR5665811_2613661\nRSTRVRSSAASDVYKRQPICRSAARVRRSSDFCHLLTRAIRTKSVGSSMKVQAMAPPVTWSVSGEACQLYIGCLLYTSDAADDLTRVDLGGRRIIKKKKKKKKINKYL\n>SRR5256885_2171212\nVRGRRRNGAGVTGGTRTGAKARALEPLGAKVAASPGEAAAGAERVHMTLPDDVVVDRIVDDVRRHLGKDAIVVDHSTTSPRGAAARIPRLNAAGVRFLHAPVFMSPQMARDGVGIILVSGPRAVFDDVKPALETMTGDVWYIGEEPDRAAAYKIFGNSMLFVIAAGVADVFAMAKGLGIAPADALAVFSKFQPGGVIAGRPPNPSAPANFVSRRARVIALAHARVIDGTGAPPREDQTLVIRDGRIADLGDAAAVAPPPGAAIVDLAGKSVVPGLVMMHEHLYYTTGPGVYGQLGVSFSRLYLAGGVTTMRTAGNLNGIMDINIARRIAAGEMRSEEHTSELQSPCNLVCR\n>SRR5437016_5746367\nCLSPAYHPVRSTAFRMAIRGKAQLDTRVSVEDNPPRLSSRTICLTQVSNLLGKSSSSAARKKEVGMRRALVCILPFCVIAFSAFAQDAVKVDPQHYKVEFENDQVRVLRIHYGPHEKSIMHAHPNAVAVFLTANRSKFTLPDGKSEERSWKVGDARWTPAETPARKPDGSAARSSFGRAKKVAGFKNTHARSREX\n>SRR6266481_1587377\nRRKPRRPIGRSASGQAAEVRDIRPSVDMPVSGAKAASGNLLFSPSVTSLARLAIESGCELHRNRSIGGNLSHQVYLTRAVVAGDAAGVDLRRQATGLRRWQAAWTQGPQYCHRSRRWKTSQGSX\n>SRR6185369_7209777\nIVLGDTACPSSSCGRVNAQRGRTTMDLPSKTVFEVLLNNGVDTLHHANSVITSCQFLRQKSLLSRGSAERSGLKQTSQSSDATDLRYSLWYDVFMDSVDIHRRARKQNHYGPVLFLLDVEKLAATRTGRIWVTKLNPTKWAGVPVEDRWFRSKKELVTGFRRGTFDQMIVFRHSGGALPLADCLDEIILDDPDLKVDGYDLCSTAHGALTLAMSDFGLQVPITKRRCAPTCTCGHYYGSTNADIKDGVVKMFFPYQ\n>ERR1719183_2396889\nLVVGTGPRRPASRRKAGRMSALARHDDGAGRETAHSLAKDGGCPPAAPYSATTHEGGTAVDVVQYGADAPPGLTRPIGDPRPVSVSSGSAQQRSGPSLQSRAGTGASSLDSRSSRSSSSSSSTASGWSSVSSSSSGSWPDDEYPPPPPPPPR\n>SRR5438045_3528744\nPGAVAHEVAVAAANVGQAEREDPVQHPEGPLAVQSIEVDDDLGIARGVKLQSRGAALFAQPAIVVDLAVEDDAGAAVDVPKRLRAGGAEIDDAQPAVAEDGVASSCDAVAVRAAMREGRVHRIDPRANVAARLEHAMDAAHSVESDPLGDLVXX\n>ERR1700691_2800241\nHAIVVGIGDIVERAVGIESFDLAVGFLEDECTAGLLGEDAVVAGLGEVVAASAIGLEDTLFTVGHVNRDGPVGRDREEILPVVGPAVSQRSERVAGADRVKKRPREVQRYAARYS\n>SRR3989338_1552555\nGWDERGDDYKTFFFVRIAKQSEQRKIFIKEQKVFLTMEEYMLSNSTAQGKQELLAPLLHQNSDDTLFIRAFEERVARTIKTFGLLDGKKNIVVAASGGKDSTAVLYILSKLGYPVTALSIDTHIGCYTEQNKRNVITFCKTHNIPLLLKDFNTEFG\n>SRR5215470_13194424\nTHVRCGEPLHLATEQSRGAAGEQAAGLTPCPARGWMGEACGGTPSFRRPGPRADEHACKVMGLSLVHQGEVPTRITLGTAPGKITCWYSGGTLAGRTDPGRRERGCPALATNFGQLMTPRPFRSVCKSGLA\n>SRR6267378_3904149\nVLRLLNRLHELKLSDEELAKVGAAVGSDVPFFVYGGTALVEGRGERVRPLSVVAETWLVVIAPSIDVPGKTARAYGSLTVEDFADGDHTKQMVACVDKRKNVPAAFLYNSFDSTKLGISLATRVYAGL\n>Dee2metaT_26_FD_contig_111_7158_length_345_multi_4_in_0_out_0_2\nMDTSKLKSNLNINMRLINLDNIGEISRKNIRKFISTIYGFKATTKDLKKIAIDMGLDIGKRKDTQKTRTYKFFGEMYNDDIEKKKNISQQLDKQIKILEKKRGKTYTALDLNKDLLTKRPFKNMFKSSKSKRKPFSVNLISRVVSNVKLSTNFNNYWQFRNWLENEEKWNGMEMNSGETIIKIGNEEAEVWDLFNMTINFIEGGKTWGENKKTITRNIKFLNYECKVLDPATSHVGDNNCGIRVLSKLLDIKLNPKSIRKEINSPAGTLINTEQLNYIYKKNNGRKNLIIIDENYEGEFNLKDTDYVLYKDNHYTAIIEAKRQNHKETGKKKQKGKLAFDIETRHTEEIIMVGETKSKVLKSTILSMVYKCVRGKKMKKTFTTDNNKNCCVKFLDWLGHEANNGRYYNCVAHNGSRFDFYLLMSYFTEEDLLDSKTQLRGTSIIGLQYKSHTFKDSCCFLTDNLNNLCNGYLITPEEKAFSKLTNIKIGDKTITNHQLCFYKPELNFNEFMELETKEPEFWTEYVKYCEYDCESLFLVWEKFKFQIDTIIGKMGEWLKKSVSLNTCNTIGSLSKKLIDANNGVKSKKQPTKEMQIIRNKYKNGNKWKYGVCKADYNEEVKKLKESGNELYEVGGITGKPNFRKYCEFMSNDEEKYEFIKNFKRGGISHSNQKGYHKEGVCGFDIKSQYPTALMNMKIPVGKSRWVENYEPTAYGFYLINNIKWCSNVKLFKPVANKKDDGILDWATNKFNELYCDSYMIKYLKENCGLVNFNVIKGLVSNEEMISNKLFGTYVDTLYKEKAHQDYLKDSNQEYNKPYREAIKLLMNSLTGKLVEDPSRYFKLEFKSNDEKTQSINNVKINKTDANKGINYWVVAGVMVYSYSKRLLWEYINCLPNKADDVIHIETDGIYFGLPNKDAFIKNLKEKNDPIIRIGRELGNVEQEICTKEESFFIGKKDYMIGEPILNNDKSINYNKSKIRNKGIPKTTINDEGNKIDLLNKQFYIDRYNGKTCYKTFKTIGKALYDTKHHSGITLTGYDMVRKSTPHDFKNFKMYEEKDGKVIIKDWKKY\n>GraSoiStandDraft_4_1057263.scaffolds.fasta_scaffold10840448_1\nDNNEAFTLTATPAGGQAATGTGTIKDDGTGDIYKADGTTDTSAVKNDDRVVAVTSPTVNEASPYAVFTVTGTAGQTVSLGLTAGTATGGGTDFGSATATTNLQYSIDGGANWLDYSTTGAFALPAGGSVLVRTPINNDATPDNNEAFTLTATPAGGQAATGTGTIKDDGTGDIYKADGTKDTSAVKDDDRGLTVTSPTVNEASPYAVFTVTGVSGQKLTLALGNTSTVSDKDAQLGTDTGNAGTGVPLQVYDPSAAAGAGAWVDYTPASLATIPSGGVLLVRTRIANDSILEGAETFTLVATNTGGTSAEGICTIRDDGQGSIYPDNKTGADDPAAVKDDDREPIAVDDTYTVAEGGTITGNINANDTDPDGKTLVGSSVAVVNGSTFTSLTDSAHPIYTAADGYKQLTLATGTLYVKSSGQFAYVHNGGETPADSFTYKVSDGSELSVAAAKVSLAVTAVNDPPVPGKLPGGANDPAYNASAGRYEISTPEDTPISGRASASDVDGGPLTYALTNQPAKGTVVVNPDGSYTYTPAPDFNGTDSFAITVSDGKGGTAVITVFVTVTPVNDPPVPGKLPDGAADPNFNPAAGRYQTTTPENTPVSGRVRAYDVDGDPLTFAKASDPQNGTVTVNPDGTYTYTPKPGFNGNDSFTVTVSDGKGGTATITVAVTVTPVNDAPQGGKLPSGAADPNFNPTAGRYEISTGQDKPVSGRVSAFDPDGDRLTYTAKTAPANGSVVVNPDGSYTYTPAPGFNGEDRFVVLASDGNGGVVEILVVVRVSAAPVNTVPNGPMKFRGEPARVVGPDGSVFRVADADSSELTVELSCGHGLLSLPVRTGLQIVKGTGSNDTVVAFRGTKESINAALAQLVYQPITGYFGLDTITITSVDERGNSDRDQIDPPFTVELVTLGGNDANASVASLAAQGKTVVGSAVTSFDSTLIKGAQVVGDGPVGRLAIGTPLRQDGSVQETTVKVELAYADGSKETFDVRVTIYNPKLELITQLRLNPQTSLYEQRVQVTNTTPFVIDSFRVIVPTLPAGVSLYSRSTTTSDGRAAIEDQRPLQANEARVFIVEYFAPNVQRFTEPVLALEINTSGGVSTPIGTNSPVDRVVVGANNRTYVEFATQSGRTYFVQYRDGANGAWQTSPVAVNGTGTTIHWLDEGMPKTLTPPTAAREYRLLVTSGIATPLLITTQPQSTQVASGGATTLRVAMGAGGPYTYQWFRDGVAVSAATGASLAISDATLASEGDYHVVVSDGRSSIQSQTATVSLASNNPGRIVNLSVRAQLEASGTPLITGFVMEGAGSRPILVRAVGDTLANFGVQTAVRDTALKLYRGQSVLSENDDWTRDSEAAQTRSASANVGAFALAETAKDAALVRRLLAEPYTIHVDNRTTQEGIVLVEMYDALGAYDSGNRIANVSARARVSSGDGVLIAGLVVGGNTTCRLLARVVGPTLSSLGVTGTLADPTLELYAAGGSTPIATNDDWGTVQGAVLGERLFRRVGAFDLPLGSRDSVIVTRIQPGAYTLVAQGKGGAQGQALIEIYLIDX\n>SRR5450759_2854005\nHSVTNDLPEKRYILDERGAVIDQSAQSLSLPPPILTRSAPLLDSGSVVGRFVTSRSLVPLLQDTALVALFGLVLALAVYFSLSVLPLRALKRTLGALVQERERLRAIVDNAVEGIITFDPQGKLQSSNPAAGRMFDYSAAELVGRSAGDLLPEIDMANTDPAGRQAHLGTQETVGRRKDGTRFPIELAISQAIL\n>SRR5919197_598751\nAANPGLHGILFDTAEGVGDARDVLPERAEIVTGDFFEHVPGGDAHMIKSVIHDWDDEHSITILRRVREAMQPHGKLFLVEPVLPDDHEGLARSKVTLMSDLNMLIMLGGRERTEGEFRALLTAAGLRLGDVTPAPPGSFSVLTAGAGITKGRAGGLRRGPPRPVLPAALRRRARLARGLAGRPGRLX\n>SRR3712207_1410375\nXMNCKKILISSLLISFISCNLSTDFEPITQEEKSNYLGTRSQQSLVIFEDDFEQTGRIPDTTKWSLCPRIEPAWGKHLSESYDQAFVENGNLVLLAEKKEGEYKAGGIQTLGKFDFQYGKVEVCARFTKTAQGGWPAIWMMPSIHRYAGSSWPACGEIDIMEQLNHQSIVHQTIHSHYKNTLHFYLPVPAMISSYKRDEYNVYGLEWTPDYLIFSINGQSKLKYPNMHFASEPSKKQWPFNAPFYLILNYALGGPDTWPGEIKDADLPAKMEIDWVRIYSHTLSEHHITSGDTYNILTALNAKSAVDVAGAGTTDGTSVILWHGNSAVNQKWIVTELDNGYYRLSPVYVPDQALSAPLDSSATNQQLEIRTYKGELSQQWKIKSVGNGFFTLSPASSPEMSMDVIGEETEDGTSIALWKTTEKINQRFMFKKTRXX\n>SRR6056297_976187\nDDVGKIGIPDAILLKPGRLDDDEFDTMREHVDVGVRLLAQGQSELMVLAEKVALTHHERWDGSGYPRGLSGDEIPLVGQIVAIADVFDTLINARPYKPAWKLETAIAEIRRKSGRWFSPRIVEAFMTVLADQPELLARLERESWEDAQNGRLLGTVVAERRKRRHLAVLEAELPQARPRGGRDLGRRQDAADRRPRRLAHPPHVAVELMDGVVAGSAPLELDDHQTPLAVASVQIDPAHADGKLDLEQDEAVLDQLGTPGQRPLHLGLAAVQEQAALVAWSQRQSERGVEERHANQLGGRGSLRDQHGPSRLLDQLHRVDPRLPVQRLDAARRVHLQAAVRLEQQQVVAGVGGAGRPPVVDDLHLAADLEPAARLRELLAQEREQLAGAWLEQLRCDHGPDGTTGPGRHPRPVPCRHGTAWSARIGIRRRREGGGASRRPPLRRLPDLRQEPQPLVRAAEVRGGRRDVPRAAWYRRSTGGGARGLPDQPREPQAGGGPEVARGRSEEHTSELQSLRRISYAVFCLKKKKKKKKKQKKKIKIKQKKTHQQKKRK\n>C1N8J1_MICPC\nMHAVASTPCAAAAAARGRGRRRRPEDAARGGGGGGGCENASSWSSSCRRWEVAPSPRRLLATPRRATPRLRALRGDEWKAIAPPGFTPSALNLSYDEHEADALFERVTEVMDEVDVDAQSAPGGGVKLTASQKRALDAFWLSCGVASASHRASLVREGGKRGLFRDPRRVVERVTELEDSLWRAVGISEIDVGLCVGRFPKVLFFEPDFLIERLRLLRDLLPNVNLRKVIERNPQVLGMDMTCTLPAKMRELSVLLPHVDVIHLIETHPKILSTNVSGNVAGNLRQLKRLMSEVGVEDIGVEMMVTRAPRLLTSDVDGTVRERMRAIERASPGTFRRYADKPASAARMLCASEKVIDRIAFLHETVEEGERGSEIAAVNAPAGTFSKKHPGFEAWQRERSKARERERSADTGAL\n>SRR6202050_3633006\nFFYGYGDHQELHSFPTRRSSDLGRRQHSHHGYRPAIKGQRSSHNVRVRPEKRKSTRLNSSHGSISYAGFCLKKKNHHSHSGVLVQSDLLARDTCHAPNACSFSMPKENGPSVVCARSMSQSSGGPRHRHGSPRPRSSFFPDG\n>SRR5882724_974133\nICIGFGLNIDDSGPATPNTNTLTVQLDGVTIISNGTNVSSGTATVTRIGASTAISYSQSALLASLSSHTVHVTFSGTGFSGTIDETRNFTVAFYPTLPVSVRTPVGSGSQPGFRVKVWQINNAFSFVNGWLNRIVFDEQQLAGLISTNTADLTSFTNNGSFYESSTINYSLTLASGFIQPDAALPGVPGSLTVNDDVVYEMLSFVEFPTNGLYTMGVASDDGFKITVGDRTGPDVGLKVLAPASVAGRYFGVPTASDYGDAFGAALPKTPLVARAVLCDLPWPPSLPNNAAALSNNIALLHRDPSGGVAVHGIWAKQAGAVAVVLVDQDDQGATVDQRGAGRLPGNWGGSIAGFTIPVVMMDYALGTNIFALATSNTSSPVIMSIGDDSSYELAEFNGGRGDGTPTVFNVNVPQAGVYPLRLVYENGGGGAAVELWTVSGGTTISSMIRVVWLRRIERAPSRLDQP\n>SRR5882757_10675725\nXMTISDMSSRQAACAFSVPVSERDQLLGKRTPLKATIDFHPTIVREEQQLTSRLCSDQRVPIRLKGKLYNFGQLVSLVRLELMSRRVIQSAILAICGSPPSVEAPSLIRRGAFIPAVAADAEQEMQVCLGKNDAGADGEVVWSCLDADVESVEARPARPGAGE\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/mgy_clusters__subsampled_1000.fa",
    "content": ">MGYP001379502932 FL=0\nKNNVKKNNANKNNVKKNNVENIIKQEDDSESNEKLMFKISDDISNDISEIYSYNVDKSKKVYKTYNFYILILVLFILFFIYINEDSSILPFSYTPTPSPEFLNSSTEF\n>MGYP001093304395 FL=0\nMGVPVGVGVSVEVGVPVGVGVPVEVGVSVEVGVPVEVGVPVEVGVEVGMEVEVGMEVEVGMGVEVEVEVEVGVEVEVGVEVEVGVEVEVGVGVEVEVGVGVEVEV\n>MGYP000080920170 FL=0\nMPVLSGLKPESVFSYFEKLCAVPHGSGNTQIISDLCVSFARELGLKCRQEDCGNVVIWKDGSTGYENAAPIILQGHIDMVCAKTDDCTKDMTREGSGRLAGRKWSGQSNPRRTPPFVRRAARSPYAYRRRRTR\n>MGYP003331872083 FL=0\nLDYEYVATVFDLNASKWNAVLMEEYLQWIIDIFSDTHPDVPNFLFFFAIFLRDIHIDPIKSEHELILNQIEALQQQFPNKVTTIKRLKPIPIPILEDWIRDLGEQNQAVIEDTIKEIVASLPKEKREQYQNENQNLMLYIGSFEFVRNFS\n>MGYP001589871100 FL=0\nREVKRAVYEALKVLSGSGSPEELLNSVIKGTKSVVGLKVNVYFGEPNNATHPAVAYALAELINKIGVNRNNIIIWDRAEDELNKANYQTNKSAKDVRCLATLTHRNPRFAKPFIGYEDSPITIGKAQVRLSKLVNMSNVIINMPVLRTYKFKDNTGISNAITNMYHVVDIAEADMPFFYDNECNPGAAEIYNIPAIKTRTGLTVCDAIYPLYNGGPGDDQRYHWRANAVIASLDPVALDTVAQNIIQKYRDKVMPGEQPLKSAYLETCAKAPYLLGASDIKQIDVIEREI\n>MGYP000312263992 FL=0\nFSPFFNKNKKLQSLCDLLLKYAPDFDHKQLSRPVLHQKIFKTKTYKVTQINNLISDLLKMLYAYLAFVNYEAKPALGKDLLLEELLHKDIHQDVERVSRAFEKIQQHTPFENYDFHLNEYQRYDKLDRFFFTKGIRTYDENLQLKNDHLDLYYFINKFRIACDMASRNIVTNAQYQCNFLKDLLKHFESKHELLDQIPALQIYYKILRMIQEHEVEAHYQEI\n>MGYP001087948731 FL=0\nMSRAADPLLFGTAGVPDTTPQTSTLAAVKRVRELGLDCLEIEFVRGVRIMPDSAAKIRERAAALGVALSAHAPYYVNLNSPEPGKRMQSQDHLLRSARMAAACGARTVVFHAGYYGADSPEKAMSAIRAELSQVISILRSERNPVRMRIETMGKPSQFGTLDEVFEAITLIQTRKMPPIPIVLFGRDYWEKAINFQ\n>MGYP000560073095 FL=0\nRRSKGGSDFFQCLAQGPTQGQAKPRSDLGFRSRQSSVVMVTVAAVGVADNLATWLQGSDAAVPQGVDGATQTTRLGRADGRIGAQTSYELALRMWRAYQPWPGVWVEIPGVADRLILSGVSAVEGGALVAPGVLELRDDTLLLGLAGGTVRLDRVTPAGGKSMTGGEFARGRQGELAARGRIAE\n>MGYP000244154749 FL=0\nSIVFNVGSKSTFMQRDYKLDVSWLWNVYVLVICPILGHPLFPLISNRISKSILFLQNAISSALIALHSCVFAIANIFTCATPYKVTPLHIKKSSLKC\n>MGYP001210306911 FL=0\nDFRPTYNEEDEEPVVLPVRFPNFLVNGSEGIAVGMATSTPPHSLSEVIDALLALLDDADISNEALMRILPGPDFPTGGIIVNRDDLPAIYETGQGRIRIRGKVETEKGRNGHINLVITEIPYTMVGAGIGKFLSDVAALAENKVTNDIIDITNQSSKEGIRIVIELRKDTDVENFKNLLYKKTRLEDTFGVNMLALVEGEPRLLPLKRALQIFIDHRVVVITRRTRFELEKAKHRAHILEGLLIALNNLDEVIKTIRSSADADIAKTNLIHRFKLTEIQAQAILDMQLRRLAQLEREKIENEYKELMDRIAYLEDLLAHPKKILGLIQE\n>MGYP001762835755 FL=0\nQRRAGRGEEGGGAARGREPIGETQAEVAMRNQLRTAVDRAEHDAGVVDLYGQRPAANQKARKDMNLLDVGRYTLAGNRLW\n>MGYP001516588361 FL=0\nQMCIRDRINSTQEFAIFAESRNLNRNQNENGIDE\n>MGYP001111298869 FL=1\nMITELRIADLGVINDANFVPGVFPQAR\n>MGYP000402828031 FL=0\nEHILEYQNQFYYVGGKVPEKECVDKTENENYYLLTLAALAQEMRFRGLTDASVKMGAALPPRRFQQQKESFKKYLLKTKELHFRYEGGTLSCVVGKCVCFYAGACGDPYAFRSGSPVIAF\n>MGYP001006094493 FL=0\nAVIPATDLTKSPEEAAKPEAGNDINTPADKAVVKDPAKLTDAEKKAIEDKVKAVNPGATVAVDDKGNATVTTPEGKTAVIPATDLVKSPEEATKPNAGNDIVKPADKTVAANPEKLTDAEKKAIEDKVKEVNPGATVVVDDKGNATVTTPEGKTAVIPASDLTKSEKDVNDGKAKDNAVTPAAKTKVANPEKLTDAEKKAIADKVKAANPGAEVVVDDKGNATVVKDGNVSVIPSTDLVKVQDDATKPNGGNDANTPAAKTVVKDPANLTDEEKAKVKKAVEAV\n>MGYP003389908322 FL=0\nVSTDISSRYDAFLFIDETHALHPLHMQTIKDEDLPETFPTGL\n>MGYP000520683910 FL=1\nMVGRNGGMRSGDSLAIVERKKMSASQRNKGQRGERELFGILSDLLGTCVRRNVDQARNGGADGLDVPGWAIECKRVESGFREAWWVQAVNQSVDTDRKPALVYRASRQPWRVRMFLHDCNPGMYCSHAWVEMNLETFAFVVRESLETETT\n>MGYP000427244613 FL=0\nVDIFKISNVLNIGDIIHGDLDTKTITLPSLIVNDGINVIVPSNGVNKNIIGSDASGLTNLSFDKVEKKKLSFEDYGFVIDPANRLGIIEETVNTGNDNRQVTYLGNSAVDTGSIWGVAKTSNDGALWESVIAATQAGNIGIDKNNPESKLDVNGDIRFQTVNPITRLANGSSPTHVTLLRNLLTNEIEHYENTEWFTYRNVDIINGASANSVQSRIVNGRVQLRIFNLSNFTANQRFLILGPTFRPSNPMHAGALFPNNPADTSSFVNIQVRNNGSLFIDKDSAGLVYGGIITYDLW\n>MGYP003153183859 FL=1\nMKHPIKVSPVSRKPVLRKKVKVGDIVTCKWGSPFGVVVKVLAADQWRIVEACRVRWIDDPHGLGEEFSADLKVISRG\n>MGYP001561007815 FL=0\nIEKNTITVSKKINKDELPNGKIEITLKNINWINRKPNIGESLEARSRYRQTLEKIKIKDEKTIIFEKPQYTLSSGQSLVIYDGDICLGGGIIS\n>MGYP001231096471 FL=0\nLKILLLGGDTGESEGGAVAKEDFGKVSGDDCPVSCPDDSLWGVFAGTAAPEIHSGNENGRPFVLGLVDRVIPGFSIGGITDIPEEMLAETVKGDAPHVAGGDDAVRVDIVPHHGDGSARHLLDGNQRHFRQRPGGRR\n>MGYP001181966303 FL=1\nNTLTNYNSFYADEMNTTNRVENAFVQNAGSSSETSNNGLSSFHGGATDLPDMKFNKERNYDGGGTFLPTYDNGGMTTEHGMAMLQKGETVIPKTQNMLSGGGGITLNIGGDIVTNDAEDFAQRIADVLPEALRRQDDMGGI\n>MGYP001558603255 FL=0\nMLCDNCKERDAVINLTQVEHDSKVTLHLCEQCAQQKGVETGETVLKSPLGGFLTALGKGGGGAALLPTPTDGLRCAACGATLRDFRDSGRLGCDQCYVTFDFHLRDLLRRLHGSSQHVGERYELPGVDDADPKGRLLELRAQL\n>MGYP000721412648 FL=0\nVSMGSDGAVLLDENGYSYKINALNTKDAINTVGAGDSMIAGFIAGYKLSSKYEEALDMGIAAATATTASMFLGKKEKIYNIYNDIKDARLSKKGECIDW\n>MGYP001793408712 FL=0\nMQEKDIQEKDIQNYIKKIILDEKTLDKKPEILVSYPEKTDEKGHITVICGKNHSGKSYVLKKISEALTKTEERKKYNKDEGILQCAETNLKVEFSSLGDDLPEVGKILSIGDSTSTKRIYEQINSITFKELRDNKIFTCALYFNDDKNSFLKILTSTNLKENFRFSSIHPPVLYSNKFFDTLLKNRCQQYLEQYFQQYFQQYLKHYLKRYLQQNFRQDFKQYLKQYLKQYLKQNFQQDFKQYFQQYLKQDLKQYFQQYFQQYLKQNFQQDFKQYFQQYLKQDLKQY\n>MGYP001036737385 FL=0\nMAGKLAIQGGEPAITIKDPE\n>MGYP000214490624 FL=0\nRSLALYDTLLDEMHDDAISHTEVAAELAQKTIGNGESDDDDTGAGIASDSPAEASKVKAEESEDDLRLGPDDAESWSDDPVRMYLTQMGEIPLLTRKEEIALAERIETTRAAFRRKLLECDFVIRASAKVLNRVFQGELPFDRTVQVSVTDQLEKEQILGRMPHNLRTLDILLQRNREDYEIATNKRQRVAHRRAAWRRLGRRRHRAVQLVEELGLRTQRIEPMIKVVEDFSRRIDELKATLTSMKKTRRSLTERKPLMLEYRSILRCTQETPTSLRNRINYLKAVYCEYQTAKRGLSEGNLRLVVSIAKKYRNRGLSFLDLIQEGNAGLMRAVDKFEYRRGFKFCTYATWWI\n>MGYP001362031269 FL=0\nGGPGGGPAAGPRRPFEGVGVGGKDTRIEQKKQRCLLGGEEGGDDDGE\n>MGYP001241401404 FL=0\nKDIFLKIILLFPLLLNSQIQRVDPPNWWIDFKNNSFQLLFKGESISNLSPTIKYQGLKINNITRSNSSDNYLFVDFAMDSTIKPGKFTIYFNGNPQIKYKYELKERSFDKLRFNGFDSSDVIYLITPDRFANGDYANDVIHKLRENKINRSDDYARHGGDIKGIIDNIDYLSRMGFTALWTNPFLINDMEKHSYHGYAITDHYKIDPRLGSLNDVINLSEKLNSKGIKLIMDQIVNHCGLEHWWMKDLPFDDWLNFQQEFQSKPISIDKMRISNEYNQDSINKYLIKTNHRRTINQDKYSSQFDEIKMLNGWFVSSMPDLNHNNQFMSRYLIQNSIWWIETLGLGGIRQDTYPYSDKKFMSKWASEIMYEYPNITIVGEEWSYNPLSINYWHKDSNNSDGYVSNINSVMDFPLQKSIIEGINEKESWNTGFIKIYESLSNDFYYSNPFELMIFIDNHDINRAYTQFNKNIENFKMAFGYILSIPRIPQILYGSEILLHNSDRIGSHGKIRSDFPGGWKDDKKNGFNDIGITNNQKDAKLFFKKILNFRKSSRAIQKGETIHFAPFENIYVLFRIFQEELLMIVLNKNLESYKLNLNRFREIDILDKTYLDIIRNDSIKVKNSIIIPEKGFYIFSIR\n>MGYP001468330683 FL=0\nKKLTPIMTFGKMPIANGFIDKKDLKKEFFFDMSIGFSEDLSLLQLLDHPKPEAMFNNNYPFFTSSSRFMVDHFKSFSNWLKKNYSNHIKNIIEIGSNDGTFLLNFKGEDMNLIGFEPSSNVSDLAKKKGINSVNDFFNTSSIKNYSNYINQTDIICAANVICHIPNLPDLFETINMCLNKNGLFIFEEPYLGSMFSKVSYDQIYDEHIYIFSATSISKICSLYELELIDAIPQTTHGGSLRYVCGRKNHHKQSINVKKILDQEKKMNLDNIESCLQFKKNCKNSKKKLREKLIKFKMQNKKISGYAATSKSTTILNYCDIGPDVIDYICDTTKEKIGKLSPGKHIPIKPMEYFYNNQPDVAFLFAWNHKKEIFEKEKEFSKKGEWMAHVEL\n>MGYP003628530332 FL=1\nMILLDSAQSMIRNEPITLSAVILVLTGTISYLYRERDKDRKAERERFLDQIDRLEEEINDLRNRKEKRKTL\n>MGYP002780399917 FL=0\nTGQIERRRETGNVVSSISADDVEPAAVSDIADMLTARAPGVIVQNNSGTTGTSQRIRIRGSNSISLSNQPLLIIDGVRVNNNALGLNTVEARAVWVGGQETS\n>MGYP001284371659 FL=0\nHGVGETQVRGSSSSASSSSSLKRNAKEHRNPLARTKGENDAASLGGKYERSKSKLGDVLVPPKAPARGVAEEGKLGSTTIESLSRDGDEERARDDRETDETMKKLDGYFNFDDNASNNKASEEKKSSASSLSSNDDAETAEEAKTKVEFSARKNEEDGSKTITSGTKIDESISDKDALDAYFSAKSSSSQAASVASSSSGSSSGGGDLSSAVKTALDARADEDPSLEDLKSSLKSGKTVNGEELEGKVETKPIASTPKASSLTSSVNMEVEAEKLLKEASEETEKSLSSTTKTAATGSIDSTSSTAAASEKSKYVPITTSHSMRSLSPIAQKYLRPRATSAYASTSSTSSASAAAAAAPSLHSDLASSARSLYSRDASTSGKSASSNKNAIAAKYANMFSLRSSDASSSSGKPSTGYA\n>MGYP003656136555 FL=1\nMLINLNVKNKYTNCVMKKGRRYIEPELGKGDKKGKNIKPKKTKGFAWDGKSRPVDDAYRENWKVIFGKQEKTTAEKENEEYLEEIKNKL\n>MGYP001595159463 FL=1\nMKQLNDMMRVGLGVRKMLSVCPHNPQPTTHSGNCLFQSCRAQSILEFTFSTIVFLAMVSGMVLIFRWAMMDLAERRFDHDRNLTVNSLTPEQQLAPDFHRVRAMDTFLFKKP\n>MGYP001794431668 FL=1\nMYVQVAGLQCNNAVNCSTVTLIWTDVNSVTVIAGSQENFPVVSDSTMTVLLTDLIVVQHSC\n>MGYP000352505163 FL=0\nVVISAPVFSKQLINTEIVTGGNSSTQVVAGEILTYSIVITLPEGTIPNLLLSDTLGSTSGALAYVNCVSITASANVTRTGGSGGTTGNWPSFALMAPPTELPTDTVSLTDWAMFETRLEPMQSRAHSFSVLLPISGPGSDIATLQRDMDLVRRVVSLEKPAHTRFDIQPYWTLFRLGQVRLGLDTLLGDGSRDPQLAPAMVLGQGHIGSSRTASRRDVPPDRILLEC\n>MGYP003280527331 FL=0\nMSDGTAVQFKTEKRRFLCFFY\n>MGYP003443885239 FL=0\nGVTSIGNDAFRGCSSLSSLVIPDYVVNIKGNPFSGWNGELKCLSPYFIYDNKVLFNKDKSKIIAFRDKNTTSYVIPDSVTSIGSGAFRGCWSLSSLVIPDGVTSIGDYAFVGCGSLRSLVIPNSVTSIGGGAFSDCESLGNLVFPNSITSIGDCAFDECFSLRSVVIPDSVTSIGDYAFDSCRSLTDIVIPDGVTSIGDCAFRGCRSLSSLVIPDSVTSI\n>MGYP001559223103 FL=0\nMLAFRRDVQTTQRLGGRSLRFDGRRPVRGLGSAVVVGSGGGMTVHGVELQNCNSLPFGAQYSCSLA\n>MGYP001074122584 FL=1\nGIAVGMATNIPPHNLREVAEAVLWALDHPEATDEELLNALLARIQGPDFPTGGLIVGRQGLEEAYRTGRGSIRMRAVVEVDEDARGRTQLVVTELPYQVNPDNLALSIAELVKEGRIGGIADVRDEGSLRTGQRLVIVLKRDAVAKVVLNNLYKHTQLQFTFGANMLAIVDGVPRTLRLDEFVRYYVAHQVEVIVRRTRYRLRKAEERAHILRALGKALDALDAVIALIRGAESADAAREGLMQLLDIDEIQAVAILDMQLRRLAALERQRILDELAEREAEIADLTAILADGARQRRIVGEEMTEIVDKYGDERRT\n>MGYP001605154428 FL=0\nRLIKSLRAGFLADSFGRSKRQWRGGSHWIICNHXHRYNTHHRGHHDSRTIISSNSWRGRRIEHSWTGLLYMYVRFKVX\n>MGYP000199882868 FL=0\nMGKAKKFFMYLILTVASILSVFPLYYMFCASTNRSIDVIAGKLIPGTYLIDNFKALIAQQNLRLALCNSFRNATVLTILCLLVCSIAGYGFEIYHDKGKDILMSILLLAMMLPFVAIMIPLFKMFTSWKLVNTWIALALPSISTPFMIMLFRQAARSFPHDIIEAARPERNTDFLPDVHSGDEIYLWSGDDGYIYECVEQLSVADDHFTGQQGDHHADVSSQSEEWIQCGLWYADAGSIDLYTSYSDHLPVFTEELCKWNYGSSEIMQQKMPKQETMTQAHIRKAQGAFLLAHRMGLIEDPSMEGLKARRKKHNEELRRMEQEGQRFYGPHYFSAPAYLQYELTRFKMDFAEPCEK\n>MGYP000548054597 FL=0\nMLRKILVPVRGDGKGDNVLAHAAALARGFNAHIEITHCRAKPENLLPFGVPIPAALRAQLVESTSQVFDIEDYNLPYFIMFSDYRVATNKKYPEIENDIAESLCFFLLPFVYDNETYDEYLSFYNSYEEDEEFNLYSYKTKSGKYI\n>MGYP001129376977 FL=0\nMNDFSETNPYTPLVFNSLEVNEQNFCSNLLNRLIVFTQASFHYSSIESLHLFREIVNSSRSSQGSLFSPFFFFKTKKTNLKFQISNQKDKDKEKEKEKEKDKEKEKDKEKEKEKEKDRPKMFKTDAQLLFYCYLIAPSFRLAKANVKLSQDVIFFFLSK\n>MGYP003295116401 FL=0\nLREAYDYLLLDLPPVAEVTDAMAVAPKVDGMLLVVRQNYCDRIVLSETVQQFAFINAKILGVVFNCTSEHGGKYYGKGYYKGYYRRYYKRYKGYGYNQENQNA\n>MGYP000887695439 FL=0\nKGEYYLEAMVFDLNSKGQYLPEWYDNAKDMTEATPVILDCADAATADFYLEKMPEPVYHKVSGTVKDAETGDPIQWAIVEFYGNDPNGYGYSSYASTDEDGYYEAQILEGVSYIAYANSGYRGKKDYDTIPYQDIYLPQYWDGKSDPSEADPIVAYEDVENINFNLEKYVFHENLITGIVVGEDEKELSDIMVFAYLIDGENVDESNYKYHGFMGYTDHNGKFYLNNLVPGTYVLFAVPARPMKYAPGFYMEDDLAILTWEDATQIEITEDGEFGPYTITLPLFENIFGEGIVKGKVSSEIGKVKVDEEVQGNEDGLQGAFVHVTDYLGARIKTSETNSKGNFELKGLANGTYTVTVDKVGFKSTSFQITITDDNKVIEHGVTLVKDDNTTDVNDDVLSPLSITVYPNPSVESFNVQFNSISGKSDLQIFDNMGRVVYQQTVNSTNGANYININSDNFTNGTYYIRLSNGNSTVLTPVVIAK\n>MGYP001202805109 FL=0\nGVDGEGGAVRTWLGLGSGLRVGVGSGIGLGIGLGIGIGLGLGLGLPGI\n>MGYP000917578306 FL=1\nMNKKFTSLLLLSSVILITTADKTRTKADTTDSSIEQQENIINEAQSAKDKSLSDISLLQSKIDGIRVEKNKTEQKISEIKKQAQNLNNKIEELSKNIEKRTDVLESQARSAQVNSNATNYVDTIVNSKSLSDIIQRLSAMATISSANKSMLSLQIKEQKDLNNKSDEVKKNYIEYDNLVKNQALQEKDLTSQEKQLKVASLNYQSTIETAQDKKENLLKQKSTAEKEAKIAQAEKEKVASAQKSAKEAYTSSSVTNTPSSSVEKSSSPKKENTKTSSNTGTTVEQGTGTSSNNDTNNSTSGTGNPNYNPYAGGGCTDFVWQYFAAKGIYIANIVNGNGGYWGTNGVSQGVLRRTNLAPGVIASGFTFHFTGYGTSTTARTSPYGHVAVVTGVNPDGTFNVQEAGYGGTFPWGNVRTNISPENVVFLLPN\n>MGYP000491110560 FL=1\nGTAIYGETRAIPLNLVDFTLRDFATRQSDDSQTISYLETDYSNSYQFNLDSNNILRLVYDLAPTARGFSRSFDGSTSATNFTVAVIPISARAPVIVSDGGGPTASLSIAENGAAVTTVVTRSNFRHLAEIVRLATRMMTGAGLAVVLIAMTAAVLVIFAVRSGLAIHRETIEVLHLIG\n>MGYP001489963689 FL=0\nSERNKYSRSIQVSLKNIIILMFFGISLFGLAVIGTLRIINKEPLTRELNDLRADRLLLKQIVSDLHASGIIDSTKAYEHFVYEFYNSHKMSFPDLAPVMGYVTRGVHMGNNHLGIDIAAKYKDDIYAPADGRIIFSGVGDDLGNTIIMSHDGGFITVYGHNATNLVNTGDSIHKGQVISQVGDTGKSKGPHLHFEIWKNNQVLDPREIIKKYKEKDVSIRETRK\n>MGYP003582534822 FL=1\nMLFFAQKGTVTDGHQYIPAVIEAGAAAIVCKDLPEVLQPEVCYIQVDEVAPVIGLMASAFYDHPTRKLQVVGVTGTNGKTSVATLLYKLFNQLGEDSGLVSTVENRIMDNVIPSTHTTPDPVSLQALFRQMVDASCTYAFMEVSSHAVHQHRIAGITFRGGIFTNITHDHLDYHQTFDEYIRVKKQFFDHLPKGTFALTNIDDKRGMVMLQNTKAAKKAYGLRVPCDFKGKVFENNLTGLLMNIDGQDVHFRMSGLFNAYNLLAVYGAAVLCGKDKIDILTALSNMQGAAGRFETYHSENEKILGIIDYAHTPDALQNVLSTIKQFGQQANIITVIGCGGDRDKLKRPEMAQVACELSTKVILTSDNPRSEDPEAILDDMEAGLTPGMMRKALRISDRKAAIKTAVSMAHADDVILVAGKGHETYQEIKGVRHHFDDREVLLEMFKLLEK\n>MGYP001208310892 FL=1\nMKKKKAYVVGTNVSKSLSPLIFNYWFKKYKINGSYNYKEIKEKKFDLEIKKILQEEGVRGINVTIPFKEKIIKHLNQQNKHAKLIGAVNCVSIVKEKTKGINTDWTGFKDCTKHIKKRNVAIVLGYGGSAKAVIYALKQMGFKKIRVFNRTFNKIKRLKNIKPHKLEEIPDYFYTADIIVNTIPKNFISKLLKAKQKPTNKTNKTGYGFDLVYNHPTLFLDSISKTKRIYGVEMLAHQAAPCFYKWFGKKPKVDKKLIKKLINS\n>MGYP000076073552 FL=0\nDLVLGVFGWVVRSDKLGKGTLDHTLKIQVESELQYWRSVLNRVVAVIKFLSSRGLAFRGEN\n>MGYP001544161807 FL=0\nMGLQQRLDSLALNDFFTLYHFIWTHSKESICNTTHCGTFYIPPRQIVPKVYNIITRTFPSVARIQGRDKDCTEICFAVAFCNSGEHVTGSSGDGFQLRRCCFALISPRTCLRPDCNDASVHRSVXERASLAVRTTHGEGNAGXTKLLRRRCXLX\n>MGYP000196507220 FL=0\nRFMAEKRELQMKEITEQLEQGVKELFTSEMYTEYLRTMSQFHNYSFNNTLLIAMQKPDATLVAGYQAWQKKFKRQVRRGEKAIQIIAPAPIREKQEVEKIDPETQEPVLRFDGQPETEEVEIVIPRFRVASVFDISQTDGEPLPELETPELMGSVENFKVFMKAVQEVSPVPVRFDEISSGAKGYYSNTEKEIVIQNGMSESQTMKTGIHEVTHAMLHDRDFMEEQGEKKNQMTKEVEAESVAYTVCQYFGLDTSDYSFPYIAGWSSSMDMKELRTSMDTIRKTAGSFIDSMTEVIQRLMWEQPELSLSAMKQAEILIDRVEQERTLFSGEERNLLVNYAYKFDNAEETEKLIRKLAEAKAIPDLRSATEICRDIQKEIEFLPDGMVGMTELHRYGYQNEGCFRLKGRGHMNCFRKVLRYSPCIRMIRRQCWMMKENLIRMTVFSG\n>MGYP000592636036 FL=1\nMTDRPLWQMTATETANAIRDGQITAQQATEAALSRMQEVNPHLNAVVEDLSREALEQALGMESGYVLDFSDRTFNDFFYETIAIDPEDQSQLFNGRGTSKAKRLRSFIERAQPALVAKILREMWEYRDAMVFAPSAHNEEKLKESYFTTVARIEGRADVIDTSAIETFEPNETLEELVASIRRDLDANKPQAALDRLHTYCMKRFASLVRKHGGGECGKDDALHARVAKYVKILGAQKNLNPISERIVKSSISVFEAMNPVRNDQSFAHDNPDLVQMEEARFVFDSVTAFLRFSKAIDGRFFED\n>MGYP000923000473 FL=0\nGISVENTSMFEITNFDIVIEVIISGTISIHFIYNTDVFENETIKRLSGHFRNVINVIVNNLEIEVSRVELLTEYEKKQIKYGFNNSKTLFPDNLAVHEVFEEKVKNTPENKALSFNGFELTYKELDEKANQLAWFIRSKGIIQNSIVAIIFKRSIEMIVSILAILKAGGAYLPIDPMYPIERIDSIIEDSGAKLVLTQKNIFDQANISENGMFHRNNIELVFLNDVEYLLSQYEKNYIQNINVPGDVAYVLYTSGSTGKPKGTLITHYNICSKIVNANF\n>MGYP000510006770 FL=0\nRVGKRTWWYENGQIRQESNFKDGKIDGKLTEWNENGQIRLESNFKDGKRVGKRTWWYENGQIEREENYKDGKKNGKWTWWYENGQMEREENWKDKIPDGNWVSWFENGLQSSEGNFKDGTGVFLQLHENNQKSYEVIYKDGLGKMTEWYENGQIAGERNYKDGELHGKHTYWHENGQIFEEANLKDGKWDGKYTRWYENGQID\n>MGYP000191306956 FL=0\nLRTQTSGVQIRTMEAEKPPLRIISPGRVYRNDYDQTHTPMFHQVEGLMVDKNVSFTDLKGILHDFLHHFFEESLEIRFRPSYFPFTEPSAEVDVMGKNGQWLEVLGCGMVHPNVLKAVGIDPEEYTGFAFGMGVERLTMLRYGVNDLRAFFENDLRFLKQFN\n>MGYP002707266309 FL=1\nMNKFGLDNVVTEKANVELTDLDNGVKVSFSGDIDVQNPEPIFVPFFEQIHNKIIENGIKYVELDFSKLTFLNSSGIKTLIKWITKVTPLPADKKYNFKVIANSQITWQETSLKMLSMLAPGLIEIQIQ\n>MGYP000629646757 FL=0\nMPFVTTPDGTEIFYKDWGPRGGQPIVFHHGWPLSADDWDNQLLFFRDKGFRVLVAQRGAGHHAVALEKLDVPVVVDGNPRQRRLWFPLRSGRDAQDLVGRVVVDVAVLDLAQVDAGLH\n>MGYP003443031209 FL=0\nPSVMVSVTTVSTVYVPIMVSVVVSVAVKIPVVVIMSAIDVTPVMIPVVHCCTGRAVACTIMMVAIVSAVPSVTHTEMTGGVMVDIVVTTTMVPTSSSYDMPGMSTTIRGVEDRATIVEIVTMRIACIDGEVPETVTPVEWTIEVGGCTESA\n>MGYP004007491671 FL=0\nTTQSVHDTLFELDAAGKLAPGLVEAWEWKDSLTIVLTTRSGVKFHDDTEFNAEAVRYNLERIRNPDTGSIRGGEISALDTVEVLDAKTVRLRLKQPFAAFLYPLVDVAGCVVSPTAAERWGKEYGLHPAGTGPFKLVEYLKDAHSILERNGDYWIPGKPHLDRLVLRPIPVDSTRLAELRSGGVQFAESLPWQDIQRLRAGNEVVVSEKVGFRWEWFGFNVREEYPGHSK\n>MGYP002477604874 FL=1\nMESMHFLHLLTAVAALLLGALLGGRIASLLHIPRVTGYLLTGLLAGPSFTQLVGLPSLLTTDALQELAVLSKVALALILLNIGGQFRTEQLRRFRHRILLFSASESLGTALLVSGGTVAVNQFYLQQVVPGLSLLGTSLAFGLLLGLVAIATAPAATLMVIREYEAEGPVTGTLLTLVGLNNILAILSFSVAAHLMFHGDSGMGQLAIKMFGPLLVGGSLGFFLSIWGQRLELDTEFKLLLLGGAVATAALCSALGLDVLLASMALGIVLANSSPRWHRMQEALRQVDYPLYVAFFVLAGAQLHLETLSHIGLLGVVYVVARTLGKLGGAWFGAKLGHFGERERKWIGITLLAQAGVAIGLAEQIAQLWPVGGHLIETVVLGSVVIFELIGPLAVRHGLVSAGEVPILSLLQKRAPQNAIEGFHSVLSHFRSSIGLPAGHRMRDPGDILIRHVMRQNVETIRNDTPFNELLRHISHSRYDRFPVVDESGHFLGMINYTEIRELLFEPALAKLVVASDLVSTSHLAVNPDQPLREALQLLQKHRDISYFPVVDPEDQNLLLGILRQNDVLAAFRRLDLQ\n>MGYP001551819414 FL=0\nTLDASLGDVAVLYRTRDQGEVIANALGKLGLPVKMTGKATLEQSENIDRVLGALEFIAGRKTPPVDFEGVLETSSALADLSAREVIHKVSETLFEEDGSASADIAPLVRIAKKVDEHWAKKVTKKVSFVKPGRPIDDFLDRIALQGKADLHESKVDSITLTTLHASKGLE\n>MGYP000703270391 FL=0\nMPKSEKLRDVLIGFDSAWTDSLRNPGAISACILDGGQHVTFYRPRLATFEEALHFTRQVGGDADYVLIAIDQPTVDPNRDG\n>MGYP001030102971 FL=0\nGRYRSEPPPRAGGDRSSRADGTLVIPVEGAGLSVRVAFASPIQERGYAPLVEACGMLVGLARAPSAEASASLRPVPPPPEPATVAPAVRHLYADALRVAQGDVSVLIRGESGTGKEILARYIHAASRRAAAPFVPLNCAALPRDLLEAELFGVEKGTATGVDARPGKFELADGGTLFLDEIADMAPDT\n>MGYP000938480968 FL=0\nFEAKLKELSDDAQVNGFRHGKAPRRLIENRYKKEISEQLKNELLYQSLEQMSEDKKLNPISPPNIDPNRIEIPMEGDFVYEFEVEVRPEFNMPEYKGLKLNKPVHHYTPEEIVREERRILATYGTPLPKEEAVALEDMVILSGPVKYGEQQIGMIKSHPFRVDGQLAFKDGVAPKFAEQ\n>MGYP001617072387 FL=0\nMNRDEFADKTVESYKAACLEHLRQFLRSMRLRDKVSSNPTRLGNLSVECIWHEGQNHYIENYHKQQWAWGFTLFCPQGHEIARRLVISQEQVGAFLAHQERPCYACKEAKP\n>MGYP003654168572 FL=1\nMEELVDNFERLDGPQKRKKLEELLRIDRRLGEIDDLPFGVPPNRLEACYYDVLRWLRSGEDVRAPEVGDLVDVLAGTYHTGFGRMRDTPAYHGAIVLKLDSHGRIVARLPDSAGPFAAEDRAMHLGWNVKPTRKLYLSFDEYKLKRKE\n>MGYP002623322284 FL=0\nPPEETHRLLPCLQTGIIDDRGAAAWQWRNRGRASPGGPLTMDMAANRTIRHKGGFPPATPGRAQEWRKPMFKKTAAAMALSLGLVLGAGAIAPEAAAQTRVTLKSAKAGTSYYVMMVQLGEMMKAQSGGKIQATVEESQGSVQNVKESARRPGNFLFTTPPSLLVSAREGKKPFEGETGYDRVRALFVVPFVTIHFAVQQDSGITDVMQLEGKKFIAGGKG\n>MGYP001568520366 FL=0\nHQLRVWLTVGDVLAVRQQPQALIVMLIVSLFRHLFVSYMVNRFSSPIS\n>MGYP000925408016 FL=0\nMVEHIGYHTLKEGKTLLAIFNALEGFANNLTGLAGKNIEISTDIPSSAKAPVKQT\n>MGYP003579269052 FL=0\nMNSDVPGPDDGAAPDALDFASLDVVYIDDALAVVDKPAGLMVHDSALARGETDFAADRLREQFGRPIFLVHRLDRATSGCLLLAFDREVASALGKTLMARDVEKDYVAVCRGWPAEERFTIEHPLDGGPGKPVQKPATTPVG\n>MGYP003309607925 FL=0\nMSVKRIFLIVLDSVGVGELPDAAKYGDEGSNTLKACV\n>MGYP000957236481 FL=0\nMVEGALDARHLPGLAPFLSRETLDRLALKIGEGQIDAGCLTSLAPFLSQEALSRLVDQAAEGTFDAVHLTGLAPFLSRETLDRLALKIGEGQIDAAHLPALAPFLSQEALTRLLGLAGAGKLGAETIVALAPFLDSAVLGELIKNSARQK\n>MGYP000599625106 FL=1\nMIENNQKLGSLSSGKNFDRTQSWVERSDQISNSNTGIFIQISLPAKISGFYGLKEFNFMNCEMSGMFGPNLAKCISFYNTDWVKNEKYFSMPTNGIQKVTIPTSAVYKITAFGAGWQNYGAMAKSNVKLENGTQIYVGIGQRGKHISDGCGGTFVTFRKNGKFVPLIIAGGAGGGDYENEYGNGSTDEFGKKSDSIEESNRNIGKGGKSGYSNCYNGGNGFEGEINENWEKT\n>MGYP001217081736 FL=0\nSFADKFLEVLIFRTALFLFLLTIILQIIMPFCIYFLAPGFLDNSLVLDQITTLTRITIIFMPLISIVALLGVATNVSGKFWILSFTPIILNFCLIISCFFISDNWTVKSLPLALATVLGGVLQLIFTLIMIKKFGILKLSFKSKTIKEYDQIKLYLKQTWKKFLPAAFGGGILQVNLLVDTVLASLLGFGSVSYLYFADRIAQLPLGIIGIALGTALLTSLSKSSAIKDTKQFSKELIISLKIGLFFSIPASFVFINFSELFIKVLFERGEFSSLETNQTAQALIAYAFGIPAFIIIKSCQPAFLADGNTKTPMYIGFILLLLNVFLSYTLMHYLKHSGIALATSLVSWTGSIMYIVLLIKKGKISKFKFTFKYDQFNLFAVLIYALKIIFTSCLMVLVMKSIFYFLNIYKINEISILLFIVLFGMLTYFSTTYFLKYIPQELLKINVFKFRKVN\n>MGYP002526846326 FL=1\nMIRRSSDKISVTKPSPFNGIGEITVRSLLNGPEEMENKGRVFGHTTVYPGSKIGLHMHKGDSETYYILSGHGKYNDNGTIIDVQPGDVYYCADGESHSIEAIDEPIEMIALILYTT\n>MGYP003577118151 FL=0\nMIPSQINDTSLKIFRDGMAAYVVFEDTEWEILKNYIELKVLQKKDHFAVSGKICDHIGFIVNGSVRYYHIKDGTEITGYFSFENDFVSSYKSYVTRTPGTGYIQALEQTEFAIISYNNLEQMLNHPL\n>MGYP000225436725 FL=1\nMRNTFHLKTLAVAIAAFSVASVTNAAGLDRSGQDVTAFLQDGIYAEAVYTYIDADVSGYDNGRVATDDAGYVQGNKTGDIAEYYDFFRYGVKADVNDTFSVGILYDEPFGAAAAYTGDSNFT\n>MGYP003337284868 FL=0\nMKEGYGEENSDIRRYSGDYLNDVPHGYGTIIYGKNIYTGNMKNGKKDGIGTIRNFTGKFEYHYYYQGKKYRGPLYRFPIYEEKKAFWKEDKFIVDFYIKKGELMIQNYLNSMNEKDIKYCKSNNIRNYIYKNFH\n>MGYP003906308351 FL=0\nAYGFVRDCDGAERHQGPLVEAALAAKRPGDAGELANELARVCLESGNADKAENWYRKGHDAGIAQPDFTPATKDLWEFRTAHALAALVGDQGRQRRDRVDARAHERVGVAEAEPIVPVASAPATAAFSRGCVAAKITGLPRDVLYAHALTMKPEEPARS\n>MGYP001106728357 FL=0\nMINAIIFSKDRAPQLRLLIYSIQKNAPHAFNLNVIYKYSNDKFKEGYEKVKGEFSSICNFVEQ\n>MGYP000556042202 FL=0\nMRLKLLVALVAALLLSACNDPHTGTFIFTAIPDQDESQLEKRFGTIALYLEDQLGVPVKYVPVKSYAAAVTAFRNCLLYTSPSPR\n>MGYP003339182432 FL=0\nMISRRNFLGLSLSTVALQRLSIFDAFAANADISHGLRTKKEVALTFHGAGDLKIARDLLAIASDAKTPISVMAVGSWLSANPEIGKEILAGGHDLGNHTYNHKAMLHLNLNEAKSEIAKGKAAIIKSVGSAQKYFRPSGTPKSNATIRKAAIASGYSNCITYDVDTLDYRSEEHTSELQSLRHPRMPS\n>MGYP000070210673 FL=0\nMRSKYISKLILLCAIIIISNINVFSQDEDSIKTIEMKEVMVSANKTEKPFVELTVPAKIISKKEIENSGHSRLDEIISEQVGIITVPGFGGSEGIQLQGIDPEYTLILIDGLPVIGRVAGILDLSRISLASVERIEIVKKALFYDLKLNKKKVVVISFSSLTTELCKKYKSNIILRGLRAVSDFEYEFQLAGMNRKLNKNIETLFLMSDVENQIISSRFVKEIVNLKGDIKKFTTKSTIKLLKRKYE\n>MGYP000373531853 FL=0\nTYWFLIHFIFERNKWRYAKINESPGILTIREPNGTDRVELERLEVEEARETLGVFIAMDGNQDAQTQALKDKAATWADKIRTGSFSHAEAWFSLQYCLMKSLEYPLMATCLTKKQCEDIMTPVRKAVLPALGINRKLSLVVSQAPKKYQGLGVLDLWTVQGSLKTWLAINHGDASTITGHQLRASMELHTLEIGLPGQLTQHDFEIYGAITTTSWIKNLWKFCQHSKIQLNTTTPQLQLACTNDSLLMGTFAEYGYREPQLSLLKLCRLHCHAVRVSDISTGDGRRI\n>MGYP000570708825 FL=0\nLERYDVDPANVLGAGDGGNDVGWLSGIGFPVAMGNARPEVHEIARAVAPSNADDGAAHLLERLAAAHGGA\n>MGYP000034617079 FL=0\nRVRNGAGRAVVVQRLGQDRNVGTGRVWPYQDREVFDTADGARFDLDSAPGGLPNEGYFGTRSTSRA\n>MGYP003372218023 FL=0\nMTNYSVYIDESGDLGINKGTHWFVISAVVV\n>MGYP000394300602 FL=1\nAKERMKLVDLDPAFGARSVNEGFSGGEKKRNEVFQMAVLEPRLAILDEIDSGLDIDALRIVAGGVNALRRADRAILLVTHYKRLLEYVEPDHVHVMAGGRIVRSGGPELADELERTGYAWVAGAAPETAAAGA\n>MGYP003610839716 FL=0\nMIEMKLLVTGGLGFIGSNFIRLMLHEREDCRIVNVDAMHYGSNPDN\n>MGYP000586146873 FL=1\nMQDELKVYEEKMEKSIEAMMSEFASIRAGRANPHVLDKIKVDYYGTPTPIQQVGNISVPEARMILIQPWEKSLIKPIEKAIQTSDLGINPNNDGSCIRLVFPELTEDRRKELAKDIKKKGEAAKVAVRNIRRDANDAFKKMEKNNEISEDDLKDAETGIQKITDKAIEKIDKAVDNKTKEVMTV\n>MGYP003291547436 FL=1\nMLSFFVGALSSCAAQLLKLMIHGIHHLVEHYLIEQHHWWYLITPMIGITLAGLFVKYVVKDDISHGITKILYAISQRKSIIKLHNTWSSLVGSAITIGFGGSVGAEAPIVMTGAAIGSNLAKLFRLDQKTMMLMIGCGAAGAVGGIFQAPIAGLVFTLEVLMMDLTMTRMAPLLISSVTATAISFLANGQEAMFPLTNSEPFFVERLPWYILLGVMCGLVSLYFTRGMNHLEQFFKHHVQNIWLKFVVGGSVLGLLLFLFPPLYGEGYDVIKQLINGDSVSAIVNSPFEQLGKSNWVLVGYFVAILLFKIFASVATNGGGGVGGIFAPSLFMGAITGFICARLMNMIGISVPEANFALAGMSGLMAGVMHAPLTGIFLIAELTGGYHLFMPLMAVAVISFLTIKIFEPHSLYAMRLAQKGELLTHNKDRSVLTLMKMENVLETDLRTLHPEMTLGELVKVIAESSRNIFPVIDEEGRLLGILLLDEVRNIMFQPRLYDRFIVKQLMNSPQAILTNTMPMGKVMEVFEDTGAWNLPVVDEQKKYLGFVSKSKIFNSYRHVLVHFSEE\n>MGYP000629932273 FL=0\nKSDVSIARTIWQENEIRRLERAVTGYFDYIEDLIERENTFNMEQFAASVNEFLTFRKYQILPDKGRISAAQARQRQKANTIFLIKTNGLILTLTKKLGGCWVKSNKMK\n>MGYP002789926533 FL=0\nREALDALDASERAAQEALLKAREAADAASAAAGEKARDKRGVVLEPGDAVEVATLGGKTGKLIERRGSDAVVMVGALKLTVPFAALRRVSQRHLKDQAPAIAIIDVPEVMAKTEVDLRGLRVHEVDDAIVQAIDAAHRADLRALRIIHGKGTGALRERVNQLLKGDKRVKSFRLGAWNEGGAGVTVAELS\n>MGYP000243790712 FL=1\nMKTGFRKSQKGAVAIEFALVFIIFFAVFYGLVSYSLPLVMMQSFNQATSEAVRRSVAVDPNTPNYSTVVLNTANATLTQQLSWIPPVFNLVVGVDTSSQYSASGLLTVRVDYPVSKLNQVMPFLVLPVVGTVPNLPTYLTAKSSLQF\n>MGYP003301794412 FL=1\nMNKTKLLILLFFIALATNVNAQFGIGLKGGLDFNSVTRSNSGRIDETYHAKNGADYGIILSYQINEWFALRANVEMLSRSHTMKRNLNAVKGLYTDYKNQYLTVPVMADFTFGGARVRGQFMMGGYVSYWMMANVSGNTFDLYNKIRPFNEKMEFNEYHNRFVAGLVAGPGLSVALTEKISLELDALLYYDLVSYMKVSKVSPDPRYNNTASLTLGVIYKL\n>MGYP003383111361 FL=0\nMYKTSKLRKLVFQRLTTPEGTRAQQSLSSGTGQSLHDLVVQAMINVKLVKW\n>MGYP003686761737 FL=0\nTPHAPIHARDTRQEAPVFFQAEDGIRDRSPSRGLGDVYKRQVQLNEKFSDGKYIVKSQYGNSKSTVNTSSFLIATSNISSMESTSSEIPTWIKNNAGWWADGSIDDDSFVQGIQFLVQEGFMKITN\n>MGYP001302444474 FL=1\nRSNSDSNWANEGNLENEVVLEAEFDLGS\n>MGYP002051420820 FL=0\nGRQDRQGGQRAWTPNQTTSTITSKKIILLAYTYTYVISNYFSPTGSLLYYVSCNPEIQDKIFDEILDTIGSDEITHDNISKLDYLEACIMETLRTCPPVIEHDRVCTNDCVVQGIPVKKGVKICMPNYPAHYDADFFPEPEMFKPERFLKENADQIIPYTWRPFGSGNRVCIGQRFALMEIKIFISKLLYKFKVERTPRTELKYSPGGFFIISYPEIRVALHPRNWTNKILQKKVFMRSGILRKINFRACKEKPSYKKLCQKMVDK\n>MGYP000789720163 FL=0\nSSSSPMVLVDGMEYSLNELNPGDIETISVLKDASASIYGSKAANGVILINTKNGRNSEKMNVSVRLENTFSMPTMVQQVADGVTYMQLYNEAVFNTAKETGTLHAYQPFYSADKINGTKAGLNKYLYPNNDWYDLMFKDFSVNQNLNLNIRGGGRKVSYFLNAAVSNEN\n>MGYP003304858611 FL=0\nMVTERTRELDESNHLLEQKQLLIEQRNKDLEQALQEKDRLLSVIAHDLKNPMFAIVGALDSVLKNHSSLESTWKTLKDIYLSALNLQSAMVKLLEWARGKQTDVVCHVEDASVRKMVQEVVSLLNGLFKEKKIKVSTSFNVSHCALMDSRMIGTALRNVLSNAVKFTPEEGSVEIEVLEESGYITMKVTDTGVGMTEEQLVSIRNNENVISTMGTKMEKGTGLGFKMAKDFVEKSGGVLLVDSKKNEGTVITIKLPVALTDD\n>MGYP000358995731 FL=0\nPSGYHEERVMSKCENIYDTLLQVFEISSEKDIPTFEAANHMVEERLETIAHIKSIKS\n>MGYP001565574238 FL=0\nMKALTLPFPPSANRYWRHTAGRVYVSEEAKDYKYYAVMEALRQGILAPLVGKLSLVARFYFPFPVKGDLENRLKVLDDAMNKILWDDDSQLWRIVLERHYDRANPRVELEV\n>MGYP000188450185 FL=0\nQITASLGGVSTGFPREAGFDITVASEVMAILCLAKDLSDLQKRLGDMIVAYTRERKPIYARDIKADGAMTVLLKDAMQPNLVQTLENNPAFVHGGPFANIAHGCNSVIATTTALKLADYVVTEAGFGADLGAEKFLNIKCRKAGLAPSCVVVVATVRAMKMNGGVAKADLGAENVEAVQKGCPNLGRHIANVKSFGVPVVVAINRFPTDSDAEVELARKAAEAAGAEAAVMSNHWEEGGKGAVELAEAVVAACEQPADFKLLYPDDMTIKQKIETIAKEIYNADGGTFE\n>MGYP000733041054 FL=0\nSPCSFYTIGTQQIFANTSDWSSEFFARGEEVGLIPSSLSQSKKSYITRKNFSEIAINFYSLYTGNPAVSINISPFMDEKSPKIVKAYELGIVNGYIEEMMEGQKVVKVFTHEEESIADFNRLNDQLFHSADNANKFGNILMPVNAQIGNISYVLCAIVGGILALGGYGGFTLGKLASFLTYNKSFGQPINQLSMQLNNIVMALAGSERIFALLDEQPEVDDGYVTLVRAKWENGQIVESKERTGMWAWKHTHQADGSVDYIELKGDVVFDDVDFGYVPEKTVLHNVDLYATPGQKIAFVGSTGAGKTTITNLINRFYDIQDGKIRYDGININKIKKDDLRHSLGIVLQDTHLFTATVMENIRYGKLDATDEEVMAAARLANADTFIQQLPNGYDTLLTGDGANLSQGQRQLLAIARAAIADPPVLILDEATSSIDTRTEKIVQDGMDKLMAGRTTFVIAHRLSTVRNSDCIIVLEQGRVIERGSHDQLIEKHGKYYQLYTGNLAEG\n>MGYP003499035801 FL=0\nMTNSSFSVLIVDDEPNIRSGLAKGLISEADSIETAKDADEALLAFGKHDYQLVLADVRLNCSMNGIDLMRKMLLARPQTAVIVITAHGTMETAVEAMRAGAFDFIAKPLDLNLVRQQVRKAREHYQLQLENRNLRNQLANAGEISNIIGNCTAMQEVFHQIRQVANTDATVMIHGESGTGKELIARALHELSDRSGGPFLAVN\n>MGYP002865127206 FL=0\nMERNELKKKAKEALRSTDLDEKVGAAANEMKEKVQDVLDKTDLDEKIKAGADRLREKADANVDALKAQVHANAEQLKDKVQDALDKTDVDERVK\n>MGYP000383000818 FL=0\nMTLLVAGPEVEEQCRQLGLPLAAPLAEGWALPTKPRCLHLEKGPQGFGFLLREEKGLDGRPGEWEPWGRWGKVGLGVGTQAYIHLSVHRRGVPV\n>MGYP000367940092 FL=1\nLMSGESVLLEPILSFVIEVDSGDLGRVLFDIQRMQGEAEPPQAAGERMEVRGRAPAACMADYPQTLISATRGTGRISLRFEGYAPCHNAQEVIEAKGYDPERDVENTPDSVFCSHGAGYPVKWDQVPNHIHCK\n>MGYP001277400934 FL=0\nCARSVLKPRPPPVPPAPPKPLVCAAEPARQLTPRELPRVPPAVVQAEIHEHLADVSTGPDENMMRMLFEAEPDPALVFLKAVRPSPLPRTGPRAVLASSCPAER\n>MGYP000821197694 FL=1\nMIMQNLSLIHISEPTRLLSIS\n>MGYP000868773532 FL=0\nMLSINERDGVRLDALALPHRPQFFSGLGLHVDLPGLDAQGPGNGVAHGLAVRRHAGCLGHNGAIDIADLPPLLAHPPDGLGKQAQRVGAPENRVGIGEMRADVAQRGRPQQRVGDGVQQHVGIGVAEQAHGMRDGDPADDQRAARHQGVDVPALADTEIDGCVHAARLFRMASARAKSSG\n>MGYP003609178968 FL=1\nMLRKPVYRSWAYTADADAKSKSNAEYFEELSHLRSKEHMSFTTSPQYAHTTFSGELLSEEALALTADEILLLMDHGNLCFGGRCSKSGNKFSGSYNTD\n>MGYP003113185133 FL=0\nKKKKKIRIGIIDAKADQILTGIGTVADNPELGNIIDIVVGMGITQTLVGKTSIGAGSTSSLSGYLKGMVTEVGEGQVSVKKKKKVEGSTETPRDYQEGGAFPFDDLGSLGIHTAGISTAAATVPYAGRQDWFSQQTVAISTSTVGGSTITTTQPWNTVADKPGTSQYAADRGTRFDEVHVVVIDGAGKVSGNAGTILEKHLGLSKAKDAEFSAGAPSYWRSYLKTNSAFVFGGDEPSGTIDVGFDVGGFSPAGGSWDKTAEGTIFKSIGKFNGVMGGGKNYDGNTDITGDNALAVDLSKLVTGYSLFENADNFKVDFLLMGSADYSKEIAQALANKLIAVADTRKDALAFISPYRKAFLTDTVAGSVTVNNDETITENVLEFFSPVTSSSYAIFDSGYKYMYDRFANTFRYVPLNGDIAGLCARNDIDNFPWFSPAGTTRGAILNAVKLTYNPSQTQRDRLYSARINPVIVSPGGGIILFGDKTGLAKASAFDRINV\n>MGYP000828330599 FL=0\nMRKLNYSLKELVLADLYRYEGKTDTKSFLHAYATYEGFKFSVWLRMCSVARKKKLTKIFILPICRMIYRHYKYKYGYDIPYACLLYTSPSPRDKRQSR\n>MGYP001429112534 FL=0\nESGGITQHIGAYEVIVEGDKKITFLDTPGHAAFTAMRARGAQVTDIAIIIIAADDDVKPQTIEAIDHAKAASVPMIFAINKSDLPEADIDRVKKSLSGINILVEDWGGKYQSQTISAKTGDGIKELLEKVLLEADVMDLKASREVSAQGVVVESRLDKGLGPVATVLVNKGTLK\n>MGYP001154957988 FL=1\nDVCFCKANKGCAVGESSTDGSFTNDSIIWRTIDGGKTWKQTYAGEGEGGLGAVTFTSKKKGWAVGRGGTILKTKTGGRKWKKVTVPAGAEHYDLTDVSFPDKMHGWAIGGLSQGATDYNIFLRTRDGGHSWDLTTFNMTEPLSILWKISFPTDTEGWAVGDEGRIYHTSDGGTTWSEQESPHTDTFIQATDVHFTDADTGYVVTSDGYLLTTINGGADWEIAHHENSGFYGIAFGDLLNGWAFGADGMAVTTLDGGETWQRTTEGATEVLLGCSFADLSAGWAVGAFGTALGTSDGGHTWRDLQTGTVEHLRAVKFIDRDHGWAVGDSGAILHTYDGGESWAPQESGTGQALAGVDFVDSLHGWAVGGDTTLLRTVDGGETWTASSADAAIDLYTVDFVDTMHGWAAGKGPGHVLRTEDGGETWDAVEVVFIQGQTVAGYFSVRFRDAYEGWLCGAVQVGLDDATVIGHTTDGGWTWDSQHLSRSTDHILQAMAVTEDGRGWA\n>MGYP004345682747 FL=0\nALMISIKNFPNPSLKVYNVSALICFQSTQNPNKTAPDSPATQHRTGFKDGLATSPIDRHFP\n>MGYP003480708303 FL=0\nMYHSGYKKSFKITGFALVELLVSISILVMVTGAVMANHGAFNSAVLLRGQAYEVAFQARDTQLFAVSIMSDAGQYRNIYGLHFDKNNNTGYKIFRDSNRNSYFGTSEEFGRQGSLDSRFVIGDVRWVHSNGSETSINNVSVLFERPNFDAKFFEAAAPGGELSNAMAVEIDIRTKGTSGNTNGEVRTVEITRTGQI\n>MGYP001578248368 FL=1\nMKEEIKRLPQTLSELRKQEDEDDYSPRPRGGKPYKRKFLISFKKNEGK\n>MGYP001074384480 FL=0\nRHHRGPGDHGQRGQLSGRGVHHEGRLAWGPASQDPALHPAPQREGGEVQPADGR\n>MGYP003184699802 FL=1\nMYKKKQITCSPCFSDNPSESLDFNPFVDKVAVARPMSYYLNGGVDLDGISTRKPLPDAFDDAESIASGDVNVFTDLTVGKLDLMDMASTMASESQARALKDGARETNFD\n>MGYP003330398148 FL=0\nLLPSFAIIVLGTIGSIPGAIVGSIIVGFVRALSSPVLIGVGLPLGRSNYSALDGVMPYIFLVAILMIMPEGIGDAYEKWKIDRLRKKREASVRDDKLQSTTYKCFMERSYYVYLLASRRMGTLYCGVTNELMRRVYEHKLGQADGFTRKYGVSRLVWFERHELVNNAITREKRIKRWRRDWKIELIEKDNP\n>MGYP001273406180 FL=1\nMAIIYMLFKHISQLFSYKITLLFVFIVLFSIVYMFLDDKHFSGVNFIKDAIKEEVIKKKIEKKVDKTLENFTGDVFSFKPITANDEEDVDTKIDRVAEVTEQEVKEQDLSAEKIETSYPQKLFDRFYFSINTTTLLGYGDIYPVTNVCKSLAMTQSLLTIFLIVV\n>MGYP003308729374 FL=0\nMIAKIEKCTLSGTAYAPTSKSIAHRLLICAALSEGVSIIKKVTFSEDIYATLECLKTLGANYTVDGDTVIINGIENIQQSEEKIFNCRESGSTLRFIIPLLLLSDVKQILTGKGRLIERPQDVYEDICNEQNLLFEKNDKITVRGRITAGNYYVKGNISSQFITGLLFALST\n>MGYP000219845609 FL=0\nTTTTTANITEPTAVVISGAPVTDANCTGANNGSITINANGGTGTLQYSIDNGITYQIGNTFSSLSPGSYIIVVQDANGCTATTTAIALPAGQLILSGFGSGSLKSKIIKAKSIFRANECDEHSGEQLYILYTSAMMEKILGDTTLTSADFMAGKMIQEGGVGGKWMGFNWIPYEKLSQGAAVGELRTVAYCGSAIHFGEADITGFDITTRSDK\n>MGYP000496951928 FL=0\nMSIEAMKQALETFKMLNLTQVIEVQWTINALRQAIEEAEKQFNPDWDQQAVLVKRIRELEAQQALDKKADNARELGLDYEPTHTDHPMRHWDRTCPACVEQAEKQEPSRAQTKQIVEGLKHCHHPDSQHEFLRVWIKDWTAHKSAQPRKEWQAVNGKLEVEPIKGTLLPQAQGQEPVANEKEGSPCPEFWDWLPKAYNFAGNGVFTKYNMEVAFLAGKQFSSTAPSRTSIEHAVIAGVLFDFMGWLTS\n>MGYP001105606284 FL=0\nYGMIPCYKWPRNSSRLESFLQKQGTLHPKGYTYSEVKKMTKSFAHKLGQGGYGAVYRGNMPDGREIAVKMLKGIEGDGEEFMNEVASISRTSHVNIVTLVGYCLQGSKRALLYEYMANGSLERYTFGNNSTQGEDTLSWDKLFNIVIGIARGLEYLHTGCNTPIVHFDIKPQNILLDQDFCPKISDFGLA\n>MGYP001562148884 FL=1\nMILIGLVTGLGAMIALSYWLTGSVGSNPAAADVCAEVATPVLDGPVADVTLGTVCGDIDLRLDEPISGTDGFEGDFRYSGPPSDPDRPRPGYLVWESDGCSAPVLGRGPFDFTLACNRHDFGWRNLKHIDGDDVPTWQVENKDRVDAGFLHDMRKRCAAVPAIVRIGCDTTARVYYTAVRLNPSGVKGIPGSG\n>MGYP000254919864 FL=0\nRYHKIIIMTDADVDGSHIRTLLLTFFFRQMPELVERGHIYIAQPPLYKLKKGKQEQYIKDNDALETYLISNAIDELELHVSADAPAIRGEALAKVIADYQTSQKSLSRLTLRYPASLLDGLLELDAFKIDQAVSSYQTAKVKPKVIGSP\n>MGYP003314355870 FL=0\nKESSAASDVYKRQVQESVLRKEETPLVSHVRTIVGHIILMENYWQQRA\n>MGYP003594184147 FL=0\nNDKFRGQSMMSIDQMELFFQLLISQNSDRKVVEVFPSYYNKETTFGQCEILKETYGVNSKHDYAETISLSSERLIVRFRNIFVVGILFKRDFITWKEGKPIENEFVPFYKHLLNFVSFEDKV\n>MGYP000202344024 FL=1\nMETATKASDQQATNAALAALAATGNSYALGQLWELNKGLLRSMFWKWYPAHKAQADAHGLTADDFEQEGIFCCPARRPDLRPGTGSLYHLADCRHAAPDPAHPYQRPRPQRDRR\n>MGYP000205932652 FL=0\nHQARMAPLRHQVDAGRVVQIDLHIPETSHMQHAPFLDEQPPLALRPVRPHAADGHAQPDHPGDGERRAKQHAQPVEREIGQSDDPQRRDRRGQRHRRLEPPFQQGRRLGADHRETLA\n>MGYP000157303393 FL=0\nMKAKLLSTLKYLFFLGIGIAILIVVFKDKDLDKMVEDLRNAEYKWLIFSMIFGYAAYLFRGLRWLLLLETMNYKSSANHATQAI\n>MGYP001265825478 FL=0\nMLRFILLTLLALIVWVVAFVGGTIAGLWREPIAPRGDTAAFVKAATARIDREHKGNVAFTLVEHGRKVA\n>MGYP000910426799 FL=0\nMNMNAVTRAERGCVEAPTVSFTLNGRQISALASETLIEIATRESIDIPQLCYRPGLEAVGNCRACMVEVKGERVLATSCCRFPLPGMDVTTDSERARKAQQMVLELLQSDLPKTALTRNNEVDEWAARLEVCSPRFAPRPAVAADLSHPAIAVNMDACIQCTRCL\n>MGYP001021135751 FL=0\nFKARFFALWAQNDKKHTQNDKKHTQNDKIFSEWQYILRMTKHT\n>MGYP001288254412 FL=0\nMAGHNASKRLPLATQGRDRGVPHEKPRELLPNQRAARTLRKVPAHDQAQASPAAAQVPRLWKRDRVEHYRSQRGEAVRTWDIQQGDCLDLLRALPDNCIDAIVTDPPYGLSPDGRCRTWDDIESGRKGGGFMGKQWDAAVPGVTWARECLRVCKPGAHIVAFGGQRTIHRLICGLEDAGWEIRDLGAWQQWQGFPKSLAVGKAIDAHHGAEREVVGHADRKTGPGRHLAALAGNPGESATPSITAPATEDARRWEGYGTALKPCLEPWTLARKPLDGTVAANVLRWGTGAINVDGCRYGYGDPAWPGPQGDPGGRHNSADRSGSPTVHLPPVSLDSHDLGRWPANVYACPKASRAEREAGCGHLKGRAGFEAVERTEGSAGLDNPRAGAGRTAGEVRNHHPTVKPTALMAWLCRLVGGQPGSLILDPFCGSGTTGIAALREGFRFLGFELDPEYIQIAEARIAGDAPLLNRRESVLG\n>MGYP001416122492 FL=0\nSEKEHHPDYERNTNHIKWRFVMDNANFCSDHKQVEFCAHELDFTCDYDAAITKKTGKHHKHTKNKTKRQYSGRDSEDNGSDMDLFEYTLNSDSESDTSQRGSGRKTSKKPKKRSNTGDGVKDSFLRDSMQFHPYNKSEHDTLNSTEMRWSGRKSYRDNRRNIGLNNNKSRARVVTVVS\n>MGYP000266266674 FL=0\nMGMEDFWEQLPTGKEDKPLLFEMGPLEYDFHDIDGLYFMLDRRLSGCLLMMLSLIHISEPTRRV\n>MGYP001810632152 FL=0\nALENMPLEELQGQVQARQQDLEGLFRFVNSQEEELTLQRQDIEELQVKLSRSSEGERPGLEAELADQQEQYNMLNETLVGQRRNLREREEILSKHQEVLWRRLGNPPGLGRSKRLDVGSALQKAEAWRQNFGAAVQNLTGSVESLQQSLGELRETVTQKAAAMEGKQQELKEKESALATRQQEVLELAGRVSLYQEMLQPERDRLHSLHEKLEELGAAIAHLDETKDYQQQAITQIRDALMPIISPSA\n>MGYP000787850220 FL=1\nMCKAKAWVLALTAGLLLLLIPAQARADVTRLLILNDEQTSETSAAATDVLRRFALYSSWTCTFVSSEDVPDTCLLYTSPSPRD\n>MGYP003299208211 FL=0\nENRCQNGPVQGQFSGRNRDVADEGAEGTKYEHGCHKHPGGASGVLHGNHFLSKMVLIVPEDGAVCKMYLIRQEPKNFFKMRIIPIDK\n>MGYP003980343243 FL=0\nMMKSKIDPTVLYPSRRSMYKQDALAIERNEELPLFDATLLDTDVIIVVGKRQKVKDVAAYPFYLVKENNTVNSLVTTVEIQLGIYEVSVNKEEEYLDDTGTIDISLIGKPLLHTFVTKTLLESILSPTPTVNNHNNNNHNNNNHNNNNYNNGFNANNENPEENNNNNNNNTLQPSETERKRKSNSKTALEAEAENYIDIMTPTKT\n>MGYP001799802231 FL=0\nYVIYINTFSKVLVPGLRIGYLVVSGPVRQLLLQQKLNHDRTTSDLMQRALEAYMTVGKYQVHVRRVCRAYRQRQVAMHQALKRHMPQGVTWQRPNGGLFFWVKLPDGVTAVSLFQQALRQGVVVSPGTSYTTPIDNESPYLRLNFTVHDTAVLEEGIARLGQIVRERLD\n>MGYP003466254295 FL=1\nMSLSKIIGYASAALAVYFYKQSSDLENEIKSEKKAHEAYVRELLAANSALENKIDPNLGSYQSPIIFSATMRSGGQMLEQNEITLNCTNPTDSIIEISDFQARIWVAGYMADLCVPANILSIKIPAKKTVSFRLYARYGKMFRNYVEVKRALNLLYDGKNTSTMRAGTFIPLDKEPVLMNMQYLWVGKGFEDKCYVYDVPGSFRWKYAGWTVGAYVGYNAGNENQQKANPSYWTDTQEIDSIDE\n>MGYP001158205152 FL=0\nMHANQYNFISSVSSNIIQVNIDITPKYNDYEMAQIIQNHAINQNGYIKNHGLMIYQKKDVYLVYAMDYVGFEFAWKYMIDAHSGKIVDQIPLIYDSGPTIGSGINLLNESITDLKVYEGSSFETMGGDLITPNLICEQFCWDYGDCDGQNYSDCIVVAEQYNCDDGYIVDCDGICFNEWYMQFPGVGNGFCNDPWIEYEEANI\n>MGYP003680783999 FL=0\nQATIFGILAGALVIIFSKNLQAIFHTQSHWMFVLFGIGIPLYFFMSVNRGTFQGHQDFKNLSITYQTEMWSRLFLIPWEPSFLVALGIGLSFLFGLIPSNLKDISFKSKAKLLPENSKRVTQFMLLTACYEFTQIIINNSDILLVKHYFNALDAGLYASLALIGRVVYFVAWMFVMLLLPTVVQKQKD\n>MGYP001343183673 FL=1\nMSNTYERLQKVIAQSGVTSRRKAEKLIEEGKVKVNNKVVTELGTKVSPDDKIEVNGIQLEKEVPVHYLFYKPRGVISSVKDEKGRKVVTDFFPEIEERIYPVGRLDYDTSGILLLTNDGEFANLVMHPKHGVEKVYVAKIKGIPSKLELGRLRKGVKDNGELLKAIKYRVISSDKKKNTMILELTLQEGKNRHVRRMMEQLGYPVIKLKRERYGMLTLDGMRVGEYRKLTPKEVKQMINLATQIVED\n>MGYP001231558494 FL=0\nKNSDLILINGDKDIDFEKKLFSYNAKVKIYYSVYKPINADKFKNKKILALAGIGNPENFFNLLKNSNLSVSEKNFFPDHYEFSKSELSKIILKAKRNNFCIVTTEKDYFRVKDYNLAEIEYLKTELVIENKKQFLKDIMKIYD\n>MGYP000160763201 FL=0\nMINKSIKYIGVILLAYTLNACNEQRMSSSSETTTPVWLAEVGKRDVLELTTTTGTAKAAKTVEVKSETNGKYELMINPKTKRPYKLGDIVEEGAVIIKLNNKEHENTVSLPTKKMQVDIAKKEWDGQKAVFEKGGATEKDVLNAESSYIQAQTALETAYTELAKLTIKAPFKGAIVSLPYFTPNVEIASGETMVGLMDYSHMRSEERRVGKECRSRWS\n>MGYP003702127599 FL=1\nMSAMKRASSVVKMKPLSSRSKPLPVNDVIAATDLPTPSPASPRGGRASGSAMIRCEFFARDVCENFFLAIFPFMHKFQDDPMITNLKVSEVKNLRKFSSNIWTAIKYMGRNLYSHL\n>MGYP001407002453 FL=0\nGFAVLGGLKPALNLLGNVPLSVLTDYNLAVIPMFILMGAFASHSGMSRELFGAGRAWLGHRRGGLAYASIAACAGFAAINGSSVATAATMTQVALPEMRKSGYDAGFSAGLIAAGGTLGIMIPPSVIFVLYGIMTETDISKLFAAGVMPGLLAVLLYFAVVQFLGWRYPASMPLGEPHSWPERWTSLRALWAVLLLFLFVLGGIYGGWFTVQEAAGIGAAGTLGIGMMRGRLRWQQIRAALIDALRVSSAIMLIVVGAYLFGYFLTITQFTQKAVAFLTTLPIGAYGVLALVMLGYLILGAVMDELAMILLTVPIVFPAMMQLGFDPVWFGVIIVMAVTFGMICPPVGMNVFVINSIARDITLARIYRGTLPFATELWDPVLR\n>MGYP000300748531 FL=0\nMTVEFTFQAIFGFLSNFVEYLCTIQKRIYGIKRLHHSDRCLLLDDIGPPIETLRSIPLLVSRYELLAHCLYAVTSYQFSFNLVCLDKVTIHITISTIHKMQNILVSKNNKITSTS\n>MGYP003495590882 FL=0\nMPTGHWPAEAAHTDEYLQVAPGICYMNIPARDKYVPGGEMWVTESGDAGGGGDTWASTYLDVLRTLNELGSFCTLTNGVIFHNTLASSDYGFLQHGSFDPRPNYFAALLWNRLMGSECYKVEDAPQTEGAHVYCHSSKDGRGNYCYLIINNSLAEETLVSVPKHSY\n>MGYP001249907410 FL=1\nMWARIEQTMAKQIRHVRPIARDHADPTTQRIAAQIERDFGAFVPPFALHAPAPAVLAACWMMLRESLVPAHVDRRTKEAVASAVSRLNACTYCVDAHTAALHALGETATAAAIADAAPALDASGALGPFIAWAAATRSPDNRLLRQPPLSAAQGPEVIGIALCFHYINRLVSIFLAPSPLPFKSARLKAIARRLLSPILTGLLQRPLEPGESLAWLPEAPSPPDFAWAAGNPTIAAAFARAAASFESAGAAVLPATVRALVRDRLHAWHGEEMGLGRRWLEDAVDLVDAELRPAARLTLLTAFAPFQVDDVLLREVRRTLPDDAALIAATAWASFAATRRIGTWLTVDQFTSGSRK\n>MGYP003567298226 FL=1\nMFSAEVFRLSGFRHDIQAGDPPLPLWWKIEQNKNMNLSRKPRPQLSLGPAAPDLALGRMHEATGPSAVIFAALAAGRLTGPILWARPAWEGGVLNPEGLAPLFDPTRLVVASCPRPLDILWTAEEALRSGAVQMVVAETAEPPALTPLRRLQLAAEAGGANTKRPPLGLILPPRAGTAGAVESRWRCRPSPAWASGQPARWRFERSYGKSGPPLVWETGVSDTIQRRAA\n>MGYP003550943715 FL=0\nMLLCPPRLIAERQAAQYEIIFSHGDSLARSIMIRGVVDAVLTLPLVLPPTVTRYFLLRLLGSRRVIGAWLMTY\n>MGYP003599591953 FL=1\nMKLIEDWKQAWKLKSVQVGAMSAFFYALILFSEQFVNIWNVIPQDLKNYIPAQWQEYMGMFVGVAIVLARLKKQPELHAPELSGINSLLSMPTQTNDLAWMIEAKKHIGLKEVSGKAHNPTILNWLKSLGAWWSEDETAWCGTFIAHCLKVAGAKYPKHWYRALDYVNYGSKLTKPAYGCVAIKTRQGGGHVCFVFGRDEKTRKLVCIGGNQSNMVCYALYAESEFQEFRWYGMTDRPADKRYNLPIMTGVTATKVSEA\n>MGYP001120090256 FL=0\nVRLLLRLLLLLLLRRTRFDLDSRSSLLLPPLLLALLLSS\n>MGYP000141974819 FL=0\nMSVIERVLKTGDTMQVSDYELTPLTEVVKIQLPGKHAGLIWNHPKAVIVRTTDGRESHLPVRDVTRIVMWATLAGGLLGAIMVARIYRKN\n>MGYP002637710184 FL=0\nTQRKKEDGTLDPIKDLFRSPDIKTIGIHLDVPKGLVLKKSDGAVAEVGIQSGDEVTAINGIPVFTFGDLQYYYDQVGRKSTSITL\n>MGYP001617737781 FL=1\nMGEILLIWMVGGWKMYKKRSYDGKNTPRLIHVLMAIIPILVLGGLLVYFAYIKVPEYQQSDTTYSSRQPAYDEYSQQWQSVQSREKQQRENVTAAYKQMSQYTQDQLQQLRTERELQKTQQKVIYPFK\n>MGYP000263732607 FL=1\nMPLFIFIRLFHHRKMSAAELDAKLVELKKNLFMLRMQHATNQLDNPLQIAVVKKDIARIKTIIRENETK\n>MGYP001213662979 FL=1\nMAFNNFLEGVATQLINTGLRKVAGNLPGLNISVNSSNSSPVADVTRNSRSTKFFRFPLDVEADPGIGNQGHYMMFEINEQDHARLKFGGKGSPMRRVKAVSPVLSNLDQPPPARLDPIQQMNRYGSIQNYEKAVSDYKTKSVGTKRASTTEISAHIAMYMPESVTTGYSAQYTDTEIGYITSAAIDAYEKFAQGNMRGGLEEIGRRDKDLAAALNAMMLNTAGALPGLSGLKAAAEMRSGVVLSDRMELAFKGIDKRTFQYEFKMVPKSEDEAKEIKEIVNMFKLNMLPEFAGNDVHGRSLIVPNTFNIRYMYAGAENEFLHKISECVLESMNVTYGGERYKTHSATDGGAPPIQTTMSLTFKELDLITREQVMMGM\n>MGYP003703380869 FL=0\nMVPLLNSPGASWKVLAPYILSTANSPGANWRVMVPLILSACTLP\n>MGYP000959007105 FL=0\nMSGTQTETVACDVLCIGGGGAAVMAAISAKKAGADVVIASKGKIGNSGDTIMIGGSYSMDGESAKKKYGFKKANASVTKDVLFEQIVKQGFLPFRTEPCGAVRGGRPGGGLSVLAVGGARK\n>MGYP003576775111 FL=0\nMASAPSISDAFRTTLDLFQTGCDLMRQNLRRRYPDAHEHEIDRLLQTWLLERPGAERATAPAGRSTSSPDLRDGTRSGAQNDCGTRISPRTRARDRVRRTVAPAASLX\n>MGYP003283773441 FL=1\nMEQGGTLAARQRTRQVDVGGVTLGGGAPVRVQSMLTAPTADAGGALAQTRALAQAGCEIVRAAIPNEAALAGFEALCAASPIPVVADVHFDHRLAVEAARRGAAGLRINPGNIGSWEKVDLVIDAAARAGIPIRIGVNAGSIGRDLAERDDLSVADKMVRSAVSFVEHFEGRGFTDVVLSAKAHDVPTTVETYRRLSRDLPLVPLHLGVTEAGTALQGTVKSAVGLGILLEEGIGDTLRVSLTADPVDELPVAWGILGALGLRRRGAELVSCPTCARCQVDLIPIAREVECRLAALELPITVAVMGCEVNGPGEARGADIGVACGRGSGAVFYGGKIVARAPEDRIVDVLFGEIASRFGC\n>MGYP000469828058 FL=0\nSYRRDLVKLQSGRLVCGYIYASAGEGESSTDLVFAAHNLIAENGTILAQSKRFENEIVTADLDIHRIRAERRRMTTYPTTQEEYEWTEFELKTEETKLERTFARTPFVPQNKNDRERRCEEILSIQALGLKKRLVHTNCKSLVVGISGGLDSTLALLVAARACDMAGIGRDHILSVTMPCFGTTDRTYQNACELTRRLGATLKEVDIRKSVTCHFEDIGQDINCHDVTYENGQARERTQVLMDLANKSGGMVIGTGDMSELALGWATYNGDHMSMYGVNVGVPKTLVRHLVAYCANTCSESEKVLQEVLLDVLDTPVSPELLPPEDGKISQKTEDLVGPYELHDFFLYQLLRCGFGPAKIYRLACRAFEGIYSKETIGKWLKTFCRRFFAQQFKRSCLPDGPKVGSVAVSPRGDLRMPSDASSA\n>MGYP001221173772 FL=0\nMTIPSALASLLLSQAAAEQQTLIMESLDLISQNSSEDLIASSGSSTQSSSLPSSFGEI\n>MGYP001563734490 FL=0\nMSGRAMGWVTVALLFAGCAGVNYRDKYERYLEEGHKLPPSTAEEVKLQRQAYVDAVGRDSPFKEVLWDVAINGHRIARVTLRGDHVYVETRDYWLYAIEAKTGITKWALDVTRPIQYPPTVVHGLDDAMAAQRALLANIQE\n>MGYP000046061924 FL=0\nKLDAFFNDNVNYIKRFTNPEHLGIAADVEVPDLVMSSIITGAEIYLPLADLLNVEEELARLEKELAKWQKELDMSVRSSLTNAS\n>MGYP003435272778 FL=0\nFIFCLVAFNYTMRELKRGRILNKVTFLEKVIKQIKL\n>MGYP000462850367 FL=0\nYIYKRYGTSWRIDKKVVANDPAEDDQYGISVAIDGDYVAVGAPYKNANAADQGTIYVIEHNASANAGSAQVYNYDGTSWIQIGQTLYGKTELSHFGVSVSLDYDGDIVAIGAPDVNNGVVGVYKFGTDGSWAQLGSDIVGEADGDYFGISVSIDSDGSHVAIGGAGNNAAGDDAGHARVYEYNGTRWREVGYDIDGDGDGDYFGNAVSIDS\n>MGYP000891392761 FL=0\nYNFFPFCYISRFFVQFICQIPFFFVFMRPSVFLREKRWDASTRKFWIYFNNVELPYLNNLNFS\n>MGYP000314751283 FL=0\nYQEAVKWYRLAAEQGIAKAQYNLGVMYRDGKGVLQDYQEAVRLFRLSAEQGHAKAQYNLGVMYANGQGVPQDYKEAAKWYRLAAEQGVAEAQSNLGVMYEKGHGVPQDYKEAVKWYRFAAEQGTAEAQYNLGGKYYFGKGIPQDYQEAFKWYRLAAEQGIAEAQYNLGTMYN\n>MGYP001575587140 FL=0\nFLEHMCFKGTFKRPRAIDITSELDSLGAQYNAFTGHEYTGYYAKVEARHLDKALDVVADLYQNPIFNEREIEKEKGVVIEEINMYEDLPQKKVQDLITKLLYGDQPAGWSIAGNKETIKILTKADFLKDRNQHHVASATTVVVAGKFDDKNIFKKIETKFAVFSDLRKKGYIVKTALKFGAEFRVYEKGVKPGEDHAKWILYTV\n>MGYP000040707706 FL=1\nMGMLNTSCFYSFGKEMFRKIFYKSCKRHSFCINDTKGLACGSFISLIEYEIASRKTRLPTLPFLSILFMSLFR\n>MGYP001557050405 FL=1\nMLEQYKKTAFHESGHIAMTYFAEYACQEVEVLISGDGKTTMEYGNDLLLISAITNCKEYPEMFNDLPHATKLNSPGVAFKASLILLAGSIEESIYMNNGIVDGDMEVELSGPDLLRVQNIDYLLSSIAKNHPSNFIQSNIENIMMTFSIPEIWTSITALAESIYSKDGMKLTKDEIEQNLTSTGYFDHIKKYL\n>MGYP002626139264 FL=0\nNNDTAALLAPIAISVAASMGVAARPLVMTVAVAASASFLTPVGYQTNTMIYGAGHYRFGDFVRLGGPLSLLTGIVATLLIPWLWPL\n>MGYP001591609445 FL=0\nLTESGSCPTFPIFYGTYSGVAKEFKADITEEYSLMKNQDWFDFFNNKLFTIEKNKLDSINKSKNSFELNLEFDNNLGEDINLETHDLEENNEDITKEENSEDIKLETHDLEENSDSDGKWSDITSEEEYKDVIRVAEKIDIPYFSVNFVEEYRENVFKNFVQEYRDGFTPNPDILCNREIKFKVFFQKAMELGADYFATGHYCQHEYIDGKSILTKGIDAGKDQTYFLYTMQEEILNKVLFPIGHLEKKIVRKVALDFELATATKKDSTGICFIGERNFKNFLSQYIKEQKGEFVRLDDGKTVGPHDGYCYYTIGQRKGLGLGGPGGPWFVAGKEVDTNIVYVVEGEN\n>MGYP000075518654 FL=0\nAQIGKGVHLSAGVQIGGVLEPLQASPVIVEDHAFIGAGSIVVEGVLVRRSAVLAPGVVLSGSTPIVELNEKHEKVAEYKGEVPENAIVIPGIRMKGNSGYGYQTPLIIGYKSEGTSAKVALNTLLRDF\n>MGYP001377906329 FL=1\nMETDQIMSAIFLIAVLALILPGFLSTNNRAKQFMKNLSIWTIIVLIIIVIIYLIKQ\n>MGYP003341019630 FL=0\nMLFRSIGAFWALTLAAKPADRTHHYGHFKAEYFSSGLESVLIVVAALAIIHTAIARLQQPQPLEQLGLGLAISLVATALNGLVAWALLRAARRFDSITLRADAQHLLSDVWTSCGVVLGIGLVKLTGLTILDPLIAIAVALNIVVTGWMLLRETASGLLDRSLPDHEQQLVERSEEHTSELQSHSDLVCRL\n>MGYP001601917572 FL=0\nLKALATSRAINLIEVEENKLKLRQKNNYLQVGGRFPRLGGRQAGDRFDEIREWIAKLAVARAAE\n>MGYP000576050399 FL=0\nMADSKKNDKTEAPKNNIEDSKEQIKEKFRNKDNMVDLDSDPTKLIEIVEI\n>MGYP000088332676 FL=0\nMSSWGRPERVVVLLVGEGAVGDTSAVRERIVHQQSTYAWEFVLVDVKRGRRRAAFNHGKLARALQQATGKEFDDDRLPLEQLRFSPDRTACWFRVAGKGWTCVLKTCVLE\n>MGYP000901407724 FL=0\nMDSAGERFEAIRAALADRNNILTVKDLCELAGVSRSGYYNWVRSEKNRELREAKDRAAFEQILEAYRFRGYAKGVRGIHMRLLHMGIRMNVKKIRRLMRKYKLTCPIRKPNPYRRLQRSIRMGSAAENLVNREFESHGPRAILLTDITYIPLCGRFCYLSTILDACTKQVLAYAMSESLEVDFVLETVQLLVKHHGISLSKETVIHSDQGTHYTSLKFIQLVENSALRRSMSRRGNCWDNAPQESFFGHMKDELASEIPGWTSFEAAKASIDRWMDYYNNDRCQWDLAKLSPNEYYHYITTGEYPAGTMRRCREELSKLFKRLYEDNVLGRVTDEQYRMLAGDYTGEQKALEEQIPEKEARLEKLKAASANVNTFVEKAKQYTAIDELTPELLRLFIQRIEVGERTEKYSRSSHQSIRIVYRDIGTVDSAMEQGEAQPHIAPPLSEVFELPA\n>MGYP001844006787 FL=0\nFGNFVKITXPNLAKRHIYRPRAFIXSQHEISRPLRSRDIARTNKKSIFVGFFLAILSRSRDQIGQNGQKAHLQAESFHLSPTXNLXASPFSRXWPHKQKSIFGVFCQFRQDHVIKFGQNGQKAHLQAENFYLRPTSNL\n>MGYP000461460321 FL=0\nMERKSFASLDCSIAQCLEVVGEWWSLLIVRDAFLGVHRFDDYQRRLGISRNVLRQRLTHLVEAGILEKVPYSTRPPRSEYHLTDKGTDLWPVLTAMRQWGDRHAAPNGPPALFVHRSCGATTDTLLVCESCREPVRAGDMKLVPGPGRTLASLVSTSRTDK\n>MGYP001244209094 FL=0\nMARNWCSAHAPVGNSESPAHSLESPRLHSSAKRRGDRFTGQIVVGRVGLEPTTTRESVRTSTCQRAIDPLKVTRKKYRLREDGHDPSSSYSASATSGLMPSDGCSARLVTGRDGFLWFPLLFLFVFLFVCLALWVFLKCSGICLVCHSGEEQPMCCVVVDHRVQALLVSELVPS\n>MGYP002522304077 FL=1\nMLNNTSTDMDTHPPTQAGIGIATPVCYSEIGAKANQEDALFPLAGEATARQRVFLVCDGMGGHEHGEVASQCVAHTVGTLTAAQPPCDTATMRTTFEQALATAYDRLDEIDTPPSEGRTMGTTLTFLALCTDGILIAHIGDSRVYQLRPGEDVVMRTRDHSLVSDLIAAGELTEDEARTFPQRNVITRAIQPHQERRDRATYNVVRDVREGDVFLLCCDGVVEQLDDASLCALLLAPGSLTDRLAALRDECLRRHTRDNNSAYLIGITAVDSPARPQAAMPTSPVTQPRGRHNWVYVAIALLIALACFLLAQVFMGSKDGARAGKTDPPATETTADSAPLRTIQHR\n>MGYP002571109560 FL=1\nMKNILFVIGSGIYPHVVGGMEIFNYYLIKKLSSFFKIHYLSYKRYDYDEGKQLKCFKIKPTKFFAPLQLAYYLLIKPQIQTVVFSYSAAHWILWHLYQKVTRLFNRNYIVVIHYGHTPPVEKKQAYQKFFQQAKAVIAVSNDIKKNYDAYFNINCEVIYPLVPFEHSNLNKKELRENYNLPIKSNIISMIGSLKPMKNPETIIHALCLFTQEEIAKYNPHIVYAGKGESMVKLQELAKQYNLTERISFLGFIPKEKVNDIMKLSNIYLIASDFEGTSVSLLEAMYNELPILASRAPGITNTLNENKDCLMFETKNAQQLKMQLLRLLSNESLSKQLAINAYRNYCNKFSYESIVNSYQKIL\n>MGYP000323132695 FL=0\nMIERLLRIDNPPAHRRRAGAVLFDKPRGKTVGVVVQHVCDIALLPKLDLLGLVPCDFFVTHARKKIAQFLRVGRRKFNKFKAVGASGVLWRDLRFRRAVGERTHGNASLVVRG\n>MGYP001035366785 FL=1\nMSPRRSFHTISCPLQKAAGLQDDDRPAFIAKPCAQYYKLRAPSSVLGPSRGQQVPEPELVRQDLDAAGLGARAPAAALHGPHRLLAQPRRQLQAHPIHERVHVLGEVQQVPVQELGHRQPPRRRHAHGRLQVLPLRRLQLLLHARRRVHPHLKSEETTASPPGQAHIVTRTIASADCCYCRRPAAAGRNLINYRGGGPAPAGEREGDEGLRPLQPERAALRRHVVAGAGAALAPFRIHLPGHESSIRSAHSATATRGVAPLYRARR\n>MGYP000942704436 FL=0\nMAAISKGTVAFSFGVDETYTGGTVTSLSVNESWGNIGEVRNETGTMISKRYDDIRKEGTITVLLEDATVPSSALGSTFTYDAVVYYIDGISEARSNEGYAEYTFNIKEYENMSSVTIV\n>MGYP000205166280 FL=0\nEINIERAFPDADHVVLEKAGTAMARILEAINTI\n>MGYP003568659006 FL=0\nFYAAYTRSPYFLLQNYRNENDVDRVTGNFTITYKPMEWLDIVERVGADVYADRRRLKYPKFTYYPVDETTGNYTRANVQSATGEYRETQFNVSEIVHDLMITARKKMGSITGSLMLGHNVRQRTSTILEASTNESAGLIVPGWYNLDNSNGPVSNYNNFSRRRLTGLYAQLTLGFNEMLFLDLTARNDWSSTLPKSNNSFFYPSASASFAFSELMKNGNLSDVLS\n>MGYP000466899968 FL=0\nARYGTRKLKKGYRSHKLKPYREVAKAEKAAFKANVNFQYHKALQENPQLTSNPFSRFMQKQKIKRQYAKTVKKGGAATAKAAAGASQTAAKEAAAFAGRHPAGVIIAIAALLLFIMVSVGLSSCGAMFSGTLNGVLGTSYTSEDSDLVEVENSYAGLENELQSRIDNIERDNPGYDEYRYDLANIGHNPHELASYLTAKYQSYTCAEVQSELQRIFNQQYKLTLTEEVEIRYREEERTDTWTDEDGNEHTDTYTVQVPYEYYILNVKLTNKPISELAEKLLTPEQLEMYRVYLETSGNKPLIFGGGSPDGSPSEDLSGVEFVNGTRPGNQ\n>MGYP003111832576 FL=1\nMSIATSLGKRLRDWQLVYVADNAFFPYGDQAESLVIDRCATLISSVMAETPIDMVVVGCNTASTVVLPALRAILSCPVVGVVPAIKPAAALSRNRRIGLLATPATIQRPYLDQLIAEFASDCTVTRIGSSELVRLAERWMGTGEIALGDCQRILRPFAEAEVDTVVLGCTHFPLIRYLLEPVLGPGVGWVDSGEAIARRLEALWQQSAAGGLGRAEQEDPVEFSFYFTGLEPPRIRSYLAATGWPTARIHPEYVPSAPGSAPGLARGVKGAG\n>MGYP004300484681 FL=0\nPPPHSTQAARWPDARTSSSGSWHACKYAADTVRRLLRTELADALQHGAEAPAEGAPELTRLGEAIVALLLQKEGAIDVRDLFNAAFAAHWHGIDHLAAHFRVGAHHRRPHRRHEAGVDRVDPDIVTCELHGSGFCRKAPLAALAPRAVPLHSLPGAGVPYSQSARSMIMPRSTSGPGSVPNSCVTWSARSHAP\n>MGYP001071452416 FL=0\nPFIKSLKLWVNAVSKSPALKPLVQPLVIVLLSAIRAKESHLIFLPYVSIILGMVNDLSLSCETFVPIISSCLSALNMCSNKLASKSLTAEGREPNISDVVRVSDRQLKDKRVVRTLTLMILKELTRHLCFLARTGAFPEVAWPVAQTLRKLAKSNSTLKPEVASLIDSIDKTIVDIKEKRAAEIGTSLFQFSFEETPMGKEYEKVLTKMEKSWEYKDEEGDEEEEDDEDDDEEDEENTKKSMSKEERSKRSIKRQRQNEKKRALKQTVPEDALVA\n>MGYP003153901614 FL=0\nDTARAVVDGLAAKGIACPAVTGAGTGTFELEAASGVFTELQAGSYAFMDADYGRILDADGNRIDAGEWENAFFILTSVMSHAKADKAIVDAGLKAQSVDSGLPVIYGRDDVEYVKCSDEHGVVADPKGVLKVNDKLKLIPGHCDPTANVHDWYVGVRNGKVETLWPVSARGKAY\n>MGYP003386720413 FL=0\nMGQKVNPVGIRLGITRDWTSKWFASTKNFPSYVHSDWLVRDYLKRRLAEASVSRIQIERAAKKANIMIHTARPGVVIGKKGEDIEKLRVDVARLMKMAVSDVRVNIAEIRKPELDAQLVAEGVAQ\n>MGYP001336422905 FL=1\nMKILKKSQERTEEDRRELSRLVQDIIDNVRANKDEALKEYGRKFDACEREQIRVSKDEIEEAYAQLSEEEKELAEQYADLE\n>MGYP000344590912 FL=0\nKGDVDFAQKLARLGNVWVNDAFGTAHRAHASTAVIGQFFTDKVSGYVMQAELDNAQKILEYSERPFTAIMGGSKISDKILIIERLLDKVDNLIIGGGMTYTFSLAEGGKIGKSICEPDKVELAKQLIEKAKAKGVNLIMPLDNVCADDFNNNANRQIVERGCIPDGWEGMDAGPKSLELFDAVVNQCKTILWNGPMGVFEKEKFSLGTEAICKSLREAKSNGVNVIVGGGDSIAALKKLGNKDWVTYISTGGGALLESLEGKALPGVKALSNDY\n>MGYP001550816469 FL=0\nMVLNYTRFFGVFTGAIERVAVTGREGNIGPSPTDSNLMPTPLVFAHNAQDDIALLPAMSNRHGLITGATGTGKTVSLQVMAERFSSIGVPVFMADVKGDLAGMSQPGAGSPKLTER\n>MGYP003138151264 FL=1\nMAKAAATARPRRRERKNIAAGIAHVNSTFNNTIITITDAQGNSIAWSSAGAQGFKGSRKSTPYAAQVAGEVVGRAAMEHGMKTLEVEVKGPGSGRESALRALQSVGFTITAIRDVTPIPHNGCRPRKRRRV\n>MGYP003443083341 FL=0\nMGDTLLVRIDPRLIDPLMEQAEACGAAFADELCLVLLGLSTGARDSALERILGRLAHNMTLTLHGPAEFI\n>MGYP001435087364 FL=0\nIIESDIVKTFNGDMQASEPKYFDIEEILMKTYLPVWA\n>MGYP001431098935 FL=0\nMSHYNLILKNYKIDKTQNNNIKYSFNNIDQDSNSVSETFILSEGSNFLKNEIKGYKGSVEKINSQGDPVKKHAR\n>MGYP003304349197 FL=0\nGIRDPLWSRGLGDVYKRQVKYKAPNSWKWVKLN\n>MGYP001141817981 FL=1\nITTIHGFAQRCLRRPALEAGMAPDLSLDTDPATLIAQVVHDYWQQQVLALPPDWLAALQRAALNPALLETLLGTLDGDPALALDPPPPELPPELPLPVGLPVLWQRLWDSFADAWRRDGRALQDELCEQAAEWRGLGVEDTGEYRPTFRKTNDRAAAIDGFVAAAGEQPPGYEAVLAIKPLTTYFHPGPFTKEARKAEGEDRPIRLPRPDLMEAVAALVDGPLEAVLAHACSWGRAELRRRRQRAGTLSYADLLAGLDPGAAATGPTPLLQAVGERYRVALIDEFQDTDPVQWRVLRLAFGGPDHLLVMVGDPKQAIYRFRGGD\n>MGYP000931218709 FL=0\nMRTVLAVAALGVALGTVSLGLRSALDGGVLPRLLGVLEGLGGAQLLAGAPGGASVTGDLRRGGEDGRGRRCGAVRLSRRRLQGLLGGGLGLFDGALMPAGHTAHRCDGLGLRRLCGDRRR\n>MGYP002812137160 FL=0\nVRNLPFSAVRPFVRGLPLLRSSERFGQFGYFNVRLQSRIDGSEIKSADLKIHQCNESLFPEFALHARQNPLWGLNVTLAAN\n>MGYP000364897687 FL=1\nMNSPFRIFLLARAVPALVAAAVITFSANHAVIVGQIVFIAYGFVLAPLFVWAAFSNSFTTIVRRSFLAIGLTSLAAAAAAALTIGQGLIAFTLTIGIWAAISGLLELFAGWSSTNKDQTREMLLLGALTAVLGLVEAVVPLNDVYAVGLFGAYAAIVAVFSAIAGFSGSSATPAPSSSAPSPRLPSGRPT\n>MGYP003364664002 FL=1\nMSIFNFFKKSSKNEPTTAPTAQTCESSVEMQSVAVPKASSDEQPVQPKIDTTGAKRVHNLIIVDESGSMSSIYQPALTGLNETLQTIREAQKEHENQEHIVWLVTFDTSHFKQIYANTPAEKAEDITREQYRPCGGTPLYDAMGKSINQLRQMATADDVVLVTVITDGYENASREYNGKAIKALVEEMKGKGWVFTYIGANQDVEAVAASMSIDNHLAFEEDAEGAKEMFARECRSRKKFFGKLNDNMPMCDISKDYFEEE\n>MGYP000037013818 FL=1\nMAHRIDERVVLVLRRDVGEARALQEALDGGVRRADARPLLLLAQVRLARGQSRDVQGEAKKMGRP\n>MGYP001133519274 FL=0\nMKTRYVVQRKPLIVGLAGLTMLAALAAPNAAWSPLATAAAQDSHGSSHSSGTHGSQNKGGQGQGKGKSSSGDASGSSSHGNSGSKSVESKVLHGSGDASAAADESSDRRGPKYGGGKASTGKPTGAGTKKGDLLGDLNVILRDANGIPILDQYGHVQPLDASGNLIPLTPEGDIVAGSEDLVVPVEFSRLSVSRSPSKVTDKAYDEAIAALNAATAITTDSSGRLVTTVDGVAKTIDSPLENLALYEALMNNGYLPGFVPKDGVSLGSLSFLVDKSATNSDMLQAASFLAAASDKAGSINEDMVVYTDSILGVTGATPLVGADGKDYVDFSNVTYDRSATYTGTVTYLKSNGDGTYSTVTAPIIDAVFGGTTYTGTQLDAFTQAADDARAVIEYVHDNPLPAQ\n>MGYP001272594557 FL=1\nMKFGRKKDTNYFELLNSMAECTSRAAEQLDEMLHNYTDVAAKAEAVHGTEHECDNYLHRLVRELNRAFITPIDREDLLQIGSMIDTITDAIEDVANSFEMLSIRKVEKPALDMSELIKAVCTALSKAVKEFEHFRSSKKLSEYVIEVNHLEEQADVLYRSTIKALYNNTHMTVLDVIKWKEIYDYMERIFDACEDVANLLEGTAIKNR\n>MGYP003517379434 FL=0\nTLPLYLVRNYESGVNLSGSNATTTTTTTTTPAVCSGRCKWIWDLTNEIWELDSSNCSTATTTTTSTTTTAGSTTTTIALDCECVSGTTTTTNTSTSTTTTTTTASPCSCSYPAYCGTEDGECTYTNCVAGYVTTTLECTTTTSCDCNTTTTTPDCSSCANYICTPTGWVLVDDNCTGNCTAEEPSSDCNFGTSGSCSGLGGISVAGYGCSGECIYIYYDALDDWYFAYGNC\n>MGYP003652714744 FL=1\nMSVATSAGYDNLSGGKWNPSIYSQKVLKFFRRSSVAEAITNTDYSGEIENFGDTVKIIKEPTITVSSYTRGAVVNTQDLTDSEITLTVDQGNYFAFKVDDIEERQSHVNWESLSTSSGAFSLKKAFDYNVLKEINDSAVQGTAGTDTGAAGAAISCNTGNKAANVLARYSQQLDANDVPQENRWFVANSGFYELLKQADAKLMDASVTGESMSALMNGAVTSRQVHGFTLYQTNVIQTASVGSAAAFTFGPSATSGETTCLAGHISAVATASHIAKTEVIRDPDSFADIVRGLHVFGRKVLRGSGDGYKGVLQGVVDLNS\n>MGYP002630153343 FL=0\nHLTPVSSPLHSLPLQAWTMASLTDLLNEMLELVFLQLEDWQDLISLGSSSTALRQVFIQPRMWRELLEKTRIVQRGVGFEEVTESQVKKIMTFLKTVVGHEPLLEVLNDSICDQHQSIMWRRTIMKLGALRKMGAMRKMGAMRKLRAMRKIGATKKIGAMQWGEFGPQLWEELGQAAAR\n>MGYP002515195457 FL=1\nMGSLFLSVFCVFSTLHLISSWKNDRTRRAKTKPFLISSLALAYLVSAEVPSALLLAALVTSWLGDVLLIPRGNRWVILGGISFLGSHFLLMVLFLHHIHFAAIPWFRLLPVAAVYALLSVISIRSIWDNTPTLMLLSFGLYLLTNSCMNLLALMQLLTSRHPGAAVAYAGAVLFFLSDCILLLVRYHRNPDLVPKKHFPVMLCYLSGEFLITLGIFMMA\n>MGYP000652960749 FL=1\nMLNSFKNLSTVLKLRKQPASLKAARQFHDCGNFQMLYIASGITVTILLEHPQA\n>MGYP001560261255 FL=1\nMTPAPPTLLAGQGAQPGDIINAIAVQRNQLMDALAMAEANFAAFRRAHQGGGCGLDEVVPGERKVPDDAPA\n>MGYP001590704470 FL=0\nREAAAGFIPEGGTITLKALEVDSSLSGLRETWPASMPPVTLGLKLDDLSFRLKGFDEPFSGVGGTVSLKGDNITVENVSARYGKSVLKSADATLRGITGNTAYGISAEGTLDAGAGLSLARDITGGNTLPGQRGFPGPRPPAL\n>MGYP001590172643 FL=0\nAKSQREIASDSVKLNVLSCFDYSLQTEKTLLSVCDHTTTIVPITLVNSGSLSNIYDLSLKGPSWVGLDNNNILVNSGNQGKVNLIVSPDYGINGNFDLIVESKSKNGEIVKSSDIKVNVKGCNSVNVNIADDKIKMCGSLTNQYNVLVKNTGEVTNRFNLRTSGVDWVSLDKSLVELRGGEETNVILTIKPDKDVISGVYDVRIEAVNIEGNVKSDDTIKIEVVNMEKCYEPNLNISKKSVEIVIGDSVTIPILIENKGSNTADYNVGISGDAVNFVQVNPASITLEAGKSEIVYLYLAPSIQNRQGPYSLTVSVRYDSTTIIDSDTIEINVVEKQGVKITSEEKKEEKKEKGVFSLIWSYKWYILIALILLFVIVKVISTKGEEEYLDEIEELNKEKKIEKKEVKEKKLIEKPKEKKKEEKREEIIKEDVEERNYGFVKYIVGLVVLAALAYVIYRYNSYLGVYKWYILSAIALLIIVILIIRGFGGLIKFFEEDEEFEEVKEEKKIEKKEVKEKKLIEK\n>MGYP003651019918 FL=0\nMEFMEFYFYISDITLPQQEYLRDRIERMNVHFNEEEGYVAYGRGMMEGIDRSLSHPLTRTPLSRDTTYLPGAPALPFTVRTIFNGSYTYDPESEWARNSSTILHAFNRDRFSLSLSLSLSLSLSLSLIC\n>MGYP003348846132 FL=0\nASTVTVEANATVDASATQNGNGGYISIWSAVKTAVAGILNATGGQFGGNGGVIETSSKGSLQLPNSLAVNTTAPNGKTGTWTLDPTAIIVDSADVAVVPVVCVTID\n>MGYP000962646007 FL=0\nGGCGGPAPGAAKDLRRVVRRDGNRRCHGGRGALEEPKGAVAIASLQEISDTSFERGLVCHRPGSGGVGGGRNQLVPQDPERAEVLDLLDGGDQVVQERRGHHGLQ\n>MGYP003955760495 FL=0\nMWAQERVLVTGGRGFLGRHIVDFLRQAGA\n>MGYP001189459322 FL=0\nMNKILLIIKREYLSRVRKKSFIIMTILGPVLMAGLILAPILLMDSSDEEKKEIWVCDENNLFEPQFEDINGTDYQFFKNDIIEVKERFNTSDGYALVHIPKFKNESIDVLESSVKVYVRKPMSFSNQNQISNNIESVIESIKLKEEGLTRDIIDRTRSNVNLNTIILGESGSEKTGSTEVSMGISMFGGFLIYIFIFLYGAMVMRGVMEEKTSRIVEIIISSV\n>MGYP000827854766 FL=0\nMDNNNLVNDLSGILDGLDSSQEQLEKDAFDVINSSDTSLNLVKESISSVEEILKMIDELNEVAEESATRIKELEKLSKDIEQFAGVISSISNRTNILSLNASIEAARAGEHGRGFAVVASEVRNLAAQSAKSSKEITDTITMVQQSVGKTVDSMKNIYENSNQQKEKADEIGNVLNKVVEAAYTCLLYTSDAADDMQC\n>MGYP003969404433 FL=1\nMPLPSKSTNMDNNNNQALRIHQSDNVYVALADLVPGKDILANGNKIHVSEPIPAKQKFSISGLKKGEVVRMYGVTVGEVIRNIPAGGLLSRSNIKHKSDGFVSTDSRYHWDEPDVSPWQGRTFKGFYRSNGSVGTANTWIFVPMVFCENKNIHVLRDSLNKSLGYEKTTIYQDYAKKLAEMVRNGASEEELADFEISKLKSSTPHVNRAFPNVDGIKFLTHNIGCGGTRQDSNSLCGLLAGYITHPNVAGATVLSLGCENAEVSILKDEVIKRDPEFDKPLLIYEQQKFGSEMDMITSAIRETIINLSVANECERKPAPLNKLLIGLECGASDGFSGISANPAIGACTDRLIALGGGAILSEFPELCGAEQSLVNRCITKEIGDRFIKLMRDYAARAEAVGSGFDMNPSPGNIRDGLITDAIKSTGAARKGGTSPIVDVLDYPEKVINTKGLNLLCTPGNDLESTTAMAGSGANLILFSTGLGTPTGNPVTPVIKVSTNDKLSNTLSEIIDFNTGSIITGNKTVDELGSELLNLCIDTASGDYITCTNKMSQDDFLPWKRGVSL\n>MGYP001828137919 FL=1\nMLPDKADIVVIGGGVIGASIAYHLSKQKVKVVLLEKSDPAGGSSGACGGTIFLQTKSPGIHLEMALASARRFVHLEEELGDGFEYQRNGGMIVIEHEEELQAVKRHVENQKKFGLDVSLLDRKQAREFEPSLSETILGATFSPMDAQVNPMLLTFAFIKAAKKNGAKFFSHTRVTGFRKTFNRINIVKTDQGEIETQMVVNAAGVHAAEIGALVDLEIPITPRRGQLVVTEAAESVIGRCMLSAQYIAAKFNPDQAQKSGGVSIEPTANRNFVIGSTREFVGFNKGITLEGIHHIAKHVFRIVPCLKKLQFIRVFSGLRPYTPDGLPILGKVTGLPGFIMAAGHEGDGIALAPITGRIIADLIVDNQTTFPLKEYNLERFSS\n>MGYP003643276008 FL=0\nRGFKKIAKSPLGKMALMYFGGNLLQGNALFGNPLSGNLTNKLGSMFTGGGGGGGGGGFKGITEGFKNIAKSAFKPENAFATISGISGLSGLYTSYMNNKREDESMADYQRRLEEERGNFAPIPTDFVQFAANGGRMGFADGGDDDDDDESFRSKALGALYSMKRPQFSMGGGAGMPPVTMMSEGQDTQSFGDDESTGMVNATPTMPNQTPMRSPM\n>MGYP000011570578 FL=0\nNRFDAEIIIIVDKIFQSEVVDYALQLGITNAFIQEGDVAKESFIPDFDTTGV\n>MGYP002350897487 FL=0\nMQIDAIDRRILYRLQENGHLSNQ\n>MGYP001584058516 FL=0\nVLYSNKLTALPESLGQLAQLQSLNFSNNQLTALPSFIKQLVNLTVLNIGDNPFDKSIEIIGSLHQLKELYCFKINVPLPKTIGELKNLERLSIMQNKLELLPEFVCELSNLNWLWLFDNQLTELTSSISQLKNLKEISLHKNKLTDIPSSLVYLEHLEKLSLDDNPLNPALQSAYKQGLVALKAY\n>MGYP003693669217 FL=1\nMASPTVAANAYAALSRIMESGGAEKGGQSAGGPSFGALLKDAVGSVLDAGKKSDAQTMAMSSGKANVMDVVTAVAETDVAVSTLVSVRDRVIQSYEDIMKMPI\n>MGYP000343390212 FL=0\nMNIAIIAHDAKKELMVQFCIAYCRVLSQHSLVATGTTGKLVAEATGLP\n>MGYP001158220473 FL=0\nEMSELVQIKDHDQTSNHENEWAEKAKGKEVLMIMSELNYEVLEQLELMQKCLSEYDLYNNTDGKFCTIFMLNKDIGNESQLVSVGMAVGAEVEKVWETYSENNNPPEWVKSFAESYNRNMELLEKWNNLNAKLKKAYGY\n>MGYP000395984138 FL=0\nMKKEIAVTERPEIFTEQYLAAFGNMSWYDFVTAMPSLVFVVTGWKSNGKENACLHSWSSFAGSGADNFICILGKVNKDGHMYQSLKETKACVLNFPSNDIYDRCIKTIGNNQFETDEITASGLTAEAALKVNAPRIKECFL\n>MGYP001462322588 FL=0\nQATISSDARFGILSKSGADAKKMFTDKVVPISVNYPFFFKPIQDGMDRPKTELAYRVPASKLTRRKLESNEQLRELDGLDTTIDWKNTGDNSYDGEKLKLLAHDESGKWERPDNILNNWRVTKTTLRLGSRVVGKCMMGSTSNALNKGGDEFKKLYQDSDVTKRNGNGQTKSGLYSLFIPMEWNMEGFIDIYGMPVFTNPEKPVLGIDGEMIHQGAVDYWVAVIKPGAVLFEINGLEEERAYKVLKLASYKLPIKTKIISR\n>MGYP001101270620 FL=1\nMDRIIFHIDVNSAYLSWSALEKLHNGSCVDLRTIPAIIGGDMAKRHGVVLAKSIPAKAYGIVTGEPIVNARRKCPNLTLEPPDHKLYSRRSRELMTLLSDFSPDLEQVSVDECYMDFTPIRRQYPSPETAAHLIKERIETELGFTVNVGISDRKVLAKMASDFRKPNLVHTLYSYEIQEKMWPLPLSSLFMCGHSSVETLRNLEILTIGDLARTDRAIVESHLKSHGTLLWEYANGIDASEVATVQADAKGIGNSTTLTKDAEDKETAHLVLLSLAESVSRRLRSSGQSAGMVSTEIKYNNFRKVSHQTTLLSPTGQTDAIHQTACALFDEIWDGTPVRLLGIRSSKLVSNEDPVQLSLFDLQTADAGTAADDSFAPAYTRSPRRQPSTKKKEQLDAALDSIRKRYGADAVVRGSLLSDSKKPKYD\n>MGYP001545760421 FL=0\nMKRRVAALYGLAIRNAALSQNPMLSTAARPLPHSALQRVQRSGSWQIGLDFDKTALSKAAAESRVLHIELDVVTRVA\n>MGYP000446957473 FL=0\nEIQCVTGVQTCALPISGGDGIYLVGVGVGDTGYNDELMDTVTDAGKGASVFIHEPAEAWKVFNQNFVNTMAIAARDVQVQLDMPPGFDIVKFSGEEYSGDPTEVEPQHIAPNDAMVFHQVIETCAPESVDGSAEITVTARYRDAWTFLPKEVSHTYTFDELSAQTTPLMYKGAAILAFAEMIDAWDQLST\n>MGYP000532152884 FL=0\nLDVMDGHFVDNISFGPAFVEATAAVATRPIDVHLMIERPDHYVPRFLKSATNITVHVEAKHNVNKTLRAIREAGKSCGLALNPATPVEAAVPYLDLIDLLLVMTVVPGFGGQPFMPETMEKVRHAHAARQIKACAISCQRFMIAAAHMIGAQARPKRQCAQSQPTAKPRFGANEISERRYFSICASRL\n>MGYP001076569615 FL=1\nMDDRLTGKLIQMIGELTGKEMKRFEDFVDSPFYNKKEKLQKLSRFIAKYHPNFQHRNFTKQA\n>MGYP001614764691 FL=1\nMRGLRAGVYTNGPWGRLRGMSSAMGQMTDVKDRDELFLEG\n>MGYP000090456593 FL=0\nMCDDFSSPFQQISSYTLTIEPYLNTYSKQYENIIVIDKMPLGPLSQLVSHFNAPRLSPFAKQTNSCCKYAIRRHYNNTLRRENCFLTADDVPSLLSYLSANGYTINSEITKIVQKTNYNKKNFVCVFYYTV\n>MGYP002742331534 FL=0\nYFVCDMYPLLELVCTDTYFIGLTVFVNGGTICIVVFTLLLISYGVILNSLKTYSQEGRHKALSTCSSHVTVVILFFASCIFIYVRPVSNFPTEHFMFNP\n>MGYP002712581081 FL=1\nMATLASAARPDDAARVLSEAIARIARFWSLSNAQAGAILGLSAPTVSRLRAGNWRLEPGSKPFELAQHLLRLFRSLDSWLGQDDAAARSWLATPNLDLGAAPIALIASVRGLLRTADYVDALRART\n>MGYP000897634123 FL=0\nMDDVGPEAQLGSGRPVAVSGEEEIGIDGDRRGDHQGVGKFHRPVGGTDERSGPRDVVVDGVHPNGEPLEPSVDRSDAPWPAL\n>MGYP003681647399 FL=0\nMYPLDTIHFKKPETVLALAKSLELTGNAFTFARLRLETNIETNRVMRSSITWDSMSEAPSQGKASAP\n>MGYP003287676207 FL=0\nMLAGLAKFAYDVVLDNLSESAVLAAHHFGRANSIFEMLSDRYRAARAKFLLGRAYSAAQPERAAEHEPAADGPADGSEAIRWTSPDWPTSPTKPKPSCGCGVCDPAETLMNIGSFICS\n>MGYP001816890121 FL=1\nMSDGRPPFHLAFPVNDLEQARHFYAEVLGCPVGRESDRWIDFDFFGHQITAHLSEPGDAGSANLVDGDAVPVRHFGAVLPWARWRDLADRLAGQDLEFLIEPKIRFKGQAGEQGTFFVRDPAGNALEFKSFRDPARLFARA\n>MGYP003627722903 FL=0\nMDIFKTLILDTPDTLSNISGILPVSNGGTGADNAPDARVNLLPSYTGNANKVLSLNGGATDVEWTSNGAGDVVGPASATDNAVVRYDGTTGKLVQNSGVAIDDSGNVNLADNSSLNWSTAPGRPYIVGNKASDLIKLGTPTGGDLLNLVGSNVGIGSTAPAKNLAISSNANSQTTA\n>MGYP001002779910 FL=1\nMTAPSAPPHPGNTVPDAPYDARPASASTNRLKLGIDFGTTNSVVVLAHPDGKTETLRFRFPEHAESDTCRTLLCFWQDEVGSRIIQQEAIGAAAIDAYLEDPAESRMIMSMKSYLAQKSFRETQVFSRRLTLEMLIARFLSNLMQAVAIDPASVDVTVGRPVEFAGDFPDDALGAQRLRDSFTAAGFPSVELAWEPEAAGWRFAQRLENPTTILVGDFGGGTSDFSVLRFDPARPGHAEPLGHSGVGIAGDQFDYRILNTVIAPLLGRDCTYRVMGGEPLPVPIEWYASLGRWHRLALMRTPQTLRAMEDVARTVSEPQKLRALIDLVQDQQGQALYRAVGAAKNALSSADSTVLRFQHRSFKVEQTITRAEFESWIAPDLAQFDSAVDQALTHAGLTAADVDRVFLTGGTSFVPAVRNLFIRRFGTERVDTGGEFVSVAEGLALMSGKAAHAA\n>MGYP000271019841 FL=1\nGTAADARSPVHRATLGDPRGGDRIRRPDSRGHRRASSLAPHGRLGRIPLRPDDVRGVAGRGRLRGADARGTRRGRRLADRAGAVRLSGRDAEDLGVPARWNPRRVRRASTEHESGDLLGSTSGRDRRTRPRRGSTRHREACASDVLRDRLPKTPRRAPAKARLRLVRSPPALGRSTPAGPIHGLRRRPAAARRRGRRRERQLLIGTREAAAQTRSRGSSRGINALRAARRVAPSARPEVHRLAQERRQAVRGGHAVEPAEPPCAVRLVTERGEDAHG\n>MGYP000735556993 FL=0\nMKKNILYVLLIFIFIACDLTKEDKKNTVRGDIVSIPITEMETDYGKLSDFAEDIKMIPLEFKDECILGEIRKVVMSDSYIFIMERNNPKGVYVFDHMGKYLYKIGNRGQEPEEFVDLSDFSLNEEERVVYLYDLMRTKVLTFSYEGDFIKDIPMNYYADN\n>MGYP003340149605 FL=1\nMGPNIANAIIIYLSGRVIDELINESNTKVEQGDFKLLDILHHFTSGMKSISTDMMYRGTDELRSSCGGAGFHVASGLVTGFTDHAPLATFEGVNTLMTQQSSRYLIKQVKKAKSGKTCKDYFEYINHLSKLVSSKSEAKTLEDC\n>MGYP003571959109 FL=0\nGADSRVAFTENNSQTIGDYGTESHGSIDQKDGQPGCLLQAKSEETLGRKATGPFSMKKG\n>MGYP003329312794 FL=0\nRRGAETSGDIDIIINDQPTFDQFIKDLVDKNIIVEMLTDGKTKKLTVAQLPGKTPRRIDFLYSPPDEYAFAILYFTGSKEFNTSVRERSLKLGFSINEHGFSKMEGKKKGDKLNQEFKSEKDTIDFLKIKYREPSQRNSDNLEEIIEISQPKSDNSPKKTTRKKRDSNKKNKILEKIEELLL\n>MGYP003570303464 FL=0\nFLICQTFHFXLXKKHTTAXSTLCQIFTTQEKPRALLELFLKMLSKFLIFKVKKKLDAAALTLFKNIQIRLFQQEPVQYILEQAD\n>MGYP003863973903 FL=0\nMRLCLSPRRPYRHRRQARVDGLHSVIVKAEPIDIYRMLRLHNPSPYMYLFQFSDGISVVGSSPEALVKVNQKEVMVHPIAGTRKRSASPEIDKKLAEELLADPKERAEHLMLVDLGRNDLGRICTAGTVEVVDFMHIERYSHVMHIVSTVIGELNDGVSVVQALSAVFPAGTLSGAPKPRAMEIIEELEPTRRGLYGGIVGYI\n>MGYP000597221545 FL=1\nDQVADARLDHHRRVHAGKLRERQLAAHHLGILLVAARCAGRGDIVLAVDRRQTVGVLRNADHEARIGTEGFANDTGGGRQGLAQRLGPAILDFVPGDDRHRALGFKDRRAGLGARGCALGNIAFHRRGRIALPRDDDLVQFRRCGLLGDSSGMKGKETGSGEKGYPGVHGPSNKTKEIHD\n>MGYP001178354147 FL=0\nMEIMQDDLHKVEYRVWFSDSHRTLYLDTYMVWERKSKRHGWVVKASYHRLYDRYSTLTLAEVPFGDDIREMVKKEFMDSVTVKVWEDRK\n>MGYP003521894557 FL=0\nDYHPVTEVLMALRQRPFDKAPAFDLDDIWKKYRWQLATVGVLITLVLLLAASLDRYNRRLRQLKVRAEEGDNRRTIRMSATPCSSCTKQRPKP\n>MGYP000829874590 FL=1\nMFEMKIHTVRKYGLTINDEDVYFSSKGKAIEAGKISIKLNPNTKLFEEYKLCLLYTSDA\n>MGYP002763718406 FL=0\nMFTADAHYKRCGYPFFCKYLCPQGVLEGAIPLSAVDSGIRAALGTLFSWKLGILIAVIVLSVLFYRPFCKWLCPLGAFYALLNKVS\n>MGYP003059114969 FL=0\nMPDRIPVAEKDFMFSAITEEFGLIFSIALLLVCLNNLILMMNIASRCKTLFYRLVAVVAFAQITPHFGNGPVLANLND\n>MGYP000926614758 FL=0\nPNWVPSIWGVLETDPATLAQPRAAALRTKARTMVVASEASGKLVELDTMLSDLRHKADAMSLSLSDGSLRQQRSRLNSLRDQAAVQEAAVFDTSGHVIAFTSDEKDALAPVLPSSEVLRDIRMQRSSSRIRVAVIEPRFSPRSPARCSKCALAGAACARRSQARWALPARLASTRR\n>MGYP000302371285 FL=1\nMAKMAPGNAVHGDAYKYDLMGEYQMLADVAFKLSVNNLTDKHYADMLYRGHYIAGKPRTLQLTATAKF\n>MGYP001304573571 FL=0\nLLNEIPFPKNLKNVPTIASNHHEKLDGSGYPFGKQEKDLSIQSRILGFSDIFEALTAPDRPYKRANTLRESLDIMYDMCNKGKIDKEIFKVFLNKKLYKKYAKKHIHKNQIDGIDINQYSFS\n>MGYP001161862952 FL=0\nMKERGISSSLWKQSSMLIETFTENHTIECAVDNIAYCSCHNCTDSQNQSSGCFFTDKGRKEPSYTENCYNSEDTKNEFPGFAPHFHPEGHPVIFYEMQNTPVTKQVNFLPDLHMGFDPYLQNLIRQ\n>MGYP001557844164 FL=0\nKTNLFVFFNRIGLKDEGSYYLAELEDLGKDLKIRHN\n>MGYP000311311414 FL=0\nLVMFFIFSLSLSFSFYCVFSLIH\n>MGYP003155641669 FL=0\nMIWSNRFQEILADLDRPYAPMFRLQIGTTAITYHMSETERISGHKVLEILSHPGTASYPDLSAPNPQLEGQGNFSNGYTSGPYKYVVGLTSRISMGAQSVSPRSFKYTGASLQVDVSRKAFSLATKIYVGAMAVLQVCLDDPDDPT\n>MGYP000405580788 FL=0\nAAQANLQAAKQDANRLQAERSAAVQQRQNTRLIAPADAVVISRDAESGSTVVAGQAVLRLANPLSLWVKLRVDQARSAGLATGLPAQIVLRSRPQQLLSGKVERVELQADAVTEERIAQVAFEQIPAALSIGEMAEVTLKLQPADQDLDADFGGGDRIGDALGRAVARKGRRQRLARRQKHLPEPT\n>MGYP000037092074 FL=1\nMINLKLIATNILSNENKLVYEIIYDAAGTRYSYLDGELDGGDGPAVEKTNGDKEWYINGELNREDGPAIEHANGDKYWYVNDKLHREDGPAVEYANGRDVWYLDGHKIKHDSKTWSQLVKDSEMEREIGRVMDA\n>MGYP001501362630 FL=0\nQAFIQHGNTAGESGFSSVDTTSVAAGVGGEIAFHGKYNTGAQDYAYYGHIRGIKENATNGNTACALTFHTRPNATAPIERLRIDSSGRLIVGGGTHAGGSALVVKGGNQNNYSTIGMFSNHTNPANNTLLTQIRFGANASAVGADIRVYADADWGTNDYPTRMEFHTTPDGSNSKQVRLKIEKDGRVNVLGPKLKLPTGTSNPGSSVAGDSYYNTSDGTFKIYDGSIWGSVVVAAKGTQQNPAANSTELAATGALAQYYFKPNTGDTAFQQYACGGLSNLGTIPSGGPSWVNSHSSLIIIEKGQVGATSTMKMSQANYGKFIKESITRNSGTTPYVYWAVFDGGTLWGIWRIRWTGATYSTWFSNHNYSEGVNTAPSGTPSSDVWKTGSGTTGNALATGTYTISNNTSLNRAVLPEQDYNSAGSWGIHYKRLGSGEHYPWRNSAGNYTSNGYFEPSTSYSMGTDTRYIHYVYLADN\n>MGYP001058876537 FL=0\nKSISTSRISSAKEKEKLEEESLKSTSQLLPVIDDIIIKEDPRKFLKNIVQFDKGSTCTIYTAEYNGEEIIVKEMIIDKDNEQPLLEETRLMASMDSQYIVKFIAAYRVDDHLWILMEYMDGGSLTNIATLCDCQEEHIAYFAREILHALDYMHKQHKIHRDIKTDNVLLKKNGEVKLADFGFTAQLDKKRPVRKSIVGTPYWMA\n>MGYP000564650396 FL=0\nLTVSSTKLDALKKDFDNWAHVSESADFPQQ\n>MGYP000266732317 FL=1\nMAQILFYTLTVLIWGSTWLAITFQLGRVDPETVGISPERLEFLTRTFQDYVDNGQLPGAVVLVARGSQVAYLALLLPLPDGQPHGSRLRQRLDYQHPGHYRFLREVPLEERLVVGDVLDALEGVPLLGDEGVDHEERVTVRKYGACLLYTSDAADE\n>MGYP000394770065 FL=0\nPWLKELAGIRHEFEARMAQLLPDSADALAAFLAEYDLGPATAFEGILQGIENTNYRLETPAGRFVLTLFERRAAAHDLPYFVALMAHLAGAGFPAPKPIPRRDGATIGEIAGKPAAIVEKLSNYALVALEFSSFAPDSASAMMARLALGVAGQKVVDLEAVLVTMLKQAAGEHIGHPEVLGDILRKATRKR\n>MGYP003657985056 FL=0\nGVVIASYRPTLAAEEATGGNTIATLGNYTVHTFTSSGTFTIPADKRVPIQYLVIAGGGAGADGGGGGGAGGYRNSTIGELTGGGGSAEATLASAAGSYTVTVGAGGAGTSSDGNNGANSAFGSITATGGGGGGGGGRVGLAGGSGGGGGYFTKSGGSASSPTQGFNGGTGGGAGGGCAASPHNGGGGGGASAVGTNTAGSTDGSGGDGLSSSITGTSVQRAGGG\n>MGYP000700515465 FL=0\nSSDVCSSDLGFADQGADRASLVAKGQHGPAYHEADHRHTQGGHTQKTQKRTECFADGNGQRMNDGAEAPDHDRPGISFFGTEFIDDTSGEQHADGITELEYRCDIGIIAVRPPEFFSKVGLQQAQYLPVEVIDRGGKKQQGADRPAVFADCFPIHMKHFIFCRPG\n>MGYP001095249562 FL=0\nKSLLDITKCEEGASLQFKQTDLRDFIRNIIEESAICVLGKQLNLIENVQDIPNFIPIDETALKRAIMNIMMNAIEYSPTKGDLMFSVEMISEKLQFIVEDSGRGFTEEEMHSATEQFYRGDKSRNSKDHHGMGLYIAKSFAKQHGGNLYLSNSEKLHGAKVVLEISA\n>MGYP000020363101 FL=0\nLLKQLKPTSVQQLAATLAIIRPAKRHLANQSWEKILKEVWVKPTNNEYFFKKAHAFAYAMSVIVHINLLCEKIKS\n>MGYP000387930855 FL=0\nMTIDEKLQHFYEVSVEEAKEDAAKAIQEHRESLSQMLEDHKAARRQSAEAEVKAEAEHVRREINKALAAEQITLKRGWSRKQEELKETLFVEVQEKLADYMATQEYQQLLISQIREILKFAGNEEVTIYIDPADQSCLSGLTAAVNHPLTVSEYSFSGGTRAVIPGRHILIDNSFA\n>MGYP003117850129 FL=1\nMADTNGFWTTAGARDPKRGFRFRVSFAGGTNSVLNGIAWYAKKATKPSVSFSEASHQYLNHTYYWPARTEWNEVDITFVDPVEPDLCDGLTSLIESVGYVVPAGGAFAPADFSTVSKSRSVAALGNVQVEQIDEDGAPLETWTLNNGWVKELTFGDLDYGSDDLTEVTMKIRYDWASVQIRNAVTKKFSLRT\n>MGYP001108639497 FL=1\nMKRFALIGAAGYIAPRHLKAIKEVGGELVAAYDPSDSVGHMDAYFPKAAFFTEFERFDRHLNKLQEAGTPVEYISICSPNYLHDSHIRYALRNGAHCICEKPLTLRPWNIQGLTNTAQATGNKVFTILQLRLHEQVIALKERVEQKWLKEPDHVFEVDLTYITSRGNWYYASWKGDEEKSGGIATNIGVHFFDMLQWIFGPLTSQKVYLRTHDRASGMLSFERANIKWFLSINESTLPETATNEGKRTFRTLSFDDWSFDFTEGFTELHTQSYQHILDQGGFDEKAAENAISIVHQMRETALTPLDDQAHPFAHLPLEEHPFYPKR\n>MGYP001328585271 FL=1\nMRHVIDARESGSQDYKCWFFISVVNRLTVRMSYPYVTHNNNVTKEQSGFAQNRIQVVRHKVDLMFDRRRQRPSTVPLL\n>MGYP001616298175 FL=0\nMAKQFKTNVVVLGAGPGGYTAAFRAADLGLNV\n>MGYP000014566423 FL=0\nDKSFPKVSIIIPVKNEEETITELLDSIFELDYPKDKMEVIIVDGKSTDKTVEKASKYPVKILFEEGKSPNNARRIGIQHASGDIYIFTDGDCVVPKDWIRRIIDDINEEEIGCVGGSVFVEKSLQDNLLAAYSDHSIMRVMPLVEEKEEISEVRVFKHLAFCNMAIKKRALERTGGLDPTLKTFEDVDVVTSICKIGYKVLRDPKVYVWHKHRHTIREIIRQTYNYGRGGPKFRRKHPDTPIARFYTFGLTIFTAYFFILILSSLSGIILSNIRPI\n>MGYP003409085276 FL=0\nMAIESTLYGDRKVFTVAAFNSGVATWLRRLPELWVEGEVTELRRNEAWANVFFTLKDPASGSCLAATMPRRRFDALE\n>MGYP001804777217 FL=0\nMLVLHPSCEINLLISLIQVLSSTVNAVFHPIVTTSRELLVNIMLCWFLLESYISGAVKRH\n>MGYP000216902384 FL=0\nVPADQAGMVVDGDAAAADGDAIPSDFIQGTFKPSETTVQAQDSYEYPFLGLTMKLPEELLKQIKEQTIAMITNEGWNDNADAIKYAYISWSEMTEEQKEAEVDKLGTAYDDWYNSSVEEILYEDPDGIGDMIQAVCKLIHSCVDAGEYKEAFRTGRRLFMQEILTDDEYMTGPLEVEDFICCNELDIDLKKIALDTLYACYQVKKEAERADIMYEIWSNSGIHDLKLEDVMQHGD\n>MGYP003292492700 FL=1\nMNKKISLVTLGLSLSSILILTGAMIISQPKYTLKNIVGKQSSLGDVVVYSQSKRGIYSNDSVILSKDKYQFNKNVNQNPDLYKYSKNFNKNRDIFPGYIHDTGSIYSDENSIGYIEYIDEQYGETDITLSTTIKDKNLDTGEFTQFKIEIPNSLKSENNNNHKGLVTKYNGEVYIALLGEQENNPDIKMGEKDELENFVEISKVNFNSKEAKSVNNINLKIDDKSKYRIVYHNPFVIDNKIYFYLENQDKLENSYYLAYYDMENNKFDYIDNKINLEFPLESYQQDIEGEKLNLLADIDNKNKVDLRISTIDLTTGKVITNNEEYSIKKLNKEMGIDGFRIIDNKIYILASALKSYYDVRDYTENIIVLDKTSKSTLYIGEYKQGNEFKANSYILKKDEL\n>MGYP001325456118 FL=1\nMNVAVFSDKFSGTLTAKEALSIIKDVFQASSINAEFFSVTDGGEDSSKIFKEYGFKQFEAFRSYNCDGTEVEVESLNINGLKYFETAQLIGINSIKDSLEINSASLFKVLQKVNILGTGGSKTVDFGVGLLSKLGIDFLSNGERINNPTPKDFPLINSVSTKEFDPDINLKVLADTTIPLLGQNSAYDVFGPQKGLKQEFIKQHQIETERLIELLAKELSLELNPYEQLSGAAGGLSFCLHQILGCEISSGSKYFMETTNLAEKVKEYEIGVFCEGKFDESSFEGKIIGELLKNFNGNSYFLGGQYKAESKKLFTNIFECGEAGLNDPKGTLKIATNNLIKELT\n>MGYP000616556949 FL=1\nKPTEEAIFYAACKKAKLLMYMKKMKIINTQNLLRLCYVLQELKHQKQEFIR\n>MGYP000530409509 FL=1\nSPPVNSEAQEDAAGISKDATIEALQKTADSNVLIQEYSNTTQEKTTETVDVLKEILELMKKMSADNQSGTAGGDGGDGGGMDIDLPDRRRGPRRSRGRLRARARMASRGIRGRVGGLARGLVSGARTVGSAILSGGARTLGMLGLGTAGATGAAGLGTAGATGLAATGATGAAAGGGCGHAAGPQQHRP\n>MGYP000350425517 FL=0\nHRPEDFLAVDPHGGRHVVEQARADEVALLVTGHLEAATVDDELRAFRDAQSWRRLEVGAAWIEAQEEWRGARFYPDANSTLRVTYGTVRGYRPTPDAPNGGRRLATDRARPGRSRPG\n>MGYP003641307857 FL=0\nGGTWQXSGHAHSAYPLQDXSLSPVDKALSFAGLLWKKLIMSSAKRTRSRSIWMLRWLPCMSRVSHGESFGQTCTRETGAAIWYPAKPALSPFDRLTAASYLRAHPFAFKRDALLLRQHNSVQSANGHGSSLTDRNDRETDISLFSQLLGRRCATVFSLHSAIFFVNY\n>MGYP002623368859 FL=0\nIKFPKVTIPVKPGRNIAMIVEVAAKNMRQKRLGYNAAEELNKRVLKSIEERKASKTLG\n>MGYP001326310147 FL=0\nSQADLGKTQYGSAPSPNKLMDAYHSMYQDQKEQTLDEEGRNIFGSTPQLDKVEKIKKYKENADRVLRNKKPESGNDNTKNLNNSVDLLAAYRAVYEHHKKDEDGNTIPHEDDVKEGKIPAGLQAYLDKKKGKKKDDDDNGNDEKESKKKAKKDVKEGYDLVYNHFISEGFSEEETYERMSNLTEEQLDEFLKALAQAGMRGAESIGKKTQGLAARAAQQGAMTDPKFRKLEKVQGPRPNRADQVLDDLRTRRKQQSDNLRGRLDTAVTQLRSKEGLKFGGSQSSTLKSTPTPTSSTSKSTATQTSSGNTTIKPQQKKNNNLLSTDNLVKAQVVGSMLSGGGNQQKKKTGQVSSVQGPSQAGALSSIRRSRGQVMQDSFDLISNELIKEGYSEKETYKIMSNLTEDQIEELNEAIVSGTLATLGVLGKLLGGGVAKAAAVGKGLATAAKGGAMAVKGAAKGAMSAAKTTMTGTKDLANKALTKVQSIAKPPSKGPKITSSGGDIVQGSDQAKNKILSTDNMMKAQMASSMLSGGGGQKKEKTATVSASADLFDIVKGQLLDEGLSEEEIKDIMLTLTPEEILNEMGAKFPAGKGAKYRETPKPNPQKRLGDRTDGTAGSYVEKPQKPQK\n>MGYP001574869672 FL=0\nMNTPTESAAQESELLKGIVTEAMRRARHFRAVVGSDYDFAYKELETFLYGILRGAPQPPITKDAKPTNGHAADNENAIPPGAYRDGYAAG\n>MGYP001569408988 FL=1\nMTRKKEEFKSIVKGKVGMYTCGPTVYWYQHIGNLRTYLFSDFLKRVLLYNTYKVNQIINITDVGHLTSDADEGEDKMEKAALKEGKRAQDIAKHYFDVFHVDLHKLNILEPLNWTKATDHIPEQVTLIEQLEKKGFTYKTDDGIYFDTSKLEDYGILAGIQKDQIKAGKRVDIGGKKHTTDFALWKFSGEVGKRQQEWDSPWGVGFPGWHIECSAMSMKYLGKTFDIHVGGEDHRQIHHPNEIAQSEAATGKKFVHYWLHGAFLLDKEGKKVSKSTGGLYTLSELEEQGYAPMHYRYFCLQTHYRKPLQFSFENLDSAKNAFERLKRKVFELKATEHTGRDKTKEYEKEFHSAINNDLNIPEALQVFLKMLDDSAFDTCKRIALLEKFDTVLGLGVVEFKEEKFTVPQDIQELIDAREVLRKEKKWAESDILRQRILEKGFRVIDMPQGSKAEKI\n>MGYP000341628933 FL=0\nQRGPKIASAKINDTGKKKSYRKSTIHQAEKKEKEPSKFKRNIRESNTSIKTKNTNLHIAGRTGALAAGAVTEQVEGGQEVSQAAYLAYEVSRPVTGTASRGASLFRRKAAAEAKRRIKKVETGKKLAKKMGKKAASDTAKKVAGDTTKTAAKETAKNTAKETAKNTAKETAKNTAKETAKTTAKAATTAAGTAVAPGAGIAVGMAAGYAT\n>MGYP001115643208 FL=1\nMCSRKKWPNSSGSFVLSLFFPMDGKWWLTFHIVGLGTASFEIHDQHGLQKIIYEEVCWKWCFSLLLEANRLVYIGYRLAS\n>MGYP001336892370 FL=0\nSKLGIKALFKILFAENDVVVSYPGDRMIIPSKSTWAETQILRVLPIPEVFCPVGSRILPPDKFINSKLTYFKENFDKEDEILSESICEYAFSFPFEGETQFELVLQKDSLLGEILPTAKSILTLALEDDDRTITMETTLGFPSSGVVYIENEAIFYTSKSLNQLFDCKRGYNGVAVNHPNGSRVF\n>MGYP003760760195 FL=0\nARIPAELVVLEVGLGGRLDATNIIDRPAACAIASISLDHREMLGDTLAAIAFEKAGIIKPGIPVATGAQPAEALEVIAARAAALGAPLLARGADWHVAPTATGFTWRDASAKLDLPRPSLPGIHQLDNAGIAIAAIRASGLAVADAAIAQGIARAQWPARMQRLTGHLAALL\n>MGYP001290313395 FL=1\nFRSALARFKDAEAFILLNRWSIKYFHSDGPIMPYVLFQVWSFIAPGLYEKEKKLAMPLFISSVLLFYLGIAFCYYIVFPLVFGFFTSVAPVGISVTPDINSYLNFILKLFFAFGLAFEIPVATVILVRTGITSHSALAKKRPYIIVCCFIFGMLLTPPDVISQSLLAIPTWLLFEFGLILSRFISVKS\n>MGYP001572697057 FL=0\nADEVNFPSLPGGIGQKLILRTAFSPPVTINLAATSPEGQRGGDSQGGAATAVMNALKPSIEEPATGLRIEPWGSPGDWRIPLGILLALAAFGVYALARG\n>MGYP000217052795 FL=0\nTLFRSFFNDPCDLLLSLSLAPIMSFDEDYLVVSLNELSYEDESLPNNTLKISDVAELIPLTEIAFSGYDRKFSTGMIWTHPSKYQFDDTFLDFSKLQIRKDAEKNFNFLNEVYNFNEVERHINEDIKKEIIEASICKRLLKKSDLNIKGNEFPHVYCSLMIYEQGSHLSRESAMGFLMHAVGVYILHKGYGSQLTSKIELNNST\n>MGYP000907485586 FL=0\nMLRWQFVLVGVVALTLSACKKNEQPTAMPAE\n>MGYP000122865995 FL=0\nMEGVGRGMGFITSLESYSILTRLNQHHKSELFLTSLNHMSESFPISLIQHKFASSTPIWNDALANLKRLRIAYLRLIYPVLSLAGQFV\n>MGYP001557166919 FL=0\nTPLEHTIPADSLLPVELCWRVLAEVEKDYSIMVQVIGPENSLISNRRTFPGLGRYPTSTWQPGAAWCDLIHLLVADKGIPKTLVYKIEVGMLYPELDDRISIYGTAGDQIETFAADVLITQDADESVSLLDTDEIMTLLDYQVEPVWRPGQANQFVLTWAVSSPISEDYQLYVHLRDT\n>MGYP000281517610 FL=0\nMREHRRLGAASLAVGATLLLSGCIGAGPSVVVGSEVNIGSTVSFTSMNPQSQSGRTDTNIAVAAATGARFFNFDETAAVVFDPSFGSVTKLSGDPLVVRYTVADGVRWSDGVAVDGADLLLNWAALSGVLNDPRLSRADVFEENTDGDGEEFRADLPTDAVYFDTGVNPARPRGIQLARAIPQLSDDRKSITMTYSAPFADWAIAMPSAGLPAHVVAGEGLDVEGSNQAKDAVIAAVLEGDTAALGPLSRFWNTGFNVADTAIDGTSSLLVSNGPYLISDIVAEQFVTLSPNPNYVGAHRPEFETVTFRYFSDPLAAIQGLSIGAIQVATPPLTASVVSALGALQLDTQAGYSARWEHLDLRVTESKSGVFDNPLVREAFLKIVPRQLIAGMLTEDADAPAGPRDSFLFQPGQDGYTSASRANGDYLLASPGGATAAVALLAEAGVTAPEVCILYPSDDPLRAREFLAIQGAAAPAGFVVTDCSSADWQDRLGAAGEYDAALFSWELATPGISDLEQIFATEGFENLTGYSNPELDALFSEITASTSVPERRALRLKADALIFSDHYGLPLFNYPRVTLFDEDEVSGILPSPTASGPYWNIWAWKPVLPG\n>MGYP000572280030 FL=1\nMKDKDLLKLLLKNGWKDVPVGLLNAILKRTGLK\n>MGYP000287529352 FL=1\nTMEKALKIEKYREIREKKERTSQDLEGSPKVP\n>MGYP000977872181 FL=0\nMMTKNPGQDEIHMIATNRRARHDYTIENSLEAGLVLQGTEVKSLRE\n>MGYP003566039669 FL=0\nERQLAEAVMKLKPTTSIQEKLWSRITADVDLMSDYRLIRLDNALAEPPVYVFVIIIGFILTMSCFGVYQPQAPLVGLVVLYTVFIGLVRFLLLTLSDPFHGIGVQPTSFELKYALP\n>MGYP003578873141 FL=0\nEGHLRAQLRRAAEFEEDVEVTSEMTHAKENVFALRVKGTSMIDALVNEYRTCRPDLVLTHSTDDPYNPDHPTAHQISLQARVYAQAEGYPASGRPIGAPPVFMFEPHQPERCGFMPDVLLDITAVWEQKRKAMESMEAQRHLVDYYSDLGRRRGTQAVRNSGRKGITVLTGEVGTGKTTLLRAALEPMKSTAVRYAHLSNPTLTRSEFYEFL\n>MGYP003526032744 FL=0\nMRLSLRWQEALLLVSGYTLLALQPSWMPNVGLFALHGLLVLLLGWMAGQRLFGSGYTAFERFGGGVLTWASSLSLVHTAAYYASIPLTTLNTTLLEAVIAAVVFAIPPLPETSPTNAPVAPVALHQRFLGLLAGAVGIGSAAFLFRAALLHPATVSIRTPWPLLPNGVFLFFALCFASGLVAAHVTRSVQTTWLAAVSWFTISALPALLYPLGYGFDGFIHRASQELLLRTGTLTPKPLYYIGQYVWTVWLSRWTELPLTIIDTWLVPASIGVVIFAFVGLLRRSSPSLRWAPWPLLLLLPLGAFVTTTPQTWSYLLGFSALLIALWPGLQGRAWIFPLLISLWAGLVHPLGGLPFASIVWALGIGALPIFKRYAVPVRIIGFIGALLLIPLAFWAQSRLGNTPIRWSWDWLRWEVLRTSFADLLLAPRQTLTLWLDGAEWARTAVSLGGILVGAWLCLRPK\n>MGYP001228241971 FL=0\nINLSLKETGSMKIELIIDAIAVLFLAIGGSLYFSYSKSRIKGLQIWTPISKRLILNFLVPLATGGLFIIILYVQNQWQLIVPSMLIFYGLAIINAGKFTYSEVFYLGLAEILTGLISAISPEHAIFFWSFGFGLLHIAYGLFMYRKYEV\n>MGYP003467506258 FL=0\nEHVFDDEHALRPAEPAERGLRRLVRLRDPSLRHEIRDPVGVVDVAERTPHDRLREVEAPTAVGGERRREREDVADSAVRIGRKIIELLGARDENGYVFRVDMRLRPSPEVTPIAIPVEAAISYYESSALAWEQAAFIRARAAAGDKALGDYFLKSIQPFVWRRSLDFGQLANIRKMSGQIRDHYHKGQVLGPGYDLKRGRGGIRECEFFAQAHQLIHGGRDPGLRMADTRTALAALA\n>MGYP000492251796 FL=0\nDMTGSASVALPQITAGAITSTGLNSTTGTVQYTDGGSAFDSSDADGYPRFTVTNGSAQLGLFRAGSSVGGSYIGADDSKLLRVYNTSFASKFDIDTSGNVTALGTISSGALATTGNSTHGGYSSWTAGNGTSGIFQHYNSSNSYRGYFDWRTLQLGNNGANNILAGNSSTGGYFKFWVNATGISQTGGTSGINALTISAAGNSTFSGSIDSGAISSTDRVTVTTAGADGLVLAPDTGSTNNSARLFLNGSVGNWAIFNNSNILKFNSSATAGSTSGNLAASLTTAGLLTVVSLTESSSIRYKENLKPITNGLEVIKKLEPVTYDRTDNDSKDEPGFIAEEVLKFLPN\n>MGYP000299415252 FL=0\nLQKEGKDRSAYRVSEADKRELLAAYQRRGYCEGYYHQHNGRDMISLKRPKNAKDGNTEEKPWQDIKVQEKINGILTFSVGKRAKLTVSYGNITVECTGQEVQEAQKQPLDPKRIEKQMRKTGNTEFVFERLKIHTEGNVFLPMQALNELRREGIEELTEQIQMQYRREKAGCGMKTATAGFDSDADGVTETAGKKE\n>MGYP000035781564 FL=0\nFDRLLSIYNRFPLKELIIHPRVLKDFYKYTPRMEAFRNAFANSAAPVCYNGDIVDRESYERLTAAYPALDAVMIGRGLLADPFLIETLSGQAGTERRRTQIERLSAFHQQILEGYCQTMSGDKNVLFKMKELWFYMGHLFEENKKQMKKIKKSQKLSDYMEAVDSLFEEGEFHAWGTFE\n>MGYP000547744649 FL=1\nLLFGFETQEEYKELLELLIQLRTPKLSSLFNSI\n>MGYP001288746208 FL=0\nFFDCKRCFFFDLKFGIKRPHGTPLVLNNKIIQQVKKEFDFFREKKKPHPEIIKLKRGFIPSNHENLLKWKNSFNGVFFVDKKTNLKFHGTIDDLWFDNQTNSHISVIFKSTSRKDQLNQSEIWDGYWKQLSFYSFLLSKNSIEMSQSGLILYINVLNEDNFEKEIKLDFNLFEQILDFSWIENTIENIHELLNKDAIPDQNRKCKFCNYFNNIKKIHE\n>MGYP000877297596 FL=1\nMLFRSADAVEAVIRGLKRAGVSVATYLPDSLLKELYPALDADPDIRTIPVTNEGEGAAIAGGVFLSGKRAVLVMENSGLRAATEHLARMGLGAGIPVVMIMSYRGEMGENNWWAIPHGITMEPLLQALRTPYTIVRDVDQLETAIVRAYDTAYASYYHAAIVLGGDLVR\n>MGYP000780934939 FL=1\nMTLKEAYETGRDLDVYVDSEMADQDSHSFDDLWQSIYDICLLYTSPSPRDS\n>MGYP003414964913 FL=0\nFMKKNEEINMFTVYILYSPSMSKYYVGSTSMDISERLARHLHDHQGFTSRAKDWEVIYTEKYDDKTEALSKEKAIKKRGAKRYLEQLGHL\n>MGYP000195956432 FL=0\nMIGYLEGKLLKKDSDRILLLANQVGYEVLLPAVVMETFGAQKIGDQISLYIYYQQTERQPKPVLIGFNLEAEREFFQLFISVEDIGPLKAVRALNIPIRDIARAIEARDVQKLNQLKGVGKRTAQKIIATLAGKMDKFA\n>MGYP000654245701 FL=0\nMSETRYSKDHEYIRVEGDVGIVGISDYAQSQLGDVVFVELPATGKALSKGAEAAVVESVKAASEVYAPVSG\n>MGYP001494102332 FL=1\nMADYKPIEAGFTKIRMLRKYDVFDLLSISLFNAVVFGCGLGVGWLVWCY\n>MGYP003981121435 FL=0\nGTLCHFDSXYYXQSDSDCISSGFXNDSPFLKCLAFYYQSIGEEGKTRKELQNHVLQVEETFISNFS\n>MGYP000559679233 FL=0\nDILEDIRAFFERNVHMKMPENNVQQAELPEGCTVFDNPVGTAPGCAFEADGVHVLMLPGPPFEMLTMLKGHVVPYLRGFSSEVIVSHDIMTFGMGESSVDQLLHEKMSHMENPTLATYAKPAEVRLRATAKAETAEAAEAMLAPVVKDVTDFLGDYVYGVDVSSLEETCFRLLKEKGMTLATAESCTGGRVAERMTALPGVSAVYRGGVVSYWTSVKAAVLGRQTFLRPAQHNRLDGSPVAAPAPTVEGDHNPRRSHPPRHSPHCAAHWRGVQAAIAPQ\n>MGYP003443514059 FL=0\nMASLIDYIHLYGGVSFSKKRFNDVDNVILSLVAYIDMSNTAAATSDGIRLADALENFIRSHTQKEISRYGLAIKDAYLVAKELIGAPRFADVRVSDYVYLADGDTQFGAMVFHLTKYLDYICFEGTDHTIGGWREDCLLACYHPVSSHILGADYLKKHIKLSGPTVILGGHSKGGNTALVSALMTTPMRRKKIRMIYSNDGPGLRRRELLSKEYKSIRSKYKHIVPQNSIVGML\n>MGYP000585668832 FL=0\nTRSSHALALNLGNITDARMKSMPESLKTAASLHIPVMLDLVGTACSNLRYEFANRLMNIHMPELLKGNMSELLAMSGQTAHAIGIDAGDEDTVTDINRLHLQELFQEKAAQWNTTLLITGKEDMIVSANKCSFIKRGTPAMSQITGTGCQLSGLMTLIWQRIRTTCWSRGRSCLRHGTGG\n>MGYP000681108114 FL=0\nMKDQDLIQAIEQLVTDHNPPVSDLPGHVDFIKETNRSLVTKIKELFFKSVPVGSTKATIQVHAVMSFWYAQRNIERWSLIDKVFGEEDEGVVNHLKDLFMKAKYCINDFMIDLDEEKRMKLIQYVMDQYNGFTLESAKRYVDQLEK\n>MGYP000336411506 FL=1\nMDIINIVAVISFFLIEIHTLPLVESLIVLLVEFFLHVNQRFAIDVGFDEKAEVF\n>MGYP001129885005 FL=0\nQLLRDLVSRLRLPDSPTATAVAEIRPFDFVAADDYELPAAYDQRRPPSPSAATVAKALSGEKPPPYWAGQAAPEADATHLTRLELASVEPELCVALRAEGKRRGVSLHAILFTACAAALRAAFDVPPALGIKAATPISARRFCEPPVDADEVGNFIGGVETWLPLVSAADPSDDAGEFWASCAAYSRHLSANLREGAALPGLLAHVGEWPAAWER\n>MGYP000989466621 FL=1\nMNQSIKNQNIFSSVLLAALGYFVDIYDLILFS\n>MGYP003369514027 FL=1\nMNNSEIITCVNGALSHDQKSVERLYQYTYPNASALARHLCSNPNDVDDILQESYITAFTQLNPLREKASFPFWLRKIVINTWRAFAKNKSNYYEILVQDIPGEELVDESLQLSVQDEVELSENQREINDLVEALPESHRLCVRLFYYEEISVEEIAEILDIPVGTVMSRLYYGRKRLKEQIEQRGLHTFHASPTAASAADPLLLSQILSALQAASGGVSAGGIALKLCLGLASLLTIGGLIGIPVLMKDDSKPAQPSITAHSTTATTAAATSSTSSMTSATASSTTVTTTATTIAATTPRSYISFEFEDYDGGIMLTSYTGTEPDVTIPDSIDGKPVTAVGSGAFKKNRILRSVKIPPSVRRIDSNAFRDCRALQSVAFGSGVSYIGDMAFLGCSSLRKINIPSNVDEIPESVKVEKRRS\n>MGYP003580237746 FL=0\nMEMTITEKPARTLPVQDARIYPRGGLDVLSRAEVARLRDASGGGMHELLRRCALAVLTSGSASDDPRAARDLYPDFDIQVAQQDRGVRID\n>MGYP002553410909 FL=0\nMGDFGGVEQDANRCLYPSLATGENAGLSARLFWEQGKARSNKKINCRGLNNLYQSGIDKAIVSALPFGPQYSNQQLCCFNNYIKQQVALFPHRLKGFCTINPLEQDALSYLEQLIGSEGFKGLKLHNNMQQFYPDDTKLYPIYQKMQEYQLPILFHCGGIGLPPTRDSYGQPIRFDAIACDFPDLPIILGHAGRTWYDETAMMLRKHKNIYADISTNIGRLKSHAGKPMADLLEKVKVWAGHTNTLFLGSDYPFYGQAETVEIL\n>MGYP001481087062 FL=0\nFIEDKALDFFKNQTLKSAIVQSVEIMESKGDFEQIKRLVDDALNAGSERNIGHDKKPARMKAGFQVVIYPVSKGLKDSN\n>MGYP001410066015 FL=1\nMNITGIKKLAKEGKSPYFFSPDTMRFFSSKVYKDVRAVKEGHLFITSEVFGDDSRHYSLRLIDSKGSIETLITKDNLKIIKQLMRAY\n>MGYP000418322004 FL=1\nATANKKAQQRESNSRPQHSNPKRGREAGFTPTHEKRPNPHANYGVHFDMYSASDEERQNSLGRYGKQAPWAQPKQSHTPRTPEQEASLKRKIRALEGKLEDAKRDQASGRNDFPQVMLVDGTSSSLSVHVRKSMETELRAWNFDVPPRVSKDLVTIRFLLDYGEFIQELNCPVDMAYLNLRLMSQKWKEARLTPLRTAVS\n>MGYP001323574780 FL=1\nMYSLELFVIAIYCLIEDALYPHFCHQHGQPRRAGFPPALSDSECLTLEVVGHYLGYGTQKQLYEQLCDRFGTWFPGLRIGWPLPGSRPTCGRSKPGSTSTL\n>MGYP003297312165 FL=1\nMDNASNTLLGKVKKLIGVEPGTKLQPMVAYNSAVFFTGGGPYILGCYLLPFLTKVEGLDAVPESVSAEVDVLQIAENWSLFMSNDLPFSTVAKDLIPSSYQYEVATKYANGIDITFTSIHTLLDPAFVDEKVTNFVWITDNLFSVDISFVKRMLLSSGTTIEDSMNDRFYFVKYDDTNDYSDNPTWKLLSMKEIVGNAE\n>MGYP001502702574 FL=0\nMINPINLAILGLICGGLMKFFWQMGLENKVDIASFLAVDALFIFLFTVITFLYLKQPFVLSGRMSIAAALAGIFGGIAMTAVAYAIKLGGAGSVIFPIISLETLLVVILAFV\n>MGYP000531888355 FL=0\nRKRNIHRSIHVESDDYPFVAIFKERINIMREKYESLSLGALKEIAKARGMRGISTLKKSELVERMVQEDDKERQMKESSAPQESEQESRNGSRAGKAEERQESRASGRQEERQETRASGRQEERQETRTSGRQEDRQESRTYVRKEEKQESRTERPPMEQSDLDSGMSVSGILEVLPDGYGFIRSENYLPGENDVYVSPSQIRRFNLKTGDILRGNTRVKSQNEKFSALLYVTSINGIKPNEMRRLNFEDMTPIFPNERLHLERPGGSLAMRIVDLVSPIGKGQRGMIVSPPKAGKTTLLKDAAKSILKNNPEMHLIILLIDERPEEVTDIREAIQGPNVEIIYSTFDELPEHHKRVSEMTIERAKRLVEHKKDVTIFIDSITRLARAYNLTVPPSGRTLSGGLDPAALHMPKRFFGAARNMREGGSLTILATALVDTGSKMDDVVYEEFKGTGNMELVLDRRLQEKRVFPAIDISKSGTRREDLLLTKEEHEAVDIMRKALNGMKADDALENILNMFAHTRNNNEFVQTVKKQRFL\n>MGYP001261365442 FL=1\nMTFDITKPFAPSTRSPNSTPIASWSSWAEERRCRETLASAQQLKQVALSKRHRITFYMERTTVADFVVDDLVSPADVVRIGPCLVVDDHAQHPVVGAQIHHPLRSDDVGIGQDGNAVFGRTSRHDRVVGEASRLRKVPSARLSVPTGVDRALGSRIISTGGGREWIG\n>MGYP001159235774 FL=0\nDGDVYYVAGGGDWHTSGNNGYYSDPNYIRLATTQENATGYYWDDDSDSDTPDVWHAPVVLNLVHHDTSPYTDVTHTLRAVNDQPMSGLVNGQAYFVVNRTATSFQLSNTPNGSPIAFSNGGLTGGHHTFAVEGIDLTSAGSGSQDLVLDIDNGATGSFSGMGGARGASGAPSGDLQFTVSTTGSTGGAVTVGYAKADGTASIDTDLTINSAKIFGADVNIETKSFMNVSAVSDSGAFGGVAIGESNTSALGTNDSDITINSGAVIESTTDLKVSATIDS\n>MGYP001146147798 FL=1\nMRSKSQKLQLKLTIEFALFFIVVSVFIFIHFTKKFEDQINDKYVYKADVFVNFFKQSPNAFTGEKLADKEAVSNLLDLNGAVYLVIEKPTGEILDAINLDIAENNLYVLSKTNREGISKDEKVYRIALPVEGDNISGKIYVGFESRDDAQKILKNRMLTALFSLSILLAGIVFTYFLSSISFRPLAKIFKALDSANIYADIKGKKNVNKSELRVLEDRVNILLGELDRSSGEVESLNRKLHDVFKDKIAELNFEINQRKKAEILLQKSEEQFRLVFQNAPIGIVIISTEGKIISVNRSFCNTVGFERDEIIGIPIKYLFEKNDLEGFENDSLVYDGKPIADISTERTLLKKEGKEINVIVKLVSVLDEKNKVKHYVMQLLDITEIKRVQQELVAALKKAEESDRLKSAFLAQMSHEIRTPLNVILTSIPLLADEISSKDEELKIILDSVKSAGRRLQRTIDMILNMSSVQSGNYKPVFEKFDLLTDLKKLMNEFKSLSDDKGLELKFKQSADESFIVADRYTVNQIFQNLINNAIKYTLKGYVEVFVRNENDNKVRVEIRDSGIGMSDEYLKKIFTPFSQEDVGYKREFEGNGLGLALVKKYVELNKAEIEVESEKSIGSVFSVTFDLSVNFEDESQVKKYSNYQ\n>MGYP000699489815 FL=0\nMQINITIEPEYSGTVWCKETMDGINEKVSSLRYSVNFCSDVSEAKDAMDWAGR\n>MGYP003287736390 FL=0\nGLLHGLWFIGQGEEGGVLFIGDDWAEAHHDIEIEDEAGRLLVRKRLPEGLAGVTLLHELVAEHLDPSGEPDQVLVGIETDRGPWVQALLATGYLVYAINPLQVARYRERHSTSGAKSDQGDAHLLAEIVRLDRAHHRPVAGDSEIAEHIKVAARAHQTMIWSRVRQVNTLRSMLREYYPAALAAFGADLAGREALAVLAAAPSPDPGRRLAQARLESLLRKAGRQRNVAATAAKIRATLATEQLTARPGVVPAYAPARRR\n>MGYP003686838251 FL=1\nMQDIPYAHEVLSAETQTLALEAIKKAGPYEPQTAAAKLERTETAIIELIEQQAAGIANKVHDEMTELAPNESCLIEVYPSRFGNLYLLQKVPCLQTIVENINRISGLDISAMLATEEQDIGDRNPLYVTVAGILIQKGKSLHRGQHLLRTRS\n>MGYP000072504175 FL=0\nRIGPHLVGVARDQPEAPARLGTKMDLGVRFAQLHVAPQRGHMAVGAPLDGIVGAELDLIAQKRLERAAELGREFVVKVEGVVRERSSKNMKIPTGEIEIQVINMTILNESKVPPFTIEDESDGGDELRMKYRYLDIRRRPVKENLIFRSRVTMEVRKYLSDKGFIEVETPYLIKSTPEGARDFVVPSRMNEGEFYALPQSPQTFKQLLMVGGMDKYFQIVKCFRDEDLRADRQPEFTQIDCEMAFVEQEDILQAFGGLTLHLLETICGVRLDSIPRMTYDEAMRRYGSDKPDIRFGMEFGDLNEVARHRDFKVFNEAELVVGFAVPGGNAYSRKEIDALTEWVKRPQVGAKGLVYVRCNEDGSFKSSVDKFFGQEDLAAWAERTGAQQGDLILVLSGEADSTRTQLSALRMELAERLGLRNPGEFAPLWVVDFPLLEFDEETGRYHAMHHPFTAPKPGQLELLDSDPAAVRANAYDLVLNGNEIGGGSIRIHDRETQEVMFGHLGFSPEEARQQFGFLMDAFQYGAPPHGGIAFGLDRLVAILGGQESIRDFIAFPKNNAGRDMMIDTPSTISGEQLDELKLRVIKD\n>MGYP001564172474 FL=0\nIVVASLNFFDTYLAVIRFVDYKLITRLIRGYLVAAVVLYGIARYLDSAAWSERMLLMFVILGPAIALQVRLLAQWFLRPYLRKDQREPVLIYGAGHAGTQLAAALVTSARYKVKGFVDDRPSLQGREMLALPVHAPARLRALKEEDVFRQIIVAIPSITKSRRRAILESLEDLSVKVQVVPGLDEVASGQRKFEDVREVQVEDLLGRDPVEPIAGLVEAQVRGQCVLVTGAGGSIGSELCRQIAMLGASK\n>MGYP000465940127 FL=0\nYAAKRTRRQAQPKVCVLVENMEYANIGQFGYEIVAGFRLAAAARGWAVDVLPTTPEAQARTKYGSLLLEGGYGGAFILGLTPQDAYMRALAGTGTPTVLLDNCVPNASVGYVGTDSWEGVELGDILSSGFEAASFDAALSECAFFLTGDPEGALREAARLLRPGGALLYSDICPGGEARLRRAAEAAGFAVEALTDVTEDWKRYYIAALWRGEAECPPDGARNCRYLCAVFRKEAR\n>MGYP000176012788 FL=0\nNIAKITLKNLSEKVLTIHPLGKAVVRCFKNDHSATIPEASDFKMIPGRGVSANVEGYHVLAGNMAMLNENNITVSQPIMAKTEEYINRGCTITYVALDNEFAGYVILSDTIRALIADEKSPA\n>MGYP001150477923 FL=0\nMMMEVQDEANEVDSDLMENKTHLDANEGELLILRRVLHTQDSPYD\n>MGYP000662722262 FL=0\nMTYVVTDNCIKCKYTDCVSVCPVDCFYEGENTLVIDPDECIDCGVCVPECPAEAIFPESPDLANWVEINRKYAKQWPVITKKKDALPEAKDFDGMKNKYEKFFDPRGFQGQTRK\n>MGYP003721390011 FL=0\nXXSLKSSXVSPPAXFLHTXLLPXEVYSKSASLLXQVDRLIESLLLPISQQQIRKLESERTMLVDRNVGIQAELDQLKQQSRDRIAAVAATQQN\n>MGYP001010919623 FL=1\nMYPVLFHIGDNPVHSYYLLWTLALTLAVVFSRRRMTFFYGIDDDDARSVIIWAFIGMLLGARAGSVYDSWSIYSADPLKILRIWEGGLSAVPAFLGAGAVSFVYSKRRKIPYWMIVDAGALPAALTVAIGRWGCFLNGCCTGIETTVPWGVRFPSDALGLLRHPTQLYYSFGALFIAALLQWTESSWLGYHNDRRIRGAVLCPLFAILYSLLRLAADPFRSDFSRIGMQTNRSVLFVVLGISMLWLGYSVFYEKKCIRS\n>MGYP000546373282 FL=1\nMSHQRVKRLTQFIAATAIASLITLPAAADGLSLGSRPDQAPRTSQSGNSISVEAWAGGTTATTNTADTTATEFDSTAWTRWAPVSYTHLTLP\n>MGYP001816006016 FL=0\nMSRKCIVVIGAAGRVGSQIVAELLRRHHRVVMVDALPGDALTRRAGRLLNDARLAVSPCSGSLRAYGGIDALNCAAMTDILIRENPDLVINYAIPITWDAAKRLPNYKAISAAGLGAFTPIQVLTPLKVAQAIHDSGVESRYMVGNLPDITIPIINGIAQGGTLQPALCGAGNVGLNQIAMRHQAALELAASFDDVDVALVSHHLHWVAPREPGYSNEGPFLATVSLAGEDVSASFKDLRALMNEGVRRHYEADASFSSTTGILASQVAMALLDDTDTTHHLHTPAPNGLPGGYPVEIQHGAINVNLPKQWSLDDAVAAMAICHTLDGVASIIADGTVTFTDLARDILRDELSFDLPSQMLPHDIETVAREQIDCMRCLLYTADAAD\n>MGYP001138444575 FL=0\nMPTIEVEGSKVELDDEGYLVHPEDWNEKIACILAEREGIIKKCPMTKEKVGILKFMREYYKNFEAFPIPRGICVNIHQPRNCTYEEFPDPSIAWKIAGLPQPSRHVVAQLKGLGGVS\n>MGYP000402310384 FL=0\nMTRDPLDEVTVTFQPRRPNSIFRQKVLVQYSEQFNTFGFGMVVKKHGIYREYRMNVKRKTLWISDLIFNVEESRHSMNNPVSFCFDRKIICGKRPRSMYQTSVNRPMPFPQCKFDAVWMRPGAIF\n>MGYP000123267625 FL=1\nMFKDKLAVEQEQGCKVPITLLESLTTFLGKNSTKRLDQVKGALTLWMSGILIKTLPATSDPACGKGIFFFFTTHLFA\n>MGYP000748431043 FL=0\nLRALGTSSTAESHVPAISFQSDQGDGVTARASISADRDGGATKGSLIFSTRISDNITEAMKIDSSGRVGIANDTPGDFDADGDDLVIGNSTGNRGLTVRSSASGFGSMYFAMGTSTTAQKVDGFLVYDHGTSFSGTSGLHIGTGASTRIGIDESGKIGINETAPTATLDVRGSSSQPICNFGDDNIRDSDALDIFGSDSFRYQFQNGQQARPAIIEGGGDVAANESAVYFTGFSSSQTDGHRNLGGMIVYRKNTGGADSGQYGSQIQFRSKADGTATPAQNMVLSENGSLGIGVGAPSATRLQLVRADGVTDSTEFTQTIQNLDTTEGQGSGLFIQAGNGSTDKILQCQTRGGTFVLDLNGAGRFNTTANVAND\n>MGYP001244487380 FL=1\nMQYHVKAMQSLDMVVELNVDCVEADDARRQVERLGYEGVTLRSKRAGLAAYLKRRTTFPLTLFSQELIALLGAGLSLVEALETLREKERHPDLKQVLEQILTKLREGLTFSSSVEQLPSSFPALYVATIRASERTGDLREALSRYIAYQVQLELVRKKLVSASIYPVVLLVVGGLVMLFLMMYVVPKFSRIYEDAGKDLPVLSQLLLEWGKVMEAHGLLVMGCLACVGIASAYGLTVPAVKARILSQLRSIPAIGSRLQVFDLARFYRTLGMLVKGGIPIVSAIEMVSGILPLSLRGPLHAAVRDLREGKPVSQAMESHGLTTPVAHRMLRVGERTGQMGEMMERIAVFYDEDIARALDWVTKLIEPALMAAIGLVIGTIVLLMYFPMFELAGSIQ\n>MGYP001368835617 FL=0\nFTWKSLQISSFILNNLSVRKRSLFAKKKLRGSFFRKLLFYYLSEKSKTTQTSIYLKNNLIITIFLL\n>MGYP003476759632 FL=0\nAGQAFEQTGLKLTPWQQYEKDLAEYNEYIKQNPNAATQSTAASAANVAKGNGTGNVPMNTDTISLKDQFPETTTTGGGASWQGIGDTDRFGDVEPPLKDQFPDTPQGTGASFLGTPEAPPDDPIPPDIITTPPPDVAPPPGGPCPQPTTYSQCTSYHPESTIPGKMSQAATVRSITAYINSKGFRHDPDGIPWLAPSAWKTWDGVTTINPCTSTTAQIMAFVFPPPGSVNTMRGLRERFYQVNPFADNQNPTVAEIENWNVEVIRHFRRLLGFNQTTHPVYNDKCTYLKAAWAEERARTNYWSASYPGVQDSASGPCTQPSSSNAHCGASFLPSPADQAPYLCPATMPACTTTAGAEGISNQNKDIPWGIKMSRIIGNYLSADGITGHTG\n>MGYP001453318140 FL=1\nMREFGAELGELRLHRRTHGEGILLAAVGHNATVDLEELCVRRQGDVGPVGALANGRPLLLAQVADHEHRAVH\n>MGYP000100214384 FL=1\nMNIEKFYDDDLSGQIKAKNFQGKIFEILCLLAILLGISILLILLIDVTLDGIPWLRPQLFNSFPSRFPDQSGLRSALQGTLWMAILTAIIAFPIGVSAAIYLEEYASDNRFSRFIEINIANLAGVPSIIYGLLGLGLFVRGLGLNRSVLAGSLTMTLLILPTIIVTSREAIRAVPRSLRMASLALGATQWETIRYHVLPYAMPGILTGLILGMSRAIGETAPLITIGALTYIAFDLRGPMDIFTVLPIQIFNWISLPQKDFHDLAAAGILILLAILLSLNSIAIYLRNRLQHRW\n>MGYP000373900305 FL=1\nMKDYAKKFYLSQAWRKTRDAYAKSQNGLCERCKQAGDIVHHKQYITPKNISNPLITLDWANLELLCQDCHNKEHTKKQNSRYAIDEFGNILPPGCVKNKRPREPVKGS\n>MGYP000933484466 FL=1\nMKIGNLNLDNRVFLSPMAGVTDLPFRLICKEQDCGMLYTEMVNAKALCYDDQNTKKMLKIEEEEHPVAIQIFGSDPEYMGGAAKIFNSYPNEILDINMGCPAPKVVKNGDGSALLKNPELAAKVLKAVVGNSEKPVTLKIRKGWDDTCINAVEIAKIAEDCGISAIAIHGRTREQYYSGKADWDIIRQVKENVSIPVIGNGDVFEVEDAINMLNQTNCDAIMIGRGAQGNPWIFKRINHYMQTGEILPEPTLEEKINTAKKHLKLAVEEHGEYVAVREMRKHIAWYLKGLRNSARVRDEINKIESYEEVVNKLESYMQDCLTLE\n>MGYP003298397327 FL=1\nMKKIYENIEIAIILMPTMDIVTLSINQKDDVADDIFAPNN\n>MGYP001558061087 FL=1\nMNILQRLKLRLGLQVCLGERTREGWSGALPFYAFKCPVHGLVENYPSGWAEILRCPLCIEAEKLRHGESRPP\n>MGYP000481936423 FL=0\nRTQIGKASLNVGWPRDYAKLPVIRRYSFAPHVSPRDGTMPVELIGPVNSPGGNGPSNGMYALQKALRKRIDEGLDWLSIKPLPASKGSLPWFWHWDDRRYAAWWDSEGQPFVQGPNMLFTYSGKPRSDTEECALLDAVNCRAMFCHSEWYRDLIAKHRGPANQSPIVLWPYPIDPWPGEPLPDEYDLLLSLIHISE\n>MGYP003150238574 FL=0\nIGPYFKSETGTGNTGKTPIQAYVPAGPAPATSTIQSSYWTNLGHRVYGYGTVYGCGVFRDPLSVEHLLVATSDGVYATKEANPSVLLSGITSITNDVTFVQCFNVVVMFRGEGEEPYVMERIDEGFKAISQVASDTDLDENDSDGTESIPNASTGLFFANRLLIPHSDDQVAVSDFLNYTRYQPIMSNFRINQGSEDELVGLRRINNSTLACFKTNSVYIVSNIYGNLTDIVLDEVTREYSAVSDKSIVQVGSDVLFLSSKRGVCSLTVATNGKVSAVDQPVSEAIQPLVDRINWNHSSKAVAAYHNNRYYLAVPLDGSTYNNAILIYDTFNKAWAGYDDGDAVKVKDFVETKHQGKRRLFFLSTDGFVNLYDDDITECGFVDEIPSSTTITDSDFGQVTVKDIKDELVTRGYTAGDVSPKKWRSAEVHLSTNDPWFQVKTQYDGPEEDDQELTAAATIDANGYITAGGKTFSRSAYDRPFDKTAFVESMTNNDFFTQHRQDYSVDPDTEIVLGSNGFDPDIHQKSVNRYR\n>MGYP001768574441 FL=0\nFPDPSTQDLAGYISTDPETKDELKYY\n>MGYP001452703586 FL=0\nSVLIFLIAAGIVLFAVTSSMMSWDFVMSIDSHWFSTMFGWYTFAGIWVSGLTMIGLMTVYLKRKNLMAAVTSHHVHDIGKFMFAFSVFWTYLWVAQYMLIWYSNLPEEIVYFRTRLDHYRWTFWIAFFLNFIIPFLVLMTRDAKRQFNILFFGGIVILCGHWLDSFNMIIPGTLTAHGNHWQLSWMEVGTTIGFLGGFLYVTFRSLAKAPLLRTKHPLMMESVQHAI\n>MGYP000024922526 FL=0\nMEDIYKLIDDINLQKIDNIDSRVNDALTSPNDDALFILGETLYNFGLMPQGLEVFRTLYHKYPDESELLIYFIEGLMAENQTDEALEYLSHVETSTEKLMLEADLYQQINMLEVAIDKLIEARDLEPNDPIIHFALAEILYYDGQYLRATHEYQTVLDTGEYEINGINLFARMADCSLQSGNYSDAIRLFDEISDEEMTSDDYFKKAIAYEKNDLSLEAIKIMTTLLTKNPDFLQGYYYLQQLYEHEKNYADAIEIGKEGLRLSQFYKELMVSTGSIEIEHGDANEGVALLKQALEVDNAYHEPLLLLADLFRSEEDYEALINLLQYVDEEDLDPVFTWHLAFAFGQEERDKEAQHFFELAYPTLKTQSAFLSDYYYYLLEIGDKNHAQQILNQLLELDPSNEIWHEETARLEN\n>MGYP000184957940 FL=1\nMLSDSLADGKAIHPRHIDIQQNQVWLFTRLLDGLPAAVGGEDLVLGGEVGFHGIDNAGLIVHYQQGRFQGDAPFHGVFFILP\n>MGYP000054682017 FL=0\nMHIHILGICGTFMGGLAALAREAGHRVTGCDAGVYPPMSDQLRALGIEALSRGAGHVTFVDTSPRALAAVRDPGVIDDKIELVGAHRRVAAGAVDDQIDATETDHQTAQRFAQARCVEHIDRQRQTARMRLLEGEQFSLHRGALRDARWIGLLEDPHRGDRVALADGRVLRDARRLEPDLAGLDAIAPV\n>MGYP001618312234 FL=0\nMMLHRIHPVVNPWHAQNCSRSTPSKRVSSPSQPWALCMAWAWPQAHSGPGAGQGRDLRRVSLYVTMSLLSLSLFGLGWTSDL\n>MGYP003315070702 FL=1\nMGDDIMGSSTFIPRWVKIDDNASIYNRKVSYLSGNNKIIERSFECKTQKNNQKLVVEIWDIEFVVTKFDENSIQIGDSAESIPCKARSPVLYLFVKFSNFNINYSFLKSQAHIKSLA\n>MGYP001373614446 FL=0\nRQVRVETTLPEIKTQDFSAASVAAIADPKLRRALDRVASGFEVARLARVADATPEVWDAWRQEARDIKAHTIEHLDYYLDLLHTNVTAAGGHLHFAKDAGQANEIVAQIARTRNVKVATKSKSMVSEELGLNPILEAVGVEVWETDLGEYIIQLAEETPSHLVAPALHKSKEDVAELFSEKLGIPYDEDIFHMAATAREVLRDKFMEADLGISGANFVIAETGTLVIITNEGNGRLCTSAPRIHIGITGMEKVIPSLQDLSIFLRLLPQSATGQRITSYVSMTTGPRRSDDEDGPEEFHLVLVDNGRSRMLADPALREALYCIRCGACLNICPVYARVGGHAYGWVYPGPIGAVVSPMLVGLKKAKELPQASSLCGACREVCPIKIDIPKMFLHLRNQTAESPDPNLRSAPIVERTMAKMYARLMSSPRLLGLFRKFGRALQLAEGMIPFSPLTKDGEWIRMAPLPPLSKWTRSRDLPTLPKQSFHEIWKKGLSRDDS\n>MGYP000395248815 FL=0\nNKSYTMYFTEINFTEIDFTEIYFTKIFLNYLVCILPPTIVQKGKSQK\n>MGYP001502370584 FL=0\nAAGSTEYTTGVETNGTPGNSGAYTRITVAADAPTLYYYCTNHSGMGSFVTIGANVQFNNDADPPNITITPKTDFTVGQRYALSYPSGVFTQTGAGGSFVGTGYTFTARNYSYQLWTWGDNEFGNLGLNAPETSRKSSPTQIPGLTWENSLSSSSQSKHSAVAKNDGTLWTWGRNDWGQLGQNSEVNYSSPVQIPGTTWAGPTATDSEGTTYATKSDGTMWAWGRNTMGNLGQNSTNTGYSSPVQVGSDTTWPTDLGSDDGVIKLATGSDNVFAIKTDNTLWSWGTNLTGQLGLNNTVKYSSPVQVPGSWKSIGDDGYTKFGVKTDGTAYYWGQSNDGYSGINLFEPKRSSPTQLHGGGTTWNHIAFGGTIALAVKTDGTMWGWGENTYGQAAIGNPDTFPQGTPGKSAPIQIGNQTNWKFVQSSASGGASPQFAGLKTDGTLWIWGLAPFGTAGNNTVTPGSAGYSSPVQIPGTDWKTVALSYGKVAATKQI\n>MGYP001024040911 FL=0\nLDIRLTPARNDAGRVVAIRDMGKAQFLQIQDQSGRVQVYAGNKTLGEDDYFVLRNLDLGDIIGIKGRPFRTKTGEASIHADELKILSKNLAPLPVVKEKDGETYDGISDIELRYRQRYIDLAVNAEARATFTLRSAILREIRDFLHRKGFMEVETPMMQAIASGAAARPFTTHHNALDIDLYMRIAPELYLKRLIVGGYEKVFEMNRNFR\n>MGYP003311824185 FL=0\nRLRIGEQEHLLELRRFTPWILLEFRAGFTMKIRGICRFYLLEKAPHMRLYMSPVNIDPENPALPISYPATYSMYLAKTQGRFSTLGLAEDTWALNERVLDEDAFLEQAYLVHEEREKMFLDAIEKTEQGLAVCVFDITDRVQHMFWRYLEKDHPSNVDKDVTRHKNAIFDLYERMDGLVGKVMKNISDDTVMLVMSDHGFKSFQRGVNLNSWLHQEGYLAVHSGPSGAEWFAEVDWERTRAYAVGLGGIYLNVRGREAQGIVD\n>MGYP000397936239 FL=0\nGVFAENHSLALGVFGNFGQRVANNTIGQADTILNVMRTWWKAVCLVTSTCLAASMNLT\n>MGYP003982510387 FL=0\nIKDAPNIQKWTNPISWPGLHLKNDDDIYAIPGNTIVRADGMMIRKDWLDAVGLDLPADNEVTLDEYTEILKRFTENDPDGNGEDDTYGMGVAASGGNMYLVFGWPFGVGRRATEDWWQKVDGEEFDYMPMKYAKNHENMIDALEYHQMLWDKSYVDKNWPSNNGTMRNDRVWSGVSGGRESFGGHVYGNWLPNIQKNFPEAE\n>MGYP001965651419 FL=0\nTHARTHARTHARAHTHTHTQEGALLQVLCADMVERFQMFIFLLLVTVQNWAKDGRVSSHSFAWLQEWVQAILLVFASELGVLRASC\n>MGYP001756801604 FL=0\nYIFTGLRIGIGLSWLVIVAAEMLTGGVGIGFFIWDAWNSSRISDIILALVYVGVIGFLLDRLVAWAGRLITRGTTAAQRMRRVDRWLTDVHGPLLRRTPRPLAVDLGFGAEPVTAVEMAQRLRVQNPALELVGLEIDPARVARARERAGGLPGVTWAVGGFELPVPRPPTVVRAFNVLRQYREEDVPAIWSLLCAGLADDGVLVEGTCSEDGRRAAWVDLRRDGPASLTVALRLGSFARPSDVAARLPKVLIHRHVPGEPVHRLLAEADAAWAAHAPLAAYGTRQGGRARRVGRE\n>MGYP001019934495 FL=1\nMFLPVKRRGLLFILSSPSGAGKTTITRSLLERDDQLSISVSATTRAPRVGETDGKDYHFVSKEAFDQMVERHELLEHAKVFNNYYGTPLVPVEQALANSQDIIFDIDWQGTQQLKQKLVNDLVTIFILPPSKDELERRLRSRQQDDEDVIRERMKKASDEISHYSEYDYIIINHDLEKSILQARAILEAERCKRRRLTELPDFVRTLMQESI\n>MGYP000405630647 FL=1\nGYPSQVSPVVKTPSQRCKVNLSRTQQIPSRKLAQATKKEVTSFVFVTVLGSSVVTLI\n>MGYP003603128023 FL=0\nMSLNIAFIGLGAMGWHMASHLPKLGHPVWVWNRRAERASSRAKTVVAWAYEM\n>MGYP001304718576 FL=1\nMHCSRCGSREYFKNGKMNGKQRYRCKGCGYNFTNLHGRGYPPALRLYALKLYTENVGIRSIARLLGIDPSTIVHWVRDEGKKVMEQLKASIPDSLPEMDIIEIDEMWHYTQKNSANYGYGLLCLDSPDKSLPSKWDLVVQSHSKNSGNV\n>MGYP001796365966 FL=0\nMSQGRLKRRGTGFTAVPNSFLRDDSLSGDARMLFMLLSSHSENWVFRVPQIQKNLRYGKDRLRNAKNGLIKRGFLTLWQPKDENGSVIPGPWSWEICIDPALPISAGRKTAQADARPAETRIALKEQDQEDQVQEDYVDSAREPNLLDRLDAGLKTAT\n>MGYP000859918013 FL=0\nKGWTLDGNAVNGTNNSYSFTVTKAAEVKVSFESDSTPLPQYAVNFSVEGGNGTLKAKADGVAETATSPISVQKGKTVIFTAFPAAGYEVKEWQIFGTGAVFEAGTGTPANNTAQVNLKEGLTDLVVKVSFQVQTLTPKHKVTMSAGANGSISAEPALPAGGMVNENTTIVFTASPNSASYTVDAWTITGGQVLSGGSPGSSTAMVKITEPVTVAVSFKLKPPTTYTVSFGVAGTPPNGTISATYKTDGAAFTSGTAVAENTALVFTASPAAGYKVEKWTVNGTAVPGNTSNTYEHTVTQPADIRVTFVSSVTIPDTFTLPNGAEYKVTDKAQKLVIMTKRENNASGTVYTVNVKPEYSGITYTLTGFSESV\n>MGYP003019047097 FL=0\nEKYQSPVYKVLSVPIEKIVANSYNPNIVAPPEMKLLEVSIWEDGYTMPVYVIISPVSYTHLRAHETRSN\n>MGYP001083449663 FL=1\nMDDSAPIRDFEKLLRETIGLSMETVGASVIRHALKRRMTACAISDLHAYWAFVTSSPAERQELVDAVIVPETWFFRDREAFGAMVRHLRENRASCRPLKLLSLPCSTGEEPYSIAMALLDAGFPDGSFQIDAIDVSSRNLVHAERAIYGKNSFRGADIAFRDRYFEACNGGFRPHDIVRRHVRFRIGNVLSAAAQTGNEAYAVAFCRNLLIYFDRETQGAALNQLRQMLADDGLLLVGPAESGLPPLHGFNSTRVPRAFAFIKAEAAPVKPPEPPAARRPRPAPAKAAPLPRAQTAKASSAPRPFAQKTASAQPSAPSPDRVAASLAEIERAADAGHLAEVSAAAERHIAEFGPSPDAFYWLGLAHDAADAVEDAMRNYRKALYLAPDHQRALAQLRLLQQRQGDHGAAKALADRLDRLAKRSGT\n>MGYP000234632724 FL=1\nRDVERSRGLGDVYKRQIAGIATPTEASAIGAMGALIITFVNGKFSIDFIKEASEKTAIVSTMIFTILIGASIFSLIFRGVGGDELIDLIFGSLPGGPYMALIFVLLLVFLLGFILDFIEICYVIVPLVAPPLLMMGFDPVWLAILLAINLQTSFLTPPFGFSLFYLRGVADESIKTSDIYKGVIPFIFIQLLILALVLIFPFIVL\n>MGYP001050647894 FL=0\nMATTKNKKEGLARKRQSPMVLISPSFPWNFRVLPGDVAHLAVQKHREPAADGVSGAF\n>MGYP001636256112 FL=0\nMIFRPQGLEAKGLSAGTGRV\n>MGYP001782636417 FL=1\nMFVQGNAFRYGSDVDTDVIIPARYLNTSSAEELASHCMEDIDPDFVKRVKKGDVIVAEDNFGCGSSREHAPLAIKTSGVSLVIANSFARIFYRNAINIGLPILECPDAVKAIKAGDVVSCDLSTGVITDVTTGETFRAEPFPPFIQNIIDAGGLIASLASKED\n>MGYP003367769974 FL=1\nMDQSLNMVKIAYDALDDKLAEDIKIIDIRSISVLADYFIIADGNNKNQVQAMYRKNFLKLDMR\n>MGYP003688882127 FL=0\nEREREREREIEKNREREKEKEEKESEKEKEIERQRDIDSCDFDVFSDF\n>MGYP003700002783 FL=1\nMLPAFVLRAIEEGVSLQEILKEHNIYLAFAKLSGRVHGLTYADSSGYYLIIINENLSITAQYKTLLHELKHIIYDLPKMKYIVGKDMNSNIEKEADKIAEEWFKEIVKKLRKG\n>MGYP000043255058 FL=0\nMEFNYTVTDKVAIISWNMTTSPMNVLNDVSIPEFEQNVDKALADESLKGIIITSDKNEFIAGADVKMILKNADKDPKEIHKLSMDLNRLATRLERCGKPVVAAINGTALGGGYEICLGCHH\n>MGYP001157010399 FL=0\nMKSLRKQGIILFTILALVLVACGGDAAEEEVVEAKEDEPAAEEAPAEEESPAEEEVVEAK\n>MGYP000411183089 FL=0\nMSLTLREASKDTLQAENKTWHYYSLPLAARTLGDISRLPKSLKVLLENLLRWQDDDSVTAEDIQALAGWLKNALALIQISWPHESMGKRVIRLLVSKKDRRV\n>MGYP000600471748 FL=1\nMTTTRRLSLAYLALTAGVAVLFALNLFWGSVSLTPGAVAAALLGRGEDALAVGIVLQLRLPRAVMVVLLGAALSAAGYLLQTFFANPIAGPFVMGVSSGAKLAVALTMVVFLQQGLLTGSATLIIAAFAGSMAAMAFVLVVARRVPRMSILVICGIMIGYICSAVTDIVVTFAQDSNIVNLHNWSMGSFSGMTWENVLTAALIVLPCLALSFMLSKPMAAYQMGEAYAQSVGVSVRPFSVTLVLLSSLLAACVTAFAGPISFVGIAVPHLVKRTLRSAKPLHVLPGCVLGGAAFCLLCDLIARSIFAPTELSVSSVTAIFGAPVVILLLVRKQRREAAA\n>MGYP000149143676 FL=1\nMQFVEDYIVLTAVLSLWQRVNVYVTNSTQETFVIQVKKLCLLLNTLTFNTTMLTISSHTLSIIYYNDNTLDAVFD\n>MGYP001584307752 FL=0\nIREGRHDPVLYSVGPVPPGKDRNSHGVVVSWEGRSLRTVFSRMVSDSPVTILEERLLSEDGREMTVRNVSDRDGSETVQLYXXXXRQLSVEHGYQGRGINTSETVTDVYLRQAR\n>MGYP001913057525 FL=0\nYRCRDHGFEWPGQAYRIHSMGEPGSAEGMNAENPKHLILKAPHPSPLSAFRGFFGSRPFSKTNAFLEEHGIEPIDWQID\n>MGYP003393519970 FL=0\nENALKALAKNIKGDRYDDAILSAPLPDNANAWKELVDVKALKKSLADQKAEQARLKELLGAIENREQLATERAQVQEECDRRLSSLSLWERLQKEKIEEPRLKKRLSELTKEKAQAEHTRVDARAKLDELSVKLFEQRTALNKEDERFNRLLRLMEQCVPPPSMEAQPSGPMAVPADAEDAIALYTKLTLSYKDMSREMDQLRSKIENVLKSDIIGATENETVRLMKEQIEGLPTFEEALRKDWDNYLHLLRANFANVLSGLSDIRNAAEKLNKRFGSVRVSNLESLRMDVLDQSDLVEPLKELAETDHTGLFDSSTKLDAAYQSFRNKLSERITLNYGDLFTLRFSVVIKGKTHSYDNLQVESHGTAITIKVLFNLLVLRSMLKEDPKTRAPLSNVPFFLDEIHSLDAANRGAVLRMARDLGFMAITAAPEPVSEVDALYFLRPINGRLVVRNELRVGVKYDAVEA\n>MGYP000523383570 FL=0\nMQIENNYGNDVYNGDIGFVAGIDLDEQELSVSFDGRTVRYAFGELNELVLCYATTIHKSQGSEYPAVVIPLSTQHYIMLKRNLVYTGITRGKRLVVLVDQKRALAIALKGEQLERRWSKLEERLREPGSIRYRPESLRHLDCPRSGRVHQALESGQVVAHPAEHPEIVSARLPLLVLRLPSYLRRSGVGFISLAHCYNITA\n>MGYP002653935032 FL=0\nNDALLREVGSDVKRGDPLASVGNSGGQGRPALYFELRRNGQPVNPASWLSAAR\n>MGYP003551677296 FL=0\nQDGMGIRFTGQYAEVLPGFRLDFSGRAGISDAGNFAANIDFQSSEPDASIKIDLGKFSPQLTDLSFEGNIGMSGSCQVTGSTVTSNAVLSTHNAKIEIPGRKMTLEGIDLNLNLQDLYQFHSAPDQVLKFKRFAWGDIEMNEGEVLFQIESLSSFFLQKSSFSWCGGHVYTHGLQITSGKREIDIICYCDRLKLATLLQQ\n>MGYP000229859498 FL=0\nMEKEVSFVYCNNNNNVVLFYVAELRPHGLLY\n>MGYP001544784897 FL=0\nMPVVEAARYQVHRLQRISPVSQAQLKAERATPLHTLDTLTVATKKGRLFREEAPVLRRLSAAQARPVLAALSPAQAEEFLAGYRTRIRAAYPAAPYGTVLPFRRVFVVARVKA\n>MGYP001256815242 FL=0\nMVPETQLRAFRPPLRTPASLYQRDAGWDLSHAQVRGLARHPDTHDLDKIKPIALSHSDKTYLIDNCCNDKV\n>MGYP000824429490 FL=0\nRMKGQKNVKDVGRQKGKHSKDQKKQKIKDVRNVIRHQL\n>MGYP001586178734 FL=0\nEQLAKGQARTKAYLASEQSCAAEELRADLVDASDVRVVLREAEGESFLLVADGEDELVEDLDAVLRGLDPLFQGHDRVELGVDDREQLAAEVIDQRYVEGAEELVAGEPSFDRGERGELESECARERAVRVRGVAGESVEDAGLVAGQGELVVRRENNRRLRFLAFENNLRG\n>MGYP000104835098 FL=0\nSLLIYIIHENIILMSLVERILPYERNLFLWLNDQHTSYWDVFMWIYSGKLVWLPLAIVAIGVFVYKIKWKEALLLLLCAVLVGVLCDYVSSSLIKPFFERLRPTHHPDFQNYVDTVRNYRGGKYGFISNHAANGFGIVAFISLLFRYKYYTITVLLWACITGYSRIYLGVHFVSDVVGGAIWGALVGISMYYVYLTSRRYILKVPKDELKIPVYTKVRAQILMCTIWVLVISIAIYS\n>MGYP001657250507 FL=0\nMQTKQTLLKTKRINNKQTKKLEDQLXRLFIHLSLSQSYXVSLLAQLQRMKQSKKILFLNQXKVLMEXKMLHIMX\n>MGYP003575916264 FL=0\nVLLVIAGMFLTWRFMIGGLWLGLAGNSRVLAFSAAPYVILPLFVLPAILIMEQPIMDWIAENSRRLLPPLVWIAAAGVVIKFWLAAFSWRKIEPRYVRRYLPVWLGGAVCLTVLAFMLGVLLSLFLPEDTYRL\n>MGYP002282927298 FL=0\nMEWTSGVSAVAFKSSLRSVPGSSAANGTSFSVFGHDDSSRGSMDRGAGSGPGSRADSPVEFRFHDHFDFQRQIGRSPTSEAWLVRSKQSNKPYCVKKVTAKFRTPAERSRYIHEVEAVCFLPPHANVVKYYRAWQEHRHFYAQM\n>MGYP001843998727 FL=0\nMLLTMSLDSTWRDGKKVRWFAVQATNKTQRNKFTQDCYYSHAQGSQEKWARDXMXSRKSRMCVWQTSNKIIAGDRSCHLRHQRPQPADGEISHSAQLKATDQPIIVKRTVLX\n>MGYP000291769357 FL=1\nSAGGADRCAESGVNMSNDRTIGFIGAGNMAEAMIRGLLRGGDFAIAQIAASGPREERMRELRDTYGIYATTDNKVPAASEIVVLSVKPQILSRVLDDVLEYGGDYSIDRFEVGKTPLDPSYARLTVTADTEEDLARLVMRLQTHGVNLTDPGELTVREVEQDGVFPDDFYSTTNLETVVRTGGHWVPVENPEMDCGILVEGDDEHPRARTIAVSDVKRGDRIVCGASGVKVVPLPAIDRSVGGFEFMNSEVSSEKPQALLVRQIAQQMREIKAEGRKVLWVGGPAVVHTGAAPAMVALVEAGYVDVLFAGNALATHDIEAALFGT\n>MGYP001585133350 FL=0\nMFSCSFIDKLPIRILSDVKESFLNLGMMCKXKXFKRSYXLHKTTSIWNXIFQSSNRILX\n>MGYP003587374593 FL=0\nLNDLSFSELAHKRISLIHQSAIRLLNLINKILDFRKAETRNMLLKISQGYLSKLIREIGLKYKELNRNENITLQIVLESDEQPIRVDEEKVYIIVDNLLSNAFKYTQKGEIVLTLRTIYKQKTAWAEIEVRDTGNGIPVSRQAAVFEAFSQADDSTTRRYGGTGLGLTICTHLVQMMGGRVWLESVEGEGSCFYFTARFGVDSSSSAISSVLQFGDLRVLLIESNPAVAAQLSAFLAQLGVQVTHMAASEAAVDAIEKSRSLGFPFDCVLADIKMAPPGGMDLAESWHGYDHSEKLIMVMDSEEQRRHMSKLRGLGVD\n>MGYP003618342538 FL=0\nMEHLFDHAASSTPLDDLLKQLHLTDPSSAIPQDDAFSSLLSDANMVAPPHDADWNAPTFDAAQHESPFDPTNWQDPAHLSSEDMLTSAFET\n>MGYP003539180734 FL=0\nLLACVFSLSLVFAVACEEEETEEVVFAPTYTYTDYTQDTDALITNGDFTKGLAEKTEKDFPVSSIGSWNVGADTNSDASVVTNGVISVSDNGWKELMGTFHGVSNFKSWAEKTFNGNNKIDTKEAFQDFMVGQNGLKNPGKASGTTLNDDKVLMLANFTNSTTVDGRGTAMKASSTSTISIAKGKMA\n>MGYP000164259871 FL=0\nQIPKGYESRLRYEKFPKKSVDTHATNRKADEAP\n>MGYP001127871448 FL=1\nMQAPTKYALVINLKTAKALGLAVPPSLLGRADKLIE\n>MGYP001811598644 FL=0\nMTWMCAGLEPLLEDIQQPPLLSGRPVQHTNLWMCSRCVLQAVAGAAGVGLCXAAPCKSXKVX\n>MGYP003351460088 FL=0\nMTDLGTGAGRLAWPPPASLLPWRQPVKFPGVAAPEFRRGRRGDPANPRLHQPRDFRVFGRELAYRPVGSEQHLVLRDRLRVLHDQRVDVVRGVAAQVHPHVGLVDDHCESVLVPREGRVREDDLQVGEVRGDVVEIFPAYEEERAIRVEFFGDEIESISEIDPLRGVRIQKIPRITIYPGSHYVTTVENRKRAVDSIRIELQQRLQERALALISIAHPKYRADLLKRSEEHTSELQSRVDIS\n>MGYP002526488509 FL=0\nMAGNVDNRVVQLTFENRQFERNIAKSKKSLDELKASMNFDETSKGLNKFAEGMDKLSFSHLEDNIQKLTDKFTGLGTATELVVSQIRRKIEEAARSMSGFVESMTTQQIGVGKDKYDMLNKSVRTIMNATGKEEKEVLAVMERLNNRRSE\n>MGYP001359237027 FL=0\nNSVNNQFTPLFQDEIKPGCRIISNTTFENLNNFRINLDIHDSKKWNKNIIYGELRNGYRIAERYKTQQYATFEIINKNDGSICTLQAKVRISGDAADHINLEKFQASIDVELIDENIFGYTDFKLFLPETRNNENEIFVTTLLRHLNYLAPNTFFIDIFVNDQKVKYLFQEKINK\n>MGYP000346659406 FL=0\nMGTRIGSIHANVTAKDLSWSDTMRRVREETKRTADLLQGISDRGGGLGSLGSIMPTIDIGNVINRSIGLVTDAYRQLSEAREKAEIKADKADVLGLSMADLQGLSVGAALANTDIETVTGATDKRGTEVHFWADEAIFSHVEFHYDILAKRIRELSFLNNGVHIKL\n>MGYP002611241135 FL=0\nSPATPLGSKRRFIRVPSNNFVWHILGGSNAVMGFISSTSAWMEVPFMLLCGFLLTKYSCASLLRISSFFYILKPSILLLASSIPMVALGQYMQGPSYAIFTIASVYYMNHMVDIKDNAKAQALLGICTKGLSGIVANLVSGIMLDRFGINGMLGFCMACTICGFCVIQVMTLQKEKGR\n>MGYP001764798971 FL=1\nMSATPVLPRHAANAAGLIARPAWKGRLDWRGLLGWLRDDRLISAEDEQRVTQRFGAGASSQHALVRLGGAGLKRAGTQQPLDTEALTEWLAARCRLPYLRIDPLKADVGRVADVMSVHYAESRCALPLQLNNTEVVIATSEPFDAGWVGEIEAHTRRSVKLVLANPQDVRKYTTEFYALAKSVRAAQKTGEVSPAASFEQLVELGKTAKQLDANDQGVVQVVDWLWQYAFDQRASDIHLEPRREMGAIRFRIDGVLHTVYQVPLGVMNAMVSRIKLLGRMDVVEKRRPLDGRIKTKRPDTADKIGAEVEMRLSTLPTAFGEKLVMRIFDPETAVKSIEALGFGAHDTARWQELIARPHGIILVTGPTGSGKTTTLYSTLKTLATDEVNVCTIEDPIEMIEPAFNQTQVHAAIDMGFAEGLRALMRQDPDIIMVGEIRDLATAEMAIQAALTGHLVFSTLHTNDAASAITRLADLGVPSYLISATVIGVLAQRLTRMLCPACKQRDEDTTRETLDELAKPWRLSGGVRPYKPVGCLECRHTGYRGRVGLYELLVMTDGARAAVHPALDATALRRQAVKDGMRALRLAGAMKVAEGLTTVEEVLRSTPSLDVRA\n>MGYP000601219188 FL=0\nGGGLFYMYYVETRSHYVAWAGLELLASSDPPTSASQNAGIIGLSHQAGPGYSKYIIILRSIHHLDHSLTIYFYFPVIVLISWVRHSSLDI\n>MGYP000591043049 FL=1\nLARGVARALWLPGLSLSPLRIPFCEFSQIYIYSNALYKQVIYGQRPDHNTGNYVPYSLR\n>MGYP003318478948 FL=1\nMIYLFLANGFEECEALCPLDLMRRAKIEVTTVGVGGKYIEGAHGITVCADITDAELCDDAPDGVILPGGMPGTLNLDACAAVHKALDAPEKRGALICAICAAPSVLGKRGYLRGKQAVCFPSFEEYLDGAILQPKGIKVVTDGKIITAVGMGAAVEFGLALVRVLKGDEAANALCSAILAD\n>MGYP004071202169 FL=1\nMIVLSAINEPKRYAPLSPKKIFALGKLNNKIDNKIIIWAINIKEISVFALIRLIYTKTKLIIIRLITSKPLKPSIKFAPLTMNKKHRRTKITENISLFVKEIKKGISIFVILIGKKNIMELKKKIINNSLLKGLILNLRSSRNPIKNIE\n>MGYP003151139587 FL=0\nMDVEQTEEAVAEAPPAEIVDQAQINEWLDDKLGPAEPEVTEEPEATEEPEPEPAAAEPETPEPETPRVSKAFSKVAKKEREVQQQKQELNKEKEKLKPLQEAQAAADRGDMLGALEKVGWTYEAATNSVLQDGKLQTPKAEPAALTPEVEGRLAKLETMERQKQIDNYVNRMKTKVEGDERFELVKDNWDNAWPTILEMQKIVAQETGTIKQDEEILQEVENFYEQQAQKLAKSGKFKNLLQPDAGPPEKP\n>MGYP004197989809 FL=0\nFHVKSEKIEISQKNHLKHDLN\n>MGYP001807843292 FL=0\nMCVKEHKEHNTRRTVYARCVCVCVCVCVCVCVCVC\n>MGYP000196272724 FL=1\nMALRICSQLTVGGFVPTIMVLGSATEVDRIKPIQPLGTFIFIVFIYLFIYFLRRSLTLSPRLECNGTISAHHNLHLPSSSN\n>MGYP000647749030 FL=0\nMEVGAEGDPITFAERRTMSVAGRKIIAGS\n>MGYP000363977344 FL=1\nVQHDRNCSRNVSPNRMCLCVFPKGTQMVRMGPDSIGICRGSVKIDVSTMRNPGDALPNIAPKSNVSDNRNENRSKQHIYSTYLNSTRGQNIKSGTGGTLFFSGNFAPGVDFGRPDAHNHQGMISRDTSLQNRPWEPTQGRKPTLFIQIISTSFLF\n>MGYP001764752421 FL=0\nMFENLSERLEKSFKLLKGQGRITEINIAETLKEVRRALLDADVNFKIAKQFTDNVKQKAIGQEVLKSVNPSQMMVKIVHDELVELMGGD\n>MGYP003108819162 FL=1\nMACFHPLEDFDFINRILPKISFFGGLDDEQLAYIFSRLESAEFSQGEIIGRPGTVPSHIHVIQEGAVDLLISHDQRLVRKRQFTVGDCFGEAALLSLINDTATFTAAGPTSVASLSRLQLLRLHSEKPDIFLQLVLNMARDLARKLQYSDELLLRR\n>MGYP001799047598 FL=1\nMYSLYIPVVDSFYVYCIQEAEAAQASTEDDSYEQEIEEATSQEIETDDQVFH\n>MGYP000061367530 FL=1\nMGSTYTRQSSTEIVDGEVIAASDFNNEFAQLVSAFASSTGHTHDGTTAEGGPITKLLGTAITIGDGSSGTDIAVTFDGETSDGVLTWMEDEDYFKFSDDVLIVDDEKDLREIIRYNLEQEGINSIQASNGDKAIESLSQNPSLI\n>MGYP003345690776 FL=1\nMRNFLKSHFWVLAGCFLFYSVHADQHGTTERILFDGQSLDNWEKTDYAGGGEVRLDGKGGVVLEFGIALTGIHWIGEKVPRCNYEISWSAKKVSGTDFFGSLTFPYLNEHATLVLGGWGGALVGISCLDGFDASENQTATAHLFNTNQWYRCVLRVTEAHFKFWVDQEKLIDCDIQGRTISMRTGEIELSKPLGFSTFDTTGLIKDVRLSSLVP\n>MGYP000806452421 FL=1\nMEEKVDIVALGELLIDFTEAGHSQGGRKLFEQNPGGAPANLLTVASHFGYRTSFIGKVGNDMHGKFLKRTLQTEGINTDAIVEDPDYFTTLAFVEIGENGERNFSFARKPGADTRMEKEEIDVDILDKTHIFHVGSLSVSYTHLTLPTILRV\n>MGYP001393538896 FL=1\nMKCKDCRKQFSVTGNKRIIYELRGDMACVHVICDVRRDLRALLLRRLVEAPRSPGP\n>MGYP003366091699 FL=0\nLRMSRGLGDVYKRQPLASGAKAADQAEIDIIIAELSALAAQYTE\n>MGYP001054490991 FL=0\nRRLGHGELKLGGGNGGRGDGAPALMCSPRFKRLR\n>MGYP004024396583 FL=0\nMITLILHYXSNRFKIFLFLKYLFHQIXFVMXTRLVXTRLGLIXQCHCFCLVLSGIYMRKMGTSILYGTNRHLRCRLWPKKKKIVTCMTVGLVSCGYFGTIALQADMFI\n>MGYP001796939300 FL=0\nFDTVTIKDIAKALNFSTSTVSRALRGSYEISAETKKLVLEYAEKINYRPNPVALSLKERRSRAIGVVVSEIANNFFSQAIDGIESIAYNRGYHVIITQSHESEAREKVNVQHQASISVDGLLISLSSETVDLSYLKELHDKGFPIVFFDRITDEIETHKVTANNYLGALQATEH\n>MGYP000574954487 FL=0\nMKKFSLITLLLITVGFSSCTQEDSTFLEEPTAQVLLKSFTLNKSTSGDYSLDYQLNNGAASDNVLDAKTNTSNIYLYSSENVSKSIKNEGIALKDGELRISFNDTEKHKKHSITVLDEEIKASRSEDDTDLGYLNSYSVTTNNDGTFTLDFKVNEWVVVDYIFDLCDGYQYSDSRTSGKANTHATPRKTKGR\n>MGYP001104094517 FL=0\nTVFGEEYKNVISSLTDWKMYGFFKINGTIGLKYFDNKVVTLDYKNKKIAVSNNALDYSRLQNEKYTVLPLIKSNLSNEQDLLFFEGDVNGEKSTIYLDTGSSRSFYNLDGTREEIEVKLGEKAYTFNSNKFRHDEIGFKDTFKYPLKLAINSDLLKANHFIIVVDKQKKVVFFRFI\n>MGYP004251094059 FL=0\nMNQLIIRTKIICTFTCNPIKRFRYAQVIITKIFKNINAKSKK\n>MGYP001561011533 FL=0\nLTLLRFANDDIKMRELGNSIIDEIVNDANVPHEQHLIIEQDREDIMNLTKKAHS\n>MGYP003626153934 FL=1\nMPAVHAPRLLMIGAGGHARVCLDVMVDNDDVAIVGAVSAEGVVSEPLGVPLLGTDAQLRELTQSYAVTTFCVSIGSNPIRQAFGELLTQSGRHVTRIISRSAVISRSAKLGDGVQIMPAAVITAATVLGDGTIVNTNASVDHNCRVGRFVHIGPGAVIGGDVTIGSRAFIGLGSRILPGVTIGADAIVGAGAVVLSDVPAGATVVGVPARIIKSKSAQQ\n>MGYP003586072608 FL=0\nPLFTIAQIVAAHIGSTPGVLRVLASSFILISLSSIFFGLFCVXXRSPGLCQKNLXNTWCTASVCGSSGEVRARKRLQICPKTIAKVCNRFWADFLCXLFPFAVSHRVKEVRKRLFSCAWALFSEKPFFESDRIRSGXKNMX\n>MGYP003337571193 FL=1\nMSKITDLIVPNIGDFKNVEIIEILTKPEQNINKNDGLITLESDKSSVEVPSQFSGKIKNIKVKIGDRVSQGDIIGQIELTADEKIEERIIKNRSNHDLTTEVFSKKKELQTIAISPNKDENNFVKSASPKIKKYARELGVDLQLVNGSARKGRIVEEDVKQFIKNTLNTKIIKEEVIKNIETKEEKLPFEHEEFGEIDIQKIPRIKRLSGPHLVKAWNEIPHVTQFDEVDVTDMEYFRKNLIDLNTKEKITITPLAFIMKALVNAMKKYPNFNCSLETINENIIYKKYFHIGIAVDTPHGLMVPKIRNVDQKNLLTLSNELRRISKLSKELKIDKKEFFGGSMTISSLGGIGGSFFTPIINSPEVAIIGIGKTETKQIFIDGKFISRAMMPISLSYDHRIIDGAEAARFCQDLKTSLGKNFAFKIGRAHV\n>MGYP002417791626 FL=1\nMLKMEESKININRIHFLYEALAKRHASPEETYHAILNEGLKAFNLSLGIISQIEGERYSLLAVSPTRGDISAGMVFELKDTYCQRVVSENRIISVEHAGEHPGFNNHPVYIGMRLESYISAPIWVRENLWGTLNFSSTQVRAISFSEDDYEFISLMAEGIGSLIEMNLLISENENVISALRKNNDILESIFENSTIGMALVAPSGQWMKVNSSLTRMLGYTEDHLLSINFQNITHPDDLTTDLKQLEALSQGNIPFYQLEKRYLTASGHYIWILLSVSLVREDNGDVKYYIAQIQSIDERKKMEMELKNQKEALHKVNIILERMATEDSLTEIANRRKFMLWFESEITRMARHPVPVSLAIADIDFFKSYNDDYGHQEGDFALQNIARALSHPLRSQDKIARFGGEEFIMLFPETDEKGCLLACERLRKRVENLTSLRRTVTISIGAVTCHPKEGELVHFDDLLKVADSKLYEAKRSGRNQVKVTSLEDHQE\n>MGYP003123586391 FL=0\nVWGRWLRRRLRKDRGEQLLSIVRSLDYAMNNTSLILLFEVGDTKLLFPGDAQYENWMYALGQDWVKKLLEGVDVYKVGHHGSLNASPRSMLDLFEKKRSRTDDPEKVMHSLLSTMHGVHGSVSSRTEVPRKTLVKTLEDETQLTATSDFGGEISHTVTLPL\n>MGYP003322783177 FL=0\nMLSNVNDIDEEKLKTISNNQYAIVKTEDLNNIKDENRIIFAIGDLHNKINNPDLKIIILGNVFVETEDFTSTEGIQSISGSLYIQSKGGLETPNLESVYGNIYIDDSLFTQIYVKEIYGEINIKNSIKTYILADNAYGKIKCNKSVDTQLD\n>MGYP000483552797 FL=0\nGRPVAVPDLPGLPEAVSEAMTITLNPIGVIRSPHLAAPGTPIQPAFAQQYEGHVLVNNEFEAALADIEGFERLWLIYLFDRAGRYKPRVVPYRDTREHGLFATRSPCRPNPIGLSVVRLLGREHNMLRIAGVDILDGSPLLDIKPYVPSFDAHPSSMAGWLDERREDRTEADSRFHGENGPETAHDGAARHGKTTVKP\n>MGYP002514261527 FL=0\nSRVTRDLPANEVAVGTTCRVLRKIGEKDREYYFRDKKIKL\n>MGYP003501294569 FL=0\nNEEAYELTVKTGKMTYFSRSRNEIWVKGLTSGHFQYLMSMEIDCDNDTLLAKVRQVGAACHTGERSCFYRNLMSREYANTNPLKVFSDVMATILDRKENPKEGSYTNYLFEKGIDKILKKVGEEATEIIIAAKNPDKEEIKYEVADFLYHVMVLMAVKDVTWDEIITELARR\n>MGYP001567805989 FL=1\nMNATITTIIISFAVLPILVLSYQLGTPSIGESAVGEYLKQPALTTFALAKKQESKEVLPRRRPEIADLVVDSSEALAWDSKQNVTLFSKNSEVTRPIASLTKLITAAVVLDYTQPRETVAVSLKAIRTEGNSGNLKEGEVLTVYDLIAAALLESSNDAAYALAEYTGNKIISNQETPPDPVKTFVRSMNQKFNDLGLVHTNFTDPSGLADKTSFSTAEDFSRFIKYLRDNQRYLPIWEILKMNTYTTESQNGVSAHEFRNTNPFLAELSGVIGGKTGYTPAALGNMALVMSGPNGTEIIYLVLGSADRFGDIRKMVGWVSEAWVWPAPM\n>MGYP003352111790 FL=1\nMREWNLEEIKMNKAQSKENIFLLKGWKGVVVLYTVMIATAAITIGIAQFGGGVLSP\n>MGYP002236981273 FL=0\nDNNRKEINEARRDFENSFFNMLNLLQVKIKDMRVVNKITKEVHAEDVGYSFISLSHSEVKYCKEITLEYLKRIINESWTEWPKQSANNICNIFIAAHRIYLIIIDFCLIHLSLLMSLKLVMLIKKRYANILGRKISNYELLMLFYNCLSEDGRKFQYYFEKYEILDNLPIIKMAYKNHVLLVNKKCWGDNKQALELINGE\n>MGYP001471266083 FL=0\nMNVFCALRSLPHIMSIGILSQKTLFLIMLTSSTNLNFMIKDHPIFLESIRYIRSNLEANDFNYLEKKVLERLVHSSGDFSIQNLVNFSEGACEKGLQALKNGAPILTDTDMAAAAIKSMAENTTRNKVFTASMWFGE\n>MGYP000742235348 FL=0\nMAQATESRSSSSSQPNIQDVFLNYARRERLPVTLHLL\n>MGYP001188259027 FL=0\nEQYGLDHDNFIGSTVQKNNLELDASIVWHATDYLDITLEAANLLNEALVLRQPKAGNIVHSVDEFGTRYFVGASIRF\n>MGYP004019405559 FL=0\nMKLQNYFPYFSLFKFSIYFLISSIYLLDMSVYISVSIIEKIIIDSPKATPYVMELFAISLANSFGLKPIKRIKEK\n>MGYP000810644476 FL=0\nMTVAEDGSVTVADETLTTLRVPQGVAWMAQPVLRSVNGGDAAENRYPMEPNGTVALVPDTVGPTGGLYLYGVPGADLESKTYQWNGSKVTLCAVYTDVNGKKVDASVFTYKKGNTLFFYFPVTIGGEAKEIEITDLDVPTHGQPLDRTATASVGTVTKVRYEMLRKEINEVSKGDNISVGVQVKIPKGFTFADGSYAVWNGQTSEYRIRTSSMGSDEYLYVF\n>MGYP000110014348 FL=0\nLLRKNELSSCIPLAKSIISLGTSGFIMQLTNSLVSICCNHVLSVTGGDVYVSVMTIVSSVRQMVETPIYAINEGTSPILSYNYGAQRPKKVKKAICVLTCMILIYTAITWSVIIFEPEFLIGIFSTDRELLADCVGALKLYFAAFIFMDLQYIGQTVFKSLNKKKQ\n>MGYP000289551974 FL=0\nKRNCAKAGIQQEIRKREHYEKPSVRRKKKAEAARRKNAKK\n>MGYP000993698250 FL=0\nLTVHVDKRPDLESHTMTNLLVEDEKLENLVQETGVPNLFVVPSDTSLAGVEQVLANRIGRETILREALEVFPAGKEFDFVLFDCPPSLGVLSANALVAADFVVIPMQAEYLSLQGMAKLLEVIQLVQKRLNPQLQIACVLPCMLDARTNLSTEVLREIDAHFGSLLAKTRIRNNVKLAEAPSFGRTIFEHAPDSNGARDYEAFGAEFLAMILVLVYVGAVAVLFLFVVMMLDVDFVELRQGMLNYLPVG\n>MGYP002735085997 FL=0\nEDAFGFVNAECRYPENGANWTEEVFQNYGGTLKWISYNSGVGIPEPEPDITGKCGDNVTWGFVERSGKLTLSGTGATWDYGSYGPEEFKSFRDRVRVIEVKPGVTDLGTSLFVFCENAEKVILHEGLKTIDMFTFQRCDSLTELIVPESVTYIESAAFRDCPSLVSVRLPSHFTRIPDVLL\n>MGYP001200674681 FL=0\nNGWIITIVLINLLGCLWLLWWTRKRPEDTIKEGESLGHSFDGIEELNNPLPHWWLNLFYFTIAFAFIYLTLYPGWGDAKGILGWTSVGQWETEVEKAENRYDRLFEEYAQVPVEQLAGNEEVVKTGQRLFGNNCAICHGSDARGNVGYPNLADDDWLYGGQPENIKTSIVQGRNGIMNPWGDVIGEEGVVASANYVLKLSGRDHDAGQAAE\n>MGYP003380670323 FL=0\nMKKRYXQSAXYGCASRXAHKNYXLIREMVIQYRPSGXWRKGKMVQPHFEXLHQPARFHARETERXXGYRKDPMDRQSLXQFLLLXSIHGKIPXRRXYXISILSDSPTNIMXELLGIRKRXIYLPTGKVNVFCCSWNVPIXKQPYGXTDKRQECRIVFVFPINMIXPIMSVPENVLSLSGWIIVSKKSMSDRIRTAXPTRPKETGTALXDASVCKRLRKHISMIFKYIRNRNKTGTCQSRHQRYRHCKSKIISRELQYGXKHIVPAIQQEIKLNKGVTETEMVLPMGNDMLLWDEFHPALYKLKAEVTNGKKLRXKKYNSVCADLKSKVNGFMXTGAKPSFAEQLKTVTSRXPVTPRWMXKVGNGYSVSVAVMDXITCVSIHSVLPKPLLWLPTGXDSICNPKVRAGPIMVPNXVWDNLLTNIXWTKPSHXPKNMATMLLIACWHAETNLADAGXNGXPSSXNIGKRRIPDMYIPEHRXATDGNGNLATNIMXRLGHVAXPGPRNNRPPKTTIVSKIILTPXDSPTYPMKQVNGALSPISMKYVNIQASIKPRTSRFSKTFWLTTTXATKPIYLXWPAESCKPFVTNMKXKRHSARPIMPVSNYWHXTIIRVRELHWXVFSMFSLKKKDISTLQNGDVSAHLQFHXCVQINLYIITRKFXRRILKSLILVPRHXNKQKLYIRXKTNMAKYMRKAHWQHKTFLSEIXIAQVALSFRLLISKRLKAESGNTHYGNRSCKXLEFLGLSRPSDNSRRKSIHYRHLGFESPGNSSEWWKCAYYSCGQSELWXRSGPAIHSCILEHLLVQNASSSYHRYLSEPQTPVIPSVSDRISQQSAMVGTAESCSSDAIHPLSTRFPTYGSKHRHLVYKPQDRYVIRSQCIKWESAHDKHGHYLPARETHCSPSDAXSHFGLYEFGPVPSAIYCNASTNQXVVHKTAGDIX\n>MGYP001753171793 FL=0\nEMTSSLVGSEMCIRDSDRLLSLLGLARRAGRLSLGNDPVLSSMEEGKAKLVLVCPDLSQRTLKGIESRAEAFGVPLVTIEQTMDQVSMSLGKRCGVLALNDEGFARKALTLTKTNGEDLII\n>MGYP001606986961 FL=0\nMKSQEKNCIIIHGCPSDAEKAMNPETRTYDKHWIPWLKRNLVAARIKTDFPFYMQIVNRWVKIEPAVWNLFYRNNGAKVNFSGQIFQAVQYGLNPETEQIDYDQVATLAQEHRPKVIVAGA\n>MGYP001452258850 FL=0\nMHDKKIVNERLISSTVEITKEAGEAITEIYNSDFDYQLKKDLSPITAADNLSHNIIVERLESLTPEIPILSEENCDIPYKIRTQWTKYWLVDPLDGTKEFIKKNGEFTVNIALIEKDTPVFGVVYAPAIDLLFWGSMQLGAWRKNAQESEKRISISTQTSKKIKIAGSRSHPSEKMKSFLSQFVDYELQPMGSSLKICLVADGTVHLYPRLGPTMEWDTAAAHAILQSAGG\n>MGYP000432580839 FL=0\nGYAFFGSHRIGESYRTGLDGVYYLTAAGVLAKYRSSTEMLRRLVLSAMKELAARSPLGRIETIMSEKDPKLRRIFESLGFETTARYRSFIKRP\n>MGYP001553361461 FL=0\nGPRHRRRRISEGPQGPHPVIDGRRMTAFCSNDYLGLASHPQLVTALKRGAERYGVGSGAAHLVTGHSGAHHALEQELADFLGRPRALLFSTGYMANLGVISALAGRGDLVLEDRLNHASLLDGATLSRARLIRYAHGDAAALAAALEGDAGGECLVATDGVFSMDGDLAPLPDLARAARERGAWLMVDDAHGLG\n>MGYP000983384177 FL=0\nMKGKILGVNGDGSGGVILGDDNKRYNFTQEEMKNSSNPEVNQSVDFNADGRDAKDVYTVASGLFDVSQLKIPSFSIGDNFQVVILSLLVLFFAFTYYKNSKIEEAFVEFIATQEEYKITFEDYDCSGLFSTDCTLENIEFTTGGVLDFEAESLEISNIYELGTFDQSYRKSKIPFSVEIEGIKFAERIQETYFKSFVNNGGFISAREKELSEEVYNYLIDSLDSDTITLDGKLEVANKKLNRLEIIELSYDNDILPISIDMKVDNLGEEKRIVRNVTLRLSSENLL\n>MGYP003554407810 FL=0\nILCFVTRLLMGLCVGLVYGAMAKACKNATANCFVASLSAPLLNTLFFMGYIVLAFYNCDYVQNLVSVKGAANPLMFVVLLVGVQGVAEFLVSGILGGIVARAVHKFLK\n>MGYP003431497335 FL=1\nMHQQVSLELLEILEIGCSKSNPASAGHLKLKHED\n>MGYP002928876319 FL=0\nALHVMDEANRCLQCKVPQCQKGCPINTNIPMAIRLLKENKLNEAGKMLFENNPLTTGAVSSAIMRTSVKVTVYLDCLLYTSDAADDKA\n>MGYP003442291329 FL=0\nRDNTMNTINAYYEYSIDMQPNMSIGQNYITDIRTSKQTFPNGSTTGARWIQFKIPVAQPENTIGNISDFRSIRFMRMFMTGFSDAVTVRFGALDLVRGDWRRYTNTLDPNDTNPTDDKTHCDESTPPDYGVPEYTAATRPAPVRLEAAH\n>MGYP000852449644 FL=0\nAINFKFSLSPLLDSTKSQVTVFINGIYAGTTKLKTVPGRKMNFKVKIPPQARDRQLLEVAVRYYLDTEQQVNLDCGRRDYDKAWFIIHGDSWLDYKHRDKNVFYLSDLPGPYLLRKKVNLPLFVMPDQPTAADLTALERLSMSMGQLMPKNENWFSVKKASQITKEDLKTNHLIVIGLAERQ\n>MGYP000542208118 FL=0\nHTTAAALPMMRKAGWGRVVNIASAHGLTASPFKGAYVAAKHGIVGMTKVVALETAREPITCNAICPGYVLTPLVEAQIPDTAKEYNMTEEEVVEQVILQRQPSKEFATVEQIGGTAVFLCSDAAAQITGTTISVDGGWTAL\n>MGYP001017409220 FL=0\nACRTTRAITRRSNPRTSRASNKMTSSSMAVFGQVNLMVLVARRSFRQHLLDDELGNIGAVGLLMVHRADRPVAHIANRPAMRFRRAVAAVLGGAGFAAIQPAVQLGQGAGGDHGMHHVLQVGGLLDGERLRVRDRLFAVDQIGRQGLGGADRGGLGRQRHRGYQHLALTDGVGCHGDRVVGRRHGTVEGVEAGVEIHAHAQACGRCGQLTGCEIPGLVHEGGVAGLLEGGAQRDLADELGRIAVVVAEYPAVDLGGL\n>MGYP001607760096 FL=0\nMSDTGTEAPGGATHFTVSKGNLDLFDYTRACEEDRKSPNCK\n>MGYP003410680479 FL=0\nMKNNLLKYGLFTFSLAFAISCGTPKANLTAIQKDPIAQRVDSVLKLMTLEEKVGQMNQYNGFYDVTGPAPSEGEASKKYENIKKGLVGSMLNIRGAKEVRAMQKIAVEETRLGIPMLFGFDVVHGYKTVSPIPLAEAASWDLEAMKKSAEIAAAEAAAAGLNWTFAPMVDITRD\n>MGYP000424193527 FL=0\nCDSVVISSFVRTGYTTRRTRLIKHVIPPGLLGLVGCQIENVEPVISTFL\n>MGYP001346217960 FL=1\nMGDAFKALADPTRRRILELLAQGDLTAGEIAAHFDMTKPSVSHHLNILRSAALITDERGGQNIVYSVNLTVFQELMKWFYDCGLVKGDDSNEKE\n>MGYP003339884708 FL=0\nMSVSKFRFVSPGVQVAEIDNSQLPRLPSAMGPVIIGRSL\n>MGYP003507622094 FL=0\nVELSADDGDPTEPDHALVWMSASEALSKMRHEAHAWAILHWLRGRRGV\n>MGYP003457963375 FL=0\nRSSETRAALASSGVPRGVYAGKKPEKLLLDPGFVITQANLAEKQEEMWGFTVWKKQNG\n>MGYP002508125824 FL=1\nMRAGCNPGGGIGVPRDNSVSTGSVRVLSRSESSWIWAEKSLSAFTAGSFWSSVSTDTGAGIPEEEREQIFKPFTRVRNLAEGDGLGLPICAFINALGESSVA\n>MGYP003488338009 FL=1\nMDHVWLRNPPRPSGPDRGPPRTLNELHYDQLMLRLKFVEKIEKELGHKGLAAKGSIEEIMSADFNQEFEVEREHVPGKIASCWEVCYWVRTNYGNRHMEVLLTGELLRFSDDVVKLKEKFAKQDSAFAYSGR\n>MGYP003140940673 FL=0\nMSASGPAGQDGGGSKESNKKARKDLEVSAYEREIEKQNKLKSQKQLTT\n>MGYP003132782948 FL=1\nMASAPPTGFVLKAYLTEANARADSNALQVTTNTAYLINKEQDANYNFFTHIEYYFRIEANDPVIEFYIDWDDGENNDPKGKANFSLIKLDTPNNIAITSHIFTRDKLHFPKIRVKSVDGFLSKFYQAAGDDTFEGIDVLAVGDALIDEGRNDRYRLENDKTNAERIPILAPTPRPPVGILKADKKRVFAGITNKYLAGVGGTYDGVTCRLIGSHALMDTTRDNVKVKVTYYAGGADQNDLGNTGSGELIETEMSITTTPTISNVLSVVKMELVDLRENTSENQADIADGTASSFNTSRLFAGEKMILVVDGSSAYQNDTPSVIGEVSMGNPILVLDDPKFSVSLDATESFCRSPEQTIDEYKIWDGDYVTNHGFDENTALFSASSTDTSDIFGAGAGRDTLRAASGIKTTSYAFHPSMTFTDEYHRWLPKQLLAIAQVKSSESAAKAATGTVNDTRATYDHSFVEHWVDESQSNNYGEDRAGIEEYNWPSDMTSSAFFAFKGPSDSDNWHDLNPFNRLTGLDMEHTLFHQTDRASVTGGTRRYANTSTNDLDQVNAQGAYMICARDSKWTKQHFVTKAYSRDTNRTASVGENGPYRAAPITVNGVANKTTANEWSGVSHAAVRVEIFYTARQDGSTNIIWKPLKRIDKTKHPYLSDSTFYSSGAMEWMEPEDWVECDPGDIPDRFWPGGDFESSLEPDTERDSFAYDSDATGNYFDVSNRWNATNKKYGLMWVLTSDGGVDSQHDTFGWGPDVHYSFPASNKNSVLIDIVDPMHVSLNTHAIAQSVSYNHKGKYQIIEDRMGKSEIRKIGATGGTLTFGGVDLKDKDGTFTRDKFYEYQKRAIPVFFDIEHKSRNISRFFGVITDMSEDHPVGKQHGKFGITMQCSHMIYFAGSGSSLGDGSILSDGYVSLGGDMIDEFDYI\n>MGYP000711591066 FL=1\nMKTNTIITIGRQYGSAGREIGSKVAEAFGIKLYDKEMLARAAKESGICEEIFETHDEKPTNSFLYSLVMDTYSFGYSSAAFADMPINHKIFLAQFDTIRKIASEGPCILVGRCADYALEDNPYAVSVFIKASLDERVQRIKRIYELNDSKAA\n>MGYP003326832321 FL=0\nTIEQVLYRRVYDASDDEVQLRACAPKGYVKSFTVPGFHGPKPLQIRHQILLDYHNSRAGGHPGRAATVDAISKDWWWPGLYEDVKQWIQRCPFCSKEKGISGVSAWTRTELHSRPFRMLQFDTVSAIGGGDSGYKHILTARCPFSRYYWLIPLVGETAEEIAEALVTHVLLGLANFPTILQSDNGLLNQVMTCLMKTFEIEHITSSSYHPQSQGKVERMHGHLNELIKGLVRSEPSNWVKMLPYAQC\n>MGYP001544677532 FL=0\nLLDRDLSLHFRLLLALTGTLGRAVAARPTQRYDYFTTDDTDETGCWRPDAGWNGGRPGS\n>MGYP001464162734 FL=0\nIMFLLRKPSVKILAIDNFSNSKPNFVNNIKKKYKNKFFFKKIDIRDEEKLTNFFFKNSIDVVIHLAGKIDAIDSFKNKDEYRSVNLDSTKKLINISASNNVKRFIFASSAAVYGEVTQGNCSEKKKTNPINPYGKYKLQAEKYIINKKKELNFVILRLFNIAGIDKIFYS\n>MGYP003602224053 FL=0\nYSFLLTKNILMILRRQYGKSQLIFPEAFLFPYALIINRTKHKINLFVRFLVYFFVFVE\n>MGYP000042883827 FL=0\nWKVQIQVLQIVLARAFENQARRALSHHALEPETHLLAPTQIGAGQGIGLAQILGRAVEHDAPALRAGKNEAEPHPFPATMHPVIEAHRAQLLALARRHGMRSIKVFGSMARGAAGPDSDVDLLVEPEPGQSEPVRMFALGALLMDAEELLGRHVDVVTVALLHPLLRGRVLSEARALGVIAAA\n>MGYP001545084500 FL=0\nRMAPAIQDLWMLLSGDRADQIAQLSEVVEGYNEFYDFHPRELNLIEALRALRILYHTAWIARRWDDPAFPRAFSWFNTERFWGEHILELREQCVVLREPPLSLT\n>MGYP000472409418 FL=0\nSGDAMDLIKNFKLHVLALVIVIIAEMIGVLRFGLIMFLPLFYALVIGGIISYPSFKIMKLPEMERASRILTVGMLVLVTKILGIGPNLEMLSHSSLALLVQEFGHFFGTLVFGLPVAFLVGMKREAIGACYSIDREPNIAIIAERYGLDSAEGRGVMGMYICGTVFGALWVSILAGVIAQLGIFHPHSLAMGAGIGSASMMAAEWEMQGGTSVPVSGPYGSRLMETPISSTASIVATHPEWAETVQAYAAAANLLTSVLGIYFALFVSLPVTIKVYDWLDRFRSKKKAA\n>MGYP000294864057 FL=1\nMKHRMKRAAAPLAGIGAVVLVWYMVSRLGLLSAYVLPPPPKVWSSFIKMLVTGELWKDIYISYVRVMKGFSIAFVLAFLLGMVRSLLPASGRYYEFIVQFFRNVPPLSMIPLLILWCGIGEMTKTVIIVLASFFPMYLNIVKGFTGCDRKLMEVGEMFGYSKGRRFLRIVLPYALADILVGMRIGLGYSWRAIIGAEMVAASTGLGHMILFAQQMSRTDKVIVGILVIGIVGYVTDRVFALAISKLLKGSGDNGWD\n>MGYP003498844063 FL=1\nMSNDTTSTRPALTTLSDDEAAFRDAVAAFAEGEVRPRVQAMEREEGAARDLVRSLLERGRGEVLFQVETLTDHVTQNLPRVEIVEQVGQIDIEHVSQNSGRVCRDMVAGFIRWVTFDRKIENFTE\n>MGYP003578506829 FL=0\nMLMVTPKTLVATTAELIAYAKARPGKLNFPTGLGGAPHLAGLSFAQRAGIDWVYVPTKGGANSVAAMMAGEGDAMFLGMLQSLPHVNAGGLKLIGISAG\n>MGYP002788440824 FL=1\nMSRISLAKNYDYNCELIIIGDSTVGKSSILSIYNNNTNPLKQISTIGIDYIIKDEKINDKLVKVKIWDTSGQERFKSLADNVLKTSHGVILVFDLNNKETYDNLKTWIQFITIKISENIPLLLIGNKSDLEANILYGESIKFADKFNMKYFETSVKNNTNILESINWLVTQTIEKGIIKLIDKNINK\n>MGYP001490688083 FL=0\nVVIRRRVIPAAVAVVRQRAGTTADGEITDRQRVAFNVRRVRQQRRARDRVRPAVLGNGGQRHPTRYRGVVDRGDVHRRGTGDGTIVRNTVRRAVVGDRVAEAHIAVVVIRRRVIPAAVAVVRQRTQTIGNDQVTDRQRVAFNIQRVDQQRRARDRVRPAVFGNGGQRHRRTRRGVVDRGDVHRRGTRDRTVVWSAVRRPIVGDRVAEADIAVVVIRR\n>MGYP001613389359 FL=0\nLEFLLSQVDKMCVGGKIANVFLAAQGILKSELYPADEIAVAKHLLESYSNKIIVPSDIVIGNDDGSYVQTIDAGNIPESVGGVWDIGPKSVAQIQAACEGAKTIIWNGPVGRVEVPAYEQGTKSLVDFLASHSAYRVVGGGDTVNVLEKMKKIDAFNHVSVGGGAMLEFLEGKRMPGLEPLKI\n>MGYP001822186784 FL=0\nAKSEVPGPPKAIPVEKLAPAQTELGLRLVGTVVAYDSRLSRAFIGNRQTRRQKIYSEGDTIDDVLIKKILRNKVIIATKAGDRLLTVRSAASGNSNETYSAAPQVSRASMPQSQSPGRPSNSARVRHISLDRQEVEDSLANVDQVLQELTLTPYMRFQKPAGFRISNLSRNSIFNKMGLSSRDVIMGINDQKITSPDQAAEFLQTLAEGDEVTIKARRRLRTRRIILSIQ\n>MGYP001418701337 FL=0\nVKPLMSSSGKGQSLIKNDSDIQKSWDYAMEGSRGDLMEIIIEEFIDFDYEITLLTLTQKNHNTLFCPPIGHRQERGDYQESWQPIDMREEHLKMAQEMALQVTESLGGNGIWGVEFFIKENKVYFSELSPRPHDTGMVTLAGTQNFSEFELHARAVLGLPIPEIKLMKNGASAVVLANNISVEQPKFSGLEEAMNVTDSDLRIFGKPTTRPFRRMAVTLTYGKEDVDSLVERAKELAA\n>MGYP001258882498 FL=1\nMADAFFVCVVFCSAGAGAPHDWPGHQARRAGPRALLQNGGDARRHRGRQREAPRRGHQLRGEVLRGQAQAGGHGKLILFKSSRMCALRWRPASRCLERESNNSEQQ\n>MGYP002553949049 FL=0\nTESTKCVIALIDEIPDRITLDESVIAKVEAARKAYDAITDLTQKSLTRNFGKLTGAETNIERLRAGQQSSSSDSSSSAQSKSAPVALFIVLGVLLVSCAAAAVVFVLRKKKNK\n>MGYP000347212883 FL=0\nNRIVLRNYGSSPPTLQIWLLLSHLASHCPIHTHTHTHTHNTYMHVTMYMYVSMSMSMSMSMSMSMSMYMNVYMHMYMYVSVSVSVYVCVYVYVYVYECVYAYVYVCVCVCACACGCACLCLCLCLCLCLSRVCVYVYHICICVCVCVCVCGSIFLCLSLSTAFPACV\n>MGYP003507787529 FL=1\nMSEQSTHDAYEAKAKSTFSAERKEDYFVLAVAAITVALVLSGVIGPNFFKSLFF\n>MGYP000959777104 FL=0\nKEAKDARRLERAVFRSRPVERDEAEWVEADDPEDALAPLFTWVGPDLPEHIGPDCDPEEDMLCAVGSNLLVIANYKVGKTTQVFGMCYRLAGAPTPWLGVFATPQPLTVAYFDFELLASQHKRWRRRASDALGVRHDEDVQSRFRSLPLRSASAPNPATKAGRKALVRVWLAYQPDVAVLEPATAWVEGDGNSAEVVIAWTRGLDLAKGKYDRARMRAWEEAGAVGVPPPPLTCVISLHTPKSVKPGEETAIGSGRWMGWADE\n>MGYP000823295119 FL=0\nKIADFLAGMYPETIDRSLLLTGTLLHDMAKAQEFVFSQLGLATDYSIKGQLLGHLVMGAQDAAETAARLGVPEEKSVLLQHLILSHHGEPEFGAAVRPLCAEAELLSYIDLIDSRMEIYAETLPAVPAGSFSARIFALEKKIYHHN\n>MGYP000922530624 FL=0\nMSPTTVRRPIRPAALLRSVLR\n>MGYP000535681885 FL=0\nVWLKDYELPGVGDFLGRPPGYLMGSDLDRAYAHCRRIAKKHAKNFYYAFRTLPREKRRAIYAAYAFCRHCDDIADEELSHEEKMRLFADTRRRLSQAQNGSAQDPVFMALGHAAKAFGIPSEYFEQIIEGVEMDLTKARFQDFDELRTYCYHVASVVGLVCIEVFEYE\n>MGYP003610816290 FL=0\nCCSMSPSVHSIWSPPCILAPRFLAPARLGALVGXDFPLGMPLDDVFFDLVTVWAP\n>MGYP001477694372 FL=0\nMPRGGTAGKAQESNRRLGSVRGATRAKTPPPCAYAQTSQITIKVEGKFVSRGSREQA\n>MGYP000729372693 FL=0\nLLGTLCGDPRATSGRIVFDDKDITDWQTAKIMREAVAIVPEGRRVFSRMTVEENLAMGGFFAERDQFQERIKWVYELFPRLHERRVQRAGTMSGGEQQMLAIGRALMSNPRLLLLDEPSLGLAPIIIQQIFDTIEQLREQGMTIFLVEQNANQALKLADRGYVLENGHVVLSDTALDKLESIPGFDIFPDDNRFREIIKDVGVAIIGQTSSLAPADKRFYATRDITATVDSIPLITASILAKKLAEGLDALVMDVKVGSGAFMPTYELSEALAEAIVGVANGAGVRTTALLTDMNQVLASSAGNAVEVREA\n>MGYP003294174267 FL=0\nPQIDQRFVNFGVVAAEDAGVGRGLVKTDKNNIAPRLGIAWRLTDSSVLRGGYGIYYPTSAAQGMRDAFAANAFNQRITKSSTTATPLGGLPGGVNPRGVTPFSGGSVVVQGVAINAIRFDLQSPRIEQFNVTFEQEVKWNTGVRVSFVGSRQHNLIAGIDLNMLAPNDTPFGVHNADGDLCTPGDDCEESAADSARRPFPAL\n>MGYP002514170153 FL=0\nLKSARIYREEQMKNLEIKNPERHTERLMNAMQRELRLDRQPRHIECFDNSNLQGTNPVASCVVFRDGKPSRKEYRHFNVKTVVGPDDFASMREIVYRRYSRLLEEKAELPDLIIVDGGKGQLSSAYEVLCALGIENQVPIVGLAKRLEEVYYPNDPMPYYLSRTGEPLKVICHLRDEAHRFGITFHRQKRSKNFIVSELESIEGVGPKSIEALLRRFRSVSKIRAASVEELAEVVGPKRAELIEQWRSKS\n>MGYP000515275479 FL=0\nMASRVKINNIKELEKRKNSTHPSLVNIRKILSLLKNPQKNLGITIGITGTNGKGSVAKTLSTILNDSNLKTGLYTSPHLYSINERISIGKKNIPTKELNQILTEIFETEIKANIKLSFFELITVVAIIFLSKKKNIFNIFEVGLGGRFDATNVIDSDISIITNIGKDHKEYLGNTLLKIAKEKIGIIKKDSFFITGMKPYPFYRVKDYILKKTKKIYIFKKDFQIENNKEFYKYENLTFKPSLKGSHQIENMALVLKTCSIIKNNLGFNLKNQNIVDSLESVKWEGRFSILSSSPYKIVDVAHNYEAIKVLVQNVKKITSKKFIVILGMLNDKDPIKCINELLNIANKIILFKVNNQRTFIPEKIAKKINNKKVVLGKSEELGALIEKDINTLYCGSIYFIGDLLKKYKNLRSC\n>MGYP000931687007 FL=0\nMKNYLNEKYNDLDSVAKLHCKSYITADPYPHIVFDNFFNDVMLNEILNEFPSELDKVGSKYNTNQERKSFSNNPDQLSPKINNFLNFTNSHKFINFINILSGIERSLIPDPYLFGGGLHELKDGGFLNIHCDFNKHPQMNLDRRINALIYLNHDWQEKYGGALELWDKNMKNCVQKIQPIFNRMVIFNTTNFSFHGNPEKVTLADKSKSRKSIALYYYSNGRPANEVSSKDHSTLWQNRPNTSDT\n>MGYP001385379217 FL=0\nINLILIYQIFIYLLKNKYWTFIENDATNYHYLHLLYRNSVLEVAKHIIEGCKAEDQKCCKQLYSMFKDKMYGVCLRYAESEHDANDIFQEGFIKVFRDISSFRGEGSFEGWMRRLFVNTSLHFLKQKRKSGFVFEDDFSQYDNADELDDSIEISENRQNLLIDLMQKLPSGYRTVLNLYIMEDYSHVDIANQLGISVSTSKTQLMRAKKMMKLMVESALIKN\n>MGYP001196022355 FL=0\nMLHAPVLHREAVIPNLATQRGFRRRVAVVDFPWSDRERVRGDAHALLVRISGKALRVVRAGPDRHALALRALLVLVVDRLVVEEVADLHLAAVPRAPAIFVVAVVVPTRSLGDGSPLFCIRFALQVAVRLLPRVVPGPGKTERPAYHVRVGVRVLVDPVAPGVDRVRRQARAQLKRGLGVGGLGAFYLVLCALRFEPEALFKA\n>MGYP003389695985 FL=0\nDEIQYRVWEMTPHLELPGSDHRSPGPRTPNPNRRQVRVPPATQSSHGQHAPGGQMGXIPPAHPRLLPARFQWCQKYSTGTALNRRLVGVX\n>MGYP000014734933 FL=1\nLGRYGVRTIGELSKCSEEMLETLMGKMGSQLYRYANGLDDSPVRGAADREPIKSVGNSTTFRRDLTRWDEVQSGISLLSDSVAMRLRRYGLYCGGVQAGIKNSRFQVFSRQTTLDHSTHLMREINDTALRLTKDLWKQSQARALCVFQHSGCYRHRSLQVPGCASQVGGHNFGGRGHGPFFISILFIQHRVSGSVHHHGTLSAGGRQRPHRHQQKQT\n>MGYP000109000080 FL=0\nNVFYQDMGFSKTDIANAVKLVGVIMVIAGGFLGGILAQKLRMMQAMMVGAILACVTNLLFVLLTYHPGSLPHMYVAVIFDNLAAGLASAVFIAFLSALTSIRFSAVQYAIFSSLMTLLPKVMGGYSGAIVDNMGYPFFFIFTFAIGMPILILIYLVDKHIVIGDNDDIYGDNDKLTKANPNLTDTSEPPRASE\n>MGYP003723858749 FL=0\nARGESQRTGQRSREEIQQEAGQGLRCEDHSACAGTRQGQGSCAANLRQRQGPLQSVFRCHVVKEAA\n>MGYP001454151373 FL=1\nVSEDDGVDKIDRVVSNGEANTVVITVVVSST\n>MGYP003345151193 FL=0\nDLRVRCLVACCSWRGDECESAVWRVAVIATPFQSLGDHVVE\n>MGYP004046731215 FL=0\nMSADPFXIXSGTLLLAAXSIGSQAFRLRLRFIMPKRTSKTSGRATRKTSPIPASPGPLFPSTPERRSSPKRSRSKSSPRSPPRREVRRRVTFADGTEGEGDASHSTSDESVVNNSD\n>MGYP003232878591 FL=0\nMSTLFCVARAPHCSASVPHEARIAPPRLLEESIEGAHGALINIAGPSDLKLQEAAAATQLVGKAIHPEAQIIWGLSLDDAYGDEVRVTVIAAGFDANSKKAAQAEAQKQAEPAESTVPLSALSAAPRA\n>MGYP002780757469 FL=1\nMRESSFIRQNFDKWKYIETRLELKKGENPDELASLYIQLTDDLSYAKTFYPKSKVTDYLNDLTGLAYANLYKNKREKSNRFITFWKSELPLLYFKYQKTLALAFFVLIISFVFGYLSAAFNEDFVRGILGDRYVNMTIENIESGDPMGVYGKSEPFEMFITITGNNIYVSFLTFIWGGVNFGFPVFIFLSGGSIFSLLYNGIVLGAFMRFFYDYSLTTTASSALWIHGVFELTAITIAAAAGIIMGNGILLPGTRTRIESFAIAAKDGLKILLGLIPFFIVAGFLEGFVTRHYKNELVAWFIIILSLVFVIWYFVIYPINVKKNYGSTE\n>MGYP003421169975 FL=0\nASNLALLVRSLYKHWSSIKSSIWFDLFSRLVNDIYDQKIGIKKAWEYIQNIKNAIPSKYPLDETSNNSDSNKAGYAKVLDDYNWSIRSNINIDNFGWTIEKIVNDMSYWTLPYQYIIPQLFKNDIYVSYKINKINNEYTNDFKIYDGKTKTFNIINIFNGTVVDWLDLAVKEIKDVWAKNQVPIVVGGTGMYIDNLING\n>MGYP002515247338 FL=0\nLSRIVVELSPATPADRMPQMWDELRRKVQNVQNELPEGASAISVGDDFGDLYGIYYGLKGDDGIDNEELREWAQEIKRRVVTVDGVQKVVLYGEQQPVVNVYVSMARLSNFSIRPESIIAAMSGQNRVVDSGEKLAGEMQIRILESGTYRTLDDIANQLLTSSDGKQFRLGDVARIEREVIEPPTSIMRIDGDRAIGIGIATDPSRDVVRSGRAVAEQLRQLSSQMPLGMEIVTLYPEDEIAREANNQFIINLLESVAIVVAVIMLVMGLRQGVVIGSSLLLAIGGTMLIMLVVGEGLNRTSLAGFIIAMGMLVDNAIVVTDNAQRGVAQGVDLQTSFISGANRPMWGLLGATLIAMISFLPLYLAPSSVAESIKPLFVVISLSLLLSWVLSLTQVP\n>MGYP000642399635 FL=0\nDAPLAEEIAEELGAELVPVEPSAGAQRVPVPLFYPVLFDRLSIRRRDK\n>MGYP001211563207 FL=0\nMSSSSIVNKKIPVTVLTGFLGSGKTTLLNHI\n>MGYP001099929414 FL=1\nPVDPNKSANKTVLLLIKGLLTINSTNRFFFRRKYIFQPTDLRLFFYMLIGTIIYIST\n>MGYP003481454472 FL=0\nVVLNSQTKRAELTVEGADMVGFVFFAPSPRHLSLETARELGRQAKGRAAKVALSVDADDATLENIVETLQPDLLQLHGKETIARVRDIKAKFGLPVMKVIAVETSADLAVLPGYASVADRILFDARAPKGATRPGGLGAVFDWNALAKLELDLPYLVSGGLTADNLAEAVRVTRAGGIDVSSGVESAPGIKDPEMIRNFIRAARASE\n>MGYP003404440343 FL=0\nPGLTAHEEEPTASIDRIVEPGRQLPQLALPPDKHITGTAGSDVILALVHGPIVPTCAPARIPR\n>MGYP003306851604 FL=0\nIKIPANRGAGCCLGGNSYLTVTGCRNLLISGISTTVNGAVLISVPTNLGTGCCLSFNRYLVMACCRDLHIGSISTLGAVLIGIPADFGTACGLCLYNSQAMAGCGDCFIRGVITAGTSNILLPAIFGTGCCLTLMGLVIMTQLCLFDIGGVITVCTVLIGFPADFGTGGSLCLY\n>MGYP001507408964 FL=0\nPELCIAGVKEGDSGLYWCEAAPEGGQGQKTSPPRELCGRGWGAEGWKQSLQSPPRKEATGLTALPTLTPKQ\n>MGYP000892867995 FL=0\nGSAPRMRRLHELGFAVLGIDYRGFGRSEGSALPSEAMAYEDARAAWDWLKRDAEKTGAPEAGAVRRFVFGHSLGGAIAVDLAAQVEDDASGLIVEGSFTSLRELLATFKWGWLPVGPLLTQRFEAAARIAQVRAPVLVVHGSDDHLVPPTLGRALYERAPGRKRFLLVEGGSHHDSSARGLDEYRVAVRELFGVAAVE\n>MGYP001570592810 FL=0\nKLEMITTENAPTIAPHINPNVTITDGNVLTIKQNAVPLPHTEGWSAASGAISPYLIDMCFDKNGNMYFVCRFSWASMGNLDGTQDGDMAGIHKMAPDGTITYKWWYYSDPSIEPTKGEAGIWSGTSWDNAFNLSTAIWCEGNDIYLGCGDHGTANCLKISISDTSDILSTKVLRLNRAAAAGSVDGPYSAPVKGVSVEGDSATTCPPIAKIRSFSNGDICMVIGARN\n>MGYP000867335061 FL=0\nMDPVRRDVLAMGAAATAVAATSPAAFAQDGAAASFFEKDGVRIRYGIVRQLGSFNLLWAVFHEWIGIARDVWRAPWRAKLPYMFAPPGWSHDGSRDTSDSIRARWQERQEAVPAE\n>MGYP000426411893 FL=1\nMQSSVFYFPHCRNETEVESKLIVDFLLPRLGYTPHTWHQEVAFGHIRLDFLVFAVNRAPLRLADNQPVSLVIEAKSPQHGLDRFEGKLREYLTKLRIGHGVLTNGKDFRVYGRDKDSVRLLFRCPGEAIEQSLPQIRELIGREALITLSSSEPVLLDPVQEVDDLPSLRVVPIPASTEGIPETQGLSNVSSLEYSVIREDSSMIIIAIYHNKGGVGKTTTTVNLSATLSKMGYRVLLVDLDSQANSTFAVGLMKFPDEIDDDIKKSYVYHVILEKNQFSIPEVARKSSFCNPEFDVIPSHIDLMTHEFELKEGGSGITKYRLLKKLEEVQNSYDVVLIDTPPSLNLFAEIALITADYLLIPSDLKPFANEGLNNVRRFIDDINEDREDRGKTTLEVLGILPSKIATHARFVEHTLPKMEKTVEERYGYKLLNSRIYERRDASAAIEKTIVVGDLDIPDPQSVLDFKPDSASALEFKRLAEEIISLTGL\n>MGYP000549342313 FL=1\nMLKNIIWRDIEVVITLSLIHIS\n>MGYP001554259151 FL=0\nPFWSKVRQVSIDSDQESQRELFLFEDMSSQNEMFEKVQRLSQAVEQSSNSVVITDIDGIIEYVNRTFIKTTGYSSNEVIGRNLSFLSPDQAASSVYEEMWTAVRAGKEWAGELINKKKNSELYEENVVVSPIRNEQNEITHIITTKENITDLKKARQQADSANKAKSQFLANMSHEIRTPMNAII\n>MGYP001144722731 FL=1\nMCYWNCPLASRLFRKSKASWRVAPAWSRWQLQLPWPIFIASQPTRAVPWLVV\n>MGYP001076062122 FL=0\nMSKRLILFVAVAVMLLSSAGIVTFLSAQEGEIPAGAPQDSPGNAPAGGEPLETQYAPDRIYRTGSPDVWRVSTGDGILLSRDSGRTWENRGTGLPARAVWPFDKPRPPIVTGLSVDPAHTDRVGLTTLDPLYLSEDAGGTWEKVELKDPLKANDQLTCIALSPLQPASLLIGTSFHGFFETR\n>MGYP001119048589 FL=1\nMKQNIITKKDFDINKDRDVKNFLLNFGPQHPAAHGVLRLVLELNGEVVLKADPHIGLLHRGTEKLLEYKTYSQGLPYVDRLDYVSMMAQEHAFAYVVESFFNKKVPKRASYIRVIFLEITRILNHLLALTTHALDVGAMTPFLWAFEEREKLMEFYERVSGARMHANYIRPGGVAQDIPVGLLDDIFKFIKQFGSRIDELEELLTGNRIWKQRLVDVGIVSAEEALAWGFTGVMLRGSGIPWDLRKKESYEIYDELSFEIPIGSKGDCYDRYLIRIEEMRQSLKILEQCLDKIPETGNYKIFDFKLVSPPRALIKFDMHALIHHFKFFSEGYSLPKGESYVGVEAPKGEFGLFLVSVGSNKPYRFRIRAPGFFHLQSLNQMSYKHMIADVVTIVGTQDIVFGEIDR\n>MGYP000170037481 FL=1\nSGPLFVFHGIEKTFAEDEVLRKVDLSLYPTKCILLTGKNGSGKTTLLKIVAGLEKPEKAEIEISGKLHCWKKVMPIIRKEIIYLHQQAFLFSGTVESNVAYGLRFTSLTREKRRESLKKALEWSGLTDMAKQEANTLSGGVQQRVAFTRAQIMKPKVLLLDEPMANMDHESREQTYQLLVRMKLAGMSLVITSHFMQYFEGIVDQHFQLKNGALELKSKS\n>MGYP001203790631 FL=0\nMIKNFKQLILFHRLKPFMNFEESIAEVHAISMSIKWCRPGALLGLFASPIRSYLLAAKPYIE\n>MGYP001549860555 FL=0\nLSLEGKSGPAAQSARAFARNFAKRSDIPIALVDERFSTAAVTRTLLEADSSRKRRAEVVDKMAAAYILQGALDLVRGLKLELANLKEADIVACPPFTALSEVSKATLDSNIRLGAQNMSEHNVGAYTGEIAAVMLKEFSVRYVILGHSERRQYQKESNELIAKKAPEVHVDALRPIVCVGESMAEREQ\n>MGYP002065815634 FL=0\nVAYRQPLYLLRTAVEWDVVQDRVMAYSLPMVEATMHMPFRVAEYTDFYASRHHATNVGTMFRGPENALPPNWLHIPIGYNGRASSVVVSGTDIRRPWGQLKGAEYDAPIFAPSRHRRTVQNASIPSRSSRSSVLRVPLSRNHAVR\n>MGYP001354736308 FL=0\nQKKKKMGIRNVSPIYTPAAARTKPPHRLAPLNDSSSSTGAFNGLKPLGKISIDSPWDAFGKPKSITAVEKKK\n>MGYP003506483410 FL=0\nXSPLLPKXATSNGHNHDNKQWFYQFATELDGSVGTKVRAEHQAKSHGNAQLVVNVT\n>MGYP001354348586 FL=0\nDTGTGIHAAAGAAAGWGGEARINWALLQLQNNLWRYAFGNVLAARVRAMAMNWVQFQEGLSMAEFMARYGSEAKCRRALCRARWPKGFRCPACGDRRHSTFQRGGQTYYQCRACGHQTTLLSGTLLQATKLPLTTWFLAMHLLTSTKTNMAALELKRHLGVCYRTAWRLKHKIMQAMATREETRRLDGFVQIDGAYLGGERNGGKAGRGSEDKQAFVVAVETDETLEHPRYAVIEPVSTFSNATITAWAQRRLA\n>MGYP003378432903 FL=0\nMGSRKKKNGKFLSENNNNCDYEGFTKVLSKRRIIVTIYFYLEVQ\n>MGYP001118074481 FL=1\nVNCPLCSPSRASLLTGQYAVTHGYTVNAAVNAVPDERLPIYQHTLRGAGYRTGHVGKWHKDSYVEPRPGFDYWVTYHGQGVHTDPQLRVKQYDAPVRTVNETGFTTNVLTEYALDFLDDYGTGGDRTEPFALTLSFKAVHGPHGDQYTQSGGAYAGQTIDRPPNAR\n>MGYP001597331187 FL=0\nMWLSLAGLVETLRGGCGACSLGCGILLLPYGPHILRQCLELLNFISIHVSDVVRLWARELALSSLRHPMQMEVGEIGIERGGFCSQ\n>MGYP001567613541 FL=1\nMDNNNKWYISSTGSGLSLTIKGVLVGIVPLIAGLARTYGYDLTEGELFNFIEAGFQAVSLSMVVFGLARKLFFKFKPL\n>MGYP000114959871 FL=0\nMRPVLASARALSQNPHESSFPSTNGNCGFVGQYFDRKDLTDLRLSRLDSRIAFDWGNGSPDRRIEPDTFSVRWTGRIVPRYTEVYTLSTVSDDGVRLWVDGALVIDNWTDHAQTENSASVELAAGRHPIRLDFYEKTGGASIRLEWEGPGIGRQIVPRTVLAPSNADEKAEGLLGTYYQGGPGESIFAWTDENDDGRVQPPEVRTGTITFEGAPWRQVAATWQTRMNDRFEIAFSDGEYGRAGIAFFNVRGFNRRGYPLYELPKSFVPIPGLAHASDAVMRDRAGNAISLDEYVVSVSPDGRILWRYKNRWPGLHAGHYTTAAGDEPGVLIATTRFLGSAVVNETLGEVIAILSNLGATYLFTADGLYIDRVFQDCRQGLSWSFNAPPSDELLKRVSLGDEHFGGTFQKVKTADGSFRCRYVVSPGSPHNSVVELHGLENVIRLEGGSFEVTAEHLSRAEHLRQRRTLAATEPRRLIVR\n>MGYP002866891791 FL=0\nTSIDTMITRHHQKGDAASVAVYTACESYRYLLTRTWDASGPRALFVMLNPSTATEVQNDPTVERCERRSRALGFGAFRVTNIFAFRATDPKVMRAQTDPTGPANDDTIVGSAIDWIRGGDDRVICAWGTHGAHLDRGPAVEALLRQTDRPLWHLGLSKAGHPKHPLYIAYDQQPQLWRTT\n>MGYP000706738672 FL=0\nMSSKFYTKATTLALLTGGGTSAAALAWFPLRQNSKDTDDNVDSPFSDEGLEAGMLLLEHAQDVPGLLPIAFLVSAIVKSSEHSGHSDATRFARLIETLEILLLQASSLPLPFLAQLTTVLEQAEV\n>MGYP000526671817 FL=0\nMTKQKSIMTNGIIMKFKNNNTMRNIFYSLIFIFVIWVLMQPRPTNDIVTYHNDYRIDSNYLTPIEPLTESVNTMSVIPKQKENAVDLYIKRYSKTAIEEMRLYGIPASIT\n>MGYP001798615877 FL=0\nMNQDRTVSFKNGHSGYTNCDFTILDIYDCDFTILDMYDCDFTFLDMYDCDFTI\n>MGYP003125760673 FL=0\nMKQRKLKVRKGHWAYTLKSQPYSGNRITPFLLLKGTWLEQAGFNIDTPVSVSVEDGRLSIIRDHTRXEPRPGHRPGHSVLXQIRGMX\n>MGYP001490802382 FL=0\nMPLHLNVQQSNSSAAVKKLWFVPEVLMFIMQIVYISDTFSLLISNFYYFWAVLCT\n>MGYP003141655914 FL=0\nVDGVKNEGLLQPDNVTEPKKINIPRSVAGTHTDGNIHTYLINSALDIGPPDGLGFPVFYNNQIPIREEHITVIKKGPKNILNLDLDTGRDSDISTYINQQKTIKVAIRSDLNGNQDFNLLGWESYKGKTVVLKEFENDTAPSIPIADYRIKGIITDWHNFQNPELISDTGLQDISYPDGDSTGIIEIEILPTAVQGLPPLAPSGETLNYAIDLFDEEEKLFEFKFPRFSYRYKYEDGE\n>MGYP000069741418 FL=0\nREAPPAEAPPAPETPAPRREKAATAREVAVQTAAVAAEIEEKMATGEDAYRFPPVTLLHENREENHVEAGAELRNNSRRLAETLTSFGVDASPGDVVHGPAVTRYEFVLDQGVKLSKITNLADDIALALGATGVRIAPIPDKISVVGIEVPNKQVTPVLIRDVIESRDFTEHKSHVAFALGRDIGGRNVIGNIEKLPHVLIAGTTGSGKSVCTNSLIISLLYKSTPDEVRFIMVDPKMVELAPYNGIPHLLIPVVTDPKKAAGALQWAVFEMMKRYKTFSEHGVKKLEEFNRLARATEGMETLPAVVVVIDELADLMLVAAKEVEESICRVAQMGRAAGVHLVIATQRPSADVITGLMKANIPSRIAFAVASSLESRIILDTTGAEKLVGKGDMLYAPLGAGKPTRVQGCFISPEEIEDVVACVKQSGEAQYSDEVIAKIEESIQEKEKGGKGASAASADPGEDEGDELLPAAVDVVLETGQASVSMLQRRLKLGYSRAARLVDQMEERGIVGPFEGSKPRQLLITRAQWQEQQMGGAPDAGEPPFPVEGDEGL\n>MGYP000844791533 FL=0\nPRRTFIDFSENDKVASRRDSPLDRALSESESEVTTIRARSIIAAPKGDSAEPMSNFSREAPRKVVTKPAPSPAATPAPPVLVATPAAPYEAVRPVRPFEDFKEFSSPPLVVPKTVVRPIPVETVVVPEPTPAPAPEIATSVANIETTTVKSEPREGFIKSIAPATLTFVRTGYYSAKYRKFDDRMKNEASMLGLGAARGIETSWGSFEARAAVDIYHAMDQSMTIDNIRMMSVRTEVAYWLSHSRVKPGLSLGLGWADYSIRSYRSISGANEDIVTLRTHAKGKAFSIIPATSLRIEVADSDTSQLVVDVQTEFVALLGGESPDAAQGLG\n>MGYP000545153660 FL=1\nMSADPHVVYVTVPEMLDAARIAREVVSARLAACANIMPNIQSVYHWDGEVCLSDEVVIVFKTTGDRVVELTHMVVDEHPDEVPCVTSWPITDGNPEYLKWVRDEATGQPQG\n>MGYP000168519987 FL=0\nMASITIPYAVADFIEMRERGFYYVDKTQYIAKLEDYKAPVFLRPRRFGKSLLVSTLACYYDRTKAHRFEELFGDTWIGNHPTKEHNRYMIIRYDFSAMVMSDHIQGLAQNFNDLNCGPVEVMVAHNRDLFGDFEFSNRGDASKMLEEVLTYARSHELPKVYILIDEYDNFTNTILSTYGTEFYRKATHGEGFIRGFFNVIKSATTGTGAALERLFITGVSPVTMDDVTSGFNIGTNITNDSWFNDLVGFSEKELREMLTYYKEQGVLQESIDEIVAMMKPNYDNYCFSRSRLVDCMFNSDMVLYFMKSFVLHGEKPEEIVDPNIRTDFNKLAYLIKLDHGLGENFSVIKEIAEQGEITTDIVTHFSALE\n>MGYP000057883855 FL=0\nKNLLKPGDHGTTYGGNPFCSVLQLIRCFEMIGARPHHRPCERNHTISWKKNYDELVASYDFLTARRGLWTDAGLWYPKSRSDRSLQMALEEGLIVITAGSERTPFCTTAHHRETTCG\n>MGYP003384944733 FL=0\nMPVYRYYVPHAIVFLTQTVANRAPIFREPRWVDLLRATLHRVQERHPFRMRGYVFSPDHFHLLIQPTPPETHSSVMHSLKRAFTLAYKQATGIPGSLQFWQRSFYDHLIRDERDFEQHLHYIHFNPVKHGLVARPEDWPDSSLAAWKARGAYPEMWRWSLEERAAA\n>MGYP002790362313 FL=0\nGKWQSVWRLDLNTEGLLLFTNSGELANQLMHPRFGVEREYAVRVLGTLEPDARKKLLEGVKIDGQPASFKSIEDGG\n>MGYP001259587854 FL=1\nMLTNRIAKLLSVLLLLTLASACGGGGGGGNDDSSSPPETINLGQFYDGDLSSKNSETWSFSAAANTFISVELYGARLDQTSWNTPLNAPIVKLLNSNGSTILAHNITDSAGDLTSYWYFGYRDTEIPLYYLTDAGDYSIEVSKKTTNSGAPYKIRVNNENKSILAQFGSAQEETEPRGLGTNNILASAETILRDGPGTDEIIFGLFEDDDPDTYAIDIAADTTTPAVISCFEIISQRLGILTPQTGQSYPDLELTLYDTTDTKVNFVDDFYFTDPKVCRKITNTDTANDTYKIQVTETTGASNPTTDAYYFLKYTEEKILN\n>MGYP000577366278 FL=0\nMPWEIGDIVRQVKKQVKIPLGIHAHNDSGCAV\n>MGYP002519074643 FL=1\nMQTAVFTRETSVAMPSDMFAARNSGILSAAAVIAAETGVPVFELDMIMHGSSYFDSMYRNIDTLKGALG\n>MGYP002064227981 FL=0\nLLRRAAISRPEIGDADRRAGCRLRQRRHRIHQHVRCLVDDVLGAQLDAVGKSHLADGHDPPIADRHVANQRFRARTVVDRAALKQQILKAVPSIPDLVRPAWASASTFRGSDKRGGANGARIRLEPQASWDVNVRSGVGEVVAKLDAADLVARRRMRPVRRLRRWSPTSITGDDAGLMALPVAAAAVSSDCSPLPPAIAPDRRSVTIGRAPWIAGVSGLASQATTRPAAHTANSATSSGSRCRSGSMSTSAAKELADLGYTNVVELDGGMRAWSA\n>MGYP000874961551 FL=1\nMISKISNDFPVFDFKKDARYLGFFDFSCPEGPIFSWSGCSIQTNFNGTGIYAKIIDKNMTGNSWISVIIDYKESDPINIKPDKDMYVIAKGLKNEAHNLEIHKRTEALLGQLQFCGFELSSGGRFLTPPSEKARKIEIIGDSITCGAGNEGVYSGDDAEFLGKEENNYMSYGPIAARILDADIAMVSISGSGCYQNYGGAKENTIGDLYLKTNLSTSYDEWNLKKWTPDVVVVNLGTNDFSAEIDTDKFKEKYKRLIKHIRNKYSKAAIFCSIGPMNLQPGKYIDSVVNELKIEGDSSIFYCEFDPIDLKDEGLGWGTHPTIKTHEKMAKKLANEIKLRLCW\n>MGYP000873909662 FL=0\nIYYLETGANQRGSTVVYDRAASSVALAAAEEYDFRSALGGVARVHVTGITPAISENGFLATRALLRLASQQGAKVSCDLNFRKKLWRWRKGVPPGELARQCMTELLPMVDLVIGNEADAEDVLGIKAEGTEVERGRVSAEAYVEVARGIAERFPNVSRVAITLRESVSASHNNWGAMLFDARSASAHFAPLDGQGRYRPYEIRNIVDRVGAGDSFAAGLLYALDSEKYAAPADAVRLINKGALVIDVRDPAAFATGHIVNAKNVPLAEIESGTEVAKKKNKVLVTVCDRG\n>MGYP001229117954 FL=0\nNREAKLPPRQELFECNLAVAADIELGHDQVLLLRLQLVPHVPAQQLQLVGVERDHVHAVGAVRLVGVALAEGADVDPPQAPRPLDRARAFPGREFGPPLEDLEAAWVVAVADFLRPARDSLGIGEALNGRDRERDRRQRAPAALRKEVVTPSADLLDSEVLVAWSAELPDLTLLRA\n>MGYP003486854474 FL=0\nALGLSGERAGRIDANLAEHRLRDRTLAEEAVQDAFLRVVRHRQRFDPARRFAPWFYTMLFNLCADHWRKAARYAARLKAFVPEIDTVQFAHNFRCHGTHPWLAHKMAETDRISAVX\n>MGYP000004611563 FL=0\nSDSPASASQVAGTTVAHHHAWLSFVFLVEMRFHHVGQAGLELLTSCDPPTSTSHSAGITGVSHCA\n>MGYP000261681696 FL=1\nMDFEQFYQDKYPAGVPRNVDLDKYTSMVDVFDQAVKKFAERPAFSAVGATLTYKDLDTQSRNFAAWIQNRTDLKPGDRIAVQMPNVSQYPVIVFGAMRAGLIVVNTNPLYTTREMEHQFNDSGAKAIVVLANMANNVEKVLPHTGIEHVIVTEIADMHSPLKRTVMNAAVKHLKKMVPAYNLPQAHKLPAVLSAGSKEKFSPVECKKDDIAVLQYTGGTTGTETECTRFRPYDRGYHFNALLLIDNIFHSAKDFLHLLG\n>MGYP000082023964 FL=0\nPFVPRRMPDGSGYELMMLEPELAPPLEDAETTARWIERCLAGSEPVPASLKIQMACCLVATGESASLAEGLARVEQSF\n>MGYP000378578682 FL=0\nMEKMRFSISSSPHIRQSQTVQSIMRDVVIALIPTAIYGVIQFGYQAALVMLSGVAGAVLTEFVGNKLTGRPVTVTDFSAIITGLLLAMCCPAYVPLWVPFIGSVFAIAIGKLPFGGLGQNFLNPALVGRAFLLASWPALMTHWAPADAVSAATPLAAYKATGAMASYGDLFFGNIPGCIGEVSKLCILIGAAYLLLRHVITLATPIGYLGGLALMIFAFGGQDGLFTGDALFAILSGGAMFGAFFMCTDYVTSPVTQKGQFIMGLGAGILTALIRTFGGYAEGVTYAILFMNVVTPLIDRFVHPKLYGEADRKSVV\n>MGYP002628574471 FL=1\nMKINFHHPAPEKTPRIWRSLRELENDPEFEKHLHTEFPRGADVYQDSGLSKRDFIKLMGASIALAGVGLTGCRRPESYLVPFTKGVEFTIPGKFLYYATSMPARFGAIPLVATTSDGRPTKLEGNPLHPFSNGGTDTFAQAETLNLYDPHRSKQITENGKPSSREAFDAYVASVAQSDGSNLAILTEPSSSPTRARLRAALQTKFPKLVWAEYDPLAPTAANAANEASFGSSVRLVPQFSRADVILAIDSDFLNPIETGIGYAQGFSARRNPEQKGASMNRLYAVENHYTVTGGMADHRLRCKISETGEFARQLGLALAAATNNAALAEVANAFPASQTSIDPAWIKECAADLAKNAGSSIVLAGPMTPAPVQVLVNAINNALGNIGSTLLPVKADLVPAASIEDLAAAIDKGNVKTLFLMGVNPVYNAPANLGFKELLSKVPDTVHLGFFEDETGTASRWHVPAAHFLESWGDCRTFDGTYTSVQPMILPLWNGVSEIEVLNILSGATAPEGPSLVRETFNAIAPQATAESWNAFLRDGFLPESAFQQIQPTFNAATASGLAKKGAPAKADALELVFLQSSSVDDGRYANNSWLLETPDFVTKVTWDNVLMVSPATAVRLGIKTNNFGLLGDVAEKMGNDVNYDLIGDIVELSDGKSTIEAAAIVAPGHADDSLSIALGYGRKGVSALMDGVGFDAYPLRSSNSMRFLDGVTIKVTDRNYPIAQTQEHRSMEGRDLVREGSLERYAKDNAFAQTMGMDSHIPPNISLYTHPELNAKDQWGMTVDLNTCTGCNACVVACQAENNVPVVGKDQVRKNRDMAWIRLDRYFAGDSSDPEMLSHAIMCQHCENAPCETVCPVNATVHSEDGLNLMAYNRCIGTRYCANNCPWKVRRFNYFDYNQRPIDELYWGPLAKKGMADSLKMSKNPNVTVRMRGVMEKCTFCIQRIEEAKISRLVEAGPTPASDTPIAPFKVACQQACPNDSIVFGNIADPKSQVSRMRKDPRGYVMFKYLNVSPRVTYLARIRNPNPKMPGADLVGMANGSGHHGDAHGEHADQGHVDSHSDHHTEPAAH\n>MGYP000967004213 FL=0\nSSEGALPGNGRFFAVTRPALVDALDAQGGEHPT\n>MGYP003580660516 FL=0\nMPIINRNIESPINILIIFLFITVSFYSNHKKSRHSGGNDGLRSNSIDSEFXDQSPSSIPGSFTALX\n>MGYP003382547724 FL=0\nMRWVRFRENEDRVIRKSMLCEAVIRRKKRRMMPPFSTIFDQNAVTGITSRPRQRSGMVNLPCGRKSVTIAILLLVSWLNSLAGDAFADDVQSRRQGSFAAGGTDGKILQQHEASFQASDDGQENGSWQKAEFKAETKVTSLPQQPASFRSLLSGTPDFLNYDAP\n>MGYP000595587323 FL=0\nNVTATDPATGAVVSSATQVVDAERVLGNVAVVSHPGTKGPRLEPALYAFDDWTITGEGVAHHPGQTFGPIACAQHTLSRGVLKMTAQFLPMDDNAPSGVDLQVNQGGQWVTVDTAELDTLSWTAGFRVPDWDDTVDQDCSGADLTDVDGDQYDAEAAGGGDCDDDDPEVHPGAIDIEGDGVDSDCDGVDGRGGGDDTGGGDDTGGGDD\n>MGYP000311212580 FL=1\nMLTGVDQAKAVRALLPELPAENFIIEPLRRDTAAAMALAAGSIARRNPHATAVVLPADHHIPSTIDFQKTLHCAVQAAETSGSIVTVAIKPDWPCPGFGYLELGDPVERESGAVYPVVRFHEKPSAETASEYLAQGNFRWNAGMFVWSVPVLCEALQKTAPALFDFYTGLKQASDAVEFLNANFESVPKVSFDYAVMEKLSGVLAVEAGFAWDDLGGWAAAGKYFPSDQHGNSGNTAIQSIDARNNIVFSKEPNQHVALLGVENLIVVNTGDALLVCPRGQAERLKELVAGLPSDLQ\n>MGYP000202157561 FL=0\nAQVRTLGCVGDCVAQASELIDQSALQRLIAAPYASLTDLIDLFRGLVAIGGDLGDEILVAGVDHRLQDFTDARIEELHAKHIFCVLNRRRQALAYLGGELGHQALAVGLGALPGSLRGQLGGQQRRADENADEAEGDDAAEDAEHDQQQRQAAAAADQVGLDEVVDAADHQQAPGGHEDGPAHRTLGQQPQRGPTPHQRRPHRHHGQQEGGRGQGWRAGYAGHQEADQGHQGLGQRRAEDAVHHAGDGAGDGGQQLVGQAAGQLVQDGARGQDQLVTVAVEEEGDEGRESELQQAAAQGLAA\n>MGYP000361399541 FL=0\nMGAPPALCGRAADRPALRPSTFGLPLRRVPGLAPAAQRSPSRLSPALHTQRAARCLRVAVPVTGLAAARRRSAALHAPVHDPDAVRDAQRLLGEVHAQKLRELSVERADLLRCQHGADALAGPDAPAPAAVRVRHRVIVREGLDVADAAFRQIADEGGVEARGHGEADVRLELRRVVALDQRLGPLDDVAAERDPVEGRDHDVPTGAQLRADLTQRRRPIEPVPALTRADHVEALGAKRDLLGAPEHIIDPQPRLRIEAARRREQRLRDVQADDPAAVAGEAARHDPGPGPQVQDRLAAGADSLVGEAAEQGVWEPDPVLPVVLCGAIKVDLHVCLPVQCPALFNALPCSAPCLRGTAYQRGAVSVRGQRLLQGDVRLDAAQRLRLARHAARQLRRHAREDAAAAQKLDGADDAQELGHRGLVQHLGAGEVEDDPQRPQLDDLLEQPRRHVAGALGVEPTDDREGERALPDLDHRRRQEQQLLLFRGQRLQLPIEPLFIRDAVVGRAGHAGGVAEHHDVGRAEGVRLRAGEPVGADAADIAQDRDEEARADAQAAAGAALRAPFGVGLDVRDVQELRVAHHPAGVS\n>MGYP003362107572 FL=0\nMSLFSKKTTQQPIPEEQRVEQAYLAGMTTLRDLIAPSSLEIFSNYFRLGTKFGRTLYVYGYPRQVHTGWLSPLINIDEILDISMFIYPVDTQIVLNNLRKKVTQLEATMNINTEKGRVRDPGLETALQDAEELRDQLQIGAEKFFRYGLYITIYADSMDELNFVQHKIETIFGQQLVFSKVASSQQEQGLNSTIPQLTDELQIRRNMNTGAISTSFPFTSADLTDGKGVLYGINMHNNGLVIFDRFSLENANMVVFAKSGAGKSFTVKLEALRSMMTGSDIVIIDPENEYQKLCEAVGGSYIRLSLNSDTRINPFDLPRVIDTEEADDALRANLVTLHGLLR\n>MGYP001412591253 FL=1\nMTRISLPFAPQVRSGIPKSPCHSNVVYECVCEKKITVSLICAGGKEGFASPAAEPQSPVPLSHTPRPVASTLTCFPPLPLGPAHGRKDRL\n>MGYP001520358773 FL=0\nIFANEYPNEFIGEAGTINGPNNIRKRKNKVPGALYIAITSLYLK\n>MGYP002525796693 FL=0\nMNKKLITLLVALLSGSAAFPQVHKMERKDSSAVDRTYNLNPVVVTGSGHHQRLKSTATPVHVLSNQEISEQGISTFDGALTRMMPQISMSPNSMGTFLRLNGLGNKYILILINGQKLSGDISNNVDLNRINMSRVKRIEVLDGAASSLYGSDAIAGVINIITDQPTQNLISVTSDTRVSGHGQLTENVTLDIYKNGFGSYTSFSHDRADSYRHNDLEYVKGSDTETQQTIAPFFTGYRSNVIGQKFTYAPIEQLALNAGLDYSYKITDRPETRQDITGGTDYEMRYKGFRWNVGGIYKFTAKNSLQANFTVDRFRYGKQYDVKTKDYAVGDYVQSKKQMMMDGELKAILGLTKNSTTIFGADWRKDYLTATSGNIEENVYSLAAYAQHEHKLFKDFTATLGLRLTHHE\n>MGYP001301746093 FL=0\nMTQEVQITRDQVLEQLREVYDPEIPVNVVDLGLIYDVQVSGKNEGFVQMTLTAAGCGMGPYIAQQAEWSISELEGVEE\n>MGYP004005692463 FL=0\nGVAAHGPSRVVRDPEQASGVERALVVRLGGVHDILVAELFEHRLAAQYHQDLTLARRRPEHRFAVLFLDLDHFKVVNDSLGHHVGDRLLVEVARRLRTCVRPGDTIARLGGDEFIILLTDLAESADVDRVTARVQEVFEAPFNVASHEVQTSASVGVAAGELSYTRAEELLRDADTAMYRAKALGRSRTEQFEASMRVKALARLGTEIGIRQGLDDDQFVVHYQPIVSLGTRKILSFEALVRWEHPEAGLVGPDQFIQVAEETG\n>MGYP001224191517 FL=0\nLNYVGHLRGYHDITESTNIDLGASYSYGHNPAGVINDIDIGRFTTKLFGVDATLRWRPLTRAIYHQFVGRSAVIWSHRQQFGGPQDRLGYYVPGDYQFARRWFAGGRFDHSDRVDDSAIVETGGSAVLTYWPSEFSQVRGQYRRTSYAEGVVANEFLFQFLFSIGAHGAHTF\n>MGYP001086061371 FL=0\nAAYGAVFTIRALQQNTEDEPQPGHAFSFVTALKFALVLAAILLASAALREWFGETGVILAAAVAGFVDAHSAAISIAALVASGKMDAADAVMPILAGFTTNTISKMVFAGTSGGYGFALRVIPGLILVAVAAWAGAGTTRIGR\n>MGYP000610080798 FL=0\nMSIGGLTKDKLSNFDKLSQPRD\n>MGYP001730562506 FL=0\nLNVLHHSSVKYFISFPSIQDFEIIILKSVKKSTIILTISGKNRFSFCAFHPDILIEK\n>MGYP000961376923 FL=1\nMKHHVENQCDEPRVSVVILNWNGRKLLEQFLPLVLEHTLGDEFRVVVADNGSTDDSVEFLQTLFPEVPLILLDENHGFAEGYNRALEQVRSEYVVLLNSDVETTPNWLQPLVDFMDNHPEVAAVQPKLLSYHQRDHFEYAGAAGGFIDRYGYPFCRGRILEEVEEDRGQYDTVIPLFWATGACLMIRKSDFVENGGLDGRFFAHMEEIDLCWRLNARGRKVMCVPSSTVYHVGGASLDKENPKKMYLNFRNNLLMLYKNVPRTRYFTTFAVRYFMDLLAFVHLVMKGNFKNARAVVKAYVDYWKMRPSYKQVRRENLAKTLIEIPTQYPKSILMRFYTGKKTYQSLYSK\n>MGYP003987264985 FL=1\nMEDIKKAIIKAKGEGNKHLVQRLQQELDALQEISNNLDWPRYEKVIRKLEDKPDMEDFPDGPKKNNS\n>MGYP001575371671 FL=0\nEESALDTLPGLAALCNALSPKLVSGAVELGAEGTA\n>MGYP002783228703 FL=1\nMSDEIGRLDIMVEAEANRANRALGGMEKRLNRIADSLEKVTALTAGINGFDKFDLKGLESFRKELDSVFKSSSKKSVKVDDSDLKYAKKSMDELQRQYKNAKLEVNISTIGEEELKKFINQTERRYRKLKQTLADTIELNGSDMVGGKAWYKANMQLMQYENALDDATEALGRMKSMRDRIPEITIDRGETYNNDTDIPEYPKIVEIGNCEQYDASEIEEYINNFAGARKEANTFEAQIKSLKSELSDLASQGFSQYDPEYDSVARELAEVTIAQKQYNKELRESARESLGISNSERSAEAMKKASKQAGVFKRTIDGIKSSAKNINALKRNFDNVSKSIRSAIKLSKSALHPIRSLKQVISGDGGNRKGMSWGRMIGSSVLFSFVFQGINAIQKAIKEGSDNLVKYSAEYNYSISSMLSSLLYLKNAFAAAFSPIVNVVSPYISQFIDMMASAANAVGQFMAALTGKGFAVQAKKAWKDYAAGLDTTKDSAGDAAKAIKDLQNYTLRIDELNVLQPNDNSSSGSGSGGSGSGGADISPSDMFETVEVSNSMSKLAEMFKEAIANSDFTEIGRMISNKLSDELESIDWQSIYKKADNFGKDLATFLNGLITPRLFYNLGKTIANSINTAFHSANAFAINFDWSNLGDSLASSVKGFFENWDAKLTGETFSNFVKGVLESITSFVNSLNSNDTFEDIGQKFVDLLCGVDWAGLTWDMGKFFKALSDAMTDFPKDFSKGVAESILEHMFDSEFSDGMKQKFNDSIQPLNDIWDYLFSSLNPAINAFKIMDFVRETVSSKGQNILDFLSDCWESIKIIFSPVVKWFKDTFSGAYEAIKSPFEFIASWFGEKWTAIKGVFDKDKVRNFFKSAFKAALDAVKNIWDGIGDYFKKIANHIISPIGKAVNGIIKGINWVLDKVGSKKPPLDLWEIPKFARGAAGLPEDTIGIVNDQKGSVYKELIVPPDGKPFIPEGRNVMLPLQKGTKIMPADETKALMSAFPHFAGGIGDFFGNAWAKFKDFTGNVLDYITHPNKIVQIALDKFVDISNMAEPISSIAKGTVDTVFDGIVDYIKGIFDSETTVKYNPTAGVEQWRSLATKALQMTGQFTESNLSRMLMQMQTESGGNPNAINNWDINAKNGTPSKGLMQVIDPTFRAYAYPGYNANIYDPLSNMLAAIRYTVSRYGSLAKGWKGHGYASGIGKINFADFLPQLAGGGAVKSGQMFIAREKGPELVANYGNKSFVMNNDQIVQSVSNGVEAAFERQNARTNALLQQIAECQKMLIHKDTSVNIDGKKADKQLSKARKNSGYSFSPA\n>MGYP000278592768 FL=0\nRPPRSTLFPYTTLFRSRKVMAYNDQVMMCEITFEKGAKGNFHTHPHIQTTYIVKGSFAFTIDGETQVVNAGDSILMPSNSLHGCECLEAGVLCDVFTPMREDFIKK\n>MGYP000014633898 FL=1\nMSDGKKILITGGAGYLGSVMTPLFLHAGHSVTVLDNFMWRQSSLAAVCHHPRFELINGDARTESTMKPLVNEADIAIPLAALVGAPLCDKDPIAATSTNLDAVRMMLDMLSKDQWVLLPNTNSGYGVGEGCCVGKLGVPSREPAPSVGTCGGRGRRARKMKPVPTSRATMKLMKAIW\n>MGYP001266816030 FL=0\nMEHYGKKLKFRPLNYVFILL\n>MGYP000960759586 FL=1\nMRVDPVTQTTMARMMDHAVLNPAMTENDIRRAAAMCRARGVGNLCVRPTDAALAASLLKGSATTVAVVVGFPHGASRSEVKALEARLAIGDGASELDMVMNIGKFLSGDYEYVKRDIEAVVAVAKPQGVLVKVIQESCLLTLDQVAKACELTIAAGADFVKTSTGFNGDGATVEQVEVMLKTCAGRTKVKPSGGIRDWERAAMFVRMGVDRLGVSSTDKILDGAPTEDGC\n>MGYP001420375246 FL=0\nPEQLAGVLSIVARQSAAAKGQPYDEEADTAIRAAVEQQIEAESLPVFLSGRLYDDGVIDPRDTRTVLGLCLSAVHSAPVEGVHGGFGVFRM\n>MGYP003296810821 FL=0\nCQGYFTEERGDCYGGNFNIVKVIIESPIAPTSCEGLFQGLTACKVIEGIEKLDTSRATSMEDMFASCFKLYNPDVSGFDTSNVTDMSGMFTSCHAITKLDLSNFDTSKVTDMSKMFVACHGLATELNLSSFIFCYF\n>MGYP002731676114 FL=0\nNTKALRQKILDLAIHGKLVPQDPNDEPASVLLERIRAEIVEGVTTEATNALGEKVQMDFAANRTSLPMDLRAAEVQENAIQENQNPKKFVVHSGANENRKTLDSKKNL\n>MGYP000800539561 FL=0\nMKNICIGLFEGETLPESLAAFKDVKLDLEFGKVTTIYTLHQLDCEKVVVVGLGDGKKNIKEAFSKVEADDYLAYVTENTAYAAGFGLVYAVSYTHLRAHETDS\n>MGYP000365574991 FL=1\nMNEATYISELGEAIYPHLNKPDVKFNENGEYKVILKVSQGRATKMVAQFEKAMQDSISKAESELKGKTVKVAPSPYSEEGGFVNFKFKMKATGVNRKTKEPFSQRPALFDAKKNPLNPTSCNIWGGSKIKVAYQLRPYHTPLIGAGVTAILKAVQVIDLVEGKQMNLFSKEDGYENTTSPEEMNNVPETEVQTSTDF\n>MGYP001556904936 FL=0\nSLTEILITVFLGFIGFVAFIGFVAFIGFDRLLGVFRPLLSATLQPSYHPCITLGL\n>MGYP004044994415 FL=0\nFSGSGFLGENKKFKIIKPILRLKATKKKIIIDKYSFKKSASILYVYLYSTFFYTYRREIDAK\n>MGYP000469735265 FL=1\nMFHVNLICKRCAKTVSYTHLRAHETG\n>MGYP000883239672 FL=1\nNPEAIKKHKGIIANPNCATIIGLVAVNPLHKAAGIRRITGQAIADI\n>MGYP003386468952 FL=0\nKLLSTNALDGIELPPKGEQIPKALYSVEEIEKF\n>MGYP001795370918 FL=0\nMIGIVLYLELKLISEANKSSNIVFELLMSASQISIWAYMLQGTYPTATNIIHLSQLVMVDRGKGSQ\n>MGYP000051665382 FL=0\nMTDPAALAREYYRTIDADEYDALADLLAPEFVHARPDRTLSGRDRFVAFTRDERPMTETTHVVETVYDVGPGDSGSVAVRGRLLDADGAELFAFVDVFTVRDCHLTRVETYVSAGTETG\n>MGYP001510798038 FL=0\nMVKFKYSKAWWGKTSYKIIGLHEQLDQELLNFITTIQNQESSTVTALENSVDLLISSLNSCIAKVGLNQGTIANYESNSFYTDKDVYALANISELFYQQHEDNKDVYDAICEAEQNLKAVSYTHLRAHETV\n>MGYP003638701188 FL=1\nMAKRLPEFLPHKYQEDVIQEMEDAGVLALLLDPGLGKTSIVLEYFRRQMDCMAATRMLVVAPLRTCWGVWPQEVQKWKGFKHLKVHVAHGKTGKDAALCNDADIVVINPEGLTWLEGEMKAKRIERFDVLAVDESTLFKSGSSLRTKTLFRIAHKHQGGIPNRFILTGTPAPNGVEDLFGQFAILDPDVLGKTLTAFRTNFRFSASKRPWGMVWAPSVHTAQLVQDAIRTHSVRLEATDHLDLPDLIQVQREVVLPKGVMDLYKELQAEMLVNLDGNTSVVAVNPAVLSAKCRQVANGAVYVDDNGEAGDSSARRIEYLHQAKVKELAQLFDELGQKPLLVAYEFRHDLKQIRNHMKASYKLDVPFIGGGSSGEETAQAIDDWNAGNLPMLLVNPASAAHGLNLQSGGSHLCWYAMTWNLEHYQQLNARLWRQGQREAVIVHHLLAKDTVDLVVWEAVQRKDATQRDLLLGLKRSKS\n>MGYP001045944336 FL=0\nLVWRSYRPYAVGQSRRDATPPCPSSKNHDELLPSSTRNPKRDELLHPSSRNPMVCA\n>MGYP003142759631 FL=1\nMKKARNIKNKKHNQIVNDYDKIKSRHLEKLANKILKDEERRDNLRSKDIKGDFLKNF\n>MGYP001277206801 FL=0\nVAAGLAGGLLDEHIAYVTSDESFRTPFARGYVVVEQLPYREKALKAALRERGVGRLAIKKRGVDVIPDQLRKRLDLRGDAEATIVLTRARGHGIALLVQPF\n>MGYP000667709688 FL=0\nACTDITGFGLIGHGLEMAVASQVGLVIQSGAVPVFPEALDYAKIGLVPGGAHSNRQFFSCKVEVHPGVPDLLLDIFYDPQTSGGLFISLPRDGAETLVQRLKDRGHVNTAIIGEVVPEPKGKIRIF\n>MGYP001758919174 FL=0\nRDSVASRGLGDVYKRQEVVKDE\n>MGYP003402598952 FL=1\nMRHGNKNNALGRKKAHRDALLSNLAISLIDHKRIETTLAKAKALRLYVEPLITKSKDDTTHSRRVIFSELQNKEATAALFRDVAPKVASRPGGYTRIIKLGNRLGDAAEMAMIELVDFNTTYTKEKSAGAAKKTRRTRRATAKPTTAKTDGGDEAKSE\n>MGYP002859056165 FL=1\nMANKIMKFFHEEFGNVRGRYIGGECRFAGKDVAQALGYKDTKSALADHVFDDYKQVFNAKTIRQMASQSKGGETPPLETTSPRGMIYIKEPGLYQLIFSSKMPKAIKFQRWVFEEILPKMRREALREEARAEGKRVRRELTDVIKSFIEYLTARGELDRAEVAWYSAFSNLVNKMTATNDKRDNLLMLPLLRLSDCEDILTDAIEEGMAEGKGHHDIWLACQGKLDAWRQLTK\n>MGYP003351460330 FL=0\nMAGQMDTMPGERAGRREQNKAENRAALLKAARSVFAEIGYNAAGVRDIVRRTDLASGTFYNYLDRKSTRLNSSHVSESRM\n>MGYP001464310971 FL=0\nQALDVLLLRAGEDGAGGDGHFQERAGLVRVDVLEGLHGDLAGFGALGHDVHNLAAHQALGSHALAHVHDDPQGAFGGHGLGSLAADVLERVAEQRVAREDGHLLTIYLVVGGLASAEVVVVHGRKVVVDEGHGVNHLERARGGHGDIHSPAHEFAGGDAEAGADALA\n>MGYP001323269287 FL=0\nVGDRGGGTSSPSPSAPPPMAISPRSTARGDPGEEPGTVSHRLTPGTAAPLISPRTDPAPRRGRGRSAAGAGGVGEPEEYGYPCGGAGGVGEPAKCMGIPLEGNAGAERMINPPAKVLARRRTGLCRTPPVGIYLNPVQKVHYYWLQIISCNG\n>MGYP003154234093 FL=0\nDDPIEGSYEALEQISKKYTIIIFTTKAKSDRGLVNGKTGTELVWDWLKKHDMAQFVSKVTAEKPRAVAYIDDKAVRFENWKDALENVL\n>MGYP001373085551 FL=1\nFCIHTTGSAFDDLRKLIESGGGYTPAWKGRIRGKETAIVPVTMYTYFIIGLAEKPLFMGQVELAKRLGMENDFILANLIKAQDQWIIDIKGNSSLYGSFINNSSRNEKDILIQWLEKT\n>MGYP001489405527 FL=0\nVTASSAVPVVFDPVVVENYAACSAGLPSWLEAARSRQSMDANLRMVVADDAAYADKTGHRYAHFVDGGITDNLGLRALLETVEVIGGAQEYVAQLGMQPPRRIAVISVNAAADPRQGIDASRQQPTIGQTLDAVTNIQLQRYNTDTLQEMQQSLQRWSKALSTPQWQVQNYFIRLSFEGVPDLPLRRFL\n>MGYP002718885158 FL=1\nMSLILPNSKGKSTLVNMIDTPGHVNFVDEVASVARLVDGVVVVVDVVEGVMHGTEAVIRHAMQEKLKIVLVVNKMDRLILELRLPPSEAFFKIKHTIEEVNSFIA\n>MGYP003566853254 FL=1\nMKYIGVKRKKNRGNRYKFVVDIHVNGVRYFFGNYDDPKEAAKAYDLLVIRKGLDRPTNFFKKKLV\n>MGYP001092313238 FL=0\nTYYKVMNNLASRTDEELVVLYSKGNNEAFDILLNRYKNRIYSYIYYIVKDRELTEDIFQETFVKVITTIKQGRYVETGKFPSWISRIAHNLIIDYYRQEKSENHLSNDEMNPDVFNRKELSEGTIEDSLVQTQIQADIRKLVAALPDNQKEVLIMRYYKNMSFKEIADATNVSINTALGRMRYAILNMRKMAEDHHIELSL\n>MGYP001474034502 FL=0\nAKAALELVQAKDFKGLVALARKHADSIAEKALDASQSFEAQVLAQKERLQTLARAAEAPAIPPRAMIPTDAKEPADESIRLAGKFDELGAVVPRGVLRVVSAERVAIPSDHSGRLELADWIIDPQAGAGRLTARVLVNRLWHHSFGRGIVRTVDNFGRTGEAPSHPEL\n>MGYP000079457881 FL=0\nMSSTSRDASAVVAGPALEAVAAELEAQGPLAVLSWAFETFGPGVAIATGFGVEGAALIDMAARVNPRPFVFFVDTGFHFEETLALRTRIERRYRIEIRAVEPDLTPDEQADAYGVRLWHYDPDFCCSLRKVEPLERFLAGRDAWVTAIRRDQTAARATARTVEWDA\n>MGYP001330772963 FL=1\nMQVPEDIGVNEINIFLLLPSPIMLIGLTGRNASGKSTLVEWFSEKGMNSYSCSDSIRAWLREQDKEITRDTLIEGGRELRRQGGGGILAEMLIEILDGEDAVIDSIRTPAEVSVLRSRGDFFLIEVKASEEVRWSRLQERARPGDPTEKNIFLEQENKEIKAKDSAGQDLDATAKMSDFQIFNDGSVENLYTKLDDLWEKLHNSKN\n>MGYP002627366002 FL=0\nMTNQVRPESMKRITTTELAQAFIDEQIIELKKQVGNGKVLLALSGGVDSSVAAVLLNKAIGKNLTCVFVDH\n>MGYP003117035852 FL=1\nMSLLRNSVIVGGATFLVGSAFMEIGKADSKSDIGKWPYVATFLSGALGFYLLKQNVIPVPKALELNADYTDSDLSHFGKPLEDDEKFTTMQVRIGSPSGSTTSWTTAFNLQCVGDDDNLTYFTGLLEDSVRDRVRKWNGDELGDFIPMQIVIGSPSGSTTSWYRAFTVQPVDVDEENLYYLSGEIQDLLVDKAKWWNGHEVIYDAEIEYDGAKSYARSLDSKFDGANDEGYFPVDEDDFSEMVVDEIGEHTTLDAESFDADSLKGRWEEGTTRIVHGVSVTKSRYGEYEKPQYRASYNGYSCRIFYEGVAFYLPCWMYHGYGGVGRGGCFKNPMEAILDFKRRAEGGFQQISHRKDFDADTSLLQSFAAEVFMADRKIRRRTRWTWTRGNEKGFEIENDDLSELPYNIDYTAYTGRGYYRNSQPMYSIDEAYYISDLPEGYHLHLYKPSVRSGEWRAFSKSPTSEDWNEYRNYKKSNLTGDLLNWYNQDIAQPEEKTLSPIEKLMISKGMKSGTVQIERVVIPKTNYTPEKVQYFALGGPTNMSPTKFCEIEGGVIALENLRYEDEPNLFAFGQGLKFMTEKAGTLRSVNRFNKNPEAWVKSYPAWFQNAVKNKLTDIDVQFKFYQEHDGGIRINNIRVLKFLNGVDRLSWRPINESERKMMDTPYGEMPQFEIYELDMSDPAPITPRPSTMRKIYGKSFKQNLNGEWKFDKDMFMMAVVDKYKFENGGSERVHKSMVDEPLYSIDIIPYMTPMAELMARRYKKKE\n>MGYP002788159078 FL=0\nTQTLIRDTARGFAERVLAPQATKLDREGGFPVESLAQAAELGLLGIAVPEELGGVEAGQQLAFLDLHAF\n>MGYP001798696378 FL=0\nMLTGGEMAVSVITIQTKDIKAETKETHPNHYQKTNLXCHWSXKWRHAVKKTSCCMX\n>MGYP001406754757 FL=0\nMRPLGSMCAIEYPAIPLPVFFLLEMMIPSSFDWSFTNRIILKFFWLRFGPIGARPPALVLRSLLAAPGDDVDRVGSPNVSSSPCP\n>MGYP000997370353 FL=0\nFECGICKYLEHVDYRDLFLFRFGLVYRLWWFSQVESLVTDLHDVFGLDPGSLALAQSLRRAERLLSGTVLWAIGEGLQFASVVALIVSFGLGLSATIHFLNRLRLENTPDTTAEAAVEKATVLVGPALILTTVVLACGLVVTVFSDLPSLRLFGWLSAFSMVAALVADLFILRPTSMWLIGMAQKIRGRGADGKAI\n>MGYP002214501719 FL=0\nIIIHVIFDKNSRANDVYKKQISSTTITTTATKKKKILVTTGIDSTSLFYNQGKGGNSGTSGYIAILAAIDAL\n>MGYP000390568609 FL=0\nPISCFLPCVCFLCVFFFGGGVGGGSSILLAKKLISLKFAII\n>MGYP000957035233 FL=0\nMSPLAAASPARPAIEPRGVVIAVRGSVVDARFPRHLPALRQQLHAGRDRSVVIEVSDHLAADTVRGIALTPTQGLARGDPVQDCGGSLTVPVGPELLGRMINVFGQTIDEGPALADGERRSIHQPPIPLAQRRVGLEMFETGIKVIDLLCPLERGGKAGLFGGAGVGKTVVITELIHNMVGRYQGVSLFCGIGERCREAEELYREMREAGVLLSTDGPFDNVLKIKPPLAFGKPEADMLLAALADAAPVEAELLRG\n>MGYP003548451047 FL=0\nVARAMGGAVFLLMIAAGSAFDLVTQNAALSIGLGVTRETLFRVALGCGLAGLVLLTYAFVRSRLRNQSNDAQLAELEDEYADLLDRKNSSSEND\n>MGYP001276729923 FL=0\nAFAALSLQSPPQRQTLESIPESMNECVHESMDDSVNE\n>MGYP002536854477 FL=0\nMADKIRVLLSEDEVNKRISEVAAQISRDYQGKEIHLICILKGASFFTCELAKRITVPVEVEFMSVSSYGSGTESSGIVKIVQDLSTSIEGKNVIVVEDIIDTGRTLSYLLENLKTRSPKSVRLCTLLDKPERRVVDVKVDYVGFEIPDEFVV\n>MGYP000601791154 FL=0\nMPALRHMSQTYALCANTSLHRRSWLVRSNTAGLLKRTAPERKKSNGAVPPKRSTSSKNTLLTRVLLGRFPMRPVPQSASSCGLASWTGQYFPSCSPRVCLGASCPRFSVTFIIEHFYLSMACQIDRVKNRRPFPARETRKTLLDRTSASVLWSS\n>MGYP000636477196 FL=0\nMNTLNVKLSHSISQLYETLCQVGKSTFAELQRATNLKTRSPVWLYARSCTTTKYIRHVSAIPFITLLNNVLHRKFDLTKPDHRIKQANQRVRDKSCGRITAGTILPFPNRDARIVPSNKGTSGVSHWLPFHKAILAIDVSVKTPSRMIKISSASPF\n>MGYP000562867999 FL=0\nNSFFYGWAFGFGYFFSNLYWISISLTFDSNFKFLIPFSLFLIPAFLALFYGFISFLFFKINLRSTLTSFFLLTLLFSIFEFLRGHILTGFPWNLIAFSFSNYPKFLSIISLIGTYGFNTICISLFLIPGLLYLRNSYINRFVCGIFFLILIFFNVYGNYYSNIFLNLKKIKLDYQIRAIASNFEIKKFYNNFSTEEIIKELIDISNPSTTTKKTLFLWPESIIPGVTKEQFQNQNVGSSINYFLLMLNIYALSV\n>MGYP003365983449 FL=0\nMLVAVAPLARMLFIALLEPASIAWLTSTALGGQLGVLCWG\n>MGYP001155155630 FL=0\nMLMVNHALSLVAECRAEARAVFMVFSFCFLELYVVCVRACASRGWLLSSPLGIGNE\n>MGYP001568236931 FL=0\nMISSQAGQQSSPVEWVSAPELGESMFYMVQRTPDAELLLTPNEAFFPKLGLNAGGEGEFPLEKPELNQNKNFKWISGWDPGDAAEWGLWVEKPGSLKVSVAMDGAEGSYLLSLSGEEKKLSGKVVSFNVRKPGMHVLRITCRADADAEKLHALKLSGSAVENAGLLRKRWRPSAAHARFSSSANPKDVRLVIIEMDAKPGTLGFYAPITTPFGYYGPTWKADGLVNTGFNFSLWSYGRGKEEPPVERLSHLIAIGDPTAEFSGFGHEGTGVKIRGW\n>MGYP001201323188 FL=1\nMYTTFTQITPAINLRRRRTLSAAGTVMVRLGQKVSADDVIAEAVIPTRHELVDVVRLLGLSKRKTADTLIQRKIGDTLAEQDIIAETGGLFSRVIRTPAPGKIISIRDGQVLIETETRKVQVLAIYSGVIDEIIANRGAVINTTGSIIQGAWGNGKIAVGPLLCKAETSSSNLTQADLEITARGSIIASASCSEEKLFDLAAQLPIAGLILGSMPAALIEKALAQPYAVMLIEGFGKSGMNSAAFKYLSMYNNHEITLNAGVDNETTEHQIEALISAAVEGEIGRGQSRVTSGQTVRIHTAPFLGQSGTIEKVLPGLTLLPNGLRVCAASVIMDNKDRKTIPVNNLDGIGFTQSNLG\n>MGYP000016403168 FL=0\nLQTVEQIALMLPLCSDLKYRFHYIGNSFIALDCFCAFY\n>MGYP001020068561 FL=0\nDFVKVCRHAGIAAEAGVQLFFQELAHIQIHIAARRRGLPPQDPAPRRAHQFAGSFMAEPHPTSAEEDLELLRASAVTAGIIAAGYFRRDLKSWTKEFGSPVSEADIVLDKFLHSALTTARPDYGWLSEESVDNADRLGRNRVFIVDPIDGTRGFIRGEDSWTVSLAVVENGIAVAGVVYAPARDQMYEAFAGGGARLNGASLQRQQEPGRRAPLIPAPGAVHQELQAAGLDYTRGPAYPSLAYRLVQVASGTLDAAVARRGAQDWDIAGAAVILAEAGIAFEDVCAGAM\n>MGYP001126300050 FL=0\nWMVWKEKMMLNWFEKSNRQIYYGILITVSFHIFVVAFQ\n>MGYP001386794033 FL=0\nPLGGNAAVALLDAAMERQAALIVEWMRVGFIHGVMNTDNMTLSGETIDYGPCAFLDAYDPAATFSSIDRQRRYAFANQPPIAQWNLARLAESLLPLIDEDENKAVEIASERIGRFKPLHEERWKAMMRGKLGLAGEEEGDATLALELLEWMRASRADYTNTFLALAGRVVEGGNAPLPVGTDAWNLQRRARIERPEGGGGAAHAPGGRHNQR\n>MGYP002527839631 FL=0\nKAFERTHQMYNLGIEGLPYELIINSNPSIAYLMKQNPLHLQILIMAHCVGHSDFFKNNRMFKDTRPDSSVSRSRNARKRIQGYSEDPLIGRKKVEKFLDVLHTIRFQTERNGRKRNTRNDIKKGLIEEYNRNRSSGKNIPVPDLDRKLLHQDDDLLSFFIEYGNHFSD\n>MGYP001804104866 FL=0\nMLTFPHANTLLFLGIPTYYVSFVPCAWHVCDMHMAFVHFRDWVXKRQNRTHXQKRRLLYSLVSTSINLQXHGRGXWTLTIDSSERLLXDRVLLNKAEQGRXVQCXKSYFFX\n>MGYP000506167729 FL=0\nSKETMDKCPNLKAIAVLATGYNVVDYEYAKAKGIPVMNVPVYGTDNVSQFAVSLLLEVCSHIGHHNESVHKGEWASNADWCYWHYPMIEVSGKTAGIIGLGRIGRDTASLCTGIGMKVAGYDPFLTKEQIEGMGYEYYANYEDLLKDCDVISIHVPLTKETENMVSAKQLKEMKNTAIIINCSRGGIINEADLIEALDSGEIAGAGLDVF\n>MGYP000552990992 FL=0\nGGMHEKFLNLRTKIQMLGGGFGNVQGGNLSFYGGDSNLGNGGDLLLAGGPTVSGDGGSIAFEGGIGEEGVGGSINFSSGQGVDLPSEGEINFNTNYKPVFFNTAGNKYKLLTTTQRDALPTTESLLLWNTSTKNFNWYNGTSFASPITDLDNAAGDVTGLFSNLQLGANVVTNIEVADNAIGSAEIINSSITNADLAPNSVTSGA\n>MGYP001062954301 FL=0\nIYNECHIDKLDSYQGYTVFVDDYDGYVTLYDELKDKRIGIHLFFDSIFDINELKKINVIIKMIIIAMSFILIIVQVWLELKMPDYMSEITKLVQTKGALMSDILIQGGYMLLCAFGSLVSAIIVGYLISNIAASFSMRTRKSLFEKVENLSMEEVKNFQASSLITRTTNDITQIQMFIAMGLQLLIKSPITAVWAVTKILGKNLTWSMITAIAVVILLVTILVLMIIVMPRFKIVQNLIDKINGVTRENLTGIRVVRAFNAEKYQEDKFEKVNNDLTKNQLFNQKAFSVMQPVMYLVMYFLTLSIYFIGAGLIESANMTDKISLFGDMVVFSSYAMQVIMSFLMLAMIFMMLPRANVSAKRVNEVLDTVISVKDGKGAKAKEVGTVEFKNVSFKYPDAEEYLLEDISFKAKKGETIAFIGSTGSGKSTLINLIPRFYDATKGEVLVDGVNVKEYKLKDLYNKLGYIPQRAVMFNGSVSSNIAYGENGKGEITKEKIKDAVKVAQAEEFVSKMENAYDAHIAQGGTNVSGGQKQRLSIARAIARDPEIYIFDDSFSALDYKTDSVLRKELKKYTKDATILIVAQRIGTIMNADKIIVLDNGKCAGIGTHKELLKTCDVYKEIALSQLSKEELENE\n>MGYP000237869789 FL=0\nGGGREKNTERSGRVGPNGPRVQLRFRVTSSGVTRIKGLTFNDGAREIFSRNSLRPRLPPPIFVSPSVSGA\n>MGYP003956841209 FL=0\nSDISSIELLERARAVIPGGVNSPVRAFKSVGGSPVFVREASGPW\n>MGYP000266856341 FL=0\nMSDCNLDKRITRRQFLTFAGGLTDAGFGALPRWVREASAQAKQGRKVLIVLFQRGAADGLNIVPPFNDEVYRKARPSIKIEAPIAGSRTIDLDGKFGLHPKLASLMPLWKDNRFAIVQAAGSPEETRSHFDAQDYMESGTPGVKVTEDGWLNRALVSGKIPQDPMAAISVTARL\n>MGYP000179581380 FL=0\nMYFHFTVILDIIKELWADFFRKHHVRPIAVGLQPVKQGAKIGAPSVNVQRKYGILPRCFISLPALICSMFRI\n>MGYP000648191730 FL=0\nIGIEKTNSGSIFKGKEDITKADPSKRGMGIVFQNYCLFPNMTVLQNVMYALNIKIKNKDEARKLSLEMLELVKMEEHKNKYPHELSGGQQQRVAIARTLVLKPDIILFDEPMSALDADNRLTLRKELKNIQSKFKTTMIYITHDQEEAFSLSDRVMVMKDGNIVDNLCATIKLVLPSINFRIRCQ\n>MGYP001537497899 FL=0\nAASDVYKRQICKQAKNLFLEITIPEQKAYHVQTMLETSGNFQHSWQKFPA\n>MGYP000667005491 FL=0\nQGQEHPADTAPRQAEQTGAEPDVRFYAVELDRGSQIAYGVWDDQNDRIYVDDEGVSEEFTSRWQAEEYARQLNQVNPLARYYGEGETILIRQYPNGQYYVQYCYDDQDNTVYATAGGFDTFEQAEAALYTHRPKAKKDPIAAQDLAYRQAAEYWSGDEHLVIFREPNGTFCNQYGFISGRVTPTTGSFAKLEEAEKQLYADRPLAQKVQAREKPPAHAPADRDEAERRYQVVVYHHLENGMDEKLEYATPEEAEQAARGYLEGTMEPDGFAYEGTAVYDLLEKKWLRVIGDFPTPEPPAAKEEQPLPSREDTETAASDRDLLGKEITLEGRRFRVEKIDEDGRASLRDLTFEGAVGFPIERVEHISVIRRLMGPAEKTAGPGKGVESLADGHDQGGTEPPLAPQRRARVSPFVLHPEVPNADRHEYHITDDAIGTGTPGERFSNNVRVIRLLKRLEAEDRLATPEEQEVLAQYVGWGGLADCFDERHSKYAELKALLTEEEYAAARESTLTAFYTPPVVIRSIYQALTNMGFQTGNLLEPSCGIGNFIGMRPEALADSKIYGVELDGISGRIAQQLYQQSSIAVQGFEKTDLPDSFFDAAIGNVPFGSFKVIDKRYDRYNFLIHDYFFARTLDKVRPGGVIAFVTSKGTMDKDTPTVRKYLAQRADLLGAIRLPNNTFKDAAGTDVTSDILFLQKRDALSSEEPDWVHLNTDANGLKMNQYFIDHPEMVMGEMREISGPYGPETACLPIEGRDLGEQLAAAIQNIQGSITEYVMDDPEIEGEDKSIPADPEVRNFSYTIVDGKVYYRENSRMNPVEVSVTAANRIKGLIGIRDCVRTLIEYQTEDWPDQDIQAQQRKLNALYDAFVDKYGRINSRANSSVFSMDSAYFLLTSLEVLDDERNFVRKADMFTKRTIKQRVTITHVDTASEALAVSLAEKAKVDMDYMAELTGKTEQEVYADLTGVIFLNPMHGYGGGSEEKYLTADEYLSGNVREKLEWAKRSAELYPEDYTAHVQALERVQPVDLTASEIAVRLGATWLPTEVIDQFIYELFGTSPRSQRMIRSHYSQHTGAWNIESKFADRGNVKAENTYGTTRVNGYKIIEETLNLRDLRIFDYVEDEHGNRVPILNKKETAIAQGKQQLIKQSFQDWIWKDPQRRERLTRLYNDKFNSIRPREYDGSHLNFVGINPEITLRPHQVNAIAHILYGGNTLLAHVVGAGKTFEMVAAAQESKRLGLCQKSLFVVPNHLTEQWASEYLQLYPSANILVATRKDFETKNRKRFCGRIATGDYDAIIIGHSQFEKIPVSVERQRYLLEQQRSEVLNGIAELKANHGERFSIKQMERTKKSIDAKLAKLNDQSRKDDVVTFEELGIDRLFVDEAHYYKNLAAFSKMRNVGGISQTEAQKSSDLYMKCRYLDELTGGRGVVFATGTPISNTMVEMYTMQKYLQYHTLEEHGLLNFDAWASTFGETVTAIELAPEGTGYRAKTRFSRFYNLPELMSMFKEVADIQTADMLKLPVPKANSHNIVLKPSEQQKEMVAALGERAEKVRNRMVDSTEDNMLLITNDGRKLALDQRLLNPLLPDSDTSKINACADNVFEIWQRTADQRSAQMVFCDRVAIRCYK\n>MGYP003718977623 FL=0\nSKQHVNSAGTNTRGDLSPLSFPPPAPQPFPLVAPHHQLNCQTPYNQGSLLESGDLQKKSHTVGLHLR\n>MGYP001491601391 FL=0\nEDSFQKSSSLLKHGFLDAIIERDALNEKIGNLCSILLKKNEIETSDAQPQQDREFIKKTAASS\n>MGYP002264516364 FL=0\nIRYNDVPADLRTADEDLIGGVQTHDHADGDDHLELAVLVVGILAADLGKQVGPAPAEQGNEGKPEPHVFFFLLYYVCVIFVFWIIFSLKGYKIKIKGKRFFHALFFIPSMLPIALMATVFGSMLEYKNGIVNQILRGVGLGALAQRWLADPKLAMGAVCSVSIFMIGIPIMYYTADLTTISRSILEAATIDGAGMKDQLLLIIFPVLKNTHKTIILSMLLGGFREMERVYLMTDGGPGGSTEIIGTYIYRATRSAGSNIGLVCAAAIIVLIVAFIISFIQLKMTSKNG\n>MGYP001571232008 FL=0\nPLCEYEYGVHWFWPSAECAREMIDSDSEDDWNHSGVSQCEKDASVLSVFYQESMHLLKLDISIAEFVIKHSKGRSXXXXKFKRHQRACGSRFAASAQIIRTEWKCSPLLVAILRELQPCCQRRSEDFIETVLGRSSQLRFGKIDG\n>MGYP001478861697 FL=0\nMEKNPSLILVVAAAMLGHDGRVLMQRRRHDAQHGGLWEFPGGKVEPAETLQSALVREIAEELGVVVQQAGLVPLTFAAAESASDGRQIVILLYTCREWVGEPVCVDAEELGWFHPRELPGLAMPPLDYPLANALILSN\n>MGYP003588991860 FL=1\nMKKMGSRCLAALAMVLCSSAFAADKVDLARAEEIVSGRCFLCHGLEGESASPVFPLPVGA\n>MGYP000788765185 FL=0\nMDMTNIMYELVNTKTSLTIADRTIETLQKQNRRLNRRCLRQSLMIAGLTLSLIHISEPTRRSYIS\n>MGYP001606674547 FL=0\nASRDHIRRVIPLTNEVLAQSGQALEAIDMVAFTRGPGLAGALLVGAGMACALGAALGKPVLGVHHLEGHLLSPFLSADPPSFPFIALLVSGGHTQLMRVDGVGRYQLLGETIDDAAGEAFDKTAKLLGLPYPGGALLSQLAEQGDPRRFTLPRPMLRSGDFEMSFSGLKTAVLTLVRQQEALSPTGQLDDRTRADICRAFQEAIVEVLVTKSLAALKHTG\n>MGYP000296153156 FL=0\nMETPTKSKKRFLPAGRRIFLLQAATSVKKKREGKGEHVKSKKGAEAKEIELT\n>MGYP001120318111 FL=0\nSIATCESEAETTCAFIIDIAGDQDHIANCVGSVY\n>MGYP002231636691 FL=0\nVGIIGFGRMGRFYWEAMTKSDGWNIAYICDTDPASRQLAKKLSPNSIIVEDNQKIFEDEKLCRLVGLFTLADSLEWKQIEKAIRYGKHIISEKPVADTMENEWKVVEMAEVQMSFLR\n>MGYP001205799662 FL=0\nNMVSHTVDKLVGTDATNGATRTVYSLTESPTNPDAVSVYLNGVYQRSGSGGANNYDVSGSTLTFTSSLATTDQIDVHHHTFRSTLTKVADNSVGDAQLASGTLTTKGALTVTGNVIIANAGNIGSVGDTDAIAIASGGDVTMTQNLVVNGNMTVSGTTTTVDTTLTLSDAMVINNAGSDVGLLINSTSTGNIIQLQDGGVNKFVIADGGALTYTGAATI\n>MGYP000237547906 FL=0\nIREQAWSQLLPGLGFMRWPIFRGAVVLAESLHNGYSALKFSTEHGLPPDDDGKPHDAEPHANHRRDHVRVPLGERVKVQEGPRVRRGLPAARRPAGEGDVEAEAFQHLQRGDGGARGELVDEAGREERDAHCRDGAIGQRTDGLLIMGHKQQRRPVAAQMLHPLEAALLEQGIAHRQRFVDDQDLRLDAHLHRKGQPHQHPARIGLAGLVDELADIRKSLDVGDPGFHLLPREPEHGAVHEDVFPPGELWVESRPELQQGGDPATGFNAPRGRVQGAADELQEGGLP\n>MGYP003113969438 FL=1\nMAHLPPLYHLRPAWLRQAFFLIALTCAVCAGQASACVGSADPVISRLEIEVGRNPLAALDSITQEIADTDPLDKRRLAELYIVQAKALNMGGLDSAPALKKARSAASKLSERAPANILLQMNAYYDLPDEAAKRRAMSSLLRGYRSLPDGSSAKTCRAVDLAFNYSFQEKPREAFTFASQAYLNSADDKSSPARAEAASALAYLVSNSHDFDYAKQLHSEALAIQLKLGMSDLAANELLVRGYTKLKDGEWTDAVADFRESAKQARSYGNQYAVDYALLGVCQAASEGGKIADAAPECERAYQGLGKPDEAMALPATALMAKLFVERGNPGRALAILDPMIAKGKQENASDDWVMALETRAQALFALGRNAQAYEQMREANEAAKTFHNADMQSGAAALQARFQTRELQNLLAEEERASSTRLRLAIAVIAGSTTTLLLLGTLIFFLLRHRRRFRRLAMTDPLTGLANRRATLERVGAALPGPDAPHPRASFALLDIDHFKSCNDTFGHDAGDQVLSQFARVVERCVRPTDIVGRWGGEEFLVILPATGLKDALDIIERVRSEAALEEFDFAPGYRLRFSAGIAMPSETGGVTDACIKLADRRLYAAKHNGRNRTCIDAGIAWAGPPAPTPPPSSGVSGTGSGSAQAA\n>MGYP000344450175 FL=0\nSTQGVSSAASDVYKRQNKAYIVGEEGPEIMISKSSGKVLSNDDSQIFAMLLAANPQLQKVSKARAEKIMRSRFPEYFE\n>MGYP001069234379 FL=0\nMVSLSERTDLLGAAIEAARLGGVVLREFFGQKKEIAFKGAIDPVTNADVASERAIVEFISRRFPGHDIVTEETRPDLSGSSYRWVIDPLDGTVNYAHDHPMVAVSVGVEVDGVV\n>MGYP001488139253 FL=0\nMDNLIGKKLDGLYEVKELIGSGGMANVYKAVMLGRNGPVPAGTVVAVKVLRQEYTHDPELVRRFKNESKAISLLNHPNIVKVYDVSVNDQLQYIVMEYVDGMTLREYLNERGGKLTSRETVHFISQILKALEHAHANGVVHRDIKPQNIMLLDNGQLRMMDFGIARISRAENQLLSGKTMGSVHYISPEQAKGDETDCTSDIYSVGVMMYEMLSGQLPFDAEDAVEVAIKQISDQPKSLHEIAPQVPAALVEITEKAMAKLPQNRYASAREMLDALDTYVQNPSVMFEYQYITEDAPEKVVKRTMNQNKAARQNHPNESAAPRGKNAKRKRRTIFLPVLFGITIAFALACLALCWLILNDSSNLMNNKADITLNDYIGMTQEEAQATEQVASGQISVTWEQEYNSNYAAGYIYKQSPVSGRTVREGQGVTLTVSLGTQYVTVPDLTNYVQADAEQQLKSLGVSVLVTQAVDTSVASGAVI\n>MGYP000855914706 FL=0\nVSSDKMEKTITVSVETVKQHPLYKKTIRTSKKYTAHDENNEAKTGDVVKIMETRPLSKNKRWRLVEIVRQQETMLQVGDNTGAKKVLCIKIPGGSSRRYATVGDVIVASVKEAAPGGVVKKGEIVKAVVVRTKKEIRRPDGSYIAFSENAAVIIDDNNNPRGTRIFGPVARELREKNFMKIVSLAPEVL\n>MGYP000079949637 FL=0\nEQEALYPFGYGLSYTEFSLSEPEITVYEGDKVSETGIIRKGTGMTVRTVIRNIGKMAGGETVQVYVKSCCDGTPNPQEVVLTLKPEAFELFDIDGAAQILSGEYCVYTGTSQPDKRSKTLTGKGGFVNTFAAEV\n>MGYP003113302263 FL=0\nKKKKKSSKLTVDVVFDSLYSSLSRNEINGFRSKRINFTGLIGDAVYEVEVPLEDDKDYEGFETGIFSLQNLSTGRFGDFISHTVMVSDNELPEIKIEIVENLNKKVLVLHNLESRELDLRNWELVKGDIKIVFPKNTRLKVGESIVILAGEDQGLFANSLLLDNEKAELLNSNGTIHLKNYEGTKVAEVSISKKEESSNSLVASGQVSSN\n>MGYP001378584181 FL=0\nITIVVTNVLDLAGNPIDLYNNSGTDVGIGVSPTVIISSTATNPTNSSPIPIIVTFSEPVTGFDLTDVTVGNGTADNFASSSATTYTFDITPSADGLVTVDIPAGVATDLAGNGNEEATQFSITYTSITYDETPPQVISVDVTDPFTVDVTFSEAMGDGVTTADNYAISGDGQGTLADHPDSVVHKSDNTYTLTWNTGEMRNGASITIVVTNVLDLAGNPIDLLHNFGTDVGIGVSPTVVISSTATNPTNSSPIPITVTFSEDVTGFDLTDVTV\n>MGYP000737688134 FL=0\nMYRIAVLTNSRAQEAFLTEQILQFCAEHCLFPQMDCYHDQESFFETARSEPLTNAVIALPGVDGLNAVEHLRALCPQTRVIWCSDLDFSLHAFRLRVDYFLLEPITEEAFQQGLSTWLDGKKTSALFRADHNKHNNEEDY\n>MGYP000609830271 FL=1\nMDFNDTTEEAKFRKEVGDWLSANATLKEDEESGSYPGMGEDDALSLAKKWAAKLYDSGWACLHWPKEYGGRGSTPIERVIWGQEASKYRIPGGFFEIGQGMAGPVLMMYATEEQKKRYLPPMAKGEEIWCQLFSEPGAGSDLAGLKTKSVLEGDTWTINGQKIWTSGAHYSDYGILVTRSDPSAQKHKGLTYFFLDMKSPGVEVRPIKQISGGANFNEVYFTDVKIPDEQRLGSVGDGWKVALTTLMNERLAVGDASGPDFQEAFNLACGHDLNGDLAIKDGSVRDKLADWYCQASGLKYTKYRNISALSRGETPGPQASITKIVSGNKLQEIANFGMDIMDAAGIVRPESADAEQNMYQMGFFGAAGIRIAGGTDEILRNIISEQVLGLPQDMRADKGIPFNEIPSSNK\n>MGYP001094161847 FL=0\nMNPRYILVLFSGIVVCTLEYYIHILRPQLESAPPMKKPVLQVGNRAKHSTEIVNEMQVTFAYLEGTFLKSAMGMDELTTEMHNYTLLAGIVSASGGPYYFKDSGSAATMIEHKKMFKSFIYSIDVL\n>MGYP002524929742 FL=0\nMKAVDNDEDFALVTPRDTGDGPVNEVVATVKAKDLWDDIAESAWKTGDPGVVFVDRVWETAPNPQMGKIKTSNPCGEEFLENYSNCCLGSINLDLHINGTDFNWELLEDTTRTAVRFLNDVIEVKDRKSTRLNSSHSWISYA\n>MGYP003440339087 FL=0\nIIHRINMDTHVVIMAGGIGSRFWPMSTPQMPKQFVDVMGVGKTMIQMTVDRLASLCPMKNFWVVTSERYVDIVRKQLPEIPVDHILAEPAARNTAPCIAYACWKIRKHHPEANVVVTPSDALVLNIEEYRRVISSALEFTRSGERIVTVGICPTRPETGYGYIKTGEYVESEICTVSSFREKPSLEVAEEYLADGGYLWNAGIFVWNINTITEALRRHSPGLASIMDEMSISFYTTEEKAVVEKLFPTCEKISSDYAVMEKADNIYTLPAEFGWSDLGTWGSLWTLKERDENGNAVVGDDVRLFDCKNCIIHTPDLKRVVIQGLEDCIVSKHGDRLLISRKDHEQQITDYSKD\n>MGYP001086002945 FL=0\nAEQSTRYSMWTEITRPKYERKGLGYSSDLGDAEWAMIEPRLPQRHRLGRPPKTEMRRVVNALLYMVRTGCQWRQLPREFPPYTTVQHYFYAWRDDGVLQRINFELLLEARETAGRAARDHRRNSRTTTVAAHVMRSD\n>MGYP003329493463 FL=0\nSCKLHEDGSTRRTYQNEIASVWSKEIPIEIPSSEWSNDDVEPETIASLIQRNQKLKALIYEDAESLNLVKEKISKLPV\n>MGYP001213017408 FL=0\nGPGSGPGQGDARQDTGLGTPGPPLLQVCSLTQRYGNKIVLQDVDLEVRSGEIVGVMGDNGSGKTTLLLSIMGILRPVSGRVMLEGEDITNVPVSARARRIGMVFQNPNHQLFTDQVWREVVAGPLSRAVRRRRAVPRPRRFSTGLTSSRFARATR\n>MGYP003197570824 FL=0\nKDSEGWLKHTDFIILDMICLQLAYVLAYAISGYGFNPYETIIYRNMAVFLELADLVMIFAYGTMKSVLKRGFCSYVKSCDYGRCLSGFIFIPAS\n>MGYP001590617569 FL=0\nYNTLFIHFRQSIHTLLRSRPVGKRFSKFLAITGEAFWASLGSFGGVQYWYGAVVNEWIVADAWASSCVPHAILYRMDSGTHVEVDQAFERAYEHSLFLCAVFCDCTFWSAPREVEWVFVFFALGTPFKRKNTILISNVKCTDELACLIPHHQIQRGFRFTDPVLQYVTRHWISLMVYLILCASQCRT\n>MGYP000882899174 FL=0\nMLLNVTLIVLCAGNSTRFEHKTKKQWIRIENEPLWLNVSKRLASFSQFDKIIIASHEDELNYMKNFTDNFIFVKGGETRQKSIINALELVTTKYVMMSDVARACVPQSAIKNLL\n>MGYP001793805036 FL=0\nMRGNSKYMRREILFDSTRPILCNTLTSGVCDGILLLARCIRFDISPYDPPSPPI\n>MGYP001580518470 FL=1\nMSWIGGIDKVSRERRGIKDLVNGWDKGVGFGIYLLNI\n>MGYP000055909560 FL=0\nEALLVWTAHRCITSLELVLTAMSEHAPLDDRPFWALVGDAGYNKDPITAFGISDAFRDAQLLSEAIDDGMSGRAGLEEALGEYERRRNESAMPLYETTLRAAEYDQHHPRSLELRAALRGNQPDTDLFMGVLTGSVPKEEFFNSQNIRRILSQAKDGGSAA\n>MGYP000181573229 FL=0\nMGSKKILLVEDDPNFGTVLKDYLALHDYNVTHAKDGIEGLIEFKNGEFDLCILDVMMPRKDGFSLAADIRSTNKEIPIIFLTAKTMKEDVLRGYQVGADDYLNKPFDSEVLLFKIKAILQRKESDVNKESELLQEIRQFCIAAGRNPNLDSIITYNYDDLLESCLANIEVDIPFKSIHASGMKHKPHELPIYHVHGFLPQKSKLTNKNRVVLSEDGYHQQYTDVYGWSNLSQINKSVSYTHLRAHETVLDL\n>MGYP002759741552 FL=1\nMSNPVPASPFSPVAIGPLTLKNRFIKAATNEGMSAGGVPSKQLAQLHGNLAAGGVALTTVAYCAVSRDGRTLPNQLILEPASLPHFKALTDAVHGNGGLASAQITHGGCFTFIRERSTRRPLSASGGFNKIGVMSGMFFKQAMSEADMAQVVADFAQGARLAREAGFDAVEIHMGHGYLLSQFISPIYNKRRDQYGGSLENRLRFPRRVLRAVLDAVGQDLAVICKYSITEGTRAGNSADDGARIARMLEAEGAHLLVLSAGMNAESITTMFGSSFPKENRVQQKNPLIALAMAIQRRTEPEVKFRELYLLEHARKVRAAVKMPLAYLGGAQGLAGIEQVIGEGFELVAMGRALIAEPGYVNKLASGEERNNRCTACNRCVAMMYTPGGTSCVLGEPGDAALNRVPAGSA\n>MGYP003289090808 FL=1\nMKKSILLWLMVLCVGIVSAQTIEINTVEDLSALATNNESQNGYVGQTIDLKADLTITKVWRPIGTRDYPFRGTFKGNGHIISGLGAIAGTDGVGLFGYVGEEGVIEEVGIGTGHIKTMKNDECQYVGALVGRNNGTIRRCWNMATLEVNAIHVGGLVGQNSGTTEDCYNAGPILKAIDYIGGLVGTNTNTGAIRYCYNIGYAANGYGVVAQNTGTINDCYYDRQLYIQNPDAGHQDPTGVTAMEKSADMYTIFSARSAWQQMGDNYPILKVFQNQDAAIVSAASIDLTNKGDALADNHMNLLTSDFIVNSKNGVHWEVTSPLMEQWVYPDAANANQWRVAFPCRPTDVIMQVSKNGNVREVYAFPKPVPDFIPGKFAADSFVVCLSETLNFKDIEFKEKGYEAPSGGAGNYQVKLMLNYLDEKGEVDHNEILISAPSWGDYIALYNSGSWTPSEPGHYTLQRYAADEQCHPELMEAEGVVPIFVPANLTAGDIAGDAILCGIDQTITIHSVEPAICEGTEVYYFWTKNGIEITGEDNASLENYPMNTSGTFVFKRYAYNNACVSKDHPLEAEHSVTITVYEEFVWGAIVEPSDTIIGCTVQDVLNQLSVISEQETVRGGKKPYSYQWMMKIDDGAAQPITGADQHDLNLRDAGLEDAHDYVIYRTVKDSHCQTEWIKSDGQVKIQIYSKITGGKIETKTIQADCIMPEEKGAIPVQIQSRQPAQGRGDIDYKWYMVVNDETFNPIDLKQHTESLDYKLDYGSVQNNATYTFFRTATNKSCGGEEVRSEGETTLQVVIATNVDSTLLICESMFENGQYTFYYPNAENPRQTNIFYKDDLQIWEFNDKLESGCEPRVTIRPVLTLAPKIHADNVSTICQDGDAGTLTIYFEMLEGKADTYNIELSESLRPFFDGKQYISGTIPTVTAGNSGAITVQCQRIGISGGDKIMNLQVAQQIDGQELCYSAMSEIVLNVTQGGYVLDKYGKVLFIDNNPKHPTDPKFIAYQWYKNGQPVEGATGQYYHEDGASLNGSYFADLFYFNGGREMILRTCPIEMENGTKREQENATDSVSKRLENSQIIIQRGDAEYTILGSEL\n>MGYP000988737932 FL=1\nMRLILVFLTLLLAAASAMPQDAHPHEESLPAWFAETFLDLREDVAEAAKAKKRLLVYFGQDGCPYCRELLQTNFSQKRIVDKTQRHFTAVAINIWGDREVTTMDGRTQTEKEFARALGVQFTPSVLFLDEKGQVVARMNGYYPPHRFEAVLDYVAGHMERKRSITAHLRTAAREAASPDLHAEPFLIPPPHDLRRRPGGKPLAVLFETRHCAGCDELHRDGFRRPEMRNLLNGFDIVRFPLFGTEKITAPDGRATTAGDWARRLKIAYSPSIVFFAPDGREVFRIEAYLRPFHLAGSFEYVATGAYASEPEFQRFLQGRAGRLRERGEAVELWK\n>MGYP003328125236 FL=1\nMNIKTNISLKSYNTFGIDVNAKYFFEFSSVDDLQYLLSDKSLKNEEKLVLGGGSNILFTRDVDALVLKNEIGGIELINEDDTHFYIKAGAGVVWHEFVLYCINHGYAGIENLALIPGNVGASPMQNIGAYGVEIKDVFHSLEAIDIIENKKVVFTNSECEFGYRESVFKNIYKNQFVITSVVYQLNKTPKYNIEYGAIREELDNMKIDHLSINSIAQAVMNIRRSKLPDPKIIGNAGSFFKNPEISSAEFENLKTEFPKLVGYKNENNSVKVAAGWLIENCGWKGYRIGDAGCHEKQALVLVNFCNASGDEIYDLSEKIIESVKNKFGIQLQREVNII\n>MGYP000122910653 FL=1\nMLDLATAEYSLVGCVLIDARCLPAAREILPTAEAFASEPCRKAYAAACRLEDEDKGIDPVIVGRAAGLSNDFLMQCMDLAPTCTRAAEYAKAVLDGYQRRQLQALGEKLQTEALCAGSTADQLLTEARSTLDDLASTPGRCSVKSARDSLLDFMTFRAEVQQGKRQAIRTGFPSLDRILGGFAQGGFYVMAARPGVGKSALGIALADMMARDRRVLYVSLEMTEAELNARRVAAVSDITCTFGKLLFGKTTEEQDAAIANACGKLYAHKLQISAVSTLTVPELELQARNVGAEVVIVDYLGLLSAEDKRLSEYDRVTRISGDLKRLAKRLGCVVLALCQLNRESVSAPGQDTRPRLSQLRSSGAIEQDSDGVLLLHRPEYGRTETPREASAPQQFFVDVAKNRHGRTGTAELAWYAPVNRFEDYGGKWTVKSWM\n>MGYP001552508999 FL=0\nLAGAGISTLDPLEDNERGVIISTASVAAYEGQIGQAAYAASKGGVVSLTLPAAREFAQFGVRMNAIAPGIFLTPMLQGLPEDVQQCLAASVPFPKVLGNPAQYAALVLHIDHHHRADRARQVVX\n>MGYP003447821379 FL=0\nSCTKNRFLINNNIQLLKQQTIMDLNEFVAHFAEQFEDTDASVFTPETKYHDLEEWSSLIGLSVIAMVDDEYDVTLKGNDVKNSVTIEDLFNIVKERA\n>MGYP001289232407 FL=0\nELTVSENRLVYDSLVRAGEAPPVVWDTVKAGNYGRVYIYTDDERAENLKISNLQSASRRILLSDKTINGQHYTTQVYLDKTLFLSTDGPKGPITIQVKSVSEDYFTYLKGYEQFEASSDFNALSQPVRVNGNVQNGLGVVGGAYVQEFQYLYDRW\n>MGYP000237473348 FL=0\nMTPVGLWALGWQNTATGRWSRAAASWSGGNIVARQAGNVNMLCYVVWASLFSIPPLFALSLWLEGWSAMVHGVRSADALTWVAVLWQAVGNTMLDRKSVV\n>MGYP002446805835 FL=1\nMLRVQLICTGKLKESFYAAACEEYNKRLQRYCSPEIIELPETGDIKARRRGDARAHRLWRPRRRHVH\n>MGYP001329416472 FL=0\nETIQSKNGCLIKGNISSSGDRIYHVQEGQYYNETKISMSLNSARKCSECNGIGAKNASDVKTCTKCDGSGVFVQIQQIGPGMISQSTQTCGICQGKGKMLDPSKLCKRCNGKKVEKKRVKLDLQLNRSHKDGDKVVFSEMADFDPEATTQGDLIIILKEKNNQQFLRIDDDLVYTKTITLLDALCGMDLTITHMDNRKLFIKTSEVIQPDSIYRISGEGMNKNSNLFVKFKVVFPSKLSEERKKYLRKLIQTKVTENVQDKEENTKDREIKFLDDLNENEVVYINEKINILNLKGKTSSDNQPEYEYSGEEEGIPACAQQ\n>MGYP000295350481 FL=0\nMVRNRPKVRKKFVVIRPKNHRKKAAGCPIEQPAAYLFT\n>MGYP003428885701 FL=0\nNMITGAAQMDGAILVVSAADGPMPQTREHILLARQVGVPYVVVFLNKCDMVDDAELLELVEMEVRELLSKYEFPGDDTPIVHGSALKALEGDQSDIGVPAIVKLVAEMDRYIPLPERAIDGAFLMPVEDVFSISGRGTVVTGRIERGIVKINDEVEIVGIKDTVKTTCTGVEMFRKLLDQGQAGDNVGVLLRGTKREDVERGQVLCKPGSIKPHTKFEAEVYVLTKEEGGR\n>MGYP001619181529 FL=1\nMKRTVLWSAIGIALALTAPPVQAEPARSADLPTLIDQAMRKSPGLQAKKRAYEAARGRVVSAWLPDDPMVGVDVEGQPDLFNFGGRTNNEYMVSQTIPFPTTLILRGQVALRDAQMAFQQYKEKERDVVWHLEQPYYEFYLAKKTRAALEEVRALLEKLAETARRRYEANQASLQDVLKAQIERSKVDIELYQTAQEEHIAQAHLSHILNLPLNTPYELPEERHSPPLSWTHEELEHLAVRMRPELRAAELGIKRAKASRMLALTRWLPDVTGRIEARQFKADGRANERDTFIGVTVPVWSLLKGAGGEWKSAGKDVEETEAAYQELKNEVLLSVHEAYAKAKTAEHALGVYEQFTLPQAKQQVELALSAYEAGRAGFXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXSPSATCTTARNSTRASRAR\n>MGYP001234761162 FL=0\nSGYKCGIDLVFIFIVVFKLILNLHYDLRLNPIDICKTVSTNFKTEIFDVRDRHEGTHI\n>MGYP000998860503 FL=0\nMKRMLSYVVWVLSAALLWGCSKRAMGRMESGAKLPVHFSCEGFSKTGGAATRVTGENFEPGDVVGMFSYPSDGPMFGSGDFTKGNVPYVYMQEGELLVREGEVPLYFPDDPSVPLTFKGYYPYSEQMTADGLLTLDLADQRAGEKNAVLYSDNAQRIVRTANYVGLEFGYAMAQVIIRIQYDPDEMPDGDLAAVSAVTLEGEGIYSACDFHMADGSVTAAAGVPARGTIGMRPGSAETTATVAPATARDLTVSVTTPAHTYVARPKDITYERGRQYTYNVTLKGGGEAQIGEASIVDWEPGNDGIPPIIGVPEYEQR\n>MGYP003398871467 FL=0\nYALIDLPEFFDWLEANAEKLRAGDKAALAEAVRVSCASKARIVAIDPATYADAVTWSEQFGADVDEVIEALSSSTEESIPVIAIEGEPVPEVGSFGLGRTYPYRVVATVRGFPTAGNRSVSVLASADAINEYAARGGDEDAPAVTESFRRTAVSQAGADVLTSLAQAQRIRRTPGTAAERDKARVDWLTQYNRSSAKDNAK\n>MGYP002477722919 FL=0\nCICVHQAEEEGASLGGWDERAESAWHATWVASLSRCIAYASKASAVAFVQKQVRVATLVVEIMIDHACVSLDLSLADQAANNNSDLVIMEDHKFTNPYEEQKDHINEYTAQEIATLQSRLDKQLGPEYISTRPGNGGGKVHYLAAEKVINLANEVFGFNGWSSAIRDVQIDFVSFSDSPRSLVMLTTTVRRESNNRKDQLRTVYHCARLFERWHIPRGKLSSALIYPLELTGVDIGYGHIENCKGKAAAFEKAKKEATTDALKRALRNFGNVLGNCLYDKDYLQRVTKVRIAPSKWDAENLHRHPDYAPIKKEAIAGPSAPTTIASNPPARMPSAQSNTSEFEDEFGGNLFDEVDFSHPDEVRLDNSITEVSVETPVRPPANSVSAQAMNRQQPNRVASMPNVRQFSGGPQQNGQQNGQQARPQVPSQTFKNTNGMNNQPPNRMMGPPHQASNQNGFRSNPSSASESTTTNGRQITPPESVITPSQVPSHVPSGFVSGAAASALVQPPESGAVPPIKLFDPHHESPSIRRTQGVDLRKSAPIKRSEVGAPTVPIPNPKPMMNGGAPANRSNFVNPAMDAGRRIGMPGMQQSPLANRSAYKPPAMKRPLPAEAPVGRPPLADMSNVQQTDGASDPKKLKMDAVQEPPNPASGETGAAA\n>MGYP003292343469 FL=1\nMPVLYISHDETLIEKTANMVIHLEQLKRKTEPKFTVAKMPYRQYVEERLHNFDRQEQQALNERREKRKRDERFAEIYQKVQTQLAGCSRQAPSVAKNLKDKMHSVKAMGKRFEREDENMTEMPEQEEAIFFKLGNKEDSIPAGKVVLEYELDEVFRYNSKTKKIMSDYWVKVKIAKNKVAPPFKTAEFDIIYGKGISREGDILDLAADVDIVNKSGAWYAYEGNKIGQGRENAKLFLQNNPEICNLLDAKIREYYSLGGAISGEKSE\n>MGYP002583638056 FL=1\nMGLFDFFKSLTNSKTEITSTDNDVTHLTNITKSGLSIHPDLVDLIWIGDGKYQNYSNQPHPTMTYPYRGFVVKVAAFGAEEPSLLYLKYPIEQVQPSEQIERPPYYPFYGELTPKQKYLYWKFLNDPYNPHNDIGYVFIFYYGLERHLLYGDFEKAFNVILKLRDVYNNRSFQHYSAGALILSTLIHKRADYTQKFINSLDKDYEFQMPGELYFLCKLSLGIPITAFDIMKFHKFFNFTNTRYIKNNSDMFLKNLRQNICYQNNGRESLDASLYCTESNFSHLPTISLPIFANVSIREKEVTIPNLSCDSHFMGCIFLLLDKAHQDTKQELANLRKGKSANSTTEEQSTESHTPYAGSYFDDKKFMSLQQIYYDNSQKIESQWSILYNLKTYTGSNADRYMELCRLNIQQYTKMNDRGKHYTDYESPLGVPAYRRLAMLYEKQGNYEASFEVCIEAIKSGILYDGNKSGFKGRAARMIKKGNIQPDEEIITLLME\n>MGYP001139541149 FL=0\nMDIQEILEHLPHRYPFLLVDRVLECEPGKR\n>MGYP003566972480 FL=1\nMRLSIRNNGRYLVEFDRLDVQGRNAISGCGLVFSLKGSSPGSEKNVNIFGIQIGLYHSEDSKFIVPSISCADSLRQVSQYSNNNENFHFEAVLTSEQINAIEEIRQDGDLKLTLTLKALLSSSSGLANSYERSEVVVPRELWLKALRSSGFCRTVLYEIPLPASDIDIEGLITKARGFIETGHYKDAVMQCRHIIESLEELRGDKRQAQAANRMAHSDSRKDMTSIERLLSLREQLKNVCQLGGHGREAFTRSQALSVLGMTMALVSEPTVGALVNAVSEGTERGEA\n>MGYP001095359691 FL=0\nMNSRRSWSRNRCRFDARTDAAGEPVLLADQDRTRWDRTLVMHGLAALDRATTLGRPLGPYTLQAAIAACHSRAPRFADTDGEAVVALNDSRPQLAPSSVV\n>MGYP000548248604 FL=0\nMDEQKRPRAWVYARIPGDYDGTMNSYKVCSMQALHDGCDIVGGSIDERGGWLLRPGYRDNPFGGDRPSQT\n>MGYP000364143963 FL=0\nGDGTFQPAASYTAGIPYWDPAHAVAVGDFNGDGRADLAVANLGTVSILLGNGNGTFQSEVKYGTAGGSTIQPIAVGDFNGDGKTDLAVASLGGTNVAILLAKSDGTFQPAANYAVGHQPYGVVVGDFNGDGWADLAFASNVDKNVTILLGIGATSTPDLIISKTHVGSFVQGQTGATYTITVSNRGGSTTSQVTVTDSLPVGLTATALSGTGWTCSLGDRKSTRLNSSHLVIS\n>MGYP000838638459 FL=0\nYTRLFVGSSDVYKRQAAGQLLYEKGFFFVTFVWGAALAAALIKRWRDGGSLSTVKK\n>MGYP000110898291 FL=0\nCKIICQKLAEMGFFDSAMNDADQQFGVLLRNNDPDAYTGYLRWAKPVVELLEGKGSATFRKVVFFWVRDEQRRQQMQSNIVAHYLDVIARPWAEEMAYRMQAQGYDKSNPAGRFIMNIGLPMCRVISKFGKKTELPMWLKTALIWGTTTVLLVAVSAISGTDKVLNKLRKHLYRDWE\n>MGYP001080633953 FL=1\nMSPGQAASLQLSTARLRILPLDSENLRLSLEAPEQMEMNLGLQVTGNRPQGEVRDAVESMLAHVQQDPENWLWHTHWQIVLKRDKLIVGGCCFKGPANVRGEVEIGYGIEPEHRRQGYMEEALSETVRWARQQPGIRSVTAET\n>MGYP003432707236 FL=0\nMAGGSQIIISSDGIIIKTPGEFKVFAGQHIFNEASVASLKATHLQHLLPPCDVIPKAKITPDVHFPVMGILARIERLDGEKINSTDKLLINGSPLKEVWIAENAYEPAYGARPLKR\n>MGYP000920430015 FL=0\nRELAEVWDELREYGEQVIIELKSQPSVYRIKDKLVKWDYGYDLFNDKLVAIKGSLTLNAFH\n>MGYP000639132496 FL=0\nMGAYILRRLLLVIPTLFGVMVINFALTQFVPGGPVEQVIARLEGGGDSIQNLGGSENAGVQEEEAVGEGGDNGYVGARGLPPEFIAKLEVQFGFARITCDEGFTGTPSVTAPECRKEKIPAVERFFIMMGNYLTFDFGQSYFRSISVVDLVIEKMPVSITLGLWSTLIAYLVSIPLGIRKAVRDGSGFDTWTSGVIIAAYAIPGFLFAILLMVVFAGGSYFQWFPLRGLTSDNWEELSLWGKIVDYLWHITLPVTAQLISSFAVLTLLTKNSFLDEIKKQYVLTARAKGLSESRVLYGHVFRNAMLIVIAGFPGLFLAVFFGSSLLIEVIFSLDGLGQLGFRSAVERDYPVIFGTLFAFGLIGLVVGILSDLMYVFVDPRIDFERRG\n>MGYP001328790198 FL=1\nMSELYEKTAVELGKVLSSGEASSEEVARSFADRTAKVDDKVHAFLNRDDEDFIRQAKESDERRSKGAALGPLDGVPVALKDVISHKGQPLTAASRILENYVSPYDATTTRKLKEAGALVWGRLNLDEFAMGSSTENSAFGATRNPWDVDCVPGGSSGGSAAAVAAREAPLTLGSDTGGSIRQPASLCGVVGMKPTYGMVSRYGLAAFASSLDQIGPFSQTVEDTALALGVIAGHDPLDSTSFPTEVPNYLETITKPCPKMKLGLPKEFFGEGIDEEVRKLVDEAISFYRKEGHELVEISLPTTDLAVPVYYLIATAEASSNLARYDGIRYSHRSERAENAVDVYAKSRGEGFGEEVKRRCILGAYALSSGYYDAYYLRAQKTRTLIRRDFEQAFQEVDAILTPTSPTPAFKQGERAEDPIAMYLSDVFTISVNLAGLPAISVPCGHTSSGLPVGLQVIGQAFGETEMLAVANAYDSVHGFGRKCPEL\n>MGYP003694182255 FL=1\nMKLNCAAIPTGLLESELFGHEKGAFTGAMAQRIGRFELANGGTVFLDEVSEIPLDLQTKLLRVLQEREFERLGSGRTLRTDARLIAATNRELGALVDEQKFRADLFYRLNVFPIHVPSLRERPEDIRCSSGISSSTMRAG\n>MGYP000441261351 FL=1\nMRLNIRKSIITGISLATLLPAFSLLQSCDDSEAEKWVDLRYRVEDSYLVEAKNPEPVSFQVKSTDPWEVFGKYDWYTISPSTGEAGETYTVTVTCKENTELDDRIDTLNIKSDYWTGKRFVLTQKGTAYLNVEGVDMIDQEGNSETFSVLSNQKWTAKVTDGDVWLLHPIRSIGRNERRNYCHRFTEYRRTTYRYCNHL\n>MGYP002925163669 FL=0\nFAARKAFVRECIDANLVLETPDPVIDTQFRYAKLRAAESIVATRGGYMHAPGGESYYAAIWANDQAEYVNPFFPFLGYGVGNASALNSFRHFARFMNPAYEPLPSSVIAEGDDIWITDPKGREHRLAMLRNQTRGQDNLSLADFIAPKGDWIGCFAVTAGIGLKELCEKFRAGGDDYNAITVSYTHLTLPTNSR\n>MGYP000555143592 FL=0\nFTTTGLKNNITRYMIASANWNLGGTSSKTLYANQLYTSERGTAVYSGHTTMWQGKVALPYASDYAYAAAFGNGSSLLCSSNINSYSSTNCKNNNWLYTQFKSGSAWLITPYSGNQYDPWLVDTTGIGNYGSVAYNANAIYPTVYLNPDIVISKGTGTSDEPYQLSADTVTSSQVGEYFNGYTSYKNLDFAYYDFGSSVSVIAKFKIDDYPIKFADIVANWETGGFGLVIDTDKKLKFGIRTTTGSDYVYAASSGAVSLSEWHTAVGTYDGTTIKVYLDGSLVGSTTISGSIKSTSAQIAVGADPYTGGSASGEYFPGYVSEVSVIDQAIGASTIATYFSKSTPSTTTYTNTKTLVKAKSTSLNSPTLVKDSIYRGKYFDGTIESGSYVARAELTGDTYFSLGTQWNDITKAYGLSDKEMFNLFNTRALDDAVRQGKSIRFSQNPLEWKGTALGDEWLYLQSKHGYTRLKKIGDYWYAK\n>MGYP001202979195 FL=0\nLCLIRNEYLWYPTPKQSPLLGVAGLGGGIASRLGGKAPNPYRGLVGNGSLRSGFTNLQMAFPFTDSKNGLDLSGNNRNLSNWSTNTPVEYAVTGVDKNGDPPPYTTSYGKTQSGPDYGWKNLSSDFNFQGSKTYTMECWFQVNSPDTGILMISMRSNESEGQVLTASTSYGIKSLAWSGSEDYTLSGGTIVVGQWHHGAYTRDSSTSPDTHTLFLDGTQVAQITSDTYGDAYDYNQYGFATFGGGGVAYYPNSFMQDLRVFDTVKYTSDFDIAEYLPTLDA\n>MGYP003457825976 FL=0\nLEAACRRDEPAALIVEPLVLGAGGMLMYAPQVLADMARICAEHGVLFIADDSGAYDVYDIPASGGPVRRLTRLAAGALDPLELDGNLYFAGYRAAGWDLARASPFEYTAICLSNASGAVISSIFSARSNRVTMSSTESDCSA\n>MGYP000975471581 FL=0\nMSNYVINHLRELESEAIFVIREIAAQFENPVLLFSGGKDSILLTHLAKKAFYPAKIPFPLIHVDTGHNFPETIAFRDMLVKELGVQLIVGSVQESIDKGRAKEETGADASRNALQIVSLLDTLEENKVDAAMGGARRDEEKARAKERFFSHRDEFGQ\n>MGYP002779293856 FL=0\nYHWLTETIKRNSMKYKRVLLKLSGEALMGNQGYGIDTTVLTTYAQEIKNVVDKGVEVAVVIGGGNIYRGIEATATGIDRVQGDYM\n>MGYP001768057102 FL=0\nISEHDALLATHVATILSGGDRSPGVASEQDFLDLEREAFLSLLGTQKTKERIQHMLKSGRPLRN\n>MGYP000742296790 FL=0\nMKTRNDTNFTSTKKFLPLFVAIIITAIFLSNCVPIEQPKPEAPMAVTEPAPEPR\n>MGYP003387108590 FL=0\nQLAKAEGLRVIADSSTEDKELVTELGADVVVPRGDNISEQIRNIMPEGVDGLADGSVQNELSVGAIREGGSFASVRYWEGTGERDIKFHRTSVSDYFQRSDLLDQLSKQVDDGILTLRVAETFSAEQATEAHKKLEAGGTRGRCVILL\n>MGYP001556444362 FL=0\nMKLKIQQIKNPLLFIGLLLGLVFMVTSCQKETNEPDQAFHKAKKGPQKEEIVVVANRLDGSISFIDAISDQVQNTLSIAGSEPMYVVYVPDNDRLYVGDRAQDKVHVIDPATRQVESSIDVGNGVFHMWAGGNGDQLWVNNDQDETTSVIDLSTNTVIQTISIVLK\n>MGYP002617661281 FL=0\nGRGGVAGHDDHLASLRDEAGDGLVGEDVTENLKTIRSIPMTLEGAPARLIVRGEVFMPRASFARLNEAREAAGKSLFANPRNAAAGSIRQLDTSVTASRPLRFLAYGFGDVRFGGVQPWSTYEEVMGRLRDFGFETPPGGRLCRGSEEVEAYYASLSEKRESLAYEIDGVVMKLNDLEAQEALGYTARAPRFAVAWKFPAQQATTLLLDITVQVGRTGVLTPVAELEPVNVGGVLVSRATLHNEDEIRNRDVRIGDRVVVQRAGDVIPEVVRAVLSERAPDSQ\n>MGYP000022545691 FL=0\nIAQKGGIIMDGRDIGTVVLPQANLKIFLVASVDERAERRYKENLSKGIPTDLERLKVEIAERDRKDSTRVVSPLKQAEDAILLDSTGKTIKEIVQFIEEKAKKLMENEFFYIFLYYKSFASFCRNYQTLI\n>MGYP000539356882 FL=0\nPPAWAVYIPIETPNTRSGETATAANADDAGYIDANKKCHWYSQENTGNAVANVKGAWFTYIVFFNGVHITNNTDPAIWNTGAAGTGTNGTSGRAVLTLKLIHQDPREYVLQLNGVDLKATDNYSVMRMTYVQPNFNNMPSSPYTIGSSSYEEFRHHNESQAAFTLPAAGYWISADEVSYSFWEEISGDATLDATITQHLQDDLITGFRNNYIGLNQPITYMSYDEVTAFCSGQLSAKIGTTARLPNEAEWEFACRAGKDSTYSNMKGYTLDGISSNPFDAGNNDPVDDNNIKDYYEKVEVYVNGSNTMPCPVPTILSNENQWINGAWESKAFSVFYTIESEIKAIKQMI\n>MGYP001030690318 FL=0\nMHVLLDELAEFVRSHRLENEKFHEGAPGAANILLIWRIDVICKNLTFKQVLPSLLILAKVFDQW\n>MGYP001004560480 FL=1\nMARKVGFVIGLILLVCLTPMFATGAAETPVTGAGPKVINLWSFTDEVPKMLEKYKELHPEFDYEIKTTIIATTDGAYQPALDQALIAGGADAPDIYCAESAFVLKYTQGDAAQYAATYKDLGIDVDTLLKQADIAQYTIDIGSNERGLVGLGYQATGGAFIYRRSIAKAVWGTDDPAVIKTKVGPGWDKFFEAAAALKAKGYGILSGDGDLWHAVEGASEKGWVVDGKLYLDPDREAFIDMSMELMQKGYHNDTRDWTDAWFADMKDANPKQVFGFFGPAWLINYVMAGNSGGTKPGEGTYGDWAVCEPPVGFFWGGTWLLANKDSKVKDAVADIIEWITLDSSDTGLQYFWANGTLAGPGGTKDTVASGTVMKKSDGSLPFLGGQNMFDVFVPAGQFATGKNKHQYDETINTYWRDQVREYTGGKKSRAQTIADFKQMVADNLAIPVK\n>MGYP000510584249 FL=0\nMEVLVENLTFLTWQQVLMWIIGGTLIYFAIVKEMEPSLLLPMGFGAILVNLPNSGAAGVIAHLFQLGIAGHELFPLLLFIGIGAMIDFQPLLANPKLMIFGAAAQFGIFFTLGLASLLGFELNDAASIAIIGAADGPTSIFVANVLKSHYTAAIIVAAYSYMALVPIVQPFCIRLITTKKERMIRMEYTPGKITKTTR\n>MGYP001059407761 FL=0\nNGTQAKDEGALPLTAAQSATLKQGLKLVTGPNGTAASAFANLGYNDFLGKSGTAEDSGEQSHVDFVAAAPAETPTVLCTVFLDHGTSGSTQAGPIARDIVLAALAEGL\n>MGYP002518956829 FL=0\nMVSWNNLDTLASYKELSEVARVNLAEAMTGENGAERVKKYSVPMAAGMAFNYAAKQVDDNVLAVLAKLADEMQLVEKFQALYNGEVINTGEKRMVLHHMTRGQLGEAVTADGGDKRAFYLNEQKKIAEFANKVHNGEITNVQFGLYADADMIADDGKVIPKGALLETAYCDKDGNIIKSGKCDPWIIKELYPTENGYMTKVVGSNVALDLIILPSLKNSLPLCQTEVTPTVDTSTACPLVKSII\n>MGYP001810087265 FL=0\nIMRRCSQTADLLNAALSGSHGXCPGREFLCTLHRCGFKWXDVQTDAVCRHTCFRRLWVGCVCMLCVCVXGXGXVSXEGVVIGVWLAGTGALCVCLXRCGFLLX\n>MGYP000952481259 FL=0\nFELESHFVAQAGQQTDSVSKNKTKQNKNKKQN\n>MGYP000924557708 FL=0\nWRTDHQSFAENGVNRWLRTWPGNELTKTNIAFYWFRGLHLSMDYVPDVAIRQPDHAERIHQALMQSPHEAPMPEAVQAQFAQLAADNRAREPWIARLWVPLVHLQTMLMQASAYPEVARLLDRVAPGLGQIVLALLRAGILVGLLLLVLHWRRLRLWDQQVRLARGFINALAGDCEVIRVQFNSRPVTAHALASDKG\n>MGYP003568761090 FL=1\nMSRLDSMLRRFTAQRDGLNWAASFIEGMEGDALDMGLGNGRTYDHMREIMPDRRLWVMDRILQCHPSCVPPEEDFLQGEAEDGLAGLKEMGAKIVISHYDFGFGVKEKDVEEAARFSPLIAEVMAPNGVIVSGQPLIGFEAVKGPDHIAPDRYYFYRT\n>MGYP000894995155 FL=0\nTLPLFGGCTGQDGDKGQSNAKTAGKDSPLVTIRWFQEARGQDPNKDRILQEIQNKLNIKLEFVAAPAGQESEKLNLMVSTGEQLELVTAFDIDRAAIQWAKDDFIYAYDEFMESGDYPRIKAILDSDVYKDLKVNGKSYFKPQPLWPGLRGYVIRKDWLDNLGLEIPTTIDEYYNVLRAFRYDDPDNNGKEDT\n>MGYP001069368337 FL=0\nPALGGGEQALEDRPIVDALDKAEIPATIVIAFEIVVIELRADAPDRPAIADRQPIGDLGMIEIRIGFRIEMVAPLKHQRRDPMGVIGVDVERDSDEAVYTGTVADLLDAEISHRQRHRSLRRAQSTAL\n>MGYP001036930292 FL=1\nMRCIFLFVFLISHLVMPFLFFLLYFCFLTLCYDSNSK\n>MGYP000703538265 FL=0\nMLSYPVNVAGLEKLDIGFAAYTRYVAPLLEEALKGLIIVALLRSHRIGFLVDAAIFGFAVGAGFAIFENLFYLQALPQTQMGTWIVRGFGTAIMHGGATAIFAIVSHTLIEQERSFALLPGFAGDVIKTVQAMPGVARPTATDPGAVVVRGSGNYDTRFFVDGIDLLVVVLANEITALSGGQPHPGTAHDTQGRRRKPVDLYALAQAALGNGLFAVLLWLLLDPKLWYTDGVSPDPVATTESPEDPAVAAPSGDAADKSAKAESVRPHDVLRSAGRLLAALILVATALGYVRLANFVFHRGVLLAAFLISVWSVRVLAAWGLSRLPAAKPPGAHA\n>MGYP001563729933 FL=0\nMVERNLLREGFVVNTRTPLGTISGTQVVTPQEIDRLADSDIATTALIASGTKLLSLDADLGARFKISRLELYTAE\n>MGYP000417054785 FL=1\nMTTAEASGKNFGSLKITFKYPCDFYISGHHVVITIVFEYHGDIEELLSHNPNYD\n>MGYP003967751787 FL=1\nMIYEKYNNMIQQLVMFNCTSVIIINELTQSNTDYYIGLCIKILTIFLIILYKI\n>MGYP000178255560 FL=0\nMIKKTIKYVDFNGVERTEDHYFNLTKAEITEMQLGVKGGLDKYIEEKVYENDTE\n>MGYP000422954699 FL=0\nMSARGLWIKSLEAILLVVLCFVIFAPMLGLLLWSIAIRWYWPHVLPQQVGLDYWKQALGFERSLAIGAVSITDAFNTSVLIALIVVAIVMVIATPVGYVLAR\n>MGYP000957065041 FL=0\nMKNDVNKSLERRFSTVQLYSQSEDFELSISGEEGTYYKFRSEDLLYVTKK\n>MGYP001611453920 FL=1\nMMLFHISGVLAEANPDSNPESVPAATTGARRINQSPTSQNDFMSSLANASEPSG\n>MGYP003568452137 FL=0\nMDDGFRRCQAATFKMSCFEFSHSNTDEKEIHIFIWTEKRKSYN\n>MGYP001429666462 FL=0\nFTQRAFRVTIRLVTDTPGMRAWVKLSGDDLVTGGNIGRPMADALLDEHDRRVEAGTLYGFQPFVTLVAERV\n>MGYP001129982810 FL=0\nLYDKENRREVFKSGQKGTLMRMYEDKPIYYDNWDVDLFHMLKHEEAAADGAPELIAEGALRVTLRFHYTYRHSTFEQDVIFHAGSRRIDFETRADWHETHRLLKAAFPLDIRTTKATYDIQYGHVERPTHFNTSWDYARFEVVAHKWADMSEEGYGVSVLNNCKYGHSAHDNVLRITLLKSGKYPDTEADMGRHEFTDALLPHAGSVVEGDTIEESVKLNLPLHKAEGMLWAAAPLVETGSRSVIVDAVKKAEDDGCLVVRIHECRG\n>MGYP000615634015 FL=1\nVKLEANTSDGYKDESYSVDGNILEVVNGSVLSISNNGYNGYNYGKPSEIGKDTALGRKDRLADFHNALVLFFGEDIGKELYQEVKNSSAYAICRVNQTAISEEEKFDVYCQTVFAYSDPKMDCPEDFSSFLYKANTKRKNLNSLRAALQGHYGKDKGMKYYSLFKSHIKIMNRM\n>MGYP001275058744 FL=1\nMSEMTPREIVEELDKHIIGQAQAKRAVAIALRNRWRRRQVPDEFLRSEITPKNILMIGPTGVGKTEIARRLARLARAPFIKVEATKFTEVGYVGREVDSIVRDLVDMAIKMTREEALERVRPRAEDAAEERLLDLLLPPARGSSAPDQETAPTNEEGAGRQRLRKLLREGTLDEKEVEVEVASPTVGVEIMGPPGMEQMTDQLQGMFQNLGGQRKITRKVRVREALRLLTEEEASTLVNDDDLKHEALERVEQDGIVFLDEIDKIVGHSERQGGDVSREGVQRDLLPLIEGCTVSTRSGMVKTDHILFIASGAFQLNKPSDLIPELQGRLPIRVELDALGTTDFVRILTEPDASLTEQYAGLMNTEGVTLEFDPAGIDRIAQVAWQVNEQTENIGARRLHTVMERLLEGVSFEAADRSGQHVVVDQDYVDGQLVGLAEDEDLSRYIL\n>MGYP000812623567 FL=1\nMKRKVTLRKKQVLAIAVAVIAVIGAIAAWQTWGATTRIAFLNFQVTELGQISKANDNSMIELCEISADDIADLDSYDMVMVTAMGLKLTEEQRAMLKEKAEKVAVYTRMATNPDNYICSVDSVDADFISQYLDNGGRTNYRSMLAYIRKFIDGKKLNAPEPELVKERPDCLLTHYDPSDVDGEELGFNSVAEYNAFLAKHGLYSEGSPQVMLTGFMGATDDMTRALEKKGMTVYRVNKPQLFIGGKHADSIHVAAVVNMAHGRMGDYMVEFLKMKNVPLFSPVNVNRLVDEWLDDKQGMSGGFMSQSIVTPEIDGAIRPFVVFGHRTNDDGLRETYGIPGRMDDFVETVSRYITLQKKSNAQKRIAVYYFKGPGQNSLTASGMEVIPSLYNFLCQLRSEGYNVSGLPATVKEFESMIMAQGAVFGTYAEGAYANFIKTQHPALVTAAQYSEWTGKALSTQQIKEMNEINGEFPGKYMATADGRLAVARLQFGNVMLLPQVIAGAGDDSFKIIHGTNVAPPHTYIASYLYARYAFNADALIHFGTHGSLEYTPRKQAALDSNDWPDRLIGTLPHYYVYTIGNVGEAMIAKRRTYAQIQSYLTPPFRESELRNTYRQLNDAIDSYNKAPNAAAAQKVKQLTDKMEIAAELGLSKKAAYTADDIQRVESFAEELANEKITGQLYTMGEAYSQADIRTSVFAMTTDPIAFGLLGIDKLKGRADGNAEKHKQTFNRQYVEKAKAIVTRLMAAGGNMTDEEICRTAGITAAELKMAREVEAMQAAPDPIMMMMQMAEKMGAKSGKPQMQASQKKLTVSELRKMRLPRHGKIPQLSKAVFDKMEQSGRFPEKMMTAIRNEQKWYKESLKKGAKKPAAKKANAPRFSRSEIRLAQAITAVEHALKNVKAYSDALAESPRMEMASMINALNGGYTAPTPGGDPIVNPNALPTGRNLYSINVENTPTEDAWDKAKELCDNTIKMYRERHNGEYPRKVSYTLWSSEFIETGGATIAQVLYMLGVEPVRDAFGRVADIRLIPSSQLGRPRIDVVVQTSGQLRDLAASRLFLVNRAIAMAANANDDKYDNLVKAGVTESERLLVEKGMSPKEAREVSMFRVFGGVNGNYGTGIQSMVTAGDRWDKESQIAEVYLNNMGAYYGDDKNWESVRKDAFEAALTRTDVVVQPRQSNTWGALSLDHVYEFMGGVNLAVRNVTGKDPDAYLADYRNHQNMRMQEVKEAIGVESRTTIFNPAYIREKMKGGASSAGTFAEIVTNTYGWNVMKPKAIDQHIWNEIYNVYVKDKHNLGTKEFFEKQSPAALEEMTAVMMETIRKGMWKATPQQTADIARLHVEMVNKHKPSCSGFVCDNAKLRQFIASKTDAASAREYQANVENIRQEQLADGKKSTVMKKETLNDDSNKTKAVVSGVLVAAIAIVAVIAIVVLIRRRRKNLN\n>MGYP001306074617 FL=0\nDIMRTKELQNGVLWNPETGQKVEQIEKGLHVVVLARRRRDRPARLPRIVETSIHV\n>MGYP001598923031 FL=1\nMVNAITQVGNVMGIMSVAVLVESRVVLDTLVAIGF\n>MGYP000619228673 FL=1\nMYMHFLHSWIFVCYRAMFVCIFLHLDCLSFFHSFQSIFKNLTISSPLC\n>MGYP003648209433 FL=0\nGFQIVGIPLIDGGFGFELHWHQRSVDLFLGLPFNIASYAALGLILEKITGYKCIAVQGDLKNVYLYENSYSSAAEIMKRGVEVIS\n>MGYP002561378225 FL=1\nMMDSPKHEAYENGGTIVNRYARIAIAVLASVGLLTSASACGTSQDGAGSAHGAIPVVSSINQWGTLAEQLGGSGVQVTSIINSTNVDAHDYEPTTSDIAKLQKARIVIVNGAGYDSWAVKAAQSAKSQVINAAEIGGVKDGGNPHVWFSAAVRKAVAQAITRAYEGTRPDGKADFDKLNQQWRSKEDEVARKITETKRKADGEAYAATESVAEYLAGDLGLKDATPTGYMRATANESEPTPTDIKQFTDMLEAGKVGLLVVNIQEETELTGKIVTVAKSSNIPIVELTEQMPEQYDSLTDWMAALVDAFSQAI\n>MGYP000499357948 FL=0\nMRLFSDFFQPSIYIFLLLNKNALNGCPKIPNFYEKIAEYYDRHSAAKKNIFTTFHLLNQFYYQKNILERILAD\n>MGYP001675491746 FL=1\nMTHEYTIFEIKARGVGRNKTTCYSIFMSEKRSDNIKKQRQRTKPKRLSVKQYMFIAVVLVLLITTVGIFGIIRYSDTRRLDVAYYGVPESIATAINAVLENPDNATVQKKYSRLRIVQLAESDIRNTKRIAKKYDLLFMWNGANAANAAEKAVVLPESVYNLFPASVRHTGKVNNVPKMLPLLLDHYELACYRTYRNNAGLALPETFNELESYLHTIKGYADYPLICAGKTDATLTAFISAFTESLAGSEGYATLVKAAAGADCLSDVLDVSLGKNISLASILGIIKQWQHEGLIHPQWYNVTEKDIESYMEEHRLGAIFMPLSEHRVKPLILIKYYDTVQFPKGDVANHALIAPVLVGMAFRNDASQLAVLEHFAHTDLQMLLSQHSKLAPASARAEAHDVQADDVRFWAASCTDGPVPELGKAAFASPVKTAAFAEEIRAYMAFTQE\n>MGYP000328593210 FL=0\nMVPVIALVGRPNVGKSTLFNRLTKSRDAIVAEYAGLTRDRQYGEARWQGRTYIVIDTGGISGDEEGIDAKMAEQSLQAIEEADAVLFLVDSRAGMTAADQMIAEHLRKRNKRSFLIANKVDTIDPDLARAEFSPLGLGDALPIAAAHGRGINHMLQEALGIFPKDNAEEEGEGEPASEEVAEGEEPTRIPGPSEKDGIKIAIIGRPNVGKSTLVNRMLGEERVIVYDQAGTTRDSIYIPFERNEEKYTLIDTAGVRRRGKIFEAVEKFSVVKTLQAIQDANVVIFVMDAREGVVEHDLNLLGFVLETGRALVIALNKWDGMEAAERDYVKTELERRLLFVDFADIHFISALHGTGVGHLYKSVQESFRSAVTRWPTSRLTSILEDAVQVHQPPMVNGRRIKLRYAHLGGANPPLIVIHGNQVDAVPKAYTRYLEKTYRRVLKLVGTPIRIEYKGGENPYEGKKNSLTARQVNKKRRLMSHHKKAEKKKKKDKRR\n>MGYP000632763877 FL=1\nMASEDGCGGGNRRVVEPEARISRFAEPVVEVEFVDVGDLVEAHAHDPDEDEDPDGGHDHAEAETEIGYSERVSLFIPTGDW\n>MGYP003625842865 FL=1\nMKSLFDFIIQPLGGKYDNEITIGDKKLILNNKIESFKSVNNLAIVIETPKAYKTPIKKGDIIVIHHNVFRTFYDMKGKKKKSRGFFHDNLYFCQIDQIYLYKKNQQWKSFGDRCFIMPLKNDNYLTADKERKLIGIVKISNSSLEAAGINTGDLVGYTPNGEWEFIIDDQRLYCMKSNDIVIKYEYEGNEVEYNPSWAHSVCLYII\n>MGYP003126176265 FL=0\nMATIITADRVSGSFTSTGSLGQLSLGGTSTSGSIQPSSSLHIQGNNAEGGIHMFRDAFPGAYGMRMYLVDSGADGQYLRFDSQRNLNWTEVLRIGNGGNTSNQTLQLVTGNLSGSVESTASFGALRVESEEDGTTITTDRFGLTIDGQAGYYPLTVQSPYETAARFISTDGTANIEIGDNSSTTNYNRIQVVGDTRLQIIQNNVDKVRFNQNTTIFNENSNDINFRVESNNDQHMLFIDAGKDKISIGSDIFGDDKMLVAGNVGITGSLHVSGNISTSGSIIAKEFRTEFVNQIIATSSGSTEFGDSIDDTHDFTGSIEVSGTLNIPTGSITVEGGIGGANIARFSRNQGTT\n>MGYP001636533327 FL=0\nAAAAVLVLLAAGLLAAVVVPEDPGAGKAGGLAGLAFQGQAMDTVL\n>MGYP000052352460 FL=0\nIDKQFRLLELILFYYETAGEALRKGAPMQPVFDIPARTDWVLLNANYYVREFFALGKTLLFD\n>MGYP001423369931 FL=1\nSMIAKLIVTADDRPRAVARLSRALSEFVVEGIRTNLPFHRRVVEHPDYLSGNLDTHFVERLLGPQAT\n>MGYP000606642193 FL=1\nMDPILLAIIVVTVIGLIGAVILVAASIFMYVPVDERVEQITAVLAGANCGACGCAGCADYAKSIVEDGNAVNKCTPGGAACAAKVAAIMGVEAGSSTPMKAVVACSGTCGKTGKKYEFQGIQSCQAVKGLYGGDGLCKFGCLGYGDCTRACAFDAIHIVDGIAKVDRSKCTGCGACAAVCPNAVISIVPEHKRKPVVLCQNKDKGADTRKACTAGCIGCMKCAKACPKEAITVENFLAKIDQDKCVGCQLCVKECPMGVIHVPASE\n>MGYP001134501289 FL=1\nMFFAVLAVQIYLLKTTTTRDHQNITEFTFMIHHVCMNKPMVTCTLDELDVDFLLYPLSIPNSAKKFEDFGGATCPLIWLSSELLPVLAAGAFSTYSNREVQDLLLVIVLSVTDGRTGAGSSGFCS\n>MGYP002743407678 FL=0\nMAKIFDDLGYNWKFKVLNSKEYGIPQNRERVFVVGFRNDLNINDFNFPNKLELNKTMQDFLLDSVSGKYYLAKKGVEFVTSKKNIDKRYTQIDGEIQLCQKKNQQFNWHGDFIFQAAREFEFDDFIFDVNSVEEKYYLSEKIKNYVLAGGTKNFKTSTETDLPVARPLLQTMHKMHRAGVDNYVTHNRGRIRKLTPRECLRLMGFRDDFKILVSDTQMYRQAGNSIVVD\n>MGYP000205383798 FL=1\nIHAIEAHHGVAEDAHAGDWHRQVSLLAWESIEKARARGLELGGLDVSLESWKEVLEAMARLPE\n>MGYP000432900193 FL=1\nLIPMDIIEEMAELGVFGLTIPEEYGGLGLGALELCVVAEELGRAAAPVPFSSSVYLGTEAIVKYGTNSQKEKWLPKLSSGELISTFALPETNSEPTEKNIKTTFSNGKINGKKLPVADGSYADISIVVVKNTDNDDIALAIAELTSENVKRKQISTLDPSRDHAEIIFENSEAEIMDIGDEGWGAVDSILNSAAVLMAFEQIGGAEASLNMAKEYALDRYAFGRQIGSYQAIKHKLADMYIAVELARSNCYYGAWALSCLLYTSPSPRDS\n>MGYP000580577341 FL=0\nMKIVPLTLESMWPSAALLSANKEASRENFLKFLEGGFKATQLKFKNMGPSFKNLKMWMDHLRTGVQDQAGQHGETPPLLKIQELARCGGR\n>MGYP001331097511 FL=1\nLNLNSARQLSFQGDVAGAQKEILNQVRQMGDFNKMNVFQQEALAKATGYSAVELTKMLKNEEKLAQLSDKEKASYEKALEAMKEQNEETGKDLLMKTQMQSAMAQLNNTYEAFKQILADILTPVVNVAVKLLIPALKLALLVFNLILIPVKVLANALYKLFEPLEPVVQSISDAFDGINSKIEEAVQF\n>MGYP000153268017 FL=0\nMIVSCLYCGYVAPIHRVMKRQARALACLALAATVVGFMLRGAALTGGIDGMVDPEMLGLLWQTSVGDVLVYRLIGAVMILVGLSPALGTFLAGVVLANSEFRHELESDIAPFKGLLLGLFFITVGAGINFAVFFRDPFELLGFTLLLMGGKGMVLYLLALIFRMKGRDKWLFTLGLAQAGEFGFVLISFSLQQNVLGAALGERLLLVVALSMLLTPLFFIAYERFQHRMSGDTSDAPEADQIDEKQKIIIAGIGRFGQVVNRLLMLAGFRAVVLDHNLEAI\n>MGYP000930301694 FL=1\nMADDVIPDVIGGAIPVTVIGGYLGSGKTTLLNALLRGGHGRRLAVLVNDFGSINIDADLITAHGGDTISLANGCICCSLQDNLGTTLHSLAARSDPPDQIVIEASGVANPSRIGHYAMSLPGLHLDAVIVVADAEGIRRQARDKYVGDVVLQQLAAADLLVLTKTDLVAPQVVQEVRQWLETQVPCVPCVERGNDQVPPALILGLRSELAGPDHGLGCDHEPYEHVHGEEPHDHRFAQVTFTTEEPLDRGALVAAIDALPPGVVRAKGIFYLADALGEQVILQMAGRRREWQTGEPWGDERPYSRLVLIGPRALVDEESLHARLSVLLTPTIE\n>MGYP001478987189 FL=0\nMRMRRGVIFAALAFFLSAGAFAQDKRPDPKFFIYLCFGQR\n>MGYP001414076324 FL=1\nMLDDFFTRAVIGGIGVALVAGPIGCFIIWRRLAYFGDTLSHSALLGIALALLLEVNITLTVFLISVMISFLLLLLQRRAVLSSDALLGLLAHSTLAIGLVVLAFMTWVRVDLMGFLFGDILAITSYDLVIIWGGGVIVLIVLSFIWQPLFAATVSYDLATAEGVRPEIINMIFMVILAGVIAVSMKLVGVLLITALLIMPAATARRFSTSPEWMAVIAAAVGAGSVLIGLNGSLKWDTPAGPSIVVAALVCFLFSLLPFPNFLGKKHK\n>MGYP000072544056 FL=0\nMAIPMTTGNIFSSCTDDFEKLNTSNIQVDPADLPFAAQCTEPMTYCYPPQQNMFQFWTNLTIDLYGGYFMTPNGNFTNGDMGENRGHSGGMYENYYLHIFNNTRRIIAQCDASGERGLSGVMRIVQAYGTLMTTDAYGPIPYSSILSGENEVYFEFDSQKDLYKAMLEDLSTAITDISAMGADEIAKLKSFDCWCNGDKDLWVKIANTMKLRMALRLSKRETEAGNAGMNLKAIATEAAQNTLATVNKDILIDKSLENEMWLMFNWGDCGFNANLVTIMSGTKDQRQPLYMTPVS\n>MGYP002856813101 FL=1\nMSLNLMYITNKPAVAKIAEEVGVDWIFLDMEFIGKDSRQGGLDTVQNHHTVEDIKNIRKAITKAKLLVRVNPIHEALTDYPSSKDEIDAAIQAGADILMLPFFKTVKEEGQFIRFVGGRAKTLLLLETVEAANLIDDILKVPGIDMIHLGLNDLHLEMGMKFMFQLLADGTVDKLGDKIKAKGIPFGFGGLATLDGGALPGSMVLKEHYRTGSSMVIVSRSFCNTDIVTDLDEVRHIFETGIAAIRDLESKVQHESKEYFEKNHREVVAAVNQIVKNIEAKEHGNQ\n>MGYP003291001117 FL=0\nRSRRPATSNARTGAPMRTIWALCAAAACVVALAATQTTEFPLLIVLMAVLTMVVSWL\n>MGYP002777180191 FL=0\nVRVIVVGTALPTWAAGADVVLPITTMAEEEGTFTNLRGRVQRYLQAKPAPGLARPSWFAAGDLLAAAGEGQGFFTASEAFDAMAAQHPKFAGLSYARLGLRGLPVIEAEPAGELAGVGA\n>MGYP003430828053 FL=0\nWLNDLLYTHSENPPLEFIENVKGDLAQDALYVFTPKNELIRLPAGSTPVDFSYAIHTNLGNRTVAAKVDGQFVPLASPLTHGQTISIVTNPNATPNPAWLSFIKTPRARQAIRDQLKTLREDEARKLGKRVLTLAMSSVGLSSQRIKKSQLAKTLNQWGEPSLDSLYTSIGLGQKLAPVVARQLLPQDDAHSDRETLPLVLDGSETQVVEYAKCCKPLPGDPIVGHMSAGRGLVIHRKQCTQIGQKRHKNMPPPQKQDGNWLSVTWGGQV\n>MGYP003343356212 FL=1\nMKVSIDKSVGGLQQGLTFLASTGATAPFIGLFCTVWGIYHALISISTSGSAQIDQVAGPIGEALIMTALGLAVAIPAVLGFNAINRANKLLVADLNRFGNDLLAYFVTGARVHSGE\n>MGYP002238360443 FL=1\nMSQQELASMVGVSYRTIRSWEVEGRFPKQNVLYQKLADALQCDVSYLMSENEAFITEASEQFGNRGARQAQQILEQAAAMFAGGSLTDEDKIAFMDEIQSLILGFPKDVQRKFTP\n>MGYP003335923377 FL=0\nDSCCRGCFSFVSALFNLVASGCLSGRFSLVSSCFARPSRFFRMSFWGNGDHSLVARGXSTQFPGGYILHDKGTPLQTRTVRRVLQILGRSPEMELCLCLREKRESSCHTSDAQKCEVHAXRRGWRERQLHLWSTPXAEPMDTACAPGRTQQDSMLHSAGGLLLRPRAKPACTRPAESAADPTVLPSVFPWRPWTDIPLTX\n>MGYP003595024705 FL=0\nHPWFVATQYHPEFKSQPLAPHPLFSAFVAAALRHAGERP\n>MGYP001183065379 FL=1\nMNDHQNITGIYPGTFDPVTFGHLDIVERACNIVDKLIQNHKIAWICGAFVAAMNNYLCSKYLLFDD\n>MGYP001772517118 FL=1\nMSTYIRAVVAAMAIEEKYGIPLGDLVDTFADIPAADVVEVVHGRWVFGKDLADSFGSINKNKYHLYCSECRNQAFNKTVDNDPDFDVDTPFCPWCGAKMDKEVIL\n>MGYP000932959631 FL=0\nMAELLKVEKLWAGYGEAVVLEDIAFSLQEGDSLALLGRNGVGKTPLLSTLMGAARHRSGTIQFAGRDQDRIAVGIFE\n>MGYP001710201224 FL=0\nMEKELDLLIATEMSGDGDSVAEELRSVFAKRGVTVHRIEFRSGKDSVIRSVRANPQIHAVVLSQYQDQEKLSPRDIDQICSTAEGDLQVFVVVSEMRGSDYMKEIESLGIYTAVYQEDASFEKIADCEAIRPDIAGIMGAFGAALIAREHYEDGYVTTMLDYQKICELQFETSMAKCKGCTNNCRLTINKFSGGRQFISGNRCERGIGGQKNAHNVPNLYEYKLHRLFSYESLDADKAPRGVVGIPRVLNMYEDYPFWFTFFTELGYRVVLSPSSNRKIYELGIESIPSESECYPAKLAHGHVTWLIRQGIKFIFYPALFYERNEFEDANNHYNCPIVTSYSENIKNNVEEIAGGEITFRNPFMSFRDLGTVTDALTKEFTEIPAGEIAAACEKGWQELANARHDMEKKGEETLEYLRQTGKRGIVLAGRPYHVDPEINHGIPELITSYDMAVLTEDSISHLAKPERPLIVSDQWMYHSRLYAAASYVKT\n>MGYP002084656506 FL=0\nLLGFVDVVGGEDDGHARVAQRAHHAPHVLAQLDVDARRRLVEKQDARLVRQRLGDQEAALHAARQSEDLAVLLVPQREVFQHLLDVGRVRALAEQAERIDLAVVSANFFEVFGARAAQGRLFSSADEQAGHAPVVVLSHAFWERRLGADNAARVAELVGANASFELCETLKDLANLPRVVQAKRN\n>MGYP003719918597 FL=0\nLGLTVSGPLEPEPGPALDKIVTFVPVGPSIAAVHTALSDAGAGAIGNYSHCSFATAGTGQFLPLDGAAPVIGSVGRLERVAETRLEMVLPRSRRRDVVAALRAAHPYEEPAFDLLEMAPLPSSLGLGRVGELAALGQQRHAVQQLDGAALVLPRGAGVAQPGDQRMRRVX\n>MGYP003357866643 FL=0\nFVLQMIWKNKSQQSFSRLFYHSTGLLAPGGWNGAFRSIYPTLLCITISGAATLYGSIQKFVPTTWVEFYFHPTINPFSLEPAHLGSFYNQRLVYLYYLVHGSYRFVASWTVSTSSYSFYRTCLHLCDSLSNLYHHCSKLCRLSSPLDLLDLCYFAVSQSTLYNTVLWQLRSRNTSARNLPILWRNQQIVAHSR\n>MGYP001703284989 FL=0\nSNLETACCQIVSCSLXNXXXFYIHLGXGNKKQFIKIRIFRNSFWXFFFYIYKRFNFKIXRYNPNRQNRVYKXVDVLX\n>MGYP000305843427 FL=1\nMAQIIVLGAGTGGVPAAYELKSALGSDHQVTLVNASSRFQFVPSNPWVAVGWRKPDDTSLDLT\n>MGYP003518858476 FL=1\nMILAGITLFNPDVARLEENISSIYGQVDRVICVDNGSDNIKSIEDCVLKNWKNITIINIERLKSGQF\n>MGYP000766296581 FL=1\nMVCSIEKVSLRHERRVSRLAEDYVIEMLHITKEFPGIKANDDITLQLRKGEVHALLGENGAGKSTLMSVLFGPVSYTHLTLPTILR\n>MGYP000585817851 FL=0\nAVLVAFDTAEEFEAYQEGIEDAFLIALNGLFETSESVCNRDFRFVESVQAKLGVDVNQDYFDRRLQEDSLTTSNPSERPLNEPISFQATVEPANQEPTTNPSISLGPSTSHQPTFEPTYAFSSSLNAILFVSGICNGCENSIIWTNQINGRARHLGGEDDQPQNWSPRRSLEEEQAESSCFCPISAIVQDVALVASDVEQQFQSQLSRSS\n>MGYP000583006313 FL=0\nMTGQRFSNKQVRDMERLAHLTSALLVAV\n>MGYP001048952483 FL=1\nMKRNRILIVEDEQKLARTMGDFLRFQGYETCRAANGREALAIFYRERKTLDLILLDVMMPDISGYEGLKEIRKTSNIPVIMLTARSSVEDQMSGFEKGADDYITKPYTLELVKLHIEAVLKRSGKLAKVLEYQDISINVEAQKVYWKGNYIETTRKEYELLVYFIENSGIVLARNKILDAVWGYDYVGDIRTVDTLVKQLRKKLTEECTYIKSVYGVGYLFGEGGYEE\n>MGYP000370032573 FL=0\nTATTEIYTLSLHDALPISARFWYAAASMKSHLSGGKALTAQKY\n>MGYP003323358317 FL=1\nMASIRSRNGRYQVQVRRADLGSRSRTFVLKQDAERWARKMEAQFDQGELQQLRTKDVVLHDLIDRYRREIAPAKKSRDTEGVRLARLMRDPIASLSVGKLTAHELALFRDRRIKDGIRTCQYDLVLIRHILEIARKEWNLGLAVNPVDQIRKPNGLRPRNRRLEPHEETLLLDGCSKSSVTHLKPIITLALETAMRRGEILAIQWGDINESLRILSIPVTKNGRLGHPTIKYGPDDSPGDSKGHF\n>MGYP003316122480 FL=0\nPKVTRLTHPHRRHLAAARLDVHHRGELRVGLGGERRGDAHALDAGLGGGHGRAVIVLARWRCWRRIAQAVRAARGVTIFAREVRQLGELKGNSAQLPADA\n>MGYP004316249655 FL=0\nMIRNDTLRLYNQRLTSGDKMSTNPDEWKDNLIRQLAEMFKGMNMPFDENMIRQMMEQFSEQFEEMGIDPEKLGSVDMKVDMKNFAKAFSGGADMTEIFSNFGFNVEVNSPPVEVEVDGTPNSSKNEIMKLPEADWYLDGWNMCLTVDCNNSLSSDDEKVNLSIVNNGGLLEISLENAPQPFARIELPHPCESVEEIEINNGIVDVILKLMPQGSALDDEDD\n>MGYP002631629027 FL=0\nKPEITLNMTDGSNNRFAKIYYLDNATTSFDNGYDGETFGGIANTTDVFTHLVANSEGKKYQVQSLPNSDFENMIVPVGIKAAAGKEITFSAEAINLPDGIKVYLEDRTANSVTLLSEANATYKVTLGESLDGIGRFYLHTKASGVLSTSEVALDNISIYSPAKSTLRIAGLTQGKASVKIYSVLGKQVFANTYNTTGVIDMNLPTLATGLYVVQLATEKGTLNKKITLE\n>MGYP001549131463 FL=0\nQLARRFCTVTITRMPDHKGRKTMKFILIAPVLANLLFFASIASAEKTILAGGCFWCMEADFEKLEGVSDVISGFTGGTLIDPTYNGNHEGHVEAVQITYDPDTISYQDLLKHYWVNIDPFDARGQFCDKGPSYLSAIFVSNETERGIAEQLKKDVEEQFPDKTVVTPILDASTFYPIKGSEGYHQDYYKKSPFRYKTYRWNCGRDKRLKEIWGDKAVDT\n>MGYP001793035123 FL=0\nMRTLWVSAAAGAPLQSNPTTPGTQARGVEDGHRATTAAAGKCHR\n>MGYP000255802630 FL=0\nMEEKNISRHPDQSLKQGRKCVTYMYENRPNIWLQIQRDFNMIRAQTPAKVEMDPEEIYILG\n>MGYP004001795269 FL=0\nGETIGFWDGDALITWTSNIQGWMSHSGFEFSNKMQTIEIYKSNYDSNGNFSGINHEAIFYDPEALLEPVRIVRDLNKLSSFREGDPIVFTECIQTIFPQNGRGEPVAPGTVIEYKVPDMYGQPWRQIWEEYFEQDMDIPKEDDIFSF\n>MGYP000644120371 FL=1\nMKKRTPWKLIPLKSVPIFILLLLSLGGTQAFSFSPTVVLGGRLDQVFSPQSAALWGDMYGFGSWRTTLGSEAYAVFNADSSFSLPLDQQAASVDQHSLSAQVGLSLPRGSLLLSSETFFSIKDPLYGLTMLPDWRGRYGIALDQKSTKKAYVGYSGSYLYQEKGTEDRLSQSTAIGFIYEPSFTRSYRFELNGSLDDLRQRETSSGQQRRDYGTAGEFEVSGLAGYFMDWSLQILAGARLSNDPTYEASIADLEAQISWGPTRNLNLSALLYGEGLSYWERTTEDGSDELTRIDIGGQVELDWTFNNSLYYTVRLTGAHILSNEPSLASWDISLGLGIEWGF\n>MGYP002638041597 FL=0\nKAYRENMPFDQFTIEQLAGDMLPDATEQQRLATAFNRNHRQNGEGGALAAEYFVENVIDRVETTSTVWLGLTTGCARCHDHKYDPISQKEFFQLYGYFNNIGEKGIGNGTKANPLMSIGSPLERAPADHAEKVAALDAAVATAEKDLPARFNKWVTGAHAAAIDPEAVWFSADSVMSNTVAGKKGSLKLLPDSSFRYSGKTTTGVDYNLKLAPG\n>MGYP000692869867 FL=0\nMESRTVAQAGVQWRDLRSLQAPPPGFTPFFCLSLPSGWGYRHPPPLPANFFVFLVETGFHHVSQDGLE\n>MGYP000986204494 FL=0\nMKRLILVPLALILLKVLAACSSDEEAEPEINQVAYSAMDNYFVGPQYLPAGMTKLTLTNDGQELHHQQLIAIPEGMTADRLLVGMAEGGDAPPPPGVEAAGGASALNPGLAGLVTQNLAAG\n>MGYP003576055532 FL=1\nMFRTALMAGVAVLAGVAVGFGAIEASAPVSAAEAIPNFAPDRNTGWVLDRGNHDDLLPDGSRPGPVTFDKAHPYIPNAQAKGRQPTYRVADLSNPILQPWAKEQMKKANDQVLAGKMPFRARELCWPIGVPGFAVFSAVEPTYIFQKRDEVIMINQGGPEIRRIRLNAQHSANPKPSWYGESIGRYENGDTLVIDTIGVTTRTFVDNFRTPHTDKLHTVERYKLVDGGKAIEISIEVDDPGAFTTKWYARQRWNRVQEPLTEIHCNENNEDLFNLYPMPSPKAEKPDF\n>MGYP001236546810 FL=0\nMKQAIRVAEAQEIVLQSVQPLGIEKVDLLQALHRLTAEEVIAQRYIPLEDNSAMDGYAVQHHDIATATTERPALLTVLETLPAGKTPHYQVAPGTAIKIMTGAPLPAGAE\n>MGYP001162411550 FL=0\nMLSRIVTLKVLLKELLGHTTPIIPLMISWMIFKFSTNFYDGSTDSSKEKLKSLDINVISHPHNLGYGAALKTGIKNAKFDTIVISDIDGSYPPKHIPELIKIYEDSFDLGNGLDMVVGARKGKEYDGSFAKFIFRKLLKFLVEWTTGRTIVDINSGMRVFSKKTVSNFLQQLCNTFSFTTSLTLAYMLNAKFVKYESIEYDARQGNSHVRIFRDSLRTLQYIVEAIIYYNPLKLFLLFFIFFIFISLIFLILSIYIKSILFMMIMASSVIVAFISLFFGFLLDLIRQNSKQK\n>MGYP001489463811 FL=1\nMFAGACCRVEKADSVLCGDDQFVSVGHDVAYNIRGQCGRVARFHPVNGKAVGVQVEFVQSSQVCADPHNLLCPVVIDCLELLCEILFLPSSWRYQR\n>MGYP001439564737 FL=1\nMSFIIRAARMDDVQALYEMAKRTGGGFTNLPPDRKSLTAKLERASAAFARTGDGIADDLFVFVLENLDSGEVRGTCQIFAQVGQKWPFYSYRIGTLTQHSVELDKTFRAEMLTLTTDLEGSTEVGGLFLHPGERAGGLGMLIARSRYLFIRNHRARFGDRTIAELRGVIDEAGGSPFWDGVAGRFFGMNFQQADEFNAVHGNQFIADLMPKHPVYTAMLPESARSVIGIPHPSGRAAMRMLENEGFAWENYVDIFDGGPTMTARTDQIKSLREAIDSRIVAIDPSLSERSSGETASPAHGQLPPPRAAYDLLDRREDGIAIDPDAARLLAVEPGNEVSHVSRA\n>MGYP000479884579 FL=0\nMRLKNPELFRQQCFVAGEWIDAKSGKTFEVYNPATGGSVGHVPVMGRDETRAAIAAAEAAWPAWRQLTARRRSRIVRRWYELIMENQEDLAVIMTVEQGKPLVESRAEIANGANFVEWFAEEAKRVYGDTIPMAQAGKRIVVIKQPIGVCGAITPWNFPSAMITRKAAPALAVGCPVVVKPASRTPFSALALARLAEEAGMPAGVFNVLTGPAVEIGAELTGNPVVRKLSFTGSTEVGKKLMRACASTVKKISLELGGHAPFIVFDDADLDEAVAGAVASKYRNSGQTCVCANRFLVQEGIYQTFADKLIRAVSAGLTVGNGFTEGVNQGPLISLDAVQKVERQIEDALSRGARIGCGGKRIEGNGFFFEPTILLDVTPDALISREETFGPVAPLFSFATEEEAIVMANDTPYGLASYFYSRDVGRIWRVAEELEYGMVSINTGIMSTEAAPFGGVKESGIGREGSKYGIEEYLEIKYLCLGGLDKT\n>MGYP001249954087 FL=1\nMRPGFAPDFAEANQDKLMIFGLLRKNNVNAVIVERQYGILTTAARRPEFYLEANVPDTVMGRFEMLSAVLILYFRRTRQSGEAVKTIAQEIVDAFFEDLDHSMRELGIGDNGVPKRMKKLASMFYGRVDSYGTALDANDSQALAAALKRNFHPENSDETLTMERLALYMTEAARALDSVPESVLERGELELPPFNGGAADAAHV\n>MGYP001276526933 FL=1\nPQHSDTKGFTTTSVALPDGTAGVQVSMTIVSAGSSILEFAAQADNRTEKMINGAVRKRVS\n>MGYP003150834777 FL=0\nMALISRSQHEAFECFENDVLMMAESDEMSGSSDDKTPVERLQVA\n>MGYP000526089798 FL=0\nPYAEWIAGYGDPAYAGTVDRAMGIGSEIAETLKTEERLAMTAAFLRSNRLEWMFWDAAWRLEAWPPIHRDAGVPPRQ\n>MGYP003495424184 FL=0\nMEQIVANLALMKKNLKQIGYQGEILLESLDYHEGGAYERVTEPDFIREVVEKSGVKLLVDFGHLLMAATNNSLYKPDQ\n>MGYP000214496963 FL=0\nQHPNVPEAHYELIPKRAANPMKTDWLHPVRTWRRRRATSVPFPREWDEILARNFPLDARLPERDRKELRKRIQIFIAEKHFEGLGGLKLTDEVRVTVAAQACLLLLHCGEKDYPRLSSILVYPTAYKAREVSRSADGLVTEGEEVRLGEAWNLGAVVLSWHDVQFGAGDYHDGSNLVLHEFAHQLDMENNVANGAPLLPRRSMYVAWARVLGREYEHLRQEVAKHHRTILDRYGATNPAEFFAVATETFFEKPAQLHDRHPELYELLREFYRQDPRSYFTRPPGAGSPGSETAG\n>MGYP000694618993 FL=1\nMVSLAFISVHLSAVIGPVGRLHGLAHDLAIRVLGQLLHKLDMARALETAQAIGAEAVDGLVDARVTGCLPLLEHDVGSHGFAPFVVGAGDDGGLEHVGVAVEDVLDLDRGDVLD\n>MGYP000858948085 FL=0\nWTRRVPHPVLIGHAASLTSVLLSPLRGAARAGGRTAQARRGPAAQVRGAPGARRPAPPTRDAPRLRPDIGRASGPRRGALTCGVLAEGYHGLGSRTRRLQCPHRHPRCGEVVGEPRRGARRVAAGRRRRRPKWTRSVQLVREGGGGGGGGGEGAGGGGRTLRVGSSPAVHSRQHNQYVFQAA\n>MGYP001041972360 FL=0\nHGGDYNPDQWIRTPEIWDEDMRLMKLAGCNAMSTGIFSWSSLEPEEGRFEFGWLDTIMDKLAANDAYAVLATPSGARPAWMSEKYPEVNRVNEAGVRALHRGRHNHCSSSPVYRDKCNIMNSKLAERYRDHPALLVWHLSNEYNAGACHCDYCYAAFEKWLRAKYNDDLDELNHQYWSGFWSHSYSKWNEVRPVDGSVHALMIDWRRFLSDQLIDFCKAEIAPLKKFTPDVPVTTNFMGF\n>MGYP000630167433 FL=0\nNFTRKYPTLESGSKVKIFRKKKNFEKERTSTWQNEIHEVISIGTSHGQTFFKLDSLPKEYLHNELLKVS\n>MGYP003587511970 FL=1\nMGKILLVDGSSILFRAFFALPHFTTTSNIPTSAVYGFLRMLIRIIKDEKPDYLAVAFDKKAPTFRHIEFKEYKAQRPKMPDELSLQFDIAREILQSFGINYFEIDGFEADDIIATFVERLKGENIKISILSSDFDLSQLIDDNVELISPKKGVTKIEKIDKEKFIQEYGFEPTSVPDYKALTGDPSDNIEGIKGIGEKTATKIIQEFKNVENLLKNEETCKKYGIIGNEEKILQNKSLCVLVRNVPIAFELESLKLRDFKTENVKAILEKYEFKSIVKELGLDKVDFNEESIFNSLPKEIGKEEYRVNLESENTAVVYLISSEKRIDKAILFYNERFYDFDFSSNLFLNPSELDVLKKVLEDETVIKYTNSYKSLLKLGNFLYTFVNNVKLDSTLASYLIDPDQSEFSLKNLAFLLGKDETFNSFSDEVVFLKKNGDYILDFLKKEKLFELYETLEMPLSRVLFEMERKGITVDVKVFKSLKEEVEAELSKLENEIYKLAGLSFNILSPKQLSSVLFDVLGLEAPPDSKGSTGSSTLLEIVNKHPIIPLILKYRHLTKLLNSYIEPIPRLVSKETNKLHTIYHQIGTATGRLRSTNPNLQNLPVKDEWGERIQSGFVVSSPDSVLLSADYSQIELRVLAHLSSDENLIDSFLNNYDIHERTAMEVFNLKKQEVTKDKRNLAKAINFGIIYGISPYGLSKQIGTSKEEAADYIDKYFKKYPKVYEYINVAVEEAKKTGETRTILGRRRLIRGLDDRSAAVRDAARRVAINSPIQGSASDIIKLAMVKIFNDVSDVDILLQIHDELVFELKEALVSEKGEQIRNIMESIVNLKVPLKVDVSFGKNLGTARK\n>MGYP001804161484 FL=0\nYWMIGTNSSNLRPPTGEQSREGIMLYFTMKTICTKISCLXQSQMALVHRTXSCNQPLNAMFTFMLLWDFAKKTQPTXSLFFGSIVIFSLAHIGSQIWVEKNFMKNHWPD\n>MGYP001421152768 FL=1\nMLVGGAAGDAGPPVRPVPPRPGRPAGVDPWSPRGAALSAARTGLSPGAPGLGASGDTTRAARRAPRASDAQKTLRPPRPGDVAARRGPARVRPRAR\n>MGYP000446294339 FL=0\nLIVAYPITKNGAPATAADIDGTNNHGDLNDGDRITFTFETTVTGTVDQWVEAEGRLDWEDDTITSPYHNESKGRVQIQDDEQTYTPKDTDDMSIQSVPVYFNHGTNPIMSTAQTYHLHSMNYQSNTKVVTDGFYTRIKDDRAISTGWKLTAKLSDFKDSSNAPMPNGTGTSLKLENMSIERVTDRDTPQETIDPSPTGTDVPSSVQSTETIVAGQPTAKTLVTAQPNQGQDTWQLRMPFDKISLNLPANAGKKGTVYKAKLTWSLDDTP\n>MGYP001472249376 FL=0\nMDYSVSEGINFFDTAEIYSVPPTAESYGKTEEMIGNWFEKRKNREKIILASKVAGPGCDWIRGGGNSFDEKKIGEAIDGSLKRLKTDYIDLYQLHWPERSTNFFSKLGYRHNKNEGSWTAFEDILATAQKFVDQGKIRYLGLSNETPYGLSKYLHLASTHKFPRVVSVQNPYSLINRTYEVGMAEMSVREKVGLLAYSPLAFGMLTGKYLNGQMPEGSRLKLYSKNFPRYQGTRSQLAVEEYYKIAQKYEMSLTQMSLAFVNMQPFVDSNIIGATNMKQLEENINSIHIDLSDEIIKDINAIHENNPSPAP\n>MGYP001245916141 FL=0\nVDTMQSTPVESGTTTFTAEEEEMAQFVSVVLKDTETIWGEIFKQAGSTYRQPSLVLFSGQVQSACGYASAASGPFYCPGDEKVYIDLSFCDELKTKFGAYGDFAVAYVLAHEIGHHVQNLMGILDQVNAQRSRLSETKANQLLVRLELQADFLSGMWAHYEQQMDYLETGDIEEAMNAAAS\n>MGYP003647845281 FL=0\nDYVTMPDSDVFDWGTGDFSISWSIYFTTIHTTTAAYVNNMFGSSLSGVGLVIAYKNGANLFLLMNNTTVIDQSYSLSTGQWYQMEITRSGTSINWFIDGVSRATATSSANADKAAPLAIGASNEGGYRASDRDIAGYMDEIQIIKGRALNTSNFTAPSAAYSDPQAPANNFTNNNTVTTTTHTPTNLNCLLSPLDKNSATVLSNGNRTQSDLGASW\n>MGYP000974398092 FL=0\nMVRRQEADRYGLAAVDHRAPAAVVFRRVEVAQRLRNVVVVNLGVVLGDDAVERRQRTVVDGVGIPVARHLPVGHAQREVGVGVEGPLAVPFAQTFNIGGVEFVENFAVEVAQRLGSQHPRDMVEHAFGLLAQSGGRLHGHAVGAFPDGLEKGVGMGFRRFVAGYAFGEGGYAVDLRATAVFAECLAPERPLGGLAPCETLLGAFFGGIGCRQRRQRFAGDLVSEIGIHDTAVFGAQAHHFGVFGVLHGPESELRLVIEFCCDGPAAVDAQRFALPFFPGVGDRGVFGGIVDAQRGVGLLRFGDDVEAPRADSDLGRIGTFGDVGHGVGKDILLRVARESVDHREIALFDPFRRYREMFFRTIRNVPGRVGRRAVVFRSIDAEHREVARVAGPDPVVGVAAELADRRGRRGHEAHVVELLVDEQELLVAVVHLLDRGPETLAFGLGPADDLLGRLPGLQAVGHLLHAHEEADVEPFVGQLFGPRHGPESVREVVVLDGRVALDGVVAAVVVGQQQPFGRDQLARAAAVEEHYGVLHRGLVDRIDVFGREAESFRAHVVDALRDEARKPHALVGQSRQDSEGREQ\n>MGYP000161612758 FL=0\nMAKQSKNLAKVQSMLDGTYGGKTQVGYGDQDSKHRSVGDTWTDSEGYEWEQKEGFRVKNSVMPAVGMFNHQCKDCKKNCSPKTAKPWDRDCFKADGRCYYCQLDYEVELKTKPIRWFAYRRLKDLQNMESLEKDMIQWVDEMTKQREKNPFDMKVANAMANGEVEMSIKKNTQ\n>MGYP003493975136 FL=0\nCIQPXRXMXGFLIVKLRPIHQLPLPQVQHGHPGAIQLGQDIRVRYXHETSESPNHALQIIVYPKSKDLVSQSMCNHSIKDTNMPSITWILKLVSKRYSR\n>MGYP000200203148 FL=1\nIWGVLPVFGGILIFVSMASLGLPGLNGFPGEFAITRSAWGIYTWQVAISMVGLLMTGAYVLKGIGETLHGPVKPEWRNLPKMTITEHAVVWPLMILILSLGIWPQWLQAVINDTATMILGG\n>MGYP000071017550 FL=0\nMKKFLSLMLAGLMSASLFVVGAAAEEPKKETVVGKDGGVLDADFTKNETSNDNNINVKVEAVTHKYAVDLTFNFTDLTIGGLVWNVETLRYDFAEGKALTDSEQTITVTNRSDKPVYAWGTVTDGDANDYVTVGMKTGETGSGTNDRLEVAKATAGQTANGTATNGKLTVSISSANWANVANYYGKKVAETEDPSTVNFKAATVTVTISKNATK\n>MGYP003685103309 FL=0\nMKKNIISNIVKQVRTNEPIEPDTVLLGLILVSLGPLNIFPTT\n>MGYP000129413943 FL=0\nNLKSIQYGGSLQFPACTHRKDKYDGIREEIELWLDDMMVKVNDFTVEKRYGEALNYYVHDIFPTALKLIVKIERWMAREKRREMEKRLARSMLGNINTHMVDPEELTNKRLRGLDTYFYGMMNEQIVVLIEHLKKCRMEGKNGWDPSFLRRDLIMRLAELYRGEFRSKNYKKKPEYVGEKYRYLITR\n>MGYP004202648141 FL=0\nFQTQFFEFCNEIEPFLYELAQILLRGEKRENDVRRLSQNTYKRLGM\n>MGYP003594687530 FL=0\nMYPQLTTQPGAIASAAAIARGELSPLEAVDAAIARIEALDGPLNAVVVRDFDRAREAAKALDGKQPGADQPLFGLPMTIKESFDIAGLPTSWGIAEHKGHIAQGDAVVVRRLKRAGALFLGKTNVPPFLADWQCDNPNYGRTSNVHDHARSPGGSSGGSATALASGMVAAEYGSDIGGSIRIPAHFSGVWGHKTTWGAVSGDGQNFPETDGHEIALGVVGPLARNGEDLALLLDLTLDLPLPKADKPIGQSRFLYIDRHPLCEVDDAVRGP\n>MGYP001596028094 FL=0\nSERAGGSAIPRERDSGGVRRSDSEIRGSDNRRFGKRKPHHEKSDRKNEKKLLHKC\n>MGYP001229890441 FL=0\nTGRIPVWWGFVHIVSKAVVSASIAGIPCAHDLASIDATLANDRIDDPHVAMELAEFIRDCFMKSKSKLYQLDNTATLTEAENKSTAWIGSKYFLQKSGYYDSNYSESGRKDWSFNPTRDAGFESSKTPGGKGGHPICSEWWLDRNVGLRKKLIGSIDNNYFTNLMTIIGSPKYFNPVGNATDRENILLRKYLALQTNNSGYSGSGLNQSFGNSYAERWTLDRSQGSDIQASISYGLGNVAIDGLVVASAAVGGLLKGPGALVEGVMIREGVTLFQGFLLMVFVIILPFL\n>MGYP003333085768 FL=0\nMDGLKFDLAQFCKEIRTLLQVAAEGHVAFGMRNETYCFDFAYRKFVTAEASRRKEEVNWETTMSEIQEITADSGDLLGEVDTHVVSVALSHAVFGRADWAIMLSCFACLWHEVKTKYVDKEKWSLTILLDLLRSGRLSSIVAEYKQKHGYAPHPCTLLELYEKEHPDELDLHPPTPRMKKKRGAPTQLLDAKADPDQRTASNGEDAFMLAATLRTAH\n>MGYP001563487917 FL=0\nYNSQSPSYTQSNSILANVHANARSVYYNVLMSLVRGAQCDPADPYIQQPYMQQPFVYQPLMSPQFRAFVNSRYKGVGIGIKQADSLHIVKATTLPPFYLYVLAQSEVASHYVKGVPAAGGEAAPVNVLTYTLVPNVLFDADAGLVRIVNDDAEQSPIIIASTKDDQLNYNLGAASSLVLVGDQLHDTN\n>MGYP001435143440 FL=0\nMKEVIELRLSCIVYARIRVILPPNLDQTKRKRFSKRADIWGTQDPGPQRPDI\n>MGYP001552004220 FL=0\nNQAIFQLAQLEYLANMPGNEGLRPLVEAQRQVIMGGMPPSGAGATPSVTTGATPRVVPAGGAPGATPSVVQPADQYLADQAILLDSETGGVNADGTPFEPPAPVVTPSEPLPEAAPTPDVAAPTETPAPQSTILDDLQQEIDQNNALIAQRREELEAAIEQYGRAETGAGMGLPTSPGGAELIVEQIQSDINNLTNRNETLEQRIFEQRQVERETQAAAEQEAAEQAETESRMQPLIDDA\n>MGYP003921459353 FL=1\nMENLKKQGRLIMPQKKPKGNQKLLLIKKNNGTYLEEEFFDVKFVPLLNKDIK\n>MGYP000745101651 FL=0\nRSEKRLRTLAWQYEGKHIVVANATIFIEEKPAMPNRRIRRNRTENASKRGTKETLREICNRNFNVVTLINLLVMTAYPLIFTFVYSFTDYNLLRSLKKGSHFIALQNYTKLLSDPYFQQSILNTVKFTILAVIFEMFIGLVMALFVNSLKRGQKTMRTLLLLPYLLPTVTVALSWRMMLSPNYGIVNQVLQALHLPVYNWFSDIHTAFGMLVLIDVWQSAPFVFLLLYAALQSVPQSQYEAARIDGANRFKILFYVTLPNIKNSLALCALLRTIDSFRLFDKVNLLTGGGPANSTSTITQYLYNYGIKSLDFGFGSAGAIVMTVLVLLLSSVYIKRAIS\n>MGYP000475249838 FL=1\nDALPICFNLDFTYQRGFIKTWECNTSNVLIRLGVAF\n>MGYP000373718212 FL=0\nAAEMWYSMHSKVLGDSFTVKNPLIIYNDHPGFQQTNAIQGAISVGTGGVTEGLRNRVIFPVAPTNQQTNHVLGHELVHAFQYHMIINGDSTNIRNLGNIPLWMIEGLAEYLSIGRIDPHTALWMRDAVLNDEVPRIKDLDNGKFFPYRWGQAFWAYVTGIYGDEVIAPLFENTAKYGLKMSVPMTLGVKVDSLSENWRSALKSHYGRWAIKGKKEDLPGKTLLDDANAGEMNISPVLSPNGKYVIFLSEKNLFTTDLFLADAKTGKLMRKVASTASDGNVDHFNFLESAGTWSPDSKRFAFDVYENGRSVLVIKGIFKGAKSEKIRIPDVPAFSNPTWSPDGKTIVVSGLVRGQTDLYEYNLKSKKVRRLTNDLYSEILPTWSADGLTLAFSTDALSVQRGRTNGAWAMNLAVMDIAFGKTENLDVFPGADNMNPQFDKNGNLFFLSNRDGRRNLYRYDMLTKKVFQLTDLMTGITGITPYSPAITVADDRDRILYTHYNKGRYTIHQAKDADFSPKEIDPMSVDQVPATLPPFSTKQRDMVNTSLRLMDTAKDSVSMTSKKFKPKFKLDYLGGSTGVGVNTGNSSFGTQTGLAGGIDALFSDILGNNQLYAGAVLNGDIQDAGGQVSYINQKNRIGWGLNASHIAYQTGGYSYLAYTPVETSPGQTDTVLASVFGLERVFQQRLGASAFYPFSVTKRVEVGAAAEFYSSRVTEYSDYYDPVFQNYLGSDQKKQPKGPSLNLNNINAAFVGDNSYFGLTAPLQGWRYRFGAEQYFGDYQFTALLADARKYLYLKPITLAVRGLSYARTGGNSTAFSLQYPLFAANSNFVRGYDRKVFAATDDPDFIYRTVGSKMIVGNVEIRLPFTGPRRLSVIKSN\n>MGYP000608946936 FL=1\nMLSLAKRALASDYVKSAELAKKADDKQAEIDALYSQWEQAQQALDELCEESSKQG\n>MGYP001546073984 FL=0\nLIAAREERQRRKEEERRAAAEAIERAKREAEEARVRAEEEARAEAGRKKEEELQKMMQLLAEQKAARDARYAARKERLKKGRR\n>MGYP003398203515 FL=0\nLLPPWEQGYKNVFVNKAKEILAMLLFNEESLEGQLKVRTSGTPDGAETHATTQVYPLPTFHPDCQVVSPSDFSMKPVPCGYDLTRLLPTPDIARTHIKLANSVSTSSMLVIDPDNVIKHKIVPPPILDKIYIYQAINPYNGLVYGHGAPKIFPVDGLRKLDLSKFPIDGDFTLWAAREIGCGVEVLNETVAVHEFGTSQTSGAITAYREAYKLQRTLVGAAPYDSLFVPRIDSPRMGAPRTANTDAKNSTMDSVFNVTDALLEAERRTVLKRLETWISVNCYPSTFKYMA\n>MGYP001150268012 FL=0\nMQLESTGESGEDMGAVSDDMFTEFFTQVLNPELGCVDMVIFLLCSFC\n>MGYP001140916756 FL=1\nMISLIFLVMEVGICYNKWEKIFYTNGGCIIMSEENFNTENGTNEQTCSQPQQAYSQPQQTYSQPQQTYSQPQQAYEQPQQNYDQQAYNQNQQYAQQNYGYDQSQQGYGTYQQPQQQAYGSFDQTQYGYNQPASSGKGMAIASMVLGIISIPAICFWIVGLPCAIVGLILGILYNKKNEHSPMATAGIVCSIITIALLVLVLILCIVGAVSLSSLEYSYYY\n>MGYP001587054973 FL=0\nMQPKPVTNRRSTAQEIFAGCADSARQPYMNTPLQLRPVHTLLCPWPXFPGRSSRPNGAFSPVRTESSPANRAGSRAGSHAESAPTFVLRGRVCGAXXLX\n>MGYP000208465860 FL=0\nSSDLQLVEYPVISAELIMMPQNMTEISDEETAGKVLKLIDVLEDHDDVQNVFANFSIDDELLEKINF\n>MGYP003351738706 FL=0\nMKQSGGFIWVYSELGRGTTFKIYFPRVGQTVEPRTVETPRIILPADTGATILLVEDEDSLRRSIQQMLTKAGYPNGFSTELVTYVLPQWAASVQGYLKAVGIDAKISQLQVQALVQRCQGRGECPMDMGSWGSYSINDVSAVMPVFLGGGV\n>MGYP000525123928 FL=0\nMFDLFIKEVDKKLADKSLNNEITSKEYYAEKQKLKYLKPAKEYTNNLKYAKIEDMILDFKTKLEQLKFDTKLTTFEQKEFNIKDLEKNKKNNQTELEYQKEDIQKEKYDYEYHKIYQERDELSEEKLKEKIKELEDKEIEPPTEKEVDDMYNDLGYKYLGKEMSDRENYKLAETWKNLEKQDINEEHESMYMNYDELDNKITRYTFDNDLDNNEIKTYIGKRLGEDYGKNLDREKKELASKFAELEVSGRYRDIDINNPKLLLQLEKVDGLNIETLEETIGLDTKDLKKEIYIATYEEYLDENKGIMSPAKEYYTKDEKGEYIKIGESDKEETTITVDGFDFKLKNDEILKGEELEKVTQKEMVEELIKNEVEKSLGDGKRVTGISKVLDVNFLKELEKQCGYDKKDETLWDRVSLVSTINEKGEEDFQILEKYYDEDGNITYKDLEGISTLENSNRDIAIETEEIIYGKYKKVESTKTLKEYQTESGDRYAITRDEDGNLGFSEIYSEIHREDYHILEAKEIDTYSFETKWLTEGYDEFDINQSDIENAKEIFDRSKDEMEKTQENTKEDKGREL\n>MGYP001623022299 FL=1\nMEVDLEHLRKPCTCGRAHEISVRGIWIESGASGRLYEMLTEGELREFTAPVIVWDDNTSEAAEKILGDVSEICQEICLSAGNLRADSRSVEILEETLPEETDLILAVGGGTIHDLSRYVAAQRRIPFLSVPTAASMDGFLSTTADLSQDGMKKRVPARAPLYVFADTDIFSKAPYRLTAAGISDLLGKYICLADWRIAHAVTGEYICEEICSLEYKAVKDVVKRLDDIREGDAEACERLMYALLLSGLAMQMAGGPRPAFCAEHHLSCLWEMEVINESTDALHGEQVGVGLLLAEKYYRRIQKAIENGRCEIRRHEGLEKELLQTTFGSHGLYEAVMDENTPDPLDEVDPERLRRAFLEIAEILDDIPSRERLMDMMEEGGCRVSLSEIGLPESLEEESLALAPYVGRQMSLLRLGKLLVI\n>MGYP003326090123 FL=0\nVYKRQIVKTVEESFSNDFNVDKCLLKFYKNKDIEKIEKETGLSLHKGAIHCGSFSSEKADILFGDNKIESMVIAVIILEKEIGLLKLGSLDRAKYLGDEDTTFIQAHDYVDLDWYGNYDTWADFPDGNTTYRQILMHYDMRCSSSGCSGWDYTTKIIILKPNGEYNADGDPTFINAQTLANVVTPYGTYMQEGNSQGSGFSPNWVQRYTYDVTDFAHLLVDSVKMRAFYGGWSTGFNVTLNFEFIEGTPPRDVLDVQQLWSGSTS\n>MGYP001037461204 FL=0\nMTRMLAKRIIPCLDVTAGRVVKGVNFVELKDAGDPVEIGRASCRERVSDTV\n>MGYP001119331046 FL=0\nLEERIKAIMKRKHISITALVAVLVVMCVTTTVFASAAPEDREDPHQNAPETGYVYDHLGIVEDNGVSIMSKGGENGEKLYSADDGKTWMTEERYHAEYGSCYKGKLSAFESGGSPFPVGL\n>MGYP001570668198 FL=1\nMSLNKRLSWTLLTLFFIFDNFVSYYAVTYHGGREANLAIAWLVEKYPLLYFVCIPGQIVIIYFIVKWLTRFASEKVILTALVIYWPIANSSMNLTFILGHRQPAKNWLMFTAVGVLLAVVYALRNWKNKNHRKF\n>MGYP000837251816 FL=0\nGLGDVYKRQHFKAKREMEASHQLEKVGEGIRAMYSWNGDDKYAEK\n>MGYP003705394679 FL=0\nTDLNKVVTLAENGNREAQIGIAHVFEQRGQSRENIMRAIAWFHLAHNTDEDHFSSGRERGSRITDEFKRIRVESELFTEGLRSELTGTNVGVAMAGRNCSAEQRA\n>MGYP000950492884 FL=0\nMSEMHATVEAVTARIVERSKRGRQAYLDLIAKQRDAGVNRPVLSCGNLAHGFAASGEDKASIRDGKAMNIGIISAYNDMLSAHQPYGRYPEQMKIFAREVGATAQVAGSTPAMCDGVTQGQQRDVLDAASQLNRMLDERVDDPEIANKVNEELRLQYRYLDLRRPEMIRNLRLRS\n>MGYP000774599694 FL=0\nMALEKISDKQKEILEFIKSEILNRGYPPSVRDICEGVHLKSTSSVHAHLETLERKGYIRRDPAKNRAIEIIDDSFGLQRREMVNVPLVGRVACLLYTSDAADDL\n>MGYP000900149593 FL=1\nMKIKINRFKNIHDGTIGKLTITDDGKKLFECFTLEPAGADTIERGKDRRIPAGLYNVEWYNSPSQRRICPLLWNELVPKSRYILIHTGNFPKDTAGCVLVGDGHNAAGVTNSLKTYNTLFKLAQKHGLQSVEIINGAGV\n>MGYP003625506155 FL=0\nMKEVKVKLTLDDKGAVVAAKNIQDSIKDIGDEAEKTGGKVGEVGKSASKSKKGFATMAKGLKSVGVALKAAGIGLVVALVAGLTEAFSRNKRIMDGVSIVLGTIQEVFTQVADALIATYDAVAQSSDNFDALGKVMGGILTLFINPFKISFFAIQLALQAAQLAWEDSFFGGGDEEKMAQLRLDIEDTKTSISEVADEMVEAGSTIVDNFAEAVTEVGKITDIASENLSKVSIKAANETAKAHKAATDAAIIAQAMAAKNIALFDRQAEQQRQIRDDANKSIKERQEANIKLGEILEKQEEALLKQAAAVEAGARAEFAKNNSIDNRAALIAAEAATAQVLADIEGKRSEQKSNTNTLL\n>MGYP003576697368 FL=0\nITTKLDLNALHAGIFTEGEVTENSAFYLSARGSIQQYLFGDKAKEDLEKEDGIRVQQVPQDSDYQFKYQYNLDDANSITLSANGATDLAEAEFLDLSTDVLEDPDMAGDARIKNNFQNAFISWRSQPDDSSQLNVQLGQYINKGDTFWGDKKYFFNIKTTDSYVTAQYEFLLAKDHSLTLGAEAHSTDY\n>MGYP000113647356 FL=0\nVTLWIVAEGRYEPQNFQWYAIRNDDLEWDWAVGASNYKDIRAERSAVQPGKMWEIESSVDILRQQVETPLRNGFFGASGGPGGGSVTAARSSASRRSLSARSASSLAWRSAASRCLRSASSLASRTSVSAVRWALTSVLRNVSSKSGMGAGGAPGGMGVCEGLRASISRASADQRAGRAGRTQPGIAVRLWRAEQNAALPAFTPPEI\n>MGYP003702691201 FL=1\nMLSRFGYKRFIKSYKYIIGKEAVILLQFYNKDIGHYSLLINTRSSLSDPFPSIFSDFPVVSEVGGGPTLIH\n>MGYP001051415245 FL=0\nEALAVYKELVDKGADFFKSQAMFDQARVLAKKGDTAGAKDLYKKILEKQATGPLHDEVQARLGAIGG\n>MGYP000892997868 FL=0\nLSYSLAQGDGINDAHNSLVEIIDNLGVVAQDADINFEADPVLRIFLEVSDGDLSYQQSFAIDVLNLDEIAPAITSGATATAIDENSGAAQVVYTATSDDSSDVSGGVSYSIKPGSGDGEAFSIDSSTGVVSLIGNPDFESKPSYAFTVVATDAAGNSTEQTVALSINNLDEIAPLITS\n>MGYP003509546382 FL=0\nNTAEDARRAVAAVKFGPGNHRGLAAGTRPDNYGLAKSMEEFVERSNAETLVCVQLEHAAAISNVDEILAVDGVDVLFVGPSDLSQSMGFPGNPTAEPVRAAIEETLRKIAAAGRISGMPASTDSVVSVLKTGAKYIYTHLPRLIGAGAAQFRNAAASSK\n>MGYP002781630755 FL=0\nAYIRRGDGGFEEVMRIRVADVIKTVRVKATVIGSGSRARVLGVDLDITDQLLAQEKIEETAENLQAVLDGSP\n>MGYP000437988234 FL=0\nTTVASASSATGAGATGVALLEIYEVP\n>MGYP001158237079 FL=0\nMNRNLFTSESVTEGHPDKVCDQISDAILDDILTHDPNGRVACETLTTTGLVVISGEITSSYNPNYEQIIRDTIKKIGYDDPKSNFCSKTLKVLLYIDRQSSEIAQGVNENNNQEQGAGDQGLMFGYACLETPEFMPLPIQLSHRLTQRLSDVRKNKKLPWLRPDGKSQVTIEYDGYKPVSVSKVVIATQHEDLIEKFSSEEKEHSYIKEEVIKEVVLPVL\n>MGYP001046820937 FL=0\nMPEVLDGLRAAGVNDVPVIVGGIIPEADAARLLGWGVAAVFTPKAFSITDLRGDVVRLIRPAPRLAAAVCVWGLALLALSQPVADQVHLG\n>MGYP000228404273 FL=1\nMSLTMADLLFIWQLFILFEIVLFASYTFIMYIYSRKEEEFPINNNLPNVTLIIPMYNEEKVIREKIENTAHLDYPKDKLEVI\n>MGYP003201765208 FL=1\nMLTSGLGVDKNGVENTLYELLLGEADVKKTIVKDVVENLDLIPSNINLSGAEIELINMDDKEYILRKITEKLRRKYDYIIMDCPPSLNMLTINALTAATSVLVPIQCEYYALEGLSQLIHTIDLVKDRLNKKLVMEGVVFTMYDARTNLSLQVVENVKDNLEQNIYKTIIPRNVRLAEAPSYGQPINLYDSRSAGAEAYRLLAEEVINREDK\n>MGYP000603741297 FL=0\nMVPFQETPIEEPQQLALPRPQDVEQAPQEPGVEYGGILEALRDTGRQALASFPTLVAMANKPGIYDPGIYQDKEEYIEKVNDFRAEMLTDALKILEGKENEKQAYHDLFDLIKNGEWDKLDNWAGTFLGQTVPQLAMSYLTKGISGFVLESASSYQESVRKISEKKGISVEDVIREGHDKPALDFLIGTINASLELMGAKSVIKPGATGVRSIFRRIFQSAGTESGTEALQGNITKLG\n>MGYP004409704841 FL=0\nLKQVSKDFAQPARNTLCDVQWLMRNNVSLHGLLKQGSPSPALVTKLAKASPGCLMQRDGDGLLPLQFAAAYKSRFGDALVSTIREVTVRAVPGSVWPARSDEARGLRKGLRPVRTRVSGVIVAA\n>MGYP000111574240 FL=0\nHGMAEEHEPAVPALLRDWIPEVQDYRMLVFGAFLAAMMVVRPGESKPERLREIIDDINSQPKGPASAFSNMAQQLARDNIRVNSVAPGSILFEGNNLYAKDIDPVEVRYRIGMVFQKPNPFPKSIYENIAWGARIHGYTGNMDELVEQSLRGSALWDEVKDVLKKSAYEVSGGQQQRVALARALITQPKLILLDEPFAALDERSRFRMQDLLLDLKQGRHAPVHTLIDLTFVHEMAALEVRGDDLYIGAAVPVNRVALDPLVGTHAQALVEACNLIAGPQVRNTATLGGNVAHALPAA\n>MGYP001611773216 FL=0\nDDITKSLEAGAFWDAHLKEAFDQTPADGWAIDLGANIGFFSLYFAERFERVVAVEAHPDTARLLYQNVMVNGQGGKVLVITAAAYDRHTTLELATSKVHGWLEDERSFLDTDSVLHSAGFSFVEDPSQQHHLHEIRVPTVVLDEIIPESAPIRLLKVDVQGAALRALHGCDRILARC\n>MGYP000527795113 FL=0\nMKTTQYKDQSAIKTIQYKDQSAIKTTQYKDQSAIKTTQYKDQSAIKTTLYKDQSAVKTTQYKVQSAIKTTCFWSLTSLFQCN\n>MGYP000852577756 FL=0\nMARNRAEEEVEQLHFLRVGEVFEPFVPWRRNEQGKQVYIKLTRAEEVSFLYVGSQLSVRAELQQALMRLVNDGWSVEGEVVVQFDGRSEPGTDPYVYREPLVIELGKGLLPLIDPQNGAPLISKFEQIREEVAREVGLVIPPARVVDNLQLDNQYLLRVKDSPIAMGEVFLDRLLALGSLELLGQVEGWTCQDPVHRMPAKWITEEH\n>MGYP001572973866 FL=0\nGLKKLGFNTGMSETPITPVIVGDAALAHQFSRDLFAEGVFAMSVGFPTVPVGKARIRTIVTATHSEEELSQALEILGSVGKKLGII\n>MGYP000527111928 FL=0\nGLKSIWIPWLWPVFNQIFLMVFLSIWLRRSKVTTGAEWITTRFGRTRDSNLSHGVVVVFALIMCLGYLAYGFIGLGKFVMIFIPWEIVQPYIPVHIPLEYVPHVYGIAFTLFAVFYAVLGGMSSIVWADVLQYIIMTISAILIGILAMKALAVETLNVPETWKSPFFGWNLDKLDWRGIIDEVNTKIASETKT\n>MGYP000292924687 FL=0\nMKKILYMTIGIVSVILGLIGVFVPGLPTTPFLLLSSWLFYKSSKSLHDRLHRSRLGKYIRHYEAREGVSWLSKLISIVCMWNMIRIFSNREFTCTDLIIGAGMYWNWKCVVYSAYSKEVKDELSKNILDSFLLFLDHYVYNFSGNNDHFADFFAFKPFCSFRGRFYCSFNFGIGGS\n>MGYP000084281174 FL=0\nEALGGPGDRHPDDGVADGHDGGTDVGREPRDALAPARVLGQPEEAHPLSILNDPGGRELAQEEGRLRRGDRGRAHAFRPDEPGDQREEGFDVSPANERLYGRVVRNYYRFVDGVIADYLAEVGENS\n>MGYP003569383907 FL=1\nMPTYTFRNEETNEEFTTLMSLNEREIFLKENPHIKQCLSTPAFGDAVRMGMHKIDRGFNDVLQKAKSAHLHSTIDTL\n>MGYP000625040987 FL=1\nMSKRHLHLGQTLTFTADPFVEGPGAARHDTQGALVVEDGVITQVGEAGALRQGEFASVTDHGQALLLPGFIDAHAHYPQTAMIASWGKRLIDWLNTYTFPEEMRFGDPDYAAEIAGRYLDLLLAQGTTTVCSYCTIHPTSVTAFFEAAEARGMRVLAGKTCMDRNAPEGLRDTAQSAYDDSKALLGRWHGQGRASYVITPRFSPTSTPDQLSALGALWAEHPDCLMQTHLSEQTDEIAWVKSLYPQARDYLDTYEAHGLLGANGLYGHAIHLEPREKDRLREVGAALIHCPTSNTFIGSGLFDMDGLTRAGHRVGLATDTGGGSSFSMLRSMAAAYEIAQLRGRALHPAELIWLATTGSARALRLDDRIGSLAPGMEADFIALDLASTTAIAQRSARANDLWEALFPTIMMGDDRAIASTYVAGRRVA\n>MGYP003399258141 FL=0\nAGSADILTAGIAIIAASDIIIAILFIVLSIKFL\n>MGYP000308143635 FL=0\nMKRIAWVDAARGFAIILVVFGHVLGGVMSRRRLDGEGLYRAIYNYIYLFHMPLFFMISGLFCIEAMRKSPINAFISRTESIASPYIFWDFFVRTAALPLIGAFMSNPPSDIGWHARLEQALTGEVSWFLWTLYVMQILLIPFARMPIWVLFLVSLAVILYLPNSHLGTINSVVDHLPFLLFG\n>MGYP000676410644 FL=0\nMDGNISLENRLELCNSKLSEKEKMKKITAALCDMPLFKGLSEPQIQQALESFHAYTRCYDKGTYLLSCGQPPQFGLVIAGEVHIIKEDFWGHRSLLAQLGPGALFGESFSLSATPSLPVSVLAGTQVEALFFRAELFFQPSVVSACSISLVTNLLGILAEKNQLL\n>MGYP000176506859 FL=0\nMVVNKLLITSTILIATTLITYSCTEDTKSKDRLSLEQKTSVKSDAKKVCELVSNIKIAISEVSNAINEGANSSYVEALNAKAKALDVRIKEIQKRNAGNEEFMKLQQSCYEVMNK\n>MGYP001197552457 FL=1\nMSNFVQLGRYRHYKGKEYQVLGCARHTETEEEFVVYQALYGERRLWIRPKSMFLEHVQIGTKLIPRFILIERA\n>MGYP003478946207 FL=0\nMSPQSVNTRQATRQVRDVVFVDGVRTPFGKAGDKGIYHGTRADDLVVKCIRDLMRRNPSLPAERIDEVAIAATTQTGDQGLTIGRTAAMLAGLPQSVPGFAIDRMCAGAMTAVTTTAGSIAFGAYDVVIAGGVEHMGNHPMGAGADPNPRFLSERIVDPAALNMGNTAENLHDRF\n>MGYP001199610918 FL=1\nMQSIGTYLKQRRESLSLKQKDVANSVGVSSAYLNKVEKGDSIPAPAFLEKIARTLELDFIDLYLRSLEDRPLPDTLMHAMREYRSLRPLLAPGMPVERFRSFIRSMSPEQTHRILLMIESVVLMIHEAEDRGAGARAIREPVPGDGTGADRIPPE\n>MGYP003348169323 FL=0\nHQPLLHAKEKLASIINTTSGRGGKIIAPAFAVGRTQQLVLMIHELIHEGKIKEIPVFVDSPLAVNVTDAFRAQRHARKTGGHAKEKTGPALPAGEHGAHLGARQAGEVDHGVGGLAVVPGMNGRAHLERIGGIDRAHRIGEARRLHRIERRLRPVERQQPHIRPRPSRRRHRQHARLARADE\n>MGYP001430805213 FL=1\nMRIESREDLKTWASFKNISVYLDQKKILSNININIKHGENILILGPNGSGKSTFLKLLNRSIYPITKKDSSLKLFNKENINIWDVRKRIGFLFKEMEGRVNHGVKLYDLITSGFSGTFNSRYSKLLSEIEKVKVDNLINEWELNNIVNNEFLSLSDGEKRRALLARALVYEPDILILDEPFCNLDIKSSFILNQNLNRLIEQSINILYVTHNLESILPKTNRVILIKEGKIIKEGNPNEIINSKIISDLFKISINVVKQDGYWRSYPVSI\n>MGYP001428761037 FL=0\nMRIDGIQGVYVPSKKPPINPLKKAVGRIRDVIATPKKYTHKDRLREQWSNSGSSLSYREYATTHDHTIKTPASELVKRFK\n>MGYP001559191903 FL=0\nMLILMAYIYKKTIHGKQYYYLRVSKRVKGKIVVKDIAYLGNDASKLDYAMQKLPLLYKKDIRKAYRNIRKFVQEESFSVANKSPATIACAGAINPPETKEKIQYLKKSFKGMPYGAAF\n>MGYP003492916345 FL=0\nTMGKNAKFFPENIWKFELKKHELLIIMP\n>MGYP001589567138 FL=0\nVQDVEQIVARALAEFAAAPDPAALENSKARYLGKSGELTALLKSLGTLAPEARRSAGAAINTAKARLEQALEQRRAELANERMQARLAQEALDVTLPGRGRGRGGVHPISRTWARIEAIFGSIGFEVADGPEIETDWYNFTALNNPENHPARSMQDTFYVDLRDSGGLPLVLRTHTSPMQVRYARTHRPPIKVIAPGRTYRVDSDATHSPMFHQVEGLWIDEDVSFADLKGVFADFMRRFFESDDIEVRFRPSYFPFTEPSAEIDMKFDSGPLKGRWLEISGAGQVHPEVVRNFGLDPERCIGFAFGAGLERLTMLRYGIDDLRLFFDGDLRFLRQFA\n>MGYP001206066660 FL=0\nMIVTLNKKVLIVIRVVKIFMTFLTSKAFNFN\n>MGYP001314004753 FL=0\nFHTPNYKYEVFGSFINSKNSVKETFGLANPTEFDQLSGRAKTYAGTANFYDASNLFIDRTWSITQFFRPGKRTIQLNDTTIVPDTNTSNIKSQWFHELRYRRHINRFTDSDTNTDLFPVRYVSLETHDSMFHAVLSNRIGKVIKSKSQLIKLWGLHEAIQVKQQYFHSSNLSHLRFGAEMSKTLLSVKHDFYAHISALGYYQGDIKALYGFNPELEKVDVRAEASITRRRPDYNDQFFGSNNYYWNQDLNQTQTSKLLLTIDNKKATQGIELAYFNINQFVYYDTSGFAQQFNESINHLRATAKLQLQLGSWFWQHRLTYQSTSSNVLALPDLSVKTRLYKEGYLFNKNMWARMGVDLQYFTPFTGTVYNPIVRQMTLSNTEIGGFP\n>MGYP001770970470 FL=1\nMIRSIKYGLLLLLPGMLFTAQAADRQDVKCHLITSKGEQIAFYRWDLDKQQLFMARLSGKSLKDARGKRYFIREARECVLLKEAFSSEKARKLDEMALR\n>MGYP000978871530 FL=1\nRAEPAELDAELARLILLSEQRRLAILAPLLTGLTLLVACFGVLANARGTLPNGFGWILCIASVACAYEWLAGLFVARLAQKGRQPARFRFYLNALVELGALAVMTLVLARTNNPVHAISGPASYSYFLFIILATLRLDFRICVFTGTVAAAAYTLTGLLHWNALEASFSE\n>MGYP003540537710 FL=0\nTPTAVTPAAPVITPTIVPNAPSVTGQAIVAASTTVTPPAAPKTVAEAYPTLISNDRGVTSLDKAFSLRKIASRFLGSVSPIETLVNALSSTKAMINFVGSTTTKHTLTPLAQVFYRETLPEIAGKLINTLNTRLSAALDGTNGKSALGDLFSNPTMSKKGELNIPQDMVRGRVFNITEMDA\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/nt_rna_2023_02_23_clust_seq_id_90_cov_80_rep_seq__subsampled_1000.fasta",
    "content": ">XM_032924760.2 PREDICTED: Daphnia magna juvenile hormone acid O-methyltransferase (LOC116918952), mRNA \nCAACAGTGTCTCAAAGAGTCCGTGACGACCGAGTGACCGATGCTTCAAGCAGAGCGGAGAGATGGAACTGCCTGAACTCTACGCTGGCGCGAGTCCGTTCCAAAAACGTGACGCTGTGCACGTACTTACGCAGTACCTTCCTCAGTTCGATTGGGCGGAGGGCGACTCCGTTTTGGACTTCGGTTGTGGTGATGGTGACCTGACTGAGTATTTGGCCCGTTGCATCCCCAGGTGTGCGTCGTTGACGGGCATAGATATTTCAAAGAAAATGATAGACTACGCCAGGTGCCATCACCAAGAGCATGATTTGCGCCTTGGATTTCAGCAAGTCGACATCATGAAATCTATTGACGCCAGAGATGTATTTCCAGATGGATTCGATAAGATATTTTCTTTCTATTGTCTCCACTGGATCAAAGACCATCAACGGCTAATGGAGCATATGTACGACATCCTCAAGCCAGGCGGGGATATCTTGTTGGTATTTTTGGCATCCAATCCTATTTTTACCATGTACGAACGCATGGCAGAACGGACGGAGTGGGCCGAATACATGAAGGATGTTGCTGATTATGTTCCTCATTACCAGTACGCTGCTCGACCAGCTGAAATGTTTTCTTCTATTTGTCGCTCAGTTGGTTTGCAGGTGGTCGAATGCACGGCCCAGGAAAGGAGCTTTTCGTTTCAGAATATCAATATTGTTAAGAATGCGGTGGCTGCTGTCAACCCGTTCCTTCGTCGGGTCCCTGTTCGACTGCGCGAGAGCTACCTTCTGGATTGTTTGATGGAATTGCAGAAATTAAAGGCACCATCTGCAGATGAAACAACTGTTGCAAGTTACCGTTTGATGATTGCGCACGTTCGCAAACCATAAGCGCAGGATGGCTGTTGAGACTTGTGGAGGGGGCAAAACCCGGAAGGCTCCCATAAGACAAGTGCTAAAATAGCAAAAAACAAAACAAAAAAAACAAAAAACAAAAAAACAAAAAAAAATTAGTTATCTCATAATCCGCATCAAGGTGAGGTAAGATGATGACGAATCTAATGGCAAACCGGTGCTGTTACTGTAAATAAGGTTTGGGTGGTTATGGGATGGTTACAGCCAATGGCTGCAGTGAGTGATTCCAGTGACAAAGAGAGCTTTAAAACATTAAAGAATAAAAAACAAAAACAAAAAAACATTGCGGTACAGTACGTGTTCGAAATGGAAATAATGATCTCGTTTTCGGGGTCCGAACGGTATGGATGGATTTTTCTAGATTTGCATAAAGGGCGGTCGATGCGGATTTGTAGTCACGCAGTAGTAAAAACCTCAATACTCCCGGTTCACTGAAATCAGCAAAAAACAAAAAGATTAGATGTACAATACGTACTCCGTGTAGTACGTAACATTTGGAATTTCAGATTAATACAAGTATGATCCACA\n>XM_052522147.1 PREDICTED: Oncorhynchus keta serine/threonine-protein kinase DCLK1-like (LOC118377397), transcript variant X16, mRNA \nTGAGAGAGGAGGGAGCATTCGCGAGGTGAGATGCTTGGTGCTTCCCTCGGAAGGCCTGCATGTCAATGAGGGACGGCCATCTGGAAATCACTGCTTAAGACACAGAAACCAGCTGCAGCTCTTGCAGCGCACACTTGCTCAATCACAGGGCAACAAAGGGACGGATGCTTTTTCTATCGCTCGGGCCATTATACTACACATATATGCACTGACACAGTCTGTTGGAGAGCTGCTATATGCAATTGCTAAAGAATTGACGCGGTTGACTGCATCAGACTTCAATTAAAGTTATGGAGCTGGAGCACTTTGACGAGCGGGAGAAAGCCCAGAGAAACACCCGCCGAGGCTCCAGGAACAACGGGCTGCCGAGCCCCACTCACAGTGCCCACTGTAGTCTGTACAGGACCCGGACACTGCAGTCCCTGGCCTCGGAGAAGAAAGCCAAGAAGGTCCGCTTTTACCGCAACGGAGACCGCTACTTCAAAGGGATTGTCTATGCCATTTCCCAGGACAGGTTTCGGTCTATAGACGCCCTGTTAGCCGATCTGACCCGCTCCCTGTCAGATAATGTGAACTTGCCCCAGGGGGTCCGGACCATCTACTCTATTGACGGGACCAAGAAGATATTGGGCATGGAGCAGCTGGAGGAAGGAGAGAGCTATGTGTGTGGCTCCATAGAGCCATACAGGAAGCTGGACTACACTAAGAATGTCAACCCCAACTGGTCAGTTGGGGTGAAGACAGCTGCCTCGGCACGTGGCCCATCCTCCCTGGGCAGTGCCAAGGCTGGGGCCCCAGAGACCAGGGAGAGTAAGGACTTCATCCGGCCCAAACTGGTCACCATCATCCGGAGCGGGGTGAAGCCTCGAAAGGCCGTCCGCATCCTCCTCAACAAAAAGACGGCCCACTCCTTCGAACAGGTCCTCTCTGACATCACAGATGCCATCAAGATGGACTCTGGGGTCGTCAAGAGACTATACACCGTGGATGGGAAGCTGGTGACATGCCTTCAGGACTTCTTTGGTGACGATGACATCTTTATGGCCTGTGGTCCAGAGAAGTTTCGCTACCAAGATGACTTCCTCTTAGATGAGAGTGAGTGTAGGGTGGTGAAGTCGACGTCATACGGTCGGATCTCCTCTCTGCTGGGACGCTACTCACCCAGAGGAGGAGGCTCACGCCGAAGCTCAGGTTCAGCCAATGGGACGGCAGGCAGTCAGCTGTCGACTCCTCGCTCAGGGAAGTCCCCCAGCCCCTCTCCCACCAGTCCTGCTAGTCTCCAACGACGCAGGGGGTCCCAACACAGTGGCTCGTCCCTGTCTCTAGCCTCCACCAAGGTGTGTAGCTCCATGGATGAGGGAGACGGAGCAGGTAGTGAAGCGGAGCTGAACCTGCTGAGTGATGAATGTCCCTCCATCCCTCCGTCCATCGCTGAGAGGTACAAGGTGGGGAGGACTTTAGGTGACGGTACCTTTGCTGTGGTTAAAGAATGTGTGGAGAGATGTACCGGCAGAGAATACGCCCTGAAGATCATCAACAAAGGCAAATGTAGGGGAAAGGAACACATGATCCAGAACGAGGTGTCCATCCTCCGTCGTGTCAAACACCCCAACATCGTTCTGCTGATCGAGGAAATGGACACCTACAGCGAGCTTTACCTGGTCATGGAGCTGGTCAAGGGGGGTGACCTGTTTGATGCCATCACTTCCTCTAGTAAATACACAGAGAGAGATGCTAGTGGGATGCTGTATAACCTGGCCAGTGCCATCAAGTACCTGCACAGCCTCAACATCGTGCACAGAGACATCAAACCTGAGAACCTGCTGGTGTATGAACATCAGGATGGTAGTAAGTCTCTGAAGCTGGGAGACTTTGGCTTGGCTAGCCTGGTGGATGGACTCCTCTACCTGGTCTGTGGCACCCCCACCTATGTAGCACCTGAGATCATCGCTGAGACAGGGTACGGGCTGAAGGTCGATATCTGGGCAGCTGGAGTAATCACATACATCCTGCTGTGTGGCTTCCCTCCCTTCAGTGGGAACAGTGAGGACCAGGAGATTTTGCTGGACCAGATTCTAACGGGACAACTAGACTTCCCTTCCCCGTCCTGGGACAACGTGTCTGTCACTGCTAAGGAGCTGATTACTGGGATGCTGCAGGTGAAGGTGGAACAGAGATACACAGCTCTGCAGGTTCTGGATCACCCCTGGGTCAATGATGATGGGCGATTAGTGAACGACCAGCAGCTCTCTGTGGCTGGGAAGATTAAGAAACACTTCAACACGGGTCCTAAAGCCTGCAGCACCACTGCTGGAGTGTCTGTTATCACAACCACCCCTCTTGATAAGGAGCGGCAGGATTTCAGACTAAGACACCAGCAGGATGTGAGATTGAAGCCCCGCCCCTGCCCCCAACCAACCGGCTTCCCCACCAGTGCCAGCCAAAGCTCAGCCCACAGCTCCAATAACCCTGCCCTCTCTCCCGCTGACTTTACCTCAGAGTCAGAAGATTACTCCCCCAGCCCCTCCCCCACCTCTCCTAGCTCCGCTGATACCGTCCGCTCCCCCACCTCCCCCTTCTAGACCCCGAAGGAAGAGAGAGGGGAGAGGAGGAAGGATAGGGGGTGCGTGTCCCTGTACTAACACTAGCCCATGTCCCTGTATTCACGACGACACTGTCAAGATGCCTGCCAATTACTTAAACATTGATTTTCCATTCCGGCTACAGTGTCAGTTTACCAAAAGATACACTGGGGTCAGAGCCATGCATAGGGGTCAGTTAGGGTGGGGTTAGGGTTAAAGGTTAGAGGTTAGGGTCAAGGATAAAGGTGTATTCTGGATGGGTTCTGCTCTGGCCCTGAGAGGTTACTAAGGCTGAGAATCTGTATCTGCTTATCTTTTTAAGACACCACACAGACATACAAGAGTTAAGCCTTATTTCAGCAAATACTGAATAATGATCCACTGAGGTCCCCTGGTGTTGGGAGGTGAGTACTGCAGGCCAACCAACCTGCTAACAGGACAGCTTAAACTGCAACACAACTAACCTACAGATCAAAATCTTCCATTTAACTTGACGGGACCTCATACGCCCTAAATAGGGCATCTTAAGTATTTATGTGATTATACATACATTTTGAAAATAATAATGATGATAATAATAATGACGTTGGGTCCTTGAAAAGTGCTGTATAAACAAAATGCCGCGTATTATTATTCATTTTGACAATGTATGTATCAAGTCAGGTATCTATTTGTGTGAAGTTATATTGCACCCAATTCATTACAACTTGTACAGTTCATTCTGTAGAAAAACACTTTCATGTCAATAAGACATGCTGTATGATGTAACGTGAAGATATAATCTACGTGTGTCTGGAAGGACACGTGGCTACGGTCATGTCCACTCCAGTCCACTTTCATTTATCCAACTGTCTAGTGTTCAGCTATTCTCCAGTTCTTGGTGCTGTTGTAGACATAATATACTACACACTTTACAGAGGACCAGAGAGGGGCGCTGGAAGATCTCCAGGCATTCTGCGATACCATATCTATTGGTTGATTGATTGTGTTTTTGTCCATGACTGTTATGCCACTGTGCCAGTTCATGTACAGTCGTCATTTAATGGACTACGAAAAAGGTTGTGTATTTGGTAGAGTATTAACAGACATTTTCATGGCTTTTTACTTTTGTACAAAATTGGCCTTGTTTCAGTTAATATGTTAATATGTTGATAGTGAAATAATGACCTATTTAAAGTACGATTATTGGCCTGAACACAATGGACCAAGTGCAATTAGGTTCTGGATCTCTTACCAATATTAGACAGCACAGACTTTTTCAAGCTATTGTTAACTATAAACAATCCATACATTGTGAATGTATGTCAGAACAGAGGTGCTATGGCAGCGTCTTTCAGTGCTGCCTGAGTTTTCCGCTTGCTGTGTGTGAGCCAGGGGTTGGAACCGGTTCAGTGAACAGAACTGAAAACTGGAAAATCATGTAGTTCAAAACAAGATGCCCAGCACTTCAAGCCTCCTCCTCCACCCTCTCTTCCCACCCACAACATTTTAGTCACATCTCACTCCCTACAATTGTCTGTCCAATGCATGTAAACAACTACAGCTTGCCCACTCCATAGCAAGCTACTATATCCGCACTGATTGGTAAAGTAATTTAATGTTGAGTTCAATGTTTTTTAGAAACTATGATTGCAGAGGTTTAAAAAGGAACAGAAAGGAACAATATAAACTGCTACTAATTTGGGGAATCAATCCGGTTCAGAACTTTATTTTGCTGGTCAGAACAATGGAACTGAACAAAAAAAATGGTTTTGTTAAAAACGATGCGATTGGAAAATACTTTTGCTTCCAACCCCTGGTGTAAGCACAGTGAGTTGGCAGGTCTAGAGAGAGAAGCACAGTGAGTTGGCAGGTCTAGAGAGAGAAGCACAGTGAGTTGGCAGGTCTAGAGAGAGAGAGAAGCACAGTGAGTTGGCAGGTCTAGAGAGAGAGAGAAGAACAGTGAGTTGACAGGTCTAGGGAGAGAAGAACAGTAATTCAGACAGGTCTAGAGAGAGAAACACAGTAATTCAGACAGGTCTAGAGAGAGAAACACAGTAATTCAGACAGGTCTAGGGAGAGAAGAACAGTAATTCAGACAGGTCTAGAGAGAGAAACACAGTAATTCAGACAGGTCTAGGGAGAGAAGAACAGTAATTCAGACAGGTCTAGAGAGAGAAACACAGTAATTCAGACAGGTCTAGGGAGAGAAGAACAGTAATTCAGACAGGTCTAGAGAGAGAAACACAGTAATTCAGACAGGTCTAGAGAGAGAAACACAGTAATTCAGACAGGTCTAGGGAGAGAAGAACAGTAATTCAGACAGGTCTAGAGAGAGAAACACAGTAATTCAGACAGGTCTAGGGAGAGAAGAACAGTAATTCAGACAGGTCTAGAGAGAGAAACACAGTAATTCAGACAGGTCTAGGGAGAGAAGAACAGTAATTCAGACAGGTCTAGAGAGAGAAGCAAAAAGCACAAGAGAAGCATGAGATGATTGATGTGTGGAACACTTGTTTGTCCTCTAGGACAGACAAACAACTATGTTAGTACTGAATTTTAATCATAGAAACAGAGGAAGTGAAGTGTATCTATCTGCTGAATGTAATTGTCCAAATTTCTGTTGTGAGAGAATGAAAAAGTACAGATTGAAATTATGTTGCTATGCAAAATATGTATTGATACCCAATGATATGTAAGAATTAGTGACTACATGTGAAGCCAATTTGATCGGGATTCATCACCAGTAGCACATCTTTTTTCCTGATGATGGTAGTGAATGGTCATTGTTCCTGTATAGCAACCCTTTAACAGTGGTCATCACCAAGCCAAACCTGTGAATAAACCACTTCCTCAATCTGAGAGCCTGGTCATTGTACTGCGTCCGTCCAGGGGGACTACAGTCGGACAATCTGGGATTTACAAACAGCAGCCACAGACGCAGCAATAACATCATCCAGCCAGTAGATGGCAGTATAGGATAATCTGTACCAGATCTAGAAGGTAGTAAGTAATAAGACAACAAACACATGCATTTTGAGTTTCCACTATTGAGATACCTTTTAAGTGCATGGGGTTATATTCCATTTTTTGTTGTTTAAGATATGAGTAATATACATATAGATATTCTATTGGGGCGGCAGGTAGCCCAGTGGTTAGCGCGTTGGACTAGTAACCGGAAGGTTGCAAGCTCGAATCCTTGAGCTGACAAGGTTGTTCTGCCCCTGAACAAGGCAGTTAACCCACTGTTCCTAACTGACTTGCCTGGTTATAATTCTATATGTCAGAATATTCGAAAAACAAACTACTAGTTTTGTTCAAACTGCAATTAACATTTGAGAATTCAGTCGCATAAGAGCTTGCTTTATTTATTGTTATTATAAACACAACAAAAAGGAAAACAATAAAAAATGTTACTGTTCATCAATCTTTATATATTGTCATAAGTTAATGTATAACAGCTCCAAACAAACACAGGGTAAATGCCTCAGACATTGCAATCTACACAAAAAAACAACATGTAAATACAAATAACTTGTGAAATCATGATATACTTAAATCTATACTTAAATCAACAAAAATACAGATCAACTAAATATTTTACAAAAAAATCTAAATTTGTTTTTTAAAGCAACAATGTCAACACAAATAAAATGCATTTATTTAGCAAAATCCTCCAAAATCCTCCTTACACAAAGATTTAAGTCAAATATTCAAAATAAACCCAGTATGTCAAATTCATATTGATGGGTATTATGAACCAAAGCAGTAAAGTCA\n>XM_051681377.1 PREDICTED: Myxocyprinus asiaticus CDC-like kinase 4b (LOC127431112), transcript variant X2, mRNA \nGCCAAATGGAGCAGGTCAAAGAGACCGAGAGGGAGAAGAATGGTTACCACTACAGCAAGTCATCCGGACGCAGTGGGAGGAGTCGGCACAGCAGTAGAGAACGCCAGCGATCACGCCATCACAGCCCCTGCTCAGACTCGATGAGATTGTAGGCACCCTGGGCGAAGGAGCCTTTGGAAAAGTGGTGGAGTGCCTTGACCGTTCAAAAGGTGGTGCAAGAGTGGCCCTGAAGATCATCAAAAATATTGAGCGCTATCGGGAGGCAGCCATGACAGAAGTAGATGTGCTTGAGCGGATAAACTCGCTTGATGGCGATAAGAAATTTGCCTGTGTTCGGATGCTGGATTGGTTTGATCACCATGGTCACATCTGCATAGTATTTGAGCTGCTGGGACTGAGCACATATGACTTTCTTAAAGAGAATGGATTCATGCCCTTCTCAGTGGACCAGATCAGATGCATGGCAGATCAGATCTTTAAAGCTATACGCTTTCTGCATCAAAATAAACTGACGCACACTGACCTTAAGCCTGAAAATATTCTCTTTGTGGACTCCACGTATGACATGGATTATAACTCCAAGATGAAACGAGATGAGAGGACCTTGAAGAGGTTGGATGTCAAAGTGGTAGACTTTGGTAATGCTACATATGACCACGAGCATCACACCTCTGTGGTGTCAACTCGCCACTACAGAGCCCCCGAAGTTATTTTAGAACTGGGCTGGAACCAGTCATGTGATGTGTGGAGTTTGGGCTGTATTCTGATTGAGTTCTATCTAGGATTAACATTGTTTCAGACTCATGACAGTAAGGAGCATCTTGCCATGATGGAGAGGGTTCTAGGCCCCATTCCTACTCACTTACTCCAGAAAACCAGGAAGCGACGCTATGTGCATCATGATAAACTGGACTGGGATGAACTCAGCTCGGCTGGGAGATACGTGAGGAAACACTGTAAACCTCTAAGGCAATACATGTCCTCTAAAACCCCAGAGCACGAGCTGTTGTTTGACCTGCTTCAGAAGATGATGGAGTATGACTCATCGAAACGGATCACCCTGGAACAAGCCATCGGACATCCTTTCTTCAACCCATTACGAAAAGTTAGGAGAAATTGACTTTGAAGGGGACACTTGAACATTAATGCTCCCGGGGAGACCTGCTGCTGACTGTATCAGTCAGCTTAAAGACTGCCTACTTTACATCCTCTGTCTGTTTTTATTGTCTGTTTGAATATATGGGCCAAATTCCTGTGTATTTTCGGCAAAATAAACTTGAATGCTTTGTATGCA\n>XM_039837429.1 PREDICTED: Pteropus giganteus SEC22 homolog C, vesicle trafficking protein (SEC22C), transcript variant X2, mRNA \nCCTCGGCTTGTCAGTCCTGTCCGCTACCCTGGCAGGAATCGAGCTTACACCGCGAAGCCTCCTCGCATCTCCAGACGTGGGAATTACAGGCCTGGACCTCAAACCCAAGCGTGTGTCCTCATGACTTCTCTTGCGGACCATGTCCATGATCCTCTTTGCCTGTGTGGTAAGGGTGAGGGACGGACTGCCCTTCTCGGCCTCCACTGACTTTTACCACACCCAAGATTTTCTGGAATGCAGGAGACGGCTCAAGACTTTAGCCTCGCGACTGGCCCAGTATCCAGGTCGCGGTTCTGCACAAGGATGTGACTTCAGTATACATTTTTCTTCTTCGGGGGATGTGGCCTGCATGGCTATCTGCTCCCGCCAGTGTCCAGCAGCCATGGCCTTCTGCTTCCTGGAGACCTTGTGGTGGGAATTCACAGCTTCCTATGACACCACCTGCATTGGCCTCGCCTCCAGGCCGTATGCCTTCCTTGAATTTGACAGCATCATTCAGAAAGTGAAGTGGCATTTTAACTATGTAAGTTCCACTCAGATGAAGAGCAGCTTAGAAAAAATTCAGGAGGAGCTCAAGTTCCAGCCTCCCACTGTTCTCACTCTGGAGGACACAGATGTGGCAAACGGGGTGATGAATGGTCACACGCAGATGCTCCTGGAGCCTGCTCCTACCTTCCGAATGGAACCAGTGACAGCCCTGGGTGTCCTGTCCCTTATTCTCAACATCATGTGTGCTGCTCTGAATCTCATTCGTGGAATTCACCTTGCAGAACATTCTTTACAGGTTGCCCATGAGGAAATCGGAAATATTCTGGCTTTTCTTATTCCTTTTGTAGCCTGCATTTTCCAGTGTTATTTGTACCTGTTCTACAGTCCAGCCAGGACTACGAAGGTGGTGCTGATGCTGCTCTTCATTTGCCTGGGCAACGTGTACCTGCACGGGCTGCGGAACCTCTGGCAGATCCTTTTCCACATCGGAGTGGCTTTCCTGTCTTCACATCAGATACTGACGAGGCAGCTTCAGGAGAAGCAGTCCGACTGTGGAGTGTGAGGGTGACAGTGTGCGAGGAATGGATCCTTTGATTTTCTTAGAGGGTCAGCCGTGTGTCCCTTTCGGCTTCTCGACTTCACCTCAAGTTTCCATTCTTGAAGTTCATCTTGACCAAACCCGACTGATACCGAGACTTGGGGACTTTGAACGGGTGCAGTTGAGGGTACGAGGTCGCTTGACACCCAGCCCCGGTTTTGTGCTGAGTATAAATTCCTGTGAGACCTCCAGTTCGGCACGTTTACTTAGGACAGCAGACGCTGGGGGCTCATTCAGAGAGAGCATTATTACAAGATCAGAATGGAATTATTTTGGTCTTTCAAATTGAATGATGTAATAAACCACTAGGCTCAGTAATACTAGTTTATGTTATTGGCAGTTGTCTCCAGGGAGCTACCTTAAAATCCATATCAGCTTTTCAGTATAAGTGTGACTTGGTTAGCTTTTATAGTGGGTCAGTACAGGTGCATTAAAAACTTAAAAACATGGTTCATAAATGTAAGCAAGGTAAATTCTGTTTACATATTTGATAACAGGTTCAATACAATACCTTTAGAATATTTAAATATATTTTGGATATAAATTGAACTTGGTTTAGGGTAAGGACAGACAAAGAAAATGGTTTAAAAGCTGAGTTTAATTTGTACATAACCTTTTGTGGTGGGACTGTGTGGGCACAGAAATATTTTGTATTTATTTGCAGGGTATATCTGAATATTTTAAAAGTTGAATAACCAGTGCTACTGGATCGTAAGCTTTTAAGCATGAACAGAAATGAGACTATCAGGATTCTTTGCGGTGGGCCACAAACTGGAGTAGGTGAGTCACGTGGATTCACACAGCGGCACTTTTCAGACGTAGGTGGGAGCGGCCGCCGTCATCAGCCTTGTACAAGGTAGTCGAGTGCCTGCCATTTTAATGATGGTGAATGCTTGACCCGTGTACCTGTTCCCAGAACACCTCCCAAATTAATTACTCCTCTACACCATTCTCAATCCTCTTAATTAGATCAAGGGCTTCATTTTTTATGAATAAGAGTTAAGTAGATATTAACTTTTTAAAAGCTTTATGAAGATATAATTAGCCCTCTGAAAAGTTCCTTTTGTTTTTTCTCAACTATGATTGATCATAGTTTTCCAAAACGTAGACCCGAATCAGGTCCCTTAGCTCTCTGGACATTGCAGCCTGGGCTGTCCGGCACCACTTAGGAGGCCTTTTTGGGAGCCTGCCCTTAGGTTGTTCCTGGTATAAGTCTGGAATATGAATGGCTCAACCACAATTGCATGGAATACTTGGGGTTGAATTATGTAGTCTTGAAAATTCAACACATCCTATTTCGATAGTTCTTCAAAGTTGAAAACCATTGATTGCAAGAGTTACTGAGCACATGAGGGAAGCAAGGAGGTTTTTCAGGGAATTCCGTTAGACGTGGTTGTTACCAGTGGTGTATCGTTGCTGAGCTACCTTGATATCGTTTTAAGAAAAACAAGTTTACGTAACTGGAAACCGTTGGGGGAAATGTTGCCAAAGTCATTTTATTTTCTTATAATAGAATTTTCTATTTTTCATCAAATAAAATATCTGGGTATGAAAGTTCTGTTGGCAACACCGTCAGATGGAAACTTCAGAGCTGTTTCTCTGTCGACTACGTCTACATGATTTTCTGCATACCCAGCAGGTGAATGTTCAGGCTTTCCGGGAGATAATTTTGAAGAGACAGTAAAATGGAACGGGAAGACAAGGAGGAGAAAAAAATTCCTTTTTTGTGATAGAAGCACAAAAAGCTTGAAAAGTTGGTAAGAACAGCTTACCAATGAATTGTTTTCTTTTTGAGCCCCTGTGCCATTGGTGTTGCCATGTAGCCCTGTACCCCAGAAGCTCTGGGGGTCTGGGCCTGTGACCCACATTCAGCAAGCAGTACAGAACAATCCTTGAGGAGGACTCCCTCCTAGTGAAGGCTTTCTACCCTAGCAGAGATGTTATCCTCACTGGGTTGAATGTGGTCTTAATCCGTTAACATCTGCTTGGAGGTTGAGATTAATTTTGCAAACAGGAAGGAAAAGATGCACTGGGTGAGCAGCACCAAATAATGGCCACGAAAACATAGTGTGACTAAAACCCAGCTAAAACTCAGCTCACTGTGGGGAGAAACTAGTGATGGGAAAGAATTTCTGAAGATTTTGTCCAAAGGAAGTCCCAGGCTCAGGGTTGGCTTGGTCCAGGCCTGGAGTTTCGTGGCCCCCGTGTCATCCTGGGTGCCAGAAAGCGGGCTCCACATCGCAGTGGTTATCCTCACCCCACCATGACTCAGTGCCGCTCCAGCACCTTTTGTTTTCCCAGTGGTTAAATGCCGCCTGCCTGGCCCACCTCACAGGGCTAGATCTGGGAATAGATGAAATCACGTTGAACACAAAACCTTAAAAGTGCCTTCTGGTACCAGATGCTGCAAGGTCTGGAGCATCAGAGTGTGTTACATCTCGACTACTATATTGGGGTGGGAGTGTGGCTCTGTTCGCAGGCTTTGCCCCTTTCTCAAGCATAACTAGTGAAGGACAGCTGTAGACTTTGGTTTTCTTCTCCCCGGGCTAGCCTAACTGTGATAGGACCATTTCTGGGTTTCTGTTTCCTGTGTGGGGACAGTCAGGGCATATTTGGGGTGGTATCTGCCTCGGTGCTAGGAGCCCCCACTGCCCGCAGCAAGAGGAGTACGACCACAGCCTCCCGGCGTTGCTTTCCAGCCTCGCACCCCTGTTACCTGTGAGCTCTGTTGATGGACAGTGTGAATCGAGGCCCAACATTTTAAAGTTCTTTAAGAGGTGGGAAAAGGGCGTCGGGACGAGTGCTGAAATGAAAATGTGTAATCATCGTTTCTACCCACCTCACTTTGAGCTCCCTGTTCTTTTCCTAGGTGCCCCTGTTCTCCAGGTCCCCCCGCCCCCACTGCTTCCCACCTCTGCCCCCCACACTCCAGCCCTGGGGACAGAGGCTGGAACCGGAGTCTCTGAAAGGGAGGGAAAGCCACCTTTAATTGTATCAGTAGGGTGGGTGCAGGAGCTTCCGAGGAGAGCAGAAGGTGCACTGTGCACCCTGGGGAGCTCAGCACATACTGGGAGTTGGGTCTCGGAGGGAAGTAGCACTGCTTAGAGTCAAAGACAATAGCCAGCAAGGTGGGCTGTTTGGGGTGCTGGAAGCAGGGGGGTAGGTGGGAAGCAGAGCTGGAAGACAGCAGCCTCCCCTTGGTGTGTGGGAGCTGCCGCTTGCTGTTCCTCCAAAGAGTCAGCCACTCATTGTAACAATCAGGACAGGTGGCCCTCAGAGAATCTGCTGCTTGCACTGTGTAACACAGGTGAGGGCCAGTGGATGGGAGTGTTCACGGGGACCGGATGTGGGCCCCTGCCCTGACCGGATGTGGGCCCCTGCCCTGATGCTCCCGGTCCGATAGTTCCTACGGGGAATCCTGCCTGAGGACAGGGAGGCGCCACCTGAGTGCTGTGAATGTTCACGGTGGTGGAAGAAGAGAGAGCAGACGTGCCCTTGAGAGAGGAGGCTGGGGAAGGAGTGTACTGGTCAGCTGGCTGGAAGCCTGGCTTGGCTCTGACATTCGGTCTTGCACCACAGTGGCCAAGTCACTGCCCTTCGGCCCCAGTGTTCCCATCTGGGAAATGGTGATAACATCCGCCTGTCCCCTGCTGTCACGAGGATAAAAGCCTAGTGGAGGGGAATACTGGGTGAACCCATTGTGTGTGTGCAGGCGGGAGGCTTTGAGTTCACCTGCCACACGGAGGTGTCTTCTGGCCTTTACACAGAAAAAGACACCGCAGTGTAAATGGCTGTATTCTTTCCCTCCAGAAAGGAAGCGGACTCTTCCCCTTCCCCTGACCCTGCCTCCTTCCTCCAGGCACAGAGCCCCTTGGTACCGCTGGCTGGGGTCCTCCAGGGTCCAAGGAGGCCAGTTCTGCTGGTTGTGTTTGAGGCTTGTCCTGGGGAACCAGGGGCTGAACCTCAAGGTTTGTCCCTGACCCAGATGAGGAAAGCTCTGCTTCTCCCATCGGGGAGCAGTGATGTCAAACGTCTGTTGCTGGGGAAATGTCATTGGCAGGGGACCTGTGGAAAGGGCTTGTTGGTAAAATCTGGGAATGGCCGGATATGGAAACATCTGGCTGTGTGTACCGATGGCAGAGCCGTTGCCCACAAGCGCCCTTTATTTAGGGTGAAATTATCAAGTCCATTCTGTTCCTCTAATCTGTACTTGGTACATATGACCTTCTCGAACGCTTATCCGTGTATGGTTCTGGGGTTGCTTCAGAAGTAGTATTTAATGAGTTGTTTATATGACCCCAAGATTCTATTTTGTTTAATGAACTTTTCTACTGAGAGCGTAAAAGACTGAGTCTGATTTAGCCAGGGCAAAACCATTCATTTCATATATTCATTTTGAATGCTTGCTGTCCGTGTTATACAAGCTTCTTAACTGTTTTCATGTAATAACAAAGATCTATTTTGAATAAACGATGGGTACGTTTTAACAAACTTCCACACAGTAGTAAAGCCTAACCTTGTGTTAACGTATGTGCAGAATGTTGCATAGCCATTTATATACTGTGTATATGTAAATTAAATGGGGTGGCTTCAGAAGTGAGAAGAGAATAAATCTAAGGTGCTTCTTAACGA\n>XM_028554974.1 PREDICTED: Dendronephthya gigantea vegetative cell wall protein gp1-like (LOC114533457), mRNA \nTTACTGAATACAGTACAATGATTTTTAGTTTAAATTACAAAGTCAGAGGGGCTGAAGCACCATGTTACGCCTATGCTCTGTTCTTTCGATATTTTCCATCATCTTATCAAATTGTGGAGAAGTACACACAAAAAAAGAAGCAGACAAACTTACTTTGTTAATGAAAACAAAATGCAAGCAATGTACTCATATTTTCATATGTCCTATGATATGCGGTAAAAATAGCACTAAGCCAACCATTAAACCCCCACCCACCAAGCTACCTCCAACCTCTACACCGATCTTTCCACCAACGCCACGTCCGCCGACACTACCACCCCTTCCTCCAGTAACCCCTGCTCCACCGATCATACCGCCATCTCCATCCCCTCCAACCAAACCTTCCCCACTGCCGCCAGCAACCCCTGCTCCACCGATCATACCGCCATCTCCACCCCCTCCAACCAAACCTTCCCCACTGCCGCCAGCAACCCCTGCACCACCGATCATACCATCTCCACCCCCTCCAACCAAACCTTCCCCACCACAGCCAGCAACCCCTGCACCACCCATCATACCATCTCCAGCCCCTCCAACCAAACCTTCCCCACTACCGCCAGCAACCCCTGCACCACCGATCATACCATCCTCACCGCCACCCACAACCCCTACTAGTCCTTCTGGTGGTCAAGAAAAAATCCGACCACCCTCACCAGTGACCCAAGCCCCACCAGTTATTGTTCCCACATCTGCCCCAGTCCCACCACCATCGCCATCCATTCCTGGAGAATTATCATGTCTAGTACGTCTTGAGAAGAAAGGATGTTTTAAAGACGATCAAATTCCTCCACGTCCTCTTCCAAACTACATCTTAACTGATCGCGACAATACTTTATCGATTTACAGTGGCAAAGGAATTGACTGGGGAAATTGGGTGAACTATCTTCCTGATTTCGTGTGCCGTTGTGCCCAACTTACTAAGTCTAAAAATTTTAAATACTTCGGAATACAATATTATGGTGAATGTTGGTCAGGTCCTTCAGGAGACGAAAATTCTTTCAAAGAAGATGGAGTTTCAACAGAATGCGTCAACACGAACTGGAAGACATGTTCTGATCAATCAAAATTAGCTTGTGCTGGAAAGGAGAAAAATAACTATGTTTACGCAATTGTTTAATGTATTTTGTAGTAGTTTGAAATGATCTGTAACCTAGTCTGGGAGGAATATAAATAGGAAATAGCCTAAAGTGTTATTGCATGCATTCACCGCTAGATCATAATGTTATTGTTAGATCATAATGTTACTGTTAGATCATAATGTTACTGTTAGATCATAATGTTACTGTTAGATCATAATGTTACTGTTAGATCATAATGTTACTGTTAGGTCATAATGTTACTGTTAGATCATAATGTTACTGTTAGATCATAATGTTACTGTTAGATTATAATGTTACTGTTAGATCATAATGTTACTGTCAGCGTTAACCTATAGTTAACATGGCTCCAGTTTCGGCTGACCGTTGATAAATAGAAACGAAAATGTCAGCAAAAAGGAAATGAAATTTATTATAAAAATTATTAAAATTTCTCCTGCTGCATGGGCATATATATGCTTCACTAAAGTTTTACATTACCCCATGCTGAACTTCGACATAATTTAATTTGTTCGAAATGCCTTTTTCAAACAAATCTATCCCCTTTCATGAAAAAGTTCCAATTCCATCTCAAAACATTTACATATCCGGGGGCATAAAATATTCCTTACCGCTACATGGCTGGTTTGGGGTTGGTTTATTACTGTTTCCTTGGCACAGTTTATAGACAAACAGTCGGACTGCAGTGTGGAGAGTACTACTTAGCTATATACGGTGCCGTTTATAAGTAACACGTATCAGGCCGAACGAAAATTTTACAAAATATACTGATAACAGTGAGTCAAATCCAACGGGGGTGGAAGTCAATTTGATACCTCCTCACCTCGTCCTTTCATATCTATAAACTGTGCCAGGGAAACAGGAATAAACCAGCCGTAAACTAGATAAAATGAAAATATTTGTTCCGTTGCACGAATAAAAACATTCAATACAGCAAATACACAAAAATAGAGCTAATGCGTTTACCGTAAACGTCGAATTCGTACTATTAATGTA\n>XM_039788533.1 PREDICTED: Perca fluviatilis E3 ubiquitin-protein ligase MARCHF7-like (LOC120551252), mRNA \nGCAACAGGGCGCTGAAAACCTCATTAGGCGCTGAATACAGATCAAAAGTGGTAGATACAGAAGTGAAACGACAGATTCCAGGCATGCAGGCTTTTTCGACACTGTTGCAGCGCATGTCTGCAAGGAAGGCCTCAAAGCAGCCGTCCCCCTGCAGCGCTGGGAAAAGTGCTTTGTCTGAACCAGAGAGCCAATTGAATAAAGATTCGGAGTCCTGCCTTCAGGCTATCTCCAGTGGAACCCGGAGCATGTCTGCAGAGCTGGCAATGACTTCAAAGATTCCCCACAGAGAAAAGGCGCCCCTGGCATCCAGATTACTCCCCGCAAAGGATCACAACGATCACAGGTCTGAGCGTGTGAAACACAAAGGATTAAAAGGATCCACCCAAGCGAGCAAGCAAACACAAAGCCGGGACGTCCTGAAGAGCAACAGCAAGATGAAACACCTTTTCAACAAAACAAACGTTGAGGATGTCATACACCCCAAAGCTGAGACTACGTTTGCCTTCCCAGCAAGTACTGACACTGTCCCGCATGTTCCCACACGTGATACAGGCTCACTGTACAGTGAATCTGAAGAAGAGGAGGAGGCAGATAATGACCCATCAAGCTCACTGTACAGTGAATCTGAAGAAGAGGAGGAGGCAGATAATGACCCATCAAGCTCACTGTACAGTGAATCTGAAGAAGAGGAGAAGGCAGATAATGACCCATCAAGCTCACTGTACAGTGAATCTGAAGAAGAGGAAGAGGCAGATAATGACCCATCAGGCTCCTGTCAGGGCACATTTAGAGAGGCCACCTATCCATGGCAAGTTTCTCGGTCAAGCTCAGCCTTCCGTTGCTTCTCTCACAGTTCACACCTAAGTACATCAACAGTTTCACCTGTTGGTCGTCATGGATACGGTCCTGGTCCTTTCCTGGAGCGAACAAGGCGACCTCATGCAGCATCGCTGTTATCTACCACTGACAAACTCAATAGGGGTTTTGTAGGCTGTGTGAGTAGCACTCAGCAGACACACCAACATCTCCATAAGTTTCAAAGCAGCTGGCCAAGCACAGCCTCTTCACACAGGACTGTCGGCTTCTGTTCTGCTGGGTTTGCTGAGAAGCAAAGCTACCGTACCACTGACTACAAATCGAGGTCTTCTAATGAGTCCTGGCGTCTAAGTGCCTCTGGACAGGTAGATAATCTGAATGTGGATGATATGACGACGTGTAGTGATATCAAAGAGCGAGTACCCAGTCAAGAATGTCAAGAAGCCCGGGAAGGAGCTACTGCTGCCCAAAACGCTCAGTCTCTAAAGGATCGCAGCAAAGAGACTGTTTGCAGACCCAAACAAAGGTTATTAGATGAGTCATCTGATGAGGAAGAAGGGGAGCAATGTCGAATCTGCCACAGTGGCGAGAGTTCACCAACCAACCCACTGATATCACCGTGCCTGTGTTCAGGCAGTATGCAGTTCGTTCACCTCGACTGCCTGAAGAAATGGATTAGGACAAAAATCGAGTCAGGGTCAGGGCCCTATACTGTCAAAAGATGTGAACTTTGTATGGGGAGGCTGACTCTGGACCCGGATACACTTCACTTGGACGTTTACTACAGAGAACAACAGCAACAGATGTTGGGCAACCCTGACCTGTATGATCTCAATGATGTGTTTGGAATGCTAAGGCGGCCAAGACTTGTGCACGTTCCGATATGGTCATTGCTTTCCAACCTAAGGAGAAGACTCCTCAGAGGGAGGAGGAACCCCTCACCACAAGAGACATCGGACACTTGATCCTCAGCCAAACTCCTTTTTTTTCCACATCTTTGCTGATGTGGAACTAAACACACATGTTTTACAATAAACCACCATGCATCTAA\n>XR_006693933.1 PREDICTED: Macaca fascicularis uncharacterized LOC102122981 (LOC102122981), ncRNA \nTAGAAACAGGGGTTTCACAGTGTTGACCAGGATGGTCTCGAACTCCTGGACTCAAGTGATCCTCCCACCTCAGCCTCCCAAAATCCTGGGTTTACAGATATGAGCCACTACGCCCAGCGTGACAGAGCATGACTTCTGAGGGTAGGTCATAAAAGACATTGTGACTTCCGGTTTGTTCTTTGAACACTTGTCTAAAGGAAGTCAGCTGCCATGTCTCAATGACACTCAAGTGGCCCTATGGAGGGGCCTAAAACAGCATCCTCCCGCCAACAGCCATCAAGGAACTGAGGAACTGAGGCCCTTTGCTAACAGCCATGAGGGCACGATCATGGAAGTAGATCTCCCGCCCCTGTCAAGCCTTCAGATAACTGCAGCCCCAGCTGACTGCTCAACTGCAACCTCGTGAGAAACCCTCAGTTAGGACAACCCAGCTAAGCTATTCTCAAATTCCACAGAAACTGTGAAATAATACATGCTTTTGTTTTAAGCAACTAAGCTTTGGTTAATTTGTTACACAGTAATAGACAACGAATACAGCTGGCTTATCAGCCTCTCCTCTTTTTGCAGGCTGCAGGACTGCCGAGCTTCGAGGGAGCTGAGAGGAATGCTGTATTCAGGCCCTCTTACCTGACTTGACCTTGAGACCAATGGGTGTGTTGGAAAGAGGCTGGCAAGGTCTGAGGGTACAGCCTGTGGCGGAGGTGGGGCCAGGCAGGCCCAGCCCCTCAAGCCAGGCCGTGGGCCCCAGGGCCCTGCCGGATGGCCGCTCTCTGGGAGCTGCATGCAGAGGTGCCTGGCACCCCCAACCGCGCCCCACGGGGCACCTGACCTCCAGAGGAAGGAAATGAGTCTGGAGATGCCGTAGACGAAAGAGTTGCCGCTTCCTCCGCCTGGGATCACTCACAGATGCCTCAGGGAGGCGGCCGGCCCTGAGTCACGCTGAGCGCTGAGCCGGCTGTGACTCAGCGGGACCGCGGTCCCTTGGTTGCGCCTGGGTTGATTTGCGCCCCGCTTGTTTTCTGCAGAAGACAAGGCCGTCTCGGATTAGACTGCCCCTCCTAAACAACCAGCAACTGTTTTTCTTCCTCAAAGTGCAGTTTCCCTCTGGCACAACCAAAAATAAACACAAACCAGGCTCCTGCCCAAGGAGGAGGGGGGGAGGAAGACAGTCCCCGGGGCGCCCACCGAACGCATGTGAGAGCTCGCAGGTCACCTGCTTGCATGAATCTGTGAAGCAAGCAGCCATGAAGGCAGAGAAACCTCTCCCATCGCAGGCTGCCAGCACAGAGGCTCTGATTGTTGAGTTGGCGCTCTGTTTATTTCCCCAACTGCCTCCTCTCAGGTTCCGTCCTAACTGCTGGACTCACTGCCGCGTGGGCCTGAGCACATTTCCTTGGCAAATTGTCCTCAGTGGAAGTTTTTTCTTCTCGATGTGGTGAGTCAGAGCTGGCTCACACACAAACACCAAGCAGCAGCCTCAGGGACTAAAGTGCTTTAAGGACACGAGGACCTATCCTCCCTCCCCCTATCTCAGTGGGGTGGGCCCACAGTTCCTGAAAGCTGGCCCAGTGCAGTTCATTTGACAGGCAGAGGCTGAAAATGCAAATCACCCCAGCATAGGTGAGTGCACAGCAGAGACCACGCCCGGGCTGCAGCTTATCCTGAAATCCTGAAGGCAGGAAACACCGTGCCCACAGGAAGAGCTGGGAAGCCTGAACCATGCTAAGATGTCCCAGGGTGAACCGGAGCCACTGGTTAGTCACACTGACTTCACATTTCCTTCGTGAGAAGGAACTGAAGACAGATTCCAGACTTGCTGTGCATAGAATGTATAGTTCATTGCATGTGAGAACACAGCAACAAGGCACCATCTTGGAAGCAGACAGCAACCCTCA\n>XM_043685587.1 PREDICTED: Chiloscyllium plagiosum uncharacterized LOC122546987 (LOC122546987), mRNA \nATGGGAAATCAGACTTCTAGACTTACTAAGGAGAAGTCAGGGAAGACTGCAAATGGGAAAGAAATACCCCCCGATAGTCCACTAGTTCGGAAGGTAACTCTATGGACGGACAGTCGTAGAACGAAGGACTTAAAGAAAGACACCATGATAAAATATTGTTGTTTTATATGGACCAAAGAATCTATCCGCGCCCCCTCGGTAGTTTGGCCCGAGTATGGTTCTGATGAAGACTGGGTGTGTCTAATCCTAAATGTATATGTTAACAGAAAACAACCGTTTGACCCAGAAGAGAGCAAATACGCCGCCGCCTGGTTGGCGGGCGACGGCGAGAGTCCCACGCGTCTCTATCCTCTGATTCCCCAAACAGACCCGAGGAAGCCCCAGAAGTCTTGGGACATCCTCACTGACGGTGCCGTTGGGAACGAACGGACCGGGTTCGTAGTACAACCTTTAAATTCTGGGGATATCCGGCAACTCCGTAACGAACTACCCCATCTACTGGACGACCCCATCAGTGTGGGAATACAACTGGACCAATTTCTGGGGCCCAGTATATACACATGGGCTGAACTGCAGGCCATGATGAGAATACTATTTAATTACGATGAAATTGTTATGATCCGGAATAGTGCAATGGCCATTTGGGATAGGGAGCATCAGGACGGCCCTCAGCGTGGAGAGCAGAAGTACCCCTTAGAGGACCCCCGGTGGGATCATAAAGACGCGGGGGGATGGGCCAATATGACAGATCTCAGAAGCCTTATAATCAGGGGGATCCAAACCTGCGTGCCCAAACAGCGGAATTTAGCGAAAGCATTCGAAGTTGGACAGAAAAAGGATGAATCCCCGAGTGAGTTTTTAGACCGTTTGCGGGAGTCCATGCGAAAGTATTCAGGTTTAAACCCCGATGGGGAAATAGGCAAGGGCATGCTTAAGGTGCACTTTGTGACTAAGTCATGGCCTGACATTCAGAAGAAATTACAGAAAGTGGAGGATTGGGCTGAAAAAGATGTTGCAGAATTATTACGGGGAACACAGAAGGTGTACGTTCAGAGGGATGTAATAAGGGAGAAACAAAAGACAAAAATGATGGTGGCAGCCGTACGGGAAGCTTGTAAGTCCACCGGAATGGGGGAGGGAGGTTATGGGGTGGAAAGAGGAACGTCGAAGAAAAGTTGGAGAGGGAGAGAAGAGAGACGGGGCAGAAGTGAGAGAGGAGGATCTTATGGAATTGAGCGGCCTCAGGTGGCCGGATGTTATCATTGCGGGAAACTGGGACACTTCAAAAGGGATTGTCCCGAGTTTAAAAGGGAAAGAGAAGGGATGTATGAAATGGAGCGTGAACAAATGGATTAGGGAAGTCAGGGGAGGATCGGACAAACGTGCGAATTGTACGCCTTGCACC\n>BT024918.1 Arabidopsis thaliana At5g50110 mRNA, complete cds \nATGAACCTTACAGCAACTAAAGAAGCTGATGAAGTAATGGAGAGGCATATCGAAGATTCTCTTGCGATATTGCCTCCTATAAAGACTTGTTACAACTTACATTCCAGTGATTTGTTTGATCACATCAATTTAATCGATGTTGGAAGCGGGGCTGGTCTTCCTGGGTTGGTTCTAGCCATTGCATGCCCAGATTGGAGAGTTACTCTACTGGAGTCTATAAATAAGCGATGTGTTTTCTTGGAGCACGTTGTGAATGTTACCGGGCTTACAAATGTTACAATCGTTAGGGGCAGAGCAGAGAGTTGTGGGCACGATGTTATGTACAGAGAGAAGTTTGATGTGGCTATTGCAAGAGCTGTCGCGGAGATGAGAGTCTTAGCTGAATATTGTCTTCCTCTGGTTCGGATTGGTGGATTGTTTGTAGCTGCTAAGGGTCATGACCCAAAGGAGGAAGTTCAAAATGCAGAAAATGCTGTTCGCTTGTTGGGTGGTTCAATACTACAAATTAGTCCAGTGGATTCACATAGCCCATACGGACAGCGGACAACGGTTGTTTGTCGTAAAGATCATTCCACCCCACAAAAATATCCACGTGAAGCAGGTACTCCTGCTAAATTACCGTTGTAA\n>XM_041034442.1 PREDICTED: Toxotes jaculatrix potassium channel subfamily K member 15-like (LOC121179542), mRNA \nATGAAGACGCAGAACATCAGGACCCTGTCTCTCATCCTCTCCATTATTTTCTACCTGCTCATAGGAGCCGCCGTCTTCGACGCACTGGAGTCCGAAAGTGAAACTTCGAGGAAAAAGACGCTGGAGCAGAGGCTGAACGAGCTGAAGAAAAAGTACGGCTTCACCGAGGATGACTACAGGGAGATTGAGAGAGTGGTCCTTCTGTCGGAGCCGCACCGAGCCGGCAGGCAGTGGAAGTTCACCGGCTCGTTTTATTTTGCCATCACTGTGATCACCACGATTGGTTATGGCCACGTTGCTCCTCGAACTGATGCTGGCAAGGCCTTCTGTATGTTTTACGCAGTCTTGGGGATTCCTTTGACGCTGGTCATGTTCCAGAGCCTGGGCGAGAGGATCAACACTTCTGTCCGCTACCTGCTGCGAAGAGCCAAGCAGGGCCTGGGCTTTCAGAAGACGGAGGTGTCCATGGGGAATATGGTCCTGGTGGGTCTGCTGTCTTGCATGAGCACTCTGTGCATCGGAGCTGCAGCCTTCTCCCATTTTGAGGACTGGACCTTCTTCAACGCCTACTACTACTGCTTCATCACACTCACCACCATCGGCTTTGGGGATTTTGTAGCCCTGCAGAAGAAAGATGCTCTCCAGAAGCGACCCCCCTATGTGGCCTTCAGCTTTATGTACATTTTGGTCGGGCTGACAGTGATTGGGGCTTTTCTTAACCTGGTGGTCCTGAGGTTCCTCACTGTAAGCTCAGATGAGCCCGACGTGAGGCTTGAGGATGGGGAGGTGTCACACGCTGAAGCAGAAGCTGCTGAAGTGGCATATAAAGACAGAGAAGATGGACACAGCAGCCAGTGCAACCTGAGCCTGCCCATGGAGGGGGGCACTAGCTGTACGAACCTCCTCCCTTCACCTGCAGAGGATCGCAGGCTTATTATATCCGAACAGAGAGAGCACTCTAAGCTCCCTGAACCCAGCAGACTCAGAGCCTTGTTCTCCTGCATCTGCTGTGGCCTGGACATTTACGACAGCCACCCTCCATCTCACCATGAGCAGGAGCGCGGCCACAGCAACCCCGTCTTCTACAACTCCATCTCCTACAGGGTGGACCAGGCCTCATGCAGCTCCTGCACCGTGTCGTCACAGGACTCCCCCACCAGCATAGCACTCTGCCTGGGCAAGAACAATCCTCACAGCAGGAGGAAGTCACTCTGA\n>XM_015424951.1 PREDICTED: Gekko japonicus serum amyloid P-component-like (LOC107121936), mRNA \nATGGCTGTGGAGCATTTGCACGGCGGGCCGACAGACCTCAAACAGAAGACCTTGGTTTTCCCAGAAGCGTCCAACACGGCTCATGTGGTTTTGAGGCCTGCGCGCCAGCAACCTTTGACCAGCTTCACTGTCTGCCTGAGATCCTACACAGACCTGAGCCGTGCCCACAGCCTTTTCTCGTACGCCACCAGGACGGTCGACAACGAGTTGCTGGTCTTCAAACCCAAACCCAACCAATACAGTTTGTATGTGGGGGGGTCAGTTGTGACCTTCAGCGTTGCAGACAATCCGGTCCCCAAACCGCTGTGGGAGCACATTTGTGTGAGCTGGGAGTCCGTCACAGGAATAGCAGAGCTTTGGCTGAACGGGGTTAGCTTGCCCCGCAAGGGAATGAAGAGAGGTTACACCATCGGTCCGGAAGCTTCTATCGTCCTTGGGCAGGAGCAGGATTCCTTTGGAGGAGGCTTCGACACCAACCAGTCCTTCATAGGGGAGCTCATGGATGTGTCTATGTGGGATCGGGTGCTTTCCTCAGATGAGCTGGTCGTCATTCAGAACAGCGGCCGCCTTTCCAACTATTTGATTGACTGGCAGTCCCTAAATTACGAAATCAAAGGCTATGTGGTGGTGAAGCCCTCCTGGGGGTGAAGCCCTCCTTTGTAAGCCCCCCTGTAGGCTTCGCAAAACAAAGCAGAGAGCTGGAAACAAATCGATAGTCTTCCCCATAATTAATGTTTCTGTTAGTAGTAAGGCAGCATTCCTACAAACGATTTCCTGGACGTAAACTCCTTGGAGTAGCATGGGACTTCCTTCTGAAAAAGACCTGCAGAGACTTGTTCTCGTAGTCCTCAATCTGTTTGTGCAAACGCATTCATGAAGCTTGTAGATCTGTATTCTCCAATGAAAGATTTCAACCCCCCCCCCCCAAGTATTTTGCATTCCCTGACACC\n>XR_005453858.1 PREDICTED: Tachyglossus aculeatus small nucleolar RNA SNORA7 (LOC119936833), ncRNA \nCCCCTCTTAGGGTCACACCTGGAGAGTTTCTAGTACTCTACCAGTCTCAGTTATGGGAGGGAGAGTCAAGTAGAGGCATACCCATTCCATTCCTAGCTTGGCCAGTGACTAGCGAGTGGAAGACAATCTGCTACAAGT\n>XR_008035993.1 PREDICTED: Dreissena polymorpha uncharacterized LOC127851864 (LOC127851864), ncRNA \nTTGGCAAGCGTGGTTAAATGTTATCCTGTCACATAACGTGTTACATAGTTACTTTTGTTTACTGGAGACATAACCTTGCGAAACAAACTTCAAGTTGATTTTAATTAGACTCCGTTAAGGTTGACATTACGTGTTGAGACTTTGGACAAATGCTAGATTGGTGTGTTTTGTTTTGTTTAATAATCAATTAGCTTTAATACCTAAGTTATTTGAGTTAAATCAAATATATTGAGATCAAAAGCTTCAGGGTTGAACAAAATGGCGACCTTTTCACAGTCCACCATCGAAAAAGGATCTGACATCGTCCAAGACTTCTTGTGTTCGGCGTGCGAAGACAAGAAACTGGAAATCTCAGCTGATAATATTTGCGGATCTTGCGTGAAGTTTTACTGCCAATCATGTATTCATTTGCATCGCCAGTTGTTTACAAACCATTCTACTCATGGAAGGGGAAATATGAAGAAATGGCCAGTTGCGAAGACGGTGGAAGATTTTCTTCTTAAATGTGATGTTCACAAAGAAGAAAACTTGGCAATGTTTTGCAAAGACCACTGCAAGCTGTGTTGCAATAATTGTGCATTCCTTAATCACAGGCAATGCCAAACAGTGATGATCTTATCAGACTTAGTAAAACATACCTCCACAGACCTCAAAAAAGTATCAGCTACTATCCAAACTACTCTGGCAGAACTTAAAAAACTTCAAGACAACCAGGAGGCAAGCGTACGGTCTGTGCAAAGTTCCTTCGATGAGCAATTAAAAGAGATACAGGAAACTCGCAAAAAATAATTGAAGCCTTAAACATGCTTGAAAAGAAGACACTGAACGATATGAAAGATGCGCTGGGAAATCTGCAAGCCTCTCTAAAAGCAAATGTTGACAAATGTGCCACTCTTCGTGATCAATTAAAGCAACTTGGAGATGCAATACATGACTTAAGTGATAAAAGCAAGCAATAACTATCTCTTATAGCCAGATTTAAATGCCAGGACAAAATACAGCAGTTTGAAAATGAGAAGAAGAACTTTGTTCAAGTAAGATCTTCAATCACTTTCCAACCTAATAGAAAAATTGTGAAGTACCTTTCTAAGTTGTCAGGTCTTGGGAGGGTTGAAACCAGTACCCAGATATTGACAATGCCGGGAAATCCAGACAAAGTAATAAGGCTGAAAGAGAAGTATGAGTATGACGTGCGCACGCGAGGTGATTCATATGAAGAGTATGCAGTATGCAGTATCAGAGACATTTGTGTTCTCCCTAGGGGACAGGTCTTGGTTGCAGACGCGATGAATAATAATGTCAAGCTGTTGAACCAGCAGTACAAGGTGTTGAGTCACTGTGTTAAACTTGATACGCCATCGGGCATTTTTCAGATCACACCCAGTGAGGTTGGCGTCACTTCTGGTTCAGTAGTCCAGTTTATCAAAGTCAACTAAAGCCGACTGGTGACAGACAGAAAGCTAACATTACAACGTGAATGTAAAGTAGATGTATGTGCAGTGAGCCCGACAGGTGACAAATTGTACATCACCAGCCACTACCAGCACAGGATACTCACCCTTGCCAGAGATGGATCAGTCCTTGCCACATTCAGGGACCAAGAATTACAATGGCCAACTGGTGTACACGTTACATCTGCAGGCCAGGTGCTGGTATGTGGATATGATTCAAAGACAATCATTCAGGTTAACCGTAATGGCAGTAAAAAGCTGGCAACTCTGGCTACAGAGAGGGATGGGCTTCAGGGAGGCACATGGTCCGTCTGCTACAACAGCAACAATGATTCCATTATCGTGGGGCAGTTGAACAACAGGATACTGGTGTACAAATTACAATAGCTTATCATTCTTGTATTTTATATGAGTAACAATAAGTGATATACATTAAAATAGCTATTACATTGAGTGCTTTGTTACTTTGCAAAAATATTTTAAACATATAATATGTTTGTAGGAATAATGTATGTAAATAACAATAGTTGTTTATGTAATAGTGCTGTGTAACCATGCAAACAAACTTCAAATGTGCATACCAATAGTTTTGTAAAAAATAATCTAATATTTTTTTTGTTTTTAAAATCTAGCGTGTTTCTTAATTGATGAGTCTTAAGTGGCAAATATGAATGTTTACTTTTGTTCTTAGAACTCAATATCTTAACATATTATTTATGATACAATATGTTTGTAAAATAGTTTATAAGACATTTTTTACTATAAAGAACTCGTACAGAACAATCATGCTAGTGTTAGACCGTCATGTATAAGATGCATAGCAATTAGGTTATTAATTTATTTCTATTTAAGTAGCAATCATAAATCTATCTTTAACTCACTGGTCTATAAAAATAGCTGATATAATGTCAGTAGCATTTATTAAAACACCTTTTAAATG\n>XM_028615390.1 Sodiomyces alkalinus F11 IKI3 family protein (SODALDRAFT_45849), mRNA \nATTTGATGCGCAAGAGTTACATCTGCGGAACCCCCACCAAAGTACCAACGTAGTCCCTTTTCATACCTCGAAGATTTTCATCGCAACCACAACGGCAGCAGCACAAAGCGTCCATCGTGACCACCTCAGTCAATAACTCGAAGACGACCTCCACCTCCCTCTCCCTCCCAAGCCCAAACGCCGGGACAGGGAACACTTATTATGACCAGTGATTAGTGACTTCATCACCAACCCGAGAATGCGGAATTTGCGCAACATCCGCTTCGATGCCTGGCGCCTCGCCGACATCACTTCCACCTGCTGGGACCCCGCCAAGGATGAACTCCTTTGCACTCTAGGTCCGACCGAGACGAGACGCTCCATCGAGCTTGTCCGGATTGCAGATACATTTGAGCTACAATCTCACACTATTGCTTCGTGGGACGTCCCGAGTCCCCATCCCGATGTCCCAGCCGACTCAGTAGTGAGCCTTCACCACTTCAGCGACACGTCTACCACGTGTGTTATTCTTGCCGGCGGCGATATCGTCACTATCAAGGAACCCGATGCCTTCTCTTCCCAGGATGACGTCCACATTGAGATTATCGGCTCCATCGATGCCGGAATTACGGCGGCCCGCTGGTCTCCCGACGACGAGCTACTCCTCGTAACCACCAAAGATGGCAAGGCCGTCTTCATGGGCCGCACCTTCGATGCCATCGCCGACGTGTCCATGACCTCGGAGGACCTCAAAGCATCCAAGCACGTCTCCGTCGGCTGGGGGAAGAAGGAGACCCAATTCGAGGGGCGGGGCGCGAAGGCCCTCAGAGACCCCACCATCCCCGAGAAGGTGGACGAGGGCGTTCTCAGCCCGAAGGACGACGGCTCGTCGTCCATCAGCTGGCGCGGGGACGGCGCCTACGTTGCCGTCAACTCCGTCGAGGGCGGCTTTCGGAGAGTCGTGAGGGTGTACTCGCGAGAAGGCGTCCTGGACAGCGCGAGCGAGCCTGTTGATGGACTGGAGGGAACTCTGAGCTGGCGGCCGGCGGGGAATCTCATCGCCGCCATCCAGCGTCGGTCGGACAGGATCGATGTCGTGTTCTTTGAAAGGAACGGTCTGAGGCATGGCGACTTTACCTTGCGCTCGCCTGGTGGAGATATCCTGTCACACGATGGGATCAGGCTGGAGTGGAACAACGACTCGACTGTTCTTGCCGTCATCTTGTCGGATACGATCCAGCTCTGGACCATGGGGAACTACCATTACTACCTCAAACAAGAGGTGCCCATCACGTCCCCGTACGTCCACTTGGCCTGGCATCCTGAAAAGGCCTTGCGCTTTGCCGCGGCGACGTCCAGTCTCCTCACCTCCGCCGAGTACATTTTCACTGTGGCAAGGGGTTCTCAGAGGCCACCCCACGATCATGGCGCCGTTGCGGTCATCGACGGCCACACGGCGAAAATTACCCCCTTCCGGACGGCAAACATGCCTCCTCCCATGACCATGTTCGACTTGGAGGAGGCATCGAGTGTTGTTGACGTCGTCTTTGATTCTGCCAATTCCTCCATGGCCGTCCTGCATCGTACCGGAATAGACGTCTATGCATGGCAAACTAAAGGAAGCCGCTCCCTTCACCCCAAGAGGGTGAGCCGAACAACTTTCTTTGAATCATCATCAACGGACGACTCGCCTCGGGTTCCACTTCAAGCATGCTTTTCCTCGTCTGAAGAAATCTCTGTCCTCGTTCACGACGGAGGGGACCTAAAAGTTGAAGTATACAGCTTTGGGCCTGGGGATAGTAACCTCCAGGATGTCGTGGAAATCGATCGATCGGAGCCGATTTCTTCCATTTCGAGCTACTGCGGTCTACCCGATATAGGGGCCTACGCCCAAGATCGCTCTGGAAAGTTATACAACTTATCCGGACAACAGGGCCTTATGCCTCTCGGACTTCGACTGCCCGTCCAACTGCCATGGTGTCAGCTGGTTGCCGTCGGAGACAATACGGTGGCGGTGGGAATGGCTCGCAACGGACGCCTCTACGCTGACAGTAGGCTGATAGCCAAGAACTGCACTTCCTTTGTGGTTACTGATGCCCATATCATCTTCACAACAACCAACCACTTCCTCAAGTTCGTCCATCTGGTGGATCCTCAAGAAATGGAAGTCCCGGAAGACGACCCTGAGGTGGATGAAAGGTGTCGCAGCATCGAGCGAGGTGCTCGGCTCGTCACGGCCATGCCTACCAACATGAGCCTCGTGTTGCAGATGCCCAGGGGTAACCTTGAGACTATATACCCTAGAGCCATGGTGGTCGCGGGTATCAGGCAACTCGTCGAGGAGAAGAACTACGGTCGTGCTTTTTCATATTGTCGTACACAACGGGTGGACATGAACATTCTCTATGATCACCGCCCGAACCAGTTCCTAGCCAACGTTGGCCTCTTTCTCGACCAGATTCAGGACGTGGCATATATCGATCTCTTCCTCTCGTCTCTCAGAGAGGAGGACGTCGCCCAAACGATGTACAAAGATACCAAGCGGACAACAGCTCGCGACCCGGACATTATCGCCGAGGAAGCGGCCGCAGATTCACTGGCTCCGCAGAACTCGGGGAACAAGTCCAAAGTCAACAAGATCTGCAATGCTGTTCTCAAGGCTCTGCAGCATAAGAAAGAAACCCACCTCCAAAACATCATCACCGCCCACGTCTGCAAGGTGCCTCCCGCCTTGGATGACGGCTTGACTCTGGTTGCCGAGTTGGTGCAAGAAGACGAGAAGCTTGCAGAGAAGGCCGTAGAGCATATCTGCTTCCTCGTAGATGTCAACCTTCTCTATGACCATGCTTTGGGGCTTTACAACCTCGACCTTGCCTTGCTCGTTGCCCAGCAATCACAGCGAGACCCGCGGGAATATCTGCCCTTCATCCAAAACCTCCACAAACTCCCCGAGCTTCGCAGACGGTTTGAGATTGACGACCACCTTAACCGGCGATCCAAGGCCCTAGCACATCTGAAGGCGTTAGATGCGTTTGACGAACTACAGGCATATACTACCAAGCACGCTCTGTACCAAGACGCACTCGGCCTCTGCAGGTACGAGAGGCAAAGACACCGTACTCTCATCAACCTCTTTGCCGAATATCTCGAATCCAAATCCAAGTTCCGGGAGGCTGGTCTAGCCTTCGAGTCTCTCGGGAACTACGAAAAGGCCATGGTCTGCTACCGCAGCGACGGCGCCACGAGCTGGCGCGAGTGCCTCTTCGCCGCCCAGCAGGTACAACCGCCTCTCTCCAAAGAAGCGCTCACCGACCAAGCCACCACCCTCGCCGAGGCGCTCACAGAAGCCAAAGACCACGCCTCAGCGGCGACCCTGCACCTGGACTACCTCGACTCCCTCGAAGGCGCCGTCCGCTCGCTCTGCAAGGGGAACCACTTCGCCGAAGCGCTCCGCCTCCTCGCCCACCGCAGCCGGGCCGACCTCGTCCCCTCCGTCTTCGACCCCGCCCTCGTCGACACCCTCAGCACCACCACCGAGTTCCTGGCCGACTGCAAATCCCAGCTCCGCGCCCAGGTGCCCCGCATCCTCGAGCTCCGTCGCCGCGCGGCCGAGGATCCCCTGGCCTTCTACGAAGGCGAGCGCGCCGGCGGCGCCGACGGGATCCCGGACGACGTGTCGGTGGCGGCCAGCTCGCGGCTCAGCACCGGCGGCGCGAGCTTGCTCACGCGGTACACGGGCAAAGGCGGCGGCGGCGGGGCGAGGACGACGAGCACGGGCACGGTGGGGACGGGGGTCAGTCGGGCTACGAGCAAGAATCGGCGGCGCGAGGAGAAGAAGCGCGCGCGGGGCCGCAAGGGTACCGTTTACGAGGAGGAGTACCTCGTGAACAGCGTGAGGCGGCTCGTGGACCGCGTCGGTGCCGTGCGCGGGGAGGTTGGGGCGCTTGTTTTCGCGTTGGTGAGGCGGGATATGGCTGAGCGGGCTCGGGCGGTGGAGACGCTGGTGGATGAAGTTGTGGAGGGATGCAGGACGGCTGTGGCGGAGGTGTTTGGATCCCCCGAAGAAACCGAGCAACAGGATGGGGAGGACCCGAACGAGGGTCTGGCTGGTGGTGGTGGTGGTGGTGGTGGTGGTGTTGGTGGAGACATGGGATATGTGGCTACAGGAGGTGCGGGTGTCTTCCATGAATACTTGGAGGCGAGGAACAGGAGGCAGGAAGTTCCCCTTGTCCAGGCGGTCCAAAAGCTATCCTTGCTCGGAGGATAGCGTAGTCCTAGATTATGGCAATCCACATAGATGATGTACATAGAAACGATTTTTCCAAGGTGGGAAAATTCCGGAACCATTCACACGACTAAAGATGATCATGATAGCTGCAGTGCTATCTGCTGATAAAAGTACACTATTGCACAAGTGAAGATCGCCT\n>XM_002560539.1 Penicillium chrysogenum Wisconsin 54-1255 hypothetical protein (Pc16g02130) mRNA, complete cds \nATGGACGCCTACCCCGAAGACTACGTCAATCACAATCTGCCTTTAGTCCTACTCTCAGGGCTGGAGGCAGACACTGAAAATGAGCCAGGAACACCATCGGATTATCCTCTGCTATCAGAGAAGGGGACGCATATCTTCTCAGACTTCCCACCTCTGAGCGGGGCTGTTGCGGAGGAGCTCCGGAGCTTGCTTCTAGAGGAAGATAGCTCTCAATCGCCATGGAAGTCTAGAGTTACTGTAAGCGGGAATACTACGATTGCGAATATTGGTTACCGCATCAAAAGTTCTGGCCGCTCATGCAGACTCCCTCCACAAAAAGCTGACCCCCCTATCCCCTCACCACCAACTACTCCCAGTGATGACCATGATAATGAACACTCCGAGCCTAGCGCACACTATGTCCTCCACTCCCCGATATCGCCTCTGTCACCGGGTTCCCCAACTTTCCCAGATGGCTTGCTCACACCTCTATGGGTAACTAAACACCAGGACCTGGTTCCAGCAGCAGTGATAAATTTCTTCCCGTTTTCGCTGGACCCAAATATGAACTCGCTGCGAGACAATCAACTCAAGATCGAGATCAATAGCTTGAAAAAAGAATGGCAATCCTCCGGGTACAAGACGCGGTTCGTGGTCGTTCTGTTATCAGAAGACGGAGAAGAAGGCGGCTATGAGGGCGAGATTGATGACCGAATTGCGGGGATTCGGCGGGCAACAAACCTTGACCCCAGGTCAATATTTGTGATTCCACCAGACGCGACTTCATCGGAACTGCAAGACTTTGTGAAATCACTCTTCTCTTTACTGCAACCGTCGGTTGTTGAATACTATCGGGATCTGTCAAAGCATGCCAGGCGTAAACGGAACAGGGGGAATATCCCCCCTCCGACCGCACCACCAACGACCGGAACTTCTCAGACCCTATCGTCCCAAGGCTGGAACGTACGGTATGAATTCAAGCTTGGAATTTTTGCCGAGTTTCGCCAAGAAATGGATGCAGCCTGCCGGAACTATGAGAGTGCGTACGAAACCCTGTTTGGGCATGAAGTCTTCGAAAATATTGCAGGCTGGAATCCTCGATTCAACGATGCGCGCCTTTTGGCCGACGCCCTGGCCATTCGGATTATACGCTGCCTGCTATGGACGGGCCAGACGACCACTGCAGCTCGGCTTTGGGTTGACCACAGAGTCCGTGTAAAGGATATTGTCGATCGCAGAGGAAAGGGCAGTAAACACTACGGGTGGGAGGCCTGGGAGGCGCGTTGGTCGATGGTAATGGCACAGCTTATCCGCCGAGCGGAAATTCCGCCTATCTCCAGCGAAATCTCTTCTGAGCAGCCCAGAAAGCTCTATGCTCTACCTGAGAAATCGATTCCAACCGGGGAAAGAGTCAGGCCCTGGGAACATCTCCATCACGAGGGTTACTGGCTACACCGTTCAGCGAAACATACGATGTTGCGACGTGCCCTTGCCCAGGAAATCCCCTTGGAAGATCGCAAGCCCCCCGGGCAATCACCCGCCTCACAACTCGCAAATAAATCCTACTTGTACGACACGTACCTTGTTCCCGACGCTCACGCCGAAGCACCCCAAGAAGGACGAACTGGCTTCGACCATTCTGGTCTAATATTAAGCACGCTGAAGGCTGCTATCGAGGAATTCGCAAAACGCGACCAAACAAGGAAAGTCGAGAGCTTGAGTCTTGAGGCGGCCGAGGAGTATATGCGTATTGGCTCATGGTCCGAAGCGCATGGCCTTCTTCGGCCGCTGTGGTCTACTCTTAGCTGGCGCCGCTCAGGGTGGTGGCATCTGATGGCCAATTTCGGGCGGGCGCTCAGAGAATGTGCCCTCAGGATGCAGGACAGCGAGACAATCTTGCGAGTGGACTGGGAGCTGTTGAATAAGAATCTCAAACCTAGATCTGCGTGGCATTATGACATCCACAAGAGTCTTGAAAGTTTACCCTCAGAAAAGCCTAAACCTTCTCTTATCCTTCGCGCAGAGGATGTTATAACAAGTCTGACCGCGTCGCTGGTGTTCGAGAAATCTGATGGCAACGTTGGCGAACCTCTACATGCACAGCTTGCCATCACATCCTGTGCTCATAAATTCTCGGCGCCTATTCGGCTTTCGGAGGTCAAACTGGTTTTCGAAGGATGTCTTCGACCGGTAAAGGTTCAATCTGACCAGAACCAGGATGCTGACACCACAACCTCATGTTGTATCGCAACTCTTCCACTCCGGGAACCGAGCAACGCTGATACTGCGGTTCAATCCCCAGCCGGTGGACTGACCGCATTGACCAAGGTGTTTGACCTCACCTGTGTTCCTCGCGAAGCTGGTGAAGCCAGGGTTGCTTCAATCACCATGCTGATTGAAGAAGAACAATTCGATTTGGGTTATGCGGTCACTGAACCAGAACAGCGTGAATCGTTCTGGTGGGAGCAGACCCAGAAGGGCGTGACCCGTAGGAGAGTGGGCAAGGATAGGGATACTGGCAGGTGCAAGGTTATGCCTAAGCCTCCCAAGATCCGCCTCACAACTCCCAACCTGAAGCGGACCTACTACACCAATGAACGAGTGATGCTTCAGATTGGTATACACAATGAAGAAGACGAAGCTGCCGATATATCTGCTGAGATCAGACTATTCGGCACCGAGTCCGCAGCTCAAATCCAGTGGCTCGACGGCGACAGCAACCCCGAACTCCTCGAATCAGGCGCCAGCACTCCGATTGAGGGGCCGTCTCATTACTTGAAACGATCTGTGGGTGTTCTGGAGCGCTCCTCCCAGAAAACTCTTACAATTGTGTTGGTCGATACCCAGGAGGCTACGGATTTCACCTTGGAAGTTTCGACTGTGTACCATTTGGTGTCTGATACCCAGACCCCGATTATGAAGAATACTACCGTGGATCTATCATTTATTCGGCCGTTTGAAGCAAACTATGAATTCTTGCCGGCAATTCACCCTCAGCCATGGCCCAATTTCTTCGCAGTTAGCGACAACTTACTCGAGGATGGCTCTGCGCCAAGTCCTGGAGGCCTGTTCCAGAAATGGTACCTCAATTCCAAGGTAGTTTCCTTTGCACTGGAGCCATTGGTAATTGACAAGATGTCCCTGGTTCTTCTCGAAGCCAACGGGGGAGTCGTTTGCGATGTTCACTCAGAGGAGCTTGTGACTCCCGGAACACCACATCTCGCACCGGAAGAACTGCGAGAATCCAACTTCTGCCTCGATGTCCAGAAGCTCCTTCTCGGAGACCGCCGGCCAACTGCGCTCACCTGCACATTGGAGATCAATTGGCGCCGGCAGTCATCTGAATCTGTAGCTTCCTCGGACGCAGAGAACTCAGTCACAACCACCGTCCTTGATATTCCCCGATTTGTGGTCCCAATGGGCGAACCTCGAGTCCTTGCATCAGCCACCCCATCCAGCAGTATGGCGGGGTTGATTCATATGGGCTATGTACTGGAGAACCCCTCCACCCATTTCCTCACCTTCAACCTGGTCATGGAAGCTAGCGAGCACTTTGCCTTTAGCGGACCGAAGACCACCGTTGTGCAGCTTGTGCCGCTGAGTCGCCACACAGTGAACTTCAATTTGTTTGCAGCGAAGCGTGGCTTATGGATTCAGCCACAACTGGTAGTTATTGATACCTACTTCAACAAAACGCTCCGCGTCCTTCCAACGGGGGATATGAGGTCGGACAAGAAGGGGGTTCTGGTATGGGTTGATGCCGACGATTGA\n>XM_011327141.1 Fusarium graminearum PH-1 hypothetical protein partial mRNA \nATGACATCCTCCATCGTGGAGGCATTGGCGAATGTTCAACCACCAGAAACACCAGACAGCGAAGATCATGACATCGAAAACGAGACCCAAGAATCACCACAACCTACAAACGAACCTTCCCTAGACGACCCCCAAATCGGAAAGCCCATATCTCATGGCCAAATTGTCGACCTTTGGAAGCGCTCCAAAGCACAAGACGATGCAAACTACACTCTAGAACAACTCCTTCGCGGCGCATCCGTCTACATCCCTCCTCCACCACCTAAACCCGAACCTCTAACCAAGTGCAGTCTCCCGAATACAAAGCCCTCATGGCCCGTCTTCGCCGCCAAGAAGAAGCCCGCTCCTACGAACGAATGA\n>XM_039262098.1 PREDICTED: Dioscorea cayenensis subsp. rotundata uncharacterized LOC120253894 (LOC120253894), mRNA \nATGGCCACAGTTCAAGGACCAATAGTTCTGGTTCCTGAACTAGAACCGAACTGGCTAGGTTCCAGTTTTAGGACAATTACGGTTCTGCCGGTTCCAGCCCGAAGAAAGAGTAACTACTTATTGGCCCACTTCATCTCTCTTCTACTCAGCCCTAATTCCTCTTCTTCTCTGTTTCATCACCACGCTCCTCCACCATCGAACCCGTTGCCGATCACCCGCCCGTCACCACGGTCCTCATCTTCGCACCATCGTCGGACCCGTCGCCGGTCACCCACCCGATCACCACGATCCTCATCTTCACCATATCATCGAAACTCGTCACCAGTCACCTACCCGTCACCCGCTCGTCACCCACAAGCCTGCAGACCTTCTTTTTCTTCGAAGAAGGAAACGATCTTCATCTTCTTCTTTGATGATTCTAGGGTGGGTGGTGGTGATCTTCCTGATGACACTGTGTTGACTTGTTCTCACGGCTTAGAAAGGTGGGCTTATTACATTCTTTGTCTGGCTTCCTATCCGTCATTAGGTCCTCACATTATGTTTGTGATGCATTTGCATCAACATTAAAGGGCTCTCCAAACAGTGTTACAGTTGCGAGAACCCGAATTGAAGGAGGTGCAAAGGCTGTTTGGACTAGTGGAAGCCTGGTGCTTCAAAGTATACGAGCCATCTATGCTCGCTAAAGCATCTTCTTCTGGTTCGAAGTTGGGGAAATGATTGTTGCCTAATGATAGCCCTTGTGTATGTAATGTTGTACTTTGAGTTCCTCATCATCTGATTTGTATGTCATTTAAGCATTAGTGCTTTTCCAATTGAATCAACTTCGACAAACGAATATATTTGCTTGT\n>XM_040352829.1 PREDICTED: Rana temporaria histone deacetylase 9 (HDAC9), transcript variant X3, mRNA \nTCCCTCTATTGAGATGCTATTTTTAGCAAATCCTACTCGTGTCGCCACGGGCTGTGATCACATCTTTCTCTCCCCGTTTCTGCCTCCCTCCCATCCTCAGCCATCCCTTTCCCTCTCTGTCTGCAGATTTGAAAACATCACTGGCAGCGCTCCCCGGCGACTCAGCACTCATGTAACCTGCACGGGCAGCGAGCACGGCGTCAACTTTCTTCTGCTTTGTGTTGTACGCTTCCTGGCAGCCTCCTTTCTGAGGATGGATGGTCTGGATGAGCGGCCAACTTCTCCGAGCAGCTACTGAATGAGCAGCAAGATCCTGCTTTTCAGTTACAAACCACTGAAATACATTCCTATCAGATCTGGGATCTCTATCAAACAGCTGGTCGGCATGTCTTCTCCAACCATGAGCACCACAACACAGTCAGATGGGGTATCTGGACGGGAGAAGCTCCTGGCACAGCACAGAATGCACAGCATGATCAGTCCAGATGTGAAGACTGAAGTCCCAGTAGGTTTGGACCCCATCACACCACTGGACCTACGGACAGATCTAAGGACAGTCATGCCTATGTTAGATCCTAGCTTACGAGAGAAGCAGCTGCAGCAAGAGCTTTTACTGATTCAGCAGCAACAGCAGATTCAGAAACAGCTGCTCATTGCCGAGTTTCAGAAGCAGCATGAAAACCTCACAAGACAACACCAAGCCCAGCTGCAGGAGCACCTCAAGCAAGAACTTCTAGCAATGAAACAAAAACAAGAGATCTTAGAACGGGAGAAAGAGCACAAAATGGAACAACAGAGACAGGAACAAGAAGCAGAAAGGCATCGCCGCGAGCAACAGCTGTCTCACCCTCGCAGCAAGGACAGAGCAAAAGAGCGAGCCGTTGCCAGCACTGAAGTCAAGCTGAAACTACAGGAATTCCTTCTGAGTAAATCTGCCACAAAAGATTCCTATACAAACGGAAACAGTCATTCCATAGGCCGCCACCCAAAGCTTTGGTACACGGCAGCACATCATACTTCATTGGATCAAAGCTCTCCTCCATTAAGTGGGACCTCTCCATCATATAAATGTCCTCTTCCTGGAGCACATGATTGCAAAAACGACTTTCCTTTGAGAAAAACCGCTTCAGAGCCCAATTTGAAAGTTCGCTCTCGATTAAAACAGAAGGTAGCAGAGAGGAGAAGTAGCCCTTTACTAAGAAGAAAAGATGGCAGTGTTACCAGTTCATATAAAAAGAGAATATTTGAAGTGGCAGAGTCTTCAGTTAGTAGCAGCTCTCCAGTATCTGGACCCAGCTCTCCAAATAACGGCCCAGTTAACATGGGTGTGGAGAATGAAAACTCAGCATCACCATCCAGCTCACATGTCGAGCACTTGGTTTCCCAACAACATATAGTTCATCATGAAAAGTCGATGAATCTGCTAAGTCTTTACACATCTCCATCATTACCCAACATTACTCTAGGACTTCCAGCAGTAGCTCCCCAACTCAGTGCCTCATCTTCATTAAAAGAGAAACAAAAGTACGAGCCTCAGGCACCCAGGCAGGGGGTGTCACTGCCTGGATCGTATGGAGGAGCCCTGCCTGTTTCTTCAGCTCATGCATCCCTGGAGAGCAAGACCAACAGCAGCCACCAGGCCTTACTGCAGCACTTACTGCTAAAAGAACAGTTGCGACAACAAAAGATTTTAGCTACAGGTAGTGCTGCAATTCTTCACCAATCTCCACTTACAGCAAAAGAGCGGGTTTCTCCGGCGGGCAGGGTGGCGCACAAACTTCCTCGGCACCGGCCACTGCACAGAACACAGTCGGCTCCGCTGCCTCACAGCACTTTGGCCCAGCTTGTCATTCAGCAGCAGCACCAGCAGTTTTTGGAGAAGCAGAAACAATATCAGCAACAAATCCAAATGAACAAAATGCTTTCAAAATCAATCGAACAACTCCGCCAGCCTGGAAGCCATCTAGAGGAATCGGAGGAAGAACAGCATAGTGATTATCTGATGCAAGAAGAGAAGGTGTCCTCCTCGGCTTACATACGAAGTTACAGCAGTACTGACATCAGAACTGACCACCTCAGACCTGTGAAGGTGAAGGAGGAGCCACCGGACAGTGATGACGAAAGCCAAATGCCACATGAATCTATTCACAAAATGGCTTTTGTGCAACAGGTAATAGGCCAAGAAATAGCTCCAGGATTTGTTATTAAAGTTGTCCTTTGAACTTTAGGACTGACTAAGAAAAAGTAAGACCCCTACATTATGTAAATAGACATTTTTATTTGAATATGTTAATACAGGTTCTTTTCTTTTTTTAATCTTAGTAAAGCTGGTCATATACTAGATTTTTGAATAACAGTCCTTATAAATATCTGTGCAAACATTTGCAATGAAATTCTCAGTACATCAGATGACTGGACAAATGTCATTCGATTTTGGAGTGAATGGAATTTCCTAAACAAAAACTACATACACTATTGAGAAAAAAAATCCATCCTGCACCTTCAAGCTTTCTCATTACTATGGTTTAAAAAAAAAAGTTATTTTTATCCCACTAACAATTAGAAAGTCAAATGAATGTCAACAAAAATCCTATAATGCCGTGTACGGAAATTCCGTGGATTTTTTTTTCCGACGGAATGTTGACTACTTGTGTTGCATACACACGGTCACACAAAACA\n>XM_039196864.1 PREDICTED: Hibiscus syriacus probable prolyl 4-hydroxylase 3 (LOC120194605), transcript variant X1, mRNA \nAAATTCTCTGATACTTTTCATCCGAGTTTTACCCAGAATCAGGGGTGATTTTCTTCCACCGATCCCTGGGTTTTGAGCTGATTTCTCTCGTGTCATCTCCGTAAATTCAAGAATGCCGAAATTGAGACATTCTCGGTTGCAGGCGAAGAAGCTGCCGACAGCGACGCTTGTATTATTCATGTTGTTTATGTTAACGGTAGTTTTATTGATGCTTTTAGGACTAGGGATTTTCTCTCTTCCGATAAACAGTGATGATTCTCCGCCCACTGATCTTACTTCTTATAGACGCATGGCCTCTGAAAGAGGAAAAGGCTTGGGGAAAAGAGGGCAGCAGTGGACTGAAATCCTTTCTTGGGAGCCTAGAGCTTTCATTTATCATAAATTCTTGTCCAAGGAAGAATGTGAATACCTAATCAGTCTTGCTAAACCTCACATGGCAAAGTCCACTGTTGTTGATAGCAAAACAGGGAAAAGTACAGATAGCAGGGTGCGTACAAGTTCTGGTATGTTTCTGAGAAGAGGGCAAGATAAAATCATTAGAAACATAGAAAAAAGGATAGCTGATTATACTTTCATTCCTGCAGAGCATGGAGAAGGCCTTCAAGTTCTCCACTATGAGGTTGGACAGAAATATGATGCACACTTCGATTACTTCCTTGATGAATTCAACACTAAAAATGGAGGCCAGCGGATGGCTACTGTGCTTATGTATTTGTCAGATGTTGAAGAAGGAGGTGAGACAATATTTCCAGCGGCCAAGGGAAATGTTAGTGCTGTGCCTTGGTGGAATGAATTGTCTGAATGTGGTAAACAGGGTCTAGCTGTGAAGCCAAAGATGGGAGATGCATTGCTGTTCTGGAGCATGAGGCCTGATGCCACACTAGATCCTTCAAGTTTGCATGGTGGGTGCCCTGTGATTTCGGGGAACAAATGGTCCTCAACAAAGTGGATTCATGTTGAAGAATACAAGGCTTAAGCTGCTGTATAGAGGGTGCAGTTCTGAGGAAGTGTGATTGAAGCAACCCCCTTTAGACTCGGGTCCATCAATCTCTTTTTGACGGGGCACGGTGTCTCTAGACCTAATCCTTAGGTTGAGAAGTAATTGTTCTCGTGTATTCTGCTGGAAACTATCGGGTTAAGAGAATGCGGTTCATACGTGTTAGGTCCTATAAAATCCGATTGTAAAGTAGCTAAATAATAATGAATAGAAGTATCTTGGAGCTATTGTGAGTCTGGTGGTTTTAAAATCAAAAGTACGTACTAAAGTTACCGGCTATTTTGTTGTTAACACACTGATGTGGCCCATAGTTCATAAAAACAGAAACAAGCTGGATAGACAAAA\n>XM_045620325.1 PREDICTED: Harmonia axyridis 26S proteasome non-ATPase regulatory subunit 14 (LOC123681941), transcript variant X2, mRNA \nTATAAACCAGCTGTCAATCTGTCAGTGGAAGTCAAATATCGTCAAATAACAAACGGTGATTTGCAAAATTAACACTCCTTGTTTTTTCACTTTATAAATAAGAATATTAATTCATTTAATAGTACTTTTATATTATAGCCATGGATCGACTACTCAGGCTTGGTGGTGGAATGCCCGGATTGTCTCAGGCAGCCCCTGCTTCTGATGCTCCTGTTGTAGATACTGCAGAACAAGTTTATATTTCTTCATTGGCCTTATTAAAGATGTTAAAGCATGGAAGAGCAGGTGTACCCATGGAAGTGATGGGGCTCATGCTGGGTGAATTTGTTGATGACTACACCGTTAGAGTAATCGATGTATTTGCTATGCCCCAAACTGGTACTGGTGTAAGTGTCGAAGCTGTGGATCCTGTATTTCAAGCAAAAATGTTGGATATGCTTCGACAAACAGGCAGACCTGAAATGGTTGTTGGCTGGTATCATTCCCATCCTGGTTTTGGATGCTGGCTTTCTGGAGTGGATATAAATACGCAACAATCATTTGAAGCATTGTCAGAAAGAGCTGTTGCAGTTGTTGTTGATCCTATCCAGTCTGTAAAAGGCAAGGTTGTTATTGATGCATTCAGACTGATAAATCCTAATATGATGGTACTAGGTCAGGAACCCAGACAAACCACATCAAATTTGGGACACCTTCAAAAACCTTCCGTCCAGGCTCTCATTCATGGTCTAAACCGTCATTATTATTCAATCAGTATAAACTACAGGAAAAATGAACTTGAACAAAAAATGTTGCTTAATTTACACAAAAAATCTTGGATGGATGGCCTCACTTTGGCAGATTATTCAGAAAATTGTAGTGTGAATGAAAAAACCGTATCAGAAATGCTGGAACTGGCTAAAAATTATAACAAAGCCTTAGAGGATGAGGAGAAAATGACACCTGAACAGTTAGCAATTAAAAATGTTGGAAAACAGGACCCTAAAAGACATTTGGAAGAGAAAGTTGATGTACTTATGACGAATAATATTGTTCAGTGCTTAGGTTCAATGTTGGACACTGTAGTGTTCAATTAATTTATTATTTTTACAATAAATTATCAACATATTCAACTTCATCATTTTGATTCAATAGTTTTTCATTTCACTTATCGTTTGCTGCAAGTTAAACACTACAGTAGGCAAAAATTACTCCAATCTTCTATTGGAACTCATAATATTAATTCATTAATTCTCAAATGAACTAAAGTTTATTTTCAATGAGTATGAAAATATTAAGATAAATAAGGATTTTATAAGAATAAAATTTCAATGATCTGTAATAAAAAAACCAAATGTCAA\n>XM_018196263.1 PREDICTED: Atta colombica NADP-dependent malic enzyme-like (LOC108689497), transcript variant X2, mRNA \nCAATAATGGAGAAGCCAACGTACCTCGTCCGCCGATTTAATTACAAGTGAACGAACCGCAACCGGTTCGTCGTGCCGCGCGTTTGCTTCGGGAGTGCCGTTAAAGTTATCGGACTCAAGTTATGGTCCGCGCGCGATTATAGTGCACTATTCGCGAGTGTTTTACGGGAGTGGATGTCAATCCAATTCTGAGAGGAGGAGAAGGGAGAGACATCGGGCACCGGCGGAGCATTTACCTTGCAAATTATCGACGTTGCAGATAACTCCACTGTTGCGCATCGGGATGATAACGATGTTCAGAACAGACAGCTGAGAGACATGCCGCTATCGATGAATGGCTGTCAGAAAAAATTTGCTCGCATTCTAGAAGACTCGAGCGAGGAATTGTCTTCTCAGTCGCATGAAGCCATCCCTCTCTGCGCACGACACACAAAGTTACGCACGCATGACCCAGAGCAGTACACAACCTAACTGTAGCAAGAATAAAAGCATGTCGAGCTTGGAACGCGATCAGCTGGGCCAACGAGGAAGCGGCGACACGGTCTCCGCTGGTCTTCTGCGTGGCCTCGATCACATTAGAGATCCGCACTTGAACAAGGGTATGGCGTTCAGTATTGAGGAAAGGCAGATACTGGGTATACATGGTCTTCTACCGGCAGCCGTAAAAACCCAAGAAGAACAGTTAGAGCTTTGTCGTCTTAATCTGGAACACTACACGGATGATCTCTCAAAATACATATATCTCATAGGCCTACTGGATAGAAACGAGAAACTCTTCTACCGTTTGTTGGCAGAAGATGTAGATAAAATAATGCCATTGGTATATACGCCGACCGTGGGTTTAGCATGTCAGAAATTCGGTCTGGTTTACCGTAGGCCGCGTGGCCTTTTCATAAGCATTCACGATAAAGGCTATGTCTATGACGTTTTGAAAAATTGGCCCGAACACGACGTACGAGCAATCGTTGTCACGGACGGTGAGAGAATATTGGGATTGGGTGACCTAGGTGCTCACGGCATGGGCATTCCCGTAGGTAAATTGTCATTGTATACCGCATTAGCTGGTATCAAACCCCATCATTGTTTGCCTATCACTTTGGACGTCGGCACTAATACCCAGTCTTTGTTGAATGATCCCCTATATATCGGTCACAGACACAAACGTGTTACTGGACAAGAGTATGACGACTTCGTGGACGAATTTATGAAGGCTGTTGTGAAGCGATTTGGTCCGAATACGTTAATTCAATTCGAAGACTTCGGAAATGTTAATGCGTTCAGATTGCTTCAAAAATATCACAAGGAATATTGCACCTTTAATGATGATATTCAGGGTACCGCCTCTGTCGCTGTTGCCGGGTTATTGGCATCACTTCGTGTTACGCAGACAAAGCTCTCAGAGAATACAATCGTATTTCAGGGTGCTGGAGAGGCGTCATTAGGTATCGCGGCATTGTGCGTGATGACAATGCTAAAAGAAGGAATAACTAAGGAAGAAGCTAAGAGCAAAATTTGGATGGTAGACTCGAAAGGATTGATAGTGAAAGATCGTCCAAAAGGCGGACTGACGGAGCATAAATTGCACTTTGCTCGTGAGGATAAGCCAATCGACACTCTGTTCAATGTTGTTAAGACCGCCAAACCTTCGGTTATTATTGGCGCAGCTGCTATCAGGGGTGCCTTCACAACAGAAATATTGAGGGAAATGGCGCGTATCAATGAGAGACCCATTATTTTCGCTCTGAGTAATCCAACGAGCAAAGCAGAGTGCACCGCGGAAGAAGCATATATTGCTACAGAGGGAAGATGCTTATTCGCAAGCGGCTCGCCTTTTCCACCAGTCACATATAACAATAAAACTTACTATCCTGGTCAAGGTAATAATAGTTACATATTCCCTGGAATCGCGCTGGCCGTAATATGCGCTGGTATGCGCACCATTCCCGAGGAAACTTTCCTTATTGCTGCGACGGCTCTCTCCGACTTGGTAACGCAAGCCGATTTGGACAGCGGTAATCTTTACCCACCATTGGCCGATATACAGAAATGTTCGTTGTGTATAGCATGTGCAATCATGAAATATGCTTATGAAAAATCTCTAGCAACTGTCTATCCGGAGCCTTCAGATTACGAGAGTTTTATCAAGGCACAATTATACGATCCAAGCTATAAATCGGCAATTCCTCCAGTTTATTCATGGCCAACAATAGAATTCTTTGGGAATCTTCCTCGCTTTTTTAAAGTCTGTTGACCGGGCTTATTTCTAACAAGTATGTGCAAACGTGATCAATATTTAATTATTAAAATTCGCAAGAATGAATTTGTGTTTAA\n>XM_051723159.1 PREDICTED: Myxocyprinus asiaticus protein EFR3 homolog B-like (LOC127455345), transcript variant X3, mRNA \nTGCATGCATGCACATGTGTGTGTTTGAGTGTGTATTTGTGTGCATGTGTATATATGTGTGTGTGTGTGTGTGTGTGTGCACCTGTGTGTTAAACCAGCATTGTTCCTGATAGAGGGAAAGCTGTGCCGCACTGTTTGGAAAATCCAAGGTCATTGAAGCCCGGTCACATGCACCATATGTGAGCGTGCATGTGTGATTTAGTGTCTGAGTGAGTGAGTGTGTATGTCTCTCTTCCTCTCTCTCTCTGGCTGGAAAGAGGCTTCAGGCAAAGAATAGTGAATTTCATCAGGTTTTCCATCAATGTACGGTGTGTGTGGATGCTGTGGGGCCTTGAGACCTCGTTATAAGAGGCTGGTGGATAACATCTTTCCTGAAGACCCTGAGGTATGTTTGTATTGCTATGGAGGCTTTGGACCAGCTGCTGATGGCCTGTCACTGTCAGAGTATAAACCTTTTTGTTGAGAGTTTTCTCACTATGGTGCGCAAGCTTTTGGAGGCAGACAAACCCAACTTGCAGATCCTGGGCACTAACTCATTTGTGAAGTTTGCAAACATCGAGGAAGACACACCATCATACCATCGCAGCTACGATTTCTTTGTCTCACGCTTCAGTGAGATGTGCCATTCCAGTTATGAAGATCCAGACATTCGCACCAAGATTCGTATGGCAGGTATCAGAGGTCTGCAGGGTGTGGTGAGGAAGACTGTCAATGATGAACTGCAGGCAAATATTTGGGACCCTCAACACATGGACAAAATAGTGCCATCCCTTCTGTTCAACCTCCAGCAGGAAGAAGGCATAGAGAGATCTCCCTCCCCAGAGACAGAGAAGGAAAGTCCAGTGGAGCTGACCGAGAGGTGTTTCAGAGAGCTGCTAGGACGAGCAGCTTATGGTAACATAAAGAATGCCGTCAAACCCGTGCTCATGCACCTTGATAACCATTCACTCTGGGAGGGCAAAACATTTGCTGTGCGCTGTTTTAAAATCGTTATGTACTCCATCCAGTCCCAACATTCACATTTGGTGATTCAGCAGCTGTTGGGTCACTTGGATGCTAACAGTAAGAACTCAGCCAGAGTGCGTGCTGGGATTGTGGAGGTGATCTCAGAGGCAGCGGTCATAGAGGCCAGTGGCTCAATAGGGCCGACAGTACTGGAGGTGTTTAATACTCTGCTGAAGCAGCTGAGACTCAGTGTGGACTACGAGCTCACCGGATCATACGACTCTTTTGGAAACATGGGAACCAAAGTCATTAAAGTGCACGAGGAGAGACAACTCCAAGAATCTGTCATCAAAACTATTGGCTCATTTGCGAACACGCTGCCCACCTACCAGCGCTCAGAAGTCATGCTGTTCATCATTGGTAAAATTCCTGTGCCAGGGATGTATCCGGCTCTGGGGTCAGCCAACACAGGGGTTGAGGGCAGTAGGATGATACAGATTATGCTGCTAAAATCTTTGCTGCAGGTAACAGCAGGATTCCAGTCTACGAACATTCTGACAACTCTTCCCACCTCATTCCTGGACCCTCTCTTGTCCTTTACTCTGATGGAGGAGGCAGAGATCCGGCTACTTGTTCTGGACATCCTCATCAGCATCATTGATCGCCATGACAACCGTCACAAATTCTCCCCTGTCAGAATTGTGTCAGATATCGCTGTACTGAAACTGAAAGTAGACAAGTGCTCAAGGCAGGATAATCTCTTCATGAAGAAACACAGCCAGAGGCTCTACCGCCACATTTACCTGGCCTGCAAAGAGGAGAGCAGTGTCCAGTGGCACTTTGAGTCTCTTTATACGCTGCTGGGGTTGATCAGTGTTGAGCTGGCCAATGAGGAAGTGGTGGTGGACCTGATTCGACTGGCTTTGGCCTTACAGGACCTGGCCTTGACTGAAGAGGCACTTCCTGTGTATAACCGCTGTGCCATCCATGCTCTATCATCTGCATACCTGAACCTCATTAGCCAGCTGACCACTGTGCCCACCTTCTGCCAACACGTCCATGAGGTGATTGAATCAAGAAAGAAACTGGTCCCCTGTCTGCTGCCTGAGGATGTGCTTGTTGAGACCTCAAAGATCCCAGAGAAACTGGAGAAGGTGGAAGGTGAGGTTCTGTTCATGCAGGCTAAGATAGCGGAGATGCTGGGCGGCAGTGGATACAATACAGAGAGACTGGCCACTCCATACATCCCACAGATCACAGATGAAGACAGACTATCTAAGAGGAAGAGTATTGGTGACACCATTTCCCTGCAGTTAGAGATGGAGTCCAGAGACAGTCCAGAAAAAGAGCAGAGATCCAAAGCTGAGCAGATAACATTTGAAACCCTTAAACAAGCCATTGTAGACAGTGTGAGTGTGGAGGAGCTGGAGAGAGAACGCAGGAGGCAGGTGGTGGAAAGGTTTCAGACGGCTCCATTTGAGGAGATCGCAGCACACTGTGGGGCCAGGGCTTCCTTGTTGCAGAGTAAACTCAACCAAATCTTCGAAATCACAATCAGGCCTCCTCCGAGTCCGTCTGGCTCTGTCGGGAATGGCCGAAATCGTTCTGTACCAGTCTATGAAATGACGTTTCCAGACCTTTGTGTGTACTGAGAAAACCTGGAGCCACAGTCACCAGATACAGACCTATTTCAATCCCTACAATATTGTCACTCCTTCTCAATGTCCAGTTGAAACTATGCGTCTTCTAAACTGTGTCCTTTAGTTTAATATCTTTAGATAAAGATCAAAACTTGACTTGATCCCGAGGTGTTCACCAAAAAAGACAACCAAACCAAGAGAATATACATTGGTTATATATGCACTGTATCACTAAAAATGACAAAACAATGTTCACACAGCTTAATCTAAATGCAAATAGATTGAATGTATTTAGAAACATTTGTGCCATTGTCTGATACTAGCATACATAGCAGAACAAGGTTTTCATGTTTAATCAAATGTCCAGTGAATAGGCCAGGTTACTGTGTAAGTCTATTGTTCAGAGCAAGTGGATGATATTCTTGTACAAATAAAAAGTACAGCTGCCTTACATTTTGTATCTTAAGTTAAGACTTAAAGAATTGTTAAAGAATGTTCTCGGCATGTTTTCTGTAACTATGTTTTTCAATCTATTGATTATTAAAGTGACGGTGCACTTAAAGGTAGATAAATATAAGGTTGTTTGCCTGGTATATACTGTATTTCTTTGTGCATGTTTAAACCTTCTCTACATTCTGCAATAATATTTGTATTTAAAGCAATAATTAATGAATTTAATAATGCAGATTCTTCTGAGATAAAAGCTGAAGAAAAAATGCAACACATTTTGTTTGCGAACACTGGATGATGCAGTATTACAATCAGAACTAACAGCTTATTGACACGCTGTGTGCAAGAAAGTAAATTCAGTAGAGCCTCTGGTGTATTTGCATAGTAACGTCATGTTAATTATGTTCTAATTGAGTTCTGTACATCTGTACCTCATTACCACAAGAAATATGTCATATATTTCAAAGAATATGTCAGTGAAGGGTAGGAGTTTTCATTTGCTTAATAGTCTAACAATGATTGTGTACATTTCCCAAATGACCATTTTCCTTTTTTGAACCAGAGTGAAGTGGTAACACTTCTCATAGTCCCCTACATTTGGGGTCTAAAGGGGCCAATTAGCTCTCTATTTGTTTTTGTTTTTTAAATTAGCTATGATATATGTTTGTTCCTTTTGTCACTTGTATAACTTTTCTCTCTTCATAAATCCTGTAATTTCAGGTTTACGTCAAGATTTGGTTCTCTCTTGTATTTTATTGCAGCACTTTAAAGATCATTGTGTAAATGTGGTGTATGCTAAAAAATATATGTTCTGTGATTTTCCACCTTGACATGTGAATGTGTTCTTGAGTGTCATTTTAAAGTGAATTATCTTTTATCGTCTCATATTTTCCTATTCCACATGAAAGTTTGCCTGTTTTTCTGCTATAATTCCATGAAGTCCTTTTAACTTTTTTTTTTCTTTTTAAAGTTATTTAATCAAGTCATTGTGTTTTTTGTGATGACTTGAATTTATTTACTGTTTCTACATACTGGTTTTAAAAGCAAAGCATCCAAAAAGAACTTGACTTTTGCCATCTTTAATATGGGTATAATGTCCAACTGATAGAACATTCTAGACTTCTTACATGTGAGGTGTTTGACGATGTACTGCATGTATGAAATATCAAAGTTTAGTCTTTCCTCTCAAAAAACTGTGTCCTTGACAGTTGCCGCATGCACTGGGAGTTTTGTCTGTGCTTTTACTATTTTTGTTGTTGTTTAATTTTTTGGGTTGAATCCTTATTAAGAAAATTAAAACATTGTGGATTGTAATTAGTAATTATTACATGTCAGCTTAGTCCCTGTTATGTGTTTGGTACCGTCAATGCAAACTGATGACTTCAGAACTGTGTTCTGTGAATGTTTGCCTAAATGAAACAATTCCTAAGTAATGTACAGAAGTGGTGTGAATAATAAGAATATCAATTAAAGACTAATTTTATGAA\n>XM_039521359.1 PREDICTED: Mauremys reevesii poly(rC)-binding protein 3-like (LOC120396454), transcript variant X13, mRNA \nGAGGGAGGGGGGGGAAAGAAAAAAAGAAAAAAAAAAAAAAAAAAGCAAAGCTTTGCCTCATTCCAGTAGGGCTCAGGGCTCCCGGCCATCTGTCCACCCTTGGAATCAGAAGACAAATAGAGGGACCACACTCACTATAACTGTGCAGAAGGAAATTGTTCGGAAAGTCTGGCTGAGCTTTGCATTTGAAGTGCGGGCTTTGAGAGCAGCTCAGCAGGTTGACGAAGTGAAAAAACTAAGAAACTGCTTTCAAGCATTGAAGATACCAGGCCAGGATGAACACGAAGGACACAAAAGTGACAGAAGGAGGTCTCAATGTCACACTTACCATACGTCTTCTCATGCACGGCAAGAAATATTCACTTACTGTGGTGTTGTTTTTTCCTGTTCCAGGAGGTTGGGAGCATTATTGGAAAGAAAGGGGAGACAGTTAAGAAGATGAGGGAGGAGAGTGGTGCACGAATCAATATTTCAGAAGGTTCCTGTCCAGAAAGAATTGTGACAATAACAGGCCCAACAGATGCGATTTTTAAGGCTTTTTCTATGATTGCATTAAAATTTGAAGAGGACATAAATGCTTCAATGACAAACAGCACAGTGACAAGCAAACCACCTGTGACATTGAGACTTGTAGTCCCTGCAAGTCAGTGTGGATCCCTTATAGGAAAAGGTGGCTCCAAAATCAAAGAAATCAGGGAGTCCACAGGGGCCCAGGTACAAGTAGCAGGGGATATGTTGCCAAATTCAACAGAACGTGCTGTAACTATATCAGGCACTCCGGATGCCATTATTCAGTGTGTAAAACAAATCTGTGTGGTCATGCTAGAGTCCCCACCCAAAGGTGCCACCATTCCCTACCGTCCCAAACCTGCCTCTGCACCTATCATTTTTGCAGGTGGCCAGGTAAGAGCAGACACCATTTTGGCTTCAGCTGGAAACCACACCGTCTTGGCCCAACCTCAGCCAGCGCCTGCATTTACAATTCAGGGGCAGTATGCCATCCCTCATCCAGATTTGACCAAGCTTCACCAGTTGGCTATGCAGCATCCCCCCTTTACTCCCCTTGGGCAGACCACCCCTGGTTTCCCTGGATTGGATGCCACTACTCCAACCAGTTCCCATGAGCTTACTATTCCAAATGATTTAATAGGCTGCATTATTGGCAGACAAGGCAGTAAGATAAATGAAATCAGGCAGATGTCAGGAGCGCAGATCAAGATTGCTAATGCCACAGAAGGCTCGGCAGAGCGACAAGTTACAATCACAGGCTCCCCGGCAAACATCAGCTTAGCACAGTACCTCATTAATGCAAGCTTAGAGATGGCTAAAGTCAGCACCCAGACTGCTTCCGTCACGACCCCTGTTGACCTCAACATGAACCTCTCTCAGTCTGCCACCCCTACCTCCACCCCCACCTCTATGGCTGTCTTGGCGGCAGCAGCAGCTGCCTCCGCGGTTAACGTCAGTACCCCTCCCCCTTTACCAACTTTACCAACCACCCACTATGCCGTTCCTGTCTCCAGTCTGCTTGGCATGAAAACTGTCCCACTCCTGGCACTAAATGCCGCGGCCGCTGCGGGGGCCACGGGGAGTTTATCTGCTTACACTGCCAAAATTCCATCGACGAGTGGGGTTAAGAAATCTGACCGCCAGAAGTTTGCTCCATATTGAAGGGATGAGAAACAAATGCAAGGTTTTTCGAGCTCTACCAAGATTCTGTGGTAGATAATAGCTATCAAGGAAACAATATGGCATATTTTTATTTTCTGTTAAATTGCTAGTGTTAACTGTTGCCACCTCAAATTGTCTTCCACTTTCCATAACTATTAACACGTGTGCACGCACACACCCACCCAAAATGTAGCAACTAGTTCCAACAGCCTCCCTGAGTCTTTTAAACTCTAGTTGGTAACCATACTTAGCTAAAGTTTGTCATGTAACGGGTATGGTTCCCACATAATCTAGCGTGTTTAGCTTAATACAGCTATTAATAAAGGGTCCAACACTAGGCTTAGAATGGAGACAGATTTTCATTCTGAGGCATCACTGCTCTGACAACAATAATAGAGAGCTGCAGGCTCAAGTGTTGACACAAACAAATGCTGCCTGGTCTAGCCAGCGTATAGGAAAAGACTCCTTCCCAGGGCTAAGTTCTGTCCTCATTTATGCTTGATGCATTTCAGTAGGGTTGCATGGGGGACAGCAAGGACAGAATTGGGACCTTCAAAAAGGGGGGGGAAAAATGATACCTAAGACAAACGTCTTTGGCATTAGAAATAGTTATTAATTACTGCCTAGCGCATCAGTATTTATATCTATTTGAAGTGATCCCTTCAGCTGTGAGACTACTTCTCAGTTGATGTATCCTTCAAATTTGACATTTGTCTTCATGAACATTTTGATAGGCCTATAGCTAGAAAGCACCATGCGTCTCTGAAAGGAAATGCCCATGCATGCCTGACCTCCAGCGGTCATTCTACTAAAGTTCACAAAGCACTGAGACTTGTATTAATCTGCTTGGCATTTACATCTTACTAGATAATGAAGCTAAAAAGAACACCAAATATTCTTCTAATACATACATGCATATAGTCATGGATCGCCCATGTGTATGAATCTTGCTGCACTGAGAAACTCTTAACAGAATGGAAAGAGAGAGAAAAAACATTAAAGGAAGAGAAATATTAAGTGGTAACATGAGGTAATTTTAACAAGCTTTTAAATCTTCTATGTGCCATCCTTATAGCCATACTAATGTATCAGCCAAGCCTCAGTACTCACTTAACCAATCTGTTTCTATAGGATATTTACAGAGCACAATGGTTCATCTTAATTTAGGATACTAGTGAAGGATAATGTACTTTAAGGAGGCCATTTTCAGGAGGGCAGGCTCCCTTTTGGATGCACAATTTGCCCCTATATATTTTGCTCCTGCTTATGACCTGGAGGTGCAACTCCAAATACATGCATCTCGAAGTATTGAATTATGGGTACAAATCAGAGGAGCAAGTATTCAGATTTGTGCCCACAGTTTGTTTTGCAGGCCCAAGATACACTCCCACAGCCAGGCATCAGACTGGCTGAAACTAGACCCCATGTAATTTAGGGCCCAGATCATCCTCCCGCTGAAGTCAATAATAAAACACCCATTGACTTTTTCATGGGAGCAGGGTCACATGGCCTTCTTGGCCAACATGCATTGGCTAAGGTTTACTAAGGTTACTGTACAAATCCTAAATACATTCCAGTTTAAAAGCTTGGCAACTCATTTCACAGTGTAAGTTATGGTTAGAAAACAGGCATTTAAAAATGAACTACACGTACAAGCTATTTCATATCAAATGTTATTTGAAGGTTGTCACGTTGATTGGATGCCAGCCAGCAAACATAATTACACACAAGTTTACTATGAAAGGAAAAATAATTGCAAGCAAACTGAAAGTAGCTGGGAGATGTACGAGCTGGTTGCTAGCTGTTGGAACTAGTTTTTAATTGCATTTTCTGTTTGTCCATTCACCTTATTTTTAGTTTACGTTGCATAGCACTGGCTCAGTAATGCAATATTGTTTTCCTCACAACTTCAAAATTCAGAATCCCATTAGCCTGCCATGTTCATCCACTTTGCACTCCTTGGACACAAAGCTTTAACGAATTGAACTGTATTCGGTGCATTTTAATATAAACTAAAAACACAGAATGCAAATGCAATACTTTTTAAACCATGGTATTTAAAAGTGTGTTGTTATTGTATAGGGCTAAGTACTATTTCAGTATTCTTTGTCATTTCTGTATTTTATAGGCTTTTCTCCACCTTCGTACCTTTGCGCTAAGTTTTGTCACTGTAACCATTTGTAGAACTGTCGTTGTTACAATTTTCACTTAACAAAATGGGGAGGCGGGGCTGTTTGTATATAATGAAGGAAAAACTGGAACAAATGTCATGGTACCTCAGATATTTGACAGCTCTAGAAAACTGCTGTAAAATTGTTCTGGACTATTGTAACTGTTTTAATAACTGAAGTAAAAAAATGTGAGAAAACTTGCCTGCATTGAAATGCTGTTCTATGCTAGTTGTACTCAAGTGTAATTTTTTTAATGGTGCGAAGATTTTTTTTTCTTTTTTTTTTCTTTTTCTCCTCATTTTTGTTCCTACA\n>XM_039832640.1 PREDICTED: Medicago truncatula lichenase-like (LOC25491909), mRNA \nATGATTATTTTGTTTCTTATTGTTCTTATTGGGTTGAAGACTTCAGGAATAGGAGCACAATCTATTGGAATATGCTATGGGAGAGTGGCAAACAACTTACCTCCTGCAAAGGAAGTAATAGATCTTTACAAATCAAATGCTCTTGAGAAAGTTGGAGGTGCTAATTTGGAAGTAGTCATATCAGAAAGTGGATGGCCTTCTCATGGTGATGTTGCTGCATCAGTTGAAAATGCACAAATCTACTATGAGAATTTAATTAAGCATGTTTCTAATGGGACTATTAGTAGACCTAATCAAGCATTAGAAACTTATTTATTTGCCATGTTCGATGAAAATAAAAAAGGACCTGCTGAAATAGAGAGACATTACGATGTCTCGTCACTGCAGTCAGAGTTTGTTGTGCTCGAAAGAGCCGTAATGCTTGTTGTGCTTTGTTGTTGCAGGGATAGTTGGTCCGTGGATCTGTCCGTGTTGGCGGTCAGTTCATATACCATGTCTGAAAAGATGGGTTTGGTTTTGTTCAGATCCGTCTCTGGTTTGATTATGATGCTCGCGAATGTATTGCTCCTCCAAGATCATGATGTGCTTCGTAACATGTCTTCTAGGCTAGAAATAGTCATGTACATGTTGTCCATTGTTGTTGCGAATGGAGGGTACGGGTGTTACCGTGTTGGCGGTGCTCAGACTCGTTGA\n>XR_005989539.1 PREDICTED: Vulpes lagopus uncharacterized LOC121497833 (LOC121497833), transcript variant X2, ncRNA \nGGTTCTGCGTGATTGGCCCGGGCTGCGGCCGACCTAGACTTAAAGGGACGGCGCCCTCCAGGGGCAGGAGGGAGGGAGGTGACCTGGGGAGTTCGTAGCGGGGTTGGACCACGAAGTTCCAGGGTTCTTTCTGGCGCTGGAAGGAATTTAGAAATCGCCTGGCCTGGTCCTGGTCACCTGTTCTTTCCAGAAGCCCAGAGAGACCGTGCTGCTCGTTCAGCTCCACACGGCGCTCCTCCCGCTTTCAGTGTGGCGGAAAGGCGGAGTGAGGAGTGAGATTCCCAATGTACAGAAGAGGAAACCGGGACCTACACACGGTTGCTTCCCCAAGCAGAGGACTGCAGAGGTGAATGGTGCTGGGCCACCCCCTCATCAGGTCTACTCCTCTTTGGGCTCAGGGCCCATGATTCTAGGCCTGTGTGCAGATGGAGGAGTAGTGCCTGCAAGCAGCCCTCAGTAGGCCTCCCGCATAAATACCTTGTCTCCGTGTCTACTTCAAGGATCCTGAACCCAGATGAGGTGGCCCCCGAGACAGCCATCCAGCCATGGGACCTCCTACGTACCAGGCCTGCACTAAATGAGGAGACGGGCCATAGCACATACATGACACACATAATACGAGGCGGTGCTCTGGAAGAAAGCGAAGGACAAAGGGTAGAAGGAGGGAAGATGCCATCTGTTCTGAGAGCTGTATGAGGTGAGAAGAAGCCACAGAAAAGTCTGGGTGTGGAACATTCCAGACAGGGGGAACAGCAAGTGCAAGGGGCCCTGAGGCCAAAGAATTTGAGGGACAAGGAAGCCAGTAGACCCAGAATGGAAAGAACAAGGGCCAGAGCGACAGGCGACAAGGCAGCAGAGGTGAGAGGACGCTGGTCACGCGGGGCTTGTGAGGCCGAGGAAAGAGTTTGGATTTTATTCCAAGTGGGAAGCTGATGGGAGGCTCAAGGGTGGCGGTTAGGAGGCTGTCGGCACTGCCTGGCTAGTGGAGAACTTTCTGCAGAAGGGAAGCCGGAGGCCTCGTTCTCAGGAGAGGGCAGCTGTCCTGAGCAGGGATGGTGCTGGCCCGGCGGGGCCGGGCGACGGGGGTGGACACGGGATGGAGCAGGCGGAGAGCTGACGGACGCCCCTGTGGGTTGCCTGACATGACGGAGATATCACAGGATGACACCTGCGCTTTGAACCCCTGGTTTTTATGTGACTACTTGGTTACTTTCTATCTTTTTCGTCCAAGAGAGCAGGGACTTTGTCTGCTCTGTTTTGCTCACTGCACTTAGCCTAGACTCCAGTACACTGTAGATGCTTCGTGAGTGTTTGTTGAATGACTGAATGATGGAGATATGGCATTTGCTAGGACTTGAACCCTGATCTTTTGGCTCCAGGCCCCAGTGCCTTTTCTCTCCCACCAGGGTTTTGATGAGGATCAAAGAGATAGGAGTTGTGCAAGGGGGTTGCAGGTGGCAAAACAGCCCACAAGCTGGTGGCTCTGGGGCCATTTACCAAACAGTAGCTCAACAGACTCGCCTCAGAGCCCAGCACAGGCTACAGCCTGTGCTGCCTGCAGGGTGGGCACCCCCCTAAGCCAGCCTGGCCAGCCTCCCCTGGGGAGCAATCCTGCCCCTACTCACAGCCCCTGGAGCCCACGCTCGGAGCAGCTCTGCCCAAAGAGTACACAGGTGCCCAGGCTGATGCCCAGGGGAGGGGACGGTATACTCTGCTCTTCGGACCCCAGGGGCCTAAGCCAGCCCCCCACCCCCTTCAGGAGATGTGGAGCAGATGTGAAGGGAATGTAGGCCTACCCACAGGCTCGCTCCCCCAGGCCTCGCCCCAGGGAGGCTCCTCTGGGAGACCTCTCCTTCCCCTGGGCCAGCTTGGGCCCCCCTGTTCCTTCACCCTACCTCATTGGTGCCCTGGGGCAGCTGCCTGCCCTGTCCTGAGATTTGGGGTCTCCACCGAGGCCCTGGGAGTAAGAGTCATCCTTGGCCACTGCTGGGCGGCTTTGTGGAGACCGAATCCTTTGTGATTCTCCTGACCCCTGTATTGTTCTCCCCAAGCCCTTAATCCACTTGCTACCTAGACATTCATTTGTGTGATGAACTACCTGGTGTCAGCTCTCTGGGTGCCAGGAAGCGCCTTCACCAGGAGATACCCAGCCCCCAGCCTGGGCTGGTTTTCACAGGAGGCACCCAGTAAATGTTGAATGAATGGCTGAAAGCGCTTAGCAAGCTAGGGAGCAGGAGTGATGGGAAAGTTTGGGTCATGAGGGTGGAACAGTAACTGTTCTGTCCACAGGCCGTGGGGGCAACACAGCAGGAGGCCACCAGCCCATGGCTGTGGCTGGGGTGGGGGTCGGTGTAAGCTGAGCGGCCTCCCCGCCCCACTTCTACACCCCAGCACTTAAATAACAGTAATAACAGCCTTTCCATCCATCCCTGAGTCTGTGCAACAAAATTACGAGGTGAGGACTACCGTTAATCCCATTGTGAAGATTTGGAAACCGAGGCTCAGGGAGTTTAAGGAATTTATCCAAGGTAAATAAATGGTGGGGCTGGGATTCAAATCCAGGTCTGTCTGAGGTCGGGTCCACCAGAGGGTTAGCCATGGCATCCTTCTGCTCCTCTCCTCACCTTTAAACTTCTCAGCCTCCCCCATCCACATCTGGCCTCCTCCAGACTCTGCTCTGTCCTCAGGCGCCTCTCAGAGCCTCTGTTTATCCATCTGTAAAATGGACACACTAACCCCTGCCTGTTTTGTAGTGAAGGTCCGTGAGGATGGGGATGCTTTCTGTCAGACAAGGGCTGGGCGAGCTGGCACCGAGGGAGTGGAAGCCACTGCAGGGTCCCGTCCGAGGCCACCAAGAGGGGCCGATGAGCAGGGCCCTCTCCCAGCTCTGTGGCTGCGCACGGCGGGCGAGGATTTGTTTGCAGTGGCTCCCTGGATGAATTCCCGGCAGACCTCTCCTCTTCCCTTGACATTCCTGCTGGAGGCTGAGTCTGCGGTGAAGGCCATGCAGCTTCTCCCATCCCGGACCTTGCTCCTGAGGTGGCCTCCACATTTTCCCCTTCCTGCCCTTATAGGTCTCATCTCTGCGTGGTTGCTTTAGGGCCTCAGGGCAGGGCAAGGTTAGGAGCCTCCTCTGCGATCTGGAAACTCTGTGCTTCCCTTTGGGAAAGCCTTGAGGGAAGGCAGATGTGTGTGAGGGAAGTGGTTTAGGAACCACATCTGCCCTTTATCAATCTGCCTTCCTCACTAGACTTTTGGTGCCTTGAGAGTGGGGGCTAGTTTGTGGGTTTTCTTTTGTTTTACTTTAGGGTTTTTTTTTAAGATTATTTATTTATTCATGGGAGTCTCAGAGCCCAAGTCATAAGCAGAGGGAGAAGCAGGCTCCCTCCGGGGAGCCTGATGCGAGACTCGATCCCAGGACCAGGGATAGCAACCTGAGCCAAAGGCAGACACCCAACCAGACGCTCAATGCCTGAATCACCTAGGTGTCCTGGTTTTTTTTTTTTTTTTTTTTTTTTTTAAATAAATCTTGTATTCATTCACTGATTTGTTAGGTTGTTCACAAAGGTTTATGGAGCACCTATTCTGTGTTCTGAGATCAATTCTGAGCTCTGGAGATGCAGCAGCTAAGAGAACAGACTATAGGTCCCTGCTCTCAGGAAGCCCACAGTCTAGGTGGGAGCTGGACGCTCAAGAAGGAAATCAGGCCCTATAAGCAGTGAAGAATGCCCTGGAAGGGATTAACGGGGACTGAGAGGATTACTGGAGATCCTGGCGCCCAGTGTAGGGTCTGGCAGAGAATTGGCACCAAAAACATTTGAATTCGAACTAAAGGGCCTCAAATCAACTTGTTAAGCGGCAGGATCAAGGGCCTCACCACCCCTCTCCTGTGTAGAGAGGAGCTCTTCTGGCCCACCTCCTTAGCTGCACAGCCTTAGGAAAACTCCTTCACTTCTCTGTGCTTCAGTTTCTTCATCTATATAATGGTACTAAGTGTTCCCTGCCTTTTAAGATTGTTCCAAGAACTAAATGTGCTACAGGCTTGAAAAGGGCTGAACACTCAGCCTGGAATATCTTCAGTGCTCAATAAATGAAAGGGTGAAGATGAGGATGAAGAGGATGGAAGCCAGGAAAATGGGAGGAGTGTTGGCCTGGCTCCCCTTGCTCTTGGAAGTCGGGGCTCTACTCCGCCTGGATAGGCAGTTTCAGGAATGGCCACGAGATGGTGCCCAAACACCAGTTATTCAGGAATCTTGATTTCTCCGCAGATGAAGCTGTTTAGGGAAGTAGGGGCCAGAGAAGCAGGTGCATTCTGTGTTGTAAGATGGGCTGGGGTGGGGATTTTCAGCTACTTGAAATCCAGCCCCTTCCCACCATTCTCTTCCTTCAGTTTTCTTCTTGGGGTTCCTGTCCGTGTTTGGGGGTCCAGCCCTCCCTTGCCCCTCAGGCCCCCAGCACTGGAGTCCAAGGCTTCTGTTGAGTAGGTCCTGGTTCTTGTCTACCCAATGAGGGCACCCTGGGTCCTCAAGCCATCACTTCTTCCCCTTCTCATTCACGAACCAGGCAGGGGTACTTAACTGAACACTTCCTTGGGGGCCTTGAAGGATGGAGAGCCAGAGGAAATGACCCTGTTTCTGTTCATCATATCCTGGGGGGGTGGGAGTGGGGGGAGGGGGCAGTAGAAACCGAAAGAGGGAAAAGGAAAACATGCAACAGTTACCAAAGACCTCCTTCTCATCAGCACGTAGGAAACAGCCTCATTTCACACACGCAGGAACCGAGGCTCAGAAGCACTAGGCCACACGAATGCGTTGCCCTTTCCAAGCACCAGGGGCTCCTTCGCCAGCAGCGAGGTGTGGCCCAAAGTGAGTATATTCCTAAATTCATTCCACAGCATCTACTGAGCTCTGCAGATCCAGCGAGAATCAGACCTGGCCCCTGCCCTTGGGAGCTGGGAGTCTGGAGGGAGATGCTGGCAGAGAAGCACACAAGGGCAGCTTGTCCCCGAAGTCTGTGCTGCACCGCGGTGACCCAGAGGCTGCTGTTGCTGGTGCCACCTGAACAGATGGGGGGGGGGGCAGGAGGGATGGAAGGTGTGAGAGACTTTGTAGATTCCATGGGGACCGAGGGTCTGTGGAAATATCATTTTCAAGAAGGTGAAATCATGACCCTCATACAATAAAAACAAGTGAATGCACGTCCAAGATTTCCTTTAGCTCATTAATTGACAAGGAACCAGCAAAATGTTAACACAGCTCAGATGAGGATTCCACTTCAGGCATTTACATTCTCTACTGGACAAAACTTCTTTGTGTTATGAACAGGACTCATTTGCTTGCTCTTGGGCAGGAATCATTTCCATGATTATCTGTTTTCTACAAATCGCCTCTATCCCTACAGAGTTATAAAATCAATCAAATAATCAATAGCACACAACCCTAAAGAATCAGATGATCATCCAGAGGACACGTAGCTGACACCCAGACCTCCTCTGAAAGGACACCCAGGAATCGCTCAGGCCTTTTTCCAAGGCTTTGATATGTTTTCTTGACTGACCCCAGAAGGATCGGGATAAATTAGGTAGCAGGTGTTCCAGAGGAGGCAGGTCATCTGGGTTGTCTAGTCTCAGCCTTCTGGGGTTCCCTTTCGGCTCCCAGGAGACAGACTTCCCAGTCCGGGGGGAGCTGGCCCCGCTCAGTGCCCACCAGCAGGTGGCGCCGAGGCAAATTCGCAGCAGGAACCTAGTGGGTTCTGGGGCTGGGAACAGGGGGGCAGCTCCCAATTTTCCGCCATTCCTGGTCTCCAGCAGTCAGGTTTCACGATTTCAGAATTTCAGAGGGCCCTTCCCACCTAGAGTTGTTGGTTTAGTCATTCACTGATTCAGTTTTGTTTTTTTTTTTCATTTGACAAACGTGCCCAGGCCCACAAGTCAGGTTCCCGAGTTTCTCCTTCTCCAGACAGAAACTCACAAGTATCAAAGAATCAGTCCTTGTCTTTGCTTGTCTGGCTTTGCTGCCAGGATTTGGAGCCACCTGAAATTCTGAAATCTCACTCCACCCCACTCCTGCCCTGCCTACCAGGGTGT\n>JQ061302.1 Uncultured Pneumocystis clone CS13 large subunit ribosomal RNA gene, partial sequence; mitochondrial \nTGTGAAATACAAATCGGACTAGGATATAGCTGGTTTTCTGCGAAATTTGTTTTAGCAAAGAGTTTATAATAACATTATTAGTGGGTATAGCACTGAGTATTTTTAAGAAGGAGTACTAGTAATACTTATTTCGAATACTTAATCTCAAAATAACTAATAAGTAATTAAAATAAGCTTTCAAACTATATGCGATAAGGTATATAGTCTAAAGGGAAACAGCCCAAAACAGTAATTAAAGCTCCCCAATTATTATTAAGTGAAATAAAGGAAGTTATTCTTTTGAGACAGTCAAGAAGGGGGCT\n>MF242562.1 Uncultured bacterium clone denovo36630_N25_23851 16S ribosomal RNA gene, partial sequence \nACCAGACTCCTACGGGAGGCAGCAGTGGGGGATATTGCACAATGGGGGGAACCCTGATGCAGCGACGCCGCGTGGGTGAAGAAGCGCCTCGGCGCGTAAAGCCCTGTCAGCAGGGAAGAAAATGACGGTACCTGAAGAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGGGCGCAGACGGCGATGCAGGCCAGGAGTGAAAGCCCGGGGCCCAACCCCGGGACTGCTCTTGGAACTGCGTGGCTGGAGTGCAGGAGGGGCAGGCGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCGGTGGCGAAGGCGGCCTGCTGGACTGCAACTGACGTTGAGGCCCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCGGGTACC\n>XM_044441890.1 PREDICTED: Varanus komodoensis zinc finger SWIM-type containing 5 (ZSWIM5), mRNA \nAGATTAGGTTTTCTTTCCCTTTGTGTGTGGCAACACCTGCCCAGGGAGTCTGTGTGTATCAAAAGAGCAACAAAAAGTGGGTTTAATTGCATGCATCTTCAGTGGAGGCTTTCTGGCACTTACAGCACAAAAGGCCATTACTGAGCTGTTTTCAATGGAGACTAGGAGTGCAGGACTGAGAAGAACTCTCCACTATTCTCACAGGCAAGCAAATCACTTTACAGGAGCATTGTCATGTGGAAATGAGTTCATGAGCCCATCTTCTTCCAACTGCAAGGTCAGGGAGAGAGCAATTGTCAGTTTCAGCTGGCTGGAGCAATTGATCTGTTTGCTTGAAAATGTTTGCTTACCTCCCTTCCCTGCTGTGCTAGTATATAGATATCTCTCTGTGTGTGTCTGTGCACAGGCATGTGTACACTCCACCATATGCTGAATGACTGAAGTTCATAACTATATGTTAGCAGTTGCTTACCATATGACCATTAGTGTGTCATAGGGATGTACAGTTTTTGTTAAATCCATTCCATCTGCATTTCACAGATTGTGAGGTACTTTTCAATCTCTCCTCCATTCTCATTGACAGTGTGTGTGTGTGTGGGGGGGGAATTGTTACAAGTTCCTGAACTTCTTGCATACATGTGCTTTTTTGCAAATCTCCACTGTTAAAAATGCACAACCTCCTCCAGAATGTGCATTTGCATGCTTTAGTATGCGGGGAAATGTGCTTCTTTTCTTTTTCTTTTCAACAGGAATGTTTGTGCAAAATTCTGAAAAGTAAAGTAGTGGTTCACAAGTCCACAGAATCCATGTGATTCAGAAAGGGCTGGTAGACTGCAGAATCTGGGGAATCCTAGAAATCTGAACTCATTTAAAACCCATGGCAGGTTCTCCAATATCCCTAGAGTGTTATAAATAACTAATAGTACAGCAACCTTAATTTAATGCTAGTTAAAGCTCTTTTTGAAGAGGGAAAATCATCAAGGTCCCCCACACACATCCCCAGTCAGGCTTTCAAATATGTTTTTGGATCATGGTCAATACTGTCAGTTCCTGTGTTAGGTGTGTGTTCTTTCCCCACATATTTGCATCTCTGAAGAATTATGGCTTCTCATCTTAAGATGAAAGGCTCAAACAGTGATGCAGCTTTGGCTGGACTCTGGGGCCAAAGTCCAGGGCCCTGCATTCCAGGAAGGCCTGAATAACCACCCAGAAAATGTCAGGTGATGAAAGTCAAAGAAGCAAGTTCCATGTTATTCCTGTAGTCACGATAATACAAGGATTTCAATATATTTTAAATGCAAAACTGCACATGCTCTGTATTTTATTACTATTTTTATTATGGAGGGCAAATAGCTTTTTCATTGTTCTAACACAGCAGGTGTGCAGAAGCAGTTGTAAAGCGTGGAATAGTGGTGGTGAAGGAGGAGAGAGTCGCATGCTTCACAACTTGAAGTAATACAGCCATTTAAAAGGGGGACATAATAAGAACTGCTCTCACTCTTTGGCCTCACAGGGCATCCTGAATTGTGCTGCTGGTCAAGACTTTTGTTCTAAGATGAAAAGCTATATTCTTCAGATATTCAAATATGCGGAAAAAGAACAAACAAACAAGAATCTAAAATGACTAAGCTGCACCCCTGTCTCAAACCCAGGCAAACCATTCTCCAGATAGCTCATGATGTCCCATGATTGACCTTCACTCTGGTCTGGAAGAGTGATGTGTTTAGGGAAGGGGAAATGCTGTTCATTTGTCCAACAGAAAAGAAGAAGCTGGTAAAGTCAGAAAGAACCATGTGATCTTAGCCATTCATCACTACCACATTTTCTTGGTGTCAGGCAGCTTTATAATCGGACAGCAAGCTGTTATGCAGCAGACAGTTGAAATTGGGTTAGTCTGATTAGATGTGGGTGTTTTGGAGCTGGAGGCTGAACATGCTCAGTAAGATGATATGCTACCTCAGGGTGACAGAGAAAGGCAGAAAGCCTCTTTGTTATGGAGCGGCAGCACCTTGCTGGAAGCATGCTAGAAAGTATCAGCAATGCCTGCTAGAAACAAAATATATGGGGCACAGCTTTCTGCAATATTTTTTTAAAAAAAATTCAGATTCTGTAACAAAAAGAAACAAATACTGAGCAGCATGTAGCTTGCTGCTTCTAGAATTTATACTGCTACTACTTAAACAGCCCCACAATTTGGATAGCTTTAAAGGGGATGGGACAAATTTATGAAGGCAAAGCTATCTGTGGCTACTAGTCCTGGTGGTTGTTTGTTACCTGCAGTATCAGAGGCAGTGTGCCTATGCACAGCTACTGTTTGCTTCTGTTCTTTAACCAGTTACTGATCCATGAGAGGACCATGATGCTAAGTTTGTTCAGGAACCTTTGGTGAAGGACTTCGTGAAAAGTGCTAGAATACACTGCCTGATGAATTGTGATGTATCATTCAACAATTTGAATATGTCAGTTCTTGATTTAGGATACAGCCTGCCTCCTACTGACAGCTCAGGGCAGACATCCATATTCATCTGTAAACATAAAAACAGAAATTTAGATAAAATGAATAGAGCCTAGCAAATCTTAGAACACTACCTTATATATCAGGTGCTTTTAGGCATCCAAGGAAATAAACTTGTACCAGATTGGGGAAGCGAGATAGAAGAGAAGCACTTCATTCCCCAAAGCCAAGAAATTATATTATTTATGAGTGAACATAATGTCTTACAGAATAGCACCAACAGAAAACTGGTATCTTTCTCGAAGTGCTTAAAATCTAAATTAAGGCCACAGCTTTTGCAGGTGGGCAAAGAGAGAAAACAGAATGAAGGCAATGAGAACAATGGTGTGAACCCTCTACCTTTTTCCAAAAGTTCAAAGTAAGTTGTTGCCAACTTAATTTGCACATATGTTATAAGAATCATGAGAACAATTGGGATAAAAACTGTTTGGCATTCTGAATTGTTTCCTTCTCTTATATTTCGTATTTGAAAGTGTCCAAATTTGGCCAAATGCACATATTTCTAATTATGTAGTATTTTCTAAGCCCCATAATTCAGGATACTCCATTATTCAGCCCCATAATTCAGGATACTTGCTCATTTTCCAGACATTCACACACCACTCACCACTCACCAGGAGACCATTCTTTTCCTACATTCCATGTTGTATATTTGGGAAACAAACAGGCTCAAAGTATTATCGTGGCATTTTAATTCCATTCTTCTTTGGCATATATGCTTCCCTCTTTTATACTCACAACACCCTGAGCTAAGTTAGGCCAACCAGTCTAGATTTTACTGAAGAGAAAGGTATTTAAAAATAAAATTACTAAAATAAAAGACAATAGTAACAGGCTCAAGCTTACAGTAAGTTTCACAACTGAGTGAAGAATTGAACACAGGTTCCCATGGTTAAAGTTCAGCGTGTTATCTGTTACAGCACACTAGCTCTTACTACTGCTTTGACAGCTGCATCTGTAAGTGTTTACTGAATGAACCTGCATTGTTTCACTTTCAATGAACTTTTCTTTCCTGTACCAGATTCACATTTCTGGGGCTTGAAGTACCTGACAGCCCAGTTTTCTTTGTGGGAAGTATGGTTGGGGCAGTAACCTTTCGTAAAACATGTATTCCTATATTGGCTTTGCTAGTGATTATTCAAAAGTATGACTACTGAGGCAGCCAGTTGAACAAAAGCATCCCATGTACTCATGTAAATACTTCAGATAAAATAAATATCCTGATGAACTTTTTTCCAGAGCAGTGTTTAATCTTTGGCTAAACATTTGATAAATATTTTACATTTTTTCCTAGTTGATATTAAATATATGTGCTGTCATGAAAGCTAGAAATTAAACTAATGCTTGATTTAAAGCCTAAACATCAGATAAACTTGGCAGACTCCAGAGATACTTGCGCAAGACGTGAGTTGTGTCCCTTTCCCCTTAGACTGTTTTCCAGCTGTCATCAACACCAGACCAAGATATTTTAAGGTAATTTAATATGCCTAAAAGCCAGTGTTTAAAATGGAGCAGCTACTCAGTTGGTTCCTGGTCTATTTTTCTGATTTGCCTGCAGACACAGATCACAGAACAAGGTTTATACTTGGTTTGGATACTGGTTGGAGAATGAGAAATAAGCTGTGGGCTTACACACTTTGCTTTCCCTTTGCAAGTAGATTTCTTTCCTTGCCCCCTGGCTTCTACCGCATCTTCTTCATTCTCTAACAATCAGCCCTTCTCCCATCCACCTATGAACCAAACAAATGCATACAATATTTTACTTTGAATGTAATATATGCAGGTATTGATGAATGGGAGGCAATTAAAGAGGAACTGATTGAATTTTGCAGCAGAATCTGGATAGGAATTGGGAAATTAATTGAGGTGATATCCTGACCCATCCTTGGCTGGCTTTGTAATTTTCAATAAATAAATACATAAATTTTAGGGATGTGTGTAAGAGGACTTATTTGGAAAAGTTTCCCAAACATTGTTTCTTGTTTGTTTTTTCACTTCTGTTCACAGCCATTGCAAAGTAATTTAAAATAGTTGATGCACAATTTAGCTAATTAAAAATTATATGGTTTTATAGTTGATTAACCAACTGATAAATTGCAGCCCTTGTATTTGTACAAGCAGACAGTGTGACTATGGCCAAGATAACTATAGTATCAACTGAGGTATTGTCAACTTGGTAAATGTCTGTAAGTTTCTATCCCTGATCAGATGTAGTCTGTAGGCTACCCAGTATAGCCTTAAGGGACAAGAGCCTCCACGACTCTGGCTGCTCATTTGCATGAAATATTTCTTTATAGGTGGTAAGGATTTCAGTTCAATTGCCAGTATTAAAATATGAGTGGAAAGAAATCTAGTAATGTGGCTAAAGATTATTTTTCAAAGAACAGGTAAAATATAAATGCCTTTGAATTTTTGCCTTTTTGAGTGTTATCCTTTAACAAAAATTCTAATAGAGACTCTAGAATGAAATTGCTAAATTAGAAATTATCAAAGGTTGGATTATGTTGGGTTAGACCTGATCTGAGATATTGGTGGGGTTTACATGATCATGAGGAGAAGAAACCACAGTGGCATCTTTTCCCTGCCACTGTGCAAGGCAGCCATTCCTACGCAATTATGGTGTGTGGGTTGCTCTGTTGTCCAAGCCCAGTGGGGCAGCTTTCAGAGCATGGCTTGTTGTAGGTTTCTGGGGTCGTGGTGAAGCCACGTCCTCCTGTGCACCTTGCTTGATTTGGGCAACACAGCAATGGATGTGCTGTGAGGGTAGTTAGGTAAACTGTGCAGCGCACAGCTGTGTCTTATTTTTCCTATGATCTTGCCACAATAAAAAATCTACTAGTCTTTAATGTGCTACAAGTCTGCTGCTTTTGCTCAGCAGACCTTTTTTAGGATTTGTATGATGAACACCTCACAGGAAGAATGGAGCTCTTGGCTAAGATTTTCTTGTATAAAATGCATACCTTTGTTCCTATCTGCTCATGAAGAATCATACAATGGGATATCAAGAGAGGAAAAGAGAGGAGAGTGAGGCTGTTGATGATAATGTTACGGAGTCCTTTATACTGAGCTGTCTTTACCCTCAGCATGCAGTATCATTATGTAGGGGTAAAGAAAGGAAGTTGCTCCTGCTGTTGCAAAGGAATAATTGTACAGAACTGGGAGTTACCATGCATATTGGTTAGAATGAATTAAATGAAGAACATGGATATGTTGATTGGACAGGTTTTGAATGGAGGTGGTTTTTTGGGTATATTCCTGGTTTTTAGATCAGTCTAAGGAGTCTATGATTTGTTTAGAAGGCCTTTAGAAAAATCTAGTTCCTAAAGCGAAAAAGAAAACCCCTCTTAGTACTTAATCAGATCTTGATGTGGGTTTTGGCATCACTTTAAAGAAGATGGTTTTGATACTGTTGATTAAAAACTTCTGGTAGAATTTGACTCAGAATGGTTGTGCTGTTTGGCAAGCACACAAGGGCTATATGCAGTTAATGTAGTTAAATAAATTTTCTCTTTTGCTGTCTGTAAGCCTTTCAGATTCCTCTGGTATGAGTTAACATTTGGAATCATAAAAAATTTCTAGCAGTATAGTCAATAGTCATCTGAGAGGAAAATTACAATGTGGTTGAACTTGTGCGGTGGGAATCTGGACTCACAGATAACTTTTTTTCCAATCATATTTTAAATTTAGGGAAGTCATCTGATATTTCACCTTACTGTTTTCATATTTAACTAACTGGAATATTAGATGATGACTATTCTGTATCCACACATTTTGGGAACTATTTTCCTTACATTTTGTTGGTTGGAAGCTGGTGTGTTGAAATATTAGTGAATTTTCTGCTATGAATTGTGTGAATTTTCTGTTGACCACTTTGGAATGTCTTGGCTGTCAGTCTTTCCCTCCTTCTTTAGGACAGCCAAGACCTGCATGCCACATTAACAAACATTCCTTTGCAGTTACCAGAACTGAAAGCATCTCATTTAGTTCCTTTGAGAGCCTAGTGGGTTGAAGAGCTCTTCTCAAGGACTGTCTTGATTGCATAAGATGATGATCAAGTGTTGGTACCCCCTTTTTTCTGGATCACCATTTATTTTGACTGCTGTCTCTCTAAGCATGTGGATCTGTGCTGTGGAGTAATGCTCCAGGATAGCGTCTATGTACCTTATACAATACTGGTACAAAGGTGAATGCCATTTTGGTCTGTATGTATCCATGATCATGGTCTCTAGTTCTAGCCTCCTGTAGTAAAGATCCAGGAGAGAGTAACAGCATAGATTTTTCCTATTACTTTTGTCCTGGTAAAATAGCAGTTGAAAACTGGGTTTTCAGAGTTGGGGTAGGAAAAGAAACCACAGTTGGACCTTATTTCCCCACCTGGGCCAATTGCATACTGCTTCACTTCCATAATTATCCATGCCAAATGTGGGTTGCTGTGTCATCCAAACCTGATTGGGGGGGGAGGGGGGAATGTTCTAAAGCACTTGAGAACCCTAGAATAAGCAAGGTGGTTTGGAAGTCATCTCTGTGGGTCTGGTCAAGCCAAGGCACCTCCCTTCAGATTCAAGCATGCTCAGAATGGAACAAAACCACTTGTCAAGAAATGATATACAGTTTATGAATACAATGGTGAAATACGGATGCAAAACATAAACTAGCAAACAAAAGATTATAGTCCCCTTATTTGTGGCCATTTGTTGTTGTTCCCTAAGTAGGTCAGGGATGCTCCATGGGCTTCCAGAATTGCCTGAGTGAATGACTCATTAATTCTTCTCTTCAAGCCAAGAACAAAAGATAATGCCTTTTGGCACAGATTTTATAAAGTTCTTTTCTCACCTTGTTTTGTAGGCTTTCAGTACAAACAGCTTTTAATTTCATTCCTGGGAGACAAGAAAGGACAAAGCTGCTACAATAAAGCAACAGTTTTTGTTCTTACAGTAAGAGCAGGGCTTATCTATTTATGTTTGCTGTTATAACCTTGCATTTCTTATACAGATGGTTGTTAAATTTCCTTGGAGTTGTTTCAGTGCTTCCTTTATCTTAAAGTTTCTACATGGCTTTAATATTTATATATTACTTTCCTCAAGAGTATATAGGCATTTATGTTACCTCAGTAATATATAGAAATCTGTATGGTAGGATTGAATTATTATTCCTAAATTGCAGATGTGATAACTGAGATTGAGAACAATTTGCTTAAGGGCTAATGTAGACATCTTGGCTGCAAGCCCATCTGTTACAGTGTGGATCGTGCAGCTTTCTCATAAATCAGGGGGGGAATTAAGCACAATTTGACATGGGTGGATAAGATGTATGCTCAACTTTCCTGCTACTCTTTCTCTGCTGCCATTTATTATTTAAAATATTTATATGCCATCCTGTCACGAAAGCCTCAGGACAGCTTACATATATGAAATAACATAAAATATAACATAAATATTTATTTATTCCCCTTCTTGTGGCTGCAGTGTGGAAAGTAGCCATCACTGGGAGGAAACATCTGAGAAGAAGCATTTTTGTGTGGAAGTGTACTTTATGGAAAATTGATATGATCTACATTGTAGATCACTTACTTCATTGTCCACGTTCTTAGATGGAAATACACAGAGAATTGTGTTTTTCACCTGGAATAATGAAGGAAAGAAGACATTATCTACAATTTTACTTAAATTGATTGAGGTCTTGAAGGGAAGGGCTGCATAAATATTTTAATGCAGTGTGGTTTTGCTTTCGTATTTGCTAAAATGCATTGGTGCTCTTTCTCACTCAGTTTGTGTCCATTACACCATCACAAAATAAAGGGTGAATATTTTTGTTTCTTTGCTTTGAACTGTACCATTTTCTGACACAAAATAATTTTCTGTTAAGTTTCTGAGCCATTCTAGATGTGTCTTAAGATTGGGTCTGCTCAGCTGCAGCATTTATATGTCATGGGAATGAATATAGACTATTTTACCATAGCAAGTTTATATATAATTTTCCCTAGATTTGTGTTGTCTTTGTTAGTGAGGCATTGTACTTTTTGTTCTTTTTCCCTAAGAGCACAATCTTATGCAATTTTATAAAGAAAGTATAGACTGCTGGGTGGGGCATGCTGGATGCTATAGGCCTTTTTCTGGCTAAACTTGCATAGGCTTGTGTCTTAAAGCAATGAAATATGAATTGATATGTTGCAATGTTGTTCAACGGCAATTAATGACCTTTTAAATCAGATTTGGTGGTGTGTTATATTTTGCATGGATATCTGGCAGTTGACTGATTTTTGCAAAGCCTACCTTTCCCAAAAATACTAAACCATATTTTCTGGCAGAGAAAATGTCCAAGATGCAGCATGATATTAAACCCCTTTTGCCATCAGATGAAGTATCTCTCAGTTGCAGCCAATCCTTGCTTATTTGGCAATAAAGGACTGGAAGGAATGCAGTTACGTTACAGGGACATGAGACTGAAAAGGGAGCAACCACTCTTTTCTCCAAAAGTTTAATGAATTTGCCCATGGGTTTGATAGTAGCTGAAAAGTCTGAGACAATTTTGGAGTGGGTCTTATGCTAGTCCAACTGATTTGAAAGCAAATTGAATATTTTACATTCCGTTGAGTACTACAGTTCATTCAGCTTGGAATCATTCTAAGCTGGCTAAAGAATGCAGAATGTGACTGTTCAACTGGAAGCAGCCTTCATGCTGGGTAGATAATTTTCTTGAGCCCTGAATATATTTTGGTTTTGGAGAGAGGGTACTGCTGCCAGTGGCTATGACCTGTCTTTTGTGCTCAACAGTTTCAAGGAGGGTAATGTGTGCATTCTTGTAAGCATTATTGAAGCCTGAGCTTAGTGGTGTTCTATTAAGATGAAGTTTCCTTGCAAAGCTAAATATCCTTCTCCCTGTTTTATTCTCCTTCTCACAGGATTCCACCTGAGTGGCACAGTTACAGAGCCTGCTACTTCAGCAGAGCCAGAAATGACCTATAAAGTGGCCATCAGCTTCGACCGATGCAAAATAACTTCCGTGACGTGTGGTTGTGGGAACAAGGACATTTTTTACTGTGCTCATGTTGTGGCACTCTCGCTGTACAGGATACGAAAACCTGATCAGGTCAAACTCCGTCTTCCTATCTCAGAGACCCTTTTCCAAATGAACAGGGACCAGCTCCAAAAGTTTGTTCAGTATTTGATCACAGCCCACCACACTGAAGTGCTCCCAACAGCTCAAAAACTGGCTGATGAAATTTTGTCCTCCAACTCTGAAATCAATCAAGTTCATGGTGCACCAGACCCCACTGCAGGGGCCAGCATTGATGATGAGAATTGCTGGCATTTGGATGAGGAACAGGTGCGGGAGCAAGTGAAGCTGTTCCTCTCCCAAGGAGGGTACTATGGCTCTGGGAAGCAACTCAATTCCATGTTTGCTAAGGTCCGTGAAATGCTGCGCATGAGAGATTCCAATGGGGCCAGGATGTTGACACTAATAACAGAGCAGTTTATGGCAGACCCACGTCTTGCTCTTTGGAGACAGCAGGGAACAGGCATGACAGACAAATGCCGACAGCTCTGGGATGAGCTGGGGGCGCTGTGGGTGTGCATTGTGTTAAACCCACACTGCACGCTGGAAGAGAAGGCATGCTGGCTGCGACAGCTCCGGAAGTGGGGAGATATGGATGTTTGCCCGCTGGAGGATGGGAATTATGGCAATGAACTTCCCAACATCACTAGTGCACTTACTCAGAGCTCCAGTCACAGGCAAAGCTCTTTAGCAAGGCCGAGACGCACAGTGTTCACTCGTGCCATCGAAGGTTGTGATCTGCACTGGCAGGATAGTCACCTTCAGCGGATAATCAGCAGTGACTTCTATATTTCTCCCTCTTACCAAAGGGATGGAGAGGGCCTTCTCTTCAACTCGCAGGGGCAGCCATTGTGGCTGGAGCATGTCCCTACAGCCTGTGCCCGTGTTGATGCCCTTCGTTCACATGGATACCCCAAGGAAGCACTCCGTCTCACTGTAGCTATAATCAACACCCTGCGATTGCAACAGCAGAGGCAGCTGGAGATATACAAGCATCAGAAGAAAGAACTGCTGCAGAGAGGAGCGACCACTATCACAAATCTGGAAAGTTGGGTAGGGCATCCGCTCAATCCCATTGGCTGCTTATTTCTCACATTGACCGAAGCATGCCGAGTAGAAGACGAGAACTGCCTTGAAATTTCAGATGCTGGTGACCCGAAGCCTCCAGTGTATCAACACGTGCCAGTGGCCAATGGCACTCCTGAGAATGGGGAATCCTACCTCTCCCTAGCTCTGGAAGTAGCACTGATGGGAATGGGGCAGCAGCGGGTGATGCCCGAGGGCCTTTATGCTCAAGACAAAGTGTGGCGGAATGAGGAGCAGATTATTGCCTGCCTGCAGGAGCTGGAGCTGGATGCCGTGCTGGTGCAGACACTACGCAAGCAGTGCATCCTGCTCCTGGAAGGTGGCCCCTTCAGTGGCCTTGGCGAGGTGATCCACCGAGAAAGCGTGCCCATGCACACCTTTGCCAAGTTCCTGTTCTCTGCCTTGCTGCCCCACGATGCTGACCTAGCCTACAAACTGGCACTGCGTTCCATGAGACTTCCTGTTCTGGAAACAACTCCTTCAAGTGATGTCACACATTCTCACCATCTGGTTTCAGTGGTGCCTAGTAGGTACCCACGTTGGTTTACTCTGGGACACTTGGAATCACAGCAGTGTGAGCTGGCTTCCACCATGCTGACAGCAGCCAAAGGTGACATGCTGCGTCTACGGACGGTCCTGGAAGCAATTCAGAAAAACATCCACTCTTCCTCCCTGATCTTCAAACTGGCACAGGATGCCTTCAAGATTGCAACTCCTGCTGACAACAGCTCTGACACAACCCTGCTCAATGTGGCACTGGAGCTTGGGTTGCAGGTGATGCGCATGACCCTATCAACCTTGAACTGGAGACGGAGGGAAATGGTGCGATGGCTGGTGACCTGTGCGACAGAAGTGGGTGTTCGGGCCTTGGTCAGCATACTGCAGAGTTGGTATACCCTCTTCACCCCCACTGAAGCCACCAGCATAGTAGCAGCGACAGTGATGTCTCATAACACCATCTTGCGCCTCAGCCTGGACTATCCGCAGCGAGAGGAGCTGGCCAGCTGTGCCCGTACACTGGCCCTCCAGTGTGCCATGAAGGACCCGCAGAACTGTGCGCTCTCAGCCCTGACTCTGTGTGAGAAAGACCACATCGCCTTTGAGACAGCCTACCAAATTGTCATAGATGCTGCTTCCACGGGCATGACTTACTCGCAGCTTTTCACCATTGCACGGTACATGGAGCACCGAGGGTACCCACTGCGGGCCTTCAAGCTAGCCTCGCTTGCCATGACGCACCTCAACCTTGCCTATAATCAGGACACACACCCTGCCATCAATGATGTGCTTTGGGCATGTGCACTCAGCCACTCCCTGGGCAAGAATGAGCTGGCAGCCATTATCCCGCTGGTGGTGAAGAGCGTTCACTGTGCCACTGTTCTGTCTGACATCCTACGGCGCTGCACCATGACAGCACCTGGTCTGGCAGGCATTCCTGGCCGCAGGAACTCTGGGAAACTGATGTCAACGGACAAAGCACCTTTGCGCCAACTGCTGGATGCTACAATAAGCGCTTACATCAACACCACACACTCCCGGCTCACCCACATCAGCCCTCGGCATTACGGAGAATTCATAGAGTTTCTTAGCAAAGCTCGGGAAACTTTCCTGCTGGCTCAGGATGGCCACATCCAGTTTGCGCAGTTCATAGACAACCTCAAGCAGATCTACAAGGGCAAGAAGAAACTCATGTTGCTAGTGAGAGAACGGTTTGGATGAGCTGCTGCACGAGGAAACCCTGATCCCTGTTGGTGGAATTACGCTTACCAGGCAAGACTGATGGAGTTTTCCATTCAGAGAAGATTGGACTGTAAACCAAAAGCAGCATGGCAGGAAGGGTTTGCGTCCTACCTACCATTCATTTGCAAACACCTCGGCAATACCAAAAGCTAACTAGGAAACTGAATACCTCTTTCCCAAAGGGCATGGCAAATGGAGGCTGGAAAGCAAACCCCCACC\n>XM_031777163.1 PREDICTED: Contarinia nasturtii U1 small nuclear ribonucleoprotein 70 kDa (LOC116346891), mRNA \nGTCCGACGACCAACGAAGACACTTCACAGCAGATATTCATTGCGAACGATACATTGTAAAAATGTATCGGTAAAAAAGTAAATTTGGAAATTAACCAACTCGTTCTCAAAAGTTACAAAGAAAAAAAAAAAGAGTGAAAAATCTGTCATTTTATGCAATATCAACGAAAAAGTGCACTTTTAAAGTGAAAATTATAAAATATTAGTGAATTGCGTTGTTTGATACATCGACATAAACATTAGCACAAGAAAAGAAACATTCAGATCTTGTGTCATTTGAAATTGTTTTTCATACGCATACTGCGAATAGTTTTGAAATAAAGACGACGAAAGGTTTATTCAGAAATGACACAATATTTGCCACCAAATTTATTGGCACTATTTGCTCCACGCGATCCATTACCATTTCTACCACCACCCGATAAATTGCCACATGAAAAGAAAACAAAAGGTTATTTAGGCGTTGGACAGTTTTTGTCGAATTTTGAGGATCCTAGTGAAACTCCGCCACCAACCCGTGTTGAAACACGTGAGGAACGTTTAGAGCGACGTCGAAAAGAAAAGGCTGAACAAGTTGCTTATAAATTAGAGCGTGAGATCGCCATTTGGGATCCAAATCAACTTCAAGATGCCACAGAAGATCCCTTCAAAACATTATTCATCGCTCGTATCAACTACGATACCTCGGAATCGAAACTGCGTCGTGAGTTTGAAGTGTATGGGGCAATTAAAAAAATTGTCCTAGTTCACAATGTTGACACAGGAAAGCCTCGTGGCTATGCTTTTATCGAGTACGAACATGAACGTGATATGCATTCTGCGTACAAACATGCTGATGGTAAGAAAATTGATGGTAAGAGAGTATTGGTCGACGTTGAGCGCTCAAGAACGGTCAAAGGATGGCTTCCTCGTCGTTTAGGTGGTGGTTTGGGTGGAACAAGACGTGGCGGTCCTGATGTAAATATTAAACATTCTGGACGAGAAGACAATGACAGAGAACGAGAAAGATATCGCATGGAAAGAGAGCGTGATGATTATAGACGCGACTTTCGAGACAGAGAACGACGTGATCGTCGATCACGGTCTCCGAAAGTTCGTGACCGTGTTAGAAGTAGAAGTCGAGATCGCAAAGAACGGAAACGACGACGATCAGAGGAAATTGAATACGAGAGAAGAGACTCACGTCGTGATCGTGAAAGAGAAAAGGAACGTAAACGTAGTAAGCGATCGAGATCCCGAGAAAGAAAGCGAGATAAACGTGATAAATCACGTGACAAACGCGATAAAGAGCGTAAAGAACGAAAACCAGAATATGGTGAAATTAAAATCAAAGAAGAACCAGTTGATGATGATTATCCTGACTATAATTCACGTATCTACAGTTCATACGGAGCCGAAGTCAAGTATGAAGATGGCGAAGAACAGAAATATCGACCGCAGGAAAACAATGGCCAGTACGGACATAATGACGATGATGACTATGATGACAGAGGATACTAAGTTTTATAAGTTTTTAGCGTGTAGCAGCGGAGCTCATACAAATGCGTTACTGTCAATTTATACGGTATTGAAGTAACGCAATATTGAACTCTCCACAATTAATATTAATCAAGCAAAAATGATTCGATTAATTATTAATTTTTATTTTTATTTTTGAATCTAAGAAAAACAAGTTAAATGCTCCGTAAAATATTTCATTTGCGCTACTTTTATCTCGCTTTCGTTCTCCAAAATATACAAAAATCGTTTTTTTGGTAGGTATACACAAGTTAATTACAATTTTCCTATAAACAAACAACAACAAAATTAATAACTTTGACAGGCGCTATGATTTGTAAATTTTATTAATCAAATGTTATTTTGCAAACGGAATAAAGTGAACGAAAACGGCTTTTGCAGTGGCAAACACAATAAAAATTACAAACATATTTTCA\n>XM_047789246.1 PREDICTED: Phacochoerus africanus adenine DNA glycosylase-like (LOC125132267), transcript variant X10, mRNA \nGCGGGGAGGGAAGGGGAAGGCGTGTCCTCGGCAGCCGTCAGGCCAAGTCCTCTGTCGCTCGTGAGATGTGGCAGAGGTCACAGCCTTCCGGAAGAGCCTGCTGAGCTGGTATGACCGAGAGAAGCGGGACCTGCCCTGGAGGAGGCTGGCGGAGAGTGAGGTGGACCCCGACAGGCGGGCATACGCTGTGTGGGTGTCAGAGGTCATGCTGCAGCAGACCCAGGTGGCCACGGTGATCAACTACTACACCCGGTGGATGCAGACGTGGCCGACCCTGCGGGACCTGGCCAGCGCTTCCCTGGAGGAGGTCAACCAGCTCTGGGCTGGCCTGGGCTATTACTCTCGAGGCCGCTGGCTACAGACAGGCGCCCGGAAGGTGGTCGAGGAGCTAGGAGGCCACATGCCACGAACAGCAGAGACCCTGCAGCGGCTCCTGCCTGGCGTGGGGCGGTACACAGCCGGGGCCATTGCTTCCATTGCCTTTGGCCAGGCAGCTGGTGTGGTGGACGGGAATGTAGTTCGGGTGCTGTGCCGCGTCCGAGCCATAGGTGCTGACCCCCGCAGCCCCCTCGTCTCCCAGCAGCTCTGGAGCCTAGCCCAGCAGCTGGTGGACCCAGCCCGGCCAGGGGACTTTAACCAGGCAGCCATGGAGCTAGGGGCCACGGTGTGCACCCCCCAGCGCCCACTCTGCAGCCAGTGCCCTGTGCAGAGCCTGTGCCGGGCGCACCAGAGGGTGGAGCGGGAGCAGCTTTCAGCCCCCCAGAGCTTACCGGGCACTTGTGACATAGAGGCGTGTGCTCCCGACACCGGACAGTGCCAGCTCTGCGCACCTCCCACAGAGCCCTGGGACAAGACCCTGGGAGTGGCCAACTTTCCCAGAAAGGCCAATCGCAGGCCCCCCAGGGAAGAGAGCTCTGCCGTCTGTGTTTTGGAGCAGCCCAGGGCCTTTGGAGGTGCCCGACTTCTGCTGGTACAGAGGCCCAACTCAGGTCTGCTGGCAGGACTGTGGGAGTTCCCGTCTGTGGCCGCAGAGCCCTCAGAGCAGCTCCAGTGCACGGCTCTGCTGCAGGAACTGCAGAATTGGGTCGGACCCCTCCCAGCCACCCGCCTCCAGCACCTGGGGGAGGTGGTCCACAGCTTCTCTCACATCAAGCTGACTTACCACGTGTACGGGCTGGCCCTGGAAGGACAGACCCCGGTGACGGTCCTGCCCGCTGACGCTCGCTGGCTCACCCGGGAGGAGTTTCACGCCGCAGCTGTCTCCACAGCCATGAAAAAGGTGTTCCGTGTGTATGAGGGCCAACGGCCAGGGACCTGCAAGGCTTCCAAAAAATCCCAGGTGTCTACCCTGTCCAGACGGAAAAAGCCCAGCCCAGGCCAGCAAGTCCTGGATAATTTCTTGCGACCCCACATCCCCGCTGATGCACCCAGCCTCGACAGTACAGCCCAGTGATGCCTCTGGAAGTTCTCATCCCCTGAGAATCTTGTTTAATAAAGTGCTTATTTTTGTAATCA\n>XM_007261321.1 Fomitiporia mediterranea MF3/22 uncharacterized protein (FOMMEDRAFT_143842), mRNA \nCGAGTGGTTACAATATTATGCGCGATGACATCGCACTGCTCGAGGTGCATGAGAAGCACCCTCCGTCTTTCTCAGCAAATCTCTATCCTGACTACTGGACTCTCAATCACGGACCCAAGTTCTCATATAATAATTCTGTTTCGTCAATTCTGGAAGATATACGGGCCTTCAGGATACCTACTGACTTCATTAAAGTTTTCGACGAGGCAGGTATACAGTATTATAATGGGTGCTTAATTGTTGAACTCTTGGATTTCCGACCTGCAAGGGCGAAGGAACCAGTACTGGAGAAGCCAGATAAGCAGCGCGTAGTACTGCGACCTAACGCTGAAACAATATGGGCAGACATTTGCAACATGAACGAGAAGACGGGGTCGAAATGGTCAGATATGGATGCTCTACTAGTCGAATCAAAGATTCTGTTGTGTACTTCGGCTCCGTTATGTCTGGATCCGGATCCGTCTTTGACACGAGTTGTTAATAGTATTCTCCGTGTCTCCACGCCAAACGTTCCGAATTCACTAAAACGCAAGGCAACTGCTATGGTTGACATCGAAGAAGACGAAACCGAGAAGGCCAAACGTGCGAAGATTATGCAGTTCATGAATCCGCAATTTAGCAATACGCATAAGCCATTTCATCCTAGTTATAAAATTCTCTCAGTTATGGAACAGAAGCGTGCAGCGGCAGCCTCTCAGCAGACCTCACAGCCTGCGACGACTACATCAGTTCCAAACAACATATCTTCTGGTACTATGGCTCCGCAGAACCTGACTCGCCAACAAGCACCTGAAAAACCTTCAGCGCCTGTCGCGCCTATCGCACCCACACTTACCACGTCGTACTCACAAACAAATACGAACACGATTCCACAACCCGCACCCACCACAGTCCCCCAGACGCAGGCGCCACCTGCTATTGATCCTGCCCATAGGCAGTCGCCTTCAAAACAACAGCAATCCGCAAGTCAGCCTCTCCCACAACGCCCACCGTCGCAAACTGCCGCTCCGCCGCAGGCGAGCGCGGTTAGCCAACCGCCTCAAGCTCAAGTTCCTCAGCCAACTCGACCTCAACCGACTCAGTTCAACCCCCCATTACCTCCGGCCAATTTCCTCAACCCTGCTCTTCCCCCTGGTCGGCGCCGACCTTCGACAGTTGTTAAACCTAGCACTCCTGCTGTTGCGACCTCTTCGCTGCCGACTCAACAACCGGTAAATCAGAGTCAACCGCAGACTCAAACACAAATACCGACGCAGACTCCGGTTCAATCTCAACCGCAAACACAACCGCAGCCAGCATCGCAACCACAACCGCAGCAGCCCGCACCACAGCCAATTGCACATCCAACGCAGGTACAGGCACAGGCTCAACCGCGTCTCGCACAGATTCCTGCAAATATGGCACAATTCTACCAGACCGGTAGACCAACAATGGCCATGACACAGGCTGCAGCTGCGACCATTGCAGCGCAGAGACAGGCACAGAGTGGTCGAAACACGCCTATTACTGTGAACAACCCAAGTTCCTCGCCCGCACCACCTCCGTCGGCGCTAGCACGGAGCCCTATGGTACCGCCGGCTGTAGCTGCAGCGATGATGTCAAGGCAGAGCACACCGGTAGCAACAAGCAACCAAGTCATGCGTGGTAGTCCGCTAGTTGGAAGTCACCCAGTTGTCGCACGGCCAGTTGCAGGACAGACACCAGCTCCAGTCCAACAGCAACCCCAGCAACCTCAGCAGCCGATCCCGGGCAGCCAGGCGATGATGATGCAACCAGGTGCGAGCGCGAATCCCCAGGCAGTCCTCCAGTACCAGCAGCAACGTATGGCCATGTATAGGTCGCTACAAGCGCAGGCGGCCCACGCACAGGCAATGCATCAAGCGCAGATGCAACAGCAAGGTCATGTGTCACCGGCGCCGCAGCAACAGCAGAATCCACAAGGTGGCAATACCCAAACAATCCAGCAGACCGCGCACGATCAAGCTCCCAGAACACAGCAAAACTTCGCCGGCGTCCAGATGCCTCTCAATTATATGCATATGGGCCAAATGGGCCAGATGGGTCAGATGGGTCAGATGGGTCAGTTGACTCTACAGCAGCAACAGCAATTCCTTTGGGCCCAGGCCCAGGCCCAGACTCAGCGAAGCATGGGTCGAGGAATGCCCCAAGTCGGACCAAACGGGCAGCAACAGATGCCAACTATGCCTGCAAACATGACACTCCAGCAATATCAGCAAATGCAGGGGTTGGGACGTGGTGGAGCCCCACCGAATCGATGAATGTTATTCTTTCCACTTTTTCTTTTCCAATTTGCCATGTATTTCAATCTGTGTTTCCTCGTCATGCTTGCGTCCGGACAGGTGTTAACGTAGATGTACCTCAGTGTATCTTTATCTCAGCTTCTTCGTAACGAACAACGCCATGAAATGCTCCCG\n>XM_045941201.1 PREDICTED: Trifolium pratense germin-like protein subfamily 1 member 17 (LOC123891348), mRNA \nATAATTCACACGAGCAATATATAACTTTTACATAAGAAGAATAAATAATTAAAGAGTATTAGCTAGTGAGTTTGAAAATGAAGGTTCTCTACTTCCTAGTTAGCATCTTGGCTTTGGCATCATCAGTTACCTTTGCTTATGACCCCAGTCCTCTCCAAGACTTTTGTGTTGCAATCAAAGACCCCAAAGATGGTGTATTTGTGAACGGAAAATTCTGTAAAGACCCTGCTCTTGTTAAAGCTGAAGATTTTTTCAAACATATTGAAGCTGGGAATACATCAAATCCATTAGGCTCTCAAGTAACTCCAGTTACTGTAGACCAACTGTTTGGACTTAACACACTCGGTATATCTTTTGCACGCATTGATTTTGCACCTAAGGGTTTAAACCCACCCCACACTCACCCCCGAGGCACAGAGATCCTTATAGTCCTCGAAGGAACTCTTTATGTTGGATTTGTCACGTCCAATCAAGGCAATACTAATCGCCTTTTCACCAAAGTCCTCAATAAGGGTGATGTATTTGTGTTCCCAATAGGCCTAATTCATTTTCAACTAAACGTGGGATATGGCAATGCGGTTGCTATTGCTGGGCTTAGCAGTCAAAATGCAGGAGTTATCACAATTGCAAATGCTTTGTTTAAATCTAATCCAGCCATTTCTGATGAGGTTCTTACCAAAGCTTTCCAGGTGGATAAAAGCATAATTGATTATCTTCAAGGACAATCTTGGTATGACAACAACTAGTTCGAGAACATGATTAATCGTTTTATTATTATTAATAGATGATTCATCTCATCTTTAGTGTTACAATCACCTAGTGGAATCGACCTTCTCTACTTACTTATTTTTATTGTAATAAATAAAATAAATGTTGTTTTATTTAAACACATGGTTGTTTTAATTTTAGTTTAATTTGGTTCAATAATAGATTGTTGTTGCTGATATGTTCACCAATAAATAAAAAGATTGTTGTTGAGGTTTTTGTAATATAATAATTTTCTATCCCA\n>KX055998.1 Phytophthora gonapodyides isolate H18 internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene, complete sequence; and internal transcribed spacer 2, partial sequence \nACGTGAACCGTATCAACCCCTATAATTTGGGGGCTTGCTCGGCGGCGTGCGTGCTGGCCTGTAATGGGTCGGCGTGCTGCTGCTGGGCGGGCTCTATCATGGGCGAGCGTTTGGGCTTCGGCTCGAGCTAGTAGCTATCAATTTTAAACCCTTTCTTAAATACTGAACATACTGTGGGGACGAAAGTCTCTGCTTTTAACTAGATAGCAACTTTCAGCAGTGGATGTCTAGGCTCGCACATCGATGAAGAACGCTGCGAACTGCGATACGTAATGCGAATTGCAGGATTCAGTGAGTCATCGAAATTTTGAACGCATATTGCACTTCCGGGTTAGTCCTGGGAGTATGCCTGTATCAGTGTCCGTACATCAACCTTGGTTTTCTTCCTTCCGTGTAGTCGGTGGAGGATATGCCAGACGTGAAGTGTCTTGCTGGCGGTCTTTCGAGTCTGCCGGTGAGTCCTTTGAAATGTACTGAACTGTACTCTCTCTTTGCGCGAAAAGCGTGGCGTTGCTGGTTGTGGAGGCTGCCTGTGTGGCCAGTCGGCGACCGGTTTGTTAGCTGTGACGTTTAATGGAGGAGTGTTCGATTCGCGGTATGGTTGGCTTCGGCTGAACAATCTGCTTATTGGGTGCTTTTCCTGTCATTGGCGGTACGAACTGGTGAACCGTAGCTGTGTGGTGCTTGGCTTTTGAACCGGCTTTGCTTTGCGAAGTAGTGTGACGGCTTCGGCTGTCGAGGGGTCGATCCATTTTGGGAAACTTTTGTGTGTGCGGCTTCGTGCTGCGCGC\n>XM_008173413.3 PREDICTED: Chrysemys picta bellii NECAP endocytosis associated 1 (NECAP1), transcript variant X1, mRNA \nCCCTTAACAAAAATGGCGGTCGGAAGCATCCCCGGTTACTAGGACCCCCCGCCCCTCCCGCTGGGGTCTCAGATCCGAGATGGCGGCGGCCGAGGCGGAGTACGAGTCCATCCTGTGTGTGAAGCCCGATGTCAGCGTCTACCGCATCCCGCCGCGGGCCTCCAACCGGGGATACAGGGCATCTGACTGGAAACTGGACCAGCCGGACTGGACAGGGCGTCTCCGTGTCACGTCAAAAGGCAAAATTGCATATATAAAGCTAGAGGATAAAGTTTCAGGAGAGCTCTTTGCTCAGGCTCCCATAGACCAGTTCCCTGGCCTTGCAGTGGAGACTGTGACAGATTCCAGCCGGTACTTTGTCCTCCGAATTCAGGATGGGAATGGGCGAAGCGCTTTCATTGGCATCGGCTTTTCAGATCGGGGTGACGCCTTTGACTTCAATGTCTCCCTGCAGGATCACTTCAAGTGGGTGAAACAGGAGACCGAAATCTCCAAGGAGTCACAGGAAACTGACACACGCCCCAAACTGGACCTAGGGTTCAAGGAAGGACAGACCATCAAACTAAACATTGGGAACATGCCAACAAAGAAAGGAGGGGCACCCAAACCCCGTGCAGCTGGATTGGGGGGGCTGAACCTGCTCCCACCCCCTCCAGGTGGCAAAATCACAGCCCCTCCAATCCCTCCCCCATCTTCAACAGCCATTTCCAACCATGTGACGCCGCCACCAGTGCTGAAATCCAGCAACATGGGCAATGCTGATATCCTGTTGGATTTGGACTCTCCTGCATCCATCTCTAAGGCACCAGCACTTGCTGCTGTTCCAGCCACCACAGACCTCTGGGGAGACTTCAGCACTGCATCCAGATGTGCTCCAGCCTGGAATAGACAGGAGGTGGTGGATCTCTTGGGCCTGTGGAGAGAAGTGGCTGTGCAGGAACAGCTCTGAACCAGCCATAGAAAT\n>XM_029877336.1 PREDICTED: Aedes albopictus nuclear inhibitor of protein phosphatase 1 (LOC109424494), mRNA \nCTTTTGCTCAGGTCAAGGAACACAAATCGCCCATTATGTGGTTAGTGCGTGAATTTCGTTCCAATTTACTTATTTTCCACCGTAAAAACTTCTAAAACTATCGTAATTAGTGTATTAAGTTGAGGATTCGTGTTTTCCTGATCTGGGACAACAACTCATTCTGAGCGTAATGTCCAACCACTACGACATACCCTCTTGGGCTGGTAAGCCGCCCACGGGGCTACATCTGGACGTGATGAAGGAAGACAAACTGGTTCAAAAGTTGATGATTGACGAAAAGAAATGTTATCTCTTCGGTCGGAATCCCCAGATGAACGACTTCTGCATCGATCATGCGTCCTGTTCCCGCGTACACGCCGCATTCGTTTATCACAAACACTTGAACATTGCCTACCTGGTGGATTTGGGCTCCACTCACGGGACGTACATCGGCTCGGTCCGGCTGGAAGCTCACAAACCCACCCAGTTGCAAATTAACTCGACGTTCCATTTCGGCGCTTCGACCAGGCACTATATGCTCCGGGAGAGACCCAATGTCCGATCCAACATTATGGAAGACATCCCGATGATGGACACCAGCGATGGAACCTATCTAGGCCTTCCCGAGAGCCAAACGGAACTTGATAACTTGACTGAATACAATACCGCTCATAACCGGAGGATTTCCATGCTTGGAATATCGGACGAAACCAGCACTTTCAAGAAGAATATGAAGAACAAAAGGAAAAGGAAAGGCGTCCAGTTCAATGAGGATGAAATCGTTATAAATCCCGAAGATATCGATCCAAGCATAGGACGCTTCCGTAATCTCGTATCGTCCACAGTTGTTCCAGTACAGGCGAAACGTGCAAAACTAGAAGTTCACTCAATGGGTCTCTCTACGTCGCCCTCATCCAGCAAAATCCTTCATCATCCGCACAGCTTGGTACCAAATTTGTATCATGGAATCGACGACCAAGCGCATGATCCACGAGGTCCGCCCGGCAATGGTTCCGGATTCGGGTTCGGCATGGACACCACACCCAGTGGACTCACCACTAAGCTGGGTATAATTTTGCCGAATCCAGCACCGGATGTGAATCCGGCCAGTTCCAGCACTGCTCTAATGCCTCCTCCTATCTACAGCAGCATGGCTCCCAAAAGTGTTAAAATTGTCGACAAACCGGACCTATCGGACGAACCCAAAAAGAAGAAATACGCCAAGGAACAGTGGCCCGGAAGGAAACCTCTGGGATTGGGAGGTTTCTAAGCGGTTACAATACAAATGTAACGTTACATTTATCTTATATTGGTGTGACTATTTGGTAAGTGAATAAGGTTTACCGAATTTAATCTAACATCATAATAATCGAAAGTTAA\n>XM_053193968.1 Colletotrichum fioriniae uncharacterized protein (COL516b_007061), partial mRNA \nATGGGAAAGTCAAGACGAAACAGAGGCGGCCCAAGCCATCGCAAGGACCCCATCGCCAAAACCGTCAAGCCCCCCTCCGACCCAGAGCTCGCCGCCCTCAGGGAAAAGTCCATCCTGCCCGTCATCAAGGACCTGCAGAGCGCTGACCCCAAGTCGCGCACCGCCGCCGCCGAGGCCGTCTCCAACCTCGTCTCCAACGAAAAGTGCCGGAAGCTGTTGTTGCGTGAGCAGATTGTCCACATCGTCCTGAACGAGACCCTCACCGACGCCAGCCTCGACAGCCGCGCCGCTGGTTGGGACATCTTGCGCGTTCTCGCCGAGGAGGAGGAGGCCGACTTTTGCATTCACCTGTACCGTCAAGATGTTTTGAGCGCCATTGGTTTTGCTTCTCAGACTATTCTCCAAAACCTTGCAAAGGGCTCATCTCTGAGCAAGGGCGAGACAAAGGTCACCTGGACCATCACCGAGTCTGTCATTGGCCTTTTGTCTGCTCTTGCCGAAGCCCAGGATGAGGTTCTCGAGGCCATTGTGGGTATCGAGGGCATCAAGCACTTGCTCTTTACTGTCATCGCTCACCCCGACACACCATCAAGCATCTGCCTCGACGCCCTCTCAGCCCTCCTGACCCTGTCCGAAGACAACCAGCGCCTGGCGCAGGATGTCGTCGCCGACGAGAGCCCCAAGCCGCTCACGTCGTTGACCAAGCTGCAAGAGGTCGCTGGCGCAAAGGGCGTCCTAGCCTGTGGTATTCTGCATAACATATTCACCACCTTGCATTGGTTCGACAGCACGCCGGGCCCCAAGGACCTCTCTGACGCCTCTCTCATCCCAACTCTGTCATCGGCACTCAAGAACACCACGCCGGAAACTGATTTGCCACCCAGAAGCCAATGGTCTAACCCGACCGAGGTTCTTCAGCTTGCCCTGGAAATCCTCGCCGATGTTGGAACGACGCTGCAGCAGTCTCTCCAGGGAGGCGACAGCAAGAAGGCCAAGAAGGAGGAATGGAACGGAATCGAAGACGACGACACCGCCATGGACGAGGACGTCAAGGAGGACAACGGCTCCGGCGACGAGGACATTGGCGAGGGCGACGAGGAGGACGACAATGACGACGACTCCATGGACGAAGACGAGATGCAGGCCGACATGGACCTCGTCACCGGCGCCGACGACGACGTCGACGAGGAGGCGAGCATGGACGACCTGCCCACCCTGCGCGAGCTGGTCCAGCAGGCCATCCCGCAGCTCATCACCCTCGCGACGCCGTCATCACAAGCAGAGGGCGACAACGTCCGGGTACAAGCGCACGCCCTGGCCGCCCTCAGCAACATCGCCTGGTCCATCTCCGTCTTTGACTTCTCCGACGATCACAACGCCGGCATCCTCAAGGCCTGGGCCCCGTCCGGCAAGGCCGTCTGGGCCCAAGTCATCGCCCCTATCTTGGCCGCCAACACCGCCGACGTCGAGCTCGCCACAAAAGTCACCAGCCTCGCGTGGGCCGTGTCCCGCAGCTTGCCCCGCCGCCTACCCCTCAGCGGCGACGAGCACACCAAATTCATGGCGCTGTACCACGCGACCAAAAACCTTCCCTCAAAACAGGCGGCCGAGACGGCGGCCAACGGAGACAAGGCAAAGGACGAGGATCCCGAAGATCCTTTCCAGGGTCTCGGCGTAAAGTGCATCGGCGTCCTGGGCCAGCTGGCGCGGGACCCGGCACCCCTTGCGCTCAACAGGGAGATTGGTGTGTTCCTTATCGCGGTGGTGACTGCATTGCCAGAGACCCCGGCGGCGGATGCCGTCGAGGCCCTGAACCAGCTTTTTGACATTTACGGAGACGAAGACATGCCATGCGACAAGGAGGTCTTCTGGAAGGACAACTTCATCCAGCACCTCGAGGCGGTTCAGCCCAAGGTCAAGGCCTTGGTCAAGACGATTGATAAGCGAACTCTCCCCGAGTTGCGCACTCGTACTGAGGAGGCTGTGTTGAACCTTGGACGGTTCATTCAGTACAAGAAAAAGAACAAGGCATAA\n>XM_046724795.1 PREDICTED: Haliotis rubra E3 ubiquitin-protein ligase parkin-like (LOC124288282), mRNA \nAACAACAAATCGAGTGTCAAGCACGTGTTTCTTGTCATTATAGGAGGGGATTTTTTTGTTTGTCGTTATCGGATGTGGACTACACAAAACTGACGACACCAAAACAACCCAGGGTGCACGTTTCTCTGTCTTTAAGCAGATGACAAGTGTGCCAGGTTGTGCTTTCGATCGCATACCTGTGCTAACTACGATGCAGGAAGTTGTTTGACAGCCACACTTAGCCTTCAGGGAACATACGGCGCATTATATGCAGCGAATGAACATGGTGTAATCTTATCTACATAACTTGCATCATGATTACCGTGAATGTGAAATTTCACAGCAATTGTGCAGTTCTTGTTGAAATTAACCCCGACAGCAGCTTGCATGAAATCAAAAGAGAAATATCAAAGAAGGTCAATTTGCCACTGGAAGAAGTCAAGATTATATTTGGGGGGAAAATTGCTGACGGACGATTGTGTGTTTCAAGATTTGGATTTTGGTGATCAAAGCACTCTCCATATCTTCAGACAGATATCAGGGAGTGAAAAAACTCTGACATCAGAAGCAAGCGAGGAAAGAGAGCTCAAGAACCAGTACTATGTGTACTGTAAGGAATGTAGATCAATACAGCCAGGCAAGCTTAGGGTCAAATGTGCTACATGCCAGGATGGGGCCTTTGTTCTCAGCAGGGACCCCGAGGGCTGGAGCGATGTGTTGCAGTCAAGGAGCATGGGTGGGGAGTGTCGGAATGATGGCTGTGAAGGGACAACTGCGGAGTTTGTGTTCAAATGTGGCAAGTCCCACGCTGATGGCATATCAGCTGTCGTTCTACGACATGTCCGACCAAACAGACGGGAGGTTGAGTGCATTACCTGTGCAGATGTGAGATCTCCTGTGCTGGTGTTCCCCTGTGAGTCAGGACACGTGATGTGCATCGAATGCTTCAAAATATATGGAATCACCCAGTTGAGTGAACGCAGGTTCATTAAGCACCCAGAGCATGGGTACACCCTGCCTTGCCCAGCTGGCTGTCCCAGCTCGGAGATCCAGGAGAGCCACCATTTCCACCTACTGGGAGATGAGCAGTATGAACGGTTCAACACGTTCGCTACAGAAGAGTATGTACTACAAGATGGTGGCGTGCTGTGTCCAGGACCAGGATGTGGGATGGGCTTCGTCCTTGACACAGCGGGGAGGAAAGTCACCTGTGTTGCCAAGGACTGCATGATGACATTTTGTCGTGACTGCAAGAATGAGTACCATGACGGGCCTTGTGATGTCAACCCTCTCCTCACACTCTCACCTCTGGACTACTTGGTGGACCCACTCCAGGCTGACGGTCTCTGGGAGGACCAGTCTCGAACGCTGATAGACCGCACCACCAAGCCCTGTCCAAAGTGTGGCTCCAGGACTGAGAGAAACGGTGGTTGTATGCACATGCTGTGTCCACGGTGCGGGGAAGACTGGTGCTGGGTGTGCAACAAGGTGTGGGATCGGGACTGCCAAGGCCAGCACTGGTTTGGATAGTGTGCATATCCTTCCAGATAGTGATTACAATAATAATATACAGGATATACAATTCGGGAAGAAACCTCCTATATTTTCATACACTCTGAACCTCCACCATTCATATGTATAAATGATATTGATGTCATGTTGATATATGTGTGAAATATTCCAGAGACCTGCTGAAATGGTATTTGATGGCTATGTTGTATGTGATGTCAAGAGTGAGATGCTATGCTGTTGCCATTGGAAACTCACAAAACATGATATTCACGGCTAGATTTAAGCATTTAGAACTTGCACTGGTGCAGCCTGAAACTGCAAAATGCAACCTCATACTTATACCGGTACCAACTGGCACCCACTGCATGTTTTTATTTTTGCTGCTCAAAGAACACAGACTTCAGTTTGAAAACAGAATGGCAAGGAAATGACTTGGAGCAGTGACTCTGATGGCTGCATGGACAGTAAGACCATGACCGTTAGTGTTCATATGATGGAATTTTATTAAGTTAGATAAAGTGACCTCATCAGACTCTTACTAATTTTGTCTCAGCACCAGATGCAAACTGTTTTTGTCTGGTGCTACAAGGTTAATACCAGTTGGAAGTAGGTTTCCTGTTTTTAAATCAAGCCCTGATATCTGTTTCAGTTTCTACTATCAGCATGGTGATCTCACTCTGTACACAAAAATAGACAGTATTCTTCAGGAAGTTAACATGGGAAAGTATTTTTAGATGTCTTTTACATATAGAAATATATGGTAAGTGATGCTCAGGTTTATTCATGGGCCATGTTTCACAAAGCAATATTGGAGTTACGACCATCATAAGCAAATGTT\n>KC455192.1 Uncultured eukaryote clone T2S303B03 18S ribosomal RNA gene, partial sequence \nAAAGATTAAGCCATGTTTGTCTAATTATAAGCTTTTATACAGTGAAACTGCGAATGGCTCACTAAATCAGTTATGATCTACTTGACAAATTTACTACTGGATATCCGGGGTAATTCTAAAGCTAATCCAGTGCATTCAACCCCGGATGTTTTGATGGGAGCACTAGTTAGATCCATAGACCAAACCCCCAGGGCAACCTGGTATTGCTTAGTCATAACTATTAACCTTACCACCCGCAAGGCCGACGGTTCAATCAAATTTCTGCCCAATCATTGCCCTGTTGGTAGGAAAAAGGCCTACCATGGCTGCAACGGGTAACGGGGAATAAGGGTTCTTTTCCGGAAAGGGCCCCTGAAAAATGGCGACCCCATCCAAGGAAGGCAGCCGGGGCGCAAATTACCCAATCCCCACCCGGGGAGGTAGTGACAATAAAAAACAAAGCAGGGCCCTTTTGGGTCTTGTAATTGGAATGAGCTCAATTTAAACCCCTTAACAAGGAA\n>XM_047242661.1 PREDICTED: Schistocerca piceifrons protein O-mannosyl-transferase TMTC2-like (LOC124712366), mRNA \nCGGCGCCGCGAACGTCGGAGGCAGCAACGACGCGTCGCGACGCTTTCGACGCACGACACGTGGACACATCCTGCAAAAGCTGCTTCTGGTCGCCGCGGAACTGTCAGCGAGCTTCTCTTGTACAGTCGTCCGCCCCTGTGAGCGCGCCTGTCGCCCCGCTGCCCCTGGCGGGGTGTCTGCAGCCAACAAGTGTGGGAGCGAGAGGCAACAGGTAGTCTGCTGGTGTGACGCGGCCGCCCTTATCTGGATGGACGGCACGGCCGTGGCGTGCGCGCTGCTCGCCGCCGCCGCCTACTACAACACGCTGGACGCCGGCTTCGTCTACGACGACAGGCGGGCCATCCTCGGCAACCCGGACGTGACGGGCAACGAGACGTCGCTGTGGCGGCTGGCGACGTCGGACTTCTGGGGCACGCCGCTGCGGCTGGCCGGCTCGCACGGCTCGTGGCGGCCGCTGGCGGTGCTCAGCTTCCGCGCCAACCACCTGCTGGGCGGCGGCTGGCACGCCGCCAACGCCGCGCTGCACGCCCTCTGCGCCGCGCTGCTGGTGCGCGTCGCGCGCCGCCTCCGGGCCGCCCCCGGCGTCGCGGGGGCGGCGTTCGCGCTGCACCCGGCGCACTGCGAGGCCGTGGCCGGGCTGGTGGGCCGCGCCGACGTCGCCGCCGCCGCCTGCTCGCTGCTGGCGCTGCTCTGCTACGCGCGCCACGCCGACCTGCGCGACGCCGCCGACGCCCGCCGGCGGCGCTGCCGCGGCTGCGGGGGCCCCGTGCACCGCCAGCAGGGCTGCGCCCTCCGGAGGGCTCTCGCCGCCGCCAAGGGCCTCCTCGGCGCCGCTCTCTGCTCGGCGAGCGACCGCCTCTCTTGCCAAACCCGCAACTCCTCTCACCCCCCTGCCACCGGCACAGTCACGACGAACGGTACTGCTTATAAATCCGGCGCCTGGCTGGGACAAACTTCTAAGTCACCTCGAGCTGACATCGTCACTGAGTCCAATGACGCCAACAACAACACCAGTACGAACGCACTCGCGTGTCAACAGGCTCCGTCGAAAACATCCGTCGACTTCGATACACCGCCATCAATCTCGAAAGCGATCACGGCAGAAATCACTCGCATTAACGCCTCTCACACCACATGTTGCAAACAACCTCGCACTTCAACGCAACATTACAATGGAACTGTTCCTCTCGCCTCTTGGCCGTCGACCGAACGGACGGAAAATGAGGACGTTGCCGAAGGCAGTGATGCGACACGAGACGCTAATCACAACACTGAGTTCGTCAGTTCGTCGCAATTGTTTTCAATTAGCCAGTGGCGATACCAGAACGCTTTCGACCATCATCTTGAAGAAAAGGTTGTGAGACGCAGCCTCTTCAGAGCCAAAAGGGAGGCGTCCAGCAGGCTCGGAAGTAATGTGTTGAGGAGGAGGTGGAAGAAGTGTTTCAAGGACAAAAATTTAATCACAGACAGCGGTGAAGATCAGAAACGGCTTCTGAAGACAGCAGAGAGGAGCACCTGTTGCGCCGCGGAGGGCTGCAACAAGGAAGAGTCGCGCTCGTGTCGGAACAGCGCCAGCGGCGGGCCGCTGCTGCAGCTGGTGGCGTGCGTTCTTCTGAGCGCATGCGCGCTGCTCTTCAAGGAGACGGGCATCGCGGCGCTCGCAATCTGCGTCGCCTACGACGTGGCGCTGCTCGCAGAGAGGGGCGTCGCCGGGCCGCGGCAGCTGCTCGCCACTCGAGCGATCGAACGCCGCCGGCTGGCGCAACAGGTGTCGCCTGTGGAGAGCCAGAGGCGGCCTGCGGCCTGCCCCTCCAACCGAGCCAAGGGCAACCGCTGCTGCCTGCTCGGCGGATGCGCCGAAACGCACGCGTGCGCCGACAACAGCGTCAGTGGCCCCTGTGGCAGAGGTGCGCTGCTGGTGAGCCTGTCGCTGCTGGTGGTGCCGTTCCTGCCGGCCAGCAACGTGGCGCGCTACGTGGGCTTCGCGGCAGCGGAGCGCGTGCTCTACCTGCCCAGCGCCGGGCACTGCCTGCTGCTCGGCCTGGGCTGGCAGCGCCTCAACCGGAGGTCCCACCACCACCAGCACCAGCACCACCACCACCACCACCACTGGGCGTGGCTGTCAGGGTTTGCACTGGCTGCCACACTGGCCAGTCTTGGAGCACGGACCGTACTCCGCAACAGGGACTGGTACGACGAGGAGAGCCTCTTTCGCTCTGCGCTTCACATCAACCCACCCAAAGCGTACGGCAACCTGGGCTGCGTGCTGAGCTCTGCGGGCCGCCTGGAGGAGGCGGAGTGGGCGCTGAGGCAGGCGCTCAAGCACAGGCCCAACATGGCGGACGTCCACTACAACCTGGGCAACCTACTGCAGGCTAGAGGCCGCCCGGAGGAGGCAGAGCGCAGCTACCGGCTCGCCATCCACTACCGGCCCTCTCTCGCAGCGGCGTACGTGTCACTGGGGCAGCTGCTGGAGGCACGGGGTCGGCTGCGGGAGGCGTCGCAGGTGTACGAGGACGGCACACAGCTGGACGGCGAGCGGCTGCGGGACCCGGCGGCGCACCTGCAGGCCACCCTCAGGGCGCTGCTGAGACTGGCCCGGCTGCGGGCCCAGCAGGGCGACTGGCAGGCGGCGGCCGACAGCTGCAGGCAGGTGCTGCTCAGGCACCGCACTGCCCAGCTGCAGGGGCTGTTGACACAGGTAATGGCGCAGCAGGGTGCTGACCACTTAGTAAACAAGTGCTGTTCAGGCACCGTGCTGCCCAGCTGCAGGGACTGTTGA\n>XM_020923618.1 PREDICTED: Boleophthalmus pectinirostris sodium bicarbonate transporter-like protein 11 (LOC110159053), mRNA \nATGAACAGCAAGAAGAACGCAGAAGAAACACCCACGGTCATCGTCACCAGATTCACTGAGGAACTCAAGGATGGGGAGAAGGAAGAAACAAACATTTATGAAATCCCAGTTAGTACTACAGCCACTGAAGGGCCCGGATTTGGACTTTTAAATACAACCAGAAAGTATGTGAAGCCAATGAACTTCCAGGAGGAGGTACGAGCTCATAGAGACCTGGACAGCTTTCTGGCCCAGGCTAGCATCGTCTTGGATGAGAAGGCTGCCACTCTGGACGAGGTGCTGAGGAGAATGTTGACGAATCTGGTTCAAGAGGGACATGGGAGCTGTGACACTGAAGAGGTCATGAACACACTGTTCACAGACGCAGGGGGACAGGACTGTGATGTGCACCTTCTAACAGAGACCATTCAAGGAGTAACGGCTAATTCTACTGGGGTTCACTATCAGCAATCATGGCTTTGTATACTCTCTACAGTGAGGACTCTGCAGCGGCGCCATGTCTGTGTCACTCGTTTAGAGCGACCTCAGAACTGGGGAGTGAACTGCTGCGAGGCGCGATATGTCATACTAATCCTCGCTCCTCCCAGAACGAAAAGCACCAAGACAGCCATTGAGCTCGGTAGAACGTTCGCGACAATGTTCTCGGACATCTCCTTCAGACAGAAGCTTTTGGAGGCCAGAACACAGGACGAGTTCAAACAGGAGCTGGTCCTCCAACGACAGCAACTCTCCATGGTGACAGAGAAGCCAGTGATCGAGGAAGTGGTGGACTCGGACCCCCGCAGGGCCAAAGATCTACAGTGCATGGACTTCTTCAAAGCCGGCAAAGGTGTTTATGAAGATCTCCGCCGCAGACTCCCACTCTACCCGTCAGACTTCACAGATGGAATTACTGGAAATGACCGCTCACTACTCAAGTACACCACCACAGCTATTTTCCTCTACATTGCTATTCTGCTCCCAAACATCGCATTTGGCTCTTTGAATGATGAAAGTACAAGAGGTGAAATTGATGTTCAGAAGACAATAGTTGGCCAGAGCATTGGTGGAGTTATATACGCGCTGTTTGCAGGCTCTCCTCTTGTCATCCCACTAACTACAGCTCCGCTTGCTATCTTCATTAGTGTGATCCGTGGCATCTGTGACGACTACAACCTGGACTTTGATGCCTTCTACGCCTGCATTGGTTTATGGAACAGTCTCTTCCTTATCCTCGGGGGCCTATTCAATGTCAGTCTGCTGATGAAGCTCTTCAAACGCTCCACAGAAGAAGTCATTGCTCTGTTCATCTCCATAGCATTTGTCGGCGACGCGGTGAAAGGCACAGTCAAAATTTTTGAACACTACTACTATGGACCTACCCTTGCTACCTCCAACAGTACAGTGGTGCTCCAGCAGATTAATGAGATTCTGGAGCGGGCAAACAACCACACCTCCACCAATGGCACTGGGTCAGAGACTGGACACTCAAACCTCCTCCTCCTGCCTGAGTCTCTTATCGTGTGCACCAGGGAGAGACCCATCCTATGTCTGCTGCTCATGCTCGGGACACTGTGGCTGGGATATGCTCTCTACCTCATCAAGAGAAGCCCATATCTGAATGCCAAAGTGCGGGAAGTGGTGTCGGACTGTGCTTTGCCCATATCAGTCGTCATTTTCTCATTCATTGGGTCCTACCTGTTTATCGATATTCAGCTTCCTCAGTTTAGCGTCCACAATGGTCCAGTTTTCAACTTCCCTCCCTTTGACAGGCTGAGTGGCATGACAACATTAAGTGCAGTAGGGCTTGGGTTCTTACTCGCTCTGCTCATCTTCATCGATCAGAACATCGTCATCTCACTCACACATGTACCTGAACACAAGCTGCTAAAGGGCACCACATTCCACTGGGACTTAGTGCTGACCGGCCTCATCAACATCCTCATGTCCTGTCTGGGGTTGCCATGGATGCACGCCGCTTTCCCACACTCGTCTCTGCACGCCCGTCAGCTGGCCAAAATGGAGCAGCATGTGGAGAACGGACATGTCTACTCTACCATCGTAAGTGTGAAGGAGACTCGGCTAACGGCGCTGGTAGCAAACATCCTGATCGGCGTGTCTGCCTTCATGCTGCCCGTTCCCCTGCAGTGGATCCCCAAGCCTGTGCTCTACGGCCTCTTCCTCTACATCGCTGCCACTTCTCTTGATGGGAACCAGATGGTGGACCGCATGGCTCTACTGCTGAAGGAGCAGACGTCGTACCCTCCCACTCACTACATCCGCCGTGTCCCCCAGAGGAAAGTGCACTATTTCACCGGGGTGCAGATGGTTCAGCTCGTGATCCTGTGCGCGTTTGGCATGTACCCTTTGCCCTATATGAAGATGGTATTTCCTCTCCTCATGATCCTGCTCGTTCCTGTCAGGACAAGTCTCCTTCCGAAATTAATTGACGCCAAATATCTGGATATCATGGACGCCCAGCACATGTAG\n>XR_545375.1 PREDICTED: Equus przewalskii uncharacterized LOC103553015 (LOC103553015), ncRNA \nCGTCTACACAAAGACTTGCACACGAATGTTCACAGCAGCACTATTTGTAATAGCCCAGAGTGGAGACCACTCAAATGTCCCTCAGCTAGTGAACGGATAAGCAGGGTGTGGCCCTTCCACACAATGGAATGTTTTTCAGCCATAAGAAGGAATGAAGTACTGACACAGGCTGCAACGTGGAGGACCCTTGAACACATTCTGCCAAGTGAAAGAAGCTGGCCACAAAGGACCACATGTTGTGTGATTCCTTATATGAAATGTCCAGAACAGGCAAATCCATAGAAATGGAAAGTAGATGAGTGGCTGCCTAGAGCTTGGGTAGGGAAAT\n>XR_002766617.1 PREDICTED: Eurytemora affinis uncharacterized LOC111708265 (LOC111708265), ncRNA \nCTGGTGAATTATAGCTGAAATTGTGATAAAGTTACGCATCTATTTTGTATCAAAAATAGCCGATAATTGTTTGTGAAAATTTTCAGATGTCGTCAAATATTTTTTCTGAGGTACTATGGAATGGAATTTTAGGCGATGAAGAAGAGAGGGGACCCGAAATGTCCAATATTATAAACGGTCTGTCAGTGCCAATCAAAGCTCCAACATGTATAATACAGAGCTGCAATCCAAGAGTATGAGGATCACGGTTTAGATTTCCAGCAAGAAAAAAATTGTGGCTGAAGGCCCTTCATTTAAATCAAGAGTATATCACAGTAAAAGATCCAAGAGTATGTGAAAAACATTTCAAACCCTCTGATTTTAAAAGTAATTTATAGTATAATAAATATTACGACGTTAA\n>XR_006947954.1 PREDICTED: Xenia sp. Carnegie-2017 uncharacterized LOC124444429 (LOC124444429), transcript variant X1, misc_RNA \nGCTTAATTTTAAAATCAAAGTACTTTCAGAAAAACGCTATTGGTTTTGAATTTGTAAAGATCATAATTTTACCAATTAACTTGTCTCTTAATTGCTTAGAAATTTAAATATATTCCAAATTGCGCTGCGGTAATTAATTTTGAGGCACCTCAGATCCTCCAAGGGTTTACTACATACAATTTGGGACATCTTTTCGTAGGTTGCCACCGGCGGGCAGTGACGCATTTGACTTTATCACTCAATCGTTTTAGCTGTTTGAAAAGTACTTGACTCCTTTGAGAAAAAAAGTTCACATCACGTTGGGTAAAGATAGTCATCTTGGCCGTTATGAAACAGGAAGGTGGTGGGGAACTTTGATTGTTGCTCTCGTCGTTCTGTTCACGTCAATGGCAACGATGACAAGTGTCGCAGTAAAGCAAACGCAAAATTTGTTTCGTCGACGACCTATTGTGGAAAAATTGACAAAATGGTATTCGTCGTTGTCTCGGAAACTTTTTTTAAGTTCAGTGATCGCACAACTGCTTATCATCGTCATTCTCAACGCATGCGCAGGAATAACATTCCTCCTGGCATCCAACATGTCTCTTGTGTGTGACGTCACCTCTCATCATGAAAATATTGACAGGATCTTCGATATTTCAAGTGTGTTACCAAAGTCTACAATGCTTCCCAGGACAAAATCAATACAATTATTCAAGAAACTTAGCGAATGTCCCGAGAACGGCACTCTCTGGACGATGTTGGATCTGGATGATAAAGTGGACATCAATTCTGGTATTAGTCAATTACGTAAACTTCCACATTTTGCTGAGCGTCTGTTTCTCGTCGGTGACACATTCCATGATTTCCAAGCCGATAAAAAATATGCAAGACTTTTTTTGAAATGGAAACGGTTCATGTTGGAAAGCCTCGAGATTGATTCTATGGTGAATGAGACTATAGAATCGTTCAAAACGTACCGAAAGAAGGCTGTTAAAAATGGGAATGCAATCCGGAACGTTCATATTGAAATTTTTCCCATATTGTTGAAGCGACTTCGGCAAGATTTCAAGAGATTCCAAGAATCCAGAGCTCAAATTTCCAAAAGCATTAAAGAAATAAAAGACACTTATTTTGATATTACTTCAAATACTTCAAAAAAGGTCGGTCTTCAGGCTTCCAACGGTCTCGCCGTCCAAACTATCGAATCACTGAAGTCGTTTATCAACGAGGGTGTTTTCAAGATCAGAAGTCACGTGGGAAAATGTTTGCCAATGAAAAAAGCCTATTACAACATCACGTGTCTGTTATGCCATGACATCTTCCGATCTTGGAATCGCTATTTTCTGTTGTTTTTTGCCTGCGCCTTCCTTACGACAATCTCCATCATCGTTTCCATGGTTACTGTGATCTGAATAATCGTGTTTTATCGCTGGAAAGTTCGCGTAGACTGGTAACGAATTAGGACTGAGCTCTGAAATTCGCTTTGGAGATCGAGAACGAGACGAGGGAAAGACAGCTCCTGCTCAATTCCCGAGATGATTTG\n>MW805831.1 Corticium thailandicum isolate MG242 TYPE large subunit ribosomal RNA gene, partial sequence \nTCTAGCATATCAATAAGCGGAGGAAAAGAAACTAACAAGGATTCCCCTAGTAACTGCGAGTGAAGCGGGAAAAGCTCAAATTTAAAATCTGGCGTCCTTAGGGCGTCCGAGTTGTAGTCTGGAGAAGCGTCTTCCGCGCTGGACCATGCATAAATCTCTTGGAACAGAGTATCATAGTGGGTGAGAATCCCGTCTTTGGCATGGACTACCAGTGCTTTGTGATGCGCTCTCAAAGAGTCGCGTTGTTTGGGAATGCAGCGCAAAATGGGTGGTAAATTCCATCTAAAGCTAAATATTGGCGAGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGAAAAGCACTTTGGAAAGAGAGTTAAACAGTACGTGAAATTGTTGAAAGGGAAACGCTTGAAGTCAGTCGCGTCGTTCGGGACTCAGCCTTGCTTCTGCTTGGTGTATTTCCTGTACGACGGGCCAGCATCGATTTTGATCGTTGGAAAAAGTTCAGGGGAAGGTGGCACCTCCGGGTGTGTTATAGCCCCTGTTCGCATGCAACGGTTGGGATCGAGGTTCGCAGCACGCCTTTATGGCCGGGGTTCGCCCACGTACGTGCTTAGGATGCTGGCGTAATGGCTTTAAACGACCCGTCTTGAAACACGGACCAAGGAGTCTAACATGCCTGCGAGTGTTTGGGTGTAAAACCCATCCGCGTAATGAAAGTGAAAGTTGAGATCTCTGTCATGGAGAGCATCGACGCCCGGTCTTGAGCTTTGGCGACGGATCTGAGGTTGAGCATGTATGTTGGGACCCGAAAGATGGTGAACTATGCCTGAATAGGGTGAAGCCAGAGGAAACTCTGGTGGAGGCTCGTAGCGATTCTGACGTGCAAATCGATCGTCAAATTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCTGCCGA\n>XR_004926052.1 PREDICTED: Halichoerus grypus uncharacterized LOC118553476 (LOC118553476), ncRNA \nGCCCAGACAGAAGAGGCAGGCGCGTGTAACACAGAGCCTGGCCCTGGCCTGTCACGGCCTTCCTGTCTCTGCAGCTGGGCTGGGGCAGAAGCCGAAGTGAACTCGGGCCTGCAGACAGAGGCTTACCGCCAAGGTTTTCCAGAAGAGGGAAGTCCACTCTTTCAAAGACACAGCTGGAGTCAGACGGGGCAGGACAGCCCCTCTGAGGCTGACCCCTGCACAGTGTCCCTTCCTGACTCAGGAAAGGTCTACTCCTGCGCTGTCCCAACATGCCGGCCGCCAGCCACGCGGGGCTCCTGGGCACTTGAAATGCGGCTGGCGTGACCCTAGGTGTGCTACAAAGTACCAGTACACCCCAGGTTTTGAAGACTTGGTATGGAAAAAAAAAAGTAAAATATCTGTAATAATTTTCTGTATCGACTGCATGTTGAAATGACAGTACTTGGAGTAA\n>XM_028734882.1 PREDICTED: Podarcis muralis zinc finger protein 341 (ZNF341), transcript variant X4, mRNA \nACATTAGTCCAGGGGAATATCTTAGTGAGTGATGAGGTCTTGATGTCAGCTATGTCTGCTTTTACAACCCTGGACCAACCAATGTCCACAGTACAACCCTCTGTGCAGCCTGAATATGCATACTGGAGCTGGCTACCTTTCTCAACCACCACCTCCTCCTCCTCCTCCACCACCACCACCTCAGCCTCCTCCTCCCACACCTCAGTCTCTTGGAGCACCAGGTCAGGCCAACTCAGGCAGCAATGGAGTGGTGGAAGTGTACAGTGCATCAACCCCCATGACTGGGAATAGCACAGTAGAGATACAGAATCTGGGGATGCAACCCTACCCACCTATGGAGGTGCCCAATCAATGTGTGGAAACCCCAGTGTACCCCTCCCCTCCAGTATACAGTCCAGGGAAGCAAGGTTTTAAGTCTAAAAGCCCCAACACTGTTTCTCCCTTGAACAATGCCTGCGGAGGAAATGTGACCAGTTTTGATCCGGCTTCAGCTGCCAAGAACCGTCGTCTTAAGACAGACAGCAGCCTGCTAGAAGGGAAACCCAAGTCACCAAAACTGAAATGCACATACTGCGATAAGGCATTCACCAAGAACTTTGACCTGCAGCAGCATATCAGAAGTCACACAGGGGAGAAGCCATTCCAGTGCATCGTATGTGGTCGTGCCTTCGCCCAAAAGTCCAACGTGAAAAAGCATATGCAGACGCATAAGGTGTGGCCACCAGGAATTGGGTGTACCATCTCTCGGAGCTCTGTCACTGTGCAAGTCATGGCACTCAACCCCAACCAGCAGGAGGAGGAGAATGCAGGTTTGAACACGGTTCCCAGAAGCAGCCCCCCACCGCCACAGGTCATGCCTCCTGCAGAAGAGCATGAGGCTTGCAAACTGGAAGCTAAGCAAGTGGTCTTGATAGACAGTTCTTACCAGTGCCAGTTCTGCCCCAACAAATTCTGCACATATTTCCAGTTGAAATCGCACATGACCCAACACAAACATGAACAGGTTTACAAGTGTGTTGTGAAAAGTTGTGCTCAAACATTCCAGAAGCTGGATTCCTTCTTGGAGCACATCAAGAACCATCAGGAGGAGCTGAGCTACCGTTGCCACCTTTGCAGCAAGGACTTCCCCTCCCTCTATGAACTGGGTGTCCATCAGTATTCCCACAGCTTGCTCCCTCAACACAGTCCCAAGAAGGACATTGCCATTTACAAGTGTGTCAAGTGTGTAAATAAATATTCTACCCCAGAAGCCCTGGAGCATCACTTACAGACAGCAACACACAACTTTCCCTGTCCTCACTGTCAGAAGGTGTTCCCTTGTGAGAGGTACTTACGGCGACATCTACCTACACATGGGGGTGGAGGGAAATTCAAATGTCAGATCTGCAAAAAATTCTTCCGCCGAGAACACTACCTCAAACTACACGCTCACATTCACTCGGGTGAAAAACCTTTTAAATGCTCTGTGTGTGACTCAGCCTTCAACAGGAAAGATAAACTCAAACGGCATATGTTGATCCATGAGCCTTTCAAGAAATATAAATGCCCCTTCTCAAATCATACAGGCTGCAATAAAGAGTTCAACAGACCGGACAAATTGAAAGCTCATATTCTCTCCCATTCAGGGATGAAGATCCACAAGTGCCAATACTGCAGCAAGGCCTTCAGCCGGCGAGCTCACATGGTGGAACACCAGCGCTCTCACACTGGAAACTATAAGTACCGCTGCCCTACATGCAGCAAAGGCTTTACACGCCAGAAGTACATGAAGGACCACAAGTGTAGACTGAGTTCAGCCAAGGACAAAGAGCTGCCAGTGAGAAAATCCCAGAAGAAGTGGGGGACTCGTGGCCGGAAAGTGGGGCTTCCTGTTTCAGCTCAGTTGACCTTGACAGAACTGAAAGACAGTACAGATGGAGGAAACCCTCAGAAAGGTGGTCCCAATAAAGAACAGTTTCCAGTGTCTGACACAGTCCTGTCCATTGTGGTTGGCAGATCAACGGCCGTGTCGGCAACAGACTCTGATCTTGGCAACCCTACCCAATGCAGTGGCATTCCATCCAACCTTGCTCTGGCCGAGTTGCAGCCTGGCTCGGAGAGTCCATGCGCCATGCTAGCAGTTCCTGTATACATTCAGGCTACTGAATAACTGAATAGTACTGTGACTTAATGGGGGAAATAATTCCTCTGCTGTTTGATGGAGATACGCTGCTGCAGGGGATTGGAAATGAATGAAATGTGTATGTGTACTGTATGTGTGAGTGTATGTTTCAGCTGCCGTGATGCAGTGATCAGCATTCATAAAGAATTTTGTTGATAAAA\n>XM_046012474.1 PREDICTED: Meles meles microfibril associated protein 5 (MFAP5), transcript variant X3, mRNA \nCAGCCCCCTTCTCATTCCCGCCTCATCACACTCCTCTAGCCTGGCTTTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCCCTCGCTCTCCCTCATCTCATTGTTTCAGAGTAGGCCGAATTTGAAGTCCTTCCCAGGGAGTGGCCCTGTTCATCTTATTCGCCAGCCAAAGTAGAAACAGTGTGAGAAGGAGAGAGGCCCATTCGGCAGCCAAAGGACTCGGTGGAAAAGAGCAGAGGAAAAATACACAATATGCTGCTCGTGGGACCCAAGGTGCTGCTGTTCCTCACCGCCCTCATCATCCCCTCTGATGATGTGACTCCAGTGACTCCAGAGACATTCACAGAAGATCCTAATCTGGTGAATGAGCCTTCTACAGATGAAACAGTTCTGGCTGATATGGAGCCTTCCACAGATGACCTGGCTTCTCCTGCTGATAAAAATACCACAACAGACTGCCGGGATGAAAAATTTGCTTGCACGAGACTCTACTCTGTGCATCGGCCAGTCAAGCAATGCATTCATCAGTTATGTTTCACAAGTTTACGACGTATGTACATCATCAACAATGAGATCTGCTCTCGTCTTGTCTGTAAAGAACACGAAGTTATGAAAGACGAACTTTGCCGTCAGATGGCTGGTTTACCCCCAAGACGACTCCGTCGCTCCCACTACTTCCGACTTCCACCCTGTGAAAATGTGAATTTGCAGAGACCCAGCGGTCTGTGATCACCAAGGAAGAGGAAAGAATAATGTGTGGGTGGGAGGAAGAGAATGCTCTAACAAGAGGGAACTCCTTCTTGTCCAACCATTGTCCACTAACCCATAGACATTAGGATTTCTTAAACCAATCCCTTTGCAGCGCCTAACTTTTGCCTCCATTCCCTGACTGATAACAAAGTCTATATTATTGCATGGTTTTGCTGTTTCTCAGTATCATAGATGTAGATTAATGATAACCATGTGGCTTATATACAAACATCCTACACACAATTTCAAAGGAAAATAAACTTTAGGTTAATATTTA\n>XM_052001689.1 PREDICTED: Antechinus flavipes supervillin (LOC127564871), transcript variant X20, mRNA \nCTTCCCATCCTATTCGTCTTCCCTTTTGTCATGATTTTTCCTTTTTTCTGTTTCCTTTCTATCTTCTTTATTTTTCTCTTCCTGATTTTCCCTCTCCCTTTTTGTGTTTTTTCTTTCCTTATCTCTTCTCTTACCTTTATTCATCTTCTGAAACCAAAATCAAGATCTCTACTCATGAATATCTATTTCAACAAGAAAAGATCAGACCTTTTCCAGCTACCACATCAAAGAAGAATATCAAGCTTTCAGAGAGAATTTTCACTTGAAGAAAAGGAACAACTTGTCAACAATAGAAAGGATATCGATGCTAATCTTTTAACTGTACTTCCCAAAGTTGCAGAACTAAGAAAACTCTTTGAGCCAAAGAGAAAAGAAGTTTTAGAAATGAAGAGAAAAGAACGGATTGCCAGACGCTTGGAAGGCATTGAAAATGATTCGCAGCCCATACTCTTGCAGAGCTGTACAGGATTAGTTACCCACCGATTACTAGAAGAAGATACTCCCCGATATACGCGAGCTACAGACCCTTATAGCCCCCATATTGGTCGATCCAATGAAGAGGAGGAAACTTCAGATTCTTCTGTAGAGAAGCAACCTCGATCCCGATATTGCATAGAAACTACCACCCTCAATACAGAGTCATCCTACAGCCCAGTGACGATGGACACCCAGGGACTGGACTCCAAAGCTGAGAGAATAGCCAGATATAAGGCTGAAAGAAGGAGACAGCTTGCTGAAAAATATGGGCTGACTCTGGATTCCGATGCAGACTCTGAATATATGTCGCGTTATACTAAGACCAGGAAGGATCATGATGTCGAGAGGAGGGGAGGTAAAAGTGAGAAGCAGGAGGAGGAGAGCAAAGACTTGACTTATCATTATTCTAGGACTGAGACTGTGGAGCCCAGGAGCACCACAGCTGAATCCAAGGACTATAGCTTTCATGGGAGTGATGGTGTTATTGATAAGGAGGCGCTGTTGAATGTGGAAAACCACAGAAGAGCCCAAGAATTGAGTGCAATTGGCCAGATCCGTGACTTGCCACCTGCAGCTGATGGTTCCCCCTCCTTTTCCTTTTCTGGACGAGAATCCTCATTCAGTGACGTGCCAAGGTCTCCCAAGCAGACCCGCAGAGTATCCCTTTCTTCACCTAAGCAGCCAGCATCACCAAGTCATTCACTTACTGACTCATCATTACACGGTGATTCCAGAACGAGATCCACTTCAAATTCAGAAATGCCAACTGCTGAGGATGAAGAAAAATTGGATGAACGCGCCAAGCTGAGTGTTGCTGCCAAAAGGCTCCTTTTCAGGGAAATGGAAAAATCATTTGATGAAAAAAATATTCCAAAGCCACGTTCCAGAAATGCAGCCGTGGAGCGACGCCTTCGCCGTTTGCAGGACAGATCTCACACACAGCCCATCACCACTGAGGAAGTGGTCATTGCAGCAACTTTGCAGGCATCGGCACACCAAAAGGCACTAGCTAGAGAACAGGCAAATGAGGCCAAAGATTCTGCTGAACAAGGTGAACCTGATTCCTCCACTCTGAGCTTAGCAGAGAAGCTGGCCTTGTTTAACAAATTGTCCCAGCCAGTCTCAAAAGCGATTTCTACCCGAAACAGAGTGGATGCTAGGCAGAGGAGGATGAATTCTCGTTACCAAACTCAACCAGTCACCCTTGGAGAAGTGGAACAGGTTCAGAGTGGAAAACTCACTCCTTTCTCTCTTACTATTAACACATCTGTGTCTACTGTGGCATCGACAGTTGCTCCAATGTATGCAGGGGATCTACGGACAAAGCCATCGGTGGAAGAAAATGCAGGTGCTGCCGACTTTGGATTCCATTCACCAATGGAAAATGCAGACTGTTCAGTGAAGAGCATCCTAAAGCCACAAGGGTGGCAACCTTTGGGGGAAGATATCAGAAGCAAGCGAGGATCGAGGGAATTTGGGGAGATGGAAACTGAGAGAATCTTAGCTCAAGAGGAGAGGGAAGTGAGAAAGAACAGGTCCTTTGAGGAAGAAGGGAGTTCCTCCCTTTTCCTAAATAAAACTGGGGAAAGGGACAACCAAAGAAAATATACTCCAAGAAAAGGCAGCATGGAACATGCTGACCTCCTAGTGCCATGTCATGAAGAAATACGGGAGTTTTCAGTCACCAAAAGCACTGGACAGAGCAAACAGGACCTGAAGGAAGTGCAAACCTTGGAGGAAAAGATGGATTTGGAGAATGTTGCAAAAAGCAGGTTCATGCTACGAGAGCCTGCTGAGCCCACGTCCGAACTTCCTGGCACGATAGCTACAAAAACTGTTTCTCAGACCACATCCCTGGTCTCCAGTAGACGAGAGTCTTCAGAGCAGTCGGAGGAAAGACTTTCCAAGAATCCATGTAGGATGTTTGCTGGTGGAGAGAGCAAAATATCAGAGGATGCCCTTGATGCATCTAGCAAAACCATGTCCATCAAAGAAAGGTTGGCACTATTGAAAAAGAGTGGAGAAGAAGACTGGAAAACCCGGATTAGCAAAAAGCAAGACTACAGCAAAGTGTGCGTCACTGAACGAAGCACGAGGCTGCAAGAGGCTGAGCAGTCCTTCAAGAAGAAGGAAGAAGGAGGATTTACAGATGATAATGCCATTTCTAATCTGCTTTGGGAACCTGTATACGCTTCTACTTATTTTCCTGCTATGCCTGCTGTCCATAAATACCAGTCTTTTGTACCCATTAATCAGCAGAGGATGGCAGAAAGTCATGAAAGCCAAATGACAATTGAAGAGAGGAAACATCTTATTACTGTAAGAGAAGAAGCCTGGAAGACCAGAGGAAAAGGAGCAGCCAATGATTCCACCCAATTTACCGTTGCTGGCAGGATGGTAAAGAAAGGTTTAGCATCACCTACTGCCATAACTCCAGTAAGCTCCCCCTTTAGCAATCGAATGAAGGGCACTACACCGATCTCCAAACCCCTTGAAGATATAGAAGCCAAACCCGATATGCAGTTAGAGTCGGATCTGAAGCTAGATAGGTTAGAATCATTTCTGGGGAGACTGAATAACAAAGTCGGTGGTATGCAAGAAACCATTCTCACTGTTACTGGAAAAACTGTGAAAGAGGTGATGAAACTGGATGACTATGAGACCTTTTCCAAATTTTACCGCAGCGTGGATTCTGTGCCTCTAGGAAGAGTAGAGTTGGATGAGGATTTTGATGCAATTTTTGATCCTTATGCTCCCAAGCTGACATCTTCTGTGGCAGAGCACAAACGTGCTGTTAGACCTATGCGCAGGGTTCAATCTTCAAGAAATCCCTTGAAAATGCTGGCAGCAAGAGAAGATATTCTTCAAGAATATACTGAACAGAGATTAAATGTTGCTTTCATGGAGTCAAAACGGATGAAAGTTGAAAAAATGTCTGCCAACTCAAATTTCTCAGAAGTCGCCCTCGCCGGTTTAGCTAGTAAAGAAAATTTCAGCAGCGTCAATCTACGGAGTGTCAACCTAACAGAACAAAACTCCAACAATAGTGCTGTGCCCTACAAGAAACTTATGTTGCTACAAATTAAAGGAAGAAGAAATGTGCAGACAAGATTAGTGGAGCCACGAGCTTCATCGTTGAATGGCGGCGATTGCTTTCTCCTGTTAACTCCCCATTACTGCTTCTTGTGGGTAGGAGAATTTGCAAATGTCATCGAGAAAGCTAAGGCATCAGAGCTTGCAACTCTAATTCAGACGAGGAGAGAACTCGGCTGTAGAGCTACTTATATTCAGACCATAGAAGAAGGAATAAATACGCATACCCATGCAGCAAAAGACTTCTGGAAACTCCTGGGTGGCCAGACAAGTTACCAGTCTGCCGGAAATCCAGAAGAAGATGAATTGTATGAAACTGCCATCACAGAAACTAATTGTGTTTATCGCTTAGTGGAAGATAAACTTGTTCCTGATGACTACTACTGGGGCAAAATACCAAAATGTTCTCTTCTGCAGCCAAAAGAGGTCTTAGTGTTTGATTTTGGCAGTGAAGTTTATGTATGGCATGGAAAGGAAGTCACATTAGCACAGAGAAAAATAGCATTCCAATTGGCAAAACACTTGTGGAATGGAACCTTCGACTATGCCAATTGTGACATAAATCCTTTAGATCCTGGAGAGTGCAATCCTCGTATACCCAGAAAAGGACAGGGGCGACCTGATTGGGCAATATTTGGGAGACTTACTGAGCACAATGAGACTATTCTCTTCAAAGAAAAATTTCTTGATTGGACTGAAATGAAGAAGCCTTGTGAAAAGAACTCAAGTGAACTCACCCCACAGAAGGAAGAGCCAAGGTCTGAGGTTAAGGCTTACGATATCATGCTGATGGTCCCCGTGCCCCAAGTGACCGTCGGCACCATCTTGGATGGAGTCAACGTCGGCCGTGGCTACGGGTTTATCGAAGGAGATGACAGGAGGCAGTTCGAGATTGCCAGTGTTTCTGTGGACGTCTGGCACATCTTGGAATTTGACTACAGTAGGCTCCCCAAACAGAGCATCGGGCAGTTCCACGAGGGAGATACGTATGTGGTGAAATGGAAGTACATGGTGAGCACTGCAGTTGGGAGTCGGCAGAAAGGCGAGCACCCGGTCAGGACGGCCGGCAAGGAGAAGTGCGTCTACTTTTTCTGGCAGGGCAGACATTCGACCGTGAGTGAGAAAGGCACGTCGGCGCTGATGACTGTGGAATTAGACGAGGAGAGGGGGGCCCAGGTTCAAGTGCTTCAGGGAAAGGAGCCACCATGTTTTCTGCAGTGCTTTCAAGGAGGAATGGTTGTACACGCAGGGAAGCGAGAAGAAGAAGAAGAAAATGCACAAAATGACTGGAGATTGTACTGTGTCCGAGGAGAAGTTCCCATTGAAGGAAATTTGCTTGAAGTTGCCTGTCACTGTAGCAGCCTGAGATCCAGGACTTCCATGATTGTTCTTAGTGTCAATAAAGCACTCATGTACCTTTGGCATGGGTGCAAAGCACAGGCCCATACAAAGGATGTTGGGAGAACTGCTGCAAATAAAATCAAAGAACAATGTCCCTTGGAAGCAGGATTGCACAGTAGCAGCAAAGTGACGATCCATGAGTGTGATGAAGGGTCAGAGCCACTGGGATTCTGGGATGCGTTAGGAAGGAAAGATCGGAAGGCCTACGACTGCATGCTACAAGATCCTGGGAAGTTTAATTTCACGCCCCGCCTGTTCATCCTCAGTAGTTCATCTGGAGATTTCTCAGCCACGGAATTCATGTATCCTGCCCGTGATCCTTCTGTGGTCAATTCCATGCCCTTCTTACAGGAAGACCTGTACAGTGCCCCTCAGCCAGCACTTTTCCTCGTCGACAACCACCATGAAGTGTATCTCTGGCAAGGGTGGTGGCCAATTGAGAACAAGATAACGGGGTCTGCCAGGATTCGCTGGGCCAACGACCGAAAGTGTGCCATGGAGACGGTGCTTCGGTACTGCAAAGGAAAAAATGTTAAGAAACCCCCCAAGTCCTACCTTCTTCATGCTGGGTTAGAACCTCTGACCTTCACCAATATGTTTCCAAGTTGGGAACATAGAGAAGACATTGCTGAAATCACAGAAATGGATGCAGAAGTTTCTAATCAAATAATTCTTGTGGAAGACGTGTTAGCCAAGCTTTGTAAAACCGTTTATCCGTTGGCTGATCTCTTAGCCAGGCCCCTCCCTGAAGGAGTGGATCCTCTGAAGCTTGAAATCTACCTTACTGATGAAGACTTTGAAATTGCACTAGAGATGACCAGAGAAGAATATAGCATGCTGCCATCTTGGAAACAGGTGAACCTGAAGAAAGCGAAAGGGCTCTTCTAAGCATCGATGCTGCCAGTGGAAGATGAGGCTGGAGAAATCTCTGTGGTCACTTTCAATACCGTTGGGCCAGGAAGATTGACATCTATGTGTCCTGGTCTTCAAATTGTTTAAAAGTCAAAGTAGAAATGATTTGAAGTTATTAGATACTGCCTGAGCTGGAGTTGTGTAATTTTGTAAATGTGTAAGAGAACTCTCTGAAAACTTTCTCCTCCCCGACTCAGAGGGTATTTCCTGTTTGTAAACTTGGCTCTCCCGTGCACTTAAAGCAGTAGCACCTCACAGCTGCTGCTCAGCCCTCCTGGCTCCATCCAGCCTTCGCCTATTCATTTTTGAAGATGCTCTCTTTGTAAAGTGTTATTTTGTTAGCTTGTGGATTATTAAAAAAAATTATATTTATATAAACACCATATAGTTCAAGTATGTATTTAACAAAACAAAATATGTATTCACTTAAAAAAAAATTTTTTTTTGGTGTCAAAACAATACCGAGAAGTAGATGGAGTTGCTTCTACTGAATTATCTATTCCACAGTCTATGTATCTTATACACGTTCTGAAACGTTTCCTTTGGCAGTGGGCAAGGGGCTATTCTAAGGAGTACCACCGGTGCTTAAAGGAACAAAACTTTTATACTTAGGGCTGGAGACTCTGGAGAAACTCTGTGACCTTCATACCTTAATATCCAAAAACAAACAAAAACATGTATAGTGCCTTGTTTTGTGTACAGTTTATATACAAAAAAGTTTGGGTCTGCGTTTTTGAAGATGGTTTGGAACAGTATCAACAATTTTACTTTACAATGATCGAGGTTTAAAAAAAAAAAAAAACATCTCAGTTTATAATACTTGTAAACACATCTTTTTGTGATATAAGATTCCAAAGTACGAGCTTCAGAATAAAACTTTGGCAATGA\n>XR_003381398.1 PREDICTED: Zonotrichia albicollis uncharacterized LOC113459830 (LOC113459830), ncRNA \nTACTATGATGATGAAGATGCTCTAAAAATATACAGAATCTAATCTAGTTTAGATTTGACTGAAATAAACATGGACAAGGATATGTTGGGAGATGATCCTTTTACTTGGAACTTTCACCTTAGTGTGGGACTGTGCAGATTGATCTGGAGGATTTCTATTTTGGATGCCATTAAGCCATCTTGTATCTTCTAGCAGGAAGTCAGAGTAGCATCTCGACTGCATCTTCAAACAAGACTTTTGCAAGCTGATGCTCACAAGGGGCTCTGTTTAGAGGTTTGTTCCTGTGGGGAGGCAGGCAGCTCCTCCTGGTTGCTTCTGAAAGCTTCTCTTCATTGCACTTTCCATCTGCACTGGCTTCTGTTTTAGCCACTAAGGTCAAGTCGGTGTGGTTTTCCCACTCTGCCTGTTGCATTAGTGGCACTCTGGAAGTGAGACTTGCACTGGATGGGAAGTGTTTGGTGAATTTTTAAATACCATTATTGATTTCACATTAATTTTCTTTATGAACCGGGCAAAGCTCTTATGCGAGGGTATAACAGCCAAGAAATATTTGACAAGTTGTTTAAAATCTATTGCCTGGAAGAAGCCTGATAGATCAATTAATTTATTTCCCTGCTATTTCAATATATCCTTTAAACATATTTTCACTGATTGTTATTACCCATCCTGAAGTATACAGCACAAAAGCAATCATATATTACCTGCAGCAGAGGGGGCTGCCTCCTGGATCTCTGTCCACAAGAGATATAGATATTTTGCCCAAAGTTGGTTTTTTCCTTGCCTTCAATGAAACATGATTAGAACATAATGATTTTGCCTCTGCATCAGTCCACACCAACTCTATGGTGTTTTAGGGCATCAAACCTGTAAAAAGGGCAGATTCTTTTACATATGCAAACTCCTCTACCTGTTACATCAGTTTATTTCACATTCCACCAGTGTTCCTTTGGATACAGATTATTGATTGCTCCCTAGTGAATACCTTTTTAGTCATTCTTTGGCCTCAGAAAATTACCTTTGAATGTTTTATGCAAGAGTATTCATTATGAACAATTAATGTACTGAAAATGTCAGCACCTCAAGCAGGCATTTTATAAAAGATGAGTAAATTTATGGTAATGCATCATTCAAACTTCCTGCACTTTTCATTCTTTTAAAATTTATGTCTTACATTGCAGTTCAATAGCCTGTAACAATTTGATGACCTGAGTGGAATAATGTCAAAAATGTCTGTGTATTTTAGAAAAAATTTAGAAATTAAGATTTTTATTTTTGCTATTACTGTTTTTAGGTATGTCACAGCTTTATAGTAACGCGAAGTATTTGCTTTATGACAGCTCTTCACATGCTTTTTAATCAGAAGTGAAAAAAACTTGGTTCAGAGCAAGCTTCAGTCTACATAGATCCATTCATAGAAAGTGAGGAAAGTCTTTTGTATCAAGTGGAGGGTGAAAAGACTACTTGTACCCATTTATATTGATATTTGTTAAGTTTTATAATATAGAACACCCTGAATTTAAACCTCTTAAACTTTTCCCTTTGACATGTGGAAGGATCTCAGATTGTTTTGCTTAATTTAGTAAGCTTTAAGCCTCGAAAATGATGCGTGTTTCACATCGCTGTCCAAACGCTCTAAAAAAGTATTTTTAAGGCACTGCCAGCTAATTACCCAA\n>XM_020665074.1 PREDICTED: Amborella trichopoda ABC transporter G family member 11 (LOC18430567), mRNA \nTAATCTGTCTCGATCTCTTCAAGAATTGGGTTGATCTCTCTCTCTGTGTCTCAATCTCAATGGCCTCACTCCATTCTGTCCCAAAATGGATGCCGAGCTCGAGCCCAACACAATCCACAAACCCTCTCCTCAGCCACCCTCCCTTCCAACAAGAATCCGAAGACCACATCTCTCTTGATGAAATTACTCCGAAACCATTGCAAAGAAACCCGAGCCTAAAAATCTCTGACATTGATGAAAATGCATCGGGCACCAGCAAGCGCTTCTTCCACCTCCATGCACCAGCTCTCCAACCAGGCAATATTCGCTCCGAGCCCACTTCTGGGAGGAGTGTCGAAATGGGCAGGACCCAGCACAAGTCGGTTCAAGTGGATATGGATCCACTTGGCTCGGCTGGTTCCGGTGTGTCACTAACGTGGACCAACCTATGTGTCATGGCTGATGGGAAAGAGGGTGGAAGCACAATTTTAAGGGGGCTCAATGGGTGCGCCCAACCAGGCGAATTTTTGGCTATCATGGGTCCATCAGGCTGTGGAAAGTCGACCCTTCTCAATGCACTTGCTGGGAGGTTAAATTCTAATGTAGTGCAANNTATCAACGGTCGTAAACAAGCCCTGGCATATGGAACCTCGGCTTATGCGACCCAGGATGATACACTCATGAGCACTCTAACAGTATGGGAAGCGGTGTACTACTCAGCCCAGCTCCGATTGCCAAGCTCCATGTCGAGCTCTCAAAAGATAGAGGGGGCTGAGATAACCATTCAAGAGATGGGTTTACAAGATGCAATACACACAAGGATTGGGGCCTGGGGGGTTAAGGGACTCAGCGGTGGCCAAAAGAGAAGAGTGAGCATTTGCATTGAGATCCTCACGAGACCTAGCCTTCTCTTTCTTGATGAGCCCACTAGTGGGCTCGACAGTGCTGCGTCTTACCATGTCATGACTCGAATTGCCCGTTTGGCCCTGCATGATGATCGAACTGTGGTTGCTTCGATACACCAGCCTAGTGCTGAGGTCTTCGGCCTCTTCAACACACTATGCCTCCTCTCCGGTGGGAAGACACTGCATTTTGGCCGGGCTTCCGAAGCCAATGCCGTTTTTACACTCAATGGCTTCCCTTGCCCTTCATTGAGAAACCCCTCGGATCATTTCCTCCACACCATTAACACCGATTTTGACAAGGATATTGAGCAAGGTTCCGATGCCGAGGCAACAGAAGCTGCTAAGGCGATTGATATCTTAGTCAACTCTTACAATTCCACCATTGCAAACCAAGTCTTTGCTCATGTAGCTGATATCTCCAAGAGGGAGGGAGAAGCATTGACAAAGAAAGGGAGCCAAGCAAGCTTCTTTACACAAGCGTCCGCCTTAACAAGAAGATCTTTTGTGAATATGTATAGGGATTTCGGTTACTACCGGTTGCGCCTAGCAATCTACATTGCGTTGTGCCTGTGCATAGGTACCATCTTCTTTGACATTTGCCACAGCTTTGGCTCTATTCAGGCAAGAGGGTCCATGCTCATGTTTGTTGCAGCATTCTTGACGTTCATGGCGATTGGAGGCTTCCCCTCCTTTGTGGAGGACATGAAGGTCCCTTTTAATTACTATATTTTCATATAG\n>XM_457077.1 Debaryomyces hansenii CBS767 DEHA2B02508p (DEHA2B02508g), partial mRNA \nATGTACGATTCGTTCGCTAGTTATCCGCATAATTACTATACTAAAAGTGATGATGAGACAGAAATTCCTCCAACTACTTTTCCTGGTGAAAATTTGTTGACCAAGGACCATTTGCTAGAACAATTGCAGCCAATATTAATCATCAGTGATCCATCCGAATGTAACAATAACTTAAGTCTTTTTATGAAGTTAATCGTTGAGAATATATATGACCAAAATGAAGAAACTACACATAATTATCAAAAATTATCATCTTATGCACTTAAATTGTTGACCCTGAATTTATTTATCAAGAACTACGAATTGTGCCTCGGTAAAATATTAGGATTATTGGCAGCTTTAAGTCGGGACACATTGTGCTCAAGTGAAGGTATCGATGAAGATGTGAAGTTTGAAATCGAGTCATTACGGGAGTTCATTTGCATTATTTTACTTTTACTTTTGAAGTTGACTAATAGCCCAGGAGAGAAGAGCGAAAGATCAAAAATATTGGAAACAGTCGATAGAAATGAGTTGTACGAGATCTTGTCCGACCTTGGAATTATACCTATCATCGCTAATGTTATAACAAATCATATTGTGACCACCGATAAATCTAAATCCCCGTTCTTGTTATTGAAATTTGGTGGGGATATTATATTTGAATATCTCTACAATTGTGAATTATTGTCTGATGTCGAGTTTAATAGTTTGACTAGCGAGACCAACTTAATCCCTACCATTATTAAGCATTTACTAACAAACGACGATTTTGATAATTATGATACTGATGCTGACGATTGGGAGGGTGAAAATAAACTATTTATATATGAGGAGTTTAAGTTATTGTTACTCATCAATGAACAATATTTGATGAAATCATATTCGTCCAAAGAATCAAAAAATAAAGTTTTTGATGGCTTAATGATGGGAGATGCTCATCTATCCTCAGAAAATTCACAACCAAGTAATAAACAGATTAATGGGTTTATCAACTTGTTGATTTATTACATTAATCGTGAGGAGTCTCAAATTATTAAAATCCTTATCTTAAAATTCTTATACCTTATATTTACAACTTCCTACACTGCAAAATTGTTTTATTTGAACGACCTAAAGATTTTGTTGGATATAATCATTCGTGAATTGAACAATCTAGACTATAGTGGGAATGCGAATGGAATATTGATTGTCACATATTTAAAAGTTTTGTATCCTTTGTTGATGTTCTCTCAATTAAGTGAATTGCCCGAAGGTTATAAGAATGAAGGTATATTAGAAATTTTGAGAAACTTGGTTCTTAATTCTGAGTCAGGTAATCGTAAGACAACTGAAATTTCTGAAGCAACCGACGAAAACCAAGCAGATATTATTGCAAAGCTATCATTACGGTGTATGTCTATACCTTGGTTGAGGAAGCCACAATTGAGTAAGAGAAAAAACCAAGACAACCCTAACTTGATAAATAACGTTTATGGAAAGTTATCTGCTGCTTCCTCTTCATCATCCTTGAATTCGAAACTGAGCTTTGTGGGAAAACGTTCTGAATTGTACGAGAGTTCTGATATTTCAAGTGAATCGCTTGGTAAGGCCTTCACCCGAATTGCATCCGTCAGAACTTCAGTAAGAAGCGACTATCATAAGCATGCACTAGTGCATAACGAAAACGACCAAGTGGGCCCAAACGGTCTGAAGAGCTCTTATGTCGAAAATAACCATAATATTTTCTTAGATAATGATTTTAAGTCATTATCAATTAATACCACGGAAGATTTTGCTAATTCTCCTTGGATTCCAATATCAGATGAGTCGAATTTGCTAGATTTACCAAAAGAATATTTAAAAGATGAGCCAGTACAGCCCTTAAAAAGACCAGAGTCTGCATCATCCTCAATTAAGTCAGATTCGAGTCTAGCACAAAAGGCATCAAAGAAGAAGGCACCGCCACCACCTCTTCCACCGAAAAGTTTCCTGCCGAAACCTAATCATATACATTTCGAAAAGAGATCTCAATCACAAACACCACCACCACCACCACCTCCTCCTCCTCCAAGACGCAGGCGTTTGTTACATCTATGTGAGCATTAA\n>XM_042466471.1 PREDICTED: Sceloporus undulatus RNA binding motif protein 46 (RBM46), transcript variant X1, mRNA \nGGCGCGGGAGAGGCTCAGAGGCGCTGGCCTCTGCGTGGGGCAGTTGTTGTTTGTTTCTCCACGTGGGAGGAAGGAAGAGGGGAGGCATTGCTGCTGCTTCTTCTTCCCTCAAGGCGATATTTTCCCTGTCAGGTTTGTTGGATGTGGATGACTGACCAAGTCGGAATCTAATTGTGCACATTGTGGATTTGAAAACTGTTCAGATTTTATTTCTGAAGGCTACAGAACAGAGTAAATAAATTACAAAAAGTAGAACTCTGTAAGTTTCCATCATAGTTATTTCTTAACGTTTTCTGAAGACGGTAAAGCAATGAATGAAGAACAGACAGATGTTACAAATGGCTGCAGCAAAGTTAGAACGGGTACTCAGAACGAAGCTGCGTTATTGGCTCTTATGGAAAAGACTGGTTACAATATGGTTCAAGAAAACGGTCAAAGAAAATTTGGTGGACCTCCACCAGGTTGGGAAGGTCCACCACCACCACGAGGCTGTGAAGTTTTTGTGGGAAAAATTCCCCGTGATATGTATGAAGATGAACTAGTTCCTGTTTTTGAAAGAGCTGGGAAGATCTATGAATTCAGGCTGATGATGGAATTTAGTGGCGAGAATCGTGGATATGCATTTGTAATGTATACAACCAAAGAAGAAGCTCAGCTCGCTATTCGGATCCTTAATAATTATGAGATTCGTCCTGGGAAGTTTATTGGAGTTTGTGTAAGTTTGGACAACTGCAGACTATTTATTGGAGCTATTCCAAAAGAAAAGAAAAAAGAAGAGATCTTAGATGAAATGAAAAAAGTCACCGAAGGTGTAGTGGATGTTATTGTGTATCCAAGTGCAACCGATAAGACAAAGAATCGTGGGTTTGCTTTTGTTGAATATGAATCCCACAGAGCTGCAGCTATGGCAAGAAGGAAACTCATTCCTGGAACATTCCAGTTATGGGGCCATACTATTCAGGTAGATTGGGCAGACCCAGAAAAAGAAGTGGACGAAGAAACAATGCAGAGGGTTAAAGTATTATATGTTCGAAACCTGATGATCTCAACTACAGAAGAAACAATTAAGGCTGAATTTAACAAATTTAAGCCAGGAGCTGTTGAGCGTGTGAAAAAACTTCGAGATTATGCTTTTGTTCACTTCTTCAATCGAGATGATGCAGTTGCAGCTATGTCAGTTATGAATGGGAAGTGCATTGATGGAGCTAGTATTGAGGTAACACTAGCCAAGCCAGTAAACAAAGAAAGCACTTGGAGACAGCATCTTAATGGTCAAATTAGTCCCAGTTCTGAAAATCTTCTTGTCTTTGCAAACAAAGAAGATGGTCATCAGAAGTCTCTAGCAAAGCCAGCAAATCTTCCAATTCGCCTTAATGGACAGCATAGTCCTAGTCCTCCTGAAATTGAAAGGTGTTCTTACCCATTTTTCCCAGGAACAAAGCTTACTCCAATTAGTATATTCTCATTAAAATCTAGTCATTTTAGTTCTGCAACAATGCAGCTAGATTATTATTGCAATAAAAATAACTGGGCACCTCCAGAATATTACTTGTATTCAACAACAAGTCAAGATGGAAAGGTACTACTAGTATATAAGATTGTTATTCCTACTGTTGCCAATGGATCCCAGAGTTATTTTATGCCAGACAAACTTTGCACTACAGTAGAAGATGCAAAAGAGCTGGCTGCACAGTTTGCTTTGCTGCACTTGGATTACAATTTCCGCCGAAGTTCAATAAATAACATTTCCCCAGTTAGTGCTACTCTTTCTTCTGGAACCACCAGTGTGCTGTCATATACATCAAGACCATACTCTTATCCAAGCTATCCTTTGTCACCATCAATTCCACTTGCTAGTAACAACCATGTTGGGCAGCGTCTGTATATCTCCAATCAGGGCTCATTCTTTTAAGGAAAAGAAAAACATGGATGAAAATAGTATACTCTTATTTTAATATTATGTAGTTTCAGTTTTAATTGTGTCCATGCAATTGGTTTTGATGAGTTCAGTATATCTATATATTTCAAATTACATATAAATTAACTGAATTTGGGTGAAGATAAAAGTTCCAAATGTGTTCTATCTTGGCAAGAAGAAATGCTTCCTAAAATATGGCACAGAATTTTATGATTGTCAAACAAGACAAGAAAACCCATTTAACATTTTTAAAGTAATTACTTTCCTGAATAGTAGCTTTAAAATATTTAAAGTGCATGCAATTGTTGGTTCTAATCTTGTTACCAAGGATCACCTCTGTTTTTTGGAGATGAAAAACAAAATAGTCAAAATGCATGTAATCAAAAAGCAAAGTATTATGTAAGAAAGAAATGATGCTGATGAAAGATTTTTTTAAAGAATACAAACTTTATTTAACTCCAGATTAATAACCTCTATACTACTGTGGTCCTTATAAATCACTTTGCATATTTTAGTTGCATGACAAATATTTGTTTTATGATTAGAATATATTATTTTGTGTTACTTTATCCATGTTAACACTGTTAATCTCTATTTGTTAAAGGTACTGTTCTGTTTACGTGTTGTCATGTTT\n>XM_019277554.2 PREDICTED: Larimichthys crocea E3 SUMO-protein ligase RanBP2 (LOC104918663), transcript variant X1, mRNA \nTTGACGGTATTGAGACTGCGCAATAGCATCATGGGGAGCTAACGTCAGTCGAGGCTCACATTAATGTCGGTTTGTTTTATAGTTTGTTAAATCCTCCCGCTGTTCGGTTGTGCCCGGAATAATCAGCCGTTTTTAGGGAGCCATGAGGCGGAGTAAGGTTGAAGTGGACCGGTACGTCTCCTCCGTGCAGAGCTCCTCTCCTTCACTCAAAGAGAAGCCAGTCAAAGGGTTTTTATTCGCTAAATTATACTTTGAAGCAAAGGAGTATGAACTTGCAAAAAGACACGTGTCGGAGTATCTGAAAGTCCAGGAGAGAGATCCCAAAGCACACAAATTCCTTGGACAGCTCTACGAGAGAGAGGGAGACCTCAACAAGGCGATAGGATGTTACAAGCGTTCGGTGGATTTGAACCCAGCCCAGAGGGACCTGGTACTGAAGGTGGCTGAGTTACTGGTCAGTAAGGAGGAATGTGACAGCAGAGCAGAGTTTTGGGTGGAGAAAGCTGCCAAGCTCCTGCCAGGAAACCCTGCAATCTTCAACCTGAAGGAGCGTTTGTTGAGTCGTCAGGGTCAGCAGGGTTGGAACCGGTTGTTCGACCTCCTCCAGGCCGAGCTGGCAGCGAGGCCAGCTGACGCTCATGTGAATTTGAAGTTGGTTCAGCTGTTCTGTCAGGACGGGCGGCTAGAGGAAGCCGTTAAGCACTGCCTGGCTGCTGAGAAAAGGGGTGTGCTGAACCACAGTCTGGACTGGTACACCATCGTGCTGCGCACACTGCAGGAGTATCTTGCTCAGCCCAGCGTCTCTAGTAATGAGAAGATGTGTCGACGTCTCCAGAGGGAGCTCCTGTTGGCCCACTGCAGCCTGCTGAGAATCACACTGTCTCAGAGCAGCGTGCAGCCCAGCCTCGATGCCCTCAGAGGTTTTGATGAAGCTATGCAGACGCTGAGCAGCGTTGCTGCTCGCCACATGGACGATCTTTGGGAGGTGTTTGTGGAGATGAGAGGTCACCTCTACATGCATGCTGCCACACTGCTGTTGAAGCTGGCTCAGGATCGCCAACAGACCTGGAGGGCTGTCATTGACCTGGCTGCACTATGCTACCTGTTGGCTTACCAGGTTCCCAGACCAAAGCCTAAAGTGACCAAAAGAGACCAGTCAGCCCCACAGCCACTGGAGCTGCTGGCCAACAGCCGACAGAGTCAGGCCGGCCACATGTTGCTAAACCTGAGCACGGATTCATCCACCTTGATCAGAGAGGTGGTGGAGGCGTTTGGGAACCGTAGTGGTCAGGACTCTCTGTTTGAACTCCTGTTCGGACCACAGGCCTCTGCTGCATCGTCCTTTATTGCAAATGATGACATTCATTCTGTTAACACCACGGCTCCAGAGCTCTCTCAACTGGCCAAATGGGACGCAGGCTCCATCTTGCTGCATGGTGGTAACTTGCAACATCTGAGCTGGCTGGGGCTTCAGTGGACCCTTCTGGCCCAAAGACCGGCCCTGCGAGACTGGCTACAGCAGCTCTTCCCTAGACTTACTCTGGAAACCTCCAAACTGGACACAAACACACCGGAGTCAATCTGCCTGCTGGACCTGGAGGTGTTTTTATACGGCGTGGTGTTCTGCAGCCACTGTCAGCTCCAGGAGACAGCGAAGCTCAGCAGCGGAGTGAACCAGCAGCAACAACAGCAGCTGTATGAACCACGCTGCCTCCCTCTTCCCCTCATTCGCCTCTTGACCACCGACAGACAGAGGGAGTGGTGGGACGCCGTCTACAGCCTCATTCACAAACAAGCAGCTCCTGGTACTTCAGCCAAACTTCGGATGATTGTGCAGCACGGACTGAGCACGCTCAGGGCTGGAGAGAAGAATGGGCTCCAACCAGCACTGGCCATCCACTGGGCTCAGTGTCTCAGCCAGACGGGTGATGGAGTGAACTCGTACTACGACCAGAAGGAATACATCAGCCGCAGTGTCCACTACTGGAAAGTTGTACGTCCTCTGTTGGACAAGATCAAAAACAGACGCAGTATACCAGAACCACTTGAGCCCCTCTTCATGCACTTTCAATCCAAGGATATTCAGATTTCTTCTGTTAGGGGATACGAAGACGAAGCAAACATAGCGTATGCGGCTCTCCTTGACATTGAGGGCAAGACAGAGGAGGCTATCGCTACGTTGGAAACCATCAATAACATGTCATCCATCTGGCATTTGGCACAGATCTACCAGCGGCTATCAGAGGAGGCCAGCAACGGGGTTGAGGAGACCCAAGATAGATGCATAACATTTCTGAGAAAATTCAGGACGTATTTGTCAAAGATCTATAATGCTAATGCAGATGACATCGAGAAGCTGCCTGTTTCTATGGAGGACATTGTGGACCTTCTGAATGATGTGAACCAGCAGCTGGGAGAGAGTGGTGAGGCCATGGATGAAGAAGAAGAGAAGGAGGAACCGGGCCGAAGAGGACCAGCCCACTCCAGCCCTGCTCATCCCACAGAAACCTCTGCCACCATATCCCACATCAAGTTTTCCACTCCCTCCCCGAACAAAAGCCTCATCTCTCCCTCCAAAAGACACCTGATTTCTCCCAAGACACCACCTCACTGGGTCGAGGACCAGAAAAGTCTTCTCCAGATGCTGTGTCAGCAAGTTGAAGCCCTCAAGAATGAGGTCCATGATCTGAGACACAACTCTTCAGGGAACGCAGGTTCCCCTCATCACAAAATGTATGGAGAGAGCTATGGAGCCGAGGGTCTACAGGAGCCTTTTACCCCAGTTCAGTCTTATCATGGGGCCCCCCTAACAGTTGCCACAACAGGCCCCTCTGTGTACTACAACCAATCTCCTGCTTATAACTCTCAGTATCTCCTGCACACAGCAGCAAATGTAACCCCCACCAAGGGCCCAATGTATGGTATGAACCGTATGCCACCTCAGCAGCACATGTATGCCTACCAGCAGCCCACTCATACACCTCCATTGCAAACAGCCCCAGCCTGCATTTACCCTCCTCAAGAACAGGTCTTTGGTGCCCCTCTTCGGTTTGAATCGCCAGCCACAAGCCTACTTTCCCCATATAGTGAGGAATATTATGGCCAGAGTGTAACCCAACAAACGACTAACCCTCCCCTGCCTGAACCTGGCTACTTTACCAAGCCGTCTGTAGTCCCCGTTCAGCCACCAAAGAGCATCGAGGGCAAGCCTGGGAAGCTCTCCTTCAGCCAGCAGGCACCTGCTGAAGTCCCCAAAGTGCCTAGTTTTGGAGCAGGGGCAGTTGCTCAGTCAACACCCTCAAATGCTTTTAAATTCAACTCCAACTTCAAATCCAATGATGGAGATTTCACTTTCTCAGCCTCTCAGGCCAAGCACAGCGAAAGTCTGCTTGGTCTTCTTACATCAGACATTCCCACTAAAACTGACACCGTTCCAGACAAGCCTGCAGCCCACGAGCAGCCCCAAAGCCAAACAGGCATCTTCACCTTTGGCAATAAAAATATTTCTGGCTTTTCTTTTGTTGATTCCACGCAGAACACAGTCAACACTGGAAGTCTATTTGGAAAGGTGGACCAGCCATTTAAATTTGGTGTTGCAAAGTCTGCAGCAGAGGAGGAAAGAGCAGTAGAGAGCGACAATGACAGCACTCATGTTGAGGAGGATGAGGATGGTCCACACTTTGAACCCATTGTACCCCTTCCTGATAAAGTAGATGTGAAAACAGGTGAGGAGGAAGAGGAGGAAATGTTTTGCAACAGGGCAAAGCTATATCGATTTGACACAGAAACAAAAGAGTGGAAGGAGCGGGGCATTGGCAATGTTAAAATCCTAAGACACAGCACAAAAGGGAAGGTCCGCCTCTTAATGAGAAGGGAACAAGTCCTTAAGATTTGTGCCAATCACTACATCACTGCCGATATGCTTCTGAAACCGAATGCCGGCTCAGACAAGTCCTGGGTCTGGAATGCCATTGATTATGCGGATGAAGAACCTAAGCCCGAACAGCTGGCCATCCGCTTCAAAACAGTAGATGAAGCATCACTATTTAAAGCTAAATTCGAGGAAGCCCAGAAAATTGTGCTCAAATCCCCAGAAAAGGACAAACGACAGGAGGAGAAAGAGGAAACTGTAAAAGTTCCTGAATCACTGGCAGCCCAGTTTGCAGCCAAAGCAGGGGAATGGGACTGCACTGTGTGCTATGTAAGAAATAAACCCACGGATATGCAGTGTGCCGCTTGTCAAACTGCCAATCCCAACGCTTCATCCAAGCCAGATATTCAGGCTACTGGTGAAACCAAAGCCAGTCCTTTTACTTTCAAATTTGGAACTGATGCGTCAAAACCCAGTAGTTCTGGCTCTACGTTTACTGGATTTGGTGCTTTTGGAGCTTCTATACCTTCGTCATTTACATTTGGCACCAGTGCCTCAAAGCCTGCTGACACAGTGACCAGTGCATTTGGTTCTGGCTTTGGGGCTCAGTTTGGCAAGAAGCCAGGGCAATGGGACTGTAACACATGTTATACAAGAAATGAGTCCTCTGCAGACAGCTGTATTTCTTGTAACGGTCTTAAAGCAGGCCCTAAAACAACTGTGACGGCACAAACGGCACCAGCTGCTCATGTACCTGATGCACCCTCTGTATCTGCTGTTGATTCTGGGTTTGGTGCCCAGTTTGCCAAGAAGCCGGGGCAGTGGGACTGTGATACATGCGCACTGAGAAATGAAGCCTCTGCTGACAAATGTGTTGCCTGTCAAACCCCCAACCCTGCAGCTAAATCAACAGAGAAGGTTCCCGTGGCATCAAATCAGCCTGCAGTGTCAGGATTTGGGGCAGATTTTGTAAAAAAGGATGGCATGTGGGACTGCAATGCCTGCCTGGTCAGAAATGATGCAACAGCTGTTGAATGTGTTTCCTGTCATGCACAACGTGACACTTTAGGAGCCATGTTTGCCAAGAAGGCTGGAGAATGGGATTGTGACACTTGTCTGGTGAGAAACGATGCCTCTGCCAATCAGTGTGTGTCCTGTCAGACACCAAATCCAAATGCTAAAAGCACAACTAGCACTGCTCCCTCAGCCTCTTCATTTAGCTTTAGCTTTGGAACAAAGAATTCATCAAGCCAGCCTACCGCAACTGGATTCACAATGCCTTTTGAAACTGGAAGCGGTTTTCAGTTTGGTCAAAGCAAAGATAAAAGCTCAGCGGCCTCTTTCAAGTTTGAAGCTCCTCAGTCTGGATCTAATACCACAAGTTCTTCACCCTTCTCTTTCTCAATGCCCATTCCAGCTGGTGGCTTCAAGTTTGGCATTCAGGAGCCTGCAAAAGAAACCCCCTCAACTGATACTCAAGCACCTCCATCAGGGTCAGCTTCCAGTTTTCTGAAAAGCATAGCTGACAAACACAAGGAGAAAGAAAATGTGCCCACACCCTCCGTGGCCCAAACAGAAGAAGATCAAAATCCAATAATTGCTGTTAAACCCAATACATTCAGCTTTGCAGACTTGGCAAAGTCCTCTGGAGGAGATTTCCAGTTTGGCCAGAGTGACCCAAATTTCAAAGGTTTTTCTAGAGCCGGTGAGCAGTTGTTCTCATCATTAGAGGCAACCCCCACCAAGAAGGATGCCTCAAATGAGCCGGAGGACGATGACATGTACAAAACGGAGGAAAATGACGACATTCAGTTTGAACCAGTGGTCCAGATGCCTGAGAAGGTGGACTTAGTAACAGGGGAGGAGGATGAACAAGTGCTTTATTCTCAGCGTGTCAAACTGTTCAGATTTGACTCAGGCACCAGTCAGTGGAAAGAGCGTGGTGTGGGAGTTCTTAAATTCCTGAAGAACAGCACCAATGGCAGGCTAAGGGTGCTGATGAGAAGAGAGCAAGTTCTGAAGGTGTGCGCCAACCACTGGATCACCACCACCATGAATCTGAAGCCCCTGGCAGGCTCAGACAAGGCATGGATATGGTTGGCCAATGACTTCTCTGATGGCGATGCTAAACTTGAACAGCTGGCTGCAAAGTTTAAAAGCCCAGAGCTTGCTGAGGAGTTTAAGCAGAAGTTCGAAGAGTGTCAAAGACTTCTCTTGGACATCCCCCTACAAACCCCCCACAAGCTTGTTGACTCAGGCAGAACAGCACGCCTCATACAGAAAGCAGAGGAAATGAAGTCTGGTTTGAAAGACCTGAAATTCTTTTTGACGGATGAGAAAACTAAGATCAAAGATGATGACAGCCAGGCAGACATTACAAGCAATGTTTCAAGCCTTGTAATCAAGCCACACGGTGAGACCACCGGCCCCACCTTGGAGTGGGATAACTACGACTTAAGAGAAGAGGCTTTAGATGACACTGCCGACTCATCAGTTTATGCATCTCCCATTGCCAGTAGTCCACTGAGGAAAAACCTTTTCCGTTTTGGAGAATCCACTGGCGGCTTCAGCTTCAGCTTCCAACCAGGCATCAGCCCCTCCAAGTCTCCTGCTAAGCTAAACCAGAGTAGGGCCTCAGTGGGCACTGATGATGAGCAGGATGTAACCCAGGATGAGGAGAGGGATGGCCAGTACTTTGAACCTGTAGTCCCCTTGCCTGACCTGGTGGAGATTTCTACAGGAGAGGAGAATGAACAGGTGGTCTTCAGTCACAGGGCCAAATTGTATCGCTATGATAAGGCTCTGGGTCAGTGGAAGGAAAGGGGCATCGGAGACCTCAAGATCTTGCAGAATTATGACACCAAACGAGTCAGGTTGATAATGAGGAGAGACCAGGTCCTTAAGATATGTGCCAACCACTGGATCACATCTGTCATGAAGCTTGAACCTATGAAGGGTGCCGAAAAGGCCTGGGTCTGGAGTGCCTTTGACTTTGCTGAAGCAGGAGAGGGTAATATTGAGCAGCTGGCTGTGAGATTCAAGTTGCAGGACACTGCAAACACATTCAAACAAGTCTTTGAAGAGGCCAAAGTTGCACAAGAAAACAAGAAACTGATGACTCCAGTGACACCTCGGGTCACCACACCCCAAGACAGTGGACCCACAGGATCTGCTCAGACTGCTCCAACTGTATGTGGAAAGGCAGCCATCGCTGTTCTTGAAGAGACCACAAAGGAACGCACAGAGCTTTCCACCGATGGTAAGCCATGTGCAGCTGGGTCTCCGAGTCCAGCCAACCCAACCCAACCCAAGACAGTAGTGTCACCCCCAAAGTTTGTCTTTGGCTCTGATAGCCTTCAGAGGTTTTTTGGTTCTCCAAAATCTCACTCTGAGTCTGAGGAGTCTGCATCCAGCTTGAAAGCCAAAGATTCTGGACGTCCTGCCAAGGCTTCACCTGCAGCGCCTGCATTCAAAATCCCAGAGAGAGGGCTGGATTTTAGGCTTTTCAAAGATAACCCAATGGCTTTTTGGACCAGCACATCAACCACCCAATTTGAACCCCCAGGGCCGCCTCAGACAGAAGGAGGCAGTGCAGGGTCGGATGAGGACTCAGAGGTGGAGGTTGTGTATGTCAGGGAGCCCACTGCTGAACAGGCAGCTTTAGCCAGAAAACTCCTGCTGCCTCTCACATTCTTTTGCTACAAGAATGAACCGGGCTACACAAGCAACGATGAAACTGATGATGAGGACTACGAGTCAGCAGTAAGAGCCTTGAATGGAAAGCTCTACCTTGATCCTCCCGAGAAAAAGGCTGCAGCATGTGGTGGTGATGAGTCAGACTGTCAAGTTGTGTGGGAGAAGAAGCCGACGCCAGAGGAGGAGGAGAAGGCCAAAAGCCTTCAGCTTCCACCCACCTTCTTCTGCGGCCTGAGCACCACAGACAGCGACCCGGATCACGACAAGCCCGAAGACTTTGAGACAGAAGTCCGCAAGGCACAGCAAGACCTGGATGCTCAGTTAAATCAAGCTGACAAGGCCTCCAGCAGCGATGCAACAGCCACAGAGGAGCCAACGTCGAGCCTGGCATCAGGTAGCGCAGACGCTGATGGCAGCGTAGAAGCTGAAGGTAGCACATCTACATCGAAAGAGCAGACCTCAGACCAGCCAGCAGAGACTCCGAGTGAAGCTCCCAGGAGCAGCTCTCCCATTGACCTGTCAACAAAAAAGTGCCCAGAGCCAGAGTCCAACTTTGGGACTGCAGCTGCAGCACCTACTGCTACGACTGCAGCAGGGCTTACTGTTACCACGGCGGCGTCTACTGCCACAACAGCTTTTACAGCTACAGCGCCTTTCACAGCCATGACAGCGGCGTCCACTGCTACAACAGCTTTTACAGCTACAACAGCTTTCACTGCTACTACAACCGCTAGTCAAGACACCTCCAACTTTGGCTTCAACGCATCAGGAGGCTTCTCTTTTGCTGACCTGGCCCAAAACACAGAAGGATTTGCATTTGGATCTAAAGACTCCAACTTTTCATGGGCAAACGCTGGAGCGACAGTGTTTGGGTCGGCTGTGGCCTCTGCACCAAAAAACAACGGCAATGAGGAGGGCAGTGATGAAGAAGACGCTCCTAATAATGTGGACATTCACTTTGAGCCAATAGTGTCCCTACCAGAGGTAGAGACAAAGTCCGGAGAAGAGGACGAGGAGATCCTGTTCAAGGAACGTGCCAAGCTGTACCGATGGGACCGGGACCTCGGCCAGTGGAAGGAGCGTGGCATCGGTGATATTAAGATCCTCTTCCATCCAGTCAAACGTTTCTATAGAATCCTGATGAGAAGAGAGCAGGTGCTGAGGGTTTGCGCCAACCACACAATCTCACCGACGATGGAACTCCAACCCATGAACGCCTCGGCCAACGCACTCATCTGGACGGCCACCGACTACTCAGACGGCACCGGCGTCGTGGAGCAGCTGGCGGCCAAGTTTAAAACCCCAGAGATAGCCGAATCCTTCAAGAAGACTTTCTGCGGGTGTCAGAGCCGAATTGGCAACACTGGTGACGATGCCTCATCTAGTTTCACACAACAGATGTCCAGAGTTCAAGAGCACTCCAGAGACACTAACCCGCGGGTGTTCCTCAAAGTGGCAGCCGATGGCGAAACACTGGGCACGATCACCATCGAGCTTTTCTCCCATATTGTCCCCAAAACTGCAGAGAACTTCAGAGCTCTCTGCACCGGCGAGAAAGGCTTCGGGCTTCTGAACTCCATCTTCCACAGAGTCATACCATCCTTCATGTGTCAGGGTGGTGACATCACCAACAGTGACGGCACAGGAGGCAAGTCCATCTACGGCAGCCAATTTGAGGATGAGAACTTTGACGTTCGTCACACAGGCCCGGGCATCCTGTCTATGGCCAATCGTGGGCGCGACACCAACAACTCGCAGTTCTTCATCACCTTGAAGAAAGCCGAACACCTGGACTTCAAACACGTGGCTTTCGGCTGGGTTCTGAACGGCATGGATGTGGTTCTGCAGATGGGAGAGCTGGGCACAAAGGGAGGACCGCCCACGAAGAAGCTTGTCGTCACAGACTGTGGACAACTCTGACTTTTTTAAATGTTAAGATCAAGATTCACAGCTTGGTTTAGGTTATAAAGACTTTGGATAATGATGCGTTCCCCGTGCAGTGCATACTTTCCTGATTATACTGAGTCCATAGTCATTAGACAGCTGAGAATCAAACACTGATCACACAGGCCTATTGATCAATCATAATAGAAATTGGCTACAGTAGCCTGAGATTAGAAAATATTTTGCTATCCTCTAACAGTCACAGATGGGAAACATGGAGTAGTATGCGGGAGGAGACAAATATAGTACACTTCTTCTGTGTTGCACTTGCATCTTCATCATCGTCTGTCAATAAATTCTGTTTATTTTGTGTACATAATTGTATATGAACTACTTTTTTAATGTTTTTTGTCTTGCATGTGCTCAATTTGAATGTTCTGGTCGTCTTCATAAGCTCCACTCGGGTATTTTTTTTTCTCCCCTTTTTTCTTTTGAAGTCTTAACTATAATTGAAAGGTGAGGCTGTTCTTTGAATGCACTTGTTGGTTTATAACTGTGCCCCTGCCTTCACTCCAAATGCTGCCTCTGTGTACTGTTTACCGTAGGGCTCCCCCAGTGTTTTTTTTTTTTCTTTCTTTCTTTGTGTATGTGGATTTCACAGGTGAATTGGACTTCATACTTTCTCAGAAACTCGAGTCATCTCACTGTGTGGCTAGATGATGACGTTCCATCTGTTTTGAATTTTACCAGGCGATCCTCCAGAATTTGAGATTATTATTACATCGCTGAAGTGAAAAAATAATATGCTGATAAAGGAGAAATAAAGTTTGCTTCACAAGTAA\n>XM_051564479.1 Radiomyces spectabilis CAP domain-containing protein (BYT42DRAFT_497200), partial mRNA \nATGGTTTCTCCCACCTTCATTTCGTTGCAAGTGTTATTCATTGTGGCCGCTTTGATTCAATTGGTCTCGGCGACATCGGCCAAGTCAGCTCAGCACATTGTGGAGCTGCATAACCAGTACCGGGCCAAGCATCAAGCGCCTCCTGTCAAATGGGATCCGAAATTAGCAAGATTTGCTCAAAAATGGTCGAATCGTTGCATATTCGAGCATAGTACCAGCCCGTATGGCGAGAACCTGGCAATGGGCCATAAGAACTGGGCTTCCGCCATTGCTGGTTGGTACAACGAAGAGAAAGACTATGATTACAGCAATCCTGGCTTCACTTCGTCTACGGGTCATTTTACCGCCGTAGTCTGGAAAAGTACCACTCGCATCGGTTGCGGTGTCAAGAATTGCAACGGTGCCAAGCTCTACACATGCTCTTACTCTCCTGCCGGTAACGTTGTCACCACTGACAATCTTCGCTTCAAGCAGAACGTCTTGCCCCCTGTATAA\n>XM_043120008.1 PREDICTED: Carya illinoinensis HVA22-like protein k (LOC122307253), transcript variant X1, mRNA \nATCCTGAAAATTTCCATGATCGCCACTCTTAGGAACCTGCAAAATTCGGTGGGTTTGCGGTTGCTTCTTTGTCCTCTCGGTTCTAATATTGTAATACGGACAGCTTGCTGTTCTGTTGGGATTGCTTTACCTGTGTACTCTACATTCAAGGCAATTGAAAGGAAAGATCAAAATGAGCAACAAAGGTTGCTTTTATATTGGGCAGCTTATGGATCTTTCAGCATTGTGGAAGTCTTTTCTGACAAGCTTCTTTCTTGGTTTCCTTTGTACTACCACGTGAAGTTTGCATTTCTTGTTTGGCTTCAACTTCCATCCACAGATGGGGCCAAGCAATTATACATGAACCACCTACGACCATTCTTCTTGCGGCATCAAGTTAGAATTGATCAAATTATGGGTATTGCATATGGTGAAATGCTTAAACTTATAAGCGCACATCAAACTGAAATTCAATTCGCTAGGAATGTGTTTGTGAAGATTATGGGGGCAGCGGACCAAATGTTAAGAGGGGCTATGAAGCCCGATCAACCTCGACAGAACACTGCAATTGAAGGCCCGTTAAGATCCCCAGATACCCACTCAGATCATAACGATTGATTCCTCTTGTAAGTTTGCATACAACTGAATCATTTTTCCTTGCCGATGAATATAGTCAGCTTGTAGCTGTTATCACTCTTTTTCATTTCCTTGTAAGATGAAGGACCCTTTGCTGTATCTTATCCAGGGGATAGGTGGTATTAGTCTTTGAATGTAAATATTCGGCCATACATGTGGACCTTTAGCGTACATGCGGTTGATTAAAACTCGTATCTATTTGTTTTACCCTGTAATAACACTTCATTTTGTTTTTGTTTTTA\n>XM_007831313.1 Pestalotiopsis fici W106-1 hypothetical protein mRNA \nATGGATTCTCGCTTTCCAGTGTTTCGAGAAGAACTATACAATGTTCAGATGGACGTGAAGCAGCTTGCTCATGTGCAGGTCAGCCACGCTGAAAGATTGGCTCGGCTGGAGAAGCACCAAGCAAATGAGTCGGCTATCAAGTCTGCCTGGAACTCTCCATTCCCCAGCGCTATCGGTGGCACCCCGCAGCATGGCCCTATTCAAATGCCCCCAGTCGATTTATTCGATGACTTTGATGAGGAGCAGGGCCAGAACTTGCTAGGCAGCCTCCATCTCGATGCTGAAGAGGAGCCTGTCCGGCGCGGCGCGGCCTCAAGGGCGAACAGTGTTCGTTTTGACGAGAGCGCCCTTCAGGGCTCTAGCTGGGCTCAGAACGGCCGGCAGTCTGGCGAATTTGTGCCTATCCGACCTGGCAGTGGCATGGGAAACATGATGGAACGCACGTATTCCCACAAATCGGATGGCCGACATAGTTCTGCCGGTTATTCTGTGCACTCTGTGCATTCCCATCATTCTGTAGCTTCTGGTCGTGGCAGTAGTCTTGGTCTAGATACTAACTACGCAACGACTGGTTCCGAGGAGGACTCGCCCATTGATGCACCGGCACCGCCGCCCGGTTTTTTCATTCTGGGCTCTGTTCCGTCCATTGTTCGTTGTTGGCTGACAACAAATTTCGCACACGAGACGCTCTTGTATGCAGATATCTGCTCTGGCTCACAGCAATCAGTGCTGGACTATTCACTGATCAAGGAGCTGGAACTATCAGACGAAGTGCACAAGGACCTGGACGGAGTGTATCGAATTCGCTTGCCAGTCTACCTGACTGAGGCCACTGTCACCCACCCGAGCTCAAGAAATTCAAGCCCAACACCGCAGATGCCGAATTTGATTGTTGGCTTTGAAGTCGTTGGACTAGAGCAAGCAGAGTTTCCTGATTTGAAAAAGGGCATCCGCATTTTCATAGGAAGTGAGACTTTGCGAGAACATTCTGCTGACATCTTCTTCTCCCAAAACCGCATGACGCTGTACGGCAGTGAAAGAGAGAAGCTCTCCGTGCCCTTCGTGCGCCCGGAAGATCACAGTGTGTTCAAGTACATTCGTACAGTGGCTGTCCTGCCCGAGAAGCCGCGGCTGAATGCTACAGCGCGTCCTTTCGTCTTGGGTGAGCCCAAGGCGGCGGAAATCTCCAATGAATCTGTCAACGAGATCCAAGAGAAACACGAGCGAGGCGCGCTCGACAAGGAAATACAGTCTCGTGCGCCTGAGGTATCACAGCAACCGACGACTGACCGTGTTACAAGCAACCTGCCTGAAGCCGCAAACGACCGAGACACCCAGGGCAAAGAGGACACTGATGTCTACGAAGCTTCGAACCAAGACCTGTCCGTCTCTGGTGACAATCGCAGTGAGACCACCAGTGACAGCCAGCGCCGTGAGCCAACTGCTAGTGGCATATGGTCTTCTTGGAGACAAGGCTCTTCAACAAACAGTGGTGACCCGAAGGAAAATGCCCCATTGAGCGGATATCAACCACCTGGTCGAGTTCGAAACATGAAAGTCCTGAAGCCAAGCAAAGCCAGTACGTCTTTGTCTACCCGAGCTGGAGTCACTTCGGAGGCGCTTCCGAAATCCAACGGTGAAAATCGTCGTAAAAGTCAACCTGCGGACACTACTCCCACAGGTGTCCTTCGATGGGGCAAGCTTGATCGGGGTTCTGCTTCAGGATCAGACAAGGACTCCAAACCAGCGGCCATCAATGCGGTGCATCGCGAAACCCGGAGCGTGTCCAGCACACCGCGCACTTCTGCCAACCCCGTCGGCGGAGCCTCGGCTTTCTCATGGATGACGCCGATAACTAAAACAAAGCCTTCTACAACCACTGCAGATTAA\n>XM_047249926.1 PREDICTED: Schistocerca piceifrons uncharacterized LOC124775103 (LOC124775103), transcript variant X2, mRNA \nACAGCACACCACAGCGCGCGCGGTCCAGCTGCGACGCAAGCCCGGTGTCCGGAAGCGCCGAGGCCGACGCACACATCCCGGAAACTCACCTCTACGTACCTGCGAACACGCGCACCGTCAGAAGTTGCTTTTTCCAGAGCAGTTCGACCGGATCGGTGTTGCCATTCAGAGACACACCGCATGGTGGCCACCAAAACTGTGAATTGCTCGCCTCACGTGCTCCTTGGACCACGTCAGTGGTCCTTTATGTGCTCTTGGCCACAGTTATTGGGCAAATGTTATCCTATTACGAAGTTACTGCAGGGCTGGCCCAGACAATGGACAGAAATGGTGTTCAAAATCCCTCTAAATTGACTTGGTGCTCCAATGGTGGAAACATTAGGGAATGGATTTAAACAAGAACATAGAATTACCATGATGCTACAAGTTACCAATAACTGATCTTATTTATTTGCTGTTTCAAAATTCCTTATTTTTAGTGCATTGAGAAATAAGTGTATAAACAACCCGCTTCGTTATGGTGACTCCACCATCAGAGGAAACACCTACAGATGCATCACACCAGAAACGGTTGTCAGTGGATTTGTCATTGCCAGCCCGTTGCCATGGTGTAGATATTGCTTTCGATGTGAGAGAAATAATTCCTCGTGACAAACTAAAACAGGAATTTAATGGTAAACTGGCTCAATATGGCAACTTTCCAGATTTCAAAAACGATTTTAGAAATTCTTACCCATCTCAAGTGTCAGATACATCTCCAATCTTGGAGCCCATCTCCACCATTTCATTACACACTGACCAGAAAGCAGTCAGTGACACAGCAAATTGTGCAGTTAAATTTGAAGAAGGTACAAAATCATCAGCAGACAAAAATTCAGAAAAGGATAGCATCTGCAGCAGTAGCCCCTCCAGCAAGGATCATTCAGAGAAGACCAAAGTGCCGGATGGAGGTTGGGGCTGGGTGGTTGTGATTGCATCACTTGTCATCAGCATGATTGCTGATGGTGTAAGTTTCTCCTTTGGGTTATTGTTCATACAGTTGCTGGATCATTTTGGTGAGAGCAAGAGCAAAACATCTTGGATTGGAAGTCTGTTCATGGCAGTCCCACTTTTATCTGGACCGGTTGGAAGTGCTTTGGTAGACAGGTATGGCTGCCGTTGGATGACCATTATAGGAGGCATTGTTTCTGGCATAGGTCTTACATTGAGTGCGTTTGCTGATTCTGTGGAGATGTTGTACATTACATTTGGTCTGATTGCTGGCTTGGGATTAGGACTGTGTTACGTGACAGCAATTGTTAGCATTGCTTACTGGTTTGATAAGAAGAGGACTTTGGCGACTGGTCTGGGCTCATGTGGCACTGGAATTGGTACCTTCATCTATGCACCAATGACGACTTACTTTATTGAAGAGTATGGATGGCGTGGGACGACGTTGCTCCTAGCTGGTACATTCTTCAACATGTGTGTATGTGGAGCACTGATGCGTGATCCAGATTGGTTGGTACTTGAGCAGAGAAAGCAAGCCACAAGCCACTTGTACAAATCTGGACGAGCATCTTCAAGTTGTGCCTCTGTATCTGGCCGATCAGATAATGCTGGTGACTTCCCGGGTGTAGATGGGATCCGCAAAATGCTCTCAAGTGGCCATTCGCCAGAATATGTGCTGACGACATTAGCTGCCAATTTGCAGGACACAGACTTACCCCCAGGAGAATCGGAGGTGGATGGTACAAAAACTCCAGCTTATAGTTCAGTTGTAAATCTCCCCACATTCATTCATAGAAGTGAGAAGGTTCCACTGGAAGTGCTGGAATCACTCTGCACTAAGAGGAGAGTGTTCAGTGTAATAATGGAAAATTATCCAAGCCTACTTTCGTGCAGAAGTATGTCAGATAAAGGTATCAACAAGCTTCCTGTAACATCACACTCAGTTTCTCACCGTATCCCAGTGTCAATGGAGGTCCACATTCCCAAGAAAGAAGAATCAATTCCAGCTTGCGAGTACGAAGGAAACGATGCAGAAAAACCTACTCAGCAGGCTACATCACCACTGCTGCCTAATGGAGGAGTGACACAGCCAATGAATATAATTCCACTGGCTACAGGGCCATCAAACTACCTAAAAGGCATCCGTATGCACAGGAATTCTGTAATGTACAGAGGCGCTATGTTGAAAATACACAAGTATCGGTTGAGAGCGTCATCCTGCCCTGATATCTATCGTAACTCTATGACCACCATAGCAAAGGAAACAGAGGAGAAATGGTATTCTGATATACTGGACCTTTTGAGGGACATTGTGGACTTCTCAATGTTCTTGGAACTGCATTTCCTATTTACATCACTTTCAACTATCCTGCTTTTTACATGGTTTATCGTCCCGTACTTCTATTTGGCTGATTACATGATGCTCTATGGATACACTGAAAATGAAGCATCACTTCTGCTCAGTATTATTGGCCTCACTAACTGCATTGGAATGATTGCTCTTGGATGGGCTGGTGACAAACCCTGGGTGAATGTAACCAAGTCATATGCTTTGTGCTTAGTGATGTGTGGTGTGGCAACTGGATTAATGCCACTAGTCATTACTTCATACTGGATGTTGGCATTACTTTCAGCTCTATTTGGTTTATTTTTTGCATCTTCATTTTCATTTACTCCAGCCATTTTAGTGCAGCTAATACCTCTTGATCGTTTCACAACGGCGTATGGACTGATGCTGCTTTGTGAAGGAATTGGAAATCTTCTTGGCCCACCATTAGGAGGTTTGGTTTTTGATCTGACTGGTTATTGGGATCTTTCCTTCTACTTAGCTGGTGTTTGGATTGTTTTATCAGGCATTCTCATTGCCCTGATACCCATCACGAAGAATCAAGTTATATGTGGCAAAGGAACACTTGAATTGGAAAAAGAACAAGATCAGGACTCTGTTGATGTACCATAAAACTTCTTAAGGAAAAAAATCATTTTCATGGAAAATGAGGCATCTTGATTCATGTTTGAGGCACATAAGAACCTCAGCATCCTGTAATACTCTTATTAGGTTGTGACACCAATCTAAAAAAAGCTGTTGGGTAAATGTTATGTATGTGAAACTTGTTTGTTGCAATTGTAATAAATAGCTTTAATCTCTTCAGTGACTGACGACCTAATGATAAACTGGCTTAATATACACAATTTCCATCAGAGGAACTTCACTTTAATAGATTTTCACAGCCTGATTATCAGTAAGGAAGAATGCTAAATAGGTTATGTTCAATTATTAATTGTATATTTGTGTATAATATTTAATTTTGTCTTATATTAAGCGCAATCAATATGAACAGAGACTGACCATAACTGGAGAGGTTCTTACTGGATTTGATAGTATTTGGTTTCTCTTAAGGATAAGAACACTTACAACCACGTTTATGATTGCAGAGCTCCAGGATAGTCAAAATAGCTATTTTGTAGCCAATAAATTAGTGTCAAGTGTCAGAGGTTGATGTTCACAAGGGGATAACGTGCTAACAGCTCTGATTATAATATGCAGTTATGGTCTAGGCAACACCAAAACACTGACAGTAATTTAGTAGTGACAACACAAATTCTTTTATCATTTTAGTATTTGAAATCATAATCACAGAAATAAAAACAAAATCTTTTGACATACCGTGTCTAGTTGAGTAGAATGTATTGGATATTATTGTGTTCATACAGCATGTGAAACACATTTGACAATTATACAGTGTGTCTTAAACAGATTGAGGCTATGCTCTTATAAATGCAGGTAGCATTAATATTAATCCTTTAAATTGCTTGCCTGTAATTAAAAATTTAATATACTCCTTCTTTTTACAAAGAAAGAATTATAGAAGTTCCTGAACTTTTTGTGAATGTTGTAGTTGCACAATTAAGTGGAAAAAATTCGTAGCAGATCTACTTCTCTCCTACACACATTCTTAGCTTTGCATAGCATAACAGTTATTGCTCCAAGTTTGACAGTTATTTTATTTTCATTGATAAAAAGTTATTGTTATCTAAATTAGTTGCACTTAAGTGTTAGATATGAGCAGTTAAAGTTAAAATGATCTGAGTGAGGAACAATTCCATAAATTCCCCAGAAAATGTGTCCAGACCTTAAATAAAAAGAGTACTCCATTAATTGGTTTAATTACATATACAGTTGTCACACCATAACCTACCGGAATCAGTTTTCTATTCTATGACTACTTATACCACATATATGCGAATAATATAATTCACCAAATAATCTGCGCACCCAAATTTTAAGGGGGGGGGGGGAGACTGGTTTTAATTTGTTTTTGTTTATACATTGTGTATCTTGCTGTTTAAGTGCAGCTTATATATCGAGTTGTTGCAGGATGGATGTTATGCCTCCGGGGGTAATAACAGCTAATTTTCCCTTTTTGTAACTTGTCTCGCACTTCCTCAATTCTGTCTCTAAAAGCTGCCCAGGACTGACATGGTACATAAATTCAGTAACGCTACAGGGTGACATTGCCAAACCATGCCACCCAGTCAACCGCAAGGTCATTGTCCATCCGCCCCTTCACGTTCACTGTCACCAATATGGCTTTCAGTGATCTTTTTGCAATAGTTTCTTTTACATTTTACGTTAGGTGGTAGCTATCATCCATTGCCAGTTACACACATCACTGTACACCTTTGCCACTCATTGCTGCCAGTTCGAATCATGACGCTGCAGTCCCCTTGGATCTGTATTAGCAACTTGCAATAATATAAAGGAATGTTTGCAGTGCAAATTTATCACTTAGTGATGAAAATTCACTACTTTTCCTCCAATCATCTGGCAGCTGTTGAGCAATGGTAGTTTTGCTCTGGAAGCCTAATCCATTGTGATGGAAAAATATTGATAGCCAGCCCTAGCTAACATTGAAACCGGTGATGCTTAGTTCTTTGGCTGAAGCCAATGCTTTGATTTGGCACCTTTCACTTGTCACTGGGCATCCACATTGTCACTTCTTGCCCACGTAATTGCAGAGCCTTTTTTCGAGATCCATATGCTTTGCTTTTTGGCTGTGAAATCGCTGGCGATTACAGTTTGTTTCTTGGAGGCGCATTTTGTTTTTTCACCATTCGCAAATAACACTTGCTCACATCCTACTTTATTCCCACTGCACGGTTTCCAATGTTCTCTGCTCCTTCAGTAATTTCAAGTTTTTTTTAGCTGTGTATGAGCAGTATTGAGAACATCCATAATTAATTAGTGGTTAATGCACTTCTAATGTGCTATTGATGTCACAGACTGAGGCCACGACAACACTATAGTATAATGGGATCTATTGTTGGAGGTGGACAGTACCAACCTTATTACAATTAATCTACACAACCCAGCATTTCATCCTTAAATTCAGGGTAAAAACGAAGCCCAGACTACTCATGTCTATACGGTATTTGAACTCTTCGATTTTGTGCTGAGATTGATTTCTAGATTCCTTATTCTAGTGAACATATAGCAGTAAGAGTACAAAGTGTATTTGGAATGGGATGTTGCATTCATTTGTCGTAGATAATTTTCTGAATGTTTTCCATTTGAGAATCCCTAACACAGTACTTGAAAGTCTGCTACAGTTTTTCTATAATATCTTCTGTTTTCATCAATGTGGAAGCAAACTATTCTTTACCCAAGTCTTTTTCGTTTGTAAGGATGATTTTTATCTTAGAATCATTAAAAGACTCATCCTAGGGCTGTGAAGAAAAATCTGTTAGAACGACTATTACAGTGGTAGAAAATTATTTATTTCATTTGACTGTTGTTGCAATTTGAAATGCAGCAGCTGCTTCTCAATTAGTTGGTTTGGCATTGTTATAGTTTTTCTTTGGTTCTTTTTTACTTCTGGAGAAAATTTTAAATTATCCATAGAAAAATATTTTAAAACATTGTGTTTGGAATATAATGTGACTTGTGGCTCCCAGTTTTGCAATAGAATTGAGAAAGATGTAATAGGATCTGTCTGCTTAATTGATTTTTCCCTCCTCTGCATTTCCTGAAATGGTTGATTGTATTAAAAGTGTGACGTTTAAGACTGTGAGCTATCAGTGAGTTATTGAGTTATCAAGTGAATTATTGAGTTATCAAGACAATGAAAATCTCAAATGCACATACTCATCAGTGGAAATTCACTTGGGAAACTGAATTAGTGGAAATAAGAGGTGAAATGAGCTTCATGTATGATAACAATATCTTAATGTCCATGAGTAAGGCATATGTTGAACAAAAGTAGTAGCTAATTGGTGGCTACTTGTCTCTAAATTACTGATGTAGTAAAATATGACGTTAACAATTGGATGTCGATTGTTAACCATTGTGATTAGAACTTCACAAGTGTATAGTAAATGCTGAAACCATGTCTACAATAAATCCTTTTGGATCTTCTGAATCTGTAACGACATTTTGCTTTCTTTTCTTAAGACACGAAATTTGAAGGATGTAGCAAAGAATTCTGCATCTTCGTCAATCATCCCGTTGAAAATTTACCTCCTGTGTAGGAGGCTTTTAGCAAGCTAGACAGTTCTGGATGTGATGTTTCTGGGTGTCCAGTCATATACTTCATTTAACTCATTTTTGAATGTCCTGTTGTAAGCATAATAAATTTGTTGTTAACTTTTGCATACAATAATTATTACACGCCATGCTGAATGACAGAATAGTGGTTTGCATCCTTGTGGCCTACAACGAACCACACCAGTATATTGATGCCCTTTTTCTGTGCAGTACAGGTGTAACAATTTGTACATACATGATTGTACACGATGACAATGTATTCATTCCAGCTTTTGCTGGAGATAATGAATGTGAATTTCCACACCATTAGAATTTCAAACTTTCCACAGAAAGTTATAATCATGCATGAAGTTTCTGATACAATTGATAAGTACTCCTATTTGACAGGGCAGATTTTTTTAAACATCACATAATTTTGGACTAATGATAAATGGTAGTATTGCACAAAATGATTTTTTTGAAATCTGGAGATGATCAGAATTCATTTAGACTGGTTACTCTCCTTCCTTGTGCTTCAATAATTATTAGTCTGTGGTAGCCTTAATTTCAGTTTATTGTGATCTTAAGAGATTAATATATTAGCATTTATACAAGGAAATTTGTAATTTTGATAGCATAGTTTGTCAAGCTGGTTATTGAAAGTGCATGAAGAAGTTCACAGAGAAAGTTTGATGCTGTATTGAAGAAATAGATCTTGTGCCTTTTCTTGTCTATATAGTGTATTGATTGATCTGTCTTCGCCAGTCATCATTCACATTTCATTGTTAAAATTAAAATTAATGTATTTACATAAGCAAATTGTTGTTTGTAGTATTCTCAGGACCATAATTGTATTCATTAGCTTTTTCATAGTGTCCTCAATTTATATGAAATGAGACATTACTTTTACAAATTTATTCTCAGAACTGTTCTAAAATTATTGCACTCAAATGTAGTGCTTCGTTGAATTTTGTAAAGTCTAAACTAAAGCAATAATGTTTATTCTACTAGCTATAATTATTTTTGTGTGTAATGTCTTTCATATGCTGTTATGGCATGTGATACATAGTGGTATTAATTAGGAAAGCTCAAAAAAAGGTAATTACTTGTGAAGATTTCATTTGATTTCCCAACTCTGTTTGAAATTACACATGACATGTACATAATCTGTGTCTTTCAAGTGAAGTGCTATATCTTTTAATTGTATTTATCTTGCTACAGTTTATCTCACTTTCACATTAAGAGTAGAGGAAGAGAGAAATTGAGACGAGGAAACCTTCATGCATGGAAATAAGATTCTCTCTCCCCTACATTACGGGTTATCAGACTGTTTATTTTTGGTAATCATGCAGTTACATTCTCTGCATTTGTTTAATACTGATCAGATGCTGTAAAGCCAAAGTGATATTATTTTACAGATGACATATTTCTTTATTTGATGAAGAGTCAGTGAAGTATCTATGATCAAACATTATTACGCCTACTTTGAAATGTAAATACATACTGAAATTTTGTTCTGATACAAAATTCAGCGACTGAAAATATTGTGGTTGTAATAATTATATATATCACTGAAATCATTTTTTTTAATTGTTCATATCATCTGCCATGTTCCTCTCACTAAGTGTTAGGCAGACTAGGCTGTGATTGTGAAGTATTGTTTGGTTTGTTGTAGAAAGTTTCTCTTTATTTCTGTCAAAGTACAACTTACATTACCAAAGTCCTGCTCAGTATTTTAAGTAGATTCTATTGAAAGTACTAATGTAAGTACTCACAATTTAAAGACTGTAGTAGTATCATAATTATACATTTATTATTAATTCATTTAGTAAAAAAAGAATTTATCTTGTAATTTGTTAAACACAAATTAAAGGGGGCTGTCAAGTTTATTGGGTGTAATGTAGTGCCTTTCAAAATGAAAATTTTAGAAATACAGGTTTATTGTGAGACTGATCTCTTGTCTTTTTTTGTGAAATAGTATTCATTGGTATTGACTTGTTTAAAATTACAAGAACTCTGATTGTGTATGTCGCATTTTTGCCAAGACATAAATTTCTCAAATGTAAGTAGTTACAGTAAATGATTGGTAAAATTACTAACAACAGGTTTCATTGTCTCAGAGATGATTATAGTTACAAATGAAGCAATAATGTTAAAAATTTATATATAAAAATTTTTTGATGGCCAGTTTGTACATATTTTTCTGTCCTCAGTGGAGCAGATGTGTTGAGTCCACAAGTAAAACAAGCAGCTACTGCAGGCCAGTTGCCTGGCCTCATTGAGTTTAATCGTA\n>MW362430.1 Lactobacillus acidophilus strain BCCS A50 16S ribosomal RNA gene, partial sequence \nATTCACTTCGGTGATGACGTTGGGAACGCGAGCGGCGGATGGGTGAGTAACACGTGGGGAACCTGCCCCATAGTCTGGGATACCACTTGGAAACAGGTGCTAATACCGGATAAGAAAGCAGATCGCATGATCAGCTTATAAAAGGCGGCGTAAGCTGTCGCTATGGGATGGCCCCGCGGTGCATTAGCTAGTTGGTAGGGTAACGGCCTACCAAGGCAATGATGCATAGCCGAGTTGAGAGACTGATCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGACGAAAGTCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTGGTGAAGAAGGATAGAGGTAGTAACTGGCCTTTATTTGACGGTAATCAACCAGAAAGTCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGAAGAATAAGTCTGATGTGAAAGCCCTCGGCTTAAC\n>XR_006102310.1 PREDICTED: Sceloporus undulatus uncharacterized LOC121923102 (LOC121923102), ncRNA \nTGGCGAGGAGAAGGAGGAGGGGGAAACAGGAGGAGGAGGAGGTACCAAGTATCAGGTTGTGGCTTGCATCAACAGGTCCCATGCACCTGACCAAGAGAACAGGCTTTCTATTGCTCAGGCTTGTGATATACAGATGAAGGTAATAGACTGGAACCGTGAAATGCAGTTGTGAACTGCTAAAGCCTCATCGAAAGTTTACGCCAACAACTGCAATTTTATAGGCACTTCAGGAAAAGAAGACAGCATTGGCCATTTAACATAGCAGTAATGTTTGTTTTCCTTCTGCCAAGTATACAACATTATGATTAAGAAAGAGAGGAGCCCATAATTTTTCTTGGTTAACATGGGAACGCAAAACAGGAGGGTGTGTTTATCTTGTTTAATGTTTTTTCTCTCCTCTGACCTCTAAAAGGCTTTAAGTAAATTTTGTGGTAAAGCAAAGCACATGAGCAGCGAGGGAGTCTCAGACAGTTATAGTGTCTGAATACACTCTTTGTGGTATTGGCAAAGATGCTGTGATTAAGAATTGGCAAGCTGGTGGCTTCGACTGATAGAACTTTTATTTTCCTTCCAAGAAACCTGCAACATGAGGATGGACAT\n>JF772131.1 Bacillus sp. NA-107 16S ribosomal RNA gene, partial sequence \nATACATGCAAGTCGAGCGGACAGATGGGAGCTTGCTCCCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCTGTAAGACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATGGTTGTTTGAACCGCATGGTTCAAACATAAAAGGTGGCTTCGGCTACCACTTACAGATGGACCCGCGGCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTAGGGAAGAACAAGTACCGTTCGAATAGGGCGGTACCTTGACGGTACCTAACCAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAAGAGGAGAGTGGAAGGTGTATGGTAACCCTTGTTGTGTGGGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGT\n>XM_047969201.1 Xylaria bambusicola uncharacterized protein (F5B22DRAFT_156494), mRNA \nCACAGAACGACATCTCAGGTGAAAGAGGTGAACATCATCTAAGACATTATCGGATTGGACGTAACCATGTCACCAGATCGAGTCCCTAGTAATCGAGTTCCGCCTCGCCCGAAGACGCCTACAGACTACGTCCCTACGCCGATTCGTGCAAAAATAACCCCCTCAGAGACTTTCAGCCACCTCGTGAATAAGAAACAGAGATCCGCCAGAGTGCACGCGCTTGCTAAAGAGCGACTCACAAGTTCTAGGCCAACCACGCCTCGGACCCCTACTACCGTAAACTCCATTATCAAGTCCGCAAGAACCAGCCGGTCCGCTCTCAGTTCCGCAGGCAGAAATATAGCGTCCAGCCTTTCAAAGGCAAAGCCGGTGGTGGAAACAGCAGTCGCAGCCAGCAAGAAGGCTGCCGTCACAACTGCAAATCGCTTGACAAGAATGGCAACTGATGTGCCGAAAGTGGCCAAGCAGAAGGGAAAGGAGGTCGATGTATTGTCGACTCCATCTAGCTCATCATCGCAAAAATCACTGTATCATCGACCTAGGCTGCCCAAGCTCAAGATCCCCGAAGTTGATGCTGCAGTAAGAGACGCGTTAAATAGTGCATGTTCAACTGATACACAGAACAGCGAGAACTTTCGAATACTCCAAATTTCGCCCACGAGCCGAGAGCTCGAGTATGAATGGCAGAACGATGATAACCCACCTGACGTTGCTGCAGAGTTTCACAACATGTTAAGCGCACGCCGCAGAGTTCGTAAAGGTAAGTTTGGATCGAGGGTCACAAGATATTGCCGGGAGCGGCCAACCTGGCAAGACAGTTTCGTTGCCAGAGCCCATCTCGATAACCACGAGGATAGGGCGCTGTTGAAAGAGCTTACAGACGCTGTCCAGGAACAAAAGGATTACGCCGCCCGCCTAGTACAGAGAATCCCAGATCGTTTCCCCGGGCTCGAGGCTGTATCTGTGCCGGGGTCAACATTAAAATTATACTGGCAACACAAAAGCACATGGCCTAAGCAGTAAGGGCTCATGGGAATGATGGTCCATTCAGTTAATGATAGAACTGGCCGGTTCCAGGGGTCAAATATGGTCAAGTATGCGTACTCACTACTAATATAGATCTAGACTGTGATTTTGTGTCTA\n>AB726205.1 Uncultured fungus gene for 18S rRNA, partial sequence, clone: a70-1 \nAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAATTTCGGGATCAATTTATCGGTCGTGCCTATGGTATGAACTGGTACAATTGGTTTCTCCCTTCTGACGAAGCATGATGTCATTAATTTGGTGTCGTGGGGAATCAGGACTGTTACTTTGAAAAAATTAAAGTGTTTAAAGCAAGCATTAGCTTGAATACATTAGCATGGAATAATGTAATAGGACGTTTGATCCTATTTCGTTGGTTTCTAGGATCGACGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGATGATGTTAATTTTTTAATGACTCA\n>KX928124.1 Williamsia sp. strain AC048_ELMA209 16S ribosomal RNA gene, partial sequence \nGCTGTGGATTAGTGGCGAACGGGTGAGAACACGTGGGTGATCTGCCCCAAACTTTGGGATAAGCCTGGGAAACTGGGTCTAATACCGAATATGACCACTGGATGCATGTCTGGTGGTGGAAAGCTCCGGCGGTTTGGGATGGGCCCGCGGCCTATCAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCACCAGGGACGAAGCGAAAGTGACGGTACCTGGAGAAGAAGCACCGGCCAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTGTCCGGAATTACTGGGCGTAAAGAGTTCGTAGGCGGTTTGTCGCGTCGTTCGTGAAAACTTGGGGCTTAACTCCAAGCGTGCGGGCGATACGGGCAGACTTGAGTACTACAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGTAGTAACTGACGCTGAGGAACGAAAGCGTGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGGTGGGTACTAGGTGTGGGTTCCTTTTCACGGGATCCGTGCCGTAGCTAACGCATTAAGTACCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGTGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGGTTTGACATACACCAGAAAGCCATAGAGATATGGCCCCCCTTGTGGTTGGTGTACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAAC\n>XM_023377893.1 PREDICTED: Centruroides sculpturatus glutamate receptor 2-like (LOC111633339), mRNA \nTTATAAATCTATTCATGCCACAACGGAACTTCAAAGGCTAGCTACGAAATACGAAATTACACTGCTTTCTATTCAGAGATTTCCTTTGTCTGACTCAAAATCTCTCGATGTAACACCACAATTAAACGCCATTAAGGAAAAGGACGTGAGAATAATAATTCTTTATTGTGATATAACGATAAGTAAAACTGTTATAAAGCAAGCTGAACGCATGAACATGTTTCGTTCTGGATGGACCTGGCTCGTCATGGATAGCATTACATCGTTCAGTCTTAAATACTTATCGGACGATGACGGATATATACCATCTTCTTTAGTCGGATTAATAGGAACAGCATTTGTAGTTCCTGATACCATTTTGTATTTAAAATTAATGAATCAATTAAAAGCGAATAATTTGGAAAATCATATAGAAAATCAGCAAGCTATCACTCGTGTGTATGATGCAGTGTTAGCAATTGCCAACGGACTTCACAGAATTCTTTACGAAGAGAAAGTATCTTTCGAACTTCCTACTTTCCAAAAAGGAAGTTGCGCAGATTCTGTCAATGACTGGAAATGGGGTAGAAATTTGTTGGAAAGTATTCTTAATTTGAATAACGTTAATGGAAGTTTAGGGCCTATAAAGTTCACGAAATTTGGTTACCATCATCTCACCAGTTTTGACATCGAAAACCTTCAAACGAGAGGTTTCGTTAAAGTAGGAAAATGGTTAGGAAACGAAAAACACTTGACAATTAATTCAGAAATCATATTTCCTGGGCAAACTGTGAAACCTCCTGATGACTCTCATCACAGTCTTCACGGAAAAACTCTTAATATTGGAATAGTTATAGATGAGCCCTTTATAATGAAAATCCCTTATTATAAAGAAGGAGATCCTATACATTCTAAATACGAAGGATTACTTATAGACCTTCTTTTGAAATTACAAGAAATGCTTAACTTTAAATTTAAATTTCACGAAATAAAGGAATATGGAATTGAAAATCCCAAAACAAAAGAATGGAACGGATTAGTTAGACAATTAATGGATAAGAAAATAGATTTGGGCCTAGCTGCCTTCACGGTATCTTGGAAAAGACAAGAAGTTATCACCTTTACAGCTCCTTACTACGATTTAGGTTTGGCTATATTAATGCCAAAATATAATGCAAAAACTAAACAAAATTATTTTGCATTTTTATCACCTTTCGAAACAACAGTGTGGCTTACCATTGCTGTGTCGGTGATTTTTACTTCTCTAGTGCTTGCAATATGTGTAAATTTAACACCAAGTAATTTTAACAATAGAAGAAAGGAGATAAGGAAAACAAGTCAAAGCGTTAGAGATTCTTCTTGGATCACTTTTCCACAAGCACTTTGGTGGAGCTTCTCGTCGCTTGTAGCCCCGGGAACAGAATTTGAACAACAAAAGAATCTTCCGGCAAGAATTGTAATGGTGACATGGTGGCTAACTACGGTTATTCTTATTGCAGCATATACAGCAAAATTGGCAGCATTTATGACAGTCCAGAATATGAAACAAGAAATTAATTCTCTGGAAGATTTGGTGAAATTGAGTTCAATTTCATTTGGAAGTCTGAATGATTCTTATGTTGAGAACTTCTTCGCCAACAGTCACTGCGAAACGCATAAAATAGCTTACAAACTGATGAAAAATTATAATACATTCATAAACGATACTTTCGAAGGCGTAGAGAGAGTTAGAGCATCGTATTATTTGCCAGAGGGCCACAAGGATCGTTTTGCTCTTATTTCTGATTCACCACTTGTGGATTACGCTTCTATGCAGAGGCCATGCAATGTCGAACGAGTTGGAAGACTTTTTGGATTAGTAAATTATTTTTAA\n>XR_004836665.1 PREDICTED: Folsomia candida uncharacterized LOC118438235 (LOC118438235), ncRNA \nCTGAGAACAAGGCGATGGGGATGAGCAGCATAATACTGGCTTCGTCGGGGGCGAGGGTTTTAATTCTACGGTAAACTTGTACTTTCGTTTCGAGCACAGGGTTTGGAGTGAAGCCAAAACTTTCTTCGGGCTAAGGTCTGTCATGAAACTTTAAGCAACTGTCGGTTGCACCACAGTCGGAGAACAGAACAACAGCAACCATCAACATGATACTGGCTTCATCCGGAGCATTGGTCCGAATTCTTTTGTGAAGTTGCATTTGCATCTCTTTCACCCCGTCGGCACAATTACAGGCACATTCGCCACCCTGCACAGAAAAATACACATATTCAAAAAGTGTACACAGATTTCTGAAATTACATATGTAACTTCTTAGTGGAAAACCAAAATGTGTATAAATTTTGAACCAAATTAAAAATTTTGAGGATATTCATCATGTTATAACATGAAATGTATATATTTCACATTTATCTTGCGAATTAAAAATGGTGTAAAAATTATTAATATGCA\n>XM_039871033.1 PREDICTED: Pteropus giganteus Scm like with four mbt domains 2 (SFMBT2), transcript variant X6, mRNA \nCATATCTCCTTCTGCAGACTTCGACCAGTTGGTTGGTGTCAAGAGAATAAATACAGAATGGACCCACCTTCAGAAATCTATCCTTTGAAGATGGCCTCTGAATGGAAATGTGCTCTGGAAAAATCCCTTATTGATGCTGCAGAGTTTCCTCTTCCGGTGGAAGTGTTTAAGGATCATGCAGATTTGCGAAGCCACTTCTTCACAGTTGGGATGAAGCTCGAAACAGTGAACTTGAGCGAGCCCTTTTCTATCTGTCCTGCATCAGTGACCAAGGTTTTTAACAATCATTTTTTTCAAGTGACTATTGACGACCTGAGACGAGAACCTAGCAAACTCTCAATGCTCTGCCACGCGGATTCCTTGGGGATTTTGCCCGTGCAATGGTGCCTTAAAAACGGAGTCAATCTCACGCCTCCCAAAGGCTACCCTGGTCCGGACTTTGACTGGGCAGATTATCACAAGCAGCATGGAACAGAAGAAGCACCTCCCTTCTGCTTCAAAAACACGTCATTCAGTCGGGGTTTCACAAAGAACATGAAACTGGAAGCCGTGAACCCCAGGAATCCAGGAGAACTCTGCGTGGCCTCTGTCGTCAGCGTGAAGGGGAGGCTGATGTGGCTTCGCCTGGAAGGCCTGCAGACTCCCGCTCCGGAGTTTATCGTTGACGTCGAATCCATGGACATCTTCCCAGTGGGCTGGTGTGAGGCGAATTCTTACCCGTTGACCACACCGCACAAAACGGTCTCACAAAAGAAGAGAAAGATTGCAGTTGTACAACCAGAAAAACAGTTGCCATCCACAGTGCCTGATGAGAATATACCTCATGATCTTTACTTATTCCCTCACTTGGACAACACAGGTACTGTCAATGGGAAGTACTGCTGCCCTCAGCTGTTCATCAATCACAGGTGTTTCTCAGGGCCCTACCTGAACAAGGGGAGGATCGCAGAGCTGCCTCAGTCGGTGGGGCCAGGCAAATGTGTACTGGTGCTCAAAGAGGTTCTTAGCATGATAATCAATGCAGCTTACAAGCCTGGAAGGGTCTTGAGAGAACTGCAACTGGTGGAAGATCCACACTGGAATTTTCAGGAAGAGACACTGAAGGCAAAGTACAGAGGCAAAACGTACAGGGCCGTGGCCAAGATTGTACGCACGTCTGACCAGGTAGCAGACTTTTGCCGACGGGTTTGTGCCAAGCTGGAGTGCTGTCCAAACTTGTTCAGTCCTGTGCTGGTTTCTGAAAACTGCCCAGAAAACTGCTCCGTTCATACCAAAACCAAATACACCTATTACTACGGGAAGAGAAAGAAGATCATTAAGCCCCCAATCGGGGAAAGCAACGTTGAGAGCGGATGCCCGAAACCAGCCAGGCGTCGGAAACGGCGAAAATCCATTTTTGTGCAGAAGAAACGGAGGGCTTCTGCCGCAGACTTTGCCGCAGGCTCGGGGGAGGAGAGTGAGGAGGAGGAAGCGGATGCCGTGGACGATGACACAGGGAGCGAGGAGACCGGCTCCGAGCTCCGGGATGACCAGACGGACACCTCTTCGGCCGAGGTCCCCTCCGCCCGGCCCCGGAGGGCTGTCACCCTGAGGAGCAGCTCCGAGCCTGAGCGCCGCCCACCTGTGGACAGGGCACGACGGGGCCGTCGCGTGCAGGCCACCTCCTGTGCCGTGGGCGACAAGGGCCCGGCAGCCGGCCAGGACACGGCAGAGGAAATAAAACAGGAGGAGGAGGGGAGACTGGTTCTGGAGAGCAACCCGCTGGAGTGGACGGTGACTGACGTGGTGAGGTTCATTAAACTGACGGACTGCGCCCCCTTGGCCAAAATATTTCAGGAACAGGACATCGACGGGCAGGCGCTCCTACTGCTGACACTTCCCACCGTGCAGGAGTGCATGGAGCTGAAGCTGGGACCCGCCATCAAGCTGTGCCATCAGATCGAGAGAGTTAAAGTGGCTTTCTACGCCCAGTATGCCAACTGATTCTACCTTCAGGGGATGTGGCCCATTGTGTTGGTGATGCCGCGTCTTGGGAAGGTTTTCGGGACTGGAACTTTTATTTTTCTGGGTTATGAGAGATGGTTCATATACTGTTACTGAAAAGCAAGAAGCGTGAAGGACCTCCTTCACTTTCATCCACCAGCCTGTTTCATAGTTTCATGTTTTAAAGCTCATGCCAGGACCACAGCAGTGGCCTCTGGAGAGTGTAAATTAAAGTTCTGTGTCAGA\n>XM_028176078.1 PREDICTED: Bombyx mandarina disheveled-associated activator of morphogenesis 1 (LOC114244323), transcript variant X2, mRNA \nGGACGCGATGCCTGGGTCGCTCAAACGTACGATTCCGACGAATTGACGATTTTGGGCTGAATACAACGAGGACGCAGTGCTTTAAAAAACAAAACAAAAATTTTGACAGTTAAAATTACGCGCGTTTTTTAATCTGTGGACAGTGCTTTAATGGTATTTGTGGGAAAAGTGTGCATAGTTTTTCGGACAAATACTTCGGTTGTAAAATGATGATTGAAATCGAGTGATAGATGTAAAATGTGATAAAGTGAATAAATAGTTAATTGATAGCAACAAGACAGCAAAATGTGCAGCAAGGATCAGATCAATCACATACTCGGGAAGATCAATGTGGGTCTGCCGTCGTGGTCCCGCGGTGTGGAGGCGGTGGAGGCGGCCCGGACGCGTCTGGTGCGTTGGGCATGTGGCGACCCACCTATCGAGCCTGACCCGCCAAGGAAGAAGATGCCGCATGCGCTAAGACGGAGGTGGCCGCTCTGTCCTTGTTTACAGAATGACGAACCGCCCGAGATCACGTACTGCGTGGTGGGCGGCGAGGGAGGTCTCGCCCTCCAAGCGGTCACCCCCACGCATCCCATGCCCCCGGAAGATGAGCTGGACGCCAAGTTTGCGGAGCTGGTCGAGGAGTTGGACCTGACAGCAGTTAACAAGGCCGCGATGATGGCGCTACCGGCTGCCAAGAAATGGCAGATCTACTGCAGTCGTAGGCCGCCACCGGGCCAGGCGCCTCCACTGGCCACCGCACCACAAGTCGAGGAGTACATCAAGGCTCTTAACGAGATCGCTGATGCATTTGCGTCGTCTGAAGGCGTCCCCCCGACGGAATCCTGCGGCCTACTCGAGGGCCTGAAGACAGCGCTCAGGACGAGGGCTCACAGCTTCGTCCTCCGGTTTATCAAGCAAGGAGGACTCGGTGCCATATTGGACGCGTTGCAGAAGGCGCCCAGGGACGATGCTGTCACGAGACATAACCTTATAGCTGCCATAAAAGCCTTGATGAATAATTCGACTGGTCGTGCTCATGTATTAGCTCATCCCACGAGCATCGATCTGATCGCTCAGTCCTTGGACACGGAGAACGTGAAGACGAAAGTCGCAGCACTTGAGATACTCGGCGCTGTATGTCTTGTCCCCGGGGGACATAAAAAGGTGCTAGAAGCGATGGTCAACTTCCAAAAGTATTCCGGCGAGAGGGCCCGCTTCCAGAGCATCGTCAACGAGCTGGACCGCAGCACCGGCGCCTACAGGGACGACCTCGGCCTGAAAACGGCCATCATGTCGCTCGTCAACGCCGTGCTCAACTACGGGCCCGGCGAGGAGAGCCTCGAGTTCAGGCTCCATCTGAGATACGAGCTGCTCATGCTGGGGCTTCAACCAGTGATCGAAAAACTCCGCAAATACGAAAACGAGACGCTGGACCGGCACATCGAGTTCTTCGAGATGGTCCGCGGCGAGGACGAGCGCGAGCTGGCGCGGCGCTTCGACCGCGAGCACGTGGACACCAAGAGCGCCTCCGCCATGTTCGAGCTGCTGCGCCGCAAGCTGGGCCACTCCGCCGCCTACCCGCACCTGCTGTCCCTGCTGCAACACCTGCTGCTGCTGCCGCTGGAGTACGGCCCGCAGTCCCAGCACTGGCTGTTGCTGGACCGTGTGGTGCAGCAGGTGGTGCTGCAGCAGCCGGCGGCGGGGGCGCGCGCCGACAGCGAGCAGGGCAGCGAGGGCGGCAGCACCAGCGACCAGACCAGGATATACGATCCGGACGTGGCTCCCCTCGAGATAAACGTCGGCGAGATAGTGCATTTGCTCGCCAAGGAGGAAGAGCTCGTCGCCGCCAGGACCAAGGCCGAGAATCTGGAACGGGAGAACATCGACCTGGCCACAGAGCTGGCTAAGAAGTTGACCCAAGAGAGAACCGAGAGAGCGAGATTTGAAAAACTAGTCAGCGAGGGAAGCATACCTGATGATGCTAAGGTGAACAATCTGAAGAACGCGGTGATCGAAACGTCATCGGTACCTCCCCCTCCTCCGCCGCCGTCAATGTTCCCCGCGCCCCCCGCCGTGCCGGCTCCTCCCCCCGCGCCGCTCGCGCCTCTCGCCCCCCTGGCGCCGCTCGCCCCCGCCCCTCCCAAGCCCAAGAAGAACGTCCCCACTCCCGGGAACCCGCTCAAGAGCTTCAACTGGAGTAAATTACCTGATACCAAGCTGCACGGCACGATATGGCAGGAGCTGGACGACACGAAGCTGTACAACGCGATGGATCTGCACACCATCGACAAGATGTTCTGTGCCTACCAGAAGAATGGCGTCCAGAACGAGGGGTCCGTCGAGGACCTCCGCCAGCTCGGGTCGAAGCCCAGGACGAAGATACTGTCCGTGATAGACGGCCGCCGCGCCCAGAACTGCACCATCCTGCTGTCCAAACTTAAAATGACCGATGAGGAGATTTGCAGAGCGATCCTCAAAATGGACAGCGGCGAACAACTGCCCATCGATATGTTGGAGCAACTCCTGAAGTTCACGCCGAGCGCCGAGGAGGCCGCCATGCTAGAAGAGCACCAAGATGAACTGGACAGCATGGCGAGGGCGGATCGCTTCCTCTACGAGATCTCCAAGATCCCGCACTACTCGATGCGGGTGCGCACGCTGCTGTTCAAGAAGCGGTTCGCGGCGGCGAGTGCGGAGGCGAGCGGGCGCGCCACCACCGTGCTGCGCGCCGCGCGGGACATGACGCGCTCGCGCCGCCTGCGCGCGCTGCTCGAGCTGGTGCTGGCGCTCGGGAACTACATGAACAGGGGAGCCCGCGGCAACGCGTCAGGGTTCCGGCTCTCGTCACTGAACAAACTCGCCGACACCAAGTCCAGTGTTACAAGAAACACCACGCTCCTGCATTTCCTGGTCGAAATGTTGGAGACACAGTTCAAAGACATACTGCTGCTCGAGGAGGATTTACCGCACGTCCGAGCCGCGGCTAAGGTTTGCGTGGAACAACTGGAGAAGGATGTGGGTGCTTTGAGGAGTGGCCTCCGTGAAGTCGCGAAGGAGGTGGAGTACCACGCGTCGCTGCCCTCTCCGCAGCCCGGTGACGCCTTCCTACCAGTCATGAGGGAGTTCCATGCGCATGCTGTTTGTACCTTCACACAACTGGAAGATCTTTTCCAGGACATGAAGAGTCGTCTCGAAGCATGCGCCCACGCCTTCGGTGAAGAGACAAGTGCGTCCCCGGAGCAACTGTTCGGCGCCATGGACGCGTTCCTCACGCAGCTCGCGGAGGCGCGCGCCGAGTGCGACGCCATCAGGAGGCGCCGCGACGACGAGCAGCGCCGGACCAGGCACGAGCAAGAGTTGAAAAAGCGTACAATGGAACGTAAGCAATCAAACTCGCTAGGCTCGGTGAGCAAATCCCTAGCGAAATCCAACGGGGATTGCAACGGACACTCCAACGATAGCTCCCGGGACGGCACCATGAGTAACGGACAAAAAGGAGAGTTCGATGACCTTATATCCGCATTACGAACAGGAGATGTCTTCGGAGATGACGTGGCCAAATTCAAAAGATCAAGAAAGACTTCCAAAGTCACTCAGAAGGGTCGCGACTCTCCTCCCAGGGGCGTGTGCAGGGAAGACTCTAGGGAGAGACAGAAGAATTGAGATTGACAGCAGTTATTGATGTGTCAAAGAACGTGAGTACGGCTCTATGCGTGAACGTTGCTTGTAAGTACAGAAATTTGTTACACCAACTTTTCTGTTACTAGAATCGACCACATGTTTGTCAATATTTCGAAATACCCTCAAATAAATAATTAGGCATTAAACTGTAAGTTTTGAAATAGTATACATGTACTTATTCGTCGATGCTAATTAAAGTTTGGGAACGGAGAGCCGATGACCGTCATACGTCGGAATATCGATTAGAATGACTGCTTTAAAATAATCGATTAGTATAATTGTAACAAGTGATATTTTCGAAGTAGATTAGTTTGGACGGTGATGGTGTGTACGTCACAAAATATTTAGAGATTTATACAGAATAAAAGATAGGACGTTTAATGTGCTAAATACCAATTAATTAGCGTGATCGCTTATATATTAAATCGATTAATAAATAATCGATATTAAATCGACTAATAAATAATCGATATTAAATCGATTAATATATAGCAGAGTTAATTTAATTGTTACACAAATGTATTAACTATAGACGATGGAATAATTTTAAACGAAGTCAGCATTAACTATTAATTTAGACCTTAAATTGCAGTGGATAAGGACTGATCTGTGATTTCACAAATTGTTTACCTTGTGTCTGTTTTTAATTATCACAGGTATATGTTTGCGGCTTGGTCTTAATTAATTAATTTCATAATAAGTAGCGTTTTGCCTTTAATACTTTGTAATTTTTGTATGCATTTTACCACGTATTTTAGTGGTGTTTTTTGGTACTAAAATAAAGTATTTTGAAGAGTATTTTTTTTGTAATAATTTTTGCAAAAATTGAAATAATTGTAGATTGAGATACAGTTTCAATGTTTTGTATTTTTTCGTAACGACTGAAGTAGTGAAAAGGCTGCAAATAAATGATTCCGTAAACAATTTTTTTTGATAGTCTTAATCTTACTATAGAGCTATATGTGTTTGTATTATCTATGTACGTAGTATTTAGATACTGTATTTAATGCGTTCGATTTGACACCGTACCCGGTGTTGCCAACACACAAAAACAAACCTAACATATCCCCGTTAGG\n>XM_042445786.1 PREDICTED: Sceloporus undulatus transmembrane protein 258 (TMEM258), mRNA \nGAGAGAGGAGGCGAGAGGGGACTTTCATTCTGGCCTGGACAGGAAGTTCCCGGATGGATTTCCGGCGTCTCCGCCGAGGAAGAGACGTGTCCCTGCGTGGCCTGGGAGGAGGAAGAGGAGCCTGAGCTGACTAGAGAAGGGGCCAGGGAGCAAGATGGAGCTTGAGACGATGAGCAGATACACCAGCCCAGTGAACCCGGCTGTGTTTCCACATCTGACCGTGGTGCTCTTGGCCATTGGCATGTTCTTCACTGCCTGGTTCTTCGTTTATGAAGTGACCTCTACTAAATATACTCGGGATATTTACAAGGAACTGCTCATTTCCCTGGTGGCTTCACTTTTTATGGGCTTTGGAGTACTCTTCTTACTGCTCTGGGTTGGAATCTATGTTTGACAATAAGCCAAGAGCTGTTTCAGGTTCCAGAAGAATTGCTGAAGTTTCTTTTTTATTTTTGTACTTAATGTAGCTCATCACACCTGTAGTCTGTGTAAATCCTGACACATTGTTACAGCCCAGAATATCGTAACATCAGATGAATAAAGCTGACTGTGATGACATGAA\n>XM_024284361.2 PREDICTED: Oryzias melastigma peptide Y (LOC112153899), mRNA \nTCTCTCTTCCTGATAATGTAATCAACCGCGCGCGCGCGTCAGGTGTCCGTGGCTCTATAAAAGCCTCAGATCCGCGAGGAGAGGAAGAAGAATCCACGGAGACACCAGTCCAGCTGACGATGGCCAGAATCCTGAGGTCGTGGGCGATGCTCGCCGCGCTCGTGCTCTGCCTGCTCGTGTGTCTGAGCAGCCTGGCGGACGCCTACCCGCCCAAACCGGAGAGTCCCGGGAGCAACGCGTCACCGAAGGACTGGGAGAACTACCAGGCGGCGGTCCGGCATTATGTCAACCTCATCACCAGGCAGAGGTACGGGAAGAGATCCTCCCCTGAGCAGGCCGCGGCTTGGCTGCTGTTTGGGGCGGATTCAAGTCAAGATGCTGAGCCCCGGTCTGACTACGTTGAACCGTGGTAAATGAGCTCAACTCTACCCTGCACTACTGGACAAGTCCTCTAGATTTGATTATTTAATGAGCATGCAAATTTCTTTCTCTCTCATCCTGTTTGTCTGCTGCTGTCAGTAAATGTTTGTCCTTTTCTCAAAATTTGTAAATAAATTCTTGTATGTAAAATAATCTCTTTACAATAAAGATTTAAGTGGA\n>XM_004989695.1 Salpingoeca rosetta mitotic checkpoint protein BUB3 (PTSG_08955), mRNA \nCGTTAATAACCGCCAGTGCCAAAAAGGAAAGGAAGCACAGAAGACCGTGAGGAAGCACAAGCACACGACACCACACCACACCACACCACCGCACGCACACCGACACACCACACCACTCGCCAACATGACGGACACTGAGCTTGTGTCGCCACCCCAGGATGGCATCTCCTCTGTTGTGTTTTCTCCGACCAGCAACTTGCTTCTCGTTGCTTCCTGGGACAAGACGTGCCGGCTTTACGACGTGGACTCCAACACGCTCAAGTTCACGTTTTCGCACGATGCACCGGTGCTGGACTGCGCCTTCCTCGACGACACAACAGCTTTTGGTGCGGGGATTGACAAACAGCTGCACAAGTACGACTTGACGACTGGCAAGAGCTCCGTTGTCGGGTCGCACAGCGAGGCCATCAAGTGTGTGGAGTGCTCGATCAAGCACGGCGTGGTCATAACCGGCAGCTGGGACAAGACCATCAAGCTGTGGAATCTCGAGTCCCTCGAGTGCGTCGGCGAATACGCCCAGCCAGACAAGGTGTACACGATGGCGTTGGCTGATGACCGCGTGATCGTCGGCATGGCTGGTCGACACGTGTGGGTGTGGAACCTCAACAATATGAGTGCGGTGGAGCAGCGACGAGAGTCGAGTGTGAAATTCCAGACCCGGTGCATCCGTGCAATGCCGGACGCCCAAGGGTATGTGCTCGCGTCGATTGAGGGCCGTGTTGCTGTGGACTATCTCGACCCGTCTGAATCGTCGCAGAAGCGCAAGTTTGCGTTCAAGTGCCACCGCTCGAAGGAGAACGGGCGTGATGTCATCTACCCGGTCAACGCCGTCGCCTTCCACCCAACCTTTGGCACGTTTGCGACGGGCGGGTGCGATGGGCTCGTGAACGTGTGGGACGGCGTCAACAGGAAGCGCGTGTACCAGTTCCACGAGTACCCGACGAGCATTGCGTCGCTGTCGTTCAACCACGACGGGTCGCTGCTCGCCATTGCCGCATCGTACACATATGAGGAGGGCGACAAGCCCCACCCGCCCGACGCCATCTTCATTCGTCGAATCACGGAGGAGAACGTCAAGCCAAAGCCACGCTCATAGACACACACGCGCGCACGCACACACACACGCACACGCACACGCACACGCACACGCACGCACACTCAAATCAACACACGCACCATATGTTCCACGTTTTTTTCTGGTGTTGTTTCTTCACTGACTAACAATACAATCACGTTTCGTTTCAAACAAATGAACAAGAAACAAGCAATAGC\n>XM_002366755.1 Toxoplasma gondii ME49 hypothetical protein partial mRNA \nATGTTCCATCTAGCCTGGGTTGTCAGTCGAGAGATCCCCTTCTGTTTCGTCTCAAGCGTCTCAGCTACTTTGCCTCTCGCTCTGTTGCCTGTAAAAACGCTTTGTCAGAAACGATCTCTTCAGATGCAGAAGGAAGTTGAACAGAGAGGCTTGCTCCGTCTTGAGCAGTCACGTCTCATCCAAAAGGTCAAAGAGGAAAGCCAACTCATGGAGGAGTACGTGGTCGAAATCGACCGGCTAAACAACGTCATCAACGTCCTTGAGAAAGAAATGCTCAACACCAAGAGGGTGTATCAAACAGCGATTGAGTCGCGAAATCTCACTGGCATTCAGCTGATTGACAGGCAAGCGCAAGACAAGGACACAGAAAAGAAAAGCCAGCGCGCCCTCCACGAGAAAGAGCAGGATGTCAACACGCTCCGGCTTCAACTGCAAGAAGTCGAAAGGCAACTGCTTTCGAAAAAGAGAAGGGCGAAAGAGGTGCCCATTTTGACGGCGGAAGTCGAGAACTTGAAGACGCAACTTCAGGAAGAAAAACAACTGGCAGAAAACATCAGTCGCAAACTAGAAAACCCAACTGAGGGCAGACAGTGGCAAGAACTTGGAGGGGAAGATCCAGATATGGAAACATTGGAGGCGAAATATCGGGTGATTGAGCAACGTTTCAGAAGTGTAAAGAGCGAGCTCATTGATCAAGACTTGCGCCTTGAAGACTTAACGGAGTTGACAGAAAAACAGAAAGCGAGAGCCGCAGAAGAGCACTCGGACGCGATTCGAATTCGCAGCGAAATTCTTAGACTCCACGGCAAACTGATCGAAATGAACCGGCGCATGAAGGTGACGATGTCTGAGTTGACGCTCTACAAGGAGTATTTGCCGAGACTTAAGCAGCTTCAGGCAGAAATAGCACAGAGCGTGGAGAACGCCCGTGAAAATGTCTTCTTCGGTAGACCTGCTACACCAAACGCAGAGGAAGAACTTGCCGATATGCTCAAGAGAGAGGTGGCTAGAAATCAGATCCTCTACGCAGCTAAATTGCGCACTCTCGAAGAGCAGCGTGAGGTAACAACATTACGGTAA\n>MW050496.1 Uncultured Ascomycota clone OTU1949 5.8S ribosomal RNA gene, partial sequence; internal transcribed spacer 2, complete sequence; and large subunit ribosomal RNA gene, partial sequence \nGAAATGCGATAAGTAGTGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCCTTGGTATTCCATGGGGCATGCCTGTTCGAGCGTCATTTGTACCCTCAAGCTCTGCTTGGTGTTGGGTGTTTGTCCTCTCCTTTGCGATTGGACTCGCCTTAAAATAATTGGCAGCCAGTGTTTTGGTATTGAAGCGCAGCACAATTTGCGATTCTATCCGGTAATACTGGCGTCCATAAGCCTATTTTACACTTTTGACCTCGGATCAGGTAGGGATACCCGCTGAACTTAA\n>XM_053179842.1 Colletotrichum chrysophilum uncharacterized protein (COL26b_007034), partial mRNA \nATGGAGCCAGAAGGCCCATTGAATGATGAGGACTCGGATGAAGACTGGTTCTGTGGATCACCCGCATTCCCAAACCAGTATGCCTGTATCACTCTTCGCGGTGGCTCTTGGAATGGTCCTCCGGAGTGGGAAATCCCTGACGATGGCGAAGGGCCGGTTTTTGAGGGACCGGGAAGTACTCCCAGTCTCTCCATTCTGGAAAACCCAGCCTCGCCGCCCACAAATATGCAAGAAGGCATCGCGTCTGGCTGCAACCGCTACGTCCAGGCCAACATCACGATTGCCTCATGTTGGAAGATTACCAATGATGGCGGCACCTTGCAAGCACGCTTGTTCGAGGTCGACCTCGTTGTCGGCAAGCCGGGCGAGCGCTGCGATACGCAGGTGTGGCTTGGCTACTAA\n>XM_012089747.1 PREDICTED: Cercocebus atys germinal center-associated, signaling and motility-like (GCSAML), mRNA \nAGATGCAACGTCCTGCCTCATGCATTTTCCTCTTGGTGCTTTGGTCAGAACTTCCCCAAGTGGAGTGAAACTCAGGAGCTGAGAAACCGAGTCACTGTGAAAAGATGGGAAATTATCTCCTGCGAAAACTCAGTTGCCTGGGAGAGAATCAAAAGAAGTCCAGGAACGGAAACCCAGATGAGGAAAGAAAACGGCAGGAAATGACTACATTTGAAAGAAAACTTCAAGATCAAGATAAGAAAAGCAAAGAAGTTTCATCCATTTCTAATCAGGAAAACGAGAATGGCAGTGGTTCTGAAGAAGTGTGCTACACTGTCATTAATCACATCCCCCATCGGAGATCTTCCCTGAGCTCCAATGATGATGGCTATGAGAACATTGACTCCCTCACAAGGAAAGTGAGAGAATTTAGAGAAAGGTCAGAGACAGAATATGCCCTTCTTAGGACTTCTGTTAGTAGGCCTTATTCCTGCACCCATGAGCATGATTACGAAGTTGTGCTTCCACACTAAAACCCTCAAGCCGCTTTATCACCTTGTAGCAATGAAGATGATGCAGAACAGCAGACTCTGGAGAAGTTCTTCACCCTGAGCAGTGCATGAAACATTCCTTTCTGGCTAAAGTTTAGAAATATTATCTTATTATATATCCTTAGGCAACTCTGAAATGTGGCATCTCTGTGGTTTAGGTGGAATCATAGAAATTGAAACAATGATCTAAAATATTCTATGTGTTTTTGCTTGCAAAGTTTGAGGACATGGAGGTGATAAAAAAACTTTCTTAGGACAATAATGTAAAATGAAAATAAATTCCTAATCCCCCTGACTAACTGAATGGACCACCTTCTGGGCCAAGGAGACCTCAGATGATCTTGAAAGACTGAATTCTGGCCATGATAGGAAGGGAGATGAGACACACCTTGTTATACCCCTTCCCTTTTGGAGTTTAGGCACAAGTGACCAGGATGAGTCATAAGACTGATGAAACAGACTGATTGTGGCAATAAGAGTCCAAATTCCTACCTGACTCTGGTGTAGATCACACGCTGTCTGAGGGGTTCCATCTATGAGACTTTGTCTACATAACAAAGACCTTGGTTTCCACAACCCCTTTATTTTAGCTAAAGCATTCTTCTCTACTGACTTCTTAAGTCTTTAGACAAAGCTTAACTCTTTCAACCAATTGCCAATCAGAAAATATTTGAATCTACCTATGACCTGTAAACTCTCTCCTGCTTCAAGATCTTGCCTCTTTAAGCTGAACCAATGTGCACTTTCCATGTATTGATTTGTGTCTTTGCTTGTAACTCCTGTCTCCCTAAAATGTATAAAACTAAACGGTAACCTGACCACCTCAGGCACACTTTCTCAGGACCTCCTGAGAGTGTACCCCAGGCCATGGTAACTCATATTGGCTCAGAATCAACCTCTTTAAATATTTTACAGAATTTGGCTTTTGGTTACCAATAAATCTCCACAAATAAATGTCCAAGAATCTTCAATTCCAACCCTGCTCACCAAAGTTCAAATGCCAACATCTCCCCATCCAATTACCTATTTCATTTTTGAGGTGTAATCTACTCAATAAACTGTATAAGACCAGTGACCAGACCCTTTGCTAACCTGATATTTACTTCAATTTTTCTTTTTCTGTGTACTGGAGATTTTTGCTTATAAACTTACAGTAATAGTTCAGAAATTAATAGTTTTTGACATTGGCTTTTCTGAGAAGAAAATTGAAAGTGTCACAAAATAAAAAAAAAAGATGAAATGAATCATATATAATTGTCCATTTTTTCAATTTTCTAGCCAGTAGAGGATTGAAGGATTCTGTTTAAAGATTAGTAAAAATTGAAAATAAACTTGTGCTTATACTTTGTGTGCAACACACTAGTTAATTTAACCTGTGACTAGTTATCTCTACTGAAGGTGGATGTATAGTTTCTGGTTTTAAAATTCAAGCAAACTGGAAAATGATCCATCTAATTATACTTTCTTTCCCAAGAAATTTTTAAATGATATGCCAGCTTCCTAATTTGGAGATAAAAGCCTTAATTGACAATGCATTTATGATATATATTTTTTGTATAGTTACAGTATACAAGTTGAATATCCCTTAGATAGATGCTTGAGAGCAGAAGTGTTTTGGATTTAAGATTTATTTTTGGATTTTGGAATATATCCATACACATAATGAGGGAGTTGGAAGATGGGATTCAAGTCTAATCATAAAATTCACTGACAGACTGGATTAAGAAAATATGACACATATACACCATGGAATACTATGCAGCCATAAAAAAGGATGAG\n>XM_028615259.1 Sodiomyces alkalinus F11 hypothetical protein (SODALDRAFT_392700), partial mRNA \nATGATGGGAATGCACCCAAGCCACGAACTATCCGCCATCGAGGAAGTTCTCTCAGATGAAGATGAAGATGATAACAACAAGAAGCTGAATGATGTTGACCATGAAGTCTCGGACCAACCGTACCCTGCCCTTGGTTCGGGTCCCATCGCCGAAGAGAGTCAGAATGGCCAACAATTTCCGCCGGAATCTGCTGAACATGACACGAAAGACTCCCACCGCTCGCAACAGGTAGATGCTCAGCATAGCCCTGATGCGAACACGGTTGGCTTGGCCATCTCGGAGCACGAGGACGGCCAAGTTAACCAGTCTGGTTTCTTTGGCTATGTCCAACGGAACGACGAGGGGCACTATGCTAATGCCCATGATACCTCCGATGGGGATTCGTATGATCCGATGGACCTTGCTCCGCTTCAAGACATGGTCCGTAGCGTTCCCAGCTCGGGGGGCTGGGAGCCCGAGGAGCAATATGAAGCCAAGGCTCTTGAGGGTCTTCAACGGGAAGAAGAGGTTGTCCATACTCGAAAACCAGTCCGTTCAGCCTCCCTGGAAGAATTATATAAACTTACTACCGAGGGGTGGCTGGATGCCAACGAAGGATCGAACGGTTGGTATCCTATCAATGGCCGTGATGATCCAGAGGGAGACGAGGTTGTTCATGCGAATCAACCCACCCGTCCAGCCTCCCTGGAAGAGCTATACCGGTTCACCACAGAGCAGTGGCTAGATGCCAATGGAGAAGAGGACGGCTGGTATCCTATCAATGGCAGTGGCCGTTTATCGGACCCTCCGGCGTCCGAGTCTCGTCAAGATGACAGCCCAGTTAACTTCGACCTATTTCACGCGGTGGTTAATTATGTTCCTCCTTACTTCACTACCAATTACCAAGGGAGACAGGCCGGAGACCGTACTGGTCAGCCTGAGGCCACTGGCGGTGCTGTCTATTCCCCGAACACCCGTGACTGGGCCGATTATGGAAGCGCTCTCGTCGACTACGCCCCTGAGACGGCGATTCCCAAGGTTCCTGGTTGCACAGCTGGCCAGCATCATGCCCAGAATTGGACCTTCGGTGCTTCTGCCTTCATAGCATATGCTGCCATGCGTGGTTCGGGCATGGATACGGGCAACCCGCTCCAGACCTGGATGGGGGTTAAGGGTATAGAGCGTCACGGCCATGACCACGACCTCGACTACGACCACAACAACTCCCGGGCCACGGACTCGAAGGCCGACGACTTCAAATTCAAGCAACTAAGAAGTTTCACCGCCGAGGTTGAAGTGGCCCTTTGGGAAAGACCCTTGGTCATTGATGAGAACCGTCAGCAGCGAGTTGAGATCCCCCGACCCAAATACAAGCACCTGAACCCTCCCGAGGGGTTTGAATATCCCCATCACCTCGCGTCGTCGATCAACGGCATCGCCGCGGATAGCTGGGAGAGAGCGAAGACTTTCGAAGAGGAGTACGATATCTCGGATGACGAAGGATCGCCTCCCTCTGGTCGTATATCACCTTGCACATTCCGCGTCCTGGCCGAGGGTTGCAAGCGCTGGGAAGACCCGGCCAAGGACCACAGAGTCGAGATGCCCCCTGAAACGAAACGACTTCGACCTGAGACTCCTCCCCCGACAGACATGCCGACATATCATCGCAACCGTATGGGCCACAAACGCACCTTGCAGCAAGACGTGGAAGACGGTAGCTGGCTCTCTCCCATCTACTCTGTGACTGAAGACCCGAGTATCATCTACACGCCTCCCGGAACCCAACGTCATCCGACAAACTTTGCCATATGTAACTGGCAAGACAACGTCCACGAGGTCATGGACCCTCTTGGCGCCCAACATCTGCGTGAATTCCAGCCCACCAGCCATATCGCCCCTAAAATCACCACGCCCAACGACCTGGCCCCGGCCCGCATAGCCTCAGCACACACCGCCGCGACGCGAAGCTCAGAGAACCGGCCCTACACAGCAGCAGAAGTGCAAGCAGCCCTGCTCTCCCCGCAAGCGCGACCGCTAGTAGACGGCAGCATAGCGCCCGAACACGCAGCGGCGGTGCTCGGAGCCCACTGGCAATGGGCATGCCAGATGCGCGACGCCGCGGCGCAGCAGTCACAGCGCAACGAAGAAGCGCGGCAGCGCATCAATTCTCTGCGCGACGAGCTGCGCGACATGGAACTCTGCGTCGACCACGTCCTGCAGAGGCGCGAGGAGGAGGAAGAAGAGGTGGTGGAGGAGGAGGACCAGCGCCGCGTCGAGCGCCGGAACCGCCGCATCATACGCCAGGTCAGCGCACACCTCCGCGAGGTCGCGTACGAGGTCCACCGTCGTAGGGAGCAGCTCTGCGTTGTCCTCGGCGAGGCGGCGCAGCTGGAGTGCGAGGAGCAGGTCCTTACTGCCGATGTCCGGGCTGAGATTGCGCGGTCTGGTCTTCCCGATGCTGATGCCGTTCGTGCGGAGGCTGGGCGGGAGTTTCTTGAGCTTGCAGGAACTACGTGA\n>XM_017399093.1 PREDICTED: Daucus carota subsp. sativus histone deacetylase HDT1-like (LOC108224459), transcript variant X2, mRNA \nCGAAATTATAGTGGTCCGCGATACACAGTATCCTCACCCCCTTCCTATATAAACATATGCATTCTTCATCTTCTCCGTTAATTAGCCCTAGCTTTTACTCGAAAAATTACTCGAATTAGCATCAACACAGCTGCAATGGAGTTTTGGGCTGCTGAGGTCAAAGCTGGAGAATCTTTCAAGGTGAAAATTGATGAAAATAAGGCGTTGCATCTCTCACAGGCTTGTATTGGTGATGTCGAGAAGGACATTCCTGTGTCCATTTGTCTCTATGTGAAAGTCGATGAGAAAAAGCTTGCCCTTGGAACACTTAACTCTAAAAAGTTATTTCAGCAGAGCTTTGACTTGGTGTTTGATAAGACATTCGAGATATCCCACAACTGGAAAAATGGAAGTATATTCTTCCTTGGATATACAGCTGATAATGAAAAATCTGATCGAGCTTCAGATGTGGATGATTCTGATGCTGAATCGGATGAAGATATCCCAGTTATTGCTGCAAATGATAAACAAAAGGATAAAGAAAAGGCGAAGATTGTAGAACCCAGAAAAGCTGCGAGTTCAGATACTACTGATGACTCTAGTGAAGATGATGAAACTTCAAGTGAGGATGACCCGAAGGTTAGTGTTAAGAAAGATTCTGCTGCTGGAAAACAGAAGGCGAATATTGTAGAACCCACAAAAGATGTGAGTTCAGATGATACTGATGACTCTAGTGATGATGATGAAACTTCAAGTGAGGATGACACGAAGGTTAGTGCTGAGAAGGTTTCTGCTGCTGGGAAACAGAAGGCGAAGATTGTAGATCCTAAAAATGATGCCGACTCCGGTGATGATGATGCAATGTCTGAGGATTATTCAGAGGAAGCTGATGAGTCAGATGAAGATAGTGACAGTGATGAGGATGAAGAGACACCAGTGCAAGTTAAATCTAGCAAGAAAAGAGCTCTGACGCCTGCTAAAAAAGCTCTCCCCGAAAAGAAAGCTAAATTGATTACTCCTCCAAAAACTGATGGCAAGAAGAGCAGTGTCCATGTGGCTACACCCTATCCTTCAAAACAGACTGGAAAAACTCCTGCTAATAAGCTGAACCAGCAGACTCCCAAGACTGACGGGTCTCATACTTGCAACTCCTGTAAGAGGACATTCAAATCGGAGGTTGCTCTGGAATCTCACAACAAAGCAAAACATACTGGTGGAAAGTAAATAGGATGCGAACATTGATTTTTGGTGATGTACTTTAGAATTGCGATGAACTAGGTATATGGTAGGCTTTTGGTTGTTTGTGGTGAAGTAGTTTGTTTCCTTGTCTCTTCAAGTTGTTTTCAATTGGATGCTGTGCCTCTGTAACTGAAGAAACTTGGAGGGTATGGAATTTGAAAGACTATGTTTGATGTTTCTTGTTTGTCTTTTTA\n>XM_009911451.1 PREDICTED: Picoides pubescens F-box only protein 15-like (LOC104310052), mRNA \nATGGACTTGCTCAGAAATCCTCTGCCATGTGAAAACAAAGAAGCCATGAGAGCTGCTGGCTTGAGCTGGATGCTTGTCCTGAAAGAGAAGNNAAAGGAACACCTAAAGGAGAAGAGAAAAGTATCATTTCAGGATGCATTTCTTAACATATTTTGGTATGGTATCAACTGGCCATGTCTGGATGTCCTCGCAACACTCAGGCTCTATGGAGTTGCGCCTTTATTTCCTTAGAGCAGGAAGGGACCTCGCTACCATTCCCTGGTTGCTGAATACCATCTTGCTGATCTGACAGCACCTGGTGCTGACAACATTCTCCAGCTCTTCACTCTGAAGCCAGGACTCTTAGTAGGCCTTTGGAAGGACACAAAGGAGATCGCTTCTGTCTCAGCCAGTCTTCATTATCATCAGTTCATGGAGAGAAGCATCTTGGGTTCTGCTGCTTCTTCTTATGCCCGTCCACTTCATCAGCCTCTACTGGGTGATACTGACCCAGAGTATGGACTGCATGGCTACTGTCTACACTTTGAAATCCACAATGGAACCTGTGCCTACATGTGTGCAACATTCAGGGACCTCTTCTGCAAAAAAGGTGAGATTGCAGATGGGTATGTGAGGCTCACAGCTGTCAGCAGCCTGCAGGACAACATGGACCACTGTCTTTTAGCCACCATGCCTGGCTTGCCCTGTCAGCTGGAAGGCACTGTGAAGGAGTGCTGTGTGCTGGATGTTACTCTCTTGTATGAAGACGGAAAAGCCTTCTGTTGTTTCAGTGGCCCAGTCTCTGTGGGACTGTCTTCCAGGACTTCAAGCTGTTATGACTTGCTGGGTCACAGCTCCAGCAGAGAGTATTGTGAACCTTCAGAAGGCGGAGTCCGTGCTCGGTTCACCTGTGTGAGTGAAAGCAGGCAGCACCTTGGAGTCGTCTTTGCTGTCTGTCCACCTAACTCGTGA\n>XM_019704704.3 PREDICTED: Aedes albopictus 60S ribosomal protein L29 (LOC109428867), mRNA \nATGGCCAAGTCCAAGAACCACACTAATACACACAACCAGAACCAAAAGGCCCACAAGAATGGGATCACCAAGCCANAGCGCCAGCGTAACGAATCGACCCGCGGTATGTGCCAGAAGTTCCTGCACAACCTGCGATTCTCCAAGAAGGGAAACCTGTCCCGTGAAGAATCCCTGAAGCGCGCCGAGGAACGCAAGGCCAAGTTTGCCGGACAGCCAGCTCCGGTCAAGCTGTAAACTGCTTCCTTCTCGATTCCGCTTCGGATGATGATGATGATGGTTGGGTGGTGTATCCGTTTTGATCCGTGATCAACATCAATTCCTAATCTGGTACGCGTTACGATATCCAATGATACCGTGCAGTTGATGAGTACAAGTGAGTTCAATGCGGAATGAAAATTCAGTTGGA\n>XR_007260822.1 PREDICTED: Pyrus x bretschneideri uncharacterized LOC103942768 (LOC103942768), ncRNA \nCAATTATGGAGGCCAGAGAGAGAGGGGGTGCGGCATAGAGAGAGAAGAGATAAATGTGTAATTGTGAGATAGACGGTTCTATGCTCACATAATTTTCTGCTTGGTTCTTCAGATACCTTCCGTGCAACATTTGATGTGGTATGGTTTTCCAATTTCCCCTTTGCAACAATTTCTTTTTGGTTTTTGGAGTATGTATGATTTATTTTTAATTAGAGAAGAAAAATTAATAAAACACAAGAAGCAATTGGAAACATGGCTGCAAGTGATAAGCCAGAGTCTTTTTTTTCAATTAACTATATTACTTTTGTAGTATATGCATGCGCAGGAAAAATCCAAATCGTACTACAAGATCTTAGGGCTCTGTATTTTGTGTCAAACCAATGCATTGAGAGAATATGAACTATTGCGTCTGGTTTGGATATGTGTCTATGGTGGTACCCCTATTTCAAGGCAACTGAGAGCGCTTGACTATGGTAACCCAATGGCTTTCTTTGTTGTTTTTCCTTAAGAGGTTATCGATTCCTTACTTTTTTAACTGAGTTTTTGACTATCAATATTTTGCATTTCTGAGCTTAAAGGCACAAAATGATTATTTGTTATTGGGTAGATGGGTTGCTAAAGGCAAGCAAGACACATAAAAATGACCATTGGGAACGAAAAGTCGCTTCTTCGGTGTATTTATACTTTTTTTAGTTGTATCATGCGAAATTAAGTATCGATTTGCTATGTGTATTTTGTTGAAGTTATGTTTTGATGAGCTTGGATTCCTGAAACGTTTGATACTAAAATGACATGAATAAGCATAATGAATGGTTTGAAAGATGCTATTAATGGTTTTGCGAGTATATCGTTAGTCGTTTGGTTGTATGATTTGTTTTTGTTTTTTCTTTCAAAGCACTTTGCTCTTAATTTTTTGGGGCTGCAGCTTTCGAAGCCCTTTATGCTCAAGGTAAACAATTTTGGATTTCAGCCTTCCAACAATTTTTTTATTTATTTGAATATTGTGAAAGTTGTGTTTTATATGCTATGAAAGTTGAATCTGTGAATTTTTTTTTTTTTAATTCATGGTATATATTCTATTTCATAGTTTTGGATGATGTTGGATTGAAAAGCTTTTCTATAGAACTTATAGTTATTTAAAGTGTTTTATCCATTCTTACATTTACTCTCATAAATTATAGCTGATTTGTTAATCTCTTACCAAAATACGCAAATTATTTTGTAAATTTGTTCTTATTCTAGCAGGAACAACAAATGCAGAAGGGGAACACATATATAATCAGTGTTATTCTAGCCAAAACCTTTATTCTCACAACATTGGGTACGATTGTTATAAGTTTCAATTCATTGTACCTAAATTGAAACAATTTACTATTAGCACAAACTTTTTTATATTTTAAACATGATATTTCATGCATTTTCTAATCCTGCAGCAACGTGCGGGTAGTACTTTCTAATATCTTCTATACATCAAATACATTTCCTTGGCTCCA\n>XM_022304284.1 PREDICTED: Myzus persicae uncharacterized LOC111026242 (LOC111026242), transcript variant X2, mRNA \nATTTCAAATTTTTCTATATAGTATGAATACAGAATATATGATAATATTTAGGAATAAAATTACCTATGTCCTATATTAATATAAACATATTTAAGTACAAATCAAAGTATAAACGCATGTCGTTAAGTTAAATAAGGGTTTAATTTGGTTTATCTGCTGATATTATTTTTTTTACTAAGTATTTTATTCTAATTTCTGTGTATCATGTCGTCAGTAAAGGAAGTTTTCAAAATAAGTTTTCAATTTTTGGCTCAACAAACAGATAATGTTATCAAGGATTTCTTGAGGCTCACCAAAGATTTTATGGACAACGGACCTAATTCCAGTCTTTATAACAAAGCTGCAGAAAAAATGCAGGTTGATGAGGACAAAATAATATCAGTTGTAAAAAGCATATGTCTCATGTGTGTGCAAAGCTGTAAGCATAAACTAACTGATTTGGAAATAAAAGAATCACTGACAGAATATGGTTTTAGTGAAACCAAATTAGATATGATTATATTATTTTTGGAAAACCAAAAACCTCATTTACTAGATATTTTGTCATTAAGTGCGTTTGTATTCCCACACTTCAAAGAACTGGAGTGGCGATTTGAAACCGATATGGGATCCAGATCTTTATTACATCAAACCGTGCCAGTTGTTACATTGAAATTAGATTTAGAAAAAAAGGATATTTCCGAATCGTTATTCCTACAAACAAATCCATTAAACTTGGTTCATATCAAAGATACACTAGAGACTGCTTTGAAACAGAACCAATCTCAATGGATAAGGAAAATACGTAGAAAATTGAAATAAAGGTATAACTGTTATAAACAATATAAAT\n>KY530257.1 Liriodendron chinense AT4G19003 mRNA, partial sequence \nATGGCTCCTGGGAAAGCCATAGTAGGGGCTGCTGCTGCAGCAATTTCCATGTCTATACTCTCCATCTTCCTCTGCAAATCTCTCTGCAATCTATCAATGAGAAAATTCCAAAGACCCATCTCAAAAACCAAAGCTAGAAAAGGCCTCATCGACGCCATCGGCAATACCCCTTTAATCAGAATCAATAGCCTTTCAGATGCCACTGGCTGTGAAATTCTGGCGAAAGCTGAGTTCTTGAACCCTGGAGGCAGCGTGAAAGATCGAGTAGCGGTTAAAATCATAGAAGAGGCTCTGGAGTCTGGTCATCTTGTTCGAGGCGGTGTAGTGACTGAGGGGAGCGCTGGAAGCACTGCCATTAGCCTTGCTACGGTGGCTCCTGCTTATGGATGCAAATGTCATGTGGTTATACCCGATGATGCTGCTATTGAGAAGTCTCAAATACTCGAAGCTCTTGGAGCTACTGTAGAAAGAGTAAGACCCGTTTCGATTACACACAGAAATCACTTCGTCAATATTGCAAGGAGAAGGGCATCTGAGTTTACCGAATTAGCATCAAGACAGCGAGAAGCCGAACGCTCCGTACATGTCAACGGTCATGTCTCAGAAGAAGGAGACCGCCCATGCGCTTTCGCTAAAGATTGCAAAGGTGGTTTCTTTGCTGATCAGTTTGAAAACCTGGCTAACTTCCGTGCTCACTATGAAGGCACTGGCCCTGAGATCTGGGAACAGACTGGTGGCTACTTGCATGCTTTCGTTGCAGCTGCTGGTACAGGTGGGACCCTTTCCGGCGTTTCGCGTTTTCTTCAGGAACAGGATCCTAATATCAAGTGCTTCCTGATCGATCCACCCGGTTCGGGTCTCTTCAACAAGGTGACAAGAGGGGTGATGTATACACGGGAGGAGGCTGAGGGTCGGAGGTTGAAAAACCCGTTCGACACCATAACTGAGGGGATCGGAATCAACAGGCTAACCAAGAATTTCATGATGGCAGAATTGGATGGAGCTTTCAGGGGTTCAGACATGGAGGCCGTTGAAATGTCTAGGTTTCTTTTGAGGAATGACGGGCTATTCCTCGGGAGTTCTTCAGCCATGAACTGTGTTGGAGCCGTGAGGGTCGCACAGTCGTTGGGCCCCGGGCACACGATTGTGACCATCCTGTGTGACAATGGGATGAGGCATCTGAGTAAGTTCCATGAT\n>XM_052888826.1 PREDICTED: Bicyclus anynana jerky protein homolog-like (LOC112047489), transcript variant X2, mRNA \nCGCACTGTACGCGACGGCCGTAAACCCGCGCTCCATCTGAGCCCGCGTGCAGAAGGCAGTCAACGTCATAGGGACTTGGTTCCGCCTTTGGCGGATAGAAGTCAACCCAGAGAAGAGCGCAGCTGTGCTCTTCACTGGCAAACCGTTTTGCCAGAACAAACTCAAAGAAGTCTCACTCTACGGAGCTCCCATCCCCTGGCAACGTACTGCCAAATACCTAGGCGTGACCTTTGATAACCGCATGAGCTTCTCCATGCACATTAGGGAAGCTAGAAAAAAGGCTGCATACGTAATGCACCGCCTCTACTCGATGATTAACGTTAAAAGTAAATTGTCCCTCCGCTTAAAACTAACGCTTTATAAAACTACGATCCGTCCGATCCTAACCTACGCTAGTGTAGTGTTCGCCAACCGTCCCAAAGCGACCCTTAAGCCGCTTCAAAACTCTGCAAAATCGATTCCTACGGCAAATCACGGGCGCGCCGTGGTTTGTACGTAATAACGACCTCCATAGAGATTTAGAACTACCTTCAATAGCTAATCACATGAAACAGCTCTCTCAAAACTATTTTGAAAGAGCTGCCATCCATCCCAACCAACTAGTGGTTGAGGCTTGCAACTATACTCTCAACCTTAACGCTAACTCCAAGCAGAGACGTCCCAAAAACATCCTTTACGATCCTGACGATGACATGACAACTGACAATGCTTCTCAGGCAACACAATCACAAGCTACACAGCGTCTTCGCCGGCGAAGACGAGGTCCCCGATATCTAACGTCACCCGGAAGTGGGTTTTCTAACTCACGATCTCGGGGGCGTCCGGACTGATTCACTCAGGTCACGGTCAAACCCTCCCGAATGGCCCTCTAAGCCGAGGCCCGAGTCTCATAGGAGACGACCTTACAGAGCCGTTCCGTCCTCTGTTTTTATTTCAGCCTTCGTGCACAGGCGATGCTTCCGCGCTCGCCCACCCCCTACCGGTGACGTCGTAGTGGTTCCACAGGGAGCTAAACGGCATTTACTCAACAAAAAAAAAAATATTTTCATTTGTGGTCTCGCGCGCAATAGATGATACTTACGCCTTCTCTACAGTACTCGCGAAGTTGAACGTATTTCTCAAAGCAAAACAATGTCGGAAGTAAAAAAGAAGAGACGGCAATACTGTGCGGAATATATTAAATTCGGATTTATTGAAAATCCCACAAACCCATCGTCGCCTTTTTGTCTTCTATGTCTAAAAACATTTTCGAATGAAGCAATGAAGCCTTCAAGGCTGCAAGATCATTTGAATAAAATGCATCCAGATAAGAAAGACAAGAATGTAGCATATTTTCAAGACCTAGAGAAGAAGCATAATACACAGCCAAGTGTAGCAAAACTATTTGTCCAAGCGCAGACGTCGGACGACTACGCGGGTTGCGGGGTGCGGGGACACCGCGCCGGCCCGTCGTGCCAGCGACCGACGCGCGGACACTTCGAAATTGATTCGCACGGACTGTGTGCGCATACACAATACAATATTGTTGTTTGGTCTTTTATATACTTAAATAAAATTCACGAAGAGCACCAGTATTCATATTTACAACCACCAGCTCGTTAACACATCACTATTTTTGGTCTTTCGCCCTTCTAACTTTGTGGATTTGGAAACAAGCCATACGACAAACAAGAAAGGATTTCTGCAAATGGGAATACCTACAACACACAGCTGTGAAGAATTACGAGAAGAACACCACGGAAACAAAGGACGAGGGACACGATACTGAGTGAGTTCGTTCCATTTTCCTTCTTATTTTTCCGTCTTCCTTGCGCCTTCCTTTCGATTTTTCAAAATTAGAATTTCTTCACACGCTTAAGGTAATCATTATTACGTAATAAACTTACATCTAATTCTTATAATAATCATAATCTTCATATGTACTTAAATACTTTTATTGAGAATTATAATAATCATTCATTATGCTCCAAGCTAATTTTTTTAATTAATTGCTTGCTTATTCATTTAATATTACACGTAGTTAACTACCTACACGTATTCAACTCGCTTCGACCGCTCGGCCGCTCGGCCGCTCGGACAAAAAACCGGTTCCTTATCGCTAGCGACGTAGTTCTCATACCTATCTTGCAGTCAATTTGCATCGTAATAATATAATATGAATGCATCAAATAGGTAACTACTCATCACGCGCGGCTTTTTAGCTGTTTTCGGCGGCTGCTAAGCAAGTTGACGACGACCTTCGAGCTTCGTACAATATCTCTTTGTTAATTGCTCAAAAAGGCAAACCACATAACATCGGAGAAGAGTTAATATTGCCAGCAATAAATCAAGTTATAACTACAGTGGACCCCCGGTAATCCGGCCTCTGACTAATCCGGCGCCCCCTGTAATCCGACATGACAGAATTATGTTTGACAATTCTTGCTAATATCACGCAAGTTTGAACAGGTCACAACTCGTACGCGCCACCGCTATTGTGCTCGACGCGTATGCATTGTTTTACTTAGTTTGAATTTGACTACTAGTGATAGCGGTACGGCTTAGCGTACGTTCATTGTTTACTACTTATTTATTCATTGTGTATTAGGTATATGTAGTACCTAGTAATGTCGTCATAAACCCACAAGCGAAAGCACAAAACGTTGACAATTAAAGAAAAATGTGATATTTTAGATCGCTTAAATCGCAATGAAACTTTCAGTAGTTTAGCAAGTGAATACGGCGTAGGCCGATTTACAATTTATGACATTAAAAAAAAACCACGAGAAGAAGTTCGTGTCAACTACTGACTGCGGGCCAGGTAAGAGATAGACACTCAAGGAAGCTGAACATCCAGAAGTGGAAGAAGCTTTGTACATGTGGTTTCTTCAGGAAAGAAACATGCATGCACCAATTTCGGGACCCATGTTGGCGATGAAAGCTAAGTTTTTTTATAAGGAAATAACAAAAAAAGATGATTTTGTGGCCAGCAAAGGATGGCTAGAACGTTTTAAAAGTCGTCATGGCATACGTTTAATGACTATTACAGGAGGGAAACTTTCTAACGATGCCACCTGCATAGAGCCCTTTAAATTAAGATTTTTGCAAAAGGTGAACGATTTAAATCTTGGCCCGTCACAGGTGTATAATGCAGACGAATCAGGGCTTTTTTTGCGTGTGATGCCTAACAAAACTTTCGTTTCTTGTAACGAAAAAGACGTACCTGGACGAAAAGTGAGTAAAGAGCGTGTAACCATACTACCATGTGCTAATGCTGCAGGTACACACGCGCTTACGATGGTGGTCATTGGGAAATCTAATAAACCAAGGGCATTCAAAAACATTGATTTACCTGTACACTATTACGGACAAAAAAGTGCATGGATGACAAAAGACCTTTTCAAAAAGTGGTTTGATGAATGCTTGGCACCTGAAGTTAGAAAATGGTTAAAAGATCATAATTTTCCTCAAAAAGCGTTGTTGCTTCTTGATAACGCTCCCGATCATCCGTCTGAAGAAGAACTGACAACTGAGGATAAATGCATCACTGCGATGTTTCTTCCGCCAAATTGCACTGCACTGATTCAACCAATGGACCAGAACATCATTCAGTTTGTTAAGCAAGACTATAAAAAAAACCTACTTTTAAGAGCCGTATCAAAAGACCAACCAATAGAAAAAACTTTAAAAGAATTTAATATGAAAGACTTGGTTTTTGCTCTTAGTCAGTCGTGGAGTGCGTTACCGTCATCAACTATTAAATCGTCTTGGAAAAAGTTATGGCCAGATATAATCACCACTCCTAGCAACGATCCACAAATCAGTGTAACTTCGGAAGTTATAGAACAAGTCTCTACTGAAACACAGATAAGTCCGGAAGATTTGGAAGTCTGGTGTCGTGGAATGGATAAAGAAGAAAATGTTTTTCTTGAAATGCCTGACGAAGATATTATAAAAGAGGTTTCTAATAATACAACAAACGATCAGGAAGATAACGACGACGTGATTGCAACTGCTCCACAAGTCACAGATCAAGACGCAGTTAACGCTTTTGAGCTAGGTTTTGTGACGGAGTAAAGCGCCATCTGTTGGTATGATGACGAAATCCGTAGAAAACGCGCTCATAAAAGGTGCGAAGAATTGATTATATTATGGGTCGCTAGTGAATGGCCGTCTAAATCATAGATGGCGACAGGATCGTGTCTCTTCGTGTGAAATTGCGTTTCGTTTCAGGGTCGGGGTGTGCAAATTGGCAATTTTCGGGTAAAACAAACTTCGTGGGGGTTCAAAAACATAAAATAAGGCACTAGAATGGTGTTGGCAAGCTTATGATTTGTGAATACAAAAATAAAAGGGATAAAGATTTTCTATTGTTATAGTTAAGATTTGTATGAACGAACGAATTTTTTGATGCGTCGAACGAAAACGTGTGAGCAAAGTTCTCGCCGGGGACAGGGTTTCGGTGATTTTCTGGAAACAGCCACCATGAGCTGAACAAAAATATCCGGGGGGAAGGATTTAATGTAGCAGGTCTGCTGAGACCAAAAACCTTAACTAAAATATTATGTTCAGCTCATTGAAAATATAAGTTTTATTAAGTCTTGGGAAAATCACAGGAGTCTTCCTTCCCGTTGGCAATGAATTCGTATAGCGACTAAATTTAATATTCGGGGGGGTGGGCCAGAGAGAACTGATATTATCAGGTAAGAAATATTTTTCACTTTACGGGACATTGTGCGGGGTCATTGACCACGCCGGTAGAACTTGACAATGACGTGTCATTTTTTTCGTTTCAGTGGGAAAAACAAGAAAGAAATATATAAGAATGAGTTTCGAGAACCTTTGAGAATGTAAAAGGGTAATTTATGAGTTTTTACGAGTTTCGAAGAGGTTGTACGAATCCGTCGTGACGTCGCGGGATTCGTGGAAGGCTTTAAGAAGATAGTCATTTGCCGGTTACAACATCCGGGAACGTCGCAAGCTGAGGCAGACGGAGTAGCCGTACCAGGTCAAGGGAGTCCGGCAGGACATATAACCGGGTAAATACCCAGACAAGGTCAGTCCTAACCTGTTTACCAAGCTTGCGTTGATCTTCGGTGTTATGGACGAGAACATATCTATACAGTGTTAATTTCGGGGGGGGGGGGGGGGGATTTTTGGATATTTGGACATTGGATCTGAACCGTGTTCGGATATAATTTAAAGTTTAGTGCTTAACGATTTATGGTGGTATTTTGTATGTGGAATTTTGTATTTTGTACGCGGTATTTTGGTATATTATGATACTTTGTGTAATTTTGTCCAACAGCAAATATTATGCTGTTTGAGGATTCTATAGTAGTACATGCTTAATTAAAGGTTTGGTTATGCTTTCTCTTACGGAGGTGGGATTGTGGGAAAATAAACAAACTTTCCGTTTGGTTGGTTAGTGACCGGTAGTGTGATTTGGACCCACGGGCTCTCAATTCAACGACTGAGATACCGGGACATTAGAGCCTTTGAGTCCGGTCCAAGTAACCCACATCTTCTTTCCTCCGTGGGACGAGAAAA\n>XM_029190890.2 PREDICTED: Osmia bicornis bicornis bromodomain-containing protein 7 (LOC114877834), transcript variant X1, mRNA \nCGTTTCTCGTCACTTTTAATTGTCTCGTAACATCATCTTGACATCGCCAGGTCGTCGCGTTATGTGCCGTCTTATATAAATAGTCGTTGTACTTCGTGCTGTACAGTGTGTTCCAAATGAGCTCGCTACGCGCCTTCAATTCAAACGTTTCGATTGTCGCTTTAGTGCGATATTTGTTTTTATGTTCGCTGATCAAATCATATCCGCGATGACAGCTCATTGCTACGTTATCAGGTGTTCTCATTGCATACTGTTTTCACAGCTTTTTGTACTTGAATGCATACATACGTTCATCGAAGCAACGGCAGAAGGGCACTATACAATCACGGATAAACCCCGTACCTTGAAGTTAATTTTAAAGGTGGGGGGTAGTAGTGGCACACCTGAATACGGCAACGAATCTCCAAGTCAAACAACAATGTTGTCTCAACATTTAGGTGTGTACCAGCAACAGTTGGGTCTCAACTGTTCCGTAACGCAGGAGTCTGAATACGATAGGTATTTGGGGCATAAGAAACTCAAGAAGAAAAAGAAAAAGAAGGATAAAAGACACAAGCACCATCATAAAGATAAGAAAAGACGAAGAGAAGAGTCAAGTCAAGAATCCGTAGGAGATGCGGATGAAAGTTTCGCAGAAGTCCCCAAAAAGATTCCTAATCACCAGTTGCTACCTCCTAGACCCCCATCGAGCGGAGAGCACAGAGTTGGCATTACTAGCCATATTAGCTCTCTGTCTCCGCATCGTGAGCCTCGAACTTGTGTGCTTCGAAAAATTGCCGAGCGTACACCCCTTCAACGATTGTTAGAACATCTTCTCAGGTCAATGGAAAAACGTGACCCACAGCAATTTTTTGCTTGGCCAGTCACAGATAGCATTGCGCCTGGTTACTCTCAAATCATTACTAATCCTATGGATTTCAGTACCATAAAACAGAAGATAGATGATAACAATTATCAAAATTTAAACGAATTTATAGACGATTTCAAGTTAATGTGTGATAATGCTACTACTTATAATCACCCAGATACAATTTATTACAAGGCAGCTAAGAAATTGTTACACGTTGGTCTAAAAATGGTTACACCCGAGAAGCTTCGTCAATTAAGACCCGTTTTAACTTATATGCAGGATATTTCAAGAGAGGAACTTGGATTCGAATTAGGTACAGAAGATCCTAACAATCCAGATGTTCCAGTAACGGAAGAGCAAATCGAACGGGAACGAGAACAGGAGGAGCGCAATGAGGAAGCGGAGGAACTTAGAAAGGAGAATCAGAGGAAAATGAGATTAGCGAATTTAGGTAAATTCGAAGCTATCCCGGACGATTTGACTCCTGAAGAGATCTTGAAACAAGCGCGAGGTGCTGCTAAAGCAGCATCCGAAAAGTTAACGTTGAAAAGGTTGAACTCGAAGATGGGTTTCCTTAGACAAAAGAAAGATGGAACTACTAGTTTACAGATAATAGTACCCGGAGATGGAGTGATTCCAGGAACCAATCAAAGACCGGTATCGTTAGGTCAACTGATAGGAAAATTGAATCATGGTACTGGGGCATTAGCAGGATTTCGTGAAGACAGGAGAAATATGTCTAAACCAGTAAAACCTTTATACTACGGTGCCTTTGGCTCATACGCGCCAAGTTATGACTCTACGTTTGCCAATCTTACAAAAGAGGAAACAGACTTGGTGTACCAAACGTATGGCGATGAGACGGCTGTACAATACGCGGAATCTATTTTAGACTTTGCTAAAGACTGTGATTATACTCTGACTATGGTCGACGATTTACTGGATATATTGACAGGAGGTGATCACAGAAAGACCAAGAAGTTCCTCGAGGAAAAACGAAGGCTCAAAGAAGAGGAGGAGAAGATAAAGCATTTACTAGAGAAACCTATGCAAGATATAATTCGAAATATCTCAACTGTTGACAACGTTAAAGTTGATATTGATCAGTTGAAAACACTTTCAGAGCTAGGAATCGATGTCAATTTCTTGGAAAATCTAGATGTTGATTTAAAGACCACTGAGGAACGTACAGCCTTGCAAAGTCGTTTGGACGATACGTCGCAAATGTTGAATCGTTTGAAGCAGGTACAACACGAACGACTCTCGGCTCCACCACCCCCTCATTTGTCGAATGTTCCTAAACCATCAGAAATCGAGGTGGCGATAGCTGACAAAATCACAGACAATTTAACGGAAATAGCTAAGAAGCTTCCTCCTTCGGCTATCGCACCCGTGGAAGGTTTGAGAAAGGCCATGGGTATAGCACCTCTTGGAGGACCAGAGCCTATGGAGGTTGAACCTATCACTCATAACCCGACTATCGTCGCAGAAAGTAATCTATTATCGCAAGCTAACGCTAATCAAGTTCCGCCGAATTTGTTGCCAACTCCCTCACCGATTCCAAACACAAATTTACTCAGTTCAACGACTAGCCAACAAGCTCAACCGATCAGTATCGTGAACGCGAATCAGCCACCTATTCAAATACAGATTGGCATGGCGCACAGTCAGACGCCGCCATCTTTACTTGGTACGACAGAAACATCCGCGGTTCCCGATTTGGAAACCGAACTTCGTGAATTTCTAGAGAGCGATCCTACGTTAGGACACTCCCCTCTTCACGACGATAAAACATTGGAGGACATTTTATCTGAGTCTTAGTGTGTACGATTCGCGATAATATATTTTTCGTTTATATACCTCCCACAGGTTGTACATTTTTCTTACGTATCAACAGCAATAGGTTTAATGCGAAAATGCGTACTGTTTAATAAATATAAGGTCGTGTCCCCATATCGTGTTGTCATGCAATCAACACCGTGCTTATTTTATATAATTATTTATGAAGTTTGCGTAACAAATAATATTAATGGAACACTTGTAAAATTTTTATGAGATACACATGTAATGCGGAATATTGTTTCATTATAAATGTTGAAGAGATTTTAATGAATTATACCCAAAGATAAATCAAATGGAATTTACTTTATTCTTACTTTTGTTTTTAATCCTAAATTTTGATGTTAATCGTTTGTCGAAATGTTACGCAAACGCAAATACGTATTTTAAGAGCAAGGAAAATACTTTGTATTCGAATAAATTCAGACTTTTCTGTTGCACA\n>XM_028730195.1 PREDICTED: Podarcis muralis actin binding LIM protein 1 (ABLIM1), transcript variant X39, mRNA \nACAGTTGCCATAGATATGCCATCTTTCCCCAGTCTAAACAGTTTTGGGAAGCTTTGTGGATCAGGGAAAAGCAAGAGGTTGGTGTCTGAGCGGATAAAGTACAAAAACTCTATCAAAAGGATGTCTATTATAGAGGACGGTGATATTGCTGAGGTCTTGTACCTCATCCCCAAGCAGTCTGTGATGAAGCAGCTGCCATACCTGAATCCAGATGACTACTATTTGTGTGAATGGTTGTTTGATTATCCAGAAGGTTCAGTGGCACATCCTCAGGAGCCTCACCATTCCACAGAGAAGCCAGTCATCCACTGCCATAAATGTGGGGAGCCATGCAAAGGAGAAGTTCTTCGGGTCCAGGCCAGGCATTTCCACATCAAATGCTTTACCTGCAAAGTGTGCGGGTGCGACTTAGCTCAAGGTGGCTTTTTCATTAAGAATGGAGATTACCTTTGTACTGTGGATTACCAGCGGATGTACGGGACCCGATGCAATGGCTGTGGGGAGTTTGTGGAAGGAGAAGTTGTAACTGCTCTTGGGAAGACCTATCATCCTAACTGCTTTGCCTGCACTGTATGCAAACGTCCTTTCCCACCAGGAGACCGGGTTACCTTTAATGGAAGAGACTGTCTCTGTCAAATGTGTGCTCAGCCTATGTCATCCAGCCCAAAAGAACTCTCCAGTTCCAGCAATTGTGCAGGCTGTGGAAGAGATATAAAGAATGGACAAGCATTACTAGCACTGGATAAGCAGTGGCATCTGGGATGCTTCAAATGCAAGGCCTGTGCAAAAGTCCTGACTGGAGAATACATCAGCAAAGATGGTGCACCTTACTGTGAAAAGGACTATCAGGTTCTCTTTGGTGTCAAATGTGAAGCATGCCACCAGTTCATCACTGGGAAAGTCCTAGAGGCAGGGGACAAGCATTACCATCCAAGCTGTGCACGATGCAGCAGATGCAATCAGATGTTCACAGAAGGAGAAGAAATGTACCTGCAAGGTTCTACAGTTTGGCACCCTGACTGTAAACAGTCCACAAAGGGTGAAGAAAAGCTAAGGCTGTTTTCACCACCTTGTATAATGAACTCCATCAAAAAACTAAGGCAGCCTACAAGAACATCTTTGGAAAGTATTTATTCCAGGCCTGGATCCAGTATACCTGGCTCACCAGGCCATTCAATCTATGCAAAAGTAGACAATGAGATCCTTGATTATAAGGATTTAGCAGCCATTCCCAAAGTCAAGGCCATTTATGACATTGAGCGTCCAGACCTAATTACTTATGAGCCCTTCTACACTTCCGCCTACGAGGAGAGACAGGAGAGGCAGAGTCTTGGAGAGACTCAGAGTTCAAGATATGGCAGTTCTCCTGTGCACGATGAAAGTTCTCCAAGGACACTCTCTCCAACTCCATCTGCAGAAGGATATCAGGATCTTCGGGATCGGATGATACACCGGTCTACCAGCCAGGGGTCCATTGGTTCTCCTGTGTACAGTCGTCACAGCTACACTCCCACAATGTCACGTTCACCACAACATTTTCACAGACCTGATCAAGGCATCAATATTTATAGAAAACCTCCTATCTACAAACAGCATGTACTGTTGGAAGGCATGTTTTTGTAATTCCCTGAGCAATGAGCCAAGATAGCTGCTCCTTATCCATTAAAGGCAGGGATGGGAAACCTCCGATCTGGGCATCAAATGAGACTTCTCTTCTGGCCCTCAGGACTCTCCGCAAGCTACACACCCTCCTCAGTCACCCACCCCTGCTCCCCAGCCACACCATTCTAGGACTGATCTTGGCTGGCTGGAATGTGTCCCTTGCTTGCCTGGGTGGAGGATAGAAAGGGGTATATTCAGTATGTTTAGAAACTGACCTACTGTAAACAGGTTAAATCTACATTCATTGCTCTGCCCACTTTTGCCTGTGAGCCCCCCCACCCTTGGGAGGCTGCCTAGAAGGGAATGTGCCCTCAGTCTGAAAAAGGTTCTTCACTTCTGCATTAAGACTTCACAGTTTTTCAGGAACTTTTCTTGTTCATAAGCCCCCTTTGAAATGAAAGAGAGCTGCTAGTCTGCACAGGATGAAACTCTTGTGCAGCTTTCATTTGTTTCACTTAAGCCTGTGCACAAGATATTTCCAGTTAGTTACATCTCTTATGAACAATTTTTATTATATTTCAAAATAGTAAGGGGGCTTCTGCAAGTAAACATCTTTTGTTTCTTGTTTGCTCTTCCCTAAAAATTCTACATTTTATTATAACTTGCAAACTTTAAAAAGTTAGTATTCTTTCACTCTGCTTTCTCTTCTTCTGGAGAATGAATCTAGTTAAGGTTTTAACTATGTAGTAGCATCTGATAAAGACTTTCCCTTCCATCATGCATGACTAAATAGTTGCAGGACTTTCATTTAAAAATGTACTTTAAGAAATGTTAAAAAGTCTTAAAATATCATGGAGTTGCAGTCTAAGGCTGAGATGGCCATGGTTTAGGGGAAAGGGTCTTAAGGGTCAAATTGAGAACCGTTCAGGGCCTGATTAGGTCCATTGGCTGGTGGTTTCCCACCTCTCCTCTAAGTGATCACAGGTAAAATGGCCAAATTCATTTGAACGGAGCATTAAAACATTGAAGTATATTTATATAATATGCAGATGGACAATCAATATCTGGATTTACCCTTTCTCTTCTTATGCAAGCATGGCCCTGTATAACTTTCTAACATTTTCTGATACAGGCCTCGGTTTTAGCTAAGTTTGTGACATCTGAAAATACTCTTTGGAGGCTTTCAGAAACACAAACCATAAAATAGTAAAGACACAAAATATATCTTGGGAAATAGTTTTTTCTAGTTCACATTCTTTTCTATCTTTTTTTAGTTGCTTCATACACAGTGGAATCAGCCTAACATTTGGTTATTGAAAACAGCAAAGGGTGAAACTACACTGTCATTTTGTATATGTAAAACTCTGCCCTGAGGTGATGTTTTTTCTTTGTTATTTACTGGCATTAAATCTGCCTTCTTCTTTTCAAATATACATGAATCTTAAGAACAGTTGCATGCATCTCATGGCGATGTTCCCTCATACATAATGATAGTATAATTTCACCCTAAGTGAATTGCCAGGATAAATATTACACTATTACTATACCTTGCTTTGGGATCAATTTCACATGGTGATGACAATGCTCTGAAGTAAACATCAAGGATGCTTAATAAGAGATTTAACCAAAATAAACTGAAGCTAATTATTATGTAGCA\n>XM_030853958.1 PREDICTED: Globicephala melas ubinuclein 2 (UBN2), transcript variant X2, mRNA \nGAGGAAAAGAGGAAAACTGAGCCACAGCCACGACGGTGGATGTGAGCGTCTCCTGTCTGCGCATGCGCCCGCTCAGCGGCCTGCTTCTATTTATGTGGGGGATCCAACATGGCGGCCGCAACGATCCTGGCGATGGCGGTGGAGCCCATCAGAACATAGTGGCGGGGAAGGGGGGACAGTCCGCACTCACGGTGGCGTCGGCGGCGACGGCTGAGGGTGGTGGAGGGAAGAAAAGCGACGGAGAGCAAAAGGAAGGGCAGGCAGGCAAACAACTCGGCGTAGAACCGAGCGCCGGCTCGAGCGAAGGCAGAGGGCCAGAACAGTGGGGATGGCGGAGCCACGCAGAGTAGCGTTTATTAGCCTGTCACCGGTGAGGCGGCGCGAGGCCGAGTTCCCGGGGGCCGAACGCGAGCCCGACTACCCTCGCGAGCCCCCCCGACTGGAGCCGCAGCCGTACCGCGAGCCGGCCCGGGCGGAGCAGTCGGCCCCGCGGGAGGTTGCCCCCCGGTCGGACGCGCAGCCCCCGCCGCGGGAGAAGCCGCTCCCCCAGCGCGAGGTCAGCCGCGCCGAGCCGCCCATGTCGCTGCAGCGCGAGCCCCCTAGGCCCGAGCCGCCGCCGCCGCCGCCGCTCCCGCAGTTGCACTTGCAGCCGCCTCCGCCACGAGAGTCGGCTTCCCGGGCCGAGCCGCAGCAGAGGCCGTCGAAGGAGACAGTGCGCCTGGAGCTGGTGCTCAAGGATCCCACCGACGAGAGCTGCGTGGAGTTCAGCTACCCGGAGCTGTTGCTGTGCGGAGAACAACGGCAGAAGAAGCCCATTTACATGGAAGACCCGTTCAATGATGATCATCAAGAGAGGCAAGAAGTGGAAATGTTGGCTAAGAAGTTTGAAATGAAATATGGTGGGAAGCCCCGTAAACACCGGAAGGATCGGCTACAAGATTTAATCGATATAGGCTTTGGCTATGATGAGACAGATCCATTTATTGATAATTCAGAGGCTTATGACGAATTAGTTCCTGCTTCTCTAACAACAAAATATGGAGGGTTTTATATCAACACTGGCACTCTCCAGTTTCGCCAAGCTTCAGATACTGAAGAAGAAGATATTACAGACAACCAAAAGCACAAGCCACCCAAAATTCCCAAAATGAAAGAAGATGATATTGAGATGAAGAAGCGGAAGCGGAAAGAGGAAGGGGAAAAGGAGAAGAAGCCAAGGAAAAAAGTACCGAAACAACTGGGAGTTGTGGCTCTAAATTCACACAAATCTGAAAAAAAGAAGAAACGTTATAAAGATTCTCTTTCTCTAGCTGCCATGATAAGAAAATTTCAAAAAGAGAAGGATGCATTAAGGAAGGAGTCTAACCCTAAAGTCCCAGTGAACTTCTCGACCTCCTCTCTGCATAAAACCCCCTCTGCTGCTGTGGCATTGGGGAATGATGTCTCGGACTTAAATCTGAATAGTGCTGATCCGGACCTCCCCATTTTTGTTAGCACAAATGAACATGAACTATTTCAGGAAGCTGAAAATGCCCTAGAGATGCTAGATGATTTTGACTTTGACAGATTACTGGATGCTGCTTCTAATGGTAGCCCCCTGTCTGAGTCAGGAGGAGAGAATGGAAACACCACCCAGCCAACCTATGCCTCTCAAGTTATGCCCAAGGTGGTACCTACACTCCCAGAGGGTCTGCCTGTCCTTCTTGAAAAACGTATCGAAGACCTCCGTGTAGCTGCCAAACTTTTTGATGAAGAAGGAAGGAAAAAATTCTTTACACAGGATATGAATAATATTCTTCTGGACATTGAGTTACAGCTGCAGGAACTAGGCCCTGTCATTCGTAGCAGTGTCTACTCCCACCTTGAAGCTTTTGTGCCATGCAATAAAGAAACACTGGTAAAACGTCTAAAGAAGTTACATCTCAATGTCCAGGATGATCGTTTAAGAGAACCTCTGCAAAAACTGAAACTGGCTGTTAGCAATGTCATGCCTGAACAGCTATTTAAATACCAGGAGGACTGCCAGGCTCGTAATCAAGCTAAGTGTGCCAAGTTTCAAACAGATGAAGAACGAGAAAAAAATGGATCTGAGGAAGATGATGATGAGAAACCAGGGAAACGTGTCATAGGACCAAGGAAGAAATTCCACTGGGATGACACCATTAGAACTTTGTTATGTAACCTTGTTGAGATCAAATTGGGATGCTATGAGTTAGAGCCAAATAAAAGCCAGTCTGCTGAGGATTATCTTAAATCCTTTATGGAGACAGAGGTGAAACCATTGTGGCCTAAGGGCTGGATGCAGGCAAGAATGCTTTTTAAGGAAAGTCGGAGTGTACATAATCATCTTACTTCTGCTCCGGCAAAGAAAAAGGTGATTCCTGCACCTAAACCCAAAGTGAAGGAGTGTAGTCCAAAAAAGGACCAGAAAACTCCTGCATCCTTGGTGGCTTCAGTTGGTGGCCCTTCAACGAGCTCTAGCACATCTGCTGTGGCCTCCACCAGTTCTAGCTCTACACCGGCCCAGGAGACGATCTGCCTTGATGACTCACTAGATGAAGAACTTTCTTTTCATCCACCTGCACTGGATCTTGTTTCTGAAGCTTTAGCTGTTATCAACAACGGGAACAAGGGCCCTCCATCTGGCTCAAGGATAAGTATGCCAACTGCAAAACCTCGTCCAGGACTGAGAGAGGAAAAATTAGCAAGTATCATGAGTAAACTGCCACTGGCTACTCCCAAAAAACTAGATTCTACTCAGACCGCACATTCATCAAGTCTTATTGCTGGCCACACAGGGCCAGTACCAAAGAAACCCCAGGATTTAGCTCATACTGGCATCTCTTCAGGCCTTATTGCTGGTTCTTCAATTCAGAACCCTAAAGTTTCCTTAGAACCTTTGCCAGCCAGGCTACTTCAACAAGGACTACAGAGGTCAAGCCAGATTCATGCTTCTTCCTCTTCGCAGACCCATGTCTCCTCTTCTTCCCAAGCCCAAGTTGCTGCCTCCTCTCACGCTCTGGGAACATCAGAGGCCCAAGATGCTTCTTCGTTAACACAAGTAACAAAGGTGCACCAGCATTCAGCTGTCCAACAGAACTATGTGTCTCCATTACAAGCAACTATTAGTAAATCACAGACCAATCCAGTGGTGAAATTAAGTAATAATCCCCAACTTTCCTGTTCATCCCCACTTATTAAGTCTTCAGATAAGCCACTTATGTACCGCCTTCCCTTATCTACTCCCACACCTGGAAATGGTTCTCAAGGGTCCCACTCCCTGGTTTCTAGGACAGTACCTAGCACCACTACCTCCAGTAACTATTTAGCCAAGGCAATGGTGTCACAAATCTCCACGCAGGGTTTCAAATCTCCCTTCTCAATGGCTGCATCCCCAAAACTTGCCGCATCTCCGAAACCTGCCACGTCTCCTAAACCCTTGCCCTCACCTAAGCCTTCTGCCTCACCCAAGCCCTCTCAGTCAGCTAAGCCTTCAGTATCAACTAAACTTATTTCTAAATCCAACCCAACTCCCAAACCTACTGTATCCCCAAGTTCTTCCAGTCCAAATGCACTAGTGGCCCAGAGTAGCCACTCTAGCAGTAACAACCCAGTCCATAAACAGCCCAGTGGAATAAACATCAGCAGACAGTCTCCCACCTTGAATTTATTGCCCTCTAATCGCACTTCAGGCCTTCCATCTACAAAAAATCTTCAGGCCCCTCCAAAGCTAACAAACTCATCATCCACTGGAACTGTCGGCAAGAATAGCTTGAGTGGAATTGCAATGAATGTACCGGCCAGCAGAGGTAGCAACCTTAACTCAAGCGGAGCTAATAGGACTAGTCTATCTGGGGGAACAGGAAGTGGAACACAGGGTGCTACTAAACCGTTGTCTACTCCACATAGACCATCCTCTGCCTCAGGGTCGTCAGTGGTAACAGCCAGTGTGCAGTCCACAGCAGGAGCATCATTATTGGCTAATGCCTCACCTCTGACTCTCATGACATCACCTTTGTCTGTAACAAATCAAAATGTGACTCCTTTTGGGATGCTGGGTGGCCTTGTTCCAGTGACCATGCCCTTCCAGTTTCCCTTGGAGCTACTTGGCTTTGGAACGGACACAGCTGGAGTGACAGCCACCTCGGGATCTACCTCAGCCGCTTTCCACCATAGCCTAACTCAGAATTTACTAAAGGGTTTACAGCCAGGAGCTCAGCATGCAGCAACACTTTCCCACTCACCTCTGCCTGCACATTTACCGCAAACATTTAATGATGGAGGCCAAAGTAAAGGGGACACTAAATTACCACGGAAATCTCAGTGACTTCCAGCAAGCAAAGGAGATGACACACTTGGCTGGCTGATGGAATCTACCTGATGGAAAAGTACTCATGTGGTCATAGGGCTGCTGTTCTGTCGATGTTTACATTCTCTCGTCCCAAGCACTGTGTTTCACCAGAAACCCCAAAGGCTGAGAACAAAACAGTAGGTGCCAAGTCCATCCACATTCTAAAGGGAAAAGGAGCTAGATCACCTGTGCGCCACATGCTAAGAGATTGTGAACTAGATACTGGGAAGCACTGGCTCAGTGCTGGGAAGGAAGAGCTCGGCACCCACCTTCAGGCTCTGTGAGAGAATGTGAGAAGATTCCTTTGGAAGCAGCTGTCAGTATGCTGGACGTTTCCATTCCGCTCCCCAAGCAGGAGAGGGTGGAGGTGCTTCCTCTTCACCTCATGCCAAATGAGGAGGCTGCTAGAGGACCATTGGGAGAGCGTGACACATCCTGTGGAGTATGAGGGACACAGAAACTGGTGTCTGACTCACTCCTAAAAGTCTAAAGACAAATGAGGAGTAGGTGGCTAGCTCCTGGAGAAGACAGAAAAGGAGAGAAGGCTGCAATGGGAATGGTTTACACTCCCAAAGTTTCCGAGTTCCTGTGGGCCTGATGTGGTTCTCAAGAAAGGGAGCCAGATTTGGTCATTTTAAGAAGGAACCCAGCCAAAGGGAACACCTGGACGGATGGAATGACCTCAGTGGAGGGGAGGCTCCTGGAAACTAAGGGGCCGGGGAAGGAATTCTAAGTAACTAGAGAAGGCATGGCCTACAAGGGAACTACAGCTGAGAGATCCCCAGAGAAGGAGAAACTATTGAGAACCTATAAAAAAAGAAGCAACACTGGAATCTGCTGCTCCCGGAGGACACGGACACCAGCTTATCTCTACCAACAAAGAAAGCTGTGTGAGCCACCCACGATTTCATGCCGGAGAGGAAGAAATCCACAAGCAGCAGTGGAAGGAGGAATAAATTGCTCTCTGCTTGTATCTAGCAAGTCCAGCTTGCTGGGTAATAGTCACCTCTACTTCTGAGTATTATAATGTACTGCAGTCTATATGCTACAGGATGTTATCAGTAAGGTTAATTTGCTTAAGAGTAAGACATTTAAATGGCAGAAACTACTATGTAATGGGAAGTAAACGACATAAAAATCTGTAAACTACACAGATGGAATGATTATCTTGCTGAAAAGTATTTACAAGAGTTGTCAAACTTAAAAATTACCTATTTTTCTTTTGCAAAAGAGGCAAGTGTTTCTCATTTGCTGTCCTCCTCTGTGATGACAAGAGGGTATGAGGAGTATGCTGCTGTGTGGTCTGCAGTCTGGTTTTTGGCAGCCAGCATTCATTCCCATATCCTTATGTATTACAGGGGCTAGATTTATGGAAACATTCCCAAACTCCTTGCCTTCAAGGTTCTGGATGTGATTTCTTTCTGCTAGATGTATTCATGAGGTATTTTGTAGGTGGGAGGAAAAAGTGATATTTTTTCTTCTGGCAGCACCTAGCAAAACGGGCAGGCCATGGGAGACTTAAAGTTCTGCCGTAGCTCCCAAGTAATCTCCTATCAGCCCCTACGTGAGCACTTGGGGACCAGCTCTGATCAGCAGTGGGGGGACCTGTATTTTTCTGACCTAGGTGATAGCAGCAACCTCCCAATACTCTGAACTGCTGAACGTTAGTGGCAGCTTTCCTTAACTCCTGCAGCTCTTCTAATAGTGCCGTCAAGCGTCTACTGAATTGAATGCCCTGCACTCAGTTCCTTTCTGCTTGAAAAGCCTGCAGTGGTTTCTCTTTTTCTGACTGAGCCCTGATGGATACAGGTGCATAGCTGATCTTCTGAAAGAAATGAACATACTTAATGGGTCCTTTTAAGCTAAAAGTGATATTTTAAAGCTAAGTGAGGCACTGACTGCCTTTTTAAAAGAAACTCAAGCAATGAAGAAATTTGAGAATGGATGTTTAGAAATGTTTTATCACTATGTGATTTTGTTGTCCCAAATGATGTGTTAAACCAAGATTTTCAAAATAATAAAACATACTGTATTACATTGCATTTTCAATAAAATAAAGAATAATAATCTTTCTTTACTGAGAGAAATTAGTACTTTTTTACTGTTAATAAATAAAATAAAAATATTTTCAAAA\n>XM_011942543.1 PREDICTED: Colobus angolensis palliatus ADP-ribosylation factor-like 2 (ARL2), transcript variant X3, mRNA \nCGTCGGCGAGCGTGATAGCCAATAGGAACCGGGAGCGGGGTCCCGGGACTGGGAAGAAACGGCGGCCGGGAGGGGCTCCAGGGACCATGGGGCTCCTGACCATTCTGAAGAAGATGAAGCAGAAAGAGCGGGAGCTGCGACTGCTCATGCTTGGCCTGGACAATGCTGGAAAGACAACCATCCTGAAGAAGTTCAATGGGGAGGATATCGACACCATCTCCCCAACGCTGGGCTTCAACATCAAGACCCTGGAGCACCGAGGATTCAAGCTGAACATCTGGGATGTGGGTGGCCAGAAGTCCCTGCGGTCCTACTGGCGGAACTACTTTGAGAGCACCGATGGCCTCATCTGGGTAGTGGACAGCGCGGACCACCAGCGCATGCAGGACTGCCAGCGGGAGCTCCAGAGCCTGCTGGTGGAGGAGGCCCTGGAGCTGGACTCCATCCGCAGCCACCACTGGTGCATCCAGGGCTGCAGCGCCGTCACCGGGGAGAACCTGCTGCCAGGCATCGACTGGCTCCTGGATGACATTTCCAGCCGCATCTTCACAGCTGACTGAGCCACTCCAGATGTCCCTCCACCTAGCAGTCCAGGTCCCCCAACCCTCACCAAACACTATCCATGGGGGCATGGGAGTCAGCCAGCCAAACTAACACTCCCCCTCCTCCATCCCAACCTGCTGCTGCTACTGCTGCCCGCTGCTGCTCTGTGGCCACCCAGCTCCTGTGGCGGGAGGGCTGTGCCCTGGCTGTTTCCCTGGCTCCTGACCTGGCCTTTGGCTACCATACCAAGAAGAGAGGACTGGGCGGGGAGGAGCTGCTACTGCTGCTACCGAGGCTGTGGGCCTCATCCTTCACTCAGCGGTGAAATAAACCACTCCTTGCCCTGA\n>XM_021957819.1 PREDICTED: Prunus avium uncharacterized LOC110756391 (LOC110756391), mRNA \nATGCATTGACTTGGAGTCTTTGATAACATTGACTTCGGGTCTTTGAGTCCATGAAAAACCGTTCGCATTTTCCATGATCTTTCTTTCTGTCTGTGACCCAAACCTGCTTCCCGAGTATATTCCAAAATCGCCATTTCAACCTCGAAGTTATAATCAATTTACGAATCAAACCATCGGTTTCAAAAAGAATCATCAACGCACCGCTCGTTTGTTCATTGTCGCGTTACGATTTTCCATTTCAATTGGACGCTTTGAAACTGCTCATACTCGAAGATTTTCCGGTTTTTGAGCATTTCATTTCATTCCATTGGGTTAAGAGTTGGAATGGGGGTCGTAGGGGCGACGAAGCATTTGGAATCATCGAGAATAATTGCTGCGCTTGATGTAAGTCATTCTGAGGAAAGACTGGGACAATTTACCATGGAAAATGGTGAGTTATTTTTCCATACCAAGTCAACTAAGTTCAAGAGGCAGATAGTATCTGCTGTTCGTGATTTCCCCCCGGGGTGTGGACGATTTGCTCATTTGAACTCTTTGAGACATGCTAAGGATGCCACTTCTGTGGGTACTTCAACAGAAAGTTTGCTTAGTGGGGGTAAAAATGTTGGTGGACATCGTGGGGTTGAAAAGCTGATGCTCTCAAATGGTCAGGGAGACGAGACTGACTTGATGAATGGTAATGATGTGGATTCTGTGGAGACAGTTGAATCAGTAAGCGCCTTAGAGCATGAAAGATCTGATTCTCTGAAGAATCTACTTCAGTTAAACAATTCGAGAACTGTTGAAGAGGCAGCTTCTGTTGGTACTGAGGAGAGTTTGATCAGCAGGGATACTAATGTTCATGGAAAAAGGGTTGAAAACTTAATGCTCTCAACTGATCATGTGCATGAGACTGACTTGATGAATGGTAAGGCTTCTGGTACTGTGGAGACAGTTGAACCTGTGACAGATTTGGAGCATGAAGCATCTGATTTGCTGAAGAGTATGCATCAGTTGTCAAACAATTTGAGACCCGTTGACGAGATAGCTTCTGTTGGTACCGCTGAGTATTTGCTGAGAAGGGGTAAGAATGGTGATGGGCAGGAGATTGATAAGCTGATGGTGTCAACTGGTCAGGTGGATGTGACTGTCTCGATGATTGGTACGGCTTCTAGTACTGTGGAGACGGTTGAATCTTTAATGGCCTTACAGAATGAAGTATCTGATTTGTTGAAGAACCCATATCAGCTTGGTGTGGCTACTCCAAAGGAAGAGATGGTTGCTGTTCTTTCAGATAGAAATTTTTGTTCGCCACGTGATGGATCCATTTCTGTTTCTATTGGAAATGGTCTTGAGAAGACTGCAGCGAAGAAATGTCCTTCTCGAAGACTAGTATCAGCTGTTCGGGACTTCCCTCCTCTCTGTGGAAGAAATGCTTGTAAGTTTGGTCAAGTGAAGTCGTGTATGGGTGATGAACCAACACAATCGAACACAGCGAAGACTAGTGTAAAACAAATAAGAGAGGATTTTCAAGAAGAGTTTCATAAGAATGAATTGGGAGGGAATGTTTCTGAAGTTATTAGAGACAAGGTTCAACCTAAATGCAAGGGGCATGCTGTACAAGAAATGGAGAGACGGGATAAATGTAAACCAAGTTATAAGCTGAAGGCGGTTTGGAAAGATACAAGAGAAAAGTGCATTGAGAAAAGTCCGCAAGAAAGTTCACAGCTTCCGTCGAATAGAGTAATTGTGCTGGCTTTGATGGCTCCGTCAAATTCTCAATTTAGGAAGGGGAGAAGGGTCCGCAAGCATATACCAGATTGCATTTGATGAAAGGAAACGAAAGAAACTTCGTCTTAAATGTTAGCTAGAAAGACCTAAAACTGCTTCCAGGACAGAAAAGGCAGCTAAACTCATCAGAACCATTCATCAACAAATGAGCCTTCAAGTTTTGACGTGGAGGTTGAACGCTGACATTTTTCAATGAGCCGGCTGCCCTGTTTTTGCCTAAAAGCTAAAATGATCTGTTATTGGCACTTTGAAAATTACACGTGGAGGAGCATGATGACTTTTGTGGAGTGCCAATAACAGCTTCCGTTTTTTTTATTTTTGTAAAGTGAAGTATGAATCCTGGAAGCATGCTGTGGAGCATCACAATAGGAGTTGGTTAATTGTTACATCTGTTCTTTTTTACACCATGAAAATTTCCCCAAGCTACGGATTTCTAGCATGAAATTTGGCTTTA\n>JF936918.1 Taeniopygia guttata clone F5CD66-14 T cell receptor alpha chain (TCRa) mRNA, partial cds \nATTGCTCGAGTAGAAAACTCAGCAAACACGCAGCTCGCTCTCGGCATGCACCTCGCATGTCTCATCCTCAGCGTCCTGCTGGCCCAGCTCCTGGGCACCTCGGGGCAGGACACGGTCACCCAGAAAGATGGAACCGTCACGGTGAAGAAGGGACACCCCTTCCACACCACCTGCAAATACCAGGCCAGTAATTTTGGGGGATTGCTCTGGTACCAGCTGCAGAAAGGCCAAGCCCCACAGCTGCTCTCCTATCAAACAGGGACCGGCCGCAAGCACAGCGGCCGGATCACCACGTACCTGAACACCACGGGCAAATCCAGTGTCCTGCAGCTGGAGGAAGTGGAGCTCTCTGACAGTGCCTTGTACCTCTGTGCTCTGGTAAATGTGGCAGCCAGAGTCATTTTTGGCAAGGGGACGGTGCTTTCAGTCCTGCCAGAAATTACTCCATCTCCCTCAGTCTACAGGCTGACCTCCAAAGATGACCAGGGTCTGGAAATGTGCCTTATCACAGATTACTCCCCTGAGAAGCTCACTCTGAACTCAGCTGAGCAGCACACATCTGCTGTTGTGGAGGTGGCAACCATGGAGAACAGCGAGGA\n>XM_041785118.1 PREDICTED: Cheilinus undulatus N-sulfoglucosamine sulfohydrolase (sulfamidase) (sgsh), transcript variant X2, mRNA \nGTTGAGGAACTGCGCTGTGTTTTCTTAGATTTTAATGTCAGCTCTATCAGTCAGTAACTGTTCACCATGCATTGATTTAAACGAATACAATGACTCTATTTAAATGATGTATTTATTATGAGTTAGACGAAATGTTTAAAATCATAACCAGCGCAGTTTTTCAGCCTTTATAGACAGGTTTTAGGGAAGGTCTGAGAGAAAATCATCATGGTCAAGCTGCTTTTTCTCATTTTGGCATCATGTTGCATCGGAGAGTCAAAGAGGAGAAATGTCCTGTTAATAATTGCTGATGATGCAGGCTTTGAGACGGAGGTGTACAACAACTCTGTGGTCCATACTCCACACTTACGATCTCTGGCCCAGCGCAGCCTGGTGTTCAACAACGCATTCACATCTGTCAGCAGCTGCTCCCCCAGCCGCTCCACCATCCTCACAGGACTTCCACAGCACCAGAATGGCATGTATGGGCTTCATCAGGGTGTTCACCACTTTAACTCGTTTGATGGAGTACAGAGTCTACCGCTGCTCCTTGGCCAAGCAAACGTACACACAGGTATAATTGGGAAGAAGCATGTAGGTCCTGGATCTGTTTACCCGTTTGATTTTGCCTACACAGAGGAGAACAACTCTGTGCTACAGGTGGGAAGAAACATCACCCGCATCAAACTTCTGGTCCGCAAGTTTTTCCAAACCCATAAGGAGGAAGACCATATAAAAGATGAAGAGAGGTCGTTTTTCCTCTATGTTGCCTTCCATGACACCCACAGATGTGGACATTCACAGCCTCAGTACGGGGCTTTCTGTGAGAAATTTGGAAATGGTGAAATGGGAATGGGAAGAATACCTGACTGGACTCCAGAGTATTACACCCCAGAACAAGTGAAGGTTCCTCCTTTTGTGCCAGACACGCCTGCAGCACGAGCAGATTTGGCTGCACAGTACACAACAGTTAGTAGGCTGGACCAAGGTATTGGTCTGGTCCTGCAAGAGCTCAGGGACGCTGGATATGAAAACGACACTCTGGTCATCTACAGCTCAGACAATGGCATCCCTTTCCCAAACGGCAGGACTAACCTGTATCACTCTGGGACTGCAGAGCCCATGCTGGTGTCCTCTCCAGAGCACCGGGAGCGATGGGGCGACATTAGCCAGGCCTACGTCAGCCTGCTAGACATAACTCCCACCATTCTGGACTGGTTTTCTGTCCCCTACCCGTCCTACAGCCTCCCCGGCAGCCCTTCAACCCCCGTCCACCTGACTGGGCGCTCCTTACTGCCCGCCCTTGTCTCTGAGCCCAGCAGCTGGCACACGGTCTACGCCAGTCAGTCCCTCCATGAGGTTACCATGTACTATCCAACCCGCTCTGTCCACCAGGGGGCGTACCACCTCCTCCACAACCTTCACTACCGCATGCCCTTCCCCATTGACCAAGATCTGTACGTGTCACCCACCTTCCAAGACCTGCTGAACCGCACCCACCTCAGAGAGCCCACACACTGGTTCAAAAGCCTGCAGCAGTATTACTACAGAGAGCGCTGGGAGCTGTACGACTCCAGGGCAGATCCACTGGAAACAAAGAACCTGGTATCAGACCCCTCCTACAGCACCGTGCTGGAGAGCCTGAGGCAGAGTCTGCAGAAGTGGCAGTGGGAGACAGGAGACCCCTGGGTCTGTGGACCTGACTACGTCCTGGAGGACAAACTGGAGCCGCACTGTAGACCACTCTACAATGGACTCTGATGATATTTGTACATTTCTGACCGACTCAAAGTCTGCTTAAAGTGACACATTCTTCTAATGAAATAAATTACTTTTATAGGCATTTGTATTATATTAAAATGTTGCTGCTTTGTTCAGAAATAAAAAAAACTTGAATTA\n>XM_026823756.1 PREDICTED: Diaphorina citri dipeptidase 1 (LOC103509407), partial mRNA \nGCACAACGATCTACCGTGGAACATTCGTAAGTTCATTCACAATCATCTGGTCAATTTCAACCTCTCCTCGGATCTCAGTGTGACGGAGCCGTGGTCCAAGAGCAGCTGGTCTCACACCGATCTGCCTAGACTGAGAAAAGGTATGGTAGGAGCCCAATTCTGGTCGGCCTATGTGCCATGTTCGTCACAACATATGGATGCAGTACAGATAACAATGGAACAGGTGGATGTTATACGCAGGTTCACGGAGTTGTACAGCGACGACCTTAAGCTGGTCACCTCAGCACAAGAAATCCGAGCGGTCCATCGGGAGGGTAAAATCGCCAGCATGATAGGCGTGGAAGGTGGCCATTCTTTGGGGAACTCGATGGCCGTTCTGCGCATGTTCTACAAGCTCGGGGTCCGATATTTGACCCTGACCCACGCCTGTCCTACACCATGGGCCGGATGTTGCAGTTCTCTTTTCTCTCCCTCCCCTGGTTCCCAGCTGGTGGTGCGGGAATGCAACCGGCTCGGCATGCTCATAGACCTCTCCCACACCTCCGTGCAGACCATGCGACACGTCCTCAACATCAGTTCCGCCCCTGTGATTTTCTCCCACTCGTCTGCCTTCGCCCTCTGCCCTTCTCCCCGAAACGTGCCCGACCCTGTGCTCAAACTAGTGGCCTTAAACGACGGAATAGTAATGGTTAGCTTCTACTCTCTGTATCTCACCTGCAGTCTGAACTCCAGTATAGATGACGTTATAGCTCATCTGGATCATATCAAGAATGTAGCGGGTGAGGATCATGTAGGTCTAGGTGCTGGATATGATGGAATTAACTAG\n>NM_001168050.1 Saccoglossus kowalevskii cripto-like protein (LOC100313583), mRNA\u0001GU075970.1 Saccoglossus kowalevskii cripto-like protein mRNA, complete cds \nGGCAGAATAAGCTATATAAGACATCTTGGCGTTATCTGGTCACTTGTAGCGTGGACTCACAACTCCGCACACTCTCTATCATAACCTTGGATCTTACACTGTAGTCTTCCCCAGTACCCTAACTTTGAGTTGACCATGAATTGTCACCTTGCCAATTTGTTAGCAGCGATTTTACTGCTCGTGATGGTCACTAACGTTTCGTCAGTAAGTCTAGGAGAATGGACTAACACCCGATCTTCCGCCAACATCTGCCATAACGGAGGGATAATGATCCTTGACAGTTTCTGCATATGTCCCATTGGATATGGTGGTCAATACTGTGAAAGCAAGCCTTGTGGCGCAGTTGCCCACGATGAAAAACTCACCGTACAATGTAATACCTGTCTGTGTCGAGACGGGAAACTCTACTGTGTACCACTGGGATTCCCTGCTTGTGAAACTACAGATGAAGTGATTATTGTGATTACGTCAGCCCCGATCACCACCAGCACCTATGCGCCGACGGAGGCCGAAGACGTCATAATGTTTTCTTACGGTGAATTCGAGGCGTTGTCATCTGTTGCAGCAATCACTCCCCGTTTTATACAGTTAGTTCTGCCCGCATTGGTGTTGCTTATGACACTGTGGACATGAGTTGCATATCTGAGAAAAGGGACAGCGAGGTTTATTGGATCCAGGCAATGATAGTTCTGATAAGACGACCGAAATCCCCGACTTCGCGGATTTACAACCATACAAGATGGTAGTTTACCGTCCAACAGCCCGGATAGGGTGATTGAGAAATAACAGTGGACGCACTCCATGTTTCCTCTGGGCCAAGAGGCAATACAGTATACATTCAATGTATCTTCCTAATTCAGGCATTATGCTGTTTAATTGTGATACAAACCGGGAAATGTACTAGGGCCTGTGCTATTATATTATCATCAGAAATTATGTTTATATATGCAGTATTGTGAGTTGTATTGTAAGTTGTATTGTAAGTTATTTGTAAATAAGCTACATATATTTGTAAATTATGCATTTTTATATGAAAAAAATAACAAAAGACAATACAAATATAGAGGAATGAGATTTTAATAAATAATTTAACATAATTATGTAATTTTATATTTTTAAACTGGGTATCACTAAATAAAATCATAAAATCACAAAAAAAAAAAAAAAAAAAAAAAAAAA\n>XM_053452891.1 PREDICTED: Spea bombifrons zinc finger protein 217 (LOC128471049), mRNA \nAGAGAGGATGAGAGCCTCACACCCAGGAAGTGCTTTCCCAAAATGACTAGAAGAAGAATAAGAGGCAGCAGGTACAGCGGCCAGAGGTAGCCCCAGCTCCAAGTGATGGACCTTTTGGGTTTCCCATGACGATGCGCAAATTCAGTCCTATTTACATCTGAAGGAAACGTGTGCATTGTTCAGGGGTTCTTCTCTCATCCATTATAACAAAGGATACATACCAATGTCTTCACAGAATTGACAAATGAAGAATTGACAGCTAATCTTCTCTGGAAGGAAACTACGAGCAGTACTTGAGATCTACAGTGGCATTCACATGTATGTGTCTTTAATTGCCCACAGCTTTCCTTATGTTCCTAAGGAACTTCTAACTAAAAAGTTGGCCCGCAGCACTGGAATTCTAAATCTGGCAGCAACCATGCCGGTTCAATCAATTTCCGATGGTTCTGATGTCTTGGGTACTGGCTTTAATTCCCAAATGGAAAGTTCTCATTCATCATTGGCACTCCAGCCTGCAAACACCCTTTCCAATGCAGCATTGCATGAAAAATGTTTAATGCAGACAGAGGGGGACATGCTGTTCGATTGCATGTTTTGTGACAAAACCTATACCTTTCATGAAGAACTTGGGAAACATGTCTTGGTCCAACACAGGCCAATACTGTGTGAGCCAGCCGTTCTTCGTGTGGAGGCAGAGTACCTCAGTCCCCAAGATAAACGCAGGAAAAGTGGAGAGCTTTCAACGAACGATGAACTTGATGAAGCTGAACATAGACTAGGCTTTGACTGCGAAGTATGCGGCCAGACCTTTAATGATTCTTCAGATGTGGAAGGTCACATGAAGAAGCACAAAGATTCGTTCACGTACTCTTGTGATATCTGTGGACGGAGATTCAAGGAGTCGTGGTTTCTGAAGAACCACAAGAGAACACACAGTACAAAGTCTGGAGGCAAAAACAAGCAACTGATAATCAGCGAGATGCCTATGACCATTAATGAAGTGGTATTGGAGCAAGTGGACAAAAATGTCCTGTGTCCTTACAAGCTGTGTGTGGTTTGTGGATTCTTTTTCCCCAATAAAGAATGCTTAATGGAGCACAGTAAGATACACCTTAAGGAATCTACCTCATCCGAAAATGGCTTAAATGAGCTGCCACCTCCAACAAATAATTCTGTACAATCTGAGGCTAGCGAAAATGCAAAAGGAGATGCTTCAAAAGAAGCCTTAATGAGGATGTTAAACTTACAACCTAGATCTGCAGGACCAAAGAACGCTGAAACATCTAGAAGATGGATTGGGGCCTTAGATCCATTCAACACCTACCAAGCCTGGCAACTGGCTACCAAAGGTAAAATTGCACTTGCCCATGGTAGAGTTAAAGAACCTTCGCATGAAGTAAACTTTCATATAGATCCATGTTCGGACAAGGACAAACCCAGTAAACTTTGGAAAACGGGAAAGGTTAGTCGTGCTGGAAGCACCCATCAGACCAAGAGTGAGGTCTGCGAAGGACACACGACTTCCCAGGATGGCCAACATGTACATCTGCAAAACGAAGCCAACGACGTGCCTTACGTAGACGACAAAGACAGGCCAACGTTTTGTGACGATTGTGGGAAAACGTTCAAGACCTACCACCAGCTTGTGTTACATTCACGAGCGCACAGAAAAGAGAGGAGCGATTCCGAATGTTCCGCGATGAGCGGGGAAGTCCTCTTGCCTAAGGTGGCCTCGCCGGATATCGCCAGCAGTTTGGAAGACGCTGATGCTATGAAAATGCACGATGATTCCGAGGATGGGTCAGAAGATCCTGGAGGCGATCCTACACAGATTGATGATAAAAATGAAGACGATCTAGAAAGGGGGAAAGCAAAAGGCCTCTCTGTATCTCGGAACTGCAGTTATTGTGGAAAGAGTTTCCGCTCAAATTATTACCTCAATATTCATCTCAGGACTCACACAGGTGAAAAGCCATACAAATGTCAGTTGTGTGACTATGCCGCAGCACAGAAGACCTCGTTAAGATACCATCTGGAGAGACATCATAAATTTAAACCAGGAGATTCCAACGCCATGGTGAAAAGCATCAGCAAAACCGTACAACTCGCTCAACAATCTGGCGAACATGCGTCTCTTACTTCCAACCTAACAGAAACAAAACCTCTGAAAAAGCTTGAGGCAAACTCTAAAGAGGAGAGCCCACCATTAAAACCGAAACGTGTTTCTTCTTCGCGTAACAAGTTTGTGACCGCAGCTCAGTCTCCAGAAACCGAAGAAGCCGTCGTTGATGGATACCCAATCTTTCCAAACGACTCCAATGTGAAAGAGCTACCTCCTTCCCAATCTGTGACCAAAGACAATGTGCCTGTTGATATGGAAGTTGACCGAGAAAGCCATACCACCATGGATGAAAGCTTTGCCGAGCAGGGTCATTTTGAAATCACTCCTATGCTGGCCGAGGAGTTGGTCCTATTAAACTTGTGTTTAAAATCGGATAATGGCCTTTCAGCACCTCTGGATACCAATGCCTTGCTTTTTAAGACCTGCCCTTATTGTACTTTCAAAACCTTGCACCCAGAAGTGCTGGAAATTCATCAGAAATTGACTCACAAACCTAATCTTGCCGAGAAGAATGGCGGCAAACTCAAATCTGTGCTGAATGCCATTAAAAAGAGGCGTACCGGCTGCCCTCCTGCACTTAACGGAATGGACATTTCTCCTGCACCTTGCAGTGGTCTTAAAGCCAAAGCTCCTCTAACGCAACCAAAAACCCTCAACAATGAAAAGGTGAAACGGGCGGCTTTTTTGCCTGCGAAAGCCGTGCCCTTGGATCAAGAGAATGCAATGCTTGCACATAAACACAATGGGGCTTTGCTGAACAATTACACGTACGTGCAACCTGACTTACAAGGAATTTCTCACCTGCTTGAAAGGATGCAACCGCCTGAACCAAGTAGGGCTTCTTGGAATGCGCCAACTACCAGCAGGGGGAATTCTACCGCTGCAACTACAGAATACGCCTATCAGACATCCCAGGCCTGGCCTGGCGCTCAGAATCTGTTTGCCAGACCCCTGAACTCAAATCACGAGCCGTGCCCAAAGAAGGCCAAGTTCAATATTACGACAAAGGATGACATGTTCAAAAAACCGCTTCCACTTGGGCATACTGGGATGTTTCCACAAGATATGGCAGCGGCAACTGGAAGCTCATTGCTACCTAACAAGGGCTATAACACCTGTGAAGCTGGTTCTTCAAAAGCAATGAAGCCTCCTGCCCAAAGCACTGCTAGATTTGCATGCGTTAATCCGGGATCTACCTCCGCCACCGACGGAAGAAGTCCACCATACCGTCGTGTATCCAAGAGAAGCTTGACACCAAATGATAAACGGGTGTGAAGGATACCCTTTGTTTAAAAAGGGTAAGCAATGATTTGCTGTTCTTTGAGCCACTGTAGCGTGAGTGAGTGTGGGATCGAGTATTGTATAAAAGAGAAGTGGAGCGATTCTATCCAGCTGCGAGAGCCTGTCTC\n>XM_039175744.1 PREDICTED: Hibiscus syriacus profilin (LOC120166485), transcript variant X2, mRNA \nAAAAGACAGAATTTCATCAACGGAAAAATAATATATTCGAGAGAAGTAGAGGAAGGAGAAAATGTCGTGGCAAACGTATGTAGATGATCACTTGTTGTGTGAAATCGAAGGCAACACTCTCTCTGCCGCCGCCATCATCGGTCAAGACGGCAGCGTTTGGGCCCAGAGCTCCAATTTCCCTCGGTTCAAGCCAGAAGAAATCTCTGCTATTATGAATGACTTTGTTGAACCTGGATCACTTGCCCCCACCGGATTGTACCTTGGTGGCACAAAATATATGGTGATCCAAGGAGAAGCCGGAGCTGTTATTCGAGGGAAAAAGGGGCCTGGAGGAGTTACTGTTAAAAAGACCAATCAAGCCTTGATCATCGGGATCTATGATGAACCAATGACTCCTGGCCAATGCAACATGATTGTTGAAAAGCTCGGTGATTATCTCATTGAACAGGGTCTTTAATTTATTTAGCTTGCCTTAATTGTCGCAGTTCTTCTTGGCTTCTTTTTTCTATACGAAAGTGCACCTGCCACCTCCCGTAATAATGGTTGGATCGAGTTAAAATAACAGTATTAGTAGTATTAAAAGTCAAGGGGAACCTTTTTCCAGAAACAATAAGCTTGATGTTTGTAATAGTGATATGCTTGTGATCCTCTTGCTTTGTTTCTGTTCTTGTTTGATGAATGGTATTGTCAAGATTGTGGAGCGAGGTACTTTTGTCTACATTT\n>XR_004882887.1 PREDICTED: Helianthus annuus uncharacterized LOC110916910 (LOC110916910), transcript variant X15, ncRNA \nTTGTGTACTCTCCCATGGTTTGTGGCCCATCTTCTCCACTAGGCACGGTTGCTAGGACGTGGGTAGAATGCAGTTGCCCAGTGGTCTTATATAATATAGACCCTTGCATCCAAATATTCACCTCCATACATCTTTCAGTTTGTAGCAGATATGATATATGCACATAAATAAACACACCGTTGGTACCGCGTTCTTCAATCGTGATCTCAAACTTACATTCAATTGTTCTTCATTCAAGATCTGCCCTTCTCCTCTACTCGCCGCCGCTGTTGTTTGAGTCGGACATCGGCGCCGCCTCCGTTCTACACCCTTTTGTCATTTAACACACCCTGGCGCCACAAAATTTCTGAAATCAATCACAAGGTCGTTGATGTTCTTGGATAGGTTACTATCTCAGTTAAGGCTTAGTGGAGATAAATTATTAGTTGCAGAAGATCCTAAAGAGAAAGACATATCAACTTGAAAGTCCCAAGTGAGAGGAGGACAAAGGTCATTACTTGAGGCTAGCAATCTGATTGTTCTCAAGGGATATAAAAAGTAGTTGAGTGGAACCCATACACTAAAATTACTAAGTACTAATTACACTAGATAATGTGAGTTTGGAAGAAGGGGGCAAGGGGCCATGTGTAAGCCACTTAATGCTGGTATCCATGCCTATAGGCGTGTCGATATCAACCCAGACAATAAAGTTTCGATCTTTGGGGATGGACCCATCTCCACTTTTACACGGCAGGCTGAGCTCACGGTACTGGTTGGTTATTTTGGGACACAACAAAGTATGCCATGAATGGTTCAGCAAAACTTGATGCCAATCTTCAAGAGATATTTTTAATGGAAATTTGAAGGCTATTCAGGGATTGGGATAGTTTCAATAGCACCAAACCATGAGGGCTACTAACGGGCCAACCAACCCAACCCTTCTGAACTTGTGCAGAATTCTTGCTTGAAGCAATAAATGGACTTCTTTCGGACACCAGGTTTCAAATATGGCATTCAGAAAAGTGTACCCGTTGTCTGGATGAATACCCACCATTGTCGAATGAATCATTTGTCAATGAATGATGGGTATTACGTTCTTCAAGAAGGCTTTTGTAATGGTGTCAATCTTGATTCTGTTAGCTCTCAAGGTTGCCTATTATTTGAGTATATGGAATGGAATCAGCCTTGGGGTAGAGAACCTTTAGCTGATAAGGTTAAGCCTTGCCACACGCCATCCTATTTACGAGGGTTACGCCTTGCCACATGCCATCCTCCGGTTAGATCTAGCAGGACGTTATCTAACCGTCTGGTTGATGAGATTCTACCAGAACGTAGAACGTGGGTATACATTCACCAGAACCGCAAAACGGGAAATTGTTAGAGACATGAAAGAAAAACGGGCGTACATCGCTCTAGACTATGTTAGAGACATGAGAAGAGTTTCGAACTGCCCGGCGAGCAGGTCATTACCATTGGTCAACAATGTTAATATTCCTAAGAATCAATCCAGATTCTTTGAGCAACAATCAATCCAGATTCATATTTCACTAAAGATGTAAACAACTACTTCCAATTCTTTAATTTGCAAATAGAGTTTGAAATTGTTTATTAGTTTGATTTCATAAACTTGAAACGATACCATCATACAGATTCTAATCATTGTATTT\n>XR_007968113.1 PREDICTED: Xyrauchen texanus putative uncharacterized protein FLJ46204 (LOC127624086), transcript variant X2, misc_RNA \nCACACACACACACACACACACACTCACACACACTCACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACATGTTGTGTTTCCATGTTTTATGGGGACTTTCCATAGACATAATGGTTTTTATACTGTACAAACTTTATATTCTATCCCCTAAACCTAACCCTACCCCTAAACCTAACCCTCACAGAAAACTTTCTGCATTTTTACATTTTCAAAAAACATAATTTAGTATGATTTATAAGCTGTTTTCCTCATGGGGACCGACAAAATGTCCCCACAAGGTCAAAAATTTCGGGTTTTACTATCCTTATGGGGACATTTGGTCCCCACAAAGTGATAAATACACGCTCACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACACAGGCTGGTGATTCTCAACGGATGGGTCTCAGGTCTCATTTAAGAGCAGACAGCAGGTTAAAACAATTCAATGCAACTAACCATATAATCATTAATAGACAAGATAGAGAAACAAATAGACTTTATCGACTTTTGAAAGGTTGGAGTAATCACTTCCCATATCAG\n>XM_026403930.1 PREDICTED: Urocitellus parryii CUGBP Elav-like family member 3 (Celf3), transcript variant X37, mRNA \nATGAAGGAGCCGGATGCCATCAAGCTGTTTGTGGGGCAGATCCCGAGGCATCTGGAGGAAAAGGACCTGAAACCCATCTTCGAGCAGTTTGGTCGGATCTTCGAGCTGACTGTCATCAAGGACAAGTACACCGGGCTGCACAAGGGATGTGCCTTCCTGACATACTGTGCCCGCGATTCAGCCCTGAAGGCCCAGAGTGCCCTGCACGAACAGAAGACGCTTCCAGGGATGAACAGGCCGATCCAGGTCAAGCCCGCCGACAGCGAGAGCCGAGGAGACCGGAAGCTCTTTGTGGGGATGCTAGGGAAGCAGCAGACAGATGAGGACGTCCGGAAGATGTTCGAGCCCTTCGGGACCATAGATGAGTGCACTGTGCTCCGGGGGCCAGATGGCACCAGCAAAGGCTGCGCCTTCGTGAAGTTCCAGACCCATGCTGAGGCCCAGGCCGCCATCAACACCCTCCACAGCAGCCGGACCCTGCCTGGTGCCTCATCCAGCCTGGTGGTGAAGTTCGCTGACACCGAGAAGGAGCGAGGTCTGCGACGCATGCAGCAGGTGGCCACCCAGCTGGGCATGTTCAGCCCCATCGCCCTCCAGTTTGGAGCCTACAGCGCCTACACCCAGCTGATGCAGCAGCAGGCGGCCCTGGTAGCGGCCCACAGTGCCTACCTCAGCCCCATGGCCACCATGGCTGCCGTGCAGATGCAGCACATGGCCGCCATCAATGCCAACGGCCTCATCGCCACCCCCATCACCCCCTCCTCAGGAACCAGCACCCCTCCTGCCATCGCTGCCACGCCCGTCTCTGCCATCCCTGCTGCCCTGGGCGTCAACGGCTACAGCCCGGTGCCCACCCAGCCCACTGGGCAGCCTGCCCCCGATGCTCTGTATCCCAACGGGGTTCACCCCTACCCAGCCCAGAGCCCTGCGGCCCCCGTGGACCCCCTGCAGCAGGCCTACGCAGGGATGCAGCACTACACAGGCCCAGCAGCCTACCCGGCAGCCTACAGCCTGGTTGCGCCCGCGTTCCCGCAGCCTCCTGCCCTAGTGCAGCAGCAGCAGCGAGAAGGCCCTGATGGCTGTAACATCTTCATCTACCACCTGCCCCAGGAGTTCACGGACTCAGAGATCCTCCAGATGTTTGTCCCCTTTGGCTTTGTGAGTTTCGACAATCCGGCCAGTGCCCAGGCGGCCATCCAGGCCATGAATGGTTTCCAGATCGGCATGAAGCGCCTCAAAGTCCAGCTAAAGCGGCCTAAGGATGCCAACCGGCCCTACTGA\n>XM_034920330.1 PREDICTED: Acipenser ruthenus E3 ubiquitin-protein ligase TRIM52-like (LOC117972083), transcript variant X1, mRNA \nCAAACATCAGAAACAACCATAAATCTAGAGGACCACTGTCACTGTCATTGTGAAATACACAGCGGGAAATGAACTGACTCATACTGAGACTGAGAGAGAGAGAGGAATTGAAATCAGCAATTAAGGTTTGAGAGATTTTCAGCCTGTCCTCAACATAATGATGTCATCGTCTCCGGAGGCGGAGCTGGCGGAGAGCCTGACCAATGAGGTGACGTGTCCCATCTGCCTGGAGCTGTACTGCGACCCTGTGCGGCTGGAGTGCGAGCACAATTTCTGCCGTAGCTGCATCAGTAAGTACTGGCTGCGGGGCGGGGAGGAGGGCAGTGCCCCGGAGGGGCAGAGCCAGGCCTTCACCTGCCCCCAGTGCCGCGAGATCTTCCCCCAGCTCCAGCTCAGGACCAACCGGCTGCTCTGCAACATCGTGGAGCGCGTGCGCAAGCTCCGAGTGGACTCCTGGGGCACGGCTTCGGCCTCTCCACCAGAGGGCAGCGGCGCAGCAGAGAGGGGCACTCCGGCGGGGTTCTGTGCGAAGCATGGCGAGAGACTGAAGGTGTACTGCCAGGATGAGCAGGTGGCAATCTGCGTGGTGTGCGCTGTGTCCAGAGATCATAAAGACCACAGCATGGCACCCATACAAGAAGCACTGCAAGAGTGCAAGGAGAGGTTTGAGTCGGCGCTGACTGAGTTTGAAGAACAGAAGGAAAAAATCCGGACTATGCACTCGAAACACGAGAGAGAGCTGAATGACCTAAAGGACTCTGCTGCCTCTCTTGAGAGGGGGATCTGCTCCCAGGTGGAGGAGCTCCTGCAGTTCCTGGAGGCTGAGAAGAAGGCGCTGTGCTCCCAACTGCAGGCTGACCTGCGCAGGCTGGAGCAGCAGAGAGAGGGGGTGCTCAGCGCAGCACAACAGGAAGTGACCCACCTGCAGCAGGACGTGACCTCACTGCAGGGCAGGCTGGCAAGGGAGGGGCTGGAGAAGGATGGGCAAGAAGTGGGCGACGCCCCAGCGCTAATTAAGGAAAGTGACTTCCTGTTTTTTTTTATTATTATTATTATGGAAGTTTATGTAAGTTTGTTAGCGTGAAGGATTGCGATTCTTTTAACTTTTGAGCAGCTTTTTGGCTGGATTTGAAAGTGTGTATACAGCTTCATACCTGCAGAGGAACTGAACTGCTTGACTCAGTTTCTTCTAGTTTCTGTAACACTGATGAAGGCACTCGCTGAAACGCTTGTCTGC\n>XR_007189094.1 PREDICTED: Ursus arctos uncharacterized LOC125282004 (LOC125282004), transcript variant X1, ncRNA \nTTTTTTTTTTTTTTTTTTTTAACACAGATAGAGACAGCCAGCGAGAGAGGGAACACAAGCAGGGGGAGTGGGAGAGGAAGAAGCAGGCTCATAGCGGAGGAGCCTGATGCGGGGCTCGATCCCATAACGCTGGGATCACGCCCTGAGCCGAAGGCAGATGCTTAACCGCTGTGCCACCCAGGCGCCCCGGAAATTTAAATACTTTTAACATATTTTTCCAGTTCCTTGGTCCTTCTCTCCCCAGTCATTCAATGGGAAGTAACGTAGATTTTTTTAAAAATATTCAAATTATACGTACATATATATCTATCTGTGTATACGTGTGTGTATTCAAATTAAACATACATATATGTATATATGTATACATATATATGTATATGTGCATATGCATGTATTGTGTGTATATATGTACATGTATGTATGTACACACACGTTTTAAGTAACTCTTGTATTATAGGAGATCCACTGTTTCCCCTTAGGATCAGATTTTGAATGTGTTCAGTTGTTGCTGTTAATTATCTTTCCATCTGTTTATGATGTTTAGTTTTCCTGCTTTTAGTGACCACTCTTATTATCTATAAGATGCATGGAAAGACTGCATCCCAGAAGAGCAGTAGTCAGTATTATAATGGTTTTATTTAATTAACTGAAAAAGGTTTTTTTCCTAAAATAATATCTTTCTAGGAAGTTAAAAAAATGTTCTCCAGAATACCTTCTATCTTAATGGATTGAAGGCTGCAGGTACAGGTAATTTTTTAGATTTCAACCTTTTATGGGGCTTAAGTTGAAAATGTTGTATAGTGTTTCAGCTTATAATTTTGCCTACTTTTCAAATGTAGTACACTAAAGGGCATGACTGTGGGACTGGTAAGTTTTGAGTTGCTTTTTTACATTTGCTCTTGGAGGTGTGCAGAGGCCTTATAAGGAGTTTCAGTTTGGGAATTAGGAACAGACAGACTGTCCTTGAGGTAGGTCAGGATCTGATCTTCTTCTCAGGTCAATTAAGGTCCCTCAGTGGGACAGGCGGAGGCAGGAAGGTGCCCACAGTTCGTGTCCCAGGTGAAATGGATTGCCAGCCGGTTGCTCCTTTTGTCTTGGTTGGGGTGTCTTTTCCAGCACGGCTCCCGACCCGCTCCCCAGTCTTACCTGTTAGCCACTTGTAGACTTTGTGATGCTCTGTGCATTTAGCTGTAAATGTTGCTTCATCTGTACGTGTTTTTCTTCTGTTGACCTCCTCAGGGATTTTAGATTTATAAAAAGTAAAATGCCCGTTGCGTCTTCTGGTTTGGCCACTGTTGATTGTATTAGTTAAAAAAAGATTTGAATTGAGAAAGGTTTGACCTACTCTGAAAGGATAAAGACATACTGAGAATTAAGATTACATAGATTGTCAGCACATTAAAAAAAAGTACTTCCCTTTTGTTGGTTTCAAATAACAGAGTGAATCTGAGATAGGGCTTCAGAAGCCGGTTTAGAACTGGATCTTGGCTTCAGATCCCTGAATCCCTCGTAGTCCGCCCAGGATGAGATAACCCTGTATGAGCAGGGAGGTAACTTCCTTATGGGAGGACGTGTCCAGTCAGGGGTCCCTGCAGCCAGAGAGTCATGGATACATCCGAGTCTCCGTATTGTTTATACTGAGAATCTGTCAGGATAAGTTATGATGAGACCTACCTGCTCACCTCTGCACCAGGGGAGCTGCACCTTTGGTGAATTGTAATCTTGATTCTGGATCCCTTCTCAAGACATTCATGTGAACATTTTTTCCCAGAGTAGCCTGTGCTATAATGTGTGTAATAGAGCAGTTTCCTGGAGCATTGCACGGGTGGGAAATGTTGCTTCTTTCTTCATTTTGGTTCTCTCAGTTGTGGATGGCTTGCCTGGCAGACATGCAGAAAACATCTGTATACTGCTGAAGTTGTTCTGCCCCCACACTTTCCTTTAAAACTCTCTGGATTCTGATTGGCTCTACACGTTAAACATACTGACTTCTGATTACGGGCTTAGGGTGTGTGTGACAACGTTGTATTTACAGTGCTGCTTCATCTTTAACTCAGTTGGGTGTTAGAAAAATAAATGTGTGTGGTAGGTGTTCCCTCAGTTCTTTTAAAAGACTTTTTGTGGAAATTTTGGAAAAATTGGATAATGAACCCTTTTTCAACCTTCTGCCCTTGTTTGTCCTATTTCTTCTCTCCCAGACTTTTGTTTCCTGGGGTATTTTATTACTTTTAAAAATTTTTTTATTTTTTAATATTTATTTATTTGAGAGAGAGAACACAAGTAGGGGGGAGTGGCAGGCAGAGGGAGAGGGAGAAGCAGGCTCCCCACAGAGCAGAGAGCCCCATGCGGGGCTGGATCCCAGGACCCTGGGATCATGACCTGAGCTGAAGGCAGACGTTGAACTGACTGAGCCACCCAGGCACCCCAGATTGACTCCTTTCAATATGATTTATTGCCCAGTTTGAGGTATACTATGTGTGTCAGAACATGCCATCTAAAACATACCTGTCTATATGCAGAAAGTCAAACATAATATAATCATTATGTAAGATAGTGTTGTTCCCCAAGTACTACCATTAATAACAAAGTTCTAGCATTTTTTTCAAATGTTTAAGAATTAAAATATACCAGGATAATTAAGAATAATGTTTGGCTCTTTATTTAATTCAGCCTGAGGATAAACCTGAAAGATTAGGGGCCTTAAGATATTTTTCTTTTTTTTCTTTTTTTTTTTTTTTTTTTTTAAGGATTTTATTTATTTGTCAGAGAGAGTGTGTGCGTGCGTGCTTGAAGGGGGAGTGGCAGGCAGAGGGAGAGCAGGTTCTGTGATGAGCAAGGAGCCCAATGAGGGACTCGATCCCAGGACCCTGAGACCATGACCGGAGCCAAAGGCAGACACTTAACTGACTGAGCCACCCAGGTGCCCCTGTTTCGCTGGAGTATTTTAGAGCTAATCCCAGACATTGTATAAAGTTTCACCCATGAAAGTTCATTGTATGTCCCTAACAGATAAAATATATAACCATAATACCTTTACCATGCCTCACATAGTTAAAAGTAATTTAAAATCTTTTCTCTCAGGGCACCTGGGTGGCTAAGTCGGTTGTGTGTCCAACTCTTGATCTCAGCTTAGCTCTTGATCTCAGGGTTGTGGGTTTGGGCCCTGTGATGGGCTCCACACTAGGTGTGGAGCCTACTTAAATTAAAAAAAGAAAGGAAGAAAGAAGGAAAGAAAAAAGTAATAAAATCTTTTCTCTAATAAAACTCGGTAATGTTTAATTTTCAAATTTCCCCATTTTTTTAAAAAAGTCTTTGACCTATCAGTTGGCATATCTCTAACATTTCCCACTCCTGCCTTGCACCCTTTCCGTTTTATTTTTAAATAACAGCTTTTGTTGATGCTCTGGAAGAAACTGTCATTTATCCTATAGAATCTCCCACATTCTGAATTTGGCTGATTGTATTATGTGATGTCATTTAATTCATAAAGTTTAAAACTGGTTGCTAGAAGTCCAGCTAGAATGAGCTTCAACTCTGGGGGTAAGAATACTTGCTGTTGGCTTCACCTCTTAGGGACGGTGACATTAATCATTTGTTCAGATGGTGGTGTGATCCTTCCACCTTGTGGCTTTTGTGGGTGTTGATGGTGGCTGCCTGGGTACTTTGTATCAGAATTGCAGACACGGTGACGATCTGATTCTGCCTTCTGTATTTGTTTGCTGGAGCCCGTGCAGAAAAGGTGGGATAAATGGATAATTCTTGTATTTACTAGCTTCAGAATGAGTTTGTTCTCTACAAGTGAAAATTATTTTTAGTCTCATAAATGCATAGATGTTAAGATGACCTATATATGTGTATGTGTACACACATACGTAGATGTTAATTTACAGCATTCTTTCTGATGGTCAGATTGCCCTTCAGAGGTATCTTCTGTGTCATATGCAGACAATGAATCATTGCCACTAGATCAAAAACTAATGACGTACTGTATGGTGACTAACGTAACATAAAAAAAAAAAAAAGATATCTTCTGTGTCCTTTGGAAATGGCTCCAGTAATGTTTTTATAGTTTTCTTGTTTATGGGCACTATAAAATAGTTTCAGACTCAGTTTGTACCCTTATTGCCGCAGACCTGAAACCAGCCATCTCTCTAAGGAGCCTTGATTCCTTGTCACGTTTTAGTGGGAAATGGTGTTCAGGGACTAGAATCTGGATACTGTGATAGGTAATGCTGGAATCTTATTTCTTCTGGGCTTTTTTAGGGTATAGAGATAGGAAGTGTGTATTTTTCAGAAAGAAAAAAAGTCATGAGTTTATCTCGATACTTCCAACTTAAATTTAAGATTACAGTGGGGCGCCTGGGTGGCTCAGTCAGTTGGGCACCTGCCTTCTGCTTGGGGTCATGGTCCCAGGGTCCTGGGATCTGCCCTGCGTCGGGCTCCCTGCTCAGCGGGGAGTCTGCTTCTCCCTCACCCTCTGCTGCTCCCCCTGCTCGTGCTCTCTCTCTCTCTCTCTCTCGCTCTCAAATAAATAAAATCTAAAGTAAAAAAATTATAAGATTAAAATGGTTTACTTCTTTGATTTTATGTTTGTATGTCATTTCTCTTTTGCTTAAAATCTTGGTTCTTAACACTAACACGTTTGTGTCATTGCTTCATCATTCATGTCTGTGAAACTTGCGTGTCATTTCAGAATAACAGTGCCAGTGTTGTCACTAACAAGACCTCTGAACGTGTTTGAACGTGGTTTCTCTGTTTCATCTTGGTTTCAGTGATGCTATTACTAAAAGCAGTGTTAGACTTCATTATAGCTCTTGTACGCCATAGGGTGTAGCACACTGGGATGTACGGTCAGATTACAGCTCCGCGCTGAAGTTACACCACGCTTTGAAAGTTAGGCTTATTTCTTTCGTTTTTGAAGGGTAAGGAGCAGTGGGAACTCTCAGACACAACTGATGGGAGTATCGTTTTGTACGTCCACTTTGGACAGTAGTTTGGTGGCACTTACTACAGTGGAACGTGCACACTGGCCTCGTGGTTCCGTTCCAGGTGGACACACAGCAGAGATGCGTGCACGCGTGTACCAAGAAACAAGTGATTTGTACTAGTCCCAGACTGGAACGGAGAGAGAACTGGGGTACATTCATATGATGACGTGCTCTCCAGCAGTGACTGTGAAGCTCCAGGACACAGCGTGGGTGCTTTTCACAGCATACTTTGTAAAGAATGGCTAAGCCCCAAAGGATACATACTGTGTGATTTTCTTGTAAATTAAAAAAAAAAAGGATGTTTTTGAGTCTCCATGTTCTAATGTACACGCGTGCATATTTCTCAGTGTAGCTCATCTTGACCGCTTTATTTCACGCTGCAGCCTGCATTCCCCTGCGCGCCCACTTCCTGTCCCTCCGACCCTGCTGAACTTAGTAATTTTTAAAATAACACCACTTGACAATATACCGTATAATTTAGTTATTTATGATTTTATTGTTGTCTGTCTCGCCTAATAGAATGTAAACTCCATGTGGGCAGAAAAAATGTGTGTGTGTGTGAGAGAGAGAGAGAGAGAGAGAGAGAGAGCTACAGAGTCGGTGGTAGCTGGTTGACGCCATATTGGTAGCTTGAAACCGAACAGGGTGGGTGTATTTATACCACAGAAATCAGCACACACCACAGAGCGGGGCTGCCCCCACTGACTCCGCACAGAGCCAGTTGTTACACACTCACCAGGGCGTCCTGGTGCACATCTCTGTCTTTGCACACACACTGAGGTAGGGATTCATGGTATCGGAACAGTGCCCGGCATGCAGGAGGTGCTCACTAAATTCTGAGGTGAATTTTATTATTGAAGAAATGTTGAGGTGCAAATGGCAGAAACTTACACTAGCTAAAGTGAAAAAAGGGAATATATCATTTTATGTAACTTGGAGTGTATTTAACGAATAAGTTACCGGTTGGTATCTGGAAATAAGTCTCTAGAAAGTCAAATGAGAAAAAGAAGTACCAATAAATCCTAAAGGAACTGTAACTACCGTGGAAAATAAATAAGTCTAATAGTTCTTTGATGTAGCCTTGTTTAAAATTACAAGAAGTTAAACATCAACTCCCAGTCCGCCCAGCGCCGCCAGCCGCACACCCGCTGGTAGTTGCTGCATCCGTCTTTCTCCCCAGCCCTCGGCAGCCGACCACTGAGCTCTCTGACCCACAGATGTGCCTGTTGTGCACATTTCATGTGATCGGAATCCCGCATCCCGTGCTCTTCCGTGTCCAGCATCTCACTTAGGCTTCCATCCACGTGGGAGCACGTGTGGGCACCGTCGCTTTTTGTCGTGAGTGACGTGCAGCCGTGAAGACGCTGCGTTTGCCTCTGGGTGTCCGGCCCGCCGGAGCGTGCGAGCTGCCCTGGCCTCTGGCGGCAGTCGTGTGCGCGGAGCCCGGGTTCCACTCGTTCCCCAAGTTGACAGATACGTGGCAGAGGTGGACGCAGCTGCGGAGGCCCAGCCCAGCTTCTCGGCTCTTCACCCTCTGAAGCTCTCGCGGCCTCTCTTGTCCCCACTGCCTCAGCGGCTCTCTGAACGGTGTATTTTATGTGCTTTTCACCATTTTCTACTGCCAGCTGTTGCATCCGTCTTGGATTCAGAAATCTCACGTCTCTTTTTTTCATTTTACCTGTTAGAGACTAATTTTTTGATTTAAAAGAAGGAGGAAGGAGGAATGTTTTAATAAGTCAGCCATTTACAAATGTCCTTTTGTGTCAGTCTGGCCCTGATGAGGTTCAGCGTGGCTTGCGGAGTGGAGGCATTGCTGCTGTCAGTCAGGCCCTTTGGACCGAAGTAAGAAGGAAAGAACTACGATTTCTGCCATGTCAGGGGACATGGGAATATCCACAATCAAGCATTGATTTTGCTAACAGATTTTTAGGACTTACCTCCTTTATTTAAATTCAGACATTTATAAGTCATCGAGTTTTCTGGTCTAATGTAAAAAATTCATTATAACTGTTTCAAGTAAGATAAGGCTCTGACAGTTGAGTTACTGTAGTTCTGGTCCTTGAAAAAGAAACGTTAAGTACCTTTTTTGTCCTCAGAAGAGAACTTTAAAAATTGAGTGATTGTATTTAAGATGCATTGGGCAGAAATGTTTCTAGTTTTACAGACCCCTTAGGTGATAAGGCCTGGACGTGGGGAGCCTTGGAGTTGAGGTGGACGGAGCCACTGGGAGAGAGTGAAATATGGGGAGGACCAGGATTTTGGGGAGGCATTGGTGGAGCCAGTGAAAACCTCGGTAGTCAAGATAAGTAATAGCTTGATGCAGCGTTTAAAAAAGAAAAAACAAAAAAAAACCTTAATGCAAAAAATCCATGGTGAACAAGATACTAAAATTTTAAATAAAGATAAGAGCAGTATTTTTCATTTTTCCTTTAGCCTTATGTGTTAGCTAATGTGCAGCATTGCTCCTTATTCTGTCTTTATTTCTACTTAGAGTTTAATTTGCTCTTATTTTTCTTACCTCTTTAGACAGTTGATGTTTTTACCTTTTAAATAGAAGCACTTGAAGTTTGAAATGTCCCTCTAAATACTCTCAGCTGTGTCCCAAAGATTTTGATGTTCTAGTTTTATTATCACTGTGTTCTGAACATTTTCTGATTTCTTTTTTGATTTGTTATTTGATGGGCGTGTTACTTAGAAAGGATTGCTTTCTTGGGAAATAGTGGGGACTTCGCTAGGTACTGTATCTTTAAAATAGTTACTTTTTATGTTCACTTATTATTTTGAACAGAAATATAGATGGCACAATATTCAAATGGGCAGGCAGGGAACCCTAACCCTCCCCCTCTTTAACCCGATTTCTGCTGAATTCTGTCTGGAAGAGTCACTGTTCATAATTGTGTAAATGTCTGTGGGTGATCTGTGCATATAACAGGAAGCACATATGTGCATGTATTTTTCCTTTACAATGAAATACCACAGTCTACATACTCTTCTATACCTTTTTATTATTTGAAATATATATCTTGGGGTTCCTGGTGGCTCAGTCCTTTGAGCGTCTGACTCTAGATTTTGGCTCAGGTCATGATCTTAAGGTCGTGCGATCGAGCCTTGTGTAGGGCTCTGCTCTGGGCAAAGAGCGTGCTTGGGATTCTCTCTCTCCCTCTGCCCCCAACCCCTAGCTTGCATGTGCTCTCGCTTGCTCTCAAAAAAATTTTTATATAGACAGGTATATATCTTGAAAATGTATGCATTTTAGGACTGGGAGTTACAGTTTTCTTTTATACTATGTGGACTTTTTTCATTGATGAGTGTTTTCCAGTGTCAGTGAAGAATTTTCAGTGAGTATCTTTTTCCAAACTTTATTTACTCATTTCTTTTCTATTGACATGTAGGCTGTTCCTAGTTTTTTAGTTTTGTGAATGAACCTATGATTCATTTAAGCCTCAAACTGCCTTAAACCTTAAAGGGGATTACTGGAGGTTTCTTGGACCAGTCTGACGGAAGCTGGATCTATGGGTGCAGTGACTTAAGTGCTTGTCTTCTTGTGGGCTCTGAACTCCTTAGGGGCCAGACCTCTGTCCGTATTGTCTTCCAATCCCTGATGCTTAACTCGTTGCACCAACACAGAAGATGTGGAACAGTGCCCTAGGCACGCAGCACTCTCAAAGCCCTTGATGCTTGTAATACTTAATTCTCATAACAACTGTTTGTAACTTTATTTAACTGATGAGAAAACCAAGTTCTAGAGAACAGTTTTTTAAGAAAGTGCCCAGAGTCCTATATCTAGTATGTTGCCACGTGGGGATTCAGGGAGTACTTACCAATAAGCTGAATGGACAACACTGGACTTTCAGGTTGAAGGTGGTGGAAAGATGAATGAGTTTGAGCTTTGGGGTCATTGATTTTACAAGGTCCGATCTTAACTCCAAGTCCTTTATCTCTGTCAGCCTCAGCTCCCTCTTTCTTGAAAATAATGTTGTTAACCTTGAAAATAAAACTGCCAGTCATTTTACCAGCGAAAATGGGTTTATTTGGGAACAGCAAAGAATTGCAAAGGCAGGCAAGCAAGCAGGGAGGCAGCACAAAGGAGAGGACTGCTCTTTTATAGAGGAAAGGTGGGGAGTTGGGAGGGAGGAGGAACCTTCCTCCTGCTGGGTTAGTCAAGTGGTATCCGCCTGCAAGGTGCACCTCTCCTTGTTGGGCCTGCAGTGGGGGAGGAGTGGGGAGGTGAGAGCTACCCCTGCTGGCCTCCAGACTCCATCCTAAGTGGGGCCTCCTGTTATTAATCTTCACGACGTATTGGTAATGACCTCAGAGTTTATTAAGGAGTTAACTTTTCCTCGTAGTATTGGACTAGTGTCCTGTCTTTACTCAAGGACCGGTGGTTGTCATTCCCTTTTGCTGCTGCTTGCGCTTTGGGCAAGTTCCTAGCGTCTCAAGGCTTTTTTCCCTCATCTACAAAAGTAGACATAATTATATTCGCCAGCTTGTTGTAAAATAAGCAAGAGACGCTCCATTAAAGTGGTTTTAGCATTCTTTGAATTTTTATTGTGGTAAACAAAAAACAACATAATTTATCCTCTTAACCATTTTTGTACAGTCGTGTTACATATATTTACATTGTTGGGAACCAGATGGCTGGCACTTTTTATCTTGCACACTGAAGCTCTGTCCCCATTGTTTTCTGAGGTGATAGCACCCTGGGTCACACCATTTTATATTCCCACCCATGGTGCACAAGGGTTCCGGCTTCTCAGTGTCCTGGCTAACGCTTGTTATTTCCTATTTCCCATTTAAAAAAAAAAAGAAGAAGTAATCATCCTGATAGGTGTGAGGTTATTTATAACATTTTTTAATGATAAAAATTTTAGGGAGAATTGGAAAAATGACTTTAAATTTCTTGCTAAATCGGAATAGTATCTGTTGATACCAGTGTGAGAAAACCAAAAGCATAGAGGAGGGCCTTTGAGCAAGAGGACCCACGACTGTGTATCTGTGTTTGGGAAGAAAAGTCGCCTTCTTCAGGGCTCTCCTTAGGATACAGCTGGGGGAGGACTGGACCCCTACGATGCTGCTGATCCTTCCTGAAAATGGGCAGTGTAGGTGGTAGAAGGGACCTGCTCGCCAGCAGGGCCCCCTGCCACCCACGGGCCTTCCCGTGTGGCTGTGTGGGTGTCACCGCACAGCCGATATCCCGCAAGCCACCACTGTTTTCTCAGCCGCAGTCCCAACAGGGCACTCTGCTGTTTGCTCGGTCAGGTGAGCGATCACACTGGGGGTAAACTGGATTTACTGGGTAAAATAAGAATTTACGGTGACAAAATGATAAAGTAAGTTGGCTGTATATTGATGTTCACTAAAACAGGAGTTGCAAAGTTTATTCGAATGGTGTTAACATTCAAATAAATAATGGCTTGTTTTTCAGTATTTGTTACTTGGTCAGTATACGCCAAGAAACCCCACTCTGTTTTATAACACGTACAGTTAGGGTGACAATTTTGGTCAGTTTCTGGCCCCGTGCTGTGTTATGCCTCTACTAGTATATTTGAAAAACTCAAGTGGCGTCGTCTTTGAGATTTCAGGAGCCTTTTTTGGTGGCAAATAACCTCCCAGCAGTTTCTAAACCTAGAATTAGCTTTCATCTCCTCTTTGGCAGAACACATGAGAAATGGCCATTAGTGTCTGTGAAAATACTCTAGTTGAGTATTGTCTAAATTGATAAGAAGTTCAGAATTTTCTGCCTCTTGCGGTTGCAGTTGCCCTTCTATTTTATGTATCTTATTTTGCTTAATTCATTGCTACGTGTATTTCCTGGTGATTGTGGTGCATCTCCCCGGTCCCCGCTCCATGTCCAGCATGTACTGTGTTGGCTTGTATCCGCAGTCGGGGGATCGCGGACTCGGGAGGACTGTCATGGGAGCCGCAGAATTTAGTGAGTTGGAGTGCTGCATGGGGATGAGAGCAGCCTGTCTGTCTCATATTCTTTCTGTGATTCAGTCATCCTTTGTAAGCCGAGGGAGGCCTGTTTCCTGGTTCTCTGGAAGCCTTTGCAGCCTCCGGAGGTGGTGTCGTTACCGGTGGTGGCTTGAGTGTGTGCTCTGGCAGGTGTCCCAGTGCTGGGGCCAGCTCTGCCGCCGACCAGTTAGCTGTGACGTCAGGCACGTTGCTTCATTTCTCGGTTCCTCGGTGTGTCCGCCTGTCAGGTGTGCCTTGTGAACTTGCTGGTTGTTGGAATTATTGATTGAAAAAATAGGTGAAGTCCTGCAGTGGGTTAGCGAAGGAGCACACGCTGGAGGCTGACTGCTGGAGCGCGATGTCCAGCTCGGCTCTGCAGGAGGTCTGTGACCTCAGACAAGTTACCTAGCGCCCCATGCTTCTGTTTGTCATCTCTTACACGGGGGTAGTAGAATCTACCTCATCAAGTTGGTTATTAATACCTGAGTCCATATGTTTAAAGTATCTAGGATAGGGCTTGGCACAGAGTAAGCATTAACTTGGCATCCCCATTGTATCATTATCATTATCTTTTCTTTGTCATTAGTGTTGCTATTATGCTATTTGCTGACTGCCACGTAGTCCCTACTCACGTGATAGGTATTGTCATTGTCCTTGTGGAAGTTCAGGATGGCGAAACGAGTCTTTCCTTGTCTCACAGATGGAACCGGGGTTCCTTTGTATCTTCCAGTTGCAAATTTAGTGCCTTCCTCAACTTCCCCAGAGTTCCTTCAGAGTAACAGAAGGGAGGAGGTATAGTAATTGTTAGAAACTCTGCAAGAACGGCGAATAACACCGTCCCCTTTTGGAGTATGTTGTATTTTGATACCTATTATCTGTTTGTCTTTGGAATATGCTTATATCCATTCTTATGATTAAATTTCTTTAGTCCTTATCAAGTCTTAATTTTTGTTGATAGATTAAAATTTTCAGAAAAGTTACTTCTGTTTTGTGGTGGAAACAGGCACAAAGACATAGGAATGATAACTCTGTGAATCGTAATAGAATTAAGTTTGGGATAGCACACCCAGCTTTTGGAAGTCAGGGTGTATTGTAGTGATCAGCTGCTAATTGGAGCTATCGTAGTCTAATAGTGTTGATTTTACTTAGATCTAGAACTCTTGATTAAAGCAAACATAAAAGAAGTAAGAGAGGTAAATTTTGAATTCTGTATGTGTAATATGAATTCCAGTTTTCTTTCACATTCCTCCTGTTAGCTGACTTGGAAGCATTGACTAGGGCTTTCCTCTTCCCAGAAGTACTGCCCTCAAGTATTAAGGCCAGCAAATAAAAGCATACAACTGTATGAGAAATGTGCGAGTCAGACTTGGATTTGTGTGATTTGCTTTTGGTGATATTTATAAGCAGCTTTTTTTTTTTTTTTTTTTAAAGATTTTATTTATTTGAGGGAGAGAGAGAAAGTAAGCACAAGTTGGGGGCAGGGGCAGAGGGAGAGGGAGAAGCAGGCTCCCCTGACATGGGACTCGATCCCAGGACCCTGAGATCATGACCTGAGCTGAAGGCAGATGCTTAACTGACTGAGCCACCTAGGCGCCCCTCCCCCACCTTTTAAAAGATTTTATTTATTTGCGCGAGAGAAGCAGTTTTTTCCTTAATCATTCTTTCCGGTGACTTTCTCACCTAAGACCAGGTTTCTGTAGGGAAGCTGTAGTGGACAGTACTGCACAGTGTATGAAGGGCTTTGGATTCCCTTTTCTCTCCCTCATCTTGCTCATCACCTTGTTTGCTGGCCTTCTAATGATTTCTGTCTAATCTTGCACAGTATTGTCACTTTTGTCATCCTGAAATTTGAAGTGGAGGTTCTCATGGGAGTACCAGAATACTACAGTTGTGTGATTTATTTTTTATGTGGGATGGGGAGAGGTGGTGTGCATGGTCTTCCTAGATTTTGTGTCAGTTTTTCTTTTCCAATTTTTATATTCTTGAAAAAGCAACATTTTCATATGGTTTACTTCTACTTATTCGGTGAATACTTACCAAGCACCTGAGCTGAGTGGGGTCTCGGAGGTAAAGCCGTGCCCAAGACTGAGGCAGGCCATGCTGCCACTGAGCTTAGTGCCAAGTCCTGACATCTAGAACGTCTAGATGCTTTTTTTGTGACCACGGCCTCTAAAAGAGAAGAGAAATTCCCTCTGTCCTCTCCTTGTTGCCTGTAGGTGACTGATGGATGTGTGGGATGTGGCCTGTACCTCTTCCTGGTCACTTCAGTAAGAAGGCCTGGAAGACAGTATGTGCAGAACAGATCAGATTCTTTCCTATTGTGGAGATGGGGTTGTAGTGGGGGCAGCTGGACAGCAAACGAACGTACTGTGTCAGTCAGTCCCGTGGTATTTGAGAAGGTGTAAGTGCCGTGGGAAATGAAGCAGGGTAAGGGCATGGGGCAGGCAGTATAAAGGTGGGCACGGGCCTGGTGTGGGCAGAGGACAGCAGGGAGGTCAGTGTGCAGTGTGTGGAAGGCCACGAAACAGGAGCCAGGCCGTGGCGAGACAGAGGGTGTAGGTGCGAGGGGAGCCACCTGTACAGGGCCTTGCGGACCATGCTGAGTATGTAGTTTGCACTGCTTCTGGCAGAATTGGGGAGCTGTCGGTGAGTTTTAGCGGAGTGAAATGGTGTGACGGGCGTCACGCAGGGAACTGGTTGGGAACAGAGTATAGGGCAGTGAGGCCTGTAGCCGCGGCCTGGTGGCACATGGCAACAGCTGGGCTGGTGGTGGCAGCGGACGTAGGGGCATGTGCACGGTCCAGATTGGGGTCCAAGCAAATCGTAGTCTCTTTCTTGTAAGTTTTAATGAGTTTACCTGTGAGGGAGGACTTCCCAGAGTTGCTTTTAACTATACTGATACGATAAAGAGTTTTTTAAAGAAACTAGAACTTTTTAAGGAATGATGGCCTTTATGTTAGTGCGTGAGTTTCTTATTCGGAGCGCATAAAGGGACTGCTCACCGTTTTCACTTAGGCCACCATTAATGTAGGCCTTTCCCGCTCTTTTCAAGACCTCACCGGCTCGAGAATCTAAGAGCCTCATTGGTCTTTCCTGTTTATCGAGAAGCAAACAGGAGTGGTGCCGTCCCAGAGTGACGTGTCCTCGTGTAATTTCTCAGCCCTTTGGCCGTAGGCCCGCGCCCCACTGCCTGAACCACACTCTCCTCTTCGCTGCACGCGGGGAACGAGCTGCTGTGTGTCGGGAGTGACGTGCGGCGGTTTTCTCTGTGACAGCGCCCAGCGCCCTAGCTTCTCCTCGGTGTGGCGGAGCCCCGTCCTCTCCTGCCCGCCCGCTCTTCTCAGTGGCCCGAGTGCTTCTCGGCTCTTCCGGGCTGCTGCTTCCGGCGGGGCTCTGCTTGGTGGCCTGGAGGGGTCTTGGCCTCTTTCGTCTTGTCATCTTTTGTATCCTCAGAACTCTGCACATGCGGAGGTGATATTTGGATATTGAGATAAATATAAATTAGCTCGAGGGGTGGGAGAGAAAGCTGCCGCCCACTGGTTACTTTGCAGTCAGAGAGTTGGCTTCTCCTCTCTGTCACCTAAAGAGCTCCCACGTCTGTCCTCTCGTCACCTCCTCTACTGCTGTGGAGGCTCCAGCCGCCGTGCCACTTGCTTGCACCAAGCCCTCTCTCTCCCGTGCAGGTGGTGCCGTGGCATTCATTCAGTCTGGCTCAGAAACCTTTTCTGGGTGTGTGCGTACAGGAAGACCTCTGGCTTCTTGGATGACAGGTGGGCTCTGCGAAGCCGTGTCTCTTCCTAGCTAAACGACTCCATCTTTAACTCCTCTTTCAAAGATGTGACAGCACTGGGGTGCCTTCGGCTCAGGGCGTGATCCTGGCGTTACGGGATCGAGCCCCACATCAGGCTCCTCTGCTATGAGCCTGCTTCTTCCTCTCCCACTCCCCCTGCTTGTGTTCCCCCTCTCGCTGGCTGTCTCTATCTCTGTCAGATAAATAAATAAAATCTTAAAAAAAAAAAAAAAAGATGTGACAGCACCGATGTTCCTCAGAAGACGTGAAAATTGGGTGTGTAAAATATCGTTGGCAACTAGTAAAGGTAGCTTCTGTTTTTTAAAGTCTTGAGTCGTAAGTTCCAAGAGAGACTCCGAGTTTGCCTTTGTGGTTGGCATGTCTGTTACTTGATGGTTCAGATTAAACCCGAAGCCATTCTCAGGGGCCTGGGTCAGATACCAGACTTGCTGCTGTGGCGTGCTTGGATTCCTCCTATGATGAGAGTAGGCCTTTGTGTCCCGAGTGTCCTCAGTAATGGTGATCTTTCTGCTTGTTTCTTCTGTTTCTTTCCTAGCTTGCTTGCCTGTGTTTTTCTGGAGCCCCTTTTCTTCCCAGTGTTGCCTGGGGTCAGAGTTCCTTCTGGTGAATGATATGTTTTCACTGGGGGCATCTAGGAGGTTATTTGAGCTCTGACTGCTATTAGGAGGCTGAATGTAACGCCTGGAGACAAAGCCATCATCGAGAGTAGTATGTCAGAAATGAAACTAGCTGTCCTGGGGCATCACTGGACACAGATAGGCCTCTTGTTCCCCTAGCCTTTTTCAGCTCTTGTTTTCACAAGTTAGTGAATTCATAAAACCCTGGTCGTGGTCACAGTTAAGCAGAGGACTCGATTTTTTCTTCGTTAATGGGATTTGCTACGGACAGAATTACCCGCGTAGTAGGAGAGCTGAACTGTCTATGTCTTGAATGTGTATCACATGTGCTCAGACAACAGAGGCTGTAGGAGCCCAGTTTCTTACTGTCTTACTGCCAGAGTGGAGTGTGTTTAAATAGCTACATTTTAGAGATGACCCAGACTATCTCTCAGTTTGAATGGAAAAAGTGTAAGTAGCTTTACATTTTTTTGAAAAAAACTTACTCGTACAGATTGTTAGAGTGTTTTTCTGTCTTCCTTCTTCAGTATGAGTTTCCTACTCACTCATGTTTTGAAATTAAGAAATTGGGCATCTTGTATTCCTCAATATTCCCTAAGCTAGTTTTAAAAGAATCTCGCAACTTCAAATTCTTGTTCCTGTGTGTTTTCTAAATACTTTTATAAATTTGCAGACTTAAAACTATCGATCTGAAAAAACCTTTACCTTGGAAATATCTGGGTTCCTATAGACATAGTTTCTACAGATTTGTTTTTAATGTTGATCAAGATGTTTTCCCCTGCATTATTCATTTTTCATCAAGACAATTACCTTAAGTCTTAAGGTCAGAATTAGGCTGGAAAAAGGCCAAAGGCATGAGTTTGAAAACAAAAATAGTCGGAGGAGCCATCTACAGACATGATCTGGGTCAGACTTGATTTGCAGCTTACTCAATTTTAGAATCGCCTGTTGGTTTTGTGAGCAGAGGTCTGCCAGATGAATTGAGCAGAAGGGTGGGATTAGCATATTAATCGGGTGCTGGCTACTGGCCTTCTTTTTCTCCTCCCTCTTTCCCCTCCCTCCCTCTCTCCTTCCCTGAATGAATCTAGGAACACAGGCCCCTGGGGTCACATTACTGGCTGGTTTCCTTCTGCTCTGGAGCTTAATCTAGCCAGGATGGTCTGTGTTTCAGATCGCAGAAGCAGAAGATTCTGTAACTGAGAGGCATTCTTCAGGCTGCCGGAAAAAATTACAGAAGGAGCACCTCCCAAATTTTGCTTCAAGCTCTGAGAAAAGGAGCACACAGGGGAAGCTTAGTGTGGCTGTGGATGGAAGCGAACGCTGTGGGAGCGATGAAAGGGGACTTGGTGCGCGGACGCCTGGTCTGATCTTGAGGCCTGAGTTTATGTTGCTGGAACTGGCGGGCCAAGAGGCCCTGAGACCAGCAGGTGCCGTCTGTATGGGGAAGAGCGGCTGTAGTCCCATTTCCGATGTGTTGGGCTAAAGGTATAGGTAACTTAAAAATCTGTTTGGTTTAAATTTTATTCAGATTCATGCTTTTGCATTAAAAAGGTGGATAAGAGTTTTTCAGACCTTATTTCAAATAGATTTACAACGAAATTTAAGGAAAAATGGAAATTGATGTACTACAGGTTTGCAGCTCTTGGCATAAAACCAACTAGATAGCTTTTAGAAGTAAATAAAAATATTTTTATCAAAGTGCATTTTAAGTAAGTTATCTTTTCTGTTCTGTGTCTCTTATAGTTTTATGTTTTATTTCGTGTGTTTTAATTAAGGCACCCATATCCGTTCTGTGATGTGGAAGTACGAGGCTAATTTTAACTTCAATAGGATTGGAGGGAAAAAGTGATGTGGTTTTTCTTTTTTCAAAAGTTGGTTCTCTTTACTCACTGTAAAGATTGTGCATTTAATTTGCAATTCCATATTATCGTAAGGTGGTCTTATCACTAAGGGTCAGTAATACTTGGATAAACATTTTCCAGTTTAATGTTTTTAGGGTTTTTATTTGTATAAAAATATAAAATACAGCATTTTCATTGTAACATTCAAGACAGTATTTGGGAAGCATGTTTAGAAGTTAAAAATGCCATGTAATCCATGTATGAATAAGACCAAATAATTTATCTGCTTCTCTTAAAGTATTAGTGAATATTATTCCCGGGGGATGAAGTCCGTAATAAAGAATTTAATACAGATACTGGTATTTTAAAGAGTATATTCAAGTATCACGTTAACCTACTCAGGAAAGACTTTTACAAGGAAGAAACCTGCGCTGGGTGAAGACCTGAAGTATTATAGTAGACCTTCAGGCTGATTCGGTTCAGTGTTTAGCTTGGAACTTTCAGAGCCGCCAGGATGTGGGGGTGCTCGCGCCCGCCAGACCACGGTTTAGATCGCTGTCAGATCGCGTCTCATTTACCAAGTTGTCGGCATCATCTAGTCATTCTTGTCTAGGCTTTTAAACATTTCCCCTTCCTTCCTTCCCTTCTCTTCCCTTCCCTTCCTTCCCTTCCTTTCCTTCTTTTCCTTCTTTTCCTTCCTTTCTTTGCTTTCTTTCTTGCTTTTTAGGTAATCTCTACACCCATCGTGGGGCTTGAACTCACTAACCCCAAGATCAGGAGAGTCGCCGACTGAGCCAGCGCCACTTTTAAACATTTCTAAAACATGTGACGTCAGACCTCAGATGTCAGACCAAACAAAACGCCTGTCACTTTATTACCTAATTAAGTATTTAGAGTAAAGATTTTGCTGAGTTAAATTCAAATTGTTGAATTTTAAAGGGCTTTGGGTATGGAAACTTCTGAAAACTGTAATTTCTCACCTGAGGACTGCACAGTATAATTGAGCATGACCAGTAACGAGTGCTCAGAGGCAGAGAGCTCTTTACTATTCTTGTTGAAGATTTTGGTCTCTCCCAGACTTGTTGGGACCTGTATGCACAATGCTGCCTCCGTGGTGTGACAGTCCTCTGTTAGCCCTGATCCTTAGCAATAAGGCTCTGATTTCACTAAGTCTAGGCTAGATTCATGTCTATGAATCCAGTAGCAATGGATATTAAATAGTTGGCTACTGGGTTTTTAAGAAATTCAAGGTGACTTTAGAAATATGAGCTTCAGAAGGAAAGAGAGACTGAGGTGCTTTTGCTCATCCCAAAGCAATTGATAGAAGCAGCTTATTTCCCAGTATGTTTACTGACTGGCAGAGCTCGTGAGGAGAGGCGTTTTTCACTGAGACGTCATTTCGATAGCGGTCAGGGTTGGGTAGGAGAGCAGAACCACGTGTATGAAAGAGGGGAAGAGGTAGGGACAGCATCAGGCTTAGATCATTGCATTTGCAGGCTGGAGCAGGCCGTCACCTCTGACGCATGGTCTTGTTTCTGGATTGTGCAAGAGGAGTTTTCTGACAACACTAAGGAGGTTGTCACCCTGTCCCCTTCTCAGGGCTGAGTACACCATCTCCCCAGGGGCACGCAGTGCTTATTGCTGTATTGGGATCAAGTGCCATTTAAAAAGTCCAGTCTCATTAAGTGTATGAGTTTCATGAGTCATTGAGTTTTATGGCTTCACAGGTAGGTGAAGCTGGTTACTCCCACCTAGTGAGATGGCCTTTGTCAGGAGCTAGGGAATTACAAAACAACTAACATGTATATAATGCCGAAAGCACTCTGACAAGCTGATTTTATCCCCACGGGAGTCCTACGCTGTAGGAACCATTGATGGCCCTATTTCTGAGATTGAAATTGAGGCAGAGAGTGCTTAAAAAAAACTTGTCCAAGGCCCTATAGCTTCTAGACTTTAGCCAGGCAGTCTGCTCTGGACGTTTTTGCCCTCAACCTTTGCTATTGCCTTTCAGCTAAATAGGGAGAAATAATTGTCAACAAGAGGTTTTAGCTGGACAAAGGAGAGGGAGAGGGTAGCTTTTGGTGTGGTTTATAGATTATTTTCTGGATAAAATGTAAAAATAATAGGAACGGTTTATTGGCTCTTGCTTGGTGGTAAAGGAGAATGAGAAATTAAAGATTTCTTTAAAAATTCAGGAGTGGGGGAGCCTGGGTGACTAACTCTACTAAGCGTCTGCCTTGGATTCAGGTCATGATCTCAGGGTCCTGGGATCCAGCCCTGCATCAGGCTCCCTGCTCAGCGGGGAGCCTGGTACTCTCTCTCCCTCCTCCTCTCCCCCAGCTTGTGTTCTTTCTCTCTCTCAAGTAAATTAAAAAAAAAAAAAAAAAAATTCAGGAATGACCCCAGCTCTGTAAAGGTATCTGCTGGTTGTTTCTCTGTGGTTAGTTTGAATGTACTTCTCTGGGGTTCGTGATGATAGTAAGGCAGTGTGCTGGTGTGTCTGTGCCCAATGCTGAAAATCACCACCCCAGAGGCAGTTTGAGGCCTGAGCTCGGTTGTTCAGCACTTGTCCCCCGTCTCTACTCACCACGAGTGCTATTTGAGGGAACTGCAATGAGCTCCTTCACAGGAAAATTGGCAGTTTGACGTTCAGTGCCACTCACTCCCATCATTTCTCACCTGACTACTTATCTTCCCACTCTTGCATTCCCAGGGTGATGCTTAGTTTTTTCTGGTTTTGATTTATTCGCCCTTGTCTCTGAGGCCTTTGTGTGGTTCAGATTTGAGTTGGGAGGCCAGATAGGAGTTCTGCCCACATCTCTGACTGACTGTGTTACCTTGGGCAGGTCACGGGAGATCTAGAACCCGTGGTTTCTTTATCTTCATTGCACCTGCGCCATGTACCTCACAGGGTTATGGGTGAGGGCCAAAAAAAAAAAAAGAAATTCCTGAAAGTGTCTTTTGAAGTATAAATGTATAGCATTATTAATGTTCCCAACCTCCCCAAGTTTCTTTGTCTACTCCCTGCTTTGATGCCATGCATAAGCTTTGGTCATGGTACCTTTTGCATTACTTGTTTACCTCTGTACCCTCAAAGGCCCTGTGTCTTACTGTCTTTGAATTTCCTAGCACTTGGCTCAAGGCACGTTGGAATGGGTACTGGCTCAGTAATGTTCAAATGAATGAGTAAAGAATGTCTGTCTAAGGGATGTTTCTGGTCATAGTTGTTTTTGTCGTTGTTCATCGTTTTTTCTGAATGAAGACTTCCTCCTTGTCTCTATGCTTCTTGAAGTTAGCCTTGTTAAAAATCTGCCCTTTCTTACTTTCTTGTGTTCCCTTTTGCAGGATGTTAAATTCCAGTATCTGTGGCCTCCTTCTTCAAGGGCTAGGCTTACTTTTAAATATTCATCTGATGAGTCTTGCTTTTAAACAATCAGATAAACAATCAGATAAATCAGTTCTTCCAGCTATTGACTTAGAGATAGAAAATATTTAATATTTATTGTTTGTGTATTCATTTAACAAATACGCCTTGAGTACCTTTTGGGTACCAAGCTCTGTTCCTGGGGCTAGGAACAGAGCAGTGAACAAATTGGATGAGATTCCTGGCCTTATGCAGCCTCCGGTCTAGTGGCGTGTCAGTCAGTGAAGAAGGAAATGAATACATAAGAGAATTTCAACGAATCTTAAGAGCTGTAGGAGGGAATCACGTGAAGAGGGCTTCTAGACCAGTGAGCAGTCGTCATATTTATAAATAAAACTGAATATGTTACCGATGTCGTGCTCTTAGTTTCCCTTTGTATCGGGTTACCTGAAAGGTATCTAATGGTGTTGATGGTGAGTACTTGAAGCTCTAGCCCATCCATGCCTCATCCACAAGAAAGATACAGAATGGCTGAGGAGGAAGGTGGCTATTCCCTGGACTTTTGGTTTCATGAGAGCACCTCAGTCTGTATGAGTGCTCCTCAACCTTGACTAGAACCCTCTTTGTTCAGGTAGCTCTTTTTGAGTATCTCTGATGGACCAAGGGGGACCCAGGAAAGATAAGGGAGTCATCGATCACCCAGTAACTTCGCTGTGCCATCTTGCTGTGTGTCAGTGCACCCACATCCTCAGTGCCAGGGAAACTGCTTGCTTATGGCATTGTGTGTCCACATTCGTTCTCCACATTGTTTACAATGTGCTCTGGATTATAAAGAAACAGTACAAATAAAATATGCCCAAGCCAACACCAGAGTATTTCATTAAGTACATAAGGACTTCCTAAAAAAATTTACTTTTACATGAGTAATTAAAGAGGAATAGACTTCTTCTGACAAAAATTTTTAACAGAAACTGGTAATAGTGACTTCCCCCCACCAAGAAAGAAACTAGGAGGGTAGGGCACAGAATTTGGGATCACAAATTAGCAAATGTTACAAATATAGCAAATAACAGGAAAATCATTCTCTTCCTGGACTAAGGCCTGTTAGGCCACCTCCTAAGTAAATATGTCTTTAATCTGTTCACTTTCTATTTAGTCCAGGTCACCTCTGCTGTCACCTGCATGGCCAGCATGCCTCCCTCTCCTCTTGATCCCCTTGTCTACTGTCCACGCAGCAACTAGGGTGATCTTTTAAAACACAACCATGCCACCAGCAGCCTCACGTGCTTGAAATTCACACCTGGTGTCACCCTTTGCCTGTTTGCTAAGCTTCGGCCATACTGCCCTTCTTTAACTATCACTGTCCTGAGCACCCCACCCTCCTTCAAAGCTCAGGGCCTTTGCATATGCTGCCCCCTCCACCTAGGACGCTCTCTGCCTCACTGAAGCAGGCTTCTCCTTTAGATCTCAGCTGAAATGTTTCTTCCTTGGAGAGAACTTCCCTGATTCCTCAATCCAAGTCTATCTTTAATTAATTATTCTCTCTCGCAGAACTCTGTTGTTTTCCTTCATGGCATGTATTCCAATTTGGTGTATCTGTATTTATTATCTGTCTTCTGCATTAGATTGTGAGGGCTATGGGGGCAGACGTCTTTACTGTGTTGTTTACAGCTGAAATACCAGAGCCACTTATTAGCACATAATCATTTAGTACATATTTGTTACGTGAATTAATGAATGAACAAACTGCTTGGGAACTTGAGTTCAGGACTTTATATCTGCCTTACGCATACTGTAAACCTGCTATGGTTCCGTTCCTCACTCCATCGGTGAAGATTTTGCTGTATCTCTCCTTAAACATCGCAGTTGGAAAATGCTCCCATTATTCATGTGCTCCACAGATCTTACCAGCATGTTACTGATTTCTATGCCCAAGTAACTGATAAAAACACTGTACCTAACAAAGCCAAAAATGAAACATCAGGTCACAGACTGACGTCTCTCTAGGTTGAGAGCTGAATATCTCACTTCTGATCCCGGAGTTGATACTCCTTTGTGTCTTACTCTTCGCCAAATCAAGAGAACCTATGAAGTTTGTCACACAGCCACATTGTCCACTGTGCCACCACCACGCTCAGCTCTCGATGTTCTCTAAACCTAGAGCCCTCTCACACACCGCATCGTGGCCTTCTGTAGCACGGATTCTCGGGGAGCTCCACTCAAGCTGCTGGAAATCACTGCTGCTCCTGTTAAGTGTACACATCTCCTGTTATCCCTTTACTGCGCTAAGGTAGCTAGTAGTGAAAATGAGCAGGGGAAACTATAGGTTTCACTTTGTTAGGATTTTTATTTGCTCCTGTCTCATCTCTTTTAGATTCACTCTAATATCTTGCAAGTCGTATCATTCAAATAAATATTTACTGAGCATCTGCTGTGGACCATGCACTATTTGAATCCCCATAGATTTAGGGCGATCAACACAAACCCCCTCAGTCCTGTATAGCTACAGTATGATCAGGCGCACAGAGAATTAAAAAAAATCATATCTAAAAACTGATGGAACATTATCTGATTTCAGTATCCTATTTCTTAAGTTGCTTTAAAATACCAATCTCATTAGGGTGCCTGGGTGGCTCAGTTGGCTGGGTGTCTGGTTCAGGTCATGATCTTGAGGTCCTGGGATTGAGCCCCATGTCAGATTCCCTGCTCAGCGGGGAGCCTACTTCTCCCTCTCCCTTTGCTCTTTGCCCCTGCTCGCGCTCTCTCTCTCTCAAATAAATAAAAAATCTTAAAAAAAAAATCAATCTCATCAAAACTTACACATCAGACTGGTTTTGTTCATATAAAGCTTTCATCTCCTCCAAAACTTGCCTGAGTCCATCCTCCTAGAACATACAAAATGATATTGATACACGTCCATTAATTCCACCAAGTCTGTAGCAATGTCTAATCTACTCTATGTTTATCTTTGATTCATATATCTTATCAAAAAGCAGTACCTGTGGGAATGCCTAGAACAAGTGTTGGTGAGGATGAGGAGAAAGTGGAACCCTCATACATTGTAGGGAGGAATATAAAATGGTGCAGCCCTATGAGAAACAGTCTGATGGTTCCTCAAAACGTTTAACATAGAATTACCATATTATCCAGCAATCCCACTTGTAGGTATATACTCAAAAGACTTGAAAACATATGTTCATTCAAAAACTGTGTATAAATGTTCAGAGCAGCATTCTTTATGGCAACCCCGAAGTAAAAACACCCAAACATCCATCAGCTGATGAACTAATAAACCAAATATGGCATATCCGTTCAATGGAATATTATTGGGGCATAAAAAGGAATGTAGTCCTGCATGCGTCAACATGGATGACCTTTGGAAACATTATTCTAAGTGAAATAAGCCAGACACAAAAGGATAACTATTGTGTGATTCCACTTACCCGAAATATCTAAAATAGGCAAATTCGTGAAGACAGAAAGTAGATTAGATGTTACCAGGGGCGGGGGGAAGAGGGAAATGGGGAGCTATTGCTTAATGGTTACAGAGTTTCTGTTTCAGTTGATGAAAAAGTTTTGGACAGAGGAGTGATGGCCGCACAATGATGTGAATGTAATTGAGGGCACTGAAGTGCACACTTAAAATTGGCTAAAATGGCAGCTTTTATGTTATATTTTACCACAATAAAAAATAGAGGAAACAAGCAATAAAAGGAATGAATTACTGACAACGTAAGCAATCAACATACTGATGAAGGATATTCTCAAGTACACTGTACTCAGCAAAAGAAGTCCGATACAAAGGAGTACATACTGTACGATCCCTACTGGCCCTTCCCAGAAAAAGTATGCAACTCCTGGCACCCTGAATCCAGACACCTCCCCGCAAAAAAAGACAACTATAATCTGTAGTCGCGGAGAGTACATCAGGGCTTGCCTACGGCTACAGAGAGTAGGTAGCTACAAAAGGGGAAAAGGGAACCCTTGGGGTGACAGAATCCTTGACTGCGGCACTAGTTATAAGGATGTATAAATTCGTAAAAAACTAAAAAAATCTGCTAAATTTGTATTTTGTTGTATATAAATTATATCTCAATAAAATTAACCAAAAAAACCCACCACTCCTTTAGAAGCAATAAAGCATGACAAAAGTATGTAAATAACTTTAACGAAAACAGATCTTAAAAAATTACTACAAGGGTAGTAGTGATACCTAGTCCTGGGATCAAGTCCCCCATCAGGCTTCTTGCTCAGCGGGTGTCTGTTTCCCCCTCTCCCCCTGCCCCTCCCCCTGCTTCTGTGTATGCTCTCTCTCTCAAATAAATAAATAAAATCTTAAAAAAAATCACTACAAAAAATGAACACTTTGGTTTGCAACAACAGAAGGACCAAAGGTGTTTCTCTACTATCCACCTTGGGGCAAATTTTTTAAAAAATTTCCTTTCGAAGGATAAAAATATTAAAATTCTGAAGTTCATAGATATTACACAGTAGGTCTGTCAGCAATCCAAAGATAAGTGACCCAACTACTTTTAGGGCCAACATACATGTAGCAAAAACATTTTGGCGCTATTGGTATAACTACAAAATCAAGAACTTAACCCTCTTCAAACATAAGAAAATACGTAATTCCCAATGAAAAACGTAAGCATGTCTTCTATCTTCCCTTTCATCAAGTAGTTAAACAGAGATCATGGAAAAGTCTGATTTATTAGAATTCAGTTAAATATTCCTATTATCAGCAAATACTATTTTAAGGAATAGCTGAAACTCCTGTATGATTCATAGATCTGCAGGTATACAAAAGACATGTGTGAAATAATTTTATAAAAATACACACATGGGGGCACCTGGGTGGCTCAGGCGGTGAAGTGTCTGCCTTCAGCTCAGGTCAATCCCGGAGTCCCAGGATTGAGTCCCACACTGGGCTCCCTGCTCAGTGGGGAGTCTGTTTCTCCTTCACCCTCTGCCCCTCCTCCCTACTTGTGTTTTCTTTCTCAAATGAATAAAATCCTAAAAATAAAAACACACACACACACACATATGCTGGGGCCCCTGGGTGTCTCAGTTGGTTAAGTGTCTGCCTTTGGCTCAGGTCATGATATTAGGGTCCTGGGATCAAGCCCCATGTTGGGCTCCCAATTCAGTGGGAGTCTGCTTCTCTCTCTCCCTCTCCCTCTGCCCCTACCCTCTGCTCGTGTTCTCTATCAAATGAATAAAATCTTTTTAAAAAATTAAAAAAAGATAATACACACATGCTTTCAGATTTAGATTTATCTATAGTAAAAATAGTACTGTTTTGTGTTCCCACCTCAGGCTGGGAGCCCAAGATAATTTTTCTAAAACCTCACTTAAACTATTAGCAGTTCTGCATATAGAAAGTGGACAATTATTTCAATTTGCTGAATACAGCACCTAACCTTGAGGTCGTGGAATGAACAAGGCAGAGTCCCTCCTCTAGACCCAGTGACTATCATCTTCCTGGGAACAATGATTCTTGAAAGGTCCTGTGGGTCATGGGCCTATCAGCCCTCACATCAATCAGATAGATTGGCCTGTCCCCGCTTGGCTGTGTCAGAGACTGGCCAACCTCCTCAGGCCGAGTCTTCCAGGCCGCTGAGTCACCTGAGCAGACGGGTTTGTTAGTGGAAGGTGCCTGTGCGGCAAAAAGCTGCAAAAGGTGCTCTGCCAAACTAAAACCTAGAAAAAGGAGTGATTTTATAACTTTTAAGTTTGCCTCTGAACCCCCCAAAAGTGGTAACTTAAGATTTGAGTGAAACAGAGAGCTGCATGGACTGAAGGTCTGAAGAGCCAGTCATAAGGCCGGGGCGGCCAGCTCCTGCTGGACGAGTCTGTGTCTCTTTGGGCTTGTCTCCTCATATGTTACATAACCTCCAAAGTGCCTGGTTGTCTGAGTGCAGCGTGGGGTCGTATTTTAGAGCCTGCGTGCCTTGGCATTCTGGCATCTCTGCTGCCCGTCCCACCACTGTCTCCTAACTTTTTAAATGAAGTAACTGTTCTGAAAGAACAACAGACAGGAAATCTAGGAAATCTGTGTTCAAGGTGAGGCTTTGCTCCAATATGCTGTAAGTTCAGACAAGTCCCTGAAGTTGATCTATAATTTCTTTTGGCTCAGTCTCATTTGCAAAATGACCTAACTGTTCGACCAGCCACTCTCTAATGTTCAAAACAAAACTCACCTTTCCCCAAACACTCTTCCTCCTGATCTCTGATGCTGTATCTGAGAGAGAATCCCCTCAAGATCCTCTGTGATTCCTCCTTCATTCATTACCCATCCCACCTCCACCCCTGTTCTAACAGTTACAAGTCCTGTTTGCCTCATCTCTGAAACCCAGACACTGATTTCTGGGCCCAGCGACCAGACATAGTTTGGACCATACGCAGCTCTCACAGTAGGTCTGTCAAAGAGCGATCATAAGCACCCCTGCCACTGTTCTTTCTTATCTCCAATCTATTCCATGTAGTGCTGCCATCACCACCCTCAAAACGTAAAAAACTGTCCTGTCACTTCCCTGTCTAAAATCCTTTACCAGCTTCCAAATGCCTTATACATGAATACACAACTCTCCTAGGCCTAGAACCCACCTTTGTAGCCTCTGCACACACATCAGTCCCCCCTTCCTATGTGACCATGAGTCTCTGCACGGCTGTATCCTTCAGCTGCATTGCCTATCTTCCTTCTCAGAGTGGGGACCTCATCCTTCCAGGCGTGGCCCCAACGCCCCCTCCTCTACCCCAGCTCCTACCAGCATTTCTCCTTATGCTCCTGTGTACACCTCTCTAGTGTCCTCACACTGCATTCTAATACTCACATTTCGTGCCCCTCTACCAGCAGAACATGCCCGGTATCCACGCAATGGCTGCCCTGTGTTAGGGAAAGTAGTCAAGGATGGAATTTAAAGTGCAAGTTTGAAACCAGACTGCCATGGTTTAAATCCTAGTTTCACTTCCCACTGGCTATGGCCAAGATACTTAATCTCCCCAAGCCTCTGGATACATGGCTGGAAGAAATGGTTTAAATCTCAAAGTGTTCTTATAAGAACAACGGATAACATAGGCCACGTGCTTAGCACCCTTTTGAGGTAGTAAGAGAAAAATAAGAATAATGGTAATAAGTAGTAGTGAGTAAGGGACAGGCAGGGCTAGGTAGGGAGAGAGAGGTAGGGGGCTACGGGATCAAGCTCATACAAATCTCAAAAATTCAGAGATATAAGGAAACCAGAGCTAAGGGAACAAACCAGACCATCCTGTCCCAGGTGTGGGAGCTGGGGTCTTATTATGACAGCTACGTGTGACCAACAAAGAATTACAGGACGCTAAAAAGGAAGCAAGCCACTGACGATGTTATCACTAGTCCTTACTCAAGGGTGCTATCAACAGAGAAGTAAAAAAGATTTAAGTTCCCTGGTTAGCTTTCTATAAAAGACCAACCCTAAAAGCCCACAAGGGTAAACCTGTCAGGACCCCTCCCCCTCCTGAGAGCTTCTTCTGTTTCATCACTTACTGAACCTCTATCGGTTTACTCTCCTTTGTCTGAGAGATTCAGTCTTCGACTAGGTGAGACAAGAACCTCGCTGGTCTCCCACTTCAATAGCAGCGGCAGTGGTAGACAGAAAATTAATAGCGAAGACTGACGTCGCTGCTACTTGTATGTCAGGCATTGTCCAGAGAAGCTGACATATATATATACCACTCCTAGGGCCCTCGCGACAGGAAGAGTTGAGTACTATTATTATACTCTTTCCCATTTCTGCAGAAGAAACGGACAGCACAGAGAGTCTGAGTAACTGCCCCGAGGTCACAAGTAGGCTCCATGCCCAAAATGGGGCTTGAACTCAGGACCCTAAGATCAAGAGTTGCAGGTTCTGACCACTAAGCCAGTCAGGCACCCCAACCACTGAACAGATAACTTATCCAAGGTTACTCAGCTTCTAAAGTGGCAGACTTTGTATGTAAGCTTTCAACCCCACAGAAGCTCCTTTGATTTTAGAAGAGTTATTTTAAAACATTTGGAAAATAGCTCTAATGGTGAAGTCTACAAAGGGGGGAAAATACCCAGATTCACACGAATTCACACAGCCATAATTTACCTATATGATTATGGAAATTTTCATAACCATAGAGAATCAAAGGTGGAAATTACTGCTATAGAAACAATTTGTTTTACTTGGTTACCTTTTAAAAAGCAACATTTCTAAAAAGAAAATAGGACTGCATTCTAGCTAACCCCAGAAACTATGTTCCTCTTTTGCAAATAAAGATACAATAGCTGTGTAATCTGAATTGAGTGACATTTCCTTTTCAGCTCTACAGTCAGGGATAATTTAGCTAAGTTTTATTAAATACACAGATCTATAGTGGACTGTGCTACAGAACTGTATTCCAAAAATCACCAGTATCCACAACCTTCCTCATATACCTTTTTAATTTCAGAATCTCGGCCTGAGCTTCATTTCCTTACCTGTACAATGGGGCCAACAGTACACACTTCTAAGGGGCTGTGGTGATTGATTACTCTTTAAGCAAATATTCATGAAGTGCTTACTCTATACTGCATATTGTTCTAGACACTGAAAATAAAGTAGTGAACAAAGTACTTGTTCTCAAGTCTACGTTCCAGCGTGGGATACAGATATACTGATGATAAATATATTAGTGAAAAGTGCTAAGGAGAATAAGCCAAGGCAGGTCAATAGAGTGATGATGAGAGGACCTGAGGGTTTTGTTGGTGTTCAGAGAAGGCACAGACCTGCAGTGTGGAGCGAGTAAGGCATGTGGAAACGGGGCCATAGGTTGGGTAGAGAATTACGGGCAGCAGGAATGTAAGTACAAAGGCCCCAAGGAGGGGAATGGGTGGCTCACACACGTGCCACCCACACCTCTCCTTGGGGTCCCCGCATCAGCAAGGAGGCAGTGACACTGGAGCAGAGTAAGGGAGGGAGACCCTGGTGGCTGACATCAGAGTGAGGACTGGAGGCCATGTCAGGTAGGACCCTTGTAAGCCCTCTCACAAGTTTTCTGTTTTATTTTCAGTGAGATGGGAAACCATACAGGTGTTTTGAGCAAACAAGTGACAGGATTGGAGCTACGTCTTTAAAAAGAACTTTCCGACGGCTGAGTTAAGTAGACAAAAGTTGGCAATGGTGGAGGCAGGAGACCACTTATGCTATTAAAATAATCCAGATTCTTCAGTGATCTGCACACCCGACCTAGGACTGGCACCTGCAAACCCAGATCAAGAGTCCTGTGCTCCACCAGCCAGGCGCACCTCCACCAGCGACTACTAACTGCTTTACACAAATCTAAAGTCATATACAGATTTTAAGAAGTTTTTTTCCAAGTGGAGATGTTTTGACCTGGAAGTTTCATTGAAGAAAGGTGACTGTGATCTTGCTGCCCTAGGCCAGAGTTTTCTGCACAGCCGTATTTCCTCTGACCCTCTAAGGAGGCATGGAAATCTGCCAGGGAACAAAGCCACACAGACAACCTCCTCACGTTAAACCCAACCCCCTGACAAGGGGTGGTGAAAGGCCAACCAGGCAGAGCAGCCTGAACAGCCGAGCAGCAGGCCCCTCCCCCAGAAGACAGACCGGAAGAACAGGAGCTGTTCAAGAAGCTGCTGCCCCATCAGTGCCTGGACTCCGTCTGGTCCAAGCGCAATAAGCCTGGCAATGAGCACCTGGCACCCACAGTCCGGGCCACTGTCGCCCAGTTCAACGGTGTGGCCAAGTGTGTCATCACCACCTGCCTTGGCAACCCAAGCATGACAGCCCGGGACAGGGCCATGGTGGTGGAGCACTGGATCAAGGTGGCCAAGGCCTGTCAAATCCTGCAGAACTACTACTCCCTGAATGCCATCGTCTCGGCTCTGCAGACTGTCTCAATATACCACCTCAAGAAGACATGGGAGAAAGTTTCCAGGAGCAACCATCTAATAAATCTGCCACCCTGGTGATGGCCCTCCGGAGAGCCTAGAAGAAGAGGCTGCAGAAGAAAGGTGTTGTCCCCTAACTTGGCACTTTCCTCACTGAACTGGTGATGCTGGATATTGCAATGGAGGACTATCTGGAGGTGGGTGAGCCTGAGGATTGTGGGGGAGGGACCAGAATCCGGAGGTTTGGGAGCAGAGCGCCCCTGTACTGAGCCCTGAGCTCTCAGGACTCGGCAAACCTCCCCTCATGACAGCCTCACGGCTACCCTGTGAGCCTGGGGGCTGTTGCCCATCTCAGGGATGAGCGAGGTGAGGCTGCAGTTAGGCCACGGCTCCCGGTGCCGAAGACTGGTGAAGCAGCAGAGCTTCCTGAAGGCAGGGCTGCATTAGGTCTGTCTGACTGGACCTCAGCCTCCCCCGGTGAGTTTGCCCGTGGAGGGAGAATGAAGTCAGGACCCTCCACGTCAGCAAGCACCTCAGTAGCCGCAGCAGCCCCTTCCTGCCTGAGGCTTCGGCCTCCCCCACTGTCTTCCGAGAGGGTGGTGCTGCAGGGTCCCGACCTGTAGCCAGTCCATCTGCCCCATGTCCTCCTTTCTCTGGACCCCAGAGCCTGGCCTACATCCCAGGCCCGCTATCTGTGTATGCACGGCCCCCTCATGGGTCCTGGCCATGGTGCAGCATGAGAAGGGATGGGAATCAAGTGCTCCTAAGAACCAGGGGCCTCATTCTGATGGACTTTGTCTGCTTTCCAGGGGAATGAGATCAACGACCACAAAAGAAATAAGAATGCAGTGCAAGACCCATCCCATTAGGAGATGGGGACAGACGCATGGCATCCAGGAGAACTTCCCGGAGGAGAGGCTACTGATATTCACCTCTGAGAA\n>XM_012612283.2 PREDICTED: Gossypium raimondii prefoldin subunit 5 (LOC105786035), transcript variant X1, mRNA \nAATAATAGGAACATAAACAAACCACACAATTTGAAAGAATTCAAAACCAAACAAACAAATAAATAAAATAACGAAACTAAACAAATAAAATAACAACCCAACATTGAGCAGGCATCCACTTTCCCTTTCCATGGGCAATCAGCAACACCATGGAATCCAAAACGGCAACCTATGTTCCTAGCCAACATCATACCGTTCATCTCCCCTGATCTCAACCGAAACCCCCCAAACATTGTCGAACACTCAAAGAATTTAGCAACCCATCACCACCTCAAAAGTAACCCACCGGTCTTCGTACCCCCACCCTAGATAGTAGTAGCCCTCAATACCCTTCCCCCCTTCAAACCCCATTAAAGTTTCTTGCGATGCCATCAGAGAACATCTCCACCATTTCTTCCCCCAACTGTCATTCGCGCCGATCGTTGTCCATCGCATCCCTCGCAAAGTCCAACACACACCCTTCCAGATAAGTGCTCCCACCTCTCATCAACCCCTCTGTTGATAGTATATGTGCAACTCTATTCGCATCCCTGGGAACATGTCTAAATGAGCATCTTGTGAAGCCTTCTATTTTTTTCTTTGCATCGTATATATAAGCCCCTATAACCGGCCCATCTTCATTGCAGGACCTCATCTTTTTTATCACTGACAAGGCGTCCCCTTCTACCATCACCTATTGAATCCCTAAATCTATCCCCAAACTTACTGCCTGAAGACATGCAAGGGCCTCTGCTGCAAAACTCGTAGGGAAGAAAATGTCGGTTCCTCTCACTGCTTCCCTTTATGTTCCTGGCACACTCGATGATGCCGACAAAGTTCTTGCCGATATCCGCACCGGATACTTCGTTGAGAAAACAATGGATGAAGGCAGAAATTATTGCGAGCGTAAGATCAACTTAGTGAAATCCAATTTCGATCTACTTAATGAGGTTCTTTCCAGCAACTCGAGCAACCGAATTAAGAAAAGATATTTTCAAAATATGACAAAAGGAGACTGAATATGACTTCTGGGAACGATACAAGAAGTTATGTGCAATCTGCCTACAACACGACCTAACTGAACAATCATTTCTTCAATACTTCTATGACGGGTTACTTTGTATGAAAATGAAGATAATTGATGTCACCAATAGAGGGGCACCTGTTGGCATGACTCCTCAAAGAATAAGGGAATTAAT\n>XR_008246896.1 PREDICTED: Vigna angularis uncharacterized LOC128195426 (LOC128195426), ncRNA \nTTCAGTGGAATGAAGGTTTCATTCATGCATGATGTTGTTTGTGGATGGTTTTGCTTATGTATGAAATGTCTCCCAAGTGCATTTTGTTGTGTTACTGATTTGTATACTTGTTGTTTGCTTAATCTTACATTGTTGTTGTAATTTTTTTCGATTGGTAGTCATGGACCGCGTTGGCCTTGCTGTGAAAAAAAACAAGCCACCTCAAAATGAGAGTGGTGAACCTAGTTGGCCTTGCTGTGAAAAAACTTGAACCCAATTACCCAGTTCATTCGGCTTTGGTACGAGTTATGTTGGTGAAGCCAGGGTCCTAGAAAATGTATTTTTATGTGACACGAATGTTAAGAAATTGTTCCCAGATTACTTAGAAGTAGCTGAAACGAGGGAAAACAAACAAGGCACCCCAAAATGAGAGTGGTGGACGTAGTTGGCCTTGGTGTGCAAAAATTGGAACCCAGGAAGAACTACAACAAGTTAGGGAGCAATATGTTTGTCAATGGATTTTGGATGTGGACAACGTGCGGAGGAATCAAGTGTTGGAAGATTTAGGCATTTTGTAGAATGTTGGAGATTATTGATGAAAGAAAACTTGTTACTTTTCATATTTATGTATTGGTTGGACATCAAATCTGATTTCAGAAATTGTTGAGAAATATATTTGGCAGTTGAAATTCA\n>XM_017185738.1 PREDICTED: Drosophila ficusphila calphotin (LOC108088083), mRNA \nCAACGAGTAGTCGGTCGCTGTGAAGAACTATTTTACTGTTCGATGTCTACTGACCATGAAAGGCTGACCATGAAAATTTGCGTTCACTAATCACCGGATAAGTGAAAAGCTCCGCAAAAGGGCAAACGAGTTTAACCGTGAGAGAGGCCTGAAACTAGAAGGACATGGAACCTGCAGCGGCACCAGCACCTGCTTCTGCCCCAGTGGCAACGCCTGTGGCCCATGCAGCAGCAGCTCCTCCTGTGCAAGTTGCTAGCCCCGTGGCAGTGGCTCCTGCAGCACCGTCGCCGGTCGTTGCAACACCAATTCCTGCTGCTCCCCCCACTGCGAGTGTTCAGACAGTTACTGCTCCTCCTGCTGCTGCTCCCCCTCCTGCTGCTCCGGTTGCTGCTGCTCCTGCCCCGGTTGCTGCCACTCCCGTTGCTGCTGCTCCAACCCCGGTTGCTGCCACTGCAGTTCCTGCTGCCCCCGCTCCGGTTGCTGCCACTCCTGTCGCTGCTCCTGCAGCTGCATCTCCTGCTGTTGCAACTCCCGTCGCTCCAGTGGCGCCACCTGTTGTTGCAGCTCCCGTCGCTCCAGTGGCCACTCCTATTGCAGCAACAGCAGCTCCTGCTGCAGTGGCGTCAGAGCCTCCGGCTCCTGTAACTCCTGTGATCGCTGCTCCTCCTGTTGCAGTTGCTCCTGTGATCGCAACACCACCTGCTGCGGTTGCTGCGATTCCGGTGGCAGTTGTTGAGACACCAGTCGCTGTTGCTCCTGTGATCGCAACACTACCCGTTCCTGAGACTCCAGTTGCTGTTGCTCCTGTTATCGCTGCATCACCGGTTCTAGTCGCTGAAACACCAGTTAGTGTTGCTCCCGTGATCGCTACACCACCAGTTGCTGCGACTCCAGTTGCTGTTGCTGCCGAACCTGTTGCTGTCGCAGAGACTCCAGTTCCTGCGACTCCTGTTGCTGTTGCTCCAGTCATAGCTGCATCACCAGTTGCAACCCCGGTGGCAGTTGTCGAAACACCGGTAGCTGTTGCTCCTGTAATCGCTGCGACGCCAGTTGATGTTGCTCCGGTCATCGCTGCGTCACCAGTTGTTGTTGCGGAAGCTACTGTGGCTCCTGCTGCTGCTCCTGAGATCGCAACCCCACCTGTTGCTGTTTCTGAAACTCCGGTTGCTGTTTCACAGTCTGAAGCGCCTCCTGTTGCTGCAACACCGACACCTGCACCAGAAGCCCCTGCCCCGATTGCACCAACTGTGGAATCTCCAGTTATTGCAGCCCCTGCAGCAGATATTGCTCCTGTCGCTGCTCCAGTTATCGTCGACACTCCTGTTGTCGTGGCCGCACCAACACCTGCAGCAGCAGAAGCGGCTGTCATTGCACCACCAGCTGTTGTGGAGATCGCAGTTGCTGCTCCTGTGGCTGTCACACCGGAAGTTGCTGTTCCTGAGACTCCTGCTATCGAAGCTGCCACTGTTGCACCAGAACCAGTTGCTGTTGCACCACCAGAAGCTGAACCAGCTCCCGCTGCACCAGCGGCTGTTGCAATTGAGAGTGCTCAGCCAGCTACAGTTCCAGAACCAGTTCCTCCAGAGCCAGCAGCTGCAACCGTTTCCGAGCCAGTTCCTCCAGAGCCAATTGCTACACCAGTTCCCGAACCAGTTCCTCCAGAGCCAGCTGCCACAACAGTGGAAGCTCCAGCTCCAGTTCCGGAAACTCCTATAGTCTCTGTGCCATCGGTTGAAACACCTGCAGCTATACCAGACACACCATCCCCTGCACCAATTCCACAAGTTTCAGCCGCAGTTCCAGAGCCGATACCCACACCAGAACCAATCGTTGTCACTCCTGTGGATCCTTTACCAGTGGAGACTCCAGCTGCGAGCCAGGACCCACCAATTGCCAAAGAGGAACCACCAGCAGAAGCACCAGTTTCTGTGGCAGCAGAGATCCCACCAGATCCACCAGTTGTTAATGAAGAACCAACAGTTGCTCCTGTGACAGCAGAAGTTCCGCCGGAAACTGTTACAGAGGTTTCCGCTCCGGCCGAGGATGCTGTTCCGATCGCAGCTCCTACAACGACATTGGAAGCAGATACTACTACAATCGCAGAAGCTTCACCTGCGTCTGAACTTGCAACACCTGAAGTTGAAGCCGTTGCTGCGGCCGTCGCCGATCCCGTCGCACCTGCACCAATTCCGGAACCAGCCGCGCCGATCCCCGAACCAACGGTTCCTGAACCAACCGTTGCAGCTGCTGAACCAGAACCAGAAAAAGCGGAAGTCAGTGAGCAAACTGTTCCAGCAGCGGAAGAGATTACTGTATCTGAAGTAACAGAGACGGCTACAAAACCTGTAGAGGATATAGTTCAAGAGAGTACCAATGTAATTGACGAAGCAACTCCAACCACAACTGAGTCCGCAGTTATAGTTTCTGGAGAAGTATTGGAAAAACCTCCAGCAGAAGAAGTGGTTGCAGTAGAGTCTGGTCCTGAGGTTGTGGCCTCAGTAGTAGAAACTATTGAAGCTCCAGCTGCAGTAGAAACCACCGAAACTTCGCCAGAACCAGTGATTTCAGAAACACCTGTTGTTGCAGCTGAAGAGCCAACTGCAGAATCAGTAGAAACTATAACCAGTGGTGCGGCAGGTACTTCTGAAGAAAAACCAACAGAAGAGGTTCCCGCAGATCCTAGTTCCGTTCCCGTGGCAAAGATAACGCCCCTGCTGAGGGACCTTCAGACCACCGATGTTTCGCTGTTGGCCATCGCGGCCACTTTGGATGCAATTGGAGAAAAACTTAAGGACCAAAAGGCCAGAAACCAGCAGGTGATGGACAGACTCTGCGAGATCGAGAAAATTCTTGGACCACCTAAATCAAATTAGCTTAAGCTGAAGGAATAATTCATGGTAATGTTAAACTAAAATATCAGTCGAAAATATAAAAATTAACATTGAAATAAACTTATCAGTTTAAATTTCA\n>XM_043518673.1 PREDICTED: Dermochelys coriacea RNA-binding protein 14-like (LOC119858569), transcript variant X5, mRNA \nGCTAGGGCGGGTCTCGCGGATTGTGACGGATGCAAAACAAAGGTTACAGGCGGTTGGGGCTCAAGTGCGCCCGCGCAACGACGTTGCTAGGAGAAGAGCGGAGGCGCGGATACAGAGGCAGGAGTGCGCAAGACAACAGTAGCACGCAGGCGCGGCATTAGCCGAGGGTCTCTCTTCGCAGGCGCAGTTGCTCGTAGGCGGTGGCAGGTAGCGCGCTGCGCAGGCGTGTCGACGGCTGGGTGGTTCCTTCCTCTTTCCTTCCTATCTGAGCGTTCGGAGGGTGTGAGGTGCTGCCGCCATTTTGTCAGGAGTCCCGGTGCCAGCTCGGCCGCGGCCATGCGTCCTGGAGTGAAGCTGTTCGTGGGGAACGTGCCCGAGGAGGCCACGGCCGAGGAGCTGGGCGAACTGTTCACGGGCGCGGTAGGCCCGGTGCTCGGCGTGGCCCTCATGAAGCAGTTCGCCTTCGTGCACCTGCGGGATGAGGCGGCCGCTGTCCGCGCCATCTCCCAGCTCAACGGGCACCAGCTGCATGGCCGCCGCATCGTGGTGGAGCCGTCCCGCCCGCGGCCCACCAACACCTGCAAGATCTTCGTGGGTAACGTTTCGGCGGCCTGCACCAGTGGAGAGCTGCGTGCGCTCTTCCAGCAGTACGGGCCCGTGGTGGAGTGCGACGTGGTGAAAGGAGACACAATCATGGAACAGGGGTTGGTACTCCTTTCCATTGCACCTGCAGAGCTGTTTCAGGTGATATGGACCTGCCACCAGATGCAACATGGGTGGTTGATAACAGTCCAATATGGTGTAATCTGCACAGCCAACTCAAGTGTGTTGAGATGTTTGCTGACTTCTTGAGAGACTTTGAGATTTATTCTTCAACTTTTTTTAGCTGCCTAGATCTGAGCAAGTCATTGTGATTCGTATTGCACTACTCTATTTGGACTAGGGATGTGGGAAATTCTTCATCAGTTGGAGTCTCTATGTTGAAATT\n>AY571475.1 Uncultured bacterium clone RsaHf359 16S ribosomal RNA gene, partial sequence \nACCTTACCTGGGTTTGACATGGTAGTGAATGGTGCAGAGATGTATCAGTCCCGCAAGGGACGCTATCACAGGTGCTGCATGGCTGTCGTCAGCTCGTGCCGTGAGGTGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTACTGCCAGTTACTAACAGGTAACGCTGAGGACTCTGGCGGAACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTATGTCCAGGGCTACACACGTGCTACAATGGACGGTACAACGTGACGCGAAACCGTGAGGTCATAGCGAAGCACAAAAAGCCGTCCGTAGTTCGGATTGAAGTCTGAAACCCGACTTCATGAAGTTGGAATCGCTAGTAATCGCGCATCAGCATGGCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATCCGAGTTGGAGGTACCCAAAGCCGGTAGCGTAACCGCAAGGAGCGCGCTGTCTAAGGTAAATTTAGTGAGGAGGGTGAAGTCGTAACAAGGTAACCGTA\n>XM_017212262.2 PREDICTED: Drosophila eugracilis peripheral-type benzodiazepine receptor-associated protein 1 (LOC108105593), transcript variant X5, mRNA \nATGGGGTTAACAGAGAGAACGGGGCTCTGTTAGTGGTTAACAGGGTAAAGTAATAGTAAATCGTAACTAACAGCCCCAGAGCATGAACTTACCCACTTGCAACCCCAAAGGAGCCCGTGAGCGGGAGAAAATTACCCGTTTTTCAGTGTCATTTCACAGAAAAATCGATTCCCCGCACACTGGGTACTGGGCATTGGGTTCTGGGTTCTCTGGGCCACTCTGCTCTGGCACACTGAGCACCGAGCTCTGGCAGTTGGGTAGAAATCAGAGTACAAACCAGCAGCGCGACCGAGATGACCCACTTTTCGGTTTTCGCACTGAGACCCAACTGCTACCCACAGAAAGTGGACAACTAGGCGGAGTTTTTTTCTATATAAGTAGCAGTTTAAACGATCGCGTTTTTCGGATAATTATGTACAGCCTACGTAGCCTAGTGTAAACTCTATGCATTTATGTGAATTTCCCAGCGCAAACGTGGAAGACGAAAACAGGCGACCTGAAAAAGCAGCAGCAGCAGCAGCAGCAGCGAGCAAGAAGCAGAAGCACAAGCAGCAAAAAAGTCGTCCGAGGGGCAGCCACAGCATGCCGTACGAGTCGATGCACCATCATCAGTCGGCGGCCGCTGCCGTGGCCGCTGGCACAGCCCCCAACGGAATGCTGGACGCCCTCAGTCTGCAGCTGCGCGATGCGGAAATGCGGCGCACAGAGATCGAGCGGGCGCATCAGGAAACCCTGGCACAAATACGAAATCTAAGCGGAAGCGCACGTCCCGATGCCGAGGCGGTTGAGAATCTGCAGTCGAGAGCCCGGGAACTGGAAAAGAAGGTTGCGCTGGAAAATGTGCGCTGCGAGGAGCTGCAAATCGAACTGACCTCGGCTCTGAAGGCCAAACAGGCGTCCCGCTCGGTCTGCTCTGGAATGGTCGGCGTGTCCTCCGGAGGCGGAGCCACCATTCCTACATCAGCCAGCAGCTCCACCGTCACTTGGGCACCGACAATCAGTCACCAGGACCAAGGCTCCGAGATTGATATCATAATGGCAAAGATTGAGCAGGATAATCGCGTGCTGGCCGAGCTGGAGCAGCCTCGCACCTCGGCCAGCGCCAGCATGTCAGCATTGCCGCCCAGTTCCATGTTGAGCACGGTAAATAGCGAATTTAGAACCATATCAAAGAGTGAACTCGAAGAAGAACTGAACCGTTATAAAAGGGCCGTTCTTGGCGGAAGTGGCGGAGGTGGTGGCGTTTCAGCTCTCTCCTCCGGCTATTCAAGCCTGCCGCAGTCGTTGGCCTCTACGCTGCCCAATGGCGGGGCAAGCACCAGCCTAAGCGGTACCAGCCTTGGCTCGCACAGCGTGGCCGCTGCTGCTGCCGTTGCCTCTGCTGGATCGGGGGGTGTGACTGGGGGTGGTGGAACGGGAGGTTTATCATCCATATCGGCCCTGGTGCCCAACTCAATCAGCGGCATATCCTCGAGTCTAAGCAGCCATGCCATACAATCGATGCAGTACGGAACCGGACAAACGTCCGTGGAGAAGCTGCTGAGCGGAACTAGTGGAATCACTGGGATTCCACCTCTGCCGGTAAATATTCACACGATGAAGGCTATGCCAACGGCATTAAGTCAGCGCGGAACAATACAGCTGTACAATTTGCAGAGCACAACCATGCCCCTCCTGTCACTCAACTCGCATAACCTGCCGCCCGCCGGCTCGACCAGCTACTCGGCCCTGGGCGCCGGCGGCGGCACCTCGCTGACGCATCCAACCAATCTGGCCAATCTTGGCCTGCTGGACACTGGCGCCCTCTTGGGTGCCACCGGTCTGAGCGGTTTGGGCGTGGGACCCGGTGCCGGTGGCATTACCGGTGCCACATCACTATACGGTTTGAGCGGCGGCGGAGGTGCCAGTGGTCTGGGCAGCTCCTATGGTCCGCCCTTCCTGGACGTCGCCTCGAGCGCCTCGTATCCATTCACTGCGGCAGCCCTGAGACAGGCTTCCAAAATGAAGATGCTAGACGAGATCGATATACCGTTGACGCGGTATAACCGCAGCTCGCCCTGCTCACCCATACCGCCCAGCAATTGGGGACTGGACGAGTTCACCGACGGCCTCAGTGTCTCCATGATGCACAACCGCGGCGGCCTGGCACTGGGTGCCCTTGACTTGGACACTCGCAATCATGGGTTAAATGGAGCCAGTGAACCGCAGGTGGATATGCTGGATATTCCTGGAAAGGGGCGCTGCTGTGTGTTCATAGCCCGTTTTCCATATGATCCGCCAGATGTTCATAATGAATTCCTTTCCATGCCTTGCAGGGAGGCTGAGGGCGAGCTCTCCCTGTGCGCCGGCGACTATCTGCTGGTGTGGACCAGCGGGGAGCCACAAGGTGGCTACCTGGATGCCGAACTACTGGACGGACGACGCGGCCTTGTTCCGGCCTCTTTTGTGCAGCGTTTAGTAGGCGACGACCTCCTGGAGTTCCATCAGGCGGTGCTGTCGACGCTGCGCGATGCCGAGGACGGATCGATGCAGTGCGACACCACATCGCTACCCTCCTTGCCGCCGCACAACCCATTGCTCACACACACCCACGAGGACCTGGCACGTTTGAGTGAGACGCACACCGATCTGGAGCACGACCAGGACGACATTAGCGACAATGTTCCAGCACCCAAGCACTTGACGCTGGAACGGCAGCTGAACAAGAGCGTGCTCATTGGCTGGTCACCGCCGGAGCCAGTGGGCTACAACCTCATCGACAGCTACCACGTCTACGTGGACGGCGTGCTCAAGGTCACCGTGAAGGCCAACGAACGCACACGAGCGCTTATCGAGGGCGTTGACTCCACGCGGCCGCATCGCATCAGCGTGCGGAGCGTGACTCAAAACCGACAGACCTCGAGGGATGCCGCCTGCACGATGATCATTGGGCGGGATACCGCCCACCTGGGCCCCTCGGCGGTGCGCGCTTCGCACATAACGTGTTCCTCGGCGGTCATCTCATGGCTGCCGGCCAACTCCAATCACCAGCATGTGGTGTGTGTGAACAATGTGGAGGTGCGCACCGTCAAGCCGGGCATGTACAGGCACACGATCACGGGCTTGGCGCCGAGCACCCAATACCGGGTGACCGTGCGTGCCAAGCACCTGCGGGCCGTGGGCCAACATGCCGCGAACGTGGGCCAAACAGGTGTAGCCGGCAGACCTGGTCAGGAAGAGGCGCCCGGAGCGTACGCTGACTTCCGTACCCTGACCAAGGGACTGCCCGATCCGCCACAGGAGATTCAACTAGAGGCCGGCCCGCAGGATGGTACCATTCTGGTGACATGGCAGCCGGTTAACAGGCCCACCTCGACGGGGCCTGTAACCGGCTATGCTGTGTATGCCGATGGTAAAAAGGTCACCGATATCAACTCGCCCACCGGTGACCATGCCCTCATCGACATTGGCAAACTGGGTGTCTTTAATCCACGCGCCGTCACCATTCGCACCAAATCCCGCGACTCCCAGTCGGCAGACAGTGCGCCCATCTTGATACCAAATACCGTGCGAAATGCCGTGGCCCGAAGGGTGCCTAACCAAATGGGCATGGGTCCACAGTTGCCGCAGGGACCGCATGGGATGCAGGTGCAGCAGCAGATGGGTGGAATGCCTGGACTGCCGGGTCAACAAGGTCAGAATATGATGGGTCAGCAGGATCATGGCCAGTACGATCCCAATCAGATGCAGCAGCAGCAGCAGGGCATGCAACCGCAGCCGGGTCAGCCGGGTCATCAGGGCTATCAACCAGGGGCACCAGGAGCGCAGCGGGGCATGGTCCCGATTCCGGGCAGGGCGCAGGGACCACAGCAACAGCAGCAGCAACAGCCCTACGGACCCCAGGGTTCCATGGGTGGGCCACGCTTTCGAGGACCAGTTCCGGGCCAGCTTAATATGCAGGGCCAGCAAATGCAGGGTCAAATGCAGGGTCAGATGCAAGGTCAGATGGCGGGTCAAATGCCTGGACAGATGCCTGGACAGATGTCTGGTCAAATGCCTGGTCAAATGCCTGGACAGATGCCCGGACAAATGCCCGGACAAATGCCCGGACAAATGCCCGGACAAATGCCTGGCCAGATGATGGGACCACGAGGACCGCTCAATCAGCAGCAGCAACAACAGCAGCAGCAGCAGATGCAGCAGGGCCAACAGATGATGCCAGGCCAACAGCCTGGACAACAGCAGACACAACCCGGACAGCCGGGTCAGGCCGGCCAAATGCCCGGGGCCCAGAAGAAACCCCGCTATTTCGTGGCCATGTTTGACTATGACCCATCCACGATGAGTCCCAATCCCGATGGCTGCGACGAAGAGCTGCCCTTCCAGGAGGGCGATACGATCAAGGTATTTGGTGATAAGGATGCCGATGGCTTCTACTGGGGCGAACTGCGTGGTCGCAGGGGATATGTACCGCACAACATGGTCTCGGAGGTGGAGGACACTACTGCCTCTTTGACAGCCGGCGGACAGATGCCCGGCCAGATGGGCCAGGGTCAGGGTGTCGGCGTGGGTGGTACTGCCCAGGTGATGCCCGGCCAGGGAGCTCCGCAGCAGAGCATGCGCAACGTAAGCCGCGACCGCTGGGGCGACATCTATGCCAATATGCCGGTGAAGCGGATGATCGCGCTCTACGACTACGATCCCCAGGAGTTGAGTCCCAATGTGGATGCCGAGCAAGTGGAATTGTGTTTCAAGACGGGCGAAATCATACTCGTTTACGGTGATATGGATGAAGACGGTTTCTACATGGGCGAACTGGACGGCGTGCGCGGCCTGGTGCCGTCGAACTTCCTGGCCGATGCGCCCGATCAGTACAACAACCAGATGGGTCCGGGCGGTGTGGCCGGCAGAGGTGGTCTCAGCCAGCGGGGCAGGGGTCAGGGGCCAGGAGCGAGGGGTCCACCGCCCCCGCCACGTGACAACATGATGCCCGGAATGGGCGGTCGCGGCCAACCGGGCAAAAATGCTCGCCCTGCTTCCCCTACACTGTTAGACAACACGGGCCATCCTGCCCCCGATCACCAAACGCAGGGGATGATCGGTCGCGTTGGTAATGTCGGCCTGCAGCAGCAGCAGCAGCAACAGCAGCAGCAGCAGCAACTCCAACAGCAGCAGCAGCCGTATGGTCAGCAACAGACGCAGATGGGACAGCAGCAGCAGCAACAACAGCAAATGGGACAACCTGGAATGATGGGTCAGCAGATGGGTCAGCCGATGGGTCAGCAGATGGGCCAGCAGATGGGACAGATGGGTCAAATGGGTCAGATGGGTCAACAGCAGCAACAGCAGCAACCGCCGGTAACGACACAGGCGCAAACGGGTGGCCTCTTCTCCGGTGCGACTAGCCTGCTCTCTGGTGCTACCTCGGCTGCCACCGGTGGTCTATTTGGGTCGAAGCAACCGCCCAAGACGGATCCAATGCAACCACAAGGTGGTGTGCAGCCAGCGCAGCAACAAGCAAATGCCTTCGGTGCCCAGCAGCCCGGCATGGGTATGCAGCAGGGGGGAATGCAGCAGGGGATGCAGCAGGGGATGCAGCAGGGTATGCAACAGGGGATGCAACAGGGGATGCAACAACCGGGCATGCAACCCGGTATGCAACAGGGTATGCAACCCGGTATGCAACAGCAGCAGCCACAGCAACAACAAGTGCCACCGCAAGCCCAGGCTCCGCCACAAGGACCGGGCGCCGGTCTGCTGGGCGGCCTTAAGGGTATCGCGGCAGCGGCGCCCGGCGGCGATGTCCTATCGAAAGGCAAAGACCTCTTCGGAAAATTCGGGTTCGGCTTTGGCAAATAACCCCGGTCATTCTATAGGGTCCTGTTATATTATTCGTAGATTAGACTTATTATTACTATTATGATTATGATTATTGCTATTGATTACGGATTACTAAGCTAATATATAAAGAAAAAAAAAAACACAGACGATGATGATTAGATCGAGGAGGACAGACAAACCAATGCTAAAGTTAAAAGAAAAACCCATACTTTTAGGCCCAGGCTGTGGGCCAATGTGTGTATGTTGTTGTTGTTGTTGTTGATATGAATATGATATGATATGACTAATAGTACTAATGGTAATATTTTTTATTAATTAAATTGATAGAAATATTATGAGTGACCGACAGACAACAGCAGCATCGGCCTAACAGCTGGGCCAAAAAAAACCAAAAACAACAAAAAGCCACAAGCCCAGATAAATTGTTGTAAAATTATTTAACAAATTGCCTGCCGGTTTAGGTGACTGCAACTCGATAAAAGATTCCACTAACCCATTTAAAGGATAAAGCTCTATATAATGCATAAACCAACACACACACACACACTGAGACACATACAGATGCAATACACACTCACATAGATACTGAGAACACAGATATATTATACAAAAAAAAAAAAGAAAAACCAATACAAATACAAAAGTAAGGGAGGAGAAATATATTATATACATACATTATATTTACAATTATTTGTTAACGCACATTGTTAAATTTGCTACTGTTGCTGACCAGTTTATAAATAAAAACCAAACCGGATGGTAAGGAGGAGAAGAGAAAAGGAGTATAGAGGAGAGAAGATAAAGCAAACACATAAGGTAAACTAAAACCAAAAAAAAACATAAACATAAACATACATATATTATATGTATATATTTCAAATATATTGAAAACTAAATTGAGATACACTATAAAACTTACATTTATAAATCAAAAAACAAAAACAAAAACACAACCGAATGTTGAGCAATGTCAGGCAGGCGAAATGATGAGGCCGAACCAAAAAACAAAAAACCAAAAAAAAAAAACAAAAATATAAATAATGAAGAAGAAGACGATACATACATTAAAGTAAAATAAATAAATCGATATGGTACATATTTACATATATTCGCATATACTAAATACGATTTCGCATTCAAAAGCCAACCTCCAATCGGGCGCATTTCCAAGACAAGGCGACCTTGACTTCCAGTCCAGCACAAGAAGCTAACTTTAATCCCTTGAACATCCCCACCCCCCATGCCTTCTTTTCAATCCAGTGATAGCCGAAGCCAAAATTTCTATCTCTTAATTCCTAGTAAAAACTTTCCCCCCTTTTCTCACGACTGCTCGACTCAAAAACTTCTCTTTATTCTATGCAACCGAAAGAAATTTTGTTCAGTGTTTGATGTCCATAGAAGCCATATGCGATAAAATATCAGTGTAACTTAAAGCAAACCAAAGACCAAGAGAGAGATCTACTCCTACATACATATATATATATATATATATATATATATATATGGGATACCCAACAAAATGGCAAATACAAAGCAAATATAATGTACTAAGCACAAGATCGTAGCATTAGACCCTGGAGACATGTTCACTAAATTCAGCAAAAAGGAGACTTTTCCACAACCTTCTTTAGCCACTTAAGCCGCCGCCCCTATTGCTTTTCTTACCAACTTTCTATCGCTATCTAACCCTAACTTTTACCTAACCAAAAGTACACATACCTTTTCGATTGTTATTTTAAATACTACCAATTAACAGATAGTTAGTTACTCGCCTATGCCGCATACTTACGACTACTTCTGTTCTCCTCTCGTGGAAACTTTATGCTTTATTATCCGATACGATCCGATCCGAGAGAGAGAATGAAAATTTGCAGATAGTCAAGGTGTTTCCTAATGTTTGAAAATTGCTTTGACTCAGCCCTCATGATACACACTCAGCATAACACAGACAAATACATTGCGTACCTCTTGCTTTACGAAAATACAAAATACATTCAAGAAATGGAAAGTATAAAGATAACAAAAACCAAAAAAAAACAATTATATTAATGACAAAATTTACCAAACAAATATATTAAACAAGGCATATTTAAAGAGCGCATAGAGAGTTGCATATGTACATGTGCTTGGCCGGCAAACAAGACAACATAATTGTGAGCAAATGATTACTTTAGACACACACACTTACCACAACTGATACATAGTTACACTGCAAAATGCAAATTGCAAATTGCAAACTGCAATACCGAACACTGTAAATTGTAAACTGGCAAAAACAAAAAACATATAGTAGAGAAGGGCTGTTATAGCCAGAAAATGTTGATCGAGAATGACTTACCGAAATCGAAACAAGCGTTAACTTTTCCCACGTAAACGATTTAAATCTAACAATCAAATCAAGTCACTGTATTATTCAGCCACATCGGATAGACAATTACAATCTACAAGCCTAACTTCGGCAACCACCGAAGCCGTGATGCCTACGTAAACCGGAAGATATATCATATTCGAATTTACAAGGGCACAGCGGAAATACACACACAAATACAAATACAAACAGCAGACAAACACACTTACACACACACTCTCTCTATAATCATTTACTAGACACCTACCTATACAAGTATACAAGAACAGTTTATTTCCTCGGAAACAAAGCGAACAATATAGAATAAATGAAATTAAATTCCCATTAAACACACACACTGGCAAAAAAAAAAATGATAATGGCAAAAAAACGAGTACTATGCAATATGAAATGGATAAAACAAAAACCAAAAAAACAAAAAAAATACAAATGAAAACCAACTAAATTGTTATACTGTATTATTATACTTTTTCTATAAATTATAATTTCCTTATTGAACGACAAAAAAGCGAAAAAAATAATAATTAAACAACAATTTCAAAGAAAAAAAAATCAAAAACGCAGCATTTCAATTGCCTTAATGAGGCGTTTCTTCAATTTCAGTGATATTACTCATACGACACGTA\n>XR_003431942.1 PREDICTED: Lagenorhynchus obliquidens AVL9 cell migration associated (AVL9), transcript variant X2, misc_RNA \nCGGAAGCGGATGAGGGAAGCTCGGCTGCGGCCCGGGGGGGGCGGTGCAGAGCTGCAGGAGCCTCGGCCTCCTCCTCGGTCCCTGCGAGGCTCTCATGCGACGCCCTCGCTGACACCTGAAATCCACTGCTCGCCTCCTCCTGGGGGTCACGGGGTTGCTCGGCTTGCCGCCCTCGGCGGTTGCAGTCATCGTCTTGCGGGCCTGCGGCGGTCGCCCATGGAGAAAAACGGGCGCGGCGGCGATAGCGCCCCCCGTGGGCCCGTATTGCACATCGCGGTGGTCGGCTTTCATCACAAGAAGGGCTGCCAGGTTGAATTCTCTTACCCGCCCCTGATTCCAGGAGATGGACATGACAGTCACACTTTACCTGAAGAATGGAAGTATTTGCCCTTCCTTGCCTTACCAGATGGCGCACACAACTACCAAGAAGATACTGTGTTTTTTCACTTGCCACCCAGAAATGGAAATGGAGCCACTGTATATGGTATCTCTTGCTATCGACAAATTGAAGCCAAGGCATTGAAGGTACGGCAAGCAGATATCACCAGAGAGACCGTTCAGAAAAGTGTCTGTGTTCTAAGCAAGCTGCCTCTCTATGGCTTACTTCAAGCAAAACTTCAACTCATTACGCATGCATATTTTGAAGAGAAGGATTTTTCCCAAATTTCCATTCTAAAGGAGCTCTATGAACATATGAATAGTTCCCTGGGAGGAACTTCATTAGAAGGATCCCAGGTATATCTTGGTTTATCTCCTCGAGATCTTGTGCTTCATTTTCGACACAAGGTCCTAATCCTGTTTAAACTAATTCTTCTTGAAAAGAAGGTTCTCTTTTATATTTCTCCAGTGAATAAATTGGTGGGTGCCCTGATGACAGTGTTATCCCTTTTTCCAGGCATGATTGAACATGGTCTCAGTGATAGTTCTCAATATAGACCCCGAAAGAGTATGTCTGAAGATGTTGGGCTTCAAGAAAGTAATCCCACTGAAGATGAGTTTGTTTCTATGCCTGCTCCTGACATTTCAAATACCAACTTGGAAACTGTTGAGAAAATCATGATGAGAAACCATGGAAGAGATGCTGCCATGAAGACTGAAGAGCCTTTTTTCCAGGTAGATGATGACAGCAGTGAAGGACAGGAACCCAATGACAGCAATCAATATTTGAAACCTCCTTCTCGCCCATCTCCAGAGTCTTCAGAAAGTGACTGGGAGACCTTGGATCCTAGTGTCTTAGAGGACTCCTCCTTGAAAGAAAGAGAACAGGTGGGATCAGAACAGACAAACTCATTTCTAAAGGACTCTTTGCCCTCAGACAGTCCTCCGATTACTGTACAACCTCAAGCTAACACAGGCCAGGTAGTCCTGATACCAGGGATAATTTCTGGTTTGGAAGAGGACCAGTATGGCATGCCCCTGGCCATCTTCACAAAGGGATATCTGTGTTTGCCTTATATGGCATTGCAGCAGCACCATCTTCTCTCTGATGTCACCATTCGAGGATTTGTTGCTGGAGCTACTAACATCCTTTTTCGACAACAGAAACACCTCAGTGATGCCATTGTGGAAGTAGAAGAAGCTCTGATCCAGATCCATGATCCAGAACTCAGGAAGCTGCTTAACCCAACCACTGCAGACCTAAGGTTCGCAGATTACCTAGTGAGGCATGTGACCGAGAACCGAGATGATGTCTTCCTGGATGGCACGGGCTGGGAGGGAGGTGACGAATGGATTCGAGCCCAGTTTGCAGTCTACATCCATGCACTGCTGGCCGCCACGCTGCAGTTAGATAATGAAAAGATCTTATCAGACTATGGGACGACCTTTGTTACAGCATGGAAGAACACTCACAACTACAGGGTCTGGAACAGCAACAAGCATCCAGCACTTGCAGAAATAAATCCAAACCATCCTTTCCAAGGCCAGTATTCAGTGTCAGACATGAAGTTAAGATTCTCACATTCTGTTCAAAACAGTGAACGTGGCAAAAAACTTGGAAACGTCATGGTCACAACGAGTCGGAATGTTGTGCAAACAGGAAAAGCTGTTGGCCAGTCAGTTGGAGGAGCTTTTTCCAGTGCAAAGACAGCCATGTCTTCATGGCTTTCTACTTTCACCAGTTCCACTCCACAGAGTCTCACTGAGCTGCCTGACGGGAAACCCTGAGCGGAGCAAGCCACCCAGAAGCTGCTGTCGCTTTCTTAGGTTTAAGCATCCCCTGTCTGTCTGCTGCTCCCAGACTGTTCCTCTTCATCGACCACAGGTCCACAGCAGGGACCAATAGGTCGAACTGTTTACAGGGACGGTTGCCCTCTGTGTAAATGAATGTCACGGGATGCTGAAAAGACGAAACCACAAGCGTAGCAGGGACGGCTTCCCAGTGGACTTGGCCTGTTTTTCTAGAAGTACCCTTCATGTTGTCAGTGTGGTTTCTGGCCTGCTTCACAGTTGGAGAGAAGGGCCAGCTTCGTTTATTAGGAAACCAGCGGAACTAAAGGACTCATTGCTCGTTTTTTTTTTTTTACTCTCTCATTTTGAAAATACTTGTGGTGCTTCAGTTTGTGAGGTGGTGACCCTCGCAGCAAGAATGTTTAGTGCCTGGGGCTGCACAAAGTACCACCAAACGGAGTTTGGTCGTGCAGTAACATCTTGTCACATGCTCACGGACAGAAATCCCCAGGGGACTAGGATATTGCCCCAAGCAACCCATTTTTCCATCCGTACTGGTGAGCTTCAGAATAACCTTGACATTTCCACTGAGGACTCCTAGCACATTTTCACATATGTATTTCCATGTACCATGGTTTCCTTATAGCTGTTTTGCAAAACAGCTTCACAGAAGAAGGAGACAAATTTCTTTGTTCCCAGGAATGTGCGCTGCCTTGAGTACAGGGTTAAATTTAAGGTACCAGTGTTCTTACAACGTGGACTGTTGCTGCCTGGAGCTGACAAGGTGACTCGGGCAGTAGAGCTCGACACCGCCAACATCTCCCTTTTCCGAGGACCTGTTCCAGCTGCACTTCAGGCTCTGCCGTGGTGAGGGGATGGTCCCCCATTGTCTCCCAGGTCAGAGCTGCCTTCTCTTCATTCTGATAGAATGGGAGTTGCAATGATCAAACCTGGCAACATCTGGAAAGAGCAGGATTATAGAGGCAGTTTCTTCCAAGGAACCACACTTTGTGAAGGGCTCATCTCCTCCTGTGGTAATCACAGGCTTAGGGAACCGCTCTGCAGCAGGACTGATCTGTCCAAGTTCACAATCGACAAATCCCCAGCGGAGCTTCCAGTCGCGTGACCGACAGCCAACTCCAGTCGAGGCAGCTAAGGTCTAGTCATCCAGCGCAGGTCCTGTGCAAAACTTTGCCTCAGCATGAGTTTTTGAAGACAGAGGAGGGAACCCAATTTTTTTTTACTTTGAAGGGCTGATGTTCTCCAAGTCTAGCAATCACATAAATGTCCGGTGTGTCCGGAACTGTCCTGGGCAGCCACAAGCCCTAAGGACTTTTAGCACCGAAGCAGAGACTCACACTGGCCTCCAGAGATCCAAGATGTGCACATCTTTGGCTACTTGCCCTGGGAAGTCACTTTCAGAACTAACCCATGTCCCTCACACTGCATTTTAAACCCTACCTTCTTCCCATCAAGTATTTGAGTGCCTACTGTGTACACACACAGTACATGCCACCCACATAGCAGGGGGAGAATGGATGGTTACCATAGTGGGTAAAGAGGCTGGGTCAAAGGTCAGCCCAGTGTGTTTGAGCAGGTGGCCAGCTCCTTTTTGGCAGGGGTGAGTAGATGTTTCTTCCCCTGAAGGCTAAGTGATAGTTTTAGGAGTGAGGTGGGTTTAGATACAAAGGGCTCCAGGACCTAGGAGAACAACATAGGCAAAGACTGGGAAGCAGTGAATGTTCTTTGGTGTGACTGGAACCTAAATGGCAAGGGGGGATGGGCAAGAGATGAGGCTGTAAGATAAGGCCAGGTTTGGAAAAAGAGATACCTGTCAGCCTGGCAGAGGGGGGGTGGACTTGATCTAAAAGGGCAGGGGAGAACCTTAAAGGGCTCTCCAAGGGCAAGTGGCAGGTTGGGTGCTGCATTTGAGAAAGTTCATTCTGGGTTGGGCACCACTGCATTTGCATGGCCATTAGCTCTAGTGATGTCTCTCTGAACTCAGCCATCACCGCCTTCCTTTTCCTCAAGGGCCCAATCTCTTAGCTTTGTACCAACTTTAAATCCCATTTGCCCCAAACAATGGGCCCCAGAACAAAACTCCTATGGACCCAGCCCTCAGTCAAAAACCAGTCACCCTGATGTCACCCTAAGAACTGTTTTCCTTTGATTTCTCCAGCCGTTAGACTAGCGGGGGTGGGGGGGTGGGGGCTTGTGAACGAGGAGCGGCTCTAAAGTGATTGTGGGCGGTGCCGGGAGAGCCCGGAGGACACTTAAGCATCTGCTGAGGTTACTCTTTTTGGCAAAGGGGAGACCCAAGAGACCCGTGCCGCCACCACCATGTTGATAAACCTGGGCGAAACTCACTGTTTCTTCCTAAAGTTTACAAGCAGGAAGGGAATGCTTCGTATGTTCTAAAAGTCCATCTGCAGTTAACATCCGGACTTTCATTTATATTCGATCTAATCCATGGAATTTTTATTCTGATCAGCGTTACCAGATGAGCCATGTGCACTGAGGAATGATTAGCCCAAAGTAGGACAGAAGAGAATCTGAAAAGTAGCCTTTCCACCTGCCCCCTGGCTCTGCCCTAGAAAACAGTCAGTCAGCAGCACTTCCTAGAAACCACGGAGACAGAAGTTACGCTGCACCGTCTTCAGCTGCAGGAATCCTGAATTGGTTCTTTGTACAAGATCATCCATGAAACGCCAAAGCCTCAGTGCCCTCGATAGATCATTCACTCCCACTAAATGCCTTAGAAATGGAAATTCCAGAGGAACTTGACCACCTGCTATATAGATGTCATTATCGGGAGTTACAACGGTTCCAACCTTATGTAAATCAGCTGGTGGGCTGCATAGCTTGTAAACTTTTTCTGCTTGGGGGCTGTAACAGACAGAAGA\n>AB179100.1 Macaca fascicularis testis cDNA clone: QtsA-12801, similar to human tetratricopeptide repeat domain 3 (TTC3), mRNA, RefSeq: NM_003316.2 \nCAGATGTAAAGTCTACACCAGTGTCAGATTCATCTTCAGCACCAGCTTCTGAAGATGTGAAACCCAAACCTGTGTCTGCAAATTCTCCTGAGCCAGCGTGTGAAGATGTGAGGGCCAAACCAGTAGCCGACAATTCTTCTAGACAAGTTTCTGAGGAAGGGAAACCCAAAGGGGCCTCTTCCAATTCTCCCACACCAGGCTCTGAGGATGCAAATTACAAGCGATTCTCCTCTAATTCCCCCAGACCGGTTCTTGAGGATGTGAAACCAACTTACTGGGCTCAATCCCATTTGTTCACAGGATACTGTACGTATCTTCCTTTCCAGAGATTTGATATCACCCAGACACCGGCAGCATACATAAACGTGTTACCAGGTTGGCCCCAGTACACCAGCATATATACACCCTTGGCCAGCCTTTCTCCTGAATATCAGCTACCAAGATCAGTACCAGTGGTGCCGTCTTTTGTAGCCAATGACAGAGCAGATAAAAATGCCGCTGCCTATTTTGAGGGTCATCATTTGAATGCTGAGAATGCTGTTGGTCACCAGATTGCCTCTGAAACACAGATCCTTGAAGACTCTTCGGGAATATCTGTAAAGTCACACTGCAGCACAGGGGATGCTCATACAGTCCTGAGTGAGTCTAACAGAAATGATGGGCACTGTGGAAATTCTAACAACAAATGTGAAGTAATTCCAGAAAGCATCAGTGCAGTAACAAACATTCCACACGTGCAGATGGTTGCCATACAGGTATCTTGGAACATAATACACCAAGAAGTCAATACTGAGCCATATAATCCTTTTGAGGAACAACAAGGGGAAATTTCACGGATTGAAAAGGAGCACCAGGTATTACAAGAGCAACTTAAAGAAGCATATGAAAATTATGAGCAGATGAAACTTAAGGGCTTAGAAGAGACCAGGGACCTGGAAGAAAAGTTGAAAAGGCACTTAGAAGAAAACAAGATCTCAAAGACGGAATTAGATTGGTTCCTTCAAGATTTGGAAAGAGAAATTAAAAAATGGCAGCAGGAAAAAAAAGAAATCCAAGAAAGACTAAAATCACTGAAGAAGAAAATTAAAAAAGTTTCAAATGCCAGTGAAATGTATACCCAGAAAAATGATGGAAAGGAAAAGGAACATGAATTACATCTGGATCAGTCCCTTGAAATCAGCAACACACTTACAAATGAGAAAATGAAAATAGAAGAGTGTATAAAGAAAGGAAAAGAGGATTATGAAGAGAGTCATCAGAGAGCTGTGGCTGCAGAGGTATCCGTACTTGAAAACTGGAAGGAGAGTGAAGTGTATAAGCTACAGATCATGGAGTCACAAGCAGAAGCCTATCTGAAGAAGCTGGAGCTGATTAGCTGTGATCCTGCAGCATATCCTGACATGGAGTCTGATATATGTTCATGGGAACTGTTTCTTTCTAATGTTACAAAAGAAATTGAGAAAGCAAAGTCTCAGTTTGAAGAACAAATTAAGGCAATTAAAAATGGTTCTCGTCTCAGTGAACTTTCTAAAGTGCAGATTTCCGAGCTTTCATTTCCTGCCTATAACACGATCTTTGCCTGGGCTGTTCCCAGCCTGGAACACCGTCCCCGCTCTGCATCCTGCCTTCCCCTGAAACCCCATCAGAGGCTGCCCTCTTTTGGCCTCCCACTGTGGCCCTTCTCTCACATGCATTAGATCTCAGCCTGGCCTTGAATGTCTCTTTCCCGCCAGTACCTTGCACAGTAAACATCCAAACTTACTGTGAATTCATCTGAAAAAAAAAAAAAAAATTAAGTATGGAAAAAGTGTGACCACCCTGAACTGAGTAAAATATTCTGTTGAGATCCAGTTTTTTTCTCTCCATTGAATGTGCAGTTTTAGTTAGAATTACACTAAAGGGCGGCCGGGCGCAGTGGCTCAAGCCTGTAATCCCAGCACTTTGGGAGGCCGAGACGGGTGGATCACGAGGTCAGGAGATCGAGACCATCCTGGCTAACACAGTGAAACCCCGTCTCTACTAAAAAATACAAAAAAACTAGCCGGGTGAGTTGGCGGGCGCCTGTAGTCCCAGCTATTCGGGGGGCTGAGGCAGGAGAATGGCGTAAACCCGGGAGGCGGAGCTTGTAGTGAACTGAGATCCGGCCACTGCACTCCAGCCCGGGTGACAGAGCGAGACTCCGTCTCAAAAAAAAAAAAAAAAAA\n>XM_018370368.1 Pneumocystis carinii B80 hypothetical protein (T552_01802), mRNA \nCTTATTTTGCTTAAAACTAAATACATCTGGACACTTTTCTATCTTAATGGATGATATTTTGGATATTACAGTTCAATTTTCAGGAGGGTTACAGACCCTATTTGGTAACAAAAATACTCATCATATTCAAATATTACTATCCGATCCTGCTTTAAAAGGTAACCCTCCTAACATTGCTTATTTGATACAATTTTTATCTGAAAACCTCATGAATGATGCTCGAAAAAACTTTTTCATTAAAGATGATACTGTACGTCCTGGTATTCTTGTTCTTATAAATAATGAAGATTGGGAATTAAATGATGAAAAGTATTATATACTTCAACCTAAAGATGAAATTACTTTTATCAGCACATTACATGGAGGATAATTATAAATAAATAAATAAATATCTCTTGAAAATTATTTTATTA\n>XM_028690088.1 Plasmodium gonderi protein phosphatase 2C domain containing protein (PGO_140940), partial mRNA \nATGGGTAATTGTATGTCCATTATTAGTTATTCCAAATTCAAATTAAAAAAAAAAAAATTGGAGGATTCGGATGTGCATTCAAACCCAGATTACGAGAGCGCAACTGATAGCAATATCCGTGATAAAGATGAAAAAAACAGAAAAGGAAAAGACTTAAAGCATAATCCAAATTTAAACAATTCCAATTGCGATAAAAAAAGTTTTAATGTCATCCATGAACATGATACAAATTCCATATATTCAAGCAATCCTGGTAACTTTGATCAAAATGAGAAAGATGAACAAAAGCAGCCTGTTTCCAATGAGGACATTGGTTACCTACGAAGGGAAGAATCGGATCATCATATGATAATCCAGAAAAACAAAAAGAAGAACAAAAATAGTAACAATGTGATAGGAAATGACGAGATGAATCAAAACGAGGGAAACCAAAACGAGGTGAACCAAAACGAGGTGAACCCAAATGAAGTGAACCCAAATGAAGTGAACCCAAATGAAGTGAACCGAAACCAGGTAAACCAAAGCGAAGTAGACAGAACCAAGGTGACAAAAAAAACGAAAAAAGAAAAAAGCGAATCCAAATCTAATATAAATGGAAAAGTAAAACGGAGCACGTCCAAAGACAAAAATACAAAAGACATAATTCCCAATAGTACGCATAACGACAGAGATAATTCAAAATCAAACGAAACACATGATTATAAAGGAGATGTGTTTTCAAATAAGAATTCCTCATTTAATAGCGAATCAGTTAATAGCAAGGATTTGCAAAAAAGAAACAAAAGAGAGAACTTACTGAACATAAAATACAGCAATATGATATTAAATGATATAAGAGATGTAGACATTATTGTCGTTTTTTTATTTAGTCTTTTCCTTTATTTTAATGCCAATAATATAGTAGACATGTTGGATAGAAATAAAAAGGATAGATATTCTCTTAGGAATTCATTGAATATAAATCATGATATCATAAAATTCCCAACGTTTCCCAAAGAAATTATTGACAGTTTTTTGAAAAATGATTTTACTTTATTAAAAAAATATATAAAAAATAAATGTAATAAGTTGAAGAAGAAGTATAAAAGTACATATTTAAAAAAAGTCACAATAAGTAACGAAAAGGGTGAAAAAGTAGAAGCAGGAGAACAGAATCAAATCGGAAAAACAAATCAAAAGGATGAAAAAAACACAAAAAAGAAAAGTTTTAAATACGAATTAAAAGAAAAAAAAGAAAAATGCACTTTTTCAAAAATTATTGAATCTGTTGATAGAAATGAATGGATTCATAGAGACATAACCGAAATACCATGTGATCAAAATTTGCCAGATCTGAAAATTACTTTTATAGTTATGGGGGCATATTGCTTTTACCAAAAAAACATGAAACCATTTCAAGATAAAAATACTTTTTTTTACAAATCCCCATCATATGCTTGTGATGCAGAAATTTCTGTTGCATGTAAAAAAGGAAGAAAATTAGATTTCCCAAATCAGGATGATTTTACAATTATACAAACTAATGAATGGATTTTAATTATGGTATTTGATGGACATGGGCCATCTGGTCATGACATCAGTAATTTTGTACATGTAGTACTCCCTTTACTTTTTTCATACAATATTGAAAGAATATTTGAAAACCCTGTTCGAACAATGAAAACATTATTTTATATGATAAACTGCTACTTAGTTAATTATTCCTACTGTATAAATAATAATATAAATCCAATTAACATAAATTTTATTGATTATAATTTAAGTGGAACAACATGTACAATCATACTCTACAATTTTCTAACAAAAAAAATTTATTCTGCCCACACAGGGGATAGTAGAGCTGTTATGGGAAAACAAAATGAAAAAACAAACACATTTAGAGCTTATAATATTACTGAAGATCACAAACCATCTTTAAAATTAGAAAGAGAACGAATTGTTGCATTTGGTGGAGAAGTGAAAAAATTGCAAGGAGATGTTTCATACCGAGTTTTTGTTAAAAATGAAATGTACCCCGGATTAGCCATGAGTAGAGCTATAGGTGACATTACTTCGTCTTTCATTGGTGTTACTTGTGAACCTACCATAAAAATATTTGACAAATCTGATGAAGACAAGTTCATTATTGTTGCAACAGATGGTATCTGGGAATTTATAAGTAGTGAGGAATGCGTTCAGATGGTTTCTCGAAAGAGGAAGAAGAAGGTGCACGTTGCCATGGAAGAAATTATCAAGGAATCTTGGAGAAGGTGGGAACGAATTGACACCGTCGATGATATGACACTGGTTATTTTATATTTCTAA\n>XM_024490585.1 Echinococcus granulosus hypothetical protein (EGR_01336), partial mRNA \nATGCATGGAGCGCTTCAGATGCTGCATCGTGAGGACGATATTTATGGCGGTTTTCCTTCAGCCGTCCTCCTCGCTCCCTCTACTCTTACAAATGGTAGAAAGCTGCCCATTATCGCAACCTCCAGTGAAGGCACACCAATCGGCTACATAATTACGCCTAATCCTACCAATGCTGATTCAAAATTTGTCGCTAATGAGACAACGGTCCAAAAGCAACAAATAGGATCTGATGATGCTTCTTCCAGCTCTACCGGTCACGTAAAATCCACCTGCAATGGTCTTCTGTACCGACTACCTGATGGAGGCTATGCAAAGGTGGAAAAGAATTACATGACAATCAACCCCAAGCTCTATCAGCAAAGCATATATCGAAAGCTCCATGTTCATGAAGAATGGAACGGACCTATCACCCAAGCAAATAATGCTCAGGAGGATAATCACGGCATTAAGAAAAAGGTTGTTGTGGCCCATGAATCGTCGCCTGTTTTGGAGGGAGGAACGGGCCACGAGGAAACTGACGTCGACACACCACAATGA\n>XR_004086260.1 PREDICTED: Quercus lobata vacuolar sorting protein 3-like (LOC115966022), transcript variant X5, misc_RNA \nATTTTTGAACTTTGCTCTGTACGTAGGGTCCAAGGAAACTGATGAAAAGGCTGATGAGGTTCTAAAGTAGGATATTTTGGATTGTTGGACGCCAGAAAATCACTATGGATGGACTGAATCTAAGTGTTAAACATTTCTAAATTTAGACCATCTATAGTGATTTTCTAGAGTCCAATAATCCAAGATATCCAACTTTAGAACCTCATCAGCCTTTTCATCAGTTTCCTTAGACCCTACCTCTGAGGTCCACGAAAATGGAGGTGTATCATAAGAAGTCGGGTAGGTGTATTCAATCGATAAGTTTTGGTGGGGAAGGAGTTGGAGCTAGCGTTATTGCTGATGAGGAAGTTGGGAGTGGGAAACTTGTTGCTGTTGGAACACCCAACAAGGTTATTTGCTATCGTAAATTACCTTCTGAAGAACAAATCAAAGACGTTTTGAGAAAGAAGAACTTTAAAGAAGCCATTGCCTTGGTGGAGGAACTTGAGTGTGATGCTGAATTGTCAAAGGATATGCTCTCCTTTGTTCATGCTCAAGTGGGGTTTCTATTGCTGTTTAACCTGCATTTTGAGGAAGCAGTAAATCACTTTTTGCTGTCAGAGACAATGCAGCCTTCTGAAAGATAAAGGTACCTCCAGTGGTTGATTGAAGATCAGGACTGTGATGATACTCAATTCCATACATTATATGCTCTATCACTTGCCAAATCAGCAATTGAAGCCTTTCAAACTGAAAATACTTATCAAAACAGTGACATTGGAAGGGTAGATGAGACAGTAATTTCTGATAATAGAATGAACTCGATCTTTGAAAGTCCTCTTCGAGAAAGACTGCAGATATTTTTGTCGTCTTCAGACTTGTATGATCCAGAGGAAGTTCTTTACTTGATCGAAGGATCGGAGTTATGGTTGGAAAAGATCGTTTACTGCCTAATGATTTGCATCATTTCTTTCAAACTGTTGTTAGGCAATTCTTTACAGTAAACTGGGTCAAGAGGGATTAGTGCTCCAAATTTTGGCATTAATCAGCACTGAAGAAAATGAAGATGAAGTGACTGAAAATGAAGAAAATTCGGGTTCTGCTTCTACTTCTGCCAGTACTGAAGAAAGTATTGAACTTTCACCAGCAAGAGCAAGACCTCAAAGGGTGAACCGTGCACAAACAAGACTCATGTGTTCATTTCTCCAAGCAAGTTGAGGGTGAAGCTCATAGGGCCTCACCATCTTAGAAAGAAGGATGGATCAAACAGTAACTCTTCTAGACACAATTTGGTTTGCTGAGGAAGGTAGTGCATAAGCCATGGTTCTTGACAGCATTCTATCTTCTCCTCATCGTAGGTCACCATCATTCAGGAAGCAATTCTCGCGGGATGATTCATTAAGCTGGCCAACACTCCTTCAAAGGCACCGCTTCCTCTTAATAGCTCTAATTCTCCTAGCTTTCCTATGCACTATGTATCTTTATTTTGCTGTCACTTTAGGTGCTTCTGGATCATGTTCTGATTTAAAGGGTGCTCAGAAAGCGTCAGGTTTGGATGCAAAAGCTTCTGTGGGCAATGGAAAATTGAAATTCCTTTGACATGTAGATGATAATTATAGTTGGAAAGCATTTCCGTCCTTGGTTCTTTTCGATTCTAAGGAGATTGAATTTAACCATACTTTTAAAATTGCAATAGGTTGTTTGCTGTTTTTGAACTCAATTGTCCTGAATCTTATATATGAGAAATGTAACAAAATTTTCATTTGGAGACTATATAGCAAAAATTTGATTTGGA\n>XM_033023418.1 PREDICTED: Amblyraja radiata transmembrane protein FAM155A-like (LOC116974698), mRNA \nAACTCCCGTGCCGTCTCCTGTTCAGTGCATGCTCCGAATTGATGAAAAGCCGCAGTTTCAGATGTATACTGCAGTAAGGAGACTGCACCGCAGCAGGATTGTGCTCAGCAACGGGCGGCTGTAAAAGGAACTAGTCTGGCACTAAATGCGCACGGCGGCACACGATACAATACTATTACACCTTTCGCCTCTTGTCCCATTGCTTTAGGCAGCGGCCGGGGATACATCTCACGCCAGAATGTGAACTGGACGATCGCCGCGAACACCGAAGACAGGATCCAAAGTGCCACTTTTTGGTGCACGGTTCGAAACTTCGCTCGAGGATTTGTTGTTGTTGTTGTGAAAATAGCGAAGGGCAGCTGATATTTGTGCGTGGCTGTGGCTGTGCCGCCGCAGACACGGCTGGGACGCGCCTGGTGCACAAGTGGATGATGCAGCGCCGGTGTGTGGCAGCGCTGGAGATGTGAGTCTCCCCTTCTCTCCCCTCAGCTCAATGTGCCAGGATGGAGCGATCTCGGTGCTGGGATGACGCAAACCACCGTCCTCAACCGCAACCCTCACCCCCCGCCCAAAAATAATAATAAGAGGTGTTTCTGGGCGAAGATGGCCGCAACTTCCACCCAACATGATGAACGCTGCGTTGCTCCAAACGCCAGGGCCAGCGACGTTTCGTCGGCATCAGGAGAAATAGTTCAACTTTTCTCTGCTTGCATCTGGTGAATTTGTTGGCGCCGATGTTGGCAGGGTCGGATGTGTGAGGCTGGTGTGATGTGAATCTGCAGAGAGTGGGCAGGGGAGAGAGGAGCTCGCTCGCCGTCGCCAGGAGCAGGCTTTCCCCCCGGAGTGCCATGGATAAGTCTGGTGTGACTCTCCTTGCTGCTCCTACGGATTGGATGGCAACAGTTGACCACCCGTACATGCAACCCAAGTGAACGCTCAACAGAATAGCAACGCGGCTGATCTAGCAAGACAAACCCGGTCAATGTATATCGAGGCAAAGGTCCGTTCGCCGCGGAGCCAGCCCGAGCCGCACTTGTCCACAATATGACCAGAGGCGCCTGGATGTGTCGCCGGCAAGACAACGGATTACAAATCTGGTATGTCCCCCGCCAGAACGACAAACCCTGCACGGATTCAGAGCGGGCCCAGAAATGGCGACTGTCTTTAGCATCTCTGTTGTTTTTTACCGTCCTGCTATCTGATTACTTGTGGCTGTGTGCGGATGCGAATCTCACCAGAAGCAGAGACCAGGAGCGGAGCACTTCAGCCGAGCCGACGGGGGGGAACCGCTCACTGTCCCCACTGTTCCTCAGCGCTGATCAGCCTAGGAGCACCGCCAGCAGTGACAAACGTGCTATTTTTCTAGGTAATACCACTAGCAGACCCATCTGCCAACTGGAACCGTGTCGCCCATATTATGTGTGTGAGCAGTGTGTAAGTATTGAAGATGCAGAGACTGTGTGCGGGAGCGCCGGCGAGGATGCGTCCAATGGGTCTCCGCCGCTGTCCTTCAACAATTTCCACCTTTCCTTTTGTGAATCCTACACCCTTTCTGAACTGTTCGCCGGGATGTCGAGACCAGAGGGCTCCAATTGCGATCTGAGCCTTGTGCTGGACGGCGACGCCACCGTCTGCATTCAGTGCGTTGAGATTTATCAACGTTTGGACCAACATGCCCAAGAGAAATACGAGGAGTTCCAGAGCTTGTTTCAGAAGTATTTACAGTGGGGAGATTACTCTGTGAAAAGTTGCATCGATGACTGCAAGGGACAGATGGTGCAAGGTGCCAGCAAGTTCACGAATTGCACATATGAATGTGTTTGCAGAAGTTCGGAGACTGCTGACACTTTTAAGGAACGGTAG\n>XM_033152434.1 PREDICTED: Lacerta agilis small nuclear RNA activating complex polypeptide 2 (SNAPC2), transcript variant X3, mRNA \nAGCGACGGCTTTTCACTAACTAGGCGGCGTTGCGTTTGAGGTGAGGACTACCGGAAGATAACGAGCAGCGTTGTGTCGCCTTAGAAGCCAGGAACGGGTGGCTAGAGCGCCATGAAGCCGCCTTCCAGGCAGCGTTCAGCCCCTGCTCGCTACAGGATGGCCCCCACGAGCCAGGCTTGGACGGACCCAGAAAAGCGACGCCTTCTTCGGGCCTTGAGAGCTCACGGCCAGGGTCCGTTGCGGCCCGAGCTGTTGAAGGAGTACCTGCCTTCGAGGGATGAAGAAGAGATCATGGCATTTGTGGAGCACCTGAAAGAGCGTGTAGCAAAGGAAGCGGTCAAGGAACAATATCAGTATCGCCAGCGTAAACAGAAGGATGCTCCTATTCCAGCACCTATTGAGGTTTGGACAATTGCATCTACTGAGCCACTCACCTTGCTCCATTCCGTGCCTCCAAAGTCAGTGGTGACAAAGAATTCTCAATGTTCATCCCAAAATCTTCATAGTGAGAGTAGGAAATCCAACGAAGAATCTCATGAACCAACTGTATCATCCAGTGTAGAGGAAATAGCCCCTGCAGAAAACAGTGGGTTCCATGTGGACTTTGAAAAGATCTACAAGTACCTTTCTGTGATCTCACGTGGCTGTAAGGCACCTGAACTCCCACCAGGTGAGTCAGCTGTGGTCCTTGATTTGCTACTGTCACTGCCAGAAGAGCTGGGCTTTCTGGACTATAAGAAGCTGAAGAGTCACATGCACAAATGTTATACAGAGTTGAACACCCACTACACAGGTGAAAGAAGCAGAATGAAAGAGGGCAACCAGCCTGTAAACAATAATGGAGAGCTATTCCTGCATGTGCAGCCAGCTACTAGTGGCTTACCACAACAGGAGAGTAGTAGTTCTCCTACCACTTCCCAAGATGATGCAACTTCTGCCTCTGCCATGGACTGGAAGACTCTGGGTATCTGCCCTTTGAATTCATTCTTGATTCCTTTGGATATCCTTGCACGTAAAGAAGAAATCTTTGACTGAGGGAACTGGATTCTGTGCTGCCCAGTAATGAACTATGTGCTCTCATAACATGTGAGGGAAGACTAAACAAGCTTGCCGAGCCTACCTTAGCCATGCTCCCCCATCATAGCATGGAGTTTAAGCAGCCTGACCTGCTCTTTTACACCTTGGCTCATGAGTATGATACTTGTTTTGTATTAATACTATATGTACACTGATGTCTGGTCTTACTACTCCATGACAGCTGCTAGATCTTATTTAGCCAGTTGCTATGTAGCAGCTCATAGATGGCCTTGAGTGTTAATCTTGACCTTGGTCTACAGATCATTATGGTTAGTAAAATAAGTGATGTTAGATATCATTCCTAAGTCACAGAATAGTCAAATTATTTTGTAATAACTTATTTTTAAATATATATA\n>XM_011762108.2 PREDICTED: Macaca nemestrina family with sequence similarity 192 member A (FAM192A), transcript variant X3, mRNA \nGGGACTCTATTGTGGCGGTGAGGAACAGGAAGCCCTGAAGGGTCAAAAGGAATACAAAAGCAAAGGCTATTTTCTTTTTTTTTTTTCTTCTTTCATTCGTTCCTTCCTGTTTCTTTCTTTCTTCCTCTCATTTTTGTTTTTCTTTTTTAAGAGCGAGCGGCTCTGCGGTGGCGGTTTGGGGTAGGCGCCGCCGAGGTGAGGGCGTCTCGCCTCCCGCGCGCCGGTAGAATAAACAGCCATTGGACTCTTCAAAGAAATACGCTGTCTGCATCAAGTACTGCTTTTGCAGATTGGTTGTTTCATTATGGATGGAGGGGATGATGGTAACCTTGTTATCAAAAAGAGGTTTGTGTCTGAGGCAGAACTAGATGAACGGCGCAAAAGGAGGCAAGAAGAATGGGAGAAAGTTCGAAAACCTGAAGATCCAGAAGAATGTCCAGAGGAGGTTTATGACCCTCGCTCTCTGTATGAAAGACTACAGGAACAGAAGGACAGGAAGCAGCAGGAGTATGAGGAACAGTTCAAATTCAAAAACATGGTAAGAGGCTTAGATGAAGATGAGACCAACTTCCTTGATGAGGTTTCTCGACAGCAGGAACTAATAGAAAAGCAACGAAGAGAAGAAGAACTGAAAGAACTGAAGGAATACAGAAATAACCTCAAGAAGGTTGGAATTTCTCAAGAGAACAAGAAGGAAGTGGAAAAGAAACTGACTGTGAAGCCCATAGAAACCAAGAACAAGTTCTCCCAGGCAAAGCTGTTGGCAGGAGCTGTGAAGCATAAGAGCTCAGAGAGTGGCCACAGTGTGAAAAGACTGAAACCAGACCCTGAGCCAGATGACAAGAATCAAGAGCCCTCATCCTGCAAGTCTCTCGGAAACACTTCCCTGAGTGGCCCCTCCATCCACTGCCCCTCTGCTGCAGTCTGTATCGGCATCCTCCCGGGCCTGGGCGCCTACTCTGGGAGCAGCGACTCCGAGTCCAGCTCAGACAGCGAAGGCACCATCAATGCCACCGGAAAGATTGTCTCCTCCATCTTCCGAACCAACACTTTCCTCGAGGCCCCCTAGTTTCTCTGTCCTTAACAGGGAGCTCCTCCCCAAGGGTAGATTGGACCGTTCATGCTGCCTTCGGGCATTACGTCTCAAAAAAAAAACTCCTTTGCCTGCATCCTGTGCACAACATGACACTTTTAACCAATCCAATCTAAAAATGTGCCAGAATCCACCTGTGGCCCGAATTGTGTTTGGTTTCTCTTTCTACTGCAGTGCACATGAGCAAACCTATCCCGCTGCCACTTTCCTCACTGATACTGGGAGGAGGGCAAGGCCCAGCTGAAGTTCCACTAAAAATGCCCTAGGAGAATAGGCACCGGCTGGCTTGCCAAAGGGTTTGGGTTTTATTGCTTTCTGTTTTTTTCTTTTCCTGACAGCACAAAGAAGTAAGGGCAGATATAAGTAAGAAGTAAGGTGTTATTTAAACATTCTATTGTAGGTGAACGTGTTGTTTGGTTCTACTGCATTGTGGAGCATGCGGGGGAAGAGAACTGACCCAGGTGATGAAATGGAGCCCTTCCCTGGAACTAACCAGTCCTTGATGTTGTGTGACTAAGTAAAGATGATAAACCCCATCTGCTGGGGGTGTCACTTCACACTCGGCATGCATTGTGAAAGCTTTCCATACCCTTGGCCATTCTCTCTCCCCTCTTTATCCAACCCCGTTTATGCAGGAAGGGACTGCTAACAAGAAAGCTTCCATCTCAGACCTTTTCTCTGCCTGGAAAATTATTTTATGTTTGTTTTTGAAATAAAGGATTTAGTTTAAGATTCTAAA\n>XM_030051840.1 PREDICTED: Myripristis murdjan protein DDI1 homolog 2-like (LOC115359395), transcript variant X2, mRNA \nACATGTCGAAAACATCCTGAAATGCGGCACTAGCACTGGTAGTTGATGTTAGTTGTTGAGATAAGAGAGGAAACTGTCCGAGCAGACCTGGACTTAGTGAGTGTAAACCAAGGCGTTGTGTTCAGGGGGGCAACACCAGTTTCCCTTTAATGAGAGTTTCACCAGAGACCGTCTTCACACCGGGTCACACTAGCTGTTTAGCTCAGCGGGAGAAGGAACTCCAGCAACGGCGCTTGTGTTGCAGCGGGCTCGTCAACTGATCCTCCCCGAAAACAGCGATGCTGGTCACCGTGTTCTGCGCGCCGAGGGACCGCCCGGAAACCACTTTCGCCCTCGACGTGTCTCCGGAGCTGGAGCTGAGAGACTTCGTAGCACTTTGTGAACTAGAATCAGGGATCCCGGCGGGAGAGATCCAGATCTCATATGTAGAGCAGCCCCTAAAAGACCCCACTCGTGCCTTGGGGAACTACGGCGTGAAGGATGGAGATGTGGTGGTTCTCAGACAAGCAGACAGAAAGCCACCACCACCAACTCAGCCAGCCTTCCCAGGACTGCCCCATATAGACTTTCGCTCCATCACAGTCCCAGGCACGTCTTCTTCGACCAGTCAGCAAGCTGCCACAAGGCAGCAGCGTCAGGCCCCACAGCAGCAGCAGCAGCAACAGCAGCAGCAGCAGCAGCACACCGCACAACCTTCTACGCCAATGGCCTTCCGTGGCTCTGGCTCCTCTCCACAGGGGCTGGATGACCCTGCCTTACTCCAGCAGATGCTGTTATCCAATCCACATGAGCTTTCACTCCTCAAGGAGCGCAACCCACCACTGGCTGAGGCCCTACTCAGCGGAGACTTAGAGCGTTTCACCAAAGTGTTGCTGGAGCAACAACAGGATCGGGCACGAAGGGAGCAAGAAAGGATCAGACTCCTGACTGCTGATCCGTTTGATTTGGAAGCCCAGGCGAAGATTGAGGAGGACATCAGGCAGCACAATGTGGAAGAAAATATGACCATTGCAATGGAGGAGGCTCCAGAAAGTTTTGGACAGGTGGTTATGCTCTACATCAACTGCAAAGTAAATGGGCACCCTGTGAAAGCTTTTGTTGACTCAGGAGCTCAGATGACAATAATGAGCCAAGCGTGCGCTGAGCGCTGTAACATCATGCGTCTAGTGGACCGACGCTGGGCAGGGATTGCAAAGGGTGTAGGCACCCAGAAGATCATTGGCAGAGTTCATTTGGCTCAGGTCCAGATCGAGGGGGACTTCCTACCTTGTTCTTTCTCCATCTTGGAGGACCAGCCGATGGACATGCTTCTTGGACTTGATATGCTGAAGAGACACCAGTGCTCTATTGACCTGAAGAGGAGTGTGCTGCTGATTGGCACCACAGGCACTGAAACTCGCTTTCTACCTGAGGCAGAGCTGCCAGAGTGTGCCCGGCTGGCATACGGGGCAGAGGGTCGTGAGGATGCCCGCCCAGATGAAATAGCTGACAGAGAACTGGCAGAAGCACTTCAGAGATCCATACAGGAAAGCGGACAGCACTGATGCATTTGGAGACAGCTGGAGAGGGCCCTACCAACCAGACACTGCAGATGGACAAACTACCTCACCAAAATCCCCACCATTCCCATTACCCATACCCTTAGACCAAATGTCTTCATCAACCTCCCCTTCCCAAAGACC\n>XM_042461403.1 PREDICTED: Sceloporus undulatus damage specific DNA binding protein 2 (DDB2), transcript variant X4, mRNA \nGGAGGCTGATGGTCCTGGCCACTACCCTTGGCTCCCTCCCTCCTCCTCCTCCTCCAGCCGAGAATCAGGGCCCTGGAAATAGCACTGAATTGAAAACCGTTTGAAAGGTTTTAAAACGTAATAGATAAGATGAAAAGTACAGCACCACTCCTCCTCAGTTAAAAAAAAGTTGAAGCAGATGAACCCGGATTCCTAAAGGCAGGCGTGAAACCTCGCAAGAAGACTCATCATAGCACCCTTGAGGCTCTGGGTGGTGCTGTGCAGGCATACCAGATCCAGAGCCCAGAAGACAGGAAGGAAAACGAAAGACAGAGACTTGGCCAAGAGTTTGTGTTGTGTCCTGTTAAGTGTGTAAAAAACAACGAAGACAAGCTCCACATGCTCTAGGATGATAATCTACCAGCTGAAGCCAGTCATTTTTGGTTTTCATTCCAATCGCCATTGTTCAAGATACAGTGTTTTAATATAATGCATCCTGGGAAGGATTCAAAGGACAAGAAACATCTGAGGATATCTGATAGTGCATCACAAAAAGAAGCAAAATCAAATGGAAAAAGAAAGCGAGACTGTGAAGACCTAGAAAATGAGCCACAAGCAAAAAAAATACATCTGAGGAAAGCTCCCAAATGTCTGGACAAAACCGGGCAATCTTTCAATTGCTCCATGATCCGAAACAGAGGGGTATTCGTCCATCAGCTGGAAATGCAGAAAAATATTGTCCATTACATTTATCAGAACATGCTGGGAAGCACAATCAAGACACAGCTCAGAAAGTGTCTACAGGTGCCCTTTGTACGTTCTCTCTATTCATACCGCCTCTTCCGAACAGCAAGTCCTTTCGATAGAAGAATTACATGCTTGGAATGGCATCCAACATACCCTAGCACAGTTGCTGTGGGCTCCAAAGGTGGAGACATCATTCTGTGGGACTATGAAGTGCTAAACAAAACCTGCTTCATAAAAGGAATGGGAGCTGGAGGGGCCATCACAGGAATGAAGTTTAACCCTTTTAATCCTTGTCAGCTGTACACATCATCAATTGCTGGAACTACTGCCCTGCAGGATTTTAATGGAAATACAGTCCAGGTCTTCACCAGTACCAACGACTGGGATTTCTGGTACTGCAGTGTTGATGTATCTCCAACACGTCAGTCGGTGGTGACAGGTGATAATGTGGGCAATGTCATCCTGCTTAGTACTGAGGGTAAAAAGATATGGAACCTGAAACTGCACAAAAAGAAAGTTACTCACGTGGAGTTTAATTCTCACTGTGATTGGCTCCTGGCTACAGCGTCAGTGGATCAGACAGTTAAAATCTGGGATCTAAGAAACATAAAGGACAAATCAAGCTGTCTTCATATACTTCCACATGACAAACCTGTCAATGCAGCTTATTTCAGCCCAACCGATGGTGCTAAGCTACTGACTACTGATCAGCACAGTGAAATCCGGATTTATTCATCTTCTGATTGGTCCAAACCACAGCATTTGATCTCACATCCTCATCGCCAGTTTCAGCACCTTACGCCTATCAAGGCAACATGGCATCCTCGTTATGATCTCATTGTGGCTGGTCGTTACCCAGACCCTCTTTTCCCAGGATACACAGCAGATGAACTGAGAACAATCGACATATTTGATGGAAACAGTGGGGAGATGGTGTGCCAGTTACATGATTCAAATGCATCGGGCATTATCTCGCTCAATAAGTTTAACCCTATGGGAGACACACTGGCCTCTGGAATGGGCTTTAATATTCTTATTTGGAGCCGTGAGGAGATGGTGACCAAAAAGCAGGAGCATCTCATGCAAGCTATGACAGAGGAGGGAATTGGACACAGGAGCTTATCTCGACAAGGAGGTAGAAGGCAGAGACAGTCAAACCCAGGAACAAGCAAATCTAAAGCTAAACTACTCAGTCTTGAATTAGAGAGCTCTAAAACTCAGGCCAAAGAACACAAATTGCAAGAGAAAAAGAAAAGAAAGCATCCAAAGGACTAATCAGGCAAGCTTTTCTGTAATGCTGGTTAAAAACAGCCGGTGCAGACACAGTGGGCTGAAATGGCTTCAGAGGTGGCATGCCCATTACTCTCACCCAGCTTCTCCAGATCATAAAAACTGAGTTGTCAAAACAAGGCATCCTTTATTAAAGGCAATAATGGATAAATGTTCACTTGAATTTAAGTGAGCTGAAAGAAGCACCATATTTGTGCATAGCTGCTGATTTTTAATTGCCTAGGACATTGTACAGAGCAGCGATCTGGAGTATCCTGGCAGTTAAGATTGTATTTTCAGAACATTATTATTATTAAGTTTTATTTATATAGTGCTGTAAATTTACACAGCGCTGTACATACAGTCTTTTTAATTAGACGGTTCCCTGCCCTCAGGCTTACAATCTAAAAAGACATGACACA\n>XM_022360255.2 PREDICTED: Drosophila obscura nurim homolog (LOC111069978), mRNA \nCCAGCGATATTTTCAATTGCGTCCGTCCAAGCAGTCAAAAAAATATTTATTTTGCAATTAATTTATAGTGTTTTTTTTTTTGTGTAAATCATGGCCAGTTTTGCCAAGGTTTTGCTGCTCCTGAGCTCGCTGGCCACTTTCGTGTATACCTTTTTCGTGGTTGGCAAGCTGGTGCTGTTCCTCTCCACACCTCGCTCGATTTCGAAGGCACACACGTGGATTTTCAATTTGCTGGACAACAAGTCCCGGCTGGAGACCGCCTATGGGCCCATTGTGTTCGACACACTCTACCTGATAGGATTCATCTTCCAGCACAGCTTCCTTAAGTCAGCGCTGGTGAAGAATTTATTGGGCAAATTGGGCTTGGCTGCAGCCGAGCGCACTATTTATAGTTTGACATCATCGCTTTGTTTACATTATCTGCTGAAGAACTGGCTGCCAGCCCAGTCGATTGTCTTGTGGCAAATTGATGTGGACGAGAGTGCTCCACTCTGGTGGACTTTTGTGGTCACACATGGCCTTGGCTGGGCCGTCATCTTTGGCGGCTGCCTTATAATGGATCTGCCCGAGCTGTTGGGCGTCAAGCAGGTCTACTATGACCTTAAAGAGTATGGGGAGCCCATTGCCTACAAGTCGAGCGAGCTGCGTCATCTGTACTCTCATGTGCGTCATCCGTCCTTTGTGGGTCTCTCCTTGATCCTGTTTGCCACGAATGTCATGAGCCTGGATCGCCTGCTGCTGGCCTCGCTGCTCACCGTCTACATGTACGTGGCCTGGTCCACTGACGATAGGGACGTGGCCTACCAGAAGCAACAACTGCAGTGCAAGAAACACGAGCTGAAGGCTCAGTAAATCGAATTCTTCTCATTTAGCTCTAGTTCCTATTTAAGCTGAACGTATAACACATTAAAGACTAACTCATCCTAACAATGGA\n>XM_017911197.1 PREDICTED: Eufriesea mexicana RING finger protein nhl-1 (LOC108555529), transcript variant X6, mRNA \nAGGCGGAGGAACAGAGCGGCGAAGTAGCTGGCCAGAAATAACTAATAAGACATTCACTCTAAGACGGGCGGCCAACCGGCCCGGACAAACGCGCTGTCACAGCGCCGGATATTGGTGAACGACGAGTGCGACCACTTGGGGCCCCCATAGAGAGGGCCCCCAACCGGAAGAGGCCGCCGCAAGGCGGTCGATCTATCAGGCATGGAGCAGTTCGAGCAACTGCTAACGTGCGCGATATGCCTGGACCGATACAGGAACCCGAAGCTACTGCCATGCCAGCACAGCTTCTGCATGGAACCGTGCATGGATGGCCTCGTTGACTACGTGCGTCGACAAGTGAAATGTCCAGAATGCCGCGCGGAACATCGCATCCCCTACCAGGGTGTGCAGGCCTTCCCGACCAACGTGACCCTGCAGCGATTCCTGGAATTGCACATCGAGATCACCGGGGAGCTGCCGGACCCGACCAGCGGCCAGACAATGGAACGTTGCGGCGTCTGTTCGGAAAAAAGCTACTGCTCCCTCTGCGTCCACTGTGAGAAGAAGTGCTGTCCCGAATGCAAGGACGCTCACATGGACATCCTCAGGCGCGAAATTACGCGTATCAATTCCCAGATTCGCAGGGGACTGCACAGGTTGCAGGACGCGCTGGCTTTGGTGGAGAAAAACACGTTGGGTCTGCAAACAAACTGCGCCTCGGTCGCGGAAGAGGTGGACGAGATTTATCGGAGGCTGAGCAAGGCTTTGAAAGACCGTACGGAACATCTGCGTAACGAGGTCGATCGATACCTGAGCACCGAGCTCAGAGGGTTGATTCAGCTCAAAGAGAATCTCGAATTGGAAATCGCGAATATCCAGAGCAACTGCGATTTGGCGGAGGCTCACATCAATGAAAACGTGCCATGGGACGATTCGGAACTCCTCGACACAAAAGAGCTCTTCCTGCGTACGGTGGAATTCATCAGGAACTTCGAGTACGAGGCCGGGGATTACAGTCGGCGAGTGCGTTTCGTGATGGCACACGATCCGAACCAGCTGGTCCTCCATGTAGCAGGTTACGGCGAACTGAATATTAAGCCAGAAACCGGAAGCGGAGGATTGCTCGGTAGCTCGAGCAGTCTAGCACCTCCCGGAGGATCACCGGGCCTCATGAGAAGCAAAAGCGACCATCGTCTGGCCTCGCAGTACCGGCAGCAAGAGGAAGAGCGACTGGCGAGAAATCGATACGTGCCCGAATACGAGTACGACGCGCCAGAGTACGAAGTACCGAGGAACAAATCGAGGTACAGAAGTCGATTCATGCGACATCGGGACGGAGACGATTCCGATGGCGACTCGAGGTCGACCGTTCGGTTCACGTCCACGCCGCAGGAATCCTCGGGACTTCGTGAACGTGTTCTGGACACAGAAGACGCGGCACGTGGGCCACTTTCCGGGATTTTTCGACTCACCGACTCGCCGCGTATCATGAAGAAGCTTCAAGAATACGAGAGAGCCGGGAAAAGGAAGAAGGAGGAACCGGCGATACACCCTGCTCAACAACCTCAACCACCGAAACAACCTCAGGTACAAGTGAGAAAAGTGCCGACAGCGATGGCGAGGCAGACCAGCGAGGACGACGAGATTTCTAGGATTAAAAAGCAGAACAAAACAGCGGCCACACCTGCGACCGAAACGGTGGAAGAACGACAACCGGCGCCAACACCTGCACCTGTACATCCACCTCCGAGGGAGACACCCTCCGAACGAGAACCGGAGGAACCCGCGCGGAGACCGATGCCCGCGAGGAGAACTTCGACGGATACCCACACTCCTGCGACGAGAAGCGCTTCATCAGACTCGAGCACGGGCTCCGAGAGCTCGGGAGGATCAGGAATCCGCAGCACCGGTGCACCATTCACCGCCGAGGAAATGAAGCAGAAGTACTTGTCGAGGGCACCGGCGTCGAACGCAACATCCACGACCTCGTCGCCGCACAGCGGGACGCCACCGACTGCCAAAGACACCACCGCCAACGCCACCCCCGCGTCCCGATCCTTCCAGAGCCGTTTTTTAGGCACAGGTAACCGCGCAGCCCCACCACCGCCCACGCAACCCCCAGCGGCGCGAGAAGAGACCGCCGTAAAGAAGAAGGAGGAAGAGGAGGAGGAGGACGAGGAAACGAGTAGCTCGTCGGAAGAGACGGAATCCGAGACCGAGGAGGAATCGGAAACCGATGCTCATCCAGCGGGCACGACCACGTCCACGACGCCCTCTACCCCGGCTCAGGATCGTCAGAGGAGCGAGTCCGCGATGGCGAGGACAGACATAGGGCCTCTGCTCGCTAGGAGCGCGGAGGCGAGACGCGGCAGCAAGGAAAACTCACCTACGACCAGGTATTCGTCGCCGAGAGGAAGTCCCGCGCATTCGGTGACGAGCCCGACAGCGACGACGACGACGACGACAACGAGCGGCGCCGCGACGTTGACAACGCCGGCCGGCTACACCAGCAGGTTCCTAAACAAGAGCAGGAGCCAGGCGGCGATGATGGCGAGCCGGGAACGGGAACGGGAGCGCGAAAGAGAACGAGAACGCGAACGGGAGCGAGAAAGGGAACGCGAAAGAGAAAGAGAACGGGAGAGAGAACGCGAGCGAGACATGGACACGGAGGTCGATTCGCCCCTGTCGACGAGGTCACGGTATGCCGCGTTGAAGGAAAGAAGACAACGCCTGGCCCGGTCCAGAAGCTCGCACAACTTCGGCGGCGATGACCTCGACCTAGACGAGGAGCCACCCTCTCCGACTACCCAGTCGCCGAACGCTTACTTGGCAGCCAAGTACGGAGCCGGCTCTGAACTGGCCAGAAGTCGGAGTACTCATGCTCTAAAGTCGAGAGAACCGAGTCCAGAACGAGACAGAGTAGGTACCGAGAAGGATGGCGCCGCCTTGAGTTCCTGGGCGCGGTACTTGAAGAACAAGTACGGCAATCGTACCACCAAAGACAAGGAGCCTTCGTCCTCTGCCTCGACGATTCCGTCATCGAGTGGTAGCGCAACCTCGAGGAGGTTATCCCTCGGACTACCTCTCAGGCACGGTGGTCAAACATCCTTCGAATCCTCTGACGACGACCAAAAAAACCCGTCAGGCTCCCCCACGTCCCCTACAGCAGCTCCCGTTATACCCGCGGCAGCAGGTTCCTCCACTAGTAATGGCCGGAGGAGTCACTACTTGCTGAAGCGGCGGCAGCTGTTTAAGTTCGGGATGCGGGGGAGCGAAGCCGGATGCTTTACCTGGCCGAGAGGCCTCGCGGTTGGCCCTGACAATTTCATCGTCGTGGCTGACAGCTCTAACCATCGTGTTCAAGTATTCGACTGTAATGGGAACTTCCTGAAGGAGTTCGGAACGTATGGCAGCGGTGAGGGTGAATTCGATTGCCTCGCCGGGGTGGCCGTGAACAGGATCGGACAGTACATCATCGCGGATCGTTACAACCACAGAATTCAGGTTCTCGATCCTTCCGGTCGTTTTCTGAGAGCCTTCGGCTCCCAAGGGACCGCCGACGGTCGGTTTAATTATCCTTGGGGAATCACCACGGATGCTCTTGGATTTATTTATGTGTGCGATAAAGAGAACCATCGCGTACAGGTGTTTCAATCGGACGGCACGTTCGTGGGCAAATTCGGTAGCTGCGGAAGCGGACGTGGCCAGCTGGAACATCCTCATTACATCGCGGTGAGCAACACGAACCGCGTGATCGTGAGCGACAGCAACAATCATCGTATCCAGATATTCGACGTGAACGGCCGCGTGCTGACCTTCTTCGGATCCGAGGGCTCCGACGAGGGTCAGTTCAAGTTCCCAAGGGGTGTCGCTGTGGACGATCAAGGCTACATCATCGTCGCCGACTCCGGCAACAACAGGATACAGATATTCAGCCCTGAGGGGACGTTCCTCAAGTGCTTTGGCGGATGGGGTAGCGGTGACGGTGAATTCAAGGGCCTAGAGGGTGTCGCTGTCACGTCGGGCGGTAACATCGTCGTCTGCGATCGCGAGAATCACCGTGTTCAAGTGTTCTGATTTCGTTCCGCTTCGTTTCGTTTTATTCTCTCTTATTCTCCTGTGATTCGTCGACCAAACTCAAACGCGTCGAGCGATCTCAGAGGAGGCTCGCATTTCGACGAAAATCGATGCAGTATTTCTCGCGATGCTTTCGATTCTGGTTTTCTTTTTCTGCCTAATTGGGAGGAGAAATAACTTTCGACGGAGAAGGGTTTCCACGAATCGACGATGGGCGAGACGTCGCGTTAATAACCGCTTGCTTGCGTTAGAAATTAACATGTAGCTGTTTTGTGCTGAGCTAATCTTTTCATTCGGAAGCCCTTTCATGAGAAATGTTAAATAACGTAAGATATTCTGGACGATTGGTTGGAAATTTCGTAACATATATTCTACGTATATACATAGGTTTATATATAACATAGTTACCTTCGCTGTTTATGCATCTCACCGAGACGAATCGATAATGGAACTGAAAAGATACCCTTGGACGTCGGTTAATTGCAGATTGCAGCTTAAAAAATGAAAAAAGAGAGCAAAAATATCGTTTATCTGTTCTTCTCTCTCGTCTTACCCCCTTTCTCTCATTCTACCATCTTCCCCGTACGCACGTCATACTCGCGTAACTTAATTTAATTTATACTCGAAGTGACAACAATACAGTTTGTACCGTTTGTATGCTTTAAATAAATTGTTGCGGAAGTAATAAAGGAGAAACGAAAAAGAAAAAAAAAAAAAAGAAAAGAAAAAAGATATGAAAAAAGGACGACACGCGTTTTATTCGCTTCGACGCACCCCCGAACCCGCGTT\n>XM_042027756.1 PREDICTED: Corvus kubaryi hydrocephalus-inducing protein-like (LOC121664448), mRNA \nATGGTCTTCAACCTCCGTATTCCTGAGGACGGCTCGGGAGAGCTCAGTGTTTGCAGCTTCGATCAAGTGACCCTGTGTTCCAACACCGTGATGGAGTGCTACCAGTATATCCTGGTGGACGTGGAGGGTATTGGCGAGGGAGTGTTGGCACTGACCGTCATGGGCAGATGCATCGTTCCTAAGCTGACAGCGTACCCCTACATCCTGTGCTACGATGAGTGCCATCCGAAGGAGCCGTACGAGAGGAAGTTCCTCGTTGTGAATAACAGCCACATTCCTGGCTGCTACGGGCTTATTGCCCAGGTTTGGCATCACATCCGCCTCCTCCTCGCGGAGGAGATTATTAGCGGGGAAAAAAGGGTTTGGTTTGCTGGTTTCTATTCAATCTTAAAGATCTGCTGAGAACAAGATCCTACCGGAATGTAAAGTTTAGGGTGCAGTTTAACCTCCTGAGG\n>XM_036088610.1 PREDICTED: Halichoerus grypus CD300 molecule like family member f (CD300LF), mRNA \nTTTTTTTTTAGGTTAGGGCTGGAATGGAGGCCCTGCGCCATGCACGGGCACTGCACCATACCCCCTGGTTCCCCAACACCCTGCCTCCACCTTGTGGGAAGTGGCCAAAGGAGGAAGTTCAAGGGTGGGGAAAGCAGAAGGTTGGAAGATGCCGGAGCTAGGTCGGAGTTGACTGGCTCCATCAAGGGGGGCTTGTGTGAAGAGAGAATGAACCTGCTGCTGCTCTTCCTCCTCTTCCAGCGTGCAGGCTCATCTGCCCTCGTAGCAGTGTCCAATGCAGTGAGTGGCCCAGTGCGGGGCTCACTGACCGTGCAGTGTCGCTATGAACCTGGGTGGGAGACCTACAGTAAGTGGTGGTGTCGAGGAGCTGAGTGGAGACGCTGCCGTATCCTCGTTCGAACTGATGGATCAGAGCGGGACAAGAAGGCTGACCGAGTGTCCATCAAGGACAATCACAAATTGCGCACATTCACTGTGACCATGGAGGAGCTCAGGTGGAACAATGCAGACACTTACTGGTGTGGGATTGAGAGAACTGGACCTGACCTTGGGGTTGAAGTTAAAGTGACCATTGACCCAGCACCAGCTACAATATCAACCACCACCACCTCAACCACCATGTCCGCAGCACCAGCAGAGACCAAAGGCCCCCCGACTGTGAGCCACCACTCCAATGGCAGCGCTAACTCCATGAAGCTCAGCATCCTGATTCCCCTCATCTTGGCTGTGTTGCTGCTTCTCCTGGTGACGGCCTCACTCTTGGCCTTGAGAAAGATGAAGCAGCAGAAGAGAGCTGCTGGGATATCCCCAGAGCAGGTGGTCCAGCCCCCAGAGGGGGACCTCTGCTATGCAAACCTGGCTCTGGAGCCAACCAGCACCTCCCACAACTCCTCCCAGAAGAAGGCCTGTACAAAGTCCTCCTCCTCTGCCCTGGATAATCAGCAGGAAGTGGAATATGTCACCATGGCCGCCCTTCCGAAGGAGGACATTTCCTACGTGGCTCTGTCTTGGGAGCCTTTGAATGAGGAGTCAACCTATTACAACATGAACTACCATGTTGCCCACGTTCCCAGCAGGAGCCACGAGGAATCCATGGAATACAGCAGCATTAGGAGATCTTAGCCTGAGCTCCAGGCTCCCCTCTTGAACCCCACATGAGGCCTGTGAGCATGTTCCTGCCCTGTCTGCTTTCTGCCCCCATTCACTTCACGAGGACCAACCAGGGACTGAAGCCTCGGCCTTGTCTCAGGGGGCTTTCGGGAGGTAGATAGGGGTCTCTCTACATCTCTTTTTCTCCCATACAGCTTAAGAGGGGTTGGGGATATGCTCTGGAGTTGCTGAGGGAGTAATAATGATAATGATAATAATAATAATTAACCTTTATTTATTGCTTAACATGTGTGGTGGGCTGAATAATGGCCCCCAAAGTTCTCTGTGTCCCAATCCCCAGAACCTGTGAATATGGCAAAAGGAGCCACGTGGATGTATGAAGTTGAGGGTTTTGAGATGAGGAGAGTATTCTGGATTCTCCATGTGGGCCCTAAATATAATCACAAGGGTCCTTGTAAGAAGGAGGCAAGAAGGTCATAAGAGGAGAAGGCAGCCGATGACAGAGGCAGAGGTTGGAGTGATGTGGCCAGAAAAGGCAAGCAATGGATTGTCCCCTGGAGCCTCTAGAAGGAACCAGCCCTGCCAACACCCTGACTTTAGTCCAGTGAAACAGATTTTGTCCTTCTGGCCTCCAGAATTATAGGAGAATAAATTGATGTTGTGTTAATGAATTCA\n>XM_028783841.1 PREDICTED: Grammomys surdaster transmembrane serine protease 13 (Tmprss13), transcript variant X3, mRNA \nATGGACAGAGGCAGCCACCGGAATGCTTCTCCAGCAAGGACACCTCCAGCAAGGACATCTCCAGCAAGGACATCTCCAGCAAGGACACCTCCTCAGGCTTCTCCAGCAAGGACACCTCCTCAGGCTTCTCCAGCAAGGACACCTTCTCAGGCTTCTCCAGCAAGGACACCTCCTCAGACACCTCCTCAGGCTTCTCCAGCCCAAGCGTCTCCAGTCCGGGCATCTGCAACCAGGGCACCACCTTCCAGGTCACTGTCAGGCAGGTCTTCATCTGCCAGGTCAGCCTCCACGACATCCTCCCCAACGAGAGTGTACCTTGTTAGAGCAACACCAGTGGCGGCTGTCCCCATCCGGGCATCTCCTGCCAGGTCAGCACCAGCCACCAGGGCCACCAGGGCCACCAGGGAGAGCCCAGGTCTCAGTTTCCCCAAGTTCTCCTGGCAGGAGACCCAGAGACAGCTGCCACTCATCGGGTGTGTCCTCCTTCTCATCAGCCTGGTGATCTCACTCATCCTTCTCTTCTACTTCTGGCGAGGCCACACCGGGATCAAGTACAAAGAGCCATTGGAGAGTTGCCCTAACCACGCGGTTCGCTGTGACGGAGTGGTAGATTGCAAAATGAAGAGTGATGAGCTGGGCTGTGTCAGGTTCGACTGGGACAAATCCCTCCTGAAAGTCTACTCTGGGTCTTCTGGTGAGTGGCTTCCTGTCTGCAGCAGCAGCTGGAACGACACGGACTCCAAGAGGACCTGCCAGCAGCTGGGCTTTGACAGTGCTTACCGAACGACTGAGGTGGCCCACAGGGACGTCACCAGCAGCTTCTTACTCGCTGAATACAACTCCACCATCCAGGAAAGCCTCTACAGGTCGGAATGTCCTTCCCAGCGGTATGTCTCCCTCCAGTGTTCCCACTGTGGTCTGAGAGCTATGACCGGGCGGATCGTGGGAGGGGCTCTGACCTCAGAGAGCAAGTGGCCCTGGCAAGTTAGCCTACACTTCGGCACCACCCACATCTGCGGGGGCACACTCATCGATGCCCAGTGGGTGCTCACCGCTGCCCACTGTTTCTTTGTGACCCGGGAGAAGATTCTGGAGGGGTGGAAGGTATACGCAGGCACCAGCAACTTGCACCAGCTGCCTGAGGCTGCCTCAATCTCCCAGATCATCATTAACAGCAACTACACGGATGAACAGGATGACTATGACATCGCTCTCATAAGGCTGTCCAAGCCCTTGACCCTGTCAGCTCACATCCACCCTGCCTGCCTCCCTATGCATGGTCAGACCTTCAGCCTCAATGAGACCTGCTGGATCACGGGCTTCGGCAAAACCAAAGAAACAGATGAGAAGACATCTCCCTTCCTCCGAGAGGTTCAGGTCAACCTCATTGACTTCAAGAAATGCAATGACTACTCAGTCTATGACAGTTACCTTACCCCAAGGATGATGTGTGCAGGGGATCTTCGAGGAGGGAGGGACTCCTGCCAGGGAGACAGTGGAGGACCTCTCGTCTGTGAGCAGAACAATCGCTGGTACCTGGCAGGTGTCACCAGCTGGGGCACAGGCTGTGGCCAGAAAAACAAGCCTGGTGTGTACACCAAAGTGACAGAAGTACTTCCCTGGATTTATAGAAAGATGGAGAGTGAGGTACGCTTCCGGAAATCTTAACCATGCCCTTCTCACTTTGGTGATTGCTATGAAGATTCTGGCTAAAGGGACAGGCC\n>AY335457.1 Uncultured Sphingomonadaceae bacterium clone B101/6 16S ribosomal RNA gene, partial sequence \nCGTAACGCGTGGGAATCTGCCTTTAGGTTCGGAATAACTCCTCGAAAGGGGTGCTAATACCGGATGATGTCTTCGGACCAAAGATTTATCGCCTTTAGATGGGCCCGCGTTGGATTAGCTTGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGCCTTAGGGTTGTAA\n>XR_002992789.1 PREDICTED: Selaginella moellendorffii uncharacterized LOC112347534 (LOC112347534), ncRNA \nGTGGCTCATAGGACGATGATTTGGAGTTGGATACAAAGTGACAATCAATGTGTTGGTGGTGGAATGGCTGTTGCTGTTCTTGCAGCTCCACTGTGCTCTGTCGTCTCTCGGAGACACTGCTGCCCTTTCTACTGCTCTGAGAGCCAGCACAGACGAACAAGGACTTCATTCTCCCCGCCCAGCCTGTAAAAGCTAAAGTTTGATCACAAAAACCATGCCACGAGTTTAATCAAAGACGAGTACATTGTGTTGGAGTGCTTCGCTCAAAGAAGATCTACTCGCGGTGTAAGCATAGAAGTGAAAGTACTTTGCGGACAAACTTAAACATCCTTTCAATCCATAGCTTTGCTTCTCAGGTGGAAGAAGTATAGAAGCTATTGGAGATCAAAAGTTCTTTACGGACACACTTAAAAAATTCTAACGAGAAGCTCCTCTCTTTGATTTGTGCTCTA\n>FJ727014.1 Uncultured bacterium clone A72h_1235 16S ribosomal RNA gene, partial sequence \nTTTGATGGCGACCGGCGCACGGGTGAGTAACACGTATCCAACCTGCCGATGACTCGGGGATAGCCTTTCGAAAGAAAGATTAATACCCGATGGCATAATAGAACCGCATGGTTTGATTATTAAAGAATTTCGGTTATCGATGGGGATGCGTTCCATTAGGCAGTTGGTGGGGTAACGGCCCACCAAACCTTCGATGGATAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCATG\n>KY281550.1 Uncultured bacterium clone CP_Otu6690 16S ribosomal RNA gene, partial sequence \nTACGGAGGATGCAAGCGTTATCCGGATTCATTGGGTTTAAAGGGTGCGTAGGCGGAATGGTAAGTCAGGGGTGAAAGTTTGCGGCTCAACCGTAAAATTGCCTTTGATACTGTCATTCTTGAGTACATACGAGGTAGGCGGAATGTGGCGTGTAGCGGTGAAATGCTTAGATATGCCACAGAACACCGATTGCGAAGGCAGCTTACTAGACTGTAACTGACGCTGATGCACGAAAGCGTGGGGATCGAACAGG\n>XM_017287255.2 PREDICTED: Drosophila miranda peripheral plasma membrane protein CASK (LOC108156021), transcript variant X3, mRNA \nGTTAAGTCCGCGGTCACACTGGGTTCGTGTTTTTAGCAAAATTAGTGAGAAATAACAAATTAATTAAAGAATTAAGCGTTTCTATGTGTTGACGTCAACCCAGGCGCGATCTATGAATGCCGCTGCTGTGTAAAGTACTCCGTCGCTGAGGGGCAGGGCACACAAAATTTCGGTGCGAGGCTGCGAACAGGGCCACGAAATGTATCTTTAACATCAGCACCAACCAGCGAGGAAACGAAAAACAACAACAACTACCATAAGAAGAACAACCCACAAAGAGCCAAATTTTTAGTTAGTTTTTTTGTGTTTGCTTTTGGAGGGCAGTAGGCGAACAGGGCCAAAAAACATTGGACACGGAGTAACACGTACATCTAGGACCCAAAACCAAACCCGGAGCAGCCAGGGACAGGGGACAGGGGACAGGGGACCGTCCCACTCATCAATATTCGAAAAAGCAATTGAGACGCGAACCATCAGCAGGCATCAGCATCAATTCATCAATTATTCAAAATGACCGAAGACGAAATTCTCTTTGACGATGTCTACGAGCTGTGCGAGGTCATTGGCAAAGGACCCTTCTCCATTGTGCGACGATGTATACATAGGGAGTCCAGCCAGCAGTTTGCTGTTAAAATCGTTGATGTGGCCAAGTTCACAGCGAGTCCAGGACTGAGCACAGCGGATCTGAAGCGCGAGGCCACAATATGTCATATGCTGAAGCATCCACACATTGTCGAGCTGCTGGAGACCTACAGCTCCGAGGGCATGCTCTACATGGTGTTCGAGTTCATGGAAGGCTCCGACCTGTGCTTCGAGGTTGTGCGTCGCGCCGTTGCCGGTTTTGTCTACAGTGAGGCGGTGGCTTGCCATTACATGCGGCAGATACTGGAGGCGCTACGATATTGCCATGAGAACGATATACTGCACAGGGACGTGCGTCCCGCCTGTGCCCTGCTCGCCACCGTGGACAACTCGGCGCCAGTGAAGCTTGGTGGCTTCGGTTCGGCCATCCAGCTGCCGGGCACGAGGGAAACCATAGAAACACACGGACGCGTGGGCTGTCCGCACTATATGGCGCCGGAGGTTGTCACCAGGCGGCTGTACGGCAAGGGCTGCGATGTCTGGGGCGCTGGTGTAATGCTGCATGTCCTACTATCCGGCAGATTGCCCTTTCTGGGCTCCGGGGTGCGACTGCAGCAGTCGATAGCGCGTGGCAGGCTCTCGTTTGAGGCGCCTGAATGGAAATCAATTTCGGCTAATGCTAAGGATCTAGTCATGAAAATGCTGGCGGCCAATCCACATCACAGACTTTCCATCACCGAGGTGCTCGACCATCCGTGGATACGAGATCGGGACAAGCTACAGCGAACACATCTCGCAGAAACGGTGGAGGAATTGAAGCGCTACAATGCTCGGCGCAAGCTCAAGGGTGCCGTTCAGGCCATTGCCGGCGGCACCACCATGGATCCCGTTTATGTCACCGATGCGGACATGCCCATTGCTGGTGCACCCGACGAATGGGCCGACGAGGAGGCGGGCATCGAAGCGGTCCAGCGTATTCTGGACTGCCTGGACGATATCTATTCGCTGCAGGACGCGCATGTGGACGCGGATGTGATGCGGGATATGCTGCGGGACAGTCGCCTGCATCAGTTGCTGCAGCTCTTTGATCGCATCACCTCGACGGTTGTCACCAGCAACGGCCGGGCGCCGGCCGCAGAGGCGGTCACCCGCAGTCGGGATGTCCTGGAGTCGCTCTCGTCGACGGCCGGCAGTTCGGTGGCCAATAAGTATGCCAAGGATGAACTAATGCTGCTGCTGGCCGCCCCACACATGCAGGCCCTGCTCCATAGCCACGATGTGGTGGCCCGCGATGTGTACGGCGAGGAGGCGCTGCGCGTTACCCCGCCACCGATGGTGCCCTACCTCAATGGCGACGAGATGGACAATGTGGAGGGCGGCGAGCTGCAGCATGTGACCCGAGTGCGGCTGGTGCAGTTCCAAAAGAACACGGACGAGCCGATGGGCATAACGCTGAAGATGACCGAGGATGGGCGCTGCATTGTGGCAAGGATTATGCACGGGGGTATGATACATCGACAGGCAACGCTGCATGTGGGCGACGAGATACGGGAGATCAATGGCCAGCCGGTGCAGCATCAGTCGGTGGGCCAATTGCAACGAATGCTGCGCGAGGCACGCGGTTCTGTTACCTTCAAGATAGTTCCTTCGTACCGTAGCGCTCCGCCACCCTGCGAGCTTTTCAGGATCAGACCCGCTCCGGTGCTTATTTTCGTGCGCGCACAATTTGATTATAATCCGCTGGATGATGAGCTTATACCCTGCGCCCAGGCGGGCATATCATTCCAAGTGGGCGACATACTTCAGATCATTAGCAAGGACGATCATCACTGGTGGCAGGCGAGACTGGACACGGTTGGCGGCTCGGCGGGCTTGATACCATCGCCGGAGCTGCAGGAGTGGCGCATTGCCTGCCAGACGGTCGACAAGACCAAGCAGGAGCAGGGAGAACCGGGTGCTGGATGTTCCGCTCACGCAGATGGGTGTGATGGATCAGCAGTAAACTGTTCGATATTCGGGCGCAAGAAGAAGCAGTGTCGCGACAAGTACTTGGCCAAGCATAATGCCATATTCGATAATCTAGATGTGGTCACATACGAGGAGGTTGTCAAGGTGCCAGTTGGTGATCCGAACTTTCAGCGCAAAACGTTGGTGCTACTGGGAGCCCATGGCGTGGGCAGGCGGCATATTAAGAACACCTTGATATCCAAGTATCCCGATAAGTACGCCTATCCCATACCACATACAACGAGACCTGCCAAGCCCGAGGAGGAGAGTGGACGCAGCTATTACTTTGTCTCGCACGACGAAATGATGGCGGATATCGCCGCCAATGAGTACTTGGAATATGGTACGCACGAGGATGCGATGTATGGCACCAAGCTGGACACTATCCGACGCATACACACAGACGGCAAGATGGCCATATTGGATGTGGAGCCGCAGGCACTGAAGATACTACGCACAGCCGAATTCACGCCCTATGTGGTCTTCATAGCGGCCCCCTCGCTGCAGAATATCGCCGATTACGATGGCAGCCTGGAGCGTCTGGCAAAGGAATCGGAAATGCTGCGTCAAATGTATGGCCATTTCTTTGATATGACGATTGTGAACAACGACATTAGCGATACGATTTCCGCGCTGGAAACGGCCATCGACCGGGTGCACACCACTCCCCAATGGGTGCCAGTCTCGTGGCTCTACTGACAAGACAGTGAACTGGAATGCCCCGATTGCCTCGAGGGTTGCGATTGCGAGTGGGATGCATATACACAGGCCTCCAATGTGGCGCTCTACTGAGTGCAATACCACAGTTACATCACACCTACTATACACCACAAACACCATTTAAGTATTACCAAGGCACAAAAATATACAACACAGCAACAGCAATAGTAGCAAAAGCAAAAGCAAAAGCAACCGAAACAGAAACAGAAAGACATGAAGACAGAATGCGCTTGGCGCCGAGATATATGTAGGTATGAGGATACAGGAGAGGGTATTGTGGGTAACTGCGGTCGCAACGTAAACACAAAATGTTAATTGTAAAACGAGCTGTATTTTGCCTTATACTTTGTTAAATCCTAAGTGATTAATTTTACATTGTATTTGCCATTCCAATGGGCTGCCCTCAAACAGGCAGCCTGTGTCATTATGTTTATTGTATTTATGATTGTTTGTTCTGTTAAAGTTTTTGTTTGTACCCGTTCTCGTACTCGTACTAGTATTTATTTTGTTTCTTTCTGTCAGACAGCATTAAACGCTTATGTTAATCTTGCACTTGTTAGTGTCTAAGTTAACTAAAACACAAACCGAAATCGAAACAGAAACAGAAACCGCAACTAAAAAACACTCTAAATTGTTTTAATCAAAGATTATTTCCATAAACACATACGAAAAAAAAAAAAATAAAAAACACACCCAAAAAAATGAAGAAATAGAAATCCGAAGAATGTTTGAAGAAAACGAGTTAGTAAATTATAGCAACAAAAAACTACGTAATTAGTTATAATTAAACATAACAGCAAACCAGAATAAAAACCAACAAGAAGAGAAGTTCAGGAAAACGTTAAAAACAATATGAGATGAGAGCAATTTCAAGTGTTTCAAGCCCAAAAAAAAGTATAAAAAAGCAAATTAATTACATATGGAAGAGCAAATGGGGACAAGCGATCGTAAAGTGTACGTTTTAAATGCAATAAACATTAACAAAAGGACCCGTATAACATCACTTACACACGAAACAAACAAACAAAAAAATACACTAAAATATTACCAAGAAAGAAAACAAAAAAAAACCAAATTGTTGACGTTTAAATAAATTCAATGGGAAATGATTAATAATGCAATCATAAACGAGTTAATAATAATAAGAAGCAGGCGCGTTTAAATCAAGCAAAAGCAATTAAAGGACAAAACATTAAACCAACAAAAAAAACATAGAGTGAGCACAAAAACAACAAAAAGAAAACACATACTAACAGCAATTACAGCAAAGAAGTAAATCAAATAAGAATTAAACTATTTAGAGGCCAATGAGAACTGGTGGAAGAGTGCGCAAGGGGCACAACAGGACACGTATAAATATAGAAAGACACGCAGGAAAAAGAGAATGAATGAATGAAAGAAATGATTAGTACAGAAAATATGTGGTGTATGCAGAACATACAGACATATATAGGTATATTTTTCGAACAACTCAAAACTCAGGTTGGATACATTGAAAATCAGTCAAGTTCAATAAGATAAATATAGCGGAGCGCTTCCTTTTAACCCACAGCCAAAAAAAAAGCAAAACGAAAACCTTAACAAAACCCAATCGAAGTTTACAATGGATTAAACAGAATCGAATCGAAATGAATTGCAGTTTACCCACAAGCCACAAGTTACCACCCTAGCAGCAGCAGCTTCTGCAGAAATCTTTTCTAAATGCTTTACAAGTACAAAACATGTCTTTAGCAATCAGATTTTTAGCCCCAAAAAACCCCAGGCTCGCGCTCATTAGCTTTCTCCTCTTGCTCTCACCGAAGCTTATCCTGCTCCCGTTTGATTGGCAAAATCTTATCCAGGCTTGGGCTTGATTGCGCTTCTCCAGAGCAGGACCTAAGCTGAATCTAGACCTAACACTAAGGAGTGCACATGCAATCACAACAAAGAAACAAAAACTGGTTAGAATTGGAAAATGTGGTTGAACAAGCAAAAACCACTTACGATTAATATTAGACTAAAAAAAAACATTTGACATTTGACTTTGTAATTCCTACCACCTACAACCCTCCAGCCCCACAAGCACCTCACTCCTCACTCCATTTAAGCCAGAGCTTAGTTCAAGCCTAACCACAGAACCCACATCGATTTCCACACACACACACACAAATGAACTACCAGAACAATTCTATGGTTTCAAAACGGTTGAACAATTTTTGCATAGAGAATTATTGTTGAACGCTGGGCTATGACTTTTTGGTTCGGAGCGTATGACAGAACAGACAGGCAGCAGGCAATGCAAATCATAGAAGTATCCCAATGAAAAACCTACCCGAAACTGAAGAACTAAACTACCTACCCACAACCAGATACAAAATAAAAGAAAAAACCGCAAAAAAAACAAGCAGCCGAGTGGCCAAATTAACTAAGTATTTTACCCTAAAAAAAAGAAAAAGTCAAAGAACAACCGGAAGTGGAAGTGTATGTATATGTTGCAGCTATCCCCCTCCCCCCCAACCTAGGCAGGGTGTGCCAGATAAAAAAAAGTCTAAGGAAAATTGCTCAAATCAAAAATCAAGTATTTTATGGTATAAAAACCGTGAGGAATGATCAGGATTAGAATGAAGGGGAAGTCGCGTGTAAGAGTTGGACATTCCAAGAATGAGCTAGAATTTCGAAGGGATTCGTTTCTTATTTTTAACTGATCCTTTTTTCTTAGCTGATGCGAGCAAATTGTAGCTGTACACTAAGAATAATTTCACACTAAGATTAAGCGAAAATTTATTGTTGATATTACATAAAAAAAAGAAAAGAAATGGAAAACGGATATTGGAAAAAAACCAGAAGACTCATTGAAGCAAGCCAAATGGATTAGAATTTTTCTCTAATTTGATAAGTGGTAGACGATGATGAAGGAGCTAAGGATAATGAAGATGGTGACGAGTTGATAATGCTTATGATCTCCAAAAGTCAATATGTGTAGGATTGACACGATTTGAGCAAATTGAGTGAATTGTTATTAAAATAATAAATGAAATGAGTGGCTCAATGGATCGATATCGATCCATTGATGCTGAAATAGGTCAAGACGTTAGAAAATATCATTTAAAGTAAATGATACAAATGTCATAATATATACATAGTTTAAAATGAAAATAATAATAACAAAATCAGAAGAAAAATGGGAAAAAATGGGAATAATGCGAATTAAAAACAGAAACAGAAAAAAAGAAAAACAAAAACAACCAGTAAACACTGAAATACCGAATTTTAAATACATAAGTTTTGAATCATGCATGCCGCAAAGACAAAGAAAACCCAACACAGAAAAAGAAATTAATAAAAAGAA\n>XM_006681305.1 Batrachochytrium dendrobatidis JAM81 uncharacterized protein (BATDEDRAFT_27075), partial mRNA \nATGCAAGTTTGCAACACTCGCTTGACTCGTTTGGCTCGGATTCTGGTTGATATTTACGATATCGATGCAAAGTTACATTCCAGAATGAACGTGCATAATCTGATGTGGTCAATCGTTTGGTTTCATTGTTATCGGTCATTGACACCAGTGATTGCATTGATTGCAAATAGTAGTCCAAGACTGACAAGTGTGTCTGAATTGATGACAGATGATACAGTCTATCCAACAAAAAGTAATACATTGATCGTGTCTGTGTGGCCAAGTGTAGATAGGTCAATAGGAGTAAAAGTATTTCCCACTGGGGTTGTAAAAGAGCCGCCAACAGATGCAAGTACCAAAAAAAGTGCCTTGAGTTGGGGCAACAACAGACTTGACTCTTACGACACTGACCAACTCTCACTCTCGTTGACTGATGGTGGAAAAGCTTTGCAACCATACGGCCCAGTTCCAGCATCAGTTAAAGAGAGTAAGATTTGGTCAGTGTCGTAA\n>XR_006867874.1 PREDICTED: Ischnura elegans uncharacterized LOC124171616 (LOC124171616), ncRNA \nTCCCTAAATCCGCCAATGGTTATTAATCTCCTTTATATTGCCTCAAAATAACTACGAAGTTGAGTCGTTGCAACCCGCCATTTTAATTGCATCATAGGTAAATGGCCGGTTATGTAGTAGCATAGGCGGAACATCAAACGGGTGCCGGTTTTTCCTTTTTGTAATTGATTAATTTGGGATATGTGCGGTTTTTCTGCAACTAACTGTTCTAATAACTGCAGGAATGAGTTCCGTGTTTTTTCCGTAACCTTAAGAAAAAGGCGACATGACTACAAATGTGCCGGAGGAATCATTGGCAACGAACACCATATTCCACAATTTGTGAGATTCATGCCTGTTGCATCATGCTTTGCTGAATTGATGGCCAAATAATGGAACGACTCCTATGACGTCAAGAGACAATTTTTTCATTGCATGTCCAAATAACCTAAGCAGCAGAAGCATCCAGTAATCTTGTACTGCTCTGGTATTTTGGTGTCACCATCTATTTTGCTTGAGGAGAGAATTTATCTGGAGCAGTGTAATTCGGATTATCTACTGATGAGCTTCTCATGAGTGTTTGACGTTCTACACAGCTAGTTATGAGAAAGTCACACCTGTTAGTGTCTACTGTGATTGTTATTTTTATAGAAGAGTAATTTTTTACTTGATTACCTCTGAAATTTCCCATTATTAAATGTAGTAATTCAAAGTTATGGTTACAATGTTGTGTCCTTTCCATCAAATTTTAT\n>XM_008649455.4 PREDICTED: Zea mays evolutionarily conserved C-terminal region 5 (LOC100502368), transcript variant X2, mRNA \nAGAAATCCCATCGTACGCGACTTCGTATTGGTAAAAGCCTTTGAGTTTGATACCCATGACATCTCTAATCGCTCTCATCAAATCACGATTCACATAAAAAAGGTGTGGGAGCCCGATCCGATCGCCAGATCCGCCGGCCTGTGCGCCGACTCGGGCGTCCTTCCACAGATCCTCTTCCTTCTATCGTAGGCTCGCCCTCGCCGCTCGCTGGAGCGGAGGTCTCTCCCTGCAGCCCATACTCCTTGATTCATTCTATTGCCTCGCCGCCGGCTCTATGGATAAGCAGGAGCCAGTAGCCAATGGTGAACAAACGATAGGTCTTGCTGAGAAGCCGAAGGAGCTGCCTGTTGCCAGTAAGGATGAGAAAGCAACTGTGCCCCCGATTTTAGTTGATTCAAATGCTTTCAATCTACCAAGTGAAGGCCAAACCCAAGCTGGCACATCTAACATGGATGGGGGCCATAATGGTGCACACAACTTTTATGCTTCTCAGGCACAACCATTCTATTACCAAGGCTCCGGTTCTGAAAACCCTACACAAGCATGGGATACATATCCTCCCTACATGAGTGTTGAAGGATTGGAAGTGGGTCCACCAGTTGTATACAATGAGGACCCCTCATTGATGTTCCATGGTGGCTATGGTTACGACCCATATTATTCTCCTATTGCAACACCTGTACCAAATGCTGTTAGTGGAGGTGGTCAGCTCTACTCCCCTCAGCAGTTCTTCTCGGCTCCTTACTACCAGCAGTCAGTACCACCTGACATGCAATATTTAAGCTCTCCTACTCCAATATCACAGGGTGATACAATAATGCCGATTGACCCAACACAAGGAGCTTTTATCGCTGATACCCTGAGTCCAAACAGCTTCCTGTTTGGCCCAAGACCTGAATGGTTCAGATCTTCAGAAGGAACTGGGTCATTTCCATCACCTGCAGCTTCACCTCAACCTTCTAGGGGTGTTCCAGGGTCCTATGACCAAAACAACTTTCCAATGGCTTCAAGAATGTCATCACCTCACCAGAAGCCCTTCTATGGTTTGAGATCCACAACTGACTCCTATGGAAGGGGTTTTTCTCATGGTGGAATGTTCCCACAGGCCAGTAATTATGGGGGATCCGTCACCAGCTTTGGCCTTAATGGTAGAAGTTTGATCTCAACCGAGAAAGGGCGCAGGAGGGGAAGGGGCAATGCACTTATTTGCAGCTGCAATGGTCCTCTTGACTTTCTTAATGAGCAAAGTCGGGGTCCACGTGCAACTAAGCCTAAGAAGCAACCAGAGGTTGACAGTAAGGATGAGGTGCCTACTACAGGAGTTGGTCGTGAGTTATACAACAAGCCTGACTTTGTTATGGAGTACACGAATGCGAGGTTTTTCATCATAAAATCGTACAGCGAAGATAATGTGCACAAGAGTGTCAAATATGGTGTTTGGGCTAGCACCACAAATGGAAACAAGAAACTGGACTCAGCCTATCGCGAAGCTAAGGAGAAAGGAGAGCACTGTCCCATTTTCCTGTTATTTTCGGTGAATGCCAGTGCACAATTCTGTGGTGTTGCTGAGATGATTGGACCAGTGGACTTTGAGAAAAGTGTGGATTACTGGCAGCAAGATAAGTGGACTGGTCAATTCCCTGTGAAGTGGCACATAGTGAAGGATGTTCCCAATAATCTTTTCCGACATATAATTCTTGAAAACAACGACAATAAACCTGTAACAAACAGCAGAGATACACAGGAGGTGAAACTAGAGCAAGGAATGGAGATGCTGAAGATCTTTAAGAACCATGATGATGATGCATCAATCCTTGACGACTTTGAGTTTTACGAGGAGCGTGAGAAAGCGCTGCAGGAAAATAAGGCACGCCTGCATCAGCAACATCTACCCAGTTCTATTGTTATTGAGCCCAAGAAACCCTTGACTGCACCCAGTGACCTCGTGGGCCATATCACCAAGAGTTTTGCTGAGGCTGTGCGGCTTGGTGAGGCCAAGACTGTAAGCCATTTGACTGAGAAGGTTTCTGGGGGTGATCCGTCTATTCCTGTGAAGCATGTTGAAGTTAAGCAGAGTGGTTTATCTTAGGAACTCTTGATCGATGTGAATGAACTGTACCAAAAATTCACCCATACGCTTCCTGATCAAAATGTCGGGAATGCATATGCAGATGGATGATGATGAAACCCAAGACATCGGCAAAAGCATGCATGCACACTAGGGTAGGTCTTTGCCAACCTTGGAAGCATAGTTTCTTGAATAGTTTCTCTCTTTTTTTCTTCTTTCTTCCTAGTATTTTCTCCCCTTCTCTTCGCATCATATGATGATTCCTTAGTGTCTAGCCTCAAGGAGAGTTGCTGTTTTTGTGTAAGCCTCTGTAAGTTTCCTGTTCCATCACATATGAGTAAGGCCTTTTTGTTTCTTTTTATTTAAGTAAAAGATCCATCTTTTATGTACTGTCGTGGCAGTTTTATTATACTATGTCTGAACAAGGCCTATTCACTATGTAAGCAAAACATAAACGCTATCCAGGTGACCTGGTTGTGATGACTACAGTAATAAGTAACTGAATAATTTTTTATGTT\n>XM_312219.5 Anopheles gambiae str. PEST AGAP002709-RA (AgaP_AGAP002709), partial mRNA \nATGGATTATAATTATGATACCGACGAAGCGTGGTACGCGGCCAGCCTGGGCGCCGGGCCCTGTACCGACGTGTCAACGCTGAGCGTGGCGCCGCTCTGCTCTAGTCTGAATCGGTACGGCACGCTGCCGAGCACGGTGCCGATGCCGACGCTGTACGCTTCCGAGGGCCAGCGCAAGCCGAAGCTTTCCATCATCGAGCTCGTGCTGTACAACATGGCCTCGATGCTGGCCAGCATTGCTTCCGGGTACGATGTGCGTGTGTCGAACGTAACGCCGCTCCATCCGCGGCTACACCCGGGACCGTTGCAATCGTACGAATCGTACTCCCAGCCCGTGAGTCCGTACCACCACCATCGGCACCAGCTGCCGCCAATGGTAGACCCACATGCGCTGCAGCTCGAAGGTATGGTACGGTTGGACGGGATGCCGCCATCTTTAACAACCGCGCCACACACGGTGGACAACGCTCTGAGCCAGGAGGCGTACGAGGAGGAGCTGGCTCACCAAGCTCAGGATGATAGACTTTACGCACAACACAGCACACCGTACCAGGAGACGCCGGAGAGACAGCGGCCGAGGAAGGTGCATACTCAATCGACCAGCCCAAGACAAGACGAGCGGGCGCTGAAGTACACGGACTCACCGCAACACTATCTACCATCGACGATGTCGACGACGAGCGGGCTCGGCTCGAACTACACGCCCTCGGGACCCAGCTCGTCCTTCAGCGTGGGAGCGGGAACGCAACCGCCAACGCCTTCGCCCCGCCGAAAGTCTAGCGCCGCGTCGTTCATGGATTTTGGCGATCTGCCGGAAGAGCGCGAAAGTAGAGCGGGCCTCTACATACCGGGCGAGTACGACGGGTACACGCAGCACAATCCAATCTTTAACGCGGGTACGCGCGGTGCCACTAGTAGCTACATCGGATCCCATTATTTCCCCTACCGGCCGGCGATAAACTTTGCGTTCGAGCGGGAAACGAAATCGTACGGCGGGGAACCGGTGTACGAAGACCATCACTACGACAGTGCCTCGTACCATGATTACGCGTACGAAGGTCCCGCCGGGGGACCGTCGGGAACGGCCAGCGCTAGAGCAACGGGTACGCGCGTCCCAACGATGGGCATCAGTGCGGCGGGCCATCGCCGGACGCACTCCAGCATTTCCAGCACGCTGCACAGTAGCAACGTTAACCAAGGGTTTCACATGGAGGGCGAAGAGATGGACGGTGCCGGAACACGCCTGATTGATGACGTGACGTACAAGCTGGGCGATCTCTACCTGCCCGGGGGCGGTACGGATGCGGCTAGCCGCTTACCGGCACCGAGCACCGCGAAGCTGCACGAATCTCCCCTGCCTGCTGCCTTTCATGCGTCGAGCCGAATGCATCAGTACGAGAACGTGCCCAACTTCTTCCGGCGGCAATCGAGCCTGCAGCAGGCGCACTACTCCCCCAGCAGTGCGCACAGTGGACATCTGTCCGGCGATTTTATGTCCGGTGGTGCAATCCCGGAGCCGGAGGAGCGTCCGTACACGGTGCTGGGGCTGACGGAGCACGGTGCCGACGGTGGATTGCTGTCCAGCAGCTTAAGACCCCAAACGAAGCTGCGCTCCAGCATGAAGAAGTACACGCACTCACATCCGACGCATCAGCAGGCCACCGCGTCAGCTGGCGGGCAGGGTAAGTACGGGGCGGGCTACGGTATGCACGGGACGACCAGCGCCACGAACCAAACACCGCCCGACAGTCTCACCAGCGACGACAGCTCGTACCTGAGCGCGAAGGACAACTCGTCCTCGATTTCCTCGCAAAGCCGGGTGCGCTTTACGCCGGAAATTGTGCTCGACGTGGACTCGCCGCTCCAGTCGCCGACGTGCTACACGGGCGGAGCTGCTGCGGCGGCTGCCCCGTCCGGCCATGGCTTAAAGGACAGACGCAGCTCCTCCTCCGGCAGCACGATGCTAACGGCAACGCCCGGTTCGGGCACGTCCTCGACGTCGATTTCGGGCCGGCGGTCGAATGCCTGCGACACGAGCCAATCCTAG\n>XM_025275219.3 PREDICTED: Bubalus bubalis NPR3 like, GATOR1 complex subunit (NPRL3), transcript variant X9, mRNA \nTTGCCTCATACAGTCGCGAAGTCTCGCGAGCCTCTTGCGAGTGTGGGGTGTGGGACGGGCCCGTGGGCTCGGTGGGTCTGGCTCCGCTCGGCCCCCCCGCCTCCAGCCGGTCCTCCTCAGGGCGGTGGGTCCCGGGTCCTCAGCTCTCCCCCGGGCAGCTCCTCCTCAGAGCCCCACCCGCCCCTCGCCCCCGACCCGTCCTCCTCAGGGCGCTGGGTCCCGGGTCCCGGCCCCTCCCCGGCCCGACGTCCTCGGGGCCCCCACCCAGGCCCCGGGCCGACCCCTCCCCGGGCTCCCGGCAGGATGGGGGACAACACCAGCCCCATCAGCGTGATTCTGGTGAGCTCGGGGAGCCGGGGCAATAAGCTGCTGTTCAGGTACCCTTTCCAGAGGAGCCAGGAGCATTCGGCGTCCCAGACGAGTAAGCCTCGTAGCAGATACGCTGTCAACAGTGCCGGAGAGCATGCTGAAGACCAGGATGGGGACCCCAGGTTTTCAGATGTCATTCTGGCAACAATTTTGGCAACCAAGTCTGAAATGTGTGGCCAGAAGTTTGAACTGAAGATCGACAACGTGCGGTTTGTTGGGCACCCGACGCTGCTGCAGCACACGCTGGGCCAGGTCTCCAAAACTGACCCGTCCCCGAAGAGGGAGGCTCCCACCATGATTCTTTTCAATGTGGTGTTTGCACTGAGGGCCCACGCGGACCCGTCGGTGATCAGCTGTCTGCACACCCTCTCCCGCCGCATCGCCACCGTGCTGCAGCATGAGGAGCGCCGCTGCCAGTACCTCACGCGGGAGGCCAAGCTGATCCTGGCGCTGCAGGACGAGGTGTCCGCCACGGCTGACGCAAATGATGGGCCTCAGTCCCCATTCCACCACATCCTGCCCAAGTGCAAGCTGGCCAGGGACCTCAAGGACGCTTATGACAGCTTGTGCACGTCTGGGGTGGTGCGGCTCCACGTCAACAGCTGGCTGGAGGTGAGCTTCTGCCTGCCCCACAAGATCCATTACGCGGCCAGCAGCCTCATCCCGCCAGAGGCCATCGAGCGCAGCCTGAAGGCTATCCGCCCGTACCATGCCCTGCTGCTGCTCAGCGATGAGAAGTCCCTGCTGGGTGAGCTCCCGCTTGACTGCTCCCCAGCCCTGGTACGCGTGATCAAGACCACGTCCGCTGTGAAGAACCTGCAGCAGCTGGCCCAGGACGCAGACCTGGCTTTGCTGCAGGTTTTCCAGCTTGCGGCCCACCTGGTGTACTGGGGCAAGGCCATCATCATCTACCCGCTGTGTGAAAACAACGTCTACATGCTGTCTCCCAACGCCAGCGTGTGTCTGTATTCCCCGCTTGCCGAGCAGTTCTCACGCCAGTTTCCATCTCACGACCTGCCGTCTGTCCTTGCCAAGTTCTCCTTGCCTGTCTCCTTGTCAGAATTCAGGAACCCCCTGGCCCCCCCTGTTCAGGAGACGCAGCTCATCCAGATGGTGGTGTGGATGCTGCAGCGCCGGCTCCTGGTGCAGCTGCACACCTACGTCTGCCTGATGGCCTCGCCCAGCGAGGACGAGCCCCGCACCCGCGAGGACGACGCGCCCCTGGCCACCAGGGTGGGCGGCCGCAGCCTCAGCACGCCCAATGCCCTCAGCTTTGGCTCCCCAAGTAGGACTTCCTGCCCCTGGGCATCTGTCTGGAGGGGGCCAGCAGCGATGACATGACCCTCACCAGCCCCAGCATGGACAACTCCAGCGCTGAGCTGCTCC\n>XM_017686507.2 PREDICTED: Pygocentrus nattereri complement C1q-like protein 3 (LOC108413828), transcript variant X2, mRNA \nAGCAGGCAGAGAGAAAGCAGCTGACCTCCTCAGTGGTCTCCTGTGACAGCAGACGTTGAAGATGTTTGGGCTGGAGGTGTTTCTCCTGATCTTCCTGTGGAGCACACAGGCTCAGGACGTGCTGACCCCCAGTGTGGACATTATCAGGGAACTGGACAAGCTCAGAGCTCTGGAGCGAAGAATGAAGGCCATGGAGGCTGAAATGGCTGAGCTGAAGATGATGAACGAAGGACTTTCCAGGAGCCTGGGGATCATTACGAAGACCATCACAGATCAGCCCAAAGTGGCGTTCTCCGCTACGCTGTCCAACCTGCAAGATGGTTTTAAGTTCCTGGGCCCGTTCCAGAACACGGTCACCCTGGTGTACGAGAATGCCTTCACAAACATTGGCTATGCCTACGATCCACAAACAGGAATCTTCACGGCTCCCCTGGGGGGAGTGTATTATTTCAGCTTTTCACTCTTCCACCCGGTCGGACCTGGTCCTCAGGCCAAGACCGGGGCGTCCTTGGTGAAAAACGGGGTGCTGGTGGTGGCTGCCACAGATAACGCCCCGGGGGCGGATTCTGAGGACACTTCTGGAAACTCCGCCTCCATCCGGCTGGAGGAAGGAGATCAGGTGTACGTGCAGCTTTGGGAGAAGCACAGGGTCTACACAGACGGAAACAAGCGCAACACCTTCAGTGGGCATCTGCTCTTCCCAGTGTGAATCTCACCTCACTTGGCTGTGGACGCCTTCAGCTGATGCTCTAATGCTGGGCGCCTAAAGTTGTAGCGTTGTAGTTCAGGTTAATTCAAATGTACTATTAGTAGAGCTTCTATGAAATAAAACAGTATGACTTCAGTTTACTTCTTATGTACTACACCGCTTCCAAAAAAGCTGTGACGTTCTGCAGAATGTAAATAAAAACAGGATGGTCTGCAAA\n>XM_029369271.1 Trypanosoma conorhini pre-rRNA-processing protein TSR3 (Tco025E_02343), partial mRNA \nATGGGAAAGCCAAAAGGCCACCCCAACAGAGAGGTGGGGCAGCGCAGCAGGAAAAGTGCGCCCCGAGGTGGACCTCGCGGCCATGCGCCGTGCAACAACCCTTGTAGTGTGCCGCTGGCGATGTGGGACTTTGAGCAGTGCGACCCCGACGCCTGCTCGGGTCGGCGCTTGTATCGGCACAATGCATTGCGCCTTTTAAAGCTGCGGGAACCCTTTCATGGGGTCGTTCTCACACCAACAGCCACAGAGGTTGTGAGCCCTGCCGATGCGGACCTCGTTGCCCGCTCCGGTGCCGCAGTGGTGGACTGTTCGTGGAAGCAACTGCATGCGGTGCCGTGGCGGCAGATGAAGATGGGTGCCCCACGTCTGTTGCCGCTTTTAATGGCCGCAAATCCCGTCAACTACGGTCGGCCGTCAAAGCTGAACTGTGCCGAGGCACTGGCAGGGGCTCTCGCCGTTGTTGGCCGCATGGAGGACGCGAGGTCCGTCTTGTCGTACTTTTCCTGGGGAGAAAGTTTTTTTGACGTTAATGCGGAGCTCTTGGAGGGCTACAGCGGGTGCGCCAACGCGGCAGACGTGGTGGCTTTTCAGGAGCAGTACGTGGCAACTGAGGTGAGCAAAAGTGCGGCACGGCGGGAGATTGACTTGAATAGTATGGATCTGATGGATGCGGGTCCGCTAAACCTTAAACGAGGCAAACTAAGGAGTCGGCATACATGGCAGAAAGACGATGACAACGAGGAAGAGGAAGAGGAAGAGGAAGAAGGGGAGGAGGAAGAGGAAGAGGAAGAAGAGGAAGAAATAAAAAAGGATGCTGAAAAAAAGGAGGTTCAGTTAGGGAAATTGGAGACGTCAGGTGATGGGGGGAGTCTGCGTTCTTAG\n>XM_037232021.1 PREDICTED: Pollicipes pollicipes tyrosine-protein phosphatase 99A-like (LOC119108450), mRNA \nGGCGGGCGCGTGGTGTGTATGCGCGCCGGGCCCAGCGACTGCGGCAGGGGCACGTACACCAGAACCACCCTGCGCGGTTGGTAGATGAGCCGGCTCCAGGAGGTAGACGTGCGGCCGGTCGGGTAGACACGTTTTGAGCGTGTCTGCGGTGTTTAATCACTACTGTGAGTGACGAAGACTTTCTGTGTGACAGTCGTGCCATCTGGTGTCACACCAGTCAGAACCATGTTGAGAAGACGGGCTTTGGCAGTGACAGTCGTGCTCCTCGTTCAAGGCTGCTGCGGGGCGTTCGACACGCTCTTCTCGAGATCTAAAGCGAGCGTCATCCTGCCCTGCGACGGCATGACCGACCTTGACCCAGCCCAGGTCACCGAACTTGCCTGGCTCTGCTACGGCTGCATGGAGAGCATGATCGTGTCGGTGGACGCGGCGATCGAGACGAGGCTGCTGGAGTTCGTGGACGGCACGGCCACCGTGTTCCACAACCACGGCCGCATCAGCCTCCTGCCCGACACGCTCTCGCTCAAGTACGACCCGGTCGAAGTGAAGGACAGCGGCGAGTACCACTGCCAGGTCAACGGCCGCGAGCCCATCTCCGGCCTAATCAAGCTCGTCGTGCAGGATGTTCCTTCGGCACCCGGAAGGCCTCTCATCACCAACTTCACGTCTCGGTCAGTGTTTTTATCCTGGACTCCGGGCAGCAAGCAGAACAACAGCCCCATCAGACACTACATCATCCACGTCAAAACTGGCGAACATGGCGAGTGGAGCCAGCAGCCCATCTCCACGCCAGATAACCAGACATCGTTCGTGGTGGCAGACCTGCAGCCGTTCACCGCCTACAGCTTCAGGGTGACAGCCGTCAACGGCATCGGCGCCTCGCCAGACGGCATCGCCTCCTACCCCATCATCACGCTGAGAGAAGCCCCAGCCGGGAAGCCGGCGATCCTGGCGGCGCATAATACAAGCTCCACTTCGGTCCGGGTCCGCTGGAGGCCGCTGTCCAAGGAGGAGCTGCGTGGAGAGTTTCAGTTCTACAGGATCACTTACCGGGAGCGGAGCAACGTCAGCAGCCGGATTCGAGAGCTTCGGATCAAGGATGAACGTGTTCAGAGCCACACCATCTCCGGGCTCCGTCCGTACACGCAGTACATCATCTCGATACAAGTGGAGAACCCGGCTGGCCTGGGTCCCAGCTCCACGGTCGTGGTCACCACGGACGAAGGAGTTCCCGAAGCGCCACGGCAAGTGTCTGTCGTGAACGTGACAGATACCACGGTCACCATCTCGTGGCTGGCTCCGAATCGCCCCAACGGCCTGATCGAGGGTTACCGTATCTACTTCACTACCGGCAACTTCACCAATGCCACTTGGCTCAAGCTGCCCGTGGATGACATGCAGTACACGCTGAAGAATCTAGAGCCCTTCTCCAACTACTCGATCGCGGTGAAGGCGTTCACGCGGAGCGTGGAGGGCCGCGAGTCGGCGGCGCTGGCCGTCACCACCGACGTGTCGGCGCCGGCCGCACCGCGGCTGACCTCGCTGGCATGTCAGCCGGACGCGGCCCTGCTGCTCGCCTGGCGACCGCCGGGCCGCGTCCGGGGCCGCATCGACTTCTACGTGGTCGGCTACCGGACCGGCCAGGCGACGGCGCTCACGGAGCTGCAGGTCACCGCCGACTCGGCAGAGCAGGAAAGCATGCTGCGCTTTCCTGCTGGCGCTGCTGGCCCTGGCCATCTGGAGGTGAGGTCACTGCTGGCCCTGGCCATCTGGAGGCGGTACTTCCAGTCGTCCTACTACTACAGCCTGGATGAGCCGGTGACGGCACGCGCGCCCGTGACCTCTGACCCGGGCTGGGAGCTGGACGGTCCGAACGGTTCGGCCGGCCCGATCCCTGCCGATGCCTTCCCGGTGCACGTGGCCAGCCTACACGCCGATTCGGACATCGGATTCTGCAAAGAGTATGATGAGGTGCTGGCGCACACAATGAAGTTGGAACTCTCTTCGAACGTGTCACAGACCGAGGAAAACAAGCAGAAAAATAGATACCAGAACATTGATGCCTACGACCACACCCTGGTGCCCCTGAGGCCCCTTCCGGGCCAGCGGCGGGGAGACTACATCAACGCCAACTACATCGACGGCTTTCTCGTGCGCAACCAGTACATCGGCGCCCAGGGCCCGCTGACCGGCACTTTTGCGGCCTTCTGGCGGCTCATCTGGGAGCAACGCATCCAGATCGTGGTCATGATCACTAACCTGGTGGAGCGGAACAGGAAAAAGTGTGACATGTACTGGCCGAAGGAGGGCACTCAAGTGTATGGAGTTATACAAGTGGAGCTTTTGGACCAGAAGGAGCTGTCGACCTATACGATAAGAAAAATGCTCATCAAACATACAAGGCACAAGAAGAAGAAGGGCGTGTGCAGTGAAAGGATCATATACCAGTACCACTACACCAGCTGGCCGGACCACGGCGTACCAGACCACCCGCTTCCGATCCTCAGCTTCGTCAGAAAATCGGCCGCTGCGAACGGCGCCGGCGCGGGACCCATTCTGGTCCACTGCAGTGCCGGGGTCGGAAGGACGGGCACCTACATCGTCCTCGACGCCATGATGCAGATGATGAAGCTCCGGGGCGCCATCAACGTGTTCGGCTTCCTCAAGTACATCCGCACGCAGCGCAACTTCCTGGTGCAGACTGAGGACCAGTACATATTCGTGCACGACGCGCTGTTAGAGGCCCTGGAGGCGGGCGAGACGGATGTGCGAGCCACGCGGCTCACCGAGTACCTGCACCAGCTGCGCTCCTACGACCCGAACCAGTACCCCCGCTACACGCTGGACCGCCAGTACCAGCTGGTGACATCATACCGGCCGACGGAGAATGACCTGGCAGGGGCCTTGGCTCCGTGCAACCAGGCGCGAAACCGGAGCGCCCAGTTTGTGCCGTTGGACCGGTGGCGGGTCCACCTCTCTCCCCGGCCGGGCGTCGAAGGCAGCGACTATATCAACGCCACTCCCCTGATAGGTTACGAGAAGCTGTGCGAGTTCATCATCACTCAGCACCCGCTGCCGCACACGGTGGACGACTTCTGGCGAATGGTGTGGGAGCAGAACGTGCAGACCGTGGTCGTCCTCTCGCCCATCGACGACCAGCATTACCCGCGCTTCTGGCCGTCGCCGGACGATGACATCGACGGCGACAGCTTTCGGGTGCGGTTCGTCGACGAGCCGGCGTCGGCGGCGTACGCCACCGTCGACCTGGTGCTGCAGTCGGCGCAGGACGACTACCAGGTCACGGTGCGCGTCATCTCGTGCGCCGCGTGGCCGCACGGTGCCGCCGCCTCGCCGCACCACCTGGTGGACGCCGTGCAGCAAGCCACGCTCCAGTACCAGAACGGACCGGCGGTGGTGGTGGACAGGTTCGGTGGAACTGAGGCGGCCACCTTCTGCTGCCTGACCACGCTGTCCAAGCAGCTGGTGAACGAGAACTCCCTAGACGTGTACCTGTACTCCAAGCTGTACCACATGAGGCGTCCAGGAGTCTGGCAGACCCAGGACGATTTCACCATGCTGTACCACGCCATGGAGGGATTGGTCCGCCCAATACTGCCCCACTCTCCCAGCAGCCAATCAGAAGCCGAAGCCCTTCTGCGTCCACCCAGCCTGCGCACGAGCACTATGAGGGTACCTCCCGACGGAAGAGAGTGCTATGTGCCTGCAGAGTGTGTCTGACGTTCTGTCAGAGACCGTACGTGACTGTCACAGCAGAGGGTGCTCCGAGCCCGCCGAGTGCCTCTGACTCTGTCAGAAGCCGTGCTCCGTTTTGAACTGCAGGGGGAACCACGCA\n>XR_005812777.1 PREDICTED: Oryza brachyantha uncharacterized LOC107305249 (LOC107305249), ncRNA \nGGAACTCACTAAAACCGCTCGCCGTTCGCTTCTACACCTGACAACCCCCGCCGTGCCTCTATCGACCCTCCCTCCTCCGCCTCGAGCCTCCGCCGCCGCTCAGCAGTTGCGGACCTCTCTCTCTCTCTCCCCGGTGCGAACCGGCCGTCACCGTCGGGAAGGATGGGGTGCGTGCCATGCCGGCACTCACCATCTCAGCATCCTAAGAACCGCAGTTTTGGGAGCTGGCCGAGTTCTTTCGGTATGTCACCAGAAAATTGGCAGCCAACAACGCTCCTGACATGCACAAGAAAAAGCTTTCAAGGTTACTCAAGGATCCAATGGTCGATGGAAGTGGACCGCTCAAGTTGTTGTAAGATAAGTCCCTGCAGATGATCTTAATAGATTTATCACAACCAAACAAGGTAAAAACTTTCACAGGTAGATTCAGCAACATTAAGGAAGAGTCCATGTTGCAGCTCTTGTTTATAACACTCAAAAGCTTTCTGTAAAATTGACAAACTTGTAGTACATACAGGTACTGTAGTTCTGACAATGACTGTACATCTCCTGAAAGTGACCCAGACAATCCAAAACTTGACAGCCTACTGTAAACCACAAGAAAAAAGACATCATTTAAATGAACATAGAAGAAACAGCATCTTGATTTAATGAAATATGTGTGTGTGTGAGAGAGAGAGAGAGAGTTGATTCAGATAAAATGGTTCTAACATCGAGGTGACACGATTCTGGATGCAGGATACTCCTGGCCATTTTTGTCCACAAGGATCATTTCCAACCCAATCCGATAGCTTGGACATGGCGTTATCCCAGGAAGCTGCTATGCCTTTGAGGGCAGAGGCTGTAAGGCAATGAGAGTGAAGAAACATCATCATGCAACAAAAGCTAGTTTTTACAGCAAATTAACTGGAAAACACAAGGAGGCTGATGAAACACTTACTATCTTGTGGATCTGTATCTGCTGATATGATGAGAGCACGGTGAATAATGATCAGGGAGACTAGCAGATGGATGATCCTCCAAGAAGTTGGAGGATGCGCCATGGTGAACTTTATTTCAGGTTGCTGAGAAGCCCTTTCTTGTGTTACCAACTCTCCACTACTCAATTCTGAGCACTTGCAGTGACATGATGTTATGAAGGCTGAATATGCACATCAATTGTGAACTGGTCAATGGAATCAGTCAAGAATGTGGCTTTCATCTCCTCTCAATGGATTGCCTTTTCAAATTCATCCAATTAATGGTGAAGTCCCAGATTTTAAAAACCAAGAGAGAGCTCACAATGGGAGTCAACGGTGAGCTATTGGTTGGCAGGGAGCATGAAGTTCTCTCCTATGAAATAGGATCCGAATGATTCAAATTATTTTTACCATGTTTGAAGTATCATTCCAATTGAATATAAAATAATTGCTGCTCCTTCTAAGACACTTGAATGTTTATTGCATGCATATTATGTTTTGTTGAATAGTGTAGATTTTAGTTGTCGTATATTCATGGTGGGATTGACTTTAGAAAACTATTGGGACCATTTTGTTGTGTACATGTGCTGAATCTGAGGTTTATTCGAATGATTTGCTAAGAAATGGTCTGGTTTGAACACAAAACATCTGATATTTCTAGACATAT\n>XM_034077493.1 PREDICTED: Pseudochaenichthys georgianus non-SMC condensin II complex, subunit G2 (ncapg2), partial mRNA \nCGCGGGCTCTTATGGCAGACTGTCGTTCTGCGGCTGTCGGATCACAGCATTATTAATACAAAGGAATATTGGTGTTGTTTCACGTCTTTTGGAGAACCACAAACATGTCGAAGCGAGAGGCTTTTCTAGAGTCCTGCTGTACGGAGAATGTGGACGATTTCCTCCGCTTTATTCAGCTTAATCGGAACAAGACGGAGCCCTTCGATGTGGAGGAAGTTCTGCAGGAGATGAACAGAGACCAGAGGCAGACGCTGTGGGGGAAACTGTCCTCTCTCCTCCAGGACGTCCTGCAGGAGGAAAGGAGAGAGGAAGGGAGTGAGGAAAGGAGAGAGGAGGCCATGGAGGTGGAGGCAGCTGCAGACCCCAGTCACGTGAGGTCTGTCGTGGACGGTGTGACTCTGGTTGCTGCCGAGTCCCTAAAGGTCCTGCAGGACGGAGAAACCTACAGTTCTCTTCTGGAGATCATCCACAGGCTGCATGATATGTTGGAGCTGCAGCCGGTCTCCGAGGCTCCGCTGCAGCTCCAGATCCTCAGACTTTGTGACGCCTGGTGGAAGAAGGATCTGAAGGAGAAGGAAACGTTCGGTCGCAGCGCTATGATCATCGCTCTGACGAGGAGCTTCGACCTGAAGAAACCGGGCACAGAGATCCAGAGGGTGTGGAGTCTCCGGGAGGTTCTCCTGGGTCTGGATTACACGTCGGAAGACAACAAGCAGATGATGGATCTGCTGCTGAAGTGCTTCCAGCGCCCGGCCTTCCTCAGGAACGACGATGGAAAACGCTTCCTGGTGTTTCTCTTCAGCTGGAACATCAACTTCATCTCGGTCATTCACGGCACCATCAAGAACCAGCTGGAGTTCTTTAGCATGATGGTAACGGCTCACATCGCTGAGATCTACTTCAGAGCCTGGAAGAAAGCCGGCGGTGATTTCCTGGAGAAGATCGAGAGCTCCTGCGTTCAGGATCTAATGCAGAACGCCATCTTCCTCCACAGATCCTCTCCTGTGTACGCCAAAGTCCGAAAGATCGTGAGCTACTTCCACTCGAGGAAAGGCTGTGAGAAAGTGGACAAGATGCTCTCCAATCTCTACAAGCCCATTCTGTGGAAAGCTCTAAGTGCGCCAAACTTCGAGGTGCGAGCGAACGCCACGCTGCTTTTCACCGAAGCTTTCCCGGTGCTTGACGTGGAAACCGGCAACAAGAGCACGGACGAGGCCATTCAGAAGCAGCTGGACACGGTCATGGTGCTTCTGGACGATCCTCACCCCACAGTTCGCTCTAACGCCATCTTAGGAGTGTGTAAGATCCTGGCTAAATACTGGGAGGTGCTTCCTGCCGCCATCATCACCGACTTCCTGAAGAAGCTTGTGATGGAGCTGGCGTTCGATTCGAGCTCTCCTGACGTCCGCTGCTCCGTCTTCAAGTGTCTCATCATCGTGCTGGACAACAGCCTCAGCCATCCCATCCTGGAGAAGCTGCTCCCGACTCTGAAATACAGTTTGCACGACAACTCGGAGAAAGTCCGCATCGCTTTCCTCGACATGCTCATTAAAGTGAAGGCTGTGCGAGCTGCTAAGTTCTGGTCCGTGTGCAGCATGGATCATCTTCTCGCTCGCCTCGCCATCGACTCGTTATCCGCGTCGAAGCGCATCGTGGATCTACTTTTCAAGTCCTTCTTCCCCGTGAACGAGTCGGATAAGGAGTGGTGCAGCCGCTGCATCACGCTCATCCAGATGAACCCCGCCGCCGCCAGGAAGTTCTACACACACACACACAAACACACCGCGCCCACCAACATCATAAAGCTGATGTTGGCGATTCGCCGCGTTCTGAACTCTTGCCTCCAGGCCCAAGGTGACCTGTCTGAGATCAACGACACCAACAAGGAGAACAGCGCA\n>XM_013920937.2 PREDICTED: Limulus polyphemus tyrosine-protein kinase Abl-like (LOC106461142), mRNA \nAGCGGCCCCTATGGACGGCGTAGAGGCTTGCTTTGAGAGTGTTCGGTCATTCGTTTCAGAGGTTTTTCAATATGGCTACTAATGAAATTGTTAGTGATTAAATTATTGATAGTCACAACTTGCTAACATGCTTGTACTTTTTATAATTGGCATATTTACGTAGTTTATCAATAATGCTATTAAAGGTCTCCTAAATAAAAGTTATGTTCTGAAAATATACTGCATAGTAAGGATCCCGAATAGCCTGAAGGTCGTTTTGACGTTAGGCTATGGGAGCCCAGCAGGGCAAGGAAAACCGTGGAAGTGGATCTTCGGTTGGCAGTGGACATGGTGGAAAGACTGGGAAGAGCTTTAAAAATAGATCTAAGGACTCTAGATTATCATCAGTTTCTGGAAATATATTTACAGAACACAATGAAGCCCTGATGCAAAGCAGGCCTTTGCCAGATATTCCTGACTTTGGAGATCATATTAGCAACTTATCCATCCCTAATGATGGGTCATCCCGGTGGATGTCCAAGGAGAATCTCCTGGCTCCTGAAGACTCTGATCCCCAATTGTTTGTAGCACTCTATGATTTCCAATCTGGTGGAGATAACCAACTTTCTCTCAAGAAAGGGGACCAAGTACGAGTGCTATCATACAATAGAACAGGTGAGTGGTGTGAGGCACAGTCACGTTCAGGTCAAGTTGGTTGGGTCCCTAGCAACTACATCACTCCTGTCAACAGTTTGGAGAAACACTCCTGGTACCATGGGCCCATCTCTAGAAATGCAGCAGAGTACCTACTAAGCAGTGGGATCAATGGGAGTTTTTTAGTCAGAGAAAGTGAAAGTATTCCTGGTCAAAGGTCAATATCTCTCCGTCATGATGGACGAGTATACCACTATCGAATTAATGAAGATGGCGAGGGTAAAGTGTATGTGACGTCTGAATGTCGATTCAATACTTTGGCTGAACTTGTCCATCATCACTCCATGCATGCCGATGGTTTGATCACCATGTTACTCTATCCAGCTCCTAAGAGAAACAAGCCTGCTGTATTTGCTCTTAGTCCAGAACCAGATGAATGGGAAGTGGACAGGACTGGTATTGTCATGAAACACAAACTTGGAGGAGGACAGTACGGAGACGTTTATGAAGCTGTCTGGAAGAGGCATAACATGACAGTAGCTGTTAAAACACTGAAAGAAGATACAATGGCCTTAAAGGATTTTCTAGAGGAAGCAGCTATTATGAAAGAAATGAAACATCCAAACTTGGTCCAGCTAATTGGTGTTTGTACAAGAGAACCACCATTTTACATAATCACAGAGTTCATGCCCCATGGAAACTTGCTGGATTTTCTCAGGAACGCCGTTCGCGATGATATCACGGCCGTGGTGCTAATGTACATGGCTACACAGATAGCTTCAGCAATGGCTTATCTAGAATCCCGTAGTTTCATACATAGGGACCTAGCAGCAAGAAATTGTTTGGTGGGAGAAAATCATCTCGTAAAAGTTGCTGATTTTGGTCTAGCTCGACTGATGAGAGATGACACTTATACTGCACATGCTGGGGCCAAGTTTCCAATTAAGTGGACTGCTCCTGAAGGCCTTGCTTATAATAAGTTTTCTACCAAGTCTGATGTTTGGGCTTTTGGCATCTTACTGTGGGAGCTGGCCACATATGGAATGTCTCCTTACCCTGGGGTTGAGCTAACAGACGTTTATCATATGCTGGAGACTGGCTACCGAATGGAGTGCCCACCGGGATGTCCACCAAAGGTTTATGAACTAATGAGACAGTGCTGGTTGTGGGAGCCTCTTGATAGGCCTACTTTTAAAGATGCTCACCACACTTTAGAAACTATGTTCCAGAATTCAAGCATAACAGAAGAAGTGGAGAAGCAGCTAGAAAGGCAGACTCCTGCACCGTACAGGTCCTATGGAGAGAGTTCGCCAAATATTTTTCAGCGTGATGAAGAAGGAGATTATCCACTAACTGAACAAGGTTGTCATAGTGGAGGTTCAACCAAACACCAGACCATTATCTCCACTAGATCTACTTTGGTTCAACTTCGAAGACATGGCCCTCGAAGTAAACAGGCACCTGTACCACCAAAGAGGACCAGCACTTTTCGGGATAGTGTCTATCAAGACAAAATGTATGGAACAATCGGACAGGAAACTAATAAAAATATTCTCAATAATGGTGGTGAGAGAGCCTTTGAGACTAGTAACAGGAAAGCTCAGGAGATGAACAGCAATGAAGAAGGGGAATGTGAAATAAGAGAGAGAACTCCTGATACTGAGGAATCTGATACTCATACAGCAGCTTCAGTTGCTAGTGTTCCAGCAATGTCGCTAAACCAGCAACATTCTCAGCAAAAATTGAAAAAAGCAAGGACCTACCCTCCTAATATTCAGCAACATAATAATACAAAAGAAAACAGTTCTTCAAATAAAGCAAGAGAACCCAAGAAAGTACAAGTTGCAGCTCTAGAAGTTCAAAATGTGAAACGAGCCATTAATCGATATGGGACACTTCCCAAGGGAGCAAGAATTGGTGCATATTTAGATTCACTCAGGGAGCATGGTCTCCATACTGGAGCTAAGTATCCTGAGCCTGTTGTTGAAAGTGAACCACAAGCTTTTAGTGACATAGGATGGGAAAGTGCAGCTTTAGATCCACTTTCCCAGAAACAGAATTTTAGCAACATAAATAATACTCATAAAGGAGAAACTGGAAGCCATTTCTCTTCTAGATATCCTCCTCCAAGTCGGCATAGACACGAATATGATGGGGTTCATCATTCACCTCATGCCTTTCTACAAAGGCAAAAGTCAGATCTCACGTACTCCAAGAACAATGACACATTTGAAACAGGATCTATTCCAGACTCTAGACACCTTAGTTCAAAGCCTATTCCATCTCCTAGACTTCCTAGAAGTCAGAGGGTGGATCGAAAATCCTCTCGTGATGGAAGAATTGAAGGACCACCTTGCATACCCCAGGAGATAAGAAATATTCACGATGTTGGTACTAACAGTGCTTCAAATGCTGGTGGTGAAACCAGTTTTCGAGATTATTCTGGTAGTAGTTACCCCCGGAATAATATTATTTCAGAATCCAGAAATGTTGATTCTCAGTCATTCTCATCTCCTTTTAGTTCTAATGTCTTTCGAAGGACACTCACTAAAAGACCAAAAGAAAGACCTCCAAGTCCTCCAAAGAGCCCACTTGTAAAAAGTGGTTCAATTGATGATCAGTTAGGATGGAAACCTGAGAGGATTTTTGATCAGAGTCCATCAGAAAGTGCACACACTGTGACTCCACTAACTTGGAGTGCTAGTGTAGACAGCCCACTTCCTCCTGGAAAAGTCAAAGTCCCATCGGGGAGTCCAAAGTCATCATGGAATATTGTATCTCCCCCTCCACCACCTCCTTGCCCAGAAGGTTTTCCTCCTCCTCCTGATTTTGTAAAAGATTCTCTGGAATCTTGCTCTGAACAGCAGACTGTGATTGAAGTTAAAGCTCCTTTAGTTGCCAAGGCATCACATAATAATCAAACTGCCAAGAACCCAGCAGCTCAGCTAGTCTCAGAACTCTTTGAGAGTCTTAAAATGAAAGCCAGAAGAAGAGCTGTAGAGATGGGAGATGCTTCTTCTCAAACCACTGAAGAAGTAGGAAGCTCTGCAGAAATATCAAAAGATCAGTCAGCTGTTGCACTGTCTCCTAAAAAGCAAATTCCTTCTGTAGACTTACCTGTAAAATCTGAATCTGTAAATTGCTCTAAGTTAGGCTATCAACAAGGAAATGAGCTTTCCAAAAGAATCAGCTCAATATTTGAAGCCAGCTCAAATAGGGAAAAAACAACTGGAGAATCACAGTCACAGTTTTATGTGCCCAGCAATAGACTCAAAAAGAAGACTCAAGATAATATAGAAAAAAGTGTCAGTGGAGATCTTGGCCAAAAAAATTTAGTTATACCAAAACTCAAAAGCAAACCTCCTGATAGAGATTTGGTAGAAATCTGCCAACCAGATAGATGTGAAGAAGAAGAAAGAAGACATAGTTGTGGAAGTATAACAAGTTTGAAGAAAATCTGGGAGAAAGAGAGCTCAAAACAGGAGTCGGAGCTAAATGCTGATGGTTCATGCATTGACAGTCCAAAAGTTGTGGCACGTCGACCAGAATCACTGAAAATAGAAAGAACACAGACTTTGGAGCTTGGAGATGATACTTTTAAAAGTGGAAACTATGAAACTGAACCTGTACAGAAAGCATCGCCAACCTATGTTAAAGAAAGTACTACGTCAAAAGCATTGTCTCAAGCATCATTAATAGGTGAACAAACAGAAGAACTAACTAATCAAGAAGATCAACAGAGTCATTTAAAAACTTCCCCTCAAAATAAAGAAACAGGAGGACAGTTATCCCCAGCGATTCCTAAACCAGCAGTTCCATTGAAACCACCAGTAAAAGGATCTCGAGCTGTTTTGCCTCCAGGTACCAGACCCTCTAAAACAAGTAATAAGCCCCAGGTTTTTCCTCGAGGAGGTATAGGGGGGTCTCCATCATCGCAGGCTGATGACGAAACACACGATAGCATAAGCAGCAAAGAAACTATATTGGAAATTTCTACAGCACTTGAAAATAGTATTCAGTTACTGAAAACAGCTACATCTCTAAGCAGTGGAAACGTAATGCAGCTGTCGGATAAAGTGCAACTTTTTCGAACTTCTTGTGGCAACTATGCAGAAAGTATCCCTCCACATGGGAGATTTCGCTTTCGAGAATTGTTAACAAAGTTAGAACGACAGGGTGAACAGTTGCGCACATGTAGCAGTAATAACAGTGCGTTCAGTTCCAGACTTTTTGAAGAATTACAAAACACGGTGAGGGACTTGGTAAATATGGTCCAGAGGTGAGCAGTGTGGTCAATATGTATAAAAACGTATATCAACTCTCATTTATATATCATGATATGTGTATGATTAGTTTCTTGATTTACTCATGAATTCCAGCATAAGAAAGTGGGATACATGGTCATCTAGTCGTAACTTTTGCTCATTAGTGAAATGGTGGTGAGAAAAGCTGACAAACTTACTTATAGTTACTACAACTTCAGCTGAGAACTGTCGTATGTACGCTTTAAATTTGTGATTTACACATTGTCCATGAGAACCAGCCTAAAAGATCTCTACTACGTGAATTAGATCCCTTAAAGTGCTTTTGAGAATGGAGTTCAACTAATACTTGTCATGTTAACACAGGTGTCATTTTTATCCTTAGAAAATAGTATTGTAAAGATATATTGATAATCCAGGAGAAGTGTAAGATACAAAATGTCGGGTATTTAATAAAAGTAGAGAGCAAAGCTATACAATTATTCATTCAGGGTTTGGTACAATATTACTCTTTATTCTCAAAGAAAATTAGATGTGTGTGTGTGTGTTGAGTCAGTCATGGTTCCTTTCATCTGTGAACAGTTGTTAACATAGTGTCACAAACAAATATATTTTGTAGTTTAAAAATTGATGTGTGTCGTTGTCCCCCCCCCCCTCCAAGGTAAATTTGTGGTTTGGACACACTTGCCTCGCAATGAGACAGTTAAGTGCATATTTCTAGGCTAAAGCTACATTGAATCCCATTTAACTTTCATTGTGAGTTAATGCTGGTCATAAGGTAAACTCTGTTGTACGTTTTATGGTTAAGAGTATTTAAGAATTGAATGTTTACTAATGTGGCTCTATCAGATCCAGCCCATTGTTGTTTTTGCCCTTATAAACAAATATGTGGATGTATTATATCTGTGTATTTAACTTAACCTTGTGCTACAGTGTCTGTACTAGTTTTTGTGACAGGGGTTAGTGGATGAATTCCTAATATGTATAGCAACATTTGCATTTCCTTTCATAATAAAGAAAATTCAGGTTTCGAAATTTTATCTCACTCAATTCAAATTATCTTAACTTTGTGGGTGGGAATACAAATTCTCATAGGGTTGGCAGTACAGGTGGAGTCGTCCAGTTAGAACTTTGAGCCATATTACTTACTTCCATTGGCTTTACGTAATGATAATAGGACATTGAGGGCACTTTCTATTTGATGCCTATCCTTTACCTTTGTCTTGGGGGGAGATTTCAGCTTATATATGTCATAGCACCTTTTTTATGCACAGTTCGCCCTTTAATTTCTCTTTTGACCTGTATTTGACCTGTACATATTTCGTGGTTTCTTTTACTGCAATATAAAATGTGAAGCCAGAATTAAGTTTAGTGTGAGTATGGTTTTATATGTATATTACAGGAAATATTTTGTGTTTTTTTGTTGGTTCTTTTGTAAGTTTCAAATAATTTTAACTTCAAGCAGTAGACAGGCCCATTTAAGAGAAATTGTACTTAGTATGAGAAGATTTCTTGGGAAAATAGATGAATTTTTTTTTTAATATTTATTGATAGGAACCTGTAGAAAACTGTTTATATGAGCCACTGTTTTGCTCTGAAGACTTCACTGGGACCGAAAACCGTTGTGTGTCTCGGAACTTTACATATCCTTTTAGCCCTGAGCAAAATGATGTTATGACTTTCTCATGTCTGTGTTCTTTATTTAGGCCTAATGAAACTGTAATGGCAAAATGTTGGCTTAAGTAAACTCTATCGTCTGGAGTAATAAGCCCTATTTCATTTATCCTAGAAGTTGGAAATTCGTCAGTCTGCTCCAAAAATCTTCATTGTAATGTTTTCATTAGTGGTAAAAATTTAACTGTTGAACTATCATTCACACCAAAAGTGTTTCAGAAACGCGTGTTATGTAGTTCTGTGTCACAAACACGTGCTATGCAGTACCAATATTTTGAAAATTAAAAGTGCTCTCTATCAGTGAAGTCGTGAACTTTTGATCAGTATATATATATATGTGTGTAAAGAGTGTGTTAAACGTTCATAAGTAACAGTTATGAGGAAATTGGATACAGTGATTATGGCGACTTGTTTATCTGTTCGTTATATTGTTGCTTGCTCATTAAATAATCCCTTTTTTTTAGTTCGCTTTTGTCTGCGACCAGTGTATGCAAACTTGTACACATTATTAATCACCTTGTTAAAACTTTTTCTCTGTTTTTTTTGTATTTTTTTATATCAAGTCTGTTAAAAGCGATTCATCTCTGTAACTTTGGCTAGATGGTGTTGCGTGCGTTTATTATGAGTGAATGTAACATCATCTAACTTTCTCTGTAATATGATAAGACAAACTGCCACAAAAGTATCGTAATTCAAAAATCAAGCCTTGTTTATTGGATGGAAGTTTTGAAAAAATGTCTTTGTCTAAAAACGAACATACGCATTGGACTGTTTGATACGTGAAAATGACGCTGAAGAAACGAGTCGTATTTATGAGTGATTGCCTAAGTTAACATTAAACATGGATTATGTTATAGCAGATATGTAACTAAATTTGTATTTTAATGTCAGAAAGCATGTGAATTTTTGGTGTATTTTAACTGTATATCATGGAAGGTTGTTTGTGAAATGTAGAGATAGGTTTGTTCTCTGTGCCTTGACCTGTAGGCGTGTCTTGTACCGATGTTCAGCACTATAATTATCGGCATTCTTTCCTCTTTCAGTACTTTCCCAAAGCGACTAATCAAGACTCGGTAAAATGGCAATAATCCACACTTGGAATATGTTGTAGGAACGTGAAGGTTAAGCGTGTGATTGTATATAGAGAGAGCAAACTTCCTTCTCAAAACGGTCTTCAATAAACTCTTCTTGAGAACATATCAGTTCTTATGTTGCTTCAACAATCCCTAATGCTAGCGAAAGGTATTTTGCCTACTTAATACATTTCTCCACTGTTAATGTGTTGCCATTATTTTAGTTCACCTTAGTTTCGTTCTATAAGATACCGTTTATAAAGCTTTAGACAGCTTATCCTATTTCTTGCATCGTATACAAGAGAAAGTTTGAGGCCTGGAGCTTTTGTTATTTTACAGGTATTTAATTATATTAATCAAGGACCAATGTTTTAAAAACGTGGTTTTAGGTTGAAATGTTTGTGCTCAGGATTGTACTCTCTTGGTGATCTGAAGGTGTCTTGTTGTAAAGCAGTCTTTGCGTTGAGTTTTTTACATTTAATCCTAACTCGTAATGTTTATAATTGATTAAATTGAAACAGAAAAGGCTATTATTTAATCGTTTTTAGATGAATGAGAATCACTGACTCTATTGATAACAAAGTAGCGGTGTCAATTTCGTATGAAAGATTCGTATTTTTGAAATTAAAATGGGTCATAGTAACACACTTCATAAACCTTACATTTTACCAGTGTGTTTGAGTTAAGAACAAATGACTACTAGACCTAGAATTACCTGTTAAGTGTGTTGCACATTCGCGTATCTAAAACTATTTTATGTGTATTGGAGTTTTCTCTTGTGTTTGTCTGTGTGCATAACAGTATTTCTTTTAACCCTTACTCAAATCCTTGGCAGATTGGTGTTTTTTTTAAGTATTTATTCTGTATGTAAACATAATTGAAACGTTATTTTACGATTTATGATATTCAGGTTCCATAACCCACGCTTTCGGTCGTCTTTTAGAATATTCGTGAAATTTACGATAATTGTAGTGGTTGTACTATTTTATATTTCGTGTAAATATATTGTCTTTTATCTTTTCTTCCTACTTCTCATCTCGCGTGTTTTGATCAGGGGTAGAAACTAATTATACTACTTCTACATTTCATTCTAATGTGTGCTACTGTGTAAACATTTCTTCAAAACACGCTGTCATGACTTGTCACATGTCTATACTTGAAGACCATTTCGTGTATGTAAGAACGCGGTTCCCACCCTACCGGTAGCACTTTTAATCGTGAAACTCCACAAACTGGAAAAAGAAAAATAGTTCTCTGCACCACCAGAGAACTACATAAAACTACAAGTCCAACACGAGTATATCGCAATGGATACTACTAAATAAACAGGAAAAAAAGTTTTTTTTATTGAAAGTACAGTGTGTGAATGATAAATCATAAATCATTAAGACAGTCTAATACTTTTGTTGTAGGTAGCTTAAGTATATAAATAAATAAATATATATATATATATATATATATAGCTATGTAGCTGACTAATTTAATGTAACATACCTTTATGAAACAAATTGAACATTTGTATATAGTTGAAGTGTCTAATATACTAATCAGTAAATGTTTCTTATGGATGCCTAATTTTGACTCGCGCTGTAAATTGTAGATTTTTCTAAGTATTAGTTCCCATCAGCGTAATAATTTAAGATTAAATCAAATGAGAAGTTAAGTTACAACGAATTGATTTTGTTTCAGCACCACGAAAGTGTTTCTTATTTATAAATTTCTTTTGCGTAAAAAAATGAATGGCTTGTATTGGACTTTTTTTAAACGTCTGGTATGGATTTTTTTTTATTTAGTCCTCTTTGAACAGAATAGATAATGCTTGATATAAATACGTCATATCAAAGTAAGAGATTGAACACTTCCGTAATACTTAGGCAGCATAACGTCGACCACCATGTTTGTTTATCTTTCTGAACACAAATGGAATTCCACCGTTATCACAATAGACTGTTTGTTTCAAAGTATGTTCATTTCAAGAAGTAACTGTGATTGTTTTATTTTTATTTTTTTGTTAACTATCGTTGCTCATATTAGACAGCAGATATTAAATAGTTGTGAATAAAATATACGACACCAGTTTG\n>HQ716622.1 Uncultured bacterium clone T2WK15F91 16S ribosomal RNA gene, partial sequence \nGTTTGATTATGGCTCAGGATGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGGAGTTAATAGTGAATGAGGCTTCGGCCAAAGGAGCTATTAACTTAGTGGCGGACGGGTGAGTAACGCGTGAGCAACCTGCCTTTCAGAGGGGGATAACATTTGGAAACAGACGCTAATACCGCATAAGATCACAGTACCGCATGATAGAGTGATCAAAGGAGCAATCCGCTGAAAGATGGGCTCGCGTCCGATTAGATAGTTGGTGAGGTAACGGCTCACCAAGTCGACGATCGGTAGCCGGACTGAGAGGTTGAACGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCAACGCCGCGTGAGGGAAGACGGTTTTCGGATTGTAAACCTCTGTTTTCGGTGACGAACGAAATGACGGTAACCGAGTAGGAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTACTGGGTGTAAAGGGAGCGCAGGCGGGATAGCAAGTCAGCTGTGAAAACTATGGGCTTAACCCATAAACTGCAGTTGAAACTGTTATTCTTGAGTGGAGTAGAGGCAAGCGGAATTCCGAGTGTAGCGGTGAAATGCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCTTGCTGGGCTCTAACTGACGCTGAGGCTCGAAAGTGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACACTGTAAACGATGATTGCTAGGTGTGGGGGGTCTGACCCCCTCCGTGCCGGAGTTAACGCAATAAGCAATCCACCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCAGTGGATTATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCAACTAACGAGATAGAGATATGTTAGGTGCCCTACGGGGAAAGTTGAGAGAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTGCCATTAGTTGCTACGCAAGAGCACTCTAATGGGACCGCTACCGACAAGGTGGAGGAAGGTGGGGACGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTAATACAATGGTCATAAACAGAGGGAAGCAAGGCCGCGAGGCGGAGCAAATCCCCAAAAATGATCTCAGTTCGGATCGCAGGCTGCAACCCGCCTGCGTGAAGTTGGAATTGCTAGTAATCGCAGATCAGCATGCTGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTTTGTAACACCCGAAGTCTGTTGTCTAACCGCAAGGAGGGCGCAGCCGAAG\n>XM_041020936.1 Aureobasidium melanogenum CBS 110374 alpha/beta-hydrolase (M437DRAFT_44633), partial mRNA \nACTTTGAGACATATATACCATAAAGGCTCTCATCAGTATCCGCATCTCTTACGGAAAGTCGATATCAACAAGGACACACTGCTTGAGTACGAGAACGAAGCTGGGACAACCATTCTTAGACCAGCTTGGGATGCGTTTTCTGTGCAGTCGGATACGTTGATGATACAGCGCCTTGCTGATCGCAGACAACATGTCGTTGACGGCTTATTAGAGCATGGAGCTACCTTCGGTGAAGCCAAAGCTCTCGATGCAGAAGCCTGGACTCTAGACGAGGTCTCCAGCCCTGATGTGACCGATAAGAAGACAGTCCTAAGCTTCGCCCACATGGCGGCAAACGCCTACGTCTCCATCCCTCGTAAAGGCGACTGGATCGACATTGGCGGCGGCTTCAACTATACCGAAGATTTCGGCTGGGAGTCCGATGGGCTCCGCGGCCACATCTTCGCCGACACGCACAACAAAACCGTCGTAGTCGGGTTGAAAGGCACGTCCCTCTGGTTCTTCGATCCTCCAGAGACAACAAACAACGACAGAGTAAACGACAACCTATTTGGAAGTTGTTGTTGCGGGCAAGGAGGCCAATATGCATGGAAAAGAGTTTGCGAATGCCAGACTGATGCAAAGACTTGCAATGCTACTTGTTTGGTGAGTAGTTTGAGGAAAAAGAGTAGTTATTATCATGCTGCGAGGGCGCTATATCATAACGTGACGGCTTTGTATCCGAACGCTGATGTTTGGCTTACTGGACACTCGTTAGGAGGTGTGGTATCCTCTCTTCTTGGTGCTACTTATGGTCTACCAACTCTGACTTTCGAGACTTTTCCTGATGCACTTGCTGCTCATCGATTAGGTCTGCCAACACCACCAGGTCACCAGATTGGTCAATCTGGTAGACAACATTATACCGGCACGTTTCATTTCGGTCATACTGCAGACCCGATATATGTCGGAAACTGCAATTCGTATGACTCGTCTTGCACGCTTGCGGGATATGCTTTCCAGAGCAAATGCCACACAGGGTTCAATTGCACATACGATACAGTTGGTGATAAGGGTTGGAGGGTCTCAATCGGCACACACAGAATCAGCAGCGTCATCAAAGATGTCCTAGAAGCTTATGACACGGTCCCGGTATGCACACAAGATGTTGGTTGCAAGGACTGCTCTGAATGGTCGTTCTTTGAGGGCAATGGGACAAAGACGACGACCAGCTCAACAAAGACTGCTTCTTCGACGGAACTCACTACTACCACGACTACGACTTGCCGCACTCCTGGCTGGTGGGGTTGTCGGGATGAGTCTACTACTACGAAGACAACATCGACGTCGACGAGTGTCTCTAGCTCAACGTGTTTGACGCCAGGCTGGTGGGGCTGCAAAGATGCTTCTACGACAACAAGCTCTTCATCGTCTCATAGCGCTGAGATGAGATCGACTGCCACGCCGATACCATGA\n>XM_012484966.2 PREDICTED: Apis florea spindle and kinetochore-associated protein 1 (LOC100864548), transcript variant X2, mRNA \nAACTTATTGATAAGAACGCCATTTGTAAACGATATCGAATGAATTAAATTCAAAGTTTACAAACGGCGCCAGGAATGACCGTTATTTGTAATGCTATGTAAAAATGCAATTAAAGAAGAATTCCTTAAAATGCGCATAGTACTTTCACAAATGTGTAATGGTATTGAACAGATAAGGAAAAAATTAGTTGATATGAGAAAACAAAATAATCAATGTAGAGAATTATTGTCATTCATTGAAACTTTGGATAAAAGAATCATTCATATGGAAAAAAATATTCCACATGAATTAATTCGTGACTATAATGAAATTGAAAATTCTTTATCAATGAAAAGTATATGCAAGAAAGAGCTTATACAAAAATCACCTATAATAATAAGAAATAAGAATGTAGAAAAAGAAAAGACTCCAATAAAAGATTGTAAAAAAATATTATTTAACGAACTTGAAGTTTGTCCTACGATATCTTTGATAAGTGAAGATGAGTTCAATAAAGTTCCAAAATATATTATTGGAAGACAATCTTTAGAAACTGTAAATGATTTCATAAATACTATTAATCACATTTTAAAAACAAAATATACATTTTTATCATTGGGAAAAGCTCATGCAAGAAAGCAAGGAGATTTAAATCTTTATTTGCACTATAAAAAACAAGAATTAGATTTATGTAATGATTCTGAATACATATATTTCTTTACTGGTGAAGATTATGAAAAACAAATGAAGTCTAAATTAAATAAAATAAAATTAAATCTAATAACAGTTTTACGACATTGCAAAAGATTAAGAGAACATAGGATAAAAAACGACTTGCGATATGTAATATTAACAAAAAAATAATTGCTTAAGTTTTAAATTAAGTAATAAAATAAAAAGATTGCATAATAAATTGTTTCATTGTACAAAGAAGTTAAACATATAATTTTATATATTTTTTTTATAAGTTTTATAATAATTTAAATGATACATATTTTTATGTGTAATCAATACTATTGTAAAATATATTTCTATTATTCCAT\n>XM_047672130.1 PREDICTED: Vanessa atalanta protein claret segregational-like (LOC125064848), mRNA \nATCACGAACAAGCGTAAATATTCGAATTTTAAATTATTGCGTCCGTTTACTAATCTGACAAACGAAACAATTGTTCGTGTTTCAAGTGAATGTTGTTTTAATGTAATATTTAAATAAATAAATAAGATGTCTCGCATTCCGAAATTTCCTTCTACTGCTACAAAAGAGAATAAACCCACATTTACAAATGGGCGTAATACAACGCGAACATTAGGCATTGGGCTCAGTGACGCTGATAAAAAAAGCTTACTATTAAATCATACAAAACCAATGCGAAGTACAACATCCGCCAACACTGTAGCTGCGCCCCGCCTTAAAAGATCAGCTACAGCACCTTCCTCCGCTACGGTACCTAATAAAACAACTAAAGTCGAAAAAAAGACGACTACTGTAGCACCTAGGATTGCTCCTTATGATTACAAAGCCAGATTCAATGACTTGGTGGAAAAACATAAAGCCATGAAAAGTGAATTGAATGATTTAAGGGACAAACATTTGGAAGTATCAGACGAATATGAAAAAGTTAAAGAAACAGTTGAAGGAAGTATTACTGAAAGAGATACATTGAAGGATAAATTATTAAACACTCTCAAAGACTTGAGACAGAAGTCTAATGAATATGAAAGCCTAAAGCTGGATTATGAAATACAGAAACGGGAGAATGAGGAATTAAATAATAAAAGTAAACTTTTAGATGACGTAACTAAAAGCTTGAAGTTAAAAATAATGGAATTTGATAAACTTAAAACAGAATTTGATGATTTGACTCGACGTCATAAAAGTCTTAATGAAGAAACTGAGGCTTTAAGGGTTTTGACTGATCACCTTAAGAAAATATCTGTAGAATATGACAAATTGCAATTAGATTATAAGGATGCAGTTTCCACAATAACAAAAAATAAAACAGACTCTGAGGCTTTGCAAAATATTTTAGCGACTATGTATAGAGATCAAAGAGTTTTACGGAACACAGTGCAAGATTTAAAAGGTAATATTAGGGTCTACTGTAGAGTACGACCTCCACTTGAGTCAGAAGCATCCAAGCCTTTGTACAATCTTAATGTCCTTGATGCATGTTCTATAGAAGTTGAAAAGATTGAACTTCTGAATTCTGCAAGAAAAGGAAAATCACAACATTCTTTCTCATTTGATGGGATATTTACACCACACTCCTCTCAAGAGGATGTCTTTGCTGAAGTGTCTCCAATGGTACAATCTGCACTAGATGGTTATAATGTGTGTATTTTTGCATATGGTCAAACTGGCTCTGGAAAAACTTATACCATGGAAGGTGGTTGTGGAGTTGAACAGTATGGTATTATACCACGAGCAATAAATATGATATTCACATGTATGGAAGATCTTAAAAGAATGGGATGGGAATTGACAATTAAAGCATCCTTTTTAGAAATTTACAATGAAATAATTTATGATTTGTTAAACTCAAGTAAGGAACAAGAAAGTCATGACATAAAGATGGTTAATTCGAAAGGCACAGATTTGTATGTATCCAACTTGAAAGAAGAAGAAGTGAAGAGCTCTCATGATTTCATCAGATTGTTGATATTTGCTCAACGTAACAGACAAACTGCGGCTACATTGAACAACGAGAGGAGCTCCAGATCTCATTCAGTTGCACAAATTAAAATAGCAGCTATTAATGAAAAGCGTAAGGAAAAATTTACTAGTAATTTAAATTTGGTGGACTTAGCTGGATCTGAGAGTGGGAAAACCACTCAAAGAATGGATGAAACAAAACACATTAACAGATCACTTTCGGAACTTTCAAAGGTGATATTATCTCTACAGACTAATCAGTCCCATATCCCATACAGAAATTCTAAGCTTACACATTTACTAATGCCAAGTCTAGGTGGCAATTCAAAAACTCTTATGTTGGTTAATGTTAATCAATTTGATGAAAGTTTCAATGAGACTCTTAACTCCTTAAGATTTGCCACAAAAGTTAACAGCTGCCGAACTGTAAAAGCCAAGAAAAATATAACAATGGTTGACTCATTATAATTTTTACATTGACAATATTTTGCTTTAGAATGTAGTACACATGAACACCTATAGTTATACCATCTACTGTGAATTGAATATTATCAGTATTCTGCTTTAACATACATATTTGTATTGAATACTATTAATAAGTGGTATAACTAAATGTGCTTTACTATTTTGTTTTATAGTTAATTTTTACATGTAGTACTAACTTCCCACTGAATATTCCACCGATAAATGTTTTTACTGTTGTTCTATAGTATTTTGAAATATTGTGGGATTTTAGATAATCAAGAGCTCTTATAGTTTTAATTATTCAAATGACCTTAAATAGCTATTACAAAATAACAAGTCTCATTATTTTTATACAAAAGTTTTAGAAGCATTTTTTTGGATTTGTTACTATAAATGTGGAATTCGATATATTATTAAATAAAATAAATAGTGTGAAAGTTCATATACATTCTAAAGAATGTGAGTTGATATTGAAATATTTTGAAGTATTGTGTTAACTGAACTAAAATAATGACAGATTAATTTACTTACTGTTTATATAAATACTATGGCAATAAAATAATATAATTTTACAAATTGTCATAATTTGAATTTGATCCTTTTAAGGCAGGTCTTTGAGTACCATATACAGGTGAAGTTCTAACAATTGACTCACTTTAAATTCCTACTTATAAAATGCCTAATTGACTTATTTAGGAAATTATTATTGTTATTTTTTTACAAATTGGCAGGTTGAATTTGACATTTTAAAGTTTAATTTATTGGGTAGATCAAAGAATATCATATCTGCTTTTATGAAATATCTATTAGGTATGTTTATTACTACTTTTCATTTATATCCTATTCAATTCAATTGAATTGTATTTCTAAAAACACATTATCTTGAAGTAATCTGTTCAGTAAGGTGTTATTTTTAATTTT\n>XM_025561023.1 PREDICTED: Sipha flava GTP-binding protein 2 (LOC112688017), mRNA \nGCTAGTTTTTTCGCGTCCGAAACGGTGCCCGATCGTTGCGAACGTCCCGAAATTGAATTTTATGTTTGTTCGCGATCCGTCAGCGTTTGGGGCCATTCGAGTGTTTTTCGTACCGACGCGGAAAAGCGGAAGCGACGGGAAAAACACCTGTTCGACGACCTTGAAAACCAACATCGTTAGTCATCGATTATTATTGTTTCGTTTCCCGTTGCGGGTCTCCGTCCCGCGATAATGCCTTGATAACGCTTGCCGCTATCTTATCCGCCGCTACTACGACGAGACTTCACTGACCTTTGGCTCTCGTTTTGTTTATAAATATAAGCCCGTCGCCGTACGTTGTTGCCGCCGTCGGCACTCCTCCGTGTCGCTTGGCATCGGTCGCCAACAGATCAACAGCTGTGACCCATCTGTCGAATGATCGTTTCAAGAATCCCGACGATTATCACCGCGCATCGTATACGGCCGTCGACGCTCAACGACGATGGATTCGTTCCTGGACCTGTTCGATCCGGGCACCAGCCCTCCGTCTAATTGCGACGTATGGCCAGCGGAGGACAATGACGATGTCACCGCAAGGCTACCGCCGGAGCCTCAGATGGGCAATGTCGAGTACAAACTGAAGCTGATCAATCCGTCCAAGTTGCGCTTTGAACATCTGGTCACGCAGCTGAAATGGCGGCTCAGAGAGGGTCACGGCGAAGCCATTTATGAAATCGGCGTTGAAGACACAGGCATGCTGACCGGCTTGTCTGCTGAGGATATGAAATCTAGTCTAATCACCTTGGATGAAATGGCCCGTAAATTAGGTGCTACTACGTCGGTGCTGCGAGAGAGATCAGTAAAAAAAGACAAAATGGTTGCTGAAGTTCTAGTTCGAAAGGTTCCAGATGACCAAGAATGTATAGAAGTGATGGTTGCTGTATTAGGAGGTGCTGATGCTGGCAAGTCAACTCTTCTTGGTGTATTAGCACATGGTGAATTTGATAATGGTCGTGGTAGTGCTCGATTAAATGTTTTAAGACATTTACATGAACTACGATCTGGTCGAACTTCTTCCATATCTCATGAGATTCTTGGTTTTGATACTGAGGGAGATGTTATCAACTATCAAAAAGCCCGTACAGCCGAAGAAATTCGAGATCGCTCATCAAAGCTGATCACATTCCTCGATTTAGCTGGACATAAAAAATATCTTAAAACTACTGTAGCTGGTTTGAGCGGTTACTGTCCGCATCATGTTATGTTGGTTGTGAGTAGTCCAGCTGTAACTGTTTCTAGTCCTACTCAATTGGATATGACCAAAGAGCATATGGATTTGGCATTAGCACTTAGACTTCCATTTTGCATTGTTGTTACAAAAACTGATATCACTCCAGCAGATAACACAATTAAATGGTTGGAGTCTATATTGAAATCCATTGGATGCAGAAAAGTTCCTTTTGTTGTTAAATCTGATGATGATGTTTTAACAGCGAGCTCTGCACAGCCAACTCAAAATGTTGTGCCTATATTTACCATTTCTAGTGTTACTGGTGAAGATTTAGACTTACTCACAAAATTTTTATATGTTTTACCACCAAGTATTAGTATAAAAGATAAAGAAAGATTGGAGCAGGAGTGCTGTCAGTTTCAAATAGATGAGATTTTTAAAGTACCTGATATTGGTACAATTGTTGGTGGTGTACTTGTCCAAGGTGTTGTTAATATTGGTACAGAACTAGTTATAGGCCCCTTTGATAATGGAACATTTGTTCCAGTAACTGTGCAATCTATACATAGGAATAAAGCTCCACGTCGAGTTGTAAAAGCAACTCAAAGTGCTTCGTTGAGTTTGGAACAAAGTATTCCTGGATTACGTAATGGAATGGTGCTCTTGGGATCGGGTGTGAATCATAGTGCTTGCATATTCTTCCAAGCTAGAATTGTTGTACTATATCATGCAACATCTATTCATAATGGATTCCAAACCACTGTACATATTGGAAACATACGGCAAACTGCGGCTATTGTTGCTATCATGGAATGTGATAAACGAGGTATGCATACTAATGACACAGCATCAGTAATATTTAAATTTGCACGTCATCCAGAATATGTCACTGAAGGTATGCGGTTATTGTTCAGAGAAGGACAGACTAAAGGAATTGGAATTGTTACTCAAGTATTTGCTTTGCAAGTAGTTGCTGGATAGATAACATTGTTTTTATTGACTTACAACTTTTATTTATATAACCAATAGAGGTAAAATGTACACAGTTACATAATTTAAACTTATAAAAATCACTTTATACACATAAGAATATATATATATATAT\n>XM_036413688.2 PREDICTED: Pipistrellus kuhlii TATA-box binding protein associated factor 8 (TAF8), transcript variant X2, mRNA \nAGAAGCATCACCTGGAGAGGTGAACAACACGTGGTCTCGGCCCCTCCCGCAGACAGCGAGGCACTGATCCTGGGCGGGACCTAGCCAGGTGTTGCTAACAGTCACGTTTGGGGCGCTCCAGGGGGGATGCTCTTTATGAGAAACGATTTCAGGGGGAAAGAGGTGTGCAAGCGAGGACGCATTTCCCGGGCCAATTCCGAGGGTCACAGCAACCCGTCGCTCAGTGTGGGTCACGTGCCCAGGGTCATCAGAACCCCCCATCCCCCGCCTCGGCAGGGCTTTGGAAAACCCAGAGGTGCGAGCGCCGCCTCGCCCCGCCCCTCCCCGCCGGGCGACTACAAATCCCATCCTGCCCTGCGCTCGCGCACGTTACGCCAGAGCAAGATGGCCGACACGACGGCCTCTGCGGGGGCTGGCAGCTCCGGAATGAGATCAGGAAGTAAACAGTCCACTAACCCTGCTGACAATTACCATCTGGCCCGGAGGCGAACCCTGCAAGTGGTTGTGAGCTCCTTGCTGACGGAGGCCGGGTTTGAGAGTGCTGAGAAAGCATCCGTGGAAACACTGACAGAGATGCTTCAGAGCTACATTTCAGAAATTGGGAGGAGTGCCAAGTCTTACTGTGAGCACACAGCCAGGACCCAGCCCACGCTGTCAGACATTGTGGTCACTCTTGTCGAGATGGGTTTCAACGTGGACACTCTCCCTGCTTATGCAAAGCGGTCTCAGAGGATGGTCATTACTGCCCCTCCAGTGACCAATCAGCCGGTGACTCCCAAGGCTCTCACTGCAGGGCAGAATCGACCCCACCCGCCGCACATCCCCAGCCATTTTCCTGAGTTCCCCGACCCGCACACCTACATCAAAACTCCGACGTACCGCGAGCCTGTGTCTGACTACCAGGTCCTGCGGGAGAAGGCTGCATCCCAAAGACGTGACGTGGAGCGGGCGCTCACCCGCTTTATGGCCAAGACGGGCGAGACCCAGAGTCTGTTCAAAGACGACGTCAGCACGTTTCCACTGATTGCTGCCAGACCCTTCACCATCCCCTACCTGACAGCTCTTCTTCCGTCTGAACTGGAGATGCAGCAAATGGAAGAGACGGATTCCTCGGAGCAGGAAGAGCAGACAGACACAGAGAACCTCCCTCTTCATATCAGCACGGATGACTCTGGAGCCGAGAAGGAGAACACCTCTGTCCTGCAGCAGAACTCCTTGTCCGGGAGCCGGAGCGGGGAGGAGAGCCTCATCGATAACCCCTACCTGCGCCCCGTGAAGAAGCCCAAGATCCGCAGGAAGAAGCTGGACTGGGGCATAGGAGCAGCTGGTGACGACCTCATTCATTATCACAGGACCTCATTCCTTTGACCTGAGAGACCAGGGAAGGCAGCAGAAAGAAGGGGCTGTGCCTTCTCTGCTTACTCCAGAAGGACTGTTCACCTCGTTTCTGTTTCAGGCTATCCCGGTCCCTCTTATTGACTCACAGACAATGTGTAGCATCAGTTTATCACTTGCTTTGCCTTGGTGGGAACCTCATTCTTATTTCTCTTCTCACCTGGGCGCCGAGTGCCCTGCTGAGATGACGGAAGGTGACTTTGCCTTCCCACATGGCACTCCTTGACCTGGGCCGGCAGGAGTCGGGAGGGGTGAGCAGGCATGTCACGTGGAGGAGGGTGGTGCATCACAGCACACCAGCTCTCTCATCGCATTTGGTGAACTCTTCCTTCAAGGCAGCGCCCTCTCTGGGGGATTGGTATTTATCGTCCCTCTGTGGAATGTGTGCTTTGGGCCACTGAGTCCTGCCCCGTCCAGGAAAAGAGCTTTCTCTGACAAGAGCCTCTGCAGGATCTATTCTGCTGTGACTTGCTGGAGGAATCCGACCTTAAAGAGCAGGAAAGGGATTGGGGGGGAACGGGGGAGAACTTGAGGGCTGGATGGCCTGTTTGCTGGGAGCCGGGAGCCCGGGGCGTCTGCTGGAAGCCGGCACAGAAGGGCGCCGTGCGTGGAAGCCAGTGGGCCAGGCCACGGAGCTCTCCCAGAAGGTCTGAGTCTGTTCAGCCGCTTTGCATCCTGGGGAGAGATTTCATCCTGCCTGAACCTACAGATCAAAACAAGTGTTTAAGGAAGATGCTGGACAAGCTGATACCCTTTGGCTGGTCTCTGAAAGAAGAGATT\n>XM_042281434.1 PREDICTED: Peromyscus maniculatus bairdii phospholipid scramblase 1-like (LOC102915703), transcript variant X4, mRNA \nTTTGAAACTGTTAACAAATACAAAATCAAGGACAAGCTTGGTCAGAAAGTTTACTACGCAGTCGAAGAGTCCAATTGCTGTGCACGCAATTGCTGTGGGGACTGCAGGTCTTTCTCTATGAGGATTCTTGATAACTCAGATGGAAGTCCAAGCTCCTCCTGGTGTGACAATAGGTTACGTTGTTCAGAACTGGCACCCATGTGTTCCAAAGTTTACAGTTCAAAATGAGAAGAAGCAGGATGTTCTCAAAATTGTCGGTCCATGTATCATATGCAGCCTTGGAGGAAACATTGATTTTAAGATCAAGTCTCTTGATGAAAAAATTGTGGTTGGTAGGATTTCCAAGCGCTGGTCTGGTTTTCTGAAGGAGTTACTGACAGATGTGGACAATTTTGGGATCCAGTTCCCGATAGACCTTGATGTAAAGATAAAGGCTGTGATGCTTGGAGCTTGCTTCCTCATAGACTTCATGTTTTTTGAAAGCAGGCCAAATCAGAAATGAACACTATTATATTCATGAATTGATGAACGAGTCCTCAGAATATGTGAAGCTGGAACACTGATTGAGAATAAAAGGCAACATAGTGATTTCTTTCATTGAAATCACTCATCTCTCCTTGAATTAAACTAGGATGTACATAA\n>XM_019798545.2 PREDICTED: Ailuropoda melanoleuca pleckstrin homology domain containing A6 (PLEKHA6), transcript variant X5, mRNA \nTCCCCCCACCCCTGCGGGCGGGCGGACAGTGGGGGCCGCTGGGCAGGAAGCCCTCCCCCCTCCCCCGCGGCCCGGGGGGCCCGGAGCGAGCGGGGCTTCTGGACGCCGAGATGGCCGATGAGATTGACTGGCTCGACTTGCCCGGCCGGTGGGCCTACGGCGTTGACCGCGGTGGGAGAGTCTTCTTCATCAATGATGAGGAAAAGTCAACCAGCTGGGTGCACCCTAGCACGGACTCCCCCATCCAGAGTGGACACTCCTCCAGCCCAGAATTGCCCAATGGCTGGGAGATGGATTCTACCCAGGAAGGAGCTGTGTATTTCATCAACCACAATGAAAGACGGAATACATTTCTACACCCAGTGACTGGCCAGGTCCCAGAAGAAAACAAAAAATTTAACTTGAAAACATCGGCCTTGGACATGTCCAATAAAGCAGGTGGGAAACAACCGGCTATCACCAACAGTGACGTACCCAACCACAACATGGTGTCTGAGGTCCCCCCAGAGCGGCCCAGCGTCCGGGCAACCCGAACGTCCCGCAAGGCCATCGCCTTTGGGAAGCGCTCACACTCCATGAAGCGAAATCTCAATGCACCTGTCACCAAGGCGGGCTGGCTCTTCAAACAGGCCAGCTCCGGGGTTAAGCAGTGGAACAAGCGCTGGTTCGTCCTGGTCGACCGCTGCCTCTTCTACTATAAAGATGAAAAGGAGGAGAGCATCCTGGGTAGCATCCCCCTCCTGAGCTTCCGGGTGGCCGCGGTGCAGCCTTCGGACAACATCAGCCGAAAACACACCTTTAAGGTGACTGCGTGCTGGGTGGATGAGGCCGGGGCCAGTTCCACGCACTGCCTCTCCCCACAGGCCGAGCATGCCGGGGTCCGCACCTACTTCTTCAGCGCCGAGAGCCCCGAGGAGCAGGAGGCCTGGATCCAGGCCATGGGGGAGGCTGCCCGAGTACAGATCCCCCCAGCCCAGAAGTCCGTGCCCCAAGCTGTGCGTCACAGCCACGAGAAGCCAGACTCTGAGAACATCCCACCTAGCAAACACCACCAACAGCCAACCCACAACAGCCTCCCGAAGCCCGAGCCCGAGGCCAAGACTCGAGGGGAGGGTGATGGCCGGGGCTGCGAGAAGGCCGAGAGGAAGCCCGAGAGGCCCGAAGTCAAGAGCGAGCCTCTGGTGAAAGCCAACGGCATTCAAGCTGGACCGGAACCAGCCTCGGAGCCCGGCAGCCCTTACCCCGAGGGCCCAAGGGTCCCAGGGGGGGGCGATCGGCCCGCTCAGCCCAACGGCTGGCAGTGTAGCTCCCCAAGCCGACCAGCAAGCACAGCTTTCCCGCCTCAGGACTCAGAGAGCGGAGGACACCAGCGGAGCTTCCCCCCACGTGCCAACCCCGACAAAATCGCCCAGCGCAAGAGCTCCATGAACCAGCTTCAGCAGTGGGTGAACCTGCGCCGAGGGGTGCCGCCACCTGACGACCTTCGGAGTCCCTCTAGGTTCTACCCCGTGTCCCGCAGGGTCCCTGAGTATTACGGCCCCTACTCCTCCCAGTACCCAGACGATTACCAGTACTACCCCCCAGGGGTGCGGCCCGACAGCGTCTGCTCGATGCCTGCCTATGATCGGATCAGCCCACCCTGGGCGCTGGAGGACAAGCGCCACTCTTTCCGCAATGGAGGCGGCCCTGCCTTCCAGCTGCGGGAGTGGAAGGAGCCCCCAGGCTATGGGCGGCAGGATGGCACCGTCTGGCTCCCCGGCCCCTCCCCCTCCCGGCAGCCAGTCTATTATGATGAGATGGACGCCACCTCCGGCTCCCTGCGCCGCCTGTCCTTGCAGCCCCGCTCCCACTCTGTGCCCCGCTCGCCCAGCCAGGGCTCCTACAGCCGTGCCCGCATTTACTCCCCCGTCCGCTCACCCAGTGCCCGCTTTGAGCGCCTGCCACCTCGCAGCGAGGACATCTATGCCGACCCTGCTGCCTATGTGATGAGGCGATCCATCAGCTCCCCCAAGTATGATTACCTGGGAGACAGGCGACCAGTCCCTGCAGGACTGTTCCCCTACAACTACCCACCATCCCCCACGGTCCACGATAAGATGGATGAACTTTTAGATCTTCAGTTGCAAAGAAACCTAGAGTATTTGGATCAGCAGATGAGTGAGAGCGAGACTCTCATCAGTATGGTGAACCGCATGGTGGAGAACTCCTCCCCCAGGGCCCAGATCTTCATGCAAGTCCCTCCGTACCCAGAAGTGTTCCGGGACGGTCTCCACACCTACAAGTTAAACGAGCAAGACACAGATAAGCTGCTGGGAAAATTGTGTGAGCAGAACAAGGTGGTGAGGGAGCAGGACCGGCTGGTGCAGCAGCTCCGAGCTGAGAAGGAGAGCCTGGAAAGTGCCTTGATGGGGACCCACCAGGAGCTGGAGATGTTTGGAAACCAGCCCGCCTACCCGGAGAAGCTGCTGCACAAGAAAGAGTCCCTACAGAACCAGCTCATCAACATCCGGGTGGAGCTGTCTCAGGCGAGCACGGCCCTGGCGAACAGCACCGTAGAGTATGAGAGCCTTGAGTCAGAGGTGTCTGCCCTGCATGATGACCTCTGGGAGCAGCTCAATTTGGATGTCCAGAATGAGGTGCTCAACCGGCAAATCCAGAAGGAGATCTGGAGGATCCAGGATGTGATGGAGGGGCTGAGGAAGAATAACCCATCCCGGGGCACAGACACGGCCAAGCACAGAGGAGGACTTGGCCCCACGACCACCTACAGCTCCAACAGCCCCGCCAGCCCTCTCAGCTCCGCCAGTCTCACCAGCCCACTAAGCCCCTTTTCACTGGTATCCGGCTCACAGGGGTCCCCCACCAAGCCTGGGTCCAGTGAGGAGCCCGGTCCGCCGCGGCCCCCCCTCCCCAAAGCCTACGTACCCCTGGAGTCTCCTCCAAACGTGCCGCCGCTCCCTAGCGAGAGCCGCTTCTGGCCCTACCCCAGCTCCCCTTCCTGGCACCGCGGGGGCGAGCCAGCCAGGGGTCAGCCCAAGGCAAGCCATGAGCAGAGCAAGAAAGACACCCCCCAGACGTCACCCCTGGACACTGCTAGAGACATCAGCCTTGTGCCCACCAGGCAAGAGGTGGAGGCAGAGAAGCAGGCAGCTCTCAACAAAGTTGGCGTTGTGCCTCCTCGGACAAAGTCGCCCGCTGATGAAGAGCTAACTCCGTCGAGAGTGGTGAGGAGGAGTGCCAATGGGCTTACCAATGGACTGTCCTCCCGGCAGGAGCGCCCCAAGAGTGCCGTGTTCCCCGGCGAGGGCAAGGTCAAGATGAGCGTGGAGGAGCAGATTGACCGCATGCGGAGGCACCAGAGCGGCTCTATGAAGGAGAAGCGGAGGAGCCTGCAGCTCCCGGCCAGTCCGGCCCCCGACCCCGCTACCCGGCCTGCCTACAAAGTGGTGCGCCGGCACCGTAGCATCCACGAGGTGGACATCTCCAACCTGGAGGCAGCCCTGCGGGCAGAGGAGCCCGGGGGGCAGGCCTATGAGACGCCGAGAGAGGAGATTGCCCGGCTCCGCAAAATGGAGCTGGAGCCCCAGCGCTACGACGTGGACATCAATAAGGAGCTCTCCACGCCCGACAAAGTCCTCATCCCCGAACGGTACATTGACCTGGAGCCCGATACCCCCCTGAGCCCCGAGGAGCTGAAGGAGAAGCAGAAGAAGGTGGAGAGGATCAAGACGCTCCTCGCCAAGTCCAGTATGCAGAACGTGGTGCCTGTCGGCGAGGGGGACCTTGTGGACGTGCCCCAGGACTCAGAGAGCCAGCTTCAGGAGCAGGAGAAGCGGATTGAAATCTCCTGTACCCTGGCGACCGAGGCCTCCCGCAGGGGCCGCATGCTGTCTGTGCAAGCCCTGGCCGAGGCCAACGCTGCGAAGCTTCACAGAGCCACGTTCTGAAGGCCTCCTTCGCCCCCTGAGGTCGCAGTTCCCCACCCTGGCCCCCTGCCCCTGCGCTCCCATGGGCATGCTGCAGGGAGCCAGGCTGGGGGCCGGGGGTGCTGCCAGGACGTTACCTCCGTGTCCACATGCCCACCACGCCCGGCCCTGAAGCCCTCGCTGCTCAGATGGCGACCCTAGGCCGGGGCCTTAGATGGTGGGCAGACAGCAGCCCACATCCCAGGGGCTAGGCCTGGCCCTGGCTGGTGGTGTGACGGCCCTACTGGAACATTCCCAGATGAAGAGGATGCCCTGGTGGGGAAGACGCTCTGGGCTCTCTTAGGTTAGGAGGAGGGTGAGGAGAAGATGGACACTCGGCCTCTTCCGGCCCCTCCTGACACCGAGGACGGCACCTGCCATCAGGTCCTTCCCCCATCGACCCCACCCTGCTGCCCCAGCTGCACCCGGGGCTTTGACATGTCTCTGCTTATGGGTGTTCCTTTGGGGTCCAGTGGAGACTGACCACCCTGCTTGAGCCAAAGACAAGATGACAGGAGCTGGGGAGAGGCACCTCAGCTCCCGGAGGGGACAGTGCTGGCTGTGGGTAGAGAGCGGCACGCAGGTCTGCGCAGCGTCTGAGGACAGGTTGAGAAGGGGGAGAAGAGAGAAAGGGAGAGATGCAGGCAAGTGGGAGGACAGGGGAGCGGCAGGACTCCTTTGCAAGTAAGAGGGTGAGGCGGAGGTGGAAAGGGGCTGTGAGAGGGATGGGTTTCCCCGGGAGGGAACCTTAGCTTAGTGCCAAGTACAGTCCAGACTGTCAGCCCTGCTCCTGCACCGGGTACCCCCGATCCGCGGGCCTGCCCACACACTGGCTCCAGGAGGACCCACCAGCGAGCACATGGTGACCGTCGCTGCAGCCATGGGGACGAAGGTGTGGGGATGCGGGTGTGGGCAAGTAGGTGGGAAGGTGGCCCTTTCTGGGTCTGGGCCTGGTGTCTGCCTCCCCCACCTCGGCTCAGGGGCAGAGAGAGGGACCTGTGTCATGTAGGGTGTTGTCAGCCTTGGGGCCTTTCCTAACCATGTTCGGGACATTTTCTTGTCCCCCTTCTCCCTGGAATGTGCTGTGAGCCAGCTGAGAGAGTGCCCCGGAGAGGAAACACAGCCTTAATCTGGGAGGCTAGATTCTAGGGCCCCATCCCGCGTCCCAGGCATCCCCAAGGAGGACCAGGTGAGGCTGTACGGAAGGACCCCCTTCTGGTCTGGCTCTCTCACCATCTGCCTACCCGGGGAGGCCAGTGAAGGAGACACAGAAGCAAAGCTCACTTTTCCTCCTTGCCTCTCATCTGGGGGGGACGGTAGCCAGGGAGGAGGGAGGGGAGAGAGTGAAGCTGGACACACCGGGGCCCCTAGGCCTTCTCTTTGCCAGAGTTGCTGCCGGGAGACTTCAGCCTCCAGTGGCCCCAAGAACAACTACTTTATCTTCCAGCACTTCTCCACTCCTTCACAGCTGGGCCAGTGAGTGGTTCATATGCAAGTAAAGATGGCAGTTCATTCAACAAATATTTATCGAGCACCTTTTACGTACCAGGCACTGTTCTAGGTGCTTAGGGTATTCTCGTGCTTCTGAGGGCTTGCAGACTGGGGAATTCCTCTTCCCTTTTAGCAGACGTTTGGAACATGGCTACACTTCCCGTCTGTAGCATCACTCAAGCACCCTGTCCCTGTTTCCCCCCCCCACCAGACTGGCAGGTGGGATTGGCCCTCTCCCTCTTTCCAACACCTTTCTCCATCCTCGAGAAATGGCTCTTTCGGGGCCTCCATGCCTTTCCCCTTTGTCTCCCCTTTGTTTTAAGTGATGTTTGTAGACGTACGTGGAAAATACCAAGGGTTAAGGTCTGCATCTCTGCCACGTCTCGCTCTCATCTCATAAAGCTGGCTCTTTATGTTGCTTTACATGCCTTAATATATGTTTTATGAAGATTATACATATTATAGATATATACATAATATATATATTTGTTTGGACGTCTGATCCTTTCCCAGAACTCCTGCCCAGGCCCATTTTCCCTCCTTTACTTTCCACACCATTCCTAGCATGTGTCGGCCACACCCCACGCCTTTTGATCCAAAGAAGGGGAGAGGACGGTCTTATTTTAAGACAGATCTATTTTACGCTTTTGTTACAAAAGCAAATCTATTTTCAAAATGTGCAATGTCTGAATGGAATCAGCAAGTAATACGAGGAGATTGGGCGGCTGCCTCTAGGTCCAACCCTGTGTCCTTCCCTCTCCCCGCCCCCCCGCAGCTTCCTCCTCCCATCCCCCAGTCTGCAAAGGGCTGGTCCCCAGAGCTCACCCAGAGAGCATCTTACCAGGGCGGGACGTTCTCTTAGAAGTCCTGGTCTAAGGATTTGATTACACTGTCAACTCTTGACGGCCCTCTAGGGTTACGGGATGTGAATCCTCTCGAAGGAAATGTTTATAGCTGTGTGCACAAAAATACACCCCTGCGGGCAACCCGCCCCCCAAGTGTACTCCTGGACCACCTCCCGTCACCAATCTGCTGGAAAGGGCAAACAATTTAATGACAGCCTATGCCAAGTGGCACCAAGAACTCCACTCCCTGACGGAGCCAGGATACAGTACAAAGGCCAAAGGAAATGGTTTGGGACCACAGGTCCTTCAGCACAGACACATTTGAGTTCCTTGGACTTCTCACACTCCTTGATCCCTTTCTGGTCTGGGTCACATCTACAACATCTGTCTCCCTCTGTTACCCTTCCTCGGGGGGCTGTTGTTAAGGGGGACGGTTGCTCAGTCTGGCATCCAGACTGCACAGTCAGCTTCTGGGCTGAAGCGGGTCCCACGGATGAGGTGACATCTCAGCCTTGCCCAAGAAGCCCCTAGGACTGTCCTCTGGCGGGCTGCCACCGGGACGCTGAACTCCGCCAGCTCAGCCTTGCAAACTGCTTAGCAGCTGACGTAGTAGGCAAGGGGCTCTTGCCTCACAAGGATCTGGGCAGAATGGAAGTCTTTTGTCCAGATCTGAAATCAAGGGTTTGGGACTGTCACAGAGCTCCTGGCCAGCACTTGAAACCTGACCTCCCAACTTTGACATGTACTGGCGTCCTGTTCCCAGCCTAGAGCGTCTTGTTATGAAAGAATGGGGCCCAGATGGAGGCCCAGGGCTAAGTGACCCAGCGGGGACAGCCCTGGTTGCTATTCTGGGGCCTTGCCAATTAGCACATTACCTCCCTGATCAATAACCAAGAGGCTGTAATCAAATACGGCTACTGTCACTTTAAAGATTTTTCTGAGGTCGCAAGCTGTGCTCACTTGCTCTCCTGCCTTGGTGAGAGGCATGTTCTTGGGGCAGGGCTGACCATAGCAAGACGGAATCGATTCCTTTCCCCTTTAGGCACCCCCTACCTGGCAGCTCTTAAAACTAAGGAAAATACAAAATATACATATATATACATATATCTATTTATGCACATACTGGGGCCAATTTGATCTGCTAGTATTAGACAATAAACCATACAAGGAAATGTATGATCTCAGTGTCTTTATTTAGTATAAAAGTGACCTTAAAAGAAAAGTTAAGGTTAGCTGAACAGAGGGCATCTCTATTGGGGGACCAAACATCTGTAGCCACCCCATAGCATCTTTTTAGCCAACAAGCCCCTACCCAGGAGGGGCATCCTGACTGATAGGTGAGCGCCTGCTTCCCCACTCCCCAGCATTCTTTTCAGATATAGTAGGTACTGAAGAACCCCAGTGAGCTCTGCATTTGTATCTTGCAAGTTTGTATAAACCCGATGCAGGAAATAAAATGAA\n>XM_053554548.1 PREDICTED: Nycticebus coucang SH3 and cysteine rich domain 3 (LOC128560913), transcript variant X2, mRNA \nCCTGTCATTTCAGCTCTGACACCAAGGCAAGAGGCTAGGAGGTCTACAAATATCGTCTAGGTAGCTGGTGTGAGTACAGAGGGTACTGGGGGGGCTTAGCCCCCAAGGAAGAGGACCAATCCTTACCCAGCACCACCATCAAGGCCCCAGGGCCTCCCACTTACTTCCTTCCACAGACTGTGGACTGACTTAGGGAATCCCAAATCTGCAGCGACTGAAGCAGTTATTCAGGAAGGGGTCTACGGGGACAAAGGAGATGGAGATTCCCTCAGAACCCCAGGCCAATGGGGAGGCAGTGGGAGCTGGGGGTGGGCCCATCTATTACATCTATGAGGAAGAGGAGGAAGAAGAAGAGGAAGAGGAACCACCCTCAGAACCTCCTAAGCTTGTCAACGATAAGCCTCACAAATTCAAAGATCACTTCTTCAAAAAGCCAAAGTTCTGTGATGTCTGTGCCCGGATGATTGTTCTCAACAACAAATTTGGGCTTCGCTGTAAGAACTGCAAAACCAACATCCATGAACATTGTCAGTCCTATGTGGAGATGCAGAGATGTTTCGGCAAGATTCCCCCTGGTTTCCGTCGGGCCTATAGCTCGCCACTCTACAGCAATCAGCAGTACGCTTGTGTCAAAGATCTCTCTACTGCCAATCGCAATGACCCTGTGTTTGAAACTCTGCGTACTGGGGTGGTCATGGCAAACAAGGAACGGAAGAAGGGGCAGGCAGATAAAAAAAATCCTCTAGCAGCCATGATGGAGGAGGAGCCAGAATCTGCCAGACCAGAAGGCAGCAAACCCCAGAATGGAAACCCTGAAGGAGATAAGAAGGCTGAGAAGAAGACACTTGATGACAAACACAAGCAGCCTGGCTTCCAGCAGTCTCATTATTTTGTGGCTCTCTATCGCTTCAAAGCCCTGGAGAAGGACGATCTGGATTTTCCGCCCGGAGAGAAGATCACAGTCATTGATGACTCCAATGAGGAGTGGTGGCGGGGGAAAATCGGGGAGAAGGTTGGATTTTTCCCTCCCAATTTTATCATTCGGGTCCGGGCCGGAGAACGCGTGCACCGCGTAACGAGATCCTTCGTGGGGAACCGCGAGATAGGACAGATCACACTCAAGAAAGATCAGATCGTGGTGCAGAAAGGAGACGAAGCCGGCGGCTACGTCAAGGTCTACACCGGCCGCAAGGTGGGGCTGTTCCCCGTGGACTTCCTGGAGGAGATTTAGGCGCTCGCCTGCTGGCGGGAGACACCCACGCCCCCATTCTGGGCGGGCCCAGTGGAGCTTGGGGAGGCAAGGGCAACAGCAACTGGACTGCCGGGTAGGCAGGGGCGGGAAGGCCCGCAAGAGCCTGACGGCTTCTGCGTAGGGGCTGGTTTCCGCCCCTTCCTGACCTAGGGCCTGGGGCCCTGACGCCCAGAGCAGCCGCACAGGCCTCGGACCTAGCCTTCGAGAGCTAGAAAAAGAAAATATCTCACTGGGGGTGGAGGGACGGAGGCACTAACTGTCGAATGTTTCGAATTCACTAAAGTTTTGACAAAAGTTAGAAAAGTTA\n>XM_027475688.1 PREDICTED: Abrus precatorius basic 7S globulin (LOC113846927), mRNA \nAATAAAAATGGTGACATATCCCCGCCCACACAGATGAAGATAGAAGATAAGCACACACAGTGACACGCTTGCCATAAAAAAAGGTAAAAGACTTAGAAGAGAGTGAGCAAGAACCTAGACGCAATTTCATTCTTCTTCAGCAGCAAAACGTACGACCCTCCCAACAACCCTTCTCTTCTCCCATGGCTTCCTTTCCTCTCCTCTTCTCCTTTCTCTTCCTGTCCCTCGTTCATGCTCAATCTTCACTTTCTTTCCACATCCCAGTCACCAAGGACGGTTCAACCCTCCAATACTTGACCACCCTCTCTTACGGAACCCCTCTTGTACCCACCAAACTCGTGCTTGATCTGGGAGGCCCTTTTCTCTGGCTTCATTGTGCATCGAGAAACACCCCTTCATCTTCCACTCTCACTACTCCTCACCGTTCAATTCAGTGCCTCACTGCAAAAACCCACAAACCCGATGACTCATCCTCCTCCTCTTCGTTTCTCTCTAGCCCCGTGGACGAGGACCAGTACCAACCATGCCAAGTTCTCCCAGAAAACAGCATCACAGGCACAGTGGCCACAGAAGGAGAGCTTGTAGAAGACCTCATGGCAGTACAATCATCTCACTTAGAAATCATTCACCAAGTTAGCTTCACCTGTTCCCCCACCAGCATGCTCTTAAACGGCTTAGCAAAGGGTGCTAGAGGCATGGTTGGTCTTGGTAGGTCTCGCAGTTCCCTTCCCTCTCAGGTTTTCGATTCCTTCAGCACACACAGGAAAATCACTCTCTGCCTCTCATCATCAAAAGGGGTTGTCCTCTTCGGCGACATGGCCTATTACGAGTCTTCTCCAGCCGTAACTGAGAGTCTTAAGTCTCTTACATTCACACCCCTTGTTACCAATTTCCCATCTCAGGAATACTTCATCAACGTTAATTCAATCAAAATCAACGGCAAGAGGTTGTCGTTGGACACGTCATCACAGTCCCTCGAGCAAGAGAACAGTGGTGGGGCTCTTACTTTGTTGAGCTCAATTGTACCCTACACCACCATGCAGAGCTCGATCTATGCTACTTTCAAGGCAACTTTTTTGGACGCTGCTGTGGCTTTGAACATGACCATAGTGGCTTCCGTGGCACCCTTTGAGCTTTGCTTTGAGGGCTCGCACGTGGGGGCAAGTGTGCCGGCGATTGAGCTGGTGCTGCAGAGTGAGATGGTGAAGTGGAGCATACATGGGAGAAACTCCATGGTTAGGGTAAGCAGCGAGGTTGTGTGTTTGGGGTTCTTGGATGGAGGTGTCAACCCAAGAAATCCCATCATCATTGGGGGGTATCAATTGGAGGAAGTAATAGTACAGTTTGATTTAGCTACTTCCATGGTGGGGTTTAGTTCTTCCCTTTACACTAAGAACACTGGCTGTTCCCATTTTAGATTCGGTTCCATGCTTGCAGACTCAGTTTGACTATTCGTTATAACTTCGATTATAGTACTGATTATTAAATTTTCTTCTTCAAACTATGTTTCTGAACTTTCTCAATTTTGTACGAGCTTGATTTTTGTGAAGCTTTTTTTGTTTATTTTTTTGGGGGGGGGGGTTTACTATTTAGCTGTACTAATCGAGGCTGATGAGATATTATGATCTTGTATTTTGATGGGACTTCTGCGTCAATTTGAGTTTTATGATATTGGAATACTAGTCGACTTTCAAGATGCTCGATTGAATTGCGAAACCTGAAAAATATCACTGAAAGATTCGTTTCCTTTCCTCCCTCTGTTTGATAAGAAGTGCATCCCACTGGGGAATTTGGACAGTGCCGAAGGAATAATCCTTTATGTACTGCAAAAGAAAAGGGTATGCTCACATAATTTGTTATGTATTTCTTTTTTTCGTTTATTACATCAAGATCTT\n>XM_023724909.1 PREDICTED: Trichechus manatus latirostris CKLF like MARVEL transmembrane domain containing 5 (LOC101347816), transcript variant X5, mRNA \nGGTTTCTTGGACCTTCCTGCTTCTGTCTGCTTCCTCATCCTGCCAGGTTTCAGTTTCCCTTCCAGGCTGCTGGTGGTGGTGTGGGGGGCTGTGCCTGGTGGGTCCCATGGAGATGCTTGGTGCTCGGGACCGCCTGGACTGGCCCCCCGAGGAGGGGACGGCTGCAGGGCTCCAGGCCTTCGCTGTGGACAAGAACTTCCTCTCCTCCCTCAGAGGCATCCTACTGGAAACCGAGCTGGACTTCCTCCGCTGTGTCAGTGCTATCGTCATCTTCCTGGTGATCTCCATCGCTGCTGTGACCTCCCGGGATGGAGCTGCCATTGCTGCTTTTGTTTTTGGCATCATCCTGGTTTCTGTCTTTGCCTATGATATCTTCAAGATCTACCAGACTGAGATGGCACCCAGGGCTACCGAGGCTCTTGGCCCGCAGCTTGTTGACCTGGGACTCAGCGATATCTGCCCGCTCCTCTGCCTCATCCAGCTCGTGCTGCACCTTGCGGAACTTGGAAAGGCATTCCTGGATGGCGAGAATGGTTAAGCACTTGGTTGTTAACTGAAAGGTTGGTGGTTTGAGTTCATCCACAGGCACCTTGGAAGAAAGACCTGGTGAACTACTTCCCAAAAACCAGCCATTGAAAACCCTATGGAGCACAGTTCTACTCTGACACACAAGTTGGAATTGATTTGACAGCAACTGGTTTGGTTTGGTATTTCGTTTTTAACAACAAGCTATGCTTTTAGGATATTCTTTGTTTTGCACTTCTTTTCCTTTTTCTATGAAAATGGGTATGTTCTAGACATTGCAGCTAAAATGACTCAGCTTTGAAGAAAGATTCCAAACAGCAAAGTTCTACTCCTGAACTCTTTAGTAACACGTTTATATGGGAACTATTCCGAGGAAAATGGAAACAACTTTTTTTTACTAGGGCAATATTCTTGAAATGATTGTAGTTGTAGAAAGAATGTATGTTGGGTAAGGAAGAGGGGACCAGGTCAGTGGATGGTGTCATCCCACATATATGTGCTAGATTATGGAACAAAACTCCACAGGGTAGTGCAATAGTTGGTCACAAAAACCCATTGCAGAATATAATTGAAGGGACCATGGTCTCAGGGAACATCTAGCTCAACTGGCATAACACAGTTTATAAAGACAATGTTCTACATTCTACCTTGGTGAATAGCATCT\n>XM_006974484.3 PREDICTED: Peromyscus maniculatus bairdii ArfGAP with coiled-coil, ankyrin repeat and PH domains 2 (Acap2), transcript variant X7, mRNA \nTGGCCGCGGCTGTCACTCCGGGGCGTTTTCCCCGGCCGGCTCTCAGCTGGGGCGGAGGAAGAGGCGGCCTGGGCCTGCCGAGCCGTTGCAGTCTCCGCGGCTGCTATGCCCAGGGTGCGCGGCGCCCTCCGCAGCTCCGCGCAGCGCTAGAGGCGGCCGAGCGCTCGCCGACGCCGCCCGGATCCCCGGTGCCTCCGCTCTCCCGCTCCCGCAGCTCCCGCGGCTCCTCCGGCGTCGCCTGCGAGGCCAGGCAGAGGCAAGATGAAGATGACGGTGGATTTCGAGGAGTGTCTGAAGGACTCGCCCCGCTTCAGGGCTGCCTTGGAAGAAGTAGAGGGAGATGTGGCAGAGCTGGAACTAAAACTCGATAAGCTCGTGAAGCTTTGTATCGCAATGATCGATACCGGCAAAGCCTTTTGTGTGGCAAATAAACAGTTCATGAATGGGATCCGAGACCTGGCACAGTATTCTAGTAATGACGCGGTGGTTGAGACAAGTTTGACCAAGTTTTCTGACAGTCTTCAAGAAATGATAAATTTTCACACAATCCTGTTCGACCAAACGCAGAGATCAATTAAGGCACAGCTTCAGAACTTCGTTAAAGAAGATCTTAGAAAATTCAAAGATGCCAAGAAACAATTTGAAAAAGTCAGCGAAGAAAAGGAAAACGCACTAGTGAAAAACGCCCAAGTTCAAAGGAACAAGCAGCATGAAGTGGAAGAGGCCACAAACATCCTCACGGCCACGAGGAAGTGCTTCCGGCACATAGCCCTGGACTACGTCCTTCAGATTAATGTGCTTCAATCAAAGAGGAGATCAGAAATCCTGAAATCAATGCTGTCCTTCATGTATGCACATCTGGCCTTCTTCCATCAAGGGTATGACCTGTTCAGTGAGCTTGGGCCCTACATGAAAGACCTTGGAGCACAGTTGGATCGACTGGTTGTGGATGCAGCAAAGGAGAAAAGAGAGATGGAGCAGAAACACTCTACTATCCAGCAGAAGGACTTCTCCAGTGATGATTCCAAGCTAGAGTATAATGTAGACGCAGCGAATGGCATTGTCATGGAAGGGTATCTCTTCAAGCGGGCCAGCAATGCCTTCAAAACGTGGAACAGGAAAAAGCCCGATCATATCAGACGCTGGTTCTCCATACAGAACAACCAGTTGGTTTACCAGAAAAAGTTCAAGGACAGCCCCACTGTGGTGGTGGAGGACCTCAGGCTCTGCACCGTGAAGCATTGCGAGGACATAGAGCGGCGCTTCTGCTTCGAGGTCGTCTCTCCAACCAAAAGTTGTATGCTCCAGGCCGATTCGGAAAAGCTTCGCCAGGCCTGGATTAAGGCAGTTCAGACCAGCATTGCCACCGCCTACAGAGAGAAGGGCGATGAGGCCGAGAAGCTGGATAAAAAGTCATCTCCATCAACAGGAAGCCTAGATTCTGGAAATGAGTCAAAAGAGAAGTTACTGAAAGGAGAAAGCGCACTGCAGCGTGTCCAGTGTATCCCTGGCAACAGCAGCTGTTGTGACTGTGGTCTGGCAGACCCACGGTGGGCCAGCATCAACTTGGGCATTACCTTGTGTATTGAGTGCTCTGGGATTCATCGGAGTCTTGGGGTTCATTTTTCGAAAGTACGATCTTTAACTTTAGACACTTGGGAGCCTGAGCTTTTAAAGCTTATGTGTGAATTGGGAAATGATGTTATAAATCGTGTTTATGAAGCTAAACTGGACAAAATGGGAATAAAGAAACCACAGCCAGGACAAAGACAGGAGAAAGAGGCATACATCAGAGCAAAATATGTGGAGAGGAAATTTGTGGATAAATACTCCATGGCATCATCACCTTCTGAGCAGGAGAAAAGGGTTATCTCCAAAAGCTGCGAGGAGCAGAGGCTGAGCCAAGTCAGAGCATCTGTCCACACCGCAGTCAAAAGTAACGACAGTGGGATCCAGCAAGGCTCTGATGATGGACGGGAGTCTCTACCTTCCACCGTGTCAGCCAATAGCTTGTATGAGCCTGAAGGAGAAAGGCAAGAGTCTTCTGTGTTTCTGGACTCGAAACATCTTAATCCAGGACTTCAGCTTTATAGGGCTTCATATGAGAAAAACCTTCCCAAAATGGCTGAGGCTCTGGCTCATGGTGCAGATGTGAACTGGGCTAATTCAGATGAGGACCAAGCGACAGCACTCATCCAGGCTGTTCTGGGGGGCTCTTTGGTGACGTGTGAGTTCCTCTTACAGAATGGTGCTAATGTGAACCAAAGAGACGTCCAAGGGCGGGGCCCGCTGCACCATGCCACTGTCTTAGGACACACAGGGCAGGTATGTTTATTCCTGAAGCGAGGTGCCAATCAACACGCCACTGATGAGGAGGGGAAGGACCCCTTGAGTATTGCTGTGGAAGCAGCCAATGCCGACATAGTGACCTTGTTACGTTTAGCAAGAATGAATGAAGAAATGCGGGAATCAGAAGGACTTTATGGACAGCCAGGTGATGAAACTTACCAGGACATCTTTCGTGATTTTTCTCAAATGGCATCAAATAATCCAGAGAAACTCAATCGTTTCCAGCAAGATTCACAGAAGTTCTGAGCCTTTTAAGAGGGGAAACTATGAAATTTGGTGAATTCCTAATGTGTACAACCAAAATCTCACCCCCCCCCTTTTTTTTTTACTGCTTTAATTCTGCTTGATTTTGGTGGACATTGAATTGTTTGGAAAAAATGGTACCCATTCATTGGTATTTTTGAAAATGAAAACAGATCTTTCATAATTGGGAAAGGGAGAAATCCACTATAGTTCTTCTTTTATTTAAGAAGAAAAAAGCCTATTAATGGGTTGTGCTTTTATATAAAGTTGTATCCAGAGCTGGACCATCCTCTCTTAAGTTCTGAGATGCTACACTGTTAGGCCCCTGCACCCTTTGCCATGGGTGGTACACGGTTCCCCCAGGAACATTGAGTCACTATGCCTGCGTCAGGTGGGAACCAGTTTTCTTACCTGTATCAAGGATGTTTCTTTCCTATAGCTTCCCTGATAGATGCATGTGTGTTTTCTGGTAGCTTCGCTGTGGTACCCACGGTATGTGATGTAATTGCGAGGACTAGTGAGGGTGTTCCTCATTTGCTCGGACAGGCCATCGCACTTGCGGACTTGACAGACATGGCTGCTGCACAGTGGACCACACATTAGTCTTTAGACTCATTTCATCTTACGGTGCAGAGGAGCGCTTCCTTTTTCTTCTGTCAATCTCCACAAGACTCCCAGCTTGCTTTTTATTGTTGGATTGGTTTCCTAAAACCTTGACAGATCATCAGTGCAATAAAACGATTTCAGAGGTTGACTATTACAAAATTGGGCTTTCATCAAAACAGGGTGATTTCAAAGATAATGTAGGGCATTTTTATATTTGGAATTTATCCATTTATATATATATATATATATATAAAATTTATATATATATAAAATTTACTGTTACTCCTGGTGGAAGATGTAAGGAAAAAAAAGCTAATTTTTTTCTGTTTATATTAAAATTTACCAGCAATAAATTCCTTTTATTTTTTTCTACATTTATCTTATTTACTATACAACAGTATACATTCTTTTAAATTGTATCCTGTATATAGCTTTAGAATTAAGTAAAATATGTCATTGACCTTTGAGTTCCAAAATTATGAATATGTGATACAGTTTGGTGAGATTCCATCTCTGATTGACATGTCTTGTCAGAGTATGGAATGAATAAGTAATTACCTTATGGGTCATTTCCAGTACTGTTGATGACGTTCAGTCTTTTAGAAATTATTTGTAAGATACTCAGCTTCACAGAAACATTTTTAAATGTATATAAAATTATAGTTAATTAAATAAAAATTTTTAACATTTTCCCCACAGTATGTAGAGCCTTACTTTGATTGAATATAAAATCAGAATCTAAGCAGAAATCATATGGAAATAAATTCACAGCACAGATAAAGGCCCTGTCGTTCAGTCAGATTGCAAGCATGCAAAGCTTAGTAAGTCCCCACACATTAGGGATACAGAGCTATTGTGATTTGTTTCCAGGGAAGTGCAAACTTCCACAGGATGAGAGGAATTTTGTCTCTCCTGTCTCACCTCAAGCTTGCAGACCATCTGGCCTTGTAGGTATTTTGTTAAAGACAGAAGTCTAACTTTAACTGGCGTGTGTTGTAAAATTTATTGTCCTAAAACATGTTGAGGGAGGACCAGGCTACAGAAGGGCAGAAAGTCCGCCATGTTTCCCTCTGCTGGGCTCATTCTCGGTGACTGCTGGAGCGCCCCCCCCCCCTTGTCTGGAGGTGCTGACGGGCTTCCCTGCGGTCCAGCTGCCAGGAGACTGTCCCCCGGGCCTGCCTGCCTCCCCACCTCGTGTCAGAAGTTCTTGGTGTGGTGGTCAGTAGTGTCTGCTGCCCTTTAATGGCTAGTGTTTTTGAAATAAGCCTTAAAGATTCAGTGTATTTGAAATGCCTTAAAGGTTATTGTGGTTCTGAGTATCGTTAGAAAAAGCTACACCTTTTCGTATTGCATGGAGGCTGGCAATGCAAGAATATATTTCTACAGCTTAATTTCCTCAACGTGCTGAGAAATTGAATAGCAGAAAGGAATGGAATAGAGCAAGGCTTTAAATTCATAGTTACAAAGTAGCTTGGCTTTTAGATGAGTTTTGCTATAATAGCTTATGTGGCCTGTTGTGACGCCTTCTGTGCATTAGGAGAGAGGAGTATACGCAATGCCAGTTGCACACTCAGGCTGCTCTTTCTGATTGCTCTGTTTTCTCTCCAGGACAGACATGCTGAAAATAGTGTGATTCTTTATTATTAGTCTGTTCACTCTTTTTCATGCTCTCAGTAATGTCAAAATTGTATTACTGCCAAGAGAAGAATAGGGGTGCTATGAAGATTCAGAAAATGCAGGCGTAACATGGGCATAGATAAAGGTGATTGAGTAGCCGTTCACCAGGCCTCATTGCAACACTTACATGTTTAAGATTTCCAAGATTTCCAATTTATTTTTATTCATTTTTAAAAGTTTCCAGCATTCCAGTGTGCTTGACTAATTGATGCTGGTGTTTGCTGTAGTGGAGTGAACTTTGGTGTTACTGCCCCCAAAGTAATCCAGCTTGCAACTTGTACTTTAGAACGTCATAGGTGCATTTTTGGGGAAAAAAATTATACATTCACATTTTAGAGAATTTAAGTTTGTGATCATGTTAGCAGTATTTAAAAATAAAAATTCCTGCATATTAGATATGATCATAAACCAAGTTGTTTTATTTAAAACTAAACTCGCTACCCACTTGGAATAATTGAACATTCCTAGACCACTCATTCTCAAATTTTTTTGTGTGGTTGCATTTTGACCATGGCTAGAATTTTTTAAAATGAAATCTTATGTCCATAATAACTTCAGTTTATATCCTTCTTGGATCCAGGGCTCCTCACAAGTGAAAGGATGAAACAAAGGGAAACTCTAAAAGCTCCCCTCGTGTGTGTTTCATGACTTAGAGTGTTCTTCACACTACCTTTCCTCACCTGCTGCTTACAGGACTCCTAGATCCTAACCACGAGCATCAGCCTCGTCCGTCCGTGTCTCCATCCGAGCCCACTCCTCTCGTTTTACAGAGAGCGTCACTTCCTTTGCTAGTTGGAGGCCGAGCTGACCCAGGTCTGCCATAGCTTCGAAGCACTTGTATCATGGAAGGATTTGAAATCGCCGTAATGTAAAGCAGCAGCTTTCCCTGTGTTTGATAAGAAACTCCAAATACTCTGGAGAACCTCATGATGAAGTTTGAGGGACTAGATTGGGATTTGAAAGCATCAAATTGTAGAAAAGTCTCCAGATTTTACAATAGCAAACATTAATAAAAGCAAAGTATTATAAAGTTAAACTCACCATTTATTAACTTTTTGATGTTTTCAAATGAAACATAACCATGGAAGGGACTTGGATTCAGTTTGGCTGAGTCCTAACACCTAGAAGGATGATTTTTGTGGGCGTCTTTTCCTGTTTACATAGAGGGGGATCATGTGGACAAAGAGAGATGGAATGAAATACAAATTTTCTTTGCATTGCTGTTCTCACTATCTTATTTTCTAGATTTTTCTCATTCTCCAGTTTTATTTTGGGTTATTAATTTTTAACAGGGAAAGCTTGCTGCAGTATCAAGGTTGTTAGCACCATTTAATACGAAGGCTAAAGGTTAACTTTTGGAAATGACCAGCTCCTTTTTAAATATCTGTTTACGTGCGCTTTGTGATATTTCTGGATCATTCCGGTCATAAAGACTGATCACGTGTACTATTTCTTGCTACCTGTGAAAAGGGTTTTAAGAATGTATAACCAACACTCCATTAGTTTTTATTAGTGTGTAGAAGATTTGTATCTAATTCATGAATGTAGTTTTACTGTAGTTTGTCATTGTAAATGGAGCAAAGTACATTATCTTTATAGTTCTTCTAAAATGTACATTATGTAAGAATTGTAAATATACTTGATTACTTTGTATGCTGAAAATTTACAATAATAAGTCAATAAAAATATCTCACTTCTGGCACA\n>XM_038145225.1 PREDICTED: Motacilla alba alba chromosome 9 C2orf72 homolog (C9H2orf72), transcript variant X3, mRNA \nTCTCGCCCCGCTGCCCCGGGGTGTTGCTCTTCGCGGGGCCGGGGCTGGTGCAGGGTGGCGGGGCGGGTGCGGGCCAGTGGGCGGTGCGGAGCCGGGGCCGGGGAACATGCGGATGCAGGCCGGACAGGGAGCACGGCGGGGGATGGCGGCGGCAGACCTGCAGGAGCTCCGGGCGCTGGTGGAGCGGGCGGGCGGGCGGCGGGCGGTACTGCTGGTGGCCGAGGTGGCGGAGGGGGCCCCGGCGGCGCCCGCGCTGGCCGCCTTCGCCCGCGACCTCCTGGACGACGAGGCGCCGCGCGCAGCGTGCCCGGGGCCGGCGCCGGTGCCGGGGTGCCGGGAGAGGCGGTCGCCAGGCGCCGGGCGCCGGGCGCTGGGAGCGCGGCTGCTGCTGGTGCTGTGCGGCGGCGGGGCGGCGCGGGACCGCGGGGCGCGTACTCGCCTGCGGGAGATGGTGCGGGACGTGCGCGGCCGCCTTCCCGCGGGACCGCCGCCCGCCGTCGTGGGCGTCCTGCTGCCCGGCGGGGACGGAGAGGACGCGGCGGTGCTGGACGCCGCGCTGCGGCGGCACTTCCCGGCGCCCGGCACGGTGCAGGCGGCCCGGTACAACCCGGGCAGCCCAGGCGACTGCCGAGCCGCAGCCTGCCGCGCCCTGCGGGCTGCCCTGCAGCACCCCGCAGAAGACATGAAAGACAGGGAGAGGTGGAGGCTGCCATCCTTCCTGCAGTGCATTTCTTGGAACCAGGGGAGCTGGAGAAAAGATTACAAAGTGAAAGCTGAAAACAACATTCATGAAGGTCTGCCTTGACCTCTCTCTGCTCCCTGCAGATGACCTGCAGGACCCTGAGGAAGAAGTGGCTCTGGCCAGCCTTTCCCCCAGTGGAAACTGTGAAGAAGCTGCTGAAGGCACAGGCACCTAGAGCTGCTGGGCATCCAACACAGTCCACATCCCAGACCTGCCCAGTGGATTTGGAGCAATGGGAGGAGGAGCTGGTGCAGGCCCTCTCCTCCAAGGACCCACAGCTCCAGGGAAAAGCTGCTTGGCTGAACTTGTCAGGGTATTTTTAGCTGCCACCAACACAGAGGGTCTGTGCCAGAGAGCCATTCCCTGCTGCCCCGGGGCACTTGGAGCTGCTGCTGGACACTGGGCTTCTGAGAAGCCCTTTGGGGATGTACCCCACATCCCGGGCAATATGACATTGGGACTTTGAGTGTGAAATGCAGCCACCTGTTTGAAGAATGAGAAATGTTTTCAACTTCTGAGCAAAGTTCCCTGCTGAGGTTGCTGGGACCGGCCTCCCTGGCAGACTGATTCTGCTGCCTTGTTTTCCTACTTTATTGGTGCTTGGAATTTCCCACCCTCTTTGCCGTTAAAAACCAAACCAAACCAAACCAGAACAAAACAAAACAAAAAAACAAACAAAAAAACCCCCACAAAAGAACCCACAAAAAACCCCCAACGAAGTAATACAGCAGCTTGGAGACTGCAGTAGGACTAAATGTGAGTGCCGGGATCTACCAGCTACTGAAAAGGCATGAATGTAACAGTGTAACAAGAAGAATGCAGTAACAGCCCAGCTTGAGTGGCAAGAATAACATGAAAGATACTGATAGTACTGGCATCTGGACCAGAGTGGGGTTCGGGAGCGGGATCTGTCCCTCTGGCTTGTCCCGGTGCTCATAGGCTAACTGAGGGATGCCTGGGTTGGAGGGGTGGCGGGTGGGCTCTAAGGTGTGGCTGCTGCTAGATGGGGCTACAGGAGAGAGCCATCTTACCTGGGAGATCTCCACAGGCATGGTGGCACAGTTTGGAGGTGGCCTGCAGCACAACAAGAGGTGGCTGTTTCATAAATAAACATAAAAATATAAAAAAATATATTTAAGTAGTTCCAAAGGGTTGCCGGTAGCCTGTGGGGCAACACAACTAACCAGAAATCATTGGTTTACAAGGAATATTACTTTAATGTTAAAAATATATTTTTAATTCTTTATGCAACATCAAAGAGGTCTAGTTTTATTTTGAGCACAAGCCTGGCTTTCCTTTAGGAGTTTCCTCCAGCTCAGATCAGAAATTTCAACCTGCCTGCCTCTACTTTGGGTGAATTGCCAAAGTGCATCCTCTGTGCATGTCTGTCCTCTCTCTGGCTCCTTCTTCCCCACTGGCAGCAGAAGTGTCTGGAGTCCTGCCAGCTCTGGCCAGCACTCTACCCCAGCAGTTTGCCTTTGGCATCCCTCTAGCTCTTACCTGGAGCAGGGGATGCTGCTCTGCAGAGAGGGCACTGACCCGCTCTCCTTCCAGCCTCCAGGATTTCTGGAGAAATGACCTGTGGAAAACACAAATGTAACCAAGTGGCTCGCTGTGGGTGGCTGTGTCACTGGCCCAAATGTCAGCACTGAGCACTCAGTGCATCTTGGTGAGATTAAGGCTCCCTCCTGCTCCATCCCTGCATGGCCCAGGTGGCTGTGCAGGTCTGTATTTCCCAGCAAAGCCCTTGGTTAGGTGGGTCAAGCAGGACTCACCAGCAGGAATCTTTATTTTCTTGCAGCATTTAGCCTTTGCTGCTAAGCATTCTCCAATGAAGAGGTGATCCAAGAGCACAGACTGGCAGTTAAACCTCCCTTAGTGCTGCAAATCCACTGGATTTATTTACTGGTAATTTTGAGGTAAATCATGCAAGTTTATCCCTGCAAGAGACTGCTGGAAGTGGATGAACTGCCTGGGCCTTAGGCAGTGTGAGTGAGAATATATTTGACCAAAAGTATTGTTTTTCTTTCACTGAGGAATAAAAGTGACTTGAATTACTTTTTTTTTTTCCCTTTTCTCTTTTCACTATCTGTGCACTTGGAGGTGTAAGCAGATAGTTTTACGTGTTTAATTAATTGAATAATTTAAGGGCACTATCACATGCTTGTAAAATAAAGACACTTTCCAAATTGGAATGTGCTTATTTGTTTGCCATGGTGTTATCCTTGAAGCAGCATTATGTATAGCTTAACTCATATTTATCTTGGCTTGAGAAAAATGGATATTGGGATGGAATGGAAGTGACCCCAGTGTTTGAAATGCAGAAGATCAGAACTGAGTGCAGTCCAGGTGGAGCAATGGAGAAGGCTGGACATCTTCCCAGTTGTCCAAGAGCAGGGCAGTCCCTCTTGGCATTGTGGGTCGGAGTTTGATAAGCTTTCATTAGTAACTTTCATTAATAACTTTCACTAACTGATACCATTATGCATCCTCAAGGAATTCAATATATACCCTTCATAGGGTATTTCTTCCTAGTCAGTAGCATCAAGGAGAAATGAATGCTGCCGAGGTCTGGGCACTTCAGTCTCTTGTTGCTCATCGTTGCTCCTGAGCTGGACTTTCCCTGGTGCAAATCCACCACCCTGGGTATCCCATCCGTCTTGTGCCGCAGAGGCGGCCGGCACGTGTTAAACCCATGGGATAAAATCGCTGATCCTTGCCCTGCCCTGGGACACGCTATGCCCCTACAGATGCCCACCCCCTGCGGGCGGCCTGTGCCGGCGGGGGAAGCAGCCGCTTCTCTGGGCACGGCACAAACGCGGGCACCGGCGGGGTCACTCGTGGGGAGCTCACAGCCGCGGTCCCGCTCGCGCCGGCAGCGGTGTGGGGTCTGCGGGCGCGGGAGCCCGCGGGGGCAGCGGGGGAGCCCCGGGAGGCCGCGGGGGAGCCCCGGGAGGCCGCGGGGGAGCCGGGCAG\n>XM_030524043.1 PREDICTED: Scaptodrosophila lebanonensis synaptic vesicle glycoprotein 2C-like (LOC115628070), transcript variant X7, mRNA \nATAGTTCAATTATTGAATGTGTTGTACATATTTAAAAGTGCTTAAAAATATAGAAAAACTATGTTCTGAAAAAACACCTCTTTCAAGTAGTAAAAAGTGGAAAGAGAGAAATCATTCTAAATGGGTGTAATATATAGTGTACAACCAGAATTGTGATATAGTGCCTTAATGATAAAAAGCATTGACATTCAACTTGGAAGTTTGCGATGTTTCAAGGCATGCATATGTCTTGACTTTTTGGAGGATTTAGGAAGCGACTATGAAGATGCACTTCTACAAGCTGAATTTGGAAAATTTCATTTTCTTTTACTTACGATATGTGGTCTTATATACCTAAACACAGCAATAGGAATAACTATAATATCATTTGTTCTTCCCACTGCAACTTGCGATTTTGATATGACGTCTAAAGATAAAGGCTGGCTATCTGCTTCTCCAATGCTGGGAATGCTGATAGGATCATATTTTTGGGGATGTCTCGCAGATACAAAAGGTCGACGCATTGTATTAATTGTAACTCTCTTAGCAGACGGTATATGTGGATTGGTATCATCACTTGCACCTTATTACCTCATATTCCTGTTTATTCGTTTTGCGAATGGTTTCAATGTGGCTGGAACAATGGGCATTGTGTTTCCTTACTTGGGAGAGTTTCAACCAACGAAGTACAGAGAAAAAATTTTATGCTGGATGGAGCTTTTTTGGACATTTGGAATCATTTTACTTCCAGGAATCGCGTGGAGTGTAATTCCATTGCAAATAAATCTCCAATTTAGTGTTTTTACTTACCACAGTTGGAATCTCTTTGTTGCAATATGCGCAATACCCAGTATTTTGCTGGGTCTTTGGCTTTTTTCATTTCCGGAAAGCCCAAAATTTCTATTAGAGCATGGGGAAACAGACAAAGCGCTGGATATTCTCGTTTGCATGTTTATACAGAACACTGGACGTAAACGTGATGACTACCCTGTAAGACAAGCAAAAACTCTAAATAAGCTAATGTAAGAGTCTACGTGGCCCAGACCGTTCTAATAAGAAAAATGGCGAAAAGGGAATTCCTAACCTTCGATTTAGAAGACCGAATGAGTTAAAGATATTAATATCGGAAATTTGGACACAAACTAAAACGCTTTCC\n>XM_040248511.1 PREDICTED: Oryx dammah pre-mRNA processing factor 18 (PRPF18), transcript variant X3, mRNA \nTTGCAAAAAAAGAAGAGGAAGCATATTTTGAAAGATGTGGCTACAAGCCTATAAATGAGAAGCCACCTGGAGAGAGCAAGGATCAAATAACCCTGTAAGATGATTTTCTCAAAGAGGAGAAGCAAGCTGATTGTTTCCAAGAAGAAAGTAAAAATCTTGGAGTCTAGGGAGAAAATACAGCCAAAAGATGAAGACCAGAAACCATTAACTTCATCGAATCCAGTATTAGAACTTGAACTGGCAGAGGAAAAATTACCCATGACTCTTTCTAGGCAAGAGGTTATCAGAAGATTGAGAGAAAGAGGAGAACCAATCAGACTATTTGGAGAAACAGATTATGATGCTTTTCAACGTTTAAGAAAAATAGAGATCCTCACACCGGAGGTTAACAAGGGATTGAGGAATGATCTGAAAGCAGCTTTGGATAAGATTGATCAGCAGTACCTCAATGAACTTGTGGGTGGCCAAGAGCCTGGAGAAGAAGACACCCAGAATGATTTGAAAGTTCACGAAGAGAACACCACAATTGAAGAATTAGAGGCTCTGGGAGAGTCTTTAGGAAAAGGTGATGATCATAAAGACATGGACATCATTACCAAATTCCTTAAGTTTCTTCTTGGTGTTTGGGCTAAAGAGCTGAATGCCAGAGAGGATTATGTGAAGCGCAGTGTGCAGGGTAAACTGAACAGTGCTACTCAGAAACAGACTGAGTCCTATCTCAGACCCCTTTTCAGAAAGCTACGGAAGAGGAATCTTCCTGCTGATATTAAAGAATCCATAACAGATATTATTAAATTCATGTTGCAGAGGGAATACGTGAAGGCTAACGATGCCTATCTTCAGATGGCCATTGGAAACGCCCCTTGGCCCATTGGTGTTACTATGGTTGGCATCCATGCCAGAACTGGCAGGGAAAAGATTTTTTCCAAGCACGTTGCACATGTTTTAAATGATGAGACGCAGCGGAAATATATTCAGGGACTGAAGAGGTTAATGACCATTTGCCAGAAGCACTTTCCTACAGATCCATCAAAATGTGTGGAGTACAATGCACTATGAGATCTGTGTGCGGTGTGTAAATATCAAGAGAAACTTAAGGAAGCCTGTCACGGACTTCTGGAATTACCACCAGTTGCAATGAGGGAAGAAGAAAAAAGGAGTTTGTGGTCTCTGAGTTCTACCTAATGCAGCTCTTGGTTTTAAGAACGTGTGTTGGCTCTCATGTCACATCTGACTACAGAGTGATTTTTGTGTCTTACTTTTTAAGTAGTCAAAAAATTAAGTACTAAAGACTTTCCCCAGTAATTTAAATGTGTAAATTTAAAACAGTCACAGGACACGGTTTAAAATAACTTTTCCCCTCTAGACCTAAAAGTTGAAATGAGAGGATTAAAGAGGAACATTTGAGGATGGACTTAATGATTTCTATAAAATATGGTAATTTTCATGTTGCCTTTTATGTTGTGTTTATAGAGAAATATTTTTATATTTTTCAACAAAAATATGGAACTATTTAGTGAAACTTGATCATCCTTAAATGTTGCTTGACTTTTGCCACCTTGCAATATATTTGAATGTAAATGTTTTTACTATTGTCTATCTTGCATTTTAAAGCTTTTATCCTTTAAAGATA\n>XM_027406478.2 PREDICTED: Cricetulus griseus probable global transcription activator SNF2L2 (LOC100770307), transcript variant X12, mRNA \nGGGCGGAGCCCGAGTTTAGGAAGAGGAGGGGACGGCTGTCATCAATGAAGTCATATTCATAATCTAGTCCTCGCTCCCTCTGTTGCTGTACTCTGGGTGACTCAGAGAGGGAAGATTCAGCCAGCACACTGCTCGCGAGCAAGTTTAGTGATACTCTGCTGACTGGCAGAGCCAGGAGAAGTAGATGTCCACACCCACAGACCCAGCTGCAATGCCCCATCCTGGGCCTTCCCCGGGGCCTGGACCCTCTCCTGGACCAATTCTGGGGCCCAGTCCAGGACCAGGACCATCCCCAGGTTCGGTCCACAGCATGATGGGGCCCAGTCCTGGACCGCCCAGTGTCTCACATCCTATGTCAACAATGGGCTCTGCAGACTTTCCACAGGAAGCCATACACCAGATGCATAAGCCCATGGACGGGATACATGACAAGGGAATTATAGACGATGCCCACTGTGGATCCATGAAGGGCGCCAGCATGCGCCCACCACACCCGGGAATGGGCCCTCCACAGAGCCCAATGGATCAGCACAGCCAAGGTTATATGTCACCACATCCTTCTCCTTTGGGAGCCCCAGAGCACGTCTCCAGCCCTATATCTGGAGGAGGCCCAACCCCACCCCAGATGCCACCGAGCCAGCCAGGGCCACTCATCCCAGGAGATCTGCAGGCCATGAACCAGCCTAACAGAGGTCCTTCGCCTTTCAGTCCTGTCCAGCTGCATCAGCTTCGAGCTCAGATTTTAGCTTACAAAATGTTGGCCAGGGGCCAGCCCCTCCCTGAAACCCTGCAGCTTGCAGTCCAGGGGAAAAGGACCTTGCCTGGCATGCAACAGCAACAGCAGCAGCAGCAGCAGCAGCAACAGCAACAGCAGCCCCAGCAGCCTCAGCAGCAGCCCCAGCAGCCTCAGCAGCAGGCGCAGCCACAACCGCAGCAGCAGCAGCCTGCCCTTGTTAGCTACAACAGACCATCTGGCCCTGGGCAAGAGATGCTGATGAGTGGCCAAAGCACCCCACAGAAGCTGTCAGCACCGGCACCCAGCGGCCGGCCGTCGCCCGCACCCCCAGCCGCTGCCCAGCCCACCGCCACAGCTGTGCCCGGGCCCTCGGTGCAGCAGCCTGCCCCAGGGCAGCCGTCTCCGGTCCTGCAGCTGCAACAGAAGCAGAGCCGTATCAGCCCAATCCAGAAACCGCAAGGCCTCGACCCCGTGGAGATCCTGCAGGAGCGAGAGTACAGACTGCAGGCTCGCATAGCTCATAGGATACAAGAACTGGAAAGTCTGCCTGGCTCTTTGCCACCAGATTTACGAACCAAAGCAACTGTGGAACTGAAAGCACTTCGGTTACTCAATTTCCAGCGTCAGCTGAGACAGGAGGTGGTGGCCTGCATGCGGAGGGATACCACCCTGGAGACGGCCCTCAACTCCAAAGCATACAAGCGGAGCAAGCGCCAGACCCTTCGAGAGGCGCGCATGACGGAGAAACTGGAGAAGCAGCAGAAGATAGAACAGGAGAGGAAACGGAGGCAGAAGCACCAGGAATACCTGAACAGTATTTTGCAACATGCAAAAGATTTTAAGGAGTATCACCGGTCTGTGGCTGGGAAGATCCAGAAGCTGTCCAAAGCAGTGGCGACTTGGCATGCTAACACTGAAAGGGAGCAAAAGAAGGAAACAGAGCGGATCGAGAAGGAGAGAATGCGGAGGCTGATGGCTGAAGATGAGGAGGGCTACAGGAAACTCATTGACCAAAAGAAAGACAGACGCTTAGCATACCTTTTGCAGCAGACCGATGAGTATGTGGCCAATCTGACCAACCTGGTTTGGGAGCACAAGCAGGCCCAAGCTGCCAAAGAGAAGAAGAAGAGGAGGAGGAGGAGAAAGAAGGCTGAAGAGAATGCAGAGGGAGGGGAGTCTGCCCTGGGACCCGATGGAGAGCCCATTGATGAAAGCAGCCAGATGAGTGACCTGCCCGTCAAAGTGACGCACACAGAAACTGGCAAGGTCCTCTTTGGTCCTGAAGCACCCAAAGCAAGTCAGTTGGATGCCTGGCTGGAGATGAATCCTGGGTATGAAGTTGCTCCCAGATCTGACAGCGAAGAGAGTGACTCTGATTATGAGGAAGAGGATGAAGAAGAAGAGTCCAGTAGGCAGGAAACGGAGGAGAAGATACTGCTGGATCCAAACAGTGAAGAAGTTTCCGAAAAGGACGCCAAGCAGATCATTGAGACTGCGAAACAGGATGTGGACGATGAATACAGCATGCAGTACAGTGCCAGAGGGTCGCAGTCCTACTACACGGTGGCCCATGCCATCTCCGAGAGGGTAGAGAAGCAGTCTGCCCTCCTCATTAATGGGACCCTAAAGCATTACCAGCTCCAGGGCCTGGAATGGATGGTTTCCCTGTATAATAACAATTTGAATGGAATCTTAGCTGATGAAATGGGGCTAGGCAAGACCATCCAGACCATTGCACTCATCACATATCTGATGGAGCACAAAAGACTCAATGGCCCCTATCTCATCATTGTTCCCCTCTCGACTCTGTCTAACTGGACATATGAATTTGACAAATGGGCTCCTTCTGTGGTGAAAATTTCTTACAAGGGTACCCCTGCCATGCGACGCTCCCTTGTTCCCCAGCTACGGAGTGGCAAATTCAATGTCCTCCTGACTACTTATGAATACATTATAAAAGACAAGCACATTCTTGCAAAGATTCGGTGGAAATACATGATTGTGGATGAAGGCCACCGAATGAAGAATCACCATTGCAAGCTGACTCAGGTCTTGAACACACACTATGTCGCCCCCAGAAGGATCCTTTTGACTGGGACCCCGCTACAGAATAAGCTCCCTGAACTCTGGGCCCTCCTCAACTTCCTTCTCCCTACAATCTTCAAGAGTTGCAGCACATTTGAGCAGTGGTTTAATGCTCCATTTGCCATGACTGGCGAAAGGGTGGACTTAAATGAAGAAGAAACTATCTTGATCATCAGGCGTCTGCACAAGGTGTTGAGACCCTTTTTACTGAGGAGACTGAAGAAAGAGGTTGAATCCCAGCTTCCAGAAAAGGTTGAGTATGTGATCAAGTGCGACATGTCAGCTCTGCAGAAGATTCTGTATCGTCATATGCAGGCCAAGGGGATCCTCCTCACTGACGGTTCTGAAAAAGATAAGAAGGGGAAAGGAGGTGCCAAGACGCTTATGAACACTATCATGCAGCTGAGAAAAATTTGCAACCACCCATATATGTTCCAGCACATTGAGGAATCCTTTGCTGAACACCTGGGCTATTCAAATGGGGTCATCAATGGGGCTGAGCTGTATCGGGCCTCAGGAAAGTTTGAGCTACTTGATCGTATTCTGCCCAAATTGAGAGCAACTAACCACCGCGTGCTGCTTTTCTGCCAGATGACGTCTCTCATGACCATCATGGAGGATTACTTTGCTTTTCGGAACTTCCTTTACCTGCGCCTTGATGGCACCACCAAGTCTGAAGATCGGGCTGCTTTGCTGAAGAAATTCAATGAACCTGGGTCCCAGTATTTCATTTTCTTGCTGAGTACACGAGCTGGGGGCCTGGGCTTAAATCTTCAGGCTGCGGACACAGTGGTCATCTTTGACAGCGACTGGAATCCTCATCAGGATCTGCAGGCCCAAGATCGAGCTCACCGCATTGGCCAACAGAATGAAGTCCGGGTTCTGAGGCTCTGCACTGTCAACAGTGTGGAGGAAAAGATTCTCGCAGCTGCAAAGTACAAGCTGAATGTGGACCAGAAGGTTATCCAGGCGGGCATGTTTGATCAGAAGTCCTCCAGCCACGAGCGGAGAGCATTCCTGCAGGCCATATTGGAGCATGAAGAGGAGAATGAGGAAGAAGATGAAGTACCAGACGACGAGACCCTGAACCAGATGATTGCTCGCCGGGAAGAAGAGTTTGATCTTTTTATGCGCATGGACATGGACCGGAGGAGGGAGGATGCCAGAAACCCAAAGCGCAAGCCTCGCCTGATGGAGGAAGATGAGCTGCCCTCCTGGATTATTAAGGATGACGCGGAAGTGGAAAGGCTTACCTGTGAAGAAGAGGAGGAGAAGATATTTGGTAGGGGTTCTCGCCAGCGCCGGGATGTGGACTACAGCGACGCCCTCACCGAGAAGCAGTGGCTCCGGGCCATCGAAGACGGCAATTTGGAAGAAATGGAGGAGGAAGTACGGCTCAAGAAGAGAAAAAGACGAAGAAATGTGGAGAAAGATCCTGTGAAGGAGGATGTGGAAAAGGCGAAGAAAAGAAGAGGCCGCCCTCCAGCTGAGAAACTGTCACCAAACCCCCCCAAACTAACCAAGCAGATGAACGCCATCATCGATACTGTGATAAACTACAAAGATAGTTCAGGGCGACAGCTCAGTGAAGTCTTCATTCAGTTACCTTCCAGGAAAGAGTTACCAGAATACTATGAATTAATTAGGAAGCCAGTGGATTTCAAAAAGATAAAGGAAAGAATTCGTAATCACAAGTACCGGAGCCTGGGTGACCTGGAGAAAGATGTCATGCTTCTCTGTCACAATGCACAGACATTCAACTTGGAGGGATCCCAGATCTATGAAGACTCCATTGTCCTACAGTCAGTATTTAAGAGTGCTCGGCAGAAAATCGCCAAAGAAGAGGAGAGTGAGGAAGAAAGCAATGAAGAGGAGGAGGAAGATGATGAAGAGGAGTCTGAGTCAGAGGGTAAGACCCTGCATCTGGCCCCTTCCACCTATCGGGCTATTTCCACAGCCAAATCTGTGAAGGTGAAAATCAAACTCAATAAAAAAGAAGAGAAAGGCCGGGACACAGGGAAAGGCAAGAAAAGGCCAAACCGAGGCAAAGCCAAACCTGTTGTGAGCGATTTTGACAGTGACGAGGAACAGGATGAGAACGAACAGTCAGAGGCAAGTGGGACTGATGATGAGTGAGCAGTGTGGACTTGATCTGACTGTGGCAGAACTGAACACTTTCTCCCCCTTTCTCCCTTCACCCCCAGTGAGTTCATTTGCCCTTTGGGCACTGGGTTATTCCTCCGTCCTCATTGTCATCTAGAGCTAGCTTTAGGATAGTGCCAGACAAACATATGATATCATGGTGTAAAAAAAACAAAACATGCATCTACACACACACACACACACACACACACACACACACACACGAATATTTGTAACATATTGTGACCAAATGGGCCTCAAAGATTCAAAGATTAAAAACAAACAAAAGCTTTTGATGGAAAAGACGTGGGTGGATAGTATATTTCTACAGGTGGGTCAAATTTGGTAGCCGTTTGATGTGCTTGCTTCCATCATCTATCCTGATGAGGAGATTTTTATCTTCTACAGCGCTGATGACCGGGAGAAGCCATTAAAAGCCACTGGTTATTTTATTTTTCATCAGGCAATTTTCAAAATTTTCATTTGTTCGGTATTGTTTTCTTGTTTGTTTGTTTTTTACACTGTGGTACATATAAGCAACTTTACTAGGTGACAGATGTACAGTAGTTAGAAATCACCTACATATACATTTTTCCATTTTATGCTCTATGATCTGAAGAACAAACAAAAAAAAAGCTTTTTGACTTGTATAAGATTTATGTCTACTGTAAACATTGCGGAATTTTTTTTTCCCTTTGGCTCTTGTTTTATTGACGCTATTGACTATTACAGTGTCTAGAGTGTCCCGATGGCTTCTTTTGTCCACCTGAGCTCCTGTGTTACCAATGGGTATGGTCTCCTTCTCCCTAAAGTGTACTTAATCTTTGCTTTCTTTGCACAATGTCTTTGGTTGCAAGTCATAAGCCTGAGGCAAATAAAATTCCAGTAATTTCGAAGGATGTGGTGTTGGTACTTTCCTAATAAACCGATAACTTACCTTGA\n>XM_016163448.2 PREDICTED: Rousettus aegyptiacus junctional sarcoplasmic reticulum protein 1 (JSRP1), transcript variant X3, mRNA \nAAATATCGAGCCTCTTACCACATTCATTGTCATTTTCAAGCCTGGCCACTTCTGCTAAGTTATTCTTGGGAACAAAAAGTCTTGAGCCAGCAGCAAGGAAAAAGAGAAGTCAACAAGGGCATGCGTCAAACAGCCCAGGGCAGAAGCAGCCCAGCAAGGGCTTCCAGCCCTGCCGTGAGGCCACAAATCCACGGGCACATCTGCTGGCGGGTGATAAAGTGCCAGTGGCCTTGTGACAGCTCCCCGAAGACTCACAGGCCCCAAGGATGTGAGGGCGTGGCCGGATAAACAGGGCTTATCTCACACCGGAGGCCGTTTTTTTGTTTTTTTTTGTTTTTTTAACCCAACTTATATATTTTTTATCTTTTATGCTTCTCAATAGACTTTTCAATACTTTGTGATAGTTCAAATGCTTTGGCGAAGGTTTCGTTACGGAAAAAAGGGAGGCGTGGCGGGCTGGGTCTGAGCGCTGCGGCCCTGCAATCCGCTTCCTGCCTCACCTCGCCCGCGCCTCTGGGGTCGCCAGGTTTCGTCTTCGTTGCGACAGCATTTCTGTTGCCGGATGGAAGAGTGACGGGTGCTCTTGGAGGACACTAAGTGGATGTGGGTGTATCCTCGCCAGATCTTTTCTCTGTGTATGTCTTTTAGCATCTGTGGTCAGACTCCGTGTGCGTGTGAATAGCCAGACACACAGTGCCCCACGGCGTGCGCCTCCCTCCACATGACAAGTCCAGAACAAGCACGTCCCCAGACAGGAAGTGGGGGCCACCGTCCATCCCGTCCGCCAGGCCCAGCAAGGCGGCTGTGGACCCCGCAGCAGCCCGAGTCTGGACCCAGGCTTCTCAGACATCTCCATGACAACCAGGGCCCTGGAGGAGCTGGATGGAGGCCTGGGCAGCTGCCAAGCGGTGACACCCAGGCTGGCCGACTCCAGCAGCTGGCCCCACATGCTGTTGCTGGCGAGGCAGGTGCCCCTGCACCTGTCCCTGAGCCATGGGCCCCACCTAGTTCATCCCCCCAAAAGCCAGCACCGCACTTGTCGAAGCCCGTGGCCCGGGCACCCCCATCGGTGCCCCCTGCGCCCCAGGTGGAGGCAGAGGAGAGGCCCGAGGTGCCCGCGGCGGCTGCGTGGAAGGACGAAGGGGAGTCTGGGGAGGCCGCCGAGGAGCAGCGCGCACCCCTGGCCCACGGAGGGCCCAAGGAGAGGCCGCGGAAAGAGAGTCCGCGGAAGGAGAAGTCCCGAAAGGAGGAGAGACCGCGGAGGGCGGAGAAACCGCGGAGGGCGGAGAAGCCGGGGGCTGCCAGGGAGCCCCCGGGAGCCCGCCCCCGGCGCTGGGAGGCCCGCGAAGGGGGCCGCCGGCCCTGGGTGCAGGAGTCCCGAGACCCTGAGCACAGGAAAAGGCAGGCCTGGGCCTCTTTGCGGCGCCCCAGCGAGGAAGACCGGCCTCCGGGCCGCCAGAAGCACCGCGCCGGCAAGGGGCGGGACTGAGCCGCGCCAGGGGCTCGCGCTGGAGCCCCAGGCCTTCCCGGCGGGCCCCGGGTCCAGCCAAATAAAGAG\n>KR839926.1 Uncultured bacterium clone OTU_8642 16S ribosomal RNA gene, partial sequence \nTACGTAGGGGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCACACAGGTCCGTTGTGAAAACTCGAGGCTCAACCTCGAGACGCCGATGGAAACCGTGTGGCTAGAGTCCGGAAGAGGAGTGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAAGAACACCTATGGCGAAGGCAGCACTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>XM_032296798.1 PREDICTED: Sapajus apella PTPRF interacting protein alpha 2 (PPFIA2), transcript variant X20, mRNA \nTAATTACATTGATATTTATGATGTTCTATAGGAGTTCAGAAAAGTGGAAAATATTTAGTACATTTTGTTTGATAGTACTCCTAGTATATAGAGTCTTACTGAGTTGTATGCAATTGCCTCTCAATGTCCTAGCCAGCTGTAACAGCTGTAATATACTTTGATCTATAAATTATAAAATAACTATCTACTTTAAAAAAAAAAAGGCTTTGTAAAAAAAATCGCATCTTGTTGAAAAGTCTGGGAATGACTAAAAGATTTAGAAAGATGCAGAATCAAGAGCGATAAAACAGCAATTTGTTACTAAATAGAGCTTTAAACAGTATATGAAACATACTTCAGGTTAGTCAGAAGAGGTCCTCTGAATTACACTGTGCATGCTTCCCTGAAATGAAACTGTATGTTATTGGTTAACCAGGATATTTAGCATAATCACTCTGCTAGACTGTGGTGGAGGGAGGTGATTATCACTGAGAACAGATGGGCAGGTCCACAGCACTGCCAGATTCTGCACAAGCTCCATTTATCGTTGGTTCTTGCTTTTTTCCTTCTGTGTTTTAAATTTTTTTAAAAAACATTGTATGTTCTAAAGAACTAGCTTCACAAAAGGCTGGTGGCTGATGATCTTTCAGCTAAGATTTCAAATGTAGAAGAAAGATTTAAAATGCTGTCACTGTGTATCTAAGAAGGATGGGGCAGATTTCATTTTACCCTGTAGTCTCCCTCAATGCATGCACGGATTTATCTGTACGCTAAGCTCTCTGCTCTGCATCTGTAGCTCCTTGTGGATTATATTGTCTCTGTGATCAGAAATGATTTTCTCGGATATGAACACCGTTTCTGGCTCCCCTAAAGTGCATCCTCCTAATGGGACCCGGTTTTACACTTTTCAAGAATTTGCTGCACTGACAAAAGAATTAAATGCCTGCAGGGAACAACTTCTAGAAAAGGAAGAAGAAATCTCTGAACTTAAAGCTGAAAGAAACAACACAAGACTATTACTGGAGCATTTGGAGTGCCTTGTGTCACGACATGAAAGGTCATTAAGAATGACGGTGGTAAAACGGCAAGCCCAGTCTCCCTCAGGAGTATCCAGCGAAGTGGAAGTTCTCAAGGCACTGAAATCTTTGTTTGAGCATCACAAGGCCTTGGATGAAAAGGTAAGGGAGCGACTGAGGGTTTCTTTAGAAAGAGTCTCTGCACTGGAAGAAGAACTAGCTGCTGCTAATCAGGAGATTGTTGCCTTGCGTGAACAAAATGTTCATATACAAAGAAAAATGGCATCAAGCGAGGGATCCACAGAGTCAGAACATCTTGAAGGGATGGAACCTGGCCAGAAAATCCACGAGAAGCGTTTGTCCAATGGTTCTATAGACTCAACTGATGACACTAGTCAAATAGTTGAACTACAAGAATTACTTGAAAAGCAAAACTATGAAATGGCCCAGATGAAAGAACGTTTAGCAGCCCTTTCTTCCCGGGTGGGAGAGGTGGAACAGGAAGCAGAGACAGCAAGAAAGGATCTCATTAAAACAGAAGAAATGAACACCAAGTATCAAAGGGACATTAGGGAGGCCATGGCACAAAAAGAAGATATGGAAGAAAGAATTACAACCCTTGAAAAGCGTTACCTCAGTGCTCAGAGAGAATCTACCTCCATACATGACATGAATGATAAACTAGAAAATGAGTTAGCAAATAAAGAAGCTATCCTACGGCAGATGGAAGAGAAAAACAGACAGTTACAAGAACGTCTTGAGCTAGCTGAACAAAAGTTGCAGCAGACCATGAGAAAGGCTGAAACATTGCCTGAAGTAGAGGCTGAACTGGCTCAGAGAATTGCAGCCTTAACAAAGGCTGAAGAGAGACATGGAAATATTGAAGAACGTATGAGACATCTAGAGGGTCAACTTGAAGAGAAAAATCAAGAACTTCAAAGAGCTAGGCAAAGAGAGAAAATGAATGAGGAGCATAACAAGAGATTATCGGATACTGTTGATAGACTTTTGACTGAATCCAATGAACGCCTACAACTACACTTAAAGGAAAGAATGGCGGCTCTAGAAGAAAAGAATGTTTTAATTCAAGAATCAGAAACTTTCAGAAAAAATCTTGAAGAATCTTTACATGATAAGGAAAGATTGGCAGAAGAAGTTGAAAAGCTGAGATCTGAACTTGACCAACTGAAAATGAGAACTGGCTCTTTAATTGAACCCACAATATCAAGAACTCACCTAGACACCTCAGCTGAGTTGCGGTATTCAGTGGGATCCCTTGTGGACAGCCAGTCTGATTACAGAACAACTAAAGTAATAAGAAGACCAAGGAGAGGCCGCATGGGTGTGCGAAGAGATGAGCCAAAGGTGAAATCTCTTGGGGATCATGAGTGGAATAGAACTCAACAGATTGGAGTACTAAGCAGCCACCCTTTTGAGAGTGACACTGAAATGTCTGATATTGATGATGATGACAGAGAAACAATTTTTAGCTCAATGGATCTTCTGTCTCCAAGTGGTCATTCTGATGCCCAGACTCTAGCCATGATGCTTCAGGAACAATTGGATGCCATTAACAAAGAAATCAGACTAATTCAGGAAGAAAAAGAATCTACAGAGTTGCGTGCTGAAGAAATTGAGAATAGAGTGGCTAGTGTGAGCCTGGAAGGTCTGAATTTGGCGAGGGTCCACCCAGGTACCTCCATCACTGCCTCTGTTACAGCTTCATCGCTGGCCAGTTCATCTCCCCCCAGTGGACACTCAACGCCAAAGCTCACCCCTCGAAGCCCTGCCAGGGAAATGGATCGGATGGGAGTTATGACACTGCCAAGTGATCTAAGGAAACATCGGAGAAAGATTGCAGTTGTGGAAGAAGATGGTCGAGAGGATAAAGCAACAATTAAATGTGAAACTTCTCCTCCTCCTACCCCTAGAGCCATCAGAATGACTCATACTCTCCCTTCTTCCTACCACAATGATGCTCGAAGTAGTTTATCTGTCTCTCTTGAGCCAGAAAGCCTTGGGCTAGGCAGTGCCAATAGCAGTCAAGACTCTCTTCACAAAGCCCCCAAGAAGAAAGGAATCAAGTCTTCAATAGGACGTTTGTTTGGTAAAAAAGAAAAAGCTCGACTTGGGCAGCTCCGAGGCTTTATGGAGACTGAAGCTGCAGCTCAGGAGTCCCTGGGGTTAGGCAAACTCGGAACTCAAGCTGAGAAGGATCGAAGACTGAAGAAAAACACATCTGGGCATGAACTTCTTGAAGAAGCTCGGAGAAAGGGGTTACCTTTTGCCCAGTGGGATGGGCCGACTGTGGTTGCATGGCTAGAGCTTTGGTTGGGAATGCCTGCATGGTACGTGGCAGCCTGCCGAGCCAACGTGAAGAGTGGGGCCATCATGTCTGCTTTATCTGACACTGAGATCCAGAGAGAAATTGGAATCAGCAATCCACTGCATCGCTTAAAGCTCCGATTAGCAATCCAGGAGATGGTTTCCCTAACAAGTCCTTCAGCTCCTCCAACATCTCGAACTCCTTCAGGCAACGTTTGGGTGACTCATGAAGAAATGGAAAATCTTGCAGCTCCAGCAAAAACGAAAGAATCTGAGGAAGGAAGCTGGGCCCAGTGTCCGGTTTTTCTACAGACCCTGGCTTATGGAGATATGAACCACGAATGGATTGGAAATGAATGGCTTCCCAGCCTGGGGTTACCTCAGTACAGAAGTTACTTTATGGAATGCTTGGTAGATGCAAGAATGTTAGATCACCTAACAAAAAAAGATCTCCGTGTCCATTTAAAAATGGTGGATAGTTTCCATCGAACAAGTTTACAATATGGAATTATGTGCTTAAAGAGGTTGAATTATGACAGAAAAGAACTAGAAAGAAGACGGGAAGCAAGCCAACATGAAATAAAAGATGTGTTGGTGTGGAGCAATGACCGAGTTATTCGCTGGATACAAGCAATTGGACTTCGAGAATATGCAAATAATATACTTGAGAGCGGTGTGCATGGCTCACTTATAGCCCTGGACGAAAACTTTGACTACAGCAGCTTAGCTTTATTGTTACAGATTCCAACACAGAATACCCAGGCAAGGCAGATTCTTGAAAGAGAATACAATAACCTCTTGGCCCTGGGAACTGAAAGGCGACTGGATGAAAGTGATGACAAGAACTTCAGACGTGGATCAACCTGGAGAAGGCAGTTTCCTCCTCGTGAAGTACATGGAATCAGCATGATGCCTGGGTCTTCAGAAACATTACCAGCTGGATTTAGGTTAACCACAACATCTGGACAGTCAAGAAAAATGACAACAGATGTTGCTTCATCAAGACTGCAGAGGTTAGACAACTCCACTGTTCGCACATACTCATGTTGACAAGCCACTCAAAGGAGGCAGCACTGACCTGCTATGTCGTCTTTTCAGTCTACTCTACCTAAAGTGCACTACCATCTAAGAAGACAAGCAGTGAAAATATTTGTGAAAACTGAATTCTAAGAAACTAATGATGTCATGATTTATTAAAAGCTGAAAAAAATGTGATTTTGGGGGGAGTCAGATGTTACATTTGATTAGTTTACTACAATTGTAATAAAATGCTTAAGTCATTTGAATAATAAACATCATCTACATCATAAACTCTGTACAACAGATGCTTTTATGAAATGAAGCCACTTGTTTTTCATGTTTTATTGTAATATACTAGGCATTTATGTATTACTGTGCATTTCTTTTTAAATGTGTAAGTCTTATGTAAATGGATATAAATATGATTTTTTAAAAAATAAAATATATGGTTCATGGAGTCTCGAGTACAAACATTTGACAATTCTAAGTACTGTTTGTATTTTACCATTCCACCATTTTTACAGTTTTTGAATTGTTAACAGTCAAATCAATGTTTCCTTGAAGCATGTTCCATGCTTCAACATGTTTCTCCTTCAAGTCTGTCAATACTTACTTACTTACTTAAAGCTGAACAACCTGCCTCTGATCATGTAAAAAAGAATGATTTAACCTGGAACTGGAGCCAAAAAATAGAGCTTTAAAGGCAATCAGGGATGTCCTATATCTTTAGAAATAGCACTGTGATGGCTCGATCTCCTTTTCAATACAAAACAAAGCCAACCTGTTTACAAGGGTCAAAAGCAATTATTTAAAAATTTATATTAAAAAACCATTATCTTCTCTTGTTACCTGTGGACCAAGAAAAAAAAAAAAAAAAAAAAAACTTCTTTACTAGAACCACATGTTCATTTAAGTATCTTGAACTGCCAGCCAGTACTGGACAGCGAAATGTCAACCGCCGCAGAGTCTGAGGCTCATTTCCACGAGAAAACAAAACCCAAGAAACCCTTCCCTTTTGTCAATGGAACAGGGCATTAGCCAAACTCATGTCTAATGTTATAAGCTTTCAGCCAAGATGGCCTTGTTGCGACTTCCCTGAAGTCAGTTTATCAGAGGAAATAAATGAAAGACAGAACAATTAACACATATAGTGTATAAAATTATGGAAGAGTAATCTCTTTCCCTGTGGCTTTATTTGGTGGTGTTACTGTTGTTTATTCTTTGTTTATATGGGAGATTCAAAGTAAAACCTATTTACTAATACCATTTATCTAACTGCGGATTTTCTGCTGCTTGATCTTATTAAGCGCAAGACCTGTCATTAGTAATTTTTTTTGTATTTTAATTTGCTATGTTTGCACGTACATTACATTTGTTTCGATGTCTATTTTTGTTTAACAGATTCAGTCAAAAGGTAATGGTAACAGAAACCCTTTCCATTGTCAATAATAAAAAAAATACTTCCA\n>XM_021543360.1 PREDICTED: Lonchura striata domestica calpain 7 (CAPN7), transcript variant X2, mRNA \nCGAAAGTTTGTCAGGCTTCGGAGGAGCCGCGTTCTTCGGGGCGAGTTGCGAAACGCCTTTTCCCTGCGTCCTGGTTTTAGGAAGCTGCACAAGCCTTGATTTATGCTGGGATGGCTGGGTCCAACTTGGAAAATATTCAAGAAAAGATAAATGAGTACTTGGAGAGAGTTCAAGCTCTCCATTCAGCAGTTCAATCACAGAAGACAGACCCTCTGAAGTCAAAACAACAGTTGGACTTGGAGCGTGCTCACTTCCTAGTTACACAGGCTTTTGATGAAGATGATAAAGGCAATGCAGAAGAAGCTATAGAGTTGTACACAGAAGCAGTGGAACTCTGTTTGAAAACAGCTACTGAAACCTCAGAAGCCAGCCTCCAGTCCAAACTGAAACAACTGGCTCGACAAGCACTGGATAGAGCAGAAGCACTGAAGGAATCTATGTCAAAGTCATCACAGAAAGAAAAGTCAACTGCAGCCAAACCAAATCAGCCAGTCAGAACGTTCTTTCCACTGGGACCTGATTTTTCTTTAAATGATAAACCACAGACAATCAGAGCAGTACAAGCTAGTGAATCTCAAGGTCAGAGATACACTGCAGAGGAGATTGAAGTACTCAGGAAGACTTCAAAGATTAATGGCATTGAATATGTACCTTTCATGAGTGTTGATCTGAGGGAACGTTTTGCCTTCCCTATGCCTTTTTCTGATAAGTGTGGGAAGCTACCATTATCCCCCAAACAGAAAGCAATGTTTGCCAAGTGGGTGCGACCAGATGACATAACAAATAACCCTACAATGATCTATACTGTATCAAGTTTCAGCATAAAGCAGACAATAGTGTCAGACTGTTCTTTTGTGGCATCACTAGCTATCAGTGCAGCATATGAAAGAAGATACAACAAAAAACTGATCACGAGTATAATTTACCCTCAGAATAAGAAAGGAGAACCAGAATATAATCCATGTGGTAAATACATGGTGAAGCTTCATATCAATGGTGTTCCTAGAAAGGTAATCATAGATGACCAGTTACCTGTTGATCATAGTGGGGAACTTCTCTGCTCTTACTCCAATAATAAGAATGAATTATGGGTGTCACTAATAGAAAAGGCTTACATGAAGGTCATGGGAGGATATGATTTTCCTGGATCAAATTCTAATATTGATCTCCATGCACTGACAGGTTGGATACCTGAAAGAATTGCTATGCACTCTGACAATCAAGCCTTCAATAAAGATAGCACTTTCAGAATGCTTTATCAGAGATTTCACAAGGGAGATGTCCTTATCACAACAGCAACAGGGGTGATGTCTGAAGAGGAAGGAGAGAAGTGGGGTTTAGTTCCAACCCATGCATATGCAGTCTTGGATATAAGAGAATATAAGGGACTTCGATTTCTTCAGCTAAAAAATCCCTGGAGCCACTTGCGTTGGAAGGGACGATACAGTGAAAATGACACAAGAAACTGGACCCCAGATTTACAAAAATACTTGAACTTTGATCCCAGAACAGCTCAGAAAATAGACAATGGCATTTTCTGGATTTCCTGGGAGGACCTGTGCCAGTACTATGATGTTATTTATTTGAGTTGGAACCCAAGTCTTTTTAAAGAATCTACATGTATTCACAGTACGTGGGATGCAAAGCAGGGCCCGGTGAAGGACGCCTACAGCCTGGCCAACAACCCTCAGTACAAGCTGGAGGTGCAGTGTCCACAGGGTGGTGCTGCCGTCTGGGTCCTGCTCAGCAGGCACATCACTGACAAGGATGACTTCGCACACAATCGGGAATTCATTACAATGGTTGTATACAAGACTGATGGTAAAAAAGTTTACTATCCAGCTGATCCTCCTCCTTATATTGATGGTATTCGGATTAACAGTCCTCATTATCTGACCAAGATAAAGCTGACCTCTCCAGGTTCCCATACATTCACCTTAGTGGTGTCCCAGTATGAGAAACAAAACACCATCCATTACACCATCAGGGTGTATTCCTTGTGCAAGTTCACCTTTTCCAAGATTCCTACGCCTTACACCGTTTCCAAACGGGTTAATGGACAGTGGAAAGGTCACAGTGCTGGAGGATGTGGAAACTTCAGAGACACCTACAAAAATAACCCCATTTATCAATTCCAGCTAGACAAGAATGGACCATTGCTAATTGAACTACGGGGGCCAAGGCAATACAGTGTTGGCTTTGAACTTGTCACCGTCTCAACAGTGGGAGATCCTGGTTCCTATGGCTTTCAGAAAAAAAGCAGTGGTGACTACAGGTGTGGATTTTGCTACTTGGAGGTGGAGAACACATTTGCTGGAGTTTACAACATTATCCCCACCACATTCCTGCCTCAACAAGAAGGGCCTTTTTTCTTAGATTTTAACAGTACTACTCCTCTTAAGGTGTCACAGCTGCAGTGAGGAGACAGAACTGTGTAGTGTTGTTTAAGGAGATGGTTTTGATCTGTCCAGCAGCCTGAGAACAGGTGAAGAACCCTTACTACACATGCACAAAAGAAAATTACATCCTGATTTATAGCCAAAAGCATGGAATCACAGATTGCCAGTTAATTATGGCAGGGAGTTGGCTGTGGGTTTGCTGCTGTGGTCTAGGAGTGAGCACTGTTCAACAGGCTTGGGAATAGGCTAAAATGCATATATTCAAATGAACCAGCAGAACTCACTCAATTTATTGCAGTTTTTCCACACTTTGAATCAAAGTCTACTGAGTTACAAGAAAAACTAGCATTGAAATTCTCTCCTCCCCACATACAAGGTATAGGAGCTAAAGATTCTATTCTTAAAAGTAAACATGTAAGAAAAAATATTCTTGTGTATTCTGCTTATTCAGTCTCAGGACCAAATAGCTTTTATTACACATTTGTGCTGCTATCTGTAATGTTTTCAGCACTGAACGGGTTCTCAAATCTAAATGTAAATGTACTACTGCTGAGTCAAGAGTATTCCATGTGTCATCTTATCTGGAATATGTATATAGGAATAAAGGAAAAAGAAGGTTCCAGCTTTAGCTATTTCTAAAAGCAAAGCAAGTGCTTTGCTTATGTTATGTGTACCTTGAGAGCTGTTACTTCATATCTGTATGACTTTAGCACATAATACAGCATGAGGTTCTGTGGCTTTCTTCCTGCTATCTGCCAGACCTAGGTTGATCCTGAGGAGCAGGAAAGACAGGAGATCATCCAGCAGTAGTGATCAGGCAGTGCAGCACAGCCTTCTATGAGCAGCTGTGAAAGGTTTTCATCTGAAGATCCCCTGTATGATTCACTGTATCCACTGAGGGTAGTCTCAGTTACTGGTGCAGGGAGATGGGGAACTGCCCACCATCAGCAGCTCAGCAAAGAAATGTTTTATTTTCATCACTTTTGTAAGTATGTGTCATGTAGGGAAGGATCATTTAAATCTCTCTCCCAATACACCACAGCTTCAAGGAAGGCACTTGCTGATTCAATTATACAAGACATCTTTGAAAATATACTTTTTTCCTTTTAAAATGACACCAGTGAAGGAATTGAGCACAAGGCCAGTGTCATCAATAGAAGCAGGGTCACAGTTCTTAAGAAAATAGTGGAGGTGGGATTAATGCAGAACAAGTTATTTTTTTAGAAGTTCCCCCTGTATGTGTTCTTCCTCTAGATCTGTATAAATTGTATCTGAAGTGAATTCAAGATGAGCAGCTTTTATTTAATACCAACTGCCTGACAGATCCCAAAATTGATTAAATTTTGTCATTTTTACAAAATTTACAGTATTTCACAGCTGAGGGAGAGGGTGTTTTTAAAACAGCCATGGGAATTTTGCTGCCATTCACATTGGTTTGGCAGTTTTCCAAGCAAAAAGGTAGCATTTAAATCTTGCTTTAGATTACAGGTGTCACTTAGCCACTGGGAAACTGAACATACATTCTACAATAGCACCAGAAATAGCTGTGGGCTAAAGTTATTCCCACAGAAATCTGCTATTAGTCCTCTCCTCTCCTTTTGTTTCATTTCCTTCATCAGACAGCTGCTTAACAAGTATCTGGCTCTGAAAGGGCAGGGATAGCTCCTGCCTTGGAAAACACATGCCTTGCTGACTGCAGTTCTCTCAGAGACCATCTGGGCTAGGGAATTCATGACAAGTTTGTCACAGAGTGACTTACCTTCTTTTGCAGGGAAGTCTCTGATGTTTAGTGCAATAAATCAACAGAAGGAACAGCATGGTTGCAAGCTGAGAAGAAAACAGATTAGGTTCTTTGTGGTTATGCTTGGCTTTTGGAGTATGTGCCAAGGACTGCTTCATCCATAAAATATGAAAATTTCATTCAACGCCCATTTTCCCTACAGATTTCTGTTAAGTTTTTAGCCGAGGCTAAACCAGAGTAGCAGGAGAGTCCTCCATCTTATCACCTCTAAAGTTGGAGGTAGTGGGGAAGTATGAACCGAGTATCTTTTTGGCAGTACAAAAGGCAGATGCCAGAAGTGCCAGCTTTCAGCAGCAATTTCTTGCACATTCTCTGCTGTTTGAGATCAAGCTGGTAGACTTGCCTACAGGAAAATCTGTTGTTGTTCTTCAGTAGTTGGTTCCTACTCGGAAGGAAGGAGTTTTCCTTTCTCTTTCCCCCTGAGCACAAGTTAGTGCCAAAGCTTATGCTGCATGAAATGAGCAGAAGGCTCAGCTTCCATACTGTGCTGAACTTAAACTGAACTGAACTAAAAAGTAAGAAATGTACTCACTTTCCTAATGCCAGGCAAAAACATTAAGGCCAAAGGATCCTGTCCCCACCAGGATATGCCAATATTTCTTACGCATTCAGAACAGTCAGTGGATTGGGCTTATCCCCATTAGTGCATAGGACTTAAGCTTACTGTCAATCTTATATATATAAAGCAAATTCTATTCAAATATTGCATCTGGATAGGCTACTAGAATGCCATCACTGTGCACTTCCCTTCAGATACAGGACAGAACACTCAGGTGAAGTATTTCAGAGGTACTACAAAATATCCATATAAATTGCAACCTAGGGATTCTGGTTATGGCAAATTTATTTTACAACGAAATTTTCTTGTCCTTTTTTCTTAAGAAAAAGCATTGATATAAGCATTAGGATTTGCTTTAATATTTTCTGTCAAATATATACTTTTATATATTTTCCACAAGTAAGTCTAGAAAAATTATTGCAAAGTGAACTGATCCTTAGATTTTAACACAAACTCAGACCACTAAGTTAATATTTTCTTTTCCCTGTACTGTTTAGCACTTTTTGAACCATACGAGAGAGAACGTAGTTTGTTCTGTTAGGAAGACACAAGTTAGCCCTTGGTTGATCCAATCTCTCCGTTCTCAAAGATGCAGTGAGACATTGTACCATGGATGAATGGTATCAACACCTGCCCCAGACTGTGAGTCTGAGTTCAGTCCTAGTCTCCTGCTGCAAGCTTCATGTAACTATTTTGTACAGTAATTATGCATTTAACCACACAATGTCTGCAGCCTTTGAACAGCCACCTATTTAGATCTAAGTGTGTGTACATACAGTAGAGGTTTTCATTGCTTTATCTAAAAGGACATTGAAATCGTTTGATAATACCAAAGAGAAGTAGAACTCCTAGGTTAATACTGGCTTTATACATTCTCACATCAGGGCAGATGAAGCAATCATGTATACTTTGATACACCAGAGGCTTATTTTTATACCCATGAAGGCAGCTACCATCATGTTACACTTCAGAATCCACGAAGAGCTTAAGTAAAAACTAACTGGAGAAAGCTTGTTCCCTTACTTGTACTACATAGCAATGTGTGTTCATTTAAGTCTGTCATATTTATGATTATGGCTTTTATGAAGTTTAAAATAAAATGAGTTTTCCATTAATTTATTAGACA\n>XM_017957302.2 PREDICTED: Papio anubis enhancer of zeste 2 polycomb repressive complex 2 subunit (EZH2), transcript variant X5, mRNA \nTGCTTGATTGGGTTGGGGGGGCCAAATAAAAGCGATGGCGATTGGACTGCCGCGTTTGGCGCTCGGTCCGGTCGCGTCCGACACCCGGTGGGACACAGAAGGCAGTGGAGCCCCGGCGGCGGCGGCGGCGCGCGGGGGCGACGCGCGGGAACAGCGCGAGCCGGCGCGCGGGACGAAGAATAATCATGGGCCAGACTGGGAAGAAATCTGAGAAGGGACCAGTTTGTTGGCGGAAGCGTGTAAAATCAGAGTACATGCGACTGAGACAGCTCAAGAGGTTCAGACGAGCTGATGAAGTAAAGAGTATGTTTAGTTCCAATCGTCAGAAAATTTTGGAAAGAACGGAAATCTTAAACCAAGAATGGAAACAGCGAAGGATACAGCCTGTGCACATCCTGACTTCTGTGAGCTCATTGCGCGGGACTAGGGAGTGTTCGGTGACCAGTGACTTGGATTTTCCAACACAAGTCATCCCATTAAAGACTCTGAATGCAGTTGCTTCAGTACCCATAATGTATTCTTGGTCTCCCCTACAGCAGAATTTTATGGTGGAAGATGAAACTGTTTTACATAACATTCCGTATATGGGAGATGAAGTTTTAGACCAGGATGGTACTTTCATTGAAGAACTAATAAAAAATTATGATGGAAAAGTACACGGGGATAGAGAATGTGGGTTTATAAATGATGAAATTTTTGTGGAGTTGGTCAATGCCCTTGGTCAATATAATGATGATGATGATGATGATGATGGAGACGATCCTGAAGAAAGAGAAGAAAAACAGAAAGATCTGGAGGATCACCGAGATGATAAAGAAAGCCGCCCACCTCGGAAATTTCCTTCTGATAAAATTTTTGAAGCCATTTCCTCGATGTTTCCAGATAAGGGCACAGCAGAAGAACTAAAGGAAAAATATAAAGAACTCACCGAACAGCAGCTCCCAGGCGCACTTCCTCCTGAATGTACCCCCAACATAGATGGACCAAACGCTAAATCTGTTCAGAGAGAGCAAAGCTTACACTCCTTTCATACGCTTTTCTGTAGGCGATGTTTTAAATATGACTGCTTCCTACATCCTTTTCATGCAACACCCAACACTTATAAGCGGAAGAACACAGAAACAGCTTTAGACAACAAACCTTGTGGACCACAGTGTTACCAGCATTTGGAGGGAGCAAAGGAGTTCGCTGCTGCTCTCACTGCTGAGCGGATAAAGACCCCACCAAAACGCCCAGGAGGCCGCAGAAGAGGACGGCTTCCCAATAACAGTAGCAGGCCCAGCACCCCCACCATTAATGTGCTGGAATCAAAGGATACAGACAGTGATAGGGAAGCAGGGACTGAAACGGGGGGAGAGAACAATGATAAAGAAGAAGAAGAGAAGAAAGACGAAACTTCGAGCTCCTCTGAAGCAAATTCTCGGTGTCAAACACCAATAAAGATGAAGCCAAATATTGAACCTCCTGAGAATGTGGAGTGGAGTGGTGCTGAAGCCTCAATGTTTAGAGTCCTCATTGGCACTTACTATGACAATTTCTGTGCCATTGCTAGGTTAATTGGGACCAAAACATGTAGACAGGTGTATGAGTTTAGAGTCAAAGAATCTAGCATCATAGCTCCAGCTCCTGCTGAGGATGTGGACACTCCTCCAAGGAAAAAGAAGAGGAAACACCGGTTGTGGGCTGCACACTGCCGAAAGATACAGCTGAAAAAGGACGGCTCCTCTAACCATGTTTACAACTATCAACCCTGTGATCATCCACGGCAGCCTTGTGACAGTTCGTGCCCTTGTGTGATAGCACAAAATTTTTGTGAAAAGTTTTGTCAATGTAGTTCAGAGTGTCAAAACCGCTTTCCGGGATGCCGCTGCAAAGCACAGTGCAACACCAAGCAGTGCCCGTGCTACCTGGCCGTCCGAGAGTGTGACCCTGACCTCTGTCTTACTTGTGGAGCCGCTGACCATTGGGACAGTAAAAATGTGTCCTGCAAGAACTGCAGTATTCAGCGGGGCTCCAAAAAGCATCTATTGCTGGCACCATCTGATGTGGCAGGCTGGGGGATTTTTATCAAAGATCCTGTGCAGAAAAATGAATTCATCTCAGAATACTGTGGAGAGATTATTTCTCAAGATGAAGCTGACAGAAGAGGCAAAGTATATGATAAATACATGTGCAGCTTTCTGTTCAACTTGAACAATGATTTTGTGGTGGATGCAACCCGCAAGGGTAACAAAATTCGTTTTGCAAATCATTCGGTAAATCCAAACTGCTATGCAAAAGTTATGATGGTTAACGGCGATCACAGGATAGGTATTTTTGCCAAGAGAGCCATCCAGACTGGTGAAGAGCTGTTTTTTGATTACAGATACAGCCAGGCTGATGCCCTGAAGTATGTCGGCATCGAAAGAGAAATGGAAATCCCTTGACATCTGCTACCTCCTCCCCCTCCTCTCTGAAACAGCTGCCTTAGCTTCAGGAACCTCGAGTACTGTGGGCAATTTAGAAAAAGAAAATGCAGTTTGAAATTCTAAATTTGCAAAGTACTGTAAGAATAATTTATAGTAATGAGTTTAAAAATCAACTTTTTATTGCCTTCTCACCAGCTGCAAAGTGTTTTGTACCAGTGAATTTTTGCAATAATGCAGTATGGTACATTTTTCAACTTTGAATAAAGAATACTTGAACTTGTC\n>XM_028016850.1 PREDICTED: Xiphophorus couchianus intraflagellar transport 27 (ift27), transcript variant X1, mRNA \nACCACAGGGAACGGTTGCTAGGAAACGAGCTTTGTCCATTTTTGCCGAGGCGAATGGAAGATTAAAGCTGCTAGCAGGAATGCTATTTAATTTATTAACAGACACTTACAATATTTCTCACGAGGTTTCGAATGTACGCCGAATAATGGTGAAGTTGAGGGCAAGATGTCTGCTTCTCGGGGATGCTGCAGTGGGGAAAAGTTCTCTTTTTCACATCTTCTACAATGATGGATCTCTGTTCCAGAAGAACTATAGCTTGACAACGGGAGTGGAGCTGGTGATGAAATGTATCAACATTCCAGAGACCAACGACTCCGTGGAGCTCTATATCTTAGACTCGGCGGGGAAGGAGACGCTAGCGGAGGGCTGCGAGAAAATGGTCAGAAGCTGCTCTGGATTCTTCTGTTTTCATTTGCATGAAACTAATCAGTGGGGGGAGCCATCTTTGCTGTGTCTGGTGTTCGATTTGACCAGTGAGCAGTCTTTTGCTAACTGCGCATGTTGGATGGAAAGAGTCCAAGCACACTGCAAAGGCCTCCGTGTGCCAGGTGTTCTCGTGGGAAACAAGTCGGATCTGTCAGCTAGAAGGGAAGTACAGGCGTCCGTGGCCGAGGAGTGGGCCCAAAGCAAGGGACTGGAGTACCACGAGACATCAGCTAAAGAGATGGTCAACTGTGATGCCCCCCTCCTCAGTTTAGCACAGTCCTTCTATTCTCTCTACCAGGAGCAGCGTGAGATCATGCAGAACCTCGGGCCCGGCTAGACTCCTCTTCCTTCACCACAGAGCTCACAGCCGTTTGAGACGAACCACTGCGAAGGAATTGCTTTAGGAGAATAGGATTTTCTGGCAAGGATACTGAAAGGCTTTCTGATTGTTTTTGTTTTAAATAAAGGACTAAATAAGGAGCAA\n>XM_015847342.1 Paracoccidioides lutzii Pb01 hypothetical protein (PAAG_11752), partial mRNA \nATGCAAGGACCAGAATATGTTTTAGATGAGCGGACGGAGCAATTGTTAACCCAGGGGACCAAGGGCGGATATGAGAATGGGTTCACATTTAGAAAGTTGCGGCTGGAAATCTCCTTTATTCGCAATCACCCATGGATGAAACGTCTCACTCCTTTTCCCTTTGGCCCACAACAGATGCTCAAAAATCAATTATGGGGAGTGTCTCCGCTATCATTTTCTCGTCCACAGACAGAGGAGGTCCCTTTGGATCAGAAGGCTCAAAATAATAGTGGATCCCAATCCCGCATCTTGGAACAGCGTGCCCGAAGGGTCAAAGCACTTGCTATCGCTTGTGGCGCTGGAGATGGCTGA\n>XM_018786474.1 Plasmodium gaboni hypothetical protein partial mRNA \nATGATTTTTAAAAGGTTCTTCCATAAGTATCCTGGAGGAAGTAAAATAAAATGTTATATAGAAAAACGAAAGAAAAAGAAATTAAATATAAGTTTATTTCATCAACCTCTATATTCTAAGAATTCGAAAAATTTTATTGATTGGAGATATAGTACTCCTAAGTCAGGGTATGAATATATGTATATATATGGAGAGAACACTATTGAAATAACGAATTTACCGAATAACAAAACTAATGAATATATTCAAGAACGTCTAAGAAAAAGTTTAAATAAATATGGAAGATTAAAAATTATCAGATGCTTAAGTCATAGGAATGATCCATATATAAATAATAATATTTGTTATGCTACATTTTATAATAGAAAAGATATGTATAAATGTATACGTAATATTAATATAAGACTTCCAATATCTTTACAGTATAAAATATTAAAATTTAAAAGTTTACTTTCCAATAAATGTAATGATTATAATTATTTTTTTAAACAAGACCATTATAATTACAGTGCTATAAATATAGCTTTGAATTTGTTTAAATATTTAGAATATAATAATTGTAGTATGAATATAAAGGATATCTACAAGCATGTATTTGAATATTCGTTTTATCCTCATAAAATTATTTCTTCAGGAATATCAGTTTATAAAATATTTAAAAACTGGACAAATTTTATATATTTTTTTGATAACTTATTTCATATTGTAAAAAAAGATGATGATATTTTTATTACAGCCAAAATTCTTAATGATCAAAATTTATCTATTTATTTAAACAACAAATTAATTGAATTAAAAAAAAAAACGGAACAGAGTAATTCCGTGTATTGGAGGGAGCACTCTTTACAATTACCCGAAGAAATTGAAAATAGAATAAATAACGATCGTCCAAAAAAGTTAAAAGAGGAACTGCAACTTTTGTCCAAGACAAAAGATTTTTACAAGATTCATGACGAACGACACTTATTTAAACTGAAATTAAACAAGGAGCGAAAAGAAAAAAAAAAGATGTTAAAAAAAAATAAGCAACAAGAAAAGGAAGAAAAGGAAAAGGAAAAACAACTTAAGAAGGAAATGTACTGA\n>XM_046923823.1 PREDICTED: Gallus gallus integral membrane protein 2C (ITM2C), transcript variant X1, mRNA \nGGCAGTGAATGCGCTCGGCTGCAGATGAGCACTGTAACTTTCCATGGAAACTGCTGCATTGATTCTCTGCCTTTGGCTGCAGGAGGAGCAGGCTCCCGTGGTGCAGGGCCGCAGGTCATCGCTCAGCGGGGTGTGCTACCTGACCATGGGTCTCCTTGTGCTGCTCCTCGGCTTGGTCTTTGCATCAATGTATGTCTACAGATACTTCTTCATCACGCAGCTTCCCCGTGAGAGCGTGTTTCATTGCGGCGTCCTTTATGAAGACTCGCTGTATTCACCGTTCAAAGGGCAGCTGGAACTGCACGAAGATGTCAAGATTTACATCGAGGAGAACTACGAGCAAATCAATGTCCCGGTGCCCCAGTTTGGAGGGAGCGACCCTGCAGATATCATCCATGATTTCCAGCGAGGTCTAACAGCTTATCATGACATAACGCTGGATAAATGCTACGTCATTGAGCTGAACACCACTATCGTGATGCCTCCACGCAACCTCTGGGAGCTGCTGGTTAATGTGAAGAAAGGGACGTACCTGCCTCAGACATACATCATCCAGGAGGAGATGATTGCGACCGAGCACGTCAGCGACATGGAGCAGCTCGGCTCCTTCATCTACCGCCTGTGCAGCGGCAAGGAGACCTACAGGCTGAAGCGGAGGAGCACCAGGAGACGTATCAGTCGACGTGAGGCTGGGGACTGCCACCGTATTCGTCACTTTGAAAACACTTTTGTGGTTGAAACTGTTATCTGCAAAAAATCATGAAGCCCCTGTCCAGCTGTAACCTTCCGTGGCTTTGCTTGCACACACATGCTCTCAGCCCTCTTTTTAGACTTGGTAATCTGTCTTACTTTTTTTACGCCCTCTCCTGCTTGTGCAGCTCTAAAGCCTTGGGTCTGTCGTGGCCTCGCAGTTGATTCTCTTCTCTTTTCTCCTTACTGAGATGTTTTGCTGGGCTTAAATTTATGCAGCGGTCACAGATGGCCTTGGAGTGGATGCAGCCTCTTCCACCCCACAGGGTGGGGATCTGTTTTGGGAGCAGGTTTTGGGTAGAAGGGACGACCAAGAAATAGGATGCTGGAAATGGGCGCTCTTCTCATGTCTGAGCAGTTTCCTGCTGGCGCTGTTGTGAGGCTGGGGCAGAAGGTGTACTACAGGAGGAGAATTACCATTCTGATGCTGATGTAACGACCAGAATATGTCATCAGATGGACTTAGAATTAGATGCGAGGTTACAAACAGGGTGATTTGGAAAGCTCAGCAGGAGAGTTTCTGCCCACGCTGAACTGTGGTGCTCACAGTTTGTTGTCCCAATGAAGGCCAAGTTTTTGAACAGTGAAAGCAGCCCATATGCATTGTTTCTGTGTCTAGCTCCTGGCTGATTTGGAGTGGCATACCTGGAACCAGCCAGGCTACCCTCCCTCAGCCTTCAAAATAACAAGCAAGTGGTATCTGCTTGGGGCTCCTGAGCTCATCTGCTACGGCTTTGCCTGAGTAAATAGAGGTGAGCCGTCAATACATGCTGCCAAAGCTCAGCTGATGTCCCATCCTATGGGCTGCTGATGAAGCTGGATGCTTTATTTCAGCTCACCTCTCCAGGCCAGCTCCTCCTGCCTGGAAGATGAGTTATGTGAGTTATGTTCACATAGATCTGTCTTTCTGAGTTGTCAGGATCCCATCTGTGTGTGGATGGGTGCCATGCCAGCATGCAAAGCGGTATCAGCAGCAGGATCAGTAGTTACTGGCATCTGCAGAAACAGGGTGGTTTTTTTTGTTGTTGTTGTTGTTTGTTTGGGGTTTTTTGAGAGCATATTTCCACAGAACTCCTCTGAAGAAAGCCATTTTGATCATAACTCCTGTAGCCCAGCTGTGTGTTGTGTCATCTGTAGGCACCGCTAGAGAGCAGGTGTCGATGCAAGGCAAGATTCAGTGCATCAATATACTGCAGAGAAATTGTATGAACAAAATTGTGTTTCTATTGATCATCAGAAAGAAAAATTGCAGGGTACTTAAACATTCTTCCCTCTGTTCCATAAATATAGTAAAAACTAATGAGGTTCTTAAAATGCAGGCAGTTTTTTGGCTTGAAAGAACAGCTTGGCACATTCTTGTTAATTGGTTTTCAGCAAATCTGGACTTGTTCATCTGTTGAAATGAGCTTGTTGTTTCGGGAAGAGAAAGGATAAAGTAAATGCAAGAACAATCATTAACTCAGCAGGACCAAAAAAATTAATGTATTTGAGAGTCAAACTTCTATTAGTAATACTGTGAGCTAATTATATGAAAACAAAACAGAACCTTAAAATGATCGCATAACGCAGTAGCAATTAGTATGTCCTTAGAAGCTGAGGTTCTTATTTTTTTATATAAAAATAGAGTCAACCATAAACATTAGATTTTAATAGGTAGAGGAGGAGGTGCTGATCACCTGCTTTTTAAGGTGGATGTGAAATGTGAGATTGCATGTGTTTCGTGCAGACCAGTGAGGAAAGTTTCCCACTGCCAGAGGAGTATTTGCTTTTATAGTACAGCTGTGTTTTTCCACTACAACTTGCTATTAGTCCTAACCTTTCATTGCAAAGTGAATGATGAGAGTCAGAGAATCGGTTTGCTTGGTGGAAGTAGCACAAACTGGTAAATTTATGCCCTGCATTTCTCTCTGTTTCCAGGATCCTAAGCCTGCACTCAGGTGAGCGCTCAGACCTTTCCCCTTCCCTCTGATGCTGCATGAATTAACTGGTCATTGAATATGCTAACTCTGTGCAACCCCGCAGCTGTAAGGACAAGCCCTGATTCTTTAAGGTGAACTAACATGGTCGCTGTTTCATAGGGTGAGAATGCAGTTGTCTAGAAAGAAAACACAAAATGCTTTGTATATTTTGTCTGGTAGAACCTTTACCTCTTAGGAAACATTCATGGGATAATAAAATCTTTTACCTCTGATA\n>XM_008488083.3 PREDICTED: Diaphorina citri protein rogdi-like (LOC103523006), mRNA \nGCACGATGAAGTTCGAACAGTACCAGGCCGAGAACTCAATACCATGGCTGAATGAGGTGCTCGTGCTGTTCACCGTGGCACTTCAACTGTGCCAGCAACTCAAGGATAAGATCAACGTGTTTGCCCAATACAAGGACTTCATCGTGTCACCTAATCTCTCCACACCTAGTGCTACCTAGTGGTAATTATGTAGATTAAGAAAGTGTGTACAGGGTGGTCCCATTGATGAGAGAGGGTTCACTGCAGATCATGGTTCACACAGTATATTATTATTGCACAA\n>XR_001166349.3 PREDICTED: Fundulus heteroclitus uncharacterized LOC105928738 (LOC105928738), ncRNA \nCGTGTCTTGCACGTCGTCGCGAACGTTCGCTTGCTTCCGGCTTCCGTAGTCACTTCTGTGGCCACCAGGGGGGAAAATGACGGCGTGGAAGATGTGCGGTAAGCAGATGCATAGCTTTACCCTCGTGGGAACTACAGAAGCCGACGTCACGTAACTGCGCTTCGCTGAACGGCTGTTGTTACGAAGAAGCAGGGGATGATCGTCCGGTAAGGGCCTTCCAACGCCAGAGGAGGAGCAGGACAGATGTGCTTCCGAACGCATTTCAGTTTGACTGGGAGTCGTATGAAAATGCAGCGGAGCTTTTTGTCCCCATTGGTAAGGTTGGTTAACGGAGGTTAAAGAATATTAAATATATTGAGGAATTGAAAAAATAACGGGGATAAAACCTCGCGTCTACCTGAACGCAGCTTTACTTATTTCTCTTTTGTTCAAGCATCAAATGTTAGCTTCAGATGGAAAATAAATGTGACAATATGGGGGAATTCCCCCTAAGTGTGGACACTTTAAAAATGTGTGTGTTTAAAGACACATTTCCTTATTATAAGAGGAGCCGTGTGAAATCCCCAAGTTGTCTTCAGCACGTAGCAAGTCGCTTTCGGTTTTATCTGTTTATGATGACTTCCTTGTCATCGTCTCTTTGATGAAACAGCCATTTACTTTAGCGCTAGCGGCTAGTCCAAGTGGGCCCTAGGTCAGTATGTTCTGGGAAATCAATCCAATATCAGAAATATCCTAATGGTTCATGTGAATTCTACTTCATGAACACAGCTGTCAGATTTACACTAGAGGGTTATTTCTAGAGAACCGTATGGTTACAGCAGATAAAATTAGAAATGGACACAGGAACAATTTTCTCAGTAAATGTATTTCTAATACTTCTATTGAGGCCACCAGTAAATATTAAACCTTGTGATATTTATTTGCACATAATGGCTGGAATATTTTCTAAATACTAACAAGCCTTTGGCTGGTTTCTTGGCTTTCAATGCCTTTTGGTACATCCTTTTCTCATCCACCCTTCCACTTTATTACACATGACTCGAATTTATAGACTAATTTGCTTTGATTTCTGCATATGTGAGGATTACTTTGTGTGTTGCTAATATCCGTTGTGAATTTCATCTCAGTAGAAAGTAGGGGCATCCCGATACTGATTTTTTTTTTTTTCAGACCGAGCACGAGTACTTTAGTTCAGATACTTGCTGATTGCAAGTGCTGATACTGAGTATACTGATATAGCTTTATTTGATCATAATCAACTGGATTTTGGTCTTTTTGGTATAAGCATACAACGTGGCTCTATACCTTTAAAGACAATGTGCATATATATTTGAGAGTGGATATGTTTTAACGTAGTAGAAGACCGTTTTGGAACTTTGGGATTTTAGCGCTTAAGCAGATCAGCTTTAACACTGGAAGAGTTATGTACTACAGGCAAGGCATGTTCATAACCTCTAACAGAACGTGACAAACCTGAGCTACCCCTTTAAGGTCGCTCCATGAATGATAATATTTAAGTTGGTGGAACCTTCACAGGTGTTAGCTAAACGTTTTGCTTTTTAAACCCTTTCCAGAAAATAATCTGTGGATGTTTAAATAGATCCTATGTTACTCCTCCTGAGGAACCTGCCTGCAGCCTACACCCAGCTCCATGCCTTTGAGTTAAGTCCGTGGCAGATATAGTTAAGCCCAAAATGATTTACAGCCCTAGAAGACTTATGTTAGTATTTTTAAAATATTACTTTTAAACGAGTTTCTTCTGGCAGGAAGTAATAGCAACGTTCTTGAGCGACTCGTCCTTAGTGCTGGCTTTAATCTGGTAGAGAATCAGCGGAAGCAGCTAAAGATTAGGGTGATTGCTTGGAGGCCTTTCAACCTTGGAGGCTTGGTGCTAATCACCAACAAAAAAATCTTTGAAATATGAGTGGAAAAATACAAAAAGATGGTCAGCAATTTTAGGACAGGTTGAATTGCTGTGATGCCAATGAAGATTAGACCTTGGGCTATTGAGAAGGATGTGCACATTTGGCATAATATTTTGAATAAAATGTAAAACAAGAATGAATTGAAGCCTTCCATTTACATTTTTCAGTATATTTTGGGAGATGCCGCTCTCATTTTTTATCAGAAACAAATGCAAATGATTTAAAATCAAAATCGTCCAGGGGTCGGAATAATTTAGGTTTAACTCTTATTGTCTGTAAAAGTGCTGAAAGCCTGAGTTCTTTTAAATCAAGATTAAAAACACATTTGTTTAGGATTGCCTTCGACTGTTCTAGTTAAACTGTTTCACTGAAATATAATT\n>XM_024809453.1 [Candida] sorbophila hypothetical protein (B9G98_02896), partial mRNA \nATGGATCAACCATCTTTTACTATGGCCGAGCGGCTGTATAAAAAGGCGTACTCTGCTTCGTTCTGGAGCCAGAACGATTCTAAACACGGGTTTGACTCAGAGACCACGACTATTGTGCCGCATCTTGCCGATGCGCCCTTGTCTTTGAGACAGAAGGCACACATTTTGCTAGGGGTTTGCAAAATCATCTCGTCAAATGGGCGAATACTGAGTATAGAGGTTATACGGACCTGGAAATCGATGAACATTGTCAAATCTAAACCTAAAACAGACCCGCTACTGCTACCTGCTCGAAGGTCTCGCTCCCACACTCTCCCAGAGAACCCGCTCATCAACTTAGAGCTGGAAAAGGACTGGCCACCTTATAAACTGCCCAAACTCGCCTACACCCAGACACCGTCGCATTCCATCAGCGATTCTATTCGGTTAACAGACTTCCCCTTGGACCAAACCGAGTCCGACTACTCTTCTGTCACAGAAAGTATGCTTTCATACCAGAGTGATTTATTTGGTAACGCGAATCAGGTCTTGTTTGATCTGACGGAACATTCCGATACTCCTTTCAACCAAGTAACGCCAATTGCTTCGCCAGTTACGTTCAGTGAACCAGTCTACCCCGATGAACCGATCGAGCCTTTAGATTTCAGCGAACCGGATGAAACAGAGGACCCTACAGAAGCAAGACAAGATCCCTCAAGGAAATCTAAAGTGACTATTCAAAAAGAGATATTTTATTCCCAAGATAAACTAAATGAGTGGTTTGATGGCTATGATGAGTTCTGCAAAAATGCCTCTCGGCCATCGAAGAAAATAACATTTGAACGATTGTTTTGGGGTCGAGAAACTTGGTCTGCTAGGCATAATCGAAAACGCAGAGAGGCTGAGCTGCTGAAGAAAAACAAAGCAGCACCACCGGCCATGCCGACACCAGACCTGATAACACCAGACCAGAGCTCTGATGCGGATGAATCCCCTCATCTAGACGCTTTCGACAACCAATTTGATATAATGGATGATGCAGACAACAGTGATATTGAATTTGATGAGACACCGGGAAGTCCAATGCTGGAACTTCGAAAGGGGGAGTTTGAACACACCCTGGATACAGTGGGTCTTCTTCCTGAATCGTGGGATGAATTACCGCCACACCCACGTATCTCTGGGAGCTTTCAAAGAGACCAAAACGAACTTCAGGGTTTCTTACAACAGTTGACTGGCCAAGATGCGTTGATGGCTGGCCGAGTCACAGAAGAGGACGATGTGGCAATATTGGAAAAAGTAAACACCCTTGGTGGGAAATGTCTGTTTGATCAAGTCCACACAGCAACTCGTCTGAGTAAAGGGCATGCGTTTTTCTCGGTTTTGCGACTCGCTCAACAAGGCAAACTATCGCTGAACCAACCAGACGTGTTCGGAAAAATAACGATCCAGTCCTCATTTAGACCGCATTAA\n>XM_044046427.1 PREDICTED: Solea senegalensis ret proto-oncogene receptor tyrosine kinase (ret), transcript variant X1, mRNA \nTGATACTGAGGAGGACTTCATCTCTCTGTGTCTGCCCAGACAGAGAACCGCGCACTCGGGACGCACACTGGTTTATACATCGCCCTTTTTTGACTCTTGTGGCTTGATTTTTTTTTTTTAACTATTTAAAGATTTTTTGTATTCTTTTTGCCAAAGGAACTTTTTTGAAGTCACGTTTCATTCACAAACCTTTACTTATGGTGCGCGAAAATGGGGTTAAGTTCTGGTTTCTCTCGTGGAAACATCGCCGTGTTGATGCTGCTGCTGCTGCTGCTTGAAGGAGTGACAGGGTTGTACTTTCCTCAGAAGGAGTACATTGAGACGGTATACGTGGGCCAGCCTGCAGGTACACCGATCCTCCAGGTCCACGCTATGCTGGACAACGACTCCGAGCGGCCGCATTTCTACCTGTGCTGGAGCGCGCTCAAACGTCCACCCCACAACTCCTGGTTCCACATGGACATTAACACTGGAATATTGTCCTTAAACAAAACCCTTGAGGAGAGCGACTTCACCTTCCCAAATCAACATTCGTGGTCAGTGAAGAAGTTGGTCCTTCATGCCACAGTCTTACCCAACGTCTCCAGGAAACCTCACTGCATGAACAAAAACGCCCCTCGGATCACTCTGGACTTTGTCAACGCCACATTGCCACAGTGTGCTCAGACAGATATGAAGGAACTGTGCTTCCCCCACAGAGACACCGCCAACCCTCACATAATGGAGAACAGGTTCCCCGGGGCCATCAGGCAACTCCGACGTCTTACCAGACTCAACGTTTGTCCTAACTACACCATCTCTTATAATGTGGAATCAGAGACCCCAGCGCCATTTGCTGTGAACGACAACTCCACAGAGTTGGTGGTGACCGCTCCATTAGACCGCGAGGAGAGCGAATGCTACAGACTCCTGCTGGTCTGTACAGTCCGAACAGAAACAGTCATCACCAAGGTGGAGACTTCCCTGGACGTGTTTGTTATGGACGAGGATGATAACGCACCATATGTAAATGGAACAGACGCAACAGATATTATCATCAGCTTCAATCGTACAAAGGGTGGCTCCTTTGGAACCTTGTTTGTCTTTGACAGGGATTTAACCCCCATTTTTCACATTGACAAGAGTCACAGTAAGTACAGGGGGACCTTGCTCAACAGTGATGCATGGATAAATAAAACGTTTGACATAAAAGGCACCTTCAGTGAAAAGAAAGCTGCTCATGGAGGCATTCGAGAGACCATTCACGACTACCAGCTTGTCCTGAAGAGGAACCTGTATGTGAATGAGAATCGCTCCGTGCAGCTGGACTACCTGGTCAATGACACAACCTACCCTGGTGTGGAGGGAACAGTGTTGCTGCACTTCAACATCACCATCTTACCAGTGCACATCCGCTTCGCAAACGTCACACACACGTTCACACTGACACGTAGAGCTTCCGTTTATGCTCAGGTTGGCAGAGTGTGCGTGGAAAACTGCCAGCAGTTTGATGGCTTCAGTGTCACGTACCGCCTCGAGGTGCCAGATAGGAACGCATCTGCTGACTTGCAGTTCTGCTATGGAGCCATTAGCATTACCCAGTCTCCTGGCGAGATGTGGGGACTGCTCTATGTGAACGACTCGGAGGCTTTGCGCAAGCCCGAGTGCCAGGACCTGCAGTACTTTGTTGTCGCCCAGGAGGAGCACACAAAGCAGGAGGCCACCACACAGATCCACATCCAACTGGATAGTGAAGTAAACAAAGGCAGCCAGGAGAGCCAGCAGTTCCTGTCCTGTGCCGAAAACAGGCGACGGGGAGACTGTGAGTCTGTCCGAGGCCTGGGGGCAACCACAGGGAGCTGTCAGTGGAGGCAAGGCACAGAGAAAGGAATATCTGAATATTACTCAACCTGCTCGCCTGATCTGCGGACGTGCCCAGATAGCTTTTGTGATGCAGTGGAAAGCAAAGACCCATTAATATGCCCACAAGACTGTACAAAGGAGACCGTAATTGGAGGTCATGAACGAGGTTTAGGGAACGGGATTAAAGCTGGATATGGAACCTGCTACTGCTACTCTGAGAGATGCTTCTGTGAGAAGGAAGATATTGAGGAGGCGATATGTGATGACATGTGCAAGACCATCATCGCCACGTCTCTGCTGCTCTCCTTTGTCGCCTCCATCCTCCTGTCCTCATACTTCATTCACCGGTATCACAAGAACTCGCCGAAACCACCGATAGCCTCTGCAGAAATGACGTTCCGTCGGCCAGCTCAGGCTTATCCCATCAGCTTCCCTGCAAACAACTTACGCCGGGGCTCACAGGACTCTATTGAGCCTGATACCTTTAAAATCCCTGAAGATCCAAAGTGGGAGTTTCCTCGTAAAAACCTTGTACTTGGCAAGACTTTAGGAGAAGGAGAGTTTGGAAAAGTTGTCAAGGCTACAGCTTTCCGGCTGAAAGGAAAAGCAGGTTACACCACTGTGGCTGTGAAAATGCTTAAAGAGAACGCCTCACACAGTGAGCTGCGTGACCTGCTGTCGGAATTCACTTTACTGAAGCAAGTCAACCATCCGCATGTTATAAAGATGTATGGAGCATGCAGCCAGGAAGGACCATTGTATCTGATTGTGGAGTACGCCAAATATGGGTCGCTCCGCAACTTCCTGCGCGAGAGTCGGAAAGTTGGCCCGAGCTACATGGGCAGGGACGCCAACCGAAACTCCAGCTACCTGGAGAACCCAGATGACAGGGCGCTCACCATGGGCGACCTGATCTCCTTTGCATGGCAGATCTCCAGAGGCATGCAGTACCTGGCTGAAATGAAGCTCGTTCACAGGGACCTTGCAGCACGAAACGTCCTCGTCGCTGAGGGAAGGAAGATGAAGATCTCAGACTTTGGCCTCTCCAGAGACGTGTATGAAGAGGACTCGTATGTTAAGAGGAGCAAGGGCCGTATTCCTGTTAAATGGATGGCAATAGAGTCCTTGTTTGATCACATATACACAACCCAAAGTGATGTCTGGTCCTTTGGTGTGCTGCTGTGGGAAATAGTGACACTGGGAGGAAATCCATACCCAGGCATCGCTCCTGAACGCCTCTTTAACCTCCTCAAAACTGGCTACAGAATGGAAAGACCAGAGAACTGCTCAGAGGAAATGTATAACCTCATGCTTCGGTGCTGGAAACAAGAACCAGACAAGAGGCAGACATTCTCAGACATCAGCAAAGAGCTCGAAAAGATGATGGTGAAAAGTCGGGATTACCTGGACCTTGCAGCTTCCACGCCTGCCGATGCTCTGCTGTACGATGACGCCCTCTCTGAAGAGGACACTCCACTAGTGGACTGTAATAACGCCCCTCTCCCTCGAACCCTCCCTTCCACATGGATTGAAAACAAGCTCTATGGCATGTCATACCCGAACTGGCCTGAGAAGAGCCCGGTACCGCTCAACAGACATGATGCCACTAATCCAGTCTTTACAAGATATGCCAATGATAGTGTTTATGCAAACTGGATGGCTTTGCCTTCACCCGCAAAAGCTGTGGACAAGCTTGATAGCTAAAGACAAACCGACACTGTAGAAAAGATGACTAATTGGTAGATGTATATATTTCTATAAGACTGTATATATATACGATCTGATGCTAAAGTTGGTTCCCTTTTATTTCTGTTGCATGGGTTGCATTCAAGGTTTAAAGCTGAGGTGTTTTGGCTACTAAAACTGGCTGGATCAACGTAGACCATGCTTCATTCTGCTCTTCAGTATGTTAATTATTACCTCATGGGTCATGTTGGCCAAGTTGTATCACTGCATGACTAGTGTACCAGATTGTATGTCAGTGTCAATGTCTTTAAGTGCCTGTGCCGCTTCTACAATACCCTCCAATTGTTAATGTGCGACCGTGAAGATCTTGTTCCAGCCCAGGAATTAAAGGGGACGTCTTTACCATCACTGTTGTAGACAGCTGGGATTGAGTGGACAGAAAATGCTGAACTTGTTCTGCAAATGTAAAGTTTCTACTGTGGAGAATCCAGCTCCTCGAAATGTCAAAGGCCCATTTTGTGTTTCTCCCACAAGATTTTTCAAAGCTGTTGTTGCCAAAGAAAAAAGTAACACAGACATGTTCAGTGAACGAGTTCATATTCTTTTTTTTCTGTTTTCTGTTGCTTTTTTTTACATGACAAATATCAACTAGAGAGTGTTACTGCAGTGTGAGGACATGAGATTTAATGTAGATCGTGACAATGTTCTTTCGTCAGACTATGGTTCACTTTTTTTTGATTCACTGTAATTGCAATCTTTGTGGAAAAACCGTACGGTGATGTAAAGTAAGGAGTGTTATCATTGTCCTGTTATTATTTGATTATGTTACCATTAATAATAAACATTCAAAATGTGCAGTTTGTCTAAAGACGGATAAGTTTCTGTATGATAGCTTTTTTCACAATTGAAA\n>XM_029888545.1 Pyricularia pennisetigena uncharacterized protein (PpBr36_01358), partial mRNA \nATGGAATCGTCGCTGAAGTGCAACACGCTTCTGTGCAGGACAGAGCTGAAGGACGAAGCTGTCGTCACCAGCTGCCTTCATGTTTTCTGTATTGATTGCGCTTCTCGCGCCAACTTGATCACTCCAGGCGCGGAGCATCTTCGCCAGTGTCCCGCATGCCGTTCGCCCTTGCCGGGTCCAGATCACGCAGTCCATGTCAATCTAAGACCTTCTGATGACTACAAAGGCAGCATTTTACGTGGATTAAGTCCGGTCGCTGTGATTGACTGTGCCAGTGCTGCCTTGAACTTTTGGGAGTATCAGATGGCCCAGGAGATCGTCTATCATGCCTACTTTGAGCAAACATTGACAGACAAATACTCACAATCGAGAGCCGAGCTGGACAAGATTACAGGAGAAGCAAATGGCCAGATAGGAATGCTGTCTGACAAGCTATCCGCGGTCACACTAGAACGTGACTCTGTGCGCCGAAAGAACGATGAGCTGATCGTCATGCTAAAAGAAAAGAACAAAAAGCTCATGCAAGTCCAGGAGCTATACGACAAGCTGAAACGCAAGGCTATGCTAGGTTCACTGCAAGACGGTGCCTCAGAGGCGGTTGATACAACCTTGGATCGAGTTGCAGCTGTTGGTGCCACGCCTGTAGCCGCAGATCGATACCAGCGGCTGGGGTTTTACCAACAACAGGCCGGCGACGTTAGACCTCATGGAGGTTTACAACCAAGAACAGGAAACACGTGGGACCAGCAGTTTAGACGCGATCGCATTGCAGCAACGCCAGAGCACAGAAACCATTCAAACAACACCGCTGGAATTAGACTTTCGAATATACCGGGCTTAGTTGTTGGCGGCGCGCCTCTGCTCAACCAGGACCGCCGTCACGGCTTGAGGTCAGAGCATCAGCACCTAAACGGTGTCCACGGTAACTCTGGGTATGGCGGTGCCAGTACCAACAACGGCCTTGGGCTGAACACAAGTGGTACAACTGGTGCTCTCCCGGGCGGAGCTGTTGGACTCTCATCCGCACAGAAACCAAGCTGTATGGACTCTCAGGATCCTTTTTCGATCATACTTAGAGCTGACTTTGGATATCTTCTCCAGTAA\n>XM_033983629.1 PREDICTED: Periophthalmus magnuspinnatus butyrophilin subfamily 2 member A1-like (LOC117386288), mRNA \nGAGGCGCTGTCAGAGTCTGATCCTGAGATCCGTGGACTTTGCACTGCACTTAACTGAAGGAATTTGACCTCAAACAAAACAGAGTTTCACTATGGGTGTGGAGATGCTCTCTGTGTTTTTACTCATGCAGACTCACTTTTGCTGGGGTCAGAACACACTGGTCGTTCCCTCTCAGCCAATCATAGCGCCCGTTGGTAGTGATGTCACTCTGCCCTGTCAGTTGGACCCTGTTAAAGACCTCAGGGACATGGTGGTGGAGTGGTCACGGCACGACCTGACGCCGCGCTACATCCACATCCGCCGGGACGGTCTGGACTTCCTCATAGACCAGAACTCCCTGTACCTGGGCCGCACCTCTGTGTCCGAGAGCCGACTGCAGCAGGGGGACATGTCCCTGAGTCTGACCCGAGTCAGGGCCAGTGACAGGGGCAAGTACAGATGCTACATCCCCCTGGTTAACGTCAAAGCAGAGGTCACTCTGATGGTCGTGTCCGTGGCCCCTCCCTCGATGAGCCTGATCAAAGAGCGCTCGGGGTCTCCCGTGCTGAGGTGTGAGTCCAGGGGCTGGTACCCGGAGCCGGAGCTGGAGTGGCTGGACTCAGAGGGGACGGTTCTGCTCAGGACTGAGGCTCAGAGAGGAGCGAGCGAGGAGCTGTTCAGTGTGAGCAGCAGACTGAGTGTGGAGCAGAGGCTCGGCAACACGTTCACCTGCAGAGTGAGTCAACAGGAGAGCGGCCAGAGCAGAGAGGCCCAGCTCAGCATCACAGATGAATTCCTGGAGGCCTGTCCCTCGTGCTCTGTGGCCTGGGTCCTCTTTAGTTTGCTGCTGTGTCTCGTTGCTGCTGCTGTTGCCTTTGCCGTGTGGAAGTTTCAAATCAACAAAACCAAGACTATGGAGAACAAACTTAAAGACTGTGAAGAAGGTGTGCCAATGATGAGGGAAAAAGAAGATGAGAAAATCCACAGAGGAGACGACAAACACAGAGGAGACGACAAACTGACTGAATACAAGGAGCAATTAGAGAAGATTAAAGAAGAGCAGACGTCTGCTGCACAGTTGAGTGAGGAACTAACAGGAACAAAGATGTTTCTAATGAAACTAAAAGAAAAACTAAACCAATGTAAGTATCAACTCAGCACTGACATGAAGGAGAAGGAGAAGACAAAGTATGACTCTAAGAAAGAGGAGAAAATTAAGAAAATGCAGCAGCAAATGGAGGAGTTTAAGAGCATTATTAAAGATGTTGACACAGAAATGTCTAAAATTGAGAAGCTTCTTTCAAAAACCAGTGAGAAGAAAGGGAAGCTGGATGAAGACGTCAGGCGTTTCACAAAACTGGTGCAACAACAGGAGGCAACAGAAAAGAAGAAACAGGAGGAGAAGAAACAGGAAACCAGGAATGAGGCTCATGATGACACCAGTGGAGGAGAGAATATGAACCCCAGTCCTCAAAAACCAGTAAACCCTCAGGAGCAGACAGAGGAGCTGCAGGCACAGGGGACGGAACCGGAACAAACAGACACAAATACAGAGCACTACTGAGAGAGAAGAAAAGTAAGTGGTACAGCATACCAAACAAAAAATGTAAAAATCAATAATCCATCAAAATAACTAAGTTTATTATTGACTACACGCACACGCACACACACACATTCATAATAGACAAGTGTCTTGCCTAAGGACACAACATTCTGTCACTTCTGTCCCGCTGTGGCTCCTGGTATCACACGTCGTCTCATCCAAACACTGACCAGGCCCCTGTTTATCTTCTGACGTCTGAGGAGATCAGGTTTTGACAAAGAGGTTTGGTCAAGTCAATAAACTTCATTATAATTTACAATATAAATAATATCTGAATAAAACACTGAAATACAGGTTTGAAGTCAGTGATAAATATTTACATTTGTCAGACTAATTGTGCTGTTTTCATCTCAGTGAAAATGTGTCTGAATGTGACAGTTCTGTTCATCAGTGTTTTACTCTGTTTATGTGGTGTCTATGACTGTGACATTATCCTCAAAGTTTGAACTGAACACAAAAATACAAACGTGACAGAGCGGATGAAGAGAAGTAATATTTTTTGTAGGACATGGCAAATAAGCAACTTTTATATCTTATTTTGTAACACTAATCCAAGAAATATGACTAGTTTTATACACTTAAGTTTGTGTTTGTTTACTGCTTGTTACTGTGGATAAAGTTTAATGGTTTGGTTCTTGTCATTCCATTCAACTAAACTAAACTTTTTAAAACGAAAAACTATGAATTATTTTTTTTATGTATTTGAAATGACTGTTTAACTGTGAAAAAATGTGCAATTGTGCCATCTGTTGGTGTTGAAAAGTAACTACATGTCTAAATAC\n>KJ347058.1 Uncultured bacterium clone Evans.12.9_05674 16S ribosomal RNA gene, partial sequence \nTACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGGCGGCCATGTAAGTCAGAAGTGAAAGCCCGGGGCTCAACCCCGGGACTGCTCTTGAGACTGTGTGGCTGGAGTGTCGGAGGGGTAAGTGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACGATCACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGG\n>XM_027695588.1 PREDICTED: Neopelma chrysocephalum KIAA1217 ortholog (KIAA1217), transcript variant X7, mRNA \nCTCCTAAATCGCCTTTATCTAGAAAAGAAGATTTTAACAGCCGATCACGAAAAATTAGGCTAGGTGAAAAGATTTTGAGAGCTGGCAGCGAAGGAAATCTGGTTAAACAGCATCAGCAGGAGCAGGTGGAAATCACAGAAGGGCTTGTGCCACGGAGGGCTCCTTTCCTGAAAGACCAGGCAAAAACCAGTTTGCATGTAACATCACTAGACGATGCAGAATGTCTCCGATCTAAAGAGCTCCTTTCGACCCCGAACAGTCACACCTCTTCTAATTCAAAGTCCACCCGCAACATCCCTCGAAGACATACAGTAGGTGGCCCTCGCAGTTCCAAAGAAATACTGGGAATGCAAACCTCAGAAATGGACAGGAAGAGAGAGGCTTTTCTTGAGCATCTGAAACAGAAATATCCCCACCATGCTACAGCAATAATGGGACACCAGGAGAGACTGAGAGATCAGACAAGAAGCCCAAAGCTGTCCCAGAGCCCACAGCCCAATTTGGGTGACCAGACAGAACACCTCTCTGAAGCATCTGCGGATTCCTTAGAGGCCATGTCTGAGGGTGATTCTCCAACCCCCTTTTCGAGGGGCAGCCGCACGCGGGCAAGTCTTCCAGTTGTGCGGTCAGCAAACCAGACAAAGGAAAGATCACTGGGTGTATTATATCTTCAGTATGGAGATGAAACAAAGCAGTTGCGGATGCCGAATGAAATCACAAGCACAGACACAATTCGTGCCCTTTTTGTAAGTGCCTTCCCCCAGCAGCTGACAATGAAAATGCTGGAATCGCCGAGTGTCGCCATTTACATCAAGGATGAGAGCAGAAACATATACTATGAATTGTGCGATGTGAGGAATATTCAAGACCGATCTTTCCTTAAAGTTTACAACAAAGATCCTGCACACGCATTTAATCACACTTCCAGAGCTGTAAATGGAGATATAAGGATGCAGAGGGAAATTGCTTATACAGGACGAGATGGCCCAAGTGGTTCCCGCCCTGGATCTGCCACGCACCCTCTGCATGCGATGCCCAGCTCTCCACCCTCCACCCCAGTGCCCCACTCCATGCCTCCCTCTCCGTCCAGGATTCCCTATGGTGGGGGCCGGCCCATGGGTGTGCCAGGCAATGCCACCATCCCCAGGGACCGTCTCTCCAGCATGCCAGCCTCGCGCTCCATATCGCCCAGCCCAAGCGCCATTTTGGAGAGACGGGACGTGAAGCCAGATGAGGACATGAGCAGCAAAAACCTTACCCTGATCCGAAATGAAGGTCTGTACGGTGACCCCTACTTGTTTCACGAGGGGAGGATGAGTGTGGCTGCACCGCACTCCGGACACCCCCTCGATGTCCCCGATCACATTGTAGCCTACCATCGCAGTGCCATGAGGTCATCAAGCACTTACTGCAACCCTTCAATGCAGCCTGAAATGCTGGAGCAGTCCTTGTACAGACAAAAGTCACGGAGGTACACGGAGAGCCATTTGCCCACTCTCGGCTCTAAAACACCTCCTGCCTCGCCCCACAGGGTGGCTGACATGAGAATGGTCGATATTCATCCTCACCATGGGACTCACATTCCCCACCACACCATCCAGCCTGACAGGTCTTCCCCCAGCCGCCAGTCCTTCAAAAAGGAGCCAGGACCGCCTGTGTTTGTGGATGCGAAAGCACGGAGTGCTGTTGGCCTCCCGGGCATGGCCGAGGCAATGCCCTCTCCAGCTGACAAGCAGGCTTTTGGCTATGGGTCACCTACCATGCCCAAGGACAAGGAGACAAGTGAGAAGATGATGTTGAAAATTGTGTCCAGCAAGAGCAGCGTTGACACTGCAGGTGTTTCTAACATGTCTGGGGGGAAGAATGCACTGGCAACTGTGGAGTCAGCTGTCGTCCATCACCCTGCTGGAGCCCTATCAATGCAAGTCAGCCTGCATGGTATGAAACGCAACGTGTCAGACCTGCGGCTGCAGCTGCATCAGATGAAGCAGCTACAGCTGCAGAACCAGGAGATGCTGAGGGCAATGGTGAAGAAAGCAGAGCTGGAGATCAATGGCAAAATGATTGAAACAGTAAAGAGGCTTGAAGATCCTGTGCAGCGACAGCGCAACCTGGTGGAACAAGAAAGGCAGAAATACCTCAACGAGGAAGAAAAGATTGTAAAGAAGTTATGTGAGCTGGAGGCATTTGTTGAAGACCTGAAGAAGGATTCTGCTGCTTCCAACAAGACAGTTACACTGAAAGATGTTGAAGATGGAGCCTTTCTTTTACGTCAAGTGGGAGAAGCTGTTGCTACTCTAAAAGGAGAGTTCCCAACACTGCAGAATAAAATGCGTGCGATCCTCCGAATTGAGGTAGAAGCTGTGAGGTTCCTAAAGGAAGAGCCACACAAGCTAGACAGCTTGCTGAAACGTGTGCGCAGCATGACCGATATCCTTACCATACTCAGGAGACATGTTACAGAAGGACTGCTGAGGGGTGTGGATCCATCCCAAGCCGTGCAATCCTCAGCTATGGAAAAGTCCACTGCAGCTGACACTCTGAAAAACCAGGAGGAGCACAAGTCTGCCCAAGGACATGCACAGCAGAATCTCACAGCAGTCACATCAGAATCCCAGGTGTCATCAGTGAAGTCAGAAGTCATCCCCTTCTCAACAATGACTGTCCATCACGTGCAGAGCTCGCCAGTTGTCATCCATCAGTCTCAGCACTCATCAGCCCTGGTCAACCATGCCCAGGGCTCACCCACTGCAGGCACTCACAGCGAAGGTGTGCCAGGTCATCTCTCAGCCACCCCGCCAGCCCCCCTGCAAGAGCCCACAACAGGATCCCAGCCCACACAAGCCACACCAGCACCACAGGTCTCTGTCAATGGCACCACCATGCAAAGTCTTTTCATTGAGGAAATTCACAGTGCAAGTACCAGAAACCGAGCTGTATCAATTGAGAAAGCTGAAAAGAAGTGGGAAGAAAAAAGACAGAACCTTGATCACTATAATGGAAAGGAATTTGAAAAGCTCTTGGAAGAGGCCCAGGCCAATATAATGAAGTCAATTCCTAACCTGGAGATGCCTCCCCAGCCAGCAGCCCTGCCTAAAGGGGATGCAGCAGAAAAGCTAGAAGTCTCAGAAGAACTTCCTGATGGAGAACAGGATAATGACAAGCTGACCAAGTCTCCACCTCCTCCACCTCCACGGCGCAGTTACCTGCCAGGGTCAGGACTAACCACGACGAGATCGGGAGATGTTGTCTATACAGCCAGAAAAGAGGCTGCTGCTGTCAAGGAATGCAGTGAGGATGCTGGGCAAATAGCACAATCCAAAGCCCCTAAAGAGGATCAGGCATTGTCTCGGAGCACAGGACATGCTATAGCATCAGCTGCAAAAGATGAAGAGGAAGAGGAAGGGGATAAAATAATGGCTGAATTACAGGCTTTCCAGAAGTGCTCTTTTATGGATGTAAACTCAAACAGTCATGCTGAACAGTCCAGAAATGATACACATGTTAAAGACATAAGGCCTGGGACTTTAATGCATCACAAGGAAAAGAAGGTGTATGGGGCTACAACAGGATCTCCCACAGATAGTGATCATCCTAAAGAGAAGAGGGAAGGGAAAACTGAAGAAGAATTGGGTTCTGATTCATCCAGTACAGCTGACAGTAAAATTGGCTTTTCAATGAATGACAGTCCTACATTTAGCAAGGGTTTGTTTGTAGACAGTACAGACTATTCTAACAAAAACCTTCAGAATAAGAGCACAAACCTGTCTGGTGTCAGTTTGCCAGAGGATGACAGACGAAGAGGGGCTCAAGATATTTTAGGATCCCATATTCCAGCTGTTGAAACTGGAAAACAAAAGCCAAACTACAAACTCTCAAGAGATGCTCACCAGGGCCTGCCACAGGGTGAAGTCTTGCAGAGCACAGGCAAGCACATCCCTATCAGCAGCGTTGCCCCTCTCGTGAGGCAAAGCCAGGAGGCCACAGGGCCTCAACCTGCCTTGCAGGAGCAAGAAGGTTCTGCAGTGAACTACAATCAGGTTGTGCTAAGACCCAAAGTGTCCAGAAGTAATAGTGTGAACAGCATTGAAGAGACAGACTCTCCAGCCACCTCTCCAAGTGAAGATGGCCCACCCACAGAAAACATCGCCTTCATGATTACCAAAACAGCTGTGCAGGTCCTCTCAAGTGGAGAAGTTCACGATATAGTCAGCCGGAAAGGAGGAGATGTGCAAACAGTGAACATCGATGCGAGGAAGGACGTAGCATCAGAAAAGGGTATCCCAGAGAACACAGACAGCGAAGAGCCAGTGGTGTGTCTGGACAAAAAACCTGTCATCATCATTTTTGATGAACCAATGGATATCAGGTCAGCATATAAGCGGCTTTCTACAATTTTTGAGGAATGTGATGAGGAGTTGGAAAAAATGATGACAGATGAAAAGATAGAAGAGGAAGAGGAGGAGGAAGACAATGAAGCACATGATGTCTCTGAGAGCCAGAAGGAAGAGTCACCAGTAGTTAATGACAGAAAAGCAACTGCAGAGCATTCAGCAGCTCACAGTCTCCAGGAGCCGTACCTGTTTAACCTTCAGTCTGACTCTGCAGAAAGCAGACCTCCTGCAGAAGAGGAAAGCACAAAGACAAATTTGAACAAATACCGTCAGATCTATGGGCTAAACACAGAAGCAAACTCAGACTCTGCCGATCAGTTTGGAAGCAGGCAGGATTCTAAGAAAAAATTTAAGTTTAAATTCCCTAAAAAGCAGCTGGCTGCTCTGACGCAGGCGATACGGACAGGGACCAAGACTGGGAAGAAGACCTTACAGGTTGTGGTCTATGAAGAAGAGGAGGAAGATGGGACCCTGAAGCAGCACAAGGAAGCGAAGAGATTTGAAATCACTAGGTCTCAGCCTGAGGAGAGTGACAAAAGTCCTTCTGGGAAGCAAGAGGGACCCTCCGGAGCTGCAGCGCCCCTATCTAGGACTGATGAAATTCGACAGAGCACATACAGGACACTAGACAGCCTTGAGCAGACTATAAAGCAGCTGGAAAACACCATCAGTGAAATGAGTCCAAAACCTATCCCTGAAAACACATACACCTCTGAGGGAAGTACTGTCCCCTTCTCTGCCCAGATAGTAGCAGAGACCCCATCCCGAGAGCGTGTAGTGCTGGATGAGAACCTTGCTGGTGTAGAGCCCCCTGCGTCCATCCCAGCCACTTCACGTAAGGGCTCCAGCGCTGCCTCCCAGACAAGCCGGATGCCAGTCCCCATGACTTCAAAAACTAGACAAGGAAGCATGGAGAAATCCGGCAAACAGCACAAGCTGCAGGATCCACGCCAATACAGACAGGCTAATGGAAGTGCTAAGAAAGCTGGTGGGGACTGTAAGGCTACTTCCCCTACCCTACCTGCTTCTAAGATCCCAGCCTTTTCTCCCACTTCTGGGAAAAGCAGCTCAGCACCTGCTTCTAGCGGTGACAGCTCTAACTCTCTTAATCCACCTACTAAAACCTCCATTCCTTCCTCCAACCTTCTTGGTCCTCAGTCAGGTCGCATAACTTACTCTACCTCCCTCATCCCCTCTGTCTCTAACGGCTCCTCCAAGTTTCAGAGCCCCACTTACCCAGGGAAAGGTCACCATCTCTCCTTCTCACTACAGACTCAAAATGGCCGGCCACCCCCTCCTTCCTCCTCTACCTCCCCCCCCTCCTCTCTGTCCCCCCCTTCACTGAACCAAGGTATGAAGAGCATCAGGACAATCCACACACCTAGTTTCAACAGCTACAAGGCACAGAATGGAAATGCCAGCAAGTCCACCCCATCCACGGTCAAGGAGCCATCCTAAAGGCTAAGCACGGCACACCTGCCAGGTCACCAAGGCTTTTTGTTCATTTTCTGCAGCCAATATTTTAACCAGGGAATGTAACCATTTAACTGTATTGCTGGAGGCTTAATACTAATCACGTGCTAAATACTGAATTACTACACTAGATTAGAGTGAAGCTTTTTGGAAAACTGTTGCTGTTGTACTGATAAAAGAGCATTTTCTTCCTATAGGCAGCACCTCTTACAAAAAGTGTGAAGGTGTGTGAGTGAACTTGACTGCGCGTGCACAGCGGTGTACTGAGCATGGGGAATTGTATGGTTAAAAATTTAGTAAGTTGTTTTGTATAAAGCTATTTTTCATTATGGGGTCTAGAAGTGAACAGAGATATACTAAAGTGTGATTATATTCAATTGTAAAACTGAAACTAAAATATTTTTCTTTTATTTTGGTGTTATTTAGCTTTGTTACAGATTTCTATTTTTGTCAACAAATGTCATGGTTCCTTTCGAGATCTTTTTGCCAAAACATTTTGATACTATTGTAATGTACATTTGAAAGTAGTATGCTGGACAGTAAACCTCTACACAAGAAACAAAACAAGACTGGTCTTATGTGTGTATGAGGCAACTCAAACTATTGCACTGCCATTCAGATTATATTTAAGAATTTGCCAGCCAAGAAAAAAATAAATTGTTTTACACATATAGATAGTTGCTGATTACTTTTTTTCTTAGCTAAATCCACCCTTTTTCCTTCAGTTTTATTTTACTGAGACCTGGTAGCCCATTAATGCATTGCATTGTGGATTTTAAAATGTACACTTCAGTACTGTTCTGTATACTGGCAAACTTTTGTACATATCTATAAATATCTATAAATAAAGAAATACTGTATGTGGCTGGGCA\n>XM_001989357.2 PREDICTED: Drosophila grimshawi DNA-directed RNA polymerase II subunit RPB11 (LOC6562570), mRNA \nCCATGAAATTGCTTGTGAACACAAGCCAAATATAGAAGAAATATTTCGCAAACAGTTTTAAACTTTTTATATTGACTTTTTCATTATCGATATGTAAAGAGGGCTTCATAACTAGACAGCACATTGATATAAATACCACAAACATCGCGTACATGCGATAGATCGACTGTGCAGTGTTGTTAAGCATGTGCGCACTTCAAGCGTTTAACAGCACATACTCAGCGCATTATTTTCGTGTCTGCAGTTGATTTTCACAAACAATTGCAATTTTATAAAACATAAATAAATAAGTAAATTAAAACAGCAAAATGAATGCACCGCCCACATTTGAATCGTTTCTGCTGTATGAGGGCGAGAAAAAAATAATCAAGGAATTGGATACGAAGGTGACAAATGCGGCGATATTCACCATCAACAAGGAAGATCACACGCTGGGCAACATGATTCGCAACCAATTGTTAAAAGATCCAAATGTTCTGTTTGCCGGCTACAAAGTGCCGCATCCGCTGGAACATAAATTCGTGATTCGCATTCAGACAACGGCCGATTATTCACCACAGGAAGCATTCATGAATGCCATCACTGATCTGCTGGCGGAACTATCGCTCTTCGAGGAGCGATTTAAGGATGCTATTAAGGAGAAAAAGGAGGGCGGCGATTAGTTTTACACATTTTTATTTTCGACAAGAAATTTACGAAACAATAGAAATATATATATTTTCACTAATTTGTATAAATAAATAAAAGTAATATATGCTATTAGTGAAATGTAATAGTTTCTCAGCTGAGGTAAAAGAAAAAAACAGA\n>XM_027211675.1 PREDICTED: Coffea arabica probable tocopherol O-methyltransferase, chloroplastic (LOC113693095), mRNA \nAGTGCCACATTGTTCCCTCTCCCTCTCTCTCGTTCTTCTCACAAGTTGTCTTGCGTGCTGCTTTGCTTCTCAGGACACGTTGAAGCTTTTGTTCTTTGCTAGCTAGGATTGTGCGGTACAACCAACAATAATGGAGGGGGAGAAGACGGATACCGAGGGAAAGGTGGAGACAGAGAAGATGAACAAGGAATTTGCGATGACATATGATGTCCACTCTAAAATGTTAGAGGATCTAGTTGGGGATCACTTCCATTTGGGCTTCTATGACTCTAGCTCCGTTATCCCTGGTTCTGATGTCAATTCTGCTCAGACTCGCATGATCGAGGCGGCCCTCCGTTTTGCCTCTGTATCAGAGGATCCATCTAAGAAACCAAGAAACATACTTGATGTTGGATGCGGTATTGGTGGCAGCACCAGGTACCTAGCAAGCAAATATGGTTCTCAATGTAAAGGCATCACCCTTAGCCCTTTTGAGGCTGAAAGAGCTCGTGTTCTAACTGCTGCCCAAGGATTAGAAAGCCAGGTCTGTATTGAAAGATTTGCAAGAAGTTATCAATTGTTAAATCACCCTTTATGCAAGTGCACAATGAGTAAAAATTTTCATTCTTCCATTTCTTAA\n>XM_018222954.1 Mollisia scopiformis ARM repeat-containing protein (LY89DRAFT_786121), mRNA \nCTCTAAACTGCGACCAAGGAGCCCACGAACGCGAAATAAGGCGCCAGGACTGCTTGGTCATGACAATATTCTCGATTCTACAATATGACTGAGGTGGAGGTCAACGGGATAGCGGCGGGCGTGGTGGACCTAGATCTCAAAACATCACTCTCTTCTTCATCAACTTCAAGGCGGATCAATACCCTCGCAATCTTGCAGGAGAGGCTCTCAAAGAATGAAATCAGCCCGAAATTATTCCCCCCTCTTCTACAGCTGTTATTTGACACGCATGCATACTATCGCGACCGCCCCTCTCGTCGAGCTGTTGAGCAATGTCTAAGACTTGCTTTTCGCTCAGGCTGTGCTCCTCCAGCATTAGCGGGCTTCATCAAGAATCTAGAGGCCGAGTCTTTGAAGCTAGGGATCGCCCCCAGCAATGCTTTTGTTCTGGTAGAATGGTGTAGCATGCTTCTGCAGGTGCTGACTGGAACCGACTACTGGGATATCTGGGGCTTCCAAGTTCTCGAGAGCCATGCTCGATTGCTGGAATTGTGTGTTGGAGAGTCTCCGCGGGACAACATTAGACAAACCGCACTGCGCGTCACATGGCGAGGACTCCGGGAGGCATTCTCTATACCCGAGAAGAGGCAAAATGTGATGAAAGGAGCTATCCAGAAACTTGCGTCAAAAGGTGCTCAGTCATCTGCGAAGAATGCTATCATGCTTGGAGCTATCGCTGGAACATGTGCGAGGAATTTCCAGAAAGAGTCCACGAAATCGTCAGAGATGAAAGAATGTCTCACGAACAAGAAATCCGAATACTACGCATTCTACATTCGAGAAATCATTGGTTCGCGGACTCTTGTACCAAGCCACATATCGAATGCTTTACATGACTTCTTTGCTTCGTTCGCAACAAAGGAGGACATAGAGAGGGAGATTGTTCCTGCTCTGGAAAAAGCTCTGCTTCGTGCACCGGAGATAGTGCTCAATGATCTCGTTACGCCACTGTTTCGTTCCCTTCCTGATACGATAGATCTTACAAGTATTCTTAAGAACAACCTTCTCAAACCTCTGCTTTCCAATATCAAGTCAAGCAATGCTACTATTCGCTTAGGAGCGCTTTCGGCACTTCGTGCTGCGGCTCCCAAGTGTCACGAGGTGAATGTTATTGCTGAGGTTGCAGAAGAGATTGTTACCCCTCTCAAAGCTGGAAAATTGCCTTCCGCTGATCAGAGAGCTAACCATGCCGAGATGCTTGCTCTACTCCCTGTCACAGAGACAACAGCTACCAAGATTGGTTCAGCTATTACCGCCGTTGTCGGCAAAGAAGCAAACGAGGCAGCGCTTACATCGGAGACATCAGCCCTCCTGCATTATGTAAGTTGGGCAATACAGCATGGAATGGATCTGGATAAGCAAATGACAGATGCTTTCACCAAAGGGATCTCGGATAAAAAGGTACCTTTCAAGAGTCTTTGGACCGGACGACTGGGTGAACTGTTCTGGGCCACGGATGATCATGAGATTTTGCGAGGCAAATTAGCTAAACTCGCTGAATGCACAATCTCACCTCTTATGGATATCTGGCAGGAAGTCACGGCGAACCCTTTGGCTGCAGCACAGTCTGGTCTCGTCGCCAGCGCTTTTGTGCTTACTGCTATTGCCTTTACGAAGCTACCACATGTTTCGAATAGCAAGGTTGATACGGCTCTGAAGAAAGCTCAGATAGGAAGACAAGCCTTGGTTATGGAGCCAAAACCTTCCTTCCTGTTGAACCCACGCATTTATGGGAAGCTTACAAGTGAGGAGGATTTCATCTGGCTTCTTCGAGCTCTTGCATCCACTGCACAAGATGTCGTTACGTCTGATACAGTTTCACCTAGCTCTATTGCCTGGTCTCAAGCCGTAATATTCTGCATATGCTCTTCAACCGTCAAGCCGAGTGTTAGAAAGAATGCTTCCGAAACCTTGACTAAGCTCTACCTCAATTATCCTTTAGCAATTGTCAAAGTTATCGTGTCGGGACTTTGGAGGTGGCGAGACTCCATCGAATCAGGCGACAAGGATAGTGCTGCTGTGTTGTCTAAAACAGAGAACAGCAATATTCACCATGTTATTCGAGCCATCTGTCTATCCCCAGCAGAAGTCACTCAGCTTGGTGGTCAAGTCGAAATGTCTGTCCGGATGGAGCAGATGATTTTACTGTTGGTTCTATCTCGACAGGAATTGTTACCGCGAGTGAGCTGGATCCAGCTGTGTCTCAAAGTTGAGGTAGATCCTGGCAACCTTGCCAGGAAATCTGGAGATGCTCTGGTTCAGCAGATACTTGATTGCACTAGATTTGACGAAAAAGCGACCTTCCAAAGATCCGACAATGTCAAGATCGCTGCTTTCCAAGCAGCAGCAGAACTTGCCTTTGTGGCCCCCGATGCAATGACCCCTAGAATTGTAGAGCTTCTTGAAAATGATCTGGACTCAACTCAATTGACTAACATCGGCCCAACAGAGGCGGCTATCTTCAGAACAGAAGAAGGCACGGCTTTTGTCGATGTGCTCGCGTCCAAGTCCCAAAGCTATGTTCCCAACAAAAATACAAAAGATTACGACACTTTGAAGTGGGAAGAAGAGTTACGAGCTCAGCTCGCACAGAAGAAAGGACAACAGAAGAAACTCACTTCCGAAGAAACTGCCAAGGTTAATGCTCAGTTGAAAAAGGAGTCTGCTATTCGTCTGCAGATTCGCCACCTTCAAGCAAAGCTCCTCCGTGGGTTTGGTATCATCAACAGCCTAGCCACAGGACCGCCTACTGAAGCAGGTCTTTGGATGGGGCCGGCTGTCAAGGCATTAGTGGAGGTAATTAAGGCTGGTGCTGGGCTCATCACAGGCAATGCAGCTCCCGATGCGTACATTGCCTGCGCAGAACGACTTCCGAGCCGCGTTGGTGCTCTGAGGCCATTCATAGGTATCGCGACATTGAGAGCTTTAAATGTACCACACCTTCCAGAGCATCTAGAGGAAGAGCCTCTAGGTGCGTTGATTACCAGAGTCCTTTATCGACTTCGCTTCTCTGGAGAACAACGACCTTTCGATACAGTCTCCTTGATCTACATTCTCCCTCTTGTCTTTCTCGTCCTGCGCGAGAAAGGCTTTGGAGAGTCTGATGACGCTGAAGCTCAGATTGTCTTAGCTTTAGAATTCTTATCTTACCATACAGATGCCTGCTCTGACGAGCTGGTACCACGCGAGGAGATCTTGTCTGTGCTAATATCATCGATGCAAAACTATAATCAGCATTACAAGATGATCAAAGATTGTCTGGCAGATCTTTGCCGTTGTATTGCGCCGAACATAACTGAGATCGAGCTGTCAATCCTTGCCCGCGGAGCAATTGTCCCGCAAGTTTCGGTTCGTTCCTCAGTCCTACAATCAATTAGTGCTGAGATCGATATGAGTGATGTAGACTTCTCTGACGAGATATGGCTCGCTTGTCATGACGACGTGGAAGAGAATGTCGAGCTTGGAAAAGAAATTTGGGAAGAGAGCGAATTTACAGTCTCCGAAGATGCTCCCTTCAGGATGCTGCCTTATCTCGAGATTGTGGACAAGCAATTGAGACGAGCGGCGGCAAGATCGTTAGCGGCAGCTGTGAAATTACGGCCATCAACATTTCAAGATGTGTTAGAACGCTTGAAGTCGACATATCAAGAGCTTGCAAAGCCCCGTGTGCCCCAGCTCGACGAATACGGCATGCCCAAAAAGATGGATCTGTCGGATCCCTGGGAGGCTAGAAACGGTATAGCTCTTGCGTTCAAAGAGCTAGCTCCCATTTTCGAGATTAGCCTACTTATTGCATTCTTGCAATTTCTGATTGAAGCTGGTCCTCTTGGCGACAGAAACCCAAATGTGAGAGAAGAAATGGTAGAAGCAGCTACCAGTATTATCGCACTTCACGGCAAAGACAAGGTGGAGGAACTAATGAAAACCTTCGAACAAACTCTTGAAGCTCCAGACAAAGGCTCCGAATTCGCGGATCGAGTCAATGAAGCTGTCATCATCATGTACGGAGCTCTCGCTCGACATTTGAAGGCGGGAGATCCACGAGTTCCTAAGGTAGTGGAGAGGCTGCTAGAGACTCTGAGTACACCTTCTGAAGCAGTGCAATACGCTGTTGCTGAATGCTTGCCGCCACTGGTACGTGCGTCGAAAGAGCAGAATCCAGAGTACATCAGGCATGTTCTCGATCGCTTGTTCAATTCCAAGAAATACGCTGCTCGTCGCGGTGCCGCCTATGGACTTGCAGGTATTGTTCATGGCATTGGTATACTAGCTCTGAGAGAATATCGTATCATGTCAACGTTGAAAGGTGGGATTGAGAACAAGAAGGATGTCAATCATCGTGAGGGTGCATTGTTGGCATATGAATTATTCTCAACGATTCTAGGGCGAAACTTTGAGCCTTACGTTATTTTAATCGTACCCCAGCTCCTTTCCAGCTTTGGAGACGCCAGTGCGGATGTACGTGAGGGTTGCTTAGCAGCCGCAAAGGCCTGTTTTGCAAGTTTGAGCTCATACGGTGTCAAGCGAATATTGCCTACGCTCTTGGAGGGCCTTGATGACCAACAATGGAGAAGTAAGAAGGGAGCATGCGACCTTCTGGGTGCTATGGCCTACCTTGATCCTCAACAATTAGCCCAGAGCTTACCTGAGATCATTCCACCATTGACTGGGGTACTCAACGACAGTCACAAAGAAGTTCGACTTGGCGCAAATCGAAGTCTGAAACGCTTTGGTGAAGTCATCAGCAATCCCGAGATCAAAGGCCTTGTGGACGTACTGCTTAAGGCTCTTAGCGATCCTACAAAGTACACAGACGATGCTTTGGACTCTCTCATAAAGGTACAATTCGTTCACTACCTGGATGCACCATCACTTGCACTTGTAGTTCGCATTCTAGAACGTGGACTAGGGGATCGCTCGGCGACCAAGAGGAAATCATCTCAGGTCATTGGCAGTCTGGCCCATTTGACGGAGCGAAAGGATTTGATCTCGCATCTGCCAATTTTGGTCGCTGGTCTCAAAGTTGCTGTGGTTGATCCTGTGCCCACCACACGTGCAACTGCCTCGAAAGCCCTTGGCTCACTGATCGAGAAGCTTGGCGAAGATGCTCTACCTGATCTTATCCCAGGATTGATGCAAACACTGAAATCAGATACTGGTGCTGGTGACCGACTCGGATCTGCTCAAGCTCTGAGCGAGGTCCTTGCTGGTCTCGGTACCAGTCGCTTGGAAGAAACACTGCCCACAATCTTGCAAAATGTTGCTTCCTCAAAGCCTTCTGTCCGAGAAGGTTTCATGTCACTCTTCATCTTCTTGCCTGTTTGCTTCGGCAACAGCTTCGCAAACTATCTCAGCAAAATCATTCCACCAATTCTAAGTGGTCTGGCTGATGAGATCGAGTCCATTCGTGACACCTCCCTCCGAGCTGGACGTCTTCTTGTCAAGAACTTCGCAACTAGAGCTATCGATCTCTTGTTACCCGAGCTGGAACGAGGTCTTGCTGATGACAGCTACAGAATTCGTCTTAGCTCTGTGGAATTGGTGGGCGATTTGTTGTTCAACCTCACAGGCATCAACGCCGGTACCGAGCAAGATGAGGTAGAAGAAGGTGCCCAGGAAGCAGGAGCCTCGTTACTGGAAGTCCTTGGAGAAGAGAAGAGAAACAAGGTCCTCTCGTCTCTTTACATTTGTCGTTGCGATACGTCTGGCTTGGTTCGTACCGCCGCAGTCAATGTTTGGAAGGCTCTTGTGGCCAGCCCAAGAACTCTTAAGGAGCTTATCCCAACATTGACCCAACTTATCATTCGCAGACTAGGAAGTTCCAATATGGAGCAGAAAGTTATTGCGGGCAACGCACTCGGCGAGTTGATTCGAAAAGCTGGCGACGGAGTCCTATCCAGCTTGCTTCCTACACTAGAGGAAGGTCTGCAAACATCGACAGATACCGATGCCAAGCAAGGTATCTGCATTGCTCTTCGAGAACTAATCTCATCTGCTTCTCCTGAAGCTCTGGAGGATCACGAGAAGACTTTGATATCAGTAGTCCGAACCGCTCTTATCGATTCCGACGAGGAAGTCCGAGAAGCTGCCGCAGAAGCTTTTGACTCTTTGCAGCAGATTCTTGGCAAGAGAGCTGTCGATCAAGTGCTACCCTATCTTCTTAACCTGTTACGCACAGATGAAGACGCAGACAACGCTCTATCTGCCCTCTTAACGCTACTTACCGAGACAACAAGATCAAACATCATCTTGCCTAACTTGATCCCAACCCTCACGACCTCTCCAATTTCGTCTTTCAACGCCAAAGCTTTAGCATCCCTATCCACTGTCGCTGGCTCTGCCATGACCCGAAGATTGCCTACGATATTGAATGCGTTAATGTCCAACATCATCTCCTGCAATGACGAGGGCTTACTCGAAGATCTCAACACATCATTCGACACCGTGATCCTTTCGATTGATGAATTTGATGGTCTGAACACGGCTATGAGTGTATTGCTTGGGCTCTCGAAGCACGATGACCACCGCATAAGAGCAGCTACTGATCATCATCTCGCAAAGTTCTTCGCTGCGGCCACTGTGGACTACTCTCGCTATAACCAAGATATCGTAAGAGCTTTACTTATATCTTTCGATGACCGGGATCCGGACGTAGTTCTAGCCGCCTGGACCGCGTTGAGCGAATTCACTAAACACATAAAGAAAGAAGAGATGGAAGCTCTTGTGTACTCCACACGACAAATCTTACAACATGTTGGAGTTGCTGGATCAAATCTGCCAGGCTTCAATTTGCCTAAGGGCATCAATGCCATCCTACCTATATTTTTACAAGGTCTCATGAATGGCACCGCAGAGCAGAGAACACAAAGTGCTCTTGCCATCTCGGACATTGTAGATCGTACAAGTGGGGATGCTTTGAAGCCATTTGTCACTCAGATAACTGGACCGTTGATCAGAGTGGTATCCGAACGCTCAGTCGACGTAAAAGCAGCGATTCTGTTGACTTTGAACAATCTCCTCGAGAAGATTCCTACATTCTTGAAACCCTTCTTACCTCAACTTCAGAGGACTTTCGCCAAATCCCTGGCAGATACATCAAGTGAAGTTTTGAGAACTCGAGCAGCCAAGGCACTAGGCACGTTGATCACACTCACTCCTCGAATAGATCCACTCATTGCTGAGTTGGTCACTGGATCAAGGACTTCTGATTCAGGTGTTCGTAACGCCATGCTGAAGGCCCTCTACGAAGTCATCAGTAAGGCAGGAGCGAACATGAGTGAGGCATCTCGAAGCGCTGTTCTTACTCTTATCGACACTGACCCAGAGGATAATGATGTTTCTATGGCAATCACAAATGCTAAGTTACTTGGAGCTCTGATTAAGGTTGTCCCCTCGGAGAGTGCTGTTGCCCTCATCAAGAACAGAGTCTTACCAAGTCACTTCACTCAGTCCTCTGTACTGGCTCTGAACGCTGTGCTGCTAGAATCCCCAGCGACTTTAACGGAGACTGCCTTCGCCGATAGCTTACCACAAAGCATCTGTGAAGGCATGCAAAACAAGAACAACTTCATTTCTGACAACTGCGTCCTCGCGGCCGGAAAATACCTTCTATCCGACTCACGCAGCAGTGACTATGAGACGATCAAGCCAATATTCGAGACACTTGCCACATTGATAGGACCTGGACAGTCGGCTGACACTCGACGTCTAGCTTTGGTGGTGGTGCGAACTGTGTGCAGACATCACATGGAGCTCGCTCGTCCTCATCTTCCACTACTCGCACTTCCCGTCTTTGCTAGTGTTCGAGATACCATCATTCCTATCAAGCTGGCGGCAGAAGCAGCATTTATGGCGCTATTCAATGTCGTAGATGAGGAGAGCAAAGTATTCGACAAGTATCTTGCATCTCAAGATCTAGCTGCCAACCAAAAGCGGAGCATGCAGGATTACTTTAAGCGTGTTGCATTGAGGCTGGGAAATACTGCACGAGAGAGGAAAGAGGCAGAAGGTGGACAGGGCGGCTTGGGACTCTCTCAAGATGAAGTTGATGATGAAAAGGAGATAGCTTCGGTAGGAAGAGTCGACCTTGGAGAGGGAGCTTTTGATGAGTGATGAGTTACGAAAAGGCATGGGAGGTGGTCAAAAAGCGTGCATTGTATTTGGAGGGATCGTTTTTAGACGAATGAATTCTTGCG\n>XM_047966548.1 Annulohypoxylon maeteangense uncharacterized protein (GGS22DRAFT_23129), mRNA \nCCTGAATCACGGTCATTTTACATCATCTACATAGTCTACAAATCGTAACCATATTCCGCAGACTCAGTCAATTGTTTTCTTAACGAAATAAATATGGCCGATCAACCTCGTCGGCGTCGGAACCGCCCCGATAGCAAACAGATGTGGGATGAATCCGACCGTCGCAACCGCAACGAGCCCAACGCGCGCGACAAACGAGACGACCGCGGCCGGGATCGAGACGAACCACCCCGCGAACGAGAACGAGACCGCCGCTATAGATCCAGATCCCGATCTCCTCGACGAGACCGACGGGACAAGAACCGCGACCGTCGAGACAGGGACCGCAACCTTGATAGGGGTAGACCACGTGAGAACGACGAAGCGCGGCCTAGAGCAGACGAGCGTCGCGAGAAGAATAAGAATAAAGGAGATCGTCATCGCGATAGAGATGAGCCTGCTCCAAAGGGTCCGGCTCGAGATCGAAGTCCCCGACGCTCTGCATCGCCAGCTCGAAGCCCGGCTGGGAAGGTAGATCGCAACACGCACAACAACTCACCACTCCCAACGCGACCAAGACCCGGCGGAAAAGCTGAATCAGGGTTGGGATCCTCGCTTCAGTTTAAGGTTGGAGGAAAACATGACGACGATGCGAACCGTGGAGGGAAGAGTGCGGCGGGAGGCAAATTCTACGATGCCAGAGGTTCTACTGATGAGGCTGAGGACCGAAGACGACGAACCGAGACGCCAAATTCCGACCGCGGGGATGCCATGGACGAGGATGTCGACGAAGAGGATGTTGTTGTCGAGGATGACGGACTAAGTGCCATGCAAGCAATGATGGGATTCGGCGGTTTCGGTACCACAAAGGGAGCCCATATACCAGGCAATAATGCCGGCGCAGTGAGGAAGGAGAAGAAGACCGAGTACCGACAGTACATGAACCGTATCGGTGGTTTTAATCGCCCGCTGAGTCCATCGCGGTAATCGTAATACCTACCTACTGTTTTTTTATTGCTTTTTTTGATACACTACGAATCAGACTATGGAGAAGATGAGTTTCCTTGAAAGGGGCGTAGGGAATACACGGACCAGAGGTTAGGTGCTCTTAATTTGATGATCATTATAATCCTTGTTG\n>KF726604.1 Pseudopachylus alticola voucher MZUSP:59952 16S ribosomal RNA gene, partial sequence; mitochondrial \nGCATAATCATTAGTTTTTTAATTGGGAGCTGGAATGAAAGATAGAGACTGAAAAGATAGTTTTTTTTAATTAGTTTGAATTTAAATTTAAAGTAAAAATGCTTTATTTATTTCTTGGGACGAGAAGACCCTAGAAGCTATAAATTATAAAATAATTTTTTATTGGGGCAATAGTTAAAGAAATTAATTTTTAATTTTGGTTTATGGAAAAAAAAAGTTACTCTAGGGATAACAGCGTTATATAATTAGTGAGTTCTTATTGAGAATTATGGTTGCGACC\n>XM_033398930.1 PREDICTED: Drosophila miranda uncharacterized LOC117194359 (LOC117194359), transcript variant X1, mRNA \nCCAACGCATGAGCAACATCTCGCTGTCCTCCGGCACGGACTCCGTGGGCCACATGGATCGCGGCAGCAGCTCCAGTCTCGCTAGCAGCGCCACCGTAGGCACCAACACCATCACCAGCGGCATTTCCAAGGAGTGCGCCAATTACCCCGTCGGCAGTCAGTCGGCCCGTCCATACGTCCAACTGCCGGGCATACACATTTCCAACCCTCCCCAGTACGGGCCAGGGAATATGCAGGAAATAGACGCTGGCAAAATGGCGCACAACGGCAAGGCACTCACAGGGCGCTACAATGCCACGCCCACCTATGGCTTCGACAACGAGCAGAACTACTGCCTGAATTCCCAACAGTTGCACAACTTCGAGCTCGAGAACCACACACCGCCGGCATGTCCCGGCTCTGGACCCATTGCCATGACGAACGGCACCATCCAGTTGCGCCTCCGCGATGGCGTGCGCATTGACATGACTCTGGACAAGGCGGTGCGCGTGCTCAATCAGCGCAGCATGGTGGCAAATGCTCTATCACGCAACTGCAGCAACTCGGCTTTGATCCACCCCAATGGACGCATCTTGCAGAGCGGCGCTAAAGTCGAAATAGTCACCTACGACGGCATGAAGGGCAATAACTTTGTTCGCTATGCCAAGATGTGGTACAAGGTGTGAGCAGTGTTCTATGA\n>JF368683.1 Uncultured soil bacterium clone GO0VNXF07IAPWG 16S ribosomal RNA gene, partial sequence \nAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGCAGCACGGGTACTTGTACCTGGTGGCGAGCGGCGGACGGGTGAGTAATGCCTAGGAATCTGCCTGGTAGTGGGGGATAACGCTCGGAAACGGACGCTAATACCGCATACGTCCTACGGGAGAAAGCAGGGGACCTTCGGGCCTTGCGCGTATCGAGATGAGTCCTAGGTCGGATTAGCTTAGGTTGGTGAGGTAATGGCTCGACCGAAGGCGACGATCCGTAA\n>XM_052578998.1 PREDICTED: Carassius gibelio triosephosphate isomerase 1b (LOC127975165), transcript variant X1, mRNA \nCCTCGCTGTCTCTTCAACCGGGGGCTGTCTGTCATTTCTACTGTTTTTTTTTTCTCTGTATTTTCTGGTGAACGCAACACGTTTCAGTCATGACTGGCAGGAAATTTTTCGTCGGAGGCAACTGGAAAATGAACGGAGACAAAAAGAGCATAGAAGAGCTCGCCAATACACTGAATAACGCCAAACTCAACGCAGACACCGATGTTGTGTGTGGTGCTCCATCCATCTATCTGGACTACGCCAGGTCCAAGCTGAATCCTAACATTGATGTGGCTGCACAGAACTGCTACAAGGTTGCAAAGGGAGCGTTTACTGGAGAGATCAGCCCTGCGATGATTAAGGACTGTGGAGTTAAATGGGTTATTCTGGGACACTCTGAGAGACGCCATGTTTTTGGAGAGAGTGATGAGTTGATTGGGCAGAAGGTCGCTCATGCTCTTGAGAACGGTTTGGGTGTGATCGCCTGCATCGGTGAGAAGCTGGATGAGAGGGAGGCCGGAATCACAGAGAAAGTTGTTTTTGGCCAGACAAAGTTCATCGCAGATAACGTGAAGGACTGGAGCAAAGTGGTCCTTGCTTATGAGCCTGTGTGGGCCATTGGCACTGGTAAAACCGCATCACCCCAGCAGGCTCAGGAGGTGCATGACAAGCTCAGGCAGTGGATGAAGGCCAATGTCTCAGAAGCTGTTGCCAACTCGGTCAGGATCATTTATGGAGGATCCGTCACTGGAGGGACCTGCAAGGAGCTTGCTTCTCAGAAAGATGTGGATGGCTTCCTGGTCGGTGGCGCTTCCTTGAAAGCAGAGTTTATTGACATTATTAATGCAAAAGCATAAGGAGATAAAGCCACCATCTACCTAAAGCCTAAGGCTTAGGTCTGTTCCCAAACACTGCTCTTCTTTAGAAAGTGTTGTTGTGGTTTTGTTGCTGTCGCTTCATTTTTTTTTATATTACAAAGGGACAGATTGCCACACACTGAACACTCAGCTGAGTGTGTTATTGGCCCTCCAACTAGTTTAGTGAACTACATGACTGTAATGAGAACCATCACGGGGCTTAGAGCCCACACCTTTACTTGAATAATATTAACCAACATTCTCATGTATACAGTGTCAAAAATCTAGGATTAAGTCAATCAACCTCAGTGTCGTTTTAATTCAAGCGAAAGTACTTTCCATGAATGTGGTTGTCCTGATGTTTTCCTGTCCCTCAAAGAGTGTTTCTCTGAGTGACCTATCCTGAAGGTGCTCACATGAAACCAATATGTTTTGGTATAAAGGATAAGACAAAAAATATTCTAATAAATGTTTCAGAATCATAGACTTAA\n>XM_007110546.3 PREDICTED: Physeter catodon golgi transport 1A (GOLT1A), transcript variant X1, mRNA \nTGTGAGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGAGCGTGTGTGTGTCTGTCTAGGGGGAGTTAATGATTTACCAGAGGCTCATTTCACAGCTTACCAAGGGTCAGCTTCCCTTGGGCATGTACAAGTTCGACCTTCTGGGCTCCTCACCCCTTGCCAGCTTCCACCTGGAAGGTCCCCCAGGCAGCCCGCAGCATGATCTCCATCACCGAATGGCAGAAGATTGGTGTGGGCACCACCGGCTTCGGCATCTTCTTTATCCTCTTTGGAATGCTCCTGTACTTTGATTCGGTGCTCCTGGCCTTCGGAAACCTGCTGTTCCTCACCGGCCTCTCCCTCATCATCGGCCTGAGGAAGACGTTGTCCTTCTTCTTCCAGAGGCACAAGCTCAAGGGGACCAGCTTCTTCCTGGGGGGCGTGGTCATTGTGCTCCTGCGCTGGCCCCTCCTGGGCATGTTCCTGGAAACCTATGGCTTCTTTAACCTCTTCAAGGACTTTTTCTCTGTCGCCTTTGGCTTCTTGGGCAATACCTCCAACATCCCCTTCCTGAGCATGCTGTTCCGGAGGCTTCAAGGCACCAGCTCAATGGTCTGAACAGCAGAGATAAGCTGCTTGAACTTGGATCATTGGTTGAAGGGGCTGGAAAGGAAATGGGGGCCACCCCCTTAGGCCCCCACCCCACACTGACTCATCTCCCCATCATACCCGGACCTCTCCAAGTCCAGAAGGAAGGATGGAGCCGAGTGACTGACCTCAAATCCCCAAGTCAACGCAAGAAGCTATCAGGACAGTTGGGAGCAGAGATCCAGGTCCCACGGATATTGAACGGGGATCACACCCCACCCTGTATTTATCAGAGGAAAAGCAAAGATTAAATCCCCAAGCTGGGGCTTCCCTGGTGGCGCAGTGGTTGAGAATCCACCTGCCAATGCGGGGGACATGGGTTCGAGCCC\n>XM_009871050.1 PREDICTED: Apaloderma vittatum myosin VC (MYO5C), partial mRNA \nTACAATAGGGTTTGGATCCCTGATAATGATGAAGTTTGGCAGTCTGCGGAAATCACGAAAAACTACAAGGCTGGAGACCGTTTTCTCCATGTGCAATTAGAAGATGGAACTGAACTGAATTACCCTGTTGATCCAGCTGCCTTGCCACCCCTACGAAATCCTGACATACTCGTTGGCGAAAATGATCTCACCGCGCTTAGTTATCTCCATGAACCAGCTGTTCTACACAATCTTAAAGTTCGTTTTATGGAATCTAAGCTTATCTACACCTATAGTGGAATAATTTTGGTTGCAATAAACCCCTATAAACAGTTGCCGATATATGGAGATGCTATTATCCATGCATATAGTGGGCAAAACATGGGGGACATGGATCCACATATATTTGCTGTGGCGGAAGAAGCATACAAGCAAATGGCAAGAAATAACAAAAATCAGTCTATTATAGTCAGTGGAGAATCAGGAGCTGGAAAGACTGTGTCTGCAAGATACACTATGAGGTACTTTGCCACTGTGAGTAAGTCAAGCAGCAATGCACATGTGGAGGATAAAGTGTTGGCATCCAATCCAATAACTGAGGCTGTCGGCAACGCAAAAACCACACGGAATGATAATAGCAGTCGATTTGGAAAATACACTGAGATCAGTTTTGATCGGAGTTACCAAATCATTGGAGCTAATATGAGAACATACCTGCTTGAAAAATCCAGAGTTGTCTTTCAGTCAGAGAATGAGAGAAACTATCATATATTTTATCAGTTGTGTGCATCTGCTATGCAACCTGAATTTAAGCATCTTAAATTAGGAAGTGCAGAAGAATTTAACTACACAAGAATGGGTGGCAGCCCAGTAATAGAAGGAGTTGATGACAGAGCAAATATGGTGGAGACTCAGAAGACATTTGCCTTGCTGGGTCTGAAGGGGGATTTTCAGATGGATGTTTTCAAAATGCTGGCAGCAATCTTACACTTGGGCAATGTGGAAATAACAGCTGTTGGAGATGAAAGATCATCCATCAGTCTGGAAGATAAACATCTCAATATATTCTGTGAACTCCTGGATTTAAAACGTGACAAAATGGCACAGTGGTTGTGCCACCGAAAGATTGTCACTACCTCCGAGACTGTAATAAAGCCAATGACAAGAGCTCAGGCTGTTAATGCAAGGGATGCCCTGGCGAAGAAGATCTATTCACATTTATTTGACTTCATTGTGGAAAGAATTAACCAAGCTTTGCAGTTCCCTGGCAAACAACATACTTTCATTGGTGTTTTGGACATTTATGGCTTTGAAACATTTGATGTGAACAGTTTTGAACAGTTTTGCATCAATTATGCCAATGAAAAGCTGCAGCAGCAGTTCAACCTGCATGTCTTTAAACTTGAACAAGAGGAATACATGAAGGAAGATATCCCATGGACTTTAATAGACTTTTATGACAACCAGCCTGTCATTGACCTTATTGAAGCTAAAATGGGAATTTTAGAACTTCTGGATGAAGAGTGCTTGTTACCTCATGGAACAGATGAAAACTGGCTTCAGAAGCTCTATAATAATTTTGTGAATAAAAACACACTCTTTGAAAAGCCGAGGATGTCGAACATGTCTTTCATCATTCAACACTTTGCTGATAAGGTGGAATATAAAAGTGAAGGATTTCTGGAAAAAAACAGAGATACAGTACATGAAGTATTGATTGAAATCTTGAAGGAGAGCAAGTTTCATCTGTGTGCAAATTTTTTTCAAGACAATCCAGTGTCCGTTTCACCTTTCAGTTCAACTATAAACATCAAATCTGCAAGACCTGTTCTCAAGCCACCCAACAAACACCTCCGGATGACAGTTGGCAGTAAGTTCCGGAGCTCTTTGTCTTTGCTTATGGTGACTCTTAATGCAACAACCCCTCACTACGTACGATGCATAAAGCCGAATGATGAGAAGTTGCCTTTTGAGTTTGATTCGAGAAGAGTTGTTCAGCAACTGCGAGCGTGTGGTGTTCTGGAAACTATTCGAATTAGTGCACAGAGCTACCCATCCAGGTGGACTTACATTGAGTTTTTCAGCCGTTACAGCATTCTTATGACACAGCAGGAGCTCTCCATAAATGATAAGAAGCAGATTTGCAAGACTGTTTTGCAGCGGCTAATCCAGGATCATAACCAGTATCAGTTTGGGAGAACAAAAATTTTCTTCCGAGCAGGGCAGGTTGCTTACTTAGAAAAACTGCGATCAGACAAACTGAGATACGCATGCATCACGATCCAAAAGAGCATTCGAGGCTGGCTGCAGCGGAAGAAATTTCTTCGCATAAAACAAGCAGCTGTTATAATCCAGCAGTATTTCCGAGGGCAGCGGACTGTGCGGCAAGCTATAACTGCAAGAACTCTGAAGCAAACGTGGGCAGCTATAATTATTCAGAAATACTGTCGAGGTTACTTGGTCCGTAGACTTTGCCAGCTCATCCATGTGGCTGCTGTAACAATTCAAGCTTATACAAGAGGATTTCTAGCAAGAAAAAAATACCGGAAGATGCTTGAAGAACACAAGGCTGTGATCCTCCAGAAATACGCCCGTGCATGGCTTGCCAGGCGCAGATTTCAGAATATTCGTCGGTTTGTATTGAATATCCAGCTTTCATACAGAGTTCAGCAGCTGCAGAAGAAGATAGAAGAGCAGAGTAGAGAAAATCATGGTTTGCTGGAACGATTGACCAGCCTGGCTTCGACTCACGTGAATGACATGGAAATAATACAGAAACTCGAATTAGATCTTGAAAAGGCAACTGCTCAAAAGAGAACGTATGAAGAGAAAGGGAAAAAATATAAAGAGGACAGTGAACAGAAAATCCTAAAACTCGAGAATGAGAATAAAGAATTACAACAACAGAAAGAGACCTTGGAAATAAAGCTCCAAGAGAAAACTGAGGAAATGAAAGAGAAAATGGATGATCTCACAAGGCAACTGTTCAGTGATGTACAAAAAGAAGAAAACCAGAGAATGATACTTGAGAAAAATTTCCAAAATCAGAAGCAGGACTATGAAAAGGAAATCGAAATGCTCAAGGGAGAAATTAAAATTCTGAAAGAAGAAAAAACTCGGCTACAACATCAAATTCAGCAAGAAATTGTCATTCAGGACAGCTTGAAAATGGAAGTAGGACAACTTACAAAACAAGCACAGAAAATACCTGAGTTGCAAAAGGAAATTGAACTGCTGCAGACACAAAAATTGGATATTGAAAAGCAGGCCCAGTCACAGAAGCGAGAACTGAGGGAAAAGATGTCAGAAGTTACAAAACAGCTTCTTGAAAGTTATGATTTTGAAGATGTAAGAAGCAGACTCTCCACAGAGGATTTGGAACACTTAAATGAGGATGGGGAACTGTGGTTTGCTTATGAGGGCTTGAAAAAAGCTACAAGAGTATTGGAAAGTCATTTTCAGTCTCAGAAAGAAATATATGAAAATGAGATCGAAGGCTTGAACTTAAAAGTTGAACATCTTAGCCAAGAAATTAATCATCTACAGAAGTTATTTCGAGAGGAAAATGACATAAAGGATGGCATTCGATTGGAAGTTAGCAGGCTAACTTCAGAAAACCTGGTGATCCCAGATCTTAAGCAGCAAGTTTCTGAACTTGAAAATCAAAAATTAGATCTTGAAAACCGTCTTCAAGAGCAAACTGTAAAGTTGAAAGGTAAAGTAACAAATGATGTAGATATAAAAGAAAAAGAGAGACTGAAAGTCACAACCCAAGAAATTAAGGGGCTGAGCAATGGTCTAATGCAAGATGAAACCCAGGATGAAGTACAAAGCAAGATGAAGCAAGAGACAACTCGACTTACTGTGGAAAACATGGATCTTGAAGAAAAACTAGACATGAAAGACAGAATAATAAAAAAATTGGAGGATCAAATCAAAACTCTTACCAAGACTATTGAAAAAGGAAATGAAGCTCATATGCCACCTTTGTCCAGAGAGTACATTGGAATGATGGAGTACAAAAAAGAGGATGAAGAAAGGATCATCCAAAATCTGATCCTCGATTTAAAGCCACGTGGAGTTGTAGTTAATATGATACCTGGCCTTCCAGCTCACATCCTCTTCATGTGTGTGAGGTATGCAGATTATCTGAACGATGCTGACATGCTGAAATCTTTCATGAATGTAACCATTGATGGTATCAAACAAGTTGTTAAGGAACATTCAGAAGACTTTGAGATGTTGTCCTTTTGGCTTTCCAATACATTTTATTTTCTTAACTGTTTGAAGCAGTACAGTGGGGAAGAGGAATTTATGAAGTGTAACACGCCACGTCAGAATAAGAACTGTTTGAAGCATTTTGATCTCTCAGAATACAGACAAATTCTTAGTGATTTGGCCATTCATATCTATCACCAGTTCATTACTGTAATGGAGAACAACATTCAGCCCATGATCGTACCAGGCATGCTGGAATATGAAAGTCTTCAGGGAATTTCTGGCTTGAAACCTACAGGGTTCCGTAAACGGTCTTCTAGCATAGATGACACGGACACCTATACAATGACCTCTATCCTGCAACAGCTCAGCTATTTTTATAGCACCATGTGCCAGAATGGCTTGGACTCTGAGCTGCTGAAGCAGACAGTGAAGCAGCTTTTCTTTCTGATTGGAGCTGTCACCCTCAATAGCCTCTTCCTCCGCAAGGACATGTGCTCATGTAGAAAAGGAATGCAGATAAGATGTAATATCAGCTACTTGGAGGAATGGCTTAAGGACAAGAATCTTCAAAGTAGTAATGCCAAAGAAACTTTGGAGCCGCTATCTCAAGCAGCCTGGCTTCTGCAGGTCAAAAAGATCACAGATGAGGATGCCAAGGAAATATGTGAACACTGCACGTCTCTTTCTGCTGTGCAGATAGTTAAGATCCTCAACTCGTACACTCCAATAGACGATTTTGAGAAAAGAGTGACTCCATCGTTTGTTCGTAAAGTCCAGGCTATGCTAAACAATCGTGAGGATGTTCCACAGCTGATGCTTGATACCAAATATGTCTTTCAAGTGACGTTTCCTTTCACCCCCTCTCCACATGCCTTGGAAATGATACAAGTCCCCAGCAGCTTCAAACTTGGCTTTCTCACAAGGATTTAA\n>XM_020048109.3 PREDICTED: Esox lucius basic helix-loop-helix and HMG box domain-containing protein 1 (LOC105026992), transcript variant X2, mRNA \nCCGCAGCTTGGTAATAGACTGGTTGTTAGTTATTGCACACATGTAGCATTTCTATGTAGCTAGCTAGTACTCTTAGCTAATTTATATTTTGCTGGCTTATCTGCTCGCTCTCGCTGTCACAATTGGCTACTAAGCGGTTTTACAGGTGTGGGTGAATTTTGAAGTGGTCTATTGTCCAGCCTAACTGCATGTTTGATCCCGATGAAAGATTTGAGCCATGGCACCTGGATCCAAAGGCAGAGACGGAACTCGAAAGAAAAGAAGGAGACTCTGGTCCACATGCTGCGCTATTTTGACTTCCTTCAGAGTAAAATACAGACCTTGCAGAGGTGCTTGCCCCCTGAAAGCATCCCCAAGCAGGAACCTGACACAGGATCTGAGAGTGAAGAGAACACCCCCTCTGAGCCCTGTACACCCTCTCATATTCTAAAGGCTAAGCGCAAGTATGTCTGCAACCGTTCCCATAAGAGACTACCTGCCTCCAGCTCAGAGGTGAAAGCAGAGCTTCAGGGGAAAAGAAGAAGATTGTGCACTGCAGATGTCAGTAGACAGAAAGCTGACCCAAAGGAGGAGGATGTGCCTGTCCCTATGTGGGGTGTGCATTTTGATTGGTCAGAGTGCCATTCCAGTGATAGTTATGGGGATTGGCATGTGCGTGAAAGTGACTCCCAACCAAGCTCCCTGGATTCGGGCTTCAGCTTCAATCAGTTGCTTCCCCTGAGCACCCCTTTGGAGGGGTGCAGTGGGACTCTGAGGACTCCATCCACTCTTCAGGGAGGCCACTGCTCTGCCTGTGAGGACGGCAGTGAAAGCAGCCCAAGGAGCGGTGTCCTCCATACCCCAACTACTCCAGTTACTGGGCCAGGGTCACTTTTCCTGAAGGATCACATGGTTGGGGTCATCCCGTCCACAGGAGGCCGATGGAAACCCTTCCTGAGCCCTGCTGCTACACCAAAACGGCCCATCTTTCTGCCGTTTGGAACTGAGGACAGTCTGAACTTGGGCGAGAGTCTGAACCTTAGTCCGTCTCTCCTCACATCACCTGGCCGGGGCCTCAGCCAGTGCCTGCTACCTGAGGGACCGGAGGAGCTCCATGTGCTGTTTGAGGATGTTTGGGTCACCCCTAAAATGACCCAGGCCAAAGTGTCCCACCTATCCTACCATGACCCCACTGACACGCTGTCAGATGGAGAAGCTGTGGTGAGGCATAGCGGTGGAGGGTGGTTGTCCTCCCACAGTGAGGGGGAGGAGGAGGACGTCACCTGGACCCCCAAGCAACAACAAGTCTCTCTGAAGTCCAAGACCAGTGGGACAAGACGCCACCGCAGAACCAACGCCTCCACCAGGGGGCACCCTCTCCTCCCTCCCAACCTGAAGAAGAAGTGTATTAACGGCTTCATCATGTTCTGCCGCATCAACAGGAAGACCTACCTACGCACCCACCCAGGCACGCCATCCACCGTGGTCACCAAGGAGCTGGCCAGCCTGTGGCACGACATGCCCAAGCAGGAGAGGCGTGTGTACTGTCTGAAGGCTCGTCGCTTCAGCCGTCAGCAGAACCGTAACGTGAAGCCTCAGCCGGCGGAGGGGGAGGAAGAGGACTTTGTGCCCAGTCCACTCCACATGCTGCTGGCGCAGAGAGACCTGAGGGCTTCAGCCAGAGGAGACTCCTAGAGCAGTTCCCTTCACACACACTGGCCCTTCGCCAACCATATGCATGGGATGGATATTGATATAGATGTCCATATTAAAATCAACAACTTCTCTTTTTAAGTCACTTACTGTACTAGTTAATTATGGAGTTGTTTAGAGATTTATCTGAAATGCAGACACACTTTGTGTGTGTGTCTGGCACGTCACATTTTAACTGTTACTGTTTACTGCTTCAAGTTGTTTCTAGACAATGTTCAGACTTGGTTTTACAGATATCATTGAGGAGCCTTTTAGACAGGGTTTATTGACAGAAGTCTTTCTGTGGGTTATAATGCCAAGGCATTGTTTTGCTATTCATGTCAACCTGACGTTGAATTCACCAGTCTATTTATGATCATAATGCAAAGGACCAAATAAATGACAGTATGTGGCTGACAGCTTTATTTATTACCTATTTATACTCAGAATATATTCATATGTGGGGAATGTTAATGTGTCTGTGTGAAGTCCTTCTGTACAGGACAGATGAGAACCAAAGTCTTACCGTTTGGAGTTATTCACACTGGTTGGTTGATGTTTTTATGCGGTGTGAAAATGTTTTGATGTTTCGTGAATAAAAGTTATTACTACTTAGTAGTGGGTTATTTGAGACACATCAAATAGTTTGTTTA\n>XM_034078853.1 PREDICTED: Pseudochaenichthys georgianus glutamate receptor interacting protein 1 (grip1), partial mRNA \nGACGGGCGCGATCCACGTTGGGGATCGCATCCTGGCGATCAACAGCAGCAGCCTGAAGGGGAAGCCTCTGAGCGAAGCCATCAGTCTGCTGCAGCAGGCCGGAGAGACGGTCACGCTGAAGATCAAGAAGCAGGGCGACCTGGCGAGCCCTAAGTCCTGTTTGATTGGTTCAGGCATGGGGGCGGGGCTTGTGAGGGAACACCAGGACGGCGTTGACGATCCGGTCATCGTGGTTACGCCGCTGTCGGGTCAGCGAGCGTTCAGCACCCTGCCGTCGGTGGACAGCGCCGTGGAGTCCTGGGACGGATCCAACGTGGACAGCTTCACCCCCCCGGCTCCTCCCTTTCAGTCGTCTCCGTACAATTTCCACGACTGGCGCAACGCAAAGACGACAAACAGCCAATCATCTTCCTGCGCTCGCCAGAGAGCCAATCAGCTGTCAGACCTCGGCCTCAGCGACGACGAGTGGGACCGCCCACCAATGGGAGGAGCCTATAATCTGCCCAGCGGTTTGATCACCGACTGCAGGTTCAGCGTGGGTCATGATGGGACGGAACCGGATCAGGAAGAGAACTTCTGGTCTCAGGCTTTAGAGGATCTGGAGACATGCGGACAGAGCGGCATCCTCCGAGAGCTGGAGGCTACCATCATGTCCGGTTCCACGCTCAGTCTGAACCACGACCCGACCCCTCTGCGCAGCACTCTGGGACGCCAGGCCAGCTTCCAGGAGCGAAGCAACTCCAAGCCATCGGTAAACTCTCGGTCCAACACCTTGCCCTCTGACCCCACGCGCCGAGCCTTCGCCATGAGGAAGATGAGGCAGGAAGTCAACGAGATCCTAAACCAGAACCCCGTGGAGCTCCACAAGCTGACTCTAGAAAAAGCCACAGATCTGGAAGATTTTGGGTTCAGTGTTTCTGACGGCATGTTGGACCGCGGCGTCTACGTGAACAACATCCGACCGGGAGGACCAGCAGAGGGCGGCGGCCTCCGAGCTTACGATCGGATACTACAGATTAACCACGTTCGGACTCGGGACTTCGACTGCTGCCTCGTGGTTCCTCTGATCGCCGAGTCTCCGAACCACCTGGAGCTCGTCATCAGCCGAAACCCGACTTCCTCGTCCACCACGCTGTTGACCAATCACACTGACGGCATCTACAACAGCGGCCACTCCCCTCAGCCAATCGGCAGCGACCTCGGACCTTTGGAGCTCTCCATTGGCCAGTTGGAGGACGGCGGTCCAATCAAGTGGAGCCAACCGGGGGACATGTTGGTGGCGGGCCTTGGGATGGGTCAGGTCAATAATAATTCCGTATAGCAGACAAACAATGGATTCAATTAACCAGATTGGACTGGAGAGGCCGACCAAACAGCAAAATGACTGGTTTTGACCAGTCCAAACTGGTTTAGAGTACCCTATGGTGCTACACACACCCTCTGGATGACCTTTGAACTGTTGAGGCAGCCTGAAAGCACACTGATGGACCGGAGCAACTCCTCACCTTTTCACAAGAACCAGTTCTGCATACTGGTCCTTTATTACTGGAGTCACTGGAACTATAACTACTGATCCTACTGGAACCACTATGAGAGAGCTACTGGTCTGACTGGTCCGACATTAATGGGTACTCGAGTCATGGATGCTGATTCTTCTAAAGCCAATGGTTTTACTGGTTTTAGATTAATGGTTACTGGTCCAACTGAAGCCAGAGCCACAGCCAATTAATGGTCCTACTGGCCAAGACACATCGGCTCTGGTCTTATGGTGAGTTCACACCAAATGCAGAGCTGATGCACTTTGGGTAAACTGGCAAAAGATGGGAAGGCAATTGGTTTGAACTCGGCATAAGTGGGAACAAAACCAATCTGAAGCCAAATTGATTGGTCTTTTTGGTCTAGAAGACTCGGGTTCTGGTCTGAGTGGTGACAGCATCACGAGTACTGGTTCAACTGGTCCAAGACATGGTTGTTATGGTCAAAGAATCATGTGTACCACCAAGCAAGATCCATGACTACTGTGGAACTGGGTCTTCTGGGCCATCTGGTCTTACTAGAATCAGAACCATGGCTCTAATGGCTGTACTGGCCAAGGACCACAGCAGCACAAAGACTGATGGGAACCAGAACCTGCTGACGGACACACGGGTTGCCATGTAGACGAGGGACGCCCCGATCTAGAGCCAATCCAAACCATACTGATTACTGACTGGTTTCTGGTCTTACAGGTTCATTTATGTCGACGGTATAGGTATACATATCTATATTCGGCGCAGTGTGTTGGGTTTAGGCGCACAATTAAAACTAGTGATGGTTAAATACAAGTCTGAAAATGGTCAAATGCAAGTATAATATTGACAAAGTTGGTTTAAAGATAAGGACTAAGGACGTGGATGGTGTTAGGTGGGGTTTAGGTGTAGTTCAGTTTGTTCTAATACAGGGCTGTCAAACTCAATTTCATCACGGGCCACATCAGCATTATGGTTGAACTCAAAGGGCCGGTTGTAACTTTAAGACTATATAAAAATACATATATAAATATTTTATATATTTAAAATAATGTATTATATTACTTTATTGCCTCTGCTTTGGATTATTAAAAAGCTTCATAGATAACTACGTCTGAAAGAAGAAGTCTAGGGCAAATAAGTGCAAGTCTCTTCA\n>XM_046869510.1 PREDICTED: Silurus meridionalis nucleolar protein 9 (nol9), transcript variant X4, mRNA \nGTATATTAAGAACATGAAATAATTCGTTTTAAACCCCGGGATATTTCGTATTGTCCATCCCCTTGTTCGTTCCATACCGCTTTTGGAGCATACGCTAGACAACGGGCTGTGTTTAGATTTTTTATAATATTTTAACAACATGGTCGTTTTTGTCTCACTTTAGTGTAGGAGCGTTTGCAAAGCATAAAAGGGGGTTAACGTTTGTCTTCGTTTGAGGGTTAATATTATTGTTAACGTTGACGTTAAAGAACTGCAGGACTGCTCACATGGAGAGATCCTAGCTGTGAATTCCTGTTTATGGCTGCAGATTCTTGAATATTTTTATCAGCTAGCCATTTAAAGAGGTGGTTTTTCACACCATGAGCCAGTGCCAATGAAAGTTCACAAGCCACAACCATGAAGGTGCATAAAGTCTCCTCTCGCTCCAAACATGAGAATCGAAATGCTACGAAACGCCACTCCAAAAACAAGTGGCGCACTCACGGGAAGAAGAACCAGCACGTGGACCCTTCTGGCCAGAATCCCAGGCCTTCGACGGCAAAGTTTGAGAATGAGCTGGTTAACAGACAGAAGCCCAAGGTGAAGCGCTTACAGAAGGCTTACACCAAGGCTGCAACTGTGACGTCCAAAGACAAATGTTCATCTCAGGCTAAAGGCAAGGCTCTGTCTGCACCCTGTCCTCACGTCCACACCAACGGGGGTACTGAGCTGGAGACGGAGAGCGACTCGGAGGACTCCCAGGTCTGGAGGTCTTACGCCAAGAGCGTTCTTCAGAACGGTGCCGAGAAAGAAGGAGAAGGGAACTCGGTTTTAAATCAGTCTGAGGAAGTGGAGGTGTTGGAATACCACGCGCAGTATGAACGCTCCCAGAACCACACAGTGTTAGTACTGAAGCAAGGCCAGTCCCTATGTTTCCGAGGAACGTGCCTGCTGATGTGCCTGAGCGGTCGTGTGGAAGTGATGGGCTTTACAATCGAGCAAGGCCAGCAGCCGTATCCGCTCTTCTCCCCATCGTCCCACTGTCCGCTCACCATCAAGGCCATGGTCGAGTGCACATCCTCAGCCAAAAGCAGGAGGGAAACTCGATTAGAGGCCAAAGCCATCGTCCGCAAGTACCTCCTGCCAGGCGGCGCCGTTGCCGAGGCTCGTACGAGACTGCTGAGCGAGGTGGATGCAGATTCATGCGTGGTGCTGCTTCAGCCGCTGGACACGCCCCTCACACGCTTCCTCTCCAGCTTCGGCAGCTCCTTCAGCCATCTCTTCGACCTCAGCTCGAAGGAGCTGCACTCCCAGGCTGCCGTGTATAACCCAGCTCTCTCTGCCGTGGGCGTGACGGCGCTGCAGGGCCCCTGTGCACGTGGTCTGGTGGCATCAAACAGCTATAAAGAGGCGCTCAGTCGCCTGCTCAGTGCATGGGAAGGGGATTTTGATCGCTGTCCCATTATTCTCGTCTGCGGGGCCAAAAACTCTGGCAAGTCGACTTTCAACAGGCATCTCATCAACAGCCTGCTTAACCACACTGCAAGCGTGGAGTATCTGGAGTGTGATCTTGGCCAGACGGAGTTCACGCCTCCCGGGTGTCTCTCTTTAATCACTGTGACCGAGCCACTGTTAGGCCCTCCATTCACACACCAACGAGAGCCAGAGCACATGGTGTTTTACGGCCAAGCAGAATGCCAGTCCGATCTAGACCGCTACCTGGACTCACTCAAGACCCTGTGGAGACACTACAGCGGAGAAAACCCGGTCATTATTAACACCATGGGATGGGTTAAAGGGCATGGCTTCCAGGTGCTGGTCGACCTCATTCGCTTATTCTCCGTCACCCATGTGGTGCAGCTGAGCTACGGTGACACGCCCCAGTGCCATACTCTCAACCCCGACTTCCTGCGCTCTGCCCAAGGCTGGCACACTCATCCACCGGCGCAGTCTGCCCTCGCGGAGGAACCGGCCAATCAGCTCTCGGCACGGGGTCACCTCCTCCTCAGCATCCACTCGGAGTTCGAAGGAGCCGGGACATCCGGGGAAATGCGTCATCAGCGCAGTAACGAGCTGCGTGAGCTGGCATTGCTGGGATACTTCAGCCAGCTACAGTCTGCAGAACCCGGCCCTATCTGCCCCCTGCACTGCTTCACCCCCTACCAGGTGCCCCACTCGGCTATCGCTCTCGGAGTCACTCACTGTGACGTGGCACCCAACCACATCCTGTACGCCGCTAACGCCGGTTTAGTGGCTCTCTGCTGTCTGAGTGAAAAAGTGGCAGGAAGAGGTGGACCTGTGCTACTGCCTCAAACGCCCATCTGTCAGTGCGTAGGCTTAGGTGTCCTCCGAGGGGTGGATATGGCCCGAGGGCTCTACTTTCTAGTCACCCCAGTGCCTCCGGCGACCCTGAGGCAGGTCAACTGCCTGCTGCTCGGGGAGATCACACTGCCGAAAATCCTGCTCACTGTCCAGCATGGTGTTGAGACGGAGCTTCCTTACGTCACCACAGATTACAGCTTTGAGATCACGGGCGCAGGAAAAGTCCACGTTTTCAAAGGGCTCGCGAGGTCCGGTTTCGTCAAAACTAAAACAAATAACTAAGCTCTCTTATACGGATTTCACTTTCAGCGAACGATGTTTGTATCCCTGTACTTGTTTTTTAGACCAAATAAAGAGGCTTCAGCTGCCACCGAATGTA\n>XR_003057350.2 PREDICTED: Ziziphus jujuba var. spinosa uncharacterized LOC107427618 (LOC107427618), transcript variant X2, misc_RNA \nGTAACTTGCAAGCAAAATAGGGCTGGTTATATATATTACACTTTGCTTACCTCTCTTTGAGATGGTCTTAGGCTTGAAGCGAGACCATTTCTAAGCAAATTAAAACTACGTCATCCCTTGGCGTGTTTGTAGTTTGAATGTTCATTTTTTAGTGTTTTTTGGCTTCCAAGAATTCTCACATACCCATATGAAAAAGCACATAAAACCCCCTTCATAAATAGATGAATAAGAAACTATATATAATTCCAGAGATCAAATTTTCTTGGCTTAACATTATTATTTATATTTTTTTCTTATTGGTGAATTCAAGAAATTAAAGATCAATTATGTGGCAGATACGATCTTGGGCTTCTTACAAATTCCGAAGTATGCTTGAGTTAATTCGTCCCGGTATATCTGCTTTCTCATCCTCCATGAATACTGTCTATCACAGAAACTCTAATTCATCAGGTATGCCGATGGCTAAGTTTGGATATGGTTTTCCAAAGCACCAAGGACTGCAGTTGTTCGGCAACACCACCGGTAGCAAAACTTTGACAACATTTGGTACCAACATGGTAAAGGATGGCAATAAGGAGCAAGTTCCACCACCAGTGCCTCCTAAGAACAACATTCTTTATTGGGCAAGATGGGTTTTGGGCTCTATATTAACATTGCTGCTGCCATTTTGGAAGCAATATTGGGGAAAACTACAAAGAATAGAAGGAAAGGTAGAAATGGTTGCTGAAGAGGTGGAAAGTGTGGCAGAGGTGGTGGAAAAGGTAGCAATTAAAGCAGAGAAAGTGTCATCAGAGGCTGCAAATGTACTTCCAGATAATGGAAAACTGAAGGAAACAGCTTTGATTGTAGAACACATTTCAAAAAAAGCAGCCCAAGATGCTCAACTAACTCTGGATATCATTCACAAGGTTTATATATATTTTCCAAACCAATTAATTCTAATTAATTTTGACAAGTAATTCTATGGTATTCCAGGAATACATACCCTCAAACTCATAATAGAATGGACTCCACGTATGTTTACGAGTGTGGATGCATTAAAGCATGACTTCGAAGAATTGGAGACTTTAGTTGAGCCTGTTGTCGATAAGATTGTGGTAAATCATGAATCTGATGGAAAGTAATTAATTTGGGTATTGATCATAATATCATTTTTTTCCTTGTAATGTATTTTCATAATTTGGGCAACCGCATTTTGCCCATGTGAATCGTACAACTTTTGCGCTTTGTTCTTTCTA\n>XM_010349232.1 PREDICTED: Saimiri boliviensis boliviensis guanylyl cyclase domain containing 1 (GUCD1), transcript variant X2, mRNA \nGGATTGGGCGAGGGGGCGGGGCCACCCGACGCAGAAGCGGCAAATGGCCAGGGCGGGCTTAAATTGGGAGGCTGGGGGCATCTAGAATCAAAGTTTGGGGCGGGGCTTCTAGAAGGGGCGGGGCCTCCAGATTCGAGACCTGGAACGACCGGGGCGGGTCTCGGGGCGGCCCAGCCGCCGCCTCCAGTTCTCCCCACCGCAGCGGCGCCGGCGGCGGTGGCGGCGGAGGAACTCGATACGCACCGACCGTCCTCCCGTCCTAGCCGAAGCGGAAGCTGTAGCCCGCTCTGGGCCGGGGCCATGGGCGCCCCGCGCCGCCCGGGTCATGAGGACGGAGGCGGAGGCAGCGGGGCCGCCGCTCGAGCCCGGGGACTTTGTGCAACTGCCTGTGCCCATCATCCAGCAGCTCTACCACTGGGACTGTGGCCTGGCCTGCTCCAGGATGGTTCTTCGGTACCTGGGCCAGCTGGACGACAGTGAGTTTGAGAGAGCCCTGCAGGAGCTGCAGCTGACCAGGAGCATCTGGACCATTGACCTGGCCTACCTGATGCACCACTTTGGCGTGAGGCACCGCTTCTGTACCCAGACCCTGGGCGTCGACAAGGGCTACAAGAACCAGTCCTTCTACAGGAAGCACTTTGACACAGAGGAGACCCGGGTCAATCAGCTGTTTGCACAAGCCAAGGCCTGCAAGGTGCTGGTGGAGAAATGCACGGTGAGCGTGCAGGACATCCAGGCGCACCTGGCTCAGGGCCATGTAGCCATCGTGCTGGTGAACTCGGGGGTGCTGCACTGTGACCTGTGCTCCAGCCCTGTCAAGTACTGCTGCTTCGCCCCTAGTGGCCACCGCTGCTTCTGCCGCACTCCTGACTACCAGGGCCACTTCATCGTTCTGCGTGGCTATAACCGAGCCACTGGCTGCATCTTCTACAACAATCCAGCCTACGCCGACCGAATGTGCAGCACCAGCATCAGTAACTTTGAGGAGGCCAGAACCAGCTATGGCACAGATGAGGACATCCTCTTTGTCTACTTGGACAGCTGACACCAGGAGCCTGGTGTGCCCAGGCCCTCGGACCCCATCCCCACCCCAGCTGGGCCCACTCAGGATGCCCTGGCCCAGGCCTGGGGCTGCTGGGGCTGGAATGTGGAACTGCAGCCTCAGCCCATCTGGCAGGGCCCCGGGAACTCTGGGAGACTGTGGCACAGCTGCTTTGTCTGCCAGTGCCCTGTGTTGTCATGTCGGTCACCCCAAGCACTTGCTGGCTGCTGGAAGCATCCCCCAAGACCCCAAGCCTGACTCCAGCTGTACCCACAGAAAGTCCAGCTCCAACAGTGCCCTTGTTGCCTTTGAGCCAGACCCAAGGCAAGGGAGAGGCTTTGTCTCCCCACAGACCGCAGGACTGGGCCTGGAGAGAGAAGTCGCTTGACAGATGCCACTTGTCAGGATAGTATGTGAGTGTCTGGAGACAGCATAGCTGACCCCAACCCCCCCAGCACTGAGGACCCCTCCAGGCTCTTCTCTCCTGGAAGTGCTGAAGATGCCTCTGTGCCCCATGGTTGATGACACCACCACTTCCTGCCTACCCATGGGCCCAAGTTTCTGTGGCTGGTTTCAGAGCATCTGGTCCCTGCCACCCAGCATAGACACACCTCACAGCTGCTTTGCCATGCAGAGCCCTGGCCCCTGGGGACTCTTAAGCCCCCCACAGTCCTCCAGGTCCTCCAGCTCTGTCAGATGGAGGGGTCTCGGGTGTGACCTGGGCCTGGATCCCACTGGTAGGCCTGATGGCTGGCAGCAGTGTGTGCTCTGGAAATAAACAGCAGCTCTAACCCCAGAGGGATCCCTGCACCCAGGAGGCCTCCCAACAGCAGCCTAAATCCTCACAGTGGGGTCTGCCCTGAGATGGGGACCCCCTAGTACTTTAAGGTTGCCTGCTAGGGCCTGTGCTCCAAAGCAACGGGCAGGGGCAGCCTGCAGCTGCCCACCCAGCCTGGTCTTCACACCAGGTTGCACAGGATACTGGGTCTCTTCTATCTTGATGGAGAAGAGGGGTTCCTGCCCAGGATCATACAACACAGCAAATAGCATAGAGCTCTTCCTTCGGTTTTGGTTTTTTTCTTTTTTTTTTTTTTTCCTGGTTGGGATCAGGGGTTGTTTCTTTGAGATTTAAGTTTTCATTTTTGAGGGGTAATGACCTTTAAGTAAAACAGTAATAGCAAGAGTGAAGGTACTTTGGAACCACCAATACCTCTGCACAGGGCAGTTAGCCAGCTCAAGTTCTTTTTTAAAGAAAGGGACTTGGCTGGTGGTTTGAGTACCCACCCCTTCACTTCACAGACAAGGCAGTTGGCCCAGTCTGGGGAGTCTGCCCAGGACAGTGGTGGGGCTGGGCCTTAAACCCCAGTCTATACCTAAAAAACTAAGGGAAATGGATCATTCTCAAAGGGGCAACAGTGACACCATCCCTGCACTCCTGGGTCCTGGTCTTACAGTGCCCAAGGCATGGCATGGTGGCAGCTGGACCCTCCCCCATCAGGTGGCTCTGGTGGTAGAGGTGGGCTCTTTTTAGGAGGGTGCTCGGACCACACAGCCAAATTGCTCCTCAACCCTAGACAAAGCCTTGACCAAGAGGGAGGTGCTGTTAGCTGGGCAGCCCTTCTGGGTTTCAGAGACTCGTGTGGGCTCCAGTCTGGTCTCATCTCCATTGCCTTAATGACAGGTGGCCCAGGAGTACCCATGCACAGCAGCTGTGGGGTGTGGGCATCTTCAGATGTTCTGGTAAAATTGTGAGATTAGCTGTATGAAGGAAACCAGTGGGAGGAAAGGAAGTTTTCAGGATGGCAAGATTTGATTCAGACACAGTGCACATGCTACTAGGGCTGTCACTGGGCAGTGGCCTTCATGGAGAGTGGTACCAGCACCTCAGTCCATCCAGGATATTTAGAAACACTCAGTCTCTGGTCCCAGAGGATGGCTTCTCAGGGCATGCCACAAGTTAAAGTCACCTGCCTGGAAGATGAATGAGAAAGCTGTCCATTCTCAAGACCCATCTGCCTAGGGAGGGTCACAGAGGCAGGATGTAAGCCACACTGTATTGCATTCTTGCATAAGTCATGAAAATGGGGCCAGAGAGGGAGCCTGGACATCAGGGACTTCTGCCCACAGCACATGGCACCCACAGCTGCCCAGCCTGTCTACATGCTGGGGCCCAGCACAGCCCCTGAAGCCACATGGGACAGTGGGCTTTGTTCACTATAGCCACAGGGGGATGAAAGGGATCTTTTACATTGCAGAGATTTTATATATATTTTGTTTGTAATGAGCCATTCTCAATAAATTCTCGCTGCAAAA\n>XM_053281253.1 PREDICTED: Hemicordylus capensis transmembrane and coiled-coil domains 4 (LOC128338576), mRNA \nTCCCTCCCGCGGCTGCCGGCCTAGTCGCCTTTTTCTGAGCCTCGGACTGGAGTGAGCGCTGAGCCGGCCCAGAGTGAAGGCAAGGCGGGGGCCGGTCGGAGCCTCGATGCGGCCCCTTTCTCCCTCGAGGACGGGCAGAGGCCGGTGAAGATGGCTGCCGGTCACCACCAGCGCTGGAGGCCTTGGAGAAGGGGGCCGATAGGAGAGCCGGAAACGGAGGAGCCGTCTGCACACGTCGGCCGGCAGCTGGGCGAACCGGGGAAGTTTGCCTACGCCGCTCTTTGTGCTGTATCCTTGGCATCGCTGTTTCCAGAGCAAGCCGAAAGCTCGTATCGGACGGGATTCGTCGAGAGCCTGGTGCGGTGGCTAGACCTCCCGGAAGGCGTCTTGCCTGCGATGCAGGCCTTTGCCGGCGGCTTGGGAGGCGAAGGGACAGACACCTTTGCTCAGATCCTCTTGAAGGACCCCGTCCTGAAAGACAACTCTGACATCATCACCCAAGATCTCGTGGCCTTTTCCCTCAAAGATGGCTACTATGATGCCCGAGCAAGAGTGCTCCTCTCTCACGTCACCTGGCTTTTAAGAATCCCGTTGACTGAGCTGGAGGCCTCGGAGGAACGACTTCTTGAATGCTTGAAAGATGAAGAAGAAGAAGAATCTGCAACGGCGGAGGCATCGCGGAAGAGGAAAGAGAAGAAGAAGAAGCTAAAGCGGTACTTGCTGATCGGTTTGGCGACTATTGGAGGAGGGACGGTGATCGGTCTGACGGGAGGCCTCGCCGCCCCTCTGGTGGCGGCCGGAGCCGCGACCGTCATCGGAAGTGCCGGAGCGGCCGCCCTGGGCTCGACAGCTGGGATCGCTGTCATGGCGTCGCTCTTTGGAGCAGCGGGAGCCGGTCTCACCGGTTACAAGATGAAGAAGCGTGTGGGAGCCATTGAAGAGTTTGAGTTTCTCCCGCTAACTGAGGGGAAGCAACTCCACATCACCATCGCGATCACTGGTTGGCTTTCTACGGGCAAATATGGGAGTTTCACGGCCCCGTGGAATAGCCTGCTGCAGTCGAAAGAGCAGTACTGCTTAGCCTGGGAGTCCAAGTACCTGGTGGAGCTTGGAAACACCCTCGACGCCTTGCTGAACGGGCTGGTGAATGTGGTGGCCCAGGAGGCCCTGAAGTACACGGTATTGTCGGGGATCGTCACCGCCCTGACCTGGCCTGCTTCACTGCTCACAGTCGCCAGCGTGATCGATAACCCCTGGGGTGTGTGTCTTCATCGCTCGGCCGAAGTCGGGAAGCACTTGGCGCAGATTCTGCTCAAGCGGCAACAGGGCAAACGGCCTGTTACGCTGGTTGGATTTAGTCTTGGTGCCAGGGTCATCTACTTCTGCCTCCAGGAAATGGCCAAGGAAGAAGATTGCAAAGGGATCATTGAAGATGTGGTTCTGTTGGGGGCACCCGTGGAAGGAGAAGCCAAGCACTGGAAACCGTTTACCAAGGTCGTTTCGGGCAAGATCATCAACGGCTACTGTAGGGGAGACTGGCTGCTGGGCTTTGTGTACCGGACGTCCTCCGTCCAACTCCACGTTGCCGGACTTCAGCCAGTTGACCTGGACGACCGGAGGATGATCAACGTGGATCTCTCCTCTGTCGTCAGCGGCCACCTGGACTACATGAAGCAGATGGACACGATCCTGAAGGCCGTGGGCCTCAAAACCAAGCAGTGCCGTCTGGAAGAGAGGGGAGATCTCACCCTCCTCTCCGCTGAGCCCAAGGAAAGCCAGGAGGAGGCCCCATGTGTAGACACTCGGGAAGAGCAAAACCTGCTGGGAGGAGGAGAAAGTGGCAGCCATGACGGCGGCAGTGATGACTGCTGGTCATGGGAGCCAGTGCCCAGCCGCGGATCGTGCCCAAGGGAACCTCCAGAGGGGGCAGATTCTGAGCCGAGCAGTCTCCTCGATGCCGAAAGGGACCCACAACTTCCTGGCTTGGAAGACCCCTTCCCCACCAGCTCCTCAGGAATAACTGGCCACTGCGACCGCTCTGCAAGCCCTCTTTCTCCAACCGTCCGATAATGCACGAGGTGGCAGGGCATGATGGTGGTTGTAGTACTTGCACAGAGTCTGCCATAAATCTCCCACGGGGCTGGCGCCTCTTAGTGCTTGATGGTGGCGAGACCGATCGTGCAGGATTGGGCCAAAGGACTTATTTTTGTAAAAAAAGTATTTCTCCCCCCACAAAACCATGAATTGGGTACCACTGAAAATCTCGCGAGCATGACGGAGGTGCCCGTCCCTTTTATTCTTTTCTGTGGCTTCTGTTAATAGGAGATGCTAGTCCTGGAAGCCAGCAGTTAGTAACTACTGTTCTTCCTCCATGAGCATATCTGGGCCTTTAAAAAGGCCGTCTAAGTTACTTGTATATTGCATTAATTCCTTCTTATGTGATTTCCTCAGTTGATTTCCCCTTAAGTTCTGATATAAACAGAGAGGGGAGAAGGGTATCCTGCTTCCGAATATGGAGGTTCTGTTCTATACTGTCAGTTTTTCAGAACTGTTAGTTACCTAACTAACATATTGACTGTTTTATGTCAGTGTATGTAGCCTAGGGCTGTCTGCTCTGGCTGGCAGACAGGGTCAGATCATTGGCCCATCTAGTTCAGTGTAGCCTACCCTGACGGGCAGACCCTCTTGAGGGTCAGGGGCCTCTTTGAACTGGAGAGGGAACCTGGGAGCTTCTGCATGCAAAGTGTGTGCTCTCCCCACACTCACAGATCTATTACCCATCGCCATATCTTGTGGCAAAGAGTTCCTAAGATTTCCTAAGAACTCTTGTGGCAAAGAGTTCCTAAGATTTAAGTTCAGAGTGAGAAGGGAGAGAGCTTGCAGGAGACTTAACAAGGTCTGTGTAACCGAAAAAGACACACCCCTATTTATTTACAAATTCACAGGGTTCTGTACGTGGCAGAAAGGTGGGATATAAAATGCAACAAAGCTTTGCTTGGCTTATGGGGCCAAACCAAATAATGCATGTGAAGTATCCTTGCGTACTAAGGAAAGTCCTGTAGTCCTGATCCAGAACTTGATTCCGATCCATCGGTAGATCTCGTAGCTAGACCTCCAATCAGAACTCTGTTTCCCCAGCCCCCCGTATGGCAGATCTAGCCTTGCCATTGGACCCAATTTCCATTTGCAACCCACTTGTTGTCATTTCATCCTTCGGGTCTACCTGGAATGCAAGGCGGGACCATGGCAGCTTGGGCAGGATTCCTGTGAAGCTTTGTTAAAAGCAATTCCAGTTTCTGTGAACTGCGAGCGGAAGGTGGGCTTCCGGTCCGCTACTGTTTAAGAAAAATATTTATTTTGTCAGGAACACTGAAAGGTTGGGCATTAAGAGGATTTGCAGGAGAGATGTGTGGGTGTGCCTGCTGGGAAATAAAGCAATTGTATTAAT\n>XM_029611915.1 PREDICTED: Rhinatrema bivittatum neurofibromin 1 (NF1), transcript variant X2, mRNA \nACTTCCGGTGTGGTGTCATGGCGTCTTCGCTGTGATGGCTGAGGAGAGGCTGCGATAACAGGGGAGGGGGGGAAGCGAGAAGAAGGGGAAGAGGGAATTAAAATAATAAGAATAACCACCCCCTCCTCCAAGCAAGCCAAAAAATAAGAGCCCTTCCAAAAACAGCAAAATAAAAAGCAACGTAGTCGCGGAGGTGGGGGGTGAAAACCTCCCACCCCTTTCTTCCCCTCCCCCGAGGGAAAGAAGGTACTTTTAAACAATATCTAAACATATATATTATATATATATGTAATATAGGAAGGTCGAATCCAGGCGGCCCCGGGGGTGTTTCCACTCCCCTGCCCGGGCTCTCCCCGGGCTGAGATGGCGGCGCACAAACCGGTGGAATGGATCCAGGCCGTCGTGAATCGGTTCGATGAGCAGCTTCCAATAAAAGCGGGACAGCAGACCACGCACACCAAAGTCAGCATGGAGCACAATAAGGAATGCCTCATTAACATTTCCAAGTACAAGTTTTCTCTGGTCATAAGTGGACTCACAAATATCTTAAAAAATGTAAACAACATGAGAATATTTGGAGAAACTGCTGAGAAGAATCTCTACCTGTCCCAGCTGATTATATTGGATACTCTGGAAAAATGTCTTGCAGGGCAACCGAAGGACAGCATGCGGCTAGATGAGACGATGCTGGTGAAACAGCTTCTCCCCGAGATCTGCCACTTTATCTACACCTACCGTGAGGGAAACCAGCACGCAGCCGAACTCCGCAACTCCGCCTCTGGCGTCCTTTTCTCTCTCAGCTCCAATAACTTCAATGCTGTCTTCAGCCGCATTTCTACCAGATTACAGGAACTGACCGTGTGCTCGGAAGAGAACGTTGACATTCATGATATTGAACTGATGCAGTATATCAACGTGGACTGTGCAAAGTTAAAACGATTGTTACAGGAGGCAGCGTTTAAATTTAAATCTCTCAAGAAAGTTGCTCAGCTGGGAGTTATAAACAGTCTGGAAAAAGCATTTTGGAACTGGGTAGAAAATTATCCAGATGAATTTACAAAGCTGTATCAGAGACCACAGGCTGATATGGCGGATTGCTCAGAGAAGTTGTTTGACCAGGTGGACAGCTTTGCTGAAAGCACGAAACGCAAAGCGGCGGTTTGGCCCCTTCAGATCATTCTCCTCGTCTTGTGTCCTGAAATCATACAAGAAATCTCCAAAGATGTGGTGGAGGACAGCAAAATGAACAAGAAGTTGTTTCTGGAAAACCTTAGAAAGGCATTAGCTGTGCATGGTGGAAGCAGACAGCTGACTGACAGTGCTGTCATTGCCAGTGTTAAGCTCTGCAAAGCATCCACCTACATCAACTGGGAAGATCACTCCGTCATTTTCCACCTTGTACAGTCCGTTGTGATAGATCTAAAGAATTTGCTATTCAATCCAAGCAAACCTTTTTCCAGAGGTGCCAGCAATCAGAATGCCGATGTGGATCTAATGATCGACTGTTTGGTTTCCTGCTTTCGCATTAATCCTCACAATAACCAGCATTTTAAGATCTGCTTAGCACAGAACTCCCCATCACCATTTCATTATGTGCTTGTGAATTCTCTACACAGAATCATTACAAATTCGGCCCTGGACTGGTGGCCCAAGATCGATACTGTGTACTGTCACTCAGGAGAGCTCCGCAGCATGTTTGCAGAAACCCTTAAAAGTGCCATGCAAGTCTGTGGCACGCATACCACCACCCGCCTGACTCAGAGTCTTCCATTCAAAGACAAAAGAACAAATCGTAAATTTAAAGACAAACCTACAGACTTGGAAACCAGACTTGGAAACCAGAAGTACCTGTTGCTGTCCATGGTGAAGTTGATTCATGGAGATCCAAAGCTTTTGCTTTATAACCCAGGCAAGGTAGGACATGACACCCAAAACAGCACTACTGAGTTAATTACCGGACTTATGCAGCTTGTACCACAGTCCAACATGCCAGAAATAGCACAAGAAGCCATGGAGGCCTTGTTAGTCCTTCATCAGCCAGAAAGCATTGAGCTGTGGAATCCAGAGGCACCAGTAGAAACGTTTTGGGAAATTAGTTCAAAAATGCTTTATTATATCTGCAAGACATTAATTGGTGCCAACATGCTGAACAGCACAGAAATTCTCAAGTGGCTGCGAGAGATTTTTATTTGCAGAAACAAATTTCTGCTCAAGAACAAGAGCGCCACAGCGGGCAGCAGCATTCCAATCTGTCGCCAGGCACAGGCCAAGTTAGAGGTTGCTCTCTACATGTTCCTGTGGAGTCCTGACATCGAGGCTGTCCTTGTTGCCATGTCCTGCTTCCGTCACCTCTGCGAAGAAGCGGATATCCGGTGTGGGGTCGACGAAGTGTCTGTGCATAATTTTTTGCCAAACTACAACACTTTCATGGAGTTTGCATCTGTCAGCAACATGATGTCAACAGGGCGAGCAGCTCTTCAGAAGAGAGTGATGGCATTATTGAGGCGCATAGAACATCCAACAGCTGGAAACACAGAGGCTTGGGAAGATACACATACGAAATGGGAGGTGGCTACCAAACACATTCTTAACTACCCGAAAACAAAATTGGAGGATGGCCAATGCACTGAAAGTCTTCACAAAACCATCGTGAAGAGGCGAATGTCTCATGTTAGCGGAGGTGGGTCAATAGATTTGTCTGACACGGACTCTCTGCAGGAATGGATCAACATGACAGGCTTCCTATGTGCTCTGGGCGGTGTCTGCCTGCAACATCGCAGCAGCGCAGGCTTGGCCACGTACAGCCCGCCCATGGGACCCATCAGCGAACGCAAGGGCTCCATGATCTCCATGGTGTCCACCGAAGGCAACACAGAGACACCCGTCAGCAAATTTTTGGATAGGCTGCTTTCCTTGATGGTGTGCAACCATGAAAAAGTGGGAATTCAGATTCGGTCGAACATTAAAGATCTGGTGGGCTTGGAACTGAGCCCTGCGCTTTATCCCATGCTATTTAACAAAATGAAGAATAATATCAGCAAATTCTTTGACTTACAAGGACAGGTTTTGCTGACTGACACCAATACGCAGTTTGTAGAGCAGACCATAGCTATATTGAAGAATTTGCTTGATAATCCTACAGAGGGCAGTTCTGAGCACCTGGGACAAGCTAGCATTGAGACCATGATGCTGAATCTAGTTCGATATGTTCGTGTGCTTGGAAATTTAGTGCATGCCATCCAGATAAAGACAAAACTCTGCCAGCTCGTAGAAGTGATGATGGAAAGGCGAGACGATCTTTCCTTCTGCCAAGAAATGAAATTTCGGAATAAGATGGTGGAATATTTAACAGACTGGGTTATGGGAACGTCTAACCAAGCAGCGGATGAGGATGTAAAATGCCTAACCAGAGACTTGGACCAGGCCAGCATGGAAGCAGTAGTCTCTCTCCTTGCTGGTTTACCTCTGCAACCTGAAGAAGGAGATGGAGTAGAGCTGATGGAAGCCAAGTCCCAGTTATTCCTCAAGTATTTTACTCTCTTTATGAATCTTCTAAATGACTGCAGCGAAGTTGAAGATGATGGTACTCAGACTGGTGGAAGGAAACGAGGGATGTCTCGGAGGCTAGCTTCCCTGCGACACTGTACTGTTCTTGCTATGTCAAATTTACTGAATGCTAATGTGGACAGTGGTCTCATGCACTCAATAGGTTTGGGCTATCACAAGGATTTGCAGACAAGAGCCACATTTATGGAAGTCCTTACCAAAATCCTCCAGCAGGGGACTGAGTTTGACACCCTGGCAGAAACTGTGCTTGCGGATCGTTTTGAGAGATTGGTAGAATTGGTCACTATGATGGGCGACCAAGGAGAACTGCCCATCGCCATGGCTCTAGCCAATGTGGTGCCTTGTTCACAGTGGGATGAGCTAGCCCGTGTCCTTGTGACCCTTTTTGATTCACGACATCTGCTTTACCAGCTTCTCTGGAACATGTTTTCAAAGGAGGTTGAACTGGCAGACTCCATGCAGACCCTTTTCCGGGGAAACAGCTTGGCCAGTAAAATAATGACTTTCTGCTTTAAGGTGTATGGTGCTACATATCTGCAAAAGTTGCTGGAGCCTCTGCTCAGGGCCATTATCACATCACCTGAGTGGCAGCACGTCAGCTTCGAAGTGGATTCCACAAGGCTGGATGGGATGGAAAGTCTGGATGAAAACCAGCGCTGGCTGCTGCAGATGACAGAGAAATTCTTCCATTCAATAATTACTTCCTCTTCAGAGTTTCCTCCCCAGCTGCGAAGTGTCTGCCACTGTCTGTACCAGGCAACTTGCCACTCTCTTCTGAGTAAAGCTTCCGTAAAAGAAAAAAAGGAAAACAAAAAATCAGTTGTCAGCCAGCGATTCCCCCAGAACAGCATTGGGGCAGTCGGCAGCGCCATGTTCCTCAGGTTCATTAACCCTGCAATCGTCTCTCCATACGAAGCAGGAATCTTGGACAAAAAGCCACCACCTAGAATTGAACGGGGCCTAAAGTTGATGTCAAAGATCCTTCAGAGTATTGCCAATCACGTCCTGTTTACAAAAGAAGAACACATGCGCCCTTTTAATGACTTTGTGAAAAGTAACTTTGATGCAGCTCGAAGGTTTTTCTTTGACATTGCTTCGGATTGCCCAGCTAGTGATACAGTCAATCATAGCCTGTCCTTTATCAGCGATGGTAATGTGCTGGCTTTGCATAGGTTGCTTTGGAACAATCAGGAGAAAATTGGCCAGTATCTCTCTAGCAACAGGGACCATAAAGCAGTGGGCAGGAGACCTTTTGACAAGATGGCAACTCTGCTCGCATACCTGGGACCTCCAGAACACAAACCTGTAGCAGACACACACTGGTCCAGCCTAAATCTCACCAGTTCCAAATTTGAGGAATTCATGACCAGGCACCAGGTACATGAAAAAGAGGAGTTTAAGGCGTTAAAAACTCTCAATATCTTCTATCAAGCAGGGACATCAAAAGCTGGAAATCCGGTATTCTATTATATTGCCAGGCGATTCAAGACTGGCCAGATAAATGGGGACTTGCTAATATACCACGTGTTGCTGACTTTGAAGCCATACTACGCCAAGCCATATGAGATTGTAGTGGACCTCACCCACGCTGGGCCCAGCAATCGCTTTAAGACTGACTTCCTTTCCAAGTGGTTTGTCGTTTTCCCTGGGTTTGCATATGAAAATGTGACAGCAGTTTACATCTACAACTGTAACTCTTGGGTGCGGGAGTACACAAAGTATCACGAGAGACTGCTCACCGGCTTGAAAGGCAGCAAGAGACTAATTTTCATTGACCCCTCGGGGAAGTTGGCAGAGCACATTGAGCATGACAAGCAGAAACTACCAGCTGCCACTCTAGCTTTGGAGGAAGACTTGAAGGTGTTTCATAATGCTCTCAAACTGGCGCACAAAGACACCAAAGTTTCTATTAAGGTTGGTTCCACAGCAGTTCAGGTGACATCTGCTGAGCGGACAAGAGTCCTGGGTCAGTCAGTTTTTCTGAATGATATTTACTATGCCTCCGAGATTGAGGAGATCTGCCTCGTGGATGAGAACCAGTTCACGCTAACCATTGCCAACCAGGGAACACCTCTGACTTTCATGCATCAGGAGTGTGAAGCCATCGTCCAGTCTATCATTCACATAAGGACTCGATGGGAGTTGTCACAGCCCGATTCCATTCCACAACATACTAAAATCCGTCCAAAAGATGTGCCTGGAACATTGCTCAACATTGCATTGCTTAACCTAGGAAGCTCAGATCCAAGTTTAAGGTCTGCTGCCTATAATCTTCTGTGTGCCTTAACATGTACCTTTAATTTAAAGATTGAAGGCCAGTTACTGGAGACTTCAGGTCTGTGTATCCCTGCCAACAACACCTTGTTCATTGTCTCCATAAGTAAGACTTTGGCAGCTAATGAGCCCCATCTCACCTTAGAGTTTTTGGAAGAGTGCATTTCCGGATTCAGCAAATCCAGCATTGAACTAAAGCACCTTTGCCTGGAGTACATGACCCCCTGGTTACTAAATCTGGTGCGCTTCTGTAAACTCACCGATGATGCCAAACGGCAGCGAGTCAGCGCTATTCTGGATAAGCTGATAACCATGACAATCAATGAAAAGCAGATGTATCCTTCCATTCAGGCAAAGATATGGGGAAGTCTTGGACAGATCACAGATTTGCTGGATGTGGTTCTGGACAGTTTCATTAAAACCAGTGCCACAGGTGGTTTGGGATCCATAAAGGCTGAAGTTATGGCAGACACAGCTGTAGCTCTGGCTTCAGGCAATGTGAAATTAGTCTCAAGCAAGGTGATTGGAAGAATGTGCAAAATAATTGATAAGACCTGTCTGTCGCCTACACCTACATTAGAACAGCACCTGATGTGGGATGATATTGCCATCCTGGCCCGGTACATGCTAATGCTGTCCTTCAACAATTCACTGGATGTGGCAGCGCACCTTCCCTACCTCTTCCATGTTGTCACTTTATTGGTGGCCACAGGTCCTCTGTCTCTGAGAGCTTCCACCCATGGCCTGGTCATCAATATAATTCATTCCCTGTGTACCTGCTCACAGTTGAACTTCAGCGAGGAGACCAAGCAAGTTTTGAGACTCAGTCTGACGGAGTTCTCATTGCCCAAATTCTATTTGCTGTTTGGAATTAGTAAAGTGAAGTCAGCCGCTGTCATAGCCTTCCGATCCAGCTACAGGGATAGGTCGTTCTCTCCTGGCTCCTACGAGAGAGAAACGTTTGCTTTGACGTCGCTGGAGACGGTCACAGAAGCTCTGCTGGAGATAATGGAGGCTTGTATGAGAGATATTCCAGCATGCAAGTGGCTAGACCAATGGACAGAGCTAGCACAAAAGTTTGCATTTCAGTATAATCCATCCCTGCAGCCCAGGGCGCTAGTAGTCTTTGGCTGTATCAGTAAACGAGTGTCACATGGGCAGATAAAACAGATCATCCGCATCCTTAGTAAGGGACTGGAGAGCTGTCTTAAAGGCCCTGATAATTATAACAGTCAGGTTTTAATAGAAGCCACAGTTATAGCTTTAACCAAACTACAGCCACTTCTGAATAAGGACTCCTCTATGCACAAAGCCCTCTTCTGGGTGGCTATGGCGGTGCTGCAGCTGGACGAAGTGAATCTGTATTCCGCAGGCACAGCCCTCCTCGAACAAAACCTACACACATTAGATAGCCTTCATGTGTTCAATGACAAGAGCCCTGAAGAAGTATTCATGGAAATCAGGAGGCCCCTGGAATGGCACTGCAAGCAAATGGATCATTTCGTCGGGCTCAATTTCAACTCCAACTTTAATTTTGCACTAGTAGGACACCTTCTGAAAGGTTACAGGCATCCTTCTCCTACCACAGTAGCACGGACGGTCCGCATTCTACACACATTGCTGGCGCTAGTTCACAAACACAGGAATTGTGACAAGTTTGAGGTGAATACCCAGAGTGTGGCTTATTTGGCAGCTTTACTCACAGTGTCTGAAGAGGTCAGAAGTCGCTGCAGCCTAAAGCACAGGAAATCTCTCTTATTGGCAGATGTTTCACTGGAAAATGTTCCTATGGATACATATCCCATGCATCACAGTGACCCAAGCTACAGGACATTGAAGGAAAACCAGCCGTGGTCCTCCCCAAAGGGTTCAGGCATCCATCTTGCTGCAAATTACCCAACAGTGGGGCAGATTAGTCCCCGAACCCGAAAATCTATGAGTCTGGATATGGGGCAGCCATCACAGGCTAACACTAAAAAGCTTCTAGACTGCTGCTGTAACTCTGTTAAGTTTTGGCTAGGCGTGGCTGAAAACGGGATATTTGTTCCAGTCCACTTTCCTGGTACAAGGAAAAGCTTTGATCATTTGATATCGGACACCAAGGCTCCAAAAAGACAAGAGATTGAGTCTGGGATCACTACACCTCCCAAAATGAGAAGAGTTGCAGAGAGTGACTACGAAATGGAAACCCAGAGAATAGCATCGCCCCAACAGCACCCTCACCTGCGCAAAGTCTCAGTGTCCGAGTCCAATGTGCTTCTGGATGAAGAGGTCCTAACAGACCCCAAAATCCAAGCTCTGCTGCTTACCGTCCTTGCTACACTGGTAAAGTACACTACAGACGAATTTGACCAGCGAATTCTTTATGAGTACTTAGCAGAAGCGAGCGTGGTCTTCCCTAAAGTTTTTCCTGTCGTGCACAATCTGTTGGACTCCAAGATTAATACCCTTTTGTCACTGTGCCAAGATCCAAATTTACTGAATCCAATTCATGGGATTGTACAGAGTGTGGTTTACCATGAAGAGTCCCCGCCCCCATACCAGCCATCCTACTTACAAAGTTTTGGTTTTAACGGTTTATGGAGGTTTGCTGGGCCATTTTCAAAGCAAACACAAATTCCAGAAGATGCTGAACTCATTGTAAAGTTTCTGGATGCCTTGATCGACATGTATTTGCCTGGAATAGATGAGGAAACCAGCGAGGAGTCCCTCCTGACTCCCACATCTCCTTACCCTCCTGCCGTGCAGAGCCAGCTCAGTATTACTGCCAACCTGAACCTTTCCAATTCCATGACCTCGCTTGCCACCTCCCAGCATTCCCCAGCTTCTCTGCCTTGCTCTAAATCAGCAGTTTTCATGCAGCCCCTCGCTCATCAAGGAATCGACAAAGAGAACGTGGAACTCTCACCCACGACGGGACACAGTAACAGTGGCAGGACGCGTCATGGATCTGCGAGCCAGGTGCAGAAGCAGCGGAGTGCTGGCAGCTTCAAACGGCATATCATTAAAAAGATTGTGTGATGTTTGCATGGGGGAGAGGGGTTTTAGAGAGAAAAAGCATACAAGAAACCAAGAAAAAGACTTCTGCTTGTGAGCTTCTCACCAGTGACCCCTACCAGTCAGGATGCTGCACTTAACTTTTAATGTCACCGTACAGTCAGCCATGTTGCCAAAAGAACAACTCTTTGATGTATTGCCTGAATTAACATAGTTTAATGCCTCCTTCAGGTTTCTTCTGTTTCTCTTTGTTCTTTTCATTTTAAAGCAGTGTTCCAGAACCATTGTAGAAAAATTGTTCGTAGATCCCAAGGTTCCAGAATGAAGAACTTTGCAGCTAAAGAAAGCACTGAATCTGCTTCAGTACCTAAACTACAGAAGCCATTTTTTTTTTATTTTTTTTTTTTAGAGATGGTTCTCTGGCTTTTTCTTCCTTGCCTTGCTTTTTTAATTTTGTTTTTGTTTATAAAAAGGAAAGTGTTAATGCTGAATTATTTTTGCACACTTTTCAAAATGGAAAAAACAATAGAGGGATAAATCCTGTTCTTAATGGAAACCCCTTTTAGACTTTTTAGTAGTCCTCTTTTATTTCTTTTTTCTTTTTTACCTGGAAATGAATCTGTAAAAGTTGCAATTGTTCAACTGTGGGCCTAACTAACCAGAGATTGTGCACCTTTAAATAATGTAACTACTTTATCATTTATGGTGGAATTCATGGGAATATAAAACTCTGGCATCAACAAAATCAGCATTTACTCCTTGATACCTGTCAGTTTCTCTAGTGTTCATTTATATAAGGCAAAACTGTTTGTCCCCCTGTTTTTATTGTCTGTAACATTTTAATGGAAAATTGCAGGGTTTTTTGAAAGAGTGAGGGGTTCCAATTTTCAGTGTTAGTTGCTGAGCTGTTTCTCTTCCTGAGTTTGTAGATAATGGTTAGGGTTAAGTCTCAACGTACCCTGCTGCCAGAATGGAATGGTTTGTTAATGCAGGTGTAGAGAATTCAAGTAATTTTTTTCCAGCAATTTCTGAAAACTTCTCTGTGAAGACCTGTTATGACAGCCTCCTGAAGGGAGATGGTAGTTTAAATTTTCTATCTGTGTTTTCCTGGGGGTTCCCCTCAAAACAAAAATAACTACTGGGAGAATTTAGTTCAAAATAACTAATCCCCCTAAATTAATTATTTAATAAGCTTGAAAGCAAGGAGCAAAATACTGATTTTATCATGCCTCTGTTCATGTGTTCTGAATGTAGATGCACCTGCCTGAAGCAATGCTGCGCAATCTTGTTTTTTTTTAAGCAAACTAATCTGTTTTAACCAATTTATATCTGCACTAAAACACATTAGAAGGCGAGAACTGACATCTGTGGTGACACTTTGAATAGAAAAGACATTTGAGACTATTTGTTCATCCAATGTCGTCCTGGGTTTTTTTTTTGTTTGTTTTGGTGCCCCTTAAGTTTAATAGATTCTTCCCCCGGGGACATTGCAAGCAGAATAAATACAGGATTAGGCAATGTGGGAGTTAGAAGCATTACGTCCATGCAGCTCAGCCCAAAAATCAACGCATGTATTATGCCCACATAAATGCAAGATGGAACGGTACATGACCGGAGCGGGCTTAACAAAAAATCCGCTTCATGATGTCAAGCTCTCCCAGTCAAGAATTCTGGCAGTACAGTTTGTCTTATCGCCAGACTTTCCAATCAACATCCACTTATGCTGTAGAATAATCAGAAATTCTAAGAATCACTTTAGAAACATTTTGGGGGTTTATAATTAAACTGAAAACCACATTCTATCACTGTGAAAGCCGTGTCAACCTAGCATAGTATAATGGCAGTGGATGACTGTCCTGGTATACTGCTGTTAAGGTTAATATGTACTATGGAATAGGGCAAGTGGTTAAAATGCTATAATGGACGAAAATGTAAACATTCTGATCATGGAGATAAATACACGTTTGACAGCTATGAGTCAAGGTCATGTTATTTAGGTGCTCATTTTTAGATTGACTGTATTTACTGCTTTAACAACATCTATTCATGGCCCCAGTATAGTACTAAAATTACAAAAAGCTTTAAAAAAAAAAAAAAAAAAAAAAAAAGTATATTGTTAGTGTATTTCAGTAAATCAAATTCCACAGCTAAATTACTAGAAAAAAGGTACAATAAAGTGTTCAGATTGTATTTCTATAGCACATAACACACTTATTCAGACACAGTAATCAGTTTAACATTTATGAATGTAAAAAAATGCCTTTATTTTATTGTCACAAACAAATAACTTAATTTCTTTTTAATTTGTTTACAGTCCTGGAAAAACTATGAACAGAAACATAATATGCAAATATAGTTTGCCAAAATAAGTTTTAAAAAACAAACAAAAAACCCCGTAGTATTAGTTGTGGCTATTTTGAAGTAGCTGACATGTTCAAAATATTGAAGGTTTGTGCAATTAACCAAACTTTTTGTTTTTTATTATTATTATTATTATTACTGTTATTGATAATGTAGAAGTTGCAAAATAGAAATAATTAAAATGCTACAAAATGTATGAAGGGTATTAAAAGGTGAATGAAGTTAGGAATAGAGCAGGGACCCAGTGGCAGGTGCTATACCCATTAGTTTATTTTCCCCAGTCCTGAGATTTCACATGTGAAAACCTACTGTACTGTACACGAGATTCTACTGTAGATTGAATCAAAATTTATTGAAAACATGTACCAGTTTAGCTCGTAAGTGATTGCGTACCAAACTGTATTTTCTCTTTTTTAAAATTTTCATTTCAAATTGAGCAGGAAAGAAAGCAGGGGGAGAAAATGTAATAGATGCCTTGATCTGATTTTTCAAAACACTACAATTTTCTGAAACTGTTGCAAGATTGGATTTCTTTAGTAACCTATTCAAATCATTGACTCTTTCCATTGTGATTCTTAGTGTTAAAAGTGCACGTTGCTTAATCATAGGCTGAGTTGCACAAAAAAATGTCAATTTGGAATGTACACCCTCCACCCTTCCTCCCCCCTCTATGAAATTTAAAAAATATCAGACAACTAAAATTGCTTCTCACTATTGGAATCCAAAAAAATGACCAGGAAATGTTTCACTTGTCCTAACAAAACTTGTACAAAACAAAATGCACACAGCATAACTAACATTTACTTAAAAAAAAAAAAAAGCAAATGAACATGTCCATTACTGGTACCTGAGATCT\n>XR_005095104.1 PREDICTED: Pollicipes pollicipes uncharacterized LOC119106218 (LOC119106218), ncRNA \nAAGAAATGAACTTCAACTGCCTGATCTGTGGAACCAGATGCAAGCTTCACAAGAGCCAGCTTAGTTCCAGGCTGGGAGAGTGGCAACAGGAGTGGTCCTCCAAGGAAGCTGATCAGGGACTCGTTTGGATACTGGATCTGGATCTGAACTGCTTGGACGAGGAGCAGTGCCTGTGTCCAAAGTGCTCACAACTCTTGCGTGATCTTCGGAGCTATGAAGCTAAGGTCACCGAAATCCGAACTGAGCTCATTCAGAGACATGAGGGTTGCATGCATACAGACACTCCAGGATCTGTAGACATCACTGTCACAGAAGCGTCTGTGAGGCATAAGCCGAACTCGGCGAGGCCAGAGCCGGAGCTGGAGCTAGAGCCAGAACCAGATCCAGAGCCGGAGCCAGAGCCAGATCCGGAGCCAGAACCAGAGCCAGAGCCAGCGCCCTGCCTGCGGCGAAGCTCTCGTCGTTGTGGACGACCGCCGGCGCCGGG\n>XM_024031699.1 PREDICTED: Quercus suber uncharacterized LOC111999568 (LOC111999568), partial mRNA \nAGTGCAGACCTGCGTTGGAAGCCACCTGACTTGGGTGTCTATAAAGTCAACTTTGATGGGGCTTTATTTATGGATCAGAGGTGTGCTGGTTTAGGGGTGGTTGTTAGGGATTCAGCTGGGCTTGTTATTGCTGCTTTAAGCCAGAGAGTGAGGCTGCCAGGATCGGTTGATGTGGTGGAGGCCTTGGCAGCTCGTAGGGCAATGTGTTTTGCTCAGGAACTTAGCCTTCATCATGTGGTGATTGAAGGGGACTCTTTGCGAGTTATTCAAGCCATTAACAACACTAGGCCAGTGCAGACTTTGTATGGACACATTATTGACGAAATTAGACTTTTATCTTCGTCAGCTAATTGTAGTTTTTCGCATTTTAATCGGAATGGCAATAAGTTAGCTCATGCCCTTGCTAGACGAGCAATTTTATCTGCTGATACTGATGTGTGGATAGAAGAACTTCTATAG\n>XR_001602060.1 PREDICTED: Miniopterus natalensis uncharacterized LOC107525510 (LOC107525510), ncRNA \nTCACGGGCAGCGGGAGTAAAACCGCGGGCGCTGGAAGGGGCAGAGTGGTGAGGGCTTCTGAAGGCGCAGCCGCGCTCCCCGCGGCCCGGCTGAGCGTCCACCAGGAGCTCGCGCCAGGCCTTCCCGGCTGGGCCGGCCGAGGGCAGCCAGAGCTGTGTGATGACCCGGTTCCAGCTCACACCGCCTCGTGCGCCCGGTGTCGGTGACTGAGCAGCTGCCACAGGGCTTCCCAGTTCTGGAGGCTGGAAGTCCAAGATCAAGTGTTGGCAGAGTTGGTCTCTGCTCACTCTAGCGAAGGTTAGCCACCCTGTCATGAGGACATTCAGCACCCCCTTGAGAAGTCCATGTGTGCCAATGTCCATGTGTGCCAACGTCCACGTGGAAAGGAGCTAATTCACCAGCAACAACTTTCCAGCCAGCTGCAGCTCCAATAAAGGCGAAACCACCGGCCACCCTCCCTCTGGATCTGAATGCTTTCAAGGAACTATTTATTGAGACTGAGCAAGGACTACTTTCTCTGGTTTTCAAATATGTTTAACACACCAATCAATGTGGCACCTTGTTAATCATTTCACTCAACCAATCCTCATCGAGCACCGAAATACACAGAGCACAATCCCCAACAGTGAGGTTCAAGGTGGTGAAACCCCATCACTGCCATAGGAGCTTCCTGCCCAGTGGATTCGAATTACAGAATACAATATAATCAGGTAATAATCACCAAAAACATCAGGTCTAGTTTTACTCATTTACCAAAGGCGTGAGAAAGCTGGGTGTGCCCTGGGA\n>KP885581.1 Homo sapiens isolate SLS040 tRNA-Pro (trnP) gene and control region, partial sequence; mitochondrial \nATTCTAATTTAAACTATTCTCTGTTCTTTCATGGGGAAGCAGATTTGGGTACCACCCAAGTATTGACTCACCCATCAACAACCGCTATGTATTTCGTACATTACTGCCAGCCACCATGAATATTGTACGGTACCATAAATACTTGACCACCTGTAGTACATAAAAACCCAATCCACATCAAAACCCCCCCCCCATGCTTACAAGCAAGTACAGCAATCAACCTTCAACTATCACACATCAACTGCAACTCCAAAGCCACCCCTCACCCACTAGGATACCAACAAACCTACCCACCCTTAACAGTACATAGCACATAAAGCCATTTACCGTACATAGCACATTACAGTCAAATCCCTTCTCGTCCCCATGGATGACCCCCCTCAGATAGGGGTCCCTTGACCACCATCCTCCGTGAAATCAATATCCCGCACAAGAGTGCTACTCTCCTCGCTCCGGGCCCATAACACTTGGGGGTAGCTAAAGTGAACTGTATCCGACATCTGGTTCCTACTTCAGGGCCATAAAGCCTAAATAGCCCAC\n>XR_003958643.2 PREDICTED: Taeniopygia guttata SFT2 domain containing 2 (SFT2D2), transcript variant X1, misc_RNA \nGTGGGCGCGGTGGTTGCCGGGGCTGGTAGTCCCTGGGGAGGGCAGGGCATTCCGGCCGGCCGGGCGGGGTGCGGAGCCATGGACAAGCTGAAGCGGGTGCTGAGCGGCCGCGACGCGGAGGAGCCGAGCGGCCTGGCCGAGGTTATCGATGCGACTTCCTTAGGTTGGGGCACCCGAGTGAAAGGTTTCATTGCGTGTTTTGCGATCGGATGTCTGTGCTCGATCTTGGGTAGTTGTCTGCTATGGATACCAAAGAAAGGGCTGGTATTCTTTGCGGTGTTTTATACCCTGGGGAATATTGCATCCATTGGGAGCACCATGTTTCTTATGGGACCAATGAAACAATTGAAGCGGATGTTTGAGCCCACACGTTTGATTGCTACTATTGTTATGCTATTGTGCCTCATACTAACACTGTGTTCTGCTTTCTGGTGGCGTAAGGCAGGACTCGCGCTGCTTTTCTGCATCTTACAGTTTTTTGCCATGGCATGGTACAGCATTTCCTTCATACCATATGCGAGGTTGGAAAGATGGAAAGATGTGTCAGTGGTGAACTCTGCCTTCTGCTACATACAACATAAATTGCTCTTAGGCTGAACTCTTAGAGTTGAAACAACCTTCCCCATGCTGAGAATAGTAATTGGGCTGTTCCCACTAACCAACTACAGCTCCTTCAGTTAGAGTCTGCACCAGCATGAATGCAATTTCCATGCATTGTTTCAGTCTGGAAATGAAACAATTTTCATTAATGG\n>KJ543947.1 Bacterium AM0179 16S ribosomal RNA gene, partial sequence \nTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTGGTAGAGAAGAACGTTGGTGAGAGTGGAAAGCTCATCAAGTGACGGTAACTACCCAGAAAGGGACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTCCCGAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGTGGTTTATTAAGTCTGGTGTAAAAGGCAGTGGCTCAACCATTGTATGCATTGGAAACTGGTAGACTTGAGTGCAGGAGAGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCGGTGGCGAAAGCGGCTCTCTGGCCTGTAACTGACACTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGATGTAGGGAGCTATAAGTTCTCTGTATCGCAGCTAACGCAATAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATACTCGTGCTATTCCTAGAGATAGGAAGTTCCTTCGGGACACGGGATACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATTGTTAGTTGCCATCATTAAGTTGGGCACTCTAACGAGACTGCCGGTGATAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGATGGTACAACGAGTCGCGAGACAGTGATGTTTAGCTAATCTCTTAAAACCATTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGAAGTCGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGG\n>XM_007779277.1 Coniosporium apollinis CBS 100218 hypothetical protein partial mRNA \nATGTCGGGAATCAAATCCGCCGCTGCCGTAGGACTTACTCTCCTTGCCAATCTTGTTTTGGCCCAAGAAGTTATCATCAACGGTGTAGTCCAACAAGATGTCTTCTTCTACGGTCAGAGTCCACCGGTCTATCCATCACCTGATGCTGAGGGTGACGGCCGCTGGGGCGACGCCTTGTCAAGCGCTCGGGCGATCGTTGCTCAAATGACACTTGAGGAAAAGGTGAACATCACCGGAGGGTTCTCTAACACCACGAATGGATGCGGTGGAAACATCCCGGCCATCGAACGCCTGAACTTTCCTGGAATGTGCTTGCAGGATGGCCCGAATGGTGTGAGAGAGACTGATTTCGTCAATGGCTACGCTGTGGGCATTCACGTTGGTGCAAGCTGGAATCGGAATCTGACTTACGCGCGCGGTTCTGCGATCGGTGGCGAATTCAGAAGGAAAGGTGCCACAATCGCCTTAGGCCCTATGGTCGGACCGTTGGGAAGGATTGCTCTTGGTGGTCGCAACTGGGAGGGATTCAGCAACGATCCCTACATCAGCGGTATCCTTGCTGCTGAAACAGTTAGGGGAATCCAAGACAGAGGCGTAATTGCTTCCACCAAGCACTTTGTTGGAAACGAGCAAGAGCTTCTGCGAAACCCCCGCCCAGATCTCAGCAACCGCAACAAGACTATTGAAACTTCGTCTTCGAACATGGACGATGCGACGATGCACGAACTATACATGTGGCCTTTCGCGGACGCTGTACACGCTGGTACAGGCAGCATTATGTGCGCATACCAGCGCCTTAATAACAGTTATAGCTGCCACAATAGCAAAGCTCTGAACGGTCTTCTAAAGACCGAGTTAGGCTTTCCAGGTTTCGTGCTGAGCGACTGGGGTGCTCAACACACTGGCATTGCCAGCGCATTGGGCGGTCTCGACATGGTCATGCCTTTTGGATTCCGCTTCTGGGGCCCCAATCTCACTGAAGCAGTCCGGAATGGCTCGGTTCCAGAGTCCCAAATCAACAACATGGCAACGAGAATCATGGCAGCATGGTACTTTGTGGGCCAGGACAGTCCAGACACGCCTCCTTTAGCAGTTGGCATGGCACGCAGCCACTTGCGTCCTCACACTGTGGTCGATGCCCGAGATCCCGCGGACGACGCCGTCAACCTCCAGGGAGCTATTGAGGGCCATGTCCTTGTCAAGAACATCGACAACGCCCTACCTCTACGAAATCTCAGCATGATGTCAATCTTTGGCTACGATGCCAAGAACCCTAACTACAACAGTCCGGCAGAAGGATTCAGTGCTTGGTCCCTGGGTCTCCAATCCCAGAATTACCGCTCTATAACCGGAGGCGGCTCAGGAGCTATTACCCCTTGGTATATTGACGCACCGTTCGAGGCCCTGTCCCGACGCACACGTGCAGACAGAACCGCCCTGTTTTGGGATTTTGACACCAACGGAGCGAACAGCACGATTGACACCAACAGCGAGGCCTGTCTCGTGTTTATAAATTCAGCCGCTTCTGAAGGTGTTGATCGGCCATCCCTACGCGACGACTTCTCGGATGCATTGGTAGAGAACATTGCCTCCTCTTGCAACAACACAATTGTTGTGATCCATAACGCTGGCGTCCGTCTAGTTGACCGTTGGATCGACCATCCTAACGTCACAGCACTCATCTTCGCTCAACTGCCGGGTCAAAACTCAGGCGAGGCGATCACGCAGATTCTCTATGGCGACGTTTCCCCCAGCGGCAAGCTTACTTACTCTATACCACGGAACGAATCTGACTACGGGTCGCTACTGGCACCCGTCAATTACACTGGCTGGGACCGCTACTTCCCGCAGGACAACTTCACAGAAGGTGTCTACATCGACTATCGCGCTTTTGATGCAGCAGGCATTGAGCCCAGGTATGAGTTTGGCTTTGGCCTCACCTACACAACCTTCGAGTACTCTGATCTCAATATTCAAGTTACAAGCGATGGGAACCTCTCGGAATACCCTGTTGGGCCAGTAATTCCCGGAGGGGAGGCGGACTTATGGGACAACCTAGCCACCGTGACAGCGGAGGTCACCAATACCGGCGATGTAGAGGCGGCCGAGGTGGCCCAGCTGTACCTTGGGATTCCAGTTGCCGGCCAGCCTGTTAGGCAGCTGCGGGGCTTTGACAAGGTGATGATCGCGCCGGGTGAGACGAGACACGTTCAGTTTGATCTGAGACGGCGCGACTTAAGCGTGTGGGATACTGGTGCGCAACAGTGGAGACTTACCCTCGGAACCGAATATCGTGTTTGGGTGGGAGCGAGCTCCAGGATTCTGCCACTGAATGGAACCATGGTCTTGTAA\n>XM_034834249.1 PREDICTED: Vitis riparia plasmodesmata-located protein 2 (LOC117917828), transcript variant X2, mRNA \nGAAACCCAAAAACAAAAATCACCCAAAAAAAGGTTGGAACCCCACAACGCTCCTGAGCTTTTCTCAACCAGAATCCATCACCCTTGCCTTGATTTCAACCAAAACCCATTTCTAGAGACCACCAAACCCTGCAAAAACCATTCATGCTCTGAACGATTTCATGTTTCCTAGATGGGTTTGCCGCCAAAACCCCTGTCTCTCCTCTCCCTCTCTCTGACTTTCCTCACAATTCTTGGCTTCTTCCCATCTGCCAAACCCTCCACAGATTTCACAAACTTGGTGTATAAAGGCTGTGCCGACCAAAAATTCCAAGACCCATCAGGGGTTTACTCCAAAACCCTCAAACCCCTGTTTGATTCTCTGGTTTCACAGTCCTCCACAAAGAATTTCTCCACAGCCACCTCTGGTGAGGGCCAATCTTCCATCACAGGGCTGTACCAATGTAGAGGTGATCTCTCCAATTCCCAATGCTACACCTGTGTGGGAAAACTCCCAGGCCTCTGCACCAAGCTCTGTGGCAAAGCTATAGCCGCCAGAGTTCAACTCAGTGGGTGCTACATGAGGTATGAGCTTGCTGGGTTCAAGCAGGTCACTGCAACTGAGCTTCTGTACAAGGTGTGTGGATCAACTCAGGCAAGTCAGAGTGGGTTTGAAGAGAAGAGAGACACTACTTTTGGGATGATGGAGAAGGGAGTTGAAGGTGGGGATGGATTCTACACTGGGACATATGAGTCTGTGTATGTGTTGGGGCAGTGTGAGGGGGACATGGGAGGTAGTGATTGTGGAGATTGTGTGAACACTGCAGTTGAGAGAGTCAAAACCGAGTGTGGTGACTCAATTTCCGGGCAGATTTATTTGCACAAATGCTACATCAGCTATAGTTACTATCCAACAGGGGTGCCCAGCCAATCTTCAGCAGAATCAGGTCAGAGTACAGAGAAGACAGTAGCACTTGTTGTGGGAGGGGTAGCAGCTCTAGGGTTTGGAATTGCTTGTTTGATGTTTGTTAGAACAGCTTTCAAGAAACATCATAGTAATTACTGAAAATTTTGAGATATGGGTCTAGAAGATGCCACTGTTTTCTGTAGTGGGTCTCCTCTTTTCTTTGATAAAGAGGGTGGGAAGAGGGTGGTAAAGTTAGGTGAAGTATTCATTGAATCATTGGGAGTGTTGTAAATGGGAAAGGAGAGAGGGTGGGAAGAGATGTTTTTTCTCTCCTTACTTCACACTTAGACTCTACTAGTATTTTGTCATTTTCCATTTTCCTTGTGCATTACATTCCCACACATGAAATTGATACATATGATTCAAAGTATTTTGCTTTCCAATGAAGTTTCCCACTTTATCACTTTATCA\n>LN615563.1 Uncultured Glomus partial 18S rRNA gene, isolate ACyCA VTX00247, clone GAMF284 \nAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAATTTCGGGGTTAGTAGGTTGGTCATGCCTCTGGTATGTACTGGTCTCACTGATTCCTCCTTCCTGACGAGCCTTAATGCCATTAATTTGGTGTTTCGGGAAATTTGGACCGTTACTTTGAAAAAATTAGAGTGTTTAAAGCAGGCTCACGCTTGAATACATTAGCATGGAATAACGAAATAGGACGTTTGATTTTATTTTGTTGGTTTCTAGGATCGACGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATTGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGATGATGTTAATTTTTTAATGACTCATTCGGCACCTTA\n>XM_026558135.1 PREDICTED: Papaver somniferum 60S acidic ribosomal protein P0-like (LOC113309662), mRNA \nTGCTCATCACTTTCTCTCTCAACCAACTCTTTCTCTCTCCTCTCTGAAATAGTGAAAAAAAAATCTTTACAGTTTTTTCGTCATGGAAGAGTAATCTCTAGGCAAACCTTCGGGTGATTAACGGGTCAAGAGCTGCAAGGAGCGGATCTGAATGTTTTCGGATTGAAAAAGTGGTGATGAAATTTTAGGATTTTTTAATCTTGTTTTTCACTTTTCTTGCTTTGTTCTTAATCCTCTCTTCTTTCCGGGTTTGAGAAATACAAGCTATGGTTCCAATTGACACAGGTATTCCCTTGGATTGTTGTTCTTTTTGGGTTTTGTATTGATTCTTCTCACTTCGGGTAAGTGAAATACAAGTTGTGGTTCCAATCGAGGACCGTGGCTCCTTTTTATGATCTTGATTGAATCTTTTCTTCCTTTCTTTGGGTTTTTGGGGGTACTGTTGTATTAGGTACAACAACAACAGGGGATCTAAGATTTCTCTTTCAAATTTCTTTTGTGTTCTGATTAGATTTGCCACTGCATATAATTATCAAGCTGTTTTTCTCATTCCTCCCCTTTTAGGTTGTTCTCGGTATGGTAGTGATAAAAAAAAAACGAGGATATAGAGGGTTGAATCTACCTTTGGTCTGATTCTCTTAAGCTTGCAATTATTCTTTTTTTTTCTTTCATGTGTAACTGGATTGTAGACCAATTAAGTAGTTGTCGGTATCCCAATTGAGATTGGGTATGTGGATTCGAATTTTGCAATCTAATTTCCTTTGCCGTAAATACCAATGTTGATTGGGTCTGTTTATTTTTGTTGCCTCTAAGCTGTTTGGTGAAAGTCCTGAACTGTCTTTCTCCTGTATTTGGCCTCTCTTGCATCCTATCTTGAATGATTCATTCTAAAATTTTAGGTTTCTTACATCAGTTTGGTCAAATTTTCGTTTTGAAAACTACTTTCAATCTTTAACCTTTGCCTTAAAATTAGTATAAATTTATCAGTTAAATTTTCTTTGGTGTTGTTAAACACTTGGGTTGACAATTTTGTCCCAAAAGTGGTAGGTATCTTAAAATAAGTAATTCACAACTATTATTACCTGTTCAGGTGTATGTGCAGATGTTCGTGTTAATTTTTAAAAGTCATCTCCGTTAGGTGTGCTTTATGAACCAAGTGTATGTGCATTGGGTTTTAAAGGAATCGTGTTTAATTTCGAAATTTTCTGATCTTAAAAGTGCTTTCATAGTTCTTAGATGAATAATAGGGCCTAGCACTTCGGAAAAGGCGAAGTCACTTATTAAAAAACAATTTCTTCATTTTTATGCACTTTCACTTATAGTAGTGGTTTCTTTTTAAGATGATTAAGAGTTCTGTTATGTCTTTTATTAGAAAATTTTAGAAAATGGTTTTGATCATTCGTTTGGGTTAATTTTAAAAATCCATGTTGGTCTAAACATATTCAAGAAATCTAAGGAGTTAATATTGGTAGGATCAAAGTCGTTGTTCTTACTAAGTAAATTGTTAAAAGTAAAATTGATAGGTTAATTTTTGGGAGGCTCGTTGATCTGTTTCTGGTTATAAGATGGTTTTAAGGGTATTCACATATAGTTTCTTGGAAGATTAAGGACTAGGATATGATTAATGAGAATTATCTAGCGATAAGGTGTTTCCATCTCTAGTCAATTTTGTTCTATGTATTGTTAAACTTTCGAGGCATGTCTTCGCCTTTGCTTGATTATTTTCCATTAAGAACCAGTGGTAGCCCCATTGTTTTAGTACCCTTATCTCTGCGTCTTTACAAATTAATTTGAGTAAAATCATCATCACTTTTTTGCGAGTCATAAAATCATATCTAAACCTCCGCTCCTCTGTCCCGATAAAACCCAAAGGTAAGCTGACGTCATCTCTTGATTTCTCTCCTTCTTTTATCTCCCGTCTTAACCTTCTTTTATTTCGTCGTATCTTCTTATATTCAAGATATTTTGTGTATGTTTCTGGTAATTCAATTTGAAGTTATTTCTACTGTTTCAACAAACAAGATTTTACAGCAGGAATACAGGTAGCAAAAGCTTGAGGGATTTTTCCACTCAAGCTTTTGACTTACATCTTTTTTTTTAAGATAGTCTTTTGTTTTATCTTGAGTTACGTTTTTACAGAATTCTTATAATCTATTGCATACATGATTAAATCTTAGTTGTTGCTTTAATTCCTAAAACATATTTAGCTTGTTTTTTAGCTTAGGATTATAAGCTGAGGTTTCAATACTTTTTCCTCAACATTCCCTGATGTTTTTAAAACCCCTGGTTATCTTAAAATCAAGCATATCATTAGTTTATATTATGTTTTCACTCATAATTTGTTGTTGTTATATTATATTATTTTGTTTTCTAATACAGAACTTGCTAATGAAAATATTGGCCTGGAACACACAAGGGTGTGGTAAAAAAAAACTAGGCAACAGCTAAACCACTTAGTAAATACTAAAAAAAACAGATGTTCTTTTTTTTATCTGAAACCCAATCTCAAAGGTGCTTAATGAAGCATGTGCTTAATTTTTCCCAAACACCCACATTGTTGACCCAGATGGAATCGCTGGGGGCTAGCAATTGCTTGGGTAGATGGTTTTCATTTTGAAGTGGTTCAATGGAACCTTAACATGATTAATATCATTGTTAAAAACAATTTTCATTCAAATGAATGGCTTCTAACTTGTTTTTATGGTTCTCCGAAGAATGAATTTAAACTAGAAATAATGGGTTACTTAGAGAATATTGCTAATCAAATTAATATGATTTCAGTGTCATGGTTAGTAATAGGAGACCTGAACATTATCTTCAACAGTGATGAAAAAGAAGGATGTCTTCCTTTCAATAGGAAAAAACTGGAACCAATCTTAAATTTAATCCAAAGAACTGGATTAGAGGATATAGGTTTCCGAGGTAATATTTTTACCTGGAATAACAAAAGAGAAGGGCATGCAAACATTAAGCAAAGGCTTGATAGGGGCTTAGCTAATGCAGAGTGGATTCTTGAATTCACAGATGCAACTGCAGAGTGGATTCTTGAATTCACAGATGCAACTCTTGAAAATTTGGTGGAAATAGGATCTGATCATAGTCATATCTGTCTTAATCTCATCTCTTGTAGTTTACATTTAGTTCCAACTTTTAAGTTCTATGACACCTGGCTAAAAGAACCTTCTTGTATAAAGGTTATAAGACAATCCTGGAAATGTTTTTCTGATTCTCCGGCTTTGAAATAATTTGGGAGAAAATTTGAAATTTTGGAAAAAAAAATATGTTTAGAAAGCCAAATAAAAAAATTAAGCATATAATCAAACGAATTGAGAATCTCTCGGCTAAAACATCTCAGGGGAGTATTAGTGAGCTAATAAACTAAAAAACTTTGGAATTAGAGGCTTTGTACGACACTCAAGAAGAAATAGCTAAACAACAATCTAGGAACAACACAATTTCCTAAGGAGAAAGAAACACAAAAATTTCATGTCACAACTTTAAAAAGAAGAAATAGGAACAATATAGATTGCATTCAGGATAGAGATGATAAAGTCGTTACTTCTAGACATGAAATTGAAGATGTTCTCACATCTTACTTTTCTGATCTTTTTTCTGAAAACTCTGTTAATACAGAGGATGAAATTTTTAAACATATTATGTAACACCCCAATTTTCGGGCCCGGATCCTGCTCTGATACCAAACTGTAACACCCCGAATCCTTCCCGGATCCCATGCCTGAAAATCGGGGTGTTACATATTAAGCCTTGCATCTCTTTGGAAGAAAATATAGCTCTAACTGCTATCCTAACTTCAGAAGAAATTTGCGATGTAGTGAAAAAGCTTAAGTCTAATAAAGCACCTGGGCCCAATGGCTTCACAGTGAGCTTCTTCAAACAAAACTGGGAAACTGTAGGAACACAATTGATAACAGTAGTACAAGATTTTTTTCAAAACTAAACAACTACATGTGGATCTAAATAAGACTTTCTTGTTTTTAATTCCAAAAATTAAAAATCCCAAATCCCTTTCAGATTTTAGGTCAATTGGACTTTGTAACACTCTTTACAAAGTCATAGCTAAATTAATGGCTAACAGGTTCAAAATATCTTTAGGAAAAATCATTTCCCCCTTCAATCTGCCTTCCTCTCTTCTAGACAAATCTCAGACAATATTATTGTTGCTCATGAGATTGTCCATTCAATGAAGAAAAGTAAAAAGAAAACAGGAAACATAGGAGCAAAAATTGACATGTCTAATGCATTTGATAGAGTTAATTGAAACTTCTTGATAAAAACTCTAGAGGCCTTTGGTTTCTCTAGCCATTAGAGTGAATTGATTTATCAATGTATCTCTACTTCTTCCATATTTATTTTACTAAATGGGAACCCCTGTAAGGAGTTTAAACCAACTAGGGGAATAAGACAGGGGGATCCTTTATCTCCATATTTATTCATCCTATGTATGGAGGTTCTTTCTAGACTCCTCTGTCATTTGGAATCTGTGAAACAGGTAATAGGTATCAAACTCATCCCAAAATCAACACTTATTTTTCATTTATTCTTTGCAGATGACCTTTTGCTTTTCACTAGAGCTGATTTAGGCAGCTGTAAAAATCTTCTGGAAGCTATTAATCTTTTTAGTAAAGCCTCTAGGCAAGTAATAAATTTTTCAAAATCTGGTCTGTTTTTTTAGTAAAAAAGTTCATAATAAACACCAAGGTATTATTTCTAGGTTAATGAAAATCAAAAAAATAAATATCAAAGACACCCATTTAGGAGTACCTTTATTCATAGATAGATCAAAACTTAAGTTCTTTGATAGCATTATAGAAAAAATGGAACAGAGAGTTAAGAACTGGCTAGCAAAAATCTTATCCCAACCAAGTTAGATTGTTCTAAATAAATCTGTTCTTTCTTGTATGCTAATTTTTAGCATGGGATGTTTTGTTTTGCCTAAAAAAAATACCAAAAGAATGAATGATATTCAGACAGATTTCTGGTGGGGAAAACATACTAATTCCAAAGGTATTTACATAAAATCTTTTGATTTCTTATGTAAACCAATTGACCAAGGGGGTTTAGGTTTTAAAGAGGATAACAAAGTGAATCAGGCTATGATTAGCAGGATATCCTGGAGATTGGTGAGTAATCCTGATAATTTATGGGATCAAATTTTAAAAAGAAAATACTTTAAAAAACAGGAGCTCTTCAATCCAAAAAGAAATCAACAACTTGTTAGATTTGGAAATGCATTTTACAAGGTATTGAGCATATCAAAAAGTATAGTGTTTGGGATGTAGGAAATGGATTCCCTATATATTTGATGATAAATGGTTACCAAACATGGAACAAACTCTAGCTAGTTTTGTCCCTAGAAACTCTAATATAACACTTGTGTCTGATTTGATAAATCATGACACAAAAAAGTGGAATGATTCTTTGTTACTTTCAACTTTTGATAGATCTTTGGTCAGTGAAATAATGAACATAAGATTATACACACAAAGTGATGAAAAACTGAAAAAAGATAAATTGAGATGGTTACTTGCTAGAAACGGTGAATTTTCTGTTAAATCTTTATATGCAAAGTTACTGAATCCATCTAACACCATCCCTGACTAAACAAAGAAGTTTTGGAAAGGATTGTGGAGCATTAATACTTCGCAGAGAATCAAAATGTTTATTTGGAAATGACTGCAAGATGCATTACCTACTAAACAAAAGTTAAAATCAGTGGACAACAAATGCATTTTCTGTAAGACTGAGGTGGAATATACTTTTCATCTGTTCTTTGACTGTGACTATGCTAAAGCTGTGTGGAATCTACAACCAATGGAAGTTCAGAGAGTACCTCACAACTTAGTTTCTCTTAATACTTCTTTCTTGCATAAATATAATGGATGGTTAGCAGGAGATTCGAATTCCATCTCAATGGCACTAGCTGCAACAAAGTGTTGGTTTATTTGGAAAGAAAGGTGTCTGAGGATATTTGAAGATAAATCTATAACACCAATTCAGTTATCACTAGATATATCAAGACACTGTGAGTACTGGCATCCAATGACTTTGAACAGTTTGAATTAAACACAAGACAGAACTATCAAACCAAAACCACAATGGACCTTCCCAATCACAAATACTTTCAAACTAAATTGTGATGCTTCTTGGTTGTCTGAAAAAAAATATAGGCTTTGGTTTTGTTCTTCATAATTGGACAGGAACCTTCAAGGGGGCAGAATCAGGCATCTTCAGGTCTTCCACTGCGGAAGAAGCAGAAGCTATAGTTCTCCTTCAAGCAGCTAAATGGGCTAAAATACATAACATACAACATCTGGTCGTAGAAGGAGATAACAGGGCAACAATTAAGTATTTACAGGGAAAGGAATCAACTATCCAATGGCAAAGCATTGTAATACTAGATGAAGTTAAGAAGCTAGTAGAACAAATGGTATCTTTTTTGGGTTTCCGGTACGTAGACAGGTGAGCAAACAAAGTGGCAGACCAGTTGGCAAAGAAAGGAAGAAAAGGTAACATTGCAATTTCTTGGTTAGACCAAGCTCCCTTTATTTTGATTCCAACAATTTCTTTTGACATGGTCAAAGCTTATGAATCTTGTAATATAAGTACAAACCTTGTATCAATTCAAAAGAAGGTTAATCTTACATATTCAGTCATCAACAAGACAACTCTATCTGAGTTCGCTCCTTATGAGACTGAATCAAATGCTTAGCCTTCTTTGTTTCCAGTAATATATTTCTATTTTCAAAAGAAAGGAAGTCGTTGCTCCTCAGTCTCCCTTCGGGCAGGAGCGGAAGCACAACCATGCTTCCCCTGGCTGGAGCCACCCACAAAGGCCCAAAACACATTTCTTTGTGTCTAATTCATGTTGGACCACAAAAACAGTAGGAACAGTATGGTCAAGCTCAGGGTGAAAATATGGTCAAGCCTGGCTGCCTGGGGTAAGGAAGGTTTCTGGTTCTGCCACTGCCTCCAGCTCTAGTTTAGGTTCATCGGCACATCAAGTTAGATTCATCGGCACATTAAGAAAGGTAACTTAGCTGGTGCCGCGTTGGAATTGGTGCGCCTTTTGTTTTTTGACGCCGCAAAGGAAAGTATTTAGGAATTCTGTTTCTAGAAAGAGGGTATATATGGAAATCGCACAATGAGATATTCAATGCATCTCGCATTATAAATAGAACAATAGAGTAAACCCCGTTACTTGCATAACACACGTAAAGATTATTTTAGGGTTTCATTAGGGTTTCAAAGCAGCAGCTCAAAACATGGCACCCAAACCTTCCAAGGCTGAGAAGAAGATCGCTTATGATAAGAAACTCTGCAAGTTTCTTGATGAATATGGTCAGATCTTAGTTGTTGCTGCAGACAATGTTGGATCGAACCAGTTACAAAACATCAGGAAAGGTTTGCGTGGCGATTCAGTTGTTTTGATGGGAAAAAACACTATGATGAAGAGAACTGTTCGTCTTCATGCTGAGAAAACTGGAAACAATGATTTCCTTAACCTCATTCCTCTTCTTGTGGGAAACGTTGGGTTGATCTTTACTAAAGGAGATTTGAAGGAAGTTAGTGAAGAAGTCAGCAAATATAAGGTTGGAGCCCCTGCTCGTGTTGGACTTGTTGCTCCTATCGATGTTATTGTACCACCAGGCAACACAGGATTGGATCCATCACAAACATCCTTTTTCCAGGTTCTCAACATTCCAACCAAGATTAACAAGGGAACCGTCGAAATTACAATCCCAGTTGAGCTTATCAAGAAAGGTGACAAAGTGGGTTCTTCCGAAGCTGCCTTGCTATCAAAGCTAGGCATAAGGCCGTTTTCTTATGGTCTCGCTGTACTCTCGGTGTATGACAATGGTTCAGTCTTTAACCCAGAGGTGCTTGACCTTACTGATGACGATCTAGTTGAGAAGTTTTATGCCGGTGTATCGATGGTTACTTCACTCTCATTGGCTCTCTCGTACCCTACCCTTGCTGCTGTACCTCACATGTTTGTCAATGGATACAAGAATGTTCTTTCTGTCGCTGTTGCCAGTGAATACTCCTTCTCTTATGCTGATAAAGTGAAAGAATACTTGAAGGATCCAAGCAAGTTTGCAGTTGCAGCTGCTCCAGTTGCTGCGGCTGCTGCTTCTGGTGGTGCACCAGCTGCTGCTTCAAAGGCAGAAGAGAAGAAGCCAGAGCCTGAAGAAGAGTCTGATGAGGATATTGGGGGGCTGTTTGGTGACGACGATTGAGAAACTGTTCCCTGATGATTTTTCCTGCTTGCATTTGCATCTTATTATCTTTAAACTCATCTTTAGTGTTTATACAGTTTGTTAGAACTATCACCCATAATCAGTGTTTTGTTGATATATTGCCATTTTATTGGGTGCGGTTGTTTTTCACTCGTATGGTAGGAGAAATAAAATCATTTTGGAACTCAGAAATCTGTGTGTGTGTTTTGTTCTACCTTTTCTTGTGTTCAATGTGAGTATTATTCGAAGGGAGTACAAGTTTTTACA\n>XM_034856521.1 PREDICTED: Etheostoma cragini testis associated actin remodelling kinase 1 (tesk1), transcript variant X2, mRNA \nTAATAGGCCGCAGCGTCACTGAGGCAGCTCTGTGCGCACTGGAAACCCGGAATTCAATTGGTGGAACCAGGAGGGAAGCCCCGGCCTTTTCTACTGCAGAAGGAGCAGTTTGAAAGAAACCGTGAGAGAGACGCCGCTGCCAAGACAGCAGCAGGAGCAGTCTGCGCAGTTTAGAAAACGGCACAGCCTAATCTGCTGCACGGCATGATGGACTTTACCAAAACTGCGTACTGACTCTGCAAGATGCAACGCTGCAGCTTCGTAGTTCGTTAGACACAGATAGAAACAAGCCCGTTCCGGACGTGTGCAGGAATTTGACAGAGGAATTAGGCCTAACCGGTCGCTGACCACAGCTGCGACATTTGGTTTTCCCACTGAGAGTTTATCACTCCTCCCCTCCGTAGAGCCCTGCTCTGTGGCCTTGTAGCGGACATGGGAAATGTAAACAGTGGTCGGGCTGGATTTTAAACTACGCACACGTCATACGTCCTCCTCTCGCCTCCACCTCCTTCTCCTCCCGGGGCGCCTGAGATGGAGATGGAGACGGAGAGGGTCGAGCAGGGAGAGGCAGAGCTGCCCATGCACAGCGTCCACGGAACCAACCGGATCAGACCGTCCTCTTACCGGGCACTGCGCAGCGCCGTGTCCAGCCTGGCCCGTCTAGATGACTTCAACTGCGAGAAGATCGGCGCTGGGTTCTTCTCTGAGGTGTTCAAGGTGCAGCATCGAGTGTCGGGCCAGGTAATGGCTCTGAAGATGAACATCCTGGCCAGCAACAGAGCCAACATGCTCAGGGAGGTCCAGCTCATGAACCGACTGGCGCACCCCAACATACTCAGGTTCATAGGAGTGTGTGTCCACGAGGGACAGCTCCACGCCCTCACAGAGTACATTAACGGTGGCAACTTGGAGCAGCTGTTGGGGAGTGACGTGTACCTGTCGTGGAGTGTGCGGATGATCCTGGCCCTGGACATCGCCCGGGGACTGCAGTACCTGCACAGCAAGGGCATCTTCCACAGGGACCTCACCTCCAAGAACTGCCTGGTGCGCTGGGAGGGCTGTGTGTGCTCAGCCGTGGTTGGAGACTTTGGCCTGGCGGAGAAAATACCAGATTACAGTGAGGAGGAACAGGAGCCTCTGGCGGTCGTCGGCTCTCCCTACTGGATGGCCCCGGAGGTGCTCAGAGGAGAGGTGTATAATGAGAAGGTGGATGTGTTTGCATACGGGATTATCTTGTGTGAGATCATTGCGAGGATACAGGCCGACCCCGACATCCTACCACGCACTGAGGACTTTGGTTTGGATGTGGACACCTTTCAACAGATGGTGGGAGATTGTCCTCCTGACTTCCTGGAACTGGCCATTGCCTGCTGTAATATGAATTCAAAGCTCCGTCCATCCTTCTCCCAAATTGTGGTAGAGCTGGAGAGGAGACAGGCTGAAAGGAAACAGAAGGATGAACCATCAGTCAAAGCCGTTTCTCCAGTCATTGGTCCTCTACGAAGACGATCCCTCTGCCTCCTGTCAGATCCTCGACTCTCCCGTAGCAAATCCGACATGCTCCACCCCCCAAACATGTCCCCCTCTGTTACTACGGCAATTCCTGCTCGGGTCAACCCCTTCTCTCAGAGGGAGGACCTTAAGGGAGGCAAGATCAAGCTGTTCGACACTCCCAGCAAGTCTGTCATCTCCCTTACCTTCACCCTGCCTCCTCCACCTGACTGCGATGACCCCTCTGTCTCCGAGTCTGACAGCAGTGAGGTACCAAGGAGACACAGGCGCTGCCACTCGCTGCCTTGTACGCCTCCTCCGCACCTCACATCAGCGCCGAACACAATCCTTACAGAGCAGGAGTCCATGTCCAAGATGGACACTGTAAATGGAGAGACAAACCGAGTGAGTGAAGAGGAGAGATTGTTAGAAGAGATGGCAACTATGGAAGGGAATGGAACTGATTCAGGCCTTCCTCTTTCCATTGAGCCCCTGTCGCTGGACCAAGAGAGGGAGGAGGAGGAGGACAACGAGGAAGAGGAGCCCATGGACTGTACCAGCTCCCCAGACACACAAGACAGCACATCATCTCCTTATTCCAAACTCTCCTTTCCTCCGTCCGACTCCTCAACTCCCATCCAACCCTCCACTCCTCCCTTCTCAAATGGCTGGGGGTCAGCAATCTCCAACGGGCCTCCTTGCCTACCTCCCCTCTCTCATTTGGACAACAACAACGTGGTCATCGGTCGACCCTTGGGATGGAGCGCCGCCACCACCACCACCAGTGCTCCCACAGCAAGAACCACCAACAACAACGGCTACCACTTCCCTTCCAGCGACCCCGCTGGATCGTCCCCATTTGGCTCTGGCAGCGGACATTCTCTGGACCAGGAAGAAGTCATCTCCTGTCCCGGCTGCTGCATTGCCGGCCTTCGCTTTCCTTCGATGTGTCCCCGAGCTCCACCGCGCAGAAACCCCTACAAGAACTTGAACGGGGACCATGCAGCTTCACGTGGGCTGCTTGGTCCGGGACCCAAGGGTCTGCCGCCCTCCCCTACCACCACCACCAACCTGGAGCCAGGACTTGCCTTGCCGGAGGCACAGACATGAACCCCAGCAAACTGAAAAGATTTGTGTAAACTCTGCACCAAAAGCTCATCCCTGGAAATTAAGTGGGTCTTGGAAGAATTTGCACAGATTTTAACTCAGCAATACCCTGATTTTTTTTTTTTTTTTTTTTTCAGACAATCTTTTTGGTGCAAATCAGTTTACTAAAACACACTCCAGGTTGACTTTTTCCGTGAAAGCTGTAGGACAAGGTGCTGGTGACTTGTTGCACGTCGCCCTCTGCTGGGCTGAGGGCGACATGCTACGTCAAGAACTGTTAAGCATGGAAACACTCCAGTTTGGGGTCCATTTGGTTTGATCCTCTAAATGTGCATATGTAAAGATTCTTATGACTGATAATATTGATGATGATGCTCAAATGAGGAATGTTAAGCTTAGTTAAGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTTCTGTTTTTTGTTGCTGTGTGATCTCTAATGGCCCTTCTGGTCGCCTGGTTAAGCACTTCAACTGTATTACTGAAACTATTGATGTTATTATTTTTGGGAATGAATGGTCAAAGACCTGTATAAGAGATGTACAGATTCATATTATTTAAAGGATGCATTGAATAAAAAAGATAGAAT\n>XR_001760135.2 PREDICTED: Cynoglossus semilaevis uncharacterized LOC107988670 (LOC107988670), transcript variant X2, ncRNA \nAAAACTCCCCCGCTCTTTGGGGGCATGTCCAAAAGGTGCAGCCCACTTCTCCTGTGTGACTGGGGGGTGTTTCAAGAATCTGTTAAATGCAGAGAATGTTTGGAATTTCTCTTACAGAAAAGTAGAGAATTGAAAAATACATTTAAATAGAGACCTGGACTTCTGGCAGGACAGTCAGGCAGATGAACTCCAACATGATTTTGTCATTTGTACAGAATTATGCTGTAAATGATCCGGGTAAAAATCCTAGATCTGGAGTTCTAGAATGAATGTTTTTAAGCCATCGATTGTACATTGTTAACATGATGCAGCCCTACCTCGACACAGATGATTGATCACTCAGTTGATCAACTGTTTTTTGGGCAAAACGGACTGTTATCAACGTCACATTTGTGTGCACTAACGACTGTATTTGTTTTTTGCAGCACTGATGTACGGCTTCCTCGTTGGGTAACGCACACTCTCAGGGAGGCGTTCTCCAGGTAGGCAGACTGCGTTTAAGCAACAATGATTTTCTAAAGTATTCCACACCCTGTGCCTATGAGCTTGAAGGTTATACTCATTCAGCAGCAATGTTTTTCCCTTTTACTACAACAACATAGATTTCCCCAGACTCCCTGGATCGTTTCACAACAATATTAACTCTTGTTGGTGACAGACCTGATTTTTCTCCAACCTTTTTCTAACAAACACTTTTTTTATCTCTAAATAAATTTCTGAAGTCGAACATAAAGTTCCAAAACATTTTTACTTAAGGCCGAGTCTTGAGCAACTAGTCAAACTAATAAGGTGATTACTGAATGTTATTATTATGACATTTTTAATCCCTTAAAACAACTTTTGGGAGTTTGTTGCAGTCTTTTGGTTCTTCATTTGTTTATGTTAAATAGACAGAATTATGATGGTCAGTGGTCAGTTTTTTTGATTTGAGGGTTTCGTGCACTTTAAGAAGTGTACCAACTTTCTGGAAATAGGATTTGTATTGTATTCAACAGTCACACAAACAACCAAATGACTGTCCTCTTCATTTGCACTGTTGGCTGTTGTAGGTTTGGGCTCATGCCACATGAAGAGCTGTTACATCCATGAGCGGTAGAAAAGGGCGAAGTTTCCTCCCAGATCCAATCCAACAAGTGGCCAGGCCTAAATGTCAACCCGGGGGTCCTCAACCTGCGGCTCCACTACCACATAAGATAGAGATCGGCTCCTCTCGTACCTTGCTCTCTGGGACGCCAGCTCCGACAACCAGCACCAGACCACAGCCACTATTACAATCATTCCTATGAAGGGGATGGAGAGAACAGGGTGCTCAGATGGATGGATGAATCTCTGAGGAGGGAAAAAGAACAAACACACGGGACGTGGAGATGAAGGGAACAGATGAACTGATGGATTAAAACTGGAGACTTCACGGACAGTCGGAGAACACGGACATGAGCAGAGGCACGGGCAGACAGTTTGACAAAACGCTGAGAGACATTCACAACAGGGCTGTTGTAGACGAAACACATTCCAGGGCATCACTGTCACACAGAGGCTTGGACACAGACACAGTCAGGCAAGGATTCACCACTTCAGGCCACACAATAATTTCTGATATGTGCTGACAGGTCCTGTCAGTTCATATCAAACACACACACATATATATATATACTGTATATATATTCTCCTCACAATGAGAGACATATAAAGAGGTGCTCGACACACAGGAGATACAGCAGGTGTGATGTCGGGTGTTGTTATGTGTTAGTTGAGGACATGAGCAGAAACAAAGCTGGAAATAGCCAAAAGTTTAGCAAATTTCTTTTTCAGTCCTAATGATTGTAGCTACTTAAAACCTCAGTGGTGTATCTTTTAGATAACTTTTTTTTTTT\n>FJ579386.1 Uncultured Methanobacteriaceae archaeon clone KR-H08-A02 16S ribosomal RNA gene, partial sequence \nGCTCAGTAACACGTGGATAACCTACCCTTAGGACCGGGATAACCCTGGGAAACTGGGGCTAATACTGGATAGATGATTTTTCCTGGAATGGTTTTTTGTTTAAATGTTTTTTCGCCTAAGGATGGGTCTGCGGCAGATTAGGTAGTTGGTTAGGTAATGGCTTACCAAGCCTATGATCTGTACGGGTTGTGAGAGCAAGAGCCCGGAGATGGAACCTGAGACAAGGTTCCAGGCCCTACGGGGCGCAGCAGGCGCGAAACCTCCGCAATGTGAGAAATCGCGACGGGGGGATCCCAAGTGCCATTCTTAACGGGATGGCTTTTCTTAAGTGTAAAAAGCTTTTGGAATAAGAGCTGGGCAAGACCGGTGCCAGCCGCCGCGGTAACACCGGCAGCTCTAGTGGTAGCTGTTTTTATTGGGCCTAAAGCGTTCGTAGCCGGTTTGATAAGTCACTGGTGAAATCCTGTAGCTTAACTGTGGGAATTGCTGGTGATACTGTTGAACTTGAGGTCGGGAGAGGTTAGCGGTACTCCCAGGGTAGAGGTGAAATTCTGTAATCCTGGGAGGACCACCTGTGGCGAAGGCGGCTAACTGGAACGAACCTGACGGTGAGGGACGAAAGCTAGGGGCGCGAACCGGATTAGATACTCGGGTAGTCCTAGCCGTAAACGATGCGGACTTGGTGTTGGGATGGCTTTGAGCCGCTCCGGTGCCGAAGGGAAGCTGTTAAGTCCGCCGCCTGGGAAGTACGGTCGCAAGACTGAAACTTAAAGGAATTGGCGGGGGAGCAC\n>XM_007564720.2 PREDICTED: Poecilia formosa hexokinase-2-like (LOC103146708), transcript variant X3, mRNA \nAGAAGATGATAAGCGGGCTGTACATGGGGGAGCTGGTGCGTCTCATCTTGGTGAAGATGGCCAGAAAGCAGCTGCTGTTCCAGGGACAGACCACGCCACAGCTTCTTACCTCTGGATGCTTCAGCACCAACTACATCTACGCCATTGAGAGCGACAAAGATGAAGAAGGCCTGGCTAGCGCCGAGAAGGCGCTCCGCAGCCTGGGCCTGGACCCGTCTGCTGAAGACTGCGCCGCCACTAGGAGGATTTGCCAGATCGTTTCAACCCGGGCTGCACATCTGTGCGCCTCTACCCTGGCGGCGGTGATGCGACAGATCCGGGACAACAAAGCGGCCGAAAAGCTGCGCATCACCATCGGAGTGGACGGCTCAGTCTACAAGGGTCATCCAGAATTTTCCAGGAAGCTCAACAAAATGGTGCGGCGCCTCGTGCCAGACTGCGACGTGCGCTTCCTGCAGTCGCAGCACGGCAGCGGGAAAGGCGCGGCCATGGTGACGGCGGTGGCCTACCGACTCGCCACCCAGCACGCCGAGCGGCAGCGCGTCCTCGACACCCTGCGGCTGAGCCGCGAGCAGCTGCTGGAGGTGAAGCGGAGGCTGACGGAGGAGATGGCACGGGGTCTGTCCAAGCAGACGCACGACCAGACCAGCGTCAAGATGCTGCCGACGTACGTCAGGTCCACCCCGGACGGAACAGAACAAGGAGATTTCTTGGCTTTGGATCTTGGTGGGTCCAGTTTCCGTGTTCTTCTCGTTCGGCTGAAAAATGAGAAGAAGCAGAAAGTGGATATGCACCAGAAGATCTACAGTATCGATCAGGACACGCTGCAGGGCACGGGGGAGGAGCTCTTCAACTACATTGTGTACTGCATTGCTGACTTCCTGGACTACAGGGGGATGAGTGGAGCGTCCTTACCTCTGGGGTTCACGTTCTCTTTCCCATGTGATCAAACCAAACTGGAAGAGGGAATCCTTCTGAAGTGGACGAAGGGCTTCAAAGCCAGCGGCTGTGAGGGGAAAGACGTCGTGAAGCTGCTGAAGGAGGCGGTCCAGCGCAAGCAGGACTTCGACACTGACATCATGGCAGTGATCAGCGACACGGTGGGGACCATGATGACCTGCGGCTTTGACGACCGTCACTGTGAAATTGGCCTTATAGTGGGAACGGGCACTAATGCGTGTTACATGGAGCAGATGAGGAACCTCCAGCTGATGGACGGCGATGAGGGGCAGATGTGTGTGAACACAGAGTGGGGAGCGTTTGGAGACGACGGCGCCCTGGAAGACCTGCGCACCGACATCGACCGGGAAATCGACGCTGGCTCGCTGAACCCTGGCAAGCAGCTGTTTGAGAAGATGATAAGCGGGCTGTACATGGGGGAGCTGGTGCGTCTCATCTTGGTGAAGATGGCCAGAAAGCAGCTGCTGTTCCAGGGACAGACCACGCCACAGCTTCTTACCTCTGGATGCTTCAGCACCAACTACATCTACGCCATTGAGAGCGACAAAGATGAAGAAGGCCTGGCTAGCGCCGAGAAGGCGCTCCGCAGCCTGGGCCTGGACCCGTCTGCTGAAGACTGCGCCGCCACTAGGAGGATTTGCCAGATCGTTTCAACCCGGGCTGCACACCTGTGCGCCTCTACCCTGGCGGCGGTGATGCGACAGATCCGGGACAACAAAGCGGCCGAAAAGCTGCGCATCACCATCGGAGTGGACGGCTCAGTCTACAAGGGTCATCCAGAATTTTCCAGGAAGCTCAACAAAATGGTGCGGCGCCTCGTGCCAGACTGCGACGTGCGCTTCCTGCAGTCGCAGCACGGCAGCGGGAAAGGCGCGGCCATGGTGACGGCGGTGGCCTACCGACTCGCCACCCAGCACGCCGAGCGGCAGCGCGTCCTCGACACCCTGCGGCTGAGCCGCGAGCAGCTGCTGGAGGTGAAGCGGAGGCTGACGGAGGAGATGGCACGGGGTCTGTCCAAGCAGACGCACGACCAGACCAGCGTCAAGATGCTGCCGACGTACGTCAGGTCCACCCCGGACGGAACAGAACAAGGAGATTTCTTGGCTTTGGATCTTGGCGGGTCCAGTTTCCGTGTTCTTCTCGTTCGGCTGAAAAATGAGAAGAAGCAGAAAGTGGATATGCACCAGAAGATCTACAGTATCGATCAGGACACGCTGCAGGGCACGGGGGAGGAGCTCTTCAACCACATTGTGTACTGCATTGCTGACTTCCTGGACTACAGGGGGATGAGTGGAGCGTCCTTACCTCTGGGGTTCACGTTCTCTTTCCCATGTGATCAAACCAAGCTGAATGAGGGAATCCTTCTGAAGTGGACGAAGGGCTTCAAAGCCAGCGGCTGTGAGGGGAAAGACGTCGTGAAGCTGCTGAAGGAGGCGGTCCAGCGCAAGCAGAAATTCGACCTAAGCTTTGTGGCGGTGGTGAACGACACAGTGGGCACCATGATGACCTGTGCCTATCAGGACCCCAAATGTGAGCTGGGCCTTATTGTAGGCACAGGGACCAACGCCTGCTACATGGAGGAAATGCACAACATCGAAACGGTGGAGGGAAATGAAGGCCGCATGTGTGTCAACGTGGAGTGGGGAGCATTCGGCGAAAACGGTGAACTGGACGACTTTTGCACAGAGTTTGATTATGCTGTCGACGAAGCCTCCAACTACCCTGGGAAGCAGAGATATGAGAAGATGATCAGTGGGATGTACCTGGGAGAGATAGTGAGGCATGTGCTGATGGATTTCACCACCAAGGGTCTGCTGTTCAGGGGCAAACTGTCGGAGCGCCTGAAGACCAGGGGCATCTTTGAGACCAAGTTCCTGTCACAGATTGAAAGCGACCGGCTGGCCATGCGTCAGGTCCGCTCCATCCTGCAGCACCTGGGCCTCACCGGCTCCACGTGTGACGACAGCGTCCTGGTGAAGGAGGTGTGCAGCGTCGTGGGTCGCCGCGCGGCGCAGCTCTGTGGCGCCGGTTTGGCCGCTCTCGTTGACAAGATCCGGCAGAACCGCAACCTGAACCAAATGTCCATCACTGTGGGAGTGGACGGTACCCTTTATAAGACCCATCCTCATTTCTCGAGGATCATGCAGGAGACCCTGCAGGACCTGGCCCCGCAGTGCGAGGTGACGTTCCTCAAGTCGGAGGACGGCAGCGGGAAAGGAGCGGCGCTCATCACGGCCGTGGCCTGCAGGTTGAAGAGCGAGCAGTCGCTGTGAAACCTGCGAAAACTTCTCCCTGTGGGTCAACACGCGCACTGTGTTCAGTCGGTTGTCATTCTTTTTTCGACGTGAGCGCGTTCACACGAGAGTGTCCGCTTAACGGCGCGAGGCGAAGCTGTGACGGAGGTTCGGTCGGGCGCGAACTGAGCTCAGAAATCACAGTTCTGCTGGTAATGAACCTGCACCTTCAGTGAGACCCGACTGTTACGAGCTCGTTGCTTTTCGTTTTTACACTCTGTCGTTGTCTTTTACTTTTATATTAGTTCTGTTTTTAAGTCAAGTCTGTGAAAAATAAAACTTTTTAGCACATTTACTGTCTGGCAAGTTTAGAAAAGCACATTCCTGAACCAAAGAGAAGCAAACCAGTACATTCAGCAGGTAAATGAAGCAATAGTTTCTTTCCTTTTTTTACATTTTATTTAAGTTTTAAAGCAATTTTACTTTGTTACAGGAAACTTCAGAAAAAATGCAATATTGTGATGAAATGTTTTTAAAATGTAAACACTAGTCCATGCATCAGAAACATAAAGATGTTTTAGAAATTGCAGAGGCTCCGTATAACTGGAGGTATAAATAATTCAAACTGTGTAGTTCTGATTGCAGCAAGCTTATTATGATGTGCTGTGAAAAATATCAACTCCAAATAAAGTGAGAAATCACCAGGGTCTATTTTTTTTATTATTATTTATCAATAAAACCAAGATTACTCCAACTTGGACTCATTTTATTACTGGGGTGTTGAGAATAAAGAGGACAATCTGCACCTCCATAATTGGACCAATCAGTTTAATTTGTAGTTTTTCTCACAAAGCATATTTTCATTGGCTTTTTTTTTTTTTTTTTACAAAATCATTACCTTACAATGGAAAACTACCCTGAATACACATAATCAGACAGCTCTGAAAATACTGTAACATGTGATCTTCATTTTCACTGTTTTTCATCCAACCAAACCCAATAAATCTTACTTGGCTATGTTGTT\n>EU380792.1 Rickettsia sp. GDM18 16S ribosomal RNA gene, partial sequence \nGCTTAACACATGCAAGTCGAACGGACTAATTGGGGCTTGCTCCAATTAGTTAGTGGCAGACGGGTGAGTAACACGTGGGAATCTACCCATCAGTACGGAATAACTTTTAGAAATAAAAGCTAATACCGTATATTCTCTGCGGAGGAAAGATTTATTGCTGATGGATGAGCCCGCGTCAGATTAGGTAGTTGGTGAGGTAATGGCTCACCAAGCCGACGATCTGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCAATACCGAGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTTAGCAAGGAAGATAATGACGTTACTTGCAGAAAAAGCCCCGGCTAACTCCGTGCCAGCAGCCGCGGTAAGACGGAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGAGTGCGTAGGCGGTTTAGTAAGTTGGAAGTGAAAGCCCGGGGCTTAACCTCGGAATTGCTTTCAAAACTACTAATCTAGAGTGTAGTAGGGGATGATGGAATTCCTAGTGTAGAGGTGAAATTCTTAGATATTAGGAGGAACACCGGTGGCGAAGGCGATCATCTGGGCTACAACTGACGCTGATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGATATCGGAAGATTCTCTTTCGGTTTCGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGGCTCGCACAAGCGGTGGAGCATGCGGTTTAATTCGATGTTACGCGAAAAACCTTACCAACCCTTGACATG\n>XM_045299987.1 PREDICTED: Echinops telfairi calcium voltage-gated channel subunit alpha1 G (CACNA1G), transcript variant X9, mRNA \nTCGAGCGCATCAGCATGCTGGTCATCCTGCTCAACTGTGTGACCCTGGGCATGTTCCGGCCGTGTGAGGACATCGCCTGTGACTCGCAGCGCTGCCAGATCCTGCAGGCCTTTGATGACTTCATCTTCGCCTTCTTCGCTGTGGAGATGGTGGTGAAGATGGTGGCCTTGGGCATCTTTGGGAAAAAGTGTTACCTGGGGGACACTTGGAACCGGCTTGACTTTTTCATTGTCATCGCAGGGATGCTGGAGTACTCACTGGACCTGCAGAACGTCAGCTTCTCCGCTGTCAGGACCGTCCGTGTGCTGCGGCCACTCAGGGCCATTAACCGGGTGCCTAGCATGCGCATTCTGGTCACGCTGCTGCTGGACACGCTGCCCATGCTGGGCAACGTCCTGCTGCTCTGCTTCTTCGTCTTCTTCATCTTCGGCATCGTGGGTGTCCAGCTCTGGGCCGGCCTGCTACGCAACCGGTGCTTCCTGCCCGAGAATTTCAGCCTCCCCCTGAGCGTGGACCTGGAGCGCTATTACCAGACTGAGAATGAAGATGAGAGCCCCTTCATCTGCTCCCAGCCTCGCGAGAACGGCATGCGGTCCTGCCGGAGCGTGCCCACGCTGCGTGGGGAGGGGGGCGGCGGCCCACCATGCGGCCTGGACTACGAGGCCTACAACAGCTCCAGCAATACCACTTGTGTCAACTGGAACCAGTATTACACCAACTGCTCCGCCGGGGAGCACAACCCCTTCAAGGGGGCCATCAACTTCGACAACATCGGCTACGCCTGGATCGCCATCTTCCAGGTCATCACGCTGGAGGGCTGGGTGGACATCATGTACTTTGTGATGGATGCTCACTCCTTCTACAACTTCATCTACTTCATCCTCCTCATCATCGTGGGCTCCTTCTTCATGATCAACCTGTGCCTGGTGGTGATCGCCACGCAGTTCTCAGAGACCAAGCAGCGGGAGAGCCAGCTGATGCGTGAGCAGCGGGTGCGCTTCCTGTCCAATGCCAGCACCCTGGCCAGCTTCTCGGAGCCCGGCAGCTGCTACGAGGAGCTGCTCAAGTACCTGGTGTACATCCTGCGCAAAGGTGCCCGCAGGCTGGCCCAGGTCTCCCGGGCGGCAGGCGTGCGGGCCGGGCTTCTGAGCAGCCCAGTGGCCCACGGGGGTCAGGAAACGCAGGCCAGTGGCAGCTGTTCTCGCTCCCACCGCCGTCCATCAGTCCACCACCTAGTGCACCACCACCACCACCATCACCATCACTACCACCTGGGCAACGGGACGCTGAGGGGCCCCCGGTCCAACCCGGAGATCCAGGACAGGGAAGCCAGCGGGTCCCACCGCCTCATGCTGCCACCGCCCTCCACACCCACCCTGTCTGCGGGCCCTCCGGGGGGCACAGAGTCTGTGCACAGCTTCTACCACGCCGACTGTCACCTGGAGCCGGTGCACTGCCAGGCACCCCCTCCCAGGTCACCATCGGAGGCGTCAGCCAGGACGAGGGGCAGTGGGAAGGTGTACCCCACCGTGCACACCAGCTCGCCGCCAGAGGTGCCAAAGGAGAAGGCGCTGGTCGAGGTGGCTCCCCATGCTGGGCCGGCCACCCTCACCAGCCTCAACATCCCCCCAGGGCCCTACAGCTCCATGCACAAGCTGCTGGAGACGCAGAGCACAGGTGCCTGCCAAAGCTCCTGCAAGATCTCCAGCCCGTGTCTGAAGGCAGACAGCGGGGCCTGTGGCCCAGACAGCTGCCCCTACTGTGCCCGGGCAGGGGAGGTGGAGCTTGCCGACCGAGAGGTGCCGGACTCTGACAGTGAGGCGGTTTATGAGTTCACGCAGGATGCTCAGCATGGTGACCCCCGGGACCCTCGACGCAGCCTGGGGCTGGCTGTAGGGCCCAGCTCTGTGCTGGCCTTCTGGAGACTGATCTGCGACACCTTCCGGAAGATCGTGGACAGCAAGTACTTTGGCAGGGGCATCATGATTGCTATCCTGGTCAACACGCTCAGCATGGGCATTGAGTACCACGAGCAGCCTGAGGAGCTCACCAATGCCCTGGAGATCAGCAACATCGTCTTTACCAGCCTCTTTGCCCTGGAGATGCTGCTGAAGCTGCTGGTGTACGGGCCCTTTGGCTACATCAAGAATCCCTACAACATCTTTGACGGGGTCATTGTTGTCATCAGCGTGTGGGAGATCGTGGGCCAGCAGGGGGGTGGCCTGTCGGTGCTGCGGACCTTCCGCCTTATGCGGGTGCTGAAGCTGGTGCGCTTCCTGCCGGCGCTGCAGCGGCAGCTCGTGGTGCTCATGAAGACCATGGACAACGTGGCCACCTTCTGCATGCTGCTCATGCTCTTCATCTTCATCTTCAGCATCCTGGGCATGCACCTGTTCGGCTGCAAATTTGCTTCTGAGCGGGACGGGGACACGCTGCCAGACCGGAAGAATTTTGACTCCCTGCTCTGGGCCATCGTCACAGTCTTCCAGATCCTGACCCAGGAGGACTGGAACAAGGTCCTCTACAATGGGATGGCCTCCACATCCTCCTGGGCCGCCCTTTACTTCATCGCCCTCATGACCTTTGGCAACTACGTGCTCTTCAACCTGCTGGTGGCCATCCTGGTGGAGGGCTTCCAGGCGGAGGAAATCAGCAAACGGGAAGATGCGAGTGGACAGTTGAGCTGTATTCAGCTGCCTGTCGACTCCCAGGGGGGAGATGCCACCAAGTCCGAGTCCGAGCCTGATTTCTTCTCGCCCAGCCTGGACGGCGATGGGGACAGGAAGAAACGCTGGGCCTTGGTGTCCCTAGGAGAGCACCCGGAGCTGCAGAGGAGCCTACTCCCTCCTCTGATCATCCACACGGCCGCCACCCCCATGTCACTGCCCAAGAGCTCCAGCACGGGCCTGGGGGAGCAACTGGGCCCCGCCTCCCGCCGCACCAGCAGCTGCTGGTCTGCAGAGCCTGGGGCAGCCCATGAGATGAAGTCACCGCCGAGCGCCCGCAGCTCCCCACACAGCCCCTGGAGTGCCGCCAGCAGCTGGGCCAGCAGGCGTTCCAGTCGAAACAGCCTGGGCCGTGCCCCCAGCCTGAAACGCAGGAGCCCTAGTGGGGAGCGGCGGTCCCTGTTGTCTGGCAAGGGCCGGGAGAGCCAGGATGAGGACAGCTCGGAAGAGGAGCGGGCCAGCCGGGTGGGCAGTGCCCGGCACCCTGGGGGCTCCCTGGAGCAGGAAGCCAAGGGATCTTTCGACCTGCCGGATACCCTGCAGGTGCCCGGGCTGCACCGCACGGCCAGCGGCCGCAGCTCGGCCTCGGAGCACCAGGACTGCAATGGCAGGTCGACCCCAGGGCGCCTGGCCCGGGCCTCACACCCAGACGAGCCTCCACTAGATGGGGATGACGCTGATGACGAGGGCAACCTGAGCAAAGGGGAACGGATGCGGGCGTGGATCCGAGCCCGGCTCCCTTCCTGCTGCCGTGAGCGGGACGCCTGGTCAGCCTACATCTTCCCTCCACAGTCAAAATTCCGTCTCCTGTGCCACCGGATCATCACCCACAAGATGTTTGACCATGTCGTCCTCGTCATCATCTTCCTCAACTGCATCACCATCGCCATGGAGCGCCCCAAAATCGACCCCCACAGTGCCGAACGCATCTTCCTGACTCTCTCTAATTACATCTTCACCGCCGTCTTCCTGGCCGAGATGACAGTGAAGGTGGTGGCGCTGGGCTGGTGCTTCGGGGAGCAGGCGTACCTGCGCAGCAGCTGGAACGTGCTGGACGGGCTGCTGGTGCTCATCTCCGTCATCGACATCCTGGTGTCCATGGTCTCCAACAGTGGCACCAAGATCCTGGGCATGCTGCGGGTGCTGCGTCTGCTGCGCACCCTGCGCCCACTCAGGGTTATCAGCCGGGCGCAGGGGCTGAAACTGGTGGTGGAGACGCTGATGTCCTCCCTGAAGCCCATCGGCAACATCGTGGTCATCTGCTGTGCCTTCTTCATCATTTTTGGCATCCTAGGGGTGCAGCTCTTCAAAGGGAAGTTCTTCGTGTGCCAGGGCGAGGACACCAGGAACATCACCAACAAGTCCGACTGTGCCGAGGCCAGTTACCGGTGGGTCCGGCACAAGTACAACTTCGACAACCTCGGCCAGGCCCTGATGTCGCTGTTCGTGCTGGCTTCCAAGGACGGCTGGGTGGACATCATGTATGATGGGCTGGATGCTGTGGGCGTGGACCAGCAGCCCATCATGAACCACAACCCCTGGATGCTGCTCTACTTCATTTCCTTCCTGCTCATCGTGGCCTTCTTTGTGCTGAACATGTTCGTGGGTGTGGTGGTGGAGAACTTCCACAAGTGCCGGCAGCACCAGGAGGTGGAGGAGGCGCGGCGGCGGGAGGAGAAGCGGCTGCGGAGACTGGAGAAGAGGAGAAGGAATCTAATGCTGGACGGGGTAATTGCTTCCGGCCGCTCAGCCAGCGCGGCACCAGAAGCCCAGTGCAAGCCCTACTACTCGGACTACTCCCGCTTCCGGCTGCTCGTCCACCACCTGTGCACCACCCACTACCTGGACCTCTTCATCACAGGCGTCATTGGCCTGAATGTGGTCACCATGGCTATGGAGCACTACCAGCAGCCCCAGGTCCTGGACGAGGCTCTGAAGATCTGCAATTACATCTTCACCGTCGTCTTTGTCTTGGAGTCGGTGTTCAAGCTCGTGGCCTTTGGCTTCCGCCGCTTCTTCCAAGACAGGTGGAACCAGCTGGACCTGGCTATCGTGCTGCTGTCCATCATGGGCATCACGCTGGAGGAGATCGAGGTCAATGCCTCGCTGCCCATCAACCCCACCATCATCCGCATCATGAGGGTCCTGCGTATCGCCCGAGTGCTGAAGCTGCTGAAGATGGCTGTGGGCATGCGGGCGCTGCTGGACACGGTGATGCAGGCCCTGCCCCAGGTGGGGAACCTGGGACTTCTCTTCATGTTGTTGTTTTTCATCTTTGCAGCTCTGGGCGTGGAGCTCTTTGGAGACCTGGAGTGTGATGAGACACACCCGTGTGAGGGTCTGGGCCGGCATGCCACCTTCCGGAACTTCGGCATGGCCTTCCTGACCCTCTTCCGCGTCTCCACTGGCGACAACTGGAACGGCATCATGAAGGACACCCTGCGAGACTGCGACCAGGAGTCCACCTGCTACAACACGGTCATCTCCCCCATCTACTTCGTGTCCTTCGTGCTGACCGCCCAGTTCGTGCTGGTCAACGTGGTGATCGCCGTCCTGATGAAGCACCTGGAGGAGAGCAACAAGGAGGCCAAGGAGGAGGCCGAGCTGGAGGCCGAGCTGGAGCTGAAGACACTCAGCCCACAGCCCCACTCGCCGCTGGGCAGCCCCTTCCTCTGGCCTGGGGTCGAGGGCTCCGACAGCCCCAAGCTGGGGCCCCTGCACCCTGCAGCCCACTCCAGGGCAGCCTCCCGCTTCTCCCTCGATCACCCCACGATGGAGTCCCAGGCTACTGAGGTGCCGGTCACCCTGGGACCAGACCTGCTGACCGTCCGAAAGTCTGGGGTCAGCCGCACGCACTCCCTGCCCAACGACAGCTACATGTGCCGGGATGGGAGCACTACTGCGGAGTCCCCTGGGCGCAGGCCCTGGGGCCTCCCCAAAGCTCAGTCAGGCTCCATCTTGTCTGTGCACTCCCAGCCTGCGGGGTCCAGCTACATCCTGCAGCTGTCGAGAGATGGGGCCCATCTGCTACATCCCCATAGCGTACCCCCCTGGGGCGCCATCCCCAAACTTCCCCCACCGGCCCGCTCCCCGTTGGCTCAACGGCCACTCAGGCGCCAGGCAGCAATAAGGACTGACTCCCTGGATGTGCAGGGCCTGGGCAGCAGGGAAGACCTGCTGTCAGAGGTGAGTGGGCCCTCCCCGCCGCTGGCCCGGGCCGCCTCTTTCTGGGGCCAGACAAGCATCCTGTTGCAGCAGCAAGCCCAAGCCTGCAGCCAGATCTCGAAGCACACACCACCTCTAGTCCCCCATCCAGGCCCAGAGCCCACCCGGGCCAGGGTCCCCCGAGAAACCAGCAGCAGCTTGGAGCTGGACACGGAGCTGAGCTGGCTTTCCGGGGACCTCCTGCCAGCGGGCAGCCAGGAGGAGCCCCCCTCACTTCGGGACCTGAAGAAGTGCTACAGCGTGGAGACCCAGAGCTGCCGCCACCTGCCGGCCTCCTGGTTGGACGAGCAGAGGAGGCACTCTATAGCCGTCAGCTGTCTGGACAGCGGCTCCCAGCCCCACCTGGGCCCCAGCCCCACCAGCTTTGGGGCCCAGCCTCTTGGGGCACCAGGGAGCCGGCCCAAGAAAAAACTCAGCCCACCCAGTATCTCCATAGACCCTCCAGAGGGCCAGGGCTCTCGGCCCCCACCCAGCCCTGGCGTCTGTCTCCGGCGTAGGGCTCCGTCCACCGACCCCAAGGACCCCTCGGCCTCGGGCCCCCCCGACAGCATGGCTGCCTCGCCCCCCACAAAGAAAGACGTGCTGAGTCTCTCTGGTTTAGCCTCTGACCCAACAGACCCGGACCCCTGAGTCCTGCGCCCACTCTCCCTTCCTCCACTGGGGGCCAAGTCCTAGCTCCCCCTCCTGGGCTGGTGCCCTGAAAATGTCCACACAGACACGGAGGCGCCCCTCCTCGCCTCAGTGATGCTGGGCCACGCCACACAGGAGTTCCACCCTGGGCCGCCGAGCCAGGGCACAGAGAGGCCCCATGCCGCCGAGGTTCCCGACACCAGGACTTGCTGGGAGAAAGCAATACGTTTGTGCAGAATCTCTATGTATATTCTATTTTATTAAATTAATTGAATCTA\n>XM_020899216.1 PREDICTED: Odocoileus virginianus texanus LCA5, lebercilin (LCA5), transcript variant X2, mRNA \nGCGGAGAGAAGGCAAGGCGGCGGGCGCCGCGTCGGCGCTGAGGAGGGGCCGGAGCGGGTTGGAGAGGAAAAAAGTGTATCTTCTGGTTGCTATTGTGAATTGTGGACTAAAGGTACATAGAGAAAACGGATTGCACAGACTTGAATATTATCCCCAGGATCTGAAGACTCAAAATTGCTCTTCAGGCTTATTTTGGATTTTTCTGAGAAGACTCTGTGAAATTATGTGAATAGAGACTATTTTTCAAAGCCATGGGGGAAAGAGAAAGAAGTCCAGTTACTGATCGAGAAAGTAAGACAAGCAGACCCTATTACTCTTACTGTTCATCTGAATTTGGAACTACTCCACAGTCTTCTGGCCGGTCGTCGCTGGTGCATCCCTCCCCACCTGCAAGTGTTAAGGAAAAACATCCTAAGAAACAAATTTCAGATAGCCAAGTGCATCATCACGCCCCTAGGAAACCAAGCCCTAAGGGTTCACCAAACAGAAAGAGAGTCAGAGCAGGATTTCGCTCCCAGAGCCTCAATAGGGAGCCCCTTCGGAAAGATCCTGATCTTGTTACAAAACGGGTTCTTTCTGCAAGACTGCTAAAAATCAATGAATTGCAGAATGAAGTAACTGAACTCCAGGTCAAGATAGCCGAGCTGCTAAAAGAAAATAAGGCTTTGAAAAGGCTTCAGTACAGGCAGGAGAAAGCCCTGAATAAGTTTGAAGACACAGAAAATGAAATCTCACAACTTATTGCTCGTCATAACAATGAGATTACAGCACTCAAAGACCGCTTAAGAAAATCTCAAGAGAAAGAACGGGCAACTGAAAAAAGGGTGAGAGAGACAGAAGGTGAACTGCTTAGGACAAAAGTTTCCTTACAGAAACTGAAAACGATCTCTGAAGCTAAACACCTACCTGAACGAGATGATTTAGCAAAGAAACTCTCTTCTGCAGAGTTAAAATTAGATGACACTGAGAGAAGAATTAAGGAATTATCAAGAAACCTTGAGCTAAGTAGTAACAGTTTCCAACGACAGTTGCTTGCTGAAAGGAAAAGGACATGTGAGGCTCATGATGAAAATAAACTTCTTCAAAAAGAACTACAAGGACTATATGACAAATTAAAGGAAAAGGAGAGAGAACTGGACATAAAAAACATATATTCTAATCGTCTGCCAAAGACTTCTCCAAAGAAAGAAAAAGAATTTACATCAAGAAAAAATGCTGCATGCCAGAGTGATTTTACAAACCAGTGTACAAAAGGAGTACAAACCAGTGAAGACTTCAAGCTGGAGGACTATCCTATAACACCACAGACAGTTATGTGTTATGAAAACAAAAGGGAAGAACCCGAACGTCTTTCTTTGGATCTGGAATCTCAAAAGAGAGATAATCTTGGAGAAGCTGGGATTCTAAACCCAACTGTGGAAAGAGAAGACAAATTTGCTAAAGATCAAGGACTCCATGTTGTGAAACAGGATGTTGAGAAGCTGGATAATGGGTGGGAAAGAGAAGAACTTGCTAAAAAGCCAAAGGAAAAGACATCTTTGTTGGAGAGAGAAGGAAAGCCAGTGTTGGAAACTGGAAGATATCAAGTGGAAATGCACCAAGTTCAGAAAATTGATAAACTGGAAGAAGAGGAAGAAGAAAGGCTAAAAGAAATGCTACTTGCTAAACTGAATGAAATCAACAGAGAACAAGACTCTCAGAATGTAAAATATCCTTCTCTGCCATTGCTTCCTGACGTGAAGCCAAAACTGCATTCCCCAGAGAGAAACCCCAGAACACACACGTCCTCTGGATCCTCAGAGAGATTATTTAACGGGCATTATTTGCAAGACCTCAGTCTTTCAACAACGAAAGGAGATGGTCAGAATCCAGGCCATACTCGAAGCCCAGCCTCTCCAGATGAGCTTGTGTTTGGTAGCTATGTGCCTTCATTTGCAAAAACATCAGCGAGGTCAAATCCACTTAGCCAAAAAAGTGACCTTTTGGGTTTCTCAGGAAATAATACAGAGAAATTTAGTAAAGACAGTGTAGATTCAATTACCAGACAAGAAAGAAAAGCCACCCTGATGGAACAGCTGTTTGGTACCAGTGGTGGCAGCAGCCTTTCCTCTAAAAGCAGTGACCCAAATTCTCTGGCTGTCACTAAAGAAGACTGTGACCCTCTAAATTATCTCCCTGGGGATAAAAACAGCTGGGGTAGGGAACATAGTGATGATGATGACTTTTTCCTCAGCGAAGGAAGAAGTTTTAATCCAAGTAGACACCGATTAAGACATGCAAACAGTAAACCAGCAGTAAAAGTAGTTGATTCTGTAGAAGATGAAATTGAAGAAGTAGTGCTGAGATGACTGACTAGAATGTTTTTTTCCAATTGTAATTATTAGGATATTTTAATACAGTATTTATTATGAACATTTAGACTTTCTAATATTAAAAAGTCATCATTAACGGATAATTTTTAGTATATAAATACAGTGAAAAGTAGCTGATACCACTAGTAGCTACACACATGTAGCTAGTTTGCTAATAAGGAAGGAGGCTCTTTTGAATGAAACCAGAAATAGAGATGTATCTTACTTTCTTTGTGCAAATAAAGATGTATCTCACTTCCTTTTTGCAAATAGGTTTTACCTCTTGAATCAACTCTATGAGGAGTTTTACTCCATTGGCATACACATTCATTTTCTGTGTTATCCCTATTATTTTTGGTCTTATCCTCACTGAGCTAAGTACAGTTTTCCCGCTGATGGTTGTGTGGAAATGGAGAGATGCTGTAGGGAGCTGGTGCTACTAGGAACCTCTCCACTGTGACTAGGAGTGAAGGGGGTCCCTTTCTTATATGCCAAGACTGAGCTACTCTTAAGTGGAAACAGTGACAACGTGAGAATTTCCCATTCTTCTGGAAGTAACCACAGTTAAATGGTACTGATTTCGCAGTGACAGAGTCTGATTATATCACTTACCTACAGCTGTGCTAACTCATTAGGCTGAATTCCGAAGACGTCTTTCTGTTGGCATGAACAGTGCCCTCCCTGTCCTGGCTTCCAGAGGTTCCAGTGCAGTGTAATCGGTAATTCCTCTCCTTGAACTCCTAATGCTATCTGTATCTCAGTGACTGGTTGTGAGAGGTCATACCAAATGCACAGAATGGAAGAAATTTCACCCCACTAGAGCAGGATTTTCAACTCAATTATGATTCCAGAGTAACATAACTTGGAAATTTTAATATGTACTTTAAGATTTGAACTTACTGTCAAACCAAAGAGACAATGATCACATGATACCATTGGACTTAAGCGGACTAGTTTTAAAGCAGCCTTGGTGAAAAGTGTTTTACAGATGGAGCTCCTCCCTTGCTGAGTAGGGTGGAAGATGTTCTGTTGAAAAGTGTTAGTTTTTTTGCTGTTTCATAGCTCACTTCAGCTCCAGAGAGGAGTCAGGGACCTTGGATTATGCTGGGCATGAGTGGTCTCTAAGAAGCAGAAATATGCCAGTGGCCTAGGAGAAAACTCAGTGCAAATGAAGAGTGGTGGGAACAGTGTATCAGGGCAAGAATAAGTGGTGATTGGCACTTGTTCTGAAATGAACTGTTGTTTTCTAGAATTTGCTACATATTTGTTCATAGTAGGATTTCTGATGCCAGGCATACATACTGATCAGGGGATTCGAGTTACTATCTTGAGTTCTTATAAATGCTAATTATTGAATATAATTTCATAATTATCTGACAAGACTTACTGGTTAGGTCTCTAATTACAAGATGTACTACCTACATCTTCTAAATTGTGTTCCTGTTACCTACTAGGAACCGAATCTCTCAAAAGTGCTAAACTATATCAAATTTTTTTATAAAGAGATTTTTGGATTGATATAAATAAGCATTTACTATGTTGTAAGTCATTCTAATATATGTAAACCACAATATTTTTGTAATGCAGTTCTTGATAAAATATTATATATTAATTTTTTTCATAGCTGCTAATTTTTCAGCCAAAAGTATTCTCATTTTTAGGCTGTTTTTGTATTAAAGGTTTTTTTCTTTCAAAAGTCCTTTAGTAAAGTTTTAAATTCAGATCATTTTAATTAGTCTCTTTTTTCTACTTGATGTTTTCCAATCTTTTTAAACAGATGTAATAACACAGAATTGTTAAAATTAAATCTAAAATTAAGTTATAGACTTGAAGCATTATGGAGTTAAGCATTAAAATTGGAGACTAAAATGTACAGAACAAGTTATTCTTTATGAACAAACCTTAATGGATAACTTTTTTTTCTAAATGTCAAGTTAAATTTATCTGTACTCCAAACTATTACTAATAAAAATTTAAAATA\n>XM_045922658.1 PREDICTED: Maniola jurtina cleavage and polyadenylation specificity factor subunit 6 (LOC123876410), transcript variant X5, mRNA \nGGTCACACTGGTACTACACTTTTCTTCAATTCGCAAAATGGCGGATGGAGGCGTGGATATAGATTTGTACGCCGACGATATTGAATCTGATTTTAATAGACAGGATGACTTTGGAGGTGAAAATGTCGATTTGTACGACGACGTGATCGCAGCCCCGTCGAAGCCCGAAGACGGCGACGGGCCACCCAACTCCGGACCGCCGCAGCATCAGCATCCACCGGAGGAAACCAACGGTTCAGTTCCGTACCACCACAACACCGTATCAAGCCACGGCCATCATGGCCGCCGCTTCCAACTTTACATCGGCAACCTCACCTGGTGGGCGACTGATCAAGACATAGCTAACGCGGTCGCCGATATCGGCGTAACGGACTTTCAAGACGTGAAGTTCTTCGAGAACAGGGCAAATGGACAGTCGAAAGGATTCTGCGTCATATCGCTGGGTTCCGACCAATCCACCAGGATGGTCCTCGATCGACTGTCCAAGAAGGAGATTCACGGTCAGCATCCCGTTGTGACGCTGCCAACTAAACAGGCGTTGAATCAGTTTGAGAGTCAGTCGAAGACAAGGTCAACACCGCCCGGACCCAACAACCCCGGTATGAGAGGTCCTCACCCTGGGGGCATGCCTGGCCCACACCCTGGAGAATTCTTTGGTGGCGGACCAAATGGACCGGGACCAAATGGCCCACGCATGATGATGCCTGGGCCAGGCCCCCATCATCAGCTTCGTGGGCCCCCACCCGGACCCCATGGCCCCCCACCGCACCACATGCAGCAGCACCAAGGCCCCCCACCGCACCATATGCCGCCTCATCAGGGCCCGCCCCCGCACCAGGGGCCCCCACAACACAGGCCACCGATGCAGTTCCAAGGGCCGCCGCAGATGCAACGCGCCCCCGGAGGCCCTCCAGGAGGCCCGCGAGGGGGCCCTGACTGGCCCAGGCCCCACCACATGCAGGCCCCAGCTCCACAATACGGACCCCCGCAACACCAAATGCCGCACCAAATGCCCCCGCCGTCACCGCATGGGCCGCCCGGGCAAGGCATGCCGCCGCCTCACCATCAGATGCCGCCGCACCAGCAGGGCCCGCCCAGGGGACCCGCGCCGATGCCGCAACATCCAGGCGGGGCTCCAGCGCCGCACGTGAACCCGGCGTTCTTCAACCAGCAGCCGCCCGTGCAGCCCGCGCCCGCAGTGCAGCCGCCGCCGCAGCCCGCGCCGCCCGGACCAGGCGCGCCCTACGGCCACCCGGCGCACGGAGGCCCGCCGCCCGCACAGGGCCCGCCGCCCGGCGCGCGCCAGCCGTACGGAAGACCACCTGCAAGCTACCCCGGCGGTGCCGAGGCGCGGCCCGCGCACCACCCTTCGCCGCTGGGCCCGCACGCGCCCCCGCACGCGGCGCACCCCACGCACCCCGCGCACCCGCCGCACCCCGTCATCAGTGAGGCGGAGTTCGAGGAGGTGATGGGCCGCAACCGCACCGTGTCGTCCAGCGCCATCGCGCGCGCCGTCAGCGACGCGGCCGCGGGCGAGTACGCGTCCGCTATCGAGACGCTGGTCACCGCCATCTCGCTCATCAAGCAGAGCAAGGTGGCACATGATGACAGATGCAAGATTCTCATCTCCTCACTCCAAGACACATTGCACGGCGTAGAGACCAAGTCGTACGGGGGAGAGAGACGGCGGTCGCGGTCGAGGGAGAGGGATGCGCGCGTGCACCACCGCGCGCCGCGTCGCAGGGAGCGTTCCGCGTCGCGCTACAGGGACAGGTCGCGTGACAGGGAAGAGCGAGACAGGTATTACAGGGACTATCGTGAGAGGGAACGCGACCGCTCAAGGTCCAGGGACCGCGAGCGTGCAGAGCACTACAACAGGGGACACAGCCGGACGGAAGAGAGGCCTCGCAAGTCGCCCGTAGAGCCAGCGGTGGAGAGTGGCGCCGGAGATACAAGCACGAGCAAAAGTCGTACAGCGGCGACGCCCTACTACGACGAGCGGTACCGCGAACGCCGCGAACGCGACCCTCCCACCGCGGACCGCGAGCGCGACCGCGAACGCGACCACCGCCGGGACGCTAGGCATTAAATGACTAATAAACTAAAACTAGACCATACCATAGTCTAAATAAAGTACAGTACTACCACTTTCAGAAGTAACGCTGATGTACATTCAAAGGCCGTAATTTGTTTAGCACCTTAATGATCATATTCGCGTGGCAAGGTTATGCACATGCGTTAGGTGTGTGTAGCGTGTTTATAGAAAAAAGCCATAAGTGCGACAGGTTTTTGATGCAATAGTTTCGCGGAATTGCTACTCGAATTCTGAGGCCGACCGTACCTACGCAGATATTATATTATATATTATGTATGTGACATTGCCATTACGGGATAGTGGGAGCAAAATTCTATTTTGTTATTCTGGGACTTTGAACTTTCTCTCTTCTGATTGGTCCACAAACATTCGTATGTCTTGTTTTTGCTCATAGGTAGTGATGTAAAATAGTGCCACTCGGGGCCAAAATTTTATGTTTAAGGGCGACGTATATCAATTCCTCTCTCATAACCCCATGTTGATTCCACAGTTTGTATGTGCGTGGAAAAAAGGATCTGGCACAACGGGCGGTCGAAGTCACCAGGCACCCAGGTGGTTAGGGTGAA\n>XM_034343108.1 PREDICTED: Prunus dulcis protein DECREASED SIZE EXCLUSION LIMIT 1 (LOC117614330), transcript variant X3, mRNA \nCACCCTCACACCACTAGTACTCTGATACAAGTCTGTCTACATCTACATCCTCTCTCTGTGTGTCTGATGAGAGAGCACAAAAAGTTGAAAATTATTCTTCTATCTGACTATTTTCCCCTTGCACGGGTTATCATCGTCTTCCGCGAAAAACAGGGTTTCTCCAAACTCTTTCAGTCTCTCGCCGTCTCTGAATCGGTTTGTGTGTTGACCAGAGGACGAAGTCAATTTTAAGTTCGTTCTTCTGTCTTGACTAGTCCAATGGAACGTTGGTTTAGTACAATCTGTAATAGCACCTCCTCTTGAATAAGTCGTAAGAATAACACGAAGAAACCCCTTTCAACCCCGTCGGGTCGTGTACTCAGCACCTCCCTCTAGTGCTATAGCGGCAGTCTGTGACTCTGTCTGTGACTGCCGCATTGCTTATTGAAGAAGCAGGTCCAATGAGCAAACAGAGACTGCCACCGGACCCAGTGGCTGTGCTGAGAGGTCACCGCGCCTCTGTCATGGACCTCTGTTTTCATCCATCCCAACCTCTCCTATGCACCGGTTCCGCAGACGGCGAGTTGCGGATTTGGGACACTATCCAGCATCGGACTATATTATCAGCAGGGGTGCATAATGCTGCACAGGGGATTGCTTCTGTTGCTTGTAGTTCTTCAATTGGAGCCAATAAAGTGATCAGCCAGGGTAGGGATGGAACAGTGAAGTGTTGGGATATTGAAGATGGAGGTCTGTCCAGGACACCTTCTGTTACAATCAAGACAAACTCTTACCACTTTTGTAAACTTTCCTTGGTGAAGAGACCTCATTCTAGTTCTAAGCGAGTTTACGGGACTACGCATAATGACAGTGATGAAACAAGGGTTACGGAGAATGCTGATACGGATGCTCTAGACAATAGCAGAGAAAAGTTTCAAGAGTATCTGCCTGAGCAGTCCAGCACCTTTGAAGAAAATACTCAAGTTGAGGGATCTAAATGTGTCGCTGTAGCAGGGGAGCAGCCTTCTGAGGTTGAGATTTGGGATCTTAATACTGCAGAAAGGTTTGCACGGCTACCTCAAAGCTGCGTTGCTGGTTTCTCAGGTATATCTACCACAGAGAGAGGAATGTGCATGGCGGTTCAAGCATTCTCACCATCCGAATCACAGGGATTCCTAAATGTCTTGGTGGGTTATGAGGATGGTTCCATGCTTTGGTGGGATATTAGAAATCCTGGGGTTCCATTGACCTCTGTCAAGTTTCATTCAGAGCCAGTTCTAAGTCTATGCGTTGATGGGTCATGCAATGGTGGTGTCTCAGGAGCCGCAGATGACAAAGTTGTGCTGTACAGTTTGGATCATTCCATGGGTACATGTGTGATCAAGAAAGAAATTAGTTTGGAACGACCTGGCATATCGAGCACTTCTATTCGACCTGATGGTAAAATTTTTGCAACAGCTGGCTGGGACCACAGAGTGAGAGTATATAACTATTGCAAAGGCAATGCTCTGGCGATATTGAAGTATCACCATGCAACGTGTAATGCTGTTTCTTATTCACCCGATTGCAAGCTAATGGCATCTGCATCAGAAGATACGACAGTGGCACTGTGGGAACTTTATCCTCCTCGAACTTGAAATGATATGGTAGTCCTGAAGTGGAAATGAGTTTGTGTTCCCTATAATGTAATAAAAGAGCATCAATAATCAATATCATTACCGTTTGTGTGCATAAGGTTAGATTAAATTCATTTAAATTATGGATTATTGCTTCTTTAGGAAAAAGATAAGATGTTAGACCTTCAATTTAGCAATAAGAGAAGATGTTACTCGCCTACAAGAACCGTGTGCTGGGATGAAATATGTGTTCTCCTTGTGTAATTTTCAGTTGTTTCAGACAAAGCCTAAGAAAAAATCGACATTTTGGACTGTTATGTAATTTGATGGCTGCCTGCAGGTTTGTAATTGAAAAACAGAACCAAACTCGCAGGCTTTCAGACGCAAAAGAGAGGGCCAAGTCGCGTTGATTTGATTTGGACATTTAGTTTGGTGGCCAGCCTCCAATCCAATGGTATCGAATAGAGGTGCCACATTCTTAGCCTCTGATCTACAAAGCAATGATTGGCTTGGCTATGCCGGGGATTATTGCTTCAAAGCTCCCAATTTGATCTCTCTTACTTTGCACTAGAAAAAGATGACCCGTTGTTGACTTTATCAATTACTCTTGAAATATTTTTCAATATAGCAGCCGGGGAAAGAAGTTGCACCTA\n>XM_035481792.1 Colletotrichum scovillei uncharacterized protein (HER10_EVM0012396), partial mRNA \nCGGAAATTTAGATCATTGTAAAAACTGTTCGTTGAGTTGTTCTCGGGCGTTTTTTTCTTTTCTTTAAATAGCGTACAAGTCTCGCAACTCAAAGCGTCGGGCGCTCTTCCGTTGATCAATCGGAACGTGGCCAGAGACCAGACGATGTCGAGGGACGGGAACCCCGCAATTAGTTCATAAATCCTGTTCAGCCGCGGGCTAATTCCGATGAGCATTGCACACTCATTCGCAGACGACCCATATCACGATTATCGGGGCCATGGGATTTCGACAGCATGTCAGAGGGGAAGGTTCAAAGAGGTGCTGCTGAGTCTACTGGGGAAGTGCCCGCAAAGCAGCTCAAGGGCTGCGCCAACTGTGAGCGTCGTCGAATTCGCTGCGATCGACGGCGACCCCATTGCGCCAAGTGTGACAAGAAAAGACTTTCATGCCCTGGCTATGACCGCCGACTTCGATGGGTGGAAGGGGTTGCCGCGAGGGGACATCTGCGGGGTCGAACGGTCCCGACGAGGCCGTCTTCTGAAGATAAGGCCGCATTTCGAGAAGAGGACTCGAAAGACATCTTCACCGAAAGTCCACAGCTACACAAAATAAAAGACTTCACGACTTCGGTCGTCATTCTCAATGCGCCAACCGCCCAAGCAAGTCAAGCTTGCGAGTACCCCGACTCCCTGACAAGGGTGTTCATGGACTATTACAGACGGAACTTAGCCGGTCTGATGGTATGGATGGACTCAGACCAAAACCATTACCGTACACAGGTTGTTCCTCTGGCCGCGAATCAACCAGCGATCGGCTTCGCCATCATGGCTTTCGCGGCTCAACACGGCGCCATGGCGTTGCCTGATGAATCTATCGCTGAGACTGCTCGCGATAGGTGCTTGCACCTGATACAAACCCGCGCTCAGGATATGACGGCACGGCTTATCGAGGGCGATGACTTGGACAATCATGGTGACTTGGCTGATGCGGAATGGATGCTGGCCTCGATTCTCATCATGTGCAACTACGAGAATGCCCGTCGCCGCCTTCAAATCGCCGATGATCACAGGCGCGCGGCAAGGACGATTGTCAACCTTTTCAAAAGCCAGAAGTCAATCAACAACCGAGATCTGTTTGCGTTCTTGCGAAACCAACTAGCTATAGATGATGTACTGGCAGCTACGACATCGTGCGACCTGCCTCTCATTCGGAGCGCCGTCACGCCAGCACCTGGCTCAGATTATCTCCTCTTTTCGAGATATCTGACTTTTTTGCACCGTGTCACGCTCATTTCGGCAGATGCTGTTGATTCTTATCCTTCAATCTCGCGCTTACGCAGCGGCCTCACGGTGCCTCTCATCCAATCCGAGTTTGAGCAGGCAAGAGGCGCCACGCTGATGGCAGCCGGACGACTCGGACTGGCAGGATCAAGCATGTCTCGTGACTTCATACGCTTAGTCGAGGTTTATCATAACGCGGGGTTGCTTTACTCGTTAAGATGCCTCGACTACGCCATCGAGCACGCCTCGGAGCGCCTTGTGGCCGCTGCTAGTCTGTTCGACCAACTGACCGAATTGGAAGACCTAGCTGCTTTCGTTCAGAATCTAGCCTGGCCGACGTTCATTGCCGGTACCGAATGCCATGGAGATCGGCATCGACAAGATATCATTGCGGGTTTGCTCACGGCAATTCATGAGGGCACGCGCTTCAGTTATTACTTGGACGCGGTGAACTTTCTCAAGGAGTTTTGGGCCGGAGAAGACAACGACTGGCGTCCTCTCGCTCGCATGAGAGAAGCCATAGGGCAGCGAGTCCTTGTGGTATGA\n>XM_006964907.1 Trichoderma reesei QM6a uncharacterized protein (TRIREDRAFT_61223), partial mRNA \nATGGAGACGTACCACGGCTATGTACGGACTCCAGCTGATGCCATCAAACTGTTCGAAGCCTGTCGGCTAGGCCATCTGCCTCGGGTCCAGAGGCGACTCTCTGAAAAGGAGAGGCAGTCTATCAGATCCGGCTCAGTCTTTGTGTGGGACGAGCGCGAAGCAGGCATGCGGCGATGGACGGACGGCAAGTCTTGGAGTGCTAGCAGAGTGTCGGGCAGCTTCCTGACGTACCGCGAAATGGAGGGCAAGCGAGGAGGCGGCTTTGGAGGAAGCAGACGGGGCAACGGCAAGACGCCCGAATCTGGGCGCGGTAGCGACGAGGACCATGACGACGGCGAGCCGGAAGGATACCGATACAAGGCCGACGGCCTTATGAAGCAGTCGTTCAGCATCACCACGTCGACCGGCCAGCACCTCCACCTCATCTCGTACTACTCTCGGCCTCAGCCGGGGCAGCCCGAGCTGCCTCAGCCGACCAACGATCCGATGCTGCGATCCATCATCCCGATGAAGGGCATGTACCCGGAGTCCAGCATGGGCGAGACGAACCAGACGCCTGCACTGACGAGGGCGCCGATGCTGCAGCAGCCGCCTTACATGATTGCTCCTCAGCATCAGCACCACCACCCTCCTCACCCGGCGCATCATCAACCGCCGTTTGCGAGCCATTACCAGCCCGGGTATGGCTGGCCTCCGTCGCCAGTCGCGACCCCTCCGTACAGCCATTACACCTATAGCCATCCTCCTCCCGTCCACCATCTGCCTCATCCGTATGCCCCCCAAGGTCCGCCGCCGCCTCACCACGGCTATGCACCGCCTCCGCCTCCTCCGCCGCATCACTACCAACAACATGGCGCGCCTAGTCCCTACGACCGGCCTTCATTACCGCCTCTGCAAAACACGCCAAAGCCGGCCCCTCTGCCTCCGTACCATGGCCCGCAGCATTCCCAAGGACCGACGCCGCCCCGTGGCCACGAGTCTCCCCACCAGCCAACCTTGCAGGCTGCCGCGCAAGCCGCCATGGGCGATTCACGGACCCCGCCCGAGAAGAAGCCTCAGGGGCCTCTTCCAGCTCTGGGGACTGTTGCCAACGGGCCTCTTGTCTCTGCCCACAGCGGACTGCACACTCCTCCCACACGGACGCTGAGCCCGAGTCCGCCTCAAAGTTCCCATGTGGAGACGCATACTAGCACCAGCACCAGCAACAAAGCAAGCCTGTCCGCGCTGCTGCACCCCACGACGTCTTCCTCCACAGAGGCCGGTGCAAACGGCAGCGCTCACAGCAGCCCAAGGACGGCCAGTATCACCATGGCTGAAAAGGGAGGCGCCAGCGAAGACGCGCGAGCCCTGCGGATGCTTGACCGCAAGTTTTGCATCTAG\n>XM_032861574.1 PREDICTED: Lontra canadensis endothelin 1 (EDN1), mRNA \nTCAGACGGCGGGCGTCTGCCTCTGAAGTTAGCAGTGATTTCCTTTAGAGCCTGGCCTTATCTCCGGCCGCACGTTGCCTGTTGGTGACTAATAACACAATAACATTGTCTGGGGCTGGAATAAAGTTGGAGCTGTTTACCCCCACTCTATAGGGGTTCAATATAAAAAGGCGGCGGAGAGCTGTCCAAGTCAGACGCGCTTCTGCAGCGGCGCTGGGGCGAGCGCGCACAGGGTCCTCGGTCCGCGCTGCTGTCCCCGCACGCCACCGCCGCGTGCGCCCGCAGACCGCTCCCACTGCCGGCCCTCCTGGCAGAAACTTCTTTTTTCTCTCCGTTAAAGAGCACTTAGGCTGAAGGCTCACTTTGAGATCTGAATAACCAGAAGAGCTTTGAGGGACCCGAAGCTATTATTTTTCTTCGTTTTCCTTTGGGTTCAGTTGGCAGGGGAGGACTTTGATCCCCACTCCCTCCCCCCTTTTTTTTTCAGAATGGATTATTTCCCCATGATTTTCTCTCTGCTGTTTGTGGCTTTCCAAGGAGCTCCAGAAGCAGCGGTCCTGGGCGCGGAGCTCAGCACGGGCTTGGACAGCGGAGGGGAGAAGCCCGCCCCCAGTGCACCCTGGCGGGCCCGCCGGTCCAAGCGCTGCTCCTGCTCCTCCCTGATGGATAAAGAGTGCGTCTACTTCTGCCACCTCGACATCATCTGGGTCAACACTCCCGAGCACATTGTTCCCTATGGACTCGGAAGCCCTTCTAGGTCCAAACGATCCTTAAAGGATTTATTTACCACAAAGGCAACAGACCACAGGAAGAGATGTCAGTGTGCCAGCCAAAAAGACAAGAAGTGCTGGACTTTTTGCCAAGTGGGAAAAGAATTCAGGGACCAAGATGGTATGGAGAAGAGCTGGAATGACCCTAAGAAAGGCAAAGACTGTTTTGGGCTTGGAGAAAAGTGTGTTCATCAGCAGCTGGTGGCAGGAAGAAAAATGAAAAGGTTGGACGCCATCAGCAACCGCATCAAAACAGCTTTTCGTGTTGCAAAGCTGAAGGCGGGGATCTACACAGAGAGGCAAGTGACTCACAACCGAGCACACTGATGGCAGGTCACCAGGGCCCATGGCTGGCCCGCCCGAAAGCCTTCTCCTCCGAGGAGGGAACCCTGTGGCTGATTCTGCACTCTCTCCCCATGGCTGGGATCAGAGCAACAGCATCCTCCCTGCTTTGACCGACCATTTCTTGCTCCAACTGGCAATGGACCAGTGCCCTCGCTCTAAACATTCCAGGGAAGGTTAAGGAGTCCCCCAATCCATCTTCATTTGCCTCCATTGGTGATAACTGCTTTCGTCTCTCCTCGTTTGGGGTGACAAGAGACTACTCAGAAGGCAGAGAGACACACAGTGACTTGTGATTTCGGGTGTCACCATCCAGAGGGAGGACAGGAGATTCCACACATGGTGGAATTTCTGAAGAGGGTCCGAAGGGAGTGTTTGTGTCTCACTCAGGCGCCTGGCACATTTCAGGGAGAAACTCCAAAGTCCATGCAAAGATTTTCTAAGGAATGCACAAATTAAAAACACTCTCGAAGGACACTCAAGTTAAAAAAAAAGAAAGAAAGAAAGAAAGAAAAAGACTTTTTTTTCTTTTTAAATTCACAAAATGCAAAACTAAAAGATACTGCTACTACTGTAAATCAGGATGGGTTTGATGAATCTGAGTCTACCTCACCTCTATTGCACTCTGGTAGAAGTACTCCCCCCCGCCAAAAAAAGAAGTACTTCCCCACCATTAACTATATCCCCCCC\n>XM_030076989.1 PREDICTED: Myripristis murdjan Ras and Rab interactor 1 (rin1), mRNA \nATGCAGGAGGTGGGCTGCTCCCAGCAAGGCTCCCAGAGGGCCTTCAGCGTCTTGGACCGTCTGCTCCTCACACACCCCGTCTGGCTGCAGCTGTCACTCAACCAAGACTCCGCCCTCTACATCCTGCTGAGAGAGCCGGTCGGGACGTTCTTGGTGCGTAAATGCAGCTCCACTCAGAGAAAGGTGCTGTGTTTGAGAGTGACAGCGGACCGAAGTGCCTCCTCTGTGAAGGAGTGCTTCATCTGTGAGGAGGACTCCACTTTTGCCTTGGAGAGCTCTGCGCTCAGCTTCCCTGATTTGTGTCGATTGGTGGCCTTCTACTGTATCAGCAGGGATGTGTTGCCGTTCCCGTTGCAGCTACCGGATGCCATCGCTAAAGCCACGTCCCACAGGCAGCTGGAGGCCATCTCACATATGGGACAAGAGTTTTGGAGCCCGCCCACTGCCTCAGAGATGCTGAACGGACCAGTGGACCAGTTGGCATCGACCAGTCAGGACCAGGCGGCGCTGACCCAGGACCTGTGCAACCTGATGGCCCGAGGCAGATACAGCAAACTGTGCTTCATAAACCCCCTCTTCATGCAACTGGAGCAGCCACAACATTCAAACCACGGTGCCTCCAGTAAACGGCACCGCTTAAAACGCAGCATGAGGCTCCGGCTCTCCAACGAATGCTCCATGAATCTGTCTCTGGAGGGCGTCGGCTCCTTCTCGCCTCCCTCCTCCTTGGAGGTGCCCGGCGGTGGAGAGAGGCTGCAGAAGGCCAGTCCTAACCCACAGAGAAGAGTTCATCCCGGGGCAGGGGTCTTGAGGCGAACCCCTGCTGTTTCCCCCGGCTCTGCAGAGGAAGATGACATCATGTCGACCTTTGTACCCCAGGTAAGAACCAAGGCTGGCGTGGACGAACCTACAAGGCCCCAGCATGGTGTCCGAGCGGAGGAGCCGAGCATCGAGGTGGCCGTGCTGGCCTTGGAGAGCCGTCCCGCTCCCTCCCTGGTCGAGCTGGACAGCAACAGCTCCTTCAGCAGCATGGACGACTCGGATTCAGATTCAGAAACTATGAGTCAGCCGCGAACGCAAGCCCACCAGCGCCCGCCCCTCGTGCGCTCGCGATGCCGCGGCGGGCTTCACCGCATGAGCGCGGCGTTTGTGTGCTTCTTCGCGCCGGAGAAGCGCCTGACGCGGCTGGTGGAGGAGCTGTCCCGGGACAGGCGCTCGATGTTTGGGGCCATGGTTCAGGACTTCATCGCGCAGCAGATAGAAGTGCTGAAAAAGCTGGATCCCTCTTCATCCTCTTCCTCTCCATGCGTGACCTCGGTGGAGCTGCTGCAGGGCCTGCGTCTCTTTCTGTCCCAGGCTAAGTGCTGCTTGTTGGACAGCGGAGAGTTGGAGCCTCCCATTGAAACTCTGGTGCCTGAGAATGAGAAAGACCTGGCGCTGGAGCGGGCCATGTTCACCTGTGTGCTCCGGCCGCTCAAGTCCCTGCTGGACCAAGCCCTGGTCATGCTGCACATTCAGGATGGCTCCAACCAGCGCCTCAGCAAGAGCCTGCTGCAGCTGAAGGGGGACAGGGCCATGGAGCATCTGGGGGTGCAGACGGGCGTCCCGGACAGCCGTGACGTGGAGAGGGTGAAGCAGAAGCTGATAATGATGCAGAGGACGTACTCACCTATTGATAAGGTGCTGCTGCTGCTGCAAGTGTGCAAGTGCGTCCAGAAGGCCATGGGGTCCTTACACGGCCAGCCGGTGAGCTGGGAGGACTTCCTGCCTTCGCTGTCGTATGTGATGGTGGAGTGTAACCGGCCCCACATCCTGATAGACGTGGAGTACATGATGGAGCTGCTGGAGCCCTCCTGGCTCTGCGGAGAGGGTGGCTACTACCTGACCAGCGTCTACGCCAGCCTGCGTCTGATCCAGAGCCTGGAGGGAGACCAGCCGCCCCCCGCCGGTCTGACCCAGGAGGCCCAGGAGGCGCTGAGGGAGTGGGGCTGCAGACGGAACCGAGAGGCCCAGAGACACAAGGAGAACCAGCAGACTCAGAGGTACGTTCGGATACTGTTCCAGGACGGGGAGCGAAGTGCGGTGCGGACGTTGCAGTGGAGAGCCGGGGAGACCAGCCAGGCCCTGGCACAGCTGTGTGCCGACACCTTCGGCGTGTCGGACCCCCAGCAATACACCCTGTACTGGCGCAGCGGCGGTGAGATGAGGGCGCTGCCGCCCCAGGCCCAGCCACAGGACCTGGCCAGCCACAGCGAGGGCGGCCCCTCGCTGTCCTACCTGAGGACCGACCACGACTTCAGCAAGATGCGGCGGCTGACCAGAGGCGGCGCTGTGGACCTGAGCGAGTCGGTGTGTGAGGAGTGAGTGGGAGGGATGGAGGAAGGAAGGAAGG\n>XM_013321598.1 PREDICTED: Papilio xuthus rab11 family-interacting protein 2 (LOC106124683), mRNA \nTGATGCGACTGAACGGTGAACGGACTTAACAAACAAATGGTGACGGGTGACGGTCTATGATTATTGACTGCGACAGCTCATCGTTTGTATAACAGTAGTTTTTTTGTACATTCCATCAACAAAAATATTGCTTTATTATTACTATTTCTTTTAATAAAATGTGGGATCCGACACATGTGCAAGTAACAGTCCAAAGAGCCCGTGGATTATTAATTAAAGGTAAAAACGGTACTAATAACTGTTTTGTTACTATTGCCCTCGGTAAAGAAAAGTTTCAAACTTCCGTGAAACACAAAGCTACTGAGAACGTCGAATGGTTAGAAGAATGTGAACTACGTATTCCATCTCACGGCAACACTGCTGAAATCGTTTTGAAAGTTTACGACGAGGATTTTGTAAAGGATCACTTACTAGGTCAAGTATCGATTCCGTTAAAAGACCTCGATGTCTATGAACGTCCAAGAAATCGCTGGTATACATTGCAAGGTAAAACTGGGAAAGAAAGTGATAAAAAAAGAGGCGAGCTTGAAGTTAAAATAGGTTTTACAGTAAAAGAAGGAAGCCTGACAGATCTTAGCAAAAAGGAAAAACATAAATCATCTTTGTCAAGTATTGCTCAGAATGTAGGCGGAAGCCTTATGAGTATCGGAAGCATTGAAAAACGTAAAGGTATCAAGAAATTCGCTAAGAATCTTGGTTCCAAAATTAATCTGACAAAGAAAGATAAGAAAAGTGATACTTTATCACTTGATGGCAGTGTGGGGAATCTCAAAACTCCGACTTTGCTGACGCCCGACCATTCAACACCAAAAAGATTGTCAGGGGAAGCAGACCCTGGTGTAATTAGTGAAGATGAAGATGAATTTGCTTTTGATGATCTGTCCCATAAAAGTTCTGGGAGTTCACTCAATGTCCACACACTACCAAGAGGGCATAAATATACTCCATCGCCAGTTAATGCTTCCCTTGAAAACCTAGGAGGTGGAGAATTCTTAAGAAGATCAACAAGCAGTAACTTAGCAGTACCTGATAAGTTAGCACCTCAAAAACCTGTCCGCTTGAGTTTAGACACATTCACAGCTCCGCAGCTGCCTGCTCAAGTGATAGATAAAAATGATGAGTGGTCCCAAAAACTTTATTCCCGTCCAAAATCCAATAGCCAGAGTACTATTGACAGAGAAAAGTCATCAAGTCTAGAAAGAAATAAGAAACTGGATAGTCCCAGTTCTCTGAAAGAAAAGCCTAGCCCAAAGTTCTTTAAAAAGTTTGGTAACAATAACAAACCAAAGAAATTGTTAGAGGAGCGAATTATTGTTGGTGAAGAGAACATTGTTGAAGAAGATGCTATCAATCCAGCCTTTAATAACATTCCTAAGACGGTCTTGCAACAGTTTGATGGAAAGACAAGAGAAGATTTAATTGTCATGATCTACAACATGCAAAAAGATGCAGAAGCTGAAAAGAAGAAGAATAAAGATTTAGAAAATTATTTAGATGAATTGTTGCTTCGAGTTATGGAAACAACACCAAGAATCTTACAAAACCCATACACAAGAAACAACAGTATGCATATGAGAAACAAGTGAATTTAAAACTTTCTGAAATCAATATTTACAATGTCAGGAGTGAATTATATTAATATGATAATCACTGTTTTGAAAATTTTACAGAATTGAGTCCATCCAAAGTAAAATTATTAATGCAAAGATTGTGTCATAGTGGATTAGTATGTCTAAATATGGTATAATTTAAAATTAATAAAAATTTAAATGGATGCCTTGAGAACTGTGGCACAGTATTATAAAATAAACTTAGGTAAGTACTTGTCAGTTCAGTTATGAGATTTCTAGTTATAAACATGTTACATTATTTCTCATTATTTATTATGCAGGTGAAATTAAAATGTACTTCCTTATGTTCATTAATTGCTAGTAAGATTTCTTCAACCTAGTGCCTTATAAATTTTACTAAATCTGTGATAAAAGCAAATTTGATTTGATACAGAAATATATTGCTTATTTGATAAATTACTATGAGAATTATGAAACTATTAGCTACTAAATATTTCAAACATACTCAATTTATACATAATATGTCTATGTTATTAACTCATCTATATATCTATATTTTTATATCATTAAAAGCAAACATGCTAACACATCACCTATTGTTATGTGACCACTTTAACCTTGGTGCCAAATTTTGTTGTTTGAAAATTGTGGATAATTTTACTACCAAATCAAGATTTTTATTTTTGTATTATCTGATATGATATGGAATGTATTCATTTGTAAATCTACAATCTACAAGTTTTACAACCCTAAAATATAGTAACTTTTTGCTTCTATGGAAATATTATTAATCCCATGGGTGCGGAGTTATTTGAGAATATATTTGCATGTGGAACGGAATAACTTTTGATTGCTTGGAGTATTATGTAAAGGCAGTACATTTAATTTAAGAATGTTATTTATAAAATATTAAAAGTTTAATTTTTGGTTTGACGTCTTAAACACGTCATCCGTTCTTAGGGGGGAAAAGCAAATGACGTAAATGTAATGAAACAAAAAGAAAAGCAAACTGGAAACCATATGTGTGTCACAATTATTAATATCTAAATATAGAAAACTATTAGTTGATTTGTGAAATACTATTATTGCATTGCATATATTTTATGAATGTATATATACTTTATCATTTTTATAACTACAGTGAACCTTTGCTAAATAAGTTTTGGGCAGTATTGAAGTATTTAGGTGACTCTTTCAATTTGTCTGGGCGAATTACAAACAGACGACATTCACAATCGATCAGTTACATAAATATGAGTGGGTGAATCATGTGTTTAGTGATTCACTTATAATGAAAACTCTTAACGAGTCATGTAATAAACCATAGACATACCGGTTTAAAAGAGTTGACCATTATTATTGTTTATATAACTTTTTTACAAAAAATGTAGCTATTTCATAGACAAAACTGAGTTTCAAATTACTTCATAATATGTGCAATATGAATTAGCTCATAAGTAATTATACATCTCATTTATTAATGAAAGGCAATTTAGGTGTAATACATATCAAGGTCCAAGTTGTTATGTCTGAAACATGGAGAAAAAGTTCATATTACTTTGGTACTAGATGAACAAGCCTTTATTTACTTAAATTTATATTAGTGTTATTATTCTTATGTAGTTGTGTTATTTCAGTGCAGTCAGCAAAAAACATCGATGATTTTTAATCTTCCTTCACTTACACTTATGTTCACCAATACACACAGCTGAGCACTGGGCTCTCTGACCTTTTTAAGACTTGGACTGCAGTGAGAATCACACAACTATTATATTTATGGTTGCATATTGAACAATGTAACCTTGATTATATTCTCCACTGAGTGAGTTGATAAATTGTAATTTTAGAAATAGGATACTATAAGCCTTACTTGTAATTCAAAGATTTGTTTAGTGTTTATTTATTTTTTATTTCATTTAAATACTAAAATTGATTTTATTTACTTCCTTTACCATTTTTCATTAACCATCAATTGTTTGATTTTGAACTTATTTTTTATTAACAATTAAACTACTAACTCTTAAATTATTTAGTTCATGTATCTAATAGTTAAGAGTAAAGTATGTTTATATTCATTGATT\n>XM_031377017.1 PREDICTED: Mastomys coucha olfactory receptor 2A12-like (LOC116095757), mRNA \nATGAGGATGTTTTCAGGACAGAACCAAAGTTGGGTTTCTGAGTTCATCCTGCTTGGTTTCTCCAGTGACCCCATGACCAACAGCATCCTCTTCATTGTCTTCCTTCTCATCTACCTGAGCTCAGTCCTGGCCATGAGTCTGCCATATTGTGGGCCCAATAGGGTCAACCATTACTTCTGTGAAGGTCCTTCAGTGCATAGCCTGGCTTGCATAGATACCCACCTCATTGAGATGGTGGATTTTGTATTGAGTGTTTTTGTGGTTGTCATTCCCATTTCCCTCATTGTGGCTTCCTACATTCATATTGCCAAGGCAATTCTCAAGATCAAGTCCACCCAGGGCCGCTGCAAGGCTTTCTCTACCTGTGCCTCCCACCTGACTGTGGTCACATTCTTCTATGCTCCAGCCACTTACATCTACATGAGGCCCAACTCCAGCTACTCTCCTGAGCGAGACAAGCAGATCTCACTCTTTTACAATGCCTTCACAGCCTTGCTCAACCCTGTGGTCTACAGTCTGAGAAACAAGGACATCAAGAGGGCATTTCTCAAGGTGATGGGACATGGTAGGCTGGACCAGTGA\n>XM_021109787.1 PREDICTED: Arachis ipaensis putative amidohydrolase YtcJ (LOC107613187), transcript variant X3, mRNA \nAACTTATAACAGACATTTAGTTTCCGATCATTGGAGATGCTTTAACTCACCTCTTCTCAACATAGTTCCCCCATTTCTCTTCCACTTCCTCTCCCGCTGTCGTTTGTCAGCGCCGCCAGAAACGACTCTTTAGCCCTCCTCGACGTCGTTCCTCTGGTTGAGCTTCGTGCTGCCGTTTCATTCACTGTGTCTGTTATTTGAAATTTTTTACGTCGTTGATGCTGCTGTTCCGAATAACATTAGCACATCAAGACGTGAATTTCATGATTTGCTGAGGCTATTTTAGGAAATTGCTACAGTACTCCTGGATATTACATTGGGACAGAAGAGTGCCCAATGAACTCTTTTCTGAAGCTGCTCTCCATTCCCATAGCTCTCCTCTCCATTCTTTCTTTCTCCTTTCTTCACCCAACTCATTTCTTGGGTTGGAAGGCACTAATGTCGTCTCAGCAAGTGGCAGATTTGGTTGTGAGGAATGGGGTGATATATACAGGTGATGATTCTCTCCCGTTTGCAGAATCCATGGCAGTGGCCAACGGGAGGGTTGTCCGTGTTGGAAACCATTCCTATGTGCAGGAGTTGGCCAGCTATGGAACTGAAGTGTTGGATCTTGGTGGGAAAGTTGTGGTTCCGGGGTTTATTGATTCCCATGTGCATTTCATACCTGGTGGATTGCAGATGATGCAGGTGGATCTGACAGGTGTGAATAATAAGGATGAGTTTATCAGAAGGATCAAAGATGCAGTACAAAGTACAAAACGAGGTTCTTGGATTTTGGGTGGAGGATGGAACAATGATTTATGGGGAGGAGATCTGCCAGCTGCATCTTGGATTGACGATTTCACTCCTTACAATCCCGTATGGCTATCAAGAACAGATGGTCACATGGGCTTGGCTAACTCAGTGGCACTAATGTTGTGCGGCGTGACAAACTTAACAGCTGATCCGAGTGAAGGGACTATAAAGAGGACTCCAGATGGAGAACCTACTGGATTGCTGATCGAATCTGCAATGTCACTTGTTATGTCGCAGATTCCAGAGGATTCAGTAGATAATAGGAGGGAGGCACTGCTTAGAGCAAGCAATCTTGCCCTGGAAAGGGGTGTGACAACAGTTGTTGATATGGGAAGATATTATTCAGGGACTTCAGCAAATCTTTCTTGGGAGGATTTTACAGATGTTTATCAATGGGCTAATTCTATGTCAAAAATGAAAGTTAGAGTGTGTTTATTTTTTCCAATGGAGACATGGTCACGTTTAGTGGATGTGATCAACAAGATGGGTTATGCCTTGAGCGAATGGGTGTACATTGGTGGTGTCAAAGCTTTTGCTGATGGCTCATTGGGTTCCAATAGTGCATTGTTTTATGAGCCGTATGTTGACGATCCAAACAATTATGGCCAACAACTTATAGAGTCCGAAGCTCTTTTCAACATGGCTTTGGAGTCAGATTTATCTGGTCTGCAGATTGCAATCCATGCTATAGGGGACAAAGCAAATGACCTGATCTTGGACACATATGGCTCAGTTGCCTCTACAAATGGACCGAGAGATCGAAGATTTAGGGTAATATGGTTACTATTGAGCATGCTCAGCATCTGGCTATGGGAACTCCACACCGATTTGGCAAACAATGGGTTATTGCTTCTATGCAGGTATACCATTTCCGCTGCTCGGGCAAGCTTCCTTGACAATGATCTGGGATCCTTATCTCCAGGGAAACTTGCAGATTTTGTCATACTAACCACTCATTCCTGGGAAGAGTTTGCTGAAAGTGCATCTGCATCTATTGCCGCGACATATATTTCCGGTGTGAGAGCATATCCTTGAAGGTATTCCATAATCTATTTCAAGTTTTACAATCAAATTTGCATCAGATGTGCAGAAGGAAAGAAGTGTTGTAGCGCCAGTCCTCTGAAAGGTTTTAAATACAGTCATCTTATTTTTTATTTTTTTAGGAAGATTAATACATACGCATGAGAATGTGAACATTATTTTAATTCCATATTGGTGTATTAATTATTTCATATTTGTTCTTGTCATGTGAGTTTTTCTATATTTCTTTTATACGACTAATACTAGGCGTACACCAAAATCAACTATAAAATCAGCCATTGTATTTTTATACG\n>XM_010548157.1 PREDICTED: Tarenaya hassleriana uncharacterized LOC104818540 (LOC104818540), mRNA \nATGGGAAGAAAAAGTTCGAGAGGTGATAGCGTTGCCGAACGGTTCTTCAAATGCGCTGAAGCTTATACGTTGAACGAATTTGAAGACCTGTTTAATGATATAAAGGACAGGTATCCCAAAGTTGCGGAGTATATGCAGAAAGAAGAACTTGATCCCGAGAAATGGGCAAGGTGTAAATTTAAGCGTCAAAGGTACAATTTATTGACAACAAATGCAGAGGAATCAATAAATTCTGTAATGAAGAAGGCCAAAAGGTTTCCGATGCTGGGCCTTCTGGATATGTGTGTCTCCAAGACCGTGGAATGGTTCAATAGATATAGAGTTGAAGCAGGATGTGCCGATGATTCACAAAAAATGACACCGCATGTTGACAAAGTGCGCCATAAGAGGTATGAGACTGCATGTACGTATGAAGTCATTGTGCTAAACACTGTTACAGAGGAGTTTGAAGTGATGGGTGAAAAGGGTAGAAAACACTTTGTTAGCATTGAATGTAGAACGTGCAGTTGTAGGGTGTTTGATATCGATAAGATCCCATGCAGCCATGCAATTGCAGCACTTCATAAGGTTGGTAAAGCGAATGTTATACTAGACTTATGTTCTCCATACTATACACGGGAGGCATGGCGTCTTGCCTATCAGGAAACCGTGTATCCGGTCCCCGATTGCTGTGAATGGATTATCAATGACCCGGATGTTACAAATCTTGTGGAAATGCCTCCTATCATGGATGAGAAACGATAA\n>XM_032257218.1 PREDICTED: Sapajus apella replication termination factor 2 (RTF2), mRNA \nAGCGGTTTGCGTCACTGCGGTGCGCCGGAAGTGGCTGCAGATTCCGTCAGTAATCCCGGAAGTGGCTTCTTTAGGGTTTTGCTGCTGGCTGTGACTCCTGTTCTGCGATGGGTTGCGACGGGGGAACTATCCCCAAGAGGCATGAACTGGTAAAGGGGCCCAAGAAGGTTGAGAAGGTTGACAAAGATGCTGAATTAGTGGCCCAATGGAACTATTGCACTCTAAGTCAGGAAATATTGAGACGACCAATAGTTGCCTGTGAACTTGGCAGACTTTATAACAAAGATGCCGTCATTGAGTTTCTCTTGGACAAATCTGCAGAAAAGGCTCTTGGGAAGGCAGCATCTCACATTAAAAGTATTAAGAATGTGACAGAGCTGAAGCTTTCTGATAATCCCGCCTGGGAAGGGGATAAAGGAAACACTAAAGGTGACAAGCATGATGACCTCCAGCGGGCACGTTTCATCTGCCCCGTTGTGGGCCTGGAGATGAATGGCCGACACAGGTTCTGCTTCCTTCGGTGCTGTGGCTGTGTGTTTTCTGAGAGAGCCTTGAAAGAGATAAAAGCGGAAGTTTGCCACACGTGTGGGGCTGCCTTTCAGGAGGATGATGTCATCGTGCTCAATGGCACCAAGGAGGATGTGGATGTGCTGAAAACCAGGATGGAGGAGAGAAGGCTGAGAGCGAAGCTGGAAAAGAAAACAAAGAAACCCAAGGCAGCAGAGTCTATTTCAAAACCAGATGTCAGTGAAGAAGTCCCAGGGCCATCAAAAGTTAAGACAGGGAAGCCTGAAGAAGCCAGCCTTGATTCTAGAGAGAAGAAAACCAACTTGGCTCCCAGAAACACAGCAACAAATGAGAGCTCTTCTGGAAAAGCTGGGAAGCCTATGTGTGGAGCCACAAAGAGGTCCATCGCTGACAGTGAAGAATCCGAGGCCTACAAGTCTCTCTTCACCACTCACAGCTCTGCCAAGCGCTCCAAGGAGGAGTCCGCCCACTGGGTCACCCACACGTCCTACTGCTTCTGAAACCCACCCGGCCACTGCTCCTGCCCCAGAAGGCTGTCTGGTTTCCACCTAGGCGGGTCGCTGTGCACGCTGCTGTGTGTTCTTTCTGTACATCATAAAGCTGACCTGGCCAGCCTTGGAACTGGTGTGGCCACTCTTGTTGTGAGGTGCGTGTGTTCCAGGGGGGACATAGGACGGGCTGCACCGTGCCTGAGGTCTTGCTTGCTTCCACCTGCAGGTACGCTTGGTCGTTTCTATGGCCAGGAAGCCCTGCAGGCCGCACTTTTTATGCTTCCAGTAACGAGAGATCCCGGAGTCTTCACGAGAGCAGAGTTGGCACATATTAACTAAAATTATGATTTTGCTACCAGCAATAAATTAAGTAGGCCAAGTGAAACTGGGCTTTAGAAAGGGTGGATTTCAAATACACTGTGCCCACTAGAAGCTTTGAAGGGCCTCATCCCTCTGCTCCATCCCTGGGAGGAGTCCGGATCCTTGTTGGTCTAGCTAAGTACTATTAGGGGAGTCTGCCCCTAGCTCATCATTTGAAGACAGCAGAGTCTCAGTTGGGCACCAGTGATTGGGTTCAGAAATAAAGTTGGTCTGCCTCTTCTC\n>MG651402.1 Priestia aryabhattai strain FJAT-46583 16S ribosomal RNA gene, partial sequence \nTGCAGTCGAGCGAACTGATTAGAAGCTTGCTTCTATGACGTTAGCGGCGGACGGGTGAGTAACACGTGGGCAACCTGCCTGTAAGACTGGGATAACTTCGGGAAACCGAAGCTAATACCGGATAGGATCTTCTCCTTCATGGGAGATGATTGAAAGATGGTTTCGGCTATCACTTACAGATGGGCCCGCGGTGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGCTTTCGGGTCGTAAAACTCTGTTGTTAGGGAAGAACAAGTACGAGAGTAACTGCTCGTACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAAGAGAAAAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGGCTTTTTGGTCTGTAACTGACGCTGAGGC\n>XR_007238697.1 PREDICTED: Ziziphus jujuba var. spinosa serine/threonine-protein kinase ATG1t-like (LOC125420078), transcript variant X3, misc_RNA \nAAAAATAAATGGAACGCGTAAGTCAATCCTGTTGTAACCTGCGAGGTTGTTGATGGAAGAAGGGGAAAATGGAAGAAGATGGAACAACTCTCTGCAACTGCGACGGCATTAGAGTGGGAGACTATATTCTAGAATCAAAGCTTGGAGAAGGCTCTTTCTCTGTAGTTTGGAAGGCCCAGCACAGTCTCACTGGCCAACAAGTGGCTCTGAAGCAGGTCTATCTTTCAAAGCTCAATAGGCACCTCAGAAGCTGCTTGAACTGCGAGCTTACCTTCTTGTCCTCTGTTAACCGCCCCAACATAATTCGTCTCTTCCATGTCTTCCAGGCCAATAGTCCCCATCCTCCGGGAAAAAGTTGCATCTTCCTGGTCCTGGAATTTTGTGCTGGTGGGAACCTAGCTTCTTATATCAATCAGCACGGGAGAGTTCAAGAACAAATCGTTGGAAGATTTATGCAGCAGCTTGGGGCTGCTTTAGAATTACTTCACTCTCACCACATCATTCACAGAGACTTAAAACCAGAGGTAACATCCGTACTATCAGGGGCACTGAGGTTCATTTCTTCAATGCTTTTTGGAAGCTTGTTTTGGGAGTTTTTACAATTAAACAAGTACTTACACCAAGTGCCAACCTTCAGTTTGAAGATTTTAGAGCGCAAAGTTTGGAAAAATCTAAGGATTTTTAACAATTTCATGATGAAGCTTTGGTAAAATTTCGAGCTAAAAAGAAAAAAGCCTACCAAGAAGAAAAGAAGCAAAAGGGTCGTGCAACTTTATTCTAGGCACTAAGGCTAATTTCTTCAATACTTTTTCAAAGATTGTTTTGGGAGTTTTTACAGCTAAACAATTACTTGCATTCAGGGTTGTTGAGCTTCAATGTGTAAAAGATGGAGTAATTTGGGTTTATGGTAAAAGAATTAAACAATCTTTTGAGGAGAAGAGCTTAAGCATCCAATTCTTTCATCACTTAGCTTTATCTAGCGAGAGAGGTAAAACCAAGCTCTTATTAGGATGCAACCCAAATGTCTCTTACAATTTCTCTTTATTTTTAAGTTTAAGTTTTTATTTTTGAAATTTAAAGTTTGAGTTTGATCATTTTAGTTGTTTTCATAATTAGTAGAATTTATATTTTTGAATTCCATCTTGTTTGACTAATTTGGGTTTATGGTAAAAGAATGAAGCAATGTTTTGGAGGAGAAGAGCTTAAGGATCCAACTTTTTCATCATTTGGCTTTGCCTAGCCAGAGAGGTCAAACGAAGCATTTCTTGAGAGGCAACCCAAGTGTTTCTTACCATTTCTCTCTATTTTAAGTTTTTGTTTTTGAAATTTGAAATTTGAGTTTGATCATTTTAGTTGTTTTCATAATTAGTAGCATTTATATTTTTGAATTTCATCTTTTTGGCTAGTAAATTGGGAGTTTAAAACCTCAAATTTAGATGATTAAGTTGGTCAATCAAGAAGTATTCAAGAATGGCACAAAGTTAATGACCAAGGTGATCTAAATGGGGGTCATCTCACTCATCCCCGGAGAAACAACCTGGATGGGGC\n>XM_053020070.1 PREDICTED: Gossypium arboreum probable pre-mRNA-splicing factor ATP-dependent RNA helicase DEAH9 (LOC108487114), transcript variant X2, mRNA \nTATTTGGGCTTAGAAACCCTAAACCGAAGCGAGAGCGAAGCTAAATAAAAAGCCCGTTTAGTTACATTACTGAATTTTGATTCAATTTCCCTCGAATCGGGAAAAGTAAAACTGAGCTTAAAATTATGGCGCAGTTCTGGAAACCGGGAACCGAGAAGCCCCGCCTCCTCGAGGACGAGGATGGCGGTGTTATTTTCTTGTCATCTTCTTACTCTTCATCTTCTTCTGGATATGGGTATGTGAGCATTGAGAAGCAAAGACAGAGGCTTCCAGTTTATAAGTATAGAACTGCTATTCTTTATTTAGTGGAGTCTCACGCTACTACCATTGTTGTTGGTGAAACGGGTAGTGGTAAAACCACTCAAATTCCACAGTTTTTAAAAGAAGCTGGTTGGGCTGATGGTGGGCGTGTTATAGCTTGCACGCAACCAAGACGACTAGCTGTGCAGGCAGTTGCTTCAAGGGTAGCTGAGGAGATGGGGGTCAAACTTGGAGAAGAAGTTGGTTACACAATCCGGTTTGAAGATATCTCTAGTCCAGATCTTACTAGGATCAAATTTCTCACAGATGGAGTCTTACTTAGAGAAATGATGGATGATCCTCTTTTGACTAAGTACAGTGTCGTTATGGTGGATGAGGCGCATGAAAGATCCATTTCAACAGACATTGTACTTGGTCTTCTGAAAAAGATCCAGAAACGTCGACCGGAGCTGCGACTGATTATATCTTCTGCTACGATTGAAGCGAAATCAATGTCTAATTTCTTCCTGTCCAGTAAAAGGCGCCAAGCATTGGAAGGTGAGGAGCTTAGACCTAGGTTGGAGCCTGCTATCTTATCCGTTGAGGGTAGAGGGTTTAATGTGCAAATTCATTATGTGGAAGACCCTGTACGAGACTATGTTCAGGCTGCTGTTTCAACAGTGCTATTGATTAATGACAAGGAACCACCAGGTGATATTTTAGTATTTCTTACTGGTCAAGATGATATTGATGCTGCTATTAAGTTGCTTACTGAAGAAGCTCGAAGCAATGGGAAAAATTCCTCAGGGTTGATTATTTTGCCTTTATACTCTGGACTTACACGTGCAGAACAGGATTTGATATTTTCTCCAACTCCTAAAGGCAAGAGAAAAGTAGTGATATCAACAAATATAGCAGAGACATCATTGACTTTAGAGGGTATTGTCTATGTTGTTGATAGTGGCTTCTCAAAACAACGATTCTACAATCCGATCTCGGATATAGAAAATCTTGTGGTGGCACCCATATCCAAGGCATCTGCTAGACAAAGGGCTGGTCGAGCTGGTAGACTTAGACCTGGGAAGTGTTACAGATTGTATACAGAAGAGTATTTTCTCAATGAAATGTCTATTCAAGGAATTCCTGAGATCCAAAGGTCAAATCTTGTTTCTTGTGTGATTCAGTTAAAAGCATTAGGCATTGATAACATTCTGGGCTTTGACTGGCCGGCATCTCCATCTCCTGAATCAATGATCCGAGCACTTGAAGTACTTTATTCACTTGGAGTCCTTGATGATGATGCTAAACTTACTTCACCAGTTGGTTTTCAAGTTGCAGAAATTCCACTGGAACCAATGATCGCAAAAATTATTTTATCTTCAAATGAGCTTGGGTGTTCTGATGAAATCATAACTATTGCTGCTGTTCTCTCTATCCAGTCTATCTGGTTTTCTGCTCGAGGAGCACAAAAGGAACTGGATGAAGCCAAATTGAGATTTGCTGCTGCTGAGGGTGACCATGTTACTTTCCTGAATATTTACAAAGGGTTTCTCCAGTCTGGCAAATCTTCAAAGTGGTGTCACAAGAACTTCATAAACTACCATGCCATGGTGTGTATTTTTATTTGGGCATTTTTGAGAATTTAAGATACTGTCCAGTTTCACTCTGTTACCTGTCTTCAAGTACAAGAACATTAAAAAGGTAATGGAAATTCGGGAACTACTCAGAAGAATAGTGCTGAGGTTGGGCATAGTCTTGAAATCTTGCGAAACAGATATGCAG\n>XM_020956221.1 PREDICTED: Drosophila serrata CTD nuclear envelope phosphatase 1 homolog (LOC110186899), mRNA \nAAGCCCTGGCGATCATTGTCAGTTTTTCAAATTCTGTAAACTTGTAGAAAAATAATTAAACTCTTTTCAAAAAACCTCACTAAATTAGTTTTGAGATTATTTAAGATTCTTAATGGTATTAAGTTAATTGGTTTCAAATTTAATCATAAGCTGGTTGAAATCTTAATAAAACCATGACTGGCGACTCGTTTATGTTTTTCTCATATGGACTGATTACTTTGGCCCTGCTGCTGGCGATCATTTGCCTGTTTTTGCCCAGGGTGGACAGGTTCATCAAGTTGTCAGCGGGCAGGATATACAAGATCTATGCAGAGTACACTCCTATAGGATACATGATCGATGATTCCTTGACTCCTGTTTCCCGACGCCGTCTGCAGCGGGTGGCTAAGAAGACACTGGTGTTGGACATGGACGAGACCCTGATCACGGCCTGGATTCAGCGACAGGACAAACGTCGGCAGTCACCACCCAACGTTCCCCACGACTTTAAGTTCGTGCTTTCGGATTCCAAATATAAGGGCAAGGTCTATGTTTATAAGCGTCCCCATGTAGATCACTTCTTGAACTGCGTATCCAGATGGTATGACCTGGTGGTTTTCACCTGTGGAACGGAGCATTACGCAGCACCTATTCTCGATTTCCTTGATAATGGCCGTGGGATTTTAACCAAGAGGTTTTACCGTCACAACACCATCGATGTCGCTGGCCTAAAGGCCAAATATATATCGCTGTGTTCGCCTGACATGGCAAATGTCCTGCTGCTAGACAATTCCAATACAGAATGCAGCTTCAATGTGGGAAACTGCATCCCAATCCCATCGTATAAGATTGGGAAAAAGGACGAAGCCCTTCTCGACCTCCTGCCATTTCTGGACGCCCTGCGCTTTACAAGAGACGTGAGATCGGTTCTGGGAAAATGCACTCGCTTCGAGTGCCTTACCACGCTTCTGGAGAGTCTCGGCAATTACGATTAA\n>XM_046865945.1 PREDICTED: Silurus meridionalis translocase of inner mitochondrial membrane 29 (timm29), mRNA \nTGAATGGGACCTGCACCCTACGTAGCGCCCAGTATGTCCACTAGATGGCGATTTGGCTTCCGTCCCGGACGCACGCTGTGACTGAGACGCTAACATGGCGGCCTTGAGGAGGTGCTGCTCCAGTGTAGCTGCTGCTGCTGTCAAGAGCAAGGGGACGAGATGGGAGAGACTGTGGGACAGCCGTGCAGGTGTGTGGTGCCGCAGTCTTCTGAATGATTACAAGGAGGCGTGCCGTGAAATATTTGTTGGAGCATATGAGCGCCCTTTGAAAGCCAGCCTTTACGCGGCTTTGCTCGGAGGCACCTACGCCTGTTGCTACACCAACCCGGATGAAACTTCCTTCCAGGCACGGATACTAGAGACCTCCAACCAGCTCGCCCTCCTCTCTCCGTGGATCCGTAGCGGCACGTCTGACGGGCACGTGCAGAGCTTGGCCAAGCTGCGCAACGAGGGCCGTTTGCGACACATCAGCCTGGGTATCATCTCATTGGCATACGAGGCCGACTACGACCCTGAGTCCAGCCTGTACGAGGCAAGGTGCTCTGCGCTTTACGTACCCTGGGCACAGTTGCGAGAGCGGGTGCTGGACGTAGGCTTTGCAGGCCGTTGGTGGGTGTTGAAAAAAAAAATGGAGAACTATGATATAAATGAGGAGGAGTTCAAGTATCTTCCGCCTGTCCTGCTGGCCACAGCCCCGCCTACGGTACAGGAGACCGAGAGAAACGAAAGACTGCACCAGGAGTCCTTGAAGGCACTGGTGATTGAGGGAGAAGAATAGATGGGGGAGGGTAGCAGGTGAAGGAGAAGAGAGCAGTACACAACAGAACATTTGGTAATGTGAACAGTTCCTGATTGAGACCTGTGGACATGTCCTGTATGGTCAAATAATTTGATGTATAATGGCCTAAGAGGACGTTTCTGAAATATTTATTGTGGTGAAACATAATGCTGTTTATCCGTTTGTCTTGTGAGAAAATGAATCTTTGGAATCTTTGA\n>XM_039776918.1 PREDICTED: Perca fluviatilis serine-rich and transmembrane domain-containing protein 1 (LOC120543720), mRNA \nAGGGAGGGCAGAGACAGAGGAAGTCACAGAGGGAATGAGATTAGAGCGAGCACTACTCCCTCTCTTCTCTTCTCTCTCTTCTTTTCTCTTCACCACTTCAGTAAAAAAACCCATAATTCATTAGTTACAGCCTCTCAATTAGAGACCTTGTGTATGTGTGTTTCCTTTTGTATGTGAGCCCATTCATAGAGAGAATCCACATCTGACAGTGTCTACTCCAGCTGTAGTGCATGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTTTGTGTGTGTGTGTGTGTGTGTCAACCTGAATGACAGAAAGAGAGAGGGAGAGGGAGCGGACAGGCTCATAGGGAAGATCTCAGCAGGGGCAACAGATCTGGATTTGCTCGGCTGAAAACACCAAACACAACAGGATGGATTTCTGCACGACGTGAACGCGACCGAGGAACACCCGCATCACACATTAAAAAAGCCAGGATGTCAGGAATGGACGCGCTGTTGGTGGACCGTAATGAGACTGAAATCTCTCCAATAGACAATGGGACCTTCCTCCGTTTCTCCCCAACCTCTGCTTCCACATCTGCGGCTGCCTCGTCACCAGGACGTCCGGGCAACGTTTATGTTTACGTGTGGCTTTTTTTCGGCCTGCTGGTATTCCTCCTGACGCTGCTCATCATCTCCCTCCACAGGCTGAAAAACATCATCTCCTCCTCCTCGTCTGTTCCCGACTGCAGCAGCGAGGGAGGGAGCTCCTTCACCAACATGGAAATCTGTAGCATCTCGTCCCAGAGGTCCACCATCTCCTCACTGTCCACCTAAGGGAGATGGGATGGAGCACATACAGACACATAGACATACAGTATATGTCCATGTGCTTACATGGTAAGCATGCACACACACAAAGCCCATGGAGGTCCAGTGCCTTCTCACTGTGACATACAAATACAAAAACACTTTTTCAGCCACAAAGAAGCGGACAGCATGGCATTATAGTACATTCCGTGCATGTATATTCTATTTCCGGTGGTCCAGTGAGTCAGGTATGTCCATGCGATTTGCATAGGCACAGGTGAAATATAGCTCACAATGTGATGAAGAGGTATTGAGGGTTGAGACTGACTGAACCCCTTTGAGCCTTATTTCAACGACAAAGACAGATGAACCTGAGAAACTGCTCTTCCTCAGCAGGAAAAAGCATTGGAACTATTGTCTTTCTTCACTGTTTTTGTAAAGGTAATTTATTGTACTGTACTTGTCATATTTACTGTGGAACAAATAATATTGCTTTATAGTGCGTACAGCATGTCTCATAATGTCTGTAGACTACAGTACATTGCCAAATCAGAATTACAATAATATTTAAGACCATACATTGTACAGAAATGCATGCTTGTGTCTCAGTTGTTCAGTAAGGCTTTGGGAACTTTTTTTTTTTTTTTTTACCACTTGGCAAATTTCTGTATGATGCCCCTGGGGAAAGGACAAGACATACTGCTGTGGATGTAAAGGTGAGAAAGAAATGAGGGCTGTCTCTTGGACTCTTGACAGACAGTCTGACTGCAGCTATAGACCAGGTCAAAACTGGCATAAACAACAAGATGAAATTCTGGTCCTGAAAGACAGTTGCAGTCTCCATAGTGACTGATGCTCTGAGAGCTCTGTGCAGCTGTCAGCCTTGTCTGTATTCCAAGTATAACTACAATAATGGTTGTTTTGGCTCAACATACATCATTTTTGTTTTAATACCGTAAAATGTTTCTTTGACATGGCAACAAAAATACACACTCGAAACAAATTATTAGAAAAAGATTCATTCATCTTTGTCACACTTTGCCATAAAATTCAATATGAACTGATGGCTTGTAGAGCAGCGATGACGGCTACGAGGCCACGGACAATACAAGGAGTCATATCTGTCAGTGTTCTTATCAACAAATCCTAATTTTTTTCAGTTGATGGTACTGTGTCAGCCAAACTCTTTGGTTCCCCAATCACAGTGTTGACTATTGGTTCATTATCTCAGCTGTTGACAAACATGTATGGTTATTATGTCTAGAACCTGTTTGGTTTAAAGTACAAAAGATGTTTTAAATAATAGCTAAATGTTGGTTTTCAAGTTAACCAGGAAGTAAACTCTTTGTTTTAGCCTGGTGATGTTAAAAGAATAACCCCCTGATTGAACCCCCTGACTGTGTTTTGTTATATTAAAGCTCACATTTTCAGTTCTAGTCCTGCAAACACAAATCATTCAGTGAAAGTAGATTCAATTATTTTCCTTGCATGATTTACTGTACTGGATGTAACTGCAAAGCTGACTTTTGTCCCTGGATTAAATGAATGCAACTAAGGATTCCATCCTCTCTTACACATTGTACATATTCTCTTTTTTCATGCTTGTAAGGGATGTGTTCCTACTTGTATCTCTATTTGATTACTGGGTCTGCTGCATAAGGTGCTTTAATATCCTGTTAACGGAAACTCCCAGCACCATGAGCCCAACAAGTCTACAGCAACTTGTGACGCATGCAATTAACCAAACTCACACCTGAAACTTTACACAGTTTATCTTTAAGAAGCTCCACAGGAGAGGCTTTGAGTTACATGACTTGCTTAAGGGAACTTGAGTTCTTTCATTGATTCGATTTAAGCAGGAGACAATGCAGGACCAGATCCTACAGATGGAAAAAACATACAGCTAGTGCTGGAAATAGAAACTGGACACGTTGTTAAACTAACGCTGCTCTGTACGTCTTAGGTCTGTGTTCTTAGGAGGTGCTGCAGAGAATGACGGACAGTAACAGACTGAAATGTGTTTCTTGAAATCATCTGAAGAAGACTGGTGTCTAGTGAATGCAACAATAACACACCCTTGTGTGTTAAAAAGGAACCTTTTAGTGAAAAAGCATATTTGACCAATAAAAAGTAAAGTCATCAAA\n>XR_006253100.1 PREDICTED: Puntigrus tetrazona uncharacterized LOC122362386 (LOC122362386), transcript variant X1, ncRNA \nGTGTGTGAGAGAGAGAGAGTAAGAGTCCTATCATGCCTGTGTGCTGAAGGTAAGGGTTATTCCAGTCAAGCACTGAAGTCACTGAGGGGCTTGTACATGTCGGTTCTTGTCAGACGCAGCAGCTTTTTCTATCTCTCTTTCTCCCTTTCTTCCCCTATTCTTCCTGCCGGCCCGCTTTTCTTTTCTTTCTGTCTTTGTCTCTTTCCATCTTTCCTCTCCCTTTGAGTCCTGCTCCAGTAGACCTGCAGGTTTTAATGGCTCTGTGAAACAGTATAAAAGCAGCGGGTGCATTGAGTCATTTTAGCCTGAGGACTCAGACTGACTCTGTTTGTCTTTCTGTTGCAGCTGTCACTCTGCAGCCCTCCACATTCACAGCTTCACTTAAACGCCAAAATAGAGAGATAAAATGGTCGTGGTCATTTTATTGTGCATGGAATAGCCCTCGCCTGCATCCTCGTATCAATCAGTTAAATGAGGTGCTCAGACAGGAGCACAGCATGGCAGTAATAATGGAGTAGATTCTAGAGTTGATGGCCATAAGACAAGCTGAGAGCTCACTGTGCTATGGTCAGCTACATCATTAAACACACGCATGCACTCAGCTCCGAACGCATCTAATTTGACAAAATTGCTAGAATAATAATGAATGATGTTTGCTAGACACGTCTTATCACATCATATCCTTCCTAGTATACAATTTGGTGAGGTCGGTGCAGTCAGTACTGGACTGGTGAACTTTTCCCCTTCATGAAAGCACACAGAAAGTACTTAAATTGTGAAACTTGTGATTCATTAGCCACTATAGGCCTTAGTCTGAGAATGGCCATATTTAATTTTTGACAGCAATGAACAGGAGGCTGAGGGTTAGTACATCGTGTTCAGTGGATTGTACTGTTTAACAATATACCAACTGTTCGGCTGACAAAACAACTTTCCAAAAGACAGAGACTCCAGTTTTAGTTTTAGTTGTGAACGTAATCTAGGAGCTTTGAACAGATTGTAATCTCCCACATTTCATCCTGGGAAAATTCAATATGGCATCTGCCCTGATTAAAGTGTACATGTAAATAACTAGAAATGCAGTAAATTTGGTAAGCTGGTTAGCTGTTTTGAGCTGGTCAGCAGGCTGGTTTTAGTCGGGTTTTGCCACATTTCCCAAATCATGCCAGGCTGGTCTTAGCTGGGAGACCAGCTTGAACGACCAGCTAAAACCAGCCTAGCCTGCTGGGAGACTAGCTCAAACCAGCCACTTCTAGCTTAAACCAGCTAAGACCGGCCAACCAGCCTTTCTTTTCTTCTTCAGCAGGGCTACCACTTCACAATAACAAGCTGCATAACTGACTGTTTCTTAAACGTTGGCTGTGACCGCCTTGCACAATCAAAATAAAAATGGAAGTGCCCATTCTTACTTTAAAAATAAGGACACACTCAGACATGTTTGGGTCAACTCTGGAATGTAGTGTCGCCTTAAATTGAACATTTAAACATGTTGTTGTTTTTTCAAACCGTGCAGTAGTATGTGACATTTTCTATTTGAAAGGAATGACATTTAAAAGAAATGTGTTGCCACTGGCTTTAGCATTTCAAGAAATATGTTCAAGAAACAAAATAATATTTTAACCATTTATCAGAATTTAAAAAGGAACAAAAGGCGATTTTGTTCTTGTTTTCTCAAACTGTCTAAAGTAGATGTATTAATTAATCGTCAACTCGTGAAAATAATCACGAAAACCACCAGTGACCATTTCGCTATTAAAATGAGTAAAGTGAAATGGCGGCGTCCATAATGCTGGATGGTGTTTTCACGGTTGATCCCACTTCAGTCGAGTCTAATAAGGCTTAAACGCAGGAACGCAGAACTTCGGACACCACATTTTTTTGGAGTAACTCCTCTAGAAGACGGACCGGATCCAAAACCTCCGAATAACACACGGTTCCTATCTCCGTCTATATCCAGCACCCCAGACCAGATGCTTCACAATTACCCACAATTCCCCTGGAATTGTTCCTGCCTCATTGAGTCTTCAGCCAAAGTCAGGCAACTGCAACTAGTCAAAACACACACATACACACACACTACAGGGCACAGCCTGATGTGACCGCCTCTCCCCACCCCATCTGTCAGGATGACGTCAACTCTCTTCCGTCAGACAGGTGGTATCACCTAAGACCCCCCAGCTCTGCCACTCGACACAAAGTCATCCATCACCACAGCAACAGCTCCTGTCATTGCCTGGGAAGCGAGGGACTGCTAGGGCAGATGGGAAGAGAGGCAGCCCAACTGGTCTTCCAGCATCAGGTGGTCTGGGAATGATAAAGAGAGACTGAAAGAGAAAGAGGGCATCTTCCTTTGACACCAAGAAGTTTAAAATGGGGAAAAAATAACTTTCTTTTTGACACACAGACAGTAATGACAGGTGTGTCCGTGACTGGAGCTCCCAGCTGGAAACTCCAGAAAGAAATGTCCAAAGCCTCCTCAAAAATAGTCCGAGCTGACCCTTTTTGTGCAAAACCTCTGGCCCACAACATGGACAACCCGGAGATGAAGGGTAAGAGTTAGATGTGCTTCCTAGGAAGGTTTTGACTGTGCGTGACTGGTGTTGGCTGTAAATGCATGGAAATGTTTCATCACAGGTCAGTGGCATCTTTTCTGCAAGACAGCAGTACCGTATGAATGCAAGTGACCTGAAGGAAAAATTTCAAATCTTTCAGAGTTTCCGTTGACATACTGGAGACATTTAAAGAGAGAACACTTATCAAGCTGTATTCAGGCATAGAGAATGCGTCCCACATCTTAACGACACAATGATGAAACAAAAGAGCATATTCAGTACATGTCTGATTGCACTAAAATGCCATAAAGAGAGACAAGGCATCTTTTGTTCAATTCTGTCAGGCATCAAAATGTCTGGTCCATTGCTTAGCTAAATATAGAATAAAGGAGGGCAGTTATAACACTTCTTACTGCAGTGGATATTTCTAAAGGAAGGTTTATTTTATTGAGTCTTTGTGTTGAATTATGTTGCATTGACACACACAGTCTTTTGAACATTTCCACAATTATCACCCAAATGACAAAAGTTTGTGAATATGTGTAGAGCGAATGAGAGAGAGAGAAAACTATACTATAATTGCAGAACTTTTGTATAATTGCGTACCTTAGTAGTATAAACATATATGGCTAGGTTCGTATATATTTGGACACTATACAATTTTAAACATTTCAGTTCTGTATGCCACCAGAATATAATTATAAAATAAATTAATAATAAAATATTAATAATAAGGAAAACATCAATATGAAACTGAAGTGCAGACATCAAGCTGTGATTGGAGGGGTTAAACAGAAATATAAGATGTTTGGGAATTACAACCATTTTTATACACAGCCCCCCCATTTTCTGGGGCTTAAATGGAATTGGACAAGTAAATAAATAAAATATATAAAATGTTAATTTTTAATATTTTGTTGAGAATCCTTTTCAGGCAATGACTTCCTTAAGCCTTGTTTGTTTGTGGGTCTTTTCTGCCTTTAGTTTTAACTTCATGGAAATGGATGGAAATCAGGAGATTGACTTGACAATTACAGAATACTCCACTTTTTTTTTTTTTTACCTTTAAAAGCTCCTGGGTTGCTTTTGCAGTATGTTTTGGGTCATCATCCGTTTGTACTATGAACTGCTGTCCAATCAGCTTTGCTCCGTTTGACTGAATCCGGGCAGAGAGTATATTCCATGCATGCTCACGCCATCACACTACTCCACCATTAACAGATTATATTTTATGCTTTGAATTGTGAGCTGTATCAGAGTGTATACTACAATTGCACTCCTGTCGGCAACAATACATTTGCATATTCGAGTTTTGTACTATTTAATCTGCTTCATGATTCAGGGTTTGTGTAGCTCAGTTCGTAGTGAGTTGTGCTATAAGATGAGATGCAATCATGCGAACATGGGTTTGAACCAAGAGAATGTGTGGCCTCATAAAAGGTATATGTCCTTAATTTATGGTTTTACACAATTTTTTGTAACTGGTAGGTTTGGGGGTGGGGCCAGGTGTGGTCATTGGAATGAATTACACCTAGTAAAATCTGTTTTAATCACTGTGACTTTGGTGTAAAAAGTTCACACACTGCATTTAAACAAAACAGGCATTTTGACTAGTAAGGACAGTCATATAAGTCATTTCATGATGACAGATACAACACAACACTTTTACTTTTTACGCCTGCTACAAGGACGCTTAACTTTTAAACATTAAAAAAAGGTCTTAATAAGGTACTTCCACAAACAGGCTCGTAATTGAAATATATTTTGGTCAACAGATAAAATAATAAAAACTGTACCTGTGTACAAATATGCATTGACCTAAATGTATAATTAAGAGTGCAGCTTGTTATGAATTTCTATCAAACTTATTACCGTTGTTAATTGAATTTTCTTTCAAATTTGGGATTAAAAATCACTAAGTACACTCCTCAGAAAATAGTCGTCTTTTAATAGGCACAAGAAGTGATAATTACAAATTCTAAAACTTTTTTTTTTTCAGTGTTTGTTTGTTTGTTTTAAGAACTTGAAACCTGCAGCACCAACATGCTTCCCATGAGGTAATAAAAGAATGTTTTATTTGAAGCCTTTTTATGTGTAGATCAAACCACACCATTAAAGCACGGCTTTTTTGCCTGTATGTTTCATCTCGGGTTTACACATCAACAAAGCACTAATTAGCAGATGACAATCACATCAGTCCTGTTGTCACCAGTTTAAATGACACTGACAAACATTAGGGACCAGATTATATGCTTTAAACAAACACCACTTCTGTTATTGTAATGACTTCAGAATATAATAATTGCATGCTCCCAAAAGCTACACCAAATGGCACTTTGCAAATCTGCTGGGACATTTCTATGGGTAAATTCCAGGCTCTCTGATAACCATGTAATGAAATGTCTAATGTAAGATTTACTGTAAGTTCTTATTTCTAACAACAAAAATAATATAAAAATAGCTATATTGTGATTATCAATCTAGTAATTATTCTTAAGAAATGGTGGGGGAAGATGTAA\n>XM_001704125.1 Giardia intestinalis Myotubularin-like protein (GL50803_008210), partial mRNA \nATGGTGCTTCTTGACGGGGAATTTATCGTCTTTCAACCGTTCTTAGCTGCTACATCCATACCATCTTACACAGAAGGAAATCTATGGCTTGATCCTTCCGAATACGCAACTGCCACAACCAACTTGCCTCCTTCAAACGGGCACCTTCTGGTTGCAGGACAGCTGTATCTGAATATTGTGCTGACGAACTACCGCATGTTGCTCTTTAGAGCAATTAGTCCAACGGAATTTACTCCCTTTGCAAGTATACCCCATTTTATGGTCGTTTCTATTTCTAAGATTGGAGGAAAGAAGTCACGCGACGCCTATGGTGTGCTAATTAGCCTCATTACACCTCTACAGTTTGCCGTCTTTTTGCCTCGACATAACAAACAGCGCACTATCTTTATCGGTACGCTACTAAAGTACGCATCACCCAGGCTCACTCTGACACACCTGTTTCCTTGCTTTTCTCTTTTCACGTCTCCTAAGGCAGAGAAAGGCTGGTTTATATACGATCCATTTGCAGAGTACTGTAGGCAAGGCGTGGGGACGCCGCGTTTAGATCTAGAGAAATTCATGAAGCCCTTTGATCTATCGGTGGTCAAGCGGCCACTAGGGACGCTTGGAATCAAGGCCTCAGATGTCAAAGACGGCATGTACCGCATTGTGACCGGAAACCCAAAGCTCATGGTGTGTATTCACGAGTATGAAGAAATGAGAAAGGAAAAGGAGCGGGCGCTCCCTTGTAATCCTGGACACGTTCCCTTTTGGTCGCTCACCGACGCAAACTTTGATTACTCAGTTTGTAACACTTATCCTTTCTTACTAGCAGTTCCTAGTCGTTACTCAGGAGAGAACAATCTTGACGCACTTCAGCTCGTTGCTGGGAATCGTTCTCATAGGAGACTCCCAGTGTTGGCGTGGAAGGACAAGGATGACCGCTACGGGGTCATTCTGCGTTCCTCTCAACCCTATAACCCAACAAAGAAAAGCGATAGCAAATTTGTGGCTGATAGAGCATACCTGCAACACATATGGCAACACTACGGCGCCCTGCATAAGAAGGAGAAGCTCTTAGTGATTGATGCTCGGACAAGAGCTAACATGCAGATGAACCAGTTTGTTGGTAGGGGAACGGAGGGGTATCCCTTTGTGCATGTGGAGTTTCTTGATATACCAGGATGTCAATACATTCAACAGAGGCATATTGCAGACTGTGCATTGTTTGCCTCCACACAAGATAATTTTCAATATCATCGCTTGGGGCGCGTCGGTGGCATTACTGAGGTACTCGGAGTTGATCCGCGTAACTACATATTGCAGGACACAGAGTGGATGAAGGTAGATGAAGTACAGACGACAAGGAGTCAGCAAGATTTCGTGGCAGATAATCAGCCACCTGCTGAACTTGTTAGTAGGGATAGAATCAGGGAGGATGGCGTTGATCATGAAAGCTCCGAATGTGATATCTCAGGGGTAGAGCAGCTATCTCCAAGTATAGACTTTAACACGATTGCAGTACCGCAATATGTCGGTAATGAAAATGTTGACCATAGCTGTCAGGCGGGCTCCTCCGTTGTTATGATTAGGACAAAATGGACTAGCACACGTCAGCTTGAAGAAGTACACAGACTTGTCATTGCAGGAGCCGTTTCTATATGCGAAAACATCATTCGAGGAACTGTGGTTCTTGTTCACTGTTCGGATGGCTGGGACAGGACCGCCCAGTTAGTCGCTCTTGCGATGCTTATGCTTGACCCCTATTATCGATCTATGAATGGCTTCTTTGTCTTAATAGAAAAGGAGTGGTGCTCGTTTGGACACAGGTTTTCTTCACGGTGCGGAATTCTACAAGTTAGCAATCAGGACCAGGAATCTCTTGAAGACGCTGATAGAGGAGACCTCTCATCGAGTCTATGCAGCCCTGTCTTCCTCCAATTTCTGGAGCTCGTCTACTACCTTTTGAGCGCATATCCGTCAGAGTTTGAGTTCACCGAAGAGGTTCTCAAGTACCTTGCCTATCACACCTATAGTGCTCGATTTGGGACCTTTATCGGCGACTGTGAGCTAGATAGGCTCTTGTGCCAGCTTCCTATACGGACCGCCAGCATATGGGATCATCTGTTGGCATGTAAAGATCACTATACAAACAAAGGGTACTCGCCAGAGTCTATTCTGAAGAAAAATGGATGGGTGTATCTCAAGCTCAATTGCAACAGACAGCTTCCTGCTTGGCCAGGCTATTGGGAGCAGCACATACCTAAGCCTTAA\n>XM_022698119.2 PREDICTED: Brassica napus long chain acyl-CoA synthetase 1-like (LOC106386204), transcript variant X3, mRNA \nGGTTTGTACTTTGGTATTGTTAGGTTGACCGGGCTGGTCGCAATAAATGCCATTGTACCAATTACTCATAATAACAAAACTATGCAACTTATGTGTATATATAACAAAATTCAAGTACGGAGTACGCAGTCAGATTAATCAATGAAACTTTAGTATCTGTTTTCGCAACGATTATATATATTGTTCACAAATAATTCAATTTTATGAACATGCAAAATACGATAAAGACCCTCATTTTTAAACCAAGTTATTTCCTTTAATGATCTTTACCTATTTCACGTTTTTGTACCTAAAATTTTGAACCATTCGTCAGCTACGTCGGCGTTGGCTTCATTGTATATCTATCTCATTTATCCATCATTTCCGGTTTTTCTATCTAATACATTTCTTTAACATAAAGAAAATAGCTTCAGAGAGTTTCTCTTCAAAAAACGGAAAACAAAGAGAGAATGAAGTTTTTCGCGGCGAAGCTGGAAGAAGGAGTTAAAGGAGGAAACGGGAAGCCGTCGGTAGGTCCGGTGTACCGGAATCTTTTGTCGGAAAAAGGTTTTCCGCCTATGGATTCTGATATCACCACTGCTTGGGACGTTTTCAGTAAATCAGTGGAAAAATTCCCTTACAACAAGGTGCTTGGATGGCGTCGAATCGTCGATGAGAAGGTTGGACCGTATATGTGGAAAACTTACAAGGAAGCATACGGAGAAGTTCTGCAGATTGGTTCTGCAATACGTGCTCTGGGAGCTGAGCCTGGGTGTCGAGTGGGGATCTATGGAGTTAATTGTCCTCAGTGGATAATAGCAATGGAGATGACACATGAAGATGTGTATCTTTCCTTCTTGCCGTTGGCTCATATTCTTGACCGTATGAATGAGGAATACTTCTTTCGCAAAGGGGCTTCGGTTGGCTATTACCATGGAGATTTGAATGTGTTACGCGATGACATTCAAGAATTGAAACCAACTTATTTAGCTGGAGTTCCAAGAGTGTTTGAGAGAATTCACGAGGGAATTCAAAAGGCTCTTCAGGAACTTAATCCTAGAAGGAGATTTATCTTCAATGCTCTCTACCAACACAAGCTTTCATGGTTGAATCGTGGATACTCTCATAGTAAAGCTTCGCCCATGGCTGATTTCATAGCTTTCAGAAAGATTAGAGACAAATTGGGAGGTCGAATCAGGTTGCTAGTATCTGGAGGAGCACCATTGAGCTGTGAGATTGAAGAGTTCCTTAGAGTTACTTGTTGTTGCTTTGTCGTCCAAGGGTACGGTCTAACGGAGACTCTTGGAGGAACGGCTTTGGGTTTCCCGGACGAGATGTGTATGCTAGGGACAGTTGGTATTCCGGCCGTTTACAACGAGATACGACTTGAGGAGGTGGCTGAAATGGGCTACGACCCACTCGGGGAAATTCAGGCAGGCGAGATCTGTATAAGAGGAACATGTTTATTTTCTGGTTATTACAAGAACCCTGAACTTACTCAAGAAGTCATGAAAAACGGATGGTTCCATACAGGAGATATAGGTGAGATTCACCCAAATAGAGTACTCAAGATAATTGATCGCAAAAAGAATCTTATCAAACTCTCTCAAGGAGAGTACGTTGCTCTTGAGAACTTGGAAAACATCTACGGTCAAAACTCTGTTGTCCAAGATATATGGGTTTATGGAGATAGCTTCAAATCAATGCTTGTAGCAGTGATTGTTCCAAATCCTGAAACCGTGAACCGGTGGGCTAAAGATCTCGGCTTTACTAAGCCATTCGAAGAACTATGCTCTCTCTCGGAATTACATGATGAACACATCATTTTAGAACTGAAGTCCACGGCAGAGAAAAACAAGCTAAGAAAGTTCGAGTATATAAAAGCAGTGACAGTGGAGACAAAACCTTTTGACGTTGAGAGAGACTTAGTGACTGCGACCCTCAAGAATCGAAGGAACAATCTTCTCAAGTATTATCAGTCCGCCAACGTTCCGTTATACAGGTACAAGTCGACGAAATGTACCGAAAATTGTCGTTGAAGAAAATGTGAAAGTGTTGCATGACCATCGATGTGTGTGTTATTATTGGTAACTATGTTATGTACGTATGTGTCAATCATTGATTAAAAAAGCCTTATGCGTTCTGTAATGTTTTAATTCTAAGCTATGTTGAATAACCATTGACATCATTAATTATTATTTTTTCTTTTGTTAA\n>XM_040148298.1 PREDICTED: Xiphias gladius tensin 1b (tns1b), transcript variant X3, mRNA \nGAGGCAGAGTGAGCACAGAGGAGAGGCTGTCAGGATCCAATTTAGGTTTAGAGGAGAGACACAGGAGGAGAAAGCAAGTCAGACAGTGAGGAAAAGGGAGAAACAGGAGCCCGAGGTGAAAGAAAGTGTTTATGTTCAGGATAGTCATGGCTCTGCAACGTTGGGAAACTCTTCTCCTGCCTGGATTAGACTTAAGGAAGACCAGTGGTCTGTAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCATCATCACCAACACTCCTGTCCGTCAACATGCCGTCTGTCTCTCTCAGCCTGCCAGCAGCTCTGGCTGGACCTGCACGCACCTGGGTCTGCCTGTCCTGCATGTTCTGGCCAGAGGAGTTGGAGGCTCTTCATTCCCATACGTTCCGGGTGAAGACTTTCAAGAAGGCCAAGCACTGCAGCGTTTGTAAACAGACCATCATCCAGGACGGACTCGTCTGCCGAGTGTGCCGAATACCTTGCCACAAGAAATGTGAAGTCAAGGTGTCTTCATCTTGTGTTCCAGCAACAAACTATGAGCTGGCCCCAAGCGGTGACCTCCCTCTCAAACATGTAGACACCATGGGCTCAACAAAATCGTCAAAGAGCATGGAGTCACGGCGCAGACCATCAAGGAGTGTGAGTTTGCTGCAGGCTCTGGAAGAGAGCTACGAGTTGGACCTGATCTATATCACAGAGAGAATCATCTCCGTCTCCTTCCCCAGCAGTGTGGATGAGCAGAGTTATGCTGCTAACCTGCAGGAGGTCGCCTCCATGCTGCGCTCCAAACACGGTCACAACTACCTGCTCTTCAACCTCAGTGAGAAGCGTTATGACATCAGCCAACTTAATCCAAAGGTCTTGGACTTTGGCTGGCCTGACCACCATGCTCCAGCCCTGGACAAAATCTGCAGCATCTGCAAGGCCATGGACACTTGGCTGAGTGCGGACAGCCACAATGTGGTGGTTATACACAACAAGGGCAACCGGGGCAGAACGGGAGTGGTGGTGGCGGCCTACATGCATTACAGCAATATATCTGCCAGCGCTGACCAGGCTCTGGACAGGTTTGCCATGAAGCGCTTCTATGAAGACAAAGTGCTTCCTGTGGGCCAGCCATCACAGAAAAGATATGTAGAGTACTTCAGTGGCTTGCTCTCTGGACACATCAAGATCAACAACAAACCCTTGTTCCTTCATCATGTTATCATGCATGGCATCCCAAACTTCGAGTCTAAAGGGGGTTGTCGTCCTTTTCTCAAAATCTACCAGGCCATGCAGCCCGTCTACACATCTGGGATCTATAATGTTCAGGGCGACAGCCAGACGAGCATCTGCATAACCATTGAACCTGGTCTTCTTCTGAAAGGGGACATCCTGCTGAAGTGCTACCACAAGCGCTACCGTAGCCCGTGCCGAGATGTGATATTCCGGGTGCAGTTTCACACCTGTGCCGTTCATGACCTGGGGATCATCTTCGGGAAGGATGAGCTTGATGAGACATTCAAAGATGAAAGGTTTCCAGAATATGGAAAAGTAGAGTTTATTTTCTCGTTTGGGCCAGAGAAAATACATGGTCAAGGTGTGGACCACCTGGAAAACGGGCCGAGCGTCTCGGTTGACTACAACACACAGGATCCCCTGATCCGCTGGGACTCGTATGAAAACTTCAATCAGAACTGTGAGGACACCACAGATGAAGTCATCCATACCCAAGGACCCCTGGACGGCAGCCTCTACGCCAAAGTTCGCAAAAAGGAGTCTGTTGAAGGAACAGTCACAGCAAATGGCCTGCCACCCACTGCTGTTGAACATGCCCTACCTGCGGTTGACCATGCCTTATCAGTAAGCAGCGACTCAGGAAACTCTACTGCCTCCATCAAAACTGACCGAACTGATGAAGCAGCAGCAGTCCCTCAGGTTTCCAGAGTGAGCCAGACACACGTTCCTGTGGTTGAGGAGTCACCATCAGTCCATCACCAAGCCCCACCTGCGCAACAACCAATTAGTCCCCAAGAGAAACAGGAGCTGGAGCAGCTGCTGAGTGGCTTGGAGGGGCCCATGCACCAACAGGGCTACCTGTCCACCCCAACATCAGCTGTTGGAGGGATGCTTCACCTGGTGCCTGCTCAGGTCCATGTCAATGGGCACACTAGCATTGACCGTGAAACAGACATTTTAGACGATGAGCTACCTACCAGTCAAGAGGGCAATAGTGTGGACAGTCTAGGAACATTCTCCTCCACAGATGGTAGGGCTACACCAGCTGATCTGTACTACCAGACTGAGTCCCTTGTCAATGGCCAGGACCATGTGCCATATCTAGAGCGCAGCGTCCCCGAAAAGCCTCTGGAAACCGTCCAGCCACATGTTGGCATATCTGACAAACCTGTCACTTTGACCCAAAGTGATTTAGCCAAATCATCTGGTACTTACATGGCCACCCAGAATGGCAGTCTGTACCGTTCTCAGTCATTTGGTGCAGAACCAAAATCTATGCCACAAGCTCCAACCCGCACCACCAGTAGCAGGGATGCCGTCCAGCGTGGTCTTAACGTTTGGCAGCAGTTTGGTGTACCTGATGAGCCAGTAACTGAAGGGTTCACTTTTAGTCCACCTCCTTCTGTAGCAGTGATGCCCAGCCACCACAGTCTCCCACAGTTCCCTCATCGCCACAGCACCTCCCAGCAAGAAATTGAGCAATCTATTGAAACCCTTAATCTCCTCATGTTGGACCTGGAACCAGGGTGTTCGCTGGTGCCAAAGTCCCAAAGTGCTCCACTGCGGGAAAACAGTGTTGTAGTGACCACCCAGCCGTCCTTTTCCCAGAGCCAAACCAGGCCCACCTACCAGGGTGATGCCGCCATTCATACCCACTTTTCGGGTCCCATGTCCAGCCTGGCAAGCCACTCGTCAACAGCTCAGATGTCACCTGGGAAGCCTAGAACACCAGAGCCTGCACCTGCCCAGGGATCTCTGAGTTACAGCTCTGAAACCTCTGGAACTAGTCCTCCCTCACAAGACTCCCTTCCTGTAGCAGGCCACGTCCAGCTGAAGCCCATCAACACCTACCCTCCAAGCACACTGTCCCATTCTGCAGACATCTCTGAGGCCCAGAGAAGCCCTAGTGCTGCGTCAGCATCACTCCAGCCAAGGGACAGTGAGCCCGATGAAGTCTTCAATGTTGAAGGTCTGGTGGCTCAAAGAGTGGCTGAATACTCGGCTCGTGCCCAAAGTGTCATCCCCAGCATGACCTCTTCTCAGTCTGAGCACCGCCGTTCTCACTCCCTCCCGGGTGTCCAGGCCCGTGCAGTGTCCTTGGATGAGCCTGCAACTCTGCCTCGCCATCGCATCGTCAGTGACGGCCATTATCAAAATGGCCCTGACGACAGTCCCTCACCTGATATCCTAGTTCGTTCCCCCATTCGATGCGTTTCTCCAGAGTTTGCCAATGCCATAGCGATGAACCCCGGAGGACGGCCTAAGGAGAGAAATATGCACAGCTACCGGGAGGCCTTTGAGGAAATGGAAGGAGTCCCCATTAATCCTACACCCACAGTTGGTGGTGAGGTGTTTCCCCAAACCCCTGCCTTCCCCATCTCGCCGCAAACCCCTTACTTCAACCTGTGTCGGTCCCCTCCTGGTCTTGCCAAGACTCCGCTGTCAGCCCTGGGATTGAAGCCCCACAACCCAGCAGAAATCCTCCTGAATCAAACAGGCTCAGATGATGAGAGCAGTGAGGGTGAGGAAGCACCAAGAAGCTATGTTGAGTCTGTGGCGAGGTCGGCAGTAGCAGGTGGAGAGCAGCCCACATCACCTCTGAGCCTTAGCCCACTGGGAGAGACTACAAGCCAGCAGAGAGGTCCAAGTCAATCGACCCACACACTGAACCCACCTTTGTCCAGCAGCAGTCCCTTCCAGAGCTCACAGGGTGAACACCCCTCAGCACACTGCAATGTTAGCACTCCGTCCCAACCCACTACTGATTCGAGCTTCCGCTCCCAGGCTACAGAGAGTGCCTACCCCACTCCAACCCCCTCATGTCCAGCCGTGAATACTCCCACCTCTTCCTACCTGGATTCCAGCTCTCCAGCCTCTTCCTACCTTGGCACTACTACCCCCACACTGTCCTACCTTGGCCCCAACAACCTCCTGGGAAACTATGTTGCCTCAGATCCAAGCCTGTCCACCTCAGAACCCTCCCAGACCACACTCAGCCATGGAAGTCCCCATGCACAGCACTGGACCAACACCCTTAGCTCCACTCATAGTCCTGTCCTCCAGCAGCGCTCGAGTGCTAATCAGGATGGCTCCATCATGGGTCAACAAACATCAACAGCTAATGGCTTTGATGTGGGCATGCCAGGCCTCATGACAGGTGGCAGTCCCATCCTCGGTCATCGTCTGTCTCAGGGAGCTCAGAATAGCCCAGTCCTCAGCAGACAGGCCTCTTTGGGACAGGGGTCTCAGCGGAGCCCTGTCTTCAGCAGACAGCCGTCCCTGGGTCAGCCCATACAGAGCAGCCCTGTGCTCAGCCGACAGCCATCTATCACACACCCCCAAGGAAGTCCGGTTTTGGGCCGTCACCCATCTGTGTCACAGGTGTCCCAGAGAAGCCCCAGTTTGGACCGTCACCCCATGCACAGCGGTTACACCACCCCAGATGAGAGACATGGGAACCTGTCGAGACAGAGCAGCTCTTCGGGCTACCAGGGGCCACCCACTCCCTCCTTCCCCATCTCGCCTGCAGGCTACCAGGATGGGGGGATGATGGGGACGGGTGTAGGGTTCAGGCAGGGTAGCCCAGCCCCTGGTCTCCAGCCCCAGCTTCCAGAGAAGAGGCGCATGTCTAGCGACGACAGACCAAACGGAGCTCTGTCCTATGGCACGCTAAACGGAAAAATAATGTCCCCAGTGAGTGGAGGAAGCACTCCCAGCTACTTCCACACCCTCTCAGACTTCTCCAAGTTCAATATGCCCGACGAAAGCCCTGAGAGCAGGCTGAATGTCAAGTTCGTCCAAGACACGTCCAAGTTCTGGTACAAGCCAGACATTTCCAGGGAACAAGCTATTAGCCTGCTGAGAGAGAGGGAACCTGGAGCCTTTGTTATTCGGGACAGTCACTCGTTCAGGGGGGCGTACGGCTTGGCTATGAAGGTGGCCTCTCCCCCGCCCTCCGTGCATCAGAACAAGAAAGGTGACATCGCCAATGAGCTGGTGAGGCACTTCCTGATCGAGAGCAGCCCGAAAGGAGTGAAGCTGAAGGGTTGTCCAAACGAGCCTTACTTTGGCTGCCTGTCTGCTTTGGTCTACCAACATGCTATCACACCATTGGCCCTGCCCTGCAAGCTGCTCATCCCTACCACAGATCTCATTGAGGAAGCACCAGAGGTCGCAACAACAAATCCACTGGCTGAGAGGCTGAAACAAGGAGCAGTGCAGAGGGCCCCTGCTGATTCCCATGCATGCAACGTGCTCTACATCAACTCAGTAGAGATGGAGTCCCTGACGGGCCCTCAGGCTGTTGCCAAGGCCATATCTGAGACACTGGCTGCCGCCTCTCCACCTACAGCCACCATTGTGCACTTCAAGGTGTCTTCACAAGGCATCACGCTGACTGACAACCAGAGGAAGCTTTTCTTCCGACGCCACTACCCCGGCAACACTGTCACGTTCTGCGATATTGACCCTCAGGACAGAAAGTGGAACAAGCCTGAGGGAGGCACAGCCAAGCTGTTTGGGTTTGTGGCGCGTAAGCAGGGAAGCACAACCGACAACGTCAGCCACCTCTTCGCTGAGATGGATCCCGACCAGCCTGCCAGCGCCATCGTCAACTTCGTCTTGAAGATGATCGCCTCGCAGAAACAATGAGAGCTGTCAGCAAACCCTGGCGCTTTTTTTTAATGCCTTTGGTTATTTTCTTTCCTTTTAACCACAGACACTTTCTGTTTTGGAAAATTTGCGTTTGACGCACCACCTTGTTTTTCCTGCTCTTTTACATTTAGGCAATTGTGTAGCTGTGTGTGTTTGTGTATGTAAGCGAATGAAAGAGAGCAAGACAGAGTGTGTGTGTGCGTGTGTGGTGTGTTCGTGCGTATGCGGCTTGCATTCATGTGCTTTTCTTCTTGGATGGACTCCAGAATGGACCAGAGGAAGTGCAGGATGGGGAAGTGGCTGTGTGTGACAATGGGATGGGAGGTGATTTTAATCTCCCTGGCAGGGTAACTCATGGACAGGAAGAGGGAATGAAATTGTGTGTGCAAATGTTATTTTTTTAGCAATTGTTTCATTTTTATTTTTTTAAAGAAGAAGTGAAGTTGTGTGATGTAAAAGTGGGTTGTATATCTATCAGGCTTTTGACTGGTCAACCAAAGATTTTAAAAAAGTTGTCAGGGCGTGTATAGTGTGCCATTGTCAGAGGGTCAGAAGTATTTTGTAAAACAAATATGGCTGCTTAATCAAAAATACTGAACTGTTTCTTTCTGTATGTACTGGTCAATTCTGCATCTTGCAAACAATGTTTTCGGACATTTTTGCAGCTGGTGAGGTCTATGTAAATATTCTAGATTGCTTTATGAGTAGGACTGTTCTAGATGACATTTGGTGCCTGACTTTTTTTCTAATGCAGAGCTTTTTAAGAAAAAAGAAGAAGATCAATCTCACCCAGGCTGTCTTAAATATGCAAATAGCCAAACTTTGAAATAAGGTTGTTCTCCCAAATTCCACAGGTCCTTCCCTGTTCGACGTAGTAGCGTAGCTAAAGATGCAACTGATGTAATTCCTCTGAAGTGCAGCTAGAGTCTGACAAAATCGGCTAAACCTGTTTTTCGTGAATTTGCTGTATCCAAGTGAGCATCAGTAAGAAGGCCACTGAATCCTCAACAATCACGTCTCGGGATTCTGTTGGTCAGACAAGCTTCCTGTCTGCCACCATCCTCTGTTCAGTCTGCACAGCACATAGCCACACTATTTTGCTCATGATTGAAGGGCCAAGGGTTGTTTTATGGGGACAATCTTAATAGAGAAGTGTTGTCCTGCTATACTGCTCTTCAGTTTTCTGTGTTGAAAGTTTCCGTCAATAGAAAGAAGCTCTTTGCGTCAGCCGGCCAAAACTGTTAACACTCACACCCTACCCAAAAGTAAGCTATACATATAAATAAACATATATAGATATATATAAAAACTTCCAAACAGTGACTTAAGATATTTATTTTTTTGCTTTGTTGCTGTATCTTATCTTGTATACATGTATTATAAAGCATACACCAAGATTACTGAACGCGTGAAGAAAAAAAATGCTTTTTATTTTGGCTAAAGTCAAGAGCATTGACATATATAAGGTGTAAAGTGTGTGCATTTAAAAGTGTATCACTGTTGTTTTTGAATGTTTTTATTTCACATTATTACTTCCTTTTGTTAACCTTTTGTTTTCTTGGGGAGGCTTTTTGTTGTTTTTTTGTTGTTTTTTTTTTTTAAGAGAGGGGAAATATTTTGTATGACAGATTGTTGTTACTGAAGTCCAAATTGGAGTTATCCTAAAGTGATGCCAACAAAATTGTTTTATTAACTTAAACCTGCCTAGAAAATACGTTGTCCAATTTAAGCACTTAAATGTTGAGCTATTCTCATTGTGTTTCTACAGAAAGACGAGATATGGACGTTGACAGACCCATTTCATATCATCACTGCATGTGTGGGGGGAAGACTTGCTAGTTCCTCAATCCCCACAGCCTGGGACTGATCCTTGTACATGGAACATTATTAAGTTCAGTCAGTAGCTGCTGCCCTCATGTGGTGTGGAACGCTCATTACAAAGGAACCACTTTTATTCTAATACAGTGTTTTAGCTGTGATTACGGCAGGTCAAAGGGTAAATGTTTGAGTTAAATTTGATCACTGAGAAAATGAACTAAAACTACGTTAATTTAAATGCTGATTCTTATGCTAACTTTCTTAGAAAATTTGTTTTTTGTTTGCATTTCAAAGTCCCATTCAAGGATTGAGTGTGTCGAGATCACATCTCCTTTCTTTACGCCTGATACACTAGGATCAGTTGGCAGCATGATGTAAAATAATTAGATAAGGGTTAGTTTTTTGGGCCTACATTGACTCAAATGTACTCCTTCAAAAATATAAAAAAAATAAGAAATACAGCACTTACAGGACTTTTATATCTGACTAGAATATTCCATTATTTATTAGCAGGCTCCTGCACGCTCAAGTCAGCTTGCCACCTTAGTGCTGCTGACTGTAATGTGTACACAGTATCCTCAAGTCTTACACGACCAGTCTTTTCAGAAAGATGCCCATAGTTAGTTATCATCAGGTTTTGATTATCATGTGACGACTGTGTCTTGACTCTGCTTATGAGACAAAACAATCTATATTTTTGCCTACAAAATGCTTGTTGAGAGGACTCCCTCTTCTTCAAACTGAATGTTAGCCATTTGTTTGCCAAGATGGAAACTCCAGTGGCATCTGCCCACTTTGACAGATCAGTCTGGACTGTAGAATGTGTGTGAATGAGCTACTATGTCTGTACAGAGCTTTGTCATTTTTGATTTGCTACATTGTATGGCTTTTACTATTTCTGATGGAAAAAAAACACATTAAAAAGCAGTACAAATCAAAA\n>XM_044234934.1 PREDICTED: Neovison vison P2Y receptor family member 8 (P2RY8), mRNA \nGCCAGGATGGATATGAACATGACCCGGCCGGACAACGCCACCATCGTGATGCTGCGCGACCCGACCATCGCGGTGGTCCTGCCCGTCGTGTACTCGCTGGTGGCGCTGGTCAGCATCCCGGGCAACCTCTTCTCCCTGTGGGTCCTGTGCTGCCACATCGGGCCCAAGTCCCCGTCGGTCATCTTCATGATCAACCTGAGCGTCACGGACCTGATGCTGGCCAGCGTGCTCCCTTTCCAGATCTACTACCACTGCAACGGGAACCACTGGGTGTTCGGGGAGCTGCTGTGCAACGTGGTCACCGTGGCCTTCTACGCCAACATGTACTCGTCCATCCTCACCATGACGTGCATCAGCGTGGAGCGCTTTCTGGGCGTCGTGTACCCGCTGGCCTCGGCGCGCTGGCGCCGGCGCCGCTACGCCGTGGCCGCCTGCGCCTGCGTCTGGCTGCTGCTGCTGGCCGCGCTGTCCCCGCTGGCGCGCACCGACCTCACCTACACCGTGGAGGCGCTGGGCATCGTCACCTGCTTCGACGTGCTCAAGTCCACCATGCTGCCCAGCGTGGCCATGTGGGCCATCTTCCTCTTCACGCTGTTCATTGTGCTGTTCTTCATCCCCTTCGTGGTCACCGTGGCCTGCTACACGGCCACCATCCTGACGCTGCTGCGCGCCTCGGACCCGCACGGCCGCGGCCAGCGGCGCCGCGCCGTGAGCCTGGCCGTCGTGGTGCTGCTGGCCTTCGTCACCTGCTTCGCGCCCAACAACTTCGTCCTGCTGGTGCACATGGTCAGCCGCCTGTTCCTGGGCCGCAGCTACTACCACGTGTACAAGCTCACGCTCTGCCTCAGCTGCGTGAACAACTGCCTGGACCCCTTCGTGTACTATTTCGCGTCCCGCGAGTTCCAGCTGCGGCTGCGGCGCTATCTGGGCTACGGGCGGCTGCAGGCCTGCGGCCGGGACGCGCGCAGGGATCCCCTGTTCTCTGCCCGGACGCTGTCGGCGCGCTCCATGTCCAGCGGCCACGGCGACGGGCTGGACGGCCCCAGCCGGCCCTGCCTGCAGAGGCAGGAGAGCGTGTTCTGA\n>XM_006814478.1 PREDICTED: Saccoglossus kowalevskii uncharacterized LOC102803486 (LOC102803486), mRNA \nATGATATCAGATAACGCGTCTACATATCTGTCTGCTGCTAATGAAATTAAACGATTATTGGATTCCCCTGAAATTCAAACCTATCTTACGAACAGACGCGTGCAATGGTCATTCATACCCAAACGAGCACCGTGGTTCGAGGGTTTTTGGGAGCGTTTGATTGGCCTCGCCAAAACTGCTATAAAGAAAGTCTTGGGTCGTTCATTCGTAACATACGACGAACTCAATACTATCATAACTGAAATCGAATCTACTCTAAACGACCGTCCCCTGACGTATGTGTCTACGGACATTGACGACGCAACCCCGCTCACTCCGTCACATTTATTAATTGGTCGCTTGGTTACGCCACTTCCGCATTTCGTCGTGGACGACGATGAATTATCTGACCCGACATTTGGAAACCGACTAGATCTCGAGAAACGCCACGCTCATATATGTAAATTACTAGAACAATTTTGGAAACGTTGGACTAGCGAATACCTCACGTCTTTGCGAGAACGACACAACAATACGGTTGGTGCAACGGACAATACAATTAAGGTCGGTGATGTTGTGTTAATGCATAGTGATATCGCTCGTCGTGTAAATTGGCGTTTAGCCACCGTTCAAAGATTAAATGTCGGAAATGATGGACTTGCACGTTCTGCTGAACTCAAGACTACCAGTGGATTTACAAACAGACCGATTACGAAACTATATCCCTTAGAAGCATGTGGGAACAACGCGCCCACGCTATCTATCGAAAAATCTCTTGCTGTGAAGTCTGTTCTACCCGGAATTAATGAAACTGTTACTCGCTGTCCACCCAGAACAGCCGCGACTATAGCCCGACTACGCATTCAGGACATGAACGATATGTGA\n>XM_026561538.1 PREDICTED: Papaver somniferum uncharacterized LOC113312801 (LOC113312801), mRNA \nATGTTACACCATAAGTGTACTAATGGGTTGAGTAACAAAGCTTTTGACGAGTATTGTACTATATTACAGTCCACGAAAGCTTTTCTAGATAGCAGTATCCCTAAGAATTACTATGAAGCAAAAAAACAAATTCGAGATCTTGGTGTGGAATGTATTAAAATAGATGTATGCCCAAATGATTGTATGTTATATTGGAAGGATAATCGTGATAAGGAAAGGTGCGACGCCTGTGGTGAGTCTAGATGGATATCAGGTACTTGTCAATCTGGAGAAAAAGAAGCAAGTGGAAAACAGAAAGTCAAGAGAAAAGTTGCCAGGGTTTTGAGATGGTTTCCGTTAATACCACGGCTTCAAAGGTATTATATGGACCCTAAAACCGCAGAGGATATGATATGGCATGATAAAGAGCGTACCAAAGATGGTGTTTTAAGGCATCCGGCAGACTCGCAATGTTGGAAAACCTTGGACGAAAAGCATCGGGTATTTGGTTCAGAACGTCGCAATGTTAGACTCGGGTTGGCAAGTGATGGGTTCAATTCTTTTGGTGTTATGGGTACTGGTCACAGTACATGGCCAGTCTTTGTTACTTCTTATAATTTGTCACCAGAGAAGTGTATGAAGCAACCCTATTTTATCATGTTTCTGCTTATTCCTGGGCCTAAGGGTCCTGGGAATAATATTGATGTATACTTACAGCCACTAATCGGAGAGCTAAAGGAATTGTGGGAAATGGGAATTGAGACGTATGATGCTTATTCCAAGCAGAACTTCCAAATGCGTGCAACTCTCTTATGGACTATTAATGACTTTCCAGCATATACCAACCTGTCAGGATGGAGGCACCGGAGATTCTTACCTATTGGTCATCCGTTACGAAGAAACCTGAGCTCTTTTAATGGCCGCAGAGAACATGATAGTGCACCAAAACCTTTAAGCGGTGAGGATGTTCTTCGGCAGTTCCGTGGTTATCATCAAATCACTTTTGGCAAGGAAGAACATGCTGTGTGTGGGGAGAAAAGAAGGAGGGATGACAATGAGCTGCCTTATAATTGGAAGAAGATAAGCATTTTCTTCGAACTACCTTACTGGAAAGATCTTCTCTTACGACACAATATTGATGTGATGCATACCGAGAAGAACAACAGTGAGAGTTGGATAGGGACACTGTTGAACATAGAAGGTAAGACAAAAGATAACTTGAACGCTCGGGAAGATTTGAAAGTAGTGGGTATACGTGGACCACTTCACCCTGAAGCTTTGGGGAACAACAAATTCTACCTTCCTCCAGCAAAGTATACCTTGTCTTTGGCGGAGAGGAGGAAGATTTGTCAATTCTTGCGTGACATAAAGGTACCCGATAGTTATTCATCGAATATTTCGCGGCACGTTCAGGTACAAGAATGCAAGATTCCCGGGCTAAAGAGTCATGACTGGCATGTTCTCATGCAACAACTTTTTCTTGTTGCGGTGCGTGGTATCTTACACGATGACGTGACTAGAGTTTTAGTTGAGTTTTCTGATTTTTATACTCAATTATGCTCCAAGACATTGAGAATCGAAGATTTGGAGGCGCTTAAAAAAATGTATCTCACTTTGTGCAAAATGGAGATGATATTCCCTCCTTCGTTTTTCGATATTATGACACACTTGCCTGTTCATATAGCAAGAGAAGCTATAATTGCTGGACCTGTTCATTACCGGTGGATGTATCCAATCGAACGGTACTTGTACACCTTGAAAAAGTATGTGCGAAATAAAAGTCAACCTGAGGGATCGATTGCACAAGGGTATCTTGCTGATGAATGTCTGACATTTTTCTCCAGATACTTGAGTGCTGAGATTAATACAAAGTTCAACCAGATAGGGAGAAATAGTGATGGTGATGGTGCGACGACATCTAGTCATGAATCGCCTATCTTTGAAGACGCATGTCGTTCTTTAGGGAAACCAATTTTCCGAACTTTATCTGACAATGAGTGGGAGGAAGCCCGAATGTATGTGTTGAGTAATTGTGATGAAATTCTTCCGTTCATCGAGTAA\n>LC340153.1 Symphorichthys spilurus mitochondrial gene for 12S rRNA, partial sequence, specimen_voucher: KAUM:I:93808 \nCACCGCGGTTATACGAGAGACCCAAGTTGTTTAACAACGGCGTAAAGAGTGGTTAAGATCTAAACTTATATTAAAGCCGAACGCCTTCAGAGCTGTTATACGCATCCGAAGGTATGAAGTCCAACCACGAAAGTGGCTTTATAACATCTGAACCCACGAAAGCTACGGCA\n>MF223903.1 Uncultured bacterium clone denovo5551_560_46813 16S ribosomal RNA gene, partial sequence \nTTTTTCCTACGGGGCGCAGCAGTGAGGAATATTGGTCAATGGGCGGGAGCCTGAACCAGCCACGCCGCGTGAGGGAAGAAGGTACAGCGTATCGTAAACCTCTTTTGTCAGGGAACAAAGGCGGGGACTAGTCCCCGGATGAGGGTACCTGAAGAAAAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGCAGGCGGCCTGGTAAGTCAGCGGTAAAAGCCCGGGGCGCAACCCCGGCTAGCCGTTGAAACTGG\n>XM_024271454.2 PREDICTED: Oryzias melastigma visual system homeobox 2 (vsx2), transcript variant X2, mRNA \nTCCAAGCATGCTGAATATCCTCCTCATCCTCGTTCCCTGCAAAATGCAATAGGAGAGGGAGTAACTGCATCCATGATCCACTGGAATCCTGAATCCTTGCAGCTGATTGGCTGCTGCGGGCTGCCTCTTGTTGGGATGGACCTGTTGGATAAAAGGAGAATTTTCTAAAGGACTATGTGATACAGAGGATGTTGTGCGGGGGACAGTCCAGTTAGACGCTTTTTTTTCAGAAGAAAAACAAACAAACCATAACGTCATGACGGGGAAACAGGGCGCCGCGCTGTCGGAAAGTTTAGAGAAAACCTCTCTGGTCGTGAACGGCGGGAGCCTCCAGCCCAAAAGCAGCAACCCTCCACCCAGATGCACCGGCTTTGGCATCCAGGAGATTCTGGGGCTGAACAAGGAGCCGGCCAGCGCGCCGAGGAGCCCTCTGAGCGCGCTGCCGGCCGGGGCGCACCTGATCGCGGCGCGGTCGGTGCTGGGACCCGCCGGCGTGGGTGTCGGGATGGGATTAATCGGCCCCGCCGGGATTCCGTCGTTCTACAGCCAACCCGCCTTTCTGGAGACGGTGCTGGCGGACGGACACGACATGCGCCTGCAGCCGCACAACAGGTCTGCGAGGCCGCTGGACGCCAGCCAGTCCGTCAGCTCAGATTCCGAAGATTTATCTTCCAGTGAACGGAAACTTTCCAAATCATCAGTAAATCAAAGCAAGAAACGCAAGAAAAGACGCCATCGAACCATTTTTACATCATACCAACTGGAGGAACTGGAAAAGGCCTTTAACGAAGCGCACTACCCGGATGTTTACGCGCGAGAGATGCTGGCTATGAAAACAGAGCTGCCTGAAGACAGAATACAGGTCTGGTTTCAGAACCGCAGAGCCAAGTGGAGGAAGAGGGAGAAGTGCTGGGGCCGCAGCACAGTCATGGCGGAGTACGGCCTGTACGGAGCCATGGTGAGGCATTCCATCCCTCTGCCAGAGTCCATCCTCAAGTCTGCCAAGGATGGCATCATGGAGTCCTGTGCTCCCTGGCTGCTCGGGATGCATAAAAAGTCCATGGAAGCAGCAACTCTCCCGGCAACAGCAAAGTGCGATGCCCCCCAGCAAGCAAGCACACAAAGGCCGGAGGACGTTGAGGCAGAGGAGAAGAGGTCGGACGGCAAGTCCAGCATATCTAAAGAGGAAATGAGGGAGAACAGCATCGCTGCACTCAGGGCCAAAGCACAGGAGCACAGTGCCAAAGTGCTGGGGACAGTTTCTCATGACAAACTGCTGGAAGGCAAACAGGAGAAACAGGCGGTTGGGGAGAAGGTCAGTGACCCACCGAGCCCGTCAGAGGAGCAGAAAAGTCCCTAAAGAAACACATTTTGTGAATACTGTGGACCGACAGCTGTCGAAGCAAAAACAGACTCAATGATCTCCACTAAAGATATATAGCCCGCATCCAGACCGCTCTGAAGGAGAACTTTGATGATTCTTCTGCTGCACAGAAGTTGAAATTCGCACTTTTTCTGGTTTGCTTCTGAAACCCACTCTTGTCTGCAGTAGAGGAGACTGAATAAAAGTAGGAAATGATGTACAGAAATGAGACAATTAAAGGTTGAATCAATGGATCAGCTTAAGCACATACAGGAGGAGGAATTAGAAATTAAAGTGTGCAAAAATATGTTCCATTTCACATTTATTCTAAACCTGCTTGTACAATAAATGTGACATTTTAGAGGAGACCCATCCCACTGACAGTAAGAAAGTCAATGTTGTCTTACATGCCGCTGTATAAAAGTGATTTACAACGAAGGCACAACTTTTAAAGAACATTTTCTTCTTGTCTTAAAATGTCTGTGTTTTAATTTTAAATATGTAGAGGTCAAATTTCAAAGCATA\n>XM_039993337.1 PREDICTED: Panicum virgatum casein kinase 1-like protein HD16 (LOC120708211), mRNA \nACGGGAAGGCTTCAAAAAGCCAGCACTCCTCCTCTCCCTTCCAGACAGCCAGCCAGCCAGCCACAGCGCAGCGGTGTGTGTCTGCGGGAGAGACCAAACACCAACCTCCCACCATCCCGACCCATCCCTCCCCGCATCCCCACCTCGCCGCCGCCGCCGCTGCCGCCCGCACGGTCTCTTCTCCCGAGATTCGTTGGCGATTGGAAGTGCATGGGGAGAAAGGATGCCAGAGTTGCGTAGTGGAGTCCGGCAATCTCGGTTGAGGGCAAAGAAGGTTCAGGATCTCGTGGCACAGGACCCTACGGACAACTTGGTTGCTGCAGCACCTACGGTGGCAGGAAGGCGTGGTAGAGGAAGGGGTGGTAGGGGTGGAGGGAGAGGAGCAGCACGGGGAAGGGGAGGAAGAGGGCGAGGTGTTCCGGTGATTGACTTGGACCCCGACCAACCTTGTGGGGTTTTTCCAGGAGCTGCTCTGGGTGGTCGTGCTGCAGGTAGGGCACAGCCCATTGAGGAATTTGCTGATAGGGCTTTGAAGATGGATGGTGGGAGTGCTGAGAAGATTGCTGGCGGTGAAGATGATGGGACTGTAACCCCTGTCCCAGAGAAGGTTCAAGTAGGTCATTCTCCGCAATACAAGGTAGAGCGGAAGTTGGGCAAAGGTGGTTTTGGTCAAGTTTATGTTGGCAGAAGGATTTCTGGAGGAACAGAGCGTACCGGACCTGAAGCTTACGAGGTTGCTTTGAAATTTGAGCACCGCAACAGTAAGGGTTGCAATTATGGCCCTCCATATGAGTGGCAAGTTTATAGTGCTCTGAACGGTTGCTATGGTGTACCTTGGGTTCATTACAAAGGCCGGCAAGGGGATTACTATGTTCTGGTGATGGATATTCTAGGACCTAGCCTTTGGGATGTCTGGAATTCATTTGGGCAGACGATGACAGCTAATATGGTCGCTTGCATAGCTGTAGAAGCAATTTCTATACTTGAGAAACTCCATGCAAAAGGGTTTGTTCATGGAGATGTTAAACCTGAGAATTTTCTACTTGGCCAACCTGGATCACCTGATGAGAAAAAACTTTTTTTAATTGATCTTGGATTAGCATCTAGATGGAAGGAAGGAGGACCATCTGGGCAACATGTTGAATATGATCAGAAGCCAGATATTTTCAGAGGTACAATAAGATATGCTAGTGTCCATGCCCATTTAGGACGTACTGGTAGCAGAAGGGATGATCTGGAATCATTAGCATATACGTTGATATTTCTTCTCAGAGGGAGGTTACCGTGGCAAGGCTATCAGGGTGAGAACAAGAGTTTTCTTGTTTGCAAGAAGAAAATGGCTACGTCTCCAGATCTACTATGCTGTTTTTGCCCACCTCCATTCAAACTCTTCCTGGAGTCCGTGACAAATATGAGATTTGATGAAGAACCAAATTACTCGAAGCTTATTTCCCTTTTCGATGAATTGATTGAGCCCCAGCATTTGAGGCCTATTAGAATTGATGGTGCATTAAAGGCTGGACAAAAACGTGGAAGATTGCTTGTAAATCTAGAAGAAGATGAGCAACCGAAGAAGAAAGTTAGACTTGGGAGCCCAGCAAACCAGTGGATTTCAGTTTATAACGCTAGAAGGCCCATGAAGCAGAGATACCATTACAATGTAGCAGATGCCAGACTTCATCAACACGTAGAGAAGGGTAATGAAGATGGATTGTTCATTAGTTCAGTCGCATCTTCAGCAAACCTTTGGGCCCTCATTATGGACGCAGGAACTGGTTTCACATCTCAGGTTTATGAACTTTCACCCATATTCCTTCATAAGGATTGGATTATGGAGCAGTGGGAAAATAACTACTACATCAGTGCCATAGCCGGTGCAACGAACGGTAGTTCCTTGGTGGTCATGTCAAAAGGAACTCCATACACTCAACAGTCTTACAAAGTTAGTGAATCATTCCCCTACAAATGGATCAACAAGAAATGGAAAGAAGGTTTTCATGTTACATCAATGACAACTGCAGGAAGCCGCTGGGGTGTAGTTATGTCGAGGAACTCTGGATATTCTGAACAGGTAGTAGAATTGGATTTTCTTTATCCTAGTGAAGGTATCCACCGACGATGGGAAAACGGGTATAGAATAACTTCTACAGCAGCCACTGGTGATCAAGCTGCTTTTATATTGAGTATACCCAAAAGAAAGTTGATGGACGAGACACAAGAAACCCTTAGAACATCAGCTTTTCCAAGCAACCATGTGAAGGAGAAATGGGCCAAAAATCTTTACATTGCTTCAATATGCTATGGCCGGACAGTGTCATGAGGCTTGCTCGGCACTTCATCCCAAATCGGGAGAGAACATATTCAGATGAGTAGATATCAGAAAAATCAGCAATTTTTGTTGCTGGTCTCTGTTACTCTGTATGTGTAGGTAAACTGGTCAAGATGAACCACCTTACCATGGCCAGAGTAGGAGCTCAAGAAAGAAAAGGAAGGTAGGTGGAAAGCAAGCAGCCAATAAGCAGGCGTGGAGGATGTACCCGGCTAGTGGCGGTGCAGACGCCGATGGTGTCAACTGTTTTGCATCAGCGTGTTTTGCACTTTTGCTTCGCTCCTGACTGCTGTGCAAGAGTAGACAGCTTGTAGCCTCCGTTCGGAGGCAAGTCAATCTGAGAACCCATTGTGTATAGCGTATCATGTCATTGCATTTTGTTTAGTGGAAGCCAAGTTCCACGTTTCTGGAACTCAGGAAATGCTAAGTTATTGTGTGAGGAGAACAAGTGTACTGATAAAATTCGGTGTATCGATTCCATTATTTGATAATTCTCATTGCAGTAATTAATGCAATAATGTTGCATGACT\n>XM_003142805.1 Loa loa hypothetical protein partial mRNA \nATGCTGAATGATACAGAAAATGAAGAAATTAAGGAAGATGGAAATGTTGAATTAATCATAGAGATTGATGAGAAGAAAATTGATTACTGTAGATATGATGTCGTAAATGTGATATACTATTTATCAGTGGCAGATTCCAATAATTATACAATTATTTGCATCAACCTGCTTAGTTACGGTAAAAGTCGTTCTCTAGACCGACAACACGAAGTAAATCGATGTATGAGGAATGTATCTTTTTGTGTGGAGCTTATGCAGGGGGAAGATCCTCGAACAGCAATACATATTGCTAGACAAGGAAAACAGCTCGTCAACGGTGTGATTTTGTTGGCCATAGCTGCTTTCATTGATCTACGTGGAACACGCGTTTTCCGTGGTGTAACTTTGATCAAAACATTGAATTTCTCGGAAATTGGAAACAAATTAGTGGGAAGACTAGATTGGCATTTGCCGATAAAAATGCGTACATAA\n>XM_050796503.1 PREDICTED: Macaca thibetana thibetana RPGR interacting protein 1 (LOC126958262), transcript variant X8, mRNA \nAGTAGGACTCAAAAGTTCCAAGGCAGTTGGTAAATGACAGTTATGAATAAAGCAAGGGGCAGAAAAAAACATGTAGGGGAATGAATGAGGAACTAGGTCCAGGAGATGCTGAACCTGGATAATAAAGACGTCATATCACACACCTTGGGGTATCCATCTGAGAGCTTGCTTTCTGTTGTCAGCATGCTGGACAGCAGTAGTCAGCCCCACTGGAGCAACGAGCTCATAGCAGAACAGCTGCAGCAGCAAGTCTCTCAGCTGCAGGATCAGCTGGATGCTGAGCTGGAGGAGAAAAGAAAAGTTTTACTTGATCTGTCCAGGGAGAAAGCCCAAAATGAGGATCTGAAGCTTGAAGTCACCAACATACTTCAGAAGCATAAACAGGAAGTAGAGCTCCTCCAAAAGGCAGCCACAATTTCCCAACCTCCTGACAGCCAATCTGAAGCAGCCACTCACCCAGCTGTGTTCCAAGACAATACTCAGATCCAGCCAAGTGAACCCAACAACGAAGAAGAAAAGAAACTGTCCCAGGTGCTAAATGAGTTGCAAGTATCACATGCAGAGACCACATTGGAACTAGAAAAGACCAGGGACATGCTTATTCTGCAGCGCAAAATCAACGTGTGTTATCAGGAGGAACTGGAGGCAATGATGACAAAAGCTGACAATGATAATAGAGATCACAAAGAAAAGCTGGAGAGGTTGACTCGATTACTAGACCTCAAGAATAACCGTATCAAGCAGCTGGAAGGTATTTTAAGAAGCCATGACCTTCCAACATCTGAACAGCTCAAAGATGTTGCTTATGGTACCCGACAGTTGTCATTATGTTTGGAAACACTGCCAGCCCATGGAGATGAGGATAAAGTGGATATTTCTCTGCTGCATCAGGGTGAGAATCTTTTTGAACTGCACATCCACCAGGCCTTCCTGACATCTGCCGCCCTAGCTCAAGCTGGAGATACCCAACCTACCACTTTCTGCACCTATTCCTTCTATGACTTTGAAACCCACTGTACCCCGTTATCTGTGGGGCCACAGCCCCTCTATGACTTCACCTCTCAGTATGTGATGGAGACAGATTCCCTTTTCTTACACTACCTTCAAGAGGCTTCAGCCCGGCTTGATCTACACCAGGCTGTGGCCAGTGAACACAACACTCTTGCTGCAGGATGGATTTGCTTTGACAGGGTGCTAGAGACTGTGGAGAAAGTCCATGGCTTGGCCACACTGATTGGAGCTGGTGGAGAAGAGTTCGGGGTTCTAGAGTACTGGATGAGGCTGCGTTTCCCCATAAAACCCAGCCTACAGGCATGCAATAAACGAAAGAAAGCCCAGGTCTACCTGTCAACCAATGTGCTTGGAGGCCGGAAGGCCCAGGAAGATGAGTTCAGATTGGAGTCTTGGGAACCTCAGAACGAGCTGCAGATTGAAATCACCAAGTGCTGTGGCCTCCGGAGTCGATGGCTGGGAACTCAACCCAGTCCATATGCTGTGTACCGCTTCTTCACCTTTTCTGACCATGACACTGCCATCATTCCAGCTAGTAACAACCCCTACTTTAGAGACCAGGCTCGATTCCCGGTGCTTGTGACCTCTGACCTGGACCAATATCTGAGACGGGAGGCCCTGTCTATACATGTTTTTGATGATGAAGACTTAGAGCCTGGCTCATATCTTGGCCGAGCCCAAGTGCCTTTACTGCCTCTTGCAAAAAATGAATCTATCAAAGGTGATTTTAACCTCACTGACCCTGCAGAGAAACCCAACGGGTCTATTCAAGTGCAACTGGATTGGAAGTTTCCCTACATACCCCCTGAGAGTTTCCTGAAACCAGAAGCTCAGACTAAGGGGAAGGATACCAAGGACAGTTCAAAGATCTCATCTGAAGAGGAAAAGGCTTCATTTCCTTCCCAGGACCAGATGGTACCTCCTGGGGTTCCCGTTGAAGCTGGTCAGTATCAAGCAAGGAGAAAATCTCCTCATAGGGGAGAAAGAAAGGAAAAGGAGCACCAGGTTGTGAGCTACTCAAGAAGAAAACATGGCAAAAGAATAGGCGTTCAAGGGAAGAATAGAATGGAGTATCTTAGCCTTAACGTCTTAAATGGAAATACACCAGAGCAGGTGAATTACACTGAGTGGAAGTTCTCAGAGGCTTACAGCTCCATAGGTGATGGCTTTAAAAATGAGCCAGAGGAAGAGGAAATGACATTATCCCATTCAGCACTGAAACAGAAGGAACCTCTACATCCTGTAAATGATAAAGAATCCTCTGAACAAGGTTCAGAAGTCAGTGAAGCACAAACTACAGATAGTGATGACGTCATAGTGCCACCCATGTCTCAGAAATATAAGGCAGATTCAGAGAAGATGTGCATTGAAATTGTCTCCCTGGCCTTCTACCCAGAGGCAGAAGTAATGTCTGATGAGAACATAAAACAGGTGTACGTGGAGTACAAATTCTACGACCTACCCTTGTCGGAGACAGAGACTCCAGTATCCCTAAGGAAGCCTAGGGCAGGAGAAGAAATCTACTTTCACTTTAGCAAGGTAATAGACCTGAACCCACAGGAGCAGCAAGACCGAAGGCAGTTTCTGTTCGACGTGCTGACTGGACAAGATCCTGATCAAGGACATTTAAAGTTTACAGTGGTAAGTGATCCTCTGGATGAAGAAAAGAAAGAATGTGAAGAAGTAGGATATGCGTATCTTAAACTGTGGCAGATCCTGGAGTCAGGAAGAGATATTCTAGAGCAAGAGCTAGACATTGTTAGCCCTGAAGATCTGGCTACCCCAATAGGAAGGCTGAAGGTTTCCCTTCAAGCAGCTGCTGTCCTCCATGCTATTTACAAGGAGATGACTGAAGATTTGTTTTCATGAAGGAACAAGTGCTATTCCAATCTAAAAGTCTCTGAGGGAACCACAGTAAAAAGTCTTATAAAGTTAACTTGCTATAACATGAA\n>XM_032861595.1 PREDICTED: Lontra canadensis mitochondrial calcium uniporter regulator 1 (MCUR1), transcript variant X2, mRNA \nCGCAGCTGCTGGTGTGGACTCGGGCCGGCGCGCCGCGCGAGCGGGATGAGCGCGCGCCCGGGCCTGTGACCGCCGTGGCGATGGACTGCGGCTTCGTCGCGGGCGGGAGATCGAAGCGCCCGCCGGGCCGCCGGCGGCTTGTGCTCTTCCTGCCTTCAGGCGGCTGCGGAAGCCCGGGCGGCCGCGGCGTCCCGGCGCGCTACTGCCTGTCAGCGCTGTCCGTGGGTCTGGGGGCGCTGAAGCCTCGCGCCCCGGCGGCCCCCCGCGGCGCGTCACGTGCCTCCCCGCTGCTCCTCCTCCTGCTTGTGCCCTCCCCGCGCCTGGCCACCGTCGCCCAGCGCCGGCCCCTAGCGGACCGGGAGCGCTCGCGCCTGGGGCCCTCTGTCCCCGCGGCTAGCCGCGGCGGCGCGGGAAGGTGCCTGCGGGGCCTCGCCCCGGGCGTCGCCTGGGCCGCCGGCGCCCTCCACCTGTGCCGCGGCCGAGTGGCCGCCATCACTTCGTCCAGGAGAGAGCTAAGCCTCTCGGCTGGGAGCCTGCAGTTGGAGCACAGGAGAGATCTGGAGCACAAAAGGCGAGATTTCACCTCTTGTGGGAACAAGAAGCTCTACTTTGACACCCACGCCTTAGTGTGTTTACTGGAAGAAAATGGCTTCACCACCCAGCAAGCAGAAATCACTATCTCTGCATTGGTCAAGATCACGGACGCCAACATGGATATCGTCTACAAGGATATGGTCACCAAAATGCAGCAGGAGATCACTGTTCAGCAAATAATGTCTCAGATTGCCAATGTGAAAAAGGATATGATTATTTTGGAGAAGAGCGAATTTTCGGCTCTCAGAGCAGAAAATGAGAAGATAAACGTGGAGCTACATCGATTAAAACAACAAATAATGGATGAAGTGGTCAAAGTCCGAACAGATACCAAGTTAGACTTCAATCTAGAAAAGAGCAGAGTGAAGGAATTGTACTCGTTGAATGAAAGGAAGCTGCTGGAAATGAGGACAGAAATGGTGGCATTGCATGCCCAGCAAGATCGGGCTGTCACCCAGACAGACAGGAAGATAGACACTGAGGTCGCTGGCCTCAAAACCATGCTGGAGTCACACAAGCTTGATAATATTAAATATTTAGCAGGATCTGTATTTACGTGCCTAACAGTAGCTCTGGGATTTTATCGCCTATGGATATAATAAAGTGTCTATTTAAAGA\n>XM_032539735.1 PREDICTED: Etheostoma spectabile DNL-type zinc finger (dnlz), mRNA \nCACGAGATTTGACGTCATCGGTCCGCGACACACACCATGTTGATGAAATCGTTAGTAACGTATACATCTACGCGTGTATGTCCTTCAAAACCTCACCTGTCGTGTTGGTTTTACAGACGTGTTTTGATATTTTACCTCCGGCCGATTCTTTGAGGACGATGTTGGCGGTTAACCGGTTGTTTCGCTGTTCTCGCGGTCGTTCAGCGCCGTCTGGACTCTGCGTTGTGCTCCACTGCCGTCGTCCAGGACCACCGACGACCACAGCCAGGTCGGGGCTTCTCTCCTCACAGGACCAGCGTGGTTGTCATACTTTGTTACCTGCAGACAGACGTGAAGCTCATCTTAGCGGTTATAGGGAGTTCTCAACCTGCCAGAGTATCAGAAGTGACGCTATTGGACAGATCCAGTCAAAACATTATCGACTCGTTTACACATGCAAGGTTTGCTCTACCAGGTCCACACAGAAAATATCCAAGCTGGCTTATCACAAAGGTGTTGTGATTGTGACATGTCCAGGGTGTAAGAATCACCATATCATCGCTGATAACCTCAACTGGTTTTCGGACCTGGAAGGGAAGAGAAATATTGAGGAAATCCTTGCTGCCAAAGGAGAGACTGTAAAGAGGATTGAAGGAAGTTCCGCTTTGGAGATTGTGGTGGATGAATCTATCAAAGAAAAGTCACAACATGGTGAAGACACAGAGAAATCAGACAATGAGCCAGAAAAACAGTAATGCTGTGTTCATACTGTATATGTATTTTGTAAGATGTTTATATTGAAATCCATAATAAAAACAAATATTTATATATAAATAAATGTCTTTATGAATTCTAAGCAAGGAAAAAGGGAACTGATCAAGATAGCTTTTAATATCAGGAATAGAATAGATGGAACTATAAATCCAGCTAACTGATAAA\n>XM_027304875.1 PREDICTED: Coffea eugenioides probable LRR receptor-like serine/threonine-protein kinase At4g37250 (LOC113761756), mRNA \nCCTTTTAGCCTTGTCTTCGTCCCCCGTCTCTCCTTACCATCTCTCAAACTGACTCCATTTACAATATCTCCTTAGTTTTGGTCCTTATATTTTTGGTCACCAAAACAACATCTGTGAAGTTGGTTACCGTCTCAATCGTTCTTATTTTCTCCACTTCTTCTTGCTTATGAATAGCAATGACCATCTCGGACTTCTATGAGCGCCTAATACCAAGAAACCAATGAGCAGCTGGTTTAGAATGAGAAGTTTTTTTCACATACTTTGGTGCTTTTCCACCCTGTTTTTGCGTCTTTTGCTTCCTTCTCTGGCTCTGAACGTAGATGGAACGCTCTTGCTTTCCTTCAAATACTCCATTCTCAATGACCCTTTGTCAGTGCTTGATAACTGGAACTATGATGACGAGACGCCGTGTTTATGGACTGGTGTGACGTGCGCGCAAGTTGAAACGCCCTTTGGCACGCCGGCTATGTTTCGAGTCATAAGCTTAGTTCTTCCGAACTCTAAGCTCTTGGGTTCAATTCCTGAAGATTTGGGATACATCCAACACCTCCGTACTCTTGATCTCTCTGGCAATTTCTTGAATGGGACCCTTCCCAATTCGCTGTTCAATGCTTCAGAGCTCCAAGTGCTGTCGCTGTCCAGCAATGCAATAACTGGCGGGCTACCGGGGTTCAGCGGAGGAGGACTGAAGAATCTCAAGCTCCTCAATCTCTCTGACAATGCTTTAGCTGGAAATCTCCCTCCGAATTTACCGTCTCTGCAGGAGTTAACTGTGGTTTCTCTGAAAAGAAACTTCTTTTCGGGTACTATTCCAAATGGGTTTCTGTACGTTGAAGTACTAGATTTGTCTTCGAATTTGCTGACTGGATCACTACCACTTGAATTTGGTGGAGAAAGATTAAGGTACTTAAATCTTTCTACCAACAAGCTCTCTGGCCCGGTATCTCCAGAATTTGCGAAGAAAATCCCAGCAAATGCAACTATTAATCTCTCATTCAACAACCTCACTGGAGAAATCCCTGAATCAATGGCATTATCTAACCAGCAAACAGAGTCCTTCAGGGGAAACATGGACCTCTGTGGCAAACCGCTCAAGAAACTTTGTACTGTTCCTTCAAGTTTATCGGCACCACCCAATATATCCACAACAAATTCCTCTGCTCCGGCAATTGCGGCCATACCACAGACAATCGACTCGACCCCCCTGCCAAGCTCACCGGGAGCAGCAGCAAATGCAGCCCAAAATCAAGGACAACACAGGCTAAAACCAGGAACGATAGCTGGAATTGCAATTGGAGATTTAGCTGGCATTGGAGTCCTTGCAATTATCTGTTTGTATGTCTACCAACTAAGGAAGCGAAGAGCAGATGAAGGAAGCAAAGAGATTCCACTTCCAGTAGCAGTAGATAAACAGCAGAAAGATAACGTCAAAGATTCACAGCTCTCAACAGCGAAGGAGACAACTTCAAGAAGCCTGCCCTCTTGGTCGTGCCTAACTATAAGAAATGGTGAAGAAACATCAGAGGCTACCGCCTCGGACTGCGATGATGAAAACAAGAACATGGACATTGGACATCAAATAGATCAGTATCATGAGAAGGAGCGGAGCACTAAGTACAAGAGCGAAAGGTCACTTGTGATGGTTGATGGAGAAACTGAACTTGATATCGAGACTTTATTGAAGGCTTCTGCATATATACTGGGGTCTAGTGCTGCTGCAAGCATAGTTTACAAAGCTGTACTTGAGGACGGTTCTGCATTTGCTGTTAGAAGGATTGGAGAGAGCGGTTTTGAGAGGTTCAAAGACTTTGAGAGTCAAGTTAAAGCTATCGCAAAGCTGCGCCATCCAAACTTGGTTCTGCTCAGAGGGTTCTACTGGGGAGACGATGAGAAGCTTGTCATCTATGATTACATCTCCAACGGCAGTTTAGCTAATGCCGGTTACAGAAAGGTTGGCTCATCACCTTACCATATGCCCTTTCAAGTCCGGCTAAAGGTAGCAAAAGGAGTTGCTAGAGGACTAGCATACGTCCATGAAAAGAGACATGTGCATGGCAACATCAAGCCTAGCAACATTCTTTTGACGCCAGAAATGGAGCCAATAATCAGCGATTTTGGGCTTCATTCGCTTCTACATGGCAAAAATAGCTACAAAACAGATGCCTTTTCATCTCGGCATTTCGGTAGCATGAGAAGCAGTACTAGTACTGCTACTGCTGCTACATCATCTTCTCGCGATGGGCTGCACGACCACTCTATCAATGGCAGCCCTTGCATTGCACCTGCAGGCTTCATGGGTTGCACATCACCTTATCACGCCCCAGAGTCGCTCAATAACCTGAAGCCTAATCCCAAGTGGGACGTTTACTCCTTTGGAATTCTACTGCTCGAGCTTTTAACGGGCAAAGTGTTTTCAGACCGGGAATTGGGCCAGTGGACCGCCGGCCTGCTGATGGAAGACAAGAACCGGGTGTTACGGTTGGCTGATGTGGCAATTAGAGGAGACGTGGCAAACAGGGAGGATGCCATGCTGGAATGCTTTAAGCTAGGCTTTAGTTGTGCTTCATTAAACCCGCAAAAGAGACCTTCCATGAAAGATGCGCTTCAAGTTCTTGATAGAATCCAGACTTCTCCTTCGTACTAATCATGGTGCTGGGCAAAAGCTTAAATATAGTGGAGAAAAAAGAGAAAGAGAAAGAGAAAAAGGGGCGATCGCCTTTGGTCTTTTTGACTTGGAAGAATGTCTGGCGGGAGGAATGCTTTTGTTGATAACTCGTACAAGTGTTGCAAAGTTTGACTGATGATGAATGAAATTGGTATTTGTGTAAGACAGAATTCCGACGGTCTATCATATGATATGGTGCATTTTATCTTTACTTTGTTGTTAAGAAAGTGAGCACCATAATGAGAACTTGCTTGTCTTGATAAGCGTTTGACATGCTCAGAGAAGCAGAGTAATTGCTCACTAAAGGAAAGGAGATTACAAGGAAGAATCAAGGAGCTGCAATATGAA\n>XM_019217988.1 PREDICTED: Vitis vinifera uncharacterized LOC104878060 (LOC104878060), transcript variant X2, mRNA \nCTTTAGTCTTGAGACTTTCCTCTCTTTCACCACTTTTTCTTCTCCTCTTCTCTTTTATGTACCTTATTGTCGTCACAATCTCACCTTCTCGTTCCAAACAAATTTTTTCCCCTGCTAGCTTAGAAAGTGAAAGAAACTGGAGGTAGGAAGACGAGGCTTATGGTGGCGTCTCCCCGAAGTGGAATCTAGGGCGCGGCGGAAGCCATAGGCTTGAAAGAAGGGGAAGTGAAAGGCGGAGGACTTTCGAGTTTTATTGGCCGAGAGGCTAGGGCACGGTGTGATTTGGTTCGATCTCGGTGTGGAAGCTCGGGGAATCAGCTTATTGCGTAGTGGTTTTGTGGTTGTGGGATTTTGGAAACCTTAGATTTGGGTCAGGGTTGTGTGGTTGGCTGATTAAGCTAGGGGCGGGGCTGCCCTTGCGATTGACTGGGTTTTCATGCTGTCAAAACCACTGCCTTGGGATCGGAAGGACTTCTTCAAGGAGAGGAGAGGAAGCACGAGAGGTTGGAGTCTTTAAGTTTGCTGCAAGATAGAGGACTCGCATCAGGGTTCTTGGGAGTTTGCTCGCCGGAATCGGCAGACTTGCGCCGTCCTACAGAAGCACGAGAGGTCTGAGTCTTTAGGTTTGCTGCAAGATAGAGGGACTCGCATCAGGTTCTTGGGAGTTTGCTCGCCGGGATCGGTAGACTTTCGCCCCCCTACAGGGACACTTTTCTTTGCCATGAGCAATGTTGGTGAGGTGGGTAAATATCAATACACTTGAATATGATTGTCACATCATTTGGGGGCTTTTGACTCTGGAAGATTTCTGATTAATGTCATTAAATTTTTTCTTTTTCTTTTGAAACAATATGCCCCTTGAAGACTTGCTTTGAATAAATAAGATTTTAACTTGTTTAGCATTGTCTATTGTTGTCTTATTGTATTAGAGAGAAGAAAAAATTACACCTTGATTCCATTATTCTCCTTTTCAATTCTATCTAGTTTATCATCTTTGAAAACTTGAAGACCTTCTACTTCTAGCTTTATCTTGCAGAAGGACAATGATTCCTGATCTATCTGAATGAGGTTTAACACCAAGAACCAGATCAGGCCTTGGACAACTCAGATGGAAATTAAATCTTGGATAAAGCGTCCCTGTGAGTGTACCATTGCCCATGATATATCACTGGAAAATGTTTCAAGAATGCATGAGCTTTCAGAAGCCTTCCATGCTATTTCCTTAAGACACACATGCCTCTTGTCTATCTTGGAGCAGTTTAGTAAACTGAGTTCTAGGGCCGGTGAACTCAACTTACAGGTGGAAGCTGAGAGATCTTATCATCAAACTGTACTTGCTACTTTAGAGAAACTATTCGATGAGATGATTATGGAGAAGAAACGAAATGAGTCTTCATCTCAGCCAATAACTATGGAGAAAGATGTTTGCGTTCCTACCACATCCAAGGATGCAAATTCAAATGGATTTGACGATCATGGACATGCAAATCAAAATGGTTCATACTTTATTGCAAAAGTTATACACCCATTTGATGCTTAAGCAGATGGAGAGCTCGGTCTTTCTGTTGATGATTATGTTGTCGTTCGCCAGGTACCACCTGCCTCTATTGCAAATCCATCTAGCAATAAGAGGAATGTTTGAGACCTTTTAACAGCTTATTGGAACTTTCAATGTTTTGTATTTC\n>XM_024297971.1 PREDICTED: Oryzias melastigma barrier-to-autointegration factor (LOC112162223), mRNA \nTGACTCCTCTTTCATACAAACGATCTCAACGCTCTGCCTCGTGACGTCACAAGAGGAGCGTCAACCGCCCCAGCAGCGTCCGGGTTCGGTTTAAAGTGTCCGGGGCAGAGAGCAGCGCTGACGCCTCTCAGGTGGTCACGTTCCAGTCGCCATGTCGACCACGTCGCAGAAGCACCGGGACTTTGTCGGCGAGCCTATGGGAGACAAACCTGTGATGGCGCTGTCGGGTATCGGAGACACGCTGGGGAAGAAGCTGGAGGAGCAAGGCTTTGATAAGGCCTCCGTGGTTCTGGGTCAGTTCTTGCTGCTGAAGAAGGACACAGAGATGTTCACTGACTGGCTGAAGGACGCCACCGGCGCCAACTCTCGCCAGGCCGGATCGTGCGCTCAGTGCCTGAAGGAGTGGTGCGACGCCTTCCTCTGAGACCCCGCCCCCTTTCCTGCTCCACCTGGTTCTGCTTCTGTTCTGCTCTCCGTCAGAACTGGTGTTCTCTGGATTTCTGTGAGAGAGCTCGCGGCGGCGACGCGTGTTTTATACCAATGTTTGCAGTTCACATGAATAAAAGGTTTGAATGTTTGAA\n>XM_006985027.3 PREDICTED: Peromyscus maniculatus bairdii WT1 interacting protein (LOC102927739), partial mRNA \nGCAGAGCGGCGGCTGGAGGCGCTCACGCGGGAGCTGGAGCGCGCGCTCGAGGCGCGCACGGCGCGAGACTACTTCGGCATTTGTATCAAGTGTGGGCTTGGCATCTACGGAGCGAGGCAGGCGTGCCAGGCCATGGGGAGCCTGTATCACACCGACTGCTTCGTCTGTGACTCCTGCGGGAGACGACTCCGCGGGAAGGCCTTCTATAACGTGGGTGAGAAAGTGTACTGCCAGGAGGACTTCCTGTACTCCGGGTTCCAGCAAACAGCTGACAAGTGTAGCGTGTGTGGACACCTTATCATGGAGATGATCCTGCAGGCCCTTGGCAAGTCCTACCACCCCGGTTGCTTCCGCTGCTCAGTGTGCAACGAGTGCCTGGATGGGGTCCCCTTCACCGTGGACGTGGAGAGCAACATCTACTGCGTTAGAGACTACCACACGGTGTTTGCACCAAAATGTGCTTCCTGTGCCCGCCCCATCCTCCCTGCGCAGGGCTGTGAGACAACCATTCGCGTGGTGTCCATGGACAGAGACTACCATGTGGAGTGTTACCACTGTGAGGACTGCGGGCTCCAGCTGAGCGGGGAGGAGGGACGCCGCTGCTACCCCCTGGAGGGGCATCTGCTCTGCCGCCGGTGCCACCTGAGGCGCCTGGGACCCGGCCCGCTCCCCTCGCCGGCTGTGCACGTGACTGAGCTCTGAGAAGCAGCCATCAGGAGAGACGGGGTGACCCACACCCCCCTCTCACCCCCTCCACCGAGCTGCTGTCCCTTACGCAGGGGCCGGACCCCTGCGACAAATAATCGATTTCTATTTATTCACCGTCCGTGCCTCAAGCTACTCCCCTGCTGGGTTCCAGGACACCCGCACCCTGCAGCCTCGGGACAGGCCCAGCTCCTCTGCCCAGCTCCTCTGCCTGACCTCGGCTCCCAGAGGGGCAGGGCTTGGAGGGCCTTGGTGCCATGGGGGAAGGGTGCCTTGTTTGTGTGTGATCACAGCCAGGGGGCAGTGACAACCTGGGAACACCGCGGTTTGGCCTTGATGGGTGTTTTCAGCCACAGTCCTCCACCTCTCGGGATCCAGTCTGGGCCGGTGCTTTTCCAGCATCAGTCTCAGAAGACCCTGAGCGAATTCAAAGGCAGAGAGAAAGCCCACGAGAGCTCCCAGCAGACCCCGGGAGCATCTGCGCGCACTGTATCAGGCTCCACCACAAAACTATGTGATTTGACTTAAATTAAGTTCCCCCCAAGGAGGATGTTGACATTTTCTTGAAAAGAATATAGTTTTCTTCTAAAAACTTGGA\n>XR_005799689.1 PREDICTED: Rosa chinensis OVARIAN TUMOR DOMAIN-containing deubiquitinating enzyme 12-like (LOC112165159), transcript variant X19, misc_RNA \nTAATTGTGTCCCATAGACCGAGTCACATCTCGACCTAATTGCAAAGTGGAAGACAAAACCTCTCGACCCTCTCAGTCATCTTCTTCACCACTTTCTCTTCCCCTTCTTATCCAAAATGAAAATCTTGTGCCCTCCTCACTGCTAATCCAAACCACTAATTCAATTCCTCAAGTTCCTTTCAATTTTTCGAAATCCATACCAAATCCGAGCGTCCTGACCTTGAGAAGCAGCAGCAGCGTGACGGAGGCGCCGAGGCGGTTACCTTAATTCCTAATTCTTCTTGCGTTGAGACAGGGGTTGAGTCTAGCCATCTGCGTTTCGACTTGTTCTGGGGAATCTCGAGCCTCTCATCGTCACTGTCGAAGACCTCGATGTATAGCAACAGATTTATTCCATGCCAATCGTCGTCCAGGCTCCACCAGTTTGGGCTGAACGACAAGGCGTTGCCGGTGAAATATAGTGGATTCAGAGAAGGCCAGTAGTCCTCTCCAGTCATTGTGTTTCTTCGCTCTCTTTCTCTCTCTAAATTTCCAAATTTGATTCTCACACTCTCTCTCTCAAAACCCTAACCCCCATTCTCTAGACCACAAGACTTCCGCTTCTCATTGCCGCTCGCCGTCGACCTGCCACGGCGTCGTTTCGGCTTCGTGTCGCATTATCGGTATTTCTCGGCGTTGTCGGTGATAGCCGGACGGAAGAAGGAGGGAGAGTGGGGGTTTTGGCTTTATGGGACTTGTACGACGGCGTTGGTGATTGGTCTTTGTTTTGATCAACATTCTGGCGTTTTGGCTCTCCGGAGAAGAGCTATTGGGGTATCGAAGGCTCTGTGGGAAAAGAGGTTTGTTGAGTGAAACTGCGAAGATGCTTCAAGGCTTTCCAAAGAGCAAAACATGAGCATGAGGCATTAAAGAGGCAGCTTGAAACTTATTTCCAGCTCAAGAAAGCAACCACAATCTCCTAAAAGCTGAGCTGAGAGGTACACACCAAGATTGAAATGGGGGAAAGGAATTGTATTAAAGATTTCATCTTTAGTAATTTTACTAATATCCCATCAGCTAAACTGAGTTTCAGGGATGTGTGAGCTGTTTTTTTAGTTGGGTAGTATGAATGGAAGCTATAGCAATGCAAATGTGAGCTCAAGCTCGAGTTTGAATAGCAGCTCTCATGATACCGAGGATGACCTGACCATTGCAACTGTTTTGGCAGAAGAGGAAAAGCAGAAAAATGATGGCAAGCTGGGGAAAAGACTCTCCCACTTAGATTTGATTCCGCACACTCTCAGGGTGAATGGGGAGATACCTGACGTGAATGATGCTACTCAAGACCATAAGAGGCTTTCAGAAAGTGTAAAAGTTGGAGCAGCTCAAGTCAAGTACGCTCAAAGAGATCATTCTGAAAAAGAAGTTAAAACTGGAGGACAAGCTGCTGGATGCTCCACCCGACACATTAGGTGCTGCTGTCTTGGCACTACACTATGCAAGTATGAGAGAACTTTAGTGGCAAAATTTCTCTCAATCACATTTGATTGTATCAACTTTTGCTATCTTTCAATGTAATTAGGTAGAATGCAGTAGTCATTAAACTAGCTAGAATGCCTTTTGTACGGTATGGATACAAGAATGTATATATGATTGACAAATGCTAGCTCCTTTGGTACATTAGATGGTTGAATTAGAATATTTCAATGCCTAAATCTTATATTAAGCATTATTTTTGTGCAAA\n>XM_031791253.1 PREDICTED: Oncorhynchus kisutch protein-tyrosine sulfotransferase 1-like (LOC109884214), transcript variant X2, mRNA \nAGACTCTAGTAAAGTAAGGGTGACGCGTTTGCAGCGATACAATTGAAAAGAAAGCAGTAACAAGTAATCTTGTGTGTCGGATCAGTGGAACAACAAGGGAGCAAATTGAACGGATGGAATTTACGAGTAACGGTGTTCACCTATGAGATAAGCAGCTTGATCAACTCTCTCCCGCGGTGGATCCTCTACATTTAGGCCTGATGGAGCTGGGCACGCGACAAGCGTTGACCACCGGGGAACACACAACACGCTCTGCCCCCCATCGCCGACCTTGAAAGGAGGGACACTCCGCTACTCCCAACCTTCCCTCCTCTTCCACTACCTCCTCTGGTACAACTCCCCCCTTCCTCCCTCCCTCCCTCCTCCCCGGTTCTGAAATGGTGATGGTGATGATGATGAAGCTGAAGCAGAACCTGCTGGTGGCCTGTCTGGTCATCAGCTCAGTCACAGTCTTCTACTTGGGTCGTCACGCCATGGAGTGTCACCACCGCATCGAGGAGCGCAGCAGCCAGCCTGGGGACCAAGGGGTTCTGGGGGGCCTTCAGGGGTCAAGAGGGTTGCTCCTGGGGGGTTCTTTGAGCTCCTCCACCATCCTGCGGGGCTCTGGTCCCGGGGGCCATAACCTCTCCGCTCCATTCGTCTACAACAAAGACATGCCTCTAGTATTCATTGGAGGGGTTCCCAGGAGTGGGACCACATTGATGAGAGCCATGCTGGACGCTCACCCCGAGGTTCGTTGTGGAGAGGAGACCAGGGTTATTCCACGTATCCTGGCCATGAAACAGATGTGGTCGCGGTCTGGGAGGGAGAAGATGCGTCTGGACGAGGCCGGGGTGACAGACGAGGTCCTGGACGCCGCCATGCAGGCCTTCCTCCTGGAGATCATCGTGAAGCACGGCGAGCCCGCCAACTTCCTCTGTAACAAGGACCCCTTCGCTCTGAAGTCCCTCTCCTACCTGGCTAAGATCTTCCCGCACGCCAAGTTCGTGCTCATGATCCGGGACGGACGCGCCTCGGTCCATTCGATGATCTCGCGTAAGGTGACGATCGCTGGCTTTGACCTGGGCAGCTACAGAGACTGCCTGACCAAGTGGAACAGGGCCATAGAGACCATGTACACTCAGTGCCTGGATGCCTCAGACAAGTGCCTGCCAGTGCATTATGAACAGCTGGTGCTCCATCCAGAGAAGTGGATGAGGACGCTGCTCAAATTCCTGGACATTCCCTGGAACGAGGCGGTGCTTCACCATGAAGAACTCATAGGGAAAGCAGGAGGTGTTTCCCTCTCCAAGGTGGAGAGGTCTACAGACCAGGTGATCAAGCCGGTCAACGTGGAGGCCTTATCCAAGTGGGTGGGCAAGATCCCTGTGGACGTACTGCGGGACATGCCCGTCATCGCCCCCATGTTGTCCCGTCTGGGGTACGACCCCCACGCCAACCCTCCCAACTACGGCCGGCCAGACCCCAAGGTCCTTGACAACACCAGGAGGCTTCAGAAGACTCCAGAGAAAACAAACCCCAGTTAGGAGGAGCAACCAACATGCCACACAGACAAGACGGGGCACCGATGGACAAACATCCAATACAACACCACTTTTTGGGGACCTCAGTACTCTTCCATGGACACACACACACAAACACATACGCTATATATACAAAAGTATGTGGACATTACTTCCAATTAGTGGATTCGGCTATTTCAGCCACACCCGTTGCTGACAGATGTATAAAATCGAGCACACTGCCGTGCAATCTCCATAGACAAACATTTGCAGTAGAATGGCCCCGAACTGAAGAGCTCAGTGACTTACAACGTGGCACTGTTATAGGATGCCACCTTTCTGCCCTGCTAGAGCTGCCCCGGTCAACTGTAAGTGCTGTTATTATGAAGTGGAAACGTCTTGGAGGAATCAACGTCAAAGCCACGAAATGGTAGGCCACACGAAGTCACAGAACTGGACCGCCGAGTGCTGAAGCGCGTAGAAATCGTTGCAAACACTCACTCACGAGCCCCTGGAAGTAACTTCAGCACAATAACTGTTCGTCAGGGGAGCTACATGAAACGGGTTTCCGTGGCAGAGCAGCCGCACACAAGCCTAAGATCACCATGCGTAATGCCAAGCGTCGGCTGTAGTGGTGTAAAGGTTGCCGCCATTGGACTCTGGAGCAGTGGACCAACTCCATATTAATGCCCGTGATTTTGGAATGAGATGTTCTACGAGCAGGTGTCCACATACTTTTGGTCATAGTGTATAACATCATGACTGGATATAACCGTATTCCACACTGGCTTTGTGGAGAAACTCTCTTGGCCTTTTGATGTTCGTACTGTAAACAAATGATGCATTTGTCACAAAATGGTGACCAGAGAATGTCTATGTTACTATCTTTCTTGTCGAGGGTTGCAACATTTCCCCAATTTCCTAGATTTTCCAAAAAAATCCCAGTTGGGAGATTCCTGAGATCCTACAACCAGGATTTCTGGAAAAACATGGAAATATTTAGAAAGTTACCAGAATTTTTAAAAACAATTCTCGTGACACCAAATGTTTTTTTCTTCTTTTAAATGATTTCTCCTGTAAATATAAATATATAAATCTGTGATTCTGTTGTAAGAAAATACAGTGGACTTAAACATCAAAAAAAGTGAATAATGTATTTATGGATGACATTTTGCTTTTTGAAGATGCAATATCTATTTTAATGTTTGTTTTTCATGCCTTTCTATAGTGCGATTCCATGGGTACGGATGTACAAGATCTGTTTTTAAGTATTGACAGTGATAAAAGATGGCATTTTGTAAA\n>XM_031379489.1 PREDICTED: Mastomys coucha kinesin family member 1B (Kif1b), transcript variant X9, mRNA \nATGTCGGGAGCCTCAGTGAAGGTAGCTGTCCGAGTGAGGCCCTTCAATTCTCGAGAGACCAGCAAGGAGTCCAAGTGCATCATTCAGATGCAAGGCAACTCGACCAGTATTATTAATCCAAAGAACCCAAAGGAAGCACCAAAGTCCTTCAGCTTTGACTACTCCTACTGGTCGCACACCTCGCCTGAAGATCCCTGTTTTGCATCACAGAATCGTGTGTACAATGACATTGGAAAGGAAATGCTCTTACATGCCTTCGAAGGATATAATGTCTGTATCTTTGCCTATGGGCAGACTGGTGCTGGGAAATCCTACACGATGATGGGGAAACAAGAAGAGAGCCAAGCTGGAATCATCCCACAGTTGTGTGAAGAACTTTTTGAGAAGATCAATGACAACTGTAATGAAGAGATGTCTTACTCTGTAGAGGTGAGCTACATGGAAATTTACTGTGAGAGAGTACGAGATTTACTGAATCCCAAAAACAAGGGTAATTTGCGTGTGCGTGAACACCCGCTGCTTGGACCCTATGTGGAGGATCTGTCCAAGCTGGCAGTCACTTCCTACACTGACATTGCTGACCTCATGGATGCTGGGAACAAAGCCAGGACGGTGGCAGCTACCAACATGAACGAGACAAGCAGCCGTTCCCACGCCGTGTTCACCATTGTCTTTACCCAGAAGAAGCAGGATCCTGAGACGAACCTTTCTACTGAGAAGGTCAGTAAAATCAGCTTGGTGGATCTAGCAGGAAGTGAACGAGCTGATTCAACTGGTGCCAAAGGAACAAGATTAAAGGAAGGTGCAAATATTAATAAGTCTCTTACAACTTTGGGCAAAGTCATTTCGGCCTTGGCAGAGGTGGATAACTGCACAAGCAAGAGTAAGAAGAAGAAGAAGACTGACTTTATTCCCTACAGGGACTCTGTGCTCACTTGGCTCCTTCGAGAAAACCTAGGTGGCAACTCCCGAACTGCAATGGTTGCTGCTCTGAGCCCAGCAGACATCAACTACGATGAAACGCTGAGCACGCTGAGATATGCAGATCGTGCAAAACAAATTAAATGCAATGCTGTTATCAACGAGGACCCGAATGCCAAGCTGGTTCGTGAGCTGAAGGAGGAAGTGACCCGACTGAAGGACCTTCTTCGTGCTCAGGGGCTGGGAGATATTATTGATACATCCATGGGGTCCCTTACTTCATCTCCATCTTCATGCTCACTTAATAGTCAGGTGGGCTTAACATCTGTGACCAGTATTCAAGAGAGGATCATGTCTACACCTGGAGGGGAGGAAGCCATTGAACGTCTGAAGGAGTCAGAGAAGATCATTGCTGAGTTGAATGAAACCTGGGAAGAGAAACTTCGTAAAACAGAGGCCATCAGAATGGAGAGAGAAGCCTTGTTGGCTGAGATGGGAGTTGCCATACGGGAAGATGGGGGAACACTTGGTGTTTTCTCCCCTAAAAAGACTCCACATCTTGTTAACCTCAATGAAGACCCACTGATGTCGGAGTGTTTGCTTTATTATATCAAGGATGGAATTACAAGGGTTGGCCAAGCAGATGCTGAGCGGCGCCAGGACATAGTGCTGAGTGGGGCCCACATTAAAGAAGAGCATTGTATCTTTCGGAGTGAGAGGAACAACACTGGTGAAGTTATTGTGACCTTAGAGCCCTGTGAACGCTCGGAAACATATGTGAATGGCAAGAGGGTGGCCCATCCTGTTCAGCTGCGCTCAGGGAACCGTATCATCATGGGTAAAAACCATGTTTTTCGTTTTAACCACCCTGAACAAGCACGAGCAGAGCGGGAGAAGACTCCCTCTGCCGAGACCCCCTCTGAGCCCGTGGACTGGACATTTGCTCAGAGAGAGCTTCTCGAGAAACAGGGAATTGATATGAAACAGGAGATGGAAAAGAGGCTTCAGGAAATGGAGATCCTTTACAAAAAGGAGAAGGAGGAAGCTGACCTTCTTCTGGAGCAGCAGAGACTGGACTATGAGAGTAAATTGGAGGCCCTGCAGAGGCAGGTTGAGACTCGATCTCTCGCTGCAGAGACAACGGAAGAAGAGGAGGAGGAGGAGGAAGTTCCTTGGACACAGCATGAATTTGAGTTGGCCCAGTGGGCGTTCCGGAAATGGAAGTCTCACCAGTTTACTTCATTAAGGGACTTACTCTGGGGCAATGCCGTGTACCTGAAGGAAGCCAATGCCATCAGTGTGGAACTAAAGAAAAAGGTGCAGTTCCAGTTTGTTCTGCTGACTGACACACTGTACTCCCCTTTGCCTCCTGAATTACTTCCCACGGAGATGGAGAAAACTCACGAGGACAGACCTTTCCCTCGGACAGTGGTGGCGGTGGAAGTCCAGGATCTGAAGAATGGAGCAACACATTATTGGTCTTTGGACAAACTCAAACAGAGACTGGATCTGATGCGAGAGATGTATGACAGAGCAGGAGAGGTGACCTCCAGTGCCCAAGATGACAGTGAGACGACCATGACCGGCAGCGATCCGTTCTATGATCGGTTCCATTGGTTCAAACTTGTGGGAAGGGCATTCGTGTACTTGAGCAACCTGCTGTATCCGGTGCCCCTGATTCACAGGGTGGCCATTGTCAGTGAGAAGGGGGAAGTCCGGGGATTCCTTCGTGTGGCTGTGCAGGCCATTGCAGCCGATGAAGAAGCTCCTGATTATGGCTCTGGAATTCGACAGTCGGGAACAGCTAAAATATCTTTTGATAATGAATACTTTAATCAGAGTGATTTCTCTTCAGCTGCAATGACTCGTTCTGGTCTGTCCTTGGAGGAGCTGAGGATTGTGGAAGGTCAGGGCCAGAGTTCTGAAGTCATCAGTCCTCCAGAAGAAGTCAGTCGAATGAATGACTTGGATTTGAAGTCAGGCACTTTGCTGGATGGGAAGATGGTGATGGAAGGGTTTTCTGAAGAGATTGGTAACCACCTGAAACTGGGCAGTGCCTTCACCTTCCGGGTCACGGTGCTGCAGGCCAACGGAATCCTCCCAGAGTATGCAGACATCTTCTGTCAGTTCAACTTTTTGCATCGACATGATGAAGCATTCTCCACTGAACCCCTCAAGAACAATGGAAGAGGAAGTCCCCTGGGCTTTTACCATGTACAGAATATTGCGGTGGAGGTCACCGAGTCATTTGTGGACTACATCAAAACCAAGCCCATCGTATTCGAGGTCTTTGGACATTACCAGCAGCACCCACTTCATCTGCAAGGACAAGATCTTAATAGTCCACCTCAGCCATCTCGAAGATTCTTCCCCCCACCCATGCCACTCTCCAAACCAGTTCCAGCTACTAAGTTAAACACCATGAACAAAACCACCCTTGGGCAAAGCATGAGCAAGTACGACCTTCTGGTTTGGTTTGAGATCAGTGAACTGGAGCCTACTGGAGAATATATTCCAGCTGTGGTTGACCATACAGCAGGCTTGCCCTGCCAGGGGACATTTTTGCTGCACCAGGGCATCCAGCGACGGATCACAGTGACTATCATCCATGAGAAGGGCAGTGAGCTCCACTGGAAAGATGTTCGTGAACTGGTGGTAGGTCGGATTAGGAACAAGCCTGAGGTAGATGAAGCTGCAGCTGATGCGATCCTTTCCCTAAACATCATCTCCGCTAAGTCCCTCAAGTCTTCCCACAGCTCCAGCAGGACCTTCTACCGTTTCGAGGCTGTATGGGACAGCTCCCTACATAACTCCCTCCTCCTCAACCGAGTGACCCCCTATGGAGAAAAGATCTACATGACCTTATCTGCTTATCTGGAGTTGGATCATTGCATCCAGCCAGCCGTCATCACTAAGGATGTGTGCATGGTCTTCTATTCTCGAGATGCCAAGATCTCACCACCACGTTCTCTGCGAAACCTCTTTGGTAGTGGCTACTCAAAGTCGCCAGACTCCAACCGAGTAACTGGAATCTATGAGCTGAGCTTATGCAAAATGGCAGACACTGGGAGCCCAGGCATGCAGAGGCGGAGGAGAAAGGTCTTGGATACCTCCGTGGCGTACGTGCGGGGGGAGGAGAACCTAGCGGGCTGGAGGCCTCGTGGAGATAGCCTCATTTTGGAACACCAGTGGGAGCTGGAGAAGCTGGAGCAGCTGCACGAGGTGGAAAAAACTCGCCACTTCTTGCTGCTTCGGGAGAGACTTGGTGATAGCATACCCAAGTCTCTGAGTGACTCGTTGTCTCCCAGCCTCAGCAGTGGGACCCTTAGCACCTCAACCAGCATCTCTTCTCAGATCTCAACCACCACCTTTGAAAGCGCCATCACACCGAGCGAGAGCAGTGGCTATGACTCAGCTGATGTTGAAAGCCTGGTAGACCGAGAGAAAGAGCTGGCTACAAAGTGCCTGCAGCTTCTCACCCACACTTTCAACAGAGAATTCAGCCAGGTACACGGCAGCATCAGTGACTGTAAGTTGTCTGACATCTCTCCAATTGGACGGGACCCATCTGTGTCCAGTTTCAGCAGTTCCACCCTCACACCCTCCTCCACATGCCCCTCTCTGGTGGACTCCAGGAGCAGTTCTGTGGATCAGAAGACCCCAGAAGCCAACTCTCGGGCCTCCAGTCCTTGCCAAGAATTTGAACAGTTTCAGATTGTCCCAACTATGGAGACACCCTATTTGGCCCGAGCAGGAAAGAATGAATTTCTCAATCTTGTTCCAGACATTGAAGAAGTCAGAGCAGGCTCAGTGGTATCTAAGAAAGGATACCTGCATTTCAAAGAGCCGCTTTCCTGTAACTGGGCTAAACATTTCGTTGTGGTTCGTCGCCCTTACGTCTTCATCTATAACAGTGACAAAGACCCAGTAGAGCGTGGCATTATTAACCTGTCTACAGCACAGGTGGAGTACAGCGAGGACCAGCAGGCCATGGTGAAGACACCTAATACTTTTGCTGTATGCACAAAGCACCGTGGGGTCCTTCTGCAAGCTCTCAATGACAAAGACGTGAATGACTGGTTATATGCCTTTAACCCACTTCTGGCTGGCACAATAAGGTCAAAACTCTCTCGAAGATGCCCGAGCCAGCCAAAGTACTAAGCGGTTCTTCTGAGCCTTGCTCACCTGTGACAGATAAAGAAAGTGTTACCTCTCATTCTCTCTCTTTGTGATTCTTGACGGTTATTCTTGTATGTAATCCTGTGGCTTAATGACTTTTCCCTCCCTCGTCATCCCGCACTTCTCTAGTTCTCCTGTTCCCTCTCTCCATGGCTCTGTACTCTTCTTATTCTTGTGCTAAGACTTGTAGCATGTGGCCTAACAAAGGGGAACAAAACCACTACACATTCATATACACTCACACCCACGCACCCTGAGGGGATCCAGCACATCTCCAAATGATTTTCCTGTGTACGTTAGCTTCCTTTTGGATGATGGGTCCCCTTCATGGTCACTGTCCCCCTGTTGTTTCTGTATGGCTCTGGTTTTCAGGGTAACTTCTCTGTCTCTCTTTTTTCCCTCCTTTGTTTATGATAATCTACTTTTTTCTGGGTGGTTTAGATACTAAGGGAGGAGACGTTTGGTATTGTCAGCCAGGAGAAAAAAACTTGCTTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTGTCTCTCTTTGTGTGTGTGTGTGTGTCTGTGTCCATGTTTCTCTCTCTGTCTCCGTCTCTCTCAATGTCTCTGTCTTTGTCTCTCTCTTTGGTTGCTAATCCATGTATTTCCATTCAGGGAAAGCACTGTGGGAAGCTCAGAATTGGGATTTTAAATTCTCTGTCTAAATCAGGGCGCAGAGCATGGGCTTATAGAGAGGAAGATGCAGAAGGGCCTTTGTGATCAGCCTGCAGCAGAGGCTGCTGCAGTAGACTGCTGGAGCTCCTCACAGCCGGGTCCTGCAAATGTCTCCTCCCTGGGAAGGAAGCTTTTGTCTAGGAGTTCCCCAGCCCTATTCTCAGCATTACTGTTTAGAATTACGAGATGTCATGAACAGATTTCCCACAAGAGGGATTGGGGAATGTTTGACTTTCTAGTGATAGACTGGACCATTGTTGCTTTGAGAGTGCTGAGTGCAGCTTGTGATTGTTGTAGCTCCCTTTGATCAAAGACTTGTAGCTTCAGCATAAATCTTGAGGTCTCCATCTAAATCCAGTGGCCATTTTCAATGTATGAAATATGAGCAAACATGGCATTGTTTTTTAGATGCCAGAACTGGCCGGTCCTTACCACCACTCCAAACAAATCACAAGATATTTAGGGTTGAAAAAGATTGTGGATTGTGACATGCCTCCTGTGTGACATGCCCCTGACCCCACTATCCCCATGTGGTTTGGAAATACTCCCTTAGGAAGAATTCACTGCTCCCAGTTTCTGTGGCTTCTAACAAACCAGGTCTCTGGATTCAAGAAGTTATCATAGAAAATAACACTCTCCCTCCACCAGCTAGTCAGTGTTGGGGACTGAGTAGGGCACAGAATGCCCGCTGGAGCTACTTGAGTTGTGTGCCAGCGACTTGAGGCTCATTCACACTGCTGTGTCCTGGCTTCGCCAGCCTGCTTCAGTGCCACTCATGCACCCAGGAAGGCATCTGCTCACCTCCACTCTACAAAGGCTCCTGGCTACCTGAGGGTAGAGAAGGAATGGATTGCCTTCTGTTGGGAGCTCATCTCCACTGCAGAGCAGCCACCAGGGAGGCGAGCGAGCATGCAGCCCCTTGCTGCTGACCTCTCGGCAGGGCTTCTCTCGGAAGAACTGGTCTCCAGCTCCTTTTGTTACAGCTGCCTTGCAAAGAAAGGGAAAGTGGACATGGAGAAAAGAAAGGGCAGAAATCAGACTGTTCTTATCTAAAAGATGATCAACTCCAGTAGACTTGTAAAACTTTCTTTCTCTCCTTAAAGTATAGGTTACTAACTGTAATGTTACTTGTTTTCTAAGCATATATATGAGATTTTTAATGTAGTTAGAAGTCTCTGTTGTCTGATGGACACAACATGTCCTTCTGGTGTATACTCAAATTCAGCAGGCTCTGTCTATGCTTGTAGACAGTTTCCTGGACCGGAACTAAATATAATTTCAGGGAAACAAAGATCAAAGGTCGCTTTTAAACTGAGTCACTGATGTTGCTGCTGTTAGAAAGGTAGATGGAAGGATCCGCGTCTGTGCGAGGTGAGAAGCCTGAGGGAGGGTGAAGTGTGCGGTACACTAAACCCTGCGATGACTTGTGTTTTCTTTTAACTCAAACAAAACTGGTTTAGAAAGTCTTTGCTTTGCAAATATCAAATATTAGCATGAGCCAAACTGGACTGCCCCTTCATCAGAGGCGCCCCCCCATAAGGAGGCCTCATTAGGAAGCCAGGGAAAGGAAGGTTGGAGCTTGGGCACGTGTGCTGCTACCTGCCATCATTGGGGCCCCCCCTGACTGTAAGGCCCATGGTCAGATCAGAATCAGAGCATTTGGGGGCTTTACTTTCTGTTTCCAGACAAGGTCACCTCTGCTTCGAAGCTCTGCAAGAGAAAAGGTTTTATGGCAGGACCTGTTCATGAGATTTTTGTGGTTGCCATAGTAGCAGGAAAGTTAAGACAACTAACCTTAAAGAAACTTTTTTTTGGGGGGTGGGGGGTCTGAGACAGGGTTTCTCTGTGTAGCCCTGGCTGTCCTGGAACTCACTCTGTAGACCAGGCTGGCCTTGATCTCAGAAATCCGCCTGCCTCTGCCTCCCAAGCGCTGGGATTAAAGGTATGTGTCACCACCACCTGGCAAGAAACTATTTTTAAGGTAATTTTAAAAAAAATTTCAAAGCACTCCTTTAAACAAAAAACCTACAAGGAAAACATACAGATTACAGAAAAGTGAGTGCTGGTTGAAATGAATTAGCCTCCCCCTTCCTTCTTTATCCTCCTTCCTCCCAAGCAGATATCACTCCTAACTGTCCCCCACGCCAGTGCTCAGGCCCAGCCTGCTTCTGGGGCTCTACCCTGGGAGTCAGCCAGCTCTCAGCCCCAGACTGTCAGGGACCAGGCAGTCCCTGCACAAGGCTAGGCAGGAGCACAGGCCAGACTGCTTCTGAGCAGGCCCCTGATCTCCATCCATAAATGAGGCGAGCTAAAGCTTCCTCAGCTAGGAAACCTTTCCTCCCCTTCAGCTATATGGAATGTATATATCTATTAAATTTTTATCTTGTTTTGATGAAAGGATGAATGGTTGTGAAAGGTATTTGGGGTCTAAAACCATGATTTTTTCCTGGCACATATTTCAAAGCATAGACTTTGTTACCTGCTGCTTCTTGTCTAATTTACAGGGATATTTAATTTTGTAAGGTATTTGTATATTTATACAGCTGTAATGAATTGCACATTGGACTGGAAGGGGAAGGCTCTGCCCTGTGTGGCTCCTACTGGAACTCTTGCATTTTCCTCTTGGGCGCTGTGCTTTGGCCCATCTGAACAAAATCAGGGGTGTGTGGTTTGTTTAGCGTGGGTCCATCATTTTCATTTGGGTTCCTTTTGGAAAATGTAATCTTTAACTTGCTCTGTGAGAAGAAAAGAATAATTGTGTTGCTGCTCTTGGAAGGTCTGCTGAGTGCATTTGAGTGAACTCTGGCGCTGTGTACTGCAGCCATCCACCATGACCTGTGATCCACCAAGAGTGAGTAAGACCACGACCATGGAGCAAGTCAGAGATTGTCAGGCGAGAGATTATTGCTGTTACTGTTCAAAAGGCCATTTATGAAGTAGATATTTGAGCTCTTTAAAAAAAAAATCTTAAGAGAGCCCCTAATTACTTAAAGAAAAAAAGAAATTTAAAGAGTTAATACAGAACTGGTATTAAAAACTTGCAGGCAGAGGTTAGAGCACTTGGCAATTTTACGTGATGCCTTTGGTTCAATCCCGGTGCTGCAGATCAGACAGAAAGCCAGGAGGCAGAGAGCTGCGCAGACAGAAAGTCTGTTATATGTTGTCATGTCTTTAATTGATTCTTTTCATGCTGTGTATTCTGGCATCAGTTCACCTAAGGGACCCACCAGCCTCCTCATGTTTAAGCATTGTCGTAGACTTTGTGGCTCTAACATACTTGTCTGTTGAGAGTGGCGTCTCTTGTCACCATCCCCATGCTATAACAGAACCCATGAAGCATAAGTGGCCTTTTTGAACCAAGACTTTGCAAACTGATCTCTCCCCAGGGAAGGAGTTGAGCACAAGCAACAATGTACATTATTAATTTTGGATTTCATTTTCATGTTTTATTTTGTAAATATCTAATGTTTGGAGCTTGAGTATACAAAATGTAAATACAGTTCTCGTATTTGTACTAATCCTGATTCTTTTGCTGTATAGCCCTAGCTGTGTAATGCAGACATTATCTGACTGTGTATGGTAACCTTGCATCACAGAACTGCTAGTGAACGAGCTAAAACAATAAAGGTACAACCAGTGCA\n>XM_039680831.1 PREDICTED: Pimephales promelas family with sequence similarity 49 member A, like (fam49al), transcript variant X3, mRNA \nAGATGAGCAGCTGCTAGGCAGGACTGTCTTGAAAGCAGAGAGACAGTGAGAGAGACCATTTGGTGCCTGAACGCGAGCGAGGGAGGGGGCGAGAGAGACGCACACACTCAGCGTGAGCCTCTGGTTTAAGTAGACACTAACCGTGCGTTTAGGGAAACCCACAGTCTCAGCTCCCTGGGATACAGGAGTTTCTGGCCCTGCTCTTTTTCCCCTTTTCATTCTTTTATTTTACTCCCTCCATCTTTTCTCTTCTTCCCTTTGCCTACGGAAAGCGCTGGACCACTGTTTTCTCCCTGAAACACGCCAAGCCGGTAGTGGAGGCTGATGCTGTGATACACTGCAGGAGAAACATACAGGCTCTCATTTGATGCAGTGAAGTGCTCTGTGAGGAAAATCGCAAGCAAAGGTTTGCCGGCCATGGGGAACCTCATTAAAGTCCTTGGCAAGGATTTAGAGAACTGTCCTCATTTTTTCCTGGATTTTGAAAATGCTCAGCCCACAGAGGCCGAGACAGCCGTGTATAACCAGGTTAGTGCTGTTCTGGAAGAGGCCCATGGGATACTGGCAGAACTACAGTCTTACAATGGAGCAGGACAAGAAATAAGAGAGGCCATTCAGAACCCCAATGACCTCCAGTTGCAGGAGAAAGCCTGGAATGCAGTCTGCCCTCTGGTGGCCAAGCTCAAGAGATTTTATGAATTTTCTCTCAGGCTAGAGAACGCCCTGCGGAGTCTATTGGAGGCCCTAACAAGCCCACCCTACGCTCCCATGCAGCATCTGGAGAGAGAGCAGGCCCTCGCCAAACAGTTCGCAGAAATCCTGCACTTCACTCTCAGCTTTGATGAGCTTAAAATGACAAATCCAGCCATACAGAATGACTTCAGCTACTATAGGAGGACCATCAGCAGGAATCGTCTGAACAACCAGCAGTTAGAAGCTGAGAATGAAGTAAATAATGAAATGGCCAATCGGATGTCGCTCTTCTACGCTGAAGCCACACCCATGCTCAAAACCCTGAGCAATGCCACGACTAAGTTTGTGTCGGAGAATAAGACTTTGCCAATCGAGGACACCACAGATTGCCTGAGCACTATGGCCTGTGTGTGCCGTGTCATGCTGGAGACTCCGGAGTACCGGTGCCGTTTCACTAACACAGACACCATGCTGTTCTGCATGCGTGTGATGGTGGGCGTCATCATCCTTTATGACCACGTTCATCCAGTGGGTGCCTTTGCCAAGACCTCCAAGATTGATATGAAGGGCTGCATCAAGGTGTTGAAAGAGCAGCCTTCAAACAGCGTGGAGGGACTGTTGAATGCACTGAGGTATACCACAAGACATTTAAATGATGACAGCACCTCAAAACAAATCAGGGCTCTGCTTCAATGAGAGCAGGAGGAGAGGGAGGAGGACCCACAGAGACAGGGACTGTCAGAGAACAAGCGATGGTGGCTGGCAGTCCTCTGAAACCTGTTTGTTTACAAGAGCAACTTGATCTCAAATGAAATAAGATATTCTAGAAAAGAAAAAGGAATACGAAAATAAATATATATATAGAGAGAGAGATTGTTGATGGTTCATCACCGTGTGTCATTTTATAAAAGCAGGAAAAATAGAGATATATATGTATATTAAAATTCATTACTTAAAACTACCTGGGTGTGGATATAAAAGTCTTTCAAAAACATATTAAATATTTAAGAATTGAATTTAAAAGCGGTAGTTAAAACCACCAACAAAACTGGTTCATATTCCAAGTTCCGCCTGAGAGTATTTTTGCACACTTGAAAAGGAATCCCACCTCACAGGAAAGACATTAACATGGCTTGAAACTGTATAATTCAGATCCCTTTTCACGCGTTTTTAGACTTGATTTGATTTGCAACGCCTCGTTATTCCCGTATGTGCTTCGTCCAATGCATTCTGGGAATTAAAACCGGAGTCCTTGGCATTTCAAGTCTGTTGAAGGATAAATGTAAAGATCACATACTTGAGACGCATCTCTGCTGACATCGCCAGAAATCAAACTATAATCCTCTAGCTGTATATACTCGGAAAGCACAGGATAGTTTTGTAAAGAAATGAAGCGTTTTGTTAGACTTCTTCACTAGTGCTGTACAGCAATACTCTATACCACCAATGTGACAAACCCGTTCATTTGAAATGCCTTCATACCAATGTATGAGACGCCGGATAATGCTAACAGTTCATCTGTGGAGTTGTACATATCATCAGACGAACAATCCTTTAAAAGTTACGTTTTTGCTCTTGTAAAGTTGACGTTCAAACGGAGCGAGTAAGCCATGAAACTGTAATTCAGACGCAAACACACATTCTGCCCTGTGCCATAGCTGCTTCCTGTACCACTGCGTCAGAGTGACGTATAACAAACATCATTCGTAGAAACCAAAACACACCATTGAGAACAACACAGCGATGTGGATTTGCTTTCCTCTGTATCCAAAAGCAAATCATTGCCAAATGGGACTGCAACTTTGCCTTTCAGATAAATAGAAGTGAGACGTTTGGTCATGAACACAATCTCAAAACAACAGGCTTGAAGGTGCAAAACACTTGACTTGGTGTAAATAAGAGGATTTTTACTAAACAAACGTTCCATCGAGACTCTTTGTTAGAATTACAGATGCATATTAAAAAAAAAAAA\n>KC305230.1 Stachybotrys sp. HGUP 0107 internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene and internal transcribed spacer 2, complete sequence; and 28S ribosomal RNA gene, partial sequence \nTCGTTGCTTCGGCGGGAACGCCCCGGCGCCCTGCGCCCGGATCCAGGCGCCCGCCGGAGACCCCAAACTCTTGTGTTTTTTTCAGTATTCTCTGAGTGGCAAACGCAAAAATAAATCAAAACTTTTAACAACGGATCTCTTGGCTCTGGCATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCGTTAGCATTCTAGCGGGCATGCCTGTCCGAGCGTCATTTCAACCCTCAGGGTCCCCGTTCCGGCGGGGAACCTGGTGTTGGGGATCGGCCCGCCCCGTGCGGCGCCGTCCCCCAAATTCAGTGGCGGTCTCGCTGCAGCCTCCCCTGCGTAGTAGTTACAACCTCGCATCGGAGCTCAGCGCGGCCACGCCGTAAAACCCCCGACTTTCTGAACGTTGACCTCGGATCAGGTAGGAATACCCGCTGAACTTAAGCATATCAAT\n>XM_052206935.1 PREDICTED: Mytilus californianus uncharacterized LOC127702642 (LOC127702642), transcript variant X2, mRNA \nAGGTTAATAGATGTAGTATTTAAGCGTATATCAGAGCAACGTTACCCAACATACCACATACGAAAAAAAAAAAAAAAAAGGGATAGCATGCTTAACAAATTACAAGTATTCGTATGTTTTCTGATTGTCAATTATATATTTTGCGAAGACACCGATGATTGCAAGGATGAAATATGTAGGAAGTCGTTAGCAATGCCACTATTGAACAATCTGAAAGCACCTCTTGTTGCCAATTTGGATATAACTCAGTTTAACAAGCAGCTACGAGGGTACATTACAGAACAGATCAAGCAATGAGTAGAGCAGGCAAAGAAAGAAATAAGGGGCGAAATGGTAGAACTCGTCGACACATTCGAAGACGCTCATGTAAACGTTACACAAGACCTTAGCAAAGATTTGAACGAAATCAGGCGTCAACAAATGCAAATGGAAGATCGTGCAACTAAAGAAAATGAAATATCGGGTAATTTTACGTTTGAAATTATCGATGGAATGAAGAATATAGAACGACATCAGAAAGATATTCTGACAGATGTGGAGCAGTTGAAACGTTATAAAGAATCAGTAATTACAGCAAATGAAGAAAAAAACAATTTCACAGCAGAAGTCAAAGATACACTAAAGAATTTAAATCAACAACTGAATGAAACTCATGATGAAATTCATCACTTGAAAAGTTTTCATGCATCTTTAAACTCCAAAATTAATTCAGCCGACAAGAGGATATCTGCAAATGAAGAAAAAGTACCAATTGTCAACGAAAAATTACGTAATTTAAAAGGAGAGCTAACTTCAATTCGATCGGACATTAATAGTGTAGAAAGTCGTCAGAAATCATTGTCCTCTGACATCAGCAGTGCTTTCAGTCGTCTTACAGCAAATGAGAAAAGAGTTGGTTTTACTGCTTGCGTTAGTAAAGATGATGGATCAACCATATCAGCAGGTCATCCAATACCATTTACCACTGTTACATCTAGTTATAATGTTGATATGTCAAGCGTTAAAAGCAATGGAAAGTTCACCGTTAAAATAAGTGGTTTATATTTTATATCGGCATCAATAAGAAGTAAAACAGACCATGGATTCTTTGCAATATATGATGATTCGTACTTTTTAGCTTATGGATACACAGCTGAGCATGACGGTAAAGATACATATGATCACAGTGGTACAGTAGATGCGGTGCGATATTTTAATTACGGTGATATCCTAGCAGTAAAGCCGTGGAAAACTATGGACATTGGTGCTTGGTCTTGTCTGACTTTTGTCAAAATAAAATAGAAACAAATTATAATTAATATCTGACATTTTGTATTTTTGCGCAATAAGATATCACAATTGAACATTATATTTTGAAACAATACTATAAAGGAACTGTTCTAATTATTGGAAGTACTAAGTACGTACAACAAAAGGTGTTTCTACTCACAACTTGACATTCTGTATTGTCACCAATTGGAAGTTTTCATGTTTTGTTTTAACAATTATCGCTTTCAAATAGTCAATTAGCTTATAGTAATTCTAATGTTCAATTATTTATTATTTCTTCATTTATGAATAACAAAATAATAAACTGATATGATATTTCAAAAA\n>XM_050245764.1 PREDICTED: Anopheles aquasalis tyrosine-protein kinase Fer (LOC126581837), transcript variant X1, mRNA \nGCGCGTGGTTGTGTGAAGCTGCGGTGCGTGAGCTTTCTTTTGCTTGTTTGTTCTGTGTTGTGTTGTTCTCCGTGCATCGCGGTGATCGTGCAGCGTGATTTGTGTGCGTGTGCACGTGTGTTCAGTGCGCCTCCTCCACGCCGTGATTACAGAGGTACGCCTTTACCTGCGCTACGTGTTTGCTCCTTGCTAGTTTACAACAGGAAGGAGAAAGAAAAGATCAAAGTGTCGGTGCGTTGTGCGTATGCTTATGCTTGAAATACGAAGATAAATACAACCGCCTGCTGCGTGTGTGCTTTTTCGGTGTGGCGGTTTGTTGGTGGCACCTGCAATAATCGCACGTTTTATCAATTCGATAGTGTTGGGTTAAGGATAAGATACAACATATCGCGCAAATCATCAATATCAATCCCTACCTACTGACTTGGTGGATAGTGTCGTTCCTCCATTTTCCAAAATGTAACGGATATTACTACATAAGACCGGAACGAAACGGCTACGAATTAACGCATTGAAAAAGTGAAATCCTAGTGCTAGAAACGGATTCAAAATTGCTTCAACAAATTAGAATATCCCTTTTGCATTTGTATCGCTTAATTGCTGTGTTTTTGTGTTACTAAAGTAGTGTTAGTAGTGTATGGCGATTCGCCAGGGGATGGCTGCGTGTAGTGTCGTGTAGTGTCTAACGCGCGAAGCGTTAGAAGTGGAGTGAACAATAGAGCCAAGAGAAGAGGTCAATCAAGTGCATAGTGCCTTTTTTGTTTTTTTGGTTGATTTTTTTTTCCTGCGCGAGAGGAAACCAATTCTCTCAGTAGGCAGTGGCAAAGCAACGGGGGGAAACCATCATGGGCTTCTCGTCTGCGCTGCAAGGCCGAGCGGCACACGACGCGCTGCTCAACCGGCAGGAAGCGGAGCTGAAGCTGCTGGAAACCATGAAACGGTGTCTGGCACAGAAGGCAAAGTGTGACCGGGAGTATGCCGTCTCGTTGGCGGCCGTCACCCAGCAAGGATTGAAAATCGATCGCACCGATGATCTGCAAGGAAGCCACATTATGCGTGCTTGGCGGGGTTTTATGGAAGAACTCGAGCACACTGCCAAACAGATTCGCTCCAATGCCGAGCAGCTGGAAACGGTTTGTCACGAGAAGCTGGCCAGCCTCTACCAGGAGAAACGCCGGGTCCGCAAGCAGTACCAGGAAGAGCACACCAAAATTGCCACTCAGTTCAGTCATCTCACAGAAGACGTCGCACGGAAGAAAAGCGAATATCAGAAGCATTTAGACTACTACAAACTGCTGCGAGGTCGATTCGAGGAACATATCAAATCTGGTCGGTCTGGGCGAAAGCTGGACGATGTCATCGACAAGTATCAAAAAGCCTGCCGGAAGCTGCACCAGGCCCACAACGAGTACGTTCTGCTCATCAGCGAGGCGGTCGAGGTGGAGAAAGATTTTCGAACAACGCTACTGCCCGGCCTTCTCGAACACCAGCAGACGCTCCAGGAAGGATTCATCCAGGCATGGAGCAATCTGCTGTCAGAAATTGCAAAACTCAGTGACACCACATCGGAAAAGTACGTGGAAATACAGCGACGCATTGATACGAGTATATCGAGCATCAACTCGACGGAGGAGTATCGCGAGTTTACGGATAAGCACAAAACATCACCGACCACGCCGGTCGTCTTCCAGTTCGACGAAAGCCTCGTCGAAGACAGTCTCGGTAAACTCCAAGCGAACACGTTGACCGTCGACAACCTGACGGTGGATTGGTTACGCGGTCGCCAGGTGGAACTCGAAGGTACGATTAAGGATCTGCAAGAACGACAAGCCAAGCTGCTCGCCGAACCGAACGGAACCGGTACACTGGCCACTAGCAGCTCACCCGCTTCCAGCAGCCCGGTCAGTACACCGGGAACAAAGCCATCCACACCGATTCTCAACGGTACCGGAAACAGCAACGGGGCATCAGGCAAGGACTCTCAGCAGATTGCGGCCAATAAATCATCAAAGGAGTTGAACAACCTGCGGTGCCAGGAACGCCAAACCATGAAGCTGGTCGAGATGATACGAACAGCACTGAACGAGGTCGGATGCGAAGAGCTACCTTCCGGATGTGACGACATCGCGGTAGAGCACCTTATCGAGAACAAAAAGTCTGTCAGTCAGGATCTATCGCTGGACTCGCAACATAACAATCCATCGCAGGCGGGAGGATTTTTCACACTGCGCACGGGTAACGGTGGCAGTGGTGGTGGTGGTGGTGGTGGTGGAGGTGGTGGTGTGATGTCAATGTTAATAGATCAGTTGCGACGCAAATCAGGGCCTCCGGGAGCGGCGACTAGTGGTGGTACTGGTGGTAAGGCGGCACCCCGATCGGTGGGTACCACTCCAGCTCAAACACCCAAACCAGGACATCGCGCGACAGCAGCGAGCACGGTAAATAGTGTTTCTAGTCCCGCTACTATTACGTGTGAGCGTGTGCAAGCTTCTTTGGATGGCTTTCCGCCGCACGCTACTAACCACTACCAGCAACAACAGCAGGAACAGCCGCAGCTGCGACCGTTAGCTCCCTGTTCATCAGCAAGCTTGTACGCTGAGCTCCGTTCCGTTAATCCAGAGATCGATGATGAGCAATCCTTTCCATACCCCGAAAACCGCATTTCAAACGTTTACGTAGACATGGAAGCGTATCTTGGGATGCGGGAGCTCAGCCCCGATGAGAACAGCAGCGAACATGCATGTGCATCGTACACTAATATCAACAGCGACCATCTTCCTTCCCTCCGCCATGAACAAAGTTCAACCGCACACAACTCGCAAAGCAGTCCAATGGGCGATCTCCCTAATTCACGCACCCCCATGCTAGGGGACGATGATGGCGAAAGGCGAAAGTATCGTCGACTACGAACCATGGGCGATCGTATCGATGATGAGGATGATGATGCCGATACTGCTGAGGAGTTGAACGATTCGAAAAACAATTTACTACGCGAAGAGAGCTACGATGGTGGGGATCAACTAGATGAAGGGCCGACGGAATCGGAAACAAAGTATCTGACGATGAGGAAACGTTCATCGCCCCGCGCTGATACGACGACCCGCTGGAAGTCCTCCATCGAGCAGCACCTGGATGTGATAGATGCGCTGAACATCAAGCTGGACGAACATCAACGCCTCTCGGCCCGCCTTTCTGAGGATTACGAATACATACGGGTGCAGACACTGCGCCGTGAAGCGGAGCTGATAGCAGCAGCAGCAGCGGCAACAGCAGCATCTTCAACATCCTCTACCGCTGTACCGCAGCGTGCAGCAGCAGGAGGGACACCGTTCGAAAAAGCAAATAGCTTCCGCGAGAAGATCAAACGGCGCATCCGAGGAGCAAAGAGCTCGCAACTTAGTGAACCGGTAGAACCGGAAACACCGGATAAGGTGGCGAATGTGGTTGAAAGTTTTTCCGGCCGATTGCGCACACGCATTGCTTCACAGCGGCAGTTTCGGTTGATGAAGGAAACGGACTCGGCCAGTCCTTCCACCGATCGTGGTTCGATCACCACAAATGGCGGCGCCTCTAACTCGGCGGGTGGACGCCAGAAGAAAAAGAAGCGTAAGTCGTCCAAAGCGCACCGTGCCTTCAAGCAGCAGCAGCAGCAGCAGCAGCAACGAAGTGGTCTAAAACGGGATACCGAGAGTGAGCAAGAGGTGTATGACCAACCGCAGCAGCTGCTCCACCCGGCAAATACCTTCTCCGAGGATGAGCTGTTAGTAGACGAGCCACCAAGAGTCGGTTCACCGGAGCAGATGGTTAAACCGAGTGGCCAAAAGTTCTCGCAAACCGTACGCGCCACGTGGCGGGAACTGTTGCACTCGACGAACAAGGTCAAGGATTCGTCAATTAATCTCACCAACCAGCAGCAGCAGCACGATCGTATGGAAGAAAAGTTAGATCTTATCCCCAATCAGGACCGTCCCGGGTTGCTAGCAATACGGTTTACCTTTTCGGACACTGAGACACCCGAACATCACGGAAGCCGCCAGCTCGATGCAACATCATCAACAACAGGCGAAGGAGGAGAGTATTGTGTACCATTGCTTTTATCGCAATCGAGTGACGATACGAAGGCTCCTCAAATTCTCTCTTCCGGCGATAGCAGCCACCCGGCTGGTAGTAACAGCACCACCAGCAAGCTGGCTATGAACCTGAAAATCAATCTGAAGGAAAGGCTCACCAAATTGGTACACAAAAGGGCACTGATGATGGGTGGTGGAGGGACAGTGCCAGGTAAAAGCAATCTTCTGCCGCTCCATCAACCATCGGGCGAAATATGTAGGTCCTGCTCCAAACGTATCGTTCGCCCGGGAACCATACACCCGAGCCAGACGGTGTTGGATTTTGTAAAAGAATTTCCTGGCCTCGATATCTGCAACGGTGGCCACGATGAGGACGACGAAAACGACGATTGCGATGGCGACGGTGACAACAAGAAGGCAGACACCGCCCGTCCAGGCCGTGCAACCGAATCGGAAATGATCAATCTCGAGTATGAGGATATCGATGTGATAACGATTAAGTCCCACAAACTAACTGACCATTGTGAGGGTGGTGATGATGATAATGATGATGATGGTATGACGCTGTCCACAAACCGGCCACTGCATGAGGAAGAATGGTTCCACGGTGTGCTGCCGCGGGAAGAGGTGGTGCGGTTGCTAAGAAACGAAGGTGACTTCCTGGTGCGCGAGACGACGCGAAACGATGAAAGCCAAACCGTACTCAGTGTCTGTTGGAACGGTCACAAACACTTTATCGTGCAGACGACGGCGGAAGGCCACTACCGTTTCGAAGGACCGGCATTCCCCAGCATACAGGAGCTGATCGTGCACCAGTACCAGTCGGAGCTGCCGGTGACGGGCCGGTCAGGTGCGGTGCTGCGTAAGCCAGTGTTGCGCGAACGCTGGGAGCTGAGCAACGATGACGTGATACTGCTGGACAAGATTGGCCGGGGCAATTTCGGCGATGTGTACAAGGCGAAGCTGAAATCCTCCAAAAACACGCTGGTCGCGGTGAAAACCTGCCGCATGACGCTACCGGAGGAGCAGAAGCGCAAGTTTCTGCAGGAGGGACGCATCTTGAAGCAGTACGATCATCCCAACATCGTCAAGCTGATCGGTATCTGCGTGCAGAAGCAACCGATCATGATCGTGATGGAGCTGGTGGCCGGCGGATCGTTGCTGATGTTTTTGCGCAAAAATGCAACCACCTTGGGCCAGCGCCAGATGATGGGTATGTGCCGAGATGCGGCCGCCGGGATGCGCTACCTGGAGTCGAAAAACTGCATCCACCGTGATCTCGCGGCTCGAAACTGTTTAATCGGGAGCGAGAACATCGTGAAGATTTCTGACTTTGGAATGTCCAGGGAGGAGGAAGAGTATATCGTATCTGGCGGTATGAAGCAGATTCCAATCAAGTGGACTGCCCCGGAGGCGCTTAACTTTGGAAAGTACACCTCGCTGTGTGACGTCTGGTCGTACGGGATCCTGGTGTGGGAGATCTTTAGCCGTGGCGATACGCCCTACTCAGGAATGAGCAACTCGATGGCTCGCGAGCGAATAGACGAAGGCTACCGGATGCCATCGCCGGAGGGTGCTCCACCGGAGATGTACCGGCTCATGCTCAAGTGCTGGTCGTACGAGCCCGAAAGCCGGCCACACTTTGACGAAATCTATACCGTGGTCGATGCCCTGATTCTATGCACCAAGGACTGACCGGAT\n>XM_009229646.1 Gaeumannomyces tritici R3-111a-1 hypothetical protein partial mRNA \nATGGAATGGAAAACTCAATATCTTGACGACACCGGAGGAAACTCTGAGATGAGGGGGTCGGGCTGCGACATTTACAGCCTGGCCGAGGGTGAGGGAAGAAGAGGGGAGGGGGGGGACGTGACGGGATACCAGAAGCGGCTCGCACCATGCACAGCACCCCGCCGCCGGCCTCGAGGACAGCACAGTCTGACCAGAGTGCCGAAAGCGATTACTGTAGATGGAAATGCAACAGAGGCGGACATGAGACGTGTCGCCGTCGGACAAGAGTTCAGACGAAGTCGCCTCAACATCATGGAGAGCCGACATAAGTATCTGCACGTGAGCATTAGCCATGGGAGGCGCTCCGGCTGA\n>XM_014964222.1 PREDICTED: Calidris pugnax CCR4-NOT transcription complex subunit 4 (CNOT4), transcript variant X8, mRNA \nACCTTCAAGTGCTGACCTTCTTGGTCTATTAAGTTATTATAAACTTTTGCTGCTCTGCGAACATATAAAGATGTCTCGCAGCCCTGATGCTAAGGAAGACCCTGTGGAATGTCCCCTTTGCATGGAGCCTCTGGAAATTGATGACATCAACTTCTTCCCTTGCACCTGTGGCTACCAAATCTGCCGTTTCTGTTGGCATCGTATCCGTACTGATGAGAATGGACTTTGTCCTGCTTGCAGAAAGCCATATCCAGAAGATCCAGCAGTGTACAAACCACTCTCCCAGGAAGAGCTGCAAAGGATAAAAAATGAAAAGAAACAGAAACAAAATGAGAGGAAACAGAAGATATCAGAGAATCGCAAACATTTGGCCAGTGTACGGGTTGTACAGAAGAACCTTGTCTTCGTGGTAGGACTGTCTCAGCGCTTAGCAGATCCAGAGGTTTTGAAACGACCAGAATATTTTGGGAAGTTTGGTAAAATACATAAAGTTGTCATTAATAACAGCACATCATATGCAGGCTCACAGGGTCCAAGTGCCAGTGCATATGTAACCTACATCCGGTCAGAAGATGCTCTTAGAGCCATACAGTGCGTCAATAATGTGGTGGTAGACGGCAGAACACTTAAGGCATCGTTAGGTACAACAAAATACTGCAGTTATTTTCTAAAAAATATGCAGTGTCCAAAACCAGACTGCATGTATCTACATGAACTGGGAGATGAAGCAGCCAGTTTCACAAAAGAAGAAATGCAGGCGGGCAAGCACCAGGAATACGAACAGAAACTACTGCAAGAATTATACAAACTAAACCCCAATTTTCTCCAATTATCTACGGGTACAGTTGACAAGAACAAGAACAAAGTGACAGCACTGCAGAGCCCTATCGACAAACCTTCAGATTCCCTCAGTATAGGAAATGGTGACAGCTCCCAGCAGATAACAAACAGTGACACACCTTCACCACCGCCTGGTTTAACAAAACCCAATCCAGTCATACCCATCAGTTCATCTAATCACAGTGCACGGTCTCCTTTTGAAGGGGCTGTAACAGAATCACAGTCGCTCTTTTCTGACAACTTTCGGCACCCTAACCCCATCCCTAGTGGGCTTCCTCCATTCCCCAGCTCTCCACAGACTTCAAATGACTGGCCCACAGCACCAGAACCACAGAGCCTCTTCACATCAGAAACTATACCAGTATCCTCCTCCACAGACTGGCAAGCGGCTTTTGGGTTTGGTTCCTCCAAACAGCAAGAGGACGACTTAGGGTTTGACCCCTTTGACATCACCCGCAAAGCCTTAGCAGACCTGATTGAGAAGGAACTGTCAGTCCAAGACCAACCTTCCCTCTCGCCCACATCTCTTCAGAACCCTACCCCACACACTACAGCTGCCAAAGGGCCAGGCTCTGGATTCCTGCATCCTGCTGCACCCGCAAATGCCAACTCTCTCAGTAGCACCTTTCCAGTCATGCCACAGAGGTTCCCACAGTTTCAACAACATCGAGCAGTTTACAACTCCTTCAGTTTTCCAGGCCAAGCAGCTCGCTATCCTTGGATGGCCTTCCCACGCAATAGCATCATGCACTTGAACCACACAGCAAATCCCACCTCAAATAGTAATTTCTTGGACTTGAATCTTCCACCACAACACAGCACAGGTCTTGGAGGGATCCCTATATCAGGTATCCCAGCCTCCACAGGAAACAGTTTAGACACCCTTCAAGATGACAATCCTCCACATTGGCTAAAATCTCTTCAGGCCCTCACAGAGGTGGACGGCCCCAGTGCAGCACCATCACAGACGCACCACAGTAACCCCTTCGGCACACAGATCCCTCTGCACAGAGCCAGTTGGAATCCCTACTCTCCTCCTTCAAACCCCACCAGCTTCCATTCCCCACCCCCAGGCTTTCAGACAGCCTTCAGACCCCCCAGTAAAACCCCCACAGATCTACTACAGAGCTCAGCGCTGGATCGTCATTAGGAAAGGAGGAAAAAGAAGAGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAGAAAAAAAAGAAAAAGAAAACCCAAAACGTTAGAAATGCAGGAAGTGTCCCACCCTGACTCCTCCCCATGCCCACCTACTGTTCCCTGTCATATCTTTCTTTCTGAAGAATCCAGTTCCTGATCAAACCTCCCCCCCAAATGCAATGCCATCACAGGGTCGTGACCGTATCTTTTTGTTAAGTTTCTGCTGAGCCAGTGTTTGAAATACACTGTTTGAAATATTTTCTAACCGTTCTAAGGAAAAAAAAAAAGAGAGAGAGAAATCAAAATGCAGTCTCAATGCTTAAGGAGAATATTACTGTCTTATGTCTTTTGCACATGAGTATTTCTGCCTAGTGGAAAAGTGTCAATCTGCAGTAGGGGAAAAATTGCAATGCAGAATCAAATGCAGAAACATGAAAAAGGTATTTAATTTAAATGAATTTACTGAACATGTGGGGCAAGCAGTGGCCTAGCATTTATTTTGCATTCAGTGTGGCACTACACAGGGAAATTGCTATGTTTTTTTTTTTTAAGGGGGATTTTGTGTCAGAGTTTGACATGAAGTGTGTTGAAAGACAAAAAACACTTATAGCTACGAGTAAGTGGCATGTTGCTAAAGAGTGATTTAAAGAGGGGAGAATAAGATTTTTCTTTAATTTTGGCTTTAGATTTAAAGTAAACTTTAATGTTTTAAAAGTATTCACAGATTTAATACCTAGCGTATACATAATATAATTATAAGCAGCTGAAACACGAGTGATATTTACTTCAGTCTTTCTGTCTCCTCTGTCAGTCTCTCTTTCTTTTTTTTTAAAAAAACAAAGATTCACCTGATTAGGGCACTCTGGGATAGCACTGCATTGGGGCCACATGATCACCATCAGGAGCAACCTCTGACCTCCTCTGCCTGCAGCTTTTACTTAACCCTGTAGTTTCTGGACGTTTGTGCAGTATTGAAAAGACAGGAAAAAAGAAACAGATAAATAAACATGGTTATAACCTGACTCTAAAACTAAAACCAAGGAAATGTACCTCTTTCTTCAGAATTAAAACTAAAATCTTAAATAAAACAGAAAACTTGATGATGA\n>XR_005915111.1 PREDICTED: Gossypium hirsutum xylose isomerase-like (LOC107963207), transcript variant X1, misc_RNA \nATTTTGCAGGGTTTAGTTTGATACTTTGAGTGATATCAGTAAAGAAGAGTATGGCAAGGAAGATTTCATATATATTTCTTTGTATGAATGTGATCCCCCTTTTAGCGGCTGCTGCATCACAAGCTTGCTCTGCTCAATCTGATGCAAAATGTTCTCAAACCGGTGAATGGAATGGGGAATTTTTCCCTGGAATTCCCAAAATCAAGTATGAGGGTCCTTATACCAAGAATAAATTTGCATATAAATGGTATAATGCAGAAGAGGTGATTCTTGGGAAGAAAATGAAGGACTGGTTGAGATTCAGTGTGGCATTTTGGCATACATTCCGTGGAACTGGTGTTGATCCTTTCGGTGCACCTACGAAATTTTGGCCATGGGAAGATGGTACCAATTCCATTGCTATGGCAAAAAGAAGAATGAGAGCCAACTTTGAATTCATAAACAAGCTTGGTGTTGACAGGTGGTGTTTCCATGACCGGGACATTGCTCCCGAGGGCAAAACACTTCAGGAAACTAATTCAAACTTGGATGAAGTGGTGAAACTTGCTAAAACACTTCAGGGAAACAATATCCGTCCACTGTGGGGTACGGCTCAACTATTTATGCATCCTCGTTACATGCATGGTGCTGCTACAAGCTCTGAATTGGGTGTATATGTATATGCTGCAGCTCAAGTCAAGAAAGCCATGGAGGTGACACACTATCTAGGGGGAGAAAACTATGTGTTTTGGGGTGGTCGTGAAGGTTATCAAACACTATTGAACACAGACATGGAATTTGAACTTGATCATATGGCAAAATTTCTTGAAGCTGCGGCTGCCTACAAGAGGAAGATTGGATTCACCGGAACTCTACTGATTGAACCTAAGCCTCAAGAACCTACAAAACATCAATATGATTGGGATGCTGCAACAACAACTAATTTCTTGCGAAAATATGGGTTGATCGGGGATTTCAAACTTAACATTGAGTGCAACCATGCCACACTCTCTGGTCACAGTTGCCATCATGATGTTGAGACTGCAAGAATCAATGGATTGCTAGGAAATATTGATGCAAACTCTGGCGATGCTCAGACAGGTTGGGATACAGATCAGTTCTTGACAGATACTCGAGAGGCAACTATGATCATGCTAAGTGTGATTAAAAATGGACACTGAGCTTCTTATCGTTTGACCCAACAGACCTTTGGTGTTCGATGAGAATTTATTTATCATATTTGGTTCACTTTTGTTTATGACAGGGATGCAAAATTACGGAGAGAGAGCACAGATGTTGAGGACTTGTTCATTGCTCATATTGTTGGTGTTGACACCATTTTTTTTGATGAAAAACGGTGGCGACTTCCGTTTTTTTCGAAATCATTTATTAAAAACAACCACTTTTGGAGGTGATCCGATCACACCTCATCAAAAAGGATCGGTGGCGACTCCCGTTTTCGTTTTCATTTTTCAAAACCCAAGTTGATCCCGTTTTTCATCCAAAAAAAATGGTATCAACAGTTGGAATGGACACCTTAGCCCGTGGACTCCGATATGCTGCCAAGTTGATTCAGGTAATACCAATACGAACATAAAACAAATACATATATGTAAAATACTTTAAACATGATTATGACACGATAAATTACATGAATACGATATAGATACATGATATTAATGAACTTGATGATTATATAGGATGGTTCTTTGGCTAAGCTTAGTCATAAACGATATTCAAGCTTCTATAATGAACTCGGTGCCCTCATTGAGGCTGGTAAAGCTGATTTTGAAATGCTTGAGAAGAAAGCAATGGAATGGGGCGAACCTACGGTTGCTTCAGCCAAGCAGGAACTTGCGGAAATGATCTTCAACTCTGTGCTATAAGAGGGACCTTGGCTAGCAATGTCTTTTGCAATTTAGCATTAGGAGTAATTGATGATGTTCAATAAGTACAGTTTATGTAATTTTCATTTTTTTTTTTAGAAATCTTTTGTACCTAAATTTCACTCTCTCTTTTTTAATTTGGTATTTAATTTTTTTATGTCCAATTTGGTAGA\n>XM_033267273.1 PREDICTED: Anneissia japonica uncharacterized LOC117121888 (LOC117121888), transcript variant X1, mRNA \nCAGGCGCTGACATTGTTATTAACAAACCTACTTGGTACTTTGTAGATTTTTTATTTATTTGTGCTCGGAAAATTACGAGAACCTGGGATGCAATTTTTTTGTTATGACCCACCCTTTCTACTGAAAATGAATTCCCTAAGATTATTTTACACCATCATTATGTTTGTGGCAGTCAAAGAAGTAGAGTGTGAGGTGAAAACAATATATTTTTGTCCTGAACAGAGTGCAACAATATATTGCAATGTTACCAGTGATTTCACCAAATTATATTGGAAAAACTCTACAGATTATGTTGTAGCATCACAGACTGTTAATAATTGCAAAATTACCAAAAAAAGTCCAAATAAAACATACTCCTCATCTGACCGATTTGAAGTCCAAGGATTATCATTGAAAATAGCATTTCCAAAGGATGGTGAACAATTCTATTGTGATGTTGTATCGAGGAAAAAAGAAATAAAACAGCATTTTACTCTAGACGAGTACAGTGAACCTTATCCTGATGATGTGTGCAGTTCACCAAAAGACACTAACAAAACAAAAAGCAGGCAGTTAAGAAGCGGTGGAACCAACAAAATTACCCGGGAAATCAATGAAACAAACTTTGTATGCATAAATGGAAGAACTGTTTTAAAATGTGATAACGGGCAACACGATAGGCCTATCGCAGAGTACTGGGAAGATAGATATGGCAAATTGATTGTGTCTAATGTGGATGGGAGACTATCAAATACGTCCGATGCCAGATATGTATTTAACCATATGAATTCCACATTGTTAGTCCAAAATCTATCAGAATGGGATCATCTATTTGTTTGCAAAACTGTCTACAAAAATGAAGATATCATAAAATGTTTCAATTTACAGGAATATGGTACACCAAAAGACAGCTTTTTTGAGGGATTTGAAAACAATAAATGTGAAGTAGATGCAAATGAAAATGGCCAGGTCATTGTACCATTCACGGTGGCTTGTTTCAGTCCAGTGAATGCAGTAACTGTAGTTTGTGAACTGAATGGAGAGTGTAATGATACAAACCCGCAGTATAATGTAACCGATGACGGGAAATTTAATTCACAAATTTGTATAGATAGGAAAATCGAAGTGAATAAAAATTTGACATGCACATTGACTGGTCCTGCTATGTGTAACCATTCTCAAGAATTTGTTTGTCACTTCAAGTTCAAGGAAAACAGTTCAAGCAGTATCAGAAATTTAGTTATTGCTATTTTGTGTCCTATTGTGGGTCTTCTTGTGATTGTATTTGTGTACTTACGTTGTTGTCAAAAAGAGGAAGAGGAACATAGCAAATCACAAGTTAAGATGCCATCTGAGATTCCCCCCATCCAATACATCACAAGCTCCGACCAAGTAACAATAACTGCACCTCAGGAGGTCACTTAATTGAGGCATGTCGTGGTGAAATGGTTAAGTTGTCGCACAGACCAGTACTGAGTAAATGAGCTATAAAAAATGGGAGCTCAAAAAATTTCCTGAAAATCCAAATTTGTTTTCCACTATTATGGATCAACAGTTTAATGTCTTATTAATCATGTCCCAAAGTATTAGTTCTGGAAAAGTTCATCAAATTGTTTATTTAACGTTATTTTGATATTTAATTGTATTTAACAATGCACAAATAACTTCAGAAGGCAATACTGTACTCAAAATTATGTTTATCTTGGCTATAAGAGTGCTGTACATTCACTTACCAATAACTTGGGCTTGAAATTTCCAATTTTAATGAATGACCCCCCGTTTTAAAGATTCCTCTTTTGTCTTTCATCTTTTGTGATCTGTTGGGCTTTGTCCCCTCCCTTGTCGTTATTTTAAGGACGTGACCCTAGAGAGTTTCATTTATATTTTCCTTTTATTATTTTTGTAACATGTTCTTGTTGGTTCTGAATAAAACTGATTATATATATATACTCAGGTATCTTAAAATATGGATATTTTAGAGGAGTCTTGAATTGGTGGGTGCATTGTACTATCTTCACTCCTTTAATCCCGACATGTCTTCAACATGGGGATTTCTAATTGTCAACATGGTCTTGTCAAATTGATCCTGCATAACTTCTCCTTGGCTGTGTTCTCCACCACAGGACACAGAATCTTGATGAGAGGGAACCAGCTCCTCATATTGATGTCATTTTCATTGATTGGAGAGGTGTATTTTATCTAATTTGATATGCTTCTTTCTAAAATGTGCAATTCAATGCTATTAACTTTTCGTTTTATATTTAATCTAACTTTTAGTAGATTTTTAACTGTTAACTTAATTCAATCTTATATATATTTTATCTACACTTTTTAATGTTTTAAAACCATTAAAAAGTAATCGTTTAATGTGCAATGTATAAATGCCAAGGTCAACTTTTTAATTATGATGCAATATATTATTACTATTACTAAAACTCTATACGGCTATGTTTGCTCTATGCTCTATGTTATAATGTAACAATACCTTAGAATAACTCTGTACAATATTTATATTCTTCTAACTTTTATGAGCTTTGTCAGTTGTGGAGACTGCATACACTTTTTAATGTTACATATTCTTCATCAATACCTCCACACCAAAGTTCATCGTCGTAATTTTGTTACCGTCAATCCCGCGTTTCCGATCTCTGTATTTGTTATGATATCACTAAGATTGATATAATCAAATTTTCTCCATTTCTATCATATTGATAGTGGACTAGAATTACTGTTGTTGGTTTTACTAACATGTTTAAGGGCAAATTTAGACAACACTGGGTTGAAATTTTTCATATTTAGTGTTATTATTGTACTTTGTATACTAGGCTCCTAAGCCTCAACTAGTGGAGTAAATATGCTCAAACAAACTGACACCATTCAAATAATTTAATTCTCGAACTCTAAATAATATGGTAATAAAGAGGGCTTAATTCCCACGTTTGCCATCATTACTATGTTTGCCATTCATCACTACAACTGAAATCAACAATAAATTCACCACAAATAGATGAGATAGTAAAAAATGATTATGTCTGATTCTATTTAATTTGTTATTAATAATAAGCCTGAAAAAATGAAAAGAGAGAAAGTATATATTGTAGTTTAAAATGTCAACTGTTCATAGTAGGGCCTATCAAATAGGGCCTAGGCTTAAATTAAATGACCAATCAGAACGTGTTATTTTTTTTTTCTTGTATTGCATTTTACGAGAAGTACCAATACTGAGTATGATGGTATGGCTACATGATGAATATGTAACATTAAAAAGTGTATGCAGTCTCCACAACCAAGTTCGTCATCGTAATTTTTGTTACCGTCAATCCCACGTTTCCAATCTTTGTATTTGTTATAATATCACTACGATAGAAATAATCAAATTTTCTCCATTTCTATCATATTTACAGTGGACTAGAATTACTGTCGTTGGTTTTACTAACATGTTTA\n>XM_004993437.1 Salpingoeca rosetta uncharacterized protein (PTSG_12341), partial mRNA \nATGTCGCGGTTTGTGGTGGCGCTGCGGCCGTGTGGACAGCTGCGTGAGCGGCTCACAGAGCCCTTGGAGCTGAGTGCTGGAGTGCACATCCTGGGGCGAAGCCCACAAACCAAAGTGAAGCAGCAGTTGTGCAGCCGACGCCAGATTGAGCTGGATGTCGACACCGCCCGCGGCACCGTCACCCTCAAGCAGCAGCTTGGCCCAAACGCATGCTCTGTGAATGGACAAACCATCAGCCGAGGGAACAGTGTGGCGGTTTCGCGAGGCGCCCGCATCTCCATGTTGGCAGACAGTCCAGACGAGACCACGTTCACCCTGGACATCCACGAGTACGCGCCCTGTGGCATGACAACGCCCGAATCAACGCCGCTAACCCAGTTTGACACGTCAGCGTCCAGCACCGCGTCTTCTGTACGACCTGACGCGACTAGTTTTGACACAAAGCCAAGCGCACATGCCCCAGCCATCACCATCAATCTCACAAGCAACACTGGCGCCGCCACAATCACCATCACCAACAATATCACTGCTGCAGACGATGCTGATTCATCGCGCTTGACGACACCAGGCGGTGACGCCGTTACTGAAGAAGACACTGGACAGCCCAAGCAGCGCAGCGACAAGCAGCAGCGACGTGTCACCAGCGAGTGTGTGGACCACTGGGCAAATGCGCTGACGGAGTTGGTGCGTCACCCGGAGCGCCATGCTGATGACATTGTCTACGAGACCGTCGACACGCTCGTCATCAACGACAAGTACCCAAAGGCGCGGTACCACTTTCTTGTGCTGCCCAAACGCGTGATCACGGATCTGACGTGCCTCACCCGACATGACCGCCACCTCATCCAGAGACTGCAGGAGACAGCCATGACCTTTGGCAAGATGATTCAGGAGGACAAGCCAGGCGTCAAGTTTCATACGGGGTTTCACGCCGTTCCCAGCATGAATCAAGTGCACCTTCACTTGATTTCGCAGGATTTCGACTCTGTGTCCCTCAAGAACAAGAAGCACTGGAACTCGTTCAACACGCCGTATTTCGTTCCTGCTCGCAAGGTGTATGAGATGCTGAAGAATGAGGGCCGAATCCACTTTGATGAAGCAAAGTACAAGGAGTATTTGAAGAAGCCGCTGGTGTGCCACCGGTGTCGCCAGGAGATGCGCAACATGCCCACCCTCAAGCGGCACCTTAAGGAGCACCTCACCAACCCCTAG\n>XM_046397594.1 PREDICTED: Scatophagus argus UbiA prenyltransferase domain containing 1 (ubiad1), transcript variant X2, mRNA \nTGCACGATGTTGCACTTCTGGAAGAGGAAATGGCGCCCGTCAGGTGCAGCAGGATTTACAGTGGCCAACCAGTCAAGTCCCCTCGTAGTTGACACGTAAGCCACCTAACTGCCTCTCGCTGCATCAGGCTCATCGGACACAGAAGTATGATTTTAAGTAGTGAGAAACCCAGTTTGTGTCGGATGGTGAAGACGTAACGGAGCGCTGCTGGTACTGCAGACCCCTTGCATCGGAATGGCCAAAGAGCAGAAACAAAGCAGGGCAGAAACATTTGTGCTGGCTGGATCTAATGGTCACAATGGCCAGCAGTGGCAGACTGGTATGAATAACTTGGTCACTCACTCTCCTGGCACTAACCACAAGTCGAGGATGGCTCGCGTTGCCTCGGACATGAGGCAAAAGTGTGCGGCCTATGTGCTAGCACTGAGACCGTGGAGCTTCAGTACCTCGCTGACGCCGGTGGCCCTTGGCAGCGCTTTGGCATACAAACTGGATGGCTCTGTGGACTTGGTCATCCTGATGGTGTGCGCTGTGGCTGTTCTTGTTGTCCATGGGGCAGGAAACCTTGTAAACACGTACTATGACTTCTCCAAAGGGATAGACCACAAGAAGAGTGACGATAGGACTCTTGTGGATGAAATCTTGGCACCGCAGGATGTTGTTATGTTCGGAGCATTGTTATATTCTTTAGGCTGCTTGTGTGCCACTCTGCTCTACTTCCTGTCAACACTTAGACTGGAACACCTAGCCCTTATTTACTTTGGGGGACTCTCCAGCTCTTTTTTATACACTGGAGGCATCGGCCTCAAGTATGTGGCCCTAGGAGACTTGGTAATCCTCATTACCTTCGGTCCTCTGGCAGTCATGTTTGCCCACGCTGTGCAGGTTGGCTACCTGTCAGTGCTGCCGCTGGTCTATGCCGTCCCACTGGCCCTCAACACGGAAGCCATCCTCCATAGCAACAACACCAGAGACATGGACTCTGACAAGCAGGCAGGGATTGTCACCCTGGCCATCCTCATAGGCCCCACACTGTCCTACGTCCTCTATAACCTCCTGCTTTTCGTCCCCTACGTGCTCTTCTGCATCCTCGCCACACGTTACACCATCAGCATGGCGCTCCCTCTGCTCACGCTGCCCATGGCCTTCCCACTGGAGAAGCAGTTCCGCAGCCGACGCTATGCCAAGATACCCCAAAAGACGGCCAAGCTCAACCTCCTTATGGGACTTTTCTACGTGTTTGGGATCATTCTGGCACCTCCTGGCAGCTTGCCGTTACTGTGATTAATTAGCTTTGATATTTCAAATTTTGTTGTTTTAATACAGACTAGTTTATGCACCTCTTTGTATTTGTACAACGCTGAGGGCTTTTCAAAGGCTTTAATTTATTGTCTAATTTATACATTGAACAGAGATCTAGTTTAGGTCCTGCTCTGTCACACTGAAGGCATAATCAGATGTATTTTTTCAGTATTAAGCCTGCTGTAATGTGTTGGTGCAAGTAAGAAGTGTTGGTGTCATTTTGTAGAGGTAGGCAGCATTTTTATCATACAAGGACAGACAGTAAACCTACAGTTGCCATATTTGCTGTTCTTAAAAACACAATACTACAATGT\n>XM_045050371.1 PREDICTED: Felis catus zinc finger protein X-linked (ZFX), transcript variant X5, mRNA \nCTCGGGTTGTTCCGCTTCCAACTACCACATTCAGAGTTGGCTATCAAGTGGACGGATTGCTAGACTCTTACGTTGATATTCACACTTACGTATCTTTTTGTCCTGTATCTTTTTGGCCTCCATTGGTTAAGGGGAGCACATTCTTATTCCCTTCGTTAAAAACCTGGTTCCCTCATAACCAACACTCCTATTCTTGTCTTTGACAGCAGCGGTCTCAAAACGTCAGTGTCCTCTTCAGTTAATCTCTTGCCCATTTCCAGCACTGAGTCCTATTATTTCTCCCTTGCTTACATCTCTTCCTTCTACTTTCTGCCACATGGACAGGCTCCGTCATCTCATTCTTAGTTTGCGGTAACTTTTATTTTCCTTACCCTTAGTCTCTTTTGTCTAGCCCAGCAGTTAAAACACTCATCATAAGATAACATGTGGATTGTGTCATTTCTCCATTTTCCGTTCATGACCCAGCAGTTTTTCAGAACACTTCCCATACATTCCCATTTGATCATCACAACAGTCCTGTGAGGAGCTGATGCTACACACATGGATGGTGATCAAATTGTTGTGGAAGTACAAGAGACTGTTTTTGTTTCAGATGTTGTGGATTCAGACATAACTGTGCATAACTTTGTTCCTGATGACCCAGACTCTGTTGTTATCCAAGATGTTATTGAGGATGTTGTTATAGAAGATGTTCACTGCCCCGATATCATGGAAGAAGCAGATGTATCTGAAACGGTCATCATTCCAGAGCAAGTGCTGGACTCAGATGTAACCGAAGAAGTTTCTTTAGCACATTGCACGGTCCCAGATGATGTTTTGGCTTCCGACATTACTTCAGCCTCAATGTCTATGCCAGAACATGTCTTGACGAGTGAATCCATACATGTGTCTGATGTTGGACATGTTGAACATGTCGTTCATGACAGTGTAGTAGAAGCAGAAATTGTCACCGATCCTCTGACAACGGATGTCGTTTCAGAAGAAGTACTGGTAGCAGATTGTGGCTCTGAAGCAGTCATAGATGCCAATGGGATCCCTGTGGACCAGCAAGATGATGACAAAAGCAACTGTGAGGACTACCTTATGATTTCCTTGGATGATGCTGGCAAAATAGAACACGATGGTTCCTCTGGAATGACCATGGATGCAGAGTCGGAAATCGATCCTTGTAAAGTGGATGGCACTTGCCCTGAAGTCATCAAGGTGTACATTTTTAAAGCCGACCCTGGAGAGGATGACTTAGGTGGCACCGTAGACATTGTGGAGAGTGAACCTGAGAATGACCACGGAGTTGAATTACTTGATCAGAATAGCAGTATTCGTGTGCCAAGGGAAAAGATGGTTTATATGACTGTCAACGACTCTCAGCAAGAAGACGAAGATTTAAATGTTGCTGAAATCGCTGATGAAGTTTATATGGAGGTGATCGTGGGAGAGGAGGACGCTGCTGCCGCGGCGGCCGCCGCCGTGCACGAGCAGCAGATGGACGACAACGAAATCAAGACCTTCATGCCAATAGCGTGGGCGGCAGCTTACGGTAATAATTCTGATGGAATTGAAACCCGGAATGGCACTGCAAGTGCCCTCTTGCACATAGATGAGTCTGCTGGGCTCGGCAGACTGGCTAAACAAAAACCAAAGAAAAGGAGAAGACCTGATTCCAGGCAGTACCAAACAGCAATAATTATTGGCCCTGATGGACATCCCTTGACTGTCTATCCCTGCATGATTTGTGGGAAAAAATTTAAGTCCAGAGGTTTTTTGAAAAGGCACATGAAAAACCATCCCGAACACCTTACCAAGAAGAAGTACCGCTGTACTGACTGTGATTACACTACCAACAAGAAGATAAGTTTACACAACCACCTGGAGAGCCACAAGCTGACCAGCAAGGCCGAGAAGGCCATCGAATGCGATGAGTGTGGGAAGCATTTCTCTCACGCTGGGGCTTTGTTTACTCACAAAATGGTGCATAAGGAGAAAGGAGCCAACAAAATGCACAAGTGTAAATTCTGTGAATACGAGACAGCTGAACAAGGCTTATTGAATCGCCACCTTTTGGCGGTCCACAGCAAGAACTTTCCTCATATTTGTGTGGAGTGCGGTAAAGGTTTTCGTCACCCGTCAGAGCTCAAGAAGCACATGCGAATCCATACTGGGGAGAAGCCGTACCAGTGCCAGTACTGCGAGTATAGGTCTGCAGACTCTTCTAACTTGAAAACGCATGTAAAAACTAAGCATAGTAAAGAGATGCCATTCAAGTGTGACATCTGTCTTCTGACTTTCTCAGATACCAAAGAGGTGCAGCAACATGCTCTTATCCACCAAGAAAGCAAAACACACCAGTGTTTGCACTGTGACCACAAGAGTTCGAACTCGAGCGACTTGAAACGACACATAATTTCAGTCCATACGAAGGACTACCCCCACAAGTGTGACATGTGTGATAAAGGCTTTCACAGGCCTTCTGAACTCAAGAAACACGTGGCTGCCCACAAGGGTAAAAAAATGCACCAGTGTAGACATTGTGACTTTAAGATTGCAGATCCGTTTGTTCTAAGTCGCCATATTCTCTCAGTTCACACAAAAGATCTTCCGTTTCGGTGTAAGAGATGTAGAAAGGGATTTAGGCAACAGAACGAGCTTAAAAAGCATATGAAGACACACAGTGGCAGGAAAGTGTACCAGTGTGAGTACTGTGAGTATAGCACTACAGACGCCTCGGGCTTTAAACGGCACGTTATCTCCATTCATACGAAAGACTATCCTCACCGTTGTGAGTACTGCAAGAAGGGGTTCCGACGACCTTCAGAAAAGAACCAGCACATAATGCGACATCATAAGGAGGTTGGCCTGCCCTGATAGTCCTTCTACAGACATTTATGGAGATGTTGGCCTTGAAGCAGAAATCTCATTTTAAAGCCAGTCAGTCTCGTTCACATACAATACTGTATATTGATTTATGCTGTGTACAAATAGAATTATTGCTTCTAGTTGAGTTTTGTTGTTTTTTTTTTTTTTTTTTTTTTTTACATTTTGTTTAATAGTGTGTTCTGAATTCTATTCAGTTTGTTTAATAAATGGGGGAAAGCAGCAACAAATAAGTTGCTTTTAATAAAGTAATCCTTGATGCTATACTGGATTTTTCTATCTTACAAGTTTTATATTTATTTAAATATTTACCTTGCTTACCTTGATGGTACTCTTCTAAGACCATTTAACTTAAAGTTAAGGTAACTTTAGATTGGTAACTCTGAAAGTATTCGTGTTGACTCATTTTTTTTTTTTTTTTCCCCATGAATTTCTCACAATAAAATTGTCAGAGACATCTACTAACATAAACGGGAGATTTTACAGTCAGGTCTAATTATCCTAACATGGAAGTCCTTGACTTGTCTTGCTTGCTCTTCTCAGACCACATGACAGTGAAAGTTTCCATTTGAGCTTTTGCCACCCGGGCATCGCTGAGGAAAGAACAGTGGCTGGGTTCGTCTTTACTTTTCATTTCGTTGAGCAGACAAGCTGTACTTTTTGCAGGGAGGGGGGGGTGGGGGGGGGGCTTTCTTTGGTGTATTTACATCTTTTGTCAGCATAGCAGACTTCTAGAAAACTTCCTTGACAAATTTTGCTTGGTCATGTTGTATTTTGATTATTCCGTCTGTGCTGCTTTGTCTCGGAATGGTTGTGTGTTACAAATGAGATTATCGAGGACTGCATTTTGGAATCTCCTTGAGGTAATTCGTGGCTCGTAGGATCTTTTGCGACTTTATATATGTAAATGTACCCTGAATTATATATATGCACATATATAGAGAACATGTATCTGTGTGTATTGTTTATTTTACATATTTATACACACAACCCCAGTAGTAGTTGTTTAAGATCTATAATGAAAAGTATTAAATTTACAATAACACGAAAGATGCAGGGATGCATGAGAGAGCATTTTGTAAATCATGCTCTTCAGAGAGACTACTCAGGTGAAGAATTAGAAGGAAAATAAGGACACTAGTATTTTTAAAGAGTTAAAGGTATTTTCTTTTAAATATCTTTGGTAATTGAAAAATAGACGTTACGATGTTTCTAGATAGAATGTTTTCATACAACTTCAGCTCCATGCCTTTATATTTTTCTGAAAAGCTAATGAGCATCCAGGCAGAACTCCCTCCGTTCTCTCAGAGAAACTCTTGAGGGAACTCTGTGTCTGTCACCCAGTGAAGGGGGATTAAGGAAGCCACAGCTCCGTGTCCCAGAGATTGGGTGCTAATGATGACTTCCGCTTGGCAGGTCCAGCCTGCTCTGTTATGTCTTAGTTACAGTTAGCAAACTTTAAAAACCTGAACACCCAAATTGGCTTTGGTTAGAAGATAAAGGTGTGTTTAAGTGCATGAGGAAAATCTGAGGCCTTATTTGGAACATCCCCAAGTCTTTCACGGTTTCGTTTTTCTTTGAGAGTTGGTATTTTTTAAACAGTTCTGAATCAGTTCAGAAACGCATACACTGAAGTCAGTTACTTAGAATTGGATCATGCGAAGATGGGTCTTGGAAAATGGAAAACAGTTTTTGGGGTCCTTTAGATGGGATGTCAGCATGTGAGTATCCGGCACGTTGTAGGAGATTTAGTAAGGACTTTTCTTCCCACCTGATAGCTGCCTTGCCACTTCATGATGGTGCTCCTTCCCCTTTGTGCTGTTCGGGTTTAACCTTTCATCTTTCTCTTTGCCATTGATACTTGTATTCAAGAATTCTATTTATAGGGTTAGAAATCTAAATATTTGGTGTTTGGCAAGCCTCTGAAGTGCTAGATTGATTTCATCCACTTGGAAATCAAGTGCTTTAGGCTGGTATGAACTCCAGCCTGAATGCCAGTTAAAGCCAAGGCATGGGCCTATCCCAGCGGGAGCTCCTGTGCTCTCTTGGCCCCATAAACATTCTTTTTTTTTTTTTTTTTTTTTTTTTAAGCGTAACTTACAATTGTGTGATTCATTGCCCTGCAGTACTATTCTTGAAAGCTCTGTCTGTTTTTTTGTGAGAACCTTTAAAATCTCCCTTAATTTCTTTTTCCCAGAAGTCATGTAAAAGAAAACACTTAAGTGAAAGTGGAAAGTTATTAACTTTAAAACATGCTGTAAAATTAGTACAGAAAATATAAAGAATTGGTCATTTAACTATATTTTTTTAAATAAACTGAAAGATAAAGAACACAACACTGTACACACTTTATATTTCTCTTACATAGTCTGGAATCATACACAGCTATTTTCTTTTTAAAGCACAATATTGAAACCTTTAAAAGGTATTTAAGGGTTTGGTCAAGTGAATATGATAAGATGTATTTGTCTGTATAAAGAGAAAATGAACTTGTAGTCACTGTTATGTACTGACATTAGTTACAACCTAGTTTTAATTCTTAAAACAATTTTGATTAGCAAAGCTAAAAAAAATGGATGTTTCAGTTAAATGTTTTAAAGAGGTACAGATTTTTACAAGGACATAATATAAGTTATTGTTCTGTAGAAATATCCTATTAAATATTGTATGTCCCTCCCTCTGTACACTTTGTAAAAAAAGTAAAATACATAAAAAGAAAATCATATAGGGATGTGTGACATTATTGTAATTGTGTACTTGAGAATAACGTGCAAAAATAAAAATCAGAATATTTTCCTGTTAATGGATGTTTAGTCTATTTGATACCAGTACTAAGTTAATGCTTTTTCTTAAGGAAAAAAATGTACAGTTTTTGTAAACCTAATAAACATCAAAAGCAGTGGATTA\n>XM_008507523.1 PREDICTED: Equus przewalskii developmentally-regulated GTP-binding protein 1-like (LOC103540855), partial mRNA \nATGAAAGATGAAGAGTCATGGACTCTGACAGGCATGACATGGAGAACGGCCCAAGGTGTGGTCCCACCAAGCACTAGGGGTCTTCAGGTCCCCTCCCCGAGAAGCCTGATGACCTACCTCAAGGGCATGACTGGACCTGGCCACCAATCTAGGGCAGGGTGGGGAGACAGAAGCTGTTCTGTCCACCTAAGCTCCTCTCAGCCCACCCTTCGTGGCCCCCAGCTCTGTCAGCTGCACCCTGGCAATCGGATAAAACTGGCTTCCCTCCAGGATGGGGACGGAGGGTGGTTGGCTGAGAGGGAGAGGACTACTCCGCTCTGTCTCTTGCGAGGAGTAGGACGTACGCACCTGCGCACTGCAGTAGCGCCTGGTGGTCGTTGGCCGGTCCACTGGTGGGTGAGCCTCCAGGGACTCACCGCTGTCAGCAGCACCTTAGCCAAGATCCTGAAGATCGAAGCCAAGATGGCTCGGACTCAAAAGAACAAAGCCACAGCACATTACCTCGGGNCGGTTAAGGCTAGCTTTGCTAAGCTTGGCAGAGAACTCATTACTCCAAAAGGTGGTTGTGGTGGTGGGCCAGGAGAGGGTTTTGATATGGCCAAGACAGGTGACACTAGAACTGGGTTTGTGGCTTTTCCATTTATGGGGAAGGCAACACTGTTCAGTAAGCTGGCAAGGGTATATTCCGAGATGGCAGCCTATGAGTTCACTACTCTGACATCTGTGCCTGGCATCATCAGATACAAAGGTGCCAAGATCCAACTCCTGGATCTCCCAGGTACCGTAAAGGGTGCCAAGGATGGGAAAGGTAGAGGCCATCAAGTCATTACAGTGCTGCAAACGTATAACTTGATCCTGATTGTTTTGGATGTCCTGAAACCCTTGAGACATAAAAAAGTAATTGAAAATGAGTTGGAAGTCTTCGGCATTTGCTTGAACAGCAAACTCCCTAACACTGGCTTTAAGAAGAAAGATAAGGGAGGGGCTGGCCCCGGAGGCATTTATCTCATGGCCACTTGCCCTCAGAGTGAGGTGGATGCTGAAACCGTGAGGAGCATTCTGACTGAATACAAAATTCATAATGCTGATGTCACTCTGCTTAGCAATGCCACAGCGGATGACTTCACTGATGTGGTAGGAAGAAGCAGAGTTTATATCCCCTGTATCTATGTGTTAAATAAGATTGATGAGATTTCCGTTAAGGAATTGGATATCATTTATAAGGTGCCTCACTGTGTAGCCATCTCTGCCCATCACTGCTGGAATTTTGATGACTTGTTGGAAAAGATCTGGGCCTATCTGAAACTAGTGAGGATTTACATTAGACCCAAAGGCCAGCTGCCAGATCACAGATCCCCAGTGGTGGTGCATTACCCCAGGACCATGGTGGAGGATTTCTGCTTGAAGATTCACAAAAACCTTATCAAAGAGTTTAAATACACTCCAGTCTGGGGGCTTGCTGTGAAACACAATCCTCAAAAAGTGGGTAAAGACCATACGCTGGAGGACGTCATTCAGGTTGTGAAGTGGAACCTTTCCATTTCCCCATCTGCCAGGCCAAGCACAGCAGCTTTCCCGGTGATCACCCTACTCCAATCCCCTTCTGGCTTTGGCAGCCTCTTGATCAAGATTCAGGGGAGGGAGATGGAGACACTCAAAGTGGAACTTCACTTGTATTATCTTGGTGTCATCTTGTATATTGAACTGCATAAAGGACATGACAGGAAAAAAAGAAAAAATAATGACCACATTCGCTTAGTTGCTCTGCGATTCTCCATGACTACACCAACAGTTGGGACTATGAAAATACAGGGCCCACAGCTGATGCTCCATAAGAGAGATCTTGGATACCTGATGCTTCAAGCCCA\n>XM_052662140.1 PREDICTED: Budorcas taxicolor EH domain binding protein 1 like 1 (LOC128068878), transcript variant X12, mRNA \nAAACGGCGCGCTCGCCGCTCAGCGCTCCAGCGACCCGACGCGCCCCAGACGACCCCGCCGAGGCGGCCAGATCATCGGCGGGCCCTGCGGCGGCCGCGGCGGAAAGAGCGGCCCCGGATCCCGCGCCTCGGACCCCTCCGCACGGACGGGGCGGGCGGCGCGGATAGGATCCTGGAGGCCATGGGGACCTGGGCCGGGCCAGCGGTCGCGGACTAGCGGGAGTCCCGGGTCTGAGGAGCGGGCGGCGGAGGCGGCGGGGCCATGACCTCAGTGTGGAAGCGCTTGCAGCGCGTGGGCAAGCGGGCCGCCAAATTCCAGTTTGTGGCCTGTTACCACGAGCTGGTGGTGGAGTGCACCAAGAAATGGCAACCGGATAAGCTGGTGGTAGTGTGGACCCGGCGGAACCGACGCATCTGCTCCAAGGCCCATAGCTGGCAGCCGGGCATCCAGAACCCATACCGGGGCACCGTGGTGTGGATGGTACCTGAGAATGTGGACATCTCTGTAACCCTGTACCGGGACCCCCATGTGGATCAGTATGAGGCCAAAGAGTGGACGTTCATCATTGAGAATGAGTCCAAGGGGCAGCGGAAGGTGCTGGCCACGGCCGAGGTGGACCTGGCCCGCCACGCAGGGCCCGTGCCAACCCAGGTCCCGCTGCGGCTGCGGCTGAAGCCCAAGTCAGTGAAGGTGGTACAGGCCGAGCTAAGCCTCACTCTGTCCGGGGTGCTGCTGCGGGAGGGCCGTGCCACGGATGATGACATGCAGAGCCTTGCGAGCCTCATGAGCATGAAACCTAGTGACGTGGGCAACTTGGATGACTTTGCCGAGAGCGACGAGGAGGAGGCCAATGGTCCAGGAGCCCTGGAGGCACGGGCACGTGTCCCCCAGCCAGGCCCAGGCAGTGCCCTGAGGCTGGGGCATTTCCCAGAGACCCCTCGGGAGCTGAAGACACTTTGTGAGGAGGAGGAAGAGGGCCGACTGCGGCCTTGGCAGGCAGCTGCCAGCCCTTCTAGTGCTGAGGATACCAGCCCAGCCCCTGTGAGTGCCCCTGCACCCCCAGCTAGGGCCTCCCGGGGCCAGGGCTCAGAACCAGCTACTGTAGCAGGGGGCCAGGTAGGGCTCAAGGCCCCAAGGCCCCCTGGAACCCTGCCAGAGACAAGGTCCCCAAGACAGCCAGGCCAGGACGTGGCCCCCACTCCAGCCCCTCGGCTCCAGAAAGGCTCTGATGCCCCCTGGCCCCCAGTCCACCAAGGAGAGGATGAGGCCCCCAAAGCCTCCAGGGCTCCCCCAGCAGGAGTGGATTCTGCTGTGGAGACCCAGGCTCGGGCAAGCCCTCAGGAAGGGACAGAGGCCCAGGGAGCTGGGCTGGGCCCAGGCATTGAGAACAGAGACTCCAGCAACTCTTTGGAAGGGCAGAAACCCAAGGTTGAGGAGGGGCCCGCTGGAGACAGGGCAGAGGCTAGTGGGGTGGATACTGGGCATGGGCCAGGAGTCAGAGAGGTGAACAGTCAGAGGTCAGTGGTCAGACCTGGGGAGGTTGAAGAGAGTTTAGAGATCGGTCACGTGGATGCGGAGCAGAGGTCAAAGGTGAAACCTGTGGACACTAAGGGACCAGAGGCCACAGAAGTGACATCTGAGGCAAGATTCAAGGGGACTCCCGAGGCTCCTCCAAGGGGCTCTCAGGGGAGAATAGGGGTCAAGACCAGGGATGAAGCTCCCACAGTCTTGAGCCCAACGCCAGCAGAGCCTGCGGGGCATTCCAGGCATCTTGGTGACCAGGCGGCCAGGGCTGCTGCAGGCCAGGAGAGAGAGTGTGCAGAGGTGAGGGGCAGAGCCCCTGGTGTTGGGGGGACAGGCCTGGAACAGGGGCCCTCTGCTGGAGCACCAAGCGCTGGGCCCCAGGTGAGCTGGTACGAGGGGCCCCCAACAGCAGCTGAACAAGGGGTGATGTCCAGGGATCTGAGGACCTGGGAAGTAGAAACTGGGGATTCGAGGGTCCTGGGGACAGAGCCTGGGGTGGCAGAGTCAGAGTTATCGGGGACCCAGGAGATCTCAGGGTCCCCAGAGATAGTGTCTGAGGCAGCAGAAGCGAAGACCTTGGGGACCCAGGAGACAGAGGCAGTGAGATCGGGGGTCCTGGAGTCAGAGACTGCTGAGATGGCAGAGTCTGAGGATCTAGGGATCCAGAAAACAGGGACAAGCATTTCAGGGGCCTCAGGGACAGAGGGTGGGACGGCAGAGTGTAAGGCACTGGGGATCCAGGAAACAGAGGCTGGGGGCTCAGGAGTTCTGGGGACAGAGACTGGGGTGTCGGAAACTGAGATGTTAGGGACCCAGGAGATATCTGGGTGCTCAGGGATACAGAGAAAGGAAGCTGAGACAGCAGAGTCTGAAATACTTGGGGCCCAGGACACAGAAGTGGGGTGTTCAGGGGTCTCAGAGATAGAATCCAAGATAACAGGGAGCCAGGAGACAGAGGTAGGGAGTTCAGGGGTCCCAGGGACAGAGACTGAGGTAGCAGAAGCTGAGATACTGGAGATCCAGGAGATTGAAGCTGGGGGTTCAGGGCCCCCAGAGATGGACACTGAGACCCTGAGGACCCGGGAGACAGAGGTGGGGGGCTCAGGGGCCCCACAGATGGACACTGAGACCCTGAGGACCCGGGAGACAGAGGTGGGGGGCTCAGGGGCCCCAGAGATGGACACTGAGACCCTGAGGACCCGGGAGACAGAGGTGGGGGGCTCAGGGGCCCCACAGATGGACACTGAGACCCTGAGGACCCGGGAGACAGAGGTGGGGGGCTCAGGGGCCCCACAGATGGACACTGAGACCCTGAGGACCTGGGAGACAGAGGTGAGGAGCTCAGGGTTCTCAGGGTCAGAGGCTGGAATGGCAGAGGGTGAGGGACTAGGGAATCAACAGACAGAAACTACAGTTTTAGAGGCGGAGAAGGGAAAGGCTCGGACTTCCGGGGTCCAGGAGGCAGAGACTGGACTTGGGGAGACCCTCAAGTATGAGGCTTTAGGGGTCCCAGTCGTAAAGCATGAAGTTTCAGAATCCCAGGGAACAGAGGCAGAAACTACAGTTTCAAGGGGCCAGGAGGCGGAGATTGGGATTTGGGGGGTTTCAGAGGCCAAGTCTGGGGTTTGGGGGGCCAAGGAAGCAGAGGTGGAAGTTTCAGGGGCTTCAGAAAACCCATCTGGTATTTTTGAGGCCCAGGAAGCAGAGGCTGGGGTCTCAGGAGCCGAGAAGGGAAAAGAAGCTGAGGGAAACCTCCCAGAGGCCAGCCTGATGGAGGTGCAGGTGGCCAGTGGGGCAGGGGCTGAGGTGTCCAGGCCCTCCGGGGCCTCTTCCCCAGAGGAGCCTGAAGAGGACAGGAGGCTGCCGGGCAGCCAGGCACCACCTGCCCAGGTCAGCTTCAGCCAGTCCCTGTTGGAGTGGTGCCAGGAAGTCACTGCAGGCTACCGCGGTGTGCGCATCACCAACTTCACCACGTCCTGGCGCAATGGTTTGGCCTTCTGTGCCATCCTGCACCGATTCTACCCAGACAAGATAGACTTTGCCTCCCTTGACCCCCTGAACATCAAACAGAACAACAAGCAGGCCTTCGATGGCTTCGCGGCCCTGGGCGTGTCGCGGCTGCTGGAGCCGGCGGACATGGTGCTGCTGTCGGTGCCCGACAAGCTGATCGTCATGACCTACCTGTGCCAGATCCGCGCCTTCTGCACGGGGCAGGAGCTGCAGCTGGTGCAGCTGGAGGGCGGTGGCGGCGCGGGCACGTACCGCGTGGCCAGCGCCCAGCCGAGCCCCCCCGACGACCTGGACACCGGGGGCCTGGCGCAGCGGCTGCGTGAGCACCGGGCCGAGGCGCCCCAGCAGCCCCAGGAGGCCGCGACCCGCGTGGACGCGGCGGCCCCCGAGGCGGCCTCCAAGGACCGCGGGGCCGCAGCCGCCCAGGAGGCGCGCTCCGCCGAGGCCCCGGCCGACGGTCCCGGAGCCCGGGCGTCCGTGCCCCCAGCAGAGGGGCTGGTGAACGGGGTGGGGGCGCCGGGCGCCGCGGGCGGCGTGAGGCTGCGGCGGCCGTCGGTTAACGCGGAGGCCGGGCCGGTGCCCCCGCCCCGCGCGCACGGCTCCTTCTCGCACGTGCGCGACGCAGACCTGTTGAAGAAGAGGCGCTCGCGACTCCGGAACAGCAGCTCCTTCTCCGGGGACGAGCCCGACTCCGGAGCGGCGGGAGCGGCGGCGGAAGGCACGAGCCCTGACCCCAGCCCTGCCCCTGGCCTTCCCGCAGCCTCAGCCCCACAGCAGCCCGCTGGTGGGACTCCTCCGGCGGAAGAACCGCCCCCAAGCCCAGGGGAGGATGCTGGGCTGCAACGGTTCCAGGACACAAGTCAGTACGTGTGCGCGGAGCTTCAGGCCTTGGAACAGGAACAGAGGCAGATAGATGGGCGGGCAGCCGAGGTGGAGAAGCAGCTAAGGACCCTCATGGAGTCAGGTACCGACAGGCTGCAGGAGGAGGTACTGATCCAGGAGTGGTTCACTCTGGTCAACAAGAAGAACGCTCTCATCCGGAGGCAGGACCAGCTGCAGCTGCTCATCGAAGAGCAGGACTTGGAGCGGAGATTTGAGCTGCTGAGCCGGGAGCTACGGGCGATGCTGGCCATTGAAGACTGGCTGAAAACGGCTGCGCAGCAGCGCCGAGAGCAACTCCTGCTGGAGGAGCTGGTGTCGCTGGTGAACCAGAGAGACGAGCTGGTCCGGAACCTGGACCAGAAGGAGCGGACCGCCCTGGAGGAGGATGAGCGCCTGGAGCGCGGCCTGGAGCAGCGGCGCCGCAAGCTGAGCCGGCAGCTGAGCCGGCGTGAACGCTGCGTGCTGAGCTGAGGCCACGCGGGCCCAGAAGCCTTCGCCCCTCCCGGTCCGCAGCCTTTCTCGCCGCCGCGCCGGATCGCCGCTTTGGCCCTGCGCTCGGGAGGACCGGACCCTCCCTGGTGCCGCGCGCGACCAGTAGGGGCCGCCGTGACCCTTTACCGGGAAAGGAAGCGCAGCCTTTCGGGCCCCGACGGACGAGGGCGGCTGGCTGGGCGGCCGCGCCGTCCGGGCCGTATTTATTAGTCCGTGTGAGTGAGTGTGCGTGTGTGTTCGTGGTGGACTGAGGGTCCCAACCGTGCCCACCCAGAGCCCGTACCCAATGGCCGGACCCCGCTGGCGAGCTCCAGGGGTGGGAGGGACGGATGGTGAACTGCCGCGCTCAACACCCCGCCCCCTTCCTGTTCCTAGCGAGCAATAAAGTTGGAAAAGGCCACGCCAACGCGCCTGGGCTTTCTCAGGGTGACCCGGGCTTTCAATAGACGGAAGGGGGTGGGGCCTTGGCCGATACGGCGGTCTGCGATCCTCACGGGGACTGTGCAGGAATGGGGAGGTTTTCAGATGCCAGCCGAGGCAGGACCAGAGGCCTGACCTCTGCCTTTAAAGGATGATGGGGTTTGGGTTGTTGATGGCTGTAGGGAAGTCCCGTTTCGAAAGAAGAGACGAGAACA\n>AY338304.1 Uncultured bacterium clone BREC_93 16S ribosomal RNA gene, partial sequence \nTGAGCGGCGGACGGGTGAGTAACGCGTGGGTAACCTGCCTCATACAGGGGAATAACAGTTAGAAATGGCTGCTAATGCCGCATAAGCGCACAGGACCGCATGGTCTGGTGTGAAAAACTGAGGTGGTATGAGATGGGCCCGCGTCTGATTAGGTAGTTGGCGGGGTAACGGCCCACCAAGCCGACGATCAGTAGCCGACCTGAGAGGGTGACCGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGAGGAAACTCTGATGCAGCGACGCCGCGTGAAGGAAGAAGTATCTCGGTATGTAAACTTCTATCAGCAGGGAAGAAAATGACGGTACCTGATTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGACGGACGGGCAAGTCTGATGTGAAAGCCCGGGGCTTAACCCCGGGACTGCATTGGAAACTGTCCATCTTGAGTGCCGGAGAGGTAAGCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACGGTAACTGACGTTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATACTA\n>XM_053628787.1 PREDICTED: Ictalurus furcatus calcium/calmodulin-dependent protein kinase (CaM kinase) II delta 1 (LOC128609903), transcript variant X2, mRNA \nGAAGAGGCGAAAGCGGATCATTTACGTCTGAGCAGCCGCAGGAGCAGATCGACGCTCTCAACTTCACTCAAGCGCGAGCCATCTGCAGAACACAGACACAACACACCTGCGCGAGCGGAGAGCTGACAGACTGGACTTTTTCTTCTCTCCGCAGCATTTAGGCGTTTACTTTCATTCTGTGAAGCACAGCTGAGGAAGCGAGGCATTAGACTTGATTGCTGTTCAGATTTGTCCTGGCTGTCTTTCTCGGCATGGCTGCGACCACCTGTACCAGGTTCACCGACGAATATCAGCTCTATGAAGAACTGGGCAAAGGAGCCTTCTCAGTGGTGAGACGATGTATGAAAATCTCCACTGGACAGGAGTACGCTGCCAAAATTATCAACACCAAGAAGCTGTCTGCCAGGGATCACCAGAAGCTGGAACGTGAAGCTCGCATTTGCCGTCTGCTTAAACACCCCAACATTGTGAGACTCCATGACAGCATATCTGAAGAGGGATTCCACTACCTCGTCTTTGATTTAGTCACAGGAGGGGAGCTGTTTGAAGATATTGTGGCCAGAGAGTATTATAGTGAAGCTGATGCCAGTCATTGCATTCAGCAGATCCTTGAGGCCGTTCTCCACTGCCACCAGATGGGAGTGGTCCATCGCGACCTGAAGCCTGAGAACCTGCTTTTAGCCAGCAAACTTAAGGGAGCTGCAGTGAAACTGGCTGACTTTGGCTTGGCCATTGAAGTGCAGGGAGACCAGCAAGCATGGTTCGGATTTGCTGGCACTCCTGGTTACTTGTCTCCTGAGGTGTTAAGGAAGGAACCCTATGGGAAGCCAGTTGATATGTGGGCTTGTGGTGTGATTCTCTACATCTTGCTGGTGGGCTATCCTCCATTCTGGGATGAGGATCAACATAGACTTTATCAGCAGATTAAGGCTGGTGCCTACGATTTTCCTTCTCCTGAGTGGGACACAGTGACCCCAGAGGCCAAAGATCTGATCAATAAGATGCTGACAATCAACCCTGCCAAACGCATTACTGCTGCAGAGGCCCTCAAACACCCATGGATCTGTCAACGCTCTACAGTGGCCTCTATGATGCACAGACAGGAGACTGTGGAATGCCTGAAGAAGTTTAACGCCAGGAGAAAGCTAAAGGGAGCAATCCTGACCACGATGCTTGCCACAAAGACCTTCTCAAAAGGGAATCCATATAAGAAGCCTGATAGTGTTAAGATCAACAACAAAGGCAACGTAGTCACCAGCCCTAAAGAGGCAGTCCCCTCTCCTGCTCTGGAGCCTCAAACTACTGTTATCCACAATCCGACTGACGGAAGCAAGGTAGAATCCTCCGAGAGTGCCAACACCACCATCGAAGATGAGGATGTGAAAGCACGGAAGCAGGAGATTATAAAAGTGACCGAGCAGCTGATCGAGGCCATCAACAATGGAGATTTTGAAGCTTATACCAAGATCTGTGACCCTGGACTGACCTCTTTTGAACCTGAGGCTTTGGGGAACCTGGTGGAGGGAACAGACTTCCACAGGTTCTACTTTGAAAACTCTCTCTCAAAGAGCCACAGGCGTACCGTCCACACCATCTTGCTGAATCCTCACGTGCACCTGCTGGGAGAAGACGCTGCCTGCATAGCTTACATCAGACTCACCCAGTACATCGATGCTAACAGCATGCCTCGCACCATGCAGTCAGAGGAGACTCGGGTGTGGCATCGCCGTGACGGCAAGTGGCAGAATATTCATTTCCACCGCTCAGGCTCGCCAACCGTGCCCACCAATTAACGTGGTGTCCTGACCAGCGCAGTTCAGTGTAAAGGACTTAATGTCAGATGGCCACTGAGTGTCTGCTTTATTCAAACCCCACCTTTACAACTTCTCCACCCTGTCAGTCTTGTTTACATATCGTCACTGCTGGACTTTAGCCTACACACAGGTGGGGAATTAATATCATTTTGTATTAGGATGTGTGTATGCGTGCGACTTGCACGCTCTCCTCATAAACCATTGATGTTAAAGACTTATGTATACATATTTTTTTTTTCCCTTTTTATAATTTAATGTTCTATTTTCTATGGTGTGAAAGTAGGGCGTCACACTTGCTGATATATCTTTGGGTGTGTGGGTACATCAGGAAAAGAAATGCTTGATCTCTGTACACAGTCAGATACAAAGTCAAACAGTACATAGACGAATCTGGGCGCACGTGTGACATGTTCATATTAGAGTGATTAGTAATCTAGGCACAATATCCGTCACTGATCTTGAGGATATGATTAGCAGCAAATCAAAGCCAATTCAGTCTTGTTTCAGTGCTTTTCTATTTTAAGTGCAATACAGCTGAAAAAAATTCATTATGAATCTGACAAATGAGCTCGCTTTTGTTTTTTTGGTGAAGTTTTTGTGAAGTTGTGTGAAGTGCTATTCCTGCTTTATCTTTTAGAGAATTGACAGTTGACCGTGATCTTAGTTCTGCGAGCTTTGTTCGGTTTTAGGTTGCTATGGCCTAATGGGTTTAGCAACACTAATGTGCAAAACTGACAAAGGAAGCACATTTAGCCTACAGTTCGCTATTTTATTCTGATGTTTTCCACAGCATCACATGAACACAGTAGAAAAAGTGTAAAAATTTCAATTAAAGAATGTACTTTATCAATCAACACGAATAATTGGTAAACCAAACTATTTTATTTTATTCAGTTGTTGTGAGAGTTTTATGCTTCTGTTTTCATTTTTATATTGTTTACTAACATTTGATGGGGGTATTCTTTGGAAAGAAAAAAAAACGAGTTTTCTCTATTTTTCACACCTTCCTTAATTAATTAGCATTAGCTGTTATGTATTGCATGAAACATCTTTTATCAACTTTTATGTACTTTTATGTACTTCATGTTTATGATCTTGTGATGGTTCCCTTCTCAAGGGTGAAGTAGAATAAATGGTTTATGCTTTGTATTCCATACTGTCCATTTAAACCGAAAAAGAGATGAGTAGTTAGTGCAGTTTGAAAATGATTTATATTTGCAAAAACTATTACGATTATCAATGCAAAATCCAAAAAAAAAAAAAAAAAAGAAAAATAGGAAAATTTGAAATGGGAAACATTTGACAGATTAATATAAAAGATGATTTATTTGTAGCACAGTTGATATTTGATTTAAATAAAGCTTGCCTTTGTTTACTCAAACTTTGTTTAAGATCGACTGTAATGCTTCATAACATCAGTTTGTGGAAAGCATTGGGAGGAAACCTGAATTTGGGACTGATTATTAATCAGTCTGATTATTAATGATTGTTTAATTTGGATTCAGTGTCTGAAATGCTATCAGCGGTTTGAGACTTAAAGATTATCAGTTGTTATCTAGTTCCATTTTATTTGCTTTGCATTTAAAATTTTTTGTTATTTTTGTTACTTTTTTTTTATTCTAGTCCAGTTCCCTTTGTACTTTTTATTGCTGTAACTAGATGAAAATCCCCAATCCCACAAACCTGTACACTAAACAGAAGTACAAATACTCGAGCAGTTAAAAAGGACACGATAAAGCAAATAAATAAACTGTGAAAACATCCTCTTTTTTTCTCGGTTAATACATATTCATTTTGAGATTAAGAAAATTAAGGAATTTAAATAGTTTGTATATGTGGATACAGAGAACAACATATTACTGTGCACAGAAAAACATATTACCAACCCAATGCATGAATAAAATATTTCTGCCTATTTTTTGTTGTTGTTGTTGTTGTTGTTGTTGTTGTTGTTAATCTTAAATTGGGTTTAAAAGTTAAGTTTAATGGAAAACTATTAGCCATTTTGTGGTTTCTGTACATAAAAAAGGTTGGGGTTTTTTCCTCCTTTGTTTTTTTGTAAAAACTTTTTACAAAGAAAGTGTCCCATGTTAAATAAAAAAGCCCCAGGCACCAGCA\n>XR_003317481.3 PREDICTED: Ursus arctos uncharacterized LOC113259124 (LOC113259124), transcript variant X3, ncRNA \nGGGCCATCTGCAGAGCCCTCTATTGGACGAGCCATGCTGAGGGATCCCTCTGGGAACCAACCAAAGGCGTCAATCTGGAGCCGAAGAGGCGTTATCGCCCGGCGGACCAGTTTTGGAGGTCAAAGCTCCGCGGGGCGCAGCTAGTGGCGGAGCGAGCTGTGAAGGGAGGGTCTTCCACTTGTCGCCAGCGTGAACTCTGGTGCCCCGTGAGTGTTCGGAATGAACCCCCAACTCCGGACCCTCAAATCCGCCCACGCCCAGGCGTGCTTGTCTCTGCTTCGACTTTGTCATGTAACACTTTCTCCTTTTTTCCCCTGGGATCCTTTTGGTCCCTCCCCGTCTCTTCGCGCTCGGAAAGCCGAATTTCGCTGATGCTCTCAGCTTAGAGGAAAAAATTTTGTGCGGAATTCAGTCCTTCCTTCTGTTAGGCAGCAGTCGTTGGATGGGAGGGACTAAAAATCACTTGGTGCCCTGACAAGATTTGTTACTGTTGCTAAAATCGTCAACTCTAATGCTTTAAGGGAGATAACTTCCTGCAAATCCAGAACTTTCGGATTACTTCCGAGCTTAAAGAGCACGCCACATGAAGATGAAGGCAGAGATTGGGTTGATGCTTCTCCAAGCCAAGGAAGTCCAAGATGGCCAGCATACTCTCAGAAGCTATGGGAAAAGCCTGAAACAGATCTTTCCCTCACAGCCATCAGAAGAAACCATTCATGCTGATACCACGATCATGGATTCTAGGCTCCAAAACTGAGCTGCTTACAGAGTGTTATTAAATATGTGGATACATTTCGGGCACCTGACTGGCTGTTGGAATAGCATGAGACTCTTGATCTTGGGGTCATGAATTCAAGCCCCACACCAGAGGGAAAATACAGACGTCCATTAACTTCAATCCCTGGAGTCAGAATTCAACTTGAGACATATGGATGGGAGCTATGCTCCATTTGTGGGATGGGAAGAAACCAGTTCCCCTTTTCTAGCCTCACATCTGTTTGGATTGTATCTTAGTAGGCAATAATGAGAAGGCTGCCTAGGGCTGACTCAACCATAAATATTAGAATTAGGAGAAGTATTAGAATTGCGAAGCCATGTTTTTTTGTGAATGGTGCTCCCTATTCTTTGATTAAGAGCTTAAACCTCATTCACACTCATGACTTACAGGCTGAGCCAGCAGGAAGGTGGACACTAACTCTAATCTCCTAGGAATGAGGAATGAAAAACCAAGACAAGCAGACACTGTAAAATTGTTTTTGTTTTTTTAATGCAGGTCAAATATCCTGAAACATACATGTATTTTGATAGTCTTCTAATGCCACTTTAGTTCAAATATTAAAGTAACACACACGAGCTAAGAGAATTCAATATTGTTCCAAGGCACTTACTGAATCTCCATGACTAGATGAAAACAAGGACAATTAAGATGAACAATTAGTATATAATATAAAAATAACTTTTTGCTTACAATTTACAAAATGTATTATTATTACAATCTTTGATCTCTGATAACCTGCAATGCTGGCTGCATGAATCCAGCAATTTTAAAATTCAGAAACTATTTTCTAAAACTTCAGGGCAAATAATTTACAAATAAGGTACACAAAGATTTAGACCATGCAGAAATTTCTTACATCTTCTGTTAATAATATTTTATGACTGCAACTTTATCAAATTATATACCTACTTGCCCTGTACATATACAAAATAATGCATACATGATAAAACATTAGCAAAAGAGTAGTCCTTAAATTCAATTTATCATAAAAGTATTACTATATTAACATGTCTACAAGCAGCGTGTAACAGGTTAAGAGACATTAAGGCAATAATACTTGAAGTTACAAAATAAACCAATGTAATACTTTCCTAAGTGTAGTATAAGGCAGGTAGATGGTCCAAGCAAAAAAATACTAAGGTAACAATCTACACTGCTGTTAGTCCCACATTTTTAAGATGGAATACTATAAATCTGGCTTTCAGTGGCACTTGAATTTTCCAGTATAATTTAAAGTGTCTTTTAGCTCCCTGAATCATGTCCATTCTGAAGGTGGATCTCTTGGTCCTTTGGGTTTTCCACAGCGATTACGAAAACCTGTAATCAAAAGACCAGAGTAATTGGTCAGTGTTCAGAAATGTATTTTAATGTACTAGAAACTCTTAATTTGCTTTGGGTAGTTCATTTAAGAACCTAAATAAATCAGCACAAAGTATGGTAAACTCTGCCTTCAGGAAAGCCTGAAATGATGGCAAATAACCGTTTCTCATTCTTGCCAGCACTAACTACATAACTAAAGTTTTAAAATTATTTAGTAAACAAATTACCAATATCTGTGGCCTCTGTTGGACTTTCTGATATTTGATCTTTCTTGTTACTGAAAAGAGGCGGACATTCTGTACAAGTCTCTGTGTGAATACCTCCTGCTGGATGATCTAAAATGCAAAATAAAGCCATTGTTAACCACC\n>XM_011504069.1 PREDICTED: Ceratosolen solmsi marchali transmembrane protease serine 3-like (LOC105365808), mRNA \nTTTTCAATTTAAATTTTTGCTCTTCAGATACTATGAAAATTATTTTCAAAACATTAATTGCACTTCTACTGGTGCAAGTCAGTTATGTAAATTCGTGGGATCATCTCAGGCACGCCAGTCCTGGTCAGTTTCCACATCAAGCAGTATTGGTATGGATCGGAGCATTACCATTTCCTCCATTTCACTTATGTGGTGGTGCAATCTTGAACGAATTCTGGATTTTAAGTTCAGCGTACTGCGTTGTTGATATATTACATTTAAATAACGTACGTATCAAGGTTGGTAGTCACAATATTTCTTTAGATGACGAGCACGTACGAAACGTTGAGGTGGCAAAGATTATCGTTCATGAAAAATATACTAGGTGA\n>XM_048344465.1 PREDICTED: Perognathus longimembris pacificus LRR binding FLII interacting protein 1 (Lrrfip1), transcript variant X23, mRNA \nGACGGCCCCGCGGCGGCGGCGGCGGACGGCGGCGGACATGGGCACCCAGGGCTCGGGGCGCAGGCGGCTCCCCAACCGGGAGCGGCTCACGGCCGAGGACGACGCGCTCAATCAGATCGCGCGCGAGGCGGAGGCCAGGCTCGCAGCGAAGCGTGCGGCGCGGGCGGAGGCGCGGGAGATCCGCATGAGGGAGCTGGAGCGGCAGCAGAAGGAGGTTGAAGAGAGACCAGAAAAGGATTTTACGGAGAAGGGGTCTCGCAACATGCCGGGCTTGTCTGCGGCCACGCTGGCCTCGCTGGGCGGGACTTCCTCCCGGAGGGGAAGCGGAGACACCTCCATCTCCATGGACACCGAGGCTTCTATTAGGGAGATTAAGGACTCCCTAGCAGAAGTGGAAGAGAAGTATAAGAAGGCCATGGTGTCCAACGCCCAGCTAGACAACGAGAAGACCAACTTCATGTACCAGGTGGACACGCTGAAAGACACGCTGCTGGAGCTCGAGGAGCAGCTGGCCGAGTCCCAGCGGCTCTACGAGGAGAAAAGCAAGGAGTTGGAGCGGGAGAAGCACGCGCACAGTGTCCTGCAGTTCCAGTTCGCCGAGGTGAAGGAGGCGCTGAGGCAGAGGGAGGACATGCTGGAGAAACACGGAATAATCCTAAATTCAGAAACAGCTACCAATGGAGAGACTTCGGACACACTAAATAACGTCGGATACCAAGGCCCGACTAAGATGACAAAAGAAGAGTTAAACGCCCTCCAGTCAGCCGGCGACGGGACACTGGATATTAGGTTGAAAAAGCTCGTGGATGAGAGAGAGTACTTATTGGAACAGATTAAGAAACTCAAAGCGCAGCTGGAGGGGAAACAGAAGAACAACAAGCTAGACAATCTGCGATCTGAAGATGAGGTCTTGGAAAACGGGACAGATGTGCACGTCATGGATCTACAAAGGGATGCCAACAGACAGATCAGCGACCTCAAATTTAAACTTGCAAAGTCAGAGCAAGAGATAACTGCATTAGAACAAAACGTAATAAGGTTAGAGAGCCAGGTATCGCGTTATAAGACAGCTGCTGAAAGTGCAGAAAAAATAGAAGACGAACTTAAGGCAGAAAAGCGGAAACTCCAAAGAGAGCTTCGCTCCGCATTGGATAAAACGGAAGAGCTTGAGGTGAGCAATGGCCACCTAGTGAAGCGTCTGGAAAAGATGAAAGCGAACAGGAGTGCACTTTTGTCCCAGCAGTAAGCACCAGCCTGCGGGGCAGCTGCGCGTGTGTGTGTGGCCCCTGGGCTTTTCCCTGTCCTATGAGAGCGCCGCTTCCCCTATGCCTCCGCAATGCCTCCGCGGAACGCTAGGGGGAGCCCCTGGCCCTTCCCACCCGGGCCACATCCACTCCAGAGAAGCCCGCAGCCGCCGGGGCGGCCTGGTCTGCAGCCGCCTTCTCCAGGCTGGGCCGGCTCTCAGAACCTCCAGGTTTCTTTGTAAGCACACTGGGCCTCGTGGAAGCTCGGCGTCTCCGTGGCACAGCTCGGGCCGACCGAGGCCAAGATGAACGTGGAACATGAGTTGTCTTTTCATGTGTCTTGCTGAAGGTTAAGGGGAAATGTTACCGTGTGGGGACTCCTCCAGGGCAGAACTACAATTTGAGTGACTTCCGTAGTATCTCTTAGTCTATGCTTTTCATACACGAAACACTGTGGAACCACAAGCCATTACCAAGCGAAACTCTCACTGCGAACAAGAGGATGGTCTAGGCGTAAAAGTGACCTTAAGAAAACTCTTTACAGGCAACAAATGAAGCTTTTCTAAGGGATTTTTTGCATCTGTTCAGTCATGAGAATACTTTTTTCCAGGGTAATTAGGCAATAGCTTCTCTGAAAAATGACAGCTTTTCATTTGCATTATATTTGGAATTGAAGTTGTTAACTTCTTTTAAAGAATGTACTATTAGGAAAATAAAATATGAAATGTTAAAAGACTTGAGCAATGTGGTTTTTATTTTTTTC\n>XM_005356914.2 PREDICTED: Microtus ochrogaster leucine rich repeat containing 71 (Lrrc71), transcript variant X2, mRNA \nCAGTTGCTGGCCAACTGGGTCTGGTGAGTGGCGATCCTCAGGGCGAGGCCCACAGAGTCCTGTCTCATCTTGCCTCTCACTCAAGGAGTCCAGAGCCACCAGAATGTCAAATGAGCCGAGTGCCACGGGGACCTCACCTAGGACACCTCGTCCTGGGGCCCAAAAGTCATCCGGTGCGGTAACCAAGAAGGGGGAGCGGGCTGCTAAGGAGAAGCCAGCAACTGCCCTGCCTCCAGTGGGTGAGGAGGAGCCAAAAAATCCCGAGGAATACCAGTGCTCGGGGATCCTGGAGACAGACTTCGCAGAGCTCTGCGCACGGTCAGGCTACACGGACTTTCCCAAAGTCGTCACCCGGCCACGGCCCCATCAGAACTTTGTCCCTTCTGCCTCCATGTCAGAAAAACCCACCCAAGACGACCAGCGGCTGTCGGCATCCTGTAGCCAGAACAGCCTGGAGAGCAAATACGTGTTCTTTCGGCCCACCATTCAGGTGGAGATGGAGCCAGAGGACAGCAAGGCAGTGAAAGAGATCTACATCCGAGGTTGGAAAGTTGAGGATCGGATTCTGGGTATCCTCTCCAAATGTCTACCCTCCCTCAGCCAGCTGCAAGCCATCAACTTGTGGAAGGTGGGGCTGACGGATAAGACCCTGACCACGTTCATCGCCCTTTTGCCTCTCTGTTCCTCCACACTCAGGAAGGTATCTCTGGAAGGGAACCCACTGCCGGAGCAGTCCTATTACAAGCTCATGGGACTGGACAGCACGATCGCTCACTTGTCTCTGAGGAACAACAACATCGATGACCATGGGGCGCAGCTCCTAGGCCAGGCACTGTCCACACTGCACAACAGCAACAGGACCCTTGTTTCACTGAATCTGGGATTCAACCACATTGGAGATGAGGGCGCAGGCTACATTGCGGATGGCCTGAGGCTGAATCGCTCTCTCCTCTGGTTGTCCCTGGCACACAATCGTATTCAAGACAAAGGAGCACTGAAGCTGGCCGAGGTCCTGCGCCCCTTTGAGCTGACCCACAGGGAGGTGGTGGAGAGGAGGCGCCTGCTGCTGGAGAAAGGATCGCAGGAGCGGTCACGATCGCCTTCCTCCTCCCGACATGGGGACTCCAAAACAGAGCGTGAGAAGTCTCAGACAATGGGGATCAGCAGTGTTGCTTTGGCAGACAAGCCAGAAAAGATGCAGACAGTGAAAACACCCAAGGGCCTGGGCAAGAAAAAGGAGAAGTCAGGGGAAGTTGTAAAGAAGGAGGAGAAGTCAGGCTCCGGGCAGTCACCCACACAAGGAACCCCTAAGAAAGAAGATGCCACAAAGGCAGGCAAGGGGAAGGTCACCATCCCCGAGCAGAAGATGAGCAAGGGAAAAGGGCCCAAGACGGGGAGCAAAGAGAAGCGCAGCATCCTCCTGGAGTCTGAGCTGGTTGTCGAAGCTACAGAGATGGTCAACCCTCTCCTGGAGCCTGTGGAGCACCGAGATGGGAAAGTTTTCATGCCTGGGAACAAGGTCCTTTTGCACCTCAACCTCCTCCGAAACCGAATTACAGAAGTGGGGTTGGAAGGTTTCCTTACTGCCGTGCAATACCAGGTTCAGGTCTCCAAGCCCAAGAGTTCATCCAAGGGTCCCTTGGGGCTGCTGTGGCTATCCCTGGCGAAAAACTGCTTTGACCCACAGTGTCCAACATACACCATGATTCAGGAACTGATGCTGCCAAGGGACCCTGTGAAGGCCAAGGTCAGGGAGGAGGAGGCCACAGCTACCTAGGCTTCCCATGGGAGACACCTTGGACCATTATCAGCCTATTGCTGTGCTATTCTTTGAAAATCACTTCAGAACTGTTGGGAACATTTGGGCTCCTGAGTCTGTTCATATTGCCTGGTTAGGCATGGCAGAGTGGTGGCCTGAATCACACGGTATCTGTTGGGGGGATGAACTGAGCTCCTGGCTCCACCTCCCGAGTGCCCCAGCAGCATCCCCCAGCCCCTCTCTGCCAGCATGCACACAGCTGATGATGGAACTAGGACCCATCCCCCAGCATCCTTGCTGCTTATCTCCAACCCATGTGTTTGCCTGGCTTGTGAGACAAATGCACTCTGGAGAGGGTACTGTAGCCATATTTGCATAGCAAAGGCCAAACATTAGACATGGCAGGTGAGCAACCTGAAATCATGGACATCCAGAGTTGGGACTGCCAGGCTGCCTCTAAATTCTGGAGAGCCCATGCTAACCTACAGGGAATCTCCAACCTCTTTCATCTCTTGGCCCTCCGCACTGGCTGCTGAGTGGCTCCAGGGACATCTTTCTCCATTGCTCTGAGTCC\n>XM_030788246.1 PREDICTED: Chanos chanos meiotic nuclear divisions 1 (mnd1), mRNA \nATGGGCGGACAGTCTAAGAAGAAAGGATTGAGTTTGGAGGAGAAGAGGAGTCGCATGATGGAGATATTTTTTGAGACTAAGGACGTGTTTCAGCTGAAGGACATTGAGAAAATTGCCCCCAAAGCCAAAGGGATCACGCCCATGTCGGTGAAGGACGTCCTCCAGAGTCTAGTGGACGACAACATGGTGGACTCAGAAAGAGTGGGAACCTCCAACTATTACTGGGCATTTCCCAGTAAAGCTCTCCATGCCCGTAAACGCAGACTGGAAGAACTGGAGAAGCAGCATTTGGAAGGGAAGCAGAAGAAAGCCAGTCTACAGCAGGCCGTGGACAAAGCCAAAGTGGGACGCCAAGAAACGGAGGAGAGGAGTGCTCTGAGGCAGGAGTTGCAGACCCTGAGGGAGCAGCGGGACCAGCTCAGGGAGGAGGTGGAGAAATACAGGGAGTGTGACCCTGAGGTGGTGGAGGAGATCCGCAGAGCCAATGTGACTGCCAAGGAGGCTGTCTCACGGTGGACAGACAACGTCTTTGCCATCAAGTCTTGGGCCAAGAGAAAGTTTGGATTTGAGGACGCACGGCTGGACAAGGCCTTCGGAATACCGGAGGACTTTGACTACATGGACTGA\n>XM_051990939.1 PREDICTED: Antechinus flavipes zinc finger protein 665-like (LOC127557627), mRNA \nATGAAGTACTACCCACCTGCCCCTCCCATCGCCTTGCCCACCAGACGCCCCTTCCCTCTCCGAGAACACCCGCCCTCTCCGAAAACACCCGCCCTCCCTGGGCACACCCGCCTTCTCCGCATCCCCCTCTTAGGCGCCATCATGCTTGCAGTAACCAACGACACAAGAGTCAGCCGCTGGGAGAGGGCAATCATATGCCCACCCACCTCCCCCGGCACGCTCACCCTCCTCTGCTCTCCTGGTCTCCTGCAGCTTTTCTCCCCCTCTTCTGGCGAACCCGTCTCTTCTGTTGCCCTTGGTTACGACCCTGGTGCCCACACACTGCCCCTCACCCACATTCCCCCTCCGCGCCATACCTGGGCAGCCCCTCGACCAAGCAGCGAAGGAGTCGAGCTCCACGCCCGCTCGCTGTCCGTGTCTCTGGGATCAGGGGCTGCGAAAGCTTCCGGTCTAGCCAAGGAGGACAACATAGGGGGAGATAGGTACAAGGAGTGCGGTGACACTTATGGACTCTGGAAGGGCAAGGTGGCCCGCCTGAGCAGTGGGGATGATCAGGGGGACATGAGGGAAGGTGAAGTTGTGGAGGGCACAGGGCAGTGGAGCAGGAGAGTTCCTCGTGACCAACTAGTGAGGCCCCGCCTTTGCAAGCGCAGCCCTGGCCACCTCCTGGAAGAATCCTTTGTGGCTCGCAGTGGGATCGCATCTCTGGCTGGCCCAGCCCGGGGCCCAGCCAAGAGCGAGCCTACGTCCTGCCTCGCCTCCCTTCCCGTAGCCCCAGGGGCCGCCCGCCTCCCCCAGCCCACTCCTCTGTCTTCCTCCTCTCTGCTCTCCAGTTTAGCCTTTAGGATGTCCAAGCCTGGCCCAAGAGAGAAGCTTGGAGCCAAGGGAATGGCCCCTGAGACTCAGAGGACTCCATCCCAGAAATGTGTGACATTCAAGGATGTTGCTGTGTTCTTCAGCCGGGAGGAATGGTGCTCCCTGAACTCTTCACAGCAGAAGCTGTACAAGGAGGTCATGCTGGAGATCTCTCAGAACCTGCTCTCTCTGGATGGAAAGAATAGACCTAAAACCCAGAAGTCTACTCCAAAGCTGAATAGTTCCTGTGACTTTCATTTGAGAAAAATCAAGGGTAGTGAAAATAACTCAGAGAAGAAGCAAGGCAACTTGAAGAGTCATTCCAAAAAATTAAATATTATCATCAGGAAAACTCCTCAAGAAAAAAAAGATGATGACCATAATAAGTCTGAGAGTAGTTTTACTCCACAGTCGACCAATGAGGGTAATCAACTTGAGGGGAAGCCAGATCTTACTAAAGATCAGAAAAATCCAAGTGTCAAAAAGCCTTACAAATGTAATGAATGTGGGAAGACTTTCAGTCGAATCTCATACTTTAATGGACACAAGAGGATTCATAATCCAGATAGATTTTACGTTTGTAATCATTGTGGGAAAAAGTTCTCAAGACCCTACAAACTTGCCGTACACCAAAGGGTACATACTGGAGAGAAGCCTTATAAGTGTAACAAATGTGGGAAGTCCTTCTCCCAGACCTCATCCCTTACTCTGCATCAGAAGATTCATAGTGGGGAGAAGCCTCATAAATGTAACGAATGTGGGAATACCTTCAGCCAGCGCTCAACACTCACTGCACATCAGAAAAGACATACTGGAGAGAAGCCCTATGAGTGTGGTCAGTGTGGGAAGGCTTTCAGCCGGAGCTCGAGTCTTAGTGTCCATAAAAGGAGCCACACCGGGGAGAAGCCCTATGAATGTACCGAGTGTGGAAAGGCCTTCAGCCAAACCTCATCCCTTATTGTGCACAAGAAGATTCATACTGGAGAGAAGCCCTATAAATGCAACGAATGTCAGATGGCCTTCAGGGAAAGCTCAGCCCTTCATGTACACAAGAGGTTACATACTGGCGAGAAGCCCTATCAGTGTAATTACTGTGGAAAAGCCTTCAGTCAATCCTGCAGCCTTGCTGTACATAAGAGAATACACACAGGAGAAAAGCCTTATAAATGCAATGAGTGTGGGAAGGCCTTCTGTGAGAGCTCATCTCTCAGTACACATCGGAAAATTCACACCGGAGAAAAACCCTACAAATGCAAGGAATGTGGGAAGTCTTATTGCCAAAGCTCGACGCTCAGTGCTCATCAGAAGACTCACACCGGGGAGAAATCTCACAAATGTCATCAGTGTACAAAAACTTTTGTAAAGCCCTCCCAACTTGTAGCCCATCAGAGAATTCATACTGGAGAGAGACCCTATAAATGTGACGAGTGTGGCAAGACCTTCGGCCACACTAAAACCCTTCATGCCCACCGGAAGATTCATGCTGAGGAAAAACTTTATAAATGTGATCAGTGTGAAAAGTCCTTCCAGTGCAGTTCCTACCTGGCTGTGCACAAGAAGATTCATACTGGGGAGAAACCTCATCAGTGCAACGAGTGTGGAAAAACTTTTAGACAAAACATATCTCTTATAGTACATCAGAGGATTCATACTGGAGAGAAACCCTATAAATGTAATCAGTGTGAAAAGTCCTTTCACGGCAGCTCGTATCTGGCTATCCACAAGAAGATTCATACTGGAGAGAGACCTCACTCGTGTAATCAGTGTGGAAAGGCTTTCAGAACCCACTTGAACCTCGTTGTGCACCAGAGGATTCATACTGGAGAGAAACCTTATCAGTGTAATGAATGTGGGAAGTTCTTCACCCAGAGCTCCAATCTTGCCGTACATCAGAAAAGCCACACTGGAACCAAATCTTCTAAATCTAATTAACGTATGAATCACGGACTTGATGACACAGAAAATTCATGTGAATGTAATTTTTTTCTCCTCTTCTATCAGTGAAGAAAGGAGGAAAAAGCAGATGGGACTTTATATTTCCTGTAATTTTATGTAAAGATATATAGGAAGGGACAAGGGGAGAGAGCACAAGATGATCTGTACTTTTAACAGGACAAAGGAGGGTTGAACACATGCACACACACACAACTTTATCGTAGGAATAAATCAGACTCAAATCAATAAGCAGGGATGAGGAGTAGGGTTAATGTGGAGAATAATGGGGAGGGAATTATCAAAAGCACAATGAATGTTCACTTGAGGGAAGTGAACACTGAAGGGGATATTAAAAGTTAAAAAAGAAATCAAAGAAATGATACAAAGAGGACCCCATTATTTGGATAATGAGTAGGTAATGCAGTGGAGACAGTGTGAAGTCTGGAGCTGGAAAGATCTGAGTTAAAAAATGGCCTTAGATACTTAATAGCTGGATTACTCAGAGCAAATCACTGAATTACTTACCATCTGCCTCTATTTCCTCATATGTAAAATGGGATTAATAATAACACCTCTTTTTCAGGGTCGTTTTGAAGATCAAATGAGTTAATATTTGAAGTGATTTCTAGATCTTAAAGTATTTTATAAATGCTAGCTCTTAAGAATATCTGATAGGATAGTATTGTATCATAAGAACTGATGACAAGGACAGGTTCAGAGAAACTTGGGAAAACTTGTAACTGAGGCAGAGTAGTGAGCAGTACCAGGAAAACAATTTATGCAATAGCAGTATTATTTTTTTAAAATTTTAATAGCTTTTTATTTACAAGTTATATTCATGGCTAATTTTACAGCATCGACAATTGCCAACCTTTTGTTCCAATTTTTCCCTTCCTTCCCCCACCCCTTCCCCTAGATGATAGGATGACCAATACATGTTAAATATATTAAAGTATAAATTAAATACAAAATAAGTA\n>XR_004154822.1 PREDICTED: Punica granatum luc7-like protein 3 (LOC116196428), transcript variant X3, misc_RNA \nCAGTAAGTACAGTTGATCGCCCCTCCACCTCCACCGTCGTCAAAGGGATTTCTTGCTTCCCCCTCCCACTCCGAACCCTAGAAAGTAGAGGAGCTCTTCCCCTCACCCACCATCGCAGCTTCCTGCTATTCCATTTGAGGGAAAAACCTATTGTTCCCAGCTGAATTATCCATCTGTTCCGAGCTCTTACACTACGCGATAGCGAAATCTTATCCATAAGCCATGGACGCGCAGCGAGCTTTGTTGGACGAGCTCATGGGCTCAGCTCGTAACTTGACGGAGGAAGAGAAGAGGGGATACAAGGAAATCAGATGGGACGATAAGGAGGTCTGTGCATTCTATATGGTCCGGTTTTGCCCTCACGATCTCTTCATCAATACTCGAAGCGACCTCGGTCCGTGCCCAAGAATCCATGATTTGAAGCTGAAAGAAAGTTTTGAGAACTCTCCAAAGCATGACGCCTATGTGCCAAAATTTGAAGCTGAACTCGCGCAGTTCTGTGAGAAACTGGTGATGGACTTGGATAGAAGAGTTAGGCGCGGGCGGGAGCGTCTTGCGCAAGATGCTGAACCTGTGCCACCTCCTCCTCTTTCTGCTGAAAAATCTGAACAACTATCAGTGCTCGAGGAGAAAATCAAAAACCTGCTGGAGCAGGTGGAAGCCCTTGGTGAATCTGGAAAAGTAGATGAAGCTGAAGCACTCATGAGAAAGGTGGAGATGCTTAATACTGAAAAGACTGCTTTGACACAACCTACCCAAAATGAGAAGGTTCTGATGCTTACACAGGAGAAGAAGATGGCTCTTTGTGAGATATGTGGCTCGTTTCTGGTGGCTAATGATGCAGCAGAGCGGGTTCAGTCTCATATCACAGGGAAGCAGCATGTAGGTTATGGCATGGTTAGGGATTTCATAGCAGAGTACAAGGAAGCTAAGGAGAAGAGAAGGGAGGAGGAAAGACAAGCAAGGGAAAAAGAAGCTGAGGAGCGGAGGAAGCAGAGAGACAAGGAACATGATAATCAGAGAAGAAGTGAATCAAGAGACAAGGATAGATCCCATGATAAGGAGACAGACAGGGACAGGGAGCGAGACCGCTACCGGGAACATGATCGCTACCGTGAAAGGTCACGAGATCTCAATGGTAGAAGTGGTCGGGATGGAGGGAGGGGGATGGATTGGAGATCTAGGAATGGAAGAGATGGAGGCAGGGACAGGTACCGGGACAGGAGCAGGTCTCGATCCCCTGGTAGACATGGATACTGAAGGTCATCACAAAGTCCAGTTCACTAATATTATGGATCTTGTAGACAGATGAAGATCTGGACTTGTTGAGATTTCTTGAAAATATGTGATCTTCAAGGGTTGAGGTAGGTATTACCTTGGCGCTAGTCTGTTAATTTTACTATGCGGGTTTGGATTTTGTTTTTGGACCAGATTCATTGTCTCTGAAAGGCCCCTTTCAGAGTCTTAGCCTTTGCCTGAGCATGAATCTCAGCTGCTCTGATGTCCCAAGCATATTAGAGTTAATATTCTTGGAAGAAACATGCCTGGGCTTCAAGGAGATGCATTTGGAGTTGGGTTTTATGATGATCATTCTTAAGGCAAAAGACAGAGCACTGCCCTTATTCACGTTCAGTGTCTGGGGATCTGGTTATTGGGCTGGTTTAGCATGGATGAGAAAGAGTGATATATTTTGCTGGCTTTTTGCTGTCGGCTTAGAAACAGAACTTTATTTAGCTGATGTGCCATTCCATGATCAAGAAAAGTGGTAGCATTTCCACTAATGTCAAGGTATAAACTCGTGTCTCTATTACGCAGTGTTTTCAACTATGCAGGAAGAGAATGGTATCGTGGTGTATTATAGACTCGTAGATGGTGGAAGGGGAGTGAGGAGTAGTTCTTGCTGGGCGTTGGCAGACTTAATTTACTCTTCGGTTCCTAGCTGTCTGTAATGAATGAAACTGTAGGAGGGTGATTAAATCTAGAAAAGTCTCCATTTATGGTGGTGGCTTTTACAATCTGTTCTGCCCATTGGCTTGAGACTTGTTCGGTTGTTCCTGAACTTTCTAATGATTGTACTTGTGGTGTGAATGGTCCAACAAGCAGGCAATTCTGGACATTATACACTTTACCGGCTTTGAAGGGTATTCCGAACTCAA\n>KX758048.1 Babesia microti Trx1 mRNA, complete cds \nAAAAAGTATTGACAATGGTGAAAGAAGTACAAACTACTGCTGAATTCAAGACTCTAATTTCTGAAAATGCCATCGTTGTTGTGGATTTTTACGCAACATGGTGTGGACCTTGCATGAGTTTTGCCCCCAAATTTGAAGCCCTTAGTGCTGAGTTCCCCAACATCTTATTCATAAAAGTGAATGTGGATCAAAATTCGGAACTACAAGCACTATATTCCATCACTAGTATTCCGTCATTCAAAATTTTCAAAGACGGGGCTGTTGTAGATTCGTGCACTGGAGCTAATGATGCGATTTTGAGGAGCACTATCAAGAAGCACGTCTAGCAGTTATATGCAATGGGGACTAATACCTCTGGGTATCACCTAGCCCTGGGACTTCTGGGTTTGTCCATAATTTTATTCAATTTAAAAAAAAAAAAAAAAAAAAAAA\n>XM_027775713.1 PREDICTED: Tupaia chinensis melanoma-associated antigen B4 (LOC102498282), mRNA \nCGTTGGGGGTGAGGTGTCTGTGGAGGAGGTGCAGCCTCAGGCCGTTGCCGGAGGCGTCTGATCCGTGTCTTATCAGTTCTGAAGACTGTACACAAGTGGAGCCGAATAAGGACAAGCTGAATTGTTCTGCTTGGCTTTTAGGTGCCTGCCTTGTCAGCCCTCCAGCTGTCCCTGGAAAGACACCATGCCTCGCGGTCAGAAGAGTAAGATCCGTGCCCGGGAGAAACGCCAACAGGCCCGTGGCATGACCCAGAGCCCCAGGGTCCCTCAGATCACCGCAGAAGGGGAAGAAGAGTCTTCCCCGTCCGCCTCTCCTGCCTGTGGAGGACGCAGCTCTCCTTGCAGCTCTCCTGCTGCCTGCTCTCCCCCAGAGTCTCAGGGAGACCCACCCACTAGCTCCCCTGATGCAGGTGCCTCAGGCACAAAATCTGATGTAGGGGCCCAGAGCCTGGAGGAGGCAAGTCCAATAACCTCTCAGGCAGCANTTTGCTGCCCTATGGTCATGCAGAATAAGCAGCACTTCCCTGAGATTTTGAGGAGAGCCTCAGAGCGCATGGAGCTGATCTTTGGCCTAGAGTTGAAGGAAGTTGACCCTGTCAGTCACTCCTATGCTCTTGTGAGCAAGCTAGGCCTCTCCAACGAGGGAAGCGTGAGTGGTGACAAGGGGCTACCCAAGACCGGTCTCCTGATGACGCTCCTGGGTGTGATTTTCATGAGGGGTAATCGTGCCACTGAGGAGGAGATGTGGGAATTCCTGAATATGTTGGGCTTATATGCTGGGAGGAGCCACTTAATATTTGGGGAACCCCACAAGCTCATCACCGAAGATTTAGTGCGGGAAAAGTACCTGGTGTACCAGCAGGTGCCCAACAGTGACCCTCCATGCCATGTGTTCCTGTGGGGTCCCCGGGCCTATGCTGAAACCAGTAAGATGAAAGTCCTGGAGGTTTTGGCTAAGATCAGTGACACAGTCCCTAGTTCCTTCCCTTATCTGTATGAAGAGGCTCTGAGAGAGGAGGCAGTGAGGGCAGGAGGGAGATTTGCAGGCAGGATTGGCACTGTGGTCCAGGTCAGGCCAGGTCCTAGGGCCATGTCCCACTGCTCTACCCACATCTAG\n>XM_046141267.1 Boeremia exigua Molybdopterin synthase sulfur carrier subunit (C7974DRAFT_388246), mRNA \nCAGACACACACAATTGATGGTAAGCATCAACCATTTTCTTCGCACTCAACCCCCCTGTCTTGTGATGTTTTCCAATAGCATGTATTATCCGACTGTCGCTTCGGTGACGGCCTGCGGAACACCTTTTTTGGCTGATCAGAAAATTTGCTCACCCTTGTTGCACACTGTTCCTAGGACACAAAAGCTAACAAGGTCCAGTCATTGTTGCTGTCATGGTAGCCTCAAACCCTCCAGCGGGGCACTTTACCATCTTGTACTTTGCGGCCGCCTCGACCTATACAGGCAAGACCACGGAGCATCTGCCCGCACCCCTCCGGGTGCGCAACCTGTTTGCACAGCTCGATGCCGCATATCCTGGCTTCGGACTGAAGGTGTTGAGCAGCTGTGCTGTGACTGTTAATCTCGAGTATGTTGATCTAGACGATAGTGATGCTCTCGATGTGGATGCCGAGATAAAAGCAGGCGACGAGGTTGCTATCATACCGCCTGTAAGCTCAGGCTAGGGCCAGCAGTGCTGCAACGGAGTGGGTGCAATGTGGACCGAGGATCGCATGCCTGCTGTCTGGTTGAATGGGTCACGTGAGGAGGCCGGCCGCGGCTGCTGTTGACCTCACCGCACGAGGACTACGATTAGCGAGTAGCGACCGAGGACGGACGGTGGCTGGACAGTAGAGAATGTTAGCTCGCGTGTTAATTGTGATTGTGCCTCAACGTTCTCGCGTCACGCGTCACGCATCACGTAGCACGCTCTCACGTTGCAAAGTAAATGGCGGACTATGAATGAGCCGGACATCCTACTACGCGACAGTAACGTGGGGAGAATGCACAAAAACTCTACAGAATATTTTTTTGTCTACAATATAAGTAGTTCTTATACAAAGTTTAGCTTTTAGTATTGTGATAGCTACAAGTTCTATATGAAAGTTAGTGAGCTCTGCTTATCCACCGTTTTTTCTGAAACTTG\n>JX990552.1 Uncultured thaumarchaeote clone H7_Parch519F_24 m 16S ribosomal RNA gene, partial sequence \nCAGCCGCCGCGGTAATACCAGCACCCCGAGTGGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCGGTCCTGCAAGTCCTCCGTTAAATCCACCCGCTCAACGGTTGGGCCGCGGGGGATACTACAGGGCTAGGAGGCGGGAGAGGCAAGCGGTACTCGACGGGTAGGGGTAAAATCCACTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAGAACGCGCTCGACGGTGAGGGATGAAAGCTGGGGGAGCAAACCGGATTAGATACCCGGGTAGTCCCAGCTGTAAACGATGCAGACTCGGTGATGGGCTGGCCTTGTGCCAACCCAGTGCCGCAGGGAAGCCGTTAAGTCTGCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTTAAAGGAATTGGCGGGGGAGCAC\n>XM_020038344.1 PREDICTED: Musca domestica GATA zinc finger domain-containing protein 4-like (LOC109613490), partial mRNA \nGTGGAGACACGTGCCTATCCCGAATTAAGCGGTCAGCAGCGTGACACAGCCACACCCCTGTGGATTATCATATTGGCCATAATTGGAGGCCTGCTGCTGCTGGCGCTCTTCACCTATGCCATGTGGAAGTGTGGTTTCTTCAAGCGCCGAAGACCGGATCCAACGCTTAGCGGAAATTTGGAGAAAATGAACGAAGAGAAGCCATTCTTAAATTCATCACAGAAAAATAATCCTCGCGGTTTCTAACAAGAAGGAACAGTTGGGTGGGATTTAATGCAGCAACAGAAATTGAGACCGGAAACGGTTGAGCCACCCAAAAATTGCTGTAGCAAAACAACAAAGAAGGATAGCGATACTTATGATTTTTGGCAAACATTTCAACAAGAGAATAATAACAATAACAACAACAACCACAATACATCTAACAATATCTATCAGCAATTGGGTGCCCATAATAGTAAATCAATAAATGAAATTAATTTGGCCGAGGTACGTAATGCCCTGGACCGGCGAACAATTGCAATGGCGAGCAATAATCAAACAACAACAACAACGGGCAATAATCATAATCACAATAGCAATAACTCAGGAATACAACCGATGGGCGGTAGTGCTGAAATAATATTCACCTCCAATTTTCAATCATCCCCCTCGCCCAACAATCCTCATGGTGGCAATACATCAATGTCCACCGGCAATAATGTGGGTAGCAGCAATGAAAATCTTCTAGATATCTATAATGGAAATGGGAAATTTGCAAACTCCCCCAGTGATCTATATAAACAAGCGCCAGCCATATCGGCTAATGGTGCTTTGGTACCACCACCCTACAGAGATCCACCGCCACCACGTAATAGTCCTTTACAACAGCCAGCAATTAATGCGAATGCTTCAAATGCCCTCTATTCAAATCAACCACCACCACAACAACAACAG\n>XM_019441788.1 PREDICTED: Panthera pardus solute carrier family 51 beta subunit (SLC51B), transcript variant X2, mRNA \nCTACTCTGTGGAATTCCTCCTCTCTGGGTCACTTGCCTTGCCTCCCCCAACACTTAGCCCTCCAAAGGTCTTGTTTTACTGCTTCTTGTAGGGAATTTACATAAGACCATGACCTTCACTGTGAGAAAGCACAGGCTATAAAAGGCCAGGCTTGGCTCCCAGCTCTGTGGTTAAATATTGATAATAGCAGGAAACAGAGGCCTGGGGCGGGTATACCACATATCCCCCTGCAGTAATGGAACACCCAGACTGAGGGTCTTCCCCAGCCCATTGCCTGGGCTGGAAAGACAGTCCACATGTTTTCTCTTTACTTCAGATCAACATATAGGAAGGAAAGTATGGAGCTGCTGGCTCTTGCAGATCGTGAAAGCCAGGCGGAGCCTGTTTGTCATCTAAGGCCACTCATTCAAGAGGTCATTCACCCTGGAGTGACAGAGGAGGTTCCAGGCCTGGGCGTGTGCTAAGGGCAGAGCTACCAGCTGGGCCCCACTGCCACAGGCTCTACAGCACTGTTCCCCCAGGTGACGGCTGTGACGGGTGCTCAGGCACAGAGACCATCCAGTGCTCCGGTAAGGGGAGGACATAGAAACCAACGCTGCTCCCAGCAGCAGATCAAGGCAGGCCCAGGAAGTCAGATCCCAGGTCTTTAATTTTGGTGTCTCAGTTTGCTGTTTGTTAGATGTGCACCTCGTCTTCCTTTTCTTCATCAGTAGCTAGTTTCCCTGACATCATCCACTGAACAATTCCTCCTTTACCTACTGGGGTCTTCAGGGCTTTGCTCAAGGGCCAGAACCTAGGAGCCCAGGCGGGCAGCTCGGGAGCAAAGGGGCCTAAGGATTTCATTGTCAGAAACGTATCCCAACCGTGAACAGGGGCATGGACCACAATGACGGTGTCATCCAAGCTCCAGCTGGCACCGTGGTGCCTCAGGAACTGCTGGAAGAAATGCTTTGGTTTTTTCGGGTAGAAGATGCATCTCCTTGGAATTATTCCATCTTTGCCCTGGTGGGTGTGGTGATTGTGATAAGCATCGTCCTCCTGAGAAAGAGCATCCAGGCAAACAGAAATCAAAAGACACTGAGGAAAAACAAACTGGAAACAACAACTCTGGAAGTCCAAGACTTGGCTGAGGCCGGAGCCAGAGAGGACAACAATCTGAACATGCTAAGAGAGACTTTGCTCTCAGAAAAGCAAAATTTGGCCCAGGTGGAAACTGAGTTAAAAGGGAGAAAGGTGCCACTGGTTCTCCTTCCAGACCCACAAGAATCCGAGAGCTAGAAGGGGTCCAGAGCACCGCCCCATGTTGTCAGCAGATTCAGTGAATGAACTGCAATCAAAATATTGTTATGAAAAAAAAAACCCTCCCTTTTTATTAAAATGCATCTGAAGTGGGCATTTGGAAATGCAGTTTGTTCCAATGGGGGTGGTTCAACACAAGGGGCTTGGAGCAAAA\n>AY749834.1 Labidiosticta vallisi 16S ribosomal RNA gene, partial sequence; mitochondrial \nTGCAAAGGTAGCATAATCATTAGTCTTTTAATAGGAGGCTGGAATGAAAGGTTTAACGAAGTACTAACTGTCTCATTTTTATATTAGAATTTAATTTTTAAGTGAAAAAGCTTAAATTTTGTTGGAAGACGAGAAGACCCTATAGAGCTTTATAACCAGTTTTCAAAATATTTTTAGTTAAATATTTTATTTTTATTAAATGGGTTATTTTGTTGGGGTGACAAAAATATATAATTAACTCTTATTATTCTATTGACCATAAATTTATGATTATTGGATCCAATAATATTGATCGTTAGTCTAAGTTACCTTAGGGATAACAGCGTAATCTTCCCTCAGAGTTCAAATTTACGGGANGGCTTGCGACCTCGATGTTGGATTAAGATAATAGTTGGGTGTAGAAGCTTGATTAATAGGTCTGTTCGACCTTTAAATTCTTA\n>KR841045.1 Uncultured Stella sp. clone OTU_9761 16S ribosomal RNA gene, partial sequence \nTACGAAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCGCGCAGGCGGCCTTTGAAGTCGGGCGTGAAAGCCCCGGGCTCAACCCGGGAATGGCGCTCGATACTCTTGGGCTCGAGTTCGGGAGAGGAGGGTGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCGGTGGCGAAGGCGGCTCTCTGGACCGATACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGG\n>XM_050429574.1 PREDICTED: Quercus robur uncharacterized LOC126725075 (LOC126725075), transcript variant X1, mRNA \nAAAAAAAAAAAAATCCCTTACGCCGTTGCCATTGTCTCCACACTGCAAAGTTTCAACACTTTGTCTCCACAAGTTGCTGTTTTGTGACCTCAATTGTGGCTGAGCCATAGCTGGACTTGACAAGCATGCCCAATGGTAGTATCTCTCTCTGTTGGTCTGTTTTGGCCCTTTTGGGTTTCCCGTTTCTGTGGTTAGTTTAGGATTTTATGTTTATTTGTTTATTGACTACTTTATTGATATTTGTGATATATTGATATATTTTATTATGTTTATTATATTTACAAGTGGTTAGTAGCTATCATCATTTATAATTTACAATTTGTATTTTATTTTTTAAATTTCATAATGGTGGCGCCGGCTTGTTATGGTTTATTTGATAAAATTGTTTGAGTATTTGTATATATATAATTATATTTGAACAAGTAGCAGTCTAATTATTTTATAGATACGAATTTACACCTTAGTTGCTTGGTTTTGTCTGACTGCACATAATGAAAGTACTAAAAAAACACTTTAGAATCAATTATAAATTGTCAGAAAGTCTTATAGTTCAGTAAATATTTGTTGGTGTTTTCAATACAGTCTAAAGCTCAAATCTTTCGTCCCCAACTATTGAATTGCCAAATTATAAAGAATTAATTATTAATTATTTTGGTATAGCACCCAAAAACATAAGCCAAAACTTTAGAGTTAATTTAATTTCTGAAATAAAACTTTTTTTTAGTTATGAAACTTTTTTCATACTTAGCTTGGCCCTCCCCAGGAAAAATTTATGGCTCAGCCATTGCCTAGTTGACTACATCCCAACAAGACTTAGGATTATTGAAGGGGTAGCAGATCATCACTTAGATGATCTCTGCTTTCCAATTAGACTATGCAACAAAAACACACTAGGAGCCCCTATTGTAGTCCCATTGCAACAATCTGTCCCAGGTAGACAAACTATTGTTGAACACAAGCCAGCCAATAACCGCATGCTTGCACACAACTAAAGGAAACTAGACTATTTCCCAATATGGAGTTTCTTGCTTCTTCAATCTAACTGCATTCCAGTCTTCAGTAGAATCAAATTTTCTTGATTAGGATGGCAACCACAGAAGCCGAAGAACTTTACCACCAACTTCAACCAAGCTTATCAGGCCTTGATGTACATTTTCAGATTTTAATTTAAAAAAAAATAATAAAAAAATAAAAAAATAAAAACTGTGAAATAGACTCTTTCTATTTCAAATGAAACCAAGAGAATCTTGTGATGATGTGGGTGTGTTTTTAGTAAGTGATGTTCATAACAGAATGGAATGGAGTCCATAAGGAAAGTGGTATTATGTACTCAACCAGGGACAAACAAGGACGTGTGAGTAAAATTGGTACAAGAGCACATTTCTAGGAGGAGAGAAATTTGAGTAAAGCTTCAAAGCTATCACTGAATCAAAAATGGGATAAACAAATATTTAATATTGATTTAAGCTAAAAATGGGATTGAGATAAAATAGATAATTTTTAAGCAGCTGGGGTTTTTTTTCAACAGGTTTTCTTAATGTATGGGGTTAATTTTACATTTCAGAGAACTCAAATGGCCTATTCATAAACCCACAAAAATTCCTAACCTTTATCTAAAACTTGGTCTGGAGTTTGAAATTGCTATTAAATATTTGTCTTTTTAACTAATTTGTCAAGTTTTTGGAAATTGCAGTTTGTGTTCTACTTTAGCTTATTATCCATTTTTCATCGCATTATGGCCTTTGTTATTGCAAGGGATTGTTCTAATTGCTCTGTTATAATTTCCAACTACTGAGTGGGTCAAGGGGAAGCAATTGGAAGAAGCTATAACCATTAAGAACACTTGCAGAAATGGCCAAAAAGGGCAAAGACACTCATAATAAAATAATGAAATATGAGATGGAAAGAGCACAAAGAATCAAGCAAAATCAAGAGAAAATAAATGCTTTGGGATTGAAGCATCTGTCAACTTTTTTGCCTAAATATGCAAATGTGGGAAGAAAGAGAGTAAGTGCTCAGGTAGATGACGACGATTGTGTACCAACTATTGGTGATGATGAGTTATCTAGTTCTTTACATAATGAGATGGCACCAAGATGTAGCACTCATTCACGCCGTGAGGAATTTACCCCAACAGTCCAGCATAAGGGCCCATTATTGAGACTACTTTGCAATGGAGATTCTGAGATGGCTCATTATAGGCGTGAGGAATCTACCCCAGCAGTCTAGCATATCGGCCCATCATCGAGCACACATCTTGGTAGAGATTCTCTTGTCGAAATTTCTACTAATGTAGAGGCACAGCTTGTGGGCACACCGTCTACCACAGATACATCGACTAGTAGACGTGCCCGTGGCATGACTCGTGGATTAAGGGTACGAGGACTTGTTGAGAAACATAGGAAGCTACCGGTCCTCATTGCCCCAGAGTTTTGTGCTCCTGTTGGTGAACATGCAGGGAAATTTGCTAGCCAAATTGGTGTACAAGTGCGTACGAACTTGTCCACTATGAATGCTTATAGTTGGAAGAATATTGATAGCGGTGAAAAAGAGGCGATCATTCAAAATGTGGCGGATCAATTTGATATACAAGGAGAATCTGTACTTGTCAACAAATCTCTAAATACAAAGTGTGGTAAATTATTGAGCAGCCACTACTACAAGTTGTTTACAAAATATAAAAAACTTGTAAAGGATGAAGGAAGCACATATGCAAGAAACCACCCACCAAAAAATGTCACACGAGAAAAATGGATTGAACTAATTGATGGAAAGTGGAGTGATGAAGATTGGCCGGCAATTAATACTTCGAAAATTTTAATTACAAGTGAAAAAGTCTCAACAAGAAATGCTAGAAACAGAAATAAAGAGGGAATGCTTGACAAACACATTCATAGATGTGGAAACAAGTCACTTGCAATTAGAGTGGATGAGGCAAGACGGAAAAATGGAGGTCATATTCCTAAGCTGGCACAAGTCTACTATGATACTCACTTCAATTTAAAGACAAAACAGTGGGTACACCATGATTGCGAACATACATATCAAGAGATGTTGAGAGTACAAGATGAGCATTGTAGCACTCTTGAAGCACAACCTTTGACCGAAGAGGAGATATCTATGATGGTTCTTAAGTCGAGATCTGGCTATGTAAAGGGACTTGGCATGAGGCCTTCCTCGTCTCTTAGGACTCTTGCCTCATCTTCCTCAACTCCGTATACTCAACAACTCGAAGGTCGAGTAGAAGAGTTCCAGGATGCAAACTACAAGCTGGAGGGCCGAGTAGAAGAGCTCCAAGATGCAAACTTCAGGCCAGAGGAGAAGATGGATTGCATCATACAATATTTGAGGAGCAAGGGCGACAATGACATTTGTGGTAGTGGGGGGAGCTCATCTACTAACTAGAACACACCTTGATATGGGATTGGTGACAGAAAGATAGCTTTTGTGGGACTACTTGAACTCAAATAATTTTTTGTAAAATTTGGAAGTTAAGACATCATTTGTATATAAATGGTTGTAACTTTGTGAACATCTTTATTACGTTTTTAGATTGTATGGATGTATTTTTTATGGATTTGGTTAGAAATGAATGGATTTTTATTTATTTTTTT\n>XM_035972485.1 PREDICTED: Aplysia californica uncharacterized LOC101852208 (LOC101852208), transcript variant X5, mRNA \nGCATGAGGAGTGAATTTTACTTTTAGTTTTAGTGAATTTAGTCGCTATTCCTCTTGACAAACTTGTTTTACAGTGATATAGTTCAATAAACATTAGGTCGTGCACTTGACTGTATGTTACATGAAAGGATAAAAAAGTAACTAGAAATCTTCCCCCTTTCTGTCCTGAAAAAAAAAAGCTCTTCACTCCCATTCTATTTTCCCTTTAACAACAATTAATTAATAAACTCAAGCCAGCCCAAGCGGATTTCTTGTTTCGTAAAATTATACTAACCCTAATCATACATTTTTAGAGAATTAACAAATAGTTACTTCCATTTCTAAAGAGCAGTTTGGGTATTAATGCGCTCTCTTGGATACCAACAAAACAAGTGACTTAAAATAAGAAAAATAGATATGGTGTCAACGTTTTAAATATTGATATCGACTTATTTTATTACTAATAAGATCCATTTTGGATCGAGAAATGAACATATTATATTGTATTTTATTAAATTTCTTGGAACTATTTATGTCCTTCTGAAAGGCGCAGTACCACATTGTTTATGATGAAGTAAAGTGGCGCCTTTCATTTTTTTTCCTATTGACTAAACGGTGAAAGCAATATCGAGTTTTTATAATGTATAGGGTCTTTTGATAGTCAAACAAATGTGCCAAGGATGTCTTCGAACGAAGTTGTAAAGACCGTTGCCAAAAAGTTGAAATACTACTTTGAGATCAAGCGTCTAGAGGATGGCTTTGATTTATCAGATGTGCACCAACCCCAACTGGATCACCCTCCTTTGAAAGCGCGTCCAGCACTTCAGTATGAGGGCCTCCATGACCGTGCCCTCAAGCACTACTTCAGCCAGCCTGAGGTGCGCGTGCAGCTCACACAGATGCACGGGCCAAATGGAAGGGGCACATTGCATGGGCGGAGGGAGCAACAAGTTCGCAAGATGCTGGACAACTACATGAAACATTACTCCTTCCAGGAAGAGTTTCTGAATGCCTCCCCAAGAAAACGTCCGGCCAGCCCAAAGAAGAACACACTGCCCAGCTGCTACTACTACCACACACCCAAGGGCTGTAAGATGAACACCAAAGCCACTGGAGTCCTCCATAGAGCCAAAAAACCGAAAAATCTGATTGGAGGCTGGCCTACCCTGAGGTCTGTCCCAGACCAGCACATCTCCAGAGGGGAGGCCACCAGGCTGGTCAACTCAGCCACCAAGATTCTTGTGGCCTCAGCCTATGATGACTCCTACATCGATAAACCCAGAGCCACTTCAGCCCAATCTCGGCCAAGATCACCAACTCCATCCCAGAGCACAGCAACAACCACGTCAGCGACAACTGCCACAAGCACGTCCACCGATGATCACCCACCCGTGCGGCCGCAGTCAGCCAAGTACCGATCACGCACAGTCATCAATGTGCCACAGCGCAGGGCCCAGGAGGAAGTGGCTGTGATCAGGGCTACTCAGACGGCGGCTGATTTTGACGTGGGAACCAAGCATGATCGGCAGCTGCTGGAGAAATATGACAAGCTGGAGGAGGAGGTCGATGATGGAGCATGGTGTGAGTACCAGGTCTATGTCTGCACGGGCACGCGTATTGGCTCCAGCACAAAGGCACCCATCAAGCTGACAATGTACGGGGAGAAGGGCAGAACAAAGGAGTTCATTCTCAATGACTCCAAACGCCACAAAATCCCATTCCAGAAAGGGAAGGAAGATCTTTTCATGCTGGCGGCGCATCACATTGGTAGGATCAGGAGAATACAGATTGGCCACGACAGGCCTGAGCTAAGCTATGCATGGTATCTGGAAGGGGTCACTGTCTACGACATGCATGCAAGGAGGATTTTCCAGTTCCCCTGTGAACAGTGGCTTTCTGGACAGGCCGGGGATAAGAAGACATACCGTATGCTTCAAGTTGATCGTGAGAGAGAGTTTATTGATGCACTGGGGGATGAAGCTGGCTTGGAGAAGTCCACGAGAAAACACAGATACTCTGCAGAGCCAGAATCATCGACACCCAGTGAGGCGTTCCGGTACCAGCCGAAAGGAGAGGACAATGTGAGCACACGGGTGCGACCGGGCGATGACTACAGCGACACCGACAGCTCTGACAGCTCTAGCTCCGGCCGCTCACAGGACGCCGAAGTTCCTGTCAATGAGCATGGCTCTACGCCACGGCAGAAGAAAAAGGTGGCTAAGGACGACTACGAGGAGAAGACACGGGCTGGGACTGTGATAACGCTCCATTCTGCCACTGACTCCCAGCAAGTGGACGAGATCTTCATGGAGCCCAAGGGACGAGCCGCTAATGCCAAGTCTGGCTCTGATTTTCTAGAGGGATATAAGACAGCACTATCTGCATCAGAAGCTGAGAAGAAGAGAGGGCTTGAGCGAGAAAGAGAGATGGAGCGAGCATTGCTCCAGGGCAAGAGTATTCACGAGGCAGTGCGGGATGGGGATGTGGACAGAGTCAAGGATCTGCTGCACCATTTCCCTGAGATGAGAGATTTTAAAGACGAGAGCAGCTGGACACCTTTGCACCTCGCAGCTGCCAGAGGAAACATCGAACTTTTGAGATGGCTACTGACCAGTGAGGCGGACATCAATGCAGAGACGTCCACAGGCTACAACGCTATGCACATTGCTGCCATGAATGGCCATGTCAGCTCCATGATGTTGCTTCAGGCGATGGGATCCTCCATATTTGGCTTGACAGCAGAGAAACAGTCGGCTCTGCACTTGTCTGCTAAGAGTGGTCATCTGGAGTGTGTCAAGTGGCTTGTGGCCAACCGTGCCTCTCTGCCAGCTGAGGATGCCTTCGGTCGCACGGCTCTCAAGTTGGCCGAGGAGTTCCGTCACGATGCCTGTGCTGACTTCCTGCGCATCTGCCTCCGGGAGCTTGCCAACCCCCGCAGCACGTTTGCCATGATGCAGGGACAGAGGTTGAGCCAGAGTGGCCTCCCTCCTATTGAAGAGGACACAGGCTCTGCCTCCAGCAGCTCACAGTGGAAGGACGATGTGAAGGGACACTCAGCCTCAGAGGATAGTGAGAATGAAAAGAAGAGCCAGAGAAAGTCCAAGGCTGAAGAAAAAGAGCTGGAGGAAAAACGGAAACTGTACAAGGAGCAGCACGAGCTGATGGAGGACAGAGGGTTGTCTTTCCTTGATAGCATCAGACAGGACGCAAGCAAGGCATAAAGCAGGAAAGCAGGAGTGAAGGAATGGAGGAGAGAAGGA\n>XM_048336008.1 PREDICTED: Perognathus longimembris pacificus SH3 domain containing kinase binding protein 1 (Sh3kbp1), transcript variant X4, mRNA \nTTTCGTAATTTCCACTCACGGAGAGCAGGAAACCCGGTGCAACCGGGCGCAGCGGGCCGCGATGCAGCAGCAGCAGCAGGAGTCGCCCCAGGGCAGCAGCGGTAGCAGCAGCAGCAGCAGCAGCAGCAGCAACAGCAGCAGCGGGCGGCGCTGAACCCCCCACCGCCGCCACTGAGGAAGAAGCCCGCCCAGTCGCCGCCGCGTCCTGACGCCCGCACCCGGATCCCCGCGCCCCGATCCCGGCGCCCAGAACCTCACGCCCGCCTCCGCCAACTTTCAAGCTGCCTCGGCGGCCCGACCCGGCTCGGCGCCAATGGTGGAGGCTATAGTGGAGTTTGATTACCAGGCCCAGCACGATGATGAGCTGACAATCAGCGTGGGTGAGGTCATCACCAACATCAGGAAAGAGGATGGAGGCTGGTGGGAGGGACAGATCAACGGCAGGAGAGGTTTGTTCCCTGACAACTTTGTAAGAGAAATAAAGAAGGATGTGAAGAAAGACCCTCTCACCAGCAAAGCTCCGGAAAAGCCCATACACGATGTGTCCAGTGGAAATCCTTTGCTGTCTTCTGAAACAGTTCTAAGAACCAATAAGCGAGGTGAACGACGGAGGCGCCGATGCCAGGTGGCATTCAGCTACCTGCCCCAGAATGATGATGAGCTTGAGCTGAAAGTCGGGGACATCATAGAGGTGGTAGGAGAGGTAGAGGAAGGATGGTGGGAAGGTGTTCTGAATGGGAAGACTGGAATGTTTCCTTCCAACTTCATCAAGGAGCTGTCAGGGGAGTCGGATGAGCTCGGCATTTCCCAGGATGAGCAGCTTTCCAAGTCAAGCTTAAGGGAAACAACTGGCTCCGAGAGTGATGGGGGTGATTCGAGCAGTACCAAGTCCGAAGGTGCCAACGGATCAATGGCAACTGCAGCCATCCAGCCCAAAAAAGTGAAGGGAGTGGGCTTTGGAGATATTTTCAAAGACAAGCCAATCAAACTGAGACCAAGATCAATTGAAGTAGAAAATGACTTTCTGCCAGTGGAAAAGACTATTGGGAAGAAGTTACCTCCACCTGTGGCAACTCTAGACCCATCAAAATCAGAGATGGATAGCAAGACTAAGACCAAGGATTACTGCAAAGTAATATTTCCATATGAGGCCCAGAATGATGATGAATTGACAATCAAAGAAGGAGATATACTGACTCTCATCAATAAGGACTGCATTGATGCAGGCTGGTGGGAAGGAGAGCTCAATGGTAGACGAGGCGTGTTTCCTGATAACTTCGTGAAGTTGCTTCCAGCAGACTTTGACAAGGAGGGGAGTAGGCCCAAGAAACCACCTCCTCCATCCGCTCCTGTCATCAAACAAGGGGCAGGTACCACTGAAAGAAAACATGAAATGAAAAAGATACCTCCTGAAAGACCAGAAACCCTTCCAAATAGAACAGAAGACAAAGAAAGACCAGAGAGAGAGCCAAAACTGGATTTGCAGAAGCCCTCGGTTCCTGCCATCCCACCAAAAAAACCTCGACCACCTAAGAGCAATTCCCTTAGCAGACCGAGCGCGCTGCCTCCGAAAAGGCCGGAGCGACCAGTGGGTCCGCTGACCCACACCAGGGGTGACTGTCCCAAGATTGATTTGGTGGGAAGTACTCTGTCTGGAATTCTGGACAAGGATCTCTCTGACCGCGGCAATGACATTGACCTAGAAGGTTTTGACTCTGTAGTGTCATCTACTGAGAAACTGAGTCACCCTACCACAAGCCGACCAAAAGCTACCGGAAGACGCCCTCCATCTCAGTCGCTCACCTCTCCAGGAACCATGGCAGCAGGCAGTGGCCCAGCCTCGCTGACTTCACTGGCTTCAGTCCCCCTGTCATCTTCTATGGGAGCACCCGGACACCGAGCCAATTCCCCATCTCTGTTCAGCATGGAAGGAAAACCAAAGATGGAGCCGATAGCCAGCAGCCAGGCGGCTGTGGAGGAACTCCGGACACAGGTCCGCGAGCTGAGGAGCATCATTGAGACCATGAAGGATCAGCAGAAACGGGAGATTAAGCAGCTACTGTCCGAGTTGGATGAAGAGAAGAAAATCCGCCTTCGTTTGCAGATGGAAGTGAATGACATAAAGAAAGCTCTTCAATTCAAAGTGAATACTTGATAATTGAGATTTTGCATTTTTCATCATGAGTCCAAGACTCAAAATTTTCTGCCCCAGCCAAAATGAATCCTGTGCCAAAAGGTTACAGATTTGCCATCACATGTCCCTGTTTAAAAGATTAGCACAAAAAGTCTTGATAGCACAACACAAATTCCATCCAAGAGGAGAATCTTCCCCATGGTTTAGGCCTGGGTCTGGCACTGGTTGTGACTTAGAGCAAATTGTGCTAAAAAGGCTTTTCTACCTTGAGATCTCATGTGAAACGAAAACTCAGGCAGTTTAGTCCATAGTGGTACTATTTTGATGATCTTTTCCATTAATGAAATGTAATTTCAGATTATTCTTTACAAGCTTTATAATTTTATGATTTTTTTAACCGTGTTTTGTCACAGAAGCCCCTAGCGTTTGTATTACACCTAGTCAGAAGCGAGAGTCTTGGTCTTTTTGCTTCAGGCAGAAAGCTGCCTGGCTTTATGTTCCCTTTAGGATTCTATTTACATATGCAATTTTAGGTCCAACCCTCCCTTCCCCTGCCAGCAGACCCACCCCCTAAGAGAAATTTAGCTTATATATGATGGTATATTTACAAAAAGAGAGAGAGAGAAAAAAAAATCTGGTATTTGCAATGATCTGTGCCTTCTTTTTACCACCCTCTTGATTGGAGTTTTTGTGATGCAGCTACCATGATTCAACAAATCAAAAAGAAAGAAATGAAAATCTACCACTTCTCCAAGTCCACTAGAGGCCGCTGTGTTCGCAGTTTCTCTCACCCTAGCCAAAGGTCCTAAGAGGAGACAACTGAGATGTCAGGCGTGTGCTGGATCAGACCACCTGTGACTTCTCAGTTTCTCCTACTTTGAGGTTGTTCATGAAATGAAAAATGGCATCCCTGCTTGATTTTTTTTTTTCATCAGCCAAGTGAAATCCCTGCTTCCTGTCCTTTGGCGCCTTTTTTTTTTTTTTTCCGTGAACAGCATATGCATTATTAAAGCAAAGCTAAATAAAAGTTCAAATGCAAATGAAAACAAGGGGGGGAAAGTTGTATTATTTCCTGCACTGGGTAATCCATGTGTGTTATTGTTTAAAACTGTATTCACACAATGTCATTTTGCCTTGCTCACTTGTAACCCCCCTTCCTCGGGTCCAAACGAATGGGACGAGGGTCTTGTTGAAGTGCAGCCAATGGATCTTTCTTGCATTCATGGAATTGCTTTTTTTTTTTTTTTCCTTTCTGAGGGAATTGATGTTTGCTTGTCTGATTTAATCTTTGTAGCACTTGGAACAGTTCAGCCTTAGATTATGTAACTGTTTTTCCTCATCCTCTGCTGAAAAACTATGGGGCATACCTTACTGCAAGATTGTTCAGGGGTTAGAGGTGGAGGGGCTGGTCCCTTAATGGCCCCAACAATGTCTGATGTGTTTCTAAGCAGCTGCTTTGTCTATTTCTTGCATTTTATAGTGAAAACTACTCAAAAAAATGTCATAGATTTGCACAACTATGAAGAATGAGAAATGATGTCACTAAAGGAATGATGCAAAAAAAAATCACATTATTCATCCTTGAAAATAGAACAAGTGTCTCTTTCCTTTCTCTTCCTCTCTCCCTCCCCTTTGCCTTGCTCTTGCCTGCATACTCCTTTCTTTCCTGAGAGTATTTACAGAGCCCAACGCCCTAGTCTTCCTTGGTGGGGACACAGTTAAGGGAAGGGAGTGTGTAAGGAGCCAGGCACCTTTTGCTCCGAGTGTGGCTATATGTACGGCTTGTGCAGCAGCCTTGGCCTCAGTGTGCATGGGGCTGGGAACAGCAAGTTTCTAAGGGCAGCACAAAACATTCCTGTCCCCCTTGAACTGTTCTAAGCATTTCTGCATTACACTTGAAGCCTTCAGAGATTTCCCACCACCTAATAGAACAATGAAGATTGGATTCTTTGGTGTTTGAATTTCTCATTTCTACATCAAGAAAATCCCAACTGATATAGCTTTATCAAAAGTGCATACAGAGTAAGATTGTGGACAAGGAAACGGCAAGGTGGAGGTATCCTCGGTGGGGCATTGGCAACCTGGAATGTGTAGGGCTGATGTCAGCGCCTCAATAGAGGCCATTGGCTTTCTTCATTTAAAGAGGGGAGAAGTAAGTGATTGTAAAAAGAAGTTGCCATTTTCCAGCCTCCTTATTGTCCCTCGGGCTAATCAGCAAAGAGGATTCTGCATCATGGGACTGGGTGAGCCTCTGCTTGAACGGCTACCATCTTTACTCTTGTCCATATGAATCCATCAAGGAAAGCTTG\n>XM_001582328.2 Trichomonas vaginalis G3 uncharacterized protein (TVAG_2v0998720), partial mRNA \nATGAGTGAACTCGCTGTAGACGCACCAAAGGTTGTTGAAGCTTTCAATGGCGGCCTCACATGGCTCAACAGAAAATCAAACTCCCTCCAGAAGTTCCAACTTGACAAGATTTTAAGCGCTAAGGAAGAAGCAAACGGCGAGCTTATTATCGAGAGCAACCTCAAGATGTTCAACAAGGATCACCACTTCAGATTCGTTATCGATACATCCTTGGCACCAACAAGCCCAGAATACTTGAAGGACTTCAAGCAATTATCTCCATAA\n>XM_018438955.1 Phycomyces blakesleeanus NRRL 1555(-) hypothetical protein partial mRNA \nGCAAAAACTCCCCCCCTCTTTTTTTTTTTTTTTCTTCGTACTATTTTTTTTTTTCATTTATTATTTTTTATTTATTTTTAAATACTAAATGAATGTACCAGAACAACAGCTCCATGATGACCTTGTCAAGGACTGGATTCTTTCAAGTCGTAATGAAATCGATGCGTCCTTCATGGCTCACGTTTTATTAATGACAACAAAAAGCTCGACAGGGTTATCAGATCTTGTCAAGTTTCTCTCAAATTATTGGAAGGATGAAATTCACCGAGGAAAATGTGTCGAATTACTTACCCAGGTCACAACTCATAGTCGTTCCTCTCTTGATTATGAGACAGTCGAGGTGTTGATGTCATTCTCATGCGACCGTTTAAATGACTCTACATCAGTTCTCCGTCTTCTTGATCTAGTTGATGTCCTATGCTCAACACCTCATTTCGATGGCCATTACGCTGTCATGTTATGTCAATCAATCTTTCGACACATTGGCCAGAAAAAACAACCTCAGGGAACTCGCCACAAGATATTCTCACTACTCAACAAGCTTCTTCAGACTTACACTTCCGATCTACAACGTGCAAGAGTGAACTTTATTGGTAGCTTCGTAGCTTTTATGGATGGTGAAAAGGATCCACGTAATCTTGTGATTGCATTTGAAATTGTTCGATTCATCATTGAAAAATTTGACATTTCACAGCATGTTGAAGATTTATTTGACGTGCTCTTTTGCTATTTCCCAATAAGTTTTAACGCCCCGATTAATGACCCGTTCAGTATCACCACCGAAGACCTGAAGGACAGCCTCAGACGTTGCTTGGCTGCCACACCTTATTTTGCAAACTATGCTACTCCTTTACTAGCAGAAAAACTATTGAATACGACTGGAAGTGCCAAGAAAGATGCCATGGAAACAATTGGCCTTTGCGCTCCCGCGTACGGTGCACACGCTCTCTTACCACACGCAAAAGATATATTCGATGCCCTCGTAAACGAAGTCTATCATGCAACCGAGACCTCAATGGAGGCCACAGCTCTCAAGACCATTCATAATGTTGTGGCTACTCTAGGAACTGGTGTCAGCATAGCCAACATCAGAGATCCTGTAGAGAAAACCATTGATGCCTTACTATCCCAATGCGTCGAGAAACTTAACGAACCCGAACTCAAATATGCAAAAGCTGCAGCATTGATTCTACGTTCTGCCGCCTCTGCATCAGATCCTGCTTGTACATCTGTAGTACATACGACCTTCCCTATCCTTCACAATATGTTTAAAGATGCCAATTCTCTCAGTCGACAGCTCGCTGTTCTTGATATCTTTATCGAGATTCTATTTGCAAGTAAGAGTCTTTATGGCTCAATCGAGGATATTGGATTTGATCGAGATTTCCAGACCCCTTTGCTTTCTTACAAGAAACCGCTGTTGGATATCTTTATCACATCTTTGAATATTCGTTCTGATGAAGGACGTGTCTGTCGAATGTCTGCCTTGAAAGGAATTCGCCAAATGGTTGTTATGAAGCAATTCTTGTCGGCAGAAGAGATGGAGAAACTTGTATTGCATCTCACCCAGTTGATTCCAGACACAGACGGTGAATTAAGAGCGCTTGTTCTCTCTTCCCTTTCTGTATTAGCAAAGTTGAGTCTCCCTGCACTCTCCAAATACACCTTCCCACTCCTGTGGAGACTACTTCCAGGACACCAGAAACCAGACAACAGCAACTACCATAGTACCCTTGAAGCCGTCGAATACTTGACGATCAACCCCACCATTTTCAACACCATCGTTGCCTCTTCTCTATTGGACAAATTTGATAAGTCCTGCCGTCTATCTGACCAGTCGCGAGACTACGTTTCCGCGTTGGCTAAAACTATGCTCAATTTATTTCAAACTATGGCCCCAAAAGACCCAAAAACTATGCAACTAGGACAACGTATTTTTTTCCCTCACATTATGTCAGAGTGTATCAAATCTACTCTTCACTATCCAGGTTCATGGCTACTCGATACCCAACTTGTCGATATATTGTCGCTCTTTGTGGCTGGAGTCGTAAAGAACTCCAATTCAAGTCATCAAACAGCACTGACTGCAATTGCGTTCCGTCTTTTTGTTAATGGTGATCTGACAGCTGTTAACCTTCAATCTACAAGTGATCCTACCCTTCGTCTCTTTCCTTTATCAACCGTTGTTCTTCCTATCCCATCTTATAGTGAATTCATCCAAGGACTTGTCCAGGCTGCGTTAAATACTCCATGTAGTGCCAAGAGTCTAGCGTTGACAAAATCCTTTGCCTCAATTGTAAACAAGTGGGGAAATGAAAGTGTAATGTCTTGTGTGGACAATATTATTCCTACCTATCTTATTCCTGCCTTGGAATCCTCGGATATCAAAGTAAAGAAGGCTGGGTTATTGCTTCTAACATGGTTGGCCAAGGCACTCGTTATTCAAGGACATGCTTTGGGTTTCCAGATACTTGACATTATTGCAAACCAATGCCAATTACCTGATGTGGGGCGCGAGGCTGCAAATCATTTTTCTACTATCCTTCAAGACGACGAACTTATGCTCAACAAAAAATCCTATGCAAATGTTTCTATTCTTTACAGACAACGCGTCTTCAACTACTTGGCCCCAAAACTCATCGAGACAGCAAATATATCTTCTGCAGACTCCAAAATCAATTACTTTACCGCACTCTCTTGTTTGCTCGTGAACGTACCTGATTCTGTAGTTGCTAGTGAATCATCAAAGCTTATTACCTCTATCAATGCCTCCCTTTTATTGTCTGACTCCAACCTCTCCTTGTCTATGATCAAAGTAACACGCGTCATTATTGCCACTTCTCCAGAAAAGATCGAACACGCCACATCACCCACTATCGATGGACTGCTACACTCGGCTGATCCTGCTCACAACCTCTCCTTGCCCGTTCGAATCGAATCTATCCAATGTCTAAAGGATATCCCAGATAAATTTAAGCCAACAACCCTATCGCCACATGCACCCATTGTAGTCAAGCGACTTTGCAGATCCTTGGATGACAAGAAGCGGCTTGTTCGTAAATATGCCGTTGACTGCAGAGAAAGATGCTCGCTTTTACGGTATCTTCTCGGAGCATTTTCTCAGCCACTTTGCATTAAAAGATATATCAATAATAGAATGACAAGCCTTCTGTTTTACGATTGTATTACCTTAAAACTCGAGATTTTATGTGTCGGTGATCCTACATAA\n>XM_023978471.2 PREDICTED: Salvelinus alpinus phosphatidylinositol glycan anchor biosynthesis class Q (pigq), mRNA \nCTGTCTGTCTGTCTGTCTGTGTGTCTGTGTCTAGCTCCGCCTTGTGGTAGTGATGGTCCAGGGAGTGGTCCATCTCAGTGTTGACTTCATCAACTCCTTCCCTCTGTTCGCCATGGGCCTCCGACTCTTCAGATCCTACAGACTGGCAGAGGGGGTGAAGTTCAGAGTGCTCTGTGAGGAACCAGGAACACCTCTACACCTCATGATGGATATTAACCCTCTGAAGGTGAGCAGTGTGGTTCAGACCTACAGGACCCCCACCTACAGCTGCTACCCTAAAGACTCCTGGCTGGCCCTCTGCAAGAAGCTGTTCCTGGGAGAACTCATCTACCCCTGGAGACACAAGACTACCAAGATAGACTAGGACCAGGGGGGAGAGACAAAGGGGA\n>XR_002711448.1 PREDICTED: Cucurbita moschata uncharacterized LOC111448527 (LOC111448527), ncRNA \nACCAAATACATTGATCGAATGGCGCCTTCTTCCTCTAGTGCCGCCGAAGCATCGTGAAATTCTCCCCTCCTTCCTCCTGTAATGCCGCAGGATCGTGAATTCATTCTCTGTCTCCTTCACTGACTCTTCGACGAGCTGACGATTCGAGTTGTAAGAAATCCGCTTCGAGCCGTAGTCCTAGTCCTTTACGAATTTGGAAATCATTGAAACTTATCATTCAGACTAGCATTGTTGATTGAAAATCCGAGTCGCAGAGGATAATCCAAAAGCCTTGTTTAGTGCACCGATGAACAAATGTTCGACGCATTAAGGCTATTACAGACAGGATTTTAGTAAATAGACAGGATTGTATTAAGCACTGTCTTTTTTCTATGACGGAGATGTGATGATCTTTACTCCAAATGGACTTCCACAAGTATACAACGTTCTTCGGACATCGTTACGAGCGTTAATTGAGATTGTTCGTTATGAAGGATTAGGAAAGGAGGGAAAGAAGATGCAGGAGAAGAAGATGGAAGTAAGAGGAATGGTGAGTTACAACCCGAATGAGCGAGAGTTGACCAGGCTGAGAATCATCATTTATTATTGATGTGACTCGAAAGTCGAAGACTGAATTATAAGGAAATTCACTCGATGATTATTACTCAGTAAGCAGGTAAGTCTTCTATTCTTTTGTTATATAATCTGTTGCATCCGCTACCATCTACATTTCTCGTTATGATTAATCATCATTACTCAGTTTTTGTTGGATGAAATTTGTTGTTTGCTGT\n>XM_041901937.2 PREDICTED: Coregonus clupeaformis protein lin-28 homolog A-like (LOC121585613), mRNA \nGGAAAATACACTATTTTCCAAAGAGGGATTACCGAAAAACGTGCACCGATAAACCAGAGTTTATTGCCTGATTCTTCTGGAGTTGTATGAGGCCCAGGAACCCCCCAAACCATGGCAGAAGGGGGCTGTGCAAAGACCGAAGAGGAGGAAACCACGGGCTCCGAGGAGGATCTGGGTTCGTCTCGTGGCAGCGGCGTGTGTAAATGGTTCAACGTCCGGATGGGTTTCGGGTTCCTGTCCATGACCAACCGAGATATGACACCGCTGGAGGAGACTGTCGATGTATTCGTTCATCAGAGCAAGCTGCACATGGAGGGCTTCCGTAGCCTGAAGGAGGGCGAGGCGGTGGAGTTTACCTTCAAGAAGTCGTCTAAAGGCCTAGAGTCTGTTATGGTGACGGGGCCAGGGGGAGCACAGTGTGTGGGCTGTGAGAAGACACCCAAGGGGCAACAGAAACGACGCTCCAAGGGGGACAGATGCTACAACTGTGGAGGACCTGACCACCATGCCAAAGAATGCCAGCTACCTCCTCAGCCCAAGAAGTGTCATTTCTGCCAGAGCATCAGCCACATGGTGGCCAACTGTCCAATCAAAGCACAGCAGTCCTTCCCTGGCTCTCAGGGAATAGCATCATCATTGAGGGATGAGAAAGAGGAGCAGAGCCACGCCCCCTTGCTCCAGAGGGAGAGCACTGAATGATCCATTCAGGGATTCAGCCAATCACAAGGTTTCATTGTAATGCTGCTTTTGGAACTACATCAGGCTGTCTTTATTCATCGAACTAACAGCAAGAAAATGGTAAATTTATTGATGCGATAGTTGAGATTGAGAGTTAGCTCTGTGTTTTAATGCACAGAGAGACACATCTATCCACCTTCTTTGCAACTCAAATACTTTAAAGTAATTCCTTTTCTGTCTATGAAGTTATTATTTCTGCATTAGATACTGAAATAATCTAAACTCACTGTGTTTACAAACTGCAATAAGCCTTGTATTGTCAGTTTTTACCACTGTACGTAT\n>JN498124.1 Uncultured organism clone SBYZ_7200 16S ribosomal RNA gene, partial sequence \nGTTAGCTTTGGCTATATGGATCAAAGGTGGCCTCTGCATGCAAGCTACTGTNTGGGGATGAGCCCGCGTACCATTAGCTTGTTGGTGGGGTAAAGGCCCACCAAGGCGACGATGGTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGGAACACGGTCCAGACTCCTACTGGAGGCAGCAGTGAGGAATTTTGCGCAATGGGGGTAACCCTGACGCAGCAACGCCGCGTGAGTGATGAAGGCCTTCGGGTCGTAAAGCTCTGTCAAGTGGGAAGAACCCATTCCGGCACAACAAGCCGGGGTGCTGACGGTACCAATGAAGGAAGCACCGGATAACTCCGTGCCAGCAGACGCGGTAATACGGAGGGTGCGAGCGTTATTCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGCCGATTAAGTCAGATGTGAAATCCCGGGGCTTACCCCCGGGAAGTGCATTTGATACTGAACGGCTTGAGTATGGGAGAGGGAAGTGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCGGTGGCGAAGGCGACCTCCTGGACCAAATACTGACGCTGAGGCGCGAAGGCGTGGGGATCAAGCAGGATTAGATACCCTGGTAGTCCACGCAGTAAACGGTGATCACTAGGTGTAGCGGGTATTGACCCCTGCTGTTCCGGAGTTAACGCATTAAGTGATCCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAAGAACCTTACCTGGATTTGACATCTCGGGAATCCCGCGGAAACGCGGGAGTGCCCTTCGGGGAGCCCGAAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCTTCAGTTACCAGCGAGTAAAGTCGGGGACTCTGGAGATACTGCCCCGGTCAACGGGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCTTTATGTCCAGGGCTACACACGTGCTACAATGGGCTGTACAGAGGGAAGCGATCTCGCGAGGGTGAGCCAATCCCAAAAAGCAGTCCTCAGTTCGGATTGGAGTCTGCAACTCGACTCCATGAAGCTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGCGCTACGTTCCCGGGCCTCGACACACCGCCCGTCACACCATGAGAGTTGGCTGTACCAGAAGTCGTCGG\n>GU967443.1 Rosa rugosa putative MYB transcription factor (MYB4) mRNA, complete cds \nACTTTGTATAACCAGCCTCTTTCTTTCTTTCATTCACTCTCCCTTCCTCACAAACACATAACACACTACGGGAGCAGCCATGGCTGGTGTTGCAGACAGTGAGTACACAAGTCCTAATGAAGAAGAGAATGAGATGAGAAAAGGGCCATGGACGCTTGACGAAGACACCCTGCTCATACATTACATTGCCAACCACGGCGAAGGACATTGGAATGCCTTAGCAAAATGTGCAGGATTGAAGAGGACAGGAAAAAGCTGCAGATTAAGATGGTTGAATTATTTGAAACCTGACATCAAGCGTGGGAACCTCACTCCACAAGAACAACTCTTGATCCTTGAACTCCATGCCAAGTGGGGTAACAGGTGGTCGAAAATAGCACAACATTTGCCAGGAAGAACAGACAATGAGATTAAGAACTACTGGAGAACAAGGGTGCAAAAACAAGCGCGCCAACTTAATATTGAGTCTAATAGCAAGAGGTTTCTTGATGCGGTTCGATGTTTCTGGATGCCGACTTTGCGTCAGAAGATGGAGCAAACTTCTTCACTTAGTTTAGACCCACCTTCTTCTTCTTCTTCTCATTCTAATTACTTGACTTCTCAGATCTCTATAGCTCCTTCTCTGTCGACGTCTCCTCAAACTTGCTCGGTTCCTTCTTCTCCACCAAGCAAAGTGGTCTCACACGTATCTGATTATTCCCCAATTGGAACTTCAAGCCCAAGTCATAATAGTCTTTCCTCGGATTCTCTTATTTCACAGCTGCCTCAAATTACAGAACAACCAGCAAGTTCATCCTATGCCTTTGAAGCTCTAAATGACAATTATTATGTGGACTATGACATGGAGGGTTTTAGCCTTGACCCTGTTTCAGAAATGGCAACTTTTGACACTTCACAGTTTGATTGCCAGATGGCAGAAAGCGATTGGATACCAAGCAATTACATGACTGACACTTTATGGAACATGCAGGGGATGTGACAATTTGGGGAAAGATACAAGATCAGATGGGGCATCAACGACTAGAATTCATAATTCATATTAGGAGTCTAAGGGTGTGTTGTAATCTGAGTGACCCTTTCATCTATAGGAACCTTTAGTTATATA\n>XR_007259806.1 PREDICTED: Pyrus x bretschneideri uncharacterized LOC103929507 (LOC103929507), transcript variant X5, ncRNA \nCATTCTTTTCCCTCATTGGTACCCATCCTTTTCGATCTCTATCTCGCAGAAGCCTTTCTTCCTTGTGAAAGTGTTGCTCATCGTGGAAGGAGAGAAGGATGAAAAATGGGGCTCTTCCATTTGCTTCCAGAACAGATTTCTCAAGCTCTCTCACTTAAGCCGCGAACTCCTGGCCTCCGTAAGAAGAAAAGCTTGGCTCCCGTTCTGATTTGAGGAGATTTTAAACCCATAAAAGCTTGGGTTTCCAGCTTTGAAGAAGAAGATAACTTCTTTCACTGCAAGGACTTTAGACCTCTGATCTTCTGGCCTTCACGCAATCTAGATCTTCACCGTCAATCTCACTTGGGCTCTGCATTTTGTGAAGACAACTTCGTCGCTAAGATTAAAATAGAGATTGTAGTGAGCAAAGACCGGGAACCCAGAAGAGTCCCGAATTCAGTTTCCACTCTGACTGAAGATGGAACTTGGTGCTATTAAGCTATCATCCTCAGCTTCAGAATTCAGGCCTTGTCCATGTAAGGAGTTGCAAAACACCAACCAATGATATGAACATGGTAGGGTCTTGAAGCAATTCACCATTGTAAGGAGCAAGTTTAGAAGCACATGAAGGCGATGCACATGGTTTGGAATCTAGCATGTTGGCTTTTGTTAGGAGATCCTCGACATACTTGGTTTGAACCAAGAAGAGCGTGTCTGCCGATGAGCTTGAATACCAAGAAAAAAGTGCAATGGACCAAGATTCTTCATAGCAAACTGAGTACTGAGCTTGTTGATAAAAAATTCACAATGAGAAGAAGAGTTACCTATAATCAGAATATCATCAGCATAAACAAGTATAAAAGTGAGTGAGTGATCAACCTTGATAAAGAGTGAAGGATCTGCTATAGAGGAACGGAATCTGAGAGCTACAAGACTACGATAGAGCTCCTCATACCAAGCTTGCGGGGTTGTTTGAAACCATATATAGACTTGTGAAGCTTGCACACAAAATGAGGTCTGGGAGGATCTATGAAGTGTGCCATGAAGGAAGGCATTGGAGACATCCAATCGAGTAATCTGCCAATTGAATTGGATAGCTAGAGATAAAACGAGTCTAATAGTTGTTGATTTAGCGACTGGACTGAATGTTTCATGGTAGTCAATACCATGTTGTTGAAGAAACCCTTTAGCAACAAGTCGTGCTTTATATCGA\n>XM_014803901.1 Moesziomyces antarcticus ANTH-domain-containing protein partial mRNA \nATGGCGCGCTTCGACGACCACATGCCCACGCGGCCCGTCGACCGCGACAAGGCCGAGTCCGAGCTCTCGATCCACATCAAGAAGGCCACCAGCACCGAAGAGACCGCTCCCAAGCAGAAGCACGTCCGCAAGTGCATCGTCTACACCTGGGACTACCGCACCTCCCAATCCATCTGGACCGGCCTCCGCGTCCAGCCCATCCTCAGCGATGAGGTGCAGACCTTCAAGGCGCTTATCCTCGTCCACAAGGTCCTCCAGGAGGGTCACCAAGTCGTGCTCAAGGAGGCCCAGGCTCAGATCGGATGGTTCGAGACTTGCGCCCGCACCGTCGGCGCCGACAGCATGCGCGGCTACGGAGCCCTCATCCGCGCCTACGTCAACTTCATCCTCGCCAAGCTCCGCTTCCACCGCCACCACAAGGAGTTCAACGGCCTCTTCGAATACGAAGAGTACATCTCCCTCAAGAACATCGACAACCCCGACGAAGGCTACGAGACCATCATGGACCTCATGAACCTCCAGGACCAGATCGACCAGTTCCAGAAGCTCGTCTTTGCCCACTTCCGCGGCTCCGCCAACAACGAGTGCCGCATCTCCGCTCTCGTCCCCCTCGTCAAGGAGAGCTACGGCATCTACAAATTCCTCACCTCCATGCTTCGCGCCATGCACCGTCGCACCGACGCCAGCGACGCTCTTCAACCCCTTCGCGAGCGCTACGACTCGCAGCACCATTCACTCCGCAAGTTCTACTACGAATGCGCCAACCTCAAATACCTCACCTCCCTCATCAACGTCCCCAAGCTCAACCACGAGCCCCCCAACCTCTTTGAACTCCCCGAAGAGGGTCCCTACCTCCCGCCTCGACAGACGCCCAAGGCGCCAACGCCGGACCCCGGTCCATCCCAGGCAGAGATCGACGAGCAGGCGCGCTTGCTCAAGCAGTACGAAGACAAGCAGGCCTCACTCAAGGCGCAGGAGGAAGCAGAGAGGCAACGACAAGCCGACCTCGCCGCAAAGCAGCAGCGCGACTTTGAGGAACAGCAGCGTCAGCAGGCCGAACAGCAGCGCCTCGCACAAGAGCAGCTCATGCGTGCACAGATGGACCAGATGCAGGGCGGTCGTCTCGCCGAGCTCGAGCGCGAGGTCTTAGCCATGCGCGGACAGTACGAGCGCGACCAGCTCATGCTCGAGCAGTACGACCGTCGTGTAAAGGCGCTCGAAACCGAGCTCGCCAACATCGGCCAGAACTTTGGCGCCCAGATGCAGGGCAAGGACGACCTCATCAAGCAGCTCCAGGATCAGGTCACTCTCTGGCGCAACAAGTACGAGGCGCTCGCCAAGCTCTACTCTCAGCTGCGTACCGAGCATCTCGAGATGCTCGGCAAGTACAAGCAGATGCAGATCAAGGCTGGAAGCGCGCAGGAGGCCGTCGACAAGATGGAGCGTATGGAGCGCGACGTCAAGGCCAAGAACCTCGAACTCGCCGACATGATCCGCGAGCGCGACCGCGCCCGCTTCGACCTCGACCGCATCAAGGCCAGTCAGAAGGAGGAGTTCGACCGACTCAAGCGCGACCTCATGTTTGCCAACGAGCGTGCAGAGGATGCGACGCGCGCCAAGAGCTCCGAGCTCTCGGGCATGATGTCCACGCTCAACCGCCAGATCGCCGAGCTCGAGGACTCGCTGCGCGAGAAGCGCATGGAGCTCGACGCTCGCGACGCCGAGCTGGCACGCATCCGCGACGAGAAGGATGCCGAGCTCGCCATCATGCAGGAGGGTATGGACGCCACCATCAAGCAGCTCACCGACATGCAGCTCAACCAGGGCGAGAGCGACCAGGCGGTCAATGCACAGATCGACACGCTCATCCTCGACAACTCCAAGAAGCTCAACGCCATCATCGACTCCATCCTCCAGGCGTGCGTCGACAAGGTGGACGATGCGCTCTACGAGCTCGAGTCGCCCTCGGCCTCGGGCAACACCACCGCCACGCCCGAGTACGTGCTCTCGATGATCGAAAAGGGCACCACCTCCACCAACGAGTTTGCCACCGTCTTTTCGCTCTACCTCTCCGGCGAGGTGGGCGGCGAGCACGTCGAGGTCATCAAACGCGCCAATCAGCTCGCCCAGACCATCAGCGACACGCTCACCAGCACCAAGGGCATCACAAGGTTGGCGCAGAACGACGATGCTGCCGACAAGCTCATCGGCACCGGTCGCGAGACGGGCAACGTGCTGCTGCGATTCTTCAGCAACCTGCAGTCGTACCGTCTGGCCGGCGTCGCACCTGCCCAGCGCCGCGATGTGGTGGCACGCCAGAACATGGAGGCGCGCGCCGCGTTTGGCAACCTCAACAGCGTGGTCGAGACCATGGTCAAAGCGGGCAACACCATGCTTGCCAACGCCAACGGCGACATTGGCGACATTGTGGAGCGCGAGATGATGAATGCTGCGAGCGCCATCGATGCTGCGACGGCCAAGCTGCAGGCGCTGCTGTCGAGGCCGAGGGACCACAACAAGTACTCGGCGGTGGATCTGCAGGTGCACGACGCCATCCTCGAGGCTTCGCTCGCCATCACACGCGCGATCGCCGGCCTCATCAAGGCGGCGACCGAGTCGCAGCAGGAGATCGTGGCCAAGGGACGAGGCTCGTCGACCAACCAGCAATTCTACAAGAAGAACAACCGCTGGACCGAGGGCCTCATCTCGGCGGCACGTGCGGTGGCGTTTGCGACGACCATGCTCATCGAGGCGGCCGACGGCGTCATCATGGGCACGCACTCGCTCGAGCAGCTCATTGTCGCATCCAACGAGGTGTCGGCTGCGACGGCGCAGGTGGTGGCCGCGTCGCGTGTCAAGGCCGAGTTCATGTCCAAGACGCAGGACCGGCTCGAGCGGGCGGCCAAGGCGGTCACGGACGCGTGCCGTGCGCTCGTCAAGCAGGTCAAGACCATCACCGACAGGCAGAGCAACGGTGCAGCCGACTTTGACTACTCGCAGATGGCCGTGCACGAGTTTAAGGTCAAGGAGATGGAGCAGCAGGTCGAGGTGCTCAAGCTCGAGAAGGAGCTCACCCAGGCACGCCGCGTGCTCGGTGCGATGCGCAGGGCGGGCTACCACGCGACCGAAGACGACTAG\n>XR_001875487.1 PREDICTED: Lepidothrix coronata uncharacterized LOC108499283 (LOC108499283), transcript variant X2, ncRNA \nTATGGGCTTTCTGAAAAGGTAACTGTTGTAGAACTGCTCCGCTTCTATCCGGGTAAATCCGGGGCAATGATGGTCCTCGATGACGGCTGGAGAGTGAAATAAGGGCGAACATTCTGTGTTGTTACTTGAACTAAGATGGAACAAGAAAAGTTGAGCCCTGTGAAATGCTGTTTGCAGTTTGTCTTGGAACCTACAGAAAAAGGTATGTAATTCAGCATCCTGGACATAAGCAGGAAGGTAAGTCATCCAATGAAAAACACTCCTTAAAATGTATCAAAACATCAGGTAAAGGAAAAACAGTGATGTGGCTTTTGTCACATGAGGTGTGTCTGTACAGCAGTGACCACAGCTCAGCAATGCTACCTTGTTTATGTTTGACCTAGGTAGCTGGCAAGAGATCTCTACAAGCAAATATTTTAGTAGAAGTAAAAAGTTAAGAGTGTTTTTCAGCTGTTTTTGACCTGGCTCTGTCTTAAACTGTGAGGCTTCCCCCGTGATCAGCACGGTGACTGTGCTGCCTGGGCTAATGAGCCTGTTTGTGGAGGGGTAAAGCAATGCCAAGCTGCAGTCAGAGACATACATGTCATATGCTGTGTCCTGGCCAGGTGTGGACCTCAAAGCTCTGAGCTGTGCAGGCACTGGACTTATACTGCAGTTTCAATTACAAAAATCTGTGAGTGGACACTTGGTAACTGGTGAACTACCTAATAAATAATAGAAGAGTTTAAGGATCACTTTGATAAAACTGTATGAAAACCAGCATTAATCTTAGATGGGTTTCTGAACTTCAGAAAATGCAGTCTGTATCTTGCCAGTTGCTAGTAGGTGCTGGAAGTTTTTTCCTGTCTGGCTCAACAACTGTATGAACTGTTTAGCCAAAATCACCGTAGAAGTCTCTGTTATAGATAGTGGCAAGATGATGAATCTGCAAGATTTCCAAAGACATTGCCTGAAATTTTGTTTTACTGTTGTTGCCTTGGACCTGACCCAGTTAACCACGAGCATTGGGAAATGCTCATCCCATACACTCAACTATTTAGACACGAGAAAGAGGTTTATATGAATTAGAAGTATGACAGAGTTTTGATTAAGTCAGATATTTGTGGAAGTCTCAGGTTTTTTTCATAGTGTGAGTTGGTGGCCTGTAAAAGTTCAGCCTTTAAGGATTTTCCTTTTAATTACCTTTTCAGAATGAAAGATGGAAGAATTTTCACTTTTCTGGCCTTTTCCTGATGACAGTGGCTTTGACTGGGGGCCCTGATCTCCCAAACACTGATTGTCTTATGTTTCTCAATTCTGAAAACCTTCAAGCATACAGTCAGGTATCCTGCCAGCAGCTCTGCAGCAGTCAATGCTTTTGCAATACCGGGCTCTGCTCATTTCAAAACTGTGAAGCAATCCAGCTTAGCAGTCAGCAGAGTGTAAAACTGAATAGTAGGAAGCATCGGAGAGCACCTACTCCAGTTTCAAGCAGAAGAAAGCCTTAAAACTTCAAGGATCAGAATGCTGGGGCATCTCCACTGACAGGTATCTTTCAGGAGCTGCCTTATCCTGTACCTGTCATAAAGCCAAAGTAGGAGCAACTGTTCATTCTAAGATGCATAAATCAGCTTTCCGAGATGATGCTCTAAGGAGAGCGCTGAAGAGCTCTGAAGAGCTTGAAGCTGGCAGGTACTGGGTGGCACACCTGAACTGCTCCTGGCTGCCCTGGAACATCCCACTGAAGATAACATTTATGGAAATGCAAGGAAAAGAATTGCTCCACCTTGCAGGTACAAAACAAGATGCCACGTTCCTCACAGCGGCCAGAGTTGGCATGGATGAACAGCTCTCCCAGAGGGACCTGCTTCCCTGTGGGAAGATGCTGCCCAGGACAGTAACATTTCTGCTACTAGAGCTGAGGGGAAAGGTCATATTTGGGACCTGATGTTAGGTCAGAATTGGAGCTGGAACTTTGCATACATTTTTTTTTCCCCCAAAATGGTCCTGTACTCTACTCTCTCAGCCTTGTCCTCAGCTAACGTGTTGCAGTATTGCTTAGGGGTGAGCTGTGCTGATGCCACTGCTGTACTCTTGCTGGTTTGGAGCATGGGGTCTGCCTGGCCAGGTCTGGGAGGAGCTGGGAAGATGGACTGGCTTGCAGTGCTGTTTGAAAGCAGCACAGACCCCTTTCCTAGCAGAATGTTTAATGGAATCTGCTTCCTTGAAACCAAAATGAGGCAACAGCTGTGATTGCAGCAAGCTGTAACATCTCATTACTGGATGGAGGCACGTCCTGTTACAAGTGGTGGTGCTGCAAAACCTCAGCAAAAGAACCTACTGAGACCTGCCTGGCTGGGGGCTGTGAACTCCCCTGAGGCCTCAAGAAGAAGCTTGGAATGTGGTGCCAGCACAACAGCAGACAGTGAGAGAAACTGAGGCAAGCACCTCGAAGATAAGTAATAAATGATAATTGTTATTTCCTATTATTCATCTGAATCTCTACTCCTGAGAATTTGAGTTAAATCCTAAATTTTCCTTTATTTTTAAGCAGATCATCCAGCAAGTTAAAAAACAGCAACACAAGGAGGTCCTAAGATAGGGTTTGCTCCAGTTTTCCTGCTGAGCATCTGTTTAGGAATTGCTGCTAAAAAAAGTCAGAGGGGATGGTAGTTGCTGTGCTGTCACATGGGCTGATACAGAGCAGAATCTGCTTAGCATTCTTGAAGGGAAATTATCCAGTGCTGTAACTCACAATTTATAATTGGTTGCATATTAATATCTAAAAAAGGCAATAAAATCCACTGTGTGTTTAAAAAAAATAGTAAGTAGGAGTATTACAAGCTGAGCAGTGAAAATCTGGAAGACTTCTTGGCTAGAGCAAGGCTGTGTGCAGTGCTGTTTCTCCCTTAATTACAAGCAATTTTAAATCATCTCCTTCCTTCAAAGAGGGATTTTGTTCAGGGTGTGTGTTAATTTTAATCTTGCTAACGTGATACTCTCTTGGAACCTCTCCCTTGTGTCATAACAGTGAGATGTGCTGCCTCTTTTGTCCCTGCCCTTTGGGAAATGCAGTTACTGCTGCTCATTGCCTCAACCCTGCCGTCGTGACTATCAGTGTACCTCCCTTGAAAGGAGAAGAAAACAAAACCCAACAGCAGCATTGCTTTTTCCCCCCCAGAGGTTCACTTTTATTTGTACTATTTAAGCTAGACTGTGCAAGTACTTCATGAAAATCAGGGATTTAAAATGTATGGTACTGTATTATGCTGTATTATTGTGGAAAGCTTGTTATTCAGCACACTAATTATTTCTGAGTCACTATATTTATGAAATGGCATGTAATAACTACTTCACCACCACGCAAAGTAAACAGTATAAAAGCAGGCATTTTATGATTTTGACATTTTAGTGTATAAACATATTCCTGAATCTCCTGGGGGGCTACTGGAAATCAGATAATGTTTTTATGACTTTTAAAAAATGACATTGAATTTCACAGTCTGTAACGCTCCATATATATGGTTAATGTTGCATATTTTATTACAGCCTCAGTGGCTTATGTTACAAGTGTCAGCTGCAAAGAGAAAATGTACAAAGGCGGGTTTGTGGAACTGTGGGGGAAACAACATCGTAAAACCTTGCAATGCACACATCAAAGCCCTTGGACAAGCTGTAATGGCAGGTCCTGGGCCATGCTGGGACACCAGAATACACCCTCTGCTTTTTTTCGTGTCAGGATGGATTACAAAGCCCTCGCTGAAGGAGGGTTTCTGCCCACACTTGTCACTAGAGGATAACTAAGTTTGGGGTTTTGTCAAGCCCTGTGTGAATGACCCGTTAACTCCAGAGGAACTGGGACGCCTTGAGTGACACTCTGCGAGCTGGACTGCACTGAGACTTCTGCATTTCAGGAATGTGACTCCTGTCCTTGACCTCGTCTGCAGATAAATACAACATGCCCCGTAGTGCTGAGTGGTTTGGGAAGAATGTCAGCCAGACAAGAGAGGGGAGATAATGGAAAGACAGGCTAGGATAGGAACTGGGCTGTCTGATTCTGCAATGTGGGAATCGCCTTTTCTCAGCTGCCAGTGTCAAAGTCAAGCTTGCATTGCACAAATAAAATGGGGTATTCCACACACACACCTGCACCCTTTCAATTCTCACTGATATTTAGCAGAGGGAATATTCAAAACATTATTCCCTCCAATACAGAATGGCTGTTGGGTGTTACCAGATCACGTAAAAAGACATCTGAGTGGAGTTTTTCCAGCAACAAACAAGAAACAAAGGGAGGATTAAAAAAATGTTTTGCTACGTATACTGTTATGATTTTTTTTGGTGAATATATATAAAAAATTAATGTTGGGATGTGAAGAAACAAAGAAAAAGAGCAGGCAAGTGTGCTACCATAAAATGTAGCATGACTTGGTACAGAACTGAATGTTACAGGGTCAAGCATCAGGTAGGGACATGTGTTGGGGACTAGGATGGTACTTACACTTATTACTGAGGTCAGTGCATATTTTCCACTACCTTATTTATGGGATCAAAGGTTTGATGGGATCTAGAAATCCAAACACATTTAAAACGTGGCAGATGTGGGTAACCTCAAGTACACAGCCCATCGCCTCAGAAAGAGGAATGTTCTTGCAAATTTGACATAATCCAATTAGTTGATTCCCTCAGTGACATTTCTGCAGGCTCATGTACAGAGGGACAAGGAAAGGGAGATTTATGACAGCTATTCCTAGCAAAGGTCATTTCTTTATTAGTGAACAACCTGTCCTTAGTCATGCTGATGATGAGGCGTTGAAGGATAAGGGAGAGGCTGTGTAGCTTTAAAACTTGACAGGGAATAACAGCAATAGAGCATAGATCATCTCTCTACTTGGACCAGGAGGACTGAAATCTCCCACCATCAGGCCAAAGCCAGAGAGCAGGAGGCAAAATCCAGGAAAAAAATAATACATGGGGATTTCTGTGGAGATTGTGAAGGAGTTTGGATGGTTCAGTGTCAGCACAGCAGGGGGGAAAGAGGAGCCACAGAGCATGAGTATGTTTTTGGATAGGATAAGTGTCCTTGGTGGAACCAGCTGCTTATAAAGAACCTGGTCTGGTTGCTCTGGGGAATCCCTGGTCAGCACTGCCAACTTCCCAGTTTGAGCAGCTCTCAGCATCCTGTTCCATGCCATTTCCAGAACAACACAGATGAGAGCATGCTCAAATATCTACAAATACACTTCCTTGGCTGTCCTTCCATAGGCAAGGAAAGCACCAGATTTGACAGGAATATGGTTTCAGTAGATTGTGACATACACATTATGTATTTTTAAACAATAAACCAGTATCTACCTATTCAAGTGACTATTTTTCCTGCTTGCAGAAGAGAAGGTATTTGACACTGTACATA\n>XM_039434265.1 PREDICTED: Nilaparvata lugens aminopeptidase N (LOC111044204), transcript variant X4, mRNA \nGTCTCTGCTATTTTTAACCGTATTCAGCTGAATTAGTCGCTAGCTTGGAATCAATTAAACATGGGTGCTCAAACTTTTGTCCCTCGTTCAAATTTCTTCAAATCCTGACTATAATTATTAGATTGTCACGTGTGACAACTTACAGTTTAAATTTTAATTTGATTTAATTTTGATAAGTTCAATTTCCAGAATTGTTGTTATTATTGGGATTCATTTTTAATCAAGTAAGCGTTCAGTCATAATAGTTCCTAAAATGGGGTATTTTATGACGTCATTGATAGTATCTCTCTTGCCCTACACAATGAATTTGGCTGATTCGAAAATGCTAACTGGATCTCCTATAGCATTTCAAAGATCGACTCATTTCAATAACCAAAGACTACCTCTTACCATCTTTCCAATACATTATAGATTAAATTTGTCAGTGCCATTGATAGATAACAATTTCACCGTAACTGGGGACGAATGGGTTTTTTTGAATTGTACAGTAACTACAAGGGAAGTTGTATTCAATGTGAAAAACATTGACATCGATAAGGCTAAGACCAGGCTTTATGATTCTTTTGGTGGATCGTTCGTTCGAATTATAGAACAAAGATATGAAAGTAGCCGAGAAATGTTTGTGATAAGAACGGCAACTCCATTGATTTCTAGACGTCAGTATGAGTTGGGACTTCAGTTCTCCTATGTTCTCAATGATGAGCTGATGGGATTCTATCGAAGCAGCTATATTGATCATGCTACTGGAGAGAAACACTGGATAGCAACCACCCAATTCTCTCCCACGGCAGCCAGGCGGGCTTTTCCTTGTTGGGACGAACCATCATTCAAAGCCTACTTTTCCATAAGTATTGCTCATCACAACAAATACCATACTTTATCCAATATGCCTATCAGCAATTCAATACCGGCCCCTGGAATGAACAATGATTGGATCCAAGATGTTTTCAAAACGACATTACCGATGTCAACATACCTTGTGGCTTTCATTGTTTCTGACTTTGTTCCTTACAAAACAGTCATCGATAACAGCTCAGGTTGGAAGTTCACACTATGGTCAAGAAAAGACATTCTATCACAGACTGAGTATGCCGCCGAAATGGGACCCAAATTGCTTAGTTTTCTGGAAGAATATTTCTCCATAAAATTCCCTCTTCCGAAACAAGATGTGGTTGCCATTCCCGATTTCGGTTTCAGCGCGATGGAGAATTGGGGACTTATCACATTCAGGGAAACATCCCTTCTATATAAGCCCGGTAAGACAAGTGAGAAGAGCAAACTGGACATAGCGTTTGTGTTCGGTCACGAGTTGGCTCACCAGTGGTTTGGCAACCTGGTCACCCCTGCCTGGTGGAACGATCTCTGGCTAAAAGAAGGATTCGCTACTTTCATTGGATACACGGCGATAAATCATATGGAGCCATCATGGAAAGTGCTGGATCAATTTCTTCTGCAACAAGTGCTGGGATCGATGAAAATCGACTCACTCAACGCAACACATGAAATTGAAGTTGAAGTGGAGGAGCCCAAAGACATTGTGCAGATCTTCGACAACATTTCATACATGAAAGGCGCCTCGATAATCAACATGATGAGCCAGTTTCTGGGTGAGCGGGTGTTCCGCGCGGGTCTCAAGCGCTACCTGACCGAGCACGCCTACTCGAATGCATGCCAGGACCAGCTATGGCGAGCGGTCACGGTCGAGGCTGCCTCGAGTCTGCCTCAGGGTGTCGACGTCAAGCAGATCATGGACACTTGGACCCTGCTGCCTGGCTTCCCTGTCGTCACGGTGCACAGGGATTATGAACAGGGAACGGCTAGTGTCACACAGGAGCGATATTTCGTGCTGAATGAATTCACCAGTGAAGATAAGTGGTGGGTACCTGTTTCATACACCACACAAAGTGAAATGGACTTCAACAACACCCAGCCAAAAATTTGGTTAGAACCATCCAAACCGACTAAGAAAATTACAAATATTGATCCTGATGACTGGCTGCTGATAAATTTAAAACACACTGGCTACTATAAGGTGAACTACGATGAAGAAAACTGGCGTAGATTGCAGGAATCGTATCTGAAAATGCCAGAAACGATTAGAGCTCAGCTGTTGTCAGATGTGTTTAGTTTGGCAGCCACCGGAAGGACCAACTACTCGACTGCCCTGGGCTTCAGTCTGCATTTGCCCCGAGATAATTCCTATTTTCCCTGGTCGATTGCTTCCGAAAAATTGTCGTTTATCGGAAAACTCATGCGGGATACGGATGCTTCTGACGATTTGAAGAAATACATGTTGCATTTGGTGGTGAATACCAACAAAGAGCTCACTTTCTTCCCAAAAACTCCAATTACTGGTTATTTGAACCTATTGCTTCAATTGAATTTAGTTGGAGTGGCGGCGGACAGTGATCACCAAAAATTGGTTCATGAAGCGAAACAATTTTTAAATGATGAGATTCTCGGTAAAAACGTCAGTATAATGGCGGATTTCAAAACCAAGGCATATTGTACGGCAATCAAACATGGTGGCTATGAAGAGTGGAATTTTCTATGGAAAAAATATCATGAGACAAATATTGCCTCAGATAGAGTGGTCATTCTCATGGCATTGGGATGTAGTAAAAATAGCACCATCCTTTCAAGGTATTTGAACAGAATCCTAGATCCAGACAGTGAGATAAGAAAACAAGACGGGGCGTTTTTATTTGAAGTTGTAGCCAATAAGAATCCAGTCCTGGCTTTCGATTTTCTCAAAAAGCGGTGGGAGAATCTCCAGTCATATTTTGGACTGGGATTCAGACAAATGGCAAAAATAATTGAGTCTCTTGGCACGCACTTGAATATGGAGCAGCAACTGATAGAGCTGGAAAAACTGCGATCAGACCACATGCAAAGCCTTGGGTCCACAAGCAACAGTTTCAAACAAACCATCGAAAGAGTGAAGTTCAACATACAATGGATGAACAACCATTACGAGTCTGTTACAACTTGGCTGAAAGAAATGCTACCAAAATTGAAAAAGACGTGATAAAGTGTTCCTTCCTCTCAGCTATGATCAATACTGGAGTATTATTAGTTTAAGGGAATAAATGTGTCGAAAACTTGAAGATTCAAATCGTTGAAGGCTTATCTAGCTTTTAACATTATCAAGACTATCTCCTATCAGACATTTTTCATGTCAAATAATAATATTTCAAATTTAGAACTTTTAAGCTAGTACACTCTTGAGGAGAATGTTAACAAGTTTTTTATTTTTTCAACAATAATCTACGTTTTCACTTATTGACGTTTCACTTATACACGAATTAATGAAAAGTTTGCATTGGAACAGCATGAGAAACTCCAATTTCTCCAGCAGTTTCAGTACAAAAATTTTATTGAACCGAGTGCTTTGAATATTTTCTGTAAAATTTAAAAGTTTAACTTGTATGTAAGAAATCTACAAAGCTCTAGTGAAGAAGTGCCATTGTTTGAAAGGTGCTATTATTATAGTCAATATTATTGCAAAGTCAGTTCTGACTTAATTGTGCTAAAGTAAGATTAAAAGTTGTGTGTTCTCATAAGTTATTGAGGAAATCTTTTTTTTCTGAATAGAGTATGCAAAAATATAGTCATTATTCGA\n>XM_028248081.1 PREDICTED: Camellia sinensis pentatricopeptide repeat-containing protein At2g13600-like (LOC114302958), mRNA \nATGGGGTGTGCTAGCAGGTCCGATGTGAAAGAAATAGCCGATTACATGACACTTCTTGAGGGATGGATTTATGAGCACTTTCGTGGATTCCAACCACACTTGAATATGAATTACACTCGAGACATGCCACATGTTTACCGTTGGACTTCTCGGAGAGAGTCTGGTGAAGAGAGACAGTTGCAGGCTTTTCGAGAGGAGCTTGATAGGTTAGGGTATTTGGAACCCATACTAGAGTTGCAGAGATGTCCATCCGTGTCACCCAGCTATGTTCTATCACGGTTGCCTAAAGTGTTTGGAAGAAATCTTGTCCCAGATGATGCAGTTGATTATATTGCTTCTGAGAATAACATTGCAGAATTTTTTAAAGTGGATAGCACTATGTTTGTGCCTCTTTTGACTGTATGCACAGAGCTCTTTTTGCTCAAAGTCGGAAGACAAGTCCATGGCTTTCTTATTGCTTTCTCTAGCTGTCATTGTAATAATTATTCATTGGATGATGGCGATGCAATTATTGGAAGCGCTTTGATCAATATGTACAGCAAGTGCGGTAGCATTGGTGAAGCTCGAAAAGTTTTTGATGCTTGGCTGCCTGCCCAACTTGTGGCTCTTTGGAATTCGATGATATCAGGTTATATGTATAATGGTTTAGTTGAAGATGCTAGGACACTGTGGGAAGAAATGTCAGAGAAAAATGTCATTTCATGGACGAGCATGTTATCTGGGTATGTACAGAACGATATGCCACGAGAAAGTTTAGATTTACTAGCTAAAATGTATTCTAACGGGGATGGATCTAGAGTAGAAGGGAACTGCTTCACTTTTGTAGCGGGTCTTGAAGCATGTAGCTATTTAACAAACTTAGAAATGGGAAAACAAATCCATGCAAAGCTCATGAGGACATTAACTAGAGCTGATACCAATAATGTGGTTGTTGGAACGGCTTTGGTGGATATGTATTCTAAAGCCGGCTATTTGTCCTATGCACAAACTGTTTTTGATTTGATGGTGGAGAGAAATGTAGTTGCATGGACATCTATCATTATGGGGTATGCAGTTCATGGGTTTGGTTTTCGAGCCCTTGATTATTTCCAGCAGATGATGGAAATGGGCGTGGAACCAAATGAGGTGACATTTGTGTCTGTCTTAACTGTTTGCAGCCATTGTGGTTTGGTGGTTGAGGGGTTACAATACTTTAAACTGATGAAGGAGAAGTATAGATTAATTCCAAGGGAAGATCATTACACATGTTTGGTTGATATGTTGGGACGCGCTGGAAGGCTTGAGGAAGCATGGAATTTGCTGGAAGAAATTGATGTTGGAGAAATGAGTTCTAGAGGTACCATTTGGGCCGCAATGCTTGGGGCATGTCAATTGCATGGGAATGTGGAAATGGGAAGGAGGGCAGCTAAGAAGATGTTAGAGACAAAGAAACAAATTTTGACGACTCATATTGCACTTTCTAATGTTTATGCCGGGGCAGGGATGTGGAATGAAGCGTATAGAGTGAGAGAAAATTGGAGCAAAGAAGGTGATGTTAATGGGGAGCCAGGTCTTAGCCACATCTGCACAAACCTTGTGGTTTCTTGA\n>JX292766.1 Haloferax sp. SSIN2 16S ribosomal RNA gene, partial sequence \nCGCAAGTGCGATAAGGGGACCCCAAGTGCGAGGGCATATAGTCCTCGCTTTTCACGACTGTAAGGCGGTCGTGGAATAAGAGCTGGGCAAGACCGGTGCCAGCCGCCGCGGTAATACCGGCAGCTCAAGTGATGACCGATATTATTGGGCCTAAAGCGTCCGTAGCCGGCCACGAAGGTTCATCGGGAAATCCGCCAGCTCAACTGGCGGGCGTCCGGTGAAAACCACGTGGCTTGGGACCGGAAGGCTCGAGGGGTACGTCCGGGGTAGGAGTGAAATCCCGTAATCCTGGACGGACCACCGATGGCGAAAGCACCTCGAGAAGACGGATCCGACGGTGAGGGACGAAAGCTAGGGTCTCGAACCGGATTAGATACCCGGGTAGTCCTAGCTGTAAACAATGCTCGCTAGGTGTGACACAGGCTACGAGCCTGTGTTGTGCCGTAGGGAAGCCGAGAAGCGAGCCGCCTGGGAAGTACGCCCGC\n>XR_004551154.1 PREDICTED: Pseudochaenichthys georgianus uncharacterized LOC117439437 (LOC117439437), transcript variant X1, ncRNA \nGTTTGGTGATGTTGTGTGTGAATTCCAAAAACAATGTGACAACAATAATGGAGTTTCCATGCACTAATGGATACTGATTCAACAAGCTCCGTCCATATAAACTGATGGTGAACAGAAAGTCTGCAGTCAGCTCCTTCACCACAAGAGGAGAGAGACAACAATGATTTCCATGCAGCCGGCGGAAGAGAGAGAGGGAGAGAAGAAAGCCACCAGCGGGTTCCCGGTCCAGAAGATCCAAAAGGTCCAGAAGATCCAGAAGAGCCAGAAAGCCACCAGCGGGTTCCCGGTCCAGAAGATCCAGAAGATCCAGAAGAGCCAGTGTGCTGGACCGACTTGTTTGACTGTGACAATCCCAGTGGCTCAGGGGACTGGGAGCTTTTGAAGGACCTGAGGAAAGAAAACCCAGGAAAGATCTGTGAAAACCCTCTGTACATAAAGGTTGTTATCACTGACACGATGACCCCAGCCATCTCCACAGGGCAGACCTTCTATATCTTCAATCCGACTCAGGGATTTGTTTTCCGCAACAAGGACCAGAGTGAGGGCATGTGCCGTGACTACAAAGTTCGCTTTGGGTGCCCGTGCAAGAATTAAGCTGCAACTCCACAGCAAACATCCAACAAGAATATGAAGCTTTGATTGCTTTAAAATGTTGTCCTTTTCACTTTACCTTTCTATTTTATATCTTACTTTGCCTGATGGAAGAAGTTCAATGGACCTTTTTTACGGCAGACATGTTGACTTGTAGCAGGAACAGGACCATGAAGCCTCATCAGTTGATTAAAACTGAGCTTTATATCGGAGTATGTTTTACGCCTGTACGTTTACCAACATGTCTTCCGAGTTAAGATGCATCATGTCATGTGCTTTCTCAAAAAAACCTTTTTCTAGTGATCATGAAATCATTGTCTAATGTAGGAAATA\n>NR_045871.1 Mus musculus RIKEN cDNA 4930428O21 gene (4930428O21Rik), long non-coding RNA \nACAGCAAGAGCTTCACTGCTGCAAACCAAGTATGGCTCCCACTGTCACCCAGCACTTGGGAGGCTGAGGAGAGCCCACGGATTTGGCAAGTCTGGATAGCCAGCTTGTCCCTGGGATCCTCTGCTCCTCCCGCCTGAGATCTAGCACGGCAAGTGGACTGCCACATCTGCCTGTGGACCTCCACCACATCTGCCTGTGGACCACCACCACATCTGCCTGTGGACCACCACATCTGCCTGTGGACTACTACATCTTCCTATGGACCTCCACCACATCTGCCTGTGGACCACCACATCTGCCTGTGGACCACCACCACATCTGCCTGTGGACCACTACATCTGCCTATGGACCTCCACCACATCTGCCTGTGGACCACTACATCTGTCTGGATTTTATTGCATGGTGATGCTCTCGGCTTGGGAGTGAATCACAGCAAGAAAGCCCTGCATCGTAGGTAGCTCTCCTCGGTACATTCCTGACTCTCTTTGGCCAAAGGATGGAAATCTCTGAAGATAATGACTCTTCTGTGACTTCTCTCTTCCTACTTACTTCTGTTGGGTTGAGTTCCCTTGTGGCCTGCTGATTGGCCCTGGCAATGTACCTGTTAGTGGTGGAGGGCAGTTTGGAGAGTTACTTCCACTAAGTTGATAAATGCCCTCCCCCACAACGGTTTTCTAGACTCCAGTCACAATCAACACCTTCTTTCCAAATTCCCCAACCACATTGTTCAGGAAGCAGAAGCATCTAGAAGCCACAGGGAACTGTTGGACTCAACCTGTAGAAAACTGGATGGAGGTTAGCTAGCCCTCCCTCCCGGGAGCTCCGACCTACTCCAGGGTGAAGAAAGCGAACTTGTATTGTGTAAATTGTACCCAGCACTGTCTCAGGAAGTACCGTAGCTTCCTGATTGTGAATGCAGATAATAAAGTGTAAGGCCGTAGCGGCTAAGGACGAAAGCCACCAACCCACCAAAATGTAGAAAATGACATTTCTAAGCCTCAGGTGCAGGAGAGTCACTATAATGGTTAGGAGGCCTCAGGCAAGGAATTGGTTTCCTGTCTTAAGCAAAGATCACTGGGAGCTTTGAGAATGGCAGGGAAGGGTTGGGAGACCTCTCCGCTGGTCTCACACAACCGTTGGGTTTCCAGGGAGTCAGGACTGCTACTTGCCACTTCCGCTCCCCTATTTTCTAAGAGAAATTATGAAACAGAACTTGATAAAGAAAAAGTAAATTTATTTACAGCTGGAAAAAACTGGGGAGAAAGAACCTAGTTTCTTTCCTCAGTGTCTATGGTTAGGATTTTTCAAAACCCCTAAGACACAGGCCAGAATATTGCAGATTTACCTCTGACAGTTAGGCTGGTCTTGATCTAGGGGCAGAGTGACTCAGCCCTGGGTTGCCCGTACTCCCGGCAGGCTGCCTGGTGCTGCTTCTGCCTCCTTCATACACACAAGCATACATGCACATGTATGTATTATATACACAAACACATATGAACATATATGTATTATACATATAAGCATACATGCACATGTATGTATTATACACACCAACATATATTAACATATATGTATTATACACACACGCACACATATGTATTATACACACAAACATACATGCGCATATTTGTATTACACATACATGGTTATTAGACATTTGAAATATGAAGAGTGTGAGGAGCTGGTTTTAAAATTTTAAAATGAAAATTTATCATTTTAAAATAAAAAAATTATTTTGAG\n>XR_004558147.1 PREDICTED: Thalassophryne amazonica uncharacterized LOC117501971 (LOC117501971), ncRNA \nCCCTGAGCCTGGTTCTGCTGGAGGTTTCTTCCTCATAGACAGTTTTTCCTTACCACTGTCGCCTGTGTGCTTGTGCCAGGTGTTGGTAAGGTTAGACCTTTTTTGTGTAAATCGCCTTGAGGAAATTTTGTTGTGATTTGGTGCTATAAAAATGAAA\n>XM_018405618.1 Kwoniella dejecticola CBS 10117 hypothetical protein partial mRNA \nATGGCACCTGTAAAACCGGTGAATGGCAGTGACAAGCAAGTGAAGAAGAAGCGGACTTTCTTCGCGTCGAAATTAGCCATACCAATCCCTCCAGCAAGTGCGACGGAAAAGGGCAAACAAAAGGCAGTAGTGGTGTCTACAAAGACGGTACTTAGTGCTTTGGATGGATTGGAATCTGTGTCTAGATCAACACCTATCAGTAACGGTAACAGGAGGGATCAAGAGAAACGCCCCACTGCAACTCACACTCCATCTCGCGCGCAGACCGTAACATCGAAGCTAGTACAAGATCCCAAGATCTACACGAGGAGAAACAAACCGAAGGTTCAAGCCACAATCACCCGGAGCTCAGAGGTCGGTGGGAATGTCAAGAATGGCGTAGATGGTAAAATCAAAGTGAAGAGTGAGCCTTCAAGCTCGGTATCAGCTTCGTCTAGTAGGCTCGTGAACCGGAAGAAGGATGTCATCAATGACACGGGAAGGGTTGCGAGTGCTATTGAGCCGCAATCGAGTTCATCGTCCTCGTTTGTTGTGGGGAAGCATAAACACCTCAACGTGAAAACGAAAACCAAGTCGAACTCAAAAGTGGGTCCCAGTGCTAAAGCCAAGATCATTACCATCAAATCATCTTCGTCTCGCAGAATACCACATACCACCCTCAAATCCTCTTCCAAAACCAAGAGCGCAAAGACGACCACGCGTTCATCTGGCTCTGCGAAGACTTCAAATAAAGCTACACAGGTGCGGGCGATCCTGTCGAGGCGAATCATCAGAACTTATGAAGCCAAGTCTCAAACCAAAAGCGAACCCAGTCAAATAAAAGGAGGAATCTCTAGTGGGAGTCCAGAAAAGCAGGAGAAAGGGAAAGAGAAAGAGAAAGAGGGCAAACCGTTGAAAAAGGATTACATGTCAGCTGGATTCTATTGCCAAGATCCCCATCCTTCGTCTTCAAAGCAATTACACAACAAGATCTTAGCTATCCGTTCGGCGGAGAACAAAGCCTCAAAGTTGTTAGATGCAAAGGCAAAGGCAAAAGCAAAGGCTACTCCGACCATAGTGCGCCAAACGAGAAATAACGTCAAATCACATTCGAGCGAAAGTCAGAGTGCGAGTGCGAGTACGAGTACGTATACGAGTACAGCTCAATCCAGTAAGAAGTCAGTCGATCAGGAGAGACCGAGTTTCCCGCCGTTACCGTACGATCATGGCTACGACCTGTTCTTCAAGCAGGAGCACGAGTTCGTGTTGCCGTACCATATCATGAAGGAGAAAGAGGATGGAAAGCTGGTGGCGAAGAAGAAACCTACTCAATTTACGAAGATACGAGGGAACATATACCCCGAACGACCAAAAGTCATGACTGATTTCCATGCGATATGCAAATGCTCGCCGGAATCGAAATGCGCCGATCAATGTATAAATAAGTTGATGAGTTATTTATGTGGGAAAGAATGTCCTGCAGGAGATGAGTGCACGAATAAGACTTTGACTAAGAGGAAGGCGGCGGCCTATAAAGTGGCTGATACCGGGACAAGGGGTTTCGGGATCATACTGCTGGAAGACGTCAAAGAAGGGGATTTCGTAATGGATTACAGAGGAGAGGTGATATCGATAGACCTTTTCATGGACCGCATACAGGATGAGTATAAGGGCACGAAGAATTTCTATGCGCTAGCGTATGATCAAGATGAAGTGATTGATGCGGGGATGAAAGGGAATGATGCTAGATTCATCAATCACGGCTGCGCGCCCAATTTGGAAGTACGGAAATATCAGACCGCCGGGGATGGGTGGGACGAATTTGAGGTGGGCATGTGGGCTATTAAGGATATCAAAGCGGGAGAAGAGCTGTTTTACGACTACAACTTCGAGTCATTCGGAGTTGCCGCTCAGTCCGACGAACTACGCACGAAATGTCATTGTGGAGCGCCCAATTGCGTCGGGTTCTTAGGTAGAAAGGCAGGAGAGAAGTCGGCGAAAGAACTTGCAGCGGAATTAGCTAGGAATGCCAAGATCCTGCAAGGAAAGAAGGCGTCCATCAAGAAGCTTAAAAGTAAATTAGCGGAAAAAGCTCAAGCTGAATCTCGAAACGCGGCGAAGCTGGGTACGACGGTATTGGGTTTGGAAGATACCCCATCTATCATTTCTAATGCCGATACAATCACTACCACTTCTATCAAGACGCCTTCTCAAATATCGCCTTCTCGACCGCAGATTAATGCAAGGATGCCTTCGTCTTCCCCACTTTCCGAGCTGGATCCCGTCGAAGCCGAAAGCCAAACCAAAGGTTTGCCTAAGGACAAAAAGAGGAAGAACGAGATTTTAGCCACAACGGAAGCGGAGACTAAGAAGAAAAGAAGGAAATCTGAACCTTTACCAATACCCAAGAAAGCGACTAGCAAACCGCGCAAATCTGAGCCTTCCGCAACAAGTGCATCGACATTGAATTCGGCAGTGCGAATCAAGAGTGTGGGTAAAAAGGCAAGGAAGTCAGAACCGATCCCTACGTCTACCGTGAAGAGAGATGAGGATGAGAGCGAGGATGAGGCAGAGAAGAAACCATTCAATAATCCTCGAATCTGTATGGATGCCGTCCGAGAGGCTGCTCGAATCAAGAAGGCCGAAGTCGTGAAAGCTAGGAGGGGGGCGCCTAAGGGATGGACAATCGTTTTACCGGGACATGAACCGCCACCTAGGGCCGCACCGCTCGTCGTGTCGACTAGGAAACCGCCCAGAGATAGGTCGAGCTTGGGGTGA\n>GU637646.1 Uncultured bacterium clone RW2302 16S ribosomal RNA gene, partial sequence \nATTGAACGCTGGCGGCATGCCTTACACATGCAAGTCGAACGGTAACAGGCCGCAAGGTGCTGACGAGTGGCGAACGGGTGAGTAATACATCGGAACGTGCCCGATCGTGGGGGATAACGGAGCGAAAGCTGCGCTAATACCGCATACGATCTGAGGATGAAAGCGGGGGACCGTAAGGCCTCGCGCGATCGGAGCGGCCGATGTCAGATTAGGTAGTTGGTGGGGTAAAGGCTCACCAAGCCGACGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGAATTTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGCAGGAAGAAGG\n>XM_023804680.1 PREDICTED: Paramormyrops kingsleyae potassium voltage-gated channel subfamily H member 2-like (LOC111840147), transcript variant X3, mRNA \nAAGGCCAGAGTCGCAAGTTCATCATCGCCAATGCGCGTGTGGAAAACTGCGCCATCATCTTCTGCAGCGATGGTTTCTGTGCCCTGTGCGGCTACACGCGCTCGGAGGTCATGCAGAAGCCGTGCACCTGCGACTTCCTGTACGGCCCACACACCAAGCGGCTGGCCGTCGCACAGATGGCCCAGGCGCTGCTTGGCTCAGAGGAGCGGAAGGTGGAGATCGCCCTCTACAGGAAAGACGGCGTGTGCTTCCTCTGCACGGTGGATGTGGTCCCGGTGAAGAACGAGGATGGCATGGTGATCATGTTCATCCTGAATTTCGAGGTCATGAGCGAGGAGAAGCGCAGCGAGTCCAGCCGAGAGCTCAACCACAAGCTGTCCATCCCTTGGCTCTCCGCAGGCCGCTCTCGTGGCTTCAGGGTACGCCTCCCGCTCCTGCGCTCCCTGGCCAACAGCAGGCAGTCCCTCCAGGACGACCCCGAGGCAGCTTGTGTGCCAAGGGCCTCCCACCCCAGCCGGGACTCCCTGATGCTGGACGAGCTCATCTCCCTGCCCGAGCCGGCGGGCCGGAGGGCACTGCTGGAGAGCCAGCCCCCAACACCACCACCGCCACCGGCTGCCGACTTCCCCGTGCATCCACACCACCTCGACCCAGACGCTTCCGTGTCCAACTGCAGCCTGACTCAAAGCCGCTCGCGGGAGAGCTTCCACAGCATGCGGCGCGCCTCCTCCGTTGACGACATCGAGGCCATGAGGCCCGAGTGGGAGCGCAAGGTCCGCTCTGGTAGCACAGGCGCAGTGAACAACAAATCAAACATCCTCAACTCTACCTCGGACTCGGACCTCATGCGCTACCGGACCATCAGCAAGATTCCACAGATCACCCTCAACTTTGTGGAGTGCAAGCCGGACCCCCTTATTGCCCTACCTCCTGGGGACAAGGACATCATCGCTCCCTGCAAGCTAATCGACCGCACGCACCACGTCACAGAGAAGGTTACCCAGGTGCTATCACTGGGTGCCGATGTCCTCCCTGAGTACAAACTCCAGGCTCCCCGCATCCACAAGTGGACCGTCCTGCACTATAGCCCCTTCAAGGCGGTGTGGGACTGGTTAATCCTGCTGCTGGTGATTTACACGGCCATCCTGACTCCCTACTCTGCCGCTTTCCTGCTGAGCGACCAGGATAACGTGGCCATGGAGAGCTGCATCTACACCTGCACTCCGCTTAGCATGGTGGACCTCATCGTAGACATCATGTTCATCATCGACATCCTCATCAACTTCCGCACCACCTACGTCAACATTAATGACGAGGTGGTGAGCCACCCCGTCCGCATCGCAGTGCACTACTTCAAGGGCTGGTTCCTCATCGACATGGTGGCGGCCATTCCCTTTGACCTTCTCATATACCGCAATGGGGAGGAGACGACCACTCTGATTGGCCTGCTGAAGACTGCCCGCCTACTGCGGCTGGTGCGGGTGGCTCGCAAACTGGACCGGTACTCGGAGTATGGTGCGGCGGTGCTCTTCCTGCTCATGTGCACCTTTGCCCTTATCGCCCATTGGCTGGCCTGCATCTGGTACGCCATCGGCAGCGTGGAGCGCAACGGCTCCATTGGCTGGCTGCACTCTCTGGCCGACCAGCTGGGGAAGCCCTACAATGAGACCATCCAGGGCTCGGGCCCGTCCATCAAGGATAAGTACGTCACAGCACTCTACTTCACCTTCAGCAGTCTCACCAGCGTGGGCTTCGGCAACGTGTCGCCCAACACCAACTCGGAGAAGATCTTCTCCATCTGCGTCATGCTCATCGGCTCCCTGATGTACGCCAGCATCTTCGGCAACGTGTCGGCCATCATCCAGCGGCTGTACTCGGGCACGGCGCGCTACCACACGCAGATGCTGCGGGTTCGGGAGTTCATCCGCTTCCACCAGATCCCCAACCCCCTGCGCCAGCGCCTGGAGGAGTACTTTCAGCACGCCTGGTCCTACACCAACGGCATCGACATGAACGCGGTGCTGAAGGGCTTCCCCGAGTGCCTGCAGGCCGACATCTGCCTGCACCTGAACCGCACACTGCTGCAGAACTGCAAGGCCTTCAAGGGCTCCTCCAAGGGCTGCCTGCGCGCCCTGGCCATGCGCTTCAAGACCACGCACGCCCCGCCCGGCGACACATTGGTGCATGCCGGCGACGTGCTCACCGCCCTCTACTTCATCTCCCGCGGCTCCATCGAGATCCTGCGCGAGGACGTGGTGGTGGCCATCTTGGGTAAAAATGATATCTTTGGTGAACCCATCAACCTCTACGCACGTCCTGGGAAGTCAAAGGCAGATGTGAGGGCACTGACCTACTGCGACCTGCACAAGATCCACCGTGAGGACGTTCTGGAGGTGCTGGACATGTACCCTGAGTTCTCTGATCACTTCTGGAGTAATCTGGAGATCACCTTTGACCTGCGCGACACTAACATGATTCCCGGCTCTCCGAGCAGCGACGAGTCGGACTGCATCGGCTTCAACCGGCTGCGCAGACGGAAGCTGTCCTTCCGGCGCAGGACCGAAAAAGATGACGAGAAAGCAGGTGAGATAAAGAAGTCTCAGAGGCCAGTCCGCCGGGCAAGAAAGCAGACTGTCAGCAACCAGACAGAGGGCTGTAAGGTAGAGTGGGAGGGGCCACGCAGTTCCGTGTCTTCTCACTCCAGTGGGGAAGAGGGGGAGGAGTTACTTCTCACCTGCCCCGCCCCTCCCTCCGCCCTCCTGGAGTTGCCAAGGGAACTGGGGACACACGTCAACGTGAGCAACGCTCCGGAGGTGGACGGGGATCCTAAGACTGGCAGCACCTGCAATGCGCTCTCTGGTGCGTTTTCCGGAGTGTCAAACATCTTCAGCTTCTGGGGTGACAGTCGCGGCCGGCAGTACCAGGAACTGCCCCGGTCCGGTCCGGCCTCCTCTCCCACATCGGCCACGCCGACCCACGGCATGGCCCGCTGGCAGCGGAGCCAGGTGGAGAACCGTCTAGAGCTGCTGCAGAAACAGCTGCACAGGCTAGAGATACGCATGTCCACCGACATCAGCACCATCATGCAGCTGCTGCAAAGGCAAATGGTCCTGGTGCCCCCTGCCTACAGTACGGTGACGTCCCCCCCTCAGCCCTCGCCCTGCTCCGGCCCCGGGGAGAGGCTGGTCCAGCCGGTCCCCCCACTGGAGCCCGACACCCTGCAGTCGCTCTCACAGATCCTGGTCTCCCAGAGCTCTGAGGGACCCTCTGCCAGGTTATGCGAGTCCCAGAATAGTACGGTGGAGCCTCAACCCCCGGGTTCCCTAGGAACCAGGAACCAGGAGGCAGGGCTCTCTGGCCTGGCCGGTCCCCAGTACTGGCTGGACGGGGTGACGGGGACCTCCGCGATGGACCCCGAGGCACAGCGGAGGCTGTCGCTGCCGGGGCAGCAGGTGGTTCTGGATTCACGGACGCCGCAGAGGCACATCTCTGACCCGGGGAGCTAGGTCCTCCTTGGAGCATCTCATCCAGGTCTTCCCTGTAGTCCCTCCACGCCGAGGAGGAGACCACCAGTGCTCACCACTTCCTACTCGTATTTCCATCAGCTGTGGGAGTTTCCTAGGGTGCTTCCCACCTACCTTGCACAACACTACCCCACTTACCCCTCTTCTTGGCTGACTTGAGGAACCACTGGAGATTAGAGTTTAGACCCATCCATCTCCAGCTCATTGTCCTTCACAGCAGGTCAAGACACTGCAAAGCGTGTAGTGAAGCGAAAGGCTACACTGGATGGACTTTCCCTTTACTGCTGAGACTGGCGTTGGAACAGTGAGACAAACGTGCACAGCGTAGGCACTCAGCCCACCTCTCGTCCACGTTGCTTCCTGACATTGTTAGTGAACTTCTGCGTTAGCTGGCCTAACAGATGTGTGGCTGCTGCCCCCTGGAGTCCATTTCCCAAAGCGCATCCACCAGATGGAATGTGGTTTCTAACTGTTGCTGTAGGGGAGTGGGGTGTTCAAAGCCATTAATTACTGGTGAACATATCACATTCTTAAAATAAACCTTGTACAGATTTTGAATGACAGAATCCTCGAACCATATGCAAACTCAGCAAGAGAAATGTTAAATTATTACAGGAGTGTGTCGATTTTCAGTCCAAAGGTTTGCTGAAGTTTGCTAAGGCCTGTGGATCGCAATTCGTCCGCGTGGTGATCTGCTGGATCCTACTACAGCAATATAATATATAGAGAAAGAGTTCTTGCTCATGAAGACTGTAGTTTTCTGTTAATCACCTTCCATGTCTTCTTGATCCATTCTCTTGGGCGGGTGGTCCTTCTCCCTACCTCCTTCTGGAGATAGTCTTCAGAGTGGCATAGAAGAACTCCTCTGGTGTTCATCTTGGTGAGTGGATGGCAGGTTGTACTTTGAAAGATGGTTGATTGTAATGTACTGCGTTGCACAATGAAATGAAGGTATGTATTGTATGTTTTTTATTTCTTGGGTGTTGTATCTTCTTCAGTAATCAACACGTATTCTTCTGTCGCAAAGAAAAATATCAGAATTTCTCTTCTGATGGAAGAATATGCACTGGATTTTTGACAGTCTTGTGGATCCTTTCCCAAATCCATTTCTGTGTAGTGAAAACATGGCAAAGCAGCTTTTAATTGGACTTAATCCTCACCAGAGATTCCATTTGGTCGAGTTACACACCTCAGTTTGTAATGAACTGTAACAAGGTAAAATTTGAGCTGTCAATCTACTGTATGACCACATATTTGCCAAACCCCAAAATCTATTGGAATTATGAATATTTTTTCCTGTGTATTAGTATGTATTTTTACAAAGTTCCTTACCCAGACTGAACATGAGTCTGAAAATTCACAGCTTGTCCATTATAAAAATAAGCATTGATTTGCATTACTAGTCCTGGGCATTGATATTAACATTCAGTCCAAAGCTGGGCTGTCGAATTCCAGTCCTGACAGGCAGCAGGTTTTTGTTACAGAAGAGATTTTATTAATTAACAATTCATCGATCCTCCCCATCTATGCCAGGCAGCATAGGGCAGATGCCAGGGGTACAGCCTCGATGGATAATCACACTCTGTGGGTGATGTGAAGGTGACACAGAAGTATCAGGTGACAGGGCTGCCTAATAATTTTACAGCAACTGATTTCCTAATTTAGAAAAAATAAAATAAACACGGTTCAAAAACCAGCATCTTGGTTTACAAACTAAACACATTGCTTGTAGACCCACTGCAGTTTAATTTGAATGTGTCTGTGATTTCATTTGACCCTTTGGTCAACAGTAAAGTTGATTATAGTAAATTTACGGTAAAGTAGTTTACACAATTGAAACTGAACAGTAAACCTCTATTGGAACTTAAACCAGAGTACCCTGCAATTCCGTCCAGGACTTAAGTTTCACAGCCCCTTGCAGCAATTCCAAATGCCTTGCCAGTCCCAAAGTAGAGTTTAACTGTTTATTTTCAAATGAGCATATTTTGTGTTTTTAAAGACTTTAACCAGACCTTTACAGCCATTATTAGCATAACCTGTTAATCCCATGAAGCTGATTCAGTTATTCTTGGCAGGTATGAATTTTAGTGTTGAAAGACGATGGGGGTGAGGTATTAGTGACCCCCAGTGATATAGTATTGCACAGTGGACATGTGTAAAGTGTAAGCCAAGTGTTTCTCCCATGTCTGAGGGTCACATGGACTTCTGAGGCACTGTATAACATGATTTACCAATTAACAGAAACCTCAGTCCTCAAATTGTGTTTTAACCTGTGTATATGTACTTAATGTAAAGACATTAATACTGCTTTAGTCTGTAAGAAAAAAAAACATTTAAGCACATGACAGTAACACCACTGGAGTTTTCTATCCCTGATGCCAAACTGAGGGATGATTTCACTTTCCACTTCAACCTTCACGCAGTACTGTAAGATGTCCACTGTTATCCTGTGAATCAGATTGTCTTGTTTCCTCTGATTCAGGTCCATTTCCTTTCTGTACTGCTCTGATACTTGCCCTATTGTTGGCAAACCGCTTACAACTGTAAGTCTCAGCTTAATTTCTGTCATAACCTCGGACCTGTATCATAAAACAGGATTTCTTGGTTAGCTCGATGACTTGTCAGATTTAAGGTAGTCTGGGCTAAATGTATGTGAACAAAGATAAAGTCCATTTAAACTGGGCTACCTCAAATCTGACAGGCTATCCAGTTCAGCAAGAAATCCACCTTCATACAGGCCCCTGCTGTAAAAGTAGCTTTGTTCTGAAGTATCCTCACACGAGGATGTTTTGCTTCCTCAATTCATTCAACTGGTTCGCTCAGGCATTTGAAAACCGTACTGGCTGTCACCTTAACAAACAAAACCTAGGAGCTGTAACGCAAAAAGCAGGATTTCTTGCTTAGCTAGATGACTTGTCGGATGTACCCCGGTTTAAATCGACTTTATCTGTGTTCACTTACATTTAGCCCAGACCACCTTAAATCTGACAAGTTGTCCGGCTAAGCAAGAAATCCAGCTTCGTGATACCAGCCCGCAGTCTTCATCTTAGTACAGGTATCTGCAACAAATCACCTGTAACATAATTCTTACACTGCCTCCTACAAAGGCACACTGCACCCTTTAACGTCTGGAAGATTGTCATTTAAACCTGATGCCTCTCAGTAGACGAGACTGTTTTCATATCGACGGATGTTTCTGATATAGGTCTGGCATTTGTAGATACTCTGACAAATATTTTTCCCTAAAGTAAGTCTACACTAGATTTTTTATTGCCTCTTCCCTGTATATGAGAATCTTGTAATTGAATCAGCCTTGGCACTCTTGTAGCCAGCACTATGCAGAAACTGTCATATCCGTGGCATGCTCCAGAATGCAAACTGTAGAAGCGTTTGTCCAGTTTTTAATAATCATATTCATGATTATATTAATATTAATAATAACGGTGATGGTGCCGATCAAAATAATGAAGATGAAAAAAAATAAATAAACGTTGTGCACATTTTATTTGCATGCTGCACTGAAAATGGAGGGACGAGATTAGCTCTGGGCCACTGGTTTCTGGATCGCCTGATCGGCACGCGTTAAGATGCTGTGTCAGAAAGCAGTAAATGCATACTAACATGCCAGAAGGAGACCTGAAGAAGAACAGTGAGCCCAACACCTCAAGGAGAATTAATTCTATAGCCATGTTTATATCAAGCACCAGTGAATTGGAGGAAATAAGCTATGGGGTCTTGACTGTGTGATGGTACCATAAACGGATGAAATGTCCAACTTTTCCTTCAATAAACCTCTTTGAAAGCAA\n>XM_035091360.1 PREDICTED: Chelonus insularis ras-related protein Rab6 (LOC118071888), transcript variant X2, mRNA \nCGTCACTTCCCAGTCAAACGTGGCGGCCGCGACAGGAGAACGAAGGAGTGGCTGTACGATCTGTCAAGTTGCTCAGTTTTCATTGTGTATTTAATGTTTTTTTTCGTAACTGGATTAATAATTGTGTAATTACAAGTAGATCCAGTAGTATTATTAATAAAACTCATTAGAAACATGTCGTCGTCGGGTGATTTTGGTAACCCGTTGAGAAAATTCAAGCTTGTGTTCCTAGGTGAACAAAGTGTTGGGAAGACTTCTCTTATTACACGTTTTATGTATGACAGCTTCGACAATACTTATCAGGCTACAATAGGGATAGATTTCCTGAGTAAAACCATGTATCTGGAAGATAGAACTGTTAGACTGCAGTTATGGGATACAGCTGGTCAAGAGAGATTCCGTTCTCTAATTCCAAGTTATATTAGAGATTCTACCGTTGCTGTCGTTGTTTACGATATTACTAATGCTAATTCATTTCACCAAACATCAAAATGGATTGATGATGTACGAACGGAGAGAGGCAGTGATGTTATTATTATGCTTGTTGGTAATAAGACGGATTTGAGTGATAAACGACAAGTTTCAACTGAAGATGGAGAGCGTAAAGCTAAAGAATTAAATGTGATGTTTATTGAGACTAGTGCTAAGGCAGGATACAATGTCAAACAGCTATTCAGAAGAGTTGCTGCAGCATTGCCTGGTATGGACTCCACAGAAAATAAACCTCCAGAAGACATGCAAGAAGTAGTTCTCAAGGATACACCAATTGAACTCAAAGCGTCGGAGAGCAATTGTTTATGCTAAATCAAGATAAGTCATAATAGACAGACTTACATTTCTACACTCCATAGACACGAATTAAACAAAATTATAAACAAGATTCGTCGTCAATTGGTGCGCTAACGATCTTGACAGATCACAATTGTAACAATAATTTTTACCCACATATTAAACAGTGCGATTTTTTAAGAGTGGTGCACATATCCAATATTTTGTATAAATTGCTCATTAATTTTTATTTCCGGGAATCATTCGTTTTTATCAGCATTTACAAATGATGAGATCAATTCTTTGTACTCATTTTTATCGCTTTATCCATGCTATTCATCGTGACAGCCACGGCACTAATAATTATACATTAATCATTTATACAAAAGCAACGATTAACTATTTTCAAATTATAAAATTCTTATTGATCACTTTCGTTATCAATTTATATACATTTTCATATTTACAACAAAA\n>XR_006035448.1 PREDICTED: Aricia agestis torso-like protein (LOC121725853), transcript variant X2, misc_RNA \nGTCAGTTGTGCCGCGGGGCGCGTGTTGTCGCGATGTTTCTGTCGCGTCGTGCTGTCGTGTTGCTGTCGCTGTGTTGTGTTTGTTGTGACGAGGACCTGGGATACACTCTGACCATCGGCAATGCTATTGACGTGTTTGCCAACTACGGTGACCTGTCCCAGGTGACGCAGGTGGTGTCAGCAGACTACGATGACAACGAGGGCTCGGAACCCTTCAGGGAGAAGAACATCAGACTGTTTGAGAACATCAGCAGCCGCCAGACGCCGGGGGATTCCCACTTCGACATGAACATACAGCTGTGCGAGACCTTCGATGACTTATTGGCAGTGTACTTCAAGAACTTCAAAATAGAAGGTACAGACAAACCATGGAAGGCTTTCTTAGGAGATTGGATACTGGACGAGATCATGCGGACTTTCGGTATCGAGTACGACGCGCGGCCTGACAACTGCTGCTACGTGCTCGTGAAGTTGACCAAGGTCCACACTGCGGTGCAGGTAGAGTCAATGGAACGAGTCCGCGTGCGGGAGTACGTACAGCGCGCGGTGAACAGCCTCAACGTGAGCGACGGCGTCGCGATCAGACAGTTCATGAAGAGCTACGGCACGCACTACATCGAGTCCTTCGCGACCGGCAACTTTATATACCAGGTGTTTAAGTACAAGCGGTCTGGGTACAACCGTCTGAAGGCGTACATCAGGCTGCGGGAGAAACACCAGATCAACTCCGACAGTCTCAGGTTCTACTTCTCCTCGTACTTCCTCAAGCAAGTCGGAGATATCCGAATAGCAAGCGGCAACAAAGTAATAGAGGAGTGGGCGCGAGACAATCTCAGAGACAGCCAGTATCTTTTCTCACGACCGAGTCTACTCCGACTGCACTTCAACCCAATACTGGCGTTCAAACTCAACGAAATGCTGGACAACGGAGCGCTCCTATCGTTGAGTTTGAGAACACTCAAACCGCTATTCAAAGACGAATACAAAGGAAGGGTATTTGCGGAGTACGTGGAAAACGATATGAGGCTATGGGAAATCAATGCTTAGATTTGAAATTTTGTAGAAAGAATGACATGGAGTTAATTTTCAAGATGCAGGTACGGTTAAATAGTCAATACTTATGACGAGAGTATGAAAGAAATACAATGGTGAGAATTATAATAATAGATTTTAAATTTTTAATGTTGGTGAAATATTTACTTAAGTTCACCAATAGATGGCGTAACGTTCATATAGAATTAAAAAGT\n>XM_009873997.1 PREDICTED: Apaloderma vittatum cytoskeleton-associated protein 4 (CKAP4), mRNA \nATGGGGGTTGCGGTCAGTTCGGTGCGTTCCCTTCAAGCAACTTTTGGAGAATTTGAATCCATGATGAAAATTGCTCAGCAGAAGCAGGAGGTTACTGAGAGGGCTGTTAAACAAGGGGAGAGTGAAATAAACCGGATCAGTGAAGTGCTTCAGAAGCTGCAAAATGAAATTTTGAAAGACTTGTCTGATGGCATCCACATGGTGAAGGATGCAAGGGAACGAGATTTCACGTCTCTGGAAAATACAGTGGAAGAGAGACTAACAGAACTAACCAAGTCTATAAATGATAACATTGCTGTATTCACAGAAGTCCAGCAGAGGAGCCAAGATGAAATCAACAATATGAAAGCAAAGGTTGATTCACTAGAAGAAGCAGATGTGTATAAACAGGAAATTAAGGTGCTAAAAGATGCTTTTGCTGAGATGCAAGCATCCATGAAAACCAAAGAAAAGGACATAGAGACCTTGAAGAGTACAATAGACTCCATGGAGTCTGATGTGTACACTGAAGTGAAAGAGCTAGTCAACCTCAAACAAGAACACGAGAAATTCAAAGAGGCGGCGGACACTGAACACCTTTCGTTGAAAGCTTTACAAGAGAAAGTTCTGAGAGCTGAGGATTCTATCATGCAGCTCCCTGGTGACATTAAAAGACTTGATGAAGACTTACTGCAAGTTAAAGCTGACCTTAACAAATGGGAGGAAAATGAACTCTTCAGAAAAGCACTAGAAACTTTCGGAAAGAGCAGTGAAGGGCTGGAATCTCGATTGAGGCACATAGAAGACAGCTTGGAATCTCTAACATCTGTTGCTGCTCAAAACAGTGAAAAGATGCAATCCTTCCTTTCTAAGGAGGCAGAGTACGAGAATAAGCTCACTACCTTAGAACAAAGCGTTACTGCTCTTCAGGGAGTCTTCAATATGGACGTAACTTCAGTCACAGACACTTTGAAAAATCTCGGTGAATCGCAGACCTCACTGTACAATGACGTGGAAAACTTGAGGAAAAGCATCAGTGACCTGCCATCCTCTGGTGTTCTTCAGGATGTCCAGAAGCAAATTAGTACTTTGCTGGATCAAGGAAATCTTCAGACAGATCAAGCACATTCTCAAGGTTATCTTGACAAATTTTCTTCTGTGGAGGGCTCTGTAGATGAACTGAGATCTTCTGTCAGCCAGGTTGATTCCGATTTGAAAATGATAAGAACTGCAGTGGATAGTTTAGTCTCCTACTCGGTGAAAATTGAAAATAACGAGAACAACTTGGAGTCTGTGAAGAGCTCAGTAGACGACTTGAGGAATGATCTGGAAAGGTTGTTTGTGAAAGTAGAAAAAATACATGAAAAAGTTTAG\n>XM_014296803.1 Sphaeroforma arctica JP610 hypothetical protein partial mRNA \nATGGGTCAGAGAACGTCAACGCAGGTAGATAAGCTAGCTAAAGCATTCAAGAAAGGGTTAAATAGTAAGTTACCTGAAGCTCAGAATACAACCCTCGAGGCGTTATTGAAGGACATGCCAGAAGTTCACGATAGACTTATGACATTGTTTAGTGAAAGTAATGCTGTATCAGCAGCATCAGCAAAACGCACTTCGACGGGCGAACAAGAGTTCAATGATGATGAGCAAGGTCAAGAGACTGATATTGAGGGAGAAGACGAATCTCCCTTACAACGTGACATGGATACAGAAGAACTGATAAGGAGAAGTGTTAACGATGGGTCAGAGAACGTCAACGCAGCATCAGCAAAACGCACTTCGACGGGCGAACAAGAGTTCAATGATGATGAGCAAGGTCAAGAGACTGATATTGAGGGAGAAGACGAATCTCCCTTACAACGTGACATGGATACAGAAGAACTTGAAGTTCACTATTGGGTTGTACAAGATCACAATCTAAAACATGTTAGTGAACGACCTACTCTACGAGATGCCCAAGAAGAAGGGATTGATCATCCCAGACTCAGGGCGATAATACGTAAAAACTACAACTCCTGTAGGATTGCGAATATAATCAGATCAAGCGTTATGGATTCGCGCCACTAA\n>XM_018329607.1 Xylona heveae TC161 zf-DHHC-domain-containing protein partial mRNA \nTCAAAAAGGCACACTTGGTCTCAAACATCACGCTTTGCATCAAAGGCCAACACTTCTTTGGGGGGTGTCACCACCGGAAGCGAGATAGGGACAGAGTCAAGGAGACCTCAAAGTTCGGCGAGTAAAACGCATGTGCCATCGCTTGCTTCACATGCTTTCTTCCGTCCACTGAGCTCGCAGAGGCTTCAAGCTCAGCGAGGGCGTCCTTCGCCAGCCACCTTCGTTCCAGCTAAAGAAAATGTGCCTTTAAAAGACGCAGACTCTGAGATAGCGCATGAATTGGATTCAAAGATTAATCAGAAAAGGAACTCCGCTGTCCTTCTTGATAGTGAAAAAGCGCAGCCACCGTCAAGGGGTACTGAGTGCACCGAGTTCCATGGGCAGGAAATGATCACAGGCGAAGTTAGCCCTGCTGCTAATCGCACAGGCACAAGCACTGCCGGCAGTGCGCATCCTTTGACCCAAGCTTCTCTGGCACCCAATGAGCCGACCGGGACGGTCTTTCGAAGAGGCTCCGCCTTTTCGTCACCTCTCGAGAAAGATCAAGGCTCGTTTCGCTCAAATTTCCTTTTACCAAGTCAGAATTTAGAGCTTCGAGATAATCAAATCATCGGTCGAGAAAAGCTAGCTTCTGCAGATTCTTCGCCACAACTTGGGCCCTACGAGACAAATAATCACGTGAGGAGAGATTCGGAGCGCAATTATCAATATTTTCCTGGAAACACTGTCTTCTGCTTTGGCGGGAGGCTTCAAAATACCAAAGATCGACCAGTTAACATCGTCACTTTCGTCTTGGTCATTCTGCCCTCGGCTCTTTTCTTTGGTTTCTCTGCTCCATGGCTCTGGCTGCATGTCTCGCCCGCGATACCAATTTTGTTTGCGTACCTCTTCCTCATATGTGTTTCCTCCTTCACTCATGCCTCTGTTACCGACCCTGGGATACTACCGCGAAAAACCCAACCATTTCCTCCTGCGAATGATGCAGACGATCCTCTTACCCTTGGGTCGCCAACGACTGACTGGACTCTGATTAAGTCAGCTGCGTCGCCCACCTCTGCCATGGAGGTTCCAACAAAATACTGCAAGACTTGCAACATTTGGAGACCTCCTCGGGGACATCATTGTCGAGTTTGCGACAACTGCGTGGAAACGCAAGATCATCATTGCGTGTGGCTCAATAACTGCATTGGTCGCCGAAACTACCGATTTTTTATATCCTTTGTGGCTTCCTGCACGTGTTTAGGTCTCTTTTTACTCGGCGCCAGCCTTGCTCATATTCTTCTATACGAATCCAGAGAGAGCATCTCATTTCGGGACTCAATCAGTCATCTGCGAGTCCCCTTTGCTATGGTTCTATACGGAGCCCTAGCGACGCCTTATCCCGCATCTCTTTGGGGTTATCACTTATTCCTGATGGCACGAGGCGAGACAACAAGAGAATATTTGAATTCTCACAAATTTTTGAAGAAGGACAGGCATCGTCCATTTACGCAGGGCAATATTCTGAGAAACTGGTTAGCGGTCGTCAATCGGCCGAGGCCCCCAACCTACATACGATTCAAGGAAAAACACGAGGCCGGTGACCAAAGGTTTAATCTTCGGAGA\n>AB364225.1 Uncultured bacterium DNA, ribosomal RNA intergenic spacer, clone: Amplicon22-5 \nCCGGAAGGTGCGGCTGGATCACCTCCTTTCTAAGGACGAAAAGCGGAAGCGCCGCGTTCGGCTCTCGAAGCCAAATGTTCTTCACCCGGAGGGGTGCTGGCACCCCGAGGGGGAAGGTTATTTGGCAGAAGAGAGCCAGGCGCTGGAGCTAGACAAGACGAAAAGTGGAGGCCGCAATGGCCAACTGTCGATACACAGCGCTTCTGTTTCGTTCAGTTTTGAGGGAACGAGTCATGTTCTCTCAATGACAAAAATCGTTCCTTGAAAACTAGATAACCGGAAAAGCGGAGGCGAGTGTTTCGCCGCGATGGGCAAATGTTCTTCGCCTGCAAGGGTGCTTGCACCCGGAAGGCGAAGGTTATTTGCCCCCGAGCGGCGGCGAGCCGACGCTAGACAATAAGGAAGAAGCCGAGAGCGCTGTAGGTTAAGCTAGAAAGGGCGCAC\n>XR_002421788.1 PREDICTED: Columba livia uncharacterized LOC110363588 (LOC110363588), transcript variant X2, ncRNA \nCTGCTCTGGGGATGTTCTTTGTGCCCTTCGTGATGTGCTGCTGGGAGATTGTGATGTCAGTGGATGTCGAGATGATTTTCCCAGCTATCATCCCACTGCACATTGGACTTCTTCCCCAGGATCTGCAGCACCTTTCTGTGAGACATCACGCTTGATGAATATTGACATGGAAATAATGACTGCCCATTGCTACAGTGCCACTTGTGTTATCTGTTGGAACTAAAGCCTTCACTTCTTAATAAAAATAAACTTATAAAATC\n>XM_031706046.1 PREDICTED: Actinia tenebrosa lysosome membrane protein 2-like (LOC116297758), mRNA \nCACCTGATTGAGTTTGAAGGCCATTCAAGGTTCGGCATCTGGTGAAGTAAAAACTGAAGGACTGGAATCTTAGCTAGCAAGCTTCATTCAGCCATATTTTAAACTTTMCACCACATAAAAGCTGCATTTCTCCATCAATAATGGAAGAGAAATCAGAAAAACAAACAAGCTGTATTTACGGGGGAAAGAAGATTGCAGTTCTTTTGACTATTGGAGTGCTGCTAATATTGGTTGCCGTCACTTGTTATCCTCTGATCGATTCTTTGATTCAGAACAAGATCGATTCAACTCTGGCGTTGAAGCCTGGCTCAGATAGCTTCAAACAGTGGAGGGCACCAAAAGTTTCGATTTAYCTTCAGTTTTTTATTTTCCATGTTGTTAATTATGAAGAAGCATCGCTTGGTTTACCTCCTTATGTTGTGCAAAAAGGACCTTACTCGTACAAGGAGTACAGACGAAAGGACAACATTACTTGGCACGATGAGAACTCTACTGTGTCTTACAATGAGAGGCAGTGGTTTGTGTTCGACCCAGATACCTCTTGTGCAAAATGTGATCCTGTTAGAGATGTTATAGTAAACGTGAATATTCCCTTAATCGCGATTGCTAATCTAGTGAAGAACTTCCCAGATTTCTTASGCTGGAAAGAGCTGTTATCTTTGATATTGGGCAATTTCAATGAAACGCTTTTCGAAAATAGAACAGTACAGGAACTTTTGTGGGGATACGATGATCCTTTTCTTGCAGAATACGCTAAGTTGAGGAAAAAGCTCMATCTCACTAGTATTCTTCCAGATGTCGATCCTCTCATAGCTTTGCAAAAGAATGATACTTATTCAGGATTCACAAMAGTCCACACTGGAGTGAAAGATATAAACTTGATAACTAAATGGACGGAATGGAAGGGAAAACCAGATGTGGGTGTATGGAACACGACCTACGCCAACATGCTAAATGGCAGCGATGGTACTCAGTTTCCTCCGCAACAGTCAACTGATAGTACACTCTATGTTTTCGTAACTCAGCTTTGCCGTTCATTATACTTGACATATAATAAACAAATAGCAATTCACGGAATTGATACTTTGCAGTTCACGACTCCAAAAGAGCTTTACTTAAATGCCTCAATGAATCCAAAAAACAAGGCATTTTGTACAAAGGAGTGTTACCCAACTGGAATATTAGACATTGGTGTGTGTCAGGATGCACCCATAACAATCCCATTGTTTGTGTCTGCACCACATTTTTATCTTGGAGATAAGTCTCTCACAAATAATGTGAAAGGTCTCTCTCCGAATGAAAAAGACCATGGAACATTCCTGGACGTTGAGCCACACCTTGGTGTACCGCTTAAAAGCAGCAAGCGACTCCAGATCAATGCTCTCATTGAACCAGTCGACGACATTAAACAAACTCAGAACCTTCACAAGTTATTCCTTCCTGTCATGTTTATTAATGAGACAGCCACCATTGATAATAGTCAGGCGCAAATGATCAAAGACAAAGTGTTGATGCCATTCACAGTTGTTCATGGTGTGGAGATAGGACTGGTTGTTCTTGGGGGCGTGCTTTGTTTGGCAGGATTGATTTTATTGGTGCTTTTGATTGACAGAAATAGGAAACTCAAACAGGTGAAAAACATACTATCAAACCCTGATGAAAACTCACCTCTTGTAGTCAGCACTTAGTAACATCATCTAGATTATGATCTTTTAGTTTAATATTATTAAAAGATCATWTCTATATTTAAAAAATGTCAAAAAGGCTAAGCTGAG\n>XM_028718607.1 PREDICTED: Podarcis muralis ubiquitin specific peptidase 4 (USP4), transcript variant X3, mRNA\u0001XM_028718608.1 PREDICTED: Podarcis muralis ubiquitin specific peptidase 4 (USP4), transcript variant X4, mRNA \nAGAAGGAGGGATTCCCTGCCTCCCTGCCCTTTCACTTCAGCGGAAAGCGGCCCCTTCTTCCTCAGCGTCAAAACACCGCGCTCGGCCCGGCGCTCCCTGCCCTCCGAACGCCCGGAGGCGTCGCCGCGCCTGCGCAGTGCCGTTCTGTGCGCGCGGCGGCGGCGGCGGCTGGGCGAGGAAGGATATCCGCAGTTGGGGACGGCCGGCCGGGCGAAAGCGCTTGCAGTACTGTCATGGCGGCAGCCGAAGTAGGGTTAGACGGCGGGGGAGGCGGCGGCGCCGGCCTGAGGCCGGACGCCGGGACGCAGCGGGCGGAACTTATGCCGCTGCTGGGGACGGCGCTGCGGCCGGGAGAGTCGTGGTTCCTAATTGACAGCCGGTGGTTCAAGCAGTGGAAGAAATACGTGGGCTTTGACAGTTGGGACTTGTACAACGTTGGAGAACCTAATCTCTTCCCGGGACCCATTGATAACTCGGGGCTTTTTGCAGACTCAGAAGCTCAGACTTTGAAAGAACATCTCATTGATGAGTTGGATTATGTGTTGGTTCCTACTGAAGCCTGGAACAAATTAGTAAATTGGTATGGTTGTATAGAGGGACAGAAACCAATAGTGAGGAAGGTTGTGGAGTATGGCCTGTTTGTGAAGCACTGTAAAGTAGAAGTTTATCTTTTGGAGCTGAAGCTGTGTCAGAACAGTGATCCTGCTAATCTTACGAGCTCTTATTTCAGCAAAGCAGACACTGTTGCTACTATTGAAAATGAAATGCGAAAGCAATTTAATATTCCTGACGGAAAAGAAATTAGACTGTGGAGCAGATACATGAGTAATACTTATGAGCAGCTAAGCAAACTCGACAGTACTATACAAGATGCGGGGCTCTATCAGGGACAGGTAGTGTTAATAGAAGTGAAGAATGAAGATGGTACGTGGCCCAGGCAATCTCAGACAAAAGGTTCTAGCTTTTCCTGCAACTCCTACAACAACAGGGAGAGCCCTCCTCAGTCACAGCCTGGTCTCTGTGGGCTCAGTAACCTAGGAAATACATGCTTCATGAATTCAGCTTTACAGTGTTTGAGTAACACCCCTCCACTGACTGACTATTTCTTGGAAGATGAGTATGAACCTGAAATAAATCAGGAGAATCCTCTGGGAATGAGAGGAGAAATTGCAGAAGCATATGCAGAACTCATCAAACAGATGTGGTCTGGGAGAAATTCTCACGTGGCCCCCCGCATGTTCAAAACCCAGGTTGGCCGCTTTGCTCCTCAGTTTTCAGGGTACCAGCAACAAGATTCCCAAGAGCTCCTGGCCTTTCTTTTAGATGGTTTACATGAGGATCTAAACAGAGTAAAAAAGAAACCTTACTTGGAGTTGAAGGATGCTAATGGCAGGCCTGATTCGGTGGTAGCAAAAGAAGCTTGGGAGAATCATCGATTGCGTAATAACTCTATAATTGTAGATATTTTCCATGGTCTCTTCAAATCCACATTGGTCTGCCCCAAATGTTCTAAAGTTTCCGTGACTTTTGACCCTTTTTGCTACTTAACCCTTCCATTGCCCTTGAAGAAAGATCGAACCATGGAGGTTTTCTTGGTTTTTGCAGATCCACAGCGCAAACCTACTCAGTACAAGGTAATTGTGCCAATGATGGGGGCTGTATCTGACCTGTGTGATGCACTCTCAAAATTCTCCGGGGTTCCTGCAGAAAACATGGTGGTGACAGATGTTTATAATCACCGATTCCACAAAATTTTCCAGATGGATGAAGGCTTAAGTCAGATTATGCCAAAGGACAACATCTTTGTATACGAAGTTTGTAAGTCAACGGAAGATGGTGCTGAATGCATCACTCTTTCAGTTTACTTCAGAGAAAAGAAAGCAAGACAATCCAGTGCTGCTCCGGGGACTGTTCTCTATGGGCAACCACTACTCATAGCTATACCCAAACACAAGCTTACTCTAGATCACTTGTACAATGTTATATTGGAGCGGATTAGTCGCTATGTTAAAGTTTCCTTAAAAGAAGAATGTTCTGAAGGATGTCCAGATAGTGAGAATTGCAATGGCTCCAGTAATGTGTCTGAAGGTGATGTTGAAGAAATGGAACATCAGAATGGAGAGGAAGACAGTAAGGAGAAAATATCAGAAACAGATGCCTGCAAATCAGAGGACTGCATCCAGGATGACCTGGAAAAGGAAGGCCTGCATCACAGAAGGCATCTCTTTAGCTTCAGTCTTGTGAACTCTTATGGAACATCAGAAATAAACTCCCTTAATACAGATGGGAAAATCCTCAAGTTGAGTTCTCATGCAACTCTTGCTATTGATTGGGATTCTGACACCCGAAAGTTGCTTTTTGATGAACATGAGGCACAGGCATTTGAAAAACACAACAGTATGTTTCAGCCACAGAAGAAGAAAACTACCGTAGCTCTGAAAGACTGCATAGAACTGTTCACTACTATGGAAACACTTGGTGAACATGATCCATGGTACTGTCCCAATTGCAAGAAACATCAACAAGCCACTAAGAAATTTGATCTCTGGTCACTTCCACGTATTTTAGTAGTACATTTAAAACGCTTCTCATATAACAGATACTGGAGGGATAAGCTTGACACTGTGGTTGAATTCCCTATCAGGGATTTGAACATGTCTGAGTTCGTTTGTGACCCAGCAGCAAGCCCATATGTGTATGACCTCATTGCTGTTTCCAATCACTATGGAGGCATGGGTGTTGGCCACTATACTGCATATGCTAAGAATAAAGTGAATGGCAAATGGTACTACTTTGATGATAGCAGTGTGTCTCCAGCATCCGAAGAGCAAATAGTGACAAAAGCGGCATATGTCCTCTTCTACCAACGTAGAGATGGCATGCTCAAGGGAAACCCCGCTCCTTGCATAAGCACTGAGCTGAAATCTGAGGAATGTGATGGCATGGATACCAACTGAACCTATGTGGTGGGGTTTAAACAAGTCATATTGCTAATTTTAAAAAGCATCCAAGAACTGATTTTTGTAAGAATCAAACAGGAGTTTCAGTACAGAAGGACTCAATGAGCAGTAACTATGGATAGCATAGGGAAGCAATAAGATGTCAAGGACTTGGGTATATCATAGCCAAAGAGCTTTTAAACAAATAGTTATTCAATAAAGTGTTATCTAAATCTGACTGTGTAGTCTGGCAGAAACTGTGTGGAAGCAGGAGCTTATGCTGTATGACTGGAGCAATGCATGAAAGTGCGAAACAACATTTGACTGTAAGTAGAATTCTGGTTTGAGCTCTATGCATTGCAGAAGATGCCTGAGTGCTTGTGTTTCCAGAGTAAAAGAGAAGTGAACATTTGGCACAAGTTCCAATCTCGCACAGCACATTTTGGCACTATGTTGCTGTCAGTCCCTTGCTGACATGGCATGGTGAGCTTGTGTGTGCTTTTAAGAAAAAGAGAAAATTGCATATTTGTTCTGGCTCATTGTGTCCCATACAGGAGTCACAATCCCCACATTTTCTTGTTCCGTTCTAATAAAACAATTATTTAGGATCCGTCCCAAAGATTAACTTTCCCCCACCCCCAGCCTTTCCAGCAGCAGTATTCATGGGGCCTATTCTTCACACCAACTCACATGGAGCCTTATATGCTCCTGATCTAGTTGGTAACTTACATATTGTGCAATCACAAGGCTTCTTTATTCAAGTGTCTCATTGGGGAGCTAAAATAACTTTCCCTGGTAGTTTTTTTAAATTCCGCTGTCAACTGTCTTCTATTTCTGTGCACTTTCAGCCACACCAGGAAAAGTTCAGAGTCCATCTCTTGAAGGCTGCATAGGAATCAGTGTCCAGTGGAATATGTCCTTTTGGGTGGTCTCAGACACGACACACTATTTTTCTTTTTAGCCATTTTATTTCTCTTTTTGTAATCTTTTGCTATCCTCATACCTCCTTAGTATTTTTTCCTCATTGGCTGAGAGATGGCAAGAGTAAATGTTGTTTGACTTCTTCCTACCCACAGCCTCCTCCTCCACGGAGGATGATAGACAAGAACCTTCTAGGAAAGGAGCTTTCAGGTAACACCGTGGAATTCCCATGCACACTGCTATGACACCTTAAGACATTTCCCATTTAGTGTCATGGCTTTGAAACTATCTTGGCACCTGTGTAAAGGTGTTTCACTTTTGTGCTCTGAACACATTCCCACGGATTCCCTTCAGCAAACTAAGAAGTATTCCTCTCCCAGACTGCTTCTGTGCTGATCTTTATCGGCATGACGTCAGGCAAGTGGTAGCCAGTGGTATCGTCAGGCCACACCATTTTAGCAGAACTGATTAAAAGTGATCGTGTTCTTTTTAACTTACAGAGCAGAAGAGTCCTCATTGCTGTCAGCTGCATTTTCCTCACTATTTTCCAGTGATTACTATTGCGTTCTCCAGGATAGTCCTTTTAAACACTGAAATTTGAGCTGTTTGGTTCAGTTGCTAATGCTTCCAGGTTCTTTAATTGATTTGAGGTCTTGTCTCAACTGGATATTATTTTCCTGCACACTTGGGTTGGTGGGTGGGGTTAGGGCTGGAATTATTTAAAGGCTAAGTTCAAACTGTAGCATTGCACTGTTTTGTTTTTTCCTGTTTTTCTGGGTTATATTTTCTTTGGAATGTAACATTTGGACCGATAAGGAAACAGATATTTAAAAGCAAAGAGCAATTTAATGTAACCATATGTATTTCTGTTCCATACTGTTGCAGCAAACTTTTCACTGCTCTGTATGGTCAGATAGTGTGCACATTTGTGTTTGGGTGATTTTTGGGCTCCTGAACTAAATTTCTTCTAAATGCTGTAAAGATGGTATTAGGAACCTGGATTTGCCTCTGACCAGGCTGGATCCTAGCTGGTGTGTACATTCTGTATAGTGTCAAAATCTGTTTTTAGACTAGCACTTTGTAAGTGACTGGCTTTACTGTATAAAAGGAAAAAAAATTAAAAAGAAGTGGATTGCA\n>XM_029695648.1 PREDICTED: Salmo trutta inaD-like protein (LOC115151590), transcript variant X3, mRNA \nCCTCCCTTCTCTCTCCTCTCTACGTTTGTTCTCTGTAGATTCTCACCATATTTCAGTATGCCTGCTCAGCCTTGCTCAAGGCAGCGCTGCCAACCAACACCACGAGGTTGACAACGGACAAACACACACACAAACACACACACTGGCGCATGGGGATGTTAAACTCAGGATTGCTGGGAGAGTGAAGCATGGACCATGCTGCCAGAGCGGATCAGGTTGCGTTACGGGGAGCTGCGCGGGGAGCTGCTGTGTGTGGAGCTGGACAGGGAGCGCCAGGGCCTGGGTCTGAGCCTGGCGGGGAACAAGGACCGCTCCTGCCTCAGCATCTTCGTGGTAGGCATCAGCCCTGGGGGCCCCGCCGCCAAGGACGGACGCATCCGCATAGGGGACGAGCTGCTGGAGATCAACAACCAGGTCCTGTATGGCCGCAGCCACCTGAATGCCTCGGCCATCATCAAGAGCACCTCGTCCAAGGTCAAGATCACCCTGATCAGGAATGAAGATGCTATCAACCAGATGGCCGTTCCCCCCTTTCCAAACCCTCCTGCTGTCCTCTCCTCCACTGAAACCCATCCCCCCAAACCAGCAGCAGTAGCATCCCCGGGCCCCACAGAGAAGTCTCAAACCCCAGAGAGCCTGGCCCTCAGCAGGGGACCCCTGGAGGCCTCCATCTCCATCAGCGAGGTGAAGTCCAGTGTTGGGTCCAGTGGGAGCACAGCTACAGAGCTTGTTTCCAGAGAAGCAACACTCAAGATCCTCCGAGAGACTTCCTCAAAGAAGGCCTCAGAGAACGAGGCTGAGTCTTCAGAGAGCGTGACTGTGCCGGCTGCCAAGGCCCCCCTGGAGCAGACTGCTCTCCTGTCCAAAACCTGTCGGCTGTCCTGTAAGCTGCCTGTGGTGAGCTCTGTGAAAGGGGGGCTGGTGCCCACCCCTGCCTCTTCCCTGCCTTCCTCCTGCACCAGCCCAGACTTTGAGTACTGCAACAAAGACCCAGCCACGTGCCCTATCGTTCCAGGCCAGGAGATAATCATAGAGATCGCCAAGGGTCGCTCTGGCCTGGGTCTCAGCATCGTAGGGGGAAAAGACACCCAGCTGGATGCCATAGTGATCCATGAGGTATATGAGGAGGGGGCGGCGGCACGCGATGGACGACTCTGGGCTGGAGATCAGATCCTGGAGGTAAATGGTGTGGACCTGCGTAACGTGGCCCATGAGGACGCCATCACAGCCCTAAGGCAGACCCCGGCCAAGGTGTGTCTTAAGGTTCTGCGGGACGAGGCGAGGTACCGCGACCAGGAGAACCTAGATGTGTTCAGTGTGGAACTGCAGAAAAAGGCCGGCCGTGGCCTGGGCCTCAGTATCGTCGGCAAGAGGAACGGCACAGGGGTGTTCATCTCGGACGTGGTGAAAGGAGGCGCCGCCGAGCTGGATGGCCGGCTGATGCAGGGGGACCAGATTATCTCTGTCAACGGAGATGACATGAGGTCTGCCTCGCAAGAGACGGTAGCTGCCATTCTCAAGTGTGCCAGGGGGGTGGTACTCCTAGAGCTGGGCCGACTGAAGGCTGCCTCCTGGATCTCTTCCAGACGTACCTCCCAGGAAAGCCAGCAGATGAGTCACGTGAGTGCCAACAGCACTATCGTCACGCCCCACCCCCCGCTAAACTCCACCCCTTCCACCTCTCAGCTCCTCAATAACGTCAGGAAGCCAATGACGGTGGGCATGACATCATCACAGAGCGCAGAAACAGGGATGCGCACTGTGGAGATCACAAGGGGTCCTACTGATGCGCTGGGGATCAGTATAGCTGGGGGGAAGGACAGTCCTCTGGGGGATATCCCCATCTTCCTGGCCATGATACAGGCCAACGGGGTGGCAGCCAAGACGCACCGGCTCAAGGTGGGTGATAGGATCGTGAGTATCAACTCCCAGTCTCTGGAAGGCCTGTCCCATGGGGATGTAGTCACCATGCTGAAGAATGCCTACGGCAGCATCATTCTGAAGGTGATTGCTGACACTAACATCAGTGCTATAGCCAGTCAGGTGGAGAGTATGTCGACTAGCAGCAGCCCCGAGACACAGCCAGGGGAACCAGAAGCCCCCAAGCCCAAGAGTATCTGCCTGGAGAAGGGTTCTGACGGCCTGGGCTTCAGCATCGTAGGAGGCTTCGGAAGCCCTCATGGAGACCTGCCAATCTACATCAAGACTGTCTTCAGCAAGGGGGCAGCAGCGGTGGACGGGCGTCTGAAGAGGGGTGACCAGATCTTGTCTGTGAATGGAGAGAGTCTGGAAGGGACCACACACGAGCTGGCTGTGGCCATACTGAAGAGACAGAAAGGGGCCGTCACCCTGGATGTGCTGTCCTAGCTCACACACTCTCTACCCCTTCAACTCTCTACCCCTTCAACTCTCTACCCCTTCAACTCTCTACCCCTTCAACTCTCTACCCCTTCAACTCTCTACCCCTTCAACTCTCTACCCCTTCAACTCTCTACCCCTTCAA\n>XM_046072427.1 PREDICTED: Micropterus dolomieu transcription factor ETV6-like (LOC123985072), transcript variant X4, mRNA \nTAACAGCATAGGTTTCAGGTTTGCAGCCAGTGTTTTGGAGCAGGGAGGACGTGGCCCAGTGGCTGCGATGGGCCGAGAAGGAGTTTGCCCTGCGGCCAATCACCAGCGGCTCCTTCCAGATGAACGGCAAAGCTCTGCTGCTGCTCACCAAAGAGGACTTCCGCTACCGATCCCCTCACTCCGGGGACGTCTTGTATGAGCTGCTGCAGCACATCCTGAAGCAGAGGAAGCCCCATGTGTTTTACCCGTCTGCCTACTTCCCTGGGAACTCCTTCCACTCGCTGCCTGAAAGCGCTGTGCAGCACCTGAAGCTTGAAGAAACGGTACGGCGGGCACCACGTGGTACGGAGCCACTCCCCCAGCATCCACCAACCATTGAGCTGCGGCACCGCTCCCGCTCCCCCCATCATCCAACCACCAGACGATCCCCTCCGGAGCCAAACCACCCCCGCCAAGCCAATGAGGACCCCCTCCAGACCTTCTCCCAGCTGCCCGACAGCAACCACCACCTGCCCGAGGAAATGTACCCTCTGTCGGTGTCTCCGGCTGCACCCAACGGCCGCTGTGCGACGCCCCGGGAAGCCCCATGTCCGGGCAGCCCTGGGGGCCAGGAGGCGGGCCCTCCTCGCGTCATCCAGCTCATGCCCAGCGCCATCATGAACCCCCTGCTCCTCAGCCCGAGCAGGAGCGGCGGGGGTGCCGCCATGGACTTCAGGCACAGCCGTGGCGGACCCCCCTCTCAGGTGACGCTCGAGAACGGGCGCGAGGGGAAGGTCCACGCCCACCACCATCAAATATCACTCTCCCAGCAGCAGCAGCAGCAGCAGCAGCACCACCTACTGCAGCAGCAGGAGGAGGTGCTTTACCGGAACCAGGTCATCATGCCCGTGTCTCCTCCAGAGGAGCAACAAATACCCATCGGACGGATAGCAGACTGCAGGCTGCTCTGGGACTATGTCTACCAACTCCTGTCAGACAGCAGGTACGAAAACTACATCCGCTGGGAGGATCCAGAGAGCAAAGTCTTCCGCATCATGGACCCCAATGGCCTGGCCAGGTTGTGGGGAAACCACAAGAACAGGACCAATATGACCTACGAGAAGATGTCACGAGCACTGAGACACTACTACAAACTGAACATTATCCGGAAAGAGCCTGGACAAAGACTTCTATTCAGGTTTATGAAAACTCCCGATGAGATAATGAACGGGCAGACGGACCGGCTGGAGCACCTGGAGTCCGACACAGACGAACAAATCTACATCAAAGAGGAATGCTGAGGAAATCTTGGGGGAGGGGATGAGTCCATGAACTACTTACTACTTACTACTACTACAGCCGCTGATGCCTTTCAGAAGCAGCCTGAACAATCGTTGTTGAATCTGGAGCACGTGGATGTGCGCTTGTATCAGTCCCACACAGATGGATGTGAAATGTGGTCTCCCGTAAGATTGCCTTAGGATGACGTTTTCCTGAAGTAAACAGATTTTCCTGATGGAGCGAGCTGAGAGCACTTTCTAAGTGTTCCCTTTTTATTTCTGAATGAACTGCAAAAAAAAAATCACTTTGTGCTTAAGTCACTTTTATGATTTTTATTATTTTTTTGTCCCCTCACATGCATTATACAATGGAATTTTGCTGTTTGTAAAAAGAAAATCGCGTGTGTGTGTGCGTGTGTGTGACAGGAATGTTTTCACCATGGAATAAACATTTTTTGATCAAACTGTA\n>MG257935.1 Paenisporosarcina sp. strain SC-Apr-C3 16S ribosomal RNA gene, partial sequence \nGCCTAATACATGCAAGTCGAGCGGAATGAAGAAGAAGCTTGCTTCTTCTGATTTTAGCGGCGGACGGGTGAGTAACACGTGGGCAACCTACCTTGTAGATTGGGATAACTCCGGGAAACCGGGGCTAATACCGAATAATCCATTTTGCTTCATGGCGAAATGTTAAAAGGCGGCTTCGGCTGTCACTGCAAGATGGGCCCGCGGCGTATTAGCTAGTTGGTAGGGTAACGGCCTACCAAGGCGACGATACGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGACGAAAGTCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTGTAAGGGAAGAACACGTACGAGAGTAACTGCTCGTACCTTGACGGTACCTTATTAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTCCTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGAGGACTTGAGTACAGAAGAGGAAAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGG\n>XR_003604399.1 PREDICTED: Vigna unguiculata uncharacterized LOC114183599 (LOC114183599), transcript variant X4, ncRNA \nGTAATACCTTTTCACACATTTTTCCAAAATTTTCCTATTCTAACTTTTTTTACTTAAAATTGAAAACCTAAACACCTTCTCCCTCATAGAAAACCTAAACACCTTCTCCCTCAATCAGTCGCATCTCTAGCTTTGTCGCTCACTCTTTCACTCATGATTCTAGCTCAGTTGCCCACTCCGTCACGTGTCACTCTATTACTCCGTCGTAGGCAGCCCTATCATTCGTCGGAGTTGTTCGCAACTTTTAGGAGCTTCCACTTCCGATTGTTTTCCTAACATTTCACTTTCGATTTGCTTGCACTCATGATCATGGCAGGAAACATGTCTGATCCAAGTGGGAGCAAGGGTGCAAATATTTTCATTGTATCTTCTTCCTTGTTTTGAAAAAATTATGGAAAACGCCCTTACATTACCATGATTTTTCTACAAAACTTCTGTTAATAAGGATAGTTCTGAGAAGTTAGAAGGGACATTCTCATTGTCAATTATGCCTGATCGGTTTGTATTTTACTTGGAAGGACATGCTCCTAGAGTTGACCTGCCCATAAGATCAGTAGAGATAAGCTGGTCCACTCCAAATAATAATGTTATAAAAGACTCCAATGGTGGCAACCTTGTTGATATGGAGCCTAGGATGCACAGTTTTGGAAATGGCTACAACTAAACCTCATTGGAGTCAGCATGAAAGGGTTAGTAATTTATGTATGTCAATATATTGGAAGTTTTAGCTAGCTTTTTTATATTTTGTTTCCC\n>XM_043838092.1 PREDICTED: Telopea speciosissima uncharacterized LOC122644689 (LOC122644689), transcript variant X2, mRNA \nTCTTCTTAGCTCTTTTTGGAGTCTGTAAAGTTGAGGCATGGGAGTAAAGGTTGCCGCGACCTGTTTACAATGGTCGCAGCCAGTAGCTTCACACTCTCCTTCATCGGCTCAGACGCTAGCCTCTGCAATTTCATCTCCTTCGACGAAAAAACAGAGAGGAGGCGATCGAGTTCTTGTATGCCGATTCGTCCATAAATTGGCTTTCTTGGGAACGTCATCGACGAAGCTTTTGAGATCTCGATCTTGCGATAATCTGAAGTCTAGAGGCCAATTCCTCAGGCGAGCTTGCAGCGCCAACTTAGATGGATACCCTGACGAAGAGTTCACGGAAAATACTCGGGAATTAGCACAGAGGTTCGATCTTTTAAGCGATGGTGATGAAGAACAGAACAATAATTACGACGCGGAGGATGTAGAATTGGATAATTCTGCTGTTGATTCCGGGGAAAAACAAGGCGAGAGCAGCAGCAGGAACATCGACAATTGCAGCACAAATTCGGTACGAATATCCAGTTCTTTTCAGCCACCGAAGCTGGAGTGTGTGCAGCCTCCATGGCTTCATGTCAAGCCGGAACCACCAGACTGGCCAGGAAGGGATGAGATTGATCAGGCGAGTATAGAACGAAAGGCAAATAGCGTGGACCTTCCCTTATCTCTTAGAATGATAAAGAAGAAGATGCAATGGCAAGAAGGTTTCAGACAAGCAGGGGAATCTGCCTACTGCTCGATGAAGAAGGCCTTCTCGTCGATGGTGTTTATCATTCGTGAGCTTCAATGCTACACGTTGCATATGCGAGAGATTCTCTTCTACGAAGACCTCCAAGGTATCCTGGCACGAGTACAGATGGAGATGCACGCCTCATTTGTTTGGCTTTTCCAACAGGTCTTCTCACACACGCCCACTCTAATGGTCTACGTGATGATCCTTCTTGCCAATTTCACCGTGTATTCGATGGGAAACAACGCAGCAATCGCAGCTCCGCCACCGGCGTCGGCTGCCACGGAGATCGTATCGGTGAATGAAAACCAACCCAAGAGTTTTGATTCTTCTTCGGTAATGAACACGTTTTCAGTTTCGTCTTCGACCGGGAAAACGGCCTTCGTGGGAGGACACAATGGCGGCGGCGGTGGAAAGTTCCGGCGTGTGATGAGTGGGACTGAGGGAGATGGACCTTCCGATAGTTCGTCATCGTCATGGAACTATCAGTCTCTGTCTCATCAGGTATCGTCGTTTGGGAACCCCAACCCCACGACGACGGAGGGAGCAGAGTCGGAGTCGGCATCGGTGGTAGAGGCAAATCCGGATGGTTTTGTTGGAGGAGTAAGGAGCGAGGAAGAAATGAAACTGTGGAATTCGATGGTGGATGAAGCTATGAGAATGCAATCGGAGGTGAGGGACGAGTCTCTCGATATCCACACGATAACAAATTTCGTTTCTCCGATAAAGGCAAACATTGAAGAGGAGGACCAATCTGATTACTTGAGGACGGAGCTTCTGTATAAGACGGCCGTGTCTCAAGAGCCCAACAACCCTTTGCTACTTGCGAATTACGCGCAGTTCCTATACGTCGTCTTACACGATCATGACAGAGCGGAGGATTACTTCAAGAGGGCAATAGAGGTGGGGAAGAAAGGAGGAGGAGGAGGAGATGCAGAGGCGTGGAGTAAATATGCAACATTCCTGTGGCTGGTGAAGAAGGATATAGAGGCGGCTGAGGAGACATATTTAGAGGCGCTAGCGGCGGAGCCAGGGAACACGTACTACGCCGCTACCTACGCTCATTTCTTGTGGAACACTGGTGGAGAGGACACTTGTTATCCTCTCGACTCCCCCGACAACGACTTCGACAATATGGTTTAACAAGAAATAGG\n>AY015863.1 Lepidium latifolium chloroplast tRNA-Leu (trnL) gene, intron sequence \nTTKAKCCTTGGTATGGAAACCTACTAAGTKATAACTTTYAAATTCAGAGAAACCCTGGAATTAACAATGGGCAATCCTGAGCCAAATCCTGGTTTACGCGAACAAACCGGAGTTTAAAAACGAGAAAAAAGGGATAGGTGCAGAGACTCAATGGAAGCTATTCTAACAAATGGAGTTCACTACCTTGTGTTGATATTGTGTTGATAAAGGAATCCTTCGATCGAAACTTCAAATCAAAAAGGATGAAGGAGAAAAACCTATATTTAGACAATATAGGTAACACAAAAGATCTCAAAAATGACGACCTGAATCTCGATTTCTATTTATTTATAAACAAAATAGGAATGTTGTGAATCAATTCGAAGTTTAAGAAAAAATCAACTATTCAGTGATCAAATGATTCACTTCATAGTCTGATAGATCCTTGGTGGAACTTATTAATTGGACGAGAATAAAGATAGAGTCCCATTCTACATGTCAATACTGACAACAATGAAATTTATAGTAAGATVAAAATCCG\n>XM_014048373.1 Monoraphidium neglectum hypothetical protein mRNA \nATGGAGGCAGCCTTGCGACAGCTGCTGTCATGCGTCGACAGCGGCCGCCGCGACGCCGCCAGCGCGGCGCTCGTGAGGCTGCAGCACGCGTGCCGCGCAGCCGCAGAAACTGGCTGCGCCGCGGCGGTTGAGGTGCCCGGCGAGCGCTCCTTGGACCGACTGCTGCGGCACCTGTCCTTGGCCGGCGGCAGCGCGCGGGCGACCAAAGCGGACTTCAACACATCCCTGACCGCCAACCGGGCGCTCCTGATCCTGCTGAACGTGCGAGCAGTGGCGGACGCCTTTCTGACGGAGGGTCGCGTGGCCGCCCTGGTCGACACACTCGAGGCGCTCGATGGCGGCGAGGAGGGCGGCAGCGGCGGCCGCGAGGGCATCTCGGAATTGCGGCTGTGGCTGCTGACCGCGAATCTGGCAGCCGCGGCGCTGCACTTAGGTCTTCAACGCAACGGGCCCACGGGTGGCGACGTCGACGGCGGCGGCGGCCCCATCAACCCCGCGCAGCTCGCCCTGGCTGGAGTCATTGCGCGGCCGGCTGCCGTGCGCGTGCTTGTGCGGGCGGCGCACACGCAGCTGTCATCAGAGCTGTCTGCAGGGGACCTTCTATCGCCGCTTGAGCAGGCATTCTTGGCTGCAGCTTTCTTGCGAGAGCGGGCTACGCCAGCCCCCCACGACACGCCGTCAGGGCCCTCGTCCTGCGCCGCTGACCTGTTTGCCGCAGCGCGCGCGGCGTGGCAGGGCGCCGACGCCAATTGGCTCTGCGAGGCGCTGCCGCCGCTGCTGGCGATGCGACTGGAGGAGGCCAGGCAGCGGCAAGGGACAGGGCCCGGCGGAGAGGCGCTTGAGCCGCACGCTGCTCTGTTCGTGGCCTTGCACTTGTGCGCCGTGGTCGGTCCCCTGAGCAGGGCCCTGTCTTTGCACGCGGCCGCCATGCGCGCGGTCGCAGCGTGCATTTGTCGGAGCGGAGACATCCGCCTGGCCAGGTCATCGTTGGTCATCCTGACCGGCGCGCTCGACGCCTGGCCCTGGGGCCACGAGGGCGCCGGCACAGCGCTCGCGGCTTGCTGCCAACCCGACACTCTCGGGGAGCTGCTGCGCACAGCCGCCCTTCGCGGCACCCGCGGCGGCAGCGGGGTGGCGGCCGGCACGCCGGCGAACCAGGAGATGTTTCCGACTGTAACGGATGGTGGTTGTGCAGCGCAGCTGCTGGCATCGATCGCGGCCCACGAGGCGCTGTCCACGCGGCCATCCAGCATTGCTGCAGTGCCAGCGACCGCGGCTGCGGCGGTGGCGAGCCTGCGCAATTGGCTAGAAGTGGACGGCGCGCAGATGGCTTATGGCAACATGCCGCGACTCCATCAAGTCTGTGTGATGGTGCTCAGCGTTGTTGCTGGCGGCGGCGCCGATGGCGACGCATGGGCGGCCACGTTGTTGCGCCTCGGAGCGCGGCAGCTGCTGATGCGCGCCGCGGCCGAGCTAGGGCCAAGGGCACCCGAGTGGTCGGCGGCCGCATCAGCAGCACTTTACGCCGTCACACACGCAGCGCACGCATCACATCAGCAGCAGCAGCAGCAGCCTGCACAAGGCGGCACCACCAGCGGGCTTGAGGAAGGTGAGGAGGAGCAGGGCGCTGTCGCCGCCTTGGTGGATGCTGGGGTTTACGCGGTCCCGCAACTGCTCTTGCTGGCGGCCCTGCGTCCCGGCTGGCGGTCCTGGCTGATCCAGGAGCCAGACATACTGGAGCTGCTGTCGGCCGTGGCGGCTGCCCCTGACCAGGGCGAGTACAGCCACAAGGCCCTCCGCACCCTCTGCCTGCTGGCTGCGGGCGCGGCGCCGTCGGAGCGCCTGCCAAACTTTGCGCGGGCTGTGCTGGAGGTGTGCAATGAGCGGCCGGCGGACGTGTGGGCCGGAGTCCCTGAGCTGGACAGCGATGGCGGGGCCGTGGAGGAGGTGTTGGGGTGCCTTGCGGGCTGCCATGAGGCAGGCAGCAGTGTGGGTGAGCGCGCTGCCCTGGCTCTGACCCAGCTGAGGATCGGCAAGCTTGGGTTGGTGCAGCCCCCATCGCAACAGCAGCAGCAGCAGCAGGAGGAGGAGGAGCAAGACGTGCAGCAGCAACAGCAGCAGCACCAGCCGCGGCCACAGCCGCAACAGCACCAGCAGGAGGACAAGCCAAGCATGCAGCAGGCGCCAAACACAGGACATGCAGGGGCTATGAGAACGGCGCGCCCACATAGTGCATGCGCTGTCTGCGGCAGGACGGCGCGAGAAGGCGCCAAACTGCGGCGCTGTGCCGGCTGTGGCCGTGTCACGGGGACGCGGTACTGCAGCCAGGAGTGCTGCAGGACGGACTGGGTGGTGAGGGGGCACCGCGCGGTGTGCGAGGCGGCGCGGCGGGGCCAGGAGCCGTGA\n>XM_031652239.1 PREDICTED: Papio anubis mab-21 like 3 (MAB21L3), transcript variant X1, mRNA \nTGCAGATATTCTTTAGTATTTAAAAATGAGCAAATAAACAAAATGAGGCAAATAAATGAAGAAAATGAGTTTCTGAGGCACTGCTTAAGTGACCATAAATCAGACACATATTTTTATGGTGGGCAAATTGATGAAGATACTTTTAGTAGGCGATTTATATTCATAACAAATACATATTGAAATAATGTCACTACTGTATCAGAATTAAGAAACAGCCTCGCATTAGGACTTCTCCGTACAAATTCTTTATCATTGGTTCTTAAATTGGAAAAGTACCTATAAATGATTACATTTTTTAACTAAATAAAATGCAGATATTTTGGCTTCTTGTGAATTTAATAAAGAATCATAAAACATAGGCCTTTTTTTTGTTCTCCCAGAATGTCTCAAAAGCTACAGTAGTAGCTTTGACAAGTTGGGCAAATGCAGAACCTGCTAATGAGTTAAGTAATATGTGGACAGGGGTTGTAGCAAAGTTGTAGACTGATGGACACAAAAGTTAACTATCCAAATACTTCTAGAATGAGGAAAATGCAAAGACAGTGCATTGTGGAAAATCCATCAATGTAGAATATCAAAGGAGAAAGAGCTTATGATTACCTCAATAGAAAAATAAACATTATTTGACAACATTCAACATACATTCAAAATAAAAGCTATTAGTAGAGTAGGAATAAAAGGATGCTTCCTTAATAAAATAAGAGATACTATAGTAGATATGGTAAATTGGCACACAGCATCTCTTCACCTTCCTGGTACCTTGGCCTTTAGCCTTTTTTTTTTTATCATAACCCACAGTAAGAAATGTGTTTTATATATTCATCCTGTCATACTTCCCCACTTACAAATATATATGTACATATAAAATATCTATGAATCATAAAAATGTGTATATTTTATGCAATAATACTTAATCTTGCTAGGTACACTAATAACTTATGTTCTATTTCACTTTTTAAAATGCCATTTATGACTCAATAAATGGATATCATGACCCGCTAATAGGTTCCAACCCATAGTTTGAAATCCACTGTTCTACTCTATCTTCTTGTACTACAGAAGCTTTGAAGCTAAAATGTACATTTTCTGAATTTCTTGCAGATAAGTTTACCCTTTGCAGCCAGGTGAAGTTTTGTTTCCTTCAATCAGATACAAATGGAACTTGGAAGGTAGAAGCAAGGTGGAGGCCATACTTTTGATGAGTCTGCATTTTTCTTCACAGTGGTGGAGCCATTTGGTTTTTTTGAGGCAGTATCAGCCAGAGATGTTGTCAGTTGAGCAATAAGATCTTAAGATGTTTTGATAAACCTGGAGTAATACTTCTAGTATTCAAATGGAAAAGCAAAGATCCAAAAATATTCAAGACAACTCTGATAAAGAAGAGCACACAGAAGCTCTGAAGTCAGACTACGAAATGAGTCCTAAGGGGCCTGAATGAAGATGTCAGCAGAGCTGGTTTCTGGATTCCTTTTCTGCAATAAAAGAGGAATGCCTGTAATCTGCCTTCTCCTCCCACTTTTCTGAAGAATCCCTGGAGCAAAATTGGGGAGGAGGCCGTAGCCTCCTTGTGGGAGGAGTTGGAGAGACTACATGATAAAACAACTTTCTGACCCTAGACAAAAGACCTTCTCTCTTCTGTTTTTGGAATCGTTTTGGAAGGATGACAGATGGATTTTCACAATTTGGAAATAAAAACATGAGTGAAGGGTTCAGAAGGCAAGTCTCTGGTCCATTACACACTTCCAGAAAAATTTAGTACCCAGAGACTCACATTACTGGGAGTGCTGTTTACTCACAAGTGTTGCACTCCATTGAGAAAAAAAAAAAAAACCAGGAAGTTGCTGTTCTACTCAGGACTGACCAAGAAGCCATGAAATCCCTTACTGTGGGAGGCTTAGAAGATTGCCTACTGAATAAGGTGGACTTGAGGCGCCAGCAGATTTCCCAGGCTATGGAGGAGGTGCAGAAAGTCGTTCATCATTTGACCACAAACATCAGCAACCAAGACATTAGATTTCAAACTGTGCCTTACTCTGACACATACAATGAAAATATTAAGGTTTTGGCCCCCAGTCAGTTCCTTGTCACAGTCCCAATAAAAGGCCTGGCTGGCTACAGGGAGGCCAGGGAGCAGCGCTGGAGGTACTACACCCTGCAGGGCACCAGGCTGCCCTGCCCGTTGCGGGACCCTGAGGGTCTGCAGCAGTGGCTGGAGGTGGAACAGTTTATGAAGAGCCTGTGGCAGTGGCATGAGACAGACGTGAACATCGACGGAGACATTGTGCCCGCTAAGGTCCTCCTGGTGTTCCGGAAGCTGGTGGAAAACGCAATTAGAACCTGTCACCTCTCAGGTAAGGTCAGCATGCTAGGAAACCGCTCTGCAGTTTGGATTGCTGTGGAAACATCTGCATATCAGGTGGAATTGGAGCTGGCCCCCGCGGTGGAGATCCCCACCACCTGGTCCGAGAAAGCCCGGTGGCCTCGATGTCTGCAGCGCTGGCCTTCCCAAGAGAGAGTGGAGTGCATCAAGTCGTTTGGGTTTAACTTGTTGCCCTGTTCAAATTATCACTGGCAGCTGAGCTTCCTCCGTGCTGAGCAGGTGTTGCTAGAACAGCTGGATGAGGATGGGGGCTGCCGTAGGAAGTGTTTTCAGGTCATGAGGCAGCTGAAGGAGGACGTGTGGTGCCCAGGGAACAGGCCGGTCATCACGTCCCACCATCTGCAGACGGTGCTCTTTTGGACCTGCGAGAAATATCCCCACTTTAAAGACTGGAAGGTCTTCAGCAAAGCGTTTCTGCGCCTGGTGAGGAAATTGCACAAGTGTGTGAGCCAGCACTTCCTGAAACACTATTTCGTCCGGAACAGCAACCTCTTTCAGTGCACCAACCCGATCGAACTGGACGCTGTGGCCCAAAAACTGGCCACCTTCCTGAAGAAGCCCCAGATCAGCCCGCCCTGATGGCTGCCCCAGCCTGGGAGGCTCTTGGACATTTTATTCTGGCTTAACCTTGTTCTTTGGATGGTTCCTAAGTCAGGTGCCAGGATCCTGCCTAGGAGAAAGGCCATGAATGGCAGCGGAAATTACATCAAACCAGTAACACTTCAGCAGGGAGGGAGGAAACTGTGCCCCAGGCTGTCTGGCCCAGGCCTCCCTGGAGCCCAGCAAGCATTTCCACCCTAGCTACCTCTCCTGGAGACGGCTCTCATCAGGCTGCCTCAGGCACAGATTTGGAACTGGTGACAGTTCTGAACTTAGTTTCCCTTGTTCAGGCTCTGATCGCCTCACAGTGAAGATGGAGACGGAACCCCTGGAAGACATGAGCCTGCTGGCCAATACTGTGCCCAGCCCACCGATCATGGGTGCATTCTCCTGCCATTTGTAAAATGGGAATGTTAACGTGCCTACCTCTGAGCAGGGCTGTGTGTCTATGAGACTGTGCTGGCGCCTTTTCAAGGGGAAGACATTGGATCAACACAAAGTGTTCCTGGTTGGTTGAGCAGCTGGTGTTTGCATCCTGGATCGGTACCCACAGCACTGACGCAAAATTGCACCTGTTGAGTTAGCGAGCCTGTGCTTCCTTGCTGCCCTCCAGCTTCCTTAGCATGTGGGTCAGTGGCTCCTGAGGTTCTGTCTGCTTCTCTGGTATTCTCTAAGCAGGGACGGGAGTGGTTTTGATGACAAGTTTAAGTCAAAGATGAAAGCACAGCTGTTGGCCTGATCCCAACCGCAGCCCTCTCTTTGCTTCCCAGGCCATAGGCCATGGATGGAACTTCCTTATATATTTATGTAAATAACCTAGTACCATGATCTGCATGGAGTGACCTTAGGTGTCTGTCACCACTCATTGTGTTCCTTTGCTCACTTCATTCACTCACTCACTCATTGACAAATAATGCTCATTAGGCACCGGGAACACAGCAAAGAGCAAAGTGGATGAGGACCTCCCCCTGGGGATGCCGCCTAATGGTGGAGACAAGAAATGAACAACGGATAAACATGCACAGTTATTACAGATGGAAGCAAATGCTCCGAAGGAAATAAACAGAATGTTGAAGTAGAGTCCACAGAAGGGTCCCCAAAGGATGAAAATGCAAATAGCTGAAGGGGAAGGAAAAGTGACCAAAGGCAGGCCTGGCAGAGCTGGCATGAGTCAGAGCACCTGGCCTTGTAAAGCCAGGAAGGAATCAGTATTTTATTCTAAGATCAAAGGTGTGACATTTGGCCTCTGCAGAAGCGGAGGAGTATCACCATCTGACTGCATTTTAAACAATTGTTCTGGTAACTGCATGAAGAAGGTCTGGGGACTCACACGTGAGCCAGGAGCTCTTGAGCCACCCATTTGGAATTTCACAGAGGCCCACAAGGCAGCATATTCTGTGTAGCACAACTGATCAGGATTTCTAGGAGTTCTCGGTGAGATCAATGGTTTTTTTCTGGCGTTTACGTAATGCTTCTCAACTCAAGGGGCTCCTTTATTACTTTGGAATGTTTTTGCCCAAATATCTATACCAAAGATAAATTTCTAAAACATGAGCTACTGGTTTTGTTTTGATGAAAATTCACATTTGAAAATAAAAATGATTATTTTTCAAAAGTACTGTAACCAAATGGTGGGGTCCCTAGGCTATCGCATAACAAATAATGATTTTTAAAATATTGAAAACAAGTATTTCCAAACCAACAATGAGTTTACAATTTTTGAAAACATAAAGGCCTGGTGCAGTGGCTCATGCCTGTAACCCCAGCTCTGTGGGAGGCTGAGACAGGAGGGTCACTTGAGACCA\n>XM_033668712.1 Dothidotthia symphoricarpi CBS 119687 RTA1-domain-containing protein (P153DRAFT_369234), mRNA \nGATATCGACCATGAACATGAGACTCCGGAAAAGGTAAGATAGACGAATGCGAATGTAGAAACAACCAATGCGAGATTGTCAGACTTTGTCTACTCCATCGTTGGAATGTATTTAAGATGCTTTCTCACCTCCTTACTTTCCATGCACAGCTTCTCTTCCTGACGACGTACTGTATCCACTACTTCTACACTTGATCTTTAGTGTTTCATACACTCTCCACCGTTCCTAGTCTTTGGTACTATTCAAGCTGCAAGATGGCCAATCCTCCCAGCAGCAAATATTTTGACTGGAAGATGTACCGTTACGTCCCGTCCCTTGTCGGCGCAATAATTGCTATGATCATCTTCCTTATAATGGCTCTATTGCATTTCTGGCAGTTCCTAAAGCTTCGGAACTATATTGTCATCTTTGTGGTCATAGGAGCTATGTGCGAGGTTGGAGGGTTTGCAGCTCGAATTGGATCCCACTACGACAACGAAGAATGGGCAGCATACATCATTCAGGGTGTTCTACTCCTCGTTGGACCCCTATTCTATGCCGCGACAACTTATATGATGCTCGGAAGAACCATCCTACTCGCTGGGGGAGAAGATGTCTCTCTCATCAAACCAAAATGGTACACTCGCATCTTTGTCGCAGCAGATGTTAGCACTCTCATCATTCAAGGCCTTGGTGCCAGCATCATGGGCACCATGAAATTGAATCTCGCAATCGCAGGCGAGAAAGTAGTCATCGCTGGTCTCGCTCTCCAAGTCTTCACCTTCGTTGTCTTCCTCGTCGCGTCCGTCGATTTCCAGATCCGCATGAATCGCAAAGTCAACAACTACACGGCCACCGAAGATCTCTCGAACAACTGGAGAAAGATGCTTTGGATTTTGTATAGCGTCAGCACGCTCATTCTCTTCCGCTGTACTCTTCGCTTGATCGAGTATGCTATGGGTAACTCCGGCTATCTGATCGCGCATGAGTGGGCGCTGTATGCATTTGATGCTGTACCGATGTTCTTGGTGTTGATGCTGCTGCTGGTTCTGCAGCCGTCAAAGTATGTCCCGCAAAGTGACAGCAAGAAAGAGCACGGGAGTGATGAGGAGGTGGGAGTCGCGCAGAGTCAGTGACAGATCTATGCATGTTATGCTTATGCAAACTTTTAATATTGCTAGGGAAAAGGGTATTCTCATATTTCCTCAGTAGGAGTT\n>XR_003329731.1 PREDICTED: Papaver somniferum uncharacterized LOC113287130 (LOC113287130), transcript variant X3, ncRNA \nGCGAGAAGATAAAACCAGACATTCTCCCTCAAACCCCAAAAAGGAGGTTCCCCTACTACCAAAATCACCAGAGACTAATCTCTTCTTCTCGTCGTCTCTTGGATTGTGTATGCATTCATACTTATAAAGATGCTATTGAGGAGCATCAAACATTTATAGTAAGCAAGATTAATTTTGAAGAACACCGCCTACCTGCAGGTGGTTAAGGATCACAGTAATCATTGTTTGAGTCGTCAATTCGTGTTTGACGATGAGAGTGAAAAAGCTAATGCTGGCGCATTTACCAATTTGGAAGCGCTCAACTTTTTACGAGCTAGAGGAGCCTCAACAGATCCTACGAGTAGTTTCTCCTGTTTCTCCTTTTGAGTACCAGGTTTATGATTATTTGGTCAAAATTGCTGCTTATAGTCAAAGTACAAACACAAGAGAGTATCAATGAGTTCTTGAAGAGCTGTGAGAAATACAAACTTGCAAAAGCGGAGAAGCTCAACATCATTAAAACATTAGGCCGTCAACTCAAGAGGAAATTGACCCGGTATGTTTACTTTCAAAATCCCCTTTCAGTTCTTATTATATGTTTATTATTAATCATTGTTAGACACTCTTCTTTACGTATTAGCGTCCATAAATGACATCGTGCTTGTTTTGGTTTTCCTTTGTATTGACTAAATAAGGCATTTCAGAATTCTCTTGTGCATGCTGTAATTGTCAGGCTTAGTATAGACAGGAATAAATGAATAGAAATTCTTATGATCTGTCTACAGTTTTAACTGTTTCAAGATTCACTATCTCAGGAATTGGTGTGCAGACACTTCCACGCCTCCCAAATGTGTTTAAAATCTTGTTCCTTTATGCTTTAAAGTTAGTGTATCATCTAAATCTTTGTTAACCAATTTTAGATTTATGAACTCTTCTTGACGACCTCACCAGTCCCTGGGGTCTATATATTGTTTGAAATATGACCTAGTAGGCATGATTGTCTGAACCCTTACTTTTATCAAAATTGGCAATAAACGAGAGATCTTAAGATTCATCAATCTGGTAGCGAGACAACATAGATGATTGCCTCTCAATTGCGGAATCATAATTGTTCAGCATGTGTAGGCTAAATATGTTATACCTTCTGATTATATTAGATACCTTAAAACTTCCCACTTCCTAGATTCTTCTGCTTTTTAGCGTCTTTGAATTTATAGGCTCTGGCAAGATGTTTTCCATTGAGCAGATTATTGAAGAGTGTCAGAAATGCTTGGGAGATGAAGAAGTTGAAGAGTTGGTGGAGCTGATATCAAATTTATTTTGTCCACCACTCTGAAGGTACAGATGAGGGTAAAGGAATTCTTGATGGTTTCTGAATGGAAGGTAAAGATGATGTCAAAGGAGCTCCAGATGAGGAAGATACAGAAGGATTTTTTGACGGCTTTCTACTGAAAGATATAGATGCGGGTATAGAACTATAAATCTCTATCAACTTTATGGGAACTCTAAACGATCAACCAACTGCTATCTTTCTCAACCTTTTCATGTCATCTGTCTTGGTATTAAGAGGCAGAAATCTTTGTGAATTGAGACCTGAATTAACTGAACTTGTGCAAAAATATTCTATTCTTCATGTGAGCAGTTTCAGTCCAATTATGAGACCTGAATTAACTTGTGCAAAAATATTCTATTCTTCATAGGGAGGAATGTTTACATTCTGACGACAATGGATCAGAATGGTCAAGGACGCAAGAGCGGTGAACAGGATAAACTTTGGGAATTTGTTGATCCCATTGATAATCTTTTTCAAATCCCATCCGGAGTCATTCAGGTGTTACCTGACTTGCCCATGATTTGGGAGAATAATGTTCTTGTTCAAGGCATGTGGAGCAGCGAATGAAACCTAGAATGGATGCATGCAATTCATGATTTCCTTAAACCCTACAAACCCCTTCTCAACTCTCACGTCATCTATTTCTTCACTGATAAACTTTGGAAATGCATGTTGATCAACAACGTCTTCATCATGACCCCATTGCAAATGTTTCTTCAAATTTTGAATCTGAGCTTGGGGTATGGATGCAGTTGAATTCAATCTTGTGTAGG\n>XM_053220790.1 PREDICTED: Acinonyx jubatus zona pellucida like domain containing 1 (LOC106972235), transcript variant X3, mRNA \nGAGACAGAGAGACAGAGAGAGCGTGAGCCGGGGAGGGGCAGAGAGAGAGGGAAACAGAATCCAAAGCAGGCTCCAGGGTCCCAGCTGTCAGCACAGAACCCGATGCATGGCTTGAACTCACAGACGAGATCGTGACCTGAGTGGAAGTCGGACGCTTAACAGACTGAGCCACTCAGATGCCCCTTATATTTCATTTTCTTAATGATGTCTTTTTTTTTTTTATAGTGAATGGTGTCTTTTGAAGTGCAAAGCTTTTAAGGTTTTATGAAGTCCAATTTATCAATATTTTCTTTTATGGATAGTGCTTTTGATATCATACTAAGAAATCTTTGTTTTCCTTAACCCAGGTCATAAAGATTCTCTCCTATGTTTTCTTCTACAAGTTGTATAGTTTTAATTCTTTACTATTTTGAAGGAGAGATAGAGAGACAGAGTGTGAGCAGGGGAGGGGCAGAGAGGGGGCAGAGATAGAGAGGGAGATACAGAATCCGAAGCAGGCTCCACACTCTGAGCTGTCAGCACAAAGCCTGGCCCCAGGCTCGAACTCATGGGCTGCAAGATCATGACCTGAGCCGAAGTCAGACACTTAACAGACTGAGCCACCCAAGCACCCCTTAATGCTTACATTTGGTAAGGGATTTTTGGTCTATGATTCACGTGGAGTTAATTTTTGTGTATGGTGTAAAGTAAGCGTCTAAATCCTTTTCCTTATGGGTATCTAGTTGTCTCAGCAGCATATGTTGAAAAGATGGCTCGTGTAATTGTTGACTCTGCTTTTACTACATTTGTGTCTTTAAAGAAAAGCTGAAGTAAGTAGGGCATAGAGAATTAATGTATTAATGAAGATGAAGAGATTCTTCTGTGTTGAGGTTTTAAGCACTTACATTAGATAAGGAACATCTGGTTGATGTTTTAAAGAATAACTCGAACCATAATTTCATTTCGTTTCCTTCGTCTCCCCCATTCCCTCCCCAGCTCTCCACTGAACATCTGCTTCTCTTATGTGAGGGGAAGTGAAAGATTTAGGTCAGGCATAAACACAAACTATCTTTACTGTATTGTTCCCTTTTAAGACCAAAATACCCACCCTGCCGGGCCAGTTTAGCACTACATTACCCTATATCAACAGATCTACTGCAATTTTTGGAAGCTGGCTTTCCCCAGGAAACAGAACTGCTATTGTTACTTCTCGGTGTTATGTAATAAATCTGGTGGGTCACTTTCAAGGATGTGAACAGGAATCGAGAAACACTGTCCTTCAAATATCACTTTTCTTTATGTTAGCTTTATTGATGAATTTCTCACAAGAAGTATCTTAAGAGACATCACTAGTGTTGTGAGCCCTCCGCATCCAGATCTCACATGTATCTATGGTGCTGGCTAGAGGTAACCCCAAATAAAAACAGTTTCCGTTGACTTCTGGCTTCACTGATGCAAGATAGCAAGACCTTGGGGAAGTCTATCTCCCCAAAATACCATCCATTTTGCTATCTTAAATCTTTGCAAAGAACAGGATGATTACATTTTCCTCTCTGGGAATTTACTGAGTTCCTCTGTTTTATGGCACTGACCTAGCAGCTCTAATTGGGGCACTCTTCTACCCGTGGCTTTGCTAAAAATCCCTCACAATCAGGACTGCAGTGTAATAATAATAATAATAATAATATAATGCAATAGCTCATATGTGTATAGCACTTATTATGCACCAGACCTTCTTTTCTTGCCTTACATATATTAACTCATTTAACTGTTCCCTGGAGGCGTACATTAAAGCTGGCATTGCTGGAGGGTAATGAGTATAGAAGCAATTTAGTGTTTGGAGTATGATAAACTTCCATAAAATAGAAGGAAAGCCTTGAGATGATGCCTCAGGGATAAAATTGAACAGCCTGGTCCTTTTTGGGGTCTCATAATTTTTTCAGCTGTAGAACTCATTTGAGGGAAAAGTAACAGGTAGGAAACATTGGTTTTCATCACCTCGCTTTGGTTAGACATATGCTTTGGATATTCTTCCTCAAGCACCTTCAGAATCCCCATCCACTTCCATGTCTAGGCACTCACTTCAGTAGCCTGGCTCTGGGCCACTCTAGGGCTATCCAGCCTTCTCATTGTGAGGCTGGGTCCCTGTTGGTGCTTTCCTGTCCTGTGTTTCATTGTGGGAGCCGTTTGCTGGGAAGGGGCAGTTTCACCAACAAGGAGGAGGTCTTTTAAAATTCTAGCTCACTGTTGATCAGAACCAGGAATTTCCCTTAGTTTAAGATTTAGTTAGTAGACAGGGGCTCCTGGGTGGCTCTGTTGGCTGAGTGTTCGACTCTTGATCTCAGCTCAGGTCTTAATCTCACAATTTAGTTAGTACACAAACATTCTGGCTTTCTCTAAGTTTTTAGCCAGTTTTTTACATTTTAGTAGAAGATTCAGGAACACGTTTCTTGGGAGGAAAGAAAAGAAGAGGAGAGATTCTGGGGGCATAGCAAGGGGGAACAAAGAAGGGAAGAAAAGTTGGAGAGCCTCTGTGTACCTCAAAATTTTGCCGAGGGCCTTGCCTTGACAGTGGGGTGCAGATAGGTCCTTCATTGCTGTCCCCCAAATCTCACCAGCACTGTAACAGTGGCCTTCTATGAGTTGTGCACTCACCTTTGTCATCTGACACAGGGGAATGACTCAAATGGTTGGAACGTTCAGACAGGTAAGAAAGGAGACAGGTTATTACAGATGGGGGTGGGGAACTTGTTTTGGACAGGTAGTTCCTGGTGGCATCAGGGAAAACATGCCTTAGGTGGCTCTCTCTGACTGATACATTGACTGATCCTGCTAAGTCAGGAACATGACCAAGATGGCCTTATTTTCCTCAGCTTGACTAAACTTTAGACAGGTTTCTTAGTGACAATAGGTCACTGACCTCCCTTGTCTTAGAGCATTTACTTTAGAAAACTTACAATTGTAAATTCTTTATTTGCCCATCTGAGATGTAAATCTTTTCCTAGCCTCTTGCCCCTTTTACAACTGAGAACCATCTGTTTCAGAGACCTGGGAGACATCTTTTGAAATATTATCATCAAGAAAGGTAGCATCCAGGTCTCCCAGTTTCTGTAGGAGGGTAGGAACCTAGACTGGTGTCAGCAAACACAGATGGCCTAATCACATTGACCAAACTAATGTCCTCCAGTACTTTTCAACTAGCTAACCTCGGCCCTTAGAAACCTTCCTGCTTTTTTTTGTTTCTAGGGAAGTTAAGTTCTCTCTCCCCTTGAAGAAGACTTGAATTATGTCTTCTTCTTTTTCAGCCAAACTCTGTTCTGTGAAATTTTTCTTTGACATACAGACACTTGTGCAATATTTTATCTAAACTGACTCTCAGTGTGTTTGGAAAGCCATTAACCAAGAAGACAGGATAACTTTATCATGGTGCACTGTTTTCTGGACTCATTATTGGGGGTCTGACACCCACAGCATTTCATATGCTATTAATCACCTCCTCCAATAAACCCAAAACCCAAACCAGAATGCTTCTCATATTTCTTTGCCATAAGATACCTTATATATACACACGTATGAAAAGTATACATGCACAATGTTATATAGACAGACACACACAATTAGTAATAGCTATCATTTTTTTGTAGGTCTACTGTGTACTTTGTATACATACACATAGTACTTCATACATATTTCCTCATTTGATCCTTACATCATTTCTATGAATCAGGTATCATTTATCTCAAGATGAGGAAGCCAAGGCTGAGAGAGTGAAGTGACTACTTCAAATTGCTGTCAGAAGTGGGATTTGAACCCAGTCAATCAGTCTACAAATCATGATATCAGGTTTCCAATTGTCTTTCAAAGATTCACTGAGCTACCTTGTTAGGATTCTGGTCCAGAGGGAAACCTGTATTTCCAGAAGGAATTAAGGAAGAACTTCTGTCACTGTCCCTTCATCCCTCCTCCCAGAAGCATTATAGAAGATTTTACTATTCCTTAGAGAACTTCATCTCAAAGTGTGTCCCAACTCTCACCTGTCACCTGTAATTTCTGCTTTGGGGTCTAGCCCCAAATCTTGAGGAAGACATTTTTTTTTCCAGTTAATTCATTTTTGAGAGAGAGACAGAGTGTGAGCAGGGGAGGGGCAGAGAGAGAGGAAGACACGGAATCGGAAGCAGGCTCCAGGCTCTGAGCTGTCAGCACAGAGCCCCACATGGGGCTCAAACCCAAGAACCACGAGATCATGCTCTGAGCCCAAGTCATCCGCTTAACTGACTGAGGCACCCATATGCCCCTTGAGGCAGCCATTCTGATCTTCATTTCAGGGTTGCTCTGACAAGGATAGTTGGGGATCTGCCCTGGTGCTTCCAGCACAGAGGATATATTCCTTCAGTGGACAGAGAAGATGGTAGCAACTTCCTCTCTGAGTCACGCATATTGTCTGTCATTCTGTCAACCATCTGTCCTATTAGCCACGCTTGGGTGATGAATAGAAAGAACTCAACGTACTGTGAGGTTACTAGGTTACAGCTTGTGACATCAGAATGCACAATGAACAGAGCATTAGAAAGTAGACAGCAATGGTTTCTACTTATTTCAAAATATCCATGATGCCAGAGAAATACATCCCTGTTAAAAAAACCTAGGTCTTTGTAGCTCCCTTTCCTTCTTTGACATGGAATGAAAGAGATGTTTCCAGAACTGGTCAACTTCAGTAACTTTTATATCAGAGTCTGTGCTTAAAAGTATCACAAACAAAACTTCAGAACAATCACACTACCTAGAAAAAGTATTTCTAGGACTCTGAGATGGTCCTTGCCCTGAGGAAGGTGGCAAGTCTTGTGTTTACTATGGGGCCTACCCCCTCTCCTATGGAACACAGTGAGGTTTTATTCTGTGAAAGCTGTGGGAAGCTCACCGTAGGTTGTGTACCTGAGCCACTTAGATTCAAGGCAGCAGTGGTGAGGTCACTAAAGTGACCTTCTCCTTTCTCCCAGATGGAGGGGCTCCTTCTCATGAGGACTCTAACACATACAGCTCTACACATACATAAAAACTTCACTTCCATTTATTACTGGATAGATTTTTTTCAGTGTTGATGAGATGTTTTGTAGAAATCAACATATACTGTCCACATAAGGAAAGTTTAAATGATTTAAAATATGTTTCCTAATTATAAGCACTTGTGGGAAATTTGGAAAGTACAGAAAAGAAAAAAAAATTACAATTGCATCAACCCGGAAGCAACCATCACTAACAGGTTTTTTTGTTTTCCTTTTGGTCTTTAATTTTGTAGCTCTGTTTTTGTTTGTTTTTTTCTTTTTCTTTATTATTATTTATTTTTGAGAGAGAGAGAGAGAGAGAGAGAGACAGACAGACTGTGTGTGTTTGGGGGGCGGGGGGAGAGGGAGACACAGAATCGAAGCAGGCTCCAGGATCCCAGCTGTCAGCACAGAGCCCCATGTGAGGCTCAAACTCACCAATCGCGAGACCATGACCTGAACCGCGAGATCATGATCTGAGCCGAAGTCTGCGGCGCTTAACAGACTGAGCCACTCAGGCGCCCGTTGGTTTGTTGTTTTCAAGTGAAGACGCTCCTGCCCAAAAGGAACTTACAACTTTAAGGGCAACACAAATGAGAAAAATGAAGACAAAATAAGACTGAAAACCAGAGAACATGATGATAATGATGATGGGCTCACTGATTTCTCCAAAGTGTCTCTGAGACACATACTGCCTGGAATCAGTCACTTCCTGCCTTGTCTGCCACCCATTGTGTAGCCACAAAGAATGTGTGTTCTGTCAGCAGCTATAAAAGTACAGATCTGGGTGCTGATCAAGAATGTGAAGTGAGGCCTGAGAAAATGCAGAACTGAGTTGAAAGAAATGCAGAGTCATTAGCGTCTTAAGCCAATCATCACCCTAAAATGGTTTGAAGGGAGATATGGTAAACCCAAATCACTGTTTTAACTATAATGAAAGGTCAACCCAGCAATGGAAAGCAATGGACACATTTTATTTCCAAATGGTGATGCTGATCCATTTCAGTGTCTTCCTTCTGGGACAATGCAGTGAGAGCCAGTTGTCACTCAACACAAAGGTGTCTGTATTGTAGCTGCAAAAGAGGGTTATGGGATGGAGTGCCTGATAAGTTCCTCTAGATTGAGCTGTCAGCTGTGACCTCTCTGAGGAGGTGATCTAAGCTGCAATCTGAAAGGCAAGAAGGAGTCAGTGTGTGAAAATCTGTGAAAAAGTAACATCTGGCATAGAGATCTTAAGATTACATGGAGTATTTGCTTCCTGATCCTTCTTAATCTCTCTAGCCTGCATTTCTGAAAACTTGGGGAAGGCATACAAGCTTTGAAAAGACGGAAAATTTCTTAGCATAAATATCAGTAAAACAACTCTTTCCTATGGGATTTTGATGTCTCACTGAAGTAGCAATTAAAACTGGACTCTTTTGAAGTTGTTTATTCCAAGAATGCACCTTCTTGATTTTAAGGATGAAAAGATAGGAGCTGGAAGCAAACTGGATTCTGCTTCTCCAAACCTGAGCATATGTAAAAGAAAGCCTTTGCCCAGCAGAATTAGCAGATGGTCTAAATCCCCTTGGAGTACATGGGCTCAGTTCAACACTGATTTGGGATTATTCATTCAAAGTCCTTGGTCTTCTGGAACTTTAATAAGGCTTTCCCTCATCAGGCTGACGATGGCTCACTTCACACATAACCACTCAAGACTTCTGTGCAGCATAAAATAGAAGATCAAAAGCAGGGTTGAATCTTTTTTGAAAGAGTTTGGTAACACCAGGCATTTGAACACTCAGTCACATGCAGCAGAACCAGGCACATGGAGAACAGCTGATTCCACGAAACCAAGGGCTTGGGTTTTGCAATGGAACGAATATGGTTGCTGTTGCTTCTAACAAGTAGAGTGCTTCTGGGGTCTGCTCAGTTTAATGGCTACAACTGTGACGCCAACCTCCACAGTAGATTTCCTGCTGAAAGAGACATCAATGTCTATTGTGGGGTGCAGGCCATTACAATGAAGATTAATTTTTGCACAGTACTTTTCTCGGGTTATTCTGAAACAGATCTGGCACTGAACGGAAGGCATGGGGATTCCCACTGCAGGGGGTTCATCAATAACAACACCTTTCCCGCGGTGGTCATTTTCATCATCAATCTCAGCACCTTGGAGGGCTGTGGAAACAACTTAGTGGTATCCACAATTCCTGGAGTCAGTGCTTATGGGAATTCAACTTCAGTACAAATAGGAAATATTTCGGGATACATTGATACTCCAGACCCACCAACAATCATCAGCTATCTACCTGGGCTTCTTTACAAATTTAGTTGTAGTTATCCATTGGAATACCTGGTTAATAATACCCAGCTTGCCTCATCCTCAGCTGCTATTTCTGTGAGAGAGAACAATGGTACATTTGTCAGCACTTTGAACCTGCTCCTTTATAATGATTCAACCTACAGTCAGCAGTTAATTATCCCAAGTATAGGATTACCTTTGAAAACCAAAGTGTTTGCAGCTGTACAAGCCACTAATCTGGATGGCAGATGGAATGTCTTAATGGATTATTGCTACACAACCCCATCAGGGAACCCAAATGATGACGTTAGATATGATCTCTTCCTTAGCTGCGACAAAGATCCTCAGACCACTGTCATTGAAAATGGCAGAAGCCAGCAAGGCCGGTTTTCCTTTGAAGTGTTCCGATTTGTGAAACACAAGAATCAGAAAATGTCCACCGTCTTCCTGCACTGTGTTACCAAGCTCTGCAGAGCTGATGACTGCCCCTTCCTTATGCCAATTTGCGGCCACAGAGAAAGGAGGGATGCAGGGAAGAGGACCACTTGGAGCCCCCAGAGCACGTCTGGAAATGCAGTCCTCTCTGCTGGTCCCATCATTACTCGGAGTGATGAGACTCCAACCAACAATTCACAGCTTGGTTCTCCAAGGGAACCTCCCTTCCAGCTGAATGCCATCACCAGTGCACTGATATCAGGAATGGTCATCCTGGGAGTGATGAGCTTTTCCCTTCTCCTGTGCTCACTGGCCCTTCTATACAGGAAGGCACCCACCAGTTTGGTGTTGAATGGCATAAGAAACCCAGTCTTTGACTGACTTTAACAGGTCCCTTCTCTCAGGAGGACTCACTGACTATACCCTGTGTTACTGCAGTCAGTGTTTTCATCCAAATTGAATGCCAGCCAGCATTTGATATTTGTAGGTTTGATAGATTTCACAGTGTAGTTCGTCAGCATGATGATAGTGAAAGAATTTGGGTGGTATTGTTCTCGTCGCGTAAGTATGTGGTCAGCCCTATTTGTATGGCACCAATGGGTAGAATGACAACAAGCCAACCATATTCAGGACTCAGATCTTACAAGATCAGTCATATTTCATTTTATTTCAATTTTCTTTTGATAATTGGTTGTTATAGAGATAAAAGGTGGGCATAGAAAAAATATACATTTGTTGCATTTTTCCCCCTAAGCATTTATATCCAATGTGCTGGCATTTAGATTGTTTATGTGGTCCTAAATTGAAAGTTACTTTTTTATTTGT\n>XM_019449735.1 PREDICTED: Panthera pardus microtubule associated protein RP/EB family member 3 (MAPRE3), transcript variant X4, mRNA \nTTGCAGATTTTCCAGACAGCTGGGGTATGGCCGTCAATGTGTACTCCACGTCCGTGACCAGTGAAAATCTGAGTCGCCATGATATGCTGGCATGGGTCAATGACTCCCTGCACCTCAACTATACCAAGATAGAACAGCTCTGTTCAGGGGCAGCCTATTGCCAGTTCATGGACATGCTCTTCCCCGGCTGTGTGCACTTGAGGAAGGTGAAGTTCCAGGCCAAACTAGAGCACGAATACATCCACAACTTCAAGGTGCTGCAAGCAGCTTTCAAGAAGATGGGTGTTGACAAAATAATTCCCGTAGAGAAATTAGTGAAAGGAAAATTCCAAGATAATTTTGAGTTTATTCAGTGGTTTAAGAAATTCTTTGACGCAAACTATGACGGAAAGGATTACAACCCTCTGCTGGCGCGGCAGGGCCAGGACGTAGCGCCCCCTCCTAACCCAGGTGATCAGATCTTCAACAAATCCAAGAAACTCATTGGCACAGCAGTTCCACAGAGGACGTCCCCCACAGGCCCCAAAAACATGCAGACCTCTGGCCGGCTGAGCAATGTGGCCCCACCCTGCATCCTCCGGAAGAACCCCCCATCAGCCCGGAATGGCGGCCATGAGACCGATGCCCAGATTCTCGAACTCAATCAGCAGCTATTGGATTTGAAGCTGACGGTGGATGGGCTGGAGAAGGAGCGTGACTTCTACTTCAGCAAACTTCGAGACATCGAGCTCATCTGCCAGGAACACGAAAGTGAGAACAGCCCTGTTATCTCAGGCATCATAGGCATTCTCTATGCCACCGAGGAAGGATTTGCACCCCCTGAGGACGATGAGATTGAGGAACACCAACAGGAAGACCAAGACGAGTACTGAGGGCGGCCCCAGCCCTGGCTGACTGCACGGCTGCCGTGCCTCCCCGCCCTGCTCCTGCCCCACATTATAATCCTTTCCTTACAGC\n>XM_044229603.1 PREDICTED: Neovison vison NOVA alternative splicing regulator 1 (NOVA1), transcript variant X2, mRNA \nGAAAAGAAAAGAAAGAAAGAAAGAAAGAAAAGAAAAAAAAAGAAAGAAAAGAAAGAAAAAAAAAAGCCAAAACAAAAGGGAGAACCTTCTCCCCGTAGCAGCGGCAGGAACTGCAAACATGATGGCGGCAGCTCCCATCCAGCAGAACGGGACCCACACTGGGGTTCCCATAGACCTGGACCCGCCGGACTCGCGGAAAAGGCCGCTGGAAGCCCCCCCTGAAGCCGGCAGCACCAAGAGGACCAATACGGGCGAAGACGGCCAGTATTTTCTAAAGGTTCTCATACCTAGTTATGCTGCTGGATCTATAATTGGGAAGGGAGGACAGACAATTGTTCAGTTGCAAAAAGAAACTGGAGCCACCATCAAGCTGTCTAAGTCCAAAGATTTTTACCCAGGTACTACTGAAAGAGTATGCTTGATCCAGGGAACAGTTGAAGCACTGAATGCAGTTCATGGATTCATTGCAGAAAAAATTCGAGAAATGCCCCAAAATGTGGCCAAGACAGAACCAGTCAGTATTCTACAACCCCAAACCACCGTTAATCCAGATCGCATCAAACAAACATTGCCATCTTCCCCAACTACCACCAAGTCCTCTCCATCTGATCCCATGACCACCTCCAGAGCTAATCAGGTTAGACTATTTCCACAGGTCAGAGTGGCAGACTGTAACTACAGTAGTGGGTCTATAATAATTTCCCCCTGAAAATTGAAGGACAGTCGCAAAGAGAAGTC\n>XR_007719743.1 PREDICTED: Macaca thibetana thibetana uncharacterized LOC126937484 (LOC126937484), transcript variant X3, ncRNA \nCCCTGCTTGCAGTTCCCCCTTCTGTAGGGCCCCCATGCTCCTGTCCCACCCCCTCTACTCGGCGTCCGGGTGCTGGGTCGAGACGTGTGTGGGTGTTGGGAGGTGGATATCTCTTTTCCGAGCCGTAGGCGTCACCCCTACGCCCAGGCCCAGGCCCAGTGCTGGATCCTGCACTTTCCCAACCTCCCCCTCCCAAGTTACAAGGTTGCCCTCTGTTCCCCTCCCGAGCGCAGGTGACGAGCTGCTGAGACAGTGTCTGATTCACCGACAGCTGAACCAGCTACTGGTACTTGGGGAGACAGAGTCTTGCTATGTTTCCCAAGCAAATTTCAAACTCTGACCTGAAGTCGTCTTCCCACCTCAGCCTCCCAAAGTGTTGGGATTATAGGTGTGAGCCACTGCAACTGGCCCAGAACTGGAGTATTTATCCACCCAATCCTTGAACAAACCAGCAGACCAATTCAGAGTCCATTTCAGTGGTGCAGGTGAGAGGTATTAGAGACCTGGACAAGGTGGTGGCAGATGAAGATGGAGAGAACAGAGATAGGATCTCACTGTGTTGCCCAGGCTGACCTCCTGCCTTATACACCACCTCACCAAGCTTAACAGGGTGAAAATATAGGAGATGACGATCCATTCCTGGGTGGACGGCCAGCGTTCCATCTTCACTAACACGATATAGTTGAAGAGCATCAGGTATCCGATATACGCCAGCTGTAAGGAAATACAATACAGTGGTCTGGCTGTTCAGGCCCAGGAGCCTCAGCGTCAGCCACGGCCACTGCACAGCAGCACAAAACAAGGCCCAGTGACATGCACATTCTTCCAGAACCTCTGCATTTTAGTACCCACTTCACACCTTGAATTTGAATCCTCTCCAGCCGGATACCTGAAATAGGCTCTCAACACAAGCAGGGTCGAGGAGCCAGCTGGACCCCTGCCTGCTTTCTTCTCGGACCAGAAGAGGACCCAACCTACTCCTAGAGAAACTTGCTACAATGCAGAAGTGAGGTTACATGGAAATGAGGTGTGTCCTACCTTTCAGAAACTTGGGAGAGTAGGACACACCATTTTTGGAAATCTGGTGAGAAATACTCTTACAGAGAAAAACACAGCCCCAAGTAAAGTACATGGGACCTTCAATCTGAAACTGAATTGTATTGTTAGGCATGTCTGGTGATTCAAAAGACTGGCATACCTCATTTCCGATCACTTCCTCGAGGCCTGGGCTTTGTCGATACGTGAAGATGAATTTTGGAGAATCATGAAAACACAACTGAACGGATCTGGGGGATCCAGTCTGATGGGTTTACTGAGGCCAACTCAGCCATGCAGAAGAGTGCTGGACACACAGGCCCCACCCCCCAAAGAGGCAGCCTCCCAACAAGCTGCCAATGACATAAGCAAAGCAGCGTGTCTCAAGCATCTCTAATCACAAGTTTCGCCTGGGAAGCTAGTTAAACTAACACAGCCTCTTAGGCTCCTTCATGAAGATTTGATTCCATGGGTCTATGATGGGGCTAGAAATTCGCATTTCTAACAAAACGCCCTTGTCATCATGGAAGTTTTAGAAATGTTGATACTATTACGTCTACTGATTTCTGCTCTCAGCAGTCTGTAAACTTTTTCTGCAAATGGCCAACTGGTTAACAACTTTTAAGGCTTTGTAGACCTGATAGTCTCTCTCTGTCTCTCACTACTCATTAACTCGATGTGGTAGTACAAAAGCAGGCAGCCTACTGGTAATGTTAAATGAGGTTTAGCCTAAAGCTGCCTCCTTACATATTTTAAGTTCGGCCTAAAGTTTTCTCTGTACATTGTGAACTATAACAAATGAAGGTGTAACAAGACCAATCACTGAATTTCAGTCAATCAAATGTAGCCAACTGCTCAAAATGTGTTCAAATAAGGTAAATGCTGAGCTGTAACCAATCCAGCTGTTTGTGTACGTCACTTCCGTTTTCTGTCCATAATTCTTCCACCACGTGGCCCTGCTGGAGTCTCTGAGCCTCCTCTGGCTTGGAAGGCTGTCCCATTCACGAATTGTTCATTGCTCAGTTAAATTCCTTTAACAGAAATTAAGAGTCTGCCTGTGCTCCAATTCTTTATGGACACTACAATTTGAATATATGTCTCAAGTATTCCTTTTTAAATTTTATTTTGACCCTTTAAAAATGTAAAAACCATTCTTAGTTTGCAGGCCACAGTCATAGGCCATGGGTTGAATTTGGCCCGAGAGCTGTAGTTTGCCAAGCGTTGTTCTAAGCTAACAGTTGGGGTATCATAATATTAAAGGAAGGACAGACCTGGGTGTAAAATAGCTCCAAAAATATTATCTTAGGCTGGGTGCAGTGGCTATTGCCTATAATCCCAGTACTTTGGGAGGCTGACGCAGGCCCATAGATC\n>XM_032774723.1 PREDICTED: Chelonoidis abingdonii docking protein 5 (DOK5), transcript variant X4, mRNA \nGTCAGCTGATGCAGAAGGGTCCTCTAGCCTCTTCCCCCCTCTCCTGAGTGGATTAAAACTCTGGCCGCTGAGTTTCTGGGTCAGGAGGATTATTCCAAGTGATGTGAATCATTTCAGCTACCGACTGGATTCAACTTGGGCTAGCGGCTCCTCCCCACAAAAAGGATGGCTGCCAATTTTAATGACATAGTGAAGCAAGGGTATGTAAAGATTAGGAGCAGACGTTTAGGTATTTATCAGAGATGCTGGTTAGTTTTCAAGAAAGCTTCAAGCAAAGGGCCAAAACGACTGGAGAAGTTTTCAGATGAGCGTGCTGCCTATTTTAGGTGCTATCACAAGGTCACGGAACTCAATAATGTGAAGAATATATTACGACTGCCAAAAAACACGAAGAAACATGCTGTAGGCATTTATTTTAATGATGACACATCCAAAACCTTTGCTTGTGAATCAGAACTCGAGGCGGATGAGTGGTGCAAAGTGCTGCAGATGGAATGCCTAGGAACTCAGATTAATGACATAAGCCTTGGAGAGCCTGACTTGTTGGCATCTGGTGTAGAAAGGGAGCAGAGTGAGAGATTCAATGTGTATTTAATGCCATCCCCTAATTTAGAGGTGCATGGGGAATGTACCTTGCAGATAACATTTGAGCATATCTGTCTTTGGGATATCCAGAATCCCAGAGTAAAACTCATCTCTTGGCCATTAAGTGCCCTCCGGCGATATGGACGAGACCCAGCTTGGTTTACATTTGAAGCAGGGAGGATGTGTGACACTGGGGAAGGACTATTCATCTTTCAGACAAGAGATGGGGAGGCGATCTATCAGAAGGTTCACTCAGCTGCTTTGGCCATAGCAGAACAACATGAGCGCTTATTGCAGAGTGTGAAAAATTCAGTGCTTCAAATGAAAATGAGCGAGCGAGCCGTCTCCCTCAACACCATAGTGCCCCTGCCTCGGAGTGCCTACTGGCAGCACATTACACGGCAACACAGTATGGGCCAGCTCTATGGCCTACAAGATGTTTCAAGCCCCCTGAAGCTTCATCGAACAGACACTTTCCCCACTTACAGATCAGAGCATTGATAAGACTGTAAAGGATTTGAAAACTCTCTCTGTCTTGTGACAGCTTGGCCCAGCGGATAATAATGATGACAGCAAGCAAACAAAGTTGGAAATGCAGAAAAAGTCGGCTTGGATTGAATTAAGTCCTTGAATATATATATTTTTTTTTAACCTTGGCAAGAAAGGAATGTATTCTGTAGGTATTTAAAAAAATGCCAAACCAACTATCACACAGTTATTTAATATTTTACACCGGGAGGGGACAGAAATCAGCCCCTAAATGTTACTGAATGTTTTTATATGATAGATATATGTTGCAAATATATGAATTTGTCTTATGATGTGGGGTACTGTGATACCACTTAGTCTGTTTCAGCAGTGTTTGTGTTGACGTCAGCTGTGCCAGCAATCTCATGGTTCCTGTTTGCTGTAACTCATACCCTTTAGTTGTTAACATTATTGATTAAGACTAATCTTTGACTATAGTACTGATGGCCAGTTTTAAGCAGGAATTGTATCTGTTTTTCTTGTGTGAAGTCTCCTTGAGTCCTGATAGACTTTTAAAAGG\n>KF434600.1 Uncultured bacterium clone SNGUT_M7 16S ribosomal RNA gene, partial sequence \nCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGCGGGGAGGAAGGCGGTGAGGTTAATAACCTCATCGATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTCAAGTCGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTCGAAACTGGCAGGCTAGAGTCTTGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTTAGATAACCCTGGTAGTCCACGCCGTAAACGGATGTCGATTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAATCGACCGCCTGGGGAGTACGGCCGCAAGGGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCACAGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAACTGTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTTCAGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCATATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCA\n>XM_052950715.1 PREDICTED: Mya arenaria nephrin-like (LOC128235928), mRNA \nATGAGGGAACAACAGATTGTTGGTATCACCACGGTGACGTTATCTCCCGGCACCGATCCTATCAACGTGATAGAGAATACACAAACGACACTGCAGTGCCGAACATCGGGCGGGTTACCGGCAGCCTCGGTCAGATGGTTCATCCAGGGGTCAGGGCAGGTGCAAGACGTAACGTCGCTCTCCGCGAACACGTACCAAGAGGAGGACAACCTTAACGTGACGCTTAGCACACTTAACTACACCCCGTTAACAGCTGACCAGAATGGCCAGATATACTGTTCAGCAAACAATATGGGAGTGAGGAGAAATTCCACAAAGCTTTATATAAATGTATTTTACGGACCTGATAGACCGCTGTGCAAAACAAACAACTTCAACATAACTTCAGTATTGAAGGTCATTATTAGTACCACATTCACCATCTCCTGCACAGTTGACAGTAATCCAGCGCCATATTCGTGGCAGTGGTCACCTTCTGGAGGGAGCAGTCAACAGTTAGGCTTCACAAACATACAGAGGATACAGGGCGGAGAGTACACACTTCAGGTTTTGAACAGAATGGCTGTCACTGGGAGTAACAGTTTAGTCGATGGCAGTAACGCGACGTCTTTTACAGTGGATGTTTTGTTTCCCCCTGCTGTGCCAACATTACGCATGAGCGGTAAAGAGGTTATGGGTACGGTCAAGGTCATCGAAGGTAACAGCAAGACGTTCAACTGCAGCACAGAGAGTAACCCGACCAGTAGCTACAGCTGGACGTACCCACGAGGCTCAAGTTCTAACAACATCTTGCAAGTGAGCGACTTCCAGCCAGGCTCCTACGACGGCGATTACACGTGTCAAGTTCAGAACAGAATGGAGCCATCGTTTGGCAATTCAAAGGAGAATGTATCCCTGAAAACTATATCTGTCGATGTTTTGTATGGCCCGAAAACGGGGAATTTGCCGAACGCAAGTAAAGTTCGCGGGGAAAACCTTGTTTACCAGTGTTTGTACATACCTGGCAACCCTCCAACTGTTGACTTTGAGTGGACGAAATCCGGAACAGAGGTCTCCTGGGTCAAACAGAACACACAGAATTTGACCATTCTAAACCTGCAGCGCTCTGACGAGGCCAGTTACACGTGCAAGGTGTCCAGTGTTCTCCAGCCGACGTTGACATTAGCGACGACCACACAGTATGATACTGCAACATTTTTTCTAGATATTCTTTATGGGGCGGAAAATTTGCTGTTGCAACTCAACAACGTTTCCCAATCGTCTGTACAAATTGATGAACATTCATCAAACCATATGCGATGTTCGCTAGAAAGTGATCCCGGCTCGAATATGGCCCTTACAAAAGACGGTAAAACGATAATTGCACGATCTGGAGTACATCAACTCACACATGGAATACAGGCTGAATGTTCGGACGCAGGAGTGTATACGTGCTCAGGATACAACCAGTACGGAGCAGCAGATAACGCGTCAGTGCAGTTATTTGTAAAATGTTCCGCGAGGCGACCCACTGGGGTGGAGGTACAGCTTAATTTCACCGCACGCAAACATGAAAATGCAACATTAGTCTACAAAATAGTCGCCTACCCTGTGCCCAAGCCCCAAGAGTTTGTTTGGACGCGCTGTACGAATCGCACTTCTTGTGAACTTGTGCCGGATGAAATGAACAAATTTGAAATTTACACAGAGGGTCTATCAAGTAAATTAACGATTCTGGACGTTCAGATTGAAGATTACAGACTATACCAATTGTTAGTGTATAATGGAGTTGGTGATACACTAGTCGAATGGTTACACCTCAGACCCATCGGAAAATCGGATTCGCCAATGGACTTCCACGTTATTCAAGATACAATACGCGAAACAAGTGCTGTATTGACCTGGATTGCCGGATTTGACAACGGGTCTCCTCAGGAATTTCACATCTCCTATGGAAAGGTTGCTGATGACACTGGATATATTACACAAAATGTAAAACATGACAACAGAGTCGAGATGAATTACACAGTTGTAAATTTAAAACCTGGAACCGAATACTTTGTCTCACTAATTTCGGCAAACGAGGAGGGTTCTTCTGCACCGGTGAACGTTACATTTTTAACTCTAAAACGTATTAATGATCAAACTCAGACTAGTCCAAATACTGGTCCTGTTTTTGGAGGGGCAGTTGGCGGAACTGTTGGTGCAATAGTGGCAATAGTTGTCGTCGTTATCATTCTCAGGCGGAACTACGCACTAAATTGCAACGTAACCTGGACAAAGAGAGGTGAACCTTCCGAGCATTCCATATCCGGAAAAGACAACCCCGGATATAACGCAGCCGAGACGTACGAGGTCGTTTCCAGGACAACGGATACATCGGCATACAATGATCTAAAAAATGATGACAGCGGAGCCGATAACTCGCACGTGTATACGTCGTTGGAGGAGTCAAAGGCACCTGTTTACTACGAAAATGTAAAGAAAGATGATCCCATATACAACAATACTGCGCTGCAGAATCCGGTGCAAACAGTGCTTTAAATGTACACATCCATACAACAATGTGAAGATATGGCATTTTACAATGTCATTTACTTACCCAGTGAAATATCGAATACTAAACCAGCACTATATCAACGAAGTATGGATTGCATAATATTTGTTATCAAAATGTTTCATACTTCATAAAATTATATTGATT\n>XR_003276401.1 PREDICTED: Carassius auratus uncharacterized LOC113048120 (LOC113048120), ncRNA \nTTTTGAACAATTCTTGAGAGAGAAAAAAAACAGTGATTCTTTTACGTCCTGACGCAATAACGTCCGTACGTCTTTGCCTTGCGTGCTTTAAAATATTCCGATAAAGCCATATTAGGTTTTTGTAAAACCATGTCATTTAGGATACGCGTTAATAAAATTATCAAACAATCGTCGTAAATACATTTATTTTGTAACATTACTGCTCTTTGGCCACTAATGTAACTTTTAGCGCGGTAAAAATAAATAAATAAATAACAATAATAATTGTAAGCACGAGCTTTTGATTCGGGAACAGCTTGGACCGATTAGTGGAGCCAGGAAATGATCAGACTGGTTTTGGGAACCGCGTTAAGTGATTCAATGAGAAGATTAACCTCAAAAGAAACCACGCTTTCAATCGCGGGAATTTCTACAAACGCTGGAATCTCCCCCTTCACACGGAGGGATTTTATATGATGTCATGACGCGGGAAGGCAAAACGCACACATCCACTGACACAGCTGTAATACATTCCCACGCAAGCGAGACCACCATCCCGCCTGAAAAGCCTGGACATCCGTAGTGAAACATGTCTGGAATCGGCTTTCTGAAGATCTACTTCATTGGAACCGCGGTTTCTTTTCTGGTGGCTCTGTTTGGACTGGTTGATTCAGTCGGGGGTCTGATGTATCCTCAAGCCCCAGACTGGGCAGACGACAGCTGGACAGAGAAGCATCCGACCGTGTCTCCATCACAGACTGCTGCTGCCAGCAACACCAAGCGCAACGGATCGACATGATCTTCTCCGCTACCGTGGCTCGAGAGTCTAGCCTCGGGAATAATAGCCTCGGTTTACTGACCTACTAAAGCCTACTGTGGAACTACAATCTTCTACAATTTTCACTACTGCGGTCTGTGTCGTGTGAAATATGAGACATGAACACAATGGCTTGTGAGGTGCCAGCTCTTCACACTCGTTACGTTTTTACTTTGTTATTCTGGTTTCTGCAAAAACTTTAAATGAAAAAAGGGAAAAATTCTTCCGGAGAGGTTGAAAGCATAAAAATACTACAAATATGCAACATGAATTTGCTGGGCTGCCTTGGAATATTGAAATCCCTCTGTGGTCGATTGTTTTTGTAATGGGTTTTAAGTAGTTTTTGTAATGTTTGTTCCTTTTTTATATGCCGTTTATATGAAGATAAATGTAACACTCAGAATGTAAACATATGTGTAAGATGCTGTTTACCATGAGCAACTGTGGCATTAGGCAGCAAAAAGTGCACTCCCAATATGGCTAAAGGGTGTCTAAAAGATATCAGCTAGATATCTTTCAAATAGATAAGTTGGGTTATGTTACTGAAATTCACTGTTTTGTATTGAACTGAATACAATGTATACAGTTGCATTGTACATCACTAAAGCAGCCTGTTTTTGTGCTCTAAAAAGTTGTCAATTTTAATTAGAAAAATTTCCATTTGCTAAACTTTCAAATTACTTATTTCTAGTCATATTTTTGCTAAACTTTGTGTGTTGTGAACTTGTGATCATAACTGTTTATTGTGAAATGTTGTTAATGGTGTGGATTTTCCATTGAAATACTCTCGTCTTTACCTTTTACATGTCTTTGAAAAGCTGTAAATTGCAAATTGGCAGCTTTGGAAAAAAAAAAAACCTGTCATAGATGATTAAACAACATTACTATA\n>XM_017265421.2 PREDICTED: Drosophila elegans E3 ubiquitin-protein ligase Ufd4 (LOC108141837), mRNA \nATAATCAATTTTCGAGCTGCTGGACTGGATATTTGTGTGAATAAAAATAGTGTGGTGTATTGAGTAATTGTAGAAAAGCTTTAAAAAAGCAGCTTTAAAAAAGCAAGCACCAGCAAAATATTCAATATAATGCAAAAAAGATTTGGTTAAGCATAAATCAAATTTCGATTTGCGATGGGCGATGTCGATCCCGAGACGCTGCTGGAATGGTTGTCCATGGGACAAGGAGATGAGCGGGATATGCAACTGATTGCGCTGGAGCAGCTTTGTATGCTGCTCCTGATGTCTGATAATGTAGATCGTTGCTTCGAAAGCTGTCCTCCTCGAACATTTTTGCCGGCGCTATGCAAGATATTCCTAGACGAACTGGCACCTGAAAATGTACTCGAGGTCACTGCGCGAGCCATCACCTATTACCTGGATGTGTCGGCGGAGTGCACCAGGCGCATCGTTTCGATTGATGGAGCCATCAAAGCCATATGCAACCATCTTGTGGTTACGGATTTGTCATCGCGAACATCTCGCGATCTGGCCGAGCAATGTATCAAAGTGCTTGAACTGATTTGCACCCGAGAAGCGGGCGCCGTCTTTGAGGGCGGTGGCCTCAACTGCGTCCTGTCCTTTATTAGGGACTGCGGATCGCAAGTTCACAAGGACACCCTACATTCGGCCATGTCCGTTGTATCCAGGCTCTGCACCAAGGTGGAGCCCAACACGCCGTGCATTCAGAACTGCGTCGAGAGTCTGAGCACTCTGCTGCAACACGAGGATGCCATGGTATCCGATGGCGCTTTGAAGTGCTTTGCCTCCGTGGCCGACCGATTCACACGAAAGTGGGTTGATCCAGCGCCGCTGGCAGAGTACGGTTTGACCACTGAGTTGCTCAAGCGCCTCAAGAGTGTCGGCGGAAACACACACTCTTCGCTGTCTGCGGCAGGAGCCCAGCCGACTAGCTCTAGCCAACCCGCTGCGGCCACAAACTCGGATGCAATCAATGAAAACGTAGCGGGCAATGCAACCATTTCCAGCAGCACCAAGGTCAAGGCATCCGATGTGGCCGCATCGCCACAGTCGATATCGACTACAATTTCCTTGCTGTCGACACTTTGCCGCGGATCTCCTTCCATCACCCATGATATTCTGCGTTCCCAGTTGGCTGACGCCCTCGAAAGAGCCTTGCAGGGCGATGAGCGATGCGTGCTGGACTGCATGCGATTCGCAGATCTCTTGCTTTTACTTTTGTTCGAGGGGCGCCAGGCCTTGAACCGAGGAAGTAACAATCCCAATCAGGGACAATTGGCGCCACGACCCAGGCGCAACAACACCAACACCGATCGCACGCATCGCCAGCTTATCGACTGCATACGATCGAAGGACTCGGAGGCGCTTCGCGAGGCCATCGAATCTGGGGGCATAGACGTCAACTGTATGGACGATGTGGGTCAAACCCTTCTCAACTGGGCTTCAGCCTTTGGCACACTGGAAATGGTGGAATATTTGTGTGAGAAGGGAGCGGATGTCAACAAGGGCCAGCGGAGTTCTTCCCTTCACTACGCCGCATGCTTTGGTCGACCGGCCATTGCGAAAATCCTGCTTAAATTCGGAGCCTATCCGGACCTGCGCGATGAGGATGGTAAAACACCATTAGATAAGGCACGCGAAAGATTGGACGATGGACATCGGGAAGTGGCAGCTATTTTGCAGTCACCGGGAGAGTGGATGTCTCCCGATCACTCGCTGCTCAACAAGGACGGAAAAAAGTATACGTTGATGGAGCCCAGGGGTGATCCTGAAATGGCGCCCATTTACCTCAAGGTACTGCTGCCCATATTCTGTCGGACCTTCTTGGGCTCCATGTTGGGCAGTGTGCGACGGGCCAGTTTGGCCCTGATAAAGAAGATTGTACAATATGCGTACCCAACGGTGCTCCAAAGTCTCAGTGAAACCAGTTTTAGCGAAGATGAGCCGTCAACATCGAGCCAAAATGGTGGTAACCTACTTATCGAAGTGGTCGCTAGTGTCCTAGACAACGAGGATGACGACGACGGGCACTTAATTGTTTTAAATATTATTGAGGAAATTATGTGTAAGACACAAGAGGAATTTCTCGACCACTTTGCAAGACTAGGAGTGTTTGCTAAAGTTCAAAACCTGATGGACAATGATGCAGAGGAATTGTATGTGCAATTATCAGGAAACCCCGATGAACCAGCTGTCGTGCAGAGATCATCGACCAGTGTTGTAGTCTCCCCAAGATCAACTTCAGATGATCCTATGGAGGACGCAAAGGAGATATTGCAAGGAAAGCCTTATCACTGGCGAGAGTGGAGCATTTGCAGGGGTCGAGATTGCTTGTACGTCTGGTCGGACTCGGTGGCTCTAGAGCTTTCCAACGGCTCTAACGGGTGGTTCCGTTTCATAATCGATGGAAAGCTAGCAACGATGTACTCCAGTGGAAGTCCAGAAAACGGAAATGACAGTTCTGAAAATCGAGGAGAGTTTCTTGAGAAGCTTATGCGTGCACGTTCCTGCGTAATTCCAGGAGTTGTATCCCAGCCCATTTTGCCCACTGCAAGTGCTCTACGATTGGTTGTTGGTAACTGGGTCCTGCAGTCGCATAAAACAAATCAACTTCAAATTCACAACACCGAAGGCCATCAGGTAACCGTGTTACAGGACGATTTGCCTGGCTTTATCTTTGAAAGCAACCGTGGAACGAAGCATACCTTCACGGCTGAAACTGTCTTGGGTCCCGATTTTGCCTCCGGTTGGTCAACGGCTAAAAAGAAACGCAACAAGTCCAAGACCGAGGGTCAAAAGTCTCAAGTTCGCAACTTATCCCGCGAAATTTACAACAAGTACTTCAAGTCTGCCCAAACGATTCCTCGCGGAGCGGTGGCAATACTTACGGACATTGTGAAGCAAATTGAATTATCCTTTGAGGAGCAGCACATGGCACCAAATGGAAACTGGGAGACAACACTCTCGGACGCCCTAATGAAGCTGTCTCAATTGATCCATGAAGATGGTGTCGTGAGCGCCTACGAAATGCACTCGTCGGGATTGGTGCAAGCGTTAGTGGCCGTTTTGTCGGTTAACCATTGGGAAAATAATTCACCTCGATGCAAACGAAATAAAATGCAAAAACAACGAGTTTCCGTATTCAAGAAATGCATACTGGAGGATAACGTTGAATCCGCAACGAATAAGCCGCGAACTAAGAGCACTGCAAGTATTTTAATACAGAAACTTGTATCGGTTCTGGAGAGCACAGAGAAGCTACCAGTGTACTTGTATGACACTCCATGCACTGGTTACAGCTTGCAAATTCTGCAGAAACGACTTCGCTTCCGTTTGGAGCGAGCAGAATGCGAGAGCACTTTATTCGACCGATCCGGTCGAACTCTAAAAATGGAACCTTTGGCCACAATTGGACAACTATCCAAGTATCTGCTGAAAATGGTGGCCAAACAATGGTACGACCTCGATCGGTCCACATATTTTTATTTGAAAAAAATACGCGAACATCGGACCGGCACTGTGTTTACGCACTTATTTGACTTTGACGAAGAGGGTTTGTTGTTCTACATTGGCTCTAATGCAAAGACTTGCGATTGGGTCAACCCAGCGCAATATGGACTTGTGCAAGTGACCAGCTCGGAGGGGAAGACCTTGCCATATGGCAAACTGGAGGATATTCTGTCTCGCGACAGCATCTCACTCAATTGTCACACCAAGGACAACAAGAAGGCCTGGTTTGCCATCGACTTGGGCGTGTATATAATACCCACTGCGTACACGCTTCGTCATGCGCGCGGTTATGGAAGGTCGGCTCTGAGGAACTGGCTTCTCCAGGGATCAAAGGATGGCCTAAGTTGGACAACCCTCAGCTCACACGTGGATGACAAGAGTCTCGTGGAGCCCGGTAGCACAGCGACTTGGCCCATAACGTGTGCAGCTGACGACTCGGTTAGATATAGGCACATCAGAATCCAGCAAAATGGACGCAATGCATCTGGCCAGACCCATTATTTGAGTTTGAGTGGATTCGAGATCTATGGTCGCGTCGTCGGAGTTGCCGACGACATTGGCAAGAGCGTCAAGGAGGCTGAGGCAAAAATTAGGCGCGAGAGGCGACAAATAAGAGCTCAGCTCAAGCATATGACTACCGGTGCTCGAGTAATTCGAGGCGTCGACTGGCGGTGGGAGGATCAGGATGGTTGTGCCGAGGGCACAATAACCGGTGAAATTCACAACGGCTGGATCGATGTGAAGTGGGACCACGGCGTACGCAACTCGTATCGCATGGGAGCCGAAGGGAAGTACGACTTAAAGATGGCCGATTGCGAATATCTTTCCGTATTCGAAGGAAACCAGTCGATGGTTACTGTGAACGCGGCTGCAAAAATAAACGATAAATCAAACACGCTCACCTCGCGCAAATCAAGTTCAACTCCATCCCTGCCCGAAGCCACTGAAAAGAATCAAAACGCTGAAGGTGCGTCCAATCAAACCGTTTCGGCTGATAACTTGGCCTGGAAACAGGCGGTGGAGACGATTGCAGAGAACGTGTTTGCTTCGGCAAAGACACAGATTATCTCAAATCAACTGGCTATGAACACGTCATCCTCTCGGGAAGTTCGAACCAAGCACAAGGAGTCGGCTGCCAACCAAATGCATAAGGATAACATAAGTGGACCGTCGCCATTGAGTCGCGAGCTGGAGCACATATCGGACTTGTCGGCCATCAACAACTCGATGCCGGCAATTAACTCAAATATTGTTTCCGATCTAGCTACCATTTCGGAGAACCTATCCCTAGCTGAATTGTCCAAAGAAAACATATGCAGTGTCCTTTCGCCTTCATATAAGCCCGCTGAGGCTGTTGCTGCGAGTCAAAGCTCAAGCCTTCCCGATGTACAGAGTTCGTCTCCGTCTCCGCGAGAGAGTGATATAAAGAACATATCCAACATTGAAGAGAACAATAAGATGAATGCAAACAACACGGTGAATAAGATATCAAAGGATCTGCTTGTGAATCTCCGAACATCGAACATTGCAGGCTGTCAACCGGTGACACAACTTTCGACCGAAGCCCTCGAAATGATCGACAAGATGCGTGATGGCGTGGATATGATACGGAATAACTCCAACAACATTCTTTCCACAGACACTTTCCCCATGCCGCCATGCACAAACATGGGAGTCGGAGTTAAAAAGACACCCAAGGCTCAGGCGCTGATAAATCCCGAAAATGCGAATCAAAAACAAATCATAGTTGCAACAGAAGAATATCCCAGCAAGAGTTCAAAGAAACCCAGTGTAACGTTGAAGCCAACACAGCAGCCAAATGCCGTGCTTTCGATCGTGGACATCAAAGATCCGCAAATTTCATCCGAAAGCGTTTCGGTGCCCAGCCAGATGAGTATAAGTGTTCCTAATCTGACAACAACTTCAGCATCTGAGGTTCCCTCCACCTCAGAGGTGGCTACCCACACGGGTCTGCTGGAGACATTTGCGGCAATCGCTCGTCGACGCACCTCGCAGGGCACCAACATACAGGATAATCAGATCATGAATGCGGAAGTGAATGTGAACGAGCACGGGGATCAGAACGCATCGGGCTCATTCCTCGGCCACTCGGTAACCAGTTTGGTTAAGCTGGCATTGTCCAGTAATTTCCATTCTGGACTGCTCAGCACCGCCCAGAGTTATCCGAGTTTATCGTCGAATAATAGTGAAAACATAGCCCCATCAAACCCGTCAAATACGTCGACGGGACAGCAATCGGCATCCACCATAAATCATACACTTACAATGAGTCTTACATCCACGTCGAGTGACAGCGAACAAGTGTCACTGGAAGACTTTTTAGAGAGTTGCCGAGCTCCGGCTTTGCTGGGCGACTTGGACGATGAGGACGACATGGATGAGGACAACGACGAGGAGGAGAACGAAGACGAGTACGAAGAGGTGGGCAACACTCTGCTCCAAGTGATGGTCTCCCGGAACTTGCTCACCTTCATGGACGATGAGGGTTTGGAGAACAGACTGGTGGGTGTTACGAAGCGCAAGTCCTGGGACGATGAGTTCGTCCTAAAGAGACAGTTCTCCGCGTTGATACCTGCATTCGATCCGCGACCGGGTCGCACGAATGTTAACCAGACTTCGGATTTGGAAATTTCCCCCATTGGCGTTGAGTTACCCAAGCCCCAACAGAGCGGCCAGGAGACTATTGAACAGCCGATGCTGGGTCTAAAACTACGTGGTCCGGGAATTGGCGGAATTCCCGAAGTTGAAATTGACCTGAACAACACAGACTGGACCATATTCAGAGCCGTGCAGGAATTGCTGCAGTGCAGTCAGTTGAACAAGCTGGACAAGTTCCGAAAGATATGGGAGCCCACATACACGATTGTGTACAGGGAGGTGCCGCCTGAAGCGCCAGAAAGCACTGGCGTGGACTCGGAGGAGTTTGCCCAAACACCGGATGTGTCGTCAAAGAGTGGCGCCTCCACTTTGTCCCCCAACTCACCCATGCACATCGGATTTAACGTAGCCGATAATAACCTGTGCTCCGTGGACGATGTGCTTGAGCTGCTCACTCAAATCAATGGTCTCAATCAATCGGAAATCGATTCGGATGGCAAGGAACTTGGTGTTTCCGTGTTGTCCGAAGATCTCTTTATCAGCAAGAAAATAACTAACAAACTGCAGCAGCAAATCCAGGATCCACTAGTGCTGTCCAGCAACGCGCTGCCCAATTGGTGCGAAAACCTAAACCAATCTTGCCCCTTCCTGTTCCCATTCGAGACCAGGCAGTTGTACTTCAACTGCACATCCTTTGGAGCCTCTCGCAGCATAGTATGTCTGCAATCGCAGAGAGATGTGACTGTGGAAAGGCAGAGGATTCCCATCATGAGTCCGCGCCGGGATGATCACGAATTCCGCATCGGTCGTCTTAAGCACGAACGCGTTAAGGTGCCTCGAAACGAGAATCTACTTCAGTGGGCAATGCAGGTTATGAAGACGCACTGCAACCGAAAGTCCGTGTTGGAGGTGGAGTTCTTGGACGAGGAGGGAACTGGTTTGGGTCCTACACTGGAGTTTTACGCCTTGGTGGCTGCCGAAATTCAACGCGCCGACCTGTGTATGTGGCTGTGTGACGACGATTTGGGCGAGGACATCGACAACTCATCGGAGAATACGCAAGGCAATTCGAAACCCGTAGGGTATTACGTAAATCGCAGAGAACACGGAATTTTCCCAGCACCTCTGCCGCAAAATACCGAAACATGTGAGAAAGTACTAAAATACTTCTGGTTTTTCGGTGTTTTTGTGGCAAAAGTATTGCAGGATATGCGTTTAGTGGACATACCCTTATCAACATCATTTCTTCAATTGCTTTGCCACAACAAGGTGCTGTCACGTAATCTCCAAAAAGTTATTTCGGATAGACGAAATGGCGATCTCTCTGTCGTGTCAGAAGAATCGGACATAGTAGAAACCTGCACTAAGCTATTGCGCACTGATTGCAATAAGACCAATGCATTTGGGGGAATTCTTTCCTTAGAAAACTTAAAAGAAATAGATCCAACTCGTTATCAATTCCTACAAGAAATGCAAAACCTCTTATTGCGAAAGCAGTCAATTGAGTTTGACGACACCATAGACGCCGAGAAGAAAGAAGAACTAATAAACGAGCTTAAGCTGCACACCCAAAACGGCTTAGAGGTATCCCTTGAAGACTTGGCCCTTACGTTCACGTATCTGCCAAGTTCCTCGGTCTATGGATACACCCAGGCCGAACTGCTGCCAAATGGGGCGTCAGTGAATGTCACCATCAACAACCTGGAAGCGTATTGTGAACTGCTTATGAACTTCATCCTGCAGGACGGAATCGCTCAACAAATGAAGGCTTTCAGTGATGGGTTCAACGAAGTGTTCCCCCTCAAAAAGTTGGCTGCCTTTACGCCCTCAGAGGCCCGAATGATGATTTGTGGCGAGCAGTTCCCCCATTGGAGCCGAGAAGACATTATTTCATATACTGAACCAAAACTTGGTTACAACAAAGACAGTCCTGGGTTCCAACGCTTTGTAAATGTTTTACTAAGCATGTCGGGCGACGAAAGGAAAGCCTTCCTTCAATTCACAACTGGTTGCAGTAGCCTGCCGCCGGGAGGACTTGCAAACTTACATCCCCGACTGACAGTTGTTCGAAAGGTAGATGCTGGCGTCGGAAGCTATCCATCCGTGAACACGTGCGTTCACTACTTAAAGCTTCCGGACTATCCAACTGAAGAGATCATGAAGGAGCGCTTGTTAACAGCAACTAAAGAAAAGGGGTTTCATTTAAATTAAACAATTTATTGTACTCGATATTCAAGTTAATAAAATTTGAACCTTTTGTTATTTAAAGCGTACTTGTTGTGTAACGTAATAAGCGATACTGTAAATATTTCAACTGTTCAAACCCAATCTTTATATATAAGTTTAGATTTATTGCTTACACCTAAAGTCTCGGCCTATTGTTTCAAATTTAATTTAACCATTAAAATGGTAGCCACTGCAAA\n>XM_004521695.3 PREDICTED: Ceratitis capitata heat shock factor-binding protein 1 (LOC101452289), mRNA \nATTGTCATTTTCTGTTAAAATTTTGTTGTGTCTGGTTTCCAAAAGCGGAAAGTGTGCAAGATATATTATTTTTATACTTTTATAAAAAAGTTAACACAAACAATTTAGAACTAATTTTAATCGAAAATAAACCACAAACATGGCGGATATAAAGAATGATATTGATAGCGATTTGGATCAGAACTATTCGCTAAGTAGTAATGCGGATCCAAAAAATATGCAGGAATTGACAATTTATGTACAAAACCTGCTACAAAATGTTCAAGATAAATTCCAGACAATGTCGGACCAAATTATCACACGTATTGATGACATGGGCAACAGAATAGATGATTTGGAAAAAAGTATTGCAGATCTGATGAATCAAGCAGGTGTTGAAGGGCCAGAGAAGTAAAACGAAGCGGTTCGCGTAAAAACCTCATATTTTCCCATGAAGCATACTTATAAATATCGCTCATAAATGCAATAATCTTAACAAAATTAAGACATTTATTTAAATTCCTAAACAAAAATACATAATATGTAAGTGCACACATACACACAGCGACATGTACGTCATGTTAAACACAAAAGCGCACGAAAATGCAACCTTAAATGCTGATAAGAAGAATAATTGGCTCAAATGTGACACAAAATGTTTAATTAAGTTACAAACAATACTTATTTTAATTAAGTGAATTTTAAATATATAATGATTAAGGAATCATTTTTGAACATATTTTAAAGTTTTTTTTTTTTTTGTTATTTATATGTAAACAATAACCAAATGTGGGAGAAAAAGAAGTTCTTTGATATATGTGAATTTCTTATTAATTATTGTAATAATTATTAAATATTAATTATTTTTCTTAGTTTCCATACACTATGCATAATTCGGTATAATAAATGAATTAGTAATTTTAAATCAAAACATGAAAAA\n>XR_004389653.1 PREDICTED: Rattus rattus uncharacterized LOC116914019 (LOC116914019), transcript variant X1, ncRNA \nTTTTCTCTCCTGGGAGCGGGCCGAGGGGCGGGGGAGGGGCCACCGCTCCGCCTTCTTCTTTTCGCAATGTTGACGCAATCTATAAATAGTGGAACAAAAGGACCAACTTCCTCGGAGCTTTGCTGAAACTGCACAAAAAATCGAGCTGGGGGGTTCCCTGGTCCCCGATGTTGGGGCGGGGAGCTCGGCGCCGAAGGAGGGGGCGGCGCAGACCGGCCTAGGGGGACACCTGGCCGAGCGCAGTCGCCGCTCCGCTCGAGCCCTGCGCTCCAGTGCCCCCACTGGCTGGAGAGCTCGCCCAGACCCGGGGTCTTCCACCGTCTCTGACAGATTTTAACCTTTAGAAGAGAGCCAGTTGTGGAAAACAACCAGTTTTTTGATCGAATACCCACGTAATACATTGGAATATGATAGGAGATTAAGGTTTAACAATGATAAAATGAAGATATTACTAAAACAGCCCTCTAAGTAGCCCAACAATTATTATTTTTGCTAGAGATGAGAACCAGAACCATACAAGGTCCAAGACGAGCACTTTCTCTGTGCATATGGATGTCCTAGAAGTTGTGGCATAATGGTATTAATATGCTAGACGTACTGAATTGAA\n>XR_003957782.3 PREDICTED: Taeniopygia guttata uncharacterized LOC115492501 (LOC115492501), ncRNA \nCGTGTCCGCCCCCAGCCCCGTGTCCGCCCCCAGCCCCGTGTCCGCCATCCGTCTGTCCGTGCGCTCAGACTGAGCCCGCAGCGCCCGGGGGAAAGCAGCGGCCGCCTCCCCGCTCCTCCCGCGCGTCCGCCGGCGCCCGCTCGGACTGGCCACGCACGGCAACACGAGATGGTGGGAGGAGAAGCTCCTTACTTCAAGGAAACGAGGCCATGGTCAGAGGCAAATTCTCCAGGGGCTGCAGAGCCCTGTGAGCACAGGGTGACCCCGCACTGGGAGCAGCAGCTGGGGGTTTCTGCACATGGGGAAGGGAATTCCCAGAGCACTCGAGCCTCAACACGGACAAATATTCTGCAGTCTCCAGCAACAATTGGCTTTGGGATTTACGCTGTTGCAGCTCTTCTGGCTGTGAGGATGACCTGAAAATGTGAAGCAAGTGCATCAGCTCTTTCCAATGGCTGTGGCAGCACCAGGGTTTGGGTTTTTTGGTTGGCACAGGAAAATGAGCTGTGAGCAGCATCTGTGCCAGGGAGGAAAGTGCCCCTGGAGCTGGGGCTGAGAACCCGGGGTCGATGTGAGCACCTGTGGGTGGGAAGGAAGCTGGCAGAGCGCTGAGTTTGCTTTTCCTGCAGGCTCGCGCTCTGATGCGGCACAACGGGCCCCCGCAGCTGCAGGAGCCCGGGCGCCTGTCGGCTCTGCTGCGGGACTGCCTCGAGTGCAGCCTGGAGCCGGACGAGGAGCGGCGCTGCTCTGCCCAGGAGCTGCTGCAGCACCCATTTTTATCATCAGCCAAGCCTCTCTCCAGCCTGACCCCTCTGATCACCGCAGCAAAGCAACTGAGGGAGCAGCGGAGGAGATGAAGCACTTGAAAACAGCTGTTAGTTACAGTAGTTAGTGAGGACAACTAGTTAGTGATGGTAGTTGGCAGTGCTAGTTGGTTATGTTGGTTAGGACACCCTGTTTGTTACAGTTCTTATGACAGCCTGTTTGGCATGGCAGTTTTTTGAATAAAAACTCTGTTAAACCACAACTCCCTTGGCGTGTCCCTTCCTCCTCCCTCTGTGACTCAGCTGCCCGGAGCAATGTGAGGGGAGAGCGGGCCCAGCCTCGCCCAGAGCTGAGCCCCAGCAGAGCCCTGGCAGAGCCCAGAGCAGCCGGGGCATCTGCAGAGTCAGCCTGGGAGGAGGCGCTCGGAGCCTTCTCGGCTGCACCGACTCTTGGGTACAAACTGCGTGTGCTGGAAAATGCCCCCGGCTCGGCCAGAGGGCAGAAGGGGCCCGGGGAAGGCCCCAGTGCTCCCTGCAAGGGAAACACCTGCCCTGGGTTTGTTATAAAGGACTATGTAGTTGTGGCTTTTGCTGTGATGTCTTGGCTTCTGCAACTTATTCTTAATCGCAACGATTTAGATACAGTACAGCTTGTAATCACTTTTAACTGCTTTTGCTGTAGTATAATTTGTCAGCTTTTTGTGGTCAATGCCCTGGCCCCTGTGTAGCTCATATCCTCAGAACATCATTCATGGATGATAGTTTAGTTTGTGCACAGTGTGAAAAACATACATGATAGTTTTGGCTTTTACAAAATATTGAAGTGGATGCCATGTGTTGTGCATTAGAATGTTAACTTTTGCAGAAGTAGCTGTAGTTGTGAAATAATAACTAATGCTTTTCTTTTTGTAACTAACTGACAATAATAACTCAGAGATATTTGTGAAACAGCCAATGTTGATTTAAAGTACTTGTGGAAGTAGCTAAGACCGTCTGCATGGCCAGATAACGTTTAAGGAACGGGTGTGATGAGGACCCTGCCGCTGACCCTTCGACTGTCAGTAACTGTCGCCTGCTGATGTGGAAACCCAGGGCACCGGGAATATTTCTCTGTCTGCTCTGGGGTGTCCTGACCCCCAGGGGAGCACTGACTTTGACCCTCATTCATGGAGAAAACTTCCAAAGCTTCAAAGTAAGCTAGAAACCACAAAAGTGTGAAATAGATTGTAGAGATTGCAGAGAGTAGTGGAGTATGTCATATGGGTGAAAAATTTAGGTTTTAGAATTTTTAGTATGTTATAGATGGGTTCAAGATGGAGGATATAGGGTGTTGTCTTGAGTTCCCTTCTTCTTTCTTCTTCTTCTTCTCTTTCTTTTTGGGTTTATGTGGTATCCTGTAATTGGGTAGAATAATCTGCATTGTGGGTCTTTAGGGGTCAGTTACTGGGTTAGAAAGAAAACTAATTTAGGTGTCACTTCTTAATTGGGTAGCTTAGTTTTTGATTAGACTTACAAGGCCTTGTAACAAGAGATTGTTGGCCATTTTTGTGCTGTTTTCCTGCACGCAGAGTCTGGTGCAGACAGTGTGCTGAAGTTTTGATAAGAATAAACAGAAGCTGAAGACCGAAAAAGTCCAATGCAGCTCTGGTTCCTGACACAGAACTGCTCCAGGAGGGTCCCCCTGCCAGGGGAGCCGCCAGGGAGTTGCCCAACTTGGGGCCTGCAAACTCCCAGCTGAATCGGGGATCAGGGGGCTGTTGTGAGGAAGTGACACACAACCCTCAAAACAACAATCCATGATTCCTGCACGGACTCTAGAAAGGCGGGTTGGGGGTCAAACCAAAAGAGTTCCTGGAAGAAGTAAATGAGTTCAAAGAAATGTTTGAATGTGTATAATCTTTATGAATATGTTTTTGGACAATACAATGGAAAAAGTAGATAAGAAGAGTTGCTATGGCTAACCAGTGTGCCTCTGGCCATTGCCAAGCACCCAGCGCTGTTATTGATTTGTCTCTAATTATCCCTTCTTAAAGTTTTAAAAATCGTCTTGCTCATTTTGCCCCTCTTTGGCTTCTTCTCCAGGAGCAGAGGGAGCCGGGGCAGAGACCGCTGTTCCTTCTGCCATCTGCGGCAAGAGAGAAGCATGAGGGACAGGCCGTTACCTCTCATTTATAACCTCGTTCCTCCTCGGATCCACAAATACCACTTCCAAGGAGAAATCAGCAACTCTGTTAGCGATGGGATTCTAAGTGACTCTGACCAGATTAAAGTGGGTTAACTCAACAGAACTCTATTTGATGAACTCTATGAATTTGATAGTCCTCCCTGGCTGCTATCAGCAAGCAGCGGTGCCTCTGCACAATGCAGCTTTTAGCTCTTGAAAACTCTGAAATGGAAAAGTCAGAGATAGCCAGCACGGACTTTGTTATTGCTGCAGCAGACAAGGAAAACTCAAACTGGATCAGAATCCCATGCAGTGCACGAAAAGGGCAGGAAAGGTTGCGCAGACGCCTCTTTGCTTGCTGGAAAGAGAGAAAATGAGCGGGGCTTCTCCTCCTAGCAAACCAACAAACCACAAGTCGGAAGTGTCCCCTCCTCAGGTGGCTAAAGCACTTGGATGCAGTGAGGGCATGTCTGGCAGGGAAACAGCCCTGGTGGTGAGCACTGCCATGTATGGATCCATGGATCTGAAGGTCCCTCACAAGCCTCCCGTTGTCCAGGCTAAAGCTCCCTCAGCACCTCCTCCTTGGCCTTGCGCTCCACAGCCTTCCCCAGCTCCCGTGTCCTTCTCTGCACACGCTCCAGCCCCTCGAGGACTTTCTGCTTCAGAGGGGCCCACAAGTGGACACAGCACTCCCAGCCATGGCCGCAGCGCTGCCCAGCCCAGGGGGACGGTCACTGCCCTGCTCCTGCTGCCCCACTGCTGCTGACACAGGCCAGGGCATCCTTGGCCTTCTTGGCCACCTGGCCACACACTGGCCCACCTTCAGCTGCTCTTGACCGGCACCCCTGCGTCCTTTTGGCCCACGCAGCTCCCCCACCACAAAGTTGCCCGCTTGACTTCAAATAGAGCATCCCCAGTTCCAAGATGTCCTTCCTCTTCTCAGCAACACAAGACAGCAGTCAAGGACTTGCAGCTTCCCCCCCACCCTAGGCACTAATGCCATTCCCAAAGCTGCAGGCTGTGTGCAGCTGTCCCTGCAGGATGGCCCCAGGGCAGAGCCCAGCCGGGCTCCCCCTGCAGCCCCTGAAGCTTGGGGCAGGCAGTGGTCCCAGAGCTGAGGTTCACGGGGAGCACCCGCAGCTGTGCCTCGCACTCTGTTGCCGTGTCACCGTGCAGGCTGGCTTGTACGGGGTGAATGTACCAGCCCTGGTTTGACTGACAGGGGCCTGGCCCATCACAGCTCTCCCAAGGCTGCAGGCATTCCCCAGGCCAGAATCTGAAGGGGCACAGAGATCAGACCAGTGAAATCATCCAGACTGGGTTTTTCAAAGGCCCTTTAGAAGGAAGGGCTTGAGAATAAACGTGCTCTGTTTGCCACAGGAA\n>KP156844.1 Uncultured bacterium clone garden_soil_51834 16S ribosomal RNA gene, partial sequence \nAGTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGCAGCGCGGGGGCAACCCTGGCGGCGAGCGGCGGACGGGTGAGGAATACATCGGAATCTACCCAGTCGTGGGGGATAACGTAGGGAAACTTACGCTAATACCGCATACGACCTGAGGGTGAAAGCAGGGGACCGCAAGGCCTTGCGCGATTGGATGAGCCGATGTCCGATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGACGATCGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTTGGGTTGTAAAGCACTTTTGTTCGGGAAGAAATCTTCCGACCTAATACGTCGGGAGGATGACGGTACCGAAAGAATAAGCACCGGCTAACTTCGTGCCAGCAGCCGAC\n>XM_050191817.1 PREDICTED: Dermacentor andersoni protein FAM136A-like (LOC126544480), mRNA \nAAGCTGCCGGGCGCTGGCGGCTGCATGGGCGGCTGGCGCAAACACGAGGCGATTGTTGGTCTGCTTGGTTTCCTTCCTGTAAAAGGAGGTATTATACTAGTACTGGGAATACTACTGTAAGTGTTGAGCCGAACAACGCGATACAATGGCCGAAGGAGCTGCTCTGCGTGTACAAACTGCCGTAGACAACATGGTCAAGGAACTCGACAACTCTTATCTCCGCAAAATATTGGGCAATGTGCACAGGTGTGCAGTTAAGTGTTGTGACAATTCCAGCTTGTCAATGGATGGTGCTCGCACGTGCATCATGAACTGCTCTGAACCTCTTAACAAAGCCCAGAGTAAAGTCGAAGGTGAACTTGGAAACTTTCAGGAACGCATACGAATGTGTGTTATGCAGTGCGAGAATGACGTGCGGGACCAGATGAGCTCAACGTTAACAGAAGCAGAAGCCTCCAAGTTGAAAGGCCAATATGAGTCGTGTGTTGTGACGTGTGCGGACAAACATATTGCTCTTTTGCCACAGATGCAGCGAAGAATGAAAGAGTTGTTAAGTCAACTTTAGAGGCCAGTGTACACTGTTGTGTACATAGTTCGTACCGATCCTTGTATTTCTAGGATGAGTTAACATGCCATGTAGCTCCGCTCGTTGCCTTCTACCATAAATGTTTGATGAAAGGAC\n>XM_014783154.1 PREDICTED: Ceratotherium simum simum ATPase, class VI, type 11B (LOC101400597), transcript variant X4, mRNA \nGTGGGCGACATTGTTCGAGTAGCCAAAGATGAAATTTTCCCTGCAGATTTGGTGCTTCTGTCCTCAGATCGACTTGATGGTTCTTGTCACGTTACAACTGCTAGTTTGGATGGAGAAACTAACCTGAAGACACATGTGGCCGTTCCAGAAACAGCAGTATTACAAACAGTTGCCAGTTTGGACACTCTTGAAGCTGTGATAGAATGTCACCAACCAGAAGCAGATTTGTACAGATTCACAGGTCAGATGATGATAACTCAACAATTGGAAGAAATTTTAAGTTATTCCTTCTCGTTTTATATCTCCTTAATGGAGAGAAATTCAAACACCAAGAAGACCTGTGCTCCAAGAAGTGTACAATACCTCTGGGGCCAGAGAGTCTCTTGCTTCGTGGAGCCAGATTAAAAAATACAAAAGAAATTTTTGGTGTTGCTGTATACACTGGAATGGAAACTAAGATGGCATTAAATTATAAGAGCAAGTCACAGAAACGATCTGCGGTAGAAAAGTCAATGAACACATTTTTGATCATTTACCTCATAATCCTTATTGCTGAAGCCATCATCAGTACTATCTTGAAATATTCATGGCAAGCTGAAGAAAAATGGGATGAACCTTGGTATAACCAAAAAACAGAACATCAAAGAAATAGTAGTAAGATTCTGAGATTTATTTCAGACTTCCTTGCTTTTTTGGTACTCTACAATTTCATCATTCCAATTTCATTATATGTGACAGTAGAAATGCAGAAATTTCTTGGATCATTTTTTATTGGCTGGGATCTTGATCTCTATCATGAAGAATCAGATCAGAAAGCACAAGTCAATACTTCTGATCTGAATGAAGAGCTTGGACAGGTGGAGTATGTGTTTACAGATAAAACTGGTACACTGACGGAAAATGAGATGCAGTTTCGGGAATGTTCAATTAATGGCATAAAGTACCAAGAAAGCAATGGTAGACTTGTATCTGAAGGACCAACACCAGACTCTTCAGAAGGACCCTTTTATCGTAATAGTTTATCCCATCTTAACAACTTATCCCATCTTACAACCAGTTCCTCTTTTGGAACCAGTCTTGAAAATGAAATTGAACTAATTAAAAAACATGATCTCTTCTTTAAAGCAGTCAGTCTCTGTCACACTGTACAGATTAGCAATGTTCAGACTGATGGCATTGGTGATGGTCCCTGGCAATCCAGCCTTGCACCCTCCCAGTTAGAGTACTACGCATCTTCACCAGATGAAAAGGCTCTAGTGGAAGCTGCTGCAAGAATTGGCATCGTGTTTATTGGCAATTCTGAAGACACTATGGAAGTTAAAACACTTGGAAAACTGGAACGGTACAAACTGCTTCATGTTCTGGAATTTGATTCAGATCGTAGGAGAATGAGTGTTATTGTTCAGGCACCTTCAGGTGAGAAGTTTTTATTTGCTAAAGGAGCTGAATCATCAGTTCTCCCTAAATGTATAGGTGGGGAAATAGAAACAACCAGAATTCACGTAGATGAATTTGCTTTGAAAGGGCTAAGAACTCTATGTATAGCCTATAGACAATTGACATCTAAAGAGTATGAGGACATAGACAGACGCCTCTTTGAAGCCAGGACTGCCTTGCAGCAACGGGAAGAGAAATTGGCAGATGTCTTCCAGTTCATAGAGAAAGATCTGGTATTACTTGGAGCTACAGCAGTAGAAGACAGACTACAAGATAAAGTTCCAGAAACTATCGAAGCATTGAGAATGGCTGGTATCAAAGTATGGGTACTTACTGGCGATAAACACGAAACAGCTGTTAGTGTGAGTTTATCATGTGGACATTTTCACAGAACCATGAACATTCTTGAACTTACAAACCAGAAATCAGACAGCGAATGTGCTGAACAATTGAGGCAGCTTGCCAGAAGAATTGAAGAGGATCATGTGATTCAGCATGGGCTGGTGGTGGATGGAACCAGCCTGTCTCTTGCACTCAGGGAGCATGAAAAACTATTTATGGATGTTTGCAGAAATTGTTCAGCTGTATTGTGCTGTCGTATGGCACCGCTGCAGAAAGCCAAAGTAATAAGACTGATAAAAATCTCACCTGAGAAACCTATAACATTGGCTGTTGGTGATGGTGCTAATGATGTAAGCATGATACAAGAAGCACATGTTGGCATAGGAATCATGGGTAAAGAAGGAAGACAAGCTGCAAGAAACAGTGACTATGCAATAGCTAGATTTAAATTCCTCTCAAAATTGCTTTTTGTTCATGGTCATTTTTATTATATTAGAATAGCTACCCTTGTACAGTATTTTTTTTATAAGAATGTGTGCTTTATCACACCCCAATTTTTATATCAGTTCTACTGTTTGTTTTCTCAACAAACACTGTATGACAGCGTGTACCTGACTTTATACAATATTTGTTTTACTTCCCTACCTATTCTGGTATATAGTCTATTGGAACAGCATATTGACCCTCACATATTACAGAACAAGCCCACCCTTTATCGAGACATTAGTAAAAACCGTCAACTAAGCATTAAAACATTTCTTTATTGGACCATCCTGGGTTTCAGTCATGCCTTTATTTTCTTTTTTGGATCCTGTTTTCTGATGGGGAAAGATATATCTCTGCTTGGAAATGGCCAGATGTTTGGAAACTGGACATTTGGCACCTTGGTCTTCACAGTCATGGTTATTACAGTCACAGTAAAGATGGCTTTGGAAACTCATTTTTGGACTTGGATCAACCATTTTGTTACCTGGGGATCTATTATATTCTATTTTGTATTTTCTTTCTTTTATGGGGGGATTCTCTGGCCATTTTTGGGCTCCCAGAATATGTACTTTGTATTTATCCAGCTCCTATCAAGTGGTTCTGCTTGGTTTGCCATAATCCTCATGGTTGTGACATGTCTGTTTCTTGATATTGTGAAGAAAGTATTTGACCGACAACTCCATCCTACAAATACTGAAAAGGCCCAGCTTATTAAAACAAATTCAAGTGTCAAGTGCTTGGACTCCATGTGCTGTTTCTCAGAAGGAGAAGCAACGTGCGCATCTGTTGGAAGAATGCTGGAACGAGTAATAGGAAGATGTAGTCCAACCCATGTCAGCAGATTATGGAGTGCATCGGATCCTTTCTATACCAACGACAGGAGCATCTTGACTCTCTCCACAATGGAATCATCCACTTGTTAAAGTGGCAGTAGTACTTTGTGGGAGCCATTTCAACTCCTTTCCTAAAATTCAGTGTGATCATCCTGGTAATGGCCATACTGGCTCTTCAGATTTACTTTCTGAAATCTCTGGAGTAGTTCATACCCACTCAGAGTTATAATGGCAAACAAACAAAAAGCATTAACGGGAACCCCTCTCAACTCCCTTATGTTAAACTTTGTGAATAAAGAGACATTTTGCATCT\n>XM_027489590.1 PREDICTED: Abrus precatorius vicilin-like seed storage protein At2g28490 (LOC113857560), mRNA \nATGGGAAACATAGCTACCCTTTTGCTCTTGCTCTTTGTTTTTTGCCATGGAGTGGCCATAGCAGAAAGTCCTTCAAGTTCATCAACCAAATTGTTCTTGATGCAAAACTCCAAGAGAGTGGTTAAGACTGATGCAGGGGAAATGCGAGTTATGAAAAGCTATGGTGGTAGGATTTTGGATAGGCACATGCAAATTGGTTTCATCTCTATGGAACCAATGTCCTTGTTCATTCCTCAGTACCTTGACTCCAATTTGATCATCTTCATCCGAAGAGGGGAAGCAAAATTGGGATTCATATATGATGATAAACTAGCGGAAAGGAGATTGAAGACAGGAGATGTGTATATAATTCCAGCAGGTTCAGCATTCTATTTGGTGAATTTAGGGGCGGGTCAGAGACTTCACATCATTTGCAGCATTAACCCCTCTTCAAACTTAGGAGTAGATACCTTTCAGTCCTTCTATATTGGCGGAGGAGCCAATGCACCCTCAGTGCTTTATGGATTCGAGTCTGTGATCCTTGAAGCTGCATTTAATGAATCAAGAACCGTGCTAAGGAAAATCTTCACCAAGGAACTAGATGGGCCAATTGTGTACGTGACTGATACACATGCACCTAGATTATGGACTAAATTCCTTCAACTGAAAAAAGAAGACAAAGTGCAACACCTGAAGAAAATTGTGCAAGACCAAGAAGAAGAAGAAGAGGAGGAAGAGAAGGAAACAAGTTGGTCATGGAGGAAGTTCATGGAAACTATACTTGGTAATGTGAATGAGAAGATAGAGAACAAACACACTGCTGGTTCTCCTGACTCTTACAACCTCCATGACAAAAAACCTGATTTCAGAAATGCTTATGGTTGGAGCAAGACACTTGATGGAGCCGAGTATCCTCCACTCAGAAAAGCTGACATTGGCATTTTTCACGTCAACCTCACCGCGGGATCCATGATGGCACCCCATTTGAATCCAAGAGCAACAGAGTATGGCATAGTGCTGAGGGGTTATGGTAGAATTCAAATACTATTTCCAAATGGAAGCAACGCGATGAACACCGAAATCAAAGTAGGGGACGTGTTTGTTGTACCAAGATACTTCCCCTTCTGCCAAATAGCATCAAGGAATGGACCCTTAGAGTTCTTTGGGTTCTCAACCTCTGCCAGGAAGAACAAGCCACAGTTTCTAGCTGGAGCTGTGTCCCTTGTTACGACCATGATGGGGCCTGAGCTCGCAGCTGCTTTCGGGGTGAGCGAGGACACGATGCGGCGCACTGTCGACGCTCAACACGAGGCTGTAATACTGCCATCAACATGGGCTGCACCACCGGAAGATCCAGGGAAAATGGAAGAAGAGAAGGTACACATGCAGCCAAAGGCTATTAGAAGCTTTGCTAAGGATATAGTTATGGATGTTTTTTAA\n>XM_036746150.1 PREDICTED: Trichosurus vulpecula N-6 adenine-specific DNA methyltransferase 1 (N6AMT1), mRNA \nATGGCCCAGGGGGGCTGGGCCCCGCCACGTTTTGCCACTCCATTGCACCGACACGTGGGACGGGGTGCTTTCCGGGAGGTATACGAACCTGCCGAAGACACGTTCTTGTTGCTGGATGCACTGGAGGCAGGGGCCGCGGAGCTCGCGGGAGTAGAGATATGCCTTGAAATAGGATCAGGATCTGGCATCGTATCTGCATTCCTGGCTTCAGTTATTGGCCCTCGGGCTTTGTATATGTGTACTGATATCAACCCCAAAGCAGCCGACTGTACCTTGGAGACAGCACTGTGTAACAAAGTTGACATTCAGCCAGTAATTACAGATTTGGCCGAGGGCTTGCTACCGAGGTTACTCAGCAAAGTCGATCTTCTGATATTTAACCCACCCTATGTAGTAACACCTTCTGAAGAGGTAGGAAGTCATGGAATAGAGGCAGCTTGGGCTGGTGGCAGAAATGGCCGAGAAGTCATGGACAGATTCTTCCCTTTGGTTGCAGATCTACTATCACCAGGAGGATTTTTCTATTTAGTTACCATTAAAGAAAACAATCCAGATGAAATTATGGAAACAATGAAGAAATATGGTTTACAAGGCAAAATTGTACTTTCCAGACAAGCAGGACAAGAAATTCTTTCAGTCCTAAAATTCACCAAGTTCTAATATACGTAATGTGAAATGTTCAGTCACTAGTATACTTTTAAAGCCAAAGCTATTCCAAGAGCCAGGTAAAAATGTGAATTGTAATTTTTTAAGTGTTGAGAACAATTTAGGCAAACTAAGTTAAAAATCAGTGCTTTTCAAAATGTAATCTGTGGCTTTTCAAGAAAAGTCTCTCTGGGCTTTAAGCTAAGTCAGAGTGGTTTATTGAACAGTGTTCATAAACATTAATAAAAATGTTATGTCATAGCAAATGTCACTGTCACTAAGTAATGAGAGAAGGGTTTGACCTATATGTTTATTGTTCAGTCATGTTCAGCTCTTTATGTCCCCATGGACCATAGCACGCCAGACCCTTCTATCCATTATCTCCTGAAGTCTGTCCATGCTCTTTCTTTTTTTTGCTTCCATTACAATATCTATCCATCTCATCCTCTGCTATCCCCTTTACCTTTTGCTTTCAGTCTTTCTCAATATCAGCCTTTCTTCCAATGAGTCCTGTCTTCTCATTATGTAGCCAAGGTATTTCAGCTTCAGCTTCAGTATTTGACCTTCCAATGAGTAGTCTGAATTAATTTCTTTAAGTACTGACTGATTTGATCTCCTTGCTGTCCAAGGGACTCTCAGAAGTCTTCTCCAGCAGAATTTGAAAGTGTCGATTCTGCAGTGCTTAGCTTTACATATAGTACACTCTCACAGCCATATATTGCTAGTGGAAAACCTGTAGCTTTGATTATATGGACCTCTGTCAGCAAGGTCATGTTTCTTTTTTTTAGTATGCCATCCATGCTTGCCATAGCTTTCCTTCCCAGGAGCAAATCTCTTTTAATTTAATAGCTGCAATGATCTTTGAACCCAAGAATATAATCTGACATTTTCCATTTCTTCTCCTCCTATTTGCCAGGAGGTGATGAGACCAATTGCCAAGATCTTCATAGTTTGGGTTTGGTTTTTTGATGTTTTTAAGCTTCAAGCCAGTTTTTACATTCTCTTCTGTTTTCACCCTCATCAAGAGGCCTCCTTATTCCTCTTCACTTTCTGCCATCAGAGTGATATCATCTGCATGTCGAGATTGTTGGTATGTCTCCCAGAAACTTTACTCCTGGCTTTTGATTCATCCAGCCTGGCATTTCATATGCTATTCTCTGCATACGTTAAATAAATAAGATGACAATATATAGCTTTGTCATACTCATTTTCCTTTCTTAAGCCAATCAGTTGTTCCATGTTCAGTTCTAACTGTTGCTTCTTGGCCCACATTCAAGTTCCTCAGGAAACAAGGAAGGTGATCTGATGCTTCCGTCTCTTTGAAGACTTGTCCCATTTTGTTGTGATCCACACAGTGACAGACTTTAGTGTAGTCGGTGAAGCAGAAATAGATGCTTTTCTGGAACTCCCTTGCTTTCTCCATAATACAGCAAGTGTTGGTAATTTGGTCCCTGGTTCCCTGCCTCTCTGAAAACCAGCCTGCTCTTTCAGTAATTGTCAGTTTACATATTGTTGAAGCCCAGCTTGAAGAATCTTAACTTGTAACATTGCTGAAGGGTGAAATGAGCACAGTTGTTCAGTTGCTGGAACATTCTTTGATCTCGTTCTTCAGGATTTGTATGTGAACTGATCTTTTCCAATCCAGTGGCCACTATTGAGTTTTCCAAATTTGCTGCCATATTGAGTACAGCACTTTTAACATCATAATTAGGATTTTAAATAGCTCAGATAGAATTTCCTCCCCTCCACGAGCCTTCTTGTTAGTAATGCTTCCTAAGGCCCACTTGACTTTATTCTCCAGGATGTGTGACTCTAGATCAGCAACCACACCATTGTAGTTATTGGTGATATTAAGATCTTTCATATATAGTTCTTCTGAATGTTCTTGCCAGATCTTCTCAAGTCCCTACCATTTTTTGTTTTTTATCATGCCTATTTTTGAAGGAAACATTCCTTTGATATCTCTAATTTTCTTGAAGAGATCTCTTTGTCATTCTAGTGTATTCTTCTGTTTCTTTACATTGCTCATTTAAAAAAAAAACCTTTCAGGGCAGCTAGGTGGCGCAGTGAGCAGAGCACCAGCCCTGGAATCAGGAGGACCTGAATTCAAATGCAGCCTCAGACACTTGACACATGTACTAGGTGTGTGACCTTAGGCAAGTCATTTAACCCCAATTGCCCTGCCCCCCCCAAAACACCTTTCTCCCTGTTATCCTCTGGAATAATGCATTCAGTTGGATATATCTTTACCTTTCTCCTTTATACCTTTCACTTTCCCTCTTTCCTCAGCTATTTGTAAAGTCTCATCAGACATTTTGCTTTCTTGTTCTTTTTCTTTGGATTATTTTTTATTGCTCCTTCCTGTACAGTATTGCAAACCTCTATCCATAGTTCTTCAGGTACTCTATTCACCAGATCTAATCCTTTAAATTTATTCATCACTTGTATTTCATATTCATAAGGGATGTTATTTAGGGCATATACCTATACAGTCTGATGGTTTTCCCTACTTTCTTTAATTTACATGGGAATTTTTCAGTAAGAAGCTCATGATCTGAGCCACAGTCAGCTCTGGCTCATTTTAACTAACTGGATGGGACTTCTCCACCTTTGGCTGCAAAAAGTATGTAACCAGTCTGATTTTGATATTGACCATCTTATCTTGTGATGTCCATGTGCAGAATCACTTTGTGAGTTGTTGGGAGTTTTTGCTATGACCAGTGAGTTATTTTGACAACTCTATTAGTCTCTACCTTGCTTCATTTTGTACTCCAAGGCCAAACTTACCTGTTATACCAGTTATCTTTTGATTTCCTGCTTTAGCATTCCAGTCCCCTGTGATGAATGTGATATGGTTTTTTGGTGTTACTTCTAGATGTTGTAGTTCTTCATAGAACTGATAACTTTGGCCTCTTCAACATTAGTGGTTGGAGCATAGACTTCTATTGCTGTTCAGTCACACATACAAATGTACTTTCATTAGAAAAATAATTTTTAAATCTCAGCAGAAAATATTTTCTCTCTCCTGAAAGAAATCACTTCCTTTTAGAATTTTATTGTGGGTTTTCCTACATGGTTCTTTTAAGGGATGAGTGATAGGGTAGGGATAGGGATAGGGTCTAGACCTTTGATTTCAATGTAATAGAGAACTCCAGAATGAGGAAATTCTGTGAATGCAGGGTAGCACCATCTTCTTAAGTTTAGAAATCTTAAGAGAGTTGCCTAGAGCATTGAAAGGTTAAGTGATTTTTCCAGGATCACAGAGCCAGTATATCCAGCTGGATTTGAATCCAGTTCACTGTACTACACTGGCTCTCATTTGATCAATATGAATTATAAAAAAATGTTTTGTGAATGCCAAATCATGATTTCAGAGGACCAAAAAGAAAGCACATTACCACCCATATCCTGCCAGAAAGGTGATGGACTTAAAAGGGGTTTTTTGTTGTTGGTTTTTTATTATTTTTATCATTAGCAATTTGTTGGGGACTGGGGGGTGGTAGCTAATTGGAAAAAATACTAAAATTTAGTTTTAAAAAATATTTTGCAACAAGCATGTATACTTTCTAAAATGGGCAGCATAAGATTGATGGCATTTCATGCCACCGATATGACAAAAGGGGACCTAATATCCACATATCGTATTGAAAGTAATTTGTTCCCACACCAAGAACATTTGGGTTTTAGTTCTTTGGACTTTGGTTAATAGACTTTTAGTATCATGAGATTTAAATGTTCTTGTATTTATTGTTGAAACTTTTGGGTTATTTGTATAAACCCTTTAACACAATTATACAAATGTTATTCTTGACCAGAAAAATACTTTTTGTCTTTACAGAATGAGAGGATACACTATCAAATGTTGGTCTAAAAATAAAACTGCTATATTGCTATTAAAGCCTTGAAAAGTAGGTATTCCATTCATTACATAAATGAACTGTGAAAAGTGAATCCCAGAAAGTTATTTTAAAAATTCCTTTGACTTCTGAGGTCAAACACAAAATTAGTAAAGATTCTGGGAGAATTCTTCCCCTAAATATAATTTTCAAACTACTATAAAGTTGTGGTTGTAAAAGTGCTATATGTTATATATGGTTTATTACCAGTGTATGACATTTTTGATCTTGAACTTAAGTAACTATGACAAGGTGAGACTGATTTATGCCATTGTACAAAGTAGTACTTCACTAACACCTGAAGACTGCTTATGCACTTTGATTTTTTTTTTAAGTTTTAGCTAATTTATGCTGCTATAAGTTGACAAAATTATTAGGCTCTTAAATTTTATTTTTCCTACCTTGATCCCAGTTTTTGGTAGGTAAGAGAAAACTTGACAATAAAATTGGAGGTCACATTGTA\n>XM_015642795.3 PREDICTED: Parus major Rho GTPase activating protein 17 (ARHGAP17), transcript variant X8, mRNA \nCGGGGGCGGCCGGGGCACAGCGGCGGGGCCCGGGCAGGCCGGGGCAGCGGCCGCCGCCATGAAGAAGCAGTTCAACCGCATGAAGCAGCTGGCCAACCAGACCGTGGGCAGGGCTGAGAGAACAGAGGTACTCAGTGAAGACCTGTTGCAGATCGAGAGGCGCCTGGACACGGTGAGGTCCGTGTGCCACCTGGCCCAGAAGAGACTGATCTCCTGTCTGCAGGGCCAGCATGGCACAGACCCTGACAAGAGACACAAAAAACTTCCTCTAACAGCTCTGGCTCAAAACATGCAGGAAGGATCCATCCAGCTGAGTGATGAAACTCTGCTGGGGAAAATGCTGGATACCTGTGGGGATGCAGAGAGTAAACTGGCAATGGAGCTCTCCCAGCATGAAGTACAGATTGAGAGAGAAGTTATAGACCCACTGTGCCTGCTGACAGAGACAGAGATCCCAAATATCCAGAAGCAGAGGAAGCAGCTTGCAAAGCTAGTGCTGGACTGGGATTCTGCAAGGGGAAGATACAACCAAGCCCACAAGACTTCAGGAACAAATTTCCAAGTGCACCCTTCAAAAATAGAATCTCTTAAGGAGGAGATGGATGAAGCTGGAAATAAAGTAGAGCAGTGCAAGGATCAGCTGGCTGCAGACATGTACAGCTTTGTGTCCAAGGAGGGGGAGTACGCCCGCTGCTTTGTCACGTTATTAGAAGCACAAGCAGATTACCATAGAAAAGCATTAGCAGTCATAGAAAAGGTCCTACCCGAAATTCAAGCCCATCAAGACAAATGGACTGAAAAACCAGCTTTTGGAACTGCCCTGGAAGAGCATCTGAAGCGCAGCGGGCGGGAAATCGCAGTTCCTATCGAAGCCTGTGTCATGATGCTCCTGGAAACGGGGATGAGAGAGGAGGGCTTGTTCAGAATTGCTGCTGGAGCCTCCAAGTTAAAAAAGCTGAAAGCTGCCCTGGACTGTTCCACCTCCCAGCTGGATGAGTTTTACTCAGATCCCCACGCTGTCGCAGGTGCCTTGAAATCCTATTTGCGGGAGCTGCCAGAGCCTCTCATGACCTACAGCCTGTATGAGGAGTGGACACAAGCTGCAAATATTCAGGACCAGGATAAGAAGCTGCAAGAGTTATGGAGGATTTGTAACAGATTACCTGAGCATTACCGTGTTAACTTCAGGTATTTAATCAAATTTTTAGCCAAGCTTGCCCAGAACAGTGACGTTAACAAAATGACACCGAGCAACATCGCCATAGTCTTGGGCCCCAACCTGTTGTGGGCAAAGAATGAAGGATCCCTGGCTGAAATGGCAGCAGCCACTTCAGTGCACGTGGTAGCAGTTATTGAGCCCATTATTCAGCATGCAGACTGGTTCTTCCCTGGAGATGAAGATTTCAACGTGTCTGGGGCGTTTGTGGCAGTTCCTGCTGTTAATTCCAATCACTTGTCACACACTGGGAATGACTATGAATGTGGGACCCTGGAGAGGAAGAGGCCTCTGAGCATGACTGTGATGGAAGGGGATTTGCTGAAGAAGGAGAGTACCTCAAAATCCAAGGACAGCACATCTTCAGCCACTCCTCCACCGGTGAGGAACGGCAGCCAGGCAGGCCCTGCCCCGGGCCAGGCAGTGCCCAGCACGTCCCAGCTCTCTGTCACCCAGCCCCAGAACGCTGCTGGTCCCAGTCCCCACGCCCTGAGGAGAGCTGTCAAGAAGCCAGCACCAGCCCCCCCCAAACCAGCCAACCCCCCTCCGGGGCAGCCAGGAAGCCAAAGCTCTTCCCCAGCTGCTCAGCCACCTTCTGTCTCTCCCAAACCACCAGCCAGAAGCTCCTCTCCTCCTGCTCAACACGCAAACCAAGGAGCAGCCCAGACCTCCTCCCCTTGCCAGGTTTCTGCACCTCGGAGATACTCCAGCAGCGTGTCCCCAATCCAAGCCCCCAGCCACCCACCCCCGCAGCCCCCAGCACAGGCAACTCCTCCCCTGCAGCCCAAGGGCAGCAGCCAGGGCTCTGTGGAGCAGGGGGCAGAGCAGAGCCCCTCGCTGTCCCAGCCGCAGACCCCCACTCCCCCGGGCAGCCCCCCGGCCGTGCCCCCCGAGCCCTGCCAGGCTCCCTGCGGACCTCAGAGCGGCTCCCTGCCCCGGCCACGGCCCGTGCCCAAGCCCAGGAACAGACCCAGTGTCCCCCCTCCTCCTCACCCTCCCTCGCAGCTGCCTGCAGACGGGACGGCTGCAAACCCTGCTCAAACGGCGTCCAAAATAGTCACAGACTCTAATTCCAGTATTCCAGAGCCACCTCCAAACCCTCCTCCAGAGCTTCCTGCAGAGCCGGCGGGCAGAGAGCTGCACAACCACGTCCTGCTGGCCATCGACAATGACACGGAGAGCACGGCGCTGTGAGCGCTCCCTCCCCGCGCTCCTCTCCTCAGACCTCACAGGGAAAAGCTTCTTCTGGCAACGTGGCACAACGGTGTGGAGCTGGGGCTGCAGCCTGCTGGGCACAGGGATCTCCAGGATGGCCGAGGTTGGAGAAGACCTCGCAGAAAATCCAGCCCAGCCTTTGGCCCAGCTCCGGTTTCGCCCTCAGAAGAAGTTTAATGATCTGGGTCTGGACAACGGTTTTCAAACTCTTGGATGGAAGGAATGAATTCCTGCAGGAACTCGCCTAGGAAGCGTGGTCAGTGCTGATACAGGTGGTATTAGCAGAGATTCCAGAAGAATAAGAAGCAGAACATTAGTTATTTAAAGTGCATGTCTGTATTAGGGGAATAATCCTTCCCATGGCACGGTTAGAGGTTATTTGTAGTTCTTAGCCCGTACCAGGAGCTGCCTCCCAAGGGCCATTCCCTCTCGGATTTGCTGCAGATTCCCCCCAAGCCATGAAGCAAACCCTGCCCCAGTGCTGGTGGTGACTGCTGGTTCTCAGTCACCCTGTGGAACTGTGGATGCATCCCGTGCCTTGAAGGACTGTCGTGCTGTAGGAGGATCTTCCTGTCTCTTTAATCATTTCATTGCTACTTAGGATCAGTACTTACCCTGATTTCATAGTTATTTGTATTAACCTGCTTTGTTCATGTGCAACTGGCAACTGTTTCACGAGGAAACCGTGGAAATGGGGTTTGTGCTTTTGTTGAAAACGGTTGAATTTTGAAAGAACTTTGAAACAGCTGTTAGGATTCAGCAGTTGAGTGAACATTTATAAAATTAAAGATTGGTTTTTGTCAACTTAA\n>XM_039807938.1 PREDICTED: Perca fluviatilis tubulin, gamma complex associated protein 6 (tubgcp6), mRNA \nTTTTGTCGAAGCCCCGCGGTAGATTGTGAATCAAGCGACTAGAGAGCAATTAGCTAGCTAGCGACAACATCTAATATGCTGGAACAAGAAACCTTTCAATAATAAAAATACATTTTGAAGCAGTGTAGGGGACCCATCTACTGGGTTTCACATGCTTGGTACACACAAGCTAGTTAAGCAGGACAGCTAACGTTAGCGTTAGCTGGCTAGGTGATCCGTGGGGGCTTGCTAATAACAAACGTTAGCATGCACTGGAAGGAACCTTTTGGGGTGGATGCAAGATTGAAACTGTCTGAATCAACGAAAAATACACCATCTCGAAGGCTGAGGTAACAGTGCCACCATGTACTCGAGCCTAAACAACCCAATGAAGTCCAGCTGCAACAGCAGCAGCATCACTGAGCTGCTGGGTGCCCTGTGTGACTGCAGCCTGTCTGGGGTGTCATGGAAACGCCGTGCCCTGGGTGGAGTTTCAAGAGAAGGTTTCCGCAGAGCTCTCAAAAAACGTGCCTACGGTGCCCTGCTGTCTAAGCTATTTCAAGATGACACCAAAGGGTCTGCCTCAGGACTGAGTGCCACAGCCAATACACCGCCCAAAAACAAAGTTTTGATGATATGTTTTGACTTGCGGGTGGCAGGGTGCCGAGAGGAAGCAGAGCGTTTGGAGGAGCAGCTGGGGATGCTGTTGGATGGAGCATCCTCTGGCCTAAAGGAAGTAGACGCTGTCCTTGAGCTCTTGGTACATCTAGCTGGTTCGGCACCTCCACCCCCTACCTCTTTCATTAGGGACTATATGAGACGAGAGAGGCCTGTACTGCGGAGGCCTCAACCCTGGGGCTACCAGAGCGAGGAGCTTCAGAGGCTAGAGGCCCGGGCATGGAGTCTAGTGTGTGGGGAGGAATGGGGGACTTTAGAGAGTTTGTGTGGAACTCAGAAGTTGATGGATGCTCCTCCAGGCACAGGACTGCTGGCTCTGAGAACTAAATTAGAAGTGGAAGAAAGATTTGAGAGGGAGACCAGGATGACACTGTTTGGAGCACTGCAGCACACTCGCACCTCAGACATAGACATAAGACTGGACCTGCCTCCTGTTCCCAGTAATATTGATGTAACTGGGCTGGCTATACGGGTCCCCCCATGTATAGATCAGTCTGAGGATGAAGGTTTCCAGTCAGCTTCCAACATGACCCCAGACTCTCAGTCAGAGACCAGCCCCATACCAGACGTTGATATATGGGAGGCTCTTCGCACATTTGAGCCTGGAAGACGTCGCTGCTGGGAGTCTGTTGGCTGCCCACCAGGGAAAAGCGAGTCACTCTATCTAACAGAGGGAGGCAGGGAGGCCTTTGACCAGCTCTATCGTCTGTGGGAGGGGGAGATGAGGGTGGTCAGCACTGCTACACCTTCTCCTCTCCTCCCGCTGCCCCTGGACTCTCAGGCACTACTGGTATTTGACCTCCTCAACGTCTTGATCGGGGTGGCATCCACGACCTTCCCTCTCAACCAGAGTGTTCAGTTTGATGTCAGACCTGGTGTGTGCGTGTCCGGAGCCTCTCCAGAGAGTGTGTCTCGTCTCTTGGGGGAGCTGGCCCAGTACGGCACCCACTACTTGAGGCTTAGTCGCTTTTCTCTGCCGAGTGCTGGAAAAAAAGGCCTAGTCTTTCAGGCTTTTACAGGTGGTCTGCGGAAGTATCTGCATTACTACAGGGCTTGCGTTCTCAGCACTCCACCCACCCTCAGCCTGTTGACTATTGGCTTCCTCTTCCGCAAAGTGGGCCGCCAACTAAGGTACCTGTCAGAACTGTGCTGCGTAGATGGGCCTTTGGGTGCAGGCCAGGCTACCTTCCCTGTGGGTGTTAAACTGCTGTCCTACCTGTACAATGAAGCACAGAATAACTGCAGCAACGAGAACTGCGCGGTCCTCCTGTCGCTGCTGAAGAGCAGCTGTGAACCTTATACACGGTTTGTGTCTGACTGGGTGTATAGCGGCGTGTTTCGGGATGTTTATGGAGAATTCATGATCCAGGTTAATGAGGACTATCTCGTCTTCAGAGACAAACACTTCTGGGTCCAAGGCTACACTCTGATCTCAAAGGATGTGGAGGATTGTGTGCCCATCTTCCTGAGAGACATTGCCAACGACGTGTATGTCTGTGGAAAGACCATCAACCTCCTTAAGATCTGCTGCCCGCAGCACTACATCTGCTGGTCGGAGCTGCCGGTGCCTCGCATTGCTGTCACCTTCTCCCTCCGGGAGGTGGAGGACATCGAGAGGGACTGTGCTGTGTACCGCGGACGCATGGAGCGGGTTGCTAAGCACAGCGCCATCAGCAGGGAGGAGCAAGCCCAGCGAGCAGAGCAGGCACGCCAGGAGCTGATCAATCAGGTCAGAGAGTCAGCGGCCAAAACCCTGGAGAGCATCCGCGGGCGCCAGGTGTCACAACGTCTGGCTGAGGAGGCCAAGAAGAAGGAGCGTTTTGAGGAGCTGAAACAGCACCTGGAGCAGGAGCAAGAGTGGCGAAGCGTAGCCACAAAGAAGCAGGAGGAGGATGACTTCAGCTTTGCCAGAGAGCTGAGGGACAGAGAAAAAAGACTACAAGCCCTCGAGGAGCAACTGGAGCAGAGAGCCAGGAAGGAGCTGATAGCTCAGTACAGCCGTCTGTCAGAGGATGCAGCTCGCAGAGAGAGACGGGCCATGTGGCGGGTGCAGCGAATGAGACTTGATGAACCCCGGGCTCAGTTCTTCATGCATGACAGGCAGCAGACTCAGGCAATGCTAGAGAAATATCCTTTAGGCCAGAAGAGACCTCCCATCAAAGTGTTTCCACCTGTTACCTCAGCACAACAGACTGCACTACAACCAACACTGGAATCTCCCACTCAGCATCTGTCTGAGCAGCAGCCAGCGGAGACTCAAGAATCTGATGGTGTATCACCTGACCCATCTTCACCTACCCTCACCCACCTTACAGTTAACCTCGCACTCATCTCTGAGAACGTTGACGTCAATGATTTTCTTCCTAAGTCACCAAATCCTAACAGTCAGCAGGTAGACATCGCCCTACAGGAGATTGGCTCTGACCTACCTGAAGTGTGTCCTACAGCACAGCTAGTAGACTATGACTTCAGTGCCCCCTTTAGTCCACTTGAAGGTATCACAGGTCAAGCCTCAGTCCAGCCCCAACCTCGCTGGGGACCTGCAATCCAGCCTGACTTGATCCAAAACCATCCCTCTTTTTCTCACATCCTCATAGGAGAGAACATGTCTCAAGTCCAGGATTGTCTCCCCAAAGCTAGCCCCTTTGGCCAACCCTCCAAATCCAGCTTTACGCTAGGCCAGTACACCCCAGAGGAGCTTCAGAATACATCTAAAGCAAGCATTTATGGACATCCCTCTCAAGCCTCAGTGCAGTTAGTAGATGGGAGTGGCTCTATGACTGACAACAAGCAGGCGGAAATTGCATCTGTGATCATTGAAATGGGGAATTTAGAAAGTAAAGAGGCAAATAAAGACAATGATGTGCTTGATGCAGCTTTGTCCACCACACCAGAAGAAAGTGGCAAGGGTAATTGTCGTTACAAAGCAGTGACAAGTCTTTCTGACTGTGGTGGGATTGAGCCACCTGATGCAAATCCTAACCCAAGCACTCAAGACCGCAGCTCAGATGCTCAAGATAAAGCTGGTGATAATAATTATTTGCCAAATGTTCATCTCCCCAGTGCTCGCCTTAAAGCTGGAGAGCTGGTTTTAGATGTCGTTGCCCAGCATTCTTTACCTAGAGTCCATGGGCATTCCTCTGATGCTCGCGTAAAGGTTGGACAACTTGTATCAGAGGTAACTGCTCCTCTTCCATCCCCTAACGTCCACGGTTATGCCTCAGATTCCCATATCAAAATTGGAGAACATATTTTGGAAGTTGATGCTTCTCTACCTTCCTCCAGTCTTCACAGTCAATCTTCTGATGCTCACATTAAAGTTGGGGAAAATGTTTCAGATATAGTTGCCCCTCTGCCCTTTCCAAACGTTCATGGTCACAGTTCAGATGCCCACATTAAAGTTGGAGAAAATATCTCAGATGTTGTCGTGCCACTTCCTGCTCCCAACATCCACGGTCACTCCTCTGATGCTAATATAAAAGTGGGCGAGTTTCTGTCTAACATACCTGAAGCAAGGCCTCGTGAGAGTAAACATGGGCATGCCTCAGACTGCATGCTTCAATCAGGCTGTGTGGTGTCTGGAACTGAACCCGCCTTGTCTGTTCTACCTGGAAGCTCTTATGGTCACTCCTCAGACTCAGGGTTAGGTGGTGGATGTGTAGTTTCAGGAGAAGAACCCAAACGTTCTCCTCTACCTGGCAGTGCTTATGGTCATTCTTCAGACTCAGGGTTAGGTGGTGGATGTGTAGTTTCAGGAGATGAACCCAAACGTTGTCCTCTACCTGGCAGTGCTTATGGTCATTCTTCAGACTCAGGATTGGGAGGTGGATGTGTAGTTTCAGGAGACGGACCCAAACGTTGTCCTCTACCTGGCAGTGCCTATGGTCATTCTTCAGACTCAAATTTAGGCGTTGGATGTGTTGTGTCCAAAACTGAACCACTTCCATCACAACTACCCGGCAGCACCTACGGCCACTCCTCTGATTCAACCCTGGGGGTGGGTTGTGTGGTGTTGGGGACAGAGCCACAAGCCTCTGCACTACCAGGCAGCACCTATGGCCACTCATCAGATTCTTCACTCGCAGTTGGGTGTGTGGTGAAGGGCAAAGGCAGCTTAAATCAGCAGAAGACAGACGACAATGAAGATGGCAGAGGTTCTAAGTCGGACAGCCCTGGTGAGCAGCTGGTTGAGTTCATGGGGTCCTGGGCAGCAGGCTTCGGTTTGTCCCCTGGAGAAAAGTCTGAGCAGGAATATCTCTTGGCTTTGTGTGCTCAGTACGAGGTGGAAAAATACGAAGACTGCTACAACCTAATGGCTTCGTCCCCAGAGTGTCAGCTGCTGAAGCAGGTAACTCGGGGACCCTGGGGCCTTCCTATGGACCACACACTCCGCAGAGCCACAGACACCACTGTTGTCCAACTCAGCGAGATGGTTTCTCTGCCAGTTCTGATAAAACAGGCCGTCACTACCCCACTGATCACACATGTGTCATTGGTGAACAAGGCGGTGGTGGACTACTTCTTTGTGGAGTTGGGGGTGGAGAGACACTTTGAGGCACTGCGCCACTTCCTGCTGATGGAGGATGGCGAGTTTGCACAGTCCCTCAGCGATCTGCTCTTTGAAAAGCTGGGCAGTGGCCAGACTCCCGGTGAGCTGCTGACCCCCCTGGTCCTGAACTCCATCCTCAGTAAGGCCCTGCAGTACAGCTTGCATGGGGACACCCCCTTAGCAGGTAACTTTACCTTCGCCCTGCGCTTCCTCCCGGAGACCTTCCACCCACACGCCCCCGATTCTCTCAACTGTCTGGAGCTCCGCTACAAGCATGAGTGGCAGCTTAATCGCATCATCACGTACTGCGCCGAAAACAAGTACAACCGTCTGTTCTCGTTCCTGCTGCAGCTCAAACACATGGTGTGGAGCCTCCGTGAGGTCTGGTTCCACCTCAAGAGAACAGCGCTGGTGAAAGGTGCAGGTCGCTCGGTGCAGTTTCGGCAGCTGCAGCTATACAGACACGAAATGCAGCATTTTGTCAAGGTGATCCAGGGATACATCGCCAACCAGATCCTGCAAGTGTCCTGGAGCGAGTTCACAGCCAAGCTGGCCACTGCCAACGACCTGGACGCCATTCACCGTACACATGCAGACTACCTCAACAGAGCCATCTTCAGGGGTTTGCTGACAGAGAAGGCAGCTCCGGTCATGAACATCATCCACAGCATCTTCAGCCTGATCCTCAAGTTTCGGGCCCAGCTGATCGCACAGCCCTGGGGCAGCCAGCAGGGGGAGGCAGTGCACCCAAGCTTTATTGCCATGCAGCAGTCGTACAACACCTTCAAGTATTACTCTCACTTCCTTTTCAAAGTGGTGACCAAGCTGGTGAACCGAGGCTACCAGCCTCATCTAGAGGATTTCCTTCTTCGCATCAACTTCAACAACTACTACAAAGACTCCTGAGCTGTGTACTGGTGTGTATGTTGTACATGAGCTTAGTGTGAGTACTTGACATAATACAGGCCATTTGTTAGATACTTGCAATGCACTGTTTACATCTTAGAGTCCCCTGTATCTGTCTATAAGACAGATAATCAGAAATATATAATACAATAAATGTTAGTGTCGAAAATACATTAAGAAACCCACCTGTACTTTATATTAGGCCATGAATTTGAAATTTAAATTGTATGCAATTATGCAAAGTTTATGCAATCCATGTGCAGGATTTAATTAATGGCTAAAACTGTATGCTGCCAAAGTTTGTAATTAAGGTGAAGCTGATGCCTACTGTAATGTCTCACGATTACGTGTGCCTCCAGCTATGTAGATTTTAAGTGCATATAAATGAAGTGTCAATTGCATGTAAATACAATTGTTAAATAAATGCGCTATGTTCCTGTGT\n>XM_050218304.1 PREDICTED: Anopheles maculipalpis sensory neuron membrane protein 2 (LOC126561926), transcript variant X2, mRNA \nGAGTGTGGGTGAGTGGGTGCAGTGAACGGTGTCACGGTGCTGCCAGGCGACGGCGATCCTCCAAACCACCAAGATGGTGCAATGCACTCTGATCTGGGCCGGCATCGGTGTGATGATGGCCGTATCCGGCGCACTGCTCGGTTGGGTCGTTTTTCCTCGCGCCGTGCACGAGAAAGTGATAGAGGCTACGGAACTACGTCAAGGGACGGATCAATACAAGCGATGGGAAGCATTGCCACAGCCGTTAGATTTTAAAGTGTACATATTCAACGTCACTAATCCGTACGAAGTGATGCAAGGACGACGGCCGAAGGTGGTTGAAGTTGGACCATACGTTTATTTCCAATATCGCCAGAAGGATAATATACGGTTTAGTCGAGATCGGTCCAAGGTGCATTACAGTCAGCAGCAGATGTATGTCTTCGATCCCGAATCGTCCTATCCACTGACGGAAAACGATGATCTTACAGTGTTAAACATGCACATGAATTCCATACTGCAAATAGCCGAGGATGAAACGTACGACAGTTTGCGACTGATCAATGCCGAGCTGAACCGTATCTTTGGCCGACCGGACACAATGTTCCTGCGGACGACACCGAAACAGTTTCTCTTCGACGGTGTACCGTTCTGCGTGAATGTGATCGGCATTGCGAAAGCAATCTGCAAGGAGATCGAGAAGCGTAACACCAAAACCATTCGCACCATGCCGGATGGAAGTTTACGGTTTTCGTTCTTTAGCCACAAAAACATGACAGATGATGGTATGTTTACGATCAACACGGGAATTAAGGATCCGTCGCGGACGCAAATGATTGAACAGTGGAATGGCCGAACAACGCTCGAGGTGTGGAACAATCGGAGCAGTGGATTGCCCTCTGCCTGCAACAAGATCCGGGGTACTGATGGGTCCGGCTATCCACCGTTCCGAACCGGTGTCGAACGAATGACGATCTTCAGCACCGATATCTGCCGCACGGTGGACATTAAGCTAACCGGGGCATCATCGTACGAAGGCATCCCCGCACTGCGGTACGAGATCGACGGTAACTTCCTGCATGAAATAGGACCCGAGTACGGCAACGAGTGTTACTGCGTGAACAAGATCCCGAAGTCGATCGTTAAAAGCAATGGCTGCCTGTACAAGGGCGCACTGGATCTTTCCAACTGTTTCGATGCACCGGTGGTTCTGACGCTTCCTCATATGCTGGGTGTAGCCGAGGAATATACAGCACTGATTGACGGCATGGACCCTGAGCCGGACCGGCACCAGATCTTTGTGGATGTAGAACCGTACACCGGCACACCCTTGACCGGTGGGAAAAGGGTACAGTTCAACATGTTCCTGCGACGGATCGACGCCATCAAGCTGACCGATCGGTTGCAGCCGACCCTCTTCCCGGTCATCTGGATCGACGAAGGTATCGCACTGAACGAGGACATGGTGAAACTGATCGATGACAGCCTAATGAAAGTGCTCAGCCTGCTAGACATTGTGCAGTGGGTACTGATCGGTGTAGGGCTCCTGCTAGCCATCCTGATGCCGATCGTCTTCTTCGTCAAACGCTGTCGTGGCAACGATAGCCGTACGGTTAGTCCTGCCGTAACGGCTACCACGAGTGCGGCCAGCCTATCGATGGCGACGGGCGTTACCGGCGAGCGGAACAAATGACCTTCGCTGACAATGCTAAGTCTGGACTGATGAACTGCTAGCACCAACTAGCGATCAACATTTAGAAGGTGCCAATGAG\n>MK538674.1 Uncultured bacterium clone OTU_1300 16S ribosomal RNA gene, partial sequence \nGGGCCCGCACAAGCGGTGGAGCATGTGGTTCAATTCGAAGCAACGCGAAGAACCTTACCAGCCCTTGACATCCCGGTCGCGAGCACCAGAGATGGAGCTCTTCAGTTCGGCTGGACCGGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGCCCTTAGTTGCCATCATTTAGTTGGGCACTCTAAGGGGACTGCCGGTGATAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTACGGGCTGGGCTACACACGTGCTACAATGGCGGTGACAGAGGGATGCAAAGGAGCAATCCTTCGCAAATCTCAAAAAGCCGTCTCAGTTCGGATTGTGCTCTGCAACTCGAGCACATGAAGTTGGAATCGCTAGTAATCGCAGATCAGCACGCTGCGGTGAATACGTTCCCGGGCCTT\n>XM_023646352.1 PREDICTED: Equus caballus chromosome 7 C19orf24 homolog (C7H19orf24), transcript variant X1, mRNA \nGCACTCGTCCCTGCCGGGCCCTGGCCGTCTCGGCGGAGTGACCGGGCAGCCTCATCGGTGTTGCGGGGCCGAGCCTGCTTCCCGGGCGGGCTGGTGGCCTCCTCGCTGGTCTTGGGGTGCAGCTGTCTTGGGGCCGAGCGGGTCCCCTCAACTCCCCCGGGGTGGGGGCGGCGCAGCGGGCGCAGGGCCCTGTCGGTGTGGTCAGCGCGGTCAGGACGGCGAGGGCCCCGCGTCTGCCGGCGGTCCGGTCTGCTGGTCCTGGCTCTGCGGGCGCCGATGCCGTGGCCTCGTGGACGGCGCGGGCCACGGCACGGCCGCCCTGCTGGCCCACCGGCCCCCGGGCTGCACGGGCTGCGGGAGGGCCCACCGGCCGAGAACAGCGAGTCGGGGCCCGGACCGGAGGGAGCCCAGGCTCGGCCCCAGCCGTCCTGCGTGGCGTGGCCTCGTCCGTGCGGGTCCTTGGGCGGCGACCCTGTGGCGCGCCCAGCTGCCGTGACCCGGTCTGGCCCAGGGCAACTGAGGCCTGGCGCGGCGGGCCCGCGGGGCCGGGGCGCGGGGAGACGCCCCGGGAGCGGCCGGGGGCGGGCGTTTCCGGAGTCGGGCCCCGCCCCCGCGGGCCATTGGCTGGCGCCGGTGAGTGACAGCGCGGCGAGGGCGGGGCAGCCTCCGCTTCCGGCGGGCCATGGGGCCGCGCGTGCTGCCGCCGCCGCTGCTGCTGCTGTTGCTGCCGGCGATTCTGCTGCCGGCGTTGCTGTGCGGGGCCCAGGGGACCACGCCCAGGTCGTCGCACCCCGCGTACGCCACGCTCTTGCCGTCGCCCGCCGTGACGAACGGGAGCCAGCCGGGCGCGCCGCACAACGGCACGCACCCGCGCTCGCCGGCCGCGCCGGGCTCGCCGCTGCTGCGCTCCTTCTACGTGCTCACGGGCCTCAGCGGCCTGGTCGCGCTCTACTTCCTCATCCGGGCGTTCAGGTTGAAGAAGCCGCAGCGGCGGAGGTATGGCCTGCTGGCCAACACCGAGGAGTCCGCGGAGATGGCCTCGCTGGACAGCGACGAGGAGACGGTGTTTGAAAGCAGGAATCTGACATGGTGGCGTTTCCAGCGGCCCTGGGGGAAGGACAAGACGCGGGGTCACCCCCAGTGCCTGGCGCAGTCGCTGATTCTTTTGTTGGCCTGGCTGCACCGCGACAGCTCGTGTGGGACCTGCCCAGCCTCCCTGAAGACGCTTCAGCCCCCGCCTGCACAGGACCACCCGAGATGGCCGGTAGAAGCCAGAGAGGCTCTGGCAGCCCCTCCCAGGACTCAGGCCGCCTGGCCGGACTGTGGCTTGTGCTGCTTGCTCTTTGCTGTGGGGACGTGGCTGGCCTGAGCCGAGGCCTGGGGGGCAGGGGGGCTGAAGGCCTGTCTGGGAGCACCTTCCCCCTGGGCTGGGGACAATAAAGGAGTGGTGGCTCTGTC\n>XM_035641279.2 PREDICTED: Scophthalmus maximus zinc-binding protein A33-like (LOC118314697), mRNA \nTGGAGCTGGAATATTTTTCCTATAACCTCACTTTACAGGAACACTTCAACCTCACCATGGCAGCAATGAATTCGCCCCGGGAGGAGGACTTACTTTGTCCCCAGTGCTGCGAGATCTACCGACTCCCTGTTCTTTTGAAATGTGGCCACAATGTTTGCAGAGTTTGTTTACAGAAATTCTGGGAATTGAAAGGATGTCGAGAATGCCCAGTGTGTCGCACTGTGGCTGAGCCCGGGAGGCCTCCTATCAATCTGCCACTAAAGATAGCTGCAGATGAATATCAACTGCGACGGAGCAGCAGGAATCGAGACCTTTGTTTTCTTCACGGTGAGAAGCTGACACTTTTTTGTCAGAACGACGAAGAGCCCGTCTGTGTCGTCTGCCACACATCCAAACAGCATAAGGTGCACGAGTGCTGCCCAGTAGAGGAGGCTGCCCAACAGAAGAAGACAGAGATTTCAACCATGCTGGAGTCCCTGAGGAAAAAGCTCAGAACCCTGAACAAGACCGAGGAGCACTGGAAGGAAACAAAAACCTATTTACAGACCCAAGCTCGTCAAAATGAAGAAGGGATAAAGGAGGAGTTTCGGAAGCTGCACCTGTTCCTCCAGGAGGAGGAGAACGCGAGACTAGAGGTTCTCAAACAGGAAGAGGAAATCAAGACCCAGGTGATGTGTGAGAAGCTGGACAACATCCAGGAGCAGATCACAACCCTCTCCTCCACCGTCAGTGATACGGTGGCCACGCTCACAGCGAAGGATTTGACCTTTTTACAGGACTACAAGAAGACAAAGAAAAGGGTCAAATGCAACGTTCGAGAACCGGAGTGCATCAGAGACATCCTGATAAACCCTGCAAAGCATCTGGGATCGCTTAAGTTTGGAATTTGGAAGAGTATGGCCAAAATGGTCAAATATGTCCCCATCACTCTGGATCCAAACACAGCCCACTCCAACCTGGAGTTCTCTGAAGAGCTGACCTGCGTGCAGTACAGCAGGAAGCAGCTCCTGCCCGACAACCCCGAGCGCTGCACCAGCCGTCTGTGTGCGCTGGGAGCGACCGGCTTCACATCTGGAAAGCACAGCTGGACAGTACACGTGGGCCAAAGCAGAGACTGGTACATCGGAGCGGTCCGAGAGTCTATCAAGAGGAAGAGCGCCGTCTTCCTCAACCCTGCCGAGGGCTTCTGGGTGATCGGCCTGTGCGGCGGAGACTCGTTCTGGGCTCAGACGTCGCCTCGCACCAAGCTGGTGTTGAAGCAGAAGCCCGAGAGGATCACTGTGGAGCTGGACTGTGACAAGGGAAAGGTGGTGTTCACCAACGCTCAGGATTCGACGACAATACACACATTCAGAGACAGATTCACAGAGAGGATCTTCCCCTACGTCTCCACCGGATTGTACGGGGAGGGGAAACTCTCCAGCCCATTGACGATCTGCCCTCTGACCGTAACACTGGAAGTAAAATAGACTCACACAGCAGATGAAGAGACACCGTTTTAAATTAGATGTGCGCGTTTTAACTTTTGACTGACATAAAAAATAATGATAAAGCCATGATTCACACATGAAATTCAGCAGCCAACTGAACGATACCATACTTTATTGTATGACTTATGTACAATTTATTAAACAAGACTATAAACACTTTCAA\n>XM_041090641.1 PREDICTED: Gossypium hirsutum uncharacterized protein At4g17910-like (LOC107939771), transcript variant X6, mRNA \nATAAAAAAAAAGAGTAAAGCCCATCAAAATCCCTAAAAGCTCGTTCCCATGTCTTGCCACAACAATGGTAAAGCCTAACCCATTTATAATCGTCGAGTCCACCAGGTTTTCGGCTTTTGACCCATCCAAGGTGAAAAATATTGTTTGGCTAAAAGCTCTGATCTCCTGTAATAAATTCACAACTGCGTTTTCAAACTCTTCGTCAATGGATTCCTTCCCAAGATCTTTGAATCCCAACAAGCACCTCAGAGAACAATTCGTGAGCAATTTGCCTGGATCTTCCATGCTTGAAGTCTCTGCGCTTTTGAATAATGTAGCTCTTCTAATGCTTTTGCGGCACACTTTCTGCTCTCAAACAGTGAATGATGCTTGTAGGAGTTTAAAGTCTTACCTAGCCTCAGTAGCTTTGGATTATGTCTTCCTTGTTCTACCCACACTTTTAATTTTCACTGTTCTAGCAGAGTGGGTATACATATGCTTGATTGGGTTATTGTTATTGCTGGTCTTCTTTACTGCAGTCAAAAGAACTTACTCTTTGCCTTACATGGAAGGACCTAATGCTTCAAGGGCAAGCATATCATCTTATAGGGTTGTTACGATGTTTATCACATGCTTGTGTATCTTGGCTGTTGACTTCAGAATATATCCTAGAGAATATGCTAAGACAGAGACTTACGGGGCTAGCTTGATGGACCTTGGAGTTGGCTCCTTTGTGCTAATGAATGCTGTTACTTCACGGCAAGCACGAAACATCAAATCATCAATGAGTTGGTGGAAGGCAGCCTTTAAATCTACAACTCCGCTACTACTGTTAGGATTTGCTAGACTTGCTTCTACATTGAGTCTAGACTATCAGGTACATGTGGGGGAATATGGAGTCAACTGGAATTTCTTTTTCACACTTGCTGGTGTATCTATCCTTACATCCATTTTAAATGTTCCCGCAGAATATTCTGGAATTCTTGGTTCAGTAATTTTAGTTGGGTACCAAAGTTGGTTGACTAATGGGCTAAATGTTTATCTTCTTTCTAATGAAAGGGGTACGGATGTCATAAGCAGAAACAAGGAGGGAATTTTTAGCTTATTTGGATACTGGGGTATGTATCTTGTTGGTGTTCAGGTCAGCTACTATCTCTTCTTTGAAAATCATACTACCAAGCAGAGAAGCAAGCATGAAACACGAATCAGAATCTGCCTTCTTACTATTATGTTTTGTGCAACCTGGCTTATGTTACTTGGGTGGTGGCTCAAAATCTACAGGTATCTGAAGATTGACTATCAACCATGACACTGCTAGGAATTTTTGGGTTCGAATTACCATGTTTGTTCTCTATTAGCCTCTCAAGAAAAGTTCACTCAGAAACTTTGTTATACAAATTGAACCCTTGCCTGTGTACCTTGTTTGGTTGTCTTTGGTTATTTTGCTTGTATTTGGATATTAAGAGACGGAGCAACATAGGTTTTTGGTATACTTGATGAACATAGATGCAATTACTTACACAAGATAATCGAAATGCTTGTTGGTGTTTCAA\n>XM_015948335.1 PREDICTED: Nothobranchius furzeri homeobox containing 1 (hmbox1), transcript variant X1, mRNA \nTGTAGATCCATCGGCTCCCTGTCGCTCTCGTTGCTGGGATTTGTAGTCTTTGTGTCGAAGAGCGCCGCCGCGTGTCGGGGGCTTCGGTGGGAGTGAAACTACAGTTCCCTCTGAGCTGCTCGGAGGTGTTAGTTGTCAGTATGGCTGTTGTCAGACAGACAAAGCAGAGAGGCAAATAATTCGCCTCTGATTAGAAATCCTTGGAAGAGGGTCGCGCGGGGCACCGCCATCAGATTCGCGTCGTTGCTCGGCTGCGGCAGACCGCGCAGCTGCTCTCCGCTCTAGTTTTAAAGTTAGATGGTTACGTGGACGTCTGGAGCCGAGCAGGATGTCTGACTTCAGCGAGGAGCCGCGCTTCACCATCGAGCAGATTGATCTGCTGCAGCGGCTGCGGCGCACCGGCATGACCAAGCAGGAGATCCTGCATGCGCTCGACACTCTGGACCGGCTGGACCGGGAGCACGGCGACAAGTTTGGCCGCCGCACCTCTTCTTCCTCCTCCTCCTCCTCCTACCTAGTAGGCGGGGCAAACAGCTGCACCAACAACTCTGCCTCCAACACAACCGCCACGTTCAACAATAACACCGCTGCCTCGGCAACCACCACCTCTTCTGCATCGTGTAACGGTAGCAACAGCGGCGAAGGCGGCACCGCGGATCAGTCCGTTGCCGCCGCCGCCTCTTCCACGGCCTCTAAAATCTCTACAGCCACGCAAACTCAGTTTAGTACTGGAGGGGGACTTTCTCCGTCTCCCAGCTATGACACCTCCCCCCCTCCAGGGCCGCCGCCGCCCTCCGCCATCCTGCCGTCACCGGTGTCTCTGGTGGCGCTGTCTCAGAACGGCCGTGACAGCCTGGCTGCCACGCCCAACGGGAAGCTGTCCCCTCCTCGGTATCCGGTGAACAGCGCCGCAGCGTCCCGAGCGTTCGGGTTTGAAGCTGCAGAAGAAGACCTGGACATCGACGATAAGGTGGAGGAGCTGATGAGAAGGGACAGCAGTCTGGTGAAAGAAGAGATCAAAGCTTTCTTGGGGAACAGGAGGATTTCTCAGGCTGTGGTGGCACAAGTGACTGGCATCAGTCAGAGCAGGATCTCCCACTGGCTGCTGCAGCACGGCTCCGACCTGAGCGAGCAGAAGAAGAGAGCCTTCTACCGCTGGTACATCCTGGAGAAAACCACCCCAGGTGCGACTCTGAACATGCGTCCGGCTCCGCTGCCTCTGGAGGAGATGGAGTGGAGGCAAACCCCGCCGCCCCTCAGCACGGCTCCCGGAACCTTCCGGCTGCGGCGCGGGAGCCGCTTCACGTGGAGGAAGGAGTGTCTGGCTGTGATGGAGAGCTACTTTAATGACAACCAGTACCCAGATGAGGCCAAAAGGGAGGAGATAGCAAACGCCTGCAACGCCGTTATCCAGAAACCAGGGAAGAAGCTGTCGGACCTGGAGCGGGTCACCTCTCTGAAGGTCTACAACTGGTTTGCTAACCGGCGCAAAGAGATCAAGAGACGGGCCAACATTGAAGCCACAATCCTGGAAAGTCATGGGATTGACGTCCAGAGTCCGGGGGCACACTCCAACAGCGATGACATCGACGGGAACGACTTCTCAGAGCAGGCCTGTGACCTGCCGTACTTTGACAAGAGACCTCTGAGCCGACCGTTTGGCCTTTACCGCCTGGAGCCCACCTCACCCACACAGGATGACGGCGCCGCTCACAGCGAGCACCAGGACCCCATCTCTCTGGCTGTGGAGATGGCTGCAGTCAACCACACCATCCTGGCCCTGTCCAGGACCGGGGGGGTCCCCAACGACATCAAGACCGAGTCCCTGGAGGACGAATGAACTGGAGCAGGATGCAGCCGGGGACAGAGGAGACGACGGTGGATTTAAAAAAGAGACCAAAATAATCCTACTTAGTAAAGCTGC\n>XM_031476826.1 PREDICTED: Photinus pyralis uncharacterized LOC116163007 (LOC116163007), mRNA \nATGGATGAATTTTGTTCAGCAGAGAAAATACTCACTGCAGAACAGCAATACTGTGAGGATTATTTCAATCAAACTACTAAACGTGATTCTTCTGGAAGGTTTATTGTTAAAATACCTTTCAAACCTACTTTAAACAAATTGGGCGACTCTTATGACACTGCTTTAAATAGATTTTATGCCTTGGAGAGAAGGTTAAACAACAATCTGGAATTAAAACTTTCATATTCTAACTTTCTTAATGAATACATTACCTTAAATCACATGACAAAAATTGAGAGAGATAATCAGGTAGCCTTCTACATGCCACACCATTGCGTTCTCCGAGAAACAAGTGAAACAACTCGTCTCAGAGTGGTGTTCGATGGGTCATGCAAGCTTACGAATGGACTGTCCATTAACGATGTTCAATGGGTAGGCCCAAAGTTGCAAAATGAAGTAGTTTCAATTATTGCTCGATTTAGACTTTATTCTTATGTTTTAACTGGGGACATTACAAAAATGTATCGCCAGATTCAAATACATCCTGAACACAAAAAATATCAAAGAATTTTATGGAGGGAAAATGAAAGTGACGAATTATCAGTATATCAGTTAAACACTGTTACATACGGTACGGCGGCGTCTGCGCCATATTTGGCCATTAGATGTTTGATTCAAACTGCACTAGACAATGAAAAAGAATTTGGTTTAGAAGCTCAAATAATTAAGGAAGACTTTTACGTCGATGGCCTTATAACAGGGTCCGACAATCTACAGACATTAATGAGAATGACTATTAAACGAAATATACAACAAATTCTATTTACTGCAGGGTTTTCTTTGCAAAAATTTAAAAGTAATGTCAAGGAACTTAGGGATGATACTGATAATAAATCATTAAAACTGTCTGATAATCAAAATAAAGCATTAGGGGTAGGCTGGAACCCGAAACAAGATTCATTTTTTTACTGTTTTAATTCTTCTGAAATACCAGGACAAATTACCAAACGCACAATTTTGGCAACTACTGCACAAATGTATGATCCTCTTGGTTTACTGGCTCCAATAATCATTACTGCAAAATTGATGGTCCAAGAATTATGGCAAATTAAATTAACATGGGACGAATCAGTTCCTGCTTATTTGCATACAAAATGGTTGACGTTCAAAAACAAATTACATTATATCAATGAAATAATCATTCCGAGACAAGTTCTCATATCCGATTATAAGGTAGTTGAATTACATGCATTTTCGGACGCATCTCAAAGGGCATTTGGAGCGTGTCTTTATCTAAGGTCTATCGATGGTTATGGTAGAGTAAAGGTAGCACTTTTAGCCGCAAAATGTAGGGTAGCGCCATTAATAAATGTCAAATTACCGCGACTTGAGTTGAGTGGAGCAGTTTTGGCAGCTCAATTAACCGATAAATTTAAAAATATATTACGAATAGACATAAACAAACAATATTATTGGTGTGATTCCATGATTGTACTGGCGTGGCTAAAAAATAATCCAAATAAATGGCAAACCTATGTTGCCAATCGTGTTGCTGAAATACAGAGATTTAGTAACCCGGAAAATTGA\n>XR_005729805.1 PREDICTED: Ictidomys tridecemlineatus uncharacterized LOC120886716 (LOC120886716), transcript variant X8, ncRNA \nGACTGGGCTGGATAGCCTGGAGGAGGGCCAGCTGGGAAAGGCATGATTACTGTCCTCAAACACCTAGAAGAGCATCGCATGCGGCCCCGGGGGAAGGGGCTGTTAGGGGGAAGCAGACGACTGCTCCTATAAAAAAGGGACTTTGAAGAGGTGGAGCTGGCCAAAGATGGAAGAGGGGCCTAGAAGACGGCCAGCAAGGCAGGACACAAGCACAGTGGATGCTGGAAGGGGACTCAAGCCCCCACAGACAACTGCTGCCAACAAGCAGAAAAGGAGAATGTTTATGCAGCCTAGTCACAAGGGAAATGACATGAGGACATGAGGACCTCAGACGGCAAAATCAAGGCTTCAACACCTTTGGGGAATCCACAGCACAAGAGCCCCTATTTAAGTTCAACCCCAGAATGAGATCAGCTGACACTTGTTCACTCCTCCCTGCGCCCAGGAAATACTTGGTTATGTGTTACTGACTGAAGATTTGGAGTCCCTGTTTCCCATGTTCACTCAGCATCTGACTTGGGCTCCCTGGGCCTCAATTCCTCCATCTATAAAATGAAAGTGATAAAGTGATACTGGCTTACCACGAGAACTATCTAAAGCTCCTGTGAGAGTTCCTGAACAGTCAGGTCTGTGCCAGCATCACTCCTCCAAAAAGCCTTCCTACAGTCTCCCCAGGACCCTCTGTGGCTCCTCACTGGGCTAGCACCCGTGTTTAGGTGACCCACAGCTCCCTGTCCATCACTGTGTGTTTATACCTATTTAATGTTCCTGCATCTGCCTTTAGACCCTGAGCTTCCTGAAGGCAGGGACCATGTGGTTCACATTTCTAACTCCATCCCCGGACCAGAAGAGGCACCAGGTTCAACAATGCAGGAGCTTCTCAGGCAATGTTTTAAATACAATAATGATGGGAAAGCAACCTCTAAAAAGTCTACTGTTCTTTGAAAGACTGACCAGCAAGGAATACTAAACCTACTGAGGACTCCAAGCTGGATGGAAATCAATCTTATTCTCTACTCTCACTGGCTCCCGGAACAGCACCTGGTACTCTAGGAAACTGCCCACACGAGTGATGACCCTCTAGAGACAAACCCCAGCTCTCGGTGCCCAGCAGACCGGCCTTGGACGATCCTCTCCAGCTGATCTTGCTTATCTTGACTCCTGGACAGCCTGCCCCTTGTCTCCCCTTAAAATTTCTGTCTACTTGAGCCTGCTCTGCTTGGATATCCTGAAGGTCATCTCGTCCCTAAAGTCTGCCTTGACTCCCTCCATATTCCCATCACAGTCCTATCCTCTAAACAGCCCATCTAGTCCACCTACATCTTTCCAGGCACGGGATGCAGGCAGGCTTTAGCTACTTTTAAGTCTTCTCTCCCCAGGATGTCAGTAATAGCAGCAGCTGACCCTTAATGCCTCCTCCCTACCATGTACACCTTTCTTCCTGCTAAGACTATAGTCAGGATATCACCACTTCTGTTTGCAAGTGAGGAAACCGAGAGGTTAGCACCTAGTCCAGTCTCACAGCTCTAGTGGCAGCCTGGGGTCTGAACCCCAGCATTCTGACCCTGAACTATGCTCTAACTACAGGTCTGTATGACTTCTGGGGTGTGGGCTTCTCATTGTGCCTAGCTCAGCCACACCCATGTAGGCTTAATAAACGCTATTCTTTTGCATTCCAAGGAA\n>XM_021191354.2 PREDICTED: Mus pahari transmembrane protein 140 (Tmem140), mRNA \nACGCCAGTGTGGGTCATGTGTTCCCGTGAGCAACAAGAAGTTGTTTACACTCTTCATTTCTGAAAAGTCATAAGACACAGGCAAGTTAAAGAACGAAAGTGAAATCAGCTGGTAGTGACATCAGTCAGCACAAATGTACCAAAGTTCAGAGAGCTGTTTACTTGAACGCGGCTGCCTGCGAGTGCGGACAGAGCCCAGGAGCTCTGAGCTGTCTGCTTGCAGCTTCTCTCCTCTGCCCTGCTTGCTGGAGCCTGACTTTAAAAAGCAGCTCAGGAGAGGATCGACTCCCGGACAGACAGACGCTGATTTCCTGTGTCACCTTTTGATGAGTGTTCCTGGGCTCTGGCGCTGGTTTTCGCCTCCCTGCAACAGCAGAAGATATGGCTCTCTCCAGGCTGTGGCGGAACAACCACCTGCCCTTCGTGGGCATCATGATCCTCTTGGCCGCCGCCCTGTCCCTGATGTTCTACGCCCTCCTCTGGAAGGCTGGCAACCTCGCTGACCTACCTAACCTGAGAATCGGCTTCTACAACTTCTGTCTGTGGAAGGAGGACATTGGCTCCCTAGAGTGTTACAACTTCCCTGAGCTGGAGATGCTGGGCATTCCTCAGGTTGGCCTAGCCCTGGCCAGGCTTGGCGTGTATGGAGCCCTGGTCCTCACAATCTTCGTCCCTCTGCCTCTCCTCCTTGCCCAGTACAACAGAGATGAGGGAGAGTGGCGGCTGGCCATGGGCTTCCTGGCGGCATCCTCGCTTCTGTTGGCCTGCGGACTGAGCCTCTTCCTCTCCTTCGTGTGGAAGTGGCTCAGGCTCTCCTTCCTGGGGCCTGCCTTGCCAGCTCTGTGCCTAGCCCAGCTGTTACTCATCTTCTTACTTGTGGCCACGGTTAGGTTCCCGCCACGGGACAAGGAGGACAAGAACCAGTGGGAGAGGTGTTAGTCCGGTCTTACACAGGCTTATTATGGGATTGCAAGGGTTTGGTTCCAACTGTGCTCCAAGAAGGGGCCAGAGGACCTGTGGCTGGGTGGGTCCTCTCAACCACCCTGTATCATAACCAATGTTGATCTCCAGCACAGCAGCGGGAACCACCCACTGTGCAGACGGCTGTGGTGTCAAGGAAGCCAGAGGCGGCTTGGAGGGCTAGGGTACCTGCAGTTTCTTAGGGTACCACGTAGCTCATTAGCAGAGGGGTTCCTATAGCCCCAGGCAGGTGGGAGTCGTCAGAGGCCAAACTTCCAAGCTATCTTGGCAAAGTGTCAAACTAGAACTCTGTGACGGTTATGGCAACAAATGGAACAGTTAGGGAAAAAACAAAACAAAACAAAAACTGCTTTAACACCGAGTCCTGACAGCACAAAGAGAAGCCTCACTGACTTTTCAGGGTCCCCTGAATGGGTCCCTGGACCTGACAGCAAACGGTAATCAGCTGTTAAACCATTCTTGTGACCCAGGGGATGCAGACACAAAATGTGTCAAAGCCTGGAAGGTGAACAGGACTGAATAGTCGTCACAAACACACAACGCGTCCCCTCACCTTACCCAGAACTGGAAAGGCAGAAGCATGGTCTTTATTATGCATTGTGGCATCCTTATATATTTTGTTCAGTGTCTATGTATCAGAAAACCTACGTGCCAACGAGTTCTTCATTCTGTGCTCATCAGAAGCCAAAGTGAGTATAAAGA\n>XM_051505439.1 Emericellopsis cladophorae uncharacterized protein (J7T54_008404), partial mRNA \nATGCCTTCTGCCCCTGCTCTCGGCGCCCTGGGCGTGACCTTTACGGCCATGCGCGTCATGGAGGGCATTGCGCTCCTCACCATCATCGGCCTGTCTGCCAACTTTATCAGTGACGCCGTCAACGCCGGCTACGTTGCGCCTCCTCCGCTGGTCGGCACTCTTGTCGTGTCCTGTCTGGCCACCCTGTACATTGCCATCAGCTACATCCTGTACTACGACTCGATGCTGCCCATGCTCATCGCCACGGGCGCCGACGCGGCGGTCCTCATCATGGTGATTGTCGTGGCGGTGCTGCTCGGCAAGCCCGTCAGCTACCTCCAGTGCGAGTCGTACCCGTCCAAGGGCAACACGGCCAACTTTATCCACTCTGTCTACAGCAACGTCAAAAAGACCAACTCCAACGTCTTCCTCTGGGTGGACCCGGACAAGACGGCCTGCTACGAGGTCAAGGCCGTCTGGGGCCTGAGCACCGCCCTGTGCATCATGTTTGCCATGTCTGCCATTGTCTCCGGCGTGGGGGGACAGGCTTCTGGTCCGAACGTGCTGCGAAAGGGCCGGAGTCTGGGCACCACGGCGGTGACGGGGCCACAGGAGCGCAAGCTCGCATCGCAGGGATCCGTGGCGTCGTCGTCGTCGTCTTCTGGCGGGTCCAACGTCCACGAGTCCTTGCCCCTGCCTGTTCCTGTTCCCGTTCACCGGGCCTCCCCGCCTCCCACGGCTTCTGAGCGACCGTCACGGTTTGGAGAGGTGGCCCGCCCCGTGGAGAGCCTGCCTCGGCTTCAGATCCCACCGCCACCGCCCATCCCGGAGGATCCTTCTCCTTCTCCTTCTCCCCAGCCGCCGCCAAAGAGTCCGCTGAGCCCGCTGCTGGCGAGGGCTCGGTCGAAGAGAAGGACCATCATGTCTAGGGTGGAGGGCTGGTGGGATCTGGGGTTGCTGGACAGACGGCAAACACTGTTTGGCAAGAGGGGTTGA\n>GQ040491.1 Uncultured bacterium clone nbw955c02c1 16S ribosomal RNA gene, partial sequence \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGACGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATGGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACAAATGTGTAAGTAACTATGCACGTCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGAAAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTGTCTGGTCTGTAACTGACGCTGATGTGCGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAATCTTGACATCCTCTGACCCCTCTAGAGATAGAGTTTTCCCCTTCGGGGGACAGAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTAAGCTTAGTTGCCATCATTAAGTTGGGCACTCTAAGTTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGATTTGGGCTACACACGTGCTACAATGGACAATACAAAGGGCAGCGAAACCGCGAGGTCAAGCAAATCCCATAAAGTTGTTCTCAGTTCGGATTGTAGTCTGCAACTCGACTATATGAAGCTGGAATCGCTAGTAATCGTAGATCAGCATGCTACGGTGAATACGTTCCCGGGTCT\n>FJ241711.1 Uncultured bacterium clone E53LV6Q02JNG4U 16S ribosomal RNA gene, partial sequence \nTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCCCTCGGCTCAACCGAGGAACTGCGCCCAAAACTACCGTGCTCGAGGAAGATAGAGGTGAGCGGAACTTAGGGTGGAGCGGTGAAATGCGTTGATATCCTAAGGAACACCGGTGGCGAAAGCGGCTCACTGGATCTTTTCTGACGCTGAGGCACGAAAGCTAGGGTAGCGAACG\n>XM_033909212.1 Saccharomyces paradoxus Par32 (SPAR_D00700), partial mRNA \nATGGCTACGTTCAACCCCCATAACGAGATGGAGAACCAGGCACGTGTACAGGAGTACAAGGTTTCCACCGGCAGAGGCGGAGCCGGCAACATCCATAAGTCTATGTCCAAGCCGTCTCCCGTACTTCTTCCTTTGAAATCCAACTCAAAGCCAGCAGCAAACAACAACAACAATGGGAGCACACAGGAAAAGGTTCCGCGTTTTGCAATTGGCAGGGGCGGTGCTGGCAATATCTTTCATGATCCGCACCTGACGAGATCCGCCCAACAACTAGACTCCAACGATAATATCAACTATAACGATGTGATTGATGACATTGACGATTATATCTCCCCTATAACTTCAGATATGGTCGATGAAGATGGGCCAAACGCGGTGACAAACACCAGGTCTCGTATCAGCGCGACAAGGAGCCACCAATCTTTGCACGCTTCCACTTCGTCTCCCAACAACAAGGCCCCAATTGTCGTTGGTAGAGGCGGGGCAGGAAACATTTTCTTTAACAAAAAGAAGGTATCCAGCAATGGTGGAAACGAAGAGGACGAGATACGAGGCGGTAATGTTGAGGATGAGGATACGATCAATGCAAACGAGGACAATTTGTTCGTGGTGACTTCGAACGGCAATGCATTGGCGGCAATAAAGTCTACATCCAAGAAACCCAAAAATAAGCACAAGGGCAAAAGCGTGCCGGAAAAATTTGCCATTGGAAGAGGCGGCGCTGGGAACATAATTTCGCCCAAGTCGAGCAGGAACACTATAAACCACAACTCAAACGATGATGATGAGGATGAAGTTAATCTGAAAGACGACAATAGTAAAGAAAAGAAGAAGAAGAAGAAGAAAAAGAAATCGGGGTTTTTCAATTCTTTGAAAACTATGTTTAATTGA\n>XM_008090460.1 Glarea lozoyensis ATCC 20868 hypothetical protein mRNA \nATGACCGGCACTCGATTGTTTGACAGTTCCTTACCCGTTGGGAACAGGTCTGTCGTGGTCAGAGAGCACTACACACTTGAACGCTGCAATGGCTGCTTTGACTCTGATGTACACCGCTGGGGTCAATTCGAGCATTCAGCCCGTGGTGGACAACTCCTTTGA\n>XR_006437666.1 PREDICTED: Triticum aestivum uncharacterized LOC123078769 (LOC123078769), transcript variant X30, ncRNA \nAAGGACCAGCGATGGAAACCCTAGACTATCGTTTCCCCAGTCCCGCCGCCGCACGCTCTCCCTCTCGCGTGCTCATTCTCCCACCTCTCCACCTCCAAGCCCCTGCTTCCGCACGTCATTCTTCTCCCATCCTCGCGTCGCCGGTCTGGAGGCTAGAGCTTGTGGCCGACGCCTCCGCTCGCCATTTGCCACGCCTCCGGATCTGAACTCGCCCGCGGTGGCAGCGATTGGTGGATGAGAGCCGAGTCCTGAACGGGAAGCAGCGCCTGTCCCTGTCCCACTGCCGTTGGAGAGGCAAGGATGGTATCGGCCGTGCCGCAGCAGCTCGGCGGCTGCCACTTCTTCACATCCCCATCGAGTCGGCGAGTCGCCCTCTGTCGGGCCCACGGAATCGGCTCCCATGACTACACGTTCTTCCTCGGCCTGTTGTAAACCATGGTTCTTCTCAAGCGCGGGCTAAGGTGGCACCATGGCTCGTGCCAAGGAGGCAGCAGCGACCTGCAAACCCTGCAACCAGCAGTAACACGACATGCTGATATTTCTTCAGGGCGTGGCTGGACTCCCCTCCCAGGATCTCACTCCACCACGGGGCCTTCCTGCTGTGAGCCTCTCTGGACGGGAGCTACAACGCCCGTCCCCATCTCACCTTAGGCAAGATATGTGTAGAATTTGGAAAGGACTTGCGAGCTAGGAAAATTTGGGAAAGGACGTTGGGAAGATAACTAGGTTTTCAGTGTGGAGGAACATGACAATTTGAACCAACTAAGATGCAAGGGCATGCTTCACATGGATTCAGACACAATTTTTTTTGGGAATAGATGGTTTTACTAGCCGATGGCATCAGAGGAGCAGCTGCAAGCGCCGAGTGAGGAATTTTCCTTTTGCTCGCATGTGTCTTGTGGTCACTTGAAACAGAGCACTACCTCTGCTTGCAAGTGTCAGAACTACAGGTTTTTGGCTGAACATTCAATTGTGGCAAAATTTTATTGATCCTCATGATTTTGAGATCTAGTGTGCCTTGTTAGTTTGGAATCAGAAGATGCATGCATGCTGCAACCTTCCTGCTTATCAATTAAGTTCTCTGCATCCTAAACTCGCTGACCTGGTATGATCCGTGTGATTAAGAGATGTTTCACCTTTTCTCCATAACAATTCTACAATGCCCCACAAGAGGGATCCACCACGCCGGTGGACTTCACTTGCCACTCCGGGAAGGGTTTTCACATTCCATTTCCATCCATCAGCTTTTCAGTTCTTGTTAGTTTTCACATTTACATTTCACCATATCGGGGATTTAGAGGGCAGCACTTCTTTCTTGGTTATATTAATCAGCCGCATTGTTTTGTGATTACAGAGAAGAAATGACTTCAACCAGGGCAAATTGATAGGGAGGATAGATTACGGCGAACTGTCTATGTCCCAAACATTGATCAACATGATGCTAAATAGAAGCTTGCTCAGGTTTTCTCAACTTGTGGCCAAACCCTACTCAAGCATCTACACCCTCTTCAGCGACCGACGCCCTGTCTGATGGAAACGAGAGACGGGCGGTCGCTCTGCTTGAAAAGAGAGACAAACGGTCTCTGAGCGAGGGAGGGGCGGAGGTTCGTCTTTGCCGGCCGTATGACATTCCTGGTTGCTGGTGGAGGTGCAGGGCGCTCACCTGATTTAGGGAAGGCACCGTGGCTGTTCGGTGAAGCGGGTTGATGAAGCTGATGTGCTTTGTTCCTAAAAACAATGCATCATCAGTTCCTGGAAGAGTTCAGTACATGCACGTGTATATGTTTCTCTGATGCTCTCCTGTCGCGTTCTTACTCCGGCAGCAGAATCTCAAGCAACTATGGTTCTCGGACTAGGTGGCCCCTCTATCTTCATTTTTATTCTCCAGTACGATCACTTCTTTGACCCAACAATTCCGTTGTGCTATTTTCTTTCCAATCTCAGAATTGTACAGTTGGTTTTCATCCTAGTTCTTCAGGCAAAATTTGAAGTTTTGCTCCCATTTTTGGTTTGAGGAAATTTAACTTGCAAAGCTACCGCCAGGTGAATTAATTAGGTCCCATGGGTTTGGATACCTCATCTCTTCACTGACTGCATCTCTTCATGTTTCCAGATTGTGCATTGGTCTAGAAATACATACTTAACTCGGTAATGTGGACTTCACTACTGTGGTACACTGTAAATGGCAAGCTTTTACATGAAGCACTTTTGGTGATCCTAAGGATTTGCTACAGAAAAGTATAATATGATATTGAGTTTCATTCTCTTCCTTTCTGCATTTCCTTGAATATTGTGCGTTCAATTAGCTCAACCGGATAGCAAGAAATGTCAAGGGTTAGCTCTTCTGAACATATTCCTCATGGTAGAAATGGCTGGTATACATGCCGACACGCCCATCCGTGTGTTCAAGACTGGCTGATTCACACCATGGCTGATGTGTACACACAAGCTAACCAAAAGGAGCAGAAAAGGGGTGCACACAACATGTCTGCTCGTTAATAACAAGTCAGGAGGGGGCTATCCAAGGACGAGAAAGCTGGGAAGCTCGCATTGCAGCTTTGGCTTAAGCTGTGAGCACTTTTTCGTCAGAGAAGCTGTAGTTTGATGTTTTGGCCAAGCAATGGGCTGTTGTACCACAATGGTGTTCCTAATTGTTGGCTCTTCCATATAGAAGCTCTGAAACAAAATGAGATGGCCTCAAATTAAGGACAGTTAAACCAGCTGCTCCGAGAGGGGATGTTGAGGATAACGACAATGACGAGCAAGTCGGTGTTTGTGAAGCTTCGCCTGAGCCATTCCAGCTCTTCCAGAGGCACAAGGAGAGCCTAAAGTCAGGGTACGTTCAATCGAGGACACTTGATTCTCCAAGAATTTGTTGAGGATAACAATGGCAACGAGCAAGTCGGCATTTGCGAAGCTTCATCAGAGCCATTCCAGCTCTTCCAGAGGCACAAGGAGAGCCTAAAGTCAGGGTACGTTCAATCGAGTACACTTGCTTCTCCAAGAATTTGTATAATCATTAGAAGTCCAAAGAATGAGTCAAGCCAAAGATATGAAAATGGAACACATTTGCGCTCCTACGAGAAGAAGGTCGCGCAACTGAGGATTCAGGACGCCAACAGTGCGGAGCTGTTCGCCATTGAGAGGACCAGGGCTGCCATCAGGGACATCTGGACCAAGTTCAACATCTCCCTTGCCTCCGTCAACGCCGGCGACCGACTCTACAAGCGTCTAGCTGTGCTTTATGACATGATGAATGCTGCCATCGCTTGCTTTTGAGCACCTACAAGTTACCCTGTTGCATGTAATCTCTAAGACTGCCACTCATCAGGCTTGCATGCGCCTGTTAATACCAGGGCTATAACAACACTTTTATGTGTATATACTCAGTTCTGCTTCC\n>LN810097.1 Uncultured bacterium partial 16S rRNA gene, clone HWB-4 \nCGGACGGGTGAGTAATGCGTAGGAAGCTACCCGATAGAGGGGGATACCAGTTGGAAACGACTGTTAATACCGCATAATGTCTACGGACCAAAGTGTGGGACCTTCGGGCCACATGCTATCGGATGCGCCTACGTGGGATTAGCTAGTTGGTGAGGTAATGGCTCACCAAGGCGACGATCCCTAGCTGGTTTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGTAGGGAGGAAGCGTTGAGTGTTAATAGTACTCAGCGTTGACGTTACCTACAGAAGAAGCACCGGCTAACTCTGTGCCA\n>XM_029018326.1 Cryptosporidium ubiquitum uncharacterized protein (cubi_01314), partial mRNA \nATGGAAAACGAAGCAGAAGAAAATTTCTCAAAAATGATTAAAGCTGTAAATCCACTTTCTAATGATCAAAAGGTATTTTTGGATTTGGGACAAGAAGGTAAGGCCATTCCAATTGATGCTACAAACACAGGTATTTATGAGTATAATATTACAAAACCAATTACAATCACCAAAAGTGGTTCTTATGTTGAGGATGACGATTCATGTTTAACAACTACTATAACTACTAACGAACTTTGTGATTCAAATAGTGTTCTCTCTGTTGCTGGAGCGAATAACTCAGAAGATATACAAACAGAAGACTCAAAAACAGATGTTCTGGCAAATAAAGATTCTAAAGAAAAACTAGAAGAGCAATCTGCTTTTGATATTCATCCTATTAATATTGACACAGGAGCTGAGGAATTGGTACAATCCGCACAAAGTACCTCTAAATCAGGTCGTCGTTCATCAGCAAATCATGAAGTTGGTTCAAGGCAACTGAAATACAATCAAATTGGAGTATATTGGAAAGATAAAGAAAGCAGAGTTTATGCTAGGTTTACATGGGCCACTAGAAAGTATTCTAAAAGCTTTTATGTGGGCCCCAATAAGCCATATGCTACTGTTAGGGATGCAGAAAAGGCTGCTATCAGATTTTTGTTGATTAATAGTCCATTACATAGAAGAAGCCACTTAAAACATTTTAGATTTTCAGAAAGTGATGAAGAAGGAGAAGAGCCTTATGTTGGTTCTCAAGCACTTAAGGAGGCAAGAAGGACCAAAGGAATCATGTTACATTTCCCTGCTCCTGAAAGTGATGATGAGGTTTGGTCTCATTATAACACTTCCAATATCAATCCTGCAACCTTGTATGGTGAGATTATTAAGAAAATGGATAATAGTGAAGGAAATGCCGCTGGAATAACTAGCCCAATTACATCTGCCAGAGAGTATGTTACAGCTAAGCATAAGCAGAATACCAATACAAACCAAAATGAATCCAAATTTTCCGCTTCCCTTCCAGTAAATTCTACAATTGGAGAAAATGTCTCTTCTGATGACTTATTTTTGGCATTAATGGCAAACCAAATTGAATCCGATAGACTAGTAGAGAGGCAGACTACGGGAACATATATGAACCCATCAGCCAGTTCAACTACTGTTTCCTCTAAGAGATTTAAACCAAATTCCAAAACAGAAACTCTTGATTCTTCTGAATTAAACTTTTTCCCCACGAATTCGAATCAACTTGGATCGGCATTTATGGATCAAAGCTCTTCAACTACCTCCACTAATCCTTTTGTTGGTATGGATTATAATACTTTGGTCGCTTTACAACATGCTCAAATGGCAAATTATTATTTGCAACAGCAAGTGGCATATGCAGCTGCTGCTAATCTTGCAATATCATCAAATACTAGTGGGAACTATGCTAATGCTGCAATACGTACAAACCCATTCATAATTCCACAATATTGCTTGGCACCTGTTACTGGATTAGAATCCAATAAATCTGAAGAATCAGAAGTTGATAAACTCCAAGGTGTTACTTTAAATGTTGGTGGTCTTAAAGGTTCTACTCAGTCTAATGCTTCTAACTCTGTTAAAAACATTGCAGAATCTACACTAGATCAGTATGGTGCAATAATGCCAGGACAAGAAACAAAGGCAATGCCTTCTTCGAATATTACTATTTGTGGTACAAACATTCCAAGTAATTACCATACGGATTATATGGCTGTTATGGCTGCTGCATATTCAGGTTGGTATTCGCCTTATGGATACACTATGCCTTTTATGGGATCATACACCCCAATGATGCCTTCGATTATTCCGAATCCAAATGTATTGGGAAGTCAATTTCATAATAATATAAGTCTATCTACAAATACAACTAATGCAGGTCAGGTTCAATCAAGCAGTGTTAATAATGCTGTTCGATTGCAAAAACAGGTAAATAATAATGTTAATTCCATTGAATCTCTGGTGAACACTCGGGTAGAAAAGGAATTACAATCACAAGGTACTTCAGAACAGGAAAATAAACAAGTACCCTAA\n>XM_027495983.1 PREDICTED: Abrus precatorius uncharacterized LOC113862782 (LOC113862782), transcript variant X4, mRNA \nTGCAATTGTACCTTCCCTATGTGAACAGTGATTTCTCCACAACAACCCTTTTTCTCATTCTTCCCAGTGTTTAGCTTTCTCAATTCAGTTGGTGCTGAATGGAAGGTATATTCTTTCTAGTTTGGAATCCTTTCAACTTTGTCTGAAGAATGTTTCAGAATCCTTCTCCAGATTAACATTTTGAGATGGTGTTATATGAGCATTCAGATGTTTTTCAATGGGGTCTTAATATTCTTGACGGTGACCCTGCTTATAGTCCTGGATACTATGGCAACATAATTCAACATGATAATGGTGACATCTATAATGGACACTACTTTCATAGCCATTATGGTAATGAATGTAACCATGTAGAGAATGATGAGATCATTGCCCGCACACTTCAAGAAGAGTTTTCACAGCTGGAGATTGCTGAATCTTCAGGATATTTACAGGCAGGTGAAGAGCAGTTCCATGTTTCTGAGACTGAGCCTGCATATGATTGGCATAACTCTTCAATGGTGAACTATTGTTCAGGAGGAGTTGGTGATGAAGAACCATCTAGCTCATGTTCAAGTCCTTGTGAAAAAGAGGAATATTCATTAGAGCTAACTGACAGTTATCCACTTGATGATGAAGTAGGGAGGAGATTGAGTCAAATGATACCAATTCCTCATGTTCCAAAAATTAATGGAGAAATTCCTTCAATCGATGAAGCAACTTCAGATCATCAAAGGCTTCTGGATAGATTGCAGTTATATGACTTTGTGGAGCACAAGGTACAAGGTGATGGTAATTGTCAGTTCCGTGCTTTATCTGATCAATTGTATCATGCACCTGATCACCACAAGTTTGTGAGACGACAAATTGTCAATCAGCTCCAATCGAATCCAGACATATATGATGGATATGTTCCCATGGAATATGATGACTACTTGGAGAAGATGTCTAAGAGTGGAGAATGGGGTGATCACGTCACTCTTCAAGCAGCTGCAGATTCATATGGTGTGAGAATATTTGTGATGACTTCTTTCAAGGACACCTGTTGCATAGAGATTCTTCCTCATTTTGAGAAGCCAAAAGGAGTAATTTTCTTGAGTTTTTGGGCAGAGGTGCATTACAACTCCATTTATCCCCAAGGAGATATACCTTCAAGTGAGTCGAGAAAGAAGAAAAGGTGGTGGAACTTTGGGAGCAAACATTAACTACACCCCTTTTTAACACATTTTTCCATGTTCAGGAATGAATTTATATCCCCATGTTTTTAGCCGGTCA\n>XM_035510062.1 Lasiodiplodia theobromae Gaba permease (LTHEOB_1369), partial mRNA \nATGGCGCGCTCCTCTACCGAGCTAGATGTGCTGCCCGCCGTCTCTTCCGGGAAAGAGTATCACAACATGTCCTCACGCGAGCTGTCTGCCGGCACCGACGATGATCTCCATGAACAGAAGGGCATTACTCGCCATGACCAAGCCGATATGTCGAGAATGGGCAAGGTTCAGGAGCTGAGGAGAAATTATCGCCCGCTGTCCGCCATTGCTTTCACAGTAATTCTCCAGGGCACGTGGGAAGTGCTGATGACTGCGACAACCCAAGGTTTGGTTGATGGCGGTTTGGCTGGCCTGATCTGGAGCTATGTGTGGACCTTTGCTGGCTTTAGCTTTGTTATGGCTTCACTGGCTGAGATGGCTTCCATGGCCCCTACTTCCGGAGGTCAATACCATTGGGTCTCTGAATTTGCGCCTGCAAAGTATCAGCGCTTCCTGAGCTATTTTACGGGATGGATGTCGACCATGTCATGGCAGGCCGGAACCGCGTCCGGCCCATTCCTTGTCGGCACGCTGATTCAGGGCTGTGCTATCGTTGCTTATCCTGACTACTCTCCGACGAATTACCAAGGCACGCTCATGGTTATTGCCGTGGCCATAATCGTCTGGATATTCAACGTCTACGGTGCTCACGCCATGCCCATTCTTCAAAACCTGATGCTCATCGTCCACGTCCTTGGATTCCTCACCATCATTATCGTGCTGTGGGTTTTGTCGCCGCGCAACACTGCTGAGACAGTCTTCACCGTCTTCACCAACGATGGCGGCTGGAACTCCATGGGCCTGAGTTTGATGGTTGGCCAGATTTCAGCCATATATGCTTGTATCTGCTCCGACGCTGCCGCTCATATGTCCGAGGAGATTAAGGATGCCGGTGTCGTCGTTCCCCGTGCCATGGTTTGGTCATACGTCATCAACGGCGGCCTCGGCTTCATCTTCCTCGTGACATACTTGTTTATGATTACCGACGTGGAGGCTGCACTTGAGGACTGGTATCCCCACATCTGGGTCTTCCGCCAGGCCGTCAATGATGCTGGCGTCGTGGGTTTGAACGTGATTCCCACCGTGCTCATCTTCGCCGGCACCGTCTCCTACAACCTGTCCACCTCGCGCCAAACCTGGTCCTTCGCCCGCGACAAGGGCGTCCCGTTCTCCAACTGGATCGCTAAGGTCGACCCGAAGCTGGAAGTCCCCATCAACTCCGTCACCGTCACGACGCTGATCACCATCGCACTGTCGCTCATCAACATCGGCTCCGACGTCGCCTTCAACGCCATCATCTCCCTCAACGTCGTCTCGCTGATGATCACCTACATGACCTCCATCGGTTGCGTCTTGTGGCGCCGCATCTACCACCCGGAGACGCTGCCGACCTGCCGCTGGAGCTTGGGCAAGTGGGGCGTGCCCGTCAACATCTGCGGCTTTCTGTACTCGACTCACGCTTTCTTTTGGTGCTTCTGGCCGAATGCTACGCCCACGGATGCCGAAAACTTCAACTGGGCGTCGGTCATGTTCGTGGCTGTGTTCATTTTGAGCAGTATTTATTATGTCTTTAAGGGCAGGAAGGCGTACGAAGGCCCAGTTGTGTTGACCGAGGGCTGGAAGGGCGAGTGA\n>XM_020885145.1 PREDICTED: Odocoileus virginianus texanus zinc finger protein 300 (ZNF300), transcript variant X2, mRNA \nGGTCAGGTGCAGGCCTGTTCGTATGCTGCTGCCGCCATCTTGGGTTGCAGGGCCTGTGCAGGCTTCTGCTCACCACAGGCGGAATTGGGGTTCAGCATAGCGGTTCTGCACCGGGAGCTGTAATGTGATGGGTTAGGTGCAAGGCCTCTGCAGAGTGTCCTATACAGATAAGCAAGTTGCAAGTTGGAGAGTCCTACATGGCAAGATATTGAGGGTGGCTTCCTTGCAACAATCAGCAAGGACATGAATGCCCTTAGTCCAGCAATCTTTGAGGCATTAAATTCTACCAACAATCATATAATTGAGCTTGGAAATGAATCTTACCCCATTTGAGTCTTCAGATGAGAGACCCCAGCCTGGATCAATACCTTGATTATAGATTTGTAGAACACCTCAAAGCAGAGGATTCAGATAATCCATGTCCAGATTCCTGACCCACAGAAACTGTGAAACAATAGATGTGTGTTGTTTAAAACCACTAAGTTTGGGGCCCAGACAAAAGCTCTGAGTAAACTGAATTCCTCTGCTTGTACGGAACTGACCAATCTAACAAGATGGCGGCTCCCACTGAGCCACATAGCACGGGAGTGGCCATATTGCCTCCTGAACAAAGCCGCCCAGGGTGCAGAGTGGGTAAAACTCCGCTGTACGGAACAGTGCACGCCGGGGAGCCCCGCGCTTTGCTCACCCAGACAGGAAGCGGGAGAATTCACCACTATGGATGTGACAGCTGTCTTGGATTGAGCCGTGATGGGCGTTTCTGGAACTGCAGGAAACATTTATTGAACACCTGCTGGGTGCCTGGAGACTGGTGAATATAGAAACTGCATTTTGCAGCCCATCTGTGAAAATACCCTTCTGATCACCAATTTTGCCTTTTCAAGCATCTGCCATTTTAGAGGAGAGCAGAAAAAGATGAAGTCCCAGGGATTAGTATCTTTCAAGGATGTAGCTGTGGATTTCACCCAGGAGGAGTGGCAGCAACTAGACCCTGCTCAGAAGACCCTGTACAGGGATGTGATGCTGGAGAACTATAGCCACCTGGTCTCAATGGGGCATCCAGTTTCCAAACCAGATGTCATTTCCAAGTTGGAGCAAGGAGAAGATCCATGGATCATTAAAAGAGACATACCAAATTGGATCTGTCCATATGAAGACCAGACAGATGGGCGACTAGACAGGAAGAGTAACCTTGACAACCCCCAATCATGTATTTTGGGGTCTGTTTCCTTACATAATAAGATATTGAAAGGATTCACAAAGGATGGTTCATTATACTCCATTTTAAAAGTCTGTCAAAGTGATGGCCAGTTACAGAGATGTCAGAAAAACAGACTTTCCACAAAAGTAACAGTCATCAACAACAAAACAATGACTGTAGAGTCAGACTACAAATATGAGGCACTGAGGAAAATATTTCAAGAGTGCATAGAGTCAGATGCTTCAAGACAAAGACCCTATAACTATGATGCCTTTAAAAAGAACTTGAAATCTAATATTGACCTACCTAGTTGTAATAAGAACAATTCAAGAAGAAACCTTGAGGAGAGTTCTGGATGTGGAAAATCATTCATCCACAGTGTGGCAAATTCTAACCTTGAGAAGATTCACAATGGAGTAATTCCCTGTAATGATATTGAGCATGGAAACATTTTCGGCAAGAAGCAATCCATTATTCATTATCAGAATGTTGAAACCAAGGAGAAAACCTGTGTGTGTGTTACATGTGGAAAAGCCTTTGCTAAGAAGTCACAGCTCATTGTACATCAACGGATTCATACTGGGAAAAAACCATATGATTGTGGTGCATGTGGGAAAGCCTTCAGTGAGAAGTTTCACCTCATTGTACATCAGAGAACTCATACTGGGGAGAAACCTTATGAATGCTCTGAATGTGGAAAAGCCTTCTCTCAAAAATCATCTCTTATTATACATCAGAGAGTTCATACTGGAGAAAAACCATATGAATGTAGTGAATGTGGAAAAGCCTTCTCCCAGAAATCACCGCTCATTATACATCAGAGAATTCACACTGGAGAGAAACCTTATGAATGTAGAGAGTGTGGTAAGGCCTTCTCCCAGAAGTCACAACTGATTATACATCATAGAGCTCATACTGGAGAGAAGCCCTATGAGTGTACTGAATGCGGGAAAGCCTTCTGTGAGAAGTCCCACCTCATTATACATAAAAGAATTCACACCGGGGAGAAACCCTACAAATGTGCTCAGTGTGAGGAAGCCTTCAGCAGAAAGACAGAACTCATTACACACCAGTTAATTCATACTGGGGAGAAACCTTATGAATGTACTGCTTGTGGGAAGACCTTCTCCCGAAAGTCACAGCTCATTATACATCAGAGAACACATACTGGAGAAAAACCCTATAAATGCAATGAATGTGGAAAAGCCTTCTGTCAGAAATCACATCTCATTGGACATCAGAGGATACACACAGGAGAAAAACCTTATGTTTGTACTGAATGTGGGAAAGCCTTCTCTCAAAAGTCTCACCTCCCAGGTCATCAGAGGATTCATACAGGAGAGAAACCATACATATGTGCTGAATGTGGAAAGGCGTTTTCTCAGAAGTCAGATCTTGTTTTACATCGGAGAATTCACACTGGGGAAAGACCCTATCGATGTGCTGTATGTGGGAAAGCTTTCATCCAGAAATCACAACTCACTGTACATCAGAGAATTCATAGCAGTGGTAAAAATCATAGTGAACTAAAAACACAGACAAGCTTTCAGTATTAGCTCAATGCTTAATACGTAACAGGAACTTGATTAATTTGATAACTTTGTTGAAGCATCTTTATAGAGAAAATTTTACAAGAGAATACATATCTGTAGTGTGGTGATACCTAACTCAGCAGACATGATGGAAAATAATTACATAAATGAAGGCCATTTTCACCATAGCATGTAGAGCTTTTAAAGTTATGAATTGAATGGTTAGTAGAACAAATTATGTATATAGAATGTTGTCAAAGTACATATTCCTTATTATGCCCCATAACAATAAACATTGTGAAATTGCTAATATTAACTTGGCATCATTTTGGTCATATACATTAATTGCCTATAAAGGACATGAAGAATGCTTGATTTAAAAAAATCAATTCCAAGAAACTGCATTAACAAGGAAAGGCTTGGGAGTTCCCTAATAATAGGACTCAACAATTTCACAGC\n>HQ038014.1 Uncultured Syntrophus sp. clone F2M5Y2A01B2QEH 16S ribosomal RNA gene, partial sequence \nGAGGAGGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCGCAACGAGCGCAACCCTTGTCTTTAATTGCCATCATTCAGTTGGGCACTTTAAAGAGACTGCCGGTGTTAAACCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCTTTATGCCCAGGGCTACACACGTGCTACAATGGGTGGTACAAAGAGATGCAATCTCGCAAGAGCAAGCAAACCTCAAAAAGCCATCCTCAGTTCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTT\n>XM_048223246.1 PREDICTED: Ursus arctos SEC16 homolog A, endoplasmic reticulum export factor (SEC16A), transcript variant X12, mRNA \nGGCGGCCGGAGCCGGATGTGCCAAGATGGCTGCTGCGGCTGTCGTGTCTGCGCTCGTCGCCGCAGCCGGGCCGGCTTCCGCCGGCGGCTCCTGAGGGGCTGGCCCAGGGGTCGCGGAGGGGCCGGGCGGGAGTCTCGGCCGCCCTGTGGCGCGCCGTTCAACTTAAGGAACCTATATCCTGCTTCTATCCGTAAGGAGCATCTAATTGTGCAGAAGATCAATCATGCAGCCACCACCCCAGGCAGCCCCATCAGGCGTGGTTGGGCCACCTCCAGCTGGGACTCCTCAGAGCATGTTCTGGTCCAACAGACCGTATAGAAGACAGGCAAATAACAACGCACCGGTGACTCCAATAACTTGCCCACTGCAGCCAGTGACCGATCCGTTTGCTTTTAGTAGACAGGCGCTACAAAATACATCGTTAGGCGGTTCGTCCAAAAGCAGCCCGCCCATTCTGCAAGGCCCGGCCCCACCAGCGTTCCTTCAGCGCCCTGGTCTGCCTGTGCCTCACACAGATGCTGGGGATACCCCCCAAGGACCAGTGTCGCAGCCCAGAGCAGATGGCAGTCTGTTTTCCAGTGTGTTGACCCCTTCAGCACCATCGGAGCCCGAGGTGAACAGGAGTGCTGAGGTTGCTCCCAGCTCAGAACCCGAAGTTCAGACTCTGCCATATTCTCAGTACATTCCAGGAGCGGGTGCTGACAGTTCTCACGGGGGCCATCCGCACACAAATATGCTTGGGCCTGATAGGCTCCTGAGTAGCCAGAACCCGCACGACAGTGCTGCGGCGTTAGCACCATCCCCTTTCTTCCCTCAGCCTCGTCAGCAAATGCCAGGGCAGTGGGGACCCGGGCAGGGAGGCCCACAACCCTCAGGTCAACATTATTGGCCCCGCCCAGAAGGACCTGTTCAGAACGCGGTGCCTCATACCTCCATCGTTTCTCAGTTCCCTGCTCCATCCAACCCGCATCTTGGTCCTGGCCACGAGCAGCTCAGCTCACTGGTGTCTTTGCCAGGACCCTTAGCCAGTGATGGAAGCAATGAGGTGGCCTACCTGCAAAGTGGAAACCATTCAACAAATAATTTTGATCCTGAAAATGCATTCAGGCAAAATTCTAGGGCTGGGAATACTTGGGCGAGCCAGGAGCTCAGGCCAAGTCCAGGAGTGAATAAAGAGCAGTTGCCAGACCTTGCTCTCGTTAATCCCCTCGCTCAGGGAAATAGCCCAGAAAGCCATTTGCACTACCCCCCAGGGGCTGGGACCAGCCGAGCCCTGTCAGAAGTGGACTCGGGGGCTCTCTCCATGTTTTTTCAAGGTGGGGAGACAGAAAATGAGGAGAACCTCTCATCTGAAAAAACAGGCTCTGCTGGTCAGTCTGACTTCGACGGCTTCTCCCCCAGCCCCGCGCTTGGTCATCCTCCTGTACATGTGGGAGCAGGCGGCATTTACCAGGCCCTTCCCAAAGGTTCCAACAGTGAGGCCATGCAGCAGGGAGGACACCCGCAACCTTATTTTTCTCAGTCTGCAGGCCCCCAGCCTGATCGACCCACCACGGCCAGTGCTGCCATTGCTGCGTGGGGCAGTGCAGCAAGTGCGGGGGCGCACGCAGCCAGCAGCTCGCAGTCTGAGAATGTGGAAGACCTAGAATTCATTCAGAATCAAGAAGTTCTGCCAAGTGAGCCCCTGAGTTTGGACCCTTCCTCCCCAAGCGATCAGGTCAGATACGGGCCCCTTCCTGGGCCAGCCGTCCCCAGGCTCGGTGTTGTGGGCCACGCTGGAGGTGGGGGTCCAAATCTCGAGGCCCCGGATTCAACGCCACACCCTGTGCGGTCTGATAGCGTGTCATCCGGTTACAGCAGCAAGAGCCACAGGAATCTTTCGAGTGCAGCCAGGCCCCAAGACGTAGGCACTTTCATTCAGCAAGAAGTTGGAAAACCTGAAGATGAGTCTTCGGGGAGTTTTTTTAAGCAAATTGATTCTTCCCCTGTGGGAGGAGAGGCAAACGAGACCACCGTGAGCCAGAATCACCGCAGCAGCCTGTCCCAGACCTCAACCCCAAGCCCCCCAAAACCCACTGGAATATTTCAGACAAGTGCAAATAGTTCTTTTGAACCAGTGAAATCCCACTTAGTTGGAGTAAAACTCGTCGAGGCCGATCGCGCCAACGTGGTGGGTGAGGTGAGAGGGACCATTGCCCACCAGAAGCAGCGCAGACCCGCTGCTGCCCCACCCGACACTTCCCCCGGCAACCTGGAGCAGCCACCGGACAACATGGAGACCCTGTTCACACTCCAGGCCTGCTCTCCGCCCTTTTCCATACCTGTGGAGCCCGGGTACGGGCTCGTACATGCTGGGGGGCCGCCCTTGGAAACTGTGCCCCTGGCAGCTGAGAAAAGGCCTTTGGCCAGAGCCCAGGGAGCCGTGAAGTGTGAGAGCCCAGTGACAACGTTGTGGGCACAGAACGAGTTGCCAGATTTTGGAGGCAACGTCCTTCTAGCCCCAGCTGCTCCTGCGTTGCACGTGCCTGTGAAACCACAGCCATCCGAAGTGATCCAGCCGCCAGATGAGGGCGCGTCCGCTCTGCAGTCCCAGCAGCCAGGCTCTGGCCTCCCTCTGCACAGTGGGGACAGCATTGGTGCTTCTGAGAACCTCGAGAACCCTCCCAAGATGGGAGAAGAGGAGGCCCTCCCGTCACAGGTGACAAAAGACGCTCAGGAACAGCGTGGCCCAGAGAGAGCCCAGCAGGAGCCAGCACCACCTCCCCCACAAGGGCCCAAAGCAACATGTACAGATCCTTCAAACCCAGGAGGTCCACCCGTGCAGGGACAGCCCCAGAACTCGGTCCCACCACCCACAAGCCCAGCTCCAGCTGACGCAGGTCAGCCACTGCCGCCTCGGCCACCTCGGTCTTCCAGCGCGTCGGTCGTGTCTACCAGCTCGAGCCAGGCAGCCGTGCGGTCAGACCAGCACTGGCTGCAGCCGCCTCCTCCAGACCTGGCATCTTACTACTATTACAGACCCTTGTATGATGGCTACCAGTCCCATTACCCCTCGCCATACCCACCGGAGCCTGGCACGGCCCCCCTCTATTATCAGGACGTCTATGGCCTGTACGAGCCCAGGTACAGGCCCTATGACAGTGCGGCGTCTGCCTATGCTGAGAGCTACCGCTATTCCGAGCCTGAGCGACCCAGCTCCCGAGCAAGTCACTGCTCAGACCGGCCGCCTGCCAGGCAAAGGTACCCTGAAGGTTACTACAGTTCCAGAAGTGGGTGGAGCAGCCAGAGCGACCACTATGCGGATTATTACCCCGGCCAGTACGATTACGCAGACCCAGGTCACTGGGACCAGTACCACTATGGTTCCAGATTCAGGGACCCCCGCGCCTGTGACCGGAGGCATTGGTATGATGCTGAGTACGACGCGTGCAGGAAGGACAGCTGTGCGTACGGTGACAGGCCCGAGAGGTACGACGACCCCTGGAGGTACGACCCTCGCTTCACCGGCAGTTTTGACGATGACCCCGAGCCCCACAGGGACCCGTACGGGGAAGAGGCGGACAGGCGCAGCGTGCACAGCGAGCGCTCGGCCCAGAGCCTGCGCAGCAGCTTCAGCTCCCACTCACGTCAGAGTCAGATTTACAGAAATCACGGCGTGACTGCTGCTCCCTATGAGGCCCCACATCCCCCAGGCTCCTTGCCTGGAGATTACGCCTACGGGGCCTATGGCAGCAATTTTGGCAGTGCCCAGGGCTTCCCAGAGTACGGCTACCCTGCCGAAGCTGGCTGGCCCTCCACGGAGCAAGCTCCGTCAAGACCAACTTCTCCTGAGAAGTTCTCAGTGCCTCACGTCTGTGCCAGGTTCGGGCCTGGGGGTCAGCTCATTAAAGTGATTCCGAACCTGCCTTCGGAAGGACAGCCGGCGCTGGTGGAGATGCACAGCATGGAGACTTTGCTGCAGCACACGCCGGAGCAGGAGGAGCTGCGCTCGTTCCCAGGACCGCTCGGCAAAGATGACACCCATAAAGTGGATGTTATTAATTTTGCACAGAACAAAGCTACAAAATGTTTGCAGAACGAAAATTTAATTGACAAAGAGTCTGCAAGTCTCCTTTGGAATTTCATTGTTCTCTTGTGCAGACAGAATGGGACCGTGGTGGGAACAGACCTCGCAGAGCTTTTGTTACGAGACCACAAAACCGCGTGGCTTCCTGGGAAGTCACCCAACGAGGCCAACCTGATTGATTTTACTAACGAGGCTGTGGAGCAAGTGGAGGAAGAGGAGTCCGGGGAAGCCCAGCTCTCATTTCTGACTGACAGCCAAGCAGCTAGCAGCAGTGCTCTTGAAAAGGAGACGGAGAGGTTCCGGGAGCTGCTGCTGTACGGCCGCAAGAAGGATGCTTTAGAGTCTGCGATGAAAAACGCCTTATGGGGTCATGCTCTGTTACTTGCAAGTAAGATGGACAGCCGGACACACGCCCGCGTCATGACCAGGTTCGCCAACAGTCTTCCGATCAACGACCCTTTGCAGACAGTGTACCAGCTGATGTCGGGGCGGATGCCTGCTGCGTCCACGTGTTGCGGAGATGAGAAGTGGGGAGATTGGAGGCCACATCTTGCTATGGTTTTGTCCAACCTGAGCAGCAACGTGGATGTGGAGTCCAGGGCAATGGCCACCATGGGTGACACTCTGGCTTCGAAAGGTCTCCTAGATGCTGCGCACTTCTGCTACCTCATGGCCCAGGTCGGACTGGGGGTTTATACAAAGAAAACCACAAAACTTGTCTTAATTGGATCAAACCACAGTTTGCCGTTTTTAAAGTTTGCCACCAATGAAGCTATTCAGAGGACAGAAGCCTACGAGTATGCCCAGTCTCTCGGGGCACAGACCTGCTCCTTCCCCAGTTTCCAGGTGTTCAAGTTCATCTACTCCTGCCGCCTGGCCGAAATGGGGCTGGCCACGCAGGCCTTCCACTACTGCGAGGTGATTGCCAAGAGCATCCTGCTGCAGCCCCACAAGTACTCGCCCGTGCTCATCAGCCAGCTGGTGCAGATCGCGTCCCAGCTGCGCCTCTTCGACCCGCAGCTGAGAGAGAAGCCGGAGGAGGAGGCCTTTGTGGAGCCTGCCTGGTTGGTCCAGCTGCAGAGTGTGGACAAGCAGGTCAAGGAGGGCGCCGCGGTGTGGAGTCGGGGCGGGACCTTCCCCCAGCGCTGTCCCAGCACCCCGAGCTCAGAGGCGGGTCAGTATGACGGGCCAGCACTCTCCCAGCCGGGGGGCCCGGGCACCGGCAATCCGCTGCTGGCACCGCCTGTGCCCAGCGCTGAGCACTTTGGCCAGGGGGTGCGGCTGCTGCCTTCAGCTCCGCCGACGCTCCCCGACAGCCATCCGGCCCTGCCCGCCAGGGTGCCCTTGTTCCCGGTGCCCTCGCCCCCGGGCCCTGTTGAGCTGGGGCCTGGCTGTGGACCCTCGGGGGCTGCCCTCGGCTTTCCGGAGCCCTCTGGGCCTGACCCCGTGGCTCCGTACGCGGCTCCTGGCCTGCCACCTGGCGCACCATCTCCGCAAGAAAGTGAGCACGCGCCCCAGGAGGCCCGGAGCCAGGACCCAGGGGTGATGCCACCGGAGGTGCTTGGTAGAAACTCGCTTCTGGAGCTGAGAGAAGAGGGTCTTGGCGGAAAATTTGCTGATCTGGGCTCCTCCATGATGTCACAGGACTCCGAGGTCCCCCCGGGGTGGGAATGTGCTGGCTCCAGTGTTCTGCAGCCACCGACGTCCACTCCCGAAGCGAAGAGACCTGCACCAGCAGCCAGGAAAGAGGCCAAGGAGCCCAAGAAGAGTGGCGAGTCCTGGTTCTCTCGTTGGCTCCCTGGGAAGAAAAGGACGGAAGCTTATTTGCCAGACGACAAGAACAAATCGATCGTCTGGGATGAGAAGAAGAACCGATGGGTGGATGTGAACGAGCCAGAGGAGGAGAAGAAGGCTCCGCCCCCACCACCAACCTCGCTCCCCAAGGCTCCACTCACTGCACCCCCCGGTCCTGGAGGGCCCCCGAGGGCCTCTGTGAACATGTTTTCTAGGAAAGCAGCTGGAGCCAGAGCACGCTACGTGGATGTTTTCAACCCGGGGGGGCCCCAGCGGAGTGAGCCGGCTCTCGCTCCAGCAGAGTTCTTTGCTCCTCTTGCCCCGCTCCCGATTCCTGCTCACTTGTTCGGACCAAACACAGACGCAGAGGAAGCTCCGCCTGCAGAGGGGGCTGGCAGGGAAGGGCAGGCGCCCGTGGGGGGTCCGGCCAACCCAGAGCCGGCCTCGGAGCCCCAGGTGTTCAGCTCGGCGGTGGCGCTCCCTGGCCCTGAGCTCCCACCCGCCCGCGAGGACGGCTCCCAGGGCGGAGAGCTGTCGCGCTGTAGCTCAGTGAGCTCGTTATCACGCGAAGTAAGCCGGCACTTTTATCAGGTACCTGTGGCCGGCGGCTCTCACCGGACGCGAGTTGAACTGGGTCGCCTTTGTGTTCCTTCTGAGAGCGCTGTGCTGGCTGGCCGTCGTGCCCTTGTCACTCACGCGGCCCGCTGCCTCCCCGTCCCCCTCACGCCAGAGGATGCAGTGTTCCTTTCTCCCAGGGTCCTCGGGGGGTCGGGAGCCGTCCACGTGCACTGATGCGCACGTGGACCCCAAAAGGTTCCTAGTGAACGAATGCAGTTTGTAATTGTGTTCTTTCCAGATTGGTTTGTCCACACGGCAGCCGTGGGCGTAGCCTCACCGTGTGTGAGTGGGCTTCAGAAGCCCGCCAGGGGCAGGAGGGACTTGTGTTCTCTGACCGAGCGCGAGACGGCGTCGCGTAGGCCCGGCAGAGAGCGGCGGGCGGCTGTCCTTTGGCCAGTCTGGGCGGGAGAAAAAGGAATGCGTCATCTTTTATGTGTATCGTGGCACAGCGTTTCCGTTGGCTCAGTAGAAGGCTTTACGTGACCTTTTTATTTGCGTACTAAAACGCTGGATTTTGTAGCTGGATACTGGAGTCTGAAGTAATCAAAAATGTCTACTAACTGCTTCAAGCCGACGCTAACGGGCCGTCTTGGTGCCGTGCACTCCGCGTTCCTGCATGTTCTGGTTTTAAGGCATTTCTCTCTGCATGCTGCTTCATGTTTTCCCATTTTCCTGTGAACCTTGGCGTAATTAAATCCAGTGTTGCGAGAAGTGTCTGCCAGCTGCTTCCGTGGCTTACTTAGAAGCGCTGTAAACGGTTCCCGGAGACCAGTGTCTGTTCACAAGGGGAGCAAAGCGCTGGGATGGCGCTGTGTTGACGCGTGCTCTCTGTGGT\n>XM_012078672.1 PREDICTED: Cercocebus atys galectin-7 (LOC105594508), transcript variant X1, mRNA \nGTTGCCCTGTCTGGCACTATCGCTGTGGTTGTAGCCGCTGTTGCTTTAGAGACATAGAAGCAGGGATTTCAGCGCAGACATTTCCAGTCCAGGCAGGAGGTTCTTAGCTGGAGAGAAGGGTCTAGAGTTCCCGCTGGGCTTGGCTTCTCAGGACCCAACATGTCTGTGTATAAAATAAGCATGAGACACTCTCCGTGCGCCAGGCAGTGGGAAGGCAGGGCTGGAGGGGCGGTGGCACGAGGAGCCTTCTCTGCTAACGTCCCCCACAAGTCCTTGCTGCCCGAGGGCATCCGCCCTGGCACGGTGCTGAGAATTCGTGGCTTGGTTCCTCCCAATGCCGGCAGGTTCCACGTAAACCTGCTTTGCGGGGAGGAGCAGGACTCCGATGCCGCCCTGCATTTCAACCCCCGGCTGGACACGTCAGAGGTGGTCTTCAACAGCAAGGAGCAAGGCTCCTGGGGCCGCGAGGAGCGCGGGCCTGGCGTTCCTTTCCAGCGCGGGCAGCCCTTCGAGGTGCTCATCATCGCGTCGGACGACGGCTTCAAGGCCGTGGTTGGGGACGCCCAGTACCACCACTTCCGCCACCGCCTGCCGCTGGCGCGCGTGCGCCTGGTGGAGGTGGGCGGGGACGTGCAGCTGGACTCCGTGAAGATCTTCTGAGCAGAAGCCCAGGCGGGCCCGGGGCCTTGGGTGGCAAATAAAGCGTTATCCCGCAGCG\n>EU356148.1 Uncultured bacterium clone 053.F4 16S ribosomal RNA gene, partial sequence \nGAAGGGTGCAAGCGTTACTCGGAATTACTGGGCGTAAAGCGTGCATAGGTGGTGAGTTAAGTCTGTCGTGAAAGCCCCGGGCTCAACCTGGGAATGGCGATGGATACTGGCTCGCTAGAGTGCGGTAGAGGGTGGTGGAATTCCCGGTGTAGCAGTGAAATGCGTAGAGATCGGGAGGAACATCAGTTGCGAAGGCGGCCACCTGGACCAGCACTGACACTGAGGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGCGAACTGGACGTTGGGAGCAACTAGGCTCTCAGTGTCGAAGCTAACGCGTTAAGTTCGCCGCCTGGGGAGTACGGTCGCAAGACTG\n>XM_036526509.1 PREDICTED: Megalops cyprinoides Janus kinase and microtubule interacting protein 3 (jakmip3), transcript variant X3, mRNA \nAATGGTAAAATGCCTGTGTGTGAGGAGACGCGCAGACGGATTCTTTTTAGGATGTGCGCTTTAGCCCACAGCAAATGGTTCTTCACCGGATGCTAGGGGAGCTACACAGCTAAAGCAAGCAGACAGCATTCAGCCTAACTGGATCATGGCTTTAAGGTGGGAGAGAAGATGTAGGTGAGGATTCGCAGGGGGGAAGAGAAGCCTGACACCTCCCATCCTCAGGTTCTTCCTGTGGGGGCGGGCCGGCCCGAGCCGGGATCAGTGCCTCACCATGTCCAAGAGGGGGTCCGGCGGCCGAGCCAAGGGGGAGCGGCCCGATGCTCTAGCCGCCCTGCAGGCGGCGAATGAGGAGCTGAGGGCCAAACTCACAGACATCCAAATCGAATTGCAGCAAGAGAAGACTAAGGTCAGCAAGTTAGAGCGGGAGAAGTCCCAGGAGGTGAGGCAGGAGCAGCACAAGTCGACGGTGGTGGTGACGGAGCTGAAGGCCAAGCTGCACGAGGAGAAGGTGAAGGCCCTGCACTGCGTGCGTGAGACGCTGCTGCGGCAGCACGAGTCCGAGCTGCTGCGGGTCATCAAGATCAAGGACAACGAGATCCAGCGGCTGCAGGCGCTGGTCAACGCCCTCCGCGACGGCTCCACCGACAAGGTCAAGACGGCGCTCTTCGCCGAGGCCAAGGAGGAGGCCAAGCGCGGGTTCGAGAGCGAGAAGAGCAAGATGCAGCAGGAGATCTCCGAGCTGAAGGGCGTCAAGCGGCAGATGGAGGAGGCGCTGACTCTGGCCGTGCAGGCCGACAAGATCAAGGCGGCCGAGATCCGCAGCGTCTACCACCTGCACCAGGAGGAGATCACCCGAATCAAGAGGGAGTGCGAGAGGGAGATCCGCAGACTGATGGATGAGATTAAGGTAAAAGACAGAGCAGTCTGCCTGCTGGAAAAGGAGCTGGGCGTCCAAGCAGGGCACACTCAGAGGCTCCAGCTCCAAAAAGAGGCTCTAGATGAGCAGCTTGTCCAGTTCAGGGAGGCTGAGCGACATCTGGCCAGCCCCAAACGAGAGGCCCCTTATGCAAGTGGTGCAGGAGACGCCTCTGATCATTCAGGAAGCCCTGAACAGCAGCTGGACGAAAAGGACGCGCGGCGCTTCCAACTTAAAATCGCTGAACTGAGCGCCATCATCCGCAAACTGGAGGACCGCAACGCGCTTCTTTCCGAGGAACGCAACGAGCTGCTGAAGCGTCTCCGTGAGGCCGAGAGTCAGTACAAACCTCTGCTGGACAAGAACAAGCGTCTGAGCCGTAAAAACGAGGAGCTGGCCCATGCCTTCAGACGCATGGAGAACAAGCTGAGATTCGTCACCCAGGAGAACATCGAAATGAGAGAGAAGGCGGGAAGCATTCGCCGGCCCAGCTCCCTGAACGACCTGGACCAAACTCAAGAGGAGAGAGAGATCGAGTTCCTCAGGCTGCAGGTGCTCGAACAGCAGAACATCATTGACGATCTGTCAAAGGCGCTTGAGACAGCTGGATATGTGAAGAGTGTAATAGAGCGGGACATGTTGCTGAGGTACCGGCGGCAGAGAAAGAGAGTCATCAAGCCCTGTAAGCCGGTTGTGGAGACGTTCTTCGGGTATGACGAAGAGGCGTCTTTGGATTCAGACGGGTCCTCCATATCCTACCACACGGACAGAACACCCTGCACGCCGGACGACGACCTAGAAGATGGCCTGATCAAAGAGGAGACGGAGCTGAGGTTTCGTCAGCTGACCATGGAATACCAGGCTCTCCAGCGCGCCTACGCACTCCTACAGGAACAAGTCGGGGGGACGTTTGATGCAGAGAGAGAAGTAAAGACAAGAGAACAACTACAGGCAGAACTCATCCGGTACCAAACAAGAATAGAAGACCTCGAGTGCGCTTTGACCCAGCAAGGCCTGGACGTGAAGTGGATCGAGGAGAAGCAGGCCTTGTATCGCCGAAACCAGGAACTTGTGGAAAAGATCAAACAGATGGAGATGGAAGAATCCCGCCTGAAACATGACATTCAGGACGTCAAAGACCAAAACGAGCTTTTAGAATTCCGTATACTAGAACTAGAAGAGCGGGAAAGGAGGTCCCCAGCCGTCAACTTCCACAACATCCAATTCACGGAGGGCATGAGCCCCCTGCAGGTATACTGTGAGGCAGAGGGCGTCACGGACATCATCATCACCGAGCTCATGAAAAAACTGGATATTCTGGGGGATAACGCCAATCTCACCAACGAGGAGCAGGTGGTTGTCATTCACGCGCGGACCGTTTTAACTTTAGCAGAAAAGTGGCTGGAGCAAATAGAGGTCACCAAATCAGCTTTACAGCAGAAAATGCTGGACATTGAGAACGAGAAGGACCTGTTCAGTAAACAGAAGGGGTATTTGGATGAAGAGCTGGACTATAGGAAACAGTCAATGGATCAAGCACATAAGAGGATCCTGGAGCTGGAGGCCATGCTGTTCGACGCGCTGCGGCAGGAGGCCGGGGCCAAGATGTCGGAGCTGCTGTCCGAGGAGGAGCGGGAGACGCTGCGGCGGGCCGTGGAGCAGTGGAAGCGGCAGGTGATGAGCGAGCTGCGAGAGAGGGACGCCCAGATCCTGCGGGAGAGGATGGAGCTGGTCCATCATGCACAGCAGGTTACATCACTGAGATGGCAATCAAGCGGACACCATTGCTTGGAGGGAAAAATGAACACATTTTTGTTACACAGTGCAGTTACACAAATGTTAATGTATTGCAACCTCCTTGTTAGGTTACAAGTTATATGCTGTTTCCCAGCTGAAATGTGTTCAAATATTTACTCACTCTGAACTGAATTCAATAAGGTAGCTGCAAATCACCACCCCCTAGACTGAGATAGAGTGTAGAGCACTCGTGATATATTTGCTGATATTTATGACTCATTTCAGTAGTA\n>XM_041210960.1 PREDICTED: Carcharodon carcharias tbl1x receptor 1a (tbl1xr1a), transcript variant X1, mRNA \nGGGGGGGAAGGGAAGGAACAACAAGAGGAGGCCGCCCAGCAGCCAGGCGGAGGAGGCCAAGTGTGTGCAGATCCCGGTTCTGCAGTGTTGTTAAGTACTGACATCATTACACCCTTTGCTGGACCTGAGATTTCGCACAGTCAGTGTTTGAAGCTACTATACCACATGCCCAGTGATCTAAGGTGACGTGATACAACCATCCTTAATTGGTCCTGAGGGTTCAAAATGTGTTAATAGCCTATTCATGAAAGGCTTACCCTGTAATGACCTCATGGTTTAAGTGGGACTGAAGATGAGTATTAGCAGTGATGAGGTCAACTTTCTGGTATATAGATATTTACAGGAGTCTGGTTTTTCCCATTCAGCGTTCACATTTGGTATAGAGAGTCACATCAGTCAGTCCAATATTAATGGTGCCCTGGTGCCACCAGCAGCTCTCATCTCGATCATACAGAAAGGTTTGCAGTATGTGGAGGCTGAAGTCAGTATCAATGAGGATGGCACACTATTTGATGGGAGGCCCATTGAGTCCCTTTCTTTAATTGACGCTGTAATGCCTGACGTGGTGCAGACAAGACAACAAGCTTATAGAGACAAGTTGCAGCAACAACAAGCAGCAGCAGCTGCTGCTGCTGCTGCAGTTAGTCAACAAGGGTCTACAAAGAATGGGGAGAATACTGCAAATGGAGAGGAGAATGGCGGACACGCAGTTACGAATAATCATACAGATATGATGGAAGTTGATGTAGATGTGGATATTCCATCCAATAAAGCTATGGTATTGCGTGGCCATGAATCAGAGGTTTTCATATGTGCCTGGAATCCAGTCAGTGACCTCTTGGCATCTGGATCGGGAGACTCAACAGCACGGATATGGAATCTTAGTGAAAATAGTAGTGGTGGCCCCACCCAGCTAGTACTTAGACACTGCATAAGGGAAGGAGGACAAGATGTACCAAGCAACAAAGATGTTACATCTTTAGACTGGAATAGTGAAGGCACACTTCTAGCAACAGGTTCGTATGATGGATTTGCAAGAATATGGACAAAAGATGGTAACCTTGCTAGTACGTTGGGTCAACATAAAGGACCGATATTTGCATTAAAATGGAACAAGAAAGGAAATTTTATCCTTAGTGCAGGAGTGGACAAGACAACAATTATTTGGGACGCGCATACCGGAGAGGCCAAACAGCAGTTCCCTTTCCACTCTGCTCCAGCACTAGATGTTGACTGGCAAAGCAACAACACGTTTGCCTCTTGCAGCACAGACATGTGCATCCATGTGTGTAAACTAGGTGCAGATAGGCCCATCAAGACATTCCAGGGACATACGAACGAAGTGAATGCAATCAAGTGGGATCCAACTGGGAATCTACTCGCATCTTGTTCCGATGACATGACCCTAAAGATCTGGAGCATGAAACAAGATACATGTGTTCATGATTTACAAGCGCACAACAAAGAAATCTATACCATCAAGTGGAGTCCAACAGGACCTGGTACTAACAATCCAACCGCCAATCTTATGTTAGCAAGTGCATCATTTGATTCTACTGTACGACTATGGGATGTGGACCGAGGTATCTGTATCCACACTTTGACCAAACACCAGGAACCTGTATACAGTGTAGCGTTCAGCCCAGATGGCAGGTACCTGGCTAGCGGCTCTTTTGACAAGTGTGTTCACATCTGGAATACTCAGACAGGTGCTCTTGTCCATAGCTACAGGGGAACAGGAGGAATCTTTGAAGTGTGTTGGAATGCAGCTGGGGATAAAGTGGGTGCAAGTGCATCAGATGGTTCAGTTTGTGTGTTAGACCTCCGGAAATAGCGCTGCTAGCTGGAAGCCATGGACCGACAATGAATGTGTACATAGCCAAAACGACTGTCCCTGCCCCATGCACTGCTACAGTCTCACTTGAACCATGGCCAGTCCACTACAGCCAAAACAAGTCAGAATGCAAAACCCAGGACAACTGAGCCCTGATGTGAAGAGTACCCTGACTGCTTAATGCTGGAAGCTCCACCCACAAAGAAAAGTCAACCTTTCTTGAAGGTTTAAAACAACTTGAAATAAGACTTGACATGAGACCATATGTGTACCAAAATGGAAAGATAATATCAGAGGACAAAAATATCTTTTATTTTTTTGGTCCAGAGTCTATGTAGAATGAGTTATCTTGTCAGCAGTTCAGCAGATCTGTGTGCAGACATATCAGCTTCTTTCAATCAGCAGCAAATAGTTTGTTCCCTTGTTTTAAACATTGTTTTATCACTTTAGTTTACAGTTGCATGATGTAGGAGAGTGACTGTATCTTGTTTATCTTGTTTTTTTTCCTACTGACACTTAACACACAACTAGAAAAAAACTTTTTTATGGATACTATAAGCAAAATAACAGTGTATTTGGTATGTTTTTGGTACATTTTGTGGCTCAACAAACTAATATGTGGGGAAACATGAAACCGCTCCAAAATTCAACATAAAATTAGTTTCATTATACATCAGTCATAGGTAACAAGCTGTGGTTTACAGGTGATGTGGCTAAAATGTAGTAGTTTCTTAATGGGGACATGATTCTGCCGATTTATGAGAATTAAACAAATGGGCACAAAGAAAGAGAATCGATGCAGGGATGCATCCCATTGCTTTAAGACCATAGTTTGCATATGGTTGGATTGTGCACTATTGATAGAGCAGCTTATAGAATTTTGAAAGATAACTTTTCTGGACAGAGAATTATTACTGTTACTCTACTTATTCTTTGGTAGACCTACAGGCATAAATTTCACAGCAAGGTTCCAGTATTAAGGACTGATGTCTCGTAAGCAATGTTTTTAAAAACCTATCCAGTGCAATGAGATAAACCTCCCTCCCCCTCCCTCTGCCATTGGGCAGAAATCATGCAGGCATATGTTTTATGTTAATGCTAAGATAAGGGTTGACTTTGCTTTAATTTTCTTTCCTTGGTGCTCGTGTATTACACATGGGTTCATCTTGGCTCAGCCCTCTAAAGTACTTGCACTTGCTGTATTGTTCAGTAAAGTACAGGTAGTATAATTGCAATAGCTTTTTTTAGAATAAAAGTATATTCTATAAAGTATAGCATATCTGAGCTTTTAAACCTCAGGGGACCCTTCTTCAGATGATGAAGTGGTTAAACAAATATTTCTGCTACAAGATGCTCAATTACTTTTTCACACGAAGAAATGACGTTTGAGGTTTCAAATCCTTAGATTTAATGCATTGTAAAATGTTAGTCTAAAAAAGGTATTCTTCTATTTCCCATATCCCATGCAACAACAGATCAATGAAATGAAGTTACTGTTGCAAAGGCTTTATACCACCACTTCAAACTTGATCTGTTTTCCAACTCATTAAAAATGCAAGGTTAGTTGCTTTTTTGTTTAAATAGAAACATGAGTAAGAATAATTTCTGCACAAATGTTGGATTTTTTGTCCTTGGAGTAAAGTCTGTTGTTAATCTGAATCTAATCTAATCATTTAGAACTGATTATAGGTAACGTGGTATAATCAAATAGCTGCTATTCCAGATATTCCAGTGTCTGCATCACTGAAGTTGACCAACAAGTTCAGAACAGCTCCTAGATGTTCATTATGGGCTATTTGTCAAGTAGAGTAACAGTTATTAGGCAGCTTTATCACATTTCTAAGAAAAAAAACCATTGGTTATGTTATTTACTAGCCTTTTGTTAAATTGCGTCATATTAAGGTGATGAATGAGATTGGTTTTATCATTCTTCCAAGCTCTGCCCTTTGCAAGTTTGTTGCGAAGTCCAAGTTAAATTAAAAACCCTTGCATTCCCCTCCAATTAAAAAGGACTCATAAAGCATCTGCTACTATATGTTGACCTAAAGAACTAATGCTTGGAAAGGTGAGCCCTAGCCAGTTTTTAAATGAGCAGTTAAAACTTTTCATTTAAATCTTTTAAAAAGTATACATCGATGGCACAACATTTGAGAGCTCACAAATACAGTGGTAAATTTTTAAGAAGCAATTTTTTAAAAAATGAAAACAAGATATAAGTAGCTTTCCAACTGCTGTTTTTTGACCCTGCCAAGGGTAGAGGTGTAAGAGCAATTTTGATTACCTAATTTAATTATCTAACTTCACATTTTGGATTGGAAAATTAAAAAAAAGTTGGCAGTTACCTACACTGGACTTAAGTGACAGTCCAAAAATGGGGTAGCAGTAGAGCCTCTCACCTGAAGGTGAAGATTTATTTGAATGGGAATTTACAGCAGCCAGATATTGTATGGATGGCAACACTTACTTTTCAAAAATAGGTCTGTTCTTACCAATTGTTCTAAGGGCATCCATACTTTAATGATCTGAGGCTCTTATTCACATCTGCTAGAACTTTGGGAAACTCATAACAGCAAGATCATCACAATAAATTATACACACAACATTGTTTGAACTAACTAAAGTCAGACATTATTACACATAACACATTGAGCAAATGCATAACCATTTCCAATAATATGAATTAAAAGCTGCTTCCCTTGCTCAAGTCAATATTGATTGAAGACTCTGATAAAACTGTTGCTCATTTGTTCCATTGCAAGTGCTGTTTTAGGAAGGGCTGCAAATGAAACTAGATAGTTGAAGCAAGTGAAGTATTTAGGTTGGTGAAGACAGCATTAGGTGCATTCAGTGCTCAAGAATGAATAGCATAAAAGGATGATTTCAGGGGCTAGCATTACAGCTCTAGCACTGGATTTACATGTCTGCATCATTTCTACAGTTCTCACAAATTAAGATTTTAAAAATTGTGAACCTGTAAACCAGGCCATGAAAGTTTTTTTCTACTCTTTGAACTCTTTATTGTTCTGTTTTTATTTGTACCTGTTAAAAAGACTGATTTTTGATGTACCATACTGTCCTGGACCATGTAAATATCACCTGATAATGTATTTAGGTTCCACATTACATTAATAATTTTCCCTTTTCCACTCTCCCAACCCTCCTTCCACCACCTCACCTTACAAGTATCACCACCAAGGCACATCTTCTGTTGCAGCTTCCCTTTGCATCGTATTGATCTGACAACCATAATTTGCATCAGATCTGAAAGAGGTCCAGAATAAAATATATTTTGATATTA\n>XR_005699604.1 PREDICTED: Hirundo rustica beta 3-glucosyltransferase (B3GLCT), transcript variant X7, misc_RNA \nGGGGAGGATCATGATGGAGGAGGAACCTTGGGGAGCATGAAGGAGGGTCTCATGAAGCAGGATTTCTGGGGAGAGAATCACTGCTGTGAGCTTTTGCTGTAACTGTAATTTCTGAAGGTGCAGAAGATGAGACTGAACTACCAGTGCTGCAGAAGCCTGGAAAAAGTAATACAATTAGTAAAATAGGCAGAGAATTAAAAGGAATTGTATTTGTCATCCAGAGTCAAAGTAATTCTTTTCATTCCAAGAGAGCAGAAGATCTAAAAAGAGATATTTTGAAACAGGCTGTAGATCTTGGAAAGGAATTGCCTACAGTTCTACTTATTCATCAGATCGACAGGCATGAAGGTGCATGGACAATATTGCCGTTAATGACAGACTTCTCTGTTACCTATGGTAGGAACACCTCATGGATTTTCTTCTGTGAAGAAGATACAAGAATACAAGTAGTAAAACTGCTAGAAACACTCAGAAGATTTGACAAGTCTAAGGAGTGGTTTTTAGGTAAAGCATTATATGATGAAGAATCTACAATAATTCACCATTATGCCTTTGCTGAAAATCCTACAGTCTTTAAATTTCCAGATTTTGCTGCTGGTTGGGCACTTAGCATTCCACTTGTTAACAAGCTTGCAAAGAAGCTGAAGAGTGAACCACTCAAATCAGACTTCACAATAGATTTAAAGCATGAGATTGCCCTGTACATTTGGCAGAAAGGGGAAGGACCACATCTTACTCCAGTGCCTGAGTTCTGTACAGATGATGTGAATTTGTATAAGGTTGATCACTGTGCAACAACATTCAGTAATTTTCTGCCACTTTGTGGAGAGCCAGTGAATAAGGAAGATGTTTTTGTTGCTGTAAAAACGTGTCGAAAATTTCATGGTGACAGAACTTCCAGTGTTGTGCAATAGAGGATAATCTTACTCCAGATTTTGAAAGATTAATGGATGGCAGCTTCAGAGAGCTCTTTTTACCTGTACCAGTTGTAAAGCAGACTTGGGAGAGAGAAGCCGCCCTTATTGAATACTACAGTGATTATGCAGACATCTCCATTCCTACTATAGACTTAGGCATCCCTAACACTGACAGAGGTCACTGTGGCAAAACTTTTGCCATTTTGGAAAGGTTTTTGAATCATACTTCTGCCAGAACACCTTGGTTAGTTGTAGTGGATGATGACACACTGATAAGTATATTCAGACTCCGACAATTGCTCAGCTGCTATGACCCAAACGAACCAGTTTTCCTTGGAGAGCGTTACGGCTATGGCTTGGGAACAGGAGGATACAGCTATATCACTGGTGGAGGAGGGATGGTTTTCAGCAGAACAGCTGTTCAGAAACTACTTGCTAGCAAATGCCGGTGTTACAGCACGGATGCACCCGATGATATGGTCCTTGGGATGTGTTTCAGTGGCTTGGGAATCCCTATAACACACAGTCCACTTTTTCATCAGGCGAGGCCAATGGACTACCCAAAAGACTACCTTTCTCACCAAATTCCAATATCATTTCACAAGCATTGGAATATCGATCCAGTGAAGGTGTATTTCACATGGCTGGCACCAAACACAAAAGAGTCACATAACGACAAAAAAGTTGGATACAGCAGAGAGGATTTATAAGCAGTAGAAGAATGTAAGTGTTAATTACGATTTTACAGCTGAGAGACAGACACTACTGACAATTTTGTTTTCACATTGTTCCTCTGTTCATGACATAAAAAGACAGTGTTTTGTTCCTGTTGGTGGAATCCCTTCAGAGCAACGGAAGAAGGCACTTAATGACTTTTGGATTCTTTTCCTCTGCTTGGTTTCTTTTTAGAATGCTTTTGGGTTTTGTATACCAATGAACTTGACTCACATTTAAGAGTCTTGTACAACCTCACCTGTGTTCTGCTTTGGACTTGGTTCAAAAAGCATCGCTCTCTCAAAAGCTGAATTTATGCATTTGGGAGCTTAATACTGAATAAGTGTAGAACATCTATTAAACATCATCTCTCACTGACTTACAGAAAGTAGTTCTCTAAGAGGCTCTAGAACAGGTTCTTGATAAATCAGAGGACACTTGACTTTTTTTCCGCGTCCAGGAGCTAGATTGTCGGAAGGCTGTGCTCCTTTATGCTCATTTCAGATAGAAATACTGTAGTTTCCTGGAGTAGCAGGACCAGGCATGAAACCACTGTTGTACCTTTTAAGTTTGTTGGCATTTGTGTGGAATGTCGTGTACAAAATGGAAAAAAAGGTTAAGGACGGGGATTTCTTAGGTGGCCACGGGAGGTCACTGTGGCTCCTTCAGAAACCGGAGTCGGTGTACATCAATTTGGCAAATATAAAAGTGACTCTTAAGGATTTTGGAGAACTAACATTTCAGTATTTCTGATGTGTGCATTTCAATAGCATATGAATGCCAGCTTTAAAAAGTTTTGTAGTATCCCTAATTTGTATCATCAAAATAAGTAAATTGATGCCTACAGCATGTGAAGTGTGATTCTTATTTAAAACGTTCTTGAATTTTTTTTTAGTAATTCAGTTTTGTAAAAATGTTTGTACAAAACCTGGCTTTTAGTATGTTCTAAACTAATTTTTATATTGTAAAACTACTTCTTTTAAAATGATGTTGTATGGCACTTGTATGCTGTTATTTAACTTGGCTTGCTATATTGTAACCAAATACAGGGTCTTAAAGCCATACTGCTGAATTAATTTGTGTTTTGGTTTCTTTCAGTAGGTTAAAAATTGATTCCACTCCAAAGAAAAGCAATATTTCCTCTAGAGTTGAAGTAGGGGGAGCCACTGATTCCTGTCTCTGTAATTACCAAACTTGTATAAACATTTGTTTGCAAATGTAGCTTGTGGGTTTCTAAGCATTGAATAGCAAGCACATATTCATAATAGATTCAAATTCTGATTAATCAAGAGCAATCCATGTTATGTCTCTTTTCTTCCCACTACCAGTGCCTTAAACAGTAGACATTTTACTGATACCAGGACTATGTTCTCTGACACCATTGGTGAACTGTTAATTATGTTTACTGTTTAGAACTGTGAAAGCTGAATAAAAGCCTTCTTTAACCTGT\n>XM_020777834.1 PREDICTED: Pogona vitticeps XK related 6 (XKR6), mRNA \nATCCGAACCATGTACCTGGGGATCCAGAGCCAGAGACAAAAGGAACACCAGCGGCGCTTTTACTGGGCTATGATGTACGAATATGCAGACGTCAACATGCTGCGTCTCTTGGAAACTTTCCTCGAGAGCGCCCCCCAATTGGTGCTACAGCTCTGCATAATGATCCAAAAGAACCGTGCAGAAACCTTACCTTGTGTGTCCTCTGTGGCCTCCCTGATGTCCCTGGCTTGGGTGCTAGCGTCCTATCACAAGCTCCTTCGGGACTCTAGGGATGACAAGAAGAGCATGAGCTACAGAGGGGCCCTTATCCATCTCTTCTGGCGCCTCTTCACCATCTCATCCAGAGTTATCTCTTTTGCCCTCTTTGCTTCCATCTTCCAGCTCTACTTTGGGATTTTTGTCGTGGTCCACTGGTGCGCCATGGCCTTCTGGATCATTCATGGCGGGACGGACTTCTGCATGTCCAAATGGGAGGAGATCCTCTTCAACATGGTGGTAGGGATCGTGTACATCTTCTGCTGGTTTAATGTCAAGGAAGGCAGGACCCGATACCGAATGTTTGCCTATTACACCGTAGTCTTGACAGAGAACGCGGCCTTGACTCTCCTCTGGTATTTTTACAGAGATCCCGACACCACTGACTCCTACGCTGTGCCAGCACTTTGTTGCGTCTTTCTTAGCTTCGCCGCCGGGATCGCGCTGATGCTCTTGTATTACGGCATCCTGCATCCCATGGGCCCGAGAGCTAAGATTTTTGCCAGCTCCTGTTGCGCCGAATTGCTCTGGGGCATACCTTTGCCCCCTGACGTTGAACCTATGGATCCTCAAACGCCCGGGTACAGGGCGGACCAAGTAACGCCCACCAGAGTGGTCACGGAGCAACAGGAGGAACTTACTGCTGACACTTGCTTGCCCGTTTTCCAAGTGAGGGCCATGGTGCCATCGACTCCGTTGGGGAGACCTTACCACCCAGAAGGCCCTCTCATTAAAATAGACATCCCAAGAAAGAGGTACCCGGCTTGGGATGCCCATTTTGTAGACAGGAGGTTGAGAAGGACTATAAACATTCTCCAGTACGTCACCCCCACTGCTGTAGGAATTAGATATAGAGACGGACCTCTCTTGTACGAATTGCTACAGTACGAATCTTCACTTTAAAAGCTCCTTTAAACACAAACCCACATACACAGGAAACAAACACACACACATACACACACACACACACACAAAACTCAACACACGGTCACAGGCAAACAAGCAGCAACAACAAAAAAATTAAGAGAGGGGATTTGGGGTGGGGGGTG\n>XM_018564101.1 PREDICTED: Nanorana parkeri transmembrane protein 72 (TMEM72), mRNA \nCTGGAGTCATGGAATGTACTGAGGAGGTGAGAACAGCAGCATTAACTGGATGTTTGTGGACAGAGCCTGTTGCTTCACGGTCACATACACTTTGGGATTCTTGTTTTCAAAACACTCAGAAGCACAGCTTTCCACCGCGTGAAAGCTTGTGATGTCTGTGATGCTGAAGGTGGTGTCAGTACAGTGTCATTAGCCAGTAGTTACAATGCAGTGCCAGGCAAGCTGGGTGGTATTAGAAGGCATCTGTAGATTCCTGGGGGTGTGTACAGCTGCAGTGCTAATTGGTGTTGGGATTGAAACTCTGCAAAAGGGACAATTTCCAAGTCTGGCCTATTATTTACTGTTTTCATCAGCAGCCGTGTCATTCTGTGAAGGTGTTTTCTTCATACACATGTTTCTCATGCACTGTATAAGATGGCAGTCAGAACCCCGTCTGTATGTATGCTTACGGAAAACAGCACGAATGGGAGGATTTCAGAAGTTCCTTGGGTATGGCATACTGTCAGTGGCCTGCTTCCTTCACCCAGTACTGGTCTGGCATGTCACAATTCCAGGAACCATGTTAATTGTTACTGGGATTGCCTATCTTTTTTTGAGTAAACGAAAGAAGACTAAGAGCAAGGATTGCGTTTTGCAGGCTGAATATTACACAGACCCATCTACCACAGCCATTGCTATGACCAGAGCTGGAGACACAGAGCAAACTTACACTTTCAATGACTCCCTGCGCCAGAAGAGAGAATCTCTACTCACCCATATGAGAAGCATCCTCAAAGTAAAGAAGGACCGCCAACCATCTAAGAAAGACCAAGGTCGCATGGATGCTTCTATAGACTTATGTGCTAAAAAGAAACAGGTTCACTTTGAGGAAAAGGTTATTAAAATCATCCCCTTGGAGGAAGGCATTCTTGAAGACCAGGACAGTGAGTTGGAGGTGACAATTTCAGATACTATTCCCATCATACCCAGTGAGCCCAAACAGGTTTTGAACACCACACCCATGACATCTGGCATTTTTTAAAGG\n>XM_025751866.1 PREDICTED: Arachis hypogaea uncharacterized LOC112701064 (LOC112701064), mRNA \nATGGCAGATTTTCTAGTAGAAGTAACGGGGAATCCGACCGAAGAAACAAGCACACGGTGGAAGCTCCACGTGGACGGAGCCTCCAACCAGACGTCCGGGGGTGCCGGGATCATCCTGGAAAGCCCGGTTGGAGTCGTATACGAGCAGTCGATCAGGTTCAAATTCCCCATTTCAAACAACCAGGCAGAATATGAAACCCTTATAGGGGGCTTAACCATAGCAGCGGAAGTCGGAGCAACAAGGCTGAAAATATGCAGCGATTCCCAGGTCGTCACCTCCCAGGTCACGGTCCACCACGTGCCAAGAGAAAGGAACACACGGGCAGACCTTCTATCAAAATTGGCCAGCACTAAACCGGGAGAAGGCAACCGATCTCTCATCCAAGGTATGATGAAGGAGCCGGCGGTCACCTTGCATTTGTCAAGGCTGGGCTCTTCATGGCTAGACCCCATCACCAGCTTCCTAGAAAATGGCAAACTCCCTGACAATGAAAAGGACTCCGTGAAACTGAGAAGGGAAGCAGCTAAATATGCAGTCATTCAAGGACAGCTATTCAAGAAAGGGTTCAACCAGCCCCTACTGAAGTGCTTACACCCCGACCAAACGGACTACGTCCTCAGGGAAGTCCATGAAGGCTGCTGCGGACACCACATAGGAGGCAAAGCCCTAGCAAGAAAATTAATTCGAGCCGGATACTATTGGCCGTCAATGATGGCAGACTCCAAGGAGTTCGTCAAAAAATGTGTCAAGTGTCAAGAGAACGCCAATTTCCACAGGGCGCCGGCCTCCGAGTTAAGCCTGTTAACGTCCTCCCGACCATTCTCCCAATGGGGAGTCAATCTCTTGGGGCCCTTCCCAGTGATAACGCGATTCGCGATTCCAGAAGTTGTCATCTCGGACAACGGCACACAGTTTACCGACAAGAAGTTCACGGAATTCCTCACCGGCCTAGGCATAAGACAGAAGTTCTCCTCGGTAGAGCACCCCCAAACAAACGGACAAGTGGAGTCCGCGAACAAGATTATCCTGATAGGGCTCAAGAAGCGATTGGATAATAAAAAGGGTGCTTGGGCCGACGAGCTAGCCTCGGTGCTCTGGTCTTATCGAACAACTGAACAGTCCTCCACCAAGGAAATTCCTTTCCGACTAACATACGGATTAGACGCGGTAATACCCGTGGAAATTGGGGAACCGAGCCCCCGGCTACTTTTGAAAGGAGTAGAGGAAGCCGTGGAGAAGGACCTAATAGATGAAGCCAGAGAAATGGCCCATTTGACGGAGACATCGCTAAAACAAAGAATGGCCCTACGCTACAACACCAAAGTGCTCAAAATAGAATTCGAGCCGAACGATCTCGTCCTAAGGCGTAACGACATCGGCCCACCGACCCCAGGAACAGGCAAGATGGCGGCAAACTGGGAAGGCCCCTATAGAATAAAAAAAGTGATGGGCAAAGGCGCTTTTAAGTTAGAAAGGCTCGATGGCAAGGAAGTCCCAAGAACATGGAACGCGAACAACTTGAGAAGATTCTACTCCTAG\n>EU583709.1 Uncultured Tulasnellaceae isolate S2.12h internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene, complete sequence; and internal transcribed spacer 2, partial sequence \nAACGTCTTGTAATAAATAACGTACAACTATCAACAACGGATCTCTTGGCATCCCACTCGATGAAGGACGCAGCGAATTGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACCTTGCACCTTTTGGTATTCCGAAAGGTATGCCCGGTTGAGTATTATGAACATCTCAATCCTCTGGCTTCTGATCGCAAAGGTCGCACGTTCGGCGAAGTCGTCTGTCGGGACGACGGTAGCTGAAGTGCGACTTGGAAGCCTGTTGGACTTGGACTTGAGCGACACGTCGGTCCTCCACGATCGACCCGCTTGAAATGTATTAGCTGGCGACCCGCCTTACGGTTCCACTCGGCGTAGTAAGTTCTATTCGTCGAGGACGCCTCTTTCGAGGTGGCCGAAAAGCGCGCGATTGAAGCCGCTTCCAGTCGTCTTTGGATGCTTTGAATCTTTAATCTCCACCC\n>KC809930.1 Bacillus sp. EK-CH-I9 16S ribosomal RNA gene, partial sequence \nAGCGGACAGATGGGAGCTTGCTCCCTGAAGTCAGCGGCGGACGGGTGAGTAACACGTGGGCAACCTGCCTGTAAGACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATAATTCTTTCCCTCACATGAGGGAAAGCTGAAAGATGGTTTCGGCTATCACTTACAGATGGGCCCGCGGCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGANACNCGGCCCANACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCANCGCCGCGNGAGTGATGAAGGTTTTCGGATCGTAAAACTCTGTTGTTAGGGAAGAACAAGTACCGGAGTAACTGCCGGTACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCANCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTTCCTTAAGTCTGATGTGAAAGCCCCCGGCTCANCCGGGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAANAGAAGAGTGGAATTCCACG\n>XM_041467909.1 PREDICTED: Pyrgilauda ruficollis lysosomal associated membrane protein 3 (LAMP3), mRNA \nCTCGGCTCGCTCCGCAGCGGCTCCCGGGGAGAAGCAGAGCCCGCAGCCCGCTGGCCATGGGGAGGAGCGCACGGCAGCTCATCTCGCTGACCCTCGCCTGTGCATTTTCCTCCTGCTTTGCTGAAGTGGCCCTGGGGGTCGAACTGTCTCCAGAAACCACATCCTTCCACCAAATGGCTACTTCTGCTCAGCCACTTTCCCTTTATCATTCTTCACCCCATCAAAGCACTGCAGTTCATTTTACCAGCACAGGCTCTCTTCAAACAACACCCATGGGCCACAGAACAGCTGAGCAGACAACGGAGCAGCTCAAGACAACATCAGCCGCAGGCCAGCACACGGCAGCCCAGGCAGGAGCAGGCACTGTACCCACAGCCCCTGCAGACAGCCCCAGCCCCGGCCGGGCCACCACCCCGGCGATGCCCTCGCTTACAGCGGTGGTCAAGAACACAACCACTGCCCCTGTGTCCTCCACCAGGCATGGCAAGGGACCACGTGTGACCACAGGAACTGTGGCAGTGGCCACCAACACCTCCCTGAAGCACGAGACAGCGAGTACCCCGGGGGCAGCTGCCACCTCCGCCTCGGCAGCCCCCAGCACGCCGAGGGCCGGGCCCAGCACGCGGTCACGGAGACAAACAGCAGCCACTGGTGCTCCAACAGCCACGGCCGTGACCAACACAACAGGCACCCATGCAGGGACACAAACAGCCCCCACATCCCCTGCCAGCACAGTGAGACCCCGTCCCACCCCACAGCCCTCTGCCATCCCCACAGGCACCTACACCGTTTCTGATGGCAACAGGACCTGCGTCAAAGCCGTCATGGGTCTGCAGCTGATGGCCCGAAATACCCAACAGGAGCAGATGGAATATGTGACTGTTAACCCAAATGCGACAAAGATATCTGGAAGCTGTGGGATGGTGCAGTCTGAGCTGAACTTAACTTTTAGTGGAGGATTTGTAAACATCAACTTTGTAAAGCAAGCTCCAAGTTACTCTGTGACTAAAATTGAGAGCAGAATACTGTTATCTTCTGAAGGTATGCTTTACTATGCAGCCCTAAATGAGAAGCTGTTCACAACAAAGCTGGGGAATTCCTTTAAGTGTGCCAGCAGGCAAACCTTCCCCTTGGAGAAGAACTTCCAGATCCTCTTTGTTCATATGCAGCTGCAGGCGTTTGACATTGTGGGTAACCAGTTTGGAAAAGAAGAAGAATGTTTTCTTGATAGAAACGGCAGAGTAGCTCCCATTGCAGTGTGCCTGTGTATCCTGGGATTGTTTGTCATTGTGTTTGCCACCTTCCTGATCTCCAGGAGGAAGCCACAGAGAGGATATGAACGCATCTGAGGTGCCCCTATGCTTCCAAGTGTGTGCAGCAAGCAGAGAAGTCACAGGAGTTTTTGCTTCTGCCTGGCAATCTCTCTGCCCTGAAGCCACATTTTTAAGTGAGATGACACTGTGTGTTTACAGCTAATGAATGTTTCTGGAAGGAGTTCTTTTAAGGTGGGAAGGAGAGAACTCACACCTTCTGCTTTAAGCTATTCTTAGCATCTAATTTAGATGTAGTCCAGAATGAGGAGCCTAAATTCTCTCTGTTGTCAACAAAGGAGGTCATTCAGATCACTTAAGCCAGATTCCTAAAAATAGCTTAAAGCAAGCAGTATCACTATCTCCCAGAAAATGCATCAGGTTTGTTAATGATGGTGTTCAGATTTATCAAAAGACATAAGTCTGACCTTCAGGTGAAAAAACCTCAGGCCCACAGCTACAGACAACCCTGCTAAGTGAGAGCTCACTGAAAGCTTTT\n>XM_023176141.1 PREDICTED: Drosophila willistoni uncharacterized LOC6643128 (LOC6643128), transcript variant X4, mRNA \nTTCATTCACTATGTCCAAGGGACTTTTGGGCCTTTGGCTTCTGCTGGCAGTGCTAAATAGGCTACAGTGTTCGAATGCTTATCAATCTGGTGGCAGCTATTATGATGCTGGCCAGTCCGGGTTATCAGCATCAACGCAATCATCTTATGGCGGCAGTGCCAGAATTCAAGAGCAGCCCATCTATGAGCGCGAATCGGCTTGTCCAGCGGGTTTTACGGGTCTAAAGCCATATCCTCATGATTGCCATCGATTCGTCAATTGTTTCAATGGACGTCCAACCATTCAGACCTGTGCACCGGGCACTCTATTCGACGCCAGAAACTTGCAATGTGATTCACCCAGCAAGGTATCCTGTAACGGAGACATTGCTGAAGCAGCTGCAGCAGCAGTGAATTCCAATCAATCCAGTCGTTCGGCTCGTTTGAGACAAATCAACACTGAACCCAAGTGTCCAGCTGGTGTTAATGGATTGCATCCGCATCCTTTTGATTGCACCAAGTTCCTCAATTGTGCCAATGGTCAAACTTTTGTGCAGAGTTGCGGACCAGGCACAGCATTTAGTGCATCTCTTCTGATCTGTGACTACAAGAACAAGGTGGATTGTGGAGCTGGTATCAGTGGTGGTGTTGCTGCATCAGAGGCCTACGAGAGTCGTCAATCGAAAGCCTACAATGAAGGCAGGGGGGAAAGTGCCGGTGGTAATCGTTGGAGCTCCATGAATATGCAGCGTCCAGCTGGCATTGGCTTCACAAATTACCATCAGCAGCAGCAGCAGCAGCAGGTTGGACAAGTGAATCAGCAATATGGCGGCGAAGCAGGAGGCTGGTCTGGTCATGGCACCTCTTTTACCCATCGTATACCCACACAGAGTGTGCTCTATGTGGAAGGATCCCTACAGCCGAATCGTAATTATCCCAGTTATAAGACTCCATTGGCACCCATGGCTCCTGCCTCTACAGATCATGTGTATTACGCTAATCCAGTTGTGGAAGAGGTCGAAGAGGAGGAGGAGGATCAGCAGCAGCAGCACCATAACCACCACCACCACCAACAACCACAACCACATCAGTCACACTACTCACCCAATAGTTTGTCACGTCAAGACTTTAGTAGAGATTTGGTTGGAGCTGGCCAACAATATCCCAATCATGACTTGCCACCATTGGCTCCTTTAGGCGGACAGCAACCTCTTGATTTAGATTATACACCAGATGCTGGACAGCAATCAGTTGACCTAGACCAAAATCTCACGCCACACAGTCCATCACATGACCAGTTTCCCAGTGAAACACATCAGGAACCTGTAGATTTATATGACCCGCCCGTTAAGGGTTTCCCTACGCCATCCTCTCCGTTGCCTCACCAACCAGTTATAGACGAGTCAAATTTGTATGGAGGCTTGCAACCTCCACCACCACCAGCACCAACTCCAGCAGCACAACCTTCTACCCCATCCACAACACGTTTGCCTACAAATCTTCGTACATTTCCCATCTATCCACCCATGGCCAATGTTAGCTCACCGAAAGAGGTCAGGCCACCACATTATAGTCCTGGCTATGCAGCTGTAGCTCATTCCCATAATACATCTTGGCAAAAGATTCCGCCGCCAACTACTACACCAAAAGCTCATGATCCTTTCATTCCTTCCGAGGATATCGATGATAATTTGGATGAGTTTGGAGAGAGCACAACTAAGAGGCATGATCTTAGTCCGCCTCCTTTTGATCATAAATTTTACAATCCCACATTAAATTCTAGAGCTGCTAAAGCAGATTCCAATTCCGATCCTTCAAATGATCAACGGATTTTCGGTGAGGCTTTGCGTCTAATGCTGCGTCCCTATTTCAATCACAGTGGCAATGCCCCGGAGATTTTAGCCAAACAAACTGAATCAGCCATAGCTACGGTGATAAGCAAGCCACCTACCTCTAGAACTATTGCATCCACATCCACAACAACCACTCCCAGAAATTCCATACGACCCGACGATGATGTTGAACTCATTGTGGCCGGCGAGCAGGAAAGCCTGGACATTGAAACGAACGAATCTGACAGCGACTCTGACTCTGTTGTTCCAGATGCTGAGGAAACGACACACACTGAGCAGACCATAAATCCTACAACCTATGCTTTTGGTGATACACAAAATGATTTTCATCGTGGCACACGCAAGGTGGACATCGATTCAATGACGACCACAACCACCACATCCAGCACAACTACCGCCACAAACAACAAAAACAACAACAACAACAATTGGCATACGCCGCACAATCGTGATTTTCATAGGCGTCATCCAAATTTGCCCGATCCATTTGAGAAGCCGCATTCTCACCATCAGCATCAGCACCACAACAATCACCATTACCATAGTCCCCTCTATCATAGCCAGCATCCCGAATTGCTCAATCCCTTTCGGCAAAATCCCGAACAGAATAGTCCTGACACGACGACTCCTGACATAGTTCATCATCAGCATCATCACCCCGATCAACGTTTGCCCAAATCTTTTGACTCGCCAAAAGATCAAGATGAGGATGAGGATGAGGAATATCTACCCAATCCTAACGCTGAGGAAACAACACCTAAATCTCAATATCAGATATCCATGCGTAGTAATTTCCAGGATAATGACTGCGAATTCGATTGCGGCAATGGCAAGTGCATTAAACAAAAGGAAGTGTGCAACGGAGTGAATAACTGTGGCCCGAATCGCCGGGACGAGAGCCAGTGTCAACATTTGGGCTATCAGGTGCGGTTAACTGGCGGCGAGAACTCTCACATGGGACGCGTTGAAGTTAAGGTCAACGGTCAATGGGGTTACGTGTGTGATGACAAGTTTGGTTTACGGGATGCCGATGTTGTTTGCCGCGAATTGGGCTATAAAATGGGCGCACAAGAAGTGCGTGGCAATTCGTATTATGCCCCACCTGATCGCAACTTCAACTATATGATGGACAAAGTGGAGTGCCAGGGTAATGAGACAATGCTCAAGGATTGCCAATTCAAGGGCTGGGGCATTCACAATTGCGGTGTCGATGAAGTCGTAGGAGTAGTCTGCAAAGTTCCCGTGCTCAAGTGCCCGAACAACTATTGGCTGTGTCACACCTCTAAGGAATGCATCCCACCAGCCTTTGTATGCGATCATACAGAGGATTGTGCCGATAAATCGGACGAGAGTGAAGCAGTTTGTAAGGCTCCCATTGAGTATCGTTTGGAGGGTGGACGCAATCCAAGTGAAGGTCGCCTGGAGGTGAAGTACCATGGTGTCTGGGGTAGTGTTTGTGATGACGATTTCAGTGCAAAGTCAGCGCAAATTGCCTGCAATTCTTTGGGATACTATGGATCAGCCAAAATCGAGAAAAATATCTTTGGTCCTGCAAGTGGACCCATTTGGCTGGATGAGGTCATGTGTCATGGCAATGAAAGTAGCATCGATAAATGCAGTCACTGGAATTGGGGCGAACATAATTGCAATCATACTGAAGATGTAAGTTTACGTTGTACAGCTGGGCCACCACCAACCCGGCAGCAGCGTCAGCAGAGTGTTCGCCTTCACTCAGTGGGTGGTGGCAGCCACAACATCAAGGGAAGCCCATCCGGGCAAATTAGTCATCCCGCCTTTACTTTATCGGACATTGGACTGTGGGAACGTTCCAGCAAGGCTCTACATACGCCACGCCGTTGCGGCATCTTCAAAGATGATCTAACCGATGAGTATGCCCATCCTGAGGAGCGTGTGATTAAGGGTAATATAGCGCGTCGCGGCCGACATCCTTGGCAGGCCACCATACGTACCCGTGGTCGTGGCGGCATCTCAAGTCATTGGTGCGGCGCTGTTGTCATCTCTAAGCGTCATCTTCTGACTGCTGCCCATTGCCTGTACGGTCATCCAAAGGGATCCTACTTTGTGCGTGTCGGTGATCATTATGCCAATATTGCTGAATCCTCTGAAGTGGATTCGTTCATTGAGAACTGGTATACACATGAGAAATTCCGCGATGGTTCACACATGAACAATGACATTGCAGTGATTGTGCTTAAAACTCCGCTTAAATTTAGTGACTATGTCCAGCCAATTTGCTTACCAGAAAAGAATGTGCCTCTTGGCGAGAATCGAACCTGCACCATATCAGGTTGGGGCTCCATTAAGTCCGGTTTGTCCACTCCATCCCAGATTCTTAGATCAGCTCAGTTGCCCATTTTATCTGATGCCACTTGCAAACGCTCAAATGTCTATGGCGATGCAATGACCGATGGAATGTTCTGTGCCGGCTCCATGGATGAGAGTGTAGACGCATGTGAGGGCGATTCTGGTGGTCCACTTGTCTGCTCTGATGAAGATGGCGAAACTCTATATGGCATTATATCATGGGGACAGCATTGCGGTTATCAGAATAGACCGGGAGTTTATGTACGGGTTTGTCACTATATTGACTGGATCTATGAGAAAATCAATCACAGCTTGACGAAATTCTAAAAATCACATTTCGGATTTTTCAAAAAACATTTAGAATTTAGGACTATGAACAAGAATAAAGTCAATTTGCTTAAAATATA\n>XM_044890485.1 PREDICTED: Coccinella septempunctata spastin (LOC123307970), transcript variant X2, mRNA \nCCAGAAGAGGTCCTGTTACAAGTGTTCTGTGCTTGTTACTCTTTGGTCCTACGCTGACATAACACGTCGTTTTCCATTATTTTTTTAAGGATGAATACGAGTTCAATAAACTGAACATTGACTTAAAATGTATATTTGAATTTAGCTCCTTAATGGTTCGAAAAACACAAAGTGGAAAATCCCCTAAAAAATCTAGAAAAGTTGACCCTGAATCAGATAAAGATGTTATGTATATGACTTATGGGGACTCGTCTGTTCATAAAAGGAATCTGTGTATTGTTTCGTTTCCCATTATTTTTCTTTTCAGTATATTGAGAGCATTATTGTACCAAATTTTCGTTATACTTCGATTTCTCTACTGTCGTTCGTCGAGCTATTTAATTAAGCCACGTAAATTGCAGAATGGAAATATAGAAAGTAGTTGTGCTATTGAAGAAATTCAAATGTCACATAATATACAAAAAAATTCAGGTCCTGGTCCAGGGGACCCTCTGCTAGCCAAGCAGAAACATCATCATAGAAGAGCATTTGAGTATATTTCTAGAGCCCTTAAAATAGATGAAGAAAATGAAGGTCAAAAAGAAACTGCCATCGAATTATATAAGAAAGGAATTACAGAACTCGAATTGGGTATTGCGGTACACTGCTGGGGAGGAAGAGGTGAAGTTTGGGAAAGGGCTCAAAGACTCCATGAAAAAATGAAAACTAATTTGTCCATGGCAAAAGATAGACTCCAATTTTTAGCATCTGGGAAGAAATTAACTGTAGCTACTAGAAGACCTGGTAATTCACCTTTGTCTAAAAGCCAGACATTGCCAAGATCAATGGGTTCCCGCACAACACCTGTACAGCCAGTTCGTCCTTTTAATAAGCCAACACAGACTCCACCTGCAATTAAGAAGCAGTTATCTGTTCCTGGAAGTGGATCTCCAGCCAGAAAATTCTTAGCTAGTCAAGGTACCAGTAAGCAAACTTGTCGAGGCAAGTCTCCATCTCAACTGAAAGGAGTAGATCCAAAATTGGCTCAAAGTATTTTGGATGAAATAGTGGAAGGAGGTCCAGCTGTTCAATGGGATGACATAGTGGGTCAAGAAACTGCCAAGCAAGCTCTTCAGGAAATGGTTATTTTACCCTCCCTTCGTCCAGAACTCTTTACAGGACTGAGAACACCCGCAAGGGGGTTACTTCTGTTTGGGCCCCCTGGAAATGGCAAGACTTTATTAGCAAGAGCGGTAGCAACAGAATGTCAAGCAACATTCTTCTCAATAAGTGCCGCAAGTTTAACATCAAAATATGTTGGTGATGGAGAAAAAATGGTTAGAGCGTTATTTGTTATTGCAAGGGAGTTGCAGCCTTCAATAATTTTCATTGATGAAGTTGATTCTTTGCTTTCTGAACGCACCAATAATGAACATGAAGCAAGCAGAAGGTTGAAAACAGAATTCCTTGTTGAGTTTGATGGATTACCATCTAACCAAGAAAGTGAGAAGGTTCTTGTGATGGCCGCAACTAATCGACCTCAAGAACTAGATGAAGCAGCTCTTCGTCGATTTCCCAAAAGGGTTTACGTTACACTACCTGACATGGAAACTAGAATGGAGCTATTAAGAAAATTATTGGCTAAACAAGGTTGTTCTTTTACTCAACAAGAGTTGAAAAGGTTGGCTACACTAACAGAAGGATACTCTGGAAGTGATCTCACTGCACTTGCTAAAGATGCTGCTCTGGGACCTATACGAGAATTGCAACCTGAACAAGTGAAACAGATGGATCCAAGTGCAGTCAGAAGTCTTACGATGAACGACTTCCTGGAATCTTTGAAGCGTATAAGAAAAAGTGTTTCACCTCATAGTTTAGTGGCTTATGAAAAATGGTCATTGCAGTATGGAGATGTCTCTATTTAGAAGTAATACTTTGGTACATTTCAAACTTGTCTTTTATATTATTTGGTCTTGTTTTTTATACTTTGTCTGTGATAATTGATGTAATTGTAAGTGTTTATCATTGCTGCCAAGGATGAGTTTTGAAGGTTATATGGTTTATTCGATACTAAATTATATTCATAGCGATACAACTATGCAAACTGGATATTTTATGTTTGTTAGCTTCTTTAACTATTGAAGCAATACTTGCTATTAATAATTGAATTTCATTACGCTTTTTATTGCTATTATGTAGACTTAGTATCATGGACATTAATATATTCACTTATAACTTACAAAA\n>XM_040825979.1 Metarhizium album ARSEF 1941 uncharacterized protein (MAM_07181), partial mRNA \nATGTCGCCACGGCCGGCCCGGACGGAACATCATTTAAACGTCGACAAGCCCAGCATCCGAGCTTCGCCTCTTCCGCTTCACACCAAACCCCTCTTCCAACGAGAGGTTCGAGCACAGCCCAGCATGGCACTCCCCAAAGTCCCGACCGCGACCGGCTTGCTGCGGCACAGCACACGCCCGGCGGCCTCGCGGGCCAGCCTGCCTCAGCTTCGACGCAAGGTGACACGAGGTGACGGCGATCTCGGCGGCCCGGGCGGACAGCAGCCCCCGCCGCCCAATCCAGGCGGTCCCGAAGCCGTCAAGAGAAACTGGGTGCCCATCGGCGGCGCGGCTCTCGCTGCTGTCGCAGCGTACGCGTATCTCACCACCCCCAAGGTGGATGTGGACAGGGCCAAGCAGACAGACGCCAGGAACCCGAGCCAGGCGGAATTGCGCGACCTGGCGGCCGGTAGCCAGGCGGCGGAGGAGGTTGTCCAGCAAGTTGCCGACCAGGCGACCAAGACGATGAAGGAGATGAGCGGCAGACGCAAGACGGACCAGGGCAGTTTCCGACACGATTGA\n>XM_034374830.1 PREDICTED: Thrips palmi deubiquitinase DESI2 (LOC117639294), mRNA \nACACACCGTACAGTGCAGTGCGTCTGCGCGCGCGCTCGAGGGGTGGTGTTGTGTTGAATGAATGTTGACCTGTGTCCAAAATCTTTTGTTGTCGTCAGCATTTTAACTTTTCGCTTTGTTCAAAGAACCGTTTAGGCTTTAGTTTAGGACTTTGGACATCTAAGCCTGTATCTGACTCTTCGTTTGTCGCATGTGTTATCAGCAGGGTTTTCAGCAAGAAGATGTCGTCAGAGCCAGTTATTCTCAATGTTTATGATATGTACTGGACCAATGAGTATACTACTCCTATAGGATTAGGAGTATTCCACTCTGGTATACAAATATATGGCATGGAATATGCTTACGGAGGCCATCCCTATACCTTTTCCGGTGTGTTTGCAATTGCTCCACGTGATGCAGAAGAATTAGGAGACCAATTCCAGTACAGGCAATCAGTTCATGTTGGGTACACAGACTTTACTGAAAAAGAAGTAAAAAAAATAATTCAAGAACTGGGAAAAGACTTCCGTGGGGATCGTTATCATCTTATGAATAAAAACTGTAATCATTTCTCTGGGGCATTAAGTCAGATTCTCTGTGGCCGCGACATTCCCTCATGGGTCAATAGACTGGCATACTTTAGTTCTTGTGTGCCTTTTCTTCAACGGTGCTTGCCGAGAGAATGGCTGACTCCGGCAGCCTTCCAGCAATATAGCACACCAAATGCCCTGCAGCACACACTTAGTGCACGTGATAACAGTCCTGATGGTCCTTCCTCATAACATGAGGCTGCTGGGGCGGATCATGAAACACATCCTCTCTATGAAGATGACACTCAGTCCGTCTCCCAGCTTCCCTTGCTGTACACCCATGATCAGCCAAGTTCATGGCTGGGCAACCCCAAAGAACCACTGCCGTCCAGCTCTAACGTCAGTGATGAAGATTGAATGTACTTCTGTGTTATGCTTAAGTGGGTAACAGGAATGTTCAACATATATTTCTGTGTTATATTAAGTGAAGATGTGATTGGGTTATGAAAAGAGTGCTTCCAGAGGAGTACAAGAAGCACAACATTAAAAACTTTCAAAAACTTGAATCAAAACTTTCCTGTAAGTCATTTGTATAGTATTAAGCCTGTTGTCTCACATTTTTATTCTATTTTCCTGTTTGGTTTGAATGTTTTTAAAGCTTGTGTGGGACTCCTTCGGAAAAAGTGTTTGTGCATGAAGTCTACTATGACCTGATTCCCTTTTTTCTCTGAACCCTGAAATATTATTGGTTAATGGTGAAGCAAGTATTTCCCTGCAAAAATAAAAATTACTTGTTATCTTGTTGTAAGAAATTCTGCACTCTTGTGCAGTTAAGTTTTAAGAAACGATCATTCATCTTATATGGCCCTGTTTTATCATACCTTTGTTGATAACTCCCCCTTTATTACATAACAAAACAATTTTCCTTATGGTTTCTTTCATAAAAAGTGATCAATTTTTTTTTTATAATGTTATACCATGGTGCTTTTTGAAACTGTTGGGAAGATATCTTTGGGATTTTTCCAGACTCTAGGTATCTGATGTCATCATAACTCTTGTTTGACATTCTGTAGAAATATTTCAATTGATGTATCAGCATGTTGTCACTATTTGTATTTGTCAGGAGATGTGTTAATGCTTACTACGTATGAAATTTAGTGTTGTTGAGTCTTTGCTGGCCGCTTTTTATGTGCCACTGTAAAATTATTGCCTTATCCTAGGAATTAAAATTTGCTCTTCAAATTTGACCTCAGATCTCAATTTTTCTTGCCACTTCCTTTTTTAAAAAATTCAAAGTTCACATTTACTATGTCAGTGATTCCTCCCTGTGAAGAGGAATGCTTTGGTTTGAGTCTGTAGTTCTCTCAAATATTTGTATGTATTTAAGTTATTCATGAATCATCATAGCGTGACAGGTGACATTTTGAGACAAGCATTACTGTAGACTCCTTTGAGAGAACCGACTGCTTTTTTATTATTCAATAATCTGAGTGCGAATGAAATAAACCTTGCCTCTGTCTATGAATGAACAAACAGTTATAATTCCACATTACTTGAAGTTTTTGTGATTCTGTATATTTGGTGCTTTATAATCACTAGTTACTTACTGTACAATTGGATTTGATACGGAGGTGGCTATGCCTTGCCTAACTTTGTGTTTCAACATTTTTTGTAAAAAAAATTTGCAATATCAGCACAGTACGTTTGTATTTACTTTACAGGTACAATGTACATAATGTGAATTGTTCTTGTCATGGATCCTTGTATAACTAGTGGCAACCTGAATGTAGAAGGCATAACTGAAGGCAGAGTTCAAGTTTCCAGAATTAAAGTGTTGTATTCAGAGCCAAAAA\n>KC066956.1 Uncultured bacterium clone G4RKN2Y13H4BNZ 16S ribosomal RNA gene, partial sequence \nTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGTCGTGAGGAAGGTGTTAAGGTTAATAACCTTAGCAATTGACGTTAGCGACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGGGCACGCAGGCGGTTAATTAGTTGGATGTGAAATCCCCGGGCTTAACCTGGGAATGGCATTCAAGACTGGTTAGCTAGAGTCTTGTAGAGGGGGTAGAATTCCATGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAATACCGGTGGCGAAGGCGGCCCCTGGACAAAGCTGACGCTCATGTGCGAAAGCGTGGGGAGCAAACGAGGGATTAGATA\n>HQ143338.1 Uncultured bacterium clone 19-239BM 16S ribosomal RNA gene, partial sequence \nGCCGTGAAAGTCCGAGGCTCAACCTCGGATCTGCGGTGGGTACGGGCAGACTAGAGTGATGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGGTCTCTGGGCATTTACTGACGCTGAGGAGCGAAAGCATGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGTTGGGCACTAGGTGTGGGGGACATTCCACGTTTTCCGCGCCGTAGCTAACGCATTAAGTGCCCCCCCTGGGGAGTACGCCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGAAGAACCTTACCAAGGCTTGACATGTGCCAGACCGCCTCAGAGATGGGGTTTCCCTTCGGGGCTGGTTCACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGTTCCATGTTGCCAGCACGTAGTGGTGGGGACTCATGGGAGACTGCCGGGGTCAACTCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGTCTTGGGCTTCACGCATGCTACAATGGCCGGTACAATGGGTTGCGATACTGTGAGGTGGAGCTAATCCCTAAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCCCATGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCAAGTCACGAAAGTTGGTAACACCCAAAGCCGATGGCCTAACCACCTTGTGTGGGGGGAGTCGTCGAAGGTGGGACTGGCGATTGGGACTAAGTCGTAACAAGGTAGCCGTA\n>KT815871.1 Uncultured eukaryote clone 41c_79369 18S ribosomal RNA gene, partial sequence \nCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGTTGAGAGCAGCCGGTCCACCTTTTGGGTGAGTATCTGGATTGGTCTCGGCATCCTCACAACGAATGTTTCTGCGCTTGATTGCGTGGTATAGGCGTTGTGACTTTTACTTTGAGGAAATTAGAGTGTTTCAAGCAGGCGCACGCCTTGAATACATTAGCATGGAATAATAAGATAGGACCTCGGTTCTATTTTGTTGGTTTCTAGAGCTGAGGTAATGATTAATAGGGATAGTTGGGGGCATTCGTATTTAACTGTCAGAGGTGAAATTCTTGGATTTGTTAAGACGGACGTACTGCGAAAGACATTTGTCCAACGGAAGTGTTTTCTATTGTATCAAGAACGAAAGTTAAGGGGTAGTCGAAGATGATTAG\n>XM_033019624.1 PREDICTED: Amblyraja radiata GREB1 like retinoic acid receptor coactivator (greb1l), transcript variant X1, mRNA \nGCGGAATCTAACGCCACATGCGTGAAGGGAAAATACTGCAGGCGGGAGCTGCGACACCGTGCCTTTGATCGTGCTGGTTGCTAATGGGGTCGCTCGCTACATTTGTATTGAGCGCGGTCGATGTCATTTTCTTTCCTCCAATTTCTTTGTGCTTGGACCTTGAGTGGAAGCTAGGTTACTGCAGGACAAGCGTTGAATGTGGAGAGATTTGTGTTTCTTCCATGGCCGGAATAAACTGATTTATACCGACGCCAAATTTAATGTCCTTAATTTGAGTGTGGACCAGTTTATTTTTCATCTTTGGTTATTGCACGTCTGCGAGACAATTGAGCCATTGTTTCTATCATTGAGAGGATTGCTGACCACACAAACTCCGGCATCATTTTACCTCTTGTCAGATAAAAATGAATGCATTTCCAGAAGGGTAACTGACAGAAAGGAGACCATGGGAAATTCATATGCTGGGCAATTGAAATCTGCGCGTTTTGAAGAGGCTCTTCACAATTCAATCGAAGCATCACTTCGTTCCAACAGTATTTCTCCTCAACCAATTTTCTCTCAGCTTTACCTTGAATCCGATAAACCACCTCTGTCCCCTCAAGATGTCAAACCAAAGATAGAGGAACTTAATAAAGAAATTGAAGTGCATCGTTATACGCAGAGTAGCTCTTCTGGATTCCCAGCTATACAAGTTGGCAATGGACTGGATAATGAGGAGGAGGAGGAAGAAGAGGAAATGTCTGAGTCAAACAGCCCACCTATTGCCTACATGCAGAAACATGTTCCAGAGGGATCCTGCACTACTGATGGTTATTGCCAGGCTGGCAAGGACTTGCGCTTGGTATCACTCTCTGCAGAACAAATTGACATTCCACCAGGCTTTGTGTTGGTGGGAGCCAAATCTCCAAATCTTCCTGAGCACATTCTGATCTGTGCAGTTGATAAGCGGTTCCTGCCAGATGACAATGGAAAGAATGCACTTTTAGGTTTCTCGGGAAACTGCATAGGCTGCGGGGAGAAAGGATTTCGGTACTTCACTGAGTTTTCCAATCACATCAACTTAAAGCTGACAACCCAGCCGAAGAAGCAGAAGCACTTAAAATATTACCTCGTCAAAAACTCGCAAGGTGTTTTCTCAAAGGGACCTTTAATTTGCTGGAAAGAATGCCGGACTCGTCAATTGCCCAGCAGTTACTCGTCTGCAGTAACTTCAACCAAGACAGTTACCACAGTCGTTGGATCCACCACATCTTCTCCGAATATTGACACCGTCTCATCTAGTGTTTGCAGTACCACCATTGCCAGCTGTCAGACAGAATCAACATTCAGCCATGGTTCAGCAGCATCTTCTGCCGGCTATTCTGGATGTCAGGACCTGTCCAGGAGTGGAAATGTAGCAAAACCTGTTACAATAGCTGCACAACAACTTGTGAAGCCTCCAACTTCAGCTCCCTGTGCAAATAACCAGCCACCTGGGTCTATGCGAGTTAATGGTAATCCCAATAGTAACGGCAATAGTGGAAAATCCAATGTTTTCAATGCTGCTCGACCTCAACCTCTCTCAACATCATCAAGTCCTGGCTTGGCATCAGGAGAAAATAGCATCATGACAAGCTCTGGACCACCTAAGAAGCGTCATCGTGGCTGGTCACCTGGTTCCCCCATTGCTGCGCCTACAGTAGTCCCTGTTCCAGCTGTGAGACCAGTGATGCGACCTGATGTTATGGCACCCATGCCTGTTCTTCAGACAATGTCACCTGGAGTCTTGCAGCCTCAGGCAATACCTGCAGGGGAGACTGTTATCATCCCAGACAATTTATTAAACAATTCTGGAGTGAGACCTGTTATTCTGATGGGTTATGGTTCTTTGCCATATTTTTATGGCAACGTTGGTGATATTGTAGTGAGTCCCCTACTTGTGAATTGTTACAAATTTCCACAGCCGACATCAGCTGAGCTGGAACAACTGGGAATTTCCAACAGCCAGATACTGTCAGTGGAAAACATGATCCTCTTAACAATACAATATCTGATTCATCTTGGTCCAGACCAAATGCCGCTCAGGGAAGAATTTGAACAGATTATGCTGAAAGCTATACAGGACTCGAGCCTCAAAGACCGATACCTGCAGCTGGGAGCCCCTTGTTCCACTGTGTCTCCAGGGCAGTTACCCTGGCTGGCCCGCCTTGCCGCCAGTGTGTCGAGAGATCTGGTGCAAGTTGTTTTTTCTCAGAATTCTCTAGCAGAGGGCATCTCGGAGACGTTAAGAACATTTGGTGATGTGCATCTTCAACAGAAAGTACCAAACTATGTGGTCGTCATTTGTACGTCAAAGATCAGAGGCAATGAATTTTGTGTGGTGGTTTTAGGTCACTATCAATCCAGAGTTTTAGCCGAGAGTATGCTCACCACCACTGAGTTTCTGAAGGAAATCAGCTACGAACTAATTACAGGAAAAGTCAGTATTTTGGCATCCCATTTCAAAACCTCCCCCTTTGGAGATAACGTAGACAAATTCCTGGATAAATTTCAGCAAAACAGAAACAACAGTGTTGCCATTCCATTCAATGGAAATGTTTCGGAATACATTCCGTCAAATGAAGCGGCAGCAATGACATCAAAGCAAGGAATTGATTCACTTACGGAAGTGTTCCAGATTCATCTACCTCAGCTCACTGTCGCTCGGAATCTGTTGTCTCAGGTTTGCGCCATAGCCGACTCTGGAATGCAAAACCTAGATTTGGGCCGTTTTGCAAACGTTGACTTCATCATTTTAGTTCCTGCATCGGAGGTTCTTTTCCACCAGACTCTGCAACGTATTAGACATTCAGGAGTACTTGTAGATTTGGGGCTTGAGGAAAATAATACAGCCGACCAAAAGGCTGAGAAATATATTATCCGACTAGACCATGACATTCAGAACAAATTTGAGGCTTTCATGAAGAAGGTCAAACAGAATCCATACACACTCTTTGTTCTTATTCATGACAATTCTCATGTTGATCTCACAAGTCTTGTTCCAGGCTCTACAACTCACGGGGAAGCCAGCCAAGGTCTGTCAGATAAGTTTATTAATTCACGTGAGGCACTTGAAGCGTGCAACTTACTTATGTTGCAGGTCAGCTCCTTTCCTTTCACTCTACAGACACAGCAATCCCGTGTTAGCTCAGACAATGAAGTACATTGGCTATTATCCAGCAATCCTGAGGAACTCAGCAACGAAGAGTTGGTATATTTTGGTTTGTCCGATTACAGCAAGTCTTTGCAATGGGGCATAACAAGCCCAATACTGAGATGTGATGAGGCTTTCGAAAGAATGGTGAATACATTGATGGAAAGGTATCCTAGGTTGCACAGTATGGTGATCAGATGCTACCTGCTGATTCAGCAGTATGCTGAAGCCATGATGGCTGTCACATCGATGAACCTGTTGAGGGAGCACACCACCCCCGAGACCCTGAGCATCGTGGATGACTTGATCAGCTGCCCCGGGAAAGACGAGATTGGCCGCGGACACATGCTCCTGATACGGGTCCCATCAGTACAGCTGGCGATGCTTGCCAAGGAGCGGCTCCAGGATGTCCGAGACAAGCTCGGCCTGCAGTATCGGTTTGAAGTCCTTCTGGGCAATCCAGCCGGGGAGCTCAGCGTTGCCAAGCACTTTGTCGCACGGATGAAGGGATGGAGAGGGTGTGAGCAGGATGACTGGACACCACTCACCTATCAGGATCTGGAGGGTCTACCATGTATTGTCATTTTAACTGGTAAAGATCCACTTGGGGAATCATTTCCACGGTCCATGAAGTACTGTGATCTTAGGCTAATTGACTCCAGCTACCTTACACGAACAACCCTTGAGCAAGAGATTGGCCTTGCTTGTGGCTATGTTTCTAAAAGTGCTGTCAGAGAAACCATGGCAATTTTCGAAGGAACGGAGAAGGAGCATGAGAAGTTTCTTACCAGTGAGAATGAATCTGATGAATTACAGATCGATCTAGAGAGACCACAAAGTAACAGCAGTGCAGTCACTGGAACTTCAGGGTCCTTGGCAGAGAATGGTGTGAGCTCATCCAGTGTGCTTGACTCATCACAGAGGCCTGCTTCATCTCTTAGCTTCCAGAATATTGTGAACAGTTCAATTGATGAAGGCACGTCAACACACACTTCACACATCTCGACCACTGTGGGCAGTGAGGGCTGCAAGCAGGAAAATGACTTGGAAGGAAAGGAAACAGCAAGCAGCACAGTTTCAAAATCTTCCTCATCCTCTGGGAATTCTCGGCAATCCATACTGGTCAACAAGGACCTGAGGACTCCACGTCTCATCTTTCCAAGAACTGTAATTTTATCAAAACCAGTGTATCATCTCCTTGGTTCAGCAAGAAATGAGCACCTGTGTTCTGCCTCTTTGTTGCCCCATGCTGATGTGACTTGGACAAGCCCACTGAGATCACTTTTCCACAAGGAATTGAGCAGTGAAGAGCAGTCACTCTACTACAGACAGTGGACATTTCCCAGGCAACATCATGCGGACTATAGCAATAAAAGCGAGGGAAGTTCTGGAAATTTCCACCGACGCCGATTGTTATTGACTGGACCTCCACAGGTTGGAAAGACTGGTGCTTACTTGCAGTTCCTTAGAATTCTTTTTCGCATGCTAATAAGGCTCTTAGAGGTTGATGTATACAATGAAGAAGAAATTAACGAAGACACGAAAGATTCAAATGAGTATGCACAGGGTATTAATGCACAGTGGCCTGATATTGAACTCTTCAGTAAAATGACCTTTGATTACACGGTACATGATCCAAAGTATCGCCATATCAGTGCTGTCTACTCAGCCAAGCTGCCAAAGATTAAGCTAGAAGGTGGTAAAAAACGCAGCCTGATCGAAGGATCAACAAAACGAGAGACAGTCTCGATAATGCTAACTAAATATGCTGCATACAACACATTCCATCATTGTGAGCACTGCCACAACTACATTGACTTCAACCCAGCCACACAGGTGTCTGATTCCACACTACATGCATTTACATTTTCTTCCTCCATGCTGGGAGAGGAAGTTCAGCTTCACTTTATTATTCCAAAGTCAAAGGAGCAGTATTTTATCTTCAGCCAGCAGGGTAAACATCTGGAGAGCATGCGTCTACCTCTTGTCACAGATAAGAATCCAAAATTAGTGAAGAGTCCCATCTTTACACCAACTACAGGACGGCATGAGCATGGTCTTCTGAATCTCTACCATGCCATAGAGGGTGCAAATCACCTTCATATCCTTGTGGTTAAAGAGTTTGAAATGCCACTCTATCGAAAGTACTGGCCCAACTACATTATGTTGGTATTACCAAGCATGTTCAATGGAGCAGGGGTCGGTGCTGCCCACTTTCTAATCAAAGAACTTTCATATCACAACTTGGAGTTGGAAAGAAATCGCCAGGAAGAGATAGGGGTGAAGCGGCAGTGTGTGTGGCCATTTATACTTGTCATGGACGATTCTTGTGTCCTGTGGAATGTCCACAATGTGCAGGAATTGAGCAGTGAAACAAAAGATTCTGCAGTTTCCACAAAGAATGTTTCCTTGAAGTTCGTAATGCAGCACATTGAAGCCACACCAAAGATCACTCATTATGCACTCTGTGGGATTCGAAAGTGGAACAGCAAACTGAACACTAGCAAACTGAGGACAGCATTCTCTCATTGTCACATGCATGACTTTATATTCCTCAATGTCGACCTGACACAAAATGTACAGTATGATCTGAGCAGATATATCTGTGAAGACATTGATTTCAACTTACGGACAAATAGCAGTGGTTTGCTCCTTTGTCGATTCAATCACTTCAGTTTCATGAAGAAATGCATTCAGGTTGGAGGGCACAAAGATTTTGTTATAAAGCCTAAGATTATGGTGATTGAAAGCCTGAATATTATTTCAGCCTCGCAGTACGTCTGTGCTCCAGACAGTGAAAGCACAATGCTGGCTGCACCTGCCCAGTTTCTCCTGGAGAAGTTTCTGCAACACACTAGTTACAAACTCTTTCCTAAAGCTATACACAACAGTAAGAATCCGGTGTTGTCCATTGACTGTTACATGAACCTGGGTCCTGAGATTTCTGTATGCTACGTAAGCTCACGGCCTCACTCAGTTAACATAAAATCCGAGGAGGTATTGTTCAGTGGACTCCTTCTCTACCTCTGCGACTCGTTTGTTGTTGCTGACTTTCTCAAGAAATTCACGTTTCTTAAAGCTGCCACACTCTGTGTGATTTGCCAAGATCGAAGTTCATTACGTCAAACTATCGTACGTCTAGAATTGGAAGACGAATGGCAGTTTCGGCTACGTGACGAGTTTCAGACGGCCAACAGCAGTGACGATAAACCACTTTATTTTTTGACCGGACGACATATTTAAGTTCAGTTCACAAGACAAGAAATAGCAGGTGAGGGTTAACGGGTGCCATAAGTGAGAGCCTGACGGAGCACAATTTATAATTCCAAGCGAAAGGTGAAGTGGCACATGCGCAGAAACAAATATCGGATTTTTTGTTTGGTTACCTGACCACCGTCACTTCATCGAACATCTACATCAGAACAGAGACAGCGTGATCAGTGCATAAGAAGGGTCTATGACCTGCACTCTGTTACTTCTGTAACTCCGGGAGAGAGTTTAGTGTGCGACTTGCAGGGAAACTGGCATTGCACATGGTATGATATATCAACCCTTTCAATGTGGGGAAAAAAAGGCAGTGCGAGCTGCAGAATGTATTTTTTTTTCAGAACCGGTCAAACCTATGATTATTCCAGAATATGTCCAAAATAGACCTGGATCCAAAAAAAAAGGAACTACTGTCAACAAAAAGACTTCACTGAAGGAATGGAACCAAAGCAGTGGAGCATAAAACAATTGATTGTATGTTGAGGTTCTTCAATGTCACCATTCTGACTGTATGTAATTGCAGTTCAGCTCAGGGTTTTGCAAATAGGTGGCAATGGAGAAAGAGTTGTCTGTATTCGTACTAACTATTACCTTATTTTTTGGTGGGTTTTGTAGTGTATGGTTTCATGCTTATTTGGAGTAGTTCTTAACCTGGCATTTTTTTTAAAGCATGTTCTCATATTTTATGGACATTTAAATCTAAACATGATACATGGGGAAATGCAAAATACATGATGCTTTCAGTGGGACTATTGTTGAAATTTTTAATGGCACGCAACTTATCCAGAATCTTTTTCCTACCGTTGACAATACAGGCTTTTGTTAATTTTTAATTTCACATAATCTAATTGTTTGACTTCTCTCTTGCATTGTCTATAAAACCATTTATCACACGCAGTTACATGCTTGTACTTACACTTCTTATTTTCATACAAATGATTACCATAGTGCATTGAATCAGATTTTGAAAAGTAAAATGCGCAGCCTTGATTCTCAAAGACATCAATATCTTTTCAATGTTAACATGGTAAAGATTAATAATGGACGATGGAGACCATATGATTTTTGGTTTCCTTTTTTGTATGATATATGAAAAGAGTAAATGTGCACAAATATCACACATCCAATGGTTCCCTGCTTTGTGCCTGTAATGTTATTTTTTTATTTACTTGTTTTAAGGAGATAATCTGAGGGGGATAAACAAATGTCACATTTGTTTCAGTTATTATTCTTTATTACTGTGCCATTTCATAACATTTTTGGCCAGTTTTGTATACATCTACAGCTATCCGCTTGCAAGGGATGGATTGATATACTCTCATGGGCAACTAAATAAAAATGTAGAAAGATAGCAATTGTATAATGATGTGAAATTTCAGCTGCTCTTTTGCTACCACTCTTCCCCGGTCAACAGCAATATTAAAATCACAACGTAAATTGGTCTAGCGATCTTTCCAAAACAAAAGTGATGATTTGGCCTGCAAGTACAAGTTAGAAATTCCATATTGACAAATAGGGAAGGAACAAAATAAATCATCCAGTTTTGATGACAGTTTTCAGTTGTAATTTAAGTGTAAACGTAATGTTAAGCAGGCAGCAGCAATGTGGGGGTGCTCTGGTATCAAATGTAATCATGGGAATTGCAAATGAATGAGCAAGTGTTTGTTTGCCTTCTCACTAATAATCACTTATCAACGATAACTATTACTGTAAATATTGCTAATTAAAAATGAACAAGATTTA\n>XM_053163347.1 Puccinia triticina uncharacterized protein (PtA15_15A169), partial mRNA \nATGCCTTTTACACCGAAAATCGAAAAGGACGCTGGAAGACTTCAAGAGTGGAACTTCCACCATCGACGATCAGGTTCGATGGATTCTTCAAAAATCGCGCAAAAAACTTTCGAGCTTGAAAACCATATTCAGCCTTTGGAACAGGATAAGATATTCAAATACAACGCGGAGGAACAAAAGACGATCCAGAAAGAAGCGAAATGGAGGAAAGATCCTCACTACTTTAAGAAAGTGAAAGTCTCTGGTGTCGCTTTGATCAAGATGGTTATGCATGCTCGATCAGGAGGGCAATACGAAATCATGGGGCTCATGCAGGGCAAGATCGATGGAGACACTTTCGTCGTAATGGACTCATTTGCTTTGCCTGTTCAAGGGACAGAGACTCGAGTCAATGCGGCTAGTGAAGCCAACGAGTACATGGTCGATTTCCTCGAAAGTTCAAAAAATGTTGGCCGACTGGAGAATGTCGTGGGATGGTATCACTCTCACCCGGGTTATGGTTGTTGGCTATCGGGAATCGATGTCAGCACTCAGCTGACAAACCAAACTTACACAGACCCATTTGTCGCGATCGTCATCGACCCCAATCGCACAATTTCAGCCGGGAGAGTCGACATTGGCGCCTTCCGCACCTTCCCTGAAGGATATACCCCTCCATCACTGGGAAAGAGCAAGGACGACGAATACCAATCGATTCCATTGTCGAAGATTGAAGACTTCGGCGCCCATGCCAACTCTTATTACGCCTTGGAAATCGAACACTTCAAATCTAGTTCAGACTCGAAAATATTGGACCTCTTGTGGGAGAAGTATTGGGTCATGACTCTGAGTCAAAACACATGGCTTTCAAATCGAGTATACACGACAAGCCAAATTCAAGAAATGACCGACAAACTCACCAAATCAAGTAGCTCGCTAACAAACAGCAAGCGAAACACGCTAAAAACGTTGATACCCACTCACTTGCGAACTGCGATCGAGAATGAGAACGGTCATATCGGCAGTAACAACCATCCGGAAAACTCGACTCAAAATAACAATAACAATCAGCTGTTCCATGACGTCTTGAAAGATGTCGAGAAGTTAGAATGCGAGAACCTATGCGGCATGTTTGGTCAGATTATCAAAAATGTCTTGTTTAATAACAATTCTCATAACTGCCAACTTGAGTTCCCCATGTAA\n>HQ319463.1 Uncultured bacterium clone RMAM0533 16S ribosomal RNA gene, partial sequence \nGAGTTTGATCCTGGCTCAGGATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGGAGGTTTAAAGCGGAAGTTTTCGGATGGAAGCAATAAACCTTAGCGGCGGACGGGTGAGTAACGCGTGGGTAACCTGCCTCATACAGGGGGATAACAGTTAGAAATGACTGCTAAAACCGCATAAGCGCACATTGTCGAGTGACAGAGTGTGAAAAACTCCGGTGGTATGAGATGGACCCGCGTCTGATTAGCTAGTTGGTGAGGTAACGGCCCACCAAGGCGACGATCAGTAGCCGGCCTGAGAGGGCGACCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGAAGAAAGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATC\n>XM_029801181.1 PREDICTED: Octopus sinensis homeobox protein rough-like (LOC115231097), partial mRNA \nTTCAAAGACGGAAAAGGAAAGAGAACCGTCCCCGACGTCAGCGTACGACATTCACCAGTGAGCAGACACTGAAGTTAGAACTGGAGTATAACCGAACTGAATATATCACACGACCTCGGCGATTCGAATTGGCTGAGATGTTGAACTTGACAGAAACCCAGATCAAGATCTGGTTCCAGAACCGAAGAGCGAAAGACAAACGGATCGAAAAGGCACAAATGGATCAGCAGATGAGCCTATCTAATTTCCAAAGAAGACAAGTTGTTGGAGTTCGGCCCGATCTCTACAGCGCTGCTATTAATTTTGTTCTCTGTCCAGAATTGTGTTGTGGACAAGGGTTAGAATGCTTAGAATACTGGAACTGCCGCATTGCTGTGCCCGCACCTGCAATTCTAGCATTCCGTTCAGCCTTCTGCTTCCCATCACAAGAGAACGG\n>XM_043204581.1 Ogataea angusta uncharacterized protein (KL928_003939), partial mRNA \nATGGTCCAAATCCCCAGATCGTACGCGGAACTGAAGCAGAAGGTTCCAAACATTGGAATCATTTTTGCCGCAATAGCTTCGTGGTTTTCGTTTAGTTTACTTATCTCGCTTTACAACAAATGGATGTTTTCAGATCCTACTTTGAACTTCAAGTTCCCCGTGATAATTACAGCCTGTCACCAATTCGTGTTATTTTGGCTCAGCTGTTTGACGCTCACCTTTTGGCCCAAGTTCAGACTGAACTATGTCGATCCTTCCAAAGGCATTGCGTCCTCCGAAAATCTCAGCTACTTTATCAACCCTAAAGTGTACATTACCAAGATCTTGCCGTGTGCGCTGGCTTCCGCCGGTGATATTGGCTTGGGCAACTCTTCTTTGAAGTATATCACCATCTCGCTATACACCATGCTCAAGTCCTCTGCAGTGCTCATCTTCACGCTCTTCTGGGGTTTCCTTCTCAGACTGGAGAAAGTTACGTTGAAGCTTTGTCTGATTACGTTCATCATGACTGGTTCGGTCATGATGATGGTGTACGGACAGGGAGAGACCTCGGCTGAGACCAGTCCTTCCGCTGTTGAGGAGGAGGCTGGAGAAATGAAGCTCAGATTCGTCAAGCACCTCGTGAAAAGAGCAGCTTCTCTGTACCTCGGTGTCAGAGACGAGGAGCAGGAATCCGACGACTTGGTTTCCTCGTCCTCCTTCACAGGTTCTACGGCCAAAGCTTCTGCTGCCCTGGACACACTCACCGCATCCTCCATCATCATTGGCTGCATCCTGGTTCTGCTTGCATCTTGCATGTCTGGGCTTAGATGGGCTTTGACTCAAATTGTCTTGCGTGGCAACAGATACACCAAAAACCCAATTTTGACCATCTTCTATCTGAGTCCCGCCATGTGCGTCTCGCTGATTGTCATGGGCTCGCAGGTCGAAGGCTTAGGCAACTTTCTAGGATCGCAGGTCTGGGAGACGTATGGTATTTTGGGAACCTGTTTGCTGCTTTTGTTCCCAGGTTTCCTGGCCTTTTGCATGACCCTGTCTCAATTCATCATTCTGCAGTACGCTCCGTTGCTCACGCTCTCTATTGCCGGTATTGTCAGAGAGCTCATTACTATATTCCTCGGATGGCTGATCTTCGGCGACCACCTGAACGCGATCAATATGCTGGGTATATTGATCACCTTGGGAGACATTGCATGGTACAATCTCTACAGACTGGAGCAATCTTCGGCCAAGCCGGCTTCTGCTGCGTCTTCTGAGGACACAGAGAGGTTTGTCACCGAGGAGCACGAGCTTGAGTCTATCGACAGACGCAAGTGA\n>XM_004287821.2 PREDICTED: Fragaria vesca subsp. vesca putative F-box protein PP2-B12 (LOC101291663), transcript variant X1, mRNA \nAAATATTTTGTGAATTTCTGAGATTCATCAGAAAAGTTAGGATGCTTTCTCACCAAGAAAGTGAAAAGAAGTATATATACACAGCTTCATGATTGATTCCTCTACAGAAGGCTGAAGCAGTGTTGTTCTTTCACAAGGACCTCTAGAATTGTGTATATTCTTGTCTGATACTTTAGGTTTTTCTCATCATTCAAGTTGTCTTGTAGAGGTGTATAACTATATATACAGTAAGATGAATGCAAGAGAAATGTTTGTCAAAATAGCAGAAGCATTTGTGGAGTTGTACAATTATGTTAGAGGGCCTATGGTGCCGCAAGCAATTCAGTTAAGGGATGCAGTAGTGAAGATTCATGAAAGCTTGGCTGGTCAAATTGCAGACTCAGAATTGATAAGTAGTGTTATCGAATGGTTTAATACGTTTCATAACATTTATGTCGCACTAGGATTGGTTGGTTTGGTGATCTCCTTTGTTCTAGGATTGCTTTGGAAAGTTTTAGCTGTGGTAGTTTCTGCTTTAGGTGTATGGATTTCCTATTTGATTTGGAGAGACCATAATTGGCACAAGCTGTTCCTGACAGACGAAAAAGGATTAGCATTTTTTGCAAGTACTTGGCTTGGGTTATTGCTACTCTACCGAGCACAAGGTCTGCTTGGCAAAGTTTGTCTTTTGGGAATAGAAACCCTAGTAATATGGGTGATGCAGTATTCCATGTCGACGACGACGAATATGGAAATCCCTTGGGATGATTCTAATATCCATGAAATTATCTCCCGAGCTGTTCCACCGGTGCCCCATTATTCTTCTCCGCATGACCTCTACCGCAGTCTCTGCGCTTCCCCCATCTTCCTTGACGATGGCTACTTGAGTTTGGCGTATGATCGGGCGACTGGTAAGAAATGCTGGATGATGGGAGCCAGGCTTTTACTTATTGATTTGGCAGAAATTCCAGACTACTGGAACTGGATATCTCTGCCTGAATCCAGGTTTTCCCAAGTGGCTGAGCTCAGATTTGTACGTCGTCTTAAGATCAAGGGATCCATTTCTACCTATATGTTGTCACCAAGAACAACCTATGTAGCTTACTTTGTATACAAGTTTTCAAATACATCTCGATCTGGTTTTCATGAAAGGCCTGTTAGCTTGCGTGTAGTTCGTGTTGTTAATACTCAACGCCAAGTTGTGGCGCATCATAATCGTGTGTTCCTGATAGGAGAGATGGCTTCACAAGCTCGAACGAGAAGTGATGGATGGATGGAGATTGAGTTCGGTGAAATCTCCTACATTGATGATAGTGCTACTATAGAGTGTATACTAGAGGGATCTGAAAGTTTTGAGGGAAAAAGAAGTCTCATTGTGGAAGGTATTGAGCTCAGGCCTAGATAGAGGAAATTTATCTCTCTGTATATATATAATGGATCTTTGATCTTTAGCAAATCTTCTTGATGGCATGGTTGATGGAGATCCAAGCTCACAGTTTACTATATATATTGGTTATGGACGTGGTTTATGGACGTGATCTTGCTAGCTTCCAGCCTTCCAGGCTGGTTTACCT\n>XR_008327014.1 PREDICTED: Panonychus citri uncharacterized LOC128397849 (LOC128397849), ncRNA \nAATTACTGGATCATCTTTGATTTGTCATCTAATAGTCAATGGAATTGTAACTTTGTTAATTGTTAGTTCTTAGAATAGATTCAATTAAAATCGATGACATCAATCAGCAACAATTTATCAATCGTTGTAACAATTAACCTTAATGCGAAAAGTGAAAAACAAATCTAATCAAAGTAAATTGTTTACAATTAGAAAAAGAAATCAAATTAATTGTAAACATACCTACGTGATGAGATGCAAATCTAATTGTTAACAATTAGTCTGGGAAAATTACTTATCATTAGAAATTAAATTTGTCTGATCAACAATTAGTCAAATATGATAACAAGGATCACAATTAAACTTAATTGTTACGGAAAAACCTTCAACAGATTCTAATTATAATGTAACTATATTTACTCATTATAAAGAAAGTTAATTATAATGTCGATACATTTGCAATTAAATTTGACAAATCAATCAATTAATTACACATTTATGATGATTATGATTAATAATTAATGAGAAAATGATTAACTTTTGATTAGATTAACAAGAAGGAAATTATTTTAATTGTGTTTACCAGAAACGGTATCAATAGTAATTAGAATTACTTTGTTTACCATTTAGCTTTAACATAGAGAGAAATTGATTAGTAGTTTATCAACAATTAATTTAATCGTAATAATCAATTGATTAGTAGAAGAGAAATCAACGAAAATAGACAGAGAAATAGACAGAGAACAAGAAAAAGAGAGACGATCAAGTGAGTGAGAGAAAAATATAAAAATCATTTTCTCTTCAACGAATCAAGTGAATGTCACATTTTCCTTGGAGACTTTGAGTTTGCTAATTGATTTGATTTTTTGATTAATTGTCTTCATCTTTAAGAATTAATTACTCTTTGATTGTTGTTCTTTGAAGGTGTTGAGTTAATTTGGATTCGTTTTAATTGTGATAATCAATGACAACCATTAAAGATCAACATCAAATGCCTAATCCCAAATGGATCATCTTTTGTTGCTAATCTGTAAAGTGGTCAACACATTTTGTGACTATAAGTGTCTTAATTGTTCAAGTGATTTATTGTTAATAAGAACGTTTAAATTGACTAAAAGATGCCAGTTTACGCTGCTATCAGTCGATCAAGGAAACGAAGTCAGGAACGGAAACTGTCCCTTAGTTCCTGTTCCTCTGAGTCTTCATCTATTTCCTCAAGTGAAATTGATATAAAGGTGGATCAGAATGTGATCTTTGTGGATTATCACTTAAATCGGTCAAACAACATTACATTTGTGGACATAATTTTCACATCGATTGTATTTGGAGATACAAAAGATTAGCCCCCAGTAACCATGAGTATTGTCCAGTTTGTGGTATTCATCATCCACCAAAAACAATTAGAAATTACTAATTATCATCCTCATCACCATCATCATCGTTGGGTCATCAATATTTATCCACATCTCATACTTGCGACAATTTAAATCTAATTGTTTGCCTCTTGCTCTCTGTCTCTCATTATCCATCAAAAATCATTGTAATTATTTAATCGATCATAACAAAGTCACAGATCATGATTAATACCAATCAATACGAATATAAAATACAACTAAATCAATCAAAACAGCTCAAAACAATTAAATTGTAATCGAAACAAAAAACACGCTGATTAAACAAGTGTATCTTTGTATTATAATCATCACAATCAAAAATCAAA\n>NM_001096323.1 Xenopus laevis zinc finger DHHC-type containing 1 L homeolog (zdhhc1.L), mRNA\u0001BC106577.1 Xenopus laevis hypothetical protein MGC131347, mRNA (cDNA clone MGC:131347 IMAGE:7766144), complete cds \nCAGCAGATTCCGTAAGGATCATCCCTTCCCTTCCTCTCTGATTTCTACTCTGCTTCTTAGTTCAGACTGCGCCCGTTGTATATTCATAGCCTCATTCCATCAACCGCAAAGAGACATGGGCATTTGGAAAAAGCTACTTTGTATACAGGGTTGGAAGCAAACAACATGAGCTGACTTTCCTGTCAAGGTTCAAGACAAAGTCTTCCTATGCTGAACACATTTAGAAGCCATCTTAAAATACATGAATTATTAGTTCTGGTACTGTCAGATGGGCATTCAAAAAGATGTCAGTCTGCAAGAAGCAGTCTGCTATGAATGTGCCCGATAAAGAGAGAGGGGAAGTCATTTCAGATCCACCTCAACATTCAAGAAAAAATGGCTGGAGTTGGCCCCTGCACCTGCTGCAGCTTGTTGCCTGGTCCACTTTTCTCTTCTTTGCTGTTATAGGACTTGGGATCTTGGTCCCTCTTTTACCACAGCATTGGTTGGCAGCTGGTTACATTTGTACTGGAGTCATGTTTACTTTCCACTGTGTTGTCCACTTTCTGGCTGTTACCATTGATCCTGCTGATGACAATGTGCAGGCCAAAGGTTCTCTTGGGCCTCTACCAGCATTTGATCGCAACAAGCACACTCATGTAATTGAAAACATGCATTGTTATATCTGTGAGGTGGATGTGTAAGTAAAAGATGACCCTTCATGTTGTAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\n>XM_051729581.1 Alternaria postmessia uncharacterized protein (J4E82_003292), partial mRNA \nATGGATGAGGAAAATGTTGCCAACTTCTGCGGCATCACGTCCTGCAGCCCAGAGCAGGCTGCTCAGTACTTGCGCCTAACAGATGGCAACTTGGAGCAGGCCATACAACTCTTCTTCGACTCTCCTGGACTTGCCGATGCTCCTGCTGCGCCATCACAGCCCTCAGCAGCCGCCTCCGCACAGAATCCCATCAATATCGACTCCGATGATGACATGGACTTTGATCCCGCACCACAAGGCAACGCGCCGTCCACACGGGCACAACCAGGCGTGGAAGACGATGAAGCCATGGCACGGAGGTTACAAGAAGAGATGTATGGCGGCGGCGGCGGCGCCGCCGGTGGCGCTGGCAATGATGAGATTCGCGCGCCCATAGAACGAAGAGTGGAAACACTTGTTGGCCCAGGCTCAAACTGGGGGCCTGCCGATGACGAAGAAGATCTTGATGCTATGGTCCAGGAGCAGCTTGCTCGTCGGCGGACAGGCCGCGCCGGTATCTTCAACCAGCACACAACCCATACCAATGTCTGGGATAACACGACCGATTCGAGCACCCGGCGACGCGAGCTTGCGACCGCGACTGGCGGTGCTTCAGAGCAGTCTTCTAAGATGAACATGCTCGCAGAGCTATTCCGACCACCGTTTGAGATCATGTACCAAGGATCGTGGGAAAAGGCGCGAGATATGGGCAAGGACGAAGAAAAGTGGCTGCTTGTCAACATCCAAGACCCGGCAATCTTCGACTGCCAGCGCCTTAACAGGGATATCTGGAAGAATGACGATATCAAGGCAACTGTGCGAGAGAACTTCATCTTCATGCAGTATGCAAAGGATGATCAGCGTGGACAGCAGTACATGAACTACTACTTCCACGCCCGTGACAGTTCTGACGCCTACCCCCACATCGCCATCGTTGACCCACGAACAGGCGAGCAAGTCAAGGTCTGGTCGGGACCACCGATACCCGAACCAGTTGAGTTCCATGCTCAGCTTCATGAGTTCCTCGACCGTTACAGCCTCAATGTCAATGCGAAGAACCCTGTAGCGAAGCGGAAGTCTGAGTCTAAGAAGAAGGATGTCGGTCGCATGACAGAAGAGGAGATGCTGGAGATGGCGCTACAAAACAGCATGGATAACGGCAAGGGGCCGAAGGACGATGACCCAGATGCTCTCACCAAGTCTACAGACAACATCAAGGGCAAGGGCAAGGCCGAAGAAGTCGCTTCTGAGCCGCCAGCTGAGCCCGAGGCAGCTCCTTCGAATCCTGTCTTCGCTGCCATCTCCGCACATGCTCCTCATACCGAGCCTACCGTTACTGATCCCAAGGTCACGACTCGCATCCAGTTCCGTGGCCCGTCAGGCCGTCCGATTGTGCGCCGCTTCAACCTTACAGACCCTGTTCGCCGTGTCTACGAATGGATCAAGTCCGACGTGCCCTGGGAAGGCAAGCAAGGAGCTGAGTTCGATCTGGCGTTCATGGGCAAGAACCTCCTCGACCACGTCGACGACACGGTCGAAGCCGCCGGACTCAAGGGTGCCAGTGTTATGGTAGAGTTCTTGGATAATGAGTAG\n>XM_006724281.5 PREDICTED: Homo sapiens eukaryotic translation initiation factor 4E nuclear import factor 1 (EIF4ENIF1), transcript variant X2, mRNA \nAGGGGCGCGAGGCCCGCAAGGCGGCCGGCGGGTAGCCGGCGGGCTGGCTGGCGGGGACCGAGCCGCCGGGCCGGGGAGGACGGCTGCGGGCCTGCGCTAGCTCCAGCTTGAAGCGCCCGGGCCGGGAGATTCGGCCTCCCTCCTCCCTGCGGCCGGCCGCCCCTCAGTGAGTACGGTCTCCGCCCTTCCTCCGAAGGAGGCCGCTGGGCCCGGGCCTGCGTGAGGGGCTGCGGGTTGGGGTCGCGGCCCGGGGAAGCCAAGTTTCGGAGCTGAAGCCGGTGCTCGCCCTTTCCTTGCCATCGGCGCCCCTGACATGGCCACAGGTGCGGCTGGCCTGGCGAGGGGCGCTCGGGCCCCGTCCCCAGTCCCTGATCGCCGGATAACAAGGGGCAGCTGGCGCCGTCCATTGGTGCAGAGCATTGTAGACCAAGGAGCCATGGATAGGAGAAGTATGGGTGAAACAGAAAGTGGAGATGCTTTCCTTGACCTGAAGAAGCCTCCTGCCTCCAAATGCCCCCATCGCTATACAAAAGAAGAACTCTTGGATATAAAAGAACTCCCCCATTCCAAACAGAGGCCTTCATGCCTTTCTGAAAAATATGACAGTGATGGTGTCTGGGACCCTGAGAAGTGGCATGCCTCTCTCTACCCAGCTTCAGGGCGGAGCTCACCAGTGGAAAGTCTGAAGAAAGAGTTGGATACAGACCGGCCTTCCCTGGTGCGCAGGATAGTAGATCCACGAGAGCGTGTGAAAGAAGATGACTTAGATGTTGTTCTCAGCCCTCAGAGACGGAGCTTTGGAGGGGGCTGCCACGTGACAGCCGCTGTTAGCTCCCGGCGCTCAGGAAGTCCATTAGAGAAAGATAGTGATGGGCTTCGTCTGCTTGGTGGACGTAGGATTGGCAGTGGGAGGATAATCTCTGCCCGGACCTTTGAGAAGGATCACCGTCTTAGCGATAAGGACCTGCGGGACTTGAGAGACAGAGACCGAGAGAGGGACTTCAAGGACAAGCGTTTCAGGAGAGAGTTTGGAGATAGTAAGCGTGTCTTTGGTGAGCGTAGAAGAAATGATTCTTACACAGAAGAAGAACCAGAGTGGTTCTCTGCTGGACCCACAAGTCAGTCTGAAACCATCGAACTGACTGGCTTTGATGATAAGATACTAGAAGAAGATCACAAAGGGAGAAAAAGAACAAGGCGACGGACAGCCTCTGTGAAGGAAGGTATAGTAGAGTGCAATGGAGGAGTGGCCGAAGAGGATGAAGTGGAGGTCATCCTTGCACAGGAGCCTGCGGCTGATCAGGAAGTGCCAAGGGATGCTGTCTTGCCTGAGCAGTCCCCAGGAGACTTTGACTTTAATGAGTTCTTTAACCTTGATAAGGTGCCATGCTTGGCTTCGATGATAGAAGATGTTTTGGGAGAAGGGTCAGTCTCTGCCAGTCGGTTCAGTAGGTGGTTCTCTAACCCGAGCAGATCAGGAAGCCGATCCAGCAGTCTTGGGTCAACACCACATGAAGAGCTAGAGAGACTTGCAGGTCTGGAGCAAGCCATCCTCTCTCCTGGACAGAACTCGGGGAATTACTTTGCTCCTATACCATTGGAAGACCATGCTGAAAATAAAGTGGATATTTTAGAAATGCTACAGAAAGCCAAAGTGGATTTGAAACCTCTTCTTTCCAGCCTTTCTGCAAATAAAGAAAAACTTAAAGAAAGCTCACATTCAGGGGTTGTGCTTTCAGTGGAGGAGGTAGAAGCAGGTCTGAAGGGCTTGAAGGTTGACCAGCAAGTGAAGAATTCAACTCCCTTCATGGCAGAACACCTAGAAGAGACCTTGAGTGCCGTAACCAACAATCGACAACTGAAGAAAGACGGAGACATGACTGCGTTCAACAAGCTAGTGAGCACAATGAAGGCAAGTGGGACTTTGCCTTCTCAGCCCAAAGTCAGCCGAAACCTTGAAAGCCATTTGATGTCCCCTGCTGAGATTCCAGGCCAGCCTGTCCCTAAGAACATCCTGCAGGAACTTCTGGGTCAACCAGTTCAGAGACCTGCTTCTTCCAATCTTCTGAGTGGCCTTATGGGGAGCTTGGAGCCTACAACATCTTTACTGGGCCAAAGAGCACCCTCTCCTCCCTTGTCACAGGTGTTTCAAACTCGAGCAGCCTCAGCTGACTACCTTCGCCCAAGAATACCATCACCAATTGGTTTCACACCAGGACCACAGCAGCTACTCGGAGATCCATTCCAAGGCATGCGCAAACCCATGAGCCCCATCACAGCCCAGCAGATGAGCCAGCTGGAGTTGCAACAGGCAGCTTTAGAAGGGCTGGCCTTGCCACATGACCTTGCTGTACAGGCAGCAAACTTCTACCAGCCTGGTTTTGGCAAACCACAGGTGGACAGAACCAGAGATGGATTCAGAAACAGGCAACAGCGAGTGACCAAGTCACCAGCACCCGTGCATCGAGGGAATTCCTCTTCCCCTGCCCCTGCTGCCTCCATCACAAGCATGCTTTCTCCTTCCTTTACCCCTACCTCAGTGATTCGTAAGATGTACGAGAGCAAAGAGAAAAGCAAGGAGGAGCCAGCATCTGGAAAAGCAGCTCTTGGTGACAGTAAAGAGGATACTCAGAAGGCCAGTGAAGAAAACCTCCTGTCATCCAGCTCTGTACCCAGTGCCGATCGAGACTCTTCTCCCACTACAAATTCCAAACTGTCAGCATTACAGAGGTCTTCGTGTTCCACCCCACTGTCCCAGGCCAACCGTTACACCAAAGAACAAGATTATCGACCTAAAGCAACTGGGAGAAAAACACCCACCTTGGCATCCCCAGTTCCTACAACACCTTTTCTCCGCCCTGTCCACCAAGTTCCCCTTGTCCCCCATGTCCCTATGGTTAGGCCTGCTCACCAGCTTCACCCAGGGTTGGTACAGAGGATGCTGGCCCAGGGAGTACATCCACAGCATCTTCCAAGTTTGCTCCAAACTGGTGTGCTTCCTCCTGGGATGGACTTGAGTCATTTACAGGGAATATCTGGCCCCATCCTGGGTCAGCCCTTTTACCCTTTACCTGCTGCTAGTCACCCTCTCTTAAACCCTCGTCCTGGAACACCTCTGCATCTGGCAATGGTGCAACAGCAGCTACAGCGCTCAGTTCTGCATCCTCCAGGCTCTGGTTCCCATGCAGCAGCTGTCAGCGTTCAGACAACCCCTCAGAACGTGCCCAGCCGGTCAGGCCTGCCCCACATGCACTCCCAGCTGGAGCATCGCCCCAGCCAGAGGAGCAGCTCCCCTGTGGGCCTTGCCAAATGGTTTGGCTCAGATGTGCTACAGCAACCCCTGCCCTCCATGCCCGCCAAAGTTATCAGTGTAGATGAATTGGAATACCGACAGTGAGCAGGGCAGGCAGACTCAACTAAGCCCGGACCTGTGGTGGCACACTGGGCAGGACCCTGCTTCATCTCGGGTTGGTTTATGGGCTTTTACTTTGGAGCACTCTGTGTGAAGCTGTTTGGTGGAACCCATGCATCTGGTGTGGTCCGCATTATGATGGAAGGATCTTAACCAGTCGAGTGGAGTGTACATTGTCTGAATACAGGATGCACAATGTTGTCAATCCTGGAAATGGTCTTTCTTTTTTGTAAGATATGTGAATGAAGTGTTGGTGTCCTCACCAAGAGGTGGCACCTAAGGGTTCTGAGGAAATAAATGTATAGACCCTTATGTACAGACCTGTGTATAAACAACTTTTGTATATACATATAGGATAGCTTTTTTGAACTATACAGCTGTACATAAAAGTAGCTGATATTAGTTAGGCCTGTGTCAACAGTTTGGATTTTTTTCACTTGTACATTTGGGATTTTCTTTTGGTTGATTAAAATTGCATATGCTAAGTGTGTGAATGAA\n>XM_003017089.1 Trichophyton benhamiae CBS 112371 phosphotransferase enzyme family protein (ARB_04011), partial mRNA \nATGGTTTCCGTGAGACCGCGACTATTTCTAAGGGGTCTCAAGCACAGAATCCCGGAAGAGCATAGTACAACAGACCTTTTCAACTATACCACGGGGCGATGGCTTTGGAGAGAGAAGGAGCAGCTACTTGAACGATACCGGAGATTCAATGTACGAGAGCTACAGGCCATAACTGCACATACACTGGGCTCTCAAGCATGTGTTTCAATGTCCAAAATTGGAGAAGGCAATTTCAACAAAGTCTTCCGACTTGTAATGGATGACGGAGCAGTGGCAATAGCTCGAATCCCCCATCCAAATGCTGGTCCGCCTCGGTATACGACTATGTCGGAGGTTGCTACTATGGAATTTGCAAGATCAATGCTTAAAATACCAGTTCCTAAAGTGTTAGCATGGTCTTCATCTTCTGATAACTCTATAGGTGCAGAGTATATCATTATGGAAGAGGCTAAAGGCACCCAGCTCTCTCAAACATGGGATGAAATGAAATTACATGATAGGAGTGAAATAATCAATGATATTGTTTCCATAGAGCAGAAACTTCTCTCCGTGACCTTTGGCTTGTATGGGTCACTATATTTTTCCAAAGACGCTTTCCCTGGCTGTCAGCCGGCAGATATCAGTGGTGACGTCGCACAAGGGATTGAGGATGAGGTTAGAAAGCAATTCGTCATCGGCCCTACGACTCGCCGGGAGTTTTGGGAAAAGGAGCGAGCACTGATGGATCTGGACCGAGGACCTTGGAAATCTGCTAGTGGATATGTGGAGTCCATAGCCCATCGCGAGACCGCTTGGATTTCCCAGTATGCACGGAGGGATTCCATCATATCTGGCTACCCCAGGGGCAAAGGAAGTCAAAAATCACCCCAGGACCACCTCGGCTTATTGGAGAAATACCTATCTGTTGTTTCGAGGCTCCTTCCCGATGATACCGAGCTTGTTCGCCCAGCACTCTGGCATCCTGACATCCACGATGGCAATATATTTGTCCAGGATGGGAGGATTTCCAGCATTATTGACTGGCAGTCTGTCTGGATTGCACCTTTGCTTCTCCAGGCCAGAACCCCTCGACTGATCGATTACCATGGAGAGATCCAGTTGAGACTTCCCGAAGACTTTAAAACGCTGCCCGAAGAAGAGAGGGATCGCGTCAGAGACCAGGTCCAACGGTCTATCCAGGTATACCTTTATGAGGACCGGACGGCAAGAGTCAACCCTCTTCTTGACAGGGCAATTAGGAAACCCCATGGGAAAACATTGGCTCAGCTCGTGAGCTTTGCTGGAAACTCATGGGATGACCACATCGTACCCCTGAGGGACACTCTGATTGACGTTGAAAGGTATATAGCAAATTGGTCATGA\n>XR_008008321.1 PREDICTED: Arachis duranensis uncharacterized LOC127746577 (LOC127746577), ncRNA \nTCTTATACGTAATCCTTTTCGTGAGCGATTGTCTCTACTCTCTCTCTCTCTCTGGAATAAAGTAAATACGGTATGTTATACAAAAACTGTCAACACTATATATAGATTATAACTAACTTGTCTCACAAAACTTCCAATAATTTCTCTCTCTCTTTCTCTCTAAAGCTCTCTCCCTCTCTGAATGTTTGAGTTGCAGGTGCTTATTAAAAACATGGCTTGGTGTTTAAAACAACGCGTGTTGCTCCCTGTTATGGTGGTGTTATTGTTGTTGGGAACAAGTCCTTCCATAGCAGAGCTTCAGAAGCTGAAACACACTCCAACAAAAGCAGATCAACCTCTGAACATTCTGGTGGTCGGAGACTGGGGAAGAAAAGGAACCTATAACCAGTCCTTGGTCGCTTATCAGCCCAGAATAGGCTGAGCTAATAGGTCCAAGAGGCAGTTCTAATTGGGTTGGTTGGCTATCATGCTGTCCCAAGGTATGGATTTTATTTTTTGGAATAAAAAAAATTGTTGGGACACATTTCTCAAGAAACGTAAGGTTTACTA\n>XR_003114846.1 PREDICTED: Melanaphis sacchari uncharacterized LOC112597600 (LOC112597600), ncRNA \nATTTCTCGGGCTTGTTCCACGGCGTCATCTTTCTGACTCTTCGTCTGTCACAAACAAATTTGTTCCTGAATAGAGCTGAACTCTCTGTTCCGCTCCGAATTTCTCGCCTTTGATTTGTCGTTAGCCCGATTATGAGGGCTAAGTGGCGTAAGAAGCGTATGCGTAGGTTGAAGCGCAAGAGGAGGAAGATGCGTGCAAGGTCCAAGTAAACCTCGTGGCCTGCACAAGACAATATTATCATGTTTTGGTAAACATTAAACGATATTGAAACTTTTATATTAAATCATCTAAACAGTAATAAACTCTTTCTGTTCAACTTATAAAA\n>JX816942.1 Uncultured bacterium clone HC1::G9RA0RH03HINL4 16S ribosomal RNA gene, partial sequence \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGGTAAGGCCCTTTCGGGGGTACACGAGCGGCGAACGGGTGAGTAACACGTGGGCGACCTACCTTCAGCTCTGGGATAAGCCTGGGAAACTGGGTCTAATACCGGATAGGACCGCATGTCGCATGGTGTGTGGTGGAAAGTTTGTTCTTAATTGGACACTTCGGCTGGGGATGGGCCCGCGGCCTATCAGCTTGTCGGTGGGGTGATGGCCTACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACACTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGCGGAAGCCTGACGCAGCGACGCCGCGTGGGGA\n>XM_053359157.1 PREDICTED: Podarcis raffonei calpain 7 (LOC128398277), transcript variant X5, mRNA \nAAGATTGCGCTCCTATCTCTCTCCAGCGAGAGGTGGAGGGGAGGGAGGAGCGTTCTCCCGTATTGCGCAGGCGCATCGCGACGGCGACGCCTCCGCCACAGGGGCTGCCGGGAAGTCCCTTCCTGAGCGGGAGGCCATAGGCGGAGACGTCGGGGGGCTGCCGTGACGTCAGCGAATAAGGAAAGGAGCGCGCTGAGGCGTCTGCTGCCCGGACCCGGCCATGGAAGCGGCGGAGCTGGAGCAGGAGGCGGTGAAGTTCGCGCAGATGGCGGTGCAGCGGGACCAGCGGGGCCACTATCACGAAGCGGCCTTTTACTACAAGGAAGCTGCACAGTCTTTGATTTATGCTGCAATGGCAGGATCAGTCTTGGAAAATATTCCAGAGAAAATAAGTGAATATTTGGAAAGAGTTCAAGCCTTGTACTCAGCAGTGCAAAGAGTCGACCCCTTGAAGTCGAAGCAGCAGCTGGACTTGGAGCGGGCCCGTTTCCTGGTTACGCAGGCTTTTGACGAAGACGAGAAAGGCAACAGCGAGGAAGCGATAGAGCTGTACACGGAAGCCGTGGAACTCTGCCTGAAAACGGCCAATGAAACTTCAGAAACAGCTCTCCAGGCAAAACTGAAGCAGCTGGCTCGGCAGGCACTGGACAGAGCTGAAGCGCTGAAGGATTCAAAGCCATCTCAGAAAGACAAGCCGGTCCCAGCGAAACCAAATCAGCAAGCCCGGACTTACTTTCCATTAGGGCCTGATTTTTCCTTGAACGATAAGCCACAGGCAGTCAGAGCTGTGCAGGCCAGTGAACCTCAAGGTCAGCGATACACCGCAGAGGAGATTGAGGTGCTCAGGAAGACGTCAAAGATCAATGGCATTGAGTACGTCCCTTTCATGAGCGTTGACCTCAGAGAGCGTTTCGCTTTTCCAGTACCTTTCTCAGATAGATGTGGCAAGCTGCCGTTGTCTCCCAAGCAGAAAGCAATGTTTTCCCGCTGGGTGCGTCCCGATGAGATAACAAACAGCCCCACCATGATCTACACAGTGTCGAGCTTCAGCATAAAACAGACAATCGTGTCAGATTGTTCCTTCGTAGCTTCTCTTGCTATCAGTGCGGCATACGAAAGACGATACAACAAGAAGCTGATTACCAGCATTATTTATCCGCAGAATAAAAAAGGAGAGCCGGAATATAATCCGTGTGGAAAATACATGGTTAAGCTGCATATCAATGGGGTTCCTCGGAAGGTGATAATCGATGACTTCCTACCAGTGGATCACAGCGGAGAACTTCTCTGCTCTTACTCCAACAATAAAAGCGAACTCTGGGTTTCCTTGATAGAGAAAGCTTACATGAAGGTCATGGGAGGTTATGATTTTCCAGGATCAAATTCTAATATTGATCTCCATGCGTTGACTGGCTGGATACCTGAAAGGATTGCCATGCACTCAGGCAACCAATCGTTCGACAAAGACAGTTCCTTCAGGATGCTTTACCAAAGATTTCGCAAAGGGGACGTGCTCATTACAACGGCGACGGGAGTGATGACTGAGGAGGAAGGAGAAAGGTGGGGTTTAGTACCAACCCATGCCTACGCTGTTTTGGATATCAGAGAATACAAGGGGCTTCGATTCCTCCAGCTGAAAAATCCCTGGAGCCACCTCCGCTGGAAGGGAAGATACAGTGAAAATGATATGAAGAACTGGACCCCGGAACTTCAGAAATACTTGAATTTTGATCCCAGAACGGCCCAGAAAATAGACAACGGGATTTTCTGGATTGCCTGGGAAGATCTGTGCAAGTATTACGATGTTATATACTTGAGCTGGAACCCAAGTCTTTTTAAAGAATCAACATGCATTCACAGTACCTGGGATGCAAAGCAGGGTCCTGTGAAAGATGCATACAGCCTAGCTAACAACCCACAGTACAAACTGGAGGTTCAGTGCCCACAAGGTGGGGCTGCCGTTTGGATCCTGCTCAGCAGACACATTACGGACAAGGATGACTTTGCTCACAACCGGGAGTTCATCACAATGGTGGTATACAAAACAGATGGGAAAAAGGTTTACTATCCTGCCGACCCTCCTCCGTATATCGACGGGATTCGAATCAACAGCCCCCACTATCTCACCAAGATCAAGCTGACCTCTCCGGGAACCCATACGTTTACTCTGGTGGTTTCTCAGTACGAAAAGCAGAACACAATTCACTACACGCTCAGGGTGTATTCAGTGTGCAAGTTTAATTTCTGCAAGATCCCGACACCGTATACCATATCCAAACGGGTAAATGGGCAGTGGAAAGGTCAAAGCGCTGGCGGGTGTGGGAATTTCAGAGAGACCGCCAAGAACAATCCTATTTACCAGTTCCAGTTGGACAAGACCGGCCCCCTCCTCATTGAGCTACGAGGACCAAGGCAATACAGTGTTGGCTTTGAAGTGGTGACCGTCTCTACAGTGGGAGAGCAAGGCTTTCAGAAGAAAAACAGCGGCGATTACAGTGAGCCTGAGGCCAGGGACTGTCTGGGAGAAATATATATTTAAATGGCTGAAATGCTTTTTAATTCTGCAACTTGGATGCTCAAGGGAAGAGTCTACGGTGCACACAATAATATTAAATCCAGAGCTTTGGGTGGTTTTCTTTTTACTATTTATCACTGTGCCACAAATGGGACAAACAATTGTACCCCTTCGCTCTGACTTCCAAGCTTGAATCTTGCCATGTATCAGAGAAAAAAAGAAAACACACACGACAACTGTTTAGTTTT\n>AY736006.1 Aedes aegypti inositol-1 monophosphatase mRNA, complete cds \nGGGGAGTATTATTCAACTCGTAAAGTCATTCAGTCCAGTTTTTCTAATCATTATTTGAAACATCCGAAGCTCCCTCGATAATTGAAAGCAAATAGCCGAAATGTCGCTCGATTTGGACGAATGTTACGAGCATGTCCTCGGATTGGTAGAACAAGCTGGACAGATTATCGCATCGAGGAATTATGGGGAGAAAACGGTGGTGGAAAAGTCCAGCAACATTGATTTGTTAACCGAAACAGATCAGCAAGTCGAGCGACTTCTGATGGATGGTATAACTGAGAAATATCCCGATCACAAGTTCATTGGTGAGGAAGAAACCAGTGCCGGGAAGAAGGCAGAGCTGTCCGATAACCCTACCTGGATTATCGATCCAGTGGATGGCACCATGAATTTCGTTCACAGTTTTCCCCATTCATGCATTTCGATTGCGTTGCTGGTCAATAAGCAAGCCGAAATTGGAATCATCTACAATCCGATGCTGAACCAGAAATTTACGGCTCGCCGAGGCAAGGGCGCATTCATGAATGAGAAAGCGATTCGGGTTTCGGGAGAAACTCGACTGGAGCATGCTTTGGCAACGACCGAGTTCGGCACTAGTCGTGACGAGGAGAGGACGGCTATCGTTTTGGAGAACATTGGGAAACTGATTCGAGTTGTTCACGGGATGCGAAGCTTGGGATCTGCTGCCCTAAACATGGCCATGGTTTGCCCTGGGGTGGAGCTGATTTTCAACTATGAAGTGCGGGTATCCACGCCCTGGGGATATTGCCTGCGGGGGGAATTTGATTTGTCCCGGGAAAGCAGGCCGGGTGTCTGTCTGGATCCAGCTTGGAGGACCTCCTGGATCTGATGTTCTCCCCCCCGGGTGGCTGTGTGCCAGTTTCGCCAGAGCTTTGGCCGGAATAAAGGTGGTTCCATTTGGGTTGAACGCCAGTACTTTTCCGCCAGCCCAGAAGACTTAGGAAAAAGTTCCCCCGAATGGGTTGGGATAAAGGATTT\n>BC169882.1 Xenopus laevis signal transduction regulatory protein SAP-2, mRNA (cDNA clone MGC:196609 IMAGE:9041516), complete cds\u0001BC170158.1 Xenopus laevis signal transduction regulatory protein SAP-2, mRNA (cDNA clone MGC:196885 IMAGE:9093539), complete cds \nTCTGCGGTGTTGCCTGTTTTAGATTTCATGACTCAAATGCTTTAGATAATCATGATGGAAATTATTTCCACTTTATTTTTTCCTATTATTGTTGTAGTCCTGGCAAGAGTCATTTCACTTCAGCCTACGAGTGTCTATTCGTGTGCTTGTGGGATGGTTTAGTAATTAACACGTTTATGTCTCCACCTGTGGGATCCTGTCTCGTCTTTGCTGCATTTACTTTTGAAGAGTTTAAAGGCAGCTTCTTCCTCTCCAGCTTGTCTAGAGGTGCATCTGCCATTGCCACTCTTTCATCACACTGTTCTGCCCGCAATGGAGAAGGTATCCGTTTATCATGGGAACATAAGCCGTGAGATGGGCGAGAAGCTCCTGAGTGATGCCGGGAAAGATGGGAGTTACTTGCTACGGGATAGCGAGACCATGCCGGGAATGTATTGCCTCTGTGTTCTGCACAAAAATTTGGTCTATACATACAGAGTTCATCAGACATCAACTGGTTCCTGGACTGCTGAGGCTGCACCTGGCGTTACAAGAAGGCTGTTCCGGAAGGTGCAAAATTTGATTTCTGCATATGAAAAACCAAACCAGGGAATTGCAACACATCTGCAGCACCCAGTGGAGAGGACGGTGACAAAAATTGTTTAAGGGTGATTAATGGATGGATGCTTAAACAAATGAGTCATTTGCAGATCAATTCATTCGACGCTGCCTTGAAGAGAG\n>XM_040760640.1 Sporothrix brasiliensis 5110 uncharacterized protein (SPBR_02337), partial mRNA \nATGACTCCTCGCCAACCACAGAGCGACAGTGGTCGTGCCTGTACGTCAATTGTCACAGAGTACCACCGCAAAAAGCCGAATCAGGAAGCGCCGTTTTTGATCGAGGTCGAATACTTGAACTCTGCCGGCATAAAGGCCCACTTACAAGAGCTGCTTTGGAACTATCGCCGCATCTACCGTCCGGATATTGACCCAGAGGCATTGGGTGATGCCGAATACAAGCGACTCGAGGCTACATCCAGCACGGCGTGGTCGACTCTACAGACAGCGTTCCGCCATGAACGTGGCTTTAGTTCCTCGTTTGCCCTGAACATGGACGACGGTTCCGACGAGCGCATCCTGGAACAGCTTGTCACATGGGCGGGCCGCATTGAATGGCCACGCGGAAGTGACGAGGGCTTCTGGACAACTACGGCCCTCTCCGTGGACGAGTGTTGTGATGCTACGCGGCCATTCATGGAGGATAAGTTCTGGCCGTTTACCAATCTTATCAGGATATTTCTCAGTGCACGTGTGCTCGACTCCGGTATCATCCTAGCCGACCTCCCCGGACTCCAGGACGTCAACCTGGCTCGAGTCCGTGCGGCCCACGAATACGTTCTGCAATGTGACAGCATTCTTGTCGTGGGCCGCATTGCGCGGGCAATCTCTGATCAGTCTTTGCGGTCATCACTCTACACGTCCCTTGCAAGTCACGCCCCAAACGAGTGGCAGGAACAAGGCGCAGCCCGCCTAAACATCGCCGTTGCACTTTCGCATGCGGAAGACATTAATGTTCGATCTGCACGGCGTGAGATCCAAGACCCAGAAATCAAGGCCAAACTGGATCGCCTCGACATCGAGATAAACAATGCACAAGCCGCAGGTTCCCTTCGAACGGAACAAAATATGAAACTCATGCGAAAGCGACTGTTGGTCGAGGAGAGAAACAAGAACGTCACGAAAGGCTTGCAGGATGCTTATGCCTCCAAGATGATCAACCAAAACAGGCAGTTGCCCGTTTTCTGTATTTCCAACAAGTGGTACGAAAAGTTTACGGCCATTGGAAACACAGAGCTCGTGCGGGAAAGTCAGATTCCCGCCCTCCGACGACACTGCCAAGCCATCGCAGCGGATGCCCTACTGGGCGAAGCAAGGCACTACTTACGAACAAGTCTTCCCTCTCTCGTCACCTCGCTCGACCTCTGGGTCACAAATTCCATTGCCACGCAGGCTCTGCAGGGAGACGGCCGACACGACCGATCTGATCCCTCCGTAGATCGCGTCCGCCAAGTGGTCCGCGGAATCGACGACGAAAATTTGCTAGGCCCGGAAAGTGACTGGGTCGACAACGTCGAAAGTTGTTTCAACGAGGAAATAATGGAATTTTTCGCCAATAGGGGTGACATATGGAAGGATCAAGCTGTCAACGAAAGCAACAAGTGGACTGTAAAGTCAGGTCCTAACTACTGGCATCAAACCCATTACAATTCATGGTGTCTTCATGATGGCGATTGGAGCACACCAAAGAAGCCACATGTCAACTGGAATGCCGAGTTGATCTGGAAGATGCGGACCGAGCTCGAGCTGCAGTGGGACATTTTCGAAGAGCAAACGCATGACGAGTTCAAGGCCGTACACGAGAACCTTGGTGCAAGCCTCGTTGAGCTGAAGGACGCTATTGGGTCTGCAACTAGCGTCCCAGGGCGTGAAGGACTGGTGCGCTTGATCAACTTCAGCTTGCACGAGTTCAAGCACTCCCTGGACCAAAGAGAGCGACGCTTCCTCGTGACGCTGAGGGCTACGCGCAGCAAGACCAGTGAAGCCACATGCGCGTCGTATATTGTCGAGCACATGCTTCCGGCATACCGCGACGCGTCGCTGGAGTTTGGGACCGGACGGCGTATCAGGCAGGAGACGATCATCGGCTCAAAGGTAAGCAGAGGTGACATATTTCTCAGCATGGGCAGTGCATTGGCGCGTGATATCCAAAGTCTTCTCCGACACACAGAGGAGGAGATCGAGCGCGCCATAGAATCGATGGCTGAACACATTCTGCGGAATGTCAAAATGGCATTTGGGGCCGATGAGACTCCTCACACGTCTGTGCCATCAGCTGCCCTGCGGAATGCCGAATACAACGAGCGCCTGCAGCACTTTTCGAGTATGGTCTCTGTCTGGAGAGAACAGTACTCGCTTTTGTTTGCGAGCGAAGATGGGGCGTTGGACTCTCTGTTGTGA\n>XM_027854401.1 PREDICTED: Vombatus ursinus myo-inositol oxygenase (MIOX), transcript variant X2, mRNA \nCTCAGACAGATCACACACAAGCCACGGGTGACACTCTACACACCCCCTTCCCATCCTGTTCACTGCTAGGCCTGTGGTCAAGATGAAGGTTTTAATGGGTCCAGATCCTTCTCAGATTTATCGGCCTGATGGGGGCAAAAATAAAGAGGACTTCCGAAACTACACTTCAGGACCCCTCCTGGATCGAGTCTACACCACCTACAAGCTCATGCACACGCACCAGACCGTGGACTTTGTCAGGAGGAAGCACGAGGAGTTTGGTGCATTCTCCTACAAAAAGATGAGTGTGATGGAGGCCGTGGAGCTGCTGGACGGGCTGGTGGATGAGTCTGACCCCGACGTGGACTTTCCCAATTCATTCCATGCATTTCAGACGGCTGAGGGCATCCGGAAGGCTCACCCTGACAAGGACTGGTTCCACCTCGTGGGGTTGCTGCATGATCTGGGGAAGATCCTTGTCATGGCTGGGGAGCCTCAGGATAATCCTGACACCAAGGACCCTCGATACTGCACTGATTATGGAATGTATGAGCCCCACTGTGGCCTGGAGAACGTACTGATGTCCTGGGGCCATGATGAGTACATGTATCGAATGATGAAGTTCAACAAATTCTCCCTGCCTCCGGAGGCCTTCTACATGATCCGTTTCCATTCCTTCTACCCTTGGCACACCGGTGGCGACTATCGGCACCTCTGCTGCCCCCATGACCTCAGCATGCTGCCCTGGGTGCAAGAATTCAACAAGTTTGATCTCTACACCAAGTCAGAGGACCTGCCAGATGTGTCCATGCTTCGGCCATACTACCAGGGCCTCATTGACAAGTATTGCCCCGGGGTCCTTTGCTGGTAACGGCCTCTGCTCTGGTCTGAGCCAGCTTCTTGGCCCTCATACAGCCGGTCAGACTCACTTGCCTCACCAGGGGCAGCCAGCCCCCTCCCTTGTACACACCAACCTGTCCACAGGCCCCTTTCTCCCCCTTCCTATGAGCTGGGGATTATCAGCCCAGAGACCACCCCGAGCCACTGGCCACCCCCTTAGCTGACCTCTCCATCCCACTAGCAGCAGCATCCATGTCTTCATTATCTCCATACCTCATTGCCAACTCCATCCCCGTTACATCATCATTGCCAGTCAGCAGGTGCCCATCACTTTCCTGCTTACCATTCTCACCATCATTTGCAGCCGTCTGCACCACATGCTCTGGGGGTCCCTGGGCACTGCTCATCTCTCCAACCACACCCGCAGATTCTTAACACTCCTGCCGAGAAATAAAGACCGTACAGAACCCTG\n>XM_044147674.1 PREDICTED: Aphidius gifuensis vesicular integral-membrane protein VIP36 (LOC122849090), transcript variant X1, mRNA \nTAGGTTGCTTACGCAGCTCACTTTTTTATCATTATCATGTCATAAATATTAAATATCCATTATATCATTTACCTATTGTGATGTGTCGTTTTACACGAGCTAATCAGCGCTCATTTTTCCATTCGTGACTTGGCAAGATAATTATCGACCTGTGGCCCAATAAATTTGATTAAAAAAATCTTCAAAAATTCATTCAGATCTATAAACAACTAATTTGATTGCGTTTGAGTGGTTTGAAATAAAATTTTGATCACAACCGGTCAAACCATCAAGAGGTGCTTGTTAAATTGATATCAAGATGCATTCATGGTTGTTGTGTGTTGTGATTATTGGATCTGTCAATGCAGAATGGAACACCAAAGATTTTATGAAAAGAGAACACTCTCTTGGCAAGCCATATCAAGGTATGGGAATGTCAGTACCATACTGGGATTTTATGGGCACCACAGTGGTCACAAATGACTACATAAGGCTAACAAGCGATATTCAAAGTCAACAAGGATCACTCTGGAACTCTGTGCCATGTAACCTCAGAAATTGGGAAGCCCATATACATTTTAAAACTCACGGTAAAGGACGTGATTTATTTGGTGATGGTTTTGCAATATGGTATGCATCGGAAAAAATGATGCCAGGTCCTGTTTTTGGTTATAAAGATTATTTTAAAGGTCTTGCTATTATTCTTGATACATATAGTAATCACAATGGCCCACACAATCATCAACATCCATACATATCGGCCATGATTAACAACGGCACATTACATTATGATCATGACAGAGATGGTACACATACTCAGTTGGATGGTTGTGAAGCCAAATTCAGAAATCTTGATCATGATACGTATCTGTCCATCAGATACGAGGGAGACACCTTGACCGTTTCAACTGATATTGAAAATAAAAAGGCTTTCAAAGAATGCTTTTCAGTAAAAGGAATTCAACTACCAACACATTACTACTTTGGTATTACTGCCACAACTGGTGATTTATCGGATAATCATGATATTTTGTCATTTAGATTATATGAACTGGACACACCAGTCGATCCGAATGATATCCAGGATCGTTCCGCAATCGTTCCATCAGCAACATACTTTGATTCTCCACGAGAACACATCGATGATCCAAAGCCATCGTCTATGAGTGGATTTAAGATATTCTTCTTAATGCTTGTTAGTGCAATTGCACTCGTCGCCCTGGTCGTCGTAAGCATTATGGTTTATCAAAAACACCAAGAAAACAGTCGGAAACGTTTCTACTAATAGAAAAAAAATAATAATAGATATTAAGAATCTTCCAAGACGTTATTAGAATAATTCAAGAATCAAAACATTGTACACAATTACATATTTCATAATTTTTTT\n>XM_025922904.1 PREDICTED: Puma concolor solute carrier family 30 member 8 (SLC30A8), transcript variant X2, mRNA \nATGGAGTTTCTTGAAAGAACTTATCTTGTGAATGACAAAGCCACTAAGATGTATGCCTTCACCCTAGACAGCGTGGAACTCCAGCAGAAATCCTTGAATAAAAATCAATGTCCTGGAGAGAAGCCAGAGGAGCTGGACTCAGGAGCCATCTATCACTGCCACAGCAACTCCAAGGCCACAGAGAACAGAGCAAACGAGCAAGTCTATGCCAAGTGGAAACTCTGTGCTGCTTCAGGAATATGCTTCGTTTTCATGATTGCAGAGGCCGTGGGTGGGCACATTGCTGGGAGTCTTGCTGTCGTCACAGATGCTGCCCACCTCTTAATTGACCTGACCAGTTTCCTGCTCAGTCTCTTCTCCTTGTGGTTGTCATCAAAGCCCCCTTCGAAGCAGCTGACGTTTGGATGGCACCGGGCAGAGATCCTTGGTGCCCTGCTGTCCATCCTGTGCGTCTGGGTGGTGACGGCTGTGTTGGTGTACCTGGCATGTGAGCGCCTGCTGTACCCTGATTACCAGATCCAGGCGACTGTGATGATCATCATTTCAGGCTGTGCGGTGGCAGCCAATATTATACTAAGTGTGATTCTGCACCAGAGACATGCTGGACACAATCACAAGGAAGTGCAAGCCAATGCCAGTGTCAGAGCAGCCTTTGTGCATGCCCTCGGAGATCTATTTCAGAGCATCAGTGTGTTAACCAGTGCACTTATTATCTACTTTAAGCCAGACTATAAAATGGCTGACCCAATCTGCACATTCGTCTTTTCCATCCTGGTTTTGGCCAGCACCATCACTGTCTTAAAGGACTTCTCCATCTTACTCATGGAAGGTGTGCCAAAGAACCTGAACTACGATGATGTGAAAGAGCTCATCTTAGCGGTGGATGGAGTGGTGTCTGTGCACAGCTTGCACATCTGGTCTCTAGCAATGAACCAAGTGATTCTCTCGGCTCATGTTGCTGCAGCAGCCAGCCGGGACAGCCAGGTTGTTCGAAGAGATATTGTAAAAGTCCTCAACGATAGCTTTACTGTGCACTCACTCACCATTCAGATGGAATCTCCAGCTGACCAGGACCCTGACTGTTTTTTCTGTGAAGAACCCCGGGACTAG\n>XM_025582792.1 Aspergillus brunneoviolaceus CBS 621.78 hypothetical protein (BO95DRAFT_367563), partial mRNA \nATGCTCGGTCGACTATTGAATACTGCAGCGGCCACTCTCAATCCGACGGCATACTCCGCGAAGAACCCCCAGCCACTGGAATCGGTCACAGAGGAGGAACATACATCGGGCTTGCTTTATCCTGACGTTAGCCTTCTTCGCCGCTCCAACTCACACGCGTACCCCCTTCATACCGCTTTCAATTCCCCGAATACCTCGACGGCCGGTGGATATGATGATCGTGGTGGCGGCGTCGAATTGGACCACCTGAAGGATTTCCGTGTGATAATCGCCCAGAACGCGCTGGGAGACCGGGATGCCTGCGTGTTACTGGATACCCGGGCCACGCCGCAGGGACAAGGCTCACATGGTCTGGGCTTGGAGCCACAGGTGTTTGAAAATACTGGTACCCGCCATGCCCGCACGCTCTCCACGTTGACTCGCGGCCCGCGGCGGGGTTATCTGCCTCAGTCATCGGTCGTGGAATCAAGCCCGCTGTCTGCGGCCGCAGAGACACGGCGATCCCCGCCCATGTCTTCTGGCGCGTTCATGAGGGCACGGGTTCGTAGCTCTACGCTGGCGCCAGGTGGGAACTTCACCGAAGGTGGCCATTCCCGGGGCACGACGGATGCGAACGATTCCGGGTTGCTGAACTGCATCTTCGGGAGCAGTGCTTTCAGCTACAAGGGTTCCTCCACCAAGATGCATATCATTTCCGCCGATGATGAACCGAGTCAAACCTCGCCAGCCTCGCCGGCGGCACGTAGCTCTCTATCACGAGCATATACTACAGGAAGTTCTACGACGTTTGGCGGTTCTGATCGTGGTAATGAGTCTAAACCGCCTGCCAAGGTCACTATCCTGTTGACAAGGATGTTCAGTGTGCATCTGCCCGAAGGCGGAGATGATGACTCCTCTCCGGACAGGCCTGACTTGTCATCTTCAGTCTCCCACGACGCTCTCCCGAGCCCAGGGTTTCCCTTCCCGGATGTCTCGAAGCGCAAGAAGATCAAGGAGAAGAAAACTCCCATGTATGCGGTCGCTATCACAATCCAGATCCCGCTCTTATCCCGAAATGGTGGGCGGCCGGTTTCTCGGTTTGCGCAAGGTCCAGACTCTCCCAAGCCAGGGCTTTCGTGCTCATTGGACTCGGACTACCGTTGGCGTGGAGGCTTCTTCGAGGACAGTCTGTCCCATGCATCCCCTCCTGCAAGTTTGGATGAGCGTATTGATCTGCTGGTTGATCATTGGGACATCATCAACCGGACGTTGTCCCATTTGGAGAGGCTGTCTCGGAACGAGATCCTGTTCTTACTCAAGAAAGTAGACGCCTCGGCAGGGCCGCATCCGAAACCCGCCAAACCTCCAAACATGCAAAGGACGAATCAGACTTTTGTTCATCTGCCGGTCAATGTTTTGTCCATCAATTCCAAACTCCGCGACGAAGCCATCCGCAGCACTCGTCGCATTAGCACGGCTCTGCAGATGCCGTACGTTGTCACAGGCCAGAGCCGCTGGGGCGTCTGGCGTGAAGAAGGGCGGTCGATAATCCGTAGCCTCGGAGACAAAGACCACAGTTTCTTTTTCCTGGTCTTGGTTACTGCCTTCTTGGGAAACCATACGGAGTGGCTCAATGCTGTGGGCCCGGAGTGGTACCGTCGGCGGCACTACCTACAACAGAAGGCTCAGCAAGACGCCGACCCGATGCTGGCGAATCGCACCGTGATCATCTCACCGGATAAGATGACTGCCAGAAGACTGATTTTCTTGCTGGCGGCGTTTTTGCCGCCCAAACAGCGCTTCGAGCCCCTGCCGTCTCCGATTCGCCCTGGCACTGCGGCGTCGACTCGTGCTGTCTCCCAGAGCCCGCCTAATGTTCCTATCCTACGACAGGAGGCATTGCGGAGGGTGATGGAACGACGGTCTCGTGCGCAGCGCCTCAACCTCAATGAGAGAGAGCAGCACCAGCGTTCTGTGAGTGCTTCATCGAATGAGACGGCCCATCGTTCGGCGGAAGAACCCGAGCCCATGATTCCGCCTGATTTTGGTGCGAAGCGCAGGGGCTCAGATGCCCGCTCGATCCGAGCCTTAGGGGTTCCTATCCATACTAGAGACATGCGTCCGAGGAATACCAGTGCAGCCACCACCTCGACCACTACTCCGAGTAGTACCGTCCCCGTCCCGCACTTCGCCTCGCAGAGCCGGTCTGAGCGGATGGGATCGGATCCAAGTGTGGCTGAAGGACGTGACAGCCTGGCGTCGGAAACTCTTCTAAAGAATTTGCGGCGGTCCGAAACCTCGGCAACCTGTGCCAATGGCCAGATGCCTCCCGCGAGTGGCCGCTGGGGCACATTGTTCTCTGGCTTATGGAGCTCTCGTCAGGAGTCATCAGACGCTGGTGACGCCCCTGCGCCATCTGAAGCGCGCAAGCGATCGGTATCTGCTTATACGAACCCAGCCAGAAGGAACCCTCCGACACTTGCCCAGATGGTCAAAGAAGCATCAGAGGAACCCATGCCGGCGGCACCCAAAGCTACTACGAGCGGCAACATCTCTATCCCTCCGGCGACAAACAGTCATATCTCATTCGAGGAGGACGCACCGGATTTCTCGTCGACCACGGACCAGACCAGGGAGTCATCCTTGAGGATGGCCGTTCGTGGAGATGACGGCGTGGTGGATGTGGACCTGCCGCTCCCAGGGTTCCTGTCGCTTTCGTCGTCTGGGGACTCCACGCTGGCTTCTCCCAAGAAGACCCGCACCTCGGTTACTAGTATGGATGCAATGGCATCTACGCAGAGCAGTGTCTCCGGGTTCCACGGCAGTCTCAAGGACAATGATGGACCTAACACCAACGTCGCTGGCTGGCTGCGAACTTTCCATGACGATTTTCTCCTGCAGGCCGTGAGACCATACGCTTCGCTGGAAGCCGATATCAAGCGCGCCATGCAAGCCGAGCCTACACCAAGCCAAGCTCTGTGTCTCAACGCTGATGGTTCCGAACGATGGGTGGATGTTGCGACCACCGTGATTGCGGATGTCCGGAACTTCACCGTGAAGCGACTGCGACTGAGACGTAAACTTGTGGGACATGGGTCGTCGCGCAAGGCGTATACGCCGTCTTTCCCGTCGCAGCCCGGCACTCCGCGGTACGTGTCCAACGGGTCTGTCTCGGCCTCGCAGCTCACCAGCTTCTTCTCGCACGCCACTGGGTCGAGCAAGACATCGAACAATTCCTCCATGGACGATTTCTATCCTACCGAGGTTGAAGAACGGTTCGTGGAAGAGCCCGTGATGGATCTGGATGGCACTCTTGTCGATGCTCTTGAACGGGTGCTTGCACAGAGTGGACCGTCGTCCATGGTGCACTCTCGCGCGCCGTCGCCATCCCGTGGTCGTCGCGGAGAGGATAAGCAGGCATCGGATGCCCCCGTGCCCACACGGGAAGAAATCCGACCTGTCGAGGTGCCTCGGACTGAGTGTCGCAAGCTGGTCCTCGGGGCGCTGGAAGAGGTGGTGCGCAGTGTGACGGCGGAGCATTGCCGCGAGGATGTTGACGGGGAGCTCGGCCTAGCAGATCGCGAGCGCAAGCGTACGTTGGCCGGGGCGGATAATACGCTGCGCGAGGGAGTTCGCAAGTGGCTTCTCGATGTTGAGGAGGCGTGGTAG\n>XM_046049963.1 PREDICTED: Micropterus dolomieu ArfGAP with GTPase domain, ankyrin repeat and PH domain 1 (agap1), transcript variant X1, mRNA \nGCGGAGGAGGGAATGGGACCGAGCCCAGCGTCGCTGTCAGGGAGGGTAAAGCTATCGGAGCAGAGGAGGGGAGGGCAGGCCCGGGTCCAGGGCTGTAAATCCAGGGACATTTGAATCACAATTGAATCCGGTCTGAGGTGAAAGAGGCTCGGCTGGCTGGCTGGCTGCGCTGCGCTGCGGGGGATGTGCGCACACAATGGGAGACGACGCGCTGGCTCCGTCCGGGACGCGGCGGCAGAATAAAATTCACCTCTCTGTTTGTTTGTAATGGAGACGCGGACACCGGAGCAGGATCCAGAGACGTCAGCGGGACACACGGCGGAGGACTCCCGGGGGTAAGGACTTGTGTGAAAGTGTTTCTTCATGCCGGGACGGAGCGCTGCTGCGAGCCCGGAGAGAGGAGCTTGGGACGCGCCTGCTGCCTGTTTGTCTCGTTTGCTGCCAGTTTAAATTCCGCTGGGATGAACACGGAATGTATTTCCTGCGTCAAAGTCCGCGCTGTTTGCACATCTGGATAAGGGGAGAGTCGGTTATTGCCCCGTAGCGTCCCCCCCCCGGTGCGGTTGAACCCGTTTGTGGAGAAACGTTTCAAGTCAATTGACCACTTCCATGTTTTAGACCCTCAGACTGCAGAGCTCAGTGTGAGCAAAACAACAGAAACCCTCTTTTTAGTTTAATAAAGACATCATAAAGGAGACGACAGGATCATTTGAGTGATTTTTCTAATGCAATAAAGCCTCGTTAGAGTTTCTGTTGGCTGCTGCAGACTTTAGATCAGAGCTGAAGAGGAGCTCTTTCATCAGGGATGTACCTTCTGGACAGTAACTGCACTGAAAGGATGGAGAGGGGCACGCCTCAGAGGAAAACTGTCTACCGCATCTCGCTCACCTTGGTGAAGAGGGAGAGTTTAGATGGTGAGGATGAAGGCTCAGGCCCCCGGCGGGCGGAGAACCCCAAGGTGGGCACCATCCGGCGGGAGAGCTCGGTGGAGATCCAGCGTGGCGGCCTGCTGGAGCAGCTGAAGGAGGTGGAGGACGAGTCGGACGACTTGTCGTCGTCCCGGGGCTACATGAGGAACTTCAGGACGTTCAGCACGGGGCAGCTGGAGCTGGGGAGGCTGAAAATCTCCAGGAAACAGCAGCTACAGAAAGAGCCGAAGCAGAAGGCCTCCAGCCCGGTGGCAGAGCACGCCGCGGAGGCCCCTGAGAAGATGTCGGCACAGAGTCAGGAGCACACTCGGGGGGAGAGCAGAGAGCAGGAAGCGGAGGACTCAGACAGACTTAAAGAGGAAATCTGCTCTGAAACTCACAAACAAACAGACGCTGCCGTGGAGACGAGCGGCGTGAAGAAGAAGAAGAGGCTGGTGAAGGCTCAGAGCATGGAGGAGAGGAGCTCCGACCCTCCTCTGAACGGTGATGGGTCTCACTCCAAGAGCAACGGCAAAGCAGCCAAAGCTCCCTCCCCTGAGACGCCCCCTCTGAAGCGGCCGCCCGGCCTGCTGCGCCGCAGCTTCAGCTTCAGACACTGGAGCGGCGGCGAGCTGCTGCGTCTGCGAGCGCTCTCCAAAGACAAACACCACAGCAGCTCCAGCTGCATCGGGCGTGACGCCGGGCCGGGCGGCGGCGAGAAGGAAGCGGAGGCTCCTGTCGCGCTCCCGGCTTCCCGCCTCGCCGACCCCACCAGAGTGAAGAGCAGGACTCTGGAGGTCGGCGCCGTCCTGAACAAGACGGACTCCATGTCTGAGCTGAGCCGCTGGGAGAGAGCGCGGGGCAACAAGAACCGGACGCTGGACAACAGCGACCTGCAGCGGCTGGCGGCTGAGAGGGACGGGTCAGGAGGGGGGTTCCTGCTGAGGGGAGGGGGAGGTCGCTCCAGCGAGAGGCGTCTGGTTCGCTTCTTCAGCGGGATCTTCTCCAGGAGGGACGGGGCAGCCACCTCGACCCCGGTGGGAAGCCCCAGCAGCCTCCCGCGGAGCAAGAGGAGGGTTCTGTCCCAGTCCAGCACCGAGAGCATGAACGGAGGAAGCTCTGAAGATGCGTTTGTGAACAGTCAGGAGTGGACGCTGAGTCGATCGGTACCAGAGCTGAAAGTGGGCATTGTGGGTAACCTGGCCAGTGGTAAGTCGGCGCTGGTCCACAGGTACCTGACAGGAACGTACGTCCAGGAAGAGTCCCCTGAAGGCGGACGCTTTAAGAAGGAGATCGTGGTCGACGGTCAGAGTCACCTGCTGCTCATCAGGGATGAAGGGGGCCCCCCGGAGGCTCAGTTTGCGTTGTGGGTCGACGCCGTGATCTTCGTCTTCAGTCTGGAGGATGAGATCAGCTTCCAGACCGTTTATCACTACTTCAGCCGCCTCGCCAACTACAGGAACACCGCCGACCTGCCGCTGGTCCTGGTCGGCACGCAAGACGCCATCAGCTCAGCCAACCCGAGGGTGATCGACGACAGCCGAGCCAGAAAGCTCTCCAACGACCTCAAACGCTGCACCTACTACGAAACCTGCGCCACCTACGGCCTCAACGTGGAGCGGGTCTTCCAGGACGTCGCCCAGAAGATCGTGGCTACCAGGAAGAAGCAGCAGTTGTCCATCGGGCCGTGCAAGTCGCTCCCCAACTCGCCGAGTCACACGTCCGTCTGCGCCACACAAGTGTCAGCCGTCCACATCAGCCAGACGAGTAACGGCGGCGGCAGTTTGAGCGACTACTCGTCGTCGGTGCCGTCCACGCCCAGCACTAGCCAGAAGGAGCTCCGCATCGACGTGCCGCAGACCACCAACACGCCAACGCCCGTCCGAAAGCAGTCCAAACGCCGCTCCAACCTCTTCACCTCGAGGAAGGCGAGCGAGTCGGACAAGGACAAGAAAGGCCTGGAGGCTCGAGCCGACAGCATCGGCAGCGGGCGAGCCATCCCCATCAAACAGGGCATGCTGCTGAAGAGAAGCGGTAAATCCCTCAACAAGGAGTGGAAGAAGAAGTACGTGACGCTGTGTGACAACGGACTGCTCACCTACCACCCCAGCCTGCATGACTACATGCAGAACGTCCACGGTAAGGAGATCGACCTGCTGAGGACCACGGTGAAGGTCCCGGGGAAGAGGCCGCCTCGCGCCGTGTCCACCTGCGCGCCCGTGCAGAGTCCCAAAACCAACGGCCTGACGAAGGACATGAGCAGCATGCAGCTCGGACAGACTCCAGGTTCGGTGAGCAGCAGCTCGTCGGTGTCTCAGATGGCGAGCGGCGTCAGCTTGGTGTCCTTTAACAGCCGAGGTCTGGAGGGGATGCACCAGCGCTCCTACTCCGTCTCCAGCGCCGACCAGTGGACCGACGCCACCGTCATCGCCAACTCCGGAGTCAGCACGGATACCGGCCTCGGAGACTCGGTCTGCTCCAGTCCCAGTATCTCCAGCACCACCAGTCCGAAGATGGAGCCGCCGCCATCGCCGCACGCCAACCGCAAGAAGCACCGGCGGAAGAAGAGCACCAGCAACTTCAAAGCCGACGGCCTCTCTGGTACTGCGGAAGAACAAGAGGAGAACTTTGAGTTCACCATCGTGTCGTTGACGGGGCAGACGTGGCATTTCGAAGCCACTTCGTACGAGGAGCGAGACGCCTGGGTGCAGGTCATCGAGAGCCAGATCCTGGCCAGCCTGCAGTCCTGTGAGAGCAGCAAGAACAAGTCTCGTCTGACCAGCCAGACGGAGGCCATGGCTCTGCAGTCCATCAGGAGTATTCGAGGAAACGGCCGCTGTGCCGACTGTGAAGCCCAGAACCCGGACTGGGCGAGTCTGAACCTCGGGGCCCTGATCTGCATCGAGTGCTCGGGCATCCACAGGAACCTGGGCACCCACCTCTCCAGGGTTCGCTCTCTGGACCTGGACGAGTGGCCGCTGGAGCTCATCAAGGTCATGTCGGCCATCGGCAACGAGCTCGCCAACAGCGTGTGGGAGGCCAACGCGCAGGGACGCCTCAAACCTGGGCCGGACGCCAGCAGGGAGGAGAGGGAGCGCTGGATCCGGGCGAAATACGAGCAGCGTCTGTTCCTGGCGTCGCTGCCCGGCACCGACCTGTCTCTGGGCCAGCAGCTGCTGAGGGCGACGGCCGAGGAGGACCTTCGCTCCGTCGTCCTGCTGCTCGCCCACGGGTCACGACAGCAGGTCAACGAGACCTGCGGAGAAGGAGACGGACGCAACTCGCTGCACCTGGCCAGCCGCAAGGGCAACGTGGTCATCACGCAGCTCCTCATCTGGTACGGCGTGGATCTGATGGCGAGGGACACCCACGGCAACAGTGCGATGGCATACGCTCGGCAGGCCAACAGTCAGGAGTGCGTGGACACGCTGACTCAGTACGGCTGCCCCGACGAGCGGTTCCCGCTCATGGCCACGCCCAACCTGTCGCGCCGCAACATCAACCGCAACAACAGCTGCAGCAGCGCCGGGAGCGCCGCGCTCATATGACGAGGGCATGTCACCGTCTGACTCTTTATGACAAACAAACAAACAAACGCCGATTTGGGAGAATCCTGACCGTTTATTTTGGGAACCACTACCTGTTGCGACTCTAAGCCCCGCCCACCTCACCTGAGAGCCACCACTGCCGCTGTCGGCTCGTTAAGACTGATTAGAGCTTATCACGGGTCAGTGGTGGCGCTGTTTGTTTGGGAGAACCCTCAACGGGTGGGGAAACCCTAAAACACGGTGGGAAATGTGGTCCACAGTCGCCGATGGCTCATCAGAGCTCTTTGGGAAATAATCACGTGACTTATGACAGCCAATGACGGCCAGTCTGAAAGCTCTAGGGAAATCATACCTCATCACACAGCTATACTTTAACGCTACGCGACCAGCTCCCGCGCAACCTCGCCACGCATCATCCGGCCAATCAAAATCTGTCTAGCCAAAACATATGGTCACAACATAAGGAAGCAAACTGTGAGACAAAAATATCAGGAGGGGGGGGGGGCGGTCTTCATAGCATGCTCACACACAGGAAGCCATCTGAACTGCACATCATCTTCATCATCTTCACCAGTCGAGGACTCCTCTCTGTTGGATCCCTGCAGCTTTTCTCCTCCTCCCACCTGTACTTTTTATTATTTTATGAATTATGTGAACCCTCCTGCCTTTACACCTTCTTTTTTTTTTAAATGTGAACAATATCTCGATGTAAAACTTTAAGAGGAAAAAAAAAGATATCAGATCTTAGAGGTGAAAAAGAAGTGTGGTAGATCGCATGTCCTAGACACTTTTTGCTATTTTAATTTAAGGATTTTTTTTTTCCTTCTCCTGGATTGTGTATATTGTATCTCGATGTGCATTGCTGGACCAATCGTTTAATAATGTCAACACGGTAAGGGGATTTATTTAGTTTGTTTCCGGGTGTATAAAGTCGTTAAGTGTACAGAAGCTCTTGCCAGGCTCAGGGACCGGAGACTCTTGATCATGAACACCCCATCGTCTTTTCCCAGAGTCCTTAACCCAGCGTTCAGAGCGTTTCATTTGTTTTCACTTCACTCAGCTCAGAATCTAACAAAATTTATACTAACGTTATAAGGGAATAATACTTTCTAGATCGTTCCTCAGCTATTCTTGAGCTGGACGATATGATTTAAGATCCATGTCATGATGTATTGTCACATTTCTTCCTTGAACAATAATAAATATAACGATTTGTATGTTTTGGGGTTACAAATAATAATGTTTTTCAGTCATCAAACAATCTGCTGATTATTTTCTTTAGTTTTCCCCATAAAATGTCGGAAGATCTTCTAGTTCGTCTTTTTGTTAGACCGCCAGCCCAAAACCCAAGACCCCAGAAACTAAATATGTACTAAACTGTTCTTGTTCTTCTTCACATGTTGGATTTTTAATACTTTTCTGAACTGAGTGAACTGTGAGCATCTTAAACCCGAGCCTGATTTTACATCCTGGTCAAATAACATTTCATTTAAAGTGTCCCTGAAGTGAATTTAATTGTTTTAACTTGTAAAAAAGAAAAAATGGAATAGACAAGGAAGCAGCTAAGAAACTAACGGAGCGAAAAGGGAATTGATCTGCTTCTCCTTGTTCAGGTGTTTTTGTTAAATCTGTGAGTTCAGTTCACAGAATCTGCTGTCAGCTCAGACACATCACGGTGGTGATGAGAGGGAGGAAACTTTTTTCTTTGTTTCATTTCAGCTGGTAGAAAACTTTTCCTTTTAACAGGCGTAAACGCTCAGTAGAATGAAAAGAGTCAGTGAACGTAACACAAGTTCAAAGTTTCATGGCCACAAAATAGTGTTTCTGTGTATAAAAATCCGTTTGTAATGCTAGAGAGCCAACGCCCTCCAGTCCTGTCCCGTCCAATCAAACAGTCTCCCCGATCTGCTCAGCGAATCACTAAGAAGGGCTTCTTCTTCTCTGGTCTTGTTGTAAATAAACTTCTCTTTCTCTGTCACTCTCTCTCTTTTAACGGTGACGCCATGTAAATTAGAGAGCACAGGAAGTACTTACTGGATGTCGGGTTGCAGAGTGGAAGTGAAATATTAGAATGTGTGTTTGTTTGGGGGGGAAAAACGATATCAGCATGGACTGAATGTTGCGTGTTTTGGCTCAGTGTTGCGCTGATCCATCCAAGGCAGGAAGTTAAACTTTTGCGGCTCACTAGGCGTCTGAACCAATGGTTCCCAACCTGGAAATGTTTGCAGAACTACGATTCCAGTCCGAAGGGTCGCAAGAAGGTTTACAGGATGAGAAATAAAAAAATTTAACATTTACATGGTACAAAGAGGGCTAGAGTCAAGGCGACTAAAGGCCAGTCCAAGACTATTCCAAGTCTGCGCAGTTTTCAGAACGAATCAAGACCGTGTCCAAATGCAAAAAGTGTTCTGTTGAGACAAAGTCCTAGTGTGGTCAAGGTTGAGTCCAGATGTCTGAAATGTGGTCAAGACAAAGAATAAATGGACTTCAGTCCAAATGCGGTCTATTGTTCTGTCGAGACCAAGTCCCAATGTGGTCAAGGTTGGGTCCAGACGGCCGACATGTGGTCAAGAATGAGTCGACCCGACACCAAATATGGTCACGGTTTGAGACGAGACCAAGTCCCAATGTAGTCAAATTTGGGTCCAGGCGGCAGACATGTCGTCAAGAAAAGATCAACTTGAGTCCAAATTAATCAAGTTTGGGTCAATACCATGAGGCCTAAGAAAGCAAACTATTGAAACCAAAACAGTGCCAACTGGGTATTCGCCATACTGTTGTCTCACTTACAGTACAGTCATTTGGAAAATAAGCTTTACCTGGACTTTATTGGCCGAAGCTGGTGGCTGTGCCTGAGACAGAAGTCCACGATGAAACTGGACTCTAGTAAAGTCCACAAACATGCCTACAGTCTTTGCTTGCTTTCCTTTTGCTTAGTCATCCTAGTCATAACTCCTGCAATGATGAGCGGGGATGAAGTCAGTGGCGTGGACTACTGATGCAAACACGGTTCTGTTTACATCGGGTGTTGGCGTACGTAGATGTGAGAACTCGCGTAGTCGGTGGATACAGTCCACATGGTCATAGCTTTTGGACTAAACCCTTGGAATTTAAGTCGTTGGACATTCAAAGCTACTTAGATGCATAAAGGATGGTAAGGTTGGGATCCACTGGTCTAAAGATGCGCTGGTAATTTTAAGCCGTCACACAAGATTGTAAAGAAACACACCTTTCTCACCCTGATGACGACGACGTAGATTTGACTGAGCGTTGATTTCTTTCGTCGACTGAACGCTAATCGATCGTCGGGATAAAAAGCTGCTTAACCTCGACATTTGTGTGTGATGATTTTCACCTTCAACACTATGCTGAGCATCACCTGCTCGTCTCTTAGTCTTTGCTCTCTCTGCTGTTTTCGTGCTCAAATTGTAACGTAAAGGTTGAGAAGCAGCTCTCAAACCGACTGTGTATCCAAGCAATATTCATAAACTCATCAGTCACCGTCACATGGTGACTTCACACGCTGACGTTGCTGCAATATTCCCGTTAAACCACAAACACACTCATGTTTGTAGACTTGTAAGAAACAGTGAAAAGATGAAGTCATCATGAACTGAAAATATTTTCTCCTTCTGCCTTTTTGTTTTAAACGTCTGCCTTTACGTTCCTAATTTCGTCCGACCTTGTAATTGTACGTGCCACGCCCGTTTGCCCTCCCAGTCATCTCAAAGATGGCATTTTATCTTGCATAAATACTAAACCAAGGGGTTTGACCGCAACTTGTGTTTTCAAACTGTTTATTTTATGTTTATATCCGACTCTGTCCTAACTCTACCCATGACAGCAGGACAGGGCAAAGACGTCCTTTTATTTATGACAGAAATGCACTAAATCTGATTCAGTCTGTCTTAAGCTCAACACTTGCCACTACAGCTTTCTTTTATTCTCATATTGGCACTAACTGACGTTTGCTTATTTCTCTAAGCGGTGGCGGCTTCTGGCGGTGTCCTCTGACCTGATTGGTGCTCTCATTTTAACGGCATCTAAATTCTGAGCAACTTGGGAATCCAGAATCCATTTATTTAAGTTCACATGAGGGGAGAAAGCTCAGTAAAATCTGCTTTTAAATGACTATAGGCACCAAAATAATCCGTTGCAGGGTCAATGATAGCGCTGACCGCTAGCGGTGAACAAGCTAGCAACAAGTGTTTTCATTCTAAGGCTAAACCAAGCATGAAAAGTTGGGAAATGTCTAGATTATAGAAACATTGTGTTGGACAAGTCCGCAAAGTCAGTTTATTTAAGTTGTATGGCGCAGGAGAAGTTCTGTAAGGTTCTAACGTTAACCCTTGTTGCAGCTAGTGGTGAGCACTTTAGCATGGCAGCATTGTTTCAGCTTGCAAGCAGTTTCTACTACTACCAGTAAAAATCAAAATCAAGCTGCAGTTATCTAAACACGGCTAATGGAGAGAAGCAGGGCTGTGTACGGCCCAAGTCTGTTTATTTAATCTCAGAATAAACTCTGTAATGGCTGCTTTTAACTGTTTGAATCATCTATCGCTGAAGCTAACTGTAGCTAGCGGTAAACAAACCAGCATGGGCAGCATTGTTTCGGCTTGCAAGCAAACTATAAATGACTTAAAATTGGAAAATGTTTAGAGAATGGAAATGTCTTGTGAATCTCCAGCCCCAGCTAATGATCAGTTAGCTAAACCCAGCTAATGAAAACTGCTTGACACCGACTCTTTTCAGAACAGTTTTGTTTGTTTGTTAATGCATTAGCTGACACTTGAATCCAAAATCTGATGATTTAATCCCATTGCAGCAAAGAAAGCTCAGTAATATCTATTTGTAGTCACAGAAACTGCTGAGTCTGATCTGAAGCTAATTGCCGCTAGCGCTGAATACGTTAGCATGGTTATTTTCAACTTTATCTAAGCGAACTTTACTACCCGTCTTTCTTATTCTTAAAACTAAACATGAACAGTTGGAACATGTTTAGAGACTAGAAACATCCTGTGAATCTCCAGTTGCAGCTAGCAATCAGCTAGTTAATCTCCGCTAACGGAGCGAGGCGAGGCGCAATATATTCTCTAGTGGCGTTAGCACAGATATAACAAGATTCACGCTGCAAACAAGTGAAGCTGCCTGCTTGTAAATGAATCACGTCTGCTTTGAAAGATCCGGTGAACGAAGAAACCGCGCTAATATTGCAGCTCTGCGCCACCTCACCTGTACATAGACTTCAAACTAAAAAACGACTCAGTATGATCAACGTTTGGTTTGTCTGGTTGTGTTATCTCTTGTAGCCTTTACCCCTAAGCTCCACCCACCAGGGCTGTCCTCCACATTATTTATAAACGAACCCCGTGAGGAAGACTCCGCCCCCTCAAACCTACGTTTTTGTATATTTTTCTCCGACTTCTCCACTTTTATTATAATTGTTATAATTTCATCCAGATGCATTATTGTTCTTATTGTCATTGTTATTCTAATTATTATTATTATTGTTATTGACTTTTTGTTGGCTGTACAGTACCGTTGTTGAAAAATTTTACTTAATACAGAGTCTTCTACTGTAATGTGTCTCTTTTCAATAAAGACAAGAATAATGCTTCTTAATATAA\n>XR_002412069.1 PREDICTED: Columba livia uncharacterized LOC110358026 (LOC110358026), transcript variant X1, ncRNA \nGGAGGTGTAGGGGCTTACCATACTGTTCATGACAAGATTGAAAAGTATCTGAATGAGATCCAGAACAGCCAGCACACTGCACTGAGTTGCCAAAACTGAGTATATATATATCACAGAACCACGTTGAATTAGTCAGTGGGAACACTGAGGACTTGAGTGCTGAGAGCGACCTCCAGGCACCTTTGCCTGTGACAGATCAGGACTGTGGCCACATATTCCTCCTTGCCACGCTGGTCTGGCTGACTCAGGGAGACATTTACACCAATAGTTGATCCACTCACCTGTGATATTTTCAGCTGATTGACTCAACTGACATGCAGCATATTGTCCTCGAGGAATGACAGCTCAGGAATGCACGAGCCTTGTTCTCCTCCTGCAGCACATCTTCCCCGGTCAGCTGTGTCCCACCTCCAGCCTCACCTCTGCAGCAGCTCCTCTGGTGAGTCCAGCGTGATGGGGACTGACTGTATCATGGGCACATAATGGAAAATTAAGGCAGAAATAAGACTACGAGCACAGGATTACGAGCTCCCTAAGGTGGACACGAAGATTTACAAAGACAATATGTCATTTGGATTTTTCTGATAGAAACGTTTAACAAAAGAATATTCTTTCTAATGGCAATTTTCAATGAGATCCCACTTTCCTGTGGGGGTCTTGTGTGTAAAATTTTTACTATTTCCTTGATATTATTTAGCTTTGCAGCTAATCCATTATACAAAAGGAAATAAGAAAAGAGGGTAAGAAATGCCTTCTTCTGCAATGACATGGTTCTATGTTGATTTTTACATTCCAGGTAGGATAGCTACATAAGGACAGACAGG\n>XM_006834443.1 PREDICTED: Chrysochloris asiatica PDZ and LIM domain 3 (PDLIM3), transcript variant X3, mRNA \nATGCCCCAGAACGTGATCCTGCCGGGTCCAGCGCCCTGGGGATTTAGACTCTCAGGAGGTATAGACTTCAACCAGCCGTTGATCATCACCAGGATTACTCCAGGAAGCAAGGCTGAGGCTGCCCACCTGTGTCCTGGAGATGTCATCCTGGCAATTGACGGCTATGATACAGAATCCATGACTCATGCAGACGCGCAGGACAGGATTAAAGCAGCGGCACACCAGCTGTGTCTCAAAATTGACAGGGCGGAAACTCGCTTATGGTCACCACAGGTATCTGAAGATGGGAAAGCTCATCCTTTCAAAGTCAACTTAGAGTCAGAACCACAGGATGTGAACTACTTTGAACACAAGCACAATATTCGGCCCAAACCTTTCATAATCCCAAGCCGAAGCAGTGACCCGGTAGCCTCGGTGCCCCCACAGTCAGATGTGTACCGGATGCTCCACGACAGTCGGGATGAGCCTACTCAGCCTCGCCAATCAGGCTCCTTTCGAGTGCTCCAGGAGTTAGTTAACGATGGCCCTGATGACCGTCCTGCTGGAACTCGCAGTGTGAGGGCTCCAGTTACAAAAGTCCATGGCAGTGCTGGTGGCGCACCAAAGATGCCGTTCTGTGACAAATGTGGCAGTGGCATTGTTGGTGCTGTTGTGAAGGCACGGGATAAGTTCCGGCACCCGGAATGCTTCGTGTGTGCTGACTGCAACCTCAACCTCAAACAAAAGGGCTACTTCTTCTTAGAGGGAGAGCTGTACTGCGAAACTCACGCACGAGCCCGCACGAGGCCTCCAGAGGGCTATGACACAGTTACTCTCTATCCTAAAGCTTAA\n>XM_020957015.1 PREDICTED: Drosophila serrata uncharacterized LOC110187620 (LOC110187620), transcript variant X4, mRNA \nCTATTCAAAAGTGAAATTCTAACATTTTTATTCAAACAAAATTTTAAGTTGAAAATAGCAAAAAATGCGTGGTATTCTTGGCTGCTTGCTAACTTACCGCATGGAACCGCGTCTTTTGCAGATATCACGTTGTTTCAGCTACCATGCTCCGCATTTCCGTCCGCGTAGTGTGCTCGGTGCCAACAAGCTTTTCGAGCTAGCCAGCTCCACTTCCCCCGGTTGCCAGGCGACAAAGATTACAATATCGACGAGTTCCGGTCAAATTCGGGTACAGAGGTACTCGCAGACGACCTCCAATGTCTTTAACATCACCGAAAATGTGGACATGCTGCGCAAGCGGATTAGCTTTACTGGTGCACCCAACACTACTGCTCAGATCCTGCCCATTGGATTAATCACACCAGAAGCTGGTGGCGAGAAGGACCTTAAGATCGTGATTGTTCCTTTAAACTTGGCTGGCATGGATGCCAACGCCCTGAAGGAGACGCTTGAGGCCATTAACCAACTGCGCATGTACGCGCACCATATCGAGGCCTTTTCCAGCAGTATGGTCGACGACTACAATGCCTTGAATGAGGCCTTCCAGGAGGTTGAAGCGAAGAAGGAACAAGAAGCAAAACCGGAGGTTACCGCCGAAGATAATGCAGTCTGGGAGGACTTTGCCACACCCGATGCCACAGCCGATGCCGTGGCCACTCCAGCGGTCGATCTGCCCCTTCAGACCGACACGCCATTGCAGCGCCAGGAGGCGGTTAGCTTCCTAATTGATACCTTGACTAATGCCACTCCAGCAGCTGCCCCCCCGCCGCTGAAGACCACCAAAACTATATCGGCCGTGGCTCAGCCCAATCCGGAACCACCTAGCCCAGCCTCGACCATGGAAACCGACCTTCAAGCAGCTATTCAGGGGGGCGATGCCATTGATGAGGTTCAAGTGGATGTTCCACAGGACCTAAGTGATCGCCTCAACTGTATGGCCGTCTCCTCCATGGAGCTCTCATTCGAGATGGACATGACCAACCTGCGCGAAGCCCTGTCCAACAAAGACGCCAATGCTGTTAGCAACCAAGATCCCATGATTTGCATGCATACCAAAGTGGAAATGGAGAAGCCTACAGAGGGAAAACAAACTGTTCCGCTCAGGTTCAATGGCTTGATTTCGGGACTTGTGGAGCTCGATGCCCAAAAGCTGAATTTGACGGACGAGCAGATGACCGGCTTTAACGATAGCCTCACCGCGTTGGCGGCCAACCTGTGCAGCACAGCCTTGGATAAAGGCTTCTCCAAGGACATCAATCTAACGTTAAAAGCGGATGACACCACCATGAGCCTAGCGCCTAGTGCCGAACTGAAGATTGCTGATCAGCCTCAGGCGAATTTTGCGCTTCCTTTGGAAGTGCCGGTGCCGACTGATAAAGATGGGTGCAAGCATCCACCTGTAAAGCCGAAGCGGAAGTGTCCTGGCAAGTGTCCTCTAATTGATGATCCCTGCAAGGAGAATCCCTGCAAGCGACCCGCCGAAAAGCAGAAGCCGCCTAAGAAAGCTGAGAGTACCACGGAGATCATAGCTTTTGCCAAGGACCCCTGTGAGAAAAAGGATCCATGTGCCAAGGACGACAAGGATGCCAAGAAGGACCCATGTGCCAAGGAAGGAGGCAAGGATGGCAAAGATGGCAAAGATGGCAAAGATGGCAAAGACGGCAAGGGTGGCAAAGATGGCAAAGACGGTAAGGGTGGAAAAAATGGAAAGAATGGGAAGGGTGGCAAAAATGGCAAGAACGGCAAGAAAGACCCTTGTGCCAAGTTCAAGAAGGATGGCAAAAGTGGCAGCAAGTTTTCGACTTTCGCCGCACATCATAAACCCAACAAGCGCTACCTATCCACGGCACTGAATCAGGTTTTTAAAGAGACTGGATCACATTCAAGTCCTAAGGGTCCACGTTTCCTTGTCCACTCGACACTTCTGCGTCGTCACTATCGTGGCACCGTTCCAAAGGCCCCAGAATCTGACCTCAAACAACGAATGGTGCACAAGGCTAGTCCTCCTGCCCGCTTTACCATACACTCGACCATTCTGCGTCGAACCTATTCAAAAAAAAAGAAGTCTGGTAGCGGCAAGTGCTCTAAATTGCAGACCAAGTTTCCTACAAGTAGGGGCAAGGATATCAAGGAGCGCACGGGTATTCGCGACGACTGCTTCAAAGATGACGCTGACAGCTGCCCCTTAAAGACCTGTAGCGGCAAGTGCTCCAAGGTCAAGTTCCCCAAGAAGAAGTGTGACCGCAGTAACAAGGACAAAAAAGAGTAGACAGGCTGTTGGGCCAGGGTGCTCCAGTTCAGCTGCCATCGCAGCAACGATCATTCAGCAC\n>XM_019302128.1 PREDICTED: Ipomoea nil putative late blight resistance protein homolog R1C-3 (LOC109154305), transcript variant X2, mRNA \nGTTTCATTAAGCTACAAGTACTTACCTTGTGATTTGAAGGATTGCTTTCGTTATTTTGGTGTGTTTCCAGAAGACAATGACATACCTGTTAAGAAATTAATCAACTTATGGGTTGCAGAGGGATTTATAAAGCCACATGACAATATGAGTTTGGAAGAAGTGGGAGAGAGTTACTTGCATGATCTCATTAATAGAAGTCTTGTTCAAAGTAATGAGCTAAGTATTGACGGCAAAGTTAAATCATGTAGCATTCATGATCAAGTGCACAAGGTTTGTGTGAGAGAAGCAATAGAGTGGAATGATTTGTGCATTATCAATGACAATCATGCTCCAAACGCTTGTTGTTGGTTAAGCTGTCAAACAAGTCATTGGCCAATCACTCGAGCGAGTTACGAGAATTGCGGTCCTGATGAAATCCATTCTGTTCTCTGCTTTGGTAAAGATGTAAACCATTCAAAATGCAGGTTTGTATACCCATCTTTGAAATTGCTAAGAGTATTGGATTTATCATTAGTTAAATGGTCAAGAGGCATGCCTAGAGAAATAACAGACTTGGTTCATTTGAGATACTTGGCTTTAAGTACCATTGGTTCTCTTTACCAGTTTCGATTTTTCAAGCTTAAGAATTTGGTAACTCTCATAGTTACTTCATGGATGGAAAAATGTCCTTTGCAACTGCCATGTGATATTTTGGATTTGCCACAATTGAGGCATTTGCATGTTGACAAGAGATGTTCACAATATCTCCGTAGCTTAGTAAAAAAAAAACTACAAACTCTTTATTGGTTGAAGGTTGCTAACTCTGATCAAAGCCCAAACTTCGAAATGGTTCCAAACCTAAGGGAACTTGGGATTTACATTGAAGGCCAACTGGCGCCTAGATATCTAGGGAGCCTTGTGCATTTACATCTACTTGAGAAGTTGAAGTTTGAAGTAGGAAGAGTTGAGCGCTTTTATCTACCAATTGGTTTTCCGCCAAACCTAAAGAAGTTGACACTTCGTTATACTTATCTTCCATGGAAAGAGATGGACACAATTGGCAAGTTGCCACACCTTGAGGTGCTTAAACTAAAAGATTTCGCATTCTATGGCTCAAAGTGGGAACCATCAAAGCAGGGCTTTTTGGAATTAAAGGCACTTCTCATTTCACGTTCAAATCTCAAATATTGGAATGCAAATTCTAATCATTTCCCAGTTTTGGAGCGCTTGGTCTTAAGATATTGTTGGGAATTGAAACAAGTTCCAATTAATTTTGCAAATATTGGAACACTGAAGTTAATTGTGTTAGAAAGTTGTTATTCTTCTCTTGTGAGTTCTGCAATGCAGATTTCCTCTGCAAAGAAGTTATTGTTTGAGGGAACGACAAATTGTCCACTTCGTGTTCGTGAAGTTAGAACTAAGGTTGAATTGCCAAATAATGAAAGCTCTGAAGAAGAAAGTTGTGGAAAACTTTGAAGAAGAAAGTGTGAA\n>EU813087.1 Uncultured bacterium clone DP1_95 16S ribosomal RNA gene, partial sequence\u0001EU813284.1 Uncultured bacterium clone DP3_43 16S ribosomal RNA gene, partial sequence \nATTAGATACCCTGGTAGTCCGCACGGTAAACGATGGATGCCCGCCGTCGGCATATGATGTCGGCGGCCAAGCGAAAGCGTTAAGCATCCCACCTGGGGAGTACGCCGGCAACGGTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGAGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCCGGGCTTGAACTGCAGGAGAACGATTCAGAGATGATGAGGCCCTTCGGGGCTCCTGTGGAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGCTTAAGTGCCATAACGAGCGCAACCCCTCTCGCCAGTTGCCATCGGGTGATGCCGGGCACTCTGGCGACACTGCCGCCGCAAGGTGTGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTACGTCCGGGGCTACACACGTGTTACAATGGGGCATACAGAGAGTTGGCCATGCGCAAGTATGGCCGGATCAAGAAAGTGCCCCTCAGTTCGGACTGGGGTCTGCAACCCGACCCCACGAAGCTGGATTCGCTAGTAATCGCGCATCAGCCATGGCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCAAGCCATGAAAGCCGGGGGCGCCTGAAGTCCGTGACCGCGAGGGTCGGCCTAGGGTGAAACCGGTGATTGGGGCTAAGTCGTAACAAGGTAAC\n>XM_043073989.1 Brugia malayi Uncharacterized protein (Bma-cdh-5), partial mRNA \nATGATGATAACAACATTTGCGCTACAAACGATTCAAAACAATATCAAAATCTCTTCTTTACATTCGCCAACATTAAAGGCTTCATCGCATGAAGGTTATATACCGGAGTCAGCACAAATGGGTACCGCGGTTCGAGTTTCTCCTTCTGCATTTTCAGATTCACTTCAAATAGACATTTATGATGATGACCTGAAACCTGGAATGTCTCCAGTCAGTTATGAATATATATTAACAGGACTAGGCTCGTCCATATTTGCTGTTGACCAGAGAGGTTATGTCTACTTAAATGTACCATATATTGATGCTGATCCTCCGAATCCATCAACATATCAGCTTCATATAGAAGCTCGAGAAGTAAACACGACCCCAACTCGTAGTAGTGAACCAATATCAGTAATAATACACGTTATGGATATCAACGATAATCCACCCCGCTTCAGTTCCTCTATTTATACTGCCAATGTCAGTGCTAATGGTACTATTGATCGCCCTGTCATAAAGATTCATGCAACGGACAATGATACTGGCAAAAATGCACAAATAAGTTACCATTTGGTGTCAATAAGTGATGGAGCGTACAATAATTTTTGGTATGACAGTAAAGCGCATCAATTAAATGCTGTTGGAAACTTGAAAGCTGGTGAACGATATGAAGTTATACTGAGAGCAACTGATGGTGGCGGCCTCTCAAATCAAGCATTAATAATTGTTTATTCTGTACCTGATAATTTTCCAAAAGTAACAATGCTTGACCAGAAAAAGGAATCATTCGGACGGAACCAGATAGCCGGTCTATCTAATTTTTTAGTGGCCAAGTCATCGATTACATCTACATCTGAAAGTATTGATTCACCTGAAATGATCCAAACTTACGTTATTGAAATAAGCGAAGCAATTCCACCTTACTCCATTATCATTACACTTGGGGATGATTCAACGAAGGAACAAGTATATCACACGATCACCGGTGGTAACGAAGATAACAAATTTGCTGTCAGAAACGAAATTGGGGCTTTAATTACGGTGAAGTCGTTTGATAGAGAAGAAACGTCACTTTACACTTTAGAAATCGAAACACGCTCTTTAAAGCTAAATCAACACTTGCATTGGACGATTGTCCAGGTTGTTATAGCGGATATCAACGATAATGCACCAATATTCACTGATCCGCAGCCAGTGAGGTTGCGTGTTAATAAAAGTGGTGTAGTCAATTTTGCCCCAAATACGTATTTGGGGCAAGTGAACGTAGAAGATCCAGATGACGGTGATAACGGACATGTGGGACTCAGAATAGCATCTCCTATGAATAAATTGTTTTCAATAAATGACAGCGGTGCTGTTATGGTAAATGGTGATATGTTAAGTGGACATTTTGGTGAGCATCGAATGACTGTTATTGCCACTGATCACGGTGATCCACCTCTTGAAACTCGAGTCAATCTAATCATCAATATTGAAAATACCGCACAAAGTGTGCTATCAAATTCCATTCAGTTATCAAAAGAATCGAATAGTTTGGAACGTACGAATTTGATGCTGAATAGTACTGGTTCTGTGCAAAATGTACAATTCACATTCGATTCCTTTATACCAGCAACCATGCAAACAGCAGCAGAAAATCCAACACTGCGACTTGCGCCTGTGTTCGAGCTGTCTGAGATTGAAGTTATTGTAGAAGAAAATCAAGCAGACATTGAACTCGTCAAGCTTCATGCTTATTATATGGATGGTAAACCTGGAAGCATCACATATATCATGCTTGCAGGAGATTCATCTCTTTTTAATGTAAACAGTTTCACCGGATCGCTCCTTTTGCTGCGCCCGTTAGATGTGGAAAAAGAAATGTCTTATGAAATTCAAGTTGGTACTGCCGAGGCGACTGTTTTGTTCACCGAGCAAAATTTCCCATATACGGCCTTGGTTCATGTGAATGTTGTAGATGTCAATGACTGGATACCAAACTTTGAGCTTGATAGCTACCAATTTAAAGTGAATGCAGATGCCAAACTCGGCACAGCTATTGGCCAGATTGTGGCATACGATCAAGATAGAACCGCACCGAATAACGAGATTCGTTATCGGATCAAAGAAAGGGACACTAATGAATCATACGTCAATGTAGATCCCAAAAGCGGTTTACTAACTGTCGAGAAAAACCTTCGTCTACTTGCAAATAAAAAAATTTCGTTAAATATAGAAGCAGCAGATGACGGTACGCCGAAACGGTCTAACGAAACGCTTGTTTCAATTGATGTTGAACCTGTAGAAACTATCACTACCATTTTAACAAGAATGCCATCAACGTCTGATGCAATGTTTTCTAACAATAAATTGCAGTTCTCGCAACGGAATTACTTCACTTCTATATCGGAATCGATTCGTTCGCCACATCTGTTACTTGTTTTACCAGTACTGAACAAGTCAGCAAATGAGCGTTTCACAACTTGTTCAATCATTTCTGGTGATTACGGAGGAATCTTTAGCATTTCGACTAACTCCGAAGGTAACTGCGACCTTCGAATGCATGCGTTACTGGACCGAGAAACAGTGGACTCCTATCAATTAAACGTAAGCGTAAAAACAGAACAACAAGTAGACCATGCAATTGTCCATGTAACTGTTCTTGATACATACGATAATGGTCCGAAATTCATTTATAATAACGATGAATACAATGGATATTTTGCAGCTTTGTCCACTGATGCCTCTTCATTTGCATTTCTCACCACCGTGCAGACTAAGAATGTCGGTTTAAAAAACAACAGTGTTATTGTATATTCGTTGGATTCGTTTTCAATGGACTCGAAATACTTTATGGTTGATTTGAGCGGAAAAATCCAGACAAAAATGAGTGCATCACAAATGATGAAAGATAGTCAGAAAAATTATTTTAATTTCCGAGTGATCGCTTGTGACTCTTCTTATACTGTAAAGAAACTGTGTTCCAAAGCGGAGATATTCGTGAATATAATCAGTAATTCAAACCGATTCATTCTATCAGTTCTCAATACCGAACCACATCATCTCATAATTGCTAAAAGGGAGATTGCAAAAATATTGCGAGAATTCACTGGTCCTTGTAAACTACTTCTCTTGGAAAGTATAGAAGGCCGAACTAATATAAAGAAGCAGAAACACGTCGACATGCGCTGGTATGCTATAAATCCAACAACAAAAAGGAGTTGCGAATTTGATGAGTACAGCAAACTTTTCGATAATTCAACGATAAGAATGGTTGCTGAAAAACTAAAACAACGACTTATTATTGGTGAAATCCGTATTAACTTAAAAAATGTGTTTAGCGAAAATGCGTTGTTTTTAACAAATTTCAAAACGGTTTCTGCTGCAATAATTGTACTAGCAGTGGCCATAACAGTTGGAGCACTCCTTGGGATATGCGTAATATGTTTGTACTACATGCGTCATCGGGTGAAACGACATTCAAAACATGAATATCCAAACATTAATCAAATTCCAAAATTTGATGCCATATTTCTACCCAATCCACCAACCGGAAACACCCATGATATGCTTTATGAATCTCAAATGCTCGAAATGCCAATGGGAGAGGAAAACAGTATGCTCAAACCAGTAGGAAAGATAAACGGAATATCCGCTGCTGCATACGGTTCCAACAGCTACGATTTGGATCTAAAGCAGAGTTATCAGAATTATGCTCAAAACGCATTGTCTGATAAAAAAATTTTCGTTGAAGAAAAAATGTTTTCGGTCAGTGAACGAAGCGGGCTACATCCGCAAAAGAACAAGAATTGTGCATTCACAGCAACAAGATTCCCAGTGCAAAACTTTTTCTAA\n>XM_040515260.1 PREDICTED: Rosa chinensis uncharacterized LOC121051827 (LOC121051827), transcript variant X7, mRNA \nGTTATGAGTCATCTAATTCTTTCTCAATCTCAGGTGCTATGCCTCCTAGACGCCGGACTCGTGGGGAGACCCCTCCCATTCCAGGAGATGAGAATACTCCTGGAGGAATAGCGGAAGCTTTGGGACGTATTGTGCAGCAGTTGACTGCAGCGCTTCCGGGCTCCAGAACCGACTTTACCATGGAGCGAGCGAAGAGGCATGGAGCTTATAGCTTCTCCCATGCTCCTGATGCTATGGATGCCCAGAATTGGTTGAACAAAATGGAGAAGGTCTTCACTCAAATCCATTGCCCAGAGGATCGAAAAGTGGGTTTAGCAGTGGATTTTCTTGATGGTGTGGCTTTTGATTGGTGGGCTTTTACTAGCAGGGATTTAGAGAATGATGGCCCAATCACTTGGGAACAGTTCAAAGAACATTTTACTGAGAGATATTATGGTACAGCTATCCGTGACAGGATGAAGTATGAGTTCTTGCATCTACAGAAAGGGGACATGACCGTGACAGAGTTTGAGCAGCGGTTCACCCAGCTAGCCCAGTTTGTGCCTGATCTGGTTGCCACTGAGAGGGAGCGGATCTATAGGTTTGTTGATGGATTGGGGGGTAAGTATTGTGAGCAGTTGACAGGAGTGCCATTTAGTGATTATGCTGAGGTAGTTAATGCTGCTCTGCGACTTGAGACTATGTATATGTCTGGTGTCCGACCTCGAGATGTGGGTGGCCCCAGTCAGGGTCCATCCAAGAAGGCTGCTTCTACCTCTAGGACAGGATCTTCAGCAGGTTTAGGGTTGTCCACTTTTAGGGGAGATTCTGACGAATTTTTCCGAAAAGTGGGCCCCGCAGGTCCATTTTGGAGTTAGGAGGGTAATTCCGGGGTGGGTCCTGACAATATGTTACTTTATGCAATGGAGATCATCTCTTCTATATATGCTGAACCTGCATCTGGAAATACCAAACTTGGCACTGTCATGGACAAAAGCATTTGCGAAGATGTGTCAACTTTAAATGTTTGGGGGCATAACTAAGTTCTTTCCTCTTTAAGTATGCTGCAGTCTGCATGCACTATACTAGGATAGACCAGGTGTACCCTCAATCCCCGGAATAGAACGATCCCTACTTACTTAT\n>XM_048494676.1 PREDICTED: Sphaerodactylus townsendi CD200 receptor 1 (CD200R1), transcript variant X3, mRNA \nGGAAAGTTAGGGATGTGAACAGGAAAACTGAGATGCCAACTGGACAGAAGTAGACTGGTTGAAAAGATGTTCATCATAAGAGTGGCTAGATGTCTGCCATAATGGATGTAATGGTGAGAGAACTATGTGAGCCATGAAATCTGACGTTCATTTTGTTATGAAAGCCACAAGTGCCAGAATTCTGCTTGCTGTCATAGTAATTATGATACCAGTTGGGTCATTCCCAGCAACAGGCTCCATTCAAAACAGGTCTGCACAGTATCTTTCCAACCATTCAGCTAGCACAGTGACAGTGACCAAGACTGCAACTCAGCTGGCAGAAGAAAAATCGAGTCTATCTGCAGTGGTTGGTTCATCACTCACACTGAAGTGTCCCTGGCAATGGCAAAGAACCTTGTTAACTGTATGGAATGTGAAATTTATAAATGGGACAAATTGTCATTTATCCTACAAAAGTGACCGAAACCTGTCTGTTACAAACTGCAATGAGAACGTTAACTGGTTATCGAGACCCGATCAAGAATATGCTCTTCTTATAAAGCCTGTGCAGATTTTCAATGAAGGATTTTATAAGTGTTCTAGTTCAATTGATAAGGGCACTTTCATTCATGAATATGCTCTAACTGTGCTAGTGCCTCCTCAGGTGCACCTGACCCATGACTACAATGGAACTGCTGTGTGTACGGCAGCTGCAGGAAAACCAGCTGCCCAGATCTCATGGGGCCAGAAAGGGGATTTTATCACAGTGAATGAAACTTTGCCTAATGGCACCAAGACCGTCATAAGCAAATATAAGATCACCAGTGCTGAAGAGAACAATTTAACTTGCTACATTTCCCATCCAGCTTGGACGAACTCACAAGTCTTAAGTTTCCTGTCAGGCACAAGAAAGTCAATACATCTAAAAGTCCAGAAACAATTTCAAGAGGCAGCATTCAGGAGAATGAGATGGAACCCTATGCCACCTTTGTGCAAATGGAAAATGTGATCTACGATACAACGTTTGACACCTCAATGGGCAAACACTTCCCACCCGGGCTTTCACCTTCCACATAAGTTTCAATATGACTCTAGCTTTCTGTGCAAAGGAGACAGAGAAACACAGCATAATAGGAAGAGGAAAGACAGCTGTTGCCTTTTAAAAATGACCTACCAAAAAACGTGGTCAAATGTT\n>XM_046460927.1 PREDICTED: Marmota monax MIA SH3 domain ER export factor 2 (Mia2), transcript variant X18, mRNA \nAAGGGTACAGGATGTATTAGAATCTGAAATCTTTCTCCAGGATATGAGGTGCTTAGAAGAACTTTATTTACATCTAAGGTTATCTTAACATGAGCCATTTAAGGAATGGAATTGAATGATCTGGAGGAAGAGGTTGTGGAAGCATTGCCTGAAGATATGAGACCAGGCCCTAATCCTTATGGCCTTCCGTGGGAGTTGGTGATTTGTGCAGCTATTGGATTTTTAGCTATTTTCTTGTTTTTGTGGAGAAGTTTTAAATCTGTTAGAAGCCGGCTTTACATGGGAAGAGAAAAAAAGCTTGCTCTAAAACTTTCTGGACTAATTAAAGAAAAATGTGAACTACTTGAAAAAATTAGCCTTGTTCAAAAAGAGTATGAAGGCTTAGAGTCATCTTTAAAGGATACCAGTTTTGAGAAGGAGTCAACAGAAGCACAAAGTTTGGAGGCAACATATGAAAAGCTGGATAGGTCCAAGTCTAAACTTGAGGATGAAATACTCTTTCTAGAAAAAGAGCTAAAAGAAGAGAAATCTAAACATTCTGAACAGGATGAATTGATGGCAGATATATCAAAAAGGATACAGTCCCTAGAAGATGAATCAAAATCTCTCAAATCACAAATAGCTGAAGCTAAAACAACCTTGAAAATATTTCAAATGAATGAAGAACGACTTAAGGTAGCAATGAAAGAGGCTTTGAATGAAAATTCCCAACTTCAGGAAGGTCAGAAACAGCTTTTGCAAGAAGCTGAAGTGTGGAAAGAACAAGTGAGTGACCTTAATAAACAGAAAATTACATTTGAAGAATCTAAAGTACATGCAGAACAAGTTCTAAATGATAAAGAAAATCACATTAAGTCTCTGATTGAATGCTTGCTAAAGATGGAAGACTGGGGTGCTGTGCTTGGAGAAGACCTAACAGATGATGGTAACTTGGAATTGGAAATGAACAGTGAATCAGAAGTTGGTGCTTACTTAGATAATCAGCCAAAAGGAGCTTTGAAGAAAGTGGTTTATGCTGCTAAGTTAAATGCCTCCTTAAAAACCTTAGAAGTAGAAAGAAATCAAATTTATACTCAATTATCTGAAGTAGATAAAACAAAGGAAGACCTTACAGAACATATTAAAAATCTTCAGACTGAGCAAGCATCTTTGCAGTCAGAATATACACAGTTTGAAAGTGAGAATCAGAAGCTTCAGCAGAAACTTAAAGTAATGACTGAACTATATCAAGAACATGAAATGAAACTCCACAGGAAATTAACAGTAGAGGAAAATTACCGGTTAGAGAAAGAGGAGAAGCTTTCCAAAGTGGATGAAAAGATCAGCCGTGCAGCTGAAGAACTGGAGACCTATAGAAAGCGAGCCAAAGATCTTGAGGAAGAATTGGAGAGAACCATTCATTCTTATCAGGGGCAGATTATTTCCCATGAGAAAAAAGCACATGATAATTGGTTGGCAGCTCGGGCAGCTGAAAGAAACCTTAATGATTTAAGGAAAGAAAATGCTCACAACAGACAAAAATTAACTGAAACAGAGTTTAAGTTTGAACTTTTAGAAAAAGATCCTTATGCACTTGATGTTCCAAATACAACATTTGGCAGAGGCTCAAGAGGCCCAAAGAATCCTCTGGATCATCAGATTAGCAATGAAAGGGGAGAATCAAGCCATGATAGGTTAACTGATCCTCATAGAGCACCTTCTGACACTGGGTCCTTGTCACCTCCATGGGAACAGGATCGTAGGATGATGATCCCTCCACCAGGTCAACCATATTCTGATCCACCTCTTCCTCCACAAAGGCAAGATAGATATTATTCTAATTCTGGTAGATTATCTGGACCAGCAGAACTCAGAAGTTTTAATATGCCTTCTTTGGGTAAAGTGGATGGGCCTATGTCTTTAGAAATGGAATCCAGTACAAATGATACCAAAGATGATCTTGATAATTCAAATGTGCCTGATTCATCTCTGCCTGCTGAAAACCAAGCAACTGGCTCTCGCTTTGGTTTTTCACCTCTTCCTCCAATCCGAGGTCCATTGTTTCCAGTGGACCCAAGGAGTCACTTCATGAGAAGAGGACCTTCTTTTCCTCCACCTCCTCCACCTCCAGGAAACATGTATGGAGCATCTAGAGATTATTTTCTACCTGGCCCACCACCCCCTCCATTCCCAATGAGAAATGCTTATTCACCGAGGGGTTTTCCTCATTATCTTCCCCCAAGAGCTGGATATTTCCCCTCACCCCCACATTCTGAAAGTAGAAGTGAGTTCCCTTCAGGGTTGATTCCGCCTTCAAATGAGCCTGCTACTGAACATCCAGAACCACAACAAGAAACCTGACAATATTTTTGATCTCTCTTCAAAATGGCAAAAGACAGAAGATTAAATATTCTTGAACCACAGCAGTGATGCTTTTATAATTGGAACACTTCATGCTAGCATTTCCCAGACGTTATTTGGAACCCTGGTCTTGTGAAGTATTTCTTTTCTTCTTCCATTACCATCCCCACCTTAGAGAAAAAGGGTAGAAAGAAAGATTGGGTAAATCTTGGGTAAAATAAATGCTTTGCGTAAAATATTAAGTGAAATGAGAACTGTAGAAACATGATTACATTAAAGTTTGTTTGCTGTGGTCTAAA\n>XM_053649385.1 PREDICTED: Ictalurus furcatus tubulin cofactor a (LOC128622690), mRNA \nTCCATTACACGTTGGGCAGTCGGGCATTTTGGAAGTTTAGGGAAGCTTGTATTTCAGCTGCTGTGTTTGTGCGTACTTACGACTCTGCACTTACCACACTTCTCAGAAATCATCTTTATTATGGCGGATCCAAGAATACGCCAGATAAAAATAAAGACTGGAGTCGTGAAACGGCTCGCTAAGGAAGAGGTGTTATACATAAAGGAGGCAAAACAGCAAGAGGAGAAAATTGAACGCCTGAAAGCAGAGGCAGGGGACGAGTATGTCATCAGGAAACAGATGGAGGTGTTGCAGGAGTCAAGAATGATGATTCCAGACTGTCACCGCCGTTTAGCCATGGCTCATGCTGATCTGCAGCAGCTGTTGGAAATGGAGGTGGATGTTGAAGAATCGGAGGAATACAAGGAGGCCAGAAGTGTTTTAGACTCTGTCAAACTGGAGGGATGATGTAAACACACATGCGCAACAAGTGTCCATTCCATTATTCAGGACTTCTTAAAAATGTTGATTCGGAAATAAGTCTGGTCATCGTCTCATTGTTGTATTGATTTGTAACACTACGAATAGTGTGCCTCTGCGTTCTCTGTTGATTGTTCACAAAACTAAATAAACAATCTTATTATTCAA\n>MT512057.1 Pythium aphanidermatum strain Sala1 internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene and internal transcribed spacer 2, complete sequence; and large subunit ribosomal RNA gene, partial sequence \nACCATAAAAACTTTCCACGTGAACCGTTGAAATCATGTTCTGTGCTCTCTTTCGGGAGGGCTGAACGAAGGTGGGCTGCTTAATTGTAGTCTGCCGATGTATTTTTCAAACCCATTTACCTAATACTGATCTATACTCCAAAAACGAAAGTTTATGGTTTTAATCTATAACAACTTTCAGCAGTGGATGTCTAGGCTCGCACATCGATGAAGAACGCTGCGAACTGCGATACGTAATGCGAATTGCAGAATTCAGTGAGTCATCGAAATTTTGAACGCACATTGCACTTTCGGGTTATGCCTGGAAGTATGCCTGTATCAGTGTCCGTACATCAAACTTGCCTTTCTTTTTCTGTGTAGTCAGGGAGAGAGATGGCAGAATGTGAGGTGTCTCGCTGGCTCCCTTTTCGGAGGAGAAGACGCGAGTCCCTTTAAATGTACGTTCGCTCTTTCTTGTGTCTAAGATGAAGTGTGATTCTCGAATCGCGGTGATCTGTTTGGATCGCTTTGCGCATTTGGGCGACTTCGGTTAGGACATTAAAGGAAGCAACCTCTATTGGCGGTATGTTAGGCTTCGGCCCGACGTTGCAGCTGACAGAGTGTGGTTTTCTGTTCTTTCCTTGAGGTGTACCTGAATTGTGTGAGGCAATGGTCTGGGCAAATGGTTGCTGTGTAGTAGGGTTTTGCTGCTCTTGGACGCCCTGTTTTCGGATAGGGTAAAGGAGGCAACACCAATTTGGGACTGTTTGCAATTTATTGTGAACAACTTTCTAATTGGACCTGATATCAGGTAAGATTACCCGCTGAACTT\n>XR_007174521.1 PREDICTED: Salvia hispanica uncharacterized LOC125211483 (LOC125211483), ncRNA \nAGGCTGCACAACACACAAGTATCATCAACAGTTAGTCAGGCGGGAGAATTACATATATGTTCCATCAAGAGAGTTTGACAAAATGAAATACTGGGGGAAGAAGGAGCATTTCAAACCAGCTGTGACTATGAAGCCATACATTGTTGGACGATATACTCAAATCACAAGAACACAGAAATATCTAGGATATCTTATAGCTACCCATATCATATCATATTTTGTACAGATATCTAATAAGATTAGGATTATGTCGCACTTGTAACCCCAAATATCCATCAGCACCCAAATATCTAGGCTTAATGCGTCTGTCAATTGTTCATCATCAATATATAGTCCATGTCCCAAAAAAGGAGAAAATATACGTTAGCAGAATTGCAGAGATAGAGTTGTTTGTCACATCTATAACACACAATCACATATTCACATAAAAAATCTAAAACAAACTCAGAAAACCTACTTCAAAATGGAACTACACATACTTAACAATTCAACATAAACTTCACCAGAGAATAATCCTATACATTTTCTCACAAGTACTACTTGATAGAAAA\n>XM_021335350.2 PREDICTED: Helicoverpa armigera UTP--glucose-1-phosphate uridylyltransferase (LOC110376763), transcript variant X1, mRNA \nTCATGCGAGCGTGACGTGTGCGCGGAATTTTAAAACAACATTTTTAAAAGACGTTTTTTTTAAATAATTTTAAGTGTTTTTTTTTGGTTAAATAATGGATAGTGAGGCTGAACAGTGTCGGTCATGGGTACGTGATATGTTAAGAAATAAAAATGGGAGTATCCGCAGTCACCAGAGAACTCCCTCAGGTTCAAGGGACTTCAAAGAGGCGACCAAGCGCGATGCTCTCACCCGGCTGGAGGTCGAACTGGAGAGACTCCTGGCTTCAGTCCACGAGACCAGAAGACCACTCGTTGAAAAGGAGTTCAGGGGTTTCAAGAACTTGTTCAGCAGATTTTTGGCGGAACAGGGTCCATCAGTAACATGGGAGAAAATCCAGAAACTCCCAGAGGGTGCTGTCATAGACTACTCGTCACTCACCACCCCCACCACAGACAATGTTCACCACATGCTAGACAAGCTTGTGGTGGTCAAGCTCAATGGTGGTCTGGGAACCTCTATGGGTTGTAAGGGTCCTAAGTCTGTGATACAAGTCAGAAATGATTTGACCTTCTTGGATCTTACTGTACAGCAGATTGAGCACCTAAACAAAACGTACAAATGCAACGTGCCCCTAGTTCTAATGAACTCGTTCAATACCGACGAGGACACGCAGAAGGTCATCCGCAAGTACCAGGGCCTGAAGCTGGAGATCCACACCTTCAACCAGTCCTGCCACCCGAGGGTCAATAGGGAGTCACTGCTGCCGGTGCCCAGGCATGCTGACGTACAGGCTGACATTGAGTCATGGTACCCACCCGGTCACGGAGACTTCTACGAATCATTCTACAACTCAGGTCTTCTACAGAAATTCATCAAAGAAGGCAGGACTTATTGCTTCATCAGCAACATTGACAACTTAGGAGCCACCGTTGACCTGAACATTTTGAACCTACTCCTCAATCCTGATCCCGTGAAGACCGTCTCCGAATTCGTTATGGAAGTCACTGATAAGACCAGGGCCGACGTTAAGGGAGGTACCTTAATACAATACGAGGATAAACTAAGATTGCTTGAAATTGCTCAAGTACCAAAAGAGCATGTTGATGACTTCAAATCTGTTAGCCAGTTCAAATTCTTCAACACAAATAACTTATGGGCGAAATTGGATGCTATTCAGAGGGTGGTCGAACAAGGTTCTTTAAATATGGAGATTATTGTGAACAACAAGCATTTAGCTGATGGTCTCAACGTTATACAGTTAGAGACAGCAGTCGGAGCCGCAATGAAGTGCTTTGAAGGAGGCATAGGAGTAAACGTGCCTAGATCTCGATTCTTACCTGTTAAAAAGACCTCGGATCTTTTACTAGTGATGTCCAACTTGTATAGTTTGTCCCACGGATCTCTAGTGATGTCTCCACAAAGGATGTTCCCATCGACACCTTTAGTGAAGTTAGGGGATAACCACTTTGCGAAGGTTAAGGAGTTCCTGAACAGATTTGCTACGATACCTGACCTGATTGAGTTGGATCATTTGACGGTGTCCGGAGATGTGACTTTCGGCAGAGGAGTGTCTTTGAAGGGAACAGTAATAATAATAGCCAACCACGGAGACAGGATCGACATACCTTCAGGAGCTCTGCTTGAGAACAAGATCGTCTCCGGCAACCTTCGTATCCTCGACCATTAAGCAACAACTATTTAGCTAATATACCTTTACTAAAGGTGGATTTCAATACCCTTATCCATCCGTTGATTTTATGACGGATACGTTATTGGAATTTAAAGTAAATTGTAATACTTTTAGGTCTAGATTTGTTGAAATGGAACTTCTTTGAACATGGTGAGGAGTAAATTTGTACTACGTTTTTGTTTGTATAATAACATGATATGGTTATGCTCCGAAGTGTTATAAGTTTTTTTGTTACTAAAAGTTGTTATAAATTAAAATATATTTTTTGTGGATACTATAAAAATGAAGATTGAGTGAAAAGTTAGGGTTTAAAAGAATGAAGTTGAAAACTTTGTGGTTTTTAAAGAAGTTCCATTTCATTTGCGTCTAAAGAGGTGCGCGTTCTTTTTTATACGTCTATGTATTTGTCTATTACATGTGCATTAGTTGCCCATAGACTAAGTAGTTCCATATTCAAACAAAACAAGAGTTAAACTTACGAAATTGCTTAAATTGAGGATTACCTATGTATCATGAATTATATGGTTGTTTTTTGGTTTTAATTGGTATAATTATTGAAATTGAGATTTAAAGCGTTTGAAAACTTATTATAAACATATTTATTAGGTCGATTTTTAATATAATTGTAAAGTTTTCTATTTATTCACTTTTTATATTTAAACTTTTGCTATAAAAGTAGAGATAATAGCACAATTATATAGCATTGAAATTTTAGAATTTAATATTATGTAATTGCTAATATTGTGTTGTACTAAGATATTTCTTAGTAACAATTTATTTATAAACCAGAATACTTTTTTTTACAAGAAATATGTTTTATGATCACAAAAAAATTTAAGATTTGAGTATCTAATCTTTATTTATTGATTTATATTTAATAAAACGTATTTTTCTACACTTTTAATATGGGTTTTTAAAACCTTTGATTTTTTTATGAGCCAAGTTGCCAATTGTTGTTGCTTTATTAATTATTTATTGCCAAAGTGAAAAATTAATATATTGGGTTTATTGTCTGCTAAAAATTGTTTTTAGGTATATTACTCTTTTATTACTTTTATACTACTTACCAGTTAATATCATAAATATGGTTTGAAGAATATGAAAAAGAAAAAATATTTTTCATCATATTATTATACTTAAATATGGCCGATTTATTACACTTATTTCCAAAATATGCGACTTGTATTTGTAAAATAGATTTTTATAATTACTCCTAATAGTGATTAAGTTCATTACATTCATAGATTTCAGTCAAATATGTATTTTAGAAGAGAAATCATAATTCATACAATAAAATTGTTCTTTAAAAAAAATGAGCAATTTTATTACTCTGTTAATGAGTGTAAAGTGGCACCTTACAAAAAAATACTTATCGAATCGTAAAAAATATGATTCAGTTATATCGATAAAATATCTGTCGAGAGTGACATCACTAGGAAGGTTACTCAGTGAAGAATAAATACTGTACTATTAAGTAGTTTTAATCTAAGCAAGTTAGTGCCATTAGCTAAGTAGGTAAAACTGTTGTAATAAATATTATTATGTTTTCATTTCAA\n>XM_021074111.1 PREDICTED: Sus scrofa fibrosin like 1 (FBRSL1), transcript variant X15, mRNA \nTGCCGCCGCCACCGTCGCCTCACGAGCCCAGGCTCCTCAGCTCCGGTCCGCGCCGCGCCCGCCCGCTCGCTGGGCCTCTTCCCAGCCTTTGCCCGCCGCCAGTCGCCCATGGGGCGTGCCCGCGGGTCCGCGGCCGAGAGCCGCTGAGCGCTGGCCGTCACGCTGATGTGCGCGGCTGCTCGCGCCCGGGAGCCCAGGCCGCGCCGGGCCCGGGGCTGAGGCCACCCTCGCGGCATGTCCGGCCCGGCCCGCCGCCCGCCGCCGCCCAGGGCCCGAGTCCGCGCGGTCCGCACCGAGCCCGGCGGTGCCGCGTAGCACAGCGGCAGCGGAGCGGGAGCCCGACGGCACGGCCGCAAGGTCACCGCGCGCCATGGAGGCCAAGGTCCGTCAGAGCCGGCGCTCACGCGCGCAGCGGGACCGCGGCCGGCGCCGGGAGGCGGCCCGCGAAGCCCGCGACCAGAGCGCGTCGTCGGGTGACGAGCCAGAGCCCGGGCCGGGCAAGGAGAACACGGGCCTGCCCCGCGCACCCCCACCCCGCGCCGCCGCCGCGCGCCCCCCGCGCCGCCGCCGTCGTGAGTCCAGCTCGCAGGAGGAAGAGGTCATCGACGGCTTCGCCATCGCCAGCTTCAGCACGCTAGAGGCCTTGGAGAAGGACATGGCCCTGAAGCCACATGAGCGGAAGGAGAAGTGGGAACGTCGCCTCGTCAAGAAACCTCGCGAGTCAGAAAACTGCCCGACTGCAGAGCCGAGTGAGAACGGGCGGCCCCTGGAGGCAGGCAGCTCTGAGCAGGACCTGGAGCCCACCTGTGACCGAGGGAAGAAGAAGGTCCCATTGCAGCCCACCAAGCAGATGAAGGTCGCGGTGTCCAGAGGGGGCGACCACAACAGTGACGGCGACAGCTTCCGAGAAGCCAGCAGCTCCCGGAGGAGCAGTTCCCGGGACCAGCTCAGTGACAGCTCGGCGCAGGCGGTCTCAGGCAGAGGTTACTCCTGCGACAGCGAGAGCGACGGGGATGACAAGGCATCTGTGGGCTCTGAGAAGCTTTTTGCCCCAGCAGCGGATAAAGGGCCCACGTTGGGCGAGAAGTCCGAGGCCAAGGCCGGGGCAGCACCCAAGGTCTCCGGTCTGGAGCGCAGCCGCGAGCTGAGCACCGAGCCGCCCTTCCTGCCCCCTGTGCGCAGTCCTGTGCCCGCCCTGCCCTCCGGTGCCCCGGCCAGCCCACTGGTTAAGAAGGAAGCCCCGGCCCTGCCCCGCCTCGCCCCACAGCCGCCTCCTGCGCCCCCGCAGCCCCGGGCCCCGCTCCCGACGCACGTGCCTCTACCCCCGGGCGCCTTCCCCGGCCACGGCCACGGCCACGGCCCAGCAGCGCACAACGGCCTGCACAGCCTCAGCAGGAGCAGCAGCGCCAGCAGCGGCGCCAGCCTGGGGCTCGCGAAGCACGCGTCCCTGTCGCCTCACGGGCCGGGCCCCCACCTCTCTACCTCACACTTGGCGCTCCGCTCGCAGGCCCAGCACCAGCACCACGCGGCGGCCATGTTCGCCGCGCCCCCGACACTGCCCCCGCCCCCGGCGCTGCCGGCCAACAGCCTGGTCATCCCAGGACACCCCGCCGATCACGAGCTGCTCAGTTTGACAAGTTCACACCCAAGCTGGACAGCCCCTACTTCCGACATTCCAACAAACCCCCGGACTGAGGATGTGGTGGGAGGCCAGGCCTCCCGCCCAGGAGGCGGTGTGCAGGGCCCCACAGGCAGGGTGAGGCGGGCACAGGCGCCTGGGGTCTCACGCCCTGTCTCTCTCTCCCCTCAGACTTCAAACCCACTCGAGGTAACGGGCCGGGCCAGCGCTGTTCACACCCTCCTGCAGAAAGCCCCAGGGGTGTCCGACACGTACCGGACAACAGTCAGGAAGCCCGGGAAGTGGTGTGCGGTACACGTGCAAATTGCCTGGCAGATATTCCACCATCAGCAGAAGATCAAGATGCAGCTGGACCCCCACAAGCTGGACGTGGGCACCAAGCTGGACTTGTTCAGCAGACCCCCTGCCCCAGGCATATTCGCTGGCTTCCACTACCCGCAGGACCTGGCCCGGCCCCTCTTCTCCAGCTCGGGTGCCGCCCATCCCACTACCAACCCGTTTGGACCCTCAGCCCATCCTGGCAGCTTCCTGCCCACTGGTCACTTGACAGACCCCTTCAGCAGATCAAGCACCTTCGGGGGCCTGGGGAGCTTGGGCAGCAACGCCTTTGGAGGCCTGGGCAGCCATGCGCTGACTCCCACAGGCGGTATCTTTGCCCCCAAGGAGGGCCCCACGCTGCACGGCCTGACCAGCCCCCATGAGGCCTGGAACCGGCTGCACCGGGCGCCTCCCTCCTTCCCCACGCCACCCCCGTGGCCCAAGCCCATAGACACGGAGCGGGTCTCAGCCCTGACCAACCACGACCGAGAGCCGGACAAGGGCAAGGAGGAGCGGGAGCGGTGTCTTATCGCTCCCAGGGACCTCCTGGAGAAGACGCGCCTGCTGAGCCGGGCCTCGCCCGCAGCCCCCTTAGGCCACCCGGGCGGCAGCCTCCTGCTCCGCGGCCAGGGCGAACCGGGCCGGCCCGGAGTCCCCGCCGAGCGCGAGGCCGAGCCCCGCGTCAAGGAGAGCCGCTCCCCAGCCAAGGAGGAGGGCGCCAAGCTGGCCGTGCGCCCGCCATCTCCTCTCAGCAAGGCGGCCCTGGGGGACAGTCTGCGCCTGGCTGGCCTCCTGGGGAAGCCGCCCGAGGCGCCGGCCGAGCGGCCCCAGAGCGACGTGAAGGTCAAGGAGGAGCGCGGGGAGGACGGCGACGCGCCCCCACAGCTCGCTCCGGGCCCCGCGAGCCGCGAGCGCCTGGCCTTCGCGTGGGAGCCGCTGCGCGACGCATACCGCGGCCTGGAGCCGCCCCGCCGCGGCCCGCCCGGCCCCGGCGCCCTCTTCGAGCCCCCCGAGCGCCCCTACCGCGACCGCGAGCCGCACGACTACAGCCCCGAGCGCCTGCGGGAGGCGCGCCGCGACGAGCTGGAGCGCGCGCGGCCCCCGCACCTGCCCGCCGGCCCTGCCCTGGACGGCGCGGCGCTTCTGCCCGCGCTGGGCGCCCTGCACTACCCGCGCCTCGCTCCCGCCGCCGCCGCCGCGCTGCACAACGGGCTCCTGGCGAGGCCCCCGCCCGCCGCCGCCGCCGCCGCCCTTGGCGCACCGCCCCCGCTGGTGGCCGCGGGCGGGCCCCCCACGCCTCCCGGGCCGCCGCGGAGCAGGACTACGCCGCTCGGGGCCCGCGCGCCCGGGGAGGCCCGCGACTACTCCCCGTCCCGCAACCCCCAGGAGGTGGAGGCGCGGTAGTCCCCGCGGGGCCGCGCCCGCCGCATGTACAGAGGCCCCTCCACGAAAGCACTGCTGTCAACTTTTTTAACTGTACGTTGTTTCTAGAACCTAAGCACAGTTCCATCGGTCCTGGGGTGACGCCCGCTCCTCCACCTGCAGCCTGCGGAGCCAGGGATTTCAGACACGGTTTTGCCAGGAGTGATCTTTTGCTTTCCAAGCTCGACATTAGGCAATTGGAGAAAAACTTCAAGTTTGTACCTTTTTTCCCACAGGTGATAAGCGTTTTTAACAGATTTGTATTTTTTTCAATTTTGTGCTCTTTGGACGTTTAAAAGAAAGACTTTTGCTTTTTTATTTTTAGTTTGGATTTGCAATTTAATGGCCTCAGATCCCTCTCCAGAGCCCCAGGGGTTTTTTTTGTCTTATTTATGAAGAAAAAACAAAAAACAAAAAAACGGTCATTTTGTCCAACGCACTGTGAGGCCCCCACTCAGGCCCGGCCCTGGCCCTCCCTTGGTACTTGGAACAGAAGTTACAGATATATATTAAGATAATTAATAATGTACAAAACTTTTTTTGCCTTATTATGCAGAAGTGTAAAAGGGTTTCCTTTTTGGTTTGTTTTTTTTAAAAAAACAAATGAAACCGTGTACATAGTCTGTTAATATAAATATATGATGTTATTAAATTCTTAACCTAGGTAGACTTTATAAAAATCGTTTCTAGAAATTCCTCTGGTTATTTGTTTAACACGGTCACAAAAAAAAAAAATTCACTGGCTGTCAGTTGGAAACGCCCTCAGATGGTTGACTGCAGCAGCATCCTTCAACTATGCAAGCGCTCGGGACGGCCCGGGCCTGGGGGACCACGGCGCGCTCCCTGGAGTGTCTGCCCTGGTGCTTTCTGTGCAGTGTTCACAGAATCACACCAGACAAGACTGGGGAGGTGAGGAGTCCAAAGGCTGATTACAAGGGGAAGAGTAGCTGTCTCCTCCGCGGAGCCACCGGCAGACATGGTCTCATGTTCTCCCACCGGCCAAGGCCTTGGCGTTACTTCCTTTGGGTTCTGGTTTGCTTTCATGACCCCGTGAACGTCACTGTGCCCTGTCATCAGTGTTCCCTGTTTCCTGACGTCCATACCTGTGTCCTCAGCGTTTGAACCTCAGTTCACCCATCTCTAGCCATTTGCTTTGTTTGGTTCTGTATTTCCAACCCCACGTTTCCACTGTAGGCTCCGGTTATTTTAAATATTTTCACATCAACCAATGAAGATAAATACAGCCTTGATTTTGGATGAAAA\n>XM_006877835.1 PREDICTED: Chrysochloris asiatica histone-lysine N-methyltransferase PRDM9-like (LOC102837583), partial mRNA \nGCACTGTGCTCTTGGGCTGGAACTGTCAGAACCTGTGGGTGATGCTGACAGCATGAAGCTCACCAAGAGCCATGGAGGAGAGTATGGGGAGGACACCCACGATTGTGAGGAGTGTCAGAACTTTTTCACCGACACCTGTGCAACTCATGGGGCCACAGCGCTTTTAAAGGGCAGTGCCATGGATACAGAGCACCCCCGTCACTCAGCTCTCACACTGAATCCCGGGCTAAGGACTGGACTTGGAGTACACAGTGAGGCATCTGAGCCGCTGCTGGGCCTAGACTTTGGCCCCTACGATGGTCAGCTGACAGAAGATGAGGAGGCAGCCAATAGTGGCTACTCTAGGCTGAAATTCCTCCATCAACAAGTGCAGCACACCCATCCCTCTCAGTCCTCTCCAAGAACTCCTGCGGAAAAACACCTTCACCTAGAGCACCGCCATCCAGGGGATGGGAAGGAGCCGCATTCTGAGCAACTCGCCAGGAATGACAGAGCAGAAGGTCTAGAGATGGGAGATGGGCCCAAAGCCATGTTTGAAAGGACAAGACAGGGGGGCATTTTAAAGACCTTCTCTAGTCTACCCAAAGACCAAATGGGGAGTTCTAGGGAGGCTAACAGAATGACGCAGACAGACCCATGCTCAGGCCAGAGAGTGAATGCTGCGGACACAGGCAAATTATTGCCGGGGAAAGGAATCCCAAGAATTGCAAAAGTTACATGTAGAGAGTGTGGGCAAGGCTTTAGTGCTAAGTCAAGCCTTATCACACACCTGAGGACTCACACAGGGGAGAAGCCCTATGTCTGCAGGGAGTGTGGGCAAGGCTTTAGCCAGAAATCAATCCTCATTAGACACCAGAGGACACACACAGGGGAGAAGCCCTATGACTGCAAGGAGTGTGGACGAAGCTTTAGCCGGAAATCACACCTAATAAAACACCAAAGGGCACACACAGGGGAGAAGCCCTATGTCTGTAGAGAGTGTGGACGAGGCTTTAGCCAGAAATCAGTGCTTATCACACATCACAGGACACACTCTGGGGAGAAGCCCTATGTCTGCAAGGAGTGTGGGCGAGGCTTTAGCCAGAAATCAAACCTTATTAAACACCAGAGGACACACTCAGGAGAAAAGCCCTATGTCTGCAGGGAGTGTGGACGAGGCTTTAGCCAGAAATCAGACCTCATTAAACACCAGAGGACACACTCAGGAGAGAAGCCCTATGTCTGCAGGGAGTGTGGGCGAGGCTTTAGTCAGAAGTCAGACCTCATTACACACCAGAGGACACACTCAGGGGAGAAGCCCTATGTCTGCAGGGAGTGTGGGCGAGGCTTTAGCCGGAAGTCACACCTTGTCACACACCAGAGGACACACTCAGGGGAGAAGCCCTATGTCTGCAAGGAGTGTGGGCGAAGCTTTAGCCGTAAGTCAGACCTCATTAAACACCAGAGGACACACTCAGGGGAGAAGCCCTATGTCTGCAGGGAGTGTGAGCGAAGCTTTATTCAGAAGTCACACCTCATTAGACACCAGAAGACACACTCAGGAGACAAACCCTATGTCTGCAAAGAGTGTGGGCGAGGCGTTAGCCAAAAGTCAGACCTCATTACACACCAGAGGACACACTCAGGGGAGAAGCCCTTTGTCTGCATAGAGTGTAAACGAGGCTTTAGCCAAAAGTCAGATCTTATGAAACACCAGAGGACACACTCAGGGGAGAAACCCTATGTCTGCAAGGAATGCGGGCGAGGCTTTAGCCAGAAGTCAGACCTCATTAGACACCAAAGGACACATTCTGGAATGAAACCCCATGTCTGCAAGGAGTGTGGGAGAGGATTTAGCCAGAAGTCAGACCTCGTTAAACACCAGAAGACACACTCAGGGGAGAAGTCCTATATCTGCAGGGAATGTGGGCGAGACTTTGGTGATAAGTCACACCTCATTGGACACAGGAGAAGAAAATACTGCCAACACACACTGCCATCTCCCCAGCTTTGA\n>XR_001644210.1 PREDICTED: Nicotiana tabacum uncharacterized LOC107768680 (LOC107768680), transcript variant X6, ncRNA \nCCGGCAAAAAAAATGACTGGCCACTAAAAGCAGCTAATTCAAAAGAAATTTTAGTATTTTATCTTACCCTCACCTAATATTCCCTCCAATTTCTCAAAATAACAAAATGAAATTTGAAAAATTTGGGAATACATCACAAAGACTCAACCTATCTAACCGCTGCTGAAACCATTACCGCCACTGCAATTGATTTCTATCTCATCGCCGGCAACCAATTCCAGTTGCTAAGGTGATTTTCTTATATCTAGGGTTGGAGTAGTTCCCCTTCATTATTTTTTGAGAAAATCAAATGGCCGCTCCACCTGCTCTAGCCCATCACGACTACAGATTAGCTCATCAAGCTCCTTTTGATTAGCAATAGCAGTATACTTTTTATCCAGGACATTAGTTAACGTTGTTGGTTTAATATCGTTGTGATATTATTGACTACCTCTACTATTTGATTGAACAAGGAAGGAAGATTACAATAAAATAAGACCCTTGAGGCTTGAGCTATCATGGGCAGATGTATCTAGAATTTCAGACAGAAAGATTTCTCGCTAGCAAGCACAATTACAAAAATGTCTCCAAAAAAAGGTGATATATTGTGATGTTCAGAGATATAGCATGTGAAAGTTCATGTGATCAAGAGTTGGGAGAATCTGTCCGATGTAATTTATTATCGAGCTTATAGCTACTTGATAAAATAACTAATTAGATGCGAAATATTATTGGATTCAAATAATTTAGCATTTTTATGTTGTTTGCACTCTCAAATTATGGATTTAATGAAGTGCATTGAGCTGTTTGAAGTGAATTAATATTATTA\n>XM_026966869.1 PREDICTED: Rhopalosiphum maidis uncharacterized protein PF13_0277-like (LOC113560796), transcript variant X2, mRNA \nTTAGTGTTCGTATTGCTTTTCCATCACCGATATTATACCGATCGTTTGTGCGTAAACCGGGTTTTTTATCGGTGACAAATCAGTTTCGTTGTCAATACGGCCATGTATATGCACTTTTTCCGGACAGGTCGCCTTGCAATTGTGTCGTATTAGATACGTCCGTCGTGCATATTATTATTAGTATATGAATGTGCTTAAAGTTTAAACGTGACATAATATTATATAATATGTAGTATTATTGTCAATCAGTGACCGATATGATAATGTGCTTGTGACCCGTCTTGGTTATCGGTACGGTAATATCGTCTTGGTACGGTTTTATTTTTAGTGGTTGCGACCCCCCTTCAATTCGTTTTTCAACTACTTAAGTAAATCTGAATATTATGTTTTTTTATATAATTGCCGGTGAAGTAGATTATTCTTGTATTTATATTTCTAAGAGAAATTTATTTTTCAATTATTAATAAGACATATTGAACTAATATTTGACAAAACACAACGAAAAATATATTATTAACTCGTATCGGTGTTAGCCGGATAGATGGAATTGTAAACGACAAAAAAATAACTATCGATGTGTATATATTAAATATTAAAAAATATAATAGACATTATGTAAAGGACGATCGAAAAAACATGAATAAATACCAACAACCAGCAATGAATATGGATATAAAAAAATAATATATGATATCATATTAACCATGTCAGTGAGCAATATAATTCAAATTATTCTTGCAATTAAAATGGAAAACTGTCGGGCACATTGAATACTGCTCGATGAAATGAGGACGGATAAAAATGGATATCTATTATACAGAAGAAGACAAAACTACCAAATTAATGACAACACGGCCAATCCAAGTCAGATCGATGATGAAAATAATAACCCAGATGAAGATATTCAAGGCGACCGCAATCTTATTACATCAAATGTTAATAACCCAACAGGAAATAACAGATTAATAAAAAATGATCTTATAAAAAACGTTTTTAATAGGATGAATTCGAATGGAAAAAAACCTTCTCAAATAGAATCAAGTAGAGCAGATGCTGTTGAAGATCAACAACTAGAAGAAGAAATAGAAAACGATCCAACTAAAATGTCACTCGGTTTAGATTCTGAACTAGAAATCGCTGAAGACACTGACCTAGAAGAAGCAGACGATAAAAATATTGAAAAACCAAAACCAAAACCAAAAAAAAAAAAAAAGAAGAAGAAGAAGTCGAATTCGAAGAAGAAAAGTAAGAAACAAAAACAAAAAAAAACTGAAGATGATGAAACTAAATTAATTGAAATTGATAATAATGGAAATCAATTTAATTATTTTGACCATGAAGAAAAAGATATACGTGAATCAGATAATATTAAAGATCAGCAACAAGAACTTGATAAAGAAAACGATCCAACTAAAATTCTACTCGGCTTAAGCACTGAAAGAGAAGCTGAACTAGATAAGGAAAAAACAGAAAAAAATTTACAAAAAGAAGAAACTAATTTAAAATCAGCTGAATCCAAAGTCACTGGAAGTGATAATATAGAGTCAACGATAGAACAAACATCCAAATCATCCGATCCTGAGAATATTAAAGATCAGCAACAAGAACTTGATAAAGAAAACGATCCAACTAAAATTCTACTCGGCTTAAGTACTGAAAGAGAAGCTGAACTAGATAAGGAAAAAACAGAAAAAAATTTACAAAAAGAAGAAACTAATTTAAAATCAGCTGAATCCAAAGTCACTGGAAGTGATAATATAGAGTCAACGATAGAACAAACATCCAAATCATCCGATCCTGAGAAAAATCCCATCGAAAATATTAAAGAAGATACAACAAAAAATACAATTACGGAAGTTGATCAAAAAGACTTAACAGTATCTTCACTGGAGAATGTTGAAATCGTAAAAATTAAAAAAAAGGATAATGCAACCAGCGAAGCAATAAGAAAAGAAAAGAAAAAAACGACATTTAGAGAATTCACACATTCAGAAGGAAATGCACGCATATATTGTACATTTTTGGGAGACTTGTTAAAAATGTACAACAAAGTAAAAAAACGTTTTGTTGGACACTTTTGTCATGCAATTGTTGTTGGCACTCCAATTATCTTAAAACAAAATCAAGTACACTTAAGCAGTAACATGAAAAGTCACCTGAATAAAATAGAACCACATAAACAAGAAAGTCTTCTTATCGTCATCATGAAATATTCAAGCTATAAAGATTGGAAACATGCGTTAAAAAAATCTAACATCAAACACTTAATTACAAATATAATGCATACGGTCAAAACTTATAAAATCGATGGAATACAATTTTCAAATTTACAACCAATAGCGGGGAAAGATCCAGACAATTCAGTGGATACACACACGATGAATAATCTATTAAAATTCTTTGAAAAACTACTAAATACTGCAAAACATAATCATAATTATGATTTAAAAATTGGCATAACCATTCATTTGAACAGTCAGTGGATCACATCAAGTTTTACTTCATTCGCTGAATTAAATAAACTAGTCACTTGGTATACATACGAAACAATTTCCATGGTAACATGTTCACCAGAATACAAAGATACAGGCACTTCTCCATTAGAAGGAGACGTGAGCTTGATGAATGCATATAATACATTAACGGATACCAATATTGAAATGTCAAAAGTAGTAGTTGGCATACAATTATTTCCAAATAAAGTTAATAAATTAGAACCATTTACATATGAAGAGTTATGTTCAACACCAAAGAACACTTGGAACGAATGGTGTGCTGCATACCCTGAAAAACTTCGGTTAAAGGGTATATTTTTACGGAACAATGAAATCGGAGGCGTCCAACTATTTTACATGCACTCAGACGATTACAGGTCAACATGCGGCTGTTATTCTTTCCCGTTGACTCGAGCACTTCTTCGTGGCTTGATTAACACTCAGACGGAAGAACAGTGTAATTTTATTACGGCACACAACTAAATAGAAAATACCCGCAATAAAATCAAGAACCATTATAATAATATTAGTATCGTTTTCCTCATTAGTGCATTATTAGTAATTATTTTTTAGGCACTTGGAGTATGAACATTTTAATATTTTATATATCATTACTAAATGAATGTATTCTATAACAAACGCGGGTTCGTATACGACACATTCGTTCATTTTAATTAGCTAAACATATTGTTGTATAATTATTTTTTTAACACGCATAAAATACTGAATATATTTTATTAATTTAGTTTTTTTTTTATTATTCTTGCATTTTATTTTATCTTATAACACAGAACAAGATACTTAACTCCTATAAGTTGTATGAGTATAGACTGTAAGTATTTACTATATTTATTCGTACCCATAGTAACTATGTTAATATCACGACCTCGAGAGTTTATAATCATCATATTCACTCCTTTATTTTAATAAACCAAAATTTAAATAGTATAAAGTACAGTGGACGCCGCTTATAAGACTTACTTTGGGACCAACACAAAGTGAGTCTTATAACCGAATGAATCTAAC\n>XM_048102724.1 PREDICTED: Salvia hispanica GDSL esterase/lipase 6 (LOC125204156), transcript variant X2, mRNA \nAAGTTTTATTTAATAAATAGGAGTTTCAAATGAAGAAGAAAACTACAAATTGGTGTTGAACAGTTGAAGAAGAGTTGGCATAAAACAATATGGTGATCGAAGCCATGCATGCATTTAGTTAGTGTTGCTATGTCGTCTTCCTCGTTTTCCCGACATAACACCTCTCTCTCTATATATGTGCAAAATTCACAACAACTTTACTCAACTAATTGATTAATTTAATTTCTACAAAATCACTGGTAAAAATGGAGACACGGTTGCTGCTCGTCTCCGTCATTCTATTTCTTCTAGCAGCTTCCGCCATCGGATCTAAAATTCCGGCAATTTTCATATTTGGGGACTCGCTCTTGGACGCCGGAAACAACCCCTACATCCCAAATTGCACCGTTCAGGCGGATTTCCCGCCCTATGGATCCAGCTTCTTCGGCCGCCCCACCGGAAGATTCACCAACGGCAGAACCGTCGCCGACTTCATCTCTGAGTATTTAGGCATTCCACTGCAAAAGCCATACATGGAGGTGATGAACGGAACGGAAAAGAAATTTCCGGCCAACGGAATCAATTTCGCCAGCGCCGGCAGCGGAGTTCTTCCGTCCACCAATACAATTTCTGGAGTGACAGCAATCCAAGTCCAATTGCAACAATTCAAATCACTAGTCCAAAAAAATCAAATAGACAGAAAAGTCGTAAAAGATTCCTTGTTCTTGATAGAATCAGGATCGAACGACATATTCAGCTACTTTGATCCATCAACCTCAACACCCGAGGCCTATATACAAACCATGCTCGGACAAATCCACAACTTCGTCGATAACATCGTTAGCCTAGGGGCCCGCTGTGTCGCCTTGTTCGGACTAGGCCCGGTCGGCTGCGCCCCGGCTAGGTCCAATCTGCCCGGTGCCCCCCTCGGAAAATGCTACGACAAGTTGAATAAAATGGTCATGAAATACAACATGGGGTTGCAGAATTTGGTGAACGTTTTGCCTCGCACCCATCCCGGCACCATCGCTGTTTTTGGACGTGTTTATGAAACTATCCAAACCTATCGAGCACATCCTACGCGTTATGGGTTTGTGGATGTGGAGAACGCTTGTTGTGGATCTGGGAAACTAGGAGGACAGGTGCAATGCGGGAAGGTGGGCTACAAATTGTGTAAGAATCCAAATGAATACTTGTTTTGGGATTACTTTCATCCATCGGAACGGACTTGTGAGCTCATTAGCAAGGCCTTGTGGGCGGGCGGCCCGACTTCTATTATGCCCTTCAATCTCAAGCGGCTTGCCAATATGCCTGTCGCCTAATTGTTTAGGGTTCATATTTCATTGTTATCGTCATCTAAACGGTTTATGTTATACCGAAATGTTATTGGATTTTAGTTAA\n>XM_042583618.1 PREDICTED: Zingiber officinale exportin-4-like (LOC122024892), transcript variant X3, mRNA \nCCTTACTCAGGTGTTCTTTTCATTTCCAGGAAGGCGCACACACAGGGGGAAGGCGGCTTGAAGGGCTACCAGGCCCTCCGATCGCTTCCCTTTTCCGCACAATTTTATCTGCCGACTTTGAGAAAGCTCGCAGCTCACTCCCGTTCCTGCATCCCCATCTCCTTTTGATCGTCTCTTCCTCGTCGCTCCTAATCCGACACACACAGTACCCTAGAGAATAGAATCGGACGAGATTGAGTTGAAAAACAAGAGGCAATGCAGGGGTTCCCAGGATCAGTTCCGGATTTGTCCCAGCTTCGGTCCACCATGATTGCAGTTGAACAGGCTTGCTCCATGATCCAGATGCACATGAATCCAACTGAAGCAGAGAAAATTATTGTTTCACTGCGGCAATCCTCAATGCCATTCCAGGCATGCCGATTCATACTTGAAAATTCTGAATTGCCAGCTGCAAAATTTCAAGCTGCTGGAGCAATTGGTGATGCTGCAATTAGAGAGTGGGGAATGCTTACAGATGAGAATAAGAAAAACTTAATAGTATTCTGTCTACACTATGTTATGGAGCATGCAAGTGCTTCTGATGCTTACGTCCGATTAAAGGTGTCTGCAGTTGCAGCTCAACTGTTAAAACGAGGATGGTTTGATTTTGTTGATGCTGAAAAGATTTGTATTCTCTTAGAGGTGAAGCAAGCCATTCTAGGACCTCATACATCAGATGTGCAATTTGCAGGGATTAATTTCCTTGAGTCCTTGGTATCTGAATTTTCACCTGCAACTTTGACTCCGATGGGCCTTCCTAAAGATTTTCACACCCAATGTCATTTGTCAATGGAATCTAATTATCTGAAGGAGTTCTATTGTTGGGTTCAATCTGCTGCGTTTAATGTGACTGAAAAGATAGTGAGCTCATATGCAAGCATATCTGATGAGAAAGCATGCTCTGCAGCACTGCGGTTTATGTTTCAGGTTTTGAACTGGAACTTCCAAAATAGTTCCATTTCATGGGATACCTCCAGAAATAAATCAAATTTAGTAACATACGGTATCAGACATGATGTGGTTCAGTTGAAAAAGTTTGAACGGTCATTGGTTGAGCCAGGACCCTCATGGCATGGTGCTATATTATCAAGCGGACAAACTCTTTGGCTTTTGAACTTGTATGCAACAGTTCGCCAGCAGCATTTATCTGATATTTTGTGGTTTGATTCTCCCTTATCAGTCTCTGCCAGGCAGCTAGTAGTGCAGTTATGCTCTTTGTCAGGGACTATATTTCCTTCCGACAATGGGGAAACACATATTAAGCACCTAGTGCAGATTCTGTCAGCTGTTATTGATTGGATTGAGCCGCCTAACATAGTCTCAGGAGCATTACGTGGGGGGCGAAGTGAAAGTGAGATGATTGATGGTTTTCATGTATTACTTTCCATGGCAACCATGACTACAACTGTGCTTTTTGATAATCTTCTTAGGTCTTTAAGACCTTTTGGTACAATTCAATTATTGTCTGCCTTGACTAGTGAAATTGTTAAAACTCATGTGAGAAGAACTGATGTTGATCAAACATGGACATCAGAGGCTCTTGATATTCTCTTGGAGATATGGACCCTCATTCTTGGGAGAAATGACAATGAAAGAAAGGTTTCACCTGAAAACATATCATCATTATCGAATTTATTCAAAGCTATTGTGGAGTCGCATCTTAATGCTGCTGCCCAATCTGCATTTGAAGATGATAGTGATGCTGAGTATTTTCATGTCTCTGTATCAAAACGAGATGAAACTTTGTATGCATATGCTCTTATTGCACGAGCTGCAGTTGAAACCAATATTTCCTTTCTTATGAAACTGTTTGCAGAACGTTGTGCTCTTCTCAGTCAGAATAATGAAAGTTGTGATCCTACACAAACCTTAGAAGAACTCTACTGGCTTCTATTGATTACTGGTCACGTGCTCACTGATTCAGATTCCAGAAGCAATACAAGACGGGTTTGCTGATGTATCAGATGAATCACAGCATCCAGTGGTTGTTTTTTCCTGGTCAATACTAAGTTTTGCTAGGCAAAG\n>KM122633.1 Uncultured bacterium clone LNH_9_9_11_Pumice.146514 16S ribosomal RNA gene, partial sequence \nCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGATACTGGCAAGCTTGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAGCGACCGCCTGGGGATACGGCCGCAAGGTTAAAACNCAAATGAAATTGACGG\n>KF304776.1 Cystobacter minus strain Cbm6 small RNA Pxr-2, complete sequence \nAAGTGAGGCTGAAGGAGGTTCCCCCCCACCGCCTTCAGCACTTCCGGTGAGCTTCCTAAGAAGAACCCGAGGCCCGGTCCCTTTCTGAGGTGACCGGGCCTCCTTCTTTT\n>XR_007867290.1 PREDICTED: Lolium perenne uncharacterized LOC127325588 (LOC127325588), transcript variant X4, ncRNA \nTCCGGATCCCGTCCCCTCTCCGCGTCCAGACCTCGATTAATTTCGTCATGCGCATGGTCCTGCCCCGTACGTGCAGGTAAGCGGAAGCAGATCAGGGACGGCCTGTCCCCGCTCGACGACCACGCAAAAGGGCTCGTCCACTCCGGCCTCGACCAGGAGGAGCTCTTCCGCCCACCAAATTAAAGGTCACTTTATCCTTTATATGGAGCTCATGACTACAGCCATCAAATGTCTCAGTCTGCTCCTCAAGCGGAACCTTATGGTGACAATCTTCCACACATCGATCCCTGGGGCCTACCGAAGCTGAGAAGAAAGAGATGGCGCCACGGTGGCTCTTGGCGACTTCTGGTGACATTGGCCGGCTTGGAGGCTTGATGGGAGAGCTGCAGGTCTAGCTGCTCTGTCCCAAGTTTCACCTCGGTGAGCTCGACTCATAAAGATCGATGGGTTTAAGCTGGATAGACGGTGGTGGTTATTGTTGCAAGAAATAGAAAAGAAGACCTTATCAGTGCACCCCATGCCCATGATTATTCATTGCTGCTGCTTCACCACACACCCAAGAGGAGCAGGTTCGGGAGAAAGAAAGGGACCCAAAATAGAAACAAGAAAGGGAAAAGAGAAGAGATGGGGATTCTGCGAAACTTCCTCGAGCTCGCCATCAATTCATGTCTCGTGCTGCCATGGTAACCTTATAGTTAGTCCTTTGATTACAGATTGGTGGATGTGTTGGTAGAATTTACCCGGTTGGTTTAGCTTTACGACAGTATATTGTTTACCCGATTCCGGCGAATGGTTTGGAAAGGGGAGCAAAAACAGTACAGTTGAACATGCAGTTTTCTGTATAGTGAGTTATCATCTTTTTTTATATTAAATCAAATACGTTTTCAACATAACAATCGAAGAAGTTGTCTTGTAGGTACCAAAACTTATATTGGTTTACAGATTTAGTTTTCTCTATTAATTTGTACTAAATGACTTAATAGTTTGCCCAGTGTGGACATATTTGCCATCAAAGCTGAGATTTGGTGCTTATGTGTGCTTTTTGAAACATGTGCTTTTGAAGTTCTAGGCTTCCAGCTGCAACTTTCAGAGTACACCTGGGTAAATCATTAACGATACATCACTCATTTTGCATCAGCTTTCACAAAAAATAAACTTATTTGGATTCTTAGAAACATGATACTGTTTTCTGAAGTGTAAGCCACCACCAGGTTTCTTTATGTCTCGCTTCAGAGTTCGGGCTTGAAGGTTTAGCTAGTGACTGCAATCTGGTTATATACTCTCTTATGACGAGTTAACGTCAGTTTTGAAGGTCAAACTGTGTTGATCTGAAGCTTTCTGGATGTATACATATTAGCTTGAGCACGCTGATTTTGAGGAGTAGCCTGCTTTTGCTATGTTTGTAGTCTTCTAGTGAGAATTGACTTGAGCTTCTCTCGTGTGCTTTTTTGTGTCTAGGAGTGCTATTCTGTACATCCAGAATTGTCATTGATATATAGTTTCTTTGCAAATACCTTATGTGTTGGATTTCTCTTGAGGATCTTCTCCTATGCTTTTTAAAAAAAAAATTATTTGTTGTTCATTCATCTGGGAGTTATCTTAGGTATTGATGAGGATGGGTTGGAATGTGGGATCATGGAACATTATTTTCCATTGGTTTTGACTTTTTTCTCATTGATGAAAAGGTTTATTACACAAATGCATGGTCTTGTTGCTGTCGTCTTAGAGCTTATACTCATGTTCCTGATTCTTGTATATACCCAATTTGGGTCTTTCACTGTTAATTATATGATAGTATTGATCTGGCATTTTAGTTGATAAACATGTAATTGCCACCACTTATGCTTATTAGGACAGCAGCTAGATTTAGTGGTTTTGGTTAAAATATTTACTTGCTCTGCTTTAGTGGTTATGGCTAAATATTGACTTGCTCTGTTTGAGTGACGAAAAAGTTCGGACAAACTCCGTTTTGTTTTTATAATCTGCTTGGTGTTACTTGGGAGGGAAACGGGAAGGAAGCCGTTGAGCACCTTACCAAGGCGATCCTAGTGAACCTCAACAACCATGTATGGTACAAAGAGGTCAGTCACAATAGCAGCAATGCTTGCAGAGCTTACTGACTTGAAAATGTCGCTACTCTTTGTATGTGGAGCTGTCCCCCGAGGAGCTGGATGCAGAGTGAATGAACTTCTCGATCTCGACATGTGGAAGAAGGCAGTAGTTGATAGAGGATATGTACAATGTCACCCATGATCCTCGCAGAGGATCCATCCATGGTGGCATGATCAGGATGGTGTGAGTGAAGCTTTGAAGGCCAGTTCTCTACCGATGTGCGTAGCATATGTGCTATCCCTTGTGACTTCCTTTTTTTGTAATTGCTTCACAGACCTGGAGTTGTAATAGTGTCACATCTGTCTTTGTTGCTTATTTACGTTTGGACTTGTGATCTGAGTTGGATGATGTGGGGTTTTGGATGTCAATCTGTGCTGTTGTGATACATATGAAATTTGGACTGTTGATTATTTCA\n>XM_025161730.1 PREDICTED: Tetranychus urticae CXXC-type zinc finger protein 1-like (LOC107366317), mRNA \nAAAAGTAAAAAACTTTGTTAGTGAAAAGTTTTTACCATTTTTTTAATATCACTCTCAATGTGATCAATTAATAGATGTCCTATCAAGCCCTGGTGGACAAGCTAGTTTCAATGGTCAAATTTTTGGCCTTGGTTTGGACTTAGTGCTAGTATTGGTGCCCGAACTACTAGCACCGGATCATCTGGTGCCTCAGCCTCTGGTAGAGCTGCAGTTAAGGCCGTTGTCTAAGTGAAGACTCAAAGGGCTTAAAATGGTTTTCTGTGGTGAAAAATATCTGTGATCGTCAAGTTTCAAGGGAAAAGGGTAGAGGAGAATCACTGGACTGTATTAATCGTTTAAGCTGTAAAATAATGATTTGCTTGTATCAAAATTTAAATATCTCAATGTTTTTTCACTATGAAATCAGGTTCAAGCGTATGAGCAAATAGTGATGAATTATTAACAGCTAAAGTAATTTTACCATATTAATTATCGAAATATAATTACTGTCATAGGTTTAAAATTTTCTGGTTTACCTAACAGACCTACCTTTAGCTAAGAAACACCTACTTAACCGTGAAATAGACCATTGGTTACTCTCACTACGTCTAACTTACAAGAAACTAATTACTTGTTAACGAGATGTTAACTTGTTGACTGTGTTTAAAATAAACAATAAACTTTTATTAAAATGAGTGAAGACATTGCTTATTGTATTTGTCGCTCTTCAGATATAAGTCGATTTATGATTTGTTGTGATAATTGCGATGAATGGTATCATGGAGATTGTATTTCTATGACTAAGGAACGCGCTTTTACCTTTTTAAAATTTTACTGCAGTAAGTGTCGTGATCGTGATCCATCCTTGAAAAATCAACTTGTTAAAGAATCTAAAAAATATGTGGTATACACAATATCCTCTTCTGAAGTGACCAGCAAATAGGGAACAGTTCGGAAAAAGAGCCCATCACCTCAGAGGTCTAATAAAGTGGCTCGTTATGAAGATGATGCAGCACCTGAGAAGAGGAATTATGAAGATAAAGACGACGATGATAAAGATGAAACTTCAATAGATAAGAATAATTCATGTGAAAAAAATAATGAAAAAAGTGAACTCAAATCTAGATCAAGCCGAAAAGAAGCAAACACAACACCAGCTGACAACGAACGGACCAATGAAAAAACACATAAAGACAGAGAGGAAGAAATCTCCGAGATTGATGATGGTTTGGGTCAATTTTTTCAATGGATGTTTGAATATGAATTTTTATCGTGGCGTAGTCTTGTACTTTAAGTATAGAAGATCTTAATTGCCCGTGTTGGATAATCTGGTGTTTTTAAACCAGGTAAAACTGAAGGCGAATCCTAAATCTTCACCACTACTATTACAGTATTTCCTTGAATTTTTTGCTTTTTTCAAGTGCTGACATCTATGTCAACTACAGGGGGGAATAATTCAATTTTACAGTTAGTCTATTCTAACGATTCCCCCTTAAGGGAAAAGGGTAGAGGGGAATCACTGGACTGCATAAATTGTTTAAATTGTAAAATAATGATTTGCTTGAATCAAAATATAAATATCAATCAATGTTTTTTCACTATAAAATTAGGTTCAGGCGTAAGAGCAAATGTTGATGAATTATTAACAGCTAAAGTAATTTTATCATATTAATTATCGAAATATAAATACTGTCAGAGGTTTACCTAATAGACTCTTAAAATAGAATAGAATGATCTTTAGCTAAGAAACACCTTCTTGACCGTGAAATAGACCATAAGTTACTCTCACTACGTCGAACTTATAAGATACAAATTACTTGTTGACTGTGTTTAAAATAAACAATAAACTTTTATTAAAATGAGTGAAGACAATGCTTATTGTATTTGTCGCTCTTCAGATATTAGTCGATTTATGATTTGTTGTGATAATTGCGATGAATGGTATCATGGAGATTGTATTTCTATTACTGAACAACTTGCTAAGACGATGACCAAATTCTACTGCCTTATATGTCGTGATCGTAATCCATCTTTAAAAATTCAATATCACAGTGTAGTCCTAAATACTGTAGCATCTAGTCCTAAACCCACCAGCAAACATGGAACTGTTCGGAAAAAGAGCCCATCACCTCTGAGGTCCAATAAAGTGGCTCGTCATGAAGATGTCACTCCATCTGAGGAAAGGGATTGTAAAGATAAAGACGACGATCATCAAGATGAAACTTTAAGAAATAAGACTGATTCATGTGAAAAAAATAACCAAAAAAGTGAAATCAAATCTAGATCAAGCCGAAGAGAAGCAAACACAACACCAGCTGACAACGAACGGACGAATGAAAAAACACATAGAGAAAGAAAGGAAGAAATCTCCGAGATTGATGATGGTTTGGGTCAATGTTTGCGATGGATGTTTGAATATGAATTTTTATCGTGGCGCAGGCTTATACTTTAAGTATAGAAGATCTTAATTGCCCGTGTTGGATAATCTGGTGTTTTGGAACTGAAGGCGAAACCTGAATCTTCACCACTACTATAAGGACAAGTTAAAATGTTTTGTTGTACTGACTAAATCAACTATTTGCAATTCCCTAACATTAAAATAAAAAAAATTAAATTGTAAGTGAAATTTTGATATCAATAAGAATCAGCTTTAATTGTTCATTTTTGCTGTGAGATGACATGCAATTTAAGTTAAGACCTCAAGAAAAAATATCCAAAAGTAAAATTTTAACAATTTCTGAGAGTTTTATCATAAATGTTCCGAGTTAGATTATGCTCAACTTGAAAAGTGAAAAACCTTTGTCAGTAGAAAGTTTTACCATTTTTTGAATCTCCCTCTCTATGTTATCGAAAAGTAACTGAGTAACCAGTTTTTAAAGTCTGTTTGACTGGTTTCGGTAATTTTACATTTGTTTACAAACTCTGTTTATCTTCAATTTCGGCAGTTTTTATCCTTACGTCAAAGTTTTATTATTTAAATGTTTTTCTTATTAACTTAAGTGATATCAACATGGGTGAAGACACTTCTTACTGTATTTGTCGCTCTTCAGATACAAGTCGTTTTATGATTGGTTGTGATTCTTGTAATGAATGGTATCATGGAGATTGTATTTCTATTACTGAACAGCTTGCTAAGACGATAACCAAGTTCTATTGCCTCATGTGTCGTGATGCTAATCCATCCTTAAAAATTCAATATCACAAAGATTCTGGCTCTAAATCAACTAGCAAACAGGGGACTGTTCGAAAAAAGAAACAACCAACTTCTAAGTCCAATAAAACGGCTCGTTTTGAAGATGATGCCTCACCAGAGAAGATGGATTTTGAGGATGAAAACGATGAAGAGTTTGATGACGATGATGATGGAGATGAAACTTTCAGAATTGAGAATGAATTATCTGAAAAAAATAATCGAAAAAGTAAACCAAAATCTAGACCTAGCCGAAAGAAAACAAATACAACATCATCTGACAACAAACGTGGAAGTAAAAAAACACATAGACAAAGAGAAAGAGAAAGAGATGTCTACGAAGTTGATGATGGTTTAAGGCAATGTTATGGTCCTGGATGTATCAATATAGCTCGTCGAGGCTCCAAATACTGCAGTGATAATTGTGGTATCAAATTAGCAACCAACAGGATAATAGAAATTTTACCTGAACGTATAAGGTTTTGGCAAAGTACACCATCAAGTGCTGATGTTTTCAGTAATCGAGAATTAGATGCAATTCGAACAGAAGGAGAAACAGCCAAAAGGCTTCTTGAAGAACTGGACGGTAAACAAAAAGAACTAGAAGCTATGATTGCCGAGGCCAAGAAACTACCACCAATCTCAGAAGATGAAGTAGACGAAGAGACTGGAGATGAGCTGATGACTTACTGTGTAACCTGTGGACATGAAGTTGCATCGAGAACTGCTTTGAGACACATGGAAAGATGTTTT\n>XM_043408227.1 PREDICTED: Colletes gigas uncharacterized LOC122404294 (LOC122404294), mRNA \nATGCATATGATAACAAGACAAAGGCTTGGTCGCCCGAGAGGACCAAATGCTAACCGCCCTAGGGAAGTGGTTCATGATTCCGCTTCTCCGACATCAGAAGTGAGATATCCTCGGCTACAAAGCGAGTCAGATGCAAATTGCGAACATCAGCCGCATGAAAATGTGCCCATTCAAGACAGCGCGTATACGATGCCGCAGTCGGCTGCATATGCAGCGCGGCTTATGGCCATGCTCACCTTGCGATGGCAGAGTTTCTCTACAGAGCAGATTGCTGTAGCAATGGTTCTGGCGCACACGGCTCAATTTGATAGACGACTCCAGAGATTAGCCTTTACCACAGAAATCAATTCAAGGGACAAGCTACACCGTGCAACTGGTCACTATGCTTCCAAGTGTCACCAAGTAGCTGGCAAGGGTAGCGGCGGTGCTAGCAGCAGCAGAGATTTTAACAATGCAGTTACGTCAAATACGGTTCAGCGACGGGTTGATGTTTGTCAGATAGGTAACCCTAGTGGAAAACTGGTCTGCAATGATCAGATAGCTAGATTAGGAGGTGCTCGGTGGTACTCCAGTTTTGATATGTTGAGCGATTATCACCAGATCCCTGAGGAAGCCAATTCTATTGAGAAAACGGCCTTCGTTACTCCTGAAGGTCAATGGGAATATTTGACCATGCCATTTGGGTTAAAGAATGCTAGTTCGGTCTACCAGCGAGCTATTGTAAAAGCCCTCAGAGATATGGCATTTAGCTTCGTTTTATGA\n>MZ269370.1 Colletotrichum fructicola isolate 25640 internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene and internal transcribed spacer 2, complete sequence; and large subunit ribosomal RNA gene, partial sequence \nGAGTTTACGCTCTATAACCCTTTGTGAACATACCTATAACTGTTGCTTCGGCGGGTAGGGTCTCCGCGACCCTCCCGGCCTCCCGCCTCCGGGCGGGTCGGCGCCCGCCGGAGGATAACCAAACTCTGATTTAACGACGTTTCTTCTGAGTGGTACAAGCAAATAATCAAAACTTTTAACAACGGATCTCTTGGTTCTGGCATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCGCCAGCATTCTGGCGGGCATGCCTGTTCGAGCGTCATTTCAACCCTCAAGCTCTGCTTGGTGTTGGGGCCCTACAGCTGATGTAGGCCCTCAAAGGTAGTGGCGGACCCTCCCGGAGCCTCCTTTGCGTAGTAACTTTACGTCTCGCACTGGGATCCGGAGGGACTCTTGCCGTAAAACCCCCCAATTTTCCAAAGGTTGACCTCGGATCAGGTAGGAATACCCGCTGAA\n>XM_036071201.1 PREDICTED: Halichoerus grypus sequestosome 1 (SQSTM1), transcript variant X2, mRNA \nCCCGCCGCCGCCGCGGCCCGGCTCCGTCTCCTGCTCTCCGACCGGTAGCGATGGCGTCGCTCACCGTGAAGGCCTATCTTCTGGGCAAGGAGGACGCGGCCCGCGAGATCCGCCGCTTCAGCTTCTGCTTCAGCCCCGAGGCCGAGGCGGAGGCCGAGGCGGAGGCCGCGGCCGGGCCCGGGCCCTGCGAGCGGCTGCTGAGCCGGGTGGCCGCCCTGTTCCCGGTGCTGCGGCCCGGCGGCTTCCAGACGTACTACCGCGATGAGGATGGAGACTTGGTGGCCTTTTCCAGTGACGAGGAACTGACCATGGCAATGTCCTATGTGAAGGATGACCTCGTCCGTATTTACATTAAAGGTCTGGAGGGCAGGGCCAGGGGCCCGCTGACTGAAAGCCCCCCAGTCGTGACGAGCGGTTCGTGTGGGGTCCCACCTGCAGAGAAGAAGGAGTGTCGGCGGGACCACCGCCCCCCGTGTGCTCAGGAGGTGCCCCGCGGCCTGGTGCACCCCGGCGTGATCTGTGACGGGTGCAATGGGCCCGTGGTGGGGACCCGCTACAAGTGCAGCGTGTGCCCGGACTACGACCTGTGCTCCGCCTGCGAGGGGAAGGGCCTGCACCGTGAGCACAGCAAGCTCGTGTTCCCCGGCCCCTTCGGGCCCTTCTCCGAGGGCGTCGCTCACAGCCGCTGGCTCCGGAAGCTGAAACACGGGCACTTCGTGTGGCCCGGCTGGGAGATGGGCCCCCCAGGGCACTGGAGCCCGCGTCCTCCCCGGGCAGGGGACGCCCGCCCCGGCTCCGCAGCCGAATCAGCTGCTGGTCCGTCGGAGGATCCCAGTGTGAATTTCCTCAAGAACGTAGGGGAGAGTGTGGCGGCCGCCCTGAGCCCTCTGGGCATCGAGGTGGATATCGACGTGGAGCACGGCGGGAAGAGGAGCCGCCTCGCCCCTGTCTCTCCAGGCAGCTCCGGCACCGAGGAGAAGTGCGGCTCCCAGCCGAGCAGCTGCTCTTCGGACCCCGGCAAGCCGGACGCGGACCCGGAGGGCGCGGCGCGGTCCCTGGCGGAGCAGATGGACAAGGTGGCCCTGGAGTCGGTGCCACCGGAGGAGCAGATGGAGTCGGATAACTGCTCGGGGGCAGACGAAGACTGGACTCACTTGTCTTCCAAAGAAGTGGACCCGTCCACGGGGGAACTCCAGTCTCTACAGATGCCCGAATCCGAAGGGCCGGGCTCTCTCGACTCTTCTCAGGAAGGGCCCACGGGACTGAAGGAAGCTGCGTTGTACCCCCATCTGCCACCAGAAGCTGACCCCCGGCTCATCGAGTCCCTCTCCCAGATGCTGTCCATGGGCTTCTCTGACGAAGGCGGCTGGCTCACCAGGCTCCTGCAGACCAAGAACTACGACATCGGGGCGGCGCTGGACACCATCCAGTATTCGAAGCACCCGTTGTGACGGCTTCTGCCCCCTTGTCCCACCCCCTTCTTGTCTCCTAGTTGTGTTGAGCTAGTGTAGAACAGCAGGGCCTCTCTAAGGGCCAGTTTCTCTGCATTCTTCTTCCAGAATCTGGGGGGCGGGGATGCACCAAGCCATCCAGGGCAGTGGAACAAGTGACGGGGGGGGGGCCCCGTGTGTGGCTGCCCATGTCGGAGAAGCGTCTGCTGGCTTCCAGGGGCGGACGCGGGGCCCAGTGGTGTTCTCCTGCCCTCCCCCCACCAGGATCACACCAGCAGTCCAGAATGTCTTGCCTAATGGCCTTTTTTTTTTTTAATGACTAATAGTAGGCTGACA\n>XM_050309850.1 PREDICTED: Myiozetetes cayanensis ring finger protein 111 (LOC126636998), transcript variant X10, mRNA \nGCAGGCTCACCCGTGTCTAGGCCTTCCTTAAATCTTTCCATGTCTGAATGGACTCCTGAATGTAATATAGTCTATACTCCAGAAGCGGATATGAAGAGTGAAGTTCCTTCTGATGCACCAAAGAGCCAGGAGAGTCTGAAGGGGATCCTCTTGAACCCTGAGCCTATTGGGGCGGCCAAAAGCTTCAGTGCAGAAGTTGAGATGATTGCCAGTAAAGTAGGGAATGAGTTCTCCCACTTATGTGGTGACTCTCAAAAGCAGAAGGACATGAATGGCAACCATACAGACCAAGAAAAAAGTATTGTGCGAAAAAAACGCAAGAGCCAGCAGGCTGGTCCTTCCTACGCTCAGAACTGTCCTGATAAGGAAAACAAAGGAATCTTGGGATTGAGGCAGCATCTAGGAACACAGAGTGAGGACAATGACTCTTCTTTTAGTGACTGTATCTCTTCACCTTCTTCTAGCTTACACTTTGGAGACTCTGACACAGTAACATCTGATGAAGAGAAGGATGCTCCTGTCAGACACCCTCAGGCAGTGCTGAATCCTGTGAGCAGAACTCACAGTGCCCGGTCACACAAGTGGCCTCGCACTGAGGCAGACTCTGTGCCCGGATTACTCATGAAAAGGCCCTGTTTTCACAACAGCTCTTTAAGAAGGCTCCCATATAGGAAAAGAGTTGTGAAAACAGGCTCATCCCAGCGGACACAGAACCAAAAAGAGCGGATTTTAATGCAGAGGAAAAAGCGGGAGGTGCTGGCTCGCAGGAAGTACGCACTGCTGCCCAGCTCCAGCAGCTCCAGCGAGAACGATCTCAGTAGTGAATCTTCCTCCAGTTCATCTACTGAAGGGGAGGAAGACTTATTTGTGTCACCTGGTGAAAACCACCAGAACACTACAGCTGTTCCTTCAGGAAGCATTGATGAAGATGTTGTGGTGATTGAAGCATCCTCCACTCCCCAGGTCACTGCTAATGAAGAAATAAATGTTACCTCAACAGACAGTGAAGTGGAGATTGTCACAGTTGGTGAAAACTACAGGTCTCGTTCTGCACTTGGACACACAAGATCCCACTGGGGCCAGAGCTCTGGCTCTCACGCTCCACGACCTCCGGAGCAGCGGAACCGCAGCAGGATCTCCACGGTCATCCAGCCCCTGAGGCAGAATGCGGCTGAAGTTGTGGACCTCACGGTGGATGAGGATGAGCCAACAGTTGTGCCAAGCACATCAGCTCGAGTGGAGCCGCAGGTCGTGAGTTCTGCTTCCAGTAACAGTTCCAGTACCTCTACCTCAGAGCAGGCCTCTGATGCAGCTCCCACCATCTCCACCAGCCAGCCCTCTGCAGCTCCAGAGACGACTCCCAGTCTTCCCAGTGGCAGCACTGCTGGTACTTCAGCTGGAGATGACATAAGAAGAACTTCATCTAATACAACACTGGAAACTGGCCCTCCGGCCATGCCAAGGTTACCGTCGTGCTGCCCTCAGCATTCTCCTTGTGGAGGACCTTCACAGACTCATCATGCCTTGGGGCACCCACATACGAGCTGCTTTCAGCAGCATGGCCACCACTTCCAGCATCACCACCACCACCACCACAACCCTCACCCGGCTGTCCCGCTCTCCCCTTCGTTCAGTGACTCCAGCTGCCCTGTGGAAAGGCCTCCCCCGGTGCCTGCCCCGTGTGGAGCAAGCAGCAGTTCTGGCACCACTTACCATGATCAGCAGGCACTGCCAGTAGACTTAAGCAGCAGTGGTATAAGAAGTCATGGAAGTGGTGCTTTTCATGGAACATCTGCCTTTGATCCTTGCTGTCCTGGTTCTTCATCCCGAGCGACGATCTATGGGCACCAGGCTGGGGCTGGGCCGAGCCAGTCCCTGACAATAGATGGATACGGATCAAGCATCGTTGCTCAGCCACAGCCCCAACCTCCTCCTCAGGCATCGCTCTCCTCCTGTCGCCATTACATGCATTCTCCTTTACCTGATGTTTTCATTGCAGATGCTTCCTTGACCAGACCACTTCACCATCAAGCTTCTGCATGCCCTCACTCTCATGGAAATCCCCCTCCACAGCCACAACCTCCACCTCAAGTAGATTATGTTATCCCTCATCCAGTGCATCCCTTCCATCCTTCAATCTCCTCTCATGCATCTTCTCATCCTGTTCCACCTCCACCACCGACTCATCCTTTAGCCAGTGCAGCTGCTCCAATCCCACAGCATCTTCCTGCAACACACCAGCCTATATCCCATCACATCCCTGCAACAGCACCTCCAGCACAGAGGCTACATCCTCATGAAGTGATCCAGAGGATGGAGGTCCAGAGAAGAAGGATGATGCAACACCCAACACGTGCTCATGAGCGACCTCCTCCACATCCTCACAGAATGCATCCCAATTATGGGCATGGGCATCACATTCATGTGCCTCAGACTATGTCTTCCCATCCTCGACAAGCTCCAGAGAGATCTGCCTGGGAACTAGGAATTGAAGCTGGTGTGACTGCAGCTACTTACCCTCCAGGGCCTTTGCATCCTCACTTGGCCCACTACCACGCACCTCCTCGACTGCATCATTTGCAAATAGGGGCACTCCCTCTAATGGAGCTGATTCACTTGGAGGAACGATTAGGCAACGTGAATCGTGGAGCAACACAGGGAACTATAGAAAGATGCACATATCCACATAAATACAAAAAGAGGAAACTGCACTGCAAACAAGATGCGGAGGAAGGAACAGAAGAAGACACAGAGGAAAAGTGTACCATCTGTTTGTCTATCTTGGAGGAAGGTGAAGATGTCAGGCGCCTTCCGTGTATGCACCTTTTCCACCAAGTCTGTGTAGATCAGTGGTTGATTACTAACAAGAAGTGCCCCATTTGCAGAGTGGACATTGAGGCTCAGCTGCCCAGTGAAAGTTGACACTGCTTTCCAGAACTCTTGTCCTCCCGCTCGCTCCCTCTCATCCCTCCTGGTACTGCAGTCAACCAAAGATGGCATGACTTACCTGCGCAGATGTGGAACATTGAACCTTAGAGTGCTGGCTCTGCTACATGGTACAACTAATGCTAGACCTACAGTTTATTGTAGAAGACAGTTGAGTTTCAGTGTATTTATAATTTTTTTAAAATTTTTTTAGGTTTTACTTTTTTTTCTTTAAATTCATTACTGTATTTTTGCATGGTTCCTTGTATTGCATTTGTTTGCACATATTATGGGCTTTGTGACCCCAAACTTGCAGGCAAGATTAGCTGCTTTAGTAAGTAGAATTGTGTGGTCTCTTTTTTTTTGGTTTGTTTTATGTAGTATCAAGCTTTGAAAGTATGATTTCACTCATTACTAACCTCGAATTCCTTAATTTAATCAATCATATTTTAGTTTAAATGTATAAAGATCATCTAGAAAAGGATAATATTATGTATTGAGACATTCCTTAATTAGGAAAAAATGGCTGCTGTATATTTACAATATCAGTTCTGAGTCAAATAACATCCTTAATACTGGGAACAGAATATGGACTATATTCAGTTTGACTGATACATATAGCATACTCATCACCAGAGTTTTTGTCTGATCAGATTTTTGTGTTTGTTTTAAAAATTTCAGCACAATGCAGATATATTTGAATGTCAATATTAAACATTTAGACTGCTGTTCAGATTGTATTTATCATTTTCTTCTATGTCTAGAAATTTGAATCCCTAACTTAAATATATGCTGCTGTGAAACAGCTCTAGTGAACACTAAATGTTGATTTCAGTTAGCTGGATTGTAGATACTTGCAGATTGAAAGACTTATTAGGGAAATGGAAAAAGAGCTTAGAATCTGTTTGGTCTTCTGCTAACTTAAGTTGAAGTATCTGCGCACATTGAGAGTTGGTTTGTTTTTTTTTTTGTTGTTTTGGTTTGGTTTTGGGTTGGGTTTTTTTGGTGGGTTTTTTTTGAGGGGAGGGGTTGTTTGTTTTTTTTTTTCTTTTTGTTGTTGTTGCTGTTTGGGTTTTGTTGTTGGTTTGTGGGTTTTTTTTTAATATAAAACCATTCAGTAAGGACTTTAAGCTACAGGGTTTTTGTTTGGGTTTATATACATGCATTCATAGAATTTCTAAGGATTCCAGGCGTGTCTTGGGATTTTTATTAGATTTAAAGTTAATAAAGTTAGCTAAATCCACTTGTCTCTTGTTTTTATTTTTCATTAGTAAATTAAAAGCCTGTAAATTTCTGTAGAAACTGAGACACAAATTATGTGGTTACCTAGTTTTTGCCTTGATCATAGGTTCCCTCTTTATAAATTACCAACAGTCCATCACTGATTGAAGTATTTTCTATAGTTAAGATTTGCTGCATAATATAGTATATAGAATTAATAATGTACTAACATTTTGCCTTTGGAGGAGGTTTTAATCCACATCAGGATTCAAGTTGCTTCAACATTCTTTCACATATAATAGATTATAGTTTATTTAAATGTGCTCAACATTGCAAAATGCAAATGTGCAAAAACATTGGGACAGTATTACTGTCACTTTGGAAAAGATGTTCCTCGGGGATCATAGATAAATATGTCAATTAGCTTGCATTAAGCCACCTGCTTTGTAAGTGAATTGAATAATAAATACCTTCAGTTTCTCTTGTCTTTGTCTTTCATAATCAGATGATATGTACAATGGTTTACAGTAAATCTAGAAGATGAACTGTTATGTTTACACTAAAAAATGATCCATTTATAAATATTACCTTATCTAATTTGATGCCTGTTTCTGTCTGGTTCAAGCAGCTTCCTTTTTATTATTTTTTTTTTTTTTTTTGTCAACAAACTTAACACCTCTGGCACTGAGGCTTTTAGTGGAGAGAATTTTTATTCCAGTATGTATGTGATAAATGGACCTTCTCAAGCTTCCTTGTGTTGCTAGAACTGAACTTAAAACCACTTTGTGCTTGTAAATGGGGGATGAGGGAGAGAGGCAGCCCAGGATCTGACTGCTCCTGTGGGTTTCTGCTAAAGCTTTTGGACATGGTGGCTGTAGGAAATTCAAAGACTGGAGTTGGAGCTTCATTGCTAAAAATGAATAAAAGTAGCTGGAAGGACTGACCAGACACTTTGCTTTCCCATGACTGAAAAGAAGGGAAGTTAGTTGACTGCTAATGTTTGAAGACTGATATTCACTGCTAAAAGGTTCCAAGAAGGTACTTGAGAGACATGGGACAAAAAAACCCAGGGCCTCTAAAATAATAGACCCTGGGGTAGAATCTCTTTTGGCTTTGTTACTGGACAAAGAAGCACAGATTTGGGGGATTTTTTTTTTTAATTTTTTATTTTGTTTTTAGGAAATATTTTATGGGTCTGATTTGAGTGCGTGGTACTAGAGGTATTTTAGTGGTCCATGATTTGATTTATTAGAGCTACTGATACTGTCTTGCTTTTAAATGTATGCATAACATTGTAATGTGATGTTGAACACTTTTGTCAGGAATCACGGTATTCTGATCTTAATGCTATTGCAGGGGCTAAAAAGCTGCAGCTTACTTCTGTTCCGGAAGGTTGTGACTTAACCGTAATTTAAGAGAAGGAGAAAGATTAGGCTTTTCATTTTGAAAATTTCCACCACTTACTGTGCTTTATATGCTTAGATGCATTGCCTTAAGTTTTCTGCAGCATCTTTGACTTTGAAGATAAGATTCTCAACAGTATGCATCAAATTACTTTTCATATGAAACTCCATTGTCAAAAGAAATCCTTTTGTATGCAATAAATAAAATGTTAGACTGGTATCATTCAAAA\n>XM_033409705.2 PREDICTED: Orcinus orca olfactory receptor 2J3-like (LOC105748649), mRNA \nTTCAACATTCCCTATCCAGTTCCTCTGTTGCATGTAAGTTCATGAACCAGCATTAAGTTCTAAGCAAAGGATAATCAGGCTTCAAAATTCTGACTGTGGTGTTTCCAGCAAGTAGTGTTAAGCAATGAGAAAATTCAGTAACACTTTTCATCACTCTGATGGCTTTGTTCTGGTGGGCTTCTCTGAATGGCCCAAACTAGAAATGGTTCTTTTTCTGGCCATCTCTGTTTTCTACATAATGACCCTCCTTGGGAATTTAGCCATCATTATCTTGTCATGCCTTGATGCCAGGCTCCACACCCCCATGTATTTCTTTCTGTCTAATCTCTCTTTTTTGGACCTTTGCTGTACTACTTCCCCTGTCCCCCAAATGCTGGTCAACATCCAAAGCCACTGGAGAAATATCAGCTACCTAGGATGCATAGCTTAACTTTTCATATTCCTTAGTTTAGGATCCACTGAATGTGTACTTCTTTCAGTAATGGCCTTTGGTCGTTATGTAGCTATCTGCCAGCCTCTCCATTACACAGTTATCATGCACTCTTGGCTATGCCAACAACTGGCAGCAGTGGCTTGGGTAACAGGTTTCAGCAACTCTTTGGTGCAAATAGTGTTGACCTTCTTGTTACCTCACTGTGGTCCATATCAGGTGGAGAATTTCTTCTGTGAGGTACCTGCCATGCTTCAATTATCATGTGTTGATACATGGATCAATGAAGTGGAGATGTATGCTGCTGTAGTGGTCATAAAAGTCTCTTAAAATTTTGATTATAAGGAATTTCACTTATTCAACAAATATTTGAGTGCCTAATTGTGTGCCAGGCACTGTTCTAGGCACTTTGGATTTATCAGTGGACCAACAAAGAACTTTGCACCATGGAACTTACATTTTGGTTTGGGAGAAATCAATGATAAGCAATAGATACTAAATATCATGTTAGAAGATGGTAAGTGCTCTGGAAAGGAAAAATGTGGAGTATGGTAAGAAGATGGGGATTGTGGGGCAGGAGGCATACATTGCAAGTTTAAATAGAGTGGTAAGAGTAGGACTCACCGTAGCTGTGGCATTTGAGCGAAGACTTGAAGGTGAGAGGAGACAATGCAGATATTTGGGGTAAAAATGTTCCAGGCAGAGGGATCAGCCAGTGCAAAGGCCCAGGGATAGGAGTGTGTTTGGCTTGTCCGAGAGATAGGAAAGAGGCCAATGAGAATGGAATGGAGTGTGTGAGAAGAGAATATCAGAGAGATTACACAGGGACCTGATTGGTTAGGGCAGGGGTTGGCAATTTTTTTCTATACAGGGCCAGATAGTAAATATTTTAGGCTTTGCAGGCCATATGGTCTCTGTCACGACTACTCAATTCTGCCTTTGTAGCACAAAGGTGGCCATAGACGATACTTAAAGCTTTACTGGAATATAGCCATGCTCATTTGCTTATTTATGGACTCTAAATTTATTTTATATGTCATAAAATATTCTTTTTCTTTTGTTTTCCACCATTTAAAAAATGTAAAAACCATTTTTAGCTCCCATTCTTAGCTCATGGGCCACATAAAAACAGGTATCTGGCTGCATTTGGTCTGTGGGCCATAGTTTGCAAGCCCATGGTGAAGGGTTTCCAGGGCCCTTATAAGATCTTTTGTTTTGGGACTTCCCTGGCGGTCCAGTGGTTAAAACTCCGCGCTTCCAATGCAGAGGGCACTGGTTCGATCCCTGGTCAGAGAACTAAGATCCCAGATGCCACGTGGCGTGGCCAAAAGATTTTTTTTTTAAAAAAAGATCTTTTGTTTTTACTCAGAGTTTAAAGGGGGAGCCATTAGCAGGTTTTGAGCAGATAAGTAAAATGATTTGATTTATATTTTTAAGGGATCACTCTATGGAATGATGTCTAAGATTTGCTTCAAAATAATCTGGAGGGCAGGGTACTATGGGGGTTAAAGATGAATCAAGATGGGTCATACATTAATAATTATTGAGTCTGTATAATGGGTATATAGGGTTTAATATAGTATTCTCTATGCTATTATGTAGGGTTTTCCATACTAGAAGGTTAAAACAAAAATAGGCACTCTGGCTGCTTATTTGGAGCAGACTGTGAGGAGGGAAGGTTAGGAATGAGAAAAGCAATTAGGAGGCTATTACGGTAATCCTTGAGAGATGGCAGTGGTGGCTTTGTCTGGAGTGGTAGCCCTGGAGGTGGTGAAAAGTGGTTGGGTTCCAGGGCTTCCCTGGTGGCGCAGTGGTTGAGAGTCCGCCTGCCGATGCAGGGGACACGGGTTCGTGGCCCGGTCCGGGAAGATCCCACATGCCGCGGAGCGGCTGGGCCCGTGAGCCATGGCCGCTGAGCCTGCGCGTCCGGAGCCTGTGCTCCGCGGCGGGAGAGGCCACAGCGGTGAGAGGCCCGCGTACCGAAAAAAAAAAAAAAAAAAAAAAGTGGTTGGGTTCTGGATGAATATTGAAAGTAGAGCCAAGAGGATTAACTGTGTATCGGGTATGAGGTGTGAGAGAAAGATAGGAGTTGGGGAGGCTTCCAGGTTTTGGCCTGAACAGGGAGAAGGGTAAAGTTGCCATAAACTGAATGGAAAAATCTGCAAGTAGAAGAGATGTGGGCGGAAAGATCATCATGAGTTCAGTTTTAAACATTTAAGTTTGAGATGTCTACCAGATATCCTAGTGGAAATATTAAACCGACAGTTGTCTATGCGAGTTTGGAGTTTGGGAGGAAGTTTTGGACTGAAGACATAAATTTGGGAGTCATTGTCATGTAGGTATCTTTAGCTTGGACTGGGTAAGATCACTGAGTGAGGGAGTGTAGATAGAGAGGAGAACAGTACCAAGCACTGGGCCTTGCAGCATTCCAGTGTTAAGTAGTCAGGAGAGTAGGGAGAGATAGCAGAGGAGACTGAGAAGTCACCAGGGAGACAGGAGGAAAACCAAGAGAGCATAGTAGCCTAGAAATCAAGGAAAGAAAGCGTTTCAAGGAGAGGGGAAAGATCAGTGATGTAAAAATACTGCTTGAGTAAGACGAGGACAACAAATTGACCCCTGAATTTAGCAATGTGATTATTGGTAATCTGGATGAGCAGTTTAGGTGGAGTGATGATGGCAAAAGCTACATTGCCAAGGGTCAGGGCAAAGAAATGGAGTAAGAACAGTCCGGAAAAGTGAGGGAAAGAAGTCCGCTCTTTAAGATGGAAGAAATAACAAGTATGTACAGTCAGCCCTCTGTATCCGCAGGTTCTGCATCTGAAGATTCAACCAATTGCAGATTGAAAATATTTGGAAAAAAATTCCAGAAAGTTCCCAAAAGCAAAACTTGAATTTGCCTTGCACAGGCAACTATTACATAGCATTTGCGTTGTATTAGGTTTTATAAATAATCTAGAGATGATTTAAAGTACGGGAGGATGCACGAAGGTTACATGCAAATACTATGCCATTTTATATAAGGGATTTGAGCATCTGTGGATTTTGGTATCCACAGGAAGTCTGGAGCCAATCCCCTGAGGATACTGAGAGACTATTGTATGTATACTTGTTAACATATAGAACATAACAGTATGCATGCAAAGAGAGTGACCCATGAAGAGGAAA\n>XM_042525726.1 PREDICTED: Zingiber officinale uncharacterized LOC121974587 (LOC121974587), transcript variant X1, mRNA \nTTGATCAACGTTTGACGAATTAGAGAGTTGAGGCCTCTTTTGTTTTGAATTTAAAGGAAATGGCGTCGTCTTCCAAGAGATCTGGCAGACCGGTGCTCCCTTTTCGGAGATCTGTCTCTCCGGCTGGCGGCTTCGCCTCCTCGTCAGCCAGCCTCTCTGCTCCCTTCTTGCATCACCGATCGGCCTCCCCTACCCGCGTCCACCTGGCCGGTGCTGGGTCTTCCGGATCTTCCTCCGTTCGCTTCTCCCTCAACCGATCTGCCTCCCCCGGACGCTCCATCGCTGCGTCCGACAGCCGATCATCTCCCGCCCCGGCCCGGCGCACCTGCCTCTGCTCTCCTTCCACTCACCCTGGATCCTTCCGCTGCCACCTCCACAAGGGCCTCAACGGCGGCGGATCCGCGGCCGCTTCCTCGCCGTCGAACAGGCTCAATGCGCGGAGGTCCGCGATGGCGAACTCGCTGGTCCGGATCGGGGCCGTGGAGGGCGAGTGGGTGAAGCGCGCGCTCTCGGCGCTCATCCGTCCCTCCTCCCACCAACAGCGTCGGCGGGGAGCCTTCCAACCCCGCCCTAGCCGCCTCTCTCGGATGTCCAACGCTGCCGATCCTAAATCTCCGTCGTCCGATCCACCGATCTAGAATCAGTAATGGGAGTAACGTTCCCTCGCTCCGTTACGTTCCCGTTGGGCTTCAAGTTTGGATTGCGTCGCCGTCAAGTTCTCATCGTTCGCCGGTACGTTCCGTCATCTGCGAGGGAATTGCCTCAGGAAGCTACTTGATTCAGTGACTCGGCCACTGGTGAGATGAATCGTAAGAATTATTTATTTAAATCATTTCGATAAATAGATAAAGGACATAAAATATGATGACTAGGTCTCAATTAAAACTATAATATTAAATCACTTTAGTATTAGAACCATTCACTTAACACAATAATCATGTAATGATTTTGAAATTCTATCAACGAATTTTAGAAAATAGAATAACTTCAAAGTTCAGAAGATAAAGTGAAAGTTTGGTAGAGGAAAACATTAGGTGAGGACAATGGACAAGTCCATGTGGAAGCCATAATTGTGGTGGGAAAATTGTTAGTGGAACTGAACCACCAAGAACCTAATTCACCTTCAAATTATTTCAACATCAAACGCATATTTAAAAACTACAAAAGTGAAACAAATAAAGAAACGTTGGGTGGGTTAGTTGGATTAGCTAAGCATCACCATTTAATATAGCACGCATATTTTACCATTACATTATTTTATTTATCATTTTAAATTTTAGTCTATAAAGGTGACGCAACAAAATTTAACATGTTATTTTTTTATCCTTTTAATTAAGAATAATGTACCTAAAAGTAACATATTGGATGTTATATTAATAAATATATCATTTTATTGTTTTCAAAGGGTCATCCCTTAGTGACAAGTGGGAATAATCACAATAGTTGAAATCATAAGGAGAACTTGTGATGGTGGAGATTGGATCTAGATGGTGAGGAAGAAGCTCCACCAGATTTTGTGATGACAAAAAGGACAGTTTGGATAATGTCTATCAACATAATATAAGCATTCCCTTTCAAATTAATTAATTATAGATATTGTTCTTATTAAAGAGTCACGGAACCAAGGTTATCATCTTGAAATATTGGTTAGTGGCTAGCAGGATCTTGTGTATCCCATGGGCTTTGACTGGAACAGTTGGCCACAGTTTATTATTAAAATTTGGGAAACCTAAAGATTTTTTCTTTTTTTTGTAAAATTTTACAAAAGAAGTATTAGAGGGAGATATAATTAATTACAATGATGAATTTATAAATTATTAAAACAATTAGAAAATGTATACCGGCCAAATTAATTAACACAACATTATGTGTATTCATCTGTTCCTTGTTTATCAAAGACAAAATTAATACAAAAGTGCGATTTGAAATAGTATTTTAGTTGGGTAAGTGTGTAGTGGGAATTGTCCCGCTTGCTATGGGTATTCAGATTATGGGGAGATCGTAGAGAAAAGAAAGAGAGAAAGGGAAGATGAGAAGTAAAACAATTTTAAAAGAAAGCGAAAATAATGATAATTCTTGCTTTTGTTCTCTTTGTCAACTCATTTTTCCATCCCATGGGCATTGCAGTTGGAAAATTTGCTACAAAGGAGGTTTATATTATATATTTCTGTGAAAGTCTCATTTATAGATAGTTATTGGATCAAAGTATAGTTAAAGAAAAAAAAACTTAATTACTAATTAATTAATATCCAAGATCTATTCTGCTCATATAAAAGAGTTATTCAAAAGATCGTACTGTAAAAGTTTCTTCCAGACTATTTGTTTCCCGATCCACTGATTACAATCATATCAAGTAGTAGCTGTGGGCAACTATAGCAATGGTTAGTGGTCGTTTTTTTTCCTGGTTTTTGATGGATGAATTTTAGAAAAAAGAAGAAATGTTGACCAATGTAACTGATGAACGAGCCACTCTCTAGAAGAGTGACAGATAAGAATCAAGCGAGGTTGAAAGGAAAATTTTGACCGGAACAAAAGAGGCTGCAATTGTCAAATTTACTTCTAAGAAGTCCTTTTAAAGTGGTCATTAATCCGAGCATCAAGTTTAAGACATTGTTTTTAGAGAAAGATGTTGGGCGTGGAAGCAAAGGCGACGGCACTGACATGGAAGATGATAGAAGTCAATTATGGCACAGGACTTTGTAAGAATCCATCTTCTCATTCTAGAAGAAAAAGGATATTTTTCACCGGCGCCTGTTTGATTTCCCGTACAGATAGTTAGGCGTAGGGTCGATCGTATGGGATAGTTATGACCGTTTGCAGAAAAAGAAAAAAGAACATTTTTCCTATTTATAAAGTGGTATTTCGAAATAGATGATAAACAATCGAAGATGATAAGAAGGATTTTAGGCAA\n>XM_039010113.1 PREDICTED: Salvelinus namaycush gamma-aminobutyric acid receptor subunit delta-like (LOC120060710), mRNA \nATGGACATGATAACTTTCATGTTGGCGAGCCTTGCCCTCCTGAATATCAGGGACAACATTTTCACCAGGGCCATGCTGAGTGACATTGGGGACTATATAGGTTCAGACATACAAATTTCCTGGTTGCCTAATCTGGATGAGTTAATGAAGGGCTATGCGCGAAATTTTCGCCCTGGGATAGGAGGCTCACCCGTGAATGTTGCCATGGCTATTGAAGTAGCCAGTATTGACCACATCTCTGAAGCCAACATGGAGTACACCATGACCATTTTCCTGCGTCAGAGCTGGCGGGACGACCGCCTGTCCTACAACCACACCAACAAGACCCTGGGACTTGATAGCCGCTTCGTGGATAAACTCTGGCTGCCCGACACCTTCATTGTCAACGCCAAGTCTGCCTGGTTCCATGACGTCACCGTGGAGAACAAGCTGATTCGCCTGCAGCCTGATGGGGTCATCCTTTACAGCAGCCGGATCACCTCGACTGTGGCGTGTGACATGGACCTGACCAAATACCCCATGGATGAGCAGGAGTGTATGCTGGACCTAGAAAGCTATGGCTACTCCTCAGAGGACATTGTGTACCACTGGTCTGAGAGTCAGATACATATCCACGGACTGGACAAACTGGAGCTCTCCCAGTTCACCATCATCGACTACAAATTTGTCACGGAGACGATGAACTTCAAATCCGCCGGACGTTTCCCGCGGCTCAGCCTTCGCTTCCAGCTGAGACGAAACCGAGGCGTCTACATCATCCAGTCCTACATGCCCTCCATCCTACTGGTTGCCATGTCCTGGGTGTCCTTCTGGATCAGCCAAACAGCAGTCCCGGCTCGGGTATCCCTGGGGATCACCACTGTGCTCACCATGACGACTCTGATGGTGAGCGCCCGCTCATCTCTCCCTCGAGCCTCAGCCATCAAAGCGCTGGATGTCTATTTCTGGATCTGCTACGTGTTTGTGTTCGCCGCGCTCATCGAGTATGCCTTTGCTCACTACAACGCCGACTACAGGCTCAAAGAGAAGGCCAAGAGCAAGGCCAACAAGATGAGCTCCGAGTCAGTCGTAAAGAATGGGAAACAGGCCATGGTGCTCTTCTCCCTGTCCGTGGCTGGAATGAACCAGGGCCTGATGGTGTCCAGCCGCCGTCCGCAGCGCTCCGGCGCCGAGACCGCCGAGGAGGAGGACGTGGAGCACAGGAGGGGGCGGGGGACCACAGCGTCAGAGGAGAGAGAAGAGGATAAGAAGTGCTGTAGTTGTTGTTCCAAGTGTTGTTGCGCTTGCAAGCCCCTCCAAGCTGATACCATAGATGTCTACGCCAGGGCCGTGTTCCCTGCCACCTTCGCCATCGTCAATGTGATCTACTGGGTGGCGTACACCATGTGA\n>XM_010916034.2 PREDICTED: Elaeis guineensis potassium transporter 7 (LOC105039769), transcript variant X2, mRNA \nTTCTCCCTGCTTCGCCATCTATGGGCTTTCGAGAAAACTGTCCTAAAATCTCACGGTTTTTCTCAGCTTTCTCCATCAGGTCGATCTCTCCTCGATCTAAGCTTCGTCGGTTTGCGGCCGATTCCTTTCCACTTTCCATCGGAAGTTCCTTTGTTCTTCATCTATGTCGTAAAAAGTTCCAATTTTAGATCAATTCTGGTTGAGTTCTCCATGGCGGAAAGCTCGGGGAGGGCGAATGGGTGGTTGGCGAAGATGGATTCCTCCGAATCGAGGTGGGTCTCTCAAGGTGAGGAATATTCTAGCGAGGAAGAGGAAGAAGAGGAAGAGTTGGTTCGCCGGGCTGTTTTCGAGTCGGAGGAAGAGGACAGCGGGACCCGGAGGTTGATTAGGACCGCCCCCCGGCTCGATTCCTTCGATGTCGAGGCGCTCGACGTCCCCGGAGTTCAGAGGAATGAGGTCGAGGAACTTGACTTGCGCAAGAACTTCATACTTGCTCTTCAGACTCTTGGTATTGTGTTTGGGGATGTGGGAACGAGTCCATTGTATACTTTTGATGTTATGCTTCATCAATCACCAGTTCGTGTGAAGGAGGATGTCATCGGAGCGCTGTCTTTAGTTCTATATACTTTGATTCTGATACCGCTGGTGAAGTATGTGTTGGTGGTCATTTGGGGCAATGACGATGGTGAAGGTGGCACATTTGCTTTGTATTCATTGATATGTAGACATGCAAAGGTAAGTCTTCTACCAAACCAATTGCGTTCTGATACCCACATATCAAGTTTCCGCCTCAAGGTTCCATCACCGGAGCTAGAGAGGTCTCTAAAAGTTAAGGAGCATCTTGAGTCTTCATTGATGCTGAAGAAACTGCTTCTTATTTTGGTGCTTTTTGGCACTTCCATGGTCATAGCGGATGGAGTTGTCACCCCAGCAATGTCAGTATTGTCAGCTGTGGGTGGTCTGAAGGTTGGAATAGCTAGCTTTGAAAAAGATGAAGCGGTGATGATTTCAGTTGCATTTCTTGTAATCTTGTTCAGTGTACAGAAGTATGGAACCAGCAAAGTGGGGCTTGCAGTTGGCCCTGCTTTACTTGTATGGCTTTGCTCCCTAGGGGGCATTGGAGTTTACAACCTTATAAAATATGGTGTAACAGTTTTGAGGGCATTCAATCCTGTCCACATCTATTATTATTTTGAGAGGAATTTAACTCAGGCTTGGTTATCTCTTGGTGGTTGTCTTCTGTGTGCAACAGGTTCTGAGGCAATGTTTGCAGATCTTTGCTATTTCTCTGTAAGATCTGTTCAGCTAACTTTTGTGTTTTTGGTTCTGCCCTGCCTTCTGTTGGGATACCTTGGCCAAGCTGCTTTCCTCATGGAAAATGTAACTACATCTGAGCAGGTCTTCTTTTCGTCTATCCCAAGCACTGCAGAGCTTGGAATAATGATGATGACAACAATTCTAGTAACCATCATTATGCTTCTAATATGGCAGATTAACATTTTCATCGTGCTTTTCTTTGTCATATTCTTTTTGGGGGTGGAATTAGTTTTCTTCACTTCTGTTTTGGGTAGTGTGGAGGCTGGAAGCTGGGTTTTATTGATTTTTGCAGCAATATTGTTTATGATAATGTACATATGGAATTATGGGAGCAAGCTAAAGTATGAATCTGAAGTTAAACAGAAGCTTTCAATGAATCTGATGATGGAGTTGGGCTGCAACCTTGGGACCATTAGAGCCCCTGGTGTTGGCTTAGTTTACAATGAGTTAGTGAAAGGAATTCCAGCAATATTTGGACACTTTCTGACCACCCTTCCAGCAATCCACTCTATGATCATATTAGTGTGCATAAAATATGTGCCGGTTCCTGTAGTTCCTCAGAGTGAAAGGTTTCTTTTCCGGCGTGTCTGCCCAAAGAGCTATCACATGTTCCGTTGCATTGCTAGGTACGGCTACAAGGATGTAAGGAAAGAGCAGCACCAAATATTTGAACAGCTACTTCTTGAGAGTCTTGAAAAGTTCATACATCGAGAAGCCCAAGAACGCTTATTAGAGAGTGATGGAGATAGTGATTCAGATGCGGAAGAAGCGGCATCACGTTCAAGAATTCTTATAGCACCAAATGGCAGTATGTATTCCTTTGATGTCCCTCTCTTGGCTGCTTACAACAGTACTGAGAAGCCAAGCCCGGAAGCAAGCACTTCATCTCATGAGGCTCGAGATGAAGCCATGCCAGATGCTAGGCAGAGTCTTGAGCAGGAGCTTTCATTCATAAACAAGGCTAAAGAGTCAGGAGTTGTCTACCTCCTTGGCCATGGTGATATTAGGGCCCGAAAGGACTCTTGGTTTTTCAAGAAACTGGTCATAAATTACTTCTATGCTTTTTTGAAAAAGAACTGCAGGAGAGCGATAACAACATTGACTGTTCCCCACACAAATTTAATGCAAGTTGGCATGACTTACATGGTTTAG\n>XM_035180460.2 PREDICTED: Hippoglossus stenolepis sperm associated antigen 9a (spag9a), transcript variant X14, mRNA \nCCAGGCGCCTGTGAACGCAGCATTTGACGAGGAAGAGGAGGAAATCCACGTAGCTCGTCTCGCGTCGCGGGGTCCGGTCGTGTTGTGTCCTCGATGTGTCGGCCCGTGTAAAGAAACGCTGCTTTTCTACTCGGCGGATAAAGGCGTCCATAGTGGCGGGGTGACGCGGGGCTGCCCACACCGGTGCTGTTTGCTGAAAGCGGGGGAGAGGACAGCGGGGAAAATGGAGCTGGAAGACGGAGTCGTGTACCAGGACGACCCGGGGACGTCCGCGATGATGTCGGAGCGGGTGTCGGGCCTGGCCAACTCCATCTACCGCGAGTTCGAGCGGCTCATCGGGAAGTACGACGAGGACGTGGTGAAGGAGCTGATGCCGCTGGTGGTGGCCGTGCTGGAGAACCTGGACTCGGTGTTCGCGGAGAACCAGGAGCACGAAGTGGAGCTGGAGCTGCTGAAGGAGGACAACGAGCAGCTCATCACCCAGTACGAGCGGGAGAAGGCGCTGAGGAAGCACGCGGAGGAGAAGTTCATTGAGTTTGAGGACACTCACGAACAGGAGAAGAAGGACCTGCAGAACCATGTGGACAGAATGGAATCGCACTCCCGACAACTGGAGCTCAAGATCAAGAACTATGCAGACCAGATCGGCAGGTTGGAAGAACGAGAGCTGGAGATCAAGAAGGAATACAACTCCCTCTATCAGAGACACTCAGAGATGATCCATAATTATATGGAGCATGTAGAGAGGATCAAAATGCAGCAGATTAACGAGACTTTGGAATCGAGCGCGGTCGGCCGAGTCAGGAGAGAACGGCCTCTTTCTTTGGGGATTTTCCCCTCGCCTGGTGGGGCATCTCTACTCATCCCAGACCCGCAGGCCAAAGCGGAGACGCCGGGCACAGACCGCTGGAGGTTCACTGACTCAACACAACCACGGTCCAACACTAGCCTCAAGCAGTTGGACTATGTCGACCCCCCAAGGGACAGGGAGGGTAAGAGTGCGCAGGACTCTACTTGGGGAAATTCACTGGCAGACGACTGCAAGGATGAGCTGTCGGACTTCACCGGCTCCAAGTCGGCCACACCAATGTCCACGACCGCCTCTGACATGGAGAGGGAAAATGGGAACAGTAAGAGCACTGAGGTGCAGGCGGCTCCAGGGACCAGATCCATATCAGTGGGTTTGCCTGAAAACAAAGACAGCTCAGACGTGCAGGACATCATTGAGTCCACCCCTGAACTGGACATGGATCTCGCTGGATACAAGCTCTGCAGTACTCCTACCAAAGGCATTGAGAACATGGCCTTCGACCGCAATACAGACTCTCTGTTTGAGGAGCTGTCATCTGCGGGCACTGGGATAATAGGGGATGTGGATGAAGGGGCAGATCTGCTGGTGGAGTACTCTGACCTTAGTTTGATTGGTATGGGCCGGGAAGTTGAAAATCTCATTCAGGAGAATTCACAACTGCTTGAGACAAAGAACGCCCTGAACGTGGTGAATAAAGACTTAATATTGAAGGTGGACGAGTTGACCTGTGAGAAGGAGATGTTGCAGGGAGAAATGGATGCTGTGATGCAGGCCAAGGCCAAGCTGGAGGACAAGAACAAAGACCTGGAGGAGGAACTCAAAAAAGTGCGAGTGGAGATGGAGGAAGTGAAACACAAAACTAAAGATGAAGAAGATAATGATGTACCTACAGCCCAGAGGAAGCGTTTCACCAGAGTGGAAATGGCCCGAGTGCTGATGGAGAGAAACCAGTACAAGGAGAGACTGATGGAGCTACAGGAAGCGGTGCGGTGGACAGAGATGATCAGGGCCTCGAGGGAAAATCCAACACTAACAGAAAAGAAGAAGTCCAGCATCTGGCAGTTCATTGGCTTCAGCAGACTGTTTAGCTCCTCCTCCAGTCCCCCCGCTGGGAAGAAGGTGGAGTCCCAGTCCAACGTGAAGTACAACGCCCCGGGCGGCATGGTGAAGAGGAGCAGCACCTTCTCCCAGTTCCCCACAGAGAAGTCCAAGACCTTTGACTTCCTCAATGAAGAAAAGGACCAGTGTAGTTCACCATCGCGTAAAGAGCAGAAACGAGCCCAGTACAGACAGGTCAAGGCCCACATGCAGAAGGAGGATGGACGAGTCACTGCGCACGGCTGGAGCCTGCCCAGCAAATACAAGGTGGCAAATGGTGGACAGGTGGAGAACAAAGTGAACTTACCTGTACCGGTGTACTTGAGACCTCTCGATCAGAAAGATGCTTCTATGAAGCTGTGGTGTGCTGCAGGGGTCAACCTGTGTGGGGGGGGGATATCAGAGCTCACGAAGCAGACGAAGGGTTCTCAGAGTAGCCTGGACCAGCTGGAGCAAGAGAATAAGGATCAGGAGAAAGTGGAGCAGGAGAAGGAGCTGATACTTCAGGATGAGACGTCCAGTCGGGTGTGGGTGTGTACCAGCACCCACTCCTCCACCAAGGTTATGGTGCTGGATGCAAGTCAGCCATCTGACCTACTTGACAGCTTCTATGCCTGCAACACCCACGTCGTCTGCATTGCCAGTGTGCCTGGGGTGTTGGAGTCAGATTTTTCGACAGGTGAGGAGGTACCACAGGACGTGGACGCTAACCAGGGTGATGTGGTGTCACTGGCCGGCAGTGTGGCCAGTGTGGGGTCTACAGGCAGCGATGGAGCCATGGCAGCAGAAGGGACCACCGCAATCCCACAGATAGCCAGCTCAGTTGAGCTGTCCAGAGAGTCGAGTCCAGCAGAAGATGGGATTCCTCCGGCGGAGGAGGCAACAGAAGCAACAGAAGCTAACGCTGGTGTGGGTGAAGAGGGAGAGGAGGACCAGGGGGCAGAACACAACCAGCCGGGAATCTACACAGAGCATGTGTTCACCGACCCGCTGGGGGTGGGACCCACTGACTCCTCGCCTACTGACGCACAGAGGGGCACCGGGCAGGATGGAGTGGATTCCTTGCCTCCAGACTCGGACCCGTCGGAGGGGGATGTCCTGAGGATGAGCAGCGCCCTCCCCACCATGTGGCTCGGAGCTCAGAATGGATGTCTGTATGTCCACTCGTCCGTGGCACGATGGAGGAAGTGTCTGCACGCCATCAAGCTCAAAGACTCCATCCTCAGCATAGTGCATGTTAAAGGGAGAGTCCTGGTAGCGTTGGCTGATGGGACATTAGCAATTTTCCACAGAAGCATTACAGACGGACAGTGGGACCTAACCAACTATCACCTGTTGGATCTGGGCCGGCCCCACCACTCTATCCGCTGTATGACCGTAGTCCATGACAAGGTGTGGTGCGGCTACAGGAACAAGATCTACATTGTCCAGCCCAAGGCCATGAGGATAGAGCAGAAGTCCTTTGACGCTCATCCTCGCAAGGAGAGCCAGGTGCGGCAGCTGGCCTGGGTTGGAGACGGTATCTGGGTGTCCATCCGACTGGATTCCACCCTTCGCTTGTTCCACGCCCACACCTACCAGCACCTCCAGGATGTGGACATCGAGCCCTACGTCAGCAAAATGCTTGGTACTGGTAAACTGGGCTTCTCCTTCGTGAGAATCACAGCTCTTGTGGTGTCCTGCAGTCGTCTGTGGGTGGGGACAGGAAACGGTGTCATCATCTCCATCCCGTTGTCTGAAGCCAACAAGACAACGGGAATAGTGCCAAATCGGCCCGGCAGCGCTGTACGGGTTTACGGTGATGACGGTTTAGACTGTGCCATGCCAGGCAGCTTTGTGCCATACTGCTCCATGGCCCACGCCCAGCTGTGTTTCCATGGACACCGAGATGCTGTCAAGTTTTTTGTCACCGTGCCAGGTCAGGCAATGCCTCCTCCATGTAGCGCAGATTCAGGCTCCGATGAGCCCCCGTCTGAATCCTCTGACACAGCGACCTCCGAGCCCAAAACACACCTGGTCATGAGTGGAGGTGAAGGCTACATCGACTTCAGAATGGGTGATGAAGGTGGCGAGTCGGACGGTTTATCAGAGCCGACAGCCGACCAGCAGTCGGCACCAACCAAGGCTGAGCAGAGCCACCTCATCGTCTGGCAGGTCACAACTTCTAATGATTGAAAAAAAAACAACTGACATACTGTTGTCAGGGCCTCCCTCCAATCCTTGCATGTCCTCCTCTAAGTTTTACATTTGATATTACTGATTGTTCTTAATGCCTGAGTAGTTGACTACTTTGTAAAAAAACAAAAACAATTATTTTTAGTCCATGTTTTGTACAGTTTATTGTTTATGAATTTGAAAAAAGTGAGGATTATGTCGGTTTAAGGAAAACGTCCACGGTCCGAGTGTTTCCTTCTGCCGGGGCGCATGTTGGAAAAGCAGGTGCACGCAGGAAAAAGTTCAAGTCAGTTCAGGAGAAGGTGCGAGATACTGTAAGTGTGATCGTTTGTTTCTAAAACGTCAAAAACGGGTTTAGATGTGAAGGACAAAAAGGAAAAAGTACTTGAAGGATTCAGGAGAAGTCGTTGAAAAGGGACCAGGGAGTTTTCATTTGAATGAAATATATTTTATGTTACACACATAAGACTTTTACATTTGTAAACCACATGTGAGAATGGAGTCATGAATTCTATCCTGTGTTAAGCATTTTTTTTTATTATCCATACTATTCGGGCTGGGTGTGTAAATGTGACACCTACAGGTCAGAATACATTCATGCAGACAGGCTGATACTGGTCGGTCTGCTAAGTAGAAAACCAGTTTTCACAAACAAGCAATCCACAAACAAACATTTCCTCTAAACTAAATGTACTTTTATTGAGTAAAAGCTGTACGATAAAACATTATCTTAGAGGTCTTATTTAATTAAAGGAAACCGAGCCGCAGGATTATGTTTAGGAATGTTAATCATATCAAAGCAGTTAGGGTACTGTAAGGTTTCCTGTGAATAGAGGACCCAGCTTACTGTACTGTAGGTTAGCATTAACCGGAATGAAGGGAATCCTGTATCCTTGTGTGTGTGTGTGTGTGTTCGCCTTCTCGGCCATTTTACGGCTCAACCCTCATCTATTTGCGCGAGAAGAATCCACCCGTGCTTCCTGTTTGCTTCCGCTCATCGGCACTTTAAGATGTTAGATGTTATTCGCGTGACATTTGGAAGAACACTCGTGGTGATGCACACTGCACTGCCATGTGCTACATTTATTTATTTATTCGGTTTAAAATAACAGGAACAATGCTCATTAATAAACATTTTTGTAAAAGGGAACATAACGGACAAATCTTTATAGGGAGGTGACACCCCAGTAACCAAAGGACGAAAGAAGATGCACCGTGAAACTATTTGTTTTTTGGTTTTTTTCCATCTTTTAAACGTCTCATGAGTAATAATTTGAAGGTTTTAAATGTATGTTTTGTTGAAAAATAGGCTTGAATAAGGGAATTGGACTAAAAGTAACATTTCCGTGTGGCACCTTCTAACGGACATGCACACAGCACTAAAGAGTGTCTCTCCTGATTGCCTCATCATTCCTTGTTTTGTTGTTAAAAATACATTTTGAGGCCTGGAAGGCAAATTTTGTCATTATTTTTCTGTTGCTTTGGGCATCGTGCGTGTTTTGTATTCATCTGTGAGACACTTTCATTAAGTGAAGACTATTTTGTTGAAATAACCGAAGGATTCCAATATTGAGCAAGTGTTTTAATTTGTTTTTATATCTGAAAACTTGGACCACTGTTGGTCTTCAGTCTATTTCAAAATATTAACTTTATATTGTGCTTTATTTTTCTGCCATTCCAGTATTTATTTCCTTTGTTATGGAGCCTATCTGGGTTCAGAATGTAACTTTCTACATAAGTATAATAGGAGGCTATTGTAAACGGAATAGTCCAATGCGTTTACACGATTGTTAATAATGGCTAAATAAAAGAAATCAATGTTA\n>XM_041364600.1 Suillus fuscotomentosus uncharacterized protein (F5891DRAFT_1130999), partial mRNA \nATGCACCCCTCAGAATTAGATGCTAGGATTAGAGTGCTCCCACCCTGCTTTGAGGTTTGCCATTTCCAGAATGGTTGGACTGTGCTCTCTCAGATCTCTGGTAGAGAGAGGAAAGAGATGGTGTGCATCTTATTGGGATGCTTAGTGGGAAAAGTTCCTCGACAGGTCATACTTGCATACCGCTCCTTACTGGACTTCATCTATTTAGCTCAGTACCCCACTCACGATGATCAAACCCTAAGCTATCTTCAAGATGCTTTGGACATGTTTCACAAGCATAAGGGGGTGCTTATTGAACTGGGCGTAAGGGACCACTTCAATATTCCAAAAATACACAGCCTCACCCACTATATCAACTCTATACGCCTATTTGGTGCCATGGACAATTACAATACAGAGGCATTTGAGCGCCTTCACATTGATTTTGCTAAGGACGCCTGGAGGGCAACTAATAAAAGGGAGGAGTGCCCTCAAATGACTTCATTGGAGATGACTCAGCTTCCATTTGACAAGCTTGACATATACCATGGTTTCAAGTTTGTTTTGGAGGAACTAGGGGAGGATGAAGTTGACAGTAGTAGACAAACTGACTGGATAAAGGCCTGTCCAAAGACTCATGGTTCCCATGGTCAGAAACACTTTGATACAGTTGTGGCCATGAGGACGGATGAGTGCCAAGCTACTGGGGTTCAAGGCAAAATCGGGCGACTTAGGTTATTGTTCAAGCTACCCCAACAATGGTATACTATGCTCAAAAATGTGCCAGAGAAAGAACACTGTATGTATGAGGTGAAGAAGATGCCACTAAGGAGCGGTAATGTAGTACCAGCAGATATCATTCCTATCAGCACCATATGTCAGACTTGTCAGCTAATTCCTTGTTTTGGTACTGCTGATGTTTCCAGAGAATGGAGATCAGAAAATGTACTGGATCTCTGTGACAGGTTCTTATTAAATAATTGGTCCACCAAGTATGCATACAAAACACTGTATTAG\n>XM_041096011.1 PREDICTED: Gossypium hirsutum uncharacterized LOC107900440 (LOC107900440), transcript variant X1, mRNA \nATCTTCAATTGTCATCAGTTCCGTCACACCCCAATTCTCACAGTCAAACACTTGGAACCTTCTTTCATACCCCACTGCCATTTTCCCTTTCATTTTTAACCGTAATTTTTCCATTTCCTCCTCACTCAACTTTCAATCCTTCTTCTTTGTACATAAAAGAATTCGCAAAATCAAAAAAAAAAAATTGAAGAAAGAAAGGAGATGGGTTTTTCAAAGGAAGAGAAATCGAGAAGAATTTGGAGGGTATTGAAAACAGTGTTTTTCTTGATAACAATGGCGATTTCGTTCCTCGTATTTTCTGCGCCGGTTTTTCTCGTTCTAGCCGATGCTCTTTTGCCTTCCGCTTTGCTCTCTGCTTCGCTTTCTCCTTCTTATTTATCACTCCAATCCCTTTCTTCCCATTTCGATAACTATGATTTTAGATCTTCTCTCATAGATATTCCCCTCATATCCATCATCAGATCAGCTGTTATAATCGTTGTTTACAGTTTTTGTGATGGGCCAAAACTTTCGAGGGGACCATACCTGGGAATCACAATGATTTGTTCGATTTCATCGTTGGTTTTTGTTTCGATAAAAGCTTCGTTTGTGTTCGGTTCGAGAATTCCTAAAGAAGGGACATATGTTACAGCCATGGAAACCGCTCTTTTCATTTCTTCATTGGCTTTGGCAATTGCACACATGACTGTGGCTTATAGGACAAGTTGCAGAGAAAGAAGAAAGCTCCTTGTCTACAAAATTGACATTGAAGCTATTTCAGCTTGCAAGAATGGGTTTCCAAGGTATCATAAGATTCTCCAACAAGAAAGGGTGAAGTAAATGCAATATTACCAACACTGAACGATTTTCCTCTCCAAGAAACCTACCCTGTTCTTGGCTCATCACATTCTTCTTTCTCACATTTCAGATTTAACCAAAACCAATCAGTCACTTGAAAATCAAAGTGTTAACAAGCAGATCACAGCCAGCAGATACAGACATACATACATACATACATACATACATACATACATATATATATTATATTTCGAGGAAATGATCGAACATGCAATGATTTTGAGTGTACAGTTTGTATTACATCTGTAAATATTAATTTAAAAACAAAGGAAGAAATGGGCCAAAGGTCTTTTCCATACCCCAATTTTTTTTTGAAATATTTGAAAAATATTTATTTTAGTTATTATTTTGGCCGAACGATTTAGGTTAATTATTTTTGGTTCGAATAAAAATATTAAGGTTAAAATATGTTTTAACTCTATATGCTCTATTTTTAAGAATTTCGTCTATCTGTCCCTTGCCGATTTCAATTTAATTAGTCTAACCAACTGATTTGATCCAGTTCAAGTTTTTATGTTTTTTTTTATAATCTTTATAAGATTATATTAATTTTAGTACTTTTTATGATTTTTATAGAATTTTAATATGTTTTTTAATTTCAAATATTTTAAATTTGTTTTATTAATTTTATAAAAATATTTTAGAATTTATTAGAATTTTATATTTTTATATTTTTTATATCAATTTTCATAATTTTTATTTTTTATATTTAATATTTTTTAATTATTTTTATTGGAAAAATATTAGATTAAACTAGAAGCTGCCATCTGTCAACATCTAATTAGTCCGCCAATTTATTTTGACAGTCAACATGGTTAATGATAAAAATTGTTAATGTAGGAGCTTAATTGATTATTTTAGTTAATGATAGAGGCTAAATTGAATATGAATTTAATACATGGGCTTAATTTATCTTTTTTGCAGCTTTTTAAATATATAAGTCACATAATTTAAAAACAACAAAGGTTGTGACATAAATCCTATATATAAACATAGTAACTTGAATTTGACTATTTTTTTTGGACTAAAATAATATAAACCTAGACTTGCTTAAGATATTAGAGTATAGGAGGAAGGGTTGTATGAAACTGTGATTCCATGTCATTCTTTATCTCTTTCCATTCTCTTATTATAAAGAGATAAAAATGATATGAAATTACAGTTTCATACAATCCCACCAAATTAAAGAAAAAAAATGAATAAATAAATAAAATTCATTTTTTTATGATTCGATAAAGGAATCAAAATTCAAAGTTTTTGTGTGTTTGTTCTTCAGCTTTGTGCAATGAGAAATTTGGTGAATTTCATTTAAATAAATAGAATTTAGATGCCAACATTTGGGGAATTTTTACAAGTTGGAAATAAGGATCAAAACAATGCCCACTGCATCTCTATTACCTGAACAACATTTTTATCCCTCACTTTCAAATCCAGGTAAAATAGTGATCGTAACCCCAACTTTGGAAATGATTACACCTCCACTCCATCTTCTTTACAATGGCTAAGATGCCCAGATTTAACGCCGACGCTGCAGATTGATCGGAAATCGCTTTTGGGTTCGGGTTGTGGGGAAGAAAACTAGCTTATCTTCTTCAGCAGGTACCCAACTGTATCAGAAATATAAACTCAGAATGCAACAAGCTTCTATTTTTTAACTCAAGTTCTAAATAAAACTCGGTTTGATTACCTGAACTGAGTTACAAGGTGGTGTAAGAAGACTGAGATTTCTACTCTAGCAAGCTCATATCCAGGGCACAATCGAGGCCCTCCTCCGAACGGCGTGTAAAAATTCCCGGAACAGCTCGTCCCCAAGTTATTATTCTGTTCAATTTCATCCAACACTTCTTTGTAACTTTCGTCGTGTACCATGAACTATAATGTTGCGTTACATCTTATACTTAAATTTACCTTCCATCTCCATGGATTGAAAGTGCGAGCATCTTTAAAGTGATCATGATCAAGATGTACAGCACGAAACGATGCAAAAACCTTCCAACCCTTTGGAATTGTGTAACCTGGTCGAGTTGAGTTACCAGTAAGCACACAAAAAATGAGTCTAACAGGTTTCGGATTCGAATTCTAACA\n>XR_004848542.1 PREDICTED: Amphiprion ocellaris uncharacterized LOC111577915 (LOC111577915), ncRNA \nATGGCTGCACAGTAAATGTGTTTGATGCTGCCAGCTGAGCTGCAGATGGATGTTCATTTTTGTTTCTGTCTTGTGTTTCAGTAACAGCTGTAGCTATTGCAGCAGGCGCTGGTGGAGCAGTGGTCTCTGCTCCGTTTGTTCTGGGAGCCATAGGTTTCACCTCAGCTGGAATAGCAGCAGGTTCCTACGCTGCAGGCATGATGTCCACTGCTGCTATTGCTAATGGAGGAGGAGTTGCAGCAGGGAGTCTGGTGGCTGTTTTGCAGTCAGCAGGAATGGCTGGTCTGTCTGGGACTGCTACTGCAGCCGTGGCCAGTGCTGGAGGAACGGTGGGATTTTTGGCTACTCTCATCTGAGATGAAGCTGGAAATCATGAAGGAATAATACATACGAGACAATGTATTTGCTTTTGTAAATTAGAAACAAATGCCAACAATATCAGTGAAGTCGAACTTTATCTGTCAGTAAAGTAAAACTTGACTGAAATCTGTGGGCAAAAAATGTTTCTGTGTTTTTACAAAGCACATTTATATTGTCAAATTGTCCAAAATAAAGAATAACAATGAAGGAA\n>XM_034416225.1 PREDICTED: Pantherophis guttatus spondin 2 (SPON2), mRNA \nAAAACCAACCACTGCCCCGCTTGGACTAAAGGGACTTTTGCAGGCATAAATAGCAAGATTTCCTCTCTTCCCCTTGCAGATTTTCCAGCTGGGAGACAAAGCAAGTTCTTCTCCTAACAACCTCACAGCCACCGGAACACCCGAAATGGGAAACTCACTACCTGTGTCTGGTTCTGACAAGACAATCGCAGCACTGCTGGTTGCACTCTTGAGTTGCGTGGATTGTGTTCCCCTCGAGGGAGAGACCCTGTGTGGTGCAGAGGAACCAACCACCTACAGCATTGTCTTCACGGGGAAATGGAGCCAAACAGCTTTTCCAAAGCAGTACCCGCTCTACAGACCCCCAGCGCAGTGGTCCTCCCTCCTAGGTGTGGCCCACAACTCGGACTACGTCATGTGGAAGGCCAGCGGCTATGCCAGCAACGGCATGCGTGAGTTGGTGGAGAAGGGGGAGCCCTGGATGCTGATGAAGGAAATTGAAGCAGCTGGAGAGAAAATGCAAAGCGTTTATGGAATCTTCTCCGCTTCTCCTGTGGTTACCGGAACAGGACAGACCTCAACTCTCTTTGAAGTTGACCCGGGTCATCCCTTAGTATCCCTTGCAGTACGAATCGTGCCCAGCCCTGACTGGTTTGTGGGGATTGAGAATTTTAATTTGTGCGACAAAAATGGCTGGAAGCGCCACGTCTCCATAGATTTATTTCCATATGATGCTGGAACGGATAGCGGCTTTACGTTTTCCGCACCCAACTTCGCCACGATCCCTCGCGATACGATCACGGAAATCACCTGTTCCTCCCCAAGTCATCCTGCCAACTCATTTTATTACCCCAAGCTTAAGACTCTGCCGCCGATTGCCCGGGTGACCATGGCAAAACTCAAAAGAAAGAAATTGGGCTTTCTCATCTCTCAACCAAACGTCACAACCACCCATAACGAAGTGGAGGATTCAGTCTCGGAAACACCTTTGGATTGTGAGACCTCTCTGTGGTCTTCGTGGGGCCTTTGCCGTGGCACCTGTGGAAATTTAGGAACGAAAAGACGGACTCGGTACATACTACTTCAGCCAGCCAATCATGGGACCCCCTGTCCAGATCTGAGCGAAGAAACACACTGCGAACCAGATAATTGTGTCTGAGATAATTTCTTTGGACCATCGTTTACCTCGTGTAATTTGGGGGATATTTAAGGTATCTCTGCGTTGATATTTTTTATAGCTCATGAGCTGTCCATCTATCCATCTATCCATCCATCCATCCACCAATCCAATAGATAGATCTACTTAAGGGATCTGAGCTTTCTACACGTTTATTGTGAACTCCTACAGTGCCACCTAGCGGTCAGAAATAGTAGTAATAGTAGTAAACTCGAATAGTAAACTTAGTGTTACCAACATCTGCACGGAGAAAAGAGGCAGGCGAGAATCTTTTCATTTCTGCTACTTCTGGAATGTATTTAATGCATCTGAGGAATAATGAGCTAGTTTCTACTGACTTACGAAATGCTGGAGAATTAAATGTATAAGTTTTGAGGGAGAATCAACTTGAAGGAAAAAGAAAACCAAGTTTTTCTCAAGAGTACGAGAAAAAAGCCGAGATTTATTTGGGTGTGTGTGTGTAATTCTAAAAATTTTAAGCTGTTGTTTGAAAACTCTTGGGCTGGCTATGGTGAAAGTTGGCAAGTTTTATCTTTTATGCAGATTTCTATGAATTTTGTCCTGTTCTGTAAAGAGCTAAGAAGGCCTAAAAGGAGAACTGTAATAATAATTTGCTAAAAAGTTTGTGTACCAAGGCGTAGAGTATATACGTCCTTTACTTACAGTGTTCTATATTTCTGGATTTTTTTTTTCTAATTAAAAACAAACATTTTCCCTCCGGTTAAATAATA\n>XM_047217565.1 PREDICTED: Lolium rigidum uncharacterized LOC124682972 (LOC124682972), mRNA \nCACACGCCTAAGTGCCATTGATGGCCACGAAAGCCTGGAGCGGCTCCACCCGCTTCAGATCTCCGGCCAGCGCCGTCTGGTTCCTAGCGGCCGCCATCCTCATCCTCATCTTCCTCCTTCAGCGCCGCCCGCCCATGGACCCTTACGCTACCCCAACCCCTCGGACCTCCGTGTCGTCCCGGCGCGCCGAGCTGTACGGCAGGATGGCGCGGGATCTCGACGAGCGCGGCGCCGCGTTCTTGGAGGGCGGCGAGACGTCGCAGTCGCTCACGCTCTCGGACCTCTTCGACGTCAGAGACAGCGCCGTCGTGCCCAGACTCAAGGCCGCCGACCCACCGGTGCGCGCGAACGTGCTCTACCTGGACCCAGAGTTCGCGGCCGTCATATCGAAGGCTGTGAAGGAAGTATTTCTTCCTTATTTTGACAAAGTTATCTGGTTCCAAAATTCCAGTATGTATCACTTCAGTATGTTTCATGCCTCCCATCACCTGGAGCCAATCTTAGCATCCAAGGCCGAGATTGAAGCCGAAGTCGATGCTGTAAAAAGAGTTACTAAGGCTATTTGTCCCATTCAAATTGTCTTGGATCAAGTGGTCTTGACATCAACTGGAGTTCTTCTTGGCCTGTGGCAGGTTGAATCTGGTACTGATCCTGCCGACATCCGCTCAAAATTGAGAGAGGCTCTCCCTCGAGCACCTCAAAAGCAATTGTATGACCCTGTTCTGCTTCACACCTCCTTTGCACGAATTTTGGGACCTCCTAAGCTTCCACAAGAGGAGAATACGACATCTTTTGATCACATCAAATTCTTCCATGACCTCGTTGCACAAGTTAACGGGAAGATCCGTGGGTTCCAGGCGAAGGTAGCGGAGCTGTGGTATGTAGAAGAGTACGACGTCCTCGCACTAGCGCTGAATGGAAAGATGAAAGTTCGGAGGCTCAACCTTGGCTGCAATGAAGAATAGAGCAACTGACGGAGGACAAAGAGAACACCACGGGGATATTAATCCATCGCGTCCAAGCATTATTATGCAACGCTTGGAATGCTTTCGTGATTCGAACATCACATCCATGGCAACCTTTTGTTCTGCGAAGATTGGGACCAGGCAGCGCCGAGGAAATAGCAGCTGGGTGCCCCCAATAGAGAAGTAGAGATCGAATGTAATTGCTTTCACACCACAGTATTTGAGTACTGGTGATTCGTGAATATGTGGATGAAAATCAAACCTGTATTTGTAACACCTCTCCTGTTACTCAGAAAAACTTCCAACTTA\n>XM_017403287.1 PREDICTED: Daucus carota subsp. sativus GBF-interacting protein 1-like (LOC108227900), transcript variant X2, mRNA \nAATAACAGTGAATGGGCTGGTCTAGTGAGCATCAGGAGGTAATTTGGTTTTCAAAACCCTTGTTTGCGTCCCATAACTCTTTTTGAGCCGTTCTCAACTATTATATATAAACACACACAATCACTCAAAACCCATTTGAAATCGAATGCAACTCGCTCTTCTATTGGCTCTGTTAAACCCTGTTTTGATATTGGATTACTATCCCAACTGGGTTGTTTTCAAGTATCTCAAAGATGGTGTCTTCTTCCTCAACTTCAAGAATTGATGGGGGCCCTCAAATACTGTCTGCTGGCGTGAGAAAAACAATCCAATCCATAAAAGAAATCGTGGGTAATCACTCTGATGCTGAAATTTATTCCACCCTTAAAGAGACTAATATGGATCCTAATGAAACTGCCCAGAAATTGCTCAATCAAGGTCCCCTTTTTTTTCTTGATCCATTTCACGAGGTCAAAAGAAAAAGAGACAAGAGGAAAGAGGTTACAATGAACGTGGGGCATACTGCATCACAACAGAAAAAGCACAGTGAATCATTAAATCAAGGGAGCAAACACACTGCACATTCTGATCACAGTGTCAGTGGCAAAGGAATTATCCGGAATTCTTTGCCGGATGCAAAGGCTAGCAGAGAGTTCCGTGTTGTGAGGGACAATAGGACTAATCATAAGCCAAGCAGCAAGATAAAGCCTCCCTTGCAAAGCCAAATATCTTCAAATGAACTAGAAGTCCCGAAGTTTGCCAATAAGAGCTTGAACGTGACTTCTAATGAGCAGAAACAGACAGTTGTGCGTCATCTAACTAAATCTTCAAATGGAACGACTGAGACACAGCCTAGGCAGCCAAGGGTTGTTCAGATTAATAATAAGAAAGAATCATTGGAGGATAATCGATCCGCAGTTATAAAGCCTGTTACACAGATTCAAACTAAGAGCACAAATGATTCCCATCTATCTGCAACTTTATCTAACAACTCTGTGGCAGGGGTATACTCTTCATCTTCTGATCCTGTACATGTACCTTCTCCTGATTCCAGACCAGCTGCTAACATTGGAGCAATTAAGCGTGAAGTTGGGGCTGTTGGTGTACGTCGTCTGTCTACAGAAGTTTCTCCCAAAGGTTCATCACCACAATCTAATTCTTTTCCTAATACACATTTGGGACGTGATGGTCCGTCAAGAGATTCATATCGATCTTCTGCTTCCCTGTCTAAAAGCAGCCATCCTAGTCAAGCTCCTGTTAATGACTCGACTTTGAAGAATATTCCAGTCAATAGGCCATCTGTTAATAATCAGCAGGTTAACAGACAGCATCAATCTGGTGGTCATCAAAAAGTTTCTTCACATTCTAACAAGGAGTGGAAACCTAAATCAACCCAAAAACAAAGCACCGGTCCTGGAGTTATTGGAACACCATCAAAATCTGCTTCCCCTCCTGCTGATGCCTTAAAGAATTTGGAAACAGAATCAACTCAGTTGCCATCACATGTAGACATCTCGGACAATGAGAATGTAATTATAGCTCCACATATACGAGTCTCCGCAACTGACAGGTTTCGAGTGACTTTTGGCAGTGTGGGTACAGAGTTTGAACCTTCCAGAAACCCGGGGTTCGAAGCAGTAAAAGTTGCAGAGGAGCCTTTGATTGATCCTTCAGGAAGTGTATCAGTTGCTACTCCTGACTCTTCTGGTGATGAATCTTCTGGAAGTAAGCAAGAAGACTTGAGAGATGAAAATGTTCGCAATTCTGGTAGCAGTTCCCCTGCGTCTGCAGCAGTATCTGAACAGCAATTGACCAGTAGGATAGAATCATCAGGTCCTCAGGATATAGACAAGGGGGCAGAGGTTGAATTGGTGCGTAATAACAGTCAGTCTCACACTCCATCTCAGTCACAACCACACCAGGATCCTTCCCAGTTACCAATATTTTCTTCATATGATCCCCAGAGTATGTATGACATTCCGTATTTTCGATCATCAGTCGATGAAACTGCAAGGGTGCAAAGTCTGCAGTTTCCTCAGGAGGCTATAAGCTCACATACAGTAAATAACATCCCATCATCTACGGTAGCCATGGTGCAACAGCCGCAGTTGGCGCAGATGTACCCGCAAGTTCATCTTTCTCATTATGCTAATATGATGCCATATCGTCAATTCCTCTCTCCAGTTTATGTTCCACCAATGGCTGTGCCAGCAGGCTATACTAGTAACCCTTCCTATCCTCATCCATCAAGCGGCAACAGTTACTTGCTGATGCCCGGAGGTAGCTCCCATCTGCCTGGAAGTGGGGTCAAGTATGGAATCCAGCAGTTCAAACCAGTCCCCACCGGCAGTCCAACTGGGTTTGGCAACTTCACTAATCCAAATGGTTATCCTATCAATGCTCCTACTGTTAGTGCGACAGGACTTGAAGACTCGTCTAGGCTGAAGTACAAAGATGTGAATCTTTATGTTCCAAATCCACAGGCTGAGACCTCTGAGATATGGATGAATCCGAGGGACCTACCTACTATGCAATCAGGTTCATACTACAATATGACTGGACAAACACCTCATGCTGCATACTTGCCATCCCATACCAGTCACGCCTCGTTTAATGCAGCAGCACAATCTTCTCACATTCAATTTCCAGGCATGTACCATACTCCACAACCTGCTGGAATCCCCAGTCAGCATCATCCTGCTGTGGGCGGTAATGTTGGAGTTGGATTGGCTGCAGGCGGGCCAGCAGCCCAAGTTAATGCCTTTCAGCAACCTCAGCTGGGCCACATGAATTGGACAGGGAACTTCTGAAGGCCTTTCTAATCCTTGAGAATTTTATTAAAAGGGATTGGAGCTGATTATCTGTGGAAGTCCTCTCCTCTCTTTGCCCCTTTTCTCCTCAAAACAAAACTTAATCTACAAATCAATACATTGAGTTGTGTTCAGTCCTTGCTGGTTTATATCTGTGATTCAGGGGACGGTATGTCAACCTTTATATGGTTGTATGCAAGTTTATTAGGATTAGAGCAGGCTTTCGTTTATAAGTTCGGCCCTATGTTTTTATAGCCCGACTGAAAATATATCTCCAAATGGTTTAATTGTTTTGGAGGTTTATCAGGTCAGGGCAGGCTCTTGGTTTATAAGTCTGCCCTCATTTTTTCAGCAGTCTGTTTTTTCTGATAAATAATCTCAAAATATATCAGTCAGCCCAAATTGGGACATGTAGTTCTAGCATTTACATAACAATGCATTATTTTTTTTGTGTGAACCAAAGTGTCTGTGCAGGAATTCTGTAGTGTAGTATGACTTATGTTTTGAGATAAATGAATCATACTTTGTAATCCCAGTTTCTGAATTATTGGAAAAATAACACTTTTGATGACA\n>XM_006679287.1 Batrachochytrium dendrobatidis JAM81 uncharacterized protein (BATDEDRAFT_11902), partial mRNA \nAGACATTTGACTGGAAAAACACATGTTGCCGGCAGTGATGGTGATAATCAGTTTGCTACTTACATCAAGGAGAGATGGGAAGCTGCTGGTCTTCCCATGACCCATATCGATTCGTACTATCCATTGCTCAACTACCCCATCTCTCGCTCGCTTACTTTATTGGAGCCATTTCGATACGATGCAGTGCTGAGAGAACCAGCTATTGCCGAGGACACTACAAGTGGGGATCCAGATGCTGTTCCTACCTTTCTAGGCTACTCTCCTTCTGGAAACGTCACTGCAGAGCTAGTGTATGCCAATTTTGGTGGTATAGAAGACTTTGCTATGCTAGCTAAAAACGGCATTGATGTCAAGGGGAAAATTGTTTTGGTCAGATATGGTGGTGCGTTTCGTGGTTTAAAGGTTCGAGCTGCTGAGCTCTCTGGAGCTGCTGCTGTTTTGATCTTTTCGGATCCTGCCCAGGATGGTTACAAAATGGGTGCTACGTATCCTGACGGACCGTGGAGACCACCTCATGGTGTACAAAGAGGTTCTATCCAGTATCCAACATTTTACCCTGGTGACCCACTTACGCCTTTTATTGCTGCGACAAAAGATGCTCCTCGTATTCCAATTGAGGAAGCACCCATTCCCAAGATTCCTGCAATTCCAATTAGCTACGCTGATGCTGCCCCTTTTTTGAAAGCTCTTGTCGGTCACGGAATTCTTGCCAGAACCTTATCTCTCAATTGGCAAGGAGGTCTTGACATGGATTATTGGACAGGACCTGCTGCAAAAGTAAATATGTATGTCAACAATGATTTCAAAATCAAACCTATTTGGAATGTTTTGTCCATCATTGAGGGTAAACACGAACCCGACCAAGCCATTATTCTTGGCGGACATAGTGATGCATGGGTATATGGCTCAGTTGATCCATCTTCATCCAATTCCGTGATTGTTGAAACTGGTGTTGCACTTGGTAAAATGTACAAGTCTGGCTGGCGACCCGATCGCACCATCATTCTTGCAAGCTGGGATGGTGAAGAATACGGTTTATTAGGCTCTACCGAATGGGTTGAGGATCATGTCGAAGTACTAAATAGAACTGCGATCGCGTACATTAATCTTGATATGGGTGCTTATGGACCACACTTTCATGCTGCTGCTAGTCCTTCTCTCGCTAATCTTATCCGTGATGTAACCAAGGGCGTAAAAGATCCCAACTCGGGAAAAATGGATACACCTCAAGGTCGTGTTCCACGTATTAGCCCACTTGGATTTGGATCTGATTATGTTGCATTTTTGCAATTTGTTGGTGTTGCTGCTATGGATATTAAATTTGAAGGCGACTATGGTGTGTATCACTCCAACTATGATAGTTTTCATTGGATGGAAAAGTTTGGAGATCCCACTTGGGAATATCACAAGACACTTGCTAGTATTGTTGGTCGCATTGTTCTTTCGCTTGCACACGATGAAATTCTTCCATTTGACTATGCCCCTTATAGTTATGAGTTGACTCGATATGCTACAGATGTAAGCACTGCGCTCCAGACTGCTGAATTTCCTATCGAATGGGCAAGTAGTTTGCACGAAGCCATCCAACTTTTTTCAAAAGCAGTAAATAAGTTGAACAAGGCTATTGACGGATTGTCTGATATTGAAACCAAGACGAATGCTGAGCAAATGGATGAGCCCAAGCTTGTTGTTCAAGGAAACGACAACAACGAAATAATGATGATTACATCTTTTGATGCAGACTTGTCAGCATCCAAGAAACACAAAAAACGACCCAATGCCAAGAAGCTTAACAAGATTCTTGGATTTGGGGAGCGCGCCTTTATCAATAAGGATGGCATTCCTGGTCGACCATGGTACAAACATGTTGTTTATGCACCAGGAGAGTGGTCTGGATATGGTGCAGAGATGTTTCCTGCAATTCATGAAGCCATTCGTGCGCATAATGAAACTCGAGTGCTAAATGCGATCGCAGTTGCTTCGCATCAAATTCAACAAGCTGCAGAGATGCTTTCTCCTTGA\n>XM_023773343.1 Ramularia collo-cygni uncharacterized protein (RCC_08091), partial mRNA \nATGGCGCAAGGTCCAGCCAAGAAGCCAAAGGCACCAGCCGTAAAAACCACGCAGCGCAAGCAGACCGGAAACCGTGTAATCAAACCGAAAAAGGCCGTCCTGATCAAGCAGAATACGATGAAGAAGGCGCATTCCAGTGGTCTGGCAGCCCTGACCGAGAAGTCTCTGGCCAATAAAGCGGGACATTTGGAGCTTTTGAAGGGCGGCAAGAGGGAGAAGCGGGTCGCGATGAAGGAGGCGGCAGAGAAACTAGCGAAGAAGAAGTGA\n>XM_001417720.1 Ostreococcus lucimarinus CCE9901 predicted protein partial mRNA \nATGCTGGACGTGTCGTGCGGACCGGGGCTGATACTCGACCTCTTGGCGCGCCATTCGGCGCGCTCGGGGAAGTGGGAGCGCGTGGTTGGTTTAGATTTTTCTCGAGAGATGGTGACACTGGCGCGCGAGGCGTGCGGCGAGCGCGCGACGGTGGTGGTGGCGGACGCGTGCGATTTGCCGTTCGCCGATGGCGCATTCGACGTCTTGCATTCGAGCGCGGGGGCGCATTGTTGGGGCGATTTGAACAGCCGTGGCGTTCCCGAGTCGGCTTTTCGCGAAATGTATCGAGTTTTAAAACCGACGGGGGAGATACTGGTATCGACTGTCGTCCTGCTGAAGCCGACGACGGTTGAGGAGGAGTACTCGCGAACGCCGAACACGCCATTTTTCGACGAACGCGCGGTGTGCCGGATGATTCAAGACGCTGGGTTTCGCGATGTTGAAGTTATAGCAAAGGATAAGTGTTTCGTGGCCGTCAAGGCTGTTAAGTGA\n>XM_048826826.1 PREDICTED: Caretta caretta laminin subunit beta 3 (LAMB3), mRNA \nGCACCCACCCCACAGGAACTTCCTTCCTCAGGTGAGGCTGCATTTAAAAGCAGAGAGTGAAAGGAGACAGCCCATGAGGACTCAGGTGAGAATTCGTATCAGCTGCTCAATAACGGAGGAAGAGGAAAGAAAAGTCTAGCCCCTGAACCAGGTGAGTCCTCAGAAGTATGGAATCTCCCCCCCGGCCCATTGTATGGACATGTTTCATTCTCCTGGCTTTGCCACGACTCCTGGATGCACAGGGCTCCTGTTCCTATGGTGCCTGCTACCCACCTGCGGGAGACCTGCTGGTAGGAAGAATCCATCACTTGAAAGCCTCGTCGACATGTGGCCTTGTGAAGCCTGAGACCTACTGCACATCGTATGAGGAATGGAGGATGAAATGCTGCCGATGCGATTCCCGACTGCCTCATGCTTACAACAGTCACCGGGCGGAGAACATGCTTTCCTCCAAAGGACACATGCGCTGGTGGCAGTCCCAGAATGATGTGAACCAGGTCTCCTTGCAGCTGGATCTCGACAAAAAGTTCCAGCTCAGCAGCATCTTGCTGGACTTCAGGGCGCCTCTGCCCGTGGGGATGCTTATTGAGCGCTCCACCGACTTTGGCGAGACCTGGACGATCTATCAGTACCTGGCCTCTGACTGCGCCGCTACCTTTCCACGGATCCCCCAAGGCTCCCCCCAGAGCTGGCAGGACGTGCGCTGTCAGGAACTGCAGAGCCACCAGGGGCACCCTCTGCACGGGGGGAAGGTCAAATTCAACCCCCTTGACCTGGCATCCGGCATCACCACATCTCACAGCCAAAGCATCAGTCACCTGGGAGAATTCACCAACCTGAGAGTTAACTTTACCCAGCTACCTCGCCTCCCACAGCAGGGCTACCGCTCACCCAGTGCCTTCTATGCTGTGACCGAAATGCAAGTGCAGGGAAGCTGCTTCTGCCATGGACACGCAGACCGCTGTACTCCCTCCAGAGACCCCAATGCCGTGATGCAGGTTCACGGACACTGTGTGTGTCAGCACAACACGGCCGGCCCACACTGTGATCGCTGTGCAGCTTTCTACAATGACCAGCCTTGGAGGCCGGCAGAGGACCGCAACCCCAATGAATGCCGGAGGTGCAATTGCAACGGTCACTCGGAGACGTGCCATTTTGACCCAGCTGCGTACCAAGCCAGCGGTGGGGTGAGTGGAGGTGTGTGCGACGACTGTCAGCACAACACAGCGGGGAGGAACTGCGAAAGCTGCCAGGCCTACTTTTTCCGCAACCAGCGGCAAGATGTCACCCATCCGGAAGCCTGTCTGCCTTGTGAGTGTGACCCGGACGGCACGGTGCCTGGGTCCAGCTGTGACCCTCTGACCGGACGCTGCGTTTGCAAGGAGAACGTGCAAGGGGACCGCTGCCATCTCTGCAAGCCTGGGTTCACCCAGCTCACCAATGCCAACCCTCTGGGATGCCACAAATGTGCCTGCAGCATCCTGGGGACCCGCCAGGACGCACCCTGCGACGACGAAACAGGGAGGTGCTTCTGCCTGCCCAACGTGATGGGAGCCAATTGCGATCAGTGCTCTGCCAATCACTGGAAGATTGCCAGCGGCCAAGGCTGTCAGCCGTGCAACTGCGACCCTCGCAACTCCTTCAGCCCACAGTGTAACCAGTTCACAGGGCAGTGTCAGTGCCGGGAAGGCTTCGTGGGGCGTACCTGCTCCGCTGCCCAGCTGCGGGTTTGTCCAGATGGGTCCTATGGTGACGTCAGGACAGGATGCAGAGAGTGTGACTGCAATTTCCAGGGCACGGAGGGGATGGGGTGTGACAAGACCACAGGCAGCTGTCTCTGCCGCCCTGGCTTTACCGGGCCTCGCTGCGACCAGTGCCAGCGGGGTTTCTGCAGCAACTACCCCCATTGCGAGACGTGCCACCCCTGCTTCCAGGCCTACGACAGCGACATTCGCCGGTTCGGCCTGCGCCAAGTCAGCCTGAGAAACTCCACCTCACGACTGCAGCTGGGAACAGGGGGCGCTGGCTTCAGCACTCGTGTCTTGGAAGCAGAAGGCAATGTTCAGCAGATTCAGGGGATCCTCGGCAACCCCCTAGTGACGCAGCAGGGCCTGGGTCAGGTGTCCAGCATGCTCACTGCAATCAGACAGCAGGTCCAGGGCATAAATCCTGACCTACCCTTTGTGAATGACACCTTCTCTCTAGCCAATGATCTTGAAGCCCTGGACAAGAGCCTGCTTTTCGTTAATGGGCAGTACCAGATTAAGAAGACCCAGTTTGAAGCCAGCCGCCACACAGACCTTTCAGGAGCCTTCAAGACTGTCAGCTCTGCGTACCAGAGCTCCACCAACGCCAGCTACCGCATAACGGGCACTTCCAGCCTGCTGGCTCAATCCAGAGAGAACCGGAGAATGACTGAGGGGCTGGAAAGCAGCTTTACAGACCACCCCTCCAGGCTGGAGGCCCTCCAGGGCGAGATGGCCTCCTCCCCCAACTTGACACCAACTATAAATAAGATTTGCAGTGGCGTCAGATCCAAGGCCTGCACCCCTGGGCACTGTGACGGGGAGCTGTGTCCACAGGACAGCACAACGGGGTGCGGAACGGGCCTCAGCTGCAGAGGGATCATTCCACTGTCAAGTGGCGCAGTCAGAACTGCTGAGAAGACCACCAGAGAGCTCGATGGCATAAAGACTCAGCTCCAGCGGACCATGCAGATGATCAGGGCAGCAGAAACGGCTGCAAACCAAATCCAAAGCAATGCACGACGTCTCGGGGACCAAGTGAGTGTAACCAGGACCCAGATAGAAGGAGACGTCCGACGCATCCAGCAATTCATCCAGCAAGTCCGCAACTTCCTGTCAGACCCAGCCACCGACCCTGCCACCATCCAGGAGGTCAGCGACTATGTGCTCTCGCTCCGCCTCCCAACGGACACTGCTGCCGTCCTGAGGAAAATGACTGAGATCCGAAACCTGGCTGCTAAGCTGCAGTGTCCTGAGAGCATCCTCACCCAAACAGCTGGTGATATCGCTAAGGCCAAGAGGCTTCAGCAAGAGGCTGAACAGGCAAGGAACCGAGCAAATGCTGTAGAGGGCAACGTGGAAGAAGTGGTGGAGAATTTGAGACAAGCAAACACAGTGCTCCAGGAAGCCCAGGATGCTATTAGTGGCTCCAGCTATTCCCTTCGGCTCATCCAACTCCGCATTGATGAGATCCAGGCTGTCCTTGGTCCAACGGAGAAGAGTATGAGAGACATTACTGATCAGCTGGACAACTTCACCGAGAGAATCAGCCAACTGCGGCACAGGGCGGAGCAGAATCAGTTGCAGGCCACCGATGCTCAGCAGAGAGCAAAAGAAGCCATTGAGCAAGCAAGGAGCACTCAGCAGGGATTTGAACGGGTAAAACAAAAATACGATGAGCTAAAGAGGCGGATGGGACAGAGTTCGACACTGGGAGTGCAGGGCAGCAGGATCCAAAGTATCGACAGGGAGGCAAAAGCGCTCTTTGAAGAAACCTGGGCTATGATGCTCAGGATGGAAAGTATAGAAATGGAAATTCAGAAAAGCAACAATGCATTAATCATCAAGTCAGCCAGCCTTGCAGGCCTGGAGGAGCAAGTGGAAAAGATCAGCAGTCATATCCATGAAAGAATCGCCTACTACACCGGTTGCTAATCAATCAATGAGCTGCTGGGACTCCATCTTGCCCTGTAATTGCAGAGTCTGCCTTCTGTTCAAACACTGACTGGGGTAGTTAGCCCCCTCTCATAGAATTTTCTTGTTCTCACACTTAGTGTCTTTGGTAACAGAACTGCTGTAGCTTTAGAAAATGCTAGCATGGAGCCCAAAAGGACAAAAATGCCTCTGGAGAGAATGAATGTTATATGGCCTGGCTGAAGCAACCCTGGGAGGCTCTAGGAAAGGGGGAAGATATAACTAATGAAAAAAGCCTTTTGGAAGGAGTTATTTCTGTATGAGGTTTGTTAATGTGACCGGGGATGTTTGTTTTAGCACCTGGATTTTACCTTTTGAATGACAAAGACCAGAGTTGAGGTTTAACTTTTCTGGTACAGTGCATTTAGTTCTTCTAAGGGAGTCATAAGAGGAGTAGAACTAAGGCTACAGATAAATATAGGACCAGATAACTGAATAAGCCCTATTTATACAAACGTAAGAGCAGTTGTGCTCTCAGGTGGAGTTAGATACTATCCAGTTGGACTTAGACAATATGTTGCAAACTGAAGCCTGTAGGGAAC\n>XM_019557682.1 PREDICTED: Lupinus angustifolius nucleolin 1-like (LOC109325361), transcript variant X10, mRNA \nGTCGCATATAAAATCATTGTTATCAGCCGTAGCCTCATTCTCTTCCTAGCTTCTCAAAACCCTAAACCCCTTTCTTTCGTTGATTCATTCCTCTCTATTCGATGGCCAAGTCCAGCAAGAAATCCGCTTCCAAAGCTGATGCTGCTCCAGCTGCAGCAGTTCCACCTTCCAAGTCTGCCAAAAAGAGCAAGAGGCAGCCAGAAGATGAAATTGAGAAGCAGGTGAGTGCTAAGAAGCAGAAGGTAGAGGTGGTTGCCCAGAAGCAAAAGAAGGAAGCAAAGCTGCAAAAGGTTAAGAAGGAAAGTAGTTCAGATGATTCATCATCAGAATCTGAAGATGAGAAACCTGCTGCAAAGGTTGTTGTTCCTTCAAAAAAGCAACCAGCTGCTGAGAAACCAAAGGTGCAGAAGAAGGAAAGTAGTTCTGATGATTCCTCTTCAGAGTCAGAAGATGAGAAACCTGCAGCAAAGAAAAGCAAGCCAGCACCCCCTTCTAGCTCTTCTGATGAATCATCTGATGAGGATGAAGCTCCAAAATCCAAGGTGGCTGCTGTTAAGAAGGGCTCTGCTCCCGCAAAGAAGAATGTGCAGCCTAGTGAGAGCTCTGAGTCATCTGAGTCTGACTCCGACGACAGTTCTGATGAGGACAATGCAACTAAACCTTCCAAGAAATTGCCTGCCGCTGCTGCTAAGAAATTGCCTGCCGCTGCTGATAAGAAATTGCCTGCTAAGAAGGCTGAATCAGACTCATCCTCTGACAGTAGTTCAGATGAAGATGATAAAAATGCTGGCAAGTCGGTGCCTGTTTCTAAGCAGCCCACAAAGAAGTCAAAAAGTAGTTCTGATGAGAGTGATTCAGATGATGAAGAGAAGAATGCTAAAGCTTCTAATGGTAACAAGAAACCCACACCTGTTGTGAAGGTGGTGAAAACTGAGTCCAGTGATAGCTCATCAGACGATGAGGTAAAGATGGATGTTGATGAGGATGATAGTAGCTCTGATGAAAGTGATGAGAAGCCTCGAAAGAAAAAGCCTGTAAAAGACTCAAAAGAAAGCTCTGATGATAGTTCAGAGAGTTCAGATGATTCAGAGGATGAAGATGACAAGAACAATTCCAAAACTCCCCAGAAAAGTGTTAAGGATGTGGAGATGGTTGATGCCTCATCTGGAAAGAAAACTCCTAATACCCCGGTAACACCGAAAGGAGAATATGGTGGATCAAAGACACTATATGTAGGCAACCTGTCATATAGTGTGCAGCGGTCTGATGTGGAAAATTTCTTCCAAGATTGTGGAGAAGTTGTCGATGTTCGCCTTGCAATAGATGATGATGGGAGATTTAAGGGCTTTGGACATGTTGAATTTGCAACATCAGAGGCAGCCCAAAAGGCGCTTGAGTTGCGTGACCAAGAACTGTTGAACCGTCCTGTCCGGCTTGATTTAGCTCGTGAAAGGGGTGCATATACTCCCAACAGTGGGCCTAACAGCGGTAACTGGAACAACTCATCCCAGACTGGTGGAAGAGGCCAGTCTCAGACATTATTTGTGAGGGGTTTTGATAGATCCCTTGGAGAAGATGAGTTAAGGTCTAGCCTGGAGGAGCATTTTGGTACATGCGGGCAGGTTACAAGGATATCTGTGCCAAAAGATTATGATTCTGGTGAAATTAAGGGGTTTGCTTACTTGGACTTCAAAGATGGTGAAGGCTTTAGCAAAGCTCTAGAACTCCATGAATCTGAACTCGGAGGTTATACATTATCAGTTGATGAAGCCAAACCTAGAGACAGTCAAAGCTCTGGTGGTAGAGGTGCAGGTAGGAGTGGTGGTGGCCGCTTTGGTGGTGGAAGAGGTGGTCGATTTGATGGAAGAGGCAGTGGTGGACGATTCGGCAGCGGTGGTGGTGGTCGATTTGGTGGTGGTGGCCGATTTGGTGGTGGGCGTGGTCGTGGAGGACCAAGCAGACCAAGCTTTGCCCCAGAAGGGAAGAAGACCACTTTTGCTGATGAGGATTAGAGTGTCTGGAATCTGAAGTTTACTATTTTATTATGTGCTTTTAATTTCAGTTTTTTGCTCCAGTTTTGGTATTTGTTTGTATGAATTGGTAGAAATCAAGTGTATTTGGGATTTTCAGACAATGTCTTATGGATTTGTAGTTCTGCTACCTATCCAAACCATGTATGCAGTTTGTTAGGTAAAGACATATTCAGAAATATATATTTATTATATATTTAA\n>XM_039356821.1 PREDICTED: Crotalus tigris PTPRF interacting protein alpha 1 (PPFIA1), transcript variant X7, mRNA \nGAGTTTGCAGCACTTACTAAAGAGCTCAATGTATGCAGAGAGCAACTCCTTGAAAGGGAAGAGGAAATTGCAGAATTGAAAGCAGAAAGAAACAATACAAGAGTCAGTTCATCTTCTGTTACTACTAGAACATTTGGAATGCCTTGTCTCCCGGCATGAAAGATCTTTAAGAATGACCGTAGTAAAAAGACAAGCTCAATCGCCAGCTGGTGTTTCTAGTGAAGTTGAAGTTCTCAAAGCACTAAAGTCTCTATTTGAACATCACAAAGCCCTTGATGAAAAGGTAAGAGAAAGGTTACGAGTAGCACTTGAACGATGTAGTTTGTTGGAGGAAGAACTAGGTACTACACATAAAGAGTTAATGATTTTAAAAGAACAAAACAATCAGAAAAGAACACAAGCTGATGGAATGCCTGATATTAATCATGATCAGGAGAATATACCTAGCACTAATGGGAAGAGATCTTCCATTGGCTCTTTGAATCATGATGAAGATCTTGCTAAAGTAATAGAACTTCAAGATATCATAGAAAAGCAAACTAAAGAACAGTCACAAATGAAAGAAAGAATTACTGCCCTTTCTAATAGAGTAGCAGAACTGGAAGAAGATCTTGATACTGCTAGAAAAGATCTAATCAAATCTGAGGAAATGAACACCAAGTTGCAAAGAGACGTACGAGAGGCAATGGCTCAGAAGGAAGATATGGAAGAAAGAATTACAACTCTTGAAAAACGCTACCTCGCTGCACAACGTGAAGCTACATCTGTGCATGATCTTAATGATAAACTTGAAAATGAAATTGCTAACAAAGATTCATTGCATCGACAGAGTGAAGACAAGAATAGGCAGTTACAAGAACGATTGGAACTGGCTGAACAAAAATTGCAGCAAACTCTGAGAAAAGCTGAAACTCTGCCAGAAGTAGAGGCTGAATTGGCTCAGAGAGTTGCTGCACTTAGTAAGGCTGAAGAAAGACACGGAAACATTGAAGAACGATTGAGACAAATGGAAACACAGCTAGAAGAAAAAAATCAAGAACTATTAAGGGCCCGTCAAAGAGAAAAGATGAATGAAGAACATAATAAACGTTTATCTGATACAGTTGATAAACTTTTATCTGAATCTAATGAAAGACTTCAGCTTCACCTTAAAGAAAGAATGGCAGCTCTGGAAGATAAAAATTCCCTTCTCCGTGAAATTGAAAGTACCAAGAAACAAGTGGAGGAGCTTCAAAATGAAAAGGATCAGTTGGTAGTAAACGTTGAAGCAATAAGGGCTGAAAATGACCAGTTGAGGATCAGAGGCCCTGCTCTTCATCATAGTAGGCCACATTTAGGTAGTGTACCAGATTTTAGATATCCACTGGCACCTTCAGTTATAGCAGACAATCAGACAGATTCCTACAGCACCTCAGTTCTACGACGTCCACAGAAAGGACGCTTAGCAGCTCTGCGAGATGAGCCTTCAAGGGTTCAGACTCTTAATGAGCAAGATTGGGAACGTGCACAACAAGCAAGTGTATTGGCAAATGTTGCACAAGCCTTTGAGAGTGATGCTGATATCTCAGATGGTGAAGAGGACAGAGAAACTATATTCAGCTCAGTTGATCTCTTGTCACCTAGTGGTCAGGCAGATGCCCAGACCTTAGCCATGATGCTTCAGGAGCAATTGGATGCCATCAATAAAGAAATTAGATTGATCCAAGAAGAAAAGGAAAACACTGAGCAAAGAGCAGAGGAGATAGAAAGTCGTGTTGATAGTGGGAATTTAGACAATCCTGGTCGATTCCGATCAATGAACTCTATCCCACCTCCCTTTCCTAGTGGAAACCTTTCTGGTTCCTCTCCACCAGGAAGTGGGCTTTCTACTCCTCGAAGAATGCCACACAGTCCTGCTCGAGAAGTGGACAGACTAGGAATTATGACATTACCTAGTGATTTAAGGAAACACCATAGAAAGTCTCCAGTTTCTAGAGAAGAAGTTAGAGATGACAAGGCTACAATAAAATGTGAGACCTCACCACCTTCTTCACCTCGATCACTGCATTTGGATAAATCTTATAAAGGAGCTTTGCATACAATGAGCCAGGAAGATATAAGAGATCTTCGAAATTCTACAGGCTCTCAAGATGGACAGATAAGCAATCCCAGTAGCAGTAATAGCAGTCAAGATTCTCTCCACAAAGCTCCTAAAAAGAAGGGGATCAAATCCTCAATTGGCCGCCTATTTGGTAAGAAAGAAAAAGGTCGATCTGGACAGATGAATAAAGAGATCCTGGGACAAGTTAGTGTATTAGAAGCAGAAAGTTCAACTCAAGATGGTTTGGGGCTTGGAAAACTTGGAGGACAAGCAGAAAAGAATAGAAAACTGCAAAAAAAGCATGAACTTCTTGAAGAAGCTCGGAGGCAGGGTCTGCCTTTTGCTCAATGGGATGGCCCCACAGTGGTTGTCTGGCTAGAGTTATGGGTTGGGATGCCAGCTTGGTATGTGGCTGCTTGCCGTGCAAATGTGAAAAGTGGTGCTATAATGTCAGCCTTATCGGATACTGAAATACAGCGTGAAATTGGAATCAGTAATCCTTTACATAGGTTAAAACTGAGACTTGCCATACAAGAAATTATGTCACTAACGAGTCCATCGGCTCCTCCTACATCAAGAACGACTACAGGAAATGTCTGGGTAACGCACGAAGAAATGGAAAATCTTACATCTACACCACAAACGGAAGATGAGGAAGGAAGCTGGGCTCAGACTTTAGCCTATGGTGATATGAACCACGAATGGATTGGCAATGAATGGCTTCCTAGTTTGGGGCTTCCTCAGTATCGCAGTTATTTTATGGAATGTTTAGTTGATGCTAGAATGTTGGACCATTTAACTAAAAAAGATCTTCGTGGTCAACTTAAAATGGTAGACAGTTTTCACAGAAATAGCTTCCAGTGTGGCATTATGTCTCTCCGAAGATTAAATTATGACCGAAAAGAACTTGAAAGAAGAAGAGAAGGAAGCCTGAATGAAATTAAAGATGTCCTTGTTTGGAGCAATGACAGGATGATTCACTGGGTGGTATCAATTGGCCTTAAAGAATATGCAAATAATCTTATAGAAAGTGGAGTTCATGGTGCACTTCTGGCCTTAGATGAAACTTTTGATCACAATGCATTAGCTCTGTCTTTACAAATACCCACTCAGAATACACAGGCTCGTGCTGTCTTGGAAAGGGAATTTAATAATCTTCTTGTGATGGGTACAGACAGAAAGTTTGAAGAGGATGATGATAAAAGCTTTAGACGTGCACCGTCATGGAGGAAGAAGTTCAGACCAAAGGACATAAGGGGTTTAGCTGCTGGATCAGCAGAGACCCTCCCTGCAAATTTTAGAGTTACCACTTCAATGTCTTCACCTTCTATGCAACCAAAGAAGATGCAGATTGATGGCAATGTATCAGCAACACAAAGATTGGATTCTGCTACAGTAAGAACTTATTCATGTTAAAGACTTTCGTTGTTTATCCCCACTATTTCTACAGATGAACTGAACCATTTTGAACCCAATGACCACATTTTGGAAACAGCTGAAATCTTTAATCTGTTAATACTTGTTAAATCAACACTTTGAAATATTTTATTACAGAGTTTTTAATTAGCAGGTGAATTTGTGAGTACTATAAAAAGTATTTTAGATTAAATGTTTCTTATGTGGGTGTATGTGTGTCCCATTACTTAATTTTCTATTAAAATTGTCAATCAAGTTATTACTTTATGTTAATTTTAGTATTTTCATCTGAATGTACTGTAATGCTTGTATGTATCTGTCCCTGTAAGCAATATAGGGCTTTATTGTAAATTATGCAGTTATTGTAATTACCAATAATGAATTTAATAAAGTGAAGGTGAATTTTTTTTTACAATCTTTGTAAAGACATCATGACACCAAGCAATATCAATATATATATATTGCTGTTTGAAAAATGCTAGCTAGCTCTAAAAATTGAAATAATTCCTTTTTTTCAGAGAGGCATATGTTTATTAACAAAACAGGCATGGTACCTGATTCCATTTCCGTTAGAAACTGTACCTTTTAAACTTTTAACATTTGATTATTTAGTGTGTATTCTTATTTAAGGCTTTTGTTTAGTATAATTTGCTTTATATTCATAAATGTGGGAATTTGTAGAACATTATGAAACATATGAGACCTAATGAGGTCATTTATAACTACTTTTTGTGGCTGTATTTGTACAGTCTATGTTCATTGATTGAGCATAAGCAAGCCATAAGCGGAAATATTTTCTGTTAAGCAAGAATAGTTACTACATATTTTCTGTTAAGCAAGAATAGTTACTACATAAGAGTACTTGACAGGCAACATGGAGTGCTCCCTTTCTGGGTTTTGATGTGAAAATGTTTGTGAAAAGATATCAATGCAGTTCTTTTAATGGACCAATCATGATGCACTGCTGCCTCATGACAAAGATGTTAAGAGCATAACATATGGAGGCATGTGGTAGTGCAACTATTAAAAAGGCCTTACTTTTCTTATGTCATCTTTTAGATATATTTATAAGCTTGTTTTTAAATCCAGGCAGATTTTTTAGTTGTTAATAGTTTGAGTCATTGCAAACAGTATAAGTAGAAAATGCATCATTCATTTTTAAATAGCATCTTATGAAGCCAGCAAGGAGGAGATTCAGATCATGGTGCATTATTTATTATACAATAATATACATGGCATGTCTTTTTTCTGTATTTGGTTTTGGCTCTTTTTAAATTGTACAACTTGAATTCATTGTTACTATTTTTTCTATTAACCTTATGTGTACTTTGAATAATGTAACAAATTATGTACAGTCTAAGTACTTTGAACTATTTTTATCACAGTATTATTTATTGCTTTCAATAAATTTCTGAAGCATTTTTCCACTGCCAATAAAATGTTACTATCTTGTGATGAGGCTTGAGATGTTTTAAAATGGTAATTCAGATATTAATGCAAATGAAATATCTTGTGACGTATTAATGCTTCCTTTGGCAAAGACAGTTTTATAAGATCCTTTTCACTTTAGAAATCACACTCTGTATATTATATGTAAGATATACTATTACTATATAAACTTATCAAAATGATTTGTGCAAAAAATTTAAATTCTGAATGTTAATACATTCAAAGAAGATATATTCCAAGGAATGATTGTATGCATTAAATCTACCAGATCTCAGGTCCATAAATCCAGATAAGACTATCAGATAGCAGCAAAGAAATGTGGAAGACTCAATTTTTTTTACTGCTCAGTATTGATTATATGCATGCATATCTTAATCTGAATTTTAGATACTAAGACTAAGGAATTTAATCTTCATTGTGATTATACTGAAGCTATATATAAAATGATCAAACAGA\n>XR_002477788.1 PREDICTED: Aotus nancymaae transcription initiation factor TFIID subunit 9-like (LOC110567331), misc_RNA \nATTACGGTTCTTCTTTTTCCAAGTGAATATCTTTTTCCTTCTGTTCTTTAAATTATAATGTAATACATGATCACAAGAGACAAATCAGAAAATACAAGGAAGCAGAAATAAAGAAATCAACTTCATTTGCACTCAAGGAAAAGAAACTGTCATCTCTCAATGCAGGTCCTTCAGTATCCCTTTATTCTGTTCATTCATTGATGTAAAAAGGATTTGTGAGTTACCGATGTGCCAGGTGCTATGCAGGTGTTACACATAAACTCATCAAAATACAGTTCCTTCCCTAAAACAGATCAACCAAGTGGAGGCAGAGAACTGAATAAACAATTATACCTAAAGTTTTCCTACATATACAGCTATCTATATATGTAGATACAGTCTTTGCAAAAATTAGAATATATCATGAATGCTATTAACCTAATTTTGGGCCTAATACATCAGAAAAAAATTTTCCTGTCAATAGATTCAATCCTTGCTCATAGCCATTACTGGAGGTAATAAAGAGAAAAAAAAAATAGATTCAATCCAGAACAACAAAACAAACTCTAGAGCTAAACCTAATAAGAATCATAGTCGGGGGAGCAGTTGCAGCGAGGACCATGTTGCTTCCGGACATCCTGCTCACCGGTACACCAGGGGGTTGTAAAAACCACACTAGGCAAAGAACTTGCGTCAAAATCAGGACTGAAATACATTAATGTGGGTGATTTAGCTCGAGAAGTCTGATCATAGGATATCATGGAGTCTGGCAAGATGGCTTCTCCCAAGAGCATGCCGAAAGATGCACAGATGATGGCACAAATCCTGAAGGATATGGGGATTACAGAGTATGAGCCAAGAGTTATAAATCAGATGTTGGAGTTTGCCTTCCGATATGTGACCACAATTCTAGATGATGCAAAAATTTATTCAAGCCATGCTAAGAAAGCTACCGTTGATGCAGATGATGTGCGATTGGCAATCCAGTGCCGCGCTGACCAGTCTTTTACCTCTCCTCCCCCAAAGAGATTTTTTTATTAGATATCGCAAGGCAAAGAAATCAAACGCCTTTGCCATTAATCAAGCCATATTCAGGTCCTAGGTTGCCACCTGATAGGTATTGCTTAACAGCTCCAAACTATAGGCTGAAATCTTTACAGAAAAAGGCATCAACTTCTGCGGGAAGAATAACAGTCCCGGGGTTAAGTGTTGGTTCAGTTACTAGCAGACCAAGTACTCCCACACTAGGCTCACCAACCCCACAGACCATGTCTGTTTCAACTAAAGGTGGGGACTCCCATGTCCCTCACGGGACAAAAGGTTTACAGTACAGATGCCCACTTCGCAGTCTCCGCTGTAAAAGCTTCAATTCCTGCAACTTCAGCAGTTCAGAATGTTCTCATTAAATCCATCATTAATTGGGTCCAAAAACAATTCTTATTACCACTAATATGGTGTCATCACAAAGTACTGCCAATGAATCATCAAATGCATTGAAAAGAAAACATGAAGAAGATGATGATGACGACGACTATGATAATTTGTAATCTAGCTTTGCTGCATGTAACGTGTACTTGATCTTGAATTTATTATACTGATATTAAACATGCATGCTGGATGTTTTCAAGTTGTGTTTTAGAAAACTTTAATAATATTTAATGAGTAAATACAATTACCATACTTTTCAATTTAAATGAAGGTTCAGCCTTAAAAGTGTAAGAAAAATAAAGTTGTCATTCATTAAAAAAAAAAAAAAAAAA\n>XM_035574191.2 PREDICTED: Spodoptera frugiperda proline-rich protein 36-like (LOC118262654), mRNA \nGTTGGACAGGCAGCGGCGCGCCACCAACATCCGCGCCGTGTCGAGGCGAGAGAGCAGCCACAGTCAGTCCGGCGCCGACAACCGCCACGCGAACACGTATTCTCCAAATAATGGCCGCCGCCCACACGCACCCGGCCCCCGCGCCCTCAGACCGTCGCTCAGAGGGCCGTGCCGGTTCCCGCCGTATATTCCCACCACAATTTAAGCTGCAAGTTCTCGAAGCGTACAGGCGTGACGCTCAATGTCGCGGAAATCAACGAGCTACAGCAAGAAAATTCGGAATACATCGTCGTCAAATCCAAAAGTGGCTTCAAGCGGAACCTGCACTTCGAGCAGCACTTCTGAGGCGAGCGCCGCAACCAGCGCCGTCGCCACCGCCTTACGCAGCTGGATCTCCAGAGAGCGCACGGCTGCCTTCGCCGCCACCAGTGACAGTAGCCACACCGGTGCAAGTGCCCACACCTTTACCAGTACCAGTGCCCGTTCCTGTGCCTATGCAAATTTCTGAGCCCATCGACCTGTCAGTACGTCGACCTACACCACCACCTGCGCCTCAACCGGCCTATGTGCCACCTACGGCACCTTGTCCGACACGCAAGCCTTTCAAACTATTCCGGCCGTATCTACTTGAAGACGAAGAAGAAAAGCGACCATCGCTGGCATCGCTGCCTGTGTCTAGCGGCGTTCATGTGTCAGCGTTTGTACCGGTGCAAAGCGCGGCGGGTTGCGCGCTCGCTGCGTGCTCCGCCCCGCGATGGTGCTCACCTATTCCCTCCTTCCCGGCTCCACTCAGATGAGAGTGTGCCGTCGGAGCCCTGCTCCGTAACTCCTGTGATCTAGTCGCTGACGCCCGCCTGGCGCCGCCTGGGGCGTAGCCCTTTATCATCGTGCCTTAATGTTCACGCCGCCATAGTGCATTATGCCGTCATCACCCGATGACAGATATTTTGTGTATAAAGTTTAAGATTGTATTTTTATATGTGGGGTTTATGAAGCTTACCTACATTTATAAAGAATATAAATATTATAACGTCTATTATTATTATTATTGAATAAATAAAGAGGATTGTTTACTAAAA\n>HQ100547.1 Uncultured Brachymonas sp. clone F5OHPNU07HZVCK 16S ribosomal RNA gene, partial sequence \nTGGATGATGTGGTTAATTCGATGCAACGCGAAAACTTACCACCTTGACATGGCAGGAATCCCGAGGAGATTTGGGAGTGCTCGAAAGAGAACCTGCACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGCCATTAGTTGCTACGAAAGGGCACTCTAATGGGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTACATCCCGGGCTACACACGTGCTACAATGGCAGGTACAGAGGGCTGCGAAGCCGCGAGGTGGAGCGAATCCCAGAAAACCTGTCTCAGTCCGGATTGAAGTCTGCAACTCGACTTCATGAAGGCGGAATCGCTAGTAACCGCGAATCAGCAGGTCGCGGTGAATACGTTCCCGGGCCTT\n>XM_030296100.1 PREDICTED: Lynx canadensis ADP-ribosylation factor 2 (LOC115501167), transcript variant X3, mRNA \nGCCCCCGCGCCAGTCGCCATTTTGCAGAGGGGAGCCGAAATCCGAAAGGCAGTGGTGTGGGTAACGGTGCCCTGTGCGGCGGCAGGTAACAGAATTCAGTCACAATGGGGAACGTTTTTGAAAAACTGTTTAAAAGTCTATTTGGGAAAAAAGAGATGCGGATTCTTATGGTGGGTTTGGATGCGGCTGGAAAAACCACCATCTTGTATAAATTGAAACTGGGAGAGATTGTGACTACCATCCCTACAATAGGTTTCAATGTGGAAACGGTAGAATATAAAAATATCAGCTTCACAGTCTGGGATGTTGGTGGCCAGGACAAAATCAGACCTTTGTGGCGACATTATTTCCAGAACACCCAAGGTCTGATTTTCGTGGTTGACAGTAATGACAGAGAGCGGGTCAATGAGGCCCGAGAAGAACTAACCAGAATGTTGGCAGAAGATGAGCTCAGAGATGCAGTTTTATTGGTGTTTGTAAATAAACAGGATCTTCCGAATGCTATGAACGCAGCGGAGATAACAGACAAGCTCGGCTTACATTCCCTCCGCCAGAGAAACTGGTACATTCAGGCCACTTGTGCCACCAGTGGAGATGGGCTTTACGAAGGCCTGGACTGGCTCTCCAACCAGCTCAAAAACCAGAAGTGATCGGAAGCGATCCCTTCCCCGTGTGATGGAGGTCGTCAGATAGTACACACAAACTGATGATACGCCGTGGAGATGAATTTTTTTTTCCCTTTGAAAGTTTCGATATTCTTCTCACCTTTTTTGGTAGCAGCTTTATTGAGACAT\n>XM_052553176.1 PREDICTED: Carassius gibelio lipopolysaccharide-induced TNF factor (LOC127953842), transcript variant X2, mRNA \nTCAGATTGTCTCAGATAAAAGCACCCATCAAGGCCATGGCAAGCGCACCCCCGCTGGAGTCATCCACTCTTGTGGGACACCCTCCTCCTCCCTCGTATGAGGAGGCACTGGGATCAAACCCGCAGTACCCACCAATGCCCTACGCTCCTGCTCCTGCTCCAGACATGAAGACATCTGTGCCTCCGTATCCAGCACAACCCTACTGTCCCATGTATCCACCACCACCAGCTCAACAAGGTCAACCCATCACCAGTCCTGTTGTATCTGTGCAGACCGTGTATGTTCAGCCTGGGCTGGTGTTTGGGAGTGTCCCGGTGCAGGCACATTGCCCAGTGTGCTCACTGAATGTGATAACTCGCCTGGAGTATACATCAGGAGCATTAGCTTGGCTCTCTTGTGCAGGCCTGGCCATCTTCGGTTGTATCTACGGCTGCTGCCTGATTCCCTTCTGCGTGGACAGCCTGAAGGATGTGATACACCACTGTCCGAACTGCAGCAGCGTTTTAGGAGTCCACAAGAGAATCTGAAGCAGCTGCAGAACATATGAATGAGTTGTGTAACATACCACTCTGTGTTTATAATGGGGAAACGTTACAGTCAATTCATCTTTTTAGCAAGAGTTAATTCAATATCTGTTGCACCGACACACACATATTCAAATGTATGCGCGCACGCGCGCACACGCACACACACACACACACATATCTTAACATACTTGTCTATTCAATTTAAAAACTGTTATTTGACCAAAAACGAACTCTTTTTTTTTTTTATAATTGTATCACAATTGTGAAGGAATCTTTATAACATTAGATTTACGTATAAACAGTGCAATTATTCTCAATTATATTTTCTGTAATCAAACTGATGTAGGGAAATATTATACAAATAAATATGTATATGCTTTTCACACTTAAA\n>XM_030451652.1 PREDICTED: Calypte anna neurexin 3 (NRXN3), transcript variant X4, mRNA \nATGGGCTTCACTCTGCACTCCATTTACTTCACCTTGAAGGTGAGTTTGCTGCTGGGCTCATTGCTGGGTCTCTGTTTGGGTCTGGAGTTCATGGGAATTCCCAATCAGTGGGCCCGCTACCTCCGCTGGGATGCCAGCAGTAGGAGTGAACTCAGCTTCCAATTCAAGACCAACGTCTCTGCTGGGCTGCTCCTCTACTTTGATGATGGTGGTGTCTGTGACTTCCTCTGTCTGTCCCTTGTTGATGGGCGCATCCAGCTCCAGTTCAGCGTGGACTGTGCAGAGACTACAGTTATCACAGACAAGCAGGTCAACGACAGCAACTGGCACTTCCTGATGGTCAGCCGCAATCACCTTCGGACAGTGCTGGTACTGGATGGTGAAGCCAAGCCAGGTGAGGTGCGTCCACAACGCCAGTATATGAACATTGTCAGTGACCTTTTTGTTGGTGGAGTCCCACTGGACATCCGTCCTGCTGCCTTGACTCTTGATGGTGTTCTGAGTGAGCCTCCATTTCAAGGATTTATCCTGGATCTGAAATATGGCAACTCTGAGCCGCAGCTCCTGGGCAGTCAAGGGGTGCGACTGGAAATGGAAGGGCGATGCTCAGAAAACCCCTGTGAAAATGGTGGCACATGCTTCCTCCTGGATGGTGAGCCACACTGCGACTGCTCAGCCACTGGATATGCTGGCAAACTGTGTTCTGAAGATGTCAATCTTATTCCAGGACTCTCACACCTGATGATGGGTGAACAAGGTAGAAGTAAAGCACGAGATGAGAACATGGCCACTTTCCGTGGTTCCGAATACCTTTGCTACGACTTGTCACAAAACCCCATCCAGAGCAGCAGCGATGAGATCACTCTCTCCTTCAAGACCTGGCAGCGCAACGGGCTCATTCTGCACACCGGCAAGTCGGCCGATTATGTCAACCTGGCCCTGAAGGATGGCGCCGTCTCGTTGGTCATTAACCTGGGATCTGGGGCCTTCGAGGCCATCGTGGAGCCAGTCAATGGCAAGTTCAATGACAACGCATGGCATGACGTTAAGGTGACACGCAACCTGCGGCAGGTGACAATCTCTGTGGATGGCATCCTTACCACCACGGGCTACACGCAAGAGGACTACACCATGCTGGGCTCAGATGACTTCTTTTACGTGGGAGGGAGCCCCAGTACAGCTGATTTACCTGGCTCTCCAGTAAGCAACAACTTCATGGGCTGCCTCAAAGAGGTTGTTTATAAGAATAATGACATTCGTCTGGAGCTGTCTCGCTTGGCACGGATTGGCGATACTAAGATGAAGATCTACGGGGAAGTGAAGTTTGTATGTGAGAATGTGGCTACACTGGATCCCATCAGCTTTGAGACACCTGAGGCATATATTAGTCTTCCTAAATGGAATACCAAACGGATGGGTTCCATCTCATTTGATTTCCGAACCACTGAACCCAATGGACTGATCCTTTTCACCCATGGCAAGCCTCAGGAGAGGAAAGATGCCAGGAGCCAGAAAAATACCAAGGTAGACTTCTTTGCAGTTGAGCTTCTAGATGGGAACCTCTACTTGCTGCTGGACATGGGCTCAGGGACGATTAAGGTTAAGGCCACTCAGAAGAAAGCCAATGATGGGGAGTGGTATCATGTGGATATTCAACGAGATGGAAGATCAGGTACTATATCTGTGAACAGCAGGCGCACCCCGTTCACCGCTAGTGGGGAGAGCGAGATCCTTGATCTGGAAGGTGATATGTACCTTGGGGGGCTGCCTGAGAACCGGGCAGGACTCATCCTTCCCACCGAGCTCTGGACAGCAATGCTGAACTATGGCTACGTCGGCTGTATCCGAGACTTGTTCATTGATGGCCGAAGCAAGAACATCCGCCAGCTGGCAGAGGCACAGAACGCTGCAGGAGTCAAATCCTCCTGCTCCCGCCTGAGCACCAAGCAGTGCGACAGCTACCCCTGTAAGAACAACGCCGTCTGCAAGGACGGGTGGAACCGCTTCATCTGTGACTGCACGGGCACCGGCTATTGGGGCAGGACATGTGAGCGAGAGGCTTCTATCTTGAGCTATGATGGCAGCATGTACATGAAGATCATCATGCCTATGGTCATGCATACAGAAGCAGAAGATGTGTCCTTTCGTTTCATGTCCCAGCGTGCTTATGGTCTGTTGATGGCAACCACCTCGCGAGACTCTGCTGACACCCTGCGCCTGGAGCTGGATGGAGGCCGTGTCAAACTTATGGTCAATTTAGACTGTATCAGGATAAACTGTAACGCCAGCAAGGGACCTGAAACACTTTATGCTGGGCAGAAACTCAACGACAACGAGTGGCACACTGTGCGGGTGGTACGGCGAGGAAAGAGCCTCAAGCTTATGGTGGATGATGATGTTGCTGAGGGTACGATGGTTGGTGATCACACTCGCTTGGAGTTCCACAACATCGAGACAGGGATAATGACAGAGAAACGATACATCTCTGTCATCCCCTCCAGCTTCATTGGCCACCTCCAGAGCCTCATGTTCAATGGGATGCTCTACATTGACCTCTGCAAGAATGGTGACATTGACTATTGTGAGCTGAAGGCACGCTTCGGTCTCCGCAACATCATAGCTGATCCTGTGACGTTCAAGACCAAGAGCAGCTACCTGAGCTTGGCCACTTTGCAGGCTTATACATCCATGCATCTCTTCTTTCAGTTCAAGACCACCTCAGCTGATGGTTTCATCCTCTTTAACAGTGGTGATGGCAATGACTTTATTGCAGTTGAACTAGTCAAGGGGTATATACACTATGTGTTTGACCTTGGAAATGGACCTAATGTTATCAAAGGCAACAGTGATCGTCCTCTTCATGACAACCAATGGCACAATGTTGTCATCACCAGAGACAACAGTAACACCCACAGTCTAAAAGTGGACACTAAGGTGGTCACTCAGGTTATCAATGGTGCCAAAAATCTGGATCTTAAAGGTGATCTCTACATTGCTGGTCTAGCTCAAGGCATGTATACCAACCTCCCAAAGCTAGTGGCCTCACGTGATGGATTTCAGGGCTGTTTAGCATCTGTGGACTTGAATGGGCGTCTTCCTGATCTGATCAACGACGCTCTGCACCGCAGTGGGCAGATTGAACGTGGATGTGAAGGACCAAGCACTACCTGCCAAGAAGATTCCTGTGCAAATCAGGGCATCTGTAATCAGCAATGGGAAGGCTTCACCTGTGACTGCTCCATGACTTCATATTCTGGGAGCCAGTGTAATGACCCTGGTGCCACATATATATTTGGGAAGAGTGGAGGTCTCATCCTGTACACCTGGCCAGCTAATGACAGACCGAGCACAAGGACAGACCGGCTTGCTGTGGGCTTCAGCACTACAGTGAAGGATGGCATCCTGGTTCGGATTGACAGTGCCCCTGGGCTTGGTGATTTTCTGCAGCTGCACATAGAGCAAGGCAAGATTGGTGTAGTCTTCAATATTGGCACAGTGGACATCTCTATTAAAGAGGAAAGCACACCTGTAAATGATGGCAAATACCACGTGGTACGTTTTACCAGGAATGGTGGCAATGCCACACTGCAGGTTGACAGCTGGCCAGTGAATGAACATTACCCAACAGGCAACACTGATAGTGAACGGTTCCAAATGGTTAAACAGAAAATCCCCTTCAAATATAACCGGCCCGTAGAGGAGTGGCTGCAGGAAAAAGGACGACAGCTAACGATCTTCAACACCCAGGCCCAAATTGCCATAGGAGGAAAGGACAGAGGGCGTCTCTTCCAAGGCCAACTCTCCGGTCTCTATTACAATGGCTTGAAAGTGCTGAACATGGCAGCGGAGAACAACCCCAACATTAAAATCAACGGCAGCGTCCGACTCGTTGGGGAAGTCCCTTCCATCTTGGGAACAACACCCACGACCTCTGTACCACCAGAAATGTCTACTACGGTCATGGAAACCACAACTACGATGGCCACGACTACAACCCGAAAAAATCGTTCACCACCCAGCATCCAGCCTACAACAGATGACATAGTTTCATCAGCTGAATGTTCCAGTGATGATGAAGATTTCATTGACTGTGAGCCCAGTACAGCAAACCCCACAGAGCCGGGAATCAGACGGGTTCCGGGGGCCTCAGAGGTGGTCCGCGAGTCGAGCAGCACAACGGGGATGGTCGTCGGCATTGTGGCTGCTGCCGCCCTCTGCATCCTCATCCTCCTGTATGCCATGTACAAGTACAGGAACAGGGACGAGGGGTCCTATCAGGTGGACGAGACACGGAACTACATCAGCAACTCAGCCCAGAGCAACGGCACACTCGTGAAGGAGAAGCAGCAGAGCTCAAAGAGCGGCCACAAGAAGCAGAAAAACAAGGACAAAGAGTATTATGTGTAAAAAAAAAAAAAAAAAAAAAAAAAAAAAGAATATTTATATATAAATATATAAATACTTAATGAGATTTAACTGAAATAGCAGAAACATTGCAGCGAACAAGATTGGGAGATCTATCGTTTGTGGGAAAAAGTATTGGGAAAAAAAAATTCAGCAGTGACTGTTAATGTCTCAGTCATCGCTTGGAGTCAGCAAACTGCCCTAATGTATTATAAAGCACACTTAGAGTTCTGGAGATGGCGCGCACAGCTCTGCCCTGATAGTGAACTTGGACGTCTCCAAATCTCCTCCTCCGCTGAACTTTCTGCAAAGGTAGAAGACATCATGGCTTACTTGTTTCATACCTCCAAGTGAGTCTTTAACAATGTTCGTGATCCCTGACTGTATCAATAATTTTTCGGTTTACTTATTTAAAAAAAAAAAAAAA\n>LR784286.1 Phallusia mammillata mRNA for cytochrome P450 10-like (Cyp11b1-001 gene) \nGAGCAGATGAAATACCCACCATCAAGAAAGTGGCACCACAACCATTTAATTCAATTCCCACCCCAAGCACCTCTGCTCAAGTGAAGACCCTCCTAAAACTGTTAAGAAAAGATTTTAACATGGTAGAGCACATGTCCAAAAGACACCAGGAACTTGGACCAGTATACAAGGAGAACATTTTACCTGGAATTGCCGATGTAACTGTGTCTTGTTGTTCACCTGCTGACACAGAGGCTATGTTACGCTGTGATGGTAAATATCCTGTCCGTCCCCAACTTGGGCCACTGGAAAGTATTAGAAAAGAATTAAAATTGTACAAAGGCATTTCTGAGGCCAGTGGTGAAGAGTGGTACAAAGTGAGAAGTGTAGTGAACAACCATTTTCTACGAAATCGATCAGTGTGGTCATATGGAGAAAAGCATTTAAAGGTTTCTCGGGACTTTATGGAGTACATTGCCAAAAATTTGGATTCCAATAATGAGGTGCCTGATTTTGAAAATGCCCTAAAATATTGGTCTTTGGAAGCAGCAGGTGTATTCAGCCTAGACACAAGACTTGGTTTGTTTGACGATGAAGTGAATGAGACATCACTGGAATTAATTAAGGCAATGGATTTGTTTTTTGAAAACCTTTGCAAGCTAGTGTTTGGTGTTCAATTTTGGAAAACTTTTGAAACATTTACATACAAGGATTTAAAGAATTGTCAAAAGGAAATTTACAATGCGGTTTCTCTTCATCGGCAAGCAGTACAGCACAGCAGTAATGGAAAGGAAACAAATCAGCTCCAATCCTTTCTCAACAGCAGCCTGCTCACTGACAAATATGGTGATGGTAGACTTTCTATCTGGTGGAATAGAAACCACAGCAATGAGTTCAATTTTTCCTTTGTATCTCCTTGCAATACACCCTGAAAAACAGGATATTTTACGTCAAGAAATCAAAAAATACATTGGTGATTTTAGTATTGACAGTGGAAAGGTGCTTGCTGAAATGCCATACCTAAATGCTGTACTCAGGGAAACTCAACGTATTTTTCCTTTTGCACCTTTCTACAGTCGAAAATTCAAGAATGGCATTGTTCTTTCAAACTATCAAGTTCCCCCAGACCAACTGGTTATTAGCTCAGCAAATGTTGTCAACAACAAAGACCCTGCATACTTTCACGAACCAGATTTATTTAAACCTGAACGATGGCTTGATCCTGCACAAAGAAAAAAGGCAGCATTTGCTACTGTAGGGTCGTTCGGGGCCGGTGCCAGAAAATGTCCTGGTAGGAAGTTTGCACTCCAAGAAATCCATTCTCTTATTCCACTCATATTAAGTCAGTACCGTATTGAATACCACTATAAACCAATTAGAGCCAAATTGCGACTTTTGAGCTATCCATCTGAGAAGCCAAGATTTACTTTTATACCCTTGGATGAGTAAGATCGA\n>XM_047789995.1 PREDICTED: Phacochoerus africanus uncharacterized LOC125132573 (LOC125132573), transcript variant X1, mRNA \nGGGATTGAACCCGGGCCATACCAGTGACCCAGGCCGCTGTGGTGACAGTGCCGGATCCTTAACCCACACGCCACAAGGGAACTCCCCGACTCTTCTCTACCACCTCCTTTTCTGTCTCCATTCCCATCTTCCCATCATCTCTGGGTCAGTAGCTCTCTTTCTGTCCCTGTCTCTCACTCACTGTCTCTCACCCCTTCTTTTATCTATTTCTTTCTCATTCATCAACGTTCTTTCCACACCCCTGTCCTTTTTGCTAAGTATTTCCCTGTGGGTCCCTCCTCCGCCCACCCCCATACCCAGGTGGAAGTTTTCAGCCAAATCAAAGGCAGGCAGGCCAGAAGAAGCCGAAAGGGACTCCTTCAGCACATACCGGGAGGGAGGCCGAGCGGGGGGATGTCTGGAAATCGTTACCCACCCCCTCACCACCCCCATCCGCCGCCGCCGAGGTGGGCTGAACTGGCAGAGGGAGGAGGTGGCCCAGAGCACTGGGACCCTATAGAAAAGGGGGATGTTTCTGGTGGATTCCCTGATGTTCTGGGTGACTCCGCCCTTCCTCACACTCTCTTCCTTTATTTCTGGGTCTCTGTCTCCCCTATCCTTGGGGGGGGGGGGTTCTCTGTATCTCAAACTCTCTATACTCTGAGTTTCTATTTTTCCCTGCCCTCCCCCCTTCCTGCTGTCCTCTTCCTCTAGCCACCCCCCCCCACCCCGTCTCGCTTTTTCTCTGAGTTTTTGTGCCTCTTTTGAGGTCTCTACTCATTCGTCTCTCAAAGTCCCAGTCCCTCAGTGCCTGGATCTCTTTCTCACTAGAGTGAGATCTAGCCATCCACATGCCTGCAGGCCCTGCAATTGGCTAGGCTCCGTGTGGGCGGGTTCTGTCACCCCGGGCAACGGCAACAACAAGCCGGCTTGTCCTAGGCTCTGGGGCGGGGCTGGGACCATGGCGGGTCGGACCCTAGCTCTGCGCTATGGTCCTCCGCAGTCCCCCGTCTCCGAGACCGAGGTGTCTGGATCCTGGCCCAACTGGCATCTCACCAGCAGTGGCGTCGCCCACCACTTCATCCCGCCTGTGCCCTTTCCCCCGCCCACTGTGCAGTGCACGGTCACAGAGCCCCTGCCCCCGGCCCCAAAACAGGATTTGCATATCTGGGCTTTCGACGAGGTCATCAGCAGATGGGAGACAACCTCGGGCTCAGCTTACACGCCCAAGACCCTCGGCGGGCCATACGCGCAGCCGAAGGCCCCAGAACCTGCGGACCCCACGCGGGCTGTGGGGATCAAGGATTTGGGGGAAAAACTCAGACACCAGGGCTGGCGCCTCCCTCGGATCACAAAGCACCAGTGCAGTGAGGCCAGGGCGCAGTACACCGGCTGGCCCGGCCTGGACGGGCCTACAACCTTCCATATCGGGCCCCAGCCCCCAGAGCTTGCGGACCACCACCGCGGGGGCCCTTCCCAGGCTCTCATCCCCTGGACGAAGAACCCCGAGCTGAGCGGCCGGCCTTTCGCAGCATCTGATCAGGGCATCCTGGACTGCCATCAGCTCTATATGACCACTTCCGCTCGGGACTTCCGAACCTACTCGAAGAAGGAGTTGTCAGGATACCCTCGCAAGGACTCGCTGACCTACTGGAGCTTCAAGGAGACGCCCCAGGCCTGGGGCCACGGCCCAAAGCAGCCGTCCTATCCGTATTCCTCTTGGCCACCCGGGCCGCCGAAAACCCGCGTGCCCCGCGCCCGCCCAGTGATGCCCGCCGTGCCGCACCGCGGGGCGCAGTCTCTGGCTCAGGAATCCTACGGCCCCCCGCTGCACCCACTCCGCCGGCTCGACCGTTTCTGCCCGCTGAAGCTCCCTTGGGGAGGCCCCCACTGCAAGCCCGTGTCAGGCATTTACACCGTGCCGCAAGCCTACGGCACCGAGAACTCCAACTACGGCAGCTTGAAGCCGGCGCTCGTCTGAGCGGGCGGGGCCGGC\n>XM_035987257.1 PREDICTED: Helianthus annuus cysteine protease RD19A-like (LOC110876098), mRNA \nTTTCTCACCACGTTAATGGCAGTTTGCAGATTACGAGTCTCTCATACGCTCCGACTTTCCTCTCACACAATCGTTGCAGCGGTTGTGTCTTTCTCTCTCATACGCTCCCCTAACTTCTCCCACTATAAAACTATCACCAATAACATCCTCTCCATTATACACCTTCATCTTCTCGAATTTTCTCTGATCTTCTCTCCCCTAATAAACCCAAATCAATAAACGGGTTTGTGTTTTCATGGTTCGCATTGCTGAAATTGGGATTCTAGGATTGAGATCTCGTCTCCGGTTTCCGGACGATGCTAGAAAAGCTCCGATTCTTCCAACGACTGATCTGCCGGAGGATTTTGATTGGAGAGATCATGGTGCAGTTACTGATGTCAAGGATCAGGGTTCGTATGGGTCGTGTTGGTCATTTAGTACGACTGCGGCGTTAGAAGGTGCAAATTTCATTGCTACAGGGAAGCTTCAAAGCCTTAGTGAACAACAACTTGATGATTGTGTCCATGAGGATTTCGGTGAAGGGTATAGGGGGAAACAGGTGGTGTTGGAGAATTTGAGGCAGCTTTGTGTTCACAGATTTGCTAATGAGACCAACAGGTGGTGTTAAAACACTACTACCCCAACTTGGGGATCGGAGTTGTTGTTACCTTTGTGGGATTTGTTTTTAAAGGGCATGATGGTCTTTTCAGCATTTATGTTCATAGTTCCGGTTTGTCTTCCAATTGGACAGAGCCAGAAGAGTCGGTTTTTTTTATGGCCGGAGAATTCCCAGCAAGGATGTCGAATGGGGGAAAGTAACCATGGTTGAAGCGGAGCGTCGGCTACTAGCTAACGCGCTACTCGATTTTTGAAACCAACGATTCGTTCTCCTCTCGGAGTCATGCATTCCGCTATTTAATTTCTCGACGATATACTCTTATTTAATCAACTCTAAACATAGTTATTTCGAGTCCTATGATTTGGCAGGACCAGTTGGCCGAGGGCGGTACAACTGGAAAATGCACCCGACGGTTAAATTTCATGAATGGCGAAAAGGGTCACAATGGTTTGAAATGAGCCGTGAGCTAGCAATTGAGGTGATATCTGACAAGACTTATTTTCCGGTCTTTATAGACTATTACAATGGTTCATGTTATGCAGACGAGCACTACTTGCCTACGTTTGGTACACTTAAATATGGGGAAATGAATTCAAACCAGACTTTGACTGACGATGTTCTCCTACAAACATGCAAAGTTCAACTTGGTGATTCATAAATAACCCCCCCCCCCCCCCCCGCCCAATAAATATAATCTACGTTTGGTTGTCATTGATAGTTTTTTTTAAATACTTTTGTAAACATGTAACATTGATAGATCTCATTTATCTTCATTTAATGGTTTTAGCAATT\n>XM_040865634.1 Pseudomassariella vexata uncharacterized protein (BCR38DRAFT_77744), mRNA \nCTGGGGCCCTTGGCAAGGGCTGGAGTGCCACTCGGAGATTTCCATGAGGCTGGGAGAGACCCTGAAAAACGCGAACGCGCTCGAGAACCTGGCCAATCATGGCAGACTGTCCCACCAAAAAAGCTATTCCCTTTTCGATTTGCCATCTGAATCGCACTTTTACATGCTCAACTATCTCCCACATCACGCCCCGGTGAGCTGAACAGCATGGCAACCCAAGACGCTGCGGGTATTCCTCTCACGCATGCCGCGGATGGAGTGGGCTACAAGCTGTTGGAGCTACCCTCGGAACTGCTGGCTCTTCTCGAATCCGAAAACCCCCCTGTGTTGACCTTAGAGTCGTCCACAACCTCAGCTGTCCTCAAACACGGTAGCCAGACTTGGTCTCTTCGGCAGAAGAACACATCCAATGCCCTCATGCTCCTGTCCCCTTGTGAGACTGCGGCGTCGTCTTCAGATATTCCTCAAGCCGGACTCAAGATTATATCCACAGTCCATGACATGGTGGAGCTTACCACCGAAGGCGCGTCCGGCGCTGCTCCTGTTGCCAGGGGAAAGTGGCATGAGATGTTTGCTCGAGGCAGGTGACAGACAAGAGAGAATATGGGCAAGTCAAGTACCGGTTTTTTCTTCAAATGGTAATTTGAATAAGTCTTGGTGCTGGTGTGCTTAATGGCAATGATCTTTTGCTGCTCAAGATTGTTCATGGATGAGCATGGATGG\n>XM_013015936.1 PREDICTED: Dipodomys ordii single-stranded DNA binding protein 2 (Ssbp2), transcript variant X1, mRNA \nTGTTCCCGGGGAGGCTGTGATGGGTTGACAGGTGCGTGACAGTGGGAGCTGCTCTCGGCACAAGCATGTACGGCAAAGGCAAGAGTAACAGCAGCGCCGTCCCGTCCGACAGCCAGGCCCGGGAGAAGTTAGCACTCTATGTATATGAATATCTGCTCCATGTAGGAGCTCAGAAATCGGCCCAAACATTTTTGTCAGAGATAAGATGGGAAAAAAACATCACATTGGGGGAACCACCGGGATTCTTACATTCTTGGTGGTGTGTATTTTGGGATCTCTACTGTGCAGCTCCAGAGAGACGGGAAACATGTGAACACTCAAGCGAAGCAAAAGCCTTCCATGATTATAGTGCTGCAGCAGCTCCCAGTCCAGTGCTAGGAAACATTCCCCCAGGAGATGGCATGCCAGTAGGTCCTGTACCACCAGGGTTCTTTCAGCCTTTTATGTCACCTCGTTACCCTGGAGGTCCACGGCCCCCACTGAGGATACCTAATCAGGCACTTGGAGGTGTCCCAGGAAGTCAGCCATTACTCCCCAGTGGAATGGACCCAACACGACAACAAGGACATCCAAATATGGGTGGCCCAATGCAGAGAATGACTCCTCCAAGAGGAATGGTGCCCTTAGGACCACAGAACTATGGAGGTGCAATGAGACCCCCACTGAATGCTTTAGGTGGCCCTGGAATGCCTGGAATGAACATGGGTCCAGGTGGCGGTAGACCCTGGCCAAACCCAACAAATGCCAATTCAATACCATACTCTTCAGCATCTCCTGGGAATTATGTAGGTCCTCCAGGAGGTGGAGGGCCACCAGGAACACCTATCATGCCTAGTCCAGCAGATTCAACCAACTCTGGAGACAACATGTATACTTTAATGAATGCAGTACCTCCTGGACCGAACAGACCTAATTTTCCAATGGGTCCTGGGTCAGATGGCCCCATGGGTGGCTTAGGAGGAATGGAGTCACATCACATGAATGGCTCTTTAGGCTCAGGAGATATGGACAGTATTTCCAAGAATTCTCCCAATAATATGAGCCTGAGTAATCAACCTGGCACTCCAAGGGATGATGGCGAAATGGGGGGAAATTTCTTAAATCCTTTTCAGAGTGAGAGTTACTCCCCTAGCATGACAATGAGTGTGTGATCCTTTACGCGTCTCCTCATGAAAACCACAGTGAGTCAGCCCTTCACAGAACTACTACGGAAGAAAATTATTCATCACAGTGTACAGTAAAGGAATCTCAGTCACACCAAACCAACCTTTTTATTTCCTGCTCTCTCCCCTATTTTGTGAAGAAAGCGGGTCCAAACGTGATTCAAACAACTGTACGGAGTGGCACATTAGAATTGCCCTAATCTGAACTGCAAATAATTATCTGTGTATGTATATGTGTGGGAAGGAGATTGTATCGTATATGTGGATGTTATATGGACATATACGCATACATGCATTGACCCACAGGACATTGTAAAATATTATCACATGACATCTTAAGTAGAAATAGGTAGGGACTTTTATTCCATCCTTTTTTTCACGTTTACATTTTAATTATTAAAAGTTGCTCCTGTCCCCTCCCTGAACTATTTTGTGCTGTGTATATCACTGCTTTATATAAGTTATTTTTTAAGGTGAACTCAGATGTTATGGTTTTGTAAATGTCTGCAATCATGGATAGGAATAAAATCGCTTATTTGAGAGCTTTCATTAAATTGTGTCTGATGCAAGTTATCCTGTGAATCCTAAAGTGTACTGTCTCAAGTAATGGAAGAAAGTATGCCTTTATCCTTATGTCAAATCAAACAATTTCTTGGTTACCTTGAGTGAAAAGTATTTTTGTATTTTTTTTTGTTTGAGAAAAACACTTCAGATCAACAAAAGCTTAACTGGGGCTTCAACAGTATATTTCTGCAATAACTACTTTAAATGGAATTCTTGATTTGTTTGTCTTAGATGATACAAAAATCATTAATTAGCTCAAATTACCTAGATCACAGCAATAAAGTGACAGGGGTTGTCAT\n>XR_006051903.1 PREDICTED: Salvia splendens uncharacterized LOC121807657 (LOC121807657), transcript variant X48, ncRNA \nAATTAAAATTGCCTAGAAACCCTAAATTAAATTAAAAATATCCCTCTCCATCTCCCTTCCCAACGGCATCTCCATCTCCATATCTCAATTGGCAGAAATGACTCGTGTTTTCCCCACACCAAGAGTCATAGCCCTCGCAGATTTCACGCCGCCGGCCTGCTTGCCCGGAGAAGAAAGCCGAGGACTTGGCTGTCTCGGAGTTTGGTCCCCGCCGCGGCTGCTACTCGCCATCATCAGACGCCGTCGTCTCCTGCAGCAGGTCGCTGGTCCGGATTCGTGGGCAGCGTCACGTGGCTGCTGACTCGCGGCCTTGCCGCCGCTGCCAACTGCGCGAACCCATCGCCGTCCGCCCTCCCATCGTTTGATCCAGCTGAGCAAAGTGGTGACTTATCAAGATCCATGGGCATCCCAACTTTCAATCGAACTATGGCCTTCCTGAAATCCACACATATAGACTACAATGCCACGGGCTTATACTGGTGTTGGGAAATGAAGCTTTGGAAATCATAGAATATGCTTTTTCAAAAGATAGGTTGTGAAGACTTTTGACTTCAGCCTCACTGGTGCCTCTTCAAGATCTTGTAAATATGTCATGGATACTATGATGCAGACTTTTAAGAACAAGAGGCTTGCTTATGCAGTTAAAGAGAGTACTCTTGATAGTCTCATCATGGAACTATTGCTCCGGCTTTTGGATGATAGTAATCCCCAATGGATGATGGAAGTCAACTTTTAAGAGCTTTGAATGTTCTGATGTTAAAGATTCTGGATAACGTAGAATGTATTTCATCATTTCCTGTGCTTATATATCTGTCAAGACCTGGATCCATCAAGATGGCCATCTCCATCAAATGATCTCTTGAAATCAGGAACCAGAAGTTCTCTGATTTGGTTGTTAAATGTTTGATCATGCTCACAAAGGTTAAGGAGCCAAAACCAGAAGCTGTTCCTTAGGCTGTGGGTTCAGTACCCACTTAAGAGTGTAGCTGATGCACCTCAGGACCTTATCGATCCAGTTGATATATTAAAGCCTTTGGAGAAGTCTGGATTTTAGGAAGCGGTTAAAGCTTCAAAATGGTGGGAGAGGAAAGAGGCTGTTGCTGAACTAGCCGAACTTGCTTCAACCAAAAAGATTTCTCTTGGAGATTTTTCAGAAAGTTTGTCATACATTAAAGAAGGTTATCACGAATGTAAAGGTTACTGAAGGAAGGAAAAAAAGGAAAAAAAAAAGAAAACACATTGTTGTTGCAGCTGAAGCTATTCAAGCTCTGGGCAACCTTGGCATGAGAACCCTTCCTAAAAAAAGAAAAAAAAAAGAAAAAAAAGGAAAAAAAATGAAAAAAATAATTGCTGATGTATTTAAAGCTATTCAAGCACTGGGCAACTGTGCTAGAGATCCGAGAGCCCATTTTTCGGCCAATTGTTGCTTCTTATTTGCCTGTAAACCGCACCTCAGGACCTTATCGATCCAGTTGATATATTAAAGCCTCCTTTTTATAAGTTTGGATTTTGGGAAGCGGTGAAAGCTTCAAAATGGCATGAGAGGAAAGAAGCTGTTGCTGAACTAACCGAACTTGCTTCCACCAAAAAGATTTCTCTTGGAGATTTTTTCAGAAAGTTTGTAATACATTAAAGAAGGTTATCACGAATGTAAAGGTTACTGAAGGAAGGAAAAAAAGGAAAAAAAAAAGAAAAAAACATTGTTGTTGCAGCTGAAGCTATTCCAGCGCTCGGCAACCTTCCTAAGGGCATGAGAACCCTTCCTAAAAAAAGAAAAAAAAAGAAAAAAAGGAAAGTAAATGAAAAAAAGCAAAAAAAGGAAAAAAAGGAAAAAATAATTGCTGATGCATTTAAAGCTATTCAAGCACTGGGCAACTTTGCTGGGGATCCGAGAGCCCATTTTTCGGCCAGTTGTCGCTTCTTATTTGCCTGTAAACCGCACCTCAGGACCTTGTCGATCCAGTTGATATATTAAAGCCTCCTTAGGAGAAGTCTGGATTTTGGGAAGCGGTGATAGCTTCAAAATTGCGTGAGAGGAAAGAAGCTGTTGCTGAACTAACCGAACTTGCTTCCACCAAAAAGATTTCTCTTGGAGATTTTTTCAGAAAGTTTGTCATACATTAAAGAAGGTTATCAGGAATGTAAATGTTACTGAAGGAAGGAAAAAAAGGAAAAAACATTGTTGTCGCAGCTGAAGCTATTCAAGCGCTGGGCAACCTTCCTAAGGGACTGAGAACCCTTCTAAAAAAAAGAGAAAAAAGGAAAAAAAGGAAAAAAAGAAAAAAAGTAAAAAAAGGGAAAAAGAGAAAAAAAATAATTGCTACTGCGTATAAAGCTATTCAAGCATTGGGCAACGTTGCTAGACTTTTCAGAACAAGAGCCTTGCTTATGCAGTTAAGGAGTGTACTCTGATAGTCTCATCAATGAACTGTTTCTCTGGCTTTTGCATGATAGGCTTCCGGAGATGGATGATAGACGTCAAATTTTAACTGCTTTGAATGTTCTGATGTTAAAGATTCTGGATAACGCATAATATACGTCATCATTTCCTGTGCCTATAAATCTGTTAAGTCCTCTGGATCAATCAAGATGTCCATCTTCAGATCAGAAACTTAAAACCTAAAGTTCTCTGATTTGGTTTTTAACTGTTTGATCATGCTCTAAAGGAATCTGCAACTCCAAAGAAGGTTGTTAAAGTAACTTAACTGGTGGCATAGATGGACTTCCACGTGAAGATATAAGTGAAAAGGTCACCCCCACTTTGTTAAAAGGCTTATAGAGTTCTGATTGGAAGGTCCACTTGGAATCTATTGAAAATGTAACCAAAATTCTGGAAGAGGAGAACTGGAATTGGAAATCTATTTGGAGCTCTATAAGGGCGTCTACACGACAGTTCTAAAATTTGATAATTGCTACTTTGTCCACAGTTGGTGCTCTTCGGACTACAATGGGACATCCGGTTGAGAAGTCAAGCTAGCTCCTGTGAAGGCTTGATCATTTACACGAATGTAGCTCGTGCAAGGGATTCTTTCAGATTTTTCTGATGTCTTGAAATGCCTTGGTGACAACAAAAAGCATATGCATGAGTGTACATCTAGTACCTTAGATACTTGGCTTGAGTGTATATCTGGCCAATGTTGTCAAGTCACCACGTAGCCAAAGGTCGAGGTTCTAGGTTTTGTGGGAACCCAATTTATGTGCATCACTGATTCTGACCAACCATCTTAAGCTTTAATGAATTGAAGCTGCCTTTGTAAATGCTCCTCAGGACCTTATCGATCCAGTTTATATATTAAAGCCTTTGGAGAAGGCTGGATATTGGGAAGCGGTGAAAGCTTCAAAATGGTGGGAGAGGAAAGAGGCTGAACTAGCCGAACTTGCTTCAACCAAAAAGATTTCTCTTGGAGATTTTTTCAGAAAGTTTGTCATACATTAAAGAAGGTAATCACGAATGTAAATGTTACAGATGGAAAAAAAAGAAAAAAAACATTGTTGTTGCAGCTGAAGCTATTCAAGCGCTGGGCAACCTTGGCATGAGAACCCTTCCTTAAAAAAGAAAAAAAAAAGAAAAAAATGAAAAAAATAATTGCTGACGTATTTAAACCTATTCAAGCACTGGGCAACTGTGCTAGGGATCCGAGAGCCCATTTTTCGGCCAGTTGCTGCTTCTTATTTGCCTGTAAACCGCACCTCAAGACCTTATCGATCCAGTTGATATATTAAAGCCTCCTTAGGATAAGTCTGTATTTTGGGAAGCGGTGAAAGCTTCAAAATGGCATGAGAGGAAAGAAGCTGTTGCTGAACTAACCGAACTTGCTTCCACCAAAAAGATTTCTCTTGGAGATTTTTTCAGAAAGTTTGTCATACATTAAAGAAGGTTATCACGAATGTAAAGGTTGCTGAAGGAAGGAAAAAAAGGAAAAAAAAAGAAAAATACATTGTTGTTGCAGCTGTAGCTATTCAAGCGCAGGGCAACCTTCCTAAGGGTTGAGAACCCTTCCTAAAAAAAGAAAAAAAAAAGAAAAAAGGAAAGAAAATGAAAAAAACAAAAAAGGAAAAAAAGGAAAAAATAATTGCTGATGCATTTAAAGCTATTCAAGCACTGGGCAACTTTGCTGGGGATCCGAGAGCCCATTTTTCGGCCAGTTGTCGCTTCTTATTTGCCTGTAAACCGATGTCTTCCCTATCAGCACCTCAGGACCTTGTCGATCCAGTTGATATATTAAAGCCTCCTTAGGAGAAGTCTGGATTTTGGTAAGCGGTGATAGCTTCAAAATGGCGTGAGAGAAAAGAAGCTGTTGCTGAACTAACCGAACTTGCTTCCACCAAAAAGATTTCTCTTGGAGATTTTTTCAGAAAGTTTGTCATACATTAAAGAAGGTTATCACCAATGTAAAGGTTACTGAAGGAAGGAAAAAAAGGAAAAAAAAAAGAAAAATACATTGTTGTTGCAGCTGAAGCTATTCAAGCGCAGGGCAACCTTCCTAAGGGTTGAGAACCCTTCCTAAAAAAAGAAAAAAAAAAAAAAAAAGGAAAGAAAATGAAAAAAACAAAAAAGGAAAAAAAGGAAAAAATAATTGCTGATGCATTTAAAGCTATTCAAGCACTGGGCAACTTTGCTGGGGATCCGAGAGCCCATTTTTCGGCCAGTTGTCGCTTCTTATTTGCCTGTAAACCGATGTCTTCCCTATCAGCACCTCAGGACCTTGTCGATCCAGTTGATATATTAAAGCCTCCTTGGGAGAAGTCTGGATTTTGGGAAGCGGTGATAGCTTCAAAATGGCGTGAGAGAAAAGAAGCTGTTGCTGAACTAACCGAACTTGCTTCCACCAAAAAGATTTCTCTTGGAGATTTTTTCAGAAAGTTTGTCATACATTAAAGAAGGTTATCAGGAATGTAAATGTTACTGAAAGAAGGAAAAAAAAGGAAAAAAAACATTGTTGTCGCAGCTGAAGCTATTCAAGCGCTGGGAAACCTTCCTAAGGGCCTGAGAAACCTTCTAAAAAAAGAGAAAAAAGGAATAAAAGGATAAAAAGAAAAAAAGTAAAAAAAGGGAAAAAGAGAAAAAAAATAATTGCTACAGCGTATAAAGCTATTCAAGCATTGGGCAACGTTGCTAGACTTTTCAGAACAAGAGCCTTGCTTATGCAGTTAAGGAGTGTACTCTGATAGTCTCATCAATGAACTATTTCTCTGGCTTTTGGATGATAGGCTTCCGGAGATGGATGATGGACGTCAAATTTTAACTGCTTTGAATGTTCTGATGTTAAAGATTCTGGATAACGCATAATATACGTCATCATTTCCTGTGTCTATAAATATGTTAAGACCTCTGGATCCATCAAGATGTCCATCTTCAGATCAGAAACCTAAAACCTAAAGTTCTCTGATTTGGTTTTTAACTGTTTGATCATGCTCTAAAGGAATCTGCAACTCCAAAGAAGGTTGTTAAAGTAACTTAACTGGTGGCATAGATGGACTTCCACGTGAAGATATAAGTGAAAAGGTCACCCCCACTTTGTTAAAAGGCTTATAGAGTTCTGATTGGAAGGTCCACTTGGAATCTATTGAAAATGTAACCAAAATTCTGGAAGAGGAGAACTGGAATTGGAAATCTATTTGGAGCTCTATAAGGGCGTCTACACGACAGTTCTAAAATTTGATAATTGCTACTTTGTCCACAGTTGGTGCTCTTCGGACTACAATGGGACATCCGGTTGAGAAGTCAAGCTAGGGGATTTTTTCAGATTTTTCAAATGTCTTGAAAAGCCTTGGTGACAACAAAAAGCATATGCATGAGTGTACATTGAGTACCTTAGATAATTGGCTTGAGTGTACATCTGGCCAATG\n>XM_013088457.2 PREDICTED: Aplysia californica ubiquitin carboxyl-terminal hydrolase 5 (LOC101848919), mRNA \nGAAGTAATTCTGTTGTACCGCTTCTCTCAGTTTCAACATGGAGTCCGGTCTGTCCGAACTAGCTAAGCGATTGCCCGGTATCAAAGCCCCTATAGGGGGTGAGAAAGTCTACAAGGATGAGTGTGCATACTCATTTGACAATCCGGAGAGCCCTGATGGTTTGTATGTTTGCATGAATTCCTTTCTTGGAATTGGAAAACGTCACCTACAGCAATACTATGAGAAAACTGGGAATGGGGTATTCTTGCACATCAGACGTTTAAGAAAAGAGGTGCCCAAAGATGAGACGGCTGAGGAGGAAAAGCCAACCAAGATGGCCATCGGAGTGGAAGGTGGCTTCCAAACAGATGAGAAAAGATTTGAGTTTGAGGAGAAAACGTCCATCACCATCTTGCCCCAGTGGCACGAGATCGCCTTCCCCAACCCACAGATCCCTGATCAGGCCCAGCTGTCAGCCACCATGATTATGATGGCAGAGGATGCAGCCAAACAGGAGGAGGCCGCGGCCATGGCGGGAACGTGGGAGGGGGAAAAACTGAGGGTGTCGAAACACGCGGAGAACCTGCTTCAGCTGCCAGTGGAGAAGAAGATCCCCCCGTCGGGCTGGAAGTGTGAAAAGTGTGATCTGACCTGTAACCTCTGGCTCAACCTGACGGACGGCTCCATCCTATGTGGCCGGAAGTTCTTCGATGGTTCGGGGGGCAACAACCACGCGCTGGAACATTACCGGGAGGTGGGCTACCCTCTGGCCGTCAAACTGGGCACCATCACGGGCACAACTGCAGATGTGTTCTCCTATGAAGAGGACGATATGGTGGAGGACCCATACCTGGCCAAACACTTGGCGCACTTCGGTATCAACATGGCCGCGCTGGAGAAGACAGACAAGACCATGACGGAACTGGAGATTGACATCAACCAGAAGATCGGGGAGTGGGATGTGATTCAGGAGGCCGGCAGCGTGCTCACCCCAGTCTACGGGCCTGGCTACACGGGCATGCGTAACCTAGGCAACAGCTGTTACATGAACTCGGTCATGCAGGTCCTCTTTACGCTGCCAGACTTTCAGAAACGGTACTTCAGTAACTGTGGACAGATTGTGTCCAACGCCCCCCAGAATCCTGTCTCTGACTTCAACACACAGATGACCAAGCTGGCAGATGGTCTCCTCTCTGGTGTATATTCCCAATCAGTAGATACCAAAGAGGCTTCAGAAGGGGATGCCAAGTACATTCCACCCCCCAGCGGAATCCGCCCTCAGATGTTCAAGACGTTGGTGGGCAAAGGTCACCCGGAGTTCTCCACCAAGAGACAGCAAGACGCGCAAGAGTACTTCCTACACATGGTCTCCGTTATACAGAAAAACAGCCGGGGCGGCGCGAATCCTTGTGAGTCGTTCCGGTTTGAGGTGGAAGAACGCGTTGCTTGTTCCTCCTCCCAGAGGGTTCGCTACACTCGCAGAGAGGACTTCTGTCTATCCCTGCCCGTGCCCATGGAGGCTGTGTCCAATAAAGAGGAAGTAAGGAAATACAACGAGTCCAAAGCTGCTGGGGCAACCATTGTTGACCCAAAGAGCATTGTGCGTCCAGTGATCGCGTTCTCCGAGTGTGTTCGAGCGTTCACAGAGGCAGAGACGGTGGAAGATTTCTACAGTTCTGCCATACAGGGCAAGACCACAGCTCTCAAAACGACGCGTCTTTCATCGTTTCCTGATTACCTGATGGTGCAGTTGAGGAAGTACACCGTCGGCGATGATTGGGTGCCGCGGAAACTGGATGTGTCGATCCAGGCTCCAGATGTACTTGACCTTTCCTCCCTGAGAGGTCGCGGTCTGCAGGCTGGGGAGGAAGAGCTGCCCCCAGGGGATTCCCCGCCAGAAGCCCCGGTGGAGATCCAGGAAGGCACGGTGACCCAGCTGGTGGACATGGGGTTCCCACGCGAGGCGTGTCGCAAAGCCGTGTACTTCACCAACAACACAGGCGTGGAGGCAGCCATGAACTGGGTCATGGAACATATGGACGACCCAGATTTTGCTGCTCCCTTTAACCCTGCCCCTGCGGGCGGAGGTGTGAAGGGAGGCGCGTTCGAGCCCAATCCAGAGGGACTGGCCATCCTCGTGTCCATGGGCTTCTCCTCAGAGCAGGCAACAGTGGCCCTCAAAGCAACCAGCAACAATGCGGAGCGAGCCGTAGACTGGATCTTCAGCCACCCGGACGAGCTGAGTCAGCCCATGGAGACGGAGGAGGCCAGCGCCCCGGTCACTGCCGCTAACTTTAAAGATGGGTCAGAGAAGTACCGACTGGTGGCCTTCATCAGCCACATGGGCACGTGCACCAGCGTGGGTCACTACGTGTGTCACATCCTGAAGGAAGGTCGCTGGGTCATCTACAACGACGAGAAGGTGGCACTGTCGGAGCAGCCGCCCAAGGACCTGGCCTATCTCTACCTGTACCAGCGCATGTAGGACATTGAGGGGGGGAGGTGAGAGTGTGTGAGGGAGGAGGACATTGAGGGGGAGAGGTGAGAGTGTGAGGGAG\n>EF220307.1 Uncultured alpha proteobacterium clone FB-2_C04 16S ribosomal RNA gene, partial sequence \nAGGGTACGGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGTTACCGACGCTCAGGCGCGACAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGATGCTAGCCGCTGGTAAGCATGCTTATCAGTGGCGCAGCTAACGCATTAAGCGTCCCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGCAGAACCTTACCAGGGTTTGACATCCCGCGCTAAACTCAGAGATGGGTGGTCCCCGCAAGGGGCGCGGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCTCCTTTAGTTGCCATCATTTAGTTGGGCACTCTAAAGGGACCGCCGGCGACAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTACACCCTGGGCTACACACGTGCTACAATGGCGGTGACAGTGGGCAGCGACCACGCGAGTGGATGCGAATCCCAAAAAACCGTCCCAGTTCAGATTGCACTCTGCAACTCGAGTGCATGAAGGTGGAATCGCTAGTAATCGCAGAACAGCAGGCTGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTGGTTCTACCTGAAGACGGTGCGCTAACCGCAAGGAGGCAGCCGGCCACGGTAGGGTCAGCGACTGGGGTGAAGTCGTAACAAGGTACCAATCCCGCGG\n>KU308505.1 Uncultured Alphaproteobacteria bacterium clone 0107 16S ribosomal RNA gene, partial sequence \nAATGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGAGATCTTCGGATCTAGTGGCGCACGGGTGAGTAACGCGTGGGAACCTACCTTTTAGTACGGGACAACGTTTGGAAACGAACGCTAATACCGTATACGCCCTCCGGGGAAAGGCTTGCCGCTAAAAGAGGGGCCCGCGTCTGATTAGCTTGTTGGTAAGGTAATGGCTTACCAAGG\n>FQ227369.1 Rattus norvegicus TL0AEA13YJ12 mRNA sequence \nCAAAATAGTTAAGATGTAGATCTCCTCTTTTACTGAAGTAATTTATAATTTCTGGCTTTTGGACTGACTGTCAGCCATCAAAGGTTTGAAATTAGACTTAGTTAAATGGTTCTTACCGTTGGAGCTCCCTGGCCTCCTAACCCAATTAATGAGCTCCGTGTTCACATAGATGATAGAGGACCAGTTGCTGAGGACACTGCTGTAGCGCATGCAGCAGCACCACATTAAGAGTCACATGGAGACAACATCACTAAATAGATACGAATCTTACGTAGAAATAAAGGGCAAGTGAGTCGAGCCCAGTGTCTGTTTTAACAGAAATGATCTGCTCTGCAGTAGTGGTATAGGTCTTTAATCTTAGCACTTGAGAGGCGGATTCAGGTGGACAGCCATGGCTACACAGAGAAACCCTGTCTCAGGAATGGAAAAAGTCAAACATCAAGGATGTTTCATGTGATTTTGGTATGTATTCAATTTTGGAACTCTCTTCTGGTGGTGTAACATACAGAGTTGACTTGGTTTTTTATTTTTGTTTTCTTGAAGAAAACAGGGTTTATCTGTGTAGCTCTGGCTGGCTTCTATCTATTGGATTAAAGGTGTTTCCACCTCTGTTCGACATCAGTTTGGTTTTAGGATGAGGCATATTAACATAATGTTTCACTGGGCTTTTTCGTTCCAATGGGAAATTAATAAAAACCTGTGGATAAGGGTTGGGGATTTAGCTCAGTGGTAGAGCGCTTGCCTAGGAAGTGCAAGGCCCTGGGTTCGGTCCCCAGCTTTGAAAAAAAAAAAAAAAACCTGTGGATAAGCAGCACAAGTCAGATTTGAGTAGTTTAAATATGACAAAAAGGACGCAAGACGGGTTGGACATAGTTAGGAATGAGAGATGGATATTTTAAAATGTTAGGAAATTCTCAAGGAATAAAATTACTTTAAAATTACTGATAACAATCAGACATTCTTTAGTATGATTCTCCTTTGATACTGTAAGCAAGCACAGAAGTTTAAGAAATAACATAAGGGGCTGGAGAGATGGCTCAGCAGTTAAGAGCACCCGACTGCTCTTCCAGAGGTCCTGAGTTCAAGTCCCAGCAACCGCATGGTGGCTCAACAACCATCTGTAAAGAGATCCAATGTCCTCTTCTGGTGTATCTGAAGATAGCTACAGTGTACTTATATATAATAAATGAATAAATCTTTTAAAAAAAAAAAAAAAAAAA\n>JX483172.1 Uncultured prokaryote clone Cluster11712 16S ribosomal RNA gene, partial sequence \nCGTCAAATCATCATGCCCTTTATGACCTGGGCTACACACGTAATACAATGGCGCTTAACAACGGGAGGCAAAATCGCGAGATGGAGCAAAACCCCAAAAAGCGTCTCAGTTCGGATCGCAGGCTGCAACCCGCCTGCGTGAAGTCGGAATTGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTT\n>XM_030995465.1 PREDICTED: Strongylocentrotus purpuratus uncharacterized LOC105441690 (LOC105441690), transcript variant X2, mRNA \nATAGCAATGGCTGTCGACGGCCTGGCGATTCAAACTATTTGGATGAACGTAGCTGCATTTTGTTCCCTGAGTGATCTTGGAAGATTACAGTCAACATGCAAATATCTCAACGCGATTCTTTCATGCAATTCAGTTTGCTGTGGCGCAGGGCCGAGTCCTCGCGGCACATCCGTTTGCGCTCGGCGTTGTCTACAGTAGTTCCTCTTCGCAGACTGAAGGCGTGTGATGCAAGGTTCCTGGATGCTGCAACAGATCACATGCTGCTTGGTGGCATAGCTCAGAAAGATAACAGTTTTGCTGAACTCTGGCCTTTCCTGGAGTCTGAGAAGAAGGCCTTCTACAACCATCGAATCGCGATGCTACTGAGGAAGGGGCGGAAGGGGAGAGAGAAATGCTTCTCACAGGTCTCAGGGTTGGAGTGTGGCATGCCGCTGCAGTTCTGCTCTCTGAACCTGCTGGGAAGCGGATGGAAAGTGCGGAAGAGGGTTCTGCAAGCCCTTGAGGACACCACCAATGCTGCCATCAAGATCGGTGGAATCAAGAACTCTGAGCTGAGGTGTAGCCTGCAGGAGTTATTCCGTCCAGGATTGATCAGAGACTTCTCTCAAGAAGCGGAGCCGATCTGTCTCCGAACCCCCATCAATATGATTCCAAAAGACCTGGAAATAGTCAAGGACCTCTTCTTTCGTGTCCTGGGATACACTTGCATCTTACCGTTCAACGTAGCATCCCATGTCAGCGACAACGCCAGAGCAGAGACATGCCTCATTATAGAGAGCTACGTCCATCACACTGTCATCACACCCATCATCGATGGCATTCTGTGCTCAGACCTGGTGAGATGCAAACCCATCGGCTTTGCTCATGTCCTGGATTATCTGGTTCTAAGTTTGGTAGTGAAGAACCCAAACCTCAGTAAGATCAGAGCGCCATCCCTCATGCTGAACACGAATCCTGAACGCATGACCCTTGCCCTTTCACCTGCTCGTGACCTAATGGCTGCCGTCCGTCCAGAAAACCCTTCAGAGTATGCCTACAATTCACAGCTTGGTGTTTTGCAGTCAGGTACTGCACTTCAGCTCAAAGAGAGCATCCTATGCGTCTTCCAAGGAATCGACTCGTGTAAGCGCTCAGAGTTCCTAGTCCTTCTGGCAACCGAGTACATGTACAAGTGCCTTGACCTTGTCTCCATGGTAACCGAACTCCTCGGCCAGTTTGACCTTCTCAACGTGCGGCGATTGGTGAGTCGCATCTTCTTCGTCGGGGAGAACACGCGGATCGGTAGCTTCCGGGAGAGGTTCGAGAGGGACCTGCGGGTGAGTCTCAACCGGTTGGGGGCGGTGTTCGGAGGAGAGTTTGCCAGGCAGCAGCGATGGCCGATACACTGCGTACACGCAGAGGTGGAGGACAGACCAAACTGTCTGTTTTCTGATACCTTCACCACCATGGACTATATCCTTCAAGGCCCTGATTTCTTCTGAATCTCCCTTTATTTCTTTTTTAATTATTTATTTGGTACTTTCAAGAAATATAACAATAAAACAATATAATCATGGTGTTTACAAAATTAGAATGACAACAATTATACAAATACAACTGTTTGTAGCAATATTCTAAGTGCAAAAGATGGCAGCCAGGGAAAAACAGAGCAAACTTAATTACTGTAACCGTAATGGTCTCTTTGCCAAACCAACTGATGCACTCAGATGGTGCCTCCTCCCCAATGAACACCCTATACAAAGGGTAGTTAATATGAGGATATGCAATTGACAACCATGAACAATACTTTCCAAATCACAATTTCTGCAGGATCTTCCTTTCAATGCACCCATTTGAGGCTTGCCTCTAAGGAACATGCATGTCTACATCCTATATAAAGAAAAGTCAGCAGAATCTGCAGTTTTACAAAATAGCACATATCTTTCAGGACCCTAATTTCTTTTAGGTCTCAAGGAACATGGATGTTTTGTCCTATCCAGCTGATAGAAGGGCTAATGTGCAATTTACCGTCATCAATATATTCAAGGCCCAAATTTCTTTTGAATCTCTCTTTCAGTTCATTCATTTGAGCCTTGTTCCATAGGAACATGGAACATTTTTTTTATTATCTAAAATCCAAAGGATAGTTGAATAATTCAATTTACCTTCATGGGCTATATCTTTTAAGGTCCTAAACCTTTCCCAGCATTCATTCACCTATTCATCCACCCTTCCTTCCATCCATCTGTTAGTATCATATCCTTAATACCGGAGTTACATACTAGTTATATTTAAGAGGCCTAAATAACAAGATGTTACACAAAGGTTCTTCATTTACTGCATGTATTTCACTTTTACAAGTCTGCCACAAGGTAGCGCCATTTCACTATCAATATTGGGATATATTAATAATCTCATTACACCTTTCCTTCTTTAAAGAAGCATGTCATTATATAAACTAAAATAATACCAACAATGTTGCTCAGAATTAAGCAGTACTGAAACATTTGAGTATCTTATATAAACTTTCAAAACCTGTTCTTTGTATTGTAAATATGTACATGTATGTGTGTATTCCTAAAAAACCAGCTCACACATTTTGGATATAATAACAAGTGATTCAATTATCACTGAGGTATAAAGCTACTGAAGCGACTTCAACAAACTTATATTTAAAACTTAATATACACAGCAACTCCACAGATGAACTTCCTTAATTCTTACTTACTATTAAGCTGTTCTTTGTTCAGTTGAGTTTCTAATCTTTTAGATATGCTGGCTGTTTTGTCTGCCACTGACTTCTGCAGAATTGATCCGAGTTCTGCCCGGAGTTGTCACTACTCGATGTCGTGTTTGTTGGTGATGTGGTTGGAGATGTGTTTTGAGGATAGTCCGTTACGGAAGATTGTTGATCCACAACCAAGTCACTATTATCGTTGAACTGTTCATTTGATTTTCGATGTTCAGTTCTGATGGAGTACGACCGAATACCGACTTTCTTGAGTACAATGGCACTTTCCCAGGCCCTGGCATCCTTTTTCGGCTTGACTATTACGGTATCTCCAACTTTGAGTTCAAGCAGATCTTTGGCACTGCGGTTATAGTATTGTGCCTGCTTTTCGCGATTCTTCTCTTTTCGTTCATCAATGTCTGTTTGCAGCTATACGAGGGTCCATTGTCAGCTAGGACCGTTTCCGGGATTCGTCAAATTCCTCTGCAATCTAGTTATCACAGCTGGCGCATCCTTCTTCCCGGTCCCAGTAATCCGAAAAATAGTCCACTGTACATAGATAGTCATGGCCATCTAGCGCGAAAATGTCACATCCATTTTCTGCCATGGACGCGTTGGTAATTCATGGTGTATGAGGGTTTCCTTCCTTTGTGATGAAGCATATATGTTGCATGCTTCACACCACGATAAGTAGTCTTTCATGTCGGATGTCATATTCGGCCAATAGACACATTCCCTCGCTCTTTGTAGTGTGTTCTCGAGGCCTGTGTGACTGGCATGTAGTTTCTTGCGAATTTCACCTCTCATGTCCGTGAGGATGACACATCTCAGTACTTTGAACATGATACCGTTCGCGCTTGTTCGTGACGAATGCTGAAGAACGGTTTTGCCTCTGACGTACAAGCCTGGCTAGTGCTCGGCCATCCTGAAGCAATATAGTCCATCACTGCTTTCAGGGCTGTATCGCGTGCGGTAGATTGGCAGATCTCTTGTTGCGATATCTGAGATACGGGAATTGCATCAATAAGGTGAATACACTCGACCTCTTCTTCAATGCCTGATCTTTGAGGTCACTAGTTTTATTTCTGAAAAACTTGTTTTAATCGATTTAAAGATATTGGGTATTGTCGTAGTACGTGATGAGACAGTAAAGGAAGCCCAAGAGACATTTGTTAGTGTAACTGGTGCTTTATTTAAAAAACGTTAATTCTCGGTGTCCACACACAGAAATGAAATGTCTACAGCAAATAACCCACTGAAGCCCCCAACTACAGTCCGGCATCCTCAAGGAAAGAAGGAAGACACCATGCAGCCATCAATCTACTCAGCAACACAAACTGCAAGTCCTCTTGCCCTCATAAAGACTGCCAAACAGTTGAACTAAAACGTTCACCAAAAGTAACTGCAAGTTTCTCTAGCACAGGCACAGCCAAAACATGCACTCTACCCTTGAACGTGACAAAATGTGCTTCAATACAAACATGTGTGTTAAGACATTAACGTGGGCGGTGTATTACAAAATCAATTACCCATCCGCGAAACCATGTGTAACATGTGTAGTGAACTAATTTGCATAATCCACCTGATCTTGATAGCAACTTCCACACAATCCTCAATTGGTACTTCAATGTCACGAACACCTCTTGGTACGCTCGAAAAAGGAAGACCGGGCTAGATTTCCGCTTTGTTGTATAAACCCAACAATATGCCAGTTGAGTAAATTTATTCAACCTGTAAGTAGAATAAAGATAAACATCTTCAGTATACATCACGCAAAATATATATGTATGCATTTACTCTGTTCATGCATAATTAAAAGCGTTAAATTGCAATCATTGGCGGATGCTGATCTGGGCCCCTGAATCTAGGAGCACATTTCCTTCTCTCTTTAGCTGGTCTGTTCAAGTAAACCTAGCATGGCTTCCATCCCTCTTACATGGGCTACTCCCACTGCATTGTTGTCCATACTGGGGTGTAAAAGCGGATGATGGAAGAACTTGCACGGTTGCCCTTTTTATGTCTCTGGACACTGTCTCCTTTTCTTACAAGTAGCCATCCGATGCTCTGTACCGGCTTGCCTTAAACAGCTATAACAAGCTCGGCTGCTCTTCACCAACTCCAATCTCTCTGCTGTAGACTTATCAAGGAAAGTTTTGCATTGATCAGTCCAGTGCCATCCTTACTCTTGCAGATCCAGCAGCGATAATCTTGCTGTCTTTCCTCAACTGTTGTGACCTGATTAACAGCGGATCTGGACTTGGAGGTTGAATCATTCCTCACTGGAGCAGATGATCCTTGAGGATTCTCTCCTCCCTGCATAAGACTTTCTCCTTGGCCACTCCTCCCAAATGATCGACTAAGGACGGGCCTTTGCAGCATCTTTCAGCTGGTAGTGCCGACAATAACTATCGAAGTTGTCCAGCCACCCCTGCAGAGACAGATCACCAGCAACCTGTGGAGAACCCTTAAACTTGCCCACCTTAACTGGTGGTGGCGCCTTCTGTACATTAAGTCCTTGCAGAACACTGATTAGTGTCTCTAATATCTGCACCACTGATACGGCCATCGTTACAAAGGCTGTAAAGGTACTAGTGGGACAAAACAGATAAGTTACAAGTTACTATACTAAAAGTACATAATAATAATACAAAACAAACAAAATACAATGATAAACAATTACATATCAGACATAACAAAAATTACAAATAAACCTACAAATTA\n>AK346643.1 Sus scrofa mRNA, clone:MLN010029B10, expressed in mesenteric lymph nodes \nTAGCTGAGACACTGCCATGTTTCTCATGTACTTAGAGAAAATTCACAAGGTTTTATTTTATTTCTTAGGTTTTGCAAATATACATATAGGGAAAAATGAAAATATAGAAAAATGTGAAACGTAACCAATTCTGTCTATATGGTGGGATGGGTTTTTTTTTTTTTTTTCAGAAACTAAGTTTACTGACAGGATTTTACTTTAATTTTAGTAAATATGACTAATTTAGAGGCGTTAATCCCTTATGAGGTCTTGGGATTCCTAAGTCATTGTGTTGGAAACTGTCTGGGAAAGACAAATAGTTAAGATACGTAACTAGGATCTCATGTTTTGGATTTGTACTGAATGACGTCAGAAGGAATGTGGTAACTGTAGTCTCTCCATATTTGAAGCCTGTCAGAAAAAGGAGAAATTATAGAATTTTGTTCATTCGTTTTAAATTTCAGGAGGCAGTGTCGGTCACTGGAACGGAGGACAGTGGTGAAGGCAGGTGTAAGTGAGGGAAGGAGGATGAGGAATGCCGTGAGTGGAAGGAGGCAGCCTGGCGTGGAGGTAGATTTTAGCTCATGTGAAGCGAGATTGCTTGCTGACCGGTACAGAATTATCCAAGGATTAAACTACTTGATGAAGTCATGAGCCTTTCCATCTCTACAATGGTTTTCTCTTTAAAATATAGGTTGCCGAAGGATCTAAAAATGTACGGCTAGGTTCCCTCATTGGGTTGCTAGTTGAAGAAGGAGAAGATTGGAAACATGTTGAAATTCCCAAAGACGTAGGTCCTCCGTCACCAGTTTCAAAACCATCAGTGCCTCCTCCCCCCTCACCACAACCACAGATTTCTACCCCTGTCAAAAAGGAACACACACCGGGAAAACTGCAGTGAGTATACTTACTTGAATGATGTTAAAAAAAAAAAAAAAAAAA\n>XM_010884186.4 PREDICTED: Esox lucius IQ motif and ubiquitin domain containing (iqub), transcript variant X3, mRNA \nGGGTGGGGGCGTATGAAAACGTTACGCCAGTGCTTCTTAGATCACATGGATGTTACCATGGGAGCGCCCAAACACTTGCAGCATTGAATCAAGTGAATGGTACTGTATGCATGCGGCACCAAAGACACGAGCTAACGTTAACGTTAGCCAGTTACCCATGTCCGAACATGATGCAGAAACTTCGGGGATCAAAACTGATGAGCAAAATGAAAAAGAAGACCCTTTGTACCACAGATTAACCGAAATAAGTGAGTCTCAGTTAGAAAGCAACGCGACAGAAGAACCACCTACAGATGTAAGTCTTACGTTACATTTACAAGATAGCGATGCTGGGGGAAAGATTGAAACACAAAATGTGATGATGGAGGAAGAGGTATGCAAGTCAACCTTTTTGACTGAGAATGGGAACTCGGTGGAGGCTACAGCTCCAGCAGACCCTCTGGAGGATAACAGGCAACAAGGAGCATTACCAAAGAAAGAGTCCTTCCCAAATGCTGTTGGGAACTCAACAGCCACTGTGAAGATCATGCTGATGCCAGAGGGACACATGATGACAATGGCCTTTGCCATTGGGCTCTCCATCAAAGAGTTGAAGTGTAACTTCTCAAATGAGCTAAAAGTACCAACAGAAGTCATACAAATATCTCTGAGTGGCAGAGTGATAGAGGACCACAGAAACCTGATAGAGCTGGGAGTGCAGCCTCATAGCACCGTCCAGTTGGAGATGACCTCCTCTGACCCTGACAACCACCCCATCCGTCCTATGAAGCCCCGGCAGGACTACAACATGCCTGACGTCCTCACTGTCCGAGTCCAGACAGACTCGGAGACAGACACATTCCAGGACGTTGTGGTCGAGGTTGAGAGGGTCACCCACAGGAAGGCTTTTCTGGGGGGCTACAGGCACAAGGCCACAGGGACGGAGTACCACCACGCTGCTGTACAGACTATAGCCAAGAAAAAACCAGACGGGGGGGTGGAGACTTTCAGCCGCGACACACAGACTGTGACGGTGAAGAGCCAGTCCCAGCAGTGCACCAACAGCACATCCACCCAGATGACCAGGATCGGCTGCTACGTATCCAACATGGAGGACAAGCTCATCTCCCCTGGGGCCTACGTCACCGCCGCCCAGTACCACGCCAAGAGACTGAGAGCTGTGATCACTCTGCAGACGCACACGCGGCGCTGGCAGGCAAAGCGGATGACTGACCAGCTGAGGGCCGACAGGGATCTGCGTCTGGCCTGGATGGAGCGAGATGGGTGTAGGAAGAGGAGGGAGAAAGAGGAGCAGATCAAGGCTGAGTACAACAGGAGGATGAACCCAGAGAGCAGGGATGACTTTGCACTGCTCTACAGCGCCCTGGAAAAGTGGAAGAAAGAGGAGTTGGAGCGAATCAATGCCACACTGGAAGGTGCTGAGAGGAAGGCTGCTCTGTGTGCGCTACTGGAACAGGAAACGCAGCTAATTGCATCCATTGGACGCCACCGAATAGCTGCTGGGGAGAGGAATTACCACAAGGCCGTTCAGGCCTTCCTTGAAAAGTGTGCTGCCCCTAAGAGGTGGTGTGCATTTGATGGGAAGATGACCCAAATGGAAACCCAGTACACCATCAGAGCCAAGAAGCTGAAAGAGCTGTACACCAGCATCAACCTGCACTACTTCAACCACGAGGAGAGGCTGGACGTGCTGCTAACACTTAAACACACCGTCAAGGAGCATGACTGCAAACTTACCCAGGACATTGTGGAGTTGATTGACAGAGAAGCAGACCTGCTGTTGAGGGGGGTGAAGAAGTCCAATCTGGAGGGGCTAAGGAAGAGAATTTCCACCCTCTTCCTCCAGTACATCAAAAGCCCTACCTTTAACCCTGAGGCGGCCAAACTACTGAAGGTCCCCCAGGACCCAGCTCAGCTGAGGAAAAACATCTACTTCTGCCGTAGCTGTTGCCGCCATTTGCAGTCCACTGACTTTACCCTGACGGTCAATGCCCGCCTAGTGGGCCAGTGCCAAAGCTGTTCGGAGCTGGACAGCGAGGCCCGCGGCCGCGAGAACCTCTCCCACTACAAAACCATCCTCAGCAGGCTCCGCAAGTCAGAGGCCCAGAGGGACAAGGAGGCCAAGATTACCTTCCTGCTTCAGGAGCAGGATCTGAAGTACCTGGTAGATGTAGTGTGGGGGGCCCAGTCAGCACTCAGTGCGTGGAACGACATGCACGACCTGGTGATGGTGAGATGGGAGCGCATGTGGGAGTGGAGTCCCTGGAACTGCATTCTGCTCACCAAGGAAGAAGCTCCTGTTCATGACAAAGTGGAGGACAATGAGAAGGCCTACGGAGTGGTGTTTATTCAGAATGTCAAACAAAAACACACGCTGGCAAAGAAGTACTTCTCCCAGATTCCAGTCATGGCCAAATACCTCCAGGACGTGCACTCACAACAGGCCGCCCACGGAAACTTCTTGGTCGCCAAGCCCATCAACACGTTGACAGCCAAGGCCCTGCCTACAATTCCACAAGCCACTGGTGGAGAGGCTACCCAGTGAAGGCCTCCTTATCCACCTGCCTGCCTAACTGTCTGTCTCCCTCTTTCTCTATTCCTCATACTCTGTTGAATGTCAAATAAAAATAGTATTCTTGAGAGGTATTGAACTGGGTAGAAATGCAATTTTGAAATGGATGTGTAATAATTTTGTGATAAACGTGAAGATATTAAATGTAAAATA\n>XM_003665021.1 Thermothelomyces thermophilus ATCC 42464 uncharacterized protein (MYCTH_54167), partial mRNA \nATGGCCTCATCAGCTGCCGCTCATGGCTCCCGGCGTCCACCCACGAGACCAATAATCTCCGCAGACCGGAACCACCACCGCATCATCCAACTCGACGACTTCTCCTCTCACATCGCAAGTGCAGAACAACAACCACCGCCAGCAGGACCAGTATCGGCAGCAGCCAAATCCTCCTTCAAACACCTCTTCACATTCACCCCCGCACGGCACATACCCTTGGTCGCCCTCTCGTTCACCACCGCCGCCCTCGTCGCCGCCGGCCGCACTGCCTACGCCGTCCTCCTCGGCCGCATCTTCGACGTCGTCACCCGCTTCGGCACCGGCCTGCTCTCGCCCGCCGACTTCCTCGCCCAGATCTCCCAGTGGGCCGTCTGGTTGTGCGTCCTAGGCGCCGGCATGTGGGTCGTTTCGACCGTCGACGCCGCCGCCTGGGTCGTCGGCGGGGAGCTCAGGGCGCGGACGGCGAGGCGGGAGGTGTTTTGGCGGTTCCTGATGGGCAAGGAGGTGGGTTGGTTCGAGGCGCGGGAGGAAGGGGTTGGCGGGTTGACGGCCAGTGTTGCGACGCAAACGAGGGAACTGCAGACGGCCACATCCCAGACGCTTGGCTACATTGTCTGCGACGTGTTTGTGTTCGCCGCCTGCCTCGTCGTCGCGTTCGTCTACTCGTACAAGCTGACGCTTGTCATGCTGGCGACTGGTGTCCCCTCGGCCCTGATACTCTGGCGCATCAGCAGGTTCCTCGACCCGGCGATCGAGGCGCAGAAGAGAGAGCTCGCGCAGGCCGCTAAGTACGTCACCGCCGCCTCCACCGCCATAGACCTCGTCAAGGTGTACAACGCGGCCGACCACGAGGCGTTCAACTTCACTTCGGCAATCCGGAGGTCGGCGAGGTATTACTCGCGCCAAGCGATGTGCAACTGCGGGCAGATGGGCTACGTCAAGTTATGGATGATCACGTTGTTCGTGCTGGGCTTTTCATTTGCCGTCGTTCAAGTCAAAAATGGCGAGCTTAGTCCGGGCGATGCGTTGACCACCTTCTATGCCGCCCTTATCGCGTTCCAGTCGATCGAGATGCTCGGACCGCACTGGCTCGTATTGGCGAAGGGCATGGCCGCAGGACAGCTGCTTCGAGGACTGGTGGATGAGAGCGGCAGTGGTCAACTCGAGAGAACTGCTGGCTGTCTAAAGCCCTCTGGGTGTCGGGGAATCATCGAGATGAACAATGTTAGCTTTGCGTATCCGTCAAACTTTGCCAGGGCAGTCATACGGCCATCGAATCTTCGTTTCGAGCCTGGACGGCTCACCTTTGTCATTGGCAGAAGCGGCTCTGGTAAGAGCACCCTCGGCAGTCTCCTCGTGCGGTTCTACGAACCCCTCACCGGACAGATCATGCTGGATGACAACCCCATCACGGCATTCGATCTCAACTGGCTTCGACAAAACGTTACGCTTATCCAGCAATCCAGTTCGATCTTTGGTGACAGCTTCTTCAAAAACGTCGCCCTTGGCGCCATGGAACCAGACAATGTCCCCCTCGACGCCGTGCAAAGCGCTTGCTCCATGGCCCTCCTCCAGTCCACCATTTCCAGCCTACCCAACGGACTCGACACCACGATCGGTCCAGGCGGCTACGGCTTGAGTGGTGGACAGAGGCAGCGTCTAGCTCTTGCCCGAGCCAAATTACGCGATCCACCCGTTTTGATTCTTGACGAGATCACCAGCGGACTCGACCCCGTGAGCCGAAATCTGATCATGGAAGGCATTCGCGCGTGGAGAAAGGACAAGACAACAATCATCGTCACTCACGAGGTCGGCGACATTAAGGACGATGAGTATGTCTATGTCCTTGCAGATGGATCGGTGGCTCAAGAGGGTCTCAAGCGTGAGGTTGCCAAGGATGAGAGCGGCCTCTTTGCCTCGTTCGTTGCCTCTGCCGAGACTGCCTGTTCCGGCACTGACAGCGAGACTGAGAGCGAGACTGAGAGTGAATCCGATTCCTCTGACGACGGTCCTCTCCAGGAGTCCCAATATGCTAGGTCGCCCCGAGGTGCGCTCATCAGCAACCAAAGAATGCCTGTGGGCCTGTTCCAGCGCATCTCGCTAGGACCCCGAGCAACCATCGCACAGGAGTCCATCTGCCGATCCATCACTCACAAGATGGCCACGGATGATGAGCCTGTGACTGTCAACATCAGCCGCCCCTCTAGTATCCGGATCATAGCGCAGCAAGGATTAGCAGCTCAAAGAAGTAGGACTCTGAATGCACGCCAGGCTTTGCGGACCGATCTGGACCCGGAGCTCCAAGTGTCTCTCGACTCACTAGACCGTTTCTTTCTCGAGCACCTTGCCAAGCCCAGGGGCCGCGAGAGCCCATCTAAGGGGACCCAACTACCTTCACTCGCGGCCATTTTGAAGACTGTCTGGCCGACGCTGGACAGGACGGGCAAGGCTCAACTGATCGCTGGTATTGCTCTGTGTCTGGTTGTCGCAGGCAGCAACCCCGTCTTCTCCTTCTTCTTTGCCAATCTTATCGGACAATTCTGGAACATGGAGGGCCAAGAGAGCTCAGTCCCCAAGTGGGCTGGCCTCCTTGCCGCCATTGCTGCTATCGATGCGAGCGCTACCTTCTTTGGCTACTTCCTCATGGAACAAGTGGCCCAGAAATGGGTCAATAATCTGCGCGCAGAGGCGATCAAGCGCATCCTTAGACAGCCCAAATCGTGGTTCGACAGGGCAAACCATTCCCCGGCTCGCATCACCCAGTGCCTCGACCGCAACGCCGAGGAGATGCGCAAGCTTGCCGGCATGTTCGTGCCCCTCCTTTTGACCATCTCCACCATGATGCTCTCCTCGCTCATTTGGGCGCTGGTTGTCCGGTGGGACTTGACATTGGTGACGCTCGCCGGCGTGCCCGTGGTCATCGCAGCGGCGCGCGCCAACTCGCTGACGAGCGACAAGTGGGAGGCCGCCTGCGATCAAGCTGCTGCCGCGACCAACGCCATCTTCAGTGAGGCCTTGGCCAACATCAGAGTCGTGCGCGCCCTGACACTGGAGCGCTACTTTAGCAACAAATTCAGCCGCTCCGCAGCTGCCACCTACCATCTCGGGGTGAAGCGTGCAGGCTTCATCGGGTTCTTCTACGGCTTGCACCAGTCCATCGTCTTCTTCCTGACCGCTCTCGTCTTCTTCTACGGTGCCAAGATACTCGGCGAAGAGGGTACCACCGTGACCGACGTCGTCAGGGTCATCAACCTCTTGCTCTTCTCGCTCGGCACCGCGGTTGCCATGCTGGGCAACGTCCCGCAGATCGCCGCCGCCAAGGCCACGGCGGTGCAGATGCTCTACTACGCCAACCTATCGCACGCCGCGAGCCACGAGTCTCGAGGCGAAAGGCGGCTCTTCACCCCGCTCCCCGTCCGCATGACGAACCTGCGATTCGCCTACCCCAGCGCGCCCCAGACCCAGGTCCTGCGCAACATCAACCTGCAGTTCGACGCCGGTACGTGCACAGCCATCGTGGGCGCCTCGGGCTGCGGCAAATCCACCATCGTGAGTCTACTCTTGCGGCTATACGACCCGCTGCAAGAAGAGACGGACCCGGCACGCGCAGCGCACCGAAGCGAATCCGGAGCCCCCATCTCCCCGACCCCGGAATCCCCTAGCACTCCCCGATGCCAACGCTCCTCCCCCTTCCCCTCTGCCACCGCCACCACCAACACCACCACCAACACCCCACCCCTGACCTACGCCTCTGTCCCCTCCTCCCACGTCCACACCCCTTCTCTGCGCGCCCGCATCGCCTACGTGCCGCAGACCCCGGTCCTCTTCCCAGGCACGGTGCGCGCCAACCTGACCTACGGGCTGCACGAGGGGTCGCCGCTGCGGGCGGAGGCCAACGTCGTCCTCGCCGCGCAGCAGGCCGGCATCCACCCGTTCGTCGCCTCGCTGCCGCAGGGGTACGACACGCCCCTCGGCGGCGACGGCGGCGGCGGCATTGGCGGCGGCATTGGCGGCGGGGGGCCGGCCGCCGTGTCGGGCGGGCAGGCGCAGCGGCTGTGCATCGCGCGCGCCCTCGCCCGCCGCCCGCGCCTGCTCGTGCTCGACGAGCCCACCAGCGCGCTGGACGCCGAGGCGGCCGCCGAGGTGAGGCGGCTCCTGCGCCGCCTGGTGGAGGGCGGGGGCATGGCGGTCGTCGTGGTGACGCACAGCAAGGAGATGATGCGGATGGCGGACCGGGTGGTGATGATTGAGGGAGGGGTCGTGGCGGAGCAGGGCGGGTACGACGAGCTGATGACGGCCCCGGGAGGCAAGTTCCGGGCGCTGGTCGAGGGCGGGGTCTGGACTGCCGGCGAGGGCGGTTATGCTGAGGAGATGGAAGGGAAGGGGAAGGGGAAGGGGAAGAGAAAGAAGAAGAAGGAGAAGAAGGAGAAGAGGGGTGCTGCCGGGTGGAGGGACGTGGAGAGGTCGAGGGAGGAAGCGCTTAGGCGACTGGAGGGTAAGTCGGACTAA\n>HM739632.1 Uncultured bacterium clone GB7N87002DK33B small subunit ribosomal RNA gene, partial sequence \nAGAATCAACGCTGGCGGCGTGCCTAACACATGCAAGTCGCACGAGAAAGGGGCTTCGGCCCTGAGTAAAGTGGCGCACGGGTGAGTAACACGTGACTAACCTACCCTCGAGTGGGGAATAACCTAGAGAAATCTGGGCTAATACCGCATAACACTTACGAGTCAAAGCAGCAATGCGCTTGAGGAGGGGGTCGCGGCAGATTAGTTAGTTGGCAGGGTAATGGCCTACCAAGACAATGATCTGTATCCGGCCTGAGAGGGCGCACGGACACACTGGAACTGAAACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGCGCAATGGGGGAAACCCTGACGCAGCAACGCCGCGTGGAGGATGAAGTCCCTTGGGACGTAAACTCCTTTCGATCGGGACGATAATGACGGTACCGGAAGAAGAAGTCCCGGCTAACTTCGACGCCAGCAGCCGC\n>XM_026799137.1 PREDICTED: Zonotrichia albicollis erythroblast NAD(P)(+)--arginine ADP-ribosyltransferase-like (LOC106630292), mRNA \nATGGCCATCAAGGTGGTGCCCCTGGACGTGGCCTGGGACTCCTTTGATGACCAGTACCAGGGCTGTGGCCCTGCCCTGAATGCAAAGTGGTCATCCCTCTACAACTCCAAGTCCCAGAAGAATCGTCCCTTTGCCTGGGGCCGTGGCTCTCATGGCCTACACATCCTGTACATGTACGGGGACTTCAATGCAGTCGTGTGCGCTGCCGGGCGCTCCCGCCAGGAATACCAGAACAACTTGTGCTTCAAAACGCTGCATTTCCTACTGACCCAGGCCCTGGTGACGCTGAGGCAGGGTCAGAACAGGCAGTGTCACCATGTGTTCTGGGGCATGCGTGATGTTCATTTCCAGGCATGGCAAGGCCAGAGCATCCGGTTTGGTCAATTCACATCGATGTGGCTGCGTAAAGAGATTGCTCTGCACTTTGGGACAGACACAATTTTCGAGGTGCACACGTGCCATGGCGTGGACATCCAGTGGTTCTCCATGTATCCAGGGGAGGAGGAGGTGCTGATCCCACCATATGAGACCTTTGAGGTCACCAAAGTCACCCAGAATGGGAAGAGGACATGGATCAGTCTCCGTTCTGCTGGGACTTTCAGCAAATATAACTGCGAGTGGCACTGA\n>XM_047886733.1 Psilocybe cubensis uncharacterized protein (JR316_0000919), partial mRNA \nATGTCGCTCGCTCGTCTCATTCCAAGGGCTACCACCGTCTCTCGCATTGTCCGAACTGCCCCAACTCTCCAAACCAGATGGGTGCCCCGCGCCATGTACTCTGCTGGCGGTCCCTTGTCCAAGGACGTCATCACATCCCGCGTTCTCGAGACATTGAAGGGATACGAGAAAATTGACCCGGCCAAGTTGACCACGTCCGCATCTTTCCACAAAGACTTGGGGCTCGACAGCTTGGATGCAGTGGAAGTGATGATGGCAGTTGAAGAGGAGTTCTCAATCGAGATCCCTGACGCTGAGGCTGACGAAATTACAACGGTCCAACAAGCCATCGACTATATCGCAAAATCTCCTGACGCTATTCTGGAGTCTCTTGACTTGAGAGATGATCGATGTGACGCGAGTTCCGTCAAATCATCTGCTTTAGCGGTCGCATGA\n>XM_023773741.1 Ramularia collo-cygni uncharacterized protein (RCC_08491), partial mRNA \nATGGCGGCCCCCGAAAAGACTCCCACATCCCCAGATGCCCACCGCGCGCTTCCAGACAAGAAAGCCGTGGAAGCGGCTGGCGAGCTTCTAATCAAAGACGAAAAGGGCAACGAGATTGCCTTTAAATCGCTCTACTCCGACAAGCCTGCCGATGAGAGACAACTCATTGTTTTCGTTCGACACTTTTTCTGCGGCTCCTGTGAACTCTACGCCCAAGCACTCGCACGGGATCTCCCCGTAGAGGCACTGGCAGCCAACAAAATCACACTCACAATCATCGGATGCGGAGAGCCCATTTGCATCGCTGATTGGCGAAAGCGAACGGGATGTCCTTATCCCCCCCACACGGAGCCCAAGCACCGACTACAAGACACATTGGGCCCCCCCAACCCCCCCAGAGCCATGCCCGATAAATTCCCCGAGTACCACTCCAAAAGCCTGTTCCAAGTAATCAAAGATTCCACATGGCATGCACTCTCCTCCGGACCTAAAAAGGCCTTGTCAGGCGGTCCCGCATCGCAGCAAGGAGGCGAGTGGCTTTTCCAGAATGGAGAGGTTAAATTCGTGCACCGTATGAGGAACTCGGCCGATCACGTCGACACCAAAGAGCTGAAAATGGTTCTTGAAATCAACGAGTAA\n>XM_048709217.1 PREDICTED: Triticum urartu serine/threonine-protein kinase Nek3-like (LOC125545316), mRNA \nTTACGAAAAAAGACCTACAACAAAAAATCACACGACTCGCACGCACGAGCGAGTGCCCTCCAGAGTGCGCTCGAGCGAGGCCTCCAGATCGCTTCGCCGCCGCCCTCGCACTCCCATCAGGCGACTCGCAATCCAGTCCTTCGTTACAACCCTCGCGCTCGCATCAAGGATCGAGGCCTCCAATGGCCGCCGCCGATCCCTTCGACGGCGCCGAACCACTTGAGGAGCCGCCGCCGATCCCCTTGAGGAGCCGTTCACCGATCCCCTTCAGGAGCTGGCGCTGATCCACGCCGCTGCCACCTATGCAGAACCCCAGGGCAGGGCGCTAGGAACCACCGACAAGAGCATACTCGCCCTCGTGGCCAGGGTCTCCGCGGTCGGCATCGGCGTCGGCGTCGTCTACGGCTCCATCAGGCTCGACATCCTCAAGGCTTGCTCAGAGGATAGTGCAAGGAGATGTCCCACAAGCACTGACAAATTGTCGACTAATTACCAATTGACATGGGTGCTTTGATTGCCGGTGCAAAATATCGAGGAGAATTTGAGGATAGGCTTAAAGAAGACGCAGATTCTGATGGACAGCTTGTCAGAGATGGCAAAGCTGTTCTATGCAGGGTACGCCTCTGAGCTAGCCGATGCGTACTGTATCCAGTGTTCTGTTGCATCCGGTGCGACCTCAAAGAATACCTTCTTCTACCTGGGCGTTGAGCGCCTCAGGGACGACGAGGTGCAGCGCCTGGGGCGGAAGCAGTTCAACTACACGATGATGAATTTTTGCAGAGAAGTTCAGTTGCTTTGCGTATGGATTTACCAACAGTTCTTTTGTGCAGTTGACACAATGGGCCATATGATTCTTGGCAGGGAAGAAGCTATTTGGGCTGAATCAGACGAGGTGCTGGAGCAGATTGGGAAGGGCTCCTTTGGCTCTGCGCTCCTAGTGAGGCACAAGGTTGAGAGGAAGAGGTATGTCTTGAAGAAGATCCGGCTCGCCTGTCAGACCGTCAGGTGCCGGCGATCTGCGCACCAAGAGATGGAGCTCATCGTCGCAAAAGTAAGGAGCCCTTACATCGTGGAATACAAAGATTCTTGGGTGGAGAAGGTGGGGTGCTATGTGTGCATCATGATTGGTTACTGCGGGGGAGGGGACATGCTAGAGGCCATTAAGAAGGCTAACGGCAACCATTTCTCGGAGGAGAAACTCTGTGTGTGGCTTGTGCAGCTCCTGATGGCGCTTGATTACTTGCATGCCAATCATATCCTTCATCGAGATGTCAAGTGTTCAAATATATTTCTTCCAAAGGACCAAAATATACGGATCGGCGATTTTGGGCTGGCTAAAGTGTTTACTTCTGATGATTTAGCTTTGTCGGTTGTAGGAACTCCCAGTTACATGTGCCCTGAACTTCTTCCTGACATTCCATATGGCTCCAAGTCCGACGTATGGTCGTTAGGATGCTGCATCTATGAGATGACTGCGCTGAAGCATGCATTCAAAGCATTTGATATGCAGACACTGATAAACAAGATTAACAAGTCTGTTGTCGCCCCTCTACCGACTATATATTCTGGCGCATTGTAA\n>XM_027425389.2 PREDICTED: Cricetulus griseus phosphate cytidylyltransferase 2, ethanolamine (Pcyt2), transcript variant X10, mRNA \nGCGTCGGGGGCGGGGCCGAGGCAGTGCGAGTCGCGGGAGCAGCCCCGGGCTTGCGGGGCCTGTGGTGCCATGATCCGGAACGGGCACGGGGAGGCCGGCGCGGCTGGGCGCAGGGGCCCGGTGGGCCAGCGCGCCGTGCGGGTGTGGTGCGATGGCTGCTATGACATGGTGCATTATGGTCACTCCAATCAGCTTCGCCAGGCACGTGCCATGGGGGACTACCTCATCGTGGGTGTGCACACTGATGATGACATCACGTTGACAGTAGATGGCCGAGATACCTACGAGGAAGTGAAGCAGGCTGGGAGGTACAGAGAGTGCAAACGCACCCAGGGTGTGTCCACCACAGACCTCGTGGGTCGAATGCTGCTAGTGACCAAGGCCCACCATAGCAGCCAGGAGATGTCCTCGGAGTATCGGGAATATGCTGACAGTTTTGGCAAGTGCCCCGGGGGGCAGAACCCCTGGACAGGGGTGTCCCAGTTTCTACAGACATCCCAGAAGATCATCCAGTTTGCTTCTGGGAAGGAGCCCCAGCCTGGGGAGACAGTCATCTACGTGGCCGGTGCCTTTGACCTGTTCCACATTGGGCACGTGGACTTCCTAGAGGAGGTGTACAAGCTGGCCAAGAGGCCCTACATCATCGCCGGCCTACACTTTGACCAGGAAGTAAACCGATACAAGGGCAAGAACTACCCCATCATGAACCTGCATGAGCGGACTCTGAGCGTGCTGGCTTGCCGGTATGTTTCAGAAGTGGTGATTGGGGCGCCATACTCGGTCACAGCAGAGCTCCTGGGTCACTTCAAGGTGGACCTCGTATGTCATGGGAAGACAGAAATTGTACCTGACAGGGATGGCTCTGACCCTTACCAGGAGCCCAAGAGGAGAGGAATCTTCCGGCAGATCGACAGTGGCAGCAACCTCACTACAGACCTGATCGTGCAAAGGATCATCAAGAACAGGTTGGAGTATGAAGCTCGGAATCAGAAGAAAGAAGCCAAGGAATTGGCCTTTCTGGAGGCCATGAGGCAGCAGGAGGCACAGCCTGCAGGGGACACTGCCTAGCTTCTGACCTGGAGGATGTTACTCAAGCCCTCGCCCTGTGCCCACCTCTTCTCGCCCCGCCCTGCCCTGCTGCTGTGTCTTGGTGTCAGCTCACACAATTCCAGAGGAAGCTGCCTTGCTGGAGGGTGAGCTGCCCAGAGAGGGTGGCTCACACAGTGAAGCAGCCCAGTGGACAGGATAAGCAGAGGGCACCTGTGACTGGAGGAGTATTGCTATGTGTCCTTGGCATCCACAGTTCCAACTGCCACTGCCCTAGTCTTGTCTGGGACACACCCCTCCCGCCTGACTGGAAGCTGCCCACCCAGCTTTGGTGAAAAGGTTCAGAGGTTCAGAGGGATGACTTTGGGGACCTCTTGTCCTGGGTCACCCTGCAAGTGGGTACCCTCTACTTTGGGGCACGTTCTAGCACCCCATTCCTGATTCCTAGAAGACGCACTTGCCCCGGTGGCTGGGCCAGCTTGACTGTTCTCTGCACAGACTTCTGGTCCTCATTTTGTACCTCAGTGGCTGCTGTAAATCTTTTTGGCACAACTGAATAAATCCTGGTGGGAAGTGCTCTGTGGGCTCCAAGCCCCCGAAGAAGCAGGAAA\n>XR_002678113.1 PREDICTED: Setaria italica uncharacterized LOC111257591 (LOC111257591), transcript variant X4, ncRNA \nCCGCACGCCCCCCGCCGTCTGGACGCCTCCCGTCGCTCTCGCTTGGGCCACCGCCGCCGCCAGCTCTTTCATGTCCGCCGCCGCCTCGTCCTAGTCCTCGTCCTCCTCCCTCCTTTCCAGTTCGCTGCCACCACCGCCGCCGCCGCTAGCCCTTTCCAGTCCGCCACCTCCTCCTCCTTGTCCTCCTCCTCCTCCCTCCTTTCCAGTTTGTGCCGAGCGGACTCTGCACCGCGGTGAGCTGTGCCGGATCCTCGCGGAGCTCTTCCCAAAGTACCCGATTCAGACGAGCGCAGACGGTGAGGACCAGGAGGAAATAGGTGCTGTTCTAGACCTGTAGGGCAGTTGGTGTGTCCTGACAAAAGTTAAACTACCTTGAGGTATATGATATGTTCCTATTAACATCTAAACTAGGGATCTGCACATAGAAATGAAAATAACTTGATTGGTTTGGAATACTCGATCATCATAGATAATGAAGTGAAACACGGAAATAATGGAATGTAATCTATTTTTCATTGTCTTGCTTCGTGTATGTCTCCTCGGCATCGGTAGCTTTGTATCCTGGACTTCCCTTCACTTTGTTCCAGGCATAGTTAACCAATGTGACAGCTAGCTTGAGCCTGAAATTAGTCATATCCTTCTGCACATAACAAATACAAATGCCTGTTAGCCTTAATGTAAGATGGGCATAGATTGGGTTGCTGAATTTATGTTGTTCAACTTACCTGTGTGAATAAGGAAGATAATTTGTTTCCGGTCCAAAGCTCCATGAATTTAACCGTGAATAGTCCACACGATGCACTGCGAGTTTATTTGTATTTACACAAGTTAGGAAGAACTAATTATGGGAACCCGAGTATATTGACAGGTGTTGATGTGCTTGTACTTGTCAGTCTGGATTGTCTTTTTGATGCATTCAATGACTGGCCATTCTTTGACTTGGGTGTCCTTCCACCTATGTTCTTTGATCAATTGCAGGTCTACAAGGCGTGTCATACGGTTCTGCAACCCTTGCAACTGAGTTCAATAGAATCATCAGTGGTTGAGGCTTGCCTATATGTGTCTCCATCGCCTGAAGCACGACATTTCTAGGTTCTACCACTGCCCTTGATTCCTGCAAGTTAGCAACGGCTGCAAATTATGGTAGTCGAGCTCGGAACTGAATGAAGGCAAGTGGTGGTATATGGAGCATTTCTCTTATTGATCCAAACAATGAGAATATCCAATAACACTTGGAACAATTCTCAGCTTGCAGAATACAATTGATCGCTACCTGAACCACACCAAAGGCACACCTACAAATGAAAAAGTTCACGAACCAGGTGTAGAGATGAGATTGAACTTACTGGATTGAATGGGAGAGATGTAATTGGATCAATTAGCGCAGGTGGTGCATGCTCCTTCTGTTGCGCAGGTGGTGTATGGTCCTGCTCTTGTGTGTCAGGATTGATGGGTGGCACCGAAGAAGTAGCTCCGTCCACATCCATGGTGGCTGAGTTGTCTGATGTGAAGCAAGATGGTAAACTGCCGCTGCCTGCTGCCTTCCTGCCGCTGCAGCTGCCAAGTTTGTTGTTCATGTGAGTCCGTGTGAAGCAAGATTGTTTTTATTATCTAACGTCAAGTGTTAGTTTAAATTAGGTGCTATGATATCCAAACGTGTAGAGTTTGTTTAAATTAGGCCTCACGTGAAGAGTTTGTTTAAATTAGGCCTCACGTGAAGAGTTTGTAAGCTAATACATGCCTCCAACGACGGGATAGCACAGTTTCCAACTAACGTTTTTCTGTCAATGCTTTCCAAGCAAATTACTGATACCTTGTCAATGCGACGGGATACTCTAA\n>XM_050703260.1 PREDICTED: Spodoptera frugiperda RNA binding protein fox-1 homolog 3 (LOC118266813), transcript variant X21, mRNA \nTCTAACCAATGCCCAGCATTGACTACTATTCTTAAATAAAAAATGTTGTTATTATGGCTTGGTTAGGTTGTGACCGAAAAGTTAAAATCATCTGTAATTTTGTGTAAAAGCAACGGCAACATTGTTTGTCACGTTTCGTCCGCCGAATCATGCCGACTGTATCTCCTATCCTTGTCTTTCTCACGGTGATCCGCACGGGCGAGGCGACTCGGTGAGTAGCCACGCGTGCTCGTACCCGTCCGTTGTTGCACATCGACATTAACCGCTTTCAGTGCTAGAGCGCGTTCCTCCGCGCTATACTCACATAACCTAAAAGTTAAACAATCCTGATAATTTTAGTACTATTCATTGTAAAACCATTAAATACTCATGATTACCTCGAATTTATAAGTTAGTGTTGTGGAAGTTTACGCCCAGCGAAAGGGCGTACGTGGAGTGTATTTTTGTGCAACACAAAGTAAATACAAACGGCAAGCTGTGGGGTTCAGGGGCCTTTTTTTTGCCGCCGCAGGGGATGTACTATCCTGTGAGTAACGGCAATGTCATCGATACAGGAACACCAACCTTGCTGCATATGGTGGGGACGGGTATGGCGACCCCGTTCCCGGCGGCGGCGGCGGCTGCGGCAGCCGCGGCACAGTTCGCAGCTAACGGCGACGCACTCGCCGGCGTGAAGGCTGAGGCTGCCGGTCCGACAGCTCCACCTCAACCCCCGCTCGTTAAGAGCGAAGGCCCGCCACCGCCCGCGCCTCTACCGCCCGCCAATTTCTCCCCTCAACCGCCTCCTCAACAAACACACACACAAAATTCAGTAGAAAATCAAAACAACAATAACAATACGCAAAGCGAAGGCGAAGCAAATGAAGAGAGCACACCAGTAAGTGTGGCGGCGGCGGTGGTGGCGCAGCAAGCCGCGGCCGTAGTGGCGCAGCAAGCGGCGGCGGCGCACGCGGCGGCCGCGGCCGTCAGCGCTGCCGTCGCTGCCGGCAATGTTAACGCTACCGGCACTCCTGAAAAACCGACACTCGTACCCGTCTCACAAGCGTCACAACCTAAACGATTACACGTCTCCAATATACCCTTCAGATTTAGGGACCCAGATCTTAGAAATATGTTTGGGCAATATGGCACGATTCTCGATGTAGAAATTATCTTCAACGAACGTGGTTCCAAGGGATTCGGTTTTGTAACATTCGCAAATAGTGGTGATGCGGAGCGAGCACGAGAGCGTCTTCACGGCACCGTGGTTGAGGGCAGAAAGATAGAGGTTAATAATGCGACAGCGAGAGTGCAGACAAAGAAACCTCCGACAGTTCCCAACGTGTGTGTCCAGTGGCCGGAAGGTGAGAACCTTCATTACGATTTTGCGCTGCGCCGCGAGCCGCGCGCCGCGCCGCACGCCGCCGCCGCCCCCGCCCCGCACGCCCCGCCCCAGCACGCGCTGTCGCACGCCGTGCTCAACCGCGCCGCCGCCTACGCCTCGCAGATGCACGCCTACGCGCCTGTATATTACGACCCGTTCTTAGCAGCCGCGGCGACGGCTGACTCCAACTACAGACTCCAGGCGGCAGCTGCAGCAGCAGCGGCAGCGGCGCCCCTGCTGAAGTCTCCGCTTACTTCGCCGCCGTCAGCGCCGCGCCCGCGCCCGCGCTCGCGCCGCTCGCTGCCACGTACGGCAGAGAATATGCAGATCCATATTTAGGCCATGGAATCGGACCAGTATCAGGATATGGGACTGCAGTGTACAGAAGTGGCTACAACAGATTTGCGCCATACTAGAAAGCCAGTGGATGGATACGATTGAACTCGAATACCTTCGTCACCTTCACCTTAACATGACAATGAACTCTCTTTGTAAACGTACAAACATAAATCATAAATTTAAGGATCAATAATAAACGCTAGCAGACTACCGTGTAAGTATCTAAGCTTGGGTAGCAAACTAACGAAGTAACGAGCGAGCGTGGAGTCGTGCAGTCGTCGAGTCGTCGAGTCGTCGGCGTCCACAACTTATGAAATACCAAAGTCATTAAAATTTCTAACAGAATACTTTATAAGTTGAACTTAATGTAAATTATTGTGTACCTAATGCTATACAAGTGCGAGCAGCTAAAGTGATTGCTTTCGTTCTATTTAGATATTCTAGGAGTTACTATAATTTTAACAGAAGTGAATTCATCTTACGATCATACGTACCGTACTGTCTAGTGTAGATGTTACACTTTGTTCATCGTGGACAATAGAAGAAATATTTACTATATTGTAATGATATATTTAGTGAGCTTTGCACTTGCATATCATAAAATTGTAAATACTTGTTTGGAAACATTTAATTCGGTCTTGATATTTTATTTTTAAATTCAAAATTGCCAAATGGTGTTTCCTGAATACATTTTCAGCGATCTTATTCTAAATAATAATATACTCGTTAACGTTAAATGGTCTCCATTTTTAATTATTAAATAGAATAAATTCGATTTGTAAACGCGAATTAGTTGGCGTTGCGGTTTATACCTAATATATCAATTTTAGTAAAATCGCCGTTATTATCTTGTAGACATGTATGTACGCAGAGACAATAGAAATCTCAAATCAACTATTTTGGAGTAAATACGTTATTTGGTGCGATATCAATGTGGTGCCATTTATTTGGTTGTTATTTTTACATCGTATTATATATTTTCTAAAGTTACCTTGTACTCTATACAGTTTATGTGACCTAGTTGTAGGCTGTCCCTCGGAGAACGCGACCAACGTCTCGGGTGTGCAATGCTCTGCCTCGCGTCGCTCCGCTTGAAGCGTGTCTCTTGAACTTTTGGCAGTGAACGCGAGGAGAGCACTTGTATACGTGTGTTGTTAGTCGGTAGAACTAATATGGCGTCGTTTCGGTTTGTACATTTCGCTTGAAGCTTACGTTGTCGACAGTCCCCGTTCCTTCCGTCAGCGCTGTGTCGCAGTCTGAGCCAGGCGTTTTCTCGTGTTCCTGGTTACTTGTAAATCGGTTGCTAGTTTATAAATAAGCTAATGTTTTACAGAGTGTAGGCGAAACGCTTTAGCTGTAGTCTATAAGGAAGAAGGGAACTCCGTCGAGTTCTTACATATCATTGAGATTTTCTCCTTGTATGTAGTTACGTTTATTCAATAATTATTCTATTGTCTTTTAACGATGTCTTATTTTTACAATGCTATTTAATATTTTTGTCTGGCGTACGGACTTTCATTTTTATAGAACAAACACGCATACGGGTCCAACCCTTTTAGAAGTTGTAAATTTTAGATCTAACATTTGCATTAGGATTTTAAAGTATTGTAACATCTATGAATTCGCTCAACGTTTATACCAAAGCACAAAAACCCATCGATTCATACGTATTCGGAGAAGTGTTTCATGACATTAACCCCTTTTCGATAGATTTAATAGTCTTTCAATGAGAAAAACTTGGGAAATCTATAAGTCGTGGTGTAGATAGATGATAACTAGAACAAAACTACAGACTTTATTTTTTACTTCATTTGTTGAAAGTTTTCATTAATCCTAAGTAATTTTTTTCTAAGGACATATCTACATGTTTGCCATCTAGAGTAGTTTAATCTTAACGTAGTTCAATGACTATATACATACATAAAATATAGATCTGAATTAAATCATAGTTGATTGTCAATCTTCTCATGTTATTGTAAATTCCTAAGGAATATAGTACACATTGTGTTACAGATGTGTCTGTATGAGAGGTTGCGTCGACGTCGACGTATTAGAGCTTTGTCAGTTTATTTTTCAAACCTTTACGTAGCAAGTAGAGATAGAGTACCGAATACGTTGGGCTGGTGCAGGGGCGCATGGCTCTCGTCACTGCTCGGTGTCGTCTGATGATGATAGCTTTAATTAATTAAAGGTGTTAAGGTGATGTTCTCACCCAGTTGTGTCATCTTGTAACCACAATTAGAATAACTAACTCAAGTAGCATTTCCATGACATTATTATTATTATTTGTCTTGCAGAATTCTAGTCTTCGCGCACAATCTTTTATTAAAATAATAAATAAATAGTAAAGGTGCTTACTCGTAAAGGTTTCATGTGATATTTACGGAATTAGTTGTCGAATCTTTGTCTCGATTTTTATTCTATTATTTCCGTACGATATGTAATAAGCAGTTCGTGTCATATTTTCCTTTTACTGATTATTTTTATAATTATTACTCTCGCCTTTTAGTGCCACTGGCTTTTATATAATAAGTTATATTTACTTTATCGTACGTTATTGTAGTCTCGTTGCAGCTTCGAACAATATTTTGTGCTTTACTGCTGAATACTCATGCGTGGATGCGTTATTTTAAGTAATTCTTAGGTTTGTAGGAATTGTCTGATTAATGCAAGATTTTGTATCTGAGTACAGAAACAAGTACATGTGATTCTATTTGATGATTTTATTGTTTAGTTTTAGTATTTTGTATCAATTAAAGTCACAAATATTTGTGAGTGTTATATTTTTAAATCATCATATTTTATAACAAGTTAACAGGACTTTATTTGGAAATACAATAATTACTTACGAACTTTGATATTAAAAATTCGATCAAATTCTGACCAAATCTCGTCTTGTTTACTTGGAATTTTAAAATGTACCTACATAATTTTTGATTATGTTATCTTTATAGTCTTTATGTATGATTTTAATGATAATTAAATAAATCACAAAAGCAAAATACCTAAGTTTTGTATAAAGTTACATAATATAAGCCAAATTGTTGTTACTTGGAGAATAATCAGAATTTAAATTACATATCTGACAAAATGGTTAGTGTGCTACAATAAGATTGAAAAAAAAATAACATCAAGAACAATGTATTATAAATATTATAATCATTAAATTAAGGATATGTATTTTGTAACGCAGTTTGTTTCTCAGTTTTTATGAGATGTTAAATTAAAGTTTCATACTACTCTTGTTTCATGCTGTGCACAACTTATACGATCGTCGGCTTCGATATTGTATTCATTAGATAAAGCGAATTGTTATATTGTGCATAATAAATCATATCAGTAGTGGTGTTAGCTAGTTGCGAGCCGGCGGCAGCGTCCACTGTACATAGGTATACTTAGTGTTACCGGCGGCCGTATTACTGTGCCCTCGGGTCATATTGTTAAAGTAGCCAGAGTTGATAAGTATCACTTGTTCGTCAATTGCACTCGTCAAAGCTGTTCAGTTGGTGTTGTAGGTTATTCAGATATTAGCGGGGTTATTGTTAGCTCCTGCGTGGCAAACTCGCAACTTGTGGCCGTGCATGACACTCATTTTATTGCACGACATCGCCACACGGCACGTCTACAAATTGCTGGTTTGTTTGCGATTAACCCCAAAACATTTAGATGGTGTAACGCATACTGACTATGGGATCGATTAGTTGCTGGTCTACTATCCGGAACGTAAATAAGTTTAACGTTCTAAGATCCATATTATCACTGTTAACTTAATTATAGCTATCGTTTGTAATTACTATTTGTTATGCATTACTTTTGAAGTTGCTTGTAGTGATCAAAGCAGTCAGTATGCGTTGCAGCTGCATTGTGGGCTAGTATGCGCGTGCGCATAGTTTCCGAGCTAGTCTCGAGCACACTTGCAGCCGGCCAGTATTTGAAATACTATTACAATACCGTGCTCAATTCCTGTATCTGTACATTGTAAGTATAATGTTGACAAAATGTTTTTGAAGTTTAATGTAAACTACATACAATAGGTTTGTTACATAATGAATGTCTTCCGTTTGGCACATTTTATAGATATACCTACTTTGCACATTTTATTAAAGCACGGATCTACATAGGAATACTAGTTCAATATTATTTAACAGAGATATTTTCAAGCCAAGTGCACAGCGAGCCCCTCATATACAATTTGTGATACCTAAAGTGAAATACGATTTTCCTTTTTTTTTGTGTGGCAATTTTTAATGGATTGCAAAGCTGATTTTCTCTTTTGAATTGTAAATATTTTTTTCTAATGAAAAATATTAAATGAAGTGAATCATTTTAAAGCCTTTGGCATTGTGTACTCATTTACGTTATAAATAAATTATAGTATAAAA\n>XM_050906876.1 PREDICTED: Gymnogyps californianus immunoglobulin lambda-1 light chain-like (LOC127022987), mRNA \nATCGCGCCATGGCCTGGGCCCCTCTCCTCCTCGCGGTGCTCGCCCACAGCTCAGGTTCCCTGGTCCAGGCAGCGGTGACTCAGCCGGCCTCGGTGTCAGCGAACCCGGGACAAACCGTCCAGATCACCTGCTCCGGAAGCAGCTATGGTGTTGGCTGGTACCAGCAGAAGGTTCCTGGCAGTGCCCCTGTCACTGTGATCTACAACAACGACAAGAGACCCTCGGGCATCCCTTCACGATTCTCCGGGTCCAAGTCCGGCTCCACTGGCACATTAACCATCACTGGAGTCCAAGCCGAGGACGAGGCTGTCTATTTCTGTGGTGGCTACGACAGCAGCATGTGTGGTGTATTCGGGGCCGGGACCATGTTGACCGTCCTAGATCAGCCCAAGGTCTCCCCCACCGTCCACCTCTTCCCACCATCCTCCGATGAGCTCTCGGCACAGGGCAAAGCCACCCTGGTGTGTCTGCTGGGAGACTTCTACCCCGGCGCCGTGCAGGTGGCCTGGACGGCCGATGGCCGTACCCTCAGCAGTGGCATCGAGACTGGCCAGCCCCAGCGGCAGACCAACAGCAAGTACATGGCCAGCAGCTACCTGACGCTGAGTGCCGCCGAATGGAAGAGCCACGAGACCTACACCTGCAAGGTCACGCACGAGGCCGGCAACGTGGATAAGAGCCTGAATAGATCCCAGTGTTCCTAACCCTGCTGGGACCTCCCCGCACCCGGCAGCCCCTTGCCGGCCCCTTGCCGGCGCCCTCCCTCTTCCCCGCTGCTGGGGGCAGCGGCTCCCCCCCCACCGCAGATGTCTCTCCCCATGTCCCCCTGTCCCCTGCTCCTGTCCCCCCGCCCTGAGTGTCACACGAATAAACACCGACACTGAACTAG\n>JF646645.1 Uncultured bacterium clone GDIC2IK01BM6IP 16S ribosomal RNA gene, partial sequence \nGATCCTGGCTCAGGATGAACGCTAGCTACAGGCTAACACATGCAAGTCGAGGGGCATCATGTTGGTGCTGCAACCAATGATGGCGACCGGCGCACGGGTGAGTAACGCGTATCCAACCTTCCCCTTAGTAGGGGATAGCCCGGCGAAAGTCGGATTAATACTCTATGTTCTTCAATGCGGACATCTAAGTTGAAGCAAAGATTTATCGCTAAGGGATGGGGATGCGTCTGATTAGGTTGCAGGCGGGGTAACGGCCCACCTGGCCTACGATCAGTAGGGGTTCTGAGAGGAAGGTCCCCCACACTGGTACTGAGACACGGACCAGACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGCGAGCCTGAACCAGCCAAGTAGCGTGCAAGGACGACTGCCCTATGGGTTGTAAACTGCTTTTATCAGGGAATAAAGTGAGGCACGCGTGCCTTTTTGTATGTACCTGATGAATAAGGACCGGCTAATTCCGTGCCAGCAGCGGC\n>GU634984.1 Uncultured bacterium clone HF9475 16S ribosomal RNA gene, partial sequence \nATTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGAACGGCAGCACAGGGAGCTTGCTCCCGGGTGGCGAGTGGCGCACGGGGTGAGTAATACATCGGAACGTGTCCTGTTGTGGGGGATAACTGCTCGAAAGGGTGGCTAATACCGCATGAGACCTGAGGGTGAAAGCGGGGGATCGCAAGACCTCGCGCAATTGGAGCGGCCGATGCCCGATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGACGATCGGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGGACAATGGGGGCAACCCTGATCCAGCCATGCCGCGTCGCAGGGATGAAGGCC\n>MG192940.1 Homo sapiens isolate HD19_NN14_F4 T cell receptor beta mRNA, partial cds \nGTTGTCTCCAGATCCAAGACAGAGAATTTCCCCCTCACTCTGGAGTCAGCTACCCGCTCCCAGACATCTGTGTATTTCTGCGCCAGTGGGAGAGGACAGGGGATCTACGAGCAGTACTTCGGGCCGGGCACCAGGCTCACGGTCACAG\n>NM_001252006.1 Homo sapiens poly(A) polymerase alpha (PAPOLA), transcript variant 2, mRNA \nAGTTCTAGAACGTTGCTGTGGTAGCGCTCGGGCGCCATGTTAGGACGAAGGGGAAGGAGGAGAAGCGCTTAAAGCGGCGGGAGCGGTGCGGGAGAGGGGTTGGACCCAGGGCTGAGGCAGGCCCCCCCCTCCCTCCCGCCTCAGTGGATCATGCCCAGGGCGGCAGCGGCGGCGGTTGCGGGGGGGAAGTGACTGGGCGGTGCCGGCGCCGGAGACGATGCCGTTTCCAGTTACAACACAGGGATCACAACAAACACAACCGCCACAGAAGCACTATGGCATTACTTCTCCTATCAGCTTAGCAGCCCCCAAGGAGACTGACTGCGTACTTACACAGAAACTAATTGAGACATTGAAACCCTTTGGGGTTTTTGAAGAGGAAGAGGAACTGCAGCGCAGGATTTTAATTTTGGGAAAACTAAATAACCTGGTAAAAGAGTGGATACGAGAAATCAGTGAAAGCAAGAATCTTCCACAATCTGTAATTGAAAATGTTGGAGGAAAAATTTTTACATTTGGATCTTACAGATTAGGAGTGCATACAAAAGGTGCTGATATTGATGCGTTGTGTGTTGCACCAAGACATGTTGATCGAAGTGACTTTTTCACCTCATTCTATGATAAGTTGAAATTACAGGAAGAAGTAAAAGATTTAAGAGCTGTTGAAGAGGCATTCGTACCAGTTATTAAACTCTGTTTTGATGGGATAGAGATTGATATTTTGTTTGCAAGATTAGCACTGCAGACAATTCCTGAAGATTTGGATCTACGAGATGACAGTCTGCTAAAAAATTTAGATATAAGATGTATAAGAAGTCTTAACGGTTGCAGGGTAACCGATGAAATTTTACATCTAGTACCAAACATTGACAACTTCAGGTTAACTCTGAGAGCTATCAAACTATGGGCCAAACGCCACAACATCTATTCCAATATATTAGGTTTCCTCGGTGGTGTTTCCTGGGCTATGCTAGTAGCAAGAACTTGCCAGCTTTATCCAAATGCAATAGCATCAACTCTTGTACATAAATTTTTCTTGGTATTTTCTAAATGGTATGTGTTTAGATTATATTAAAATAAAATTGATTGTAGACACTGAAGTTTAGTCTTATTTCTATGACATTTCTCAGCTTGGTTTCAGATTCAAATTTTAGTTCATGATGTAGTCATGTAGGCAGCCTTGGAGATCACATTGTGTATAAAATGGCAAACTGAAACTATTTTTTTTCCCTAGTTTGGCCAGGATAGTAAGGCAGATTCTATTTGTACTTCCTTGCATAAACTTACCCTCTGAATAAACTCTGAATTTTAGCAGCTAAGATCCAATTTATTGATAGGTTGGGAAATCAGTTACTATACTTTTGGATAAAACTTGTACACACTACCTCTTTCACTCTTTTAATTCTCTATCTATAGGCCATTAGTTTCTTGTGATTGTTTTTTTTTTCTTTTTGCTTTCAGCATTTATTTGGCCTAATATTAAAGATACGAATTTTCATAAGAAGCTTTTAAAGAATAAATTAACATTAAGTGCTTCGGGACAAAAAAGGAATTTGAGATTAGTCATTAACCCAGATTTTTTTAAGTTTCTTCGTTTCATTTCCACATATGTCAACTATGATTTAAGAAAAAGTAGAATAAAAGATTACTGCCATTTTATATTAATTGCCTTGGCCCAAAAGGTGAGGGTTCTTGGTTTTTAATCAAATTAAGATAAATCGTCCATTCCTGTTCTTATGAACTCCTGCTCCTCCCTCTGCAAAAGAGATGTTCTTTTCTAGTAATTTTATAAAAATTAGTTATTTGAGACAATTTAGAGCTGTGTTCAACTGGAGGAAAAATAAAAAAAATTTAGAACCATGCCACACTTTTCAGTACACATTCTGGCTGTTTTGGGATTTAGTAGCACTTATAATCAGGTGTGATAAGATTAAAGAATGTCAGAATTTCTTTTTTTTTTTTTTTTTTTTTTGTTTGAGACGGAGTCTCACTCTGTCACCCAGGCTGGAGTGCAGTGGCACGATCTTGGCTCACTGCAAGCTCTGCCTCCTGGATTCATGCTATTCTCCTGCCTTAGTCTCCTGAGTAGCTGGGACTACAAGCGCCTGCCACCACGCCTGGCTAATTTTTGTATTTTTAGTAGAGACGAGGTTTCACTGTGTTAGCCAGGATGGTCTCGATCTCCTGACCTCATAATCCGCCCGCCTCGGCCTCCCATAGTGCTGGGATTACAGGCGTGAGCCACCGCGTCCGGCTGTCAGAATTTCTTTTAATGCTACACATATATAAGCAAATAATGTTTTTAAGAAGCTAACCTTGATGTTAAGAGTGGCAGGTGTTCTCCAGTTTTTACCTCTTTCATATGGGACCAAAGTAGCTAGTTTATGGAACACATATGAAAATGTGGTTATGCCACCAAGTTTTACTACTACACTTGTCTTACCACTTTTAAGTCATGAATTCTATAATTATTCATACCCCTTTGCCTGTGATCAGAAGTAACTTTTAAAATTATCACTTGACTTTGGATGGAACTAGTATAAAGGCAGGAATTTTGTCTTTCAGTGGAGATTTATTCTGTTCAAGGTTGAAGTGGACACATCATTATCTTGGGATGGTACTTCTTTATTTAAATAGTCCTTTAAAGTTCTTTGAGTGGCAGAGAACGTTTTTGGTTTCAGTCTGAGAAGGCTACCAAATGGTTTAAGTTCATTTCATAGTTAGGAGAAAAAGATTTTGAGTAGTCTAATGTCGTCAGAAAGGATTAAAACGTTGTATGTACCAAGAAGGCAGAATGAAGAAGGATCACGTTCACAAATGCTGTATGTTTAACAAAATACGTTTAGATGGTAATATCCAATAGTCTTATCAAGTGCTACAATCTTTTTAAACAGGGAATGGCCAAATCCAGTGCTATTGAAACAGCCTGAAGAATGCAATCTTAATTTGCCTGTATGGGACCCAAGGGTTAGTGTATTATTTTTTCCCCTACCAATTCACACTGTGCAATAACAAGTAAAAATCATCTGCATAAACTCCAGGGAGACTTCCAGCCTTTTACTTATGAATGGTCATGTCCGTATTACACTTTCTTTTAGATAACCTCAACTATAATTGTCCTCAACTATAATTGATGTGAGAAGCATAATTATGTACCCTGTAAACCACATTTAATTGTACATAGTTTTTAATACAGATTTTACTAACATTTTAATTTATTCTATATAGAACTACCTTGTAAGTCAAAGTTGTGTGGGCATTTGTGCTTTAAAAAAAATAAAAGGATACTAAAAATCCCTGTATTTTTTATTTTATCTAAGTATTATGCTAAAGTTGGGTTGTTATAGGAAAGCTGTTACTTAATGTTTACATGTGGCATATAACTTCTAAGCATTTTCACTTTAATTACCATGATGTAATTGTAAAAAAAATTGGTTTAGATATTTTAGAGATTATAAAAACATGGTTGGGCTAAAGAAGACCTTCCATTCTGTTTCTTGGGAAGTTACAACATTTACCGCTTACTCATTTTAAATGTTAACAACATGCACTTTATAAACTGATAAAAGAAATTTAGGTTTGAATAAGATTTCCTAAGTTTATGAAATCCTTTTTTTCTAAATTATTACAATATCAAAAATTTTAAATTCTGTTGAATTACATCAAGCTATGCATTTTCAGGTTTTCCGAACCTCAAGGCATTTACTTTTAGAGGATGTGAATTTACAACTTACTTTGTGGAAATGTGCCACTTACTGATATACAGATTTAAAATTAACAGTATATCATTTCATTATCTCCTAACATATCAACATGGATAATGTAGTTTCACCGCGTGTTAATAAGCTTGAACTCCTTAATAGTTTCAGGGTATATTAAGAACTTAAGTTTCTATCTTGTTGAAAATTAGCTTACAAAACATTGTAGCATGACATGTCTCTAAAGGTAATTGTATGTGCATCCCCATTTCTGTTGTTGAATAAAGAAAAACTAAACATCAAAAAAAAAAAAAA\n>XM_018797717.1 Schistosoma mansoni hypothetical protein partial mRNA \nATGGGTTGTGGTGCAAGTGGATTGAAAGATTGTAAATCAGAAGTAGCTCAATCGACAGATGACAGTCATTCCAATAATGCAGAAATAGAAGTTGAAGAACATAAAGAAACAGACACAAATCATACAGTTCCTGAATTATCAAGTGAACAATTGGATCCTGTATCGAACGATAGACTACATGATGAATCTAAAGAAGAAATTCCACAAAATCAAGAAATTCCAGAAGTTTCAGTGATTACTGAAGAAAAACCAGATGTAGATTTGGCAAATGATGCGGGACAACCTGAAGAATCCAATACAAATGAAGGAAATACATCAGAAAGCTAA\n>XM_040902855.1 Laetiporus sulphureus 93-53 uncharacterized protein (LAESUDRAFT_536661), mRNA \nGCAATCGGAAGATCACGCCTCACGAATGACCCGACCGTCTCATCGACGGTACTTGACTGACCTCTCCGCGCTGAGTGCGTCAATGCCGAATCATCGAACGCGCCGCCTCGTACCGAAACCAGACCGCGCGTCGGGGCCACGCCGCTGCGATAGAAGACGAAGACGTGCCTTGCGCTCACCGCTGATGCAAACGGACCGCGGCGTGGACCGTGATTTGACGCGATGCACAGCAGATGCTGGGAAACGGTTGACACGGTGAGCATTGCACTTCCCTACACACCTGCTACTAGATTCTTCGCGCGTACATGTCGACTAGGGCGGTCTCTACGCTCAATCGCCCTGTTCGCGTTGAGAATGCTGTCGACCTCGTTAGATGTGTGGATGACCAGAGCGTACCGAGACGCAGGCGAGATGTTGACTACGCGGATACTACAAATGACGAGGCGCACGACGAGAGACGGCCAAGACCGATTGCAACCGTCATTCGCGCTCACCCGCATCGCACTCGGGCTGGACATGCCCTCGTGCGCTCGTCGCCGTCCTGCTGTCCGTGGCTTTGGACTGCGAAGCAAGACAGCATGATCAAACAAGTGCGCAAGAGAAACGGGGGGATGGCCTACCGCATGCCAAAGCCATCATTTCACGCAGTCTCCTTCGCCAGAACACGCGCAGGACTGGCGCTTTCACGACAGGGCTTGAGGCTCGTGCCACTATCCAGCGACCGGTCGGAGATCACACCTGACGTCTCAGAAATACCCGCATCCGATGCTGTCTGATGCAACTGGGCTATTCCGGCGCACTTCAAGCGATATTCGAGCAACAGAAGCTGCGACGGTTGACTCGCAGGCCGCAGAGGCCGACCATGACCTGCCGCAGACGGTAGACCGACCTAGGAGAGCATCTCGCGTTTCGCGTGTGGTATAGAGG\n>XR_002312254.1 PREDICTED: Odocoileus virginianus texanus uncharacterized LOC110131716 (LOC110131716), transcript variant X2, ncRNA \nGGACGGCCCACCGCGGCCCTGCCCAGCTTCCAGCCACAAGGTCTCTGGCTGATGAGTAGGCGGTGGTGACACCCTGATGGCCCAGAGGCCGGAGCCCACTCAGTCACCCGGTCTGTGCACGGGCCTGTGTGTGTCCCTCCCCACAGGAGGGCTCGCAAATTAAGGGACTCCGGCTGGAGGAGGGCTGAAGGGGAGCCCTGTGCTTCTGTTTGTCGAGACTTTGCCCATACCATCGCAGCTCCAGCCCAGCTCTGTGGGAACAGCCTGTAATAAAAATAGAAATTATTGCTAATCAGGAAAATCCTCCCAGCCCAGCCATGCTCTTCAGCTACAAAACACCTCTGTTTTCTGGTATTAACCTTCTCTACTGCTACCCTCCAGTGTTTGCAGCCTCTATTCTGTAAGCAGGGAAACTGAGGTCCAGAGAGGCGAAGCAACGAGCTGAAAGCTACTGTGAGGGGCAGAGATGAAGCCAAGGTAAGGTCATTGCCAGATCTGTTCTAGTGGGAGGTTGCAGAGAAGTCACTGAGGGCTTCCTGGAGGAGGTGGCAAGAAATCTAAAGGAAGGAGGACTCAGATCAGGAGATAAAAAAGGTGAGGACAATTCTGGCAGAGAGAAACATGTGAAGCTTGAAGTTGGGGATATTTCAGCCACATTCGTTCGTTCCACAAACGCATTGACATCTGCTGTGTGCCATGTCCTCTGCAGGAGGCTGGGGACACACAGAGGACAAGCCAGATCGGGCTCCTCCCTAGTGGGGAGCCCACCTACATAATCGTCCCAAGGGACCGGCAGCAGTGGGAGCTCCAAGAGGGTGCCTGACTCAGCTTGGGGCATCAGGGGGAGTCTGGGGAGGGTTCTTAGAAGAGGAGGGAACACAGAGCTATGACCAGGAAGGTGAAGAGACCACAGTCAGATAAAGGCATTCTAGCTAGAGAAACAGGATGTGCAAAGGCCCTGAGACAAAAGTGTGTCTGGTCTGCTGGACAGATTGATCTCAGGGTAGAGAGATCTTGGGGCTCAGGAGAACGGGTACCAGGTGGTCCAGGGCTTGGGCTGTCTCCTGAGGGCAATGGGGAACCGCAGAGCATGCGTGAGGAGTGGTGGGTCTAGAGGGGGCGCTGAACAGAAGGAGCCAATCCCAACCTGGGCACTTCTAGTGAAGCCTGTCCCCTGATGCCTGTGGCAGGGCCGTGAGCTCACCTCCTGTTTCCCTTGGCATTCGGCACCCCTGGGGGCCGCTCCTGGCTGGTGCTGGGGTTCTTGGGAAAACCACGGCTCCAGGAGGGCCTCTGGGCTTGCGTGTGCCTCATGCAGCTAGGACAAGGGCACATGGAAGCCAAGCCCCTGCCACAGGCTTGGCATGGGGCTAGAAGTGTGGACACACATGGCCTTGTTCATGGCTGGGCCATGAGGAGTTGTGAAGAAGAACATTCTAGGCAGAGGGAATGGCGAAGGCGGCAGTCCTGAGGATGTCCCAGTCTGCGGATCAGACAACAGAGGCCTGGAGCCAGGCACTCTGGTTTCATGTTCCTGCTTTCTGGATCCCATTAGCTCTGAAATCCCACTTCTAGGCAGCAGCCCCCTCCACCCTTGCACACCTTGGCAGCCTCTCATTACACACTTACTCACTCTGGGTGAACTTCCAGCCCTTGTACCTGCTGTTCCCCACCATCCCAAATACCTTCCTCCTTCCTCCAAGATCTGGCTCTGATGCCCCCTCCTTCAGGAAGCCCTCCCTGCTCTTCTTGGGCAGGGCTTAGGGGCTGTGCGACATTCCCCTAAGATGCCAGAATATTTCTGGCAGAGACAGGATGACCTCACCCGGGGGACTGGGGATGTCTGTGTTTTGTTCTGTTCCCCTTTCCCGGGTCCCCCCTGGGCCTGCAGAGAGCCCTGCCCCGATGAGTGTCACATGGTTCTTAGTTCTTATAATTCATGTACCATCGTTACTATTAATAATAGTAACCCCTGCTACCGCTGTGCTTTATGACAGACTCAGGAGCCGCATGGCCTGGGTTCAAGTGTCAGCTGGGCATAGCCTCACTGTGTGACCTAAGGCAAGTTGCTTGACCTCTCTGTGTCTCAATCGCCTCACCTAGAAAGTGGGAGTGATCACTGCTGAGAGGACTGGATGAGCTCAGCGTCTACCTCCAGTGTTAGCCTCATTATACAATATGGAACTTATACACGATGTCGGTTATACCTCAGGCCGTTTTTACTCACATTTTCCTCAGAGAGGGAATGAGACAGCTCAAGGTCACACAGCCAGGATTAGACCTGGAGAAGGCAGGACCCCTGAGGCCTTCACACCACCCCTCTCTGCCCTTGGCCACAGATTGCAGGGGAGAAACGCTAACCCAGGCCCCTCATTAGCTGTGAAGACTGCTGCCTGGGACCTCCTGGCCTGAGCCCTTGGCTGGCGCCCCAGCCAGCCCCCCTTCCCACCACGCTAGACCCAGCGGTTCCAGGAGCCTGGCCAGACTCGGGCAGAGGGGCTGGTGCCTGTGTGATGAGGCCTCGGAGCCCTCCCTGGCAGAGTTCTGCTGGGCCAGGAGACATGTGGGCGCCCCCCGCTTGCCCAGCCGCCTCTCCTGTGAATCCAGAGGGAAAGTATGTCGGGAAGGCAGCCGCCCTGCCCTGGGCGGGCCCAGCCACAGGCTCAGGGTCTGGGGAATTCATTAGAGCAGCGAGGGAGGCCACTTAGCCACTGCTGGATCTGCGGCTGAGGAGCCTGACCCAGCCTGCCTTGGACGGCCCGGCTGGACCCTGCTCTCCAGAAGGACCAAGCAGTGGGGTGAGGGGCAGTGGGGCAGAAAGGGTGCCATCCGGGCACTGGAATCTGGCAGAACCCCCCGACTTGCTCTGTGAGTTCTGGCAAGCCCTGACTCTTTCCCCATCCTTCATTTGCTCTGACTGTGTCGTCATTTGCCTCAGGCTCTCCAAAAGGTATGATAAAGAAGAAAATAACAATAAATATAATGGCTACAATTTTATTGAGCAAGTGCCAAATGCTCGAAAACTTGCCACATCACTTTTGTGGGTTTTCCCTTTTTGTCCCCTCTCCTCACGGCGCCACGGGGCAGGAACTGACCATCATGGGAGACAGCAGGAGACTGCCAGGAAGTCTTGGTCTCTGGCACCAGGAGCCTGAGTTTCATATCCCACCTCTGCTGTGCAGCTTCAGACAAGTTGCTTAACATCTCTGTGCCTCTTTTCTTTTTTTCTTTTTTATGGGGTAGGGGAGGGTACCTTCAAAGGTAGATTTACTTTTAATAATAATGTAGATTTTTGCTTCTCCAGTTTAGAGAATGGACTGCAGAGTTGCCTCAGGGGAGAAAGGACTTCACTAGGAACCAGCTGGAATTTAATGATGTGGCATTCAATGGGCATTGACTTCTGAGAATGGTTTTACATCACTATTATCTTCAGAATTTTCCAGGGATAACTGTGGCTGGACAAATGACCACTTTACTTTTTCCTCCTCTCCTCTCACATTTAATGAGAGTTTTGTAGGTAACAGTAAAACAAACCAGTGTCTGTGTTGCAATAAGAGAGACTGCCTACGGGCTCACTATAGAAGTTTTCTTCTCTCCCTCAGTCTGTCTGTGTTTCTCTCTGTCTAATGAAGTGAAACATGAAAACGTCTAAAGTTGTTTGCAGTTTATCAGCAGCACTAAAAACCCAAGTGAAACGAGGACGATGAGAGCCCCAACCTCTGAGGCTCATCATAAAGCCCGAATACATTAATTCGTGAAAACTACACTCGGCACTTTTTTTTTAGAGATGGGACGATGGTGGTCTGAGCCTCTGCGCCTGGCGGTAGGTGACCTTGGAGGTGGACAAGTGCATACCAGCTGCGGCAGGAGCCCCGGAGTCAGGGAGACCACTCTGCCAGGGAATGTTAGTGTTGAGACCTGAACAGACAGGAAGTTCCCGTGAATCCAGGCATCCCAGGACCACAGAACAGGACGTACAGAACAGGGGGTCACAGAACCAAGGTCACAGCGCTGCGTCACGGCACTGTGAGTTAATGGAACCGTGGAACCGCAGCATGCTCCAGCCGTGGCACTGTGGGATCCTAGGGCCACGGGACCACAGTGCCAGAAGCCCACAGACTCAGGGGATGTGGCCACTATCAACAGGAGCTCAGAACCGTGGGATGGCAGAAGCCACAGAATCCTAGGGGGCCTGAGACACAGCACCCAGAAATCCCACTTGGGAGGTGCCATAAGATGGAGTCTCAGAACTGAGCCCATCAGAAACACCGTCTCAGCTCCACCTTCACCTGTTGGCTGGCCAGCGAGTCTCTCAGAGGCCACGGGAGCTCGGAGGCACTCTCTCTCCATCCCTGGGGCAGCCACCGGAGAGAAGGACCATGCTGTCATCAAGGCCTGGAGCCAGCCAGCCGCCAAACACTCAGCGAGTCCCCTGTTGCCAGGGCCAAGTGAGGCTGTCCGGGTGCCGAGAAACAGTGCCAGCCTCCGGCCAGGCGCGCCGGGACGCCGAGTGCTCAGCAGCAAGTGGAAAAAGAATCAACGGGTTCCTTCTACATCCACATCCTCTTAAAAGCCAACAGAAACATGACTCGGAGGGGAGGTTGTACCCTGGCTGCATTGCCTCCGGATGGCGGCAACGGGAAGCAGCCCCCCAGCACTGCCTCCGCCCACGCCAGGAGTCACAGCCCGGCTCAGGTTGCACCAGACACATCCGCGTACTAATGAACTCTCCAGGGACTGTTCACCCAGCAGACCTGACACCTGATGCTCAGAATAACCAATCTGTTTTGGAGAGGGGAGACTGAGGCCCAGAAGTGAAGACTCCTGGCCCAGATCACGAGGGTGAGAGCTGAGACCCAAACCCAAGCATGATGGATGCTAAGAGTGAGCTTGCCACCACCCAAACGGGCTTGCTCTCGGGCTTCCCCAGCCCCATCCTGTTTCTAAATGTGATCCAGCATGGAAGGTGGGAGGCTGGGCTTCGGCAATTCCTTCCCTTTGCCGAACCCAGATCCTCTTGTTCACGGGGCTGCCATGGGGACGAAACATGATCGTGGTGAGTGCTCACTGGAACCTGGTATTGCTGTCATGAAAGGACTT\n>XR_005956344.1 PREDICTED: Pyrgilauda ruficollis uncharacterized LOC121361499 (LOC121361499), ncRNA \nCGCCTCAGGCCGGGATATGCCTGGATGGGGCAGTCCTGGGATGTTGGGGGCTTATCCTGGAGATCGTCTGGTCACAGCGCCCGCTGCCAGGGGAGTAGTTCTGCTGGTTGCTGCCATGCTCCACAGGAGGAACTCAAAGCTCTGGCTAGGATTTTTTTGCAGAATTCTACAGTCATTGCATCCTGGTGGAGAACGCAGGGATTCCTGTTACACTGCTAGCACATAGAAAAATTCCTGGAGGAATGCCACAGGTTGCTGCTCTGCATCTGCTCAGAGAATCAACTGTGCCCAAAGCCATCAATTTCCCCCAGCAGTTCAATGCACAGGAAAACTACCTGGAACTTGTATGTTGCAGTAAGTCATTGAGAACTTGGGGGTTTGTGTTCATCCTAACACAGACATGTGATGGCAGCTGTGAAAATAAGTGCAGTTCCCCGGAGGCAAAGCAGTGCTATGTTTGTGCTGCAGCAGCCTGGGCCAGAGGAAGGTGAGAGAAACCACAGTGGGACAGGTGAGGCACCAAAAATGCCTTTATCTTACCTGTGGCCTTTTGGACAAACTCCAGTTGTATCAACCCACAGCATCAGACAAAGCTGCTTTTAAGAACACTGATGCAAAAATGAGATCTTGGGTGATCATTTCTGGTTCAAGTAGCGGTTTATATATTTATTATAATTATACACAACCTTGACAATCTGTATTGCCATTCAAAAATAAATCCAAGTCTTGTCAA\n>XM_003890613.1 Puccinia graminis f. sp. tritici CRL 75-36-700-3 hypothetical protein (PGTG_20695), mRNA \nATGGCGCAGCCATCAAGTCCGTTGCTCCACATGCGGCCTCCAAACAGCATATCTCTGCCCACATCTTTCTTAAACATTTTTCTTTCTTTAAGCAGTGACGCCACCTCCCTCAACAACACAAGCAAACTTGCTCTTGGAGCAAGCTCCCACTCTAGTCACCATGATGATTCTGGCGAAACCGTCCTACCTCAGCCCGTGATTTATATCATCATCGCAGGGATCGCTTTAGCAGTGATATTGGCGGGATTTGCGATGTGGTCATGTGTTCAAAAGCGCAACAGACGTCGTAGCCGAAAGGCATCATTCTCGATGTCCCAAGCTTCTGAAAAAGAATGGGGCACCACTCGCGAGATGGCTGGCGGCATGGAGAGCGTTTACCGGCACTCCGTCATCACCTATGACGCCAAGGCTCAACCCAAGCTGCTCTATGAAGACTTGGATTTCGGTCCAATGGTCACCTCGCAACTTCCAAGTCAAAAAGAACTGAATCAATACAAGAAAGATACCATCGTGTGTCTAACCGACGTCTATGGAAGTACCAAAGGATGGGACGGCTCAGAATTTGACTATATGTTAAACTCGCCAAATCAATTCCCACCTGCGAGAAGCAGTCCCGATCTCTTATCCTCGCTTCCCAAAGCACTTTTAACTGGGAACCATACGGGTCGACAACCGGCTGTCCCGGGGTTTCGCCCATACCGGTCACCATCCGGCCAATTGATGGTCAAGCCGTTCTCTTCGACCAAAATGAGCCCCGCTGAAGCCTCTAACGAGCTGCAAAAGATCATCAACGCGCATGCCAACCTTGAGAACTTCGATGACTTGTTCGACCACGGCGAAAGCTTCGATTCTTCCAACCTCACAAACTCCTTTGATGGCACTCCAATCCATTCAAACCCTGAACATTTCCCTATCCTCTTAGGTAGCTTCCCTGCTGCCCGTAAACTCTCCTCTTCCTTCTTACCCGGCGCTGATAAAAGCTTGCCCAAAGAAATCGTCCAACTTCCCCTTCCCCGGTATAACTTCAAGCAAACCACTGCTTGA\n>XM_051686607.1 PREDICTED: Myxocyprinus asiaticus autophagy related 9B (LOC127434116), transcript variant X2, mRNA \nCGTCGAGCGATGTTTGTTGTGATTTCTGTTATTGTTGTGAAGCGCAAAGGCGAAGATCATCGTTAGTCGGATGGATCTATGGTGAACATCATAGAGAGGTAGAATGTAAAACACGATGGCTGATTTTGAAACGTATCAGGAGTATCAGCGTATAGAAGACTATGATGAAGACTCACCCCAAGGAGAGGAAGACTTACTTATTCATGTGCCAGAGGGTAGAGGAGACCCATGGCATCATATCAAGAACCTCGACAATTTCTTCACAAGAATCTATCATTTCCATCAGAAGAATGGATTTGCCTGCATGGTGTTGTCAGAGTTTTTTGAACTTGTGCAATTCCTGTTTGTGGTCACGTTTACAACTTTCCTCTTCAACTGTGTGGAATATGATGTTCTCTTTGCCAACCGAGCGGTCAACCACACGGGCCAGAGTCTCGGTCCCCTTGACAGAAACAAGGTCACCCTTCCTGATGCTATTTTACCCAGGGAGCAGTGTACTGAGAGGATTGAAGGCAACAGCTGGATCATATTTCTCTTGATAATGGCAGCCATTTTTTGGGTCTATCGGCTCGTGAAGGTGATCTGCAATGTCCTCAGCTACTGGGAGATCCGGCAGTTTTATATTAAAGCACTCAAAATACAGATGGACGAGTTGTGTAACTTCTCATGGCAAGAAGTTCAAGGCCGTTTGATTCACCTGCAGCGTGAGCAGCCCATGTGCGTCCAAAAAAGGGAACTCTCCGAACTGGACATCTACCACCGCATCCTACGCTTTAAAAACTACACCGTCGCCATGATCAACAAGTCTCTGCTGCCCGTCAGACTGCGCGTGCCCTTTTTCGGAGACATGATTTTCCTCACGCAGGGCCTAAAGTACAACTTTGAACTTATTCTTTTTTGGGGCCCCCTCTCGCTTTTTCAGAACAAATGGAGTTTACATCCCAAGTACAAACGAGCTGCGAACCGCCAAGAGCTTTCGAAACAGCTCAGCCGTGTTATATTGCTAACTGGCATGGTCAATCTTCTGCTTTGCCCATTCGTGGTGGTGTGGCAGGTGTTGTATGCGTTTTTTAGCTATGCCGAAGTCATCAAACGGGAGCCAGGCAGTTTGGGTGCGCGCCGCTGGTCGCTGTACGGCCGTCTTTACCTGCGACACTTTAATGAGCTGGATCATGAGTTGCAAGGCAGGCTGGGTCGCGGATACAAGCCGGCCGCTAAGTACATGAACGCCTTTGTTTCTCCCCTGTTGACGGTGCTGGCGAAGAATGTGGCTTTCTTCTCCGGCTCAGTGCTGGCTGTGCTGATTTTGTTGACAGTGTATGACGAGGACGTATTGACGGTGCAACACATCCTGACGGCCATCACTGTGCTGGGCGTGGTCATCACGGTCTCCAGGTCATTTATTCCAGATGAACATATGGTGTGGTATCCTGAACAGCTGCTGCAGTGTGTCCTGGCCCATATTCACTACATGCCGGATCACTGGAAGGGCAATGGCAACAAGAGCGAGACTCGCGACGAGATGGCACAGCTTTTCCAGTACAAAGCGGTCTTTATCTTGGAGGAGCTCCTCAGCCCCATAATTACCCCGTTCATCCTCATCTTCTCCCTAAGGAACAAGTCTCTAGAAATCATCGACTTCTTCCGTAACTTCACAGTAGACGTTGCAGGAGTAGGTGACATATGCTCATTCGCTCAGATGGACATCAGACGGCATGGCAACCCACAGTGGATGTCCGAGGGTCAGACGGAAGCTTCGGTGTACCAACAGGCTGAAAACGGCAAGACAGAGCTGTCTCTGATGCATTTCACCATCAAAAACCCTCACTGGCAGCCGCCGCAGGAGAGCTCTGTGTTCATCAGTCACCTGAAGGAGAAGGTTCAACAGGATGCACAGACAGGACCATCTCCTCAGCTGCTGCTGTCTGAAGCACCTCTTTGTACCTCACTACTGTCTAATGAGTCTGCCACTGGTCCTGATAACCTGTTAGCCAGCGTGTTGGCTCACCCCGTACTGACTGCATCCGGACTGCCTGGATGGAATCATCGTTTTATCCCACAGAACAGCGCAGCCTCAGCAGCCGCCAGCGTTCTGGCGTCCCTGTCTTCATCCCAGCAGCCCCATGCTGGGCGTTCACGTTCACACACTCTCCTACCCTCCAGACAGCATCAAGATGGCCCTATGTACTACAGTGAGCACACTGTGGGCGACAGGCCTGCACCCCTGAGTCTTCTCTTTACTGTTGCACATGAAACTGGTGTTGAGCGGGTAGAATTCAATGAAGCTGTCAGCTGAGGACATCATGTCCGCAAGTGACTCCAAGATGCTCAGCCAGTCCAAATCAGCCCTTGCATCAGAGTTTGCATCTGCTGAGATGAGCCTGCATGCTATATACATGCACGAG\n>XM_028933362.1 PREDICTED: Prosopis alba uncharacterized LOC114745209 (LOC114745209), transcript variant X1, mRNA \nATCAACGGCCAAGTTCAGGACCTCAATTTCAATTCTCCTCCCACCAATTCCCACTAATTGAAGCCCAACTAAGGCCAATATGGGCGCGGCGGCCGGCGTCGGAGGCTACCCTGTCGGACTGGACGAGTCGTACCGGCCACTTCCGGGGCTTTACTTCGCCTTCTTGTCCATCTGGCTTCTCTCTGCTTGCTCTTGGACTCTTAATACCTACAAAAAGCGCCAGTTTCAGTCAAATAATTTGCAGTGGGCACTAACCTCAGTTCCCTTTATAAAAGTATTGCAGCTCCTGCTGTCCTTTCTCTTCTGGTATTCATGCTTCTATTTTCAGGCATGTTCCTTGTGGATGTCATTTGGGGTGTATGTAACTGGGGTGCTCTTTCAGACTGCTGCCTTTGTCTCCTTCTTGCTCATTGCTCATGGCTACTGTATCATGTGTGAGCATCTTTCTTTAAGTGAACGCCGTACAACTGCTGCACTTGGATGTGTCTTTTACTTAACGCTAGTGGGTTACAAAGCTTGCGTACCATACTTCACGGTTCTTCTGCTACTGAATTATTTCATTTCATTCTATGTTATTTTCCGGCATATATCACAAAACCTATTGTTGTTGCGGGAACAACTGAGTATTGTTGAAAATGAAGATGTTCGGACAATGCATGATGCTCTGTATACGAAGTACATGATGTTCAAGAAATTCCAGGTTGCAATGCAGATAGTAGCTATGGCAGAAACTATGATATACATGAACATGGATGACTCTTCAGAGAATTACTGCCTTCGGTTACTAGTCAGAGAATGGGCACAATTCTGCATTTTTTCATACATTGGGTGGACTTTCAGGTCACAGGACTTGGCGCCACGCTTCTCTGTTATGCCTGCCACCAAGTGTAAAGGCGATACTTTGGTGCCTCCCATCTACAGTATTGAAATGGATGCCGCTACTTTTAAAGATTTCAGTAGTCATGAATGGCACATTGGGGTGCCAACTTCTGCTTGCCGTGATGAAAACTCAGAAGGTGCAGTTCTAGTGATCATTGAACATCCCCACTCACAGAGGCTAAGAACGCCTGATACTTCCTCTTCTCCTATTGTGTCAAATCTCATTTCACAGACATCTTCATACCGAATATAATCAATCAACATTAGCTCTACCATCTAGTCATCTATTGGTTGCCCATGCCTTTTCTCCTGCAATCTGGCATGGGCATGCCAGTACACTCACTGCTTCCGGGTTTAGAAGGTAATTTGAACGTTTCAAGCTGAGAGGAAACAAGAAGAGTAGAAGTATATATTGGGTATAGTCTCCCCTCTTTTTCTTTTTCTTACCAACTCTTTCTTTCTTTGTTTCTTTCCTTTTTTTTTTGCCCTCTTCTTTTTTAAATACTTTACAAACTTTTGCTTTAGAAAATGCCATGAGTTAGTCATGAGCTGAGGGTAGAATAATGAGTGTTATCTTGTTTAGAGGCAACCACAAATATGTATTCTGTACACCATCGAAGCAAATGGTAACTGTATATTGTTCTTCCTTGTACTGTTGTTCTCTCATTGATTATTTCCGACTT\n>XM_003035727.3 Schizophyllum commune H4-8 uncharacterized protein (SCHCODRAFT_02607625), mRNA \nACCACCATGAGCTCCAGCGACACCCAAGAGCGACGCTGCTGTGCGATCTGCTCCTATCCTGCGCCCAGCCAATGCTCTGGCTGCGGACAGGCGTTTTACTGCTCGAAAGAGCATCAGACACTGGCGTGGTCTAAACACAAGCGTCTATGCAAGATCTATCAGCGCCAGGCTCGAGGGGAGCCCGTCCCTTCCCCAGATTCCTACTGCGGTCTGTGCGGGAAGGAGAACGGGCCGCTCCGTCGGACAGAATGCTGCAACAGAACTATCTGCGACGACTACGGGAACTACACGATGTTCTCGTTCAGCGCCAACAGCTGCTCCCGAAACCATGATCGATATACGCGCTGCTGCTACCATTTCAACGAAGGTCACCCCGGCAGCGACCCTCTGCAGTGCACTAAGTGCTCTACTAGCCACGACGCGGAGAAGGAAGCGTGGTACATGACGAACAATTACAACTTCCAGGAGGACATACTACGGGCCAATCCGGCATCCTTCGCACCAAAGCACTGCACCGGGTGCGGCAGGCAGGTCAAGCAGAATGCCGAAGCCGTTTCGTATGGGCCAAGTGGTCTGCAGTGTGGCCGATGCACGGAGAGGATGGCTCCTTCTGTGCTGCCTCAAGATACTTACCAGTTTGACTCTTGAAAGGTAGCGACGTACGCGCCAATGTAATACCCTGATCTATGTTTGTGACCAAGAGGTTCATATCATCAGAGTCGACGCAACGAAGTGCGCTCGTTGTAAGTAATCATTTCAAGAATGTTGCAGCGCATACTGTATATTCGCGAGCGCGGGAACAGGTAGAGTTCATGAAAATCCTATCTCAAGTACTGGAAACATGTACTACGGCGCTGGATCTCCTTGTCGTCATCACAGTCCGATGTACTTATGTGTGTAATGGGCCCTTTCCCTTCAC\n>XM_019346602.2 PREDICTED: Oreochromis niloticus filamin-C (LOC100698591), transcript variant X4, mRNA \nCTTTTTAATCGACTCAACCCACTAGAATCATCACTGTGGACATTTTTTGTGTATAAAGACTATTTATATGTGTTTCTGTACAGCCAGGCTGATGTTCAACACAGCTGGGATAAAACCAGCAGCTCTTATAAAGCTCTAACTGCACACATCTGTATGTGATTATTGCAGAGCTGATCTTGGGCTTCACTCTGGGTCAAGTTCAGCTTGTTTCACGTAGAAGCAGACCGTGCTCAGCAGGGGGCGCTGCTGTTTACGTCAGTAAATCTCTTCAGTTTGTTTTATTCTTCAAAAAACTTGTATTAAACGCAGCATGAAATTTTTCTTCCTCTCTCGCTTGCTCCAGTTTGCCGCGCCTCCATTTGCCTCCATTTGGCAGCCAATGGAATTGCAGGAAGCAGCAGCACCTCATTCAGTTAACTGTAAACACCCAACCTCCATTGTAGTTACCATTAATTGTCATTAATCATTATCACAGAGTCTATTGTATTTTCAGATCTGATATGTATTTCCAAACTGAAGTAAACTTCGATGTTGTTTATTTCTGCTTTGTTATTTAAATGTCACGCAGTGATTTGATTGGCTGCCTGATGGTGATGTCATGTCCCTCCTCAGGGTGTCTCTCCAGGTTTGAGGACTAAAAATACCCGGAGGTGTCAGAGCGGCTGTGGAGCCCCGGGTCCGGCTGTCGGGGTGGGGTAGGTGGGGGTGTCCTGGTTGGGGTATCCAGCGTGTCTCCACCCCCTGCTCCGCGCCCGACCAATGATCTGCGGTCTCGGTGTCCTGCGGCTCGGAGGATGCCCGGGTCGCAGTAGTATATGGTCATGGCAGGGGCATTCCTGGAAGTCCTGCGCAGTGACGCCGAGCCTTTAAACCTCGCTTCACGCTCCCGCAGCTGCACAGCCCCACTCTGTCCACGCCGCCGCCCGTGCGTGACCACAGCCAAGCCAGCCGGAGGACAAAAGCAGACTATTCTTCACTCTTCCTCCTGAGCCTCCTCTTTCTCTGAGAGTGTGAGTCCGCAGGAGTGCCCGCGGGTCTGCATGCGCGCCTCTTTACGCACAGCTCCGTGAAGCTCCCTCCCCGCGCGCTGGGCACTGCCCCTCCGCTTCCACTGCCCCGTTTCTCTTTTTTTTCTGCCTTTCCTTCTCTTCCCACTGCGCTCGGTGCTATAAAAGGCATGTCCATGATGAGCAACAACAGCTACTTGGAGCCCCAGCAGTTCTACCAGAGCACCGCGGACATCGGCGAGGAGGAGGAGGAGGAGGAGATGCCGGCCACCGAGAAGGACCTGGCCGAGGACGCCCCGTGGAAGAAGATCCAGCAGAACACCTTCACCAGGTGGTGCAACGAGCACCTGAAGGTGATCAACAAACGCATCAACGACCTGCAGAAGGACCTGAGCGATGGGCTAAAGTTAATAGGGCTGCTGGAGGTGCTGAGCCAGAAAAAGATGTACCGGAAGTACCACAGCAGACCCAACTTCAGGCAGATGAAGCTGGAGAACGTTTCCGTGGCGCTGGAGTTCCTGGAAAGGGAGCACATCAAGCTGGTCTCCATCGACTCCAAAGCCATCGTGGATGGGAATCTGAAGCTGATCCTGGGTCTGATCTGGACCCTGATCCTCCACTACTCCATCTCCATGCCCATGTGGGAGGATGAGGATGACGAAGACGCCAAGAAACTGACTCCTAAACAGCGTCTGCTGGGCTGGATCCAGAACAAGGTGCCCCAGCTCCCCATCACTAACTTTCACCGAGACTGGAGGGACGGCAAGGCGCTGGGAGCTCTGGTGGACAACTGTGCCCCCGGTCTGTGTCCCGACTGGGAAACATGGGATCCCAGCCAGCCGGTGGAGAACGCCCGGGAAGCCATGCAACAGGCTGACGATTGGCTGGGAGTGCCACAGGTGATTGCTCCTGAGGAGATCGTCGATCCTAACGTGGATGAGCACTCTGTCATGACCTACCTGTCTCAGTTCCCTAAAGCCAAACTGAAGCCCGGTGCCCCCTTGAGGGCCAAATCGCTACACCCCAAGAGGGCTAAGGCCTACGGACCAGGTATCGAGCCTCGAGGTAACATGGTTCTGAAACCAGCAGAGTTCCTGGTGGAGACAGTGGAGGCTGGACTGGGAGAAGTTCTAGTTTATGTGGAGGATCCAGAGGGACACACAGAAGAGGCCCGAGTCATCCCCAACAATGACAAGAACCGAACCTACTCTGTGGTCTACCTGCCCAAAGTGGAGGGGCTTCATAAAGTAAAGGTGTTGTTTGCTGGTCAGGACATCGACAGAAGTCCCTTCATTGTAAATGTTTCAAAAGCCATGGGCGACCCAACCAGAGTCCAGGCCCGCGGGCTGGGACTGCAGCCAATGGGAAATGTGGCCAACAAACCTACATACTTTGATATTTACACTGCAGGAGCGGGTGCTGGAGATGTGGGCGTCATCATTGTGGACTCAAATGGCCGCAGGGATACAGTGGAGATTGTCCTGGAGAACAGAGGCGACAGTGTATTTCGGTGCACCTATGTCCCTGTCCTGGAGGGGCCTCACGTCGTCTGTGTGACTTTTGCTGGGCAGCAGATTCCCAGGAGTCCTTTCACTGTCCACATCTCCGAAGCCTGTAACCCAAACGCCTGCAGAGCATCTGGCAGAGGTTTGCAGCCGAAGGGTCTGAGAGTGAAAGAAGTGGCAGATTTCAGAGTTTACACCAAAGGAGCCGGCAGCGGGGAGCTCAAAGTCACCGTTAAAGGACCAAAGGGCCTGGAGGAGCCGGTGAAGGTGCTTGAGATGGAAAATGGCCTGTATGAGTGTAATTATTACCCCATCATGGCAGGAAAGTACATCGTAACCGTCACTTGGGGCGGACACAGCATCCCTCGCAGCCCATTTGAGGTTTATGTCAGTGAGGAGGCAGGGCTTCAGAAAGTGAGAGCCTGGGGTCCAGGTCTGGAGACCGGTATGGTCGGGAAGAGTGCTGACTTTGTGGTGGAGGCCATTGGAACTGAAGTGGGAACTCTCGGTTTCTCTATCGAGGGGCCCTCCCAGGCTAAGATTGAGTGTGATGATAAAGGCGATGGATCATGTGATGTTCGATACTGGCCGACTGAACCAGGCGACTACGCCGTCCATGTTGTTTGTGATGACGAGGACATCAAGGACAGTCCCTTCATGGCCCACATTCTCCCTGCTGCCAGTGACGTCTTCCCTGAGAAGGTGAAATGTTACGGTCCAGGTCTGGAGCCTTTGGGCTGCATTGTTAACAAACCTGCTGATTTCACCATTGATACCCGTGGAGCTGGCATCGGAGAGCTGAAGCTCTATGCTCAGGATTCAGATGGTTTCCCCATCGACATCCAGATCACAGATAATGGAGACAGCACCTACTTCTGTGTTTACATTCCCACAAAACCCATCAAACACACCATTATCATCACCTGGGGTGAAGTCAACGTCCCTAACAGCCCGTTCAGGGTGACTATTGGAGAGGGCAGCCATCCAGAGAATGTGAAAGTTTATGGTCCAGGTGTGGAGAAGACAGGACTGAAGGCCAACGAGCCGACTTACTTCACTGTGGACTGCAGTGAAGCCGGACAGGGTGATGTCAGCATTGGCATCAAGTGCGCTCCAGGTGTAGTTGGACCTGCCGAGGCCGACATCGACTTTGACATCATCAAGAACGACAATGACACATTCACAGTGAAGTACATGCCTCCAGGTCCCGGACAGTACACCATCATGGTGCTGTTCGCTGATCAGGAAATCCCTATTAGCCCCTTCAGAATAAAGGTGGATCCTTCCCATGATGCAGCCAAAGTCAGGGCAGAGGGACCTGGACTCAACAGGACAGGGGTGGAGGTGGGTAAGCCCACCCACTTCACCATTTATACAAAGGGAGCTGGTAAAGCCAAACCCGAGGTCCACTTCACCGGAGCAGCTAAAGGTGATGCCGTCCGAGACTTTGAGATCATCGACAACCATGACTACTCATACACTGTCCGCTACACGGCGGTGCAGCAGGGGAGCATGTCCATCATTGTGTGTCACGGAGGAGACCCCATCCCAAAAAGCCCATTCACCATCGTTGTGGCCCCCCCACTGGACCTCAACAAGGTCAAAGTTCAGGGACTGAACAACAAAGTAGACGTTGGGAAGGATCAGGAGTTCTCCGTCTGTACTCGAGGTGCTGGAGGTCAGGGCAAACTAGACGTGAAGATCACCTCCCCTTCGCGTCGACCAATCCCCTGCAAGGTGGAGTCGGGGACAGCCAATGAGGTTCATACAGTGAAGTACATTCCTCCCGAGGAAGGACCATACAGAGTGGACATCAGCTACGACGGGAATCCTGTCCCAGGGAGTCCATTCACTATGGAGGGTATCATGCCCCCTGACCCTTCAAAGGTGCGAGCCTATGGTCCAGGCCTTCAGGGTGGTGTGGTAGGCAAACCAGCCCCCTTTGCCATTGACACAAAGGGTGCTGGTACTGGTGGTCTGGGTCTGACAGTGGAGGGGCCGTGTGAGGCCAAGATTGAATGCCAGGACAATGGTGATGGATCCTGCTCTGTGTCCTACCTGCCGACTGAGCCTGGTGAATACGCCATCAACATCCTGTTTGCAGACCAGCACATCCCCGGTTCTCCCTTCAAGGCTGTGGTCCAGTCAGTGTTTGACCCCAGCAAGGTGACAGCCAGCGGCCCCGGGCTGGAGCGAGGCAAGGTCAACGAGGCTGGAACCTTCACGGTGGACTGCTCCAAAGCCGGGGAGGATGAGCTCACCATCGAGATCATCTCTGACTCTGGGGCCAAAGCTGAAGTTCACATTCAGAACAACAGTGATGGGACCTACTCCATCACATATATCCCCCAGTGCCACGGGATGTACACCATCACCATTAAATATGGAGAACACATGGTGCCAAAGTTCCCCATTCGCTTGCAGGTGGACCCAGCTGTTGACACCAGCGGGGTAAAGATCTATGGACCGGGAGTGGAACCCAGAGGCGTCCTGAGGGAAGTAACCACTCATTTCATCGTGGACGCTCGAGCTCACTACAAGAGCGGTGGCAGCCATATCAAAACCTCGATCTCAAATCCGTCGGGCACCAACACAGACGCCTACATCACCGACAAGGGAGATGGGACATACAAAGTCGAGTACACACCCTACGAGGACGGTTTGCATCTGATTGAAGTTCTTTTGGATGACGTCTCGGTGCCGAAGAGTCCGTTCAGGGTGTCCGTGAGCGAGGGTTGTGATCCCAGTCGAGTCCGAGCCTACGGTCCAGGTCTGGAGGAAGGACTGGTGAACAAACCAAACCGATTCACTGTTGAGACCAGAGGTGCTGGCACTGGGGGACTTGGCCTGGCCATTGAGGGTCCATCAGAGGCAAAAATGTCATGTAAGGACAACAAAGATGGCAGCTGCAGTGTGGAGTATATCCCCTTCACGCCTGGAGAATATGATGTCAATATCACCTTTGGAGGCTTACCGATCCCAGGGAGCCCGTTCCGGGTCCCAGTGCGAGAGCTGGTTGATCCCAGTATGGTGAGGTGTTCAGGTCCTGGCCTTGGAAGTGGAGTCCGGGCTCATGTTCCTCAGACTTTTACTGTAGACAGCAGCAAGGCAGGGGTGGCTCCCCTGGCAGTTCAGCTATATGGACCAACAGGTGTAGCTGAGCCCCTCAACATCACAGATAATGGTGATGGCACTCACACGGTCAACTATACTCCTGCAAACGATGGCCCATATACAGTGTGCGTGAAGTATGCCGACCAGGAAGTGCCCCGGAGTCCTTTTAAAATCAAGACATTACCGGCTCATGATGCTAGCAAAGTTCGAGCCAGCGGTCCCGGACTGAATGCATCCGGGGTTCCAGCCAGCCTGCCAGTGGAGTTCACCATTGATGCCAGAGATGCTGGAGAAGGACTGCTCACCGTCCAGATTCTGGGTCCGGACGGCTGCAGTCGCGAGGCTTCATTGTTTGTGGAAGACTGGGGCAGGAGGGTGTGGGAGACTCACATAGTAAAGAAAACCATCCCCTTCAGTATTCTTAGGAGAGGCTCTGATCCAGAGGGAAAACCCAAGAAGGCGACCATTCGAGACAACAGAGATGGGACGTACACAGTGTCCTACGTGCCGGACATGACGGGGCGCTACACCATCACCATCAAATACGGAGGAGATGAGATCCCGTACTCACCTTACCGGATCCACGCCCTGCCCACCGGAGACGCCAGCAAGTGTCTGGTCACAGTGTCAATCGGAGGACACGGACTCGGTTCAGGAATTGGACCAACCATCCAGATCGGAGAGGAAACTGTCATCACCGTGGATGCAAAGGCTGCAGGGAAAGGTAAAGTCACCTGTAAGGTGTCAACGCCGGACGGAGCGGAGCTGGATGTGGATGTAGTGGAGAACGCAGATGGGACGTTCGATATTTATTACACGGCTCCAGAGCCAGGGAAGTACGTCATCACCATCCGCTTCGGAGGGGAACACATTCCCAACAGCCCCTTCCATGTCGTGGCAAGTGATACCATCCCAATAATAGAGGAACCATGTGACAAGCTTCAGTTACAGCAGCCCTACTCTCCCTATGCGGCCTTCTCCCCTCAATGGGCCACCGATGATCCCATCAGCCCTGTGGACGGGCTGGAGCCGATGCTGCGTCCCTTCAGTCTGGTCATTCCCTTTACGGTGCAGAAAGGAGAGATCACAGGTGAAGTCCGCATGCCTTCCGGCCGAACAGCCCAACCTAACATCACCGACAACAAGGACGGGACAGTTACTGTGAAGTACTCGCCAACTGAACGAGGCCTCCATGAGATGGACATCAAATACGATGGCAACCACATCCCAGGAAGTCCACTCCAGTTCTATGTTGATGCTATTAACAGTGGTCATGTGACAGCATACGGTCCCGGCCTGAGCCACGGCACCATGAACCGACCAGCCACTTTCACTATAGTTACAAAAGATGCTGGAGAAGGAGGTTTGTCTCTGGCGGTTGAAGGTCCATCCAAAGCTGAGATCAGCTGTAAAGACAACAAGGACGGGACGTGCACAGTGTCCTACCTGCCCACGGCACCTGGAGACTACAACATCATCGTCAAGTTTGATGACAAACACATCCCTGGCAGCCCCTTTACCGCCAAGATTACCGGTGACGACTCTATGAGAACATCCCAGCTTAACGTTGGCACGGCAACAGATGTTTCCTTAAAGATTATGGAGACAGACCTGAGCAGCCTGACCGCGACGATCAGAGCTCCGTCAGGAAACGAGGAGCCCTGCCTGCTGAAGAGGCTGCCCAACAGACATATCGGAATATCCTTCACACCAAAGGAAGTTGGTGAACACGTGGTCAGCGTGAAGAAGAACGGGAAGCATGTGACCAATAGTCCGTTTAAGATCATGGTGGGTCAGTCGGAGATTGGAGATGCCAGCAAGGTGAAGGTTTACGGTCAGGGGCTGGTGGAGGGACACACGTTCGAGGTGGCCGAGTTCATTGTGGACACGAGGAATGCAGGTTATGGAGGTCTGGGTCTGTCCATCGAGGGTCCCAGTAAGGTGGACATCAACTGTGAGGACGTGGAGGACGGGACATGTAAAGTCACCTACTGTCCCACAGAACCAGGAAACTACATCATCAACATCAAGTTCGCCGACCAGCATGTGCCAGGAAGTCCGTTCACGGTGAAGGTGTTTGGTGAAGGTCGGATGAAAGAGAGCATCACCCGGAAACGTCAGGCACCCTCCATTGCCACCGTGGGCAGCACGTGTGACCTCAACCTCAAAATACCAGGAAACTGGTTTCAGATGGTTTCAGCTCAGGAGCGTTTGACCCGGACATTCACCCGCAGCAGCCACACCTACACCCGGACCGAGCGGACAGAGATCAGCAAAACCCGAGCCGGAGAGACCAAGAGGGAGGTGCGGGTGGAGGAGAGCACGCAGGTCGGAGGAGATCCCTTTAGAGACGTATTCGGAGATTTTCTAGGGCGAGAGAGTCTTAGCGGCTTCGGCGGGATGCCGACTGGCAGCCGACAGCCGCTGCAGAACGGTGAGGCAGCTAACCAGGAGATGACGGCTCAAGTGACGAGTCCTGGAGGAAAGACAGAGGACGCAGAGATCATTAAAGGAGAGGACAGCACCTACAGCGTCCGCTTCATCCCTCAGGAGATGGGACCTCACACTGTCAACGTCAAATACCGGGGCCAGCACGTCCCTGGGAGCCCCTTCCAGTTCACTGTGGGGCCCCTGGGAGAGGGAGGGGCCCACAAGGTCAGAGCAGGAGGCACTGGACTGGACCGCGGAGTGGCAGGAATCCCAGCGGAGTTCAGTATCTGGACCAGAGAGGCTGGTGCTGGAGGTCTCTCAATTGCTGTAGAAGGACCCAGCAAGGCTGAGATAACATTTGAAGACAGGAAAGACGGATCCTGTGGAGTCACCTACGTAGTGCAGGAACCTGGTGATTATGAGGTCTCCATTAAATTCAATGATGAACATATCCCAGACTCCCCCTTTACCGTCCCCATCGCCTCACTGTCAGACGACGCTCGCCGCCTCACCATCACCAGCCTGCAGGAGATGGGTCTGAAGGTGGGTCAGGAGGCCTCCTTTGCAGTGCAGCTCAATGGAGCAAGAGGGCTGATTGATGCCAAGATCCACACGCCATCAGGAGCCACAGAAGAGTGTTACATCACTGAGCTGGACAGTGATCAGCATGCTATCAGGTTCATCCCAAAGGAGAATGGAGTTCATTCTATAGATGTTCGTTTTAACGGCAGCCATGTGCCCGGCAGTCCCTTCAAGATCCGAGTAGGAGAACCGGGTCAGGTCGGAGATCCAGGAATGGTGTCTGCATTTGGACCAGGTCTCGAGGGAGGAACCACAGGCGTGGCATCAGAGTTTATTGTCAATACTTGTAACGCCGGCTCAGGAGCACTGTCCGTGACAATTGATGGCCCATCAAAGGTTAAGATGGACTGTCAGGAGTCTCCTGAGGGGTATAAGGTCTCCTACACACCTATGGCTCCTGGAAGCTACCTGATCTCCATCAAGTATGGAGGACCCCAGCACATTGTAGGCAGCCCCTTCAAGGCCAAAGTATCAGGACCTCGTCTGTCAGGTGGCCACAGTTTGCATGAGACGTCGTCTGTTCTCGTGGAGACCGTCAGCAAGTCGGTAGCAATGGGCAGCCCCTTTGCCTCTTTGCCTAAATTTTCCTCAGATGCCAGTAAAGTCATCTCCAGAGGCGCTGGCCTTTCGAAGGCCTTCATTGGTCAGAAGAACACCTTCACAGTCGACTGCAGTAAAGCAGGCACAAACATGTTGATGGTCGGTGTCCACGGGCCGAAGACACCCTGCGAGGAAGTGTACGTCAAACACATGGGCAACAGGATGTACAATGTCACGTATACTGTTAAAGAGCAGGGCAGCTACATCCTCATTGTGAAGTGGGGAGATGAGAACGTCCCTGGCAGTCCGTTCCATGTCACCGTCCCTTAAAACTGAACTCTTCACTGTCTCCAGCCTCTTCAACATCTGCAATGCACTGACGATTTTTCACTTACTGTTTTCTGCTAAATACGAACATCAGAGCACAGCTTCAGTAACCACAGGTTGTTCGTCGAGGCTTTTCTTCTGTCAGTTGCTCTTTTAAACATCGTCCCATTTAACTTCAAGAAAAGAGAATTTAAAGAGTTCAAACTGACAACAGCCCACACGCCTCAGAATTTGACCTGTTTTCATGCGTCCTTTATTTGAGAAGATTTGTTTCCTGCCAACATGTGGATAACTATGCAGGTGTAAACATCTGGTTCATAGCAGCTAAAAACAAACGTGCAGGATGCAAACATTAAGACTGGATTTAAATGTGATCTGCAATATCTGGACTAGTTTATTTTCTTGATGACAGGTTTTCTGTTAGTATTTCTGAAGATATGCAGCACTCAAAGAGGTCCAGAGGTGTCTGAGAAGGTCACCATGAAGGGGAGACTGCATACATTTCCATCTTTTTTGTGTGTGTCCAGTTCCCTGAAATTTTTCATCACATCTCATATTGTGTACAGTATGTGCATTAATTCACAAACACAATCTCATATTTAGTGAAAAATTCAAGCCGCAAGTTGCTCTTTTGCTCCCACAAACCAAACAATTCAGACAACTTAGCTTAAACAGAAGAAACAGTTTTATCTTCAGTGAGGAAAAAAGTGCTTCAGAGTCCCTTGTTTCTTATCTCCATCTGTAAAAACCGGAAACGATAAACTTTCTCTAAGAATCCTTATTTCTTACTGATGCTCATCCAATAAACACTAACACTTCTGACCCTCGGACTGTCTGCACTCCAGCCGTGGTGACTATCATCCAAAAATCTGATTGGTCAGTAGATGGTGATCTCTTATCTGCAACATAACCTGGAGCAGCTTTGATCTGTAGCATCAGTTACCATGGTGACATACCACCTTCATAACCCTGAAAAGACAGAGTTAAACCCGAAGTTAGCTTGATAACTACAGATCCCTAAAAGCATTCATGTTTTCTCATGGATGAGTTAAATGTCTTTCAAAGATATTAGTGTCACATAGTTGGAATAAATCTCTGAGTGAAAGATGGTGTTTAGTTAGCCTCAGCAGGTCTCCCTTTCCTCAGGATTCAGTTTCAGGTGAGCGAGAGACTATCTTCCCTCCAGGTTGAATCAGATGCACTCGGCAGGTCTCTGTATGTCAGGGTTTGTCCCAATTGCTCATGTGGTGTGGGCCCAGCTGTGGGATGTGGAATGATCAAGATGAGCTGTGCTGTGAGATTAACAAACTTTTCTGTTTTTATTTATTCTGCAGCATTTTTCTCTCCTTTGATTTTCTTTGACAGAAAATGGTCTTACTGTTGAGAGAAGCAGGTGATAATGGATTTTTTTTTTTTTACCACAGGAAGGAAGTGCAGTGGAGTTTCCTTTGTGAATGTTGGAAAAACAGCAGCAGATATTAGAGTGACATTTTATAGTGATTTTATATGTATGAGTGAAGCAAAGTTTAAGTGTTTGATATGTTAACCTTCTGTATTGCAACACTGTGCAGGCATAATAAAAGTTTATCTGTGAAATCTCCA\n>XM_002992450.2 PREDICTED: Selaginella moellendorffii UV-stimulated scaffold protein A homolog (LOC9662154), mRNA \nATGGCGGGGCGATTGAGCGATCTCATCCTCGCGGCCACGAATTCCCCGGGCAAGGAGCTGGAGGAGCCGCTGCTCAAGGCGATCAAGGCGCTGGTGCGCGCCTCAGATGACAATGTCAAGGCGGCGGCAGACCTTCTCATGGACCGGCTAGGGAAGAATCACTCCCAGGTCAGGCTTCTCGCTCTGCTGCTCATCGATCAGCTCTTTACGCGATCGAAGCTGTTTCGCGGCCAGATCGTGGCGGTGCTCGAGAAATTTATGGTTCTCTGCCTAGGGCACCGCACCGACCAGCCGCTCCCAGCTCCCGCGGATCGAGCGGCGCTGCTCAAGGCTAAGGCGCTGGAAATCGTGGAGAGATGGAACGAGACGTTTGGGCCTCACTACAAGGAGCTCCAGCTTGGCTACGAATACTTGAAGTTCACGCTACGTCTCGACTTTCCGGGTGTTCGAGAGGCCGCGAATCGAGCCGAGGAAGAAAAGAATGCCAGGGACAGGCGCACGCAAGATCTTCTCCGGTGCCGGCTGCTCCAACTCACGGAGAATTTCCCTGGCTTGAGGAGAGATCTCGAGTCGACGATGAGTCAGCTGGAAGAATGCTTTGCCATCTTGAGCGAGGAGGAGGAGGTGGTCCAGGACGAGGATGGATTTTTGGAGGTGGACAAAGATGAAGAGGACAGTAATGAGGTGTTTGGGATCCAAAGCTTGCGGTCCATGCGTGATCAAGAGGAATTGATGGTCACGGAATCTCGCGACAACGGGGCCATTTTCGACATGGCCCGGGATTTGCTCAAGTTGGTGACAACAAGACATCTTCCAGCAGCGCAGGAATGGCTGTCGGTTTTGATGCGAGTCGACCCGGAAGATCGACAAAGCCGGGATGCTCTCATGAAGGAGGTGATCGACTTGAGGAACCGCCTGGTGGTCTTAAAGGATAAGTGTCAGGAGCTCGGGATTGTCGAGGTGGCCAAATCCAAAACCACCACTGACGACGATGTGGAATGGGAAGAAGAAGAGATATTTGACAGGAGCAAGCTGGATGGTCCACGACACAAACTAGAGCAAGAACGAGAACGAGAACGAGAACGGGAACAAGGTGGCGAAATAAAAAAGAGTTCCTCACCTCAGGCTACAGCAACAGGAACGGCTTCGTCATCTAACGCAACCATGTCCGAGCTTAAGCAGAAGCTGTTTGAGGAGGCTCCCGTGCTGCCGTGGGGATCGTTTCTCGACGCCTGGGGCTCCGACGCTGCGGTTCCTGCAAACAACAGGGGACTGGTTCTCGACAACCACTGGGGAAGAGTGGATCCGGACGCTCTCATCTCTACCGAGAAGATGGCGGAGATGCAAGTGAGAGCATCGTACTACCAGCCTTTAAAGTCGGAGTTACGTCCTTGCTCGGCACCGCTGAGGAATGGAGGCCTTTGCCAGAGACGAGATCTCCGAAAGTGCCCGCTTCATGGCACAATAATTCCGCGGGACGATAGAGGCAATCCTCTCGAGGAGAAAAGGGCTGTCGAAGCCAAGGGGAAGGAGAAGGCGGCGGTCAGTCCGGCAGCTTTGGCTGCTCAAGCCGTAAGGAACGTGAGAGGCAGGGATGAAGCCAAAAGGAAACAGAATAAACGTTTGCGACAGTCTCAAGCCAGGACAGACAGACAACACAACGAGGCCGTGCTGAGAACTGCCGCGCTTGCTCACGACACGCAGACGATTGAAGCAGGCCTAGAGAGGAAAAGCCTGGATGAAGAAACGCCAAAGAAACGAAAAGGTGGTCTCAGCGCTATGCTCCGTAAGAAGGAGACTCCAAAAGACAGAATTGCCAGGAGACTGCTGCGCGGCCGGGCAGTGGACGCTATGGTCGGCAGCATAGCTCGAGACGAGGATGCCAAGTACAGGGAGTCTTTCCCAAATCAGTGGTGATTCCACTCGGAAGCTGGCGCCGCTGATTCCCGCTTTAAGCAGTCCTTTTGCTGGCAGTCTGGGACGAGCTTTACAACTGGACATCATCAAAGCAAAGCCGAGCCGAGGAAAAGAAAAGAACGAGTCATCCGCAGCTCGAAAAGAGAGTTAAATTGTTCGAAGGAAGAAGACGAAAATCGAAGCAGCCTGTCTTTATAGA\n>MF497935.1 Uncultured bacterium clone Ant5 16S ribosomal RNA gene, partial sequence \nAGTGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATAACGTCGCAAGACCAAAGAGGGGGACCTTCGGGCCTCTTGCCATCAGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAACGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGATACTGGCAAG\n>XM_053485329.1 PREDICTED: Clarias gariepinus hook microtubule-tethering protein 3 (LOC128512176), transcript variant X3, mRNA \nGCTGTAGCTGTGGCTTCGCCGGTGGAGCGGGTTGCGTGTGTCTCCACGTATTTGTTCATCAGAAGACGGATTTTATTGTTTTATATTGAAAGGTGCGATAAGGGAACATAACCGGAACGTGTTAAAACGTGTTTAAATTACTCGGGGATATATTGTGATATTTGTTTCGTTTGATCAAATCGTTCCTAGTGATTTTTTAGAGGTGCTCTCTCTGTTTGTTTGTGTGTGTGTGTGTGTGTGTGTGTGTGTCTGGGTAAAGTCACGGGCGGATTAAAAGCGAGCTGCGATGAGCACTTTGGACGCAGTGGATCGGGTCGAGCTGTGTGAGAGTCTCCTAACATGGATCCAGACGTTTGGCGTGGAGGCGCCGTGCAAAACCGTGGAGGACCTGACGAGTGGCGTGGTCATGGCGCAGGTTCTGCAGAAAATAGACGTGGTGTACTTCAGCGACAGCTGGCTGAGCCGTATCAAGCCCGAAGTGGGGGATAACTGGAGGTTAAAGATCAGTAACCTGAAGAAAATATTAAAAGGCATCCTGGATTACAACCATGAGATCCTGGGGCAGCAGATTAACGACTTCACTCTGCCCGATGTGAATCTGATCGGGGAGCACGCAGACGCAGCAGAGCTCGGCCGCATGCTGCAGCTCATCCTCGGCTGCGCGGTCAACTGCGAACAGAAACAAGAGTACATCCAGACCATCATGATGATGGAGGAGTCCGTGCAGCACGTCGTCATGACGGCCATTCAGGAGCTCATGAGCAAAGAGACGCCAGTTTCAGCCGGGAGCGACTCCTACGCCGACCTGGACAGACAGCTGAAGAAGACGGCGGAGGACCTGAACGATGCTCTGGCTTCCAAAGAGGAGATCGCTCAGCGCTGCCACGAGCTGGACATGCAGGTGGCGGCCCTGCAGGAGGAGAAGAGCAGCCTGCTTGCCGAGAACCAGGTCCTGATGGAGCGCCTTAACCAGTCCGACTCCATCGAGGACCTGAACAGCCCGGCAGGAAGGAGGCACCTCCAGCTCCAGGCACAGCTGGAGCAGCTGCAGGAGGAGACGTTCAGGCTCGAAGCGGCCAAAGACGACTACCGCATCCGCTGTGAGGAGCTGGAGAAGGAGCTCCTAGAGGTCAAAGGTCAGAACGAGGAGCTAACGTCTCTGGCTGACGAAGCCCAGTCACTCAAAGACGAAATGGACGTCCTGAGACACTCGTCTGATAAGGTGGCGAAATTGGAGGCGCAGGTGGAGTCGTATAAGAAGAAGCTGGAGGATCTGGGGGATCTGCGGCGGCAGGTGAAGCTGCTGGAGGAGAAGAACACCAGCTACATGCAGAACACCGTCAGCCTGGAGGAGGAGCTACGCAAAGCTAACACGGCCCGCGCACAGCTGGAGACCTACAAGAGACAGGTGGTCGAGCTCCAGAACCGTTTGTCCGAGGAATCCAAGAAGGCCGACAAGCTGGAGTTTGAGAGCAAGCGACTGAAGGAGAAGGTGGATTCACTCCAGAAGGAGAAAGACCGGATGAGGACGGAGCGCGACTCTCTGAAGGAGACGATCGAGGAGCTGCGGTGTGTTCAGGCCCAGGAGGGTCAGCTCACCTCAGGTCTGGTTCCACTGGGCAGCAGCGAGGCTGGTTCACTAGCGGCACAAATTGTGACCCCAGAGATCAGGGAGAGGTTTATTCGACTGCAGCACGAGAACAAGATGCTGAAGCTGAATCAGGAAGGATCTGACAACGAGCAGATCGCACTCCTGAAGAGTCTGCTGGAGGACGCAAACGCCAGGAAGAACGAGCTGGAGTCGGAGAACAGGTTGGCGAATCAGAGGCTCATGGCCGGTCAGAGTCAGGTGGAGGAGCTGCAGAAGAGTTTACAGGAGCAGGACTCGAAAGCAGACGACTCGGTTCTGCTGAAGAGGAAGTGCGAGGAACACTTAGAGAAATTGAGAGACGCGTCCAACGAGCTGCAGAAGAAGAGCGCCATCATCGAGGAACTGGAGCCCAAATATCACGCTGGTACTCAGAGGATTGAGGAACTGGAGGAGGCTCTGAAGAAGAAAGACGACGAGATGAAGCAGATGGAGGAGAGATATAAGAAATATCTGGAGAAAGCAAAGAGTGTCATTCGGACTTTGGACCCGAAACAGAACCAGGGTTCAGCTCCTGAGGTTCAGGCCCTGAAAAACCAGCTACAGGAGAAGGAGAGAATGCTGCACTCTTTAGAGAAAGAGTACGACAAGGCGAAGTCTCAGCGAGACCACGAGGAGAAGCTGATTGTATCCGCCTGGTACAACATGGGCATGGCTCTCCAGAAGAAAGCAGCGGAGGAGCGTTTAGCCAGCACGGGTTCGGGTCAGTCGTTTCTGGCGCGTCAGAGGCAGGCCACCAGCACACGGCGCTCGTATCCGGGCCACGTGCAGCCCGCCACAGCCAGTGATGTAAAGGCATGAGGTCGAGGCGGCGCGGCTGCATGACGGCGCTCCTTGCATGACCGATTTTGCTCTTGAATAACACCTCAACCAACACTAACACCTCTCGCTTTCTTCCGTCCCCCGGTCCCGCCGTTCCGTCTGCATGCATACGCTGCGTGTGTGAACGTCCGCTGTGTCCCAGCATGCAGCAGTCTGTGGGCGGGGCTTGAAGGTTACCGGAGAGTGACGTAATAATGATGATAATAATAAGTGTTGCGCTGTATTAATACGACAGTCTCTTAGGTCAGCATTTTGTTATTAACTCTTGTCTTCTTTTTCATATTTATTATCACTTTTTTGTTTCCTTTTTTATTTGAATGCAGTGTTATTTTAATTTCATGACCCGCGTGAGCAAACGGTGAGCCTCTGCACGGCACGGCTTCACTTTATTTATTAAATGTTTATTTTCCCAGAGCTCACAGCGCCACCGCTTGGCGGAAACCACGCACGAGAATTACGTTACATTACGTTTCTGTTTTTTCTTTCTGACAGGGAACAGTATTAGGAGGTCGAAAAGAACAGAAAAAAAAGAAACAAGGTCAATAAGGAGCTTAGAAGTAAAATATAAAGTATTTAAGTCCTGGGTGTGCGTATCAGAGACCTGGCAACAGGACAGAAACCACACCTCGTACCAGGGCTCTTTGTTTTTGTTTTTTTTCATAAATGATTCTATAATATTCGTTTATTAAACATTTATTAACCATCAGATCTGATTGAACAAAATGTTTTGTTAAAAAAGTTAACTATGCCAGGGTTTAGGCTGCTTTCACAGGGTTTTATTTCCCTCCCAAAGAATTATGGTTTAAAATAAGGTGATTTTTTTTTTTTTTTTATCATTATTTTTTTTTTTTTTATAAAAAGAAAAAAAAAGTCCTTTCAAAAGTATGTTTAAATTAAAATAAATGAATGAATGAATAAATAAATAAATACATATATATTGTTTTTTTGACCAATCTGATTGCAGTTGAGCAACTAAATCACGCACAAATTGTTGGTTTCAAATGAGCTTTATTAATAAAATATAGTGTAGTAATATTTAGAGATTTGTCACATTTTAAATGTATTTTTATTATTATTATTATTATTATTATTTATTTTGAGTAATTAGATGCAAATCAGAGGTCCAGACAAGAAAGAAAAATTACACGAGTGTGGGAAAAAATGCATAAGTGAAAATAATGTGAACTATATGAAGCTTTATGATGCTAAAAATAATGAAAATATATAACTCTTTTTTTTTTTATAATTATTATTATTATTGAGCCAATTAGCGGAAATCTGGGACGTCCCACTTCTTTCTCCCACCAAAAAAAAAAAATACTACAAAAGCAAATAACTTGTTTGTTTTTTTTACAAATAATTACTGCTTATCATGTTCAATCTAAATGAATCTTTCGTCGATTACTAGTTACCATGCGTTTATATAAATTAGCTAGCTGATACTAGCAGAGGTTTATAAAATCGTTGTTATGGTTAACGTAATATGACCAGCCTGAAAAAACAAAACAAAAATGAAAGCAGCCTAAAATATCTAGGCATAAAAACCAGTAAGCTGAACCACAGTTGGCTCGATCACAAACCATCGAGTGCTTTTGCGTTGTTACATTTTACACAAGGACACAGAGAGACGACCGAATGACATCATCAGGTCTCTAGGTCTCTAACATGTGCGTCTGCGATACTAAAATATCGTTTCCGCATCCGCTAAGAGGCGTGTCCTGTTTTATTATTATCTATTTACTTTTTTTTTTTACCTCGGATTGATTGATTGATTGATTGATGACTCTGTGGACTAACACACTAAACCGTGTGCTGTTTATTAGCCCTTAAACTTCAAAGTCTTCTGCTGCTTCTTTTCTTCATCACGTCATGACGTCCATTCTTACGCGCCATTTTGTACTGTTTAACGACTTTTTGTTTGAATCTATATTTAGCTTAAGTACATTTGTAAGGGTGTTTGTAAGTCGAGGAACGCACAACGCGTGGACTAGACAACAGTGTTAGCCTATTTAATATGAAATTTACAAAGAAACGTTCACGATAAGAACCGTCCATTAGGAGAGGACCTGCTCTGATCGGACACCTCAAAAGAAAAAAGAAAAAAAAAGAAAAATGACAATGACATTTTGGTTTTTCGAGTATTATTATGGTTGATGTGTTTTTTATGCATAGAAAGATGTTACGTTTAAGTCAAAGTAGCAAATAATCTTTCCATTTGCCAAGTTTTATATTGCTTGTGTACAGTATGTACAGACGCTCTGTGTAAGGAAGAGAAGGAAATTCCTGCTCATTAGTTTGTATAATTATATATATTACCAAAAAAAGAAATTCATCAAGAAGGTGATTGATTTTAGTTTAATTATGTGTTGCGACTCGACGGGAAAATGTGCTTCCTTTGCTGCAAAACTGTACAGTTGGTAATCAAGTTGTAAATAAAGCTTGTATAAAATTCTGA\n>XM_052168617.1 PREDICTED: Apodemus sylvaticus canopy FGF signaling regulator 4 (LOC127673070), mRNA \nTTTTAAAGCTTGCTGCCCGCTGCACCTAAATTTAAAGGGCCCGCTGACTTCCAGAAGTTGGTCTGAAGGCAAACGGTGGTTGTATGGGTGGACTGCGTTTTGTCATGGGACCTGTGCGGCTGGAAATACTGCTTTTCATCCTGGCAGCGTACGGTGCTTGGACTGGGGCGACGAAAGAGGAGGAAGATGACACAGAACGTTTGCCCAGCAAATGTGAAGTGTGTAAGCTGCTGAGCATGGAGCTACAGGAAGAGTTGAGTCGAACTGGTCGATCCCGGGAGGTGCTGGAGCTGGGTCAGGTGCTAGACACGGGCAAGAGGAAGAGACACGTGCCTTACAGCCTCTCTGAGACAAGGCTGGAGGAGGCTTTGGAGAATTTGTGTGAGCGGATCCTGGATTACAATGTTCATGCTGAACGCAAGGGCTCACTGAGATACGCCAAGGGTCAAAGTCAGACTATGGCCACCCTGAAAGGCCTGGTACAGAAGGGAGTGAAAGTGGATCTGGGAATCCCTTTGGAGCTCTGGGACGAACCCAGTGTGGAGGTCACGTTCCTCAAGAAGCAGTGTGAGACGATGCTGGAGGAGTTTGAAGATGTTGTAGGAGACTGGTACTTCCACCATCAGGAGCAGCCGCTCCAGCATTTTCTCTGCGAACGTCACGTGCTTCCAGCCTCTGAAACTGCTTGTCTACAGGAAACTTGGACTGGAAAGGAGAAGATCAGTGATGAGCAGGAGGAAGCAGATGAAGAGGAGGAGGAGGAGGAAGAAGAAGAGATAACCAAGACTCCAGGCAGTCCCAAGCATGACCCAGAAGATCTTTGACCCTTACTTTTGAACCCCAAGGATGGGTCATGGAGAGTTGTCTAAAGTCTTCAGCTCTCCCTTCCCCATCCGTAGGCTGTAACTGTCCTTCTCGTATGATCCTGGGGACCCAGAATGGCCACAGGAAAGGAGGAGAAGGGGGGAGAAGCGGAAGCAAGTTTTGCCTTCAGAGATGAGTCACGTGCGGCCACTCAGTGGACCAAGTGTGTGGTGACAGCACTGAAACCTTTCTCTCCCTTTTACTGGCCCTCGCCTGCACCAATTGGTCAGTGGTGTTATGACCTGTGGGAAGGTCACTTTGCTTTTTAAAGGCTCTATTTTAAACCCTTTCAAGAGGTCAGAGAAGAGCTAGAGCTCAGTTGGTAGAGTGCTTGCCTCTTCCGGGCAACGATGGGAGTTGGACCTGATGTGGTGGCACACCCCTGTAATCTGCAGCGCTTGAGAAGTGAAGGCTGGAATATCAGAATACCATCCAGCTACATGGCAGGCAGCTCAGGACCAACCAGAGCTACGTGAGACCCTGTCTCAAAGTAAGAAGCCAAGAAGGGACCCTCAACCAATACGCACTGCGAACACGAGGCTGTGTACCATTAATCTGTCAACAAGAGCAGGACTCTGGGAGCGAGTGCAGTAATACTGGGGTTAGGTGGGGTAGACATGTGGCCTATTTCCTATTTCACAGGTGCCATATTTTCTATATTGCTATTAAACCTTTTATATGTACATCA\n>XM_024925133.1 Trichoderma harzianum CBS 226.95 glycoside hydrolase family 78 protein (M431DRAFT_99295), partial mRNA \nATGGGTCATTCGGTGTCTCCAGTCTTGGTTCTTCCACCGACTTTTGAGCAGCATCACAATGGGTTTGGAGTTCAATGTGTGCACCCAAGGCTTTCATGGAGGTTTTCATGCTCGAAAGAGCAAATACGCAATTGGAAACAGACTGCATACGATATCGCAATTTCCTCCAATAGCACAGAGCCTGGCCAAGTCTTTCACGTAGAGAGCGAAGACAACGTTCTAGTACCGTGGCCGAACTCAGAGCCACTCAACTCACGAGCGCGCCGGTTTGTGCGCGTCAGGTGCTATGGCAAATACTCTCTATTCGATGGGCGCGATAATGATTCCGACCATGAGTCCGTGACCGAATGGTCTGCATCGTCTCTTTTGGAAATTGCATTGCTGAGAAACAGCGATTGGAAGGGGAGTATGATCACAGTGTCGGAGCCGTGGCCTCTGGGTCCGGACCTTTCAGCCCGCCCCCTGTGCTTTCACAAGCGGTTTCATCTTTCCCTAAAAGACGGGATGATTGACAGGGGCCGGCTATATGCCACGAGCTATGGCGTGTACAGCGTGCGGATCAATGGCAGAAAAGTCGGCGACCACTGTTTGGCCCCGGGTTTCCAAAGCTACCATAAGAGACTGCATTACCAGATTTACGATATTAAAGATCTTTTGGTAACGCCTGGGTGGAACAAGATCGAGATAGACGTGGCCGCCGGCTGGTTTGCCTCTGCCACCAGTTGGGCCAGGAAACGATTCACCTACGGCCAGAAACTCGGTGTCCTACTTCAGCTAGAGATTTGGGCTGCAGACTCTTCCTTGCCGATTTTGGTGAACACCGACGCGAGCTGGAGCGTCTCCAACACGCCTTTGGTTAGCAGTGAAATACTGGATGGTGAAATCTTTGACCAAAGTCTGAGTGTGGGCTCAAAGCTGGACGACGCTTTCTCGGTCCGAGAGTCGCCTCTTGCAGTGAGCCGGCTCATCTCTCCGGAAGCCCCGCCAGTAAGGGTGGTGGAGAGGCTGGAAGCAAAAGACATATTCAAGTCGCGGTCCGGAAGCGCTGTCATTGTGGACTTTGGACAAAATATCGCCGGTCGTATTTGCGTTAAACAAGTGCAGAAACCTGCTGGCTCTAGAATCACGTTTCGCCATGCCGAAGTCATCCAAGACGGGGAGATTATGTGTCGTCCCTTGCGAACAGCAAAAGCCAGGGACATTATAATATGCGATGGCCGAGAACTCCTTGACTGGCATCCGCAACACACGTTCCACGGCTTTAGATATGTCGAGATTGCGGGATGGAGCCCTGATGACAAGAACTGCCCTCTCACCAAAGCATGCATTGTCGCCGAGGTGATGCATACTGACATGCTGCGTACGGGTTGGTTTTCATGCTCCAACGATGATGTCAATCGACTACATGAGAATGCTCTCTGTAGCATCAAGAGCAACTTTTTGAGTGTGCCCACAGAGTGCCCATCAAGAGATGAGCGCTTTGGTTGGACGGGAGACCTGAACATCATTGCACCTACTGCCAACTTCTTGTATGACACGGCTGGCATGTTGGGAAACTGGTTGCAGGATCTGTACCTCGATCAGATGGAGGGGACCGAATACTGGCGCCAAGGCGTGGTGCCCTTGTTCATTCCCAATTTTTTACTAAGAAATGGCGACGGGGGCCACGGGTGGGATCCGATGCCAAATGGCGTTTGGGGTGACGCTGCAGTTATGGTTCCCTGGGGCCTGTATCGTATGTCTTGTGATGTTAGTTTCCTCTCGAGGCAGTATGATAGCATGGTTAAGTACCTGGAAAATGGCGTGACTCGAGGTCAGGATGGACTCTGGGATCCTGAGCAGTGGCAGTTTGGCGACTGGTTAGACCCAAGAGCGCCCCAGAACGATTCCGGCAGAGGGACCACGGATGGCACATTTGTCGCCGATTGTTTCCTCATTGCTTCCACTCAGATCGCTGGGAAGGTAGCCGCGAAGCTAGCCAAACCGGTTGACTCCTCTCGCTTCAGAGACGCTGCACTGCGCCTAGTTCATGCGTGGCGGGACAAGTATTTGACCGCGGCTGGTCTCGTGGTTCCAGATACTGCAACGGCTCTTTCGCTCGCCTTGTCGTTTGATCTTTTGCCAGAATGTGGAGACAACTCAATAAAGGCACAGGCGGCCGCTCGTCTGTTCCGACTGGTACGTCTTAATGACTTTAAGCTTACCACAGGATTTGTGGGCAGTGCATTTCTTTCTCGGGCACTCACCCAGTCCGGTGGCGTCGAACTAGCCTACGCTATGCTGTTCCAGAAGAAATGTCCTTCGTATCTGTATCCCATTACGATGGGAGCCACCACGACGTGGGAGCGCTGGGACAGCATGCTCCCTGATGGGACTGTTAATCCCGGTTCAATGACAAGCTTCAATCATCATGCTCTCGGGAGCATCGCAAATTGGATGCACGCTGATGTAGGCGGACTCGAGGCGATTGAGCCCGGCTGGAAAGTATTCAGAGTGAAGCCGCAGCCCAATAAGGAGCTGAGCTGGGCGGATACCGCATTCGAATCAAGGTACGGCCGGATTGAGCTGAGATGGACCTTAAAGGGAGACCTTTTCCGCATGAGATTACGGGTGCCTCCAAACTCTACCGCCGTCGTCAGCCTTCCCAGTGACGGCCGAGAATCTGAGGTGGGGAAGCGGGAAGCTAAAGAGCAAAGATTTGGGTCGGGAGAATACGACTTAAGGTGTCAATTTGTACAAACACAGTGGCCACCAAAGGCACTGCTTCCACCATGGGGAAGAGCAGAGTTCTAG\n>XM_036290224.1 PREDICTED: Monomorium pharaonis uncharacterized LOC118646716 (LOC118646716), transcript variant X3, mRNA \nTGGACATTTTCATATAAGAAGTAATCTCGCAGTTGCGCTGCGTCCGACTACAGCTATCGAACGTATCGGATACGTTCCGTGTAATCGTGTAACAGAGTGAAGATAACGAAAGGGAAAGCGGAGAAAACAAAGAGGATTTTGCACGATATCGCCGCGCCGTTTTTATCCGACCAGTAAAGTGAGCGGATCGAATTGTTCACAAGACCGTTTAAGATCATTTGGGATCTAGCGTGATATATGCGCCGATAACTAGGATTCGATAACGAGCATTTTACGCTCGTGTATAAAGAAAGAAAGAAAAAATAATCGTTCTTTTATCATCGAGGTGTGGCAAAGAGTCGCGTGCTGGGCAGAATTATACCCGTTCGATTCCCTGTGCCGGCGATTTGAAACAAAGTTTAGATCTGTTACTGCCTCTGTTGTAAGGAACAAAATAAGCAACATCCGCTCGATCTCCCGGAGATAAAAGGCATCGGGCGAACAGGAAAGGCAAGGGGAGAAAAAAATGGCAGAAAACGAGAAAATCGTGTCGGACGAACGATTGTATGATTATTTGCGTACGTATGCGAAAAGCATCCAATTGAGATCCCCGAAATTTCACGTAATCGAAAGCAATAAAGGCGATAGTTACATTAGTGTCGTTTATCGCGTCACGATCGAGGGAATCGAGGAATGGAACGAGGCCAAGAAACTCGAGCTCGTTCTCAAAACCACGCGGAACTACGGCATCGACAATATTTTGACCAGCGGCAGGGTCACAGAGCTATTCCAACGCGAGGCATCTTTCTATCAGGACGTGTTGCCTATTTTCAAAGAGACTATGAAGGACCACGGCGGAATGCACGACCGCTTCCCCATTTTATACGACGTCAACGATGAATCCGGAAAAGAGATACTGCTGTTAGAAAATCTAACGCCCCAAGGTTTCGTGATGTCAAAGTCAAAAATTATGGATTACCCGCATCTCAAGTTAGTGATGCGATGTCTAGGTGAATTTCATGCGTATAGCTTCATTACGAAAGCGGCAAATCCGACGGCTTTTGAGAAAATGAGGCAAATGAAAGAACACATATTTCTAGAAGTAGTAAATAGTGGCGAACAATTAGAGGCTAACGAGAGAATGAAAAAATTGGGAAAAATGCTTTTTTACATCGTGCTTAAAGCTTTAGCAAACGAAGACAAACATTATTCCGAAAGGTACCAACGATTCATGGAGAATATGCCGCAAAATATGTTTGCCGCAACTAATGGAAAAGAAGCTGAACCATACGCCGTTGTAAACCACGGTGATTGTTGGACTAACAACATGCTCTTCAAATACGACCAAGAGAAAAATCCGTGCGACTTGCGTTTCTTAGATTTTCAGTTATGCCGTTATGCATCTCCCGTTTTAGATCTAGTTCATATACTCTTCTGCTGCTGCACGCAAGAAACAAGGAGTAAATGTTTTGATCAGATAATTAAAGACGTATATTACAAAACACTATCTGACACTATAAAGAAGGCCGGTTACGATCCTAATGTACTCTTTTCTTACGAGATATTATTACAACATTTTACCAAATTCGGGAAACACGCAGCGGGAATTGCTACTTTCACTGTACATTATTATACTACTAATGACGTAGACTTCACAAGTGTATATGACACTAATAGGCTCGAAGAAAGAATAGAAAAAGATAGCTTTTACAGAAATATGTTAATAGAGACCTTTAAAGATATTATTGATAGAAATTATATTTAAATTACTACTTTCACAATAACATCGACATATTGTGATACCAAAAGAAAAAAAAGGACTCTTGTAGTTAAAACAAAATGCTTTATATTAAACTTAGACACCAATGTAGCTAATTACATATATTCATACAAGCCTACCGCATCAGGTTAAGAGAATTTCGTTATGACTTATCGTGAATGACTTATTCACATAAATATAATTTATAAAAATTGTATATTTTATGTTTCTGAACAGTTAGAAATATCGGACATTTTATTGTCACTTTTATCAAATAAAAATTTATTAAAATTACTAAATTTTTCTTTATAAATACTTCATTTTGGTCACTAAAAACAATAAGGTGCAATAATTCTTTACACTAAAGTGCCTAAAAATTAACGATGAACAATTTCATTCGGAGAAAGACAAAAATTGTATAAGAGATATATTTTTAAAAAAATGTACAGTCTCAAATATACAAAATAAAGGTAATCTATTACATTGTTTGATAATGAAAGGAATACTAGTTTAATAGTAATGTATCTTAGCTCTTAGTAATAAAGTCTTCTTGGATTATTTTGAAAGAAATTTGTAATAATAAACCAGATAATATTTTCTACTTAA\n>XM_017386452.1 PREDICTED: Daucus carota subsp. sativus histone acetyltransferase MCC1-like (LOC108214453), transcript variant X4, mRNA \nGAAGGTTTGTTGGTTATTTTTTAATTTTCTTAAAAATTCTTTATAGTACTCCCGAGAAGAAAAAGAAGCCCGGTTGCTTTGTTTTGGCGAGGGAAGATTGAAGAACCAAAAAACAAGAGCTGCATCGAATTCTGCATATACACAACAGATTCATCTACTCGACATCTTTCAAGTTGTTAGATCAAACATCAATCGGATTCATGAGCAATCCTTACATTTCCCCCAAATTCAGGTTACTAATTAGTACAAATTCACTTCATCTCTGAATTTCAATCGCATCGATGGTGAACCTGTATAAACCGCCTTGTGCTAGTATCTTTTATAGGCCTATTAGGCCCTCTGATTTGCAGCTTCTCGAGAAACTCCATGCCGATCTTTTTCCTATCAGATATGAGTCGGAATTCTACTTGAATGTTGTTCATGGTCGTGATATTGTCTCCTGGGGCGCTGTTGATCGGAATCGCTCGGATGGTCTAAGTGATCAGCTTATTGGATTTGTCACTGCCAGACTTGTTATGGCAAAAGGAAGTGATGTGGAAGATATACTCAGATTCGAAACGTCAGAAGCAAACCAGACTCTAGTTTATATTTTGACACTTGGAGTGGTGGAATCTTATAGAAATTTTGGCATTGCCACTTCATTAATCAAAGAGGTTATCAAGTATGCTTCAAACATTACAATGTGCCAAGCAGTTTACCTACATGTGATTTCCTACAATAATTCTGCCATCCATCTTTACGAGAAAATGTCCTTTCAGTGTGTACGGAGATTGCACGCTTTCTATTTCATCAACGGGCAGCATTATGATTCATACCTGTTCATATATTATGTAAATGGTGGTCGATCTCCTTGCTCGCCATTAGAACTTGCGACGATTTTCATTGCTTACATAAGGTGTGGATTTAAAGCAGCTGCATCAAAGTTATGGAGGAAGAAAGATAAGAAGGTACCTGTGTGGATGAAGTGTAAAGAAAGCAGTGGCCTACTACCAACAACGCAAAACAAGAGAATCCTCACAAGTCACAACTGAGGTTATTGTGTCAGATTGTTTTAACTTATAATGATCTTTTCACTGCTGTAACACAAGATCAAATCCCGATAGTCAATTGTATCTTGTTCTTGGAAGTTTGTTTCTTTTATTTATTTGATCAACTTCATAGTAGCCTTGACCATGCTCTTATGTTGCAAGTGTATGTAGTTGTTCCTCCTTTTCCCAGAGTTGGACACTTAAATTTCTATCTAGACAGCAAAGCTCAACAGTAGATTTTTATTCTTCAGTTCCATTGTCTCCGCCACCCTCTTTGCAATCCCTAGTGAGTGAACTAAGAAAATGGTATTTAGTGTTGCCCCCCCTTCTTTCTGTGCTCCACTTTCTTTAATAATCACAGCAAGGTAGATAAATATATCAGATCGGTAAAATAATTTCATATATTTGGCCCTATGGTACAATAGTGAAGCATTTTTTCTTGACTCGTTCCATAAGCATGACTATACCATTGTGCATTATGTTTGTATTAGTAAAGATATCTTTATCTGACTGATTCTGCATAGATTTCTGTATATAGAATATAGAATGCGAGAGGTTGATTCCATATGAAGTACGCTTGTTTTCATATTTCCTGGAATGTTAAATTGAATAAATCAATTTTGGATACTTTATGCCCACAACTAAACAGGAACACCCGTGAAAAAAAAAAGGATTTTGTGAAATTCATTTATGAAAGAAAATTGAAAAAATGGACAGATTTAGTTCTTTTCAGTTGGTACTTGTTCTCTCCCTTAAACCGAGCCTTGATCGTTTGTCTTTGAGCGCATTTGTTGGTAATATTGAAAAGCCTGTCCTACCACAATTGTCCTATACTTGCTGGTAAAATTAATTTGTCAATCCTATGGTTTGGAAATATGAATGAGCAGCAAAAGTCTTGCCTGAAGTTCTTTATTAGGGTATTCTGTTAGAGCCATGAGTGGCTGATTGGTGGCTTATGTAGAGACTAGAGAGAGATACTAGCTCGTGGTGACCAAGAAGTTAAAGAGCATTCCAATTTTCAATGGATGAAAGTGACCGTGCTCAAGGAAACAAAAGAGGCCGCTCAAACAACTCTTTGGAATATTCATTTTGAAAGATACGGCAAGGCAAAGCTGCCTGTGCTGAAAGCAAAAGTGTGGCTGTAATTGCTATGGACGAAGGAACAGAATGGAAGAAAGCATGAAATGCTTTGTGCATAATTTTGATGGTGAGCAGCTGGTAATTGTGGAGGTTGACTTATTGGATGAGTTTTAAAGGGACTGTGCACGCCTTTTTCTTCAGGAGGAGTAGGTAATGTCCGGATTATTAGTACCTTTACCACCAAAGAAGATAGTTGAGAACTTGAGATTATATGGTGATTCATTTTGTGGCAGCATTAGCCGAGACTGTAACAGATCCACAACGTTTAGGATTTTCTTTTAGACTGATGATCAATGCGGGGAAGTTCTGACTTGAAACTCGGGCACAGGCTTCCATGCTCGTGATATTTATGAATGATATCATTATTCATTTTTGATTTACAACTGTTGTTATTATA\n>XM_052334290.1 PREDICTED: Diospyros lotus succinate dehydrogenase assembly factor 1, mitochondrial (LOC127799971), transcript variant X1, mRNA \nATGCCCACGGAGAGAACACACGAGAGTGAAGATTTGGAGGGAAGAAGAGTCCTGCACCGCCCGGTGAGCCCCTCCGTCGCTGCCGCTCACCTCCGTCGCCGGTCTCATCTCCATCGCCGGCGAACAGTTTAGTACCGCCACTGCCGACTGCCACCGCCACCGCCCCTGCAAACAGCCAAACACAGGATTGCTTTATTTTGTGGAGTTGCGGAGAAATTATCTTCAGTATTTGTGCTGTGTTAGGGTTCACAGAAGAAGCAAAATAGATACGCAGTATTCCCCAAGCTGCATACAAGCAGAACCGTTCATCTACAACAATACAATACACTGTGCACCATCATATGGTTAAGCAAACATCAGGGGCATTATTTGAAGGGAATTCAGGCTGCGGAACACCAGGGGACAAATCAACTTCTGCCCTAATTTCCAGATCCCCGTTTCCTTCTTTTGGCTGAGCAAACAGCAGGGGAAAAATCGAGAATGGCTCGAAGGGAATTCAGGCCGCTGAATACCATCTCTGAATTCCAATGGTTTGTGTCGTTCTTCGCATTCTGCAGTGGCATTGATTTATTCTGGTTGGTGGCTCCTTGATCTCCTGTGAACTCCAGAGCTTTCAGTGGAAGGCAAAGAAATACAAGAGAGATTGCAATCAGGAGTCAAGAAGTGAACAAGATGCAATGGGAGGTTCTAGTGGGCCAAAGCTTTCTGGAATGCAGAAGCAAGTGCTTGGTCTATACAGAGGGTTTTTGCGAGCAGCGCGTGCCAAATCCCCTGAAGATCGATCCCGAATTGAATCAATCGTGTCAGCTGAGTTCCGTCGCAATTCGAAAATAGTAGACCGCAAGAATTTCACCTACATCGAGTACTTGCTTCGGCTTGGTAAGAAACAGCTTGAGCAGCTTCAGAGCCCGGATACCATTGGATTGTCACACTTGAATGTAGAACTCTCCCACACTAAGAAGTCCTAATCCCACACTAAGAACTCTTGTACCTTACCTTAGGATGTATCCTAAAGTTTTGTCATCCTCTGGTCTCTGACCGAATGTTTTTTTGATTACTCAAAACTCATGCTTCTCCAACTCCAAAATTCAAAATAAATGTTTTATATGAGAGCTGCAA\n>XM_028897914.1 PREDICTED: Prosopis alba SWR1-complex protein 4 (LOC114713302), transcript variant X2, mRNA \nCCAAAAAAAAAAAAAATCCCCACCCGGTGTTTTGTTTCACCATTTCCGACGTTCTTCGTCGTCTCTTCCTCCCTCCTCTTCCTCTTCGTCGGCAGCTGTCCCACGTCGGCCGTCTTCGTTGAACTTCGCTGGCTTTCATTACTCTCCTCTCTTCCGCTGCTCCGTCTAAGTGCCTCCCGTTGATATACTCCAAGTTCACCAGCTAGGAAAAATATTGAGAAGACCTCAGTTCCTGAAACTGAAGACTGAATTCTTGAATCGAAGTATTGGAAAAAGCCAAAATTTTGACAAGATTTAGAAACCCTGTTTTACATTTATGAGATGTGCTTTTTTAATTTATGTTTTTTTGGTTGTACATAAATAAGGTGGATTAGCTTGGCCCTAGATTTCCTCTGAAACTCCCATGGATGCCAAGGACATCCTTGGTTTGCCCAAAACCTCCTTGCCAATTCAAGAGAAAAAGTCTAGGCCCCAAAAAGATTCACAGAGAAAACCAGATGGCATTTCACGGGAGGTATATGCACTCACTGGTGGTTTGGCGCCTCTTATGCCTGCAATTGATTCGTCTCAATTAAAGAAAAGGCCTCCATCTGACGAGAAGATCACTTGGCAGTGGCTTCCTTTCGCCAATTCTGCTCGTAAAGATAATCTTCAACTATACCATTGGGTCCGAGTTGTGAATGGTCTTCCACCCACTGGGGACTATTCTTTTGCCAAGTATAACAAGTCTGTAGACATTATCAAATACACAGATGAGGAGTATGAGAAGTATCTGACGAATCCAATGTGGACCAAGGAGGAGACGGATCAACTCTTTGACTTGTGCGAGAGGTTTGATCTTCGGTTCATTGTGATAGCTGACAGGTTCCCATCATCACGAACTGTAGAGGAATTGAAAGACCGATACTACAGTGTATCTCGGACTCTGTTAATTGCTAGGGCTCAATCTTCCGGGGATGTTGCAATGCATCCTTTAGTTAAGGAACCATACAATGTTTCACAAGAGGTTGAGCGGAAACGAGCACTGTCTATGTACCTCTCTCAAACAAAGCAACAAGAGCGAAAAGATCAAGAGGTTCTTGCTGAGGCAAAAAGAATAACTGAATCACGCATGCCTGCTAAGGTTGCTGAAGAGTCTGAGGCTGCTGCTGCATCAAATGCTGGTGCGGAAGAGAGAGCTGTCTCCGGTGATCCTCCATCAAGTGTTCAGCTTCCATCAACGGTTGTTCCATCCACAACAGCAGATAATGCAGCCACTCTTGCTTCCCTTCGCATGCTTCGTGTGTATCTAAGAACATATGCACTTGAGCAAATGGTCCAAGCTGCAAGCTCATCTGCTGGACTACGGACCATCAAACGGGTGGAACAAACACTACAAGAACTTGGGGTTAATTTAAAACCAAGGGTTCCAACCAAAGCTGTTTGTGCAGAACATCTTGAATTAAGAAAAGAAATACTAACTCTGCTCAATCTTCAGAAGCAGCTGCAGTATAAGGAGGCAGAAGGTCGTGATGGTTCATACACTGAAACACCTGGCACACCGAAGGATAGGACATTTATTCCAGATTCTATGAGTTTTGGAGGTGAGAGGATTGGTAAGAGGGACCAGAAACGCAAGGCGCCTGGGAGGATATCAGAAGCTCCATCATCACCGGCTCAGTCTAAAAGGCCTAGAAAACTGAAGGCATCTGATCTATAGTCCGGTGGTGTAATGGGAGAATATAGAGTTACAGAATTCTGCTAACGAGGATGAGGAATGCAGGGTAAAGTAGGTGTAAGCTCATGGCCCAGAAATTCAGAATTTCCAACTGAAGTACTTTGTTTCCTTTTGGGCTGTTGCCGGTCACAGTATCTAGCGTAAGATGGAGCACAAATAGTGATGGAAATTCTGGGTTCTTCTAACTTTTAGGTACCTCGTGAGCTTAACTTTATTTTTATGCTGGCAAAGCTTTGTACGGTTGTTAGGTTTTTCTGACCAAATTGTCATTGAGAATTTTTATGTAAATAAGCATTCAGGTGAGGATTGTTCGAACAAATATAGGGCCTCTAAAAAACATGTATTTGTGCCTCGTGAATGGATTCATATCCTAAACTTCTTCAACTAATCGAAGGCTGATATTTGAATGAAA\n>XM_012572725.4 PREDICTED: Taeniopygia guttata EPH receptor A7 (EPHA7), transcript variant X1, mRNA \nCGGGCTGCAGTCGGGGCTGGCGGGCGGCCGGCCCGGTGCGGGAGCCGGGCAGCGGCGCGGAGGCGGAGGAGAAGGAGGCGAAAGAGAAAGGCAGCCTGGAGGGAGGGAGCGCCGAGCCACAGACTAGCACAGCAAATTCTCCACCGTCCTCTAGCACCCACCAAGCGGCGGCAGTGGCAGTATCTAGGAATAGAGAGCTAGAAATATAAAATCACCCCGCTCCTGCACCATGGCTTTCCAAAGTAGGCTCCCTTCTTGGATTATTTTGTGCTCCGTCTGGCTGTTCCGCTTTGCACACACGGGGGAGGCACAGGCTGCAAAAGAAGTAATACTGCTGGACTCTAAAGCACAACAGACAGAGTTGGAATGGATTTCCTCTCCTCCCAATGGGTGGGAAGAAATTAGTGGACTGGATGAAAACTACACTCCTATACGAACATACCAGGTATGCCAGGTGATGGAATCAAACCAAAACAACTGGCTTCGGACTAACTGGATTGCAAAAAGCAATGCACAAAGGATTTTTGTAGAACTGAAATTCACTCTGAGGGATTGTAACAGTCTTCCTGGAGTTCTGGGGACTTGTAAAGAAACCTTTAACTTGTATTATTATGAAACAGACTACGACACTGGCAGGAATATCCGAGAAAACCAATATGTAAAAATAGACACTATTGCAGCAGATGAAAGCTTTACCCAGGGTGATCTTGGGGAGAGAAAAATGAAACTTAACACAGAGGTGAGAGAAATTGGACCTTTGTCCAAAAAAGGATTCTATCTTGCGTTTCAGGACGTAGGGGCCTGCATTGCTTTGGTCTCTGTCAAAGTCTACTACAAGAAGTGCTGGTCCATCATTGAGAACTTAGCTATTTTTCCTGACACAGTGACTGGCTCAGAGTTTTCCTCTTTAGTTGAAGTGCGAGGAACTTGTGTCAGCAGCGCGGAGGAGGAGGCGGAGAACTCGCCAAAGATGCACTGTAGCGCGGAGGGAGAATGGTTAGTGCCTATTGGAAAATGTATCTGCAAAGCAGGATACCAGCAGAAAGGAGACACGTGTGAACCTTGTGGCCGTGGGTTCTACAAATCCTCCTCACAAGATCTGCAGTGCTCCCGCTGCCCTACTCACAGCTTCTCTGACAAGGAAGGATCTTCCAGATGCGACTGTGAAGATAGCTATTATAGAGCACCTTCTGATCCACCATATGTCGCGTGCACAAGACCTCCATCTGCACCACAGAACCTAATTTTCAATATCAACCAGACTACCGTGAGTTTGGAGTGGAGTCCTCCTGCTGACAATGGGGGAAGAAGTGATGTGACCTACCGCATTTTGTGCAAGAGGTGCAGCTGGGAGCAGGGCGAGTGTGTTCCCTGTGGGAGTAACATTGGATATATGCCCCAGCAAACTGGATTAGTAGATAACTATGTCACTGTCATGGACCTGCTAGCTCACGCTAACTACACGTTTGAAGTTGAAGCTGTGAATGGGGTTTCTGACTTGAGTCGTTCCCAGAGGCTTTTTGCAGCTGTCAGTATTACCACTGGCCAAGCAGCTCCCTCGCAAGTTAGTGGCGTAATGAAAGAAAGAGTGCTGCAGAGGAGCGTGGAGCTTTCCTGGCAGGAACCAGAACATCCCAATGGAGTCATTACTGAATATGAAATCAAATATTATGAGAAAGATCAAAGGGAGAGGACCTATTCAACAGTGAAAACCAAGTCCACTTCAGCTTCTATTAATAACCTAAAGCCGGGAACAGTGTATGTTTTCCAGATTCGTGCTTTTACTGCTGCTGGTTATGGAAATTACAGCCCCAGACTGGATGTTGCCACACTGGAAGAAGCCACAGCCACAGCTGTTTCCAGTGAACAGAATCCTGTTATTATCATAGCTGTGGTTGCTGTGGCAGGAACTATCATCCTGGTCTTCATGGTGTTTGGATTCATCATCGGACGAAGGCATTGTGGCTATAGCAAGGCAGATCAAGAAGGGGATGAAGAACTTTACTTTCATTTTAAATTTCCAGGCACCAAAACCTACATTGACCCTGAAACCTACGAGGACCCAAATAGAGCTGTCCATCAATTCGCCAAGGAGCTAGATGCCTCTTGTATTAAAATTGAGCGTGTGATTGGCGCAGGAGAGTTTGGTGAAGTGTGCAGTGGGCGTCTAAAGCTTCCTGGCAAGAGAGATGTTGCAGTAGCCATAAAAACTCTGAAAGTTGGCTACACTGAAAAGCAGAGGAGAGATTTTCTGTGTGAAGCAAGCATCATGGGGCAGTTTGACCATCCCAATGTGGTTCACCTAGAAGGAGTTGTTACCAGAGGGAAACCAGTCATGATCGTAATAGAATACATGGAGAATGGGGCCTTAGATGCATTTCTTAGGAAACATGATGGGCAATTTACTGTCATTCAGCTAGTGGGGATGTTGAGAGGAATTGCTGCTGGAATGAGATATTTGGCCGATATGGGATATGTACACAGGGATCTTGCAGCACGCAATATTCTTGTCAACAGCAACCTTGTTTGTAAAGTATCAGACTTTGGCCTTTCCAGAGTTATAGAAGATGATCCAGAGGCTGTCTACACTACAACCGGTGGAAAAATTCCAGTGAGATGGACAGCTCCAGAGGCCATTCAGTACCGCAAATTTACCTCAGCCAGTGATGTGTGGAGTTACGGAATAGTTATGTGGGAAGTAATGTCTTATGGAGAACGGCCTTACTGGGACATGTCAAATCAAGATGTTATAAAAGCAATTGAAGAAGGCTATCGTTTGCCAGCGCCCATGGATTGCCCAGCAGGACTGCACCAGCTGATGCTGGATTGTTGGCAGAAGGAACGCGGTGAAAGGCCAAAGTTTGAACAGATAGTTGGCATTCTGGACAAAATGATTAGAAATCCAAACAGCTTGAAAACCCCACTGGGAACCTGTAGCAGACCAATTAGCCCTCTTCTGGACCAGAACACTCCCGATTTTACCACTTTCTGCTCCGTAGGCGAATGGTTACAAGCTATTAAGATGGAAAGATATAAGGATAATTTCACAGCAGCAGGCTACAACTCTCTTGAATCAGTTGCCAGGATGACTATTGAAATCAAAAACATGCCAGGTGCTTTGCAAAACAGAGAACAAGAAAAATCCCTTTCCAGAAGAGATGACAGCCTGAATAGAAATGGCATAATGGCAGGAGACAAAGGAAGCAGAAAGGGGAAGCAAAACAAGAGTTATAACCATAAGATCATGAGATTGGTTTGGAGGCACAGTGAACGCTATGAGGCATTTTTTTAAAGCCCATAAGGACTGTAGTTGGGATTAGAGAATGGAAATATAGAAAAGAAGCATGGAAAGGAATGGAGAAGAAGGGAGGAACAGACTGGCAACAGGAGGAAGAGTAAACAGAGGTGTATGGGAGAGGCCAGAACACACATCTGACAAACTGAGGATTATGACTAATGACAAGAATGAAAGACCACATCTGAAGAGCATGATGATTTCAGGAGGATGGCGAAGCAGGACATGGCGATGCTGCTAGGGAGAGAAGAGCCAGCAAAGCTGCCCTGGAAGCCTGCCCTGGAAGCTCCTCACACTAACATAACCCTGCTTCCCCATCTTCTTTCTCGCTCCCCTCTTATACATAAAATATGTATATAGAAGAGCAAAGGAGAAGGAGAAGCAGCTAAATAAACTTTTCCAAAGATCGTGCTGGGGAAGAAGTTTAAGCTGGGATGATACAGATTTGCTCCTCCTGATTATGCTCATGGTAGCGAGAGGAAGAGAGCATTCTGTTAGTCATATTCCTGCAGATGAATCTATATGAGTCTTTGCCTCTGGTTACAAATAGGCCTTGTTGAGAAATAGTCAACAAAATTATAATACTCCAGCCAATCTGGGACATTTTAAAATGTCCTTTCATTCTAGAACAGAAATAAATTACACCACTGACAGTGAAATGGAAAGAGGAAAGAAGAATATTTTAACAGTTTTGGTTTTTTTTTTAATGCTGAAAATAATCATTTTAGTATTATGGAAAAAAAATATAAGGGGGATTTTTCTCATTGTGAAAAAAATAAAGCTTTTAATGAAATTTCTGATAAAATTGGGAATTATTTTAATTATGTAGGACTGGTTTTTCTGTTGGGTTTTTTTTTTTTAGAAAATTGGTATTTTTAGAAGGAAACAGGAAAATTGCTGTGTTCATTCTGTCAGACATTTTAAAATACCCTGATTTCCAAGGTAAGAATTCTTCAGGAGTAAGAAAGCTGAAAAGTGGCCAGTCTAATCTCTTCCTCACTTCCTTCTCCTCTGCTTCTGTGATCAGACGTGTCTAATGATAGTCTGCAGATAGCAAAACCAGTTTCTATGTCTCCCTGAGAAAAGGCATTTTGCCAACTTTAAGAATCTTTAACTGGATCTACTTACAGGAAGTCACTGTTTTGCTGCAGACTATGTGTCCACTTAAATCCCCCTCAAAGCTCTTCCATTTTGCCTGGAAAGGTTTATCAGAAAGCATGCTGGAAAGGCTCAGATCTTTCCATCTCCAGTGAAACTGTTTCTGAACATACTTATAGCTTAGCAGATGTACTGGTATGACAGTTGAGAGACTACTGCTGTTAATGAAGTATTCTATTACCTTGGCATATATAGACACTTTTCACTTGGTACTTCTAACTGCAAAGTATTGATGTTTAGGCTATTATAAGTACTTGTGCGTTATATTTTTTTGGTAAGTTTTAGAGGACAGAACTGCGTAAATATTTCTTCTCTTCAGGGTAAAACAGTTTTCATGAGTCTTGAAATGTTTACATTCATCTTGAATGTACACCAGAGTGATATCAAGTTTGTTGTTGTGACACCTTATCAATATGATGCCCATTTTTAGTTTCTTCTAGCAGTGGAATGATTTAAGTATTGTCTCATGGAGACAACGGCCTTGTTTAAGAATGGTGACTCTGGATAAGATTCAAATAATTTGTCTGAGTGAAGAGGAGGCAACTGAAAGTCATCGCTGAAATATTACCAAAAATCCTTAACTGGTTGGATTTGTCCATCACTTGCTTGAAGATTTTGGTAAATGGTGGTTTACTAGGTTCCCAAATGCCAGCAATGGCCAAGCACTTTCTTTTAATTTTCTTCAATTTGGACTTTGCTTAAGTTAATTAAGCTTTTGTCATCTCAGGGTTCCATTTTAGCAATGAGGTTTACAAGACCTTCTCTGTCAATGTAAAATCTTCCTATACTTAAGAACATATGACATACGGAGAGTAAACTCAATGCTCAGCAGTGCTTGAAGAATGATTCCCACCTCAGTAATTTCTCTCCATTTTTATCAAAATAATACTGGATTTAAATCCTATAGCCATGGTATCAATTTACCAAAATCTTCTCTGCCTAAATTATTCTTCAATTAAATGTAGCTCAAAGTTTTATTACAATCCACCTATCATTTAAAAAATGGGATTGCAAAGTAGTTTCATAGTATCACCCCATAATACAGATTTTTTGCATATTATTTTTACATATTTGAAAGAACTCCATTACTCAGTTGCATATAACTTTTTGCAATAAGAGGCACAACGTAAAGCAATATCAAAACACAGGTAGTATTTCTACTAATTTTATTTAGCCAAGCTCCAGATTTTGCATAATTTTGCCACTGCTTCTGGCATGATAGCAGATATGGAGGTTATCCATGCCTGCCTACCTTTTGGTGCTGAGATAGGATTCATCTGTGTGGCACCTTACCACCCTCCGCTACCAAAAAAAAAAAAAAAAAAACCAACCAAAAAAACCAACAAAAAACAAAAATTCCACTGGGAAATTTGGCATAACCTCTGGGAAATTCAGTTTGACCTACCTTCTGGGTTCAGCAACTGAACCGGATGCATGATTTGGGAAGGGATTTAATACCAGCTACCTCAGTAGCCACAAGGTGTTACGGGAAAACGACTGAAAAAATCCAAACTATTATAATGTATCCTGAGACGGAAGGACAGCATGGTCATTTGCCTATATATTTATTTCTAACCTTGCCTACACTTTTCCTCAGAATCCTTCCCTGATATTGTCTGTCAGCTCTTTCAAGAAGACACTTGGTTGTGCATAAAGTAGGAATGGCTGCACTGACTCAAGCCACGAGCCCACATAGTTGTGTGTACCTGACTGTGTGCCTTGGTAGGGGTACAGTCTTGTTATAAGGCCTCCACTGATCCCTACAGATTAGGGAAACCTTCAGCTGTTGACTTCCAGACATCTTCAGGGCTCTATATCCAATATGTACAGTTCAAATGCTTCCCAAATCAGGGTGGTGCACTATGATGAGTAGTCTGAATTTGTCCTATATTCTGTGAATTTACTTCTTTCTTCTGTCAATCTTCTCTCTCTGTCTTGCCCTTCTTTCTCCTGAAGTAGAATGACCAGGGTTGCATGAATTATTCAAAATAAGAGTGTATGATGTATTTATACAGTGATATAGCGATACAGTGTATTTATACTGTGATATATATATATATATATATATATGTTTTCTATTTTGTTTACCGTTTCTTTCTTAATCATCCAAATATCCTGTTTCACATTTTTACTTGATACTGGGTGCTTGACTTGATGTTTTCAGAGAGATGTCTGATGTTATTCCTTATTTTTCCTTCTCAAGCAATAGTTACTTTGTAGTCCCTGCCTGTGTGTGTATAGTTAGACTTATTTACCCCTTGTTCAGTTCTTTCTGTTTTATCAGATTTCATCACTCCTTCATGGCCAAGGGCATTGAAAATTGTGAAATCATTTTGCAGTCCTTTCCAGACAGTTCCTTACTGATTTAACTTACAAAAAACATTTTGTATCAAACTTTCTCATCTGACAGTTCTTAGATATCACGTTTCCCTTTACTACTAATAAAAGTACTTTTGCTTAAA\n>XM_033125297.1 PREDICTED: Rhinolophus ferrumequinum 5'-nucleotidase, cytosolic IB (LOC117033240), transcript variant X2, mRNA \nATGAGTCAAACATCTCTGAAACAGAAGAAGAAGAATGAATCTGGAACAAAATACCCAAGAGACAGTCTAGAAGCAGAGAAAAAAAGGGAGTCTGAGAAATCAGGAGTTCGTCTGAACACTCAGATGACGCATGCAGTCACACCGAATCACTCGCTGAGACGTTGCCCCATGCATGGTCACCCGCCGTGTAGAAACTGCCTTAGTGCAGCTGAGGGAACAGTCCTTCTTGGTCCCTGCCGCATAATACACATTTATATTCACATGTGCCTGTTGTGGGAGCAGGGCCGGCAGAACAGCATGATCAGGGGATCACAAGAATTATCATTGCCAAAGACAGATTCTCGTGGGTACATCGTGCGAAGTGAGTGGTCCCGAACTTCACGGAGCCCATCCAACAAAGCCCCATCAGTAGACGAGAACAGAAGCAAGTCTGCCAATCTTAAGGTCCCCAGTAGCTCCACCACGTCCCGCACTTCATCTGCCTCCCCCAGCCAGCAGGACTCTCAGCAGGAACTGTCCACGCAGCCCTTCCCGCCCACCCCACCCGTGCCACCCACACCACCAGCGCCTACAGACTCCTTCCCTCCCACACCCCCGGAGCCCCAGCCCCAGTCCGTGTCCCAGCACAGCAGCAAGATGCATGAGAACACTGACACCTGGCCACATGGCATTCCGCGGGAGATGCGGGACCCCCGGGACCCCAGGGACCCCCGGGATCCCCGGGAGATGCAGCAGCGAGAATATCCCCGTACACCCCCCACTGAATGGAAGCCCTATGCCCAGCGCAAGGCGCACTACTCCTCCCAGCTGGACCGCGACTGTATGTCTGACCTGCCCCGGCAGCGGGAGGAAGAGGACGACAATGAAGAAGCCTATTGGTCATCCGTGAGGACACTGTATGAGAAGACCCCAAGCTGCTCGCGACCCCGGCCGCCCAAACCCAAGCACGCCATCACCATCTCTGTGTCATCCCGAATTCTCTTCAACATGATGGACGGCAGGAAAATCTACGAGGAAGAGGGTCTGGAAAAGTACATGGAGTATCAGCTCACCAACGAGAACGTTATCCTGACTCCAGGACCCGCATTCCGCTTTGTCAAGGCTCTGCAGCATGTCAATGCTAGACTCCGAGATCTGTATCCTGAAGAACAGGACTTATTTGATATTGTACTGATGACTAATAACCATGCCCAAGTGGGAGTGCGGCTTATAAACAGCGTCAATCACTATGGCTTACTAATTGACCGCTTCTGTATGACTGGTGGAAAAAGCCCTGTTGGCTATTTGAAGACCTATCTTACCAACTTGTATCTTTCGGCGGATTCTGAAAAAGTCCACGAAGCAATTCAAGAAGGGATCGCCTCTGCAACAATGTTTGATGGAGGCAAAGACATGGCTTACTGTGACACACAGCTCCGTTTGGCTTTTGATGGAGACGCTGCCATCTTCTCAGAAGACTGCGAACATCCTACCAAAGACCACGGGATGGACAAATTCTTTCAACAGGAAACACAACATGAGAATAAATGCACGGCTCAGGGTGCCTTGAAAGGCTTTCTGGAAGAATTAGGCAGACTGCAAAAGAAGTTCTATGCCAAAGACCAACGGTTATGTTGCCCCATCAGAACTTACCTGGTTACAGCCAGGAGTGCAGCCAGTTCAGGTGCCCGAGTGCTGAAAACCCTTCGCTGCTGGGGTCTAGAGATAGACGAAGCTCTTTTCCTTGCTGGAGCCCCCAAAGGGCCCATCTTAGTGAAAATACGGCCCCACATCTTCTTTGATGACCGCATGTTCCAAAGTGAAGGCGCACAGAAATTTGGCACAGTCGCAGCTTATGTACCTTATGGCGTTAATCAAAAAATGAACAATTAG\n>XM_037725972.2 PREDICTED: Dermacentor silvarum acetylcholinesterase (LOC119465175), mRNA \nTGCTGGTGAAACACGCAGTGTCGCAGGAATCCCGGCTACCACTAGCGCATTGTCGGTTGTACTGGCCCAGAGCGTTTTTTATCTGGATAGCCGCTCGGGTCCCGGAATCGATATTAGAGGACGAGGCTAAATCCTCAACGACCATAGAAATGGCGACCAGAGCAGCCCTCCTGGCGGCCATTTTTCTCGCCGTCATGCTCATTGCCATGGCCGACGATGCATTCGTCAAGAAGCAGACCACGGAAGGCATGGTTCGCGGCAACGTGATCCGCGCCCTGGGCAAGACTGTCGAAGAGTACCGCGGCATTCCGTTCGCCGAGCCACCTGTAGGAAAGCTCCGGTTTCGGCCTCCAGTTCCAAAAAGACCTTGGGAGGGCACCATGGATGCAACCGCTGGAAACACAGCCTGTCCTCAGGTGCTGGTGGAAGGAATCCCGCTAGGCAACCTGAGCTTCACAGAGGACTGCCTCCAGCTGAACGTATGGGTCCCAGAGGTCGCGATTACCCCAGGTTCGCGTCGGCCTGTACTTGTGTGGATCCACGGAGGAGCCTTCACCTTAGGCAGCGCGAATATGGCGAACAGTAGCGGCGTCTTCCTCGCCGCGCTGGGCGATGTAGTCGTCGTGTCCGTGAATTACCGTCTTGGCATCCTGGGCTTCATGAACGCGAACTCTCCTGAGGCGCCAGGCAATGTTGGCCTCCTGGATCAGAACATGGCTCTGAAGTGGGTGCAGCGGAACATCGGACATTTCGGAGGTGACCCCGAGCGAGTGACGTTGCTCGGGGAGAGCGCAGGCTCAATGAGCGTGCACGCGCAAATTATGTCGCCATTAAGCGAAGGCCTCTTCAAGAGGGCAGTTTTGATGAGCGGTACCATGTATAGCTTAGACACGTGGGACACAGTTCCGGAAAGCATGGTCAAGGCAGACAAGGTCGCTAACGCTGTTGGCTGCTCCAACGGTAGAACCATCGAGCTGTCATCTAATGCGGAAGAAATCGTGGACTGCATGAGAAACAAATCCGCTGATGAGCTCGTCATGGCTTCTAAGGAGGTGACGGTACCAAAGCTGGCCCCATTTGCGCCTACTTATCACAACGAGTTCCTTCCCCGAAATCCATTCTTGGCCCTGAAGCGTGGTTTCTTCTCATCTGTGGACGTCTTAGCTGGCGTAACTTCAGACGAAGGAGCTGCGTTTCTCCTGTTCCCGTTGGTTCACGAGCTTTTGGTGGAAGACATTCGAGGTTCGCCACCAGAGGAGCTTATTAGGTCTCTTCGCAGCGCATTATGGCGAGTGCTTAAAGATGACATACCGAATACATTAGAAATGTACACCGAGGAAGCACCAAAGGACGATAACAACGCACTGAGACGCCAATACATCGACTACGTGTCCGACAGATTGTTCAACTGCCCTCTGCAGTTCTTCGCGGAAAATCACAGCCGAAGGGGCAACAAGGTTTTCACGTATGTGTTCGCCGACAAGCCGGAGATGTTTCCACTGCCTGGGTGGATGGGAATGCCCCACGGCATCGACGTAGCCTTCATGTTTGGTCACCTCTACGCAGCAAATCCTGATTCGCCAGATGGTCGCATCTCTGAGGTCTTTATTAGACTGCTGGCCAGCTTCAGCGAAAACGGGATTCCCGAACTTCCCAACAATGAGACGTGGCCACAATACAGCAAGGACTTGCCAAGCACAATCGTTATGAAGAACGGCCTATTTAACGAGACACAGGGATTCCGCTCAAGCTACTGTGAACGCTGGAGGCCTTTGTATTAAATGTGTCACTCCACAA\n>HQ089085.1 Uncultured Arthrobacter sp. clone F5OHPNU07H9DXX 16S ribosomal RNA gene, partial sequence \nGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGTCCTATGTTGCCAGCGGGTCATGCCGGGGACTCATGGGAGACTGCCGGGGTCAACTCGGAGGAAGGTGGGATGACGTCAAATCATCATGCCCCTTATGTCTTGGGCTTCACGCATGCTACAATGGTCGGTACAGAGGGTTGCCAACCCGCGAGGGGAAGCTAATCCCACAAAGCCGATCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGTGGATCAGCATGTCACGGTGAATACGTTCCCGGGTCTT\n>XM_026579881.1 PREDICTED: Papaver somniferum tRNA-specific adenosine deaminase TAD3-like (LOC113333371), transcript variant X2, mRNA \nCCAAAATATTGCGATGAAGAAGTGGGAAATCCTTCACATCCCAGACAAGATTCCGTTTAAACTTGATGAACAACCCACGATCGACGTCTTTGCTTCAGTTATAGAGCCAAAGCTTACCGATACTCTTGAAGTTAAATAAAGTTGCACCAATGGAGATTTATCGACATATTAAGAGGGTGTGGAAGAAGAAATCCGCGGAAGGAGGGGATTTTCAGTTAATACTGATTTTATGTCTTGTTGGTGAGAATAGGAATGAGTTGGAGAGTATACCTGATGATGTACTTGAGTTGATAAATGCCCACCAGTTGAATCCATATATTACAAAGGTCCATAGGTATGCCGCGATATCAAAAGAAGAATGGAGAGAACAATGCAGACTTTGGCCAACATCTTATCATCCGCCAACCTACAATATTGAGGGCATTACAGGATTTAATGAGGAGGATTCAGAATCAATATTCCACTTCATGAAGATGGCTCTTGAACTAGCGAAAGTGGGCCATTGCACCGATGAGGTAGTCAATGCAGCAGTTATAGTAGATCCTTCAACTAGGCAGGTGATTGTTAGGGGCAATGATCAAACATGTCAGCCAAGTACATCCACAGTGAGTAATACCAGCTTCGAATGTGGTTCCGTTGAACAAAAGGGTTTTGCTACTTCCCATCAATCCGATGCAGATGCTGTAGCAATCAAGGAGACTCTGTTTTCCATCTCCAGTTTTGCAGTTGCTGAAAATAAAGAATCATATACTGGCGTTTCTTGTCTATATCCTTGGAATTGGACTGAGCAAAACTCTATTGCTGGAAACACATATTCCTGGCATCCTCTGCAGCATGCAGCTCTTGTTGCCATTGAACATGCTTCCTCTAGGGATAGGCGCCTATTTCCTGGGCCGGTGGATCCTGAAGATCAATCTATCAATCAAGTGGATCACACAATCTCTTCTCCCAATAGCTCACCAGCCAAAAGACAGAAATTTGATTTGACAAAAGATGTCAAGGTTCTGAAAGCTTGCTCTAATGGTGATTCTCATTCTGAAAGGGGTGAAAGGCCTTACTTGTGCACTGGTTGTGACATTTTTGTCGCTTGGGAGCCCTGTACGATGTGTGCAATGGCACTTGTTCATCAAAGAATTCGGCGAATATTTTATGCTTTTCCGAACCCTAACTGTGGTGCACTAGGCAGTGTTTACAGACTACAAGGAGAGAAAAGCTTGAATCATCACTATGCTGTTTTTAGGGTTCTATTACCGGAGGAATCCTTGGAAACATGACATGGAAACCACATCTCGATGATGTCCAACAAATGTTAATCTAATGTTGTTCTACCATACAGTTTTTCCAAACGAAGGATGGTAAAGCTGAAGTTTATTGGAACACCCTTATGTCTGCAAGTGAAGGTTTTGATAGAGAGGTGCTTGGAACTTGCCATTATTTATTTTTCTTTGTTTTGATGTAAACTTATGTTGTGTTGTGCTATTATATAAACATCAATGTTCATAGTTTTTCAGAATACACCGTTGTAACTGTGACCGTTAATGCTTA\n>XM_020573339.1 Polysphondylium pallidum PN500 hypothetical protein partial mRNA \nATGAATAAATCTATAATATTGTTTTTATCTTTTCTAATAAATATAATTGTTGTTGTTAATGGCCAATGGCATATTGAATTCGAATATTCAGCTGCTGGATGTGGTGGAGTTCTGAATAGAGCCTCATCATTTTTGAATAATATGTGTTATAATTACGATAATGGTGGTCCATATTCACATAGATACATTGTATCTGGATCTACAACACTCCGTCAAATATTCAGTAGTACTGACTGTTCAGGAGCTCCAACTACACAAGCTACTTTCGCTGGAAATACATGTTATGATAATTTAATGAAATATGCAATAGTAAATGAACCTGCTATTTCGCCAGGTGGTTGGATTTCATTAGAACGTACTCCTGGAAATGCTTTATCTGGTTGTGGAGTTTATGAAAGTGAAAGACATATTTTTAGATTGGCTACTTGTGTCAAGACCTATGATCTTCCTAATTTTCCTTTCAATACTTATTTTAGTAGTGGTTCGGTTGGCCATGTTTACAATTTAGTGTGTCCCAATACTCTTTTCAACTTCCAACCGTGTAGTAGTGATCCCCAAAGAATTACATCAATATTAACACCAACCATTTCCTATTCAATAACCAATCCAACTCTTATCAATTCCAATACAATTCTTTTAAATCCTTTTACCAGCAACTTTAAATATACATACAAATTCCTTACTGAATATTTTAACCCCAACACCGGAAGTTTTGTCGTTGCATGCAATCAATATTCATCACTGGCATGTCAATTCTCTGTTCCAGCTGGAATTCCTTACACCTATGTTAGAGTTAGAGCTAACGGTGATGAATCATTAACTGCTGCTCCTATTTATACATCACCTAATTTTAATTTACCAATGCCACCTGTTATGAATGCAATTAATTCAATCATTACCACTACAAAATCTGTACAATTTTCATATTCTGCTACCAATTCCCCAACTTCCTATACTGTCAATGTGAATAGTGTTCCTCGTCCTGAATGTTCTGGTTTAACTACTTGTAAAATAAGTGGATTGACACCAGGTTCTCCCTATTCTATTTCTGTCTCTGCTACAAATGGTTATGGAACATCAACTCCTGTTTCTGCACCCGCTGGTAATCTTTATGCCAGTATCAAAATTCAAACGATAACTGCAACTCCATCTGCTGGTCAAATAGTGGTAGACTATACTTCTTTAAATGGTATCCCAGGTCAAACCACTTACACAACCACATTAAATAATTATCCAGGTGGTTGCACAGGTATTTACACACTCCGATGTATAATTAGTAATCTACCAGCACAATTTTCTACAACTGTAACTGTAGTTGCTACTAACGATGGTGATTCAAATAGCGATGTAAGAAGTATTGACTTTTTGGCACCAGCCATGAATCCAATTGTAATGTCCTCAGTCAAAACAAAATCTATTACTTTCACATACTCAGCATCGAGAACACCTACTTCTTATACTGTTTTGGTTAATAATATTGCACACCCAGAATGCTCGGCAACCACTACTTGTATAGTCAGTGGCTTAACATCTGGTTCCCTCTTTTCAATTTCCATAACTGCTACCAATGTAGCCGGTACCTCTCCTGCCACACAAACTAGTGGAACTTTATATCCAGATGTTGTTGCTCCAACTGTAACATTAACTCCATCAACTAGTACCATAGTTGTTGACTATGAGTCTTTGGGTGGTATAACTGGTCAAACTCTATACACTACAAAACTTGATAATACACCAGTATCTACTTGTACCAATATTGCTGCTTTAAGATGTACTATTACCGGACTTCCAGGTCAATTTGCAAATGACGTGACTGTTGTAGCAATTAATGATGGTCTTTCACAACAAACCACTCAAAGAGTTGAGTTCTTAGCACCTGTTGTTAATCCAATTACAATAGTTGAAAAGAAAACCAAGTCTATTACCTTCTCCTATTCTGCTTCTCGTTCACCAACTTCATATGATGTCAGTGTAAATGGACTTTCCAATCCACAATGCTCTTCGAAAACCACCTGCACATTTACTGGTTTAACAGCAGGTTCATCATATACTATTCAAGTAACTGCTACTAATGGTGCTGGTATTTCTCTACCAATTACATCAACAGGAATTCTTTATCCATCAGTTGATAATTTATTCTTGATGTCTACACCAACTTGGAATAGAATGTTAGTGGAATACAATTCAACAGGTGGTTTCCCAAATAACACTGTTTATACTACACAAATCGATGGAGTCAATGTACCTGGTTGTATTCAAATTGCTTCATTGGAATGCCAAATCAATGGTTTAAAGGCACAATATTCACATAATATTACCGTTTTGGCTTTCAATGATGGTGATACCATTCAATCATCTTTAAATGTTACTTTTAATGATATGGTTCCTATTACATCATCTCAATTTATTCATGTTGAATCAACTCAAAATACAATCAATGTCAAATGGAGTGCTTCAACTGGAGGTGTACCTGGTTTAACTGTCTATGATTTGTCTTTATCAATTGATAATTCATCATGGATAGTAGAGTTTAAAAATATTACCATCACTGAAGCTACCATTTCAGACTTAATTCCATCGGTCAACTATTACTTAAGAGTATCAGTGAAGAATTCAGATAATCCACCAATTCATACCTATACTAATACTCAAACCTTGGGACTTGGAGCAGAGGATTGTAAATGTACCAATGGTATCTGTGATGCCAGTTTTAAATTCTGTTTATGCAATGCTGGCTGGACAGGTTCACGATGCGAATTTAAGCACGATGTCGTTGAAGGTGAGATGAAACCACCAACTATAACACCAAACCCCACTAGACCTGAGGTAATTATCGACAATGGTGATTCCCAATACACTTTCAAAATAAGTACAATCATTGAAAGAAGTGAACTATTAGAAGAGATCTCTAGAATGGACCTTTCAAGCTTGAACTGGGATCTCCAATCAAATCTTAGTACTATTATTAAACATCCCAATAGTTTAATGAATGTTTCAATGAACCAATGGATTTACTCGGCTAAAATCCAGAAAGCCGAAGATTTAATTATCAAGTTCACTCAAATCAACCCGATATCCAATGAATCAACTCCTACCTTCCCAATGGAATTTGCTGGTGAATCGTTCAATTTGACAATTGGTTCACTTAAATATCAAATTGAAGTTAAGAAATGGGATTTTACAACCAAACTTAACCACTTGGAAATTCAATCGACTGTTGAATCTAAACTTGATGACTGTGTTAACCCAGAATCTCAATTTTCAGATGGTACCGGAATTTCAGATATTGCAATTCGTCAACCTTCTGGTTATTTCTTATTTGGCAGAGTCTCCAAGAGAATTCTTCTTGATAAAATCCCTAGAATGTCTACCATTAAATATAATCAAGTAAATGTTTCAACTGCCACTATTTCAACATTGGTTAGCCATTTCCAAGATAGTTTGGTTGTAGATCCAGATTTCTCTGTACTTTTAGATCTAGATAGAAAATCAGATGTTAAGTGTGGTGGAGAAAAGAAAACCAATGCTGCTGTTATTGCAGGATCCGTCGTTGGTGCAGTTGTTGGAGTAAGTTTAATCACAGCCAGTGTAATCTTAATCAAGAAAAAGAAGATTGCACAGAGATACAATAATTATTTGACTCAAAAGTTGAAACCAAAGATGATGGCAGACAAAAACAACAATTTGATGTACCTCTTAACCGATCTAGGTGTCTCTAATTCACTATAG\n>XM_030616062.1 PREDICTED: Syzygium oleosum uncharacterized protein At1g24485-like (LOC115689878), mRNA \nATGGCAGTCCAGATGTTCTTGTTGATGCTTCTCTTCATTGAAGTATCTCTTTCTCAAGCATCACTGTTGAGAATTGATTGTGGGTCTCAAACTGGGTATGAGGCCAAAGATGGCAGCTACTGGAGCACCGACGATGAATTTGTCAAGGTCGGCAACGACATGCCGATCTCAGCCGGTAGTTTCTCCAAGTGGACCCAACTCAACACTCTTCGAGTCTTCACAAAAGAGAAAAAAGTTTGCTACAAATTGCCTGCGCAACCGTCGGTCCGATACATGAGCAGAGCGACATTTTATTACGGCAACTACGACGGCCTTTCGAAACCACCAACTTTTGACTTGGAGTTTGACGAGAATAATAGGAAAACTGTTGTCACCTCAAATACAGATCCGCAAATTTATGAATTGATTTACACATCGGGTGCGGACGACATTAAGGTGTGCTTGATTCGAACATCGGATGCTCAGTTCCCATTCATCAATGCGCTGGAATTGTGGCCATTAGATGATAATATGTACGATGGTATGACCCGAGACATGGCTTGGCTCAGCAATTACCGCTACGACTATGGTGCAGTGGCGGACACTGTCGATGATTGGATTTTAGGGTACCCTACTGATTCGGCCAACAGAATATGGGTGCCAACAACTCCATCCGACCTGAATCAGACGAAAGCCTCCGCAACTTACTTCTACGACAACGGCGATAACAACGTGCCCAACGTTGTCATGTCCCAAATGGTCGAGGCGCCAAATTTAACGTACCCAATCAGCTTAAGCTTCAGCATCAACGACGGGATCAATCTAGTTCACTACGTGACCGCGTATTTCACCGAGACCCATTCACTAAACGAGAACGAAAGCAGGTCGTTCGAATTCAACGCGAACAACAAGTTCGTCTCGACCATGAACCCGAGGTACGAGTACTGCACGTCGGTGTGGGCATTCGTGCAGTCGAACGGTACTCTAAATGTTCAGCTGCGCGCAAGCGGGAATTCGACGCTGCCTCCTTTGATCAGCGCCATTGAAGTGTACACGGGCCAAGCCGTACATTATCCTAAGACAAGTAAGTGGAAGGAAGTCGGCGGCGGCGGCGGCGGCGTGCTCTTTCTCATTTTGATTGGCTGTGGGTACTATTTGTGCTCTAAATCGAGGAACGACGGTAGACCAAACGGCGGTGGACCAAACAACGGTGTTATAGAAGAAGCCCCACCTCGGCGCCGTTTTTGGTGGAGAAGAACTCGCTACGTTGAGGAGGAGGTTGTTGAAGCTCACGCGTAG\n>XM_031145784.1 Lachnellula hyalina Eukaryotic translation initiation factor (SPBC4B4.04), partial mRNA \nATGGCAGAGCCTACGCAGTTTGCATACAGGACACAGAAGACGGTGGGCATCGTGGATGCAGCGCCCGTCTATGAGCCCTTGAGCGGGTTCCAGAGACCGGATGTTGCCTCTCGCTGCTGCACGTACTCGCCGTGCGGGCGGTACTTTGCCTGGGTCAGTAACGAGGCAGTCACTGTAGTCGATGCCTCCGTCGGACACGTCATCACCACTCTCTCCATACCCAACGTGTACGAATTGGGTTTCTCGCCGCGGGGCTCATATCTCATCACATGGGAGCGGCCGTCCAAGGATGAGAATGGGGATGCCGTGAAGAATCTAAAGGTCTGGCGCACGGTGGAGGACATTGCAGAGGGCGCGGAGAAGCAGGTTGTAGGGCGGTTCGTGCAGAAGTCGCAAACGGGGTGGAACTTGCAGTACACTTTCGATGAGAAGTACTGCGCCCGCGCTGTCACCAATGAGGTGCAGTTCTACGAGAGTGACAACTTGGGGTCGGTCTGGAACAAGCTGCGCGCCGAGGGCGTTACAGATTTTGCTATTTCACCTGGCAACAACCAAGCTGTTGCCGTCTTCATCCCAGAGCGCAAAGGTCAACCTGCTACCGTCAAGGTTTTCAACGTCCCTCAATTCGCCAGCCCGGTTTCACAAAAGAATTTCTTTAAGGGCGACAAGGTCACGTTGAAGTGGAACCAGCTGGGTACAACCCTTATTGTTCTTGCACAAACCGAAGTCGACAAGACGGGCAAGAGTTATTACGGAGAAACTACACTATATGTGCTGAGTGCAAATGGTGGATTTGATTCGAGAATTACTCTGGACAAGGAAGGCCCAATTCATGATGTATCGTGGTCCCCTAATTCGAAAGAGTTTGGAGTGGTCTACGGATACATGCCAGCCAAGACAACCATCTTCAACCAAAGAGCTGTTGCAACGCATACGTTCGATCTCAGGCCCAGAAACACAATCTTGTTTTCCCCCACCGGTCGATTTGTTTTGGTTGCTGGTTTTGGTAACCTTGCAGGGCAGATGGATATCTATGATCTCGAAAAGGATTACAAGAAGATCTGCACTATCGAGGGTGGCAATCCAAGTGTCTGCGAGTGGAGTCCAGACAGCAAATTCATCCTGACTGCCACTACTAGTCCCCGTCTTCGTGTTGAAAATGGAGTTCGGTTGTGGCATGTTGGAGGAGGTATTATGTACAATGAAGATATGGTGGAGTTGTATCACGTTACCTGGAGACCTCAATCACTGGACAAGCTTACGGCTGGGGATCCTTTGCATCCAGTCCCGACTCCTCATGCATCGGCTCTAGCGTATCTAGGTACTGTCAAGACGCCTTCCAAGCCTGCGGGCGCTTACCGGCCACCTGGAGCTCGCGGAACCTTAACACCATCGCATTACAAGCGTGAAGACGAAGGAGGGGCCGCACATGTTGTTAGTAACGGCACTCAGCTGGTAGGATCCAACGGATTTGGCAGAGGTAAACGACAAATCCCGGGAGCGGAAGCAGTGGAAAATCTGCCACCTGGAGCGGATCCTAGCAAACCAGTCCCAGGAGGTGCCGAGGGAGATGAGAATCTCTCCAAAGCAGCTTTAAAGAATAAGAAGAAGCGAGAAGCAAAGAAAGCCAAGGAGGCAGAAGCCAAGGCCCAGGGCCTAGTCCCTTCGCCCGATGGAGGAAATGCCGCTCCCCCCGATGTCCGCAGCCCTGAACGCAGAGATAGGCGCGACCATCAACGTAGCCGATCCAAGGGAAACCAAGACATACGCACCCCATCTCAGCAACGATTCCGCAGCAATACCCAGCAAGGCAAACAGCCACAGTATCGTCAGCAGAACGGCGGAGCTCCCACGGGAAATATGAACAACCTCTCTATCAATTCCACCCCACAGCCGCCAAAGCCGGTGCCTGCGCCTGAGCTCTCTGTCACATCACCTAATGGTGGCAGCCCAGATGCGAAGAAATTACGAGGACTGCAGAAGAAGATCCGCGCGATTGAGGATTTGGAAATGAGGCTCGCAGGAGGTGAGAAGTTGGAAGATACTCAGCTTAAAAAGATTGGCACGAAGTCTCAGGTGCAGGGAGAGCTTTTTGCTTTGGACCGTGAAAGTTAG\n>XR_007275131.1 PREDICTED: Beta vulgaris subsp. vulgaris uncharacterized LOC125498264 (LOC125498264), ncRNA \nAAGATGATCTCGGGGGTCGTCCTGGGAGCATTGTGCAGAATTATGCAACAAAGGGTGGTTCCGAATTTTTTTTCATAGTGAACATACAGGTCCCTGGATAAAAAACGTACAATTTAGCACTGTACTATATGACGAGTAATCTGGAAGATGCACCTCTGCTGCAGAATTTCGTTGACAGAGACGATGCTTACAGAAATTCAAGGTTCAAACTTATTCTATACATATCTAAGGTCGGTAACATTCTGGTCTGAGGCTTGGGAATTATGCTATCTTGTCCCTCTTATGAAATCGATAGCTCGTATTGAGCATGCATTGGAATGCTTTAAAGGATTATTTCCTGGACATACAATATGTTTTCCAACTGCCTTCTCATATTTGAAGTTGCAATCACACAAATTTATTGGCCAACATTAAA\n>XM_022542561.1 Aspergillus glaucus CBS 516.65 hypothetical protein (ASPGLDRAFT_163897), mRNA \nCCGAGCTACATGCTGGGAAGTTTGGAGCAACTCCCTCTGGAACTCATTAACATGGTGCTTATACAGCTCGAAATACAGTCACTGACAGACTTCCAACGCGTCAATAAACGAGCTATGCAAGTAGTAGACTCGATTCCACAATACAAAAAGATCATCCTCCATGCCCCTGCCTCAATCCGGGGGAGCCTCAGCATCAGCACTGGCAGTTTGTTTTCTTGTCAGGAACTGTACGAGAAGCTCTGTACGGCGGAGTGCGACAGCTGCGGTGACTTGGGTGGATACCTGTACTTGGTTACATGCCGCCGCATTTGTTTTCTCTGCTTCACCAAGAAGACCGAGTACCTCCCACTACTACAGGCGGACACGATACGGAAGTTTAGACTTCGCCGTGAGGATATAGCAACTTTACCTTCTATGAATAGTGTCCCCGGCCGCTATTCACCACGAGAGATCAAATGCCGTACTCAGCTTACCTTAATCGATCATGACGCTGCGCGACAAGCTGGAATTACTGTGCACGGGAACATCAATGCAATGGAGCAATATGCCTTGGAAATGACATCTAAAAAACTGGAGCAATACCAGTCTCGAAAATCAATACACATAGCAGATTGCCCGAATCTGCGTCGACCCAGATCTGAAGACATTTTTGATGGGCATTCACCTAATCTCAAACGCTTCTTGGGAATTATCCGTGCGCCATTTCTTAATGCTCGTACAGGGTCTCTGGAATGGGTCTTCCATTGTGCCGCATGCAAACCCCATCATTATAACAGACCGCTCCATTGGCGCCGAAGGTATACAAGGAAGAGTTTCGAAGATCATATTAGGGAGTGTGGAGAGATTATACATGGGAAGCACAACCAACGCGTGAGATGAAAAGAATAAGCAATGAGGATACGAAATATAATGGAAGGCAATTGCCCTGTGTCAGGTGATAGAAGATAACCGTCGGTAGAAATAAAAGAAACCAAC\n>XM_031654791.1 PREDICTED: Papio anubis FA complementation group C (FANCC), transcript variant X2, mRNA \nGCACCGCTCACACGTGTGCGCGCGCAGCCCCGCCGCCGAGCCACCGCGGGAAAATTCCAAAACCCTCAAAACAAAAAGCCAATCCGAGGCAAAGCCAAATTTTCAAGCCACAGGTCCCGGGCGGTGGCTTCCTTTCCGCCGCTGCCCAAACTGCTGAAGCAGCTCCCGCGAGGACCACCCGATTTAATGTGTGCCCAGCATTTCCTTCAGTGCTGGACAGGCTGCTGTGAAGGGACATCACCTTTTCCCTTTTTCCAAGATGGCTCAAGAGTCAGTAGATCTTTCTTGTGATTATCAGTTTTGGATGCAGAAGCTTTCTGTGTGGGATCAGGCTTCCACTTTGGGAACCCAGCAAGACACCTGTGTTCACCTGGCTCGGTTCCAGGAGTTCCTGAGGAAGATGTATGAAGCCTTGAAAGAGATGGATTCTAATACAATTTTTGAAAGATTCCCCACAATTGATCAACTGTTGGCAAAAGCTTGTTGGAATCCTTTTATTTTAGCATACGATGAAAGCCAAAAAATTCTAATATGGTGCTTATGTTGTCTAATTAACAAAGAACCACAGAATTCTAGACAATCAAAACTTAACTCCTGGGTACAGGGTGTATTATCTCATATACTTTCAGCACTCAGATTTGATAAAGAAGTTGCTCTTTTCACTCAGGGTCTTGGATATGCCCCTATAGATTACTATCCCGGTCTGCTTAAAAATATGGTTTTATCATTAGCGTCTGAACTCAGAGAGAATCATCTTAATGGATTTAACACTCAAAGGCGTGCTTTATCATCATTCTCTTACCACCAAGATGGTTTTAGATCTAAAATTCATGTGTTTTTGAGTCCATCATCTAAGTTGTTAACAAAAAGACACATTTACCGTGAGTTAATGACTCCCGAGCGATTGGCGTCCCTGTCACGAGTCTGTGTCCCACTTATTACCCTGCCAGATGTTGACCCCCTGGTGGAGGCTTTGCTCGTCTGTCACGGACATGAACCTCAGGAAATCCTCCAGCCAGAGTTCTTTGAGGCTGTAAACGAGGCCATTTTGCTGAAGAAGATTTCTCTCCCCATGTCGGCTGTAGTCTGCCTCTGGCTTCGGCACCTTCCCAGCCTTGAAAAAGCAATGCTGCATCTTTTTGAAAAGCTAATCTCCAGTGAGAGAAATTGTCTGCGAAGGATCGAATGCTTTATAAAAGATTCATCGCTGCCTCAAGCAGCCTGCCACCCTGCCATATTCCGGGTTGTTGATGAGATGTTCAGGTGTGCACTCCTGGAAACCGATGGGGCCCCGGAAATCATAGCCACTATTCAAGTGTTTATGCAGTGCTTCCTAGAAGCTCTGGAGAAAGAAAACAAGCAGCTGCGGTTTGCACTCAAGACCTACTTTCCTTATACTTCTCCATCTCTTGCCATGGTGCTGCTGCAAGACCCTCAAGATGTCCCTCGGGGATGCTGGCTGCAGACACTGAAGCACATTTCCGAACTGCTCAGAGAAGCGGTTGAAGACCAGACTCATGGGTCCCGCGGAGGTCCCTTGGAGAGCTGGTTCCTGTTCATTCACTTCGGAGGATGGGCTGAGATGGTGGCTGAGCAGCTCCTGAGGTCCGCAGCCGAACCCCCCGCAGCCCTGCTGTGGCTCTTGGCCTTTTACTACAGCCCCCATGATGGGAGGCAGCAGAGAGCACAGACCATGGTCCAGGTGAAGGCTGTGCTGGGCCACCTCCTGGCGATGTCCAGAAGCAGCAGCCTCTCAGCCCGGGACCTGCAGACAGCAGCAGGACAGGACACAGAAACAGACCCCAGAGCTCCTGCACAACAGCTCATCAGGCACCTTCTCCTCAACTTCGTGCTCTGGGCTCCTGGAGGCCACACGATCGCCCGGGATGTCATCACCCTGATGGCTCACACTGCCGAGATAACTCACGAGATCATTGGCTTTCTTGACCAGACCTTGTACAGATGGGATCGTCTCGGCATTGAAAGCCCTAGATCAGGAAAACTGGCCCGAGAGCTCCTTAAAGAGCTGCGAACTCAAGTCTAGAAGGCACGCAGGCCGTGTGGGTGCCCAGCATGAGGGATCAGGCTCGCCAGGGTCACAGGACAGATGATGACCTATGGCCACGCATTTGTGGAGTAAGTAAGTGCCCTCTTTGGGCTGTGAGAATGAGCCATACACGTCTTGGGAAGATCTGCTAGTATCTATTTTAAAAAATGCAGAGCCAGGTCCCTCAGCCCAGACTCAGTTGGACATGTTCACCAATGACTTGAGTGAGCCTTCAGCGCTCCTGGTGCCCGCCCGGCCAGACTGTCAGCTAGAGAATTACTAAAGCAAAGGCTTGGGTGGGAGAACAGGTTTCTAGTTTTTACCCAAGTCTAGATGCACATCTATTATTTAAAGATTCAAAGCCTTAGAACCAAGAATTTGGTGATGAACCATTGAAGAATTTAGAGAGAACTCAGCTCTTTTTAGACTCTCTTCAGGAGTCAGGGATCTGGGATACAGCCACGCTGTCGTGCTGTACGGAGAAATCTCCACGGGGAGTCAGCGTCCCTCAGGCTTCCCTTGCGTCTCCCTGGACCTGCCCGATAGACCACAGGAGCAGACAGAGCACACCCAAGCCTGCGTCTCCTGCACACGCTTTCCACTCTATTTGCTAAACGCTGACTGCCACCAAAGAGCTCCTGGGACATGAGAGGGGCCGGCAGGTGAAGGTGGAGGACGTGTTGCAGAAACATTCAAAGGCAGGATTCGTATCAGTTAGTTCTCTTGTTAAACGGAGATGGGAATTGGAAATTCCTGATAAAGAACTGACGTGGCTGGGCGCGGTGGCTCACACCTGTGATCCCAGCACTTTGGGAGGCCGAGGCAGGGGGATCCCTCCAGCCCAGGAGCTCCAGACTGGCCTGGACAACATGGCGAAACTCCATCTCTACTAAAAATACAAAAATTATTGGGGTGCCGTGGTGGGCACCTATAATCCCAGCTATTGGGGAGGCTGAGGCATGAGGATCCCTTGAACCCGGGAGGCAGGAGTTGTAGTGAGCCGAGATCATGCCATTGCACTCCAGCCTGGGCAACAGAGTGAGACCTGTCTTTAAAAAAAAAAAAGGCATTGTTGGTGTAATCTCAAAGTTAACGTTTATTTCACGTCAGCAGAGGATGCTTTTTCCTGTCAGAGACATTCTGGAATTGTACCGATTGTACATTCTTTTGTGCCTATTCTGTTTGTCAAGTGAGTCAAGACTTGCTTTTGTCCATTTTGATGTACGTGTGTTAGTCGGAGTCTTGGCTCCGTTTTGAGGCATGAGCAAAGTTTCACTGGATTAGAGGTTAACCTTTAGGGAAATTCCTTTTCTTGGTATGTGGCAATGCTAATAAAGCCACCTGAAGATCTGGAAAATTCCAGGAACTTTTCACCTGAGCTTTTCTTCTGAGAAATGCTGCAGTCAGAAGGGTGTGCTGGTAAAATATTTTGGTGGCAGCTGCCATCGTGATCATTGCTTTCATATAAGACGCTCTGTGCCATCATGATCCTTACCCTCATAAAACAAACACACTTCGTCAGAGGCGTCGGGGTTGAAAAAGGAGCTGCTTCACTGGAGTTGAGGGCCTCTCTCCTGTTCTGACTTTGAGCCAGAACTTGTGGCTGGCCCTGGAAGCTGACTCCACTGTGGACACGGTGGCAGCAGGGAGCCCCTAGAGGGAGGGTCACTGGGACCAGGCCTTCTGTCATCAAGGGGATTCTGGGACAGTCCCTCACCCTGTCCTGTGGTCCTGTTCACGGGGCTGGCCTTTCCCTCCTCCCCGGCCAGGCCTCTGACCATGCCCCTTCCGTCTTCTCCACTGGGGACTGGTGAAGCTGGGCGTCTGGAAGACTTCCTGGCCTGGAAGCCCTGAGCTCGGCCTGTCTGTAGAATCTCCCAGTTCCTTCACAGCTGCCGAGTCCTCTTGTGGGCGCGGTGGAAGCGGCTTTCCGGGCAGCCAGGGGTTCCCGGATAGGACTGTCCCTCTGGGGATGTGGCACCGAAGTGCCTGCTGGCTTCATGTGGCCCTTTGCCCTTTCCCGGCCTGAGAGACGCTCAAAGGTGGAGAGCCAGGGGAGCCACCCCTCGGCTGGTCCCTCCACCTCTGGGACAGGTGGCAGCCGGGCAGGTGAGGGCATGTGAGGGCCGCGGCTTCGCTCCTAAGCCCACGTCCTCCTCCTGTTGCCATCGATTTTTGGCAAAGTCTGGGCAGGTGCCACCGGGAAGGAATGGCGTCCGAGATGCTGGGCACGGCATGGTGCGGCCGAGGGGGCCTTGACATCGCTGGCGGGGCCTGGGCACAGGGGCAGCCACAGGGAGGCAGGGATGCCAAGGCCTGGAGCCACCGTGGAAGGAACTGCTCGAGGTCTGCAGAGGTGCCACAGGGCCCAGAATCTGACCTTACCTGACCTCTTCTAGACTCTCCCTGATAGTTTTTGATGAAGCATGTTGGTAAAACCACTACCCTCAGAGAAAGCCAAAAATACAGATGAGGCGGAGCTCGCCCCTCCAACCTGGCTGTTACTCACCTGGACTCCACGACATCTGTGGAATTCGTAAGCTCTTTAAAATCTGTAACTTGTTGTCTATTTTTTCATTCTAAATAAAACTTCAATTTGCACCTAA\n>XM_047252959.1 PREDICTED: Schistocerca piceifrons cuticle protein 79-like (LOC124777512), mRNA \nCGTTTCGCTTGGTGAGAATCTGGATGGTATATAAGGAAACGGCTGCGCTAAGAACTCTGTCAGTCATTCGTTGCCCATCTACCACCATCGCAAGAGCAACAATGAGGATCACGGTGTGCGCAGTTTTGCTGGCGGTGTGCTGCCTTTCTGCCGCGGAAGAGAAAGCGCGTGCCAAGACGGAGAAGCGAGGCCTGCTGGGGCTCGGCTATGGTGGCTTCGGCGGCGGCTACGGGGGCGGGTACGGCTACGGAGGCGGCTACGGGGGCGGGTACGGCTACGGTGGCGGGTACGGCTTTGGGGGCGGCTATGGGGAGGTCAAGGCCGTCACCATCACCAAGGAGGTGCCGGTGCCGGTACCGCAGCCGTACCCGGTGCCGGTGGAGAGGAGCGTGCCGTACCCGGTCAGCGTGCCCGTGAAGGTGCCCGTGGACAGGCCGTACCCCGTGCACGTGCCGCAGCCGTACCCCGTGCCCGTGGAGAAGCCGGTGCCGTTCCCCGTGAGCGTGCCCGAGGCCGTGCCCGTGGCCGTACCTCACCCCGTGCTCGTCAAGCAGCCCGTGCCCGTCGTCGTCAAGGACGTCGGCTTCGGCGGAGGCTACGGGGGATTCGGAGGCGGGTACTCCAGCTTCGGTGGCTTCGGGGGTTACCACCACTAAACGTCATCCGTGCCGTCGCAGCCACTCATCTGACAGCCATCTTCACAGCAGGACTGCCCAACCACCTATTTCCATTCGTATGTTTCCATTTTGTTAGATCGAGATCTCTATGTACCAAAAATTTGCAGATTACTGTTGATTTCAATAAAATATTGCAATAAAATT\n>XM_046236555.1 Lentinula edodes uncharacterized protein (C8R40DRAFT_884233), mRNA \nGGAACTTTCAAGTTATCAGACCTTCGATCTCGGTCCGTGATTACAGACAGATACATTCCAACCCCAATTTTCACTGCTTTTGTCTTATCACAACATTCATGAGTGGTGTTCAAAAGACTGCCATCGTCACTGGTGCCTCTTCAGGCATTGGACGATACACTGCTATTGCCCTCCTGAATGAGGGATGGAACGTTGTTGTCACTGCTCGGAGATTAGAGGCCCTTCAAGAAACACAGGAAATGTCTTCAAATGCTGAAAGCTGTCTTTGCGTGGCTGGTGATATTACCGATGAAACCTTTGCGATAAATCTCTTCGAGCAGGCAATTGCTAAATTTGGGCGACTGGATCTTTTGTTCAATAATGCTGGAATATCGTCCGCCCAGGTTCCAATTGAAGATGTCTCCTTCGACACGTTCCAAAATGTTCTGAACATCAACTTGGTAGCGCCTTTTATCTGCACTCGGGAAGCAGTCAAAAAATTTAAAGCTCAAACTCCCCCTGGAGGTCGCATCATCAATAATGGTTCCTTGTCAGCCCATGTACCGCGTCCGCACTCTTATGCATATACGATGTCAAAGCATGCGATGAACGGTCTCACCAAGTGTACTTCTCTCGACGGACGCGCATTTAACATTGCCTGTACCCAAATCGATATAGGAAATGCGGCTACAGATATGGGAGGACGGCATGGATTAGGTGCATTACAGCCAGACGGACGCATAATTCAAGAAGGCGTGCTTAATGTCCAACATGTCGCCAGCACGATCGTGCATATAGCCAGTCTTCCGCCTGATGTTACTGTTCTCCACGTCAACATCATGCCCACCAACGTCCCATATGTTGGACGAGGTTAATAGAGTCGAAGCGTAGGATTCAATATCATTCCGACTTATACAGAGTTTTCCTTCTATTTCCCCTTACAAGGTTCATATAAGTACATAGGCCTCGTGAAATAATTTGTCCGTATCCGACAAGCCTCTGATTA\n>XM_053458426.1 PREDICTED: Spea bombifrons corin, serine peptidase (LOC128482252), mRNA \nTGTTCATCTTCAGCACGTGGAAGCTGAGTGGAGCCGCGATCCCTGCGAGGGGAGAATGTGAGCGAGGAATCGCGCAGGGAAAGTGTTTGGGAGAGAGCCGGGCATGTCAGCCCACTGAGCATGCTATCAATGCAACAGTTTGCTTCCCTGCCTCCGGAAGACAGCTACCGGCCGGTCATCTGCGCTGACAGGGTCTTTGGAGCAGATGAAGATAATATGGGGGATGGCTGTTCTCAGAAGCCGGCATCTGCCAAGTACCTCCGTCTCTTGCTGCTAATACTCATCCCATGCATCTGCGCTTTCATTCTTTTGCTGGTTGTTCTGCTCACATTTGTTGGTGTGATAGACAGACACTGTTTTGACTTTAATAGGAGTGATCCGCTAACCAGCAGTATTGGAATCGGATCTCCTGACATTCCATTCATAAAGATGGATGACAATGCATCAGAAGGGACATTAATGAAAGGCTGGGAACCCCATCCCGCACTCTGGAATACTTCTGCTGTTGTAGCTGACCAAAGCTCTACCAACTTTAGTGAAATAAAAGACACTCCCCAGCAGGATCCCTTATACCCCTTTCCTTATACCACAGTAGATTATAAACGCTCAAGAAATAACGTGACACTGACCAAAGAGCATGACGCCAACCTATTGGAAAGCACGGGCGTTTGGACCACGCCATTGCTGAGTGACGCCACCATGTCTCCGACTGTGGAACCAATTGGGCCTCAATTTGTAGTCAGGGAAGATGCCTGTGTGAACATCTCATACAGCCAATGCCAAATGCTGCCATACAATAACACCGTCTCAAAATCAGTGTATTCGTTCGTCAAGAGCATTGAAATGGAAATGTTTCTCAAGTTCTTCAGCTATCTCAACCGCCTCAGCTGCTATCAGCACATCATGCTTTTTGGCTGCAGCCTGGCTCTCCCGGAATGCATCAGTCATGGCGATGACAGTTATACTCTCCTGCCGTGCAGATCATTCTGTGAGGCTGCGCAAGAAGGTTGTGAACCAGTGCTTGAGATGGTGAATTCTTCCTGGCCAGAGTTCCTGAGATGCTCCCAGTTTCGGAACAAAACAGACAATAACAACACAAGCCGAGTGTGTTATTCTCCGCAGCAAGAGAAAGGAAAGCAATCGCTTTGTGGAGAACATGACAGCTTTCTGTGTAACAATGGAATCTGCATACCTAGACAGTTGATGTGCAATGGATACAATGACTGTGATGACTGGAGCGACGAGGTACATTGCAACTGCAGTGATCATCAGTTCCGGTGCAATACAGGGAAATGCCTTAACCACAGCCTTGTATGTGATGGGTACGATGACTGTGGAGATCTAAGTGACGAGCAGAGTTGTGATTGTAATCCATTACATAGCTACCAGTGTGGAGATGGACGATGCATAACTTTAAGATGGGTCTGTGATGGTGACCATGACTGTGTAGACAAGTCTGATGAAGTCAACTGCTCATGTCATAGTCAGGGTCTCACCGAGTGCAGGAATGGGCAGTGCATTCCTAGTGCCTTCCGCTGTGATGGAGACAGTGATTGTAAAGATGGCAGCGATGAGGAGAACTGCACTGTAAGTAAGGGACAGGTATGCCAAGAAGGAGATCCAAAGTGTATTTCTCAAGCCTGTTCAGGAGCATGTGCCAATGATCCCAACTGTGGAACGCCTCACAACAAGACAAACTGCAGTCAGTGTGAACCAATAACCTTAGAGCTGTGTATGAACCTACCCTACAACTATACCCATTTCCCAAACTATCTTGGTCACAGAACTCAGAAAGAGGCTTCCATAAGCTGGGAATCATCTCTGTTCCCAGCCCTTGTTCAAACAAATTGTTACAAATATCTCATGTATTTTGCATGTACCATTCTAGTACCAAAGTGCGAACCGGAGACCAGTCAGCGGATACCACCATGCAGGTCACTTTGTAAACATGCCAAAGAGCGATGTGAATCTGTGCTTGGTATTGTGGGATTACAGTGGCCAGAGGATACAGACTGTACCCAGTTCCCAGATGAAAAATTAGACAACCAAACATGCCTTATGCCTGATGAGGATGTAGAAGAATGCTCCCCTAGCCATTTCAAGTGCCGTTCTGGACGCTGCATCTTGGCTTCCAGAAGATGTGATGGAGAAGCAGATTGTGAAGATGATAGTGATGAGGAAAATTGTGGATGTACTGAGAGAGGTCTTTGGGAATGCCCAGTGAACAAGATGTGCATCAAACATTCAATGATATGTGATGGATTCCCAGATTGTCCTGATGAACTGGAAGAGAAGAATTGCTCATCCTGCACAAACGATGAGTTAGAATGTGCCAACCATGAGTGTGTATCTCGTGATCGCTGGTGTGATGGCGTGGTGGATTGCAAAGACAGCTCAGATGAATGGAACTGCGTTACTCTGTCTAAAGGTGTGAGGTCCCTCCTAACCATTCACAGGTCTGCATCTGACCATCACGTATGTGCCGATGCTTGGGATGATGAGCTTACTCACTGGGTCTGCAAGCAGATGGGTTTAGGCGGCCCATCAGTGGCAGAATTTGCCCAAGAAGCTGATCATTTGGAACATAATAAAATGCTGCATCTAATTAAAGACTGGAAAAAGAAAAATGGATCTACATTTCACGAGCTGCTCATGAAAGGGCAGACTTGTGAAAGCAGAGCTAAAGTATCTCTGACATGTACCAGAGAAGATTGTGGACATCGTCCAGCCGCCCGAATGAGCAAGAGAATTCTTGGTGGCAGGACGAGCCGACCAGGACGTTGGCCTTGGCAGTGTTCTCTCCAGAGTGATCCCAGTGGACACATCTGCGGCTGTGTTCTCATTGGGAAAAAATGGGTGTTAACGGTAGCTCACTGCTTCGAAGGAAGAGAAAATGCTGCCGTATGGAAGGTTGTATTTGGTATAAACAACTTGGATCACCCATCTGATTTCATGCAGACTCGCCTTGTGAAGACTATTATTCTCCATCCACGGTATAACAGAGCAGTGGTGGACTACGACATTAGTATTGTGGAACTGGATGAGGACATTGTGGAGACTAGCTATGTGAGGCCAGTTTGCCTCCCAACTAAGGGCCAGTTGGTCGAACCAGATACGTATTGTTACATCACTGGATGGGGACATATGGGCAACAAAATGCCATTTAAGTTGCAAGAGGGAGAAGTTCGGATTATTTCCTTGGAACGCTGTCAGTCTTATTTTGACTTGAAAACCATAACATCCAGGATGCTGTGTGCTGGGTATGAGTCCGGGACAATAGATTCCTGCATGGGAGATAGTGGCGGTCCCCTTGTCTGTGAACAAGAAGGAGGACAGTGGACGTTATATGGACTGACTTCTTGGGGATCTGTATGTTTTTCCAAAGTTATGGGACCTGGAGTTTATAGCAATGTTTCCCACTTTATTGACTGGATTGAAAGACAGATATACATTCACAGCTTCTTAATCAACTAAAGACGTATATATATATGAATAAAATACACATATTTAAAGGCAAACAGCAAAAATTGCCTTAACCACCAAGGAGGTTTTAATGAGTGGAAATCCTTGCCCTGGGTATTAATGAAAATGATATCTATATATTTTTGTTCTAAACGTTAGGTGTTTTAGTCTAAAGCTTTTTGACTTTTTGTACATATCTGTTCACGGTTATGTTTTGCTGTGTAATCATTTCTTAATGAACACAGACTTTCAAAAAAATGTAACATTTGTTGTTTGTTTTATATGCGGGCATTGAGTGGGTGATACCGGGCTTGGGTTTGCCAGGAGTCATTTACAGGGACTGACAATTGTAAATTACCACACATGGGACAGGTTACATTTGTAGCATAATACACTAAATTCTGATTTCAGCTACCGAGACAGGTAGGTAAAGCTCACGTTAGCTTTGAGATGTCTTAAATACCAATAGAGATGCCAGTTCATTAACTTTACTGGATATTAAGCTTACGGACTACAATGGTCCCTGTAATGTTTCCATAGACTTCAAAACATCACAGTCTGACCGCCTAGTTTATTCACCCATGTTTGATTGCTCAGGTTTAGAGGGGTTACACATGCATTTACTATAATGAACATGTAATTTGGTAACAACAGACCCCACAATGCAGTCTACAGATCAACTGTTACTACTACATGATGATTGTTTCTTTAATAAAA\n>XM_051514774.1 Durotheca rogersii uncharacterized protein (GGS23DRAFT_536457), mRNA \nCAGCTAGGCACGTGAAGTCTGCCTCTCTTTTAAACCCACGACGAAACGCCAATTCTCCCTTCGCACCCGCCGTCTTGGCTCCTCGGGCCCCGCAGTGCAGCGTCAACGAACACTCAGCCAAATCGTTCCTCCCACCCCGCCATCGCCATGGGTGAGCCAGTCAAGACCCCCGTGGTCGCGGAGGCCCATCTGGTCGACACCTACCATCCCCCCCACAAGATGCTTGAGAAGCATCCAAGCAAACCTCATCTGAATGGCCTCGAAGATTACCAGCGGCTGTACAAGGAGTCCATCACCGAGCCGGAGAAGTTCTTTGCGAGAAATGCTAGGGAGCTGTTAACTTGGCAGCGGGACTTCCAGACCGTCCGAACCGGGACTCTGACCGACGGGAATGTTGCATGGTTCGTTGAGGGCCAGCTCAATGCCTCCTACAATCTCGTCGACCGGCACGCCTTCAAGGACCCGAACAAGGTCGCCGTTATCTACGAGGGCGACGAGCCTAACCAAGGCCGAAATCTGACCTACGGCGAGCTCCTTCGCGAGGTAAGCCGGGTCGCCTATGTCTTGAAGAAGATGGGCGTCCGAAAGGGCGATACCGTCGCGATTTACCTACCCATGATTCCGGAGGCCATTGTCGCTCTCCTGGCCATTAGCCGTATCGGCGCTATCCACTCCGTCGTCTTCGCCGGCTTCTCCGCCGATTCCCTGCGCGACCGTGTCATCGATGCTCAATCCAAGGTCGTCATCACCACGGACGAGGGGAAGCGAGGTGGCAAGTTGATCGGCACCAAGAAGATCGTGGACGACGCGCTCAAGCAATGCCCCGATGTCACCGGCGTGCTCGTCTTCAAGCGCACTGGCGCCGACATCCCCTGGACGCCGGGTCGCGACCTGTGGTGGCACGAGGAGGTCGAGAAGTGGCCGACATACATTGCGCCCGAAGTCATGAACTCCGAGGATCCCCTCTTCCTGCTGTATACCTCGGGCTCGACCGGGAAACCCAAGGGCGTTATGCACACTACCGGCGGATACCTGCTCGGCGCCGCGCTAACCGGTAAATACGTGTTCGACATTCACGACGGAGATCGGTACTTCTGCGGCGGCGATGTCGGCTGGATTACCGGCCACACGTACGTCGTCTACGCGCCCCTTCTCCTAGGCATATCCACGGTGGTCTTTGAGGGCACTCCGGCCTACCCGAACTTTTCACGTTACTGGGAGATCATTGCGAAGCACGAGGTCACGCAGTTCTACGTGGCGCCGACGGCGTTACGGTTGTTGAAACGCGCCGGCGACGACTTCGTCAATGCCGACATGCCGAAGCTGAGGGTTTTGGGATCGGTGGGTGAGCCTATCGCCGCCGAGGTTTGGAAGTGGTATTTTGAAGTTGTTGGCAAGGAGGAATCGCAGATTGTCGACACGTACTGGCAAACCGAGACTGGCTCGAACGTAATAACGCCCCTGGCCGGCGTAACCCCCACGAAGCCGGGCAGTGCCTCGCTGCCTTTCTTCGGAATAGAACCAGCCATCATCGACCCCATTTCCGGCGAGGAAATCTACGGAAATGACGTTGAAGGTGTGCTGGCGTTTAAGCAGCCGTGGCCTAGCATGGCTCGGACTGTCTGGGGTGCCCACAGGAGATATTTAGATACATACCTGAATGTGTATCCGGGCTACTACTTTACCGGCGACGGAGCTGGCCGTGATCACGAAGGATTCTATTGGATCCGAGGGCGAGTCGATGATGTCGTCAACGTTAGCGGGCATCGTCTGTCGACTGCCGAGATTGAGGCGGCCCTCATCGAGCACCATTCGGTAGCCGAAGCCGCCGTCGTCGGCGTCACCGACGAGTTGACCGGCCAAGCCGTCAACGCGTTCGTGGCCATCAAGAACGGGAACGAAGCCTCGGACGCCTTGAGGAAGGAATTCATTCTGCAAGTGCGGAAGAGCATCGGACCGTTTGCCGCCCCCAAGGCGGTGTACATCGTACCCGACTTGCCAAAGACCCGGAGCGGAAAGATTATGCGCCGTATCTTGAGGAAGATTCTGGCCGGCGAGGAGGACCAGCTCGGTGACGTATCAACGTTATCGGACCCGTCGGTGGTTGAGAAGATTATTGCTACCGTTCACGAAGCTCGGAAGAAGTAATGGTTGGATACGGATATAAGTGGGTAGGTAGGCGGCTCGATTGGAGAACACCTGACAGGGCCTTGGATCGCAAATGCGGGGAAGGGTCCCAAGACATCGGATAAGTTGGAGAATTATGAGTATAGTATGCTATTTGACGGCAACATTGTGGTTTGGCACAGCCACAGAGCGGAGGAAGACGGTACGCCACCGGCTCAGCAGCTAGTGGCGCGCGCCCTTTGGTGTGGAGGCTTTGAGGAATCGCTCGGCCAAGGGTGGGATAGTTGCGCTGATATGGACGGCGTGTTTTTTATTGATTTGTCAGCTTTAGAGCCACCTTATATCAGCTTGATTGTACATTCCTATAACGCGGCGGCTTTAACGCCGAGGGTGATCAAACAGGTCGTGGTTTGCCGTTGGT\n>XM_037547025.1 PREDICTED: Pygocentrus nattereri leucine rich repeat transmembrane neuronal 4 like 1 (lrrtm4l1), transcript variant X2, mRNA \nAAAGGAGCCAGTGCATCCTGGTGGTGCATGGTGCAATCATTGCATTGCTGTCCCAAACCCTTGGAGGAGAACGACAGGCTCTCTGAAGCTCAGGTGTGGGTGGCAGGAAATTTAAGGTGCTATGGTTTGTGCTACGAGATTAGCATGCCTCCTCCCTCTCCTTGTCTCCACTCTTCTGTTGCTCTGCTCTGGGGAGAAAACATGTCCCTACAACTGCCGCTGTGAGGGTAAAATCGTCCATTGCGATTCAGCGTCTTTCATGGATGTGCCAGAGAACATTTCAGTAACTTGCCAAGGTTTGTCCCTGCGCAACAATGACCTGCACACAATGCTCCCATACCAGTTTGCCCACCTTAACCAGCTCCTCTGGCTGTATCTGGATCACAATCAGATCTCATTTGTAGACAGTCGTGCTTTCCAGGGCATACGACGGCTTAAGGAGTTGATCCTGAGCACCAACAGGATTTCACAACTCCATAATTCCACCTTTCATGGAGTGCCTAATCTCCGCAGCCTGGACCTCTCCTACAACAAACTTCAGGAACTGCAACCGGGTCAGTTCCATGGTCTTCGCAAACTCCAGAATCTGCACCTACGCTCCAACGGGCTCACAACAATTCCTGTCCGGGCATTTATTGAGTGCAGAAGCTTGGAGTTTCTTGACCTAGGGTATAACCGACTACGTGTCCTCACACGCACTGCATTTCTGGGTTTGTCTAGGCTGATGGAGCTGCATCTGGAACACAATCAGTTCTCTCGGATCAACTTCTTTCTCTTTCCACGCCTCGCAAACCTGCGTGGTCTGTATCTCCAGTGGAATCGTATTCGGGCAGTGAACCAAGGCCTCCCATGGATTTGGTATACCCTGCAGAAGCTTGACCTGTCTGGCAATGAGATCCAGACTCTGGATCCTGTTGTATTTCAATGCCTACCAAACCTACAGGTTCTTAACTTGGAGTCTAACAAGTTAGCCAATGTATCTCATGAGACTGTAGCAGCCTGGATTTCCCTGACTACAATCAGCCTTGCAGGAAACATGTGGGACTGTGGGCCAGGCATTTGCCCTCTTGTTGCCTGGCTAAGGAATTTCCGAGGAACTAAAGATACAAGCATCATTTGCAGCAGCCCCAAAAATCTTCAAGGGGAAAAGGTTATGGAGGCAACAAGAAATTACATAGACTGTGAAGATTTCGAAATCATTCCACAAACACCATTTCCTCACCACACTCTGGAACCAACTATGGAAACTACTTCTGCACCACCCTTACCTCCCACTACTCCCCCACCACCCCTGCCTCCACCTGCCTCTGAGGCACCCATCCCACCACCCCTAGCTCAACCCCTTCCTCATCCTACTATCTACAACCTTGCTGAGACTCATCCTAGAAACAGCCCTCCACAGACACCTCCACCTTCCAACAGCCTGCTCGTCACTCCATCCCCAGAACAAGAGAACTTGGCATTCCATAAAGTTGTGGTGGGGGCTGTGGTGCTTTTCTTCTCAACATCACTCGTCTTGACAGTGATCTATGTGTCCTGCAGACGGTACCCTGGTGCCACCAGGTTGTTGCAACAGCGTTCAGTCATGGGACGAAAGCGCCGGAAAAAGAGTCCCGAGCCAGAGCAGAACCTGAGCTCCCAACTGCAGGAATATTACATGAGCTACAATCCTGCCGCCACACCAGAAGCCATGGATGTGCTGGCCAATGGGACTGGTACTTGCACCTGTACCATTTCCGGCTCCAGGGAATGCGAGAATGAATACACGTGTCCCAGGCCACTCCCTGGAGCCTGGATCGGCGACATCCCCACCATTCACTAGGAATGTTTTCTCCACCAATGAGATTTCAATAGGCAACAGGGTTCCAGCCTACAGCCTCTGCATCCATCACTCTACGGCCTACGCTGCCATTTTTTTTCTTTTCCCTGTCATTTATGGAACGTTATCCACCATGGACATGTGAAGGGACATCTAAAAAGACAGCAGGAACGCCTCCATCACGCATTTTACTAACACGCACGTCACACTTCTTCAAGACGCCTCACTTTATCCACTCTCTTTTTTGCCTAGACAGCTCTTTCTCTAGATCTAAGCCTGACTAGGCCTTTGGTCGAGTTGAACATACAGGAACAGGATGAACTATTCTATTCTACGAACAAAGCCACTGTAACAGCAATGAGAGTGCATGGGAAGATATCTCCTGGACTTTAAGGAATATCCTCAGCATCAGAGCGTATGGATTTTCCATATGACAAAACATCATCCATCAGACAACCATTGACTGCCAGTCAACTGATACATTAAGCCTATTGCTGGACTTAACTTATTTGGTCACACTTTATGTGAGGGCTACCTACATATGGACCTTATAACACACTGATAAGCATTGAATAACATGTTTATAAAGTAATGTTTGAGTATTTATAAACAGCTGATATGAGTAATCACAGAATGTGTAGGCACTGTGTTGACATAAGAGGTCTTAAACCAATATAATGGATGTTTTTTTTTCATTTGTATCATTCCCACATAATGGATCTTAAATGCCAAGACCACTGTTTATGAGTTTTAAATATTTCTTCTTGAAGTCCAATTGTACAATTTCTATAAAGGAAAACCAGTATGGCTGCAGATACTAACTCCTTAAAGTAGAATTTTTCATTCAAATAAAATAGCATAATAAATCAAAGTGCTTTTACTCATAGTAAACTGCATTTAAGCAAGCAAGCAAAGTTTATTTATATAAAGCTTTTTACAACAGATGTTGTCACAAAGCAGCTTTACAGAGCAATCAGTATTATAGAAAGAAAAGAAAAGAAAATCCGGGACCAAGCCCCCATGAG\n>XM_023033177.1 PREDICTED: Olea europaea var. sylvestris ferredoxin, root R-B2 (LOC111404360), mRNA \nATGAACATAGGATTTGAGAGAGATTTGTGTTTGCTGTTTGAGATTTGGATCAACGATGGTGGTGGTTCGCGGTGGCGGCGAGTGGTGATGGAAAGGAACGGATCCTACATCCATGCTTACAAGGTACTAATTGAATATGAAGGTAAAACAACTGAACTAGAGGTTGAGCCAGACGAGACAATTCTGTCGAAGACACTGGAAAGTGATTTGCCAGTGCCATATGACTGTNAATGCATGACATGCCCGGCTCAANGAATGGACGACCAAAGTGATGGGATGCTTAGTGAGGATGTTGAGGAGAGAGGTTATGCTTTATTGTGTNATTGTCACATTAGAATCATACCCGAGGAAGAATTGCTCTCTCTGCAGCTAGTTACTTCCAATGACTAATAAATCTGTTGGTTGTTAAAATTTTCAGTTTTGAGGCACTGCTAATTGTTACTGTTTTTCTGCATTAAATCTATAAGAGGAATGTGCAAAGTGAGATTCTGAAGGCAAAGGTTAACGATACCTTGTATTTACTTGCTGGAATTTCTATTGTTTGAAGAATATTTAGGCTTCCACGTTTAGATTTCTCTAAAAGCGTTCTCTCTGACAACCAAGAATGATAAAATCATTCGCATTCAGTCTAAAATTTAAGCACAAGAAGATTTAGTTGGAAACACCTGCTACCATTAAACAAAGTTCTTCATAGATAAAAGTAGCAAAATAGGACATGTATTGAATAAATGCATTGTGCGTGGCTGGTATCTATCTATTATTACGGGTTCAATACTACTTCTCAGAGTTGAATGTAGACATATAAGGTCATATAACAAATTTTGGAAGTATGGTCAAATGTTAATGAACAGTAATTCATCCATGCGTGTATAACAGTAATTGGACACAATGTGAGTTCAGAGGTGACTAACAATTAAAAAGTAGACACTTCTCCATATCCATGTGGAAGTATGCTAACAAAGCATTCAACACTTATGTTCAGTGAATAAATATGATCGTATCAAAAATGTACTCACTGACTCCATTTGATGTTGATGCAGACAGCAAGCACTTCAGAGTAGCTCCCGCAAGTGATAAATAAACTCGGTCTTCTTCAAAATTTAGATCCTAGGACATTATCAGAGCCCATAAATCCAGTATAGCATATGGCTAACCACATTTTGTATCTCAATGAAGGCCATAACACGCAGTATTACTGCTGAGTTCTCAGGGCAAGGCTCTGGATTTTCTCTGCTCAAGTTTCAACTTCACATCAATTCCATTTATCAATTATGGACTTGAGTACAATCTGAAGCTTCCCTTCCAATTTCTCCCCTTTCCTTGGAGTATAAACCACATTATGGATATCATCAGCCAAGGCCCTCTGAGCCAACAATTCCCCAACCGCAGCACAAGCATTTCTATTCTTAGTCGAACCCATGGCCTTGGAAATAGAATGCACCACAACCAGAGGTTTGCTAGAATTTCAGATCAAAAGAATGCTCTTTCATTCAATATTCATTGAGACTCGTTTGTTGACAGCCTATTGCACAGCATTGTGTTTGAACCTTGTGAAAAGCGAGGAAACTCATCTAATCCTTACTTCCCCATCTGTTTCTCTGGATCTTGAACAGGTTTCCTAGGTAATCCCCAGCTCCGTAGATTGTTCTTTTGCACAGGGCCAATTCTTGGTATTCCTTCACTTTCCCCTTCATATAAAAAATTACAGTATCCGAAACCAAAAGTTCATGATGCATATTTCTCTTAACTGGTGGTTTTCTGGTCACGACGGTTACAGTTAAAGTTCCATTAAAGAGCATTTCCACATGGTAGAACCTTCTCAAGGAATATAAGGTTTTCAATAGGCTGATCTTGAAGCTGCCCAGTCAACACAATTAAAAGCAGAGTACACAGCACGTGCAACAAACCCAGCCGTTCTTTGCTTACAATGGTAAGTACCTCATTATAGATTCTTTGGTCGACTATAAATGCTTCACAGCCTTGTTAAATATTTGGATTTTTATACTTGGTTCTAGCTACCAGAAAAAGGACTTCGAAACGAAGACTTTAATATTATTGGTCGCATCATAATACGCATAATATGAGTTTACAATCTCCACCTGAATGTAAATGATTGAAAGGAGAATGCTACCAATCAGGACAAATTTGACCTTAAAGAGGATAAACAAAACTTCTACTTCAGATTCTTTCATA\n>XM_017942333.1 PREDICTED: Habropoda laboriosa cyclin-T (LOC108578915), transcript variant X2, mRNA \nACAAGTATGAGTTTGGAGTGGAGTTTCCGGTTAGCGTAGTGACGTGAAGTTTTCAACGTGTTGCTGTTGTGCGTTGTGCGCCCGCCGCCACTATCGCGACCGCCGTGAAGTGCGCATCGTTAGTACCGAGTTGTGTGTACATATAAATGGCGGCTGACGAAAAATGGTACTTTACGAAAGAACAGCTTATAAACACGCCGAGCAGAAGATGCGGCATCGACGCGGATAAGGAACTGAGCTACCGACAGCAGGCAGCGAATTTCATTCAGGATATGGGACAGCGGCTCGTGGTGACACAATTATGTATCAACACAGCAATAGTGTACATGCACAGGTTCTATGTATTCCACTCGCTGTCACATTTCCACAGGAACGCAATTGCAGCAGCAGCACTATTTTTAGCAGCAAAAGTAGAAGAACAACCGCGCAAGTTAGAACATGTTATCAAAATGGCACATATGTGTCTCCACAGAGATCAGCCCCCACCTGATGTCAGGTCTGAGCAATACCTTGAACAAGCTCAGGATCTGGTTTTCAATGAAAATGTCCTACTACAAACTTTGGGGTTTGATGTCGCCATTGATCATCCCCACACACATGTTGTTAGGTGTTGTCAACTGGTTAAAGCGAGCAAGGACTTAGCCCAGACTTCATACTTCATGGCATCTAACAGTTTGCATTTGACAACCATGTGTCTGCAGTACAAGCCAACCGTAGTTGCCTGTTTTTGCATACATCTTGCGTGCAAATGGTCCAACTGGGAGATACCACAAAGTACTGAAGGGAAGCACTGGTTCTGGTACGTCGATAAAAGCGTAACGTCTGAACTTTTACAAGAGCTTACAGCAGAATTCCTCCATATATTTGATAAGTGCCCGTCAAGATTGAAACGAAAAATAATGAGCATATCCGCCAATCAAAGTCCAAGCATTAATCATCCTAGTTTACCGAATTCACCCTTTGATGCGGAACCTCGCAAGGTACAATCTCCTGCGACGACGGCCGACGGTGGACCTACATTCCATTCGAATCGACCTCATCAGATGGAGAAGCAAGAAGAGAAGAAGCAAATTGCACCAGCATCCTCAAGACCCCCTGTCGATTATCGGGAGTATAGAGAGAAGAAGGAACGCGAGCGTTTGGAAAGGGAAAAGGCGTCGGTTACAACGACAGTTGCCCAGAGTCATGTGTCAGATATTAATAAGCATCATTCGCATCACCACAAACTCGTATCTAGTACAAATGTGCTAAACAAACATCCACTGCCCCCTGGACAGAAGGCGCTTCACCACAATCATCACCACAGACCAGATATAAAGGTTGGACAACCAGTACCTCAGAGGCACTCAAGTAGCGCTCAAGCTAGGGAACCAAATCGCGATCCCAATAGGCAGAGGTTACAAAGAGAGTACAATTCGAATACTGGTACAAGTAGCAGTAGTAGTAGTAGTGCTCTTCATTCTCATAGTCACGCGGTATCGAAGGAGTCAAGTTTGGATAATTCATTGACGGATTCCGCCACTCACAGATCGGATGTCGGAGCATTGCAAGAGCCAACGTCCCATGGAAGTATACAGGAGAAACTTAGTAATAATAACCATAGTGTGCACAGATTAAGTGCAGTAGAAAGCAAATACCAGGGTCATGACAAACGAATGTATGATCCGAGGCATAAACCTGTTGAACATAGGAAAGATAGTGAACAAAAGCCATACAAATATCCCGATCCAACAAGAGAATATCGACAAAAAAAGTCTGATACGTTAGAGCAGAGGTGTGAAGAGGTGAGGAAGCTTATCGAGAAGCCATTACCTCCGCCCAAGCCTCCACTCGACGTACCGTACGCTTCGAATACACAGAAGCCACCACATCATACGAAATACAATCAATCGGAGAAACTACAGGCTAGCAGTGGCGCAGTTTCTACCGACGTGAAACTTCCCACTGGCCAGAGTTCGTTTTCACAGGAAAAATCACCAACCAGTTCCAGTTCGACCTCGTTGCTTACACAGAAGTCGTTAACCTCGAAGACGGTGTCCAGTCAGCACACAGCTCACGGTGTGTCCCAAATAATAAAGGATACGATTAAAAATGGTAGTTCTCAGTCGTCGAGTTTGTCATCTTTGAACAATCTCGACGATCAAAAAACTGAAAAGCGACCACGGCACGATGACATAGAGAAAAATTCGTCTGACATGCAGCAAAGTGTGTTACAGACACCTCCTAACAAGCCGAAATCGCTATTCAGTCCAGAGAAAGTACCAACGCCTCGCGAATCTCATTCGCAGAGGCCTAAGACTAAGCAAAAGACGCCGCCTTCGGCTGCAAAAGTTCCTAAACAAGAACGCGTACCAGATACGTCGATAGGCTTTAATTTAGTATCGCCGTTCGCGAGCCCGCCAGGCTTGCAACAGCAAGAAACACAAACAGTTAAACGATTGGCCAGTGATGTTTCCACAACATCCTCTCACAAAAGGCATCGTACAGGCAGCACCACCACCGAAGTAGGACAACAGGTTCAAAAAGTGAAAATAGACGATACTTCGAGTTTCGAGGCTGCTAAGATGCTCGGTAGGGTACCAGAACTGATACAACCTATCAGAGATAATCCATCGGCAAATGGTAGAGCCACTCAGATCGCGAACGACATGAAACCACCGGAACTCATCAGACCGTTCGACTCTGAGCCAACGATATCACGCTTCGGTACAGTGTCTACACAGCAACAAGTTTCGTCGAATCAACAAGGTCTGACCAATGGTCTGGACAACAATTTAGTGAAGCAAGATTCTCAGGAGTTTCTAATTAAGAAGGAGCCTACGTACAAGACGGACTTGTCAATGAAAGTAGAACACTCCCAAGCTAAAGGCGAATATTTGTCGCCAATGAAATCCGCTCAAAGTATAAGTGCTCTGCTTCAAGAGCCTTTAGCACCAATGCCATCGTTGTTGCAGAACATGCAGCAATTTAGTCAAATACCGTCGCAGCAAGTTCACCAGGATCAATTCCAGCAACAGCAGTTACAACAGCTTCAGCAACAGCAATCATCGCAACAACAACACCAGCCATCTATATCACACTCGATGCTACTCACACATCAAGAACCCGTTCAAACTCAATGCATGTCTTTGTCATCGGTCAGCGAGCCTGTTATAGCGTCGACCGTTGACATAAGCGCTCTCTCTATTCCCATACAGACCAGTACAGAATCCATACTATCTGTACCAACGTCGACAACCATAACCGTTCCACCTCCCGCAGAAGAAAAGAGATCGGAGCATCACAAGAGCGAGAAGAAGAAGAAGAAAGAGAAGCATAAACACAAGGACAAGGATAAGAGCAAAGAGAAGCACAAGCACAAGCATAAAGACAAGGACAAGGAGAAGCACCGGGAAAAGGACAAAGAGAAGGGCGATGAGACTGTACCTGCGGTACCTATTAAAATCACTATTCCTAAGGACAAATTGAATCTGAGCACAGAATCGACAAGTAGCACCGGCGGAAGTACAATTCCACCGGATAAGAACAAATCACCCCAGAATACAAGCATCAAGATCATTATCCCGAAGGAACGGTTAAAAGGTACCGACAGTGTGTCAAGTTCACCGGCTCAGTCGATGGTCCAGGCACCGTTGAAGATCAAAATCCGTACGGATGGAATCTCAAGGAGTTCAGGTGCTCCGTCGACGACGAGCAGTACGAGCAGTAGCATCGTGCCGGAGTTCACGAACGAGAGTCGTAAACGTGACCGTTCGGAGATAAAGGAGAGCCCAACTACCAGTGTTCCACCAACGAAGAAGCAATCGCAGGTCTCGTCGGCGGGTTACGGACAGCATCGGCCTGGAGAACGGCAGAACGGCAGACACTATAGTTCAGGCAGCAATAACAAGGAGAAACACACGTCTAGCCACCACAAAAGTTCCAGCAAGCTATCGCAGTCACAGCAGTCTCACACGTCGTAG\n>XR_004353595.1 PREDICTED: Danaus plexippus plexippus uncharacterized LOC116771400 (LOC116771400), transcript variant X1, ncRNA \nTCCTCAATACCCTCACCGGGTAATGCACGGCTCTCAATTAAACTCTAATTTGTTAATAATTAATACATAATGTTTATTGGGCATACTAAAATCTGCTCTAGACATGCAATATAGACAATTATAGGGGAGCGGTAGACTGGCCACATCTCAAATTCTGAACGTACTCCGCTCACATGGACTGCATCGTAATATTGACCCGCGTTACACGCACTGGAATTCGTCCTCATTTACCGCCCACTTGGAATTATTGAGGCGAGAAATGGATGATGTCTCTAACTTGAAAATATCAAAGTTAGAAGAGTCAAAAGACGGGTTGCCGAAACCAGAAACGATTGAAGATTTTGAAAGAACGAGCAATTGGAGTCCTGAAATAATTAATTTATAAAAGAAAAATTTTGCTTCCTTCGAATATTTTTGATTACTTTTAAGAACTTGATGAAATACACACAGAGATGGAATTCATAACGAATTTCCTTATTATAAGAGCTTTTATTTAGTTTCCAAAGCAAAATACACTTTTCAACATACTATGCAGATAACTGGCTATTGAAATAAACATTCAGTTCGCGAGCATACATTGTAGTTCAAACAAGCGACATATGG\n>XM_004253934.1 Entamoeba invadens IP1 hypothetical protein (EIN_093680) mRNA, complete cds \nATGATGAGAATCAAAGATGCATTGATCAATACTGGAGGAAACACATCAAATATAAATAAAATGATTGAAGATGTTAATATTGCTCTTCAAGCAATATCCATTGAATTAACAATTCAACAACCTGCAATAAATGAGCCACACTTTGTTTCACAACAAATCTGTGAACAAAATCCAAACATCATGATAAACACTTACAACGATAATGGTATCAATGATGAGCACAACGATTCATCTTATCCAGATAGAACAGCACAACCCAACACTGCTACGCCCCCTATGATAGACACAACACAAACACCAATAGGTGTTGTTGATCAAACACCATTTGATCTTGAAACAAACTTAGATAAGAAACAGACCACTTTTGGTGATATCATGGGTCATTATGACCTTGTTTATGGAAACGATCCAATTGATGGCAGCCTGGAAACTGAGCACAGTGGAGGCGAAGATGAAGCTCATGAAAATGAAGAATATGAAGGAAGTGAATGCAATGAATGTAACGAAATAGAAGACACACGAGTCCATGAAATAATGAGTCAAGCATCCGGGATATGGCAACAGTTGTCTTCTTCGCTTATTAAGTCACACGCATCAAAAAAACCTCCCGGAAAATATCGAGGTTGCAGATGA\n>XM_004439747.2 PREDICTED: Ceratotherium simum simum succinate dehydrogenase complex assembly factor 1 (LOC101397205), mRNA \nCGGATAGCCGGAGGCGGGAGGCGGGAGGCGGGAGGCGGAGGCGGGGGCGCGCGGGGCGGAAGTGCCTGCTGCCTGGCTGCTGGCGTCTGGCGCCGGGCGGCCGCGCCGCGGTTGGTGGGGCCTGCGCTGCGTGCGACCGCGGCCCCGCCGGCACCATGAGCCGGCCCAGCCGGCTGCAGAGGCAGGTCCTGAGCCTGTACCGCGAGCTGCTGCGCGCCGGGCGCGGGAAGCCGGGCGCCGAGGCGCGGGTGCGGGCCGAGTTCCGGCAGCACGCCTGCCTGCCGCGCTCCGACGTCCTGCGCATCGAGTACCTGTACCGCCGCGGGCGGCGCCAGCTCCAGCTGCTGCGCTCCGGCCACGCCACGGCCCTGGGTGCCTTCGTGCGCCCGCGGGGCCCGACCGAGGAGCCCCGCGGCGCGGGGGCCCCGGGGACCCCGCCTGAAGATGGTGACGGCCCGAGAAGCCCGCCCGACGGCATGGGGTCACCAGAGACCTCGCGCGATGGACGGTGACAGGCAGAAGAGCTCACTCGATGGTGCAGGGAAGACGGGGGGCCAGCCTAACTGCGTGGGGGGACCAGGGAGCCCGCCTGATGAAAGGCGAGAGGTCTTGAGAGACTAGCTCGATGG\n>XM_013238176.1 PREDICTED: Biomphalaria glabrata uncharacterized LOC106077421 (LOC106077421), partial mRNA \nAGAAATTCTATATTTGGTCAACATGCTTCTAATTAATTCTTCAATATGCTTATTATTGATACTTCTTCTGCTTATGTTTTTGTACAATTCCTAAGGAAGAAAGAAACTGATACAAGGCTTCAGAATGGATACGCTTCATTTGACAACAGTGGGAAGACAACTGACAGTGTCAAACTATCAACTGGAGAAAAAACACCCTTACTGAACAGAAGATCCAATGTAAGGACATCATTAGCCGACGAAACTGCCAGAACTAGTGCTAGTGAGAAAGAAAAGGATAATGAGGACCATCTAGTTCAAGCTTCATTATTTAAGGTGTTGGTGAAGACTTATGGGATAGAATTACTTAATGCTCAAGTCTGCAAGTTTGTTTATGACTTGCTTCAATTTGTTAGCCCTCTGTTACTTAG\n>XM_016498712.1 PREDICTED: Sinocyclocheilus anshuiensis protein FAM150B-like (LOC107697862), transcript variant X1, mRNA \nGTCTGAGAGCCCCAATAAATTGACGAGAATCGACGGCGAATGTCTCGAGGCGTTGAAGACGCGCGCGCACAGCGTCCTCAGGAGCTTTGACTGGAGTTTTCTCAAGTCTCGGAAACATCAGAAGGAAGTCTGACCACTATAACTTCCCACGCTTGAGCACATTAAAGAACGATTCGCTTTAAAGGGTAGCGCTCTCTCTCTTTCCCAGCGCGTTCTGCGAGCCTCGCGTGGGGTTAAATAGGCACCGGACGCTCAGTCGCCTCAGGCTGTGTCGACTGAGGGAAAGAAACGCGGCGACACAAGCGCCCTCAGACTGCGTGATCCAGGACTTGGGCAGTTCGGGAGCGATGCGCGCGCTGCGGGCTCCGGTTCTAGTAATGGGGCTCGTCATGTTAATCTGCACTACTGCACAAAGCGACGCCAGCGCGAACAAGGTCGAGAAAACGTTCAGACGGATAACGGACATCATGAGACTGGCGGAAAACAGCGTTGACGACGCGAGCGTGCCAAAGGACACTCATCGTCTCAAAACGGAAACCGGGGAAACAATTTTAAAAATCTTTCCCAGAGACCTCAGAAAGAAAGAGAAGGTTATCAAAGTCTTAACAGGTCCTCTTTATTTCAGTCCAAAATGCAGGAAGGACGTCTACAGGCTTTATCATAACACCAGAGACTGCACCATCCCTGCATACTACAAAAGGTGCGCACGACTCTTGACGCGACTGGCAGGGAGTCCGAGATGTCAAGAGGGTTAACTGTACCAGATTCAGAGAGGACACATGCACTTAAAGCTTTTATGACTGAGAACACATTCTAGGATTAGATAACTTATCCAAGCTATTACAGATAAACCTGCGTGTCTTAGCAAATAGGATGTGATTTAAGCATGTAAACAAACTTAAGTCAGTGCTTTACATTTCATGGTGGGTTTTTCCCCCCCCAAAGACCACTTCAGAGGAAGCACATGTAACAAAACCTGTTTCCCAATTTTTCACAGATGCATCCAAGTGCACACATGTATGCGAACACAGCCAAGTCTGAAACAGCACTAAACTTCACTTCCTTTATCAAGCAGGTTGAAGCCAAACCAGAGTGACCCAAGGAAAAAAAAAAACAGCAGTCAAAGTGCCTTTGGACAAGAGAAGAGAATTTAAACCAACACACAACAATCCACATAATCAGCACATCTCGTCCAGAACACTGCTCTGCCTCTCTGGAGAATAGATGTGGGAAAGTATTGACAGAGAAGTAAACGGACACGGAATAATGGGATGCACTTGCCCAAGGACAGTCTGATGGACTCAACATGGAGCCAATGTTAAAACACAGGACGACAGAGAAAGAAAACAGAAAACGTATCTGGCATAGTGCGTTCTGAACCTGTCTGCCAAAAAAGAAAACCATTTTTCCATCGTTTCATCATGAAAAAGGGATAGCCATGGTTTTGCGTTTCGATATCAGATTATCGAGACTCGTCATTGCTGATGTTTCGCACGACATGCCTCGATGGGGTTACAATTCAGAGCCACGATGACAAATTGAGTTAGTTCGCGGCAACGAGAGAGCTTTGCTTTTCTCGGTGCTAGAACTGAAAATCATTAATTGCATGAACGTTTCCTTTTGCTTCTGTTTGCCAGCAGACAGGTAGATTTTTGCAGTAAATCTGTGACCAAAAGCTTTTAGTTTTTGTGTGAGACTATGAGTGTATGACTGTGGAATATATTCAATATATTTTGATATGTAAATGTTGTACAAATGAGACTTAAAAATCCCTATAACAAAACATATAAGCA\n>XM_010619662.2 PREDICTED: Fukomys damarensis sorting nexin 31 (Snx31), partial mRNA \nGCGCTGGGGGGTCGCTACGTGCTGTACTCCGTGTACTTGGACGGGCTCCTCTTCTGCAGGGTGCGCTACAGCCAGCTGCACCGTTGGAACCAGCAGCTCAGGCGGGTCTTTGGAAGCTGCCTGCCGCCCTTCCCACCGAAGTACTATCTGGCAATGACCACATCTATGGCAGAGGAGAGGAGGGCCCAGTTGGAACAGTATTTGCAAAACGTAACTGCAGACCCAAATGCCTTGAGGAGTGATGTCTTCATTGAGTTTCTACAGCTGGCACAGCTGAACACGTTTAACATCTCTGCTGAAAAAGCTTCTCTAGATATATTTCTGCCCAATGGAAGAAGTGTTAATATAGAAATTCTGACATCAGATACTGCTGAAAGAGTCCTAGAGGTGGTGTCACGCAAACTCGGACTGAGTTGGGAGCTCTTGGGCTACTTCGGCCTCTTTCTCATTCGGTTTTACAAGGAGGGCAGCCTGTCTGTTGTGAAAAAGTTGGCAGATTTTGAACTCCCTTATGTTAGCCTTCGAAGTTCTGAAGAGGAAAACTGTAAGGTTGGACTCCGGAAGTGGTACATGGACCCAGCCCTCGACTCTGTGCTGATGGGCTGCAGAGCGGCCGTGGAATTGCTCTACATGCAGGCAATGCAGGACATTGAGAAAGAATGGATCAAGCCCACACAGGGACAGAGGCAGGAATTAGAGGCTCTTCAGAAAGAAAACAATCAAACCAAGTTCCTGGAGCTGTGCCGGGAGGTGCAGTGCTATGGATACATGCAGCTGGATCCTTGCCGCTGTGATTCCCCAGAGCCAGGCTGTGGGGCTGTGCTCTCTGTTGGCAAAGATGAGATCTGCTGCTGCGTGACCCTGCCTGACAGCCGGACACAGGATGTCATCCTCCAGATGAGCAGCGTGAAGTGCTGGCAGGTCACTTTCCTTGGGACTCTGCTGGATATGGATGGGCCCCAGCGAACTCTCAACCAGAACTTAGAACTCAGATTTCAATACAGTGAAGATAATCACTGGCAGTGGTTTATCATTTACACCAAACAGGCATTTTTGCTGAGTAGCTGCTTGAAAAAGATGATCTCAGAAAAGATGGCAAAGCAAGCTGCTGAGAATACAGAAATGCAGATGGAAGTTCCGGGAACAAGAAAAAGTAAAACATGGCACATTCAGCAAAGCAAGCAAAAGAAGCATTCTAGTTTTCTATCAAGAAAACACAAGATCAAGAGAGCTGAAGGTGTCTGTGTGTTTGGAACCATAAAGGAAGAAGATCTTTGAAGAAAAGTCTCACCTTTGAAATGTCCCCTAAGACATCTCAAGATGGTGAAAGAGCTCGGTGGTGGGGGGTGGGCTTCCTGCTGTCAGGAAATAATTGACTTCTTCCTGTGTCTTCTAATGTTAAGATAGACTCTAGTCGTCAGGACTACCACAGCATTCTATGTACATTTCAAGAGTAAAAAATGTAAGAACTAAAGTTATAGAATTTGTTTTTACCAGCTCATCAATCACAAATTGCTGAATCAATTAAACAAATACGAACTTCACTCTCTTCCCCCCAAGAATCCATTCTTCTCTGGCTTCATGAAGTCCTCTGAATGGTCCCGTATTACGTAATGAAAGTCTTGCTCCAAAATGTTACCAGCGTTTTGGGCTCAAGTTCTAAAGACATGATTCATTAGCTAAGGAAAGCTGGGCTCTATCTAGGAAGTGGAATCACTGGGGAAGAAACCCAGACTTCTCCGACCTGTCCGCAGAGCTGCGTCAAGGAGGCGTGCAGTGCCGACTTGTTTCCTTACCTAGGTCGGAGGTACCATATGGGCAACCTCAGGGTCATATGCTGTTTTGAACATTTCTATTTGGGAAAGCAACACTGCCTTGTACTTGACATAAAATGCCTTTTAGGTCC\n>XM_017738153.1 PREDICTED: Corvus brachyrhynchos solute carrier family 23 member 1 (SLC23A1), partial mRNA \nGCCACCGCCCGGCCGGTGACTAAAGTCCTTCCCACGGCCATAAAACCCCCCCGAGCAGGGCCATCGCCGCCGGGGACGCGTCGCCGGAACATGGGGACCCGCTCAGGAGACCTGGCTCAGCCCCAGAATGGGAACGTGGCTCTGGCCCCCGCTGGCTCCCCGCAGACCCCTGGGAAGGAGCTGCCTGCGGCGGGCAGGCAGGACCACGGGGCGGGCACCAGGCCCCCCCGGCCGGAGATGGACATGCTCTACAGGATCGAGGATGTGCCCCCCTGGTACCTCTGCATCCTGCTCGGCTTCCAGCACTACCTGACCTGCTTCAGCGGCACCATCGCCGTCCCCTTCCTGCTGGCCGAGAGCCTGTGCGTGGGCAAGGACCAGCTCACCGTCAGCTACCTCATCGGCACCATCTTCACCTGCGTGGGCATCACCACCCTCATCCACACCACCGTGGGCATCAGGCTGCCCCTCTTCCAGGCGAGCGCGCTGGCTTTCCTTGTCCCCGCCAAGTCCATCCTGGCCCTGGAGAAGTGGCGATGCCCATCTGAAGAGCAGATCTACGGCAACTGGTCACTGCCCCTCAACACGTCCCACATCTGGCAGCCCCGCATGCGAGAGATCCAGGGGGCCATCATAGTGTCCAGCCTGGTGGAAGTGGTCATCGGGCTGCTGGGGCTCCCCGGGGCACTGCTCAGCTACATCGGGCCGCTGACCGTCACCCCCACCGTGTCCCTCATCGGACTCTCCGTCTTCCAGGCGGCTGGAGACCGGGCTGGCTCCCACTGGGGCATCTCTGTGCTAACCATCTTCCTGATTGTCCTGTTTGCCCAGTACCTGCGGCAGGTCGCCATCTGCCTGCCCGGCTACCGGCGGGGCCACGGCTTTGTCCTGCTCCGCATTCAGATCTTCAAGATGTTCCCGATCATCCTGGCCATCATGGTGGTGTGGCTCATCTGCTACGTGCTGACCCGCACCGGAGTCTTCCCCAGCCAGCCCGGGGAGTACGGGTACAAGGCCAGGACGGACGCCCGGGGCGAGATCCTGTCCGTGGCGCCCTGGTTCCGCGTCCCCTACCCCTGCCAGTGGGGGTTGCCCACGGTGACCTCAGCAGCCGTGCTGGGCATGTTCAGTGCCACACTGGCGGGCATCATCGAGTCCATCGGGGACTATTACTCCTGTGCCCGGCTGGCAGGAGCGCCCCCGCCCCCTGTGCACGCCATCAACAGGGGCATTTTCACCGAGGGCATCTCCTGCATCATCGCGGGGCTGTTGGGAACCGGCAACGGCTCCACGTCCTCCAGCCCCAACATCGGCGTCCTGGGCATCACCAAGGTACCGGGGCCGGGGAGGGTCCCGGCTCGGCCG\n>XM_007330897.1 Agaricus bisporus var. burnettii JB137-S8 hypothetical protein (AGABI1DRAFT_85928), mRNA \nCAACGATCGATTTGCTCATCGACACTGACATCCTCAAGACATGGCCCCCGCGAACACCAAGAAAAAGACTGGCGGCAAGACTCGCTCTGCGCTGCAAGACGTCGTCACCCGCGAATACACTGTCCACCTCCATAAACGCGTGCATGGCCGTTCCTTCAAAAAGCGTGCTCCTTGGGCCGTCAAATCCGTTGTCGACTTTGCTCAAAAAGCTATGGGCACGGCCGACGTTCGTCTCGACCCGAAGCTCAACCAGGCTGTTTGGGCCCAGGGAATCAAGTCTGTTCCTCACCGGATACGTGTAAAGCTCGAGCGAAAACGTAATGATGATGAAAACGCAAAGGAGAAACTCTACACCTACGTCTCCCATGTTCCCGTGGAATCTTTCAAGGGTCTTCAAACGACGGTCGTCGATGCAGAGTAAAAGCTTAGTTATATAGGTTCTGCCGGTCTTCTATTCGTGTTGTCGCCTTGCACCTCATGCCAGTCACATATGCATGTTCTACGTCCCCCATATGCCATGCCACCCAGGTTTTTAAAATCAAGGAACAAAAACAAAACAAACCTTTTCACATGGGTGCTTCGTGTCAATGTCATAATTCTGCGTGCAACACGCTGCCTACTTCTTTCCGGCCGTAATTCAGAAAAA\n>XM_027301384.1 PREDICTED: Coffea eugenioides uncharacterized LOC113758607 (LOC113758607), mRNA \nATGGCCATCAGGCAGAGGCCCGACGAGTCCCTAAGGAATTTCATGACCCGTTTCAATACGGAGAGCTTGCAGATCAGAGACAAGGACGAAAAAGTGGTCATGGCTGCCTTCATGAATGGGCTCAGGGTGGAAGACCTCTTCTACAAGTTGGCCGAGCAGCCTCCTGAAAATCTGGAGGAGCTCCTGAAGAGGGCGCACGCGGCCGCCAATGCTGAGGAGGCGGCCTGCCTGAAGAAGGAATCAGATCGGGAGCTCGGCGATCGGAGAGGACGGACAAACCCCCCCGAGAACAAAAAGGGTCTGGCCAAGACGAACGTATTTGACCGGCTCTCAAAGGAAAAGGCCCCTGCTCCGACACCGCTCCCAGAGAAAAGCTACACCCCCCTGACTCGGCCCAGGGCCCAGATCCTGGCCGTCATGGAGGCAGAGGGCCTGGGAGGTCGGCCACCTAAGATGGGAACACCTCGGAACAAAAGAAATCAGGACCGGTACTGTGCCTTCCACCGTGATGTCGGGTATAATACGGAGGGGTGCTGGGCCCTGCAAAGGGAGATTGAGGATTTGATCCAGCGCGGCTTCCTGGGACGTTTCGTTCAGCAAGGTCGGCTAGGTCGGGAGCTAGGTCGGACCTACCGTGGAGACAGGGACGAGGGCTAG\n>XM_036118028.1 PREDICTED: Halichoerus grypus purine nucleoside phosphorylase (LOC118551879), mRNA \nGATTAAGTTGTTAGCCCAGCCTTGGGCAGTTGAATCTGGGTGTGTCACCATGGAGATAGGGGCCGGCTTGCGTGTTCGGCTGCCATTGGCTGGGGACGCCGGGCTGGGATAGAAGCCAGCCGCGAGTAACTGTGCAGACACTGTGCACAGCGCTCCCGGCGAGTACAGCTCAGCGCGGCGCTGCTCAGCGGACCGGATCCCAGAGGCCAAGGGCGGGCTCCTCGAGAGGGCGGAGGCGGCACCATGGAGAAGAGATTTGCGTATGATGATTATCAGAAAACGAGTGAATGGCTTCTGTGCCACACCAAGCACCGACCTCAAGTGGCAATCATCTGTGGCTCTGGGTTAGGAAATCTGGCCGATAAATTAACTGACAGCCAGAGCTTTGACTACAGCGAGATTCCAAACTTTCCCCGAAGTACAGTGCCTGGTCATGCTGGTCGACTGGTGTTTGGGTTCCTGAATGGCAGGGCCTGTGTGATGATGCAGGGCAGGTTCCACATGTATGAAGGCTACTCGATCTGGAAGGTGACATTCCCGGTGAGGGTTTTCTTCCTTATGGGCGTGGACACCCTAGTGGTCACCAATGCTGCTGGAGGACTCAACCCTGAGTTTGAGGTCGGAGATATCATGCTCATCCGTGATCACATCAACTTACCTGGCTTCAGTGGTGTGAACCCTCTCATAGGGCTCAATGACGAAAGGTTTGGACTTCGTTTTCCTGCCATGTCCGATGCCTATGACCGGGATATGCGGCAGAAGGCTCACAGGGCCTGGAAAGAGATGGGGGAGCAGAGGGAGCTGAAGGAAGGCACCTATGTGATGGTGGCAGGCCCGTCTTTTGAGACTGTGGCTGAATCTTGGCTGCTTCAGAAGCTGGGGGCAGATGCTGTTGGCATGAGCACAGTACCAGAAGTTATAGTTGCGAGGCACTGTGGCCTTCGAGTCTTTGGCTTCTCCCTCATCACTAACAAGGTCGTCTTGGATTATGAAGCCCAGGAGAAGGCCAATCATGAGGAAGTACTAGAGGCTGGGAGACAAGCAGCAAAAAAACTGGAACGCTTTGTCTCTATTCTTATGACCAGTATTCCACCCCCTGCCAAAGCCAGCTAACCAGCCCTGGAGCGGTCTGGCCTCTCCATAATGGGATCCAAGTAGCTAGCTACTACATACTTCGGCCCCTTGCTGGTGTCACGTGCCTCTGCCCTTCAGTAGGAGGAGAAGAGAGAGGAAGATCCCTATCCTTCACCTCCCCCATTTCTCCCACCAGACCCTTCTGCACTGGCTCTTTTGCTCAGTTATCTCAAAGCAGTTATCATCTCCTTCCCCCTCTCCCCGCCCCCTCCCCCGGCCAAGAGCTGGAACCCAAGCCCTGCTGTGTCTATGCCCTGGGTGTGACTTGGCTGTTGAACTTGGCACGGTAGCTACTGCTGTCCTTTTGCTGTAACGCTTTCACATTCCTGGGGACTCGGTTCTGCCTCCTCCAAAGCACTAGAGCCCACACGGGGGCTGGCCCAGTCCAATACCCCTTGGAGTTTTGTATTACCCTATTTTAAGAATAAAAAGAAAGATGAAATAATATATTTTTTGTGCAGTTTGGGATGAGGGTAGGGGCACAGGCCGAGTTTGGCATGAAAGACTGAGATCCCATGTCTTGTGTGACTATCTGCTTCTGAGACAAGCAGCTAAGAACTGATGAGGTGGTGTGTGAATGCACGGAAGGAGGAAAGATACAGATGTTAGAAGATAAAGAAAGAAGGGCTAACGACTGGCACAAGAGGGCCCCTTTCCTCAGACCAGTCTTGCCTCGGTCCTTTGCCTTCCGATTGTTTCACGCCCTGTCTGTACTCTCATGAGTATCTGAACTGCTTCGCTGGTCTCGGCTGTCCCACAGTTGCTATTTTCTTCCTAAGGCCTGATGATATTTCCTGTTGGTTTCTTTCTTCTCCCCTACTCTAACTTCTGCCGTAATTAACGGCACCCCTACATTCCTTCTCTGCATTCTGGCAATGCAGTGGCGAATACCTCTTTCTCTACTACAGTCACCCCGCTGCAGATTAGAGTCCTGCCAGGCCCAGGCAGACCTGTGAAGTTGGCTCATGCTTCGCTTCTCTTTGAGCCCCTCCTTCCGTCCTATTGCTTCATTTCTGGGTTCTAATCTTTCTCTTCACTTTTGCTTGATCAGAACCCGTCTGTGACACAGCATCCAGGCATTGCCCTTTGCTGGCTTGCTGCACTGTTCTATGCACTTATCAATTTGCATGCAGCTGGCCCGTGTGTCGCAAAACCACGCTACTCTCCCAGACCCCTTTGCCTTTTGAGAAAAGATCAAGTTGGATGAGCCACTAATAGTAGTGATATGTCAGTTGTCCATTGAAAACTTTTAAAAACCTCTGAAATCATCTTTTGTTTGATAACTGACCTACCTACCTGAGTCCAGCACAAAGAAAAAGCGTTCTGGAGTGGCCCTGTCCCCACTCTCTATCTCGTCAGTTCTTTGTACCTCCAGCAGCTCTAAAACCCTCCCTGGATCTTTAGGCGCTCTGCTAGCATTTGCCATGTGTCCATGAGAGCTGGTTTAGAGGGAAGTACTGTGTGTCCTTCAGATTATATGGACTCCAACTTGTTCGTTTAA\n>XR_007407767.1 PREDICTED: Canis lupus dingo uncharacterized LOC112644623 (LOC112644623), transcript variant X13, ncRNA \nATTATGACACACTGTTACCATGGAGACCAGAAGCTACTCAGCTCCTGCGTGGGTTGATTTTCCCCCTTTCTAACCAGCTGTTATTCCATCAGAGTAAAAGATTTTTACCAGGGTTTTTATGTTCATTGACCAATTTGGTCCTGTAAGACAAGCAGTCTTGGCCTTACTATTCCAGCAGCAAAAAGAGCACTGAGGCACAGAGGGATTTGTTCAAGGTCATACAAATAATGTTCTAAAAATGATATACTGAGAAGCACTTCCAGAAAGATGCAGTAAGGATCTCAAAAAATGCATTCCTCCAGAAAAACAAGAACACTGGCAAAAATTATAGAAATCAACTTTTTCAGAACTCTGAAAATCAACTAACAGCTTGTCACAATTTAAAGAGCATTTATTCAATAGAAACTTGTTGCAAGATAGCTGGAGGTTGCTCACTATCTGGGCTCCATGAAGGAAAGATGTGGGGAGAAGAGACCTTGATCCTAACACTTGGAACTGCCAGCAATCACTCACTTATACATCTCTTGCTGTTTGTGAAAGGTCACGATCTCGGGGTCATGAAATTAAGGATTAGTAACCTTAATTCCATTTGCAACTTTAATTCACATTTGCCATGTTACATAATATATTCACAGATTCTGGGACTTAGAACTTGGACATCTTAGAGTGGCGGACACAGAGTGGCCAGAGCTAGAGTAGCCATCTTGGACAATCAGGTGAATTTGACAATGGAAATCATGCCAAGTGAGCCACAAAAAAGAAGAATCTTATTGTATTTTCCTTGAGAGAGAAATAAACTTCTATTTATTTTTAAAGATGAAGAAAATGCCTTTCTGGGATACATTTCGGCAATCTTCTGAAGAAATAAAAACTAGATGACATAATGATCAAAACAAGGAAACAAACATGGCCCAGATGCTGTGATAAATGTGTGGGATTCATCCTATATTCTTGTAGGAACATTTGTCATGGCCAACTCTAATTTAAGACCAAGAAATGCTTTCAGCTGCTTTTATCCAGTTGCTAAATCAAATAACAGTATCAGAAAGAAATTCGAGGAATTTTGAGATGACTGCAGAGCTGTTATGTAATAAAAATCCCAGTAACGA\n>XM_029005051.1 Plasmodium malariae 40S ribosomal protein S18, putative (PmUG01_09035500), partial mRNA \nATGTCTTTACAAATAATCGATAACAACGATTTTCAGCATATTTTAAGAATTTTGAATACGAATGTTGATGGTAAAGAAAAAGTAACCATTGCCTTAACTGCTATTAAAGGTATTGGAAAGAGAATGGCTAGCGTAATATGCAGGCAGGCAAATGTTAACCCAACAAAAAGAGCAGGGGAATTAACAGCAGAAGAAATTAACAACATTGTTCACATTATGAATGCCCCCTCTCAATTCAAAATTCCAGACTGGTTTTTGAATAGAAGGAAAGATGTAAAAGACGGAAAGAATTTACATGTTATAGCAAATCAGCTAGATTCCTATTTACGTGAAGATTTAGAAAGAATGAAAAAAATTAGATTACACAGAGGTTTACGTCACCACTGGGGATTAAGAGTGCGCGGTCAGCACACCAAAACAACGGGAAGAAGGGGAAGAACTGTTGGTGTATCCAAAAAGAAAGGAGCGTAA\n>XM_007952246.2 PREDICTED: Orycteropus afer afer chromodomain helicase DNA binding protein 3 (CHD3), mRNA \nATGGAGTGGGGGGACATCAAGGAAGAACCAAACCCAGGCCTTCTGACAGAGACATCTGAGGAGAAAGCCAGGGACCTAACCCTGCTGAAAGCAGGTCAGAGTGTGCTGAAGGAGCCACACACTATGATCTTGCAGGCAAGAAGTGAAAATGACCAGCTCAGGCTTTCTTTTCCTCTAAGGCTATGTTGCGATGACAGGAGGCTTGATAAGGATGACATTCGGCTGCTGCCTTCAGCTTTGGGTGTGAAGAAGAGAAAACGAGGACCCAAGAAACAGAAGGAGAATAAGCCAGGAAAACCCAGAAAACGCAAGAAGCTTGATAGTGAGGAAGAATTTGGCTCTGAGCGGGATGAGTATCGGGAGAAGTCAGAGAGTGGTGGCAGTGAGTATGGAACTGGACCAGGTCGGAAACGGAGACGGAAGCACCGAGAAAAAAAGGAGAAGAAGACAAAGCGGCGGAAAAAAGGGGAGGGAGATGGGGGACAAAAGCAGGTAGAACAGAAGTCATCAGCAACTCTACTTCTGACCTGGGGCCTTGAGGACGTGGAGCATGTATTCTCTGAGGAGGATTACCACACACTCACCAACTACAAAGCCTTTAGCCAGTTCATGAGGCCCCTAATTGCTAAGAAAAATCCTAAGATCCCAATGTCTAAGATGATGACCATCCTTGGGGCCAAGTGGAGAGAGTTCAGCGCCAACAACCCCTTCAAGGGGTCAGCAGCTGCTGTGGCAGCGGCCGCAGCAGCGGCAGCAGCAGCTGTAGCTGAGCAGGTGTCAGCTGCCGTCTCATCAGCCACCCCCATGGCACCTTCCGGACCCCCCACCCTTCCACCACCCCCTACTGCTGATATCCAGCCCCCACCTATCCGAAGAGCCAAAACCAAAGAGGGCAAAGGTCCAGGCCATAAGAGGCGGAGTAAGAGCCCCCGCGTGCCTGATGGACGTAAGAAGCTCCGGGGAAAGAAGATGGCACCTCTCAAAATTAAACTAGGGCTGCTGGGTGGCAAGAGGAAGAAGGGAGGCTCGTATGTCTTACAGAGTGATGAGGGCCCCGAGCCAGAGGCTGAGGAATCAGACCTGGACAGTGGCAGTGTCCATAGTGCCTCAGGTCGACCTGATGGGCCTGTCCGCACCAAGAAACTAAAGAGAGGGCGGCCAGGAAGGAAGAAGAAGAAGGTCCTGGGCTGCCCCGCAGTGGCCGGGGAGGAGGAGGTTGATGGCTACGAGACGGATCATCAGGATTACTGTGAGGTGTGCCAGCAGGGTGGGGAAATTATTCTGTGCGACACCTGCCCTCGTGCCTACCACCTCGTCTGCCTTGATCCTGAGCTTGACCGGGCTCCTGAGGGCAAATGGAGCTGCCCTCACTGTGAGAAGGAGGGGGTACAGTGGGAGGCCAAGGAGGAGGAAGAAGAATATGAAGAGGAAGGAGAGGAAGAAGGGGAAAAGGAGGAGGAAGATGATCACATGGAGTACTGCCGTGTTTGCAAAGATGGGGGGGAGCTCCTCTGCTGTGACGCTTGCATCTCTTCTTATCATATACATTGTCTAAACCCTCCCCTGCCTGACATCCCCAATGGGGAATGGCTGTGTCCCCGTTGCACATGCCCTGTGCTGAAGGGCCGTGTGCAGAAGATCCTGCATTGGCGGTGGGGGGAGCCACCTGTGACAGTGCTAGCCCCCCAGCAGGCAGATGGAAATCCAGATGTCCCAGCCCCTCGCCCTCTTCAGGGCAGATCGGAGCGAGAATTCTTTGTCAAGTGGGTAGGCCTGTCCTACTGGCACTGCTCCTGGGCCAAGGAGCTTCAGCTGGAAATCTTCCACTTGGTAATGTATCGAAACTACCAACGGAAGAATGACATGGATGAGCCCCCACCCCTGGATTATGGCTCTGGTGAGGATGATGGGAAGAGTGACAAGCGCAAGGTGAAAGATCCCCACTATGCTGAGATGGAGGAGAAGTACTATCGCTTTGGTATCAAGCCAGAGTGGATGACAGTCCACCGCATCATCAACCACAGTGTGGACAAAAAGGGGAATTACCACTATTTAGTGAAATGGAGGGACTTACCATATGACCAGTCCACATGGGAGGAAGATGAAATGAACATCCCTGAATATGAAGACCATAAGCAGAGCTACTGGAGACATCGAGAACTAATTATGGGGGAGGATCCCGCCCAGCCCCGCAAGTATAAGAAGAAGAAGAAGGAACTACAGACCGATGGGCCTCCCAGTTCTCCTACTAATGATCCTACAGTGAAATATGAGACTCAGCCACGGTTTATCACAGCCACTGGTGGTACACTGCATATGTATCAGCTGGAAGGATTGAACTGGCTACGCTTCTCATGGGCCCAGGGCACGGACACCATTCTGGCTGATGAGATGGGGCTGGGCAAGACCATACAAACCATCGTCTTCCTCTACTCACTCTATAAGGAGGGCCACACGAAAGGTCCCTTCCTGGTGAGTGCCCCACTCTCCACCATCATTAACTGGGAGCGGGAGTTCCAAATGTGGGCACCCAAATTCTATGTGGTGACATACACGGGTGACAAGGACAGCCGGGCCATCATTCGTGAGAATGAGTTTTCCTTTGAGGATAATGCCATTAAAGGTGGCAAGAAAGCTTTTAAGATGAAGAGGGAGGCACAGGTGAAGTTCCATGTTCTCCTGACTTCATATGAGCTGATCACCATTGATCAGGCAGCGCTGGGCTCCATCCGCTGGGCCTGCCTTGTGGTGGATGAGGCCCATCGGCTCAAGAACAACCAATCCAAGTTTTTCAGGGTCCTCAATGGCTATAAGATAGATCATAAGTTACTGCTCACAGGAACCCCATTGCAGAATAATCTGGAGGAGCTCTTCCATCTGCTGAACTTCCTCACCCCTGAAAGGTTTAACAACCTGGAGGGCTTCTTGGAGGAGTTTGCTGACATATCCAAAGAAGACCAAATTAAGAAGCTGCATGATTTGCTGGGGCCACACATGCTGCGGAGGCTTAAGGCTGATGTCTTTAAGAACATGCCAGCCAAGACGGAGCTCATTGTTCGAGTCGAGCTGAGTCCCATGCAGAAGAAATACTACAAGTACATCCTGACTCGAAATTTTGAGGCCTTGAATTCACGAGGTGGTGGGAACCAAGTGTCGCTGCTTAACATCATGATGGATCTCAAGAAGTGCTGCAACCATCCATACCTCTTTCCTGTGGCTGCTATGGAGTCTCCAAAACTCCCTAGTGGGGCTTATGAGGGTGGAGCACTTATTAAGGCATCTGGGAAGCTTATGCTACTGCAGAAGATGTTGCGGAAACTGAAGGAGCAAGGACACAGAGTGCTTATCTTCTCACAGATGACCAAAATGTTAGACTTGCTAGAGGACTTCTTAGACTATGAAGGCTACAAGTATGAGCGCATTGATGGTGGCATCACTGGTGCATTGAGACAGGAGGCCATTGATCGGTTCAATGCTCCTGGAGCCCAACAATTCTGCTTCCTCCTGTCCACCCGCGCTGGGGGCCTGGGCATCAATCTGGCCACTGCTGACACTGTCATCATCTTTGATTCTGACTGGAATCCTCATAATGACATCCAGGCCTTCAGCCGGGCCCATCGGATTGGCCAAGCCAACAAAGTGATGATTTACCGGTTTGTGACTCGTGCATCAGTGGAAGAGCGAATCACACAAGTGGCCAAGAGGAAGATGATGCTGACACATCTGGTGGTGCGGCCTGGACTAGGCTCCAAGGCAGGCTCCATGTCCAAGCAGGAGCTGGATGACATCCTTAAATTTGGCACTGAGGAACTGTTCAAGGATGAAAATGAGGGAGAGAACAAGGAGGAGGACAGCAGTGTGATCCACTATGACAATGAGGCAATTGCTCGGCTCTTGGACCGGAACCAAGATGCAACTGAGGACACTGATGTGCAGAACATGAATGAGTATCTCAGCTCCTTTAAGGTGGCACAGTATGTTGTGCGGGAAGAAGACAAGATTGAGGAAATCGAGCGGGAGATCATCAAGCAGGAGGAGAATGTGGATCCTGACTACTGGGAGAAGTTGCTGAGGCATCACTATGAACAGCAGCAAGAGGACCTGGCCAGGAACCTCGGCAAGGGCAAGCGTGTTCGGAAGCAAGTTAATTACAATGATGCTGCTCAGGAGGATCAAGATAACCAGTCAGAATACTCAGTAGGATCAGAGGAAGAAGATGAAGACTTTGATGAACGTCCTGAAGGGCGTCGTCAGTCAAAGAGGCAACTCCGGAATGAAAAGGATAAGCCACTGCCTCCACTGCTGGCTCGAGTTGGGGGCAATATTGAGGTGTTGGGGTTCAATACTCGTCAGCGGAAGGCTTTCCTGAATGCTGTGATGCGCTGGGGGATGCCACCTCAGGATGCCTTCACCACTCAGTGGCTGGTGCGGGACCTGAGGGGCAAGACTGAAAAAGAGTTTAAGGCCTATGTGTCTTTGTTCATGCGCCATCTCTGTGAACCTGGGGCTGATGGCTCTGAAACTTTTGCCGATGGGGTCCCTCGAGAGGGACTGAGTCGCCAGCAAGTGTTGACCCGCATTGGAGTCATGTCTCTTGTGAAGAAAAAGGTACAGGAATTTGAGCACATCAATGGGCGCTGGTCAATGCCTGAGCTGATGCCTGATCCCAGTGCCGACTCGAAACGCTCATCTAGAGCCTCCTCTCCTACCAAAACATCTCCCACCACTCCTGAGGCTTCCACTACAAACAGTCCTTGCACCTCTAAACCTGCTACTCCAGCTCCAAGTGAGAAAGGAGATGGAATAAGGACACCTCTTGAGAAGGATGAAGCTGAAAACCAGGAGGAGAAGCCAGAAAAGGATAGCAAAATTGGAGAAAAGATGGAGACAGAGCCCGACGCCCCCAGCCCAGTCCCTTCACTTGGGGAGCGGCTGGAGCCAAGGAAAATTGCTCTAGAGGATGAGGTGCCAGGGGTACCTGGAGAGATGGAGACTGAACCTGGGTACCGGGGGGACAGAGAGAAGTCAGCCACAGAGTCGACGCCAGGAGAGAGGGGGGAGGAGAAGCCATTGGATGGACAGGAGCACAGGGAGAGGCCGGAGGGGGAAACGGGGGATTTGGGCAAGAGAGAAGATATAAAGGGGGACCGGGAGCTTCGACCAGGGCCACCTCGAGATGAGCCACGATCCAATGGGCGACGTGAGGAGAAAGCAGAGAAGCCACGGTTCATGTTTAATATTGCAGATGGTGGTTTCACAGAGCTTCACACACTGTGGCAGAATGAGGAACGAGCAGCTATCTCCTCTGGGAAACTCAATGAGATCTGGCATAGAAGACATGACTATTGGCTTCTGGCTGGGATTGTCCTCCATGGTTATGCACGGTGGCAGGACATCCAGAATGATGCTCAGTTTGCCATTATCAATGAGCCATTTAAAACTGAAGCCAATAAAGGAAACTTTCTGGAGATGAAAAATAAATTTCTAGCCCGAAGGTTCAAGCTCCTGGAGCAGGCGCTGGTGATCGAGGAGCAGCTGCGGCGGGCGGCCTACCTGAACCTGTCACAGGAGCCGGCGCACCCCGCCATGGCCCTCCACGCCCGCTTCGCCGAGGCCGAGTGCCTGGCCGAGAGCCACCAGCACCTCTCCAAGGAGTCGCTGGCGGGGAACAAGCCGGCCAACGCCGTCCTGCACAAGGTTCTGAACCAGCTGGAGGAGTTGCTGAGCGACATGAAGGCAGACGTGACCCGCCTGCCAGCCACGCTGTCCCGAATACCTCCCATCGCAGCCCGCCTTCAGATGTCCGAGCGCAGCATCCTCAGCCGGCTGGCCAGCAAGGGCACAGAGCCTCACCCCACACCGGCCTTCCCTCCGGGTCCGTATGCCACACCTCCGGGGTACGGGGCAGCCTTCAGCGCCGCACCCGTAGGGGCCCTGGCCGTCGCAGGCGCCAATTACAGTCAGATGCCAGCAGGGTCCTTCATCACAGCCACCACCAACGGCCCTCCAGTGCTGGTGAAGAAGGAGAAGGAAATGGTGGGGGCAGTGGTGTCAGACGGGCTGGATCGGAAGGAGCCCCGAGCCGGGGAGGTGATCTGTATAGACGACTGA\n>XM_031808598.1 PREDICTED: Oncorhynchus kisutch rap1 GTPase-activating protein 1-like (LOC109896808), transcript variant X3, mRNA \nATGAGGATCTTTACAGTCAGGCACATGCTCACACAGATATAGTACATACAGACCTATACAAACCCATGCATTCTAATGGGCATGCAGACCTGTTAAGAGACCTGAGACGCAGCAGTTCTTGTCTTGTATTTAGGGGCAGTAGAATACAGAGTGTAAAGTGACAGTAGTAGTTAGACCTCTGACACTCCTCTGGTCAATATACACACAGAAACAAATATACCCATACTCTGTTTTTGGAGTCGGAGTTTTGGAGTTATGAGTGACTTCAGGATGACTAAGAGTGGCCATGTGTTCCTCAGTCCTTCGGTTATTACATGGGGCCAGAGGAGACGACACAGTGATACATCAGACCTATTTGCAAAGATCGAGAGGATGCAGGGCAGCAGAATGGACGAGCAGAGATGCACCTTCCCTCCACCCCTCAAAACAGAGGAGGACTATATCCCTTACCCCAGCGTTCACGAGGTCCTGGGTCGTAGGAGCCCCTTCCCCCTAATCCTGCTGCCTCAGTTCGGAGGCTACTGGATCGAGGGGACCAATCACAAACCCAGTGCCACACCTGAGCCTGAGCAGAGGCCCTGTGCGTCCTCCCACATCAAGCTGGAGACCAACAGCATGGCCAAGATCTACAGGAAACAGTTCATGGGCAAGGAACACTTTAATTACTACTCCATGGACATCGGCCTGGGCCACCTGGTCTTCTCCATGAAGTATGATGTCATCGGGGACCAGGAGCATCTCTGCTTGCTGCTAAGGACCAAATTAAAAACTCACCATGATGTGATTCCTATCTCCTGCCTGACTGAGTTCCCCAACGTGGTCCAGATGGCCAAGCTGGTGTTTGAAGAGGTAAATGTGGACAGATTTTACCCAGTCCTCTACCCAAAGGCTTCAAGGCTCATTGTCACCTTTGATGAGCATGTCATCAGCAACAATTTCAAGTTTGGAGTCATTTATCAGAAGTTTGGCCAGACCACCGAGGAGGAGCTATTTGGGAACAGCGACGAGAGTCCTGCTTTTGTAGAGTTCTTGGAGTTTCTGGGGGACAAGATTGAGCTCCATGACTTTAAAGGGTTCAGAGGAGGACTGGACGTCACCCACGGCCAGACAGGAACAGAGTCTGTCTACACGAACTTTCACAACAAGGAGATCATGTTCCACGTGTCCACCAAGCTGCCATATACAGAGGGAGACTCTCAGCAGTTGCAGAGGAAGAGGCACATAGGCAACGACATCGTGGCCATCTTGTTTCAGGAGGAAAACACACCCTTTGTGCCAGACATGATAGCCTCCAACTTCCTGCATGCCTATGTGGTGGTGCAAGTGGAGAATGCCTGCTCAGACAATGTCACATACAAGGTGTCTGTGACAGCGAGAGATGATGTGCCTTTCTTTGGACCCGCTCTACCGGACCCGGCCATCTTTAAAAAGGGGCATGAGTTCCATGAGTTCCTGTTCACTAAGCTGATCAATGCGGAATATGCCTGTTACAAGGCTGAGAAGTTTGCAAAACTGGAGGAGCGCACGCGGTCGGCCCTGTTGGAGACCCTGTATGAGGAGCTACACATTAACAGCCAGTCCATGATGGGCCTGGGAGGGGACGAGGACAAACTGGAGAATGGGGCTGGGGGGGGAGGGGGCTTCTTTGAGTCCTTTAAGCGGGTGATCCGCAGCAGAAGCCAGTCTATGGATGCCATGGGCCTCAGTAACAAGAAGCCACACACTGTCTCCACTAGTCTCAGTAGCAGCTTTACCGAGACCCCCAAAACCCCAGGGATATCTCTGATCATTCCTGGGAAGAGCCCCACCAGGAAGAAGTCTGGGCCCTTCAGTGCCAGACGGAGCAGCGCCATCGGGATCGAGAACATCCAGGAGGTGCAGGAGAGGAGTCGGGAAGTGTCCCCCAGCACACAGAGGACTCCAGACAGTGGACACATCTCCCAGGACCCCAAATCAGAGAACTCATCTAATCAGAGCTCACCAGAGATGCCCACAACAAAGAACAGTTTGGCCATGTGTTGCAGGGCCCCTTCTATCCCTGAGGCCCAGGATCTGTCCCGCTCCTCGTCCAATGCCAGCAGCTTCGCCAGCGTGGTGGAGGAACACGATAACGAGGGCATCGAAGAGTACGACACGGGACTGGAGAGCCTGTCCTTTTCTGGAACACCACACAAGAGAGACTCATTTGCGTACGTGTCCTGGGTAGAGGATAGTTTGAGCAGTACTAGTGCCACCAGCCAGGGCAGCTCTCCAGCACCTGCACGGTCCCGGCAGCCTGAGGGGGGCAAAGGGGAAGAGCTCAAAAAGGCGGAGAGCCGAGACAAGACAGAGCGGTCACAGGATAAGTCATCATCGAACTGTTAGCCTCACCTCATTGATCAGTACATGGATGTCCATTAGCAGCATTCCCATAAGAGGCACCCCCTGCAGGAGATGAAGCAAGCGCACGTGTGTTCCACCACAGATGCAGAGGAGGAGCAGAGCTAGTCGCTGGGACAGACAGCTAGACCTGGTGTAAACTAGTCCAGTCTGAACAGCCAGGTCCATGGACATGCACTTACAGCCTTCCCTCATCCCAACTCTTTGTGGCTGACTCCCAGCATGCTTAGAGGGGTGAAGGAGAGGATCAGCCCACACCCATTCCCAAAATGAGTGCCACTCACACAGTATCGCTTCTGGCTGTTGTCTGTTGGCTCGCTTAGCCTGCATATATTTCTGCTCCATGAGCTCTGTGAAGCCTAAATCTGTTCATGTGGTAACTCATAGTATACTCTCCCTTGTCCTCTCTATGGCATTGTTTTTGTTTTGGTTCGAAGGTGGAGGGAGGGGAGGATCTTAAGCATTAGACAGATTGGTGTTGCAGGAGATCCGTTGATCATGCATTAGGGGAAGTTTTCTGTTAGGCTAAAGAGGAATGCATGAGGAGGATAAGAGGGTGTTGTCCTGTTGTCATTGTTGGAAGAACTGACATTATTGCTCCCATCAACCTCACGTCCCACCATGATACTGTACATTTGTTATTCTTGGTGTCCCGGATCCTTTGATGTCACACCAAGCCTTGTGTTTTATTAATGGTCAATTAAGAGTGTAATGGTGGATGTTGACTAGAAACTTTTAGTAAAATGTTACATGTTTTTGGTAGAAGGTACTTTTATCATCATGCTGCTGCTGGTTTTGATTCCATTATTCATTTCCCCTGACAAACTGTACAATTACAGTTCACAGTTTATGAATGGACAATACTTTACTGACTCCATAATTATAGTCAACGTATTTCAGGCCATTTAAAGGGGTAATTTGCAGTTCAAACAACAACAAAGTCTTTACCCCGCCACTTTTTCGATAACCAGCTGAGTGATGGGGTTGGCGAAAAGTAACCACTCTCAAATTCCTAGACAGAGCTATGGATGCAAGGACTGACCATCCAGGATAGCAAAATTATACTTTTAACCATGTTGAGGCTATATAGTGTTTGTTTACAGTTACCTTGTTTACTAACTAATGAGTAAAACACATTTTGGGTTTTGATGGGGTACGACAGTTGAACTAAGCGCATGAAGCATTTATAAGTAATATTCTTCAAGAATCAATGGGTATATATAATTAATTTAAATGTAAAAAAAAGCTATGTAGCAATCGTAGATTGCCCCTATAAACTGAGGAAAAAAACATGAAGTATTGAATTACCGATAAGGTCTAGTGTTCAAACTAAATTACTCATCAGTCTTCACTGTCCCATACTGTAGATAGTACCACACAGTCAGACATTCCTCCAAGGTGACCTAACCAAAGCACACAGCCTCCAAAGCCAAGCTATTGTCCAGTGACTACTGTCTTCAGTTTATTTTTTAAAACCTCTAGTTTGTTTTAAAGTATGTGTTTGGATGTGTATGCATGGTGAATGGTGTAAATCTGCTTGCAAAACCATGTCAACTGTACAGTACCATACTGGAAAAAGATTGTTTCTTCAAACCAGTCCAACTTCTCTAGAAAAGCAGACAGTCATTATTTCTATAAATCAGTTTCGATAGAGAAATATGGCGATACAAGTGTAGATGTGGAAACTGGCACTACATTTTCAATTAATTGTTTTTTTTATTTTTATTTTTTTTAATCTGACTTGGTTTTTAAAAATAATTACACTGTGACAAGTTTTGAAGTGGCCTTTTTAATGATTGTGTTAATTAAGCTGCTTTGTAGGAGGGTATCCCCCTTCATATAAGGAATCTATCCCATGGTGGATATCGCCACTGGATTGAATGTAAAACTAAACAGATATATGTATTCATTTGTAGACATCTGCTCTCAATGAATGGAACCTTTGTATCTTGTTGTAATGTTTTACATTTTCCCTCATCTCAGATTTATATAATGAAAAGACCTGATATGAAGGCATAGTTTCCATTACTTTTTATTTAAATTAAATGAACAAAAGCTAACATGGAATTTAGTTGCACTTTGTCAGTTGTGGCATTAATGCATAAACCTTTTACACTCCTTTGGAAATCTTTCAGTTGAATCTAAAGGATCTCTGTAAGTAAGGAACACTACATCAAAATACAGTAAGTTTGACAAGTATTTATTATTAAACACCATTCTAAAGATTATGATTCAACAAAAAACTATTAATTGAAATTGTGATTGGAAAGATGAGAAAGTAACCTTTCATCAGCTTAAGAGAGCCTTTGGAGTCCGTGTGTATTCCAGGCACTGAAACTCTAAATATATCAAACACAATTTTCATCTCAAAGCTTAAAATAAATGTATTAAAACTCACGAGTCTTCAGAAATGCTTGAATAGTTGGATCACACCCTCTGGTGGCTCTAGATTATACTTACACATTTCTCTGTGGTCCTGTTCATCTGTACCTGTGTTTGTACATGTAAATGCAAGACACTTGGATTGAGCACCCAGCCAATCCAAACAACAGATTCTGCCTACAATGTGCTTAATTCAGATGATTGTATTTCTGTTCTCGTTGATATTCCGCTCAAGCCCTTGTTTAAGTTGGAAAGTCTTGTATATAAATATAGCTTTTCATCCTTTTGTAAAAAAAAAAAAAGGCAAATACATGTTTAATAAAGACAAAGGGGTAA\n>DQ727116.1 Mus musculus piRNA piR-142438, complete sequence \nTGGCAACAGTATTGCTCTGGCTCCA\n>XR_005158834.1 PREDICTED: Triticum dicoccoides uncharacterized LOC119328068 (LOC119328068), transcript variant X2, ncRNA \nCTGCGTTCAGCGCTGCCATCCTGTCTAGTGCGCTCCCCTGACCGGCGCCATGAGAGCGGCTGCGCCGGTGGCTCTCGTGGACAGCGCGTGCATCAGTAACGTCGCAAAGTTCTTCCTCGCGAACAGCATCGCAGCACCGGTCGGAGCGGCGGCCATCCGTCGTCCCCCTCTGCGTTGTGCTACGCCGTCTCCGCTGAAGCTGCAATCTCCTCGGACGACCGCGTTATTGAGCGGATTTTCCTCATCCAGCAGCGCTGGCGACTCGTATCCATCTACCAAAGAAATGAGCAGCATCTTATCCATTCACTATGCTTCTTTTTTTCCTTTTACCCAGCGTTTGTACGAACAGGGAAACCCTCAAACGACAAAGACCAGCAGGATAGGAAGGGTGACAATGAGATGGCAGGCGCTGGAAATGTTTCTGATGTGGATCTTGCTAGGAAAATGTTAGATACTGCAAGAGGTAATAATGGAAAAGAGCAAAGGCAACACTGCGGAGATATCAAGAATCCTTTCCGCGGAAAAGAGAAAGAGTGGAATTAATTTGACAAGTCACTCAGTGAAATGTTTAACCATCTTGGAGCATTTACCTAGCTGTGCTTGACACCAGGGGCAAAGGCTGCCCCTTTTTCTTGTTCAAGGGTGGCGCGGCGAACACAGATGCAACATCGGCGAGAGTCGTTGGGGACACTGATATTTACCCAGGTTTGGGCCGCATGGTAACGGCTTGGATGTTCGCGACTTGTTCATGGGAGCCCACGACTTGGGCGTTCCTGGGAAGAATGCGGATGTCTTGATATCTCCTTATACCTTATTGTTGGTGCGGAAGCCGAGGGTCACGAAGGTAGCACCTCTCGATGACCTGCCTGGATGTCTGTGCTTCACTTGTATCTCCAGGGAGGAGCCTTGGATGATTCTTGGATATGCTGATGCCTAGGTGATCTCCCGGCAAGGAGCCACTGTGTGCCGCACGCATGAGGGTTTGTGGGTACCCGATACCCGCGACACCGACAACCTAACTGCATTCTGTTTTGGGTATGAAACTGTCAATCGTCTGTCATATAGCAGTAGTATTTGCATCCTTCTGAGGTGGGTCTCTGTGGTTTTAGGAGTACTAAATTTTTAGTTAGATACGTGCTGGTATCTTGTAGATTTGGCTGGTCTTCCTGTTGCTTAATTATCCCCCTTAATTCAGTCCCGGGACTCCCTGCACCGGCTTGGTCTTGGAGCTGCCTCCATTATGTAAATTGTGTATACAGAACCATGAAAGTGCCAAGGAGACTCGGAAATTCCACTTGAGAAGATGAGATAA\n>XM_024744316.1 PREDICTED: Neophocaena asiaeorientalis asiaeorientalis ataxin 2 like (ATXN2L), transcript variant X4, mRNA \nATGTTGAAGCCTCAGCCGCCACAACAGACCTCCCAGCCCCAGCAGCCGCCCCCCACGCAACAGGCCGTGGCCCGCCGGCCTCCCGGGGGCACCAGCCCTCCCAACGGCGGCCTCCCGGGGCCCCTGGCCTCCACCTCGGCTCCCCCAGGGCCTCCCGCCGCTGCCTCCCCCTGCTTGGGGCCTGCAGCCGCTGCCGGGAGCGGGCTCCGCCGGGGAGCTGAGAGCATCTTGGCGCCGCCGCCGCAGCAGCAACATCAGGAGAGGCCAGGGGCAGCGGCCATCGGCAGCGCCAGGGGACAAAGCACAGGAAAGGGACCCCCACAGTCACCGGTGTTTGAGGGTGTCTACAACAATTCCAGAATGCTGCATTTCCTTACAGCTGTTGTGGGCTCCACTTGTGATGTAAAGGTAAAGAATGGTACCACCTATGAAGGTATCTTCAAGACACTGAGCTCAAAGTTTGAACTGGCAGTAGACGCTGTGCACCGGAAAGCATCGGAGCCAGCAGGTGGTCCTCGTCGGGAAGACATTGTGGACACCATGGTGTTTAAGCCAAGTGATGTCATGCTTGTCCACTTCCGAAATGTTGACTTCAATTATGCTACTAAAGACAAGTTCACTGATTCAGCCATTGCCATGAACTCGAAAGTGAATGGGGAGCACAAGGAGAAGGTGCTTCAGCGCTGGGAGGGGGGCGACAGCAACAGCGATGACTACGACCTGGAGTCTGACATGTCCAATGGATGGGACCCCAATGAAATGTTCAAGTTCAATGAGGAGAACTACGGCATAAAGACCACCTATGACAGCAGTCTCTCTTCTTACACGGTGCCCTTAGAGAAGGACAACTCAGAAGAATTTCGTCAGCGGGAGCTGCGTGCAGCCCAGTTGGCTCGAGAGATTGAATCGAGCCCCCAGTACCGCCTGCGGATCGCCATGGAGAACGATGACGGGCGCACCGAGGAGGAGAAGCACAGTGCAGTTCAGCGACAGGGTTCAGGGCGAGAGAGCCCCAGCTTGGCATCTAGGGAGGGAAAGTATATCCCTCTACCCCAACGAGTTCGGGAAGGTCCCCGGGGAGGAGTTCGATGCAGTAGTTCTCGGGGTGGCCGGCCTGGCCTTAGCTCTTTGCCACCTCGTGGCCCTCACCATCTTGACAATAGCAGCCCTGGCCCAGGTTCTGAGACACGCGGTATCAATGGAGGCCCTTCCCGCATGTCCCCTAAGGCACAGCGGCCTCTGAGAGGTGCCAAGACTCTGTCTTCCCCCAGCAGCAGGCCTTCTGGAGAAGCTTCTGTTCCACCTCCTCCTGCAGTAGGCCGGATGTACCCCCCGCGCTCTCCCAAGTCAGCTGCCCCTGCCCCAATCTCAGCTTCCTGTCCTGAGCCTCCCATCGGCTCAGCAGTACCGACCTCTTCAGCTTCCATCCCCGTGACATCATCAGTTGGGGATCCTGGAGTAGGCTCCATTTCCCCAGCTTCTCCAAAGATCTCACTGGCACCCACAGATGTAAAAGAACTCCCAGCCAAGGAACCTGGGAGAACGCTGGAGTCCCAGGAGCTGTCCCGGATAGCAGGGAAAGTCCCTGGCCTTCAGAATGAGCAGAAACGCTTTCAACTGGAAGAACTGAGAAAATTTGGGGCCCAGTTTAAGCTTCAGCCCAGTAGCTCCCCTGAGACCAGCCTGGATCCTTTTCCTCCCCGGATCCTAAAGGAGGAGGCCAAAGGGAAGGAGAAGGAGGTTGATGGTCTTTTGGCTTCAGAGCCCATGGGGTCCCCTGTTTCCTCCAAGACAGAATCCATATCGGATAAGGAGGACAAACCACCCCTGCCACCAGCAGGAGGCGCCGAAGGGCCGGATCAGCCCCCACCACCTTGCCCAAGCCAAACCAGTAGCCCCCCAGTGGGCCTCATCAAGGGAGATGACAAGGATGAGGGCCCTGTTGCTGAACAAGTGAAGAAGTCAACATTGAACCCTAATGCCAAGGAGTTCAATCCCACTAAGCCGCTGCTGTCTGTGAATAAATCCACCAGTACTCCAACTTCTCCTGGGCCCCGGACTCATTCAACTCCCTCCATCCCGGTGCTGACAGCAGGCCAGAGTGGGCTATATAGCCCCCAGTACATTTCCTACATACCTCAGATCCACATGGGACCAGCTGTTCAGGCACCTCAGATGTATCCATATCCTGTGTCCAACTCAGTGCCTGGACAGCAGGGCAAGTACCGGGGAGCAAAAGGCTCCCTGCCCCCCCAGCGCTCGGACCAACACCAGCCAGCCTCAGCCCCTCCGATGATGCAGGCCGCCGCCGCCGCTGGCCCCCCTCTGGTGGCTGCCACACCTTATTCTTCCTACATCCCCTACAATCCACAGCAGTTCCCAGGCCAGCCCGCCATGATGCAGCCCATGGCCCACTACCCCTCGCAGCCGGTGTTTGCCCCCATGCTTCAAAGCAACCCACGCATGCTGACGTCGGGGAGCCATCCCCAGGCCATTGTGTCATCCTCCACCCCTCAGTACCCTTCTGCAGAGCAGCCCACCCCCCAAGCCCTTTATGCCACTGTTCACCAGTCCTATCCACACCATGCCACGCAGCTCCATGCCCACCAGCCGCAGCCGGCCACCACGCCTACTGGGAGCCAGCCGCAGTCCCAGCATGCAGCCCCCAGTCCCGTCCAGCACCAGGCGGGGCAGGCCCCACACCTGGGCAGTGGACAGCCACAGCAGAACCTGTACCACCCAGGGGCCCTGACAGGCACGCCGCCTTCTCTGCCGCCGGGACCTTCTGCGCAGTCCCCTCAGAGCAGCTTCCCCCAGCCAGCCGCTGTGTATGCTATCCATGCCCACCAGCAGCTGCCCCACGGCTTCACCAACATGGCCCATGTTACCCAGGCCCATGTCCAAACTGGAATCACAGCAGCCCCGCCCCCTCACCCTGGGGCTCCCCACCCGCCCCAGGTGATGCTGCTGCACCCACCCCAGAGCCATGGGGGCCCCCCCCAAGGCGCGGTGCCCCAGAGTGGGGTGCCTGCACTCTCAGCTTCCACACCCTCACCCTATCCCTACATCGGACACCCCCAAGGTGAGCAGCCTGGCCAGGCGCCTGGATTTCCAGGAGGAGCCGATGACAGGATTCCTCCCCTTCCACCCCCCGGGGAACTGAAGATTGTCCTGGCCGCGACCTGAGACCTCCATGAGTGGAGGGAAGAGTGACCTATGTCTCTTCCCCCAGCAGCTCGGACCAGTCCCAGCCCCCCAATCCCCCTTTCCCCCCGGGGGCGGGGGGAGCTGGGGAATTCCTGCCAAGCACCTTGAATGGGAAGGGGGGCCTCAAAGTGGGCAGGGCCGGGGTCCAGC\n>XM_034818856.1 PREDICTED: Vitis riparia uncharacterized LOC117905960 (LOC117905960), mRNA \nGAGGGGAGAGGGAGAAGAGGTTAAATAATGAATGGGTTCTGAGGAATTGCTACCTTCTTCACCACTTTACTGTTTCTTTCAACCACGCTCTCCTGCCTTTCTTGAACCAGTCTTTGGTCCACGCATGCCTCTCTCTGCAGCCGTCTCTCTTCTCCTTATTTAGCTTTCCTTCTTAATTCCTTCTTTCCTTATATTGGATTTTTTTTTTTGTTGACATAGAGAAATCCAAAAGGAAAAACAGAAAAGCATCGGGTCATTTGGGGAGAAGGGATGTTGGGATGGAAGCATATCACGGTGGCTGCGGTGGCGGCCGGAATACTGACTGTGCTTCTGATCGTGTTATTTTGGCGATGGTGTTGTAGTAAAGGACATAAGGATTTTGTTGATGCTTCCAGGAATAAACATCAGAGCTTGCAAGCTGGGATTGCGAAACTCCACCATGTTAGCCTTCCTCCATATCACCATGATCTAGACAGCAAGAGAAAGGCGAATTACTATGTTTTTCGACGTGGGGTTTCATCCAGACCTTTGTTTAATTGGGCGCATCATCCATCGCTCGTCACGGATGCGGTTGAAAATGGGTGGTCTCGATTCGGTTTCACGAGCTACATGTCGTCTCCCTCGATGAGATCATCGCTGTTGGGATTATGCGCAGTGGGGGAACATGGGAAAGAAACGGGGGCGGAGATTAGCTGGGAAGTGTCTCAGGGATCGGCTGATTTCATGCAGAAGATCAGATTGAATTCTGGGTTAAAGAAGATGAATATGAGCAGTCCTTCCATGGCTGCTGCATCTGTAATTAGAACAGCTTTGCCACTGCCAGGCCCTCCCTTGGGGAATTCCTCGTTCCCGCAAGAAGCCTACTTCGAAATCACAATATTGTTTTCCGGTGAAGGTGATCCTGAGTCTGTTGGCCGGGTTAAGGAAGGTGAGAGAACGAAGCTCATCCATGAGAATTCCAATGCTAAAGCCAATTCAGAATCTATAATCCATCTTGAAGAAATGAAACTCGGCTCTAAGGACGACGGCAAAGGTGAAGTCGTAATGCTATCGGTGGGGCTCACCGCCGGAGGCTCTCTTCCTTTGAAACTTCCTGGCAGCTACCCGGGATCAATTGGATTTAACTCCAATGGCTCTGTCTATCTTGACGGAATTAAACTTGTATTCGAATCGGAGAAGGAAGAATGGGAAAGGGCAGACAAGGTTATTGGTTGCGGATTTGATCCTAGCCAGAAGAAGGTGTTCTTCACAATAGATTCAGAACTAGTTCATGTAGTCCATTGCAAGTCAGAGGAATTTGGGAGTCCCCTTTATCCAACCCTCGGGGCAAACACAGACGTGGAAGTTCTGGTTAATTTTGGACAAAGTATGTTCAGCTACGCACCCGCCAATGCACAAAGAACTCCGAACCCTTGCTTTATCGGCCCCCTTGTGAATTCCCCCGCTGCTGCTCTGGGGTATGAAGACAGCAGGGAGCTTTTCTCAATGGGGAGAATAGACTCCCAGTGGCTCAACAGATGCACAACCAAAAGCAGCCACAACAATGGCAGTAAAGCATTAGATTTCGATGAGGATTCTGAAGCTGATTTATTTGAAATAGTCTTGGACAGAAGTGGCCGATCACCACACGCAGTATTGTAGAAACAAACTATAAATATCACTAGGATTTGTTGCATATATGCCGCCCACATGCATTTGCTGAATGCAAAATTTTCATACATTCACAAGCCTCTTTTAGGGTTTCACCTTCGCTTCTCCTATTACATATACCAACAGGTTCTTCAGGAACTGCTGATACATTTTTTTCATCACCCCTGTAACTAGAATTTTCATTTATTTTCCCTCTGTATATATCATGACTAATGTTCCTCCTCCTGGTTGAGTGATACCAATGTTCTTTCAGTTC\n>MF368550.1 Uncultured bacterium clone New.OTU5316_1 16S ribosomal RNA gene, partial sequence \nTACAGAGGTGGCGAGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCGAAGTGTGTGAGGTGTGAAATCCATGGGCTCAACCCATGAAGTGCGCCTCAAACTGCTTCGCTCGAGTTCGGGAGGGGAGATCGGAATTCAGGGTGTAGCGGTGAAATGCGTTGATATCCTGTGGAACACCGGTGGCGAAGGCGGATCTCTGGACCGATCCCGACGCTGAGGCGCGAAAGTGGGGGGAGCAAACAGG\n>XM_050853872.1 PREDICTED: Eriocheir sinensis uncharacterized LOC126994540 (LOC126994540), transcript variant X10, mRNA \nACACACACACACACACACACACACACACACACACACACACACACACACACACACAACACAGATGCTATGAAGTTCGTACCAAAATACAGACCGAGGGAGAGGGCTAAAAAGGACTGGTTTAATACAAGATGTACAGAGGCAAAAGAAAAGATACAAAGCTTGGTCAAGATTGAAAAGAAACAGAAATCAATGAAACAAAGAAGAGGAGAAACGATACGAAAAGGATATCGTGGAAAAGTATAAAGAACAACCTAAATTATTTCATAGATTTATAAGTGGAAGAATTAAACCAAGAGAAACAATTGAAAGACTGACTGAAGAGAATGAAGAGATTGACGCTCCCAAAGGCAGGGCGGAAGTACTTAACAAAAAACTCCAGGAAGTGTTTACCAAAGAATCAATATTTAATGAACCACAAGAAAACAACTTAGATGTATATATGGAAGAGCTCAAAATAGATAGAGAGGAGATAATAAAACTATTTGGGGAATTGGGAGAAGGGAAGGCCATGGGACCAAATGGAGTTTCAGGTTTTATGCTTAAAGAATGCAGAAATGAGCTAGTTAGCCTGATATATGACATAATTACGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATAATTAGGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATAATTACGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATCATTACGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATAATTAGGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATCATTACGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATAATTAGGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATAATTACGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATCATTACGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATAATTACGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATAATTACGTGCTCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATAATTACGTGCCCAATTAAAAGAAATGAGCTAGTTAGCCTGATATATGACATCATTACGTGCCCAATTAAAACGGGCACAGTGCCTAGGGAGTGGAAGAGGCCAGGAGTGGAACTTATATACAAAAGTGGAAGAGAGGATGAACCCCTTAATTTACAGACCAGTGTCTCTGACCAGTGCGCAAAATATGTGAGAAATTAATAAAAGAACAATGTGTGAGATTTCTAGAAGAACATAATCTAATCACAAACAATCACTATGGGCTTAGGAGAGGCCGCTCATGTGTGACAAACTTGCCGAGCCTTTACTCAAGAGTGACGGACAAATTACAGGAAAGAGACGGATGGGTGGATTGCATTTACCTAGACTTAATGAAGGCATTTGACGAAGTTCTGTGGAAACTAGAAAATAGAGGAGGATTGAGAGGGAAGATGACGTGCTGGATGGAAAGCTACTTAAGAGGATGAGAGATGAGACCCGTGGTTAAGGGCGCTAGATCGGAATGGAGGGCTGTGGACAGTGGAGTGCCCCAGGGGTCGGTTTTGGCCTAGTCCTAGTCTATATTACTGACATGCCGGAGGGAATAAACAGCTACATGAGCCTGTTTGCAGATGAAGCCAAACTGCAAAGACAGACAAGAAACAGTGAAGCCTGCAAGAAGACCTAGACAAGATTTGGAAATGCAGTCAGAAATGGGAGATGAAATTCAACGTGAGGAAATGTCATGTTATGGAAATGGACATGGACTTATAAAATGGGAGATGGGGAGATATTAAAGAAAGTATATGAAGAGAGAGAGAGACCTGGGGGTAACAGTGAAAGATTATATGCAACCAGAAAGTCATATAAATCAGATCTTTGGTGATACGTTTAACATGGTGAGGAATATAGGCATAGCATTCCACTACATGGACAAAGAACACGGGAGCTTAGGGTCAAAGGAGCTGCCTCGTATAGGCCTACCGACCTCTTGCAGACTCCTGCGTTCGTATGTTCTTAAGAAATGATGGAAAACTTAATAACTACTATGATCAGACCTAAGCTAGAATGCGCGGAAACAGTGTTGTCTCCACATACGAAGAAACACAAATATATATGCTATTGAGTAGAATGGAAGTAGATAACGAGAAATTCCCACTAAGAGACGAACCTTCCAGCAGGAATAGTAGAGGACACAGTAAAAGGTTGAGGAAGGGAAGATGCTTGAGAGACATAAAGAAATATAGCTTCCCACAAAGAAATATAGAGGCTTGGAACAGACTAAGTGAGGATGTAGTATCAGCGAACTACTACTACTACTACTACTACTACTACTA\n>XR_005515939.1 PREDICTED: Hibiscus syriacus uncharacterized LOC120120851 (LOC120120851), ncRNA \nGATCTAATAGGTAAGAGAGAGCTTTCTTCAGTCCACCCATGGGTAGCGATGGGATTTAATTAGCTGCCGACTCATTCACCCAAATACTGAGTTAAAATGGACCGGCCTGCAAATAGTTACTCAGTAAATGAGTGAATGATGCGGGAGACAAATTGAATCCTAATCTTCCTGTGCTTGGACTGAAGGGAGCTCCTTCTGCTGTTATTTTATCAACACCTAAACTACTTTCATCCATGTTTTTCACGACGACCACTACCTTTATATATAGTAATAATTTGTGGCTGAGATATCAATGTAGGAATAATGATCGCTTTATTAGCTTGTTTGTTTGTTCTTCATTGACATTTATATAGATTATCTCAACTTCTTAATGGCGGTGCGTTCTCATTGTTTGACTACTACGAAAGGAAAGTTTCGTTTTTCGCTCCAGGAGGAAAATTTTGCAGCTGTTTCTGGAGTCTAGGGCTGAGGGTTTTACTGTGAAGCTGCTGTTGCAGTTTCTTGTTTAAAGCTCCACC\n>XM_049955181.1 PREDICTED: Schistocerca nitens uncharacterized LOC126253663 (LOC126253663), mRNA \nGTTTTGTTGAAGTATAATAATGAGTAAAAGTAAAGTTATTAGAAACCCTCTGAAGGCTTTTAAGAAAAGGAGAAATGTTGGAAAGCCAAAGGTATGTGTTATTACTGTAAACAATAAAGACGATGAAAATGCCCAACATAGCTTGTGTCCCAAAGAAGAAGACAGTTGGTGTAAATATAACAAAGGATTGCTAACTGGTGAAGTGTACACTCATAAGCATAGTCTGCCTCATGCAATAATGGAGGTGATAAAACCTATTTTCAGAGACTTAGCAGCACCTGAACTGTTGAAAAAGTGTATTCACGGAAAAACTCAAAACCCCAATGAAAGTGTAAATAGTGTTATATGGTCGAGAATCCCCAAGACTGTATTTGTTGGAATAGAAACACTTCACTTTGGTGTGTATGATGCTGTTGCGACTTTCAATGATGGCAACATTGTAAGGTGCAAGGTATTTAGAAATATGGGAATGAAGATAGGTTCTAACATGGTACGAGCAATGCTTGCTTTAGACAAGGAACGCCTTCGGGCTGCAGACAGGGCTGTAAAGAGTCTAGAAATACAAGCAAGAGTAAACAGGAGGAGGAACAAGAGGAAGCTGGAGGAGGAGTTTGCAGAGGATGAAGATAATCCATCCTATGGACCTGGAATGCACTAAAAAGTTAATCCAATCTTTGTCGCTCGATTCCCAAAACTTTTATTTTCTCATACTAATTACATGTTTTCTAAGGATCTTCCAAACATATT\n>XM_028358397.1 PREDICTED: Glycine soja membrane-anchored ubiquitin-fold protein 2-like (LOC114396422), transcript variant X3, mRNA \nATTATTATTGCTTTGCAAAACACTAACCAACCAAAACAAAGGGAAAAAAAAAGTATCCACTTTCCCTTCTTCTTCTTCCATTTGGGTTTTCTCAAAAGTGAAAAGCAAATTCCGTGACTTCCACAATCACCACTCGGATCAAACTCTTGAGTGATAGACTTTGAATGAAATCTTGTTTTTCATTAACGAGATTCAATTGAAGTGAAGTGATTATTCACTGGAAAACTTATTTTTCATAGTATTGGAGGTACAACTGAAGCTGTTAGATTTGTTTTAACTACACGAGTTCGTTGGATATTTGAGCATGGCTGGGAATCAAGATCAGTTTGAGATCAAGTTTCGGTTGACTGATGGTTCTGATATTGGCCCCAAAAGTTTTCCTGCAGCTACTAGTATTGCAACATTAAAAGAGAGTGTTCTCGCTCAGTGGCCAAAAGACAAGGAGAATGGCCCAAAGACCATAAAAGATGTGAAGTTAATTAACGCAGGAAAAATTTTGGAGAACAACAGAACAGTTGGGGAATGCCAGAGTCCGTTATGTGATACCCCTGATACTGTTACAACAATGCATGTGGTTGTGCAACATCCTGCTACGGAGAAAGAGAAGAAAGCGGCAAACAAAGCAACACAGAACAAATGCATGTGCGTTATTTTATAGCATCCAGATTGAATAGCAGATGTCATCTGTCTTAGTTGATTAGGGACAGTTCATTTTACATAACCTGCGTCGTCAAATATTTCAACATACACAAATTATTTGGTTGCATGCCCCATTCATACTACAGTCAAGGAGTACTGGACTATTTTCTTTATAAAAATGGAGTACTTGACTTGGTGAAGATTGTGAAGCTTGTAGTTCCCTGATTCCTCTGCGGCACTAAATTTCTTGCACAATTTCATAGGAGATGTTCTTCTTCTGGTTTCAACATGTATTAGGTGTTGCCTCATCAGACACTTGGTATAATTGTTGATTGAAATGAACTCTACTAGTTTGCCATCTTACCCCCTCATATATTTTACAATTCTTCTCTTTCGTGTATCTGATTCAACATACTTAATCCAGACATGTATGCGTTGAGTATTTGAATGTGTTTCAATTTTCTGGTTGTTTATATGGTACCATTGCTACCCACTCTTGTATAGCAGCTATGGCAATAGTGATTTAACAACATCTCTCACAAAATGGAGATTTGATGCTTGAA\n>XM_017886251.1 PREDICTED: Rhinopithecus bieti MAS related GPR family member E (MRGPRE), mRNA \nAAGGCTGCAGGGAGGGTCGGGGTTTCTCTTGCTGTCCACACCTGGGCAAGAGCTGAGCGGAAGAGAAGGGGTCCTCAGAGAGACGCCTTCCTCACCAGCCCCATTCCAGCCGGACACCATGTGACTCGGAGGAGCTGGTGGACACTGAACAGGAGCGGCCCAGAGGCTCTGGGGACTGGAGCCCGCGGCTGCAGCCAGGACAGATCCAAGGCCCAGGGTCAGAGCAGGCAGGGCTCGGTCGCGCCTCTGCCCCAAACGGGGCATCAGCAGAAAGAGCGAGCAGCAGCAGCACCCTCTGGCCCCCCACCCTACGATGGAGTCCAGAGAAGCTGGAGAGCAGGCAGGGGCTGCCGACGGCGCCCGGGAGGATGTGGCCTTCAACCTCATCATCCTGTCCCTCACTGAGGGGCTCGGCCTCGGTGGGCTGCTGGGGAACGGGGCGGTCCTCTGGCTGCTCAGCTCCAATGTCTACAGAAACCCCTTCGCCATCTACCTCCTGGACGTGGCCTGCGCAGACCTCATCTTCCTTGGCTGCCACATGGTGGCCATCATCCCCGACTTGCTGCAAGGCCGGCTGGACTTCCCGGGCTTCGTGCAGACCAGCCTGGCAACTCTGCGCTTCTTCTGCTACATCGTGGGCCTGAGTCTCCTGGTGGCCGTCAGCGTGGAGCAGTGCCTGGCCGCCCTCTTCCCGGCCTGGTACTCGTGCCGCCGCCCACGCCACCTGACCACCTGCGTGTGTGCCCTCACCTGGGCCTGTTGCCTGCTGCTGCACCTGCTGCTCAGCGGTGCCTGCACCCAGTTCTTCGGGGAGCCCAGCCGCCACCTGTGCCGGACACTGTGGCTGGTAGCAGCGGTGCTGCTGGCTGTGCTGTGTTGCACCATGTGTGGGGCCAGCCTTATGCTGCTGCTGCAAGTGGAGCGAGGCCCCCAGCGGCCCCCACCCCGGGGCTTCCCCACGCTCATCCTCCTGGCCGTCCTCCTCTTCCTCTTCTGCGGCCTGCCCTTCGGCATCTACTGGCTGTCCCGGAACCTGCTCTGGCACATCCCCCACTACTTCTACCACTTCAGCTTCCTCATGGCCGCCGTGTACTGCGCAGCTAAGCCCGTCGTCTATTTCTGCCTGGGCAGTGCCCAGGGCCGCAGGCTGCCCCTCCAGCTGGTCCTCCAGCGAGCACTGGGAGACGAGGCTGAGCTGGGGGCCGTCAGGGAGACCTCCCGCCGGGGCCTGGTGGACATAGCAGCCTGAGACCTGGGGGCCTCGACCCCAGCTGCAGCCCCCATGAGGCAGGAGGGTGACTTGGGGAAGGTGGTGGGGTCAGAGGCTGGGGCCAGCTGGACCTGGAGGAGGCCTTGATGGGTGGCCCAGTCATGTGCTGCCAAATCTGTGACCATCAGTCCGGAGCACGAGGCTCCCCTGGGAGGCAGCTGGAAAGGCGAGGTCTCCACATGCCCAGTCAGGTGGGCTGGGTCTCTGGGGAGAAGGCCCAGGAATGTGCATTTTTGGGAAACCTCCCCAATGGTTCATGCACTGGCACCCAAGCGCTGCTGCTGCTACCCATTCCGTGCTCAGCTGCAGTGAGGAGACCCCGGAAAGGAAGGAAGCAAGGCCAGACGCCAGGTGAGGGGCAGGTCCAGGCCCTCCCGCAGCCCACCTCCCCTCCCACTCCAGCTTCCCCAGTGCTGCAGGGGCACCCACAGAGAACACAGCCATTCCCTCAGCTCGCCATGTCCGCTCTGTGGAAGCTAAATTGACCCTAAAATTGAAGACTGCCCAAAACTTGACCCCCTCCCCCGACGAACTGTGTCCAAAGCAGCCAGCAGCCTTTTTGTCCTGGGTCCGTTACGTTGTCGTGAGTTTTCAGCAGGAAAATGTGGTGATACCGCAAAGCCACTCATTCTATCGGCATAAGGGTGTGCATTGATCAAAAGCTGTACCCCCAACCCCAGCACAGATGCTGTGAGGAAAAGCAGGGGCTGAGGCTTCTAGAAGGCTGTGGAGCTGTCCTTGGTCATCAGGCCGTTGCTCAAGGCCATGCCACCCAGACCTGGACGATGCAACCCTCACTCGGAGCTTCAGAAAAGCCGGCCCCGTGGGTGACCCTGGATATTACAGGATGCTCCCTGGGCAGGTGGAGAGGCTCCTTACAGCCCTACCCAGCAGCCTGTGGCCCTGTCTCCCCACAGGACCCAGGCCTTCAGCAACCGGAAAGCTTCTTCCCACCGGCCCTATCTAAGGCAGTTCACCCGCCTCTGTCCTGAGCAGTCCCGCTCCAGAGGATCCCTCTAAGGAAGGAACCCAGGCTTCACCCCTCAACAGGTTTCGCGCTTCCCCTGAGTGCCGGGCCTGGCTGCCATCCAGGAGCATGTGCCAGGGGGTGCCAGAGCGGGGGCTTTGGAGCCCACAGCCTGGGCTGAGCCCTGCTAGCCACCCCACTGTGCTGCCAAGGCCATCTCTGAACATCCCTGTGCCTCTGCTTGCTCGTCTGTAAAATATGAGAACCCAGTTCTTTGAGTCTTTGAGGCCTGTCCAGCCTGTTGTGAGCCCGAGAGAAATGTCTGTCGATTCTACTGCCACCAATGCCGCCATCCAAGTCCACAGTACAATTCTTAGCCACAGACTAAGG\n>XM_051693489.1 PREDICTED: Myxocyprinus asiaticus WW domain-containing transcription regulator protein 1-like (LOC127438147), transcript variant X3, mRNA \nAAAGTCCGTCAGTGGACGCAGGAAAGTTGGGGAGCGGAGGAGGAATATTTCTGGAGAAATTCATATGAGGAACATTATGACATCAACTTTTTAAGCTTTATGACAACTTTTTAAAGACTTTAAAAAAAACTTTTTAGAAGGCCAAAACAACTTTTACCAAAGAAAGAAAAAACAGGCCTAACCAAAGAGGTTCAGGATTTTCATCGCCTATTTTTAATCGAATCTTTTTATTAGTAGGATTTGTTTTATTTGTTTGTATATCTAACAATATGAGCGGTAACCCTCTCCAGCCGTTGCCGGGCCAGCAGGTGATCCATGTCGCCAAAGACCTTGACACGGATCTGGAGGCTCTTTTTAACTCGGTCATGAACCCAAAGCCTAGCTCCTGGAGGAACAAACATCTGCCCGAGTCGTTCTTTAAGGAGCCGGACTCGGGCTCTCACTCCCGGCAGTCTAGCACGGACTCGGGCAGCCACCCGCCGCGGCTCCAGGCGCAGCACGTCCGTTCGCACTCGTCTCCGGCGTCCCTGCAGCTGTCGTCGGGCGCGCTGAGCGCTGCGACCCCCGGGCGTCATCACACTCATATCCGACACCAGTCGTTCGATGTGGCCGAAGAGCTGCCGCTGCCGCCGGGCTGGGAGATGGCCTGCACTCCCAACGGACAGAAGTACTTTCTCAACCACCTTGAGAAGATCACCACATGGCATGACCCCAGGAAGAGCATGACCCCGTCGGTGACCCAAATGAGTCTGCACAATCAAGCGTCTAACAGTGCTAACATACAGCAGCGCTCCATGGCCCTGTCTCAACCCAATCTCGTGTTAAATCAGCAGGCGCATCCACAGCACCTGCAGCAGCAGCATCAACAGCAGCAGGTGCAGGCGCAGACGCTTGGCTCGCAGCAGCAGCAGAACTCTCAGGCCAGCATGTTGAACATGAGCGCACAGCAGCACCAGCAGAAGATGCGACTGCAGCGCATACAGATGGAACGAGAGCGCATTCAGAGGAGACAGGAAGAGCTCATAAGACAGGAGGTGGCGCTCCGGCAGCTGCCCATGGACTCTGATAATATGGCATCTGTGGCACCAGCCATCAGCTCTCCGGCCATGACACAGGGCAACATGCCCAACAACAGCACAGATCCCTTCCTCAACAGTGGGCCATACCACTCTCGAGAGCAGAGCACAGACAGTGGACTCGGACTGGGCTGCTACAGCATCCCCACCACCCCTGAAGACTTCCTTAACAACATGGAGGAGATGGACACAGGTGAGAACATGGTGCCGGTCAGTGTGAATGTACCGCAACAGAGTCGTTTCCCAGACTTTCTGGATTCCATGCCCGGCACCAATGTGGACCTGGGCACCCTGGAGGGCGCTGACCTCATGCCCATCCTGAACGACGTGGAGTCAGTCCTGAACAAGAGCGAACCCTTCCTCACCTGGCTCTAGACTCAAACAGGACACTATAGACTTTTATATATACGTACATATATATATTATATATACACAATCAGCCTCCTCCTGTAGTTTCACTTTGTAGACATCAGTTTTGTTTCCACACACTACTCTGAATTTCCTTTTCTTTTGCTGAGTCAAAGAACAATATTTACCAAAGTGTTTAGCCTGCGAACAAATATGCGAGTACGCGTCAGTAATAGCCGTAGTGTAGAAAGACTAATGTGTTTGTTTTGTAACTGAAATTGGATAGATTTGATTATGTTCAAAATTATCACATGAACACATCCTTTCCACAGCAGACATGCCTGGATAGTGTCCTAACAGTGGCTGTCAATCAATCTGCCCAATCATGTTTAACAGTGAAACATTCAAGAAAATGTTCAGGTAACATTTTACTCCAAAATCAAAAGAAACAAATAAGAAATGTTATTTTGCATAAAGAAAATGAAGGACATTTTAGGACCATCAAGTTTTTTTTTTTGTTTTTTTTTGCATTGTGACATTTTCATGACAATTAAGCATATTTCCCCCCCCCCCAAATTATTTTTAACCGCAATGCGAAAAATCTCATTCTAATTACCGTAATGTGAAAACATAATGAGGTATTAAACTTGTAAAGTATTTTTGTACATTATGGTAGCATTTGGTCTACTGCCTTTATGCTGATTTTTTTTTTTTGTTTGTTTAAATAATTTTATTTAGGGCTTTCAATTTAATGCACTAATTCAGTGCGATTAATTATATAAATAATAATGTGTTAAAGTAATATGGACACTGGCTACCACCAGTTCGCTAGTTCGAATCCAGGGCATGCTGAGTGACTCCAGCCAGGTCTCCTGAGCAACCAAACTGGCCCGGTTGCTAGGGAGGGTAGAGTCACATGGGGTAACCTCCTCGTGGTCACTATATTGTGGTTCGCTCTCGGTGAGGCGCGTGGTGAGTTGAGCGTGGATGCCGCGGTGGATGGCGTGAAGCCTCCACACACGCTATGTCTCCGTGGCAACGCACTCAACAAGCCACGTGATAAGATGTGTGGGTTGATGGTCTCAGACGCAGAGGCAGCTGGGATTCATTCTCCGCCACCAGATTGAGGCCACTACGCGACCATGAGGACTTAAGGCACATTGGGAATTGGGCATTCCAAATTGGGAGAAAAAAAAAAGAAAAAAGTAATGCAATTAATCATGTCTTGAGAAATTCAAGCTTGAAGTACCACCTGTTTTCTCCAGAGGGCAGTAAACGAAACTTCAGCTGTATAGGTAACACGAAGCTTATACAGACAACAAACCAACCCTTCAGCAGACAGCACAACACGAGGACACATTCTTGCATTCAAAACACAACTTGATGGAGTGCAAATCTGAACTTGGGGATCTCAAGAAGTGTTTTTCTAAGTATTAAACTACTTTTAACTTGACACAGTGACCTAAAAACGGTATGATTATGATGCGACGGAACCAAAGTGAGACGCTCCAAAAGCGTCCATCTGACGCAGGTGAACATTGATGCGTTCTTAGACAAGCCCTCATAATAAATCTCGGACTAATTGAAAAATTCAATTACAAAATGAATTGCTGTGAACTGTAGGACAATGATAGGCTTATATTCAATAATATGCAAATAAACAATACACACATTCTAAAGCCATATATATATATA\n>KU122020.1 Uncultured bacterium clone 26372 16S ribosomal RNA gene, partial sequence \nTACAGAGGGTGCAAGCGTCAATCGGAATTACTGGGCGTAAAGCGTGCGTAGGTGGATACCTAAGTCGAATGTGAAATCCCCGGGCTTAACCTGGGATCTGCATCCGATACTGGGTATCTGGAGTATGGTAGAGGAAAGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAGGAACATCAGTGGCGAAGGCGACTTTCTGGACCAATACTGACACTGAGGCACGAAAGCGTGGGGAGCAAACAGG\n>XM_050382592.1 PREDICTED: Mercurialis annua probable xyloglucan galactosyltransferase GT14 (LOC126688031), mRNA \nGGAAAGTTGACAAGATTCCTTGAAATGTCACAAAACCTTCCATTTTTATTTTTTCTCTCAGATTTATTTCCACCATTCACTAACTTAATTATACACTCTCTTTCACCAACTACTTAACCCTATTACTTCTCTCAAATACTACTCCATTAGCAGCCACCATTTTTGTTCATTATTTCCACTAAACTAAGCTACTATACACAATGCTAGAGAAACAATCCACAAAACGGCAGATGGAAAAATCTGGTTTAGAGCATAATAGATCAGTCTGGTTTGTCGTTTTGATCATTCTGATACCTTTCTTCTTCTTCTTTCTTTATGCTTTTGATTATTTATCTTTATTTGCTAACATATCCAATCAAAAATACGAGAAAAATTCTGATGAATCTTGTTCGGGTCGTTATATATATGTTCACGATCTTCCTCCACGGTTCAACGATGATATTCTTGAAAATTGCAGTACCATTAACAGATTTGTTAACATGTGTCCTTTTCTGAAAAACTCAGGTTTTGGTGTTCAGGTTGTTGGAGACTATCCTGACGGGGTCGATTTAGGACAGAACTGGTTTGCAACTAATCAATTTTCTTTAGAGGTTATATTCCGTACTAGAATGAATTATTATGATTGTCTGACGAATGATTCTTCTTTAGCTTCTGCCATTTTTGTACCGTATTATGGCGGACTCGACGTGGTTCGATACCTGTGGGATTATAATGCTACAAGAGATTATTTAGGTGTTGATCTTGTCAATTGGCTAACTCAAAAGCCTGAATGGAATAAAATGTTTGGTAGAGACCATTTTTTTGTTGCCGGAAGAATTTCTTGGGATTTTCGACGCCTGAACGATCAGAATGACGGTTGGGGAAGTAAACTCATGTCGTTACCTGAATCTATGAATATGACAATGTTGTCAATAGAATCAACTGCGTGGAGTAACGAGTTTTCAATACCATATCCGACTCATTTCCACCCGTCAAGCGACGCTGAAGTGATCGAATGGCAAAACCGAATGAGAAAGCAGAAGCGGAACTATTTGTTTAGTTTTGCAGGCGCTCCAAGGCCTGATCAGAAAGATTCTATCCGTGGACAGATAATCGAGCAATGTTTAGCTTCAACAGGGTTATGCAAGTTGCTCAATTGCAGTTCGGGGAACACATGTGATAATCCTGTCGAGGTGATTAAGGTATTTCAGGATTCTGTTTTCTGTCTGCAGCCTCCAGGGGATTCATACACAAGACGATCAACTTTCGACTCGATTGTTGCAGGATGTATTCCAGTTTTCTCCCATCCGGGATCCGCTTACGCACAATACGAATGGTATTTACCGAATAACTATTCTAAATATTCCGTGTTCATACCGGTGGATTTAGTAATAAATGGAAGTGTCAGCATTAACGAGACTCTGATCAAGGTTTCTGATGATGAAATTGTGCAAATGAGAGAAGAGGTCATAAAGCTGATACCAAAGATTATATATGCAAATCCTAAGTCAAAATTAGAGAGTACTGAAGATGCATTTGACATTGCAATTAAAGGAGTTCTTGAAAGAGTTGAAAAAGTGAGAAGCAAGATTGATGAGGGAAAGGATCCAGCCGTTGGATTTGCAGAACCAAATTGGAAGCTCAGATTTTCAAGAATGGGTCTACAACAAAATTGGACTCATTTCTTCACGTAAATGAAAATGTTGAAACAGAAAATGGTAAAATTAGTACAGTTTTATAAATATAAATTTTGGAAAGTTATTTTGAAATCATAAATGCAAAAATGTAGGACTTAATAAATTTTTGTGAAATTATAGCTTCTGAAAAGTAATGTATATTAGTGTGGTTAATTAGAGGTTCTAGCATTTGCATAATAGCATTTCTTCTGTTCACAATTCTCTATGTGATTAGATGATATAAGTTTTGGTGGAAATTTTGCAGTCCACCAATTTATA\n>XM_022914722.1 PREDICTED: Durio zibethinus uncharacterized LOC111313871 (LOC111313871), transcript variant X2, mRNA \nTCCATTTAAGATGCAGATAGTATGTTTTCCAATTTTCAGAGTGATACCTTACTGTATTGATGATTCGAAGCCAAAAATTTGCAGTCCAAGAATCTCAACTCACCATTTCACATTTCACTGTAATGAATTTTTACAGGCAGACTCCAAGCTTGGTCTCTTCAGCATCAAGATTCCCTTTCAACCAACTTTGTTAGAAGACTAATTCCTCAAATGGTCACTATCCATTCATGAATTTTAAATTCCAAGGTGACGTTTGCTCTATAATTGAATTCATTTCCTGGGTTGTTTTCATTTCGGAAAATCATATGAGATTTCAACTACATTTCAGTCCATCCTTGGGCCGGTTGATTAAGGTAAAAAACTTGAGCCAGAGTCCCAAACTCGACTAATCATAGCACAACACGTGTTAGTATTGAAGAATTTTTAATAAAAAAATAACAATTGAATTAAGTTTCAGGTTCATTATTGCGGTTCTGCAGATAAAAATTTTGGCAACTCTTCTACCTCTGGAGTTTCCCTGTTATCCAGCATTGCTGTTGTCATAGTCGGCATATCTTTATTAATTACAAGTGCTTTTAATTTCTTATCAGCCAAGATTTGGACTTGCAACTGCAACAAGAAATATTCTAGTTTGGCTTGACAAATCTTTGAATGCGGAAGAGTGGAGATGAGACAAGTTACTATGGGTTGTAGCAACAAAGACCAGGTGGTTTCACATGCAGGATTTAAGGACATGATGGAAAGTGAAATCAATGAATCCCCTTTTGCATCCATACCGAAACCACCTATACAAAGTAGCAGACCAAGTAGCATGGTTGTTAAGAAAGCACATACTGTGATTCCAGCTCATATTGTTGCTGAGGCTATATCAACACTCCTTGGTCTTGATCTCAGATGGTCAGGACCCATCACACAAACAGAAAGAGAATATGTTGAACAGTATGTATTGGCAAAATACCCAGAGTATGCAGGGCAAGTTGAAATAGAACATATTGACCTCTCTAGTCTTTGTATCAATGAAGAGTCGTGTGAGCCTGCAATTGATGATAAAAAGAAATCACCTAGAAGAGAGTCCTCCACACCTTCCTTTGGAAGCAATCTTCCCGACCTGGACAGGATTCAATTGGAGGCATCGAGACTGCTCGACATCCTCACCAAGAAATCTTCCTTTCCTGGAAGTTTCATTTCAATTCCTGAAATTCAAGCTCGAAACAAAGTTTTGAAGCATTGCGGATTACCAGATAATGACTATCTTGTTCTGTTCACTCCAAACTACAAGGATGCGATGATGCTAGTTGGAGAAAGCTACCCTTTTTTCCGAGGGAACTTCTACATGACCATCATTGGTGAAGAAATGGATTACGTACGAGAGTTTGCCAGTTACAAGGAAGCAAAAGTGATCTTGGCCCGTGAATCTTGGTTGGATTTGAGAATCAAGGGATCACAACTTAGCCAGTACTTCAGGAGGAAGTGTAAGCACAGTCCAAAGGGTTTGTTCTCTTATCCAGCTGATGTAAAGGGGATGCGTTATTCCATGCATTGGATTTCAGAAGCTCACAGGAATTCATGGCACGTTCTGCTTGATGCAACTGCCTTGGTTGTTGGACAGGATCGATTGAACCTTGCACTTCATCGACCCGACTTTGTTCTTTGTAGTCTGGAGAATACGCACGCTGATCAACCATCAAGGATAACTTGCCTTCTGGTCAGGAAGAAATCCTTTGAAACTACAACATCTTCATCTCATGTCACCGAGTGAAAAGTGGGATTAGCTTTTGTGAATACGCTATATGTTTAAATTATTGAACCCAAATTTATGCCAATATATTTTGGAAGTAGGAAACTTCGAACAAATATAATTAGTTACATTTATACAATTGTGGCAAGTTTCTAAAGTTGTTTACAAGGATTCTTAAATCTTAACCTCAGCTGGTTCCTTTAAAGCTGGGGTTTCGTTGCTTCAAGCTACCAATTCGAAAAAAGAAAGCCTTTCAAGCCAACAGAAAAGGAAAAATTACATAAAGAGTTGAGTTTCTTTTTAACTTGGAAATTTGGTATACTTGAAAATTCTATTACTTGGAGAAGGCATGTTTCCACTTTATCAGGTCAAGGTGTATTTTCATACATTAATCAAGTTATTTAGGTGAAAAACTAGAAAAATTCAATGTCCAACGCATTAAAAGCATGGAGTCCAAGTGTCAGAACTAAGGACAATCATCTTTAGGGTAATGAAAAATTCATGGTTTTTTCAAAGTGGACCATGACATTTTTCATGCAAGTCTGGTAGGGTGGAGATGGTTTAAGGTTTAGGCCCATCACTGTTTCAAAAAGCCATGTCAAAAGTCTTCGCTCCCATCCTCCATGTTTTTCAAGTTTACTTGTTTCTGGATTTGCAAGTCACAATCTTCAAGCGATCAATTCAATCAAACAATTCCTCCATTGTTACTCGGTTTCTGGCTTAGCAATTTGTCACCTTTACCTTCATGTTAAATAGTCATAGTGAGCTCCAGCCTTTGGTGAAACTTACTATGGATATTTGGTTTGTGATTTTGGGTTCTGGGCTGGCAAGGCAAAATGATTTTCCATTTGGTTCCTTCAAAGAAA\n>XM_005089107.3 PREDICTED: Aplysia californica serine/threonine-protein phosphatase 6 regulatory ankyrin repeat subunit A (LOC101861246), mRNA \nGCGCAAGTTCACCGTCAAAGTGATAATTTTTTTTATTGGATCTGCCATTTTCTCCATTATAGATTTTTTTCTTCAGGGTAAGTTATGTGTGTAGATTATTGCTATATCCATAAGTGGCGACCTCTTACAGCCTGGCTGGTGTATTAAAATGGAGCCCAAACATTGGGCCCGGTAACCCGGCCTGGCACCCGCCACGACTGGACGCACAATAAGGCACACAATATACCCTCTAGATTGTAAGGCGAGCCGGGCGATCACGGGAGTTGGGGGTGTCAATACTGCCACAGAGGCGGCGTGCACACACCGCTACACCACAACGACCCCAGAACGAAACCCTGACCAGGTGAACAAAGGCGGACATAAAAAGATCGCCCGGTTTGCTTCTCAACTCGATCGATTTCAGGCTGACTGAAAAAAAAATTCCGATACGTTCAGTTGTAATTCTACATGCAAATCTTTGTGTGGTGGGATCAAATCAGAGCGGAGAGGCTCTTCGGATACTCGGCTTTGTTGTGTATTTGCTGGTTGACTGAATTCTGATAGCCATTAGCTTTGAGCGATCGAGTCGCCCCACTCCTGGTAGCTGTGTGTAGTGCAGTCTAAGCAACACAGTGCTCGCCTGGACGTACGTAAGCCTACAGTGAGAACACCGGTCCAAAGACAGGATTATTTGATCTGTGCAGACGGATAGTGCCGGATTAGTGAGATTGCACTCCTGCAGGATTGCTCCAGCCAGCGACTGTGCCCTCTTGTGGCTATGGAGATCTAAAGAGGACAAGCCTTACAGTGCCGGACCGTACAATACAATAGTGAGACAAACCCTTGCTGAGTTGGATACTTTTGGATTCTGTGTTGGTTGAATTTAGGTGGTCTCACATTCTTTTGATATACTACAAAACCCAGGAATCTTGAACTTACCAAAGATGTTGGTCTCATCTTTGATTTGCGACACCACACGACGATGAAAGACAGAGTCGCTGGTCAGACCTGTGTCCACATCATCTAGGCAGCCCCACAAGACGACTTTGCGCTGGCCACCACAGCCCGTGGGTTTGTAAGAAAACTTTAGGATAACATAATGGAGAAAATAGCCCTGCCACCCCCGCCGTCCAAGAGACTGGTGAAGACAGCGCTACATCAAGCAGTGTTAGATGAGCGCTTACATCAGGTTCGGCTTCTTGTGGACAAACATGGAGTTGGCATTGACACCAAGGACGTCCATGGCAGAACGCCTTTGATGCTTTCCTGTATCATAGACAACCATGAGTTAGGATACAGAATGGCGTACATATTACTAAAAGCAGGAGCGTACTTGAACCTTCGGGACGGAATGGGTCGGACAGCGCTCAGTTATGCCTGCATGAACGGCAGGGAAAGCTGTGTGGCTGTGTTGCTGAAGGAAGACGTGCTGGACATTAATGAACCAGATAATGACGGCAACACGCCACTACACCACGCCTCTACCTGCGGCAATCCTCGCATTGTGGACATGTTGGCCAAGGCATTTCATAAGTTCGGCCTGAACGCTGACAAGAGAAATAACTTGGGCTACACAGCTCTACTGCTGGCCTGTAAGAGCGGCCACTACGTGAGCGCACATCTGCTGTTGACCGTGGCCAAGGCATCCCCCGCTCTGAGAGATGGAGAATTTCACCTCAACGCCACTGAATGGGCACAGAGAAGTCATCAGATCCAGGCAAGGTTAACAGATCGGTCATTCTTAGCCTCAGCCCCTGCCGCCACTCCGCGGCCCCTCGCTGCGCTGTCGTTTGAGCGTGAAGACAGCATGTACCAGAGACCCTGGGTGCCCATCTGTCGCCTGTACCGAGTGCCCAACCCTCACTTCTCGGCGGACAACTTCAAGCTGCCAGACATCCTTCTTCCTCCACCGGGCATCAGGAGTGAGCTCTTCTTGGATGGGCTGGATGCCCGCCAGATATTGCTGAACGAGATCGAGCTGTCAGAAAGTAAGACCCGACCTGTCTCCACGAAGGCGACATTGTCGAAGTGGAGCCATCCTCCAACAGCCAAGCTAAGGAACATCTCTCAGAGGAATGCCCCGTCCTCTGCTTCCGTGCCCGACATGGTGACGATGTTCAAGATGTACTGCGAGCAGTACCAGCCAGACTGGCGCACGATGAACAAACAGAGGCGGAAGACGATGGCCGTGGGTGGGCAAGGCATGACGTCCAACAACAGCAACCACTCCTTCTCCGACATAGCCGGGGCCGCCCATGGAGAGGGCGTGGAGATGCCTAGTTGATTACGTGTTGACTGATTTATTGAGGGCTGTGTCGTTGTGAACTGTGACATCTTTTTTTTTTTCAATCTTAGTCTCTGATGAGACGATTGATTATAACTATCGGACAAAACGTTGGTCAGCTGTTCAGAAATACTAAGCTCAAATTTCGTTTGCTTTTGTATAAAAATTTTATTTTTTTTAAAGTAAAGTACAGCAGCTTTACTGGAACTGATTGCATGAGCTCAAGAAGCACAATTTTGTCGAAATTCAAATTCTGTATGTCAGAAAGCAAAATTTAAAAAAAAGAAATGAAAAA\n>XR_006395823.1 PREDICTED: Acropora millepora uncharacterized LOC114972299 (LOC114972299), ncRNA \nTCTAAGAAGTGCATATTCTTTATAAAAAAATCAATGAAAGGAATATAACATAGTTCAAGTGCGCTTTCCGTTTCCGTACGTAAATTGTCAAGATTGCAAAGGACCGAGAGTAACTTGAAAACTGTACACGGCAAAGTCTCTGTATAGAAGTCTTAACCAAGTTGAACTCATGATTAAATTGGAACCAGCGCCTCTGAGAATACCCGATTGTTTGGATCTGCGAAGTCGATTCATCCGCAAATTGTCCTCTGTTTCAGGGGAGAGGAAGCCTAGCCAATGAGTAATTGATAACATTGCCGACTACACGATCGTACAAACGCTTCTCTTATGGCCAGACCAGCTTTATGGAAGTCGCCCGCTCTATGGAATGTTTGTTCGACATATAGCGTTCAGTCGAACAATTTCATCATTGACTCGGTTTTCCTTACCGATCGAGTTTAATTTGCAGCATATCAACGATGAGTCACGTTCACATGACGTAGTAGACATTGCATAATACGGCCTCATATGGACTCACGAGTTGGCAGGCGTCCACTCACCCACCCATAATCCTATTCTTGAGGTTTGTTTGTATTTTGACACAACTTTAGTCCTCTCTGACAAGCATGAAATCAAGACACAAGATACTGAAATAGATATTGAACTCATTTCAAGCTGACATCTTTTATTTGCTTAGGCTGTTATATAAATTAAAAGTTTACTGGTTTTATTCTTATAACATTATATAAAGATCAGCATAGTAGATCATGA\n>XM_002951530.1 Volvox carteri f. nagariensis hypothetical protein, mRNA \nATGCCCGCAACTGACGATCGCGCGGCGGACACCTCCTGGCTCCACGTCAGCAACACCATCGTGTACTTCCTCGCGTTCTGTATCAACGTCCTTGTCAACTCGGGTGCCGTATTTCGTACTGTACGTTCAGTTGACCGGCAGTTCGGACCCGTACTCACACCTGCCGGATGGTCGTACTACATCCGAGATCTGACGCTTTTCTTATGGGGTCTAGGAGTGACGTGTCAGAGCTTGGTGGAGCACAAGGGCTGGAAAGACGGACTCGTGGCGTGCATTGGCTACTCCTGTTTTCCCCCCCCCCCAACTCCCCGCCCGCGCCACCCCCGCCGCCTACTGACCCGGGTGGCAGTGCTGGTTCCGGAGCTGCAGAGGGAACTGCTGGCGGCGGGGTTTCGGGGTGTGCCCCCCCTGGCCTACCTAATCTACGTGTACCCAACTTCCCTGGCGTGTGGCTGGCTGCTGGTGCACCAATGCCATGTCACCGCGCTGGCAACTGGCCTGGTGACGAGCTCGCATCAGGCGGCGCTCAACGTTGGTTGTGTGACGTTGGTGCTGGCGACTGCATTGGCGCTCCTGCTGCTGGTTCGCCTCCGCGACGTGGTGTTTGGACTTGCCTTTACCTGGGGCTGCGTGGCGGTGTGGGTGGCTGGGTTCACCACCCAGGAGGATTACCGCCCGGACCAGCTGGTGGCCTTCTTCTGCGGCCTGGTCATGGGAATGTTGACGTACTGCGTAGCGGCAGGGCCGCAGGTCAGGATGGCGTGGGGGGGATGGACGGCGGCGGTGACGGCGCCGGCAGCGGCTCTGCCGCCGCCACCGCCGCCGCCGGCACCGGCAGCGGCTCCGCCGTCGCCTTTGGCTGCTACTGGTGGTATGACATCCGGAGCAATACCAGCAACGAACAACTAA\n>XM_041800643.1 PREDICTED: Cheilinus undulatus beta,beta-carotene 9',10'-oxygenase-like (LOC121518372), mRNA \nTTGCTGGTTAAATTATGGTCCATCTGGAAGCAGATGCAGACAGAAGAAGCTGTGTCCATCCATTACGACGTCGTCCATGGCTCCGGTGAAGTTCGACAGCTCAGATGCCGCCGTTCCTATTGAAAATGGGCCAGCCAAGGCATGTATCACCTCTGTACTGAAGGGTCTGGAAATGATCGCCCCTCTGGTCCGCTCTATGGAGGAGACCCCTGTGCCCATCCCCACTGAAGTACATGGGACCATCCCCTCCTGGATCAATGGAAACCTTCTCCGCAACGGCCCTGGGAAGTTTGAGTTTGGGAACACACACTACAACCACTGGTTTGATGGCATGGCCATGCTGCACAAGTTCAAGATCGAAGAAGGCCAGGTGACGTACATGAGTCGATTTTTACAAAGTGATGCCTATAAGAAGAACAGTGAGAGGGACCGCATTGTGATGTCAGAGTTTGGCACCCTCGCCATGCCAGACCCCTGCAAGAACTTCTTCCAGCGCTTTCTATCTCGTTTTGAGATGATTGAGGCCACTGACAATGCAAGTGTGAGCTTTGTGAAATACAAAGGTGACTACTATGTCAGCACAGAGACCAATTTCATGCACAGAGTGAATCCTGAGAACCTGGAAACATTGGAAAAGGTAGACTGGAGCAAGTTCATTGCGGTAAATGGAGCCACTGCCCACCCACATGTTGATCCTGACGGTACCACCTACAACATGGGAAACTCGTACGGAAGCAAAGGGGCCTTATACAACATCATCAGAGTACCCCCAGAGAAGAAAGAGTCCACAGACACCCTGCAGGGAGCCAAAGTACTCTGCTCTATTGTGCCTGCAGACAAGGCGCACCCCTCCTATTACCACAGCTTTGCCATGTCTGAGAACTATGTGGTGTTCATCGAGCAGCCGATAAAGATGGACCTGCTGAAAATAGTCACATGCAAGCTGAGAGGGAAGGCCTTGAGTGAGGGCATCTACTGGGATCCAAAGCTGCAGACTGTCTTCCATCTTGTTGACAAGCGCACTGGCGAGGTCAGCTCAGTGAAGTACCACACCAAAGCCATCTCAGTCTTCCACCAAATCAACGCCCACGAGGAAGGTGGGTTCTTGTTGCTCGATATGTGCTGCTCTGACGATGGTCAAGCAATCAACAACTACCTGATCCAGAACCTACGCAAGTCAGGAGATGCTTTGGATGAGGTGTACAACACTCTGTGCCGGGCTTTCCCTCGCCGTTTCGTTCTTCCTCTTAATGTGACCAATGAAACCCCATTAGACCAAAACCTGAACACTCGACCCATGAGCATGGCAACCTGTGTCAAAATCGGCAAAGACAAGGTGTTCTGTCAACATGAGGATCTACATGGAGAGGACCTGCAGGAGTATGGTGGACTTGAGTTCCCACAGATCAACTACAGCAACTACAACACAAAGCCATACCGCTATTTCTACGGTTGTGGCTTCAGACACCTGGTGGGCGATTCTCTGCTCAAGATGGACCTGAAGGACAAGTCGCTCAAGGTGTGGTATCAGAAGGGTTTCTACCCATCAGAGCCGGTGTTTGTCCCATCACCAGATGCTGTGGAGGAGGACGAGGGTGTTATCCTGTCTGTGGTTCTCACCCCCTCACAGGATAAAGGAACATTCCTCCTGGTTTTGGATGCTAAAACATTTGAAGAGCTGGGCAGAGCCAATGTGCCGGTGAACATGGCTTATGGCTTCCACGGCACATTTAACGCCTGTGAATGAATGATGTGATGTGTTACTGATGTTGACTATAACATGAAGAATACCAGTGCAGTGTCAACCATTATAACCACTATAATCCAGATGGTACTGACTCACAGCTCTACATGTTAAAGACAGATCTTCTGTTACTGAACAAATGCTCTTTTTCATTGGTTTCTGGTTTGAAATCAGACCCAAATGTGATGGTATTGATCAGTCCAATCATATTCAGGCAAACTGAAGATGAGTATTATAAATACATTCCTTTGGCATTAATTGTGCTGTCGTTATTCGCAACAGAGTGTTATGACCTCTTATTCTGCTGCCTTAATCCTGGTCATTGCAGGTTGTAGCATGTTTCAACCTTTAGGTCACTGAAGTGCCAAATGCTTTTCTTTTGTACTTCTTTTTTAATTGAGCAATACATTTTTGAGCTTGCATGAAATTTTGAACTTTTGTAAACTCTTCTTGGCATTAAATTTACTATTATATGAA\n>XM_003028818.1 Schizophyllum commune H4-8 Mg2+ transporter protein (SCHCODRAFT_01102597), partial mRNA \nATGCCAGGAAACGTCGAGACCGTGTCCGGTCATTTCAAGAAGTCCGATCTAAGCGCCGAGCATGGCCTCAATATACGAGATCTCCGCAAGATTGATTCTCGAATACCCAACCTCGTCCCCACTATCCTGGTCCGCAAAGAGTCCATTCTAGTCAACATCCTCCACCTCCGTGCCCTCATCAAAGCCGATGCCGTCGTCCTCTTCGATACGTATGGCTCTGTCGACTCCAGGCTACACTCCACTTTCCTCTACCACTTGCAGCACAACCTCCGCAGCAAGGCCACCGGCCTCCCCTACGAATTCCGCGCCCTTGAGTCCATCCTGCTCTCCTGTCTGAGCGCCCTCGAAGTCGAGATGGTCTTCATTCGCAACCTCGTCGGCACCCTACTCGCCGAGCTCGAGGACGACATCGATCACGACCGGTTCAAGCGCTTGCTGTACTACTCGCGTCGGCTGGACAGCTTCCAGAATCGGGCGAAGTTGGTGCAAGACTGTTTAGACGAGCTGCTCGACACGGACGAGGACCTGGCGGCCATGTACCTGACGGACAAGAAAAACAATGCGGAGCGGCCGGATGAGGACCACGAGGAGATCGAGTTCATCCTGGAGTCCTTCTCGAAGCAGGTGGAGGAGATCGTGAATGAGGCGCAGAGTATGCAGAGCAACGTCCAATCCACCCAAGAGATTGTCGAGCTCATCCTGGATTCCAATCGGAACGCGCTCTTGACGCTTGACCTCAAGGTCTCCATCGCCACCCTCGGCATCGGCATCGGCACGCTCATTGCAGGCCTCTTCGGCATGAACCTGCGCACAGGCTGGGAAGACGACGCGCACGCCTTCTGGGTCATGTCGGGCGTCTCGGGCGTTGTCGCGATCATGGTGGCGTGGAGGGGATTCAGAATACTTCGCAAGATCAGGAAAGTCGGCCTGTCGAGCACGCATAGCCCACGGCAAAGGAGGCGACCCTTTTTGCCTCTGCCTTTAGGGCGCGAGCGAATCGGCGACGGCTGGCCATAG\n>XR_007359457.1 PREDICTED: Ostrea edulis uncharacterized LOC125645827 (LOC125645827), ncRNA \nACACCCGCTGTGAGTCCTGTATCTTGATCATTTAAACAGAGTTAAATGGTTAAGTAATATAGATAGTGGCAAAATAACAGGTGTTCTTTTCATTGATCTTAGTAAAGCCTTTGACACTGTAAACCACCAGGTATTGTTACACAAGCTTTTATCATTTAGTATTTGTCAAAATTCTTTTAAATGGTTTCAGTCTTATCTTAGCGGAAGATCACAATGTGTTAGATGGAAAGGTGTTTTGTCAGATGAAAAAGATGTTACAATAGGAGTGTCTCAGGGGTCCATATTAAGTCCATTGTTCTTCATTTTATTTGTTAACGATTATCCTAAATGCCTAAAGCACTCAAATGTCTCTATATATGCAGATGATACATCTCAGGATGTTTCACATCAATCTATTGATGTTATTGAGCAAAGGTTACATGATGATCTTTTAAACTCTATGAAATGGGTGAAAAGTAATAAACTTACGATGAATTTAGAGAAAACACAATGTATGTTGATTGGCACTGCACAAAAACGCTCAAAGTGTAGAAAAATGTGTATTAAATTAGGAAATATTGTTTTAGATACTGTTAAAAGGGCCAAACTTCTTGGTGTACAAATAGATGAATGTCTAACCTGAAAAGGGCAGCCAGAATTATATTGAAGGTGAAAGTAACTCAGACTTCTACAGCTGATATTTTTAGTGTTCTTGAATGGATGCCTGTTCATGATTATGTTGTATATAGAAAACTAGTGCTTGATTTTAAGGTTCTTAATGACATGACACCAGAATATATGAGAGTTTTTAGTTTTGTCAGCCAAGTTAGTTTCAGAACAACAAGAAGTAGCGATAGTGGCATTTTATATTTACCAAAAGTTTGAACTGAATATTATAAATGGTCTTTTAAGGTATCCTCCACAATTTTATGGAATGAGTTGCCCGAGTCTGTCAGAAGCTGTGGTTCTATTACATCTTTTAAATCAGCATATTTGCAGCATTATTACTCAAATAAGTGATATATAGATATGATGTATATGTTTATTTTTCCCCAGTGATATGGTGTGTATATTGTATGTATATATTTCATATTATGTTATCTATTTTTCTATTCTTTCATTTATCTGTCTGTCAATATGTCTTATACAGGACCACAATGCAAACTAGTCATTTGTACTAATTGTGCTATCCTGTCTAAATAAAAGAATTTATTTAT\n>XM_011701982.1 PREDICTED: Wasmannia auropunctata histone demethylase UTY-like (LOC105457365), transcript variant X2, mRNA \nAGACAATAAGAAAAATTACTATTATCTTCTTTACTTTTCTTACTGAGGAAATAATCCTCCTCATTTATCCGATTTTTTGGGGTGTTCCGCGCTAAAAATAGTTTCAAATCTTGTCATACGTGAAATCTGCATAAAATTTTGTAAGAATTTTATTTCATATCTCCGTTTCGTATTTGCATAGTCATGTCTTAGATAGGGAATTATTTCGAGCATTTATGGCATAATAATAATATAAAAATATTGCCGGGCAAGTGATATGATTATTTGGGGAATAAGGAACGACGCTATGTCCGATGATTATTGTTTATCTGTAGTAGCAAAAAATTTCTAACAGGATATTTAAACCAAATAGCTTTAGTGTGTGTGGGGGGGGGGAGGCCGTTTATATTATTGAACCTATGTCCTTTGTATCCGCATCACTTTACCTTCAAATCCAATATCAAATGTGTTAGCAAGAACAGTCGCAGTTCGTTAGTGGTTGTGAGAACAATAGAGAATTTTAACTAGTATACACGTATTTCTTATCTTGCAAAGAGTCTGTATTTCCTGCTTTTTATAATTTTAATTTAATTATCCATCCAGACGGCAGTTGAAAGAGAAAATAAATCTCAATGAACGCCTCAGAGATTATCAAGCTGTGCAAAGAGCCGATCAACCAACGATTAACGGAAGAGCAATTGTCGCCGCCGGTACCGAGCTATCACGTGAACAGCAGAACGGATGCATTCCATCCGAAGCTGCAGAGAACCTGCCTGGATTGTCCCGTTGCCGTGATACGCAATCTCACGGCAACGCTCGAGATCAATCTGGACCTTTATTCGACTAAGACTCTGGTTGAGACACGGCCAAATACGAAAATCGACATACGCGAGCAGAGAAGATACGCTTTTGATGAGAATTGGGACGAGGAGAGGAGAAAGAAGAACTGGGCGTGCACCAGTAAAATGAGTTACATGACGATCAGCAAGTACGCGAAATATCAAACCGACAGGCTTCTCGAGGAAGATCAAACTCTACTCGAGGAAAATCGAAATCCCAACTTGTCTACTTTCGACGGGCCCGACAAAGTGACCGAACGCAACAAGACGGTGAAATTCGCTACGAATGTGGACCTATCGAAGCCATGCTGGAAACCGCAGTTGAACGAATTAACGAAGTTACCATCCTTGTTCAAGGTGGAATGTGCCGACAATATGCTTAGCTACATGTGCCGCGATCTCCTAGGGATGAATACCGTACAGTTATACATGAAGGTACCCGGCTGCAGAACGACCGGTCATCAAGAGAATAACAATTTCTGCTCCGTCAACATTAACATCGGACCGGGTGACTGCGAATGGTTCGCGGCGCCGCACGAGTACTGGGGCGTGATAAATTCACTCTGCGAGCGAAACGGCGTCGATTATCTGCGTGATCCCTGGTGGCCGCCGAACCTGGATGTTCTGCGCGAGAATAACGTCCCGGTGTACCGATTCGTTCAGAAACCGGGCGATATCGTGTGGGTGAACGTCGGCTGCGTGCATTGGGTGCACGCGATCGGCTGCTGCAATAACATCGCGTGGAACGTCGGCCCGTTCACCGTCAAACAATATCAGACAGCGATAGAACGTTACGAGTGGAACAAGCTGCGGCAGTACCTGTCGATCGTGCCGATGGTGGAGCTTTCGTGGAACCTGGCGCGCAAAGCTAAAGTGTCGAATCAGCTGTTGTATCAGCTGATCAAAAACTGCCTGTCGAACACGATGAAACAAAATTATTTGACGCTGGAGTTAATAGAGAGCAAGGGTCTGACAGTGAAAAAATACGCTGACGAGTGCGAAAACGATGAGACGGCTTATTGTGAAGACTGCGCTGCTGAGATATTCAATATAATAATCTGCAAGCGCAAGAGCAAGAAGACGAAGACACATCTGGTATATTGCCTGGACTGCGCGCTGAAGCAGTCTACTTCGCTGGAAAATTTTGTCTTTTTGGAGAAATGTTGTATGGAAAATTTGATGAACATTTACGATAAATTCGTATGCTACTAATTATCGGTGCTATCATCACCATTTCCTTATTATCAGCGTTGATACTTTGATGTCGCAGGTCGCAGACACAAACAGCTAATCTTATTGGTATAGCGATATTAGATATATGAGCATCTCCTTCCTACGAATATTCTTGTCGAAACATATTACAGTAGCGAGAATAAGCATCTTTTTTTGTGGAATTATCGAATTTCATTCTTCTTTTATACACTTAATTTTAAGACTGAAAAACTCATCGAACGTCTGTATTGTGAATTTAGAGTCAAACAAGGTTCCTAATCATGAACATTAAAATTATGTGCACTCTAT\n>XR_007367990.1 PREDICTED: Ostrea edulis endochitinase-like (LOC125669718), transcript variant X4, misc_RNA \nTACGTGTGTTTAAGTAGCACAGTCGAGCAGCACAAAGCGGAGTCCCGAGTAATGTGTGGCGTGCTCCTCTGCTTAGAAGAAGGAACTGTTATATTCACATTTGATGTCAATACACTAATCTGTCGAACTTACAAAGAGGAAGATTTTATCGGATGCCTCTTTCAAGCTTGTTCGACCTGTAAAACATACGGATATAATGAGTTGGAAACCACCACCGCCGCCAATGCTGGTACCACAACAGTACAAACAACCCAAGATACAGGACAACAAGGTTCTATAACAACAGTACAGACGACCCAAGACCCAGGACAAGAAGAGTGTCTCAGTCATTGTGAATTTCGTTGAAAAACAAAATATTTTATCTTTTATTCGAATCAACTGTATCCTGCACAGGTCTTCATGGAGCACTCCTTCCTCATCCTACCGACTGTTCTAAATTCTTCGAATGTGTGTACACGAATGCCGTACCACGTGTTTGTGCCGTCAGCCTTCATTTCGATGTCAACCGCAATTTGTGTGACTACCCAGCTAATGTTGACTGTCAGTCGTAAAGCAGATTTCAAAATTAATTCTCCACGCAGGACAATATCATTGTTATGCTATTAGCACATGTAGAGTTATAAGTGAATCTTCGCATTTCAAGATAATTAATATCATGGTGTTTGGCGTGTAACAAATAATTAATGATTAATTAAAACGGAGAGGATTTATATAGGCAGTGCCTGCTGCCCAATCCTATTATGAATTATCATAATAAAACAATATTTAAATCAAATTAATTATTTGTT\n>XM_024808092.1 [Candida] sorbophila hypothetical protein (B9G98_01534), partial mRNA \nATGAAGCTTTCACTCTGGACTTTGGCCGTCGCACTCCCCCTTGCTTGTGCCCAAAACAACAACAACAATGAAGATCACAATAATCACCATTCGGAAGTGAATGGTAATAACAACGACCAAAGCCAAGACCATAACCGCACCCGTGACTATAACAACTCACATGATCACAGTCACACTAACGATAACGACCAGGGTCATAACCGTACTCGTGATTACAACAACTCACATGACAATAACCACACCGACAATGACCAGGATCACGACCAGGACCATAATCGTACCCGTGACTACAACAACTCGCACCATAACGAGCACACCCGAACCAATAGTGCAGTATCTACAGGCACTTCGGCCAACGGAGGTAAGCCCTCTCCTATCGGTGCTGGTGTTGGTAGTGCTGCTGAGAGTACCAAAACTGATATCAAAACATCTACCGTGACTACAAGTTCTACTAAGATCGCTTCCACCACTGCCTCTGCCAGTCACAGTAGTACTACCAGTTCCGCTAGCTCTTCCAGTGTGTTATCCACTTCCAGCTCGACCAGCTCCACCTCTTCGTCTTCTAATGCTGGAATGGCCGTGGTCGTAGGCGGGTCTACTATTTTCGGTGCCGCCCTTTGTGCTATAGCTATTTTGTAG\n>XM_028677370.1 Plasmodium relictum conserved Plasmodium protein, unknown function (PRELSG_1111000), partial mRNA \nATGGATAACAGATATAAAGATGGAGAAAGTAATACTAATAATTTGGAAGAAAATGATGTGAATAATTTTGTTTTAAAAAATAAAAATGACATAGAAAGCAAATCAGAAAAGCAATTAAATGTGAATGAAAATTTAAGTATGTATAATTCTTATTATCAAAATGTACTGAATATTAATTATAAAACAATAAATAATGAAAAAAGGGATATAAAAAACGAGCAGAATGTGCAAATTAAAAAGTTAAATGATATTAATATAGAAAGTAACTATAATATGAATTCTGCTACTATTGGTAGTAAAAATACATTAAGTAAAAATAATAATAACATTAATGGTTTGTTTAATGATTTTAGAAAGAATAAAAATAATTTTTTCAATTCAGAATCTAATTATCTTGAGGAAAAAACAGATACAAATAATTTTGATGAAGAAATTAAAACTAATTCAAAGGATAATATGGAATGTATGTTATTTAATAAACTTAATCATAACACAAATAATAAAATTAGTTCTGATGAAAATAAAAATTTAAATAATATTTATTCAAATACGAACTTCTTAAGTGATACTTATAATAATGATTCTAATAATGATGTAAATAATTGTAACTATAATTATATTAATAACGATAACAGCAATAATATGAGTTGTAACATAAATAATATGAATAAAAATAGAAATAATATATATGATAACTTAAATAAATCAATTAATGTTAATGTTTCAAATAAAAACATTAATAAGTTTTGTAGCACAAATAATAACAATAACAATTATAATAATAATAATAATAGTATTTATAATAATGCAAATATTGTAAGTAATTCAAATAATAACTCTTTTAAAACTTATAATCCAAAAAAAAAGACGAAAAATATAAATAATTTTTTAAATATTGATGTAAATGCAAATTCAGAAAAAAATTCTTCCATTATTAAAAAAAATTGCTATATAAAAAATTATCTAAATCTAGAAGGTAATATAAAAGGTAGAACTGATATTGAGAATTTTAATTATATTAAAGAAAATAAGAAAAGTGTAACAAATAGCATAAGATATAATGATAAAGAAAATAATAATTCTATTTTAGAAAATAAGAATAGTACGAATGTAATTTTAAACACATGTATGAACAAAGTTAATAATTATAATGAAGAAAATATATTACAACTGAATATTAGCAATGAAGATTGCTTTAAATCATCGAAAAATTCAAAAAATAATGATTTAAATAATGATGTAGGTAAAACTTATATTACTATAAAAGAAAATTGCAATAAATCAGAAAAAAAAGAAAATTGTTTTAGTAAGGTAAATAGCAATAACTTTCATAATAATGATATATATGGAAATGACTATTATAATAATTGTAATAGTAACATTTTTACTTCTCCACATGAAAAAAATGAAAAACTACATAATAATTTAAGTTATGAAAAAAAGTATATGAATAATAATTTTTTGAACGATAGATATTTAAATTATATGGAAAGCGATTATAATGATAATTCATTTGATATATGTGAAATGAAGAATATAAAAAAGAATGACGAAACTAAAATTGAAAATAAGGAAGAATTAAAAGATTTTTCAAATGACTATTTATTATTTAAAAATAATGAAAATTCTTTTAATTATGATATCAACGATTATGTTTTACTGAATAAAAATTTTAAAAATTATAATGCATCAGGTGAAAGTAATGCAAAAGAAATGAAGACAGATTGTATGACAACTGATAGTACTATATATACGAATAATATTCTTAATCTACATAAAAATATAGAAGAAGAGAATGATGAAATCTATCAGAATTATAATTATTATGAAAATGATAATATTAATATAATGCAAAAAGAAATTGATGAGGAAAGTTTAAATAAAAAAATAAATATAGGTAGTAGGGAGAGTATTTTAAATGTAAATAGTTTTGAGAAAAATTATGATTTTGAAGAAAATTCACATATGTACAAGCATTTAAATTTTTCTGATAATTTAAATATGAACAAAAATTTATCATTTTTAAATTTTGATGATACACTTAATGAATGGAGGCGTAAGCAAAATAATGATAATTTTTTGAAAAAGGAAAATAATAACATGAACACATGTTCATTTTTTGAGAAATTAACTTTAAATGAAAATGAAAGCTTGGAAAATGGAAGAGAAAATAATGTTTCTATTTCAATGTATGATATGCAAGAAAATATAAATGAAAAAAATTGTTTTAAATGCACTATTGAAAACAGTGATCAATGCGATGATCGTATGAAGAAAAACATGCATAATATTATTATGCATAAGAATAACCTCAATAGGAATATAAATTTTGATGTTAGTGATTTTTGTAGAAATGCTAATAATATAAGCAATGATAATATAAATGCCAGCAATAATGATAATAGTTTATGTGATAAAAATATAAATAAATATGTTGATAATAATTATTTGAATAACCATGAATATAATAATAATAACAATAATTATAATCATGATAACGATGTAAATATCTCAAATAACGAAAATTCAATTAAAAATAATTCAAGTAATGCTAACAGTAATAATAATTTAAATAATAATACAGATAACATAAATTCAAATGGAAATGATCGTAATTCCTTTTTTATGAAAGAAAATGATTTTCCATATTTAAAATATAAAAATGAATATACCAAAAAATATATAGATGAAAATAATTTAATGTTTCACAATGAATTTGACACTTTCGATATAAAAGATAAGAAAAAGGGTTGTGAAAAAATGAAAAAGAATAATTATGATATGAAATGGATTAATAGTAATTTATCACCTAATAATAAAAATGAAATAAACAATGAAGTTATTTCCAATGTTAATAGTGGAGATTGTAATAATTATTATTTGATTTTAAATAATAAAGGGATATGTTATGATACTAATAGAAGTGATTTTCCAAATGATTGTGAGGAAAAGTTTGATGATAAAAAGAAGAAAAATAAACATAATTTAAATTATTGTAATATGAATAATAATAGTAGTAACAATAACATCAATGATAATAATAAGAATATTAATAATAACAATAACAACCAAAATAATAATAATATTAACAATAACAATAATAATAATAATAGCAATAATAATAATAATAGTAATAATAACGATAATAACAATAATAGTAATGATAATAATAATAATAAAAATGTTAATAATAACAATAACAACAATAATAATAGCAGTAATAATGATAATAGTAATAATAACGATAATAACAATAATAATAATGATAACGTTAATATGAGTAATAATAATAATATTAATATGAGTAATAGTAATAACAATGATAATAGTAACAATAACATTAATATAAATAATAATAATAATAATGATAATAGCATTAATAATAATAGTAGAAAAAAAAATGTAGAAATTGAAAATAATTTATATATGAATGACTTTAATATTGATCTACTGAGTTATAAAAATATTAAATTTGACAATTTTTCATATAAGGGTGATCTTATAAGTAATGAAAAATCTCCAAACAACTATTTAAAATTTTCTTCTAGTAATTTATTTAACAATGATTATAATGATTGTGAGAAAAATGCTTTTGGAAATGATGTATTTAATATTAAGGATAAGGAAAATAACAATTATGTTAATTATTCGAAACTAATGAATAAAGATAATAATTCAATTAGTAGATACTGTGATAACTCAAAGGAAGAAAATAATTTAAATATATGTTCTAGTGTGCTTAATGGAAATAATAATGATAAAATTAATTTGAAGTCTTCTAGATTTTTAAAAAGTAGCATTAATAATAATTCTTATTATTCAAATAACGAAAAAAAGGAAACTTATTGTTTGCCAATAACAAATAATATATTAGAACTTAATAAAAACATAAATTTAATAACAAATGAAAAAGAAAAAGAAATCATTGATCCAGTTTTTTGTTTAAGTAAAAAAAGTTTTAAAAATAATTATTCTATGAATACAGAAAAATGTAGCAGCATTCATAATAATTTGAATGATATAAAGAATGATGAAATAATGTTTAATATTAATAACAAATACAATATGTATAACATAAATAATGAAAATAATATATACCATATAGATAATGAAGATAATATGTATAACTTGAATGATGAAAATGATATATATGATATGGATAATGAACAAAACATGTATGACAATATAGAAAATATGCACCCTACAGAAAATAACTGTGCGTATAATAAACTTAATAACTTAGAAAAAAATAATAAGAATTTATATCTTATGGAAAATGATTATATGTATAATAACATAGATAATGATATATACAATGATATGAATAACTTACAAAGTAATGAAAATATATGTGATAATAGAAATAACATAGAAAATAATTCAGATGTGTGTGGTAATATCGGAGAACATGGCAATGCATGTAACATGAATAGTATTGAAAACAATATGGATTTTATATTAGGTGAAAATGAGGAAGTGGAAAAAGAATCAAAAGGAAACGTGAATAATGATAAAATAAATGAACTTCAAAACATTATAAATAGTTTAAAATTTAAAAATAGACAATTGGAAAAGGAATTAACTGATATAAAGAATATGTATTTAAAAAAGAAGCAGTGTTTAATATTAAATAGTCTAAGTAATAAAAATGATGATATTAACAGTTATTCAACTTTTAAGGACGATACCAATAATTCTGACTGTGAAAGTGCAGTTCAATCAAGTAAATATATACAGAATTTTTTAAATGATAAAGAGAAGTATAATTATGATACAAAAATATCTATTCAAAAATTTCATTTAGCTTATACTAATAATTCAATTGGAAAATTAAAAATAGCAGCGCAAAGAGATATTAGTGGATCTTTTATGGGACCTAAAGGAATACATGTAAAAACAATAAAATCTTCTTTACATATTTCTGTTTATAAAAGTGCAAAAGATGTATGGTTTCCTGGATTTGCTGATAGTCATGTTTTTTTATTAAAAGGAAATATATTTGGAATTTTAAGAGCATGCCAGTTATTATATCATTATGTAAAATCGAAAATGTCTTCTTCGAAATGCTGCATTTACCTAGTTGCTCCATTTGAATGCGTGCAAAAATTATTAGCTGATGGTTGTAAGAGAATGGCTATTATAAAAGAAGAATGTGGAGCTGATGTAAGATTAGGAAATTTATATGTACAAGTTCATGAAGGTTTTACTGAAAGATTAATGGAAATAAGAGGAAACGAAGTTAGTGTTGATTGTGCTTTGGAAAAACTAGTTATTTTTATGCAATCATGTTTTTCTGTACAGTCATATGATTATGAACTGTTAAAATATCCATGTCGCTCAGTATTAAATTTACAATAA\n>HM928366.1 Uncultured Pseudomonas sp. clone GG5QJA201B0DXG 16S ribosomal RNA gene, partial sequence \nAGAGATGGATTGGTGCCTTCCGGGGACGTCTGACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCGTAACGAGCGCAACCCTTGTCCTTAGTTACCAGCACGTTATGGTGGGCACTCTAAGGAGACTGCCGGTGCAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGGCCTGGGCTACACACGTGCTACAATGGTCGGTACAAAGGGTTGCCAAGCCGCGAGGTGGAGCTAATCCCATAAAACCGATCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGTGAATCAGAATGTCACGGTGAATACGTTCCCGGGCCTT\n>XM_012845165.1 PREDICTED: Setaria italica wall-associated receptor kinase 5 (LOC105914170), mRNA \nATGGGAAGCTACAAATGCACGAACCAGCAGCACCAGCATCAAGCCATAGAAAGTATCATAACAAATTATACGCTTTCAGGTTTAAGCATCATTATAGGAGTTGGTAGCGCAGCAGGCTTTATACTTTTGGTTGTCATTATTGTCTTTATCACTCAAAGGTTTAAGCAGATGAGGGCAATGAAGCTAAAACAAAGAAACTTTGAGCAAAATCGTGGACAACTGTTACAACAGTTGATATCCCAAAGGACAGACATTGCGGAAAGGATGATCATAACATTGGATGAGCTTGCAAAGGCAACAAATAACTTTGACCCAGCCCGTGAGCTTGGTGGTGGAGGGCATGGTACTGTCTGCAAAGGGATTTTGTCGGACCTACATGTCGTAGCTATCAAGAAGTCAAATATAACAGTCCAAAAAGAAATAGATGAGTTCATAAATGAGGTCGCCATCCTCTCACAAATAAACCATAGGAATGTGGTAAAACTGTTTGGATGTTGCCTAGAAACTGAGGTGCCATTGTTGGTTTACGAGTTTATTTCCAATGGAACCCTTTATCACCATCTTCATATTTCAAGATCACTAGCATGGAACAACAGGTTAAGAATCGCAACTGAAACTGCTAATGCAATTGCCTATCTTCACTCATCAGTTTCAATCCCAATCATCCATAGAGATATCAAATCCAGTAACGTGCTCCTTGATGATACGTTGACATCAAAGGTGTCGGACTTTGGAGCTTCAAGGTACATTCCACTTGATAGAAGAGGGTTAACCACAGTTGTTCAGGGGATTATAGGATACTTGGATCCTATGTACTTTTACACAGGCCGCCTTACAGATAAAAGTGATGTTTATAGCTTTGGTGTTCTTCTTGTGGAATTGCTCGCTATAAAGAAACCATCATATTTGTCCTCTAACGGTGATGGTCTTATTGCCCATTTTTCTCGCATTAACTTACATGATGATGGCAACCTGGACCAAATACTAGATCCTCAAGTTATGGATGAGGGAGGCAAAGAAGTCGAAGAAGTGATTAAACTTGCAGTGTCATGCGTACGATTAAGGGCTGAGGACCGGCCAACCATGAGACAAGTGGACCTTACACTAGAAGGCCTTTTGTCATCTGAGAATCATGAGGAGAATAATACATTGGCAGAGGGATTTGAGGATATTGGTAATATGCAGATGGATTTTCCGTCGATTGATGAGGGGCAAAGCACGGGGGAGTCTAGTAAATGGCACAGTTTGGGACAGGATCCCTTGATGTTTTCTGGTTCTCGGTAG\n>XM_031547130.1 PREDICTED: Punica granatum sister chromatid cohesion protein SCC4 (LOC116212494), transcript variant X1, mRNA \nTTCCCCGAGTCCCCCATACACAAGAAGGAAGGGGGAAAAGAAGACGAGAGAAGAGAAGAGAAAAGAAAAGAAACTCTGGTCCTTGTTGCTGTTCTCAGTCTTCGCTCCTCAGGGTTGAGGGAGACGGTCGGTAAGGGACAACAAATCCGGTAAAGGACCTCCCCAGCAGTTGCAGAAAAGAGGTGAGACTTGCGGCAAGATAGTCCGGAGCACGAGGGCGTTGATCTGATTTAGAGTAGTCAGTGCAGCAGTTGGAGTAGGCTTGGTGCGGTGGGAGAGAGAGAGAGGAGAAATGAGAAGCTAAGCAGAAAATGGAAGAGGTGGCGGAGGGACTTTGGTCACTGGCGGATCACGAAGAGAAGAAGGGGGAAATCGGCAGGGCCATTAAGTGTTTGGAGGCGATATGCCAGAGCACGGTGTCGTTCCTGCCCATCATAGAGGTGAAGACGCGACTCCGCATCGCAACCCTGCTCCTCAAGCACACCCACAACGTGAATCAGGCCAAGTCTCACCTGGAGCGCTCCCACCTCCTCCTCAAGTCCATCCCTTCCTGCTTCGACCTCAAGTGTAGGGCCTTCAGCCTCCTCAGCCAGTGTTACCATCTCGTGGGCGCCATTTCTTCGCAGAAGCACATCCTGACCCGCGCACTCGACCTCATTGCTTCTGCTGCTGCCGCTGCCGCCGACCAGCTGGAAGTGAAGCTATGGGCTTGCAACTTCTACTCGCAGCTTGCCAATGCTCTCATAATTGAGGGCGACTATCAGAGCTCGATATCTGCGCTAGAGCATGGACGACTCTCTGCCACTGAGCTGCGCTATCCGGAGCTGGAGATGTTCTTCGTGACATCCACTCTTCATGTGCACCTGATGCAATGGGAGGACGAGAATGTGATTGCAAGTGCTGTCAGTAAATGCGATGAGGCCTGGGCCTCCATTCATCCTGAGAGAAGACCACAATGCCTTGGTTTGTTTTTCTACAATGAGCTGCTGCACATCTTCTATCGCCTGCGCATCTGTGACTACAAGAATGCTGCCCAGCATATCGACAGATTGGATGCGTCAATGAAGAATGAGTTGCAGCAGAGGCAGGAGCTTATGGAGGAACTCCAAGCTTTGAACCAGAGTCTCTCTAGCTCTGATCTGAGCCCCAGAGATAAATTGGCTCTGTCTGGAAAACAATCTCAGCTTCTAGAGCAGTTGAGAACAATGGCTGGTCAAGATTCTTTTGCACCAGGTAATAGTGGAACTGTCAAACAAGCATGGGGTGAGGGGCTTGAGTTGGCGCCATCCCCTATAAATGGAGAGTGGCTCCCTAGGAATGCTGTGTATGCACTTGTTGATCTTATGGTTGCCACTTTGGGACGTCCAAAAGGACTTTTTAAAGAATGCAGCAAAAGGATTCAATCTGGAATGCTTATCGTCCAAGAGGAGCTGATGAAGCTCGGTATAACAGACAATCTCAAAGAGGTGGATTTGCAACACTCTGCTATCTGGATGGCTGGTGTTTATCTAATGCTTCTTATGCAGTTCCTAGAAAACAAAGTGGCGGTGGAGCTTACACGATCTGAATTTGTTGGAGCACAAGAGGCTTTGGTGGAAATGAGAAAATGGTTCACTCGCTTTCCAACTATATTGCAGGCTTGTGAGAGCATTATTGAGATGCTTAGAGGTCAATATGCGCATTCTGTTGGCTGTTATAGTGAAGCTGCCTTTCATTACATTGAAGCAGCAAAGCTAACAGAGAGCAAATCTACGCGAGCAATCAGCCAGGTTTATGCAGCCATCTCTTACATTTGTATTGGTGATGCTGACTCATCTTCACTGGCACTTGATTTAATTGGGCCTATCTATAGAACAATAGATTCCTTTGTTGGAGTTCGCGAGAAGACTTGCATCCTTTTTGCTTATGGACTTTTGTTGATGAAACAACATGATCTACAGGAAGCAAGGAATCGGTTGGCCAGGGGCCTGCAGATGACACATGCACATCTGGGGAATCTTCAACTTGTTGCACAATATTTGACTATTCTGGGAAGTTTAGCACTTGCCTTGCATGATACAGTGCAAGCCAGAGAAATCTTAAGATCTGCCCTTACCTTAGCAAAGAAGTTGTATGATATTCCAACACAGATTTGGGTATTGTCTGTCCTAACAGCCCTGTATCAAGAAGTAGGGGAAAAAGGAAATGAAATGGAGAATGCTGAATACCATAGGAAAAAGGCGGGTGATCTGCAGAAGAGACTTGCTGATGCTCATTCATCTATCCACCATATTGAACTGGTCGACAAAGTGAAAGTTGAAGCTATGCAATTCCAAGACCTTGATATGAAGCGTCTTCTTGGTGGTCCATCCATGAGGGCAAATCTTGACATTCCTGAATCTGTTGGTCTATCGGCTCCAGCCCCTAATACATATACTTCGAGGCTGGTGGACTTGGACTTGGATACAGGAAGACGCACAAAAAGAAAATATTAGTTGGAACTCTACTTTCTTTTCCTTCCACCTATATGGTGGAATGTTCATGGTCAAACTACATACGATATCAGCACTATCAACAACAATTTACCATGTTGTAATTCATGTAGGTATAGATAGATGTAATATCTAATTTGTGTATATGTAAATCTGCGAAACATGTTACTGGAATAGGCATTACAAGGTTCTTGGTTTCCGGTGCTAGGCTCTGCTAGCCGTATTGTTTTCAGTAACCTGACACGATTAGCGATCACAGTAAGTAGTTCAGTTTGA\n>XM_051656078.1 PREDICTED: Myxocyprinus asiaticus protein unc-13 homolog C-like (LOC127416634), mRNA \nTCCTCCAAGGGCTTCTCGTACTCTCTCTCAGCACACACACTTCCTGTGCATCCAGACAAGGAGCTTTCACCCGTTCCAGACACACTGTCTGCTGCCCAGCGTAGTGCTACGAATTTTGTCTGGAAGAGACAGGCAAAGAGGAGGGATATTACCCAGGATCTCTCCATGATTTGCAACAGCATGTGCCTGCCGAACAAGACTTCAGCCCAAGGTTGATCCGAGCACAACCGCTGCAGCACGAAACTAGGGAGAGATGGATCATATAGAGGGGAGGACATGGAACTGAGTCTGACATCTAGAGGCTTGTGAAAGGATGCTCGGTGCTCCACAACAGGACATTTAAGAGTTTAGTTGACTGTTCTGGAGCTCCGGTGCTGTAGTAAATGGATTTGGTGTGCTGTAGGAGTAGGCTGTGATTGAGAGATATGAAATTTCTTCAGAAGTGCGCATAGCATGTGCAATGATTTTTGCTTGGCACAATTGTCTCTGAGGACATCAACTCTTCTCTAGACCCTCTTATACCACAGAGTTAACTTTCAAAACTAGTAAGCTTTTGCGTGCTTCCTGTTAAGCACCTCTGGATCAAAGACCAGTTTTGCTTTGCCGCATCTAGAGTGCAAAACTGCTGAAATATCGCCATCCATGGTTTCTGCTCATTTCAAGAAGCTATCGTCTTACATTGTAAAGATTTGCAAAGGAATGTTTACAAAGAAACTGGCAAATACCTCAAAGAAGAAAGAAAGCAGCGACAACAAAAAAGAGCCGAAAACCTTCCCAGAACTGCATGCACGGAACCCAACGTTCTCAACTACATTGAAAAGCACAGTCAAAAAAATATCCAAATGCTCATCAACACGCAATATATCTCTTGAAGAGGAGGATGGAAAAAACGACTGTTCCTCTCTCTCTCCGACATTTAGTTATCGTGTAGCAATTGCCAATGGACTACTCAAAAATGACCTCTTACTAAACAATAATGAATTTCATGAGGTCTTGTCAGTTGACAGCGATTACTCAGACTGTCTAAACGAGACCAAACTTGTCCATAGATTCGATGAACAAAAAGCTTATACAATGCCAGTAAGAAGGAATAGGAAGAGCTTGATTAGTCTAGCACCCTCAGACGGCAGCTCAGAGGGAGAGCGGGGAGAGCGCAGCAGTCTCCACACCCTTCGATTAGGTGCTCTGAAAAAGTTGAGGAAATGGAAGAAGAGCCAAGAATGTGTGTCCTCAGATTCAGAGGCAAGCAACTGGAGAAAGACTCTTGGCATCAGGAGCAAATCTCTGGACAGGGCTGGACGGCAACAGAAAACCACTACCCTGGAGCCAGGGTCCAGCTCAACAGGGTGTATCAGTCAGACTCAGGATGTGATGGAGATGATCTTCAAAGAACTTCAGGGAATCAGTCAGATTGAGTCTGAGCTCTCAGAACTGCGAGGGCATGTTAACGCCCTCAAAAGCTCCATCGACGAGATCTCCAGCAGTGTAGAGGTGGTACAGAGTGAAATCGAGCAGCTGCGTTCGGGATTCGTACAGTCCAGACGTGAGACTCGAGACATCCACGATTACATCAGACAGATTAGCCAACATACCAACAAAGCTACTCTAAGATTTCTAAATGTGCCTGAGGAGAAGTTTGAAAAAACCGAAGAGCTTATTTATCAGATTCTGAAAGAGAAAATGGGTTTCACTGATGCACGCAAGACATTTAAAATTGAACTTGCCCATCGACTAGGGCAACAAAGAGAATGTTACAATGCTAAACCTCGACCAATTGTAGTTATATTTTCAAGCCCACAAGATAGAAATTTAGTTTTGAAAAAATGTTATAAGCTAAAAGGGACTGGCATATCAATATCAACTGATAGTCTAGCACATGATTCAAAAGAAAGGAAGGACAAGGCAATGGCCTCCTCGCAGACATATGAAAGCATGGATATCAAGGTTTCAGCCAAAGATAAGGCTGAAAGTGATGAATGGGACTCCATGGAAAGTGACAAAGAGCTAGATGAATTAAATAAGAACAAATATGCAATTGTGTCCAAACCACCTCAAAAAAGTAAATCGGACAAGAAAAAGTCTCACAATCACCGACGGTTGGCTGATGACACTGCATATTCTGTGCACTATGCAGATAATATAGCCTACGATGACCCTGACAAGCAAAGCAAGTCTTACTACTCTGACCTAACACCTGGGTGGCAGTCTCAGAGTGATTATTCTACTCCCAAACTCAGTCGGTCTGAATCGGACTGTTCTAAACTTTGCCAGTCTTATTCAGAGGACTTCTCAGAGAGTCAGTACTTCAACAGAGTCAACGGCTGCTCCCTGCTCTCCTCCTCGGATCAGGAGCTTTGGCAAAGGAAGCAAGAAGACATGGCATCCTCCTGGTATGCTAGTCCTCCCAGTCAAACTCTGAGCCAAGAACGACCTTATGTGGAACATAATGAAGTTGACACCACAGAGACTATTGACAGTGGTGTAAGTAATGGTATTGTTTGCATATCAGGGGACAGGAGCCATTACAGTGGCTCTCAGCTGTCTCTACAGGGTGACCTCTCACCATGGAAAGATTGGCATCACCTCGAACAAGGTGCTGATTCAGGTTTGGATGCTTCAATTGAACAGAACATAATCTCAGAGATCACTAGCCCCTTCGACCCTGCAGCTAACCCAGGTTTCCCTGAGAAAATTACAAAATGCCTTGAGGTTGATTTACAGTTTGAAGGTGAGACCTTCTTGACACTAGATAGCACTCCTGAGACAGGCCAAGACCAAGATATAGATACAGAACCTGAACTTGTTCTAGAACCCGATCCAGAGCCAGAGCTAGAGCCAGAACAAGTACCCAGGCCAGGACCTGAACCAGAGCCAGAGGTTGTAATTGAACCCATATCAAAACCAGTACCAACACCTGTGGCCGAACCACAACCAGAAAAGAAGCCGAAAACCAAGAAAGCCCGTACTAAGCCTGAATCAGCTCCTCAAACTCTGCAACGACAAGATGTCAATGTGAACCACCTCCAACAGAACCAGAAATCTTCATCCATGTACCGCAGTCAGAGTGAGATCGGTAATGAGAAAGTGGAGGAAGTCCCTAAATCCTGGAGTAGTAGGCTCAGCATAGACCTCAGCGAGAAAACCTTCAGCTTTGGATTCGGATCCACCCTGCAAAGAGCCAAGTCAGCTTTGGATTTTGTCTGGAATAAAGGTTCCCAGAGCACTAGTGCTCCAGTCGAAGAAACAAGCAACACCTCATTCATGGGCAGGCTCAGAACCTCGTCCCAGTCCACTGAAAATAGTTCCAGCACAACCATTGACTCTGATGTTTACACAGAACCTTTCTATTACAAGGCAGAGGAGGAAGAACAAGCCAGTGAACAACCTGTGGACAATGAGACACATTATGTTGAGGTAATGGAACAAGTGCTGGCGAATCTCGAGAACCGAACGAATACCAACGAGGCTGAGGAACAGTACCAAGAAGAGGAATATGATGTCTCGCAAGAATACGACATCTCACAAGAGGGTAATCCTGTCCTAGAATACGACTGCAGCCTTGATGAGCAAGATGATGAGGAATACAGTGAGGCGTATGACGACAATCCCATGACTGAAGACACGGCGGAGTATGAAGGGAGTTTGGTGGAGTATGTTGAAGTAACTGAGGAACAGGAAGAAGAATCTGAGGAACAGGAAGAGGAAATAGAGCAGACAAAGGAAGGTCAAGATACAACGGGAACAAAGGTAGCAGCTGAGGTAAAAAAGACAGTAGAACAAGAGGATGAGAATAAAAATGTTACAGAGGTTCCTGTGGAGCCAGCACCACCCAAAAAAAGGATACGGCCCACCTTCAAAGAGGCAGCTCTGAGAGCTTACAGGAAGCAGATGGCAGAGCTAGAACAGCAAATCCTGGCGGGAGACAGCACAGCTCTGGATACAGAGGGTTGTGCAAATATTCTGGATCAAGCCAAACTGGGGCTGAACGGTGGTGGAGTTGGCAGTATACTTTATGGCATTGACAGCATGCCAGATTTACGCCGCAAGAGGACCATGCCTATTGTCCGAGACCTGGCTTTGACCTTGGCTGCTCGAAAGGCAGGCATTGCGTTTGGCCTCGTGAACAGATCAACTCTAAACAATGAGGAGCTGAAACTGCATGTGCTGAGAAAGACCCTGCAGGCCTTGATCTATCCCATCTCCTCCACGACACCCCATAATTTTGAGGTGTGGACGGCAACTGCGCCCACCTACTGTCACGAGTGTGAAGGGCTGCTGTGGGGCATCGCCCGGCAGGGCATGCGCTGCACGGAATGTGGGGTGAAATGCCACGAGAAATGCCAAGACCTTCTGAATGCAGACTGTCTTCAACGTGCGGTGGAGAAGAGCTCAAAACACGGAGCAGAGGACAAAACCCAAAACATCATTATGGCAATGAAGGAACGGATGAAGATCAGAGAAAAGAACCGACCTGAGGTGTTCGAGTTGATCCAGGAGATGTTTCAGCTCTCAAAGGAAGATTTGACCACCCATCTGAAAACAGCCAAACAGGCAGTGTTGGAGGGGACATCCAAATGGTCTGCCAAGATTACCATCACAGTGTTGTGCGCTCAAGGTTTACAAGCCAAGGACAAGACAGGCTCCAGTGACCCTTATGTCACAGTACAAGTTGGAAAGACTAAACGCAGGACCAAAACTGTTTTTGGCAATCTCAACCCCATCTGGGATGAAAAGTTCTTCTTCGAGTGCCATAATGCCACAGATCGTATAAAGGTCCGCGTATGGGATGAAGATGATGACATAAAATCTAGAGTGAAGCAGCACTTTAAGAAGGAATCTGATGACTTCCTGGGTCAAACCATCATCGAGGTGCGGATGCTAAGTGGAGAGATGGACGTTTGGTACAATCTTGAGAAAAGAACAGATAAGTCGATGGTGTCGGGGGCCATCCGACTAAAGATCAGCGTTGAGATGAAAGGAGAGGAGAAGGTGGCTCCACCACACGGGCAGTACACATGTTTACACGAGAATCTCTTCCATTATCTGACGGAGGTGAAAAACAATGGAGTGGTTAAGATTCCAGAGGTCAAAGGTGACGATGCGTGGAAGGTTTATTTTGATGACGTGTCTCAGGAGATCGTAGATGAGTTTGCGATGCGTTTTGGTGTGGAGTCCATCTACCAGGCCATGACTCATTTCTCATGTCTCTCATCGAAGTACATGTGTCCCGGTGTTCCCGCAGTGATGAGTAACCTGCTTGCCAACATAAATGCTTATTTCGCTCACACTACCACGGCAACCACCAACATCTCCGCCTCCGATCGATTCGCTGCATCCAACTTTGGGAGAGAGAAGTTTGTTAAACTCTTGGATCAGCTGCACAACTCTTTGAGGATCGATCTCTCCAAGTATCGAGATAACTTCCCAGCAGGAAATCCAGAGAGACTCCAAGACCTGAAATCAACCGTCGACCTGCTAACGAGCATCACCTTTTTCAGGATGAAGGTGCAGGAGCTGCAGAATCCTCCCAGAGCCAGTATGGTTGTAAAAGACTGCGTGAAAGCATGTCTGGACTCCACTTACAAGTACATCTTTGACAACTGCCATGAGCTTTACAACCAACTTCTGGACCAGGCTAAGAAGCAGGATTTACCACGAGAGGAACAGGGCCCGTCCATCAAGAACCTGGATTTCTGGCCCAAACTGATCACGCTGATGGTGTCTGTTATAGATGAGGACAGAACAGCTTACACACCCATTATTAACCAGTTCCCTCAAGAATTGAACATGGGTAAAATTAGTGCTGAAATCATGTGGAACCTCTTCGCTATGGATATGAAGTACGCAATGGAGGAACACAACAAGCATTGTCTATGCAAGAGCACAGAATATATGAATTTGCACTTCAAAGTCAAATGGTTCCACAACGAGTATGTTCGAGACCTGCCAGCCTTTAAAGGAATTCCTCCGGAATATTCCCTGTGGTTTGAGCCGTTTGTTATTCAGTGGTTGGATGAAAATGAAGATGTAGCCATGGATTTCCTTAATGGAGCTCTGGAGAGAGATAAAAAAGATGGGTTCCAGCAAACATCAGAACATGCTCTCTTCTCCTGCTCGGTGGTGGATGTTTTCACACAGTTGAATCAAAGCTTTGAGATCATAAAGAAGCTAGAATGTCCAAATCCACAAGCCCTCGCTCACTTCATGCACAGATTCGCAAAGACCATAAATAAAGTCCTTCTCCAGTATGCGGCGATCATCTCGAAAGACTTCACCAACCATCTGAGCAAGGAGAAAGTGGCCTGTATCCTCCTGAACAACATTCAACAGCTCAGAGTCCAACTGGAGAAGATGTTTGAGTCTATGGGCGGAAAACAGCTGGACGCTGAAGCCAGTGATCTACTGAAAGAACTGCAGAATAAACTGAACACAGTGCTGGACGAGCTCAGCGGGGTCTTCGGCTCCAGTTTTAAGCCGGTCATTGAGGACTGCATCAAACAAATGAACCAGGAGCTTGTGCAGATAAAAGGAAATGCTGGAAACAAGAGCAACGCAGCCATGGACGCAGAAATTGCCCTGCGACCACTCATGGACCTCCTGGACAAGAACTTGATTCTGTTTGCTAAGATCTGCGAGAAGACGGTTCTCAAACGTGTTCTGAAGGAGCTGTGGAAAATCGTCCTCAACACCATTGAGCGACAGATCGTTCTGCCTCCGCTGTCAGATCAGACACAAGGAGCTCAGATGATCTTCAGTGCTGCCAAGGACTTGGGTCAACTCTCCAAGCTTAAGGAGCATGTGATTAGGGAGGAAGCTCGGAGTCTGAGCCCTCGGCAGTGTGCTGCCATGGATTTAGTGCTGCCAACCATCAAGCAATATTTCCATGCGGGGGGAAACGGTTTGAAGAAGAATTTCCTGGAAAAGAGTCCTGATCTGAAGTCCCTGAAATACGCCCTCAGCCTTTACACTCAACCCACAGATGCCTTGATCAAGAAATATATATGCACCCAGACCTCTCAAGGTCTGTCAACGTCTGGATCCATTGGTGAGGTCACTGTCCAGGTGGACCTGATCTCACACCCTGGTACTGGAGAACACAAAGTCAGTGTGAAAGTTGTAGGTGTGAACAACATAAACTGGCAGACGAATGTCATGTTCCGGCCATTTGTGGAGATCAACGCCATCGGACCACACCTAGCTGACAAGAAACGCAAGTTTAGCACCAAAACCAGGAATAACAACTGGTCTCCAAAATACAACGAATCATTCCAGTACGTGCTGAGTAACGAGCATGGCCCAGAGGCCTACGAGCTTCACATCTCCGTGAAGGACTACTGCTTCGCCCGAGAGGACCGTATCATCGGAATGACGGTTCTGCAGCTCAGAGAACTGGCTGAAAAAGGCAGTTTGAATGCAAGCTATCCACTCGTCAAGAACATAACCATGGACGAAACCGGTCTGACCATCATGAGAATACTCTCACAAAGGACCAACGACGAAGTGGCCAAAGAGTTTGTACGTCTTAAATCGGACACACGGTCAGCCGAGGAGGTGTCGTAAAAATAATCGCAGGGGGAAAAGAGCGGGGAAAAAAGCGGCAAGAAACAGAGTGAAATCCCAACAGCGCAAGATGGTTGTGTTTGTTTTTGTGCATGTGTGTGTAAAACATCTGTTGGAATGTTCATTTTAAACTACAAGTACGTACAAAAGTGTTTACCTACCGTATGCTCTATCAAATATTATATGCTACGAAGTTATGTTCAAGAGACGTTGAATACAGTTTTGTATGACGATTAGTCTTTTTGAACAGATAGTTAATTTGTTCAGATAAAGTGCCAAAACAGATGACAGAAAACAGAGGGAAAAAAAAACAATAGACACATAAACCCATATGAATTCTCGACGAAGTCTTTCTAAATTTGCTCGATCTTTTGTCCAGTGTTTATCATCCTCTCTTTAAGTGTGTAGCGGTTTTGTTTGTCTTTTCATTCTCACCCTACTTTTTCCGTTTTTGTTGCCTCGCCCTTTCCATCTTTCACAAAGGCACTTGGTGGTGCATGTGTTGTTTCCTTGGTGACGTCTCTCCCATGTGTTCACAGTGACTGTGGGCGTCAGGTCGAACCCTTTCCCCTCTAATGTTTTGTATTTTGAGCCGACTTTAAAAAGAGACCATTTTTTTAAATGGCGATGACTGCTACGAATCTCTTCATAAGTGTTTGTAATTTTATAGCTGTTGACAACGATGAAACCCACCTTCCGTCTTGCCGGTATAGGCAGAATGGGTGGAATTTTTTTTTTTTTTTTTTTTTCATATTTCTTGTTCATTTACATACTTTTTTTTTTTTTTTTTTTTTTTTTAAACATAGGCTTCCAGCCTTTCTGAATAATCACTGTGAACATGGGCTCTGGAAGGCAAGCGTACATCAGTTTTGCTGACTGTTTGATATCATCTTTTAATTTTTTCAAACAACTTTGATTCAAAAAATAAATAAATAAAAAAATGGCAGTTATATATAAAAAAAACTTTCATACAAAAGCAATCCATGATCTGTATGAAAATCAGTATATACTATGTACACGTGTTACATATGTACATGAATTATGTTTTTAGTTTTGCTAAATCATATCTGATTGTTTATGGGCCGGTTCTGAATTTAATTTGGGATGATCTTTGTGAAGTTGTTTTATCTGATATGAAATTTGTAAATGTTGCTTTACAAAAAAAGGTAAATCAATCGCCGTCATTTCATTTATTTTTGTTTACAGAGGAAAAAGTTTAACATTTGGTATTTATGCAACATTCCTATGTATTGCACTGATGGCAAATTGTATGTCATGTAAATATATTTAGTGAGATATTGTAATGAAAGTCTCGTTGTATTGCATTTTAATCAAGGAAAGCAACCTTTTCACACATTACACTTTTATAGTATGTATTAGTGTTGGATGTAATGCAATTACAAAATAATTAGTTACTATAATCTAATTACATTTTTAGTCAAAAAAGTTATGTAACATTACATTTAAAATTGTTTTAATCATATTACAGTTGCTAAATTTCAATTAAGTTCTAAAGACATTACTTAGGTAACACATATTGCTAAAAACATTTACACGGAATGAATTTAAAGGAATATTCTGGGTTCACTACAAGTGAAAGGTGCACTTAGTAACCTTTGTCTTTGTGTCTTTGTCTTGGACTTACACTGACACCTAGTGGTGTGGATGCAGCATCGTTTAAAATCAGTAGTTTTCAGTTTCAGATGCCATTGTAGAAATTTAGTATTCACAGTCAGCCATGATTACTTTAATCAATGAGTGAAAGTGTCATATTACAGGATGGTTACTGAGATTAAGCGAGTAGCATTCGGCTGGTCATGTGATACTAACATGGCAGCCCCCATGTGCGGACCCTCTCCATGTAGAATAAAACAGCTTTTATAAGCTTACTGATATAACTTGAGTCTCCATTTTAATGTGAGTGGTCATGATTTCCTACATATATTGCACAATTACAATTCATGTCTTTAGGAATTAAACTTTTTAATGAGGAAAAAATTACTGAGTGCACCTTTAAGCTCAATCAACAGCATTTGTAGCATA\n>XR_003260173.1 PREDICTED: Dromaius novaehollandiae ADAM metallopeptidase with thrombospondin type 1 motif 6 (ADAMTS6), transcript variant X8, misc_RNA \nCGAGGCTGCCAAGGCTCCCTGCTGCCGCCGCGCTCGGCTTGGCCGGGGGCCGGCAGCGAGAGGAGGTCTGGGGCTACTTCAACCAAACTTTCCTGAGTCCTTCCTGCTCTGCCTGCCTGTCTTCCCTTTCCCCCTTTCTCTCGCTCGCTCGCTCTCTCTCTCGCTCCCCCCCCTTCCTCCCCCCCAACTCAGATGATATTCACATGGTATTTTGCACAGAGGAGGCTGTTCAAGAGGAGGGCACCCACCCCCACCCCAATATAAGCCTGTTTTTCCTTCCTTCCTTCCCCCCCTTTTTTGTTGGAAAGACAAAATGTGCAGGGTGATAGGTTGGGTGAATTGATGGCATCCCTCCTCCTGCCAAGTCAGTCCGTTTTCTAAAACCCCCTTTTAGGAAGGCTAGAGAATTTTATTCTGTTGGAGAATATAACCCTGATGGTTGCTTGCACAGAGGGGAAAAGCAGAGAGGAATACGGGAATCGTCCTGTGCAATCTCTATTGTTTGAAACTTACTTTATATCAGAAATTGAAGATGAAAACGGGAAAGAAATGGAGAAAATTCACTAACTGCCAAGTCTAACGTCTTACAGATAACTTAAGGAATTTTACAAATGCTTATTTTTGCGTTGAGAAAATGACTGCTGATATAGAAGAAAGTATAGGTTGTTGGAAAAGAATACCTGTCAAAAAGTGGAACGTCCAATAGTTAATTTGGGAGTAATATAAATGTACTTGTTATGGTGCGATTCTGGAGTGGAGTTAACTCTATAGCACACAGGTAGCCCTCCAAGGAGAAGAAAAAAAAGCTTTCAGTTTTTCTAAATTATGGAAGTTTTTTGGAAGACGTGGACATGGATTTTGAGCCTAGTCGTTGTTTCATCGGAATTTCACAGTGACAGCAGGCTTTTGTATAGTTCTCAAGAGGAATTCCTGTCTTACCTTGAACACTACCAGCTAACAATCCCAATAAGGGTTGATCAGAATGGAGCCTTCCTCAGCTTTACTGTGAAAAATGCTAAACCCTCAAGGAGGAGGAGGAGCACAGACCCTTATGATCAAGAACTGGCAGCATCTAAATTATTTTTTAAACTTTCTGCCTATGGCAAGCACTTTCATTTAAACCTGACTCTCAACACAGATTTGGTATCCAGACATTTTACAGTAGAATACTGGGGGAAAGATGGACCTCAATGGAAGCACGATTTTTTAGACCACTGTCATTACACAGGATATTTGCAAGACCAACATAGTACAACTAAAGTGGCCTTAAGCAACTGCAATGGTCTGCATGGAGTTATTGCTACAGAAGATGAAGATTATTTTATAGAGCCTTTGAGGAATGTAACAAAAAATTCCAGTAACTTCAGTTATGAAAATGGTCATCCTCACGTTATTTACAAAAAGTCTACCATGCGCCAGCAGCATCTCTATGATCATGGTCGCTGTGGAGTCTCAGAAGACCTCACAAGAAGCAGTAAGCCTTGGTGGATGAGTGATGCATCTGCTTTTCCAACTTCACTTCCAGTCAATGACACATTAAGTAGTCACAGTCGGCAGAAGAGATCAGTAAGCCTTGAACGGTTTGTGGAGACGCTGGTAGTAGCAGACAAAATGATGGTGGGATACCACGGTCGCAAAGACATTGAGCATTACATTTTGAGTGTAATGAATATTGTTGCCAAACTTTATCGTGATTCCAGTCTAGGAAACGTTGTGAATATTATAGTGACTCGTTTAATTGTCCTCACTGAAGATCAGCCAAACTTGGAGATAAACCACCATGCAGACAAGTCCCTCGATAGCTTCTGTAAGTGGCAGAAATCCATTCTCTCCCACCAAAGTGATGGAAACACCATTCCAGAAAATGGGATTGCCCACCATGATAATGCGGTTCTTATTACTAGGTACGATATCTGCACTTACAAAAACAAGCCTTGCGGAACACTGGGCTTGGCCTCTGTGGCTGGAATGTGTGAGCCTGAAAGGAGCTGCAGCATTAATGAAGACATTGGCCTAGGTTCAGCTTTTACCATTGCACATGAGATTGGTCACAATTTTGGTATGAATCATGATGGAATTGGAAATTCCTGTGGGACCAAAGGTCATGAAGCAGCAAAGCTAATGGCAGCTCATATTACAGCAAACACCAACCCTTTCTCTTGGTCAGCCTGCAGTCGGGATTACATCACCAGTTTTTTGGATTCAGGCCGTGGTACTTGCCTTGATAATGAGCCTCCCAAGCGTGACTTTCTTTATCCAGCTGTGGCCCCAGGTCAGGTGTATGATGCTGATGAACAGTGTCGCTTCCAGTATGGAGCAACATCCCGCCAATGTAAATATGGGGAAGTGTGTAGAGAGCTCTGGTGCCTCAGCAAAAGTAACCGCTGTGTTACCAACAGCATTCCAGCAGCTGAAGGTACTCTTTGCCAAACAGGGAGCATAGAAAAGGGGTGGTGTTATCAGGGAGAGTGCGTACCTTTTGGCACTTGGCCCCAGAGCATAGATGGGGGTTGGGGTCCATGGTCAATATGGGGAGAGTGCAGCAGGACCTGCGGGGGAGGAGTCTCCTCGTCTATAAGACACTGTGACAGTCCAGCGCCTTCAGGAGGAGGAAAATATTGCCTTGGAGAAAGGAAACGGTATCGCTCCTGTAATACTGATCCGTGTCCTTCAGGGGCCCGCGATTTTCGAGAAAAACAATGTGCAGACTTTGATAATATGCCTTTCCGAGGAAAGTACTATAACTGGAAACCCTACACTGGAGGTGGGGTTAAACCATGTGCATTAAACTGCTTGGCTGAAGGTTATAATTTTTACACTGAACGTGCTCCTGCAGTAATAGATGGGACTCAGTGCAATGCTGATTCACTGGATATCTGTATAAATGGAGAATGCAAGCATGTAGGTTGTGATAACATTTTGGGGTCTGATGCAAAGGAAGATAGATGTCGTGTTTGTGGAGGAGATGGGAGTACATGTGAAGCCATTGAAGGTTTCTTCAATGATTCATTGCCCAGAGGAGGCTATATGGAAGTGATTCAAATTCCAAGAGGTTCTGTGCACATTGAAATAAAAGAAGTGGCAATGTCGAAGAACTACATTGCTTTAAAATCTGAAGAGGATGACTACTATATTAATGGTGCCTGGACTATTGACTGGCCAAGAAAGTTTGATGTTGCTGGAACAGCTTTCCATTACAAGAGACCAACAGATGAACCTGAGTCTTTGGAAGCCCTAGGCCCTACATCAGAAAATCTCATAGTCATGATTCTGCTACAGGAACAAAATTTGGGTATAAGGTATAAATTCAATGTTCCCATCTCTCGCACTGGCAGTGGAGACAATGAAGTTGGCTTTGCATGGAATCATCTGCCTTGGTCAGAATGTTCTGCCACTTGTGCTGGAGTGGCCACCAATGCAATTCTTTACCTCTGGCTGGGAGAGCAGGACAGTTGGCTTCCTTCAAAGCCAACACCATTGCTGCTGCATGGACTGGTGTGCAGAAACAAGAGGTGGTGTGTAAAAGGCTGGATGACAACTCCATTGTGCAGAACAATTACTGTGATCCAGACAGTAAGCCTCCAGAAAACCAAAGAGCCTGCAACACTGAGCCTTGTCCACCTGAATGGTTTATAGGAGATTGGTCAGAATGCAGTAAGACCTGTGATGGAGGAGTGCGTTCACGAACAGTTCTCTGTATCAGAAAGATTGGACCTTCTGAGGAAGAGACACTGGAAAATACCAACTGTCTAACGCACCGGCCTATTGAAAAGGAGCCCTGTAACAATCAGTCCTGTCCCCCCCAGTGGGTTGCTTTGGACTGGTCAGAATGCACGCCAAAGTGTGGTCCAGGATTTAAGCACCGAATTGTTCTGTGCAAAAGCAGCGATCTTCTAAAAACTTTTCCAGCTGCTCAATGCCAAGAAGAAAGCAAACCTCCAGTCCGCATCCGCTGTAGTTTAGGTCGATGTCCTCCTCCTCGCTGGGTTACTGGAGACTGGGGACAGTGTTCTGCACAGTGTGGTCTTGGGCAACAGATGCGAACAGTACAGTGCCTCTCATATACCGGACAAGCATCCAGTGAGTGTCCAGAAACACTTAGACCTCCATCAATGCAACAGTGTGAAAGCAAATGTGACAGTACTCCCATTTCCAACACAGAAG\n>XM_009065832.1 Lottia gigantea hypothetical protein partial mRNA \nTTTCACCAATGGTTTTCTAATTTCCATGGTTATGCCAGTATTATAGTGTGTATATTTGGCATCAGCACCAATATATTCAATATATCTGTTTTAACACGAAAAGATATGAGAACTCCTACCAACATCTTGCTGACGTGGTTAGCTGTGGCTGACATTTTAACGATGGTGCCATACATTCCGTTTGCCATTCACTTTTATTGTCCGAATACATCACCATTCGAGACTCCTGAGAAATACACGTATAATTGGATACTTTATATGATCTTCGTAGTCAATAGTGCCGCTACAACTCACACTATTTCTAATTGGTTGGGTGTTTCATTATCAGTGTTCCGCTTTATGCAGATGAGATCAACGAGTCGAGGCGTTCTAGCCAAACAACGTCGCTTAAAACATGTGAAGGTAATAACCGTGGTTGTGTACATTTTCTCAATCATTGTTCTAATTCCCAACTATCTGACTAACAAAATCCAATCAGTTCAAGGCCCGCGTAATACGACCATATATGGATTAAAAGACATGACACCGAAAGATCCCAGCACCGACAAAATGGCTTTGATAAATACTTTACTTTATGCAGTGGTGGCTAAAATTGTACCGTGCCTTTTAATGTCTATATTTAGTGTGTCTTTAGTATATACAATACATTACAAAAATCGACATCGCATGCGCAGGCTTGTGGCTGCTGGGAAAAAATCGAGGGCCATCTCTAAACAAACAACTACAACCCGAATGTTACTAGTTGTTATAGTCTTGTTTCTTATTACCGAACTTCCACAAGGCATTCTTATTCTCGTTACAGCTGCCATCCCTCAGTTTCATAACAACGTATATAACCTTCTGGGTGATCTAATGGATTTTATTGCCTTATTAAATAACGCAATCAATTTTGTGCTTTATTGTAGTATGAGCCAGCAATTTCGCTCCCGGTTCATTGAAATGTAC\n>KU027247.1 Uncultured microorganism clone SZY.L801.1_Tag26405 16S ribosomal RNA gene, partial sequence \nCAGCCGCCGCGGTAATACGTAGGGGGCGAGCGTTACCCGGATTCACTGGGCGTAAAGCGGGTGTAGGCGGCTCGGTAAGTCGGGTGTGAAATCCCACAGCTCAACTGTGGAATTGCGCCCGAAACTGCTGAGCTTGGGGCCGGTAGAGGGAGACGGAACTGCCGGTGTAGGGGTGAAATCCGGAGATATCGGCAGGAACGCCGGTGGGGAAGCCGGTCTCCTGGGCCGCGCCCGACGCTGAGACCCGAAAGCTAGGGGAGCAAACCGGATTAGATACCCGGGTAGTCCTAGCCGTAAACGATGCCCACTAGGTGTGGGGGATTAATTCCTCCGTGCTGGAGCTAACGCGTTAAGTGGGCCGCCTGGGGAGTACGCCCGCAAGGGTGAAACTTAAAGGAATTGGCGGG\n>XM_042244958.1 PREDICTED: Ovis aries caspase 8 (CASP8), transcript variant X4, mRNA \nAAAAGTAAACTTCTTCCTGGAGGCGTTTCCAACCCCACCTCCTGTCTCCCCCTCCCGCTTGCCTCATTTCCAGGGATTTATCTCCAGCTGGGTTTTAAGAACGAGCCTCAGTAATACGAAGTGTGAAGTTAGGCAGTGTGGGGTCTTGTCGTCGAGAGTTTGGTGGCTGGGATGTTGCCAGGACTGTGTGGAGCAGGTCCCAGTCCATGGTGAGGGCCCTGGGATTTTATTTTTCCTTTGATGTACTGAGAGAAGAGGCCCGTGAAGTGGCTGCTGCTGTGAAGGTTCCAGGATTCGCCTCTGGTAACAACTACATTCTCCTAACACTTGAAAAGCATGGATCTCACCCAATGTCTCTATAAAATTGGAGAGCAGCTGGGCAGTGACGACCTGGCTGCCCTCAAGTTCCTAAGCCGGGACCACATCCCATATAGGAAGCAGGAACCCATTAAGGATGCCTTGATGCTATTCCAGAGGCTCCAAGAAAAGAGAATGTTGGAGGAAAGCAATCTGTCCTTCTTGAAGGAGCTGCTTTTCCAAGTGAATAGACTGGATCTGCTGCTTAACTACTTGGACACCAGCGAGGAAGAGATGAAGAGGGAGCTTCAGATACCTGGCAGGGCCCAGATCTCTGCCTACAGGATCCTGCTTTTCCAGATTTCAGAAGATGTGAACAAAGTGGAATTGAAGGACTTTAAGTTTTTTTTGAGCCAGGAGATTGCCAAATGTAAGCTGGATGATGACATGACTTTGCTTGATATTTTCGTGGAGATGGAGAAGAGGACCATCCTAGGGGAAAATAACTTGGACACCCTGAAAAGAATCTGTGAGCAGGTCAACAAGAGCTTGCTGAAGAAAATCTATGATTATGAAGAATTAAGAAAAGATATGTCACAATCGCTTCCAGAGGAGGGCTCCTCTGAGATGCTGGCCATGTCAGACTCTCCAGGAGAACAGGGCAGTGAGTTGCAGACATCCGACACAGTTTACCGAATGACAAGCAAACCTCGGGGATACTGTTTGATCTTTAACAATTATGATTTTAGCATAGCACGGGAGCAGGTGCCCGAACTTCACAGCCTTAAGGATAGGAATGGAACACACTTGGATGCAGAGGCTTTGGACAAGACCTTTCGTGAACTTCATTTTGAGATAGTGCACTACAGAGACCAAACAGCAAAGGGAATCTGTGAGGTTCTGAAATCCTACCAGAAGAAGGACCACAAAACCAAAGACTGCTTCATCTGCTGCATCCTTACCCATGGAAACAAGGGCACCATCTATGGCTCCGATGGGCAAGAAGCCCCCATCTATGAGCTGACCTCCTACTTCACTGGATCAAAATGCCCTTCCCTTGTCGGCAAACCCAAAATCTTTTTTATTCAGGCTTGTCAAGGGGATAAGTACCAGAGAGGAATAGCTGTTGAGACCGACTCAGAACAGAGGGAAGCCTATTTAGAAGCGGATTCGTCACCTCAGAAGAGATATATCCCAGATGAGGCTGACTTTCTGCTGGGGATGGCCACTGTGAACAACTGTGTTTCCTACCGAAGCATCGTGAAGGGGACCTGGTATATCCAATCGCTTTGTCAGAACCTGAGAGAAAGATGTCCTAGGGGTGAAGACATTCTGACCATCCTAACCAAGGTGAACTTCGAAGTAAGCAAAAAGGATGACAAGCAAAACATGGGCAAACAGATGCCGCAACCTACTTTCACACTGCGAAAAAAACTCTTCTTTCCTCTTAATTGATGCTATTGTTTAGTTGTATAACTAGACAATAGTTATGCAACTGAACAATAGTTAAAATGCTGCTACTTTATTCTCTTTCTTCTTCTTTTTATTTTCAAATAGCTGGCATATCATGAGAGTCAGGACAACATAATTTTTATGCAAATTCAAGCCTAAATCTCTGGCTTTGTAGACAATAACAGTCATAGCTGTGGTCTTGATTTCAATTGTATTTTTAATTTGATGAAAAGGTTTAAAAATGAACTAAAATAAACACAAAAAACACAGTAAGTTTAAAAGAAATATCAAAGATCATGGAGGGAGATTTTTGTGATCTGACCTAGCTGAAAAATCCCCTCGACTATTGAGGTTCAGGGTATAAAGTTCCCACATCCAGCCTGATTGCTACTGATGTGTATGATAAGCTGTCCTGGAAACATGTGACCCTCCTCTCCTTAGCCATGAGCAGACTCTGATTTTCAGTGGTGAAAACCACCACTCTTTAGACTTCAGTTTCAAAAGCTTAGAGATTATTTTCCTTTTTTAAAAGAATTATTCATAAATGCGGCATTCAACATACTTTTAAGAGAAATGATGTTAATATTAACTCGTTTTATACTTCCAGTAGATCTTTTCCCAAGCTGTCCTTTATACTAATTTGCAATATTTTGTAAAATAAAAAAATTTTAAAATTCATATATTAAAGATTTTAAAAATACCAAATGATTTTGTTTTTTAAAGACTCTTTCCAAACTGAAAAGTTTTTATATACATGCTTCTGCAGTGCTGAACATGATTTGCTTTTTTACTAAAAATGCAGTATGCCTTTTATATGTTTGCTCTTTCTTTATATGTTCAATTCACTTTAAATCTTTAGTAATTAATAATTAGTAATGTAATAAATATTTTTAACAGAATAAAATATAATTTTATCATA\n>XM_012896071.1 Acytostelium subglobosum LB1 hypothetical protein partial mRNA \nATGGACCCTCAACAACCTACACAACAACAACAACAACAGAATGGTGGTGGCGGTGGTGATACATTGTCAGCAGCAGTGGCAGAGTTGGATAAGCTAGAGTCATTGTTGGCCAGTGGTTATCTGTCACGTCCATTCTCTGTGGATGTGTCAAAACAACAGCAACAGACGAACAAGTCGACGACGAACGAACCAGCAGCAAAGCAGACACCTGCACCTACACAAGCAGCTCCTTCAAAGCAACAACAGCAGACTTCATTGCAGACTGCACAGCTTACACAATTGCTTCAATCACAAGTGCAGGCACATCAACATCAACAAGCAGCAGCAGCAGCAGCAGCAACAGCACAGGTACCACCTGCAGCAGCAGTAGCAGCAGCAGCACAAGCTCCACCTGCTGCTGTGACTCAGCCACAACCTCAAGCGCCACAGCCACAGGCTACAATTCAGATTGCAACTCAGGCTCAGGTGGCCCCAACACAATCGCAACAACCTCAGACGCCACAGCCACAGGCAGCCAAGCCACAGGCCACTCAGGTTCAGGTGGCCCCAACACAAGAGTCACAGCCACAGGCAGCCAAGCCACATCCCACCCAGACACCAGCACCCCAGACACAGGCTCCTAAGCCACAGGCCATCCAACCTCAGGCTTCACAAACACAAGCACCTCAGCCTCAGGTGCCACAACCACAGGCTGCACCGGCACAGGTGACTCAGTCGTCTGTGACACCTAAGCCTCAGGCTGCTCCTGCTACACAACCCCAGCCACAACAAACTAAACAGGCAGCTCAGCAACAGAAGAAACAGGCGCAACCAAAACAGAATGATGTCAAGGACACATCACAGGTTCCGAAGACACAGCCTCAACCTCAACCTCAGGCGCAAGCTACTCCACAGGTAGCACAGCCTCAGACACAACCTCAGTCACAGCCCCAAACAAAGCCTCAGACTAAGCCTCAGAATAAGACTCAGACCAAGCCTCAAGCACAAACAAAGCCACAATCTCAAACTCAGCCACAGACGACACAGCCTCAGCCACAGGCTCAGGCTCAGCCACAGACAACACAACCCCAACCTCAGGCTCAGCAACAGACGACACCACCTCAAACACCACCTCAGGACAATTTGGAAGAAGATGTACAACGATATGATGATGACGATAACAACAACAACAACAACAATAGCAAGGAGTTGGAACTTTTGCAAGAGTTGGAAGAGATGGAAGCAGAAGTAATGATGCTGAGGCGAAAGGAATATCTCTCAATGTCAGGCGACATGAAACGCAACGAATCACTGCTGTTCCTCGAGCGCAAGGGTTTGGTCAAGGAGATCAGTGCCAAGTTCCAGACACCCGACACAGCCTCCTTCACCAAGTTCAATCCCAACACACATCTCTCCATCAAGGAGAGAATCCTGCACTTGAAGCGAGAGAATGAGCGCAGGAGCAAAGAGGTCGAGGCCATCAGACGAGAGACTGTCATCCAGCTCGCAGACGAGGACGAGACATCGACGATGGACTCGCCAACAAGCAGTCTTAGGGAGAGAATATACAAGTCTGTGTCCGAGCCACTCGCGCCACAGGACCCAAAGAAGACATCGCCAGCCGATGGCCACAAGTCGACACAGGTGGCCACCTCAAAGTCCCGCGCTGCTGACCCCGTGTCACCATTGCTGTTGTCAACAACATCAACACCAGTCACCAAGCCCAGCGGCAAGGGTAGCAAGATCATCATTCGTAGACGAAGGAATGCTGCGGCAGCAGCGTCCCATGATCAGATGAGCATGATGGCGCTCACACATTATCTCAACATCCCGCCCAACCCTGCCAAGCCACCAATCACATCCAACACAGCCAGCCTAACACAGCCGACCAAGGACTTTATCAAGACGCTAGTGTCGCTGTCCGACACTGGCAATGATATCATCCTGGACACTTCGCTGCCCACGCCCAACAGCTCACCGGACGCAGGCACCGCTCCCGATATTCAGTACACGCAACTGCGTACCCGCGCCATGAAGGCAGCTTTCAACGTGCTCTTCACACTGCCCAATCAAACATCGGTGATCATGCCATGTCAGAACACTGACACTATCGAGGCCATCAAGGAAAGGCTTGTGCAGTACATGTTGAAGGCATTTTGTACTACTACTACTACCACCCCGGCCACATCAGATGCGGCCAATGGCGAATCATCAGAGACAGACGAGTCGGCCTCCAATCCCGCCACACCACCCTCCCCTCCCATCAAGATCATGCCCGAGAACTATGTAATTGTTGACTACTTCAACAAGCCTCTCGAGAAGTCAATGACCTTGACCAAGAGCGAATATATAATGCACAGGAGATCACGTGGATTGCAGCCAAAGCTGAAGTTGGTTGAGAAGGTCAACTTCTACGACGCCGATCCTTCAACGGAACTCAGTGAACAGTCATACGAGATCATCAAACAGATTATACCCAATGTCAAGAGTTGGCATGGAGAAGAAGTGGACTACTTCAGACGCATCGCTGCACGTCTGCGTTACGAACTGTTGCCACACATCAAGGGAACTGTTCACTCATCGCTCACTGAACGTCTGTCCCCACTGCCACTTCCAACGCCTCCCAACAACAACAAGTTCCTCGTCTCCATCTTCCTTCCCATCCTCCAAGTCACCAGAACTGTTGAGATTGAGATTAACGAGATAGCAGATGATGTAATCGCAAGGATATTCAATAGGAACTATGCCAAGCATTTGCCACCACAGGTTAGTGCAGGAGACTTCATTCTCAAGGTGATGGGACGATCAGAGTACATTCATGGCACACACAAGATAACTGTCTACGAGTACATCCGATCATGTCTGGTACAGAGCAAGAAGATACAACTCGTCTACGTTCAAAGACCAACCATTGAGATGGACATTGCACCATTCAAGCCAAGATTCAATCTATCCAAAGAGTTGCCAATCAAACATGAGGTTGGAGCACTGTCTCATCGCGCACTGCCTTGGGATCATATGAATCACATCTCTGTTCGAGACATCAAGCGACCATTTAGGATCAAGGTGGGCGGCGCCTACAACATCCCAACGAGCTATCTGAGCAAGGAGGACGAGAGCATATCGGTGATCGTGTCAATCTCTTTGTATCATGGTGTCGAGTGCATATCGACCTCGTCCACCAAGCTTCAGAACATACTCCCGCCATCATTCTATGCCACGCCACCCGCATCGCTCAACGCCACGTGGAATGAGAACGTGACCTTCTCCAACTTGGACTATGCCAACCTGCCAATGGAAACACGTCTCTGCATTAGTCTTTACGCGAGCACTTCGTTCAAGACTCCCACATCGCCCACTGCCGCCTCATCCAACACCGAGCTCGACCAACAGCGCAAGGAGTCCTTCCCGATCGGATGGGTCAACGTCATGCTCTGTGACTACAAGTCGCAACTGCGCACGGGCCCAATGACCCTGCATCTGTGGCCGGATGATGTGGCCAATCCCCTGGCGCCCTGCTCCAGCAATCGCCAGAGCGGTGTCGCGCTGTTCATCGAGTTTGAGCAGTTTGCGCTGCCGGTGGTGTTCCCCTCGTGCAACAACCGCGTTACAAGCACCCGTCCCCACACCATCAACCCCAAGGACATGGTTGAGTTCTTTGAATCGATCATCAAGCTCGACCCGCTCAGCGACCTACCCAAGGAGAAGTACCAGCATCTGTGGGCGTTGCGACACTACGCCACCCAGTATCCTCAGCTACTACCGCGTCTCATGCTCAGTGTACCCTGGACACAGCCATCGGCTGTGGACGAGATCCACGCACTGATCGACAAGTGGGCCATCCTGAATCCCTACGATGCACTGGAACTCCTGGATGCCAAACACGTCGATCGCAAGGTGCGCGAGTACGCCGTGCGCTGTCTCGAGTCGCTCTCTGAGGAGGGCCTGCAAGATATCCTGTTGCAGTTGGTCCAGGTGCTCAAATGCGAACCCTACCACGACTCCCCATTGGCACGCTTCCTCCTTCGTCGCTCTATACTCAACCGCACGACAGGACATCACTTCTTCTGGTATCTCAAGTCCGACTTGCACGTCACCAACATTGCCGAGCGCTTTGGACTCTTGCTAGAGTCCTACCTCCTCGCTTGTGGCACGCACCGCAATGAGATACAGCGACAGATACAGGTCATCGACAGCCTGACCGAGGTGGCCAGGAAGATCAAGTCGCTGAAGGATCAAGATCGTCGCGAGACACTAATGCGCGACCTCGAGCGCATCGAGTGGCCCAAGCGCTTCCAGATCACACTGAATCCTAAGTTCGAGTCGAATGGTCTCATCATCCAAAAGTCCAAGTACATGGACTCCAAGAAGCTGCCGCTGCGGCTCTCATTCACAAACATCGACATGGATGCCGAGCCAATCGATGTGATATTCAAGGTGGGCGATGATCTGCGCCAGGACATGCTCACACTCCAGATGATCCGTCTGATGGACAAGCTCTGGCAGAAGGAGGGTCTGGATCTCAAGCTGTCGCCATACGGTTGCATTGCCACGGGTGATATGATTGGAATGATCGAGGTGGTGCTCAACTCTGAGACCACGGCCAAGATCCAAAAGAGTGCTGGTGGTGCCACTGCCGCCTTCAAGCTGGATCCACTCGCCAACTGGCTACTCAATCACAACAAGACCGAACAAGAGTATCAAAAGGCTGTGGACACATTCATTCTCTCCTGCGCTGGCTACTGTGTTGCCACCTATGTATTGGGCATTGGAGATCGTCACAATGACAATCTGATGTGCACAAAGCTTGGTAGACTATTCCACATTGACTTTGGACACTTCTTGGGCAACTACAAGAAGAAGTTTGGATTCAAACGAGAGAGAGCACCATTTGTATTCACGCCAGACTTTTGTTATGTGATGGGAGGCAAGGAGAGCCCCAAGTTTGCCCAGTTTGTAAACTACTGCTGCACGGCCTACAACATATTGCGTCGTCACGCCAAGTTGTTCATGAACCTCTTTGCAATGATGGTGTCCACTGGCATACCAGAGTTGCAATCGATGGAGGATCTCAACTACCTTCGCGAATCATTCTCACTGGAGCTCACAGACGACAAGGCCAGGGAGAAGTTCACATCACTCATACATGAGTCATTGACAACAAAGACCACACAGCTAAACAACGCAATACACATTCTGGCGCATTAA\n>XM_013042216.1 Blastocystis hominis mRNA \nGGAGAACACCGCTCCTCAGACACGCGAAGAAATGTTGGCCGCTCTGAAGAAACAGATTGAATATTACTTCTCTAAAGAAAATCTATCGAAAGACTCTTATCTCCTTTCCCTCATGGATGATTCTGGCTATGTTCCTTTAAAGACAATTTCGCGTTTTCACAAGGTCCTTTCTCTTAGCAGCAATATTGACGATATTATGGAAGCCCTAAAGAGCTCTGAGAACGTCGTGGTGGACGAAGTTAGCAAACAAATCAAGCCTGCGATTACTTTTGAACGTAAAACAGTCATTCTGCGTGACGTCCCGGCCGAGGTTACCGAGGAAGAGGTCCGCGCCTTGTTCGACGGAATGGGCGTTGTCGAAAGTGCCACTAAAGAGTTTGAAGGCACGTGGTTCGTCGTGATGGAGTCGGAGGCGGCCGCCGTCGCGGCGCTGGAGCTGCTTCGCCAGCGTTCTCTCCACGACCAGCCCGTGAAAGCTCGTCTGAAGAACGAGTCGTACCTGAAGAACCTCGTGAAGATGCTGACGACCTCCGAGGACGGCATTCCCGCCGAATATCTCCCGGTGGACCAGTCGTACTTCATGAACTTCGGCGGCCAGCCCCTTCTGGACTTCCAGCAGAGCCAAATGTTCGGCCAGAACTTCGCCGTCCAGGCGCCGGCGACCGGCGTGCCCGCCGAGAAGCGCGGCCGGAAGGGCCGGAAGGAGTTCAAGCATCGCGAGCGTCGTCCGCGAGCCGTTTCGAAGCCGAAAGTGGTGCCTGCGCTGCAGAGCGCGGAGATTTTCCCGCCGCTGGTGCCGACGACCGCTCCGGTGGTGGGGTCGATCGACGTGAAGTACTCGTACAAGGAGATCTGCGACATCGTGAAGGGCGTGAAGGATCTGTCGTGCCCGCCGATCGCGTCGGCAGGCGTGGAGTCGGCGCTGGTGGAGACGGCCAACCAGGAGTTGGTGCAGAAGGGACGAACGTTCAGTATCGACCAGGCGCTGCAGCGAGGATGTCCGCGAACGATGTCGGTGGACAGCATCGACTACACGTCCATGCTGCAGGGAGAGATGGACGAGGCGGTCGCGGAGTCGGCTCGCAAGGCGCGGCGCGAGAAGAAGCGCGCGATGAAGATGGGCGAGCGAGGCGAGGCGCATGCTCGCAGCTACCGCAACATTCTCAAGAATTCCCCGCCCGTGGGTGAGGCGGTCGCTCCTTCGACGAAGCCTGCCGCTGTGCAGACAGTGAGTGGAGCCAATGCGGCTAATGCGGCTAATGCGGCTAATGTGGCTAATGCGACTAATGCTGCCAGCACTACCACTGGTGCCAATGCTGTGAGTCCTGTAAGTGGCACGAACGGAGCGGAGGGAAAGAAGGAAGGGAAGCAGCATACAAAGAAGTCGCAGAAAAAGGCGGCAGAAAAGAAGGCAGCGGAGAAGAAAGCAGCGGAGAAGGTGAAGAATGAGGAGGACGGATGGAAGACGATTACGGAGAAGAAGCATTAGAGACACTCATTGTTTATTCTTTTAATGTGTGGAAGAGTT\n>XM_001589778.1 Sclerotinia sclerotiorum 1980 UF-70 hypothetical protein partial mRNA \nATGAGTAATCTCCTCTGGAAATATTACCTCGAAGATGACGTCGATAAATTTCGACGCCTACTGGCAAATACTGCCTATTCATCGCAGCATACACTGAAAAGTCATGGTGGAGGAGGGCCGGCATTCTCCAGCAGCTTTGGGAACAAAATAGGGAGTTCAGGCGGATTTGGAACATCACCAAAGACTTTCGGCAAGAACCGCAAAACACCCGGTCCAGCTGGAAACTCAAATGGGAATAAAGGACAGGGAAATGCGATCAGCAAGGCAGAATTGAATAGCAGAGATTATGCTGGGTTAACTGTCTTACACCGAGCTGCATCTTCGACATCTACGAATGCAATAATCTTTGCGACCTCTCTTATCGAACATCCTTCCATCGACCTCTATATACAAGATACGGAAAGTGGGTGGACAGCGTTGCATAGGGCTTTATATTTCGGCAACGTCACAATTGCTCGAGCAATTATCGAGCGAGACTCGAAGGATCGCGCCGCTGGAAATACAGGAGCTAAGCCGGACTCTTCGGTTATCAAGGTCAAGGATAGGGAGGGAAACACCCCATTTGATGTATACAATGCAACTATCGCAAGGCGATCTCTGCTAGACCGAGGAGAGCAGGGAGTACCTCACCGTTCAGATGATGATTCTGATGAGGAGTTATTCGATTCACCGTCGAGCGAATCGTCAAAGTTCAAAAGTATCGATGGTGACGAACTTTATGCATTTGGTAGTAACAAGAACTTTTCATTGGGTTTCGGTGATCAGGATGATCGTCAGTATCCGGAGAAGATAACGCTTAAACGTCCTGACCATTTACTCTTTCGATTTTATCAAGAATACTTGGACTCTGTCTATGATCATAACCCTATTGGAAACCCAAAAATGCCCAAGACAGTATCTGAACTTCCTTCCATGATTCAAAATAAGCCCATCATCATACAAGATGTTGCTCTGTCCAAACTTAGTAGCGCTGTATTAACTACGGATCCGGAATCAAACCTTTACATGTGTGGCTTTGGCCCTGGAGGTAGATTAGGCATGGGGGATGAAACCACTCGTTTCAATTACGTGCCAGTAGATCAAGGCGGTTTGGCAGGAAAGAAGGTCGTAACTGTTGCTTTAGGTCAAAATCATACGCTTGCAGTCTCGTCGGAAGGAGAGATTTTCAGTTGGGGTACAAATACTTGGGGTCAATTAGGCTACAATCTACCTCGACCTGCGCTGAAGGATGAAGAACCACTTTGTACAACCCCGCGCCAGATATTTGGACCTCTGAAAAGAGAAATCATTATTGGCATAGCTGCATCTGCTATTCATTCAGTGGCCCACACGTCTACCTCATTGTTTTGCTGGGGAAAGAATGAGGGACAATTGGGTCTTATGGACTCTGACTCACGATCTTTGGAAGCTCAACCAATACCTCGCAGAGTTGCCGCATCTTTATTCAAGTCATCAATTGTAAAAGTTTCGGCCATTAGTGGTGCAACTATATGCCTCTTGGCAAACCATACAGTCTGTGTTTTCACGAATTATGGTTACAACATGGTCAAGTTTCCGTTGTATGAGGGCTTCACAAACTATCATTTACAAAGTACCTCGCTCACGACTCGATATGACTCAGAGTCAAATAATATCACTACTATTGAGTCTGGCGGAGATACAATTGCGGCTATATCTGGTAGAGGTGACTTGTTTACCTTCAATGTAAGGAAAATTGATACAAAAGTTGCGGCGGCTTCTACAACGAATCCCTCCAAAATTAAAGATGCTTTATCACAGCCGCAGCGAGTCTGGTCACTTCGCAAGGGTAATTGGGATGGAATAAAATCTGTTGGTGTCGCCGAGAATGGGTCCGTGATAGTTTGTACTCAGGCTGGAGCGGTTTGGCGACGCATCAAAAGAGCTAAGAATAAGGATGCTTTCACTGGGATCAGTGGTTACGACCGGAAGGATTTCAAATTTCAGCGGATCCCGGGACTTACTAAAGTAGCTGCTGTCAGAAGCAATCCTTTTGGTGTGTTTGCGGCCATCCGTAAGGACTGTGATGTGACCAGGACTCAAGTTGCAGTTGAAGATAAGACATTGTGGGATGATATTGCACCTTTGCTAAGTATCCGAGATCTTGTAGCTTCGGAGCATCCAGTAGAACAGGCGGGAAGTCTAGTAAACCCTCGCCTGGCAAATTTGGACATCGAATATGGCCCTGTCCTCGCGGCACTGATCATGTCTCCGGACATCGAGGAAGATGTCCAAGGCTTGCTCATGGGAGTGGATTCTGAGAGTGGTGGTTATGATGTTGAGATATGTTCCAGTACATCTGACATCGCAATACCTGTCCATGGCTTTATGCTGGCAGCTAGATCATCTGTCTTGAGATCACTTCTTGCCGACTCTCATGCCAACGGAACCACTTCACTGTCTAATATCCTCAACATTGAAAATAGTACGGGTGGTAAAAAGAGAATTATCTTTAACGGCATAGATTTTATCACCCTTGTCAATTTCGCTATCTTTCTCTACATTGACAAAATTGCTGATGTTTGGGCCTTCGCGAATTATCTCCCGAATATGGCCTTCAGACTGAGGCAGGTTAGGATTGAAATCATGAAGCTTGGTTCTCATTTAAATATTCCCTACCTAACTCAACCTGGACTTGTCAGAAGGCCCTCAGACAAATTGAACTCTGACATGGACAACGCTATTACAGACGAGAAATTCTTCGATAATTGTGATGCTATTGTTGAGTTGGATGGAGGAGAGATGCCTATTCACAGTGTGCTTGCATGTCAAAGATGTCCTTTCTTCGATGGTCTATTTAATGGTCGATCGGGAGGTCAATGGCTTGCTGGTAGACGCGCAAAAATCACAGATCCGATCAGCATCGATTTGAAGCATATTTCGCCTGATACCTTCGAACTGGTATTGCGTTATATATATGCGGATGTTGGACCTGAGCTTTTTGATGATATCGTCTCCACTAATATTGATGAGTTCTCGGAAATAGTTATGGACGTCATGAGTGTTGCGAATGAGTTGATGATTGATAGATTGTCTCAGATCTGTCAACAAGTGTTGGGTCGTTTTGTCAATACTCGAAACGTATGCAATATCATCAATGCCGTGGCACCTTGCTCAATCACCGAACTTAAAGACGCCGGCCTTGAGTATATGTGCTTGCAGCTGGAGTCAATGCTTGAGAATCGTTTACTTGATGATCTTGATGAGGACCTTCTCCTTGAATTAGATGAAGTCGTGCGTGACAATCAATTGAATTGTCTTCCATTCGCCAAAAGTGGACGAGCTGATCTAGATTTGCACGAGAAATATCCTGAATTGGCGGGGGACATTGATGAGGAAAGACGTCGCAGACTTGGAGATATGATCTTCCGTGCTCATCTAAGAGATGATGATAATCGAATATCTTCATCTTTCAAGGCACGTATGGGGAGTCTTGATGATTATTTACCCTCTCCAAGTAATGATAAAGCTAGGAGGAAATCAAGGGTGGTCAAGAACGAACCATTTAGCCCAAGTGTACGTCCTAAGGATGCAGCGGCTGATTTCATGTTTGATATGGATGACGATGAAGAGCCTGGTAGTCCACCTGAACTGAACTTGACTAACGACCTAACTTCTGCTTCCCCTGGTGGTCCAGTAACTCCAAGGTTCCCTACAACTGGTTCGACGCCTAAGGTTTTCGAGTCAGGATCTCCTACGGACTTTCGAAATTCTGTCGGATTAGGAATCAATCACAATCCAGACACCCCTCAAACTGGAAATAAAACTTGGTCTTCTCCTAATCTTTTAGTCAAGCTGGACATGAAAGATATTATGGCCCAAGCATCAACGAACCGTACTTCGAATTTATCAATGAGTCTCTCAGCTCAAAAGGCCAAGGATGAAGCGAATGCCAAATCATCTACCCCAAAACTTTCACAGAAAGAACGTAAGAAGCAACAGGCAGCTCTTCAACAAGCAATTGCACAAACTCCTGTGAACAAGGGTAAAGACAAGGCATCTTCTCCTTGGCAAATTGCAGGTGTGGGTTCAAAAACGAACCTCAAGGATATTCTTGATAAGGATAACAAATCTTCACCATCATCCTTAGCACCAAACCCAACAACCTCACCAGCTATCTCACCTTCAAGTACTACTTCAACTATACGTCGAGTCACGGCGCCAGATACTCGATTTGCTGGTCAAAAAAGGAATGATAATAACAGCATCACGAAAGCACAAAGATCTTCACCTGGTCCATCAAGGCCAAGCTTGTTAACACCAAGCAAATCGTCTCCACTTATTCCTCATTCGAAATCATATACAGCGCCAGCAGCGAAAGCCGAACCGTCACTACAGTTATCCATGGCTGATATCATAGGAATGCAACAAAGAGAGCAAGAAGTGATTAAAGAAGCAGTTGCAAAGCGAAGTCTTCAAGAAATTCAAGAAGAACAAGCATTCCAAGAATGGTGGGATCAAGAGAGTAAAAGGGCTCAAGAGGAAGAAGCTTTGAGGGCAAAGGCTTCTACTGGAGTTAGTAGAGGTGGTGGTAAGTCTGGTGGTGGTAGAGGAAAGGGTGGACCGAGAGGGAGAGGTGGAAGGGGAAGAGGTGGTGGGGAATCTGTTAGGGGTGGTGGTGGCGGAGGAAGGGGAAGAGGAAAATCTCAGGAAAAAAGTACTGGCGCGAATTAA\n>XM_051905607.1 PREDICTED: Ctenopharyngodon idella intraflagellar transport 88 homolog (LOC127518647), transcript variant X2, mRNA \nATAATTCGTTGGATTTTATCCCAGACGTTTATACGTATATTTAGAAATGTAATGTTAAAAGACAATATATAAAGACACGAACATAATCAATGTAATATCGAAACATTGTAAAATCTCTCTTGTGTGCCTAATGGCAACCCCTCTTTGTATCCTAGCAACCGATGTGTTGCTCAGCTTAGTTAGCGAGCTGTAGGTGCTGCTAGGCTACAGACACTATTTTTCGGAATATTTCAGCTTAATACGGCCATTAATTTGCATTTTTCTTAGATGGAGAACGTGCATCTTGTTCCAGAGGAAGAGGAGGATGATTTGTATACAGGCTACAATGATTACAATCCGACTTTTGACTCAGAGGACCTTCACAACGATGTGGGCTTTCAGCAGGCTGTCAGGACAAGTCATGGCAGAAGACCACCAATGACTGCAAAATATCCTGGCACTGCTATTGGAGGGCGACCGATTGGAACAGCTTATGGGTCTCGGATTCCTGTTGGCACTGCAATGGGAAGGCCTATGACTGGAGCTGTTCAGGACGGTGCGGCTCGTCCCATGACTGCAGTGCGGGCAGCAGGATACTCTTCATCTATAGCTAGAGGCTCGGTGTTTGATCCACTGGGACAAGCAAAAGGACCAGCCCCTCCATTAGAGAGACAGAACGAAGACACGCCAGAGGAAAAGATAAAGATCCTGGAAAAGAAGGTGAATGATTTGATAGAGGAGAGCTGTCTCGCTCATGCTCGTGGGGATCTTCAGCTGTCTCTAGAGAAAGCCAAAGAGGCGGGCAGGAAGGAAAGGGCTCTGGTGAGACAGAGAGAACAAACAGGCACTGCAGACCACATCAATCTGGATCTGACCTACTCTGTGTTGTTTAATTTAGCAAACCAATATGCCAATAATGACATGTACACTGAGGCCTTGAACACATACCAAGTCATTGTGAAGAACAAAATGTTCAATAATGCTGGACGATTGAAAGTTAACATGGCAAATATCTATTTCAAGCAAAAGAATTACACAAAAGCAATCAAATTTTACCGCATGGCTTTGGATCAGATCTCAAATGCCCACAATGCAATGAGGATCAAGATCATGCAGAACATTGGTGTTGTGTTCATACATATGGGCCAGTACTCAGATGCCATCACATCCTTTGAGTACATCATGAGTGAGAGTCCCAACATAAAGACAGGCTTCAACCTCATCCTGTGCTACTATGCCATCGGAGACCGTGAAAGGATGAAGAAAGCTTTTCAGAAGCTCATTTGTGTGCCCCTCGATATTGATGATGAAGACAAGTATATCCCTGCAAATGATGACTCTCATGCAAACATGGTGATTGAGGCTATAAAGAATGATAAGCTTCACCAAATGGAAAGGGAGAGGAAAGCATTAGCAGAAAAATACATTATGACCTCAGCCAAGCTTATTGCTCCAGCCATTGAGTCGTCATTTGCAGCTGGGTTTGACTGGTGTGTGGACATGGTGAAGGGTTCACAATATGTGGAGCTTGCAAATGACTTGGAGATCAATAAAGCTATTACATACTTAAGACAGAGGGACTTCAAACAGGCAGTGGAGACGCTAAAGATGTTTGAGAAGAAGGACAGTCGGGTAAAAAGTGCCGCTGCCACTAATCTATCTTTTCTCTACTTTTTGGAAAAAGATTATGACCAGGCTGACCGCTATGCTGAGCTGGCCATGAGCGCTGACCGCTATAACCCTGCTGCCCTCATTAACAAAGGCAACACAGTGTTTGTGAAAGAGGACTATGAGAAAGCAGCAGAGTTTTACAAGGAGGCTCTTCGTAATGACTCGTCCTGTACTGAAGCCCTCTATAACTTAGGTTTGACCTATAAGAGGCTGGGTAGGCTGGAGGAAGCCCTGGACTGCTTCCTCAAACTGCACGCTATCCTCAGAAACAGTGCTCAGGTCATGTACCAGCTGGCTAATCTATATGAGATGTTGGAAGACCCTCATCAGGCCATTGAGTGGCTGATGCAGCTCACCAGTGTGACCCCCACAGATGCCCAGGTGCTGGCCAAACTGGGAGACCTCTATGACAATGAAGGAGACAAATCTCAGGCCTTCCAGTACTATTATGAGTCGTACAGGTATTTTCCCTCAAACATTAGTGTGATTGAATGGTTGGGAGCATATTACATTGACACCCAGTTCTGTGAGAAAGCTATTCAGTACTTTGAGAGAGCTACCCTCATTCAACCAACACAGGTCAAGTGGCAGCTGATGGTGGCTAGCTGTTACAGGAGAAGTGGGAATTATCAGAAGGCACTTGAGACCTATAAGGACATTCATCGGAAATTTCCTGAAAATGTTGAATGTCTACGCTTCCTGGTCAGGCTGTGCACTGATATGGGACTAAAAGAGGTGCAGGATTATGCCACCAAACTGAAGAAAGTTGAAAAAATGAAGGAGATCAGAGAGCAGAGGGTGAGATCTGGGAGAGAGAGCAGTGCTCGAGGTCGCAGGGAAGGCAGCGCTGGCAGTGACAGTGGACAAAGCAACCATGGCACCAGCGCCAAGGGTGAGAGGCTTAGCGTTAAACTGAAAACTCTTCCCGGGTCCAATGAACCGTATGAGGCCAGCACTCAGCAGGAAATAGATGCTTCTTATGTCGATCCATTGGGGCCTCAAATGCAGAGACCAAAAACAGCAGCGAGGAAACGCACAGAGGAAGATGAGTTTGCTGATGAAGAGCTGGGAGATGACTTACTGCCTGAGTGACGTGTGCAACAGAGATCAGTTCAGAGGAAAGTCTGATATATGTCCAGACACTACATTTCTTTGAATTTCAAGCTCAACCAATAGCACTGTAGATTAAAAATACTTCATTGTTACTTCATTAAATTCTTCATTATGCTTTACTATATTTTATAATAGCAATGTATTGTACTTGCATTTAGGGAAAAATGAATTCTGTGCAATAATTTTTTCTTTCTTTCTGTATGACAGCATAAGACCTAGATAACATAAAGCTGAAATATAGTTGTTTTGTGTGAAATATTAAAGCCCAGTTTTATAGA\n>XM_045586159.1 PREDICTED: Pipistrellus kuhlii protein SLFN14 (LOC118726237), transcript variant X2, mRNA \nAAAAATAGAGCTTTGAAATGAAATTGACCAGGATAGGAGGTGCTTGTATGATGTATGGAAATGACACGCAATCCCTTAGAGGTGAGCAGTGTAACTGGCTCTCATTTGAAAACGCCTGAATCTTCCCTTACTACCTAATTCACTCCAGAAGCCAAACTGCAGCCTTCGAATCTGCCCTGTCATAGGCTTTTCTTGAGTCCTTATCAGTCTTCCTCAGTGGGTCAATGTTATGAAGTCTGGGAGAGTCTGGCAGGGCTCCTGCTCCTCCCAGGCTGATATCAAAGAGCCACAGGACTGTGACAGAAAGCAAACATTCAGACCAAAGCCAGATGTGGAACTGAAACAACAAGAAGAGAAGCAAACGTATCAGCACACAGGGGCTGCTGAGATGGAAAGTCTCCAGACCAGTACGGAAATGCTCTATCCTGAGATAATTGTGGACGTGGGCACAGTGACTTTTGGAGAAGAGAACAGGAAGAACATGACCAATAATCAGTTGAAAAGGAATGAGAATTCTAAAATCATCCAAGCCGCCTGTGCACTGCTAAATTCTGGAGGGGGTGTGATCAAAGCGAAGATTGATGATAAAACCTACAGCTACCGGTGCCACGGGCTGGGTCAGGATCTGGAGACTTCTTTTCAAAAGCTCCTTCCTTCAGGTTCACAGAAATACCTTGACTACATGCAGCAGGGGCACAATCTCTTGATTTTCGTGAAGTCATGGAGCCCAGATGTTTTCAGCCTCCCCTTAAGGATCTGTAGCTTGCGTTCCAATTTATATCAGAGAGATGTGACTTCTGCTATAAACCTGAGTGCTAGCAGTGCCCTAGAACTTCTCAGACAGAAGCAGTATAGAGCCCAGAGAGGAAGACCCAGGGTGAAGGAGCGGCATCCTCAGAAGGTTCTTGACAGACACATTCAGGAAGAGGAAGATATGAGGCTGTCTGCTTCGGAATTTCTTAAAAAGGACAAACTCATGTATAAAGAGAAACTCAACTTTACTGAGTCGACACATGTTGAGTTGAAAAGGTTCACCACCAAAAAGATTGTCCCTAGGATTAAAGAAATGTTGCCCCATTACATTTCTGCGTTTGCCAACACTCAGGGGGGATACTTAATTATCGGGGTAGATGATAAGAGCAAAGAAGTGTTTGGATGTAAGAGAGAAAAAGTGAACCCCGACTTATTAAAAAAGGAAATAGAAAACTGCATAGAAAAACTGCCTACATTCCACTTCTGCCATGAAAAGCCGAAGGTGAATTTCACTACCAAAATCTTGGATGTATACCAAAAGGATGTCCTGTATGGTTATGTCTGTATTGTTCAGGTGGAGCCTTTCTGCTGTGTGGTATTCACAGAGGCCCCAGATTCGTGGATCATGAGGGACAATTTGGTCACAAGGCTGACAGCAGAGGACTGGGTGGCTATGATGCTGGATATTCCATCAGTGACACAGGAAGAGATACTATTTAAACCAGAATCCCTCTGTAAGACATTGTTCTCAGATCATAAAGAACTGGAGGAATTCATGAAGATGCAGATACGTCCTATCTCGCAGGGGATTGTGGTATTTTCTCGAAGCTGGGCTAATGATATTGGCTTAAGGAAAGAACAGAACGTCTTGTGTGATGCTCTCCTGATAGCGGTGAACAGCCCCCTGGTACTTTATACAATCTTGATACACCCCGGTGGGACCGAAGGGCCTGAATATGCCCGGAACACTGCTCGTCAGTTAAAGCAGAAACTGGGAACTGTTGGTGGTTACACAGGGAGAGTGTGTGTCATTCCGAGACTGCTGCACCTGCCCGGCACACAGTCTAGACCCTGTGGGACCCCTGTGCACTACCCTCAATCCTACCTGCTTGCTAACGAGGAGGAAATGGAAGACTTGTTGCAGGCCCTTGTCGTGGTGGTCTTGCTGTGCTCTCGTTCCCTTCTGAGTGACCGGCTGGGCTGTGAATTTTTCAACTTGCTCATAGAGGAGCAATGTGAGTTGCTGTCAGAGAGCCTTCAGGAGACGCGAGAATTGTTCATCCACTGCTTCCCAGGAAGCAGGAAGACAGCCCTAGCCATAAAGATCATGGAGAAAATCAAGGACCTATTCCACTGCAAACCAAGAGAGATCCTCTACGTTTGCGAACATGACTCCTTAAAGGATTATGTGGCCCAACAAACCACCTGCCAGGCCGTGACCCGGAAAACCTTCATGCAAGGGGAGTTCCTAAAGATTAAACACATAGTGATGGATGAGACCGAGAATTTCTGCAGTGTGTATGGTGATTGGTACAAGAAGGCTAAGGGTATCACCCATCCAGAGGGGAGGGGAGCTGGAAGGAAAAACCTTCACCATGGGGTTCTCTGGCTCTTTCTGGACCCCTTCCAAGTCCGTCATGCTGATGTCAACGGCCTCCCCCCTCCATCTGCTCAGTTTCCTCGGAAAACAATCACTAAAGGGATCCACTGTTCTCTGGAAATAGCAATGGTCATGAAACAAGAAATGAGGAAGATCAAAGAAAATCCTCCCTCCAACATGTTTCTGGACACACTGGCACTCTTCAGGGAAGCTGCCTACGAGGCAGCAATGTGTGCCCAGGCTCTTCCTGGGGTGTGTGAAACGGAGACCAACCTGACAATAGAACAAATCGCAAAGTACGTGGCAGAAAGATGTCACCACCTGTTCCAGTGTGGCTATCTGCCCAAAGATATAGCAATTCTGTGCAGGAGAGGGGAGGACAGAGGACGCTACGAGCTTGCACTGCTAAAAGCAATGGAATTAATTGAGACCCGCAGAGCCGCAGAAGTTGTGTTCAGCCAGGCCTCTGGTGTTTTGGGCAGTCACATCATTTTAGACAGCATTCAGCAGTTTTCAGGCCTAGAGAGGAATATTGTGTTTGGGCTTAGTCCAGAATGCACTCCTTCAGAGGAAACGCATAAGCTCTCCTTCGCCTCAAGAGCCATTAAACACCTCTACCTGCTTTATGAAAAGAGAACAGCCTTCTGAAAACCATTTCAAACAAAACAGGAAGCCAAAGGAGCAGAGTCCCTTCTCCTAGGCAGGCTGCAGGTACTCCTTTTCACATATTACAAATGGGAAGATCAAGGCACAATCAGTATGGCA\n>XM_047948956.1 Puccinia striiformis f. sp. tritici uncharacterized protein (Pst134EA_017638), partial mRNA \nATGTACCCTACAGCCGAAGATGCGGTGCCGTCAGCGATCAGCCGCGGGTCTATTAATTGTGTGTCGACTGACATGCGAGTATCAGAAGATGTTCGCCCGGGTCGGCTAGCCGAAGCTCAACGGGAGATCAGCGGCTTTCCCGAATCAGTTCCACTGCCACGGCCAGCCAACCAAGATGCGATTGATTGGTCCAGGAACATTGACCCAAGGATCACAGGGCTCAAGGAACTCAGGAGAGAAGAGCTGAACAGTGTTACTGCACATTTAGAACAGCTCGATCAATATGTCCAGGCTCAAGCTGAAGCCACGACGGATGCTATCACCAGAGACCCTCAAACTCTGGTTGGCCCTTGGTTTCAAGTCACGCCTGCTCGTCCAGGTCCACAAAGATCGAGTAGACTTGCAGAATTATTCACCAGAAGATCCAGTAAAAAAGCTGAACTAGATGATGGGTTAAGAGAGATCATCATGACCGACGTGATCCCGGTTTGA\n>XM_046909055.1 PREDICTED: Gallus gallus pleckstrin homology like domain family B member 2 (PHLDB2), transcript variant X26, mRNA \nAGAGAGACTGACTTCTCTGGCTACTCATTCACAGAAAAGTTGTGCAGCTCAACAGCAATGGGCTTGAATTAAAAGCCTCAGGGAAATTCATAATGCACAGCCTGATAGTTTTCCCCCTCGCATGCATTTCAGAATGGTGCTTGCTTCTAATCTGGAGAATGCCCTTTCAGTACCTGCTGGCAAGTCACGCCACTTTAATTTCAGATTCCAGTAAGATTATGGCAGAGTATAACCACACACAAAACCAGATGGAATTACAAAATGCTAGTTTGGGAAAGGGTTCTGTGGTGAATTCCCTTGAAAACGGTCTCCAGGATATTATGGAAAACCTCAACACGAAGAAATATTCATCAAGTCTCAAATTTAAAACAAACGGGGACTGCGCCGGTTCTTACTTAACCCTTTCACAGCCTATGATGGCTAAACCCAGTCCTTCCACTAGTGTTAAAAATATACACTCTGTTACCAAAATTCAAGGAGGCAAGCTTTTCCCTTGTGAAAGTCCGTATCTTCCAGATAAAAGCTTCTCTGTAAAGCATTTGAGTTCCCTGTCGGGCACATCTCCATCCCTCAGTGGGTACAACTTAGGAAGGACAGACTTTGATATTCATGCCAACAGAGAAAATGAAAAAGCTCTTGGACACGCAGATAAGTTTTACTACTCTAAGTATAGCCAGAAAAACAAATCGTATGACAATGTCTACTTGCCAGGAATGCTGGACACAAAGAAGATCTCAGGCTCTCTTCTTACAATGTGGAACGGCAGCTCAGGGAGCGAGCTGATGCTTTCCCCTGTTAGCAATTCAGGGGCAGCCAGCATGCCTTCTAGTCCAAAGCAAGGTCGGAGGATGAATATTGAAGATGGCCTGGCCCTTCATGCAAAGCCAGTTAAACACAAGGATGTGATGATGGAGACTCTGGCCTCACGCCCTAGGAAATACTCTGGTGGATCTCTGAGTCATATGGGAATGTACAGTCGTTCCCTACCCAGGCTTCATAAATCAACAGAAAGCCAGTTGATGCCATTAAGTTTGCCCCCAAGAAACTCCTTGGGTAATACTAAAAGGAAAAAACTTGGAGAAAAGGATCTACCTCAGAATGCTTTAGATGCTGATAATTACCTGAATTTTTCTTCGTGCAGCTCAGGGGTTTTACCACATGCAAATTCGTTCTCTGGGAATAATCCCTATGTTAGTTCAACTCTTAGCGTTCCTGCAAGCCCTCGAATTGCTAAAAAAATGCTTCTAGCATCTTCTTCCTCGTATATTCCTGATGATTTTGATAGACTTGGACTCTCAGGAACGAGTCCCAGTAGTTCGTTCTCCCCTGTGGATTTTGACAGATCATTCTCTATCAGAAGAAACCTCTCCACCAGTTCCATGGAATTCGATGATACAGACTTGGAAAGTTACAGGCAGACACCAAACTCACTGCAGACCTCTGTGAGAGAGCGTAAGAACAGCATCAGCTCCATTTCAGGGAGAGAAGACCTCATGGACTATCACAGGAGGCAGAGGGAAGAGCGGCTGCGGGAGCAGGAGATGGAACGCTTGGAGCGACAGCGGCTGGAGACGATCCTCAATCTGTGTGCAGAATACTCCAAGTCTGACAGTGACCCTGCCGCAACTACAACAGTTGCTGATGTTCAAAAGATTAACAAAGAACTTGAAAAACTTCAGCTATCAGATGAGGACTCAGTGTTTGAAGACTCGCAGATGAATCTAGAAACGAGGTTTAGGAACCACCTGAAATCGTCTGCGAGTGATTCGGATTTCTCAGAGCCAAGTAACCACAGTCGGAGCACTGCTTCTTTCCTTTCCTCCCGGGGGCTGAGAGCCGACGAGCACTTCACTGACAACATGAAGCCTGCACCTTTAGCTGCCCCTGGCTTCCTGAAGGATTCCACTGAGTCTTCGTATCTAAGCATCACGCCAAAGATACCAGAATGCACAAGTGATGATCAAAGAGGACAGGAGCTCACTCGGCTAGAAGAGGAACGCATAGTAATATTAAATAACTTGGAAGAGCTTGAACAGAAGATCAAAGATTTAAATGACCAGATGGATGAATCCTCAAGAGAGCTGGATATGGAATGTGCCCTTTTGGATGGGGAACAGAAATCTGAAACAACAGAGCTGCTGAAAGAGAAGGAAATACTGGATCATCTAAACAGAAAAATAGCTGAGCTGGAGAGGAATGTTATTGGTGAAAAGGCAAAGGATGCTGATCTACTGGACATAGAAAGCAAACACTTTGAAGACTTGGAGTTTCAGCAGCTTGAACATGAAAGCAGGTTAGATGAAGAGAAAGAAAATCTGACACAACAGCTCCTGCGTGAAGTAGCTGAATATCAGCGCAGCATTGTCAGTAGAAAGGAAAAGATTTCTGCTCTGAAAAAGCAAGCTAATCATATTGTCCAACAAGCACAAAGAGAACAAGATCATTTTGTAAAAGAGAAAAATAACCTAATAATGATGCTGCAGAGGGAAAAAGAGAATCTCTGTAATCTGGAGAAGAAATATTCCTCACTCTCTGGAGGAAAGGGATTTCCTGTCAGTCCCAATAGTCTAAAAGAGGGCTATATCAGTGTAAGTGAAATTAGTGAGCTGTATGGCAATTCCACGAATATATCCCCTTCCACTCAGCCCCCCACAGATGCTGACGCAGGTACCACTGAGCCTTCCACGGCTGTGCTGACGAGCCAGCCACAAAATAAAGAGCATTTCAGAAATCTGGAAGAGCGAAAGAAACAGCACAGGGAATGCATGTACATGAGTGATACTTTGCCTCGCAAGAAAACAACTCCAACTGTGTCACCACACTTCAATAGTTCTACTCTTGGACGAAGCATTACATCTAAAGGGCATTTACCATTAGGACAGAGCAACAGCTGTGGCAGTGTACTTCCTCACTGCCTGGCAACCATGACCAAAGAGTCAGAATCAAGAAGGATGCACAAAGGGTATAACCATCAACGTATATGTGAAAACCAAAGGCAGAAATCTCCTGAATTCTACAGCAGAACAGCATCCGAATCCAACGTGTATTTGAATAGCTTCCATTACCCAGATCGTAGCTACAAGGACCATGCCTTTGATACATTAAGCTTAGACAGTTCTGACAGTATGGAGACAAGCATATCAGCATGCTCACCAGATAACATTTCCAGCGCTAGCACATCAAATGTCGCAAGAATAGAAGAGATGGAGAGACTTCTGAAACAAGCACATGCTGAAAAGACTAGGCTGCTTGAGTCCAGGGAACGGGAGATGGAAGCTAAAAAGCGAGCTCTGGAAGAAGAGAAACGCCGTAGAGAACAACTGGAAAAAAGACTGGAAGAAGAAACTAGCCAAAGGCAAAAACTAATTGAAAAGGAAGTGAAGATACGAGAGAAACAAAGAGCACAGGCTCGTCCATTGACTCGCTATTTGCCCATTAGAAAGGAAGACTTTGATCTACGAAGTCATATTGAAACAGCTGGTCACAACATAGAGACCTGTTACCACGTCTCCCTCACAGAGAAGACCTGCCGAGGCTTTCTGATTAAGATGGGAGGAAAAATTAAAACATGGAAAAAACGATGGTTTGTTTTTGACAGAAACAAGAGAACTTTTACGTATTACGCAGACAAACACGAAACTAAATTAAAAGGTGTAATTTATTTTCAAGCTATTGAGGAAGTCTATTACGATCATCTGAAGAATGCATACAAGAGTCCCAACCCACTACTTACTTTCAGTGTTAAGACACACGACCGAATATACTATATGGTCGCTCCTACACCGGAAGCCATGAGGATATGGATGGATGTTATTGTTACAGGCGCGGAAGGCTACACCCACTTCATGTTATAACAAAATGGGCCAATAGGGCATACTGCAATAATGTTAACATATGAAGTTAGCCATATATAGTAAAATCTGAAAAGCCACATAAAATACCAGTGAACACTCTGAAATATCCTCCTTATGATGTGCAGCCAAAGCCTCAGAACGGAAGGGTTTTCTAAATGCATTGAAAAGGGGGACTTGCTACTTATTTTAGTTGATCTTTGTAGAGACAAAAGAGCTAAAGCTGTTGAGAAAGTCATAGTGCTCCAAAACAAATCAACTGGCCACTTATGTGACAACATCTGGATTCAACAATAATTTTGTACCAGTTCTCTTAAACAGAGAATGTCTTCATCACCAGTTTATGAATGCGTGTGCTCTCATCAGTATGCAAAAATTCTAGTAGAGGAACAAAAAGGTGTAATAGCATATATTTTAATATGCAGCATTTGACATTTATAGACGATTAGGTGACTTTTAAAAACTTTTAGTCGAGTATTTTATAAAACTATGAATTAAAAAGCTGCCCTAAGGTACACACAGTTCTTGCCTTAGTAAAGTATTACAACAGAGCCAAAGAGTTATGTGACTCCCTTATTGTAATATTTCAGATTGTTAGCTGTATTTAACTTCCTGTAAGGGGACAGTGCCAAAACTCTTCATGACTTGTAAAGTAATTAAGTTTTTACAAAACTATGTTAAACCACCCAGTGATACTGACTGTCAGTTTAAAGTCTGTATCTATGAAGCTCAACAAGAAAAGGACAGCTTTATAAAGACGGATTTATCCACAAGGATATGAAATGGAAGCGTGGGTTAACTTTGTCATTAGGAGGGCTTTTGCAGTCTTCCATGCTGAATGGATTGAGCTGATTCTGGACCCTGCAGCGATTTTATGTAGTCAGGTCCCACCTGATGTGGTTCTGATCTTTCTCTGTGCCAAACGAACACTTTGCTGAAACCTCAGATGTTGGTCTCCATGAAGCAAGCACTGAAGTATCTACCTATCTAAATTCTTTGAAGCAATGTTTTTAGCCAAGGAGACTTTTTAAAAGTGTATCTACTCAGAATAATGCTATCAGAATAAAAATAGAAAAGCAAGCGCTAAGGGTTTACACTGAGCAGTGTATGGATAAAAAGCGTGAAAACTTTAAGTATCAGGGATTGAGATTCCTAAAACAACAAAAATAAGGAGGATACAGTGGTCTCCTATTTAAAAATCACTTACAAATTCCAAATCCTTGAGAAATATTGCAAAGCTTAAGTGAATTGAACTTCAAGAAAGTCTCTTATTCTTTGACTTTAATGAGGTTCTATTTCAGTCATCAATACTTGTGCTATGTAATTTGTTTGTGTAATAAGAGAAAGCACATTAGACATTTTTCTCGATGAAAAGCTAATGGCTTTTGATGAAGCAAGTGAAAAACTGAAAGCAAAACAAGTTTGCTGGCAAAATAATTTTGTTGTACTGTTTCAACCCTGTATCTGTTAAGAAGGGGATGCGTTCTTCCTTGTGTGGTATACACAGGCGATATGGTTGCTCTAGCATGACATTTGTCAGTTTTGACTTGAATCATGAAAGAAGGGACAGTTATCACAAGGTAACTGTTATCATCATGTGCAGATCACAGCTTATAATCCAACGATTTAAAAACACTATCAGAATAAATTGCTTTGGTATATGTAATTATTATTTTTTCCCTGACGTATCTTGATTTTACTTCTTAGCATAGTTATAAAGGTTTTCTAATCATGATTTTTGTATCCTGCATGATGCAATGAAGGCATTTCAATAAACGTTTTTAAAAACA\n>XM_010693631.3 PREDICTED: Beta vulgaris subsp. vulgaris 110 kDa U5 small nuclear ribonucleoprotein component CLO (LOC104905180), transcript variant X2, mRNA \nAAATAATTAAATAAAACAATATTGAAGAGAAAAGGCAAAAAAAAAAAAAAAAAAACTCTCCACCAAAAACAAATATTTGTACCACCTTAACCTTAACAGCTTAACTTGAGTGTTGAGTCCATCTAAAACCCCAAATAACCCCATTTCACTTTACTCCCAAAATTCTCTCTCCTCCATTTCATCTTTCTCTCCTCTTTCCGCCATGGATGATAGCTTATATGACGAGTTCGGCAACTACATAGGTCCCGAGATCGACTCCGACCAAGACAATAATTCAGACACCGACATTCCTTCCGACGATGACGCCGACAAACGTCCTTCCGACGACGACAACACTCCTTCCGCCGCCGCCGGTCCCACCAACGGTTGGATGACAACCTTAAACGACAACAACGATGACGACATCGAAATGTTCGACAACCAGGTTGTTCTCGCCGAAGACAAGAAGTACTATCCTACTGCTGATGAAGTGTACGGTGAAGATGTTGAAACCCTAGTTGAAGATGAAGATGAACTTCATCTTGAACAAGCTATTATTAAGCCTGTTAAAACCCTAAAATTTGAAGTTGGTGTTAAAGATTCGTCTACTTATGTTTCTACTCAGTTTATGCTTGGTCTTATGTCTAACCCTAATTTAGTAAGGAATGTTGCACTTGTTGGGAATCTTCATCATGGGAAGACGCTTTTTATGGATATGCTTGTTGAACAGACTCATCATATTTCTACTTTTGATCCTAAGAACGAGAGGCATATGAGGTACACGGATACAAGAGTTGATGAGCAGGAGAGGAGAATTTCTATCAAATCAGTGCCAATGTCACTTGTTCTTGAGGACAGTAACTCCAAATCATATTTGATTAATATTATGGATTCACCGGGTCACGTAAATTTCTCGGATGAGATGAGTGCTGCTCTTCGGCTTGCTGATGGGGCTGTCCTGGTTGTTGATGCGGCTGAAGGTGTCATGGTTAACACTGAAAGGGCCATTCGACATGCAATTCAAGAACGCCTTCCTATTGTTGTTGTTATTAATAAGGTGGATAGACTGATTACAGAACTAAAACTGCCTCCTAAAGATGCTTATCATAAGTTGCGCCACACCTTAGAAATCATCAACAACCTTGTAAGTGCTGCCTCTTCAACTGCTGGCAATGTTCAGAGTATTGATCCGGCAGCTGGTAACGTTTGTTTTGCCAGTGCAACAGCTGGATGGTCATTCACTTTGCAATCATTTGCAAAACTCTATGTTAAACTGCATGGGGTAGCATTTGATGCAAATAAGTTTGCTTCTCGTCTTTGGGGGGACATGTATTACCATCCAGACAGCAGAACTTTTAAGAGGAAACCTCCTGTGTCTGGTGGGGAAAGATCTTTTGTTCAATTTATCTTAGAACCTCTGTATAAGATATACAGTCAAGTCATTGGTGAGCACAGAAAGAGTGTCGAGGGCACACTGGCAGAACTTGGGGTTACACTTCCGAATGCAGCTTACAGGTTAAATGTTCGGCCCCTGTTAAGACTTGCTTGCAGCTCAGTTTTTGGTACAGCAACAGGCTTCACTGATATGCTAGTTCATCACGTTCCTTGTGGCAAAGAAGCTGCATCAAGGAAGGTTGATCACATATATACTGGTCCAAAAGACTCGGAGATCTACAAGTCCATGGAAATTTGTGATTCATCGGGGCCAGTTATGGTTAATATCACCAAACTCTATCCAAAAGCAGATTGCAGTGTTTTTGATGCTTTTGGTAGAGTTTACAGTGGTGTGCTCCAAACGGGACAAACTGTTCGTGTGTTGGGAGAAGGATACTCACCTGAAGACGAGGAAGATATGACAGTGAAAGAGGTCACGAAGTTGTGGGTCTATCAAGCTCGTTATAGGATACCTATAAGCAAAGCTCCACCAGGTTCATGGGTTCTCATTGAAGGTGTCGATGCCTCTATCATGAAGACTGCTACACTTTGTAATGCTGATTTTGATGAGGATGTCTATATATTGCGTCCTCTCCAGTTCAATACACTTTCAGTGGTGAAAACTGCTACTGAGCCTCTTAATCCTAGTGAATTACCAAAAATGGTTGAGGGGCTTAGAAAAATCAGCAAGAGCTATCCTCTTGCTATCACCAAAGTTGAAGAATCTGGGGAGCACACAATCTTGGGCACTGGGGAATTATACCTTGATTCTATCATGAAGGACCTGAGAGAGCTTTATTCCGAAGTAGAAGTGAAGGTAGCAGATCCAGTTGTCTCATTTTGTGAAACGGTGGTAGAATCTTCATCAATGAAGTGTTTCGCTGAAACTCCAAACAAGAAGAATAAGATAACTATGATTGCAGAGCCATTGGAGAGAGGTCTTGCAGAGGACATCGAGAATGGTGTTGTGAGCATTGATTGGCCTCGAAAGAAACTGGGAGATTTCTTCCAAACAAAGTATGATTGGGATTTGCTTGCTGCACGTTCTATATGGGCTTTTGGTCCTGATAAGCAGGGACCTAATATACTGTTAGATGACACACTTCCCAGTGAAGTTGACAAGAACTTACTGAATGCTGTGAAAGATTCTATTGTTCAAGGCTTTCAATGGGGTGCTCGGGAAGGTCCCCTCTGTGATGAACCAATCAGAAACGTGAAGTTTAAGATAGTTGATGCTAGGATTGCTCCTGAGCCACTACATCGGGGAACTGGACAAATCATCCCCACTGCCCGACGTGTGGCTTATTCAGCTTTCCTTATGGCTACCCCTCGTCTTATGGAGCCAGTCTATTATGTGGAGATACAAACACCAATTGATTGTGTTTCCGCCATCTACACGGTTTTATCTCGGAGACGTGGCCATGTGACTGCTGATGTTCCACAACCAGGGACCCCGGCGTATATAGTGAAGGCATTTTTACCTGTGATAGAGTCGTTTGGATTTGAGACAGATTTAAGGTATCACACTCAAGGGCAGGCCTTCTGCCTCTCTGTATTTGATCATTGGGCTATCGTCCCAGGAGATCCACTGGACAAGAGCATAGTCCTACGGCCTCTTGAACCTGCCCCAATACAGCACCTGGCACGGGAGTTTATGGTGAAAACAAGGCGTAGAAAGGGTATGAGTGAGGACGTGAGCATCAATAAATTCTTTGATGAGGCCATGGTTGTCGAGTTGGCTCAACAGGCCGCAGATCTTCATCTACAAATGATATGAAGGATGTAGATAGATACTTTTGGGGGTTTTGAGATATACACCTGACCGTTCTGAATGTAGTTTCAATCAGTTACCCCAAATTCTTTATCACTTCATTGAAGCTGAGATGCTGCCATCAATTATATCATTCTTTCGCGAGTTTCAAAATTCA\n>XM_037769526.1 PREDICTED: Sebastes umbrosus plectin-like (LOC119488165), transcript variant X1, mRNA \nGTCTGGGAGGAACCGGGACCGAGAGGTGGACGGAGAGAGACTGCCTGCTTGCTGTAGTCTCAGAGTCGCTTTGGCTGCAGCCGAGTCGGTGTCACAATGAGTATGTACGGGTCTCAGAAGGCCCTGAACATGGGCCGCAGGAACGGGTCCAAAGGAGACTTGAGCGGGATGCAGCAGTACGCACGGAGCGAGGTGGTGCACATGGGAGGCGGTAACGGATACGAACCTTACCTGGACGGATACAACACCTACAACTTCTCAAAGTCCTCTGGAGGCGGCATGGGAGAAATGTCGAGCAGCATGATGAGACAAATGTCGAGCGGTATGGGAGGCGGCATGATGAGACAAATGTCGAGCGGCGGCATGATGAGAGAAATGTCGAGCGGCATGGGAGGCGGCGGAACGATGACCAGGATGTCGAGCGGTGGAGGAGGCGGCGGAATGGGAGAAATGTCCAGCAGCATGATGAGAGAAGTGTCGAGCGGCATGGGAGGCGGCATGATGACCAGTGTGGATGGCGGCATGATGAGCGGCATGGGAGGCGGCATGAGTGGCTCCAGCACCATCCACCAGAGGGCTATGATCCTGCAGGCCCAGTGCCAGGAGTACCTGAAGAAAGCCGAATACGCCCTTCAGTCTGGCGGCGCCTCCGGTGACGCGGAGCGCTACATGTCAATGGCTAAAGAGACCATTGAGCAGCTGAAGGGCTACGCGATGGACCTGAGACAAATGGGACAGCCCAATGACAACGTAGTCAGGACTTTGGAGATATGTAAAGACCAGCTGAAGGGGGTCCACATGGTCATGACCGGCAGCCTGAACAGGAGGAGGAGCACCAGAGGGAGCTCCGGAGGCTGGGAGGAGCCTCCGAGGAGCTTCCAAGACGCTATGGGCTGGATTGCACAGCAAAAGCGTCTGATTGAAACTGCTTCATGGGGAGACGATCCTGCTGCCATCGAGCAGCAGCTCATCAACCACTCGAACTTTCACAGCTCCATCCAGAGGAGCGTCGAGGTGGAGCGAGCCAGAGATGAGCTGATGAAGAAAGGAGACAAGGGAAATCTTCACGCTCTGGATCAGGAGTGGGACAGTCTGCAGCAAATGTCATTTGGTCGGACCGAGCAGCTGCAGAACCTCAAGCGGATCATTCAGGATATGTCCAAAGAGATCATGTGGGTGAACGACAGGGAGGAGGAGGAGCTGATGTTTGACTGGGGAGACAAGAACATTGACCAGTACATCCCACGGAAACAGGAGAGCTACTCGAAACTGATGAGTGCCCTGGAGGAAAAAGAGAAGGACCTGAATAAACTGAAAGCCAGAGTGGACGGCCTCCTGAAGCTCAACCACCCAGCTTCAGACAAGATCGAGGCTTACAGGGACACTCTGCAGACTCAGTGGAGTTGGCTCCTTCAAATCACCAAGTGCATTGATGTTCATCTGAAGGAGAATGCAGCTTACAACCAGTTCTTCAAAGAGGCCAATGAGACGTACAGCGGCCTGCAGAAGGAACATGAGACGGTCCGGATGAAATTCGCTTGTGACAAGAACACTTCACTGGAGGACCTGATGGAGCTCCTTCAGGGACTAGAGAGGGAGAAGGAGAATATAATGGAAAACAAGAGGCAGGTTCATCATCTGGTCAACAAGTCCAGGACCATTGTGAGACTGAAACCCAGAAACCCTGAAGAGAAGAGCAGCACCCCCGTCATCGTCAAAGCTCTGTGTGACTACAAACAAGACCAGAAGGTGATCTGTAAGGAGAATGAGGCGATCCTAAAGGACAACAGTCAACGCAGTAAGTGGGACGTTACCGGCCCGGGAGGACTGGATATGTTGGTGCCCTCCGTGTGCCTGATCGTACCACCTCCCAACCCACTCGGCATCAGTATGGCCAACAAGAACGAGCAGTACTATGAGGCCATCCTGTCAATCTGGAGTCAGTTGTACATCAATGTTAAGAGTCTCATCGCCTGGCAGTACTGCCTCATTGATATCAGGAAAATCAACTCCCTCACCGTGACCATGCTGTCCCGCATGCGTCCCGAGGAATACCGCCAACTCATCAAGAGCCTGGAGTCTCGCTACGAGGAGTTCAAAATGACCAGCCACGGCTCCCAGATGTTTGCTGACGAGGACAAGAAGATGATTGAGAACCAGGTCACCGGAGCCCAGACCCACTATGACCAGATCGTGGTGGAGCTGCCTACTTACATTGCTCAACAGGAACACATAGAAGTACAGCAAGCGTCCGGCCAGCAATACCAACAGCAGCTGATCCTAGTACAGCAAGCGTCCAACCAGCAACACCAACAGCAGCTGATTCTATTACAGCAGCAGCAGCAACAACAAGCTGCCGCCGAAGCCGAGGCCAGGAGGCTCGAAGAGGAGGCCAGGTGGCGCGAAGAGGAGGCCAGGAGGCTCGAAGAGGAGACCAGGAGGCGCGAAGCGGAGGCCAGGAGGCTCGAAGAAGAGACCAGGAGGCGCGAAGCGGAGACCAGGAGGCTCGAAGAAGAAAGACGAAGAGCGGAGCTGAAAAGAGCAAAGAAAACGGAAGTGAAGTTGGTGAAGAAGGTGAAGGTGGTCACTTCTTCTGCTGCCCCTCCTGTCTCCTCCCACTCCTTCTCCTCCTCCTCCACCTCCACCTCCTCATCCTCATCCTCCCGCAGCTTAACTGAGCTGCATGCGCTCAGACTCAGGCTGGAGGCCTCCGAGGGCACGCTGAGTCAGCACGTTCACATCTGCCTCGGAGACGACTGGATGCACGACTGTGGCCTCAAGATATCTGAGCTAGAGATGCTTCTGCGTAATGTCGACTCGATGCGTGAGGAGCACTTGCGTCTGAGGGAGCATATCTTGAAGGAGCTGGAGGGCATGAATGATTCAGATAAAGCCCAGTTCCTCCGCAACGAGGTTGAAGTCATCAACCAGAGGCTGGGTAGTCTGGAGAGCAGCTCATCAGCTTACCTGGACCGGCTGAAGGCTCTAAGGGACATGCTGGAGAGTGTGGAACAAGCCGAAGACATAGTGAAAGTCCACGAGGCGAGACTGGTGGAGAAAGAGACCACCTCTCTGTCGCCCAACGAAGTGGAGGAATACATGTTGACCCTGAAGAATGTTAAAGCGGAGCTGGATCTGAAGAGGGGTATTCTGGCCACCATGGAGACGGAGCTAGCCAAGGCCAACCACTGGAGCGGCCAGCTGGGCGGGCCCTTCCAGAGGTGTGACATGATGCTGTCCAAATACTCTGAGCAGGTGGTTCTGCTGTCAGACCGCTGGAGACGACTCCTAGGGCAGATTGACACCAGAGTCCAGGATTTGCAGTCGTACCAGCCTCAGCTGGAGCACTACAAGCAAACCAGCACCTCCCTTATTGACTGGATTGATGCCACACGGACAAAACAAGACACCCTGCAGGCCACCAAGATAGAGAGCATCCAAACACTGATGGACCAAATTAACAACCAGAAGGCCCTGAACTCTGAAATCAAATCGAGGAGGGAGACAGTAGAGAGCGTGCTGAGGGACAATGAGGCCTGTGTGATTTCTATCAAGGATTATGAAACGGACCTGGCCTCTTACACCTCTGGTTTAGAGACGTTGCTCAACATCCCCATCAAAAGGACAATGCTGAAGTCGCCGTCGATGGACCTAAATTTGGAAGCTACACAACTGCAAACCCGTTACATGGAGTTGCTCACACATTCTGGTGACTACTACAAATTCCTGGGAGAGCTGCTAAAAAACATGGAGGAGCTCAAGATTCGTAACACCAGGATTGACCTGTTAGAGGAAGAACTTCGCCTGCTGAGGGAGGGCATGCGAGACCGCGACTCCAAGAATAAATCTCTAGAAGAGTCTGTTTCCCGTTATGAGCTGGAGTTGTCCGACTCGCGGGACAAGCTGCTGTCGATTGAGGAGGTGAAGCAAACCGCTACGCTGCAGTGCAGTGCCACTATGGACAGCCTGGACAGCACTCAGAGCCAGCTGGCAGACCTCAACGATGAGGTGACACGTCTCAACTACTTGCTTGAGGAAGAGAAGAGGAAGAGGAGGCTGGCAGAGGAGCGCTACACTACGCAGCAGGAGGAGTACGAGCTGGTGCTGAGGAAGAGGCAGAAGGAGCTGGACACGGTCAGCTGGTCCAAGGTGGAGATTGAGAAGAGTGTGACAAACAAGGATCACGAGATTGAACAGCTGCGGCGGCAGCTGGCTGAGGAGGCGGCGAGGATCAGGGAGCTACAGAAGGAGATGTCAAAGGTAAGGAGCCAATGCAGTATGGAGATCAATAACTTAAAGCTCAGCTACGAATCCCAGATCCACGTCAGCTGCACAGACATGCAGAGGCTGGCAGCCCAGAGGGAGGAGGATACCGTTGATGTCCAGCTGCGGTATGACAGGATGGAGGCAGAGAGGAGGAATCTGGAGGAGGAGCTCAGGAAGCTCAGGATGTCTCTGAGCCAGGCTGAGGAACAAAGGAACAGGGCAGAAGAAGAAGCTCACAGTCAGCGTGCTGTCATCACAGAGGAAGGGCGCAGGAGGAGAGAACTGGAGAGTCAGGTGGAGGTGCTGATTAGGCAGAGAGACGAGGAACGCAGCCAGTATGCAGAGGAGCTGGCTGAAGTCATGAAGAGGCTGCAGGAGAAGAGTGACGAGCTGGCCTACATTACACACAGCCTGGAGGAAGAGACCCGCAGGAGGAGAACTATAGAGGAAGGGCAGGATGTGTTCGAACAGACTCTGGCCCAGCTGCAGGTGAAGCTAACCAGTTCATCAGTGGCTGCAACCCAGCTGGGGGAGTGCGAGGAAGAGCTCCAGAAGATACGTATGGAGCTTGAGAGGGAGAGCAGGGAGCGAAGCAGAGTAGAGCAGAACATGAGCAGGCTACAGAGTCGCATGAAGGACCTTCAGGATGTGAGAGGTGGGCTGGAGAGCCAAGTGGAGAATCTGAGGAGGGCCAACCAAGAGGAAGTGTCCAGAAGAAGGCAGGTAGAAACAGAGCTGGAAAACACCACCAAGGCCATGACTGAGTACATCAGCACCGTTACCACTCTAAGCCAGAGCCAAGAGCACGCCAGCATGTCAGAAAAGAGAGGTGAAGAAGAGCGCCTTAGGTTGCAGGAGGAGCTGGAGAGAAGCTCGAGACAAAACAAGACCTCTGCAGAGCGCATGACTCAGCTGAGCGCCGAGCTGAAGGCCCTGCAGCAACAGCTCCTCCAGGAGCAGGCAGGAGGCAAAGAGGCAAACCTCAGGAATGAGGGCCTTTACAGAACTATAGAGGAGAAGAGTAAGGCCCTGAATGAGCGCTCTGGTGAGCTTCAAAGGCTGAAGGAGATGGCAGAAAGCCAGACCAAAGAAAGGCTGAGGCTGGAGGAGGAACTAAGCGCAGCACGACATGATAAAGCGGAACTCCTGAGATCCAAACAGGGAAGTGATGATGAGCTCTCCTCCCAGATTACAGCCCTGCAACTGCAGCTTCAAGCCAGTGAGCGCAGCAATGTAGATTACCGCAACCTGGCCTCAGAGCTCTCCTCGGAGAGGGAGAAACTCAAGCTGGAGACTGAGAAAATACAAAAGCAGGCCACCGAGACAACCACCATGATGCAATCCATTCAGTCCCAGTACAATGAGATTGTGAATGAGAGAGATGCTCTTTTGCTGAGACTGCAATTGTCAGATAAGGACAAAGATCGCTACCAAAGGCTAGAGGACGAACTCAGTCGCATTAAATTGTCCCAAGACTCTGAGCTTCGCAGTAAGCAACGTATACAGGATGAGAACGAGAGGGCGAAGAGGGATTCAGATTACTGGAAGGACCAGTTTGATAGTAAGCAGGTCCTGATCAGGCAATATGAAACAGACAAGGAACGTCTGGAGAGGGAAAAGAACTCTCTGAAAAGTGAGCTAGAGAGGCTGATGAGGGATCTGAGGGAGCTTGATGAGACATATAAAATCAGGCTGTCAGATATGCAGAAAGAACTGCGAGAGGTGGCTGTTGTCAGAAAAACCATGGAAACTGAGCTGATGAGAGTTAGAGAGCCCCCAACCTTGGATCCTTCCACTTTGGTCTTTGATGGAGTCCGTAAGCCAGTCACAGCAAACCAGTTGGTTGACTGTGGTGTTTTGGACAAACCAACACTTAGCCAGCTTGTGAAGGGGCATAAGACTGTGCCTGATGTCTCTGTCGACAAAAAAGTCAGTCTCAAAGGGACAGGCCCAATAGCCGGGGTGGTAATTCAAGGTCCGAAAGGTCCAGGGTCTTTTACAGGCCCCTTATGCAAAATGACTTTCACCGAAGCAAAGAAAGAGAATCTGCTACCACCAGATAGCGTAGACCTACTACTGGATGCTCAGGCTGCCACAGGCCACATAATTGACCCAAGAACTAATAGGAAGTTGACAGTTGAAGAGGCATGTGATCAAGGTGTGGTTGATGAAGAGGACAGAGAGAGGTTGTTGGCAGCAGAAGCTGCAGCTGTAGGATATTGTGGTCCTGGCACAAACAAACCCCTTTCAGTATTTCAGGCTATGACGAAAGGACTGATTGACAAGAACACAACACTGCGTCTGCTACAAGCCCAGGAGTCTGTGGGGGGCATCCTAGATCCCATACTCAGTGTGTTCCTTCCTAAAGACACAGCCATTGAGCGTAACCTAATTAATGATGACATATATCATGCTCTGAGTCGGAGGCCTGAGCTCTACCTGGACCCCGAAAGTGAAGATGGTGTAACCTATATGTCAATGAAGAGGAAATGTAAGGTAGAGCCACACACAGGCCTTCTGCTTCTTCCGATCCCTGAGAAGGTAGACCCCTCCAAAATTGTCTTTGATGGTGTTCGGAAACCTGTCACAGCCAAGCAGCTCCTTGATTGTGGTGTCCTGGACAAGCCAACATTTAAAGATCTAGAAAAGGGGAAGAAAAATGTCCCAGAGGTGTCTGTAGACAAACATGTTAATCTGAAGGGGACTGGACCCATTGCTGGGGTGGTAGTCGGACGTGAAGGAAAAATGTCTTTCTCAGAAGCCAAGAAACGGATGCTCTTGCCCCCAGATAGTGCAGATTTGCTACTGGAAGCCCAGGCTGCCACAGGTCACATCATTGACCCCAGAAACAATCAGAAGCTGACAGTAGATGAGGCATGTGACAGAGGAGTGGTGGATATTAAGGATCGAGACAGATTATTGGAAGCTGAAGCTGCTGCTGTGGGATACAAGGATTTTAGTGCAGCCAAGCCTCTCTCAGTGTTTGAGGCCATGAAGAAGGAACTAATTGACAGGAAGACTGGGCTACGCCTGCTGCAGGCCCAGGAGTCTGTGGGAGGTATTCTAGATCCCAATCTCAGTGTGTTCCTTCCCAAAAATACAGCTATTAAGCGCAACCTTTTGGATGAAAACCTCCGTCAAGCTCTAAACCAGAGTCCTGAGTGTTACTGTGACCCAGAAACTGAGCGTGATGCCAGCTATGGAGCATTGAAGAAAAGATGCAAGACAGAGCCTCACACAGGTCTGCTACTTTTGCCAATCACTGAGAAGCTAGACCCTTCCAAACTGATCTTTGATGGTGTTCGTAAGCCAGTAACAGCACAGCAGTTGCTTGATTGTGGGGTCCTGGACAAACCAACATTTAACCAACTAATGAAGGGAGAGAAAACTGTCCCACAGGTGTCTGTGGATAAGAAGGTCTTTCTAAAGGGGACAGGATCGATTTCTGGCGTGGCAGCTGGACCTTTAGGGAAAATGTCTTTCTCAGAGGCCAAAAAACAGATGCTCATGCCTGCGGAAAGTGCCGATTTGCTACTGGATGCTCAGGCTGCCACAGGACACATCATTGACCCCACAACCAATCAGAAGCTAACAGTAGAGGAGGCATGTGCCAGAAGAGTGGTGGAAAATAGGGATCGAGATAGACTCCTGGCAGCAGAAGCCGCTGCTGTGGGTTACCGGGACCCAAGCACAGCTAAGCCTCTTTCAGTGTTTGAGGCAATGAAAAAGGGATTAATTGACAGGAAGACTGGGCTACGGCTGCTGCAGGCCCAGGAGTCTGCCGGGGGCATTCTAGATCCCAATCTCAGTGTTTTCCTCCCCAAAGACACAGCTATAAAGCGCAACCTTTTGGATGAGGACCTCCGTCAAGCTCTAAACCAGAGTCCTGGGTGCTACATTGACCCAGACACTGAACGTGATACCAGCTATGGGGCTTTAAAGAAGAGAAGCAAAACAGAGTCTCACACAGGCCTGATACTTCTGCCAATCAATGAGAGGAAAGACCCTTCCAAACTGATCTTTGATGGTGTTCGTAAGCCAGTAACAGCACAGCAGTTGTTTGAATGTGGAGTCCTTGACAAGCCAACATTTGACCAATTAGTGAAAGGCGAGAAAACTGTCCCAGCAGTGTCTACGGAAAAGACAGTCTATCTAAAGGGGACTGGACCCATTGCTGGGGTAGTAGTCGGACGTGAAGGAAAAATGTCTTTCTCAGAAGCCAAGAAACGGATGCTCTTGCCCCCAGATAGTGCAGATTTGCTACTAGAAGCCCAGGCTGCCACAGGCCACATCCTTGACCCTGAAGCTAATCAGAAGCTGACAGTAGAGGACGCATGTGCCAAAGGAGTAGTGGACATTAGGGATCGAGACAGATTATTGGCAGCAGAGGCTGCTGCTGTTGGCTTCAAGGATCCTAGCGGAGCCAAGCCTCTCTCAGTGTTTGAGGCCATGAAGAAGGGACTCATTGAAAGGAAGACTGGGCTACGCCTGCTGCAGGCTCAGGAGTCTGTGGGAGGTATTCTAGATCCCAATCTCAGTGTGTTCCTCCCCAAAGACACAGCTGTAAAGCGCAACCTTTTGGATGAGGAACTTTGTCATGCTCTAAACCAGAGTCCTGAGTGTTACGTTGATCCAGACACCGAGCGTGATACCAGCTATGTGACTTTAAAGAGGAGAAGTAAAACTGAGTCTCACACAGGCCTCATACTTCTTCCAATCCCTGAGAAGGTAGACCCCTCCAAACTTGTCTTTGATGGTGTTCGGAAACCTGTCACAGCCAAGCAGCTCCTTGATTGTGGTGTCCTGGACAAGCCAACATTTAAAGATCTAGAAAAGGGGAAGAAAAATGTCCCAGAGGTGTCTGTAGACAAAAATGTTAATCTGAAGGGAACTGGGCCTATTGCTGGGGTTGTAGCTGGGAGTCAAGGCAAGATGTCTTTGTCAGAAGCCAAGAAAAAGGCACTCCTACCTGAAGATATTGCAGATTTGCTACTGGAAGCCCAGGCTGCCACAGGTCACATCATCGACCCCAAAAACAATCAGAAGCTGACAGTAGATGAGGCATGTGCCAGAGGAGTGGTGGATATTAAGGATCGAGACAGATTATTGGAAGCTGAAGCTGCTGCTGTGGGATACAAGGATTTTAGTGCAGCCAAGCCTCTCTCAGTGTTTGAGGCCATGAAGAAGGAACTAATTGACAGGAAGACTGGGCTACGCCTGCTGCAGGCCCAGGAGTCTGTGGGAGGTATTCTAGATCCCAATCTCAGTGTGTTCCTTCCCAAAGATACAGCTATTAAGCGCAACCTTTTGGATGAAAACCTCCGTCAAGCTCTAAACCAGAGTCCTGAGTGTTATCGTGACCCAGAAACTGAGCGTGATGCCAGCTATGGGGCATTGAAGAAAAGATGCAAGACAGAGCCTCACACAGGTCTGCTACTTTTGCCAATCACTGAGAAGCTAGACCCTTCCAAACTGATCTTTGATGGTGTTCGTAAGCCAGTAACAGCACAGCAGTTGCTTGATTGTGGGGTCCTGGACAAACCAACATTTAACCAACTAATGAAGGGAGAGAAAACTGTCCCACAGGTGTCTGTGGATAAGAAGGTCTTTCTAAAGGGGACAGGATCGATTTCTGGCGTGGCAGCTGGACCTTTAGGGAAAATGTCTTTATCAGAGGCCAAGAAACAGATGCTCATGCCTGCGGAAAGTGCCGATTTGCTACTGGATGCTCAGGCTGCCACAGGACACATCATTGACCCCACAACCAATCAGAAGCTAACAGTAGAGGAGGCATGTGCCAAAAGAGTGGTGGAAAATAGGGATCGAGATAGACTACTGGCAGCAGAAGCCGCTGCTGTGGGTTACCGGGACCCAAGCACAGCTAAGCCTCTTTCAGTGTTTGAGGCAATGAAAAAGGGATTAATTGACAGGAAGACTGGGCTACGGCTGCTGCAGGCCCAGGAGTCTGCCGGGGGCATTCTAGATCCCAATCTCAGTGTTTTCCTCCCCAAAGACACAGCTATAAAGCGCAACCTTTTGGATGAGGACCTCCGTCAAGCTCTAAACCAGAGTCCTGGGTGCTACATTGACCCAGACACTGAACGTGATACCAGCTATGGGGCTTTAAAGAAGAGAAGCAAAACAGAGTCTCACACAGGCCTGATACTTCTGCCAATCAATGAGAGGAAAGACCCTTCCAAACTGATCTTTGATGGTGTTCGTAAGCCAGTAACAGCACAGCAGTTGTTTGAATGTGGAGTCCTTGACAAGCCAACATTTGACCAATTAGTGAAAGGCGAGAAAACTGTCCCAGCAGTGTCTACGGAAAAGACAGTCTATCTAAAGGGGACTGGACCCATTGCTGGGGTAGTAGTCGGACGTGAAGGAAAAATGTCTTTCTCAGAAGCCAAGAAACGGATGCTCTTGCCCCCGGATAGTGTAGATTTGCTACTAGAAGCCCAGGCTGCCACAGGCCACATCGTTGACCCTGAAGCTAATCAGAAGCTGACAGTAGAGGACGCATGTGCCAGAGGAGTAGTGGACATTAGGGATCGAGACAGATTATTGGCAGCAGAGGCTGCTGCTGTTGGCTTCAAGGATCCTAGCGGAGCCAAGCCTCTCTCAGTGTTTGAGGCCATGAAGAAGGGACTAATTGACAGGAAGACTGGGCTACGCCTGCTGCAGGCTCAGGAGTCTATGGGAGGTATTCTAGATCCCAATCTCAGTGTGTTCCTCCCCAAAGACACAGCTGTAAAGCGCAACCTTTTGGATGAGGAACTTTGTCATGCTCTAAACCAGAGTCCTGAGTGTTACATTGACCCAGACACCGAGCGTGATACCAGCTATGGGACTTTAAAGAGGAGAAGTAAAACTGAATCTCACACAGGCCTCATACTTCTGCCAATCACTGAGAAGAAAGACCCCTCCAAACTGATGTTTGATGGAATCCGCAAGCCAGTCTCAGCACAGCAGTTGTTTGAATGTGGAGTCCTTGACAAGCCAACATTTGAAGATCTAGAAAAGGGGAAGAAAAATGTCCCAGAGGTGTCTGTAGACAAAAATGTTAATCTGAAGGGAACTGGGCCTATTGCTGGGGTCGTAGCTGGGAGTCAAGGCAAAATGTCTTTGTCAGAAGCCAAGAAAAAGGCACTCCTGCCTGAAGATATTGCAGATTTGCTACTGGAAGCCCAGGCTGCCACAGGTCACATCATTGACCCCAGAAACAATCAGAAGCTGACAGTAGATGAGGCATGTGCCAGAGGAGTGGTGGATATTAAGGATCGAGACAGATTATTGGAAGCTGAAGCTGCTGCTGTGGGATACAAGGATCCTAGCGGAGCCAAGCCTCTCTCAGTGTTTGAGGCCATGAAGAAGGAACTAATTGACAGGAAGACTGGGCTACGCCTGCTGCAGGCCCAGGAGTCTGTGGGAGGTATTCTAGATCCCAATCTCAGTGTGTTCCTTCCCAAAGATACAGCTATTAAGCGCAACCTTTTGGATGAAAACCTCCGTCAAGCTCTAAACCAGAGTCCTGAGTGTTACCGTGACCCAGAAACTGAGCGTGATGCCAGCTATGGGGCATTGAAGAAAAGATGCAAGACAGAGCCTCACACAGGTCTGCTACTTTTGCCAATCACTGAGAAGCTAGACCCTTCCAAACTGATCTTTGATGGTGTTCGTAAGCCAGTAACAGCACAGCAGTTGCTTGATTGTGGGGTCCTGGACAAACCAACATTTAACCAACTAATGAAGGGAGAGAAAACTGTCCCACAGGTGTCTGTGGATAAGAAGGTCTTTCTAAAGGGGACAGGATTGATTTCTGGCGTGGCAGCTGGACCTTTAGGGAAAATGTCTTTATCAGAGGCCAAGAAACAGATGCTCATGCCTGCGGAAAGTGCCGATTTGCTACTGGATGCTCAGGCTGCCACAGGACACATCATTGACCCTACAACCAATCAGAAGCTAACAGTAGAGGAGGCATGTGCCAGAAGAGTGGTGGAAAATAGGGATCGAGATAGACTCCTGGCAGCAGAAGCCGCTGCTGTGGGTTACCGGGACCCAAGCACAGCTAAGCCTCTTTCAGTGTTTGAGGCAATGAAAAAGGGATTAATTGACAGGAAGACTGGGCTACGCCTGCTGCAGGCCCAGGAGTCTGCCGGGGGCATTCTAGATCCCAATCTCAGTGTTTTCCTCCCCAAAGACACGGCTATAAAGCGTAACCTTTTGGATGAGGACCTCCGTCAAGCTCTAAACCAGAGTCCTGGGTGCTACATTGACCCAGACACTGAGCGTGATACCAGCTATGGGGCTTTAAAGAAGAGAAGCAAAACAGAGTCTCACACAGGCCTGATACTTCTGCCAATCACTGAGAAGGAAGACCCTTCCAATCTGATGTTTGATGGAATCCGTAAGCCAGTCTCAGCACAGCAGCTGTTTGAATGTGGAGTCCTTGACAAGCCAACATTTAAAGATCTAGAAAAGGGGAAGAAAAATGTCCCAGAGGTGTCTGTAGACAAAAATGTTAATCTGAAGGGAACTGGGCCTATTGCTGGGATCGTAGCTGGGAGTCAAGGCAAAATGTCTTTGTCAGAAGCCAAGAAAAAGGCACTCCTGCCTGAAGATATTGCAGATTTGCTACTGGAAGCCCAGGCTGCCACAGGTCACATCATTGACCCCAGAAACAATCAGAAGCTGACAGTAGATGAGGCATGTGCCAGAGGAGTGGTGGATATTAAGGATCGAGACAGATTATTGGAAGCTGAAGCTGCTGCTGTGGGATACAAGGATCCTAGCGGAGCCAAGCCTCTCTCAGTGTTTGAGGCCATGAAGAAGGAACTAATTGACAGGAAGACTGGGCTACGCCTGCTGCAGGCCCAGGAGTCTGTGGGAGGTATTCTAGATCCCAATCTCAGTGTGTTCCTTCCCAAAGATACAGCTATTAAGCGCAACCTTTTGGATGAAAACCTCCGTCAAGCTCTAAACCAGAGTCCTGAGTGTTATCGTGACCCAGAAACTGAGCGTGATGCCAGCTATGGGGCATTGAAGAAAAGATGCAAGACAGAGCCTCACACAGGTCTGCTACTTTTGCCAATCACTGAGAAGCTAGACCCTTCCAAACTGATCTTTGATGGTGTTCGTAAGCCAGTAACAGCACAGCAGTTGCTTGATTGTGGGGTCCTGGACAAACCAACATTTAACCAACTAATGAAGGGAGAGAAAACTGTCCCACAGGTGTCTGTGGATAAGAAGGTCTTTCTAAAGGGGACAGGATTGATTTCTGGCGTGGCAGCTGGACCTTTAGGGAAAATGTCTTTATCAGAGGCCAAGAAACAGATGCTCATGCCTGCGGAAAGTGCCGATTTGCTACTGGATGCTCAGGCTGCCACAGGACACATCATTGATCCCACAACCAATCAGAAGCTAACAGTAGAGGAGGCATGTGCCAGAAGAATGGTGGAAAATAGGGATCGAGATAGACTCCTGGCAGCAGAAGCCGCTGCTGTGGGTTACCGGGACCCAAGCACAGCTAAGCCTCTTTCAGTGTTTGAGGCAATGAAAAAGGGATTAATTGACAGGAAGACTGGGCTACGCCTGCTGCAGGCCCAGGAGTCTGCCGGGGGCATTCTAGATCCCAATCTCAGTGTTTTCCTCCCCAAAGACACGGCTATAAAGCGCAACCTTTTGGATGAGGACCTCCGTCAAGCTCTAAACCAGAGTCCTGGGTGCTACATTGACCCAGACACTGAACGTGATACCAGCTATGGGGCTTTAAAGAAGAGAAGCAAAACAGAGTCTCACACAGGCCTGATACTTCTGCCAATCAATGAGAGGAAAGACCCTTCCAAACTGATCTTTGATGGTGTTCGTAAGCCAGTAACAGCACAGCAGTTGTTTGAATGTGGAGTCCTTGACAAGCCAACATTTGACCAACTAATGAAGGGAGAGAAAACTGTCCCACAGGTGTCTGTGGATAAGAAGGTCTTTCTAAAGGGGACAGGATCAATTTCTGGCGTGGCAGCTGGACCTTTAGGGAAAATGTCTTTATCAGAGGCCAAGAAACAGATGCTCATGCCTGCGGAAAGTGCCGATTTGCTACTGGATGCTCAGGCTGCCACAGGACACATCATTGACCCCACAACCAATCAGAAGCTAACAATAGAGGAGGCATGTGCCAGAGGAGTAGTGGACATTAGGGATCGAGACAGATTATTGGCAGCAGAGGCTGCTGCTGTTGGCTTTAAGGATCCTAGCGGAGCCAAGCCTCTCTCAGTGTTTGAGGCCATGAAAAAGGGACTAATTGACAGGAAGACTGGGCTACGCTTGCTGCAGGCCCAGGAGTCTGTGGGAGGTATTCTAGATCCCAATCTCAGTGTGTTCCTCCCCAAAGACACAGCTGTAAAGCGCAACCTTTTGGATGAGGAACTTTGTCATGCTCTAAACCAGAGTCCTGAGTGTTACATTGACCCAGACACCGAGCGTGATACCAGCTATGTGACTTTAAAGAAAAGAGGTAAAACTGAGTCTCAAACAGGCCTGATACTTCTGCCAATCACTGAGAAGAAAGACCCTTCCAGACTGATGTTTGATGGAATCCGCAAGCCAGTCTCAGCACTGCAGTTGTTTGAATGCGGAGTGCTTGATAAGCCAACACTTAATCAGCTAGTGAAAGGGGAGAAAACTGTCCCAGCCGTGTCTATGGAAAAGATGGTATATCTACAGGGGACTGGACCCATTGCTGGGGTGGTAGCTGGACGTGAAGGAAAAATGTCTTTCTCAGAAGCCAAGAAACAGATGCTCCTGCCCTCAAATAGCGCATATTTGCTACTAGAAGCCCAGGCTGCCACAGGCTACATCATTGACCCTAAAACTAATCAGAAGCTGACCGTAGAGGAGGCATGTGCCAGAGGAGTGGTGGACATTAGGGATCGAGACAGATTGTTGGTAGCAGAGGCTGCTGCTGTTGGCTTTAAGGATCCTCGCGGAGCCAAGCCTCTGTCAGTGTTTGAGGCCATGAAAAAGGGACTAATCGACAGGAAGACTGTGCTACGCCTGCTGCAGGCCCAGGAGTCTGTGGGAGGTATTGTAGATCCCAATCTTAGCGTGTTCCTCCCCAAAGATACAGCTATAAAGCGCAACCTTTTGGATGAGGACCTCCGTCAAGCTCTTAACCAGGGTCCTGAGTGTTACGTTGACCCAGAAACTGAAAATGATGCCAGCTATGGGGCTTTGCAGGAAAGATGCAAGACAGAGCCTCAAGCAAGCCTGAAACTTTTGCCAGTCTCTGAGAAGAAAGACCCTTCCAAACTACTCTTTGATGGTGTCCGTAAGACTGTCACAGCACAACAGTTGCTTGATTGTGGGGTCCTGGACAAACCAACATTTAACAAACTAATGAAGGGAGAGAAAACGGTCCCAGATGTGTCCGTGGATAAAAAGGTCTTTCTGAAGGGGACAGGGTCAATTGCTGGTGTTGCAGCTGGACCTTTAGGGAAAATGTCTTTTACAGAAGCCAAGAAACAGAAAATTATGTCCTCGGACAGCGCTGACATGCTACTGGAAGCTCAGGCAGCCACTGGCAACATCATTGACCCCAGAACTAATGAGAGATTGACTGTAAAGGCAGCATGTGCCAAAGGAGTAGTGGATAAGGAGGATGAATCAAAGTTGTTCGCAGCTGAAGCTGCTGCTATAGGTTACAGAGACCCAAATACAGGCAAGCTCCTGTCGGCAGGCCAGGCCATGAAGAAGGGATTGATTGACAAGGACACAGCTCTACGTATACTTCAGGCTCAAGAGTCTGTAGGGGGTATTTTAGACCCTGCCCTCAGTGTATTCCTACCCAAAGACATTGCAAAGGATAGGGATCTCATAGATGAGGACCTATACCGGGGCCTGAATCAATATCCTGAGTGTTATTTGGACCCAGACACCCAACAAGCAACTACCTATGTATCTCTGAAGAAAAAATGCAAAGCAGATCCAAAAACAGGTCTTTTGCTTCTCCCTGAACCTAAAAAGCCAATAACTGTACAGGGGCTCAGGGGTCAGGTGCCAGTCAGAGATCTAGTGGATGCAAACCTATTAGACCGGTCAGATATGGACCAACTGAGAGAGGGCAGATTGACGAGCCAGGACATTGAAGACCGCCTGCACTCCTACCTGAGAGGTTCCACCTGCATAGCAGGAGTTTATGATGAGGCCAGTGATAAGGTGATGCCCATCTATCAGGCCATGAAAGATGGACTGCTGCAATCTGGGACCACACTGGAACTGCTTGAGGCCCAGGCTGCCTCAGGTTTTATAGTTGATCCTGTCAACAACCATTACCTGACAGTTAGTGATGCTTACAATAAAAGACTGTTTGGGCCAGAGTTTAAGGACCATCTGCTATCAGCAGAGAGGGCTGTGACTGGTTACAAACTGCCTGGTACAGACAAGATTATTTCCCTCTTTCAGGCCATAGAGAGAGGTCTAGTGGAGAAAGGTCATGGCATCCGTCTACTCGAGGCTCAGATTGCCAGCGGTGGTATCATTGATCCTGAACACAGCCATCGGATTGACGTGAACGTAGCCTACAAGAGAGGTTACTTTGATGAAGAAATGAACAAGGCCCTGACTGATCAGAATGTTGATACCAAGGGTTTCTTTGACCCCAACACAGAGGAAACCCTAGCTTATCTGGAGCTTAAGAATCGCTGTATCACAGATAAGAAGACTGGCCTCATCCTGTTGCCTATCACTGACAAGAAAAGTCAAGAATCGACTTCGAAGAACACTCTGAGAAAGAGGAGAGTGGTAATTGTAGACCCGGAGACTAATAAAGAGATGACAGTACGTGTAGCATATGACAAGGGGTATATTGACTACGACACCTTTGTGGAGCTGTCCGAGCAGGAGTGTGAGTGGGAAGAGATCACTATCACTGCTCCAGATGGTTCCATCCGCTTTGTTATCATTGACAGGAAGACTGGAAGACAGTATGACATTAGCGAGCTGCTTGAAATGCGAGTAATCAACCAATCAGATGTAGATAATTACCGATCACGTACCATCACCCTTACTCAATTTGCAGATATCATCAGCAACAAGACCAAATATGGGTCATCCTCATTATCATCATCATCATCAGCTTCAAGATCATCAGCAGCCGGAGGTACATCTTCAGTGACATCATCATCAACTTCAAGAACATCAGCATCCCCGGGTACATCTTCAGTGATATCATCATCAACTTCAAGAACATCAGCATCACCGGGTACATCTTCAGTGACATCTTCATCAACTTTAAGAACATCAGCAGCCTCAGTTCCATCGTCAGTGACATCATCATTGTCATCATCAGTCCTGTCAAGACCCTTATCATCTTCTCTCTCAAAGATGACCACAACAAGAACTTCCACTGTCACAGAGCGAAGCACCTCAACCTGCAGTGTACCTCGAGACTCAACTGACTCCCGTAGGAATATATCCAGCATATCTGTCACTCTGTCCTCTCCTATTGAAGTAATAGATGAACAGGAACCTGTGGGTGCCGTCTTTGACACAGACTGTATCGAGAAGATATCCATCACAGAGGCTCTAGATCGTGGTCTGGTGGATTCCATCACTGCCCAGAGACTGCTGGAGGCTCAGGCTTGCACTGGAGGAATAATCAATCCCACAAATGGCCATAGGCTCAGCATCCATGAGGCCACCCGCCTGGGCATAATAAGTGACAACATGGGCCCAAAGCTCAAGCCTGCCCAGAAAGCCTTCTTTGGCTTTGAGGATGTAAAAAACAAGAAGAAGTTATCTGTTCCTCAGGCCATGAAGGAGAGGTGGCTGCCATATGAGGCAGGGCAGAGGTTCCTAGAGTTCCAGTATGTAACAGGAGGGATTTATGACCCAGAAATGTGCTGTAGAAGAACCATAGATGAGGCTGTGGAAATGAAGTGGCTGGATTCGAGAGACGCCGAGAGGCTCCAAAACGTCAGAGACCACACAAAGAACCTGACGTGCCCCAAGAGCAAACTTAGGATCTCTTACAAGCAGGCTCTGGATAATTGTCTGGTGGAGGAAAGCAATGGGTTGAAAATGCTCCAGGCATCATCTGTGTCTTCCAGAGGGATCAGCAGTCCTTACAATGTCTCCTCTGCCCCAGGGTCCACCACCGGCTCCAGGAGTGGCTCACGACGAAGCTCCCGCAGGAGCAGTGTGGACCTTGGATCCCCCTCCTCCTCAGGAACTTATCACCACAGTGTTTCTAGCTTCACCACCTACTCTGCATCCTCCAAATAAATCAAGAAAATGATCTGCACATTCATGCTCTTTTCTTGCAAATGATTCCTTTTGTTAAAAATATACCGATTGTTCAGAAAATAACTTGTGTGTGTCGTATATGAGGAGAAAAAAAAAATTAAGATAATGTTCTTAAACTTTTTGCATAGTTTTAGATTTCTGCTTTGGTGTTGCTATGCTTTTAAAATGCTATAGTTCAAATGTTCGAGAAAATTAACACTTCCAAGATATTTTTTGTGGAAATGAACTAAAGTATTAATGGCAGCCATCTTATGGTATTTGGAATGAAAATAATGAGGATGTTAATATAATTTTTGGTGCCCCTAAAATAGGCTTAGAAATGATTACCATATTTTTGCATACAAAAAATAAGTTTTTCAAAATCTTCATGAAATGTAATTTCTTTTTAAGCTTTGCATTGGTCACATAAGGGTGCTATGTTTACATTTATTTGTCATCTGAAATACATGTTTTGTGAGGGGAGGGATACAAGGTTTGGTTACATATATTGGTTTAACTATTTGTTTTCTACTGAATCAGTTGTTAACTGTTGTTCTTTTGCTCTTTAGTGCTTCCGGTTTTGTAACAGTTTCTCAATATCTCCAAATAAAAGCGGTTGAGTCTTTAGCTCA\n>KJ343209.1 Uncultured bacterium clone Evans.12.9_01824 16S ribosomal RNA gene, partial sequence \nTACGTAGGTGGCAAGCGTTATCCGGATTTATTGGGCGTAAAGAGAACGCAGGCGGTCTTTTAAGTCTGATGTGAAAGCCTTCGGCTTAACCGGAGTAGTGCATTGGAAACTGGGAGACTTGAGTGCAGAAGAGGAGAGTGGAACTCCATGTGTAGCGGTGAAATGCGTAGATATAAGGAAGAACACCAGTGGCGAAAGCGGCTCTCTGGTCTGTAACTGACGCTGAGGTTCGAAAGCGTGGGTAGCAAACAGG\n>XM_018460662.1 PREDICTED: Trachymyrmex zeteki zinc finger protein 830 (LOC108730757), mRNA \nGTTGCGTTCAGAATCATCATCCGAGTGTGCACCAAGATGTTGTTTTATCCTTATGTAAGGTAGATAACAAGGGTAAAACGACATCTGAGTGCATCTGGACGACAATTCTGAACACTGCCCAGCACTGCACTGTAGCCAATAGCTTCGATGGTACGAAGCACGGAGCATAGAAGCGCGATCAAAACATAAGTAACTGAACATAACCTACAAATCATTCGTTGTACGTAGTGATTTAACGAGTGAAAATTGGTGAAAATGTCCTTAAAAAGGAAACTGACGCAGGACGATCTGCGTAAAGCAATGAGTGAACACAAGAAGAAGTTCGGAACCATTAAAAAGATCGACTCACCGTTGGCAAAATATACAGATTCAGGACAGCTTATGTGCATTTTATGTAAGTCAGTGGTACGGAGTGAAACAATTTGGCCTGTTCATTTAAATTCCAAGGTGCACAAGGATAATGTTGCGTTAGCGAAAAAGACTAAACTAGAAACAGAAAGTACTATAAATGTATCTAATGTTCAAACATTCAAAAGGCCTCCGTCTCCATCAAACAATTCCCCAAATAAAAAGATAAAAGGAATATTGAAAAACTCTAGCCAGCCAGTGGTACAGGTCAAGTCAAATTTACCAGCAGATTTTTTTGATGATAATTCAGAGCAAGTTAACAATCCGTCTGTTCTAACGCAAAAATTAGAGAGCAAAGAGAAAGATCCCATAGTCAATACTACAGATGTACAACATGCCAAAGAAGAAGAAAAAGAGAAAGAAAAAGAAAAAGTAAAGGATATGAATCAAGCTGTTCTTCCAGAAGGATTTTTTGATGACCCAGTGATGGATGCTAAGGTTCGTAATGTTGAATACAAAGATCCTATTGAAGAAGAATGGGAGAAATTTCAAAAAGAAATTAAGGAAGAAACTGCGCAATCTGCACAAATTATAGCTGACGATCAGGAGGAAGCAACAACGGAAAGACAATTAGATGAAATTGAGGAACAAATTAGGCATTGGTCTAGGGTAATGGATCTCGCAAAACGTATGGAACAAGTGCAGGGTACCGATAGAAAACAGGAAAATATCGATAATGATGTATCAAGTGGTGACGAAGCCGAGTTCGACGAGTTTCTTGACTGGCGAGCAAAGAATTCGTATAAATGAAAGATTTTATATATCTAACAATTTTGTAA\n>XM_003538860.4 PREDICTED: Glycine max probable serine/threonine-protein kinase PIX13 (LOC100777578), mRNA \nCGAAAACGACCCATGTTATGTAGCTAGCACTTGTGTTGTGTCTTTTCTCATTCCTCATCCTCAACCTTACGCAGCAGCCATTCTTGTAGAATTCATTTTCTCGAAATTGGTTAATTAAGTTAATTAACACTAAACACTAAACATGGGTCTTTGCTTTGCTTCCCTCGCTACCCACCAAACACCCTCCAATAATTCCCCTCACTATTCAGGTTCAGCGCGTGAGATGGGAATTACTGAAAGCACTAGTGTTAATGGAGGAAGCAGTAGCATTAATAGCAATAACATGGTGTTTCCGAGTGTGGAAACGCGGAACTTGAAGCAGTTCAATTTCGCGGATCTGAAAGCAGCAACCAAGAGTTTCAAGTCGGATGCATTGCTTGGTGAAGGAGGTTTTGGCAAAGTTTACAAAGGATGGTTGCATGAGAAGACACTGACACCCACCAAAGCTGGATCTGGAATGGTGGTTGCTGTTAAGAAGTTGAACTCAGAAAGTTTGCAGGGCTTTCGTGAGTGGCAGTCAGAAATCAATTTCTTAGGAAGGATTTCTCACCCAAACCTGGTCAAGCTATTGGGTTACTGTTGTGACGATATCGAATTTCTCCTTGTGTACGAGTTCATGCCAAAGGGAAGCTTGGAGAATCATCTCTTTAGAAGAAATACTAACAGTGAACCACTCTCTTGGGACACCCGAATCAAAATAGCTATTGGTGCTGCACGGGGCTTGGCTTTCTTACACACCTCAGAAAAGCAAATCATATACAGAGATTTCAAAGCCTCCAATATACTACTTGATGAGGATTATAATGCAAAAATTTCAGATTTTGGCTTGGCAAAATTAGGCCCTTCTGGGGAAGATTCACACGTGAGTACCAGGATCATGGGAACATATGGCTATGCTGCTCCAGAATACATTGCAACAGGTCACCTTTATGTAAAGAGTGATGTTTATGGTTTTGGTGTAGTGCTGCTTGAAATGCTGACAGGGTTAAGGGCACTTGACAAAAACCGCCCCATAGAGCAGCAGAATCTGATTGAATGGGCTAAGCCTTCTCTCTCTGATAAAAGAAAGTTGAAAAGCATCATGGATGAGAGGATAGAGGGTCAGTATTCAACCAAGGCAGCATTAAAATCAGCACATCTTATTCTAAAATGCCTTCAATGTGACCGTAAGAAACGTCCTCACATGAAAGATGTTCTTGACACATTGGAACACATCGAAGCTATCAAGGACAGAACGAAGTAATCCAAGAAACATTGTACTAAGTTTGCAACTATGTGCAATTTCCAATAGCCAATTTATCATCCTTATGTGTTGAATATGACAAGGAGCTCCAACATGTGTAGGCTGTAGCTAGCATACTAGTCACAGTTCAAGTTCAGTGTAACTACTAACTAACTTGGCTTACAGTTATTATAGGTAGTTAGACCTGTTACTGCATGAGTGTGTTTGTGGCTGTATTTGAGTAGTCGTACCTCTCTCATTCTAGCTTTGTTCCCTTGTCAATAAAAATGTGTAGCTCCTACTTGTATCATCATCTTTTCATTTAATTCAATAAAATGAGTTACTTGAA\n>XM_039254146.1 PREDICTED: Hyaena hyaena mitogen-activated protein kinase 15 (MAPK15), transcript variant X3, mRNA \nGTGCTGCGGGCGTCTGGAGGCCCCCGGGCGCCCACTCGCCGGCATGTGCGCTGCAGACGTGGACCATCACGTAGCCCAGCGATACTTGCTCAAGCGGCGGCTGGGGAAGGGGGCCTACGGCATTGTGTGGAAGGCAGTGGATAGGAGGACCGGCGAGGTCGTGGCCATCAAGAAAATCTTCGATGCCTTTAGGGATAAGACGGACGCCCAGAGAACCTTCCGGGAGATCATGTTGCTCCAGGAACTTGGGGACCATCCCAACATCATCCGCCTCCTGGAGGTGATCCGGGCGGAGAACGACAGGGACATTTACCTGGTGTTTGAGTCTATGGACACTGACCTGAACGCCGTCATCCGTAAGGGCAGGCTGCTGAAGGACATCCACAAGCGCTTCATCATCTACCAGCTCCTGCGGGCCACCAAGTTCATCCACTCGGGAGGCGTCATCCATCGGGACCAGAAGCCGTCCAACATTCTCCTGGATGCCAGCTGCTTGGTGAAGCTCTGTGACTTTGGTCTCGCCCGCTCCCTCGGCGGCATCCCTGAGGGGCCTGAGGGCCCGGCCCTGACAGATTACGTGGCCACACGCTGGTACCGGGCTCCAGAGGTGCTGCTGTCCTCGAGCTGGTACACCCCTGGGGTGGACATGTGGAGTCTGGGCTGCGTCCTGGGGGAAATGCTTCGGGGGAGGCCCCTGTTCCCGGGCACATCCACACTGCACCAGCTGGAGCTGATCCTGGACACCATCCCGCCTCCATCCAAGGAGGACCTCCTGGCTCTTGGCTCAAGCTACAGCGCCTCAGTCCTGCCCCGCCCGGGGCCCCGGCCACGGCAGACGCTGGACGCCCTCCTGCCGCCAGACACCCCCCCGGAGGCCCTGGATCTCCTCAAGGGACTCCTGGTATTTGCCCCGGACAAGCGGCTTAGCGCCGCGCAGGCGCTGCAGCACCCCTACGTGCAGAGGTTCCACTGCCCCGCCCGCGAGTGGACAATGGATTCGGCCGTGCGGATCCCGGTGCTGGAAGGAGCTCAGCTCTCAGCCCCTGAGTACCGCAGCCGCGTCTATCAGGTGAAGTCCAGCGTGAAGGGGGCGGCGCCCTCCCTGGCCTCGCAGGCTGCCGCCCTGGGGGCCGTCCAGGCCCTGATCCGGAGCGACTGGAACCCGGGCCGTGGGGCGACGGCGGCCGGAACGCGACAGGTCCCTCGCGGGCTTCCGGCGGATGCCCGGCCCGAGCCCCGGCCCGGCCGGCGGATGTTCGGCGCCCCGGCCTGGCAGGGGGCCCAGGGCGCCGCGAGGGCCGCGCTGGGGGGCTATTCTCAAGCTTACGGAACCATCTGCCATTCGGCGCTCGGCCGCCTGCCCCTGCTCCCCGGGCCCCGCGCGTGAGCCGCCCGCCAGCCTCCAGTCCGGCTCCTGTACTCAGCCCGCGCCCCTCGCCCAGCTCTGGATTC\n>XM_016250992.1 PREDICTED: Sinocyclocheilus grahami solute carrier family 7 member 2 (slc7a2), transcript variant X3, mRNA \nGGTTGAATAGGAAAATTAGCATTGCCTCCCTCTGTGTGAAGTGTCTCTCCTCCTCTTTGGCCAGACCAGCCCTCCTCGTGGGGGGCAGGGCAAGTTAAAGCAAACCAGAACAGAGTAAAGTAGGCAGTAAAACTAATGCGGTTGTGGGCTGACATGTCATTTGAGCTTGAGGAAGGAAGGGGCAAACTTTGGAAGGACTGAGCCTGTGAGCTTTTTAAAGAAATCAGTGGAGATCCCTGAGAGGTGTGTGTGTGTGTGTGTGTGTGTTTGCATGAAACCGTAAGACATTACGTCCATAAGGCAATTCTACAGCTGCCAGTCTCTCATCAGGTGTTTGTGGTAACAGGAAGAATGCTGGAACATTGCCTCGCATTTGGTCGCTCCCTTGTGAGGAGGAAGAATGTGGACCAGGACTGTCTGGAAGAGTCCAAGCTGTGCCGCTGCCTCTCCACTGTTGATCTGATTGCCCTCGGGGTGGGAAGTACACTTGGGGCTGGTGTCTATGTGCTCGCTGGGGAGGTGGCCAAAGGCAGTTCTGGCCCCAGCATTGTGGTGTCCTTCCTCATCGCTGCTCTGGCATCTGTGATGGCTGGCCTGTGTTATGCCGAGTTTGGTGCACGGGTACCCAAGACGGGCTCAGCCTATCTGTACAGCTATGTGACCGTGGGGGAGCTCTGGGCCTTCATCACAGGGTGGAACCTAATTCTGTCATACGTCATAGGGACGTCTAGTGTGGCGCGTGCCTGGAGTGGGACGTTTGATGAGCTTATAGGGGGCCACATTGAAAAGTTCTGCAAAATGTACTTCAAAATGAGTTTGCCTGGCCTAGCAGAGTACCCTGATTTTTTTGCTGTCTGCCTGATCTTACTACTGGCAGGCCTTCTCTCCTTTGGGGTGAAAGAATCAGCTTGGGTCAACAAAATCTTCACAGCTGTAAACGTGCTTGTGCTGATGTTTGTTATCATCTCTGGGTTCGTCAAAGGAGACTCGCTCAATTGGAATATATCTGAGGAATCTCTCATAAACGTTACCATTTGCAAAAGGAATCTCTCACACACTGCTAATGTCACTAGTGATTACGGAGCAGGGGGATTTTTGCCTTATGGCTTTAGTGGGACACTGGCTGGTGCCGCCACCTGCTTTTATGCCTTTGTGGGATTTGACTGCATTGCAACCACAGGTGAGGAGGTGAAAAATCCCCAGAGGGCCATTCCCATTGGGATAGTTATTTCCCTGCTGGTCTGCTTTCTCGCCTACTTTGGTGTTTCAGCGGCCCTCACCCTCATGATGCCCTACTACCTGCTGGATGAGAGGAGTCCCCTGCCTTTGGCTTTTGAATATGTGGGCTGGGGGCCTGCGAAATATGTTGTAGCAGCAGGATCGCTCTGTGCTTTATCAACCAGCCTGTTGGGTTCTATGTTCCCTCTTCCACGCATTCTGTTTGCCATGGCACGAGATGGCGTGCTATTCAGATTTCTTTCCAAAGTGAGTAAGCGTCAGTCGCCAGTGGCTGCCACTATGGCAGCGGGCACTACTGCGGCTATCATGGCTTTCCTGTTTGACTTGAAAGCGCTGGTGGACATGATGTCTATTGGAACCTTGCTGGCATACTCTTTGGTGGCTGCTTGTGTTCTAATCCTTAGGTATCAGCCGGATGCTGCGTTTGAGAGGTCTAGGATCAATGAAGGCAAGGAAGAGGTTGGTGAGTCTGAACTGACGGAGTCTGAGTCTCACCTGAACATGCTGAAGGATGGAAGAGTAACCCTGCGCTCTCTGCTCAACCCTCCACTGCTGCCCACTGAACAGACCTCCACTGCCGTCAACATGTCTGTTATAATCATGGTGTTTGCTGTGTGTGTTATTGGCGCACTCAACACATATTACGGACAGGCCATTATTGCTATGGAGCCTTGGGCCCTGGGGGTCTTAGGTGCATCTTTGTTCATCTTCATCATGTGCATCCTTCTGGTTTGCAGACAACCTCAGACGAGGAAGAAAGTTTCCTTCATGGTTCCTCTGTTGCCCTTTCTACCCATCTTGAGTATATTTGTCAACGTGTATCTCATGGTTCAGCTCAGCGGCGACACGTGGATCCGTTTCTCCATCTGGATGGCTATAGGATTCTTCATCTATTTTGGATATGGAATGTGGCATAGTGATGAACGTAAGAGACATCTACAGAACTGTGGTGTTGCGATGGAGAAAAAGACACTGACAGGAAATGAAGGCACTGTGGAATATGTGACGCACATAGAGAAGACTAGCCCATGTTAAAGAACAGCAGATAAAACTA\n>CU677742.1 Synthetic construct Homo sapiens gateway clone IMAGE:100017471 3' read PBXIP1 mRNA \nGTACAAGAAAGTTGGGCAGCCCCGGTGGTGGTGGTGGTGGCTATGGCTGTGCCCCTCCCTGGGCCCCGCAGCTCTTGGGCTCTGTGAGTGCTTGTCCTTCTTCCCTGACCTCTTCTTCAGTGCTTTGTCTCCAAAGAAGTGGCTGAAGATGAAGTCCTCAAAGTCATCTACTTCATCATCATCACCTGTCTGTTGCACAGCCACCTCCTCCAAGCTGTCCTCCAGGGCATCCACAAAATCCCGGAAGCGGAGGCGGTCATGACGGAAGATGCCATCCTCACCAAAGAAAGCAGGTGAGAGGGGTAGCTCCTTGGTCAGCTGCCCAGCCCAGGGCAGCCGTGCCAAGTATGTTCTTAGCAGAGAGGCCAGCTCCTGTTGCCGCACTGGGGCTAGCTCTGTGCCAAAGAAAGTCAGGCCCTCCTGCCGGGCACACTCGTCCACACCTGAGCAGCCCTGGGGTGCCCGGTACTTGGGCCTCAACAGCTCTGCCCAGGATGGCAGGGGGTCATGGCTGTCCTTAGTCCCTTCCCTCCACCGAGGTTGCTTCTGCTTTTCTCCAGAGGAGTGGAAGCTACCACTTTTTCCTTGGGGGGTCCCTTCGGGCCCTGTCGCTTGCCCTCTTTCTTGCTCCCCCGACTCCTCCACCCTTGGCCTGCCCCTCCTTCCACCTTCCTGCTGGCCTCCTGTCCTTCTGGACCTCCCCCAGTCTTCTTTCTTTTCCCGGCCAAATTCTTCTTTTTTATGTTTCCGGTTTTAACCTTTCGGGTTTTTTGGCCCTCCCCCCATTTTTCTTTCCCCTCCCTCCCTAAAATTCGGAAGGGGAATTTTGGGGCCAGCCTTTAGGGTTTTGGAAAAAACCCGGGGTCTCGGCCCCGTTTCCCCGAGCCTGAATTATTGGGGCAAATTTGGGGCCCACTCTACACACCCAAAAAAAATGGGGCCCCCGGGGGGGATCTCGAAATCCCTTCCAAAATCTGGTGAAAACCCACGGCGGCTGCGGCCCTTTAATATTTGCATAAAGCGGGGCCCACCCACCAGGGTTCTTCTCTTTAGAAAGGAATG\n>XR_001314002.1 PREDICTED: Thamnophis sirtalis uncharacterized LOC106555578 (LOC106555578), ncRNA \nGGACCTGCTGGGGGAGAAGGAGAATCTGGACAAAGAGGCGACCTTGGTGAAGCAGGTTTGCCAGGCCCTAAAGGATCTGATGGCAATCTTGGTGAACCTGGCTCACGTGGGCCCGAGGGAATCCGTGGCATGCCTGGCATAGAAGGATTCCGTGGGCCTCCTGGCCCCCGTGGTTTGCAAGGGGAAC\n>XM_050835981.1 PREDICTED: Eriocheir sinensis PEST proteolytic signal-containing nuclear protein-like (LOC126983306), transcript variant X5, mRNA \nGCCCCCTGGGTCCCCATGGAGACGTCACTGGAGGACCAGAGGCTGCCTGCCCCCAAGCGGCCAGTGGAGGAGGAGGGGGAAGGGGAGGGGGAGGAGGAGCCTAAGAAAAAGATTAGTTTTGGGCTGAGCAGCAAACCTCAGGGCAAAAGTGGCCTCCCTGTCAAGAAGCCAATTGGTGGCATCTCCATCAAGCTGGGCCAGTCACAGGCAGCTGCACAGGCAGCTGGTGGTGCCTCCATCCTGAAGCCCAAGGTGGGTGCAGCAGCAGCAGTGTTCAGCACTGGAGATGAGGACGATGAAGATGAAGAAGAGGAGATGCCACCTGAGGCAAAGATGAGGATGAAGAACATTGGGAGGGACACCCCAACCTCAGCTGGCCCTAACAGTTTTGGCAAGACTAGGATGGGCTTCTGTGACTCAAAAAAGATCTACGAAAAGCAACTTAAGGAGGTGCAGGACAAAACTAACAAAGTAGTGCCAGACAGCGTGTAGGCAAGGTGACAGCCACTGCTGGCTGAAGCCCTGCACCTCACTTGGCCTGTAGCAGGGCAGGAGTGTGCCTGGCCTAGGCTGGCCTGTGCTAGGCTGGAGACTTGTTGGTTATTTGGACATCCCTCCTTTAGGCCTTAAGGTGTAGTAGTGCAGCCTGTCATCATCAGTTGTGTGTATAAATTGTAGCATAAAGCTCCAGGCTCGGGGTTGTAGCTGACTCACAGCACTGGTTGACATCTCGGGGGTTTGAGTGTGTGTGTGTGTGTGTAAACATTTGCTTGTATGTGTGTGTGGTGCATGCATGGTGGTTTTGGCTCTGCACCGGGAGAGTTTGGTTGTGTTAGAATGGGCTGTGTTTGCCAAGCAAGGAGTAGTGCTTTCCTCAGACAGGGACACACTGGTGTGGCCAGCAGTGTAGTGCTCCCCTCACTACTATGTACTGAGGCAGGACACACGGGAAACACCGGTGTTTATTTCAGCTTCTCGCAAGTACTGTGGTGTGCATAGAGTATTTCAGTTTCAACTGTTTCAGGCATGTACTTCATATTTCTTTGAGCGAACTTGTGGATGTTACTGACAGGGATTAACTCTATTAAACTCGACCATAGGCAGTGGTATGTGTCTAGAAGGAGTGAGGGATTGCCGACTTTTATAATTTGCCTGTGTACTTCAGGACATATACCAGTGATTAGGATTCAGGTTTTAGATTTTATCATGCATGCAAGCCAAGGAAAACTTGAGACTACATCTTCAACATCTTATAAAGGAGTATTGTGTCGACCTGTATGGATACTTTAGAAGCAGAGCAACGAGTAAGTGAAGATTTCAGCAGTTTATGTGATGAATGACTTTTATCATTATTACTATTCTGTGTGATAGTGCAGTTTGTGTATCTAACAACCTCATCCTACTGAGGGTCTCTGCGTACCCTCAGCAGCTGCATCACTGCAGAATTTATTGCCTGTCAGTCATTCCCTTGCCGTAGCGAAGGATGATGGCTGACTGGCTTGCCATCCATCTGGGGGCAGCATGGCTGAGTAATACATAGCATTTGTCTGCTTCATTTAGAAATTCTGTATAATGTTCTACATAGATGCATTTTCTGCTATCACCCAGAATGAGCCATTGTGACATTGATATCGAAACTGTAATATGTGTATAAAATATGTAGGGTGTTCTTAAGACTTTTGCACTCACAATGCATTTGGCTATGTTTATAACTACACATTTTGAGGATGTCCAGCTATAGACACAAACATGAGGCATCCACAGGAATCCTTGTAGGTGTGAATGATGTCTTGATTAAGGGAAGGCCAGAAAGGTAAGGTTCAAAAGTTATATTACAATTCATTACAGTAACATCAAAAAATATAAATACAGATTAGTCCTTGACTATACATCTGTCTAGTTTGGCAGTAAAGAAAAAGGCATTGGAAGCAGAGGACATCAACAACCCTCATACGGTATCAATCTTCAGTATTGTTTAAAATTGTAATACAAACATTAATTCCTCTTGCCTACTTTGTGGGTGCCTCATTGCTGGTTACAAGTAATCCTTCAGAGGTCTCATTTAATCCCTCAAAGGTGCCCTCCCAGCCAGTGTTTGCCGGCAGCACACAGAGCAGGGTGGCGGACACTTGGCCCCTCTTGGTGTTGCTGGCACTTGTAAATGTCCCAGCAGCAGTATTTCTAAATTGTTTGGGTTTGTTGTGTTGTAGCTGAAGTGTCCTCTGTTGGATGATACCACATATTCTTGCCATTCAGTTTTGTTTGTCTCTGCTATATGTGGCTGTTATTCATTTTATTTAGTCTGTCTGTGTAATTTAATTTGAAGTATGTGTGGTTGAGAGGTCATTCTACAATGTATCCATTTGTAATTTGTCATTCATCTCTACGGTCTGATGGATGGTTTTACGACTGTACAGAACCATGCAGTATTTCAAGGTTTCTTTCTGTTCAGTATTTGCCATTACTGTTGATTGTTTCTATTTGACCAAATCTGAAGTGGAAGTGGTGTACAAGATTTTAATTGACATACAGGTTGTCCACTTTCTTGAGCAAGTTGCATTTGTTCAGGACACCACCTGAGCTTTTTGTGTATTTTTACCTGAATGTTATTTAAGGGAAGTTACTCTCTGTATTCCTGGTGTTTCGGCTTCTTTGCCAACATCCACAGTCCATTCCTCTCAAGGTGACTTTGAATGTTTATCCTTATTGTTCTCATTAAGATTCACTAAACTGCCAGATGTAGGCTATCTGAGGCATCTGCTAAGTCCATGTATCATTATTACAAACTAACAGGGAGCATACGCCAGGGGGTGCATTTGCTTCACCCCGGCGGTCCCTCTGAGTGAACCCTCATGCAGTTACCTTTCCCATTCTAAGCCACTCCTGGCAGGATTGATCAAATTGCCCCACCCATGAGTTATGAGGATATAGGTTTTTTTTTATATAAAAGTTTGGTGTTCATTCAGAACAACATTGTTGTTCAGTTTTCTTCTGTCATAGCACTAGTGTTAATAATTGTGCCCATATTTTCTGTATTTTCTTATGGCTGTTCTGCTGTACCATTCCATGAAAGACAGCAGCTGCCAAGGAACAAGAGACTACCAAACAAATGAGCTGCACTAGATCACAGTAACAGCAGCACAGAGTAGCTGGCCAATGCAGGGTGCACCATCGCAGCTTCGCCAGGACCCCTTGGGGTCTTCATGACTCAGGTGACGGAAGCAGTGCATCCTGCCTGTGCTGCCCTGCGTCTTGTGTCCTGTGGTCTATACTCCAAACAACAACGTTCAGTCACTTGCGATGCCATACCAAACCTCTTCTTTCAACAAATAAAATTTCCCAAGATTTGTTAAAA\n>KP395388.1 Uncultured bacterium clone MISEQ01_89_000000000-A647M_1_1111_13864_15148 16S ribosomal RNA gene, partial sequence \nAAGGAATATTGGTCAATGGACGCAAGTCTGAACCAGCCATGCCGCGTGAAGGATGAAGGTCCTCTGGATTGTAAACTTCTTTTATCTTGGACGAAAACGGGATTTTTATCTCAATTGACGGTACCAGAGGAATAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAAGACAGAGGGTGCAAACGTTGTTCGGAATTACTGGGCGTAAAGCGCGTGTAGGCGGTCGTGCAAGTCGGGTGTGAAAGCCCAGGGCTCAACCCTGGAAGTGCATTCGATACTGCATGGCTAGAGTCCCGGAGAGGATGGTGGAACTCTAGGTGTAGAGGTGAAATTCGTAGATATCGAGAAGAACACCGGTGGCGAAGGCGGCCATCTGGACGGTGACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACA\n>XM_013051197.2 PREDICTED: Mustela putorius furo actin binding LIM protein family member 3 (ABLIM3), transcript variant X7, mRNA \nGTGGCGGCAGCGAGCGGCCGCGCCCCCCGCGCTGCCACCCCGCGAGCCCGCATCATGGATGTCGAGCTCTCCTATTTCGCTTTGCTCGCCTTGGAATTCGAGACTCCAGACGAGGACCAGGATTCATGAGCCGGTCGCAGGGGCCCAGGCAGGGGCCTCTGGCTCCCGACGCCGGCCGAAAGGTGATGAGTGAGGTCGGAAGATCGCAAGATTTAAAAAGCAACCGGGTCCTCCGTATCGAATGAAAGACCCAGTGCAAAGGCATCACCATGAACACGAGCATTCCTTATCAACAGAATCCTTACAATCCCCGAGGCAGCTCCAATGTCATCCAGTGCTACCGCTGTGGAGACACCTGCAAAGGAGAAGTGGTCCGTGTCCACAACAACCACTTTCACATCAGATGCTTCACCTGCCAAGTATGTGGCTGCGGCCTGGCCCAGTCGGGCTTCTTCTTCAAGAACCAGGAGTACATCTGCACCCAGGACTACCAGCAGCTCTACGGCACCCGCTGCGACAGCTGTAGGGACTTCATCACCGGCGAGGTCATCTCCGCCCTGGGCCGCACCTACCATCCCAAGTGCTTCGTGTGCAGCTTGTGCAGGAAGCCTTTCCCCATTGGAGACAAGGTGACCTTCAGCGGGAAGGAATGCGTGTGTCAAACATGCTCCCAGTCCATGACCAGCAGTAAGCCCATCAAGATCCGTGGACCAAGCCACTGCGCTGGGTGCAAAGAGGAGATCAAGCATGGCCAGTCACTCCTGGCGCTGGACAAGCAATGGCACGTCAGCTGCTTCAAGTGCCAGACCTGCGGCGTGATCCTTACCGGGGAGTACATCAGCAAGGATGGCGTTCCGTACTGCGAGTCCGACTACCATTCCCAGTTTGGCATCAAATGCGAGACTTGTGACCGGTACATCAGCGGCAGGGTCTTGGAGGCAGGAGGGAAGCACTACCACCCTACGTGTGCCCGGTGTGTCCGCTGCCACCAGATGTTCACGGAAGGCGAGGAGATGTACCTCACAGGTTCTGAGGTTTGGCACCCCATCTGCAAACAGGCAGCCCGGGCAGAGAAGAAGTTAAAGCATAGGCGGACGTCCGAAACTTCCATCTCACCCCCCGGATCCAGCATTGGGTCACCCAACCGAGTCATCTGCGACATCTACGAGAACCTGGACCTCCGACAGAGAAGGGCCTCCAGCCCAGGATACATCGACTCTCCCACCTACAGCCGGCAGGGCATGTCCCCCACCTTTTCCCGCTCGCCTCACCACTACTACCGCTCCGGTGATCTGTCAATAGCAACCAAGAGCAAAACGAGTGAAGACGTCAGCCAGGCCTCCAAGTACAGTCCAGCCTACTCCCCGGACCCCTACTATGCTGCAGAGTCCGAGTACTGGACCTACCATGGGTCCCCCAAAGCGGCCCGAGCCAGAAGGTTCTCATCTGGAGGAGAGGAGGAGGACTTTGACCGCAGCATGCACAAGCTCCAGAGCGGAATCGGCCGCCTCATTCTGAAGGAGGAAATGAAGGCCCGGTCCAGCTCCTACGCGGATCCCTGGACCCCACCCCGGAGCTCCACCAGCAGCCGGGAGGCCCTGCACACGGCTGGCTATGAGATGTCCCTCAATGGCTCCCCTCGATCCCACTACCTTGCTGACAGCGACCCCCTCATCTCCAAATCCGCCTCCCTGCCTGCCTACCGAAGGAACGGGCTGCACAGGACACCCAGCGCAGACCTCTTCCATTATGACAGCATGAACGCCGTCAACTGGGGCATGCGAGAGTACAAGATCTACCCTTATGAACTGCTGCTGGTGACCACGAGAGGAAGAAATCGGCTGCCCAAGGATGTGGACCGGACGCGTTTAGAGCGCCACCTGTCGCAGGAGGAGTTCTACCAGGTCTTCGGCATGACCATCTCGGAGTTTGACCGGCTGGCCCTCTGGAAGAGGAATGAACTGAAGAAGCAAGCCCGGCTGTTCTAGGCAGAGGCTCTATAAATATATATGCATTTATATAAAGATACATGTAAAATCTCTATACTGAAGCTCGGTATAATCCTCTCTTGTGTAATGGGACACACTGCCAGCCATGAGACTTGCTTTTCTGTACTGTCAGGCAAGCCCACGTCATCGAGATATTTTTATGCTCCTTACTTTCTCTTTTCTAAGTGCTCTGGGGTTCGGGAAGGGATTTGAGGAGACTCCCATCCTTTTACTGGGGATCCTTTTTATACTGAAACATCTGTCCTAACCTGAGTCCCCCAAGGTCCAACTCTCTTTCCTAAAGGAGGTGCCTGAAGAAGTCTCTCTTCTCTCTGCTTCTCGGCTCTCTCCCCAGTCTCCAGGGTGGATGCTGACCAGGCAGTTTCCACACCTTACTGGCCCCAGAGGGGCCCTCCCACGGGAAGATCCACAGTGATCTCCCAAAGTCACCGAGCACCATGGAGAGCCCGTGAAGAATTCTCCCATCTCCCCCATTTAGGAGTTCGGTGCCCTCTGGGGGTGATGCCCTTAGCTGTGTGGGCCTTGGATCTACTCACTACAGCAGCAAATGAAGTGGTTCGGGCCTGGGCCTCTCTGCAGCTTCTCAGTCCTCCTCCTCCTGCCCTTGGCCCTAACTTCAACCCAAGTCACATGGTAGGAGGAGAAAAGTCATTTCCCTTCCCTCCAACACCTCCAACTGGTCCCTTTGCCTGGCCCCGATGTGGAGATGAGAGGGAAAGCGTGGGAGCCGGCCACAGGAGCCGGAGCAGGGCACCTGTTGGAACTGGAGCTGCAGGACCTTTTGCAACCCTCCTCTCACCCTCACTGCCCCCAGCACCTCCTAACCCTTCCCCCCTTCAGAGGAGAGGCCCATTATTACGCCTTACTACGATCTATGTGCCTGACAACTCAACACACCACAGGGCTAACTTTCCCATCACAGTTCCAACAGAACAGCTAGACAACCTCTAACTCCCCTCCAAACATAATACAGGCCATGTCCCAAAGAAAGCCGCCTGGTCTACATCTGCAGGCCCCTGGGCTAGAAGGGCAACCGAAGCTGTCCCTCACCAGTCAGTCATTGGCTCCCACTGCAAAGTTGGCCATGTTTCCTAGGGGAAGCCTTTGGAAGAATGGCTGCTTATGGAATTCCAAAATGAAGCATTTGCCAACAGTGCGCATGACCACCCTGGATTTCCCCAGCGGCTGCCTTTCCTGCCCTCTGGCCTTCTTGAACAGCGATGAAAGCTTGACTTTAACTTCTCTCCTCCCTTCCCCCAAACCTTTGAACCCCGGCCCCCAGTTGGCTATGTGTGGTGGGGTCTGTTCCTCCCTGGAGATGCCTTGATGTAGATCATGTTGAGGTCACGGAGGGAAGACGAAGAAGTGGAAATAACCATTATGACTCTCAAGAGGCTGGTGTCGTGACCTGGCAAATAGAGAACTGACTCCAATCCAGCGAACCCTCACTGAGCCCCTGCTAACGCTGAGCACCTGCTGTATCCTGAGCACCGAGGGGGGAGGGAGGTGGGGACACTGAGATGATCAGCACGGGATCTGGACTGGGGGGCACGCCTGCTAGCACTGGGTGTCGTCGGACATGGACTCGCATGTGATGGACGTAAGGCAGGAAGTGATGGAGATGGCATGAGAACGTGTTTGTGGGATTACCGAGAGGGCAGATGCAAGTTGGTGCAGACCAAGGAACTTTCTGGAAGAGATTGCATTTGAGCGACATTCAGGAAGGATCTCTGTAAACTGAGAGGAGACTGTAACTTGAAAGGGTGACAGGGTGAGGGGTCAGAAGGGGGTCTAATATTCTCTCACTTAAAACATCAACCCTCTCTGCAACTCTCCTTTTGGCCAGTGTCTTTCAACTGTCCTGACCCTTTAGAAATGTCCCCAGCCAGACGCAATCATTGAAACTGCCTCATTATCACCGGTTGAGAACTTGGCAAGATGAAGGGCTTTTGTTATTGTTGTTGGGTATTTTTGTTTCCCATAAAAGCACATAATTCCAACCCA\n>XM_039549112.1 PREDICTED: Corvus cornix cornix chromosome 2 C8orf34 homolog (C2H8orf34), transcript variant X3, mRNA \nTCAACGGGCGCCGGCGGCCGTGGAGCTGACAGGAGCCCGCGGCTATCGGCCTCGGCAGCGGCGCTGTGGCGAGCACGGCAGCGCCCGTCACCACGGCGCTGCTTGGCACAGAAACACAGACAGAGACGGACTGACAGACACACGCAGCGCGGAGCGGCGCGGGCTCGGGGGCCGCCTTTGCAGCTCCTCTCCTCCCTGCACCATGCTCCGCTCTAGGCAGCGCCCGCCCGCTGCTCCCTAAGGGCAGCCAGCCCCGCGCCCAGCTAAGCGGGCGACTGGCACCCGGCTCTCTCCCCCCCGCCCCCAGTTACCTGAGTTAGCTCCGTCCCGGGGACTTTCGCAGCGCCTCCGCCCTCTCCCGCTGTGGCAGCCCTTGTGCGGCGGGGGAGTGAGCCGCCCGCAGCCGGAGGGACTGCAGCCGCCGCCGGGGGAGACGAGCTCAAGCCCCCGCCCCCGGAGCTCTTCATGGCGTCTCATCAGCAGACAAGGATCCAAGCCTACCTGGAGAAGAATAAGATCGGTCCCCTCTTCGAGGAGTTGATGACCAAGCTGATAACAGAGACACCTGACCAGCCAATCCCATTTCTAATTGATCATCTTCAGTCCAAGCAGGGGAACCGCAGTCAGCTTCAGAGAACATTGTCTGGCTCTGCTGCCCTGTGGGCAGAGAGTGAAACATCAGAAAATAAAGGAACAAGAAGAGATTTTAGAAGTTATGATAAGCCTTGGCAGGTAAATGCAAAAAAGCCTAAAAAGTCAAAGAGCGACCTTGCTGTGTCCAACATTTCTCCACCATCACCGGAGTCCAAGTCATTGCCAAGGTCAATAGAGCATCCTAAATGGGATTGGAAGACAAAACCGGAGAACCATGATTTTGATGAACTAAATCATATTCTTCAAGAGAGCAAAAAGCTTGGAAAAGCCCTTGAGAATCTGTCTCGCAGCATTGCTATTTCTGATGAACTTGATAAGGACACAGCAGGTTTCAACACCCCCCTTCTCAGACCTCGTGTGATTGGAGAATGGATTGGCCGTGAAGAGAATGATGCAGATCCTCTGGCTGCTGAGATGTTGCAGCCACCAATACCAAGAAATAAAAATGAGCAGTGGGACAGTGAGGATAGCAGCAGTCCTGGAGGAAGCTTAAAAATGGAGCCAAAGACCAAAGGATTAAAACATCAACAGCAGCAACATAAGAAACTGCTGGCTGCCATGCTTTCTCAGGACTCCTTTGATTCTGCTCAAAGCACAGCTCCATCTGTAACCGAAGAAGACATTGACAATGAAGATGATGCAATGGAACTACTGGAGGATCTTGATGATCTCAGAATGGAAGGAGTAACAAGTGTGGTATCCTCTGGGAGCAAATTCAATCAAACTCGAAGTGCTCATATGGCTGAGCCTCAAGCAAAGGTCACATTGAATATATGTGCAAGATGTGCCAGATTGCAAGGGGATAATTTGGCAGAAAGGCCAGAAGATGTCTCCATGGTATCTCAGACATCTGAGCCAGCAGTGTCAGACTCTGATGCTCAAGTACCTGGGGTTGAAACACTCACAGAAGATATTGATGAATTTCAGAGTGCCTCTCAAGTGGCAGCATCTTCTCAGACAGTTTGGACCTTGGATGCCATGACTGTCAGACCTGGAGGTTCCCCAAGGCAGAAACTCCTAAAGGACTCCTTAGCAGCAAAAGAACTTCAGACCATGGAAAAACACCTAGCTGACATTGAGAAGGACCTCGCACTGTGGGAAGAAGCAAGGCTTTCAAGAAGCCCTGGTGTCCAGCATCCCAGTGTGGTTACCTCTGACCATCCAGGCACTCTTCAGGCTGCGCAGGGCCAAACCCCCAGGCCTCAGGTGCCAACTCCGATGGGGAAGAACATTCAGCTCCAAGGAAGCAAATCACCACCGCTGCCCACTAACAGCAGAACACAGGTCTCCAGTGTCACAAGCAGTAGACCTTCAACGCCTGCTGCACAAACCAACAGGCCATCAACTCCAGGGAGCAGACCTATGACCCCAAATAGCTTGTTGTCACGGCCTCTTACCCCTAGCAACCAAGGAAATAGGGAAGGCATTATTAGTATTCAAAGAAGCAGATCTTTGTCATCTAAGAGCCAAATGGGGAGGACCCTCAGTGCCGCTTCAGGGCTTTCTGTGCAAGATGAATTCTTACAACAGTTTCAACTTGCTCATCAACCTTGGATATTGCCAAGTGACACAGAAAGTGAAGGAGTGGAAGCTGACCAAGACAAATGTAAGTATATATGTAAGGACCAGATAATACATCAAAAACCGTCAACTTAACTTCTATTTTCCATATATTCAAATACTGTGGAGATGTCATGCCTGCTCACAGGAGCTTTTCTCACAAGTACCAATTACTTATTTGTCTGAGGGCTAGACCTTACAGGATTGATTTGCAGAAGCTTTCCTGCAGTCACTGAGCAATGACAAAATGATCACAGACCACACTTTACTTAATCTAAGTGAAACAATTTGTCCTGATGTGTTAAAGTAGCTATTCCAGAGAAGTAACCTGAACTTGAAATAGGCAGTCTGTTTAATAAATCTGTATTCACCAGCAAAAAAAAAAACAAACCCTAAAAAACTTCAGATCTGAAAAGCAGAGCCTCCCTTCTTAGGCCTGTCACTCTATTGTCTCTGTTTTGCTTGCATTCTTTTTAATTCATCTGTATTAATAAAAAAGTTCTTAATCATACAAGTAATCCTTAATATCCTACACTCTTTGAAGTATTTTTGTAATCATGGAAGTGAAGGTCAGCAGGATCAGAGCCTAAATGACAGAACAAGTAACTACAAGTAACAGGCTATAAATTGCAGTTCTTTCAAACTGTAGCAAGTTCCCCCTGCCTACAACATACCTGTAAATGATCTTACTGTTTCACATTTTCTTTAATTCACAGTAATTTTGTGATCTGCAAGGGTGAATATGCAAACTGTTTCCTAACAGATTTTAGGTGATACACTTGAAAAGAACAGATTATTTAATCAGCATGTTTAGAAAATTCAGTACTGGTTTAAACATGAAGAGTTAACATATGAAAAACACATTTTCTTTACAGAAGGGAACAATTCTATAAGGGATTAAGGATTCATAATAAACATGCCAGATAAACAGAATGTATTTTTACATTATGCTAGTTAAAAGAATTGTTTTCTACTCATACATCAGTTTCACAAATTCATACATAGCCCAGAGTTTGACTGAAATTTAAATTTATGCAGTGAGGTTCTGAAGAGCATGTGCCAGGTCTTTTTGAGCACTAGTAAAATGTTAAAATGAGATTGTGTGCATCCAGCTGATTTTAGTCCAAAGCCAGTAATATGACTTCCACCAGAGCCTTTCAGTTATCTTTGGACTGAAGCTCCCCTTAGGAGGCTCAAGAGATACCCTGTCACCTGCCTTTTATGTGCATGCAATTTTTCCTCTGTATTTTCTGTAATGAATTTACAGTCCTACAAACATTGGTTGGATTGGCTGTGCACACACAGACTGATGCCAATTATGTGACCAGGGAGACTGATGCTCCGGGACATATCAGGTACACAGCATGGTTTCTTATAGCTGCTGTACTTGAATTGTGTGGGTGTGAGGACTTGTGAGCACCTAAAATCCTGTACTGTAGTATTCCAAGAATCCTGGTAGGTCACTGTCACTGCCCAGAAAACAAAGTGTTAAGTTAAAAAAGTATGTTGTTAAGGTCAATGTCCAAATCCCTCTTGAACAGTGACAGACTTGAGGTAGTGACCATCTCCCTCAGATGCCTGTTCCAGTCTTTCATCCTCTCAGTAAAGGAATGCTCCCTAATGTCTAGTCTGAATCTCCCCTGGCACAGCTTTGAGCCATTGCCATATGTTCTGTCACTGAATACCAGGGAGAAGATATCAGTGCCTCTCTCTCCACATGCCCTCCTCTGGAAGCTGTGGACAGCAAGGTTGCTCCTCAGCTTCATTTTCTGCAAACTAGACAAGCCCAAAGTCCTTAGCTGCCCCTCACAGGTCATTCCTTCCAGCCCTCTCACCAGCTTTGTTGCCCTTATCTGGACACATTCAAGGACCTTCACATCCTTTTTAAATTATGGTGCCCAGAAGTGCACACAGTGCTCCAGGTGAGGCTGCACCAATGCTGAATACAGTGGGATAATCACCTTCTTGAGGAGCTGGTGGTGCTGCGTTTGATGTACCCCAGCATGGGGTTTGCCCTGTTGGCTTCCAGGACACGCTGCTGACTCTTGCTGTGCCTGCTGCCAGCCAGCACCCCCAGATCCCTTTCTGCAGAGAGGCTCTCCAGCCACT\n>XR_008192058.1 PREDICTED: Gossypium raimondii uncharacterized LOC128035582 (LOC128035582), ncRNA \nTACATAATAGATATATATACAGTTTTTCCCTACCCTACCCGTCATCCTCTTTTCTCTTTATCCTCTCCCTCAATTTTCCTTCTTTTCCCTTCACCGTGTCTCCCATCTACCCTTTCTTCTTGCCACCCTATTGTTTAAGCTTTGATTTTTGTTTTTCCACCTACCTTGCTGATCGTTTTACCCTCCTTAATTAGCCTTATTTGCTACCCTAAGTCACCTTAAAGCCGCCCCTATCAGTCTCTTTTATTGCTCAATTGTCGCCCCTCTCCATTGTTGAAGTAGTGCCACTCTAAGAATTCATCTTTATGGCTGACAAAGATTCCCTCTTGTCTCGCCCTGTTCTGCATTTTTCTGTCGCCGTTTGTGGTGTTGCCGCCCTTTAAGACACCACCAGTTTGGACAGTCGTTCCCTTTTCAGTTACCACCCTTATATCAGTGTGCTTTTCGAGTTATTCTTTATTTATATCTGGTCTAAACGTTCTAAGTTGGCAAAGTAACCTAGGTGATCAATGGCTAACTCAGATCTCGGTAACGAGTAGTGCAAAATGTAGATTTGTGTGAGATCTCGCACTGTTTCGTTTTGTTGTTAAGTGATGCTATGGTCGAATACCCTAAGGCTTGGATATGGAATTTCGTTGCGGATTTTTGGGTATTTAATGTGATTTAGGTGCTGATTTGAACATCCCGGATCAACAATAAAACCAGATTTCATCCATGCCCTCGTTTCGTAGCAAATCAGTGCAAGTTGTTCAATCGAATTGAACCTAAAATTTTTGGCATGTAGCACTGATTTGGCCGATCCATTAAAGGGTGTTTCAAGGCTGGTTTTAATGGTAGTTAATGTGGTAGTTATTGTTATTTGGTGTTAGGTTCGATTAAGGAGTTAAATTTGGAACACAAACTTTTTCAGCTTAGTGCTGCGGATTTTTGATAATAAGGTGGGTTCTAACTTGTTAAAAAGTGCTAAAATTATGCTTTTAATGATTAAA\n>XR_004466254.1 PREDICTED: Bombus vancouverensis nearcticus uncharacterized LOC117166512 (LOC117166512), ncRNA \nCCGTTTTTCATTATAATTACGATTATAATATATTCGTTTTAATTATAATTATGCTGTATTGTTGCGATATCAACGTACTACGTTGCGCTTTAAATTAAAACTTCTTTCTGTTAAAAAAAAGCATCGTTCCAAGTCGACTTCTTTTGTTCTTTCGCGGGATTCTTAGGCAAGCCGTCGCAGCCACGCTGCAGTTTACTAACCGAGCGTATATGCATGGATTTACCGACATAATCCAATAATATCGTAGGTTGCAGACACAAGATCGCGCTGCGTAATAAGTCTGGAAATTCTCATGGTACTCCGTATGAAAGCCCAGCGACTGTGGCCGTAATCTGCAACATTGCAGAATGCACAACTGCAGTGGAATAGCCTACAATTATAGAAAATCAAGCCGTAGGATTTATCAACACAGCCTTCACCAAATTATATCTGATTTATGCAGATTCGCAGAACATTTTACAGAGTCTAAAAATCTACTCCCTTAAAGCCGCGATAAATCAACACAATTTAAACAT\n>XM_049312721.1 Wardomyces moseri uncharacterized protein (JN550_001527), partial mRNA \nATGTCTAAAAATGGAGACATCAGAGGGTTCTTCGCCAAGGGAGCGCCGTCCAGGGCTCCTCCCCCGAAGGCATCGTCTGCTAGCAGCGTATTGCCTGCCTCCCCGCCGGCGGCCGAGCGGGCCCATCAGCCAACACCTACACCTTCGTCACAGCTGTCGATAGATCTCCCGTCGTCGCCTTTCACACCACAGAAGCAGCCCGTCAAGACACCTCTGACAAGGGATGACGAGATCAGGGGCTCAGACGACGAAGACGATGACTCGGATAGTTCTCTCGAGTCGCTCGGGGAGCTCCTGGGACGTAGATCTGGCCCGGCCACATACCAGAGGCCTACGGCGTTGACGACTACTCCCAAGGCCAAGAGGATTGCACCCAACAGCTTTCACCGGTCTCCTCTGACGCTGCAGCAGCAGCCTACTCACAAGTTCGACCTCAAGTCTCTCATCAAGCATGCGAGACAGGACGATGCTACCGAGCAGAGTGCTCGACGAGCTGACGAGCTCAGGGTGAAGGCGGACCAAGAGGAGCTCGAAGCTGGGCGTGATATGGCCGACAAAGCCAGGGACGTTTTTGGCGGCGAGGATGGGGAGAAGGGCGACAAGCTGGCCAGGGCTATTGACCGCACAGTAGGCGACGAGTCTAGACCGCGCTGCTATTTCTTCGCTCTGGAGGATGAAGCAGCCGCCGCAGGCGCTGGTCCCAGGCGGCCGTTCCCCAAAAAGGCAGCCAAGGTCAAACCGTGGACCTTGTTGCAGGATAGCAAGACCCGAGACCAGATGTTCATACGCGGGATGGTCAGCGCTGTGGCTGCAAAAGGGAAGGAGCTGCCAGACGAAATCTACCGGTGGATCCTCGACGAGATATGTATCGAGGAGAACCTTCAGCTGCGGAACCAGTATATCAGGTCGGCCGCGCTGTGTTGTGATGACACACGGCGTCTGGTTGACGAGAGGCAGCTCTATAAGATGCTGGAGAAGATAGGGGGCCAGAAGCATGAAACCTCGAAGCAGAAGTTCGAGCTATCGCCTGGGCTGCAGGACCCCTATTCGAGGAGAGACTGGTCTCCTCTTCGTCATTTCTTGCAACTACTGGCGGAGATGGCGCCCAATCTGACATCAAAAAATGCAACGAGCGCAGTGCAACTGCTTTTACGCTTAAGCCTCGACCCTGTGGTCGACAGGGCGCCGGGCGTTCGTGCCGAATACGCCAAAGCCATGGTCGCTCTAGAGTCGGCTCTACCTGCTCCAGAGGACCAGTGGGATACATGTTGCAAGAAGATATGCAATTATCTCCATCAAGGTGTAGACCAAGTGACGCAACGCCACATTGCCACCGTGATGCTGCCGACCTCTACGCCTCGACTGGCTGACTTGCAGCGTAGGCTGGCGACAGTAGCCCTCTTCGACGACCCGGGCCTGGGCGCCATACATCCCGACGAGTCCGTCACCATGCAGGACCTCTTCGCCCGCCTCGGGGCCAAGAATTTCCGCGTAAGACACTCGACCGACTTTGACGAGCTCAACGCGCTCCTCTCGCTGTTCGACATGGTGCTGGACCGCGGCTCGCAGTTCGGCCGGGCCTACCTGTCGACGACGCCTCTGCCGGCCCCCACGCCTCAGCCCAGGCTCGCACCGGCGCTGCCAACCCCGGCCTCGTCCACGTCAACCACGACGGCGGCGAGCACGGCCACGACGCCGTCGCCGCGGTCGGAGGCCGAGGCGGCGGCCCTGTTCGACGCCGACGTCGACCGGCTGCGCGCCCACCTCAAGGCGCTGCACGACAAGATCGCCGACAACAGCCTCGTGTCCAGCAAGGTGGCCAAGGCGTCGCTCGACGGCATGATGAAGCGGCTGGCGTTCACGGTGCGCAGCCGGCCGCCGCCCAAGAGCAGCATCTTCGACGAGGCCATCTACGGGAGGGAGAAGGAGGACGCGCATCTGCCGCGGCAGCGGGATTTCATGAAGAAGTGGAGCGCGGCGTCGAAGGGTGGCGGCGTAAAGAAGGATGAAGCTGACGATAACGAGGGCGCCGCCTGA\n>KY685464.1 Uncultured Glomus clone M01338:4:000000000-A3V74:1:1101:10809:13957 18S ribosomal RNA gene, partial sequence \nCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAATTTCGGGATCAATACGTCGGTCGTGCTTCGGTACGTACTGGCGTCATTGATTTCTCCCTTCTGACGAACCATGATGTCATTAACTTGGTGTCATGGGAAATCAGGACTGTTACTTTGAAAAAATTAGAGTGTTTAAAGCAGGCTCGCGCTTGAATACATTAGCATGGAATAATGAAATAGGACGTTCGATCCTATTTTGTTGGTTTCTAGGATTGACGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACC\n>XM_032084393.1 Aspergillus pseudonomiae uncharacterized protein (BDV37DRAFT_269601), partial mRNA \nATGTCAAGCCTTGTCATCGGGACTGCGCCGGAGGGTCTGGACTTGTCCGAGGATAGAATCGCTCAGAATGACGCCACTGTTGGTGTTGTCATGGGAATTGCCACAATTTTTGTGGGTTTGCGATTCTGGGCGCGAACGACTAATAAGAGTGCCAATTTAGCATATGATGACTGGTTTGTCTTGGTAGCATTGATCATCTTCGCTTATGTTATTCTGTATGCCACGACAGTGCCTATGGTCAAATTGTCCGTGCTTCTTCTCTATCGCCGGATTTTCCGCCTCACCTGGACGTTGTATTTCTGTGCATTTCTCTCCATCGGATATACTATCTCAGTTGTTACTACCATCTCGCTGGCTTGCGTCCCCTCATCTTTCTTCTGGACTCAATGGGTATATCCTTTGAGTGGAGGCCACTGTCGGATCAACCTCTATCAATTCTATTTGTGGAACGGTGTGGCCAACTTGTTCACCGATGTCATCATTTTATGCCTGCCCATGCCGATCGTCTGGGGCCTGCAGATGCCCAAGGCGCAGAAATGGGCCATTAGCGGTATCTTCCTGCTCGGTGGATTTGTCTGCGTGGCCACGATTGTCCGCATCTCCGCCATCACGAAAATGAAAGATTCCGTCGACATCACCTGGGTAATCGGCGACGCCATGATCTGGTCCAACGTCGAGCCCTGCATCGGTATTGTCAGCGCGTGCCTACCGACTCTGCGGCCCCTCCTGCGCCAAATTCCCCAGCTAAGAGTCTGGGGGCTTTTCGGCAGCAGTGGACTCTCGGGCAATTACAAGATGACCGGCGACGGCACTTCCGGCACGGGACAGCAGGATACCGGCAACCGATCGGCATATCGGTCCTCGACTGGTAAGAAGCAGCGATTCTGGCCAGAAGATGACGAAATCTACCTGACTACCGACGTAGGACGTGCTGCCAGAGAGGAAGGCGTCATCCCGTCCAACGGCTCCGCTGCCTCCAGCCAGGAACCCATCGCTATGCAGATCAGGGTGAAGCAGAACTTCGATTGGAGGGAGGACCACCCATGA\n>XM_048215029.1 PREDICTED: Ursus arctos zinc finger and BTB domain containing 20 (ZBTB20), transcript variant X11, mRNA \nGCACCCAATGTGGGCCTTCTGCCGAAGAAGTAGGGGCGGGGGGAAGTTTAGGAGTTGAGGAAAGAAGATTAAAGAGCGCGAGGAGGAATCTTTTGGAGGATGTGCTACATCCAAATGAGGAGAAACTGAGAAGGAAAGAGGAAGACAGAGGATTCAGGAAATAGATGATGATAATGAGTCACACAAAAAGAAGTATTAAGGATTGCCTTTTAAGACTCTGAAGACTGAAGAGTGCCTGATAAATTGCACGTCTGTCTGTGCCCCCTAGCTGCACAGACTGCCTGAAGTTACATTTAGAGACTGAAATCACTGCACCTTAAAAACAAAAGATTGAGCTGCACTGCATTCCTAATGTATCGCCATCACTAACTGGATATTCCTCACAACTTTGCTGTCCGAGGTAAGGAAAAAGAGTCCAGAGAGCCCATGCCCCCTGGGTCTCATCCTGTGAGGCACTGTCGAAACCAGAGTAGAACTCAGGCCTCAGCTGCCGTTCCAGAGCTCTTTCTATAAGTTCCGTGACCATCAGTCTGTGGCCTGACCCTTCTCTTTATATGCAGCCGCTCTCTGTCCCCTGCCCCAATGAACATCTGCACTGCGCCCAAGCCTTGGAGTGATTTACCTGAAGAGTGACACCATTTCTTTGGAAACTACTATGAGGAAACTGAAGCCCAGAGAGGTGAAGTGAGGTGCCCAAGGCCACACAGCAAGTTAGAGGCACAGCTAGTACCATAGCTCAAGTCTCCTGACTCCCAGTCCAGTGCTCCTCCCATTACTCCACGGGTCCTGTGTCTAAGCTTCCTGACAAATGCTAGAACGGAAGAAACCCAAGACAGCTGAAAACCAGAAGGCATCTGAGGAGAATGAGATTACTCAGCCGGGTGGATCCAGCGCCAAGCCGGGCCTTCCCTGCCTGAACTTTGAAGCTGTTTTGTCTCCAGACCCAGCCCTCATCCACTCAACACATTCACTGACAAACTCTCACGCTCACACCGGGTCATCTGATTGTGACATCAGTTGCAAGGGGATGACCGAGCGCATTCACAGCATCAACCTTCACAACTTCAGCAATTCCGTGCTCGAGACCCTCAACGAGCAGCGCAACCGTGGCCACTTCTGTGACGTGACGGTGCGCATCCACGGGAGCATGCTGCGCGCACACCGCTGCGTGCTGGCGGCCGGCAGCCCCTTCTTCCAGGACAAGCTGCTGCTGGGCTACAGCGACATCGAGATCCCGTCCGTGGTGTCGGTGCAGTCGGTGCAAAAGCTCATTGACTTCATGTACAGCGGCGTGCTGCGCGTCTCGCAGTCGGAAGCCCTGCAGATCCTCACGGCCGCCAGCATCCTGCAGATCAAAACAGTCATCGATGAGTGCACGCGCATTGTGTCGCAGAACGTGGGCGATGTGTTCCCGGGGATCCAGGACTCGGGCCAGGACACGCCACGGGGCACTCCCGAGTCAGGCACATCGGGCCAGAGCAGCGACACCGAGTCGGGCTACCTGCAGAGCCACCCGCAGCACAGCGTGGACAGGATCTACTCGGCGCTCTACGCATGCTCCATGCAGAACGGCAGCGGGGAGCGCTCCTTCTACAGCGGTGCGGTGGTCAGCCACCACGAGACTGCACTCGGCCTGCCCCGTGACCACCACATGGAAGACCCCAGCTGGATCACGCGCATCCACGAGCGCTCGCAGCAGATGGAGCGCTACCTGTCCACCACCCCCGAGACCACGCACTGCCGCAAGCAGCCCCGGCCTGTGCGCATCCAGACCCTGGTGGGCAACATCCACATTAAGCAGGAGATGGAGGACGATTACGACTACTATGGGCAGCAAAGGGTGCAGATCCTGGAGCGCAACGAATCCGAGGAGTGCACGGAAGACACCGACCAGGCGGAGGGCACTGAGAGTGAGCCCAAGGGCGAAAGCTTCGACTCGGGCGTCAGTTCCTCCATAGGCACCGAGCCTGACTCGGTGGAGCAGCAGTTCGGGCCCGGGGCGGCGCGGGATGGCCAGGCCGAACCTGCCCAAGCCGAGCAGACCGCAGAAGCGCCTGCCGAGGGCGGCCCACAGCCGCACCAGCTAGAGACAGGTGCCTCCTCCCCGGAAAGAAGCAACGAGGTGGAGATGGACAACACGGTCATCACTGTCAGCAACAGCTCCGACAAGAGCGTCCTGCAGCAGCCTTCGGTGAACACGTCCATCGGGCAGCCATTGCCAAGTACCCAGCTCTACTTACGCCAGACAGAAACCCTCACCAGCAACTTGAGGATGCCTCTGACCTTGACCAGCAACACACAGGTCATTGGCACAGCCGGCAACACCTACCTGCCGGCCCTCTTCACCACCCAGCCCGCGGGCAGTGGCCCCAAGCCTTTCCTCTTCAGCCTGCCACAGCCCCTGGCAGGCCAGCAGACCCAGTTTGTGACAGTGTCCCAGCCTGGCCTGTCAACCTTTACTGCACAGCTGCCAGCGCCACAGCCCCTGGCCCCATCCGCAGGCCACAGCACAGCCAGTGGGCAGGGCGAAAAAAAGCCTTACGAGTGCACTCTCTGCAACAAGACTTTCACCGCCAAACAGAACTACGTCAAGCACATGTTCGTACACACAGGTGAGAAGCCCCACCAATGCAGCATCTGTTGGCGCTCCTTCTCCTTGAAAGATTACCTTATCAAGCACATGGTGACGCACACGGGAGTGAGGGCGTACCAGTGCAGCATCTGCAACAAGCGCTTCACCCAGAAGAGCTCGCTCAACGTGCACATGCGCCTCCACCGCGGGGAGAAGTCCTACGAGTGCTACATCTGCAAAAAGAAGTTCTCCCACAAGACCCTCCTGGAGCGGCACGTGGCCCTGCACAGTGCCAGCAACGGGACCCCTCCCGCGGGTACACCCCCAGGTGCCCGCGCTGGCCCCCCAGGGGTGGTGGCCTGCACGGAGGGGACCACTTACGTCTGCTCCGTCTGTCCAGCAAAGTTTGACCAAATCGAGCAGTTCAACGACCACATGAGGATGCATGTGTCTGACGGATAAGTAGTACCTTTCTCTCTTTCTTATGAACAAAAACGACAGAAAAGAAACAAACAAACAAAAGCTATGGCACTAGAATTTAAGAAATGTTTTGGTTTCGTTTTTACTTTGTTTTTGTTTTTGTTTCGTTTCATTTTGTACTACATGAAGAACTGTTTTTGCCTGCTGGTACATTACATTTCCGGAGGCTCGGGTGAATGATAGTTTTCCCAGCCTCCCTCGGATGGTGGCCTTAAGGCCTGGTAGTGCTTCAAGAGGTCCACTGGTTGGATCTCTAGCTACTGGCCTCTAAATACAACCCTTCTTTACAAAAAACAAAAAACAAAAAAAAACAAAAAAAAAAATCTTAAAAAAAAGTAAAAAAAAAAATTTTTTTTTCACTTGTGAAGAGCACTACAAAAATATATAACAAAATCTAAAAGGCCTACTGTCTTTAAGTACACCGCTTGCAGTGTTTCAGTGGACATTTTCACAATTCTGGCCGCTTGGACTTCACAGTAACCAGTTAAAACTGTGGAATATCACTTCTGGTTGAAAACCCAGAGGAAAGGCCCTGCTGTTTTCCACCTACCACATTTTCTGATTTCATAAAAGGGCTGGGGGGGTTGGGAAGGGGCAGTGGGTCCGGTGGTGTGGGGAAGGCGAATGGCAGGCTTCTCCCCCAGATTTCTGCTCGCGTCCACACACCCTGGCCCACCTCCTCCGTGTCTCCCCCTTTCAGCAGAAGCCAGGAAGACTTGGACAAGCATCAAGCAACAGTGGCTATCGTATTTATTCAGTGTCTTCGCTGAGCCACAGCCTCAGCACAATCAAGAGGGACTTTCATGAAGGGCAGGAATGCAGATAAAACAAAGATATCAGAGGTTTGCACCTACGTTTCTAGGTACAAGAGAAGGATTATTTCCCACAATCTTTGCAAAAAACAAAAACAAAAAAAAAGTGTCAGGATATATTCTTGTGGAAGAGAAAAAGAAAGAGAAATGGAGGGTGGGGGGTATAATAAAAAGTTCTTGAGGCTTTTTTAATTCAAAATTTTATAGAGGGGCAAAAGTGACGTTTACCAGATAGAATGCTGATTTTTTTAATATATTTACAACAGTATTTGTGTAAAAAAAAAACAAAAAAAAGTGAGATTGTTAAAAGTAATTTTCTTTCGTTTTGATTTTGCGTACACTGCCACCAATCCCTTCTCTTATTTTATTTCACACACATATATATATTTTTTGGTAAGTCAAGACTGTTAAGGTTAGCGATACTGCTTCCAGATAGAAAGAATAAAAGGCAATTAAAGTTATATTTGAAAGAGAGGAAGGATATTTTCTTCATATTTTTTTTATTTTTTCTTAATTTTTATTATTTTAAGTATTGCCTGGGTTGATGAGGGCCTCTGTGGCCAGCCCATCCCTGCTGTAATTTGAACTGCTGCTTTGTATTTTGATATGTAGTTCTTTGACTTTTAGCAAGCTTAAGTTGCTCCACTGACTTTTTTTTTTCTTCCAACTGATCCATCTAGAATTCTGTTCTTTTTCATGGGAGGACTTTATCTTTCAGAAACAGATTTCCTGCTTCTCTAAAAGTTCACTGAGGTCTTATGATTCTAGAATGTCTCTTGACTTGACTTCTTTTCTTGAATGAAACACTAGTAGTCTAGAGGTCGTGACAAATGGGTTTTCCTTCTGTGGTCAGCCAGGAGGAGGAGTTCATGCCTCCTCACCCTTCACAGCTGCAGAGAGCAGAAGCCTGGTACAGATCAGGATGCTTGATGCCAAAATTACTCTCCTCCTTTCAGATATCACCTTCTGACTATTTCCACCGTGGTTGAGAGGGCTAATGAGATGATCCTCCTTCAGAGGATGTAGTAACCCTTGCTTTTTGGAAAGATTTTAAGGAAATTAACAAAAATTTCTCAGATACCAACATCCATCATTCAAAAGGCCACCAGTTCATTGCATCATCCTGGATGCCACTCTCTCTTCCTAGTTGGGATTTCTCTCCTCGGTCCTGATCAAAGTATTGTAATAGGGATTTTTCCATTATAGACAGTGTCCTGAAGGGATTCCGACTCAATTATGAGAATTCTTACACTTAACAAAAACTCCAAAGGTGATTTTATTGCTGGGCATATTTTAACACTCTTAAAGGGGAAGAGTAAATCTTTAAACAAAGCAGAAACACCAAACTGTAATTTTAAAAAAGAAGCAAAGACAGAATTTTAGTTTCAAAATTACTTTGCATTTTAATTTTCCTGTCAGCAACTTATTTGCAAAAACTGTGCATCAAATGAGGAGACATCTTCCAAGGGAAGAAACTCTATAATGACTAAATTGGTTTTACTCATATATTTTAGATATTGGTTAACTTGGATCTTTTCCATACGTTCTTGGTGATGTTTAGTAGGGTTAGTGCAACTGGAGTACATGTGGGTTTTATTTGGTCCTCCGGTCCTCAATTCGGTAAATATTTTACTAGAAGTTTAATGTAGACTTGGATGGTTAACTGATTATTGGGTGTCACTCATCGTGATTTCTAAAAGGAGTCATATCAAGAACGGTGTGTCCAAAATTGACCTGTTTTAGAAGTTAGTGGGAAACAGCTTCAAAACTAAGAAAAAGTCCATTTTTCTCTTGCTGATTTTGCTTTTTAAAATAGCAGTGTGGAAGACTTTAATATTTCCACTTACTACCAACAGAGGGAGCGTTACTTAATTAACCACGTCCTGGGATTGTTTTGATATCTTGAAAAACAAGTCATTCAACCCAATATATAAAAAAGAAAAAATTAACATTAAGGAAAAAAGTTGTTCAATCTAGAGGGATAAATGACATAAACTCTCTCAGCATACTATACAAATGAGCTAAAAGACACTTAAAAATATTTTCAATTATTTGACAGTAGCTGATTTAAGATAGTGTCCTTATTCCAACCTTCGCAAAGTAAGCAGAATTTATAGTACCTCTAAAAAAATTGATCTTGGGTGCCATTTTGGGCCCCATTTAGCTATCTGCTTCTCAAATCAGAGGGAAACCCGTTTGCCTTAATGTTGATTTGCCATGTGAAAAGTGAAGCAGTTGGGTTAAAACGAAATCCATATTTTGTTATAGAACATACAGAGGGAAAAAATTCCAGTTGGGTTTGAAGCACTAATATTCATCCTTTCCCTTCAAATGAAGTATCTCTTTTTAAAAAATGTTGGAGAACTCCCAGAGAATTCGTGGTGAGGTGATGCAGTCATTATAACCACATGGACTCTCCAGGTTTGCATAGCAGTAGACTTTTTCCTACCGTATGTCTATTCCTCTCAAACACTCATAGTCTAAAATAGTTGACAGACTTGTACTCTGGAGAGAGGGAGAAGCTAGACTGCAGTGGAAGGTCTAATCTGGGGAGCAGTGAACTTGCTGTGGGGTTATTACAATATGTTCTGACCTCCTTAAAGGGCAACTTTCCCCACGGATCTAAACCAGACTGGACCGATTTCTAAAGGATAGAGATGCTTTTAGATTGCCAATCCTTACTTTTAAATTAAATAATTACCAACATCTTAGGAAATGGGGAAACATATTTTGCTTCAGGAATAGAGGATGAACATGAATCCTTTTATTTTTTAGTTTCAAATCCAACAATCTTCTTACATTTAGAACTTCATGCTAGGATGCTATGAGTGCTAAAAAAAATTTTTTTTTCAGTAGTCAGAGGAAAAAATAGATAAAATGGAAGCAAATGTTCCAGATTTAAGACCTCTTAGGATGAATACAGGGAACAAGAACTAGTTTGGAAAAGAACTTTTTTTTAGTAATTTATGATTTAAAAGTGGATTAGCTGAACAAGGGAAAGGAAAAAAGTCAAAGGGGAATATTTATGTCCAGACATTTAGATACAGTGTAAGAAAAATGAAATTTCCCAGCTCTGAAAACATTGGTAGCATCTCAGCATGGAAGGTAACTTTCCCCCTATTACTATAATAAATGCAAATATTTATACTAAAAAAACAAAAAAACAGAACCCAAGTGGTAAAATATGGCCCTCAAAAAGAAAGGAATTGGAACAGATGGATCTGATACAAATCTACACATGGGAAAAGATTAAGAAACAAGCCAGGCAAAGATAATTTGAAATGAAAGTCTTGATAGCAAAACGGTTTTTACTATATATTTTAATTGAGTTGTAAACTTCAGCTCCTGACAATAGTTTATAGACTTTTTCCTGCCCAAACTCCTAACTCTCTGAAACTGTTTGTGCCATGAGTAAGTGTGGTGGATAACTTCCTTCTCGTGTTCCAGCTTTAGTCCGTTCCTTCTTCATAGGCATTTTGGAGGTCACGGTAGCTCCCAGCCTTAGAAGAAAAGACTTGGATTTGCTTTGTTGAAAAGTCATGGGTTTTATTTTGTATCATCCCAATATTCTTTAAGGACCAAGAAAACCCTTTAACCCATGAATAGTTAGAATTTGTGCATTCTGATAGGAGAAGAACAAGATTTCCTCTGGGCGTGTGTGTTGCAAGTAAGTCCTAATGCCTTGACCTACGTGTACCTCCATCATATAAGCACGCCAACAGTGTGTGGCCAGCCCATACGTACCCCAAATCTGTTTTCCCTCAGCAGTTCCATCAAATGAATCGTGCCCCTTATAAAATCCCTCAGGTCCCTGACAGAACATAATAAAGGTTCATGTCGCTTCCTCCATGTGCTTCCTCCATAATGCTCCCAACACCTGTTGCCCCTAGGAAAGGGGGCAGTGAGCTAGATCTGGCTGGGATTCACACCCAACATGCCCATTCAGGAGCCCTCCTCTGCTGTTATGGAAGATGTTATTTAATTAGCTGAGGCTGGGAGCAGAGGGTACGTGATTCTGCAGCAAAGTTATCAGATAACCAAATCAGATCTGCCTCTGCTATGCAGAAAGAAACAAAATGAAGGTACAATGTAAGAGCAGACACAACCTGAGATGCCCTTGGGATTTGGGAGAAGGGAGGGTGCCCTTTCTGTTGTGACCTGACTCTTAAAAGAAATCTCCTGAAAGAATTCTTTAATTTAGTAATGAGTTGAAGTCCAGGGTAATGGAAGCCCTGGGGAAGAGAACAAAAGGACTGCAAAGTGTATTCAGCACCCAATAATGCGAAACCAAAAAACATCCAATCACAACACTAGGAAGTTTGGCAAAAAGTATTTAGAGAAATCTCTGGGCTTTCCATGGGTAGTAGGGTCGACAGACTTTCTTTTGAGTGATTTCTGGCTCTGAGAAACCTCTTTACTCACTAGAAAAGAACTTTCTTTAAATGGCCAATTTTATCCCCCAGAAAAAGAAATTTAAAAAAAATAAAATAAAAATAGGACACTAAAGACAGAACCATGTGACCCGGTAACAAACAAAAGGAAGGGTGCACTAGAATTTCAATAGAGTCCCTAATTCCATAGAAAAAGCAAGGCAACCCAACGCCTCTCCATCTGCAGTGCTTGAAGAGAGTGCTTGCGCCGACCCCGCCCCCCGGGGCTTTCTGGGGCTCCACATAACTTCCCCATTGGGTTGGCGGCAGCCCCTTTCTCTTCTTGTTGACATGAAGGAAAGGACTGTTCTCTTAGGTGCCCAGGAAATAGATTGCATGGGGCAAACTTTCAAAAGCTATCTCTACCCTGGTGCTCCGGCAGCATATGGTGAGAAGAAAAGGGACACAGAAGAGCCCTTGCTCTTGAGTGAGAATATTCTCGTATCCCCAAGGGCTCTCCGTGTGGAGTTGCCATTTCTAAGACCGTTTAAACCTCCACAAGAGGAAAAGTTGTGGTGACTCAGTGTTCATATAAACACAAAACGTGGAAATTGCTAACCCAAAGCATCGTTTCTAGCGCTAGGGATTAAGCTGATTAACCTAACCAAAATTCCCCCAAAGATTTGTCTAAGTCTCCGAATACATTTTTTCCCCTTGAACCCCGAATCCACAGTGGTCAGCGGTGTACATTGACAGATCCCAGACAATGGTTTGGAACACCAGGGTTTATTTCCAGTTCTTTTCAGGATGAAGACGTAGAGGATGAGGGTTGTACCACACGGGTTCTTTTTCAGAACTGTGTATTTCACTGAAAAAGCGGTACAAATGCCCCGGGTTGAAGCAAGTGACTGCAACCCCTGGATTCTGGTGGTTCCTCAGGCCCAGCCTAGTGCTCCATAAACTGAAACCCTTCGGACTAAAATCTGATCTGAAGTGACCTCAGTTGAGGGATTTTCACCAGACACCACTTACAGTGTAGAATTATTGCCTTAAATCAGAAAGCCCAGGGAAGAGAACAGAGGACAGAGGGGTCGGAAGGGTGTGAAGACATAGACATTTCTTGTTTTTAATGGTTGCATCGTCATCAGAATGAGCGCTCTTCATGATTGAAGATGATGGAAACAGTGGCTTTGCAGGGACGCATCACACTTGTCCGGAACTGATGGTTCTTGGGAAGTGGTTGCTCTTTTTTCATATCCTATTTCAGTGACAGAGGTCTGGGCTGGGTGTAAAATAGGCATCATCTTAGTCAAAGAGCAAATCCCATAAGACATGGTCACAGGTGCCTGGGATGTCAGTTTTCTTCATTTCCTTCATAGGGAGAACAGTCTCTACAAAAGCTTTCTTTCTCTGTACGGTATATATTTCTAAACTCGGTTTTCCTCACTTTTCATAAGCATCTGCTTTATCTGGTGGTTCTTTGTTTAAGTGCAAACTCACGACTTTCAAATCTTCAAGGAAGGAGCATAATCTGCAGATCATAGAGGAAATCTAGCCACGTTTGCAGGAGTCCTGGCTTTTGAGATACTTAATTAGGGTAGAAAAAGTTGCTACTAGCCCTCTTTCAAATTCAGGGCTTTCCTTGGTTCAGATGCCTCCATGAGATTCTGATACACCTAGAATAGAAAAAAAAAAAAAATTAACCCCATCAGAGACATCTGTTTCTACTCCTGTTACAACAGAAGTTTGTTATTGCCCAGCAAAATCATTGTAATTTATATGTAGATTCCAGCAATGAAAAGGACCTAACCCAGCTACTATGTCACAGCTGCTGTGCAGAATGTCCGTAAATGAGCACACGTTCTGCACGTACACACGCAGGGTGAGGTGCTCTCAGTACAGAGCTGTTCCACGCTCGTATTGCCCAGGGACAAGATAGATTCTGGAACTTGAAATAGTCCGGGCTCTCACAGATCTCCTCTCTGCTTCTGCTCTGCCTTCTTTGGGTGCACCGGTGCCGTCCGTTCTCTGTGATGAGGTTCTGGGGCATTCTGAAGGAGCTCAACCAGCAGTAATTTCTATGTACCTGTTTCATGAGAAACTTGACTATGCCATGTGGAGGAGGGCGCTCTTAATGAACTCCGCACTTGCACTGGATTGACTGGCGTGCGTGGACGTGTGGTTTGCGTGTGTACGTGTAGTCTGGGAGTGTGTGTGCCTGTCAGAGGAAGCACACACAGGCCCAGGTCCTGGTGCGTAGATGCAGTTGCCTCTGCCTACCGTTGTGCTCCAGACTTGTGGCTCCCTTCCCGGGAAGCAGTCACCTGCCCACTCTGTTGCTTTTCAGAGTGTTTCAGAGTTGGGAGAAACAAAGGCAGCTTGTTGGATCCACAGCAATCCTACGGTGACAGGCTGTTTTCCTCCAGAAGAAGGTAGAACAGAAGTACTCAAGTGGCGAGCAGACACAGAGAGCAGCAGTCTGGGGCACCTCTCCGGGTCTTCTGGGAGGGAGGAACACCGAGGCCAGGGAGGCAAGACCCGCACAAACTGTGATCTGAGCCGTCCATGGCTGAAAGGCCTCCATTGCTCTCCTCTGTGCAGCCCAGCGTGTGCCCACAAACACTGCTCGGCTGTTAAGTCTCACTCCCAAACGGAAGCTTCCTGACCCTGCCTGTATCTGCAGGACGTCATCCTAATTCCAAACTGTGTCTCCGGAAACCAACGTGGCCTTTGCCCAAGTCTTTCCAGGAGTGGGTTGTTTACCATGTCTAGCAAACCAGTAGACTCTCGGGGGAATCATTTTTGGTAATCTCTAAGAGTTGATGGCTCTGGCCCATCTCACACATTAAAGTAGAACGCCATTCTTGCACACTATTCTGAACAAATGGACCTGGCTCTCGTAGCTGACCTTAGAGAACGGCCTGGAAACAGTCGGATTCAGTTTGCTCCCTCCCATGCCCTTCTTTTAGTAGGTGGCTTATTATTTTTTTTGTGACATGTAGATGATTTCTGCTAATTTACAGAATTCAGAGGACGTTTTCTTTCCTCTTCTACTTTGGTGACTTTTCCCCTACCCCATTAAGTAAGGCTACTTACAGTTAGAATCTTTTCATTGTTATTATTTTTTAAAATGTATATTGTCTTTCTATATCCAAAAGAAGTCTGTGACTGTAACCATAGGTATTTCTTTTTACTGGAAAAAAAAAATGAGGTTTTTTTTGTTGTTTTTAATTCACAGTACTAGTGACTCTGTGAAAGAACGTGAGTTACATTTAGGTATGCTTACTTAAGTACAGTACACTACGTTGCAGTATTTCTGAAAGCTAGAACATACACATTATATATAACAACTCTATATTGAAATATATATTACATTATATTCATTTTAACTTTTGAATCCGCCTATGATCATGAGTTGATTGACATATTATTTCTTCGCATTTATCACCCATCACCAACCTGCTGCAGTTAATCTGGTGCATTTAATAATAATCACGACTGCTCTAGTTTGCTTTTTATATTATCAGCTTCAGTATTGTCTTTACAGGATTTTAGAATTTTTTTAAGCTCAGACTTAGCAAATGTAGGAAAGTGAAAACATTTTTTTAAGAAAACTTTGTTTTTTTCAGTGTGGCCGATACAAAGAGGTTCATATTCGAAGTGGTCTTGTTTAGCTGACCCTCTCAATATCTGAAGAACAAAAGAAGTGCATATGAATGTATCTGTGATTTTCCCTTTGAGGACTGTCACTGTCTATATTTGCTTTAGAAAATATGACCAAGGGGCTGCTTAACCTCCGTATGATCTGACCAACAGTTACAGGCTGCCGTTCAAAGGGCTGCTCATAAGGGAATGAAATGCCTAGCGTCCCAACTGGATTTCCAAACCTTGATTTCCATACTGCTTCTTTACGGACTACTGTTTGTTTTCAGTGTGCTTTACGATTATTTTACCTAGTCTTCAATGCTCCCCTGGAGGCAGCTTGACAATATAACATTCATTTTCCTAGGAGATTTTCTTTCTTAAATAAAACCAGAATTTGAGGAACGTTTTCATGACAGAGGCCGATAGAAATAGAACCGAGAAATAGCTCATTTTTTAGCCCACAGAATCCATAAAATGGTGGCTCTTGGGTGTCTGGCCCTCCGTATCGCCATTCGTCTGTGAAAGTGGGGATTTGGTGCCTTTCTTCTCCAGCCAGGTCATCATGGAAACTTCAGGAATGAGGCATCCTGTCTTCCTAGCAAGAAATATTTTCTAAGTAGTATTTTCAGATAAAGAGCTTCTTCGGCTTCTCTTAGCTACTCAACCCAGTGCCTGGAAAACTCCACTGTTGGGTAAACTTTACATCCATCCTGGAGACCTAGAGCCGGATTCATTCTCTCAGTTCTCCATTCAGGACAAAATGACAGCAGTTTTTGATACTCAGTATGAAAGCCCTTCCCATACTGGACCAATAGTAAAGCCTCTCAGTATGACTATAACACCAATTCCTTCCTTTCGTCTCTCCTAATAGATTTTTATTTCCAAATCCCATCCCATTCTGCTGTGCTCCCCCAACCGCAGCCCTGAAACAAGTCTTTCCCAACCTCCCCTTATTCAAGCTCCCAGCAGTGCCCCCCACTTGTGAAGCCTGGCAGACCTACTTCAGCCTACTTCAAAAGGGCAACATTGAGTCTAGTAGCAAAATTATGAATCTGTTTCTCCATGGTTTTCAACTAAATATATTTCTACAGGACGGACATAATTGTGATTTGGGAGTCAGTGAGGCTGCTCCTTTTCCGGTGATCACATAATACCCAAACTGTATCAGTTTCATTATTTTCCTCTTTCCTTTTCCTAACCACGTTCTTTTATTTCTTGTTTCTCTTTAGGACTACTTTAAATTACCTTTTCTTCTCCTCATCACCTGAGGAACTCGAGTAATTATGACCCCTGAGTGCTCATTTCCCTCCTTTCCCCCCACCCCCTTCCCGAATGTCCTTCTCTAAGTTTTATGCAGTTAAAGAGCATTGACAGGAGTCAGCTCATCAACTTGAGACTCGTAGGCAGAGTGAAGAAGAAGAATGTCTTCACTGTACCTTCAAATTTTAGAAGTTATCAATATTCTTTTGAGAGTGGGAGGACCTGAGTCACAGTTTTAAATGTCAGCTGTACTAGTGAGGTCATTAATTCCTTTCACCTTCACATTTGGCCAAAGGTAAAGAAAAAAAATATACTTTCTGGGTTTTTTTTCTTTAAATATCACAGCGTTCAAATTTCTGATATGAGTAGACCATTTCTGAGAGGAAAAAAAAATCATCAATGTTGGCTGTTTCAAGTCCTGCTAATATTTAGCCAGATGACATATTTACCCCATACTAGATTTACAGAAATCTGAAGAAAGAGGTAACATTGTAAGATAATTTTGATAACTGCTCAAGCCTTAGTAAACTCTTTCAAAACAAGTAAAGCCACTTCCACTGAAGTAGGAGGAAACAATTAGGAAGAATTTTTTCATTTGTTATCTTTTTGAAAAACAAATAATTGTTGATTGATTTGGAACTTCAAGCAGTAATTTACTGAGGGATGAAAAGATCCGTAAAGTGTCTAAAGTGTCTATTTTACAAACAGTTTTTTTTAGATATATATATATATATATATATACATATATATATGTATATATATATATATATCTGACTGGATACTTGAAGGGCCATGTAATGTACTCCCCAGTACCTAAACACTCAGCATATAATTTAGTCATCATGCTAGATCTCCTTTCAGTGAGTCATAATTGTCTGGTTGGCAAAATGTTGCCCAAAAGACTGATACTGTTCTGGATCTGTCCGTTACAGAATGTTCATAATGTAATACCCGCTTTCCTCACTTCCAGTCCATGACTCTTGCCATGCTCCTACAGTGCCTCTTGGCTCTCAGGAAGACAAATTCTGCGGCATTTAGAGTACTACCTGGTTCTGAGTGCACAGACATGCGCTGTTTTATTTCTTGCTTTACCCACTGACAAACAGAATCAACATGTAGTATCAGAAATGTATTCCTAACGTGACGAGAGGCTTGACCCATCTCTCCTGCCTTAATTAAACCAATTTATAACATCAACTCACACCACAGAAAGCAATGAAATAAAGAGAGAGTTCAGAACCTTCCTGAGTTACACATCTAGTAGGACCCCAGCGTTTCTTCAAGCCAGTATTTATGTTGCCTACGGTGGCGATCTTCACTTGGCACGTTTTCCCCGTCAATCCCATCTTCCTCTCCTCCTTTGTCCGTTCTCCCTCTATCTCTTCTGTAGAAGGACTCTTCATCTAAAGTACTCTTCTCCCCAGGCTTTGGCTTCTGAAACAGTAGAAGACTCTCTTTTAAATCCTAATGACTAATGTTTAAGGTGTAATGTGGCGTAGGAGAGGATTCAGTTCTGCCACGTCCCGTTTGGTCCAGTTAATCGCAAGGATTTCTCCAGGATGCCTCTTTGACATTGTTCCTTCTGGTTCCCCGAGAAGAGCTCTAACCCTGAGACCAGGATTTCTCCCCACAACCTCTGCATTAGTCTAGGTTAATGTGCAAATCCTGCTAGCATTCTAGAGACTCCAGGATGTGACTCTCTTATTGCTTAGGAGCCCCCTGCTTTTCGAAACTGACATCTGTCAGGAGCAGCAAGAGCCCTACCAGTCACTAATGCAGCAACACGATGGTCAGAAACATTATAGTACATAATAGGGAGGATAGGAAGAGATTTCATTCTTCTTTTCCCCCATAAAAAACTTGCTTCCCCGCCCCACCACCACCATGCATTTCAGAAAGCCTGCATCTCATTTTACAGATATGTAGTTTTAGGATTCGCAAATATAGCTTAGGAAATGTTCTGAGATTGAAGCTGGTAGCGAACCAGTTTATTTTCTGCACTGGACTTTAGGACAAGTGTGCACAGATACAATTCCTTCAAAGAAAGTGAAACTGATATAGTAAAGCAAAGGGATAATACTTTGACACATTAAAACAGTTGTTTGCTCTCTGTAAACCTTGACTTAGGCATAATTATTATTTTTAGAAACCTGAAACTGGAGGAATGTGTATTTTAGTAAAGTTTGTTGTCAGTTTATTTGTTTCCCTTTATCTCTTTCTTCTCGAGATAGTGAAAGATTTTGATTCTTTAATTTGATACTGTCCCTGGCCATAGGTATCAGTCAAATAATGCCCACCCTTACCATACGCTTTTCCTTTTAGAATGAGAGCCTTCCTTCCTGCCATTAAAGAGTCTTTTCTCCTTGAAAACCTTATCTTCCTTTACAGTTAGCATGAGAGAGCTTTGAGGAGAGGGATTCTCTCTGCACTTTGAGGGTAGAATCGTTAAAATAAAAACTATTTCTTGAGATAAACCCCATTTACCCAAACTAACAGGTCTGAGGCCAAAGAATGGGAATTGATTGCAGATGAAGGTCTTGTATTTTACACTACAAATCTTTATTGCCTCCTCCAGTTTTTGGAGTAAGGCTGGGAATAACTGAATGAAAATCTGCTTTGGATGTTTCTTACTAATATCTAATGCAGAATACCCAGAAAAGACAAAGAAAGGGTGCTGCTTAAATGCACAATCAGTCCATAGATTTCTATAATTATTCAGATTTCTCTTCTACTCATTTCAAAAATATGTGTCCATGAGGTCTTCACTAGAGAAACATCCGCTTCTCCATTGTTCCTCATCTCCCCCACCTGGCACTGGAGGGGAGAGTCACAAGGGAGACCGGTGCCGCATCGCCAGCCCTCCACCCATCTGTACCCCACCACCACCACAAGATAAGGAAAAACCAAATTAGAAACTTTTTTTGAAAAAAAAAAAAAGGGAAATTGTAGTGCTTCATTTGAAAGAATACTGTTTTTAACTCAATTTACAGATAGCCTGACAACCTTTTTATAACCTGTCTTTTGTGCTATAATTTGCATTTTTAGCTCAATCTTTAAAATAATTGCAATTTCAATTAAGTGAACAGAGGAAAAGCAAAGAGGGGAGACAGGGCAATGTGATGGGGCTAAATCTGATACAGTTCTGGATTCATAAGGCCAGTTCTCAGGGTTACCAGGGAAAGCTAACACCACTCACCCTTACCATTCTTGCCCATCCTTACTATTAGAGTCTTAAAAGTTGGTCAGAAAACCTCACTTCCTTATGATTGAAGACTTTTCTTATTACTGTCAAACCCACATTGAGAGAAATGGTACAAACCCCTGACGGCACCTCTGCCTGAGCTTCCTCCAGGGCGCGTGCGGAGAGATGCCGGGAACCGAAGTGTGGGCTCAAATTTGATACAAGACTCAGACATGGTCTCAAGTGCTTTGTGTATGTTCACTGCCAAGGGGTTCGTTGAAAAATAAGGCCAGTTTCTCTGCTCCTGCTGTCCTTGGGACAAACTTTGACTTGGAACCCTCTCTACAATAGATTCGTAGGAGAAAATTCTCAAAAGCATCGTCAGCAGTTCAGCTCCTTCCTTAATCCCATTGAGTTGAACCTCAGTTTTCCTGAGGAGCCCTACTGAGGTAGAAATCAAAGGTAACTTCCGTATATTGAATGAAAATTGGCTTTTTGCCCTATTTGTTGAAAGGATTGTGGTTTTCAGGAAAAATGAAAGCAGAATTTCTTAGTAATCCTCATCATGGCACACAAAGGCAAGAAGCTGATAGGCTAGAGAAAAACCTATGATGAACTTTTATGTTTTTAAGCAATCTGACTGTGCTGACCCCACTATGCCAAACGCCTTTGTTTCTACAATCTGTTCTCAACTATGGATTGATTCTCCTGAGACTTCCAGCACGCGTGTGTCGTTTGAGCAGACACACAGGTTTCCATTTGGAGAATGGAGACCCAGACAAGCCAAAAGCATCAACTCTCACGAGTATCAAATACAAATCATTTCTCCAGAATCACTCAGTTCTGCCGTATCCCAAACCAATTCCAGACTAATCTTAAGTGAGAAGTAAGCTCCATAAGATATCCTACTATGAATGTTTTTTCTTACAGAATAATACAAGAAGAGGTACAAAGCAGATTCTTAATTTGGGTGTAATTATAATTCACTTTTATATTTAATAGTTGTACTGTTTGTGTGAGTGTGTCGTTGAGCTATTAGTACCAATTTTCAATCTGTCATCCTGAGAGGGGCCTTGAGAATTTCTGCAATTTCTGCATATGTGTGTGTAGATCTGTATTTATGTGTTGTCAGAAAAACAAAATGAACGGGGGAAGAACGAGGGGAGGGAGAAGGTGGTCAATGTGAAGAAGGGACTGCTCCTAGTGTCCCTATTTCTGTTAGGTCAGGTGGCTGCTGCCAGAAGCCCTCCAGGAAGAGTTGATTGCACTATTCTAAAATAAGAGCCCAGCACTGTTAAATTTAGAACCATGTTTTGGGAAACAGGAAAGTTTTATCTTTTTCTGTACCCATTCTCTTTAGCATCAGAGCCGTTTGACATGATGAAAACCATTCAGTAAAAACCACTACTGACCTTTGCATTAAATAGCTGTTTTCCTCTTCTAAATACTAGCCCTGGTTTCAACTCATCTACTTCCCTTTATTTTCTGCCTATTGATTTTAACATTTTACAGAAGAATACAGAGGCGCATGCTAGTTGTTCCTCTCCTTTGAGCTGAAACAAACAGGGGCAACAAGAAATGACTCACTGAAGAGTGAGGTCAAGACTGAATTTCCCACTTGTGTGGCACTGGTAACCTTTAGCAAGAACTGTTTAGGGTTGACCTTGGGTCTATATTAGGGCTTTTTTTGGGGGGGGGTTGTTTTGTTTTTTTGTTTTGGGTTTTGTTTTGGTTTTTTTTTTTTGCACTAAATATGACTGCACTGCATTGCACTACTGAAATGTATTTACTTGTGCTGGGAGAGAGTGTGTGAGGTATGGGGGAGAAAGAGGCAGTTATGAAACAGGAAGCATCACAAAAACGGAGAATTCTTTCCGCCGTGCTTGGTCTTAGCAGGGTTGGTGAGAATCTGTGGAATCTGCTAACTCTTGATCAGGCCCAGAAACTGCCATGCTGATAGGATCTGTTGTCTTATGGTCAAAAAGCTGGGCTGGTACAGTAAATTGGAGATGTTTAAGGAAAAGTTTGCCCAGTGTTGTCTCCAACTATGCTTCTGGTAAGAGTTGCAATGGGTGAGGGAGCCAGCCGAGGTGAGGTTGAAGCCTTCACCTTGGCCTCCACCACAAAACCCCTTGCTGACCCACATTCCAGTGTGGCAGAGGGCGGTGGCGTGTCCTGCTTTCAAAACAAAACAAAACAAAAAACAAAAAGACAGCCTTGTCTGTATTGGAGACATCCTTTCAGCCTGCGCATGCTTTTCTATCCCTGGGTGAGACCTAGATGAGCCTAACCAAAGAGGAAGGCCGTGCACGGGGTTAAATCCTTTAAGATGGCAGTAAGGGAACAGTGCAATAAACACTGAAAACCAGTGAGGTGAAGGGTTTATTTTGAAACAAGGTAGGCCAACTTTGAAACTGAAGGAAGGGTTGGAGAATTGATCAGAACCTACTTACTAGCTGCTCCATCGTAGACTATCCTTTATTAAGCAGAAGACCTTAACAGTGCCTAAAAGTTTAGTTTGGAAGTTGCTGAACTTTTTCAATTTTTTATTGGATTTCTTTTTATTGCCTTTTCAAACCTGAGAAGTAATTAGCGTGTGACAGCTCTTCAGTGACTATTAATAAAAGAATCTTGCACCACAGGAAAAACAATCAATTGTGTAGGGCACAATAACACCAGAGTGGAGATGCTGAAGAGCTCTCCCAGAATCCAAGGCGACAGCTTGGAAGATTCTGGTTCTGTGAGAAAGGGTCACAACACATATACATGGGTAATGTTGAATTTCTCTGAACACTATCACATGTGGGGACATCAATTTGGAAAACTGTCAGTTGAGGTCTCTTTCCTAAGATTACAATATTGATACTTCTCTCTCTCTCCTTCTCTCTCTCTCTCTCCTCCTTAGCATCCATCCAAGTCTACTATTACAAGGTAAAAAATTTGTAAGGGAACTGTCAGCCTTGTGAGTCAGAAAAAAACACCACTTAGGGCTTTCAGAACTAACGTAAGCAATCCCTTAAGCACTCAAAGCATTATCTCAGTTTTAAATAGGAAACTCTAAATTCAGAGCTATTAACAGGTACTTAGAGATGTGTATTGCGTAAGCACTAAGACGGTATTGACTGCACCAAACCAAAGGTATAGAAAGAAATAATTGACCTTTTAAGATACATTCACATTAACTGTCCTAGGATACTTCTCTTGAGGCTTTGGGGAAACAACTTCTTTTGTGAAACTTGCATACCCATTCCAGTTTTGTCACCAAAGATTTTAATCACCAGAGCCTAATCTCCTCTCTCCCAGATAAAAATAATATGACAGGCTCAAGGGGTATGCTTTGGTGGTCAAGGGATGACACTTTGGTTTTCACTGTATTCACGGTGATATTTACAGGACACTCGTTATTAGAGGAGCTACCGAACTGTCTTCATGACTTAGGGTTTGGCCAGAGGTTTAAAGAGATAGGTGAAAAATAAACAATAGTACCTTGACACTGTAAACTAGTCTTTAATAGAGTCATGACCTGAAGACTGATGGAGAGAAAGAAACTTCCAGGGAAGAGAGTGAGCTAAATCACATAGAACTAAACAAGGATCGTTGGTGAAATGTGGGGCAGTGTAAACAACAGAGCGGATCGCTGCTCTTTGTGGCCAGACCCACAGCAACGGCCGGGGGCGAGTCAGACAACTGGCAAGTGAATTCAAGTATTGAAACAGCCGCGCTCTGGGTTTCGCTGTGGTTGGCGGAGCCCATGGCAAGGACAGTGCTGAGGCTGCCCTGTTGTGATAGTGCCTTTCTTGTAGCAAGTACTCGGTGAATAATTTGTTCAGTTAGGCTTTTCTGGACCATTACCCCCAGTCTTCTGAGGAGGTCTGAAGGGATAGTGTTCACTTAGGATGAAGGGACAGGATATTGCTCCTGGGATGATGTGATTTGATGATATTTGCACTAGATTCTAAACTCTACTTTAAACTGGAGCAACTGAATAGAGAAAAACCAAGGATGGTTCAATGTTAAAAGAAACCAAAAGCAGTATTTTCTAACTGATGCCTCTTCTTTTTCTTCTCCTTACTCTTGTTCTTCTCCTTCTTCTTCTTTTCCCTGGAAGGGAACTTCATACCTGCTGATTACCAAGCTCAACTCGAACCAATTCTTTTCCTTCCTATTTTTTCCCCACACTGAACCTTCAGTGTGAATTCGCCATCAGGTAGGCATGGTTAGTGTAAAGGGCGTCTGTCATTACAACTTTGCACCCGTCCTCTGCGTCATCAAGGGCATGAGGCAGTGGGGGGGGGGGGGGACGGCGAGGCTCCTCCAGAGCCACCAGCCCTTAGGACGGGTGAAAAGCAGAGATTTCCTATGGAGAGCTGAGCTGACACATATTTGTCCAGAGGACATTGGAGCCTGTAATTAATCCCAACGAATGCTTAGAAAGAGAAGGAAACCCACGTGTTGAAGAAAAACAAGGAAGGTGGTGCCCACAGTTTGCCTGTTTCCCCTCTCTCTCCTCTTTCCCACCTCACCCCCCTGTCCTCTCTCAGAATTGTATTTCATCTTTGTATTTATGTTACCAGAAGAATTATTTGGTTCCTTGGTTTTTCTCTTTATCAGTGGTCTGGGAACTCTTCCAAAATCAGAAACAGGTACCATCAGTGGCTCCCCTGTAGCCTACCAGTTTCTCAAATGCTGTCCACCTGGTCTTGACCCAGTCAACTAAGATAACTCGGAAGCTTTGGCTGGCTCAACCACCTGTCACTTTATTTTCATTTTGTTTTCATTTCCATTTGAATTCTGAGTGATCTTATGGGAAGGTGGAAATCACAGAAAAGGTTTAGAGGCTGCAATTCTAGGGCATAGCTTGTCAAGAGTTTGTATTATCCAAAATATAGCTTTCTACGCCTGTTTTTCTGTTGAATCTGTTGCCCTGATTATAATTTCTATTATATTTGCGGTTATTTTTATAAGAATAGAGTCCATTTGCTATGTCTATTTGAGTACTTTTTTTCTATTTTCCCCACATGGATGCAGTACCAACCTGTTAATGAAATATCTTTTTATTATATTATTAATATGTAATTCTACTGTAGACCAAAAATATAAAAACAAATTTGCTCATTTTAAAGATATAAAGAACTAGTGAGTTAAAGATGAAGAGTTGAAGGAAAGACAGAAGAGCAGTGGTTAACTATGTTGAGTTAGAAATCTAAGAGTAGCCTTACCTATTTTTAACCAGTGCTTGCCAGTCATACCATAGTTGGGATTATATAGTCTTGGCTCCTTCATGCTTATGTTCTATAATTTTTGTTTGTCTGTTTTTCTTTGATGTAATTGAGGTTGCACATCATGCTATTTTTGGCGATGCCTGATTTTATTATATTGTACTTTTATCAGTCATTTCCTTTAGAAGGATGGGGGGAAAAGTTTTATTTCTTTTTTTTTTTAATTTAAAATTTGTTTAATGCACTGGAAATAAAATTGGACACATTTCACTGTTCAAAAATTCAAAACCAAAACAGAACAAAAACCACAAAGAAAAAACCAGCAACCAAATAAGCAACAGAAAAAAAAAAAAGCTATGAAAAAACCACCTATTCCTACCGAATACACATATAAAATCTATCTCACACAAAAGAGAAATATCATCAAACAAGAAATATAAGTCCTAGAAGTTACAATGCTGGAAAGAAGACAGCTGGGCTCAGTGGGGATGGGAGACATGGGGCATTCCTTTGAGATCTGAGATCTCGCCCTGGTTCCAGTGACTGCCAAAGGGGTTAAATGTGGGAGAGGCAACTATGGAGGAAATAAACCCAGCATTTCTGGAACTATCACCGTTTTATCCTATGCTTGGGCTCCATTGGGGGTGCGGGGGGAAGATGTGCTATGGTTGAGAAGGTGGCTTGTATGGAGGTATGGGTACAGTCCACAGCCGCACGCAGTTCAGGTCTCTGTCCACCAACTACCTCACGTGTTTCTTTTCTCCGTGAGGATTTCAGCGGACGGGCCCGAAACATGGGAGAGACCGTTCATGACTCGTTAGAACATCAGCCAATGCTAAAGAACCTCTTGACTGCAAGCTCACCCCCTTCTTCAGCATTCCCGGTACCAGCAGAGCCAGTCAACCCGTACAAACGCACAGTGAGAGGGAGACAGAATTTGCGTAGCGGAGCGGCTGTATCATTTGTTTAACGTTTGCTGGGTTTTTCTGGTTTGGTTCTGTTTTGGAGTCGGGGTGGGAGTGGATGTAAGTACACAATCCTAATACAGTAATTGTTTTGCATCTTCCATGTTTTATGCAAAAACAGACATTTAAATCAATAACTAATTGTGCCCTAGACTGAAAGTTAATGTTTAGGAGAGGAAAAAAATTGTTGGAATTTTTTCTACATTTTTTTGTGAAGAATCTTTTTTGGAAAGGAAGGATACATATTTTTGTTGTGTAATATTTTCTATTTTTGAATGCATTTTATTGGTACAAGACTGTTTTTTTGGTGAAGACATTATTTAAAAAAAAAAAGAAAAAAACTAATCGAAAAGTTTGCCCTTAAGGATATGCTGCAGTTTTGAGGTTAAAAAAAAAAAAATAACTGATTCAAGATGCGTGTTAAAAGTTGGGATTATATTGTTGTTTTTTGTAATTGTTACAAGAAGAAGTTTGTACCCACTGCTGTTTATTTTGTTTCAGATGAGTAAGTAAAGGGATTGTTCTTGTTTTATTCTTTTTTTAGAGAAAAAAAGCTATTTATGAAATGTCAAAAACACTGGACTGTGAGTTTAAGTGTGGAAGCATTTTACCACCCTGTGTCTTCGACCAATTATGGGAAACCCCTTTTCTCTTCCCCCCCGCCTTAGCCTTGCCAAATGAGAAAAAAATAGAACAGCTCTCAGATGATGCACACCACTGAAGCCCTGCTTTAATTTTTACGGTTCAAAAAGTCAGAAAACCAAAGTTCAATTTGTTTCTGAAACCCCACTGTCCGTGGCCCTTTTTTGTAGGACACAGCCAGTCGGCTCTGCCTCTCCGTCTTGGATCATTGCCTTCTTCAGGACAGGGGGCCAGCTGTGACACAAAGAGAAGCAGAAAGGTGGTGAGCCTGAGGGTTGAGGTCTCCTGGAGCAGATGTGAGTGGGACTTCAGCCTCTCAGCGGGCAACCAGGCTTCCCCGGCCTGTGGCCAGGCTGCCCCACTGCCGGAGGAGGAGAGAGGCTGCCCACGCCTCCACCCTCCGCTTCTAAGGCCCTTCTGTTACCGTCGCTCTCCAGAATGGCTTTGCCTTTCTCAGCAGCCCGCATTCCACGGACGGGCTGGGGGGAGGAAGGATCCAGTTGAAAGAAATGGGGAAGGTAGGACAAGGGACCCTCTAGCATGAGGGATCTTGTCCGCCTCAGCTTTGATTCTGTGGATCGTCCACCCATCTGCTCACTGTGAAGACGGAGAGGCAGAGTGCCCTACGGCTGTTCAATAGCTTTCTGTATTTTTTCAACATTGAAAAAATAATTTTTAAAAACTGTGATTTTTTTTTTAAATCATTTGGCTGGAGGGAAGGGAAAAGGGAAACACCAAAAGCTGTAACATGATTAACTGGAGATATTTAACTGGGGGCACTTTCTAGACCAAGACAAACGAATTCCGTTCTGGACCCTAAAGCAGCCAAATCTTGAGACTGTCAATGACAGAAAGCTGAAGAGAGGCCTCCATTTCCTCCTTTCTCCTTTCTTCTCTCTGTCTCAAAATTCTCTCTCGTTCTCCTTTTCCAACTTCCCTTGGACTACTGACCCAATGGCCCTTGGACTCCCATTTCATGCGTGTGTGCACACGTGCGCGCACACACACACACTTGCAAAATACCATTTTTCTTAAGGATTGTGGGACCGAATAAAATCATGTGCCTTCATTTTTTCCTTTTATAGTTAGATGAACCTCTTCCTTTTTACAGTGCTTAAAAAAAATAGGGGAGGTTGAAGTGTTAGTGGGACTTGGGCATCGCTTGCGAAGTAATTTTCATTTAACACATTCCCCCTAAATATGAACACAGACACGTCAGCCCCTTCAGGATGCTCTTTGGCCATTTAGAGCATTACCTAACCAGATATGTGACAGCCTGAACCCATTTGACTTTAGAGCAATTCCTGACAATTCTCTTTCATACACTTCTTTCATTTTTACCACAAATGAGGTGAGCAATGGCAAGCAGCCTTGTTCTCCGGATCTGGTGCTTTTGCGTGTGGCATGGGGTGGGCCTGGGGGTGGGGGAGTGGGTGTGTTTCGATAAAGGGTGCATTCCTATAGATCTCTGGTGCTGAAGGGCCTCGAGTTCCTTCCAGAGACTGCATTTGACACACTTTAAGTACACACAAGTGAATGGTATCACATGCAATATTTTAATGGAGCAATGGGAGAGGCTCTTTGAAACGGGGTTTTGCATCTTTTTGTAACATTTTGATTTCTCTGGTGCCTTATTCCTACTTGATGCTGGCACTCACATACCCACAGGGAACGGACACAGAAGTCAGCCTGGGGAGTGGGGACCCTCGAGCAGAGCGATGCTCGAGTGTGTGGGCGCGGGGGGCGTTGGGAGGTTGGTGTCAGTTGGCTGGGAAGGGACTAGATGGCATCTCTTAGCCGAAGCCAAGCAGGAACTGCACAAACCCACACAAAGTGAACAATTCCGACCTGCAAACACACCGCAAACCCACCCTTCCTCATCTGAGCTTTCCTTCCTTCTTCCTCTTTGATCTCCGCCTTCTCGCAAAGGTGCTGCTGCTGCTGCTGCTAGGTGCCCGGAGTCCAGAATGCCCAGTAATCACTCAGGCACAAGCCTGGCACTGCCACGTCAGCCCCCGGCACGACCAAACCCAGGTTTCTCTTGCTCGGGGCTGAGAACTGTCAGATTTTTCTCATCAAAAATGTTTTCCAAGGAATCAGTGGATTACAGTCATTCTGCATTGAAAATGCACTTTAAAAAATAAATAAAAGCTCCAGACTGTTTAAAATGTACAGAGGGAGCAGGGGAAAGATAAACATGTGCTAGTGTCTGAACCCAGTTCAGTTTATCTCCAGTTGAAACAATATACACTATATTATGTATAAATGTATACACACTTCCTATATATATCCACATATATATAGTGTATATATTATACATGTATAGGTGTGTATATGTGCATATATACACACATGCACATAACAAATCCAGATGCTCATTACAGATGCTACACAAACAGCAGCAGAGGAAACAAGGTTGGACTCTTGCAACAGATCACAAAAAATAAAAACAGCCACTTGCAGTGATTTTGGTTACTTCTGTATGTTCACAA\n>XM_008328421.3 PREDICTED: Cynoglossus semilaevis SLAIN motif family member 1 (slain1), mRNA \nAGTGTTTTTTCCGTGTTTTCACCCAGAATATTCTTTTTAAATTGTCTCAGTACCATATAAATGTTCTTTTGTAAGGTTTTTACAAATACTTTATCACTGTATATATTATGGTTCAACGAGTGGTCGCTCAAATCTTAAAGTAGTCTTTTTTTTGTCTATCTCAAAGACAAATCTCATTTTAACGTCACTTTTACGAACATTATATTCATAATAATATTAATGTTGTGGCTGAATACAAAGACCAGCCTTTAAATGGTCGACCAGTACACTGGATTATTTTTGGTGTTTTTCTCCAAAAGAGGAGGTGCACACAGTCTTCTTTGTCACTTCGGTACGCGTGTGCATTTGGAGCGTAAACACTTCCTCAGCAGAGGAATGATGGGAAGTTCGGCTGACCAATCAGAGAGAGGCTGAGCAGTCACACCAGCAGCAGCAGCGGCGGCAGCATCAGTGTGTGAGTGTGTGTTAGGGTGAGTGTGTGTCGGTGAGGGGGGGGTAAAATCTGGACAGCCGCTCTGTTGTTGTGAATAGTTCCCTCTGCAGGCGGACACACACAGGGCCGCCGTGCGTCCTCCTCTGTTTGTGAGCCTCCCGTCGTCTCCATGTGCTTGTTACCTGATGGAAGCGGAGGTGCTGAGTCCCAGGCCGATGATGGCAGATGTCAACGGCAACAATAAGATGACCAACGCGGAGTTGGAGGTGCTGAAGCTGCAGGAGCTGGTGCGAAAATTGGAGAAGCAAAATGAACAATTGCGCACCAGGGCCAACGCTGTAAACAATTGCTCTTCCGGCGGCCCTCACCCTCACCCTCTCCCTCACCATCTCCACAATCAGCAGCAGCAGCATCTCCATCACATACATCCAGATGATGACTGTCTGAGTGGCACTTTCCCCAGTAAATATAACATATCCAGTCCTATTCGGTCCCTTTCGTCTGCGCTCGAAACCCGGAGTCCGTCAGAGGAGCCGTTCTCTTATTTCCAGCCGAGCTCCGCGTCTCCTGATGCCGCTGAGGAGCAGAGAGGAGCTGCTGCTGTAGGAGCTGCGGACACCACTGTTCTGGATGAGGTTGATATTCTGGACCTGAACGTCGTGCTCCCAGTTGGAGAACCTGATAGCTGGTTGTACGTGAGTAACAAATCCAAACAGCGCTGTGAGAGCATCCTCACTCCTCTGCAGTGGTGCAGGAAGGTTCTGGACCACCCAGGACCAGAGGTGGAGCTGGCCAGGATGACCCTCGGTCACAGACTGGACCAAGCTAAGCGTAGGCGAGGACTCTCCTCCATCCGTCCCTTCAGCTGTATTGAAGGTCTCTCCACCCTCAGCTGTCCTGTCCTGCCTTACACTAAATCTGCTTCACTAACAGAGTCTCCAGCTCCGGTGGCATCACCAGATCAGCCCAGTGCTCCAATCAGAACCAGCAACAGTCTGAGTGAGAGAGCTTCAACCTTCCTATCCAACACCGCCCTCCACAGCTCTGCTCGCAGACATGCAGCCCTCAGCCCTCAGTCTTCCCTGGACAGTGACGCTGGTGTGTCAGACCTGGACAACGAAACCATCTCTATGGGCTACAAACTGCAGGACATGACAGATGTGGAGGTCATGGCTCGACTTCAGGAGGAGAGTCTCAGGCAGGAGTACAATGCCTCTACCTCAAACACAGCCAGCCGTCGCAGCTCCACTCATCTCCAGGCTTTCNNCCGACATTCCCTGAGACGCAGTGCATTAGATCTGGAGGAAGAAGAGGAGGAGGATGAGGGGTACGACCAGCTCCCCCCTCCTCAGCCTGAACTCTTTCCAGCGGGCTCCATGCAGAGGACAGGACTGTCCCACTCTCACACCTTCTCCAGTATCAGAGACTGTAGACGCAGCTTGACCACCTCTCAGTTTTCACTCAGTGGACTCTCCCAGTTCTCTGGTCTCCTCACAGAATCACAGGCTTCTTACAGAAACAGCACAGACAAGCTACGGAAGAGCATGCCCAACCTGCTCCGAACTCCCAGCATGCCCAGTGTTCCCAGTATGCCCTGCCTGGTTTCCCCTGTCAACCCACCCTCCCACGGCCCCTCCTCCCTGCCAACAATACCCTCCCTCCGCAGCAGCCAGAGCTTTGACTCCTCCAGTGGACTTGCACGACTCCAGTCCTCCTCCATTCCTTCTCCAGGAAGCCTCAGCCAGCGAGTCCACAGCGTGACCAACTTCTCTACCGCACCTCGTCACCCTCTGAAAGCAACAGCCTATGTGAGCCCCACGGTGCAGCAGGGTCCCACCAACACTTCTCTGTCCACTTCCACCAGCCTACACTCCATCCCCAGCAGCACTGCACTGCCTCAGCCCCTGAAACCCAGCAGCATTTTGGCTCCGCAGACATTAAAGTCCAACTCTAACCAGCAGCCCTGTGTCCCTCGCAGCTCCCTCCCTCGTCCTGCCTCCTTCGTGGGAACAGGTGGAGCTCTACGTCCAAGCAAACTCACTCCACCAACACGCAGTTTGCTGACCCCTCCAAAGAGCCTGTCTACACTGAGTGCCCTGAGGGACGGCAGCTGGAAAGATGGCTGCTACTAAGTCTTCAGGTTACATATGTAGCCCTGGTTCACTAAGTGGCACGAGTGAGAAATAAATGCTATGAGAGAACCAAATTTAAAGAAGTTCCAGTGGTGCACAGGGTAATGCTGCACAGCAGGAGAGAGAGAGAGTGACTGGTACTGTTTCTTCAAAGCACTTCTTGTTGATTAAGGACTAAGCAAAGACTGTGAAGAGTATGGTTCCAGCAGGCTGGATCTGTACCGACTATCTGCTGAAGAGACCTGGCAATACGTATTCTGTTAATAAGTTGTTTGATGTGAACTGAATCTTATTTGATGTGTATTTTTATTCATTTATAAAAGTTTAATTTGAAATTAAAACTTTTTTCCAGTTGAAATCTTACCATTAATAATCCACAGCTTTTGCACGCGCCTCAATCAGTTTCAATGCAATTTAATTTGACAACATTTATTTTCCCGCCATTTCAGAGCATCTTGTCAGATTTTAAGTCATTTCCTGTGCCTGTGAATTTGCAGTAAACTCCTGTCACTTTGGTTGCTGGACCTCATAGCACTTTTGTTGGAGGATTATAAACAATGTATTAAGAGGAAAAATTATCAGCTTGACTTTAAATTTAGGTAAGATATGACTTAAGTTCAAGTAAGTGTGATTTATAAGTGTGTGGCTTATTTTTCTTTTTCTTTTTATTAATGTTTACAAAAAAATGCTGTGATTTTCAATGTTCTTTATTAATAACATAATCGCTGCAATCATATTGCACACTGAGCCCAGAGGCTCTTGGTGGATGATAAGAAAATAAAGAGGAGGTGAATTTTTAACCAAATAAACACCTTTAAAAA\n>XM_048024951.1 Epithele typhae kinase-like protein (BXZ73DRAFT_88453), partial mRNA \nATGTTTGACGACAGCGGACCCCCGTCCCCCTCAAACAACCCCCTAGCTCTCGCCCCCGTCGATCACGAATGGCAGCCCATCCTCCATGTCTCTAACCAAACCGTAGCTCGCAACGCTCGATGTCCCTATTGTCACCGTGCTTTTTCTCCCACGCATTCGCGAGGTTTCCACCCCCACGACCAAGACCTGGACGCGGAATACGAGGGGGATGACATAGAGAGGGCAAGTAACCGGGCAGCCAACTACTTCCAGCTCCTCGAGATTGCGAACGAATCCTCGAGACCACCTAGTCCCACGCAAGATTCCTCGCGTAGATCGTCGCCACAGCCGAATGCATTCCGTGCAGAGAACATGGCCGAGGGATACTTTAAGGCCTTCTTCCAGGAGGTGTGTAGGCTCGGCATGGGCGCAAACGGCAGCGTCTACTTGTGTCAGCATGTCCTGGATGAGAACCCTCTGGGGTTGTTTGCCGTCAAGAAGGTTGCTGTTGGACAGTCACATTCTTACCTCTTGAACACACTCAAAGAGGTCCGACTTCTTGAGAAACTTCACCATCCAAACATCGTCACGTATCATCACGCTTGGCTCGAGTCGTCACAGTTCTCGTCCTTTGGACCACGGATTCCAACCTTGCACATCCTTATGCAGTGGGCTGAGGGCGGAAGTCTCGACGACCTCATCGACACGCGCCTTGGACGCCGTGCCCCGAACCTTCCTCACATTAGGACCACCGCTGATGGATCCACTGAACAATATACCAGTCCCCAGCCGACTTCTCCGATAGAGCAAGAAGCCAGCCAACCATACTCACGGAATGCCCGTATACGGGCCTTCAGAGCATTACAGCGAGCCCCTCCTGAAGAACGGGAACGATTACGTCACGAAATGGGTCTCAATGATAGCGGGCAAGCCAAGTCGACGGTAAACCTGAAGCCGGTGCATCTGCTCAGCGCAGAAGAGATACATGAACTATTTAAGGATGTTGTGGGAGGACTCGCGTTCTTACATGAACGATCTATTCTGCACTTAGACCTTAAACCAGGAAACGTTCTGTTGACTTGGGACGAGGGAAAGCTTGTGCCACGAGCGATGTTGTCCGACTTCGGCACTCACAAGACATGCAATACCGGAACCTTGGAGTATTCTGCACCTGAGTCTCTGCCCGAGCCCTCGACAGGGCGGCTTCTCCAGGTGGACTCGAAGGCAGACATGTGGTCTCTCGGCATGATCTTGCACAAGTTGCTATTCTTCCGTCTTCCCTTCCGGCACACCTCCGACAATGATGATCCTAGTCGGCCAAAGGACGGCCAAGAGTATTCGGATGAGCTCGAGGCTGAGATCCTCGCATACAAGGGGTTCAAGTCTTCCGCTTCGCATATGAACACATTCGAGCCCAGACGAATACCCAAAGCTTACCTCCTGTTGCTGGAGACTCTTCTGAACGTCAAACCTTCCGGACGACCTACTTCAGACCGCGTGCTCAGCGTTATCCAAGAGGGTGGGCTTCGCCCGACGAGCCGTCCTCCGCGTAGAAATGGGCAGGCCCCTCCGGGTACACTTGCGCTAGCACGTCCAAGCGCGGCTCTCAACCCAAACCGCCTTCGAGTCAGCCCCGACCGGACCCGTCGGTCGCGCTCGCCGTCGCGCGTCCCTTCCGCCGACAGTCGCTTTGAAGCCAGCTCCGCCAATGTCGAAGAAATCCAAGAACACGACGGCGATTCGGAAGCTCCGACGGACGAGAAGGACAGGCTCCTGCCCATCCCGAAGGGCTACGCATGGACTCTGCCTTGCATCGGCAGCCTGCGCATTCCCCCCGCACTCGCCGCTCAGGCGCAAGCCATCCACCGCTGGCAGCGGCGTGCACGAATACCTGCGCTCGGATGGCGCACGCTGAAGTCCTCTATTCTTGTTGCCAAGGTCGTTTCCCTCACAGGGCCGCACCTGCATCCTAGCACGAGCGTCCATCCCATTCTAGCGGGAGCAGCGCTAATGCTTGCGGTGGTGGATACGTGGTTCGAGAGTATGGAGGCAACACTGGCGTTTGGTGCAGCGCATTTGGCGGTGCTTGCCCTTGGACAATTCACGTCGTGA\n>XM_020597508.1 PREDICTED: Monopterus albus apolipoprotein Eb-like (LOC109958668), mRNA \nATTTTATCTATGATATTCCAGGTGTGTGATTTCTGGTTATGATGAGAGTGTTTGCAGTAATCCTTGCACTGGCAGTCCTCTCAGGCTGCCATGCAAGAAGTGTGCCTCAGGATGATGGGAGTGACTTTGAAGATACCGTCCAGAAGTTCAAGGATTATTTAACATATCTGAACTCCAAGGTCGATGAGGTGGTGAAAGACATCCAGAGCTCCGAGACCGTCAGAGAACTGGACACCCTGGTCCAGGACAGCATGTCTGAGCTGGCCATGTACAGGGACGACCTGCAGAACAAGCTGGCTCCCTATGCCCAGGAAACTGCAGAGCGCCTGGGCAAAGACCTGCAACTGCTGGCTGGCAGACTCCACAACCAGATGGCTGAGACCCGGGAGCAGCTGGTGCAGTACACCCAGGAGGCGCAGACCATGATGGAGCAGGATGCTGATGACAGCAAGCTCCGGGTCTCCACCTACAGCCAAAAGCTAAACAAACGCCTCAACAAGGACATGGAGGAGATAAAGAAGCATGTTTCTGAGTACCTTGAGGAGCTTCAATCCCGGACCTCAGACAACATGGAGGACGCGAAGTCTCGTTTGCAACCTTATTTTGCTCAGGTGCAAGACAACGCCCAGGCGAAGGTCACCACCCTGAGTGATCTGCTGACGAAGCAGGTAGAGAACATGAAGGAGGAGATTCAGGGGGTGGCTGCGGGCATCAAGGACCAAATTCAGAAAACTGCTGAGGACATGAAGGAACAATTTCTTGAAACTGCTCAGAATATGCAATTCAGCCTGGGGGAGAAGGTGGAGGAGATGCGCATCTGGTTTCAGCCTCTGGTCTCCACGATCAGGGACAACATGTGA\n>XM_009083577.1 PREDICTED: Acanthisitta chloris achaete-scute family bHLH transcription factor 3 (ASCL3), mRNA \nATGCAGAACCTGATGGATGACAAAAGCTACTGTAACCTCATCTGTGCTGAGACTCAGCGTGTGCAGGTGGCCAGGCCTTTCTGTGCTGACCCACTGGTCACCTTTCACGTGTACCCAGAAACCCCAAACCAGGCCACTTGCTCTGAAGATTTCTCATTCCTTCCTTTCATGTCTGAGCACCTCCTCGCAAAGAACTTCTACAGTGAGCCCTGCAGCTTTCCTTACCAAATGCCCCATGCCAGTTTCCACAGAAATGACTACTCCTATGGGCCAGCTTTCATCAGAAAGAGGAATGAGAGGGAGAGGCAGAGAGTTAAGTGTGTCAATGAAGGCTATGCTAAGCTGAGGCATCACCTGCCGAAGGAATACTTAGAGAAACGGCTCAGCAAAGTAGAGACACTCCGTGCTGCAATAAAATACATTAGGTACCTACAGTCTGTTCTGTACAGTGATTCTGTGATGGCAGGAAAAAGTGTTGTGGAGCCAAGCCAAGCACCCAAAGCAATTAACAAACAAAACCAGTTTTTGAAGACCATCTAA\n>XM_017239098.2 PREDICTED: Drosophila bipectinata uncharacterized LOC108123788 (LOC108123788), mRNA \nCGCCAAAACCAAAACAAAAGCAAAAAACAAATAGAAATACAGCCAAAAAATAAAATATAAGAAAAAAATTAAATAAATGGCTACCGAAGTGGAGCCCGCAAATACGGCGGACAAGTTTTCGGCCAATGCCGAGGAGCTGGAGAGCTATTATCTGATGCTGGAAAACGGCAGCATTCCGGAATTGCAGTGGCAGTTTCCCGGACGGAGACCGCCATCTCCGGACGTTGGCGGCGGCGTCGGATCTGGCGCCACCAACAAGGAACTGGAGCAGACTGTTGGCGAACCTATAGAACAGGAGCCCCAAAAGGCTCAGAACGACTTTGATTTCAGCGACGATGTGGCGCCCACACAGATGCGAGTCAGAAGCCAGACATCTACGCCCAAGTCGGCCAAGAAGAAGACGGCCAACTTTGCTGGCGTTATGGAAACGCTGAAGAAGAAGAATGCCGAGAGCTCCTAGCATATGCTGAAGTTCTGATGTAATCCTAGCAAGGGTACATGGGAGTATATACGATTCTAGGCGAAGTTTCACCTTAAATAGGAAGGGGAATTTTCAAATTTTTAAAGAAATATTTAAAGAAAGATTTAAATATTATTCTATAAAATCAAAGGTCCGATTTTTGAGGGCTTTTTGATGAAGATTATGTTTTAAAGTTTTAAAGTAGATGTTAGTTGTCAAGTTAGGACTATTAACAAATTCTATAATCATTACATTTACAATTTTAAATTTTAAACAAAATAATAGCTAAGTTGTGCAATTTATAATTCTTTTATAAGATTTTGATTGAAATTATAAAACCAAAAATTTAA\n>XM_021934158.2 PREDICTED: Papio anubis ZXD family zinc finger C (ZXDC), transcript variant X4, mRNA \nTCCGAGCCGGACTCTGCGACGGGTCTTGGCGCGGATCGCGTCCCGGGGCAGTGCACGCACACTTGGGCGGGGCGCGGGCCGCGCTGCGTCCGAAGCGGGTCCGACGCCGTCGCTGGGCCCAAGATGGACCTCCCGGCGCTGCTCCCCGCCCCGACCGCGCGCGGAGGGCAACATGGCGGCGGCCCCGGCCCGCTCCGCCGAGCCCCAGCGCCGCCCGGCCCGAGCCCCGCGCGCCGCCGCCTGCTATTGGTGCGGGGCCCCGAAGATGGCGGGCCCGGGGCGCGGCCCGAGGAGGCCTCCGGGCCGAGCCCGCCGCCCGCCGAGGACGACAGCGACGGCGACTCGTTCTTGGTGCTGCTGGAAGTGCCCCACGGCGGCGCCGCCGCCGAGGCTGCCGGATCACAGGAGGCCGAGCCTGGCTCCCGTGCCAACCCGGCGAGCCGCCCGGAGCAGGGCCCCAGCGGCCCGGCAGTCGCCGCCGGCCCTGGCGTAGCCCCGGCGGGCGCCGTCACCATCAGCAGCCAGGATCTGCTGGTGCGCCTCGACCGCGGCGTCCTCGCGCTGTCTGCGCCGCCCGGCCCCGCAGGCGCGGGCACCGCCGCGCCCCGTCGCGCGCCCCAGGCCTCCGGCCCCAGCACGCCCAGCTACCGCTGCCCCGAGCCGCAGTGCGCGCTGGCCTTCGCCAAGAAGCACCAGCTCAAGGTGCACCTGCTCACGCACGGCGGCGGTCAAGGCCGGCGGCCCTTCAAGTGCCCGCTGGAGGGCTGCGGCTGGGCCTTCACAACGTCCTACAAGCTTAAGCGGCACCTGCAGTCGCACGACAAGCTGCGGCCCTTCGGCTGTCCGGTGGGCGGCTGTGGCAAGAAGTTCACTACGGTCTATAACCTCAAGGCGCACATGAAGGGCCACGAGCAGGAGAGCCTGTTCAAGTGCGAGGTGTGCGCCGAGCGCTTCCCCACGCACGCCAAGCTCAGCTCCCACCAGCGCAGCCACTTCGAGCCCGAGCGCCCTTACAAGTGTGACTTTCCCGGCTGTGAGAAGACATTTATCACGGTGAGTGCCCTGTTTTCCCATAACCGAGCCCACTTCAGGGAACAAGAGCTCTTTTCCTGCTCCTTTCCTGGGTGCAGCAAGCAGTATGATAAAGCCTGTCGGCTGAAAATTCACCTGCGGAGCCATACAGGTGAAAGACCATTTATTTGTGACTCTGACAGTTGTGGCTGGACCTTCACCAGCATGTCCAAACTTCTAAGGCACAGAAGGAAACATGATGATGACCGGAGGTTTACCTGCCCTGTCGAAGGCTGTGGGAAATCGTTCACGAGAGCAGAGCATCTGAAAGGCCACAGCATAACCCACCTAGGCACAAAGCCATTCGAGTGTCCTGTGGAAGGATGTTGCGCAAGGTTCTCCGCTCGTAGCAGTCTGTACATTCACTCTAAGAAACACGTGCAGGATGTGGGTGCTCCGAAAAGCCGTTGCCCGGTCTCTACCTGCAACAGACTCTTCACCTCCAAGCACAGCATGAAGGCACACATGGTCAGACAGCACAGCCGGCGCCAAGATCTCTTACCTCAGCTAGAAGCTCCGAGTTCTCTTACTCCTAGCAGTGAACTCAGCAGCCCAGGCCAAAGCGAGCTCACTAACATGGATCTTGCTGCGCTCTTCTCTGACACACCTGCCAATGCTAGTGGTTCTGCAGGTGGGTCGGACGAGGCTCTGAACTCCGGAATCCTGACTATTGACGTCACTTCTGTGAGCTCCTCTCTGGGAGGGAACCTCCCTGCTAGTAATAGCTCCCTAGGGCCAATGGAACCCCTGGTACTGGTGGCCCACAGTGATATTCCCCCGAGCCTGGACAGCCCTCTGGTTCTCGGGACAGCAGCCACGGTTCTGCAGCAGAGCAGCTTCAGTGTGGATGACGTGCAGACTGTGAGTGCAGGAGCATTAGGCTGTCTGGTGGCTCTGCCCATGAAGAACTTGAGTGACGACCCACTGGCTTTGACCTCCAATAGTAACTTAGCAGCACACATCACCACACCGACCTCTTCAAGCACCCCCCAAGAAAATGCCAGTGTCCCGGAACTGCTGGCTCCAATCAAGGTGGAGCCGGACTCGCCTTCTCGCCCAGGAGCAGTTGGGCAGCAGGAAGGAAGCCATGGGCTGCCCCAGTCCACGTTGTCCAGCCCAGCAGAGCAGCACGGTGCCCAGGACACAGAGCTCAGTGCAGGCACTGGCAACTTCTATTTGCTGTGTGGCGTTGGGCTACCTCGCTTCTCTGAGTACAAATGGTGTGTGGTGAATGGGTCCCAGGAAAGTGGGGGCTCAGCAAGAACTGATTACCGAGCCATTCAACTAGCCAAGGAAAAAAAGCAGAGAGGAGCGGGGAGCAATGCAGGATGACCCCTCCGGCGAAGGTGTCCTGCCCTCAACCCGCGGCCCAGCCGCCTTCCTCCCCTTCCTCACTGTGGACCTGCCCGTCTACGTCCTCCAG\n>HE815016.2 Uncultured endophytic bacterium partial 16S rRNA gene, clone Dkk4A12.M13-F \nAACCGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGGCACTAGGTGTGGGAGGTGTCGACTCCTCCCGTGCCGTCGCTAACGCACTAAGTGCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCAGCGGAGCATGTGGTTTAATTCGACGCAACGCGAAGGACCTTACCTGGGCTTGACATGTAGGTGACCGCCATAGAAATATGGCCTTCCTTCGGGACACCTTCACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCCGTTCCATGTTGCCATCATTCAGTTGGGGACTCATGGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGCCCCTTATGTCCAGGGCTACACACGTGCTACATTGGCGCATACAAAGGGCAGCAATACCGTGAGGTGGAGCGAATCCCAGAAAGTGCGCCTCGGTTCGGATTGGAGGCTGAAACTCGCCTCCATGAAGGTGGAGTTGCTAGTAATCGCGGATCAGCAATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAAAGCAGGCAACACCCGAAGCCGGTGGCCTAACCTTTTGGAGGGAGCCGTCGAAGGTGGGGCTCGTGATTGGGGTGAAGTCGTAACAAGGTAACCGTA\n>JQ912969.1 Uncultured archaeon clone B22pf 16S ribosomal RNA gene, partial sequence \nTTCCGGTTGATCCTGCCAGAGGTCACTGCTATCGGGGTTCGATTAAGCCATGCGAGTCGAGGGGGTTCAGACCCTCGGCGGACTGCTCAGTAACACGTGGATAATCTGCCCTATGGTGGAGGATAACCCCGGGAAACTGGGGATAATACTCCACAAGTCAGGAGTACTGGAATGTCTCCTAACTGAAAGTTGCGGCGCCATAGGATGAATCTGCGGCCGATTAGGTAGTTGTTGGGGTAACGGCCCAACAAGCCCGTAATCGGTACGGGTTGTGGGAGCAAGAGCCCGGAGATGGAATCTGAGACACGATTCCAGGCCCTACGGGGCGCAGCAGGCGCGAAAACTTTACAATGCAGGAAACTGTGATAAGGGAACCCCGAGTGCCCGTAAACGCGGGCTGTCCCGGTGTTTAAAACACATCGGAAGAAAGGGCCGGGCAAGACCGGTGCCAGCCGCCGCGGTAATACCGGCGGCTCGAGTGGTGACCACTTTTATTGGGCTTAAAGCGTTCGTAGCTTGATTTTTAAGTCTCTTGGGAAATCTCACGGCTTAACTGTGAGGCGTCTAAGAGATACTGGGAATCTAGGGACCGGGAGAGGTAAGAGGTACTTCAGGGGTAGAAGTGAAATTCTGTAATCCTTGA\n>XM_036570612.1 PREDICTED: Colossoma macropomum myosin-10 (LOC118808147), transcript variant X1, mRNA \nTCCGCTGGGTTCGGTTGAGTAGAAGCGGCTGCAGCAGCGCGGAGGGAGACGAGACTGAGTTTAATATATTTGAAGAACAAAAACTGGATTCTTGTAAAACTGGAAGGCCTGGATTAGAGGTTTATTTCAGCTGCTCACAGTCAAAGGTTTTGCCCTTCGTGGCCTGTCTGTAGTTCCTAATGCCGGAGATGGCTCAGCGGAGCGGTCAGGAGGACCCCGAGCGGTACCTCTTTGTGGACCGGGCGGTGGTCTACAACCCAGCCACCCAGGCTGACTGGACCGCCAAGAGGCTGGTGTGGGTTCCCTCGGAACGACACGGGTTTGAGGCGGCCAGCGTCCGCGAGGAGAGAGGAGAGGAGGTGGTGGTGGAGCTGGCGGAGAATGGCAAAAAGGCTCTGGTCAACAAAGACGACATCCAGAAGATGAACCCACCAAAGTTCAGCAAAGTGGAGGACATGGCGGAGCTGACCTGCCTGAACGAAGCCTCTGTACTGCACAACCTTAAGGACCGATACTACTCCGGCCTCATCTACACTTATTCCGGACTCTTCTGTGTGGTGATAAACCCATACAAAAACCTTCCCATTTACTCGGAGAACATCATTGAGATGTACAGAGGGAAGAAGAGGCACGAAATGCCGCCACACATCTACGCCATTTCCGAATCCGCCTACAGATGCATGCTTCAGGATCGTGAGGACCAGTCTATTCTGTGCACAGGTGAATCCGGAGCTGGAAAAACAGAAAACACCAAAAAAGTGATCCAGTACCTGGCACACGTTGCTTCCTCTCACAAAGGAAGGAAAGATCACAACATTCCACCAGAATCTCCTAAAGCAGTGAAGCTCCAGAGTGGACTCCTGGTCTATGGGGAGCTGGAGAGGCAGCTGCTGCAGGCTAACCCCATTCTGGAGTCCTTCGGAAACGCCAAGACGGTGAAAAATGACAACTCGTCTCGCTTCGGCAAGTTCATCCGCATCAACTTTGATGTCACGGGTTACATTGTGGGGGCCAACATCGAGACCTATCTGCTGGAGAAGTCCAGAGCGATCCGACAGGCCAAAGACGAGAGAACCTTCCACGTCTTCTACCAGCTGCTGGCTGGAGCAGGAGAACATCTGCGCTCCGATCTCCTCCTGGAGGGCTTCAATAACTACCGTTTCCTCTCCAACGGCAACATTCCTATTCCCGGCCAACAGGACAAGGACAACTTCCAGGAGACCATGGAGGCAATGCACATCATGAGCTTCTCACACGATGAGATTTTGTCGATGCTGAAGGTGGTATCAGCTGTGTTGCAGTTTGGAAACATTGTGTTCAAGAAGGAGAGAAATACAGACCAGGCCTCCATGCCTGAGAACACAGCTGCGCAAAAGCTCTGCCATCTGCTGGGGATGAGTGTGATGGAGTTCACCCGCGCCATTCTGACCCCCAGGATCAAAGTGGGCAGAGATTATGTCCAGAAAGCCCAGACGAAAGAGCAGGCTGATTTTGCAGTGGAAGCTCTGGCCAAAGCCACGTACGAGCGGCTCTTCCGCTGGCTCGTCCACCGCATCAACAAAGCTCTGGACCGGACCAAACGGCAGGGAGCGTCCTTCATCGGCATCCTTGACATCGCTGGCTTCGAGATCTTCCAGCTGAACTCGTTCGAGCAGCTATGCATCAACTACACCAACGAGAAGCTCCAGCAGCTCTTCAACCACACCATGTTCATCCTGGAGCAGGAGGAGTACCAGCGCGAGGGCATCGAGTGGAGCTTCATCGATTTCGGCCTCGACCTGCAGCCCTGCATCGACCTCATCGAGAGGCCGGCAAACCCTCCAGGTGTGCTGGCCCTGCTGGACGAGGAGTGCTGGTTCCCCAAAGCTACAGACAAAACGTTTGTGGATAAGCTGGTGCAGGAGCAGGGCTCGCACGCCAAGTTCCAGAAACCGCGGCAACTAAAGGACAAGGCTGACTTCTGCATCATCCACTACGCAGGCAGGGTGGATTATAAAGCGGATGAATGGCTGATGAAGAACATGGATCCTCTGAACGATAACGTGGCCACTCTGCTCCATCAGTCCACTGACAAGTTTGTGGCCGAGCTGTGGAAGGATGTGGACCGCATCGTGGGTTTGGACCAGGTGGCCGGTATGAACGAAACGGCGTTTGGAGCGACGTACAAGACCAAGAAGGGTATGTTCCGGACGGTGGGACAGCTCTACAAGGAATCTCTGACCAAACTGATGGCCACTCTCCGGAACACCAACCCCAACTTTGTCCGCTGCATCATCCCCAACCACGAGAAGAGGGCTGGTAAACTGGAGCCCCATTTGGTTCTGGACCAGCTGAGGTGTAACGGGGTTCTGGAGGGAATCCGTATTTGCAGGCAGGGCTTCCCCAACCGCATCGTCTTCCAGGAGTTCAGACAGAGATATGAGATCCTCACCCCTAACGCCATCCCAAAGGGCTTCATGGATGGGAAGCAGGCCTGTGAGAGGATGATCCAGGCCCTGGAGCTGGACGCTAACCTGTACCGGATTGGTCAGAGTAAGATATTTTTCCGTACCGGAGTTTTGGCACATCTGGAAGAGGAGCGGGACCTGAAGATTACTGACATCATTATCTACTTCCAGGCCGTATGCCGAGGATACCTGGCACGCAAGGCGTTTGCTAAGAAGCAGCAGCAGCTGAGTGCTCTGAAGGTTCTCCAGAGGAACTGTGCGGCGTACCTGAAGCTGCGGCACTGGCAGTGGTGGAGACTTTTCACCAAGGTGAAGCCTCTGCTACAGGTGACCCGTCAAGAGGAGGAGATGCAGGCTAAAGATGAGGAGCTGGTGAAAGTGAAGGAGAGGCAGGTGAAGGTGGAGAACGAACTGGTGGAGATGGAGAGGAAACACCAGCAGCTCCTGGAGGAGAAAAACATCCTGGCGGAGCAGCTTCAGGCTGAGACAGAGCTGTTTGCAGAAGCTGAGGAGATGAGAGCTCGTCTCGTGGCTAAAAAGCAGGAGCTGGAGGAGATTCTGCATGACCTGGAGTCCCGAGTGGAGGAGGAGGAGGAGCGGAACCAGACGCTGCAGAACGAGAAGAAGAAGATGCAGTCACACATACAGGACCTCGAGGAGCAGCTGGATGAGGAAGAAGCCGCGAGGCAAAAGCTCCAGCTGGAGAAAGTGACCGCAGAGGCCAAAATAAAGAAAATGGAGGAAGATCTGCTGCTGCTGGAGGACCAAAACTCCAAATTCCTGAAGGAGAAGAAGCTGCTGGATGAGAGGATCGGCGAGATGACCTCTATGCTGGCCGAAGAAGAGGAGAAGGCCAAGAACCTCGGCAAAGTGAAAAACAAGCAAGAGATGATGATGGTGGACCTTGAAGAGCGTCTGAAGAAGGAGGAGAAGACCAGGCAGGAGTTGGAGAAAGCCAAGCGTAAACTGGACGCCGAAACCACAGACCTGCAAGAGCAGATCGCTGAGCTTCAGGCTCAGATCGACGAGCTGAAAATCCAACTGGCTAAAAAAGAGGAGGAGCTTCAGGCTGTTCTGGCCAGGGGCGATGAGGAAGTGGCCCAGAAGAACAATGCTCTGAAGCAGGTCCGGGAGCTGCAGGCCCAGCTGGCCGAGCTGCAGGAGGATCTGGAGTCGGAGAAGGCTGCTCGGAACAAAGCGGAGAAGCTCAAACGGGACCTCAGCGAGGAGCTGGAGGCGCTGAAGACTGAGCTGGAGGACACACTGGACACCACGGCCGCTCAGCAGGAGCTCAGGACGAAGAGAGAGCAGGAAGTGGCTGAACTGAAGAAGGCGATCGACGAAGAGGCTCGAAACCACGAGTCCCAGATTCAGGAGATGAGGCAGAGACACGGGATGGCGCTGGAGGAGATCTCAGAACAGCTGGAGCAGGCCAAACGGTTTAAGTCTAATCTGGAGAAGAGTAAACAGACTCTGGAGGGCGATAATAAGGAGCTGGCGAGTGAGGTGAAGGTTCTGCAGCAGGCAAAACTGGACTCTGAGCACAAGAGGAAGAAGCTGGAGGCTCAGCTGCAGGAGGTTCTGGCCCGCGTTACTGAAGGAGAGCGGACCAAGGGCGAGCTCGCTGACCGCACTCACAAACTACAGACGGAGCTGGAGAATGTATCTACTCTGCTGGAGGATGCGGAGAAGAAGGGAATAAAGCTGGCTAAGGACGCCTCCAGCCTGGAGAGCCAGCTGCAGGACACACAGGAGCTCCTGCAGGAGGAAACGCGTCAGAAGCTGAACCTGAGCAGCCGAATCCGTCAGCTGGAGGAAGAGAAGAGCGCCCTGCAGGAGCAGCAGGAGGAGGAAGAGGAGGCACGTAGAAACCTGGAGAAACAACTGGCAACCTTGCAGTCTCAGCTGTGCGAGACGAAGAAGAAGCTAGAGGATGACGTCGGAGTTGTGGACGCTCTGGAGGAGGTGAAGCGGAAGCTGCAGAAGGACATGGAGGCCACCAACCAGAGACTGGAGGAAAAGGCCATGGCCTACGATAAGCTGGAGAAGACCAAAACCCGGCTTCAGCAGGAACTGGACGACCTCATGGTGGATCTGGACCACCAGAGACAGATAGTCTCCAACCTGGAGAAGAAGCAGAAGAAATTTGACCAGATGCTGGCGGAGGAGAAGAGCGTATCGGCGCGTTACGCTGAGGAGCGAGACCGAGCAGAGGCCGAAGCGCGGGAGAAAGAGACGAAGGCACTATCGATGGCCCGAGCGCTGGACGAAGCACTGGAGGCTAAAGAGGAGTTCGAGAGGCTGAATAAGCAGCTGAGGGCCGAGATGGAGGATCTGATGAGCTCCAAGGACGACGTGGGAAAAAACGTTCATGAGCTGGAGAAGTCCAAACGTACGCTGGAGCAGCAGGTGGAGGAGATGCGCACTCAGTTGGAGGAACTGGAGGATGAGCTGCAGGCCACAGAGGACGCCAAACTGCGCCTGGAGGTTAACATGCAGGCCATGAAGGCCCAGTTTGAGCGTGACCTGCAGGCCAGAGATGAACAGAATGATGAGAAGAAAAGAATGCTGGTCAAACAGGTGCGTGAGATGGAGGCGGAGCTAGAGGATGAGAGGAAGCAGCGTGCGCTGGCTGTGGCGGCTAAGAAAAAGCTGGAAATGGACCTGAAGGATGTTGAGGCTCAGATTGAGGCAGCTAACAAGGCTCGGGATGAGGCCATCAAACAGCTGCGCAAACTCCAGGCTCAGATGAAGGACTATCAGAGGGAACTGGAGGAGGCTCGAGCCTCTCGAGATGAAATCTTTGCCCAGTCAAAAGAAAACGAGAAGAAGCTCAAGAGTCTTGAGGCAGAGATATTACAGCTGCAGGAGGACCTGGCTGCATCTGAGAGAGCACGGCGTCATGCAGAGCAGGAGAGGGACGAGCTGGCAGACGAAATCTCAAACAGTGCCTCTGGGAAGTCTGCTCTGCTGGATGAGAAGCGCAGGCTGGAGGCTCGAATTGCTCAGCTGGAGGAGGAACTGGAGGAGGAACAGAGCAACATGGAGCTCCTCAATGACCGCTTCCGCAAGACTGCCATGCAGGTGGATACTCTGACCACAGAGCTGACCGGAGAGCGCAGCGCAGCCCAGAAGAGCGAGAACGCCCGGCAGCAGCTGGAGAGACAGAACAAGGAGCTGAAGGCCAAACTGCAGGAGCTAGAGGGATCCATCAAATCTAAATTTAAAGCCAATATCACCGCCCTGGAGGCCAAAATCCTGCAGCTGGAGGAGCAGCTGGAGCAGGAGGCCAAGGAGCGGGCAGCGGCCAATAAGATTGTCCGGCGCACAGAGAAGAAGCTGAAAGAAGTGTTCATGCAGGTGGAGGATGAGCGTCGCCATGCTGACCAGTACAAGGAGCAGATGGAGAAGGCGAACTCTCGCATGAAGCAGCTGAAGCGTCAGCTGGAGGAGGCGGAGGAGGAAGCTCAGCGCGCTAACGCCTCCCGCAGGAAGCTGCAGAGAGAGCTGGATGACGCTACAGAGGCGAGCGAGGGGCTGAGCAGAGAGGTTAACACCCTCAAAAACCGTCTCAGACGCGGAGGCCCGGTCAGTTTCCCCTCGGGTCGCTCTGGCCGCAGGCAGCTGCAGATGGAGGGCGAGTGTTCCGATGACGACGCCGAAAGCAAAGCCAGCGATGTGAACGAGACCCAGCCTGCCCAGCCTGAGTAGTTATAGTGTCCCCCTGTGGTCCTGCAGTGCTATTACACCTTCTACCCCAAAACAGTCAGCACGCCAGAAACCGTAACATGTAACCCAGTTCGTTCTGCTGCTCGCGTGGTGGAGAGCAGGACTGAGGGTCCACACACACACCTCTCTAAACACATTTATACACACATGACTCCTCCACACACCTGCGTTCTGTCTACAAGCCTAAGCTGCAACGAGCATGAGAACGATTCAGTACATACGGTCATTCCCTTCATATTCAGGGAACCTCAACTCTGCCTTACTCAATGCAGCAAAGCTTCAAGGTTGAGTGGAGTTTTGTTCTAATTAGCAATCTGTTGTAATGTTAGCCTTCAGAATAATTGCTTAAGGTGAAAACACTATAGGTACAAGTGCATTTTATATGTTCAGTTTTTTTGTGCACACAGTCATACATGAGCAGCAACTCGAGTCTAGTATAAATAAATAACGATAAAGCCACTGCTTAGCTAAAGCAAGACAGGTCTGGCGTTAGAGTACGATGTGAAATTCCAACGAAGCACAGGTTCTGAGTGTTTTTGGCTGGCGGAAGTATGTGTTAGAGATGCATGGACTTCTGTTTTCTACAAGTAATAGAGAAAAAACACAAAAATGTACATGTAACCGGCCGAACCTGTGGCTGCTTCGAATTGGATTGAAAAGTGAAGAAAAAAACTGTGAAAAAGCTACTGCTTAAGCTTCTGCCCACATTAGACAAACAAAAACACTAAGATGAAAGTACCTTCAGTCATTTCCGTTCATCCTCATTCTATTTGGGACACTTGATTGTTGAAGTATTGGGAGAGATTCCGATAAGTGATGGTATTAGACGTTGACGAAACTGGATGTAAATGCAAGATGCGAAATGCTTTGTAACTGCACATTTACTACAAGCCATACGAGGCAAAACTGGAAAGAAATCCGTACATTTTGGGAGAATGTGCACATCCACAAAAAAAAGAATAATTTTTTTGTGAAGGTTTCTTCGGAAAATATCTCATCAAATGTGTGAACTATTAGCTGCTTTATTAGACACTCCGAGAAGTGCTTTAGTACATGAAGGGAAACCGACAGAAGTGAAGGAATCATTTCGTTCAGTGGGATCATCTCGTTCACTGCTGATTTTGACTGGAACACTAACATCAAAACACATTGATGATTCACAGGCACTTAGTTCGATTTGAATCATAAACCTGAGCCCTTGAGCTTCAGCCCAAAATGTATAGAAGAGCCACTACAGTTCTCAAACACACTATTATTTCTCAGTATCAGTATTATAAAGATGATGGATTAGAAACGATACTCACCTGCTCCAATATTAGTATTTAATAATGTTTCTTTAAAAAGTGCCTTAGTCACTAATTAAGAAAATATCCATGAGTTAAATGCATTGTACATCTATAATGGTGTGTATACAAGTGCAACACTAACATGAAGGCAAAACTGGCAAAACAATATAAGAATAATAAAAAAAACACTACGTAACCCTTTCTGTTTTGTATTTTACTGTGCTTTGAATCATATCCGTTATCTAAGTCTCTCTTCCCTAGTCTTCTAGGTAAGCCATGGGCCAGCTTCAGTGTTATCTGTAGGAGTTGGAACCCTCTGCCTTGGCTGCAGAGGGAGTTGCAGGATTTTATTTGGTTAAAAGCTTTACCCCTCCACGATCTAGTTACTATTATTACAATTATCATTATTATTGCTATTGTTATCACTCTTATTATTGGGCTGGCTGTTGACAACCAGACATTCAACTGCAAATATATCTCTCCTTTTTTTCTTGTATACTGTTACTGTATTTCTAGACAACAGTGATTTTTGTAAAGGAAAAAAAAATAAAACCTTCATTATAG\n>XM_017906153.1 PREDICTED: Eufriesea mexicana enoyl-CoA hydratase, mitochondrial (LOC108551834), transcript variant X1, mRNA \nCATATTGAAAAGAAAATAGCTTTCTCCACTTCATAAACATGCATTGTACTGCTCTGCTAACCTTCACAGCTTTCTTCTCTCTCTCTCTCCCTATATACATTCACCTCTCCCCGCTCTTTTTTAATCGTGTAGTCTGCTAGAATCCAGTCTGGATGATATGAGTCGGAACGAACTCGTTTTATCGTCACTCATCTCATCATTCGTTCTGTTGATTCCATAAGAAAAGTGTTTTTATTGCTATTAAAATCATAAGTTTAAACAGCATTATGGTAACTACACGTATTGGACATATTCTCCTAAACAAGAGTTTACAGATCGATCGAAAATTACCATATTGTGCGTCCAACGTAAAACATTATTGTTGCCAAGTTCAAAATTATGAATTCATCAAAGTCGAATATACTGGCGAAAACAAAAATGTGGCTTTAGTAACACTAAACAGGCCGAAAGCTTTAAATGCTCTATGTGATAAATTAATGATTGAATTGAATGATGCTATATCAAAATTTGATAGAAATGATTCTATCGGTGCCATAGTCGTTACTGGTAGCGAAAAAGCATTTGCAGCCGGAGCTGATATTAAAGAAATGCAGAATAATACTTATGCACAGAATGTGAGAGGAAACTTCCTTGCCGACTGGGACGGTGTTTCCCGAGCATCGAAACCAGTAATTGCTGCTGTAAATGGATATGCTTTAGGTGGAGGTTGCGAATTAGCAATGATGTGTGACATCATCTATGCTGGGGATAAAGCGAAATTTGGTCAACCGGAAATCGCCCTTGGTACCATACCTGGTGCGGGTGGCACACAAAGATTAACGAGGGTAGTTGGTAAGAGCAAAGCGATGGAAATGGTACTAACAGGAAATCAGATCACTGCTGAGGAGGCGGAAAAAAGCGGTCTTGTTAGTAAAGTCTTCCCAGCAGATAGACTTATTGCTGAGGCAATTAAGTCAGCTGAAAAAATTGCCTCCCATTCTCAATTAATCGTTGCCATGGCAAAAGAATCTGTTAATACTGCTTATGAAACTACTTTGAAGGAAGGACTTCACTTTGAAAAAAAGATGTTCCATGGCACATTTGCAACGGATGATAGGAAAGAAGGAATGACAGCGTTTGTTGAAAAAAGACCACCTAAATTCAACAACCACTGAGACCATTAATTCCATTATAGGAGAAGAATAAAAATGATGTAACATTTGTAAAGAAATTTTATTTAATTTTATTTAATTATTTCTTTACGTCTAATATCATAATCCATGATTATGATACATTTACAATTAACGGCTCATACCAGGTAAATATTTCTTAATAATAGCAATTCTAATGCTCTCGTAGAAGCATAGAAATGCCGTTGACATCGTAAAAGGTATCCAAGAATGGTAGGAACAATGGAATTTCACACCGACATCGTTATATAATAAATATCAAACTTTATAATAATGTGTATCTTGCTTGCTATTTGGAAATTTTTTTAATCCTGTTTTCAGATATTCTCGGAGAA\n>MH775349.1 Uncultured bacterium clone 2932 16S ribosomal RNA gene, partial sequence \nTGGGGAATTTTGGACAATGGACGCAAGTCTGATCCAGCCATGCCGCGTGCGGGAAGAAGGCCTTCGGGTTGTAAACCGCTTTTGTCAGGGAAGAAACGAGTTTCTCTAATACAGAGACTTAATGACGGTACCTGAAGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTGATGTAAGACAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCGTTTGTGACTGCATAGCTAGAGTACGGTAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAATCCCCTGGACCTGTACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACA\n>XR_003646050.1 PREDICTED: Camellia sinensis protein TPR1-like (LOC114310240), transcript variant X10, misc_RNA \nTAATCTCTCTGAATCGATCGAATCAACCTTCTTCAGCCCCATTTGATCTAATCTCAGAGCGATTGGTGATTCATCTCCGATCCAATCTCAGAGCGATTGGCAATTTCGATTTTGAGATTTTGAAGCTCCACCGCCTCCACCATCTGCACTGGCGAGGGGAGCGAGCACCATCATCTACTAAGAGCCATGTGCGGCAATTCTGTTTGGCGTTCACTTCAATGTAATTGTAATTTAAAGCTTCAATTTGTTGCTCTCTCTTTCTCTCTCTATCTGTACCCATTTGGCGTTGTCTGTTGCGTCCAAGTCACAGCAACCTCTTGATTTGCCTTTTGGTCTGAAGTTTATTTTGGACGCATTCTTGTGATTTCAACATTTCATTTTATCAAATTTGTCACAATTTCATCCAAAATTATAATCAATATCCTTAAAACAAATATGATCATATAATTGTGGTGATGATCTGACAGAGGTGCGAGTGGATTATGCTCTTCTATGGTCTGTGGATTCGGCTGCATTCAAGGTTCCAAATGCATAAGAACCACGCACTGTGACAAAGGTACTAAGGTAAACCATCCAATCATGCTCCGTAGAACTACTTTTGTGGCTCTGATCTTTGGGACCATAGCCATCTTCTTCATCAGCTCGAGTCTTGTCTTCTAGTATAAGTGGCTCCCTTATCTCTTCTTGCAAGCTGTTCTCACCTTGCTCCAAAAATTAGAGAATTCAAATTTATGGTCAAGAATTTAATGGAGAATGCTAACAAAAGGATTTTGTTCTGTGATGAAAGCCAGGATGCACCACACTATGAAGTCCTTGCCAAGAATATTGTAGATGCTATGCTGGTGGACTGTTTGTTGTGTACTTTGCTCTGCTGCAACAGGTAGCAGCATAAGAGATATTCAGTTGATTGCATGACCTTTCATCCTCTATATTTGATCCTCGCTGTCAACTTTTGCTTATGCATATCTCAGTGACTATTTTTTTGAAGTGATTCACTTATTCTTTTGAACAGGTTCCTCTTACTAATGAATTCATTACTAATGGTGCTCCTCTTGCCAGGTTACATATCCAACATCTCGTCAACATGCCACTTGGTCCTTGGATGACTTGCCAAGAACAGTAGCTTGTACCATGCATCAAGGATCTGCTGTTAACAGCATGGATTTTCATCCTTCTCATCACACATTGCTTCTTGTTGGTTTTGCTACTGGTGAAATAACGCTCTGGGAAGTGGGGATGCGATATAAATTGGTTTCAAAGCCATTCAAGATATGGGACATGGCAAATTGTTATATGCTGCTTCAGGTTCCTTTTCTTCCTTTTCTTTCCTTGTTGCTTGTTATCTTAGCATTCTATGATGTGATATATACCTATGATATGAGATATCTATGGAGGTTGTAAACAGCATGTACAAATTAATTGTGACCAGATTATTTCTTGTTTGATTTGGGGACATTTATAATACTAATCTTCAACTA\n>XM_016745472.1 Penicillium expansum Zinc finger, DPH-type (PEX2_082020), partial mRNA \nATGGCCGACGACGGACTGAACATCTACGACGAGATCGAGATCGAGGATATGACCTTCGACCCGAATATCCAGATCTATACATACCCTTGCCCATGTGGCGACCGATTCGAGATCGCAATCGACGATCTGCGCGACGGAGAAGAGATCGCCGTGTGTCCGAGTTGCAGTCTGATGATCCGGGTTATCTTCGACTTGGTATGTTTCCCTATCGTCCAACCAGACGCCGATCTTCCTAAAGCCGATGCGCAGAGTACGAGTGGCGTGGCTGTTCAGGCTTGA\n>XM_047872644.1 PREDICTED: Prionailurus viverrinus adenylate kinase 4 (LOC125173463), transcript variant X6, mRNA \nTGGTGCGGCTTAACCGCGCCCCAGGAGGGTGCCGAGGCTCGCCGGGAGGAGGGTGGGAGGTGCATGCTTCTCCTCTCCTCGCCTGGACTCCTCTTGCCTTGGGGAAAAGCCTGTAACCACCCAGCTGAGGGAGAACCAGACAGCTGAAAACCCCGAGCTTCCCTCTCGCCCTGCTTCCTTAAGGATAAGCCCTCCCAGCCCACGCGTCCCCGGGGAACTGGGGCGTCCCCCCGCTCTCGCCGCCCACCTGTGGGAGTCCGGTCCCGCTGCGCTCTGGGGAACCTGTGGCGCCGCGGGGCCCCCAGCCGCGCACTGTTCCTGCCCCTCTGCGTCACCCTGGGCCTCCGGGCAGAGCCCTGGTGGCTTTGAAAGGCCTGTCTGTCCGCTGCCGCCTTCTAAGAAGTTGGTGATATGGCAAAGCAGTACATAGAGAAAGGTCTTTTGGTTCCAGATCATGTGATCACACGCCTAATGATGTCGGAGTTGGAGAATAGGCGCGGCCAGCACTGGCTACTAGATGGTTTTCCTAGGACATTAGTACAGGCTGAAGCCCTGGACAGAATCTGCGAGCTGGATCTAGTGATCACTTTGAACATTCCATTTGAAACACTCAAAGACCGTCTCAGCCGACGTTGGATTCACCCTCCCAGTGGAAGGGTGTATAACCTGGACTTCAATCCACCTCATGTGCATGGGATTGATGACATTACTGGTGAACCATTAGTCCAGCAGGAGGATGATAAACCTGAAGCAGTTGCTGCCCGGCTAAGACAGTACAAGGATGTGGCAAAGCCAGTCATTGAATTATACAAGAGCCGAGGAGTGCTTCACCAATTTTCTGGGACGGAGACTAACAAAATCTGGCCCTATGTTTACACGCTTTTCTCAAACAAGATCACACCTATTCAGTCCAAAGAAGCATACTGAGCCCGCCCAATGAAGAACCAGGAAGATGTCATTCATTCAGTTGTATGTGTAGTATTGGTGCCGTGTCCAAATTAGAAGCTAGCGGGGATAGCTTGCAGCGTCTTTTCTAGTCTAAATGGTGAACTGAAATGAAAACAAATGAGGAGAAAGAGTTAATGAAGAGGCTCTTCTCTGCCTTTCTGATGAAGGGTCACCCACACATGTCTAGGATGTCTCTGCATGTCTCAAGCCCTTCACAAGAAAGCAAGTACAGGCTGGATTTCAAAGGGTGTATAACCCAAACTCTAGCTGATTTCTGACCATCACATTGTTGCCATAGTAGCCTTTTAACATGTGATGGTGTTGGCCTCTGGTTCTCCCTGCCCCCCAAAGGCTATTGAACCACAGCACCAGGTGGCCTGAGAATGCCAAGGGCAGTAGCCCCGGCCTTGTCCCAAGTTCTCTGGTATGTGCCCTTCCTGGTGACCGTGCGATTGAAGCCAGTTGCTCTGTGGTCACTTCTCTGGCCTTGAGTGACTGTCCACAATTAGCTTTTCTGTTCAGAGTGATACCTTTTTCTGCCTCCATGCTCTGTAGAGTCTCTCCTTTTTCAGACATCCTGGAATGAAAGGATTTCGCTTCTAGTATTTTTATTAGACTGTATTTTGGTACATCTGTTTTCTCTCTTCCTAGACTATGAAGTAATAGATAGTTACTGCTTTTATCTCTCTCAGATTCCTTTCTAAGAGCCGAGAGTGAGGGGAGGGTGTCCAGATGCTTCTTGCAGCAGGAACTGAGCTCTGCAGAGGGTCTACTTATGCTGCTGGGCTGACCCTCATGGGTTGACACTGCTCTTTTCTTTTATCATGAAAAAATAAAATCCTCAAAGTCTTTGGGAGTCTTCAGAAAAATGGGAGATACTACATACATGTTAAAGAATCATATCTTGTGTATAGAAGTAATAAGACCATATGGAATTACTGCACTAAAAGAATAGTTTAGCTTTTTATTCAAGACAAAAAAAATGTATTTTGAAATGCTGCTAAATATTGATGCTGACAGTGTTTTTCTCCTGGGAGTGACCCAAACATATTATAAATAGTTGGTAAAGGGAATGGAGCCTGTGTGTTGAGGAAAATGTTGCACTAGCTGTGCCCAGACTGAGTATGACAGCTTTGTGATTATGGGAAAACAAATTCTTAATTTTTTTTTCTTTCTATTCCAAAGATGCTTTCTGTGGGGTGGCCATTAAGTCTAGAAATATAGATGATACAATTTTGTCATTCTTTGTAATGTAATATCAATAAACCATTTATTAAAGATTTGCCTGGTTTCCAGACTTGGTGGCCACCTAATGTAATTCTGGCTCTCCTCTGGGAAGGACAATGAAATTTATTCCTGTTGCCTTAAAAATAAATACCCCTCTTCATGCATCGTGATTGTCCCCAAGGAGGGTTCTTTGCTATTCCTGAGAGTGACTTCTAACTCCTCATACTGAAGAGAAGGGGGGGGGGGGGGGCGGGGAGCCTATTTCAGCACGCCTCTGGTGTTGCAATGCATTGTTTATTTTCTGAAGATGTCCTGGAGAATCTCCAGTCAATTCCCTGGCAGATGTGTTCTGTATGGTAATCGTTGCATCTTCCTTACAAATACTGCCCCACTCTTGACAGTTCCTCTCCTCTATACCTTCGTGAGAATGTTCTTTGACTACCTTAGTGGAAACATAGACTGGTCTCCTCCTCATTCTCTGAATCACCATGTTACTTTTTGGGTGTATGCAATGGAGGTGCCCAGTTCAGGTCTGTGAAACATCAGTGCATGATATGGACTTCTAGTGCTTTAGAAGAGCCGTGTTTGAATGCCGGTTGGTGGGGACAGGGTGAAAATCAGACCTGTAGGTAAAGCTCAGGTTTCCTGGGGAACCAGGTACGGAGAAAACAAACCTGATATGAAGAAAGTTGCACAATTTAGACTAGTACTGCCATGGAGACAATTTCTAAAAACTAGGAAAAGTAGAGAGTTAAGGTTGTTTTATGGGTAATTCAAGAGAGGAATGTGTGTGTCCTTTTGTAAGTGGAAAAATCTACATGACTCTTCCTTTACTTCTCTTTTTGTTTAACAGACTCCCTTTGGAGTTTTTGAGAGAGTTATGGGAAATGGCTGGTCCCTGGTGCCATACTCTAGTTCTCAATCCTTCCCTCCTCTCCTCCAGCAGAATAGATAGTTATAGTCAGTGTGGGAGCCTCTCAGTGTCTCAACAGCATTTGCTGTTTCTGTGCTTGGTGAGGGCCCTGTGCTTGGTGAGACCAATAAAAAAGACAAACACCTTTTCCATGCGTCTTTGAAAGATGATACTTATTTCATGTTCAGTGGCCTAAAAAGTCTATTTCAGATTTTCTTCAACAAGCTCTCTAGCATTTTCTCCAGTAATTTTGTAAAAAATTAAAATTCTCTTGAAAATATTTTGATAAAAGCTAAAGGGACATCTTTTCTTGGTTTTTCTTCTACTGCCACAGATACGGTTCCTTCACAGTTCTGCAAAGAGAGTAATTTGGGTGTCTATAAGATTCCTACCGGTCCACATATTCTGTGATTTAGCCAGTTGTGAATTAATTTTGCTTTTCATTGTCTGAACAGGCTTCCCACTTACTTAGAACTTGGAGACATTGCTGTGTTTAATATCCTTTAACACTAAGGCAGACATAAAATAAGTATCATTTACTGAAGGCCTTTGGGCGATAGGTAAAGTTCTAGGACCTTAGCAAACACTCATTTAATCTTTCAAGCATCCTTTGAGATAGGCATGAAGCCATGTTTATGAACAAGGAAGACAAGGGTCAGAGATGTGAAGCATCTTGCCCAGGCTCTTGCTGCCAACAGACAGTCCAGCCAGGACTCACACCCAGGTTTTCCTGATTCTGCAGCCTGAGTTTGCTCCTGGATGTTAACTATCTGTGTCCTGTCCCAACCAACCTAGGGTGCTGAGCCTGCTTGATTTTGCTCGTATTTCCAAGTGGCCTCATCAAAAGTAGCAGAAGTGACATTCAGCTCTATATGGGACTGTTCTCCCCCTCCCCGCTTTGCTTAAGCAAAGGGAGCTGCTAGAGGAAGATCTGAGCCTTTGATCTTCTTTCCTAACTTCTCACTTATAAAATGAAAGGCTGTTGAAATAGGCTGGGCTTGGGTCCAGGCTAATCTGTGGAGGGGTCAGGTTCCTTCATGTTCCTCACCTACCTAGGCTTTTGGTATCCATGGTATTGTACCCCTAAGAGACCTTAACACTTCAGCCGCCTTCAACTATAGGGCTCCCTGTAGATCTGGGCTTCTGGGAGTTAGATGCTACTCACTTTTCTTCCCTGATACCAGGAGAAATTACTCCCTTACTCCCACCCCCAAATAAGGCCCTGATGATAAACATCCTTCCTGAAGTGCTGGCAGGTGATGGAGCCCCCAGCATACCATCTTGCCTATGTCACATTGCGTATTAACATGATCCTGAATGCTACATTCACACCTTTGCGTGCCATCTGATGTGGCACTGCTTGTCATGCACAATTCTGGTGGAAACCAGGGGAGATTGGTTTCCTGTGTTATCCGCCCTGCCCAGGGTCACTCCCCACCACCCTCCAGCAGCCAAGCTCAGATGAGCTCCAGCTTTACCCAGGGTGTGCCCCTCCCTTTGGTAGGGAAGGAAAAAGGTAATAACAGCCAATGGATAAAAGGGATTCTTGGAAAGAGCTACTGCTGTGGCTTCGCCCACCTACCACTTAAAAATGTTGAGACAGGATGGTTTTAGATAGATGGGTGCCTGTGCAAAACCATAAATAGGACTGTTAGAAAATTTAGTTCACTAAACTGATTTCAGTATTTGACTTTAGCTGTTTAGCAGTTTAAACAGCTTACCAGCCTGCTGGGGGTCCTGCTTAGGTCATAAAGACCACAAATTTCAAATATGTTAAGACATATGCATTCCTAGTAGTTCCTGTTTATTGGTACTTAATGCTAAGTGCATTATGTGCATTGTCTAATTAAATCTGCAGTAGTTACCCTAACGTAATAGATGTTTTAGTTATCTAGCCTCTGTGTAAAAACTGCAATCATTCTGTTCACTTAAGTTTGTATTTTCATGTATCTATAGGGATTAATCAAGAAATCCAAAAGGGCCTTTTTTTGTACCTTTTCCTCCTTTGAGTTCCCCATTCTAATTAATAGGTAAAGCAGTGTTATTTGATTGTACTTGGAATCTTTGCTTTTGGCACTCTGGTGCTGAGGCAAGAAGTGGGCACTCAGTGGGTCTTGGTGGTAGTTGCACACTGTATATACAGAGAGCATATATCTCATCTGCACTCTGCTGAGTTACAGGATCTCGGGAGACATTCATATCTACCTGATGAATTTCATTTATTACCTTTCATTTAAAACACAGTATCTTTTTTTGCTGCATTTAATTTTGCCAGAGAGGCAATTCATAAGGCCAAGTTGTGTTCTTAGTATGAATTGCTTTCTATTTCCCTTGCATTTTTAGTAACTCCCTGGTCTATTTGGTGTCTCAAAAGGAGAACCTAGCAATGCAGCCTGTTTTTTTTGTTTGTTTGTTTCGTTTTGTTTTGTTTTTTTTTTTTAATACGGGAGTGTGGTCTAGTCATAAGTTATCATCCCTTTCCACATATAACTGATCCAGTCTGGTTTCTAGATGAAGAGTGTGCAAGAGCCAGATGTTGGGAAACCCATGAAGCCGTATTTCAACTATGAAGAAAAATATACTTCCTGCATCTGTTGAGATATACTATAATTACAGTTGTTCATAAATGCCATACCTTATCTTTCTTTTAACAAATTGCACAATTCTTGCCAAAATAAATGCCATTATTCTGTATGCTTCAGGGAAATTCCCCCAATTTGATCAGTGAGCATATGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTAGGGAGAGGGAGGGAGAGATGGTGAAACATTTCCAAGGGGACAAGAGCCCTTGGATGGCATGGATGTGCATTCCTTCCGGGTAATAATTACGCTATTCCAGGAAACAGCATGTGTCTTCCTGGAAATAAAGATTTCCTGTCTGTAACTTTTGTAAGTTACACCAAGTGCACCTTGTGATTCTCCCTGGGGTTGGTGTGTGTCTAATTCCATTTCATAAAACCTTTCTTCATTTTAAAGCTTTGGCTGTGAAGTCAGAAATGTGCTAAATAAAAACAAACTGTTTTGTATTTAATTTAGAGAAGGGTAAAGGGAAGAAAAAAAAAAAAACTCAGTCTTTATGTAAGCTCCAAGGTGTTAGGGCTTAGAGGGTTTTTCTAGTTTTATGAGAATTTGTACTACTGATTTTTATATATTCCTGTTTTTGAGATGAACAGATCTCTGGGGAAATTGTTGCATTACAATGGCGTTTCACTGTGACCCCTCTCAAGCTCAAATCTGTTCTCTTAAGCCAATGACAACTTGTCACTTCGGTTTACTGTCCTGTGAAAAGTCAGCTCCAGTTTCCCAGAAGTTGTGTGTTTATGATGAGTCAGTGCTTTTCTTCAGTGAAAGTTGTCAGCCTTCTTGATTTGGGTGTATGTGCTTAATTCAGAGTATCTAAACCTGTAGTCTAATCTGTACATGCTCTCCTAACTGTTAATTGTTATTGACTATTTTGATTATCTTGCTTGAAGATTGATTCCTACTTTTTAATTTGATAGAAATAAAGTTTTTTTTTCCTGCTTATAACTA\n>XM_032280742.1 PREDICTED: Sapajus apella ubiquitin specific peptidase 32 (USP32), transcript variant X1, mRNA \nGGCTGGCGGGAGGGGGCGGGGGAGGGAAGAGGGCGTGAGGAGGGAGGAGAGAGAAGGGCGGAGTAGGAGGGAGGGAAAGGGGGGCGGGGTGGAAGCGGGTCACGTGATCCACCATGGAGGCGGTGGCGGCGACCGGGAGGAGCCGCCGGGGCAGAAGCCGCACTTGTTAGTGTGGGGGGAGGTGGGGGTGGGGGACGCCGACACCGTCACCCAGGGACGCCGAGGAGAAGGCGGGAGGGGGGTGGGGGCGAGATCAGGCTCCGACCCCCGGCCGAGGGGATGTGGGGAGCATGGGCGCCAAGGAGTCACGGATCGGATTCCTCAGCTACGAGGAGGCGCTGAGGAGAGTTACAGATGTAGAGCTAAAACGACTGAAGGATGCCTTCAAGAGGACCTGTGGACTCTCATATTACATGGGCCAGCACTGCTTCATCCGAGAAGTGCTTGGGGATGGAGTGCCTCCAAAAGTCGCTGAGGTGATTTACTGTTCTTTTGGTGGAACATCCAAAGGGCTGCACTTCAATAATTTAATAGTTGGACTTGTCCTCCTTACAAGAGGCAAAGATGAAGAGAAAGCAAAATACATTTTTAGTCTTTTTTCAAGTGAATCTGGGAACTATGTTATACGGGAAGAAATGGAAAGAATGCTCCATGTGGTGGATGGTAAAGTCCCAGATACGCTCAGGAAGTGTTTCTCAGAGGGTGAAAAGGTAAACTATGAAAAGTTTAGAAATTGGCTTTTTCTAAACAAAGATGCTTTTACCTTCTCTCGATGGCTTCTATCTGGAGGTGTGTATGTTACCCTCACTGATGATAGTGATACTCCTACTTTCTACCAAACTCTGGCTGGAGTCACACATTTGGAGGAATCAGACATCATTGATCTGGAGAAACGCTATTGGTTATTGAAGGCTCAATCCCGGACTGGACGATTTGATTTAGAGACATTTGGCCCATTGGTTTCACCACCTATTCGTCCATCTCTAAGTGAAGGTTTGTTTAATGCTTTTGATGAAAATCGTGACAATCACATAGATTTTAAGGAGATATCCTGTGGCTTATCAGCCTGTTGCAGGGGACCCCTGGCTGAAAGACAAAAATTTTGCTTCAAGGTATTTGATGTTGACCGTGATGGAGTTCTCTCCAGGGCTGAACTGAGAGACATGGTGGTTGCACTTTTAGAAGTCTGGAAGGACAACCGTACTGATGATATTCCTGAATTGCATATGGATCTCTCTGAAATTGTAGAAGGCATATTGAATACGCATGACACCACAAAGATGGGCCATCTTACTCTGGAAGACTATCAGATCTGGAGTGTGAAAAATGTTCTTGCCAATGAATTTTTGAACCTCCTTTTCCAGGTGTGTCACATAGTTTTGGGGCTAAGACCAGCTACTCCAGAAGAAGAAGGACAAATTATTAGAGGATGGTTAGAACGAGAGAGCAGGTATGGTCTGCAACCAGGACACAACTGGTTTATCATCTCTATGCAGTGGTGGCAACAGTGGAAAGAATATGTCAAATACGATGCCAACCCTGTGGTAATTGAGCCATCATCTGTTTTGAACGGAGGAAAATATTCATTTGGAACAGCAGTACATCCTATGGAGCAGGTTGAAGATAGAATTGGAGGCAACCTCAGTTATGTGAATTCTACAGAAGAGAAGTTTTCAGACAACATTTCTACTGCATCTGAAGCCTCAGAAACTGCTGGCAGCGGCTTTCTGTATTCTGCCACACCAGGGGCAGATGTTTGCTTTGCTCGACAACATAACACTTCTGACAATAACAACCAGTGTTTACTGGGAGCCAATGGAAATATTTTGTTGCACCTTAACCCTCAGAAACCAGGGGCTATTGATAACCAGCCATTAGTAACTCAAGAACCAGTAAAGGCTACATCATTAACACTAGAAGGAGGACGCTTAAAACGAACTCCACAGCTGATTCATGGAAGAGATTATGAAATGGTTCCAGAACCTGTGTGGAGAGCACTTTATCATTGGTACGGAGCAAACCTGGCTCTACCTAGACCAGTAATCAAGAACAGCAAGACAGACATCCCAGAGCTGGAATTATTTCCCCGCTATCTTCTCTTCCTGAGACAGCAGCCTGCCACTCGGACACAGCAGTCTAACATCTGGGTGAATATGGGTATGATGAGCCTGAGAATGTTTCCTCAGCATTTACCGAGAGGAAATGTACCTTCTCCGAATGCACCTTTAAAGCGAGTATTAGCCTATACAGGCTGTTTTAGTCGAATGCAGACCATCAAGGAAATTCACGAATATCTGTCTCAAAGACTGCGCATTAAAGAGGAAGATATGCGCCTGTGGCTGTACAACAGTGAGAACTACCTTACTCTTCTGGATGATGAGGATCATAGATTGGAATATTTGAAAATCCAGGATGAACAACACTTGGTAATTGAAGTTCGCAACAAAGATATGAGTTGGCCTGAGGAGATGTCTTTTATAGCAAATAGTAGTAAAATAGATAGACACAAGGTTCCCACAGAAAAGGGAGCCACAGGTCTAAGCAACCTGGGAAACACATGCTTCATGAACTCAAGCATCCAGTGTGTTAGTAACACACAGCCACTGACACAGTATTTTATCTCAGGGAGACATCTTTATGAACTCAACAGGACAAATCCCATTGGTATGAAGGGGCATATGGCTAAATGCTATGGTGATTTAGTACAGGAACTTTGGAGTGGAACTCAGAAGAATGTTGCCCCATTAAAGCTTCGGTGGACCATAGCAAAATATGCACCCAGGTTTAATGGGTTCCAGCAACAAGACTCCCAAGAACTTCTGGCTTTTCTCTTGGATGGTCTTCATGAAGATCTCAACCGAGTCCATGAAAAGCCATATGTGGAACTAAAGGACAGTGATGGCCGACCAGACTGGGAAGTAGCTGCAGAGGCCTGGGACAACCATCTAAGAAGAAATAGATCAATTGTTGTGGATTTGTTCCATGGGCAGCTAAGATCTCAAGTCAAATGCAAGACGTGTGGGCACATAAGTGTCCGATTTGACCCTTTCAATTTTTTGTCTTTGCCACTACCAATGGACAGTTATATGCACTTAGAAATAACAGTAATTAAGTTAGATGGTACTACTCCTGTACGGTATGGACTAAGACTGAATATGGATGAAAAGTACACAGGTTTAAAAAAACAGCTGAGCGATCTCTGTGGACTTAATTCAGAGCAAATCCTTCTAGCAGAAGTACATGGTTCCAACATAAAGAACTTTCCTCAGGACAACCAAAAAGTGCGACTCTCAGTGAGTGGATTTTTGTGTGCATTTGAAATTCCTGTCCCTGCATCTCCAATTTCAGCTTCTAGTCCAACACAGACAGATTTCTCCTCTTCGCCATCTACAAATGGAATGTTCACCCTAACTACCAACGGGGACCTGCCCCGACCACTATTCATCCCCAATGGAATGCCAAACACTGTTGTGCCATGTGGAACTGAGAAGAACTTTACAAACGGGATGGTTAATGGTCATATGCCATCTCTTCCTGACAGCCCCTTTGCAGGATACATCATTGCAGTCCACCGAAAAATGATGAGGACAGAACTGTATTTCCTGTCGTCTCAGAAGAACCGCCCCAGCCTCTTTGGAATGCCATTGATTGTTCCATGTACTGTGCATACCCGGAAGAAAGACCTATATGATGCGGTTTGGATTCAAGTATCCCGGTTAGCCAGCCCACTCCCACCTCAGGAAGCTAGTAATCATGCCCAGGATTGTGATGACAGTATGGGCTATCAGTATCCATTTACTCTACGAGTCGTGCAGAAAGATGGGAACTCCTGTGCTTGGTGCCCATGGTATAGATTTTGCAGAGGCTGTAAAATTGATTGTGGGGAAGACAGAGCTTTCATTGGAAATGCCTATATTGCTGTGGATTGGGACCCCACAGCCCTTCACCTTCGCTATCAAACGTCCCAGGAAAGGGTTGTAGATGAGCATGAGAGTGTGGAGCAGAGTCGGAGAGCACAAGCCGAGCCCATCAATCTGGACAGCTGTCTCCGTGCTTTCACCAATGAGGAAGAGCTAGGGGAAAATGAAATGTACTACTGTTCCAAGTGTAAGACCCACTGTTTGGCAACCAAGAAGCTGGATCTCTGGAGGCTTCCACCCATCCTGATAATTCATCTTAAGCGATTTCAATTTGTAAATGGTCGATGGATAAAATCACAGAAAATTGTCAAATTTCCTCGGGAAAGTTTTGACCCGAGTGCTTTTTTGGTACCAAGAGATCCAGCGCTCTGCCAGCGTAAACCACTCACACCCCAGGGAGACGAGCTCTCCGAGACCAGGGTTCTGGCAAGAGAGGTGAAGAAAGTGGAAGCGCAGAGTTCGGCCGGGGAAGAGGATGTGCTCCTGAGCAAAAGCCCATCCTCACTTAGCGCCAACATTATCAGCAGCCCAAAAGGTTCTCCTTCTTCAACAAGAAAAAGTGGAACCAGCTGTCCCTCCAGCAAAAACAGCAGCCCTAATAGCAGCCCACGGACTCTGGGGAGGAGCAAAGGGAGGCTCCGGCTGCCCCAGATTGGCAGCAAAAATAAACTGTCAAGTAGTAAGGAGAACTTGGATGCCAGCAAAGAGAATGGGGCTGGGCAGATCTGTGAGCTGGCTGACGCCTTGAGCCGAGGGCATATGCTGGGGGGCAGCCAACCAGAGCTGGTCACTCCTCAGGACCATGAGGTAGCTTTGGCCAATGGATTCCTTTATGAGCATGAAGCATGTGGCAACGGCTACAGCAATGGTCAGCTTGGAAACCACAGTGAAGAAGACAGCACTGATGACCAAAGAGAAGACACTCGTATTAAACCTATTTATAATCTATATGCAATTTCGTGCCATTCAGGAATTCTGGGTGGGGGCCATTATGTCACTTATGCCAAAAACCCAAACTGCAAGTGGTACTGTTACAATGACAGCAGCTGTAAGGAACTTCACCCTGATGAAATTGACACCGACTCTGCCTACATTCTTTTCTATGAGCAGCAGGGGATAGACTATGCACAATTTCTGCCAAAGATTGATGGCAAAAAGATGGCAGACACAAGCAGTATGGATGAAGACTTTGAGTCTGATTATAAAAAGTACTGTGTGTTACAGTAAAGCTACCACTCTGGCTGCTAGACAGCTTGGTGGTGAGGGAGATGACTCCTTGTAGCTGACATTTGGCAGAAGCGTCACTGAAAGGCAAGCTAAATGTAGTTATTTTATCCTGTGACCCTGAAGCACAAAATAAAAATTCTAATTAAAATAGTTAACTTTAAGAGTAGTAATAATTTTATTTTGAAGTCTCATACAAGCTCTCCGACAGAGAACTTTCAGGCAGATCCCACCATTAGCCTGTAAACAAAGGGTTTGGCACCAGCCACCTGGGACCAAATAAGAATTCAACTGTGCTTGTCCAGATGTGAACAAATATGTAGTGAGTATAGAGTTTACCAGTAATCATAACAAATATTAAAGATTTCCTTGGAGTCAAAGTAAAAAACAAAAAATTATAATGTTGTCTAGGGACGACATGATATGCTACCTCCTTTTTCCTGAAGTTTTATTCCATTATATTGACAAGATGGAGAAAGCAAGATCATGAAGGTGTGCAAATGATTCTTATGGCATGGATGATGATTTTTTGATTTATTTTTTAAATTGTTTCCCTACTCTGTCTTTCTTGTTTTTTGTTTTTGTCATTGTGTTTGAGTTTGAGACACAACCAGTCATTGGTGGCAGGGGCATATAGTGGTTAGTCTGAAAGGGAGGCTTTCTTAAGAGCTATGTGCCTTCCACCCAGAGCCTTGTGGGAGACCCAGTAAAAAGGAAAAGCATCCTGGGAAATCCAGCTACCATGGCCCTCCCAATGGAGGCATCTTACATTTAGGATACTTCAAGTATCCTCAGAAATGTATTCTGCACCCCCGGCCCCACCCATGCTGAGGGAGGGGATGTTTGCCAATATTTGCATCATCTTCACATGCACATGTTGCAACAAGAGCTTCTGGGAAGGTAAGCAGCATTGGAGCTAGATCAAGTTTCACAATTAGTGGTTCTTTTCCGTGTTTGTTTTGCACTTTAAAAAGGAGAGAACACATGCAAATGAATCTGCTTGTGTGTATTTGATGGCTCTAAGGGCTATAAATTAAAACAAAACACATCCCAGACATTGGGATTTCATAGATTTATTTAAGGAAGTTGGTAGTTTTAGGAAGTCAACTTTAGTTTTGCTTTATTTGCATGTCCACTAATTTTTTTATTTTGATATTTGTCTTTTTAAAAAAATTTGCAGTAGTTATTAAAAGTTATGTTTCTTTGCTTACTTCATTTTTTTCTCCAATTATTCAAGACTGGAACAAACATAAATATTATTTATTTCAGGTAGCATTTTTTTTCTGTGTAGTTTTTTAATATATATTTGAAGGAAATGTTTCATCTTGTTTTTGGTCTTTGTTTATTCATTTAGACCCTGCAAGTTGATTCTCATTAATTGTCAGATTCCACTACCCTTTCTTCCTCAGAGGTAGTAATTACCAATGTAACTAAGCATTTGTATTCTGATATCTGAGGCCAGTAACTATTAATATCTAGTTCTTTTCAGAGCATTTGGAATGGTTACCTTAAATGACTACCTAAATTGAAATCCTTTTCAGAAAAAATATAATTACAAGTAGAAAGGAGTGGCCTAAATTGTATAATGTAATAAAGTCAGACAAAATGCATACTTTATAGTTTCAGATTTTCAGTATATAAAATGTGTCCATTCCTACCTGGACATGTCCCATTAAAAAGTGGAAGATTTTAAATAATTTCTTTACAGATGTTTTATTTAAGCAGGTAGCACAATCTACTAATGTTGTTTGATCTGTGTTTGTTATACTGGTTGTAATTAATTTTTTTAATTCACGAACTAGCAGAAAGTTTATTAAATTAACTATTAACTACATTCACCTTGTAAATTACTGTATAAAACTTGTTGACAATGCACTGACTTTAGAAAGATGTTAATGTACATAAATAGAGTGTAAATAAAATAGTGTTGATGTACTGAAATATGAACTGTATAAAAAGTATTGGTAATTGTATATGGGGTGTACCTGTTTATCTGTAACTATTATCCAAACAAATTAAATACTGTGGATGCCTCTATGTGCTGTTTTGCCTCATACAAGTAAACACAGAAAGTCAAATTCTTCAA\n>HQ846933.1 Monilinia fructicola isolate HAG7 internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene, complete sequence; and internal transcribed spacer 2, partial sequence \nCCTCCCACCCTTGGGTATTATTACTTTGTTGCTTTGGCGAGCTGCCTTCGGGCCTTGTATGCTCGCCAGAGGATAATTAAACTCTTTTTATTAATGTCGTCTGAGTACTATATAATAGTTAAAACTTTCAACAACGGATCTCTTGGTTCTGGCATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCCTTGGTATTCCGGGGGGCATGCCTGTTCGAGCGTCATTTCAACCCTCAAGCACAGCTTGGTATTGAGTCTATGTCAGTAATGGCAGGCTCTAAAATCAGTGGCGGCGCCGCTGGGTCCTGAACGTAGTAATATCTCTCGTTACAGGTTCTCAGTGTGCTTCTGCCAAAACCCAAATTTTCT\n>XM_035415524.1 PREDICTED: Anguilla anguilla abl interactor 1-like (LOC118226150), transcript variant X7, mRNA \nTCAGTTTTTTTGTATGTAGCTGGTGAAAGGTCGCTGTGGTGAAATCGAGGCCAGGAATCCCACAATACTAGGCGAAGGAGCTCCTTTTCGGGGCTGAGCTTGTGGTTTTAATCAAAGGGAAGGCGAAGAAGCGATGCAGAGACATGTAAGATGGCAGAGTTACAAATGTTGTTAGAAGAGGAAATTCCAGCCGGCAAAAGAGCCCTGGTAGAGAGCTACCAGAACCTCACGAGGGTTGCGGACTATTGTGAAAGCAATTATGTTCAGGCCCAGGACAAGCGGAAAGCTCTGGAAGAGACCAAAGCCTACACCACCCAGTCTCTGGCTAGCGTGGCCTACCAGATCAATGCCTTAGCCAACAACGTGCTACAGCTGCTGGACATCCAGGCATCCCAGCTGAGGAGAATGGAGTCCTCCATCAACCACATCTCCCAGACTGTGGACATCCACAAGGAGAAGGTTGCCAGGCGAGAGATTGGAATTCTGACCACAAACAAGAACACCTCGAGGACCCATAAAATCATCGCCCCCGCCAACATGGAGAGGCCGGTGAGGTACATCCGGAAGCCCGTAGACTACACGGTGCTGGACGACGTGGGCCACGGAGTCAAGTGGCTGAAAGCTAAGCAGGGGAACAACCAGCCGGCCAGAGGAGGGACGCTATCGAGGACCAATCCGCCGACGCAGAAGCCCCCCAGCCCGCCCATGTCCGGGCGTGGCACTCTCGGACGCAACACACCATACAAAACCCTGGAACCCGTTAAGCCTCCTGTCCTGCCCAACGACTACATGACCAGCCCCGCCCGCCTGGGCAGCCAGCACAGCCCTGGGCGCACAGCCTCCCTCAGCCAGAGGCCCAGAACTCACAGTGGAAGCAGCGGGGGCAGCGGCAGTCGTGAGAACAGCGGCAGCAGCAGCGGCGTTGGCATTCCACTAGCGGTGCCTACGCCTTCTCCACCCACTATGGCACCAGCAGTGGCCCCAGGGCCCGGTCCAGGCCCGATTCCCATGTCCCAGTTTGGCACGCTGTCTCGGCAGATCTCCAGGCACAATTCCACCACCTCCTCAGTCTCCACGGTTTCGGCCACGGGGACGTACAGGCGGGCCCCCTCCGTCACGTCCCAGTTCTCAGTCCAGCAGCCGCACATTAACGGCGGCCCCCAGGTGTACCCCCAGAACTCAATCGCCGACACCCCCAGCCTCCCGCCCCCTCCTCCCCCGGACGATGTCCCGATGTTCGACGAATCCCCGCCGCCACCCCCTCCACCGCCGGTGGACTACGAGGACGAGGATGCGGCCGTCGTGCACTACAACGACCCCTATGCGGACGGCGACCCTCAATGGGCCCCCAAGACGTACACTGAAAAAGTGGTGGCCATATACGACTACAGCAAGGACAAGGACGATGAGCTGTCTTTTATGGAGGGGGCAATCATCTACATCATCAAGAAGAACGACGACGGCTGGTTCGAGGGGGTCTGCAACGGCGTTACTGGCCTCTTCCCTGGAAACTACGTGGAGTCCATCATGCACTATGCTGACTAAAGACACCCCTTTTTTCTTCAGTCATCCCAAGACCATTATAAAAAAAGCATAACACTGGTCTACAAAAGCATATGTATAAGTGCATTAGAAAATGACCGAATGTTTGTTCCTTATTGAATTGCAAATAAAATAAATTCTATTTAGTTTTTTTGGTGGGAAGATTGTGGGATATAATGTATTACTTTGATGAGGTCCAATGGCTTGGTTGATCACATGCTCATGTCTGTCAGTTGTCCTGTCAGTTAATTGTATATAATGTTGAGGGCTGCAATTGGGTTGTTGGTAGTGTTACTGTTAATATTGATAAATGTCCTGAGCAGTGGATGCCACAAGTGAACATGTTAAAGTAGGGATTATGTTTTATAATGAGTCCGGTTATAAATTGTGCCATTTTCCCCCCTACCTTATCTTCCTCAGAAGACACAAGACCAATTTAATGCATTTTGGATCCTGAATGCAAACTTAACTGCTTGCCAGAATTGCAGACTTTTTTTTAGAACAGTGTTTCCTGGCTACTCGTAATTCCTGAAATGTACTTATCTTGCCGTGAAGCATGCACACAAAAGAACTGTAACATATACTTTATTTCCATTATGCTTCCAGTATGGTGTAATATTTACAGTGAGCACTCAAAATTAGTTTTTTTAAATGAAATGTCTGAAGCGGTTGTTTAAAGTCGTATTCTTTTTTCTGAAATGCTCTAATTTGTATTTAAAACATTTGATATGATTACATTTACATTAATAATTTCTACATTGAGTTATATATGTAAAACAAGGCTGTTTTGTTGGTAAGGTGTCTCAGAAGTCTGGAACCCTTGCCATTTGCTTGATACAGGTGTTGAAATGGTTTAAATTTCCAATCATTTATAGTTACAAAAGCAAAACCTCAAGTCATTAAAATTTCTGTGGAGAAAATACATGGTTCTAAAAACTTCAGTTAATTGGATGTTCTGTGTTTTAGTGTTAATGAGCTCTATCAAACATGGATATTTTAGATGTGGCCAAAATGTGCTCAGTTGGGTTATAACTGTTTCTCATCTGTCACCTAAAAAGCCATATGAATATTCCATTTTTAAAAATTGTAATGAAAACCAATACAACATATTCCTCTTCCTGAGAGGAAAAACAAGGGAGTTGCCATCCTGTCAAAGTATTGGTTTACTATTTTTAAAAATTTAATTACTCCATTAATTGTCTAGGTTCATAACTCAGGTCTAGTAATCTCCTTTGTTATTAAACAATCACTACAACAGAGCAAGGCAATGCCATCTTTTCATCTCTTAGTTTTGTACATTTTCTGTATTTTATAATGTATGAACATAAGTTTGAACCTTACCACTAAACCTGCTTTAAAAGGAAGTCACTCCTTCAAGTTTCACCTCTTCTTGAAAAATCCATTAGGTTGAAACTGACTGCTTACAGTATATTAATCACCAATGTGTGTTTCAGGATATTATCGCCAATTCCTTGATTCTTCAGTGTACGCTTTGGTATATTAAATGTGGAAAATTGCTAAATTCTTGCTTTCCTTTGGGAAGAACCCAAAACTTCTCTTCCAACCATAATTTGTATATATAAAAATGTTAATGAAATTTATGTACAGCTTTTTTATATAATAAATCATTCTCCTATATA\n>XM_017904422.1 PREDICTED: Eufriesea mexicana facilitated trehalose transporter Tret1 (LOC108550645), transcript variant X4, mRNA \nATTAAAAATCGAAGCAAGAAAAAATGGCGACATCCAAAACTCAGATAAATCATCTTTAGTGGAGTCAACATTACTTCCAAAAACCCAGTCAGTTAACCAGTTGGAAGATGGAAGACCTGAGCTTGCAACCAACAGTGGATACAGCGATGATGGAAATGGTCGAAATGTTAGTGGAAGTGTCATCAAACAAGTTCTGGCAGCAATAGTAGCGCAACTTGGGACCATTAACACTGGTATGACTTTTGGTTTTTCTGCCATTGCACTACCACAACTTCAGGAACAAAATAGCACCATTCCTATCGTCGAGGGATCATCCGAAGAATCATGGATCGCGAGTATGTCTTCCATTGGAACTCCCATTGGTTGTTTAGTGTCTGGATATATGATGGACGTACTTGGAAGAAAACGATCTCTCATTATTACTGAGATTCCAGCATTACTTGGATGGATATTAATTGCATTAGCAACTGATATTCGTATGATATATGCTGGAAGATTCTTCGTTGGACTTGGATCGGGTATGGTAGGCGCTCCAGCACGCGTCTATACTGGAGAAGTAACACAACCCCATCTACGAGGAATGTTGACTGCTTTTGCAAGTATTGGAGTCAGCACTGGTGTTCTGATCGAGTATGCATTAGGAAGCGCACTTACATGGAACGTCTGCGCAGCTATTAGTGGAATTATACCTCTTGCCGCTCTGCTGTTAATGTTTCTCTTTCCTGAGACACCTTCATACCTCATATCTCGTAGTAGACCTGAAAAGGCACGAAAAGCGTTACGACAATTTCGCGGTAGTACATATAATATTAATCAGGAAATGGAAACACTTATTAATTTTTCAAATAAGAATAATATTAAGCGTTTAACAGGATTCCGTGAGATAATTAGCGCCCTTTTAAAGCCTAATGCTGTCAAACCTTTTACTGTCCTATTCTTGTACTTCTTAATATACCAATGGTCAGGTACAAATGTCATAACTTTTTATGCTGTTGAAATTTTTAAAGATTCAGGAGCAACGTTAAATAAGTACTTAGCTGCAGTAATTCTCGGAATAGTAAGATTAATATCAACGGTTGCCGCTTGTATCTTGTGTAGAAAGTGTGGCCGAAGGCCCCTTACAATGATTTCTTCCATCGGTTGTGGACTTTCCATGGTAGGATTAGGTGGATATATGTGGCTGAAAAATAACTGGGATGCAAATAATTTTACACCTGTTGCTACTTGGTTCCCTGTCTTTTGTATATTTGCATATACTGTAACTTGCACACTTGGTTTTCTTGTTATTCCTTGGGTAATGATAGGCGAGGTATATCCAATACAAGTACGCGGTATTATTGGAGGTTTAACTACAATGGCAGCCCACTCTTTTATTTTTACAGTAGTTAAAACGTATCCGTTCCTAGCTAACGCACTTACTCGGCACGGTACTTTCATCCTTTATGGTTGTATATCTTTATTCGGCACGATATATTTTTATCTATGTCTTCCCGAAACTAAGGGTAAAACTCTTCAAGAAATAGAAGATTACTTTTCTGGTAGAAACAATAACTTAAGAACCGGAAGTATAGGTAAACATAAGCCAAAGGTATTAGAAGTAAAAAAGGGTCACATATTGCCTTGAATAACTCATACAGTGAACATCTTAATAAAATTAAATTAATAAATCTGTCTTCCATTGAACAAAT\n>XM_001378120.4 PREDICTED: Monodelphis domestica inhibin beta C (INHBC), mRNA \nACCCTGCTTTGTACTTTAGCTACTTATCAGTTGGCAGAGTCTGCCAAGTTCTAGTGTTGGTCTTGTCCTTCTCAAGCCAGATGTGCGGCCACCATCTCTCCCAAGGTAAAGAATCATGCCAGCTGGACACACACCTTTGGTGTGGACTCTAGCATTTAAAACTCAAGTGGCATAGTGGCTGAAGCCCTGAGCCCCAGATTTAAGGTGTTTCTTCTTCCAGAGGAAGACCCAGCTGAAAATGGTCTCTACTCTGCTCCTGAGTCTCCTGCTCTTGATTCCAGCTGCAGCAGGGACCGAATGGATTGATGGTCAATGTCCAGCATGTGGGGTGCCTGGTTCAGATCCTGAGAGACAGAGGGAAATACTGCTCAATCTGGCAAAGCAAAATATCCTGGATAAACTGCACTTAACTCAACGCCCGACACTGATCCAGCCTGTGTCCAAAGCCACCCTGAGAACTGCACTTCGACGCCTCCACGGTCTCCAAGGAGGAAGGATTGTGCCTGGTAGCACTTTAGGGGGTTCTGGGACTGGAGTTGAGGAACAGGAGTATGAGATCATCAGTTTTGCTGAGACAGGCTACTCTACCACCAACAGGACGGTGCTGGATTTCCAACTCTCCCCAGATCAAAGCAGTGGTAGCTTGGAGGTCCTCCAAGCCAGGCTGGGTTTTTTCTTGAAGATTCCTCCCAATGGCACATGGACTATGCACGTGAGGGTCCTGGGGCCTGGGCCCCGGGACACCAACCTCACTTTGACCACCCAACACCAGCTAGAGGTAGATGCCAGTGGCTGGCACCAGTTCCTCCTGGGGCCAGAGGCCCAGGCTGCTTATGGTCAAGGGCATCTGACCCTAGAATTGGAGGCCAAAGGCTGGGGAGCCCAGGGCCCAGTTTTCTTGGAAAAGGATGCCCATCAGCCCTTTATAGTAGCTCAGGTGAGAATAGGAGAAAAGCACCGGATTCATCGTCGAGGCATCGAGTGCCAAGGTGGGTCTCAGATGTGTTGTCGACAAGAGTTCTTTGTAGATTTCCGGGAGATTGGCTGGAATGACTGGATCATTCAACCTGAAGGTTATGCTATGAACTTCTGTACAGGGCAGTGCCCACTACATGTGGCAGGCATGCCAGGAATCGCTGCCTCTTTCCACACTGCTGTGCTTAACTTGCTCAAGGCTAATGGGGCCCCAGGAACAACTGGAGGAGGCTCCTGCTGTGTGCCTACTGCCCGCCGCCCTTTGTCCCTTCTCTACTATGACCGCGACAGCAACATTGTCAAGACTGACATCCCAGATATGGTGGTGGAGGCCTGTGGCTGCAGTTAATGTGTATAAAAGGGAAGGAGGACACGCAGAAGAGGACATTCACTTAGAGATTCCCTTCTCATCTCAGGCAGGTTGTTCACAAATTCTTCCACAACCCATAATGGGGAACCAAGGCATTTCTGGAAATCCTTCCACTCTCCCTCTGGACATTCTATTGAAGCATCTGGTAGCAGGGTAGACAGAGAGCACTGGACCTCAGCAAGACCGAGTTCAAAGTTGGCTTCAGTATGACCTGGAGCAAATCACTTGTCTTTATAGTCTCCTCAGCTATAAAATGGGAACAATAATAGTACCTATCTCACAGGATGGTTGCATGAATGAAATGAGATGTTTGTAAAAAAGTACCATAGTACTTGGTGCATAGCA\n>XM_017900195.1 PREDICTED: Eufriesea mexicana UPF0769 protein C21orf59 homolog (LOC108547609), mRNA \nATGGTCCGGATGCACGTGAAGAGAGGCGAGGAGAGCCAGTTTCTGTACGACACACACGTGGAGGCTCGGGTTGAAGACATTATATACGGCATTACTATTATTTACAACGGCCGGCTGAAGATCTCGAGAATATGTTATGAAATCGAGGAGCTGGCCAAGCACGGCACCATGCTGCCCCATAACATCATGGGCCTCACCGACGAGCAGGTAGAGGAGCTGAAGCTCAAGGACGAGTGGGGCGAGAAGTGCGTACCGATGGGCGGATGGACCTTTAACAAGGACGTTATCGGCCGCAGAAACGGCAGACAGCCTAACGCGAAGATGCAGGAGGTCTTGAACAAAACGATCGGGGAGGCACGAGCTATGGTTTCAAAGAAATTGATACAAGAGGAAAAACTGGTGACGCAGAAAACTGTGCAAGATGCACTGGATATACTGAGGGGGGCCGTAACGATTGTGTATCCGATGGGACTTCCGCCTCACGATACGATCCGACAGGAATTCGAAAACACCGAGGATCTGAGTGGCACTCAGGCATCTCTCGAAGTTATCGACGTACAACTGGCGCAACTTTGGTTCTCGGGAAAGGAAATGTTACCGGGAAGAAAATTAAAAGATTATTTGGGGATGAACGAGAAAACCAAGATTATCGTGAAGCTGCAGAAAAGAGGAGCCGGAAGACCTGCTCGTGAACCTCTGATGTCAGAGGACGAAAGGAAAGAACTAATGCTGCATGCATATAAACGACAAGAACAACTCAAGATTTCTATCGTGGATAGTGATATTATGTTAACACAAGCGGGTAAAATCAGTTTTCTGATAATTCTCTCAATTTTTCTTCGGTTATGCAGTGCCATGTGGAGAATATTGTGGTGCCTGGGTAAACCATATAAAGCTTAG\n>XM_007934287.1 Pseudocercospora fijiensis CIRAD86 uncharacterized protein (MYCFIDRAFT_46883), partial mRNA \nATGGCCGCGCCTGCACAAAATGGCCCTGTGCCCGCGGGCGCCCCTGCAAAAGCGACAGAAGCGCAACTCATCACTGCCTTTGACAACTCAATATGGTATCTACTTGACCTATGGCAACCGCTATCCATCGCAGTGGATAATGGCTGGGGCGGAGGGAATTCTTCAGACAAGCGCGACTGGTTCGCCGGCGCAGTTTCCGATTTCTTGAATCAACCGCAGTATATCAATCCTGCTCCGGGTGCTGTGCTCACCTTCGCCGACATGCAAGAAGATCTCGAAGTTTTCCTCCTACAAATCATGCAGGACGAGTTTGACTGCAACATCGAAGACGAATCGGAAGTGGAGCTTGCGAACGGCATCCTCAGAGTGCGAAAAGCCATGACTGAGACCTTAAGCACGGCTGCGGCGGACGAGGTGAAACAGAGATGGGAGAATCGAGGAAGCAAAAAGCATGAAAAGATTGTGGTTCAGGAAACGAACCAGGAAGTTGGCGACGACGAAGAGTGGGATGGTTTTGATGAGGACGAGGATATGGACGAGGCGCCACAGCTCCTGCAAGCGCCTGCACAGCCGCGAGAAAAGCCTATACCTGAGGTTGACGAGGACGGATTCACAAAAGTCCCGAGCAAGAAAAAGAGATGA\n>XM_007491848.2 PREDICTED: Monodelphis domestica cytochrome c oxidase subunit 6B1 (LOC100013297), transcript variant X1, mRNA \nCGTTCCAGGCCTACGCTTCCGCTTCCGGTCTCGGACCCTTAGTGCTGAGGGTCACATTGAATCTGCGGTGCCCGCGGGATTAGCAGCGGAGACAACTACAGTGACAGCGGTAGGAGCGGCCTCAGTCCAGGAGCCACCATGTCTGATGATATCAAGGCCAAGATCCGAAACTACCGCACTGCGCCCTTTGACAGCCGCTTCCCCAATCAGAACCAGACCCGCAACTGCTGGCAGAACTACCTGGACTTTCACCGTTGTGAGAAGGCCATGACTGAGAGAGGCGGTGATGTGTCTGTCTGCCAGTGGTACAAACGTGTCTACAAGTCCCTCTGTCCCTTGTCCTGGGTCAGTAATTGGGATGATCGCAGAGCAGAAGAAACCTTCCCTGGAAAGATCTGAGCGACTTCCTTTTCCTCCCTTCTCCCCGACCCCAATGTCTGGGGCTGGATCCCTTCTTCCCTCAGCGTGGGGGGAATGTGATCTGTGGCTACCCCTGCCCTGAGGGGCCTGAATCATGTTAAAATAAACTGTTGGAATC\n>XM_024666474.1 PREDICTED: Selaginella moellendorffii aquaporin NIP1-1-like (LOC112343293), mRNA \nCCCTGCGCCGCGCGCCTCTATACTCTCCCAAAGTCTCCACAATTTATGGCCGCTTATAAAAGCTTGCACGACTTCTCTGCCTCCTCGCGCACAACCATCTCTCCTCTCCCCAATTCCTCGCCTGATCGAATGTGATCGCTTCTTGGGCTGTGCTGCGACGACCTTCCTGACCCGATCCATGGCAGCAGCGGCGGCAGGGATGAGCGATTTCCAGCTCAACGAGATCCGGGTCACGCCAGCGCCCTCCATCGCTCTCCCCGCGAATGGCCACCAGATTCATCACCAGGCCTCGCCTCCCGCGGCCTCTAGGGGATGCATTCCAGTCGCCATCGTGCCCAAATCCACGCTCTTCCAGAAGATTGGCGCGGAAGTGATCAGCACATTCATCCTCGTCTTCGCGGGATGTGGCGCCGCGATGGTGGACGCCAAGTACAAGGATTCGATCACCCACTTGGGCGTCTCGGCGGCGTTTGGGCTCGTGGTGATGATCATGGTCTACGCCGTCGGCCACATCTCTGGAGCTCACATGAATCCGGCCGTGACTCTGGCGTTTGCGACCGTGCGCCATTTCCCCTGGAAGCAAGTTCCTGCCTACATCGGCGCACAGGTCACTGCCGCGATCACTGCCGCGTTTGCGCTGCGGCTGATCATCAGCCCCGTGGCTAACATCGGTGCCACAATTCCCGCTGGAAGCGATCTCCAGTCCTTCTATCTGGAAGCGATCATCACCTACATTCTCATGTTCGTCGTCTCCGCCGTCGCCACCGACACTCGAGCGATTGGAGAATTGGCAGGCCTCGCAATCGGTGCTACAGTGGGCTTGAATGCCATCTTCGCCGGGCCGATTTCGGGCGCGTCAATGAATCCAGCACGAAGCTTGGGCCCCGCGATCGCCGCGAACAACTACAGTGGATTGTGGGTTTACATTGTCGGCCCGACAGTCGGCGCGCTGGCGGGTGCGTGTTCTTACAACATGATCCGGTTGCCCGTGAAGCCGGACGAGCTCCCCAGGGCCGCTAGCTTCAAGAGATAGAACAAGGCTGTAAAAAGAATAGCAGCTTTTAGGTGACCACCTAAGTGATAACTCAAGTAAAAAAATAACTAGTTAGCCGTGTCTCGGTTA\n>FQ756522.1 16S rRNA amplicon fragment from a soil sample (ferralsol, Madagascar) resulting from a 16 days laboratory incubation experiment in the presence of 13C-enriched wheat-straw and a tropical peregrine endogeic earthworm, Pontoscolex corethrurus: Light-DNA fraction (DNA-SIP technique) \nTAGCCTTGCGGCCGTACTCCCCAGGCGGGGCACTTAATGCGTTAGCTACGGCACGGAACCCGTCGATAAGGCCCCACACCTAGTGCCCAACGTTTACGGCGTGGACTACCAGGGTATCTAATCCTGTTCGCTCCCCACGCTTTCGCTCATCAGCGTCAGTACCGGCCCAGACCACCGCCTTCGCCACCGGTGTTCCTCCTGATATCTGCGCATTTCACCGCTACACCAGGAATTCCGTGGTCCCCTACCGGACTCCAGCCATAGAAGTATCGAGTGGCCGCTCCAGGTTGAGCCTGGAGGTTTCACACCCGACTTTCCAAGCCGCCTACGAGCTCTTTACGCCCAATGAATCCGGACAACGCTC\n>XM_047971315.1 Xylaria bambusicola Gar1/Naf1 RNA binding region-domain-containing protein (F5B22DRAFT_384725), mRNA \nTCTTTTTGCGATACTCGAAGAGACAACTTGACATTGAAATACTACAAAGCTATATATACACCCCATGATCTTCTCAATTGTTCTCACCAGGTTTCTATGGTAGCTGCATCTCGCCCTGTCTACTTACTTAGGTTGGTATTCGGTGAGTTTGCTGTCTGGTATCAGTACCAGATCTACAAGAATCCATCGCCACAAGCAGCCTATCCGTGAAAGCAATAATCCCAGAATCAACACCTACATCACCAACACCGTCATGTCTGACGTCAAAATTCCTGGACTTGGCAACTTGCAACCCGCCGCGGATACAGAGAGTGGCAATGTCCAGCCTACTGCGGTGCCTGCGGTGCCGGCAGACGAAATGGCGGTTGATAATCCACCAAGTCCACCATCACTCACGTCGGGACTCGAAGCCCTCCTTGGTGGCCTAGACCCTCTACCAGAGCCAGTGCCCGCTTCATCAGAACAAAGTAAAGATACCACTGGTGCTCTACCGGAAACAAACAACACAGCTGTATCAGAGACTGAAAATCCAGCGCAAGCCAGCGCCTCCCAAGAAGCTGGTAATGATAACGTGCAAGAAGAGCATCCAGAGTGGGAAGTGGACTCATCTCCCTACGAGTCATCTTCCGACTCTAGCAGCTCGGATGACTCTGATGAGGACTCTGACGATGAGAAAGACTATAAGATTCTTGGGCCCGAGGAGACCGCCCGTATACTCATGGAAATGGATGGTGGGTCTGACGACGAAGGTGATGGCAAGGGAAAAGGTAGCAGTTCTGGTATGGTACGAACCAAAAATGAGCTCCCTGAAGCCATCGTCCCGCGACCCGAAGTTGAGATCAAACCTGAGATGGAGATAGTTGAGCTGGGTTCGATTGAGCATTTCGTTGGCAACACCGCTGTCATCAAAGCAAATACCGACGGAGAGTACCAAGTCCTCGACACAGGATCTGTGCTTTGTCTTGCAGACCGAACCGTGATAGCTGCCGTGGCGGATGTCATCGCGGCGGTGCGGGAGCCTCGGTATACCGCTGGCTTCCAAAACGAAGAAGAGATCAAGTCTTTCGGATTAGAGACTGGAACCAAGATCTTCTACCCACCTGCACTAGCAAGTCTTGGGTTCACAGAGATGCTCAAAGCCAACAAGGGCACAGATGCAAGTAACTGGCACGACGAGGAGGTCGCTGAAGACGAAATCGAATTCTCGGATGATGAGAAGGAGGCAGAGCACAAGCGCCAATTGAAAGCCAAAAAGCGAGGGGCACGTGGTGGTCGAGAGGGTGCGGCGAGTCGAGGAGGACGTAACGATGCTATTCCTGCGGGTGCCTCCATGGCCTCGGCTGAATTGAAGTACGATGATAATGACGATGATGACGGCCCTTACCGACCGCTAGCTCGTCCAGTAGGATTTGGGCAAAACCAAGCCTCCCATGGAAGCAGTGAGCCTCCGAGTGGCTTCTCTGGCCATTCCGGTGGTCATTGGGGAAATCGAGGCGACTTTAGAGGCAGAGGGAGCCGTGGCCGGGGCGGACGTGGCAATCGTGGTGGCAATGTGCGTGGCGGATATTCACTACCACCAAGACCACAAGGTCAAGACGGCCAGGGAGCGCAAAGTTACCACCAACAACAACCACCTGCGCAACAGTACAGTCTACCTCCTATGGTGATGGGTGGTCAACCCTTTACAAGCTTAAGTCCTCCTCAACCCAACGCTCAGCAACCACATGGACCTGCCAACCAGCAGTTTCCCTTCCCCTGGCCACAAAATGCTCAACCAGGCTTTTATCCTCCTCCACCACCTCAATTCACAGGCCAGTCTGGTGCAAATGGGATGTATTTACCGCCCAATTTCTTGACAGCTCTACAAAATCAGATGCAAGCCCAACAAAATCAACAAAACAACCAGTGGCCCGGTCCACATGGCCAACACAACACTAACTCATGGCCTGGACAAGGAGGCCACGGGTAAAAATTTAGCATGTCGTTTGCTTGTGCTGGGGAAATCGGCACGTGGATTATAGGCAATAGGTTGTGGCATGGATCTAACATTTTAGGCGCATATACTCTGGCCAGCTGTGATGGCGAAAGTAAGGACAGGGCTGCCCAGCATGGACCTTGTTCAAAATAACGATGATGACTACCGTACTCTTGGTAGCACGTACGGCTCATTTGCTCGCTAACTGGCTATTGGCCTGAACTGACAGAGAAGAGAACGTCCCTCGGCTGAACTGTCGATCGCGCCTTATCTACATACTTTGTACGTGTGGTTGTGACTAAAAGTCGAGTCGCCCCGTTTCCGTACGATAATATATATTATATGCTCCCTAAAATATGATTATATTTGATGCCACTCTTGTTCTCAGGGAGGCTGACATGCTGTTATTTTGCTGCGTCTTGATGCGACTGGTG\n>XM_014964001.1 PREDICTED: Calidris pugnax family with sequence similarity 19 (chemokine (C-C motif)-like), member A2 (FAM19A2), transcript variant X1, mRNA \nTTTTTTTTTTTTTTTTTCCCCCACTCAAATACTCTGAGACCGTGCACGAGAAACACTTCAAGTGGTCCCTCCCTTCCTACTTCCTTCACCCTTCCTCCAGCGTCTCTTTACCGGATTCCTGGTGTATTCCAAGGGAGAGGCGGGGGGAGAGGCGGCGGAGGGCTGCCTGCCCCAGCCCGGCCCAGCCGAGGGGAGCCGAGCCGAGGCGGGCGCGGTGCCGCTCCATGCCCCCGGGCGCTGGCGGGGCGCGGGCCGTCTGCCGGCGATGCCCGGGCGGTGAGGCTGGAGCTGGAGCCGGAGCTCCCTCCCGACGGGAGGCGGCCGATCCCTAGGTGTTTCCAGGAGGAAGCGGGGCTGCAGGATGAATAAGAGATACTTACAGAAAGCAACAAAAGGAAAACTGCTAATAATAATATTTGTTGTAACTTTGTGGGGGAAATTAGCATCTGGGGCAAATCATCATAAAGCTCACCATGTTAAAACTGGGACCTGTGAAGTGGTGGCACTCCACAGATGTTGCAATAAGAACAAGATAGAAGAAAGATCACAAACAGTGAAGTGCTCCTGTTTCCCTGGGCAGGTGGCGGGTACCACCCGGGCAGCTCCTTCTTGTGTTGATGCTTCAATAGTGGAGCAGAAATGGTGGTGCCACATGCAACCATGTCTTGAAGGAGAGGAATGTAAAGTTCTTCCAGATCGTAAGGGATGGAGCTGTTCCTCTGGGAATAAAGTAAAAACAACGAGGGTAGGTATAATACCAACTTTACATGTTACCAACAGGTAA\n>XM_012986102.1 PREDICTED: Erythranthe guttatus probable polyamine oxidase 4 (LOC105961838), mRNA \nAAAAATCCCGAATTTACCCCTAGCCGAACAGAAAAATATCATGCACAAACAACAAACCGCGTACCCCTACGTCTCCTCTTTAAGTTAATCCGGACAACCAGCCTTTTTTCTTCTGCCTAACAAACAAATTTCTAGAGAGAGAGAGAGAGACAGACGGTGGTAGAGAGAGAGAGAGAGAGAAAGTAGGGGGAGAGCCAATCTATGCAACCGAGGACGAAGAATTCATCGGTTGGTGTAATTGAATCTTCTGGTTGTTGCCGTGAATGCAGCTCCTGCAATTGTTGCTATTATGATTATTATGAGCTTGTTTGACGATAACCTCCGCTGCGCTTCCAGTCTCAGCCGCCTCATTGCCGGACTTTTGCTTTTCCTCCTCTTTCATTCTTCCCAATTGATTTCTAATTTTCCGATTCCTATACACCCGTAATTTTTCGTTTTTTTTTTTTTGAAAAATTGTTGTTGGTAAGATCAGATTTGGTTCTCCATCAATTTTCATTCCCAGTTAGGGTTCTCTGAATTTGTTTGTGAGAGAGAGAGGTAGAGATAGAGAGAGAGATAGGTATTTTCAGTTGTCGATTAATGGAAGTCAAATATGGCGACGATTCGATCTCCGGCGAGTTTTTTGATGGCATTTACGGCTCCCTTGTAGAGAGGCCACACAATGCACTGCCTTCTGTCATCGTCATCGGTGGAGGAATATCAGGGATTGCAGCTGCACGCATGCTGCGTAATGCATCTTTTAAGGTGATCGTGATGGAGTCGCAAGATAGAATTGGTGGGCGCATTCACACCGATTACTCATTTGGTTGCCCAGTTGACATGGGAGCTTCCTGGTTGCATGGTGTCTGCAATGAGAATCCTTTGTCTCACGTGATACGTCGTTTGGGGCTCACGTTGTATCGTACAAGTGGTGATGACTCCATTCTGTATGACCACGACTTGGAAAGTTATGCACTCTTTGACATAAATGGACATCAAGTTCCCAAGAAAATGGTTATTGAAGTTGGAGTTGCATTTCAGAAAATCCTTGACGAGACGGATAAAGTGAGGGATGAACAAACCGACGACATATCTGTGAAGGAAGCAATATCAATCGTGCTGGATAGATATCCAGATTTAAGACAAGAAGGCGTCGCATGTGAAGTGTTGCAGTGGTACATTTGTAGAATGGAGGCTTGGTTTGCTGCTGATGCAGACATGATATCTCTGAAAGCGTGGGACCAGGAGAGAGTTCTTTCTGGTGGTCATGGGCTTATGGTGCAAGGGTACGATCCAGTCATAAAGGCCCTCTCAAGAGATATTGATATTCGCTTAAATCACCGAGTTGTAAAAATTGTGAACGGGTATAAGAAGGTGGTAGTAACACTTGAAGATGGGAGAAACTTCGTTGCAGATGCTGCTATTGTCACAGTGCCATTGGGAATTCTAAAATCCAACTTGATTGAGTTCGAGCCTAAGTTGCCAGAGTGGAAGCAGTCTGCAATATCAGATCTTGGTGTGGGAAATGAGAATAAAATTGCCTTAAAATTTGATAATGTTTTTTGGCCAAATGTGGAATATTTGGGCGTGGTTGCGAAAACGTCTTATTCGTGTGGCTATTTTCTTAATCTCCACAAGGCTACAGGCAATCCCGTCCTTGTCTATATGGCAGCTGGAGCACTTGCGGATGACCTTGAGAAGCTATCAGATGAAGCTGCTGTCGGTTTTGTAATGTCACAGCTTAAGCAAATGTTTCCTGATGCAACTAACCCTGTGCAGTACCTTGTATCACATTGGGGAACAGATCCAAACATTTTGGGATGCTATTCGTACGATGCTGTGGGGAATACAGAGGATATATACGACAGGCTTCGTGCACCAGTGGGGAATCTTTTCTTTGGAGGTGAAGCTGTAAGCGTTGATCATCAAGGATCGGTACACGGCGCGTATTCTGCTGGAATAATGGCTGCTGAAAACTGTCAAATGCATCTTATGCAGAGGCTCGGGGGTCTGGAAAGAGTTTCTGTCGTTGCCTGTCGGGAGGATCTTGTCGAGGCTAACGTTCCTCTTCAGATATCGAGATTATAAGTTATTTGTAATGCCAAGGAAATAAAGATAGTGCAACTTGGTTTTAGGACCGGCAAATGTGTGAACAAAGTTTTCCTTTTTTTTTTTTTTTTTGCCTTTTCTTCAAGCAGTGTGGAAACTACATTGTTCCTTTTAACTTTTGTTAGAAGTGATGCTTTGGTAGTTGATGAGTGGTAGCGCCTTTTTAAGAACTCAATTACTACAAGCAGAACAATGTTATTGGTACTTTGTTTTCAGACCA\n>XM_030648245.1 PREDICTED: Cannabis sativa haloacid dehalogenase-like hydrolase domain-containing protein 3 (LOC115719273), mRNA \nGCATGAAAAAGGGGTTAAAAAAAAGAATCAAAAGGGTACGTTAGAGCGGTTTTAGGCCATAGTTTTTCTCCGCCTTTGTTTTGGTGTTCTTTAAAGACTTAGGTTCAGCTGCCCTCTACAATCTACATCTACTTCCTTCCTCCGAAGCCAAACTCGGTTAATGTGGGGAATAACACCATTGCTCTTACCCATATACCAAAGCTATTCAACCACCACACACACACACAAAGAGAGATATCATTGGAGCTGTTGAAGGAGGTTGTTAGAATTAAAGTGTGTCACTTTATGATTTGACCATTTCTTCATAACAAGAGTTAGATAGTCTCATCAATTATCATACTTATAGAAAACTTATTACAGTAATTCTATAATGTCAATTTTGTCAAAATTACGATGTATTACGGTGGATGTAACTGGTACATTGATGGCTTACAAGGGAGAGTTAGGAGACTACTATTGCATGGCAGCCAAATCTGTTGGTCTGCCTTGCCCTGACTATAAACGGGTACATGAGGGCTTCAAACATGCATATAAAGACATGGCTCAAAAGTATCCATGTTTTGGATATGCTGCCAAAATGCCCAACATTGTGTGGTGGAAAACTTGTGTAAGAGACTCATTTATCAGGGCCGGTTATGACTACGATGAAGAGACATTTGAAAAGGTGTTTAGACGCATATATGCTTCATTTGGTTCTTCCGCCCCTTACACCATCTTTCCAGACTCCCAACCATTTTTAAGATGGGTCCGTGAGCAGGGTCTTCAGGTTGGCATTATTAGCAATGCAGAATACCGGTATAAAGAAGTGATTCTTCCAGCATTGGGCCTGAACGAGGGATCTGACTGGGACTTTGGTGTATTTTCTGGTCTCGAAGGCGTTGAGAAACCGGATCCAAGGATTTACGAAATTGCCCTTGAGAGGGCTGGAAATCTTCCTCCAGAACAAGTACTGCATATCGGTGACAGTATGCGGAAAGATTATGTGCCAGCAAAGAGTGTAGGAATGCATGCATTATTGTTGGATCGATTTAAGACAACTGATGCCGAAGAATGGAGGAAATCTGGCGCAATTGTGCTCCCTGATTTGATGGGAGCAAAAGAATGGCTTCTTTCAGACAAGTCATGAAGAAGAAGCATGATTGGATTTTTCTCTCCCCCTTGAAAGGAAAGATTGGTTAGTGGCTAGCAGAGATTGTTTTCTCACAAAGTGAGGCTTCACTCTAATCTATATGTACACAAGTTAGAAAAGTTTGATGAATGAGAAAATGAAACCTGCTAGATTATGAAAATGACTCTAATAATTAAATAGAAATAAAATACAGGATAGGGGAAGAGTTGCACCATTTGCGTTTTTATTTTATTGAGTAATTTTTAAATATAAATATAGTTGAACAATGATGGGTCAAATTATAAACAAAAGTGTGAAGCAGACACTTTTATTAA\n>XM_012066938.1 PREDICTED: Cercocebus atys POU class 3 homeobox 2 (POU3F2), mRNA \nGGGGGGAGCGCCGAGCTAGTCAGAGAGTGAGCGAGAGCGAGAAGGAGGGAGAGGAGGAGAAAGAGAGCGAGGGCGGGCAGGCGGGAGGCGGCGGCGGCGGCAGCAGCAGCAGTAATAGCAGGAGCAGCAACAGAAGGCGTCGGAGCGGGCGTCGGAGCTGCCCGCTGTGGGAGAGAGAGGAGAAAGAGCTAGCGAGGAGAGGGAGCCCGAGGCGAAAAAGTAACTGTCAAATGCGCGGCTCCTTTAACCGGAGCGCTCAGTCCGGCTCCGAGAGTCATGGCGACCGCAGCGTCTAACCACTACAGCCTGCTCACCTCCAGCGCCTCCATCGTGCACGCCGAGCCGCCCGGCGGCATGCAGCAGGGCGCGGGGGGCTACCGCGAAGCGCAGAGCCTGGTGCAGGGCGACTACGGCGCGCTGCAGAGCAACGGACACCCGCTCAGCCACGCTCACCAGTGGATCACCGCGCTGTCCCACGGCGGCGGCGGCGGGGGCGGCGGCGGCGGCGGGGGGGGCGGGGGCGGCGGCGGGGGCGGTGGCGACGGCTCCCCGTGGTCCACCAGCCCCCTGGGCCAGCCGGACATCAAGCCCTCGGTGGTGGTGCAGCAGGGCGGCCGCGGCGACGAGCTGCACGGGCCAGGCGCCCTGCAGCAGCAGCACCAGCAGCAGCAACAGCAACAGCAGCAGCAACAGCAGCAACAGCAGCAGCAGCAGCAGCAACAGCGGCCGCCGCATCTGGTGCACCACGCCGCTAACCACCACCCGGGGCCCGGGGCATGGCGGAGCGCGGCGGCTACAGCGCACCTCCCACCCTCCATGGGAGCGTCCAACGGCGGCTTGCTCTACTCGCAGCCCAGCTTCACGGTGAACGGCATGCTGGGTGCCGGCGGGCAGCCGGCTGGGCTGCACCACCACGGCCTGCGGGACGCGCACGATGAGCCACACCATGCCGACCACCACCCCCACCCGCACTCGCACCCGCACCAGCAGCCGCCGCCCCCGCCGCCCCCGCAGGGTCCGCCTGGCCACCCAGGCGCGCACCACGACCCGCACTCGGACGAGGACACGCCGACCTCGGACGACCTGGAGCAGTTCGCCAAGCAGTTCAAGCAGCGGCGGATCAAACTGGGATTTACCCAAGCGGACGTGGGGCTGGCTCTGGGCACTCTGTATGGCAACGTGTTCTCGCAGACCACCATCTGTAGGTTTGAGGCCCTGCAGCTGAGCTTCAAGAATATGTGCAAGCTGAAGCCTTTGTTGAACAAGTGGTTGGAGGAGGCGGACTCGTCCTCGGGCAGCCCCACGAGCATAGACAAGATCGCAGCGCAAGGGCGCAAGCGGAAAAAGCGGACCTCCATCGAGGTGAGCGTCAAGGGGGCTCTGGAGAGCCATTTCCTCAAATGCCCCAAGCCCTCGGCCCAGGAGATCACCTCCCTCGCGGACAGCTTACAGCTGGAGAAGGAGGTGGTGAGAGTTTGGTTTTGTAACAGGAGACAGAAAGAGAAAAGGATGACCCCTCCCGGAGGGACTCTGCCGGGCGCCGAGGATGTGTACGGGGGGAGTAGGGACACGCCACCACACCACGGGGTGCAGACGCCCGTCCAGTGAACTCGAGCGGGGGGAGGGGCAGAGCGCGGGGCTCCCCCTCCCCTTCGGTCCTTGGCCCTTTCCCGGCCCTCTTGTTCCCTCTCTAACTTCTGATTGTTCTTTTATTTTTAATTATTATTTCCCCGTCCCTTAAAAAGAAAAAAAAAATAAGGAAAAAGGAAAGCAACTAAGACACTGGACTATCCTTTAAAGGTAGCAGGTGTAATGATGTGTTTTGACCTTTGCAGACGAGTAACCAGGCAATGGAGTGGAGTGTCTCCTGGAGAGAGTGAGGAGAGTGTGTGATAGATAGAAAGAGAGAGAGAGATAGAGAGATGGCAAGCACTGAGATAAATACCTGGCAAAACTAAATAAATTACCAAAAAGGAAAAAAATATCCACCAAACCATGATAAACACAAGACGCAGCTTCCTGATGCTTGGAGTTGGCACATGCTGCTGTGTTTATTTGATGTGGATTCCCATCAGGAAAGAGGAAAAAATACACACGTTCTTTGATATAGGCAAAATTTAACCACATAAATTTGCACTGCAAGAAAATTGAAGTTTACATGAACAAATTCATGAACATATTTTCTCTTTCTCCCCACCGTTAATTTGGGAATTGCCGTTTTGGGGGATTTTGTTTTGCTTTGCTTTATTCATCGGAGAGAGTTGAAGCCAGCTCTTGGCCTCTCTCCATTTCTAATGTTCTTGTGTTGCCCCTTATTCGTACTGTTTGTGAACTTTGGTTACCTTCAGATTCCCCTTACAAGGGTGTAACATCTATTTGTTCCTCTTACCAAAGCAAAACGATTGGCTTCATACAAAATAGACAATTCTCTGCTTTCAGGAAATGTGCGTGGTCTACCCGCTTTATCCAAGGCAAGAATCCAGTTTGCAATATAAAAATAAGCATTGGTTGTTGTTACGAGCCACAAAGTAAACTTCATTTTCAGGCAGTGTTTCTGGGGGAGGTTATGGAGGGAAGAAAAAGAAAAATCGATAGTGAGTGACTGATTGCTTCATTTTATCAGGCGGGCCCATTGTGAAAGAGCTCAGAGGAAATGTGGAGGTTAAATATATTTCCAGAGTTGTCCAGCAGAAAGAAAGTGGCACTTTGAAGAGAACTAGGGAAGTATATATCTTCAGATATCCCTATATAGTTCTCTACCTTCAGTTTTAGTAACAATTATGAAGAATTCTTTATGCTGACAGCAGCAGTTAAACTTTGTTTCTCTAATAAGCTTTTTTTTTTTTTAACATAAAAAAGGACCCACGAACTTAATAGTGTATGCATAAGGCTGTGTTTTTTAGCACATAAATACCCACAGCATACACAGACGATCTCCACGCAGTAGACAGGTTTTGTCTTCACTAGCTCATTTGTTTATCAAGTCATATTTAGGGTCCCACGCCCTCTTTTCCTGTAATTTATTGCAGAATATACCACTTTGACTTGGACAGCTTTCTCCCCCCTCTTTCACTAAGGAAGGCAAATGAAGGGGGAAAAAAATGCCATTTTCAATCCTTCCTTTCTCCCCTTTGTTAATAGTTTTAAGTGCATTTTTGACCTTATCTTGATGGAAAACGGTTAACTCCAAACACAAAAGACTCTACTGGAAAGTGTAGGTGAAAAAACTTGTAACTGTATTGAAAATAAATACCATTAAACTGTGATCAGTTAAAATTTAAAAGAAAAATCAGCACAAAAGGGCGCTAAAAGGGAAAACACTTTTTATTAATCTTAAAAGTTTGGGGTTTTTTTTTCCAGTTAGGTATTAGATAAATTTTTATTTTAAAAAATGAAAGTCTCACTACCATAAAATTATGGTTCAGCATCAGATTAGCATTGCACTCATTAGTCTTTAAGGTTTTAGGAAATATGCTTTATATTGTCTTTTCAAACACCTGTGATTGTTTCATTTTCAATGTTTTTGCAAGATAAATGGTGACTTATAATGGGCATATTTATTTGCCTGTATTTCATTTCCCCCAATGAATGTCACAAGGAGATGGGCACGGAGCTGCTTCGGGTACATCACGCTGCTCGTTCCTGAGGTATGGGGACTGGCCTTTAGTGAAGCTATCCAGAGCAGGGCAAATAGCCACTGGTGAAGGGAGGAAATGAATTTTCAGATACTTATTACCAAGTAGGTAAGGTCAGAAGCTGGAGTTCAGAGGATGTATCTACAGCTTCTCTGACTCTTATAGGTTTACTAAGATGAAAGTTACCACTGAACCTTACCACTATGTATATATGTTTAATATCTGTCTTTTGAAATGCAGAAATAGTTTAAATGTTTCTTTGTCTATTTTTCTTTTTTTTAATGCTACCCAGGGAAATATTTTCATATCATTTTTAAGTGGCCTGCCTCAATGTATATTTATTTCTTTTGAAGCAAAAAGGTTCTGGAAACTGTTTTTCTGTAGCTTTAAATGAATAGGTGAGCAAAATCTATATGGGATGTAATTTTTTTGTTCAGTCTCTTAAAAAATACTTTGTTTTTGGTACATTTGGTTGTGCTTGTGGGGAAAATAAAAACGCAGAGATCCTTATATATTTATGTTAAAGTAATATTTTATTATCTACATAAAACAGAAATGCACAATACCTTCATAGTTTGTTCTAATTATTGAAATATCTTTATTTTATTTTTAAAGATAGTGCCATCAAGTTTTAAGGGGGGAAAACCCTAGACCTTAAATTGACTGAGTTGAGTTGTGTGTAAAACACTTCCCTTCCTTTATACTTCATAAAGTTTTGGAATAAATTTTATGCATATACCGCCAGATTTCATGTTCATAACTTTCAGAGGCTTTTTTTTTTTAAATGGAGACTACTGGTCTAATTCACTTTTCTTTGCAAAAACTATTAGTCCCAAATCTTTCAGCCACTATGCCTGTAGCATTAAATAGAAATGGTCATTGGGTTTGAGCTTCAATTTGTTGAGATGTTTGTCCCCTTTAAATATGTGCAGATATGCCTGCATCTTCTTTCCAGGTTAACTGTACTTTATTCAATTGTGCAGTTTTGGAGAACATCAGTGGAACTAGGTGGACTTTAATCTCTACCCACAGGTCCTCATATAATTTGGGATCTACAGAAAGGCAGGATTTAGGAGATTATTATTTTTAATAATTTACAAGTATCTCTTAACAAAGAATAACCCTGATAGTATGCTATTGTATGTTTACTAAATAATTAGAAGTAGATCCTATACATTATTCCTGTTTGGTTTGCATAAAAAGATGAATTTTACAATGGTTT\n>XM_053552187.1 PREDICTED: Mercenaria mercenaria high affinity cGMP-specific 3',5'-cyclic phosphodiesterase 9A-like (LOC123560979), transcript variant X1, mRNA \nGACAGAACGCCAGAAGAGTGTTTCCTAATGCGCATGCGTGTGGTTGCGTGAGAAACGTATGTGTTGTGGAAACGCCACTTTCTCTTAGATTCGCCAGCGCGCTTTAAAGTGGACGACATTAACTTGTGATTTTTTGTGTGTCTGAGATTGACAGTGTTTGGGTTTCAGCTAAGTGCGTCTACATTTATATGAATCCAAACAGATATCAGACATTTTATCGATCAAGCTTTTGTAGCCATCGCTGTTGTCTGACTATTTATATCTTCTCGAGCGCTGATAAAACTGAGGATGCAAAAGTTTTGTTTGCTTATTAATATATCGTAATTTCATTCAGTCATTGTACAATGTGGACTTCATAGTGCTTTCTTTGGAGTGGTTAGACGAGAACTAAGATGGGAAACGCTTCGTCAATAGATTCGTCTGTGGTCGTTTATCTAGAAGTTAGTGGAAAACAAGAAAAGATTGTATTCAGCAAACACTGTAGTTCCAGGGATATACATGACCTCGTGGCACAAGCAGCCGGATGTAGCAAGTATTGTATATTGACCCTTAAAGATCCAAATGGTGCCCATATTTCCATGTCTCCCACGATGCCAAGCAACACGCCCAGTGCGCCTTACAAGGTTCAAGTATCACAACCTACGTCAAATCAAGGCGATAGTGAGGTGCTTACACAACTTATGACGCATGTGGCAGATCAGTTCAACAAAGCTTTCAAAGTGGAGGAAATGAGATCGGAAATTTCAACCAGACTTACAGCACTGGAAAGGAAACTGGAAATGGAGGGACTGAAAGCTGTTGAAATTGAAAAGTGCAAAAAGGACATTTCGGAAATCAAGGATCAGATCTGGACAGCACAAAAGAAGTTTGTGGACTTCAACAGAATGAGACCCTTATTGTACGGTAGTAACACTCACGATCATTTTTATAGTTCGCTGAGTGATGAACGGAAGATCTGCCTTAAAAGGGATATTCCCTCATATCCGAAGTATACTTTGTCTCAGGAAACGATAGATTACTTAAAGCAGCCAACATTTGATATTTGGCATTGGGAACCAAATGAGATGTTGAGTCTACTAGAACATATGTACCACGAGCTTGGCCTTGTGAAGGAATTCAGTATCAATCCGATTACACTGAAAAGATGGCTGCTATGTGTCCAAGAAAATTACCGGAACAATCCGTTTCATAACTTCCGTCATTGCTTCTGTGTCACACAAATGATGTATGGGATGATTCATTTATGCAAACTCTGGGATTACATGACGAGGGAGGAAATCGGGATACTCCTGACAGCAAGCGTTTGTCATGATTTAGACCATCCTGGATACAATAATACCTACCAGATAAACGCACGGACGGAGCTTGCTATTCGGTATAATGACATATCACCCCTAGAAAATCACCACTGTGCTGTGTCTTTTCAAATTCTGTGTAATCCGGAGACAAACATTTTTGCTAACTTAGACAAGGACGGCTTCAAACGTGTGCGAGCAGGTATAACACAACTTATATTAGCAACAGATATGGCAAGACATAGTGAAATCATAGAGTCGTTCAAATCTAAACTGGAAGGCAAATTTGACTTCAAGAGCAAAGAACAGCTAGACACTTTGAAGATGGTTTTAATCAAATGTTGTGATATATCAAATGAGGTCCGTCCTATGGAAGTTTCTGAGCCTTGGGTAGACTGCCTGTTAGAGGAATACTTTAATCAGTCTGATCGTGAAAAAATGGAAGGATTACCAGTGGCGCCTTTTATGGACAGAGATAAAGTAACTAAACCAACAGCACAGATAGGTTTCATCAAATTTGTTCTCATACCAATGTTTGAAACAGTCTCAAAGCTGTTTCCGCAGATAGATGAGACAATGGTACAGCCATTAAGATTAGCACGTGATAGATATGAAGGAATGAAGGAGCAGACAACTCCTCCTAATCCAAAATCTCAAAAAGATCAGGCTGCGAAGAAAGACGGAGAGTGATGCCGTGTTGTATATATATACTGGCACCTGTTGCTAAGTTAACATATCATCTCTGTGTTAAAATGTTACGAAGACCTGTAAAATAGACTCTAGTAGAATAATATCTTAACATTGTGGAAAACTATGTTTGTAGGATTTGAAAGCTTTGATAACATTATAACGGTTGCATATATTCAGGTCAAGTTTACAGGCAACAACAAAAATGTTGGGCCTTTCTCATGAAAAAAAATCTGGTGAAAAAGAAAATACTGGGTGAGTTTTGAAAAAAAAAGACTTACTCTTAAAGTGATATTGTTTTACATAAACAAACATCGAATTAAGGGTAACTTATCGTGTTGATGTATTTAATTCCTGTACATGTATGTGATTACATTGTTCAGTGTCTTGGTAAGGACTTTTAATGTTCAAATTTAAACAGCAAATTGCGTTATGTAGCAATGAGCTTGAAAGTATTTGTTCATACAGTTCAGACAGATACGGAGCTAGTGCTTGGTGACAATAGCTTTAATATAATGTTATTATTTGTGCATACAGTTTAGATAGACAAGGTGGCAATAGTTTGAACAGCATGTATGTACAGTTATAACTCGCTGTCTCGAATTCCAAGGGATCGAGCGTTTTAGCTCGAGATAACCGAAATACGACTTAAAATGATATTTTATACACGCGTTTTACCTCGAGATAACCGAAATACGATTTAAAAGGATATTTGATACACGCGTTTTACCTCGAGATAACCGAAATACAACTTAAAATGATATTTGAAACATGCGTTTTACCTCGAGATAACAGAAATACGACTTAAAATGATATTTTGTACACGCGTTTTACCTCGAGATAACCGGAATACGACTTAAAATGATATTTTGTACACGCGTTTTACCTCGAGATAACCGAAATACGACTCAAAATGATATTTTGCACACGCGTTTTACCTCGAGATAACCGGGATACGACTCAAAATGATATTTTGTACACGCGTTTTACCTCGAGATAACCGAAATACGACTCAAAATGATATTTTATACGGTGACAATAGGTTAAATGTTGTGGACCCGTAATGACATTCGGCAATTTCCGTACGATTACGAAACTTGTATGCTAGTTCGGCACCTTACGGCTGTAACATCAAATTGCTTTTTTCATAATCAAATCCTTGAGACGTCTGGTGGTGGTTGATTTTTAGCAGATTTACTTTCTGTTTTCTTGCAACTATTATGCACCTCAACAGCTAAAATAAAACGGAGAATACCTGAATTTACATTTTCTGTATTACAAATATCATGTCACCTGTACACAAACTAATTTTATACAACAAAAACAGGAAACAAAGAACATTTTTATGCAAATCATTTTCATTACATTTACTTATAAATATCTCACTTATTAGTAATATACTTTTGATCTATTTCTGACACTCTATTTTGTAACAAAACAAATATCCAACTATTAAAATACTTGTATAGGAAACGAACATAAACGTGCTTCGAATCTAAGATGAATTCTACGTGACCTCACATGAATCCAGAATTAACCCGCTTGAATTCAGTGATGTAACCATAGGCTTGAAAACCTTATCATCAATAGATCTTGTATAATCTAGCCGGTCAATGTGAATGGAGACAGGTTAAATTAGACTGCTTGATCATTGATAGTTCATCCGCAATATTCATGAATGGAACTATTTGGTGTAGCGCACGAACATCTTTTTGATGTGATTAGGAATGAAATAAAGATCCTGTGATTGTCAGAAATACACTTATAACTTTGATAGCGGGTAAACCCGCCCCACCCCACAAAAAACGGAGAAAGTCGAAAGTGCTTACGGAAAATACGTAAACGAACTGAAAATGCGATTGTCGTTACGGGTCCACGAAAAAGTAAGAACAGAATCGCTTGCAGCAATGAGTGCAGCAAACGCAACACACGCGGATTACATAAGAATGGACACTGTAGTAAAATTGCAACAGAAGTTTATGTATTTGTATTTACAGTATACAAGGTTCTTAGAGTTTGTTATTGCGTTTGAGTATAATGTAAGTTTTATATCTGCAGTTTAGAAAAAATGAAGTTTTACATTAGAAATCAAGGAAATGTTGTAGATCTATACTAGAAAATATTCACTGAGTATAGCGATAAGCATTTTACTAACATTTGCCTATAAATCGTTTGGTTATACCAAACTTCTCAATGAAACAATACATTACAGTTTCTTCAATCTCTCTCTTTAGTTATTATACAATATGTATTAATAGCGGAAACGTGATATTTTTATATTATTTTTTTTTTACATTTGAGACGCTTTTTAAAAAAAAAATATGTCACAGAGATAATGGTATACGAGCTTTTCTGTTCAAAAAAGCATGTGTTGCAATTACAAAAATTGTGTCACTGTTCACTATACATATTTAATTTCATTAAGGTGTCGGCTATATCAAAAATATTTTTACAGCGTAGGGAGTTCTTAAAATGTTTTATGTGACATTTTTACGAACACACATTATTGATCAATAGCGAGATTTATTTCAAGATTTCATAATAAAAAAACATAATGATAATAAAAAAATATATTTGGGGAAATGTTTTATGATAAATGGCACTGTATATGTTGAACTTACTTGTGTAACAGTTGTTTGATCTGTCGGTTATTTGTTCTGAAATATTGTCTTGCGTCGAAATGTGAATAAACAACGGTTTCTTCATA\n>XM_050728021.1 PREDICTED: Bombus affinis sodium-dependent transporter bedraggled (LOC126919204), transcript variant X1, mRNA \nTTTTATTGTTTAATAAATAATTGATTAAATAACAAAAATTTACAAGAAGAAGTGAAATCGTTTATCAACGTTTGCAATGTTATATCTTTTGAGAACAGCTATACTGAAAATACTAAGATCTTAATTTTGTGATCCTTTGTGAAAATTTACATAAAATTTACAAGATATGAAAAATATTCAATATTTTACTTTACAAGACTTCAATCATAATTATTTTTAAACTTGATTTATTAAATTATATGTATTTAGTATTTAGTAAATAAAAAAATAGAAAAACAACAAATATGATAAAAAAAACGTTACGTGCTAAATCTTAAAATCATGTAGCTGTTTTTATGAATATGTAGTTGGCCTTCAAACATTGATAGCTATTACACGTTGTTTGTATGTAATAGAGGATATCATTAGTGTACTAGCTTAACCATATTTATAAGAAAAATGAAACTACTCTTACACAAACGACAAAACGAGTAGATCATTTGTCATCATTTTGTCAGTTTATTTATTTTTTATTATTAACTATTGATTGTACACTTTATTATTGATATTTTATCGAGGAGAATCAAATAAATATTGTACAACAAGTATTACAGGCTATATAGATGTATCTATATATAAAAGCAAGTATCACACAAACACACACATAGAAGAACATATTAATTATATGTTTCATGTAAAATAAAATTTCTTCATAGAAAAATAATATTGTGCAAGTACGTGAATAAGGAAAATGAATTAGATTATTTGGCTATAGTATTGTTTTTAGGATATTGATTAGTTTGAAACTCTATAAAAGCATTCTGAAGTTGTTGTCCTGGTTCATGATTCACGAATGAGTTATATAGAGCCGTAGCCAGCTGAGAAGGTCCGGTTACTGGTTACCTGTTACCTGGACAAGTGTGCTGGCAACGGGCTTGTCCTAAAGTATCGACCGTGACAGTCGTTCCAGTCGATTCCAGTCACAGCTTTTAGATCGATAGTTTTCCGACAATATCGATCGATAGCTTCCTTTTGACTTTTCCAATCATGCATCCATTATTAAAATATATAGAAGTGTAAAAATTGTTAAAAACGTTAAAAAGTACAAAAATTGTTACAATTTATTCTTTCTGTTACTAGTATTTCTCTACGAGTTTTGTAAAGGGACATTCGTCGTTCGGAAGAGTAATATTGCAGAAATGTTTCTGTGTTCTTCCCTTCCCGAGTACTAAAGGACATGAATCAATTAATGAATGAATCATATTTTTTACCAACTCTGATATGATGTACGTAATCAAATTTTTAATTTATATCGGTTATCAATTCTTACTTACTTCTTCACCTACTAGGTAATATCAGATAATAATTTGAACTATTATCAGTTGACAATAGATGCTAATGGATGATAATTGATACGACAATCGAATCGTTTTAGATGAAATGTTACTAAATAATAATAAAACTTAATGAATTTGTGTCAATAATACTTTTGATTGATATTGTATGCGTATTTTGGTAGGTATGAGGAATGATTCATATGTTTATTTCTCCATTTTTATCACAATCACGTTAGTATTGTGGTAGTAGGATTAGTTTATAAATAATCGGAGTTCGCAAATTGTCTTTAGCATTACATCGTTAATGATTCCTAATAATATAACACCGTGGTTGAAGCTGCAACTTATTTTCCTTAACGACCCGGCATTCATACGTGTTTCTTTATACCGTAAGGTTAAACATCCATTTCAATCAGTTATTGTTTTAAATCATGTCAGCTATATGGATATTTCATAACGTTGTTCAATATTTCCAAAATAGTGAGTCTGTCGTAGCATGTTCTACGGTTTACACAAAGAACTAAAGAAAGTAATTTGTGTGATAAATTTCTACGTGAAAGAGCGGTTTTAGAATCAGTTTTCACCGCATCGAGATAAGATGACGATATATATGTACTTAGTTTCCAAGTGAAGCGAACGTAGGAGAGGTTTAGACATTTCAAACGAAAAAGTATCGGTCTACTTTGTTCAAGGGATTAAGTTAGCCTGATCGTAGAAATTTAAACATTTAAAACAATGCATAGGATTGTTACCCTACTACAGATAAACGTTCATTTTCTCGTTGCAGTAGTTAACCATTACAGAATGACTTCGAGCGAAGATGGTGATTTGATCGATCTTGGAAACGATAGTTGTGTACCACGAGTATCGATTCAAGAATCATCGCCTGACGAGCAAGAACATCTTCTCGATGTGTGCCTACCGAAGTTAGAACAAGCATTGTCATTAACCAGGAAGCAAGAACAAGTACAATGCATAAATGACAACGGTGATGTATTAGTCACGTTAGGTCACGATCAAGTGGTACCGATTCGTAAAAGAATCGATGTCGTTTCATCCGATACGATAAAAAGGGTTCGTGACATTACCAGGAACTTAGAACCAGTTATAAGAAAGACTTGTTCCGACATTAATGAGGAGCATCAAGACACGGTTGATTATGGAAGTTCATCGGATAACAAAGACGGACATTATTCTAGTGAAAAGCTCGAAGACGATACGTTCGAGGCACAGGAGATCAATGATGCTTTCAATTTTCTCACAGAACACGATGACAACGATGATCCAGCCGAAGCGAAATGTAACCGTTATGACCAAGTTATAAATTCACATGGACTGATCCTATTAACCTCTCGTACCATAAAAAACGAAGATTTATTGAATTACCATGGTAAAAGTGCTTCACAAGCGCTAAACTGCTGGAAAGCAGACACAGATTTAAATGATTCAGGTTTTGAATTATGTTCGGGCAACCCGTCTGAAAGTATTTCGAGGAAACCTAGATCTGATCCTGTTGATTATGAACTTGGAGCGAGTAGCATTAATGTGGTTGAAAATCATTCCGAAGAACAAACGTTTGTACGAACAGCTAAAAGAAGATCATTTCAGCATATACATCGTAAATCTTGGACGGAAGGAACTACACTCAAAAATGCAACACAGGATACATTCTCTCGGTTCGATAGGTCAACTAGTTTAAGAGGATATAATTACGCGTCATCAACTTCCAATGGCATTCATCGGCAATCCAGTTTTATTTCGAGTTGTTCAACGGAGGAAGGATTGGAAACGAATGGAGAGGATCAAGAGGACGGATGTTCAGAATGTTCGGAAGTAGATTGGTCGTGGTTAGAGGAAGTAGAATGTCCGCGGGCTACGGAGTCGTTAGCACCCGGTGTGGTTGACGCGGTTCAGGAGAACCCCGAAGGAGGGAATGTATCCCCCACCAGTGAAAACGCAAGACGCAGGCGCGGTCGCGAGCATCGTGCTACCGAGGCGGGCTGCAGTGCCGCGATGTCTGTCTCCGGGACAGTAAAGTCCCTAGTGGTCGGTGGTTCGCGATGGTTAACTTCCGATCCGCCGTCCGACTGTAACGGCAATAATCAAGATGAAAATATACGTTGCAACGCGAGCAACGAAACCATCGATCGCGAAACACGTGACAATCCTACGCTTGTCAATTCTTGGGTACGGGCTTCGATGAGACGTTTGCGTCACCTGAGATTACCGGAAGAAACTGAACGACAACGAAACATTGATTTGAATAGTTGCCACGGAACTGTCGTATCCGCGCCAAATTCTTTGCCAGATATCGCTTTAATCGCTCCAGAGATATTAGCTGCCCAAACAAACGGTACTTCCGGCACCCTCCTTAGGCCATCCAGCGCTCCTGTAAGAAACTCGAATAATTCAAATGTAGTGCCATCGCGGAGAGGCGGAAGACAATTTAGAGCAAGTCGATCGCAAAGAACGCGAAGTCGCGACATTACTTCCAGGCAAAGCAGCGTTTTATCGTCGACTACGGGCAGTGATACAACTGCTTCAGGAATCACGACATGCTCCAGCTCTTTTGGCGGTGTTTCTACGAGTCCACCTTCTAGCACGGCGACAAGTCCGCAACGCATCGCTTCCAGACGAATATGTGACAGACAGAGAGACGTTGATAGAGATGAGGATAGAGGAGAGGATGAGGATGAGGATGCTAATCCATTGGGAAAATGGCCACATGCTCTTAGTCCAGCCTTGGCGTGTCTTAGTTGCACCCTTGGTCTTTTTAATATAAGTAGATTTTCTATTCTTAGTGTACAATTCGGAGCAAATTTCATTGTACAGTTCCTGATTTTATCTTTGGTATTGGGTATTCCACTTTTGACGTTGCACGTGTGTCTCGGTCAAAGATTGGCGGCTGGATCCGTGGATATGTGGAAGATTTCACCCCTCTTTCAGGGCGTTGGTATAGCTCTCCTAATTGCACAAGCATTCATCGGTATCTACAGTATCGTTGGTGTATCCTGGATGTTCGTCTACTTTAGAGATTCGTTTATAACGAAGCAGGATAAGTACCGATGGGCAGAACCGTTTTCCTTGTACAGAGAAGATAAACCTACACAGAATAATAGTAATTTGCATAAATTATATGAGACAGTACCAGATTATTTTAGCGGAGTTGTCTTGCAAAGAAATCATTTAAATGAATCAGATCCCGGTATCGTAACGTTAAAGTTTCAAGTGGCTTTCAATTTAGCTGTTGTATGGATGATCGTGTTCGTATCATTAAGCAAAGGTTTGAGATCTTATGGCAAAGTAGTATATGTTTTTACGTTGGTGCCTGTATTTGGTACACTAGTTCTTTGTACGAAATTACTTGGCCTCACGCCACCAGGCTCTGTACATCAACTTTTTCCTGCCACTGTGTGGACTGAGTTTTTCATTAATGGCAAATCGTGGGTAGCAGCATCCATCGAGGTTTTCCTCACTTGGGGATTACTTGGTGCAGCTGCTATGCAGATAGCTGCTCATAATAAGCACAAACATCTATTACAACGAGACACGAGTCTAGTAATCGTGTTAACCCTCGCAGTTCTACTTCTCGCAGCTTTTCTGGCAAATACTTGCGTGCAAGTTTTGCGACATCATGGATATATTTACATACCTAGCTCATTTGAAAGAATATCATCGTATATGTTTATGCGACCTGTGAACCAGCCGGCACCACCGGGATATAGCAGTACACCAGAAAGATTTATGGCACATGCGTCGTTTATTGTTGGAGAACGTGTAACTCGACCCGGTGCAGACTTTAGTGTTGAATCTGGTTATCAAGCCTTGAGATTTTCGACTGAATTGGTTCCTGCAACGTTAGCGTTACTAGGCACTGAACAAGTGTCACCATTCTGGGCAGTTCTTTTCTATTTTATTCTTATCCTATTTGGAATAGCTCAACAGCTAGCAATATGGCATTGTGTAATAACTGGTATTATGGCAATTAATGCAAAAATGATGAAGTTATGGGAAACTACTATTACATTCTTCAGTTGTGCTTGTGCTTATATACTAGGCTTACCCATGGCTACCGAGTTGGGCATACACGTCGTATATTATCTAGACTACACAATTGGTGGTACGTGGTGGATAATGATCTTATACTTGGTGCAAGTTGGTGCTGTATTCGCAGTGCGCGGACGTCCACATAGTGGTGAAGCGGTAGTAGCCGAATTGTTTCCTCCAACTGGTCGATGTCTCAGACACTGGGCTGGTCCTCTTCTTTCATTCACGTGGAACGTTATACTGCCTGTTATTCTTATGGTACTTAGCATTACGGTATTTAAAAATGCTGGATTTCGAGAACTTTATTCTTACCGACGTACCGCTAGAGAGTACTGGACAGTTTGGGCAAAACAACTCGGAGCTACGATTCAATTAGTACCAATATTGACGATACCGGCAGTGGCGATTATACAAACATGTCGATACTTGAACAACGGTCCACCCGATATTTTTGATAACAATCAAGTGGAAGTTAATATAAATCACTGCGAACAATGTAATGGTAGAATTCAATTATTGTATCGACCATCTTTGGAGCCTGATGACCCACGAGATGCACAAACACATACTGGAAACGATATGAGTACCAGCATTCACGGCAATGGTATCGTACATACAACGACAGAAGTACCATTTGAAGATCCACCACCAAAATATACACCTCCTCCGAGTTACACTACAGCAACGGGAGCGAGAATAGCAAAGATGTTGCGGCAAAGTTTTCGAAGAAGTGTTCGTCGAATAGCGAATGTGCTCGGTGAGAGCAGTACTCCGAGACAGAGACCGGCGCTACAACCTCCACCTCCTGATTACGCCACTGTACTTGTAGAAATGAATCAAAGTAGGCAAACCCCAGATGTAACAATTCATATAACTGAAGCAAGAAACGAAAACATCAATTCAAACACTCAAAGTAATGCTACCGAAAGACATAGACCTAATACGATAGATAGATCAACAAGAATTGGTGTGGTAGAACGCTCGATAGAAAGAACGCATTCGACGCTCGAAAGACCTCGTCGACCTTGTATGACTTCATCGAGCAGTTCGAATTTAACTGCAGCCGATGTGGCTAATTTACTTCGTAGTAGCATTAGGAGAGGGACTTCGCGAACTCAACAGTCCCTGCGTAGGAGTTTCTGCCACGACGAATCAACGGTAGCAGCGTCCGTTGAAAATCTAGTCGAGGCTGCAGCGCCGATAGGTGAAGAATCCTTGGTCCTTCCAAAGGACGTGTCTCTAGTCTCTAATGAACAGGCTAACAATAATAGCGACGATAAAAAGACTGCCGAAGAAACGGATGATTCCGTTTCTGTGATATAGACTATATCTTTCTTTTGAGCATATAAGAAGAATAATCTGATGGTTATTTAATTTCTGCTGCATAGTGTTACGGTGATTTATTCCTTGTTTAACTTGTATTCAATATTCATTTTCACAAGCTATTCTACGAAAGATAAACAAGTTGCTGATGATTTCATCGATCAATGATCGAAAAAATAATTTTATCTCTCAGACTGAATTCAGTATTTTCTAATCTTGTCACACTTGACAAATAAGTGCATAATCTCATCACTTTAATTACCGTGACAATTGTATAACGCGCAAATGAAAATTGGATAGCTATAAGCAGTGAAACATATAATAAACTCCTTTTCTTACTTACTACGATAGACATCGATTTTATATTGTATATGTTGAACTTTATTGAGGTTCAATTTGCTTTCAATCAGTCTATTTTAGCATTTTGGCATTTTCAATCGAGACTGTGTAACTAAAATATTTATGTAATATATACTACTGTAACATTTTAGTAGTTTTATGATATTAGTGTACATACTATTTTAACGAATCATAAATTCGCTTATTAAGCATTTTCTTCATTAA\n>XM_027781123.1 PREDICTED: Falco peregrinus polycystin 1, transient receptor potential channel interacting (PKD1), mRNA \nATGAATATTTTTGTCAAAGGATACATCAAACTTAGTAATACATTTGTCATGTCTGTAATTACTCTAGATACACTGCAGAATGTTGAACGAAAACTGAAAATTGTGTTTTCTTTCTCTAGGGATCTTTCCAATAACAAGATCAGTGGTTTAGATGTTCAGATATTCAAAAGCCTGACTTCTCTGGCAAAACTAGATATAAGCCACAACAAGATTTCTACATTAGAAGATGGAATATTTGATAATTTATTTAATTTAAGTGAAATAAACTTAAGTTGGAATCCATTTGTTTGTGACTGCAAACTTTCCTGGTTGCCCCATTGGGTGGAAGACAGACAAGTGAAAGTTATTCAGGCATCAGATACGAGATGCGCCCACCCCCCTGAGGTGGCAAACCTTTCCCTCTTTGATGTCTTGTTCGTCAATGCTACTTGCGGAGCTCAATACATAACGTGTCTGACAAGCAACCACACAGAAGGGACTGAATTTGTCATCCTCTTCACATCTGTTCACCCTGGGAACCTCACTGAGGAGACTTGCAGTGCCCTCTGTTATGCTGAAGATCAGGAATATGGAGGTTTCAGCACCCAGGAGCAGTGTTTGTGTGGTACTGCCCATGAAACAAACTCTTCCTACGGTTGTTTGCCATTTTGCACTGAGCATTTGTCCGGGCAGGCCTGTGGTGGCCCATCACTCGTCCCCTCTCCCTTCCAGGCACAGCTATCTGTGTCTTTCACAGGACTCCAGCCCCGGTACAGCCTACGCCAGGCCGTGCTCTTCAATGTCAGTATTCCCATTGCTGTCAGCACTTTACTGTGGGAATTTGGGGACCAGACAGAGGTTCTCAACACCACTGGAAATACAGCTGTCCACATGTATGCCTTACCTGGCCAGTACAATGTCACTGCCACCATCTCTGTGGGCACCAAGGTCTTATACGTGCAGGCAGAAATTGAGGTGGTGGCTTCACCCCAACAGTTAGAACTGCAGTGTCCTTCCTTGGTCAAGACTAATGAGAGCCTGGACATACGGATCCGCAACAGAGGTGGCACAGGCCTTGCAGTGTCGTACAGTATCACCGCAGAGGCTGGGGAGCTGGGCAGAGCCGTTCACCCCCTGTGTCCCCCTGATGGCTTGGTTTTCCCGGGCAATAACCACTGCTATCAGCTGGTGGTGGAGAAGGCTGAGTGGCTGGAGGCCCAGCAGCACTGCCAGGAGCATGGCAATGGAGAGCTGGCTTTTGTGAGCAGCCCTGAGATCCAGAGCTTCTTGGTTGCTCATGTCATCAGGAGCCTCGATGTCTGGATTGGGTTCAATGATTTTGCAAGCACTGGAGCACAGCAAAGAGGTGAAGGATTTAACCTGGAGAGCTGTCAGAACTGGCTGCCAGGAGAACCACATCCATCAAATGCTGACCACTGTGTCCGGATGGGCCCAACAGGCCAGTGTAACACAGACCTGTGCATGGCCAAGCATAGCTACGTCTGCGAGTACAAGCCAAAAGGAGTTCTCTTAAATGCCAAAAACTTCTTTGTGGGAGACCCTGTGTCAGACACACATGAGGCTGTGAAAAATGTGACAGAAGATGCGCTGTCAGCTCCATGGCAAGCTGTGGAGGTGATGGTGTTCCCTGAGCTGGCATTCAGGCACGAGGGATATTTGACTGCCCTGGAGTTTGTAACACAGGAACTGCATCAGCCCGTTCAAGTGAGGTTCCAGGTGCATAGACCGATAGATGGAGAAGACTACCAGGAGGAAAAAAATGCTACAGAACCATTCTACACTTCTCAGGATGATGGGAACTGGACACTATTTGAATGTCCTCCTGGTTTCCAGTGGTGTCATTTGACTAATTTGTGCTCATCGCTAAACAACTGCTGCAACGCAACTGAGTGTGCCAACAGTTCTCTTGCCAGCAGCTCTACCCCCGTTTCCCTTCAGCACAGTGAAAGCCAGCTCAGCTATGAACTCATCGAGGAGTTTCTCTTTACAATACCAGCTGGCCCTTCTTCCCGGTATCTGGTCACGTTCAGAAAAGAAAATATATTTGTCAGGTCTGAGGATGTCTTCAGTATCCAGCACAATGCAGGCTTGGGCTTACTCCTCCAGTGCCAACCAAGTACCACATCCCCTTACAGAACCAACGTCTTAAGCATAAACTCTTCGGAGTCGGCACTTGGCTTGTCTGACGGCTTCATCGGTGCCACCTGGATGAACAACACTGTTTGTTCTCTCCGAGTTTGGTACGCTGAGGAGCAGCTGGTCCCGGTGATCAGCTCCCACAACACGGGGCTGGAGCATCCAGGTCGCTACACGGTCAGAGCCAGCGTGGACAACGGGGTCTTCAGCACCAATCTGTCCTGCAGTTTCTGGGTGGCTTCCCAGGTGTCAGGCCTGCGTGTCATCCACCCCGCTCCTCAGGGCGGCAGGGTCTACCTACCATCCAACCACACTACCCTGGTCATCAAACTCTCCTCAGGGGTGAATGCAACAGCTAGCTGGCTGGGAGACAACCGCACCTTCCCCTTCGAGGGGTCCTGCCCAGCGGCTGTGGCCCTGCTGACAGCAGACTGTGCCAGGGAGACCAATGACACCTGGTTTGCAGTGGTCAGCCTGAGCGGCCTCAGGGAGGGGATGAGCACCCACACGCTGGTTGCAGAGAACACTGTGAGCTCGCAGAACATCACTGTCACAGTGAAAGTGGAGGAGCCTATCCGTGGGCTGCGGGCCACCCCTGACCCTGAGAGCAGAGTCCTGCTAAATACACGAGTGAGCTACATCCCTGTGATGGAAGCTGGGTCAGATGTGACTTTCCGATGGACAGTAGATGATAAGCCATCTTTCACTTTTTACAATGTTGTCTTCAATGTTATCTACCAAAGCCCAGCTGTGTACAAGCTTTCGCTCACCGCCTCCAACCACGTCAGTAACTTTACGGTCAATTACAATGTCACGGTGGAGATGATGAATAAGATGAAGAACCTGACTGTGTTGGGTGTCCTGCCGGTCCTCCCGCAGAACAGCACCGTGGAGCTTACAGCAAGAGTTCAGGTTGATTCAGCTGTGGATGCTCTTTTCCTGTGGGATTTTGGAGATGGTGTCCAGAAGACATACCTGTTCCAACCTCCCTACAACAAGTCTTTCCTTGTTCCTGATCCCAGTGTGCATGAGGTTGTAATTGAGCACAATGTTTCACACGTCTATCAAGACCCAGGAGAGTATGCCTTGGTGGTTGTCGTGTCAAACCAGTTTGAGAACCTCACCCACTTGACCCCAGTTCACATCCACAGTTACCTGACTGATGTGAAGATGGAAGCAGAGGAGGATGTTTTAGTTGTGAACTGTCCGGTCACCTTCAGAGCTGATCCATTGCCATCTCCTTATGGCGTCGTGTACACCTGGGACTTCGGGGATGGGTCCTTGCTGTTCACAGAGAGCCAGTCTACAGTGACATACAGCTACCCCAGAAGAGGGGTGTACAACATCACTGTGACTGCCAACAATACCATAAGCAGCGTGGAGACAGTTGAGCACTACCAAGTGTTTGAAGAGATAACTGGGCTTCATGTTTCTGCAGATGAGGCAGCAGAGCTGGGAGCATCTGTGACCCTTAATGCTTCCGTGCAGACGGGGGACAGCATCACCTGGATATTCGATATGGGGGACGGGACGGTGCTGAGGACTCAAGTGCCAGTGGTAGAACACGTGTATGTAAAGGACATCAACTGCACTGTGAATGTGACAGCTGTGAATCCTGTGAACTCTGTCTCCCAAACTGTGCCCGTTAGGATATTTGTCCTGGAAGTACTCAAAATAGAGCCTACTTCTTGCATCCTTGAGCACCCGGACGTGCAGCTGACTGCATATGTGACAGGAAATCCTGATGAATACATCTTTGATTGGACTTTTGGAGATGGCTCGTCCAATGTCACAATCAGTGGGGACCCTGTGGTGATGCACAACTTCACCCGCAGTGGGACATTCCCCCTCTCCCTGACTCTCTCAAGCAGGTTTAACAAGGCTCACTATTTCACCAGCGTCTGTGTGGAGCCAGAGATTGTCAATGTCACACTTCTCCCTTCCAAGCAGTTTGTGAGGCTTGGTGAAGAGAGCAGCTTCCAGGTCAGTGCCGTGCCTCTCTACCAGTACCGCTACCGCTGGGATTTCGGGACCAATGAGTCCACTAGATCGAGTGGGACTGAAGTGACCTACACCTACAAGAACACAGGGGTCTTCCTGGTCACAGTGACTGTCTCCAACAATGTCTCTTTCAACAACGACACAGCGTTTGTGGAAGTCCAGGAACCGGTTGGGGTAGCAAAGATTGAATATAACGGGACAAGTGTTTTGGAGCTGAACCAGATCTACCTGTTCTCTGCCAGCATGAATGGAACCAAAGTGAGTTACTGTTGGGACTTTGGAGATGGCACTACCCAGCCCGGGCAAATCGCTGCCCACTCCTACAACAACACGGGCCATTACACTATTAGTGTGGTGGGCCGGAATGATGTGAGCTTTAATGAGACCGTCATTGATGTCACAGTGAAACGGCGGCTCCAGGGGCTGACCATCAATGCCAGCAGGACAGTGGTGCCGTTAAATGGTTCAGTGAGTTTTGTAGCCACACTTGTAGCTGGCAGTGCCATCCGCTACTCGTGGATCCTCTGTGATCGGTGCACTCCTATCCAAGGCTCGTCCACAATTTCCTACACTTTCCGGTCCGTGGGCACATTCAATGTCATTGTGACAGCAGAGAACAAGATCAGTTCGTTGCAGGACAGCATCTATGTCTACGTCCTGGAACAGATTGAGGGCCTGCAGGTGGCTAGCAGTGACCTGGTAGAGGACATCTATTTCCCAACGAACAAAACACTCCATTTGCAGGCAGTGGTGAGAGAGGGAACAAACATCTCTTACAGCTGGGTAGCCCAAAGGGATGGCAATGCTGTGCAGACCTTCACTGGGAAAACCTTCTCCTTGGTTGTCCTAGAAGCTGGAAACTACACTGTCTATCTGAAAGCCACTAATATGCTGGGATGTGCAACTGCTAACAGGACACTGGAGTTCATTGAAAGCATTGGTCTTTTAAAGCCTTGTGCCTTCCCCAACCCAGTTGCTATTAATGCCTCTGTTAACATAAGTACCACCATAACCAGTGGCACTGGCATCACATACATTTGGTACCTAGAGGATGGCTTCTCTCCTGTTACTTCTGAACCCTTTATTATACACTCCTTCCAAAGCCCTGGAGTGATAGAGGTCATCGTTGAAGCAGAAAACAAGCTGAATTCAACCAATGCAACAATTCCTATCTGTGTAGAGGAGGTCATAGAGGGGCTGAGTATAGGGACTGCAGAACTGGACTGTAGATACGTCTCATCCGGCTCCACAGTGGTCTTTGAGGGGGAGCTGCAGAAAGGGACTGAAGTGACATGGCTTTGGGAGGTGCCAAATGGAACGCTGACTGGCCAGTCTGTGGCAGTCATGTTCCCCACAGCAGGGTTTTATACAGTCTATCTGAATGCATCAAATGACATCAGCTGGGCTCTGGCCAGCAGGAANNNNNNNNNNNNNNNNNNNNNNATCTCAGTGCTGGACAGGATTCAAGGACTGGAAGTTCTTGCTAGCAAGAAGGTGGTGGAGCCAGGGGAACAGGTCACCTTTGTGATCAGGATGTTGTCAGGTACCTCTGTGAGTTACTTGGTGAGCATAAGTGGGGACTACTCTGTGGTGCTCAATGGGTCCAGGTACACGCATGAGTTCACCAAGAGTGGTGATTACTTGGTAACTGTGACAGTGCAGAACCAAATCAGCATCGCACATGCCCAAGTGCTCATCTCTGTCCTGGAGGCCATCCGTGATGTCAGGCTCCTGAACTGCTGTGAGGAAGGCATACCCACAGGCACGGAGAAGAGCTTCCATGCCCAGGTGGGGAGTGGCTCCCGTGTGGCATTCTCATGGCAGTTCTCCCTGTGGAAAGAGAAAGGACGATCTGTGGTCACTGTGGCAGGAGAGAGTGTTTCCTACACTCCAGAAGCTGCAGGGCTGCTTGAGATTCACCTCAATGCCTTCAATGACTTGGGAGGTATCAATATCACCAGAACCATCCAAGTCCAAGACCCAATAGTCCAAGTCTCCCTCACTGCCTCCAATGCCTTTGTCAACAGGACAGCACTGTTTGAAGCAGCACTGGTGCCCAGCAGCAGGAGTGTTGAGTTCTTGTGGACCTTTGGGGATGGCTCTTCCACTCAAATGACCAGGGTTGCAGTGGCCAACTATTCTTACGTGAGCCCTGGGGATTACCTGGTGGAGGTGAATGCCACCAATCTCATCAGCTTCTTCATAGCCCACCTCACTGTCACTGTCAAAGTCCTGGAGTGTGAGGAGCCAGAGGTGGAGTTAGCCTTGCCCCCTCAAGTAGTCATGAAGCGGTCCCAGAGGAACTACCTAGAGGCACAGATTGACCTCCGAGGATGCATCAAGTACCAGACAGAGCACCTGTGGGAGATCTACCAAGCACCCAGCTGCATGAACTTGGATGACTCCAGCAGGATCCGTCTGCCAAATGTTGATGTGAACAGGCCCCAGCTAGTTATACCAAAGCTTGCCCTGGAAGTTGGGAATTACTGCTTCATTTTTATTGTCTCCTTTGGAGACACCCCACTGTCCAAAAGCATCTTTGCCAATGTGACTGTGATACCGAGTAAGCTGGTCCCAATCATTGATGGGGGGTCATACCGTGTATGGTCCAACACTCAGGACTTAATCTTGGATGGGGAGAAGTCCTATGACCCAAACTTGGATGACGGTGAACAGACTCCGTTGTTATACGATTGGTCTTGTACATTCTCCTCCAAGAGCTCGGCTGCAGGGTGCTCTCTGAATTTCAGTGCCAAGGAAGGAATTGTCACAATTTCCAAAGCTCTGTTAGAAGCAGATGTGGAGTATACGTTCGACCTCACCGTCAGGAAGGAGGGTATGAGTCCTGAGGCAACAAATCAAACCGTATTCATCAAGAGGGGAGGAGTCCCTATCGTTTCCCTGGAGTGCGTTTCCTGCAAGGCTCAGTCTGTCTATGAAGTTAGCAAGAGCTCCTACGTCTACCTGGAGGGGACCTGCCAGAACTGTCACAATGACTCCAAGCTTGGGAGATGGGCAGCACACAGCTTTAAAAACAAGTCTCTCATCCTGGACAAAAAAACTACCTCCACTGGCGACACAGGCATGAACCTGGTCTTGAGGCAAGGGGCACTGAAGGATGGGGAGGGATATACTTTTACCCTTCACATCACAGACCTCACAACCGGGGAGGAAGGATTCGCCTCAATCGATCTGCTCCCCAACCAGCCACCTGTTGGAGGGTCCTGCCAGCTGTCTCCGGAAGGACCCCTCAGGGCACTGATGGCAAAGGTGCACTTTGAGTGTGCAGGCTGGCGAGACACAGAGGACGCGGAGGGCCCGCTGGTGTACATCCTGCTGGCGTCTCGCCACAGGGCTGGGCACTACCACGAGTTCTGCGTGTACAAGGGCAGCCGTGCAGAGCACAGCGCCTTCCTGCCCCCGGGCTTCCATGAGAGCGGCTTTATGGTGTCTGTGGCGGTCCTTGTTCAGGACCAGCTGGGAGCCACCGTGGTAGCCGTTAACAGCTCCATGGAAATCGGCTTACCTGAGGGGTTCCCCAGCCTCTCCCACTGGCTGTACAATCAAACTGACACGGTGCTCCAGGGCTTAGTGAAACAAGGGGATCCTCAGCAGGTCATTGAGTACTCTCTGGCCCTCATCACCATCTTAAATGAGTACGAGAGGTCCATGCTTCTGGAATCTGAGGCTGGAAATGAATTTGAACTCCGGACCTGGACTCGCAATAACATCACAGAAACCCTGAACTCGTTGAATGTGAACACAGTTGATGACATCCAGCAGATCTCAGCTGCCTTGGCGCAGTGCACGGTGGTGAGCAAGGAACTGGTTTGCAAGTCATGCCTGACAAGGACCTTGAACAAGCTGGAGACCATGATGACCATTCTACAGGGAGAAACGACCCAGGGCACTGTGACACCAACTGGCATCGCTGACAACATCCTCAATATCACAGGTGACCTAATTCACCTTGTCAATACAGTTTCACAAGAGTCCAAGCCCCAGGAGCTGCTTGCTGATTCCCACAATTTGCTGCTAGCTCCCAAAGCCTACAACCTGTCTTCCAGCCTGATGCGCATCCTCATGAAGTCTCGGGTGCTGAATGAAGAGCCTCTTGAGCTGGTGGGAGGAGAAATTAAGGCCACAGGCAAGCGGTCTGATCCCTTTAACTTGCTTTGCTACGAAAACACACCAAACTGCCAGTTCTCCATCCCCCAGGCATTCAACACCACCCTTTCCAACCTGACGGATGTCATTCAAGTCATGTTCCAAGTGGACTCCAATCCTTTCCCTTTTGGTTACATCAGCAACTACACTGTGTCCACAAAGGTCGCCTCCATGGAGTTTCAGACACACAACGGGGTGCAGATCCCCATTGGGAGCCTGGACTCAGAGAAAGCCATCACTGTTATGGTGTCAAACAACACAGATGCTGACAATCTCTCTGCTGGCACTGAAGTCATCGAGGCAAGAACATCTGTGAACTTAATTGTGATTATGGAAAGCAACAACAGAGAAGCAGGGCTGCACTTCCAGCTCACTTACAGAGTCCTGAACGATCGCTACATCGCAAGCGAGCCTGAGCCATTCATTATGGCTTATCTCCATCACGAACCAGAGCCCAACGAGCACAACTGTAGTGCCTCTAAGAAAATCGGCCTGGATGCCCTGGCTGGAAGGGACCACAAGCTCTATACCTTCTTCACTTCACCCAGAACGGATGACACCATCCAGAAATACTACTTCAACATCACGAACCATTTCAGCTGGTCCCCAGTGGAGGTGACTCTGGGGCTGTACACCTCCCTCTGCCAGTACTTCAGTGAGCAGGAGAAACGGTGGAAGACAGAAGGGATCATCCCACTGGAAGAGACCAGGCCAGACCAGGCTGTGTGCTTAACCCAGCACCTCACTGCCTTTGGAGCCAGTCTATTTGTCCCCCCAAACTCTGTCCAGTTCATCTTTCCTGCTCCAGGTCCAGGTCTCAACTACATCGTTCTGCTGACATGTGCCGTCTGCTTTGTGACCTACTCGGTGGCTGCACTGATAGTGCACAAGTTGGACATGATTGACATTAACCGAGTAGGGGTGATACCCTTCTGTGGGAAGAACGGGCTGTACAAATACGAGATCCTGGTGAAAACTGGCTGGGGCAGAGGATCAGGTACCACGGCCCATGTGGGGATCGCCCTGTACGGTGTAGACAGTAAAAGTGGTCACAGACACCTGGATGGAGAAAACGCCTTCCACCGCAACAGCCTCGATGTGTTTCAGATCGCAACAGAACGAAGTCTGGGGAGCATCTGGCGCATCCGCATTTGGCACGACAATAAAGGACTCAGCCCCTCTTGGTACCTGCAGCACGTCATAGTCCGGGACCTGCAGAGCAGCAAGAGCTACTTCTTCCTGGTGAATGACTGGCTGTCGGTGGAGAGTGAAGAGAACGATGGCATGGTGGAGAAGGAGGTTTATGCTGCCAGTGAGACAGAGCTGAGGAGCTTCTCCCGGATCTTCATAGCAGAGCTGCAGCGAGGTTTCTTTGAGAAGCATGTCTGGCTCTCCATGTGGGACCGCCCGCCCCGCAGCCGCTTCACCCGTGTCCAGAGAGCCACCTGCTGCTCCCTCCTCATCTTCCTCTTCCTCTGTGCCAATGCTGTGTGGTACGGCGTGGTGGGGAACGTACACCTCAGCAATGGGGCAGTTTCTAACCTGATCCCTGTTAACGTGGACACAGTGGCTGTTGGTCTGGTGTCCAGCGTGGTGGTCTACCCTCTCTACCTGGTCATTTTATTTCTCTTCCGGATGGCTCGTGGCAAGGTCTCCATCAACCACACCCTGACTCACTCAGACCAGCAGTCCTTGGAGATCGACAACTACCTGGACTCCTCAATCCTTGACAGCTCCTTCCCCACCTTCCCTGGGCTCCAGGCAGAGGCCTTCTCTGAGCAAACCAAAACAGATCTCTTCTTGGAGGACTCCAAAAGCCTCGTGCGGTGGCCCTCTAGCGAGGCCCTGCTCAGCTGGCCAGACCTCCTCAGCGACCCCTCCATCATGGGCAACACCATCCAGAAGCTGAAGAGGGGCCGGGCCAGCCGCCACCTTGGACTCGAGGCCCCATTGGCAACTGAGGAGGACAGCTTGTCGCTTGGTGTTCACCAGGGACAACCTCGATATTTCTCTGCCTCAGATGAGGATCTGATCCGGCAGATCCTGGCAGATGGAGCTAGTGGCATCTCCCACTCCCAGGACCTAGGGCCGTACATGAGGGCTGAAACAGATCTGATCTCAGGCCTGTCCAGCATGTTCGGGGAGAAGGTGGAGACTGTCATGATGCAGAAGCTGAACGACAAAGGCCAGGGCATGGCAGCTCCTCCCAGGGAAGTGAACAGATCCGCCAAGTCGACGTGGACAGTTGCAGATCAAACATTCAGAAAGCGCCTGCTGCCACCCTGGTGCTCCTACCTGGCTCATGGTATCAGTCTCCTCCTCTTTGCCACCTCCACGGGGGTCTCTGTGTGGATCGGGGTGGGCTTTTCCTCCAGCGTAGCCCTCATGTGGCTCATCTCAGGGATATTCAGCTTTCTGGCATCCTTCTTGGTCTGGGAGCCCCTGAAGGTTCTGCTGGAAGCCCTCTATTTCTCACTGGTTGCCAAGCGCTTGCACCCAGAGGAAGATGATACCTTGGTGGAGCATCCGTTTGTTGAGCATGTTTCCGAGAAGATCAGCAAAGTCCGACCACCACAGGGGTTTGCCCTTTTCCAGGCCAAGGAGGAGGCCAGGAAGGTCAAACTGCTACACAGGATGCTGAAGAATTTCCTCATCTACATGATGTTCTTGCTGGTGATCCTGCTCACCAACTACGGAGACGCCTCCCGCAACAGCAGGGCCTACCTTCTGCAGAGCTCCATCAAGCAGCAGTTGGGCAGCAACGAATTCCTCCTCATCAAGAGGTCAGATCAGTTCTGGGTCTGGATGTCGCAGGTCTTCCTCCCTTACCTCTACAACAACCAGTCAGGCCAGGAGAGCTACAGCACCACACTGGGAGCAGCCCGGCTGCGCCAGCTCCGGCTGCAGGAAGCTGAGTGCCAGCACAGTGCCCGGGACATCCTCCATAGCATGGGCCCAGCTGCCAGGAGCAACTGCACCAACTCGCACAGCTTTTCTACTGCTGACTATGCAGCTGGCTGGGAAAGGGCGGCCGTGAATGTGTCAGCTGCGTGGTCCTACTCACCACCTGACCTGACGGGGGTCTGGTACTGGGGTTACATCTCTTTCTACGATAGCAGCGGTTACGTCCAGGAGCTGGGGGCTTCGCTAGAGGAAAGCAGGGCTCAGCTGAATTTCCTTCAGCAGCACACTTGGATCGACAACATGAGTCGGGCAGTCTTTGTGGAGCTGATGCAGTATAACCCTAGCGTGGACCTGCATGCTGCCATCACCCTCCAGCTGGAGTTCCTGGGGGCCGGCCAGGCCATCGCCACGGTCACCATCAGCCCCTTCCCACTGCTGCGGCTCAGCAGGGGTGTCACGCTGCAGCTTCTCATGATGGTCTTCCTCATGATGTTTGTGGTCTACTTTGTGGTGTCTGAGTCGCTGTCCATCAAGAAGGAAGGCAGAGCCTACTTCACCCTGTGGGGCAACTATGGCCAGTGGGTCTTCATCCTCCTCACCACGTGCACCGTGGTGGTGCACCTCAGCCAAGCCACCCTTGCCGACCAGCAGTGGCTCAAGTACCTCAACAACCGCAAGGGTTTCACCAACTTCTACCAGGTGGCCTTTCTCAACACCATCTTCAGCACTTTGGCTGCATCCCTCCTCTTCCTTCTGACTGTGCAGGCTGCCCAGCAGCTGCGTTTTGTCAGGCAGTGGTCTGTGTTTGGGAAAACCCTGCGGAAGTCGGCGAAGGAGCTGGCTGCTGCAGGGCTGGCCTTCGCCGTCCTCATCCTGGCCTACGCTCAGCTCGGCTTCCTGCTCTTCTCCTCCTCCTCGGAGTCCTTCCGCAGCGTTGGCAGCAGCCTCCTGCTGCTGTTTGCCATGCTGCGGGGCAGCGGGACCCTCCGCCCCTGCCTGCCCGAGTCCTCGGGCCTCTACTGCCTGTTCTGCACCAGCTACATCGTCCTGGAGGCGTGGATTGTGCTGAGGCTGTTCACCGTGGTGCTTATCTACAGCTACCGGGAAATGCACTTTGAGCTGTACCGCCCCGCCTTCGAGCCCCAGGACTACGAGATGGTGGAGCTCTTCATGCGCAGGCTGAAAATGTGGATGGGCTTCAGCAAAGCCAAGGAGTTTCGGCACAAGGTGAGGTTCGAAGGGATGGAGCCGCTGCCTTCCCGAGACTCCAGTGACTCCAAATCCTTTCGGGGCCCCACTCCCAGCGCTGCATCTGACAGCTCCTGGGCTTCCACCTCCTCCAGCCAGCTGGACGGGCTGAGCCTCGTGCTGAGCACCCGGGACAGCCTGGAAGTGGACGCTGACATCCAGCGCCTCCTTTCCCTCTTTGAGATGCTGCTTGCCCAATTTGACCGGGTCAACCAGGTGACAGAGGACGTGTACCGCATCGAGCACCAGCTGGAGGGCTCTCAGAGCCGCCGCTCCAGGAGGAGGGGTACCCAGGTGTCCGAGGATGTCCCGAGCAGGTACTGTGCGGGCAGCACAGAGCAGGGGCCCTCGCCTGAGACCCCCTCCAACACGGACCTGCAGCCCCTGCGGGACGCCCCATTGTCCCCCCACTCTGCTGCCGCCCCACCAGGCACCAGGGGCTCTGTGCCCAGCCGGCTCCTTCGAGCTAGCAGAGGCATCGGCATGGCGGCTTCTGTGCTGCCCCCGCACAAACCCTACGCCGCCGTGGCTCCGGCGGTGAAGAAGAAACGGCCTCTCCGGGCCAAGAACAGGGTGCACCCCACTGTCAAGTAACAGGTGGCCTGCTGGGTATCGCGGGGAGCAGTGCCTCGGAGAGCCGGCAGCGCCTGGAAGTGGTTTGCATAGGGCGGGCTGTGCCTGCCCTGCAGACCTGGAGCCTCAGGAGCTGCCGCTTCTGATGGCTCCCGCCGCGGCGGCTGTGCCTGCCGGGGCGCACGGGGCTGCTGCCTGCACCGGGGTGGCACCGCTGCCATCCTCCACGGGCCTGACGTCCCCATCGGGTGTGCTGACCTCTCCGCTGGTGGTGCCCAGCACTGTGGGGGAGGCTGTGCAGGGCACGGTCAGTGTGCAGGAAATGCGTTAGCGTAGGGCAGTATTAAAAAGTTGTCTCTGAAATGGCTCCATCTGCAGACAGCCTGCACATGGTGACTGTCACAAGGACACTTTACTGGGGACTGGCACAGGGTGACCGGTACAAAGCTCACCTCCCTTCCCCACTGGCTGTGCCGGAGGGAAAGGGGGAGAGGAGAGCCCCAGGCCTTGAAGGTTTGAATTGAGTCTTGGATTTTTGTCGACCAGGCACACTGTGGAGGAAAGCTACAGCTTTCGAGAAGATATTTAACCCTTTTTTTTTTTTTTTAAAGCATAAATATATATAGATATAGATAAATGATATCTACACCCAGATCAGTTAATTTCCAGTATTGGCTACTTTTATCCTCCAGAAATTGGTACTATTATTTGTATTTAAAGAAATCCAATATTTAAGACCAATGACATTGGAAGCTGCAGCGAGCTGCCAGCCCTGCTGCCCGGCCAGGTCGGAGGGGATAACAAGCA\n>XM_024348560.1 PREDICTED: Pan troglodytes SGT1 homolog, MIS12 kinetochore complex assembly cochaperone (SUGT1), transcript variant X4, mRNA \nAAAAAGTAATGTATTTCTGTATTTTGTACCTTCTGAATAGGGAAAAACTGAATACCTTGAGTAAAATTACATAGAAAATGTTAATGAGACAAGGAGGTGAATTTTGTGACACAGCTGTATTCATTGAAGAGCTTTAAGAAGGAAGCTAAATGTTAAGCCAAAAGGAAGTTGCTGTTGCTGATGCAAAGAAGTCTCTAGAACTCAATCCAAATAATTCCACTGCTATGCTGAGAAAAGGAATATGTGAATACCATGAAAAAAACTATGCTGCTGCCCTAGAAACTTTTACAGAAGGACAAAAATTAGATAGTGCAGATGCTAATTTCAGTGTCTGGATTAAAAGGTGTCAAGAAGCTCAGAATGGCTCAGAATCTGAGGTGTGGACTCATCAGTCAAAAATCAAGTATGACTGGTATCAAACAGAATCTCAAGTAGTCATTACACTTATGATCAAGAATGTTCAGAAGAATGATGTAAATGTGGAATTTTCAGAAAAAGAGTTGTCTGCTTTGGTTAAACTTCCTTCTGGAGAGGATTACAATTTGAAACTGGAACTTCTTCATCCTATAATACCAGAACAGAGCACGTTTAAAGTACTTTCAACAAAGATTGAAATTAAACTGAAAAAGCCAGAGGCTGTGAGATGGGAAAAGCTAGAGGGGCAAGGAGATGTGCCTACGCCAAAACAATTCGTAGCAGATGTAAAGAACCTATATCCATCATCATCTCCTTATACAAGAAATTGGGATAAATTGGTTGGTGAGATCAAAGAAGAAGAAAAGAATGAGAAGTTGGAGGGAGATGCAGCTTTAAACAGATTATTTCAGCAGATCTATTCAGATGGTTCTGATGAAGTGAAACGTGCCATGAACAAATCCTTTATGGAGTCGGGTGGTACAGTTTTGAGTACCAACTGGTCTGATGTAGGTAAAAGGAAAGTTGAAATCAATCCTCCTGATGATATGGAATGGAAAAAGTACTAAATAAATTAATTTGCTCTCATTGTATTGTGTATATTCACCTAATGCCCATTGTGTATTGATATTGCATTCTTGAATTTTGAACACTGAATATCTTTTTGAAAGATTATACTTCTTTACCTCTTTGTGCTTTAGAAATTATTTTCCTTCAAGTGTTCAAGTCTAATGAAGAATGAAGATAACATTTTATCACTTCTGTCCTTAAAGATTTCAGACATGGTGAAACTGAATAAAGCGTGTCATTTGCTCCTAGATAGATTCATTCTATCTAGTTGTGGGGATGGAGAAATCTTTAATGGTATATTTTTGGTTATTGCCTTATTTTTGATGCAGTATTCTGTCAGTAATTTATTAGACCTGGCAGCTTTGGGTGAGCTTAGATTTTTCACCTTCAGTGTTACATTGTGTTTGCTTTTAAAAACTGCTTTTGAATGGAGTTGTAAATACAATTTTTCTATGAA\n>XM_028429604.1 PREDICTED: Parambassis ranga ventral anterior homeobox 2 (vax2), mRNA \nATGTTTGATCAGGCCACGACTATGGGCGATGGGAGCCACCGCTGTGGACCCAACCCGCTGTGCCCGGACAGGATGGAGACAAAGTGTCGCGCCGAGATAGGGAGCCGGTCCCCGGTGCAGAGCTCCACCGACACCCCGGGGACATCAGCGTCCACGCCGACGTCCTCCAGCGAAGACGGGCATGACAAACTTTTGGGAGTGGACCCAGACTACTGTCGGAGGATATTAGTAAGAGACGCCAAAGGCACCATCCGAGAGATTGTCCTGCCGAAGGGCCTCGACCTGGACCGGCCCAAGCGCACCCGGACCTCCTTCACGGCGGAGCAGCTGTACCGGCTGGAGCTGGAGTTCCAGCGGTGCCAGTATGTGGTGGGGCGGGAGCGGACGGAGCTGGCCCGGCAGCTGAACCTGTCCGAAACACAGGTCAAGGTGTGGTTCCAAAACCGCCGGACCAAGCAGAAGAAAGACACCACCAAGGACTCAGACAAGCGCTCCTCTTCCACGTCCGAGTCTTTGGCCACCTGCAACATCCTGCGCCTCCTGGAGCAGGGCCGCCTCCTCTCGGGCTCCGCTCCACCTCCCAACCCCCTTCTAGGGCCCCCAGCTCACCCAGCAAATGGTTCGCTTTTGAGTAGCCCGGGCGGGGGCTCCTCCACCTCCCCTGGGATGAGCAGCAGCACTCCTCCCAGCTCTCTACCTGGAGGGACATTCGGGCTGTCGCTGCCCTCACTGGGCGGCACCCCGCCTTCGCCGCGGCTGGGCGTCCCGCCGCCGCACTCCCTCTGCTTCTCCATGCCACTGCTAGGTGGCGCTCATCACGAACTGACATCCGCCTACGGCTGCGGGTCCTCAGCTTTTGAGCCGTACATGCGGCTGGACAGGAAGGACGCAGATCTGGGAGGGAAGAAGACAGTTTCTTAA\n>XM_039793275.1 PREDICTED: Perca fluviatilis Rho GTPase activating protein 1 (arhgap1), transcript variant X5, mRNA \nGGTGTCGACGCAGATTGTTGCTGTTGCTGTCAACCGCACGTCTTGCTAATCAAGTCTACGGCGACTTCAGACGCCACAAAGCCCACTGGGTGACTACAAAGCAACTTTGCAATTACGGACTCTGGCTGCTACTCTGTGAAAGTCCCAGCTTTAAGAGTGTGTGGTAAACATCACTGTGCAGTGTGTCAGTGGGTGTGTGTAGCACCGTTTTGCAGAGTGAGTGATGTCTTCAGAGCTGCTGGTAGATTTGGGTGAAGACCCTGCGACTGCACAGTTAGGACAGCTGAAGCTGACCACGGTAGATGACCAGCAGTGGCCCGCTGATGAGTCTACTCTCAGCAAGTCAGAGACAGATATCTCCCAGTGCTTTGACGCTGGCTCTCCACACCTGCCCTGGGACCATCCGTTCTATGACATCGCCAGGCATCAGATCATTGAAGTGGCGGGTGATGATAACTTTGGAAGGAAGGTGATAGTGTTTAATGCATGCAGGATGCCTCCACAGCACCAACTGGACCATCACAAGCTGCTGATGTATCTTAAAGGAACACTGGATCAGTATGTTGAAAGTGACTACACTCTGATCTATTTCCATCATGGGCTGACCAGTGAAAACAAACCCTCTCTCAGCTGGCTACGAGATGCATACAGAGAGTTTGACAGAAAGTATAAGAAGAACATCAAGGCTCTGTATATCGTCCATCCAACCATGTTCATCAAGACTCTGCTGATCCTCTTCAAACCAATCATCAGTTTTAAGTTTGGCAGGAAGATTAACTATGTGAGTTATCTGAGTGAGCTGGAAGATGTGGTGAAGTGTGAGCAGTTGCTAATTCCTGCCCGTGTCAAAGAGTATGACAACAAGTTAAGAGCTTCCGTTAAACCAACCGTCCAGCCTCCCATGTCTCCTCCTCACAGCCCCCCCCTCCACAGCCAGGTGTTTGGGGTGCCACTTGCATTGCTCAGGCAGAGGAATCCAGATGGTGATCCTGTTCCCGTGGTGATGAGAGATACCATTAGCTTCCTTTGCGAGCAAGGTTTGGAGATTGAAGGGATCTTCAGACGGTCTGCCAATGTGACTCTGGTGAAGGAGGTCCAGCTCAGATACAACTCAGGTGCAACGGTGAATTTCAGGGAGATGGAAGACGTCCACTTGGCTGCTGTGATTCTGAAGACATTCCTGAGGGAACTTCCAGAGCCTCTGCTGACCTACCAGCTCTACAACGACATTGTCAACTTCACTTTATCCAGTGAAAGGCAGGTGGCACTTATGAAGACACTGATAGAGTCGCTGCCAGAAGAAAACTATGCACCACTGCGACACCTCATCACATTCCTGGCAAAGGTATCAGCCAACAATGAAGTGAATAAGATGACCAACAGTAACCTGGCTGTGGTGTTTGGTCCTAACCTGCTCTGGGGACGGGACAACGCCATGTCACTCAGCGCCATTGGGCCAATCAACAACTTCACTAGAATCCTGCTGGACCACCAGCATCTGGTCTTTACCTAAACCCTGCCCCTTTACCCTGCAGTCTCTCTTCCAGTCGGAAACACCCTTTTCCATTAAAACACCATACACTTTAAAAGGATCCCGTGGACCAATTGCATTTAATTTTGTCTCCCACCAGTCTTTACATTCTGATTGGCACATATTGTTGATGACAACAGCAGTGTGGACTGCTACTAGCTTCTGGCCAGCATTTCCATTTGCATGTGACTCTAGTAAAATGGCACATACATTAGACTGCAGACAAATAACCCTCAATAAACAATGTAGGCAGAGAGATTTAACTTTAAAGTGCCAGTTATTCTTGAAAGTCGTGTATTTTTGCAGCTTTGCTTTTTGTCATTTTGATAAGTCAACAGAGCTGCCTCAGTATCCAGTTTTGCAACCAGTGAGTTGGAGGAAATCACAGAATTTGGGGACAGTTTTGTGAAATCAAAATCAGGGAGTGGATCTTCACAATTACTACTACATAACAAAAAACTAGATGATATGAGGTGAAGATCTGTGCCTGTGCAGGTTATTCCAACTTGCAGAAATAGTTAACTCCAGTGATTGTCCTTAAAAAAGTCTGCCGACTCACAGAAGTGAGAATGTAAAAAAAATATACAGAATCGAAGAAGGTGGAGATAACCTGAAATTCAGTCTAGCTCCAAAAACACTGGAACCTTCATTTCCCATAATGCAGCTTATTAGAGTATTTCATCAGACCCTAGCTGCCTGGTTAACTAAGTCTTGTAACGTAAGGCTTTCTGTTATAGATTTGTAGTCCAAACATTACTTTCTCACATTTGACACAGCTCCCCCAGACACAACTGTCAGACTGAATAATGAAGTGAAAGGAAATGGTAGATCAATGTCCTATAATAATAATGCTATAATAAACATAATCAGGGAGTGTATATTTAAGGACATAATTGCACTCAAGTACAATTGATTATGTTGGTTCCAGTGTGAATGCCACTGGCTGAAGTGCAGGCAACCTACAGTTATTTCACATAGTACATTTCATCACCCTATTACACCCAACAACCCTTCAAAAAATCCTGTCCTAATTGCATATATATATATATATATATACACACATACATGTGCTGTGCTGTTGTCAGACTGTCTCTCTGCTGTTTTTTTATGTAGTGACAAAAAAAATAATAAAACTGGCCTCCAGCATTCACATGAATTATCACCCTGCTCTGCATGGTAATACATGATCAGTAATAAGTACAGATAATGAAGCAGTGCAGTTACTGTACAAAACGTATAGGATTCTGATCCCAAACTTAAAGAGGAGCGATAGTGGCCCTGTTCAGACCTGGCATTATAAGTGAACAGCTCTGAGGTTGTTAACTTAGATCATGCGGCAAAAACTGCAGTTCATTTTGAATGGTGATAGTGTGATCACCCGATACGCAACTTAATGCCAGTTCAGAACAGGGCATAAGAGAATGAAGGTCGGATTTTCCATGTCCTTGAAAGTCTCAGGATCATTTACAGTAGTAGTAAACTTGGTACCAAATGTTGTTGACAATCTTTTAAATGCTGTAATTATAGTAACCAGTAGAAAAGGAGCTGTGTGATTCTACCAGCAGATGAGTAAGTGTTTAGAACCCAAAAACAGCTGTGCATGTAGATGAAATAAGTGCTGGTCTAATATACTCTGTAATATCA\n>XM_035125527.1 PREDICTED: Zootoca vivipara cadherin 20 (CDH20), mRNA \nTCTACCTGTAACCTCAGCTGCAGCAGTAAGTGACAGGAGCTCAGAGGAAAGGCCAACATAGTGACATCAGTAAAAGAAAAAGGAAGGAAACTACTGTCCTTAATCTGGCTGGCTTCATATCACTGAAAGACTGCCCTTGGGAGTTTCAGAGGCCTTTCTGTTGGGTGTTTTAAAGGACCCGGCTACAACTTTTGGAAACAATCCTGGTATGGCAACGCGAACTTCGTGTGAAATGGATAGAGCCAGGAAGTGGCTCGGACTCAGTATATCTTTAAGTTGTTGCTTAATGATGAACCTCGTTACGGCTGTGTTATCTGGGAGCAGCAGACCACCCAGCAAAGGCCAAGAAGGCAGCCTCTCGGACAACTTGCTTCTGCATCTGCGAATGAAGAGGAGCTGGGTGTGGAACCAATTCTTCGTTTTGGAAGAATACACTGGAACGGATCCTTTGTATGTGGGAAAGTTGCATTCTGATATGGACAGAGGAGATGGATCCATCAGATATATACTGTCGGGAGAAGGAGCAGGCATTGTTTTTACCATTGATGATGCAACTGGAGATATCCATGCCATTCAGAGGCTGGACCGAGAAGAGAGATCCCAGTATACTCTAAGGGCTCAAGCTTTGGATAGACTGACTGGCAGGCCGATGGAGCCGGAATCTGAATTTATAATCAAAATCCAAGATATCAATGACAATGAGCCCAAGTTCCTGGATGGGCCATATGTTGCTTCGGTACCAGAAATGTCACCAATAGGTACCTCCGTTATCCAAGTGACAGCAACAGATGCTGATGATCCTACCTATGGGAACAGTGCCAGGGTAGTCTACAGCATTCTCCAAGGACAGCCATATTTCTCTGTGGACTCCAGAACAGGCTTGATTAGGACAGCGCTAATGAACATGGATAGAGAAGCAAAAGAATATTATGAAGTGATTATCCAGGCCAAAGATATGGGCGGACAGTTGGGAGGATTAGCTGGGACGACCACAGTCAATATCTCCCTGTCTGATGTCAATGACAACCCACCCAGATTTCCACAGAAACATTATCAGATGAGCGTTCTGGAGTCTGCTCCAGTTAGCTCTACTGTGGGCCGTGTCCTTGCTAAAGATTTGGATGAAGGCATTAATGCTGAAATGAAATACAGTTTTGTGGATGGGGATGGACTGGATGTTTTTGATATTGCCACCGAGTCTAATCGCCAAGTTGGTGTCATTACAGTGAGAAAGCCCTTGAACTTTGAGAGTAAGAAGAGCTACACTTTGAAGGTAGAGGGTGCCAATCCCCACTTAGAAATGCGCTTCCTGAACCTGGGCCCCTTCCGTGACACTGCTACTGTACACATCACCGTTGAGGATGTAGAAGAGCCCCCACTCTTTGAGCCTAGCTTTTATTTTGTGGAAGTCCCTGAAGATGTGGACATTGGGACCACCATACAAATGATTCATGCCAAGGACCCGGATGTGACCAACAACTCCATCAGGTATTCCATTGATCGAAGCAGTGATCCCGGACGCTTCTTTTATGTCGACATTGCAACAGGTGCTCTGATGACTGCAAGACCTCTGGATCGGGAGGACATTCCATGGCACAATATCACCATCCTGGCCGTGGAGCTGAACAACCCCTCGCAGGTTGGCAGTGTTTCTGTCACGATAAGAGTGCTGGATGTGAATGACAACGCTCCAGAATTCTCCAGATTCTACGAGGCTTTTGTATGTGAAAATGCCAAAGCTGGACAGCTGATTCAGACAGTGAGCGCGATTGACCAGGACGACCCACAAGAGGGACAGCACTTCTACTATAGCTTGGCTCCTGAGGCAGCTAACAACCCCAACTTTACTCTAAGGGACAATCAAGACAACACAGCTTGGATTTTAACCAGGAGATCAGGCTTCCGGCAGCATGAGCAGAATATATTTTACCTTCCTATCCTGATAGTTGATAATGGACGTCCCATGCTGAGTAGCACCGGGACAGTAACCATTCACGTTTGCAGCTGCGACGACAAGGGTCTTGTGATGTCCTGCAATGCAGAGGCCTATGTGCTCCCTGTCAGCCTGAGTAGAGGAGCTCTTATTGCCATTCTAGCCTGCATCTTTGTCTTGCTAGTGCTGGTACTGCTGATCTTGTCCATGAGAAGGCACAGGAAGCAGCCGTATATCATTGACGAAGACGAGAACATCCATGAGAACATCGTGCGGTACGACGACGAGGGAGGTGGGGAGGAAGACACAGAGGCCTTTGACATCGCAGCCCTGTGGAACCCGAGGGAGGCTCAAGTGGTGCTGAAGAGCAGGCAGGACATGATGCCGGAAATCGAAAGCCTCTCCAGATACGTTCCTCAAGCCTGCACGATGGACAGCAGTGTTCATAGTTATGTGTTGGCCAAGCTCTACGAAGCCGACATGGACCTCTGGGCACCTCCCTTTGACTCTCTCCAGACGTACATGTTTGAGGGCAACGGCTCCGTGGCAGAGTCGCTCAGTTCCTTGCAGTCTGCGTCTACGGACTCAGAGCAGAGCTACGACTATCTGACGGACTGGGGGCCTCGCTTCAAAAAGCTGGCCGAAATGTACGGTGCCACAGAAGGGAACGGGGCCCTTTGGTAACAAAGAGGCGAAGGCAGAGTACTACTCGGGTACTCGGCACAGCCATCCGAATTTGTACTCAATCAGATATTGAGGACACAGGCGAGGTGGCCTCCTACAAATAGCAATATGGTGCTTGAGGGAGAATGCAGAAGAGGAGTGGAAATAAATAAGAGCTCTCTCTGGATCAGCTTTACTCAGTTACATTAAGCTACATTTGTAAACG\n>XR_003975245.1 PREDICTED: Gadus morhua 5S ribosomal RNA (LOC115538338), rRNA \nGCTTACGGCCATACCACCTTAGGCACGCCCGATCTCGTCTGATCTCGGAAGCTAAGCAGGGTTGGGGCTGGTTAGTACTTGGATGGGTGACCGCCTGGGAATACCAGGTGCTGTAAGCA\n>XR_008382064.1 PREDICTED: Nycticebus coucang U6 spliceosomal RNA (LOC128592852), ncRNA \nGTGCTTGCTTCGGCAGCACATATACTAAAATTGGAATGATACAGAGAAGATTAGCATGGACCCTGTGCAAGGATGACACGCAAATTTGTGAAGCGTTCAGTATTTTT\n>XM_035287433.1 PREDICTED: Callithrix jacchus URI1 prefoldin like chaperone (URI1), transcript variant X4, mRNA \nTCTTTATCAATGTGTCTGTCTCTTTACTGATGCCACTCTGTTTTGATTATGTAGCATTATAGTGTTCCTTAAACTTGGTGGTACAAATGCTCTAATTTGTTCTTTCCAAATTGTTTTGGCTGTTCTACCCCCTTTGCCTTTCCATTTTAGAAACCACTTGTTTATGTTTACAAAAACTCCTGGTGGGATTTTGATTGGAATTACGCTAAATCAATACATCAATTTGGGGAGAATTGACGTCTTAACTAATGTAAGAAAAACAATAGAGGATTTAAGAAAAGTGGTGAAAAATTTTGAATCAAGAGTTGAATTCACAGAAGATTTGCAGAAAATGAGTGATGCTGCAGGTGATATTGTTGATATAAGAGAAGAAATTAAATGTGACTTTGAATTTAAAGCAAAACACCGAGTTGCTCATAAACCACATTCCAAACCAAAAACTTCAGATATTTTTGAAGCAGGTATTGCAAATGATATGAAATCTAAGGATTTGCTTGCTGATAAAGAACTGTGGGCTCGTCTTGAAGAACTAGAGAGACAAGAAGAATTGCTGGGTGAACTTGATAGTAAACCTGATACTGTGACTGTAAATGGAGAAGATACGACATCTTCTGAAGAAGAAAAGGAAGATCACAACACAAATGTGAATGTGATGCATCAAGTAACAGACTCTCATACTCCGGACAGTTGTCATAAGCATGTGGCAAGTTCAGAACCATTTAGTGATCAGTTGAATAGTCAGTTGAACTGTTCAGTGAATGGTTCCAGTTCTTACCACAGTGATGATGATAATGATGACAATGATGACGATGATGATGACGACGACGATGGTGATGATGAGCATGAGGCTTTAGGAGTTGGATATAATTCTATACCAACAATATATTTTTCTCATACTGTTGAACCTAAGAGGGTCCGAATAAATACTGGAAAGAATACCACTTTAAAATTCAGTGAAAAGAAAGAAGAAGCCAAACGTAAACGAAAGAACAGCACTGGCAGCGGCCACTCTGCCCAGGAGCTGCCCACCATCCGGACACCTGCTGACATTTACAGAGCCTTTGTTGATGTTGTGAATGGAGAATACATCCCTCGCAAATCCATCCTGAAGTCTCGAAGTAGAGAGAACAGTGTGTGTAGTGACACCAGTGAAAGCAGCGCTGCTGAATTTGACGATAGGCGGGGCGTTCTGAGGAGTATCAGCTGCGAAGAAGCCACTTGCAGTGACACCAGTGAGAGCATTTTGGAAGAGGAACCACAGGAAAATCATCAAAAGAAACTTTTGCCCTTATCGGGAACACCTGAGGCTTTTTCTGGAACTGTTATAGAAAAAGAATTTGTATCACCTTCCTTAACACCACACCCAGCCATTGCTCATCCTGCGCTACCCACTATTCCAGAACGAAAGGAAGTTCTGTCGGAAGCCTCAGAAGAAACTGGAAAGAGGGTTTCAAAGTTTAAAGCTTCCAGATTGCAGCAGAGAAACTAGGCCCTGTGTAGGAAATGGGAATTTACATCTTAAAACCTAGTTGTTCATTTGTTTAGAATATCGATAGCAAAATAGGTTACGTGTAGTTTGACATAAGGTATCCCGAGTTACTTTGGCAACAAGTTCTTTTACCCTTACCAGCGGTATTTGAAAAAAATCACAGTAACTGTCTGAATACTTTAATATTCGCCTTGTTTTGTTAGTTCTCTGAATACTGTCAACACTTGTCTGAGTTTGCCTTTATGATGCAGTGGCAGCATTTTGAATTACTTTTCGAAGAATACTGTTCATACGCATTGTTTTTGTGTTTCAGACGAAATACAGGCAGTTTTGTGCCAGCTGTGATATTGTGCATACCATATGGACCCTTTTAAAGAAAATTTTTAAATTTCAAAGAGATTCAACAATTATATTACTTGCTTTTACATTTTAAAGGCACTTTAAAAAAGATCTACTTCGCCTGTAGGTTTTGCAGCTAGTGGGCTATTTAAGAAACCTCTCCCCTCTAAATGTCATACTGTAATCTATCAGAAAACTACATGAGTTAATTGTACTCTATGGAAAATTTCTTTGGAAAGATATTTTGTAAAACTTTTTTTTTTTTCCAAGTAAAAATTTTATGAAACTTGGTCTCAAAAATGTTGTGAACTTTATGATTCAAAATTAAGTCTAGATATGTCCTCGATTCATGATATATGCTACATGTATCACACAACAGATCTGCAATTCTTTCACTTCCCTGGACGCTTCTCCCTTAGTTTCTGCAGTTTCATTGGGGTTATGTTTTGGGAGACGAGGAAACGTCTAGATGCTTAAAAACGATTTTAAATAAAAATTCCTTACAGTTGAAA\n>XM_003139612.1 Loa loa hypothetical protein partial mRNA \nATGCGGTCTTCGACTGTTCCGTTATCAATAGTATTGGTGTGGTGCATCTACTACAAACTGAGTTGTGCAAAACAGTCAGAACTTGCGAATAATATGCAAATTTCTAATGTATTGAGTGAAAACGACGCTCAAAGCACCGAATTTGTTCGCACAGCTTGGAGCGCTGCAACTTATTCGAAACTCAGAATTTACAGAGAGTTTTTAATTATCTTCCTTGATAAAAAATCCATGAGGGTTCTGAGAACGAGTTGCTTCTTGCTGGAATTTTTCAAATTACATGTATGGAAACGTGCTTTCGGTAAAATCGCACTAGACATTACTTTTGGTCGAAATGCACAAATATCTATTTGGTTTGAAATGAAAATTTCTAAGCTTTCCAGTCTGCAATTAATTCTTAGAAAATTGCAAGAAGAATAA\n>LC592336.1 Uncultured archaeon gene for 16S rRNA, partial sequence, clone: m5-3 \nGCGAGAAACCTCCGCAATACACGAAAGTGTGACGGGGTTACCCAAAGTGTTCATTAGAACTGTGGTAGGTGAGTAATGTTCCCCACTAGAAAGGAGAGGGCAAGGCTGGTGCCAGCCGCCGCGGTAAAACCAGCTCTTCAAGTGGTCGGGATAATTATTGGGCTTAAAGTGTCCGTAGCCGGTTTAGTAAGTTCCTGGTAAAATCGGGTAGCTTAACTATCTATATGCTAGGAATACTACTATACTAGAGGGCGGGAGAGGTCTGAGGTACTACAGGGGTAGGG\n>XR_004309533.1 PREDICTED: Coturnix japonica uncharacterized LOC116654348 (LOC116654348), ncRNA \nCTTGCTTTTTGCCTTTAGCCTTTCTATGAGTCAGGAGACAGCAGGCTGCTTGCAAGTATAGGCTGGGGCTGGTTTTTTCCCATTTATTTATTTATTTTCCTAGGAAGAATGAAGAGCAAATAATGAGGAGGAAGAATAGATGATGAACCCAAAGATGAGCACGAGTTCCTGGGCTGGTTCTGACCCATCTAAGGGGTCCTGACTCTTAGGATCCTTTGGGGTTGGAGCTCACACATCCTGCTGCTTGTTGATGGAGGAACGATGACCCCATGTGAGTACTGCAGTGCCATACAGCCCTATTTGGGTGCATGGAGAGGCCAATTCGGCTGCAGCAGCAGTGAGAAAGCTGCAAGGTGCTGAGCTCTCTCCTGCCCTGGAGCAGCCCAGGGGATGTGGGGGCAGTCAGTGGCTGTTTTGGGGCTGTGCTGGGTGTGTTTTGGGGCTGTGCTGGCTACAAGCCTCGCTTCTATCTGCAGGCCAGCAGGCAGCATGTGATGCTGTGATGCTCACCAGCTCCAGCCAAGGGGAAAAGCCCCTTCAGCACAGGAGCTGCTGGCAGGGTGCCTGGCTGCACCGTGCCTGGCACCAGCAGTTCGGTGCCCCTCAGTGCAAAGCCTCCATCTGCTCCCCATCCTTCCCCCCCACCATGGGATGGGACTGAAGGTGGCACAGCCCCTGAGCGCTGTGCCTGCCCAGTCCCAAAACGCAATGTCACCAGGGCTCTGGGACAACCCTGCCGTGTTTAAATCCTCTTCCTAGGGGCAGCCGGGGCTGCAGACCCCTCAGGACGGCTACAGAGGCAGCAGCGTATCGCACCTTCAGCCCTCGGGGCTGCGAGCAGTCGGGTTGGAGCTGGAGCTGGCGAGCTCTCAGCACCCTCTGCCGGCTCTGCTGCCCGGCCCCGGCCCCTCCTGCTTGGGATGGAGCCTCTGTGAGCTCTAAGCTGCTGCTCTGCTTTGCTCTGCTCCCATTCTACAGCCCTGAGCCCAATAGGGGCCGTCACCCTCTGCCCTCGCACTGAGTGCTTTGCGCCCTGGGTTGAGCTGATGACTGCAGTGCTTGTGCTGAGGGTACGGGAAGGGGCCCAGCAGCCTCTCGATGTGGCTTTTCTCTGCTGTGAATGATCCCAAATAGCATCTCTGTGCTGTAAGGCAGCCCTGGGCTGACAGCAGTCTGTGCTGATGTACACGTATGGGGTATTCATGGGGCGGAAAAAGGCTGCTGCTCAAACAAGCAAACATTGACTGTCTGGTTTCCCAGCGCTGCCCCCAGCAGCAGCTTTCACATACCCTGCAGACATTCCTGCTGCTGGGCTCCCATCACCGGGCAGGGAGGAACCCCCACACTGCCTGCAGCAGCCCCTCTGACCCAGGAAAGCAAAGGGAAACCAGTTGACGTCGGGATTCTTTTAATGCAACAGCTCTTAAAATGCAACCTTCAAATGATTTTTATAATGGTCAACAATGAGAAACATCTGAGCTTTTCTACCTATGCACCCCAAACCCTTTGGGTGGAGGACTCCCTTGGGCAAAAAGGGTGAGGACAGTGTTCACATGGAGGCCCCCAACAAATGGCAGCACAACCTGGACCTTCCTCTCTCACACTTTACACTCAGGCACAAACCTACAAAGGCATCCAGCCCATCAGCTCCCCTCTTGTAGCACTTCAGACAACAGCTTCAGGCTCCTGGTTCTCTCTGCAGGTTTGTGCCTTCATGCTACGTAAAGCGATTTGAGAATGAATATCTGACTGTTTTCTGCCTTGATAGGATGGTGGTGGAGGAAGCTGATTTCCCATCACCTTGCTTTGTATGATATAATGCTACTTTATGCCTTTGTTCTGCAGAGCAGCAGGTGTTACAGGCTGCCACAGCTCGCCAATTCAAGTAACGTGGGAAATTCTGCTCCAGCCTAAACATCTGTGTAAGAATATCCCCCCACCGCCCCCTCCGCATCGTGCAGTGTTTATATGCTGTAACAGGAGAGCAGGCAATACTTGCTGAAACACATTTAATACCTTCCAGTTGTTAGTCTCAGTTTCTGGTTCTGTGCAGTCAGCACACAGCCCTCGGGCTGCGCGTGCTGCAGAATAGCAATGCTGTTAGAGCTGTGAGTGCCTTTCTCCCATCTAAAATGCTCAGTGGTTTTCTTGTACCATTTACTGGCTCTGCCCTTCCAAGAGGGGAATGGTGAGACTACACACAACGTCCTGTTGGAGGAAGGTGATGCTGTGTCTGCTTTCATCAATGCTGTGAAGAGAAACAGCAGAAAGAACCACGAGGGTCTCCTGAATCTCAGTGCTGTGTGATGCTTTCCTCCCCTTCGTGTCAAGCCTGTATTTTACTACTACCAACTACAGAAAGCTACTTTGGTCTACAGAAATGCTATGCACTTATCTCCAAGTGAATTCTAACCAACCCTTCTTAAGGACAGCAGTTAACAGTAAGTCAGTGGGTTCTTTTGCCTTAGTCTCCAATACGAGTTATAAAACCTGGATTCAGGTTTGGACAGACTGGAGCTCTTTTAGAGTCTGAGCAGCAGCTCTTGCACAACCAAAGGTCACAATTAGAAACTGAGTGTAGAAAGAGTTCCCAGGGGG\n>XM_006448447.2 PREDICTED: Citrus clementina protease Do-like 10, mitochondrial (LOC18050602), transcript variant X1, mRNA \nTCATCAAAAGATTCAAAACCTAACAAAAGCGTTTTCCTTCTGATATTTTTGCCTGCAGCTTTGGATTAAGGCAAAAACCCAAAGCCGAAGGCAAAAAGAAGAAATGCAAATGCTGCTGGGTCCGTCACTGCGTAGTCTACGAAGGCAGCTATGGTCCTCTTCATCCTCTATTTTCTCCAATTACAGTAGTATTAATAGCAGTGGCTTATTAGAAACCTTCTCCAATACATTAAGATTAATTATTTTGCCTTCTACCTCTTCACTCTCCACTATTAGTACTAAAAATTGTAATTTTCACTATTTTTCAACATCAGCAGCAGTAGCTGCTAATTTGAGTACCAAGGAAATTGTTTCTAAAGTTACGCGACGGCGACAACGACGTCGTTTAGCTAAAACCTGCGGAAAGACTACTAATGCTTACGCAGCAATAGAGCTTGCTTTGGATTCTGTTGTGAAAATATTCACAGTTTCAAGCAGCCCTAACTATGGACTTCCCTGGCAGAACAAGTCCCAACGAGAAACCACCGGTTCAGGATTCATTATCCCTGGAAAAAAGATTCTTACAAATGCTCATGTGGTGGCTGATAGTACATTTGTGCTTGTAAGAAAGCATGGTTCTCCAACCAAATACAGAGCCCAAGTTGAAGCTGTGGGTCATGAATGTGACTTGGCTATTCTGATTGTCGAGAGTGATGAATTTTGGGAGGGAATGCATTTCTTAGAGTTAGGAGACATTCCGTTTCTTCAACAAGCTGTCGCTGTTGTTGGATATCCTCAAGGTGGAGACAACATTTCCGTTACGAAAGGTGTTGTTTCGAGGGTTGAACCTACACAATACGTACACGGTGCTACTCAGCTCATGGCAATACAGATTGATGCTGCTATTAATCCTGGCAACAGTGGTGGTCCAGCCATCATGGGCAATAAGGTTGCAGGTGTAGCTTTTCAGAATCTTTCCGGTGCTGAAAATATAGGTTACATTATCCCTGTTCCTGTAATAAAGCATTTTATAACTGGTGTGGTGGAACATGGAAAATATGTTGGATTTTGCTCGCTGGGACTATCATGCCAGACCACTGAGAATGTTCAACTTCGTAACAACTTTGGAATGCGGTCTGAAGTGACTGGGGTACTTGTGAACAAAATTAATCCTCTGTCAGATGCTCACGAAATATTGAAAAAGGATGATATTATTCTTGCATTTGATGGTGTGCCTATAGCAAATGATGGAACAGTTGCTTTTCGTAACAGAGAACGTATAACATTTGATCACTTGGTGTCTATGAAGAAACCCAACGAGAAGTCTTTGGTTAGAGTTTTGAGGGATGGCAAGGAGCATGAATTCAGTATTACACTACGACCTCTGCAATCACTAGTTCCCGTACATCAATTCGATAAGCTTCCTAGCTATTACATATTTGCTGGCCTGGTGTTTACTCCACTTACACAGCCATATCTTCATGAATATGGAGAAGACTGGTATAATACTTCGCCACGTCGTTTGTGCGAACGTGCATTAAGGGAGCTGCCTAAAAAGGCTGGTGAACAACTCGTTATCCTTTCGCAGGTGCTGATGGATGATATAAATGCCGGGTACGAGCGTTTTGCAGACCTACAGGTTAAGAAGGTCAATGGGGTGGAAATTGAAAATTTGAAGCATTTATGTCAGCTAGTGGAAAACTGTAGCACTGAGAACTTGAGGTTTGATTTAGATGATGATAGGGTTGTTGTATTGAACTATGATGTGGCAAAAATTGCCACATCTAAAATTTTGAAGCGTCACAGAATACCTTCTGCTCTGTCCGGTGATCTTAACGGTGAACAGATCTCCGAAATTGAGTTAGCTTCCAGACATAAAGAATGGTCACAAAGTTGAGGGCCCTGAGCCGGCTAATATTAAAATTTTGGTTTCCTAATCCACTTAGCTGCTTTTATTATTTGTCATTTATAATCGGATGTTGAGGTGCAAACACATTTTTGGCCTTTGTGTATTGTAAGCGATTCAGAGTATTAAAACCAAAAAGCGTTCTGTTGTTTGGTAAA\n>XM_037730203.1 PREDICTED: Cebus imitator glycosylphosphatidylinositol specific phospholipase D1 (GPLD1), transcript variant X3, mRNA \nGAGACTTGGTTTCCTGGGTCAGTGACCTGCTTAGAGGGAAGCAGCGGGTCTGCGCCTGGATTTCGGAGTCACGGTGCTGCTGCAGCTCTGAGCATTCCCACGTCGCCAGAGAGCCCGTGGGGAAGGAGAGCATGTCTGCTTTCAGGTTGTGGCCGGGCCTGCTGATCGTGCTGGGTTCTCTCTGCCGTAGAGGTTCATCCTGTGGCATTTCAACGCACGTAGAAATAGGACACAGAGCGCTGGAGTTTCTTCAGCTTCATAAAGGGCGTGTTAACTACAAAGAGCTGTTGCTAGAACACCAGGATGCATATCAGGCTGGAACCGTGTTTCCTGACTGCTTTTACCCTGGCATCTGCAAAGGAGGAAAATTCCATGATGTGTCTGAGAGTACTCACTGGACTCCGTTTCTTAATGCAAGCATTCATTACATCCGAGAGAACTATCCTCTTCCCTGGGAGAAGGACACAGAGAAATTGGTAGCTTTCTTGTTTGGAATTACCTCTCACATGGTGGCAGATGTCAGCTGGCATAGCCTGGGCATTGAACAAGGATTCCTTAGGACCATGGGAGCTATTGATTTTCACGGCTCCTATTCTGAGGCTCACTCGGCTGGTGATTTTGGAGGAGATGTGTTGAGCCAGTTTGAATTTAATTTTAATTACCTTGCACGACGCTGGTATGTGCCAGTCAAAGACTTACTGGGAATTTATGAGAAACTCTATGGTCAGAAAGTCATCACCGAACGTGTAATTGTTGACTGTTCACATATCCAGTTCTTAGAAATGTACGGTGAGATGCTAGCTGTTTCCAAGCTGTATCCCAGTTACTCTACAAAGTCCCCGTTTTTGGTGGAACAATTCCAAGAGTATTTTCTTGGAGGACTGGATGATATGGCGTTTTGGTCCACGAATATTTACAATCTAACAAGCTTCATGTTGGAGAATGGGACCAGTGACTGCAGTCTACCTGAGAACCCTCTATTCATTGCATGTGGCGGCCAGCAAAACCACACCCAAGGCTCGAAAATGCAGAAAAATGATTTTCACAGGAATTTCACTACATCCCTAACTAAGAATACTGAGAGGAATATAAACTATACTGAAAGAGGAGTGTTCTTTAGTGTAGATTCCTGGACCCCGGATTCTGTGTCCTTTATGTACAAGGCGTTGGAAAGGAACATCAGGACCATGTTCGCAGGTGACTCTGAGCTGTCACAGAAGCACGTCTCCAGCCCCTTGGCCTCTTACTACTTGTCGCTTCCTTATGCAAGGCTTGGCTGGGCAATGACCTCAGCTGACCTCAACCAGGATGGGCATGGCGACCTCGTGGTGGGCGCACCAGGGTACAGCCGCCCCGGCCACGTCCATGTCGGGCGCGTGTACCTCCTCTACGGCAGTGGCCTGGGCCTGCCCCCCATCGACCTGGACCTGGACCAGGAGGCGCACGGGATCCTTGAAGGCTTCCAGCCCTCAGGTCGGTTTGGCTCGGCCTTGGCGGTGTTGGACTTTAACCAAGATGGCGTGCCTGACCTGGCTGTGGGCGCTCCCTCCGTGGGCTCCAACCAGCTCACCTACAAAGGTGCCGTGTATGTCTACTTTGGTTCCAAGCAAGGAAGAATGTCTTCTGCCCCTAACATCACCATCTCTTGCCAGGACGTCTACTGTAACTTGGGCTGGACTCTGCTGGCTGCAGATGTGAATGGAGACAGTGAGCCTGATCTGGTGATTGGCTCCCCCTTTGCCCCAGGCAGAGGGAAGCAGAAGGGAATGGTGGCTGCGTTTTATTCCGGCCCCAGCCACAGCGACACAGAAAAACTGAACGTGGAGGCGGCCAACTGGACGGTAAGAGGCGAGGAAGACTTTGCCTGGTTGGGATACTCCCTTCACAGCGTCACCGTGGACAACAGAACCTTGCTGCTGGTGGGGAGCCCCACCTGGAGGAATGCCAGCAGGCTGGGCCATTTGTTACGCATCCGAGATGAGAAAAAGAGCCTTGGGAGGGTGTATGGCTACTTCCCACCAAACAGCGAGAGCTCGTTTACCATTTCTGGAGACAAGGCAATGGGGAAACTGGGTACTTCCCTGTCCAGTGGCCGTGTGCTGATGAACGGGACTCTGACGCAGGTGCTGCTGGTTGGGGCCCCAACACACGATGACGTGTCTAAGATGGCATTCCTGACCATGACCCTGCACCAGGGCGGAGCCACTCGGATGTATGCGCTCACACCCGCTGCACAGCCCCCGCTGCTCAGCACCTTCAGTGGAGACCGCCGCTTCTCTCGATTTGGTGGCGTTCTGCACTTGAGCGACCTGGATAACGATGGCTTAGATGAAATCATCATGGCAGCCCCCCTGAGGATAGCAGATGTAACCTCTGGACTGCTTGGGGGAGAAGATGGCCGAGTTTATGTATATAATGGCAAAGAGACCACCCTTGGTGACGTGACAGGCAAATGCAAATCATGGATAACTCCATGTCCAGAAGAAAAGGCCCAATATGTATTGATTTCTCCCGAAAACCAAGTCGTCATTGCTGCTGGAAGGAGTTCTTTGGGAGCCCGACTCTCTGGGGCACTTCATGTCTACAGCCTTGGCTCAGATTGAAGATTTCCCTGCACCTCTCCACTCTGCCCCCTTCTCTCAAGCTGAATCACATCCATGGTGAGCATTTTGGTGGACAGAGTGGCATATCCAGTGGAGCTATGGTAGATCCT\n>XM_003291721.1 Dictyostelium purpureum hypothetical protein, mRNA \nATGAATGAGCTATTATCATCTCTAATTAACTTTAGTGTAAAAGAAGAATTAAAAAACAGTAGTAATATTAGTGATAGATTATTATATATAGTTTGGAATAATATATTTTTAAGAAATGAAATTCATAAACATATTTTAAAGTTTATTGAATATAGTGTTGTAGATTTTGAAATATCACAATATGACCAGTTTAAAGATAAATCATATATAACAACACTTAATTGGTTTGGTGATACACTACCTGATAAAAATGAATTTCCACCATTTTTGACAAGTTTATATTTGCCCCATTTTTCTGAAAAGTTAACTCCAACAACTTTACCAAATACAATAACTACACTCACGCTCGGTCATTATTTTAACCAAGTAGTTCTACCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTGATGATTTTAACCAAGTAATTCTACCTGACACATTACCAAATAGTCTCACAACACTCACATTCGGTTATAATTTTAACCAAGTAATTCTACCTGACACATTACCAAATAGTCTCACAACACTCACATTTGGTTATAATTTTAACCAAGTAGTTCCACCTGGTACATTACCAAATAGTCTCACAACAATCACATTCGGTCATTTTTTTAACCATATAGTTCCACCTGGCACATTACCAAATAGTCTCACAACACTCACATTCCGTAGTAAATTTAACCAAGTAGTTTTACCCGGCACATTACCAAATAGTCTCACACAACTCACATTCGGTTATTATTTTGACCAAGTAGTTCTACCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTCATCGTTTTGACCAAGTAGTTCTACCCGGCACATTACCAAATAATCTCACAACACTCACATTCGATAAAGCTTTTAACCAAGTAGTTCCACCTGGCACATTACCAAATAGTCTCACAACACTCACATTCAGTTATTTTTTTAGACAAGTAGTTTTACCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTCATCATTTTAACCAAGTAGTTCTTCCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTAATTGTTTTGACCAAGTAGTTCTACCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGATCATCATTTTAACCAAGTAGTTCCACCTGGCGCATTACCAAATAGTCTCACAACACTCACATTCGGTTTTTTTTTTAACCAAGTAGTTTTACCCGGCACATTACCAAATCGTCTCACAACACTCACATTCGGTGGTAAATTTAACCAAGTAGTTCTACCCGACACATTACCAAATAGTCTCACAACACTCAGATTCGGTTATGAATTTAACCAAGTAGTTCCACCCGACACATTTCCAAATAGTCTCACAACACTCACATTCGGTCATCGTTTTAACCAAGTAGTTCTACCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTTATGATTTTAACCAAGTAGTTCTACCCGGCACATTTCCAAATAGTCTCACAACACTCACATTCGGTAATGATTTTAACCAAGTAGTTTTACCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTTATGATTTTAACCAAGTAGTTCCACCTGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTCATCGTTTTAACCAAGTAGTTCTACCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTGATGATTTTAACCAAGTAATTCTACCTGACACATTACCAAATAGTCTCACAACACTCACATTCGATAATGAATTTAACCAAGTAGTTCTTCCCGGCACATTACCAAATAGTCTCACAACACTCACATTCGGTTATTGTTTTAACCAAGTAGTTTTACCCGGCACATTACCAAATAATCTCACAACACTCACATTCGGAACTAAATTTAACCAAGTAGTTCCACCGGGCTCATTACCAAATAGTCTCACAACACTCACATTCGGTCGTGATTTTAACCAAGTAATTCTACCTGGTACATTACCAAATAATCTCACATCAAAACTCTCAAAGATTGTTTAA\n>HQ115669.1 Trichoderma koningiopsis isolate NG_05 18S ribosomal RNA gene, partial sequence; internal transcribed spacer 1, 5.8S ribosomal RNA gene, and internal transcribed spacer 2, complete sequence; and 28S ribosomal RNA gene, partial sequence \nAGGGATCATTACCGAGTTTACAACTCCCAAACCCAATGTGAACCATACCAAACTGTTGCCTCGGCGGGGTCACGCCCCGGGTGCGTCGCAGCCCCGGAACCAGGCGCCCGCCGGAGGGACCAACCAAACTCTTTCTGTAGTCCCCTCGCGGACGTTATTTCTTACAGCTCTGAGCAAAAATTCAAAATGAATCAAAACTTTCAACAACGGATCTCTTGGTTCTGGCATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTCTGAACGCACATTGCGCCCGCCAGTATTCTGGCGGGCATGCCTGTCCGAGCGTCATTTCAACCCTCGAACCCCTCCGGGGGGTCGGCGTTGGGGATCGGGAACCCCTAAGACGGGATCCCGGCCCCGAAATACAGTGGCGGTCTCGCCGCAGCCTCTCCTGCGCAGTAGTTTGCACAACTCGCACCGGGAGCGCGGCGCGTCCACGTCCGTAAAACACCCAACTTCTGAAATGTTGACCTCGGATCAGGTAGGAATACCCGCTGAACTTAA\n>XM_026575105.1 PREDICTED: Papaver somniferum aspartic proteinase CDR1-like (LOC113328005), mRNA \nATGAGTCGGAAAAATGTTGTTTCTTCTTCCATCAATTTTGTAACAGCAGTTGTTTATGTTTCATTTCTACTAAACTTGGCCACTGCAGTTAAACCAAGAGGGTTTAGCATGAAGATGATTCGCAGCGACTCTAAAAAATCACCTATGCATCTAAGGTATGCTAATTTAACTCAAGAAGAAAGATTTCAAAGACTCGTCGAACAATCCAAAGCTCGAGCGCGTTACTTTGCATCCGCAAGAGCTGCTGCTTATAATAGAAGCATCTCCATGAATCCCGATATTGCACGTATACGTCTAAAATACATGGAGAACAGACACTATTACATCGGTGAGGTAGGTATAGACGGGCTCTGTACGTACAAAGAAGGATACATTTCCGGACCAAAAATATCTGGTCATCTTGCTTATGAAACACTCACTATGAAGTCAAACACCGGTGCCCTTGGAAGTGTTGAAAAAATAGTCATGGGCTGCGGTATTGATCAAAGGAATTTCGGACCATTATTTGGTGTTCCTGAGATTCGTGAAGGCATTGCGGATTCACACACGTATTTAAGATTTGGTTTCGACACAATAATTGAAGAAGGACCTCCTAATGAAATACTTACAACTCCAATAATTCAAGACCCGAACTTCGGGACGCCTTACCATTTGATTCTTAAGGATATCAGTATAGGTAACAGAAGCGTAGGGTTTCAACAAAGTGATTTCGAGCTAAAGCCGGATGGAACTGGTGGGACTATCATAGATTCAGGGGCTCCATTTACCACCATGAGGATGCGCCATTTTGAAAGAGTTGAGCAAGTGCTGGTAGAATATTTTACAGATTCTGGTATTCGTCCTGCTGATCCTGAACCTGGCAGAGATTTCGATACTTGTTTTGATATACCGGTCGATTTCACTGCGTTTCCGGTGATGACATTTCATTTTCAGGATGCGGATTTTGTTATTCAACACTGGTCTGCCTATTACATACAAGAGCGCTTGCTATGTTTTGGTATCATTGGCTTGAATGACGACGATCCAAATGATGTTACTCTTGGAGCTATGCAACAAGCTAATAAAAGGATTTTACACGATCTTCATGCCAAGGTACTCAAGTTTACTGATGAGAGATGCGATGATGATGGTTCGTGA\n>XM_050131643.1 PREDICTED: Microtus fortis GEM interacting protein (LOC126494357), transcript variant X3, mRNA \nACCGCTCCTTAGCTCTTAACCCAGGGAAGTCCCACTTACTCCTGAGCTACCTGACAGCCGGGGAAGAAATCCTGGCAAGGGAAGGACAGGAAAGGTCTGTGCACCTTGGAGACTCCTGAAGCGCACAGGGCGCACGACTCCTGCCCCAACCCTCCGATTGCCCTGCAGAGCCGGCACCCCGGATGCCTGGGGGGAAGGGGCCCAGGAACGGGAAGTGGCCGCTTCTGCTTATTATACTATGGATGGGGGCAGGGTGTCAGGGCCAGGATCCCTGCAGGGCACCCCGGGCGGGGGTGGGGGCATAAAGCTAGAAAGTGGCGGCAGCAGAATTGTGACTAGGTCTAGGTTATGTTTCCAGCTGTCTTTGTGTGTGTGTGTGTCATTCAGTCCGGTTCCTCATGGTTTCAGCTGTACTCGCGTGTGTTTATGCCGCAGGCTAAGTGCCTGTGCGTCCCACGTGCGGTCCCATCTGTCTGCCCTGGGGTCCATGTGGCTCCATTGTCAAGCCAGGCCTCTACTCCATCACTCATGTGGCAGCTGCATCTGTATTCTTGCTTTGCCTATGGGTCCCTGCCTGTGTGGGTGTCTCTGTGACTGTGAGCAACCGCTTCTCTGATTTTGCCGGGGCCCATCTGTCTGGTCTGAAACAACCCCTCTGAAGCTCACTGTCCCGTCCCACACTAGTCTTAGATCAAAACTCACTTAGGTCTCTGTTTCTATCTCGCTTTCTCCCTCTTCCTTCCATCTCTGCTTGAGAGTGGTTGAGGTGCTTTGCTGCCTCCAAGGGTAGAGGGAGGGAGACAGTGAGTGGTTGGTTCATGTTTTCTTGCACTTCTCTCCCCCCAGAGCTGACCCCAGCTCCTGAGGGCAGGAAGAGGTACAGTGACATCTTCCAGAGCCTGGACAACCTGGAGATATCGTTGGGGAACGTGGCTTTCGACCCCTTGGCTGGAGACCTTGTACTCAGACAGGACCTGGAGCCTGACAAGACTGCCACAGCCGCGGTGAGCAGTGAAGCCAGATGGAGTGATCCCTCCCCAGAGGGTCCCGTACCCCTCACAGAGGAAGAACTAGATTTGCGACTCACTCGGACGAACGGTGGTGTGGATGCTGCCCTGGAGTATGCCAAGGCATGGAGCCGCTATGCCAAGGAGTTGCTGGCCTGGACAGACAAGAGGGCCAACTACGAGCTGGAGTTTGCTAAGAGTGTCATGAAGATCGCTGAGGCCGGCAAGGTGTCCATTCTCCAGCAGAGCCAAATGCCACTCCAGTACATCTACACCTTGTTTCTGGAGCATGACCTCAGCCTGGGAGCCCTGGCCGTGGAAACGCTGGCCCAGCAGAAGAGAGACTACTACCAGCCTTTAGCAGCCAAAAGGATGGAGATTGAGAAGTGGAGAAAGGAATTCAAGGAGCAGTGGCTGAAGGAGCAGAAACGCATGAATGAGGCGGTGCAGGCACTACGGCGCACCCGGCTCCAGTACATTCAACGCAGAGAGGACCTTTGGGCACGTTCCCAGGGGTCCCCTGAGGATCCTCCTCCCCAGGCATCTCCCGGATCCAGCAAGCAGCAGGAGCGCAGACGACGCTCCCGAGAGGAGGCACAGGCCAAGGCACAGGAGGCAGAGGCTTTGTACCAGGCCTGCATCCGAGAGGCCAATACGCGTCAGCAGGATCTGGAAACCACCAAGCGGCGGATAGTGTCACATGTACGCAAACTGGTGTTGCAAGGAGACGAAGTACTTAGGCGGGTGACGCTGGGCCTGTTTGAGCTGCGAGGGGCACAGGCAGAGAGAGGACCTCGAGCCTTCTCAGCTCTGGCTGAGTGCTGTGCGCCCTTTGAGCCTGGCCAGCGCTACCAGGAGTTTGTGCGGGCACTGCAGCCTGAGGCCCCGCCACCGCCGTCTCCCGCCTTCTGCTTCCAGGAGTTCACGCCTGTGCTACACAGTTCCCCTCAGGACACAAAAAAGAAGTTTTTGGGGCCTCCACATGCCAGGCTGGAGGAGGGTTACTCTGAGCCTGGCCCTTGGGAGGATACCAGCTCAGGCAGCCAGGGCCCCACTCCAGTCAGTGATGTGGACAGTGTAGGTGGTGGCAATGAATCCCAGTCCCTGGATTCCCCTACTTCCAGCCCAGGTGCTGCTACTCGGCGGCTTGTGAAGGTGTCGTCTATAAGCACTGAGTCCTCTGATGACTTTGAGGAACGAGACCCTGATCTGGGGGATGGGATGGAGAATGGACTAGGCAGCCCCTTCAGGAAGTGGACACTGTCCACAGCTGCTCAGACCCACCGGCTACGGCGGCTGCGTGGTCCAGCCAAGTGCAGAGAATGTGAAGCCTTCATGGTCAGCGGGACAGAGTGTGAAGAGTGCTTTTTGACCTGTCACAAGCGCTGTCTGGAGACCCTCCTCATCCTTTGTGGACACCGACGGCTTCCAGCCCGGATGCCTCTCTTTGGAGTTGACTTCCTACAACTCCCCAGAGACTTCCCTGAGGAGGTGCCCTTTGTGGTTACCCGGTGCACAGCTGAGATAGAACATCGCGCCCTGGGCCTGCAGGGTATCTATCGGGTCAGTGGGTCTCGAGTGCGTGTGGAACGACTGTGCCAGGCCTTTGAGAATGGCCGAGTGCTGGTTGAACTGTCGGGAAACTCTCCTCATGATATCACCAGTGTCCTCAAGCGATTTCTTCAAGAGCTCACTGATCCCGTGGTCCCCTTCCACCTCTACGACGCCTTCATCTCTCTGGCAAAGACCCTGCATGCAGACCCCGGGGACGACCCTGGAACCCCCAGCCCCAGCCCTGAGATTATCCGCTCGCTGAGGACCCTCTTGGTGCAGCTGCCTCCCTCTAACTACAGCACTGTGCGGCACCTGGTAGCCCATCTGTTCAGGGTGGCTGCTCGTTTTGAAGAAAACAAGATGTCTGCCAACAACTTGGGAATTGTATTTGGGCCTACGCTGCTGCGGCCACCAGATGGACCCAGGGCCCCCGGAGTCAGCCCTGTGGCCTGTCTGCTGGACTCTAGTCACCAGGCTCAGCTTGTTGAATTCCTCATTGTGCACTATGAGCAGATCTTTGGAATGGATGAGCTCCCTCTGGCCTCTGAGCCCCTGACCCAAGATCCTGGCCTGGCTCCCACACTCCTCGAATCCAGTCCTCAGCACCCAGCCCCACTTCTTGCCCAAGACATACAACCCCTGACCATAGCCTCAGACTGCAGCCCAGATCCCAAACTCCACAGTGCCCCGGAGAAGTGTCTGGAGGTCACACCTTCTGAGGTAATTGCAACTCTGCAGAGGGACCAAAGGGAGGAGAAGGAGGTGGAAAACACCAGAGATGGGGCAGGGGAAGGGTCCGGCCACAACCCTGAGGACTTGCTCCTGGGAACACAATCCCGGGGCCACTTCAGTCGCCAGCCAGTGAAGTATTCACGGGGAGGTGTACGGCCAGTCACTCATCAACTGTCCAGCTTGGCTCTGGTAGCTTCCAAACTGTGTGAGGAGACTCCTGTTACTGTTTCAACAGTGCACCGAGGTAGTTTGAGGGGACGAAGCCTGGGCCCTGCTGCTGCCTCCCCTGAAGGCAGTCCCCTGCGCCGAAACCCTCTGCCCAAGCACTTTGAGATCACCCAGGAGACAGCCCGGCTACTCTCCAAGCTGGACACTGAGGCTATGTCCAGTGCTACCTGCTGTGCTGACACTGAGCCTGAGGGGTCTGAGGAACATCTCTGACCACCCACCATCCCAGGAGACTCAGGACTGAGCTGATGACCCCATATGTCTCTCTTCTTGCCCCACCTGGTAACCAGACCAATTTAGTGGGGTGTGGGGAGAGACAGGTTACCAGAGAGTTGGGTAAGGAAGACCACCCATCTTGGGAAGTCCTCACCATCTCCCTGCCAGAGGAGGTTAAAACGGCCAGACAACACAGGTGCACAGGCAAATCAGGATCAATGACTCAGTTGAATCAGTATTCAATGGTCAGTACAGGTCCGAAGATCCTTGGGTTACCCCAGTCACAGCTGTCTGACTACTCTGATCATAAGAGCTCCTGGTTCTACCTGAGTAGGTGGGTGTGGTTTAGCCCTCACCTGCTTTTATATCTTCCTGGGTTTGGTTTGTTTGTTTGTTTGTTTTGAGATGGGCTCTATTGTAGCTCTGGCTGATCTGGAACTCCCTATGTAAACCAGGTTGTCATAGAACTCACAGAAATTCCCTCCTTTTAAGTGCTGGCCAAATCTGGATTCTTATAACCTCTGAATAAAGCCATGTCCTGATTGAATACAA\n>MH278833.1 Uncultured bacterium clone DEN-OTU-710745 16S ribosomal RNA gene, partial sequence \nACGGAGGATCCAAGCGTTATCCGGAATCATTGGGTTTAAAGGGTCCGTAGGCGGTCTTATAAGTCAGTGGTGAAATCTCCCCGCTCAACGGGGAAACGGCCATTGATACTGTAGGACTTGAATTATTAGGAAGTAACTAGAATATGTAGTGTAGCGGTGAAATGCTTAGAGATTACATGGAATACCAATTGCGAAGGCAGGTTACTACTAATGGATTGACGCTGATGGACGAAAGCGTGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGATACTAGCTGTTGGGCGCAAGTTCAGTGGCTAAGCGAAAGTGATAAGTATCCCACCTGGGGAGTACGTTCGCAAGAATG\n>XM_020557668.1 PREDICTED: Prunus persica putative disease resistance protein RGA3 (LOC18785927), transcript variant X4, mRNA \nTCTCTTCAATTATTATATCTTTTTACGCCAGCCATATGCGCACCTTCTTGTCTACAAATCCCTCACAACCTTCTCAAAGATACATTGCGTCCTCAATTTTGCTCTACTTTTCTAACCCAAACTAAGCATTCTGCTCTCTGTCTTGAGCAACACTGAAAGAAAATATGGCTGCAGAGTTTCTTACTTTTGGTGCTGAGGGAATTCTGACGAGGGTGGCTTCACTTGCAGAGCAAGAACTCAGTCTTCTCTGGGGATTCAAAGGAGAGCTAACAACTCTACGAGACTCATTATTCAAGTTGGAAGCTATGCTCAGAGATGCACAACATTTACAAGTTCGGGGTGAGAGGGTGGAGATGTGGGTGAAGGATCTGGAAGGCATAGCTCATGAAGCAGATGATGTGTTGGATGAATATGAATATGAACTTCTCCGGCGGAAAGTGGAGATCCAAAATCAGATCAAGAACAAGGTGCTCAACTTCTTTTCACGCCACAATCCCATTGCATTTCGTCGCAAAATGGCACATAAAATTAAAAACATCAATGCATCTTTGGCAAACCTGAAGAATGAGGCAGCTAGTATTGGACTGGTTGATAGGTCAACACTGGTCAATGCAACATCTCATGATATTGGAGGACTTGACAGGGAAACCGTCTCAAACTTTGATCAAGATGAAAAGTACATTGTTGGAAGGAAGGAGGTTGCGTCGGACATAGTTACAACCCTGATCAACTCTGGCAAGAACCAAGACAATTGTCTTTCTGTTATGGCCATTGTGGCGATGGGAGGCTTGGGCAAGACAACTTTGGCTAAATCTGTATATAATGATCCTGAGATAGGTAGACACTTCGATCAAAAAATATGGGTATGTGTATCTACTCCTTTTGAAGTCAAAAAGATTTTAAGCGAGATCTTGGAATGTCTTAAACCAGAGAAAGCTGGGATAAAGGGTAAAGCAACAATATGTGAAAACCTGCAAGAAGATTTGAAAGGGAAGACATATCTTCTCGTGCTTGACGATGTTTGGAACGACGATCGTAGCAAATGGGACGATTTGATGAGTTGCTTGTTGAATGCTACAAGCACTAAAGCAAGCAAAATCCTTGTCACTACTCGCAATGTGAGTGTTTCATCAATTGTACAAACACTTCCTACATGTGTTCTGGGAAAATTATCGGAGGATCAATGCTGGTGCATATTGAAGTATAAAGCGTTTCTAGATGCGAGTGTTGTTTTGACTGAAGATCAAGAGAGAATCGGAAGGGAGATTGCCAAAAAGTGTGCAGGTGTACCATTAGTGGCAAAGGTTTTGGGAAATATGATGCGTTCTCAAGATATTGATGGATGTCGGTCAATTCTAGAAAGTAGAATATGGGATTTACCAGAAGGAGAAGAAAGAATCTTGTCGGTTTTGAAGTTGAGTTTTGATAAATTGAAATCACCATATTTGAAACAATGTTTTGCATATTGCTCAATGTTTGTCAAAGATTTCGAAATTGAAAAGGATGACTTGATCCAACTTTGGATGGCTCAAGGATTGCTTTACCCTTCTCCTCCCAACAGACGTAATCTAGAGATGGAGGATATAGGAAATGAATATTTTAATATTCTATTGAACAACTCTTTCTTTCAAGACGTTGAAAAGGATTGGTATGGTAATATTACAAGTTGCAAAATGCACGACCTTGTGCATGATCTCGCAGAACTTGTGTCAAAAACGAAGAGTAATGACTCCAATGAGACTCGACATATGGCACATATTCCTACCTCAGTGCTACATGGAGTTCCAGAAAGAGGTGCTCATAAATTGCGCTCACTTTTCTTGAATGTTGAAGTTCTTGGTGATATCTTACCAAACTTTAGAGGTTTGCGTGTCTTAAATTTATATCAAACTTATATGAAGGAGTTGCCAATTGCAATTGGAAAGTTGAAACACTTGAGGTATCTGGATGTTTCCTATACAAAGATCAAAGCACTCCCCAAATCCATTGGAAAGCTTTATAATCTACAAACATTAAGAATGAAAGAGGTCGAGCTTGAAGAGTTTCCAAAAGAACTGCAAAATTTGATAAACTTGAGACATATTTATTTTTATCCGTATGGTATGAAATTTCCAGCAAGGATAGGGCGATTGACTAATCTCCGAACATTAAAATATTTCATCGTGGGTAAGGAGACAGGTCGTGGAATAGAGGAGCTGGCTGGCTTAAACTTGTTAAAAGGCAGATTAACTATCTATAATCTAGAGCACGTGAGAGATGGAGAAGAAGCCAAGAAAGCAAAATTAGTGAAGAAGACAAACATAAGCAAGTTAAAGTTTCAGTGGGCAGAGGATAGGTCAAGCATCACCAATGATGAAGAGGTACTAGAAGGCCTTCAACCACACCCTAGTAAACTGGAATTTTTACAATTTTTCAACTTCATGGGTGATAAATGTCCATCATGGATCATGAGTAGTTCGTTTCCTGTATTGAAAAGGTTAAAGATTTACAATGCTAGGAACCTAACTGAATGGCCAGAAAGTGGGATCGTGGTCTTTCCTTGTCTCGAGGAGCTGGTTTTGAGGAATTGTGATAAATTGAGAAGTGCTCCTAGCCATTTCCCATCTCTCAAGACGTTGGAGATAGATTCCATGGGTAGCGGCATGCCAATAGCAAACATAAGCAATAAGCTGACCACTCTTACTTCGCTCGCAATAAGGAACATAAGCGGACTTGTTTCTCTGCCAGAAGGGATGCTTAAAAACAACAAGAATCTTGCATACTTGGAGATAAAAGATTGTCAGGAGCTAACTTGTATTGCTCTTGATGTAGTTGGCTCTTGCGCACTTCTTGAGTCAGTGCGTATTTCCAAGTGTCCTATTCTTGCTTATTTTCCTGATGGGCTACTCACAACATCTCTTAAGAACCTGATTGTGGAAGATTGCGGTAGTCTAGAGTTGATTCCAGTTACACAGCCCCTCTCATCCCTCTGTGAATTAAAGATTACAGGCTGTCAGGAGTTGTCAAGTCTACCGAGTGGGTTAGATTATTATACCTCTCTTCAGGAGTTGGCAATATCAAATTGTGATATGCTAACATCCGCTTTGATTCACAGCCTCCCATCCCTCCGGAAGTTGTCTATATTTCGTTGCAACAGGAGACCAAAGTTTGTTCCAAGTTTACTCGGCTTCACATGCCTTCGTGAATTGAGAATTAAAGATTCCCATGGATTGACAAGTCTGCCAATAGGGCTAGAATCATGTTCTTCTCTTGAGGTGTTGATAATAAGCAAGTTGCCGAATGTAGAATCTATTACAAGTTTAGACAACCTCACAAACCTCCATGAATTGGGGATATTTTCTTGCGATGGATTGAAAAGTCTACCCAATGGGTTAGCAATAACATCCTGCCTCACCCACTTGAAGACATTGGAAATCGGTGGCTTTTGGAAGGAGCTTGATTCATTCCCTGCTTTTCAGGTTACATCACAACTTGAAACATTGAAGTTATGGGGTTGGCCTAAGCTCAAGTCTCTGCCCGAGCAAATTCAACACTTGACTTCTCTAACATGTCTTGAAGTGCAATGCTTTGACGGAATGGAGGCTCTTCCAGAGTGGTTGAGAAACCTTACATCTCTTGAGTACCTGTATATACATCTTTGCAAGAATATGATGTATCTACCTACACTAGAAGCTATGCAATGTCTCACCAAATTAAAACGCATATTCATTTTGGATTGTCCCCTTCTAAAAGAGAGATGCAACAAGGAGAGCGGCTCAGAGTGGCCCAAGATTTCTCATATTCCACAAATATATGTTGACTGGGTACGGTGGCAGCTGCCAAATTCAATATAGTCTGAGAAAGTATCATCTTGAAATGAGAAATAGTTGAAAGTGGGCGAATTGTGGTCGAGAAAATGATTAAACTCAATTGCGTTTTTCCTTGAGACTGGTGTTGGTGTGGAGAGTTGATTGAAGCTATATATGCTACACATCATCACCATTGAAGAAAAGGTGTCCATTCCCTACAGCCTACAGCCTACAGCCTACAGCCTACAGGGTCTGTTGTTATTTGGGCATAATTTGGAGGTGGGTGGCTTTGCCTTACCTGAAGGAACATTTTTTGTAATGGGAGCAAACAGAGTCCAGGTATTCAAAAGCACTCCAATTTCTACAGTGACTGATGGGGGTAAATCCAACACAAGCCACCAACTCAAATGATCACAAAATCAAGACAGAAGTCACAGGCTGCTCAAATTTTGTGTGCCGATCCGAAGCGATTGTAGTTGGAATATTTTGGTAATATCCTTCTATTGATGTCCAGAGAAAACTATAAATTTATTCAAATTTTAGCATGGGTGTCCAAAGATGGATTTTGGGTGCAAGCGTGAGCTCACCAACATTTGAAGCACGAAGCCCAACAGCCCAAGAACCAGCAACTAAGTCCAACTTAGCCTATTGCTCCACTCTACCCCAACACCCCACTTTCTCTTTCCTTTTTTTTTTTTTATAATTTTTTTTAACTGTTGTAAAAGTGGAGTCCCCAAAATGCCCCCAAAATGCCTATAAATAAGGCTCCCTCCCATACTTGTAAATACACAATGAGATTGAGAAAACACACAGAAATAATGTGAAGAACAAACTCTCAATGAATGAGAAATCAGTTTTCTCCAATTTCTCTCTATCCCAATTCTCTCTCCATTTTCTTACTAGATTTATAACACATTATCAGCATGATTTCTCTATCTCTAAATTCAGAGACCCAACCCATCTCACCTTCCTCTGCTCTCTCATCCACACCGCAGCAGAGCTTTTCTTGAAAACCCAGAAACAACATAAATCCTGTCCGTACAGCAACCGAGCCATCTATGGGACACGGTGCTCCAGCTCACCAAGTCCGCTTAGGACAAGAACAGCGACCCGCTCCTCTGGGCGGTTCAGCACAGCAACAGCCTCAACTCGGCCGGCGTGGCCTTGCCCTCCGTCGAGCTCGCGCACCTCCTCGTCTCTCACATCTGCTGGGCCAATCACGTGCCCATCACATGGAAGTTCCTCGAGAAGGCCTTGACCGTCAAGATCGTATTGTGAACCAGCAAAAGAAAATCTTGAGAACCCAGTAAAGTGCGATGGGGGAGCTGGCAAGTCAGAAACATGTTCAGTTCATTGTATTAGTCGAAAAGAAGAAGGATTCTTTTGAGTCCGTGGTGATGGAGCATATAAGAATGAATGGGGCATATTGGGGTTTGACTGCTCTTGATCTTCTTGGGAAGCTGCACGTCAAGATGACTCAGGTGGGTTTGGTGGTAACATTGGGCATGACCCACATGTACTATATACCTTAAGTGCTGTGCAGGTTTTGGCCTTGTTCGACAAGCTTGATGTTCTGGATATTGAAAAGGTTGCGAGTTATACCACACACCAGCCTTCACATGTTTTGGATCAGCGGATGATGATGAGGTTTTCTCCAGTCGGCAAGGACAGAGAATAAAACAGTGTAAATGCAGAGGCAACTTTGACAGACCCCTGATGACGGCCACAATGATGAGCAGCACCCACCGATAAAGAAAAGCAAACCCACCGAAAAAAAAAAAAAATGCTAAAGTGCTGAAGCATCTTTCAATAAGAAAAGCAAACCCACCGAAAGAAAGAATAATAAATAAATATATTTTTAAAATTAAAAAAAAAAAAAAAAAAAAGATCACTCAGCCAAGGGCACTGACCCTAAAGTAAGCGATAAGGTCTCTGCTCCCTTATCTTCTC\n>AY964845.1 Eptatretus stoutii clone Es2VLRA.33 variable lymphocyte receptor A (VLRA) mRNA, complete cds \nTGGTGATAACCTCAAGGTGCTCTTTCAGAGATGATGGGTCCGGTCTTGGCCGCGTGTCTGCTCATCATTTTGTCCACTGCATGGATTTCCCAAGCGAACGGGGCAACCTGCAAAAAAGATGGTGGTGTTTGTACCTGCAACGACCAAACGAAGAACGTTGACTGCTCCAGCAAAGGGCTCACAGCCATTCCCAGCAATATCCCCTTGGAAACTACGCAACTGCATCTAAACCTCAACTCCCTGAGCAAGCTCTCACCCAAGGCGTTTCACAGCCTGAGCAGTTTAACATTCCTCGATTTGAGTTATAATCAACTGCAAGCTCTCCCTGCTGGGGTGTTTGACCAATTGAAGAATCTTGAAACACTATACCTGCTTCAAAACCAGCTCAAGTCTCTCCCACAAGGGATATTTGATAAACTCACCAAGATCACCTACTTGGACCTGGAAGGCAACAAGCTGCAGAGCCTATCACATGGAGTGTTTGACCACCTCACCAAACTCACAATTTTATGGCTGAATACCAACCAGCTGAAGAGTGTTCCTGAAGGAGCTTTTAACTTTCTGGAGAAACTGACACGGCTACAGCTGCAAAGCAACCCCTGGGACTGCACGTGCAACGACATTCTCTACATGGCCAAATGGCTAAAGAAAAAGCAAGACGGGGGTCTTGGGGGTGTCGACACGGCAGGCTGTGAGGAAGGAGGCAAAGCCGTCTTAGAAATCACGGAAGAGGAAGCGGCAGAAGATTGCGTCTATCCAAATACCACAACAGCGATACCGACAACAATTATTACGACACTGGCATCAAGTAATGACGATGATATACCCGAGCTGCCAGTGCCGCAAGAAAACTTTCAGAAATTCTTGGGATACCAAGAGCCAGACCATCTGCCCACCCAACCACAGTGCTTGATGTCCATTTCTGGATACCTCGGCCTCATGATGTTTTTCGTGCTCATTTCTGCTGCCATTTTGTACGTCATCCACTTTCTCAAGAAGGCCTGAACCAGTGTCTCACTTGCC\n>XM_028621987.1 Apiotrichum porosum hypothetical protein (EHS24_006566), partial mRNA \nATGGCGACCGCTGCCCCGCTTGTCAAGCATGCAGCCTCGCTGCTTCGCCCTGGCCACTCAAACTGTGTGGCCTTTCCTGACATTCACCAACCGGGACTGTCTTTCAGCCTTGTGCCGAGGGCCGCGACTCAGTGGCACGACGAGGACTGGTTCATGGGCGGGCTGAACTACCACCTTGCTGTCACTTTTGATGATGGGGTTTGCTGGCTCGCTCGAATTCGCCAGAAGAATGGCAACCCGCGCAAGCTCCAGTCCCTCGTCTCAGAGTTTGTCACCCTCAAAGCCTTGAACCGCGCCTGCCCCGAGTTTGTTCCCAATGTCTGGATGCCACAGGCGTCACCCTTGGGTCCCCCATTCTTCTTCATGGAGCACTTCAAGGGGTCCAACAGTCGCCACCTGTTCCCCCGATCCGGTGCTCGCCCTGTCGAGTCCCAGACCATCGTTTCCGACATGGCCACCTTTCTCATCCAGCTGAGCTCGCTGGAAATCCGCGGCGACATTGGATCTCTTACTGCCAGCAGCGCGGTCGTCGACGCCGCAACCGACCTCGAGCCAGAGCCAGTTGTTGGGCCCTTTGAACATTGGGACTATTGCATTTCGAACGGACTGACGACGTTGGGGCCGTTCCGCACCAGCCGTGATGCGTGGGTGGCAAAGATCGACGCCGTCGTGCTTGCACTCGAAAGGGGGCTGTTTGCGATCAATGGCGGGCACCTACTGCATGTGTATCTCGTCCATCTGGAAATGCGTGCTCTGGTCAACGCGTGCGAGGAGATGGCTGTGCCGTGCGGTCCCGGCGACGGCGAGCAGCCGACGTTCATCACACATGCCGATTCCAAAAACCACCTGCTTGTCACAGACGACGGCCATCTGCGCGCAGTCATTGATTGGGAAGGTGCGTACACCGCTCCATTTGCCGAGGCGTTCGCTGCTCCGATGGGGTTTTACGATCAGCGCGGCTTCGTTCGGGGCAGTAACGAGCTCTCCACCGAAGAAGTCCTCCTCGCCGACATATTCCAGTCTCGCGGACGCAAAGACATGGCGCAGGCGGTACGCGGTGGGCGCAAGTACCACCGACTTGCGTTTCACCTCGGAACCCTTCAGCCGACTCTGGAGATGGTCAACGCACTCTATGACGCCTTTCTGGGTGAAGAATCGGCAAGTTGTATCAGGTTTGACTCGCTCTTCGAGTGGGAGGCCGCGGCGTTGCACAAGTTCTCACATGTCCCGGGCCTTGAACAGTTGGCAATTCCGCCGGGAGAGGGGGATGTCGCCTACTTGCGCTTCGCAGAGGTCGAGCCAGACGCAAATTGGTGCAAGGTCGTCACTGTGAAGGACGCCTCGTAG\n>XM_035908051.1 PREDICTED: Neolamprologus brichardi nuclear GTPase SLIP-GC-like (LOC102787354), mRNA \nTCTGTGCTAGAGTCCGCTCGTTCACCTCGACAGGATCAGCAATTAAAATTTATCTTTCAGTTTCTATTCTTGGTCATGGATGATTTTGTGCGAAACAAACTGACTGAATGGAAACTAAGTGACTGGATTGATGCATTTGAAGCTCAAGAAATTGATGAGGAAAGTCTGTATCATCTCAATGATCAGGAAATTGATCAATTGATCACAAAAGCTGGACCTAGAGTAAAATTCAAGGAAAAACTAAAGATGTTAAAGGAAGAGCAAAATACAACCCAACCACAAAAAGAAGCAGTCAATACTTCTGGTCAAGATTTTCCATCCATAAGTGAAAGAGGAAAGAGAAAGTCAGATCATCTTCAGAGTGAGACCAGAAAATGGCAACCACCTCTTAAAAAACAATACAACTGTGCAGCAAGATCACAGTCAGAAACAGAAATACTGTCTGATGTCAAAAACATAATGAGATGTGTCAGTGAAGGACTACATGGCCGTGACAAGCTCAGTGCTTTCCTAAAAGATAAAATCAAGAATTTAGAGACAGAAAGGAGACACCTGGTTGGTGTCTTTGGTAAAACTGGGGCTGGAAAGAGCTCTTTAATCAATGCCATCATAAATAAGGAGGGCCTGTTGCCTTCTGGAAGTGTCAGTGCATGTACCTCAGTGATGATAAAGGTGGAGGCTACCAATGGATCAAAGTATGAGGCACACATCGAGTTCATTACAAAAGAGGATTGGGAAGATGAGGTGCAGTCACTAAAACAGGCTCTTGAAGACAATGACGACAACGATGATGATGATGGTGGTAATGATGATTTACTTGATCCTGACGGAAAGTTATCAGCGCTGTATGGAGAAGAGTGGAAAGAAAGATCCACTCACAGCCTCATGGACAACAAATATTTCATAGATATTCCAGAGTTTCGAACATCCAAGATAAAAATTTTGAAAAGTGACTCAGTGGGAGAGGTAGAGGTGAAGTGCAGTGAAAAGAGCATCCTTGGTCGTTCTGTTCGGCCAGTATGCAAACTGCAGTGGGTCCAAAAGAAAATCAAGAATGCAGTGAAGAATGAATTCAAAAAGCGGAAAACGATTACGAATCACTTCAGTGAGCATTGTTTCAAAGTCTTCACAGTGAGCTCCAAAGAGTTCCTCAAAGGGGAGAATGTAAATTCAGATGTCAATGAAATACTGAAACTCAAGGAAATTTTGAAAAATCTGAATGATGCTCATTCAGAGACATTAAACTATGTGTCTGGAGCTCACGGGATTCTGTCTTTGATTCAAGGGGCCAGAAGTGGAGAAGTGGTTGAACAAAAAAATGATGTGTTTGCAATCCTTGAGGGAAACTTGAGCATCCAACTTAATCAAGTCAAAAAAGCAATTGAAGACATTATAAAAGCTTTTGAACAATGCCTAAGTGAGGGAGTTGAAAAATCCAAAAAAGCATGTGAAAAAAAACTGAAGTCCTTCTTATACCCTAGTAAAAAAACAAACAGAGCTTTTCACATGACACTAAAGTCTGCAGTTAGGAATGATGGCATCCAGAAACCAAAAAAAGGAAAACCTAAAAACCTCAACATGATATTAGCGTCTTATTTGACTGAAAGCATTGATGAAAAATTCAGAGATACCTTCCCAAACAACATAAAATGTGGACATTTCAATGGAGCCATCGATGCGTTTTCACTCAGCACTGATTCACTGATTGAAAAGTACAAAGATGTCAAACTGCAACTGACATTTCTCCAGACAGAGGGGGAAAAAATGAAGACAAAGCTCAACAAAACCATCCTCACACAAAAGAAATTAATCTACAACAGTTTGACAGAGACAATCAAGGACAACATGAAAGAATGCTATAAAGAAGCAGCAGCATTTACAGGAAAAGGCACCCTGAAGAACATGAGGGACACTATTGAGAGACATGTGCACTCAAAGATGGACATGTTTGAGGAAGCAAAAAATGTCATGTTGGAGCTCTTGAACGATTTGAAGGAAACTGTCCTGAGGACACTGGAGAAAACCATGAAGGATTCCATTGAACACTCACTTAAGTCGGAGGCCTGCTCACTGCCAGGTAAACAGAATATATAA\n>XR_005829514.1 PREDICTED: Falco naumanni ATP binding cassette subfamily B member 11 (ABCB11), transcript variant X13, misc_RNA \nATGAAAACATGATGGGAGATGGTTGGGTACTTCACTGCCTAATTGAATAGATCCTTACAATTTGTTCTATAATACATAATTTTTCGCAGCGCAGCCACGGGACTTCCGATTTAAGTAACTAAACATCATGTCTGACCCTGTTGTTCTGCGTAGCATCAAGAGATTGGGAGAGGATAACAATGCTTTTGACTTGGATGGCAAATGTAACAGCTTCAAGAAATCAGAGAATTTCTATACGTATGAAGAACCTTTTGTAGAGAAGAAAACTGAAAAGTCACCAGAAAAGAAAGAAAATACTATTCGTATTGGCTTCTTTCAGCTGTTTCGATTTTCTTCATCTATGGAAATTTTAATGATGGCTGTTGGCAGTTTCTGTGCTATTGTTCATGGAGCAGCCCAGCCAGCTGTGCTACTTGTGTTTGGTGCAATGGCAGACACATTCATTGAATATGACATTGAAATGCAAGAGCTTAAAGACCCACTCAAGATATGTGTAAATAACACCATAGTGTGGATTAATGGTACTATTCATCAGAATGAAAAGAATGCCACAATAAGATGTGGGCTGCTGGACATTGAGCAAGAAATGACCAAGTTTGCAGGTTACTATGCAGGAATTGGTTGTGCTGTACTGGTGTTAGGATACATCCAAATCTGCTTTTGGGTTATGGCTGCAGCTCGTCAGATACAGAAAATGAGGAAAGCTTATTTCAGGAAAGTAATGCGAATGGATATAGGCTGGTTTGACTGTACATCTGTAGGAGAACTGAACACCCGCATTTCTGATGATGTTAACAAAATTAATGAGGCTATTGCTGACCAAGTAGCAATCTTTATCCAGCGCTTAACCACTTTTGTGTGTGGATTCTTACTGGGATTTGTCAGTGGCTGGAAATTGACCTTGGTTATCATTGCAGTCAGCCCTCTGCTTGGGGTTGGAGCAGCTGTCTATGGCTTGGCTGTGGCAAAACTAACAGGCCGAGAACTAAAGGCTTATGCAAAAGCTGGAGCTGTGGCTGATGAAGTGCTCTCATCCATCAGAACAGTGGCTGCTTTTGGTGGGGAGAAGAAAGAAGCTGAAAGATACGATAAGAATCTGGTGTTTGCTCAGCACTGGGGAATTCGAAAAGGAATAATAATGGGATTGTTCACAGGTTATATGTGGCTTATAATTTTCCTGTGTTATGCATTAGCCTTTTGGTATGGTTCTAAACTTGTCCTTGAAGAAGAAGAGTATTCACCTGGAACTCTTCTGCAGGTTTTCTTTGGTGTTTTAGTAGGAGCTTTAAATCTTGGCCAGGCATCTCCCTGTCTGGAAGCCTTTGCCACTGGCCGTGGGGCTGCAGCAAACATATTTGAGACAATAGATAAAAAACCCGCCATTGATTGCATGTCAGAAGATGGCTACAAACTGGATAAAGTACGAGGTGAAATTCAATTTCATAATGTAACATTTCATTACCCCTCCAGACCAGACGTAAAGATTTTGGATAACCTTAATATGGTTATTAAAGCAGGGGAAACAACAGCTTTTGTTGGAGCTAGCGGAGCTGGAAAAAGTACAACAATGCAGCTCATCCAGCGTTTCTATGACCCCACTGATGGCATGATTACCCTGGATGGCCATGACATTCGTTCCCTTAATATCCAGTGGCTACGCTCACAGATTGGTATTGTTGAACAAGAGCCAGTCCTGTTTGCCACCACGATTGCAGAGAACATTCGCTATGGTCGGGATGAGGCTACCATGGAAGACATAATCAAAGCAGCCAAACAGGCCAATGCTTACAATTTCATCATGGACTTGCCACAGCAATTTGACACTCACGTTGGAGAGGGTGGAAGCCAGATGAGTGGAGGTCAAAAACAGAGGATAGCTATTGCTCGAGCTCTTGTACGAAACCCGAAAATCCTGCTGCTGGATATGGCTACATCAGCACTTGATAATGAAAGTGAAGCTACTGTCCAGGAAGCACTTCATAAGGCTCGCCTTGACCGCACCGTAATCTCAATAGCTCACCGCCTGTCAGCCATCAAAGCTGCTGATGTCATCATTGGGTTTGAGCATGGAAGGGCTGTGGAGAGAGGAACTCATGAGGAACTCTTGCAGAGGAAAGGGGTTTATTTCATGTTGGTGACCTTGCAAAGCAAAGGAGACAAAGCACTTAACAGGGAAGACACAGAAACAGCAGAAAATAACATCGTTGAGCCAAATCTTGAGAAAGTCCAGTCATTCGTCAGAGGAAGCTATCGGGCCAGTTTGCGAGCTTCACTTCGACAGCGCTCCAGATCTCAGCTCTCTAACATGGTCCCTGACCCTCCATTATCCATTGCAAGAGATCATGCAGAGTCTATGTATGTTGTGCCTTCTTATGGAGAAGATGATGGACAAGCAAAAAAGGAATCTGTTGCAGTGGAGGAAGATGTCAAACCTGTACCATTTACCAGAATTTTGAAATACAATGCCTCGGAATGGCCGTACATGGTGCTGGGATCTCTGGCGGCAGCTGTGAATGGAGCAGTCAGTCCACTCTATGCTTTGTTATTCAGTCAGATTCTTGGGGAGCTGTTGGGTGTGGGTTTCTGTATTCGCATACAGTGTATTTTAGATGAGACAAGAGGTACCTCACGTGCAGACCTTCTCCATTCTTGACGAGGAAGAACGAAGAACCCAGATCAATGGTGTCTGCCTGCTCTTTGTCTTTGTCGGAATTCTTTCATTTTTCACACAGTTCCTACAGGGATACACCTTTGCCAAGTCTGGAGAGCTGCTTACAAGACGGTTAAGGAAAATTGGTTTCCAGGCTATGCTAGGGCAAGACATTGGTTGGTT\n>XM_001628387.3 PREDICTED: Nematostella vectensis peptidyl-prolyl cis-trans isomerase NIMA-interacting 4 (LOC5507809), mRNA \nGGGGAGTGGAGATTGCCAGCCGTTGCCTGTTGTGTGTGGAACAAGTAAAAGGGTCGTGTGAGGGAAAAGAAACGATGCCCAAAGGCAAGAAATCTGGCGGAGCTGATGGCGGAGGAGGAGGGAAGCAGGATAACAAAGGGAAAGGTGCCAAGGGAGGCAAAGATGATGATGGTGCTAGTAAGGCAAAAAAAGGAGGAACTTCAGTCAAGGTGCGCCATATCCTTTGTGAGAAGCACTCAAAGGCAATGGAAGCCATGGAAAAACTGAAAGCAGGGCAGAAATTCAATGAAGTGGCCACAGCTTATAGTGAAGATAAAGCTCGACAAGGGGGTGACCTCGGTTGGATGACACGCGGTTCCATGGTAGGTCCATTTCAAGAGGCTGCATTTGAGCTACAGACCAGCACTGTTGACAGGCCTGTCTACACAGATCCCCCAGTCAAAACTAAGTTTGGCTATCATATTATTATGGTAGAGGGGAAAAAGTGACCCATGTTGATGGTAATCCCTTTTTTCAAGAAAAGCCAGTTTAACAGAATGCATTGCATTTTTTTATGAAAGTGGTATAGGATGATACTGTTTCTGCGTGCAAGCAATTAATAGCTGTGTCATTTATGCAAATGCAATACACTATGGGGTAGGTCAATGCCTTATGGGGAAGGTTGAGATAGACCAAGTTACCTTACACATTTTCCATTCATTTTGCATTTAGTCTGTGATTGTTTGGAATGAGGACTGTGGGGTTTTTCTTGAACAAAACACAGCTCTTAAAAAGCACTATAATACGCACTGGGAATCAACATAATTCAACACACAGTTTTGGCAACTAACATAAGATTTTAAATCTCATGTTTTCAAATTGATTTTTGATTATTGTTGACAAATGATTTCCATCATCGCATATCTTCCCTATTCTTTAAACACTTTTAGTTGTGCTGAAATATTTTGTGTATATTTAGAACTACGAAACAAAAGAAGGAAATGTAGCACAAACAGCAATGTGTATTTGAATTGCATTATGATTTAATAATAATTTATTGTTAGATAATAATTAATAATAATTTTTTTGTGTAGAAATTCCTTCGTTATAACATTTCTGGAAGTCTGTGCCCTCTGGTGCTTGCACTTCCTACAAAAAACAGGAGGGCAACTGTGATTATTAACTTTCTCTAAAATAGTGTCTGAGTATTTACAGACTCAAAAAAGGGTCCAAGTTCACCATAGTTCTCGCAAAAAACGGGGCATTTTCCCTCTCCCCCCCGGGTTCCTCCCCCTCCGCTTCCCCTACTGCTATCTCAGCTATATCTACAGTTTGCCAACGATTCGCCGCAGGATTTTCCAGCACCTGCGGGTTGTTCAGATGATGTTTGCACGGGCTTGTTAGCCGCAAATGTCACCAGTTCACTTCCGGAGGTACGACGGAAACCTCAACCGTTAAGACAAAAGAATCTACTAGAATCCGATATATTTGACAGGCCATCCGCTCTAAATTACCAATCACACCCTCAAAGAAACTTCCAATAGACACACTGCTTCCAATATTTTGAAATAATTTTCGAGTGTTCCGTTAAAAATCATCGGATATTGTTAGGTAATCGACCGGAAGTAAACTGGTGACAATGCGGCTTTAATACGCACCCTCGCGCGCCAGGGTCCAACTCTCATAACCCGAGGCCAAGGAGGGTCTTATGGTATCAGAGGGGTAGAGCATGGTGCGCAAAATGGTGAATAAGTTCGCCAATAGTTCCTTTATCTTGTTGTCAACCGAAAGATGCCAGCTAAAGTCTGATGTTGGCGCTTTGTGCAAGGGGCTTGGTATAGCAATGATTGTCGTAATAATAGATTAACAAAAGACTTAAATAAAAAAAGAAGAACATCCCAA\n>XM_031545768.1 PREDICTED: Punica granatum exocyst complex component EXO84C (LOC116211402), mRNA \nGCCCTGTCTCCGCCCTTCTTCGCCGGCTCCTGCTCTTCTCGGCCTCCTGGCCGTCGCCGCCTCCTGGCTGAGACCGGCTCCTGCCCCTCTCCTACTCCTCTGCCCATTTGGGTACGGGTCCTCTTTCTTCTTCCCTCTGTGGTTTCGTGATAATTCCCGCCGAGCAAGAAAATTGAGTGAAAAAAAGGCCATCTACTGGGTTTTGAGCTATTAGATGTTCTGCGAGTTGAGCTTTCGCAATCTGGGCTGAGCTGAAATCCATAAATGGGTCCTCTGATCTGAGCAATCAGTAATTGTTGAGTTGAGATTCAGTAGAAACTGACTATACTGAGATCAACTCAGGTTCCCTTCCTCAATGTAGAAGTCAGTCTGTGAAGAAGAAGAAGAAGAAGAAGAAGAAGAAGGAGATTTGAATTGGGAAGTAAAGAAGGGGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAAGATGGAGAGCAGTGAAGAAGACGAGGAGTTCCCTTCAATTGAAACCATCACTCCCCAGCCGAAAGTCAATTCCCTGTTCCAATCTCACACCGAAAAGGGGATTAGGCAGCTTTGTTGTGAGCTATTGGATCTGAAAGATGCAGTGGAAAATTTATGTGGCAACACACAAACTAAGTACTTAGCTTTTTTAAGAATATCAGAAGAAGTGGCGGAGACGAAGCACGAGCTAAGCGAGCTGCAGAAACATATTTCCTCCCAAGGGATACTCGTGCAGGATCTGATGATTGGTGTGTGCTCCCAATTGGACGAATGGAACAAATGCAATCGCAGGGAGCATGAAGGTGAGAAAAAACAGGAGAGCTCTGAAGATAGAGATTCTGTACCTAATGAAACTGAAGACAGCAAGATGATGGTATTAGAGACCATCGATATTCTTTTAGCGGAGCACAGAGTTGAGGAAGCCGTGGAGGCTATAATTGCTGAAGAGAAAAACTCATCAGAACTAAAAGGTTCTTCTGAAGCTTTATCTGCTGAAGCAAATTCATACAGATCGATGTTTCTGGAGAGGAAAGCCATGGTTGAGGAGCAGTTGGTAGAGATTGCAAAGCAACCTCTGATTAGCATGGTGGAACTGAAGAAGGCATTATTGGGTTTGATTAAGATTGGGAAAGGCTCTCCTGCTCATCAATACTTGCTTAAGTGGTATGGGTCCCGCCTCCAGAAGAGCATTGAGGTTTTCCTTCCTTCGTGCTCTCTTTGGCCGAGGACATTTGCCGCCACACTAGCTAAACTCATGTTTTCTGCTATCTTAACGACAACCAGAGAATCTGGTTTGATTTTCGGGGATAATCCGGTTTATACAAACAGAGTTGTTCAGTGGGCAGAGTGGGAGATTGAGTATTTTGTTAGATTGGTTAAGGAAAATGCTCCATCTTCTGAGACTATAAGTGCTTTACATGCAGCAGGCATCTGTGTCCAGGCGAGTCTTAGTTACTGTTCAATGTTGGAATCACAAGGGCTAAAATTGTCCAAGTTGCTTCTTGTGCTCTTAAGGCCTTATATTGAGGAAGTTTTGGAATTGAACTTTAGAAGGGCTCGAAGAACAGTTCTTGATTTGGAAGAAGGCGATGATAACTTGTCTGTGGCACCCCGATTTGTCTCCCCATTGTCTGCTTTTGCTACATCTGACAATGCTCTTATTGACAGTGGACTGAAATTCATGTACATTATCGATGAGATATTGGAACAGCTAACTCCTCTTGCCATTTTTCATTTTGGAGGGAATGTATTGAGTAGAATCTCACAGCTGTTTGATAAGTATGTGGATGCTCTTATCAAGGCCCTTCCGGGTCCCTCTGACGATGACAATCTCACAGAGCTTAAAGAAGTTTTACCCTTCAGAGCTGAAACAGACTCTGAGCAACTTGCATTGTTGGGAATGGCTTATACCATTGCCGATGAACTCTTGCCTGATGCCATTTGGAGCCTGTGGAATACGCACAATGAAACCCAAGAACCAAGAAGTGAACCCAGTGAGAGTACTCCTACTCAAGCTAAGCCGGCAGAGCTAAAAGAGTGGAAGCGCCATCTTCATCACTCATTTGATAAGCTCCGAGATCACTTTTGCCGGCAGTATGTCTTGAGTTTCATCTACTCGAGAGAAGGCAAGACACGACTGAATGCACAGATTTATTTAAGCGGAAACAGGGAGGATTGGGATCCTGATCCCTTGCCATCGCTTCCATTCCAGGCATTGTTTGCAAAGCTACAGCAATTCATGACTGTAGCTGGAGATGTCTTACTAGGCAAAGAAAAAATACAGAAAAATCTGCTTGCAAGGCTGACAGAAACAGTCGTGATGTGGTTGTCTGATGAACAAGAGTTTTGGGGTGTCTTCGAGGATGAATCTTCGGCTATTCAAGCGATGGGTTTGCAGCAGTTGATTCTTGACATGCACTTCACTGTTGAAATAGCCCGGTATGCAGGCTATCCATCCCGGCATGTGCACCAGATTGCATCTGCTATTATTGCTCGTGCTATTAGGACCTTCTCTGCCCGAGGGATAGACCCTCAGAGTTCGCTTCCTGCGGACGAGTGGTTTGTTGAAACTGCAAAATCGGCGATACACATCCTTCTGGGGCCTGGGTCAGATACATCTGAGATAGATGAAGGGCATATCATGCACGATGAGATTCTATCTGATTCAGAAGACTCTGCTTCGTCCCTCTCAACTGAAGAATCCGTCGAATCTTTTGCTTCTGCTAGCATGGGAGAACTTGAGAGTCCAATGTTCACCGATCCCGAGAACTGAGGTACTAATTCGAGTCTTCTGTTATGGTGAGGCCCTTTGGCTGCGGATTGCATTGGGTTCTCTTTTCGGAACGTCGGATGGGCATTTTGTTGGTAGGGAATCTTATTAGCTTCGGCAGAACAGATGATGGATAGCTTAGGTTTTAATGTGCGATGATGGATATGGAAATCAAGAAAGTGTATTTGATTATGAAAACTAGTGTAATTTATGATGTTAAATAAATTAGATAATACTTTCTAACAGGCAGTACACAATTTTTTA\n>XM_006508279.3 PREDICTED: Mus musculus anaphase promoting complex C subunit 15 (Anapc15), transcript variant X2, mRNA \nAGTATATAAAATCTGTCAGTGCTTTCGGGATCGTGGTGGACGCGCCTTTTTTTTTTTCCCCCATCACACGGACCTGGGGGGGCTTTGGTCTAGGGAATGACAGCGTCTAGTTCTGCTGCTGGGCCAGGATCCCTGCCTTGCGTAGGATTTAAGCCCCCATCGAGTGTGTGGCCAAAGTCAAGCTCTACATGTCACTGGGTTTGTGAGCCAGGGCGTTTTAGTTCAGCTTCTTGGTGACCTTCCTGGTCAGCAGCTTCAGCCCACAGAGTTGATTTTGTTCTCTTCCATATGAGGAAACTGAGGCCCAGAGAGGTTAAGTGTATTGGCCAAAATCAAAGAGCTAGTAAGTGATGGAGCCAGGACTCAAACTCAGCTTAGGAGCCATGTCCACCTTGTTCCCGTCACTCTTCCCTCGTGTGACTGAGACACTGTGGTTTAATCTGGACCGACCCTGTGTGGAGGAGACAGAGCTGCAGCAGCAGGAGCAGCAGCATCAGGCCTGGCTCCAAAGCATCGCAGAGAAAGACAACAACCTGGTACCAATTGGCAAGCCGGCCTCAGAGCACTACGATGATGAGGAAGAAGAGGATGATGAAGATGATGAGGACAGTGAAGAGGATTCCGAAGATGATGAGGACATGCAAGACATGGATGAGATGAATGACTATAATGAGTCACCTGATGATGGAGAGGTCAATGAGGAAGTAAGTGCAAAAGACTCGGGATTGTGGGTAGGAGCAGCATGCCCTCCAGGATGCCAGCTGCCTGAGTGGAGCTGCTTCCTTGAATGGGAGTCCCTCATGAAAGAGGCCTGGTCTGAGCAATTCCTGGGATAGCTGAAGAGATCAGCGTTGGGGCGATAGGGGCTGACCATTTGCTCATCGAAGCCTGCCAGCCGGATGACTTTTTCAGCCACTGCTGCTGTACGTGAGTCCCGCTCCACAGTGAGAAGGCGACTTCCAGGGGGCAAGGCTCGCGCAATAAGCAGTGTAGAGTATCCACAGTATGTGCCCAGCTCCAGCACACAAGCAGGGGCCTTCTCTTCCACCAGCCGCATCAGAATCTGACCTATGGGTCAAGATGGCTATTTTAGAAGACATTGAAAACAGGTGTGCCCAGAATCAAACCTGCTGTGCTTTTCTGAATGTGGTGTTTATGTGTGAGGCTGACAGGCTGCTTTCCCCTTTCCCACACCTGTCTCCATCCACCTGGCCAACTTGAAGAGAAGCCTTCCAGTCTCAGTTTAGATGTTTCTTCCTCCAGGAGGACCCAGGCGAAATATCCACCCTACCTTCCAGGTTCCCGAGACATTTTCAGTTTCATGCTCAAATGCACTTCCCCATTGCTGATTGTCTTTGATTTTGGAATTGAATAAATCTCTTAATACTTAGAAGTACTTGTGCTATCTCAGCAGACAGCTATCCTGAGTTGGTTGTGGAAGCCTCTTTGGTAGGGAAGAAAGTCTAGAACAGATAATTACAAACCTCTGAGTTATGGCTATTCCCCTATGTTATGATCTCTTTGAGGCCAGCATTTGTGGCTGGTTACCCTCTGTGATCTCTGCCTCCCTCAGCACCTGGCACAAAAGAGTGGCAATAAATGTCTGCTGGATAACTGAA\n>XR_006907879.1 PREDICTED: Neodiprion virginiana uncharacterized LOC124303282 (LOC124303282), transcript variant X1, ncRNA \nCGATGATTGATAGGAAAATAACCGGAGTGGCCAACCAGCGCAGTAATATTATGTAGATCAGACTTATGGCGGCACTGATACCAAGGATCGATGCAATGGTCCATCTATAAATGACAAAGTCAGCTACAGTCATTGTATAATTGACAAACAGTTCCGGAATTCCGTTTGGAATACAACGACCAGTTACAGAAGTACTGGTCAGATACCACTGAGCACACACGTCGTTTGAAACGTAGGTAGCAAGCTGGTCTGCCGTCGCTGTATCCACTTCAATTCCAGTCTTGCATATCATTGCGGTTCTTAATGCGGTCAAGTTATTTGCCAAAATTGACGAATTCAACTGCCACACAAAATTATCTGTCGGACACTCCGGCACGCATACCTGCGGCGTATCGCATCCTTGGGTCACAGACGTGACCGCTACACATTTTGTCAGATCAAAAAATACCAAATATGGTCTGTCCTCGACATCTTTATGCCTACCGCATATCCTTCCTTCACTATCAGTTGGGTATACTAACGTATCTATATCTCCATAAGTATAAGCTGAAATTATAAAGAATTTTATCAGTGTGTTTCAAAGCTGTCTTTAAACATATATGATCAGGGTGATGTAAAAAAGATGTACTGGTTCCTTGTAGTATACTCGTATTCAAAATTGCGTACCGTAATATCCAATTACCGCCCATCCTACCACAAATGCTGAGAAGATAATCAAGCAAAAGCAATCTGTACATGATCTGCCCTTTAGAGGTCCTCGATATTTTGGATCGAACTGCATCCTATCACCTAAAATTGGTAATTTACATACTTAAATCAATAATAGGCCTTTTATAGTTTAAACATTTATCCAGTTCACAAATTCATTTCAATAGTTTTGGCACTAAGCCATTTTGACAATGTGTTGTGACATTCAAATAATCTTATCAACCACTTATCTCAATAACGAAGTATACATATTATATTGGTAGTGATCTATATTGATCTCTTACCTGGAATGGGAAAGTATCGATAGAGACGGTACTGCTTACATTTTACAATAGAAATTAAAGAAGTTTTTGAGTTACAAGCATAGTGCTCAAAACTATCGCAGAAGTTGCTTGTTGAAAAATTTGAAAACAGTTGTGGATCGTTCGGTTTGGCATAATCCTTTTTTGGTAACTCACACAAAACTCTCTACAGGTACAAGACATTTTTGACACGAGAATTCAAAGCAGTCTGTGACGTGACTCACGTTTCTATACAATGAGACAATAAGCATACGTACCATGTTTGTCGACCATTGTTTGCACTTTGGTTCTTTAAATAGACGTTATCACTCTGACTTTAAGTACTTATATAAAGCCAGTCAACGTTCTAAGAATTTTTTTTACTTGTCCAGTGTTACTTATTAACTTGTTAGGTCTGCATATTATTTTGCCCACTCCGGTTTCATGCTCTTGGTTCAAATTATTAACGAATACTTGGATAGCATATGCTTTCAGTAACACTTCTACTGATAACACATTAATCTGATAAGATGAGATTTGGCAGCGAAGTATGAATCACCGGAAGTAAACAATCTTATCAATTTTTAATTGAGTCTGATAAATTGCAAATTCTTTACAGGATATGCTAACCATATATTGATTGAAAATATGCACAGCAGTAACTTGAATCATACGAAATCTCAGAATTATGTGAGTCGTCGAAATTCTCATTATTTGCACGTTATCGGTTCTAGCTATCCCGAGTTTATAGTTTCCAACTCTGGTCAAGAAACATTTATTTACTGAAAAAGTAGCGCTCGGTGATTTGGAATAGAGTATAAAATAACAAAATAATGGAATCGTTGTTAAGACTATTGAACAGTTCGTTGCGAAATCCAAACATATCAACATCTACACTATCTAGAAGAGTTAATTCATATTTCATGAAACAGGGAATGGGTCGTTTTTTGTTAGACTTATGTACACCTTCAGTGCCGACAGATTTGTTAATTGATTAAAGAAAGATACGCAAACAAAAACAATATGATTGATAGCACTATATGACTTGATAAGAATCAATTTATGTGTACAAGATATGAAGCATAAAAAAAATTCTCCCAAGAGAACATTTCGTGTAATGGCTGTGCCGGAATATCGGTAAGGTCGTCTTAAACTACCGGGTTATTGAATTGATGCAATGACAATATTGCTCTTGCCTGGTATTCATCCCAGATCAAAAACCATTGTGTTTCTAGGATAAAATAAGAATTTACTTGATATCATAACATAGAAACTAAAATCACTAAATATCGAATGATTGGATTTGTAGGGTGGTTCATGGTGTGTTGGCATTCATAAAATAAGGTAAAAACCTGTCCAGAACTCCATGGCTTTTTCCTGGCAATAGCTTATTTGCTGTGCACCTAACTGCTCGATCTTCGTGCATCGTCTTGATTGTCTCCTAAGGGGAAGGAGAGTGAGTAAATTATTAATGAAGTTTCTTCTTTGCTTCGAACTGGTCTCTCATAGTAGGAAGATCAACCTCAGCAACTGCGGATGGCTCAAGGGTGATCAATTCAGGTTGAATTTTGTCCAGAAGTGCTTTCACTTCAGCCTCGCGGCGTTGGCTCTTTGTCTGGAATGGATTACTCTCAAGAGCATCAAAATTGGCTTCGGCACTCCCAGGAACAAGTAGAGATTGAAATCCTTTGGCTGTTGCGATGCCCAACACATCTT\n>XM_023859745.2 PREDICTED: Cryptotermes secundus sodium/potassium/calcium exchanger 4 (LOC111868780), transcript variant X2, mRNA \nTCATCCCTTCCAAAAGTGAAGACACTAAACGGGTTTGACATTGAAGTTGAATTACGAGTTGTCACACCAACAATTTTAATTGTTTGGTTTTGTAATTACTACTGGTTTATGTTGAACGGTTAGATAGACTGCCTGCGCTCTATTATTTAAATTACATGTTGTTTATATATATATATTGTAAGCAATACACGATTACTCCATAAAGTACTTAAAATATCAGCTGATGTGTAAGTTTTAGATAAGGGCTGACTGTATTTACTTCGATTTTCTGATAGCACGTGTGAGTAGTTCTCATGTAGCATCAGGCCGAATAGGATCCCTGAAGGCCTTTCCTCTTGCTAGGCTGCCTATACCAGTTGCCACGATAACCTGCTTGTGTATATAAATAATTATTTCTTCCAGTCAGAGTATGTAGTGGCAAAGTACGTTTAGAGAAGTTGAACGCAGCAAATATAACTATCATTAAAGTTAAAGGAACGAGCTCTAAAGCAAGAAATCGTAACTACTACGTGAAACAGTTTTGTTACTTCTTCGTAAGTGTGATACTAATTTATTCATTTAGGATACGTCACTTTTTAAGTCTGAGTTTTTTTTTTTGTGAATGTTTTAATTTTCTAAAATAGTGACAGTCAGTTCAGTTCCATAAACAGTTTGACAGAATTGTAAGTTCAGAAACAGCATACAGTGTCCTGATGCCAACAAGAATGACAGAACTGAGGTTGATTATAATAGTTGTGTCCATAATTTTGACTGTACAATTTGTGTCAGTGAAATGTACGAATAATACAACCGCTGAAGATGACAGGTCCCATGTGCAAGATTGCATGAACAGTTCTGTCTCAGATTTCCCTGATGATTTGTTTGATTTCAAAGAGAGGAAAAATGGAGCAATCATCGTTCATTTCTTCTTAGCACTCTACTGTTTCACAATAATTGCAGTAGTTTGCAATGACTATTTTCTGCCATCTGTGGACTGCATCTGTACAGAGCTGAACCTTACACAGGATGTGGCTGGAGCAACTTTCATGGCAGTTGCTACATCATCACCAGAACTTTTTGTCAATATCATTGGAACTTTCATTACGGAATCAGATCTTGGAGTGGGGACAGTGGTGGGTTCAGCAGTGTTTAATACACTGGGGGTTGCAGCATGTATTGGTCTTGCAGCTTCTAAGACTATTATTCTTGAATGGTGGCCACTGACACGTGACTGTAGCCTCTACATTGTTACCATTGGAGTTCTGACTGCAGTGACTCTTGATGAGAAAGTAGAGTGGTATGAAGCTCTCATACTATTCCTTATGTATATTACATACTTCCTCATAATGTGGGGAAATGGACACCTTATGAAGTTGGCTAAGAAAATTGAAGTCAAAATTATTGGCAGTAAAACTGTTCTAAATGATCCAGAGAGCTCTACATCAGAGGTTTATTCAAATGTTGGCCCTGGAATATACCGCTGGTATCTTCATGGTGATTTTACTGTCAGTAACAAGATGACTTCAGATGATACAGAAAAATCTCCCAAAAAAGGAAGTCGTCTGATGTGCCCACCAGTAGGGGGCCTACTGGACAAAGTGTGGAATATATTCTTATGGCCAATTTCACTCTTGGTCTTCATCAGTATACCAGACTGTCGAAAAAATCACTTTCGCCATTTATATCCTCTCACATTCATTATGTGCATCGTATGGATAGCTACAGCATCATACTTGAATGCTTGGATGATGACAATTATAGGTAATACATTGGGAGTTCCTGATTCTGTCATGGGCCTTACTATGCTTGCAGCAGGTGGAAGTTTACCTGAAGCATTTTCATCTATCATCATGGCACGGAAGGGTGTGGGAGCCATGGGGATCAGTTCCTCTGTTGGAGCCAATACTCTCAACATTCTTCTCTGTCTTGGTACGCCTTGGTTTATCAAATGCATTGTACAAATCATCCAAACTGGTAATACAAACAGTAGTGCAGTCAACATCATTTCAGAAGGTGTCACCTACAATTGTTTTGCTCTCCTCTCCAGTGTCCTGCTACTTTATGTTGTCATAGCTGTTTTCAAATTCCATCTTGGAAAGCTTCTTGGATTCACATGTCTCGTCACATATTTCATTTTCATCACAGTTTCTGTTCTCATTGAAATGAATGTATTCTTTTATGTTAATAGGCCTTTATGTGCTGAAATATGAAAATAATTACTTTCACA\n>XM_002627964.2 Blastomyces gilchristii SLH14081 U3 small nucleolar ribonucleoprotein IMP4 (BDBG_00918), partial mRNA \nATGGTCCTTCAGTCAGCAGCCTTGCGTCCTTCAGCAACTAAACCACGGGTCAAAATGATTCGCCGTCAAGCTCGTGAACGGAGAGACTATCTCTACCGAAAAGCTCTCCTCCTCCGCGATGCTTCTATAGCAGAGAAGCGCGCGAAGCTGAAAGCTGCCCTTGCGTCAGGGAAACCGTTAGATCCCTCTGTGGCCAATGATAAAATATTGCGAGAAGATTTCAAATACGATGAATCCTTACCCACATCCTCGAAACCGGGAGACCCTAACTCCAAAGATTCTGACATGCTTGACCTCGATGACGAGTATGCTCTCACATCCGGCATCGTTGACCCTCGACCCCTCATTACAACGTCCCGTTCTCCCTCTGCGCGCCTTAGTACTTTCGCCAAAGAGATGCGTTTACTCATCCCAACTTCGATTCGGATAAATCGGGGAAATCTAGTCATTCCTGATCTTCTAGCAAGCGCCAAGGCGTCCGCACTCTCTGATATGATCCTGCTACACGAGCATCGCGGTACACCCACTGCGATAACCGTGTCTCACCTCCCCTATGGCCCAACGGCCAGTTTCTCGCTACATAATGTCATGCTACGAGCAGATATTCCGAACTCTGCACGAGGAACCGTCTCGGAAAGCTATCCTCACCTAATATTTGAAGGGTTTACCACCAAGCTGGGTGCTCGTGTCGTCCAAATCCTAAAACATATTTTCCCGCCGCGGGAAGCAAATGGGAAGCTCGGGAGTAGGGTTGTCACCTTTAAAAATATAGAAGACAGTATAGAAGTGCGACATCATGTATTCGTTAAGACTGGATACCAATCAGTTGAACTAGCTGAAGTCGGGCCGCGGATGACGATGAGACTATTCCAAATCCGAGGAGGAACGTTGGAGAAGGACTCCGGAGGCGAGGTTGAATGGGCACTCAGTCAATATACCAGGACGAGTAGGAAGAAGGACTATTTGTGA\n>XM_031798635.1 PREDICTED: Oncorhynchus kisutch protein FAM180A-like (LOC109879465), transcript variant X1, mRNA \nCAGACAGAGAGAGAGGGGGGAGGCAGAGATAGGGAAGGGGAGGAGAGAGAAACAGACAGACAGAGTGGTGGAGAGGAAAGGATGAAGCAGTTGCATGTGAAGTGGTTTAGCAGTGCTCCAGTCAGCGTTCTTACCTCATTCTCCTGAGGGTTGTTTGTACACAGCTCTCTCCAGCTGGGGCCTGGCCGGTGACTGATCCACATTCAGATCCCATTGAGACAGACAGACGACAGGGCAGTGTCAGTGTGTGTGCGCTGGGCCGAGAGTCAGCATGATGCATCGGTGGGGTCTACTCATCACTGTGTTCTACTGCCAGCTGTTCCTGGCTGCTGCTCAACACTGGAGGAAAGCCCTTTACCCATCAGCCTTTAGAGTGAAGCGTGGCACACACTCATTGGTCAACCCCACCTTCCAGAACTCTGTGGAAGATGTTAACCTGCTGTTTGAGATCCTGCTGGCAGGCCTGCAGATCGAGGGTGAGGACAAGCCCTTCGTGATCCCAGACAAGGAGCTGGCGTCTCTGAGGAGGGTCCAAAAGCTGGAGGTTATCTGTGAGGACGTCCTGCCCAAGAGACTATCCGAGATCAGACGTCTGACCTCCCACCTGTCCCAGCGCAGAGGTGCCCTAAGCAGGGAGGAATTTGAGCGCACAGTGCTCACTATGGTGTACACTGCCCAGACTCTGGCTCATACCACCTCCCAACACCAGAAGGCGCTGTGGGGAGACGCCCTACTGCAGCTGTTCAGGGCCATTCAAGAAGATCTGACGCCCCTACCCAGAACACCTCAGCACAACTAGTGTTATGGACACGTGGACACATTTTTTTAGATACTGTAATATACTGAACATTTTATACTGTAACACAAGTCACTTTTTGGCAGAAAATTTAAAGGATGTTTTCTATTGAGTTGTATTGTATAATCAAAATGACTGTTCTAATAATGTAATGTGTTTGGTTATGATCAAATGATGATATGATCTAATCATATTGAAAGGAGGATGTGGGAAAAGGAGGGATGTGAACAATATCCTGTTCATGTTCTATCTATCGGATTCCGCCTTGTTCCAAGACTTCAGATGTAAACAAACAAATATTTTATCAGTCACTCTGTCATGATTCATTACAGGTCTTTATCAAATCTTCTGTCATAATCTTCTCAGCTGTTTATCACAATTACATAATCTTTTCCCAGCACAGTCCTGTTGCGAAAAGGTGCTTCATGAAAAAAAGAGTCCCATGAGGTGCAGAAATATTGTATTGAACTGTAACATTGAAGACAGGGGTATCAATTTGCTCAGCTTATTTCTCTGCAATTGATATTATAATAAAATAATGATCAATATATATATATATATATATATAGGTTATGGCCATGTTATGAACCAAGCTAAACACTGAAGAAGATGGTTCAGCTGAAAAGTATGTGTATGCTATCCTGATGCAGTAAAAACATGATTTATATATAATGAAGTAAGCTTTATGCAGCATCTTTTAGACTGCAGACCCATTACAATTTTTTGAGGGCTTATCTGGATTCACAGGTTTTACGCACCAACAATACTTTTTGGAGAGCACTATGGTCCTCTTTTGATATGGCCTTGTTATGATTATGTGCAAATGATTGATATGACTTGAGGATGTTCATTCACATTTGCAAAAACGTGGGTAGGGTTTTGCCTCAGTCCCAAACTGTTTTCATTTTGGAATTAGAGGATTTTAGCTGCTCTAGCCTGCAGGGAGGATGTCAGACTAGATGTGAGACATGGGGCCTCAGGCTTTCTACACATCCCCCAGGTCTACACATTCCCCAGCTCTTCAATGGCTACAAAGAAAGACGAGTGCCTAATGTGTGTCCTGTTGGCGACATAGTCCACCGCTGCTAGAACAGACTTTCCATTGACATACTGTTGCCTACAATGTTTCTCCCTCATCTACAGATGACAGGTTCAGGGTGGCGGCCATTTTGCATGGAAAACTCCTCTCCTTCTCTGTGTCCAGTTGCTATTGTTTCCGGATGGTGATAGAACTGGTCTAGCTCTCCTGGTGGTCACACATCAAGGCACGGGTGAGTCCATGCCCCATGCTCCCGGTAGAGCCCACTAGAGCCCTCATTGATGAGGAACTGCAGATTGTGGTGAAGAACGTTTTTCCCCAAAAAAGAAGATCACCCTTCGTTCACCCTTCGTTCCTGGGAGGCGTTCGGCCATTATGCCAGTGATAAAACGGGGATGGTCAAAGAGTCCAATGGGCTTACTGTGGATCATGAGGCCTGTGTATGGCAGTGAAACATGACCCAGGTTGAGGAAGAAGGATATCCGTACTCCACTGCTGGTTCAGATCTCTGTGTACAGTGGCCACATCAGCCAGGACTACAGTGAGCAGGCTGCTGTAGCCTGTACAGTCGTAGAGCGCTGGTGTTTGGCCCCCGTAGTCCAAAAGATAGACATCTACAAGAACGGAATCCAGGGAACCCTTTTTATACCAGCAGGTCCTGGACCTTTCCCTGCTGAGCTGGAGCTATCTGGGGGAGGAGGGGGTCTGTTTGAGCATCGCTCCTACCTGTTAGCATCCCAAAGCTACGTCTCCTTAGTGCTGCAGTACCCCACGGACGTCTCTACAATGGTTGCCATAGGATGCAAGTACTTTGAGGAATTTGCACAGTTCATTGTGGAAACAGATGCAAGAGGCCTGAAGTGTGTGTGCTCTGGAGTTTGTTGTGAACCTGCCGCCCCTACTTCAGACAGCCTTCACTATGCTGAGACCATCCTCAGGTGGCCAGTGATAGAGGCTATGTTTGGCTTCTCACTGGGATTCCTTATCCCTGACCGTTTACACTGATGTCATTAACATGATTATTCCACACCTTCCTCTTTGAAATTGACTTGTTTGATTGATAACCAGTTAATTAGTGAACGCAAATACTGTAAACAATTATTTTACAGGTGCTCTGTAGGCACACCTCTCTCCTATTTCCCAACATATTTGTTGATAATCCCCCTCTCTTCCAGCCCAGATGTATGGTGAGTATACGTGGCAGCCATGTTTTCCCTTTCAGATTGTCGCTTGTGTCAATAGCTGACAGGTACAACACGTGAGTGTGTTTTAACCTATTCTAAAGCAATGGGAAATGACCTCATTTGGAATGCACTGAAATTATAGTTGTATTTTGCTCAAATTTCTAGAAATATGCACTTTGATGAGAACAATCATTTGATCTGGAGAGACACAATCCAGCCCATCACTGAGAGTGGCCCTAAAGTAGAGGTGATGGTATCTTTCAGACTGCATTGTATGCACACTATACTGTATGTATTTGTACAGTGAGGAACTGACATGTGTGTGAACCTATTTTTTGGCACCATAGGTCAGGAGGTTAAAGTGTCCATTACTGATGGTCATTGGAGAAGCTTACCAGAACTGTGCCACTACAGAATCTGTCCAGGATATGCGCAGTACAGTATGTTGGAGAGGGCAGGGAACCTGTGTCTTACCCTGGGGCTGGTCACCTAATCAAACCTTTCTACACTCCTCACTTCCGCTCCAGCACCTCCAGGGGCAAAGTGATCATGTTGTGGGGAGGGGAGTCCAAATGGAGGAGGATCCTGGAGTTCCTTCAGAAGAACCTGTACCAAAGACAGGACCCCTCTGTCCCCTCAGAGCTGTCAGATCCTCCTGGACTATCTCCATTATTATAGTCATCGCTTCTCCAGCTTCATTATCTGTCAGGGCCCTATTCTTGAAATTAAGTAGAGACAATATTGGTTGGATTTTTTTTTACTCACCAGGTGGCAGCATTGCACAGTCTCTTAAATGACTGGTCTGCTGCTTGTAGTTGTCATAGTAGTCAATGTCCTGACAATTACAAGGAGGAAGAAGAGGAGATGGTCGACATCGGCCTTTCATCAAAGTCCTTATAGGGAAGCCTTTCTGTTTAAAGACCATGGATCAGACCTTGGCTGCTCGGTCACGGTTGAGTTGCGGTCTTCTAGCCAACCTGGTTTGGATTCCAAACTCCTGTGAGGTGACATGAAGTGTTATTGATCTCAGAGTTGAAGAGAATGAACACCGCTGCCTTTAACTCTCATCAACTGCATACTTTTTTCTTTTTTACATGTCACCCATATATTCTCACTCCAGATTCCATTCTGGCAAAGGGGACCGATGGCCTAAACATCTCCATGTGTTGCACATATATTAAACCAATAGCCTGGTCTGGA\n>XM_017410869.3 PREDICTED: Kryptolebias marmoratus Yip1 domain family, member 1 (yipf1), mRNA \nGAAAATATACAGAAACAGGAACGTGGCTTGTTTACATGCTGTCACTTCCTGCTCAAAGCTAACGTAGCTAACTGCAATTATTATAGGTTTTCTCGAAGAATTTGAGCTTGAACTGTTCCCTTTATTTGGCATTAAATTGCCTGCAAGTTTCCTAAAGATCAGTAACATTGTCGTGAGAGTGAATGGCGTCAAACAATGATCCATTTCAGTTTCAAGAATTTGAAGAAGCTGAAAATCTTTTGGAGACCAACAGAGATGCAGTCACCGTAAGCATTGAGGAAGAAGATCAGAAGTCCAAGAGCCAAAGATCTGCTGGTGGCTTTTCTCCAGATTTCACTGATGAGGATCCACTCCGCACCGATGACAAGGCAGAGCTTCTTGGTGGCCAAAAGAAAAGTGCCCCTTTCTGGACGTTTGAATACTACCAAACATTCTTTGATGTTGAGACACACCATGTAAAAGAGAGGATCATCGGGTCGATGCTGCCATGGCCTGGAAAGAACTTCATTCAAGTTTACCTTCGTAAAAATCCTGATCTTTATGGACCATTTTGGATTTGCACCACTCTTGTGTTTGCCATTGCCATCAGTGGAAACTTATCCAGATTCCTCCAGTACTCTGGCAGTTCAAACTACAAATATACCCCAGAGTTTGGAAAAGTGACCATAGCTGCTACAGTAATCTTCAGCTATGCCTGGCTCGTGCCTCTTGGCCTTTGGGGGTTCCTGCTGTGGAGAAACAATAAGATTTTGAACCTGGTCTCATATTCCTTCATGGAAATCGTCTGTGTGTACGGATATTCTCTGTCAATTTACATACCAGCTGTGGTCCTGTGTATTATCTCATACGAGTGGCTCAGGTGGTGCTCCATCGTGGTGGCCCTCTGCCTCTCTGGCTCAGTCTTGGTGATGACTTTCTGGCCCGCGCTCAGAGACGACCACCCCAGAGTCGTCATGGCTGTCGTTTCAGCCATCGTGTTGCTCAATGTGCTGCTGGCTGTTGGTTGCAAGACCTACTTCTTCAGCAGTCCAGAGATTGACTCACAAGTAAAAAGTTCTCCTAAAACAGAGGTTGTCAAACCAACGTCATCGACATGAACGCCTCCTGTTTGAAGCTTCTCCTGTTGCCTTATTGGAGAGAATCGGGTTCCTGTACCAATGAAGTCATGGGCTGACTGGATTTCACCGCACTTGGACATTCCAGCTCGATGCCTCTGAAAAGCCAAGACTGTAAACTTGGTGCGGCAGCATGACGATGAAAATGAAAACTGGTTGCAAGTATGTTACTTCTAACGGGATGGGTTCTAAACAAACTTAAAGTTAATTGGGGTATAGTATTACACAACGCACAATATCTGTTGTGGTGTTGTAGTTTTCAGCTTTCTGTCGCTCATGTAAAATGTTTGGAAAAAAACAACTTTGTGCAATAATAATAGCAGCACCAATGCTTTTTATATGCACATTTGTTTTGCAGTATATTTCTTTAATAGGTAATGGTAAGTCGATTTTATTTACAAACTTAATGTATGATCAATTATAGGCATTGGTAAGAATTTCCAGGATTATTTATCAAGCACCCTGTAAAGGTGATGTGGTGGTATTTTCTTATAGTTAAGTTGCCTCAACTAATGCCAAGAGCTGGTTTAAATAATTTTTCGAATGACTTTGTAAATATTTCATAAATAATTTGTTGTCATTATAACAAACATCTTTAAATAAAGTCTACTGAATTTCATCTCTA\n>XM_007381610.1 Punctularia strigosozonata HHB-11173 SS5 hypothetical protein (PUNSTDRAFT_132265), partial mRNA \nATGGCTGACGACTCGAAATCGGAGCCTTGCCACTGCATCGAAAAACCCAGACAACGTGGACCTGATGGACGTAAGCTCGGCTTGGATCAGATGATCTTGCTGATGGATCCATGCTTGGGGGCGCACTGGCAAGCAATCAAGGACCGCATTCGCAAGCTGGCGTTCGAAAGGTTGGCTATCGGCCGCGTTTACAATGACCAGCCGTCATTTGCCCATTCGTTATTGGTCTGCCAGGTTGCCGACCAATGGCAATTCCTGTGGGACTACGTGGACCTCTGGCCGCTTCGTCTATACCTTCGGTTTCTTCTCTCTGCGTACGCGGATCCTGATACGCCTACCGGCATCGCCTTGAGGCTCAGGAAAAGTCTTGACGATCATTCTGTGAAGCATGAGACTGCCTCTGCATCTACTGCCTCCACACAAAGTATCAACGATGATGATACTCTTGAGTGGGATGACCCGGAAGAACAACTTAACGATACAACTACACGAACCTCTTCGTAA\n>XM_032672596.1 PREDICTED: Danaus plexippus plexippus SAP30-binding protein (LOC116778559), mRNA \nGTGCAGCGATACATAGTTTCACAGTTGTTGTATTTACACCAAAAACATTAAACAAGAATAACCTTAAATAAGTTATTCTTGTGAGTGAAACATTACAAAAACTGTGCTAGAAAAGTGTAATTTATTCTTATAGTGCGTAAAATAAGCAACATGACTTCGCAAGCGTTAGCCACATTGACCGCGACGTACACAGACTCCGAAGGTGAGGAGGAAATGGAAGATGGAGATCCTACACCTGAGAAATCGGTCACTCATCACACACAGTCAGCTCCAACCAGTCCCAAGAACATCGACGACACCAAACAATCTGCTTCCGCACCAGTTTCTCCAAAACGAAGTTTGGTCTCGTACGTAGACGACACTATCGTATCCGATGACGAACAATTGTCTCCTAACGCGGAAACTCAGGACGATATGAGAAGATTATCGATGGAAACCGACACAGATGAAGCTGTCCCACGATCAGATCCCGACGACTCAGAGGATAGTGTCCTTATACCTCCGGAACCAACAGCCAAATGTCCCAAGGAATTACAAGACAAAATAACAAAATTCTACACAAGAATGGTCAACGAAGGTTACGACATGAACAAAATAATTCAGGATAAAAAGAATTTCAGAAATCCAAGCATATACGAGAAGTTGATACAATTCTGCGACATCAACGAGCTAGACACGAACTACCCACCAGAAATATACGATCCTCTAAAATGGGGCAAGGAATCCTACTACGATGAGCTCGCTAAAGTCCAAAAACTAGAGATGGAGAAACGGGAAAAGGATCGCAAAGAGAAGTCCAAAATAGATTTCATCACCGGAGTGGCAAAGAAGTCGGACAGCGACGATGACAAGAAACGGAAGTCCAAGTGGGACCAAGCGGCGCCCAACGTAGCCAACAAACCCAGCATCAAACAACCGGGGCTCCTCCAGCAACCGCTGACGAGCAACGTCACCGGCACCAAGGGCACTGTGATATCAGCATTCGGTTCCATTGCCAAGAAGCCAAAACTATGAGTTACAGCACAGACGGACATGTTAGTGATGCAAAGAACGACAACAATATAAAGTGTACAATATTAGTTGCAGACATTTTAATACAAAGTTTTGGCTTTTTATAAGTTGTTAAGACTGGTAGATAGTGTATGACAAAGTTAGACTAAAGCATCCATATCATCCTCAACGTGCTCCTCTCCGAACTCTCCCACACTTATGTATATATTAAAACCGTTAAATAATTCTTGTAAAATAAATTATTTGC\n>XM_030796770.1 PREDICTED: Nomascus leucogenys intraflagellar transport 22 (IFT22), transcript variant X3, mRNA \nCAGGCCAACCCTGCAGAACCGCGTCTGCAGCCCGGGCTTTGTGGCTTCTCTCCGACCCCCTCCCAGTAGCAAACGCGCCCGCTTTCCGCCCTGCGCGCCGGAAGTGGCCGAGTCCCGTCGGCCCCTGCGGGCCGCTCGCCGTCGCCATGGAAACGAAAGTGGCCAAGTAGCGCTCCGCCCTGACACGCTGGCTCTGGTGGGCTGCGGCCGGCTACGCCGCGGCGGACAACGATGCTGAAGGCCAAGATCCTCTTCGTGGGGCCTTGCGAGGATCCTAGAATTTGAGAACCCGCACGTTACCAGCAACAACAAAGGCACGAGCTGTGAATTCGAGCTGTGGGACTGTGGTGGCGATGCTAAGTTCGAGTCCTGCTGGCCGGCCCTGATGAAGGATGCTCATGGAGTGGTGATCGTCTTCAATGCTGACATCCCAAGCCACCAGAAGGAAATGGAGATGTGGTATTCCTGCTTTGTCCAACAGCAGTCCTTACAGGACACACAGTGTATGCTAATTGCACACCACAAACCAGGCTCTGGAGATGACAAAGGAAGCCTGTCTTTGTTGCCACCCTTGAACAAGCTGAAGCTGGTGCACTCGAACCTGGAAGATGACCCTGAGGAGATCCGGATGGAATTCATAAAGTATTTAAAAAGCATAATCAACTCCATGTCTGAGAGCAGAGACAGGGAGGAGATGTCAATTATGACCTAGACAGCCTTCACGTGGGACTGCCACAGCCCCAGTGAAATCAGCATGTTTCTCAGTGCAGATCTGAAATCACATCCAGCTCCTGATGTTTTCTTCTCCCTGTGACTGCAGAGGAAGTGTTCCTACGTGCAGGAAGGCACCTGTCACACAGGGCGTTCACTCAGACCATCTGTGCTCTGTCCTGAGTTCAGCTGAGAAAATCCGATTATCGAATTTGGATTTCCTGGCCCCAGAACTTCCCAAAGACCTGTAAAATGGAGGGATTTACCACCTCACATATGTCCAGTTATACAATTTGTGGAGTTGTAACTGTTGCAGCCCAATGATACAACAGTAGTTTAATCCTGTGTATTGGCTTGAATGTGATTTTCATTCCTTGATTCACCCAACGAATACCGACTGGCTGAGCACCTGCTGTGTGTGCACTGCTGTTCTAGCTGCTGACCGTAGACAGCATAAATGAAAAAGACAGAA\n>XM_046808004.1 PREDICTED: Homalodisca vitripennis neuropeptide F receptor-like (LOC124356796), mRNA \nCTACAAGTTGCGCGTCCCGCTCCACCTTCCCGCAGTCGTCCCGCACCCACATCGCGCGTGAACTTTATACTGCTGGAGTATGTGATGTTGTGTATGTGCTGACGTGTCGATCAAACATACTGTGTCCTGAATTGAATGCCTCAAGTTGGTAAAGTATATTCTGAACGCACTAAACCTTCTCGACTCCAGAGTGACGGTGAAACTCCTACGTGGCCGTACAATCTGATGACGCCCTCTGTACATGAGCTGTCCCATGTTCGAATCATGTCTGATGATGGAACTGAACGCCTCAGGCACATTTAACTTCAGCATCCACGAGGCGTTCCAGATCCTGCAAGAACACAAGAGTCGTGACCGCAATGTTGACGGACTTACGGAGGTGATCCTGATCTGCATCTACGGGTTCCTGATGGTATCCGGACTGTCAGCCAACCTGATTGTCAGTTTCGTGGTGGCGCGTCGACCGCAGATGCACACACCGAGGAATCTCTACATCGTGAATTTGACTGTCTCGGATATGACTTTGTGCCTCATCTGCATGCCTTTCACCTTGGTCTCCATCTTGAGCCGCCAGTGGACTCTTGGACTCGCATTGTGCAAGCTGGTGCCGGTCATTCAGGGCACCAACATCATGGTCTCCGTTGGCACCATTACCGTCATAGCCTTGGACAGGTACTTGACGATAGTGCGTGGACAAGAAGGTACCAACAGTAGACGACGGGTAATCACATCCATAGTGATGGTTTGGTTGGTGTCAGCACTAGCCACCCTCCCTGTTGCCTTTTATCAGGTGGTGGAGCCTCTGATGTTCCACCGGGTGGTGCTGTACGAGACGTGTCTGGAGCGATGGCCCTCTCAGCAACTAAAGATATCGTACGCTGCAGCTGTGCTGCTCGTACAGGCCGTCATCCCAGCCCTCGTAGTGTGCGTGGTGCACGCGCGGATTGCATCCTACCTGCACGCACACGCACGCACACAGAAGGATAGGCGGAGAGCCCTGCGGGAAATAAAGAGGAACCGAAGAACTACGCTTCTCCTCTCAGGTGTTGCGATCTTGTTCGCCCTGAGCTGGCTGCCTCTAGGTATCTTCTCTCTGACGGCCGACGTCCTCTACTCAGAGGAGTCCTTCAGCCGTGTGTCCTCACAGGACCTGTACGTGACCTTGGCCGTATGTCACGTGACCGCCATGACCTCCGCTGTGTCCAACCCCGTGGTGTACGGCTGGCTGAACTCCAACATACGCCAGGAGTTGCTGCAGCTGCTGCCCTCGAAGTGTGCCACTGTGTCCGGGATAGAGGAAGCCACCACCAAGACCGCTCTGCCAACCACCACCCACCGGCGGGAAAGTTTCACCATCCTGCTGCAGAACGGGGACCGGCCAGTGCTCACTCAATCGCCCCACACATTGGTCACTGTCTTATAACGGTCCGTGAGGTCCTCATCGCGACTCTGAGATACATCTTCTAAACACCATTCTCTAGATAAACACTATTTTATGTGACAAGGTATGAATGCAATGGGTAGAAAATTGTAAAACAATTACATATCACATAGTAAGACGGATAAATTCCTGGTTTAAATAATATAAGTTTCTTGACCCGTTCCTTACTTCCTAAAATTGTTTACCAGGATTACGATTGTAGATTGTCAATACAATAAATATCCAATTTTTTATACTAAACTCTCGAACACATAGCCTCTAATCGCCCTCAGTATATAAAGCTTCTGGCTTTGGAGATGAGGTCAGTCTTTCTGTCAATAAAAATAAAATTCATAAAACATGGTTTACTAATATTATTATATTCAATTTTATAATGAAAGGAATTTTTCATCGCAACATATATAACTTTTCAAATAAGCTAGATCTAAGTAGAGATACTTTCACACTTTCTGTTTATGGTGGTGTTGACAAACACATGATGAGCGAGTGCCAAGAGAAGATAGGTAACTACTGTCTGTGTTATGTTTGCTTTGCTTAGTGTCAACCTTGACGTATGCTGCATAAATATCTCTTGTGACAGATACCATATAACTAGTTTTAGAAAAGTCTATTTAAACGATTTAATTTTGTAGTAAGAAATGAATTGTTGAAATTATTTGTTGTTTTGATTGGTTTTAAAAATACAAATTGACAAAAATTATTCAAAACCTTGAAGATTTATAATGCTTGTAATATTTATGATCCGGTTTTATTTAATTTGAAAAGTAAGACACCTGTATTGTTTGGTTTTTCGAGAACATACTTAAAGTCCGTTCCTAACGATAAATATTTAAATTCTTGCTCAAACACATTTACAACAGAATTTTGAAGTTCAACTGACTCACATTCAAATGTTATTCCACCCCAAGTACTACGTTATCATAGACATGATACGCGCTTCTTTCCTTATAGAAGTATTGAAAAAAGAGTTTGTTTGGAAGAGTAACATAAACTTTCAAATATAAGTAAGAGTAAAGAGTAGCATGGACATAACTTGATGCTAGATTTACTTGGCGTATTTATAATAAATACGTATAAAGACATAACATCATGATCAGTATCAGTAAGTTCAGCTCTTTGTTTACTTTACTATAATTTTACAAGTATGGGTATGCCACAACACGTGTTGCATAACAAGCTTGACTGAGGTTGTGTGCAAAACTAAGTTTATAACACATGTTCTTCTGGTAGTTATAAAATACGTTAAAATTTATTATGATTTGATCCATTTTGTTTACAAGTTGATTTAGTCTTTGATTTTCTCGTTACTATCACGGTGAGACATAAAACCAATGTATAAGTAATTTTAGTAAGTACCGCTGTGGATTGAAATGCAGCCTCCTTAAAATCGATGTTGCATTTATAAAAATGAAGCTGCTTGCAAAATTCCAAGTTTATAGATTAATTCGTTTTTGAGGCATCGTGCGGACAGAAGGGCCTACATAGATGAAATTTTTCCAGTCCCTCGAGGGATGGTCTTCTCTAACGCTCAGCCATCAACGGACGATTGAAAATATGTATAGACAAACTTGTACGTACGAAAGGACAAAATACTTAAACACACACAAAATCTGTGATTGGATCTACGAGTTAAGAGTATCGAGAGTTATCGAGAACGATGAAACATATCAACACGAATGAGAGAGAACGATGAAATGTATCGATTTGTGGCACATCACGAACATCTCTCTGTATGCTGCAGTACCAAAGTGGGCGTCGAGTTTACTTATCGGTTTGGCAAAATCGTTTAGTTTAGTCAACAACGATGTATTTTCGTAGACTCTGATCACCCACCAAACCGTTCATAGGTTACAAACTGGATGTGATATTTAAAACCTTTTTAAATCTCTTAATATAAACCACTACCGAATTGGGTCACATTATTGGTGCTCAAATATGATTCCTTTGAACTGTGACTATAAAGTAAATGTGGGCGTAGTAGGTGGTTACATATTAGGGCGGTTCTATAGTATTTGTTTTATAAAGCCAGCATTAATACAATTATTTTTTTAGTCTCAGAGATAAAAACTGTAATACATTTTAAAAGTTTTTTCTTATTCCATATATTCCGAAAGTAGCATAAAAATTATATTTAACTACATACCATTGTATAACTATTTAAAGTTCTACTTTCATTACCATTGAGATTTGAAGATGCAACTATATGATCTTACTTAAAATGTGGCAAAATGTGTTATATGACAAGTAAGTATTATTTCATTATTTGTTTATCATTTCAAAAAACGAATGGTCGTTATCTTGTATCGTTTTCTTCAATCGCCTATCGAGCTGGAATCGCCTATCTTACCAGAATTACTATACAGCCGCTTTTATACCTTGAGGGGCATAAATGTTTAGTGCTGTGAGACAAGGGTCAATAAAAGATAATAGCGATATCGTGTTCCTTTTAAGTTCAGTATCATTAAGTAGTTCTTTCGCTAAAAATATCACAATCTGCTCTATCTAGCTTAAATTAAGGAATTAAAAAAATAATTCAGGATAATGCAATAGTATAGTTTTCTTTGTAATAGAATCAAATAATTCGTATAATGACGTCAAAAATAAACAGTTTGGATTCCTGTGATTAAAATTAAATTCTAGTTTTTTCGGTTAAATAATTTCAAAATGTTATTTTTATTTACAGTGGCATTATTTAAAAAAGTATAATTGGTAAAATTCATAATGTAATTTAATAAACAAATTGTATAATGTGTTAATTACTAGTATTAACAATTCGGAGTTTAATAAAGAAAGACTGTTTTAAAGAATAATTGTAAACTTTTTCAAGAAATATTCGTAATACATTTTATTTACATAGTTTCTCGTAGTTCTAGAGTAATATAAATTTTATCCGATGACATCTTAGAGTGGAATTCAGGACTTGGTACGCTACATAAGTTAACAGAGATTGTTACGGATAACTCCTACAGGTGAAATGTAAATGTCACTACCCACTTCTCAAGCAACACCTCTTTGCATCTCATTACTTCTCCGTACACATCTATTTTCGTATGGAATATTAGTATTTTCTGAATAATATTTTCCTGTTCTAATATTCGCTCTTGTTGTTGGCGTGACAGTGCACCCAACCACATTTAAAATTTGATATTTTTATATGTACATTTTATGACTGTACCACTACTTGAGTGTATTGTTAATATGATAAATTAATATAACAATTATAACTTAATATAATGTGCGTATTTATCTTGTAATTTGTTGTAAATACTAAACAACATAAGTGTAATTTAGTTTTAGTGTTGTTCTATGGTTCCTATACAGATTGATTACAAATTGTAACTAACATAATTGTCAAAGGTAAATTATTTCACAGGATAAATGTTTTTTTTACAATGGGTTCGCCAATATAATACTTGTAACGTGAAGCTCTTTTTTACTAATGCTAGCTGTAATCTCATATATTTACATCACAAATTGTATATATATTTAAATATATATATATATATATATATATATATATATATATATATATATAATATATTTTAAATATATGAACATTAATGTAAAATTAGATACAATATAAGTAATACAAAAGATACTTTAACGTATATTTTACAACACATTTTTTAAATAATAACAAACAAAATGAATAAGTCTAGATAGGTTTCCTAAAGGATTTTAACTGGTATCTCATGAATACTGGAACTATTACTACAGACAAAAATTGAAAAACTGTCATATATATACAATTTCACTTATTTGTTAATTTGAAATTATTGCTTGCAAATGTCAGAAATTGTATCTAAAACCATTTATATAAATTGCCAAAATAACAAAACGTTTCTATCATTATAACATAATTTTCTCTTTAAATTGGCAATTATTGAACAGCAACGCCACCTGCTTTTTTGTGATGAATACCAATTGGAATTTACAATTTTAAATTATTGATACAATTTCCCAGTATCTTGTAAATCTTAAAATTCCTTAAGGAAAACTCAATGTTTTCTTTTAATGTTGATTGTAGTATAAGATGATTTTATAATTTATAAACTTTTATTTACTCACTCGCTTAAGAGCTATAGCATATTAATGCTTTAAAAATTGCATATTTTTCCAGATGTAAGCACTATTGTGTAATTAATTTCAAATGAAGCAATAAGGAACACTGCTTTTAGTGAATTAGTAGTGTTGAACGAAAAAAATACACAGCATGACATGCGTATGGTGGATATGAGTATAAATATTAAAAATACAATAAAAATGTGCAATTGTTCGTCGTCTATGACGATAATCAATTATCCTTGGTGTTCCACTAATTTTGGCGATGTATTGATTACACTAAAGTTTTATAACTGATCTTGGCATCATACAGTGATTTAAATTAAGGTGTTAAAATTAGTGAATTTAATTAATAGTTTCTTCCATCGCATATATGCAAAATGTTTTACTCATAATACCAATAAAAAGTGTATTTATTTTTTTAAACTAGTATTGAAGGATCTAATTTAAATAATATATCAATTGAAAATAATTTTATTACGTATGGGGGGCTTCACGCTTTACATGTGTACGTTACCTATGTTTCTTGTGTTGTTTATGGTGATCTATGAATAACCACAACTATTGAGTTATAGCAATCCAAATGTTTGTACACGTGCTGTTGTGAGTAGTGAGCCCAACTCCAACACATGATTACAAACATGATCATGTATACATCAACATTATGCAGCCTCTGTGATTTGTTTGTACGCTTATTGATTAAACTATACCTTTGACACAA\n>XM_021555190.2 PREDICTED: Lonchura striata domestica interferon regulatory factor 7 (IRF7), mRNA \nATAAAGGATCGGGAAGGAGACGGCCGCCCCCGCGCCAAGGGACGGCACGGCACGGCACGGCACGGCACGGCACGGCACGGCACGGCACGGCACGGCGCGGCGGCTCTGCGGACCGGCACCATGGCAGCACCGGAGAAGGAGGGGGAAGCGCAGAGGCTGCGGTTCGGACAGTGGCTGCTGGACGCCATCAACAGCGGGAGCTACCGGGGGCTGCGCTGGATGGACGCTGCCCACACCACCTTCCGCGTCCCCTGGAAGCACAACGCCAGGAAGGACATCACCAGCACTGACCTGGAGGTCTTCAAGGCCTGGGCAAAGGTCAGTGGGCGGTACGAGGAAGGCTCCGAGGATCCAGCCAAGTGGAAGACCAACTTCCGCTGTGCCCTGAGCAGCACCCACTTGTTCAAGCTGGAACAGGACCATTCCAAGCGTGGTGATGACCCCCACAAGGTTTTCTCCATTGTCTCAGCCACCCTCCAGGACAGCAAGGAGGGACATTCCTGCATCCCCAACCCTGTGGTGGACCAGCAGGCAGCACAACAGCAGCTGCAGCCGGAGATCCACCCCCAAGACATGGCCTCAGCCATTGCTGTCCCAGGAAACACCGACCCCACAGAGCTTCTGGAGCAGCTGCTGCAGCAGTGTGACATCTCTCCCAGCGACCTTGACTCGCTGGCCCCATCCTGGGTGCCTGCAGGTGGTTTCCCTGCCAGAGACACTCCCCACCAGGACATCGTACAACAGCCTCACCAGGACACCCTGCTCCAGCCTCACCAGGACACCCTGCTCCAGCCTTACTCAGACACCAGCCAAAACAGCTGCTTCCCTCCCACATTTCCACAATGGGTGCCCTCGGTGGAGCAGCCCACCTTGGGCACCTACCAACCAATCGGCCTCATGCCACCAGAGGAGACAGGGGCCATGCCACCGCCGTGCCAGCTGACGGAGGGCACGGTCCCCATGCAGTATGTGCCGGGTCGGACGTTGTTCGTGCCCGCCGCCAGCCCCGTGCCACAGCCACGGCTGCTGCTGGATCACACAGATGGCATTGTCTCCATCCTGGATGTCACCATCTACTACCGGGGGAAGGAGTTCCACCACGAGGTGGTTGGGGGCAGCCACTGCCTGCTGACGTACCAGCGCCCCAGCCTGCCGGGGGCCCCGTGCCCCGGGCACGTGGTGAGCTTCCCCAGCCCCGCCAGCCTGGCCGACGGCAAGCAGCGGCGCATCACCGAGGATCTGCTGGGCATCGCGAGGCTGCGGCTGGAGCAACGCGCCTACAAGGTCTTTGCCACCCGCCAGGAGAAGTGCAAGGTGTTCTGGGCCTTGTCCCAGCAGCTCGAGGGGGTTGAGGAGCCCCCATCCAACCTGCTCTGCCGAGACCAGGAAACACCCATCTTTGACTTCCATGAGTTTTGCACAGAGCTGAGGGACTTCCGCAACGGCCAAAGGCGGCGATCTCCCGACTTCACCATCTATCTCTGCTTTGGGCAGGCCTTCTCCAAGGCCAAGCCTAAGGAGTCCAAGCTCATCTTGGTGAAGCTGGTGCCCAAGTTCTGTGAGTACTACTACGAGCAGGTGCTGCAGGAGGGAGCCTCCTCCCTGGACAGCCGCACCATCAGCCTGCAGCTCTCCAACTCCTTCGACCTCATGGAGCTCATTGAGCAGTACAACATGCAGCTGGGCTGAGCCCACCTGCCCCGCTCCCCATGGCCCTGGCACAGGCAGCAGCACCAGTGGGCATCCAGGCTCTGCAAACCAGCACCCCCCAACCCAAGGACAACTTCAGTGACCAGTCCTGGAGCTCACACATTGCTTTTCCTCTCTGTCAGCTTCTAGTGTTGTGTTTTTGTGGAGGGTGGTAATTTACAGATTTATTTTCTTAACTTTTTCAAGCTAAAATACATATATATATGGGATCGTAGTTCTCTCTTGCCTGGAGATGTGCCTCTTCTATCAGTCTGAAATCTTCACCACCCCTTTCTACCCCCAAAACCACGGGGGTCCATGCCCAGCCTTGTCTCAGCAAAGTCCCTGCTGGCAGGGGTGGGCTGGTATCAGAGAGCTTTATTAGCACCTTCTTCTCCTTAAATTTGAGTGGATGAGGTGACTTCCCAGTGTGAAGGGATACATTTATCCATGCATTTATTTCCATGCATTAAGGCTGCAAACATGACTCGCAAGCAGAATGTGTTGAGGACAGCTTGGCTTGGGCTAAACAAAAGTAATTCTTCATTGAGCACTGCCCAGAGTTACTCACTGGAGATGTTCTGGAAAAATAAGGCAGTAAGTACAACACGAAACACCCAGACCACCAGCTCAGAGGTGCAGAGGGGGGTGGTATCTCAGGGAGGAGTGTGGAGACCAGAGGGCTGACTGAAGATGGGGTGTGCCCTCCCCAGGCTGCAAGCAACTGCACCCCCTCCTTTCAGGAGCCTGACCATCACTGTTGGTCCCTGGGCAAGGGGAGGAAGCAGTGTCCTTACCTGCCGAGTGACCTGGATGCTGCTGGGCCCAAAGGTGGTGGTCCCGTAGCTTGTCACGTAATAGTGAGCAGAGGGCTGTGCTGGGGGCTCCTCCAGTGGCCTGGGTACTGTGGGAATGGGACACCCTTAACCCCTCTGCTCCATGAAACCCTCAGCCCTCCTTCCTCTGAGCACAGCTGTGGCACAGACTCGGGACACCGGGCTCACCTTTGGGCAGGAGCAGCTCTGCACCAAAACAATGCCCACACGTCCCGCAAGTTTTAACGTCTTCCTTTGTCCTGTGGAGGAAAAAGCCCAGGAAAGAAGGAGCAGGAGCTGCTCTCAGCGCTCCCCATGGAATATGATGCCGAGGCCATGGAAGAGGCTTGCTCTTCCCACCCTGACCTGAGGGGCAGCTGTTGGTGGACAGCCGCTGCCCTCCCAGGTGCCTGAGCACCTTCAGCTCTTCATGAAACAGGGACATGTGGGCACATGTCCAGAGTGAACATTCTGTGCCTGAGCCCCAGAGTCTCAGCTTCTTCACTTTTCCCTCCATGCTCCAGTTTCCCACACCAGTAAGTGTTAACACCACTTGGGACAAGAGCTGCTATGGTTGGGAGAAGGGCACCGTAGTGCCTGGTGAGTTTCACAACTGATTTCACATGGCTTTTAAAAGCTAACCAGCTGCACCAGCATTGCAGTAGTGGCCACCCAGGTCCCACCCTCACTTGGAGGGCACAGTGTACGTACGTGGCACCTGTGCCATCCATGTCTGGCCAGAGGAACTCTGCGGGACAGCCGGACGTTCGGCAGGGAGCCTTCACACACACATGCAGCCCCGGCCACTCCTCAGCGAGCTTCTGGATGATGAGCACAACTGCCACAAGGAAGTCCCAGGCAAACTGGAACCCTTCCAGGCAAAAGGAGAATGTCTCTTTCTTACAGCCTCCAGCCACAGCAGCCCAGGAGATTCTGTTGTGACCCACACATAATTTCCAGCCCACAGCCTCAGCTGTCAGACCAGCTCCATCCCCAGTTAACCAAACTTCCATACGGAATTTAATGGTATGTTGGAAGAGCTCCCCAATTTGGGTGGCCCTTTTACTTATCAGTGGAAGACCCAGCCTTAGACTGTTCTCTGCTGGAGCCTTCTGGGGAAGGACGACCCATTTGCTTCATGACGAGAATGAAAACTTGGCTTTCCACTTTCATGTGATACCTCTAGAGGAGTCCTGACCAGAATTCGATGGAGAAAGGGAAAACCTTTAAGTGGACTGCTGGTGGACCCAGGCCAGACTAGGACATGTGGCAAAGGCTTCCTGGGACACTTCCCATAGGGCTGGAAGTGGCAGGAGCAGAGCTAAGGCAAGACATGGGGTTGGGAGTAATGAAATATGGATCAGGGATCTTACCTGTCCTTTCTGATGGCTTTCTGCTGCGGAGCTCCAGGTAGCTGTAGGCCCTCTGGTTATTCTCTTTGATCAGCAGGGGTTTGCCATTGCATACAAGCAGGCAGGTCACCTTGGCCACCCAGTGCGTGGAATAGAAGGAGCAAGCTTTCACCAGCAACCTGCAAGGAGATTGTCCATGGCTTTCATCACTTTTCTCCTAGCTTATCCCTAATGCTGGAGAAACTGGATGGACTTGAAAATATGAACCAAGTTGCAGTAAGAACAGACACAAAATGAGGACCTTCCCCTGCTGAAAGCTCAAGTAGCAGGAGCAGCCTCTTAAACCAAGAGATCTTTCCAGAGTTGGCCATTTTGTCCTGGTTTTGTCTGGGATGGAGTTAATTTTCTTCCTAGTAGCTGGTACAATGCTGTGCTTTGGATTTAGGATGCGAATGATGTGGATAACACATCACTGATGTGTTAATTGCTGCTGAGCAGGGCTTACCTCAAGTCAAGGATTTTTCAGGTTCTTAGGCTGCCCTGCCAGTGAGGGGAATGGGAAGGGACAGCTGACCCCAAATGACCAAAGTGTTATCCCATACACAGTAGCATCATGCTCAGCACATAAACCTTGGGGACCATTGCTTGGGAACAGGCTGGGCATGAGTTGGTTAGTGCTGAGCAATTGGTTTTTATTTGTATCACCTGTTCTTCGGTTGTATTTCTCTCTTTGCTGATTTCCTTTTCATTACAATATTATTATTGCTATTACTGTTATTATTATAATTTATTTCAACTATTAAACTGTCCTTATCTCAACCCA\n>XM_037981260.1 PREDICTED: Kryptolebias marmoratus origin recognition complex, subunit 1 (orc1), transcript variant X4, mRNA \nCCCCCACACACACACACACACTGTCTGGTTTTGTTATTTCCTGCTTTGTTGGCGTTCCTGTTTGGTTCTCGATACGTAACACGTCAGAAAGAGCACAGGAACTGATGAAGAGACCCTGGTAGATTTTTCAATCTTTTATTATTAATTTTAAATTAGTGCAAATTCTTTACTCTGACTTTGAAAACAAGCTCCTTTTGTGACTTTATTTTGATTCCTGTTGACTTCAAAACACTTTTTGTTTCACCTTTAATCACTTGCACCATGTTCCCTGAAAGTTTAATAAAGACAGACAGACGGATAAAGAACTACTAACCTGGTTAAAAACCTGTTTTGCTGTGACGCTGTTGCGCTTCACCTTCCGGCCTGCAGGTGGCGCCAGACGCACCAATTAGCAAACCGGAAGTAATCAGCACAAGCAGAAGAAGAAATTTTCCCGCGAAACGCCGTCCCTCTGCCGTCTTCAAACGGCTCCAGTTAGTTTTCTGCGGGTTCTGGTTTGGAAATAAACGCGGATTTTCGATCAGAAGAAGACATTTTTTTTTTAATTTTCCGGGTCAGGTTAGCGAGGACCGGGATGAAATCTTTCGGCAGATTGAGAGTCAGGAGGTTTTATACATGGAGAGGAAATCCTCTGAGTTCCAACAGGAAGCTGCGGACACACGAATATGAGTCTTTGGCCATCAGGGTGGACGGGCTCCCGAGGACCACGGTCATCAGAACGGGTCAGCACATCCTCATTGAGGGCGACGACGACGACAACCCGTTCGCGGCCAAAGTCGTCCGGCTGTTTGGAGACGAGAGCGGGCAGCAGAAGAAGGCCGTGGTTCAGTGGTACGTTCGAGTTTCTGAAGTTCCTCCGAGCAAACTGAAGCTGCTGGGCAGAGACCCTCACCCCCGGGAGATCTTCTTCTACCAGGGAGGCAACTGCGACGACGAGGTCAACGCCGAGTCCATCATCAGACCCGTGCAGGTGAAACACCTGGATGCTGACGCTTCATTCCCCCCCTCTGATGATGGTGATGATGATGAGACGCTCTATGTGAAACTCGCCTGGGACTCGAAGGTCTTCAGGATCCTGGACTCGGCTCTGGTGGCGTCTCCTCCTCGCCATCCCAACCCCTCCCTCCCCCCGTCCCCCCCACGCTCCCCGCCTGCTGCCACCCCGGCCTCCAGGACCTCGAGTCGATGCACCCTGCCCACGCCAGACCCCACTGTGCTGCGCCGAGCCGCGCTGGGGGAAGTGAGACGCAGCCGAGCCGCAGCAAGCGCCGGTAAAAACCCCGCCGCCATGGAGGCGCTTCACTCAGAGACCAAACTGTCTGCGTCAAAATGCCTCAGCGCCAAGAGGAGGCATGGCACGGAGAGGACGCCAGGCGTCCGCAAGAAGCTGCAGCTCTGCAGTCCTGAGAAGACGGTGATGGTCAGAGAGGACGCCCTGACCCAGCTGCTGGACGAGGAGCTGGAGAAGGAGAGGACACTGGCTAAAAGGGTGCCATCCTCCCCCGCTCGGTCCCCCACCCTCACCCACAGACTCACCCCCCTCAGGAGGACCAACAAGAGCCTTGCCGCTCAGGACGCCGTGTCCCTGAAACCGTTCGTCATCACCTGCCGCAAAGTGCCCCTGAGTGAGGTGGAGTCTCCAACACCGACCAGAGACAACTCGAGCAGAGCTGCGACAACTCCTTGCACGAAAGAACCAAAACCTGTCAGAGAACCAGCTCTGGGTGATCTAGCTGAGGAAGAGGCCAAGAACTCCTCGCCGCCCAGGAGCTCCAAGAGGAAGTCGGCTCTGAAGGTGTCGTATCGCATCAGGAAGCAGCTGAACCTCATGGACGGCCAGCAGGACCTGAACTCTGACGAAGATGATGAAGACGAGTTTGTTCCGTCAAAGGAGCTGCAGAGCAGCAGCGAGGAAGAGGAGGCAGAGGTGGTGGTGAAGAAGAGCCGGGTGTCCTCAGCGGGGTCCCGCACGCCTCGTTCCTCGACCCGAACGCCGAGGAAGACTCCGAGGAAGAACGCACCAGGAACGCCGCGGACCCCCCGGAATGCCACGCCCAGCATCCCCAGCAGGTCCCTGCCGGCCAGACGGCCTGCCAACGTTCTGGAAGAGGCCAGAACCAGGCTCCACGTGTCCTCGGTGCCCGAGTCTCTGCCCTGCAGGGAGCAGGAGTTCCAGGACATCTACAGCTTCGTGGAGAGCAAGATCACCGACGGCACCGGGGGGTGCATGTACATCTCAGGTGTGCCGGGAACAGGTAAGACGGCCACGGTGCACGAGGTGATGCGCTGCCTGCAGCACGCCGCCGACACGGACGAGATCCCGCCGTTCCACTTCATAGAGATCAACGGGATGAAGATGACGGATCCTCATCAGGCCTACGTTCAGATCCTGCAGAAACTGACGGGTCAGAAAGCGACGGCCGATCACGCCGCGGCGCTGCTGGAGAAACGATTCAGTAACCCGGCACCAAGGAAGGAAACCACCGTGCTGCTGGTGGACGAACTGGACCTGCTGTGGACGAGGAAGCAGAACGTGATGTACAACCTGTTCAACTGGCCCACATGCCGCCACGCCCGCCTGGTGGTTCTGACCATCGCCAACACCATGGACCTGCCCGAGAGGGTCATGATCAACAGGGTGGCCAGCAGGCTGGGTCTGACCCGGATGTCCTTCCAGCCCTACACCTTCAGGCAGCTGCAGCAGATCATCACGTCACGGCTGAACAAGGTGAAGGCCTTCGAGGAGGACGCGCTACAGCTAGTGTCCAGAAAGGTGAAGCCCGCCCCCTCACCCGTCCCACAGCTCTTGCCCTGTGTCGGATCGCTCAGTTCTCTCCTCCGACAGGTGGCGGCTCTGTCGGGCGACGCTCGGCGGTGTTTGGACATCTGTCGGCGAGCGACAGAGATCTGCGAGCTGTCTGCTGCAGGGCTGGTGGGGATGAGTCACGTGATGGAGGCGCTGGATGAGATGTTCTCCTCAGCTTACATCACTGCCATCAAGTGTGCGTCGACGCAGGAGCAGCTCTTCCTGCGAGCCGTCATCGCTGAGTTTAGACGGCTGGGGTTGGAGGAGGCCACCTTCCAGCAGGTGTTTGTGCAGCACCAGGCTCTGTGTCGGGTGGAGGGTCTGCAGCCCGTCGGCGTGTCGGAGGGCCTGGCCATGTGTCAGCGTCTGGGAGGCTGCAGGCTGCTGCTGCTGGAGTCCAGCCGCCTGGGAGTCCTGCAGAGAGTCCGGCTCAACGTCAGCCAGGACGACGTCCTGTACGCCCTGAAGGCCGACTGACGAAGGAGAGTCAGCTCGGGTCCTGACGGAGGCAGAACACTTTACATACTGAGACCTAATGTGTTTACTGCAGATTTTCTTTTTTTGTTTTGTTTTGTGGGAGACTCTGTGACGTCCCCGGTTTTACCTGGACTGTCAGGTTTTACTGCTCTCATGGTTCTTTTATTGTTGACTTTTATATTTTTATGTTTCACTATTTGAATATAGAATAAAACAGTTTTAATATAAAGAAAATTCCTTTTCCCTCATCCATAAGCTGTGAAGCATTCACACGTTCCTAAGA\n>XM_018492714.1 PREDICTED: Trachymyrmex septentrionalis FAD synthase-like (LOC108752090), transcript variant X3, mRNA \nTGATATTGTCACGAAATTTGAAGATATTACTGAGGATGATAGAAAACTACTAGTAGATCAATATGAATATTTTAGTACAATGGACATTACACTAAAGTATGATAATTGGCGTCGTGATGTGATATTAAAATCAATTCTCCCAGAAGATATTGAAGTTCCTACAGCGTACAGTTTAGTAGGACATATTGTACAGTTGAATTTACGTGATGTACATTTGCCATACAAATCTATTATTGGTCAGATATTTCTCGATAAGACTGCGAATGCACGAACAGTAGTAAATAAAATAGATACAATTAATACATCGTTTCGATATTTTGCTATGGAAATCCTAGCAGGTGAAAGAAATACAATAACATCTGCAAAAGAACATGGTTGTACATATCAGTTTGACTTTGCGCAAGTGTACTGGAATCCACGTTTATCTACTGAACATTCACGAATTATAACATTTATGACCGAAGGTGATATTCTATATGATGTATTTGCAGGAGTAGGACCCTTTGCAATTCCTGCCGCACGTAAAAAAGTCCAAGTATTTGCTAATGACTTAAATCCTGAATCTTACAAATGGCTTCAAAAAAACGCTCTTATTAACAAGAACAATATGTCGCAACAAATACGTCATTTTTATACAGCAAGTTTGATAGTTGTAGGAGATGAAATTTTACGTGGACAAATAATTGATACCAATACATCATATCTGGCACAAAATTTAACTGCTGCTGGAATAAAACTACAGAAAGTTATAATGGTCTCTGATATCGTGGATGATATTGCTAAAGAAATACGCAATACATCAAAGGAGTATTCTGTTGTATTTACATCTGGTGGTGTTGGACCTACTCATGATGATGTAACTTATGAGGCTGTAGCAAAGGCTTTTGAACTAAAACTTGAATTAAATCAGAAATTATTTGATATATACACTCGAATGATTCCTAATCAGGCCGAAATAAAACGACTTGCTATTGTTCCCAATGCATGCAAGATTATCAACATTGATTCAGAGGCTTTTCCAATAATAAATATAAAAAATGTTTACGTGTTACCTGGTTCCCCAAAGTACTTTAAGCCTGCTGCAGATACAATAATTTCTCGTTTGAAAGGAAGCACGCCATTTCACTTTGAACATATAGATATTGCATTGAATGAACTATCAATAGTAAACATTTTAGATAAACAAGCAAAACGATGGGATGGTAAAATAAAAATTGGTAGTTATCCTCAATATGAATTGCAAACATCTTTTACGAGAATCACTTTAGAAGGACCTGAAGAAACAATTGCAGAACGATTGCTAGGATGGAACGTCCCTACTGAGGAACTGATTCATATACCAGAACATTGGCTGATCTATCCTGAACCCAATCCTTCTCTTCACTATTTACTAGCCATTCTATACATAATTTTCACCTTTGTAGCGTTACTCGGAAATGGACTTGTTATCTGGATATTTTGCTCAGCCAAATCGTTAAGAACATCTTCAAATTTGTTTGTGGTGAATTTGGCATTTTGCGATTTCTTCATGATGCTCAAGGCACCGATATTTATATATAATTCCTTTAATACCGGATTTGCTACTGGTCATTTAGGATGTCAAATCTTTGCCTTTATGGGTTCGCTTAGTGGAATTGGAGCTGGTATGACAAATGCTGCTATAGCGTATGACAGATACAGTGTTATAGCTCGACCACTTGATGGGAAACTATCTCGCGGTCAAGTGATACTCTTTATTGTACTTATCTGGGCGTACACAATTCCATGGGCCTTGATGCCAATAATGCATGTCTGGGGTCGATTTGTGCCTGAAGGTTTCTTGACAAGCTGCACTTTCGATTATTTGACAGATAGTCCAGAAATAAAATATTTTGTGGCCACGATATTTACCTTCTCTTATTGTATACCAATGTTACTCATCATATATTATTATAGTCACATTGTCAGCCACGTTATTGATCACGAGAAAGCTCTTCGTGAACAAGCAAAGAAGATGAATGTCGAAAGTTTGAGAAGCAATGTCGGTGCAAATACTCAAACTATGGAAATACGTATAGCTAAGGCTGCAATAACAGTATGCTTCCTCTTTGTTCTCTCGTGGACTCCATACGGAGTTCTCGCGATGATCGGTGCTTTTGGAGATAAGACATTATTAACTCCTGGTATCACAATGATACCGGCATGCACATGTAAATTTGTGGCCTGTTTGGATCCATATGTATATGCCATAAGTCACCCAAGATACAGACTAGAACTGCAAAAACGATTACCATGGTTAGAATTGCAAGAAAAATCTGTGGACACGCAGGGTTCTACATCCGAAGTAGTGAATATGCCATCATCTTAAATCTTGTTTAATTTTATCTTAAACAGTAACTATTTAATTATGAATGATCAATTGCTATAGTCATCATTAAGATTATGTTCTTTATTACTGCAGTAATAAAATGATTGCGTAGTCTATATCAATGTAGTTACAAGTAATTGTAAATATATAAATGTGAATAATGTAAGCTCTTAATAAATACAATATTGTTCAATCTTCCTATTCTTTGTTACGATCATGTTTATTGCTAATGTGTGATACTTCTTATCTGTTACATAAAAGACAATATTGACATCAGGCGTGTAATTGTA\n>XR_002250031.1 PREDICTED: Pseudomyrmex gracilis uncharacterized LOC109852741 (LOC109852741), ncRNA \nCAAAAACATTTTGAACTATTTCGATTTATCCGCGTCGAAAAGTTCGTTCCACGTCGCGACACGACGTATCTCGTGATAAACTTTCGATCGTAAAGTGTATTTTCGCGAAATCGTGCCTCGGATTGTGTAAATTGTATATTTTGTGCTAGTGATATCGTAGTGACAATTCAGAAATATTGGGCAAAATTTTTATCTTTATCACACAGGTCCTCGTTAGAAAACGGTCAACCGTCGATGCAAGAATATAGAACGAGAATGCCCGCATGGAATTCCCTGAATCTCGCAACTATGCACGCGCAATACTGTGAGTGTCACCTATATGCCGGAGAATGCGATTACATTTGTGAAAAAGGAAAACCTCTATTTTCGAGGCCAATACACGCGAGGGGCGTGTAATTCGTCGTGTAAGCACGTC\n>XM_050446992.1 PREDICTED: Anthonomus grandis grandis uncharacterized LOC126740808 (LOC126740808), mRNA \nACTATTGTTGCTATAAGGGGATTCTACAAAGAATTGTTTATTGTTATAAGATTTAAAAAAAAGCGCACTCTTGCGGCGCGAACTTGTAGTACATTAAAACTGTTGACAGCTGTCAATTAATATTGACAGTTTGTTTTTTCAGTAAAATTTAAAAGCAGTTTCACAATTTCTGTGATTAAAAGTGACGTGTTTTGATCAATTATAAGCCGGGACAATGAGTAAGAGCCACAAAACGAAGCATCACGAAGATCCCAGTCTGATCCCCACTTTTATGAGCGATGAAATGCACGCGGGGGCCAGGAAAATGAAAGCGGGTCCTTCGGCTGTAGCTTCGATGTTATATCCACATGCCGCGACTTCTATTACTACCACAACCGGTGTAAGGAAGAAAGAAGAAGATTTAGCGAATAACGACGAGTTGACCGATGACGACATGGAACGTAAAATGGATGGTACATTACGCAAGGGACCCCCGAAAGAAAACATTCAGGTGGATGGGAAAATTAGCATCCTTACAAAAATTGAAGGTAGGAGAGAAGCCCTCTGTTGCAAATACAACGAGGAGTACGACTATATCGCAGTGGGTTACGCTGACGGGGTGATCGTCATGTACCAAAGTTCCACGGGCGAACCAGTTTTCACTTTAACAGACGCGGACGTGAGGGAGAACAGGGCGCCAGTTACCTCGATCAAGCATCGACCTGTATCGAAAATTTACCCCATTACCAACTGTTACACCGGGACCTATGCGAACGGTTGCGTTAAATGCTGGTCCTACAATTTCAACCAGTGCCTCTATACCATCAGGGAGAAGCGACAAACTTTCGGGATCGCGTATCATCCGCGATTCCCGAAATTCGTTACGTTTGGGGACGATATGAAGGTTTATTTTTATGACGAGGAAACGAAGACGCAGGAGAGGGTGCTATCGTCCAGTGATAATCCTGATACGCACGACGGTCACATGTCCAGGGTATTCGCCGCGTGTTTCCACCCGAAAAACAATTACGAACTTTTAACGGGTGGTTGGGACGATGTCGTTCAGTTTTGGGATCTGAGACAACCGCATGCGGCCAGGCACATTTCGGGGGTTCACATGTGCGGAGAGGGCCTCGATATTAGTCAGAAAGGGACTGAGGTGTTGACTTGCTCCTGGCAAAAAGAGGATCCTTTGCAAGTGTTTGATTATAATACGACCAAAAGGATGTACTGTTTAGAACCGGACATTTATAACACTAAGCTGTATTGCGGTAAATATGCCACCAAAGATTTTGTGGTGTGTGCAGGATCCGATCCGAACCTTATACGTGTGGTGGACTTGCAAACGACTGCAACTTCGGCATTTATAAACCAATTACCGGGAGCCATTTACAGTTTGGATATCGGTCCGACGAAAGCGAAAAAAGAAGCAAAGTTGGAAAAGTACAGCGTTAAAAACGACATAACGAACGTACCGAAAATGGTCTTCGTATCTGGTAAGAGACTTTACCAGATCGATTTTTGTTAATTTAACAACGAATAAAACGCATGTGTTGAAACAAGAAAA\n>XM_028067949.1 PREDICTED: Vigna unguiculata protein IQ-DOMAIN 14-like (LOC114181480), transcript variant X1, mRNA \nCTTATTTATTCATTAAATTTCTTGAAGTTTCGTTGTTCCCTCCTTGCATGTTCCATGGACAAGGTTTTTGTCATATATAGCAGATTTTCACGAGCTTTTGACAGAGTATTTTCTTTTGTTTTGTCTCCTTTCAGATAAAATCATCACATAGTAACATAGTTGAACTGTTTCTTGCAGTGAGGGCAGCAATGGGGAGAGCCACAAGGTGGATGAAGAGTTTGTTTGGGATTTCAAGAGAGAGAGAGAAGAAACAAAACATCATAGAATCTGGTTTTTCTGAGAGTACTAATAATTCAAGAGTTTTGTGTCACAACCCAGGAACTATACCTCCCAACATTTCTCAAGCTGAGGCAGCTTGGTTACAGTCATTCTACACAGAGAAGGACAAAAACAAGCACGCCATTGCGGTTGCTGCGGCCACCGCAGCTGCGGCTGATGCTGCCGTGGCGGCAGCACAGGCCGCCGTGGCAGTTGTTAGACTCACAAGCCAAGGAAGGGGTGGCACCATGTTTGGCGTTGGACCTGAGATATGGGCTGCTATCAAGATTCAAGCAGTGTTCAGAGGATACCTGGCAAGGAAGGCACTGAGGGCATTAAAAGGATTGGTGAAGTTGCAGGCACTTGTCAGAGGGTATTTAGTGAGGAAGCAAGCAACAGCAACACTGCATAGTATGCAGGCTCTTATTAGAGCTCAAGCTAGAGTACGGTCCCACCAATCTCGCAGGCTCATGAGTACGAAGAATGAAGCATTTAGATCTCAAAATAGAGCAAGAAGATCCATGGAGAGGTTTGATGATACTAGGAGTGAGTATGCAGTTCCAATCCACAGTAGACGAGCATCATCGTCTTTTGATGCTACACTTAACATCAACAACAGTGTTGATGGGAGCCCCAAAATAGTGGAAGTAGACACTTTCAGGCCTAAGTCAAGATCAAGAAGGACAATATCAGATTTTGGTGACGAGCCATCACTTCAGGCACTTTCATCTCCCTTCTTTGCAATTTCATATAGAGGTACCCCTACCCCTACCCCTACCCCTACACGTTGGTCCATACCAGATCAAAGGAATTTTCAGGACTCTGAATGGGGGTTAACAGGGGAAGAATGTCGGTTCTCTACAGCACAAAGCACTCCACGCTTCACAAATCCTTGTAGTTGTGACTCAGTTGCACCTATGACACCACAAAGTGGGTGTCCTGATGATAACTTGTTTCTAAGGCAATATGGGAAATTTCCAAACTACATGGCTAGTACTCAGTCTTTTAAGGCCAAGTTGAGGTCTCATAGTGCTCCAAAGCAACGACCTGAACCTAGTCCAAGGAAAAGGCTCTCCCTCAATGAAATGATGGAGTCTAGGAGCAGCTTGAGTGGTGTTAGAATGCAGAGGTCTTGCTCAAAGGCTCAAGAAGTCATTAGTTTCAAGAATGCTGTGATGGGAAAGCTTCAGAAATCCACAGAATCTGTTAGGGAAACAGACAGAAACTATTTCCATCAGAGAGGGTGGTGACATGCTGAACTTGTTAGGACAGATATCTAGCTATCTTTGTTCTTTAAACTGTTAAAGTGTTAATAAAATATATTTCTCCCCCAGTTTGGTAATTTGCAGATACATATAGGTGGTGAGTGTGGGAATGTGAAGACAAAATAGAAGGCAAAGATAGAGAGAGAGAGAGATGCCTCTCATTGTTTTGTGAAAAGTTTGGCTTTGGAATTTTGATATATCATCTCTCTGTAGTCTATTCAAATGCAAGGATTTTAACTT\n>XM_043209237.1 PREDICTED: Drosophila ficusphila oxysterol-binding protein-related protein 8 (LOC108093331), transcript variant X2, mRNA \nAAAAACAGAAAATAACACGAAAGCTTGTTTCGCCTTTTCACTTCCAGCGTCTTCGGCCGCGTCATGAAAATAATACTCGCCGCCTGTTCGATGGGTGGACGGTCGGTTGGGGGAGGGTGGTGACGTCGCCAGCGCTGGTGGATGAGCTCATACGAAAGCGAAAAGAAACAAGTTTAGCTTTTTGGAATACGGACGACTGCAGCCTCAGTTCATTCGAACGCCGAACGCCAGCGACGCCGGACCGTTAAAACGAGAGAGCAAGAGAGCCGCGAAACAAAAAACGAAAACCGAAAAAAGCTATCTATAAAGTCTTTGCAAAAAGCCCAAAATTGTTGTGCAAAAAAGCGAGGAAGGCTGAGACTCTTGAGCGGCTAAAACAAAATCAATAATTGGCCCTGCGTCCAGCGCTATATGTGTGTGTGTGTGCGTGTGAGAGGGGGAGTGTGTACGTGTATTTGTGAGAACGACAATTGGAGCAATGCCTGCTGATTGATACGAAAAAAAGGGGGAAACCAATTACAAAAGAACCACAGAAGCGAAGGATTATAATAACTATTTTGTGCAATAATTAAGTGATCAAAACCATGCAACCCGCAACGCCCGGAACGCCTGTTAATAATGCTCCCTCGACGACTAATTCATCGGCCACCCCTGCCGCTCCCGCCGCCCCTGCTGGCGGGGGGGTTAGCAGCACTCCAATACGCATAAACAGTGCCAAGCAGCACGGGGCGGGGGGCGGTGACTCGCTGGCCCCCTCCACCCCGCACTCCCATTCGATGCCTGGAACGCCGCAACAACAATCGAGCAGTGTGCCCACGGGAAGTCAACTGCTGCATCTCCAGGCGCCGCTGCCCTCGGCTGGGGGAGGCGGGGGAGGATCAGTGACCCCCTCTGGCCTGTCCATGGGCGCCTCGAATCAATCGCTGGGCGTTAGTGTTGGCGCCGCCAGCAGCGTCAGTGGTATCAGCATAACGCCGCCGAATAGCGCCGGATTGCGTCAGTCGACAGTATTCGATTTCAAATTCAAACGGCGACCTTCGCTAAAAGTGCTCATGACCAAACTTCCGTCCACGGACAGTTTGAGTAACAGTCCGGCGCCGTCATCGCCAGGAATCGCCAATTGGGCCTCAGACAATCGGGATGGCAATCTGGCAGATAAGTCTGCTGCTGATGCCGCCAAACTTAATAGGAAGGAGTCCTACAAGGCGCAAAGGAAAAACTACAGGCGGGAGAAAAAGCGAGTGGCCAGTGAGCTGATGAACTCGCTGCAGGATCCTGCGGTTATTGTGCTGGCCGATTGGCTGAAGGTTCGAGGAACCCTAAAATCCTGGACAAAACTCTGGTGTGTTTTGAAACCGGGCCTGTTGCTTATTTACAAGAGCCAAAAGACAAAGAGCAGTCACTGGGTGGGCACGGTGATGCTCACCTCCTGCCAGGTGATCGAGCGTCCCAGTAAAAAGGATGGCTTCTGCTTCAAGCTTTTCCATCCCCTGGAGCAGTCCATTTGGGCACCGAGGGGTCCAGACAAGGAAACCATTGGTGCCGTTGTCCAACCGCTACCAACCGCCTACCTGATCTTCCGAGCTCCCAGCCAGGCGGCCGGCAAGTGCTGGATGGACGCCTTGGAGCTGTCCCTGAGATGTTCGGCCCTCCTGTTGCGTTCCAATAGCAGCACGGGAGCTGCTCCTTCGTCCAGCTACGTGGGTGAACCGCTGCCCGTCTCCCACGAGACGCAATGGTCGGAGGCGGACTACGAGAAGCACTTCAACGATCACGATCTAGACGCAGACAGCCAGAATGAAGCACCCAATGCCGTCATGTCTGGTCTGGAATCAGAATCGGAATCGGATCCGGCTGAGCCGGCGCAGGAAGATGGCGTCGAGCAGCCTTGTGAGGAGACGTCGTATGTGCCCTTCACCGAGGAGGAGTTTGGCGAGCAAGGGGAGCAGGTAGAGGAGTTGGCAGAGGAGAACAAGAGCCTAATTTGGTGCATTGTCAAGCAGGTGCGACCGGGAATGGATCTGAGCAAGGTAGTGCTGCCCACTTTCATCCTGGAGCCGCGTTCATTCCTGGACAAGCTATCAGACTCGTACTACCACGCGGACTTGCTCTCCAAGGCCGTGCAAGAGGATGATGCTTTTACGCGCATGAAGCTTGTCGTGCAATGGTACCTGTCCAGTTTTTACAAGAAGCCCAAGGGCCTGAAGAAGCCCTACAATCCGATTCTGGGCGAGCGATTCCGCTGCTATTGGCAGCACCCCAGCGGCAGCCGGACCTTCTACATCGCGGAACAGGTCTCGCACCATCCGCCCGTCTCGGCGTTCTACGTGACGAACCGCGAGGACGGCTTCAGTATCACCTGCTCCATCCTGGCGAAATCGAAGTTCTACGGCAACAGCACTTCGGCGGTGCTCGAGGGCGCTGCCACGATGACGTTGCTGCCGCGCGGTGAGTGCTATACGGCGACCACGCCTTATGCCCACTGCAAGGGCATACTGATGGGCACGCTCTCCATGGAGCTGGGCGGCAAGATAAACATCGAGTGCGAGAACACCGGTTACAGGACGGAGCTGGAATTCAAGCTGAAGCCGTTCCTCGGCGGCGCCGATGCCACCAATGTGGTCGTGGGCAAGATCAAGCTGGGCAAGGAGACCCTGGCCACCATCAACGGGCACTGGGACAAGGAGTGCCGCGTGAAGGACTCGAAGACGGGGGAGGAGACGTTGCTATTCAAGGTGGACGCCGAGACGCGTTCCAAGCGGCTCACCAGATACCTGGTGCCGCTGGAAGCGCAGGAGCCCAACGAATCGCAACGTATGTGGCAGCACGTCTCCGAGGCGATTGCGCGCGAGGATCAGGTGGCCGCCACCGAGGAGAAGACCGTGCTGGAGGAGCGACAGCGGGCGGAGGCCAAGACGCGGGCCAGCACCGATTCCATTCACATGCCGGAACTCTTCGAGCTGGACAGCTACGGCCAGTGGCTGTACAAGTACGCCGATCTGCGGCCCTGGGACTCGCGCAACGATGTCCGCCAGTACGAGTGCCAGTTCAAGGTGCTCACCCAGACGCGACACAAGTCGGTGCCCATTGTCCACGGCGCCGAGATGATCCATCCCCTGCGCAGCTCCTTGGAGACGCTCTCCCGCACCCAAAGACAAGCAGGACAGGCCATATCGCCGGGCGGCTCCGCGGTGCCCAAGGCCAAGAACAAGAGCCTGGTGTTGGCACCGCGCGATACCAACTCAGACTCCAGCCAGTCGCCGCAGGGAGCGGTCAAGCGCAGCTCCTCCAGCATTAAGCAACTCGCCTTGGCAGTGGACCAGGTGAACCGCGTGCTGGAGGTCCACACCCGGCAGCTGAACGAGATCAGCCAGCGCCTGGAGCGCATGCAGTATTCGCCTCCGGCTAGCAACATGAGCGTGCAATCGCATCATTTGCTGGGCGGCGGCGTTTCGCAATCGACGGTGATCAAGTCGCTGATCTACGCTCTGATCGGGCTGACCTTTAGCCTGATCCTGCGATGGCTGTTCAAGTAGACAGGCGGAGTCCGTCGTTGTTGATGTCATTTCTTTTAGGCCTAAGAAAACTTTTGGTCAACCTATAGATAACAAACATATATATAAACACCCTAGAGTACAGACAACGTATATGCTTTACTGAATTGTACATTTGGTCCTACTCAAATGCCTTCGCACGCTGCCAGAGATTCAAACCCGACCGAGGCGCGTGACCAGAACATCCGTTGTGAGAAAGTCTAATCACGAACTATGTATAAGATTAAGTGTTTGTCGTATGTAAGTCCCAACAATCCAAGTCTCTCCCGCAGACAACGTCCATGTGCAAGTCTCTTCACCATTGTATCCCTCTAAATTCTTTACTCAAGCTAGACCCGTTGGGTAGGTTAGGATGTCGGATATATATATTTAAATATACACATACGTACGAGTAGATGCACCAGATTTCGTAAAAATTCCAATTAAACCGATTATAGTTCGCTTTTCCGTTTCCTTCTATATACTGTTATTGTTAATGACACGACTTAGGGTGGAAAATGAGGATAATATGCTCGAGAGGCTTCCTGCCCTTTAAATCACCACTTATAGACATACCTTAGAGATTTAACGCGAAAAGTGCTTATAATAACTAATTTTAGTATCTCTTATACACAAATTGTTTTTCCTTTTTTTCCCAATACCTGCAAACCTTAAAACTTAATAAACTTCCCTTTTTCAAATCTA\n>XM_007369094.1 Dichomitus squalens LYAD-421 SS1 uncharacterized protein (DICSQDRAFT_149347), partial mRNA \nATGTCGCTCCAGGTCAACCTCTCAGGCAGGGAGCTCGCCCAGGCGTACCAAGATGTCATCAATGCCCGCGGCATAGATTGGGCGATCTTCACCTACGACAAAGGATCCAACGATCTCAAGGTGCAAGCAACCGGAGATGGAGGTCTCGAGGAGCTTCAGGAGGAGTTCTCGGACGGCCGGATGCAGTACGCCTTTGCTCGCGTCAAAGATCCAAACAGTGAACTCCCTAAGTTCGTGCAGATCAACTGGTGCGGTGACGGTGTGCCCGTCGCGAGGAAGGGTCTCTTCCATACCCATTCAAGTGCTGTCGCCAACTTCCTCCGCGGTACCCATGTTGTTATCAGCGCTCGCAATGAGGCCGACGTAGAGCCATCCTTCATCATGTCCCGTGTCAAGGCTGCGTCCGGAGTCAACTATACGGCTCAGAAAGAAGCACCGCGCAAGTTCGAGCCTATCACCCCCGTTGGTACGAACTATGTCCCTGTAGGCAGACCTGACATGGCCGCCATTCGTCAAGGCCCTGCCAAACCACCACCGGCACCCGCCGCAGCGAAGCCAGCTATCCCAACTGCCGCACGTCCTGTCCCAATGGCTCCCTCGCCTGCTGCAGGATTAGGGAAAGCTCCCGTGGCTAGCAAGGCCCCTGCGGACGCATGGCCGGACGAGTCCAATAGCTTCGCGCCGCCCCCACCTCCGCCTGCTGCTTCACGCCCGACTCCTGCGGCGAGCTTCGCCAAACCTGCCCCTGCAGCTTCTCCAGCAGCAGCGCGGTTCTCTCCCACCGTTACAACTCCAGTTGCCGCTTCAAACGTCCCCACGAAGCCTGCTGAAGAGGACAAGATCGGTCCAGTGGGTACCGCGTATACCCCAATCAAGCTTCAGCCCAAGAAGCTCGTCAATCCGTTCGCCGCGATGGAGGCGAAGAACCAAACTGAAACTACTGCGCCAAGGTCTTCGCCTGCTGGTAGTGCCAAGAAGTTGACTTGGAGCGAGCGCCAGGCCCTCGCGAAAAAGCAACAGGAAGAGGAGGAAGCTCGCGCGAAATCTGCATTCGGCTCTCAGCCTACTCCTCCGCCTACCTCCGCGTTCCGTACTGGTGGGAGTATTCCAGAGCCAGAGGAGGAATTCGAGGCGCCTCCTCCGCCCCCGCCACCTCCCGCGATTGCCAGTGCGAGCCGTCCTATTCCTGTTCCGGAGCCCGAATCTCAAGCAGAGGCTCCTCCGCCACCTCCCCCGCCCCTGCCCCCGCCACCGCCACCGCCCCCTGCTCCTACGGTATATCACGAGCCAGAACCTGCGAGGGAGGCCCCTCCACCCCCACCGCCTCCGCCACCACCTCCACCGCCGCCCGGGCCTGCAGCACCAGTCGCTCCGCCGGCTCCCCCTACACCCGAGCCCCAGCCCCAGCCCCAGTCCGAACACGCTCCAGACGCAACTGCGCATTCGGGTCAAGGCATCTGCGCTATTGTGCAGTATTCATATGAGGCTCTCGAGGATAACGAGATGGACCTCGTCGAGGGCGAGCTCATCGAGCAGATCGAGCAGCTAGATGAAGGATGGTGGTCCGGCGTTGGTGCGAACGGGACGAAGCAGGGCCTCTTTCCGGCGAACTATGTCGAGATCATCGAAGCTCAGGAAGCTCAGGCTGCTACCCCCCCTCCGCCGTCGCCTCCCCCTCCCCCGCCCGCTCCTCCTGCCCCGCCTCCACCTCCCGTTGCTGCCCAGCCGGAGCCGGAGCCCGCGCCCGAGGAAGATCTTGGGTCGTGGGCAATCGCGCTCTACGATTACGAAGCGGGCGAGGATAACGAGATTTCGTTCAAGGAGGGTGATAGAATCACGCATATTGAGGCTGTGTCGGATGACTGGTGGCAAGGTACCGAGCCTAACGGCAATGTCGGCTTGTTCCCCGCGAACTACGTCGAACTTCAAGCTTGA\n>XM_039761524.1 PREDICTED: Polypterus senegalus RAB, member of RAS oncogene family-like 2 (rabl2), mRNA \nTAGAGTGATCTGAATTACGTGCATACATTTTTATACCGCTGAAGATGTGCAATGCTTTTACTGGACATTTTTATATAATTATTTTTTCTTCCCGATTGCTAACATTGGCATATGTGAATGATAAAACAAAAAACGCCGGCTTTTGGTATGGCTATTGCCGGAAGTAGACAGCACAGTGGCGCAGGCAGACGAATAGACAACCTACATTTTCCTGTTGAGGGTCCTTTTTTAGCGTCGGTTGCGTAGAAACTGCTGTTGTAAATTTTTGAAGCACTTTCTCAATAACGAAGTATCGCTCAGGCTACATCGATAATTAACCGAGTCGTGGTTAATAGGAGTCCAGTCAAACGGCGCTGCTTTGTATTTTTGTTCAACTGAACAACTTCTAACTGATAATCTTGTATAAAGAGTCGCGACGGTGGAGCAATTTGGCGAATGATGAATGGAAGGGATTTGGTTATCTCTGATGATTAATTAAAACGGAGCAAAAAGAAAAGCCTAACCGGAGAAGTCGAAGGCGGTAGTGGATGAAGGGGCTGTGTGCCCGTATTTAGTTTACCGTAGATGTTCGCTGCTTGCTCCTAAGGTCGGGATCGCGTTTTTACCTCCGCAAAGCCAAAAGATGGCCGAGAATGCTGCTGGTTTTTCCGATCTGAATCAAGATAAGTATGACAAAGATGAGCTTAAAATCATCTGTTTGGGCGACAGCGCTGTTGGAAAATCAAAGTTGATGGAGAGATTCCTCATGCAAGTGTATCATTCCAAAGACCTGTCTACCTACGCACTCACACTTTACAAATATCCAACAACTGTGGATGGAAAAACTATCTTAGTAGATTTTTGGGATACTGCTGGACAGGAGAAATTTCAGAGTATGCATCCTTCTTACTACCACAAAGCTCATGCCTGCATTATGGTTTTTGACATTCAGAGAAAAATAACCTATAAAAATCTTGGCAACTGGTACAAGGAATTAAGGGAGTATCGCCCAGAAATCCCATGCATATTAGTTGCAAATAAAATCGATGCTGACATGAAGGTAACCCAGAAAAACTTCAGTTTTGCTAAAAAGCACGGACTTCCCTTCTATTTTGTTTCTGCTGCAGATGGCACAAATGTAGTTAAGCTGTTCAGAGATGCAATCAAACTGGCATTATCTTATAAGCTAAATTCCTGTGATTTCATGGATGAAGTCATGCGCGAATTAGAGAACTTTGACATGGACAAGAAAGATGACTACTCAGATAAAGAAGATGACAGTTTAAAGGAAGACAACATCAAAAAGACATGACCTACCCTGGTCTTCATAAAATGATTTGGGTTTTAAGCGGAATAGTATCTTATTTTATTTTCCTGACCGTCTTTGAAAGGAGAATCTGTTTGACTGCTGAAAACACACCAGTGAGAAATATACATTACCTAAAATATCTGACCATGATAAACTCTATTCAAATTCAGATTTGTCCCACCAGAAAAAAAACATTGTACTGTGCAGACTCCTATTGTTCCACTTTATGAATTTGAGTCCTGTCAATTGATTTTGTTGCTTTATTTAAAACTGTGAATATTACTGCCACAGCCAAAAGGT\n>XM_051965029.1 PREDICTED: Antechinus flavipes proline rich and Gla domain 4 (LOC127540371), mRNA \nTGAGCCCGCCGCCAGCACCCCGCAGCCAGCGCTCGCGTCCGGTGCCGGGGCAGCCGTCGCAGCAGCAGGTTTCTCCCGGGAGCGCGGCTGAGCGGTGCCGGCTGGCTGACCCGGAATCAGGAGCCCAGGCGCTCAGCCTCCGCCGACCCCGCTGACTTAGAAAGAAGTCGGGGCAAAATCCGGGATCCACCCCGGGCCTGGGAGAGACCGGACGGCCGCTCCGGAGCATGTGCCAGCTGCTCCAGATGCCAGACTATGTTTAAACTTTTGGTTCTGCTCAGCACTTTGCCTGCTATTACTGTTGCGTTTCCTCCCTGCCTAAGAAGTCCCCAGGAGTCTACACATGCTGGAAAAGACGTCTTTACATCAAAAAAAGAAGCCAGCATCTTCATCCATAGACGTCTCCTCCACAATAGATTTGACTTGGAACTCTTCACTCCTGGAGATCTAGAAAGAGAGTGTCATGAGGAACTGTGCAACTATGAGGAAGCCAGGGAGATCTTTGGGGATGACGACAAAACGATGGCATTTTGGAAGGATTATTCAGTTCGAGGACCAAGCACAAGATCAGATGGTGAGAGAGAGAAGATCGATGTTATGGGACTTCTGACTGGATTAATTGCAGCTGGAGTGTTCTTGGTTATCACTGGATTACTTGGTTATTATTTCTGCATCACCAAGTGCACAAGAAGAAGACAGCCATGTTCCTCAGCTGTCTATGTAAGAACGGGTCGACACCATCCAACTATTATTTTTAGAAGACATGAGGAATCTGCCTTAACCCCGTCACCTCTTCCCCCAGAGGATTCAGGACTGCCTTCTTACGAACAAGCTGTGGCACTGACTGGAAAATATGATGTTCCGCCTCCTCCATATCCTGGGCCAGCAAGAGGGTTTAAGGTGTTTAAAAAGTCTATGTCACTACCTTCTCACTAAATCCAATGTCAATATGAGAAATGGATGTTTATTCAAAGAAGGAGCCATGATTCAGTTCTCCAGTAGCTTAAAAGGCTGGCCATTCCATTCCTGTAAAGGTATTAAGATGCCTGGTCTTTTGCTCCAGATAGTTGGACTTTTACTCTGACATCAGAATAATGAGGGAATCGGTTTCATTTTGTGTGGGTATGTGTATGTAGGTAGGAGGCGAGCCCTGATTTAAATTTAGGAGTATCCAGATCATTAGCCCTAATCAGCTAAATTAGGCAAAAGATTACTAATTACTGAAGGAAAAGCCACATATCCACTATAGCAGAAAGGGTTCTAGATTGATTATGTTGAGAACTGAATTAATGTTAATACAAGACTTTTTTTGTTTCGAGTCATCTTGAGTCAAGATACTATATTTTATCCCTGTTTATTTTAATTCTCCAGCAAAAGAAACCTTGTGAAAAAATTTTAAATCGCATGATGAATCAGTGGTCTTTAAAACATAAAAGGAATCCTAATGCTTATTGTATATAAAATAGCATATGATATTCCGTACAGGTATTTGTACTTAAAAGATTATGTCCAGTTGTACAATGGTGGGAAAATACCTTCATTTTTCTTTTGATTCAATGGCTGCTGCCATTAGAACTTGGGGGTCAGAGGTACAGTGAGACAAAGTTGCAGATTATAGTTCTAATTCTTTCCTATCACCAAAAGTGTTTCTAGAACCTAGAATCTCTAGATTCTGTATGAATCTGCCCGTCCCATGAGGAAATAGATGAATTCCGTCTGTATAATTATATGTTTGGTTCATATGAGATTACTCAGGTTGGAAGTTTTATTCTAGCTTATAACTAATAGTTTAATCAGGAAAGGATAATTTATTTATTCTCTTATTATCTATGTATAGTGGTTAAAGATGTATATGACCCTTTGCATCTCTGGGATATGTTTTCTCAGACATTAAAGCACACTTAAAATGATCACTCAA\n>XM_019516974.1 PREDICTED: Gavialis gangeticus B double prime 1, subunit of RNA polymerase III transcription initiation factor IIIB (BDP1), transcript variant X7, mRNA \nACAAGTTTGTTCTACATGGTATTTCATGACACTTTTTTAATTGTTTGTAGAAATGAAAGGGTGGGTAGTGCAAGTGATGCTGGAGAAGCCATTAAACCTGCAGATGGACCCTTGCAGAGGAGAAAAAGAATATCCACTCTGCCTAACTTGGCAAAACCCAGAGTTACGGCTCTAACTGCACAACGGTTGGTATCAAAGCCTGCTCAAAAACAAGTACCTCAATCTGTCAGTGGCAACACTTCACGGAAGGAATCCTCTGCATCAGATAAGACCAATAGTGAAAGCTCTCCAAAGTCTCCCAATCTGCCTGAAAAGAAAACACCTGTCCCACAAGTGCCACAGTTTTCCCCACTTAAAAAATCAAGAAGCAAAGAGCCAAATGCCAGTATAATTGCTCATAAAAATGATGAAACTCTGCAGAAGAGCACGCTCTCCCCTCTCAAGGAGAGACCTACCCAAGGAAGATCAAAAGAAGATGAAATGTCGCATGCAAAATCTACTCCAGCAAAAGAAAAAAAAAGGTGCTCAGATCGTGAAAGGATCCTTAAAGCCCAGAAGCTGAGAGAGATGCTCAAAGAAGAGCTGAGGAAAGAAAAACTGAAACATGGGAAATCCAGACAGAAGGTGGCTGAAGGTTTCACTGCAGCAGATCGTTCCAAAATGACCATGAGAGACTTGATATACTTCCTGCCACAAAACAATCCCATGAAGTCTTCACTAATAGACGAAAAAACTTCTGCATCAAGCCAAATGAAAGAATCAGAAGAGAAGAGTGCTCCTGTTCATGAAGATGAAGAGGAAGTTGCTCAGGCAGAGGATGAGGAGGAGAATCACGATGATAAGCTTCTAGTTCCTCGAGTGAAAGTGGCAGAAGATGGCTCAATTATTCTGGATGAAGAAAGTTTAACAGTGGAAGTTTTAAGGACTAAAGGGCCAAGTGTTGTAGAAGACAATGATCCTATTTTTGAGCGTGGCTCTACAACTACCTATTCTAGTTTTAGGAAAAGCTTTTACACCAAGCCATGGTCAAATAAAGAAACTGATATGTTCTTCCTGGCCATCAGCATGGTAGGAACAGACTTCTCCCTGATTGGTCAGCTGTTTCCTCACAGAGCAAGATCAGAAATTAAGAACAAGTTTAAACGTGAGGAAAAAACAAATGGATGGAGGATAGACAAAGCCTTCAAGGAAAAGCGGCCATTTGACTTTGAATTCTTTGCACAGCTGCTTGGGAAAGTTCTAGCAGATGAGGAAAAGAGGAAACAAAAGGTGATTAGAAGTCAAAGATCAAAAGAAAAGAAGCCACAAAAAGCTCGGAAAAAGCAAAAAGTAGCTCACGCTGAGAATGAAAAAGCTGCTAATGAACAAGATCAAGAGGATGTCGGAATTTCTGATGCAGAAACTGAAGTGGATGCTGTGACAGCTGAGAAGGAGAATGAAGAATCTTTGAATGTTTCTGAACCAGCAGAAGGGCAGCTCCTGTCAGAGCCAGGGGTAACCAAAAAGAAAAGAAAACAGAAGAAAAGAAATTCTGAAAAGGAACTTCAGAAACTTGCTGATGCAGAAACAGGAGTTGATGCTGTGACAGCTGAGAGAGACAATGAAGAAACTGTAAATATTTCTGAACCAGTGGACGAACAGATTGCATCTGAGCTAGTGGTACCAAAAAAGAAAAGAAAGCAGAAGAAGAAAAATCTTGAAAAGGAACTTGAAAATCTTTCTGATGTGGAAACAGGAGTTAATACTTTGATAGCTGAAAAAGAGAACGAGGATTCTTTGAATCCTTCTGAGCTGACAGAAGAACAGATCACATCGGAGCCTATGGTAAAAAGGAAAAGAAAAGAAAAGAAGAAGAATTCTGATCAGGGCATGGAGACTCTTGCGAAAGAGACAGCAGTTATTTTGAAACCAGCTAAGGGAGAAAAATCCAGCAGGAAACAAAAAAATACATCTGGCACAAACAGTGATGATTCTACTGAATGCAGGGAGGAACTGGGTATTCATAATGAAGAAATGTTTTGTGAGACTCCTGTTCAAGTGGAGCAAGTCTTCGATTCCTCCTTACAACTGAATGATGAAAATGAGGAAGATAGTGATTTTGATTTACACAGCTTTCAAGATAGTAATAATGTAACAGAAGCAGAACCTGTTGAACCAGAAATCACCAGTGAGTCTCAGGAATGGCAGCTTTCAAAATCTCAAGTTTTGGTTAACAGAAACCAAGGAAGTAGTGATCAAACCACTGAATCAAAGAACAATGAAGTATTTGACTTATGTGAGCCAGGTGACAAGGAGAGTGCAGCAGGAAGAGGCTGTGATACAAAGTCCGAAACAATGGAATCTGAAAAAGCTGTTGCTGGGAAATCAGGAGTGAGAGGACGTTTGCAGAGACCTAAGCCCAACTTAGCAAGAGGATCTGGAAAGAGAGAAGGAGCAGTGCAAGAAAAATCAGAGGTCAGGGCTCCCCCTCCAGAGCTTATGGAAGGAGCAGAAAAGGATTCTGTGGACGATAGTGAAGGCAAGATGTTGGAAGTTGCCAGAGATGAAACCACAGGAAGAGAGAACAAAGACTCGGAGACTGAAGCTCAAGAGACTGAGAAAGTTGTTACTGGAAGGACAGCAGTGAGAGGGCGTCAGCAGAGATTTAAACCTAACCTGGTAGGAGCTTCTGGAAAGAAGAATGAGCCTCTTCAGGCAGAAAGAGAAGATAAAACTCTTCATTCAGAGACTGATGGAAAAACAGAAGAAAAGAATAGTAACCAAGGTAACAAATCTGATGTTCCCAGAGTGGAAACAACAAAAAAAGATGGTAGAGTCTCAGGGACTGAATCTCAGTCTGAAGAAACTGCTCAGTCACAAGAAGATGGCAAACAGAGTGTACTCAAACCAGCACCACTAATGAGGAGTCGAATGCAGAGGCCAAAACCAAATGTGGAGAGGGCAGCTGTGAGACAGGGAACACTGATACTGCAGACAGATCTTGGAAAGGCAAAAACTGATTGTGGTGAAGCAGTGGAGAAAGATTTGATACACTGTGAAGACAAAACAGGCGGTTCACTTCTCACTGCATCTGATGCCATCCAGGCACACTTGGAAGTATTAGAGAAGGAAGCTGCTGCAAATCCTGAGAAGTTGGCTTCCACACATGAAAACCCGCATTCCCTGAAAGAGTCCTTAGAATCTGAGAGCTGTGAACAAGTAAAAACAATTCCTGGAGGTGATTTGAAAACTGGTTCCGATTCTGATACAGGAGATTCAGGTTCTCAAAAACAAGAAAGAAAAGATAAGCCAGCACAACTATTAAGGGGTCAATTTCAAAGGCCAAAGCCTAATTTAGGAAGGTCAGCTGGAAAAAGGGAAGTGTCAGGAGCAGATAAAGATGTATCTGATGACAACACTGATAAAGAAGAAAAAAGTTTGCAGTCTGACTGTGAATGCAGCTTGCTTCCTGACCTAGACAAAACAGCGAAATGTGATGTCCTGCCTTTAGGAAAGAACGACCTTGCTGACTCTCGGGAGGTATCTGTAATACCATTAGTTAATCAGTCCCCAAAGAAGCTGTCAGGATCTGAGAGTGATGAACCCAGCAGATCTTCTCCACCTGCAGATAACGAGGAAATTGCTGCACCTGTTGCTGTAGGGCTTTACAATAAAAATATCCCTCAAGAACAAAGTAAACCAAGCTCTCTTCAACCAGCCCAGTTAGTGAGAGGCAGATTCCAGAGGCCCAGGCCAAATATAGGAAGAGGAGTTGGGAGGAAAGAAACACGACCAATGGAAAAAAATGAATCTGAAGTTGAGCAATCAATACAGCATAAACATGAATCTTCCAGTAGCTCATTGACCACAGTAAAGGGTGAAAATGAAGTCATATGTTCTGAACCTTCAGAAAAATTGTTGGATTGTGAAAAACAGACAGAACAAGAAGAATCTCAAGTGCCCAGTATTTTACAAAATGTGTCAAATGAACAAAGCAGCATTAAAAAATCCAGTTCTCTAGAAAATAAACCAGGTGCCATCAGACCAGCACAGCTTATGAGGCATCGGTTCCGGGGGACTAGACCAAGCATAAGAAGGCTGTCTAGCAAGACAGGAGAACTATCAGCAGAAAAGAATACTGCTCCAGTTGAGAGAGAAGCAGGACAAATGGAAGCGAGTCTTCTGGAACATGAAGATTGTAGTGTTAGTTTTTCTACCAAAGCTGAAGTGGAGACACTGACTGTCCTGGAGGATTTGTCCAGAAAAGATGATCCGGATTTCAGTGCTGTCACGTCTTCTCCGAAAAAAATCATTCGATCAGAAGAAGTTTCTTCCTCTGAGAAATCATTGAAATGCAATAGTCAGAGAAATGAAGTGGGCTGTGTGTCAACAGAAGTTGTGGAAAGCCTTCCAGATAATTCTGAAGGGTCGAGTGATAAATTTACTTCTGAAGAAGAAAGCAAGCCAAGTAAGAGAGAACCTTCACAGTTACGGAAAGGCCATCTACAGAGGCCTAAGCCAAATCTAGTGAAAGCAACTAGAAGGAGAGAAGTGCCAGATGAGGGAGAAAGCACAACTGAGGATAAGTGTGATGCCGGAAATGCAGATGAGGATCTCATTCTGTGTGGGAGTAGCAAATCAGAAAAATTAAATGTTTTAGTGCATGGCTCTGCTAAGTTAGCAGATGCAGCGTCACCTTCAGAGGTTTCAAGAAAAAATATTTCTGAGGAATTGACCCATAAAAGAAGCAGGCAATTCAGAAAATTCCAATCTCTGGAGAGATCGTCAGAGAGTGAAAGTCAAATAGAACAAGATGATTCTCAGCCCTCTGCTGCTGAAGAGAAGACTTCAGACAAGCTGACAAGAAGGCGGCGGAGAAGATCATCCAAACAAATAGCCCTGCCGAAACGAATCTCTGAGCTAAGAGCAGCTACTTCATTTTCATCTGAATTTGAGGCGGATCATTCTGAAAAGGGGAAATGGTGTCGGAAGTTCAAACCAAATGTCACCAGAGGCAGAGGCTCAAAACCTGCTCGCAGCAAGAAATCTGGGAAAGACCATAGGAGTTCCAAGGTAACCTTGGTGACTCTCAGGGCTTCACAGGAAGAGGATGAAGATGAGGCAGATGACTTTGAACCGGATGATGAAGATGAGTGTTTTGCTCCAGAAGAAGTAAATAAAGCTCCAGTGTTTGTTCCTGTAGGTCTTCGATCTCCAAAACCTGTTCCTGTCCAGATTGAGGAAACCATGGAAGAGCTTGAAATTTCTGTGAATGTTCCAGATGTGCCATGTGTCACAACTGCTGAATCTGTGTCTCCTGATTTAAATGTACCTGTCCAAGCTGGGATACAAAGTAGTGAAAATTCGAATATCATACAAATTGTGGGAGTGACTACATATGAAAATCCAGAGACAGACACAGGGGCTAATGATGGAAGTACAGAAGCTGCCATGACCTTACTTGCAATGGGAGATCCAATGTTCCAGTTAAAAATAAGCGCTCAAGGACGGACACAAGTATTGCCTGAGCAAGATGAGCGGGATGTGGCTGATAGCTTTGTAAATCAACCTTATGCAGAGCACAGTGCAGTTCTTAGCGAGCATTCACTTCCTTCACCTGCTGCTAATAACAAACTGGTTCCACTGGAGGATGGAAATAAAATCATTCTAGAGGACCAAAGCACTGGAACGGGAATAGGTGGAGAAGACTATGCCAATGAAAATGCTGGACACAGCAGTGATCATTCTGTCCCTAAAGCTTGTAACACAAGATTGACAAGATGCCTTTTGCCAAGGCCTAAACCAAATGTTGGAATATTGGAAAGAAATGGGGATGCTTGTCAGAAATCTTACAGTCCAGAAATAGTTGTGGAACAATTGGTGCAAGTTGAAAGTGAGGACAAAACTCTAAGTGACAGTGCAGAAGAGGAGGTGGTGGAACAGAAGATCCGATCAAGTGAGAATAGTCCTTCCAGTCCAGATGATACTGCAGCCAGAAGCACAGACCTTGTCAAACAAGGAGACAAAGACGAGAGAACAGAAAAAGAGATGAGAGAAACTTGGGAAGCTCTGGGAGAGGTAAAAGCTCTCATCACATCTCCAGAGACAGAGTCTTGTCAACCTGGGCTGGGGAATGATCCTGGTCAAAGTTTTACATTTGGGTTTCGTGAAGGAACTTCCTGTGATGCTGAGAACAACTTATATGCAGTTGAATTACTTCAGACTGAGGCAAGTGCTCACAAACTTGATCATCAGTCCTTAACCAGCTCAAAGGAGACTTCAGCAGTAAGTGGTTGCGACAATGAATATCAACCAGACCTGGAAGAACAAACATTTATTTTAACTCTGGTGGAAATCCCAACTGACTCTAAAGAATACAGTGATGGGTCTGTTTCACTTGGACATACCTCAGAACCATTGCTGCCAGCCCCAATAATACTCAGTCCAGTCAATACAGATGGGGCAAAAACGGTGGGAAAGCAGAGCATTGGATCCCTGACACCCATAGTTGGTGAAGTTCTTGCTCCATCCTTAGACAACTGTACAGAAATTGAAGGACCACAAAGAACTTTAACAGAGCCATTTCTTAATTTGGAGTCAACGCCTCGGAAAAGGCGTGCTACTGATACTGAAGATAGCAATGTTCCTCCTGCCAAGAGGAGTCCAGCAACTTCAACAGAAGATAAGCTGGAATCTTCAGTTAAATCGATACACGCTCCAACAGAAGTTGCTGGAAAACTTTTGGAAAACTTGAGGTCTTTGAAGAAGAAAAATGTATCTACCTCAGCGTCTTTGTCTACATCTGCAGATTGGCAACTAGAACAAGGAGGCCAACATAAATCTTTGCAGAATGTAGAAACTTTACCACTTGAAGATAAATCAGCATGCAAATATTTAAATGAAGGGGGATCTGGAATATGCCCTGAGATAAAAATAGGAGCCAGTGAGCAAGGACTATCTGTGGAGGTTCATGAACCTGAACAGTCAGGACATGCTGGAACTATAGCAGCCCCATCAAAAACCCTATTAGTCAGGCCTGGGCGAAAACCTCTGGGATTTTTATCCTTAATTTGCAAAAAGAGTAGCCCTGATGTTGGAGAAGACAGTAAAGGGAACAAAGAGAAATTCCAAAAACCTCAAATACCTGCCTCAAAGCGAAGCCTGAAAAGGTCTGCTCCATCCACAGAGGACAAGAGGCAGACTCTAGAGCCATGTTCCCTTCCTTCTACAAGCACATCATTTGCTGAAGGAGAGAATACAGCAGCTACTGTAGTAAAGTTCAGTGCATCTTCAAGGGTTTTAGACTTCAGATCCTAGGTTTGATATCTGGGCTGTGGTTTGGCAGTTGTCTGCAAAGATGTGGACCTGATAGACCCTCTGTCTTGCTGCACAGAAGCAGAGAACTACATCCATGCATCACACCCTCAGAATCTCAGC\n>XM_006020837.2 PREDICTED: Alligator sinensis neuronal differentiation 6 (NEUROD6), transcript variant X5, mRNA \nAGGTTGACAACCCTTAGGACCTTTCATAATATAAATCTTAATACATAAATTCCTATGGAGAGTAATGGGGTTTTAACCTTTGTTCTATTATACGGATTATACTATTCCATATAGAATGTAATAAATGTAATGAATAGTGCAGAACTTGCTCTCTCTAGCATTAGCCTCTTAACTTTTAAAATCTTGGCCACTTCAAAAACGTTTATCTTTAAAAAGAGGCCCAACCTAGATAAAGTACTAATGACCTTCAGCTTCTCATTGCAATAAGAAAATAAAGGTTGTGTGTTAATTGAGCTAAAGTGTCTAAAGTTCATGTACACCTAGACACACACCTGCCCACATGCACACACATGTGCACACACACATGCAATTTTGCTGTCTCCTCCTCTACAAAAAAAAGCCCAACCCGGATTTAAACAAAACTTTGAGAAAACAAAAATAATTGGATTGGGGACGAGAATATTAATGCCAAGCTTGGGCCCAATGTGAATTAAAGCAGATGAGTTATAAACCCTTCAAAAACAGGATTTATAATGGAAATGCTGACAAAGACCCATAACAATAGCAGCTCTGCCAGGGATTACTTTAATACTAAAACCGTATTCAATCTCACTTTTTAAAACAGAGATTACGGAGTCACTAAAAAGCTACAATACGTGACAATAGTAAAAGAAAACTTTAAATATTTTTCTATCTTTGACACTGCATTCTCACTTTAACTCTTGCTAATATATTGCTTGCGCCTGACATTTCACTCCTAAATAAAATAAAAAAGCACAAGGTGGAGTTTACCACAGGCTCCAAAGCAAGGCTTAGCTGAAAGGCTTTGTCAGCTTCATTTAACAGTTTCTTGTCTTGTTGATGAGAGAGACAAAAGGGTTAAGGCAGAAAGAACAGATAGTGCAAGAGAGACAGCTGACCGGGGAAGAGAAAATGACACTAGAAAAACAGAATGAAGAAAGGAGAAGAAAAAGAAGCAGTTGGAAAATGGATATGCAGCTAAATATTTCAAATCTCATCTACATTTTTAAAACAGAAAAGACCTTTTAATTTTTAAGGAAAAGGTTTAAGAGAAGGCAAGACACCTAGAAAGAAAAGTAAGGGGAAATTTTTCCGATTCTCACAAGTTATTAAGAAGGGCTGCACAGGAAGCAATGGGTGAAAAGTGAGTGTATACATCTATCTTGCAAAGCACTCGTTTCTAATGTCAGAACACGTTTATATTCTTGAAGCCTTCTAGTTTTCATCTAATGTCTTTTCTTTTTTTTTCCAGGGATATTACAAAAAGTCACTGATGAAAAGAATTTGAGTTTTTCTTCTATAGACTCCAGCAGGATGCTTTCTTCTATTATTTTGAGATCTGGAATAGCACACAACCCTTTAAACACATGCACACACAAAGATTGCTCACGAAAGTATCACCCAAGTATTATGCCCTCTTACACATAAAGCTAACCCTGTGTAGGTGTGCCCTAGTGCCTTCATTACTTTCTGATTTCTGGTTTCCTTTCACGGCTTTTTTTCTGGGTACCCAGATGCACAGATTGGGACCCTGTTCAATGCAACACAACACTTTAAATAAAGACTGCAATATTAACAACTACGGAGCAGTTGTACCTGCAGGTAGGGATAAAACTGAATGTTGGCATGTCTGACAATATAGACTGACTGCTAAACAGAAGCAGCTCCAGTAGAAATGTACCTACTGTATGTGAAATGCTGGTGCAGATTTTTTTTCTCTCTATCACTCTAACCTTCTGTGTTGATACATGAATGCTGGTACCCACTTACAGGGATGCCAGATGATCAGTGCAGAATGTAGGTCCCAGGAGAAAGGATCACATGGTTTTCTCTGCCTTGTGACGTCACTAGCAGATGGCATGGGTACCAGCTCTGGCAGTTGGCATCAATGTCACTTTTTAGAGATCAATGAGATAGTGCAGATATACACAGATCTAGACTCCAGGAGACGATGCGACATTCAGACTGAAAAGATTTGGAAGGCAAAAAATGAAAACTGATTGTTGAATGAAATAAAAAGCTAAGGTAACGTAAGATTATAGAACCATGTTAACACTACCGTTTGATGAGTCTGTTGTAATGCCAGAATCCCAGATGTGCAGAAAGTTTTCCAGAGAAAGTGAGGACCAAAAGCAAATTAAAAATCCAGAAAGCTTTTCAAAGCAGATTGTACTCCGAGGAAAGAATATCAAAAGGGCCGCTGGTGAAGACACAGAAAAAGAAGAGGAGGAAGAAGACAGAGAGGAGGAGGATGAGAATGGTTTACCTAGAAGGAGGGGCCTTAGGAAAAAAAAGACAAGCAAGATAAGAATGGAGAGGATCAAATTCAGGCGACAAGAAGCCAATGCTAGAGAAAGGAACAGGATGCATGGCCTTAATGATGCTCTGGACAATTTAAGGAAAGTGGTCCCTTGTTATTCTAAAACACAAAAACTGTCTAAAATAGAAACATTGAGATTAGCCAAAAACTATATTTGGGCTCTTTCTGAAATCCTGCGAATTGGCAAGAGACCTGACTTACTCACATTCGTCCAAAACCTGTGCAAAGGTCTGTCCCAGCCAACTACAAACTTGGTGGCGGGGTGCCTGCAGCTGAATGCTAGAAGTTTCTTGATGGGTCAAACCGGTGAAACTGCCCATCACACAAGGTCACCATATTCCAGCTTCTATCCTCCCTACCACAGCCCTGAGCTCAGCACTCCCCCAGGGCATGGAACTCTGGACAACTCCAAGTCTATGAAACCCTACAATTACTGCAGTGCTTATGAGTCCTTCTATGAAAGCACTTCCCCTGAGTGTGCCAGCCCACAGTTTGAAGGTCCCTTAAGTCCTCCCCCAATTAACTATAATGGGATATTTTCCCTGAAGCAAGAAGAAGGCTTGGACTATGGCAAAAATTACAATTATGGCATGCATTACTGTGCAGTGCCACCCAGGGGTCCCCTTGGGCAGAGCTCCATGTTCAGGTTGCCTACAGAGAGTCACTTCCCTTACGACTTACATCTGCGCAGCCAGTCTCTCACCATGCAAGATGAATTAAATGCAGTTTTTCATAATTAATGAGGAAAATGAAAATAAACAGTGGTCATTCACCTCCCCATCTAATTAAGATAAAGCAGATGCTTGTGCACTACGTAATTGGCACAACTCTAGTTAGCGTGTTTACTAGTTTCTAAAGTGTGATTCAACTATTGTGGGAATTTTCTATGTACTAATAAATCTTTTTTCCTATAAGTATTTTTCCTTTTTTTTTTTTGTCTGTAAACACTGTGAGATTCTGTTTCTTACCAGAGAATTTCCCCCACCCCCTGCCTTTTTTTCCCTATTCGCTTGATTTGTTGAACAGTGTGTCTAAACAATATCATTGAAATAAAGGCATACACACTGTATAAAGTCAATGTCTATTTTGATTGTACAATTTGTAATTATACAAATGCATGTTATTACATTCAGATGAATAAAAATAATGTATTTATAATGAGTAGAAATTATATATTATGTATTTAAGAAATGGATTTTAAAAATTCTGAAGAATTTTAAAAATCTATCCCTGAATTGAGATGGGCTTGTGGGTGTAGGGGTTGGGGGACAGCAATATTTAAAGCTATGCAAAAATAAAAAAAATTTTGGAGGATGGGAGGCCTGTAAGATTAAAAAAGAGGTGATCACCACTGACTGTTTGCTGACAGGGGCTAAATAATGTTAGACAATGTTGTCAAAATTTCACATCAGTTATTCTAAACCTAATCATACAACAGTATCAGCACCTTTTTGTATTATTCTGATTTCAGATGTAAAGGTTTGTTATAACAATGTATAACTGTGGTTTCGCACTACATATTTTAAATGCAATTAAACAGAGATGTTTCCACTTTTAAAGTATATCTCTTAGCTGTGA\n>KM473888.1 Uncultured bacterium clone 2010ECS-StA#2600 16S ribosomal RNA gene, partial sequence \nGGACCCGCACAAGTAGTGGAGCATGTGGTTTAATTCGAAGATACGCGCAGAACCTTACCAACACTTGACATGTTCGTCGCGACTTTAAGAGATTAAAGTTTTCGGTTCGGCCGGACGAAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGTTAAGTCCCGCAACGAGCGCAACCCCTATTACTAGTTGCCAGCACGTTATGGTGGGGACTCTAGTGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTATGTGTAGGGCTACACACGTGCTACAATGGACGGTACAGAGGGTCGCCAACCCGCGAGGGGGAG\n>XR_005569779.1 PREDICTED: Styela clava uncharacterized LOC120344705 (LOC120344705), ncRNA \nGCAAAAGCACTCTTAAAATAGCCCCGAAAATTTTGTAATGGTAAAGTATAGGAAGAATTTTCTGGGGGTTAAAGGCGGGGAAAGGTCCATAGAGAAATTCTCATTCGGCAAGATAGGCAGGAGCCCAAGGGACCCAAGCCTTATGGGACACGGTAATGGACATAACGATCATTTCAATATTATTTTGTTGAACACGGAGTGGACAAAGCGATGGTTTTGGCGTTATTGGACACGTAGTGGACATAACAATCGTTTTGTTGTTCTTTGACACGTTTTGAAGAAATCGCTTTTCTTTTTGATTACTGGATCAATTGCTTCGGTTGCCAATTTTCAGTGGTTAAAGATAGAATTTTTCTCCAGAAGGCTATTATTTTTATTCATTTCAAAATTTTCTGTGGACTTCAAGAGATTCGTTTTTTTTAAGTAATGGCATACTGCCCCTTGCAGTGCCGATACATGGATGCGCCAGCGAGGTGGATCTTCGTCTTTGGGCTTCTACACTTCATCCGAATTCTGAATCTGATAACGGACAAGACAACAACGACTGGAAGGTTAGATTTATAACAACAACTAACTTCACTGGAAGAATCTTGGAGGAGGTGAAGTGGAGGCTTCGTCCGAGCGCTGAGCATCGGCGGGAGTGAAGGAAGATCCTACTTCGTCTACATGTCACAACCAGATCTGCCTAGTTTCACAGCGATCTATGCTTGGACACCGGACCTCGCGGCTCGTGCGAATTGGTGATCACAAGAAAAATAGCGGCACACGTTTTTTATTTCGAACATTTCAGGAAGGCTTTGCTACGCTTGAGCGCCGAAGGATTCGTCATGGTTTTGCTATTGAAGCAAGGGAACAAGCTTCATTCTTGTGTTTTGGTATAATTTGTGAAGGATTTTATTATCATGAACAATTAAAAAGTCCGTTGAGTTAGGAATTTACCACTTTTAAATTCATTTTGGAATTCAAATATGGAGAATTTGAAGAGCTTTATTTCTACGTAGGAAACATCAAGCAAACAGCAAGAATTGGATTGGATTACTTCGTCATTGCAAAACGTTCCACAACATCACAATAAAACATCTTACATCATTCAATTGTTTTACTTGGGCATAACACAAGTGCATCCTGTAGAATTCATCACCGTCTCTCTAATCCAGCGTCTCTTTTTCCGAAAATATACTTGAACCGGGGCCTTAACTTGGACACTTGCTAGACTTAAATTTTCTTGGCGAGTTGCCGGATCTATGCATCCCTTGCAGAGACATTTTGCGCTTAAAATTACCCTCGGGCGTCTGTAAAATGTAATTTGTTTTAAATAAAATAACATTTGATTGTGACTCCTGTATTTGCTATCGGTGATGTTTCACTAATTTAATAAA\n>XM_047271736.1 PREDICTED: Hydra vulgaris uncharacterized LOC124808573 (LOC124808573), mRNA \nATGTTAAAGTTCCAAACTGAAGATGAAGATGATGACCTACCTATAGTTTCGCAAAAGATTGAAGTTAAAGAAAAAGAGATAGTTCCTAGTTTAACACTGAAGTTAAGCAGAGTAAAAAAACCATTTGAATATGATGATGAGGATGACATACCAAAGTTATGCAAATCCTCAAGTAAACTAAAAAGTTTAAACTTAGATTCTGTGGCATTAAATTCAAGTAAAGTAGTTGATGATGACAATAGGGAAAAGTGTAAATGCATTGATAAGTTAAGGAAAATTGGTGATGATGGAGTTTCGTTTCGAGAGATGACAAATAAACAATTTCAATATGCTTTGTTTATGGACTTGCAGAAAAATTTTCGGCAAATCCAAGAATCACAAGCACAAATCCTTGATAAGCTTAAAATAATTAAACAAAGTGGAGATATTGATTTTGATGTGAATGTTGATGATATTGGTAGAGACCCTATTAATTCGATTGAGCAATTTGATGTAATGGAAAATATTTTAAATACAAGTTCTAATGCAAGAAAACGCAAGGTAAACCATAAAATATAGTAACAAGGTCAGTAATCTTTGCAAACCT\n>XR_769696.1 PREDICTED: Tarenaya hassleriana uncharacterized LOC104800274 (LOC104800274), ncRNA \nGCGGGCGGCGCCTCCTTCTCCTCGCCTTTGCGTCGCCTCGTGGATACCGGAGAATTCAAAGTCCCAGAGAATTTCCGTGTTCCTGGAAAGCCATTGTTGTTTCTCGAGCTTGCGAATCTGATGAATAGAAAAAAGTTCATGTGGATTCGGAATTTCACGGCTCATTCCGAATGTGTTGCACCGAGTGATGGAGGATGTCCCTTGTCCAATTCACCAACTATAATCTACTTGAACTGGACATGTTCATGAAGTGGACTTCGCTGCTGGAGATAGCACGATACCAAGCCCTCTGTTATTGTAATGGATGCTTTAAAATGAATCAAGCACTGAGTGTTTGTGTTTCTGCTCTTTCATCAGATATCCATCTGGTATTGTTGATTTGTTGTTCTTGCAGATTCTTATTTGGACCAGTGTTGTCAAATGGCGGCCATGGCCCCGCCATGGCGGGATGGCCTGGCGGATTTCAAGGTAGACGCCATGGTATTTGTATAGCGTGGCGTGTATGGCGTTTTCGCCATTGCGTGCGCCACATGGGGTTTTCCATTGTGGGTTATGGCGGCCATAGCCCCGCCATGGCGGAATTGCGTATTAAAAGGGAAAGTAAAGTCCAGAAAAAAAAAAAGGAAAACACAAAAATGGGAGATATCGAAGCGTCGGTCGAATAGTTTAAGATTTTGGAAATAGAAAAA\n>XM_033481735.1 PREDICTED: Megalopta genalis pericentrin-like (LOC117226934), transcript variant X11, mRNA \nGGCCTATAGATACAATACCACACTGTACATAGCTATTCGTATTTTTATAAATCGACAACGGTCAAACGTTTATCGAATCGGTGGACGGTTTGAGACACATGCTTTGAAATGTAATGGATGACGATTCTGCCACTGGATGTTATACAATTAATTATTAACATCGTCTATTGTTGGTCGATTATTAAACGATCGTCGATTTGATTTTATTAATGAAATGAGCAAAGTAACGGACGATGATGAACGTAGAAGACGCTCTTTGGAAGCAGGCAGAGAAATGCTGGAGAAATACAAGGCGGAAAGAATTAATAAAGCCAAAGGCCCGGGTCATAGTCAAACAGACGATGCATCGGACGAGGAATCTTTTCGTATCGACAAATCCATTGGACGCAGAGAATCTTACATGCACGAGGGTGTATCGTCGAGGGATGTCACCCAAAGCAGCGTCAGTATGAGCGAAGGAGAAGCCGACGGCGATTTGGAAGGACTCGCCGGGAGGGTAGCTCAATTGGAAGAGATGCTACAAGGAAAAGAAGCCATAGTCGAAGCTTTGCACGCCGAGATAGACCACTTAAGAGCAGAGGCTTCGTCCCCTAATTCTTCGCAGAGTCAAAACAGTAGCATTCATGGCAAAGATATTATATCGTTGTATCATACGAAGTTGCAGGAATTTGAGAAAGCTATAAATAAACGTGATAATTTGATAGAGGAGTTGACATGGTCCCTGCAACAAGCACTATCTGCCAGAGATAATCTTGTTACTCAGTTAAGTTCTTTAAATGCTGTACAAATTCCGGATAAAGGTCGGGCTGGTACTGTAAATAGCGCAAACATGCAGGACAAGATCGACGCCTTGGAAGCTACTCTAAGCAATCAGAGATCGATAATAGAAAAATTGAACGGTCAGCTGATACAGTCTCAAGAACGTGAACGTACATTGGAAATGGAGAGAGAGACTCGAAATGCCGAGATCAGCGACTACAAACTGCAAATAAACAATCTGAATGAACAGATTCGTTTGGGTGCAACTGACAAGAATTTGAATATCGCTGAGACTTTGGAACAGCAAAAGAAATACGAGGCGCGCGTCGATAAAATCAAGCAGGACATGCAACATATTTTAGAAAAATTCACGACCGAGACAAACATAAATACCGCACGACATCAACAGGAATTAAAAGAGGTGGCTGCGAAACACGAAACGGAAATCATGAATATTCAAGAGATGTACGAGGAACGATTGAAACAGTTTAAAGATGAAAATAAAGTACTAGCCGATCGTTTGAACAAAGACTTGCCCGATCTCGAAACCAGGCACGCCAAAGAACTTTCCATATTCCAAGCACAAATGGGCCATTATAAAAAGACCGTTGAGGCTTTGAAGCTCGAATTAGTAAACAGATCGGAGTCACAGCAAACCGCGCAAACCGAACTGAGCCAGTGCAAAGCAAAAGTGAACGAGCTGAAGGTTCAATATGAGAACGCGCATCAAATACAAGAGTTGGAGCATCAAAAAGAAAGAGAAATGCTAGGTGAACAGATCAAGCTGCACAAGTTACAATTGGAAGATATCACGTCGAAATATGTTGCCGCGACCGCGATTCTGGAATCGAAAGAGAGCATCGAACGTTCGTTGGAACAGGCTCTAACGAATGCCGCGACACTAAAAGATGAGAACGATAGTTTGAAGTTCAAATTGGACGACTTGTCGTCGAGATACACCGCGGCTCAGTCGTTGATTGAAAATACTCAAGTGCACGAGCGAACTTTGAGCAATCGAATTTTCGACCTAGAGAAATCGTTGTCCAGACTCAGCGGTATCAACCTTAGCACGTTCAGTGGCCTAAATGAAACAGCTTATCAAAGTTTGGACGAAGTTGCGATTCAATTTCACCTGACGAAACAGAAACTCGAAGAGAAAGCGGAACTAGAAAAGCTTCTGATCGATAAAATTGAGAATCTCGAGGGCGAGGTTCGGAAAACGACGGAGGAGCTCGAGCAAGCAAATCTGGCTAGAAAATCGTACGAGAAGCAACTGAAGGACACAAGGAACATGTGCGACAAGTACAAGTCCGAGCTTAACTCGTTGAAAACTCTTGATACCGATGGCCAGAGTTGCTCGAGAGATTTGTTCGAAAAGACCGAGAAAGACCAACAGGAGATTAAGCAACTGAAAATAAATTTGGAGCAAAAGGAAGCAGAACTCGCGGATTCTCTGAGGCAGGTACAAGACTTGTCGCAGAAATTTCAAAAATCCGATGAGGAATGTCAGCAGCTGAAAAACGGATTGGCCACTGCGTGGGCCCAATGCGCGGAGGTAGAAGAGAAGTTGAATCAAACGTTGGCGTTGAACGAAAGCAAACTCGACTCGTCTGTCCCGATGTCTAGTCACGATAATACTTCGACGATGCGAATAAAATTCAATAGAACCGTAAACGATACTACGACGTTGTCCATCGATGATACGCACGATCAAAGCAGAGACGACAACAGGCTTTTCTACGGCAGGGACGACGACTCGTCGGACACGACCGGTGTCGTGGCATCGTTGCAGGCAAAGCTGGCATCGACTTTGCAGGAAAACGAAAGATTGGCCAAAGAACTGGAACGCTCGCTAGAGGCACAGCTCGATTACAATCGAGTTAAAGAAAAACCGGAACACTACTCGACATCGATGGACAACTCGATCATGGAGAAACATCGTGTCGAGGAGGAGGAGGAGGAGGAGGAGGATGAGGCTCCGTGGCAAGAGCTAAGGACCGCGCATTCGCTGAAAGAATCTGTGAATCAACTCCGAGCGGAGAAAGAATTGTTGAGAAAGGAGATCGATGCGTTGATTTGTGTTCACGATAAGCAAATAAACGCGATAAAAGTCGAAACTGCCTCGGAAATTAGGAAAGTTCAATCGTTGGTATCGGGCGTGAAAGATGGCACAGCGGAGCTACGTGATCTAAAAACGGAATTGGAGATGCGACACGCCAAGGAGATGGAGGAATTGCGGACCTATTTCGAACAGAAATGTCTGCTGATGGAAAAGCAATATTCGGAGGAAATCTTTAGTCAGCAGTCGAAAAAGATGTCCGACAACGACAGCGAGATAGCAGACTTGACGGAAAGCTTGTATTTCGGCGGTGCCGGGGATTGCATGAACGTTTCGAACAATCTCTCCGAACGTAGCTCCAGGGTTGCTTCGCCGTTGGCGTTGGCGTTGGCGGACGAACAATCGAAACACAATACCAACGGTTTGAATAAGTACGAGCTCGAGACAACCGTTAAAGCGTTGCAACAGGAACTGCAAAATAAAATAATAGAAGTGCAGGAAGTAAAACTGCATTATGAAAAGAAGTTGGAGGAACAAAAGATGACATACGAAGGAGAATTGTATGGCAACAGAAGGGAACCAGAGAAACTGGAATTCTTGCGGAACATGGTGACTCGTCATTGTCAAACAGAGTGGGATGCGGGTGCGTTGGAAAACGGTGAATTAACTCAACTGCGAGCGGCCTACCACCATCAGTTGGAAGAACAGATTGCGCTAGCTAAATTGGACATTGTCAATGCGCTTCAAGAACAAATTCAGGCCCTCCTGTCGGTCGAATCGGAGGTCGATGATATTTGGTCGCCAGAGTTGCTAGAGTTACGCGACAAACTGACCGGCAATGCGAAACGCGAGATGCAGTTGCTGAAAGATGCTCATGCAGCGGAAGTGCAACGGCTCAAGGAGGAATACTCGCGCAACGTAGCCAGAATGATAGACCGTCATCAAGAGGAGCTGAATAAGATTCGAGATGGCGTGCCCGTCACCGATTCGAAGAAAGTCTTGGCCCAGCTTGGAAATTCAAATGTTCTTGAAGAGAGGAATAGTTTGTACAAAATCTGTGCTACCCTGAGAACCTTGGTCGAAGAGCTACTAAAATATTTTCTCGTGTGCGAAGAGGAAGTCAACGATACTCTGATCGGCGAAATTTTCAAGAGACAACCGCGCGACGGTGTCGGTAACGAGAGAACGTTGGAGAACACCGAGGACGTTAAAAAGTTGAAGAACGAAGAACATGCTAGTCCAAGTTCGTCGAGATTAAATTCATCCGGTTCGAGGATTCGACGAGTTCACTTTGCACCGCAAACGACAGAAATAATATCCATAATGAACAGCGATAGCGAGACTTGGCAAACAATATTGGGAGAGAAGAACGACATCGTCGAAAAATTGAAAGAGGAATTGAACAGCTGCGTGCAACGTTTGAAGTCCGAAAACGCCGAGATTCTCGCGATTACGAACAGAAAGGACGGGGATTGTGGTCAAGGTGGTCCTTTCCCGAAAGAGGTCGCCTGGATGAATCAAATGAACGAACAGCTCGCTTCCAAGCTGCAGGAAACGGAATCCATGATTTTGAACTACGAACAGGAAACGGAGCAGCTGAAACTTACTGTTCTTGATCTCCAAAGGAAATTGATCAACGTAGAAAACAAGAAAGAGATCATTACCGAAGGTTACGGAGAGAACGACGACGTCGGCGTAGAAATTACCTTGCAAGATTTCACGCATCTACAGGAGAAAGCGAGGCACGTATTGTCGAACGGAGGAGAAGACTGTACGGTCCTGTTGCAACTGATAGAGGAATTGTGTAGACAGAGCGACAAATTGATGGAGGATGCCAGGAGAGAGAAAGAAGACTTGCAGCAACAGGTGGAGGCTCTCGAGTCACAAATGAGGGAAATGTCATCCCTTATGTCCGACACAGAAGCCAGGAAGATCGAGACCGAGAGCGAACTGAAAGCAGCCATCGACAAGATCTGGGTGTTACGAGACATTATTACAGACTTGGAGCAACAGCTACAATCCAAATCGGAAAAAGAGGAGTCTTTGCAGCTTCAAATCGGTCAACTGGAAACTGTGATCGCCGCACAAACCAAGAACCAGCAAGAGTTGGTACAGGAGCTGGACACGGTTAAAATGGGTAGCGAAAGTAAGCAGCTTAACGAGCACATCAATCACTTACAGGAGGAGTTGAGGAAACACAAACTAAGTTCCGAACAGTTTAACGCGAATTCTACCGCTCTGAAACAAATGAAGTCGGAGCTTCGCGAAATGCAGATTCAGTTGGACAAGAGGATCAAAGAATTGGAATCGATACATATGTGTAGCTCCAATTTAAGTCTGAGTCAACCTAGCGAGGACGTGTCGATCAGAGAGCAAATCGACGCGGCACGTTGCCCTACTCCGGACGATCCCAATTCACCGCCAATGTTGCCGTTGGACCAGTTACTCAAGCTCAAGGAGAAGATGTCGAAACACGCGAGAGCCGAGGAGGTTGCGTTCAAGAGAATCAAGGATCTAGAGATGCAGGTGGCTGCATTGAAGAACCAGAACGAAGAGTTGCAAGCGGAGCAGGAGATCTTGCAACAGACCACCTCCGAACAATTGTATCAAATCGAAGCGATGCGCGGCCGTCTGGAACAGCACAAGCAGAATGCGCCCTTCGCGCAGAGGCAAGCGACGTCGCGGCTCGAGTTGCAGCTTCACGAAGCAAATACCAAATTCCAATCGTTGGAGTCCGCCGTAGCGGAGAAGGACTTGGAATTGAGGGACACGCTGAATCAGTTGGACAGAGTCAGCCAACTGTTGCAGGAGAAAGAATCGGAGATCGCGAATGTCGTGCAGGTGGAAAGGTCTACCATCCAGAAGCTGCGCGAACACTTGGAGATCGTCGAGGAGGAGAATAGAATTTTACAAGCGAAAGTCGGCGTTCAAGAACACTCTCAACTCGAACTGCCGCGGCTGATCGACAGCATGCTGGCCGACAAAAACGAGGAAATCGACCACATGAAGGACCAGTTGTCGAAAAAGGACAAACAACTGCAACTCTATTCCTCGTTGAACCTGGACGAGACGCAACTGAGAGAACTGATTCGACAGACCGAACCAAAGAACAGTGCCCGTACGTTGAGCGACATTCTGTCGATTCACTCGGAATGCGAGGAAACGTCGGAGGCCGTTCGTGGAACGAATTTCACTCAAACGTTGCCAAGCGTATCCACTTTGAGAATTCCCACAGCATTCGTTTCGGCCAAAATCATGGACGACACCGCGGCGCTTTCACCTTTGGACAGCACCGCCACCAGTAACACCGGCAAGATCGGACTGCGTGTACCACCGTTGGACCTGGGCTCTCGTTCTCAGAGTTTATCGGCCGCGTCGAACCAACAGTCCTCGGAAATGGATTTGTTGCAGCCCGCTGAACCGACCTCTAGGAACTCGGAGGAGAACGACGGCACACCGATGAACGACAGCGAGAAGAAGAACGAGTATGTAATCGTCGACGATAAAGTCGACGGCAAAGTCGACGACGAGTCGCTTGTTCGTTCGGTGTGCGTCACTCCGCACGTGAAACATGTGGAAACTTCGATCAACGAGTACATCGAGGAAATGGAAAAGTTGGAACATCAGTTGGAGATCGTTCGAGAAGAGTTGCGAACGAAATCCGAAATTTTGGCGAAACGCGAGGCAGATTTGCTGTCGCTGCAAAAACTGTACAACGAGTTGCAGACGGAAGTTAAAGAAGTCGTGGAGACGCTTACCACGGACAAGTGTTTCTATCAGAATCAGTACGAGTTGTCGAAAACGTCCGAAAATAAAATCAAAAAGGATCTTCTGGAGGTGGAGAACGTTTTGAAATTGAAAACCGCAGAGGTCCAAGAGCAAAAATGTAAAATTCAGGTCAACGAGAAGATCATCATGGAGTTGAGTTCGGAGAATGGTAAGCTGAAGGCGGATATCAAGGAGAAGGAGCAACAACACGCGAACAAGTGTGCCTCGTTGTTGCGAGAGAACGCCCACGAGTTGGAGACTATGAGGGGCAGGGTTCTCCGGCAGGACAAACAATTGAACGAACTCAAGACCAAGAACGAGTTGCTCAAACAAGAAATCGTCGAGTGTCAACGAGAGATGACCGAAGGTTTGAACAACAGAGATCAGACTATCAGGCGACTCGAGGAAATGGTACGACGCGTTAGCTTTTCGGAAGCATCCTCGCCTTCGAACGAAAAGGACGAGGAGATCCATCATCTACAGGAATATTTGAAGGAGAAGGACAAAGTTATACGGCAAATGAACGACGACAGCAAGAGTTTGCACAGAGCTTTGGAGACTATACAGAATAAGATGAAGGAGTCCGGTAACGTGGTCGAGCTCAGAAGGAAGCTGAGAGAAGAGCAAAAACTGAATGCCGAGCTGAGGAACGCGATGGATAAGCTGAACAAGGAATTGTCGGATTTAAAGTTGGCCACGCAGCGGTCACAGGAGGACACCGACATCGAGGACATGGTGCAGAGGGAGCTGAATTTGTCGGCGCATCTCGACAGACGGCTGATGAATGCGATCGAAACCGACCAGGAAGATGGTATCTGTAAAGTGGAGAATCAAGTTCAAACCAGAGGGCCTCGTCGGGAGGGCGTTCAAAGGAGCAGCGAATTAAAGCTACAACTGAGTCAGGCGAATAGGATCAACGACGAATTGAAAAAGTTGAAAGACGACTTGGAAATCGAAAGGGGAATGTTAAAGTGTCAGATCGCTGAGTACGAGGGCCGGATCTTCCAACTTAAGTCTGATCTAGCGATGGAGCGCGAACAGGTTGCGAAGCTCAACGAAGAATTATTCGCCGAGAAAAGCTTGATTCGGAGCTTGAAGATCCAAATCGAGAAGGAGCATAGATCGATGGAGTCCGGTCACGTGCAGGACTCGGAGTTGATCGAGTTTCTTCAGAATAAGCTGAAGACATCTCTGGACAACGAGGCGAGGCTGCGCAACGATCTTTCCTTGTTACGACAAGAACACAAAAGCCTAGAGATACAGCTGAGTTTGATGAAGGAACACGTACAGTCCCAACAGTCCCAGAAGTCCGACGAATTGCCGAAACTAGCGGACCTTTTGGAAACTGAGAGGAAAAAGTATTTGTCGGTGATGGAAAGCTTGGAAAAGGAAGAACGTAATAGCGCGGAACTAAAGGATACTTTGAGGAAGCTACAATCGGAGAAGAATCGATTCGAGAAACAGCTGGAGGTGGAAGTGGAGGAGAAAGAGAAATTGATAAGCAGCCTTGCTCTGGTCGAGGGAATCAGGGACCATTTGCAAACAGATCTCGGTCGCACCAAAGAGGAGTTGAAAGCGCGGGAGGAGGAGTGCGAATGGCTCCAGAAGAGAATCAAGACAACGTCCGACGCGGAAATCAAAAGGCAAGAGCAAAGGACCAGTGAACAGAATCAGCTGAAGGGATTGAGGAGGGAGATCAACAATGCCAGAGAGGTGATGGTGGACTTGGAAGCCGACATGAAACAGTTGCGTGAACGCGAGATGAAACTGACCGAAACGGTGGAGAGTCTTCGGGAGAAAGAAACGTATCTGCTTAAGGAATTGTCCGCTGCCAAAGACGAAGAGACAAAGTTGAGGGACACGATCGCCGAGTTGCAACAGGAATTGAGATCGTTCGCAGAAAGGGAACTGGAGTTAGCTAGAGAATTGAAAAACAGGTACGGTGGCGACAAGACCGCCACGCCTACCAAATTGCTGCAGAAGATCAAGGAACTCGGCGACATCAACAAAAAGTATCTAAACGAGAAAAGCATGCTTCAAGAGAAGCTTGTGAAAGCGCTGGAGGATAAGGAGCAACTCGGTCAACGAGTCAAATCGCTCGAATCTCGTTTGAAGAGAGGCATCGAGTCTCGCGATGCGAACGCGGCGATCGGTGGAGATTGCGCGGACAAGTTGCAACACTTCTATGGGAAATATATACGAGCCGATAGCAGACGCAAGGCTTTGACTTACCAGAAACGTTACCTGCTAACCATCGTAAGTGGTTATCAGATCTCCGAGGAGAACACATTGTCCATTCTGGCGCAATTGACTAGCGAACAACGATCCTATACCACAGCAGGCCGTCATAAAAAGTCTCCGCGAGTACGCTTCAAGAGCGCTGCTCTGGTACTCATCAGTATCCATAGAATGAAGTGGCTGATCGTTAGGTGGAGCATCGGCAGAAGAATAGGTGCCCAGACGTTGCTGTGGAACGTGGACCAGTCGTACGTGCCGGTACAGAAACTTGCCATGGATCATTCTCCCCCTGTTCGAGAAAGACCTGTCGCAAACGAGGATGGTAATTTCGACGGATTCGCGCTTGCACAGTATTATCAACGGTTAAAAAACATTCAACAGACATTAGGTTTAGCGATGGCTGAATCTGTAAATTGTCAGATTCATCCCGAATAGTATTATATATTATAAGAGCGTTCGAGTCTTCGACACGCGGGGTAAGGCAAGCATGATAAACGTACCACGAAATCAAGTTGTGTATAATCGCGCGTGGAATTGATTGTCAAACGGGTATTTCAATCTAGGAATATTTTGTTCGGATTTCATCGTTCGCGGGCATGTATTTTTCTTATGGCATGTAAATAGGATTGCAGCATAGTAACTGCAATTGTTGGACACGCGTCAAGCCTTCTCACCGATTACCGCGTTGTGTGCTTTTTAAAGAGTTGCCACTGCAACATTCGACAACCCGAAAAAGAGACTAGAACGTTTAGTGCTAAATAATTGTGCTCATATACCAAGTTTTACCAAAGGTACGATAGACTTTAGTTATAATTGTACTTTGTTAATCCTTTCAAGAGGATGTGAACCAGTGCCTTGTCAACTATGCTACAATATAATAAGTGTCTAGTATTTATTTATTATCGATTATCGAACTGTAAGTTTTTATAATGTGAATAAACTCTATGCAATGGCTTTTTATGAAA\n>XR_006348224.1 PREDICTED: Manihot esculenta vacuolar sorting protein 18 (LOC110629926), transcript variant X10, misc_RNA \nAATGAATATAAGATAGGTTTTTATGGTTTGTATAGAGAAGTTCTAGAATCTCCTAAAATAATAGAAAAATACAAAGAAATAGAAGCCATATGAAATATGAGACAACTCTGGAAAGCTGTGGTCCCCACCAAACTTCTCCTCCAGAAGCTGCTTTCGCACCTCCAGCTTTGGCGCTAGACTCCCCCAACAGCTTCTAGATAATCCTCGCAAAGTCCAGCTTTTACTCGGGCTAGCCGCGCGCTGATTTGCTTTCCTCTCGTGCGCTCCGCAGACCAGCCCGACCAAAATACTCATCCAACGCTTGGCTAAGTTTGCTCTCAAAGACTCGGGCGACAGTACCATCCTGGAGGGTTTCCGAGTGTTTCTAGCCTTCCGAGTTTAGGGGCGTTCACCAGCCCTTCCAAGTGTCTGGGTGTTCACCGGCCCTTCCGAGCTCCTGGGCATTCACCAGCCCTCCCGAGCATCTGGGCTTTTACTAGCCTTGCGACCATCCGGGCATCCTCTGGCCCCACCTAGCTCTGCCGAAGTTCCGAGTGTTTCCTCGCAGACTTCGCTCGCTTGCTCAGCAGGTTGCCTCACCAGCGTCAATTGCTAAAAGTCTCAGTCATCCTACCATCTCTCAAATTCACCCGTAGGCCTGTTGGCTCCCGTTAATACTCCGTAGGCCTATCAAAATATCACTCGATAGCTAGTTTCTCCGAGATGACTTAGCCCATCCTTATGCCGCCTACTCGGCACCAAGATTAGCGCCAACTCCTTCCAAAAGAATATGGATATTTCCGGGGAAAACTGTGGGGGTTTGTAAGTGCAAAATCTTAATTGTGGGTATGGACTACCACATCTCATGCCTGTACTTAAGAGGACCAATGGGCTCCCTTCTATGTATTTCCATGTGGCATGCCTTCCATGAACAATGCTTGATTGCCCATTTGACAAGTCATACCAACAAAACTCAGAGAGATTTTTCTGACAAACTGCCAGTATGGTGAAGTTCAATAACATTGCTTTTCTGTGAAGATGGATGAAAAACAAAAACAGTATGCCTATGATAGTTCGGGGCCCAAACATCTAAGACAAATTTCTTCAGCTCTACGGGATTCGAATATGTAATTGGGCAATAATTGTTGAGCAAAACTAAATACAGTTTATTGGCCCAACCAAGTACAGTTCATATTTGAACTGACTAATTTCTGCAATTCTTTATGAGAAAAAAACAGCATGAAATATGCAGCAGCCTGCTGCAGTCAACATTGTACTTCAATTATTGTACGACTATGCTCTCATGTTCTGCAATCTTCTGGTATATGCACCATAAGAAATCCCATGAAGGGCATAACTAAATAATGAAACAATAAATTGAACTGCAAGCTTAGTACAAGCACATTTGCGTGGCCTAAGATTTACGATGACTTTTGTTTAAGTTTTTTTTATTGTCATCTCTAACTGAGTTGGGTTTTGTATTTAGCTTATCATAAAACTATCCTGCACAGCTTCTTACTCTGCTTTATATCAATGAAACATATCTCTGCGCCATCTTTTAGAATGAACTCCAATTCTGGAAACTCTTACCACCAATCAAATTTTCTTCCTTCGGGTATTTGAATGGATGATGCAGGCTGATTATATACTGGATCTGCAGAAGCAACTTACTTTACTGGGTGAGGGAACTAGGAAAGACTTGAATGGTGGAATAACGTAAGATTCCATTGCTAGCAAAACCCCTGTAGATAAGGTCAGTTCTATGTTCTTCTGAAGCAAAATCTATTATGGTAATATGGAGTAGTTTGTTATAACTCGAGGAAAAAATTTCCTGCATTGCTGTACATTAACTACAGTGGCAGTTTATTACGTCTTTTGTAGTTTGTCTGAGCCTCATCTCTTCTCTGGTGTGTATTTTAAATCCCGTTGGAATTTGCAGCTCGGCTCACAGTTGATGATGCAAATAGCCAGCAATTGCCCATTTCACGGTGAGTTGATGATCAAAATGTTCTCCTTGCCACTACTCTCCCTGGGGAAGCACGGTTGGTAGGTTCATGGGATAAAACCACATAACCTGGGAAACCAGAGGACGCCCTATTTATAGGTGTAATAATATTACCTGTGTGTGATTTCAAAAGCCAGTGTGCGTGTGGGGAGCTTCGATGCCTGTAATGTGGCTCTCTCACCGTCTCGTTTTGAATTGGGTTATGAAGGAGAGCATCCCCATTTCCTTGTAAACCTTTTAAGTTCTTCTTAGGCAGCACCATTAGTTCTCAATAATCATGATTTATCCCTTCTGATTGTTCAAGATTTCTGAAAGCACAAGCAAATATATGAACTTTTATCACT\n>XM_029702302.1 PREDICTED: Salmo trutta DNA-binding protein SATB2-like (LOC115155576), transcript variant X3, mRNA \nTACTCGCTTAGCCTAAGTTGTTTATTTTGCCTAACGTTCTGATCTCCCTCCCCCAGGTCTGATGATCCCAGTATTCTGTGTGGTGGAGCAGGCAGGGCCGGATGGGGGGATGCAGCGTGAGGAGGTGGAGAGGAGCGAGGGCCACAGAGAGGAGCATGCTGAGTTTGTCCTGGTCAGGAAAGACATCCTCTTCAACCAGCTGGTAGAGACGGCCCTGCAGGCCCTGGGGTACTCCCACAACTCTGCTGCTCAGGCCCAGGGCATCATCAAGGTGGGTCATTGGAACCCTCTGCCCATCCACTTCCTATCAGACGCTCCTGAAGCCACGGTGGCTGACATGCTGCTGGACGTCTATCACATGGTCACTCTCCACATACAGCTACAGAGCTTTGCCAAGCTGGAGGATCTTCCGTCAGAGCAGTGGAACCACGCCACGGTGAGGAACGCTCTTAAGGAGCTTCTCAAGGAGATGAACCAAAGCACACTGGCTAAGGAGTGTCCTCTGTCACAGAGTATGATTTCCTCGATAGTAAACAGCTCCTACTATGCCAATGTCTCCACTGCCAAATGCCAGGAGTTTGGACGCTGGTACAAGAAGTATAAGAAAATCAAAGGAGACTATCAGGAGAAGATGTGGCCAGGAAGAGAACATTCTGAAATCAAAGTGGAGAGAGACAGCCTGGCAGACTTCTATGTCCTGGGCCAGCGTCCCCCTCCCCACCTGGCCAGCCTGGTCCAGCTCAGCCACCTCGGAGGGGGTGGAGGTGCTCTCCTCAAGGGTGGGTCCGGGGACCCCCAAAACCCCTCCCAACCCCCCCAACAACAACAACAATCCCAACAACAACACCCCCCCTCGCCCCATGGCCAGCACCACAACAGCCCCCCTCTACGTGGCCAGGTCCCCCCTCCCGGCCCTCCAACCTCCCTCCAACCTCTCCTCGGCCCAGGCGGGCTTCTCTCCCCCCAGCTCAGCCCTCAGCTGGTCCGACAGCAGCTAGCCATGGCTCACCTCATCAACCAGCAGCTAGCTGTTAGCCGCCTGCTAGCCCACCAGCACCCACAGGCCCTCAACCAGCACTTCCTCAACCACCCTCCCATCCCTCGCCCCTCCAAGGCAGGGGCCCCTGGGGACCCTGGGAGCAACCCGTCTGCTGCGGAGGTCTCCATTGATATCTACCAGCACGTCAGGGACGAACTGAAGAGGGCCAGCGTCTCACAGGCTGTGTTCGCCCGCGTGGCCTTCAACAGAACACAGGGCCTGCTGTCGGAGATTCTGCGGAAGGAGGAGGACCCTCGCTCTGCCTCTCAGTCCCTACTGGTCAACCTCAAAGCCATGCAGAACTTCCTCATCCTCCCTGAGGGGGAGAGAGACCGTATTTACCAGGAGGAGCGTGAGCGCAGCATCAACCCCTCTGTCGGCCTGCCCCCTACCCCTACCTCCAGCCCCGGGGGCCCGCGCCTCTCACAGAAGGTGTGGGAGAGAGGTATGGACGAGCAGCTCACTCCTGACGCCTGGGCTGCTATCTGGAAGAACAAGACCAAAGCCACCTCTGTGCCCAAGCCACCAGGCCCCAACCCAGACCTGCCCCTGAAGCTGGAGTCTCTGGTCAACATCACGTCAGGTATCTATGATGAGATCCAGCAGGAGATGAAGAGGGCCAAAGTGTCTCAGGCGCTGTTCGCCAAGGTGGCTGCCAACAAGAGCCAGGGCTGGTTGTGTGAGTTGCTGCGGTGGAAGGAGAACCCTAGCCCAGAGAACCGTACTCTGTGGGAGAACCTGTGTACCATCCGGAGGTTCCTGACCCTGTCCCAGACAGAGAGGGACATGGTGTATGAAGAGGAGTCAAGGCACCACCACAGTGACAGGGTCCACACTGTACTACACCTGCCCCAAGACCCACAGATGTACTGTTTTTCTCACCAGGCGCTGCACAGGCAACCCCCACAGCCCCTGAAGCACCACTCCCCCATGCGCGAGGACCCCGTGCCCGCTCAGGGTAACGACGAAGGGTCACAGAACGTTGAAAGAGGTGGTGGTGGCGGTGGCTGCACGGGCGGTCCAGGAGTCGGTGGTTGCACGGTCGTTAAGAAGCCTCGGTCGCGCACTAAGATCTCTCTAGAAGCCCTGGGCATCCTACAGAGCTTCATCCAGGACGTGGGTCTGTACCCGGACCAGGAAGCCATCCATACCCTGTCAGCCCAGCTGGACCTGCCCAAACACACCATCATCAAGTTCTTCCAGAACCAGCGCTACCATGTCAAGCACCACGGCCGGCTGAAGGAGCTGGGGGAGGGGGCTGGCGGCGTGGACGTCAGCGAATACAGAGACGAGGAGCTCCTCTCCAGCTCAGAGGACCCTGAGTCCAGTGAGGATGGTCACGAGGAGATGTACCCCACTACTGAGAGGGAAGGAGGGGAGAGAGAGGGCAGCACAGCAGGGTCAGCCCCTTCCCTGGCCCTAGCCCCAGGCCAGTCTTCAGGGACCAGCATGGGAGCCATGGAGGAGAGCAAGGACAAGGGGCATTCTCATGGTCTGGGTGAGGGCCGAGCCAGCTCCCTGCCCCCTAGTAGCTCCTCATCCAGTCCCAGAGAACAAGCTGACTTCCAGAGATAGAGACCCAGAGACTAGATGAGACACTGGAAGAGACGGGCGGAGATAGAGAGACACGAGAGACAAAGAGACACGAGAGAGAGAGAGAGAGAGAGACGAGGGGAAGCGAATGGGAACAAGACACTGGGAGAGGGGAAGAGAGGCATAGATGAGACTCACTGACACACAAATATACAGACAGAAGGGATCTTAAGGAGGGCTCGTCAAAGAGGGATTTCAGTGAAAATACAATTTGTTACCTCAGCAACAGGGATATGCCATGAAACAGCAGCCATGTGGAACAGTTAGTATAGTATGTTCACTGAACCAATAGACAGAGAGATAACCAAACATACACATCTCACCCCTGTCCACAAGAAGAACTCGCCACATCAACACCACTCTTGAATTGAGCCAATCCCAAAATTCAGCTTCACTCTGTCCAATGACTACTCTCCCTAATGTCTCAACCGCACCCACATGCTGAGCACTTGTCCTTATTTCGATGCTGGGTCTTGAGTCAGGAACCTAACTGACAGTCATAGACTGAATACTGGGGGCCTGCTCAGACCTCCACCATCCTGTGGTCCCTCAGCTCCAGATCTACAGAACTGGCTGCTGTAGCTGTCCTCCAACTCGTCCCCCTCTCCGCCCCTCCATGACAGGACCATTCTAGTCTTTGGTCTTTGACAGTGTTGGCAGTTTGAGTGGGAGGTTGGATAGTGGATGGGTGTTGGTTGGAGGTAGGAACAGTGGTATGGGGGGAATTCACCAATGATAAACAAATATGGTGTAAGTCCAGAATGGAAGCTTATGGTATTTTTTTGAAGTTGGAATCGCCCCTCCCATCCAGCTCCCGTTGCCAACCCTCAATGGTGCAACAACATCCCTATGCGATGGACCAGACCATCCCTCTAACGCCCTGCCCCCTAACCCCCACTCTAAAGATGGTTCATTCTCTCTGTCACTGTACAGCAGTTATTACACACTAACCTAGTGTGTATGGCCACTGTGGTTTATGAGGACACTGCTAGCTGAACGTATCGTGGTTTAGGACATAAGAGAGGACAGCCTTGTGAGGACAATGAGGACCCAGTGGTGTACAAGGACCCTCAGGATAACAGTTACTCTGGTCTGTCCTCTGTCCCCCCTGCATACCCAACCTCTCCCTGTGTGGAAAGAAACAGGGAGGGGCACAACAGAACGGAGATTCAGCAACCAATCGGGTATCTGCAATCAATCAGTCACTTTATGTGCACTAGCCCACCCCTTCACTCTTCCTCTCTCTGTCCCCATCCCTCGTTCTCTCTCTCTATAATTGGTGCCCACAGTGTCCCCTTCCACCACACCTACCCACATGTAACTTCACCATATTTATTGCTATCTTTATCCATGATTATCATTATCATTATTGTTATGGTTGTTATTGTTGTTATTGCTGTCATAGCTGTTTATTTTTTACTTCTATTTTCATGCTTGTAATATTGGCTTTCCGAGCACCATGGTTGTTTTGGTAACGAGAGACGTTTTTGAGACATGAGGAACACACATTGCCGAACAAAGAGCAGAAGAAAACCAGAAAAGAAGCAGTTACTGTAACGTTTAGCGAGTAGAAATCCTGTCATGCTGTGCTAAGCAACTCACGTGTTCTTCCAAAGAGAGACGGACATTGGCTGAAACGGGAGTGGAATCCAAAAAGTAATGGAAACACAACGAATAAACTGAGCTTTTGCTACAGCTGTTAACAATCTGACATGTTTGGAGCCTTTGGAAAACACAGCAGGCTTGACCTCTGTGTGTTATGTACAAGTGTGTGTACAGTTCAGTACAAATCCTTATCTGAGAGCGGGTACTTATGTCGAAGGATGCATCCCAAAGAGAGCCCTATGAGCCCTGGTCAAAAGAAGTGGACTGTATAAGGTATAGGGTGGCATTTGGGACACAGACAAAGTAACAGAGTAACCATTATTTACCCGTCTGACTCTAGGCAGCTGCTACGTGAATGACCTGTCTTGTACTGTAATTCATGAATTAATCAATCATACAATACATTGTGTTATATCGCTC\n>XM_009901592.1 PREDICTED: Picoides pubescens prodynorphin (PDYN), mRNA \nATGGCTCGGCAGGCGCTGGCACTGGCACTTTGCCTCTCTCTGGCCGTGATGGCATCCACTGACTGCGTGACCCAGTGCTCCCTCTGCGTGGCACAGACACCCACCCCCGAGACCAGCAGCTGGCCCCTGATGTGCCTGCGGGAATGCCAGGGCTCCTCACCGCCCGGGCCCGAGTGGGAGACCTGCAGGAAGGCACTGGCGCTGCTGGCCCCGCTGGTGGCCCTGGCCGAAGGGACAGAGCCGGCCCCTCGGGAGGCGGAGGAGGAGAAGGCAGAGCCGGAGCTGGGCGCCGGAGGGCGGGGGGAGGCGGCAGCCCCCGAGGACTCCCCGGGGCCGGAGCCGGCAGGAGATGGAGCCGAGGAGCCCACGGGTGGCGGGGCCGGGGGGCAGGAGCTGGCCGAGCTGCACAAGCGCTACGGGGGCTTCATGCGCCGCATCCGGCCCAAGCTCAAGTGGGACAATCAGAAGCGCTACGGAGGCTTCCTGCGGCGCCAGTTCAAGGTGACCACACGCTCGGACGAGGACCCCAGCGCCTACTCAGGGGAGGTCTTGGACCTATAG\n>XR_007834401.1 PREDICTED: Phodopus roborovskii U6 spliceosomal RNA (LOC127220836), ncRNA \nGTGCTTACTTCAGTAGCACATATACTAAAATTAGAATTATACAAAGAAGATTAACTTGGTACATTATCAAGGATTACAGGCAAGTTTGAGAATTGTTCCATATTTTT\n>XM_029382818.1 Trypanosoma rangeli nuclear RNA export factor 1/2 (TraAM80_05959), partial mRNA \nATGTCGGCACCCTACAAGAAGACGAACACCCACAATGTGCCCTGCTTCTACTTCAAGAGGGGCGCTTGCACGAATCAGCGCTGCCCGTACCTGCATGTGCGTGGGAAGGAGTCAGGCGGTAACGCAGGCGCGGTGAAATTGTCAAGCGTTACCTTGGGCTTACCGGATGCAGCGACAAATTTGCTCTCAACAATGCTGAAGCTGGTCTTTGAGAAACAGCAGCAACGGGTGTATGACGCGTCGTCTGGGATGTTGGACCTGAGCGAGTTGAGGAAGTTTCCAGACCTAAAGGACGTCTCAAACTCCATTAACTTTAATACGCAGAACTTCTGCCGCGCTCTCTGTTCGACGATAAAGTCACTTATTGTCCCACCACCCTCTGCTATGCAGTTAAAGGGAAATGATATCACTTCCCTTTTTCACCTGGCAGGCCAGATGGAAAAGGCGGATTTGCACATGTCGCTTCGGGCTCTTTCGCTAGAGGCAAATAATATTAGGACGATGGATGCACTACAGGAACTTAAAAAGTTCATGAATTTACAGGAGTTGGTGCTTGTGGGTAACCCTGTGGCAAAGCGTGATGACTACCGCATGGAAGTGAAGAAGGCATTGCCGTTTCTCCTTGGACTGGATGGGGAAGGCATCGCGGTTCCGCCACTGTTATTGCCATGGCCACGATTTGCGACTTCCGAGTACACCGACGCGCAGCGGCATGTGCTTCAGTTTGTCCAATGCTCATTGCTGAATCCACTTGAGGCGGGTGAGGTGGAGCGGGTTTCACAGGGCGTGGATGCAGTATCAGATATTTATGCGCAGAAGGCCATTCTCACCATTTCCCTTTCGTCACCGGAGGCTGCAGTAAGTTCGCCGGCGCGAAGCGTAAATGGCTTTTCATTGGCGTCTACGCAGCGCAACGTCATTCGCGAAATTGTTGGTCTCCGGCTAAAACAGACAGAGAGCAATCACAACTTGTTGCATGGCGTGAAGTCAAGTGTTGTGGCGTGCGGGCGTACAAAGGTCTGCTCACAGCTGGAACACTGGTTGTATCCCAAAAATTTTGCGGTTCAACACTTCGTGCACAGCAGTGCAAGCGCCTCGTTTCTGGATAACACGTACCTGTCTGGCCCCGCACCTGTGGCGATGAAGGTGCCGGTGACTGTGGTGACGTTGCATGGCGTGATGACGTGGACCCACCTCAGTCCGCAAAGTCAGAATAACTCTGATCGTGTGGTCATTTATCGCAACTTCACACGAGTACTTACTGTTCAGCAAAACGAGGCGGGCCGTTGGTTGGTGACGAACGATATGGTGTCACTGTACCTATTTTCGGGGAAGACAGCGGGTCTATCCAAGAAGGGAGAAGCTAACGCCGATATTTCAGCTGACGTGAGTGAGTGCCGTATCCTGTTTAGTCCCAGAACCGATCGCAGTCGCGCTGAGTTGCTTGGCAGGAAAAAAGATGTACCAGTGGAAGTGGTTTTAGCACTAAGCCAACATGTGAGCAATGATGCAGAGCTGATGGCGGTGCTCGGCGACATTGGAGGGGTGCCACTGAGCATGTATGAGCACTGCGCTGCACTAACAGGTGAGAATATACTAGAAAGTATTCAAGTTTGCCGCATAGGTAACCGGTTTGGATTGGCCCCACAGGAAGGTTTGGAACTGCTGCGCAGGGTGGGTGGTAATTGGTGTGCTGTAGAGGAGGCAATGGGCACCGCCGTAGGAGTAACAACATCACAGGTAGCATAG\n>XM_017771362.2 PREDICTED: Gossypium arboreum uncharacterized LOC108470132 (LOC108470132), transcript variant X1, mRNA \nCGTTTTCTTCATCGAGACTATTCGTGTATTAACATCAATCAAAGATTTAAAATCATTTCTAGAGTCTTATCTTGGCGCTCTCTCTCACATCACTTTTGCCTTGCTCCGCAGCACGTAGGAAAACTAGAAATTAAGAGAAATTAATACTAAAAACTAATGAAAAAAAATAGCAAATAGCTCTCAATTCAAACCAACAATTTGGACTTTAGATTAATAGAATCAAGATGGAGGATTCTGGAGCAATTCTTTACCAAATTTCATGCCTCAAGGAAATGCTTGATCAGGTTAATGAAGAAATCGAATCCAATATTGAAGTATCGCGGGAGATTGAATCAGAGATGGTCAAGTGTACGGAGTTCGAAGCTGCTCTTACTACTAGAGAATCCCTGCTTACCAAATCGCTATACATTTCTCACTTCGAAATCGATGGCTTGCTCTCCGTCATCGCCGATTCAAGAAATTCGCTTAAATTTTTGGAGGAGGAGTTGAGTTGTCTAACCACGAAACGAGATGAGATGTTAAAGAGGATTGACGATAAACGAGACGGATTTACCAAACAGTGCTTAGAATTTCAAAGGGAGATTGACAAGGGGGATAACAACGAGCTGGTGAATTTGCTGTCAGAGAAAGAGCTTCTTGAGAATGAAATTCATCTCTTGCATAAGAAAAACAATGCTTTGAGAAATTCAATGTCCGCTTTTGTGGAAGAAATTCTTGAAGACCTTTATTCTTCAAATGCAGATTTTGGGTTCACATTACAAGCTCGGGGATCGTCAGCAAAGTTCTTCACACTATCTACGATTTCGGCATTTAAATATTTGAACTCGAACTATGGCATGTATAGGCTAGAAAGTGTTTTTGAAATGTTTGATTTTGGTTTGTATAATAGCCATGGGAAAATGGCTTGATGTTAAATTCAGTCTTGTTAAATTTGGTTGGTGTTCACCTTGGTTATGTAGTTATGAGCCTGGTATGTGTGATGTTGTGCTAGGTACCATGTGATACACAATTGGTTTGCTTATTATGGTAAAATTTAGTTTTATATGATCTTGATTAAAA\n>XM_003676498.1 Naumovozyma castellii CBS 4309 hypothetical protein (NCAS0E01160), partial mRNA \nATGCCATCTTTTGAAAGTGGTTCAGGTGCTGAAGAAGAAGAAGAAGAAGATTATTTTAATGACTTAGAGGTTGATCTTGGAAGTGAATTAGAGGAGAATGAAGAGGAGTACGAAGCTCTGGACATAACTCCTCAAAGTGGATATGACGATGCCTTCAATGATCTAACTAACGACACAGCTTTTCTAAATGAATTAGTTAAAACTTTTAAACCTTCTACTATGCTAAGTTCTGTCGATATGAACATGGAACCAAAGAAACTTTCGATAGTATATAGAGCGATCGAAAAACTTAAGGCAATGTTTCATTCCCAGTCAACATCATTCATTGAAGTTTTGCCTCATCTGAACGAACTTAGCCATCAGATAAGAAGAGAAATAGACATCCTTTATCAATATTCGAAAAACATATATTCGACAAGATTTACTGAACTTGATACCATAGCAGCTACCCCATATCAGTATGCAAAAGTTACATCATTGATAGAGGGAACTTCTGATGATAAGGCCGGCCAACTTCCGATCAACATCGAAATTGAAGCTAAACTTTCAAAAGAACAAGTCTTGGTGCTACGAATGTCCATGCAAACTTCATTCCTTAAGAATAAACCTTTAGAGAAGAAGGTAAAACATTTGCTTTTAGAGGCGTGTTCTATGATCATACAACTTACGGACTTGCAAAATGTTATCCTGCAATACATTTCTTCTAACGTATCTGATATTGCCCCAAATTTGTGCGTCCTAGTGGGTCCAGAGGTTGCATCACTTTTAATCGCACACACAGGAGGAATACTTCAATTAGCAGAAATACCTAGCTGTAATCTAGCGTCTATTGGGAAAAATAGACATTTATCACACGAACTTCATACCACTCTAAGTGGGGTAAGACAAGAAGGTTACATTTATAGTAGCGAACTAGTTCAAAATCAACCGATTCAAAATCACAAACAAATGTTAAGGATGGTCTGCGCCAAAGTGGCCTTAGCAGCCAGGGTTGATGCGGGTCAAAGGGGTGCTGCTAAAAACGATTTATTGGGACAACGGTGGCGAGAAGAATTAGAGACTAAGATTCAAAAAGTTACAGAGTCGCCCAATATTTCCAATGTGAAACCATTACCTATCCCAGAAGATAAGCCAAAGAAGAAAAGGGCTGGGAGAAAATTTAGAAAGTATAAGCAACAGTTCCAATTATCTCACCTCAGACAATTACAAAATCGAATGGAATTTGGGAAACAGGAACAATCTACAATGGATGCTTTTGGTGAAGAAATTGGCATGGGTATGACGAGTTCATCCATTCAACAATCGATAGGAGGTATCAGAGCTAGCTCACAACGTGTAGATAATTCGGCCAAGATTACCAAAGTGATGAAACGTAGACTTAAAGAGGCAGATTCACAATCAAAAGAATTTGCATCGTCTCTGAATTCAAGAGAATTTTAA\n>XM_026930086.3 PREDICTED: Pangasianodon hypophthalmus carbohydrate (chondroitin 4) sulfotransferase 12a (chst12a), mRNA \nGTGTGTGTGTTGCAGCTTAGATTTTGACGTGTAACTACTATTTAGGACAGCAGACAGGGTTATATATGAATTTAGGACAGTACTTAAACTTCATGGTTATCTGAAGCCGTGTAATGATTACAGCAGTTGCTGAAATCTCGCGAGGTTTCGGAGATCTCGCCTGATCGTGCGAAGAGCGGTCGCACATCATTCCGGAGGAGACGACGACGACGTCTGGGTGGAGGGTCTCGAGATGACTGATGGTGATATGGAGCTTCGGTGAGAATGGAACTCTCCCTGTCCAAACCAGACAAAATGGGCAAGACGAGGCTGTTTCGCATCTTTCTCATTTTAGGCTCTGTCTTCATGATCCTGCTGATCATCATCTACTGGGATGATGTTGGAGCCACCCATTTTTACCTGCACACAACCATATCCGGACCTCATTCTTCCCGCCTCCCACCCGAGAGTCATGCAGCTTCCAAAAACAAAGTTGAGGAGGACAAGGATGGCTCGTTCCTGGCCGACATTGACGCTTTTGTCAACCAGTTCCTGGAAGGCACCTCCGACCCTACGGAGCAAGTGAGAGCTGAAACGCCGCCCGGTGAGACTCACAACCAGTCCTCAGAAAAACCCGAGGAAAGATTCGTCCCCAGGCGCGAGTGGAAGATCCACCTGACCCCGATCGCCACAGAGAAGAAGCAAAGGCAGGACAGCAGGAAGCAGCTGATCCACGATCTTTGCAGCAGCAACAGCAGCTTCGACTTCCCAGGCAAGAACAGGACGTTCGATGACATCCCCAACAAGGAGCTGGACCACTTGATTGTGGACGACCGACACGGGATCATCTACTGCTACGTTCCCAAGGTGGCGTGCACCAACTGGAAGCGCATCATGATCGTGCTGAGCGAGAGCCTGCTGGTGAACGGCGCACCCTACCAGGATCCTCTGGACATCCCCGTCGAGCTCATCCACAACAGCAGCGTGCACTTCACCTTCAACAAGTTCTGGAAGCGCTACGGCAAGTTTTCTCGTCACTTGATGAAAATCAAACTCAAGAAGTATACCAAGTTCCTGTTCATCCGAGACCCTTTCGTGCGGCTCATCTCGGCTTACCGCAACAAGTTTGAGCTGGAGAACGAGGACTTCTACAAAAGATTCGCTGTGATAATGCTGAAAAGATACAGCAACTATGTCGACCCGCCGGCGTCGGTGGTGGACGCTTTCGCTGCTGGAATCCGACCGACTTTTTCAAACTTTATTCAGTATCTGTTAGATCCGAACACCGAGAAAGAAATGCCATTCAACGAGCACTGGAGGCAGATGTACCGCTTGTGCCACCCTTGCCAGATAAATTACGACTTTGTGGGAAAACTGGAGACCTTGGACGAGGACGCTGAGCATTTGTTGCGCATCCTGCGCGTGGACAATGTCGTCCAGTTCCCACCGAGTCGTCACAACAGGACGGTCAGCAGTTGGGAGCAGGACTGGTTCGCCGACATACCTTACGAATCACGCAGACAGTTGTACAAGCTCTACGAGGCTGACTTCAGACTGTTTGGGTATCCTAAACCTGAGAAGCTTTTAAACGAGTGAAATGGGTTTCTGAGTATTTTCTTGCTGTGGGTTATTTAACTGTAGTTCATTTGGTTAATGAGTAAATTTTTTTTTTTTTTGTGGGTCCCCTTTTCTCTGTGAGCATCGCTCCCGTTTGCTTATCACACAAGCATTAGAAAGGGTTGATTAGAGTGAAAACCGATATTACATTCAAATTTTTAAAAGTTTCCTGTATACAGATTTATACTTTTTATCTTCTTTTGAGAACACATCCGTCTGGCACGCAGTACTGTACTGTAAAGTCGGGCGAAGATGTAGGTTTTAATTATTATAGAATATCACAACAACAGTAATAATAATAATAATAATAATAATAATGGCTTATGCCTTTAGTTTTTCATAAAGTATTCTTTTTACTGTCCTCAATTAACCATCATTCATAGTTTCTTTCAATTTGATTTTAAAGAAGTATGCAGCTTGAACATACAACTGCTATGTTCTGCACATTTAGGGCAGTGCACATAGAATATGTAGAATATTTTTGTATATTTGCTATTTTGGAAGAGCGAACTTTTAGCTTTATAAAGGAAAGGATTCACTGCACTCCTGTAGCATTGCAAGATCAAACCATTTTGCTGGCACTCATTAAGCGTAGCTTGTGTGTAGACATCACCTCATTTTTTATTTTTTTTTTCCATAGCATTTGCATTTTTATCACCCACCTCAGGATGCAAACACTTTTTTCAGACCTCATTTAAAATGTATTGAGTGCAAATGGATTTTCAGACGTTTACTTAGGAAAAAAAAGAAGAAAAAACCCGAGCAGTATTGGCTCTAATATGCACTCCACACAAGGTATTTCTGTTATTGCTGTGTGATGAAACAGTGTTTCTGAACATCTTCTGTTTTTTATGAATGTTTAATGTTTAACAGGCGTCAAAAAGACATTTCTTTAAAGCAGGGCAGTGCGGTTGACAGATTGGAGCTCCTGTTAGTTTTCATGGCATCTTTCCTTTCATCATTTGCATTCGTTTCTGCTTTGATTTGAACATCGGTTCCCCTGGCAGCAAGCCGCTCTCGCTTCATTGCTACATCTCTCTTATTGTCAGTGTGCCATGTGTGCCCTTTTTTAAATTTTTATTTATTTTTTTTTTATAAATGTCCATCTCTCAAGAGCTGGTCATGGATTGTGGACAAGTTTTACTTGTTCTGGTAGACTTAGCATTTAGCAAATGATGCCTGGTTTGAGTATTGTTTTGTCTAAATGCAGACTCAGCAGACGTGGAGCGGTCTTAAAGCACAAATATTTGTCCAAGGCCCTTAAACAGTAAACAGTTCACTTTAGGCGCCTGATTTGCTCTCCAGCGTTTCCCAGAATTCTCCATACGTAGTGGACTGTGTTTGCCAGCATCACGTCAGTTGTGCCTTCGTCAGCGGATGTTCGTGGACGTCCGCTTCTCCGTTGGTCCACAACACTTCCAGTCTTTTTGAATTTGTTAATAATGTGCTCGCCGTGTTTCCTTTTAAAGTCCATCTCAACCTTGCGACAGCTTCTGATCCAGCCATGAGAATGATTTCAATACGAGAATGATTTCTCAAGAAGACAATAGTTCTTCTTTTGTCAAAGGCATCTGTAAAGGATATCTGAAAAAAAAAATAATAATATAAACTAAGTATGAAACATTTTGGAAGATATTTTGCAAAAAAAAAACAAAAAAACCTTAATGTACATCCTATGTATGGAGACTTTTGGGATACCATGCAGAGTAAAGTAAGCGTGTCACAAGGACTTGCGAGGGATTTTACGTGGGAAGTTTTCGGTTTTCGGTTGCCGTCACGGTGTTTTTGCGTGTTGCATTTTGCACATGGAACAGTTCTTGTCCTGGATGAGAACGCCGTTTCTGAGAAACAGGAATGTGTTACGGTGAAATGGTGTACAGAGAGCAGGAGCGTTATGAAGCACAGTGTGACTGTAGTAGGTCAGAGGAGGAAGGTTTTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGGAAGCCTAAACCACCATCAGCAGCTGTACTAGAGGAGGCACTGCACCGGGTGCTAGCAGTGCCTTTCTTAAGATAAGATTTAAAAAGTTTACACAAACAAAAATAAATATGTATAATGTACAGGTATTTTTGTAAATGGGTCAAATTTGAGATTTTCTTTCTCACTTGCTAGTTAGATGATGGGAAAACATTTAAAAGTATTAAATTCTGTGTCGTGTAATTTTAATCCTAGGGGTTTTGTTTTAGTTCTGGCTGTATTGGCGAGATCTGTTTAGTTATTTTTCCATCATTTTCACTGTTGTTTATTTTTTTGTCACTCGATTCCCATAGTTTACAAAAAAAAACCAACGTCAATGCAGTTAAATGTCCGCACAGTATTTCCTGATGTTCTTGTGCCACAGTATTCACTGAAACGTTGACATAAATGACAGACACATGCTCGTTCGCTGGCTGATGTGAGATTTATATTAAAAAAAAAATATTCTGAGATGATTCTCCAACATGAAGGTTTTGTGTTTGCATGGAATATGTTCATTTCAAGGGAAATTGCTGTGTTTGCGATTCAAAAGGCGATGTGTATTTCTTAATGTTGCATCAACTGAAAAACATTCTCCAGTGTGCTGATCTGGAATACAGTTTTGTATTTGGCTGGTGTTTTTTGTTTGTTTTTGTTTTTTTAATTTATTACACTTTAAGGACCTTTGTTATGCAACGTCAAAAGAACAAATAAAGCTTAATGCATGGTGCAAAA\n>MF557355.1 Uncultured bacterium clone 1686 16S ribosomal RNA gene, partial sequence \nGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTCTCTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGGGACTTGAGTACTGGAGAGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCAGTGGCGAAGGCGGCTCTCTGGCCAGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCC\n>XM_012605072.2 PREDICTED: Gossypium raimondii heat stress transcription factor A-4b (LOC105780637), mRNA \nTGTTGTTACTAAGTCATAAGACTCGTATAATTAATAAACCCACTGTTTCCTATCTCTCTCATCTTCTTCTTCCTCTTGCTTTTTCCCCAAGTTTTTATTTTGGATTGGATTAGAAACTTCCACCCACGTGTTTGGTTTTTTTATTTAACTTCATATTTTTTCCTCAATACCCTTTCTAGATTATTTTCCTGGAAAATTTCCCTTTTTTCTTTTCATAATCCAACCCTGTTTGACAATTTTACATGGGATAAAGGAATATCTACTTTCCTCTGGATTGTTCTTCAAAGGTTTTTAGGGTTTAAAGGTTTACGTGCTTTCAGTGGAAGTGATCCTGGTTTCGATTTAGCTTCTGAAAATATCAATTGTTTTGACTTTTTTGATTTAAAAAGAAAAAGGAAAACGCAGGCATATGCTTGAGTTTGAATGAAATGGAAGGATCGCAGGGAAGTTGTAATGGGCCGCCGCCTTTTCTTACAAAGACATACGAGATGGTGGACGATCCAGTGACTGATTCGTTGGTGTCTTGGAGTGAAACTGGTTATAGTTTCGTTGTATGGAACCCCCCAGATTTCTCAAGAGATTTGCTCCCTAGATATTTCAAGCACAACAACTTCTCAAGCTTTGTCCGTCAGCTCAACACCTATGGGTTCAGAAAGATAGATCCTGATCAATGGGAGTTTGCAAACGAGGAGTTCATAAGAGGGCAGAAACATCTTTTAAAGAACATTTATCGACGCAAGCCAATCCATAGCCATTCCTTGAACCGGCAAGGAAGCTCTAGTGTGCCATTGACTGAGAAAGAGAAGAAGGAATTTGAGCAAGTGATCAAGATGTTGAGTGACGATAAGAACCGGCTTCAGTTACAGTTGCAGGGTCATCAAAAAGAGAACGAGGAATATCGGTGTCAAGTAAGGCTGTTATCGGAGCGTTTTCGGAACATGGAAGATCGACAACGACGAGTGATGGTCTCATTGGCTAGGATTATAGACAAACCCCATGTTCTGTCCCAATTTCATGGCAAAAAGAGAAAGTTATTGAACTGTAACGACTTCAATGATGAATGCAACATACAAGATCTTCACAGTTTGGCTTCTCTGAATGCAAACATGGGATTGGACTTGAAACAGATTGAAGAATTGGAATCATCTATAAGATGTTGGGAAACATTGTTTCTCGAAATCGGAGAAACTATAGGTGAAGAAGTGCGCGATTTCGGGACATCCTTACGGCCTTCTCCGGTTGTTGTTACCGAAATACAGACATCTTCAGGGGACTATGACATGGATGGTGAACTTTACTCACCTTCATCACACCATTGCTCCCCTTATTCAACCGATATTAACTCATCACCTGAGCTGGTAGCCCCTGCTTATCGTCCTATCCATACACCATCATTTCACCATGTCGTAAATCTCAACCCAAAGCCTCCTGGAATTGGCCTAAACTCCCAACATGCTAGTCCACTGGAGACCGATCAGGCCTCAAAGAACCAGGCAGAAGCAGTGGCGACCGGTTATACCGTGCCAGGTAGTGTAAACGATGGCTTCTGGGAAAGGTTTCTAACCGAAGTTCCGGATACATCATCGTATGCACAAGAGATCCAGTCAGTTTAGATTACCTGGCATAGCAGCTTTCTCCAGATTAAAGAATTTAGAGTAGGTTAAGTGATAGAAGTGAGCTATGCTATTAACCATGTATTACTTCTGCCACATACTATGATGTAAGGATATTAGGTTAGAGGACTCTGTATTTTTTGGTTTACGTTTATCTATCTTCTTTCTCTTAGTTATTTTAGCAACAATTTTCACTTTGAATTGAAGGTTATTTTTTTA\n>XR_002390227.1 PREDICTED: Heterocephalus glaber uncharacterized LOC110346290 (LOC110346290), ncRNA \nTTTCAGCTTTCTCCTGCCAGTTACCTCTATCTCAGGCAATATGTTTACACTATTTCTTGGTTTTTTCCATGACTGTTACACTAGGAAATTAGAATTTTCCTCTCTTATGCCCTCTGTACACTCAGCCCCCCCAGGCAGATGTATGATAAGTTGTGGTAAGATCAATATTCAACAGTCACTGTTTCATCTGTGTAAATGTTACTCCATGAGCTGTATTTATCTTCTTGTGCAACTGGGTTGCTGTATGTTAATAATTTTCCTGTGTTTGTTTTGTTTTGAGACAGGGTCTCACTATGTAGTCCTGGCTGGCCTTGAACTCATTATGCTGCTTAGGCTGGCCTTGAACCCTCCGAGATCCTCGTGCCTCGGCCTCCTGAGTGTTGGGATTGCAGGTGTGCACCACCATGTCCGGCCGTCTTGGTTTTCTAAGCATCTCTCTGCTTCATCACTGAGCGCCCATGAGTTGCTTCTCTACTGCTCCAACCCATGCGGGTGTTTCTAAGTCATAAGCCTGAGCTGGAACTTGGGATCCTCCTGCCTCAGCCTCCTAGAGCTGGGATTATAGACCTGCACTACCATGCTAAGCTTTTGGTGCCCTCCCCACCACCACCACCATGGGTCCAACTCAGGACCTTGCACTTGTGAGGTATATCCTGGAAGACTGAAATCACAGAAAATGGGCTGACATTTGCTCTAGGAGCCACGAGTCAGTCTTTCCTGGCGAACAGTTCAGGTGCATTCCACAGCTGGCTGAGTGCAATGTCCGTGTCCACGAGGCTAAGGCAGTTGGCAGTCACTGACACCATCTCATCTCCAAGTCTACTCCATCCTTAGTACAGTTAGTGTTTGCTGTCTCCTCCTGTCCTTTCACTTTGTTTTTAATGTGAATTTAGTATTTCTTTGCTGTTCTTCCTTGAACTGGGGTGTGTGGTGCACTTACCATTAAGTTAATTCAGTGAATATCTTTGGTTTATTCCTGGGAGGGAAAGTGGCTTTTGTTTATATTTGCTCTTGCCATTTGTTCCTACTTCACTTGAGTTTATTAGTTATTCCTTTCTGCCTTCCTTGAGTTAATCAAATATTTTTCACAGTTCCATTTTGATTTTTCTAGCAGCTTGAGCTATACCTCTGCATTATTGCTTCTGGTTACTCTGGGGCATTGGTGGCAACCCTGTGGTATGAGTGCAACAGCGGGCTGTATCATTGAAAGCTCTAAAAGGTTTGTCATCGCTGTTCTAGGGATTACAATATGTATCTTTTTCAAAATCTAATTAGTATTATGCTACTTTACACCAAAATTAGTAACTTTTAACAGTGTAATCCCATTTTCCCAGTCCATATAAAACACAACCCTGGATAGCATGTAGAGTCTCACAGCTAATTAAAAACTAGTTAGTATGCAGATATGGCTGTTTTTAAGTCAGTATGAAACAGTCTGGGACCTCGAGCAAACCCCACCAGTTAGCAATGAAAGAGATTTGGCCAAAGCACCCAGCAGTATTCATTTAAAAGCTTCATTTGGAGACATTCTACATGCAGTCATTCGGTGATGCATCCAGCACAGGGAGGCTGCTAACAGTGCATCCTGCAAACCTTTCAATCCTTTCAGAGTAAGAAAAGCCCAAAGGATGGATGGAACATCTGAATGGTCCCTGAGGTCTGTTTTGTTTCCCTGCTGGCTTAGCAGTCAGTCATCATGGAGACCTCAGTGTTAAATGTCACCCAAACGCCCTCACCCCAGAGACAGGAGGAGGCATACCACATGTCCTCAGGCAGTCACAGCATCCTCCTCCAGTCCATTCTTTAGGACAGCTGAGCTCCCTGACAAGGTGAAAGGAACAAAGTACTAAGATGATGAAAGCTGTATCACCAAGTCCTCCTGAGTGTGAGCATCATGCCCTGGTTCCCGTGCACTTGGTGAGGCTGCAACCAGGAGGCTAGGTACGATGCCCACTTCTGAGCTGAGCAGACAGGAAGGGTGAATTCCCAGAACCTGCTGTCAGGAACAAGCATCAGAGCAAAGACTCTAGCTCCTGGGAGAAACTCTCCAACCTAGTTGTGTGGCTGAAATTAGTAGGGAAAGGTGAGGAAGTTACGTCTATCTAAGAGCAGGAGGATTAAAAGCTGCCAACTAGGAAGGAAACTGAAATGCTTAAAAAGTTAAAAAAAAATTTTCATTGTAGTCTGATGAATATTTCGAAGTATATAGTAAGGTATTTAACAAGGACTGGTTACCTGTGTGTAGGTTAGAGATACTAAAGTGATATGGTGCGCTGTCAGCCATATGGGGTGCAGACTTCCTCCAAAGCAGATCAATAGACTTATTGTTAAAGACAACATGTGTATTGAAAGTAGCAATTTTATTTGAGTTAAAATTATTTACAAAAACCCAAAGACATACTTCATGAAACTGGTACAAACTATTTTTTTCCTGCCGTTGGCTTTTGCTCCAAAGATCACAGCTGAGAAATACTGTATAAAATAAAAATAGGATTGGATTCAGAAAAGTACTCTACTGTTCTAATTTCCAATTGGTAGTATTTACAGAAATATTTACAGTGG\n>XM_028898326.1 PREDICTED: Prosopis alba vestitone reductase-like (LOC114713661), transcript variant X1, mRNA \nATGGAAGACAGCAAAGGAAGAGTATGTGTTACTGGTGGTACTGGCTTCATAGGTTCTTGGATCATTAAGAGACTTCTTGAAGATGGCTACTCAGTTAATACTACCGTTAGATCCAACCCAGAACACAAGAAAGATGTGAGCTTCCTCACAGATTTGCCAGGAGCATCTCGGAGGCTACGAATTCTGAAGGCAGACCTAAGCGAGCCAGAAAGTTTCAAGGAAGCCATTGAAGGGTGCATTGGAGTATTCCATGTGGCTACTCCAGTGGATTTTGAGGAAGGGGAACCTGAAGAGATTGTGACCCAAAGATCCATTGATGGGGCATTGGGAATTCTGACGGCATGCCTCACTTCAAAAACTGTGAAGAGAGTCATTTACACTTCCAGTGCCTTTGCTGTTAATTATAGTGCCAAAGAAGAGGAAGTGAAGGATGAGAGCTCATGGACTGACGTGGATTCTCTTAGAACTTCAAAACCATTTGGATGGTCTTATGCAGTTTCTAAGACATTGACAGAGAAAGCAGTGCTTGAATATGGACAACAAAATGGATTAGATGTTGTCACTGTGCTTCCCAGTATTGTTGTTGGATCCTTCATTTGTCCTAAGCTTCCTGGTTCTGTTGGTTCGGCACTCTATTTTTTATTAAGTAAGAACGACCCATTTGCTTATCTGCAGCTACCTATGGTGCATGTGGATGACGTGGCAAGAGCACATGTATTTCTGCTTGAACATCCTAAGCCAAGGGGAAGATATAATTGTTCTTCATGTCTGGCTACTGTTGAAAAACCACTTGAAATTGTGTCTGCTAAATTTCCAGAACTTCAAATTCCAACCATAGAAGAAAGAGCTAGCCTGAAAGTTTCAGATCTGCCATCTAAGAAGCTTATAGATGCTGGATTTGAGTTCAAGTATGGACTTGAGGAAATGTTGGTGGATGCTATTGGATGCTGCAAAGAAAAGGGTTTTTTATAG\n>XM_044451096.1 PREDICTED: Varanus komodoensis leucine rich single-pass membrane protein 2 (LSMEM2), mRNA \nCCTGAGCAGCTGATGTGACAGGCAGAAGCCTGTGTTTACTTCCCCAACCGCTCCCAAGGGATCTGCATAGGCCCCTCATAACTTCTTCCAGACAGATTTTTTTCCCCTTGAGTTGCCTCCGGAACAGCCCAAGGAAGCGGAGTCTGGCTATTGGGATGTCCAGCGAGATTGCAGAAGGCGCTATGGTGAAGGAGGCCACTTCCTCGGATAGGGAGCTTGTTGAGCCCTGCGACACTGACAGGGCAGAAATCAACCTGCATGCAGTGGAATCCATTAGCGACTTGCACTACGCATCCGGCAGACCGGAGGGCTTCAAGGCTTCGGAAGGGAGCAGCCAATCTCAGCCTAACACCCCCTGGACTCCGCACAGTGCTTCCTCCAAGCATTTCTTCTTCCCGAATGAAGAGGACCCCTCCTTCCTGCCAGTCCAGAATTTGCACATTGCCCCCGATTTCTTCTGCTGCCCCTGCTTCAGCCCCACGTGCTGCCCCACAGGCTTCTTCGCTCTCCTCGGCGTGCTGGTAGTGGCCAGCCTTGGCCTGGCCACGCTGGCGGTCTATCTGAGCGTCCTGCAGCGCGAGTCACTCCGTGTCCTCAGCCAGTGGCTGGAGTCCCAAGAAGAGGCCATCCGGCAGATGAGAGCTGTGAGCGTACAGCTCTGGAGGCAGCTCAACGCCAGCGAGCCCGGGGCTCAAACCTGAGTTGCACTGCTCACCCACAGCCTCCTTTTGGGGGCGCTCAATTCCAGTGCGACAGAAGAGGGGACACCAACTCACTGCTTGGCACCTTTTGGACACTGACCTGTGCTGGTTTGGACTGTGTGATCCCAGAAGCTTAAAAAAAAAGCTCTTTTGAATCACGGGTGGGTCTTGTGAGGTTCGTGTGTCTTATTGGAAGCAAAAGCTGGAGACCTTGAGGCTGCCTCAGGCGGAGAGGGGGCAGGCAGGCAGGCAGATGTCCTACCGAGGAGTAAAGCAATTGGGGGTGGGGGGGGGTCTGCTCAGCAGCCTCCCACCAAGGGCAGCATCTCAGCCACTCTTCCTTTCCTTCCTCCACAGCATTTTAAAAGACATCACCTCCATCTTCTCTGTTTTTTCGCTCTGCTTCACTCTATGATTATTTAATGGTTTGCCAATGGAGCACCTATGCAGAAGTGCCTGACAGCACAAAATAAAACCCTCAAGTTTCTGCTGCCA\n>XM_004069731.4 PREDICTED: Oryzias latipes pyruvate dehydrogenase complex component X (pdhx), mRNA \nCAAAGCCAGAATTTACGGACTGGACGAGGGAGGACAGCAACATGGCGGTCTCCTTGCGCCTGGGTCGTCAGGGAGCTCTGCTTGGGCTCAGATTCAACCAATTTAAAAAATCAATATGTCCCACACATTATTTCCAGGACCGAGTTCGACAGTTTTTTCATTCACCATGGGCGCTTGGTGTCACTCCACTCAAAGTGCAAATGCCAGCTCTCTCCCCCACCATGGAGGAAGGGAACATTGTTAAATGGCTTAAAAAAGAAGGTGAGACCGTGGAAGCAGGTGATGCTCTCTGTGAGATCGAGACTGATAAGGCTGTGGTTACCATGGAATCCAGCGACGATGGGATCCTGGCAAAGATACTGATGGAAGAGGGCAGTCGCAATGTGCCCCTTGGCACTCTCATTGCCCTTCTGGTGGAGGAAGGACAAGACTGGAAGCAGGTTGAGGTCCCCTCACCAGATTCTCCATCTGCAGCTCCCACGATTCCCCATGAACCCACTGGCTCCTCTGTGACCCCCGCATCTCCTCCTCTTTTACCCAAACCTGCGACGTCAGGGCCGTTACGTTTAAGTCCAGCAGCACGACACATTCTCAACACCCATGGTATTAACCCAAAACTGGCCACACCCTCTGGACCAAGAGGACTCATTACAAAAGAAGATGCATTGAATCTTTTAAAGGCGTCCCCTCCACCCAAAGCAACACCAGTTGTTGCCACGGCAACTGTCCCAACTCCTGTTCAGAGACCCACCCACACCCCCACAGGTCCCCCACCACCTCCAGGCAGCAGACCGAACATCCCCCCTCTGTCTGTACCAGGGAAGCCCGGAGCACCAGGAACCTTCACAGAAGTCCCAGCCACAAACGTGCGGCGTGTGATCGCTCAAAGACTGACCCAATCAAAGACCACCATCCCACATGCATACGCCTCCATAGACTGTGACATGGCTGCCGTCATTAAGCTCCGTAAAGATCTGGCCAAAGAGCAAATCAAAGTGTCTGTCAATGATTTTATTATCAAAGCAGCCGCTGTTACTCTAAAACAAATGCCAGAGGTGAATGTGACTTGGTCTGGTGATGGACCCCATGCGCTCGATTCAGTCCACATCTCGATTGCTGTGGCGACGGACCGAGGCCTCATCACTCCTATTATCAGGGATGCAGCTAACAAAGGGGTGCAGGAGATCTCAGCTCAAGCTAAGGCACTGGCTCAAAAAGCTCGAGATGGCAAACTTCTTCCTGAGGAATACCAAGGAGGCTCGTTCAGCATATCTAACCTGGGCATGTTTGGAATCAGCGGCTTCAGTGCCGTCATCAACCCTCCTCAGGCTTGCATCCTGGCTGTCGGGACCTCCCGGGCTGAGCTGCAGCTGAAGGAAGAGGATCAGACCGTGCACACGCGGCAGCTCATGACAGTAACCATGTCCAGCGACGGACGACTTGTGGATGACGAGTTAGCGTCTCGGTTTCTTGATCAATTTCGTGCCAATCTAGAACAACCACAGCGTATGGCCCTCGCTTAAAAAAAAAACAAAAAAAAACAAAGATGAGGGGAAAGATAAGAGAAAATTTGAAAAGGTCTCAAGCTATGTCTTTTGACAAGCAAGGAGCTGAAACAGTTTGTGTCTGTCCTTTCTTTAAGGCTTTAAATAAGGTTGTGTACATACTGTGAACTTAAGTTTGTGGCCTCTCTGCTTATTGTCCGCAAGTTTTTGGAGTGGAAATGGATTTCTCCCTAAATTTAAAGGGCTTGTGCAGTGGTTCCACATTCTACCATGAAAGATAAGACGGCAAATGTGATCCATCACACGGGTGTTGTGTATATAAAGAAGTAATTCTTCAATTTCCAGGTCAGACTTCATGAAAGTTGTTTCACTAAACGTAAACGTGAAATTGGTGAAGTCTCCTCATGTAAATTTGTGAGATATTTATTATTTAACATAAGTGACACTGCAGGTAAAATCCATGTAAAGCAGCATTTATTGTTGCTCATTATAAAAGTAAACTTAGTATGTGAACAAATTTATAAATTTATTCAGAATCACACATAAAGAAACATCTCCTTCTGGTCCACATGTATACATCAGGTTTGGTTTTGTTGTCTTAAACTCTGTCCAAGCAATAAAAGTCCTGTTCAACCATCTGA\n>XR_004159256.1 PREDICTED: Meleagris gallopavo uncharacterized LOC116216471 (LOC116216471), ncRNA \nACCACTGAACAGAGCCTGGCTCTGTCCTCTTTGCATCTCCCATTTTATATATGTTAATGGGACCTCCTTGGGCATTCTCTTTTCTAGCTGATCAGTCTCAGCTCCCTCAGCCTCTCCTCATGGAAGTGCTTGGTATACCCAGGCTAATTTGGAATGACTACCTATTGCTGTCAAAATAGATACCCTACTAACAATTCATTCAATAGGAGCTTACTGCTGTGGAGAAGCTGCCTGCTGCAGTAACAGCATGACATGTTCAGACTTGTTATGTTGCCTGACAGCCTTGACATATTTGCTCTGTTTCCTCTATTTGTATAATGGTCTCTGGCTACAACACACATCCCTGGACATGAATTTTCATTTTAAAGTTCCCAAATGGCCTTCATGAAACTTGTGTGCATATAACCCCAGTATTGCAGAAATAAGTACATCAATCGCAAACTTCAGAAGGGGAGCATGTTTTACACCTGACTGCTCTTCCTAACCCAGAATCCATTTGTTTATTGTATTTTAGTTTGGATTTACACACTAGCGATATGTCTTCTTACTTTATGCAACATTGCAATATTACTGCTTTACATAGAAAAAACATTGGCTGCACTGAGTCTCTGTTTAAAAACTGTTTGGATGTGGTGCTCAGGGACGTGATTTAGCAGAGGGTTGTTGGAGTTAGGGTAGTATGGCTAGGTTGTGGTTGGAATTGATGATCTTTAAGGTTTTTGCAATCTGTAATTCAATGATTTTTGTGATTCTGCAGTGAAAATGCTAAGTCTCGGCTTGGAACAGTGATTGAGCAGCTGGTGGGAAGGCAGGGCCAGCCCAGGAGAACTCAGGTGGATGCACTGTGCTCATTTAAGGGCTGGCAGTGGAGGAAGGTGCATATAAAATGAGAGTTTTCCCTTAAATGAAATATAAGAAATTTCCTAGACTTCTGCTGTGTAACCTACGCTGCTTCCAGCTTCTCCTGATGAGCAACTTGGTAACTGTGCTTTTTGCTCTTTCCTGATGAAGAACTGCTGCCTTCACTGCTCCATTTCCTGCATTGCTCACTCCACCATCCGACACCTTCAGAAAATATTGCCACCTGTTGAGAAATTTTACAATCTTCCTGCCTCTTGATGATGTGTGGGATTTGGAGGAGAGTGGATAAATAGAAGAAGACCTGTAGCCTCTTCATTTGCATCCTTGACCTGCTCAAGGCTTGGGCAGTACCTTGGTGAAGGACTGTTGGTGGTGGTCTCAGAGGAACAACCAGTTAAGAAGTATACTGGAGTTTTGAAAGAACTACATGGACTGAAGTGAAGATCATGTTCCCAAACTTCTGATTCAATGGAAAGCATCCTTTAGCTTGATACAGAGCTATACACTGTCAAAAGGCTTTTTCACATCTCTTTGGGAGACAGATTCAGCCACATGCTCTCGTCATTCACAGTGGAACTTCATGGGTAGGCAGAGGACCTCTCCCTCCGGGCTGATCTGGATGGGGAATGCCCACGGTACCTGGCACCTG\n>XM_041282614.1 Brettanomyces bruxellensis uncharacterized protein (BRETT_004118), partial mRNA \nATGCCACCGAGAAAAAGAAGAGGCAGAAAGAAAGCCACTTCTGTATCGAAGAAAGCAACCAGAACTAATTCTTCACATGGTACAAGTGATGCCACGCAAGATACCTTGAAAGATGGTGAGAAGAAGATTGAAGAAGCAGCTAAAACTCCCAAAATCACAAAAGATCTCAAAGAGTTGGAGGAAGAACGGAAAGACGCGAAAAGTGAAAAGCATGGCCAAAGTTTACCTGTTACGACTGATGCAACAATTGAAAGCAATGTTAAATCAATAGATTTGAAAAAAGCAGAGCCCAGTAATGTGCTGTCTAAAGAGAAAGAAAAGGATGCATTTGCAGAAACAGAAGCTGATGACATAATGAAGATAGTGAATGAGACGAACGATAAGAAAAGGAGTATAATGAGTCCAATTAAGAGTTTGCAAATAAGCCCTTTAAAGAATATAATAAAAGGCGATACAAAAGATCTAAAACCTGATGCAGGAAGTCCGATCAAACGCAGAAAACTTGATCCTTCTCCAGAACGAAATGTTGATAGAGACACAAGATCTATGGAAATGCACGTTGGTTTATTGTTTCAGAAGAAAGACTTAAAGGGTCTCACTGCCATTTCTCAGAAGACTTCCAGGAGGTCTGCCCAGACATTTGAAAATTACAAAAAGCTAGTTGATCGACGCGCAAAAACTGCAGAGATTATTATTGCGAACCTTACAAAAGAGAATAAGACTTTAAAGAACACAATCAAGGGACTCAGAACTGAGAATCGACATTCAACGAATGCAGTGGATAGCAAAGAGATAAACAAATGGAAAACAAAGGAAGTAGAAACTAGAAAGAAACTAGACAAGTTGGAAGAAGCCAAGAATAGCATAGAATCAAAACTTTCCGATGCGAACAACGAATTAGTGCTATCAGATTCAAAACAGGAAATGATCGAACTGCTATGTGGAACAGCATGTCTTGATTACGAGGAAAATGAAAAAAGCATTATATTTGCGCTTAGACAAAGTGGTACACTGTGTACATTATACTATCAACTCATCATAAATAAGTCCGAGCCATCAGATTTAATATACTCCCCAGTTCAAAAGAAACCGCAGGAATGGCCTACGGATAGTGCAATTTCATGGAAGGTGAATATGGATCGGTTGCACTCACTTCTTCCAGAATACTTGTTGGACAATCTTACTTTCCCTTCAAGCAACTTGAGAAACTTTTATCGAAAAATATCAAAAGCCGTGAATGGAATGGGAAAGCAGAAAGAGGCAGCATGA\n>XM_013019345.1 PREDICTED: Dipodomys ordii tumor protein p63 (Tp63), transcript variant X7, mRNA \nAAAACTTTTTTTTATCCCCAGAAGAGTGGACAGATACCATCAAATCAACTCAGTATCCAAACCCAAGGAAATGTAATTTAGCTGGAGGGAGATGGCCATTCCTCAGACTTGTTATAAAAGTCCAGGCTGCTGAAATTAAACTCTGATGCCATTCAAGCCAACATCCAATCAGGAGAGAGATCAGAAGTTCAGAGATGCCTCCAAGTTGCCAGCAAGTGTGGCCACTGTATGTCAAGGACTCTAAAGCCGTGGAAGAAAGGGAAGAACAACTTTAGTGAGGATGCCCAGCTGGTAAGAATCAACTGTTTGTGATGTTTTAGTCACTTGAGGAATCTCATTGGCTAACTTGAAGAAAGGCTCCACCTCTTTGCAAATATGTGGAATGGGAGAGAGGGGGTGAGGAAGGGGAAGTGTCTGAACTTCTATATCTGATGGCATCTGACCCTAATGCTTTAAGCCTCCTGGCCATATATCTACATATACACAGGTATATGTGTATGTTTTATATAATTGCTCTCCATTTGTTGATATCAAAGAGAGTTGAAGGAAATGAATTTTGAAACGTCACGGTGTGCTCCCCTACAGTACTGCCCCGACCCTTACATCCAGCGTTTCATAGAAACCCCAGCGCATTTCTCTTGGAAAGAAAGTTATTACCGATCCACCATGTCCCAGAGCACACAAACAAGTGAATTCCTCAGTCCAGAGGTTTTCCAGCATATCTGGGATTTTCTGGAACAGCCTATATGTTCAGTTCAACCCATTGACTTGAACTTTGTGGATGAGCCATCAGAAAATGGAGCAACAAACAAGATTGAAATTAGCATGGACTGTATCCGCATGCAAGACTCAGACCTCAGTGACCCCATGTGGCCACAGTACACGAACCTGGGGCTCCTGAACAGCATGGACCAGCAGATCCAGAATGGCTCCTCGTCCACCAGCCCCTACAACACAGACCATGCACAGAACAGCGTCACGGCGCCCTCGCCCTATGCGCAGCCCAGCTCCACCTTTGACGCCCTCTCTCCATCACCTGCCATTCCCTCCAACACAGACTACCCAGGCCCGCACAGCTTCGATGTGTCTTTCCAGCAGTCGAGTACCGCCAAGTCGGCCACCTGGACGTATTCCACAGAGCTGAAGAAGCTATACTGCCAAATCGCAAAGACATGCCCCATCCAGATCAAGGTGATGACCCCTCCACCCCAGGGTGCTGTTATCCGTGCCATGCCTGTCTACAAGAAAGCTGAGCATGTCACTGAGGTGGTGAAGCGGTGCCCCAACCATGAGCTGAGCCGAGAATTCAATGAGGGACAGATGGCTCCTCCTAGTCATTTGATCCGAGTAGAAGGGAACAGCCACGCCCAATATGTAGAAGACCCTATCACAGGAAGGCAGAGTGTACTGGTACCTTATGAGCCACCTCAGGTTGGCACGGAATTTACCACTGTCCTGTATAATTTCATGTGCAACAGCAGCTGTGTCGGAGGGATGAACCGTCGTCCAATTTTAATCATCGTTACTCTGGAAACCAGAGATGGGCAAGTCCTGGGCCGCCGTTGCTTTGAGGCCCGGATCTGCGCTTGTCCTGGAAGAGACAGGAAGGCGGATGAAGACAGCATCCGCAAGCAGCAAGTTTCAGACAGTACAAAGAATGGTGATGCTTTTCGTCAGAACACACATGGCATCCAGATGACATCTATCAAGAAACGAAGATCCCCAGATGATGAGCTTCTATACTTACCAGTGAGAGGCCGTGAGACTTATGAGATGCTGTTGAAGATCAAAGAATCCCTGGAGCTCATGCAGTATCTTCCTCAGCACACAATTGAAACCTACAGGCAGCAGCAACAGCAGCAGCACCAGCACTTACTTCAGAAACATCTCCTTTCAGCCTGCTTCAGGAATGAGCTTGTGGAGCCCCGGAGAGAAACTCCGAAACAATCTGACATCTTCTTTAGACATTCCAACCCCCCAAACCAGTCAGTGTACCCATAGAACCCCATTTCTGTATTTGAGTGTGTGAGGTCATTATGTTTCCGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGAGTGTGTTTATACCCAGCTCTCATAAATAGAACTTGAAGACATTTTGGCTCAGAGACCCAACTGCTCAAAGGCACACAGCCACTAGTGAGAAAGAATCTTTTGAAGGGACTCAAAACTTTACAAGAAAGTATGCTTGCTGCAGATTTTGTACCCTTAGATCCAGCATTGGTTGGACAGGAACCACTGTTGTGTATGTTTGTGAGCTTTTTGTTGTTTCCTGGGAGGGAGGGGATCAGGTGGGGAAAGGGTATTACAATGTTTATAAGACTCCTCTTCTGTTGCTTTCTGTTGTATTTCTAAAACTCATAATGAAGCTTTTGAGCAGGTCTCAAA\n>XM_044435426.1 PREDICTED: Varanus komodoensis meiosis initiator (MEIOSIN), mRNA \nATGTGGGACCAAATTGGCCGTGTTTGCCCTGAGGAATTACAGCTGAACAGCAAAAAAATCAAACAGAATTCTGATCGAAGAAAACACAGTAACTATACCAGCACTCTTAAAGAACTGGCTCAGATGTTGCCCATCCCTTTGCGGACAAGCTGCAAAAGGTTAACAAAGAAAGAAATGCTTCTCCGAGTCCTCCGTTACATCGAACACCTGCAGGCAAGCATTGATACAGCAAGATCTCTGCTCCAGGTCCACTCTGGGGAGCAAAAAGCAGGAGAATCTGAGCAGATGGTGACAACTGCCCTAAAGAGCGGGCGAAGAGAAACTACACCACGAGTAAAGAAAACGAAGCCACTGGCTGTCTGCAAGAAACCCAGGAAGAGGAGACGCACCCATAAATCAGAGCAACAAGGGGTGAACAAGAAAGTGTGCAAGAGCCTTGCTCTGGAGACCGGAAAGAGCCCTTCCCAAGCCGACGAACAACAGGAGGAGAACCCATCTGCATTGGGAGTTTGGAACTTGAGTGGCAACCATGAAGAAAGCAAGGATTATGCCAATGTGTTTTCTGCGTGTGAAGCTTATGAAGAGCCGCATCGATACACCGAAGTGCCTACGCATTCATTGATGGGGCAGGAGCTGGTGTACTACTATTCCTCTTGTGAGGAAGATGAGGAGGAAGGACCTGAAGCCAGCCCTTGGCTCTCAACCTGGTCCCCTGTGGGCATTTCACATGGTGACCTGCAGCTCTGTTCGCCTGCGATCATCACCCAAAGCAACCGTTGCACAGATCTGGGGTTGAGCCCTTCGCTTTTTTCCTCTCCAGCTCGGTTGCTGCCTACACACATCCTGCAAGGTGGCCAGGAGGAGTTTTCCCCAGTGCTGTTCGAAGATGTATGCCTGTCCCCACAGCCTGGTAGTTTTTCTCAGTCCCTCTCAGGCACCCTGTTAAGAAAGTCAGCATTCACGCTGGATCACTGCTACCTTTCCAACAGCGAAACAGGTAAAAGCAGTTCCAGTCCTGTGTCAAGAGAAAATGAGATCAAGTCATCATGGAACAAGCAGTTCCTTCAAGAGGAAGTTCACACTGCCAGGCCCGAATGCCCTCTGTCCTCCAGTGATGAGAACAGTGACAGCACTTGGACCCCATGCAAGAGGACGAAGCCATCCAGGGCGGCCCGTCGGAAGAAGAAGAAGAAGAAGAAGAGGAAGAAGAAGAAGCGAGCAGGCAGAAGGCAGAGGTGCCGGCCAGTAGCCCGCGAGAAGGGCAGCAACGCCTCCCCTTTGCAGCTGAAGAAGAAGTGTGTGAATGGCTTTATCATGTTTTGCCGCCTGAACCGCAAGCACTTCATCCGCGCTTGTCCAGGCATGGCCTCCACAGCTGCCACAAGAGAGCTGGCCCAGCTGTGGCGTGTGATGACGAAGCAGGAGCGCCACCCATATTGCTTGAAAGCACGGAGATTCAGCCGTCTGAACAATCGCATTGTGAGAGATGACTTCTCTAGCGGGGAAGAGGAACCAGAGCCACCCAAACCTTTCCATCTGCTACTCGCTGAGAAATCCCTCCCTGGCACTGAGAATTTTGGTGACTTCTCTTTACTATAG\n>XM_031628525.2 PREDICTED: Nymphaea colorata UPF0548 protein At2g17695 (LOC116253610), transcript variant X2, mRNA \nATCTTATTTTTAAGAAGAATTGAAGATGAGAGAGGGAGAGAGATCTGGCAGCAGGTCTGTCTCCCACAAAATGGTGTTCCTGTTCTGGAATCGACCGTCGCCTCATCAACAGTCCGCCTGCCTCAAGCAGGCGGGAGACTTTAACTACGACTCAAAATATCGTTGCTTGACTTCTTCCCCTTCGGATTGCAACCCAAATTCAGCGTCATCTTCGCCGCCACTACCGTCTTCATCTTTGTCTGAGCTCCGACATGGCTCCAACCGCGATGGTTTCGTCGTTAACCGCGCCCGCGTCCTTCTTGGCTCCGGACTCCAGACATACCAACAAGGAAAGCGAGCTCTTCAAGCTTGGAAGCACTTCGGCTTGGATTGGGCGTTTGTGGATCCCAGCAGTCCCGTCGAGGTTGGGGAGAGGTTCTGCGTGTGCGTGAAAGAGCTTGTCCCTTGGGCTGTTCTGCCTCTTCAGATCGTCTACGTTAACGACCATGATGCTGTCAAAGATGGTTCCCTTAAAAGGGGTTTGACGGCCTCCTTCGCTTTCGGGAGCGGAACCCTTCGAGGCCATTTATTGGCTGGAGAAGAGCGGTTCTCGGTTGAGCTGGACGAGGACAACAAAGTGTGGTACGAAATATTCTCAATTTCCAAGCCCGCCCACCTACTTTCCTTTGTCGGTTATCCTTATGTCCGTTTTCGGCAGAAGTACTTCGCCCAACAATCAATGGATGCACTTGTACGACATGTCCACTCTCAAGAGCGTGCTTAATGCAAAGTTCATATCGAAGTCCTCTTGCTCCTGTTATGGCACCAAGAAATTGTTATGGCACCAAGAAATATTGCACACTTCAAAATACATGAGTACTTAGTATTTTCACTCA\n>JN440548.1 Uncultured organism clone SBYB_3744 16S ribosomal RNA gene, partial sequence \nAAAGCAGCTAACTACGATAAACTGGACGGTAAGGGACGAAAGCTTGGGTAGCGAACGGGATTTAGATACCCCGGTAGTCCAAGCCGTAAATGATGCTTGCTAGATGTTTTGGACCCTTGTGGTCTGGAGTGTCGTAATCTAACGAGTTAAGCAAGCCGCCTGGGTAGTATATTCGCAAGAATGATACTCAAAGGGATAGGCGGGGGTACACACAAGCAGTGGATTGTCTAGATTAATTGGACAATAAGCCAAGAATCTTACCTAGATTTGACATGTACTATGTCCTATGTGAAAGCATAGTAGTCCGAGCAATCGGACATGGTATACAGGTGGTGCATGGTCGTCGTCAGCTCGTGCCGTAAGGTGTCTAGTTAAGTCTGGAAACGAGCGCAACCCTCATCTTTAGTTAGAATGTCTAAAGAGACTGCTCTGGTAACGGAGAGGAAGGAGAGGATGACCGTCAGATCCTCATGCCCCTTACATCTAGGGCTTCATAGACAATACAATGGGTGATACAACGAGAAGCTAACACGTGAGGTGGAGCAAACCTCTAAAGTTATCCCAAGTTCGGATGCTAGTCTGGNACTCGACTACATGAAGTTGGNATTGCTAGTAATGNCGGGTCAGCTACACCGCCGTGNATATGTNCCTGTCCATGCACTCACCGCCCGTCANACCATGGGAGCTG\n>XM_036157752.1 PREDICTED: Mus musculus predicted gene, 38699 (Gm38699), transcript variant X8, mRNA \nCGATTGGTGGTCAGGCCTGCGCCCGGCACCGCCGGGCGGTCCTCCGCGCCATCCCCAGCCGGGCCCTCCCCTTTCCGCGGGAGGCTTCCGGGACAGCGGGTTGGTGGCGCGCAGTTCCCCTTGACTGTGCGCGCCCGCGTCTGGGCTCCTTTGCAGAGGACTCGGTAGCTGCAGCTCCCGGAGCACAGCAGACAGAGCTGCAGGCTGCGTGCGCCCCTGCTGCCACCGGACCTGCCGCGGTGGCTCCCGCGCCCCGCGGCGACTTCCGCACCCGCGCTTATCTTTGCTTAAGTCCCCGAGCGGCGGCGGGGTCGGAGCCCGCGCCTTGGGCGACTGAGGCGGCCGCAGTTCGCGGCCCGGCGCCCTGGCGATGCCAGACCAGATCTCCGTGTCGGAATTCGTGGCCGAGACCCTTGAGGACTACAAGGCGCCCACGGCCTCTAGCTTCACCATGCGCACGGCCCAGTGCCGGGACACCGTGGCGGCCATCGAGGAGGCTACACTTGGGAAACCCATCATATTGAAGGACATTGTCAAAGTTCGAGAAGAAATGAAAGCTGCGGGTGGTGTTGGTGTTGGGCTGTGTGTGTGCCTTCCCTTCTTTTGTAGACAGTAAGAGATTATTTACTACCTGTGTTTTCATGTGTATCCTTAACTTCCTCGGTTAGATTCTACCTCTATCTCTTTGTGTTGGTCAGTATGTTTAGAGAGAGGTTGTTTAAATTTGAGTTTATCGTGGACTATCTTAATTTTTTCCATTAACGGTGTAGTCCTTTTTTTACATATTAAAATCCAGGCATCTGTTGTTTTTGCAGCACATGTGTGCAAACCCTTCTGGCGTCTACAAACTCCAAGAAGACATCTGTGATCTTTTTTTTTTTGTTTGGTTTGGTTTGGTTTTTTTTTTTTGTTGTTTGTTTGTTTGTTTGTTTGTTTGTTTTTGAGACAGGGTTTCTCTGTATAGCTCTGGCTATCCTGGAATTCACTTTATAGACCAGGCTGGCCTCGAACTCAGAAATCCGCCTGCCTCTGCCTCCTGAGTGCTGGGATTAAAGGTGTGCGCCACCACGCCCGGCCTGAAGACATCTGTGATCTTAATAGATCTTCCTTTATGTTTTTCCTGGCTTTTTACCTTTGCAGCTTTTAGTATTCTTTCCTTGAACTGTATGTTTTGATTATTACACAGGAAAGAGACTTTATTTTATAGTCCCTTCTGTTTGGTGTTTTGATGATTCTTGTGTTTTCTTTATGTTAGGAAGTTTTTCTTCTAGGATTTGGTTGTCAATACTTTCTGAGACTTTGAGGGAGGATTCTCCTTCCTCTCTTCCTAAGTATTCTTATGTTTAGTCCTTTTACAGTGTCCTGGATTTCCGTGATATTTTATATCAGGAAGATTTAGACTTACCATTTTTTTTTGTTTTTTTTTTTTTTGTCTGATTTACCCATTCCTTCTATTGCTTATTCAATGATTGAGATTTTTCTCCGTATCTCTGTTCTCTGGGTGAACTTTGCCTCTGTAGTTCCTTTTTGCAGTCCTAAATTTTTATTTCCACTATTTCCTAAGATTTAGTTTTCTTTTTTTGCTTCTATTTCCACTTTTATGTATTGAATAGTTTTGTTTACTTCACCCATTGGTGTGTTCTTTCTACGCTTTGTTTATAGGAATTTTGGCTTCCTCTACTTTTTGGTTTGTGTGTTCCTGGCCTTCTTTATGGAATTTATTGATTTCCTCTAATTTTGTTCTGTTTTCCTGGATTTCTCTAAGTGATTTGATCATTTCCTCTTTAAGGAACTCTGTCATCTCCATACATTTGGGGTTAGAGTGTTTTTCTTGTAATTTAGCTTTGTTGGAATATTTAAGACCTTCTTTGACAATATAAATGAGATCAGAGTCATTAGCCAGAGAGTGATAAATGCTGGTCCTTATTACATTATCGAGTACCAATGTCATGGAATGGAATGGCGCTATCTAACCTAAGTATTCAGCTTAGATTTAACCCAATGTTTGATTAATCCCAAGGCTGTCCTTTCCCTTTACACTGGACAGGTAGCCAAGTGAGGCACTTTTTGAAACAGTTACTTTTTGTGAGACACCTGTTTTTAATCACTAACCTTGGGTTAACCATTTAAAAAAAAAAAGACCTGATGTTTACAGGGTGAGTGACTTTGTAATTTTCCAAAATGTATTTATTCATGTCTTGTGAATGAAGACAGACCAGATTGATAGATATGTAAATTGGGGACTTTAGCTTGATTCAAGCAATATTGAATTTCTGACTTTGGAAATATGTCCAATGCACTTTCAGGCTTTATTCAGCTCAGATGATTGTGACACAGGCCATTGGCTGTAGTTATGTGTCATGTTACAGATCACAGCAACTGATATTGCACACAGGAGCCAGGTCAAAGAGTATTGTATTAATGCCATTGTTTTCTGCCAGATAACTTCTCTCTCTCTCTCTCTGTATATATATATATGTATATGCATATATATGTATATATATATAATTATGTTTCATTTTTCCTTTTTTAATTAATTAATTAATTTATGTACATCCTGTTCCTGTTCCACTGTGGATAGAGAGACAAGGCAGTCCTCTGGTACATATGTGCCTGAGGCAATGAGCCAATCCCTGGATGCTCCTTGGTTTTTGCTTGGAGGTCTGAAGTGTCCAGGTCAGCTCAAAGTTTTGTTCTTATCGGGTTGCCATCTTCTTCACCCCCTTAAGTCAGTACAGTGACCTGCCCTTATGTAACATTTCAACCTACAACAATATATCGATATATCGATCTACATATTTCTATATCTATCTATCTATTCATCTATATATCTATATAGCTTTAATCTATACATCTATATATCTATATATCACCTATTAATCTATATATCTACATATCTATATGTATATATCTATACACCTATACATCTATATATCTATCCATATATCAATAAATATATATAATCTCTATATATTATCTATAAATCTACATATCTATAAATCTATATATAAAATCTATATATCTAAAATATATATATACACATATATGTATATTTTTAAATCTATCTATCTATCCATCCATCTATGTATCTATAAGTCTATCCATATGTTTAGCTTGATGTAGCTTTTTTCTTTTTCTGCCAGATAACATATACATATATATTCAATTATGTTTCAATTTTTATTTTTTTAATTAATTTTTTTATTTATTTAAGTACATCCTGTTCCTGTCCCATTGTGGACAGAGAGACAAGGCAGTCCTCTGCTACACATGTGCCTGGGGCAATGAGCCAGCCCCTGGATGCTCCTTGGTTTTTGGCTGGGAGGTCTGAAGTGTTCAGATTGGCTCACGGTTTTGTTTTTCCTATCAGGTTGCCATCCTCTTCACCCCCTGAAGTCAGTACACTGACCTGTCCTTATATAACATTTCAACCTACAACAATATATCAGTATATTGACCTACATATTTCTATATCTACTATCTATTCTTCTATATATCTATTTATCATCTATATATCTTCAATCTATACATATATATATCACCTATAAATCTATATATCTACATATCTATACATATATATTTATATATCTATACATCTATATATCTGTCCATATATCAGTAAATCTAGATAGATAGATATCATCTATCTATCTATCTATCTATCTATCTATCTATCTATCTATATAAATCTATATAAAATCTATATATCTATAAATTCTATCTCTATCCATCTGTCTATCTATATGTTTAGCTTGATGTAGCCTTGTCTTAAAGGACTGTTATGTTCTAGGTTTCAGACGTTCAGGCTGAGAGGAAACAGTATGAGTAACATTTGATCTAATACCAGATCCTCGACTCTGGACCCATATTTTATGATAATTTTGGGATTATGATTACATCATTCCTACCTCCTGTGATCAATCAGTAAACACATCTAATGCCAGCAGCTGGCAAGAAGAAAGGTTGATGGCATTTCAGTTCTCGGCCTCGGTGTCTTTGGAAGAGACCATGACGGAGAGGGAAGAAGAAGCAGGAAAAAGGTCCCATGGGTGGATGGATTGGGAGAGCATGTCCAGGAGGGCGAGCCTGAGAGTATGAGCAGCCTGGGCAGAATATGGCAAGTGAGCCGGGCATGGTGGCACTCGCCTTTAATCCCAGCACTTGGGAGGCAGAGGCAGGCAGATTTCTGAGTTCTAAACCAGCTTGGTCTACAAAGTGAGTTCCAGGACAGCCAGGACTATACAGAGAAACCCTGTCTCGAAAAAAATTTTAAAAAAAAGAATATGGCGAGTGATATCTCACAGTTCTTAGTAAAGAAGTAAAGAAATTAGCATAGGGGAATGGTATCTGCCCCATGCTGGTGCTTTAATGCTTATAATTATAATTATTATTATTATTTCTTATTTTATTTTTTCACATTATCATTTACTGCATTATTATATCATATTATTTAATATTATTTCTTTTTATTATTTCATATTATTTATTATTTTATTATTTGATAGCATTGTTTCTTATTCTTATTATTTCTTATTAGTTTATTATCATTTCTTTTTCTCTTCTTCGTATTATTATTATTTCATACCTCTATAATTTATGTGGTGGTAAGAGATCCACAAGTAATATTTACCACAACAAGTTGGATGCAAAAACAGCTTGTACCCAATGAGAAATATGGCCAAAAGTTATTTTCTTGGGATACAGGAAGAAAGTCCTCTGGGGTCTCTGCTAATAAGGTCACACACACACATACCCCATACACATACCCCCACACAAACATGCACACACACACATACTACATACATACA\n>XM_012367441.1 PREDICTED: Linepithema humile MAP kinase-activating death domain protein (LOC105672481), transcript variant X6, mRNA \nATTTTTAATTTTCTCGGATAATTATACTTACTACGAATATAAAAATCATGTAACGTTAAAGATTGCATCATGCCAGTATTAGGATTAAAATAATAAATTGTATATTCGAGGCTCTTTGGTCTTCAATATAAATTAGTATAGATTTTTATATATTCAATCTAAACTAAACCTTAGATTTTGCGTCAGTTTTGTATCAGAATCTAAAGAAGTAACTGTAGATTTTTTTAAAGGTATTTTAAAGGTATTAAAGGTATAGATATTTAAAGATACGATATAAAGATTATATGATCGATCTAATCAAATCTATAAATATATAGAATAATATTTACAATATAGTTTACGTTTTACGCACTCTTTAAAGCAAACGTTGTATATTTTATATCCTGCGTAAAAAATCAATATCATCTAATACGGTCTAAAATCATATTTTATTACAAAGAAGCGCAATGTTGAAAACTCTTTGGAACTACAGCGTTCGGTTGTTTTCCACTCATTATTCAACCGCGCTTCAACGAGCGAGAAAACGGAAGGATATCGAGCCGACGACAGGGTGTCCCAATAACGGGAGCGGAAATTCACTTTCGGAAGCGGAATCGGGATTCTAGCGCCGGTACTGGAGGCGCGTCCGTCCAGACGTGCGCCTGCCTGGTTCCGGCGAACGATCAGCGGCGCGACGGCGTCGCGACGACCGCGAAGCTCCGGGGCGCGTCGGCGGATCGCCAGTGTGATATCGCCACTTGGCTGATACGGAATACGGCCTGGCCGTCATTCGTATGGCAGTCGGACGAGAACGCGCGGCAGTCACTCGCGTTAACGCGCATTGCAAAACGTGGAATTAATAAGCGAGATAATGGTACAATCATGATTCAAGCTGGAAACGATCTTGAGGAGAGTTCAGAGGCTTGGCTGTCCTGTATATACTGCATACAACGGTGACACAGCTGTATATACATAAATCACAATTATGGATATACAGAAGAAATTCCTGTGCCCCCGATTGGTGGACTACCTCGCCATCGTTGGAGCCAGGATGCCCGCTGTCTCTCGTCAGCCCGTACAGGTCCCAGAGTTGCTACGCAGATATCCGGTAGAGGATCACAAGGATTTTCCTCTGCCTTTGGATATGGTGTACTTCTGCCAACCAGAAGGTTGCAGTAGCGTGGGACCAAAGCGCACGGCCTTACGAGAGGCAACATCCTTCACTTTTACACTCACCGATAAAGATTCAGGAAGAACGCGTTATGGGATTTGCGTGAATTTTTACCGATCTATGGAAAGGGCGGGGCTTGTGGCTGGCGGGGGAATTGCGCTCAAGAGGGAAAAATACAACACCACGTTTCGAAGGGAAAGCTGGAGGAAGAGTATGGAGAGAAGCACGGATTCCGCTTTTTCTAGCGACTATAGGAGCAGTGCAGTAGGTCCTAGTGATTCTGAGAAAGATTGCTCCAGCAGCAGGCGGGATTCGGACACCCCGCAGGTCAGCTCGGTCACCCCGAGATTGGAATTCATCGCAGCGAGCGGAGACAGCGAGAGCGGCGGCAGTCATTCCCCATCGCCACGCGCTTCTCGAAGACGCCAGAGGGTTCGCAATCATTCCTTGACTTCCCTATGCATCATTTCGCACCATCCGTTCTTCTCAATGTTCCGGGAATGTCTTTTCGTCCTGAAGAAAATCATCGACGCGTGCAACGAGAGTTTCTCGCCGCAGAAGGTGGGAGCCTCTCGGCAGACCAACAGAGACACGGTGTGGAGCGTATTAACGGGTCAGGCTCTAGGGGACACGCCGTCCATCGTGCTTCACGACGTTCGCGAGATCGAGACATGGATACTTCGTTTGCTCAGCAGCCCCGTGCCCGTCCCGACAAAGACGCGCGTCGAAGTCGAGATAATATCGCCCAGTATGCAACCACCGCTATGCTTCGCCCTACCGGATCACACTAGATTCTCCCTGGTCGACTTTCCATTGCATTTACCGTTGGAGCTCCTCGGCGTCGACATATGTCTGAAGGTTCTCACGCTGATTCTCTTGGAGAATAAGATTGTACTTCAATCCCGTGATTACAACGCCTTGTCTATGTCGGTCATGGCGTTTGTCACGATGATCTATCCATTGGAGTACATGTTCCCCGCGATACCCTTGCTGCCCACCTGCATGAGTTGCGCGGAGCAACTGCTGCTCGCGCCGACGCCCTTCGTGATCGGGATCCCCGCGTCCTTCCTTATGTACAAGAAGAACTTCAGAATGCCCGACGATATCTGGCTGGTGGACTTGGATAGCAATAAAATAACTGCGCCGAGCGCTCTGAACGATGACGGTTTGCCGCCGCTACCGGAACCGGAGGGCACCATCCTGAAGAATCACCTGAGGCAGGCAATGCAACTGATGGATCAAGTTGGCTCTAGTGCGATGGCTAGCATGACGGGACCGCCATTGCCGTCGCAAGAAATCTCGCAACGTCTCTCTTTTCAAACACCGAGTAGGAGAGAAAGCATGGCGTCGCATCATTCCACCTTAAGCGTAGCTTCAACGAAGCACAGGCCGAGCATCGACCAGTGCGCGCACATTCAGCACTCCCCGCTTAATTCGCCAAGCGTGAGCTCGTCAGCGAGTCCACCTCGTCGGCCGTCGATGCCACAAACGGTTGGAGGAGCCGGGCTGACCGGTCCGCCAAGAGCGCCCGGACAGAGCCCGGCGCCTTTCAATCCCTTCATCTACGGAAATGACGTGGACTCGGTAGACATAGCCACGCGGGTCGCCATGGTGCGCTTCTTCAACTCGCAGAATCTGCTGGCCAACTTCACCGAGCACACGCGCACCCTGCGGCTGTATCCCCGGCCGGTGGTGGCTTTCCAGATCAATTCGTTCCTCCGTTCGCGGCCACGGAAGAGCAGCTTCCTCAACAGATTCGCGCGCACGCAGGCGGTCGAGTTCCTGGCCGAGTGGTCGCTCACGCCGAGCAACGTGGCCTTTCTCCGGGTGCAGACGGGAGTCTTCGATCCTGCACAGATCGGCGACAAGTCGCGCTGGTACGCGACCAACCTCGAGCCGATCTACTTTCCCGTCTGGGACTCCGGTAGTTCGTTGGCGAACGCCCTGAAGGCGATGAAGGAGCACGAGAGTCAGCCCACGGATGAGAGTGGATCGGATTCCGAGGGTGCCGAGAGCACCAGCTCTTCATATTCCTCTCTGAGCGACTTCGTCTCCGAAATGGCGTCGTCCGATTTGTCACCGGGTTACAATCCTCAAGTGAGCCAGCCCCAACAAACGCTCTCAGTGGATCCGAAGAACGTCTACAATCCGCCGAGCTCCTTGCAATATCCGGGAGTGGAAGAGGATTTACCAGCACGACCCGAGAGCCCACCAAGTACTTCTTCCAGTCACAGCGATCTCAGTAGCCCAAGCTTTAACAGGGACTCCGAGCTCGAATTGAACCCAAGAGTTCAAGAGGGTTCGCAGTCCGCTAACGATAAAGAGGAGGGTGGTAGCTTTGAGTCAGACTCCGCGTCGACAATAACACCGCGCACAATCCTGAGCGCACAAAGTTCGGTAGGACAGTTCACAGGGATAAGCATGGGCGCTTTAGGCACTCAATCTTCGCTCAACGACACTGAACGTCCTACCACCCCTCACAGGATCTCGCGCGTCAGTAGATATGTCACTCCTGTGCCACCCACCGGACCAGGTCTGCAACGTCAGCCGAGCGTAGGCAACGTTCTAGCGAGGGCCTCCAGCTTCAGCACCACCGGCGGGCCTCTTCTGCCGCGGCAGATAAGCGCGGTCACCGCTGCTGATCATCATCACGAAGCGACGCAGCTTCAGCGTCAAGCATCCGCGGGAGCGACGGTCGCGCAAAAGCAGAACGACGGCACGGTGCAACGACAGAACAGCGGCGGTTCCACCGGCGCCGCCACCGGGAACGGCGTTCTTCGACAAGGCTCTCAGGGTTCTCTGTTCGAGCAGATCGCCAGCCAGGCGAAGGATTTGGTGCGCGAAACGACCAGACAGAGCAGTCAGGACGGGCTGCTCGCGCACATGGACAAGCTCAAGCATCAGGCGAAGGAAAGAATTACGGAGGCAGGCGAGGATAGTCTGTTCGCGCCGCTGGAACAATTTACGCAACAAACTAAGAAAGCGGTAGGTGAGGCCACCAAGTCGGTGCAAGAGGTATCAAAGAACGCGTTGGAGGCGAGCAAAACGGCGGCGGGTGTAAGCAAGAATACGCTGGACGATTTGACGTACGTCGGCAAAAGCACATTTGGAGATCTGACAAAAAGTGCCAAAGAAGCTGCTGCGAAAAAAGGCTTCATCAAGAGTCTAGAATCACAATCGCCGGTACACTCTCCCTCCTCTTCTAATATGATGCAGCAGCGAAAGGATTCGATTAGCAATCAGTTAGTCGCATCGGACACACGAAGTGGTGTTGGCCGGGATTTCTTCAGCAATATTAGCAGCGATTTGAATGGCTTCGCTGCGCAAACCAGCAGTATGTTCAGCGATTTATTCGGTGGTAAAAATAATTCTAAAGGCAGTAGCTTCTTCCCGCAGAATCAGAAGTCGAAAGAAAAGACCAATCCGATTCTTCCACCATTTCCCAAAGTTGCAGGCAAAACAGGATTAGTAGAGCGTTCCTCGTTGATAAAACATTCCTCGCACAAAATTAATCAGGAAGATGCGCAGAGAATGCAAAACGCGGAACGTTCTAGTACAAATAGCGACAATCAAGCCTTTTTGAACGACGTGATAACGCAAGTGTTGGCCGGTGAAGGTGTTGGTTGGCTGAAATTGAATAGATTGAAAAAATTAATGGAAGATGAGAATTATCGTGATTTGGTCGTGAGAAAATTGAATAAAGGTCTCAATAGGAAGATTAGTCCTGATGATCACATTGACGATGTGGCCATATCAAAACCCGTGTATAAGGGAATGTTAAAGTGCCTTCAAGCAGTAACGCATGGTCTCGCACACACGTATAATAATTTCGGACTAGGCGGGATGGCTTCTGTCTTCCAACTGATGGAAATCGCTCACACGCATTATTGGAGCAAAGATCTGTCGGCGGAGGGTGGTTTCGACAGCTCTTTGATGTCGCAGGCGTCTAGCCCGTTCGGTAGTAGAGAAAACTTGAAGTCCCCACAATCTCCGAATCAGTCTGAATTTACAGAAAGCGCGCAGAAATCAGAACTGCCGCAAGTGCATTTGGAAATGCCGCAAGCACCGTCAGCGGCGGAAACGACCCAGTCAACAACGGACATGTTCCTGGACATGTTTACGAAGAAAGGAAAATTTCTGAGCAAGCTTACCTCATTCGATTCGGAGAGTGGGCGGGGTGGTGGAACGGGGAGCAGCGAAGCTTTATCCACAGACGGAGGTAGCATTATCACTAATCCTGCTTTTCGGCAAGCGCACCAAGCTTCCTTCCGAAGCACCGTATCTGATAGCGAGGTCGAGCAAGGCAATTTTCCACGGCAAGGCAAGCAGCGCTCCGGCAGCGTTTGGTCCAGCAAGTCGTCCTTGAGTACGGGATTCCGTTATCACGGCGGAAGTTTGATACCCACCACGACGCTACCGAGTCCGGACGCTGCGAGAACATATCTCTTCGAAGGTTTACTGGGGAAGGAGAGATCGGGACTGTGGGACGAAATGCAATTCTGGGAGGACGCTTTCTTGGACGCTGTTTCGCAGGAACGCGATATGATGGGCATGGATCAGGGACCTGGCGAAATGGTGGAGAGATACAAAAGTTTAAGCGACAGCGAAAGGCGGCGGTTGGAGCACGAGGAGGACAGACTGCTGTGCACTTTGCTGCACAATCTCACCGCCATCCTGGTAATGTTGAACGTCGACAAGAACGAATTGAAGCGGAAGGTGCGCAGGTTGCTCGGCAAGAGTCACATCGGCCTCATCTACAGCCAAGAATTGAATCTACTTCTCGACCAGATAAACAATCTCCACGGAAACGACATCGATCTGAAGCCGCTGACGTCACGGCAAATGCACCGGCAGTCGTTCACTGTGCATTCGGGGGTCGACGCTGAGGGTGATCTACGATTTCTCGAAGTTCGCCACGACGGTCTCGTCCTGAGGTCGGTGAACGGCGTGATAGTCGAACGTTGGTGGTACGAGCGCGTAGTCAATATGACGTATAGCCCGAAGAATAAGGTTCTGTGCCTGTGGAGGAGGAGCGGCAGCGATACCGAGTTACATAAATATTACACCAAGAAGTGTAAAGATGTGTATTACTGCATAAAGGAAGCGATGGAGAAGGCGGCGGCTCGCGGGCGAGGCGCCAACGTGGGCTACGAGCTCGGCGGCGAGTTTCCGGTGCAGGACATGCGAACGGGCGAGGGCGGGCTCCTGCAGGTTTGCATGGAGGGCGTCGGTCTTCTCTTCGCGAATAGCAAGATCCTAAAACTAGACAAGTAATTCAACGTAAATATAAGTCACAAATGGCTGAAGAGGCGGTTCGTTGCTTGCATAGAATATTTTCCGTCGCATTTACTCTTCATAAGCTTCCATCGGAGACACAGAATAAACATAAGTGC\n>XM_001504059.5 PREDICTED: Equus caballus ALG2, alpha-1,3/1,6-mannosyltransferase (ALG2), mRNA \nTGCGCAGAATCCCCTGAGGGGATGGGGCGCAGGCGTGGCTTCCGGGCCATGGCGGAGAAGCAGGATCGGGACGAGGAGCCGGGTCCCAGCCCGTCGGTGCTGTTCCTGCACCCAGACCTGGGCGTGGGCGGCGCCGAGCGGCTGGTGCTCGACGCGGCGCTGGCGCTGCAGGCGCGCGGATGTAGCGTGAGGATCTGGACCGCGCACTACGACCCAGGCCACTGCTTCGCCGAGAGCCGCGAGCTGCCGGTGCGCTGCGCCGGGGACTGGCTGCCGCGCAGCCTGGGCTGGGGCGGCCGCGGCGCCGCCGTCTGTGCCTACGTGCGCATGATCTTCCTGGCGCTCTACGTGCTGTTCCTCGCCGACGAGGAGTTCGACGTGGTCGTGTGCGACCAGGTTTCTGCCTGTATCCCAGTGTTCAAACTGGCCAGACGGCGTAAGAAGATCCTCTTCTACTGTCACTTCCCGGATCTGCTTCTCACCAGAAGAGACTCTTTTCTTAAACGCCTGTACAGGGCCCCGATTGACTGGGTGGAGGAATACACCACAGGTATGGCAGACTGCGTCTTGGTCAATAGCCAGTTCACAGCTGCCGTTTTTAAGCAAACGTTCAAGTCCCTGTCTCACATAAAGCCCGATATCCTCTACCCATCTCTGAATGTCACCAGCTTTGACTCAGCTGTTCCTGAAAAACTTGATGACCTAGTGCCCGAGGGGAAAAAATTCCTGTTCCTCTCCATCAACAGATACGAAAGGAAGAAAAATCTGACTTTGGCACTGGAAGCCCTGGTAAAGCTGCGTGCGAGATTGACGTCCCGAGACTGGGACAAGGTCCATCTGATCGTGGCAGGTGGCTACGACGAGAGAGTCCTGGAGAACGTGGAACACTACCAGGAATTGAAGAAAATGGTCCAGCAGTCTGACCTTGGCCAGTCTGTGACCTTCCTGCGGTCTTTCTCAGACAAACAGAAGATCTCCCTCCTCCACGGCTGCACGTGTGTGCTTTACACACCAAGCAACGAGCACTTTGGCATCGTCCCTTTGGAGGCCATGTACATGCGGTGCCCGGTCATTGCTGTTAATTCCGGCGGGCCCTTGGAGTCCGTTGTCCACAGCGTCACAGGGTTTCTGTGTGAGCCCGACCCAGTGTGCTTCTCGGAAGCAATAGAAAGGTTCATCCGGGAACCTTCCTTAAAAGCCACCATGGGACTGGCTGGGAGAGCCAGGGTGAAGGAGAAATTCTCCTCTGAAGCGTTTACGGAACAGCTCTACCAATGTGTCACCAGGCTGCTGGTGTAATGGGATGTTTTTTAAGGTCTTTATGCTACATTCATTAATACCATCTTTGTAGATCGTGACTCAGTTTTGAAACCAAAAAGAGAAAAAACCTAGAATCTAATGCAGAAGGGATTAAAAAATATGCACTTGAATCTTGAACCTGAGCCACCTTCCTATATACCACAACTCCCTGTCTGCTTTTTCAGAAAAATAGTATCTTTTATGCTGTAATAATCCTGAGTCTCACCAGTGTTGATTAAGATATAAATATGGTACAGTTCCACGTTCAGCAGAATATTTTAATTATATTTTCTCTAGATTATTGTTGCTCTGCCTATGAATTTTGAGTCATATTGTGCCTTAATTGTTTTAATAATTTAAGTATATCATCATCAAAGTTGATTGTTTGGCTTCGTAATGAGAATAGGGTCCCTGTAGTTCCCAGAATCAATCCACCTGGGTGTTGACTGTCCTCTGTTAGGAATTTTGCTTAGTCATACCTTTGCCTGGATCCGTGGCAAGAGTGATCTTTATTTTTTTACAAATGTGATTTATTGTGTTTTCCCACACTAAGACAATAAAAGATGTTTATCATAGGAAGAGACAAAATTTTA\n>XM_004371625.3 PREDICTED: Trichechus manatus latirostris chromosome unknown C19orf12 homolog (LOC101348405), mRNA \nGTGAGCACAGACTCTGCCAGGCCCGTGTGTCCGGGGATTGCCCAAGCCAGCCAGCAGGCCACGGATGCCAGAGAGGCTAGACTTGCCTCATTTGTGAGGAAGTGTGGACATGTAGCCGGCTCCTCCTTAATCTGGTCAGAAATCAGAAGTGAATCTGAGAGCAAAGAAGACCTTGAATCTCTCTGCTGTTTCTGTTTGCTTGTTAACTAAATGCTGCCCCGGTTTCTCGGTGATAAAGGACTTTCCATAGGATGGAGGCTTTCTGACGTGGCCGTGGCAGGGCTGCTGCTCTCTGCAGAAAATGGGACCCCTCAGAACTTGAGGATGAGTCACATTTGGGTGGAAGGTCTTAAATCCATTAACACTTGCTCTTTGAACTTCTTCCTTTGAGGCCAGCCAAGATGCCTGTCGTGGTAGAGGACATCATGAAGCTGCTCTGCTCCATCTCCGGGGAGAGGAAGATGAGGGCAGCCGTGAAGCACTCTGGGAGGGGCGCCCTGGTCACAGGGGCTGTGGCCTTCGTTGGTGGTTTGGTTGGCGGCCCACCGGGACTAGCCGTCGGAGGGGCCGTCGGGGGCCTGTTAGGTGCCTGGATGACGAGTGGACAGTTTAAGCCAGTTCCTCAGATCATAATGGAGCTGCCCCCTGCCGAGCAGCAGAAGCTCTTCAACGAGGCGGCTGCCATCCTCAGGCACCTGGAGTGGACGGACGCCGTGCAGCTGACCGCGCTGGTCATGGGCAGTGAGGCCCTGCAGCGGCAGCTGCTGGCGATGCTGGTGAGCTACATCAGCAAGGAGCTGCGGGCAGAGATTCAGTACGACGACTAGGCCGCTCCTCCCAGGAAGCGGGGTTCACTCAGAGGATGCGGTAACTCGTCTAGAAGGAGGCCGGCGGCTTGGGGGCAGCTGAGCAGACCCCCCTGAGAATCCTCCACGTCGTCAGTGTATTCCCTTCACCTGGAGCTCAGTTTTCTGTTGGGGGGACTACGGTTGTGCCGTCTCCTGTTCTGGAAGTTACTCCGGAAGAAGATGTGTTCTGTGCTGTCCTGCACGGCATGCACTGATTATCCTGGGACTGGGAGGCTGGCGAGCGGCGGCGGTCAGCAGTGGGCATTGGGGCAGTTTTCCGAATGCTCTGCTGTCGGC\n>EU641276.1 Uncultured Burkholderiales bacterium clone GC1m-1-48 16S ribosomal RNA gene, partial sequence \nTGCAAGTCGAACGGTAGAGGGGGCAACCCCTTGAGAGTGGCGAACGGGTGAGTAATATATCGGAACGTGCCCAGTCGTGGGGGATAACGTAGTGAAAATTACGCTAATACCGCTTACGATCTAAGGATGAAAGCGGGGGATCGCAAGACCTCGCGCGACTGGAGCGGCCGATATCAGATTAGGTAGTTGGTAGGGTAAAGGCCTACCAAGCCAACGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGAAAGCCTGATCCAGCCATTCCGCGTGCAGGATGAAGGCCCTCGGGTTGTAAACTGCTTTTGTACAGAACGAAAAGGTTTCTATTAATACTAGGAGCTCATGACGGTACTGTAAGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTATATAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTTGAGACTGTATAGCTAGAGTACGGTAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAATCCCCTGGACCTGTACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCAACTGGTTGTTGGGTCTTAACTGACTCAGTAACGAAGCTAACGCGTGAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCG\n>XM_029869421.1 PREDICTED: Aedes albopictus transcription factor BYE1-like (LOC115265160), mRNA \nCGGCATCACTGGTTCACGAACAGGTAGTGAACTCGCCGATACAAAGAAACTAGCTGTCAACGCATAACGACAGAAGGTGTAGGTAGCAAACGTGAAACGTGGTGAAATGACGATTGATCTAATGTTTTGAGATGCTGCAAATGATTATATAATTTGTTATTGGGTGAAGGGAAATTCTTAAAAGTAAGTTTCGTATGTAATACCACAATTGTGAAACCAATTTAGTGTATTTTTCCTCAGAACTTGTAAATTACGCCGTACATATTCCTGCAAGTGAACTGTAGCAGTCTGAATTGTCAGAGTTCGATAGGTAACCTCAACTTAACCCTTATTGGAATACCCATTTGCTAATTCTATATTTATCTAAAAGGACGATAAATCCTCATAAGGGTTTGCTCAGGATAGACCGCGAATTTGAAGATTGTGAGAAGACTATCTTTTGAGCTTCGTTAGACAAAAAAGCTGCAAGGTGCTTCTACAATCCGAACACTCTCAAAAGATACCACTCGAATCGACTCTGATGGCTACAGTGAATCCACCTCACGGAGGCGCCGGTGACCACGACTGCGGGGCGTGCAACCTGCCTAACGATGCCGATCCGCAGATGGTACAGTGTGACGCCTGTCAAGTCTGGTACCATCTGAAGTGCGTCGGAGAGACTCCTGGTGTTGAAAACAGATCGTTCAACTGTCGTGCGTGTCAACCGCCTTCCAATGTCGGTAAGTCGAAGCCTAAGAAGACCAGATCGCAGAAGGGCGTAAGTGAAGGTCAACTGAAGGTTCCCGTCGCGTCTACATCTGGAGTGACACCGATAAAACACCCGGAAGTTCCCAAATGTGTTACGAACAAAGCGACAACAATCAAAACCACTTCGTCGACTTCGCGTTCTCGAGCTCTGACTCTGCAGAGGAGGATTGAAGCGGAGCAGCTTCTGGCGGAAATGAAGCTGGCTGAAGCAGAAAAGCAGCTTGAAGAAGATCGTCTAATGCAGGAAAGACAGCGAGCTCTGCGCGAAGAAAAGATTAGGCTGCAGGAAGATCTATTGCGGAAAATGCAGGAACTAGACGAGGTCGCCGACGCTGAGAGAGCTTCCGAATACACCAGCACCAGTGGAATGCGGAAAGCACGGGAATGGTTAGCGAAGCAACGACAGGAGAACCAACAGCAAGACGACAATGGTTCACACCGGTCAATACCACCGTTTCTACCTTCTAAGAAGTCGGAACGTAGCTCTCAAAAGTCGGTGGGACGCGAAGGATTCAATGCGCAAGGTGGGTCAGATCCCGATACATCCGATGATCCGGAAGGCCCTTCAGAAGAGCCGAATCCGCCGAATATGGACAGAAGAATGTCGTTGGAGAGGTCACCAGCGATGCAGATTACTGGAGAAATGCCGGTCAAGAATACGCTGCAACATCGGAAATTGCCGGGAACGTCATAA\n>XM_002072634.3 PREDICTED: Drosophila willistoni nuclear pore complex protein Nup88 (LOC6651485), mRNA \nGCAAATATTTGCACTGAGAAATATAAGGTAAATAATTTAAACTAAATTGTGTAAAACAATTTGCTACATATTCAGGTGGCAAGCCAGGTTTTCAGTCATTTTATCACATATATAAAAGGAAAAAGTTCTGAAAATAAACAAAGCTACCCGGTCTGCTTGAATATATTATCAGGCAAAATGGCAACTACTGATGTTTTGGGTCTAAATAAAACTGAGATATTTGCAAAAATCCGGGATGGCTTGCCCATTGTGCAAGAATCACAGAATCTCCTGGACTGCAAGGACGATCTTCTTTTCGCGTGGAACTCCAATGACTGCTCATTGCTGGTGAAAAATTGGCGCGCATCTTTGATGGAAGCAGACACAGTACCTGAATCAACTGCAACAAAGCAGAAGAAAATTACTTACCAGACGTTGATACCTTCTAGTACGCTTAGTCTGGACGTGGATCGTGTAGTGGCTTCCAATGAGTGCTCACTGGTGGCTTTGAGTGCGCCACGTGGTGTTTGTATCCTGGACTTGCCTCGTCGCTGGGGACCAGAAGGTTACTTTGATGGTGGAAAGGCGATTATCACCTGTCGCACATATAATCTGGACGGTCAGCTGTTTCAGAGTAATCCTCACTTGGAGGTGCGTCAGATTCGCTGGCATCCTAACTCCGTCTCCGACTCCATGCTGCTGATTCTGTTTAACAACAACACCATCCGGCTCTACAATCATTACAAGCTGATGCATGTGTGGCAAGTTGGTCCCACCATCGTGAGATCCGGGCTGAGAACCTCCGCCTTGGATTTTGGTGAGGCAGCAGTTGACTTTGATATAGCACCGCCTGTGAAATCCAAAAGAGATTTGACAGAAGAACTAGAAGAAAGTGTAAATTTAACAGATAATTCTCTTAAGCAGGACAAGATTGAGTGGCCTCTTGTACTTTTGCGGGAAAATGGAAACATTTATATACTCATGACTGAAATGAGTTCGGACAGAACCCGCCTCCAGGGACCCATTACGATAACCCCTCAGAAAAGGGACAACTATGGACTGGAGTCGTCGTCAATTATGGTCATCCCCTCTTTGCCACCCACTTTGGTTATTGGCGAGTCGAGTGGCAAACTGCATCATGCTCTTTTGCTAGAAGCAGCCACTCCCGAGCATTCGCTCAATGAAGTTGATGATTTTATCGTCATTGAGCCCTCCGAATATGTGATCCATGTGAGAGAGACTGTGGAATTAGAGTTGGGAATAAAATCCGGTACTTCGAAATCGAATTACAAGTCCCCTGTCTACTTAAAACGAGATGTTATCAATGAACTGCGGTACTTTGCATATCACAATGCTGGTCTTCATGTTGTCACCGTGAACTTCATATCCGAATTGCAGCGTTATCTGGAGAGTGAGGCAGAGGAGGACCAGCTGAATTTTACAACGCCCTCACGAGCTGAGTACATACTGTGCACTAAATTTGATTCTAGCGACCACATCAATGCAGTTTTTGGTATTGCTCTACTCCAAACTCCGGCTGGAGTTGTTGTTTTGCTGGGGAGTGGACAGGTAATTAGCCTCAAGCTGGTCGTCGATGCCCAACTGTTAGTTTCACCAAGTGAGCAAACTCTAACGACATCTTCTGTCGAGCAAGGAGAGGCTGGACAAACATTTCAGGACAAGATTAAAAGTATTTTGCAGCGTAGCGTCAATCAGCCCATATTAGCTGATAAGCCCTCCTCCAACGCCAACGAGGGTTACGAGTTGCTTAGCCAAGCCATTGTCGTGCTGCGTTCACAGTACCTCAAACGTCATGAACTGGTGCTTGTCGAGTTTGCTAAGCACATTAATCAAATTCGCATAAAAAGAGATCAACAATTGCAAGAGATTCAGGACCTAGAGGACGAGCGGGAGGTGATTAGTGAGCGTGCTCACAAACTTGCTGAACGTTTTGAGGAAATAAGCGATAATCAGGATTGGCTTGTCCGCAAATGCCATAGACTCCTACAAAATGCCAATACTGCTCTGCCAAACAGCGTTGTGGCTGAACGTGAATTCGCTCAACAGGTGGCAAACATTAATAAGGCTAACAAAAAAATTGCTGCTGCCTTGGAAGATGCCAAGAAGACCATGAACAAACAGCGTTATTTCATAGCCAAAAACCAAGACGAGGTCCGTCAAAATGCATTCGAGTTGCCGGAGAAACAAAATCGGACCATAACCGAGATTCTAATGCAATTGGCCAGTGAAATAGATCGACAGGTCACTGATGTGAAGCGTATAAATAAGATTATTGGTATTTAAATAAATGGCTCTTGCTCATCTTAATTAGAA\n>HQ071684.1 Uncultured Leptolinea sp. clone F5OHPNU07IB2R6 16S ribosomal RNA gene, partial sequence \nGCACAAGCAGCGGAGCGTGTGGTTTAATTCGATGCTACACGAAGAACCTTACCAGGGTTTGACATGCAAGTGGTAGGAACCGAAAGGCGACGACCTTCGGGGAGCTTGCACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTCGGTTAAGTCCGCTAACGAGCGCAACCCTCGCTGTGTGTTACAAGTGTCACACGGTACTGCCGGTCTTAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCAGCATGGCCTTTATGTCCTGGGCTACACACACGCTACAATGGCCAACACAATAGGTTGCTAAGCCGCGAGGTGGAGCCAATCCTCAAAGTTGGTCCCAGTTCAGATTGCAGGCTGCAACCCGCCTGCATGAAGTCGGAATCGCTAGTAATCGCAGGTCAGCATACTGCGGTGAATACGTTCCCGGGCCTT\n>XM_022591717.2 PREDICTED: Delphinapterus leucas TATA-box binding protein associated factor 6 like (TAF6L), transcript variant X3, mRNA \nGTAGAGGGCGGAGTCTGAGCGCCGAGAGAGGGAATTAGTGCGAGCTGAGTGAGAGGGCGCCAGCGCCGCCGCCACCACCGTCGCCGTCACAGATACCGCCGTCCCGGTAACCGCCTTCGCCGTGCCGGAGCCCTCAGGTGGAGAAAGAAGCTTGACAATTATCCGTTGGCGGCTTTCCAACGCCTCGTTTCCTGGCTGGGAATCCAGGCCTTGTTCCCCACACAGCCCGTCGCTCCTCATGATTAGAACGATAGTTGAGTTCTTGCTCCCTACCCAGCAAGTGTTTATTGAGGGCGTGTTATGTGCAGACGCAGTGCCTGACGCGGGGGATGCAAAGTTCCATCGGGGCCATGTCGGAGCGAGAAGAGCGGCGGTTCGTGGAGATCCCTCGGGAGTCTGTCCGGCTCATGGCAGAGAGCACAGGCCTGGAGCTGAGTGATGAGGTGGCGGCCCTGCTCGCAGAGGACGTGTGCTACCGTCTCAGAGAGGCCACCCAGAATAGCTCTCAATTCATGAAACATACCAAACGGCGGAAGCTGACTGTCGAGGATTTCAACCGGGCCCTCAGATGGAGCAGTGTGGAGGCTGTGTGTGGTTATGGGTCCCAGGAGGTGCTGCCCCTGCGCCCTGCCAGGGAGGGTGAGCTCTACTTCCCCGAGGACCGAGAGGTGAACCTGGTGGAGCTGGCCCTGGCCACCAACATCCCCAAAGGCTGCGCCGAGACAGCTGTGAGAGTTCATGTCTCCTACCTAGATGGCAAAGGGAACCTGGCCCCTCAAGGATCGGTGCCCAGTGCTGTGTCTTCACTGACTGATGACCTTCTCAAGTACTACCAGCAAGTGACTCGGGCTGTGCTGGGGGATGATCCACAGCTGATGAAGGTCGCCCTCCAGGACTTGCAGACCAACTCGAAGATTGCAGCGCTCCTGCCGTACTTTGTTTATGTGGTCAGTGGGGTGAAATCTGTAAGCCACGACCTGGAGCAGCTACACCGGCTCTTGCAAGTGGCACGGAGCCTAGTTCGGAACCCACACCTCTGCCTGGGGCCCTATGTCCGCTCCCTGGTAGGCAGTGTCCTCTACTGTGTCCTGGAGCCACTGGCTGCCTCCATCAACCCGCTGAATGACCACTGGACTCTGCGGGATGGAGCTGCCCTCCTGCTCAGTCACATCTTCTGGACTCATGGGGACCTTGTAAGTGGCCTCTATCAGCAGATCCTGCTCTCCCTGCAGAAGGTCTTGGCAGATCCTGTGAGGCCTCTCTGCTCTCACTACGGGGCTGTGGTGGGGCTGCACGCCCTTGGCTGGAAGGCAGTAGAGCGAGTCCTGTACCCACACCTGTCCACTTACTGGACAAATTTGCAGGCTGTGCTAGATGATTATTCAGTATCGAATGCCCAGGTTAAAGCAGATGGGCACAAAGTCTATGGAGCCATTCTGGTGGCCGTAGAACGACTGCTGAAGAGGAAGGCCCAGGCAGCAGAGCCCAACAAGGGTGGGCCAGGCAGCAGGGGCTGCCGCCGCTCAGACGACCTGCCCTGGGACAGCCTTCTCCTGCAGGAGTCTCCCTCCGGGGGCAGCGCAGAGCCCGGCTTTGGGTCTGGTCTCCCGCTGCCGCCAGGAGGCGCGGGGCCGGAGGCTCCTTCCCCTTCGGTGACCCTGGCGGACATCTACCGGGAGCTCTACGCCTTCTTCGGTGACAGCTTGGCCACCCGCTTTGGCACGGGTCAGCCCGCGCCCACGGCCCCGCGGCCGCCTGGGGACAAGAAGGAGCCGGCGGCCGCCCCGGACTCGGTGCGGAAGATGCCGCAGCTGACCGCCAACGCCATGGTCAGCCCGCAGGGCGACGAGAGCCCCCGGGGCGGAGGCCCCCCGTCGGCCTCTGCCCCCACCGCCTCTGAGAGCAGGCCGCTGCCGCGCGTGCACCGGGCGCGGGGGGCGCCCCGGCAGCAGGGCCCGGGCGCCGGCACCCGCGACGTCTTCCAGAAGAGCCGTTTCGCCCCGCGCGGTGCCCCTCACTTCCGTTTCATCATCGCCGGGCGGCAAGCAGGGAGGCGATGCCGCGGGCGCCTCTTCCAGACTGCCTTCCCCGCGCCGTACGGGCCCAGCCCGGCCTCCCGTTACGTGCAGAAGCTGCCCATGATCGGCCGCACCGGCCGCCCGGCCCGCCGCTGGGCGCTCTCGGACTACTCGCTGTACCTGCCGCTGTGAGGCGGCACTGGCCTCTGTGAATAAATCCCGCGCCCGGAAGTGA\n>HQ278360.1 Uncultured bacterium clone CB6AA43 16S ribosomal RNA gene, partial sequence\u0001HQ278363.1 Uncultured bacterium clone CB6AA69 16S ribosomal RNA gene, partial sequence \nAAGACCTCACGTTATTGGAGTGGCCTACGGCTGATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGGGCAACCCTGATCCAGCCATTCCGCGTGAGTGAAGAAGGCCTTCGGGTTGTAAAGCTCTTTCAGCAGGGAAGAAACGGTTACGGCTAATACCTGTGACTAATGACGGTACCTGCAGAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTTTGTAAGTCAGATGTGAAAGCCCCGGGCTCAACCTGGGAATT\n>XM_798046.1 Trypanosoma cruzi uncharacterized protein (Tc00.1047053503983.29), partial mRNA \nATGTACGCAGGTCTCTTTAAGAAGCGGCCACGTGAAGCCGATGCAGCTTCCCACGGGAACGCACCGGAAGACAGTGGGGATGCATCGAGCAGGGCCGCCGGCATCTCGTCACCCACGCTGTCTCCCCGCACTGTGTACCACTATCCCTCGATGCTGCCATTCCCAACGGTGATAGATTCTGAATTTCCCGCTGAGTCGTATCGTTCCCGCAGCAAAGACGTAAAGGCGGCTATTCATTGGGGCCAGCGGAAACTCTTACTTTCTGAGATTCAGCTCCTCTCCATATATGCTCGGCCGAATGTGTCTTATCACATTGTCTACGCAGGGTCAGCCCCCGGAACTCATCTTGCATTTCTTGACGAACTGTTTCAGAGTCGACACACCTGGGAACTTGTGGATCCGGGAAGATTTGATCGGCCCGTGCTGGAGTCACGACCGAATTTTTCTCTTCGTAACGAATTTTTTACAAACGTGACAGCCTATGGCATTAATGCGCGCCGTCTTTTGGAGGTGCTTCCTGGGCTGGGAACCGTTTACCGTTGTGTTGCCCTGGACGGTGCGTGGTCAACAAAGAAGGAAATCCACCAAAAGCTTCAGAGCATCGTTGGAACGATTGATGTGGCCCGTGGCACGGAAGATATCCCATCCATGTACGAACCGCGGTTGGATCTTCCCTTTGGCTTTGAGCTTCTTTGCTACGTTGGTATGGAGCGAAGCAAGCC\n>XM_038047407.1 PREDICTED: Hermetia illucens small conductance calcium-activated potassium channel protein (LOC119646808), transcript variant X7, mRNA \nGTTGTTGTTCCTGCTTTTGGAAGGGTATTGTACGTATAGATACTATCAATGCGGCGTCGTCGTCGTAGTTGCCGAAATATCTAAAAGAATGCTTACGGACAACAGTCGGACGTCGGACTCGGATATCGTGTGTGAGTTTCGCTTAGGATAGGACTTCAGAGGAGTGTTGCTTTGGGTCCTTTCACTACTTTCTAGTGTGTTTTCGACCAGAAAGGAACGTATGTGTCGTGTGCGTGGTGATTGCTGTGGCCCTGCTGTTGACTATATATACTTCCTGTCGATTTGCAAGTTCTTACGCCTTTAGTCTATGTCGGGATACCCACCTTGGAGGAAACGTTGTGCTTATTTTTCCTCTCGGTTTCTATAAAAATATATTATTATGTTCACACACGCTACACATGCCAGATCATTATAGCGCACGCAATTTTCTTGATTCAAGTTTCGATTTTGTTTGTCGTTTCGTTTATACCGATGCTCCGACTTTTCATTCTCAAACTGTAACAGAGCTTATCGCGACGTCGTGACATCCATAGGGAACAGCTATTTTCTGAATAGTTTCTTCTTTGATTTTGCCATCATTCCGGTAGAGGCAGAATCGCAATTTAAATAGCTTTCGTTTGGATCCCTTCTATCTTTCAGTGTATTATGCGCGAAACTAAAATTTTCGGTTCGCTTTCTTGATACAGATCCATTCAATTGGGGAGCAGAATTTGAGAGCATCTCCTCGGAGGAGATAGTGATTGAATTATTCGATTCGATTTCGAGACTCGTGTGAGAGGGATAATAAATAGAAAATCTTTAGATATTGTCGTTGCTAAGAAATTGGTATCTGTCGTCGTTACTGTGAATGTGTCGTCGATTTTGGTCTCTTCAAAAGACACAAACTTTGGGGATGTTGTCCGGCAAGTGAATATAAACGAATAACATGCAGTGTGTGGTTTTTCGAAAGATTTTCGAAGTCGTATCCGAAACGTCGGATTCGTAGTCAGCAAATCTTGAGAATACGAAGCAATCAAATCCTTGCCCAAGTCGGTGCCGGATTTTCAGATGGATTTTCGTGCGGTTTGATTTTTCGGGGTGGTTGCTTGGGACTTTTAACCTTTTTATTCCGTACCCAAGTGTCGAGTGTCTTATCAGTGTCCAAACAAAATCTCTTAGTCCTCATTTATTGTGATTTCCCATTCATTTTGTTACATATATATTATATAGGAAGAAAAAGTAATTTTAGGGTGTGTGCGATTACGACGTGTAAAATTTTCAGAAATATACAGTGTTCGTATAATAGCTAGAAATAAAGAAGTCAAAGCAGCGCAGACGGATAAAAACTAAAGTTGAAAATTAAAAATATACCCCCAAAAAGTGTCACGTATCTGTGCCGTATCAGATCGCTACTGTAGTGCGCTTTTAGCAGCCGATTTCTAAAATTATTCGGCAAGAATAAATGCAAAGCAGATTGAATCCTAATCCATCCTTTCATTCCCTTTCCGTGCCGCTTTCAATTCCACTCCGATTCGCACGTATTTGCCGCTCCTAACGCCTTGCTCTTTCCCTGTATCCAACCCTCATCAGTGGTTTGGAATGTGGAGAAGTGCTCTTTTGATTAATTAGCAAGCAAAACTACTCTACGCGCCGTATTCATGACATCCATGATATCCCGCCGTCGACGAGTCAAAAGCCCATGTCCTCTTCATCGTTACCAGGACAAGAAACTATTAGACGAGGGTGTGTTCCATAGAATCACGACACGGCAAGCAAAGGGCATACCCTCAGGATTTCATAGTTGTGAATAAACAAATCGACGTCATAGAAATCACAGATGCGAAAAATATCAAGCCAAATGATAGATTTTGTGCAAAGACGCGAAAGCGTAGCCACAGCAGAAGTACTTCCAAAAAGGAATTCTAGATGAACGGGCGTGCCGAGAAAACAAGGAAAAGTCAGAATGACAGCGGAAGAAAAATCAGCAGCTGCGTCTTTCTAAATGCTTCTTTTGTGTTGTGTGTCCTACACCATAATTTTTCGGTCGTGCATCATTAAAACCCAAGAATACAAATGCCATCTTCGTCAATAAGACTTGGCTTAAATAATTGAGCAGCGTTTACTCAATGAATGACGGCAAAAATGCATTTAGCTTAGCGACTTTCCGTTCACTTTTCCAACTCAGTTCGATTGTACATACTTACGAGTATGAACAGATGGATACAGATAGATACGCAAACTGACAGCCACATAGACTGATTGAAAACATCATGTGAGAGCTTTGTGCCTTCTCTGTGCGAGTCCTGTTCACCCGTATCCGTATATGTACGTATACACGCAATTCAAGCGGACAAATAACGTGGATCAATCGATTTTCTATTCCTTCCGAACAGATATCCTTTTGTCTTTGGCAAAATAAAAATATCAAGGAAAGGAAACCGAAGGGCAGTCAAGGAAAAAATAAGAAGAAAACAGTACCTCGCTTTTCCTTCAACGACAGAAAACCCAACACGCGGTTATAACGGAACTAAGCATACATTGCGTATGTACTATCTTGCTGATAACCCTTCTCAATGCCACAAAAAAATTCTACTTAAAGTTAATCGCCAGCGGGCCTGCATAATACTCAACTTCTATATACATAGTCTGTTCAATTAGTGATAAATCCCGCGATTTGTATTTCTGAATTTCGGTGTTGATACCAAGTAGTATGTGAGTATGAAATCCTCAGAATGAACGCTTAACGACTGACTGGCTTCAACCAGCGTGACTAAGGACATGAAGACGAAGGTCGTCTGCCTTTTTTGTGATATCAGCTAATCCCCCGCAATTCAAACCCAACAAAAACCATTAAAAACGACAACGCGACCAAATCTTAATTTGATTTAATAAAATTGCTTTAATTTCGAGTATTAAATAAAGACCTAATTCGTAAAATTATGGAGTTGACGTCAATAACGAACTATTCAAAATATGACGGGAAAAATGAAATGCGGCAATATCTCAATATAAATACCAAGCAAAGGTTTGGATTTGCTGCCGTGTCTGCTGCTAGTTGTTCCGGACTACGATTCAAAATTCAAATCTCAACGGTCAATGAGCTGACGTAGAGATTGTGAGCGTGAGTGTTTCAATCGCCATCAATCTGTATGTGCAGCTCCGAAAACCGGTGTCCACGTTGTCGATTCCTGGCTCGATGAAAACACCCTGCGCTGGAAATCGAGAACAAATTTCGTCTGCATGCAACGAAGAAGCTGGCGTTGCACTCGTGGGTGTTCACTCAGAATATCCCAGGTACATGGAGGAGCGAGGATTGACCGGCGTCAAAGCACCTGGAGCTGGTTCAACACCGGGAACTCAGAAACATAAGCCGAATGTTGGCTATCGATTAGGTCGAAGAAAAGCTTTATTTGAGAAAAGAAAACGAATAAGTGATTACGCTCTTGTAATGGGTATGTTTGGAATTATCGTAATGGTTATAGAAAACGAATTAAGTAGCGCTGGAGTTTATTTAAAGTCTTCGTTTCATTCGACAGCCTTGAAAACATTAATATCCGTGTCGACTGTGATCCTTTTAGGTCTTATTGTTGCTTACCATGCTCTGGAAGTTCAGTTATTTATGATCGACAATTGTGCAGATGATTGGCGAATCGCTATGACGTGGCAACGAATTAGTCAAATAGGTCTAGAACTTTTAATATGTGCTGTGCATCCAATACCAGGCGAATATTACTTCCTCTGGACAACAAAACTTGCTAATAAAAATAAATCAATGGGCACGGAGTTGGTGCCGTATGATGTTGCATTATCATTGCCAATGTTCCTTCGATTATATCTAATATGTCGTGTTATGTTGCTACATTCAAAATTATTCACAGACGCCTCATCACGTAGCATAGGTGCACTAAATCGTATAAATTTTAATACCAGATTTGTCCTTAAAACACTAATGACAATATGTCCGGGAACAGTTTTATTAGTTTTTATGGTATCTCTATGGATTATCGCCTCATGGACGCTGCGACAGTGTGAAAGGTTTCACGATGAAGAACATGCAAACCTTTTGAATGCCATGTGGCTTATAGCCATAACATTTTTAAGTGTTGGGTTTGGTGATATTGTACCAAATACTTATTGTGGTCGTGGTATTGCGGTCAGCACAGGAATTATGGGAGCTGGATGCACTGCTTTGCTGGTAGCTGTTGTGTCTCGGAAGTTAGAGCTATCCCGGGCTGAAAAACATGTTCATAACTTTATGATGGATACCCAGCTAACAAAAAGGCTAAAAAATGCGGCAGCGAATGTGTTGCGAGAAACATGGCTGATATATAAACACACAAGGCTGGTGAAAAGAGTTAACCCTGGACGAGTGCGGACGCATCAGAGGAAATTCCTTCTAGCAATTTATGCATTACGAAAAGTAAAAATGGATCAACGAAAACTTATGGATAATGCAAATACAATAACCGATATGGCCAAAACACAAAATACGGTGTACGAGATTATCTCGGATATGTCAACAAGGCAGGATGCGATTGAGGAAAGACTATCAAGTTTAGAGGACAAAATGCAGGCGTTGCAGGATCATATGGAGTCATTACCGGAGATAGTCACACGGTGTCTCACTCAACATCAAGAACGGTTGGAACAGCGGAGAAATTTTCTGCATCCGGATGCTGCAGTAACAGCGTCTGCACAACCGTCGCAGCCGCCACCTCTAGTTTCACCTTTACTCTTTCCACATTCCAGGAGTGTACCATCTACAAACAATGCAATTTTCCAATGGCCAACAAGTCCAATTCTGCCACCGGTATCGAGTAGAACGCCTCATTTGGTGCCTGACACATATATTCCATCGACTTTAGCTGCGACGGCGACACCAGCTGCAGCCACAAGTTCAACCTCTCTAACAAATAATAATAACGTTAACACATCTTCCAGTAAATTAAACAGCTGAATCGAACCTGCACAAACTCAACAAACGCATTCTATGGTGTGTCCGGCGTCAACCTCAATCACGACGGCCAGCAACAAATACACGAGACGGAGGGAACGACAACGAAAAGCCCAGTTCAGAGCAATGGCAACAACATCAACAGAAGCAACAGCAACATCAACAGAAACATCAAAATCACATAGTAACTCATTAGAAGACATTTTTACGCAACAAGGCAACTCGTGAGAAAATAATGATAGTAGAAAAATTGAATAGTGACGATTTTACTATGTAATGGGAATAAATTATTATTACTATTATATAAAGACTAGGAAATGAAGCAACTAAGAAATAAGTAAGCAAAAAGACATAGGCCAATTTCTAAGGTTCTAGAAAAGTAATAATCAATTGAGACGGGGGAGAAAATATGAATAAAATTCGTGAATTTAGGGTGTAAATCATTGGAATAAATTTTGATAAGAAGGAACTCGTTTTGTTGTTTGAGTATTACGGTTATTTAGTTTTTAATTATGTCACATTTTCCAGTCCCTTAGAAACTACAGAAAAATTCTCATCTGATATACCAAGTGAAAGAAAATATTGAGTCAAATTCTCCCTTAGAGAACTGACCCGTTGATCAGGGCTGCATGTGCACTTCTTGGCAAACACATTTGACCAAATAAAAGTTTTTCCTCTAGCAAATTGTTTAGTATCCAAGTCACACATCAATAGGAAAAAAGTGATATTTTGCCGTTTTAGTGATTTTAAAATTCAGCCCTTATAATGCGGAGGACCCAACGGAATTTACTTAGTATTTTCTGTTACTGGTCATTCAGTAATATTACTCAAAGTAGAAACGAACCACAAAAGTACGCAAATTAGTAACATAGAGACTAGATTTTAAAAAAACGTACTTTTAATTTTCTTTAAAAATATTCGAAACTATGGGGCCCACTTTAATAGTCATTCGAGCGAATAACGGAAGACAAATAATCGAAATTAAAAACAACCTGATTGCTTGGATTTAGATCTTAACCGGTTTCAATATCATCAAAAAAACAACCACTCAAGAAATCCTCTTCAACCTCCGGATGAAATGAGCAACTGAACATTATGTTGAACAATAAAAGAAAGCTTTACGACAAAATAGAAACATCAATAACTTCATAGACTTCATACCTAAGACGAAACAAGCTTACGATATTAAAGCCACAAATTATAAATGATAAGAAAATCTCGAAACGAAAAAGTGAACCACTACCAAAGTGAAGTTATGTAACGAAGATAGGAAATGACAAAACCCTATAGAAATGTAGAAACAATTATTTCATCTTTAGTATCTCTTAGACCATTCATTTTCTACGAAGTCAAGGACGAAATTGTTTTAAGTGAATTAAGAACCCTTTTAGTGTATTCATTTCGTTCTATGTAATTACTAAAAAGCGTGTTTCGCGAAAAAGCTTTAAGATTTAGGGTGCCTGCATTTGCTAAGAAAAAACTTAGATTTAAAGAGAATATTACTTATTATTATTAAAATTATTATTATCACATGATGGTAGTAAGAACAAGTAACATTAGTAGAAAAATAAACCCTTGCGGAAGTAGGTCATGCATATTATGTAACATATGTTTTGTTTATGTTTGAATCGGTACATTCAAACTCAATTTGTCCAAAAATATAAAAGTTTCGACAGATCGTTTTTACTTTTGTTAGAAAAGGTTTTACGTGTGTTGCTGAATAAAATTGAATAGAATATACGGAAAAGTCTATTGTACAAATTTAGTTTATATAAAGTTGTTGCAATTATACATAAAAGAGCAAGAAAGATAAAAGTCTAAACCAAAATTGATTTTCAAAGTTAAGGACAATTTAAAAGTATTCGCATATTTACCTATATACAAAACATATTACAACAACTATTAAGAAATTATACAAAAACAACAAAAACCTAAAAAACCATCCCTCAAAGAAATTAAAAGGAATTTAAAAAGGATCAAAACGGTATCTAAGCGTAAAATAATTGAAGAAAATCCATACTAGTCTGTTTTATTATGAATTACATAAAATACGGATGAATAATTATGAACATTCTTTGAAATGTATAAATTTCGATCTTAAAAGTAACAAACGAACACACCAATTTGAACGTATCTTGCAATAGTCGTCCATTTCATTCAGCCATTGTATTATATATTTAAAGATATATATATATGTCTAAAACAAATTTATAGATAAAAAAGTGAATTGATAAAACTCAACTAAAATTAAATTTAAACCTGTGAATCATAGAAAACCCGAAAGTATGTGGATTAAATTATGGTCTTATAAAAAATATTTAAAGCAAATATATAAAAATTAAACTTTAAAGAAAATCTGCTCACATGCGCTAAGTACTAATATGATAAAGTTTAAATCTAAAAAATTAATAAATTTTAAATTATCTCAACATTCAATACAGTAAATTTATGGGTACGACATAAGGCTGAAGTGTAGGAATAAATAAAATCGAGAATGGAAGACTATTGCAACTGTATTGTCACCTTGTTATATTTTGGCTCTCCTGATAAAGAAAATAAAAAAGAAATTACGAAATCACTAAAAAGAGAAAGATAAAAACCCTAATCTAGTTATTATTATTATATAGAGAGAGAATCGTTATTTCGCAACATTAATATAAAAATATTTATTGTAAATTGTTCTGTTTTGTATGATATAATCATGTATATTTAGTTTACAATTAAATACGTTTTCTGCA\n>XR_007117108.1 PREDICTED: Pieris napi uncharacterized LOC125050190 (LOC125050190), ncRNA \nCCCAACCAACATTTTGGCGCTAATTTTCACCACTCTAATCGTTTGTATTGTTTTAACGGGTATATAAAAGTGTCTAGTAAAACTTTTGTTGGTTTAATGGTCATGAATATAACTAAATAACTCATTAAGATGAGTAACAGTAACAATAATTCATAATATAACTTAAGAAGTTATAAAAGAGTTAAGCTGAACCACAGTAACGCTAGGTGTTGTAACCTCAAGTAACAATAAGTACCTCAAGTAGTAATAAGGTTTCTAGTAAGTCTTACTATTCCCAAGTGTTGTTTAAGAGTGCTAAGTAAATGTTTTTTACCACTTAGCTTGCCTAAAAACGTAATATTACTTAAGAAGGTATGAAGGTTATAGTCACAACCATCATAGAACTTACTCTTATATAAATTCAAGTAACGCGAAACACTTAAAGTAATATTATAGTTTCTAATAACTCTTTCTACCGACAAAAGCTCTTGAAAATAGTTGACAAAATATTTTTATCACCTAAATTGCTACAAAAGAAGTAATTGGAACTTATTTACAGCAATTTAATTTAGAAATTAGAAACCACTATATATGATATTAGTTGGTATTATGGAGTTATTTTTAGAGCCCTGTTCTTTACAACGGTGTTCGAATTTACCTTTATGTTATTCTAAGAAATATGAAAATACAATTTAAACGTTGTAACTTTTATTTTCACTTGAAGTTATAAAATATTACCTACTTTATAGCTGTATAATGTCTCTAACCTCAAAATTGTGTATAGTCTGATTTGCTCTGAAGTCTGTTTGCTCTTGCTTGCTTAATTTTTGCTATGAGTTCGTGGAAAAAACGAAAAAGATGTGGAGGAGTCAAAAGAAAAATATCAAACGAATACAAATTAATAATCAGATCAAATCAATCAGTGTCATCCTGCGATAAAACCACCAAACTGCAAACAGTGACCAGTATCAGTGATGCAGTTCAGCATCATAGTTCTTCGTTGAAGAGAAGTATTGATGACGCTAGTCTGGGTTGTAGTAGTTTTTGCAACGAATATTTTCATCCAGCGCAGCTTAAATGTCAACGAAAATGTTCGTACTGTCGTAGAAACTCCATCGAAAATGTCGGTCAAGTGCGGGAATTTCAACAAGGACTAGAAAATCATAATATGTATGTGAGCAGTAAACATGGTGAAACGCAAGATATTGAACAGGGTTCTGTAAGTGAGCATTTTATAATTTCTTGTAAAGAGAGGAATAAATATTTTCTATCATCAACTGATGATATTATTGAAGTCCTAAATATATCAATTATATCGACAATGACAAATAGAGAAACTATTATGATACAAATAGGAGGAGATGCTATCGAATATGTAGATCACTACGTATATTTAGGGCAAATAATATAATTTCATGACCAAAGGGATCTTGAGATAGAAAGAAGAGTGTCTAGCGCCTGGAAGAGATTTTGGTCACTCAAGGAAGTACTTAAAAGTAAAGACTTCCCAATAGTAGCTAAGAAAAAGGTGTTCAATCTATGTATACTACCATGTGTTACATACGGCTGCGAGACTTGGGCTTTATCTCAGAAACATCTTCTAAAGTTGAGAACATGCCAAAGAGGAATGGAAAGAAGCATGGTGGGTGTAACACTGAGACATCGAAAAAGAGCAGAAGAGATCAGATCAACGACCAAAGTAGAAGACATTATAAAGAAAATAAGGCAGTTGAAATGGCGCTGGACTGGGTACATGACGAGAGATAGCAGGTTGAAATGGACAAAAATAATTACAGAATGGCAACCACGTGATG\n>XM_017443506.2 PREDICTED: Diaphorina citri phospholipase A2-like (LOC103507865), mRNA \nTTTTACTCGTCACCATGAAGTCTATCCGGGCTCTCCCTGTGAGTGTTTTACTCATCTTTGTATTCATCTCCTCTGTTCGTAGCTTTGATCAGTCCTACTATAAAAACGCGTATAATCACAACAAGTACAATTACTTGAAGGGAAATAACAATAACAAGTATAGTAACTTCAATTCCAACCAGGACAGTTACCGATCCGACAAGAGTGACTTGATCTTCCCTGGAACCAAATGGTGCGGTGCAGGAGACATTGCCACCGACTACAATGACCTAGGAACCAATGTAGAGACAGACAAGTGCTGTCGAGACCATGACCATTGCTCGGAATACATCTTGGCGAAGAGTTCTCTCCATGGACTGCGAAACAACGCACCCTTTACCCGAGTTCACTGCAGATGTGACAAGAAGTTCTACGACTGTTTAAAGACGGCGGCTGACACGGGAGATCAACCTTCCCAGATGGTGGGATACATGTATTTCAATTTACTAGAGACCCAGTGCTTCCAGGAAGTGTCACTGCTGTTATTTTAA\n>XM_002502056.1 Micromonas commoda predicted protein partial mRNA \nATCCCGGGCCAGGCGGACACCGAGGCCATCACCGCCGTCGCCTTCAGCCAGTGCAAGAGCTACGTGGCCGTCGCGGAACGCGCGGAGAGGGGTGTCATCACCGTTTACGATCTCACCACGACGACGGGCTCGCCCAGGAAGCGCGTGCTCGCGTCCACCGACGTCGGGTCCAAGGAGTACGTGAGCGTCGCCTTCTCCCCCGACGGCAAGTGGGTCATCGCGCAGGGCGGCGCCCCCGAATGGAACGTGACGCTGTGGAACTGGGAGCGGTGCAAGCAGCTCGCGTGCGTGCCTGCCAAGCCGCTCGGATCGGACGCGGGCGCCGTTCGCCAGGTGAGATTCGCCGCGCACGACCCCGGTCTGGCGTCGTGCGCGGGCGAGGGCCTCTTCCGCACGTTCAAGTGCGCGGAATCCGGGGTCAGGGCGCTTCCGGATGTTAAGCTCCCGCCCGCCAAGTCGGGCGCGATTAAGAATTACACGGCGCACTGTTGGCTTCCCGACGACGCCGAGGTGACGGACGGCGGGGAGGAGGGAGCCGAGCGCCGCGAGCGGTGCATCCTGGCGACGGACGGCGGGGAGTTGCTGGTCGTCGAGCTCAACGAGGTCAAGGCGACGATACCGGCTTTGAGCGACTGGAAGGGTGTCGACTGCGTGATTCCCTACGGCGCCGGCGGGTTTGTGTGCGGCGGCGCGGACGGGACCGTGAGCGTCTACGAAAAGACGGACGAGAAGGAGCTCTACAAGCGCGTGAAGCACTTCGTGATCAAGCAGTCGCCCGGCGCGAGGGTGACGGCGCTCGCGCTATCCCCGACGGACGAGACTTTGCTGTGCTCCACCGACGATAACCAGATGTACGAGGTTGACATGTCCAACGTCGACGTCGTGAAGAGCGAGGACATCGAGTGCCAACTGTTCACGCAGGGGCACCACACGCAGGGCGTGACGGGCGTGGATCTGTGCGTGCGTAAGCCGCTGGCGGTGACGTGCTCGAGCGATAAGTCCGTGCGCGTGTGGAATTACTTGGACAAGGCTGACGAGATTTGCAAGTACTTCGCGGAGGAGGCGCACAGCGTCGCGTTCCACCCCAGCGGGCTGCACGTTCTGGTGGGGTTCAGCGACAAGCTCCGGCTGTGTAACCTGCTCATGGACGACATCAGGCCGTACCGCGAGTTCAGCATCAAGGGCTGCCGCGAGTGCTCCTTCAGCAACGGCGGCAAGTATTTCGCCGCCGTGAACGGGCCCGTGATCCAGGTGTATAACATGTACACGTGCGAGAACGTGGGCAACTGCCGCGGCCACGGCGGCAAGGTGACCGGCATCGCCTTCTCCGCCGACGATAAGCGCCTGTTATCTACCGGCCTGGACGGCGCCGTGTACGAGTGGTCCCTGTCCACGTTCCAGCGCGAGAAGGAGAACGTCATCAAGTCCAACGAGTACGCCTCCGTCGCGATCGCTCCCGACGATACTTACGTCTTCGCCGTCGGCTCGGACGCGACGCTCAAGCAGCTCGACGGCGAGGACCTCATGCTCAACGAGGAGTTCGCCCTCACGGGGACCGGCGGTGATGGCGGCCAAACCCAAACCCAAACCTTCACGCGCGTCCGGCTCACCAACGGCGGCAGACGGCTCTTCGCCGCGACGTCCACGGGGGCTGTGAGGGCGTACGAGTTGGACGGCGGCCGGATCGCTGGCGAGGGCAAGGAGTTCAAGGAGCTTCGGTGCCACACGGGTCCAGTGACGGGGATGCGGGTCAACTTCGACGATACCCTGCTCTTCTGCGTCGGCGAGGACGGGGTGTTGTCCGTCTTTGACGTCAAGGAGCGCGCGATGGAGGGCGCGACGAAGGCTGGCGAGGGGATGGTGTTTGCTCAGGAGGTGCTCATGACGAAGGCTGACCTCGAGGATATTCGCAGCAGGATGCACGAGCTCGAGGTTCAGGTCAACGAGCTCACCCTTCAGGGCGAGTACCAGCTTCGCCTTAAGGACCTAAACATGAACGAGAAGATCAAGGATCTCACCGACAAGTTCCAGGGCGAACTCGAAGGCGAGCGGTCCAAGTACGACGCGCTGCTCCAGGAGAAGAACGAGCTCGAGATGGATTTCGCGGACCAGATGAAAACCACCGAGAACAAGCACGCGCAGGCCACGGCCGCAACCGAGTCTTCGTTCCAGAACAAGATCCTGAACGAGATCGAGCGGTACCAAGCGCTCGTGGAGGAGAAGGAGGAGCTCAACCGCGGATGGGACGAGCAGAACACCGCACTCGCCGAGTCGCATGATCGCCTCGTGGCGGATCTCACCGAGGAGTTTGCCGGTAAACTTCAGGAAGAGCAGATGCACTCGGAGACTCTTCGGCTGCAGCTGGAGGAGGCCCGCGCGGCTGCGAATGAGCGCGAGAACCAGCTCGAGGAGGACGCCGACCTCGAGATTGACGAGCTCAAGGAAAAGTACGAATTAAGGCTCAAGGAACAGCGCGACGTGTCGCTGAGGTTGAAGGGCGAGAACGGCATCATGAAGAAGAAGTTCACCACCATGCAGAAGAGCATCGCGGAGCAGAAGGACGAGATTGCCGGTCTCTTCACCGATAAGAAGAACCTGTACGCCACGATCGCAGATCTGGAGAAGGACGTCGCGGGCCTTAAGCGCGAGATCCGGGACAGGGACGAGACGATCGGGGACAAGGAGAAGCGAATCTACGACTTGAAGAAGAAGAACCAGGAGCTGGAGAAGTTCAAGTTTGTCCTCGACTTCAAGATCAAGGAGCTCAAGCGGACTATCGAACCCCGCGAGCAGGACATCTCGGATATGAAGAATCAGATCACTGAGATGGACAAGGAGCTGGAGAGGTACAACAAGAGCAACACCCACCTCGACCTCACCATCAAGGACCTTCGCAACAAGCTCCTCGGGATGGGCCAGGACGTCAAGCGCAAGCAGAAGGCGATTGAGGACCGGGACTCTGCAATTCATTCGTTCCAGAAGGATCTCCACGAGGCCACGAAACACGTCCAGACGCCCAAGCGACTCGCCGAGGAGGTCAAGTCCCTGTACGCGAAGCACATGACGCAGAAGATCGACGACAAGCCCCCCGACAAGGACATCCAGCGCGAGTACAATCGCCAGCGAGAGTACCTGGAGAAGACCATCGATCAGTTCAAGCGCAAGCTCGCGAAGGACGTCGAGACGCACAAGAAGGACAACATGGCGCTGATGA\n>EF225152.1 Uncultured bacterium clone Br_008751_0450_0145 16S ribosomal RNA gene, partial sequence \nCACCGCCCGTCACATCACGAAAGACCACGTTGTACTAGAAGCCGGCAATTCAACCGCAAGGAGATAGCCGTCCAAGGTATGACTGGTGATTGGGGTG\n>XR_004539126.1 PREDICTED: Geotrypetes seraphini TIA1 cytotoxic granule associated RNA binding protein like 1 (TIAL1), transcript variant X6, misc_RNA \nCCTCTCCTCTCGCGTAGGGTCCGAGGAGAGCGGAGGTCGGCGCCTGCGCGTTGCGGGGATTCCTGCCTGACTGACTGGCGGCCGCCATTTTGTTATCCCGGATCTGCAGCGGATGAGCCGTGCTGTAGGAGACGTAGTTGTCTGCTCGCTCCCTCCCCGCCCGTCCATCTCTCCCTCGCCCCGGCAGCCATGATGATGATGATGATGGAAGACGACGGGCAGCCACGGACCCTCTATGTCGGTAACCTTTCCAGAGATGTCACAGAAGTTCTTATTCTCCAGTTATTCAGTCAGATTGGCCCCTGCAAAAGCTGTAAAATGATAACTGAGCAACCTGATAGCAGAAGGGTCGGCTCTTCTGTTGGATTTTCTGTTTTGCAGCATCCAAGCAATGACCCGTATTGCTTTGTGGAATTCTATGAACACAGAGATGCAGCTGCTGCATTAGCTGCCATGAATGGGCGAAAAATATTGGGAAAGGAAGTCAAAGTAAACTGGGCAACTACCCCAAGTAGCCAGAAAAAAGACACTTCCAATCATTTCCATGTGTTCGTTGGAGATTTAAGTCCAGAAATCACAACAGAAGACATAAAGTCAGCATTTGCTCCTTTTGGTAAAATCTCGGATGCACGTGTGGTCAAAGACATGGCAACAGGCAAATCAAAAGGCTATGGTTTTGTTTCATTTTATAACAAATTGGATGCAGAAAATGCAATTGTGCACATGGGAGGCCAGTGGTTAGGAGGTCGTCAGATCAGAACCAATTGGGCGACACGCAAACCACCTGCTCCAAAAAGTACACAAGAAAATAACACAAAACAGCTAAGGTTTGACGATGTAGTGAACCAGTCAAGTCCCAAAAATTGTACTGTGTATTGTGGAGGAATTGCTTCCGGACTTACAGATCAACTTATGCGACAAACGTTTTCTCTGTTTGGGCAGATCATGGAAATACGAGTTTTTCCAGAAAAGGGCTATTCCTTTGTCAGGTTTTCAACTCATGAAAGTGCTGCTCATGCTATTGTTTCAGTGAATGGAACTACGATTGAGGGGCATGTTGTTAAATGCTATTGGGGTAAAGAATCCCCTGACATGTCTAAAAACGTACAGCAGGTCTGTGAGATGCCTCTTATGTGTGTATTTCATTGATTGCCATACACACTATCTCTTCAATTTTAATTTTTGGACTTGTGGCATTTGTATATAGACACCTAAAGATGGAGTATGGGCAGTGGGGACAGTGGAGTCAGGTGTATGGAAATCCACAGCAGTATGGACAGTATGTGACCAATGGATGGCAAGTACCTTCATACGGGATGTATGGTCAAGCATGGAATCAGCAAGGATT\n>XM_013369717.2 PREDICTED: Columba livia parathyroid hormone like hormone (PTHLH), transcript variant X6, mRNA \nGAATCGTTTCACCCGGTTAGAAGATTACACCAGGTCAGACGTGGCTAAGGATTTTCTTATTCCTGACAGCAGCAGGAAGGAGAGGAAGGCAACCTTGATGGGAGCTGGGAACAGAGTGCAACAGGGAGGAAGATTTCGCTTCTGAGCAACTTTTGGGGAGCCTGGTCGCCCACCCATCTGCAGCCCCTGGCTCTATTCACCGCTCAGGAATTACGTGCCAAACCTGGAACAGGGACTTACCTTCCTAGCCAAGCTCTCAGGATAAAATATAGTTTTGGAAGCAATTGCTGAGAAGATCAACCACTGTTGGCCAGGGTGATCTCTGAGAAGCACAGAGGGCTGTAACTCAAGGAAAAGGTTTTAAGACCCGGAGGATACAATGTTCACTAAACTCTTCCAGCAGTGGAGTTTCGCAGTGTTTCTGCTGAGTTATTCCGTGCCTTCTTACGGGAGATCAGTAGAGGGGATCAGCCGCAGACTCAAACGAGCTGTATCAGAGCACCAGCTATTGCATGACAAGGGCAAGTCAATCCAAGACTTACGAAGAAGAATATTCCTTCAAAATTTAATTGAAGGTGTCAACACTGCAGAAATTCGTGCAACTTCAGAGGTTTCACCTAACCCTAAGCCTGCTACCAACACGAAGAACTACCCTGTCCGATTTGGTAGCGAAGATGAGGGCAGATACCTAACTCAGGAGACAAACAAATCACAGACCTACAAGGAGCAACCCCTGAAGGCATCAGGGAAGAAAAAGAAAGCAAAGCCTGGAAAACGTAAGGAACAGGAGAAGAAAAAGAGGCGAGCTCGCTCAGCTTGGCTAAATTCTGACATGTATGGAAGCAGTGTGACCGTGAGCCCACTCTTGGACAACTCCGTTACTACACATAATCACAATTTAAGGAGGCGCTGACATTTTCAGCAAGAAATTTTTGGAAGACATATTGCAGTATTCTGTAATAGTGAACATATGGGAAGTATTAAAATATTTATTACCTGTAAATATTGTAAATGCTCAGAATAAAACTTTTTCCCCCATTGCTCTCTGAAACTGCACATTTGGTTATTGTGAATTTTCTTTGTTTCTTTTTTTTTTTTCCCCTAAGGCTAAGACAATTATTATTATCACATTTAACATAATTTATTTTGTTGACTGGTGTATTTATTTTGTGAACGTATCTTGGTGCTGCTGACTTTCTATATTTTTTGTAACATAATGCACTTTAGATATACATATCGAGTACATTGATAAGTGACATAAAATGTTCCCATTTCGTGGTTGACTTCAATGAATGCCTACATACAATTGTTCAAACTGATTTTCCTTTGTGCATGTATAATAGCAGTATTTTAAAATTTGTAAAGAATGTCTAATAAAATATAATCTAATTAAATCA\n>XM_027670495.1 PREDICTED: Neopelma chrysocephalum smoothelin (SMTN), transcript variant X3, mRNA \nGGGAGCGCAGCCGAGCCAAGCGCGGGGCCGCGCTGCCCCGGACGCCCTTTGTTGTCTCGGTCGCCGCTGAGCCCCGGCCGCAGCAGCGCGGGCCCGGCGGGCGGGATGTCCCAGGAGAGCCTCCTCGGGATGGACGAGGGAGCGCTGCGGAAGCTGCTCGAGGCCACGCTGGACCTGGCTGAGCGGCGCCGCATCCGTTCGGCCATCCGGGAGCTGCAGCGGCAGGAGCTGGAGCGGGACGAGGAGGCGCTGGCATCCAAGCGCTTCCGCCCAGAGCGCGGCAGCCACAGACAGGACGACAAGGAGAACTGGCCACGGTCTCAGCACCTGGAGGAGGAGCAGCAGGCAGCCCTGGCCGCCTTGTCCCAGGAGCTCGAAACAATCACCAGCGTGGAGGAGCTGACAAAACTGCTGCGGGCAGCGGGTGAGTATGAGGAGCGCAAGGTGATCCGAGCTGCCATCCGTAAGCTGCGGGCTGAGGAGATCAAAGCTGCGACACTGGCTGGGAATGTGCAGAGCAGCCGGAGGGATGGCAACGAGCCCCGCACTGTGCCTGGGGATGCGAAAAGTATCCAGAGGGACAATGCTGAAACACCAGCCCTTACTGGGAGTGGGGAAAGCCTTGGTGAGGGCAGCACCAAGCCCCTGGGCACAGCCAGGAGAGGGGAGAGCAGCCGTCAGGACGATGCAGAACTGCCGGCACTGGCTGAGCTAGAGGAGAGTGGGCACAGGGGGGCTGCGGAGCAGCCCCCTGCCCAGGAGCCTGAAGTTTCGGCGGACCATGAGCGAGAGGACATGGTGGAGCAGGAGCATGTCCCAGCCAGGATGCAGGAGCTGTGCAGCCAGCAGGCGGGAGACCCCCAGAAACCCAGTGTCCAGGAAGTGGTGTCGGGGACCCTTGTGCTTCTGGAGCTGCAGCCGGCCCCAGAGCCCAATCCGGAGCCTGAGGATGGTGTTGAGGAGCTGGAGCAGGGCCAGCCCCAGGGGCAGCAACAGGCAGCCTGGAAGGCAGGGAGCCTGGACAGCCCAGCCACTGCTGCGGAGCCCAGCAGGAGGCAAAGCCCTAGAGGGGAGCAGCCACCCCTGGGCCAGCCTGGTGCTGCCAGCCAGCTCCATGTTGGGGTGCGCTGCCAGGCACTGGGGCCAGATGGGAGACACGGGAGGCCACCAGTGGCGCCAGTGTCCACCCAAGATCTCGTAGGGACCCCAGCTCGCCTGAACACTCACCAGTGGGAGCAGGTGCCCTCCTCTTCGTGCCCAGCTGGCCCCACGGAGGTGACCCTGGGGCTGCGGAGCACCCCCATCCGCATCACCACCATTCCCAGCAGTGTCAGCAGTATCTGCAACATCAGCAGTGTCAGCAGCAATGTCACCAAGATGGAGCCGGAGGTGGTGGAGCAGCCCCAGGTTCTGAGGCTGGAGCCAGAGCTGCCCAACGGCATGGAGAAGGTGCAAGTGAGGGAGGTAGAGAGAAGGAGCAAGCTGAATGTCGAGGAGCTGAGCAGGATTGAGGATGAGGATGTTCTGGATAAGATGCTGGATCGGACAACAGACTTTGAGGAGCGACGGCTGATCCGAAATGCCATGCGGGAGCTGCGCCAGCGCAAGCGAGACCAGCGGGAGAAGGAGCGAGACCAGCGGCTGCAGGAGGCTAGGAGCCAGGCTATGGCAGGAAGGGCTGGCCACGCCACCGAGACCACCACCACGCAGAGCACTCAGTCAGCTGACGGCTCAGCTCGCAGCACCGTCACCAAGACTGAGCGTCTCGTCCAGTCTAGTGATGGCACCAAGACCTCCCGTACCACAACCATGGAGTCAAGTTATGTGAAGAGATCAGACAGTGGCAACAGCACGTTTGTTCAAACCAAATCATCCTACAGCTCCTCGTCCAAGAAGACCGGCAGCGTCTTTGACCGTGAAGATGAGAGTGCCTCCAGGCAGAGCAGCCTGGCTGCACTGGAGCGACGTCAGGCAGAGAAGAAGAAGGAGCTAATGAAGGCTCAGAGCCTGCCCAAGACCTCAACCTCACAGGCACGCAAGGCCATGATGGAGAAGCTGCAGAAGGAAGGCGGGAGCTCACCAAACCCCGCAGCATCACAGACCACTGTGCAGCGCTCCTCCAGCTTCGGCGTGCCCAATGCCAACAGTATCAAGCAGATGTTGCTGGACTGGTGCAGAGCCAAGACCCGGGGCTACGAGCATGTGGACATCCAGAACTTCTCGTCCAGCTGGAGTGACGGCATGGCCTTCTGTGCCTTGGTCCACAACTTCTTCCCTGATGCGTTTGACTACAGTAAGCTGACACCCCAGAACCGCCGCCACAACTTTGAGGTGGCCTTCTCTTCTGCAGAGACGCTGGTGGACTGCGTGCCGCTGGTGGAGGTCGAAGACATGATGATCATGGGGAAGAAGCCAGACGCCAAGTGCGTCTTCACCTACGTGCAGTCCCTCTACAACCACCTGCGTCGCCACGAGTTGCGCATGCGGCAGAAAGAGTGCTAGAGCCTGCCCTGCCCACCCCCCCACTGTCCTTGCTGCCAGGGCTGCCAGTGGGCAGGGGAGCTGTCTGCCCCAGGAGGGTCTGGCAGGGCCACAGGTCTGGCACTGAGGACAGGGGGAACTCTGACACCCAGGCAGTCCCCTGCCTCTGCCTTGCCAGAGCTGCCTCTGCCCCGGCCAGCTGCGGGCTGACCCCATGAGCAGGGCCAGGCAGGCACTGCTGGGGATGCTCCTGGCTTGGCTTGCCCCCTGCGCTCCAGCCTGTTAAGTTATTTGTTCTCCAGGAATTGTGTACCCTGCGGGCAGCACTCCTGTGTCCCTGGGTGGCACAGCTGCGCCCTCAGGCCTGGGGCACAGTGTGGGTCAGTGGCTGAGCAGGACCGTGTAGCCCAGCCAGGCATCCCACAGGCAGCATCTGTCAGTGGTTCCCATGGCTCCCTGTGAGGAAGCCCCTCTGCCCACCGCAGGCCCTGCTTGGTGTCACCTCCCTGGGGACAGCTCCACAGCTGTGCCGACACCCTGCTTCCCACCTTCACGTGCACCTGGGGCACTTCCGCACTAGGGGCTGCAGCACCTGTGGGCTGGGGAGCGGGCAGGGGTGAGAGGTCCCAGGGGAGCACGAGGCTGAAGGAGCCAGCCAGGATGGCAGCCCCTTCTCCCCTCTCCTGCTCAGGGCACCACGCGCTCAGCGCCGCTCGCCCCTCCGTCACGTCTCTACACCTGTAACGACACGTGTACCAACACCAGCCAGATAATAAAGGTTTACCTAGGGTGA\n>XM_032185005.1 PREDICTED: Aythya fuligula latent transforming growth factor beta binding protein 1 (LTBP1), transcript variant X5, mRNA \nAGGAAATCAATGGATACCAAAGTGTTCTGTTTATTTTTCTTTTTTTCTTTGCCTCCGCTGACAGTGGGAAATCACACTGGTCGCATCAAGGTGGTCTTTACACCCAGCATCTGCAAAGTGACTTGCACCAAGGGCAACTGTCAGAACAACTGTGAGAAGGGAAATACCACCACCCTCATCAGTGAGAATGGCCATGCTGCTGACACTCTGACAGCCACTAACTTCCGAGTAGTTATTTGCCACCTTCCATGCATGAATGGAGGCCAGTGCAGTTCTAGAGATAAATGCCAGTGCCCTCCTAATTACACTGGTAAACTTTGTCAGATCCCTGTGCAGACTGCCAATACTCCAAAACTGTATCATCACCCACAACAGGTGAACAAAGCTGTAGGATCTCAAATTATCCACTCGACTCATACTTTACCACTGACAATGTCTGGACAACAAGGTGTAAAAGTGAAGTTCCCTCCTAACATAGTGAATATCCATGTGAAACATCCCCCTGAAGCCTCAGTTCAGATACATCAAGTTTCAAGAATTGACAGCGCATCAACAGGACAAAAACCGAAAGTACCTCAGCCAGGACATCCACAGGTCTCTTACCAAGGTCTTCCATATCAGAAGACCCAGAAAGGACATACTGCTTACACAAATCAACAACCCATTCCTCATGTGTTTCCTGTTTCAGTTAAAACTCAGCTTGGACGTTGCTTCCAGGAGACTATTGGAACACAGTGTGGCAAAGCACTTCCTGGCCTTTCCAAGCAAGAAGACTGCTGTGGAACCGTGGGTACTTCCTGGGGTTTTAACAAATGCCAGAAATGTCCTAAGAAGCCATCATACCATGGATACAGTCCTATGATGGAATGCCCCCAAGGCTACAAGAGAATCAATGCTACATTTTGTCAAGATATTAATGAATGTCAGTTACAAGGAGTATGCCCTAATGGTGAGTGTTTGAATACCATGGGCAGCTACAGATGTACCTGCAAAATGGGATTTGTGCCAGATCCTACCCTCTCAAGATGCATAGCTGATAGTCCTATGGTTGCTGAAGAGAAAGGACCCTGCTACCGGTTTGTTAGTGCAGGAAAACAATGCATGCATCCTCTTTCTGTTCAGCTCAGCAAGCAGCTTTGCTGTTGCAGTGTTGGCAAAGCCTGGGGCCCACACTGTGAGAAGTGTCCCCTCCCAGGAACAGCAAAGGAAGAGCCAGTGGAGGCACTGACCTTCTCACAGAAAAGTGAGCCTGAGATGGCTGTGCAAGAAGTGGCAACTGCAGCCCCTGATCAGGAATTAGTTTCACTCGATCAAGAAAAGCAAATCGTAGAGCCTGGACAGCCCCAGCTCTCTCCTGGAATTTCAACAATTAACCTGCATCCACAGTTTCCAGTAGTGATTGAGAAAACATCTCCTCCTCTGCCTGTTGAAGTTGCTCCTGAAGTCTCTACTTCAAGTGCAAGTCAAGTAATTGCACCTACTCAAGTTACAGAAATCAACGAGTGCACAGTTAATCCTGATATCTGTGGAGCAGGACACTGCGTTAATTTGCCTGTGGGATACACATGCATCTGCTACGAGGGATACAAACTTAATGATCAGCAGACAAAATGCTCTGATATTAATGAGTGTAATCAGACACCTCATCTCTGTTCCCTTGGACGCTGTGAAAATACAGAAGGAAGTTTCCTATGTATTTGCCAAGCTGGATTCATGGCCAGTGAAGATGGAACTGACTGCGTTGATTTTGATGAATGTTCAAGACCTCATACTTGTGGGGAAGGCTTCTGTATAAATACTGTTGGCTCGTATAGGTGTGAATATTGTGATAATGGCTACCAAATGAACAGGAGAGGGGAATGTGAAGACATTGATGAATGCATGACCCCAACGACTTGTCCAGATGCACAGTGTGTTAATGCTCCTGGCTCTTACCAGTGCATTCCTTGCAGAGTGGGATTCAGAGGCTGGAATGGACAGTGCCATGATATAAATGAATGTCAGTATGGCAATCTCTGTACACATGGACGTTGTGAAAATACTGAGGGGTCTTTCAGATGTATTTGTGGCCAAGGTTTCAAACTCTCTGCATCAGAGGATCAGTGTGAAGATATAGATGAATGCCAGCACAGATCACTTTGTGTGAATGGGCACTGCAGGAACACAGAAGGGTCTTTTAGATGTGTTTGTAACCAAGGTTACACATTATCTTCTACTGGAGATCAGTGTGAAGATATTGATGAATGCCTTCAAGACAGTGATGTATGCCTTCGAGGAAACTGCATGAATACTGATGGGTCTTACAAATGCACTTGTCCAGATGGCTTCCAGCAGATAGCAAATAGGGGATGTCAAGATATCAATGAATGTGAGAGATCTGACCTCTGTTCACCTCACGGGGAGTGTCTGAACACAGATGGGTCCTACCAGTGCATATGTGAGCAGGGCTTTTCTGTGTCTGCAGATGGCCGAACATGTGAAGATGTTGATGAATGTGTGAACGGCACACTGTGCGGCAGTCATGGGTTCTGTGAAAATATGGATGGCTCCTATCGCTGTCTCTGTTACCAAGGGTATCAGGATGCACAAGATGGGCAAGGTTGTACAGATGTGAATGAATGTGAAATGCTGAGTGGGGTATGTGGTGAAGCCCTCTGTGAAAACGTCGATGGTTCTTTCCTCTGCCTGTGTTCTGATGAAAACCAGGAGTATGATCCGATGACCGGACAGTGTCGCTTCCGTACCTCACCAGAATTGCCAATAGAGGCCGATCAACATGAAGATGGAAAGAAGGAGTGCTACTACAATCTGAATGATGCTAATTTCTGTGACAACGTGCTTACATCTAATGTAACCAAACAGGAATGCTGCTGTACTTTGGGTGCTGGCTGGGGTGACAACTGTGAAATCTTCCCATGCCCTGTCTTTGGAACTGCTGAATTTACTGATTTGTGTCCTGAAGGGAAAGGTTTCATTCCCTCTGGAGAATCATCTTACGGGCTTCTTGCTGAGAATTACAAAGATGCTGATGAATGCCAGCTCTTTGGAGAAGAAATCTGTAAAAATGGCTTCTGTTTGAATACGCAGCCAGGTTATGAGTGCTACTGCAAACAGGGCACGTACTATGACCCTGTTAAGCTCCAGTGCTTTGACACGGATGAATGTCAGGACCCAAACAGCTGTATTGATGGCCAGTGCATTAACACAGAAGGATCTTACAACTGTTTCTGTACACACCCAATGATTTTGGACGCAACAGAAAAGCGGTGCATCAGACCAGCAGATTCAAGTGAACAAACTGAAGAAACTGAGGTCTACCAGGATCTTTGCTGGCAGCATCTAAGCGATGATTTTGTTTGTAGTCGACCTCTGGTTGGAAAGCAGACTACGTACACTGAGTGCTGTTGCTTGTATGGTGAAGCCTGGGGCATGCAGTGCGCCTTGTGTCCTATGAAGGAGTCAGAGGATTATGCCCAGCTGTGCAACATTCCTGTTCCAGGATCTCGACGTCCATATGGACAAGATGCTTTGGTTGACTTCGAGGAGCACTACACTCCAGAAACTAATCCATACTTTGTTGAAGACCGTTTCCTGAACAGCTTTGAGGAGTTACAAGCAGAGGAATGTGGTATTCTGAATGGATGTGAAAATGGCCGATGTGTAAGAGTCCAGGAAGGCTACACCTGTGACTGCTTTGATGGTTATCACCTGGACATGGCCAAAATGACTTGTGTTGATGTGAATGAGTGCAATGAGCTGAACAACAGGATGTCTCTCTGCAAGAATGCCAAATGCATTAACACAGAAGGTTCGTACAAGTGTTTGTGTCTCCCCGGGTACGTACCTTCAGACAAGCCAAACTACTGCACACCACTGAACTCAGAACTAGACAGTGAACTGGAGTAGAGGAAAATCTCCATATCCTAAGCCCATATACTCTGCACTGTATAAAGAAAAGGAAGAAAAGTATTTAACTTGAGAAGAGAAGGCACCAGAGTAGTGAACATAAGGGGAAAAACACATTAAAATGTGTCAAAGGTGAGACATGATGGGCTGATTGTATGTCAGCTTCACTGAAGTGACAGACCAAATGGACACATTACTCTGTATGAAAGAAACAATCAAGTATATAGTGTGTTCATAAGAAAAAAAAAAAAA\n>XM_038354470.1 Zerene cesonia endocuticle structural glycoprotein SgAbd-5-like (LOC119831184), mRNA \nAACACATTGCAAGTGAAGACGATACGGTCACAAAGCTGCGAAGCAAATCCAATCATGAAATTTTTGGTGGTAATTGGTTTCTTGGCATTAGTGTCGGCTGCTCCCGCACCGCAACGTCAGCCAGGTGCCCCAAATCCACAAGAAGTTCAAATTCTTCGCCTCGAAACTGAAAACGACGGCCTCGGCTCGTACAGATATGCTTTGGAACAAAGCGATGGCACGAAGAAGGAAGAGCAAGGGGAACTGAAGAACGCTGGTAAAGATGACGAGGCGATCTCGGTCAGGGGATCTTACGCCTGGGTTGGACCTGACGGTGTGACATACATTGTTACTTATCTTGCTGATGAAAACGGTTTTCAACCAACGATAGAACAGGGCCCAGGTGGTGCTGTGCCTTCTGCTGTCATCGCGTCCCTCGTCGGCTGATCAACAAATAACCCAAAACCTAGTCGCCAAATAAATTACCATATTTTTTTAA\n>XM_035478915.1 Colletotrichum scovillei oxidoreductase (HER10_EVM0009428), partial mRNA \nATGGCTTCCGTACCCACGCTTCGAGAGCTTGCAAAGCAAGTCTCTGAATCCATCTCAGACGAACATCTCGCCGGTAGTACGTTTGCTATTGGCGGTGAGATCCCAATTGAGCAGCCCAAAGACGAATCTAGCCCTACGACTCAGGTTGTGTCTTCTTCGGTCGTTCTTCGGTGGGACAATCCGGGGGAACATCCTGGCCCCCAGCGAGTCTCCTTCCCAGTCGCTTCAGATGACGACGCTGTCGCCTTCAATCACCTCCTCAAAGCCTCTGAAAAGGCTACATTCGGTCTCAACGGACGGCACGAATTCGATGAAACGTACCGCAAGGCTCAGAAGCTCGGTGCGGGTGATTTCTGCACCACCTTCTGCCCATATGAAACAGGCATCATCGACGCTGTTTGCCAGGTTCTTCTCCCTAGCTACGATACGGACGAAGACACGCGGGCAATCCGGGCGGAGCTGTACAATATGAATATCTACTCTGGTCCTTCGGGCAAGTTCAAGGCGCACGTCGATACTCCTCGTTCGCCCTACCAGATTGGCTCTTTGGTTGTCTGTCTTCCGATGAAGCATGAGGGTGGCGAGCTGGCAGTGAGACATTTTGGACAGACTCACACCTTTGACTGGGCCAAGAACTCCAACAACTCCGTCATTCAGTGGGCGGCCTTCTACAGCGACTGCGAACATGAAGTGCTCGAGGTCAAGTCCGGTCACAGAGTTACACTCACATACAACTTATATGCCACAGCAGGAAACGGAGAACTCGCAGGTGAAACGTCTGCTTTCAGCCCTACTTCGCTGCCACTCTATAGCCAGATCGTAGACTTGCTCGGCTCCAAGAAATTCCAGTCCAAGGACAGACTTCTGGGAGTCTACAGCACGCACGCGTATCCTCACACCGAAAAGGAACACGGCCTTCCGTTCTGCCTCAAGGGTCTTGACATGGTGCTCTACAACACCTTCAAGAGCCTAGGCTTGAAAGTCAACTTGTGTGCCATTCTCGAAAACCCGAAAGGCTTTTGCAGACGTAAGCTTTACAATGGAGAGTTTTCCGATGAGGATTCAGATACCGAGCCAACGCAGAAGGTGACATTGGCGAAGAACGATAGCGGGGACAAATTTGACTCGGACGGCGACGATAGCGGGGACCAATCTGACTCGGACGACGACGATAGTAATAAGTACTACACCAGAACCGTCGGATACATCAATCAAGCATTCTCCACTGACGAGCTGGTTGAGGACGACGATGATCTGAAAAGCATCATCAGCCGGGCCATGAGAACCAACAAGGTCAAGTTCGACGCCAGCAAGATCATCTGGCTGAACAAGAACAATGGCGAGTCGAATATGCAGGTGTCATATATGGCATACGGCAATGAGCCATCCTCCGAGGAAATCTACTCATACTTTGCGATGGTCATTGAGATCCCTGGTGTTGGAGTGAATGCAAGCGATAACGCGGAAGCGTAG\n>XM_041571208.1 PREDICTED: Xenopus laevis lysine-specific demethylase 2A (LOC108697539), transcript variant X12, mRNA \nATGTATAAGTCCATATGGGCAGCACTCCACTCTTGATGTTTAAACTCGGGTGCAAGGTAAAAGAATCAGTTATGTAGACAAATGACCAGCAACACCGAGATATTTCGTGAATAGTTCAAGTGTATTCAGTAAAAGACACCTGGTTACAGAGACCACTAAAAGATGGTTGCTATAAATGCACCAATTGCCTAACGTGCAGGGGAATGTTACAGGGCACACATTTCACCCATCCTAGGACTGGAACTAAATTTCGGATCAACCATAGGGTCACTTGTACCACAGATCACGTCGTATATATGGCCTGGTGTCCGTGTGGATTACACTACATTGGGAAGGCATCCACCACATACCGCGAACGGATGAACAACCATCGTTGTGCCATCAGAAGTGCCCTGACTACTGGGAAAGCAGATCAACCCATTACGAAACATTGGCTGAATAGCAAGCACACCCTCCCACAGTTCCGGCACATGATCATAGACTATGTGCCTGTTCCTAGGAGAGGTGGCAACAGAGGCCTCCTACTACTACAGAAGGAATCCATGTGGATTTACAAACTAGATACCTTGTCACGAGACACTTCCTATGTCCCCCTTTTATTGAGATCGGAACACTGGGTCATAAACTATCCACAGTATAATTACCTCAAATGAAGACTTTGACAGTTGGGTTTGACTAATCTTTATTTTGTTGGTTTTTATTACCGTTTGCATTTTTTGACTCTTTGGCTTCTGGATGTGAATGTCACAACAGTAATAGTATAGAATTGCAAATATGGGCTCTGGCGGCTGAGAGTTGGACTCATCGAGTGTATGAGTCGATATCTCTTTTGCTTTTGGGGTTGATCGTTTCCTCGCATTCCAAGGTGCTGGTGCCGTTCTGATCCAGCTATATAACAATATGTATAAGATTATTCTTGATTGTTGACAGGTGACTTATCAGAGTTTATCACAGGCAACTAATGACATATGTATTGCATATATGATATTTTTACAACAGGCTAGCTTCCATGAGGACGAGGGGGACAACAACAGAACATTTCGGTCGGCCTTTTGGCAGGATGATGGACCAACCAGTCATATGTGACCGTGGACCTCGCTTAGGTTAGCAGTGAGGCGCTGTGCTAAGGAGTCCTACGAGAACATGCTCCCAAACAAACACATCACACTGCACCAGGACTGATAAGAAATGTGGTTTGGCCGTCAGGTACACACAGCCTAAATATGCCCTGAGGGGAGTGAGCGTGGGGCAGGCCTTTCACTTACGTCTAGCTGACACTCCAGGGCATCGCTGTCTGGACGGTGTAACGAATCCACAAACACTTCGGTTCGATCAAGGGACTGCAATATCCCTCTTAGGGATTCCCTTACTGGGCGGTGCGCTAAGAGGTGTGGCTGACAAATACTAACTGTGATAGGAAGGAGCCTCTCGAGACGGACTGAAGGACAGCACGCGCCTCCAGCTTTTGTACGCTGGCGGCGCTTTTACAATACCTGAGAAGGGATTGACCACGTACTCACTTGTGACACAGATGGTTGGCCCGCTGTCTGCAGTATGGGCGAAATCGCTATGATACTTCTCTGTGGAATTGATCCCTCTCGTCGGGCTAGCTGGGTCCTGCTGGTATTGTCTCATGAGTGTTCGTGGATGTTATACAGATTTTCATGTGGACTTTGGTGGCACATCTGTGTGGTACCACATACTAAGGGGAGGCAAGGTGTTTTGGCTAATACCTCCTACAGATCAAAATCTGGAACTCTATGAGAATTGGCTGCTCTCGGGCAAACAAGGTGACGTTTTTCTTGGGGACAGAGCAACAGAGTGTCAGCGAATTGAACTAAAACAAGGCTACACATTTGTTATTCCCTCAGGATGGATTCATGCTGTGTACACACCTCAGGACACACTGGTGTTTGGGGGAAATTTTCTGCACAGCTTCAACATTCCAATGCAACTTCGTATATATAGCATCGAGGACAGGACGAGGGTACCTACAAAATTCCGATATCCTTTTTACTATGAAATGTGTTGGTATGTGCTTGAAAGATATGTCTATTGCATGACTCAACGCTCTCATCTCACAAAGGAGTTCCAAAGGGAGTCTCTGAGTATTGATTTAGAGCTTAACGGTCGCCAGAGACCAGACACTCCATCCTTATCCTCATCCGCTTCATCTGAATTATCGTCTTCCTCTGATAATGATGATTCCTCTGATCAAGATTGGGAGGAAGAAGGAAGTCTTAAGAAGAGGGAAAGAGATAGACTTAGAGTGGAGCATGAACTTCAGAGGAGAAGGAACAGGGATAGGCAACAAAGAGACCAAGAAAGAGATCATCAACATGCTGAGAGAATAATTATCCATACTCTACCTGCGTCACTACGTCCTTTAACTCCACCACCTTCCCTTCCTCTGCCAACACCAGATTCACCTCCCAGCACTTCTCCTTACTTGACATGGTTTGAGATTGAAGGATTACACTGTCTTGTGCTGAAACTTGAATCCTTGCCACCTCATAAAAAGTGCCTACCAGATGGTATCCATGACCCAGAAGCTCTTATCTCTGATATCAAGAGTCTTCTTGAGGACCACTCTCATGATCCACCTGAGCTTGCACTCACTGGCGTTCCAATAGTTCAGTGGCCCAAGAGAAATCAGTATAAGGTCCACCTTCGGCCCAAGATTCAGTTTACAAAACCTCACACTATGCGTCCAGCTTCCCGTCACTCCACAGCTCCTCCTAGGACATTAGGCACTCCATCTGGTACTACAGCTTCTTCGGGTGCTCGAAGGCGTCGTGTCAGGTGTCGCAAATGTCAAGCTTGTGTCCAGCGAGAGTGTGGGACTTGCCACTACTGTAAGGATATGAAGAAGTTTGGAGGGCCAGGCCGTATGAAACAATCTTGTGTACTAAGGCAGTGCCTTGCTCCCAGACTGCCCCATTCTGTAACCTGTGCTTTGTGTGGGGAGGTGGATCAAACAAATGACACACAGGATTTTGAAAGAAAACTCATGGAGTGTTCAGTTTGCAATGAAATTGTTCACCCAGGATGTCTAGAGATGGATGGTGAAGGACTTCTAAGTGATGAACTTCCAAACTACTGGGAGTGCCCCAAATGTTATGAGGGGCAGAAGCACACGATGCAACCAAATCATGATCACATCGAACTGCACAGTAAACGTAAAGCTGCTGACTATGAGAGCAGCCATTTCTACCCTGCCAAAGTTCTGCGGCCTCCACTGGGGCAGAGCCCCCCATCCCCACCTCTTTTGCTCCCACCTTCTCCTTCATCTGCTCCACCTACACCACCCTCTTCGCAGACACAAGTCCCACCTGCAAGCCGAGAAGAGCGAGCAAAGAGGCGCCAACTTACTAGAGAGAAAGAGAACCACCCGACTGGATGTGATCAGTCTGAGGGAGATCGCTTGCGGCTTAGGGGGCCCTACCTCGCGGTCACTCTTCAGCGTTCACCAAAAGAATTAAGCTTCACTTCCATTGTCCCCAAGTTACAAGCCATCACACCAAATCCCCGTCAGCCTATGCATGCAGCTCCACCACAGCATCCTGATGAGGAAGAAGAGGAGGAAGAGACAGAGAACAGTCTCATACTGGGTCAAAGAAAAAACAACATATCAATGCAGAAAGTTGTTTGGCTCTCTGTTTTCCATTACCTCACACATGAAGAGCTTTGCATCTGTATGACAGTGTGCAAATCCTGGTACAAATGGGGCTGTGACAAACGTCTCTGGTCCAAGATTGATGTTAGCCGCTGCAAGTCTCTAGTACCACAGGCTCTCAGTGGCATTAATAAACGTCAACCTGTATATCTTGACTTGAGCTGGACAAATGCATCAAAGAAGCAACTTATATGGCTTATCAACCGGTTGCCAGGTCTGAAGGATTTAATCCTTGCTGGGTGCACTTGGTCTGCTGTCTCTGCCCTTGCTAGCTGCAGATGTCCCCTCCTGCGTACTCTGGACCTGCGCTGGACTGTTGGAATCAAAGATACTCAGATTAGAGAGTTGCTTACACCAGCCTCAGACAAAACAGGACATGACTCTCGCAGCAAGCTACGTCTGCTAACAGATCTGCGCCTTTCTGGCCTTGATATTTCTGATGTTACTTTAAGGTTAATCATGCGCCATTGCCCACTTCTGTCTAAGCTTGACCTCAGCCACTGTCCCCTGCTTTCCGATCAGTCTGTAAACCTCCTTACAGCTGTGGGCTCTTCTACAAGAGGAATACTCACTCACATACACTTAGCAGGTTGTAAAGGGGTGACAGATGAGTCTCTTCTATATCTACGACGTGCCACCAACCTGTCCCTTATTGACTTGCGTGGTTGCAAGCAGGTTACTCGGGGAGCTTGTGAGGGATTTATTTCAGACCTCTCTGTAAGCATCTTGTATTGTCTATCAGATGATAACCTTATCCAGAGGATCACCTAGAGTGGAAGGACCTGTTAATTGTACTGGAAGAGGTTAGAGGAGGAATGTGGAAGAACATAATCTCCCCTGCCTCTCATCTGCTCTCTCCTGCCACTCCATAAGATACAAAGAAGGAGCAATAATTGGAATCTCTGCCTACATCCTCCAGTGAAACCATTGTTTGATCCAAGGAAATGTGCCATTAAAACGTGTATATAACCAACTGTGGTTGGCATAGTGCCCTAATGGTTTATGGGGCCCCTCAACTCATTAGGGCACCCTGCCAACTCTTACTCATTTTTTTGCTTAACTCACTCTATTCTTCAGGCTGGTCAGTGTGCATAGCAAGGGTGAAGGAAGGTTTTGTTTTAAGGGTTTTTTTCTGTTGTTGTTTTGCCTTTTAGGGATTTGAGAGATATGAGAGAGAATGCTCCGCTAAAGTTATATAGGTGTCTGATGAGTTGTGTGTTTAATTATATGTTTGAGAGGGAACAGGCAGGTTTTGTGATAAATAGTTTTTTTTTTTTTTTAATTGGATTGTAGCTGTTTGCCCATTACCTCTCATACAGAGTACAGACATTCATTTACACTTAATAGTACATTTATTTTATGCACCAGTGCAGCCATTTGTGGATATATACATATATAGATATATATTAAATGCCGGTAGGTACACAGAGTGTTATGTATGTCAGTGCCAGTGGCACAATCGGCTGTCCTCGCCTTTGACCTGGCATTAGATTGTATAAAAAAAAGAGCCTGGATAATATTTTTCTCTGTGGAGCGATCTTGCTTTCCCTTTATTTCTTTTGCAATAAAAAAAAGTTTATGATACAA\n>KF978784.1 Uncultured bacterium clone 16SOTU48 16S ribosomal RNA gene, partial sequence \nTCCTACGGGGGGCAGCAGTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCAACGCCGCGTGCGGGATGAAGGCCTTCGGGTTGTAAACCGCTTTCAGCAGGGAAGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTAGTCACGTCGGATGTGAAAACCCGGAGCTTAACTCCGGGCCTGCATTCGATACGGGCTGACTCGAGTGTTGTAGGGGAGACTGGAACTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCGGTGGCGAAGGCGGGTCTCTGGGCAACTACTGACGCTGAGGAGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGGTGGGCGCTAGGTGTGGGGAACATTCCACGTTCTCCGTGCCGCAGCTAACGCATTAAGCGCCCCGCCTGGGGAG\n>XR_005054034.1 PREDICTED: Manis javanica uncharacterized LOC118967152 (LOC118967152), ncRNA \nGGGTTGAAAAAAAATATGAGTGCTCTCTTTTGTGTGCGGACAAACAGCCGAGCGCGGGGAGGTCGGGGCCGGGGTCAGGCGCTCCGGGCTGCAGCTGCCGCCGTGGGGAGGGGGGCCCCGGGCGGCCCCCCGGAGTCGCGGCCACGGCGGCATCAGCCTTCCGGCGGCGCGGGCGGCCACTGTCCTCGCGCGACCCCGGCCTGTCGGGAGCGAGACCCGCTCCGCCCCTGGGGCGCCCAGCCCCGAGCAAGGAAGTCACAGTAAAAGAATCAAAGCTCATGACGCCCATCCAGAGTACTCCTGGTGACACTTCCTGACATAAAGTCATAAATGCAGCTGGAAAGAAAATGTGGAGGACACAGAAAAGTGGAAATGAAAACTGAAAGGCCCCAGCGGGCCCGCCGGCCCCTCTCCAGGGGAGCCCGAGTCCCTGCCAGCAGCAGTGGCCCAGGAGCCTTCAGATTCTGTGCCCTGTCCCTTCGCTGTTACCCACATGTGGACACCAGGAAGTTAGATTCCTAGAAGCATCAATTCCAACCCAACCCATGTATGCATTTTCAGTCTGGCTGGATTTACACTTCCTTCCACAAGGATGAGGTTCGTCTCCACAGCCCCTGCCAGCCCTGGGCATCACCACGTCTGGGTAGTTTCCATGCGAGGCACGTGCTCAGGGACAGCCTTGTGAGGCCCCACAGGCCACAGTGATGAGGCAGAGAGGCAGAGATGAGAAGTGGGCTCAGGGACTCTCTGGGACCTGGGAGGATGGGCCAGAGCCACAGCCCATGGCCACACCCTCAGGGCCTGGCAGGCCCACCCTGCATTCACCTCCCATGACATCTTACAGAGTGAAGGGCCTGCCTTTGGGCCAAAAAAGGTGACTGGGATGTTACGGGCCAGCTTGCTCCAGGCCGTTTGTGAGACAGCCCTCTGCAGGGGCTGCGGCTGAGACACCTGCCCCGGGGCACTTAACCATCCACCTGCCTCTGCTGTGGTCTCCTTGGCAGATTCAGCTCTGCCCTCAGAGAGCTGGCGACTTGTGGAAACAGTCAGATGCCATTCTGAGCCAAGCCCAGCGGGGCTGCTGCCGGGAGAGACCCAGGCCACTCGGGCAAGAGACCTCCAAACAGTGAAGCCCATGTGCCCCAAACCACCACTGCTTGGATAAAGTTCTGAGAGAGAGGGTGCAAACTTGTTTCCATGGGTGGTGGTGTCGCCAGGTCAGGAGGCAGCCTCCAAGGTGACAAGGGAACTCACAGGGAGAGAGTGAGTTCAGCACGTCAGTTAAAATCTCCATTTGCTGGGCCCATCACCTGCCTCCACGGGGGTCGGGCACCGTCTGCTGAGCTTGGCCACACAGTGCTCTTCCCCCGGCCGCCGCCTCGCCCCCCAGGCCCCCCGGAGCCCCTTGCTCCTCCCACAGCCTACTGAGCTTCCATCTCATTGTGCAGCCACTTCTTGTCACCTTGACCACCCTCCCCATCCCAACACCCAGTCCCTGGAGGCCAAAGATCATGTCTTTCCCCAGCTGTGTCTCCACAGCTCAAAACAGCACATGCTGCATGGTAGGGATGTGGTACATCAGGGGTGGAAGAAGAGAGGCCCTGGGGCAGGGCATCCAGAGACCTGGGACTGGGTCCTGGGCTGGCCGCTGGCACCGGGATCTTGTTCCTCAGTTTCTTCATCTGGGCGAAGGGTAGTTGGGATAACAGGTGCCAGAGGCCTTTCCAATTCCATTGTGTGAGGGCTCTTCAGGCCAGGGCTTGATGGGAGAGGCCAGGGCAAGCTGAGGCGGCCCCACCTCTGCCCCGTGCGTGATGAGGGGCAGCCTCCTCCACGGCCTCCCTCTGTGTGCTCAGTGCCTCCAGGCCAGCTCCAGGCCCGTCGGCATCCCAGGAAGGCAGCAGAGGTGGACGGAGGGCACGAAAGGACACGCTTTCACTGACCACCCAGCCCAGCAAAGCTAGAATCTGTCAAAAAGTAAAAATTCCATTTGTAAACAAGATCAAATTATTTGATTGTGAAACCAGGGTCCATGGAATTTAAAACAATTTAATGTGAAACAATATAATTTGAAATGCTGACCAGCCAAGACCTGGGGGTGGAGGGGCTCAGCCTCCTGTGGCCAGACACATGGAACCCAGCCTCAAGGAATAATAAGTCACTGTTCGACAAGGGTGAATGGGCATCAGCTGCGTGGCAACCCCAGGCCAGACCTGGGGCAGCAGGCCCGGCTCCCGTCCTCCTGGGGCTGGCAGTCCTGATGGGCAAGCAGGACTCTCACAATCAGAAAAGCAGTGCCAGAGAGCGGGAAGGGCTCCGTGGAGTGGCATATGATCCAAGTGACAAGGGAGGCTCAGAGAGAGCCCCGAGGGGCACCCGGTGGGCAGGACAGCAGAGAAGCATATTCAGGGTGGAAAGGGCGGTCAGGTCCCTCCCAGCTGCGGGTGTGCTGCCCTGCGTGATTCTGGGCCAGCAAATCACTCGTTAGCCTCAGTGTTGTTATCCACAGAATGGGAAACATCTCAGTCCCGCTCCCCACCTGCAGTGAGGATGAGAAATCGTTTCCGGGCATCCCACCCCACCAAGCTGACGTCACCAGTGGACAAACAAGCAAGCATGAGTGATGCAGTGGCCTGGTGAGCAGCTGCTGCGGGCATGTGGCAGGCAGGTGCCCGGAGGCGCTGCAGTGCGTTCTGTGTCCAGCACCTGCGGGTGCTTTCCAGAGGGACGGCGGAGGCAGGGCCCGGCAGGTCCTGGTGCAGCAGAGCTCTGCTTCCACGTACCCTGCCTCAACGTAAACACAGCTGGTAATGTTTCAGTACTGTAGGAGCAGGAATAACAGACCCAGAGAAGCCAGACCAAGAGCTCGCGAATGCTGACTTTCATGTCGCACCCAGGCATCGCATGTGCATCTTGGCGCCTGCGGGCCTGTTGCTCGGTGGGGAGGTGGGGGGCTAGTGTGTTTAGGAAACCGAACTACGGGCACAGCAGCGGGAGGATGTCAGGCCTCACCTCCCTTCATCCTCCCAAACGCAGCTCCCACCACAGCAAACCTGGAGGCTACCTGGGATGTGGGGGGGCACCAGGGCCTCTAGGTTTTAAGTGACCTAGGAGACAGTGGGGCAGGGTGGGGACTTCTCATCAGTGAGGTGCCACCTTAGGCACATCCCCTAACCTCTGCATGCAAACAGGCCCTGGAATACACCCAAGGTCAACTGGCCAGTGAGAAGCTGACCTAGAACTCAAGCCAGGCCCCAGTCTCCCCATGTCCCTGCTGCCCGCTGCGGAACCTGACCCACTGCCAGACCCGAACCTGCAAACCAACCACCTGTGGGTTCTGGGTAGCACAGAGCCCTTGGAGACCGTGATGCTGAGAAGCAGTGTTTTTGTTCGCCCCTGAGTCTTGCCAGGTCACATTGTCAAGGCCAGCACTTTGGAGA\n>XM_053291376.1 PREDICTED: Hemicordylus capensis complement C4-like (LOC128343033), transcript variant X1, mRNA \nGAGAAGGCATCTGCCCTGCACAGACGCAGCCCAGAGATGTTCTCTCAAAAGCTGCTGCTGCTCTGGCTAGCATGGATGGGGACTCTGGTAGCCCTGAGCCACCAAACTCCAAGGTTGCTAATGGTTGCCCCAAGTGTGATACCAGTGGGGGCCGAGGTGGGGATCGTGCTTCAGGTCGAGGGGGCCACATCCAGGTTCTCAGGCACAATCTATTTCCAGAATGAGAATAACATGAAAAAATGTTCCAATGAGGAGTCATTCAACTTTTTGCCCAACACCTTTGTGCAAAAGGTTACTCTGAAGGTGACCCACGAACTCTTTACCGAATGTGTTCTGGCTCGCCAGCGACGGAACCGCTACATCCAACTTGTTGCCCGCAACTCCCTGCTCCCCAATGGCGGCGTTCAAACCCTCAACCTGCGCTGGAGTGCCCGGCAAGGGTACCTGCTGGTGCAGACGGACAAGCCAATTTACACCCCACAGCAAAAGGTGAATTTCCGAGTCTTTGCCCTGGATCACAAATTGCGGCCAAGCACTGAGCCAGTTGTCATCACTGTGCAGAACTCACGAGGTCTTCAGATCCGGAAAGTTGAGCGTGTGCCAGTGAATTTTGTGATAAACGATCACCTGTCTATCCCTGATATCTCTGAGCCAGGCATTTGGCGTATCACAGCCCAGTTTGTCAACACACTGAATTTCAACACAACAACAGAGTTCGAGGTGAAAAAATATGTGCTCCCTCATTTTGATGTGACAATTGTTCCAGAACGTAAATACATCCTCCTTTCAGGACAGCAGGACTCTGAATTGCGAATTGACCTCCAGGCTAAATTTTTCTATGGGAAGGGGGTCAATGGCACAGCCTACGTGCGGTTTGGTGTGAGTGATGACAATAAGGAGAAAGTTTATATCCCAGGACTCGAGCAACAAGTCTCCATAACCGATGGCCGTGGCTCACTAATGCTGAAACGCAGCCTCCTCGCAGAGAAACTGGGGCGCCCTCTGGAGAACCTAATTGGAACAGCACTCTACATTGCAGCCACTGTCATAGAGGCAGCAAGTGGCGAGCTGGAGGAGCAGGAGCTTGCTTCAGTGAAATTTTTGGCATCTCCATATTCAGTTGATCTGTCCAAAACCAAGCGCCATTTTGTCCCTGGTGCACCCTTTGAAGTGCTGGCTACTGTTTCACTCTCAGATGGCACTCCTGCCTCCAACCTCCCAGTCCGTTTCTCAACCCAGATAAGAGGGGGCTCATCCCCCAATGATGAGCGAGTGGACAGCAGTGAGCAAGGGGCTGTGATATACAGGATGAATGTTCCCTCTGGAGCTACCTCCATCACTTTCACGATAACAGCAGGGACAGAGTCTCCAACAGAAGTCACTCTGACTGCCAAAGCAATGAACTCTCCAAGAGGCAACTACTTGATCATTGAAAGCCCAAAATACCAAGGCTTGAACCCCGGAGAAACTCTCTCGCTGGGGCTGAAACACGTTGGATCGGCTGCCTTCTCCCACTTCTACTACCTGGTTTTGAACAAAGGCGACATTGTCTCTGCCAACAGTATCAACCGTGGAACCTTTACGGTCATCTCTATCCCCATCACACCCAGCCTGATGCCAACGTTCCGCTTTGTGGCCTTCTACCGTGTTGGGGATGAAGTTGTGGCAAACTCCATCTGGGTTGACGTCGTGGACCGCTGTGACGGAAGACTGGAGCTCCGCACATTAGGAAACCCTGACCAGCTGCAACCTCAGGACCTCCTGAAACTCGCCATAACCACTGATGTGAAATCCTTTGTGTCGCTTGCTGCTGTTGATACTGCGGTTTACGCCCTCAACCGGAAGAATCGCCTCACACAGGGCAAGGTTTTCCAGGCTATGGGAAGCTATGACCTTGGCTGCACAGCTGGCAGTGGGGAAGATACCCTTGGCGTTTTCACTGATGCTGGACTCTCTCTGCGTACTGGTTCTCTACAGAGTGAGCTCCGGAAAGCACATGGGTGCAGTGAGAGTGTTTCCCGGAAGAAGCGTTCGCCGCAGTTCCAGTTCCAACTCCAAAGCATGCGTTCCAAGTACTCAACCCCTGAATCGCGGAAATGCTGCCAGGATGGCATGGTGCTCCTTCGAAGAGCCATAACATGTGAGGACCGTGCCAGGCGGATATCAACGCGAGAGTCTGAGGAATGTCATCGTGCCTTCCTTGAATGCTGCAAATATGCTGCCCGTCTACGACGCAAATCCTGGGGATCCCACAATCTTGGGCGAACTCTAGATGAGGAAGATGAGGATTTCATTGATGACGATTCCATTCAACTCCGGAGCGTCTTCCCTGAGAGCTGGCTCTGGAAAACTTTCTCCGTAGAAGGAACCCGCACGGAAAACTTGATTCTCCCCGATTCCATCACCACCTGGGAGATCCAGGCTGTTAGCATGTCCTCTGCAAAAGGGATCTGCGTCTCAGAACCTCTTCGAGTTAGAGTCTTCCAAGATTTCCACATCTCTCTCAGGCTGCCGTACTCAGTGAAACGGTTCGAACAGATAGAGCTTCGCCCTGTTCTGTACAACTACCATTCACAACCAGTCAGTGCCTTGGTGTATCTGGAGCCTGCTGAGGGCATCTGCTCTCCAGCAACCGTCGGCCCGGCTCGGAAGCAGAGGGTTGTTGTGCCTGGGAATTCAGCGGTGCCCCTGCCCTTTGTTTTGGTTCCCATGGGAGCAAACGACATTCCCATCACCGTTGTTGCCATTGGCGGCTGGGGGGTGGGCGACAAAGTTTCCAAGAACCTACGGATTGAGAGAGAGGGTGCTGTTCGGGTGGAAGAATACACCATCCCCATATCAAGTGAAGCTGGACAATCCAGATCTGTGGAGATTTTAGGAGATATACCCTCCAACTCCATTCCTGATGGCGACTTCAAGATGAGTGTCCGGTTGACAGGATCGCTGCCAGCTGACACTCTGGAGAGTTCTCTGACACCAGAAGGTCTGTCAACTCTCTTGCGGGTTCCACATGGATGTGGGGAGCAAACCATGTTATTGATGGCCCCTGGGGTCTATGCCATGCGCTACCTGGACAGCACTGAGCAGTGGCTACACCTGAAACCGGAGAGCAAGGAGAAGGCACTGGATAACCTCCGTACAGGCTATGAGCGAATCCTCACTTTTCGGAAGCGTGATGGGTCGTATGGAGCTTGGCTCACCCACCCTAGCAGTACTTGGCTGACGGCTTTTGTGGTGAAAGTTTTATCTCTGGCCCGTGAGTACCAGGGTGTGGATGAGACTAAGGTCCGTGAGTCAGTGCAGTGGCTTCTGGCAAAGCAACAGTCAGATGGTTCCTTCCAAGACCCAGCCCCTGTCTATCACCGGGAAATGCAGGGTGGTGTTGGCGGCCTTCACGCAGGAGTCTCACTCACAGCGTTTGTCACCATCGCACTTCAAGAGGCCTTGGTCATGTATGAAGGAGAGAACCTTGAACCAGAGAAGCAGCAACAGCTGAGCCAAGTGAAACACCGCCTGGCTCAGGCTACCTCCTTCCTTGCCCTCTCCTTGGAAGAGCGATCTCTGGGTGCCTATCCTGTCGCCATTGCTGCTTACGCCCTCTCGATTGCTTCTGCCAACCTGTCGGCCATCACTACTGCTGATTCTCACCTGAGGAGGCTGGCTACAGAGGACAAAAACAACACGATGTTTTGGGCGGTGGAAGAGCGGGACCGACTGAGAGGGGAGAAGAGATCTGGGCAGGTTCCCTCTGCCTCAGCCATCTCGGTGGAGGCCACAAGCTACGCTCTCCTCTACTTGGTGAAAAAAAAGGACATCACAATGGCCCACAAGGTTTATAAGTGGCTGACAGAACAGAGGAACTATGGAGGAGGCTTCAAATCCACCCAGGACACAGTGGTGGCCCTGGAAGCTCTGTCGCAGTACTGGATCAGCACCTACCAGGAGGAAGACAATGAACTGAAAGTGACCCTCAGCGTTGCTGGGAAAAGCTGGCCGATCTCCCTCTCACCTGGGAGATCAAACCATCCAGTCCAGGAAGAACTGCAGTTTTCTTTGGGGAGTAACATCAATGTAAAGGTGGAGGGGAAAGGAAAAGGGACTTTGACAGTCCTGAAGCAATATCTGGTCTTGGCTATGCAAAACACTACCTGCCAAACCCTTGGGTTAGAGGTGAAGGTGAGCGGCTCCATTCAGCGTTCACGTGAAATGCTTGACTACTACTACGAATATGAAGATGAGGATGAGGTTGAGGTTGCCGGTGAAAGAAAGGCACGGTCTCTACCTGCTGACCAGCCATTGTCTCCTATCCACTTGTTTGATGCCCGGCAACGCCGCAGGAGGGAAGTCAAAGCCCCCGGCCAGCCGCAACGGGTTGTCACCTATGAAGTCTGTTTTTGGAGGCAACCTGGAGCACATGTCTCAGGCATGGTCATCGTTGACATCACTATGCTTAGCGGCTTCCAACCCGACAAGGACGACCTTGACAAGCTCAAAGATCTTGCTGATAAGTACATCAGCCACTGGGAGCTCCAAGGACCACGGCTGTTGCTGTACATTGACTCGGTTCCAGCAACAGAACGTGAATGTATAGAATTTGCAGCAAAGCAGTTAGTAGCTGTGGGGAAACTCCAGCCAGCAAGTGCCACTCTGTATGACTTCTATGAACCAGACAAGCGCTGCAGCATCTTCTACGGTGCCCCCAACAAGGACCAGTATGTGTCAGCCTTGTGCTCGGATGATGTCTGCCAATGCGCTGAAGGGGCCTGCCCACGGTTGAAGCGTACCCTGGATGAGGCCATTACAGAAGAAGACCGCATGCAGTTTGCGTGTTACGAACCTCGTGTGCACTATGCATTCCAGGTTCGAGTGGAACGTGAGAGCAAAGAAAGTGCCTTTCGTGTCTACGAAGCTACGATCTTGGAACCCTTGCAATTTACTGCAGACATTGGCATCTCCCAGAACCAGACCCGGCGCTTTGTGGTCCGTGCAGCGTGCCGGACCCGCTTGGCCGCAGGCAGCAAATATCTGCTGATGGGACGTGATGGAGAAACCCGTGACTCTGAAGACCGCCCCCAGTATCTGCTGGATAGGAACTCTTGGGTGGAGGAAATACCAAAGGCCCAGCGCTGCCGAGCCACCCAGCACCGTAACACCTGCCTCCAGTTCAAGTCTTTCACCACTGCTTTTGCTGAGAATGGCTGCCGTGTCTGAGCCAGAGAACTGGACCAGAATGATCACCTGCACTTTCTCCCATCTTCCTGCACCAGAAGGTTCTCTCGGAATGGAATGGAAGATGCCAAAAGGCCTATTCTCTGATCACTGTCTTTTCCCCTTGATGCTTTGTATTTGGACAATTTAAGAATGTAAGAAGAGCCCTGCTTGCTCAAGCCAAAGGCCCATCTGGTCCAGTATTCAGATTCCAACAGGGGCTACCCAGAAGCCTCTTCCACAAGCCCTTCCCTGTTTTTTGTCCCCAGTCCATGGTACTCAGGCTTATTTTAAGCCAAATTTTGGGTTACAGCCCATTTGACCCACGAGTATACCCCCTAGGTTCTGGCATCACTTGGTGATCGTCATTGATGGACCTATCTTCCATGGACAGGTCTAGAAAGTCTACAAGCCTGGTCTTTCAGCCATCTCTCTGGGCACACTAACCAGAGGGAAATTGTGATTCAGAGGTTCTTAAACTCGAGTCCCCAGCTGTTGTTGGACTACAACTTCCATTATCCCCCTCTTATAAGGACAATATTGGACAATATTGTCCCCTTGTTAAGTCTCTTTTTTGTAATTCCTGCACATTGGCTACTATGTTGCAACTACCATTTTTTAGTGCCACTTGGGTTCTCTGATACTTTTTCTTTGTACTGGTCCCCAAAAATGCACATCTTTAAAACTGCATATGATCATAGCAACAGACAAATGCATGACCACAGCCATATTCACACTTTAAACAACAACTTTGGTCTATGAATAAGGACTGTTTGGCTGTGATAATGATCACACTTCAGTGAGCAGCTTTAGCATAATTCTGTAAAGATTTTTTTTTAATGAGGTGTTTGTTTTGTGCCTCTGTCACTAGCTAACATGCCTCACAAAGCTATTTTGTTGAATAAAGAGTATCATTCTATA\n>XM_022636737.1 Penicillium arizonense hypothetical protein (PENARI_c034G09255), partial mRNA \nATGAACCCAACCCCCATCAGCATGTCAGTCCGTACAGCGATAACCTTCAGCCGACTGAACCCCGCGGCGCCCTCGCTCGCCGGCGCCCTCCGTCCGCTCAACCAACGCACCTCCGGAACAGTCTCCAAGCAGCTCACACGCCTCAGCTCGACAACAGCTCGCCCAGCCATGGCGGCACCCGTGACCCTGGACACCCGCCCACAGACCCAGACCATCTCCACCCGCCCCATTGGCCTGCGCGCACAGTCGACTGCTTCTGGTAACGGTACCGGCAACGAGGAAGTCAAGCTCGACTGGGACTCCTTCTTCAAGCTCCGCGCTTCCCGTCGCCGTTATTCTCTTGCTTCATCCATTACCACTGCGGCTCTTTCGACTACGGCTGGTGTGCAGATTCTGTCCGCTCAGGATTTGGAGTCCCTTGGCGCGCAGGTTATGGGCCTGGACCCATTCGTTGTTCTCGGATTGGCGACCGCTGCGTGTGGTGCTATTGGATGGTTGCTTGGGCCGATGGTTGGAAACGGTCTCTGGGGATTGGTATACAGGAAATATAAGCCTTCCGTTGCGACGAAAGAGAAAGAGTTCTTCGATCGCATTCGTCGCTTCCGTGTTGACCCATCGACCAACTCGATTGCCAACCCCGTTCCCGATTACTACGGCGAGAAGATTGGTAGTGTGCAGGGATACCGACAGTGGCTGAAGGACCAACGGGCTTACAACCGCAAGCGCCGCAACTTCATTGCTTGA\n>XM_039112273.1 PREDICTED: Rattus norvegicus zinc finger and BTB domain containing 1 (Zbtb1), transcript variant X5, mRNA \nTCTGGGGTATAGGGTATTTGTATTTGTGTTCGATCATGTTCCTAAATCGAGTGTCGCTGTGACGGTACACGTAGATTCTCCACTGGTTAGAATGTATTTCCGTACAGTATCTATCGCTGCGGCAACATTTTCCCCTTTGACACTGGAATCCACGAAGCGTTCCAAGCATTTTTTTTCCCCTTTTTTGAGACAAGGTCTGACTAGATAGCCCAAGATCGTTTGGATAGAATTCTCCTGCCTCAGGAAATCCTAAATTCTGGGGTGATAGGCATGTTCTGAGACTTTCCAAGACCACTTAGAATTAATTTCTTGAGCCAAAGTTTGAGGCACCACCAAGTCAATTGGTGAGAACGATGTAGTTCTTATGAGAACTTTAAAGCAACCACGGTTTTTTAAAAGGTATAAACTAGATTTTCTGGAATTTTGTCACTTTAAATGGGGAGAATGAAGGTACAAGAGACTGAAGTCCCAGTGATGGATGGCTGGTCATTTGCCCAGAACTGTAAAACTTCCCTTTTGAATCACTGGCTGTTGTTATCTCCCTAAGTCTCAGTAATATTGAGTGGCAGCCACATGGGCTTTCTTCCTCTTAAAGAAATAGACAGACTTAAAGTAGACACGAAGTGAAATGCCTTTCCAAAGGTTAATACTTAGAGTTTTGTAGTGTAATGTTGTGTTATAGCCACTTGCACTCATTTTAACGCCAGGATTTCTTCTCGGACAGCAGAGTTTTACAGGGTGTGGTTGTGCACGCCTGTGATCCCAGCACTTCAAGAGGTTGGATCAGAAGCCTGAGGCCAGCCTGGATCTGGCATACAGAGCAAGACCCTTTACAAAGCTCAGGGCTGGAGAGATGGCTCAATGGTTAAGGGCACTTGCCTTTCTTCCAGAGGGACTAAGTTTGACTCCCAGCACCCCCACACCAGGCAGCTCACAACTACCTGTAACTTCATTTCCAGGGAACTCCACACTCTTCTTCTGGACTCTAGGACATCTGTATTCATGTGCGCACCCCTCCCCCCCCCACTACACATAATCAGAAATTAACATGAAAAACCCCAAAGCCTCATTTTCATGATTCGGAGTAAACCCTGGTTGAGCAGTCCTTCCAGCTGGCTGTGTTCTTCCAGTTCCTAACGTTATGCCTGCTGGTTTCACCACTGTGGCTGCATCCTTGTGAGGAAAGAGAAGCCACTTTTGACCAGGGCATGAGCACAGCTTCCTCACCTTGTTATGTTGGTTTTTGGTGTTTTGAGACAAGTGTTTCTCAGTGTATCCCTGGCTGTCCTGGAACTCACTCAAGACCAGGCTGACCTCAAAGGCTGAAGAAATCCACCTGCCTCTGCCTCCTGGGTGTCAGGATTGAAAGTGTGGACCACTGAAACTGCTGTTTTATGTTTTGTTTTGTTTTGTTTTTTAAAGCTAGGTTCTCACTGTTTGGTCCATGGCCAGCCATAGCTTTCCGTCCTCTGGCTTCGACCTCTCACCTAGTGGTGGGATAACAGGTCTGCACCGCCATACAGGATTCTGACATGGGTTTTTTGTCTTTGTGAAGCAGGGTCTCACTGTGCAGCCCTGGATGACCTCAGACTCTAAGAGATAGGCCTGCCTCTGCACCCACAGTGCTAGCATCAAAGACTCGTGCTGCTACGCCTGCTCATGACCTTGTGTTTTTATTTCATGATAGCTGCCAACTGTTTGTACCTTCTGCTTCCTCATTCCTCCACATTCCCCCACTTTTGTCAGTTTCTGGTACAGTTAGGGCCTTTTCAAAGTGCCCAGTGTCCCTTGCAACACCATTCAGGAGAAAATGTTGCTGCTTTTTTTTTTTTTTAAAGGCCTATTTTTCTCTATACAGGACACAGACTGTCTAGAGAAAAGAGGGGAAAAAAAAACCTTTGTGTTAGAATACAGAAAAAAATAGAGGCTGCAGTCTGATGTCTCGGAGGAGGGTTAAATGTGTAAAACATCTGCTTGACGTTCACTTAGGTCTCTGTAATATTTTTCATAGTTTCTTGTGTTATAAAATAATGAAAATGCTTTGCTATTCATGTTTTTATGTTAGCCTAATTAAGTTATTTATGCCTATTTTTTCTCAAAGTGGAATACCTTTTCAATGATAAAAGCAGATGCCCTTTATAAAAGTTCCAACTATACTAAAGTACATAAAATACAAAACTGAAAGTCGCTCTGACTCCCACTCCCCAGAGATAATCACTGTGAACAATCAATCCCTTGTTTAAAAACATGAAGGCAGCATCAGAGCGTCTTGCTGTGTGTGCCTCACCCCAGCCTGTTCCTGTTCACAGGCTGGTGCTTTCTGCTCCTACCTCAGATTGTTGAGAATTCCCAGGTTGAGGCGGGTGGGGGGTTGCATTGAGCTGATGTCAAATTCTATAACCTAGTGACGTGTGAAAGTTTTCATGTTTAATAGGGCTGCTGTTTTAGGTTAGTCCTCGTTCATTCTCCTTGGTGGGCTTCTTCTCACCCTTAGCAAATGTTGCAATCTGTTATCTGATTGATTTGTGCAGACTACACTCGTTAAAACAAACCCTTCGAGTGGAGAGAGCTTCTTAGCTTATCATTGGGAATGAGTAGGGACACTTGCCACAAAGACCACCGCCAAGATATCCCTGTGCCTTTTGTGATGGTGTGGGTTCCTCATGGTCAGCATCCAAGAAAATCGTGATAGAAAGGAAATTAGAGTAACGGTGGGCATTAATTACTGTTGTTTTAAGTTATGGGAAGGAATGGGAGGGGGTGTGTGCAAAGACTAGCCTGAATTCTACCCACATTAGACATCTTACATATTTAAGGTAATTTCTAAGTATACTGATATTTTGTCCTGCATAGTCATTACAAAGCTACTTAGGCCGGTGTGTTCAAGAAGGATGAGCTGTGGGGTTGATTTCCTAGTAAAGCTCCAAAATAGCAGGCTCAGATTTAATCACAGTAATTCCTGGAAGGTGTTGAGGACATGCTGCTTTTTTGAGAAGGGGGTCTCTGTAGCATTGGCTGTCCTGGAACTCACAGAGATCCATCTGTCACCAACTGCTTTTTTTGGGGGGGGAGTGGGGTGGTAAAAACACTACTATGTGAATATACATTGTTTTCAGAATCACATCTGAAGGCATGGAGGTGTATAACCTAGTATAAGAGTGCTTGCCTATCACACCTGAGGCCCTAGGTTCAGTCCCCAGCACTACAAAATAATGAGTATTAAAACATAAAGAATAGCAGTGTGTAGGGTGCATGACTTTAATCCCAGCATTTGGAAGGTAGAGGCAAGTAGATTTCTGTGGGTTCAAGGCCAGCTTAGTATACATAGTTCCAGCCAGCTACATAGTGAGACCCTGTCACCAAAAATAAATAAATAAATAAATAAATAAATAAATAAAATAAAAAATAAAAAATAATAAATTGCTAATTATATTTTCTATTAGTTTGTTCTGTGAGGTGCATGTTGTCTTTTTAAAAGCTAACTCCTTCCCACTTGAAATTGACAGCAGTGGGGGTGGCCATGGTGGTCAGCAGATGGAAAAGGAGGTGGGGAGAGGGGTGCGTTCTGCTTGCCTATTAGATAAGACAGCAAGAATGATAGGAGCTTTTACAGCGATGGAAAATGTGACTGTGGGAGGCTTAGAATGTTCCAGAGGGGCACTTCACTTAATAATCATACCCAGAAAGTGTTGTCTGGATTACAGAAACTGAAACTGTGCATCTTGAATCAAGAGTTAGGGTTTCAGCCCCAGCTTCTGTTTACAAGATGGGTAGTTAACTACTGCACGTGTTTTCTTCATTCACAAAAAACATAGATAATTAAAGGCCTGTCTCAGTGCACTGATGTGTGAAAGAGGCCCTATAAATCGACAACAGTGTTTCAGTGACGGCCATAAGTAAGAACTGATGAGCAAAACAAGACTTGCCCAGTTCAGCATTTGTTCCTGGAAAAACTCGTTATCATTTAAATGCCAAGCAACTACTAGAATCCAGGGTTGTAATGATGCCTGACACAACACCTTCGTCTTGAGGTACATACAGCCTCCAGTTTAGATGGCCCATCTCCTGTCTCCCTGCGGCTCCCACCATAAAGAGGTGCCTGCCTCATGCTAAGTCAGGAAAGGGTCCCCAAAGATGGCTCTAAGCAAAGGAATGGTGTTTATGAAGTAAGGAAGACTTCCACTTTTCCCGTGTTTGGGGATGGGGGAAGTCTTAAGAGATGTAAGGCTTAGGGATGGAATTGTGTTTAGAATGGATCTTTTTTACTGGTACTTTTAATTGGTTTTATTTCATTTATTTTAATTAGATAAAATTTTGGAGTTTGAATAGCTGTGATAGCTTCCAGCACTCAAGGCAGAGGCAGGCTGACCTCTAGAGGCCAGCCTAATATAGGGAGAGACCCTTTCTCCAAAAAGAAAAGAAGTTTTCTCAGCCTTGGTTAGAACTGACAGGAAGCCCTGGAGCTGCAGAGCTGGAAACGGATACTTCATTCAGCTTACAGGCTCTGCGAGCAGAGGAAGCAAATAATCACGGGGGGAGCTCCCTGGCAGGCCACACAGCAGATTTTACTGAACACTTAAGTTCTAAAACGGCCTGCCTTCAAGTTGTTAACAGTTGTAGCAGACAGTGTGAGCTCACAGAGCCAATACTTTGGAATAAGTAAAAATACTACAAAATAGGGTGGAGGGATGGCTCAGCGGTTAAGAGCACCCGACTGCTCTTCCAGAGGTCATGAGTTCAATTCCCAGCAACCACATGGTGGCTCACAACCATCTGTAAAGAGATCCAATGCCCTCTTCTGGTGTATCAGAAGACAGCTACAGTGTACTTAAATATAATAAATAAATCTTTAAAAAAAAATACTACAAAATAAACTCCAGCAATACAGATGCCATGTGCTGGGAACCAACTTGGTGTAGCTGCTTTTAAAGGTCACAGGTGCACACACCGCCCTCTGGTGTTCAGAACATGGCTGTACAGCCTCTAGTTTAGAGGGTTAAAAATGGATGTGTAAAATACCTTTCCTCTTATACCAGAGAGAAAGCAGAGGCCAGCACTCCATTCTCTTCCCTCTGCCTTCTGTGTGGATGGACTCCATGTGGAGTCCAGTTGAACTACAGAAATGGCTCGTTCCTGTTACTTGGTAACATTTATTATCCGCTGACCTGCCATGAAGCCAAAAGATAATTTGGTTACCTTCTACATAGTACAAAACAAAGGACCTCAAAGAAGTAAATTATGTACTTGTTTCACGGCCTATAGGAGATTAAAATGGTGGACAGCAGATCAGCGTGCCTTTTAGAAGTGACAACTGTTGGCTTGACGAGGGGAAGAACAGAAACAGACAGGCCAAAGAGCAGCAGTCTCGTTTTGAATAGGTGCAAACAGGCTCACCGGCAGGAGATGGCCAAGCCCAGCCACAGCAGCTACGTCCTGCAGCAGCTAAACAACCAGAGAGAGTGGGGCTTTCTGTGCGACTGCTGCATCGCCATTGACGACACTTACTTCCAAGCACACAAGGCCGTGCTAGCTGCCTGTAGCTCCTACTTCAGGATGTTCTTCATGAACCATCAGCATAGCACTGCCCAGCTGAACCTCAGCAACATGAAGATCAGCGCCGAGTGCTTCGATCTCATTTTGCAGTTCATGTATTTAGGGAAGATTCTGACCGCTCCTTCCAGTTTTGAGCAGTTCAAAGTGGCTATGAACTACCTCCAGCTCTACAATGTTCCTGACTGCTTAGAAGATATACAGGACTCAGACTGTTCCAGCTCGAAGTGCTCGTCTTCCGCCTCCAGCAAACACAACAGCAAGATGATCTTTGGGGTGAGGATGTATGAAGACACAGTGGCTAGAAACGGCAGTGAAGCCAACCGGTGGAGTGCGGAGCCCAGTTCAACGGTGAATACGCCACATAACAGAGAGCCTGAGGAGGAGTCTTTACCGTTGGCCAACTTTCCTGAGCCACTGTTTGACGTGTGTAAAAAAAGTTCCGTGTCCAAGTTATCTACTCCAAAAGAACGTGTGTCGCGACGCTTTGGACGGAGTTTTACCTGTGACAGTTGTGGGTTTGGCTTTAGCTGTGAAAAGCTGCTGGACGAACACGTGCTGACCTGCACCAACAGGCACTCCTACCAGAGCACGGCGAGAGCCTACCACCGAGTGGTGGATGCTAGAGATGGGAAAGACAGTGCCATCAAAGCTGAACTCGGTGACAAGGGCTCTCCTACAGCGTTTTCTGCACACACAGACAAATACAGAGAAGACGCCAGCCAGGCGCCCGATGACTCAGCCTCGCCCACTGGGAGCAGAAAAAGCACTGTGGAGTCCGGCACAGCTGGTGAAGAGAAGAGCAGAGCTGCGGAGACAAAAAGAGTTGTCATCAAGATGGAGCCAGAGGACGTCCCTGCAGACGACATGAAGGACTTCACCATCGTCAAGGTCACCGAGAAAGACTGCAACGAGTCCACCGACAACGATGAGCTAGAGGACGAGCCCGAGGAGCCGTTCTACAGATACTACGTCGAGGAAGATGTTGGCATTAAAAAAAGTGGTAGGAAAACCCTAAAACCTCGGATGTCCGTCGGCGTGGATGAAAGGGGTGGTTTGGAGAACATGAGACCCCCAAACAACAGCAGCCCCAGACAGGAGGACGCCGAGAATGCGTCTTGTGAGTTGTGTGGGCTCACGATAACGGAGGAGGACCTGTCCTCTCATTACTTAGCCAAGCACATTGAAAATATCTGCGCATGTGGTAAATGTGGGCAGATACTTGTCAAGGGCAGACAGCTTCAGGAACACGCTCAGAGGTGTGGCGAACCTCAGGACCTGACGATGAACGGGCTGGGGAACACTGACGAGAAGATGGACATGGAAGAGAACCCAGATGAGCAGTCTGAGATAAGAGACATGTTTGTTGAGATGCTGGATGATTTCAGAGACAATCATTACCAAATAAACAGTATCCAGAAAAAACAGTTATTTAAACATTCTGCCTGTCCTTTTCGATGTCCTAATTGTGGCCAGCGTTTTGAAACTGAAAATCTAGTGGTGGAGCATATGTCTAGCTGCCTAGACCAAGACATGTTTAAGGGCGCCGTCATGGAGGAGAATGAACGAGATCACAGACGGAAACATTTCTGTAACCTGTGTGGAAAAGGCTTCTATCAGCGCTGTCATTTGAGAGAGCACTATACTGTTCATACTAAAGAAAAGCAGTTTGTTTGTCAGACATGTGGGAAGCAGTTTTTAAGAGAGCGCCAGTTGCGTCTGCACAATGATATGCACAAAGGCATGGCCAGTCTCTGGCTCATACTGGCCTGGAACTCACTATGCAGTGATCATCCCGCCTCTTGGTCCCGACTGTGGAGATTAGGTATGTGCCACCACTCCCACCTGGGCTGAGCTTTTAATGTGTTCTGAATTATAATTATCAAAAGAAAAAGAGCCTGTTTTAAAACATAATACACAGGAAACATAAAAGGTATTGACACAATGAGTATGTGTTTTTTTGTGTGTGTGTGTGTGTGTGTTTTTTTTTTTTTTTTTTGTTCTTTTTTT\n>OL802220.1 Portunus trituberculatus vitellogenin receptor mRNA, partial cds \nATGACCTTCTGCGACTTCCTTCAGCGTCTATTTTTGCTGACGCTTGTGCTAGCGGCCGTAGTTTCTGTTGGCTGCGGTTATCGTGATGGCAATAATATTAAAGATGCTTTGAAACATCTGGAACAGCATCGCAACAAGTCCACTGATGCTGACGCAGTGAATCGTCGGGAAGTGAGGGGACAGGACGTAACTCCCACCACTACCACATCTAGTACCACTAGACGCTCCTTTACTTATAAAGGTATATGCAATACGATGTTCCTGTTCCGCTGTGACAACGGTGAATGTATATCGAGGAATTTCCTTTGTGACGGAGGCAATGATTGCTCAGATGGATCTGATGAGAAAAACTGCCAGAAATCTACAGAAGGAAAATGCAATTCAAACCAATTTACGTGCAAGAACGGGAGGTGCATTCGTCCTGAGGAACGGTGCGACGGATTGGATGACTGCAAGGATAATTCCGATGAAGTTGACTGTAAGAATTGTCACGGAGACGAGTTCCTATGCAAAAGTGGGAAGTGTATAGCCAATGACACTTTATGTGATGGTGACAAGAACTGCGAAGACGGCGACGACGAAGCAAACTGTGAAAAGGCACACTGCCTCTCTATACCAGGCCACTACCAGTGCCAATCAGGGGAGTGCGTGCCGCCCATTAAGGTGTGTGACAATAGGACGGATTGCTTGGACGAATCGGATGAAGGGCAGGCTTGTGCTACAACATGTGCAGCCAGTAACTGCACGCAGGGATGCTTCCGAACGCCAAAAGGTCCTCATTGTTTATGTAGACGAGGGTATTACCTAGAACGTGATCAAGTAACCTGCTCTGATATAAACGAGTGTGCTTGGAGCGACAAATTAGTGTGCGACCATTACTGTGAGAACACCAAGGGCGGGTTTCAGTGCTCCTGTCACCACAAGTATATACTGCAGAGTGATAACGTTACCTGCAAGCACCAGCAGTCCGGAAGTGCATTTCTTTTAATAGCACAGGACGATGGAATCAGGCAGCTGTTCCTGGATGGCTCTCGCAACGTGCAAATTGTTCACTCGGGGAATGCATCGGTCATAGGATTGGGTTATGACCCTGTAACTCGCACGATGTTCTGGAGTACCTTTGGTAATGTGTTAAAAGCGGAAGTGGTACCTAATGCAGTGACTCACAAACTGTTGCGTGATGGCTTCATTGTGGCTGAGGGTTTGGCCGTGGACTGGACTGGTAGGAACCTGTACCTCACAGATCCCAAAATGAAACATATCATGGTGTGTAAAATGGACGGCTCCTCCTGCTACTCGCTATTGAGTGGTCTTGGTCATCCAAGAGCCATCCAGTTGGATATGGTTAATAGGTATATGTATTGGACTGACGTGAAGGACGGCACAATTCGCAAGGCTGGAATGGATGGTACTAATCATGATGTGGTGGCAATGAATGGAGTACTGTGGCCCAACGCCATGGCACTTGACCTGCCTGCTGGTCGTCTCTACTGGCTGGATGCTAACAAGGACCATGCCTTCAGCATCAAGTTGGATGGTACAGACCAGAAGTCGCTCCAACATGCTGTGATCCACCATCCCTTCGCCATGGCACAGTGGGAGGACCGTCTGTATTGGACTGACTGGAGCAAAAAAGTAATCTTCTCCTGCATCAAAAGGGATGGCAGACATGGGAGGACGGTGCTGAAAGGAGGCTACACGATGTACTTTGGCCTCATTCTTTATCACCCAGCCATGATGGAAGACATATCCAACCCATGCCGATATTCAAACTGCAGCCATATGTGTCTTCTGTCTCCTCACTCCCCTGGGTATACCTGTGCCTGTCCCAGTGGCATCATGGAGCTCAGCCGTGACAGTCATACATGTGTTGATACATCGGCTAGAGTTTACTTGATAGTCAGCAGCCTCAAGAAATTGTACATGCTGTCACCACACAAGTTTGGCCGTGCCGACCAGCATGTCTTGGAGCCACAACCAGATATCAAAGGCATAGGTGATATGGAGTATTCCCCAGAGCAAGGC\n>XM_036181832.1 PREDICTED: Onychomys torridus olfactory receptor 13-like (LOC118579991), mRNA \nATGGGAAATCAGACCTGGGTTACACAGTTCATTCTCTTGGGATTTCCACTCAGCCCAAGGATGCAGATGTTCCTCTTTGCTCTCTTCTCCCTGTGCTATGCCTTCACCCTGCTGGGGAATGGGATCATCGTGGGGCTTATCTGCCTGGACTCCAGACTCCACACTCCCATGTACTTCTTCCTATCCCACCTGGCCATTGTTGACATTGCCTATGCCTGCAACACAGTGCCTCAGATGCTGGTGAACCTTCTAGATTCAACCAAGCCCATCTCCTTTGCTGGATGCATGATGCAGACCTTTCTCTTTTTGACATTTGCACACACAGAATGTCTGCTCCTAGTGGTGATGTCCTATGATAGGTATGTGGCCATCTGCCACCCTCTCCGATACACTGCCATCATGAGCTGGAGAGTTTGTATTACCCTAGTGGCGACTTCCTGGATTTTAGGAGTCCTCTTGGCCCTGGTCCATCTAGTATTACTATTACCATTGCCCTTCTGTGGATCTCAAAAAGTAAATCACTTTTTCTGTGAAATTATAGCTGTTCTCAAACTTGCCTGTTCAGACACCCATGTCAATGAGATTATGGTTTTGGCTGGGGCTGTGTCTGTGCTTGTGGGACCATTTTCTTCGATTGTGGTCTCTTATGCTCATATTCTGTGTGCCATCCTGAAGATCCAGTCACGCCAGGGGCGCCAGAAAGCCTTCTCCACCTGTTCCTCCCATCTCTGTGTTGTTGGACTCTTTTATGGTACAGCCATTGCCATGTACATTGGGCCTCAACAGGAGAATTCCAATGAGCAGAAGAAATACCTCTTGCTATTCCATAGCCTTTTCAATCCTATGCTCAACCCACTGATCTATAGCTTGAGAAACAAAGATGTCAAAAGTGCTCTGAAGAGGATGCTCATAAAGAAGGATACCTCTCAGGAGCATTAA\n>KC494783.1 Ornebius sp. 10 BHW-2013 isolate REU1901 12S ribosomal RNA gene, partial sequence; mitochondrial\u0001KC494784.1 Ornebius sp. 10 BHW-2013 isolate REU1902 12S ribosomal RNA gene, partial sequence; mitochondrial \nAATAAGTGTAAATATAAAAGGTTTAGGTAGTAGGAGTTAAGATCTTGAAACTTAAAGAATTTGGCGGTGTTTTATTCTGTTCAGAGGAATCTGTTTTGTAATCGATAGAACACGATTGAATAAACTTGAATTTATAATTTGTATATCGCCGTCATCAGATTATTTTGAATGGAGGAATTTAAATATTAAAATATTTATTAGGATAAAATGTCAGGTCAAGGTGCAGTTTATATTTAAGTATATAATGGATTACAATAAATGAAAATTTATTTGGATTATAAATATGATTATTTATACGAAATTGGATTTGAAAGTAAATTGGTTGAAATTAATAAATTGAATAAGCGCTGAAGCATGC\n>XM_015123435.2 PREDICTED: Macaca mulatta zinc finger protein 493 (LOC693611), transcript variant X2, mRNA \nTGTCCTCAGCGTGTGTGGCTTCATGACCCGAAGGTATTGGGAGATCCATAGCTAAGATGCCAGGACCCCCTGAAAGCCTAGAAATGGGAACTGATTTTCTGCTGTATTTTTCACCTGTGTCCCAAGCAGCGTCTTGGAACCCATCCCCCATTTCTCCAGCCTCACTCTGGCTTGCAGGGCCGTTGACATTTAGGGATGTGGCCATAGAATTCTCTCTGGAGGAGTGGCAATGCCTGGACACTGCTCAGCAAGATTTGTATAGGAAAGTGATGTTAGAGAACTACAGAAACCTGGTCTTGGGTATTGATGTCTCTAAGCCAAATCTGATCACCTGTCTGGAGCAAGGAAAATATCCCTGGAATATGAAGAGACACAGTATGGTAGTGAAACCCCCAGTTATATGTTCTCATTTTGCTGAAGACCTTTGCCCAGGGCCAGGCATTAAAGATTCTTTTCAAAAAGTGATACTGAGAGAATATGTAAAATGTGGACACAAGGATTTACAGTTAAGAAAAGGCTGTAAAAGTGTGAATGAGTGTAATGTGCACAAAGAAGGTTATAATGAACTAAACCTGTGTTTGACAACTACCCAGAGAAAAATACTTCAATGTGATAAATATGTGAAAGTCTTCCACAAATTTTTAAATTCAAATAGACATAACACAAAACATACTAGAAAGAAACCTTTCAAATGTAAAAAATGTGGCAAATCATTTTGCCTGCTTTTACACCTACATCAGCATAAAAGAATTCATATTAGAGAGAATTCTTACCAATGTGAAGAATGTGGCAAAGCGTTTATCTGGTTCTCAACCCTTACTAGACACAGGCGGGTTCATACTGGAAAGAAATCCTACAAATACGAAGAATGTGGCAAAGCTTTTAACCAGGACTCAAACCTTTCTACACATAAGAGAATTCATACTGGACAGAAATCCTACAAATGTGAAGAATGTGGCACAGCTTTCTACCAATTCTCACACCTTACTAGGCATAAGTTAATTCATACTGGAGAGAAACCCTACAAATGTGAAGAATGTGGCAAAGCTTTTAACCGATCTTCAACCCTTACTAGACATAAGATAATTCATACTGGAGAAAAACCCTATAAATGTGAAGAATGTGGCAAAGCCTTTAGTGTTTTCTCAACCCTTACTAAACATAAGATAATTCACACTGGAGAGAAACCCCACAGATGTGAAGAATATGGCAAAGCTTATAAGGAGTCCTCACACCTTACTACACATAAAAGAATTAATACTGGAGAGAAACCATACAAATGTGAAGAATGTGGCAAAACCTTTAGTATATTCTCAATCCTTACTAAACATAAGATAATTCATACAGAAGAGAAACCCTACAAATGTGAAGAATGTGGCAAAGCTTTTAAACGATCTTCAACCCTTACTAACCATAAGATAATTCATACTGAAGAGAAACCCTACAAATGTGAAGAATGTGGTAAAGCTTTTAAACAATCTTCAACCCTTACTATACATAAAATAATTCATACTGGAGAAAAACCCTACAAATGTGAAGAATGTGGCAAAGCTTTTAAGCGATCTTCAACCTTTACTATACATAAAATAATTCATACTGGAGAAAAACCCTACAAATGTGAAGAATGTGGCAAAGCTTTTAATCGGTCCTCACACCTTACTACACATAAGAGAATTCATACTGGACAGAAACCCTACAAATGTAAAGAATGTGGCAAATCCTTTAGTGAATTCTCAACACTTACTAAACATAAGATAATTCATACTGAAGAGAAACCCTACAAATGTGAAGAATGTGGCAAAGCTTTTAACCGATCTTCAATCCTTAGTATACATAAGAAAACTCATACTGGAGAAAAACCCTACAAATGTGAAGAATGTGGCAAAGCTTTTAAGCAGTCCTCACACCTCGCTGGGCATAAGCATGTTCATGGTGGACAGAAACCCTACAAATGTGAATTATGTGGCAAAGCCTTTAGTATATTCTCAACCCTTACTAAACATAAGATAATTCATACTGAAGAGAAACCCTACAAATGTGAAGAATGTGGCAAAACTTTCTACCGATTCTCAAACCTTAATACGCATAAGATAATTCATACTGGAAAGAAACCCTGCAAATGTGAAGAATGTGGCAAAGCTTTCAACCATTCCTCAAACCTTACTAAACATAAGCTAATTCATACTGGAGACAAACCCTACAAATGTGAACAATGTGGCAAAGCTTTTAGGCGGTCTTCACATCTTAGTAGACATAAGATAATTCATATTGGAATTCATACTGAAGAGATTCTACAAATGTGAAGAATGTGGCAAAAGCCTCTTCCCTTACTAAAGAATGTGGCAAAGCTTTTAATCAGAACTTCACCCTTACTACACATAAGATAATTCATGCTGGAGAGAAACCCTACAAATGTGAAGAATGTGGCAAAGATTTCTATT\n>XM_036871986.1 PREDICTED: Balaenoptera musculus vestigial like family member 2 (VGLL2), transcript variant X3, mRNA \nCTTCTATCTCGGAGCGCGGTGGCAGCTGGAATTGCAGGGGTGGGAAGGGAGCGTGCGAGCGGGATCCCGAGCCGCGGAGCACGCTGCCCCTCGCTCCGCCGCGGATGACTTGGGAGCTCGGGTCCAAGTGCCGCCCATGCAGCATCCCTGCCCTCCGCCGCCCGAGAGTTGATGATAAAACACTTAACCGTCTCCGCTGCGGGAAGCCATGAGCTGTCTGGATGTTATGTACCAAGTCTACGGTCCTCCCCAGCCTTACTTCGCAGCCGCCTACACCCCTTACCACCAGGGTCTGTCGGACTCCAGATTTCTTCCGAGCCCGGTGCTGGCGCGGGAAGATGCGAGCAAAGCTCACGCAGGGAAAACCAAAATTTGGTCCCAAAGAAACTAGCCTATTACTCCAAAATGCAGGAAGCCCAGGAGTGCAACGCCAGCCCCAGCAACAGCAGCGGCAGTGGCAGCTCCTTCTCCAGCCAAACTCCGGCTAGTATAAAAGAAGAAGAAGGCAGCCCGGAGAAAGAGCGCCCACCAGAGGCGGAGTACATCAACTCCCGCTGCGTCCTTTTCACCTATTTCCAGGGAGACATCAGCTCTGTGGTGGACGAGCACTTCAGCCGGGCCCTGAGCCAGCCTAGCAGCTATTCCCCAAGCTGTACAAGCAGCAAAGCCCCGCGGAGCTCTGGGCCCTGGCGGGACGGCTCCTTCCCGATGAGCCAGCGCAGCTTCCCCGCCTCCTTCTGGAACAGCGCTTACCAGACGCCGGTGCCCGCGCCACTGGGCAGCCCTCTGGCCGCCGCTCACTCGGAGCTGCCCTTCGCCGCTGCCGACCCCTACTCGCCGGCCGCGCTGCACGGCCACCTGCACCAGGGCGCGGCAGAGCCCTGGCACCACGCGCATCCCCACCACGCGCATCCGCACCACCCCTACGCGCTGGGCGGCGCCCTCGGCGCCCAGGCCGCCGCCTACCCGCGGCCCGCCGCCGTGCACGAGGTCTACGCGCCGCACTTCGACCCGCGCTACGGGCCGCTGCTGATGCCCGCCGCCTCGGGGCGCCCGGCCCGCCTCGCTCCCGCGCCGGCCCCCGCGCCAGGCAGCCCGCCCTGTGAGCTCTCGGCCAAGGGCGAGCCGGCCGGCGCCACGTGGGCCGCGCCCGGGGGACCTTTCGCGAGCCCCACGGGGGACGTGGCCGGGGGTCTGGGCCTCAGCGTGGACTCAGCTCGTCGTTATTCCCTCTGTGGTGCATCCCTCCTGAGCTGATCTGCTGACCCAGGGTTTCCCCTTCCCTTTCCCTTCTGACCAGCCATGGAGGCTGGCATCTGTGCCTCTCACTTCATGGATGAGGACATGGGGGAATGCAGAGACTTCAAACTTCTCCGTGTATTGGGAAAACCAGAACACACATCGACAGAATTTTCATCTAAAAATAATTCCTTCTGCCAAAAGAGGAAATCCAAAGACTCTGAATGATGCTTAATGACTTTTGGGCAAATCACTGGAAATATCCATGGTGATCACTTAGGTGACATGATTCATAGTTTTCTCGGAAAGAGGGAAAGAAAAAGAGATGTTTTGGTGTGAATATTTTTTATGCTGATGTGAATTATTTCATTAAGTAGTGTGATCATAGCACTGCAATGTCAATATCCTCAGACTGAAATGTATTTGTATTTGCATCAAAGACTGTGGTAGAGAAGTCAAAAGAAGCCAATTCCTTCTTCCTCACCTGTAGCCTCCAGCTCCTTTCCTGCCCACTCCCTCCCTACAACACCCACTCCAGACACAAAGACACACTTTCTTCTTCGGACTGTGAACGTGGAAGCCTCAGCCCGAATGTGAGCGGCAAGTGGCGAATCTGGAGCCACCTGCCCGAGTCTTACTGAAATGCAGCTGTTGTAGGACAACTGTTTAAAACTCCAGAAATACATCGACCAAAGGGGGCACTTCCCAGTGTTTGGCACAGCAATTGCAGTTGCACTGGATATGTTTTATACGTGTGTGTGTGTGTATATATCATATTTTTTACAAAGAACATTTTATGATGAAAGAAGAAGCTCTCTCTGCCTTCTCTCCCACGAATTCTGTCCCTCCCTCTATCCTTCTTTGGGTGAAAAAAAGTAAGCATCAAGAGGCCCCAGTTGTCTCCAAGAAGAAGAACTAGGAGTCACCACAAGGGGAAGAGATGCCCATGGAGTCTCTGGTACCTCGAATATTCTTCTCAGTCTCTGTGGTCATGATTTGGTCACTTTAGTGTTGGGACAGGGGAAGGGGTACACATGTGGGCAAAACTGAAGGGGATGAGGAAGAAGAAACGAACATTAAAGATGTTTGTTTACCACTA\n>OV289143.1 uncultured Bacterium partial 16S rRNA gene \nGGACTACTGGGGTATCTAATCCTGTTTGCTCCCCACGCTTTCGCGCCTCAGCGTCAGTATCGATCCAGAAAGCCGCCTTCGCCTCTGGTGTTCTTCCTAATATCTACGAATTTCACCTCTACACTAGGAATTCCGCTTTCCTCTATCGATCTCTAGCCACCCAGTATTAAACGCAATTCCTAGGTTGAGCCTAGGGCTTTCACGTCTAACTTAAGTGGCCGCCTACGCGCCCTTTACGCCCAGTAATTCCGAACAACGCTAGCTCCATCCGTCTTACCGCGGCTGCTGGCAC\n>KT295441.1 Uncultured Klebsiella sp. clone M01598_122_000000000-ADV8A_1_1102_4097_6649 16S ribosomal RNA gene, partial sequence \nCCTACGGGCGGCTGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGCGGGGAGGAAGGCGTTAAGGTTAATAACCTTGTCGATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTCAAGTCGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTCGAAACTGGCAGGCTAAAGTCTTGTAGAGGGGGGTAGAATTCCGGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTAGTAGTC\n>XM_053381890.1 PREDICTED: Podarcis raffonei L3MBTL histone methyl-lysine binding protein 3 (LOC128410530), transcript variant X3, mRNA \nGCACAGCCTCTCGCCCAGGGGATGGGACCCGAGGTGGTGGGGGAAAGTGGCCCGGCGCCTGCGAAGTGGCTGGGGAGTGTGGGTCGGCCACGGGGGGTTCCTTCCCTAAAAAAGCCCCTAAGTGCGTGAGAGTGAAAGAGGAACAAAAGAGTGGGCGAGGGAGAGCCAGAGAGAGGTGCCTTCGGCGTCCGCGCCCCCCACCCCGCTCGCTTCTTCCCCAACATATGACGGTATATGCACCATGAATGAACCAACTTCTAGTGGAAGTGGGCAAGACTTTGATGTATTTAGTGTAATGGACTGGAAGGACGGAATTGGTACCTTGCCTGGAAGTGATCTGAAGTTTCGTGTGAATGAGTTTGGTGCCCTAGAAGTAATCACCGATGAAACAGAGATGGAAAGTGTTAAGAAGGCTACAGCTACCACAACCTGGATGGTGCCTACTGCTCAAGAAGCCTTCTCAGAAAATACAGAAGTACCACAAAAACTGAAGGAAGCTAGCAAGGTTGACGGGCCTCATTTCTGTGAACGTTGTTTTCATTCTGGAACCACAGTGGACTTTGTAGCTGGAGAAAGATCTTGCAGCCAAAAATGTGCACATCAGATTAAAAACAAAGAGCAAAGGGAGGACAACGATGTCTCGGAAGTCAATGATGAGGACTGTTCCAAGGGCACTCAAAAAAGAAAAACCAAATCGCCCTCAAAAGGAGAATGTATGGAAGACAATGTCAAGAAGTATGAGGCAATGGAGGAGAAACCTGAAGGGAGGATACTAAGAGTCTCTCAGAGAGCCACACGGAAAAGGAAAAGAGAGATGGCAGTTCTAAAACAGACTTTGATGTCAAAGGCAAAGAAAACATGGAGTTGGTCTTCGTATTTGGAAGAAGAAAAGGCTATAGCAGCACCACCTAAGATTTTTAAAGAGTATCAATCCTTCCCGTACAACAAAAATGGATTCAAAGTTGGAATGAAACTAGAAGGGGTGGACCCTGAGCACCAGTCAATGTATTGTGTGCTTACAGTAGCTGAGACTTGTGGTTACAGAATTAGACTTCACTTTGATGAATACCCAGAGTGTTACGATTTTTGGCGGAATGCTGATTCTTCTGATATTCACCCAGTTGGTTGGTGCGAGAAAACAGGACACAAACTTCATCCACCAAAAGGATATAAAGAAGATGAATTTAATTGGTCCTCGTATCTGAAGAAATGTAAGGCTCAAGCTGCTCCTAAATCCTTGTTTGAAAACCAAAACTCAACGGTGATTCCATCAGGGTTTCGAGTGGGGATGAAGCTTGAAGCAGTAGACAAAAAGAACCCTGCATTCATATGTGTTGCTACAGTAACTGACATTGTGGACAGTCGTTTTCTGGTTCATTTTGACAACTGGGATGAGAGTTATGACTACTGGTGTGAAGCGGCTAGTCCACATATTCATCCAGTTGGCTGGTGTAAAGAGCACAGAAAGACCCTTGTAACCCCTCGAGACTATCCACATGCCAAGCATTTTTCTTGGGAGAAATATTTGGAAGAAACTAGTTCTTTACCAGCACCTGCCAGGGCTTTTAAAGTGAAGTCTCAGCTGGACCAAAGAGCTTTTCAGCAGTGGAAGGACACAATTGCATACAACACAAAGTCATTAACAAAGAAACCTTCTCATGGATTCCAGAAGAATATGAAACTTGAAGTAGTTGACAAGAGAAATCCTGTACTAATCAGGGTCGCAACCGTGGTAGATACTGATGACCACAGAATTAAAGTCCACTTCGATGGCTGGGATAGTATTTATGATTATTGGATCGATGCAGATAGCCCTGATATCCATCCTGCTGGCTGGTGTGGGAAAACTGGACATCCTCTTCAGCCCCCACTTAGTCCTTTGGAATTGGTAGAAGCTTTAGAACAAGGAGGATGTCCTACAGTGGGCTGCAAAGGAGTTGGACACATAAAAAGAGCCAGACATACGGGCCACCACAGTGCTCTCAGCTGCCCATATTCTGAGATAAATCTGAGCAAAGAACATATCCTTTCAGACCGCTTAAGTGGAGAGATGCCTCAGAGTATTCCGCCTCTGCATTGGAACCGGAAGCCAGAAGCAAATGAAAGATCTGCATCTCCTGTAATCAGTAATAGAAAATGTCCCAGTCCCATTGTCCTAAAATCTTCAGCTCATCTCCATTCATCAAAGCAGGAAGACACAGAGGTGAAACCTCTTTGCAAAAAGCCTCTAATGTTTGATGTCAAAGAAAAGAACTACAGGGGATGCCAGGCAACTAAGGATTTTGCAAAGAAAGATGGCTGTGCAGGCAGGAAGATGGAAAATGAAGAGTCATCTCTAAATGAATCCAAAGACACCAAGGAATCCAGTAACAGGAGTTCCCATCCTCAGCCAGTTATTTTGACCTCGAAGTTGACAATCCCAGCCTTTCCATTGCGATGGGAACAGCAGAGTAAACTCCTTCCTACTGTGGCTGGAATCCCTGCCAGTAAAGTTTCCAAGTGGAGCACAGATGAGGTGTCAGAATTCATACGGAGTTTGCCAGGCTGTGAGGAACATGGCAAGGTGTTCAAAGACGAACAAATTGATGGAGAAGCTTTCCTTCTAATGACCCAAACAGATATAGTAAAAATAATGAGCATTAAGCTAGGACCAGCCCTAAAGATCTTCAACTCAATCCTGATGTTCAAGGCTGCCGATAAGAACTCGCACAATGAACTCTGATGGAAAAGTGACTACAGGGCAGCTCTCTCCATTGCAGCTCATGTTTTATTCAAAGCACAAAGACTCCAAAGGATCATCAAGGAGGAACTCTATAAGGCGAAAAATCAGAGTGGATGGAGTGTTGATTTTCTCCAAGAGCCTGAGCAAACTAACACTTCTGGGAAGTGCTTAAGCTTTTTAGTAAGATGCTCTTACAAAAGAGTGGGTACTTGATGTTTACTGGCTGATGGCTCTAATTTTCCCACAACTAGCCATCCTTAATTTTATCGGGGATCCATTAACTAAGTTAACATACTAAAATTATGGAAATAATATCCTTTTCTAAGGATACACAAAATACACACTTCATGAATTTACTTCTTCACCAATGAATTCCTTTGTATCGTTTCATCATTTTCATTAAAAAAAAAATTGTTCGCAGTTTAAAATAAGTGGACTACAGTTAATGAAGACTGTTAACAAGTCGTCTTAGTTTCACACAGCAGCTCAAATTTAACACTTTGCTGTGTACAATGAAGCTGATCGATTTATTCTGTTGTATGAAAACATTGCTGGAGACCAATGCTATGTTTTTTTGTTTTTGTTTTTTTGCATGATTAAAGAAGTTTAATGAATATTTCCACCAGCATA\n>XM_027574246.1 PREDICTED: Zalophus californianus family with sequence similarity 71 member F1 (FAM71F1), transcript variant X2, mRNA \nGGCAAACTTGCAGCAGGCCCCTGAGCATGTGCGGAAATGTTGTCATCAGTTCCACAGAGAAAGACTCGGTGGAAATCAAAGAAGACAGTAAAAGTCACAAGATCTTTTCCAACCTTCCCTTCCCTGAATGCCTGGGAAGAAGTCAGGGGCCTCTTGCCTGTGGATGGGGAGCCAAACCCTGGAGTGGGCCTGGGTGTGGAGGAGGGACTGCTCTGCCAGATTCTTCATTCTCCAGAATTCAACCTATTTCCTGACTCAGTGGTGTTTGAAAGCAACTTTGTCCAGGTCAGAAAGGGCAGGGACTGGATAGACATCTACAAGGCCTCCAACACCATGGCCCTTGGGGTAACCTCCTCCGTGCCCTGCCTGCCCCTTCCCAATATCCTCCTCATGGCTAATGTCAAATGGCACCAGGGACAGAGCCAGACATGGAACAGACCATCTATGGCCCCAAACATCAAGCTGAAGAGGATCCTCCCATTGAAGTTTGTGGAGTTCCAGGTCTGTGACCGGCTTCAACGCATCCTGCGTTTGAGGACAGTCACTGAGAAGATCTACTACCTAAGGCTCCACCCTGACCATCCTAGGACTGTCTTCCACTTCTGGATCCGACTGGTTCAAATTCTGCATAAGGGCCTGTCCATCACCACCAAGGACCCTAGGATTCTTGTCACTCACTGTCTGGTACCCAAGAACAGCTGCAGCCCCTCGGGAGACTCTAACTCGGTAGAGAAGAAACCCCAAGCCTCCCAGCCCAGCGAGAGCCTCATGCAGCTGATGGCCAAGGGGGAGAGTGAGGCGCTCTCTCAGATTTTTGCCGACCTGCACCAGCACAATGAGTTCAGGAGCAGCAAAAAGACACAGACCAAAAGGGACAGCTCAGAGAAAGATACTCACAGTGAAGACGGCATCCCTTGCACCCGCGACCTCAGTTGGAGAGATTCGCTCACTTATGGAGAGTGGGAAAGAGAGAACCCCTCTGGGCCACAGCCCCTTTCACTCCTCAGCACCCTGGCAGCCTCCACGGGGCCACAGCTGGCCCCACTCATATAGGAAATTCTATTTAAACTACCTTTTCGCACTGGGGAGAATCTATGCAGCCCTCGCCAACGCCACTCTGCAGCATGCAGCTTTCTGAGGGACTCTGTCTGGATGTAGGGGAGAAGAAAGCTACAACTAAGGAAAAACTAGACTCATCTCATGCTGATAGCATAGCCTTTCCTTGGAGAACCACCTGGGAGCATGGCTCCGGGTAAGAGCATTATTCCAGCATCATGCCAGTACGTAACTCCGGATCCGTGCCACTACCCATCACACCTTGCCTCCGTTAACCACCACCAGGGCAGGCACAAGAAGATGTGCTCTCAGAAGGGCCACGGACAAGAGATGGAGAGAAGGAAGGAAAGGGAAGCAGGACCGGAGGAGAGGGGGACGAGAACAAAATGGCGGTGAAGAGCAGGTGGAGGGAGAAAGTCAGAGAAGAAGGGGGATCTTACAGAGAGGTGGTAAGAAAACAGAAGGGACCTGAATGAGAAGCTGAAAAGGACAAGAGAAGAAATACACCACTGAGAGATGCCTCACGAAGCTTCTATTTATCTAATTTAAAACTTGAAAGTAAGGCCATATACCCAAACAAATGTGTTTTCTTCTCTGTGCCAATTATTCTGGATAACTATGAGGGGCTAAAAACTAATTCCAGCCAAGGGCCTCTCCTGAAGT\n>KM481143.1 Uncultured bacterium clone 2010ECS-StD#1958 16S ribosomal RNA gene, partial sequence \nGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCAGGGCTTAAATGTAAGTTGCATGGATCAGAGATGGTCCTTTCTTCGGACTACTTACAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCAGGTTAAGTCCTATAACGAGCGCAACCCCTATTGTTAGTTGCCAGCGGGTCAAGCCGGGTACTCTAGCGAGACTGCCGGTGCAAACCGAGAGGAAGGTGGGGACGACGTCAAATCATCACGGCCCTTACGTCCTGGCTACACACGTGCTACAATGGCCGGTACAGAGAGCAGCCACCCCGCGAGGGGGCGCG\n>KP968504.1 Sarocladium sp. strain LA-MB10 18S ribosomal RNA gene, partial sequence \nTCTTTGTTTGTGTGTGTCTGTCCTACTCCAGGTTTCCTCTCTAATTGGGACCACGTGTGTGTCTCCGGGTTATATCTGGGCAAAACCCCCCCCTCCACCAGGGGTTGGGAGGTGGTTATCTATCCAACCCAATCCGGGGCCGTTCGGGGTTGTTTGTGATTCATGAAACTAATAGAATCGCCCGCCCTGGCCCTGCGGTGGATCATTCCACTTACTACCTTATCAACTTTCGATGTTGGCTATTGCCAATCATGGTGCAACGGGTAACGGAGGGTTAGGGCTCGACCCCGGAGAAGGAGCCTGAGAAACGGCTACTACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCCGACTCGGGGAGGTAGTGACAATAAATACTGATACAGGGCCCTTTCGGGCCTTGTAATTGGAATGAGTACAATTTAAATCCCTTAACGAGGAACAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGAACCTTGGGCCTGGCTGGCCGGTCCGCCTCACCGCGTGCACTGGTCCGGCCGGGCCTTTCCCTCTGTGGAACCCCATACCCTTCACTGGGCGTGGCGGGGAAACAGGACATTTACTTTGAAAAAATTAGAGTGCTCCAGGCAGGCCTATGCTCGAATACATTAGCATGGAATAATAAAATAGGACGCGCGGTTCTATTTTGTTGGTTTATAGGACCGCCGTAATGATTAATAGGGACAGTCGGGGGCATCAGTATTCAACTGTCAGAGGTGAAATTCTTGGATCAGTTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAGGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGACGGTGTTATTCATGACCCGTTCGGCACCTTACGAGAAATCAAAGTGCTTGGGCTCCAGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGAAATTGAC\n>JF420835.1 Centroptilum triangulifer heat shock protein 70 mRNA, partial cds \nTCGAGGCAGACAGATCCTCTTGAGCACATTTCCTCTTTTTCATCTGCAATCATCCGCTAAAGAAATGGCAAAGCCGGGCCCCGCAGTCGGTATCGATCTTGGAACCACCTACTCCTGCGTTGGAGTTTTCCAGCACGGAAAGGTGGAAATTATTGCCAATGACCAGGGCAACAGAACAACCCCTAGCTACGTGGCTTTCACTGACACCGAGCGTCTCATTGGAGATGCCGCCAAGAACCAAGTGGCCATGAATCCTAGCAACACCATCTTTGATGCTAAGCGTTTGATCGGGCGCAAGTTTGAAGATGCTACAGTGCAAGCCGACATGAAGCACTGGCCATTCACAGTCATTAGCGAGGATGGCAAGCCCAAACTGCAGGTGGAATATAAGGGAGAGACCAAGGCCTTTTTCCCTGAGGAAGTCAGTTCGATGGTGCTCATCAAGATGAAAGAGACCGCCGAGGCCTACCTGGGCAAGACTGTCAACAATGCCGTCATCACCGTGCCGGCTTACTTCAACGATAGCCAGCGCCAGGCCACCAAGGACTCGGGCACCATCGCTGGACTGAACGTGCTCAGGATCATCAACGAGCCCACTGCGGCTGCCATCGCCTATGGTCTAGACAAGAAAGGCCAGGGTGAGAGGCATGTCCTCATCTTTGACTTGGGTGGCGGCACCTTTGATGTGTCCATCCTGACCATTGAGGATGGAATCTTCGAGGTCAAGTCCACTGCTGGAGACACCCATCTTGGAGGTGAGGACTTTGACAACCGCATGGTCAACCACTTTGTGCAGGAGTTCAAGCGCAAGTACAAGAAGGACCTGACCACCAACAAGCGTGCCTTGAGGCGTCTCAGGACGGCGTGCGAGAGGGCAAAGAGGACCCTCTCTTCGTCCACTCAGGCCTCCATAGAGATTGACTCTCTCTTTGAGGGCATCGATTTCTACACTTCCATCACCAGGGCTCGTTTTGAGGAGCTCTGCGCTGATCTCTTCAGGTCCACCCTTGAGCCCGTTGAGAAGTCCCTGAGGGATGCTAAGATGGACAAGGCCCAGATCAATGATATTGTTCTTGTCGGAGGTTCTACCCGTATTCCCAAGATCCAGAAGCTCCTGCAGGACTTCTTCAATGGCAAGGAGCTCAACAAGTCCATCAACCCTGATGAGGCTGTTGCCTATGGAGCAGCTGTCCAGGCTGCTATCTTGGCTGGAGACAAGTCTGAGGCTGTCCAGGACCTTCTCCTGTTGGACGTCACTCCCCTTAGCTTGGGTATCGAGACTGCTGGTGGTGTGATGACCACCCTTATCAAGAGAAACACCACCATTCCCACCAAGCAGACCCAGACCTTCACCACCTACTCAGACAATCAACCTGGAGTGCTCATTCAGGTCTATGAGGGCGAGCGTGCCATGACCAAGGACAACAACATTTTGGGCAAGTTCGAGCTTGCGGGCATCCCTCCTGCTCCCCGTGGTGTGCCCCAGATTGAGGTCACCTTTGACATTGACGCCAACGGCATCTTGAACGTCTCTGCAATTGAAAAGTCTACCAACAAAGAAAACAAGATCACCATCACCAATGACAAGGGTCGCTTGTCTAAGGAGGAGATTGAGCGTATGGTCAACGACGCAGAGAAGTACAAGGCCGAGGATGAGAAGCAGCGCACCGTCATTGCTTCCAAGAACAGCCTCGAGTCCTATTGCTTCAACATGAAGTCAACCATGGAAGGTGAGAAGCTGAAGGACAAGATCCCCGAGGAAGACAAGAAAATTATCATGGACAAGTGTAACGAGGTGATCCGTTGGATGGACTCGAACCAGCTGGCTGACAAGGAGGAGTTCGAACATAAGCAAAAGGAGCTTGAAGGCGTCTGCAACCCCATCATCACCAAGCTGTACCAGAGCGGT\n>MF207496.1 Uncultured bacterium clone denovo1205_590_10496 16S ribosomal RNA gene, partial sequence \nGTTCCTACGGGGCGCAGCAGTGGGGGATATTGGACAATGGGGGGAACCCTGATCCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTGTCAGCAGGGAAGAAAGCAATGACGGTACCTGACCAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGGAGGATGCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGACAGTCAAGTCAGCGGTAAAAATGCGGTGCTCAACGCCGTACAGCCGTTGAAACTGGCAGTCTTGGGTGGGCGAGA\n>XM_015122060.2 PREDICTED: Macaca mulatta SMG7 nonsense mediated mRNA decay factor (SMG7), transcript variant X2, mRNA \nAACTTGGAGGTCTGCCTTTAATAATCAAGCAGGATCCCCACTGCGGGTGCCTATCAGAGTTATGGCGATAGTCAGCCTTCCGGTTAGTCCCCGACTTAAATGATAGAAAACACGTGTTACCCTTCTAGGATGCATTCCTACCCTCACCCTGGCCTCGCAGCAGGATCGCGACAGCTAGGTCAGGAGGGAGTACGCGGGTGGGGTGGATTTGGGGGAGGGGTTGACTCGCCAAAAGTCGGCTATCCCCGTCGGCAGGGGAGGCATCACGGCTGTCGTGTGCCGCTCTCCTCCCTCAGGGACCCCGTTCAGGCGGGATCCCGCCTCCCAGAGCCCAAGGCAGTTGTGGGGAAACCCCTTGCCCTTCCTCGCCGCTTGGCACTGCCGCCTCGCTCTCCCGACTCCAGCCCGCCGCCCGCCAGCCTCCAGGCCATGCATCTTCTTCGCAGGCCCAGCCCTCTCCACGCCCGGCTCTGAGAGGAAACTATGGAGGTGGTTCCCGCCTGCAGGCGGGTGGAAAAGCCCATGGTGAATGTCTCGGGGTGTCCCCCCAGTTGCTGTGAGAAGTGGGAAGGGAGGAGGAAGTGGACTTCACCACCGGGGAGAACTACCTCTATTCCTAACTTGGGGGAGGCCTTTAGATGGAAGGGATGCCAACGGGGAACCCTGGGCGGTTTCCAGGGAATCCATTGGCCAAGGGGAGGGTCACCCTGTCTGCACACACTGGTTACTATGACAATACAACCACAGCCTCCAGTTGCCATGGCAGCTGTCTATCCAATCCGATTCTTTTCTTTTCTCTTCCTCTCCGGGCCCCACCTTATCCCCTCCAAGAGTCTCCCAGCGTGCATGGGGAGGGGCTGCAGAGAAGAGGAAAGGGGGTCCTTCGAGTCACTCTCTACGCGCGAGAGAAGACAAGAGTCGAGGGACTGCTGGGAGGAACTGTAGGAGGAAGGGGCGGCGTTTCCGGTGGGGAAGAGTGGAGGCGTGCAAAAAGGAAGAGAGAAATCCGCTGGAGTGATAAGAAGGGGGAAGACTTTGAGTGTAACTCCCGGTTCTTTGGGCCTCGGTGTTCTTGGTGGGGTTGGGATTGCCCCCTTGCGCGGGAGGAGAAGGGTGGATTGGCAGGAAGCCTCCAAGCGCCACCAGCCGGTAGCTCAGAAGCCGCACACGCGCCACACAGCTTGTTGATCCCAAAAGGGAGCGCTACAGAGAAGCGGAAATCACCGGGAGAGACAGGCGCTGCTGAAATCTCGCGAGAGGGAGCCCCCCTCGTAGCCGACTTCCTTCCTCTGCTTCTCCTCTTTCCCCCGCCCCTCCTCCCTCCTCCTCCCCCCCTGGGTCGGAGTGTCCCTGCGCCCCACGGGCCGGAGCAGCAGCGAAAGCAGCTTTCCCCGCTCCCTCCCCCTCGCCTCATTCACCCCCACCCCCTTGCCGAGCGAGGAGGAGCCGGAGGAGAGGAAGATGGCGGCGGCCGCCAGCACCCGCGGTGCCGCGGGGCCGCTCCGAGGAGCCTGAGAGACCCACGGAGGCTTCGCGGGAAGACGCGGCGGCGGAGGATGAGCCTGCAGAGCGCGCAGTACCTCCGGCAGGCAGAAGTCCTGAAGGCTGACATGACAGATTCTAAGCTGGGTCCAGCTGAAGTCTGGACATCCAGGCAGGCTCTGCAGGACCTGTACCAGAAAATGCTAGTTACTGATTTGGAATACGCTTTAGACAAGAAAGTAGAACAGGATCTCTGGAATCACGCCTTTAAGAATCAGATCACAACACTACAAGGCCAGGCAAAGAATCGAGCAAATCCGAATCGAAGTGAAGTTCAGGCAAACCTTTCTCTGTTCCTAGAGGCAGCTAGTGGCTTCTATACCCAGTTATTACAAGAACTGTGTACAGTATTTAATGTAGATTTACCATGCCGTGTGAAGTCTTCCCAGTTGGGAATTATCAGCAATAAACAGACGCATACCAGCGCCATAGTGAAGCCACAGTCTAGCTCCTGTTCCTATATCTGCCAGCACTGCCTCGTCCACCTTGGAGACATTGCTCGATACAGAAACCAGACCAGCCAGGCAGAGTCCTACTATAGGCATGCAGCTCAGCTTGTCCCCTCCAATGGTCAGCCTTATAATCAGTTGGCTATCTTAGCTTCTTCCAAAGGAGACCATCTGACCACAATTTTCTACTACTGCAGAAGCATTGCTGTGAAGTTCCCTTTCCCAGCTGCCTCCACTAATCTGCAAAAAGCACTTTCTAAAGCACTGGAAAGCCGAGATGAGGTGAAAACCAAGTGGGGTGTTTCTGACTTCATCAAGGCCTTTATTAAATTCCACGGTCATGTGTACCTGAGTAAGAGCTTGGAAAAGTTGAGCCCTCTTCGAGAAAAATTGGAAGAACAGTTTAAGAGGCTGCTATTCCAAAAAGCTTTCAACTCTCAGCAGTTAGTTCATGTCACTGTCATTAACCTGTTTCAACTTCATCACCTTCGTGACTTTAGCAATGAAACTGAGCAGCACAGTTATAGCCAAGATGAGCAGCTATGTTGGACACAGTTGCTGGCCCTCTTTATGTCTTTTCTTGGCATCCTGTGCAAGTGTCCTCTACAGAATGAGTCTCAGGAGGAGTCCTACAATGCCTATCCTCTTCCAGCAGTCAAGGTCTCCATGGACTGGCTAAGACTCAGACCCAGGGTCTTTCAGGAGGCAGTGGTGGATGAAAGACAGTACATTTGGCCCTGGTTGATTTCTCTTCTGAATAGTTTCCATCCCCATGAAGAGGACCTCTCAAGTACTAGTGCAACACCACTTCCAGAGGAGTTTGAATTACAAGGATTCTTGGCATTGAGACCTTCTTTCAGGAACTTGGATTTTTCCAAAGGTCACCAGGGTATTACAGGAGACAAAGAAGGCCAGCAACGACGATTACGACAGCAGCGCTTGATTGCTATAGGCAAATGGATTGCTGATAATCAGCCAAGGCTGATTCAGTGTGAAAATGAGGTAGGGAAATTGTTGTTTATCACAGAAATCCCAGAATTAATACTGGAAGACCCCAGTGAAGCCAAAGAGAACCTCATTCTGCAAGAAACATCTGTAATAGAGTCGCTGGCTGCAGATGGGAGCCCAGGGCTAAAATCAGTGCTATCTACAAGCCGAAATTTAAGCAACAACTGTGACACAGGAGAGAAGCCAGTGGTTACCTTCAAAGAAAACATTAAGCCACGAGAAGTGAACAGAGACCAAGGAAGAAGTTTTCCTCCCAAAGAGGTAAAATCCCAGACAGAACTAAGAAAGACTCCAGTGTCTGAAGCCAGAAAAACACCTGTAACTCAAACCCCAACTCAAGCAAGTAACTCCCAGTTCATCCCCATTCATCACCCTGGAGCCTTCCCTCCTCTTCCCAGCAGGCCAGGGTTTCCACCACCAACATATGTTATCCCCCCTCCTGTGGCATTTTCTATGGGCTCAGGTTACACCTTCCCAGCTGGTGTTTCTGTCCCAGGAACCTTTCTTCAGCCTACAGCTCACTCTCCAGCAGGAAACCAGGTGCAAGCTGGGAAACAGTCCCACATTCCTTACAGCCAGCAACGGCCCTCTGGACCAGGGCCAATGAACCAGGGACCTCAACAATCACAGCCACCTTCCCAGCAACCCCTTACATCTTTACCAGCTCAGCCAACAGCACAGTCTACAAGCCAGTTGCAGGTTCAAGCTCTAACTCAGCAACAACAGTCCCCTACAAAAGCTGTGCCGGCTTTGGGGAAAAGCCCGCCTCACCACTCTGGATTCCAGCAGTATCAACAGGCAGATGCCTCCAAACAGCTGTGGAATCCCCCTCAGGTTCAAGGCCCATTAGGGAAAATTATGCCTGTGAAACAGCCCTACTACCTTCAGACCCAAGACCCCATAAAACTGTTTGAGCCGTCATTGCAACCTCCTGTAATGCAGCAGCAGCCTCTAGAAAAAAAAATGAAGCCTTTTCCCATGGAGCCATATAACCATAATCCCTCAGAAGTCAAGGTCCCAGAATTCTACTGGGATTCTTCCTACAGCATGGCTGATAACAGATCTGTAATGGCACAGCAAGCAAATATAGACCGCAGGGGCAAACGGTCACCAGGAGTCTTCCGTCCAGAGCAGGATCCTGTACCCAGGATGCCATTTGAGGACCCCAAGAGCTCCCCTCTGCTTCCTCCGGACCTGTTAAAGAGTCTGGCTGCCTTGGAGGAAGAGGAAGAGCTGATTTTTTCTAACCCTCCTGATCTTTACCCGGCTCTGCTGGGGCCTCTCGCCTCTCTTCCTGGACGAAGCCTTTTTAAATCCTTATTGGAGAAGCCCTCAGAGCTCATGTCACATTCATCCTCTTTCCTGTCCCTCACCGGATTCTCTCTCAATCAGGAAAGATACCCAAATAATAGTATGTTCAATGAGGTATATGGGAAAAACCTGACATCCAGCTCCAAAGCAGAACTCAATCCCTCAATGGCCCCCCAGGAAACATCTCTGTATTCCCTTTTTGAAGGGACTCCGTGGTCTCCATCACTTCCTGCCAGTTCAGATCATTCAACACCAGCCAGCCAGTCTCCTCATTCCTCTAACCCAAGCAGCCTGCCCAGTTCTCCTCCAACACACAACCATAATTCTGTTCCATTCTCCAATTTTGGACCCATTGGGACTCCAGATAACAGGGATAGAAGGACTGCAGATCGGTGGAAAACTGATAAGCCAGCCATGGGTGGGTTTGGCATTGATTACCTCTCAGCGACGTCATCCTCTGAGAGCAGTTGGCATCAGGCCAGCACTCCGAGTGGCACCTGGACAGGCCATGGCCCCTCCATGGAGGATTCCTCTGCTGTCCTCATGGAAAGCCTAAAGTCTATCTGGTCCAGTTCCATGATGCATCCTGGACCTTCCGCTCTGGAGCAGCTGTTAATGCAGCAGAAGCAGAAACAGCAACGGGGACAAGGCACCATGAACCCTCCACACTGAGGCCAAAGTGACAACCTGGGAATGAAGGCTCCATAAACCATGGCATGTTGGGTTTGCAGGACTGGCCCACACAGTCCCCTGCAGGTGGCAGCCCTCTTTTCTGTTTCTTGCTGTCAAGAGGGTGTAAGTATTCCACCAGCCCGCTGAGTGTGCACGAAATGTTCGCAGTGCAACAAAAAGAAAAATCCATCAGGAACTCTCCATCCCCCCGGGGCCTTCCGGAGGGAGAGAGAGAGGAACTGCTGTTTATCTCACTCAGTTACTTGGTATCACCGCCTCTCACCTTCTCCATCGTGCATGTCCCCAGCCACATGGGAAGTGAAAGCTGAGAAGGGAAGGCAGATGGGAGAAGCCAATGGGAACTTCTCAGTCCTTTTTCCCTCTTTGGGGAATAAAATAGGAATCCATTAATGGTTGCTTTGCTGACTGA\n>XM_048567351.1 PREDICTED: Pyrus x bretschneideri alcohol dehydrogenase 1-like (LOC125469685), mRNA \nATACGATTCACTTTCAAGATGCCTTAATTCATCAAAGTGTTCTAGAGAGAGAGAGAGAGACTCATCTTCTCTCTCCTAAGAATAAGTTAACAGAGAGTCCCGTGGAGTAGTTATTGGAGGCCATTTTTTCTCAACATCCTCCCAAAAATAGGCAAAGAATTGCTCTTGACCTTTGATATTATATTTCACCATCTGTGTTTGCCAATTGGCATTTTCATCTTTCTTTTTTCTTTCTAAGTAGAACACTGTGAATTACACACCATGCACAAAATGCATAAGAGTTTTAGAACATTGGTGCACAATGACCATTTCTTGAAGCTCCTAAATAACCAAAAATCTAGGTTCCTCAGACCGGAACTTTACAGCACTTCGGCTCATGCTGGCCGTGCGATCACCAGCAAAGCGGCTGTTGCTTGGGAAGCAGGGAAGCCCTTGGTGATAGAGAAGGTGGATGTTGCTCCACCGCAAGCCAATGAAGTTAGGGTCCAAATCAAATACACCTCTCTTTGTCACACTGATATCTACTTCTGGGAAGCTAAGGGCCAGACACCATTGTTCCCTAGGATTTTCGGACACGAAGCAGCTGGCGTCGTTGAGAGTGTTGGTGAAGGCGTTAAGAACCTCAAGCCGGGGGATCATGTGCTTCCAGTTTTCACTGGGGAATGTGGGGATTGTCCACATTGCAAGTCTGAGGAAAGCAACATGTGTGAGCTGCTGAGAATCAATTGCGATAGAGGAGTCATGATTGGTGACGGGAAAGCAAGGTTTTCGCAGAATGGGACTCCGATTAATCACTTTCTCGGCACATCCACGTTTAGCGAGTACACAGTTATCCACGAAGGCTGCCTTGCCAAGATCGACCCAAAGGCACCATTGGATAAAGTCTGCATCCTCAGTTGTGGTGTGTCGACTGGCTTAGGTGCCACTCTGAAAGTAGCAAAACCAAAGAAGGGTTCTTCAGTTGCTATCTTTGGACTTGGAGCTGTTGGCCTCGCTGCTGCAGAAGGTGCAAGGATTTCTGGGGCATCAAGGATTATTGGGGTAGACTTGAATCCCCATAGATTTGAGCAAGCCAAGAACTTCGGAGTAAACGAGTTTGTGAACCCGAAAGACCATAACAAGCCAGTGCAGGAGGTTATCGCTGAGATGACGGATGGTGGAGTTGACAGAAGCTTAGAGTGCACCGGGAACATTAATTCGATGATCTCCGCTTTCGAATGTGTTCATGATGGGTGGGGTGTAGCGGTGCTTGTAGGAGTGCCAACCAAAGATGCAATCTTCAAGACAAACCCCATGAAAGTACTTGATGAAAGAACCCTCAAAGGAACATTTTTCGGCAACTACAAGCCTCGGAGCGACCTTCCCTCTCTCGTGGACATGTACATGAACAAGAAACTGGAAGTAGAGAAGTTTATAACGCATCGACTTCCTTTCTCGGAGATCAACAGAGCTTTTGACCTAATGTTGAAGGGGGAAGGCTTGCGGTGCGTCATTAGCATGGAAGAGTAGGATTAATGTCCAAATTCATATACGA\n>XM_039052777.1 Cantharellus anzutake uncharacterized protein (EI90DRAFT_2259046), mRNA \nGAAGTGGGTATAATGTACTTGACCCATGGTTTGAGAGAACCATGAACTGTCGGAAGTGATGTCCAACAGTGTTCAGTACCCCATAACTGCGTGCAGAGAGACCGAAAACGACTCGGGAGAAGCGCTTAAGCAACAAAGCGGTAATCGAAGTGTTGCAGGCACCAAGAAGGGCATGTAACTTAGGTATTTCAGGGCCTAGAGTCCACATATTCGTAACCGGAATGACACCGCTAAGGTATGATATCCCCATCACATTCGCGTCTGCTGGAGTGCTCCATTGACGAGATAGACAACGTGTCTCCAGTATCGCTCAGGTCCGTCTATCCATGCCGTCGCCCCAACACCCCACCAGGAAGGGGAAGAGGAAACACAACGGTTTGGAGGCCGTGGAAATTACCAACGGGCCTGCATGAAGCACGAAGTAGCCCAATGTGCGATTCCAAGCATTTCTCAGTTGGTGTATTCCCAGATCCATGTGATCTTGCCGAACAGGCTGACGAAAAGAGCGCAGTTAGAGCGCACTACCACCGCGGTCCCTCGCCTCTTGAGCCCAAGGAGGAGGCGATTTGTAAAGTCCGTGCACGGCATATGATCTCACCCCGGATGCTCGCAGGCATTGTAACATCCCAAGGTAAAGAAGACTCCCGACCCCGGACATCCGGCACTGACCAGGGAAGCCTGCAAGATGTAGCCCTGATCGCCAGCAGGGGGGTTTTATAACCTCCAGAGTTCGGTCCCACCCCCAATCGACGC\n>XM_046171703.1 Alternaria rosae uncharacterized protein (BKA58DRAFT_402161), partial mRNA \nATGAATCAGAAACACGTTCCAGTCACTTCAACGCAACTACACACTTTCAACTGCGAGGTCTCAGGTGCGGCTCAGAAAGACATTTACCAAAACGACAGCAAACATCCCATCGGCTTCAACACTCAACATTCAAAACGCCATGGCAGCCTTCCATGGACCCTCAACCACTCCATTAAGCGAGCTGAACTCCTCAGAGTCTGGCAAAGTCGTTTCATCGAGCGATTCGAGAGCGTGAAGCAGCTGACCGTGGGGAACCTCGCTGCACTGCAGGCTGGTTACAATGACGTACAATCTCAGCCTACATCACCTCTAGACGGCGAGTTGCACCTCAGACCGTCTCCCGGTGCAACGGCATCTCTCATCAAACGTAAGCCGCTGCCAGATACAGCGCAAAAAGCAATCATAGAGATGAGAAATGAGACCGATGTAGAGTCGTTTGGAAACAGCGGAGATGAAGCTTCCCATCAAAACCACACACTTGCGCATCCAACGCACGGCCGCAGGCCGTCTTTCCATCGCACGAATACCGTGTTCACGGATTTCTTGCCTTACAACCAGGTGCGAACCTGGCAACAGGTTGATAATGAGGAATATCAAGACCGTTGTAGGCATTCCTTATCAGCTATTGCGTTGGATAGAATGAAAAAGCTCAATCTAGACCGCGATACACTATCGGCTCAAAGGAAGAAGACTGCAAATCAGTTGAAGAAAGTGATCGAACAGCACATACTTGACAAGGAGAAGTCAATTTCATAG\n>XM_004366041.1 Dictyostelium fasciculatum hypothetical protein (DFA_12355) mRNA, complete cds \nATGGAGGATCAGAGCAGTCCATTTCTTGTCGATACAAAAGATACAACAACGACAGATACAACTCAACAACAACAACAACAACAAGAACATGTTCAACAACAAACAGCAGGTCAACTTGACGATAGAGTTGATCAAGAAGAATCGATAACTATGGGTGATGATCAAAATATATCAAGACAACAACGACAAAGAAGACTACTGTTGGTGAGCAAACCAAGTGCATTCTCGGTTGGTTATGAAAGAATAATGAAAAGATACTTTAAAGATTATGAATCATTGATGAAAGAGCATTTCAAACAACTAGAAGATCCATTAAAAAAGGTTAACTTGATTGATAGAAGAATAGAGAAACAAAAAGCTTGTATACCTAGAAATGTGGCATTGTTACAATGGATTATTCAAGGTCAAACAAATCAAGATCAAAGATTAAAGGTGATATCACCACCAAATTCATTAGAGTCATCACCATCTGCGTCACCTTCATCAAAAGATGGTGCTCTTTCATATCAAGAACAACAACAACAACAATTGTATGATGAAGAGAATGATGATATTGATAGAGATGATCAATTCCCAAATGAATTCACATCAGAGGATATAAAACAAAAATTGGAAACTTGTTTAACAAATATTGTTAGAGATTGGAGTTTTGATGGTAAAAGAGAAAGAGATCAAACCTATTTACCAATTTTAAATGATTTACAATCAATTTATCCATTGGAAAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATAATGGAAATAATAATAGAAATTCAATTAAAGTTTTATGTCCTGGATGTGGTCTTGGTAGATTAGCATATGAAATAGCATCACTTGGTTTTGATACAGAATTAAATGAACAATCTATATTTTTTATTATACCTCTAAAGAAAATATTAACAACAGAATTTGAAAATATTGAATCAAAGACTGTATATCCATACATTTCAATTTTAAAGAATACTAAAAGTATAGATTCAATTACTAAACAAATCAAGATACCGGATATCATTCCAGACAGAACGGTGATTGATAGAATGACATTGGCAGAAGGTGATATTTTCGAGTTTTATGAAAGCACTACGCAGTGCTACCAATACTTTGATGTTGTTACAACTTGTTTCTTTATCGATGTAGTTTTGGATATTTTACAACTTTTCAAAACCATTTCATCGGTCATCAAACCCGGAGGCTATTGGATCAACAATGGTCCATTATTTTATCATTTCAATGAAACTTTAAATCTTTCATACGATGAAATTATTATATTGGTTGAATCGTATGGTTTTACAATTCTTAAAAAAGATATTTTACTAGGTTTATCATATACCAATAACAAAGATTCATTATATCATCCAAATTTTGATAGTGTATACTTTGTTGCAAAGAAAAATACAATCAACAACAACTAA\n>XM_023231809.3 PREDICTED: Piliocolobus tephrosceles aminomethyltransferase (AMT), transcript variant X2, mRNA \nGAACCTGGGAGGCGGAGTTTGCAGTGAGCTGAGATCCGGCCACTGCACTCCAGCCTGGGTGACAGAGCCAGACTCCGTCTCAAAAAAAAAAAAAAAAGAACTGGGACCCTTCTGCCATCTGACATAGTCCAAAGCACATCCCTATCCTTTCTCCCAGTTGTCTCGCTCCTTTTTTTTTTTTTTTTTTTTTTGTTGGAGTTCTGCTTTTGTTGCCCAGGCTGGAGTGCAATGGTGCAATCTCGGCTCACTGCAACCTCCACTTCCCAGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACAGGCATGTGCTGCCACACCCGGCCTGCCCCTTTCCAAGAGAGATGCTCAGCATGATGAGAGATCAGCCAGGGTAGGGAATGGGTCCGAGTAAGGGTTTGCATTGTTGCCTTTTAAGAGGCCTAGGTCCTCCATTAACTCAGGCCAACCATTAAGTGATGCAGGCTGCTCTTCCTTCATGTGAGAAAAACCTGTTTCCCTCTGGTTCTTCCTGACTTTGCACCTGGTGGCTATTATGAAGCAGTACTGCAGTATGTCTTGGACCTGGAAAGTTGGACATGCGTGCGGCTCAACAGTTTTCTCGGAAGAGTTCAGTGACCTTTTGGTGGCCACCCTCTGCTCTTACCTATGAGTTCTTCCAGGTGGCGACTTTACCTGCAAGGTCACTTACATAGCCCCACTCAGCTGCTTTGGAAAGCATGATGGAGCAGTAGTCCTCAATGTGTGTGTGAGTGAAGAGGACCTTGTGGTAGCAGGGACCATGCTTCATTTGTGGCTGCATCCCCGTCCGAGGGCCTGGTATGCAGTAAGATCAATACATACTTGTGGAATGCATGACTCTGTTGGCTGCCTGTGTCTGCCTGGTGGGAGAGCTGTGGACCTAGGGGTCCACATGAGGCCAGACTACTGTGGTGCTGCCTACCTGCAAGGCTGGCTCCACCCTGCTGTGACCTCTCCACCTTCCCCACCCCTACTTGACCTTACTCCCTTGAGGTCCTAAAGGTACGATTCAGACCTTTCCGCCCTTTCTGGAACTTTGACTGTTTGGAGACAGGGCGGTTCGGAGACAGGGCAGTTCGGAGACAGGGCGGTTCTGCAGGGGGCAGTCTAGCCCCTAGCTCGCTTCTGGGCAGCCCAATCAGCTCTGGATTGCCCAAGCTGCCCTGAAAAGCCAGCCGAAAGAGCCGGAGGCTGCTTCCCTATGGTTGGGAGTTCCTGCATTCTCTGCTCTAAATCCCAGCCTGCCCTCGGGGCTGCCCACGCCCCCTTCAGATCCTTTGCTCCGGAGAGAGACCTGTCCGAGCAGAGGCCTGGACTACATCTCCCGGCGTGCCTGGCAGTGTGGTGTCCTCTGTGCGCCATCTGTACTTGTTGCAGGCGACGATGCAGAGGGTTGTAAGTGTGGTGGCCCATCTGGGCTTTCGCTTGCAGGCATTGCCCCCGGCCTTGTGTCGTCCACTCAGTTGCGCACAGGACGTGCTCCGCAGGACACCGCTCTATGACTTCCACCTGGCCCACGGCGGGAAAATGGTGGCGTTTGCGGGTTGGAGTCTGCCAGTGCAGTACCGGGACAGTCACACTGACTCGCACCTGCACACACGCCAGCACTGCTCGCTCTTTGACGTGTCTCATATGCTGCAGACCAAGATATTTGGTAGTGACCGGGTGAAGCTGATGGAGAGTCTAGTGGTTGGAGACATTGCAGAGCTAAGACCAAACCAGGGGACACTGTCGTTGTTTACCAACGAGGCTGGAGGCATCTTAGATGACTTGATTGTAACTAATACTTCTGAGGGGCACCTGTATGTGGTGTCCAACGCTGGCTGCTGGGAGAAAGATTTGGCCCTCATGCAGGACAAGGTCAGGGAGCTTCAGAACCAGGGCAGAGATGTGGGCCTGGAGGTGCTGGATAATGCCCTGCTAGCTCTGCAAGGCCCCACTGCAGCCCAGGTACTACAGGCCAGCGTGGCAGATGATCTGAAGAAACTGCCCTTCATGACTAGTGCTGTGATGGAGGTGTTTGGCGTGTCTGGCTGCCGTGTGACCCGCTGTGGCTACACAGGAGAAGACGGTGTGGAGATCTCGGTGCCAGCAGCGGGGGCAGTTCACCTGGCAACAGCTCTTCTGAAAAACCCAGAGGTGAGGCTGGCAGGGCTGGCAGCCAGGGACAGTCTGCGCCTGGAGGCAGGCCTCTGCCTGTATGGGAATGACATTGATGAACACACTACACCTGTGGAGGGCAGCCTCAGCTGGACACTGGGGAAGCGCCGCCGAGCTGCTATGGATTTCCCTGGAGCCAAGGTCATTGTTCCCCAACTGAAGGGCAAGGTGCAGCGGAGGCGTGTGGGGTTGATGTGTGAGGGGGCCCCAATGCGGGCACACAGTCCCATCCTGAACATGGAGGGTACCAAGATTGGTGCTGTGACTAGTGGCTGCCCCTCGCCCTCTCTGAAGAAGAATGTGGCAATGGGTTATGTGCCCTGCGAGTACAGTCGTCCAGGGACAATGCTGCTGGTAGAGGGTTCCTGAAATGCCGACCCAGTGCCTGCCTTCCTGGCCTCCAAGACAAGCTTGGAATAGGTTCTCCTTGAAAGGGGCCAGTCTATAAGAATGGAGATATTGCCCATTGGGCACCCCATCCCTGCTCCTCCAGGGAGCTGGCATCACCTCTCCCCTCCCTGCAAGTTGTTGCATCTGGGTCCCAAGGGGCAACAGCTTCCAGGATGTTCTCTCTCTCACTGCCCTTGTGCATGCATACCCTTGTTCTGTCTGAATAACCACAACAACTGATGCACTTCCGTGTTTAATAAGCCACATCCTCAGTTGAGCCTGAGGTGAAATGTGA\n>XM_035095448.1 PREDICTED: Chelonus insularis structural maintenance of chromosomes protein 5 (LOC118074325), mRNA \nAAAAATAGAAGACAATAGCGGTATGACAAAGAAAGATCGGAAAGGAAATGCGCAGTTATTCAGTTTCCCTCTAAAAAAGTAACGTAGAGGGTTAAAACAATTCGTTCGTGAACTTTACTTGTTTATTCGTGATGTAATTAAACTTTTCAAAATGACAAATACGGACATCATAAGCCAAGGAATCATTAAAAAAATTTTCCTGAAAGATTTTATTACATATGATGAGATAGTTTTCTTGCCTGGAAGATACTTCAATGTTGTCATAGGACCAAATGGTACCGGTAAGTCTACACTCGTAGCAGGAATAGCCTTAGGGCTAGGAGGATGTCCTAAAGATCTTGGTAGAATTGGTGAAATTTCTCAATACATAAAAGGTCAATGTGAAAAAGCATTGATTGAAATTGAACTTGAAAATGGACCGAACGAAACTGTCAAAATCAGTCGCATGTTCAATACAAGGAACAGGTCTACATGGATGATTAATGGAAAAACTGTTACTGAAGCTGAAGCTCAAGATTTGATTGCAAAATTCAATATTCAGGTGAACAATCTTTGTCAATTTATACCGCAAGAAAAAATTAATGATTTCGCAAAAATGAGCCCACAGGAGCTGCTATTAAATACAGAAAAGTCTGTAGGAGATCCAAAAGTATATGATTACCACATGCAATTAATAAGAAATAAGCAAAAACAAGAAGAAATATCTAACGAAATTGGTCAGAAAAAAACTGTGCTTGAATCTGATACTCAAAAATATCAACAATTAGATGAAATTGCTTCACAATATAGAGAAAGAAAAGCAATTATGAAAAAAATAAAAAATTTGGGACAAAAAAAAGCTTGGGTACTGTATGATATGACAAGAACAGAACTGATTAATTTGAAACATCAAAGCAATGGTCTTAAGAGTCAAATATCTGATCTAAAATCGACTTTGGATCCCATTTTAAGTCAAATGAATGAAAAAGGCAAAAAAATAAAAGAATTAGAAACTTCTGTTCAATCTTACAATCTACAAATTAAAAATTGTGAAACTAAATTATTAAAAAATATTGAAACTATTGAGAGTCTTCATCTTAATGTAATAAATATAAAGAAAAATTGCAAAGAAGAACTAAAAATGGAAGAAAGTCGAGATAAATCTATTAAACTTGAAGAAACACATAAAAGTAAATTAGAAAATGACATGCAGCTATTGATGGAAGAAATCGGTACTGAAGAATCAGTTCATAAAAAATTACAAGTAATCAATGATAAAATAAACAACGAAAGAAAAAAAATGGATGAAATTAATAACGAAGCTGTATTTTATAGAGAAAAGTTGAATCTTGTAGCACGTAAAATACATCAACTAGAAGGAGAATTAAAGCAGCTTAGCGATGTTCAGTCGAAACGTTTAGATTTACTTCGTTCTATGAATTCACATGCTTATGAAGCAGTTATGTGGCTTCGAAATAATAGAGATAAATTTCGAAGTGTCATTTATGAACCTATGATTTTACATATCGATATTAAAGAACTTAAATATGGTAAATTTTTTGAAAAGATAATTCCTAGACGAGATTTGGAAGCTTTCGTTTGTGAAGATAAACAAGATATGAATCTTTTATTAAGATATTTACGCGATCAGCAAAATCTAGTAGTCAATGTAGTCCATTCTGATTCAACTGAATCATTAAGTACTGTACCCAGGATACCACTCAATAATCTTACACGATACGGATTCTATTCTTATGCAATTTCTTTTATTTCTGCTCCTGACTTAATTATGAAGTATCTAATAAAAACATACCATATTCACAATATTCCATTTGGTACAGCTGCTGTAGACGATAACATTGATGCAGTGCCTACTGAGTTATTCTCTTTTTTCAGTCCTAATTATCATTATAATGTTCGAGTATCTAGGTATACTAAAGACAAATCCACACAAATTAATCCTTTGCCAAATCATGTACGAATGTTTTCTATTGTTGTGGATCATAACAAAATTGCGGAAAATACTCAATTATTAGAACAAAGACGAAATGAGCATGCACAACATGAATCGAAATTAAGAGAGACTGAAACAAAGTTGATGGAATATAACGATAAAATGGAATCGCTTCGTAAGTCAAGAAAAGATTTAGATACTAAGAGTAAACAAATTCAGATGCTTAATAGTCAAATCAAAAGGAAAACTAATGAAATTATACAGCTTCAAAATCAACGAAGGAGTTTTGAAGATATTAAAAATGCTGCAAATAATGCAATACTAAGTGTTTTGAAAAAACAAACAGAACTGTATAAAGAATGTGCTGGAGAGCATAAAAAAGCGATTGACATTATTAAACAATCGAAAACTAACAATTTTTTATTGAAATTAGCAGAACGTGAGTTAAAAAAAATTTCTGATAGTTCGAGACAATATAAAGACCAACTACAGGAAGTGGAGAATGAATTCAGAACATTGGCCAGGCAAATAGAACCAATGCAAGTTGAGATTAAAAGATTGCTTGGTGAAGCTATACGTTCCACAGACAATGTCAGTTCTAGCGATAGAGCAGCATTTGCTAAATATGAAAGAATCTTTGCTAAATTACCTCCGACAATTGAGGAGATAGACGAAGCTATTCAGTCAGCTAAAGCTCGACTTTTCTGTGCAGGTGACACTCATCACGGCGAAGAAATCCTTGAAGAATGTGAATTAGTTAAACGAAAAATTGAATCACTTAAAGTAGAGATAGAAAAATTAGAAGAAACATTAGCGAAAAATAAAAGAGATACAGAGGAGTTACGTGATCAGTGGTTACCACTAATTGAAAAGCTTACTCGTACGATTAATGGCAAGTTTTCAAATGGTTTCCAATCAATTGGATGTGTCGGTGAAATACAACTCAAACATAATGGAAATCCGATGGATTTTGATCAATATGAATATAAAATTTACGTTAAATTTCGAGATGTTGATGATTTACAAGAGTTCAATATAAACCGTCAAAGTGGTGGTGAACGAGCTTTTACAACTGCTGTTTACATGCTGTCTCTTCAAGAGATGTGTCGAGTGCCATTTAGAGTTGCTGATGAAATAAATCAGGGTATGGATGCTATTTATGAAAGGAAAATATTTGATAAACTTGTTGAGCTTACGTCAACAGCACATGGATCACAATATTTTTTGATTACTCCCAAGTTACTTCCTAATTTACAATACAACGAAAATGTAAGAGTTCATGTTGTTCACAATGGGCCATATATTATTCCATATGATAGATTCAATCTACAAGATTATTGTGCGAAATTGGAAAGGAATTAATTATCTTTAACTATATATTGTATTATATTTTTGTTCTTTATCATTTTTATTTGATTGTTTTTAATTATGATCTCGTTAAAACTGACAAAGTCAGTGTACGCATTTCCAATACATGCAATATAATTTATCTTTGAGTATTGCATTGACTATTATCTTACTTTCGATTTATTATTATTAAAAAAAATTTCTCAAGTATTATTCTATGAAAATAGCTTTGCTTGATTCTGTTTATTTTATGAGCCAGACAAAAATATTGTAGAAAAAATAAGCAAAATAATTACTATCAAGAGTTTTAATCA\n>XM_013003374.1 PREDICTED: Erythranthe guttatus uncharacterized LOC105977970 (LOC105977970), mRNA \nCAAAAACCTCACCAAATTTCCCCAAAATTGATTCTTTCGTTCTTCACTCAAATCAATGGCGTTGTCGATAATCCAATGCCCTAAACACTCAAAGTTTCCGCCCAGCAATTATTTTCTGAAAGCAAATTCACTCCCACTTCACCCCACATTTGTCAGGTTTTCCAGATTACAGCCAATCAGCAGCAATCGGGTGGTTTGCGCCGCATTTTCTGCCGCCGGTGGTTCCGGTGCAAACGGCGATGTAAACCCTTACGAGGTTCTTGGTGTAAATCCTCTAGAGGGATTCGACATGGTGAAGGCGGCTTACACGAAAAGGCGCAAGGATGCTGAGAGGAGAGGCGATGAAGCTGCTGCAGCACAATTGGAAAAAGCATACGACACTATAATGATGTCTCAATTGAAGAAACGGAAGAAGGGCGAAACTTTCGGTCCGTTTCGGGTTTCGAAAGATATAAAATATGCCGATAAGCAGCCAATTGTTCCGTGGGGCCCAAGGTTTGCCAAATCGGAGGTCAAAGATATTCGAATCAACATGGCAATATCAGCTGTATTTACGGCTTGGATTCTTATCAAGGGCAGTGCCGAATACAAACCTTTGCAATTCTTGGCCTTTGTTTTCGTTTATCGGATATTTGAGAAGTTAAAGTCGTTCGAATCACCTGCACCTACCACATTTACAGAAGAAGGTGGTGAGGATGAAGGGAGAATGTTGAAAATGGGCAAAAGACTGCTTCGATCACTTGCATTGGGTTTTGGATGCGTCGCTTTTGCCTCTTTGGGGTACACTGCAGTGTTGAATTGTATTGAATTTGCAGCTGGCTATATACCTATTTTCTTGTACAACAACCAGGAGTTGTTTGTAACTGCGTCAACGGCACTAATGCTTTATGTTCTAGCTTCGTACTACAAATGAAAATTCTGCATCTATCAAGGGAGGATTGAAGATCGATTTATTTTATTTGGAATTAATTAGACGAATAATTCCGTGTTTCAAGATTTAAATTTTGTATATGAGTTCAAATTTTGGGACTTGATTGTAATGTGTTTAACTTGTTAGTGATATTGTTTGCGACTCCGAGTCGAAATCGAGAAAGTAAGGAACAAAATAGTTGCGGGTTGTGTGCTAAAAAAATTGCATTTTATA\n>MW016101.1 Clionaida sp. 1 JV-2020 voucher UF 3823 large subunit ribosomal RNA gene, partial sequence \nGAGCATGAAATCCCTGGCAGGTGCTGTCAGAGAATTGTGGCCGGGAGAGGCGGTGGAGCTCCGACTGTTGCTGTCGAAGTTGACCTGGAAAGGCACGTCAGAGAGGGTGAGAGCCCCGTGGTCGACACCGACGGGAAGGGCCGTAGCCGTCTTCGGAGAGTCGGGTTGTTTGGGAATGCAGCCCAAAGTGGGTGGTAAACTCCATCTAAAGCTAAATACTGGCACGAGACCGATAGCGAACAAGTACCATGAGGGAAAGGTGAAAAGTACTTTGAAAAGAGAGTCAAAAAGACCGCGAAACCGTTAGGAGGGAAACGAATGCAGCTGAAGTGGCTCCGTATCAGGTTCAGGGGATGTCGGTGGACGTTCCGGCTGCGGACAGCTAACGCGTCCTCGGTCGGAGAGGCTGCCGACTTCCTTGCACTCCTGTTGGGAGCCGGCCAACAGCGGTTGTTCCTGGCCCAGAAGGCCGGTCGGGAGGTACCTCCGCACTCGTGCAGAGAACGTATAGCCGTCCGGTTCGGCGGTCTGGGAGCGACCKAGGAGAGTCGTGAACTTTCACGCTTGCAGCGCAGGCCCCTCGGGGCCGGGTCGCCTCTGTTCGTTTGGGCCCCGCGGTTGGGACTGCTTGCAGTGTCTGCCGACGGTCAGCCTGCTCGGTCGGGGGATTGGCCACGCCTTGCGCTCTAGTTGTTGGTGCTCGAATGGCTGCATCCGACCCGTCTTGAAACACGGACCAAGGAGTGCAACATGCGTGCGAGTCTTTGGGTGGCAAACCCGTCGGCGCAATGAAGGTGAAGGCAGGCGTTGGTCTGCTTAGGCGAGAGCTTCCTCGGGAGCGCATCGTCGACCGATCCCAGGCTACGCTGTGGCGGGATTTGAGTAAGAGCGTGCCTGTTGCGACCCGAAAGATGGTGAACTATGCCTGAATAGGGTGAAGCCAGAGGAAACTCTGGTGGAAGCTCGTAGCGATTCTGACGTGCAAATCGATCGTCAAATTTGGGTATAGGGGCGAAAGACTAATCGAACC\n>JQ151355.1 Uncultured bacterium clone J2_5_82 16S ribosomal RNA gene, partial sequence \nAGTGAACGCTGGCGGCATGCTTAACACATGCAAGTCGCGCGGTCAGCAATGGCAGCGGCGGACGGGTGAGTAACGCGTAGGAATGTATCCAGAGGTGGGGGACAACCCCGGGAAACTGGGGCTAATACCGCATATGTCCTGAGGGACAAAGCAGTAATGCGCCTTTGGAGCAGCCTGCGTCCGATTAGGTAGTTGGTGGGGTAATGGCCTACCAAGCCTGCGATCGGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGTCTTCGGATCGTAAAGCACTTTCGACAGGGACGATGATGACGGTACCTGTAGAAGAAGCCCCGGTAACTTCGTGCCAGCAGCCGCGGTAAGCATACTCGTA\n>AY190253.1 Dothideomycete sp. G11-R40 18S ribosomal RNA gene, partial sequence \nGATTAAGCCATGCATGTCTAAGTATAAGCAACTATACGGTGAAACTGCGAATGGCTCATTAAATCAGTTATCGTTTATTTGATAGTACCTTACTACTTGGATAACCGTGGTAATTCTAGAGCTAATACATGCTAAAAACCTCGACTTCGGAAGGGGTGTATTTATTAGATAAAAAACCAGCGCCCTTCGGGGCTCCTTGGTGATTCATAATAACTAAACGAATCGCATGGCCTTGCGCCGGCGATGGTTCATTCAAATTTCTGCCCTATCAACTTTCGATGGTAGGATAGTGGCCTACCATGGTATCAACGGGTAACGGGGAATTAGGGTTCTATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCCGACACGGGGAGGTAGTGACAATAAATACTGATACAGGGCTCTTTTGGGTCTTGTAATTGGAATGAGTACAATTTAAATCCCTTAACGAGGAACAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAACCTTGGGCCTGGCTGGCCGGTCCGCCTCACCGCGTGTACTGGTCCGGCCGGGCCTTTCCTTCTGGGGAGCCGCATGCCCTTCACTGGGCGTGTCGGGGAACCAGGACTTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCCTTTGCTCGAATACATTAGCATGGAATAATAGAATAGGACGTGCGGTTCTATTTTGTTGGTTTCTAGGACCGCCGTAATGATTAATAGGGATAGTCGGGGGCATCAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAGTGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGGCGATGTTATCATTTTGACTCGCTCGGCACCTTACGAGAAATCAAAGTCTTTGGGTTCTGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGAAATTGACGGAAGGGCACCACCAGGCGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTCACCAGGTCCAGACACAATAAGGATTGACAGATTGAGAGCTCTTTCTTGATTTTGTGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGCTTAATTGCGATAACGAACGAGACCTTAACCTGCTAAATAGCCCGGCCCGCTTTGGCGGGTCGCCGGCTTCTTAGAGGGACTATCGGCTCAAGCCGATGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGACAGAGCCAACGAGTTCATCACCTTGGCCGAAAGGTCTGGGTAATCTTGTTAAACTCTGTCGTGCTGGGGATAGAGCATTGCAATTATTGCTCTTCAACGAGGAATGCCTAGTAAGCGTACGTCATCAGCGTGCGTTGATTACGTCCCTG\n>XM_019758284.1 PREDICTED: Branchiostoma belcheri mitochondrial dicarboxylate carrier-like (LOC109461823), mRNA \nTCGCGCGGGAAACGCCCCTCGTGGGGTCACCAGAGTTCATCCGCCATCTTGTTTACGAAGTTGTTTGTCTCTCACAACCTGCACGTCAGCTGGGTACGTCACGTAGGTCACGTGCGGCTTCGCTCAAAGGTCGTTTTTGTTGCAGACATTGCATGTTCAGCTTTTCGGCGTCTGCAGGCGCGCCTGGCTGCTCAGTGCTGCCCAGTTTGTACCCGATGGTAGGACGCTTGCTTTTGGCCACGCCACGTCACAGGTCACCGCCCCCCTCCCCACCATTCAAATCATCAGCCAGCTTCCTGCCAGGATTTGTACGTAATGATGGCCATGTGACATGTGATCGTGCGTGAACAGATGATTATACCCTCGGGACGTCTTTGTTTAGCTGTACTGAAGTCGATCGGATCCATGGAAACGTAGCAGCCCGGTGTACCTTATTGTTTGCTGACTCACAATGATTGCAGCTTTTTTGTCAAAAATCACAAGTTGAACGGAGCTCTTACACGTACGTCACCACGCCACGCCAGGGAGGTCGTGACTTTTCCAGCGCCCGCTTGCTTGAACTGGACTGGATGTGCTGTCAGCCTGACTTGTAAGACTATTTATTCAAACGTTGAAACAAACAAGAGACTTGTGTACAGTTTGCTCATCTGTTTACCTTAGTCTCCACCATGACGTTCCTGGGATTTGCGGACAGTGAAGAACTGAAAGCTAAGAAGATCGGAAGATGGTATTTTGGGGGCGTGGCATCAGCCATGGCCGCCTGCTGTACCCACCCACTAGACCTGCTCAAAGTCCACCTGCAAACTCAACAGAAGAAAGAGTTTGGGTTGTTGCAAATGGGTGTGAAGGTTGTGAAGGCGGATGGCATTGTAGGGTTGTACAACGGGATCACAGCGTCGGTCATGCGACAGCTGACCTACTCCATGACCAGGTTTGCCATCTACGAGACGGCGAAGAAGAAGCTAGCAGAACATTCGGGTGGCGCGAATCTGCCCTTCCACCAGAAGGTGATGCTGGCCTCGCTGGGAGGGTTCTGTGGCGGGATTGTGGGTACGCCGGCGGACATGGTGAACGTGAGGATGCAGAACGATATGAAGCTGCCGGCGGAGTTGAGGCGGAACTACCGGCACGTGTTCCACGGGTGGAGGTGCGTGGTGGCGGAGGAGGGCGTGAAGGGTTTGTTCTCGGGCGTGACGATGGCGTCGTCCAGGGCGATTCTGGTGACGGTGGGACAGATCGCGTTCTACGACCAGTTCAAACAGACGCTCCTGTCCACGAGCTTTTTTAACGACAACATCGTCACCCACTTCACCGCAAGCTTCCTCGCTGGTGGCGTAGCGACGGCCATGACACAACCGGCGGACGTGATGAAGACACGATTGATGAACGCAGCACCGGGGCAGTACTCGAGTATTTTGTCCTGCGCAATAGACATCGGAAAAGTTGGTCCATTTGGGTTCTTCAAGGGGTTTGTTCCAGCGTTCGTGCGTCTCGGCCCTCACACCATCCTCACCTTTATCTTCTTTGAGCAGCTCAGGAAGAACATGGGTGTGCTGCCTGCCTACACGGTATAAGCGCCATCTAGCCAACTGTACTGGCACTGCAGGACTTCTAATTCATGGCAATGAAAATCTCAAGGATCAAGTGGAAAAATGGACTCTGTTGCAAAACCATAGCAGTGATGGGTTGATGGTTTCAGTGTAGGGAGATAGTAGGGTATACATCAGTCTTTTGAAGAGGTAAATAGCAAAAGAGCATAACTGGCCTGCATGAAGGTTGTTTGCATCCCCATATGCTATGCATTCCCGTAGGCCTGCTTAATTGTGTTAACTGTGGCAGTATTAATTTTGGATATGTCAGACAAACAAATGTAATTTCCATGTCAGTGTTGCTATGTAATTGAACAAACATATAAATGGATGGTTTTCAAATATTCTAGCTCATCTCGGAACATATCAGCACCTTCAAGATCGGGACAATTACTAGTATACCTCCTCAATGTTGCATGATTTACCGGTAACCATAAAGAGCCAATTATTTCATGGACTTGTAGTAAAGAAAAATACAGCTGCCTTCATCCAGATGAGTTATATTGACCAACATGTCTATTCATATGAAGAAATAACTTGTAAACTAAATGTGATACAGCTCTAAAGGATACAAATGTGAATCAATATGCTTTTAGCAATTGAATATACAAACCAGTAGTTACTGTTAGTAAACACACCTATGGAACAACAAGATACCTTCTGAAAACTAGCTGTACATATAGATTTACTGAACAATCAGGAGATCAAAGAGGTGTGAGTGAGTTAAGCTTTGTTTTGTTTTGTTTTGTTTCTTCTCTTTATTTAATGCTTAGTAAAGATATCTGATCATAGATATTATTATAGCAAGGTGTATATTTGTGACCAAACTAGTTTGTACCAAATAACTACTAAAGTAATAATGTAGATCTTTTTTCATTTTTAGGTGATCAGTCATTTTAAGTAGAGTCTAAGCAAATTTGTTTTAACTTTGCTGTTAGATGTTTTCTTTTTATGGTTGTCAGATGTTCAATGTGTAATAAAATGCATCTGGGACCCAG\n>XR_004573716.1 PREDICTED: Drosophila guanche uncharacterized LOC117582427 (LOC117582427), transcript variant X2, ncRNA \nGTACACTCTCACTCACTCTCGCGCTGTCGCCCACGATACATGCAGCTTGCAAGCTCGGCGTCTAATCATTAGTAATGTGCCTATAACCGAAAGCAACTGCAGTGCAAATTACAAATATACAGTGTCAGGCCCGATGCCTCTGCAGCCCTCTGTCCTTTGCCCCAGAATGAAAAACGGAGGCAATCGGCATGGGATCGCCTCCTCATCGCCTCTACTGAAAATATGGGATCGAAGATCACTTGAGATGAAGAATTTCATCTAGCTTTCACTCACCATCAAACGCGGAAGACCAGCAGTCT\n>XM_043480802.1 PREDICTED: Cervus canadensis olfactory receptor 56A4-like (LOC122449258), mRNA \nATGCTGCCTTATAGGAACACCTCCCTCTCTACTGAAGTCTCTGAGTTCCTCCTGAACTGTTTTGTCAGGTCACCCACCTGGCAGCTCTGGCTGTCCCTGCCCCTCAGTCTCCTCTTCCTCCTGGCCATGGGGGCCAACGCCACCCTCCTGCTCACCATCCGGCTGGAGGCCTCTCTGCACGAGCCCATGTACTACCTGCTCAGCCTGCTCTCCCTGCTGGACATGGCGCTCTGCCTCACTGTCATCCCCAAGGTCCTGGCCATCTCTGCACAGCTCCATTATTGTGGAAAAAATATAATTGAAAACTGTATCTGTGCCAACCTCTCCGTGTCCAAGCTCTCTTGTGGTAACATCACCCTTAACAAAATCTACCAATTAATTTTAGCCTGGACTCTGCTGGGCTCTGACCTCATCCTCATCTTCCTCTCCTACATCTTCATCCTCCGAGCTGTCCTTCGACTCCATACAAAAGGAGCAGCTGCTAAAGCTCTGAGCACCTGTGGCTCTCACTTCATCCTTATCCTCTTCTTCAGCACCATCCTGCTGGTTTTTGTTTTTACCCATTTGGCCAAGAAAAAGCTTTCACCTGATATTCCTGTCTTACTTAATGTCCTCCACCATGTCATTCCTGCAGCTCTCAACCCAATTGTCTATGGTGTTCGAACTCAGGAAATTAAGCAGGGGATTTGGAAATTATTGAGGAAGGGTAGTGACAGCAGAAAGTAA\n>XM_014024072.1 PREDICTED: Austrofundulus limnaeus gelsolin-like (LOC106528817), mRNA \nCCCAGGGCAGCACCAACAGGATGTGCAGAAAACAGGAAGGGCTGTGGCACGGCTTCTTCTTCTTCTCCTTCTTCACACTCAACATCTGACTTCTGTCTTCAGCAGACCCGGAGCAACATGGCCCACAAAGAGTTCGAGAACGCAGGGAAGAAGCCCGGCCTGCAGGTGTGGCGGGTGGAGAAAATGGATTTAAAACCCGTTCCAACTCAGCTCTACGGAGACTTCTTCACCGGAGATGCCTACATTGTGCTCTTCACCACCCCGGCACCTTCTTACGCTCTGCATTCGTGGACCGGAAATGAAGCTTCCCAAGATGAAGCCGGAGCCGTTGCCATTTTCCTGACTCAGATGGATGACTACATGAAGGGACTCCCGGTGCAGTTCAACGAGTTTCAAGGTGAAGAGTCGACCTGTTTTCAAGGCTACTTCAAGTCTGGAATGAAGTACAAGAAGGGTGGCGTGGCCTCAGGCTTCCATCATGTGGTGACCAACGACATGAACGTGAAGCGTCTGCTGCACGTTAAAGGTCGTCGTCTGATCAAAGGCACTGAGGTGGACCTGAGCTGGTCCAGCTTCAACAAGGGAGACTGCTTCATCATTGACCTGGGAAAGGACATCTACCACTGGTCCGGCAGTGAAAGCAATCGCTACGAACGCCTCAAAACCACTCAGATGGCCAACGACATCCGCGACAACGAGCGAAAAGGCCGCGCTAAAGTGCACATGATTGAAGAAGGTTCTGAGCCAGAGGCTGTCATTCAAGAACTTGGACCAAAGCCGGAGCTCCCTCCTGGGGAATGTGATACGGCAGAAGAAAAAACCCAGAAGACCAAGACATCTCTGTATCAGATTTCTGACGCCACTGGTAAAATGACCACAACGTTTGTGTCCAACGGTCCCTTCAAACAAAGCATGCTCTCCCAGAAGGAATGCTACATCCTGGACGATGGAGGAAACAACATATTTGTCTGGAAGGGAAAAGATGCAAATCCAGATGAGCGCAAAGCTGCAATGACTGCTGCAAAGACGTATATTACAGAAAAAAAATACCCCACAAAAACAAAGGTGCAGGTAATTCCTGCAGGAAGTGAGACCACGATGTTCAAACAGTTCTTCTTTAAATGGCTGGAGGGCGAGGCCACAGGAAAGACCTACACTGTGGGTCGCATCGCGAAGGTGGAGCAGATTCCCTTCGACTCCTCCAAACTCCACAGCAACAAGGCAATGGCTGCCCAGCACGGCATGGTGGACGACGGCTCCGGGAAAGTCCAGATCTGGCGTGTGGAGGGAAAGGATAAAGCAGCCGTGGACCCCTCCAGTTATGGACACTTCTTTGGTGGTGACTGTTACCTGGTGCTTTACTCCTACAATGATGGTGGCAGAACGAAGCATATCATCTACACCTGGCAAGGTCAGAAGTGTACTCAGGATGAGCTGGCTGCTTCAGCTTTCCTCACCGTCAAACTGGATGACTCCATGGGCGGAGTGGCCACACAGGTCAGGGTCAGTCAGGGCCAGGAGCCCCCTCATCTCGTCAGCTTGTTTAAAAACAAGCCTTTGGTCATCCACCTGGGTGGGACGTCCCGTAAGGGTGGTGACAGCACCCCTGGCAGCACGCGGCTCTTCCACATCCGTCAGAGCTCCACCAAAGCTACACGAGCTGTTGAGGTGGAACCCAAAGCCTCCTCTCTGAACACCAACGACGCGTTTGTGCTAAAGACACCATCTTCCCTGTTTGTGTGGAAGGGAAAAGGAGCGAGTTCAGATGAGACGTCGGCAGCTGAGTATGTCGCCAAGTTTCTGGGAGGAGCTGTCACCAAGCTGGATGAGACAAAAGAGCCAGATGGTTTCTGGTCAGCGCTGGGTGGGAAGGGCAACTATCAGACCTCCAAGGCCCTGCAGAACGTGATCAGACCTCCTCGACTCTTCGGTTGTTCAAACAAGACTGGCAGGCTCATTGCAGAAGAGGTTCCTGGTGACTTTACTCAGATCGATCTGGCCACAGATGATGTCATGATCCTGGACAGCTGGGATCAGATCTTTGTTTGGATCGGAAATGAAGCCAATGAAACTGAGAAATTAGGAGCTCCAAAAATTGCCCAAGAATATGTGGATTCTGACCCCGCCGGACGTCGTGGTGTCCCCATCACCACCATCAAGCAGGGCCAGGAGCCACCGTCATTCACGGGCTGGTTTCAAGCTTGGGACCCCCACATGTGGGACTAAGCTCATCATTAGAGCAGAAAGCATCGACTTACTAAACATCAGTAGTTGGATAAAATGCATAATCTTCACACAATGAGCTTAAGATTTTTATAGATGTAGATCAGATTTTAGACAAAATCTTATATGTCTGTGCTTTCAGTGTAACAGAAATACTCACCAAAGCTGAAAACTTACATATTTTGTGGCAATAAGCTGTTTTTCTTTTAATGAGGAACTGGCAAATAAAAATAATATGTGCTAATTTAAATGTCATATCCGTATTCTGGTTTAAATTTTAAAGAAAAATTAAGTTGACTCTAAAACAAATCATTAAAAGTTCTGAACCCCA\n>KM104095.1 Uncultured fungus clone rcw_159 internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene, complete sequence; and internal transcribed spacer 2, partial sequence \nCGGAAGGATCATTATCGTGCTTTGGGGCATGGCTCCGGCCGTGCTCCTCCAGCCCCACCCGTGTTTACCACACCTGTTGCTTCGGCGGGCCCGGCGGCCCTGGCCGCTGCCCCGGGGGGGGATGTTTTCTCCCTCCGGGTGTCCGCGCCCGCCGAAGACCCTCTGAACTCTAGTGACCTGTGTCGTCTGAGCTTCATGATCAAATCATTAAAAAACTTTCAACAACGGATCTCTTGGTTCCGACATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAGTTCCGTGAATCATCGAATCTTTGAACGCATATTGCGCCCCCTGGTATTCCGGGGGGCATGTCTGTTCGAGCGTCATTGCAACCCTCAAGCACGGCTTGTGTGTTGGGCCCGGATGTCCCGGTGTGGACAGGCCCGAAAAGCAGTGGCTGGGATGTGTCTCGGCGCCCAAGCGTATGGGGACTCTTGTCACCCGCTTGCATGGCCCGGGCGGTCCCCGTCGACCTCTTTCTCTCCGGAAGGGCGCCCCCCTTTCGTCGGTTGACCTC\n>XM_019782364.1 PREDICTED: Branchiostoma belcheri tryptophan 5-hydroxylase 2-like (LOC109480215), mRNA \nATCCATGTTCGTCAGAAGTTGTCTGAGAATCAGTTCCAAGATGTCGTCGGGAAGAAAACTGTTAGGGCGGCGGTTTTCTGACGTCTTCCCTTTAAACAACGGCAGCCGAGGCCCCCTTCTTACCAAGGACGGGACTGCAGGGGCAAGAACCCGTAGGCGCATCTCGTCTTTCCCTTGTGAGGAGACGTTTGCACCTGTTCGCACTCCGGTCATCCTGTCTATGAGGAAGGACGTTGGGGGCCTTGCTGCCGTGCTACAGTTATTTCAGGAAGAACAGGTCAGCGTTCTGCATATCGAGTCCCGACGCTCTCTTCGGCGGAAATCGGTGGTTGAAATCTACATGGACTGTGAGGCCGACAAGACCCGAATGAACGAACTGATCTCCCGGATTCAGAGGGAGACCAAGATGGTCAAGGTGGACACACCAGACAGCATCGGCAAGGGCAATGCACAAGATGAGGAGGGGTTTGAGGTTCCCTGGTTCCCGCGCAAAATCAGCGAGCTGGACAAGACGGCGTGCCGAGTCCTGATGTACGGAAACGACCTGGATGCCGACCACCCGGGTTTTAAGGACAATGTCTACCGGGAGAGAAGAAAGCTGTTCGCTGAAATCGCTCTGAACTACAAATACGGTCAACCTATACCCAGAATAAAGTATACCGAAGAAGAAGTGAACACATGGGGTGCAGTGTACCGTGAGCTGACGTCACTCTACCCGACACACGCCTGTCAACAGCACCTCAACAACCTGCCGCTACTGCGCATGTACTGCGGATATAGAGAAGACAACATCCCTCAGTTGGAAGATGTGTCCGCATTTCTTAAAGAACGAACAGGTTTCCAGTTGCGGCCGGTGGCGGGGTACCTGACACCACGTGACTTCCTGGCAGGACTTGCCTTCCGCGTGTTCCACTGTACCCAGTACATCCGCCACAGCACCGACCCCTTCTACACACCGGAACCGGACTGTTGTCACGAGTTGCTGGGTCACGTGCCCATGCTGGCCGACCCGAGTTTTGCCGAGTTCTCCCACGAGATCGGACTGGCTTCGCTCGGCGCCTCGGATGAGGAGGTACAAAAGTTAGCCACGTGCTACTTCTTCTCGGTAGAGTTCGGCCTGTGTAAAGAGGACGGGAAGATCAGGGCATACGGAGCAGGACTGCTGTCATCTGCCGGCGAGCTAAAGCATGCACTGACACAAGAGGATAAAGTTCTGCCCTTTGACCCGGAAGCTGTTGTACAACAGGAGTGTCTCATCACCACCTATCAGGACGTCTATTTCATGTCCGACAGTTTTGAGGAGGCTAAACAGCAGATGAGGTAATTTTCTCATTATTGTGCTTAG\n>XR_008187289.1 PREDICTED: Carassius gibelio uncharacterized LOC128029018 (LOC128029018), ncRNA \nCCATTACAGCAACAAACATTTTTAATGCAATTTTCTTTTTCAAAATTCACATCTGAGGTATGACAGTGTGTAATTTATATTGTAGGTTTAATAGGGAACATCTCTTGAATTCATGTTAATCACGTATCTTACTTTGCTTAAAGCTGAGCTAAACAGAACTAATTTGATTATTTTACCTTTTCAGCTGAATTGTGCCCAACCAGGGTAACAGTTGTCTGATTTCACAAGTGATTTTGCTCTTCCTGAAGTCCAGCTTTAAATTCAGAGCTTGATGTTGCAGCAGGTAATGAATCACTTCCCAGGTCAGTGAACAGGAAGTCAGATCTTTAGGCACCTTCTTCAGGAAAAAGCATGTCAGTTCATCATCCTGTGCTTCATACACCACTGAAACCAGCTGCTGAAGAGTTTCTTTAGAGAACCTGA\n>XM_005997745.2 PREDICTED: Latimeria chalumnae BTB/POZ domain-containing protein KCTD6 (LOC102358416), transcript variant X1, mRNA \nTCTCTATGGTTGGTCCTGTAGATATGATGCTGATTCCATGTTTTGGGTTGGCACGGCGCTGTTTTGAAACGAGCTTCGGGGTTTCGGGTTCAGTACGAGGGTTAAAAAAAAAAAAATGTTTGCTTATTTTTAAAGTGAAATCATTTCGAATGAGTGAATTTTGAGACAGTCAGAAGTCCTAGTTGGAATAAACTTTAGGTTTATGACGGAGAACCTTTCCAGATTATCATTGGAACACACAATTGAAAAATAAGAGCCACACTGGAGAACGGGAGGTGATTATTGCTTCTACCCTGCAATCTTTCATTGTTGAATCCTAAGAGAATTACTCGAGCATTGAAGCAGATGGATAATGGAGACTGGGGACATATGATGACTGATCCAGTCACGTTAAATGTAGGTGGCCACCTCTATGCAACCTCAATCTCCACTCTGACCCGTTACCCTGATTCCATGCTGGGAGCCATGTTTAGGGGAGGTTTTCCCACTGCCAGAGACTCCCAGGGTAACTACTTTATTGACAGAGATGGACCTCTATTCAGGTACATCTTGAATTTCTTAAGAACTTCTGAACTGACTCTTCCTCAAGACTTCAAAGAAATTGATTTGCTTCGAAAAGAGGCAGACTTTTACCAAATTGAGCCCCTGATCCAAAGTCTTAATGACCCCAAACCACTCTACCCCTTGGACACGTTTGAGGAAGTGGTGGAACTGTCAAGCACACGTAAACTTTCCAAATATTCTAATCCTGTAGCGGTCATTATAACTCAACTTACTATAACAACAAAGGTTCATTCTTTACTTGAAGGCATTTCCAACCATTTTACCAAGTGGAATAAGCATATGATGGACACGAGGGACTGCCAGGCTTCTTTTACGTTTGGGCCATGTGACCACCACCAAGAGGTCTCCCTTCGAGTTCACCTGATGGAGTATATTACAAAGCAAGGATTCACTATCCGAAATACAAGAATGCACCATATGAGTGAGAGGGCCAATGAGAATACAGTAGAGCATAACTGGACATTTTGCAGATTGGCACGAAAAATAGAAGACTGAAGCTGAATAGATCTTTTTTTGCTGTTGTTTTTTTTCAGTTGAAGACAGCATTAGTATCTCTTTGGAGCTGCATGAAGACCACTGTAAATACAGAGAAGAAAACAAAAATGATATGGGCTGTTCTTACAGCTACTTTTTGTTAATCGCCCTTAACAATGATTCTTTTGAAGATTGTATAGAAATTCCTCATAACTATGCATGTGCCTATTAAAGCTGCTATAGAACTAGAAAGTGACTTTCTCATTAACTTTTGAACAGATATCCTCTGTTTCTTTGAGAATATTAAAAACCACTTTAAGCTA\n>XR_002182326.1 PREDICTED: Bos indicus uncharacterized LOC109569253 (LOC109569253), ncRNA \nTTTTAGGACTGAAGCCCCCCCAGCTACCTCTGGCTCCTTGGGTGACCTAAAGATAATAGRCTACTCTGTGCACATGGGTCAGTGCCCCARAAAGGAGCAGCAGCCAGGACTGGTGTGGACCAGGCTGAGACATTTTAACCATACCCCTGCGTCCATTCCCAAAGCGCAAAGGTCAAAAGTACTCTGAGAACGTCCAAGGGGTCACATGCCACTGTCTGGTGGCTGGCATGGCTCTGATTGGTGAGAAAAGAGCACAACAGGGGAAAGGTGGGKGGGGCTCTCTCCTCTTGAAACCACAGGGCGTAGCTGCTGTTGAGGGCTGGCTGGGCTGRTCAAAAGCAGCTCCCACATRRGGACACATTGTCCTCCAGGCATCATCATRGGACATGCTGTGCTCTGGGAGGAGGGACACAGACRGTGACAGATTCTGCGGACAGAAACAACAAGCGTGGGGTKATCTGGGAACTTTTGTATCTGGGAGCCCAAGGGTGGGACCCTGGTTATCTTGCTGTGTAGTGACAAGCARCTAATAATGGAGACCTCAGAGCTGCCCATGTCAGAGGCATGAGGACATGGACTGCTGGTTCTGAGAYGGTTGCCTAGTGATACAGTGAGGAAAGGAYTAAGACCTAGAAGAACAAARTCACAGGATGTTAAGATTGAAGGAATCCACCTCTCAGTCTAGTTCCTTTGACATCATCTAYAACAAGTATCCTAACTCTACACTAACAGTCTCTTGAGGTTAGGCACCCCACTTGTTCATTCGTTATTGTGTCTACAGTGTGGTAGCCAGCCTCTGAGATTGATCCTCATCTCTGRYACTCATAACCTCATGTGGTCCCTCTCATATTAAAGAGGGCTGACCAACGTGATCAACAGGTTATTGYGAAAGTCATGGTACGTAACTCCCAAATGTGGAGCATAAAGGCCACAGCRGCTTCCATCCTGCTTTCTCTTGGACTCTGAGGGGAGGCAGTCACCACGTTGTAATGTTGTGATGAGGGACATCATAGGAAGCCCCATGGAGGGTCCRCATAGGAAGGTACTACCGCCYCTCCTCAACAGCCAGCACCGACTTGCCAGCTGTGTGGGTGAGCCTCCTTGGAAGAGATCCTCCAGCCTTGGTGGAGCCTTCAGATGACCACAGACCCAGRCAACGTCCTGCCTGCAACYTCATGACGCATCCTGAGTCAGAACCACACAGTCAAGCCACTGGCTTGCAGAAATCGCAGACTCCCAACCATTGGACCACCAGGGAAGTCCCTGCTGCTTAGCACCAAACACCTCCACTGATAGCCARCTTACCACCTCGYGAAACAATTGATTCTATCTTYGGACAACTCTGTTCAAGACTACCAAAATTAAATTGGTTCTTCCTAAA\n>XM_001444626.1 Paramecium tetraurelia uncharacterized protein (GSPATT00012774001), partial mRNA \nATGTTAAAAAGTAATTCTTATCATCTAAAAACCAATAAGAAACATAAATCATCTCCATTAGCTTCCATAGAGCTACTACAAAAGTTATTGGATTTTAAATAAACGTAAACTTCCATGAATTGTTCCTAAGAAAACAAAACTCTAGTCATGAATGGGAATTTAGCAAAACAAATCTCGAAATCAATTTCAATTGGCAGTCAAAGTTGGAAGGATATAGCACCTCCAATTCATGAATCTGATAATTTGCTTAGAAAAAAGGAGGAAATCCTCAATACATTGAAGAAATCAAAGCATGTCAGACATATAAGTTAGATTTGGTCAATGAGAAATAGAACTGATAGTAATGTCCATACTCCAAGAAAAGAAGGGGTAAACGATTTTATTTAAAATGCAAGAATCTTTTTGAAAGAGAAACTATTAGAAAATAAGTTAGATAAGCTCTGCTATTAGGTTTAATAATTAAAAAATAAATCCGATATTTTGGAAATCTAAAATAAATTGCTTTTCGAGAACCTTAAGCAACATCATAATGACCATAATAACGTGCACGAAAGAAAGGTTTTGATGGGAAAGCTCGATTAAATGATAACGATGCAAAAGAAATAAGAATAAAGCTTAAATTATTTTAAGCAATTATTCCAAGAGAATGACGAAGGAAGGAGAGTGAAAACCTAAACCTCCTATCCCAAGCTGAGACCTGCCCTATACTCTGGCTACGTCGGATTAAAAATGTGA\n>XM_047096667.1 PREDICTED: Lynx rufus CUGBP Elav-like family member 5 (LOC124524401), transcript variant X11, mRNA \nATGAAGGACCTGGACGCCATCAAGCTCTTCGTGGGCCAGATCCCGCGCAACCTGGACGAGAAGGACCTCAAGCCGCTCTTCGAGCAGTTCGGCCGCATCTACGAGCTCACGGTGCTCAAAGACCCCTACACGGGCATGCACAAAGGCTGTGCCTTTCTCACCTACTGTGCCAGGGACTCCGCCATCAAAGCTCAGACTGCCCTGCACGAACAGAAGACCTTGCCCGGGATGGCGCGGCCGATCCAGGTGAAGCCTGCGGACAGTGAAAGCCGCGGAGGGGACCGGAAGCTGTTTGTGGGGATGCTGAACAAGCAGCAGTCGGAAGAGGACGTGCTGCGGCTGTTCCAGCCCTTTGGGGTCATCGACGAATGCACCGTGCTCCGCGGGCCTGACGGCAGCAGCAAAGGCTGTGCCTTTGTGAAGTTCTCCTCCCACACGGAGGCCCAAGCGGCCATCCACGCGCTGCACGGCAGCCAAACCATGCCGGGTGCCTCCTCCAGCCTGGTGGTCAAGTTTGCCGACACGGACAAGGAGCGGACGCTCCGGCGCATGCAGCAGATGGTGGGCCAGCTGGGCATCCTGACGCCATCCCTCACCCTGCCCTTCAGCCCCTACAGTGCCTACGCCCAGGCCCTCATGCAGCAGCAGACAACGGTCCTGTCCACGTCGGGCAGCTACCTGAGCCCTGGCGTGGCCTTCTCACCCTGCCACATCCAGCAGATCGGCGCCGTCAGCCTTAACGGGCTGCCTGCCACACCCATCGCCCCTGCCTCTGGACTGCACTCGCCCCCGCTGCTTGGTTCCACTGCCGTGCCCGGGCTCGTGGCTCCCATCACCAATGGCTTCGCAGGTGTCGTGCCCTTCCCTGGGGGGCACCCTGCCCTAGAGACCGTGTATGCCAATGGCCTCGTGCCCTACCCAGCTCAGAGCCCGACCGTGGCCGAGACCCTCCATCCTGCCTTCTCCGGAGTCCAGCAGTACACAGGTACGGACGGCACCATGTACCCCACCGCGGCCATCACGCCCATCGCGCACAGCGTCCCCCAGCCGCCGCCCCTCCTGCAGCAGCAGCAGCGAGAAGGCTTCGTGAGCTTTGACAACCCGGCCAGCGCGCAGACCGCCATCCAGGCCATGAACGGCTTTCAGATCGGCATGAAGAGACTCAAAGTGCAGCTGAAGCGGCCCAAAGACCCGGGACACCCCTACTGACCGCGCCCACAGCCGCCCGGAGGCTGCGGGCCTGGCCCAGGTGAGCCGCCAGGCGGCCCCACCCGCCCCCACCCCCGCCCCCCACCCCCCCGTCTTGGCCAAACACCCCCTCGTTCTCCATGCCCTCCCCACCCCCCAGGGGGGATGCCGCTGGAGACCACAAGGAGCCCCCAGGTTGGGATGGTGGGGACAGAGCTAGAGAGTCACCCTCCAATCCCCCCTTTGATCAGGGCTGGGACAGAGGGTGGAACCGGGGTAGAAGGGGGTTGGGGAATCCTTCCAGAAGGTTTTGAAGGATGAATAGAAGTTCACTTGAGAGGCCAGGTTTGGTCTGGGGTGGGGCATGCTGCGAGGGAGGGGCTTCTGTCCTGTCCTGTGACTCTCCCAGCTGGGCCCCTGTCCAAGTTCCTCATTTGGTGTCACCCGCGTTCAGTGAACTGGCGAAAAAGTGGAATGTTTGCCCTGCTCACCAGCATGCCCCCCCCAAAGAGACCCCCCCCCCAACAAATCCCCAAGAGTGTATTTTGCCACCAGAGAGAACAACTTTATCAACAACTAAGCACCTTCTTTGGGGGAATGAACAGTGAGCCTAAGGGGCCAGTAGGGAAACATAACTGACCACAGCCTTGATGAGCCTCATCTGTGAAATGGGTTCACGAAAGTCGCCTCCCCAGAAGCAGCAGGGAGGATCCGCTCGGGGACGCGGTGTTTTCCCAGCTGAGCCCAGGACCCGCCACCTGGAAAGCTCTTGATCATTTGTTTTGATTTTGTTTTTGTTTTGTTTTTAATCATGAGCGCCGTCGTCATCAAAGCGCCGCGCCTGGGGTCTGGCGCGAAGTAGATGCTCAGTTAGGGGCTGCGCATGCTTTTCAGACCCTGCCAAATCAGCACCCGCAGAGTCGAAGGTCACGGGATCAGACAACTAACAGGCGACCCATGCACTTTAACACCCTGGGACAGCAAATCCTTTCTGAGCACCTACTATGCGCTAGGCACTGTTTGGGGACAGCGCTCGGGGACACAGCTGTGAATGACGAGAAACGGGGCGGGGGTTGGGAGAGAACTGCCTTCGTGGCAGGGAGCAGGGGAGACAAGATGAGACAAGAATAAACGCAACTGTTTGCCCCCGGGGGTTGCCAGATGAGGAAACAGCCTCGGTGGCCAGTCCTTTTCCAAGGCGGACCGCTGGCCTCTGAACCTGGAAATGGACTCTCTCTGAGCAGACAGGGGCCCTTGGGTTCCTGGAACCCAGCCTGGCCAGGGCAAGGGGGCGGGCGGGGGGCGATGTCGTCGGCCTGCATGCCCCCCATCACCGCACCCTAACGCCCCTCCCTTCTCCGCCAGGTGAGGGGCCTTCCCACCCCAGGAGGGCCTCCCGCTTCCAACCGACCCCGGACTTTTCCGTAAATTACAACCAAGTTTGGACACCAGCCCCACCCCCTCCCGTCTCCCCTTGCCCCCCCGCCCGCTTCCTAATGTGAAACACTACTGCGGGCCACACGGAGTGGGAAGGGGGCTTCGTGGTCCGCCCCAGCTGGGGAGGGGGGCTCCTGAGTTGGGGGCCGAGGGCTTCACTGCCCCCACCCTTGGTGGCTTCCCCAAATTAAATCACAACTTTTCCTATATATATATATATGCATATATATATAGAGCTATAGACAGTATATATATTTTTTGAGTATAGATCATGGGACCAAACTTTTCCGACTTCCTTCCATCCAAGAGAAGGTGACCCTGGCCCGGTCACTCAGCAGGGACATAAGAAGGGCTGAGGATGACCGGGCAGCCCAGTGTGTCCCCACCTCCCGCTGTCATGTCAGACCAGGGCACGGAGAAGCACTGGGAATCATCAGCCAACGCGATATACCTCCAGGACATTGGGCCCCTGCCACCGACGTTCTCGCAGGCCCTTGGGCTCGGCCAGCTCGAGTGTCCCTGGTCTTAGCTGCAGCTTCTGGAACCCCTACCCCCTCCCTCACCCCAGGGCCCTGCCTTCCCCGACATAGGCAAAGAAGAGACCCCCCCCCTGGCCTCCCACCCCCACCCCCGTCATAGCCTTACTCATGTGACCAATAGCCCTTAGCTTTCCGTCAGGGGCAGACAGGGTCGGGGGAGCCCCCCTGCCCCTCGCGCCCCCTCCCAAGGGCAGGCAGCCGCCCTCCCTGCCTTCGGATCACCAGCCTGGAGTTCACGATCTCATGACCAAGATCGCCACGCGCGTTGGACAAACCCAACCCGCTCTGGCCCAGCACCCCTTTACCAGAGATACCTCTACAAATAATTTTTTTTTTTGAATTTTGGTCTTTCTGAGAAGATACAAAGAAGAAAAGAGAAAAAAAAATGGGGAAAAAAAATCAGACAACAGTGGATTTTTGTTTCCTAGTTGGGGCGGGGAGGGAGGTCTTGTGGGGCGCCTCTGTATAGCTACTCAAACCGCGAAAACCCATCTTGAAGCACAGAGTCAAGTTCGTTGGACGTCCAGTGGGGCCTCTTGCCAAATGAGGCACCAGAGAACTTCATAAGCTCAAGAAAAAAAAAAAAAATTTGTAAAGAAAAAACAGCCTTCCCTTTTGTTTCTACCAAAATGTGTTGACCCAGAAAAAAAAAAAAAAAAAAAAGAAAAAAAAAACCACATAGCAAAAAAAAAAAAAAAAAAGGAAAAGAAAAAAAAAATCTTATGACCAACTTGTTTCGATATTCCAGAGTTTGATAATTGTTCCGAGACACTCTAGCGTGCCTGTGTCCTGTGCGTCTGCGTGTGCAAGCGTGTGCTCAGGGGCCACGAGGGGGCCTCGTCCGCGTCCCCGGCACCTGCCCAGCCCCGGCCAGGCCTGCTTGGGAGAGCGTGCTGGCGTGCAGTGGCGTTGTGTCCTTCTGGTCCATGTTTACTGGCTGTAAATACCATTTTTATACTCCACATCGAAGACCTACGTGATTTGTACGATGTACTTTATTTCTGCTACGAGTAATTTCATGAAGTTTCAACTTGCAAACCGACTTTTGGAGACAAATCGCCACACACACACACACACACACACACACACACAGAAAAGGAAGACAAGAAAGGAACTTACAGGGAACTTTGGGTGGACTGGGTTTGCATTTCTGGCTGGAGAGGTCCTTGGCACTGTGGTGTGTTTCAGGTGAGAAGCTGCAACCATCATCTTAATGTCCAAACGCCTCTCTTTGGTCTGGAGAAACTGAAAGTTTATTTAATAAAAGTTTTACTTGCTAAA\n>XM_016552280.1 PREDICTED: Sinocyclocheilus rhinocerous general transcription factor IIH subunit 3-like (LOC107740007), mRNA \nAAACCCTTCAGTGAATCCACAGAAGAAGAGCTCATTATGAGTCGGAACACAACTTTTAACAATATTGGAGGAAATACTAACTGAAATACCTTTACATAGCGATTTAGAGATAAAAGAATCGCAATAATGGCCTCTGACGACGAAATTAATATTCTGGTCATTGTGTTAGATGTCAACCCTATTTGGTGGGGCCAGCAAGCTCAGCGGGAACCTCAGTTCACTCTTTCAACATGCCTGGATTCTTTGATGGTCATGGCAAATGCCCATTTAGTGATGTCAAGAACCAACAAACTAGCCGTCATTGCAAACCTGTATCAAAAGAGCCACTTTCTATATCCAAGTAAGCAGTGGAAATCAGGGGATGAAATATCTGTAAGTAGCGATGGCAAATATGAACTTCTGTCAGTTACCAATGAACTCTTTGCGGAAGAGATCAGGAATCTCATGGACAGAACAGAGGTCAATGGCAGTCAAACAGACAGCCTGTTGGCCGTATCACTCGCCAAAGCTCTGTGCTATATTCATCGAGTCTCAAAGGATGTGCAAGCTGGACAGGACATGAAATCAAGGATTTTGGTAATAAAAGCTGCTGAGGATTCTACATTACAGTATATGAACTTCATGAATGTGATCTTTGCAGCACAGAAGAAGAATATCCTGATTGATGCCTGTGTGTTGGACGCTGACTCAGGACTGCTGCAGCAGGCTTGTGACATAACTGGAGGCTTGTATCTCAGAATTCCCCAGAAGATCGCACTCACACAGTATTTGTTGTGGGTATTTTTCCCAGACACAGACCAGAGATCCCAGCTGTTATTGCCTCCTCCGACATTCCTGCTTGTGACATAA\n>XM_045728814.1 PREDICTED: Procambarus clarkii trans-1,2-dihydrobenzene-1,2-diol dehydrogenase-like (LOC123746912), mRNA \nAATTTGTATCTGGCAACCCTGAGTCGCCCCGGCCGCTCGAGATTTGACTTGACATTTCAGCAGCAACATGGCAACACGGTGGGGCATAGTAAGTGCCGGTCTGATCTCCAATGACTTTGTAAATGCATTGAAGGCCTTACCCCCAGGGGAGCACCGCCTGGTGGCTGTAGCTGCACGCTCACTTGACAGTGCAAAAAGCTTTGCATCAAGAAATGGAGTGGAAAAGGCATATGGGTCATATGCAGAGCTTGCTCAGGATCCTGATGTAGAGGTGGTGTATATTGGCACAATCCAGACACAGCACCTCGCTGCTGCTTCCCTCATGATCCAGTCTGGGAAACATGTCCTTTGTGAGAAACCCCTTTGTTTAAATGTGAAGGAGACTAAGCAGCTTATTCAACTTGCTGAGGAAAAGAAGGTTTTCCTGATGGAGGCAGTATGGTCAAGGTTCTTCCCTGTGTACCAGGAGATGACAAGAAGAATCAAGTCAGGAGAGATTGGAGACGTGGTGCAAGTTATCTGTTCCTTTGGCAAATCAGTGGAGAATGTAGAGAGGCTGCTGAAGAAAGAAACTGGCGGAGGAGTCACCCTGGAAATAGGAATTTACCCAGTGCAGTTTACCACACTAGTAATGGGAGGAAAGAAGCCACAGAAAGTGCTTGCTGGTGGACACCTGAATGCCAATGGTGTAGAAGAATCAACAAGTGTCTCGCTTGTCTACTCTGGACGACGCTTGGCTTCTCTGAGTGCCACCATCAGGGCATGTTTGCCTTCAGAGGCCTTTGTTATTGGCACTAAGGGCACTATCAAGGTGAACTATCCCATGTGGTGTCCTGAAAGCCTGGAGTCACCATCAGGAAAATTTGAGTCACCACTTCCCAAAACAGGTCACACTTTCAACTTTGATAATAGCCAAGGATTAATGTATGAGGCAATTGAAGTGAGACGCTGTCTTAAAGAAGGTTTGCTGGAGAGTCCAGGGATGAGCCACAAAGAGAGTCTCACTATTGCTGAAGTCATGGAGCAAATAAGACGACAGGTTGGAGTAGAATTTGACTAGAACATCAAGGCAATCTAACAGTGTTAAGCTTTCATATAAAGTCGTAAACTAATTGCTGTTATTGAAGACTGGAGCCCAACTATATACTGTATAGTGATAGCAATAAGATAATCAGTGGTATAGTATTAGAGTTCTTTTAGAATATTGTATTAATCTTTACTTTCATGACATCAGTAGTTTGCAGTATGGAACTGTACTTGTGTTTTCTAACATTTATACTCAATGATACAATCAAAGTTAGAAGATTCTTAATTCATTAATTAAGTTTTATTACCATCTCGGTTATTACAGAACAAAATTGTAATTTTGTCGTGGAAGTCAAAATCCTCATTAGTATGTAATTCATGTAATTATGGTTATTCACTTGTTTATGGAATACACGAAGTTTCAATTTGTTATGTAGCTTAATTCTGTTAATTTGTATTTCAACAAGTCCTTCATTATATCTTGAGATATATCTTGAGATGATTTCGGGGCTTTAGTGTCCCCGCGGCCCGGTCCTTGACCAGGCCTCCAGTAAGTCCAGTATAGCAGCTTTATAGTAAGAACTAACTGGTAGCATATTCAACTGTACCATGGAAATATGTACAGGAATTTGAGAAATGCAGACCATAATAAAATTATAAAATAATTGTAAGTTAATGGTCTGAAATGCTCAATTACTATGCAGTACATTTTTTTTCTCAACAATAGTAATGTTTTTATATTAAAAGGATTTTCTATTTCAGAATTCAGTTTTCTTAGTAGTACAAAAGATGGTGATATTGTTGACAGCAGCTTAAATTTTACTTGGCTTTACCTGTTGCAACATTTGTTTAAATTAATGGTTGTTAGAAAACTTCAGTTTGGTTAATTTTTCTATAAGTGAATGCCTGTTTTGCTCATTTAAAATTATTTAATAAAAATCAAATGTTCACACAATAACATAAATAGCCTTAGAAAATTTTAAGTAAATAACTTAACAAATGCTAATCTGCAGTAGCAACTAGACTGAACCAGAAATGAGTTACTTTACAAACTGCTCATAGAGCACATAATTCTTCTAGAAAATTTAATGAAACATTTTAGCTAATTAATAAGGCATGTGAAGTATCAAGAAAATTGTACTTTAACAAATATTAATGCAAAATCACTAGAACTCCTAGCCTGACCCTATGACTAAATGTATGTCAAATTACTTTCTTACAGTACAGTACTCTTACTTTGTCCATCATGCATAAATATATATAACTAGCACAATAA\n>XM_028373142.1 PREDICTED: Glycine soja putative GPI-anchor transamidase (LOC114409625), transcript variant X2, mRNA \nAAAAATACTCGAAGAAAGAGTTGGTTGTGAAAAACTAGAACTAGAAGAACTGCCACCAGAAGACGCCGATCTCGTTCGCCCGAAGAACTACCTAATTTATTTACACTCCCGCTGACGCCGACACCAAACTCATTTAATTCAGTGTTTGATTTGACCTACATGATCCTTAAACTACCCGAATCATCAGCTGTTTTGCGATTGCGGGATTGATTTGTGGTTGCAGTGAATGTGATGGAACACTTATTTGGTACCGGAAGAAAAGAAGGACAAGTTAGCATACTCCTCATCTGCGTTTGAGTCTACAATGCACACTAATAATTGGGCTGTTTTGGTCTGCACGTCTCGCTTCTGGTTTAATTATCGGCATATGGCCAATACCCTGTCATTGTATAGGACAGTTAAACGGCTAGGAATACCGGATGAGAGGATTATACTCATGCTAGCAGATGACATGGCATGTAATGCTAGAAACAAGTACCCTGCCCAAGTTTTTAATAATGAAAACCATATACTTAATCTGTATGGGGATAATGTTGAGGTAGACTATCGTGGCTATGAAGTGACAGTGGAAAACTTTTTACGGGTACTTACTGGACGTCATGAGACATCTGTTCCAAGGTCCAAACGACTTCTTAGTGATGAGGGAAGTCATATTCTTCTGTATATGACAGGGCATGGAGGTGATGAGTTTTTGAAGTTTCAGGATTCGGAAGAGCTTCAAAGTCACGATTTAGCTGATGCTGTGAAGCAAATGAAAGAGAAGCGCAGGTTTAAGGAGCTTCTGATAATGGTGGACACCTGCCAAGCCTCTACTCTTTTTTCCCAGCTTCATTCACCAGGTGTTTTGGCAATTGGAAGTAGTATGAAAGGAGAAAATTCATATTCACATCATTTGGATTCAGATGTTGGCGTTTCAGTTGTTGATCGTTTTACATTTTACACTCTTGCTTTCTTTGAGAGGCTGAATATGTATGACAATGCTTCGTTGAGCAGCCTTTTCAATTCATATAATCCAAATTTGTTGATGTCGACTGCATATTACAGAATGGATATATACCAACGCTATTTAAAGGAGGTACCTGTGACAAACTTCTTTGGTTCTGTAATGAAAACGATACATACTGATTCAGCCTACAGATCCCGGTCAAATAAAAAAATTGAGGAAGCTAAAAGCAATATGTCTTTGGATGAATCAATCTCTGACAGTGACTCGGATGACGAGGATCAATTTAATAATTTAACTGCTGAGAAATATCTCTGGTATAGTGTTGGACCACTATGGAGTGCTATTCTCAGCAATGCCAATACTTCTGAAAGCATCGATACTTTGGTGTGCTATGGACTGCTTTTAATGCTTCCTTTGCTGATATTTTCCACATGGCTGTCAAAGTAAAGATTGGGGAAATATTCCGTAAGTTTGTTAGCAGAGCAGACACATTTCTTTGATGCTGCTAGATGGCACCGTTGCTTGAAATGCAATTTCACCCGAAAAAGCAGATTATTTGGCTGCATAATATGTGGGACGCAAACTACTGGTAGAGCAGCTTCATAGTTGTTGCCTATCAGCTGTATTCTGTTAGCTATTGCTTTTGCCTTGGTGCAGTTTATTCTGGTAGCCATTGGTGATGTTGGCTTGCTGCTGCTGTCATGTTTCGCCTTGTATTTTGATGATGATTATGATTATGATTGCAAACTGTAAAATTTTTGTAAAACCTCGCTCTATTTTTAGATATTATGTTGATGTCCAACATTAGAACACTGCTCTTTTAAGAACTCGGAAATGAAAATGCTTGATCATTTTATCTACTTGTA\n>JF971034.1 Uncultured archaeon clone E09_A-C5_0239GSNP001F_P1 16S ribosomal RNA gene, partial sequence \nAGGGCCCCCCCTGGGCAAAGGGGTAACCCCAGGGGCCGCCGGAAAAAGGCGGCTTTTCCTTGGTCTAAAACCCCTAGGGAATAAGAGGGGGGCAAGACTGGTGTCAGCCGCCCCGGTAACACCAGCCCCTCGAGTGGTGGGGATGATTATTTGGCCTAAAGCGTCCGTAGCCGGGCCGGGTAAGTCTCCCGTTAAATCCAGCGTCTCAAGCGTTGACTGCGGGAGATACTGTCTGGCTAGAGAGTGGGGAGAGGTGTACGGTATTCTGGGGGTAGGGGCGAAATCACACTAGAACACGTCTGACGGTCAGGGACGAAAGCTGGGGTAGCGAACCGGATTAGATACCCGGGTAGTCCCAGCCGTAAACGATGCACGCTAGGTGTTGGGGCGGGGCTCCGAGCCCCGATTAGTGTCGGAGAGAAGTTGTTAAGCAAGCTGCCTGGGAAGTACGATCGCAAGATTGAAACTTAAAGGAATTGGCGGGGGGAGCACAGCAACGGGTGGAGCGTGCGGTTTAATT\n>XM_046691669.1 PREDICTED: Haliotis rubra tolloid-like protein 1 (LOC124257572), mRNA \nAAAACCATACTCACTTACCCTGACCATACCGGTATATGCGACCAGTGAACTAACGCAGTAAGGACAGCCACACGCTTGACATTGTGCACCTGGCAACTGGCTCAATTTACCGAGTCATTCATATGCCTCCGCACCTGCACCGCTTCAGTGAGCACAAGTGTGGTTCACAACATGCAATAGTGTTTCGTTACCTGGGACATGCTGTTACTCTTTACTGGACATTTGACATGGAAACAGCTACAAGCGTGTTCAAAATGTCCAAACGGCGACCACAACAGCTGGCTATTTTGATAACAGTAACGTCGTTGTGGACGCGGATACTAGGTCAACCTTGGGCAGATGATGAATGCAACAACGTCATCGTGCCAGACCTATCGAGACAAGAAGTGAGGTCAGAAGGCTACCCGTCCGGATATGAACTGAATCAAGAGTGCAGATGGGAGTTTGATGCAACGAAGTGGTTTAACCAGAACAAAACACTTAGTGTGCAATTTGTCGTGGACATTGAAAAGACTACAGATTGTTCAAGAGAATCTGTTTCAGTGTATGCTTTCACATCGTCCAGCAATACACAGCTAGCGGTTATGTGTGGTCAGACTGTAAGACAGTATACGTTCTTCATCAAGTCCCTCCTGGTTGTACTGAAGACTGGATCTAGTCCTACACAGGGCCGGCGTGGTCTTAAGATGACACACCAGATGATTGATGACGAATCCTGCCGTGAGTGGTTGTATTCAGATACACACAAGACAGGTGCCATTCATTCACCCAGATATCCTGATCCGTATCCGAGCTTTCAGAGATGCACGTACCACATACGGAGTCGGACTCCCAACCGTAACGCCGAACTTAAAGTCATCCTTTCCGAGCTGAGCAGTGACTGTCACAAGGAATATGTCCTGGTCTATGACGGGAATTCAGAAAAAGGGTCCTTACTTGGAAAATGGTGCGGTTCAGAACGACCGACGTTCAACAGCCTGAGACAACAACTCTATGTAGTGTTTGTGAGCCATGACAACATCAGCGGACGAAGGGGGTTCAGGGCAGATTTCAAAGACGTCATATGTGGAGGCGCGGCATCAGCTGGACAGTACTATGGAAACGACATCGTATTTCCTGGGCAAGAGAGAGCATTTCACCATTACATCACGTGTCGCTGGTACATCAGACCTTCCCGCGGATTTACAGGCTTGATGGTGGAGTTCAGAAACCTTCAGGTCGACTGTGACAAAAGCAGGATTTCAGTGTATGACGGGCCAAGCGCTACAGACTACACAAGGACCTGGAAGATCTGCGGTAAAATGGATTATTCCTACCTGATTTCCGGGGCGGGCGTGTTCATCGAGTTCAGTAGCCAAGGCAACACAGCAGAGCCGGTCTCCTTCAAAATCAAATACAGGGGGAGCCGCGTTACAGGTTGCAGACTGAAAGGAAAGGAGGGCGACAAGGCTTACCTTGTGGCTTACTCTTACGAACAGATACTCCTGTCCCCGGGATATCCCGATCTATATCCAGATCGGATACAGTGTATGTGGCAAGTGAAGACTGGCCTTCTCGTGGACATTGTCATGATTGATGTTGTACGGCTGAATCTCCACTCACAGCCTGCATGTGACGACAGCATCAGTTTATATCATGGTCCAATATCTGATATCAGCAAGACACCGGCCATGGTGTTGTGTGGCACCACGACCGATGTTTTCTACAGCACTGGTCGGTACGCTACCATTGTGTTTTCAACCAATGACGTTGGAGTAGGAAGCGGCTTCACCATCAGTTACAAGTCTGTACCAAAGAAGAGCGCCGATACTGGAACCGCAGCTTCAGTTTCATCCAGTGCGTCAACGATAGTGATTGTTTGTTGTGTAATCTTCATCATCATCACCATAGTGGTTATCGTAACTTGTTTCGTTTGGAGAAAAAGACGCAGTGATCGCAATCGACAGCCACCGATTGTCCAAACATCTCCGGATCCAAACCCCCAGACTAGCGGCCAGGCAACCCCATTTTTGCCGCCCAATACCACCGGTACCACCAATCCTACCAATACCCCCGCTACCACCAACACCAGTGCGTCGCCCCCTGAATACCAGGATGTAAACTTCCTGCCCGTCACAGAACCATCAGCGCCAGAGATGCCGCCTCCCAGTTATGAAGATGCTGTGTCGAAGGGAATGATAGACACGGAAACTAGGTTTTGAGGCGTTTTGACAAGGTGTCTTCAAATTATAAACAGACGCTTTGACATGCATCACAAGGCAGTGGTCAGAATGTGAGTGAGTGAGTTGTTTTTAAGCCGCTTTGAACAGTACTCGATCGTAGAGTGTCTGCATAGCGTGGACGTAAGGTCATCAGAAAGTAGTTTCCTGATATCTAGTGTAGCTGTCTCATTGTCAGAAATATTATCCACGCATTTAGTACATGGTATTTGTCAGGAAGATACTCTAGGACATGGTATTGGTCAGAAAGAGACACTGGAACATGGTATTGATCAGGAAGATACTCTAGGACAAGGTATTGGTCAGAAAGAGACACTGAAACATGGTATTGATCAGGAAGAGACACTAGGACATGGTATTGGTCAGAACGAGACCAGTGGTGATTCCAGGTTAGATGAAGTCACAAGCAGCCTTTGCTGGTCGTAAGGGGTGACTAAATGAATCAGATGGTCAGACTTGGATGACGTCACGTAAACGTCGCTCATAATGTCAATCACTGAAATGTCTGGCGCAGTTATTTGAAGACCCCGTTACAGAGCTAGAAAGTCGCTACGTTATAACAAACAACAAAGACGCCCATCTACAAAAAGTTGATTCCGAAAAGACAAATCTGCAGAAGCCTACGATGACTTGTGGAGTATTTGTGTGGAGTAATGATGCTCAGTTTAAAAAACCTCTCAGTGGTATTTCCCAAAAGGAATCTGTTAACACCCAGGACTATCTCAGACACAAGTGGAGGCGTTGCACTCATATATTGTAGGAGTGGGTTCTTTCTCATCTGATTGGATGAATGGGTAGGGCAGATGGCCGAATCGTTTTAACGGGTGCGGCCAGGTTTCCCCGCTCATAAAACTGCTCCCCGGAAGACAATTCCCCACTGGTTGCAGAAATGTCAAGAACGTCTGGGGGTGGGGCGGAGAACATGACCTGGGGAGAATTTTCTTAGTAGGGGCAGTTGATCTGACGCCATATTAACACATCTTAGGTGTGGCGTGCAAAAGCTTTAGAAACTAAGCGGCCGGAGTGAGGGTTCAGATGCTACGAGCTTGGTGAAGCATCTCAGCATCTTTGATTATAGGTTCTTGAATATGTAACAATATGTGAGCCTGCTTTTAGCATTACCAGCATCTCCACCGAAACATCCCACTGAAGGTGAAATTGAACAGAAGTTGAACTTTATACTTGTATTCCGACTCTGTGTTCTGTTATGAATTCCTTTAAAAGAACATTCCAGTTTTAATGACATCATATATTGACGGGTTTCAGAGGGCAAAGGAAACGATTTCTGCTCAGGAACACTCAGCCCTGAAAATACCTTTGTATTTTGAATACAACAGAAATAGGGGGTCAACCGACAGTGTTGGATCCAAGTGGATTAAATATGTATTTGAATATATGCAAGTGCATTATTGTTTATATTATATATGTTTTATATAACATTTTGTATGATTTTATTGCGAGATACACGAGTCATAACACCATCGTGAGCGTGTTTGTTTTATTTGTTTATACACGTTTTATACATGATGACAGAACATTACACAGTAACATCTCACTTGTAGGACATGTTACTGAAGTAC\n>XM_048419471.1 PREDICTED: Myodes glareolus docking protein 6 (Dok6), mRNA \nGAGGGGGGCACAGCTGGGGGCGGCGCTAGCCGCGGTGCTCCCCTCGTGGTCGGGGGCGAAGGTGAAGACCGCTCTCAAGGTGCTGGTGCTGCTGAGCAGATTCGGGCCCGGTTCCCTGGTCCGGGTGCTTGGCGGCCCTGCTATCGACTCAGCGTCCGCGCCGGCAGGAGCCTGGGGAAGAACTGGCGGTGGCGCGACTGCCGGCGACGGCCGGCTGGATGCGAGACCTGCGTGGACCGGGCGGTGGACAGCGGTTGACGACTCCAAGAAGCGGATCACCTAGCAGAGGAGCCCGACCGCGCTGGCCATGGCCTCCAACTTTAACGACATAGTCAAGCAGGGCTACGTGAAAATCCGCAGCAGGAAGCTAGGGATTTTCAGACGATGTTGGTTGGTTTTTAAGAAGGCTTCTAGCAAGGGACCCAGAAGGCTAGAAAAATTTCCAGATGAAAAGGCAGCTTATTTCAGAAACTTTCACAAGGTAACTGAACTGCACAACATCAAAAATATTACCAGACTGCCTCGAGAGACCAAGAAGCATGCCGTGGCCATTATCTTTCATGACGAAACGTCAAAGACATTTGCTTGTGAGTCAGAGCTGGAGGCTGAGGAGTGGTGCAAACACCTTTGCATGGAATGCCTGGGGACAAGGCTGAATGACATCAGCCTTGGGGAGCCTGACCTACTGGCAGCTGGGGTGCAGCGGGAACAGAATGAACGATTCAATGTTTATCTTATGCCTACACCCAACCTGGATATTTATGGTGAATGCACAATGCAGATCACTCATGAGAATATCTATCTCTGGGATATCCACAATGCCAAGGTCAAGCTGGTGATGTGGCCTCTTAGCTCACTAAGAAGATATGGTCGGGATTCAACGTGGTTCACCTTTGAGTCAGGAAGAATGTGTGACACGGGAGAAGGACTATTCACTTTTCAAACAAGGGAAGGAGAAATGATCTATCAGAAGGTCCACTCTGCAACACTGGCCATAGCTGAGCAACATGAAAGATTAATGCTAGAAATGGAGCAGAAGGCCCGGCTTCAGACAAGCTTGACTGAACCAATGACATTATCGAAATCCATCTCTCTTCCTCGTAGTGCATACTGGCATCACATTACGCGTCAGAACAGCGTTGGAGAAATCTACAGCTTGCAAGGTCATGGGTTTGGCTCATCAAAGATGTCCAGGGCACAGACATTTCCAAGTTATGCTGCAGAACAGAGTGAAGAGGCTCAGCCACCATTGTCTCGGTCCAGCAGTTATGGATTCAGCTATAGCTCCAGCCTCATTCAGTGACATACAGAGGCCACCACTGACCAGCAAAACAGTCTGCCCTGGACCTGCCATGGGGTCATTTCGCCCTGTGTATCCTGGAAGATCAATTGCTGTACAAATTAACATTGGTAGGGCGTAGTCCCAACTGAAAGGTTAAAAACTGAAGTTCTGCTTCCTTGATTCAGTGGTTAAGTCCTTTATTTATTGAATTTCTATGGGGGAAATCTATGTTTTACAAAAAAATCCAATAATATGAACACTCATTTCAATACAACAAATTCTTTGTGTCTGACAGTAGCAGAAGCCTTGGCACTGGGAAATTTGCCCACTCTAGTTTGTGCCTGGTTGGGGTCACCAAAATTTGTCTTTCAGACTGTTTGCTCCTGTTTCGACACAGGGCCTGTCTTTAAACATAATAATGACCCACTCTAAGCTCTGTGGCTTTTTCAATTTTGACAGAAACAAATCATGTAATCTTTACTCATGGTATCATAACTCTCCATGTAAAGAAGTCCAGTGACAATTAAGGGGGTGTTAAATTAGAATATTCTATTCAGAAGGACCCTGTAGCTCGAGTGTGTGTGGATGTGGGGGGTTGTATGTCTGTGTCTCTATGTATGTAGGAAATTACTATAACCATCTACAGATTAGGGTATATCAAATGTGCTAAATGTGACAGGATATGCTCACTTAAATTATTTAAAACTAATTTGTCACATTAAAATTAAAACTATGTTGAATAACTATTTTTAAATTAGTGCTGTTAGAATATGAAAAAGGTCCCCTGTTAGAAAATGAAAAAGGTTCCCTACTAACAACAGTATCTCTGAAGCCCACTCTGGTCTTATGAGGATTATGATCAGAAACACAAGAAGGAAGCACTTTGGAAACAAGATTACCATCCCAGCTGCCCTGCATGTCCATTACACTGTCTGTCTGGTTGATGTTGCCTTGTTGTTGACTGTTTCTTCCATCTGAGCTACTTGAGAAATTGGTGTAATCTCCAACTCTAAAATGTTTGAGAAAGACACAAAGCTACACTGAAAATGAACTCAGCTGTTTGTAGTTAAAAGAAGAACAAATGATACATGAAAGTAGATGTTTTAAGTTTCACAGAGGAATTTTTGCATGGGTCGTTGGGGTCTTGGCATCTGCTATGGAAACAGAACTTACATGACTTGAATTTTTTTTGCCCTGAACTTGATTGGTTGGGATGAAAAGAGAAAATGTTTGGCTTGCAAATTTTTTTCAGTTCTACCACCTGACAATGTCCAAGTTTAAAGGGAAATGGAAAATTCCTCTCTAAAAGAGAAAGTTTGGCTTGTTCAGGTCAACATAGACATATTTTGAGCATAATTTAGTGAGTGAAAATATAAATTACTCTGTGAGACTCACCTGGTGTCACTTGCCTAAACCAGATATCAATTAAGGAATCCAGATCATATTCCTGAACACAAGGTCAAGGTCAAGCAAGAGGAAAACCTGTTTTTTTCTTTGATAGCAAAATGTTCTACCAAACTTAGTCTACTGAAAGGGTACCTTTTTGCTGATCCTTGTTAAGATTTCATTCATCCTGAGTCAGGCAGTAGTGGTTCATGCCTTTAATCCCTGTACTTGGGAGGCAAAGGCAGGAGAATACAAGAGCTAA\n>XM_045791904.1 PREDICTED: Ursus americanus glycerol kinase 5 (GK5), transcript variant X2, mRNA \nCCGGATCTCGCGGAGGGGCGGGCCGGGGGCGGCGGCCCCGCGGGGCGCGCTCGGCTCCTGAGGTGCGGGCCTTTATAGACGCGCCCTCTCGGCAGGCGGTTGTTGCGGAGAGGCTTGCGGGCTCGGAATGTCGGGGGTGCGCGCGGTCCAGGAGCAGAGCACGGCGGGCGCGTCTCCCGCGGGCTTCGTGTTGGGGCTGGACGTGGGCAGCTCAGTGATCCGCTGCCACGTCTATGACCACGCGACGCGGATCTGCGGCTCCAGCGCGCAGAAGCTGGAAAGTCTTTATCCTCAAGCTGGCCGGGTTGAAATTGATCCCGATGTTCTCTGGCTTCAGTTTGTGACTGTAATAAAAGAATCTGTTAAAGCTGCAGGAATAGAGATGAATCAAGTTGTTGGTCTTGGCATTTCAACACAGAGAGCAACTTTTATTACGTGGAACAAGAAAACAGGAAATCATTTTCACAACTTCATTAGTTGGCAAGACCTAAGAGCTGTTGAACTTGTAAAATCTTGGAATAATTCTCTCACAATGAAGGTGCAAAAGGCAGTTGAAGAAGATAATTGCTGCTTTGGGACTATTGACACCTGGTTGTTACATAAGCTCACAAAAGGTTCTGAATTTGCCACGGATTTTTCAAATGCTAGTACAACTGGACTATTTGACCCTTTTAAGATGCGTTGGAGCAGGCTCCTTACTTCCCTGCTTTCGATACCACTGTCTATCCTGCCTCCTGTGAGGGATACGAGCCACAATTTTGGATCAGCGGATGAAGAGATATTTGGGGTGCCTATACCAATAGTGGCCTTGGTCGCTGATCAGCAATCAGCCATGTTTGGAGAATGCTGCTTCCACACAGGAGATGTGAAACTAACCATGGGAACTGGGACATTTTTGGATATAAATACTGGAAATGATCTTCAACACACCGTTAGAGGCTTTTATCCACTAATTGGGTGGAAGATTGGCCAAGAAGTTGTATGCTTAGCTGAAAGCAATGCAGGAGACACTGGTACTATCATAAGATGGGCTCAAGAATTAGATCTTTTCACAGATGCTGCTGAGACTGAAAAAATGGCCAAAAGTTTAGAAGATTCTGAAGGAGTCTGTTTTGTTCCATCTTTTAGTGGATTGCAGGCTCCATTAAATGACCCCTGTGCATGTGCCTCTTTTATGGGTTTGAAGCCTTCCACCAATAAATACCATCTCGTACGAGCAATATTGGAGTCAATAGCTTTCAGAAACAAACAGTTATATGAGTTGATGCAGAAAGAGATCCATATCCCTGTGACAAAAGTCCGGGCAGATGGAGGAGTTTGTAGGAACAATTTTGTTATGCAGATGACTTCAGACCTGATTAATGCAAATATAGAGAGACCTGTCAACATAGACGTGTCCTGCCTGGGTGCTGCTTCTCTAGCTGGCCTTGCTGTTGGGTTTTGGACTGATAAGGAGGAACTAAAGAAACTGAGGCAAAGTGAAGTGGTTTTCAAGCCACAGAAGAAATGGCAAGAATATGAAATGAGTATGGAAAACTGGGTCAAAGCAGTGAAACGCTCCATGAATTGGTATAACAAGATGTAGCGCTAACTGGAACGACTGCAACCATATACGGCTGGCTGATACGACATGCAGATGAGACACAGCTCAGGGATAAAAACCCAATACGACGATGACTGAGAGCATTTCAGATGAGCTTTGCAACCTGAGAGAAAAAACATTGCTTTTTTGAATACAAAACAAAATCCCTCATTTTTAAATCTAAACCTTGGTAAGATTGTAAGGCAACAGTACCTCAAAACTTTATATCTTCTGTTTTGTAGCAAATTCCAAAGGACGTTAGCCATTTCTAGCCATATTTTGACAGCTGTGGGTCCTCCCCGTTTTTATACTGGGTCAGCGATACATACAAACATAATGGTTTACTATCTGAGTTAGTAGTTCTGGGTCAAGCACCATTCATGTTTTGTTCCAAAATTAAGTGACAAGTGTTCCTTTAATTATTTAAGATTAAGTAGGCTATATGAAGTTCACATAGCTATAAAGAAAGAATAACTGAGGAAATGTGGAGTTTTGCAACATTAATATTTTATATTTAAAACCATAATTGTTCAATACTCTATCCAAATATGAGCTCGATACGCCCCTCTCGGATACGCTTATTGTTAGTCAATTCTTTCTTTTATTGGGCTTAAAGACACTCACTGCCTTAATTTTTCCTTGGTTAACCAAAATCTGAGCATTCTTTTTGTATTGAAAAAATAACTTTAGTGAATGAAACTACAAAGGATAATGATTCATAAAGAACAAGAAAATATTTTCTTTCTCAAATGGGATTTCTTTCGAAAACTTCTGGCTAAAGTGTAACATCCCATTTTTTACAAAATGCAGGTAGTGGATAGAAATCTTGCTTTTCTCTTCCCGTTCTTCATCTTTGTTGTTGAGATGCTTGCATAAATGTCTTTTGTTTTAAATTAAGTGCCTAACTGACAACTTAATTTGAAGACAGTGCCCTAATTCATTGGTGACGTGGGAATTGCCTTCATTGGGGTACTTTACTTCCGCAGGTATCTTTTACTTCAGTTCAATCTACTCATCTCTGTGAGACAGGAGCAGTAGGTAGCTGCCAGAGGTAATGGGGGCGTGTTCATGCAAACGATTGCCTTGCAGTTACGGGGCGGAGCTCCGCAGAGAGGGACAGGGACAGTTCCACATTTTCAAACTTTTGTGATAGAAACAAACGTAAAGGAATCAGAGTTGTGAGTAGCTCTGGGCTGGTGTAAAACTGTCCTATGGCACCAGACTGCCCTCCAACTTGTTCTCATGTAATTTGCCCCTCCCTCCACTTGGGCTAGGTTCCATTTCGATTTGTATTAATAATGAATTTATTTCCCTCTTGGTCAGGCTTTGTGACATAAAGATCTACTGTTATAGAGCTAGTTGTTAAATACTAATGTACTTTAAAAAGTGACTGTTAGAGGGATTTTTGTTGTTGCCATCATATATGTCCATTTCAGGGACAGATAGCTAGAACTAGGGGTCACACTGCATTTCTGCAAATTCCATTTCAGTGAAGTTTGTCTTCTTGAAGTATTAACATTTTTGATAGAATCATAATAGCCAATATATAGTATCATTAACTCCATTAATTAAGATTTGGAATTTTTTTTGTGAAGTGGAGGTATTTTGTTTACGGTAACAAGTCAGATTACATTATGTAGATAATATTCTTCTTTTTAATTCTTTTCATTTTTCTTACGTCCCTTTTACAAAGCTTAGTGACCAATTGTAGGCCCTTTTATCAAAATCAGATCACGTGCAAGCTGCTCTGTTGTTTTACTGTTTCTTATAGATTCTGCTTCTCAGAGGGTATGATTTCATAGGAAAGAATTGTCTCTTTGTGTTAGGATATACTGAATTGTAATATTATTAATACTTAAAATTTGTTGGCTCATTTCTTTTTCACATTCTTCTTTCTCATCATCAAACACAAAATAAAGGATAAATACCTTTTAGATAATGTGAAAAAGTAACTGTGAACATGTTTTCATCGGAATTGAGCATCTCCTCAAAAATCAGTGGCTAGTTTTTTCTTCTGTTAGTCTAGAATTAATCTTTTATTTTTACTACTTCTGGCTTTTTTAGTGACACAGTTTAGTAAATCTTTTGCCAGATTTGACCTAAATCAGAAACGTGACCACATTTGCTTTTGTGGTTGTAGAAACAGTTGATATTCAAAATCAGTTGAGCAAAAAAATTGTGCTACGATTTCTCAGCATGTTCTATTTTCCCATTATGGATCAACCAGATATTTTTAGCAGGTCTGTAGCTATCTTATCAAGGAGGAGAATGTTTCTGTACAATCCTTCTTGAAGTGGTACTAATTTCTTTCATACCTAGACTTACCGATTTTAAATTTTTTTATATCCTACCATAATACGGTTTCTCAGTCTCAGCATTATTGACATTTGGGACAGGTAGTTCTTTGTTTTGGGACGTTGTGCTATGCAAGATAGGGTATTTGGCAGCTCAACCTGCTAGCTACCAGCAGCATCCCCTAGTTGTTGTGGTCAAAAATGTCTCGTAACACTGCCAAATGGCCCCCAGGAGGCAGTATCACCTCCAGTTGAGAACCACTAATTTGGACTATTAGAAGAAAGTTAAAGGCTCAGCAAATGTAGTGTGTCTATCATGCTCCTTTTCTCTCTGCCTCATTTTACCTTAGGAAATCGTTGTTAGCAAAAAGAGGTGGTTGTATCTTAAAACAAATAGGGTTTCTACTTTCCCAGTTAATGAGGGAAAAAAAAAATCTGATTTTACCCACTCAC\n>XM_020802708.1 PREDICTED: Pogona vitticeps SH2B adaptor protein 3 (SH2B3), transcript variant X4, mRNA \nAAGCTGTTCTATTTTAGAGCGCGCGCAGGGCGGCCTTTGGCGTACGACGTCAAAACCATCCGGTCCCCCTGTTTTGGCAGGAAATCGCAAGGCGCTGCCGGTGGGCATGTCGTTCTGTCTGGAGGTGGGCTTCCCTCATGGACTGGCCTCCCTTTTTTGGCCTGCGTGCAGTCAGTGGCCGGTCTAGCTTCTGCAAAGGACATCTGAGTGTTTCAAGTTCCTACCATGAATGGACACGCTGGGCCACCCATAGATCCTGCGCACGCCGGGGGCTGGAGCGAGTTCTGCGAACAGCATGCCGTCACCACCGCTCGAGAGCTGGCCCGGAAGTACCTCCTGTTTGTCAGCGAAAACCCCGAGCACGAAATCTTGGCGGCCGACAACTTCTCCCTCCAGTTTGCTGACCTCTTCCAGCAGTATTTCCGCAATGAGGTGAAGGACCATTCCGCCATGAACCAGTTCCGCGTTCTGCCCTTTAGCAAGGTGCGGGACTACAGGGAGACTGGCCGAACTCATGCCGGCGCCTCCCCCACTGGGACGTTAGGGGCCAAGAGTGAAATGGAACTGGGTGGACCAGTTGACCGGGGACCACCTGAGGCCCGTCCCGCCGGCCTCCCCAAATCGTGGAGTTCTGAGGAACTTACTGGAACGCCTCCTTCCTTGGCCGTCAGGAGACACTTTTCCCTCACCCGCCTGAGGAGGAGTTGGCGTAACTTTTTCCGCAGGAGGTCCTCAGAGCCGCCCCCTCCCGATGGGGAAATGTCGGATTCTGTGCTGAAGTCTAACCTGGCGCGGAAGATCTTCCCGTGGGCCCTTTCGCGAGACCCACCGCCTCAGGTCCGGAAAGAAGGCGGTCTCAAATACTGGATGGTGACCGAGGCCAACGTGGACAACGGGACGCGCTGGCAGAGGTGCCGGCTCGTTTTACGGAAAGAAGGGCCTTCAGAGAGTGAAAATTACGTCCTGGCGCTGTTTGACCCCCCCAAGAGCTCAAAGCCCAGACTCCAAGCCGCCTGTTCATCAATCCAAGAAATCAGACGGTGCACCAGCCTGGAGATGCCAGACAACGCGCACACCTTTGTGCTGAAGGTAAATGCCTCCACCGACATTATATTCGAGGCTGGGGATGACCAGCAGCTGTCTTCCTGGATGTCTGAAATTAAAGAATGCCTCCCTCAAGGGTCCACAGGAGCCGACCCGGACCTGGCCCCCGACTCCCTCTCGGAGGTCACGACGGCCAGCCCCACCACCACCACCAGCAGCAGCAGCGTGGATTCCCGGAACCAAGGCGCGACGCCCCCGAACGCCCCCGACCAGCCCTGCCAAAAGACGGACCGCTACCTTTCCGCTTTCCCCTGGTTCCACGGACCCATTTCTCGCTTCAAGGCCGCCCAGCTGGTCCAGTTCCAGGGCCCCGAAGGGCACGGAGTCTTCCTCATCCGACAGAGCGAGACCCGGAGGGGAGAATATGTCCTCACGTTCAATTTCCAAGGAGTAGCTAAGCACCTGCGGCTTTCGCTGACCGAGAGGGGCCAGTGTCGGATCCAGCATTTGCACTTCTCCTCGATCCTGGATATGCTACACCATTTCCAGCGCTGCCCGATTCCCCTGGAGTGTGGCGCTGCCTGCAACGTGCAGCTGTCCAGCTACGTGGTGGTTGTCCCAAACGCCCAAGGCTCGACCAACACGGCACCTTTCCCCCCCGCCATCCACCGCTACAACCCGGAGTTCGGCCTCCTCCAGCTCACGCCCTCCAGCTTCGCCCGGATCCGCCTCCCGGACCATCCTCACCGCCACCACAACTCCTCCGTGGAGCAGATCTTCCACTTGGTGCCCCCTCCGGAAGAGCTGGCCGGCAGCCTGTGGCCCCACAGAGGCCGGCCCGCCTCCCACCACCCCTTGCCGGCCCCCCGGCCCTGGGACGGCGATTACGAGACGGACTCCCACGGGAGGGGGCACCTGCGGGCGGTCAACAACCAGTACCTGTCCCTTTGACCCAGTGCGGCGGGGGCCCCCCCACCCTGCTTTTGCCCGAGACTCTTCCTCAAAGGACATCTTCCTCTCTCTTGGCAACGTTGAATATTTGGTTTGTAAGATAAGACGGATCGCTCCCGTCGCTGCGGCTGCAGCTCTTGATTTAGGCCTGTTGAAGGGCCCGTTTGTTCCTTTTTATTATTATTTTTTTCTCAGTCAAAACATTCTTTTCTCTCTTATCGGTTTTGCACACGACCTTCCTTTTGTGTTGAGGGTTTTACGAGTACATGCAGTACTTTGCAGCGGGTTAGCGCTGGTCCCCCTTTCTCTAGCCCCGTCCTCCTTGGAGAAGACGGGCTGGGTGGGGGAATAAGAGGACAGGTCAGCCAAGCAGCGTTCGTGGCCCGTCCAGAGTTATACGGGGGCTTCCTTAGGGTTGTGTTCTACGAAATCCCTGTCGTGAAGGCTAAGGCAAACAGGCATCAGGCAGCGGCTGAAAGGGCGCCCAACAGACGCGAGCAGGAGAAAAACATCTCCAGACACTCCCGTGGGAGTTGCAGTGTGACGGCACCCGCAGGGCGCTGTGCTGGTAGCGTGGCACAGTCTGAGACGCTACGCTCGATGGACGGCCACTCTCTGGCAGGGACAGCCCTCTTCCCCCCCATCCCCAGTAGCCAGTTCCCTTGCGCCGGAAAGTGCGGGAAGCGTTCATGGAGGGCCCAAATGGGTGCAAACACCGTAGCCTGCTTTTGGTGTAAGTCCCCCTCTTACAGCCAGCTGCCTGAGGGCCACCAGCCACGCAAGGAGCAGGTCCCTGATGAACTGTTTTCTGCTTCCAGTCTTGGCAGCCTAAGTCTGGATCACTCCCGTTTACACATTTGCACCACTTATGTGCCTTAGCTGGAAAAAGGGTGGGCGAGTCCCCAAACCCTAAGCTGTTGGCTTCTCTTTTCACTCTGAAGGTAGTCGCTTGGTTTAAAATAAAGAAGGCGCCCGTT\n>XM_030133558.1 PREDICTED: Sphaeramia orbicularis signal peptidase complex subunit 3 (spcs3), mRNA \nGTATAGTCGACATTTCCGGTTTGAACATTAGCTAAACTAGCTAGTACAACATAGCATTGTAGTCGAACGGTTATTTGTTCTCATTGTTTTTCGGTTTTGGCAGTTTTTCACGATGAATACGGTTTTATCAAGGGCCAACTCTTTGTTTGCCTTTTCTCTGAGTGTCATGGCGGCGTTAACTTTCGGCTGTTTCATCACTACGGCTTTTAAAGACAGAAGAGTTCCTGTGGACATCCACGTCTCTAAAGTCATGCTGAAGAATGTGGATGACTTCACAGGACCCAGAGAGCGCAGTGATCTGGGTTTCATCACATTTGACCTCTCAGCTGATTTGCAGCCAATTTTTGACTGGAATGTCAAACAGCTGTTCCTCTATCTGTCTGCAGAATATGCCACAAAGAGCAATGCTCTGAACCAGGTGGTCCTGTGGGATAAGATTGTCCTACGAGGGGAAAACACCAAACTGAACCTCAGAGACATGAAATCTAAATACTTCTTTTTCGATGATGGGAATGGACTCAGGGCCAATAAGAACATCACGTTGATGCTGTCGTGGAATGTGGTCCCTAACGCTGGAATCCTGCCCCTTGTGGCTGGAAGTGGACAAATCAGCCTGCCTTTCCCTGACACATACGAGAGCACCAAGAGCTACTAGACCCAACCAGATGTCCATGCTTTCATTACACACTGTACACGCCAGAAAAACAGAAACAAGCACAGACGCCAACAGATGACTCACACATTCTGTATATTATTGTTTCTTCATAGATGTACATCAATTTTTGGTTTATAAAAAAAAAAAAATTCGGA\n>KP159845.1 Uncultured fungus clone OTU_86F_4_49 5.8S ribosomal RNA gene and internal transcribed spacer 2, partial sequence \nCGCACATTGTGCCCTCTGGTATTCCGGGGGGGCATGCCTGTTCGAGCGTCATTATAACCACTCAAGCTCTCGCTTGGTATTGGGGTTCGCGGTTTCGCGGCCCCTAAAATCAGTGGCGGTGCCTGTCGGCTCTACGCGTAGTAATACTCCTCGCGATTGAGTCCGGCAGGTCTACTTGCCAGCAACCCCTTAATTTTTTT\n>XM_014413384.2 PREDICTED: Maylandia zebra KN motif and ankyrin repeat domains 4 (kank4), transcript variant X2, mRNA \nTATTAAGAGAGACAGGGTCAGTAGCATTCACAGAAACAGGAAGGACAGGAGGTAAGAAGAGCTATATGGCAGGCTGTTAGCTCCTACTCTAGCAAACACAAGTAGATGACTGAGAACTCGGCCTCCCATGATGGACAAGAAAAGTGCCAATGGCTTTCAGTCCAAGGCCAGTGAGGGTGGTGTTCAAAGGAAGCAGCTGCCCTACTCAGTGGAGACTCCCTATGGCTTCCACCTGGATCTTGATTTCCTCAAGTATGTTGATGATATTGAAAAAGGCAACACAATCAAAAGGGTCCACATTCAGCGCAGGGTAAAGGGCCCACCTAAATTCAGCACTCTGCCCAGAAATTTTAGTCTTCCTGGGCATGGAGTAAGGCCTCCCCCAAAGGAAAAGGACAGTACTTGGTCTGGGACGTCTACCCTGGGTCCCAAGCCTAAATCACGAGTGACAGAGGTTCAACAGATCTTTGACTTTCGAGCAAATGAAGGCGTGATTTCCAGCCAGAGCTGCAGGGGGACCACAAGTCAAGGAACTGGCTATGTTTCAACTAAACCCAAAGATGAAGTAGGCGCGGGGGCTCGCGGTGCTGAAGACAAAACTGGGGGGATTCAGATTCAGAGTCGTCCAAATCTGCTCAGAGCATCGAGCATGCCCATCACGCTACAGCAGCGTAAGAGTTCAGATTCAAGCAGTCCTGACCGTACCGTGGGAACACCAGAAAACGGCTCAACAGAGAACATGTTCCGGGCTTCACCAGACGTAACAGAAAGACGCTGTGTTCCCCAAGATCGAGCAGGTCTTCACCAGCAGATTACTGTTGCACTGAAGCGGGTCAGAGAGCTCGAGGAACAGGTCAAAACCATCCCAGAACTGAAAGCTCAGATCTGCTCTTTGAGGGAGGAGCGGGAGCAGCTGCTTCTTCAGCTACAAGCACAAGCCAAGGCCCAGGCTTCCAAATTATCTGCTACAGTACCAACAGGTTACGATTCTAGGACAAATAATCAATCGCAAGGACAGAGACCTTCACAGGAGATGAAGTTAGTCCTAAAGACTCAACCCACTGGACGTTTAGAAGACACAAGTCTTGGGCCATCAAACCAAGCTGCAGGGAAGGAGAAACAAGGTGAGACAGAGAAAACTAACGTGTTACTATCTGAAGTGGAGAGCTCGGCACAAGGAAAAAGTAGCATGTCCTCAGCACAAGAAGTGGAGAGACAATCACTGCAGCTGGACATACTTGAAAAACAAAAAGAAACAGAGAGTCCACTGGGACAGACAGTGCAAAAACTGCCACGAGACATTTCAGGGGAGGAATTACTATCTATCACAGTGGCTTTAAAAGAAACAGAGACTGCAGCAAAAGAAGGAAAACCAAAGGATCCAGATGATATGCAGAAGTTGCAGGAGAAGCTAACAGTACTAGAGACTAAACTTATTCAGGCTAGCCAGGAGCTAGAGAGCACTAATGCTCTTTTGAAACAGCAAATAGAGGAGAACAAGCTAAAAGAGGAGAGAATACTACAACTGAGTGAGGGAACGAGAGTGGAGGTTTGCACCGCACATGAACGTCCAAGAAGAGAGAGCATTGACACAGGGACAGTGACAGAAAGGATAGATTTTACCCACCAAGAAACAGAGACAGAATCGCCTGGTACTGTAGATCAGGGGACAGACACTGAAAAAATCTGCATTGAAGTGTGCATACCAAAACAAGAGACTAAAAGTACAGATCAAGGACCAGTGACGGGAAAAGCTGACACGCATGACCAGGAGACAGAGATGGAGGCGGCGATAACAGCGACAAGTCCACCGAGGCCCAGAGCCAACAGCATGGAACGAGGCACACTAACCGAGAGCATCATCACCCTGGATCAGATGACCGAGACCCCCGTGGCCGAAAGGGTAAACCAAGTCACAGAAACAGAAGGCGAGATGGTGACGGACCATCCTCACAGACCGAGGGCCAGCAGTGTTGACAGAGGGACAGAGACAGAAAGGGTGGGCACTGTGGACAGAGTGACAGAGACAGAGGTAGCCCAGAGAGCAGACCAGCAGACTGAGACAGAGATGGAGAGACGTCATGACAACAACCCAGCCAGAGGTGTAGAAGCAGAGAGTCAAGTGAGTGAGAACACAGGCAGCCAAAGAGACGAAGTCGTGGTGAGTGAAAGAACAGAAGACAGGGAAACATACGAAAGAATTCAAAGAGAGAGTGAACGTTTAGTTGCTGAGGTTTTATCAGAAAGCTCAGCGGCAGCTGTAGAAAGCATAAAAACTTTAGATGTTGTTAGGAAGAATGAAGAGTGCGCCAGTTCGGCTGCTAAAGCAGAAGAAAATAAGATTAAAGTGAGTTCCGAACAAGATGACTCAGAAACAAAAGAAATTACAGAAGTGGTTGAAACAAGACCAGCTGCCCTACAGAGAAGAGACCAGCTGCCCTACAGAGAAGAGACTACAGAGAAGAAAGAAACAGGAGCCGGGGAGGTTATGTCTGCAGCAGTCAAAGAAACTGTAGCCGCTGACACTGTTGCAGTAACTGAGGGGAATTCAGCTGTGAAGACAGCAGCTCCTGTAAGACCACAAAGAGGCAGGAAACCCTCAGTGGAGCAAACTCAGCCGTCACCTCCTCAACTTCAGGTGGTGCCTGTGCGTCCTCGTAGGGGATCCAGTGAAACTCAGACCCAGCCGCAGACGAAAACCCAGCCCCAGGTGCAGGAACAGAGTGCAGCTCAGCTTGAAGCTCGGTCCCCAGAACAGCTCTCTGAAACACAGGTAAAACATCAAACACCGTCTGTGCCTCAGGTTGAGGACCACACTATAGCAAAGAAACCTCCTGGAGGGTCTGGAGAGAAGCAGTCTGAATCTCGACTTCAGTCTGAGACTCAGGCCTTGTCTCCGGGCTCTAGTGAAGTCCAAGTCAGGCCTAAATCAATACAAGCGCAATCTCAAACTTCTGTACCTCGGCGGGACTCAAAAGAGCTGAAAGCACCGCAGAGGGTGTCTGGTGCATCACACACTCCTAGACGGGGATCGGGAGAAGCCCAGACCCAACCACCTCGCCAAGCGTCAAGCGATGCTCAAACTCAACCTCAGGGTTCACGTAGAAGCTCCAGTGAGGCTCAGGCCTCTCCGAAAGATGCCAGTGAGACACAGTCACTGCGCAGAGGCTCCAGTGAAGCAGCTCAGCGCCGTGGCTCCAGTGAAGCAGCTCAGCGCCGTGGCTCAAGCGAAGCCCAGGGTTCACGTCGCGACACCGGGGAGGCCCAGCCTCCTCGAAGAGGCTCCAGCGAATCACCAACATCGCCTGCAGCTTTGGGTCAAGTTGTAACTCGGATAACGGGGCTGCTAGGAGAGCAGTGGGCACATCTCGGAAGCAGCTCTGGCACTCAGCAAACAGCCAGCCAGCAGGAGAGCGCGAGCACACAGAAAAAGACGACAGGGAAAAGAGCAGAGGCTGGAAAGGCAACGTCAGCCAAGCCAGCGGGGAAAGCAGCCCCATCAGCAGCAGCGACAGGGAAACCAGCGGGGAAACCTGGTACTTCCAAAATGAGCTCCATTCAGAGCCAACTGGTCAGCTCCCTCAGTGTCCTCTCTGCCTTCTACTCCCCAAGCCAGAAAGCGGCTGCTGCCAGCAAACAGCAAGAACAAGGTCTCAAATCCATCATGAAGAAAAATGGTGGAGCAGGCAAGCAGGGGAACAAGGGAGCCAAGAAAAACCTGAAGTTTGTGGGGGTGAATGGAGGATATGAGACGACATCCAGTGAAGAGTCCAGTGGAGATGAGAAGTCAAAGGTGGAGGTAGAAGAGGAAGATAGCTCAGAACCAGAAGTGGAGAAGGAGCCTGAGAAGGAGCCTGAGAAGGAGCCTGAGAAGCAGCCAGAGGAGGGAGCAGAAGCCCAGAGAAAAGATGCAGAGGTCCCAACTGAGGGAGGAGGTGCTGTGGCTAAAGAGAAGGAGACTGAAAGAGGTCTGCTGGATCCAGAAAGTAGCCAGGAGCTCCTGGAAGAGCAGGCTGGAGGGGGAAGAGTCGACAAGGGGTTTATAGATGCATGCCTTTATGTAAAGGACCGCATGGAGGAGGTTTCATCCCCAGATAAAGAAATGCGCCAGGTTTTAGTGGTGCTCTACCAGGAGTGGTTCAGAGTCTCCAGTCAAAAGGACTCGCAGGCAGATACTGTCAGATTATACCTGCGACAAGTGGGGATGACCACACCCACTCTCCTGCCATATGTTGTTAACTTGACAGACGGCAATGGGAATATGGCTCTTCACTACAGCGTGTCACACTCCAACTTCCCTGTGGTCAAACTGCTGCTGGATACCGGCCTGTGCGAAACAGACAATCTCAATAAGGCAGGCTATACTCCAGTGATGCTGGCTGCTCTGACGGCTGCTGAGAGCCCCGATGATCTTGAAGTGGCACAGCAACTGTTGAAAGTGGGAGATGTCAACGCACGCTCCAGACAGGCGGGCCAGACAGCACTCATGCTTGCGGTGAGCCATGGCCGCGTTGCCATGGTGAAGCTGCTCCTGAGCTGCGGCGCGGATGTAAATGCCCAGGACCGCGAGGGCTCGACGGCCCTGATGTGTGCCAGCGAGCACGGGCACACGCACATCGCTCGCCTGCTGCTGGAGACAGGTCGCTGTGATACCAGCCTCAAAGATAAGAACAGTTCTCCACAGTCGCTGTCCACATGGGTCAGTGGGACCAAGAAGCACTCTGCTAATGTGTGGACTCTGACCAGCAACATCCAGCAGGACCCAGACAGCGTTTTCTATCTCCCAGCTGGAGTTTTTGTTTGTCTGTGACTGGAGAGTCAGATTTTTGTTGAGCTTCACACTTGCAGACCTAAGTCAGTTTGCAGAG\n>XM_013897292.1 Thecamonas trahens ATCC 50062 hypothetical protein partial mRNA \nATGGCCGACGAACCTTCACCAAATCAGCCCGTGCCGCCCTGGGCCGATGCCGATCTCTCGCGATGCCTGCCGACGCTCGCCGCCGGCGGTGAGCGTCAGGATATGGAGTTCAAGGAACGCTTTCCCGGCCAGGCACGCGATCTCGCCAAGGAGATTGCGGCCTTCGCCACCTCCAATTTCGGCACGATCCTGCTCGGCGTCTCCAAGGCGGGCGGGGTGATCGGCCTCGCGGATTGCGAAAGCGCGTCCGAGCGGGAACGCCTGCTCGACCGCGTCGCGGGCATCTGTGCGAACAGCATCAAACCGTCGGTGACGCCGGCGCTCGCGTTCGCCGTGGTCGAAGACCGCACCGTGCTCGCCATCGCCGTGCCGAAGGGCGATGCGCCGCTCTACTACGTCGCCGGAGTGCCGTACCTCCGCCAGATGGCTACCTCGCGGCCGGCTGAGCCGCACGAGGTGATCGACCGGGTTCTCGATTGGGACCGGGCGAGAAACGGCAGCGGCCGGCCGAGCCCGGAATCCGAGTTCTTGAGCCAGACCGCGTCGCTCGTCGTCGATGTCGTCGTATACGCCGACGAACTCGAAGAACGTCGCGTCAAGCCGTGGCTCAACGAGACACGCCACGGACTCGCATGGGCGGCCGAAACGGCGCGCGACCTCGCGGCCCGGACGCCGGGAGACTTCGCGGAGATGGTCGAGCCGTTGGAGGAGATGGCGAGCAATCTCGACCGTGCTGCACACGAACGTCTCTCCATGGGCGGCGGCTGGGACGAGATGGACGCGGCGGCGCGGGCGGCAAGGGAGACGGCACGGAGCATCTGGACACGCTGGATCGAGCCGCACGGCTTCCATGCTGACTCGGTCGCCGGCGTGCGGGAGACGGTCTCGGAAAACGCGCGAAAGCTCGCGAGCCTCGCGGCGCGGCTCCAGGAAATGGACGATCAGGGACGGCTCGACGGCATCCAGTCGTCGGCCGGAGAGATCGGACTGGTGCTGCTCAAGGCCGCAACCTTCGGCGTCGGGCTCGGGGACGATCAGCGGATCGAGGAGTTGACAGCGATCGGCCGCGCCTTGCGCGACGTGGAGACCCGGACGATCTACGCCGACGGCGGCCAGTCAGCCCGGAGAATACTCGACGACGTCCGTGACGCGAGCGCGAGGCTGAACGCTTGGCTCGCCGGCCTTCCGTCTGAAGCGGAAGCGGGAGCATGA\n>LN881636.1 Terribacillus sp. 1011TES3C6,21 partial 16S rRNA gene, isolate 1011TES3C6,21 \nGGGAAATGGCGCGTGTCTATACATGCAAGTCGAGCGCAGGAAACAGATGACCCCTTCGGGGTGATTCTGGTGGAATGAGCGGCGGACGGGTGAGTAACACGTGGGCAACCTGCCTGTAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAGTATTTCCTTTCTCCTGATTGGAAATGGAAAGACGGTTTCGGCTGTCACTTACAGATGGGCCCGCGGTGCATTAGCTAGTTGGTGGGGTAATGGCCCACCAAGGCGACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGCGATGAAGGCCTTCGGGTCGTAAAGCTCTGTTGTTAGGGAAGAACAAGTACGAGAGTAACTGCTCGTACCTTGACGGTACCTAACCAGAAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCACAGCTCAACTGTGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAAGAGGAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGATATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGAAGTTAACGCATTAAGCACTCCGCCTGGGGAGTACGGCCGCAAGGCTGAAACTCAAAAGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCGCTGACAATCTTGGAGACAAGACGTTCCCTTCGGGGACAGCGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGATTCTAGTTGCCAGCATTAAGTTGGGCACTCTAAAGTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGGATGACGTCAAATCATCATGGCCCCTTAT\n>XM_022540745.1 Aspergillus glaucus CBS 516.65 hypothetical protein (ASPGLDRAFT_127844), partial mRNA \nATGATTCCAACTCTGCTGTTCTCAGGTTTCTTTTTCGCCAATGCCTTTGCCATTCCCCTTGCAGGCCACGAGCAGCAGCAGCAGCAGCAGCAGCCATTGGGTAATGGGGTCTCTTCCTCCACGGCGCATAGCGCTGGAGGGGCGCAGAGGCTGACTGGGCGATTCCTGCATATCACTGATCCTCATCCTGATTCGCACTATAAACAAGGAGCGTCGGCCGACAATAATTGCCATCGAGGCCATGGATCTGCTGGATACTTTGGAGCGGACGGAACCGATTGCGATGCCCCGATCACCCTGATGAATGCGACTTTCCGATGGATCGAGCGAAATTTAAAGGGGAATATCGACTTCGTGCTCTGGACCGGCGACTCCGCCCGCCACGACAGGGATGAAAAGATGCCGCGGAAAATGGAAGAAATCATCCACCTGAATGAAATCTTGTCCCAGCAATTCATCGATGTTTTCCAGGACTCCATCCCCGTCGTTCCGACATTTGGCAACAACGATATCATGCCGCATAACACCATGAAAGAGGGACCGAACCGCTGGACGAAGACTTTTGTGGATGTTTGGGGCAAATTTATCCCGGAGGCTGAGCGCCATAGTTTTGTGGAGGGTGGCTGGTTCACGAGCGAAGTGATTCCTGGCAAATTATCAGCCATCAGTCTCAACACCATGTACTTCTACAGCTCCAACTCCGCCGTGGATGGATGCGACGACAAGGATGAGCCGGGATACGAGCATATGGAGTGGCTCAGAGTTCAACTGAAACTGCTTCGCCAGCGCAATATGAAGGCCATCCTGATTGGACATGTACCTCCGGCCCGGGCAGGCCCGAAACAAGGATGGGATGAAACGTGCTGGCAGAAATACACCCTGTGGTTGCATCAATATCGAGATGTCATCGTTGGGAGCGTCTATGGACATATGAATATCGACCACTTTATGTTCCAGGACAGCCACGATATCGACATCGTCGATTTGGAAGGTGACAACACGGGATCTAATGATTTCTCTGTCCAATCCATGGAAGACTATCTCGAGGCCCTTCGGGGCCAATGGTCCGATATGCCATCCCCGCCATCTGGTCTTTCAATTGAGGAATGCTTGGATGAAGACTTTGCGGAGACTGATGGCAATGCGCCTTGGACGGACATATCCAAGAAGAGAAAGAAGAAGAAGTTCCTGAGAAAGATCGGTGGCCCTCTGGCCGAAAGATATAGTGTCTCTTTGGTGTCGCCCAGTTTGGTGCCAGAATACTTTCCTACGCTCCGGGTGATTGAGTACAACATTACTGGCTTGGAAGATATGCCAACTTGGTCTGATATTCAAGAAAACACACAGATCTCATATCCCAACGACGATGACACACCGTCCGTTTTGGAATCCGAAGACTCTCCGATGATGAACAATGACAAGAAAAACAAGAAGAAGCCAAAATTCAAAGTACCAGAACCCCCACCGTCTTCTGCTCTTCCGGGCCCTGGCTACTCGAACCAGCAGTTGTCCTGGCTCGGATATACGCAGTACTACGCCAACCTAACGAGGATCAACGAGGAAGTGGCTTTGCACGAATCGACGCACCAAGACGGAACCGGGAATAACGTCAATGCTACCAGCGTTGATGATGTATTTGGCTTTGAGGTCGAGTACGATACTCGTAACGACCATATCTACAAAATGAAGGATCTTACAGTCCGCAGCTACTTCGATCTAGCCAGTCGGATTGCGAACAACATTCCGAATACCCTGGAATCACCTGATGACACGAACGACGACGGTTATGATAGCCAGAAGAAGAAGAAAAAGAAGAAGGGGAAAAAGAAGAAGGGGAAAAAGAAGAAGAATAAGAACAGGACATGGAAGACCTTTTTTGATCGGGCGTTCGTCGGGTACCTGGACATCAATGATCTTGAAGAGACAGAATCATGA\n>KX654414.1 Uncultured bacterium clone OTU 2009 16S ribosomal RNA gene, partial sequence \nGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGAATGATGAAGGCCTTAGGGTTGTAAAGTTCTTTTGTCAGGGAAGATGATGACGGTACCTGAAGAATAAGCACCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGTGCTAGCGTTGTTCGGAATCACTGGGCGTAAAGCGCGCGTAGGCGGCTTTCCAAGTCAGAGGTGAAATCCCTGGGCTCAACCCAGGAACTGCCTTTGAAACTGTAAAGCTGGAGTGTCGGAGGGGATGGCGGAATTGCTAATGTAGAGGTGAAATTCGTAGATATTAGCAGGAACACCGGTGGCGAAGGCGGCCATCCGGACGACAACTGACGCTGAGGCGCGAAAGCGTGGGGATCAAAC\n>XR_002806955.1 PREDICTED: Equus caballus NK6 homeobox 1 (NKX6-1), transcript variant X2, misc_RNA \nACAAAGGCTTTGGGGTCTCCCGGGCCTGCAAACTGTTGATGAACAAAAGGAATCAAGCCCCCGCCTTTGAAATTAGGTTAATCTAGATAGTAGAATGTGCTGGGGGAACTCGCCATTATTAGAGAATAAAAGCCTTACCAAAATATCAGCCCTGAGGATAGATCAGGCCAGTTAGATAGCTTCCATTTATTCTATTTGTAAAGATATTCAAGCTTTTGTTTATCAATTCAGGCCCCACTAGTTATATAAGTTCCTAATGTGTATCAGCATTATAGTGCTACTATATTAACTTGCAGGGTAAAAAAAAAAAAAAAAAAATCCAAGGATCTAAACACTTAGCACGGACGAATCTATCTGCTTTTAGCTTAGCAGAAAGCAGTCACTTTGGAATAGTAATTTTCCAAATGAATTGACAAGATTATTACTATATTATGAAATTGAATTCTGTTTAAAATAAGTTTATCCACAGATGTAAGATATTTTACTGTTTGTGACAATTTATAATTAAAATGTCACTTAGCTTATAATTGACTTGTACAGTGTATTTCCAGGGAATCAAATTTGAGAAATCTTTCCTTGGAAAATAAAGGGATTGAGCCAGCTAGGCAAATTAAATCCACAGTTTCCTGTATTTCCAGTATTCCCTTTTGTTCCTCTTCTTCAGTTTATTATATTTGGGGGTTTTTTTGGGGGGAGGCAAGTGTATTTTCATTAGTTATATTGTTGCTCTTTAAATTAAGTAGGAATAACATTAGCCATGTCTGCTGGTTAGAGTGTATTTCTCCCTGGACAAGCATCATAAAATGCATTTCAGGAGTGATTTTGTATGTGACCATTAGAATACCATCACAGTTAAAATTATTTTTGCAGTGGTTGGTACAGAGCCTACCACAGTAATCTAGAGGTCTTCATTTGTCACCATAAATATGTCTGCATGGCTAGAAGTGAATTATTATAGCTGTATAAAGAAAATAAAAATCACTTTCTTAATTCCGATTCTCTAGGTAAAATACATAACGGATGAGAAAATGGATGAGAAGCATAAAGACAAGATAATTCAATATATTTGGGAAATTGCTTGCTTATTCCTGATGCTTTAGGTTGCAATATGTGTATCAAACACAGTGTCAAACATCGTGAATAGGCCTAAAGTATTTGTATATAAAAAGATTGTCTTGGGGAGAAACAATATTAAAATAATATTTGAAAGACCTGGCATGTTAATAGTGGGAAATAATGTAATGGTAATAATGGGGAAAAATGTAATTGGCAAAATTACGCTTTTAAAAAATAACTGATGAAAATTTTAGCCTTGACTTTGATTTTATGAAAATCATTAAACCCGAGAGACAGAGATTGAGAGAGAGAAAGAGAAACCACTGTGATGATTTTGACTGAGCTATTAAATATTTTCATGCGTTTATGTTGGTTAGCATTAGTGATTTGAGGTTTCTGTTCAGCAGATTTTTTTAACTTTACATCATACACTGCAAGTGTAAATAGGGTGGGGAGTGTTTTCCTACCATGTTTGTGTGTATTCAGACCGGGAGAAGTGTAACAGGCAAATATCCAAAAGCGAAAAGGAGAGCAGAGGTAATTGGGGGAAATGCTGTGCCTTCTCCCACAAATCACACAAAACAGCAAGTACGCTTCAGGTTGTTTGAAATATCTTAATCTGAGAAAGAAAATAACGAATACAGTCACAGTCATCATGGGGCAACTTTACGAAGGGGAAAAGTTTTCTACTTCAAACTGGAAAGTAGGAAAGCGGACTCATTTTTAGGGAGACTCATTTTAAGTTTCCAAGTTTTTTCTCTTCTGAGAAATCGCTCTCTGACAACCTCAATACTCTTGTGTTACCATCGCTATGGCAACGGCAGTTTGTTGGTGCCTGTTACTCGGAGGAACCTGGGGCGACGGAGACTGACTTTGACGGCCCAGACAAGGAGGTCTGGTTCCAGAACCGCCGGACCAAGTGGAGGAAGAAGCACGCGGCCGAGATGGCCACCGCCAAGAAGAAGCAGGACTCGGAGACCGAGCGGCTCAAGGGGGCCTCGGAGAACGAGGAGGAGGACGACGACTACAACAAGC\n>XM_006965968.1 Trichoderma reesei QM6a uncharacterized protein (TRIREDRAFT_108278), partial mRNA \nATGGACGAGCAAGAACAAGACAACCTCATCCAAACCCTCACAACCCAAAACGCCTCCCAAAACAAATCCACAGCACGCACCCTCCTCCTCCTCCCCCTTCTCTCAACAATAGCCTACATCCGCCCGCTCTTCGACCCCGCGACCGCTTCCTTTGCGATATTCTGTCTCACGTCCCTCCTCGCTACCGCGTTCCTCTTGTACCGCCTTCCGCCGACCGAGACGGGTATAATCATCGTCGATGACTGGGCGCACAGACGAACTGCTTCTTCTTCTTCTTCTTCGTCGTCGTCTGTCAATGCTTCTCTACGACAGCATAATCAGTCGCTGAGGGGCCTTTTGGGAAGGGCGCAGGTGGAATGGCGGTCTCCCTTGGAGAGGACGCTGCCGTATCTGAATCTCGGTTTGGTTGTGCTCTTGAGTCTCATGGGGCTGGTAAGGGGCGACCATCGAGCAGGTGGCTTTGGGTGGGTGAGCATGGGCAACGTACCAGGCCTGGTTTACTCTGTCGCCATCACGGCAAAAGTCGTCATGGCGGGCGTTGACCCCGAAAGGGAGCTGTCGGGCCTCAAGTACGGCTACAAAGGCGCTTGA\n>XM_008866548.1 Aphanomyces invadans hypothetical protein mRNA \nCGTCCATTCCGCGTGAAGTCGGTTGCCGCCCGCGCGAAGGAACAACTGGCGACGCATCCCCCAAACAGGAACAGGTGATGAGGAAGCAGCAACGTGGAGGTGGAGACGGTGACTACGGATCCAGTCGCGGCCTGGAGCGTCAGAAGCAGCTCTGCGATGAAGGCATGGCGCTGGTGAACGAAAGCGTCGGCATTCAAAACTCGGGGGGAGACACGGACCTGGCTGAGCGCAATTTGAACCGCGCTGTCGAGATATTTGAGACGGCTCTGGCAATTCAATACAGCACACAAGAAGAACAGGAAGCGGCCACTCGTCTGAACAACAAGATGCTTCGCTATGTCAAAATGATCAAGACTCAAAAAGCCAAGAACCCCGCGATCGGCGGCAACAAGCGCACCGCGTCCAAGTATAACATTCTCGAACTCGACAATCTCCCGCAGATTTATCATTCCATTGCGGGCAAACTGTTCAACTCGCAAGTTGGTGACGTGTTTGAATCGCTCAAAACGACTTTTGGTTTCCAGGACAACAACGTGCTCAACCAAAAAGAGCATGTCCTCTTGCTCTTGACAAACTACAAAGAGCAGCTGGACGTTCCAGACCCCAAGGCACCGGCGAACCAGCCCGTCCCCGCTCGCGACCAGCAAAGGGAGATGCAGTTGGCAGACAAAGCTGTCACCAAGTTCCATGCCAAATTGTTTGACAATTACAAAAAGTGGTGCAAGTATATTGGCCAAAAGCCCAAATTTACTCGGGACAACTTGACTGATATCGTGCTCTTCTTCCTCATTTGGGGGGAAGCTGGCAACTTTCGACAGACACCGGAATTGCTTTGCTTTTTGTTTCACAATCTCGCTCCGGCGTCGCAATCGGGCGGTTCGAAGGAGTCAGGAGACTTTTTGGCATCGGTGATCCGCCCCATGTACAACGAACTGAAAAAGGACAACGACAAGAAGACTTCCAAGGGCCAGCGCGCCCCGCACAATGAAATTCGCAACTACGACGACTTTAATGAGTTCTTTTGGACGAAAAAGTGCCTCAAGTACAACGCGTACACGATCGGGGAAGCGTTTGCAAGCGCCGACAAGAAGGGCAATCCGAAGGTCGTGAAGAAGACGTTCATCGAGAAGCGAACTTGGTTCCGTGCCCTAACGTCATTCCGCCGTATTTTCCTCTTCAACTTTGCACTGTTTTTGGCCACGGTTGGGTTTGCTATCAACATGATCACGCTGTGCCCGGACAGTCCGATCATGTATGGCCCTGACCTGGGCAAGATTGAAGTGTTCGGGAAAAAGTACTACGACAGCGTCACCTACACCACGCCGTTGACGGACACCGAAACTACCGCCCTGACGGCAGTCGAAGTTGACAGCACTCAAAAACTTTGCAACCCCGCGAAGTTGGCGACTTGCTTGGGAGTTGGAACCTATGTCCGAGGCGAGACGTTTGCGCACTATCCCCGCGACTTCAAGGAATTGATGAGTCAAATTCCTTTTCAGGACTGCATTGAAAGGCAAAGCGGCCGTTGCACGTGCTACATTGATCTGATCGAGAAGTGCTTTTCTCAAACTGGAAATGCAACCGTATACCCTGATGGCGGTTTGAAGAGCATTCCGGTCCAGTACGATCAAAAGTTGTGCGATCTGGTGTACAAGAAGACTGCCTTGGCCATCTTGAACAACAACACAGACGGAAGACTCAACTGCGACATGTGTCGTTTGGAGCCGCAGAGTTTGTTAAAGTCGTTGCCCAAACTGATCGGTTCATTTATCGATTTCAACCGATTCACCAAGAAACGCGACTTTGGTCCGCTGTTTTTCTTGGGTGGGGTGGGGTGTTTGGTCCTGGTGTTTGCGTGCGAGCTCCTCGGTCGAATGATATCGGGTGTCGGCGTCGGATATGTCGGTCGGTCGCTGCCAGTCCCATTTGGCGCGTATTGCCGGTACACGTGCTTTTGGCTCTTTTTGTTTGCTTGCAAACTCACGTTTGACTACCAATTCATGGTCAAGAACTTGGTGGAAACGACCGTGTTCATTTGGTCGACGGACGCAAAGTTGCACCACCCGACGACCCAGTTCCTCATCAGCTTCAGCTTCCACAACATTTTGTACATTGCTTTCTTGTGGATTCCGGCCATCACGGTGTTCCTGTACGACGCCCAGATCTTTTACGCACTCTTGTCGGTCATCTTTGGGTCGGTCCGCGGGTTCAACTTGCGCATTGGCGAGCTCCGATCGTTTCGCATTCTTCGGTTGACGTTTAAGTCGATCCCAAAAGTCTTCAACAAGAAGCTCGTGTCCAACTTGATTGAACGTGGCGGCAAGAAGAAAGGCAAGAAGGACAAATCGAAGAAGGGGTCCAAGGACGATCCTGCTCCGGAACGTCGATTCCAGCGCGTCTCGTACTCGGAAGGGAGCAAGCCATTGACCGGCACGGCCAAAGGTTTCAGTTCACTGTTGGAAAACGACGGATACAACGAGCTGCGAACCCCCGGTGGTGTCGATGCGGACTCGAGTACTGGACGCAATTCCAACATCACGTCCATCACCGGTGTTTCTGGGGCTGAATTTGAGCGCACGATTCCATTCGCCATGGCTTGGAACCGCTGTCTCGCTAGTATGCGCGAAGCGGATGTGTTGAGCGACCGCGAACTGAACGTACTAAGCTACTTGATCGACTCGAAAGACGTGGCGGAGCGACGTCTGTACCCGCCAGCTTTTTTGACGGCTGGCAAGTTAGACGAGTCCATCGACATCATTATTGAAAGCTACACGTTGCACGACAAGCTCAAGTCGGACAAAAAGAAGGACAAGACTCTGCAAAAGGTTGAAGTGTCGATGCGCGAACGATTGACCAAGGACGATCTGCGCGTGGAAGCCATTTTGGGCTCGTACAAGTTTTCGTCACAAGTGATTAAGTTATTGCTTGGCGACGAACACAAAGAGTTGGAAGCGTGTTTCAGCTTCATGGAGGAGATGGCAACCAACAAGACGACGTTGAAAGGTCTCAACTTCAGCAACTTGTACCAGGCTCGTTCGTCGTGTGCGGATTTGATGAAGTCGATTTTGGAAGTGCCCAAAGGCGCCCAGGAAGGCAGCATCAAGTTTTTGCGCTCGTTGTACCACGTTATCGACAACGTCGAAGCTGTCATGGGGTGCCTGAAGAAGGTCCTCTCGAAGCAAGAACACTTGGTCAAAATTTTGAACGACACGCCATTGAAGCCCAACTCATTCTTTTTCCCTGGCGACGCACAACACTATGCGAGTTCGCAACTCCAGCGCATCGTGAACGATCAAACGGCGATTGACATTGTGTCTCGGGCGTACCAGCTCCTTACGGTGGACAACTTCGATGCCGAGCCTCGATCTGAGGAAGGGCAGCGCCGTCTACGCTTTTTCACCAACTCGCTGTTCATGGAAATGCCTGAAGCCAAACCTGTGAGTCAGATGCACTCGTTTTCGATTTCGACGCCGTATTTCAACGAAATCGTGTTGTACTCGGTGAAAGAGCTGACTGCTGAAAATGACGACTCGATCAAGCTGCTGTACTACTTGCAAACAATCGATCCGTTCGAGTGGGAGAACTTTTTGGAACGCATCAACGTCAAGGATATGAACGAAGCCTTGAAAAAGTACCCGGAAGAAGTGCAGCTATGGGCGTCCTACCGCGGCCAAACGCTAGCCCGTACAGTTCGGGGAATGATGTACAACGAAGAAGCCATTCGGTTCTTGTACTGGTTGGAAATCGGCGAAAACGAACCCATGCATTTGCACGGATGCTCATGCAATCGGTGTATCAAGTTGGACGAAATGGTCGCGCTCAAGTTCAACTATATCTGCTCGTGCCAGATCTATGGCAAACACAAGGACGAACAGCGCCAACAAGCGCAAGACATTGACTACCTGCTCATGAAGCATCCTGGTCTTCGTGTTGCATACGTTGATGGCCCCAAGAAGGTCAAGGATGGGCCACCCAAGTACTTTTCCGTGCTCATTCGCGGAATCGGCGACAAGATCGTCGAGGTATACCGCGTCGAGTTACCGGGGGATCCCATCATCGGTGAAGGGAAGCCCGAGAACCAGAATCACGCGATCATTTTCACACGGGGGGAAATGCTCCAGTGTATTGATATGAACCAAGACGGGTACCTAGAAGAGTGTTTGAAGATGCCCAACTTGCTCGCTACGGTGGACCGCAAGGAGCACTCGAAGAACCCGTTGACGATTATTGGTTTTCGGGAATACGTGTTCACTGGTGCCGTGTCCAACTTGGCGAGTTTCATGCAAATCCAAGAACTGTCGTTTGTGTCGCTGGGTCAACGCATGCTCGCCCTGTTCCACGTCCGACAACACTATGGCCATCCAGACGTGTTTGACAAGATGTTTGCCATGACAACGGGGGGAACTGCCAAGCCTTCGAAAGGCATCAACTTGTCGGAAGATATTTTCGCCGGGTTCAACACGACGCTGCGCGGTGGTCGTGTGTCCCACGAAGAGTTCATTCAAGTGGGCAAAGGTCGTGATGTCGGCATGCAACAATTGGCGTTGTTTGAGGCCAAGTTGTCGTCTGGTGCCGGGGAGTGTGTCATTTCTCGCGATGCGTCCCGAATGGGCAGCCGCCTCGACTTTTGGCGCCTCAACTCTTGGTTTTATGGCAACCTGGGGTGGTACTTCACGCAAACGATGACCGTGTTCGGCATTTACGCGTTTATCTACGGCAAGATCTACTTTGCGTTGAGTGGCCTTGACTCATTTTTCCTCAAATCCGGTCGTCTTGGGATCAGTGGAGTCCTCAACACGTCATGGGCATTGCAGTTTGGTTTCCTCCTCGTCGTGCCTGTCATTGCCGTCGTGGGTGTCGAGCGCGGTTTCCGTCACGGGTTCTCGTACTTGGTGTGGAACGTGTTGACGCTTGGCCCGCTCTTCTTTACGTTCCAAATGGGCAACCGCATGAACTATTTTGATCGGACGTTGATCCATGGCGGCGCCAAGTACCGCGCAACCGGGCGTGGGTTTACCATCAAGCACGAAAAGTTTGCCGAACTGTTTCGATTTTACGCGTTCAGCCACTTTTACCGCGGCGTCGAGTTGGTGTTTTTGCTCATCCTGTTTTCAGCATACGGGACGTTTTCATGGTGCAACTGCTCTTGGCGTGTCGACCAGCTCTTTTACAACAACATTGAGCCACTGCAGTATGAATGGGACAAGCGATGTTATGCCAACTTTTACCAGATCTGCGTGTTGCCAACGAACCAAAACTACGGCATTATGAGTTTCTCGCTGTGGATTATTGCTGGCACTTGGCTGTGGGCGCCGTTCTTCTTCAACCCGAGCGGCCTGGATTGGGACAAGTGCATTGACGACTATAACGACTGGCAAAACTGGCTGCAGACCAAGAACGACTCGTCGGAGAGTTGGTTTGGGTGGTGGTCGAACGAACTCGAATACTTGGAGCACTCTAGCGTGAGTGCGCGCGTCGTCCAGTTTTTGCGCAAGTGCCGTTTCTTGTTTGTTGCGGTTGGCATTTATCTGCAGCTCATGTATCGCTTGTTTTACAAGGACCAGAACAAGGTGATCGTGTTCGACTTCCAAAGGAACTTCATTGAGTCCCTCAAGCCATTCATCATTGTCGGTGCATTGGTGGTGGTCATGCTGCTCTTGATTTGCTGTGGGTACTGCGCGAGTCGGTTTTCGAAGCGCAGTCAAATGAAGCAGAAGAAGTTGCGCAAGATCAAGTTCAACGTGAGCTTCTTCATCATGGTGCTCGTGCTGTTCTCGCTGCTGTACTTGACCATTTTGCAGCTCGTCGAGGTGTTTTTGATTGTTGTGCTGGCCGTGTACTGGTTTGTCCAGTTTGCCATCGTGCGCCTCAAGTCGAACCATGTCGTGATCCTTGCAATGGCCAAGAGCTTTGACCGGGCCGTGGGCTGGATCGTGTTTGGTCCAATTTTGTTTATCGCCATGTTTATGCCGTTCATTTCGTCGTTCCAGCAACGCGTGATGTTCAACAGCGCATTTACGTCGGGACTGGAGGTGTCCAAGCTCTTTTCCCACGACGTCATGCCGTCGCACACGGTCAAGACCAAACGCTCCAAGAAGAAGAAGCGCGACGAGTAATTGCGATTTTTGTATACCAAAGAATACATTTATAAATTCGTCGCCATTTTGGCCATTGTTGCCACAGTGGTCATTCGTTTCCAGTGACGAAATTCGGGTTTCATTCGAATTAAAAAAAAAACAAATTCGATTTTTCC\n>XM_050630547.1 PREDICTED: Bombus huntii uncharacterized LOC126871580 (LOC126871580), mRNA \nTGAAGATCTTATTATATTGTACATAGAGAATGAAGTGGATAGTTTTTGGTATCACATTAGTAATACGCAATTATATAATATCCTGTCAGGATATTGTATTTCCAAATAATGAAGAGATATCTCACGTGAGCGGCAATGCGGCGATAACAGAACGTATTCCAGTGGCTGCACCAAATATATGTCCCAAAGGCATGCTTCTTTATCCTGGAGCTGGAAGTAAAAGTACATGGGTATGCGATTGTAGACCTAGATTTCTATATTTTCCATTGAATGATAGTTGTCATGAAGCATATAGACAAGGACCTTGTGCACCACAGAATTATGTTGTACTTCCTAAGGATGAAGTTATACCAAAGTGTGTGAAAAATCCTTGCCTGGAAGACGGCTTAGTACAATATAATAATACATGTTATCCTCTAAGAACTACAGGTGGTCCTTGTGCCCCTAATGGAGTAATAGGAGTGAATGAAACTACATTTGACTTAGAATGTATGTCAACAGATATTGCACCATTCATAATTATTGATCCACCTTTAAGAAAGTGTCCCGTGGGAAGCCGTAGGAATGTACTTGGAATATGTAGAGTAATTTTAACCTAATATGTTTCTATTTAACAAATTTCTGTTTTTTTAATAACCTGGTATTTATTTGTTTGGCCTCTTTCATATAATAAATATCAATATATTATTATAATTCTGATATATTACGAGAATATATATAACATTTATATTTACAAAATATAGTTCTTATTACATTTA\n>XM_020521000.2 PREDICTED: Rhincodon typus raftlin family member 2 (rftn2), transcript variant X1, mRNA \nGTCTACAACCATTTTGGAACTTTCTACTTCAGAGTTTCCATCTGCTGTTTGGACAGCCATCTGACTGCGCCCAGAGCACTTCTTCACATCGCAGATTCTGCCATGGGTTGTGGGCTACGAAAGCTGGAAGAGCCTGATGATAGTAGCCCTGGCAAAATATTTTCTACTCTGAAGAGACCACAAGTGGAAACAAAGATTGATATTTCATATGAATACCTTTTGCTGGATTTTACTTTAGATATTGGTTCAGCAAACCCAGATGTTATTAAGATCTCCTCTCTTCTGGATCTTAATTCCAAATTGGAAGCATACTACAAGAGAGGATATGTTGTTGTCACTATCCACCCTACAGTTCTTTCTATGGGGCAAAGAAAACGATCTCCACTGAGTTACATTTATAGAGTTATATTAACTAAAGTAAGATCAGGTATAAAGACGTCAGAACAAGGAGAACCAAGACACTTAAAGCTAGTTGTTGAAGAATGGTCTGTGAGCAATCAAACACTTACCATTGATGTTGTAAAAGGACTGTTAGAAAAGGTGAATGACTTAACTAAGAAAGGAATGAGGTTTGTCGGATTTTTAAATCCACTCAGTACCCATTCAAAGGCCTGCAATGGTACAAAATCATCAAGAGAACTAGATGCAGATTTGGGACAGGATGTTGACCTTAAATTGCCAGATCAACAAAAGCAAAACCCCGATAACCATATAAAGTGCAGTGAGGAGACTTTTACCAAAAAGCCAATGGAATTTGCAACAGAAAGAGAACACTGTTGCAGTAAAGTCACTGATGTTTTAGAGAATAGACCAGCTCCAGAGGAGGATCTTTTGCATGGAAGAGAGAAAAGGATTGGAAACGAAACCTGTCCTTGCAGTGAACCAAAGGAAGATTTCAAACTGTTTGCTGTGTTCAATGTGTCGGATGAAGACTTCAGTGAACGGTCCTACCATGAAGGCAATATATCACTCAGAGTAACAAGGAAGGGCCAAACCATTTGTACCCTGGAGGCAGATTGGTTGGAAATCACAACATCTTATTATAAAAGTGGGATGTCGTTGGTTGATTCATTCATAGTTTGGGAAACAATGAAAGGAGACTACTTGTCCAAGTCTGTGGATGGAATATTTATTTATGAGGAACATCATTTGGGGGCTTTTGAGTCAAGCAAGATACCAAATGATGCAATTGTTGTTGAACAGTGGACTGTCATTGAGGGTTGTGAAGTAAAGACTGATTATGGTCCTTTGCTGCATACACTGGCAGAGTTTGGATGGCTGGTTACTTGTGTGCTGGCCACACCTATCATTCGCCATGACAGTGAAGGAAATTTAGCAACAAAACAAGTGATATTCTTGCAGAGACCTGCCATAACCAACAATGATCTAAGTCTAAAACCATTAGAGAAAAGATCTACTCGGCAAGCAAGTGAAAGAACCAAAAATTGGAACAGAAATGTGGGTGTGACCACCGGTAAAAACAAGCATTCAGAAACAAAGTCTCCTGAAGATTCTTGCACCACTTCAGAAATCAATTCACATCAATATGGAGGCATTTCAGGCATGAGTCATATTGATAGTGTTTCCAAAGACTTGGATGATGGGCAGCTGGATCAAGAGGAAGAAACAACTCAGGTTACCTGCATATAACATTGCAGAATTCAGATCTGTATTGAAGACAACAGTTTAAAGAAAGCAGACTTTCCAGAGTATAATATGATTGATAATAGCTAATGGCTTTGCAAGATGTGATTTTTGTTTTTGTTCTGTATGAAAGTGTGCTCTTTTTTAAACATTTTCTATAATCCTACAGGGAATAAAAGTATTAACAAATATTTCAGTTCTCGGGATTTATGCAAACAGATCCAGGCTTCTTTAGCAAAGTAGAACTGTTGATTACAATTTGCTATCAGAAAGAGCTTCACCTGATGATTTAAAATTACGTTCAACAAATTTAGGAAAGCCATAGCAAAGCATATTTACAGATGTTTATATTTACTTTTAAATTCTCAAGTAATATTTTTGTTACTTTTTCTATTTGTATGTGCTAATTTTTAAAAATCATTTGTTACTTTTTTCCTGTCATTTTTCTTTGCATATTCTTGGGATCATGTTTTGCAATCAACTTGTTCAAGAATATGCTCATGCAAAACAGTGCTGTCTCTGCAAGATCGAAAGGAGTCATTTTTGAGGATTGTTCAGTCAAGGTAACGTTAGTTGTCCTGCTAAGTAATATATGTATGGCAATGAACTG\n>XM_047696666.1 PREDICTED: Lutra lutra methyl-CpG binding domain protein 1 (LOC125081859), transcript variant X5, mRNA \nCCAGCGGGTTTCCGGTTCCGGGAGCAACGAACGGCCGCGGCAGCGACAGCTACCGCTTCAGAGGAAGCGTCTGCGGAGGAGGAAGAAGAGCAGGGCAAGGCGGGAGTCACAGGCGGGACCCTCGCCATGGGTCCGCGGACCTAGAGCGGCGGAAGCTACCGGCCTGGTGCCGAGCTGGCCGCTGCTCCTTCCCGTGGCTTCCATGGCTGAGGACTGGCTGGAGTGCCCAGCCTTGGGCCCTGGCTGGAAACGCCGTGAGGTCTTTCGAAAGTCAGGTGCCACCTGTGGACGCTCAGACACCTATTACCAGAGCCCCACAGGAGACAGGATCCGAAGCAAAGTTGAGCTGACCCGATACCTGGGCCCTGCGTGCGACCTCACCCTCTTCGACTTCAAACAAGGCATTCTGTGTTATCCAGCCCCCAAGCCCCAGTCCTTACCTGTCCCTAGCAGGAAGCGGAAGAAACCTTCACGGCCAGCCAAGACTCGGAAACGTCAGGTTGGACCCCAGAAGGGTGAGGTCAGGAAGGAGGCCCCAGGGGATGAGACCAAGGCTGATGCTGACACAGCCCCAGCTTCACTGCCTGCTCCTGGGTGCTGTGAGAACTGTGGAATCAGCTTCTCAGGGGATGGTACCCGAAGACAGCGGCTCAAGACATTATGCAAGGACTGCAGAGCACAGAGAATTGCTTTCAACCGGGAGCAAAGGATGTTTAAGCGTGTGGGCTGCGGGGAGTGCGCAGCCTGCCGGGTAACCGAGGACTGCGGGGCCTGCTCCACATGCCTTCTGCAGTTGCCCCATGATGTGGCCTCGGGGCTGTTCTGCAAATGTGAGCGGAGACGGTGCCTCCGGATTGTGGAAAGGAGCCGAGGGTGTGGAGTGTGCAGGGGCTGTCAGACCCGCGAGGACTGTGGCCGTTGTCGAGTTTGCCTTCGCCCTCCCCGCCCTGGTCTCAGGCGCCAATGGAGGTGTGTCCAGCGGCGCTGCTTACGGCACCTTGCCCACCGTCTCCGTCGCCACCATCAGCGATGTCAACGACGCCCTCCCCTAGCTGTGGCTCCCCCTGCTGGTAAACGTAGCCGCCGCAGAGGAGGCTGTGACTCCAAGATGGCTGCCCGGCGGCGCCCCCCCCGGACCCAGCCACTGCCTCCAGTTCCCCCATCACAGCCTCCAGCGTCTCCAGAGCTGCAGCCTTACACGAACCGTCGGCAGAACCGTAAGTGTGGGGCCTGTGCAGCTTGCCTGCGCCGGATGGACTGTGGTCGCTGTGACTTCTGCTGTGACAAGCCGAAATTTGGGGGCAGCAATCAGAAGCGCCAGAAGTGTCGTTGGCGCCAGTGCCTGCAGTTTGCCATGAAGCGGCTGCTGCCTAGTGTCTGGGCAGGATCTGAGGATGGAGCAGGGCCGCCCCCACCGTACTCTCGTCGAAAGAGACCTGGCTCTACTCGACGGCCCCGTCTGGGCCAGATACTGAAGACCTTGACCACACCCACAGTCAGATCAGGCCGTGCCCAAACTCCAATGAAACAGGAAACGGGCAGTGGCTTTGTGCTACCCCCACCTGGCACTGACCTTGTGTTCTTACGGGAAGGTGCAAGCAGTCCTGTGCAGGTGCCTGGCCCTGCTACAGCTTCCACAGAAGCCCTCTTGCAGGAGGCCCAGTGCCCAGGCCTGAGTTGGGTTGTGGCCTTACCCCAGGTGAAGCAAGAGAAGGTGGATGCCCAGGAAGAATGGACACCGGGCACAGCCATCCTGACTTCTCCTGTATTGCTGTCTGGCTGCCCCAGCAAGGCAGTAGATGCAGGCCTGCCACCTGTGAAGCAAGAGCCATTGGACCCTGAGGAGGACAAGGAGGAAGAGAGCAAGGATGACTCCGCCTCCGACTTGGCCCCAGAGGAGGAGGCAGGAGGGGCTGGCACACCCGTGATCACGGAGATTTTCAGCCTGGGTGGAACCCGCCTCCGGGACACAGCGGTCTGGTTGCCAAGTCTGCAGGGCAGGCAATCGGGAAGGGAAGATGGATGTAAAGTGTGGGAGACGGAGGACACTTTGGCGTGCACGAGCAAGAGCTGGAACCGGCGAGGATGGCCTAGAACCCATGTCAGTGTCTCACCATCTCCAACTGCGATAATGTGGGTGTCCTGCAGAAGAAGCTGGTGCCCTTCATCACAGAGTTAAATACTCATCTGGCCCAGGAGTTAGAGAAGCAGAAGGAAGATCCAGGGGAAGTGGAGCAGCTGCAGGCCTGACTGCAGGCCTGACTGCTGCCCCACACCAACGAGGTGAGCCAGCAGATAAGTGACAACATGTGTGAACTGCAACAGTGCCTGGTGCGCCTGCACCAACCTTCCGAGTGTAAAAACAGTATGCTGCTGCTTCACTTCTGTCCTCCAGTTACCATGCAAACTGTCTCTTGTGGCCCATCCTAACCGGAAGCATACAGGGAAGGGAGTTCTGGGAAACGTAGCCTAGTCAAGGTGACACATTACAAAGCCACCCTGCCATGAATCAGCTCCCAAGGGTCTCACTGCTCACCTGAGGATAACTTGATAAAGCTGCGTTGCTGGAAATGCAAAGCTGAAGACCATGGATTTCATGGTGACCCCAGCAAGTACAGAAATACTGTCAAGCCTACCCAGAAAAAAACTGGCTGGTCTCGGCTATTTTTGTGTCATTCATTCAAGTAATGAGAACCTGGCCCATGGTAGGCACTGTACTTGATACTGGGATACAGGAATGAAAAAGATACAGTCCATGCAATTTTATTAAATAACATAAGTATGTATTACAAATGGTGAATGGATATCCAACTTTATCATGGAATTTAATGGTGAAAATAGAGAATTCAGGAAACTGTCGGGAGGAAAGCTCTTGCGTGAACCTTGGGGCACAATAGGAATTGGAAATAATATAAATAGTTTCTATCTCTGAGCTGTTCTATTTTAAAATTATTTTAAAATGATTTTGATTGTCCCGTTTACTGTTTTATATATTTAGTGTTTCTTTGGGGAGTGTCTTGATGGTGTAACAGTGTTGACTCTGAGAAAGTGGGATGGTGGGTGGCAAGATCAAGGTCAGGTTCTGTCGAAGGACCTTGGGCCAACCACTTCTCTAGGCCTTGGGGCTTGGCTGAAGGTGGAGGCTCACCGCTGGTCCCGGTCCCGCCCCTCCACCGTTTTAATAGGCCCCCGCCAGGGGGCGCCGGGGCCGCGGTCATCCCACCACTGCTCTGGGAAGACGCAGCCCCTCACCCCTGGCCAGGGCGGCCCGGGGGCGTGGCCTCCACCCCGGCCGAGACA\n>XM_019948349.2 PREDICTED: Tursiops truncatus tripartite motif containing 44 (TRIM44), transcript variant X5, mRNA \nCCTGACGGGGACAGGGAAAGTGGAACCGGGGCGGCGCGGGGGCCGGCGGCACCGCGCTCGCCGGGGCAGCGGGGGGGCCGAGCGGGCGGCGCGGCGCAGGGGCCGACGGGGGCGCTGGGCGGCTGCGCCGGAAGTGCCCAGAACGCCGGAGGAAGCACAGCGGCCGCCAGGCTGCCGAGCCGGCGGCGAGGCCCTGTGCTCCTGGGCTGGGTGCAGACTGCTGGGAACAGGCGGCAGCGGCGCCGAGGCTGCGGGACACGGCGCGGCCAGTCTGCGGGACGGGCCCCAGGTGGGGAGGAGGACGCGAGGAGGCCGCGCCGAGGCCAGGCAGCGAGCTCTGAAGCCCGGAGACCCGGGCCGCGGCACAGCTCCCACATGGCCTCCGGAGGGGGCGCGGCCTTCGAGGAGCTGCCGCCCGACGGCACGTGTGATGAGTGCGAGCCAGACGAGGCTCCGGGAGCCGAGGAAGTGTGCCAGGAATGCGGCTTCTGCTACTGCCGCCGCCACGCGGAGGCGCACGGGCAGAAGTTCCCCAGGCACCACCTGGCCGAGTACGTCCACGAAGCCGCCCAGGCCTGGACCCCGGGAGCCCGGGGGGATGGGGCGGGAGAGGAAGAAGTCGAGGCCCAGGTAGAGAACGAGAAGGCCCTAGAAAGCGAGGCGGGGGAAGAGAGCGAGTCCGAGGAAGACTGTGAGTCCGAAGAAGAGAGTCAGACGGAGGAGGAGAGCGAAGACGAGAGTGAGGAAGACAGTGAGGAAGACAGTGAGGAAGAAATGGAGGATGAGCAAGAGAGTGAAGCAGAGGAAGACAACCAGGAGGAAGGAGAATCGGAAGCGGAGGGAGAAACTGAGGCAGAAAGCGAATTTGACCCAGAAATAGAAATGGAAGCGGAGAGAGTGGCCAAGAGGAAGTGTCCGGACCATGGGCTCGATTTGAGTACCTATTGCCAGGAAGATAAGCAGCTCATCTGTGTCCTGTGCCCAGTCATTGGGGCACATCAGGGCCACCAGCTCTCCACCCTAGACGAAGCCTTCGAAGAACTAAGAAGCAAAGATTCAGGCGGACTGAAGGCGGCTATGATAGAGTTGGTGGAAAGGTTAAAGTTCAAGAGCTCAGACCCTAAAGTAACCCGGGACCAGATGAAGGTGTTTATACAGCAGGAATTTAAGAAAGTTCAAAAAGTGATTGCTGATGAGGAGCAGAAGGCCCTTCATTTAGTGGACATCCAGGAAGCAATGGCCACAGCTCATGTGACTGAGATACTGGCAGACATCCAGTCCCATATGGATAGATTGATGACTCAGATGGCCCAAGCCAAGGAACAACTTGATACCTCTAATGAATCAGCTGAGCCAAAGGCAGAGGGCGACGAGGAAGGACCCAGTGGTGCCAGTGAAGAAGAAGACACATGAAGGCCTGCCATCCCCAGTGGAAAATCATCCCTTCCCCTTGTGTGTATGTGACGGCGTATATGTAATGGCTTCTGATTCCTGTGAAAGCTGCCCAGCAACAAACGTGCTTCCACCAGATGCCTCCCCAGATCCACAGCAGGCACATAGCTCTCCAAGGAATGACCAGTTTTACTCTTGCTGACTGTGCTTCTCATTCTCTTGTCGTGATAGGTCAAGGAAAATGCCCCTTTGATCAACCAGGAGCAATTAAAGGGTCCTTCAGGTAAATCCCTCGATGGCTGCTTTGAACTTGCTCGGGAAAGCCAGCCCCTGTCATAGTGTATACCCAAACAGTATCACTTCATTAAGAAGGATCTGGAATAATCTTGAAGGGCAGTCAGAATTTGTTTCCCTACCTGCTAATAAAACCACACTTTATTCATATTGAAGCATGGAATAAATGAGGGAAAAGTAGGGGCGAATCAACCCACATAGTTCGTCTCTAAAAGTCCATTTAATACATCTGTGAAAATGTGGTTTCATGAAATAATATGGACGGCTTGAAAACAGATAAAGAGTTAAAAGTTAGAAATATATAGAGATATTTTTAGTACATGAGGTTATCCAGGATTTCAGATTCATAATTCAGTGCTGTGGAAATGAAAA\n>JF973483.1 Nocardia cyriacigeorgica strain DSSHB7 16S ribosomal RNA gene, partial sequence \nCTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCGACAGGGACGAAGCGCAAGTGACGGTACCTGTAGAAGAAGCACCGGCCAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTGTCCGGAATTACTGGGCGTAAAGAGCTTGTAGGCGGCTTGTCGCGTCGATCGTGAAAACTTGGGGCTCAACCCCAAGCTTGCGGTCGATACGGGCAGGCTTGAGTACTTCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGAAGTAACTGACGCTGAGAAGCGAAAGCGTGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGGTGGGTACTAGGTGTGGGTTTCCTTCCACGGGATCCGTGCCGTAGCTAACGCATTAAGTACCCCGCCTGG\n>XM_004257108.1 Entamoeba invadens IP1 hypothetical protein (EIN_015440) mRNA, complete cds \nATGAGTCAATTGGATGGCTATAACATGATGATTGTTTCAAAATATTTTAAAGATATTAAAGACTTTGCCACCCTCATTTTTGTGTGCAAGAAATTTTCAGACACCGCTGTTAAGTTTCATTTCAACCCAATACCTTTAACTCGAGAAACACTCAAATTCTTCCCACATATTGAAACACTCTTTTTGTACTCAATAAAAGACCCGATACTCCGTGACGGGAATATTCAAAGATATTTTGCGAATTTCACATGTAGTGTATGGGGATACAAATTCTATTTGTCTCATGGTGTCGAGTGTCGAGACGTCGGGTTTTTTTATAAAGACTGTCTGTCAGAAGAACCGCCAGCAATTCCAAAAGTAGTGTCATCCTTCAATCCATATTGTTTTAGTCGTCACGCGATGCCAACGATTATCGTCACCAAGAACATTCGAAGAGTTGCTGAGCTGTCGTTTGCAACAGCAAATGTTCGGAATGTTGTTTTTGAAAATTTGATAACAGACCTTCCATTTGGGACATTTTTGAATTGTAATCACCTCACAAACATCACTTTACCACAGACAATCACTTCTATACAAAACTTGTGTTTTTGTGGGTGCATGTTTTCCAGTATAAAAATCCCCGATGGCGTGGTTTATATGGGAGAGCAGTGCTTTTCACATTGTATAAAATTAAGGGAAATCCATTTCCCTCCAAAAGTAACAAAAATTGAAAATTATTCTTTTATAGGAAATGACGCACTTTATTTTATTGATTTTAAAAACATTAGCGAGATCGGGGAGAGTGCCTTTTATAAGTGTAAAAGTCTTCATAATATTGAATTTGGTAAAAGTGTCAAAAAACTCGGGGAAAGTTGTTTTTCGAATTGCACAAATTTAGTTTCTGTAAGATTCCCTATAACACTCACTTCGATCGGTTCGCTTGCGTTTTCTAAATGTAAACTACAACTTGTGGATATCGATTATACACTCGAAGATAACAGGGAAGTGCGTTTTGTTCAAGAAAACGTCGTGTTTCAGCACAACAAAACGCTTTTATCATTTTATTGTAATAATCCTGATATTAAAGTGAATGGAATTAATGTCATACAAAATACGCATTTTGTAATTTCAAATGCTATTTTGTGTTTGTCCAATTATTGTTTTTCAAATTGTTTTGACATCACAGAAATGGTCATTCCAAGTTCAGTTTCAAAGATTAAAAATGATTGTTTTTACCGCTGTGCAAAATTACACAAAGTGATTTTTATGGAAAACAGACAAAGTGATCTTATTCTTGGCCAAAACGCATTTTATTCTTGTGCTCAATTAAGTGTTATAAATGTGCCAAAAGAACTGACACGTGTTGGACAAAAGTGCTTTTCACAGTGCAATTTTTCCATTTTTGATTTTCAGAAGAGCACAAAAATAAAATCAATTAAAGCTTTTACTTTTGAAAATGATAAAATGCTCACCTCAATCCAAATTCCGTCCACAATCACTAAAATTGGACAATACGCTTTTTGTGGGTGTGAAAAGTTACAAATTTTTTTATTTCCTACGCAATTACACAAAATAGAAAATAACTGTTTTTCTCACTGTAATTTAACAGCTCTTGACTTTGCACCACTTCACAATTTGACATCAATTGGAGCGTCTTCTTTTTCGTTTTGTTCATCTCTTCGTCAAATTTCAATGGGTTCAGTGTTAACAAAACTCCCTGACAATTGCTTTGAAAATTGCGTTTTGTTGTCCGCAATTGAAATTCCACAAAATGTGACATATTTAGGAAATAGATGTTTTTCATATTGTTACAGTTTGAAAAGTGTTGTTCTTCCAGACAACTTGCGTTTTGTTGGCCATCACTGCTTTTCGTGTTGCGCAGTTCAAAATGTGATTTGGCCATCAATTGCTTCCGTCCCAAATTTCTGTTATTACAATTGCAGAAATTTGGAATCTTTCACTTTTGCTGAACAACAAAATGCGTCAATCACAATTGGTATTGCCTCTTTCTACAATTGTATCGCGTTAAAAAGAGTTTTGTTATCAAAAAATGTCACAGAAATTTGTGATTTTGCATTTTCAAATTGTAAAAAGATTTTAACTTTTTCAATCCCACAAAGTGTGACTTACCTTTCTTCTTTCTGCTTTGAAGAGCCCAACGACATGTCCGCGCTTTTCATTGGTTTTTGA\n>XR_005782624.1 PREDICTED: Puma yagouaroundi uncharacterized LOC121013303 (LOC121013303), ncRNA \nTCCTGGAACTCATTTGTTTCTGACTCTTCGAAGACCTCCCAAGTGTAAGGTCTTTTCCTTGTAAGACTACTCCAAACAAATGCAGTGACCTGAAGACTCCCAGAATAGGCACCACAAATTCTCTAAGAGGAAGGCTTATTTCTCTCATGCCCAGCCTTCCCTCTGCCCACCTGTCAACATGTAAACCTCGTGGTGTTTAGCCAAATTCCGTGCTTTATATGTTAGTGTCCTTTATCACATGCTATATTTCAAGGCAAATGAGCTAAAACATGATAATAACTAGCAAAAGATGCCACTCCTTTCAAGAAGGGTACCGTTTAGGCAGAGAATTATAGGGGGATAAAATGGAACAAAAACCAATAAGGCAAATCTTAAGAATATGGCCAGAAGACCATCCTCTTAGAGTTATTCTGAAAAATGGAGCTAAACACCATGTTGTCTGACTCAGAGAAGGATTAGATTTCAAGGGGAAATGGATTTGGGTCCATTTCCTTGAGAAGAGTTGCTATGAGACTGAGAGCCAGCATTCTCTTCACTGAGTGTTTGAGGGATAAATGCACAGAGCAATTTAGCAGCATTTCAGAAATGTAAAGTTCTCAGAAGCCACATTCCAAGTGAAGCAGATCTTGCTGAAGAAGTTGGGATGTGTGAGTCTAAAAAGAACGCTTTGAGCCCTCTGCTTCTCTTAGCTTAAATCCATATATGGCTTTGTTGCTGTTGCTGTTTTCATTTTAAACATAACCAAACAACACTGGTGCCCAGGAAATGGACTTCCAAAGAGAGGAGGGAAAAGCCCAAAAAATTCTTTCAGCATAAAGAAGACCAGTCTTGTTTAAATCAAAGAAAGGGCGCTGCCATCCCTTCAACAGCCAAGACCACAGATCTTGAAATCTTCTTCATCTCAGTGCTCCATGCTATACCCACACTGGAGTAACGAGGGTTTGCTCAGGCTCTGCTCTCTTCAGAGGCTGAGGTGGATTCAGCCGTGGCCTCAACTGCTTATCCTGACCAAACCCAGAGGATGTAGGAAAAGCCCTTCTCCACTCAGGAGTATGGATATCATGCAGACCCCTGGAGACACGGTGGTACTCAATAAGTATCTATGAGTTGACTTACACTGAATCCGAACTAACACAGACTTGAAG\n>XM_053456309.1 PREDICTED: Spea bombifrons ADP ribosylation factor like GTPase 11 (LOC128474053), mRNA \nCTTCCTGAGCTGGACTGCATTACTTTATCCTGTAGTCACCAAACTTCTGCTTTCTGGGAAACTCTTCTTAAAGACAGGATGAAAGACAGAGCACAGAAACACTGGTCTTTCAAGGCAAAGGAGTATAGGAATTAATCAAGACGTCATCATGGGAGGTCAAAATTCAACACACAAGAAGCAAGCAAGAGTTGTGATGATGGGTCTGGACCTTTCTGGAAAATCAACTATTTTATATAAACTTAAAATGAATCGTACGATGGAGACTTTTCCTACTGTGGGGTTTAACGTGGAATCCTTAGAAATGGCTAAAAATATGTCAGTAACCATTTGGGACGTTGGTGGCCAAGACAAACTTAGATCGAATTGGAAAGAATATCTCGAAGACACAGATGCCCTGATCTTTGTGGTTGACAGTTCAGATACAAGCAGACTACCAGATGCTAGAGCAGAGCTACAGACTGTCCTGAAGGATGAGAATATGTCTGGAGTTCCATTCTTAATTCTGGCCAACAAACAGGATGTGCCTGGTGCTTTGTCTACAAATGAACTGTTACAAGGTCTCAAGCTGGGAAGCTATGAAGACAGAAGTTGGGAGATTCAAGGCTGTAGCGCATACACGGGAGAAGGTCTTGCTGAAGCCATGAGTGCAGTGTCACGTCTACTAAAAAGGGCATAAAACTCCAAATGGCTGTTTAATTTTATTTGTGGCTCTTTCATATATGTAAAATATCCATCAAAATACCGTATTCAATCATGGTTTACAAGCCGGTAGATGTTACAGGTTTGAGACTCTGGGAGTTTTACACATTTCATCGTATAATTATCTACATGGATTTTACTTGAATAAGCCATGTGTTATAAAATGATACAGAAAAAAGACGATCTAAACTCCAGTGAGTTTGTTTACACTTCTGCTATATGATGTCAACATTATGTGTCATACTGTGGTATACATAATTTTTGTTAATGAGTTAATAATGAGTAATTAAAATTGCATTTAGTTATGTTTA\n>XM_023958536.1 PREDICTED: Oryzias latipes uncharacterized LOC101166636 (LOC101166636), transcript variant X1, mRNA \nTGTCAAGAGTCAGCTAACATCCTTAAATCATGTTAGCGTGTTTTTATTTCCGCTCCCAAATGCTTTGTTGCACATCAAAACACTTAAAGAGAGTAATGCTCTTCCAGCTCATCTTAGGGTGTGTGTAATGTCTGTGTGGGAAACATTGTTTCCTCCCACTCGTTGCTAAATTGATGTAACTAGGCGGTTGAAACCACAATTATCTGAGTGTGCCATCGCCATGGGACGAAGGAGCCTGCTGCAAGTTTGTTTGCTTCTTCTCGCCTTTTTCAAAGATATGTCCTCCCTAAAGATTCGTAATAAATTGCTGGGTAAATGCCTACAGGTGTCAGAGGAACGTGCAGGAGGAGGAGTTTCTCTAGAGGGTTGCGATCCATTTTCACCCCTGCAGGAGTGGCTCTGGCTGCCTGAGGGCCATGCTCTGCGCAGTCACCACACCGGGGACTGCCTGACTGCACCGAATGCGGAGTACGAAGGCGTCCGCCTACAGCCCTGCATTTTTACAAGTGGAGTGGTCATAGTGGATGTGGGAGGAGAAGCTAGCAGCCAGGCATGGAGCTGCTCCAAGAAAGGACACCTGACTTTGAAGGGCAGTGAGCGACACCTGACTGCTTCTCATGAATCCAGTTTAGTCTTCTTGTCAGGGGAACATAAGAGGCCAGGTAGTAGGTGGCGATCTCTGGATAACCAGACGCTTTGCAGTGGCAAAGGCATCAAACAGGACATAAGCCAACCCCAACAGCAGCTGGGAAAGACAAAGCCAGTCATCTCTCCAAGTGATGGTTCAGACACAAAGAGACTCGCCGACACATTTTCAGAAAATATGTCTTGGGGACTTGAATTTTTTCCTTTAACAGAAATTCTAGATGCGGCTACAGTGGGTACTGCTGGGACAGATTCTTATCAAGCAGGAAATATGACTCATTTCTTCCTCAGTACCAAATCCCCTCAAGATCCAACCATGATCTTTTTCACTATAGACTACGGGATGGGCTGGAAGATCACAATGCTGGTGTTGACCTCCCTGGCTCTGGTCTTAGGAGCCGTCATCCTCATCCTCAGTGTTTACTCTAACAGAAAGAAGAAGATGGTTTGTGTCGTGAAGTCGTTCAATCCCAGACCAGACATGAGTGCTCCGGGATCCCCGCTGCTCAGTGAAAGAGCCCCACTGACGGAGCACGCCATGCATCTCTCCCACTCTTCCCCCTACTTACAGCGAGGAGATATTCTAATAGAATGGAAAGATGGCACTGTTACTCCCCTGTATGAGGCTTAAATGTCGATGAAGGCAGTGCAGATGTGATTGTTTTCTGTAAAAGCACGCCGGCAGCTTGTGTGTGATTTGGCATGTTGCCCCACCACAACCAGCATCTCTCCCAGTGTCTCCTGGAAGCAAAAAAAAACAAAATTGAGAAAGTGAGGTGAAAAGAAAACTCAGCCTCAGCATTATTAGAACTAACTTTGTGAAGCTTTCAGAGTAGAATGTTAGTTTTCAAAGAAAAGTTCTTAACTGAGTTGTGATTTGACAGACTCCAAGGAAGACAAACTTTACCACTTTAGAAGCACTTAAATAGTTCAGCAAAGCCACTACATCTGTCATCTGGTATCAACCTTTGCACCAGTAAATAGAAAATTAATATTTACTTGAACCATTATGACCAGCTGACCTAGTCTCTGTTTCATGACAAACACTGCTGTGCTAACTGTTTGGCAGTGCTATGTGTGCTTTATTTTGTGAACTTAATTTTGTTTAAAAAAAAATTAAGATCCCCTGTTACTACTAAGAATCCAGATTTCTTGTCTGATTTGTAGATTTTTTTTTTTTGCAGTCTGGTGGTGTTGAAAACTGTTTCCAATGTTTTAAAGGTAGAAAGCTAACTAAATTCATTTATTAAGTGCAAACTTTTGTAATTGTGTTGAGTCCTGCATGTACACTGACTTGTTTGTCCATTCATGAGGGCTCTTCTTTAGTTGTGACAAATTCTCAGTTGGCTTAAAAGTATTTTCGGTAGTGCCTCAACTGCCTTTAAAGATCATCAGATTTCAGAGTGAAGAACATCACAGGCCAAATTCAGAGATCAACTGAAAGATAAACTGAACCTTTGGATTTAGTTGCTGGTGGTAAAAGTGTGAGCAAAACTCAAATTAAAGAAAGGATCAGCTGAATTTGATTTGACCACAAGGAGATTAATGGATTATTGAATTGAGAGCATTGTGACATTGCTGGTAAATATCTTAACCCTTGTGCTATCCATGGCCCGTTAACATTTGGAGTGGGGTCATCTGGACCCCACAAGACAGTGCGCTAAACTTTTATTCTTCAATAATTTGTGAGATTCACTTGTGTCCATGGAGTATATGAAATCCTCTTCACTTTTATCCACCTTTGTCCTGGTAGGGAGTCAATGTAAGGGTGGGGTCATCTGGACCCCATAAGATAACACAAAATCAGAATAGGTGGGAAACTGTGTACTTTGGACTGTTACCTAATAAGGCAGGGCCATTTCAGGATCAAACCAGAAAAGCAGGTTTTGTCATGACGTAATCTAGGAAATTGCAGAATAACATCTTAATTATCTGTAACTGTGAAAGTACTCTGGAGCTTGTTTTTGGGTAACAATAACTGGGTAACAACTGGCATCTTGTGAAAGGGGACACGCCCTCTCCTTTTATCAGTCGGGAAGCTTCTGTTATCCGCATTGCTTCACAAGTTATCCCAGGAAAAAGAGAAATAATAGTTTGTTTAAAAACAAGAAAACTAACAACAAATCACAGGAAAAGTTTTTGTTTTAATGTTTTCTAGCCTGTAAACAAGCAATAAAATGAGTTTTATACCTAA\n>XM_018291179.1 Pochonia chlamydosporia 170 vacuolar ATP synthase (VFPPC_13402), partial mRNA \nATGGTCTCCGAGCTTTGCCCCGTTTACGCGCCCTTTTTCGGCGCCATGGGTTGCACCTGTGCCATTGTCTTCACCTGCCTGGGTGCTTCTTACGGTACCGCCAAGTCTGGTGTTGGTATCGCCGCCATGGGTGTCCTCCGCCCTGACCTTATCGTGAAGAACATTGTTCCCGTCATTATGGCTGGTATCATTGGTATTTACGGTCTGGTCGTGTCCGTCCTTATTTCCGACGGTCTGAAGCAGGAGCTCCCTCTGTACACTGGTTTCATCCAGTTCGGTGCTGGTCTGGCTGTCGGCCTTGCCGGTCTTGCTGCCGGTTTCGCCATCGGTATCGTTGGTGACGCTGGTGTCCGAGGAACTGCCCAGCAACCCCGTCTCTTTGTCGGCATGATTTTGATTCTCATTTTCGCCGAAGTCCTGGGTCTGTATGGTCTCATTGTTGCTCTTCTCATGAACTCTAAGGCTACCCAAGATACTGTCTGCCAGTAG\n>MN512539.1 Penicillium crustosum strain MMS small subunit ribosomal RNA gene, partial sequence; internal transcribed spacer 1 and 5.8S ribosomal RNA gene, complete sequence; and internal transcribed spacer 2, partial sequence \nTTTCCTGAACTTGCGGAAGGATCATTATCGAGTGAGGGCCCTCTGGGTCCAACCTCCCACCCGTGTTTATTTTACCTTGTTGCTTCGGCGGGCCCGCCTTAACTGGCCGCCGGGGGGCTTACGCCCCCGGGCCCGCGCCCGCCGAAGACACCCTCGAACTCTGTCTGAAGATTGAAGTCTGAGTGAAAATATAAATTATTTAAAACTTTCAACAACGGATCTCTTGGTTCCGGCATCGATGAAGAACGCAGCGAAATGCGATACGTAATGTGAATTGCAAATTCAGTGAATCATCGAGTCTTTGAACGCACATTGCGCCCCCTGGTATTCCGGGGGGCATGCCTGTCCGAGCGTCATTGCTGCCCTCAAGCCCGGCTTGGGG\n>XM_002370192.2 Toxoplasma gondii ME49 ribonucleoside-diphosphate reductase large chain mRNA \nCCGTTTCTGGGTCGTTTTTTGTCTTGGCGGTTCTCTTCGTGTGACGCGTGGCGCAGAGTTTGTCCGTTTCCGTTTGTCAAAATTTCCGTTTCCGCGTCCGCGGTGTGGGTTCGAGCACCGCTGACCAGCTTGCGTTTTCCACCGACGAAACTGACACATGCGGTGAGCCTTGTTTCGTTCTTTGCGCGCCGAAGCGCTCGCTGCTGGTTTCCCGCGCCTGTCTGGAAGAAGACGCCGTTCTCTCTCTGTGGATACCAGACGCCGTTAACGCTGCTGCCAGACAACTTGAAAGTGTTTTTCCGAGAGGGCTTTTCCGCAGTTCCAAAACATTCCACCGTGTTTCTACCGTTTTGTCGGGCTTTTTCGCGTGCACGCATTTCCGTGGGACAACCATCGTGGCCCCTGCTCGTCTTCCACTCGCCACCGTAAAAGCTAGGTTTCCATCGCACCGTCAGCCACCGTCGACCGTCCACCCGCCCTCCCCCCCTGGCGTGGCCCGTCTCGCGACTCACTTTCCTCGGAACCGAGTCGCGATTGTGTGCAACGAAGAGCGAATTTTCTCCATTTCCAACAAAAAGTGTCTCAACGAAGCGGAGAAACATCGCCACACTACTGTTCTCCGCCCCATTCTTCCGCATTTCCAACCTGTATAAAGGTATCCCCTTTTCTCTGTCGCGGATGTGTGTGTGTTCTAGCCTCTGTGTATCGGTATGCGATGTCCAAAAAGTAGCTGAGTGCGTTGGCGTCTGTGTGTGCGTTTCCTGTTGTCTCCTTTGTCCTCGGAGTCCCTCCTTTTGATCGTTTCCAGATTGTTTCCTCTTGGCGCTCGCCAGCCTCCGTTCTGTCGCAGACTCAAAACCGCCGTGTCCACCCGCTGTTGGCGGCTACACACCCGCCACCTTTGTCTTCTATCGGTGTACACACCCCCCTCCCACACTTGCGTGCGTTGCAGAGAACGCATTTTTTTCTTTTTCCCCGCTTCCCCGCGTTTCTCTCCTCAGTCCCCCTTTTCCCAGTGCCCCCGGAAGTCGCTCGTGTGCCCGTCTCAACTCTGGTGTGCCTGTCGCCTTCCCGCCGAGCAAAAAAATGGAAATCCCGGCGCCCTCGAGTCCGACCGCTCTCAAGGCGGCCGTACCCGTCTCGTCTCCGACCATGGCTCTGCACACACACGGGTCTCTCAGCAGTTCTTTTTCAGAGGCCGTTTCGCCGTCCAAAAAGACAGGATCTGCTGGCGCCTCTCCCGTCCACGGCGCAGGTCGTGGCATGTACGTCGTCAACCGCCGCGGCGAAGAGGAGCCTGTTTCCTTCGACCAGATTCTGAAGAGAATAGAGAAGCTCTCTTTCGGCCTCCACCCTCTCGTCGACCCCGCTCGCGTTGCACAGGCCGTTATCAACGGCATGTACGCGGGGATTCGAACAAGCGAGTTGGATGACCTGGCTGCACAGACCAGCGCTTACATGGCCGCTTCTCACCCTGACTTCTCCAGACTGGCTGCTCGGATCGCCATCGACAACCTCCACAAAAACACAACAGACAACTTCTTGACTGTCATCGATCAGCTGCATGGCTACGTCGACAAACTGGGGCGCGAGGCGAAGCTCGTCAGCACTGAGGTGTACGAATTCGTGAGGGAAAATGAGCAGGCGCTGAACGAGGCTCTGAACTACTCCAGAGATTTCGACTACGACTATTTTGGATTCAAGACACTGGAACGGTCGTACCTCCTGAAGATCCACGACCGGATTGTCGAGCGTCCCCAGCACATGCTCATGAGAGTCGCATGCGGCATTCATTGTGGGGATGTGGAGAAAGCAATCGAAACCTACGAACTGATGAGTCAGAAGTTCTTCACGCATGCAACGCCGACCCTGTTCAACGCCGGCACCCCCCGCCCACAGATGAGCAGCTGTTTTCTGCTGACGATGCAAGAGGACTCGATCGATGGAATTTTCAGCACACTGAAGCAATGCGCGTTGATTTCCAAGACAGCTGGGGGCCTCGGTCTCGCCGTGACAGACATTCGAGCCACAAACAGCTACATCCGAGGAACGAATGGCTACTCGAATGGCCTTCTGCCGATGCTCAGAGTCTTCAACGACGCCGCGCGCTACGTCGACCAGGGCGGCGGCAAACGCAAAGGCAGCCTCGCCATTTACTTGGAACCTTGGCACTTTGATGTTTTTGATTTCCTCGACATCAAGAAGAACCATGGCAAGGAAGAGCGACGGGCGCGCGACCTCTTCTGCGCCCTCTGGATCCCAGATCTCTTCATGGAACGTGTGAACGACAACGCGGGGTGGACGCTGATGTGCCCTAACGAATGCCCCGGTTTGACGGAGGTGTGGGGCGACGAATTCAAAGAGTTGTACGAGCGCTACGAACGCGAAGGTCGAGGCCGGAAGACGATTCCAGCTCAGCATCTTTGGTTTGCGATTCTCCAGGCGCAGATCGAGACGGGGACGCCGTACATGCTGTACAAAGACGCATGCAATCGGAAGAGCAACCAGAAGAACTTGGGAACGATCAAGTGCAGCAACTTGTGCACAGAAGTCGTCGAATATACGAGCAAAGACGAGGTGGCTGTCTGCAACTTGGCCTCCGTCTCGCTGCCCAAGTTCGTGGACCGCGAGAGCCGAACTTTCGACTACGAACACTTGAAGCGAATCGTCAAAGTCATGACGAGAAACTTGAACCGCGTGATCGATCGAAACTACTACCCAGTCCCAGAAGCGAAGAAGAGCAACTTGCGGCACCGACCTGTCGGTTTGGGAGTCCAAGGTCTCGCAGACGCCTTCATGCTTCTTCGCTATCCGTTCGACAGCCCCGAAGCTCGCGTCTTGAACAGAAACATCTTCGAGTGTATCTACTTTGCCGCTCTCGAGGCCAGCTGCGAACTCGCCGCCGAAGAAGGCCCCTACGCGACTTACGAGGGATCGCCGGTGTCTCAGGGCATTCTCCAGTTCGACATGTGGGGTGTGACTCCGTCGAGCGGTTTGTGTGACTGGGATGGTCTGAGAGAGAAGATCAAGGCACACGGAGTGAGAAACTCGCTCCTCGTGTCTCCGATGCCTACGGCCAGTACCTCTCAGATTCTGGGGAACAACGAGGCGTTTGAGCCGTACACTTCCAACATTTACTACCGCCGAGTGTTGAGCGGAGAGTTTTTCGTAGTGAATCCACACCTGCTGCGAGACTTGCTCGAGCGGGACCTGTGGTCTGAGGACGTCAAGCAGCAGCTGATTGCGCACAACGGCAGTGTCCAGAACATGGACGTCATCCCAGACGACTTGAAGGCACTGTACAAGACCGTTTGGGAGATCAAGCAGCGCGTCGTCCTCGACCTGGCGATCGACCGGGCACCGTTCATCGACCAGTCTCACTCGCTGAACATCCACATGGTCAATCCAACCTACGCGAAGCTCTCCACTATGCACTTTTACGGCTGGAGAGGCGGCCTGAAAACTGGGCTGTACTACCTCCGGACGCAGGCGGCAGCGGACGCGATCAAGTTCACTGTCGACTCGCAACTCGCCATGAGTGCGAAAGCGAAACTCAGCGGCGCCACTGTGGGAGCTCTCACGACGACCAGTTCCGGCGCCGACGAAGACAAGCGACAAGACGTCGCAGAGACGGAGAAAATCGAGCCTGTAGCTCCCGTCTGCAGGTGGAGACGTACAGGCGCTTCTCCAGATGAACCCTGTGAAATGTGCTCAGGCTAATCGCGTGCGTCAGCATGCAACGTACATATACACATATATATACATATATACATATATATATATATATATATTTATTTATTTATATATTTATTTATTTATATTTACATATAAAAATTTGATATAAACGAAAATGCATATGCATACACTTGTACACAGCCAAATGTGTTTCCATATGTATAAGTGTGTGAAGAGTGTACAGTTGTCTCGTAGAGGCGGACGGATGGGGATTCGATCTTTTGGGCTGCTCAAGGTTGCATGCGTCGCTTCTGAAAGCAGAGGGGGAAAAGAAGCACGGTGAGGAGAGTCCGAAACATTCTGCGCGGGCGTTTCTACAACTTGGCACTCGCGAGAAAACAGTGTTTGTCAAAAACAGAATTCTTGGGTCTTGTCTGAGTCGCGGAACCTTTTGTATTTACTCGAACGTTTGTACGAGAGAGCCCTGAGTCCTCAAATGTCGCTCCGGTGTGCCATTTTCGTGGTTTTCGAGTTTCCACAAATGCACATGCGATCGCATTTTATACATGTCGCTCTGTGCATTCACCTATATGGCTGTACAGAGAGAGGGATGATTTCCTTGCGCAGGACTCTGGGATTTGTCGACTTGTTCGTTTCTTCACCTTTGGCAAGTTTTACGCCTTCCAAGATCCGATTCACTGTTTAAAATGCGTTTTTTGTGTAAGGTGCACTTGTATGCAAAGAATCTTTCGCACTTGAGAATGGGTCTTTTCTGGCCTTCGTTTGTATCACAGTGACGCGACTCTTCTTCGCTGCAGCACTTTGTGGGGAGTCTTGCTTGTGCAGTTCTGTTTTGACAGGGAAAAGACCTTTGAACGTTTCGAGAAAGAGCGGAGAATCTGGGGACTTGGCCGTCTCTCTAGCTCCGTTTGCTTGACTTTGTGTAACTGTCTGATGCTCTCTTCGCGGCACCGTATGCGCGCCTGTGCATGCGAAGCGACTCTCACGGGCAGAACCGACAACGAAAAGGAACATCCATTGAGAAGAAAAA\n>XM_037917243.1 PREDICTED: Penaeus monodon D-dopachrome decarboxylase-A-like (LOC119568800), mRNA \nCTTGGGTCTCCCCTTTTAGTCAGCTGATAAATCCCGTCCTAGCAACGTTAGTTGGAATAGCTTCCAGTGACAGCATTTTTTTTTTCTCTCTTTCTAAAGGGATATTTCAGATATGCCTTTCGTGACGCTGACTACTAATCTGTCTTCTGAAAAAGTGGACAAGGCTTTTTCTGAGAGCTTTTCGGAAAAGTTGGCAGAAACTTTGGGGAAGCCCATAGAACGTATTTCAGTGACTGTAGTGGCTGGGCAGCAGATGTGCCGAGGAGGAAGCTGGGACCCGTTGTGTGAGGTTCACGTGTTGGCCATTGGACTCGATTCCGCCGAGAAAACCCAGAAGCCAGCTGAAGAAATAACCAAATTCTTGTCTGACCGTACTGGGATTCAGCCTGCAAGAATCTGCTTAACTTTCCGACCAGTGCTGCCTCATCAGGTTTCCGTCAATGGCGCTTTAATGGGATGATTTCAACAGCCAGTGAATGGGACTGCAACCATGAGAGAGTATGTGGAATGATCTAGCAATAAACTATTCTACAGTT\n>XM_040043500.1 PREDICTED: Simochromis diagramma methyltransferase like 3 (mettl3), mRNA \nACTGGTTTAGTTACCAACATGCCACTTTCGTAGACTGAGATATATATGTATTATATTTTACATCATATACCCTCAATCCTAAAACCACGACAAATCACTACGAAAGCGGAACGTTCAATCCCAATCAACCCGTGTGCTACCCGACACACGTTTTCGTGTTGCACCGTACCCGCTTCCCTCCAAGAGTGGACTGGATTCAACTTTTGTTTAGTTTCCCGGACACTCGGTGCTCGGTGAGGCCAGTATTGGTGTTTTTCCTTCAGCTGAGTCCATTTCGTCATGTCGGACACATGGAGCAACATCCAGGCGCACAAGAAGCAGCTGGACTCTCTGCGGGAGAGGCTGCAGCGACGACGGAAAGACCCGGCTCAGCTGTCCGCCGATGGTGGTGGCAGCACAGACGGCACCACAGTCAGGAGTGACAGCCCTGCCCCAGCAGCTCCGTCCACCTCGCAGGAGGAAACAGAAAAACCACCAGACCCTGAACTGGAGAAGAGGCTGCTGGGATATCTGTCTGATCTGAGTCTCACACTGCCAACAGACTCCCTTTCCATCACAAATGAACTCAACAGTTCAGAAACAGCCGTTAGTCACGGCTGCATCCAGAGCCTGCTGCTTAAATTCTCTGCTCAGGAGCTCATCGAGGTCCGAGAGCCCACCTCGGCTCCTTCTTCTTCTACAACTTCCTCCTCCACGTCAACCCCCACGGTGGTCGTAGCTGTGGACCACACAAAACTTTGGGCTATGATTGGATCTGTAGCTGGAGCCCAGAGAACTGGAGTCAAGAGAAAAGCAGAAGACCAAATGCACAGCAAAAGGGCTGCAGGCTTCTCGCCCTCGCTTCAGAGCTCTGCTTCTCCTCCTCACTCGTCAACCACATCGCTGACGCCGGCCTCCTCCTCAGAGCCGGGGCCTTCGGCGTCAGGGAGCGGGACGGAGAAGAAGGGCAGGAGCAGTAAAAGCCAGTCGTCTCATTTGGACATGGAGATCGAAAGCCTCCTGAACCAACAGTCCACCAAGGAGCAGCAGAGCAAGAAGTTAAGCCGAGAGATTCTGGAGCTGCTGAACGCCAGCACAGCCAAGGAGCAGTCCATCGTGGAAAAGTTCAGATCCCGCGGCCGAGCTCAGGTCCAAGAGTTCTGCGATCATGGGACCAAAGAAGAATGTGTTCGCGCTGGAGACACGCCTCAGCCATGCACCAAGTTACACTTTCGTCGCATCATCAACAAGCACACAGACGAGAGCCTCGGCGACTGCTCCTTCCTCAACACCTGTTTCCACATGGACACCTGTAAGTACGTCCACTATGAGATCGACAGCCCCCCGGAGACCGAGGGGAACCTGCTGGGGCCCCAGGCGGGGACCACAGAGCTTGGTCTCCACGCAGGGGACGCCGACAGCAATGTGGGCAAACTCTTCCCTTCACAGTGGATCTGCTGTGATATCCGCTACCTGGACGTGTCCATCCTGGGTAAGTTCGCCGTAGTGATGGCTGACCCTCCCTGGGACATCCACATGGAGCTGCCCTACGGTACTCTGACCGATGACGAGATGAGAAAACTGAACATCCCCATCCTGCAGGATGACGGCTTCCTCTTCCTTTGGGTCACTGGCAGGGCTATGGAGCTGGGCAGAGAGTGTCTCAGCCTTTGGGGCTATGAGCGTGTGGATGAAATCATTTGGGTGAAAACCAACCAGCTCCAGAGAATCATCCGCACCGGCAGGACGGGTCATTGGCTGAACCACGGGAAGGAGCACTGCCTGGTTGGTGTAAAAGGAAACCCGCAGGGGTTCAACAGGGGTTTGGACTGTGATGTCATCGTGGCAGAGGTCCGCTCCACGAGTCACAAGCCAGACGAGATCTACGGCATGATAGAGAGACTCTCACCCGGCACCAGGAAGATTGAGCTCTTTGGTCGACCCCACAATGTCCAGCCTAACTGGATAACTCTCGGGAACCAGCTGGACGGCATTCATCTGTTGGATCCCGAGGTCGTGGCTCGGTTTAAGAAACGTTATCCAGACGGCGTCATCTCCAAACCCAAAAACATCCAGTCATCATAACTGCTCACAACTCTGAAGAAGTTTGTTTTCAAACTGTTTTATTTTTTTTATACCTGTAAACATTTTTTTAATAAATATTGTCCACTAGATGCCCCGTCTCCATCTTGCCTGTGTACTTTTCACGGCTTCTCTGCACATTATCCATAATGATCGCATCGCCGGGCCTCCACACGATACCATATTATTGCTATTTTTAGTATTTTGCGATAAAACATGCAACTTATCACATTTTTTCAACAACAAATTGTGTCCTCAAAGCTAAAAGTTTGTCATCTGTTTCATCCAGTAACATAAAGTTATCTCACTTTATTTTTTTCCTGCAAAATGAGACTGTCAAGCAGACCGTCACTAAAACCTGCCATAAATGTTGCTATAAGAGCGAGCACGTCTGATATCAGTCCACAAGTTGGAAGTTATTTGCAATTTGTTTCTGATAACACTCCAATTAACTGCGATAAATCATCAAAACTCACATCTGCTGTTGTCTACACAAACAGAAATTCACATTTAACTATTAGATTTGCACTCAGTAAACTTCCTGTTCCATAGTAATATAACCAGAAAACAAACAGTAGGCAGCCAGTCGAGTTGGGCTCATGTGCCTGAGCTTATTCTGAGTTAGGAAGCAGCTTCGTTAAGGTCAGTGTCCAGTGTTGAACCGCGAGTTTGCTTAGGTGATGTTTTTTGCAGATGGTCGTGCACGAGAGGAGCCCTCTTGTTTGTAGCATTCCTGGAGTATTTGAATTTAGTTTTTAGAAAATGCCAATATTTGGTATCCTTGTGTCTTTACAACATTGTCAAGCAATATATCCCCCAGCCCAAAAAAAACACACCGGAGACATTTTGTTACAACTTATTTTATATTTGCTTAGTTTAGAATGAAGATATTTTTGACGTACTCTGGATTTGAACAAGTGATCATTAGTCTTTTTTTTTTTTTTTGATCAGCATTTAACAGTCATAGCTTTTCAATTTGGGCAAATACAGAAAGGTTTTCTTACAAAAAAAAAAAAACGTGCATTTTAAAAACACAGCCAGAGCGTCTTTTTTTCTAATTAAAAATATTGATCAGAATCAAGCAAGACTAAGAAAATACCTATCAGAAATAAGCTGCTGTGTAGCTCGGCTTATTTCATACGGTTGCCCTGTGGTGCACAACACAACTGGATTTCAGCAAGCCTTTCTGAAAGTATCAGGGCCACCGTAGATCTCACAGATGAACTATTAACTATTAACAACACTGCTGTTAAACAGGCTCAGACCTGGTCAGCAGTTAATGTCTTTTATAAAACAGCAAACCATTTTCTGTTTTATTACCTCACTTTAAACTAGCAGGGTTCTGTGTCACAGAGCAGGATTAGAAAGTTAATTCACGATGATGACTTAATGATGAGGTTTAGATAGTCACACACTTCATCACACTCAATGCTATCTTCCTCCTCTCGCTTTGTGAAACAGCCTTAATTAACTCCAGCCATGATCTAATAAGCAAATTGATCTTTTTCTACAAAGGTAGTCAAAAAAAAAAGAAATATAAAAGAAACACAGTAAAAAAAAAA\n>AY653294.1 Chlamys farreri ferritin CFB mRNA, partial cds \nATCAACCGGCAGATTAACATGGAGTTGTATGCCAGCTACTGTTACCAGTCCATGTCCTTTTACTTCGACCGTGATGATGTCGCTCTCCCTGGCTTTTCAAAATACTTCAAGAAAGCCTCAGATGAGGAACGTGAACATGCCGAGAAGTTCATGAAGTATCAGAACAAGAGGGGAGGCAGGATTGTCCTTCAGGACATCAAGAAGCCGGACAAGGATGAGTGGGGAAGTGCCCTGGAGGCCATGCAGGTTGCTCTGGCTCTGGAGAAGAATGTAAACCAGTCTCTCCTGGACCTCCACTGTGTTGGGGACAAACATGGCGATTCTCAGTTCATGGACTTCCTTGGGGGCGAATACCTGGAGGAACAGGTGAACGCGATCAAGGAGATCTCTGACCATATCACCAACCTGAAACGCGTGGGACCTGGACTCGGGGAGTACATGTACGACAAAGAGTCCATCAATGGATCCTAGACCAGAGGCACCCCCTGTGGAAGCTTCTAGCAGTGTTGAACATTTTGCCCAGAATGTGTTGTCTACTAAAATACTATATAACCACTCAGTAACATGTGAATTATAATATTCCTGGAAGAACTTTCTAGAAAAATCAATGCATAATACACAAAAAGAAAAAGAAATAATGGGCACAAAAGAAAAGTTGAAAAAAAAAAAAAAAAAAAA\n>XM_025196037.1 PREDICTED: Alligator sinensis chromosome unknown C5orf24 homolog (CUNH5orf24), transcript variant X2, mRNA \nTTATACATGTTTGTCTCCTTTATTTTGGTAGAAAATGATGCATCCTGTTGCCAGCAGTAATACAGCTTTCTGTGGGACTGGCAAGAGTTCTTGCCTTAATGAAGACAACGTGAGAGCCACTGACCAGTTTGATTTATATTCCACACAGCAAAGCAAATACAGCCACGCAGTCAGCCACAAACCAATTGCATGCCAGAGACAAGACACGTTAAATGAATCGCACTTGCAGACCACAAGTGGCAGGAATATAGAGACAAAAGATGAACTAAAGAAAAAGAAAAACCTCAACCGGTCTGGCAAACGTGGAAGGCCTTCGGGGACCACAAAATCAGCAGGGTACCGAACCAGCACAGGTCGACCCCTTGGGACCACCAAAGCAGCTGGATTTAAGACAAGTCCAGGCAGACCCTTGGGTACAACTAAAGCTGCAGGATACAAAGTCAGCCCAGGGAGACCTCCAGGAAAAAAGCAGCAAGCCTTCAGGTGTTCCAGTGATGCCTAACACATAATGAGCTGGACTTTATGCTGTACTTTACAATAGAATACTAGCAGCACGGTTTGGCAGGAAAAAGAAAGATGGCTGCCATCAGAAGGTACCTAACTTTTAATCCTATGGTGGTATTTTTCAATATCAGCAGTTGGCTTGGTCATTTAAGCAACAGTCTTTACATGTTACATTTACTTCAAATTAATCAAAGAAAACGTCAAAACCCATTGAACAGCTCTTTTCTGAAGTGTGCTTTTGTTTTGCCAGAAAGATTTTTCTTAAGCGTTCAGTCAAGACCCTACCAAACCAAGTCATTAAGAAGTGGTGTGTCTGAGAAAAGAATCACTTTGCTCTAAAATACATAAAGTAATTCTGATCAGAACTTCACTTTTTTTCCATTTCGAAGAGCTTTAAAAGGCAGAGCAGTTTAAGGTTATTTGTCTATTGGTTTCATTAGTTATGACTCTGCTTTTTTGTTACTATATGTACAGTAATGTTTCATACTATCCCTATAGACGATTACAAATAAAACAATCGCAATTGTAAAGACTTTGAACTGCAAACATTGTTTCTGACCACAAGATAAGTTTGTTCCTCTTTTTTATTATAATGCATATATTTTAACATTGCTTAAATATATTTATGAACTCTAGTTAGAGACTAGAGCTTTTTCTTTGCAATTTTTTCCAAGTAGGTAAATCTTTTTTATGAAAAATATGATGATGGTATGATCATTTTTTAGGAATGTTATGCTCATTGCTTGGTAATTTGGACCACTTTATGATTCTTTATCTTTTACAATTTGCTTTTCCACAGGTTCATTTTGGAGGAAACAATTATCCATTAAGTAACTAATATCAGCACCCTGCCCTCTGCTGTAAAAAGCCTGATTAGATACTGTGTATGTTTTTATGTCCATGAACTTGAGCTACTCGTGTGCAATTATGTGTATGGGAATGGAGTAGTGTTCATGATCTGTATTTACATCATCATATGGATGTATATTTATTAATAAAGTCAGTACTTTAAAACCAAA\n>XM_009169100.1 Opisthorchis viverrini hypothetical protein partial mRNA \nACTTCCGGCCGTGTGAGAGTATACAGCGTGCTCTCCAAAAGCTTCCGTACACCTAGTGGTGTCCGTCAGGGATGCTCACTCTCTCCACTCATATTCAAATTTGTTATCGATGAAATAATGCAACTAACGCTGGAATGTCTTCGGAACCCCGGTGTTCAAATAGCCTGTGACGAAAACCTTGTCGATCTGGAATATGCAGACGACATCGTTCTCATCTTCAGAGAAGAGGTGAAGGCGCATGTGTTTTTGGATGAACTCACGAAAGTCATTCCGTCCTTTGAAATGCACTTTGCACACACAAAGTGTAAAGTCATGTTCATGGACATGCAGCTACTGAACACGCCACTTACCATCCAAACCCTGCGTTTCAATATCGTTTCGGATTCTGCAATAAAACAGATGGAATTCGTGCCAATAGCAGAAAGTGCGATTGTAGGCGCACCAGATTGGTTTCTTTCCGGGGCAATTACAACGAGCAACTCACATTTGCGCGGGGATGTTCGATCTGCTCTCGTGGCCTTCTCCTCCAAACCCTACGTTCATATATTTTTGGTCAAAGTCAGGTCCGCAGAACAGCATGACGTCAGCTCAGTAGTCTACGTAGGTCAGATTCAAGCACACCACGAACGTATTTCAGGCTTGTCCTTTTGCGAATCCGTGAATTTTTCATCTTCATCGGATATTCAGATGTTCTCTTGTGGACAGGACGGACTTGTTCGACATTGGAGCTATCACAGTCATGAGTGGTTGCTCACCAAAGAATTGAATATTCGTTCATTCAATGAATCGCTGCTTCCCACATGCCTGGATACAATTGTGATCGCTGACCAAATTCTCGCTTTAGTTGGGACAAACAAAGGAACATTGCTTGTTTGGGCTGTGTTTGCACTATCCACTGAACCCGTCTGCTTGACAAAGAAATTCGAAAATGATTCAGCGACAACTTGTGCTTGGGAACCGTGCAACTTGTCGGGTTGCATACGCCTGGCGATTGGATACAAAAAGGGGATCATAGGAGTTTACCTCTATCAACATTCCTCTGTGACCGCAGCGTCTTCCTTGACTCAACTATCTCGTTTCTATGCCCACGAACGGGACATATGTCACGTTGTGTGGAATCCATCTGCACACGGATACTCAGAAGTGGCAGCGTCGGAACCAGAGTTATTATCTACTGGACGGGACCAGATGGTTAAAATATGGAACATTGCCAGTTCGTGGTGTTGTGGTTCGGTCAGAGTTCCTGGGAGTGCACGTTCAATGCCAAAAGAATCGGATTCATCCAACCTGACAAAAAACCAGTCTACAGGTGCTCCTTGGATATCTGCTTGTTGGTTCCCAGAAAAAACGGACAATCCGGGCAGAAATATAGTTGTATCCGGTCTTCGAGGTGAATTGTATAGCTGGTCCGATTCGTCACAGCTGGTTCGTTTACACACCGAGAACCATGGTCACTCAATGCTTGTTTTCGCTATTCGTTCTATCCCTGATATGGACGGATTGTTCTTCACAATTGGCCAGGATCGTCAAGTTATTCTCTGGACATATCGTTGTCCGACTGACTTGACATTCATGCTTCGTGTGCCTACTATAGCTGCTGGTATCTCTGCTTTGGCACAGTCGGACCACGGACATGGACCAATTGCAGCAGGCGTGGCAGATGGATCAATTTTATTGTGGCGGCACTGCAGCTCTTTACAAGAAGAATCTTCTTCAACGAACCCGGTGACTTCTTACTGGCCACGTGGTGTGCACGGCAGCTGTGTGACTGCCTTAGCTTGGCATCCTTCAGTTCGCCATGAAAGTCTACTTGCCTACGGAACCGAGTCAGGATGTGTGGAACTCATTGACACATCCAAAATTCCCAAAAGTGCTACTCAGAGGTCGAAAACGCAGCCATATATTTTTGGATCAACCGTCTATCGAGTTGCTTGGGGACCTCCACTTTTCACAGATTCAGGGAAGGATCAGGTTGTTGAAACAGCTGTCTCAGAACACGATGCGAATGGTTCGACAGATAGCACAGATACGGTGGAACAAAAAGACTCAACAAACAAATCCTCGAGTACTCCCAAGTTCTCATCTTATATATACAGCGTATGCAAAGGGAAGATTTTTTGCCACGTTGGCTTCCAGCGACCACCTTTGGATGTAACTTTGAAGTTTCCCTCTGTTCCCGGAATCTCTACAGAGGACTGGGTAAATGACAAACGAACCGACATCGCGTTTTTATACCTGGAGAATTCCACCCGTTCCGTTGACAGTCCTTCTGAAGAGAATGAGATCCGCGAGTGTTTCAGCTGTTTGATCACCGTCGGCTACCGATCTGGGTCGGTGGATGTATACGGACTCGTGAAATCGAAGGAGCATGTATCGGTCGACCTTATTCGACCATTGTGTCGTATTTCTTGTCATACGAAGGGTGTCAATTGCTTGGCTTGGTCCTTTGACCGCTACTGGCTTGCAGTTGGCACTAATGAGTCCTTCATCACTGTAACTGATGTTGGGCACATTCTGAAACAAGCCACGAAACCCAATAATCCCTCTTTCCGACAAATTTCAACTTATTTGGCACATCTGGAGGGCCACGGCAACAGGATCACATGCTTGGACTGGTCTCCGCATGAAAATGGTCTCCTGCTTTCCGCTTCATTTGATGGCACTGCAAATGTCTGGAAAGTAACTCATAGTGACACCGAGTCAGGTTCCACATCTGTAGCGAATTTTCGAGCTCATCGTCTTCGCCTATTTGCCTGTCTGTGGAGTCGTCAGGAGGCGGACCTGGCTTTTAGCGGTGGTGAACTCTGTCACCTATTTAGCTGGCGTCCATCCAAACTCGCACATAAAGAGCCACCTAATTCCCGTCGTTATAGGCCTCCTTCAGTTAAACGTGTGCCCACCGATTCAAAGGATCCCTTAATGCCGTCGGGCATTCTCGAGCCTTCGGCCATTGTTGTCACCTCACAAGAAGTAAATCATACGGAATGTGTACCAGAGCCCATACATCACACTGATACGTCCGTTGGGACAAGTGTCCCACTTGAACTACCGGTGAAATCTGTGACTACGAAAAAACCTGGTTCAGGGGACAAACGCAAGCGACCGTCTTTGTGTCCACATTTTTTGCATCGCGGTTCACTTGAACCAAGTACGACGGATCTGGGATTTTGCCCTCCTTTTCGCCTAGGCTCAAGGTTTCTGCAAGTATCGCACGTACTAAATCTGTTGAAAAACGATGTTGATCTACCTGAATCGGACTGCGATCTTCTGTTCCTATTGCCAGAAACAAACAAAACACGATCAGCCTTGGTGCGATTTTTGACCAGTGAAGCAACTCATCATCTGTCAGCATATCGTGCAACTCAGCGATCTAATGGGCTTATGCATTTGGATGCTTATTGTATCATTCTTCTATGGCTTGGACGTACTCCGTTGGTTGCGCAGACAATGTGTTCTGAGAAACACATGCCCTTTTGGTTGCTTTGGGCAGTTCAATTGGCTCAAACAACCGTACCGGCCTTCTCCGCTCCCCGAAACTCATCAGGTGATCACGCGGATATAGATCTAGCTGGAGAAAAGGTCAAGGATATGACAAGCAACAGCCCTGATGTTTTGGTGTCTTCCACGTTACTTGTTTGTGCGGGTCGACATCAGGAGGCCGTTGATTACCTATTTGCACAAGATCGAGTGAAAGAAGCCTTGTTGCTTGCACGGCTCAGACTCAGTCCCATGGACGCGAACTCAGCAATGCAGAAGTGTATTGCTCGCATCATCGAACGGCGGTTGTGTCCGGAGGTTCCGTTCGTCAGAGTTTTACATGAACTTGGAGCTGGCGAGTGGGAGCGGGCACAGACAGTTCTACGTCAGGCAGCCGTAGTTTCCCTTTCACGCCAGGACATGGAAGTTGAGCAAGTTGCAAGTAGCTGGGTAGAACTTAATATTCTCCTCAGCTGTCCGGATGACAGTTTACCGACGAATGCGTTTGTTCGATTTGCTTTAAGCTGTCTGGCCGTTGGCTTCCAGTTGCCAGAAGCACAATCCATAGTTTACTTTCAGCGGTGTCAAGAAGCTGTGACTCTGTCAGCTGTCTTGGCTACTGGGACGGATTGCTTTCGACTGTTGTTAAATACTGGCCTTCGGTTTGCTGCTATTCTTACTGGCTCTTCTCAAACAGAACTCGAATTGGATATGGAACTACATGCAGATGTGAGAGATATTGTACACTGTCTTCGCTACGCAACGCTTGATCGTCAGCCAGCGAATCAGTGGTCTGCATGTGCTTCCCAGTTGGCACTTGATTTCACCATTTGCCTTCTTTCATCTAAAAAATTGACGTCTCAAGACCAATCCACTGAGGACCTTAATCGGCTGGAAGCGAGTTTGCGTTTGTGTTCAAAAGTCAATCCCACAAACACACAACAACTCAGTGACCTCCTGTTCCACTCCCAGACTTCTTCGGACCTTGACTCACGTTTGAAGCGGTTACAATCGACTGCGCTCCGCCCCTCAGACAATACAGATGAGCAAATCGGAAACACTTGTCCAGTGTTCTGTTCTCCTTTTAGCCAAACAACAATGCCTTCCGTCCGATCGCGGCGTAGCACATTATCTTACTCCGCCGAACTGGAGCGAGCCGGGATGGCCCCCATTGAAACCCCGATTGAACGCGTCACGGGTTCAACCGTGGTAGACGCTCGAATGTCTAGCGCTTCTAGATTTTGGAATCAGGATAATACACTTGTTAACATAAGAATGACCCCTTTCGGACACGAAAGAACCGACTACACATACGGAGATAGTGGAAGTTATCGGTCAGAGCGGGTTAAGACCAAATGGAACACACCGAATATGTCGCGCCTACCCGTTCATGGGAACCACGTTGCTGGACAACACATCGCCACTTTGGGTTCCCGTACTTTGAATGACTCAGATTTTGAAATGGATTCCGTTCTGACCGATGAAAGGTTGTCAGCGGTCATTCCGGGCCTAGGAGGCAATCGCGAGGAAGAGTTAGAAGATGATGAGCTTAGTAGTAGGGCTTCAGTTGCCTCATCTCGATCCAGCACCCGTATGTCGCGTGTCCGCTGCATACGCGTGCAAGGTGAATGGTGCGTTCATTCTGAGTGTATCGCTTCTACTCCTGGGAACCGACGTATGAACTTGGTTGCTCGTCAGCGCAATACAAACAATACTGCTGACGTCACTCACATCGTCGATGGGACTGATACAGAAACTCCCACTGGAAGATCTCGACATAAACACGAACAGCAGCAGTTGGTTTCTCGAAGATCCACTCGCGCCGGTGTGAGACCCTCGATTACGGCAACGAAAACCACTACATCTCAAAATCGCATTGAGTCGAATCCTCACACGGATCGTTCGAATCAGTTGGCTTCTGCTAGTTCCACGTATGTCTACACCTATGTAGCACCAGATGCTGACCATATGCGACCAGGAGAAGGCGGAGACAAAAGCTCGTTCGAGAGAGGAGACATTCCTGATTCGAATGGCAGAATGTGGGGTGCACAACCTCCACACGTTTCATCAAATGATCCCACTACTGAGCGATCATTCTTAGCCAATAGGTTTGTTTGCTCCAGTGGAACGTCTTCCGCTGGAAACAAAGCCCAGAAATGGCTTGCTCGACACATTTTTGGCCTTGAGTCATCTGCCCCGGTGAGTACTTCGAACCATTTTGTACCCAGTGATACTGAAGAGTCAGATACAATCACAACTGGTCGCTCCGTTGCTCGTGGGAAATACGTACACAAACCAAGCGTCACACGAAGCCATCGACTGCACCATATAGATTCATCATCAACAACCTGGTTCTTCCGACCGTTGATGCAAGGAGCAGAGAAGCTGAAAGGAGTGATTTTCTCGAGTATAGCTTTTGTATTGGCTGGCATCTTCATCGCCTACGATGCTTTCAGTTCTTGCGTCCGTAATTTGTCATCCGCCGTTTGGACCTTTTGGTTCCGTTATTCCAGTCCTTTGCCCCACCGTTCTCGTGATAAACTGACCGTTCATCCACGGCTAACTCAATTCGACAACCACGTCACTCTTCAAATCTCATCGGTCGAGGAATCTGACTTCTTCTCTCGATCGTTCCGGGCAAGCTACGTCTGGTTTACCAGAGCTGGGACGATCTGTGTTCGTCTGGTGGGCTGTCTTTGTTTCCTAATCCCGCTCCTCTTACTTTTGGCTTTCTTATTCGCACCAGTTGCTGTCAATGACGACGAACCACCTCCAGTGTGGCCTTCTTTTCTTTCGGATACCGACTGTAAAAAGGCCCTACTCGAATCTCGCCCCAGCGATGCAACAGCTTGGCAGCTCGCCCTTTGGAGATTCCGCTGTCTGTACAATCTATACTTCCTAACTCCCGACTTTCCGTCAAATGCTACCACTTCGGAAAGCTCTTCATTGTGGCAGAAGTTTAAAAGTTGGTTGTGGCCTTCTACATCCGTTGTACCCTCCCCGGTCATCGTACCAACTGATCTACCGTCATACGTCGACAGTAAGTTGCTCGCTCAGCTGGAAGCATTCCGGGATTTTGTGAACGATCGATTGGATGGTTTGTCAAACACTATACGTCATACGGAAGAACGTGTGTCCGAGATGGAACAACGATCTGAGACACAGTTCAATGACCTCAGTATACATATTAACAATTTGAAACAACACTTTAACGAGCACACCACTGCATTGGATTCCTGGCATGTCCAGCTACAAGCACTGCAGGCTCTTGCAGGCCGCTTGGACAGTTCGGAGCCATCAAAGGTGACTCTAAACGAATACGATCGACTCTTCAATGCGGTTATCAGTGCCGCAAATCAAACCGTTTCCAAGGAGTTGAATTTACTTCGGATCGAACTGGATGAGAAGTCAAGTTCAATGTGGAACCGACACAACTCCAGTTTCACACAACTGTCCCTGTTAATTTCTCGTCTGCGTGAAGAACTGAACGACCGCTTGCTTCAAACGGAACACAGGCTTGGTGAACTACGTTCACAACTAAACTCGGGAATTCATGCACAAGTAGTCAACCATACGTCGCTCGTTATCCAAATGGACGAAATCCGCCTAACATTAGGCAATCTATCGGAGCGTGTGGCACAAGTCCGGAGCGCTAATGAGGGGCTGGATGGACTGTTCAAGAAACTACAAGAAGCCACACGAGACTGTAGTGAACGACAATTGCATCAAGTAGAAGACTGTAAGCAAGCGGCCATCGAACGAGCGGAAATTGCCGTGAATGCTTTTTCCGAACGTTTCACCGATCAAATTTCCGTTCTTGTCAAGGAGGCTTTGCTGCATTGGCTGAATGATGTGTCGGTTGAGGAAGCCCTGGATTTGAAACTATCAGAACTGGTTAAACAGTCCACACGAGAAGCCGTAGATCGAGCCATCCGTGAATCCGCGATCTCAGGGTACGCTCCGAGCGTGGACACCAGCGCAGAACAAACCGACGAATTAAAATCCCGAGTATTCATTCAGAAGCTTATTGACGCTGCCCTAGAGCGTTTTGCCGCCGATCGAGTGGGGATGGCCGACTTCGCTTTGGAATCCGCTGGTGGGTCTATCGTAGGCACACGCTGTACGCGGACTTACACAGAACGGGCAGCACTCTTCACCATATTCGGCATACCTTTGGCTCGTTTAAGCAACTCAGCAAGAACCATTTTGCAACCAAGCAACAATCCCGGTGATTGTTGGGCATTCCATGGAAGTACGGGACAGGCGGTAATTCGCCTCTCAGCACCTATTGTCATAACGTCCGTCACCCTGGAGCACCTACCTCGTGTTCTTTCACCAAACCAAAGGGTGGATTCGGCGCCGAAGGATTTTGTCATCAAGGGTCTATCATCGGAAACTGATGAAGGGGTCGTAATTGGAACATTTGTCTACGATATCAATGGTCCTGCCATACAAACATTTCCGATAGAAGGTCAGTCATCTACGTGGCATTTAATCGAGTTGGGAATCCTCAGCAATCACGGACATCCACTATACACATGCGTGTATCGCTTGCGTGTACATGGAAGAATACCAGACTCCTAGGCAACTTGACGACTGACTGACTGTGAATTGCCAGCATGTTTCTGTCTGCCCACATGTACATATCGACCCCGGCTGTATTTTCAGACTCGTTAACACGTCTGTTGTCCCCGGTGTTTTATAGTATTCCAACTTCCCATACAAAGTGTATACTCTCTGAAACACCTCTAACCGATGAATGTGATTTTCCTCTACTGCAGGCGACCGGTAGGCAGCCTAATCTCCTAATACCCGCTCATGTCTTAATGATTCATGTGTAACTTTGAATATCTTTTCTGCCGCCGCCGTCGCTGATCCACCACTCATTCACCTCGCTTATCTAATTACAAACGTTCTTC\n>XM_021551582.2 PREDICTED: Lonchura striata domestica carbohydrate sulfotransferase 9 (CHST9), transcript variant X2, mRNA \nATGTAGTGCTTCTTGAGGTTGGTGTCTCTGGGGAAGACACCGAAGAAGATGCAGGCATGCTGAAGACTTCAGAGAAGTGAGCAATGAGTCCTTCTGAAAGCTGAAGAAAAGCCCCCTTGTAGGGTCATGAACCTAAGACAAGTCTTCGTGTCTGTACTGCTGTTTGGAGTAGCTGGTCTACTCCTCTTCATGTATCTGCAAGCTTGGATTGAAGAACAGCATACAGAGTCTGGAAAAAAGCTGCAACAAGAGACAATTAATCAGGATTTCACACTCCAGCCTCTGGGGATGCCAAGGAAAGCAGCATGGAGAAGAATTGTTCCTGTGGGCCTCAGTAACCCTGAGATGGCTGTCTCAAGCAGCAGGCACTGGCAGGGCAGGGCTGACCCTTTTGGTGTGGTGGCTGCCTCCTCGAGGAGCTGGCTGCCTGAGCAGAAGATGAGTGAGTCCCCTCTCAGCTGGTTCAGAGGGGCGTATTTACCTCCTGCTCTGCACCCATTAAACAAGACATTTGTCAAGGGTGGTGAGTGGCAGGACATAGACAGCACCCAGGAAAAGCGCAGGGCCTTCCTGCAGGGCATCTGTAGGAAACACAATAGCAGAAGGAAGCTGCAAACCCATCTGGTGCACCTGGTGTCAAGAATTTACGTAGAGGACAGGCACAAGGTTTTGTACTGTGAAGTGCCAAAAGCAGGCTGCTCCAACTGGAAAAGGGTCCTCATGGTGCTCAGTGGACTCGCTGCTTCAGCAAACAACATCTCCCATGATGATGTGCACTATGGAAAGCATCTAAGGAAATTGGACAGTTATGACCTAAAAGGGATCTACACACGCTTGAACATGTACACCAAGTTTATATTTGTACGTGATCCTATGGAAAGATTGGTATCTGCCTTCAGGGATAAGTTTGAACATCCAAACAGCTATTACCATCCCGTATTTGGGAAGGCAATAATAAAAAAGTATAGACATAATGCAGATGAAGAAGCACTGAAAACAGGATCGGGAGTTAAGTTCAAGGAGTTTATCCAGTATTTGTTGGATTCCCACCGACCAGTAGGAATGGACATTCACTGGGAGCAAGTCAGTAAGCTCTGCTATCCCTGCCTCATCAACTATGATTTTATAGGAAAATTTGAAACCCTGGAAGAAGATGCCAATTACTTTCTGCAGCTGGTAGGTGCTCCAGCCAATCTGAAGTTCCCTAAATTCAAAGACAGACATTCCTCTGATGAGCGAACAAGTACAGAAGTAGTGAGGCAATATTTAAAGGAATTGTCTAAGGAGGAGAGACAGCTGACCTATGACTTCTATTACTTGGATTACTTAATGTTCAATTATACATCACCACTTGTATAGCACTAGAATAGCTTCAGGCTTCTACTAGATACTTATCATGTTGGGATTCAAAACAACTACTTTGATATTAGCCCTGAAAGGAAACAAAGTTACTGCTAAGTAGAGTTGTCTTGAATTAGTGGGGATTTTATAAGCTAGAGTGGTATCAATTGATACTAAATTATGGAGAATGCAAAGAAAAAAGACCTGCAAACAGCATAGATTGCACTAAAATGCCTGGAAAAGCTGTTTTTACCATTATGGATTATATTATGGAAGCAGTAGCTCAGACAGCTGTTGCATTAGCTTACCTAATGTTCTTTTAATGGTTTAAGAAAAAAAAATTGGAGTGGCATGATTCTTTTTTGGTATGTTTTCTTTAGAAATGGATTTTGAAAAAATTTTGAATGTATTTTTACTTTCTGTCACTTATTAATAAATGATCATAGGCTAA\n>XM_027345943.1 PREDICTED: Dermatophagoides pteronyssinus SOSS complex subunit B1-like (LOC113795734), mRNA \nTTGAATTATTTATTTACTTATATTTTTTTATTTAATTTTTTTTTGTAATTAAAATATATTTTTTTCCTATAAAAAATATTATGGGCTATTCGATTAATCAGATAAATATGACCGATAAAATTGATTCAATAAAAGATATTAAAGCACCATCGAACAAATTAAATGTTATTGCAATTGCAGTTGAAATTGTTTCACGTTTAATAACCAAAGATAATCATGAAATACGTGTAATGAGATTTGCCGATCGTACTGGTTGTATAAATATGTGTCTTTATGATGAATTAGGCGCAACGGTTCAACCAGGTGATATATGTCATATAACACGTTGCTATGCAACATTTCATAAAGGTGCATTAACATTATATATGGGTCGTCATGGTAAATTGACAAAAATTGGTGAATTTTGTATGACGTTTACTGAAACACCAAATATGAGTGATGGTGATCCATCTACATTATCATCACCATCAACTTCATCAACATCAACGTCGTCGTCGTCGTCGTCGTCATCAACGTCATCAGGTCCACCAACAAATTCATAAATATTTTTCATTTTTTTTTCTTTTCAAAAATTGTG\n>EU801997.1 Uncultured bacterium clone 3C003382 16S ribosomal RNA gene, partial sequence \nAGGGTTTGATCATGGCTCAGATTGAACGCTGGCGGAATGCTTTACACATGCAAGTCGAACGGCAGCACGGACTTCGGTCTGGTGGCGAGTGGCGAACGGGTGAGTAATATATCGGAACGTGCCCAGTCGTGGGGGATAACGTAGTGAAAATTACGCTAATACCGCATACGATCTAAGGATGAAAGCGGGGGATCGCAAGACCTCGCGCGATTGGAGCGGCCGATATCAGATTAGGTAGTTGGTGAGGTAAAGGCTCACCAAGCCAACGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGACGCAAGTCTGATCCAGCCATTCCGCGTGCAGGACGAAGGCCTTCGGGTTGTAAACTGCTTTTGTACAGAACGAAAAGGTCTCTATTAATACTAGGGGCTCATGACGGTACTGTAAGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTATATAAGACAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTTGTGACTGTATAGCTGGAGTGCGGCAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAATCCCCTGGGCCTGCACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCAACTGGTTGTTGGGTCTTCACTGACTCAGTAACGAAGCTAACGCGTGAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGTTTAATTCGATGCAACGCGAAAAACCTTACCCACCTTTGACATGTACGGAATTCGCCAGAGATGGCTTAGTGCTCGAAAGAGAACCGTAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGCCATTAATTGCCATCATTTAGTTGGGCACTTTAATGGGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGGCCAGGGCTTCACACGTAATACAATGGTCGGTACAGAGGGTTGCCAAGCCGCGAGGTGGAGCCAATCCCAGAAAGCCGATCGTAGTCCGGATTGTAGTCTGCAACTCGACTACATGAAGTCGGAATCGCTAGTAATCGCGGATCAGCATGTCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTTTACCAGAAGTAGGTAGTCTAACCTTCGGGAGGACGCTTACCACGGTAGTATTCATGACTGGGGTGAAGTCATAACAAGGTAACCGTA\n>XM_007934102.1 Pseudocercospora fijiensis CIRAD86 uncharacterized protein (MYCFIDRAFT_212712), mRNA \nCTTTCATGTTGTATGCTGGAGTCTGCATGTCCGCGGACACTTGCGCACGAGAGCATCAGCGCCCAGCGAGCTTGCGGAATGCGGAGCTGTCATGGTCGTACATCTGCCGAGTGTCCGTAACTGATATCGGTAGCCTCCTCAATTCTGGAAGCCTCTCAGATCCCAGCGTCCTTGTTCGCGCTGACGTTCTCTATGTCGCTTCTTTCCGCGGTGTTTCGCTTCAAATTCTCTCCCACAATCTCTTATGCAGTCTCTTCCACGCCCTCTTGCACGCCCACATCACCAGCAATGATTTCCTTCGGGTTGGCGGCTCGAGAGCTTATTGCAGCCTTGGTGAGAGGTGTAGGTCCCACGTCGTGACTTGTCCCGACGACAGGTCTCGCAGTGCATGCATCTTCGTCTTCTGGGGGTGTGAGATCGCTATCTCAACTGCCCTCGAGCTACGACTTCCATATCCCGCCTTCCTACTCCACCTTCTCCAAAGCCGGCCACATGTCGCAGACGTAGCGCTTCATGCACTGGACGGCTCTCTTGGCGGCGATTCCGAGGATAGCGACTTCACAGATGGTGCAAATTTGAACGACGTGACGGAGGAGAAGCTCTGAACCGGATCCACTGTGGTGAGAAGGTTGATTCCACAGCTCATCTCTGCATCCCTGTGGCCTTCCATCCCAGATGCGATTGAGTGAGGATCGGGTCATTTGCTGTGAGTTGAACTTGTCTTGGATGAAGCATACGATAAGTGTGATGTTGTAATAATCTCAACAGTCATGAACAATGACGG\n>XM_026366555.1 PREDICTED: Anabas testudineus cytochrome c oxidase subunit 5A, mitochondrial-like (LOC113166428), mRNA \nTCGAGTACGTGACCGGCTAAGTTAGCATTAGCTTCCTCCTGCCAGACCTCACCGGTTCGAGGAGCTAGCTGCCGCTCATCATGTTCAGAGCCGCCGTCCGACTTTCTGTCTCCGGTGTCCGGGGTTTAACCCGTACGCAACCACGGTGCCAAGCTGTTTTGGCCTCAAGATGGTACTCACATGGGAAACAAGAGACGGATGAGGAGTTTGATGCCCGTTGGGTCACTTATTTCAACAAGCCAGACATTGATGCATGGGAGCTGAGAAAAGGGATGAACACGTTGATTGGTTACGATCTGGTACCTGAGCCAAAGATTCTTGAGGCAGCACTGAGAGCCTGTCGAAGGTTAAACGACTTGGCCAGCGCTATCCGAATTTTGGAAGCTGTAAAGGAGAAAGCCGGTCCTCATAAAGACATCTACCCGTACGTGATCCAGGAGCTACGGCCAACATTAGATGAACTTGGCATCTCCACACCTGAAGATCTTGGCATTGACAAAGTGTAAATAAGTATCTGATAGTGAATAACCCCAGGACGCAGAATCATTGTACTTACATGTTTGCCTCACCTGATATGTGTGATATTTAATTTGCCCTTTATTAAGTTCTTTTGTTGTAAAATATTGATGAACCTAATAAAGGAAAACGAATCTTTATTGAGTGTCACATATTTTGAGAGATTTTAAACAGCCTGGTTACATATTGAAGCAATATTTTTGAAGTTGCTTTAACAGCAGAGCAGAGCGTCACTTGATGGTGCAAGTTGTCTCATTCTTCTGAGAGTCGCGTTTTGCCACCAGGGAGCAGCGTTTTCACATGAATGTAAAAATCATTCTTCTGTATTCAATCTATATTTCATCTGTTCAGGGAAGATATACATGCTGGTGAAATAAACTTGTTCAAATGTCAAA\n>XM_008046871.1 Trametes versicolor FP-101664 SS1 uncharacterized protein (TRAVEDRAFT_136475), partial mRNA \nATGAACGAGCTGCAGACTCTCACAACTTTGCAGCCTTCAGCGGTCGTCTCAACTCGCGTCTCGCACTCCCTCGACAGATGTTCCACGCGGTCCTCCATTCTTTCCCATCCGAAGCTGTCACACAAAGTCAAGGGCATCTGCAAGGTCGCGCGTAAGGCCGGCTTCCGCCTCGTCTGGAACGACGCATGCTGCATCGACAAGTCGAGCAGTGCCGAACTCTCTGAGGCGATCAACTCGATGTACGACTGGTTCCGACTCTCGGACATGTGCTACGTCTACCTCCAAGATGTTGCGGACGGCGATAGACCCCAGGAAGCCCAGTCCGATTTCCGGAAGAGCCGATGGCACACCCGCGGTTGGACGCTGCAGGAGCTCATCGCGCCCGAGTGCGTCGAGTTTCTAACGCAGACTTGGCAATTTCTGGGCACGAAGCTGGGGCTTGCCTCGACTTTGGAGGAGATAACCGGAGTCGACGTCAATATTCTCACAGGCCGAGCCACCTTGAACTCTGCTAGCGTTGCGCGGAGGATGTCATGGGCGGCGAAGCGAGAGACGACGCGCATCGAGGACCAGGCGTACTCGCTCATGGGTATTTTCGGCGTCCACATGCCGCCTATATACGGCGAGGGCAACAACGCCTTCCTGCGTCTCCAGGAGGAGATAATCCGGACTATCCCCGATCAGACCATATTTGCCTGG\n>FJ010171.1 Homo sapiens TCF7L2 isoform pFC8A_TCF7L2_B4_ex1-no4-11-14 mRNA, complete cds, alternatively spliced \nTTTTCTTCCAAAATTGCTGCTGGTGGGTGAAAAAAAAATGCCGCAGCTGAACGGCGGTGGAGGGGATGACCTAGGCGCCAACGACGAACTGATTTCCTTCAAAGACGAGGGCGAACAGGAGGAGAAGAGCTCCGAAAACTCCTCGGCAGAGAGGGATTTAGCTGATGTCAAATCGTCTCTAGTCAATGAATCAGAAACGAATCAAAACAGCTCCTCCGATTCCGAGGCGGAAAGACGGCCTCCGCCTCGCTCCGAAAGTTTCCGAGACAAATCCCGGGAAAGTTTGGAAGAAGCGGCCAAGAGGCAAGATGGAGGGCTCTTTAAGGGGCCACCGTATCCCGGCTACCCCTTCATCATGATCCCCGACCTGACGAGCCCCTACCTCCCCAACGGATCGCTCTCGCCCACCGCCCGAACCTCTAACAAAGTGCCAGTGGTGCAGCACCCTCACCATGTCCACCCCCTCACGCCTCTTATCACGTACAGCAATGAACACTTCACGCCGGGAAACCCACCTCCACACTTACCAGCCGACGTAGACCCCAAAACAGGAATCCCACGGCCTCCGCACCCTCCAGATATATCCCCGTATTACCCACTATCGCCTGGCACCGTAGGACAAATCCCCCATCCGCTAGGATGGTTAGTACCACAGCAAGGTCAACCAGTGTACCCAATCACGACAGGAGGATTCAGACACCCCTACCCCACAGCTCTGACCGTCAATGCTTCCATGTCCAGGTTCCCTCCCCATATGGTCCCACCACATCATACGCTACACACGACGGGCATTCCGCATCCGGCCATAGTCACACCAACAGTCAAACAGGAATCGTCCCAGAGTGATGTCGGCTCACTCCATAGTTCAAAGCATCAGGACTCCAAAAAGGAAGAAGAAAAGAAGAAGCCCCACATAAAGAAACCTCTTAATGCATTCATGTTGTATATGAAGGAAATGAGAGCAAAGGTCGTAGCTGAGTGCACGTTGAAAGAAAGCGCGGCCATCAACCAGATCCTTGGGCGGAGGTGGCATGCACTGTCCAGAGAAGAGCAAGCGAAATACTACGAGCTGGCCCGGAAGGAGCGACAGCTTCATATGCAACTGTACCCCGGCTGGTCCGCGCGGGATAACTATGGAAAGAAGAAGAAGAGGAAAAGGGACAAGCGGCCGGGAGAGACCAATGGAGAAAAAAAAAGTGCGTTCGCTACATACAAGGTGAAGGCAGCTGCCTCAGCCCACCCTCTTCAGATGGAAGCTTACTAGATTCGCCTCCCCCCTCCCCGAACCTGCTAGGCTCCCCTCCCCGAGACGCCAAGTCACAGACTGAGCAGACCCAGCCTCTGTCGCTGTCCCTGAAGCCCGACCCCCTGGCCCACCTGTCCATGATGCCTCCGCCACCCGCCCTCCTGCTCGCTGAGGCCACCCACAAGGCCTCCGCC\n>KX179358.1 Uncultured bacterium clone MA_1774 16S ribosomal RNA gene, partial sequence \nACGGGGGGCGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGGGCAGGCGGTCCGCTAAGTCTTTTGTGAAACTCCAGAGCTCAACTCTGGACATGCATAAGATACTGGCGGACTAGAGACCGGTAGAGGCTAGTGGAATTCCTGGTGTAGCGGTGGAATGTGTAGATATCAGGAAGAACACCAGTGGCGAAGGCGACTAGCTGGGCCGGGTCTGACGCTCATCCGCGAAAGCGTGGGGAGCAAACAGG\n>XM_004415061.2 PREDICTED: Odobenus rosmarus divergens fidgetin-like 1 (FIGNL1), mRNA \nAGCATGCAGGCCTCCAGCTCCAGGTCTGTGCACCTGAGTGAATGGCAGAAGAATTACTTTGCAATTACATCTGGCACATGTACCCCAGGACAGAAGGCAGATGCGTACCGAGCACAGATATTACGCATTCAGTATGCATGGGCAAATGCTGAGCTCTCCCAAGTCTGCGCCACCAAACTGTTCAGAAAATATGCAGAGAAATACTCTGCAGTTATTGATTCTGACAGTGTCGAGACTGGCTTGAATAACTACGCAGAATGCATTTCAACTTTAGCAAGATCTCAGCAGACTGACAGTGACAAGTGGCAGTCTGGATTGTCAATAAATAATGTTTTCAAAATGAGTAATGTACAGGAGATGATGCAAGCTGGCAAAAAATCCAGAGACTCTCTGTTGGCACCTGCCAGTGCATCGGTAGTAATCCATAAAGAGGCGCTTGTCCTCGATCCTCCTAAACTTAGTGTTTGTGGGGGTTCTGGGGAGAGTGGCCCATTAACTAACGCAGCTCCTGATACAAACAGGACCCAAGATATCCCAGAGAGCAGTCCTTCGAAGTGTCCTCAGGATGCTCAGCCACCTGTGCCGACTAACACCAGAAAGACCTGTCCTTCATCCTTAACACCGTTTGGTGACTTTGCCACTGCAAAAATCCATGCCACACCATTATTTGGAAATGCCAAGAAGGAAAATAACAGCTCTCCAAAGGCCAACGTAGGACTAAATATGTTCTCATCTAATCAGTCTTGTTTGCCTTCTGGCTTTGAAAATCCACGGGAGAGAAAAACTTTTTATGGTTCTGGCACCACTGATGCCCTTTCTGCCCCAGGAGTGAATAAGGCTTTTAGTAAAACAGAGGATAATGGCCAAAGGGAAGAGAGTAGCCTGCCTACTTTTAAAACTGCAAAAGAACAGTTATGGATAGATCAGCAAAAAAAGTACCACCAACCCCAGCGTGCATCCGGGTCTTCGTACGGTGGTGTAAAGAAGTCTCTGGGAGCTAGTAGGTCCCGAGGAATATTTGGGAAGTTCATTCCTCCTATACCTAAGCCAGATGGGGGAGATCAGAATGGGGGAATGCAGTATAAGGCTTACGGCGCAGGACCTGCAGAGCCAACACATCCAATTGATGAGCGGCTGAAGAACTTGGAGCCAAAGATGATTGAACTTATCATGAATGAGATTATGGATCATGGACCGCCCATAAGCTGGGATGATATTGCAGGAGTAGAATTTGCCAAAGCCACAATAAAGGAGATAGTCGTGTGGCCCATGATGAGGCCAGACATCTTTACGGGTTTACGAGGACCCCCTAAAGGAATTCTGCTCTTCGGGCCCCCCGGGACTGGTAAAACTCTAATTGGCAAGTGCATTGCTAGTCAGTCTGGGGCAACGTTCTTCAGTATCTCTGCTTCCTCTTTGACGTCTAAGTGGGTAGGTGAGGGGGAGAAAATGGTCCGTGCATTGTTTGCCGTGGCAAGGTGTCAGCAGCCGGCTGTGATATTCATTGATGAAATTGATTCCCTGTTATCTCAACGAGGAGATGGTGAGCATGAATCTTCTAGAAGGATAAAAACGGAATTTCTAGTGCAGTTAGATGGAGCAACCACATCTTCTGAAGATCGGATTCTAGTGGTGGGAGCAACCAATCGGCCCCAAGAAATTGATGAGGCTGCCCGGAGAAGGTTGGTCAAAAGGCTTTATATTCCACTCCCAGAAGCTGCGGCTAGGAAACAGATCGTGATTAATCTGATGTCCAAGGAGCAGTGCTGCCTCAGTGAGGAGGAAATTGCCCTGGTTGTAAGGCAGACCGATGGGTTCTCGGGAGCTGACATGACACAGCTTTGCAGAGAGGCGTCTCTCGGGCCTATTCGCAGTTTACAAACTGTTGACATCGCCACAGTAACACCCGATCAAGTTCGGCCAATAGCTTATATTGATTTTGAGAACGCCTTCAGAACCGTGCGACCTAGCGTGTCTCCTAAAGATTTAGAGGTCTATGAGAACTGGAACAGAACTTTTGGTTGTGGGAAGTGAAGGGGACACACGGGACACTTGAAATCTAAAGATGGCATCTTTGTAATGCAGCCTTCCCCACTTTTTAGCATGGGAAACTGGGAATTTATTAATTGTACTTTATAGTGTATATTTTGAATTCTATACCTCAAATAAAATAGTAACAGCTTAAAT\n>XM_018530727.1 Alternaria alternata hypothetical protein mRNA \nCCATCATGCAGTCTCAGCAAACTCCTCGGTATGTAAGCTAGAAGAGATGGCCTGTTGTTTAGGCACTTGCTGGACAGACCGATGGCTAGACCTCTATGCGATAGATGTAGAACAACACAAACAACAACTTGGACTAAACTTGCACGACGGTAGTCGGCAGTACGCCTTAAAATCAGAGAAATGTCTCGACACGTTTGGCCTTCCAATACGCTATCTACGTAGCACTTCACTCACCCTGATCATCTTAGCACATGAATACAGGCATATATGTCAGATACACGCAAAGTACAATAACTTGGCTTCACAGCGATCTTGGTGGAATCAATCACGTCTTCACGCAGAACTAGTGCTTGGAGAGTCAATTCAATACGAGTCGGAAACTCCCGAGGTCATCTTTACCGGCCGATGTGGTCTTACTGGAGAGAAGTTCGGAATTTTTCTAGTCAATATGATTATTATATTTCTCTTGCACAAGCACATACGACCACAGGATCTTGAGACCACGGCTTCCCGTTCGCTCAGCCCTAGTTAAGCAAGATACCGGCGGATTAGTAGTCAGGTGGGTGACCACTGGCGAATCCCCGCTGTTGTATGTTTTTTTGTTTCTTTCGAAAGAAGATCATTAGGCCGAAAATAGGCGTACTTGTTATTTTTTTGTCTTCCCGCAGATGCTGTTTCGCATGGTCGAACTTCTTTGACGTCGAGATAGGTAGTAAAGAGTAGGCAATAATTGTGGTTTCATCGTG\n>DQ227595.1 Uncultured bacterium clone ZFos29a01 16S ribosomal RNA gene, partial sequence \nGAGTTTGATCCTGGCTCAGGATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGATGACTTCTGTGCTTGCACAGAATGATTAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTCGGGATAAGCCTGGGAAACCGGGTCTAATACCGGATACGACCTCCTGGCGCATGCCATGGGGGTGGAAAGCTTTATTGCGGTTTTGGATGGACTCGCGGCCTATCAGCTTGTTGGTTGGGGTAATGGCCCACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACACTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCGACGCCGCGTGAGGGATGACGGNCTTCGGGTTGTAACCCTCTTCAGCANGNAAGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCGCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAAGGGCGCAGCGTTATCCGGAATTATTGGCCGTAAAGAGCTCGTAGGCGGTTTGTCCCGTTCTGCTGTAAAACCCGGGGGCTCACCCCCGGGTTCTGANTGGGTT\n>XM_001452590.1 Paramecium tetraurelia uncharacterized protein (GSPATT00002630001), partial mRNA \nATGAAAGTGCGTAAGTAAGCACCCCAATTTACAGCATCAGCCTACTTTAATAAATAGTTTAAGAGAATATCTCTAAGTGATTATAAAAATAGATATGTTGTTCTATTCTTCTATCCATTGGATTTTACATTTGTATGTCCAACAGAAATAATCCAGTTTTCTGATCGAGTTGAGGAATTCAAAGCAAATGGTTGTGATATTTTGGGTGTCTCTGTAGACTCCTAATTTTCTCATATGAAATATTGTAAATAAACACGTAATAATGGAGGATTGGGTGAGATGCAATTTCCTCTGATTTCAGATTTAAGTTAGGAAATCTCTAAAAAATATGGAGTCATTATAGATGATTCTGAAGATCCAGATTTTGGTGTTGCTTTCAGAGGGACATTCATAATCGACGGAAAAGGAATCCTCAGACATTATTCCATTAATGATTTACCTGTGGGTAGAAATGTAGACGAAGTCTTAAGATTAGTGTAAGCATTTAAATTTACAGATGAACATGGAGAAGTTTGTCCTGCACAATGGAAACCAGGATAGCCAACTTTGGTTACGAATCATTCTGACCCAAAGACTTAGAAATATTGGAATGAAGAACATATAAAATAAGCTAAATGA\n>XM_007882153.1 Pseudozyma flocculosa PF-1 uncharacterized protein (PFL1_04627), partial mRNA \nATGGGCTTCTTCGACGTCGGCTCCATGCGGAGCAAAAAGTCCAACGCGGAGCTTACACAGGAAGCACGCATGCAGAGGCGCAAGAACGACGAGATCCTCGCAGCCAACCTCGGCCTCGACTACTCGCATGGCGGCAGCAGCAATCGCAGCAACGGCAAGTCGAGTCGTGACCGGCTCCACGACGACTTTGCAACGGGGCACGGCGCCGCCGCATCGACTGCGGCCAGGGACGCGACAAGACGGAGCAAGCTGGAGAGGATGATGGGTGCCGACGTGCCACTGCCCGACTCGCTCTCGGCGCCCAATGCTGACCATCGGCGAGGGCAGCATCAGGCCGACGCGGCATCCCAGATCTACGGCTCAAACGGAGGCTCGGCGCTCCACCTGCCCATGTCCAAGGGATCCTTTGACGCCATGAGCCAGCATTCGTCACACTCCTCCGGCCGCGAGCGTCAGTCGAGCGGAAGATCGTTTGATCCGCTCCCCGGCGCTTCAACGACCTTCACCGAGATGGCCGAGGTTGACTGCCCTGTCTGTCTGGAGCCGCTTTCGTACCGGCTCGCCGGCGAAAAGCCTCACGTTGTGCCCAATTGCGGCCACGCGCTGCACAACGCTTGCTTCACCGCCGTCTACGGCCCGCCGGAAGCCATCATTGCGCAGCAGAATGCGGCCTTGGGGGCAGGCAACGGTCGCACAAAGGGCGCCGGTCTGGTCCAGCGGACCCCGGCCGCAAACCCGCCAGGCATGTGCGGTGTATGCCGTCGAGCCATCGTGCTCGGCGGTGACGAGGCCACCGCCAAGTCTCAGAAGCTGGCGGGGCTGGGTCCGCACGGGTCGCAGGCCGATCGGATGACTCTGAGCTCGGACTCGGCCTCGGTTCGAGCCCTCTCTGAAGCCCACGAGGACGACCCTCTCGAGAGCCAGGCAAAAGGCCGGTCTGCCAACATCTCGGGACCCATCACGACCCCGACGATCCGGGCTAGGCCAGAGTACTCGACCATCTACAAGAAGGCCGATCGCAAGGACAACAGCAAGGTCAATGTGGTCTGCGTGCTCTCGGTCGAGGTGCCATCGAGAAGGCCGAGCTCTGACGATGCGGTCGAGTCCGGCCTTGACACGATCGAGGATCGCGGCTACGCTGAGGAAGAGTTTGACGAGGAGGACGAGCGCGACTACGAGGGCGAGGACTCGTACTCGGACGACCTCAAGCGCAGCGGCTCCGAGTACGTCCCCAACGACCGCAGGTCGAGCGGTCAGCGCAGCCCGCTGCCGACGTCGTACGCCAACGGCGCCGACGGAAAGCAGGCCGCCAGCCCGGAGCGCTGCATCTCTCCCGAAAGTCAGGCCGGGTTCTCGTACAGTGCGACGCCGGCAGCGCAGCAGCGGCTCAACGATCCCAACCTCGCTGTGGTCGAGGACCTCCGCAGTCGCGTGGCCGATTGGAAGGGTCACTCGCTCGAGCATTTCGGCGAGCTCGTGCTGCACGACCTTCTCAACGTCCGCCAGGACAGTGTCGTACGCGAGTTCCACGTCTACCTGTTCGAGGGCGCGCTGCTCTGCGTCACCGAGGAGAAGCGAAAGGGTCTCAGCCGGTTCATTCCTGCGGCACCTCCGGCCGCTCCGGGTGCCACCCCCGACGTTCCTGCCATGCCCAAACCCGCGCTCAAGCTCAAGGGCCGCATCTACCTCAAGCACATCCGCCGCGTCATCGACTCGTCGGTCGCTGGCGAGCTCAGCATCAGCATCACGATGGACGAGAGCCTGGATCAGTTTGTCCTCTGCTTCCGCGATCGCGAGACTCTGTCGGTGTGGAAAGAGCGTCTCAGCCAGAAGGTCGCCGCACAGTCCAAGTCGGCGGCGGCGGCAACTACGGCCAAGGAGGCGGCCAAGCCCGAGGAACCGGCATCAGCCTTCGACGCCGCCTCGGCCGCTCACTCGGCCGCGAGCCATGGCATGCACCCCCTCGACGACCACCAGCGCCTCCGCGGCCTTCCCGCGGCACCCAGCCACGGAGTTTCGATCTCGCGGGCGAATAGCGGCGCCGCATCAATCATCAGCGGCAAGACGGGCTCTCACCAAGGCGCCCTCTCTCCGGCCGACTACAGGAACATGCGACGCTTGTCGAACGTCTCGAGCGTCCAGAGCCACGGCAGCCACCGCAGCCGCACCTCGACAGCTTCGGACACGGTGCCTCGCCACCAGCAGTGGTCCGCCTCGGGCGGGCTCGACCCGAGGATCCCACCGCCTCCGATGCTGCCACACACGCCGCTCGACTTGGTGCTCATGTTCGCCGTGCCTCCGGTCCTGCCCAACAACGCACAGGGCTCGATCAACTCGTCGGCCGCGCTCAAGCTTCGCCTGGTCCGATCGACGCTTGACTTTGTTGTCAGCCACATGGGACCCAAGGACCGCGTCTCGCTCGTGGCCTACTCGGTCGGCTATGAGGGCGAGGTGAAGCGCACGGCGCTCCTCAACCCGAGGCGCTCGTCGAGCCGACAGATGCTGGGCGAGTTCATCCAGTGCATCGGCAGGCCTTGGGACGGCCACGCCGAGGACCCGTTCCGCGTCGACCTGGACCGGCTGGGCGGAACGAGCGAGCGGACCGATTCGGTGACGGCGGTCAATGTCGGGCTGGACATCGTGCTGCAGCGCAAGCAGAAGAACCCGATCACGGGCATGATTCTCGTCAACGACACGGCCGACGGACCCAAGCGGCACCAGATGGACCTGGTCATGGCGCGGGCCGAGGCGGCCAACGTGCCCATCCACTGCTTCGGCTACGGCAAGACGCACGACCCGTCTTCGCTGTGGCTGATCTCGAACCACACAAAGGGCTCGTACACGTTTGTGCGCGAGTGGTACCAGCTGCGCGAGTGCCTGGCCGGCTGCATTGGATCGATGATGTCGATCGCGCTGACCGACGTCAAGCTGCACGTCAGTGTGCCCCACGACAACCAGTTCCGCGTCCGCAAGATTGCCGGCATGCCCGGAGCCATCATCTCGTCGTCTGGCAAGGACGTCGACATCGACATGGGCGACATTCGCTTTGGCGACGCGCGCGAGCTGCTGGTGGAGCTCGAGCTCGATCTCGAGAGCCTGCTGCCGCGCCTCAACGCCAGCAGCAGCAGCAGCCGCAAGCTCTCTGCGCCTCCCATCGAGCAGGGCAGCGCTACCGACGACTTCATGCAGCGACTCGGCATCCAGGGGCTGAGCCTTGCCGACTCGGACGGCGCCGAGGGGTCATTTGAGCACCTGATCGACGAGGTCCCTGTCTTTGAGGCCGATGCCGGTTTCCGCGACCCGACCAACGGCACCAGCACGTCGAGGCTGGCCAACCCGACGATCCTGACGCTCGAGATCGACTGCCAGTCGCCGGACCCCGTGTCCTCCGGGCCGCCGGGCCTGGCCGCTGCGATGGCCGATCCAACCGTGACGCGGCGGCGGCTCGAGGTGTTGGTGTCGGAGATGATTACGCGCTCGCTGCTGCTCATCTCTCGCTCCAACTACGCCCAGGCGCAGAAGGTGTTCAACGAGACGCGGAGGATCATTGAGACGGTGGTGCGGGCAATCCCGCTGCCCGCCGGCGGCAGCGGCAGCGGCTCGCGGCGGCGGGCGCCGATGGGCAACTCGCGCTCCGCGGCCAAGCGGCAGCGCGACGCGCTCAACCGCAAGACGATCGACAGCCTGATGGCCATGATGAATGACCTCGACACGCTGCTGGAAGGGCTCGAGGCGCAGAACCGGACGACGTTCGAGCGCGACGGGCGCAACTTTGGCGCGCAGCAGGCCATGATCCTGCGCGATCAAAAGGCGTGGACGACGCGGACCGACACCGAGTATCAAAACTTCCGCGACGACAACGCCGCCGCTTTCGCTGCCTACGGTGCTTCGTACGCCAGCTCGCGGTGA\n>XM_033386580.1 PREDICTED: Drosophila miranda mucin-5AC (LOC108151008), transcript variant X9, mRNA \nAATGTTTGTCTTTAACTCATACGCGAATTCGTTACGCTCCCCAACTGTTAAAAGACCAACGATGTCTTCGAAGGCTTCTTCACGAGATTTATTAAGATTTATAATATCACTAGTAGTGCTCAGCCAAATCATACTCAAAAAAGCAGAGAGTGCCTCGGTTGAAAAAGTGCATTTAAAAAGTGCGCAAGTGAAAAACAATCTAATTGAATATGACTCACAGTTTGGCCGAGATACAAAATTTAATCATAAAAAAACAACTATAGCAAACGATATTACATCTGCACCTGAAGAGAGAACATCAGCCGCACATTCGACTTTTGCACCTGCGGAGAGCACCACAGCTGGGGGCAATACGACTTCTGCTCCGGAAGAAAACAACACATCTGAGGACGATACTACTCGTTCTACTTCTGAAAAAAGCACAAAAGCTAATGATTCGACATCTGCAGCACCCGATATAAGCACCACAGTTCAAGATTCGACATCTGAACCTGAAGAAAGCACTACAGCTAAGGACAACTCTACTTCTGCTCCTGAAAAAAGCACCACAGCTGAAGGGGATTCTCCTGCTGCTCCTGAAGAAAGCACCACAGCTGAAGAGGATTCTTCTTCTTCTCCTGAAGAAAGCACAACAGTTGAAGATTCGACCTCCGAACCTAAAGAAAGCACGACAACTGAAGGCGATTCTACTGCTGCTCCTGAAGAAAGCACCACAGCTGAAAATTCGACATCCAAACCTGTAGAAAGCACTACAGCTGAGGAGGATACTACTTCTACTTCTGAAAAAAGCACAACAGATAAAAATTCGACGTCTGAACCTGAAGAAAGCACCGCAGCTGGGGTCGATTCTACTTCAGCTCCTGAAGAAAGCACCACAGCTGAAGAGGATTCTTCTTCTGCTCCTGAAGAAAACACAACTGTTGAAGATTCGACCTCCGAACCTGAAGAAAGCACTACAGCTGAAGACGATTCTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGATTCGACTTCCGCTGCACCTGAGATAAGCACCACAGCTGAAGATTCAACGTCAGAACCTGAAGAAAGCACTACAGCTGAAGGCGATTCTACTTCTGCCCCTGAAGAAAGCACCACAGCTGAAGATTCGACTTCCGCGGCAACTGAGATAGGCACCACAGCTGAAGATTCGACGTCTGAACCTGAAGAAAGCACTTCAGCTGAAGGCGATTCTACTTCTGCTCCTGAAGAAAGCACCACTGGTGAAGATTCGACGTCTAAACCTAATGAAAGTACCACAACTGAGGTCGAAACTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGATTCGAAATCAGAGCCTGAAGAAAGCACCACAGCTGAAGAGGATTCTACTTCTGCTCCTGAAGTCACCACTACAGCTGATGACTATACTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGTTTCGACATCTGAACCTGAAGAAAACTCCACGGCAGAGGACGATTCTACTTCTACTCCTGAAGAAAGCACCACAGCTGAGCACGATTCTTCTTCTGCTCCTGAAGAAAGCACGACAGCTGAAGATTCGACTTCCGCGGCACCTGATATAAGCACCACAGCTGAAGATTCGACGTCTGAACCTGAAGAAAGCACTACAGCTGAAGGAGATTCTACTTCTGATATTGAAGAAAGCACCACAGCTGAAGATTCGACTTCCGCGGCAACTGAGATAAGCACCACAGCTGAAGATTCGACGTCTGAACCTGAAGAAAGCACTTCAGCTGAAGGCGATTCTACTTCTGCTCCTGAAGAAAGCACCACAGATGAAGATTCGACATCTGAGCCTGAAGAAAGCACCACAGCTGAAGATTCGACATCAGAGCCTGAAGAAAGCACTACAACTAAAGGCGATTCTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGACGATACTACTTCTGCTCCCGAAGAAAGCACCACAGCTGAAGATTCAACATCAGAGCCTGAAGAAAGCACTACAACTGAAGGCGATTCTACTTCTGCTCCAGAAAAAAGCACCACAGCTGAAGATTCGACTTCCGCGGCAACTGAGATAAGCACCACAGCTGAAGATTCGACGTCTGAACCTGAGGAAAGCACTTCAGCTGAAGGCGATTCTACTCCTGCTTCTGAAGAAAGCACCACAGCTGAAGACGATACTACTTTTGCTCCTGAAAAAAGCACCACAGCTGAAGATTCAACATCAGAGCCTGAAGAAAGCACTACAACTGAAGGCGATTCTACCTCTGCACCTGATGAAAGCACCACAGCTGAAGAGGATTCTTCTTCTGCTTCTGAAGAAAGCACAACAGTTGAAGATTCGACCCCCGAACCTGAAGAAAGCACGACAACTGAAGGCGATTCTACTTCTGCTCCTGAAGAAAGCACCACAACTGAAGATTCGACGTCTGACCCTAATGAAAGTACCACCACTGAGGTCGAAACTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGATTCGACATCTGAGCCTGAAGAAAGCACCACTGCTGAAGATTCGACATCAGATTCTGAAGAAAGCACCACAGCTGAAGATTCGACTTCCGCGGCAACTGAGATATGCACCACAGCTGAAGATTCGACGTCTGAACCTGAAGAAAGCACTTCAGCTGATGACGATACTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGTTTCGACATCTGAACCTGAAGAAAACTCCACTGCAGAGGACGATTCTACTTCTACTCCTGAAGAAAGCACCACAGCTGAGGACGATTCTTCTTCTGCTCCTGAAGAAAGCACCACAGCTGAAAATTCGACATCAGAGCCTGAAGAAAGCACTACAACTGAAAGTGATTCTACCTCTACCCATGAAGAAAGCACCACAGCTGAAGATTCGACTTCCGCGGCAACTGAGATAAGCACCACAGCTGAAGATTCGACGTCTGAACCTGAAGACAGTTCTACAGCTGATGACGATACTACTTCTGCTCCTGGAGAAAGCACCACAGCTGAAGTTTCGACATCTGAACCTGAAGATAACTCCACGGCAGAGGACGATTCTACTTCTACTCCTGAAGAAAGCACCACAGCTGAGGACGATTCTTCTTCTGCTCCTGAAGAAAGCACCCCAGCTGAAGATGTGACTTCCGAGGCACCTGATATAAGCACCACAGCTAAAGATTCGACGTCTGAACCTGAAGAAAGCACTACAACTGAAGGAGATTCTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGATTCGAGTTCCGCGGCAACTGAGATAGGCACCACAGCTGAAGATTCGACGTCTGAACCTGAAAAAAGCACTTCAGCTGAAGGCGATTCCACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGACGATACTACTTTTGCTCCTGAAGAAAGCACCACAGCTAAAGATTCGACATCTGAGCCTGAAGAAAGCACCACAGCTGAAGGTTCGACATCAGAGCCTGAAGAAAGCACTACAACTGAAGGTGATTCTACTTCTGCCCCTGAAGAAAGCACCACAGCTGACGATTCGACTTCCGCGGCAACTGAGATAAGCACCACAGCTCAAGATTCGACGTCTGAACCTGAAGAAAGCACTACAGCTGATGACGATACTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGTTTCGACATCTGAACCTGAAGAAAACTCCACGGCAGAGGACGATTCTACTTCTACTCCTGAAGAAAGCACCACAGCTGAGGACGATTCTTCTTCTGCTCCTGAAGAAAGCACGACAGCTGAAGATTCGACTTCCGCGGCACCTGATATAGGCACCACAGCTGAAGATTCGACGTCTGAACCTGAAGAAAGCACTACAGCTGAAGGAGATTCTTCTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGATTCGACTTCCGCGGAAACTGAGATAAGCACCACAGCTGAAGATTCGACGTCTGAACCTGAAGAAAGCACTTCAGCTGAAGGCGATTCTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGATTCGACATCTGAGCCTGAAGAAAGCACCACAGCTAAAGATTCGACATCAGAGCCTGAAGAAAGCACTACAACTGAAGGTGATTCTACTTCTGCCCCTGAAGAAAGCACCACAGCTGACGATTCGACTTCCGCGGCAACTGAGATAAGCACCACAGCTCAAGATTCGACGTCTGAACCTGAAGAAAGCACTACAGCTGATGACGATACGACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGTTTCGACATCTGAACCTGAAGAAAACTCCACGGCAGAGGACGATTCTACTTCTGCTCCTGAAGAAAGCACCACAGCTGAAGATTCGACATCTGAACCTGAAGAAAGCACCACAGCTGAAGATTCGACTTCCGCTGCACCTGAGATAAGCACTACGGCTAAAAATTCGACATCCGAACCTGACGAAAGCACTACATCTGAGGACGATTCTACATCTGCTCCTAAAGAAAGCACCACAGCTGAGGCCGATACAACATCTGATCCTGAAGACAGCACAGTTCAGGACGATACTACTTCTGCTTCTGAGGAAAGCACCACAGAAATCACCACAGCTGAGGATGGTGCTACTTCTGCTCCTATAGAGAGCACTACTGCTAAAGTAGATTCTACCACTGGATCGACGTCTAGCCCGGCGACATCACCTTCTCCTATACCGCCTATGTCATGTGCAAGTGGCGCTCCATACTTACCGCATCCATCGGATTGCCATAAATTTATTCAGTGCAGCAACGGACATGAGTACATCATGCATTGTCCAGATGATCTCTTCTGGGACTATCAGAATTTATACTGTGGGTATGATGACAGCGGTTGCTATAACAAAGTGGATCCCGAGGAAACGGTTTGCAAGCACGGCATGGATTTTCTACCAGACCCAACTGATTGTACGAAATATATCCAGTGCAGTAATGGTCAACCAATCGTCCAGAAGTGTCCTGAGCCTTTGTATTGGAACCAAAATCTTAAAGTATGTGATTGGTTCAGTAGCTCCTGCAAAACTCTACAAAAGAATGAAATAATATCTTGTAAAATGGGTATGAGTTTTGACGTTTTTCCAACCGACTGTTCGAAATATATTAAGTGTTTTGGTGAGCGCGGTGTAATAATGAGCTGTAATTCTGGACTTTTCTGGAACTCTTTGCAGGAAGTATGCGAAAAATCCCAGCGGTTCTGCAAATAATATGTAAGCATAAACAGTTACTCGTATAATATTATTCACTCTTGGTAGATTTTCTTGTTAAATGAATTGAAGAATATTACAGAAAATATAAAGGCATTACCCATTCTTTAATC\n>XM_029689086.1 PREDICTED: Oncorhynchus nerka SWI/SNF-related matrix-associated actin-dependent regulator of chromatin subfamily B member 1-A-like (LOC115147092), mRNA \nATGGTGTCAGGTGTGCGGGATAATCAGCAGCCTGATGACCTAGAGGCCGGAGAAAGGGAGTATAGGGAGCAGAAGGCAAAGAGGAACAGCCAGTGGGTCCCCACGCTGCCCAACAGCTCCCACCACCTGGATGCTGTGCCCTGCTCCACCACCATCAATCGCAACCGAATGGGCCGCGACAAGAAGAGGACCTTCCCCCTGTGCTTTGGCGACCACGACCCGGCGGTGATCCACGAGAATGCGTCTCAGGCCGAGGTGTTGGTTTGTCTGGACATGGAGATTGACGGGCAGAAGCTCCGAGATGCCTTCACCTGGAACATGAATGAGAAGCTGATGACCCCAGAGATGTTTGCTGAGATCCTGTGTGACGACCTGGACCTGAACCCCCTGGCCTTTGTCCCGGCCATCGCCTCAGCTATCCGCCAGCAGATAGAGTCCTACCCCACAGACAGCATCCTGGATGAACAGACCGACCAGAGGGTCATCATCAAGCTGAACATCCACGTGGGGAACATCTCCCTGGTGGACATGTCGGAGAGGGAGAACTCTCCGGAGACGTTTGGCCTGATGCTGTGCTCCGAGCTGGGCCTGGGAGGAGAGTTTGTTACTACCATTGCCTACAGCATCCGCGGCCAGCTCAGCTGGCACCAGAGGACGTACGCCTTCAGGGCTGATTTCAGTGAGAACCCCCTGCCAAAGGTGGAGATTGCCATCCGCAACACAGGTGACGCATGGTGCCCTCTGCTGGAGACCCTGACAGATGCAGAGATGGAGAAGAAGATCAGGGACCAGGACAGGAACACCAGGCGCATGAGACGACTTGCCAACACTGCCCCCGCCTGGTAGAGAGAAGCACCAATAAGCTACTACAGAGCCTCTAGTCCAGTGGTTCCCAACCTCTTTTTGAACCGTGGCACACCTTGATGGGATATACAATTATGCCCTGCACACCAAATTCATTCATTTAGTGGTGATGACATCCATCTGATCTATATTGCATATCATCTATTTTCTGTGACAAATGTTTACTAAATAGGGTTTGTTTGAAGTATTTTCATAGTTCCTTACTCATGAAGGTTCATTTCTGTATACCCCTTTAAGAGTATCCCGCAAATAGGTATTTAGTTTTGAACAGTCTGTGTTAGAGGTACAACCACGTACACATAGCCAAGCTCCATTTGTTTTTATGGCAAGAGGCTGTGGTATAGCTAATAAATTACTCTCGCTAAGCCTAATCAAACTTACAAGTGATAATGGTTATCACAGACTAAGTAAAATAATAAAAATGACTTTGCTCGTGATGCGAGCCCCTCAAATGATACAAATGGAACAGCCTGAGTGCACTGGACTTGGAACAACGATACAGATGTAACAATGTACCATTTAATCTATTATCTGACTGGCACAGGTGCTCCCAAATCAAAATTACAGAGTGTACAAACATTTTTATCAAGATTAGGAAAGGTTTTGTGGCACACCACTGCTTCTAGTCAGCTAACAGTCAACTCCTATGGGCCCTCTGTGGAGACACACACACAAACAAACGTGACAAAAGACAGTCAACTGGTCCCTTCTTACAGCCCCCGTAATATTAAACTAGCTTTATGCTTGATTGTCATACTAATCCAGTACCAATGCCACATCTCTACTCCCATTAATAAAAATAATTACATCTGATCCCAGATCAGAGACTGTTCAAGGAGCCTTCTCCATTTCTAGCCCCTCTATTGGTTCAACCGCTACTCATTTCTGATGAGATGAGGCGACGTGGTATATAAAAGGTGCCATGGGTAGAGTGTATTTGTCCGTATGAAATGTAGCCATTGTCGATTGTACGGACTCACCATCTAAGTGAGCTCTACCTGTAATACTGCTTTGATGCACTTATATCTCTCATGATAGACAATGCTGACGGACTTGATCTGTCTGTTAATAGAAACACTCAGACTCAACTCTTGGGAATAATGTAAAGTTCTGTATTTATGCTGATACTTTTAGTATATTTTTTAGTTTCCTTTTTTAATAAAATAACATAAACCAGA\n>XM_028986422.1 PREDICTED: Denticeps clupeoides disintegrin and metalloproteinase domain-containing protein 11-like (LOC114794095), transcript variant X1, mRNA \nGGAGCTCCCGGTCCCACGTGTCCTGCCTTCCTCCGCTGGCTCGGCGCTTCTTCCTTCCTTTCTTTTAATCGACAGCTCCCTCCTTTCGCAGGCTGGCCGCGTTTTTCATTTGATTTCATTTTTTCATTTTTTTTTTCCTTTGGAACCGCAGCGCCGCCCAGTCTCACATTCGCCCGCGACGGGGCGCGCATCTCCCCGCATCGCCGCCCGCCCGCCCCGCTCCCCCGGTTCATATTTATCGACCGCCTCGTCGTCGTGAGCACGTTCCCGTCCGGTTTTTCCTGCTCCATGTGAGCCCGCGGGGCGACGTGAACAGGATGCTGGTCCTGCGGTGCCTCGTGTTCGCTGCTGCGGGCGCCGGGCTGTCCGCGACAGGCGTGAGCGGCGGGTCTCCAGCTCAGGATGCAGGCTTGTGGGACCGGGTCCTCCCAGTCCTCCCAGAAGAGGAAGAGGAGCTGTCCCGGCCACACCGGCTGCTGCCGTGGAGGGACTCGGACAGGGAGAGCCCACACAGTCACCTGGACACCCGGTTGAGGGACAGCAGCGGGAGCGTCACGCCTGTCCATTTGGCCCAGAGCAGCTTCCAGGTGGAGGCCTTTGGGAGCGTCTTCACTCTGGACCTGGAGCTGAATCATAATCTGCTCTCGTTGGATTATGTGGAACGGCACTTTGACCGGAGCGGAAATCCTTCAGAGTCGCTGGGAGGCGAGCACTGCTATTACCATGGTAAACTGAGGGGAGTACCAGGCTCCTGGGCAGCTCTGTCAACATGCCATGGCCTATGTGGCATGTTTTCAGATGGCCTCCACTCCTATGCCATTGAGCCCATCTTCAACGGGACCAATCAGGCTGATGGCACTCATAAAATCCGTAAAATGCCTGATGTCAGACTTCCAGCCTCCTGTTCAGGTTGTGAACAAGACGGAGAAAATGACACTGGTGACAATGACAGTAGTGAAAATCTGGACCCTCAGAGAAGGCCGAAACATACGGAGGGACTGAAACGTTCCAAAAGAGCGCTCTCGCGGCCCAGGGTGCAGACCGAAACCAAGTACATTGAGCTCATGGTGATTAATGACTTTGAAATGTTCGTTCTTCTCCGGCGCTCCACTGCTCAGACCAGGAACTTTGCCAAAGCGGTGGTGAACATGGCCGATGCGATCTACAAGGAGCAGCTAAACACCCGAATTGTGCTGGTTGCCATGGAGACCTGGACATCTGGGAACCCCATTACAGTGGAGTCGGACCCCCTGATAACTCTTCAGAACTTCATGAAGTACCGCACGGAGAATGTGAAAGAACAGAGCGATGTGGTGCACCTTTTCTCGGGCAGCACGTACCAGAGCAGCCGCAGTGGGACGGCATACTCAGGCGGAGTGTGTTCCCTTGCCAGGGGAGGAGGCATCAATGAGTATGGGAATGTAGGTCCCATGGCCATCACGCTTTGCCAGAGTCTGGGTCAGAATATTGGCATGAAATGGAACAACATCCGCAACTCAGCAGGTGACTGTAAGTGTCCTGACACTTGGCTGGGATGCATCATGGAGGATACTGGCTACTACCTTCCACGGAAATTCTCCCGCTGCAGTGTGGATGAGTACACACAGTTCCTGCTCCAGGGAGGTGGGAGCTGCCTCTTCAACAAGCCCAACAAGCTGCTGGACCCACCTGAATGTGGGAATGGTTTTGTGGAGACTGGAGAGGAATGTGACTGTGGCTCGCAAGTGGAGTGTGCCCGCAGTGGAGGGGCGTGCTGTAAAAAGTGCACACTTACTCATGATGCCATGTGCAGCAATGGACTGTGCTGCCGGGAATGCAGGTATGAGCAGAGGGGAGTGGTGTGCAGAGAGCCGGTGAATGACTGTGACATAGCTGAGACCTGCACAGGAGACTCCAGTCAGTGTCCACATAATGTACATAAGCTGGATGGGTACATGTGTGACAACAGCCAGGGTCGTTGTTATAATGGTCGTTGTCGGACACTAGATGGACAGTGCAGACGTCTCTGGGGCTTCAACGCTGCTGATCGGTTCTGTTATGAGAAGCTGAATTCTGAGGGAACAGAGAAAGGGAACTGTGGCCGCAACCCTGGTGGACAGGGCTGGATGCAGTGCAATAAACCGGACGTATTGTGTGGCTTTCTGTTCTGCTCTAACATGACTGCTAAGCCTAAATTTGGGGACCTTCAGGGTGAGGTGACCAGTCTGACCATCTACCACCAGAACAAGTATCTGGACTGCAGAGGAGGGCATGCAGTTCTAGAGGATGGTTCAGATTTGGGTTATGTGGAGGACGGGACGCCTTGTGGACCCAACATGATGTGCCTGGAGCGCCGCTGTCTTCCCATGTCTTCATTCAACCTCAGCACTTGCCCTGGGTCCAGCTATGGACGCACCTGTTTTGACCACGGAACTTGCAGTAATGAGGTCAAGTGTATATGTGACAGTGACTACACAGGGAAGGACTGCAGCGTGTATGACCCCATCCCTGACCCCACAAATCCTCCTGGCCCAGATAAAAAAGGAACATACGAAGAGGAAGATCTGGAGGGGGATAAAATCGATCTTCCTGTCTGTGTCCATGTTGCTGTGTGTCTGTGCTGTCTTCCTTACACTGTGTCCTTTCCACATCGGAGAAGAACAAGTCTTCCAACCACACCATTCCCTACAAAATATCCTCTGAATAGCTTCCAACCGAGATTCATCTCAATGTCCCTCTGTGCCGTCTAACGGCCTGCAACAGTGGAGCGTCTCCTGTCATATTCCAGCCTGCCATGTGTCTTCAGGCGAACCTCATTGACAGTATGGTCATTTCCAGATATAGGGGAGAGTGGTCCTTTGAAGATGACAGACAGCAAGGACTTGTATGTGTTTTTATGTGTGCGTTTATATATCTGTTCCCTCAATTCCATTGTTGAGTGTCCAGGAAGGGAACATGAAATGGATGGAAGGAGCACCATGTAATGATCTCACAAAGACACAGAGCAGTTTTTTTTATGACCTTTGTTCTTGGCTCTCCTGGTCACTGCTTGTCTGTTGCAGAACCTGGAGACCTTGCTCAGACCGGGTTTTTTGAACATACTTTTGAAAAACGTGACTTGAAACAAGAGAGACAATTTTCATGAGAAAACAGGCTGATTAGGAGCTGTTATATCAAAGAAGTTGGATTTCAGTCGAAGAAAGACTGGTTAGTTCTTCTCTTCCCAAAGAAAAAGGCCAGAAGAAGGAACAGATCAACATTGCAGGAGTGGAACTCCATGGACTAAGCCTGGAACTACAGCGGCGGGTCTTACATCTGCCAGTCTGAGCTCAACAGCTATAACTGTGTGCGCTTGCGTGTGTGTGTGTGTGCGCGTGTGTGTGTGTGTGTGTGAGACAGACTGTGTTTTTGGTTTTGGGATCATTGTTACTCCTGCCAGTCTTAGTGACAACCTTGTACAGGGCAGGGACCAGGTCAGTACTATAGAAAAGCAACATTCCACGTGGTTTTGTGTAGACCTTTTTCTTCCACAATATTTGTCTAAAAAACATTTTGAGAAGACCAAAAGTCCTAGAAAGTATGCCTCAAGGATAACTGTGAGCACATGCATGTGTCTGAGGATGTGAGAAATGATGCACAGGTTGACAGCTCTTAAATGTAGATATGAATGTCATCACTATGTTGTGCTGCAGATTAATGTCAGCGTTAGACCAGCAGCACACTACACGGAAAAAAAGGTTTTCATATGATGCAAACATAAGGAACACTAAAATGTGTTCACTCATATGCACTTGTACATTATGGCATTTGCAAGAGACATGTTAATACATGTGAATACATACGTTAATAATATTCTATGAATTCCATAATGCAAATTGTTTATTTGATAAAAATAAGTAAATATCATCTATCTATCTTATCTATCTATCTATCTAACTAACTATGGGCTTGGTAGCATTTAAGTCTTCTGAATATACAGAACGCACAAGAGGTCCTACCACTCCCACTGATTCTTAATCTGTTTACCACAGTGAGATATTCCGTGTTTTTCGCTTCAGCCTGCGCCCATGCATCATCAGTTCGTAATGTTTGTGGACCTGTCCAGATATCCACCCCATTAGCTGTACTTCACTGCCCTCGTTTTCTACTGTAAATGTGTTGATAGGCCCGTAGCCATGAGTTTAACCCGTAGGCTGCATAGACTTTGTTTAGTCTTTCATCGTAAATGAGATTACTTGGTCATATGGTTCCAGTAAGTGTAGCTTCCAAATAAACATTCATGAGCACCTACCAAGTAGCGGTGTTCCTGCACAGCACCCTACGCAATGCTCACAAGTTCCTCTGTAGTGCCTCGCAGGAAAACGGTCTAATACAGCGTTCTGAAATCTGTATGCAAGTCTCGATACCGGTGCCGAATGTCTGTTAATCCAAGCTACACTTAGAAGTCCAATGTGACCAAATGAAAGGAATAAATGTGAACGCTTGTGGGGATAAAAGCATTATTGGGTTGGGTGCTTGTAAAGAAGAGCTTTTTGCACTAAGGTAGATACACATTAGTCATGTACAGTAGGGACTGGGGATTGGGGCTGGTGAATGCTGGTTTCAAATTAAGAGGACAGAGGCTTTATGAGGAAAAGACCCCCGTCCATGACTTTTTAATGTGACCTTTTTAAACAATGTTGCAGTCATTATGACTGAGTGAATGGACGTGACTGTACGAAACACCCATAAAATAAAAATTTAGACATGAAAAATAA\n>XM_008008285.2 PREDICTED: Chlorocebus sabaeus four and a half LIM domains 2 (FHL2), transcript variant X2, mRNA \nTAAAGAAACATCTGCAGGGTAAGAAGGAAAAAAATCCACCGTGCAAATACATCCCAGGCACATGCCTCCTGAGAAGTGGCCCCCTCCTCCCTCCGCCGCCCCCGGCACCTCCTCGGGCTTCGCCAGCTTCCTGCTCCTGGGAGCAGGCAGAGATCCCGGCGTGGGCAGACCCCTGCCACTGGCGTCCAGGCCCCGTCCGAAACTCACGCCCACGTCGGAGGAGACTCTCGGGATAACCTCGGTGCTCCCAAGACCCGGAGGGCAAGAAGAAAGAGCCCTGGCAAACAAAGGGCACGGGCCGGCAGCGCTGCAGCCCGGGGTGGGGGCACGGTGACCGCTAGGCCTGGGGGCGCCCGCCCCCAGCGCCCCACGCCCGGTGCCTGCGAGCCGAGGCGTGCATCTCCTTATATGGTCAAATGACACGGAGGGGGTTCTCGAGGGCGGGAGCCGCGCAGCGCTCCACTCGGCCGGCAGCGGAGCCGCAGCCACCAGCCGCCCGCGCCCGCCCGCCCCGTCCGGCAGTCTCCGGGCCGCTGCGGCGCGGTGAGTACCTCCAACTCCCTGCGCCCCGGAGGGAGGCCGAGGGGCTTAGCCACCAGGACTCGGAAGAGGGGGCCGAATCCGGTGCGAGACCCGGGGAGAGGGGAGCAGATCCGGAGTTGGGGAGACCGGTTGCTGAAAAGGCAGGTGTCAAAATGACCGAGCGCTTTGACTGCCACCATTGCAACGAATCTCTCTTTGGCAAGAAGTACATCCTGCGAGAGGAGAGCCCATACTGCGTGGCGTGCTTCGAGACCCTCTTTGCCAACACCTGCGAGGAGTGTGGGAAGCCCATCGGCTGTGACTGCAAGGACTTATCCTACAAGGACCGGCACTGGCATGAAGCCTGTTTCCACTGCTCGCAGTGCAGAAACTCACTGGTGGACAAGCCCTTTGCTGCCAAGGAGGACCAGCTGCTCTGTACAGACTGCTATTCCAACGAGTACTCATCCAAGTGCCAGGAATGCAAGAAGACCATCATGCCAGGTACCCGCAAGATGGAGTACAAGGGCAGCAGCTGGCATGAGACCTGCTTCATCTGCCACCGCTGCCAGCAGCCAATTGGAACCAAGAGTTTCATCCCCAAAGACAATCAGAATTTCTGTGTGCCCTGCTATGAGAAACAACATGCCATGCAGTGCGTTCAGTGCAAAAAGCCCATCACCACGGGAGGGGTCACTTACCGGGAGCAGCCCTGGCACAAGGAGTGCTTTGTGTGCACCGCCTGCAGGAAGCAGCTGTCTGGGCAGCGCTTCACGGCTCGCGATGACTTTGCCTACTGCCTGAACTGCTTCTGTGACTTGTATGCCAAGAAGTGTGCTGGGTGTACCAACCCCATCAGCGGACTTGGCGGCACAAAATACATCTCCTTTGAGGAACGGCAGTGGCATAACGACTGCTTTAACTGTAAGAAGTGCTCCCTCTCACTGGTGGGGCGTGGCTTCCTCACAGAGAGGGACGACATCCTGTGCCCCGACTGTGGGAAAGACATCTGAAGTCAACACGGAGAAGTTGCTGCTTGTGATCTCACACACAGATTTTTATGTTTTCTTTCTCACCCAGGCAATCTTGCCTTCTGGTTTCTTCCAGCCACATCGAGACTTTCTTCTAGTGCTTTTCAGTGATACTCACGTTTGCTTCAACCCTTTAGTGCTTTGTGCTAGTTCAGTCCCAGGGAAAGAGAAAACTTGCCCTAGGCCCTAGGTGGGAAGCTGGTTTGAAATTTTTGTAATCAAGTAAGGCACAACCAAATGTAAAAATCCTTTTGAATGATGTCTTTATAAATCTTTCTCTCACTGCCTATTTAAGTGCAATTAATGTATGCCACAAACTTGAAAGTTTTCTAAACTCAGTAAGGTAATGACCAATTGGTATTTACAGCTCTGTAACTTCCTGTTGTGTCAAGTCTAAACCAAGATTATGTGACTTGCAATAAAGTTATTCAGAACTAAA\n>XR_006147264.1 PREDICTED: Dipodomys spectabilis small nucleolar RNA SNORA40 (LOC122106945), ncRNA \nAGCAATTGTATGTGTGCCTTTGTTTCATTTGTAACAAAGCCATATAGACAGGTGCAAACAGCAAATCCTCTACAACCCAGAACTCATTGTTGAATATGAGTTTGGCACATGTAAAAAGAATATG\n>XM_034342832.1 PREDICTED: Prunus dulcis ATP-dependent 6-phosphofructokinase 6 (LOC117614132), transcript variant X3, mRNA \nCCAATTTACTAACAGCCCCTCCTCCCCTGTCCGAGGACCATACACTCCGATTTCGTTTCTGCTTCAATTACTTTCAATCGCAGATTATTCTTCTGGTTTTGTTATGAGTGATCAGAAATCCGCAAAAGCAATGGGGCCTACTGGAAACTTGCAGATGAAGGTCGTGAAAGGCGATTTTGGTTATGTGCTCGAAGACGTGCCTCATCTCTGCGACTACTTGTCCGATCTTCCTACTTATCCCAATCCGTTGCAATTCAATCCGGCTTATTCAGTTGTAAAGCAGTATTTTGTTAATGTGGACGATACTGTTGCTCAAAAGATTGTTGTCCACACGGATAGTCCAAGAGGGACGCATTTTCGGCGAGCAGGACCACGCCAAAAGGTGTATTTTGACTCGGATGAAGTTCATGCTTGTATTGTAACATGTGGTGGTTTGTGCCCTGGACTCAACACGGTGATCAGGGAAATTGTGTGTGGACTTTATCACATGTATGGCGTCAACAAAGTTCTTGGGATAGATGGAGGATACAAGGGTTTCTATGCCCGAAATACCATTGACTTAACACCCAAGGTTGTCAATGACATCCACAAACGTGGTGGTACTATCCTTGGTACATCACGAGGAGGACATGATACCTCAAAGATTGTTGACAGCATTCAGGATCGTGGAATTAATCAGGTTTACATAATTGGAGGTGATGGAACTCAAAAAGGAGCAGCTGTCATCTATGAGGAAATTAGACGGCGCGGCCTCAAAGTTTCCGTTGCAGGAATTCCTAAAACCATAGACAATGACATTCCGGTTATAGACAGATCCTTTGGCTTTGATACTGCAGTTGAGGAGGCTCAACGTGCCATTAATGCAGCTCATGTTGAAGCTGAAAGTATTGAGAATGGTATTGGTGTTGTGAAGCTAATGGGACGCTACAGCGGTTTCATAGCTATGTATGCTACACTTGCCAGCCGAGATGTGGACTGCTGTTTGATTCCGGAGTCCCCCTTCTATCTTGAAGGAAGAGGTGGACTTTTCGAGTACATAGAAAAACGACTCAAAGAAAATGGGCATATGGTTATTGTGATAGCTGAGGGTGCGGGACAGGATCTTCTGTCAGAGAGCTTGCAATCCATGAACCAGCAGGATGCTTCAGGAAACAAGCTACTTAAAGATGTTGGCCTATGGATTTCTCAGAGGATAAAGAATCATTTTGGGAGACAACAAAAGATTTCCATCAATCTCAAGTATATAGCATATCACTGAGAAGCAAAACAAGGTTGTGATTACCGACAGGATGTGGGCACGACTTCTTTCTTCAACTAACCAGCCGAGCTTCTTGAACCCCAAAGACGTCATTGAAGTCCAAG\n>KU329545.1 Uncultured bacterium clone OTU_22088 16S ribosomal RNA gene, partial sequence \nTACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTTTGTAAGTCGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCGTTCGAAACTGCAAGGCTAGAGTATGGTAGAGGGGGGTAGAATTCCACGTGTAGCAGTGAAATGCGTAGAGATGTGGAGGAATACCAATGGCGAAGGCAGCCCCCTGGACTAATACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGG\n>XM_012378055.1 PREDICTED: Linepithema humile serine/threonine-protein phosphatase 4 regulatory subunit 2 (LOC105678582), mRNA \nTCCCTCCTGTCATATCTCTCATTGTTGCTGTTTTGTGGCCGATAATCAAGACAGTCGAGAGGAAGCAGGGAAGACTTGTCAGAGGAGGTTGTCGGCGGCGGCGGGGAAGATGGAAAATTTAGAGGAGGTGTTGCAAGCGCTCGATGAGTTCCAGAAAATGCGGCCGACGGTAATCCCGCAGGAGTTGGAGGATTATCTGTGCTGGGTCGCAAAGACGGGCGATCCCGTCTACCAGTGGCCGTTGATCAAAACGCTCTTCAGGGAGAAGCTCACGCGCGTAATGACAGATTTTTACGAGAGTTGTCCCTCTCTGGAGCTGGCGACCTGTCCCAACGTGGAGCACTTCAACTACGACACGATGAAGAGCAGCCTTCTGGAGAGATTAGAGTCATTTGCGAATGCGCCCTTCACAGTCCAGCGGATATGTGAATTACTGACGGCGCCGCGCAAAGAGTACAATCGCGTGGATAAATTTATGCGCGCCATCGAGAAAAACATTCTGGTGGTTTCGACACGTGAACCCGGGCCTATCGCCAGACGCGGCGAGACCGGCGACGGTATGGTGAACGGGTCCGTCGAGGAGGACACAGCCTCGATCATGCAGCAGCAACCACCGCCACCGCCTCTCTCATTGTCACCGTCGCCGTCATCGTCGCTATCACCGTCATCGTCGCCGTCGCCATCGTCATCGCCATCGGCATCACCGTCGCCATCACCTTCGCTCTCACCCTCGTCCTCACCTTTGCCCTCACCCTCATCGTCGTCATTACCTTCACTGTCACAGCCACCGTTGCAGTCGTCACCGCAATCACCGTCGCAACTACCACAGACAACGCAACCGGCGCAGACAGGTCAGCCAAACTCTCAGGATGTGGAGATGGAATACTGGGAAAAGGACTGCACCTCAACCGTCACCATCAGTGTGCACACCGTTGTGGAAAACGAAACGCCTCCTCTCTTGCACAGCGGCGTCATACCGGCCGCTGGCTCACCACTGGCTAAAAGCATATTCACCGCGAGTGAGGCGACGCGGGAGAAGCTGGAGCAGGTCGCCTCTAGAACGGAAATCGCGACGTCCAATTATGTCCCCGCTACTTCAGACTTTTCTACTATATCGAATTTAACCTCGCAGGAGTCGGCGCCGACCGCCGTTCCAGTTGTGCAAAGTCTACCGGCTGCTGAAACGGTCTCCGACGATTCGCCTGTCGGCAGCGCCGACGTGGCGGAGGCGATCATGAACGAGGACACGACTTCTCAACCTAATCTAGATTTGGAGAGCGAAGAGATCGAACCGGCCGCAACGGCGACCACCACGACGACAACGATGACGACAACGGCGACAACAACAGCGACATCGTCGACGACGTCGACGTCGGCGGCAACGACGACGGTGACCGTTGTAGCGACGGTGATACCGTTGACGACGGACACCACGCAGAAGCTGCAGGCCGCTTTCCAAGCGAAGCACTTTGAGCCCGACGATAATAAGTGTCTGGAAAAATCCAACGAGAAGACACCGGTCTCGTCAACGGTGGAAGAAGGAATTGAACATTCCATGAAGAATGAAGAAACGACATTGGCAAAATCGAAGCCCGAGTGTGCGGATTCCAACGAGATGTCTCACAATGAAAGTAGGTTAACTGAAAATTTGCTAGAAACGGATATCGAGATGAGATCCGACGCTCTGGCGAATGACGCGGAAAGTGTCAGCGAGGAGAGAACTGCGAATAAACCGGAAGAGGAGGGAACATCGGTCCTCGAAGATGTGGATGAAGAACATTTACGGGTGGAGGAAGATGCGAAAGGAGAAACGGCGGTATTCGTCGAGTCGCAATCCACGGAGAAGGACAGTGCAGTCACGCCTGACGAATGCGCGGTTATTGTATCCAGCGGCGAGGCATTGTACAAAGCGGAGAAGGCCGAGACGCATCCCACGGAAACGTCGACGACAATTTCCTTGAAGGAGAGTTTTACACATGACCAATCTATAAGCCAAAAAGCTGAAATTATAGAAGTAATGGATAAGGTTCTAGAGGCCGTTCCTAAGATAGCGTCTTCTAACGGCAACGACGACGGACAGGAAATACAGGACACTGAATTCAACACGGATAATTTGAAAATGATGGAAATCATCAACGAGAAGGTGAGTCTTACCGAGTCCGCGATGTCGGATCCGATAAGCGTTATAGAGAAACCGAAAGAAGTGACATCCGTGATTGAGAAACTCGAGCTCGTCTCGCCTACTGTCGAAATGACAGAGAGCTCTGATAACGTTGGCTATCAGTCGCCAAAGGACGATAATTCAGCAGGCATCCAGGACGACGGTTTAGCGAATGCGCAAGGTAATAAAATGGCGTGCGTCATTAAAGAGAATCAGTCTTCTGTAATAGAGAGTGTGGCGTGTAGAAGAGAATCGATGGAGTTGATGGAAGTTGACGACGAGGAATCACCGTCGACATTTCAGCAAGACGAACCGATGGAGCAGGAAACAATGGACGATTTGTCGAAGAGTTAATCCCGGCTCATTTAATCGGTTGCATGTCTCTTTCCCTCTGTTTGATATCTATTTTTAAGGGTAGATGTCGCGAAATAAGAGCTAATACGTAAGATATCTTCTTGCGCGTAAGATGCTTGGTAACTGACGAACACAATTAAGCATATAATTTTTAATAGCCGTTAATTATGAATTGGAATTCAAATTATGAGCAAAAATTCTCGATATTGTTTGCTGCTTTATTTATTTCGGATACTTCGCCGTTTAGACTGAGCTCCGGTATTTACTTACAAAGAGATTTATCGAAGTGAATTTTCTAACTCTTGGAAGAAGAAAAAAAGAACACTGCCTATTCCCAAACGATTGTAATACTGAAACTGCTTGTATAGAAATCAGATTTGGTAAACATTTCAATATCGATTTATACAAATACCATAGATATCTGCTTAGAATAAGGTTGTGCCTACAACTATTGTGTATATTGCGTATTGGACAAGTATACCTGATGCATAAATTTTTAAATGATGACGTATAAGCACTACAGATTCGAGTATCTCGCGGTCGAGGTAAACGAAACAGCGTTCGTTCACGATCACAGCCTTATACTAAGTTGCGGTTGAATCTCGAAACGCTTCACGGCTACTTCTGAGAGAACGTTCGAGATTGATCGAAGATATTATTCCTTGCTAAAACTTTCTACAGTACGTAACGGCATTTGGAAATGTGTTAGAACGATGTTACTTCGAGCAGCTGTCTACTAAAACTCCGCTACAGCTAATTCAAAATTGATATTCCAGACGTATCGCTTGAAATCAGTATGTCAATTTCATTTCGTTTCTGTTATTATATCAGTGGGCAAAAATAGTTTCCTTCTTTTTTTACCGAGTGTTTACTGCATATGAAATGTAAAGAAAAAAAGAGACTAGTAACAAACTATATTTTATGAATTACACTAGCTCTTTGTATTTTCGTTCCTCCTATTTTGATATTGTATTTTCAGTAAATGAAGAATGTAGTTAAGTCGCAGATGCGTGCGAATCGGAACAGAAATCTTCAAGTGGCCCAAAACTGATAAAATCGATTCACCGCGGGGGCGCCCAGGATCCCGTTAAGATCGTTTCGAACCGCTTACAGTTTATGTATCGGCACAAGATGTTTTCGAGCGGATTCGGATTCGATGCGGATCCACCGAACCGTTATTAGAAGAATATCGTAGGAATGGGATATTAATTTAAGAATTAATATAGATTAATGATACATGATACACGCGAATGTGGATATCTGAAAAAAAATAGCTGTACATTATTTTATAAGAAAATATATAAAAATGATTGTCAA\n>AB050083.1 Mus musculus VH2C mRNA for anti-A/dT antibody, partial cds \nGGAATTCATGAAGTTCGGGCTAAGCTTGATTTTCCTTGTCCTTATTTTAAAAGGTGTCCAGTGTGATGTGCAGCTGGTGGAGTCTGGGGGAGGCTTAGTGCAGCCTGGAGGGTCCCGGAAACTCTCCTGTGCAGCCTCTGGATTCACTTTCAGTAGCTTTGGAATGCACTGGGTTCGTCAGGCTCCAGAGAAGGGGCTGGAGTGGGTCGCATACATTAGTAGTGGCAGTAGTACCATCTACTATGCAGACACAGTGAAGGGCCGATTCACCATCTCCAGAGACAATCCCAAGAACACCCTGTTCCTGCAAATGACCAGTCTAAGGTCCGAGGACACGGCCATGTATTACTGTGCAAGAAGGGGTACTACGGCCCTTTACTATGCTATGGACTACTGGGGTCAAGGAACCTCAGTCACCGTCTCCTCAGAGAGTCAGTCCTTCCCAAATGTCTTCCCCCTCGTAAGCTTGGG\n>XM_010007313.1 PREDICTED: Chaetura pelagica leucine-rich repeat-containing protein 4B-like (LOC104397361), partial mRNA \nAGCATCCCCTCCTACGCCTTCAACCGCGTCCCCTCCCTGCGCCGCCTGGACCTGGGCGAGCTGAAGCGCCTGGAGTACATCTCGGAGGCGGCTTTCGAGGGCCTGGTCAACCTCAGGTACCTCAACCTGGGCATGTGCAACCTGAAGGAGATCCCCAACCTGACGGCCTTGGTGAGGCTGGAGGAGCTGGAGCTGTCGGGGAACCGCTTGGGCAGGGTCAGGCCCGGCTCCTTCCAGGGCCTGGGCAGCCTGAGGAAGCTGTGGCTGATGCACGCGCGGGTGGCGGCCGTGGAGAGAAACGCCTTCGACGACCTGAAGGCCCTGGAGGAGCTCAACTTGGCCCACAACGAGTTGGCCTCTTTGCCCCACGACCTCTTCGCCCCTTTGCACCGCCTGGAGCGGGTCCACCTGCACCACAACCCCTGGCGCTGCGACTGCGACGTCCTGTGGCTCAGCTGGTGGCTCCGGGAGACCGTGCCCAGTAACACCAGTTGCTGCGCCCGTTGCCACGCGCCCCCGGCTCTGCGGGGTCGGTACCTGGGGGAGCTGGAACCCGGGCACTTCACCTGCTACGCCCCGGTCATCGTGGAACCTCCCGCCGACCTGACCGTCACCGAGGGGCTGGCGGCAGACC\n>XM_053147013.1 Fusarium falciforme Sm domain-containing protein (NCS54_00138400), partial mRNA \nCCAACTCTACCACGCCCTCTATTGATTTCGCCGCCTGCGGAAATGGACTCGGAGCAGGCTCGAGAATACCTATCGGGTATTCTAAACAAGAACCTGCGTGTATACACCACAGATGGTCGCCTATTCTGGGGTGCTCTAAAATGCACCGACCCTGATAGGAACATTGTTCTTGCTCATACATACGAGTACCGGCAACCGTCATCTAGGCAGCGTGCAGAAGCAGCCGAAAAGGCCGGTGGCGAAACAATCAAGCTTGACATGAGCTCCCGCTATCTGGGACTAGTAGTGGTGCCTGGACATCACATCGTCAAGATGGAGGTTGAGGAATTTGCGAGCCAAATGCGGAACCAGATTTGA\n>XM_010271001.2 PREDICTED: Nelumbo nucifera uncharacterized hydrolase YugF (LOC104606003), mRNA \nCACCCATCCAAATACTAATTGCAAACTGCAGCATTTATAATCGTATTCTCTCGTTTGAGCTTGAGGTCTCTCTTTCACTCTCCCCTCTTATTGGATGCCGAAATCTGCGGTTCCTTCTGTTCGTTGGTATGGTTGGGGTCGCCACTCGCCACCTGAGACCTCACCTCTAATAGGTAGGTATTGTTTGGCTACAGCTCCACCGCACCCCTTTCTCATTTCTCCTCTTCTGCTTTGGGAATCCTATAGTTCAATCGGTTCTGCATCGCCCCAGATTGATCATACTTCGGACTCGGAGGCGTATTTCGCTCAGATCTGTATAATTATCGTACCCATTTCATAGCTGGATTGAAATCGAACAACCTCCCAGTTTGTAGTGGTTCCGGTCCCTCTATTCCCTCCCAAACCTTCCATGGTGAAATCCCCAATTATCTGGTCTCCAACCGGAGAGACACCCTCCATTCGCGAGTCCCTTCCAATTTCATCAAGAAATCCGCACAAACAATAATAGTAAGGATAGAAGAACTTGGACCCCTCATCCCTCTCTCTCTCTGTAATTGATCCCTTACTCTCTCTCATGGCTAATAAATGTTTCAGCTTCACCGCATCAAGGGACTGGTGCTACCGTTACGCCTTCGCTAGCACTGGGCTTCGATCGGCCACGACCGACCTCGGCGATGGCACTGTCGTACATTGTTGGGTCCCCAAGACGCACAAACAGAACAAACCAACTCTGCTCCTACTCCATGGATTTGGAGCCAACGCAATGTGGCAATGGGGCGATATCCTCCGCAGCTTCGTCTCCCGCTTCAATATTTACGTCCCCGACCTCCTCTTCTTCGGTGACTCGTTCACCACTCGCCCCGAGCGGTCCGAGTCGTTCCAGGCCCAGTGCATGATGAGAATGATGGCGGCCCACGGGGTGCAAAAGATGATCTTGATTGGGCTAAGCTACGGCGGGTTCGTCGGGTACGGCATGGCGGCGCAGTTCCCGGAGGCGGTGGAGAAGGTGGTGATATGTTGCTCCGGGGTGTGCCTGGAGGAGAAGGATATGTCGGAGGGCTTGTTCATCGTCTCCAACTTGGACGATGTCTTCAGCGTTTTGCTGCCGCAGACGCCGGAGAAGCTTAGAGAGCTCATGCGGTTATCGTTCGTCAAGCCGGCCAAGATCGTTCCTTCTTGCTTCCTTCGCGATTTCATCGACGTTATGTGTACAGAATATGTTGAAGAGAAAAAGGAGTTGATCCATGCTTTACTCAAAGACAGGAAGCTTTCTGATCTTCCCAAAATCTCTCAGCCAACGTTAATAATCTGGGGAGAGCAAGATCAGGTATTCCCATTGGTGTTGGGACACAGATTGAAAAGTTATCTTGGGGAGAATGCTCAGCTAGTAGTGATAAAGAATGCGGGGCATGCTGTCAACTTTGAGAAGCCCAAGGAGATATACAAGCACTTGAAACCCTTCCTTTTTGATTCTCCTCCTCCTTCTCCTCCATCACAGCATCCTCCTTCAAAGTTTCTTGAAAACAAAGTAGATTGATGAACTGGTTTAATCTGATACGTACTACATTGTTAAACTAATATCATGGCTATATGGAAGCTGCTGGTGGCCTGGTGGGACTCTTAGAAAAGGCAGGCAGAGGAAGGTTTAGTCCAAATGTGCAACAAATTAATTAAGGATCCATATTGGTGATGATGAGTATGTATAATTGATTGATAACATAAATGCATATTGTACAATAGATCGATTGATTCATTGATTGA\n>KP859945.1 Uncultured bacterium clone OTU_340 16S ribosomal RNA gene, partial sequence \nCACGTAGGGGGCGAGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGTGTAGGCGGCTAAGTAAGTCAGGTGTGAAATCCCTCGGCTCAACCGAGGAATAGCACATGAAACTATCTAGCTTGAGTGCAGGAGAGGGGAGCGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAAGAACACCGGTGGCGAAGGCGGCTCTCTGGACTGTAACTGACGCTGAGGCGCGAAAGCTGGGGTAGCGAACGGGATTAGATACCCCGGTAGTCCCAGCCGTAAACTATGGGTACTAGGTGTTGGCAGTTAACCTGTCAGTGCCGCAGCAAACGCATTAAGTATCCCGCCTGGGGAGTACGGCCGCAAGGCTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCAGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCGGGGATTGACATCTTGTCGAACTTGGTAGAGATACCGAGGTGCCTTCGGGAACGTCAAGACAGGTGGTGCATGGTT\n>XM_014748744.1 PREDICTED: Polistes canadensis E3 SUMO-protein ligase NSE2-like (LOC106786730), transcript variant X4, mRNA \nTTTAATAACAAAAAACAAATAAAAATGACTCAATCAAAAGAAGTAGCCGAAGAATTGTTCGAATGTTATACAAAAACTGCTGAGAATATAGTTATATACTTTCAAGATAAAGAAAAGATAATAGCTGATTTGAAAGATGTTGTACAAAAGAACTGTGAAATAGATACTAAATTAAGTATGATTCAAGAGATAAAGGATGAAATATTAGAGAAATATGGTGATAAGAAAATAACGGAAAAAAATATACCTAAAATTATTAAGGATTATGAGAAATCTATATCTACAATGAATGTTGATGTATCTACAAATAAAAGATTACTGGAATTTAATAGACAATTGGAAGCATTATTGAACGATGCGAACAAAAATCAGAATATTGAGGAAAGTAACAGTGACGAAGAATTACAATTACAAACAGATTCTATGAATGTGATAGATCCTATTTCAAAAATGAGGATAAAAGATCCGATTAAAAATATTGCATGTGGACATACTTATGATCGTCAAAATATTATGGCATTGTTAAAAGTAAATAAAAAAACAAGGTGTCCCATGGTTGGATGCAAGAATACAAAATACATAGAAATCACAAATCTTCAAACGGATGTTGCAATGAAAGTATTTCTTCAAAGAAATCCTGTTTAATATTGTGACATTAAATGATTTTGTTCAGACATGCTAAAAATGTGATTATTTACTAATGTAAACAAATCACAAAATATTTCTATATATATTTAGATTTATATATATTATATAAATACAATTAGTATACCTACACAGAGATAAAG\n>XM_023661946.1 PREDICTED: Cucurbita pepo subsp. pepo vacuolar protein sorting-associated protein 54, chloroplastic-like (LOC111781387), mRNA \nGAGGCGGAGGTGGAGGTGGATTCCACTTCATAGAGGCGAGAGGCTTGAGGCTTGAGGCGAGAGGCTTGAGGCTTGAGGCGAGGCGCGCACGGAATTCTTGAACGAGATCTACCGCGGCACCGGACTTGCATTGCCAACTCTTATTTTCTCTCTCTTTCCTTCACCCAGCGGCGTCCACAACCTCTGTTTTCTTCATCATTCCTTTTCCATCTGGTGATTGAGATCCATCCGAAGCACTTCTTCATCTCGATCTCTCTCGCGATTGGAATTCATCTACTGAATGCCATCTTTGGAACCCGCCATTAGTTCATGATTCTAAGACTTTGAGCATGGACTCCCAGCCTTCCCAATCGGGAAGGTCCCCGACCGAGTATTCCAGCCTTCTCAGTAGAGAAACGACTCTTGGTCGAACTACTTCATCCTCCTCGCCTAAATCCAACCCCGATGCCAGCAGCCAGAGCTTGTCTTCAATTCTCAACAACCCTCACGCTGGCAAGTCCGATGCGTCCTGGGTTGGCTGGTGGTCCTCTTCCTCCACCGTCACCCCACCTGAGTTTATTCCCCTCACATCCTCCACAGCCTCATCGGAAGTTACTCGATTCGATTTTAACAACTACACGGCCTTGATCTCCGATTCTTATAACCGATTCGAGGACATACGAAACCATTCCAGCAAAGAGAACGGTGGCTTGGATAGCATTGGGGGCCAGGGGGAAGCCCTTGTGGCATGTTTGAGAGAGGTTCCGGCGCTTTACTTTAAGGAAGATTTCGCATTGGAGGACGGGGCGACATTCCGTGCAGCGTGCCCCTTCTTGAATGTATCGCAGAATTTAGTGCTGCAAGAGAAGCTTTCGCATTATTTAGATGTCGTGGAGTTGCATTTGGTCAAGGAAATTTCACTGCGTTCCAATTCTTTCTTCGAGGCTCAGGGGCAGCTACAAGACTTAAATGTGAAGATTGTGGAGGGATGTAGCCGGCTACGGCAATTAAAGGAGACCATACGGCTCTTGGATGTTGATTTAGTGGACTCTGCCAGGCAAATTCAGGAGCAGAATGCGACCAGGAACAATTTGTTGGCTCTTCAGCAGAAATTGAAGCTTATTTTATACGTTAATCAGGCCATTTCAGCTCTTAAATTGCTTGTAGCATCGGCAGATTGTGCTGGAGCCTTGGATGTGACCGATGATTTATTACATCTTCTGGAGGGTGATGAACTTGCCGGTCTACATTGCTTTCGCCACCTCCGTGATCATGTGGCAGCATCACTCGAATCCATAACCAGCATTCTTTCAGCAGAATTTATGCGTGCCTCAATTCATGATGCTGGAGATGTTGATCTCGTAATTATATCTGAAACAAAAGCAAGCATTTCAAATTTAATGAATGGAAAGGATGAAGTCAAGTTAACATGTATCTTGGATGAGGAAGAAACCTCCAACTTCCGTGATCGTCTTCTTCCTATTATCATTGGATTGCTTAGGACCGCCAAGCTTCCCTCTGTGTTGAGGTTATATCGTGATGCAGTTACAGTTGATATGAAAACTGCTATTAAGAATGCAGTGGCAGAATTACTTCCCGTTCTTCTAGTCAGACCTCTAGACTCAGATTTTGCACCGGGAGAGAGAACGAAGGATACAGATGGTGGAGCATCACTCGCAAGCAAGCTGAGGGGCCTGTCATCTGAAGGTTTTGTTCAACTTTTAAATGCCATTTTCAAGATTGTACAGGTACATTTGGTGCGTGCTGCAGAAGTGAAAAAGTCTATCGAATGGATTATGTGCAACCTTGATGGCCATTATGCTGCGGATTCAGTTGCTGCTGCAATTGCTACAGGTGCTGCAGCTTCTGGTACAGCTCAAGATAGTGATAACCAAGGTGGTTTGCCTCTTCCTCATGTACCTCAGGGTGCTGCCAAGGTTACTTCCTTACAGGGAAAAGCAAATGATGCGGCAAACCCTTCAAACATGTCTAGAAATTTCAGGGCTGATGTACTGCGAGAAAATACGGAAGCTGTTTTTGCAGCTTGTGATGCTGCTCATGGAAGATGGGCTAAACTCCTTGGTGTTCGCATTCTAGTTCACCCAAAGCTGAGGTTGCAGGAGTTTTTAAGCATATACAACATTACACAAGATTTTATAATGGCCACTGAAAAGATTGGTGGAAGGTTGGGATATAGCATTCGTGGAACTTTGCAGTCCCAGGCCAAAGCTTTCGTTGATTTTCAGCATGAATTTCGTATGACAAAAATAAAAGCAGTGCTTGATGTTGAAACATGGGTTGAAGTGGATGTTCCCGATGAATTTCAAACCATAGCTGAATCACTATGTTTTCATGAGCTGCTTTCTGCAAAACTTGATGATTCTCAGGGTAATATGGATCAAAGCTACAGTGATGTAGCTACAAATAATGAAGATGCACGCATTATAGGTGGTGTCAATGCTCAACAGCACTCTGAACAGGTTGATTCAAGTGACATTTCTGGGAGGAATACTGAACATGTGAAGCCTACTCCTGCAGATACAATTGAAAACAGTAAAGCTGATGTTGCAATTCCTGCGACACAAAATAACAATACTAATGTGAAGGAACGTGGAAAATCAAGTTCTCTGACTTTGCAATACAAAGGCGTTGGTTATCACATGGTTAACTGTGGGTTGATCTTGCTCAAGATGTTGTCTGAGTACGTTGACATGAATGATTCTTTGCCAGCACTATCTTCTGAAATCGTTCATCGTGTTGTGGAAATTCTCAAGTTTTTCAATACAAGGACTTGTCAACTTGTTCTTGGAGCTGGTGCTATGCAGGTGTCTGGTTTGAAGTCCATCACATCCAAACACTTGGCTCTTGCCAGTCAAGTTATCAGTTTCACCTTCGCCATTATTCCTGAAATGAGAAGAATCCTTTTTCTCAAGGTACCTGAGGCACGAAAGACACTATTGCTCTCAGAGATTGATCGAGTGGCTCAAGATTACAAAGTTCACCGAGATGAAATTCATACTAAGCTGGTCCAGATAATGAGGGAAAGGTTGTTAGTACATCTACGTGGCCTGCCGCAAATTGTTGAAAGTTGGAATAGACTAGAGGATGCTGACCCTCAGCCCAGTCAGTTTGCTCGATCCCTTACCAAGGAAGTTGGGTACCTTCAGCGTGTTTTATCTCGAACCTTACATGAGGCTGATGTTAAGGCAATATTTAGGCAAGTGGTCAAAATCTTCCATTTACAAATTTCTGAGGCATTTTCACGGTTAGACATAAGCACCCCTCAAGCAAAGGACAGGTTGCTTCGGGATGTTAAGCACATTCTTGGCTGCATAAGATCTTTGCCTTGTGATGATTCGAGTAAACCTGACATCCCAAACTGGGGGCAACTTGATGAATTCTTGGACCAGAGACTCGGATCTGAAGCTGGATAATGATGTGAATGTGTATTTTCCATTGTTTGCTTTTTTGATGAAGGGGGTCATATTTGAGGAGTAAATAACAGGATATCAGAAGTCAATTTTCAACCTATGTCATCTCCCTTGTACACCTAAAAATCAAGGTTTTGCGATTCTCATGGACAGGCGTGAAGTACAGTTTGGGATTCAGATATTTCAACGAAGTTGGGCCTTGCCCTTTTTGCTGAAACACATAACATATTATATGTTGTATTGGCTAGGCCAACACTTTTTGCTGCCCTAATTGTAGTTATGTTTAGAGAAAGAACAGATCAATTTGTTTACTCGAATAGATTTTAGTTCCTTGCTTTCTTTTCTTTCCCCCCCTTCAATTTTTATGGGCTTTCGTACAGTTACGCATGTTTGTACTTTGTAGAGCTAAATTTGTCATTATTGCCTATAAATAATTTTGCTTA\n>XR_005523613.1 PREDICTED: Hibiscus syriacus uncharacterized LOC120200931 (LOC120200931), ncRNA \nAAGTAAAATCAAAAGATTCAAACATTGGAATATACACTTGATCAAAAACACACTAACCCTTTTTTACAAATCTTTCTTCTTTTCATCATCTGACCCTTACCTCTTTGTCCCAGTGTCTCCTACGGTGAAACTTCGGTATCTGGGTTTTACCTTTTTTCTTTTACCAGAGATAAAATTTCACTGCTTTGGATCCGCCCCATACCCCTACTTTTTACCCTACCTTCCTTTCACCCTTTAAATTGCTAGACGATCCAAGCTCGCCTAAAGAAAGAAACAAGTGAAAGAAGAAACAAAATTTTCTAACTCTTTGAAAAGTTGGGTCAATCGCCAGTACATTCCAACACTTGTTTCTCTCTGGCAGTATGGATGATTATTACAGAAGGAACCATGTTCCAGCTTTTGGTAGCTGGGATTGGAACAATGACCTTCCTTTTACTCAGTGTTTGAATCGGCTCGGCAAACCGGATTCCTTCGTTATAGCTACGCCGAGGATCGTGATTTATACGTCGCTGGCGATCTTTATGAGAACGATGTCGTCACTCCCGCCGTGATTGTCGTTCCTCGTAAAAGGACAAAAGTAAGACAGTCGCATGTTAAAGACGGCAAAAAGCAAGAATGGGAGGTCAGTGACGTGAAACAACCGGCATCGGCAGCAAGCCCCATTCCCGTGTCCAAGCCAACTCCAAAACCCGTTGATGAAGACCTTTACAAAATCTCGCCTGACCTACTTTACACTAAAACCAAAAAGAAAAAAAGGTTGAGCTTGTTCTCATGCTGTTTGGTGCCAAGTTGATCATCTTGGAGGATTACGTAAATATAGTTCTTTTGATCCGTCCCTTCCCCTTGGTGTACTCAAGGGT\n>XM_003231613.2 Trichophyton rubrum CBS 118892 uncharacterized protein (TERG_07960), partial mRNA \nATGGCACCATACACCAAGGTACAGGAGGCGAAAAACAGCAACGGTCAGGCAACAGGGCCTCCTGGCCCTCCACCAGCCGCAGTCCCTCCTCCGCCTGCTGATCTACCACCAGGGGCCGTTCAGCAAAAGCCTGAAGCCGCTGTCGTCCCGGCTATTGTGGTCCGGGACTGGACGAACGAGGACAACGCCCAGTTGAAGAAGTTGAAGGAGGACAACATCAGCTGGCGGAAAATCGCAGAGACGATGAACTGGCCGGTCCACGAGCTAAGGGAACGATGGCGGGCCATCAAGCCTGAGCTGCCTAAGAAGTCGCAGCAAGAGCCAGAAAAGGTCAAGCAAGACGGCGTTCAGGAGAAGCAAGTCGTGTTTATGGAGTCAGTCAAGGAGAAAAAGAGTAAAGAAATCCCAAAGGTGGTATATGCAGACGAGAGTCTGAGTACAGAGGAGGCCGTCCTGCTCAGCAAGCTTGCGGACAAGTACGACAAGGAGATGTGGTTACGCATCTGCTCCAAGTTCTTTGACAAGACCGGCAAGCGACTTGATCCAGACGAGGCCAGACGGCACATCCGTCCGTCATAA\n>X84340.1 H.sapiens mRNA for Ig light chain, variable region (ID:CLL001VL) \nCAGTCTGTGCTGACGCAGCCGCCCTCAGTGTCTGGGGCCGCAGGGCAGGGGGTCACCATCTCCTGCACTGGGAGCAACTCCAACGTCGGGGCAGGTTATGATGTGCACTGGTACCAGCAGCTTCCAGGAAAAGCCCCCAAACTCGTCATCCATGGTAATAGCAATCGGCCCTCAGGGGTCCCTGGCCGATTCTCTGGCTCCAAGTCTGGCGCCTCAGCCTCCCTGGCCATCACTGGACTCCAGTCTGAGGATGAGGCTGATTATTACTGCCAGACCTATGACAGCAGGCTGAATATTTGCGTGTTCGGCGGGGGGACCAGGCTGACCGTCGTAG\n>XM_033723222.1 Mytilinidion resinicola uncharacterized protein (BDZ99DRAFT_493278), mRNA \nCGCGTTAGTCTGTCCACGTCGTCACTCGAAATCTCTTGCTAGGCTTGCTTGTTCGCACACTTAAGCTGCTCCTCTTCAGCGCTCTCGCAGCACCCCGAAACGCGTCAAGATGCAGCCCCTGGAACGAAGTGACATAGACCCGCATGCCGAAAGGACGCTTCATGCTCAGGGTAGAGGAGAGAAAAGAAAGCTTCTAGTGCTATCCGAAGACACCCTTGAAAGACATAACAAGTGCTATCGAAAGACGAATGAAGCCTTCGGAAAGTCCGCCATTCGCCAGGAGGGGGCGCTGGCTTACGAAGAGGAAATGTATCATCTGCACTACGGCAAAAAAGTCGTAGCATTGCACGACGGATTCGTGCCTGGGCCCGACAAGAGAAGCATGCCGCCGCCGTCGCCGCCATCCGCCAATAACATGAACATATACAGCGCAACGCCCTCGTCCGAGACTCCGATGCGTCGCTTCATGTTTCCAAGCACGGCTCATGACGCCCAGCCATGGCTGGCACGAGGGATGCTTGAAGACAGCGGAATAGGCTGCGGCGACCTAGACAGCCTCGAGTTGAGAAGGCTGGCAGGGCAGGTCATAGTTCCTGACGAGAATGGAGATGAGACAGAGGGCAGCCTGTGTCCTTCATCGCCCACTCTGTCGAATGCGCAAGCGATGCGGGTGGTGAAAGAGAAGCAGGAAAGGGGATCTAAAGAGAACCCGCGAGTCCGAAAATTGATAAAGAGACATCGGGCGCATACTTCTAGAGATGCGCAGGATTCAGGGAATACCCCCGAGTAGAACAGGCTAGAGGCGGTACACCACACCACCTGCAGGCGGCTCTATGGGCTCAAGCTGCCGGCAAATGGTGTCGAGACGAGGAAAGATGTATGTACCTACAGATGCGGTGGATATCAGAAGTTTCGGGTTTTCTAGTTCGTCTTGCTAGTATGGATAGGCAGCACAGGCAGTCAGGCATGGTATACGATTAAATGAGAGACTCCAAAACTGGTGGGAGCACGACGCTTTTGAAGACTTCTAAAGCCACAACAAAGACTGCAC\n>XM_042379977.1 PREDICTED: Homarus americanus putative transcription factor capicua (LOC121875420), transcript variant X2, mRNA \nCTGGCTGCCATAACTCTTCCCATGCAGCAGTTGTCTCCATCTCAACAGCTTCAACAACAACAGCAACAACAAGTACAACAACAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCAGCAACAGAAAGTTAAAGCCCAGGTTGCTAGTATACCTGTAGCAGTGCCAGGAGGAAGACCTTTAGACGACGAAGAATTAGACGACAAACCAAAGTTTATTTTGGCTCCTACGCCGGCACAGCTCGGCAAGGCCCCTAGACAAAAGCGACTCAACTCTTCAGGGCAAATATCATCTATAGGAGACACTGCACCACAGTTATCTCCGGACGTAAAGATGGCTCCTCCGCACCACCCCAGCGGAGACAGTAAGGTATCTCCGGTGTTGAGTAATGCTTCAGAGGGCGACTCATCAGTACAGACGACCACCCAGCAGATGGTCTCTGTTCCACCATCACCTAGTGAGAAGAAGAGTTTCTTTAAGAAAAATATTGAGGATGGCATGGACAAGGTCCTTGAAGAGGTGAATTTCGAGCAGAAGTTCGGAGCGCTGCCCGAGTTTAACCCTGACGAGGTCCAGTCCCCCAGTGTCAACGCTAGCACTGGGCCCTCCGTACCTTCCTCCCCGCGGACCTTTATTACGTCTTACAGGAAAAAACGTAAACATTCCAGTGGTGAAGAGTCAGGCTCAGATACTCCCATGAGTGTCACCCCTCACCAGACACCCTCACTGACACCCTCCTCCACACTGCAAGGATCCAAGTTCTTTCCTCCTGATTTCAACCCAGAGACTTTCAAGGTTGGTGAGTCTCGGGCGGACAAGTGCGAGATAGAGTCACCTGCTGCAGGAGGCCGTTCACCCAAGACTCCCAGAGATGCGGACAAGAGCCATTCATCCTTGAGGCACATCCTGGATCAGAGGCGCACCCTTGTGATGCAGCTCTTTACTGAATATGGCTGGTTCCCATCTGCCCAAGCCGTCGCAGCATTCCAGTCTCGATACTCGGACATCTTCCCTACCAAGAACTGTCTGATACTCAAGATAAGAGAAGTACGTCAGAAGGTCCACCAGAACACACCCAACACACCTGGTGTACCGAGCAGTCCTAACCCGGCCACACACACTGGGTCCTCCTTACAACACCCCCACAACAACCACCACAAATTTCTGGTTAACCAAAAAGAATGTCGTGGCCGAACCATCGTACACGATCATCTCTCACTGCCGCTGTGTCAACGTCAAATCAAGCCACCACTTCCCTCCCAGTCGGCACATAATGCCACATCTCGGCTAGATTATTAATTTTACTGTGTTGTTTTTTTATTTTTATTTATATTTTAACCAATGGCTACCCAGCATTACTACATAATAATAACATTGGCATTTTACTACTGTTAAGAGTTGAATGTGTACTTTGTATAAATTAGCGACAGTTA\n>XM_004341098.1 Acanthamoeba castellanii str. Neff uncharacterized protein (ACA1_236710), partial mRNA \nATGCCGCTGCCGCCGCCGGCCGTGGTTGCTGGGATTGAGGGCGCCGACGCGGCTCGCGGGACGCCGCCGTGGGGACCGCGCTCGATAACCGTTCCAGCCTTGACCGTCTCGCGCGGGTGCGGCTCCGACGTCGTCGTCGACCCCGGGGCGTCGCCGCCGCTCTCCTTCCTGCGCTTGCGCTCCTCCTCGATGAGGCGCATCTCCTCTTCCTTCTTGCGCGCCGCCTCGCTGTCGGCCCGCTCCTTCTCGCGCTCCTCCTCCTCGATCTTCTTCTTCCAGTCCTCCTCAGTGATCTTCACGCTGCGACGGTTGGCCAGCTTCTGCTGCTTCTCGCGCTCCTCCTTCTCGCGCTTCTCCTTCTCCTCCTGCTCGACCTTCTTGCGCCACTCCTCCTCGACGTTCTTGCGTGGCGTCTTGGCCAGCGCCTCCTCGCGCTCGATCTCCTTCTGGATCTTGTCGTCCTTGGGCTCCTCGCCGCTCAGGAACGCGCTCTCCTGCTTGCGCTCCTTGACGGCCTCGGCGATGCGGCGCATCTCCTCTTCCTTCTCGCGCGCCTTGTCGCTCTCCCTCTTCTCGCGCTCCTCCTCCTCGATCTTCTTCTTCCAGTCCTCCTCAGTGATCTTCACGCTGCGACGGTTGGCCAGCTTCTGCTGCTTCTCGCGCTCCTCCTTTTCGCGCTTCTCCTTTTCCTCCTGCTCGACCTTCTTCTTCCACTCCTCTTCAACGTTCTTGCGTGGCGTCTTGGGGAGGGCCTCCTCGCGCTCGACCTCCTTCTGGTGCCTGTCGTCCTTGGGCTCCTCGCCGCTCAGGAACGCGCTCTCCTGCTTGCGCTCCTTGACTGCTTCGGCGATGCGGCGCATCTCCTCTTCCTTCTCGCGCGCCTTGTCGCTCTCCTTCTTCTCGCGCTCCTCCTCCTCGATCTTCTTCTTCCAGTCCTCCTCAGTGATCTTCACGCTGCGACGGTTGGCCAGCTTCTGCTGCTTCTCGCGCTCCTCCTTCTCGCGCTTCTCCTTCTCCTCCTGCTCGACCTTCTTCTTCCACTCCTCTTCAACGTTCTTGCGCGGCGTCTTGGGGAGAGCCTCCTCGCGCTCGACCTCCTTCTGGTGCCTGTCGGCGCTGTCGTCGTCGGGACCCTTGAGGAACGCGCTCTCCTGCTTGCGCTCCTTGACGGCCTCGGCGATGCGGCGCATCTCCTCCTCCTTCTCGCGCGCCTCCTCGGCCCTGTCGCGCTCCTTGACCTCGCCCGTGAACATGGAGGCGATGCGACCCACCTTGGCGTTGCGCGCCAGCTGCTGTCGCTCCTCCTCCTTCTTGCGGCGGATCTCCTCCTCCTTGGCCTTCGATCCGCCCTCGTCGTCGCCCGACCCGATCTTGTTGCGCCACGCCTCCTCCTTCTCCTTCTGCGTCTTGGGCTT\n>NM_001302118.2 Gallus gallus CDC28 protein kinase regulatory subunit 2 (CKS2), mRNA \nAGTCGTTAGGGGGTTTGCGGGCAGATAGTATTGTGCCTAGAGTTCCGCCACTTTTTGCCATGGCTCACAAGGATATCTACTACTCCGATAAGTACTTTGATGAGCAATACGAGTACCGGCATGTAATGCTACCAAGAGAACTCTTGAAACGAATGCCAAAAGCTCATCTTCTGTCTGAAGAGGAATGGAGAAGCCTTGGTGTTCAGCAAAGTCTTGGATGGGTTCATTATATGATCCATGAACCAGAGCCACACATTCTTCTCTTTAGAAGACCTCTTCCAAAAGATGATCAGAAATGAACTACTGTCTAGAAATATTCTTAATCTTCTGGAACTTTGTGTATGCATGTATATATGTTGGTAGTATTCAGTGAATACTTTATGTACAAAACATACAACTGTACCTGTGCATGAGCTGTATTATTCACAGCAACAAAGCTCAGTCAAATGCAATTTCTAGTAGGCTGCTATTCTTTCAAAGAGAAGTGGAACTTCTAATAGTTCCTCTTAGTCTGAAATGAGTTCTCTAATAAAGTTTACTATTGTG\n>XM_032261620.1 PREDICTED: Sapajus apella otolin 1 (OTOL1), transcript variant X1, mRNA \nGGTCTTTTCATCTATTCTGGGTATACTGATGATCTCTTAGGAGTTAGACAGAAGTAAGAGAAGTGTATTGTTTTATAATCTAGTAATAGCCTCTGGTTGCAGATCTTTCCTAGGAAATTTGAAAATGTTTTTACTCCTTTATGAAATAAAAATTTTAGTTTTATTATATAAGGCTTTGTAGTTTGGGTTTATCTGAAGTAAGCCACCCATTCACTGGCATTGAGAAAGACTGTGGAATGGTTTTTGTGGTCACATGTCTTTTGAATCCAGGTTCGCTGGGCATATATCCTGGCTCTGCTAAACTGTATACATGACCTTGGGAACTTCCTTTACATTTCTTGGTCAGTTTCTTCATTTGTAAAATCAGTCTGGCAATAATGACTACTTCTTAGCTGTTTAAAGCATTTAGTGAGTTATTGAATGTTAAGTGCCTGACTCTTGCTTAGGACTCAATAAATGTTAGATATTACTATTAGTGACTACTGTACAATGAAATAAGATTACCTACAACTGTGAAGATAACTAATTAAAACAATAATCAAGACTGGAAAACATATATTTATTGTGTACTATATAAAAACATTCCATCAAGATAGAATAAAGCTATGAAGTCAGACAGATACAGGCTTGAAAATTTGGTATGTGTCATACTGCAGGTAACTTAGCTGTTCCTGAGCCTTGGTTTTATCTTCAAAATGGAGACAATTCTGCTTTGGAGGACTGTTGTGAGCAGAAACAAGAACATTTGGAAGAGGCTGGTGTACTCAATACAAATGGCTATTATACTTTTTATTGCTACTTGCTTTTCTTGAACTAAATTTTAAATAGCAACTCCTCTTTTTTATGGAAATCTAGGGAGTCTGATTTAGAGGAAGTGAGTACATGCTGTAGAATGGCCCATATGCCATTTTGCTATTAGAATATGAGTCATTATTTCTAAACTTAGTATTGCTTTATTTGTATGTTCCTTGCTTTTCTCAGAATCCCTAAGTCAGATCCAACCATAAACTTTGGATCATAAAAGAAAGCAACTTCAATTAAGTGGATTTTTGGAGTCACTGCAAGTCACTCATATGAGGCTGTCTGACCAAGCAGTGATGTAAAGAGGGCTAATAGTATTTCAGTGAGCAGCTCTGGCATTTTATGTTTGTACAGAGTGCTTCTACTTAACGAAAGTTTTAAATTTGTATTATCTTTTGTATTGAGGTACAATTTACATATGTTGAAATGTGTAGATCTTAATTGTGCATTCCCTCAGTCCTGACAGATACATACACTTCTATTAAGATACAGAATATTTCCAGAAAGTGTCCTCGTGTCCCTTCTCAGTCAATCCTTTCTCTTTTCCCATGCAACCACTATTCTGATTCCTATTGCCTTTGGTCAGCTTTTCTTGCTGTGGAACTTCACATAAATGGAATCCTGCAGCCTTTTGTGTCTGTACTTTTTTCCTTACCATAATGCTTTTGAGATTCAGCTGTATTATTATATGCATCAGTATAGTTTATTGTTGTTGGTGAGTAGTATTCCATTGTATGGATATACCAAAGTTTGTTTATCCATTTTCCGATTAAGAGACATTTGGGAAATTTCTGTTACTTCTTTTGATCATTATTGTAATGTTGTTGGAAGGTCAGAAGATTCTACTATCTTATTCTCTAGATTAGGAAGCTGGGATTCAGAGAAGTGAGACAACTCAAGGTAAATGGGGAACTCGAGAAGAGAACCTGATTATCTGGGCCCAGATCCTCTGCTTCCTTTACTTTCTATTTTCTGAGCCCAGGTTATTTTTGGCCCTGACTAGGAGTTCTGCCCTGTCTGACACCAGGATTTGACCTGACCTGTCTTATCTTTGATGGAGAAAGACCTAGAATATCAAAATTTAGGAATGTAGCCCTAATCTGGGCTAACCCTTGCCTAAGCCTTAGTTTCTTTCAGGTGCAGTGAATAGACTTCTTAGGCTGGCTCAAAAGTTGAGCAAGTAGAGGATCTGGATTACACCGGTTTAGATTACAGAATGCCTGAAGATATTCTAGGAGAGCTTTGTCTTTCATAGTGGCAAAGGGGAAATAGGATGAACATGGAATAAGATAAGCGTCTCTTAAATCCTAGCTCTGCCACCTATTAGTTGTGTGAGGTTGGGTAACTCAACTCTCTGGGTCTCTTTCTCCGTCTGTAGAAGAGGTAGTACAATGCTTCCCTCTCAAGTCTCGGCAAGGAAGTTCCTGACACAACCTGTCCTTTCTGTGCTCGATCAAGGTTGGAATTAAGAGAGCATTATAATATGATATTGATATTGCTGTGGGATTTTCATTGTATGGAAGAATGAATTCTTCCCTTTATCTCAGAAGACAATTCATTATTTATAGAATCTGAATAAAAATAGAAAAGTTAATTTGTCAGTAAAGTCCTCATAAAAATAAAGCAAGAGAGGGGCAAAGAGGAATGTGTTTACTTTAAGACAGCTGGAAAAATGAATATAGGTAAATAGGTCCTTTGAAGACACTCTCTTCCTTCTCAGGAAAAAGGCAAACATATTTAGAAGGTTAATCCTTGTTCAGGATGCTGATTAGGCTGTGTGGTTAAATAAGGTCTGTAGGAGAACCAAAAGGAAAAAGGATCTTAAGGGAACCCCATTCCTGCCCTATTATGGATTTAATGAGGTCTCTGGGTCACAGTTTCTCCATCTGTAATCCCTAAATAGCACTTTTTAATCACATATCTCAGGATTTGATGTGAAATTTGATGTGTTCAATTTTCTCATAATTTATATAGTTGCAAAAATTTTGCATAAAAAGAATAGTATTTATGTGTATTTTATGTAATTTAAGGCAAAGTATGCTGTCCAAGAAAATCTTACAGTTTATGAGAAGATTGACATGTGAATGACTTAACAGCAGAATACATTAAATGCTTGTCATAACAAAAATTGGCAGGAGTCTTAGAAGAACCTAGAGTTAGATGATTAGCTTGGTTCATAAAAGCTTCTAAAGGAAATTTCAAAGACTTAATGACATCACTGAACTTTTCCAACCAATATTGAGAGAAGCTGGTATGAAATGATTCAAGGAGTATTTACTGCTCTGCAAAACAGCTTTGCCTTTAATGTTTCCCAAGAAAAGGACATACTTGTAAAGACTTAATGCTTGTCCTAGAGAGGAAAAACAATTTCAACAGTCAGGACATCAGAGTGGTGGAAAGTATTCATGCAGGAAACTGAATGATGTACTTTATTTGTGAATTTTCATAATTAGCATTGAAACACCGCTACTTTGCTGGCTCAGCTTTTTAATGTATCAGATCCTTTGTGTGTAGGAAGAAAGAAGAATAAATGTGTCTCTGAATGTGGGGTGCTCTCTTTTAATAAAGAAACTTGAGAGAAAAGAGACGACAATAGGCAAATATGAAATAAGTTAAAAGAAGTAGGCAGAAAATAGAGAAAACTGCATCTCATGCAGTTGACGTTTATGTGGCAATTGCTTGGTTTGGACTTTTTGTCGGAGAACTTTTTTTTCAGAATTTATTTTGTGTATCACTAGTAAGTGTTGCATAATTTCCATATTTATTTATACTATGGGTCTGTCTCTCCTTCCAGACATAAAGGACACTTTGAATTTCAGGTGATAATGGAGCATACAATCACAGCAATCATATGATGAAAGTATGATTATTATTTTTATTGTCCCTGTGTTACAGGTGAGGAAACCGAAGGCAAGAAGTTGCCAAGTTTAGACAATTACTACTCACTCTGTCTCATGACAGCTGGATCAGAAGTGGGCAACTGATGGAGTCTGGATCCATGAGGAGTTCACGTTGCTAGAAAGGGTGGTGACCATGACTCCCTATTCTTAGGGGTGGCAGTGATTGCAATGCTTCAAAATTCAAAGGAGGTGTCAAAATGGAGGGTAGGGAAAAGGCGTGAGCTCTGCCTTCCCCTTGGCAGTGGCGAAGTGATATGGAGTGTGGGCAGGGAGGTGGCGCATTATAGGACTCAACACCACGCTCGTTTATACATAAGATTCCTACCCATTGGATCACTTGAGGAAAGGAGTTCAAGACCAGCCTGGCCAATATGAGTTCAGGCAGAGGACAATATGCAAAGATTGGGAACTAGAAAGAAAACAACATGCCTGTTTATTAAATGATTATAATTACCAATGTACCAGTTATTGTCTGGGAGTACTCAGGCCTATACCTGTCTTGTACCAATGGGGTAGAACTCCTGAGAACTACCTTCCCAAGATCCCCTTGACAGCTGGTTTCCAGCCTGGTTCTTCTAATGGGCTGGACTCCTATGTAATGAGAGGGAGATGGCAGAAGTAACTTGAAGGTCCTAGACTTCTGGTCCCAGCTGCAGAGCTGACATGCACCTGTGAATGCTTGCAAGGTTCCAGTGGCAGCAGCAGTGAATGTGTGCTCTGTGATGGATGCCCATTGTTTAGGGCAGACCAGTGTGGCCTCCTGCAGGTCCTGGTCCCTGAGAGACATTACTTTCCCCTCATGTCTCCTCTAGGCCTTCCCCTCGTGTCTCCAACAGTGTTGTAGGTTAACTCTCTGGATTAGATTCTTTTCTGTTTTGAATAATTAGAGTGCTTTCTATTTTGCTGATTGAATTCTTGACTGTTATCCCCCTATAATATGGCTGTTCTGGCAAGCTAAATTAGAGGACAGGAGAGCTATAAGGCCAGAGGCTTGAATAGGCTTTTTCAAAACTAAGATGACTGGAACTGAAGAGAAGATTTTGAGCAGACTTACCTTCCCTGTCTAGGGAGGAGCTGCTGGAATGCAGAAAATGTTATGAACTTGCTCCAAAGAACCAGAACCACATATACGTGCTAATTAGACTGAAAAACAGAATAGGAGAGAAACACCAGAACATGGCTGCAAGCCCTTAAGAAAAAGCAGTCTTATCTGTTCATAAAATGCAGGATAATGACCAATCCATTGATCATCATCTCCTTCTTACAGGAGGAAGAGTAAGGGGAATGGGTGGAAGTACCCAACATGCATGGGGAGAGCTGGAAACGTCTGCCTCTGAGCTGTGTTGGAAACCTGAGAAGCCTCAATTATGTGGATGTTTACTTGGCTTTGTGCTATTTTAATTATTTTGGCTATTGCTGGTATGAACACAATAGCAAAGACCACACCGTATACCAAATTTACGAAGAAATCTGAGGAAAGAGAGATGCCAAAGGGTCTAAAGCCATCCAGTGGCCCACCTCCACAAGAAGAAGAAACCCTCTTCACAGAAATGGCTGAAATGGCAGAACCAATCACCAAACCCTCAGCCTTGGATTCTGTGTTTGGCACTGCCACTCTCTTTCCCTTTGAAAACTTCACTCTTGACACAGCTGATTTCTTTTTGAATTGTTGTGATTGTTGTTCACCTGTACCTGGGCAGAAAGGAGAACGTGGAGAGACTGGAAAGCCAGGCCCTAAAGGAGAGACTGGGAATTTGGGGATCCCAGGGCCACCAGGAGTTGTTGGGCCCCAAGGCCCTAAAGGCTACAAAGGAGAGAAAGGGCTCAAAGGAGAACGTGGGGACCAAGGAATTCCAGGATACCCAGGAAAACCTGGAGCACAAGGTGAACTTGGCCCTAAGGGAGATAAAGGAAACACTGGTTTGGCAGGAGTGAAAGGACAAAAAGGCTCCAAGGGAGACACATGTGGGAATTGTACCAAAGGCGAAAAAGGAGACCAAGGGGCTATGGGCTCACCGGGCCTGCACGGAGGGCCTGGCACCAAGGGAGAGAAGGGGGAGATGGGGGAGAAAGGCTACTGCAGAGATTCTGGGGAGAAAGGAGGAAAAGGACAGAAAGGTGAGGCAGGTATAAAAGGAGAAAAAGGTTACAAAGGGGATAGTGGAATGGAAGGCAAAAGTGGTCACAGTGGTCTGCCTGGGGCCAAAGGTGATCCAGGGGTTAAAGGAGAAAAGGGAGAGTTAGGTCCTCCTGGTCTCCTGGGACCTACTGGGCCAAAGGGTGACATTGGCAGTAAAGGGGTCCGAGGCCCCATTGGGAAGAAGGGCTCTCGGGGCTTTAAAGGCTCCAAGGGTGAGGTGGCTAGAGTGCCACAGTCAGCTTTCAGTGCTGCTTTGTCAAAGCCTTTCCCTCCTCCAAACATCCCCATCAAATTTGACAAGGTTCTCTATAATGACCAAGGGAGTTATAGTCCTGTCACTGGGAAGTTTAACTGCTCTATTCCTGGGACATATGTTTTTTCCTACCATGTAACTGTGAGGGGCCGACCTGCTCGAATCAGTCTGGTGGCCCAGAATAAGAGGCAGTTCAAGTCCAGAGAAACTCTGTATGGTCAGGAAATAGACCAGGCATCTCTCCTCATTATCTTGAAATTAAGTGCAGGAGACCAAGTCTGGCTTGAAGTGTCAAAAGATTGGAATGGGGTGTATGTCAGTGCTGAGGATGACAGCATTTTTACTGGGTTTCTTTTGTACCCAAAGGAAACTTCTGGAATTTCACCATAAGTTTATGTCTTCAATCTCGTAGTTTAGATTTAGTGGAATAGGTCAATTAACATAGACTAGTGCTATTAAAAAAAAACTTCAATTTTTTCAAGACTATAAAAATAATGCAGAAATTTTTTTAAAAAATGTCTCTTGGAGTCAATTGTTATTTCTATTTTAAGGCACCTCCTTTAAAAATACTTATATATATTTCAGAACATATGTCAGTAACTTTGTAGCTAGGCTTTAAAATTTAGCATTATAATATCAGCATTATTCATGCCATTTAAGTATAATAATAATATCTGTATACAAAATATGAATGAGATTTATAGTTAATAAATATGTTCTTACTAAATATCTTCTATATCTCAGATAAATGTATGTCACTTCTTTTTGTGTAAATTGCATAGTATGACAGCAAGGTTTTGACTCTCTTGGATGGGTTGCCTTCTGACAAAATGGAACTCCTCTCATGTTGGTTTAATTCATGGAGATGACAGAAAGAGTGGCAAAGACTAGCTAAAGGATATTTAACATTTATCAGTGTCTAAAGGTTTGCTCACAAAACTTGTATTATATGGACTTGTGTGTTGGGTAAAATGTAAGAAAAAGTTGATAATCATAGTGAAGATGAAATCATTAATCAAATTATTGTGCTTAGAAGAACTGAATGTCCCCAAAAGAATAAAATGAAATCATTATTGATTTG\n>XM_007480608.2 PREDICTED: Monodelphis domestica spermatogenesis associated 1 (SPATA1), transcript variant X3, mRNA \nGGCGGACGGTGGAGGACGGGCGCGCCTCGGGGGCGCGCGCACGTGCGCGCGCGGCTGGCTCGACGCCCCAACCCCCCTCCTCTTCCTCCTCTACGCCTTCCTTGAGAGAGCGAGCGAGCGAGCGACCGGGAGGGAGGGGAGCGCTGGCATTTACATGACTTGAAGACAAAAGATGAATGGAATGCTATCATTAAGTCACCTAGAGGATTTAGTGACCCTTATCATTAAGTAATGCTTAAATGAAAAAGAAGACCACCAAGAAGCAATTAAAAGCAATTGTTACTTACTCAGGCATCAATGACTACGTCATTCAATAGAAGTCGACCTTCTTCATCAGAGTTGGTGGAACTTCATGTTTTTTATGTCCCTGAAGGATCATGGAACTATAAGCTAAATACTATTTCAGTAGAAGTTGTCAGTAAATTTATTTCAGCTGGATTTATAAGGGTGTCACCTCATCTTACTTTGCAAGCCCTGAGAGAGCAGCTGGGTGAGTTCCTTGGTGAAGAGGCTGTTGCAGAAAAATTCTTGTTTTTGAAATGCATAGGGAACAATTTAGCTGTGGTGAAGACAAAGCAAGAAAAAGAACTAAAGCTTAAGTCATTTGCTCCACCATATGCTCTTCAACCAGAATTATATTTGCTTCCCATAGTGGACCACTTAGGAAATATTTATTCATCATCATCATCCTCTGCTATGGGAGATACACAGCAGAATAATACTGATGTTTTTGAGAATGATAAAACTACTCAGAAACCAGATAGTTGTGCAGCATCTTCAAACAAGGAACATGAAAAAGATCCAAGCCCTATAGAAAATACTGATAAAGTTCCTCCCCTCAAGAATCAGGAAGAAGTCAGCCTAAAAGACAACAAGATTAAAAAATATCCAGCAAGAAAGTATGGATTTCTAGAAGCAATTGATGATAAGCGTCTTTTTCTTGCACAAAACAAAAAAAGCCAATTCCAATGGGAAAACGGAGACAAGATAACTGATACCAGTAGAAGAAAAGAAGATGGGTTAGGTGATGAAGATTTTGACAAGCCACCAGGTCCTTCTGCTCCTCCTTCATTACCACTCCTTGCTTTTGCTCCAGGAATGCTTGAAAATTCTGGTTTACAAAATGAGAAACCTGAGATGGAACCTTTGCCATGGAGGCAAATACTGTACAGCCACAAAGAAAGTAACAGTCAAGGACTCAAGATTATGCAACAAATGAAGCAAGTAAAGGAAGAAAGATGTCAGTTGGAAGAGACTAGAGAAGAACTGTTAAAAAGAGTTAAAAGTTTATTTGAACAAAGCAAAATGAAAAGATATCGTGTCCAGGAAGCTTGGAAGAAAAAATATTTTGAAACCAAGAAAATCACAGCTTCTTTGGAGGAAGTTTTAACCAAACTTCAAGAAGATTTAGAACTTTATTATAAAAAATTGCTCATGCAGCTAGAAGCTAGGGAGATCAAGATGCGGCCCAAAAATCTGGCAAATATGGAAGATTCAAAGAATAATCTAATAATCCAAATCACGGAGGTACAGCATGCAATTGACCAACTAAAGAGAAAACTGGACACTGACAAAATGAAACTCATGATAGAAATTAAGATGAGAAAACAAGCAATTTCAGACATACGAACATTAAAAATGGAACTGGAACAGAAGAAAATGAAGACACCTTTAAGCTCCTAGTCAAATGTATTTACTTAGAAGTGTCTTAGTTTTCAAAATGTTTAGACTTATTGGAAGACTGTCCATCCATTGTTCTTGCTGATGTTTCTTTATAAGCCTTGTATTTCTATTCCTTTATTTTTCATGCTGAGTTTATGAAGTGACTCACAAAATGTTAAGCACAGTATACTTCTCCAGTACCTGGAGGATCTGTGATTTTATCAGAGTGGGTGGTACCTCCACTGAAACAGATCATACCTCCTCCACAAGTTGGGAGATGGATTTTGAGAATAGCTTTAGTTTAAAAAAAAAAGGTAGGAAGGAAGGAAAAAAGAAAGAGAGAAAGAAAGAGCAAAGTGGAAAGCTAAGTAATTTGTTCAGGGCATTATTTAGTTATTTTTGAGTACTTCAAGAAAACTGGATTTCATTTTACAGTAAAGTATTGCATTATTAAATTGCTGGGTTTAAAGATAATTCATCTAAGAATTAAGAATAAAGGCCTATTATTAGTCTTAGCAAACCACCATGTCTTGGTACAAAAGGCTACATTGATTTTTTTTCAATGTAACCTTGATAATTAAAAGAATAATCCTTTTATTTCATTTTAACTAAACAGACTAAGAATCTAAGACTCAGGAAATTGAGATTACCATTTGGAGCACTCAGAGGAAACTCCTGGGATTAGTATCCAAGAACTGACTTATTAACATATTTTAGAAGCATAGAATCCATCAGTAATTCAAAATAAGTTATGAAACATCATCCTTTTGAATGGATGTTCCAGGGCCTCTGCCATAAGCAACCTTGTAAATTGGGAGCAGAGATCTTAAATATGAACTAGACCCAGCAAGGATGGTCAAATTTTTACTTGCTTTTATTCTGATTTATGGGAAAAACCACTAAGGAAGCCTAGATTTCTATTAGCCCAGGGTTCACAGGAATAGGTTTGTGATGCCCCTAGACAGTTATACAGCCAGTGCCATCAAAATGGAAATAATAAATTTGACATTTTCCCGATGCCTATAATGTACCATATGAAAAAGCAGATAGTTCTGAAGTGAAACCTGGCTAAAGGTTTAGAAAAGTTATAAACATTAAACTACTGTGTTTTAGAAATAGAAACATCAGTTCATAAACTAATGTCATGAGGTTAAAATTAGATTCCAATGTGGGAAAATATTGTAAAATTTTTTTTAAAAAAACTAAGCAATAAGGTTGCCAATGAATAAATTACAGATGCACAGAAAAGGATCTTAGGAGAATTGTTTCATCAAGAATAGCATAAGAATAATATCAGATTATCCGCTAAGTTATCCCTATAGTAAATTTAATAATAATAAAATTCTTCTTGAAAATATCTGTCTCAAAAGCATAATTTAGCTAAAAATGTAGGCAACACCACCATACTAGTTTAAAAGATTATCTTTTAAATTCTCTAGGCCAACTCTGTATCTTTTATCTTAGAGTTACTTGTCTGAAGGTTTGGGATGAAGCAAAAAGCAAGTATCACAGGGCACTGAGGTGCTACTTGGAAATAAGAATCATTGACCCAACAGCCCATCCTTCTTTTAACAATACATTGGTCCTAAGGAGAAGACACTATATATCAACCAACTTTAATATTAGGCTTATTGGACAAATAAAATTACAGAGTGAATTGCTTCTCAGAGAATGGGTATTTAAAAAAAAAATCTGTCCTAAGCAAACTAGGCTTTCCTTTACAAGTCTTAGAGCATTTTGCATAGTTTATAAATATGTAAGCATACATGTTAATATCATGTACAAAAGACATGAACATAATAAAATTATGAAAATACCGGTTTATTAAGTGACAGATAAAACATCTTATAAAATAAAGAAGATTATTTCATACT\n>JN080695.1 Uncultured bacterium clone HI04_FZZ71GH04EJVXU 16S ribosomal RNA gene, partial sequence \nGATCCTGGCTCAGGACGAGCGCTGGCGGCGTGCTTAACGCATGCAAGTCGAACGAGAATCTGTGGAAAGAGGATTCGTCCAATTGAAGCAGAGGACAGTGGCGGACGGGTGAGTAACGCGTGAGGAACCTGCCTTTCAGAGGGGGACGAACAGTTGGAAACGACTGCTAATACCGCATAACACATTGAGGTCGCATGGCCTTAATGTCAAAGATTTATCG\n>XR_008021246.1 PREDICTED: Diospyros lotus uncharacterized LOC127792942 (LOC127792942), transcript variant X2, ncRNA \nATGGATTGGAGGGAGTGCTCCGAAATCAAAATATCTAAAAACAATTATATGAAACGAACGAGAATTTCGATACGATTATTATGACATCGAAAAAAATCTGATCAGAAACAGTTTTTTGGGCAGCTAAAAATCAGGCAGAAAATCGAATCGTCGTAATTCGTTCACAAAAAGTCAATTGAACACAAAATACAGTTTAATTTAGTTATTGGAACAACCTTTTGGTTGTTTAATGTTGAAACAAAAGTACTAGCGATCTTATCGAACAATAGGACGTAAGCGTAATTTCTTCATTTTTCCCGACTTTGCTCGAAAAAAGAAATTTCCTTTTTTTTTTTTTTGTCAATTTTCAATGGTGGAATGAAGATAATTTCATATGGTTTTAAGTGTAGTTTTATTTGGAAGTGTAATTGAAATATTCAAAAGATTAGGGGTTTAACTTGATTTTCGGTACAATTATGAGTAACCGAATGGATTGGAGGGAGTGCTCCGAAATCAAGATATCTAAAAACAATTATATGAAACGAACCAGAATTTCGATACGATTATTATGACATCGAAAAAAATCTGATCGGAAACAGTTTTTTGTGCAGCTAAAAATCAGGCCGAAAAGACGAATCGTCGTAATTCGTTCACAAAAAGTCAATTGAACTCAAAATACACTTTAATTTAGTTATTAGAACAACCTTTTGATTGTTTAATGTTGAAACAAAAGTACTAGCGATCAAATCGAACAATAGGACGTAAGCGTAATTTCTTCATTTTTCCCGACTTTGGTCGAAAAAAGAAATTTCTTTTTTTTTTTGTCAATTTTCAATGGTGGAATGAAGATAATT\n>XM_038964517.1 PREDICTED: Salvelinus namaycush extensin-1-like (LOC120020894), mRNA \nATGTCCAAACCCTTCCCCAGAGGCCTGCCCAACCCCTTTCTCAGAAGCCTGACCAACCCCTTCCTCAGAAGCCTGCCCAACCCCTTCCTCAGTGGCATGTCCAACCCCTTCCCCAGAGGCCTGCCCAACCCCTTCCTCAGAAGCCTGACCAACCCCTTCTTCAGAGGCCCGCCCAACCCCTTCTTCAGAGGCCCGCCCAACCCCTTCCCCAGAGGCCTGCCCAACCCCTTTCTCAGAAGCCTGACCAACCCCTTCCTCAGAAGCCTGCCCAACCCCTTCCTCAGTGGCATGTCCAACCCCTTCCCCAGAGGCCTGCCCAACCCCTTCCTCAGAAGCCTGCCCAACCCCTTCTTCAGAGGCCCGCCCAACCCCTTCTTCAGAGGCCCGCCCAACCCCTTCTTCAGAGGCCCGCCCAACCCCTTCCTCAGATGCCTACCCAACCCCTTCCTCGGTGGACTACCCAACCCCTTCCTCGGTGGACTACCCAACCCCTTCCTCAGACGCCTGCCCAACCCCTTCCTCAGACGCCTGCCCAACCCCTTCCTCAGATGCCTGCCCAACCCCTTCCTCAGTGGACTGCCCAACCCCTTCCTCAGCGGACTGCCCAACCCCTTCCTCAGATGCCTGCCCAACCCATTCCTCAGCGGACTGGCCAACCCCTTACTCAGATGCCTGGCCAACCCCTTACTCAGTGGCCTGCCCAACCCCTTTCTCAGTGGCCTGCCCAACCCCTTCCCCAGAGGCCAGCCCAACCCCTGA\n>XM_033401886.2 PREDICTED: Orcinus orca KAT8 regulatory NSL complex subunit 3 (LOC101288842), transcript variant X6, mRNA \nTATATTTTTAAAACTCCAGAACATTATGAAGTCGTTGCAAAACTTTTGTTTAACACAAACGAGACGTCAAGGGCTTCCGTGAGGCCCACGTTAAGCAGCTGTTCCTGGGATGCTCACGCTACTGCTGGAGACGGCTCTGGGAAGCTTTCGAGAATGGTGACTAGCATGCAGGTACCCGTTCTCTGACTTGCTGCCCCTCTTCTGACATGGCCCACCGCGGTGGGGAGAGGGACTTCCAGACGTCAGCGCGGCGCATGGGCACCTCGCTGCTCTTCCAGCTTTCGGTGCATGAGCGGGAGCTGGACCTGGTGTTTCTGGATCATAGCTATGCCAAGCCGTGGAGCGCCCACCCAGATGCCAGTAGTGCCCGCCCCACCCGCATGCTCTTTGTTACTCCCCGGAGGCAGCACGAAAGTACCATCGAGTCAGATGTCCCACTAGATGTGGAGACAGTCACGTCAACCCCTGTGCCACTTTATGACAATCAGAAGGCACGCAGCGTGATGAATGAGTGTGAACGGCATGTCATCTTCGCCAGGACCGATGCGGATGCACCTCCCCCTCCAGAGGACTGGGAGGAGCACGTCAACAGGACTGGCTGGACAATGGCCCAGAACAAGCTATTCAACAAGATCCTCAAAGCCCTGCAGTCTGATCGGCTTGCCCGCTTGGCCAACGAAGGGGCTTGTAACGAGCCAGTGCTGCGCCGTGTTGCCGTGGACAAGTGTGCGAGGAGAGTGCGGCAAGCTCTGGCGAGTGTGAGCTGGGACACCAAGCTGGTCCAGTGGCTGCACACCACGCTGGTGGAGACCTTGAGTCTGCCCATGCTGGCCGCCTACCTGGATGCTTTGCAGACACTGAAAGGGAAGATCCCTACCTTGATTGACCGGATGCTCGTGTCGTCCAACACGAAGACCGGGGCTGCTGGAGCTGAGGCCTTGTCCCTCCTACTGAAGAGGCCCTGGGACCCCGCTGTGGGAGTGCTCTCTCATAACAAACCAAGCAAACTCCCCGGCTCTCCTCTCATTCTCATTGCCTCCTCCGGGCCCTCCAGCTCCGTGTTCCCCACCTCGCGCCGCCACCGCTTCTGGCAGTCTCAGCTGTCCTGCTTAGGCAAGGTCATCCCTGTTGCCACGCATCTGCTGAACAATGGTAGTGGAGTAGGAGTTCTGCAGTGTCTGGAGCACATGATTGGGGCAGTGCGAAGCAAAGTGCTAGAGATTCACAGCCATTTCCCGCACAAACCCATTATCTTGATTGGCTGGAATACAGGAGCCTTGGTGGCCTGTCACGTGTCGGTGATGGAATACGTCACTGCAGTTGTCTGCCTTGGGTTTCCTCTGCTTACCGTGGATGGCCCCAGAGGGGATGTGGATGATCCCCTCTTGGATATGAAGACTCCAGTCCTCTTTGTCATTGGTCAGAATTCCCTGCAGTGTCACCCTGAAGCCATGGAAGACTTCCGGGAGAAGATTCGGGCTGAGAACAGCTTGGTGGTGGTTGGGGGAGCTGATGATAATCTCAGAATAAGCAAAGCAAAGAAGAAATCGGAAGGGTTGACTCAGAGCATGGTGGACAGATGTATTCAGGATGAGATTGTGGACTTCCTGACTGGAGTGCTCACTCACGCGGAGGGGCACGTGGGCTCTGAGCCTCGGGATCAAGATGCTGAGAAGAAGAAGAAGCCCCGGGACGTGGCCCGCAGAGACCTGGCCTTTGAGGTCTCTGAGCGGGGCAGTCGACCTGCGTCACCAGCTGCCAAGCTACCTGCCTCACCCTCAGGCTCGGAGGATCTCTCCAGTGTGTCCAGTAGCCCCACCTCCAGTCCCAAGACCAAGGTGACCACAGTGGCCTCTGCCCAGAAGTCCAGTCAGATCGGAAGCACTCAGCTGCTGAAGAGACACGTGCAGCGGACAGAGGCTGTGCTGACCCACAAACAGGCTCAAGTTCCTGTTTCATCAGAACAAACGGAGGAAGCCGAGAAAGAGGATCTCAGGGTCCAGCTGAAGCGGCACCATCCCTCCAGTCCTCTTCCTGGCAGTAAGACCTCCAAGCGACCGAAGATCAAGGTGTCCCTTATCTCCCAAGGGGACACAGCTGGAGGGCCTTGTACTCCTTCCCAAGGAGGAGCTCCAGAAGCCGCAGGAGGGAAGCCCATCACCATGACACTGGGGCAAGCTTCCACAGGGGCCAAGGAGCTCACAGGACTCCTCACCACAACCAAGTCAAGTGCTGCTGAAGGGGGAGTCTCAGCCAGCCCAGCGTCCTCAGTGGTCTCTAGCAGCACTGCTCCCAGTGCCTTGCACACACTCCAGAGCCGCCTGGTGGCCACCTCTCCTGGCAGCTCCCTCCCAGGGGCCGCATCAGCCAGCAGCCTCCTCCAAGGCCTCAGCTTCAGCTTGCAGGATATCAGCAGCAAGACCTCTGGCCTCCCAGCAAACCCCTCTCCCGGGCCAGCCCCACAGGCCACCAGTGTGAAGTTGCCCACCCCCATGCAGAGCCTGGGTGCCATCACCACGGGCACCAGCACCATTGTCCGTACCATTCCTGTGGCCACCACTCTCTCCTCCTTGGGTGCCACTCCTGGTGGGAAGCCCACAGCCATCCACCAGCTGCTGACCAATGGGGGCCTCGCCAAGTTGGCAAGCAGCCTCCCTGGCCTGGCTCAGATCTCTAACCAAGCTTCAGGCTTGAAGGTCCCCACCACCATCACTCTGACACTACGTGGCCAGCCCAGCCGAATCACCACACTGAGCCCCATGGGCTCAGGAGCAGCCCAGTCAGAAGAGCCCACCTCCCAGGCGCTGCCCTCCAGCTCACAGCGCCTGCCTCCAGCGCCCTGAAGATGCCATGCGATATGTCCTCCTTTACCAGGTTGGTGACGGCTGCTGCACGGTGAGGCCTGGCACATGTGCTGTCCTGCTGAGCTGTACACTTGTCTGAAGACCTCTTTAAGACAGTCATTTTTGCCTCTCTGCCAACTGTCTTCAGGGCTGGGCCTCTGGGTCTTACGTAACCATTAGACAAGGTGATATGGCGCCAGCAGGGGGGGCCTTGTCCTTTAGCATCTGCAGGTCTGGTTCCCAGAATCTCCAGGTCCTCAGCAGATCTGGCCGTGTATGGATTGGAGGCACTTCTTCCCCAGCATTAGCTGTAACTTGACCCAAGTAGCAGTGTGGGACTGCTCACTGCATTTTAATAAAGGAGCTCCCCTTCGAAGTCTGTACTGCCCCGTGCCAAGTTGGGAGGAGACGTCCGTGTGGTCTGGGACTGAGAGCCCTGTGCTGAGGACCGGGATCATCCTGGCCCACTGGCCAGTGGTTCAGTGCCAGAAGGGCTTGTTTTGCACATCACTGTTGCCTTCACCAAGCAGCCATGGGAGAGTGCTCCCCGTGCAGCTCCCTCCTTACGAGCCACACTGGATACTGAGTACCTGCTGAGACCTGGGAACTCTTCATTTCAAACCCACGATAGGGCACAGAGAACTGGGCTGTCATCTTTCAGTCCCTTTGGTCACCTGTAGATGTTGGGACCAGCAGTCGCCAGGAGGTGAAAGCTGGCTTCTTTCTTTTTTCCATCATGCTTTGGGCAGTTCTTGTATCCAGAAAGCCTGCAGGTCCAGAAAGGCTGAAGAAGAGGAAGGGAACAGCAGATGAAGTGGCTTGAAGGACACGTCAGTGGTGAAAACGATTTGGGCTTGAGGCTTAGCATCTGGTACCTAAGGAGCCGTTGATTCAACTGGAGATGAGAAGAATTTGCCAAGCCAGAGGAGAGAAACTTCAGCCCCTGAAATTTCTGTCTCCAGTGCTTGGAAGTGGAACAGGGGTAACTGCTAAGTTAACGTCTTGGCCGTCCCATGAAGCTCAGGCATCAGGATGATGAAGGCCATGCTTCAGTGTTTCTGTTTCAGCTCTGTGCAACTTTTTGTCTTCTTGCTTAGAAGTGGGAAAATTATTGGTATTGACTCTGCTGTGCAGGGCTCTTGGTACCAGCCTGAGCCCTGGAGGTGGAGGTCTCTGGAGAAGTGATCACTGAAGATGGAGCTCTGAGCCCCTCCTTACCTCCTCACAATACTTGTGTGCAAAAAGTATTTTAGATTTGGCTGACAACCTATCCTCCAGAGCAGGCTCCTTTCCCTTCCATACTCTAGAATGTTTCCAGCCAAGGCGATGAATAAGGCAACCCAGATATAACTCTTCAGTATCTGTACTGAAGGCAGGGAGGGCCCACAGCGTGCCGTGGCTGGACTTGTGGTCCAGGGTCCTGACCCGTATAGTGCATCCATCGTATATCCAAACCAGGCCACCTGCATTCAATCCAGGAGCCTCACCTCCAGTATGAGTGGCAGCCAGGAGGGAGTACACAGTGTGCAGGATTCTCAGACAAGGCCATTTGGGGTGGTACAGGCAGGGCCAGGGACTGTGTATGATAGGAGTGGAGTGGGCAGATTATACACCATACGCTTCCTCCCCGACCTCCTGCAGAGCTGGTCTCAGCAGTGACTCACACAGAATTAGGCTGCATCCCTGTACTAGCTGGCAGGTAGCTGCTTTCTGAAATTCAGGAGGCGTTTAGTAAGTTGGAGGAAGATACGAAATCTGAAAGAGACATCCAGTGTCAGGGGTTTAATAACTTTACAGGTAGGATAGTAACACACCAATAGGAATTGAGGATGGTGAAACTGAGACTATGTGAAGTTTTAGGAATCATTCAGGACAGAGGTTCCTGAACAACCCATTCATGACTTAAGAGTGCAGTCTAGACAGCACTGGAGGGGCTGCTCCTGAAAGATGCTGGCCCTGTGTGTGCTGGGGCCAAAGGAGAAACTAACGCATCGTCCTGCATTTGCGTAAATCCTAGTATGCTTCTCATGGATGATTTCCTGAGGCTTGTGTTGTACACCTTAAAGAATGCCAAAAGGAGAAGGGAAGTTGTAAGGACATTGATTCTTCTGCACCCTGGAGGGACAGGCCTAAGGAGGAAGTGGTTGAAGTCTATACAGTCATGTTCCCCAATTCCATACTTCTCCAGCCCTTGAAGTGTAAAAGGAAGCTTTCCTCCGCCTATCATGTAGCAAACCTGGAGTCCATAACCTCAGAAGGTGATAACTACTGGCCGAAAGTGTAGAAGGATCAAGAGGGCTTTAGCTGATTTCTTGGATGACAGATACATGTTGATGCTCTATGGAAGATGTCCTTGTTTTGAGAAGAGGTCACTGATGGAGGAAGACCTGTCTGCCCTTGGCTCTACCACTAGAACAGTCTTGGGCTGGATGGGTTATAGAGCTGAGCTGCTGTGACGGTTCTGTTCTTCCATTAGCCAAAACAATTAAAAATAAAAACAAATTTGGATTGCTTCAATG\n>XR_003982306.1 PREDICTED: Sparus aurata uncharacterized LOC115573581 (LOC115573581), ncRNA \nCACCACTTTGTACCTCAAGAGGCGATAGTACAGAAGTGGGCTGCTGCAGAAACATGGCGGTGTAACATGGCAGACTCCGCGACAGAGGACCTGCTTCTTTTAAGGTAATCCCAGGAAAGTCTGGCTGGAGGCTGGAGACACGTTTGTCAGGAAAGTACGTGCCTGATCTGATGTGACCCCTCCAATCATCAAACTGTCAGATATGATTGAGAGGGTAGAGTCCACTGCTCTGACTGTATGGTATATCACTACGTTGGTGATATGAACTGTGAAGGTATTAA\n>XM_040635235.1 PREDICTED: Ursus maritimus RNA polymerase III subunit E (POLR3E), transcript variant X3, mRNA \nCACGTGTCCGCTGGAGTTTCTCCACCAGCAACATGGCCGCTGCCTAACAGAAGAGCCGGGCCGCCGCCACCTCTGCAGCCCGCGGGTACCTGGGCCGTTGCCGCCGCCCGCGCGCGGCCCCCGCGGAGAGATTGAGTCCAACGATCGTGCGGCTGGCTCCCCCCTAGTATGGCCAATGAAGAGGATGATCCAGTCGTACAGGAGATCGACGTGTACTTGGCCAAAAGTCTGGCAGAGAAGCTGTATTTGTTTCAGTACCCTGTGCGCCCAGCCTCGATGACCTACGATGACATTCCACACCTCTCAGCCAAGATCAAGCCCAAGCAGCAGAAGGTAGAGCTTGAGATGGCCATCGACACCCTGAACCCCAACTATTGCCACAGCAAAGGGGAGCAGATTGCACTCAACGTGGACGGCGCCTGCGCGGATGAGAGCAGCACTTACTCCTCGAAGCTGATGGACAAGCAGACATTCTGTTCCTCCCAGAGCACCAGTAACACAGCCCGTTACGCTGCCGCACTCTACAGGCAAGGTGAGCTGCACCTGACGCCTCTCCACGGCATCCTGCAGCTGCGGCCCAGCTTCTCCTACCTGGATAAGGCGGACGCCAAGCACCGGGAGAGGGAGGCGGCCAACGAAGCAGGAGACTCTTCACAGGATGAGGCGGAAGAAGACGTGAAGCAGATCACGGTGCGGTTCTCCCGTCCTGAGTCAGAGCAGGCCCGCCAGCGCCGCGTGCAGTCCTACGAGTTCCTGCAGAAGAAGCACGCCGAGGAGCCCTGGGTGCACCTGCACTACTACGGCCTGAGGGATAGCCGCTCTGAGCATGAGCGCCAGTACCTGCTGTGCCAGGGTTCCAGCGGGGTTGAGAACACAGAGCTCGTCAAGTCACCCAGTGAGTACCTCATGATGCTGATGCCGCCCAGCCCGGAGGAGGAGAAAGACAAACCCGTGGCCCCCAGCAACGTCCTGTCTATGGCCCAGCTGCGCACGTTGCCCCTGGCCGATCAGATCAAGATCCTGATGAAGAATGTGAAGGTCATGCCTTTTGCCAACCTGATGAGCCTCCTCGGCCCCTCCATCGACTCTGTGGCTGTTCTGCGTGGCATCCAGAAGGTGGCGATGTTGGTCCAAGGAAACTGGGTTGTGAAGAGCGACATCCTGTACCCCAAGGACTCCTCCAGCCCTCACAGCGGCGTCCCTGCCGAGGTGCTCTGCCGGGGTCGTGACTTCGTTATGTGGAAGTTCACGCAGAGCCGGTGGGTGGTGAGGAAAGAGGTGGCGGCAGTGACTAAACTGTGCACGGAGGATGTGAAGGACTTCCTAGAGCACATGGCCGTGGTGCGGATCAATAAGGGCTGGGAGTTCATACTGCCTTACGATGGGGAGTTCATCAGGAAGCATCCAGATGTGGTCCAGCGGCAGCATATGCTGTGGACGGGCATCCAGGCCAAATTAGAAAAAGTGTATAATCTTGTGAAGGAAAGCTTGCCAAAGAAGCCAGATGGACAATCAGGGCCTGCTGCTCTGCTCTCTGGGGACCAGCGGGTCCAAGTGGCCAAAAGCAAGGCCCAGCAGAACCACGCACTGCTGGAACGGGAGCTGCAGCGGAGGAAAGAGCAGATGCAGGCGTCCTCGGTCCTGCCTGGCGTGCGGATCAAGGAGGAGCCCATGAGTGAGGAGGGAGAGGAAGAAGAAGATCGAGATGCAGAGGAAGACGAGGAGCCCATGGACACCTCTCTTGGTGGCAGCCTCCACAACAGGCTGGCCAATGGGTTGCCTAGCGGGCGGGCGACAGGCGGGGACAGCTTCAATGGGCACCCGCCCCCAGGCTGTGCCAGCACCCCCGTGGCCCGGGAACTGAGGGCCTTCGTGGAGGCCACCTTTCAGAGACAGTTTGTGCTCACGCTGAGTGAACTCAAGCGCCTCTTCAACCTGCATCTGGCCAGCCTGCCACCTGGCCACACACTGTTCAGTGGCATCTCGGACCGCATGCTGCAGGACACGGTGCTGGCCGCCGGTTGCAAGCAGATATTGGTGCCTTTTCCCCCCCAGACTGCTGCGTCCCCAGATGAGCAGAAGGTGTTCGCCCTCTGGGAGTCTGGAGACATGAGCGATCAGTTATCATGAAACACCAAGTCTAAACTGCTTGTCCTCGGCTGGCGCGTCCCTGGCTTTGTTGTCTTCTTCCTGGGGTCTCGGG\n>XR_001152071.1 PREDICTED: Microcebus murinus uncharacterized LOC105866893 (LOC105866893), ncRNA \nTGCTAGCTCCTCGTTAAGGAAGTGACAAGGTTGTAGACACTGGAGGTGGCTCAGTTACAACTGCCTTTACCGTGTGGCTGAGAATTCACTCCCTTCCAGGTCTGGACCTCATGGTTCTGTCACCAAATCGGCTGCCCCTGGATAGAACAAAAAGGCAGAGGCCCTTCTCTTCTGAGCTGGGACACCCATCGTCTCCTGCCCTTGGACATGAGAACTGCACATTCTCCGGCTTTCAGACTCTGAGACTTACATCACTGGCTCCCAGGTTTTGACAACTTTGGACTTGAACTGAGCTATGCAACTGGCTTCCCGGGTGCTCCAACTTGCAGTGGGACTTCTTCCTCAGCCTCCATAATTGATGAACAGAGCAAACCTTATCACCAGAGATGGAGAATCAGAACCAAGATGAGTCTGCACAAATGAAGCTTACTAAAATTATACTTATCTTCCATTCATTTCCCCCACATCCA\n>XM_037676314.1 PREDICTED: Nematolebias whitei ALG2 alpha-1,3/1,6-mannosyltransferase (alg2), mRNA \nTCTCACTAAAATCGTGTGCTTTAAAGTGAGAAGGAAATAGGCGCCATTGTGGTCCAAACACGAAGCTCGTGTAGCTTAACTCTAACGGGCAATTAGAGCCAAAATGGCGTTTAACTGTTAGAGATTCTTGAAATCGGCTGACAAGTAGGCGAGTTTAATCAATGGTTTCTAAACCTTGACTGGATAGAGGAGAGATTCAAAGGATGGCCCGGGTGGTGTTTCTCCATCCGGATCTTGGTATCGGAGGAGCAGAGAGGCTAGTGGTTGATGCCGCTGTTGCCCTGAAGTCCCAGGGGTGTAGTGTTCAGATATGGACGGCCCATTATGATCCAACTCACTGCTTCTCAGAGACCCTGGACCCAGACCTGCCTGTGGTTTGTGTGGGTGACTGGTTACCTACCAGTGTGTATGGCTACCTTCATGCTCTCTGTGCATATATAAGAATGATCTATGTGGCTCTGTACCTGGTCTTCCTCAGTGGTGTTGAGTATGACGTCATCTTCTGTGATCAGGTGTCTGTGTGTATACCTGCACTGCGGTTGTCCCGTCACAGAAAGAAAGTTCTGTTTTACTGCCACTTCCCAGACCAACTGCTGACCCAGAGAACGTCGGCCCTAAAGAAATTTTACAGAGCTCCCATTGACTGGTTGGAGGAACGCACCACTGGCATGGCTGATATGATTCTGGTAAACAGCCAGTTCACCGCAGGCATCTTCAGGGAGACATTTCAGAGTCTGAGCAGGGTCCAGATAGACGTCCTGTATCCCTCCCTGAACACACAGACCTTTGACCAGGGGTCCACTGAGGCTCAGGGCCTGCAAGGTCTGCTTCCTGAGGGAACTTCTCACATGTTTCTGTCTCTGAACCGATACGAGAGAAAGAAGAACCTGGGTCTGGCTCTGGAGGCTCTGGCAGTCCTGAGGTGCAGCCTTACACCTGCTCAGAACGCAGGTGTTCACCTGGTGGTCGCGGGAGGCTACGATGATCGCGTTACTGAGAACGTTCAGCACTACAGTGAGCTGAAAGAATTAGCCGAGCAGCTCTACCTGATGGACTGTGTCACGTTTCTGCGCTCCCCCTCCGATTCCCTGAAGGTGGCGCTGCTGCGGGGCAGCACCGCAGTTCTTTACACCCCCAGCAGGGAACATTTTGGGATAGTTCCTGTGGAGGCCATGTATTGCTGCTGTCCTGTTATCGCTGTGAACTCTGGGGGGCCCCTGGAAAGCATAGCAGACGGGGAGACAGGCTTCCTGTGCGAGCCCACCGCTGACGCCTTCTCCAAGGCCATGGAGAGGCTTATCAAGGAGCAGCAGCTCTGCAGGGACATGGGGCAGGCTGGGAGGAGGAGGGTGCAGGAGAAGTTCTCTCTTCAGGCCTTCTCAGACCAGCTCTATGGGTACATTGTCCGGCTGAACCAGTGATGGGAAGGCAGGTGAAACCTATGACTGCACAGAGGATTTAAGTGTAAATGTGAAGGGAGGTGGGGGTGTATTAAGAAGACAATTAATCAGCATTCCACTGGAGGGGTTGCTGA\n>XM_034454558.1 PREDICTED: Crassostrea gigas ankyrin and armadillo repeat-containing protein-like (LOC105340499), transcript variant X6, mRNA \nTCGAGAATTAACGAAAGTGACCAATCAAACTTTCGCTTCTATTTGTACATCGTCGTCGACACCAACAGGTTGTGGAAACGACTGCAGTAGGGCAAAATACAAAATGCACACAGGATCTATAAATAGCTGACATGGCCACTATGAATGCTGGGACCCCCCAGCCGGGGGAACCCACGGACGAGGCCCAGCTCCAGGCCAAACTGGAACGCTTGGCCAGTACGTACTTCGAGAAGTTCTCCACCCCTGTGTTCAGAATGCAGGAGCTGATTGGCTTCCACAAAAACCACTGGCTGCTCTCTGACGATTTCAAGATGGCGTACGATCAACCGGACGGCCTCATTAAAGGTTTGAACCCGCTTAACTCCAACAGCTGTGTTCTGATGGTGCCGGAGGACCCAGTCCTAGCAGAGAATAAGCTTGGCCTGGACTACCGCGAGGTTCACCAGGTGATCCGGGAGCTGACCTACGGGATCTACGTCCTGAATCAGACCCCCAGCATCTCCCTGGAGGCACTGTATGATCAGGGCACATGGTGTAACCTACCCCCGGGCTTCAACGACACTCACATCGGTCAGCTGTTGATCAGCGTTGACTACATGATGAAGTCCCTGTGGCATGGAGCTTACTTTCCCAAAGAGAAGAGGACCAAATTCAACGACAAATGGAGGGAGCACTTCCAAGTGTCCAAACAGAATGGAAAACCAGAGAAAGAGAAATCCTTCCTCTCCGATTTCCTCAGTCATGGCATGGTAGATATGGGAAAAGATCCGGATTACTGTGACGCGTACAATGACCTTCAGTTCGATAACGAGGACGACCCAGACATGATAAAAGAGCGAATTCACTTTATGAAGCACATAGAGGACATTTGTATGCAGATGACGCTGTACCAGAAAAAAGTGATGCATGAAAAAGACATCTACATGATGGAGGCCGATATGACCATATCCAGTATCGTTCGACTGCTGGACGATCGGATAAATCACGACGACTACGAGCGTGTGAATACGAGACTTCAAATGCATGAAAACATGCTGAGGGAAAACCTTATGAAGAAGATGGACATCAGGCGACAGTTGTTCATTCTGAAGTTTGTGAGTTTTCTGACGCCGTTTTTGATCGGAATGAGGAAGAGAATGAAGATTCCCGACACTACACGATTTCTGCCAGATCTCTCAGAATCAGAAACAGAGGACCAATGTAAGACAGAAGAAGAGCTGCCACCATTAATGCTGGGAGACGACTTTAAGTGTAAAAACTTCTACCCCGACAAAAACAAGTACTTTCACCTACACGGGGGAATAAACATCGACTTTGAGACAGACGATCTAGAAGCGACTCCAAAGGAAGTGACCAACAGATACTCGGATATCCTAGCAATGGCTGAGCAAGGTTTTATAAAAGCCATTTCCATGGAAACTATCAAAGAGCATTATGAGGTGCCAAAAATTACAGTGGACGGAAAAGAGTATTACCTGATCTTCCTGGAGTTTGAGACGTTCTTTAACCCCCAACAGCCCGCCTGGATAAAGGCCTTCAACACAAAGCTGACCATTGACCTAGAAAGAAAGTACCTCCCCCTACAGGACACGCCCATGTGGGACATCTTTGTCAAACATTTTGGCAAGAAAAAGACAGGAAAGTTAAAGGCTCAGATGACGGGACCGCGAGCGGCGGCCATTAGAGGACTGGTCATCATATTTGTCCATATGTGTCGCAAAACTCTGGGACAGCAGATGTCAAGGTTGACAAAGCAAGACGAACACGGTCTATCGCTTTTGCATCATGCTGCGATGAACAATCGGCCGCAGATAATTGTCAGTCTGCTGCGACAAACTGTGGATATCAACTCTAGACGCAACAACATCTTGTCCACAGGTCCGACCGGGCTCCATATAGCTGCCCGTTGTGGGGCCTTGGATGCTGCTGCCTGTCTGTTGGCCTGTTGTGCGGGACAGACATTGTACGATCAGGACGGATGGGCCCCGATCCACCACGCTGCTTTTTTCGACCACGAGTCTATCATCAAGTTGATGGCCAGGAGGAACAATCCAGTCATAGAGCTGCTGACTAGGAATGATGTTCGGTCGACACCTCTGTTGCTAGCCGCGAGTTCTGGAGGACTCTCTGCCGTGAAATGTTTGATCAAACTCGGAGCGGACATTTCCCGGCTGGACGGGGAAGGGAACGGAATGGTCAATCTCGCTGCCATGAGATTCCACACTAACGTCTTGGAGTATCTCATTGAGTGGGGCCACCAAAAAGCCCCTGTGTGGAAGATTCTTGTCAAAATGCTGACTGATCCAGAAGTGGAAAAGAAAGACAGTGCTGTCAAATGTCTGGAGGTCTTGTCTACGTCAAAACCGGAGCACTGGAAATCCATTCTGGAAGCAGGGGGTATCCCAGCCTTGGTGACCTTGCTGAGTTCAGACAATGAAGTCCTCCAATCAGTGGCCGCCTCCGTCATCGTCAACATCTCGGAACACGCGGAGGTTCGTCACGCTCTGACGGCTGCCAAAGCCGCCCCAATTCTGATCCAGCTGCTCAACTCTCCAGACGATAACATTCAGTCTCGTGTGGCCATAATCCTGTCGGACATTGCCAGTGTCCAAGGAAACCAGTCGCTTATTGCGGACGAAGGCGGGATTCCCCCGCTGATTCATCTCATGGACTCTGAGCTGGAGGAAGTCCTGATAAACACTGTCAATGCCGTCCGTGTTCTCTGTGCAGGAAATCCCCCCAATCAGGACGCGGTGGCGGAAAACGGAGGAATCGCATTTCTTCGCGAGTTTCTGACATTGGATTCAGAGAAATTAAAAGCGGCAACAGCAGCATGTATTGCGGCGATCTCTTCAGGAAATAAAAAGAACCAGGACGCTCTGTTAGAGGCGGGAGCTTTAGAGCCCTTGGTGGATATAATTAATGGAACAGCTAATGAGACGGTGCGGGTGAAGTGTGCTAATGCCATCGAGGCGCTGGCCCAGGATAACCTTGCCTGCCAACAGACCTTTCTCCGAATTAAGGCCCCCACTGCCCTCAAAAAACTCCTCAAGAACTTTAATGTGTCGGTGAAGGAACATGGGGCCAAGGCACTCTGGGCGCTGGCGGGCAGCACCACGTCCCAGCAGAAGTACATCGCAGAGAAAACCAGCATCCCCGACATCTGTAGCATGCTACTGGAGGACACTGAGAAACTGCTGCAAGTCGGCTGCATGATGTCGATAGCCTTGGGGAGAGAGAATATCGAGAACCAGATCAAACTAGCTCAGACAGAGGCTTTCAATCAACTCGTCCGTCTGCTGCGGACTCACAAAGACTCGCCTCAAGTCATACTCATGGTCATCCAGGTGCTTGGAATTCTGTGTGTGGGTGTTGCATATTGTAACAACAAAGTAACACAGAGAAAAATAGCGGAAGAAGGGGCTATTCCGACCCTGGTGACCTACTTAAATCAGCCTCCTTCAGAAGAGGTCCAGGTGGAAGTTGCCATAGCGCTGGGGTGCATCGTCCTTAGCAACACTCGTAACCAGGAACTACTTCAAGAAGAACCAGGATTTAACTTTGATGTGCTACTGGATTTGTTGAAGTCAAAGAGTGAAGCTATTCGACTCCGAGCAGGCATGGCCCTGACCATCTTCGCATTTAACAATACTCCGCAACAGTACGCCATCCGAGAGGCAGGCGGCATAAAATACTCTGTCTTCGAACCTTTCCTCAACTCCAGCATAGAATATGATGTCTGTTACGCTGCGTTTCAGATCGTGGTGCTTGCGCGGGTGATTGTCGACCAAGACCAGGTGATGTTGACGGCTCGCGGTGTCACGCTGCTCGTAGAGAAGCTCCACTCCACAGAGGACAATGTGATCGTACTCGCCGCGAGTCTCCTATCGAGTCTCGCTCACACGCGGGCAGGAATCCCTGATGCCATGGTAACCACAGGCGCCATCGATGTGCTAGTGGAAAAACTCTCCTCACGGAATGACCAAGTTCGGAGTGCATGTGCGGTTGCCCTCGGTTACTTGACTTTCAACAGGACTGCTGCGAGGATTTTGTTCAGTGCTTGTCGAAACACTCCTGGATTGTACAAAAAGCTCGACGAAAACATTGGGAAAAATGCCAAAATTAGTCAGGAGTTTGTGCAGGATTTCAAACGAGCAAAGATTGTTGGATTGCCGTCTCAATGCCTTGAGATTAATGGTGGACCTCCAGTAATTCCTCCCAGCAGAAACAGTATGAGACCGATGACTGGTACGACAAGTCGAGCTACCACCGCCCAAGCTACAAGCCGAGCGAAATCAGCTCCGGGGAAGAGACCGCCGCCGAGATCATCCCCTAACCCCAGCGTGGTTGTTGTAAGTACCCCCGACAACAGTCGCCCCTCAACGGCCTCACCCCTCAGGATCCACCCCAGCTCTCTGTTCCGACCTGCCTCCTCCCCCCACACCAGAAAAGGGGCGCGGTCACCCCCAGATGCAACCTTCAAAACGCGGTTATCTTCGTGGAAAGAAGAAATCTGATGAAAATGTTTCTCTCTGAGTTTTTTGTATCAAATGAAATGTAATTCACTTCTGTGTGTTAAATACCCCCAAATTGTATAAGTCTATAAAATTATTATTTT\n>HM490822.1 Uncultured Thermovirga sp. clone GE7GXPU01D8TM1 16S ribosomal RNA gene, partial sequence \nGTACGTGTTACTGATCTGAGAGGACGAGGGACCCATGCTTCGGTATGGGAGCGTACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTGCATCCAGTTGCCATCGGGCGAGCCGGGCACTCTGGAGGGACTGCCGGCGACAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTATGTCCAGGGCGACACACGTGCTACAATGGCCGGCACAGCGGGAAGCGGAGGGGCGACCCTGAAGCGGATCCCTTGAAAGCCGGTCCCAGTTCGGATTGCAGTCTGCAACTCGACTGCATGAAGTTGGAATCGCTAGTAATCGCGGATCAGCCAAGCCGCGGTGAATACGTTCCCGGGCCTT\n>XR_005682382.1 PREDICTED: Panicum virgatum uncharacterized LOC120691804 (LOC120691804), transcript variant X1, ncRNA \nTCCCTCTTGCCGGCGGCCTCGCCGACGTTTGCCGGCACGCTCGAGGTCGATCCGCTCATGGTTGCGGGCTCCTCTGTTGCCGCTAGGCGTACTCGTTCCTACCTTCGTTGCTGCAACCACGCCCTCCCAGTTGGACCTACGGAACCTTTGTTGCGGCATCCATCCCCTCCTAGATACAGTCCTCGGATTCTGATGCTCCCGCTAGCAAGGTTGCTCTTGCTTCTGTTGGTCAATCGTGCAACTGGTGGAAGGAGGACCACGGTTCTCCATGCTGTGGTGTAGATTAGGCGCTAGGTGCTTGATGTCACTGAAGAGAAAGAAGTAGAGGAGCTTATGTTCTTATGTTCGCTTTGGTGGCCAGTTGCTTATAATTTATTTGATACGGCGGCTTAGGATTATAGTCTTATGTAACCGTGAAAATTGTCTTTGGCAAATTTACTAAGTAGTTCAGAAGACTCACTTTGTATTGTATTGTATTTTAATAATTTATTGTTGTTGTGATCAATCAATATAAATTTGCAATGATATATATA\n>JN143486.1 Uncultured eukaryote clone KYD009 18S ribosomal RNA gene, partial sequence \nAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGAAAACTCACCCGGCCCGGACACTGTAAGGATTGACAGACTGAGAGCTCTTTCTTAATTCGGTGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGATAACGAACGAGACTCTGGCCTATTAAATAGACGGTGTATCTTGAAGTATACCGCGCTTCTTAGAGGGACAAGCGGCGTCTAGCCGCATGAAATAGAGCAATAACAGGTCTGTGATGCCCTTAGATGTCCGGGGCTGCACGCGCGCTACACTGAAAGAATCAGCGTGCGATTAGCCTGGTTCGGAAGAATCGGGTAACCCAAGTAAATTCTTTCGTGCTTGGGATAGGGAATTGCAATTATTTCCCTTAAACGAGGAATTCCCAGTAAATGCGGGTCATAAGCTCGCGTTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCGATTGGATGACTCAGTGT\n>XM_052629031.1 PREDICTED: Gossypium raimondii plasmodesmata-located protein 6 (LOC105780626), transcript variant X2, mRNA \nTCTCTCATTTACACTCTTCTTTTCTATATATTCTCTTTTAAACCTTTTTTTGTTTTCTCAATATCTTCACTTATGGCTTTAGCGGCGAAACAATTATCGTCACCTTTTGTTATTTTTCTCATATTATCAATTTTCTTAGTTGGGCCATCGTTTTCCGGCACCGATACTTTCGTTTTCGGCGGCTGTTCGCAGCTGAAATTCACTTCAGGCTCACAGTACGAGTACAACGTCAACTCGATACTCACTTCCCTAGTCAACTCAGCCATGTTCACTTCTTACGACAACTTCACCATGTCAGCTTCCGGTGGTTGCAGTGCCGTTTACGGGCTGTTCCAATGCCGTGGTGACCTAAACAACCGTGACTGTAACCGTTGTGTAGCTAAAGCGGTGAGTCAAATTGGAACTCTTTGCTTTTACTCAACGGGTGGTGTGTTGCAACTCGAAGGGTGTTTAGTTAAATACGATAATGTAACTTTTTTGGGTGTGGAAGATAAGACCGTGGTAGTGAAGAAATGTGGACCGTCGTTCTCGTCTTACTCGGACGCTTTGACTCGGCGTGACTCGGTGCTGAGTTACTTGGAAGCGAGTGATGGGACGTATAAGCCGTTTCGGATCAGCGAGTCGGGGAATTTACAGGGTGTGGCTCAGTGTGTTGGTGATTTGAGTCCGAGTGAGTGCCAAGATTGCCTATCGGAGGCAATCGGACAGCTGAAAACTGAGTGTGGGGCAGCAAAATGGGGTGATTTGTATTTGGCTAAGTGCTACGTGCGGTTCTCGGAAGGTGGATACCACTCGCATGCCGGAAAGAGTAGCTAAATAAACAAAGGAAACTGACAATTGTTGTGAGGAATCCAAAAGAAAACCCTTTGCATTTGGTCTTCATTTCTTTTATCTGTTTATATTTAGACAACTATTGTACTGTCCGGGCGAGAAAATTTA\n>HQ761033.1 Uncultured organism clone ELU0047-T268-S-NIPCRAMgANa_000215 small subunit ribosomal RNA gene, partial sequence \nAGNGAAAGGCGCTTTCGGGTGTCGCTGATGGATGGACCCGCGGTGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCCACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTGTTAGAGAAGAACAAGGACGTTAGTAACTGAACGTCCCCTGACGGTATCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGAGACTTGAGTGCAGAAGAGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCAGTGGCGAAGGCGGCTCTCTGGTCTGTAACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTGGAGGGTTTCCGCCCTTCAGTGCTGCAGCAAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTTTGACCACTCTAGAGATAGAGCTTTCCCTTCGGGGACAAAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATTGTTAGTTGCCATCATTTAGTTGGGCACTCTAGCGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGGAAGTACAACGAGTCGCTAGACCGCGAGGTCATGCAAATCTCTTAAAGCTTCTCTCAGTTCGGATTGCAGGCTGCAACTCGCCTGCATGAAGCCGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGTCGGTGAGGTAACCTTTTTGGAGCCAGCCGCCTAAGGTGGGATAGATGATTGG\n>XM_033535937.1 Aplosporella prunicola CBS 121167 uncharacterized protein (K452DRAFT_19523), mRNA \nCTGGGGCGGCGGAAGAGGGCAGAACTCCGAAACACTCACTACACCCACGTCGGGTAGCTCGTCGCCAAGGTGGTACTCTACTCTAGCTGTGTTCCGCCATCCGGAGGCCTACACGTAAGGTCCATGTCGTGCAATTGGACTAGAGACGCACTCGTCTCCCACGCAATTCTGTCGTGCAGATGTACGGTTACTTCGTACTTTTGACAGATGCCTCGTCCGTCGTCCATCGTCCATCTGCATTTATGGTCGACGTTTCTCTCCAACCATGAATGCATGCTCGTATCTACTTCCCTAAGTAACATCGAGCGCATACAACCAAGACAACAAGGCCGACTGTGGGCTGCAATCCTCAGGGGACCAAAAAATTTCTGGTGCCACTACTGCACATACACGCGTTCTACGGTTAGCGTCAAGTATGCAAGCCACGAGAGTACAACAAGGGATGGGCTACAGCTTGGAACGGCCAGCCATTGGTCGCACACGCTAGCATACACTTTTATCTGGCTCCTCTGCTGGATAATCGCATTCCGCCGCCGTTTCGTGCTTCGCAGGCATGCCCATGCTCTGTCTCCATGCTGCATCTCAAATCCAGCGTATCGTGCATGTTTTGGTGCTTTGATGCAGGTCCATGACGTCACCGGCAAGGCATCGACAACGCATTGTCTGCACCGGGCAGATCAGAGTCCCTCTCATGCCCCATAATCCGTAGCGGTGCATTTATCCATGGATTCCTTGTCTTATACCGACCCGGCGTTAGCAGACGTTAACTCGTTCTGACTCGATCTC\n>XM_008727620.1 Cladophialophora carrionii CBS 160.54 hypothetical protein partial mRNA \nATGTCTGAACAGTCCAGCGAACCGCGAATAAAGTCGCACAAGAGGAACGTCGCCCACCGTCGACGCCGGGATGACGACGATTTCGAGGACCGGTGGGGCGATGAAGAGGTTGCCGAGGACGACGACGCAGATGGACACGCGCAGGCTGAATTCCCAGAGTCGTCGTCCAAACGGGTGAAATTGTCTGATGGCTCGGCATCGCATCGGGCGAAGAATTCCACACCCACCCCTCCACCAGAAACGGAAGAGGAGAAAGCACAAAGGGACCGAAAGGAGCGAGACGAATTCGCGAAGCGGTTGGCAAAGAAGGACGAAGAGCGGGCGAAGAAGATCGTGGAAGACAGGTCCGCTGCAAAGGACAGTGCGACGGCGCAGCGGCGGGCATTGGCAGACGATGCGTCCGCGAGAGACGCTGCGATGCCGGATTTGAGGCTTCGGTCCCGTCAGGACTACCTTAAGAAGCGGGAAGCCGAGAGGTTGGCTCTGCTGCGCAAACAGGTCGCTGAGGAGCAGCAGGAGTTGAGGGACAACCCGGACCTGACGCGGCGGGAGAAGGAGGAATTCGCGCGCAACAAGGAGATCCTGCGCATCGCGGAGGAGAGGCTGGCCATTGACGATCACTTGGACGGCTATGCCTTGCCGGAAGACTACATTACCGAGAAAGGGAAAATCGACAAGCGGAAGAAGGAACAAGCACTCTACCAACGTTATGTCGATCGCGACGAGGCCGGCCGAGAACGCTATGTCACCGAGCACGAAGAGTGGGAGAGAGAGCAAACCAAGCGAGCCGAGGCCCAGATCAAGAAGTCCGAATTCGTAGACGAAGGCGACTACGGCTACGTGTTCGACGAAAGCCAGCAAATGAAGTTCATCCTGGCGGACAAGCTGGAGGGGGACAAGGGGATGACCAAGGAGCGCAGAGAAATGGAACAGCGGCTCAACGCGGCAGAAGCAAAAGCCAAGAGCATCGAGGAGACGAGGAAGAGTCTACCCATTTACCAATTCCGAGACGAGATCATCCAAGCCGTGAAAGACCATCAGGTCTTGATCATCGTAGGCGAAACTGGCAGCGGGAAGACCACTCAATTGCCACAGTACTTGCACGAAGCGGGTTTCACAAAAGGTGGCATGAAGATCGGATGTACTCAACCGCGAAGGGTTGCTGCCATGTCCGTTGCAGCCAGAGTAGCAGAAGAGATGGGCAAGCGGCTAGGGAACGAAGTGGGCTACGCCATCCGCTTCGAAGACAACACCAGCGAGAAGACGGTCCTCAAGTACATGACCGACGGCATGCTGCTGCGAGAACTGCTCACCGACCCGGAACTCTCTCAATATTCGGCCCTCATGATCGATGAGGCTCACGAACGCACCGTCTCCACCGACATCGCGTGCGGCCTGCTCAAGGACATCGCCCGCGCCAGACCAGACCTCAAGCTCCTGATATCCTCTGCAACCATGGATGCCCGCAAATTCCAGAAGTACTTTGACGACGCACCCATCTTCAACATCCCGGGAAGAAGATACGCGGTCGACGTGCATTACACGGCCCAACCGGAGGCGAATTACCTGGCCGCGGCGATCACGACGGTGTTCCAGATCCACATCACGCAAGGACCAGGCGACATCCTCGTGTTCCTGACGGGCCAAGAGGAGATCGAAGCCATGGAAGCAAGCCTGCAAGAGACGGCGCGCAAACTAGGCAGCAAGGTCAAAGAGATGATCATCTGTCCCATTTACGCCAACCTCCCAACCGACCTGCAGGCCAAGATCTTCGAGCCGACGCCCGCCGGCGCCAGGAAGGTCGTCCTCGCCACCAACATTGCAGAGACGTCCCTGACCATCGACGGCATCGTCTACGTCATCGACCCCGGCTTTGTCAAGGAGAACCAGTACAACCCACGCACAGGGATGGAATCCCTCGTCGTGGTGCCGTGCTCACGCGCCTCGGCGGGCCAACGAGCGGGGCGCGCGGGTCGCGTCGGCCCAGGCAAGTGCTTCCGCCTGTACACGTCGCAGGCGTACAAGAACGAACTGGACGAGAACACGACGCCGGAGATCCAGCGGACCAACCTGTCGGGGGTGATCCTACTGCTCAAGTCGCTGGGCATCAACGACCTGCTCGACTTTGACTTTATGGACCCGCCGTCGACGGACACGATCGTGCGCGCCGTGGAACAGCTGTACGCGCTCGGCGCGCTCAACAACGCCGGGGAACTGACCAAGATCGGGCGGCAGATGGCCGAGTTCCCGACGGACCCGATGCTGGCGCGCGCCATCCTCGCGGCGGACAAGTACGGGTGCGTGGACGAGGTGCTGTCCATCATCGCCATGCTGGGCGAGGCGTCGGCGCTGTTCTTCCGGCCCAAGGACAAGAAGATCCACGCCGACAGCGCGCGCGCGCGCTTCACCAACAAGGACGGCGGCGACCACCTGTCGCTGCTGAACATCTTCCACGAGTGGGTCGACAGCGACTACAGCTTCGTGTGGGCCAAGGAGAACTTCCTGCAGCAGCGCAGCCTGACGCGCGCGCGCGACGTGCGCGACCAACTCGCCCGGCTGTGCGACCGCGTCGAGGTCGACGCTGCCAAGTCGTGCGGCGGGGCCAGCAACATCGAGCCCATCCAGAAGGCCATCACGGCCGGGTTCTTCCCTCACTCGGCGCGGCTCCAGCGCGACGGGCAGAGCTATCGCACCGTCAAGAACGGGCAGGTCGTCTACATCCACCCGTCGGGCGTGCTGATCGAGACGCGGCCGAAATGGGTCATCTACCACGAATTGGTGCTCACGAGCAAAGAGTACATGCGCAGTTGCATGCCGTTGAAGCCCGAGTGGCTCATCGAGGTGGCACCGCATTACTACAAAAAGAAGGATCTGGAGAGCCTGGGCGTGGAGCGGAAGGTGCCGAGAGGAGAGGGTAAAGGGCAGAGTAAGATTTGA\n>HF913007.1 Uncultured Anaerolineaceae bacterium partial 16S rRNA gene, clone 4_45 \nGATGAACGCTGGCGGCGTGCTTAATACATGCAAGTCGAACGAAGATGTTCTTGAGTTTACTCGAGAGCTCTTAGTGGCGGACGGGTGAGTAACGCGTTGGTGACCTGCCCTAAAGAAGGGAACAACCTCGGGAAACTGAGGCTAATACCCTATGTGCTTATTTAGATTAGATGCTTTATAAGTAAAGGTTCTGTGGACGAAAGGCCACGGTGCCACTTTAGGAGGGGCCTGCGTACCATCAGCTAGTTGGTAGGGTAATGGCCTACCAAGGCAAAGACGGGTAGGGGACCTGAGAGGGTGGCCCCCCACAATGGAACTGAAACACGGTCCATACACCTACGGGTGGCAGCAGTAGGGAATATTGCACCATGGGCGAAAGCCTGATGCAGCAACGCCGCGTGAGTGATGAAGGCCTTCGGGTCGTAAAACTCTTTTCAAGGGGAAGAGGAAGGACG\n>XM_035019610.1 PREDICTED: Mirounga leonina family with sequence similarity 43 member B (FAM43B), mRNA \nCCTACTCCTTAACTGCCCCTCCATCCCCACCCCTCCAATAAGAATGATTAATCCCGTTCCACCGCGCCTGTGCCGGGTCCCGGGCGAAGAGCAGCGCTAGCCGGCGCGGGGGAGGAGAGAGAGGAGAGCGAGGGGAGGGGACAAGAGAGCTAGCGGTCCCGCCCGGTGATGTAGGCAGCCCGGGGAGGTGGAGCCGCGACGCCTGAAGGAGTCCCCACCGCAGTCTCGCGCTCTCGGTCTACCCCTCCGAGCGGCCAGCCGCCAACCCCAGCTCCGGCGACCTCCCTGCCGCCGCAATTTGGGCGGCGGGGACTGCGGGATCCCCCCCCCCAGTTCGGGCCCGGGGGGCCCCTCCACCACGCCCAGCCCCCCTCCCCTCCTCGCTTCCCGGACGGCTGGAGCTACTCCCGGGGGAAGCTGTTCCCGGACGCTCGGCCGCCGCCCCGGCATCTCGGCTGCCAGCCCGGCCGGGCACCGGGCATCTCCGGGCACCGACTGGCTCCGGCGCCGCCCAGCTGCTCGCGACCCCGGGGCCGCGGGCTTCTGCTCGCCCTCCCCTCCCCCGGCCGCCGGCCAGGACGCCCGTGAGCTCCCGGTGCCCCCAGCCCCTCTGGCCGCCGCCGCCGCGATGCTGCCCTGGAGACGCAACAAATTCGTGCTGGTGGAGGACGAGGCCAAGTGCAAGGCGAAGAGCCTGAGTCCGGGACTCGCCTACACGTCGCTACTCTCCAGCTTCCTGCGCTCCTGTCCGGACCTGCTGCCCGACTGGCCGCTGGAGCGCCTGGGCCGCGTGTTTCGCAGCCGGCGCCAGAAAGTGGAGCTCAACAAGGAGGACCCGACCTACACCGTGTGGTACCTGGGCAACGCCGTCACCCTGCACGCCAAGGGCGACGGCTGCACCGACGACGCCGTGGGCAAGATCTGGGCGCGCTGCGGGCCGGGCGGGGGCACCAAGATGAAGCTGACGCTGGGGCCGCACGGCATCCGCATGCAGCCGTGCGAGCGCGGCGCCTCGGGGGGCTCGGGGGGCTCGGGGGGCCGCCGGCCGGCGCACGCCTACCTGCTGCCGCGCATCACCTACTGCACCGCGGACGGGCGCCACCCGCGCGTCTTCGCCTGGGTCTACCGCCACCAGGCGCGCCACAAGGCCGTGGTGCTGCGCTGCCACGCCGTGCTGCTGGCGCGGGCGCACAAGGCGCGCGCCCTGGCCCGCCTGCTCCGCCAGACCGCGCTGGCGGCCTTCAGCGACTTCAAGCGCCTGCAGCGCCAGAGCGACGCTCGCCACGTGCGCCAGCAGCACCTCCGCGCCGGGGGCGCCGCCGCCTCGGTGCCCCGCGCCCCGCTGCGCCGGCTGCTCAACGCCAAGTGCGCCTACCGGCCGCCGGCCGCCGAGCGCGGCCGTGGGGCGCCGCGCCTCAGCAGCATCCAGGAGGAGGACGAGGAGGAGGACGCGGACGCGGAGGAGCGCGAGCGGCCCGAGGTGCTCAGCCTGGCCCGGGAGCTGAGGACGTGCAGCCTGCGGGGCGCCCCGGCGCCGCCGCCGCCCGCGCAGCCCCGCCGCTGGAAGGCCGGCCCCAGGGAGCGGGCGGGCCAGGCGCGCTGAGAGCGCGGCGGGGGGGGGGTGCGGGGGGAGGGGCGCGGGCCTCGCGGCCCCAGCCCCCCGCCGGCCTGACTTCCAGCCTCCAACCCTGGCCCTGCCCGCTTCGGCTCCCCTCTGGTCCCCCGGCCCTTGCCTCCCTCGTGGTCTCTGTTGTTGTCTGCCCCGCGTCTCATCCTGGCTCAGGGTGACGCCTGATACGCCCTTGATTATTGGGGGACAAAGGGGAGGAGAGCAGCAGAAGTACTCGATGTTCGCCTCTCCCCCACATCCGGAGTTGCTGAGCGCCCTCCATCGTGGAATTGCTCGTAAGCTTTACAACAGGTCTTTGCCCATAGACCACCCTCTCCCTCCCAGAACAACCCCTCCAAAGAAGGGGGAAGAAGTTTCCAGAAATCCAGGAGGGTGGCCCTGGACGTTGGCCAGGTGGAAGCCGTGGTCCTGCCCTTGGCCAGTCAAGCCTTCCTCCCTGGGATGGGACCAGTTCTGGGCAGGCATGCTTGCAGAGAAAGAATAGTGGCCCGGGAGACCGGAGGCCAGGTCCAAGGTGGGAAGTGAGTCGGCTGCCATATACACAAGGAAGGATTCTCAGGCCCTGTGCCTGGCCTCTCTACCCCTTGGAGGATTTCTGGACTTCACTGCTCCATCTCCGGAGAAGACTGGGCTGGTCCTACCAACCCAAACAACAGGTTAGAGCAGGTAACAGCCCTCTGCTCTGGGCAGCTGCCCAAGAGTATGCCCTGGCACCTGGCACCCCCACAAGACTCCACCCACCCCACATCTCTGCAGACAGATGTGTGGGGTTCCCCACTAGGTGCCTCCAACTAGGACCAAGATGGGGTCTCCAAAGGAGGTAAGGAGAACCTTTGGCAGGTGCTTGAGGACACTGACCACCCAGAAAGTGGACACAGGAGGGATGCCCTCCCGTCCCCTCCCGCCCCCTGAGTCGGGGCTTGTCAGAGCAGGAGGGTCCTGACAGCAGTTGGGTTCTCATAGCCGGCTGAGGAAGGAGAGTGTGTTCACCCAGCAGAGGGAGTGGGCCCCCTGCCCAGGTGTCCCAACAAGGCCACAAAAAGCCCAAAGATCTATGTGTCACCAACTGATCGTTGTAAATAAAGTGGACCTGCTTTTTCA\n>MN887529.1 Glyphodes pyloalis putative family 31 glucosidase KIAA1161 protein mRNA, complete cds \nGGGGGGGGGGGCAGTAGGTGTGTGAGACAAGATGAAGCTGATACTTCTGTTGGCAGGCGTGTCGGTCGCGCTGGGCGGTATTGCGCGCGCGCCGACCAAGCGTGACTTCTTCGTCGACCAGCGGGAAGATGGCGGCCTCGACTTCATCGTGGTGTCCAGCGAGAAGGGTACACTGACCCTCGGGCACATCGGCCGCAAGGTGGCCGCAGACGACCCTGAGGTGACCTTCGACATGGATGCGCAGCTCGATGAGGCCAGCGGCGGCTGGAAGGTCACCATCAGCTGGGAAGGGCCCAGCGACAGAGTCTTCGAGGACTGCTTTGGCTTCAGAGGCAAAGAATGGTACGGAGGTCCCGAGCAGAAGGAGCAGTACTGGCCGATTCAGCACGGGAAGCTGGAGAAGTACTCCATCATCTCTAAGGAGGACGACAACGCCGCCGTCTCCGAGAGATACTGGCTCAACTCCGCCGGCTACTACTTCTACGTACACCCAGAGGCTCCCCTCTTCGTCGACTACCACAACACCAAGAACGATAACATCTGCTTCATCGCTGAAGTCGCCGCACCTTACTCCACCAAGCGTACACACAACGTTCTCAAATACGACATCTGGTTCTTTGACAACGCCAAGGTCGCCCACCAGCACGCCGTTGACACTTACCTGGGAAAGCCATCTGGCATTCCAGACTACAGAATGATCCAATACCCAATCTGGAACACTTGGGCGAGGTACTCCCGCGGAATCGACGAGGATCTTCTATGGGAATTCGCGAATGAAATCGCGGACAGTGGATTCCCTAACTCTCACTTTGAAATCGATGACCAATGGGAGGTGTGCTATGGATCTCTGACCGTCGATGAGGGCAAGCTCCCCAACTTGAAGCAGTTGGTTCAGAAAATCAAAGGACTTGGATTTAGAGTCGGCATGTGGGTGCATCCCTTCATTAACCAGGATTGTGAGCCTTGGTATTCTGAAGCTTTAGAAAATGGTTACTTGGTACTGAATGAAGAAGGAAATCCAGAAACCAGCTGGTGGAACAACAATGGCTCCATCCCTGCCTACGTTGACTTTACCAACCCTGAAGCCAAGAACTGGTACACCTCGCGAATCCAGAACCTCATTGACACTTACGCTTTGGACACTCTCAAGTTTGACGCTGGAGAATCGAGCTGGTCTCCTCAGATCCCAGTCCAGAATGGTGACATCGACCTTCATCCGGGACACATCGTGCAGGAATACGTGCGCGCAGTTGTCCAGTTTGGAGACATGATCGAAATTAGGTCTGGAATAAGAACCCAGGATCTGCCTGTGTTCATCCGTATGGTCGACAAAGACACCTACTGGGGCTTCAACAACGGCCTGGCGACATTGGTCACTACTCTGCTCGCAATGAACCTGAACGGCTACACGCTGGTCCTGCCCGACATGATCGGCGGCAACGGGTACAACGACAAACCAGAAAAGGAGCTGTTCATCCGCTGGCTTCAGGCCAACGTGTTCATGCCTAGCCTGCAGTACTCCTTCGTGCCGTGGGATCATGATGATGAGACCGTTGAGATCAGTCGCAAATACACGACTTTGCACGCGGAGTACGCCGACACCATCGTGGCTGCCATGGAAGCCTCCGTGAGGGACGGCACTCCTGTCAACCCTCCCATCTGGTGGTTGGACCCAACCGACGAAGACGCTCTAGCAGTTTGGGATGAATTCCTCCTCGGTGAGAAGATCCTAGCAGCGCCGGTGCTCGAAGAAGGCGCGGTGTCCAGGGACATCTACCTACCCACAGGCTCTTGGCGCGACGGCGTGACAGGCGAGTTGGTGCAGGGCCCAGTCTGGCTCATCGACTACTCCGCCCCCCTCGACACGCTGCCCTACTTCACCCTGGAAGATTAAGTCGAGACCTTCAGAAGGGTCTTGGGAGTTCCTAATTGATAAGTTTTAAAATAAAGTTGTTGTTTTCAAAAAAAAAAAAAAAAAAAA\n>JX367473.1 Uncultured fungus clone 035A13021 18S ribosomal RNA gene, partial sequence; internal transcribed spacer 1, complete sequence; and 5.8S ribosomal RNA gene, partial sequence \nAAAAAACGCTTGGTCATTTAGAGGAAGTAAGAGTCGTAACAAGGTCTCCGTAGGTGAACCTGCGGAGGGATCATTACACAATAAAATATGAAGGCCTGGCTTCGCGGCCGGCTGAAATATTTTTTCACCCATGTCTTTTGCGCACTTGTTGTTTCCTGGGCGGGTTCGCCCGCCACCAGGACCAAACCATAAACCTTTTTCTTATGCAGTTTCCATCAGCGTCAGTAAAAACAATGTAATAATTACAACTTTCAACAACGGATCTCTTGGTTCTGGCATCGATGAAGAACGCAGCGAAATGCGATACGTAGTGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACNCACATTGCGCCCTTTGGTATTCCAAAGGGCATGCCTGTTCGAGCGTCATTTGTACCTTCAAGTCTTTTGCTTTGGTGTTTGGGTCGTTTTTTGT\n>XR_006640209.1 PREDICTED: Bubalus bubalis uncharacterized LOC123465122 (LOC123465122), ncRNA \nGCCGAGAGAGTAGGTCGTCAGGCGGCCCTTGAGTTTTTTTCTCTTAGTGTAAACGTGTGCTGCGCGCTTAGCCGTCCAACCGGCTCTCGCCACGCCCATCTTCAGGGTCCCGCTGGTTCGGTCGACAGCCCGGTTTCCGGAGAAGCCGCGTCCTCTCCCCGGTCCTGGGATTCTGGAGAGCCCGGCCGGCCCCCGAGACCCCCTTTCTCCCACCCTCTGCCCTCGCGTCTCCTCAGGCCAATCGTTCTGTCCCGCAGGCCTCCCTTCCTGGGATGGTTAACCTTCAAGGATGTGGTGATCGAATTCTCTCAGGAGAAGTGGGAATGCCTGGACCCTGTTCAGAGGGCCTTGTACAGGGACATGATGCTGGAGACCTAGAAGAACCTGCTCTCCCTGGATCTATCTATCTGATACATGTGGTCAACCAATTACAACCCAAAGCAGACAGTGATACAGGAGAAGTATTCCAAACAGCAATCTTGGGAAGACCTAAAAGTCATGAAATCAAACATTTTTACCTCAGAGAACTCCAGGAAGACATGTATGACTTTGAGTATCATTGGAGAAGTGGTGGAAGAAATAACAAAGGAACGCGTATAACTCATGACAGAAATCTCACTGATGGCAGAGGTCAACAATGTAGAAAGGATGTGGAAATCAAGCCCTTTGTAAATAGGCTTGGATTTAACATGCAGGATAAACTTCAGATATTTCAAACTGACGGGATAATTTCTGAATGTAATAAAGTTACAAGGTAGTCAACAGTAGTTT\n>XM_023049778.1 PREDICTED: Onthophagus taurus uncharacterized LOC111417487 (LOC111417487), mRNA \nTTTAAGTTTTTTAATAAATAATTTTTAATAACAACTTTTTAGCAACAAAAATTAAAAAATGTGTACACCCGAACCGCTTCAACTAAATACAACAAAAGGAAAATGTTCAATCTCACCTTTCACATGCATTTTAAAGTTTTTGATACGTTCGTTGGAATGTCCGGAAAGTGAAAAGTTTATTTCACGTTTTGAGGATCAATTAAATCAATTGATTGCTGTTGGAGGTGTTAATGTTTCCGTTCGCGAATTAGCTGATTTAATAAAACTAATTTCTTTAACGTTTCAAAGAATCGATGAAAAACCTGCTTATTTAGAAGCTTTTTATAAATTATTAAATTTTAGTTCGCAAAATTTGGTATTTTTGATAACCAGCGACATGATAAGTTATGCTGAAATTATACAAGATTTTTTCAACATGCTGGGTTATTTACTGGGTAGTACAGAAAATCTGGATTGCATTCAACACATTTTAAACAGCATATTAAAAATGATTGCAATGGCAAAGAAAAAACCTTATTTACAATCAAAAGTACTTTTAGACGCTTTTGCAAATAGTCAAATACCACCGATTTTTAGCGAATTACTATACATATCTGAATTCGACGTTTACATCAAGTATTTAACAGTTTTAGAAAAATTCTTTGTATCGGAAAGCATCTGTCAAGCCTTTTTAAAATGTAAAGTTTTCGACACTGTCGTTCAAAGGGTTTGTTTAAAATGGAGAGATGAAATTAATTACCCAGATGAAGTTCTTCCAACTTTAGATTTACCACCACATTTAAATGTAACCCAAAGGATTCTTTGGACATTAACAATGATTTATAACGATAGCTCGACAACTTTTAAAAATAGTATTGGGTATTTAGTTGAAGGATCTTCTTTGAGAGGTCCTCGCAATGTTTTAATAACATTAATAACATCAAATAAAGATAAACACATGAGAAATATGTTTTATCTGCTTTTAAGAGCGATTGCTGGTACTGTGCCTTTTCGTCATTATAGAAGTTTAAATAATGAATTGCATATTTTAACGTTTACAACTGAAGTGGAACAATCTCATCCTTGGGCAAAAAGAATGGTGTTACGTGCAGATGATCTTGATTTTGAGTTTAAAATGATGCTGGTTTCAATGTTATGCATTAATAGAGTTTACCCACAAAGCTTAGATCTTTTTAGAAAAATGAATGCCGTTCAAGGAATTTTTACGTTAATCGATACAGATATACAATTAATTTGGTCGACTTATCAACGGTTAGAATTAATGAAAGGGGCATTAATTGGAATGGAAAATATGATTTTTCATGTCATCGATGATTATATTCACTACGGGGGACCTGGTAAATTATTAAAAGTTCTTACAAAAGTTGTTGAAGGTGAACTACATTCAACCCTTTTATTACCAATATTAAGATGTATTAATACATCCTTAAACGTTCCGAGTAATGTGCAAGAAAAGGTCGCTAAACTTTACAGAATGAAACATATCATTGAAATTTTAACAACTACAATTGAAAATGTAATTAATGCTGAATTCATAACAAAATTAAACTTAAGCTGTTTAGCTGTAAGTTATTGTATTTTGGAGAAAGTTGCGAAACCCAACGAACCAAAATTAACAGACGTAACAAAAACGGGAATTGCAATTTTAAAAAAATACTTAAATCCAGATCCTAGTATTTCTTTCTTAGCACCGAAAGTTCTCATTGCTGTGATGAGTTTTATATGGGAAAATGTAGTTTATTGTGAAAACGGGATACACGAATTCAGTTCTACAGGTGGCGTTTACGTCATCTTAGACATAATTGAGAAATTTCCTCTTGCCATTAAAGTTTTAGGTTTAAGCATGATAGCTGATTTTTGTCAAATTCAAGAATTTCTTTCATGCATTTTAACTTGGAAAGGTAAATCTGAACAAACGATTGTTCCATTTTTATTGGATATTTATAAAGATCAAGCTCGTTTTGATAAAGATCACACTGATATAAAATCAACACTTCAAGATTTAGAAAATCCAATTTTTGGTGATAAATACAACGAAATGAAAAAGAACTACATCAACAACGAATATGCAAGTTTCGCAACTTTGGATTTTTTAGGAAATTGTAAACCATCAATCTACGCAATTTTAACACTTTTAAGATGCGACGAAGACAAAGAGTTAATTAATAACACGTATAAAATATCAAAAGAAAATTTAACAAACAAAGAAAAAATTGTTGCTGCGTTAGCTGAAAATTATCTTCCATTATCGATAGGTGAATCTTGGATAGAAGTTAATCAACATTTTCAAACGAAAGGAGTACGCCCGTTAGTTTTCGATCAAATACTAATCGCTGCAAAGCTACAAGAACATCGTGAAAGAGCCAAATTAATTCAAATTGATCAATTGACATGTGAAATTTCTGAAAATAATCGCGAAATTTGTGTTGAACGGCAATTTTACGAACGTCTCCGAGAAGAAGTTCTCAACGAGTCTTTAGATGCATTAAACGAACTTCGATATTATACAAGATGCGTTGATACAATGGCTCGTTTAGAACAATGTACTCAACTTACTTTTGAAACTGAAAATGTGACCGCTGGTCGGCTTGATAAATCGATGTTGGTCGACTATCATAAAACTTTACCCGAATATATTAATATTACACCACATTTTAATCAACATGTCAGCATTCAAAGTAACGTCATTATTGATCCTAACAAAGAAAAAACTCCAGATGCAGTTTCTTTAGATAGCACCGAGCAAGGAATTATAGCTGCAAAAAAATTTGCTGATTTAATGCGTAAACGTGCTCCTAATCCTAATCCAACTTCTTATGATGTTACACGTTCGAAATATGCACGTTATTACAGTGTTGATTTTCATTAAT\n>XM_020844603.2 PREDICTED: Dendrobium catenatum transcription termination factor MTEF1, chloroplastic (LOC110112391), mRNA \nTATGCGGACAATGCTCAATGCCACTCACACTCACTATGCTCAGTTTCCACTCCCCTCTCGGTTCTCTCACTCACCCCAAACCTCTCCAAACGCTAAACCCTAATCCAGCCCTCCGATTTTTACCTCCGGTCGCTGGCACCACTTACATCTCCGGCAACGACGCGGGCTTGCGCTTCCGCGAAAAGCTTCTCTTCCTCGAACACGACCTTGGCGTCAATTCACTCCGCGCCCTTTCCCTCAACCCTAGCCTCCGCTCCGCTCCTCTCTCCTCTCTCAAATCGCTATCGTCCCTCCTCTCCTCCTTCGGCCTACTTCAATCCGATTCCTCTCGGGTCCTCTCCCTCCACCCCTCCCTCCTCACCGCCGATCCATCCGCCTCAATCCTCCCCGCCATCCACTTCCTTCTCGACACCGTATCCATCCCCTTCTTGGACCTTCGCCTCTCCATCAACCGCTGCCCTAGACTTCTCCTCTCCAGTGTCCCCGATCGCCTCCTGCCTTCCTTTAATTTCCTCCGTGGCCTCGGCTTTGTCGGTCGCCACCGCATCACCGCTCGTACTACTGTCCTTCTCATATCTGATGTTGAGGAGACGCTCATTCCCAAGCTTGATTTTGTCCAGAGCCTTGGGTTTTCTTATACGGATACTGTGAAATTGGTTTTGAGGATGCCTAGTCTGCTCACTTTTAGCGTTGAGAAGAATTTTCGGCCTAAGGTGGAGTTTTTAGTGGGGGAAATGGGGAGGGAAATTGTGGACTTGAAGGAGTTTCCGCAGTACTTTGCTTATAGTCTTGAGGGAAGGATTAAACCGCGACATACAATGATGGTAGAGAGAGGCTTTGGCTCCTCATCTATTTCACTTGGGGAGATGCTCAAGGCCAGTGATGGAGAGTTTCGAGAACGGCTACTAGAGATGCGGCTTAGTTCCGTGGGTGAGAAATTGTAGCTTGGTATGATGTGGGTTTCTTTTCCCCTTTCCAATTTTTTGAAGAAGTTGCATGCCTCCTAGATGCATACTTAGATTTGTAAATGTAAAATATTTGATGGGCCTGCCACATTAGTATTGTTGTAATAAGTACAATTCCCTGTATGTTATTATATTTTTAATTTTTGCTTATTTGGCTACCCAATA\n>XM_026866306.1 PREDICTED: Athene cunicularia multiple EGF like domains 10 (MEGF10), transcript variant X1, mRNA \nCAGGACTCTTTTGGGGCCTTTGGTGAATTTAAAGGATTTACACAGCAAGTAATAACATTATCACCTGCCATCTTTTTTTTGGAAAGATGTTTCTTCATTTGAATTTCTTTTTTGGCTTCCCTGTCATATTCCTGTACAACTGGATGGGGACAACTTTATCTTTGAATCTGGAAGATCCCAATGTGTGTAGCCATTGGGAAAGTTACTCAGTTACAGTGCAAGAGTCATATCCTCATCCTTTTGATCAAATTTACTACACCAGTTGTACTGACATCCTGAACTGGTTTAAGTGCACACGACACAGGATCAGTTACCGTACTGCCTACAGACATGGTGAAAAAACAATGTACAGACGTAAATCCCAGTGCTGCCCTGGTTTTTATGAAAGCAGGGAAATGTGTATCCCTCATTGTGCTGATAAATGTGTCCACGGTCGGTGTATTGCTCCAAACACCTGTCAGTGTGAGCCTGGCTGGGGAGGACCCAACTGCTCCAGTGCTTGTGACAGTGACCACTGGGGACCTCACTGCAGCAGCCGCTGCCAGTGCAAAAATGGAGCCTTGTGCAACCCCATCACTGGAGCCTGCCACTGTGCATCAGGTTTCAAAGGTTGGCGCTGTGAGGAGCACTGCGGTCAGGGGACGTATGGAAACGATTGCCATCAAAAATGCCAGTGTCAAAATGGAGCCACCTGCGACCATGTGACTGGAGAGTGTACATGTCCTCCTGGATACACTGGTGCCTTCTGCGAGGACCTTTGTCCCCCTGGGAAGCATGGGCCGCAGTGCGAGGAGAGATGCCCGTGCCAGAATGGAGGCGTCTGTCACCATGTCACCGGGGAGTGTGCCTGCCCACCAGGATGGATGGGCATGGTCTGTGGTCAGCCTTGTCCTGAGGGTCGTTATGGAAAAAACTGTTCCCAGGAGTGCCAGTGCCACAATGGAGGGACCTGTGACTCAGCGACAGGTCAATGCTATTGCAGCCCAGGTTACACAGGAGAACGATGCCAAGATGAATGTCCAGTGGGAACTTATGGAGTGCAGTGTGCTGAGACCTGCAAGTGTATGAATAGGGGGAAATGTTACCATATTAGTGGTGCCTGTCTCTGTGAACCAGGATACACTGGAGAGCACTGTGAAACAAGGCTTTGCCCTGAGGGAATTTATGGTCTCAAGTGTGATAAAAAGTGTCCCTGCCACATGCCCAATACCTGGAGCTGTCACCCTATGTCTGGGGAATGCTCCTGCAAGCCCGGCTGGTCTGGACTCTACTGCAATGAGACATGTTCTCCGGGATTCTACGGCAAGTCATGTCAGCAGATCTGCAGCTGCCAAAATGGTGCTGACTGTGATAGTGTGACTGGAAAATGCACCTGTGCCCCTGGATTTAAGGGTGCTGCTTGTGGTACCCCTTGTCTTCCGGGGACATACGGAGTAAACTGTTCGTCTGTGTGCAATTGCAAAAATGAAGCTATCTGTTCACCAGTAGATGGTTCTTGTGCCTGCAAAGCAGGTTGGCATGGTGTAGATTGCTCAGTAAATTGTCCCAGTGGTACCTGGGGACTTGGCTGTAACTTAACTTGCCAGTGTCTTAACGGAGGGGCTTGCAGTGCTCTGGATGGAACCTGTACCTGTGCCCCGGGCTGGAGAGGAGAAAAATGTGAACTCCCTTGCCAGGACGGCACTTATGGTATGGATTGTGCTGAGCGCTGTGACTGCAGCCATGCAGATGGTTGTCATCCCACCACAGGTTACTGTCGCTGTCTACCGGGATGGTCAGGCATTCACTGTGACAGTGTGTGTGCTGAGGGACAGTGGGGTCCAAATTGCTCATTGTCCTGTTACTGCAAAAATGGAGCATCCTGCTCTCCAGATGATGGAATCTGTGAGTGTGCACCAGGATACAGAGGCACCACTTGTCAGAGAATTTGTTCTCCTGGGTTTTATGGACACCGCTGCAGCCAGACATGCCCCCAGTGTGTACACAGTAGTGGTCCCTGCCACCATATTACTGGCTTATGTGACTGCTTACCTGGATTTACAGGAGCCCTCTGTAATGAAGTATGTCCCAGTGGCAGATTCGGCAAGAACTGCATTGGAATATGCACCTGCACCAATAATGGAACATGTAATCCTATTGATAGATCCTGTCAGTGTTACCCTGGCTGGATTGGTAGTGACTGCTCTCAGCCTTGCCCACCTTCCCACTGGGGACCAAACTGCATCCACACGTGCAACTGCCATAATGGAGCTTACTGCAGTGCCTATGATGGGGAGTGCAAATGTACCCCAGGATGGACTGGCCTGTATTGTACACAAAGATGTCCTCTAGGGTTTTATGGGAAGGACTGTGCATTGGTATGCCAATGTCAGAACGGAGCTGACTGCGACCACATCAGTGGGCAGTGCACGTGCCGCACAGGGTTCATGGGGAAGCACTGCCAGCAGAAGTGTCCTCAAGGTACGTATGGGTATGGATGTCGGCAGATATGTGACTGTCTGAACAACTCAACCTGTGACCACATCACGGGAACATGTTACTGCAGCCCAGGCTGGAAAGGTGCCAGGTGTGATCAAGCTGGTGTAATTATAGTGGGAAACTTGAACAGTTTAAGTCGTACCAGTACTGTCATCCCTGCTGACTCTTACCAGATAGGAGCTATAGCAGGCATCATCATTCTTGTCCTGGTTGTCCTTTTCCTGCTAGTGCTGTTCATCATTTACAGACATAAGCAGAAAGGAAAAGAAACAAATATGCCCTCAGTGACCTATACCCCCGCTATGAGGGTCATCAATGCAGATTATACCATTTCAGAAACCATCCCTCACAGTAATGGTGGAAATGCTAACAGTCACTATTTCTCTAACCCTAGTTATCATACTCTAACTCAATGTACTACCCCACCTCACGTCAACAACATCGACAGACTGACCCTAGCAAAGGCAAAAAACAATCAGCTGTTTGTGAACCTTAAAAATGTGCAATCTGGAAAACGAGGAACTGTCATGGACTACACAGGAACACTGCCTGCAGACTGGAAACATGGTGGCTACCTCAATGAGCTTGGTGCTTTTGGACTTGACAGGGGATATTTGGGAAAGTCCCTGAAAGATCTAGTGAAGAACTCTGAATACAATTTAAGTAATTGCTCATTAAGTAGTTCTGAGAACCCATACGCTACTATAAAAGACCCACCAACTCTTGTACCAAAAAGTTCTGAATGTGGATATGTTGAAATGAAGTCACCAGCACGCAGGGACTCTCCATATGCTGAGATTGCCAGCTCTTCTTCAGCCAGTAAAAATGTTTATGAAGTTGAACCTACAGTCAGCATTGTGCAGGGAGCATTCAGCAGCAGCGGACGTTTCAGCCAGGATCCTTATGATCTTCCAAAAAACAGCCATATTCCATGTCATTATGACTTGCTACCGGTTCGAGATAGCCCCACATCCTCTACAAAGGAGTTCAGCAGCGAATGACCCCAAAAGCTGATGTGTAGGACTCTGAAGGGGCAGAGTGGCATGGTTGTGCTCCTTCTTCTAATTCAGCATAATTTTTGGCTCTTAATCTGTCCAGCAAACAATTGCTGTACATTAAATAGAATCTCAACATGAGGTTTGTATTGTGTATACAAGTGACAGATGGGCAAATGCCACACTCTGGGGATCCTGATCATTCTTTTTTTCATGGCAGTAAATGTTACAGAAACAGGTATGCAACTCATTTATTCTATAATATACTGGCTTAAAAATACATTTGCAGATTAGTTTTGATAACATCCCATTTCATCTACTTTAAATATAGACTTCATATTTGTCATGTTTCAGCGTAGAAATACTCCCAGGACAGTGCAGTTTACCAAATACCACTTTGTACAGGTGATCTGATTCACTAGTTACGTAGAAGAAAAACTGCTTTGCCAAATTTTACCTTCCATTGTGATCTTTAGTCAAGACATACTAAGAAACAAGATTGGATGGGGATAAGTAAGCACAATACTGCAGTTGTTTGGGAAATCCATCAGGCTTTTTCGTCTACTACTGGCAGTGGGGTATCTTGCTTGAGTAGTTTTGGAGATAAAAGCATTGCATACATCAATATTATATGATGCCTCAAGATCTATTAGTACTCCAGACCCAGCACCAGTCTTCAGCAAATCTTTTGCTATGATTCAGCTCCATATGTTGCAGTTCTGACCACTATGTCTGCCATACGCAAGTAAAAATACATATCAGTAATTCAGAAATTATGTAAATGAAATCAGTCTTACTTTTATCACCATGGACTGATTATGTAAGGAGTGGACAAAGGTGATGACTGCTGTAAATCTTAACTGCAAGGAAAGGTTTACGTTTTATAAACAGATAGTAATAATGACTGTAATATAGAATAAAAATAGTAAAGTGTTCTGTTTTTTTTTCTTAGAAATAACTAATCAATCTCTGTGCATACTTGCTAAAAAGGCACCTTTTTTTATAATTGATGTCATGCTTAAGCTGGTCTTTTGCATTGCTAATAATGTGACACGTACTCCCCATTCTTCATTAACTTGTGTCTCCTTGTTGTGTCTGTGTTTCTAGTGATCTAGCTTGTAATTGCAAAAGTGTTCTACTTTGTGTCCATTTATTTTGCATTTTTGTCAGCTGGACTTTATTTATCTGGTTAAAGGGACCTCTGGGCAGAGGGAGAGGATTAAGATGTTTATCCAGAGGTAGTTAGCTAATCCATAATAGTTTAACTTAATGAATTGGTGAAAAAAATCAAGGTGTTTTTCTCAAGGATAATTAAAAGAATGCTGAAGGAAAGTGAAAAGCAGTCCCTCTTGAAAGTTTAGCTTATTCTGATGACTATATGGATGGACATCATCTTTCCAAAAGGCTCCCTTCTCTCCCTCCAAAAGAATCTGTTATGAACTGCATAATTCAGAGAAAATTAAATTTGCCAAGGTATCCATCTGTTGAAGCAAAATTGTCCCCCAAACACATCATCCTAA\n>XM_053267654.1 PREDICTED: Hemicordylus capensis uncharacterized LOC128332879 (LOC128332879), mRNA \nAAGGCTGGCTCTCACGTAGGCGCAAACAGCGGGGAAGGCCGAGCGGCGGGAAGGAGGAAGCGAGGCAAAGCATAAGCCCCAGGATGGGGAGAGAGGGGCAGCATCTGAGCCGCACCTGGGGACTTCCAGTAGGGAAGAACAAGAGGCGCCCCTGGCAGGCAGCAGCCCTCGCAGCCTCAATCCTGAGTTCTTGCTTTCTCCTGACTCAAGCCAAGAAGAGAGTGATCTCCAACATTCCTATCACATTGAGCCCATTAAATCCAGTTAGTGGGCAGAGGGTTGTCTTTGCACTTGGAGAGCTTGTGAGACGGAAGTCCATTTGCGAGTGGTACCGAGGGTCCAGTGACAAGGAGAACAAGATATTGGAATATGACTTTGGGTTGACCCAGTCCTCCTTTTCTGCCATACACAACACCCTCAAAGGCATTGACAGTTACATCAAGGGTGATGCTCATACTGGGCGGGAGAAGGTGTCCTCAAACTGCTCCCTTTATTTGGATCAATTACTGTTAAGTGACACTGGAACATACACAGTAGAAATGAAAAGATCTGGACAAGTTAAACAAAGAGGGCGTGTTTTCCTAGAAGTCTCAGATGTTCCTCCTGATTTGGGAGCGATTCTCCCCGATTCTCCCAAGGATGATGGTGACTATGATTATTTGCCGACTCCATCTTCCATGCTAGTTCCTGCTCTTGATATACAAGATCCTTCTCATTTAAAGCTACCTCTGGAGATCATTTGGAGGATCATTATTGGGTCTTTGGCTGTGACCACAGTCCTGGAGTTCCTACTTTACTTCCTTCTTCGTTCCTGTTATTGGAGGAACAGAAATTCTAACCGAATTATCTCAGCTACTCCAGGGTGTGGGATGATTCCCTCTTCTGCAAAGATGCTGAATCAACATGGAGACCCCGCTGTGCAGAGCAAGCTGTGA\n>XM_046173440.1 Alternaria rosae uncharacterized protein (BKA58DRAFT_436843), partial mRNA \nATGCACGCTACTGCAGGCTCAATCTTAGGACCCACTAGCGCACACGGCCTGCCAATCACGCCAGCACTTGGCGGCCTCTCATCAGCGCACAAGCTCCAGCCCCGGGCGCCCCTTCCCTTCGACGCGATTGACGGCTCTTCTGACAACTCTCCCAAAAAGCAGTGCCACAACGGGAAGCCGGCTCCCAGACACCTCCAAGCACGCGCAACCCTCACCTCAGTCATTCGTTTCAGACAACAAACCAGCAAAGACAGCACACAGCAGCAACCTGCACCTAATACACCCCCCCGTACCATCACCGTCACATTCACCGTGCGCCAAGCAACGCTTCTCCCGGCACTTCCTCATCCGCAAACGCCTGCATCGCAAGAGCGACCGACTCTCGCCCACCTCGTTTCTGCCGTCCGTAATCGATTCCGGAGACCATTGCGCGCCCTTGCGAGGCTAATTGGCAGCTTCACTGGAACCAGCCTACCGGATCCAGCGATCGCGACGACGCTGAGCAAACCGCACCTGCCTCCCCGCCCACCGACATCCGCTCTCATGCCTATCGTGGCCACCCCTTCTTCATAA\n>XM_010558636.1 PREDICTED: Tarenaya hassleriana carboxyl-terminal-processing peptidase 2, chloroplastic (LOC104826103), transcript variant X2, mRNA \nAGAAAAACACAGCTGGAAATTTCTGGGGACGCGCTTTCATGGATGTCTCAGCGAGCTCCTCACTATCCCCAATTTTCACCAAGCATAATGACAATAGCAGGAGCCCTAATTTCTCTTCGAAGAACCCGGCATTCCAGGTGAAATCGTTTATTACATGCCAACCTCCAAAGTTTTTGGAAGTTGGCTTTACAAAACATGCAAGAAATGTCAGTATCAAGCCCAGGAGCCATGGAATCCTGAGAATCGTGGTCTTGCCCGAGTTTGCTCCAACCACAAGAAGCGAAAATCTGCGGAACAAATTTCTGCGTCTCGTCAAATGCAATTACCATAAGAACAGGCCTGGGGAAGTGGTCATGAATTGTTCCAACAAGTTCAGACAGAATGTCTCCCTTGCATTAGTTCGGCTTGTTTCTGTTCTGCTTGTCTCTTCCATCTCCGTTGTTCTCACTGAATCTCCATCCTGGGCTCTTACCGAAGAAAACCTTCTCTTCCTCGAGGCATGGAGAACGATTGATCGCGCTTATATCGACAAAACCTTCAACGGGCAGAGCTGGTTTCGTTACAGAGAGAATGCTCTGCGAAATGAACCAATGAACACGAGACAAGAGACATACATGGCTATTAAGAAGATGCTTGCCACATTGAACGATCCTTTCACCCGGTTTCTGGAGCCTGAAAAGTTCAAGAGTTTGCGGTCTGGAACACAAGGGGCGCTCACCGGTGTAGGGCTGTCGATAGGGTACCCTCCTGGATCGGGTGGATCACCAGCTGGCATTGTCGTTATATCAGCTGCTCCAGGAGGTCCTGCAAACAGAGCAGGGATTTCTCCCGGGGATGTTATCCTATCAATAGATAAGACTACAACAGAAAGCCTAACTATATACGACGCTGCAGGGATGTTGCAGGGACCTGACGGGAGCACGGTGGAGTTAACGATTCAGAGTGGACCCGAAACAAAAGTCTTGTCTTTGACGCGAGAGAAAGTATCAATGAATCCAGTGAAGTCAAGATTATGTGAAATTCCTGGTTCTGAGAAGAATGCCCCCAAGATCGGGTATATCAAACTAACATCATTCAACCAGAACGCTTCTGGTGCCATCAAGGAAGCAATTGAGACTCTAAGAAGCAACCACGTTAACGCATTCATATTGGATCTCCGAGACAATAGCGGTGGGCTTTTCCCAGAAGGAATCGAGATCGCCAAGATTTGGTTAGATAAGGGAGTGATCGTATACATTTGCGACAGTAGAGGCGTACGAGATATATACGACACAGATGGAAGCAATGCCTTAGCGGCTTCCGAGCCTTTAGCCGTCCTCGTTAACAAGGGAACGGCTAGTGCCAGCGAGATATTAGCCGGCGCCTTGAAGGATAACAAACGTGCCGTCGTGTTTGGGGAGCCGACCTACGGGAAAGGTAAGATACAGTCAGTGTTTCAGCTGTCAGATGGTTCTGGCCTGGCTGTGACTGTTGCTCGTTACGAAACCCCGGCCCACACTGATATCGACAAGGTCGGCGTAATTCCCGACCATCCGCTTCCTCGGTCTTTCCCGAAGGACGAGGATGCTTTCTGTGGCTGCCTCAAGGATCCCGGAGCTGAGTGTTATCTCAACCAAGGCCAGCTGTTTTCTAGATGATCATTCTTACTTCTCAAGGATGAGCATTCTTTGTTGAAGATTTTTCCTTACCTGTAATCCTTCAAAGATGTAGAGTTTAAGATACATGTATAAATATAAGAACCCATGACAATGGGAACCAGTTCAAGTCATTAAGACAGAACAGACCATGGATGGATTTCTAACTTCCTCTGTACTGTCTTGTTGTTTCAAGAAACAATTTCTCAAGTCTCAAA\n>EF527335.1 Lepiotaceae sp. PA501 internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene, complete sequence; and internal transcribed spacer 2, partial sequence \nGTAGGTGAACCTGCGGAAGGATCATTATTGAATACCACTCGATGGGTTGTAGCTGGCTCTTTGGAGTATGTGCACACCTGTCTTGATTCTATTCATCCACCTGTGCATTTTTTGTAGTCTTCTGAGGGTTGGATCAGTCGAAAGACTGGATAAGAAGAGGATTGCAAGCACGCAAGTGCAAGCTCTCTTCAGTAAACCAGCCTTTAGAGTCTATGTCTTTTTCATAAACGATGTATAAGAATGTGATCAAATGGGTCTTTGTACCTATATAAAATGTCATACAACTTTCAGCAACGGATCTCTTGGCTCTCGCATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACCTTGCGCTCCTTGGTATTCCGAGGAGCATGCCTGTTTGAGTGTCAGTAATTTCTCAAACCCTTCTGGCTTTTTGTAGTCGGCTTGGGCTTGGATAGTGGAGGTTTTGCAGGCCCCCCCCCCCTGTGTCTGCTCCTCTGAAATGCATTAGCGGAACCTTGTTTGCGATCCGTCACTGGTGTGATAATTATCTACACCAAGTGGGTTGCTCTCTAGATGTTCAGCTTCCAATGGTCCCTCTGTGTGGGACAACTTTCTGACTTCTTGACCTCAAATCAGGTAGGACTACCCGCTGAACT\n>XM_002141234.1 Cryptosporidium muris RN66 flavodoxin-like fold family protein, mRNA \nATGACTAGGAATGGGGTAACTGGTCCAGATGGTGCACATATATTGGTAATCTTGTCACATCCAGGGAAATCAATAGCAAATCAAGCAATAATTGATACTCTAGTTGAGAAGTTTGGCCAAAATATTCAGGTCAGACACTTGAATCAACTTTATCCAGACCAGAAGATAGATATAGAAGCTGAACAAAGAGCCTTAATTAGTGCAGAGCTTGTTATCTTGCAATTCCCAATGTATTGGTATAATATGCCTCCCTCATTAAAGAACTGGCTAGATTTGGTTCTCTCCTATGGATTTGCATATGGAACCTCGTATAAACTTGAGGATAAACTTCTCCTTGTATCTATTACCACAGGGGGTGAGGATAAAAAGTATGAAAAAAATACAGTAAATGACTATCTAATGTCTTTAGAATCAACATCAGAATTTATTAAGATGAAGTTTGCCGGTATACTAGCAGTTCATTCAATGCTATTAGTGCCAGGATTAGTGGGAGAGGAATCTGATATTAGGAAGAGAGCAAGTAACCATGCAAAACAAGTCGTCATCCCGAAAATTGAGAGTTTATTATCTAGATAG\n>JN440197.1 Uncultured organism clone SBYB_3348 16S ribosomal RNA gene, partial sequence \nAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCAGGCGTTATCCGGATTTATTAGGTTTAAAGGGTGTTCAGGCTGTCTGGTAAGTCAGAGGTGAAAGTCGGTTGCTTAACGATCGAATTGCGCTTTGAAACTGTCAGACTTGAGTATGGATGTGGTAGNCGGAATGTGTAGTGTANCGGTGAAATGCATAGATATTACACAGAACTCCAATTGCGAAAGCAGCTTACCAAACCAGCACTGACGCTGAAGCACGAAAGCGTGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCACGCAGTAAACGATGCTCACTCGCTGTTGGCAATACACCGTCAGCGGCTAAGGGAAACCGATAAGTGAGCCACCTGGGGAGTACGATCGCAAGATTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCTGGGCTTAAATGTGAAGTGCATTGTTTGGAAACAGACATTTCCTTCGGGACTCTTTACAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGGTTAAGTCCCATAACGAGCGCAACCCCTATTGTTAGTTACCAGCGCGTCAAGGCGGGGACTCTAACGAGACTGCCGGTGTAAACCGCGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTATGTCCAGGGCTACACACGTGTTACAATGGTCGGTACAGAGGGCAGCTAGGCAGCGATGTCAAGCGAATCTCGAAAGCCGATCCCAGTTCGGATTGGAGTCTGCAACCCGACTCCATGAAGGTGGAATCGCTAGTAATCGCGCATCAGCCATGGCGCGGTGAATACGTTCCCGGGCATTGTACACACCGCCCGTCAAGCCATGGAAGTCTGGGGTGCATGAAGGCCGTAACCGCAAGGAGCGGTCTAGGGTAAACAGATGACTG\n>HQ302012.1 Uncultured bacterium clone E416QYJ01EWDEE 16S ribosomal RNA gene, partial sequence \nACGCTCGACACCTACGGGAGGAAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGGAGGAAGAAGGTCTTCGGATTGTAAACTCCTGTTGTTGGGGAAAAAGAGGATGGTACCCAACAAGGAAGTGACGGCTAACTACGTGCCAGTAGCCGCGGTAATCTGAGCGGGCTGGCAAGGC\n>XR_004686820.1 PREDICTED: Populus alba membrane-anchored ubiquitin-fold protein 3 (LOC118044643), transcript variant X2, misc_RNA \nTGTGTTTCAGTTCACCAACAAAATAACAAACAAAACACCTACTCCCCCTCCTCCTCCACCTTCTTCACTACCAATCCAAGCCCGTCTCCTTTTTATCTTTTTCCCAAAAAAAAAAGGCAGACTGTTAATTATTTTGTCATCAAAATTTAAAGAAAAGAAAAAGGTGTCTTTTTTGATTGGGGAAACCGAGAGTGGAATATTAAACACGTTGTGGTAATTGGTTGGAGGAGGAGAAGGAAACAGGTCAAAAGTCAAATAGAAATGCCGGAGGAGGATTTGGTGGATATAAAGTTCAGGCTTTATGACGGGTCGGATATCGGACCGTTCCGGTACTCATCAACGTCTACTGTTGATATGCTTAAGCAGCGGATTGTTTCTGATTGGCCCAGAGGCAAAACAATAACTCCCAAGGCAGTGAATGAAATCAAGCTGATAAGCTCTGGTAAAGTCTTGGATAACAACAAGACTGTGGGTCAATGTAGAACACCTTTCGGAGAAGCGGCCGGGGGAGTTATCATAATGCATGTTGTTGTACAGCCATCTCTAGCAAAAACCAAAACAGAAAAGAAGATTGATAAATCTCCGAAGAAAATCGTGTGTTCGTGTTCCATAATGTGAAGGCAAAGTACGTAGAAATCTCGGGAATTGCACCCATGGTACCAACACTTTAGGTTACAGAAATACGGATTC\n>XR_004968528.1 PREDICTED: Myotis myotis U6 spliceosomal RNA (LOC118659394), ncRNA \nGTGCCCGCTTCGGCAGCACATAGACTAAAATTGGAACGATACAGAGATTAGCGTGGCCCCTGCGCAAGGATGACATGAAAATTCCTGAAGTGTTCCATATTTTT\n>XM_034024519.2 PREDICTED: Acipenser ruthenus methionine aminopeptidase 2-like (LOC117414742), mRNA \nGCGCTTCCTCTCTCGTTGTGTTTCCATCATGGCGGACATGGTGCGGCAACAGGAGCAAGAGAAAAAATCTGAGCAAGAGAAACACTTGAACGGGGAGATGGAACCCGAAGACAAGGAAGAGGCGGATACGACAGAGGAAGCAGCAAAGAAGAAGAAGAAAAAGAAGAAGAAAAACAAGTCTGCAGGAAATAATGAAAATGAGAGTAATGCCAATGCTGCTGGTGTTGACAAAGTGACAGATCAACTGGAGAAACAAGCCCTGGAAGACAAAGAGAAGGATGAGGAAGGAGAGGAAGATGGAGAGGAAGGAGAAAATTCAGCTGGGAAGAAAAAGAAGAAGAAAAAAAAGAAAAAGGGATCAAAGGTTCAAACTGATCCACCTTCAGTTCCAATCTGTGACCTCTACCCAAGTGGAGTCTTCACAAAGGGACAAGAATGCGAATATCCATCTACGCAAGACGGACGAAGTGCTGCCTGGCGCATGACCAATGAGGAAAAGAAAGTATTGGATAAAGCCAATGAAGAGGTTTGGAGTGATTTCAGACAAGCAGCTGAGGCTCATAGACAAGTCAGGAAGTACGTCTCAAGCTGGATCAAACCTGGAATGACCATGATTGAGATCTGTGAAAAGCTGGAAGACTGTTCCAGAAAACTGATCAAAGAGAATGGTTTACATGCAGGCCTGGCATTTCCAACTGGCTGTTCTCTGAATAACTGTGCTGCTCACTATACGCCCAATGCTGGAGACCCGACAGTTTTGCAGTATGATGATGTCTGTAAAATAGACTTCGGAACGCACATCAATGGTCGCATCATTGATTGTGCTTTTACTGTAACGTTCAATCCAAAGTATGATAAGCTTCTTGAAGCTGTGAAAGATGCCACCAATACTGGAATCAAGTGCGCTGGGATAGATGTCCGCCTTTGTGATGTTGGTGAAGCTATACAGGAAGTCATGGAATCCTATGAGGTTGAACTTGATGGCAAAACATATCAAGTGAAGCCAATACGTAACTTAAATGGGCACTCCATTGGACAGTACAGGATACATGCTGGCAAAACTGTTCCCATTGTCAAAGGAGGAGAAGCAACACGAATGGAGGAAGGAGAAGTGTATGCCATAGAGACTTTTGGCAGCACAGGAAAGGGGGTCGTTCATGATGACATGGAGTGTTCGCATTATATGAAGAATTTTGATGTTGGACATGTGCCAATCAGGCTACCCAGGGCTAAACACATGCTGAATGTAGTCAATGAACATTTTGGCACGCTGGCTTTTTGCCGCAGGTGGTTGGATCGCCTGGGTGAGACAAAATATTTAATGGCTCTGAAGAACCTTTGTGACTTGGGTATAGTGGATCCCTACCCTCCACTCTGTGATACTAAAGGCTCCTATACAGCACAGTTTGAGCACACCATTCTGTTACGCCCCACTTGCAAAGAAGTTGTGAGCCGTGGAGATGATTATTAAGCTCTGCAATTTATTTTCTTTCTTACATTATTTTTCCTGACAAGCTTTATCCTTTCTCACTTTGCTTTGGCAGAAATCAGCATGAACTAATTAATCTGAAGCTCGGTGTCTGTCTAAGCAGGGGACTTGTATATCTGCCATGTTTTGACAGGGATGGGAAATAGGTGACAAACTAATGTTTTCAGTTTTTTGTATATTTCTTTCTTGATCTAGAAATGATGAATGTATGCACATCCTATTGCTGATTTATAACACCTATGCCCAGTGTAGGATTGCCTTTTGAATTTTCCTGAAAGTTTTTTTTTTTTGTAAAAATAAAGATTAAACTCAAATCTGATTATTGGTTTCAATATTAATTCAATGTGTTAATTCTTCTGATTTGTCTATTCATCTTCTTTCCCCTGCCTCACTTACTTTTAGAACAGAGCATTGTAATTTATGGTCTTTCTGATTTTAATTGGGCAAGCTACACTTTTTAAATGATTTAATTGTGATTTTATTTATCAGTAATTCCACAATCCTTGCCACAACTTCCATCCATGATTCAGTACACACTGGGAAAGCATCCACAAACACCAGAAAGTAAGGATATTTATGTAGGTAGTATGTTCTGAACTGTACTTGCCTTCATACACGCTTGATTATTTTTTTATTTGTTTAGTGTTTTTACTCCCAATATAATTAATTTGGTACTGAAACTACTTTTGGGAGCAGCAGCCAGAATTACATGAAGTCTTTTTACTAATTTCCTCTTAAGTGTGAAGATAAACAGACGTGATTCTGGCCCAGGTGATCTCTCGTGCAAGTTTTAACTTAGTGTGAAAACAGTATTAGGTTTCTAGGTAGCCTCACTACTGCATAACTGATTTGAGTTTGAAAACTAAAGATGGTAATGAAC\n>XM_046102345.1 Truncatella angustata uncharacterized protein (BKA67DRAFT_558781), mRNA \nGCCGCCGCAGCCCTTTCCACGCCCGGCGCCGCCTACTCATCCTACGACCAGGTCATTACATCCGATGACTCGGACCGCATTTTCCACTACTACCCCGACGTGATGAATGCCTTCGGCGTTTCACGTCTCCGTCTGAGCAGCATTGACGAGATTCCTAAGGGCGCCGATATCATCACCTTGTTGCCCGTGAACTATGATGAATCGGACTCTACCCCTGGAATATACATGGCAGTCGATACCAAGGGCAACTACTTCTACATCATGGCCTGTGACATCGAGGGTGACGCTGCCAAGATCTTCATTGCGTCTGATCCGGATGCTGGTGCTGCCAAACTTGCCGAGGCGGATCTGCGCTACATCGTTACTGGTGGTGTTGTTCAGGATTGTTCCTTCATGCCATTTGTCTCGACTGGTGCCGGTTTGTCTTAAATGAATTTGGTGGCGTAGTGCTGTGAGTCGTACATTTGGCAAAAGGCACCTTGGTTTCTTATTACCTTAATTTGGGGCTTTCTTTGAGTACTACCGTACAACCCAATTTTTCATTGTCACAGCCATGTACCAACCATCATATGAGTAATACTTAACTGGCCCACAGAAAGTATGCACTGGAAAGAGGCCTTCTATTTCCAGTGCAACAACAATATAAGCAGTTACCTCAAA\n>XM_052329315.1 PREDICTED: Diospyros lotus uncharacterized LOC127796910 (LOC127796910), mRNA \nATGGTCGCCGACGAAGCTTCGTCGTCGGCGACCATGGAGATCGACCGGGCTTCGTCGCGAACGAAGCCCCACGGTCGGGCTTCGTTCGCGACGAAGCCCGCTGGGGAGAGGAAGCGCCCGATCGGGCTTCAATTACAGACGAAGCCCGATCGGGCTTCGATTGAAGACCCAAGGAAGCCCGATCGGGCTTCGATTGCAGACAAAGCCCGATCGGGCGCGACTAAGCCCCACACCCAATTGGGCTCCCCCGACTGTTGGGCTATGACACAGCCCGATTATCGTTGCCCAACAAAGCCCAATCAAATGGCTGAACAACAAACTACAAAATTTGCTTATGTTCATGCTCACCGAATATTACCCCCCGGAATGCGAGTTACTACTCATTGTGGGATTAAACACCTTGAGGCGATGCGTCGTGCTCTAGACCGATACAAGTTATTGGATAGATTCCTACAGGGCCCATTAGGACATTTCTTGAAGATGCCTTTGTCCCTCCATTTGACTGCACCACAGTTGATATATCATGTTCTACTTAGGGAGGTGACATTTTCGAGTGCCCGCCACGATGAGATGTGGTTCGAGATTGGCGGCACACCATACAGATACGGGAGGCAGGAGTTCATACTTATTAGTGGACTCCGATTTGGGGCTATTGATAGGGAAAGCCTTGAACCGAAACCTATTGAGCCGGAGAGTTTACGTGCTCGACTATTTCCACAACATAAGAAAGGGGTGACTGGAGACGACCTTGAATTACTTATTAGTACCAAAGAGGATATGGTTTCAGAGGATGCCCTGAAACTGATTTACATTGCTGTGGTCGACATGTTTTTGTTGGGCCAGGATGAGCGTGGGCATGTGGATGATTTCTTGTGGACTATGGCCGAGGATTTACAAGCATTTGAGATGTTCCCTTGGGGTACATATGTCTACAGTAAGAGTCAACATTACATCCGGTTGGCCACGAAAGAAAGAAAATTGACTGGTGAAGGTGGGAAGAAAATCAACCTTTATGGTTTTGTATGGGCGTTTCAGTGGTGGTTGATCGAAACGTTCCCATGGATTCAGAATAAATGGGCCGTCAGACCGTCCGAAGCAGACATTCCAAGATGCAGAAAATGA\n>XM_019061330.1 PREDICTED: Bemisia tabaci neutral ceramidase (LOC109043949), mRNA \nATCATTGAAACCCCGTTTAGGTCAAGCTCGCAGTTAAAAATGGATTTCGTCCAGTGCGCTTGAGTACAGCAGGAGCTGAAGCTTTGTATTACTATAATGCGAGAACACTTTTTACTCTGAAAGGCTGGATAACTGAGAAGACCAAAGTCGTAGTTCGAAATGCCGGGTGTATCGCGACAAGTCTGTTTGATATTGGCCAGCTTTGTAGCTTTCTGCGAATCGGCTTACAAGATTGGAGTGGGGATAGGGGATGTGACTGGTCCAGCGGTTGGAATCCCATTCATGGGCTACGCAAACCTCAGGCAGAGGGGTGAGGGATTGCATTTGCGACAATTTGCAAGAGCTTTCATCATAGGTGACTCCTACGAGAAACTCGTTTTCGTGAGTGTAGACGTGGGAATGGGCGCACACGGAGTCCGAATGAAGGTGCTGAAGCGGCTGAGGGAAAAATTCGGCGAGGAGTTCTCGGAGAGGAACTTGATGATAAGCGGGACGCATACCCACTCGGCGCCAGGCGGGTTCCTCATGCATTTCATGTTCGACATTAGCACCATGGGCTTCGTCCCTGAGACTTATGACGCCCTTGTTTCCGGCATTGTTACGAGCATAACCCGGGCGAGGAGTAACATGCGGAAAGGAAGTATATTTTTCTCGACAGGAGAAGTTTTGGACGCCAATACGAACAGGAGTCCATCCGCTTATGACAACAATCCAGAGAGCGAAAAAGCCAGATTCGAGTACAACGTGGATAAAAGGCTGATTCAGATGAAATTCGTGGCGGAAACGGGTCAACCGATGGGCGTGCTTAACTGGTTCCCGGTGCACCCAACCAGCATGAACAACACCAACACCCTCATCTCCAGCGACAACGTCGGTCTCGCCTCTGTCCTCTTCGAACAGCAGATGAATCCGGGACGTTCTATCGGCAAAGGCCCTTTTGTTGCAGCGTTCGCCTCGAGCAACTTGGGGGACGTGTCGCCGAACCTACGATCGCCGGTCTGCCTGAAAACCGGGGAGCCCTGCGACATGCTAACGAGCTCCTGCCCGGACGAACATGACATGTGCGTCGCCCTCGGACCCGGCGAGGACATGTTCCAGAGCACAAAAATCATCGCTCAACGGATCCTCGCCACCGCTATATCTCTTTGGAATGATCCTAACTCATGGGAGATCAAAGGACCCGTCCGGATGGTTCATCAATTTGTGAACATGGCTAAGCGGGAGGCAACATATCAAGATCCAAATACTGGCCAGATCCGACAGGTGCACGGTTGCAAGCCAGCTATGGGCCATAGTTTTGCTGCAGGGACAACCGATGGGCCTGGTCTTTTTGCGTTCAAGCAAGGAACCAAAAGTCCGGACAATCCACTCTGGAACTCTGTTTCCAGGATACTGCCCAACGCTTCAGCAGAGAGTGTTTCCTGCCATGGAGGAAAACCAATCTTGTTATCCACAGGCGAGATGAACTTCCCTTTCCAATGGCAACCGGAGATCGTGCCGACGCACCTGGCGACGATTGGGCAGCTGGCGGTGGCCTGCGTGCCGGGGGAGTTCACGACGATGGCCGGCCGCCGACTCAGAACCGCCCTCCGCAATCGCCTCGGCCTCGCCGACGACACCCACGTTATCATCGCCGGCCTTTGCAACGAGTACAGCGACTACATCACCACGCCCGAGGAATACGAGGTGCAGCGTTATGAAGGTGCGTCAACAATTTATGGCCCAGAAACACTACCACTCTACATCAGGCAGTACGAGGACCTGGCTGATCATATTCTTCGGAAAATGGACCCAGAGCGGGGCCCAGTTCCTCCTGAGTTTCTAAACAAATTAATTGTTCTCACACCACCTGTTTTATACGATGCTCCACCCTACGACCAAGACTTCGGAGCTTGTTTACAACATCCACCACTGAACGTCACCAGAGGCGAAACTGTCAACACTACGTTCGTCTCGGGGCACTTGCGCAACAACATGATGCGCGGCTCCAGCTTCCTCCTCGTCGAGCACCTTCCGATTAACGGGAACAAGTGGGAGGTCGTCGCCACCGACGCCAACTGGGAGACCATCATCACGTGGAAGCGGCAATCACTGCTACTGGGTACTAGTGCGGTGGTGATCAAGTGGACGGTGCCTGAGGACGCGCCGTTTGGGAAGTACAGGATCAAACACCAAGGCTACAGCAAACCCGTCATCGGGGCCCTGCACCAGTATCAAGGGCTCAGCAGAGTCTTCCAAGTTGTACCCAAAGATCTACCCTATTCATACGATGTCCCGCAAATACACGAGTGATCCTCTCAA\n>XM_034027490.2 PREDICTED: Acipenser ruthenus phospholipid scramblase family member 5 (LOC117416435), mRNA \nGAGGGATCGGAGACAGAGAGAGCAGCGACTTGAGAACAGAAGGCAAGCTTCATCCTCTGTGATCTACCGTACAGGACACAGTTCACTTGTGGCTGGGTGGAAGGATTTAAAGAGGATGCCGGTGATCACGGCCCAGCCGCCCCCCTTCGGCAGGCTGCAGAGGGAGAAGCACATCGAACAGCTCTTCAGGTCCTTACGCCAAGGGAGTAGGGGGTCCCAGGAGCCACGGCACAGTCTGGGAGAGGAGGCAGGACAGGGGGACTCTGAGACACTGGAGCTGCGTTGCACGACGGAGCCGGAGGCCCAGTCCAGCATCCCCAGAGTCCTCAAGCCAGCGGGCGCCACGGAGAGCAGCGAGCAGAGCCTGGCTCTCTTAGCGGACGTGGAGCAGCTGTGCATCATAGCCAGGCCGGGGCTCCAAGGACTGGCCTGTGAGCCTGGGAGGACCTACAGCATCTCCACAGCTTCCGGGAGTCAGCTCTACGTGGTGGTCGAAGACACGTCATGCCTGTGTCTGCTCTCCTGCGGTCCCGCTCGCTCCTGCTCTCTCCGAGGGTATGACAGAATGGCGCAGGAGGTCTTCCTGTTTGAGAGGCCCCTGAGGGCTGATGCGTGCTGTCTGGGCTGCTGCCTGATGGAAATGCAAGTGTTCACACCTGACCACCAGCTCATCGGGACTGTGCGTCAGAAGTGGAGCATGTTTACCCCCCTCATGGAGCTCAGCGACTCGGACGGGACGTCCTATATCAGGATTCAGGGCCCCTGCTGCCCCTGTCGTTGCTACTCCAGCCAGGAGTTTCAGGTGGTGTCCAAGATTGGAGACAAATTGGGAAAGATTTGGAAAAAATGGCCTGGCTTCAATGAAGAGTACAACATGGACCACGAATACTTCGGGCTGGATGTCCCAGCTGAAATGAGCCCGGAAACCAAAGTGCTGTTACTGGCTGCTGCGTTCTTACTGAACTACATGTTCTTTGAGATGAGCTGAACATACTGGAAGAGTACAGAGCGCCAGCCCTGACCAATGGGAGCACAGAGAGATCATGATGTCACAATGAAAGGTGTCACAGTGGCTGCACAAGGAGTAACGTTAAGAATCACATGTTTGTATCGGAAAACATTATTGCAGCAGTTTGAATGCCAGGGCATGGATAGGATTATTAACAGAGGCATTCACAGTGCAAGAGCCCCATTCAGACAATGCGCAGAAGGGTTAGATCACCCACAGCATATTCAACTAATGTAAAGCACTCAACTTTAATCCAATACCAGACACATACCTGCTCACCCTGAGATCGAAATCCTATGGATCATTCCAGCTGAAATCTGTGTCATAAAAAGTGCCCTGAAAAAATCTACCTTTAAAGAGCAAAGGAGCCCCCTTCAGGACATCATAAGCATGTAATGGCACCGGACTTTATACAATGACAGCATGTTGATGTAAGCAGGTACAGTATGTTAACATGAGCAGCACACTGTGCTCCTCAATGTGGTGAGGCTCACATTACTAATCTTGTGTTGTACTACAGTATATCCTGATCTGTGCTCCTCAATGTGGTGAGGCTCACATTACTAATCTTGTGTTGTACTACAGTATATCCTGATCTGTGCTCCTCAATGTGGTGAGGCTCACATTACTAATCATGTGTTGTACTACAGTATATCCTGATCTGTGCTCCTCAATGTGGTGAGGCTCACATTACTAATCTTGTGTTGTACTACAGTATATCCTGATCTGTGCTCCTCAATGTGGTGAGGCTCACATTACTAATCATGTGTTGTACTACAGTATATACTGATCTGCAACATGTACCTGCATGTGACTGACTGATTGCAGGAGCTACATGTTTACAGCCACCTCTGAATCAAGACTCAGAATAGCCTTCTTTTCATGCTTTTTCTTTTTTAATTTGATAAATAAAAACGATTTTGTAAAATA\n>XM_048518335.1 PREDICTED: Sphaerodactylus townsendi coiled-coil domain containing 88A (CCDC88A), transcript variant X5, mRNA \nGAAGGGAGAGGCTGAAGCAGCTGTTTTTTTTGGGGGGGGGGGATGAAGGAATAGGCAACGGGTGGGGTCCTGCTAGCAGTAGTTGACCTACCATTTTTGAAAAGGCAAGTCGGGGAGGCACCTCCAGATATCTGGTGGTGGTGGCAGAGAGAGAGCGCGCCCCTGTTTCCTGGGAAAGTGGGCGAGGTTGCCCGGGCGCCTCTTGTCTGCAGAAAAGGAAGATCAGTGCTAGTTCGGTGGAAAGAGGAGTGGTTTTTCTCTCTGAGCTGGCCTTGGGTGAATGGTTGTTCCTGCAAGGAAGAGAGACTTGTTGGGGGCTGATGAGGGAGGAGGTCGCTGCTGCCCTCCCCGCGGCTGGCACGCTCTTGGTGGGTCAGGGGTAATTAGCTGAGAGGAGTTTCACTGGCGTGTCTCCCCCTGGAGCACGCCGGCTGCTGGCTCGCTGGTGCTGCAGCCCGAGGCGGAGTGGGGGGGAATGCATGCTTGCTTGCGCGGCTGATGTAGGATCTTAGTAAGGTCCTTCCTTTCTTTCTCTTCTTGCTTCCTCTTCGGCACGGAGAGAGGAGGAAGAAGGAGTCATTTGGTGGAAATAAAGAAAAACAACCAGAAATGAACGTGGACTGCCTCTTGATTGTTCCCTTTCTGGACGAGGAAGAGAAAGCTCTTTTGACCGATAGCCTGACTACTTTTTAAATTGTATTGGGGGAACTGCCTTGGATATATATTTTTTCTTGAAATCGTGGAGCATTTCACGGAATTACTGCAACGAAAGGCACCGAATCTCTCCGTTTTTTTAGTCCTGGTTTAATAAAAACCCTCTTAATTATAAAGCATGGAAAACGAAATATTCACGCCTCTGTTGGAGCTCTTCATGACCAGCCCTCTTGTTACCTGGGTTAAGACATTTGGACCGTTAGCTGGAGGAAATGGAACCAACTTGGAGGAATATGTTGCGCTTGTGGACGGAGTTTTCCTGAATGAAGTCATGCTGCAAATCAACCCCAAAGCTACCAGTCAGAGAGTAAATAAGAAAGTCAACAATGATGCATCCCTGAGAATTCAAAATTTGTCTGTTTTGGTGAGGCAGGTTAAATCGTACTATCAGGAGACTTTACAGCAGTTGATTATGATGCCTTTGCCAAATGTCTTAATAATTGGCAAAAACCCCTTTTCAGAACAAGGTACTGAAGAAGTAAAAAAGCTACTTCTACTCCTGCTTGGCTGTGCAGTTCAGTGTCAGAAGAAAGAAGAATTCATTGAAAGAATCCAGAGTTTAGACTTTGATATAAGAGCAGCTGTTGCAGCCCACATACAAGAGGTGACACACAACCAGGAAAATGTTTTTGATCTGCAGTGGATGGAAGATGGTGCTCTCTCACAAGAGTATATTGAACCCCTCCTAAAAAATATGGCATTGCATTTAAAAAAACTTATAGATGAACGAGATGAGCATTCTGAGACTATTATAGAGCTCTCTGAAGAACGAGACTCTCTCCATTTTCTACCTCATGCTTCAGTGGCACAATCGCCTTGTGGATCTCCAGGCATGAAACGTACTGAAAGCAGACAGCATTTATCAGTAGAGCTAGCAGATGCCAAAGCAAAGATCAGAAGACTTAGACAAGAGCTTGAGGAAAAGACAGAACAGTTGCTGGATTGTAAACAAGAACTGGAGCAGATGGAAGTTGAGTTGAAGAGACTACAGCAAGAGAATATGAATTTGCTTTCGGATGCACGCTCTGCTAGAGTGTACCGTGATGAACTAGATGCTCTCAGGGAGAAGGCAATCCGTGTCGACAAGCTTGAAAGTGAAGTCAGCAGATATAAAGAGAGGCTACATGACATTGAATTCTACAGAGCTAGAGTGGAGGAACTCAAAGAAGATAATCAAGTATTGCTGGAAACAAAAACAATGTTGGAAGATCAACTGGAGGGGACCCGGGCTCGTTCAGATAAATTACATGAATTGGAGAAGGAGAATCTACAGTTAAAAGCTAAACTGCATGATATGGAGATGGAACGTGACATGGATCGGAAGAAAATTGAGGAACTTATGGAAGAAAACATGACTCTAGAAATGGCTCAGAAGCAAAGTATGGATGAGTCACTGCATCTTGGATGGGAACTTGAACAAATAAACAGATCCACTGAACTATCTGAAGTGCCACGAAAATCACTGGGGCATGAAGTGAATGAACTGGCATCGAGTAGGTTACTGAAACTGGAAATGGAAAACCAAAGTTTGATAAAGACTGTGGAAAAGCTACAAAGTACAATGGGATCTGCAGAAGGCAGTAATTCAAAACTTCTGAAAATGGAAAAGGAAAACCTGAGACTTAGTAAAAAGCTGCAAGGACTTGAGAATGAATTTAGCGAAGAGAAGCAAAGTCTTCAGAATAGTCAAAATCTAAGCAAAGATCTGATGAAAGAGAAAGCACAGCTTGAAAAGACAATTGAAACTCTGCGAGAAAACTCAGAGAGACAGATTAAAACATTGGAACAGGAGAATGAGCATTTGAATCAAACAGTGGCTTCCCTCAGACAGCGCTCTCAAATCAGTGCTGAAGCAAGAGTCAAAGATATTGAAAAGGAGAATAAAATTCTTCATGAATCTATCAAAGAAACAAGCAGTAAATTAAATAAGTTAGAATTTGAAAAGAAGCAAATTAAAAAAGAATTGGAACACTATAAAGAGAAGGGAGAGAGGGCAGATGAGCTGGAAAAAGAAGTACAACATCTTGAAAAAGAAAACGAGCTGCTACAGAAAAAGGTTACTAACTTAAAGATCACTTGTGAAAAAATAGATACTTTAGAGCAAGAAAACTCCAATCTGGATATGGAAAACAGAAAGCTGAAAAAGACCTTAGATAGCCGGAAAAACCTCAGCTTTCAGCTAGAATCTTTAGAGAAAGAGAATACACAACTTGATGAAGAAAATTTAGAACTCAGAAGAACAGTTGAATCTTTGAAGAGCATAAACATCAAAATGGCTCAGTTACAATTAGAAAACAAAGAATTGGAAAGTGAGAAAGAGCAGCTTCAGAAGAGCTTGGAGCTTATGAAAACATCTTTTAAGAAGACTGAACGTTTAGAAGTCAGTTACCAAGGTCTGGATACGGAAAACCAAAGGCTGCAGAAAGCCCTAGAAAACAGCAACAAAAAGATTCAGCATTTAGAAAGCGAACTACAAGATCTAGAGACAGAAAATCAAACCTTGCAAAAAAATTTAGAAGAACTCAAAATTTCTAGTAAACGCTTGGAACAGTTGGAGAAAGAAAACAAACTTTTGGAGCAAGAAACCTCTCAATTGGAGAAAGATAAAAAGCAACTGGAGAAAGAGAACAAGAGACTGCGGCAACAAGCAGATATTAAAGACAGCACTTTAGAAGAAAACAACGCAAAAATCTGTAACTTGGAAAAAGAGAACAAGTCTCTCATTAAGGAAATTGGTCTATGTAAAGAAGCTTCTATTCGACTAAAAGAAGCTGAAAAAGAGAATAAAGAACTTGTAAAGCGAGCCACCATTGACAAGAAAACGCTTGTCACATTGCGAGAGGATTTGGTGAATGAAAAGCTGAAGACGCAGCAGATGAATAATGATTTAGAGAAGCTTACACACGAACTTGAAAAGATTGGTTTGAATAAGGAGCGCCTTTTGCATGATGAGCAGAGTAGTGATGACAGTAAATACAAACTGTTAGAGTCAAGGTTGGAATCCACATTGAAGAAATCGCTTGAAATAAAAGAAGAAAAAATTGCTGCTTTGGAAGCTCGACTAGAAGAATCAACAAATTTAAACCAACAGCTGCGCCAGGAACTTAAAACAGTTAAAAAGAACTATGAAGCACTCAAACAGAGACAAGAGGAGGAGAAAATGGTACAGAACTGTTCCCCAAGAACTGGAGAAGAATCTCAGTCGGTTAATAAGTGGGAGAGAGAAAGTCAGGAAACTACTAGAGAACTTTTGAAGATTAAAGATAGATTAATTGAAATTGAGAGAAATAATGCAACACTGCAGGCAGAGAAGCAAGCTCTGAAAACACAACTAAAGCAACTTGAGACACAGAACAATAATCTGCAGGCTCAGATTTTGGCTCTTCAGAGACAAACAGTTTCCTTACAAGAACAAAATACAACTTTACAAACTCAGAATGCCAAGCTTCAGGTAGAAAATTCAGCTATTAATTCACAAAGTACATCTCTTATGAATCAAAATGCACAGCTGCTGATCCAACAGTCTGCCTTAGAAAATGAAAATGAATCTATAATCAAAGAACGGGAGGAACTGAAATCACTGTATGATTCACTAGTCAGAGATCATGAAAAACTGGAACAGCTTCATGAACGGCAGGCTGCAGAATATGAATTATTAATTTCCAAGCATGGAAACCTTAAGTCAATGCACAAAAATCTTGAAATGGAACATAAGGACTTAGAAGACAGATATAATCAGCTGCTGAAACAAAAAGTGCAATTAGAAGAATTTGAGAAAGTTCTCAAAGCAGAACAAGAGAAGATGGTACAGCAGAACAAAATGCATGAAACTGTAGCTGCAGAATACAAAAAGCTTTGTGAGGAAAATGGCAGGTTAAATCATACATATACCCAACTTTTGAGAGAGAATGAAGGTCTCCAAGTGGATCATAAGAATTTGAAAACACTTCTGAACAGTTCTAAACTGGAACAAACAAGATTAGAAGCTGACTTTTCCAAGCTCAAAGAACAGTACCAACAACTGGACATTAAGCATACAAAATTGAATAATCAGTGTGAGTTGCTTAGCCAATTAAAAGGAAACTTGGAGGAAGAAAACAGGCATTTGTTGGATCAAATCCAAACATTAATGCTGCAAAATAGAACACTATTGGAGCAGAATATGGAAAGTAAAGATCTCTTCCATGTTGAACAGAGACAGTATATAGACAAGCTAAATGAATTAAGAAGACAAAAAGAGAAACTGGAAGAAAAGATTATGGATCAGTATAAGTTTTATGAACCGTCACCACCAAGAAGGAGGGGTAATTGGATTACTCTGAAAATGAGGAAGTTGATAAAATCTAAGAAGGATGTTAACCGAGAACGACTCAAGTCTCTTACTCTGACACCCACCCGCTCCGAGTCAAGTGAAGGATTTCTTCAGCTGCCCCATCAGGACAGTCAAGATAGCTCTTCGGTGGGCTCAAACTCACTTGAGGATGGTCAGACTGTGGGGGCCAAAAAAAGCAGCACCATGAATGACCTGGTGCAGTCCATGGTCCTAGCAGGAGGACAATGGCCAGGTAGTTCTGAGCACCTGGAGGGTCCTGATGATATATCTACGGGTAAAAGGAGAAAAGAATTGGGATCTATGGCCTTCTCTACTACATCCATCAACTTTGCAACTGCCAACTCTGCTGCAGGCTTGAGATCCAAGCAGTTGCTTAATAATAAAGATGCTACATCTTTTGAAGATGTAAGTCCACAAGGAATTAGTGATGATTCTAGTACTGGATCAAGAATTCATGCTTCCAGACCAGCCAGCCTTGATAGTGGCAGAACATCCACTAGCAATAGCAATAATAATGCCTCACTCCATGAAATCAAAGCAGGTGCAGTTAATAATCAAAGCAGGCCACAAAGCCACAGCAGTGGAGAATTTAGCCTTCTTCATGATCACGAAGCATGGTCCAGCAGCAGCAGCAGTCCTGTCCAGTATCTGAAAAGCCACACCAAGTCTAGTCCGATACTCCATCATAGACTGTCAGAAACCCTGGACAGACAAGGAACGTGGAAAATTAAGACCGACTCTCCTGGCAGTGAAGTGGTTTCCCTGCAGCAGTTTTTAGAAGAAAGTAATAAGGTTATTTCAACTGAGATCAAATCCTCAAGCCAAGAGAATCTTCTGGATGAAGTAATGAAAATTTTCTCTGAAAATGCTGAATTAGCTGGAAGAGATAAACCAAGAAAACACTCAACAGTCAGCAGTGGTATCGCCAGATCACAGAGTGTAAAAAACACATATGAATTCTCTGATGGAAAATTAGCTAGCCAAGATCACCTTGCAAGGTCCAGTACATATAGAGTGGAAGAGCCCAACTTCTTGAACTCTTCAAAAACACTTACAACAGGGACTAGAGGCAAGACCAAGTCTGTTAAGGAAAATATACAAATGAGCCAATCACGACAATCAAAAGATTGTAATCCTTATGCTACTTTACCTCGTGCAAGCAGTGTGATTTCTACAGCTGAAGGAACTACTCGGAGAACAAGCATCCATGACTTTTTATCTAAAGACCCTAGACAGCCAGTATCCATTGATCCATCTCCACCTACAGTTGACAGAAGCGTCCCATCAGCTTCTAGTGAGTACGGTCCTCCAGAACAGTCCTCTTGTGTTTTTCATTATAAACCTTTTACTGCAGTTACCCTGTCAGAAAATGATTTAGGCAGTATAGCTATGTTAGGTTATTCTGCTCATAAATCAGAAGAGCAGAATGTAAAGACTAGTGAGACAAATTTTAATGCTAAAACACTTTCTTATAGTGACATGTACAGTGAAAAGGTAGGCCCATCAATAAGCAGTGTAGGGAAATTCTCTCTCGCCTGTTTATCCATGCCATTTTTGACACTTAATACTGAATTAGTCAGTAGTGTAAGTGGATTGCCTCAAAGGCCTGTATCAAAAGCAACCAGCACAACTTCTGGATCATCAGTGAAAGCTGCACAGAAGGATCATAAGCTACCTTCTGAGAATCAGAGATCTGATGACAGAAATTTAGAAGTGACTCAGAACAGGAGTGAATATACTGTTGTTGCACATGTAAACATTAATGAGAGTAAATCCCCATTACCAGTTTCTGACGATACCCAAACTATTTGGTATGAATATGGCTGTGTGTGACTAAATAAAGATTAAATATATTCTCCCA\n>XM_002842962.1 Microsporum canis CBS 113480 conserved hypothetical protein (MCYG_08091), partial mRNA \nATGTCGGCGCCAAATCGACGTGGTGATGGGCAGACACCGCTAAACTCAGCTGGACCCAGCTCCAGTCCAGCCAAAACACCCTACAATGCGCTATTCAGATTATCGAGACTAGTGGCAGCGCCTTCGACTCCGGCACAGCAGAATGCTACCTCGTTCAACTCAAACAGACCGTCAGCGTCTCGGGCTGGCCGCCGGAAATCAGGGATGACGCCGTCACGGACAAGAGGCGGAGGTGAACATATACCAGTGACTCCGCATACGATAAGGGCATTCCAGAGACGTGCAGCAACATATACTCCGGGGCGGGATAGACGGAAGAGTCAGCGCTTCAAGCGGGAGACGCCAATGGATATTTTGAAAAACCTGGGGAAAGCTCTTGCGCCAATATCAAAACCGGTATCGTCTTCTCCGCAGACCGAACTAGAGGACGAGCCGGAGCCCCCAGTGGACGAAATTGAAGAATTAGACAGGGAGCCTCCCATTCCACCACCGAGACTTTCACTCCCGCTTAATGAGATGACTGTGGTCCAGGAGGACGATAACAGTCCCGAGATACCCCCTCCAAAACTGTCTCTCCTCCCAGAGGATGAGGACATTACGAGAGGGTCGATTGAATTGCCCCGGAGAGAGCGGTCAGGTCGAGATCTGGCCAGGCTGTCGAGAGTAAGCTTCGCCAGTAATCGTTTCAGTGATCATTTTGGGGACACCACGAACCTTGAAGATCCGGCAGAGGCATTGGACTTTCGTGTTGGACCAGAAGAGGACTTTGATGAGGATGTTGACAATACGACCGGACAACCGATGTTGGATGCAGGGGGAGAAACCGAGGATTTGGGCCGATTTAACCTCGATTTTGCCTTCCCAACGCCTGAAGCGCCTCATACTATGCCAATAGAGAATGATAATGAGCAGGACACCTTCGAGTTAGATGCAGTGCCACCCGAATTCGGTGGACCAGACAGTCCTTCATCAGGAAGCGATTTCGGGACAGCAGGATTCGAACCAGCCATGACCGATAGGTCGTCTAATCGGGGAGTCGTAGAGGAAGAAGAGGAGGAGGAGCAGGAGCAGCAACAGGAAGACCAGCCTGAGCCACCGCAGAAGAAACAAAAGCTGTCTAAACATGGGATACCGGTCCCAAGTCTGCCTTCTGGAGTCGTAAAGAAGCTGGCCATGCGGTTTGCAAGGTCCGGGAATAAAAAGACGAGAATCAACAAGGATACGATGGCGGCCATCCAGCAGGCAACGGATTGGTTCTTCGAACAAGCGAGCGGGGATTTGTCGACATATTCCAAACACTCTGGCCGAAAAACAATTGATGAAACAGATGTCATCGCACTGATGAGAAGGTAG\n>JX319470.1 Uncultured fungus clone 034A1751 18S ribosomal RNA gene, partial sequence; internal transcribed spacer 1, complete sequence; and 5.8S ribosomal RNA gene, partial sequence \nAAAAAAAGCTTGGTCATTTAGAGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTACAGAGTTCATGCCCTTACGGGTAGACCTCCCACCCTTGAATACTATACCTCTTGTTGCTTTGGCGGGCCGCTCCGGCTACCGGCTCCGGCTGGTGAGTGCCCGCCAAGGGACCTAAACTCTTGAATTATTGTGTCGTCTGAGTACTATATAATAGTTAAAACTTTCAACAACGGATCTCTTGGTTCTGGCATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTTAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCCTTGGTATTCCGAGGGGCATGCCTGTTCGAGCGTCATTAT\n>XM_040766144.1 Sporothrix brasiliensis 5110 uncharacterized protein (SPBR_07890), partial mRNA \nATGGTCATTGAGACCAGCGGCAAGCTGCTGAAGGGGTATGATGACAAAGGGTACAGCCGAGCCTTCAACCGATTGTTTACAAAGGCCCCGGCAAACGCCGGGTACAACGACGGCTTGTCGGCCCCGCAGCCCGACTTCGTAGAGGGCCTCGAGAAACAAGAGTTCCGCCCGTTCCAGGCCGCCGACTATATCCCTGGAGCCACTCTTTATAAGGACGACCCCCGTTCCATAACCCTACCGATGATTGCTGGAGAATGGAAGGGCCCTGCTGGGGACATGAGAGAAACGAGAGTGCAGAGTGCCTACGACGGAGCAGCTCTTGTCCACGCAAGAAACCAAGCACTCGCCTACATGGGAGGGTCTGATCCCCCAGGCCACGCAGAAGTCACAACATTCACCGCAGACGGCACCAATCTCAACCTGACGGACGGAGACGTCTCAGGAACGCCCAAGACTATGCGAAGACTCAGTCCGAAGAACTAA\n>L38765.1 Pisolithus tinctorius (F00031) mRNA, EST0038 \nCGGCTAGCTGCTTTTAACTGAAGTATTGCAGCATGTAAGTTGTGGTTTATAAAGTCTTTCGCCATGCGAGGAACAAGTCGACAAATTTGATGAGCTTATTCATCTTATTTGTGTATGTTACCACACAATGATTCCCTTCTTTAATTGAAGTATTTGAG\n>XM_018671993.2 PREDICTED: Lates calcarifer inhibitor of growth family, member 1 (LOC108880464), transcript variant X1, mRNA \nTCAATACACAGTCAGTGAGATGAAGGAACAAACCCGTCAGTGCCAAAGCAATGGGGACTCTGTAAATGGTGCAAGTGACTGGGTGTCCTGTGATAAAGACGAATTCGCAATGTTGAACCCCACCAATGGTGATCCAGGACATGTTGTCGTCAATTATGTGGAGGAGTATTTGGACCTCGTGGAATCACTACCTTTTGACCTACAGAGGAGTGTGTCTCTCATGAAGGAAATTGATGCCAAGTATCAAGATATTCTGAAGGAGCTTGATGACGCTTATGAACGTTATCGGCGGGAATCTGACTCACTTCAGAGGCGCAAGCTTCAGTCATCGATTCAGAGGGCGCTGATCCGCAGTCAAGAGCTTGGTGATGAAAAGATCCAGATAGCTGGTCAAATGGTGGAGTTGGTTGAGAACCGAACACGACAGTTAGACTGGCATTCTGAACTTCTCCTCTCCTCTCAAGAAGTCCCTGAGAGCCACGTTCCTACAGCAGCATCCATGACCACCACTGCAGCATCCTTGATGTCCTCATCATCAGCCACAATCACTCCAGGGAAACCTGGCCACCATGACAAGAAGCGTGATGAGGTAACCCCAGGCTCAGGTGGTGCAGACAAGGCTGGAGGGAAACGCTCAAGACGTCAGAAAAATGGAGAAAATCGGGAAAGTTATGGGGGTCTGGATCACACAGAGGAAGTGGGAGTGGGGGCGTCGCGGGAAAAACGTGCCAAAACATCTTCCAAGAAGAAGAAACGGTCAAAAGGAAAGTCTGAGAGAGAAGTGTCACCTCCAGACCTGCCCATTGATCCAGATGAGCCAACGTACTGCCTGTGTGAGCAGGTGTCCTATGGCGAAATGATAGGCTGTGATAACGATGAGTGTCCCATTGAGTGGTTTCATTTCTCCTGTGTTGGCCTCCATCATAAGCCAAAGGGAAAATGGTACTGCCCTAAGTGCAGAGGTGAGAATGAGAAGACCATGGACAAGGCCTTAGAAAGGGCCAAGAAGGAGAGGGCATACAACAGGTAGCTCGCGCTGCCTGGCCAAACGAACACTACTGCAGAGAAATTTAATTTTCTGTCTTGTCTTTGTTTCCATTTACTATTAACAGTGTTCAAAAAGAGTAATGAGTTGATGAGAGGGATCTTGTACATAGTTATTTTTGTAACTGCTGCATAGCCGAGAAACAAGATCACTCCCTCCCCCATTGGGATTATTTGTAATTGACACAGTACAGCACAGTACAACCTGCATGTTTGTAACCAGCTGTCCTCCACTCACATCCCCCATGTTTTCATCATGCATGCAACATCACCCACTCCACTATATATGCTCAATTAACAAATAAAATATTTCTAAACAAGGAAGAA\n>XM_046503406.2 PREDICTED: Haliotis rufescens thymidine kinase, cytosolic-like (LOC124137211), transcript variant X3, mRNA \nGTCTAGTCCCTGAAGTGGTGTGAAAACCCGTAAACCATTTATGTGTACCTTATTTAATTAACCTCGGGCGACAAGCGAACTCGTGCACATTTCTGTGTTCCGTGTTGCTGCCAGTCGCATGTTCGCCTAATTTAGAACCTCAGTGGGCGTGATCCGGGGCGGAGCATAGCGATGTCAGTGGATCACACTTGTTAGAGCTTTAGACTAACTGTGATTATTATGGAACAAGCACGTTTCGCTACATCTATAACATATATCAATATGATGTCTACAAATCACCTGATCCCTTCACCAACGGCAGTTACCAGCCACAGAGGGCATATTCAGATAATCTTTGGACCCATGTTCTCCGGCAAAACCACAGAATTAATGAGATTAATGAAGAGATACCAGGTAGCTAACCACTCCTGTCTCATAGTGAAGTACGCCAAAGACACCCGCTACGACAATCATGGCATCGCTACACACGACAGAACAGTGTTGTCTGCCACTGCTGCCCATGAGCTGATGTCTCTCATACCTGAGGCGCTGAAGTATGACGTCATAGGCATTGACGAGGGACAGTTCTTTCCTGACGTGGTGGTTTTTGCTGATACAATGGCAGAGAAGGGGAAAGTTGTCATAGTAGCAGCACTAGACGCGACATTCCAGAAGAAGGTGGAGGTGATCGGGGGCAAAGACAAATATCTAGCGGTGTGTCGTGCATGCTTCCGAGGGAACAGTTTTCACCAACAAACCAACACCACGACTGAGTAGTCCACGCCTCTATCGATCAGCCGTGTCTGTGTGGTGGAAGAAAAGGTGTCTGTGATTTTTGTCTGAGACAAAACAGTTATTTTAATGTCTTCCTTTTAGTATTCATCATACAGCTCAGCAGACATATATTTCACAAAGAACATTGTCCGGGCAAGCATGCCACTGTGATGTAGTCAAAGGGCATATTATGTATTACACAGAATAATATTCATATTTTTTAATATTTAAACAAGACTTGTATACATACAGACCTAGAAACTATTTGTTATTAAAGTATGTCAGTAAATTGCATTGACCATTTCTTCTCAAACTTTGCAACAACAGATATTAAGTAGTTTAGGAACGGCCATAATATATTCTAGGTTAGGCTGTTGTTTTAGTTTAAGTTATTTTATAGCGCTTCAAAACGTTATCCGAGCATTCAGAAGTCATGCTGGATTCTACACACTAAAAACCCCACTGTACTCAGTGATCTGTGATCTGTTTGAAGCTCGCGTACAACCAAAATATTTTTCTTCTCAAGATGTTGTTATGTTTGCTGCTATGTTACACTGCACGAACTTGTTCCTTTGACATTAATCGACTTGGGTGCCATTTAGCTGTTATTGCTATGGTTATATGCTAGGAATCTTCATCATGAGATAACAGGTTTATTATATACTTCAGTGTGAAAGACTGAGTTTTCTGAAGTTGAAAAAAGTGATATTTTCATTGCAGTGAACATAACACTTGATATTTCACTGCGGTGAACATAACACCTGATATTTCACTGCAGTGAACATAACATGTTGACGGAACTATGTTGGCCTACACGAGACAGCTCGTACACAAACTGTTGATTTACGTCAGTTCAACGTTGACAAGTCATATAATGACAGATGGTCATTTATGTAGTTAATACCGATTCTTATCGTTTGTTTATTTTGTTGAAAATGAATTGTATTAAACTGTGAATTTCTCTTCTGA\n>XM_040439057.1 PREDICTED: Bufo bufo zinc finger MYND-type containing 8 (ZMYND8), transcript variant X7, mRNA \nTCAAAAGATCTGACAGCCCCCGTGCTCCTCCTGTGTCCCGGGAAGGCCCTCTCTGGTTCCTAGTGTCACCGTTCTCATTGCTCCTTGCACTTTACCTGGATTCTCTGCTCCACAGCTCAGGGACAGGTCTCACAGGATGGCTCCTGCCTGCAAGAGCTGTACAAAGATAATCACTCAGGAAGTGGCTCAGCCAATGGCCTGAAGCATTACATGTGGATTCCCGAAAGCCTCCAATCCTGCCCCAGCTTGCAACAGGGGAGTCTGATCATCAGGCTGAAGTGCCAAGCCCTTTCTGTCTGAGAACTGAGAGTCTGTCCTCCATGTTTTATAAGTATTGACATATAACACTGTAACAATGCATCCACACAGGTAAGCCAGAGCTTGTCTTTTTTTGTAGTTTATTCCCATCTCTTGGACACTGTGCTTTTGCAGGTTGCATTTCCGCGACTTCTCGGGCCAAATTCGCTAAACCAGCAAGTGTTTTGAATTTTGACTTTCTGGAGAGATCACATGGTTGGGTGCCATTAGCCAGTGACTGCTGCTGGGGGTTCCAGGGGTACACTGCACAATTAACTTTTTTGTTTTGTAAAGAGTGGTGGGTTTCTGCACAGCCCCCTTCACTCCCCTGTTCACCAAGGAAGATCTCTGCATTATTGTGTATTCCTGTGTCACATGCTGCTCAGAGGAACATGGAGGCTGCCTCAGCACAAGGCTTCAGCTGACGTACAGGCCACCAAGCAAAGCACACTTTATTCACCCTCTATCTAAAGGACAAGAGCCAGACTAACCCAGGACTGTTACTTTTGATACCGACCACAGAGACTCTCAGCATTTATGCCTGACATACGTCTGGGGCCTAGCTTTGGATTTTTCAAATACCACCATATCTGAAGCCTTTCTCCGGTTTACTTGGTGCCCTGTGGACCCGGCACAGTGTGCGTGTACATGATTTTTCTTGCTTTTTACCCATATATTGTTTTTTGAGATTTTTTTATTTTTTATGTTCTGGATATATGATTTCCTGAGGCTGGGAGCTAACCAATATGGATGTCAAACATTTGGCAGAGGAGGAAGTGAAGATTGAGCCGGAGCTGGTGGAGGGGATGGATGTCACCACTCGATCCAAAGGTCCTGCTGTTGCATATCCAGAGGGATTATCGCAAGAACATGGAGACAGTCAGCAGTCCAACCCAGGCTCAGGGCAGAAAAGGAAGATTTCCAGCCCTCAGCACTCATCCAATGGGCACTCTCCTCAAGATGTATCCGGCAGCCCAAGTAAAAAGAAGAAGAAACCAGGAATGTTGAACAGTCACAACAAAGACCAGTCAGAGCTAAGACATGGTCCGTTTTACTATATGAAGCAGCCACTCACCACAGACCCTGTTGATGTTGTACCGCAGGACGGCCGCAATGACTTCTACTGCTGGGTTTGTCACCGGGAAGGTCAAGTCCTATGCTGTGAGCTCTGCCCCAGAGTTTATCATGCTAAGTGTCTGAAACTGACTGCTGAGCCTGAGGGTGACTGGTTTTGTCCTGAGTGTGAGAAAATCACAGTTGCAGAATGCATAGAGACACAGAGTAAAGCAATGACTATGTTGACCATAGAGCAGCTTTCGTACCTGCTGAAATTTGCTCTCCAGAAGATGAAACAGCCGGGGACAGAACCCTTCCAGAAGCCGGTGTCATTGGAGCAGCATCCTGATTATGCAGAATATATATTTAATCCTATGGATCTCAGTACGCTAGAAAAGAATGTTAAAAAGAAAATGTATGGTTGCACAGAAGCCTTCTTGGCAGATGCCAAATGGATATTGCATAACTGCATTATATACAATGGGGGAAATCACAAATTAACACAAACTGCAAAAGTAATAATCAAGATATGTGAACATGAGATGAATGAAATTGAAGTCTGCCCTGAATGTTATTTAGCTGCTTGCCAAAAAAGAGATAATTGGTTTTGTGAACCGTGTAGCAATCCGCACCCTCTGGTCTGGGCTAAATTAAAAGGATTTCCCTTCTGGCCTGCTAAAGCTCTGAGAGATAAAGATGGACAGGTGGACGCCCGCTTCTTTGGACAGCATGACAGGGCATGGGTTCCAATGAACAATTGCTACCTCATGTCAAAAGAAATCCCTTTTTCTGTAAAGAAGACGAAGAGCATCTTCAACAGTGCCATGCAGGAGATGGAGGTGTATGTGGAAAACATTCGCAAAAGGTTTGGTGTATTTAATTACGCTCCCTTTCGGACACCTTACACACCCAACAACCAGTACCAAATGCTGCTTGACACTACCAATCCAAGTGCTGGTACTGCCAAGACAGACAAACAGGAAAAGATCAAGCTGAACTTTGACATGACTGCATCTCCGAAGATCCTGATGAGCAAACCCATATTAAGCAGCAGTGGAGGCCGACGGATTTCATTAACAGACATGCCACGGTCCCCAATGAGCACAAACTCCTCTGTGCACACAGGCTCAGATGTAGAACCAGACGCTGAGAAGAAAGCAGTGTCCAGCCACTACAGTGCAAGTGAAGAGTCCATGGACTTTATAGATAAGAGTACAGCTTCTCCTGTATCCATAAAGACCGGACATGGTGGCAGTATATCAGGCAGCCCCAAACCTTTCTCACCACAATCCTCTACACCAGTAAAATGTAAGACGGAGAGGAACACAAGCACAGGCAGCATCCTCAACCTCAATCTTGACCGCAGTAAAGCGGAAATGGACTTGAAGGAGCTGAGTGAGTCTGTGCTTCAGCAGTCCACGGCAACCCCACTCATCTCTCCCAAAAGGCAGATCCGCAGCCGATTCCAGCTCAATCTGGACAAAACCATTGAGAGCTGCAAAGCCCAATTAGGAATTAACGAGATTCCGGATGATCCTGATGCCACAGTGGAACACAGTGATTCTGAGGAGTCAGAGAAGACAGATTCTAGTGACAGTGAGTATGGGAGCGACGATGAGCCGAAGTCAAAAAATGATGAGGAAGAAAAGGAAAGTGTGAAGGAAAAGGAACTCCCTCCATCTTCAGTAAAGAAAAAATCCAAGCCCTCAATCCAAATAGAGGCAAAGGATGAATCCAAGAGTGCAACAGCGACAACAGATAAAGCGGATGCAGGGGGTAAGGATAAGCTGGCATCCACTGTAGAGAAGGATGTTCCTGACAAAGGTAAACCCCTGACGCACTCTGCAAAGGAAAAAGTGAAGGGAAAGGATGATACAGACTCTCCTACTGTACACCTTGGACTGGACTCTGACTCTGAGAGCGAACTGGTCATTGACTTGGGTGAAGATCATTCGGGGCGAGAAGGACGTAAAGCCAAAAAGGATGCTAAAATAACAGCAACAAAACACCCAGAAATAAAATCCCCAACCACAGCCAGTGTCAGCAGTCTGCCAGCAGTTGACACCCCTATCATGACCCGCTCTGCATCCCAGGCTGCCCCTGCTGTAGGGGTAACAGTGACTACAAGTTCAGCATCAGCTGCAAGCACTCCGACGGCAGCTACTGGCAGCCCAGTGAAGAAGCAGAGACCTCTGCTCCCCAAGGAGACAGTTCCCACCGTGCAGAGAGTGGTGTGGAATTCTTCCAGTAAGTTTCAGACCTCATCCCAGAAATGGCACATGCAGAAAGTTCAAAGGCAACAGCAGCAGCAACAACAGCAGCAGCAACAGCCGAGCACGCCTGCGCCGTCACAGTCTCCACAAGGGACGAGATACCAGACACGGCAGGCTGTGAAAGCGGTGCAGCAAAAAGAAGTCACACAAGCCACATCCACCTCCACCATAACCCTTGTGACCACCGCCCCACCACTAGCCATGGTGACCAGCCCAGGACAGCCACTGACCACATCAATCACCAGTGACCTGCCCATCGCTACCGCCTCAGCTGATGTTGCTGCTGACATTGCCAAATACACCAGCAAGATGATGGAGGCAATTAAAGGCACAATGACTGAGATATACAACGACTTGTCTAAGAATACCACGGGGAATACCATAGCGGAGATTCGACGCTTACGAATAGAGATTGAAAAACTGCAGTGGCTTCATCAGCAGGAGCTGTCTGAAATGAAGCATAATTTAGAACTAACCATGGCAGAGATGAGGCAGAGTCTGGAGCAGGAGAGGGACCGGCTGATTGCAGAGGTGAAGAAACAAACTGAGCTGGAAAAGCAGCAAGCAGTGGATGAGACCAAGAAGAAGCAGTGGTGTGCCAATTGCAAGAAGGAGGCCATTTTCTACTGTTGCTGGAACACCAGCTACTGTGATTACCCGTGCCAGCAGGCGCACTGGCCCGAGCACATGAAGTCCTGCACGCAGTCAGCCTCTGCTACACAGCAGGAAGCTGACCCTGACCTCAGCACGGATAAAACGGCACAAGCAACAACAGGTACCCAGCCACAGCCTGCTGAAACCACCACAACGCCGAAAGAGAAGGATGGCACAGCTGATAAGAGCAAAGAGAGTGTCACTACCATCCCTGTGGTTGTAAGCCCCAGTGCCGGAGCGGTGGCGATGAGAGCCGGTGTTCAGTATGTGCAGACCACCATGCCGGTCCAGGTGAGAAGAGTGTGACCTGTAAGCATTAAAAACAGCAAGACAATACAGAAACACTACATTGTGCGTGTCCGGAGCCAGCGCCTCGTCCTGTATGTAAATAATGTACAATCTGTGGATGTGATTAAGAGTAGAACCATCTTTTTATATTTGTATTCACTTTAACTTATGAACGTTTATCCGGAGCCACGACATTAAAACACCGATTATGACAGATACTGCTGAAATCCTGCTATCTCGCAGAACGGATGGATGCCAAGGTGTAGATAAAGCAGATTACTCTTGTATCAGTATAATCAGTGTACAAAGGAGCAGTGAATGATACAAGCGTCTATGTGAATAATCACAGCTAATGCCGCATTCATGGCAAGAGGCAGCGGCATTCAATCAAACATTAACCCTAGTGTGGGATCGTCCCGCAGGAACAACCCTAATAACCGGAGAGGAAAACGAAGCACCATATTTATCTGTGGACAACGTTGCAAAAAATATATGGTGGCGCCTTCAGTCTGTTACATTGCCACCACAGATTCACTTTGTATCTTATGTAAAATCACTGCTGATGTCTGTATATGAGGACCCTCTGTATAAAATCATTCCAGTGCCACGCGTTGTACATTTATCACACTGTTGATTTTTCACCATTGTTAATAACGGAGATAGTGTGTACAGTAACCAATGGCGAATACAAGATGGAAGCAAGGCGCCATCAACCCTGAGCGAGAGGCAATATCAGTGGCAAGCGGTTTGAAATGCGGGACTGGCCAGCTTTCCCTTGTGAAACATAATTGCTTTTAGCATATGGAAGTATTTTTTCACATTTTCTTTGTATAAAATTTGTATTAAATTCAAACATTTCTTTTT\n>XM_027968038.2 PREDICTED: Ovis aries RAD52 homolog, DNA repair protein (RAD52), transcript variant X6, mRNA \nAGCGAGTTTCTGCGCGTTCAGTCTGAACAGAGCCCTGTCCGCTCTGCGCGGCTGAGGCGCTACCAGTACACAGTGGAAGAACACCAGGCCATCCAGAACGCCCTGAGGCAGAGGCTGGGCCCAGAGTACATCAGTAGCCGCATGGCTGGAGGAGGCCAGAAGGTGTGTTACATCGAGGGTCACAGGGTCATTAATCTGGCCAATGAGATGTTTGGCTACAATGGCTGGGCGCACTCCATCACTCAGCAGAACGTGGATTTTGTTGACCTTAACAATGGCAAGTTCTACGTGGGCGTCTGTGCGTTTGTGCGAGTCCAGCTGAAGGATGGCTCGTATCATGAAGATGTGGGCTATGGTGTCAGCGAAGGCCTTAAGTCAAAAGCCTTGTCCTTGGAAAAGGCCAGGAAGGAGGCAGTAACAGATGGGCTGAAGCGGGCGCTGAGAAGTTTTGGGAACGCACTCGGAAACTGTATTCTGGACAAAGACTATCTGAGGTCACTGAACAAGCTTCCACACCAGCCGCCTCTTGAAGTGGATTTAACTAACGCAAAGAGACAAGATTTTGAACCATCTGTTGAACAAGCCAGATACAGCAGCTGCCAGCAGAATGCGACCCTGGAGCCCCCTAAAACCCAGGAGGCGACCTCTCCATGCAGACGGAGCCACTTGGCTGGACCCCACACCGTGACGCAGGGGGCCACGGAGAGCAGCTCCCGAAGCCTGGCCCCCGGCACCGCGGAGAGTGAAGCCACGCTCCAGCGGAAGCTCCGGCAGCAGCAGCTGCAGCAGCAGTTCCGGAAACAGATGGAGAGACAGCAGCAGGCTGCCACCTCTGCTCTGTCCTCTGGAAGGACGGACCAGGCACAGCCGCCACCGGTGCCTCCTACCAAGCCCAGCCTCCCCAGGACCCGCTCACCTTCAGAGCCACTCACCCAGACAGACCTGCTCCCAGACAGTCTTGAAATGTGGGACATGGCTATGGATGCAGAGGACAGCGTGCTCAAGACCTTTTCGAAACCAGAACCACCGGAGACCCCTGCCATCTCGGTCCTGAAGAACCACATGGAGACCCAGAACAGGATCCCACCAAGCCTTTGCCACCAGAATCCACAGGCACAATCTGGACCCTGGCACCTCCAAACTTCCAGCCTTAACCAAGACACCACAGGGAATTGTGACTCCTCTAGGAAGAATCAGGACATGAAGAAAAGGAAACTGGACCCACCTTAACCACGGCTCAGGGCACCTCCTGAACTGTCCTGATGGGACTTCATTTTGGTCATGAAATGACTGGTCCTGCCTGAGGAGTGCACTCTGCCTCAGGGCTCTACCTGCTTCATCCTGAACTCTGCTGGGGGACTCAGCACCTGCTCACATCAAGTCGGGCATTTGGGAAGCTCTGTAGAGACTCGGTGCCTTTTCTTGGGCTCCTCACTCTTTATTCCTAAGCTATTGTGTTAATGAAGACAGAAATCACCTCAGCCTGTGGTGCGTTCCTGAGTGACCGCTGACCTCTTGCTGTGGGGGCCCCCCGTTATCTAACGCTGCCATGCAAGATTGCAGTCTTCATCACTATTGTTCATCGGCTCATGAAACTACTTCCCTTTTCTCCTAAGACCAAAGAAAAGGTATTTTTAAGAAAGCAAAATTAAATCCTACCCTGTAACAATGTAA\n>XM_028824534.2 PREDICTED: Erpetoichthys calabaricus F-box and WD repeat domain containing 8 (LOC114668659), mRNA \nCGCTTTTGGTGACGGAAAAGGCGGTGCATCACTTCTTGACTCCCCATCTGTTATGGATGTGCTGTAAATAAATATTTGCGGCGCCGTGCGCAATGGAGTTGGAACAATTCAGAGAGCAGTGGAAGAAAGAACTAGCGGTGCAGCGGAGTGCTATCGGTATCGGCCGGAAAGAGGCACGACGGTTTCAAGAAAGTACTCGTCCTGAGGTGTTGAAAACAAACAGAAAATTTAAACATGAGTCGGAGCTCGTTAATGAACAAACTACAGACGCAAAGACGGGAACGGTCTCGTTGCCCGACAGACCCCCGAAAAAGAGGTGGTACCCACACGGAGATCGACCGCAACATCTGCGGAAAGCGCCGCGGGAAGAGCGTTTGCTGGATCGGTTAATCCAAGACTTGAATGAAATTAATGAGATACCATTTTTTGACATGGATTTGCCATATGAATTAGCCCTGAAAATATTTCAGCATTTGAACACAACTGAGCTTGGAAGGTGTGCCCAGGTGAGTAAGGCTTGGAAGATACTTGCTGAAGATGAGCTGCTTTGGTACAGACACTGCCTGAAGGAAGGACATTTGATTGGGTCAAGTATATCAGACTCGCCCTGCTGGAAAAGTACCTTGCGTGATTGTCGGCAGATGGAACACACGATGCGGACTAATTGGAAGAACCGTGTCGGGGCCATCAGCCAGCTGCAGTATGAACTGGGAAAGGTGCTGTGTGATGTCAACTCATGTGCTGGACATGTTATAGCTGGGTACACTTCCGGAGATGTGAGGCTGTGGGACACTCAGAATTTGGATATTGGTTCGCCTTACCTGAGACCTAGCCATGTGTCCAGAGAAAGTGCCTTACGGCCACATGTCAGTCATGTCTGTGTGAATGAAAATGTGGCTGTGGCTGCCTATGAAGATGGCATCATAGATGTCTGGAGCATTGAAGCTGGCCGGGAACCCATCCACCATTATCAGCACCTGCAGCGGGTGCAGGCTTTGGCTTTGGGGGCTGAGGGGACCACTGTAGCCTCTGCCTCTGGTAAGCAGGTGCGAGTGGAACAGCCAGATGAGCAGGGCTACTGGCAGACAACAGCCCAGTTTGAGCTGGAGAAGTTGGTGGACTTTGCTCAAATCATTCCAGGAGTGCGTCCTCGGACACTGGCTGTTGTTGCTGCCTCTGACACAGTCTATCTCCTAGAGCCTGGCAAAGACCCCAGCATCCTTCACTGTGTGTACAGTCACCCAATAACCTGCCTTGACACCTCCTCCTCACAGGCTGCTGTGGGTGTGAAGAGCTTTGGGTGGGCAATGAATATGGGAAACAAGATTGATGTGTACAGCTGGGAGACTGGCCAGGCAGTTGTATCCTTGGGGTCATCCAGTGGAGATTTTACTTGTGTCAACTTGAAGGACAGTCCTCCAAATCTGCTGGTGTCTGGCAACAAAGACCGAAGAGTGCGGGTGTTTGATCTGAGGACAGCAAAGTCTGTCACATCTCTGTACGGCCATCACATGGGGGTTTCTGCGGTGCAGGCAGATGACTGGAAGATTGTAAGCGGTGGGGAGGAGGGTCTGCTCTGCGTCTGGGAAATGAGGATGGCAGCCAAGCTCTGGGAAATGCACAACAGGCACCCTGTTCGACATATCCACTTCCACACCCAGACCTTAGTAACAGCTAATATTCCAGACGAGAAGACTCCCAGGGGAGCATGCATCACCGATGATGACCTCACTGCACATCGACGGCACAGAGGGACCATCTACCTGTACGACTTTTCTGTGGACATGTCCAGCACCGATCACATCCTTCCTATCTGCCGCTCAAGTTACGCCGAGTCCCATGGTTATAACTACAACATTGGGCTGGCCGTTCCATATGATAACATCCTCGCCGCTTCTGTGGCGACCAGGCCACACGTGTCTTGAGCAAGACTAAAGACTGTCATGGAGGAGGAGGACGACATTTCTAATGGATCTGAGCACACATTTGAACACCTCTTGTCATTTTCCAGAAGTGTTCCTTTTAATATTTATTTTTCAATATGTTAGTATGTTAACATTTTTAAAATCTTAAAAGACAGTTCACTGCACAGTGCAGATGTGTCATACACAGGGGACTTGGCACAGTTCAGGTTAAAGTGAAAGCTTCAGTGTGGAGTTGTGCAAGCAGGACGACGGGCTCTGTGATTCATTGATGGCTCTTGTCTTGCACGTCGATCATTTTCTCTTTAATTATTCCTGCAAGTTGAGGAGCTGAGAATCAGTTCTCACGTTAACTTACCCGTCAGCCTTGCTCTTGCACAGAGATTTGTGTATATTGTATATAAATTGTATCATACTCCAGTATTTTGCAATGTCCCTAATGATTTATTTATTTCTTGTAAACACGTAGTTCTGATGT\n>XM_045577126.1 PREDICTED: Pipistrellus kuhlii transient receptor potential cation channel subfamily M member 4 (TRPM4), transcript variant X6, mRNA \nTCCGGGCCGGCGGCCAGCCGGGAAGCGGCAGATCCGGTTTGTCCGGGGCGGACCTGAGGTCGGGGTGGCGGAGGGAATGCGGGGAGCCGGATAGGCGGCGGCGGCATGGCGGGCCCGAAAGAGCAGAGCTGGATCCCCAAAATCTTCAAGAAGAAGACATGCACCGCCTTCATCGTGGACCCCGCAGACCCGGGAGGGACCCTGTGCCAGTGCGGGCGCCCCCGGAGCGCACACCTGGCTGTGGCCGTGGAGGACGCGTTCGGGGCGGCCGTGGTGACCGAGTGGGACCGGGACCTGCACACCACGGAGAAGCCCACCGACGCCTTCGGGGACCTGGACTTCCTGGGCGCCGGCCGCAAGGCCAGCAACTTCCTCCGGCTCTCGGACCGCACGGACCCGGCCACGGTGTATAACCTGGTCACACGCACCTGGGGCTTCCGGGCCCCGAACCTGGTGGTGTCGGTGCTGGGGGGCTCGGGGGGCCCCGTGCTCCAGACCTGGCTGCAGGACCTGCTGCGCAGCGGGCTGGTGCGGGCCGCGCAGAGCACAGGGGCCTGGATCGTCACCGGGGGGCTGCACACGGGCATCGGCCGGCACGTCGGCGTCGCCGTGCGGGACCACCAGACGGCCAGCACCGGCGGCACCAAGGTGGTGGCCATGGGCGTGGCCCCCTGGGGCGTGGTCCGCAACCGGGAGGCCCTCACCAACCCCAAGGGCTCCTTCCCCGCCAGCTACCGGTGGCGCGGGGACCCCCAGGACGGGGTGCAGTTCCCCCTGGACTACAACTACTCGGCCTTCCTGCTGGTGGACGACGGCACGCACGGCCGCGTGGGCGGCGAGAACCGCTTCCGCCTGCGCTTCGAGTCCTACATCGCGCAGCAGAAGACGGGCCTGGGGGGGACTGGCATCGACATCCCGGTCCTCCTCCTCCTGATTGATGGGAACCAGGAGATGTTGAAGCGGATAGAGAATGCCACTCAGGCTCAGCTCCCCTGCCTCCTGGTGGCGGGTTCGGGGGGCGCCGCGGACTGCCTGGCGGAGATCCTGGAGGACTCTCTGGCTCCGGGGAGCGGAGGGGGCCGGCGAGGGGATGCCCGAGACCGGATCAGGCGTTTCTTCCCCAAAGGGGACCCCGACGTCCTGCAGGCCCAGGTGGAGCGGATCATGACCCGGAAGGAGTTGCTGACAGTCTACTCTTCGGAGGACGGCCCCGAGGAGTTCGAGACCATCGTTCTGAGGGCTCTCGTCAAGGCCTGCGGGAGCTCCGAGGCCTCAGCCTACCTGGACGAGCTGCGCCTGGCTGTGGCTTGGAACCGCGTGGACATCGCCCAGAGCGAGCTCTTCCGGGGTGACATCCAGTGGCGGTCCGTCCACCTGGAGGCCTCCCTCATGGACGCCCTCCTGAACGACCGGCCGGAGTTCGTGCGCCTGCTCATCTCGCACGGCCTCAGCCTGGGCCACTTCCTGACGCCGGCGCGCCTGGCCCAGCTCTACAGCGCGGCGCCCCCCAGCTCGCTCATCCGCAGCCTGCTGGACCAGGCGTCCCCCGGCGCCGGCGCCAAAGGCCCGGCCCTGAAGCCCTCCGCCGAGCCCCGGCTCCCCGACGTGGGGCGGGTGCTGCGGCTGCTGCTGGGCGAGATGTGCGCGCCCAGGTATCGCGCCTGGGCCGCGGGGGACCCCCACCGCGACCACGGCTGCAGGGACGGCGGCGGCGGCGGCCTGGAGAGCGCCCAGCTGCTGTGCGTCAGGACCCCCTCGGAGCTCATGCTGGACGCGGTGCTGGGGCAGACCCCGTGGAGCGACCTGTTTCTCTGGGCGCTGCTGCTGAACAGGGCGCAGATGGCCCTGTACTTCTGGGAGATAGGCTCCAACGCCGTGGCCTCGGCTCTGGGCGCCTGCCTGCTGCTCCGGGTGCTGGCGCGCATGGAGTCTGAGGCCGAGGAGGCAGCTCGGAGGAAGGAGCTGGCAGCCAAGTTCGAGGGGCTCGGTGTTGACCTCTTCGGCGAGTGCCACCGCAGCAGCGAGGAGCGTGCCGCCCACCTGCTGCTCCGGCGCTGCCCGTTCTGGGGGGACGCCACCTGCCTGCAGCTCGCCATGCAGGCCGACGCCCGCGCCTTCTTTGCCCAGGATGGGGTGCAGTCTCTGCTGACCCAGAAGTGGTGGGGGGAGATGGACAGCTCCATGCCCATCTGGGCCCTGGTTCTCGCCTTCTTTTGCCCCCCACTCATCTACACCAACCTCATCACCTTCAGGAAGTCAGCGGAGGAGTCCACACAGAAGGACCTGGGGTTTGACATGGACGGGAGCCTCAATGGGGAAGGGCCTGTCAGGCTGACCCCGGGCCTGTATGACCTGGGCCGCACAGTCCTCTGCCTGGACTTCATGGTCTTCACGCTGCGCCTGCTGCACATCTTCACGGTCAATAAACAGCTGGGGCCCAAGATCGTCATCGTGAACAAGATGATGAAGGACGTGTTCTTCTTCCTCTTCTTCCTCGGAGTGTGGCTGGTGGCCTACGGGGTGGCCACGGAGGGTCTCCTCAGGCCCAAGGACCAGGACCTCCCACAAATCCTGCGCCGCGTCTTCTACCGGCCCTACCTGCAGATCTTCGGGCAGGTCCCGCAGGAGGAGATGGACGTGGCCCTCATGGAGCTCGCCAACTGCTCCTCGGAGGCGGGCCAGTGGGCGCGCCCGGTGGGGGCCCAGGCCGGCTCCTGCGTCTCCCTCTACGCCAACTGGCTGGTGGTGCTGCTCCTCGTCATCTTCCTGCTCGTGGCCAACATCCTGCTGGTCAACCTCCTCATCGCCATGTTCAGCTACACCTTTGGCAAAGTACAGGGCAACAGCGACCTCTATTGGAAGGCGCAGCGCTATAGCCTCATCCGGGAATTTCACTCTCGGCCCGCGCTGGCCCCGCCCTTCATCATCATCTCGCACGTGCGCCTCCTCTTCCGTCGATTGCGCAGGCACAGGGCCAGACTGCCGGCCTCCCCCAACCTCCAGCATTTCCGGGTCCACCTCCCTAAGGAAGCCGAGAGGAAGCTGCTGACCTGGGAATCGGTGCGGAAGGAGAATTTCCTGTTGGCGCGCGCTAGGGACAAGCGGGAGAGTGACTCAGAGCGTCTCAAGCGCACGTCTCAGAAGGTGGACATGGCCTTGAAGCAGCTGAGACAGATCCGCGAGTACGAGCAGCGCCTGAAAGGGGTGGAACAGGAGGTCCAGCACTGCAGCCGCGTCCTGGGCTGGGTGGCCGAGGCCCTGAGCCGCTCTACGTTGCTTCCCCCAGGGGGGCCTCCACCCCCGACCCCGCCTGGGCCCAAAGACTGAGCCCTGACGGCGGACTTCAAGGAGTAGCACCATGGGCGGTTTTTGCCCCCTGGACCCCAGTAGGTGGTGGCCCTGTCTTGAGGTGGGCCCTGTGCCATGGACTGGATCGCCGTGGGGACCACTGCAGGAGTCTCACCCGTTCGGACCACAGCAGGCCGGGCCCCGCCCAGAGCCAGCCCCACTGTGGGAGGTGCCGCCTCTGGAGGCCAGGCTGGCCCCTCCGCAGGCCCTGCCCCGGCCCGCGGGGCTGGAGAAGGCGTCAGGTCCTGGGGGCACAGGGACCACAGACCGCACTCAGCTCCCCACACTGGGGAAATAAAGCCACGTGAGCGTC\n>MT775861.1 Lolium arundinaceum CDF1 (CDF1) mRNA, complete cds \nATGGGGCAGTACAGGTCGGCGGCCGGAGGAGGAGGAGACTGCCAGATCAAGCTGTTCGGGAAGACCATCCCCGTGCCGGACGCCAGCGCCGGTGCCGACGACAAGCAGAACCTTCAGCACAGCAGCAGCAGCATGATAGAACCAAGAGTAAAAGAAATCGTCCCTCAGGACTCCACGGATTCGCCTCCACAGCCCGAGGTTGTGGACATGGAGGACCCATCTGCTGTCAAGAACTCGTCAGAAGATCAGCAGGAGGAACAGGGTGACACGGCCAATCAGAAGGAGAAGCTCAAGAAGCCTGACAAGATCCTGCCCTGCCCCCGGTGTAGCAGCATGGACACCAAGTTCTGCTACTACAACAACTACAATATCAACCAGCCGCGGCACTTCTGCAAGAATTGCCAGAGGTACTGGACGGCAGGTGGTGCCATGCGCAACGTGCCCGTGGGTGCAGGCCGTCGCAAGAGCAAGAGTATAACGGCCGCTTCCCACTTCCTTCAGAGGATCAGGGCCGCTATGCCCGGTGATCCTCTCTGCACCCCAGTCAAGACCAACGGCACGGTGCTCAGCTTCGGGTCCAGCACATCCACCTTAGACCACACAGAACAAATGAAGCACATCAAGGAGCTCATCCCAATAACCCGGATCGAGAACACCGATGACCCATCGGTTGGGTCTTGTGCTGATGGATGGGCCAAGGCAGAAGAGTCAAACCAAATGAATTCAAGGGAGAGAGTTGCAGCAGATGAACCCGCAAACGTTGTGCAGCATCCATGCATGAACGGGGGAACCATGTGGCCATTCGGTTACGCACCATCACCTGCCTATTTCACCTCAAACGTAGCAATTCCATTCTATCCAGCACCTGCTGCTTACTGGGGCTGCATGGTTCCGGGAGCCTGGAACACTCCATGGCAGCCACAGTCTCAATCTCAATCTGGCTCATCACCTAGTGCTGCTTCTCCAGTATCAACAGTGTCGAGCTGCTTCCAGTCACGAAAGCACCCTAGAGATGGAGATGAGGAAAGAAATGCCAACGGTAATGGCAAGGTGTGGGTGCCGAAGACGATCCGGATTGATGACGTAGACGAGGTGGCCAGGAGTTCTATCTGGTCGCTTATTGGGATCAAGGGCGACAAGGTGGGGACAGATGATTCCAGAGGGTGTAAGCTTGCAAGGGTTTTTGATCCAAAGGATGCGGCAAAGACGACAACTCACAGAGTTATCAATAGCTCGCCGTTCTTGAAGGGGAACCCAGCTGCACTATCGCGATCAGTGACCTTTCAAGAGAGATCTTGA\n>XM_033534398.1 Aaosphaeria arxii CBS 175.79 glycoside hydrolase family 5 protein (BU24DRAFT_56693), mRNA \nATATACACTACGCTATTACACTACGAGCCGCCGCCGCCGTTATGGTTTGTTCGCTCGCCACAGCTCCCTCCGTGTCGAAAAGGGTAATGGTTTGATTTACTTCGAGATGGAATTGAATTTCGAGGACTTTATATTCGAGGCTTTTGCCTGCAATTTTCGAGTTTGATTTCTGTAGCAATCTCAATTGTCAATTACTGAGGTCGAAGAATCATGCTGTTTGATCTGCCAACTTTCATCTCTTTGGCCCTTGTGGCAAGCCAGGGTACGTCGGCTGCTGCTGTCATCGGCAAGAGACAGCAATCGTCAAGTGGATTCGTCACTACGGATGGAAACAAGTTCTTGCTTGATGGGAAGGACTTCTACTTCGCCGGTAGCAATGCCTACTATTTCCCTTTCAACGACAAGGCAGAAGACGTTGAAGCCGGCCTCACTGCCGCAAAGGAAGCAGGTCTGAGTGTATTCAGAACTTGGGGATTCAACGATAAGAACAAGACTTATGTCCCAGGTGGTTTGCCCCAGTATGGAGGCGAAGGTGCGGGAGATACCTCGAATGTGTTGCAGCTGTGGGAGAATGGCACTTCGACTATCAACCTCAAGCCATTTGACAAAGTTGTTGCTGCAGCCGAGAAGACTGGCATCAAGCTTGTCGTTGCTCTGACCAACAACTGGGCGGACTACGGTGGTATGGATGTTTACACCGTACAACTAGGTGGCAGATATCACGATGATTTCTACCGCCTACCGGCGATCAAGACCGCATTCAAGAGATACGTCAAGGAGATCGTAACCCGCTACTCCAACTCCAGCGCGATCATGGCCTGGGAACTCGGCAACGAGCCCCGCTGCGGCGCCGACGGCACGCGCAACCTCCCGCGCTCCGACGACTGCAAGCCCGAGCTCCTGACCGCCTGGACGGACGAAATGAGCACGTACATCAAGAGCCTCGACAAGAACCACCTCGTGACCTGGGGCGGCGAGGGCGGCTTCAACATCCAAGGCCACGAGGACGGGTTCTACAACGGCTGGGACGGCGGCGACTTCGACGTCGAGCTCGCGCTCGAGAACATCGACTTCGGCACTTTCCATTCGTATCCGGATTGGTGGTCGAAGACGGTGGAGTGGACGGATCAGTGGATCAAGGACCACGCTGCGTCGGGTCGAAAGGTCGGAAAGCCTGTCGTTCACGAAGAATACGGATGGCTCACCGACGACAAGCGCCAGGAATACCTCGGCAAGACGTCCAACATCACTCGCATCGAGGCGCTCGGCCTCTGGCAAGCAACCTCCATCGCCGAGAAGATGCCAGACATGTACTGGCAGTTCGGCTTCTCCAACTACTCGTACGGAAGGAATCACGACGATGGGTTCACCATCTTCCTTGACGACGCGGAGGCTCAGACTTTGATCTACGACCATGCTAAGAAGGTTAATGCTTTGAATGGGAACTCGACGCTGCGTAGGTAGGACGTT\n>XM_050200589.1 PREDICTED: Aphis gossypii uncharacterized LOC114125601 (LOC114125601), transcript variant X2, mRNA \nTACATTTTAGTGTTATTATCTATATCATTTTACATAATACTTATAACAATTATATTTATATAATAGGTATGATTATATTATACATATTATTTTATGTTAATCTATGATTCATCAGCAGAATAGTTAAAATAAACACTAAATGGCCACGATAAGACAACAAATCAAACGGAACACGAGAATACACAAGAACGTCAAGAGCCTAAACTCGAAGGCTAACAGTTTGGTTCTTATTATGTAATGATTTATAGGTAGTTGTTCATATTATAATTCGCATCATTTGCCATTTGTATAAAAAACGATTCGTTGTAACCCTTACATTATGGATTTCGAAAGTGAATTTTTGAAGACTTATAGAATTTTGAAATGGGATGAGTTCACTGTGCTGAATAATGACCGTATATCAATCAACGAGAAAATCACTAACAAGGTGATAACTAAACATGAGTTGTTACTGCAGTTTAAAGCAGAGCTGAGTTTGCTTAATGCGTGTAAACACAAAATCAAAGACGAGTTGGAACAAGGTTTAGATGTTATTGATACTCAAGTACTTGTCCTCCTAAGCAAACGTGTTATTGAATTGTTTGATCATATGCATGTTCTGTTTTCTATTGATGAGAAGCTGTTATTTTATTTTATCAACTTTTGTCAAGACAATGTAAGCTACATACATGTAGACCAGCTAGATATTTTATTAGATGCTGTTTTGTGTACAGAAAATAATCAAAAGATTTGGATACGATTATTAAAGCTTTATTTGGAATTAAATAGTTTTGATAAATTGATGACTGTTTTTCAAGAAGGTGTTCGTTCATTAAAAAAAAATTCACTACCTTTATGGAAGATTATAATTCGATTTATGCAAATTAGGCGTCCTGATATGTACAAAGACATAGATGCAACTCGTAACCTGTTCAATGAACTAAAAAAGTTAAAGCCACCATGTTATAAATTGTATTTAATAATGATGGCTATTGAATCAGAGACATCAGATTTTGAATTACTGACTGTTAGAAAATTGTATGATGAAGCTTGCATTTTATTTGGCACAGATAACATTGAAGTATGGCTTGATTATATTCGTTTTGAACAGACTGATGGCTCCCCAAAATTAATGGAAAGTATTTATACTAGAGGTTTATGGAAACTGGAACCGAATTTAAAAAATACTTTCATAGAAGAGTATAATAATATTAAACGTGAATTTATGAATAGTTTAGGAAAAGAAGTTATAGTCATTGATGATTGAAATATATATTATATATTATAAACAAAAAATGGCGAATTTATTTAGAGATCTCCTTATTTATTTAATTTTTAAATTAATATTATAAGTGGGTCACTTAATAATATTAATACATTTGTATACTTTGGTTTTATTTGGTCATATAAAACAGTTTATTGTATTAGGCAAACAGTGTAGTACAGTGAAACTTCTGTTAATAGTTTACTTTGAAAGACTTCTAAATAAATAAATATGTATAATATGTATGTACAACATCACTTCTGCAAAGTTGCATTTTTTTCTGTTTTCTATAGTTGAACAGTACAAAAGTCTCACTGTACCATTTAGACGTCACAGTTAATGACACAATCTTAAATTTAACAATAGAAGGTTAATGGTATTTTTTTCTTTTATAATGTGTGTAATTGAATAATGTTTTATGTTACTTAATATTTTAAGCACTATTATATTTATAAATATATCATTTTATTTTATTTACATTGTCATAATTGTAATTTGTGCAATACCTATTAAAATAGACGGTTTGATGATAATAAATTATAATTTTTTACCTAA\n>XM_026522476.1 PREDICTED: Papaver somniferum putative F-box protein At1g52490 (LOC113272669), mRNA \nATGGAGAAGAAGTTTCCTAGTGACATAATGCTAGATATAGTATCTCCCTTACGGCACGAAACCATAATACATTGCAAACTAGTTTGCAAACCCTGGCGAGATATACTAAACAATATCAAGGTAGGTGTCCTTTTTAGGTTTGGGAAACCTGCTTTCAATTTCTGTTATAGAGGAGAGCAATACGATGATATTGATATGCATGAGAATTACTCTTACACGACACTGGTGGAAATCGATAAGCATCGGCCTGTCGAGCTAGAACCCTTGTCTGACATGGTTGGTTCATGTAATGGTTTGGTTTGTTTTTCTGTAAGGCGCAAGTTCACTGTTGCGTATGATCCCATCTACATCTGTAATCCCGTCACAGAGGAATATGTATATCTTCCAACATTCAACTATGATGAACCATATGATGATCTCCGGGTAGCTGGTTCTTTTGATTGTGGTTTTGGTTATCATCGTTTCATGGATGAGTACAAAGTCGTTAGAATCCACGGGGCTCTGAGAGATTTTAGTAAACGCTCGCAGAGCCGGAAAGTTGAAGTATACACTTTGGGTAGTGGTCATGGGTGGAGAGATAAAGGAAGCATCGATCACTTATTAGTTTGGGACCATGGAGTTTGTGCAAATGGAGCCATTCATTGGGTAGAGTATCGGAAAAATAAAATTGTGGCTTTCGATTGTAGCAAATGA\n>XR_001996655.2 PREDICTED: Juglans regia pentatricopeptide repeat-containing protein At5g61990, mitochondrial (LOC108994206), transcript variant X3, misc_RNA \nACCATCTCTGCTCTGCCTCTCGAGTCCGAGTCCCCGCAGCCGTCTCTCACGCCGAGCCCCTCTCTCACGCCGTCAACAGCCCCTCGCCGTCGACACTGTTATTCCGTTCTGTTCTCCTCCGCTTCCAGTTGTTCCCGAGGCTACAGAATCACAGATATTGTTTTCCCCTCTCTCGGCGAGCTAATCGGTCAGGAATAAAATGGGTCTACTTTCTCAGAGAAACCTCCTTGCATTTGCACTCCGAAATCGAAATGTTGTCGCAGAAGCACAACCATCAAGACTTCTTTTTGTTTATGCCAAATCCTTCAGCTTTTGCACCTCGCAGACTTCAAAACAGAATGAAGAGCTCACAATCGAAGAAATCTCCGCCTTTCTCAAGCAAAGCAACTGGCAGTACCTCATGGAATCGTCAAATATACCCAAGAAGCTGAACCCAGAGGTGGTTCGGTCTGTTCTTCAACATAACTGGGTGAGTGACCCCAAACGCCTCCTTCATTTTTTTGATTGGTCCGCTTCTTTGATGGGCGTTCCTCAAAATCAGTATTCTTTCTCGATTCTTGCAATTGCTCTATGTAATTCGAGGCTTTTCGCCCATGCTAATGGCGTCTTAGAGCGAATGGTGGGAACCCGGAAGCCGCCGTTGGAAATTCTTGATTCCATTGTTACTTTCTTTGTAGAATGTGGTGGGTCTAATGTGGTAGTTTTTGAGATTTTGGTGAATGCTTATAGGAAAGTGGGGATGTTGAATGAGGCTGCTAGCGTGTTTTTGGGAATTAAAAATGATGGGTTTTTGCCTACTTTGGTGTTTTGTAATTCTTTGTTGAAGGACTTGGCAAAGTGTAATAGGATGGAGTTGTTTTGGAAGGTTTATGATCGGATGTTAGAGGCTAAGATGAGTCCGGATGTTTATACTTATTCTACTGTGATAAATGCGCATTGTAAGGTTGGGAATGTTGAAGAGGGTAGGAGGGTGCTATTTGGTATGGAGGAGAAGGGCTGTAGTCCTAATTTGGTTACCTACAATGTGGTGATTGGCGGATTGTGCAAACATGGGGCTGTTGATGAGGCTCTTGAGTTGAAGAAGTTCATGGCTGGGAAGGGGTTGATCCCAGATGCCTATACTTACTCTATGCTTGTTGATGGGTTTTGCAAACAGAAAAGGTCAGAAGAAGCAAAGTCGATATTGGAAGAGATGTTTGGTATGGGTTTACGTCCTGATCACATTACCTACACTGCTTTGGTTGATGGGTTCATGAAACAAGGTAAGGTAGAAGATGCCTTGAGAATCAAAGATGAGATGGTTGCCCGTGGAGTAAGCTTAACTTTGGTAACATATAATGTACTTGTCGGTGGGTTTTGTAAGGTTGGTGAGATGACGAAGGCCAAAGCTCTCATCAATGAGATGAGTGTGATGGGAATAAAACCAGATAGTTATACTTTTAACTCTTTAATTAGTGGTTATTACAAAAAGAAAAATATGGTTGAGGCTTATCAACTTCTTCTTGAGATGAAGAAGTGGAACTTGGCACCCACAATATTCACTTATGGTGTGATAATAAATGGCCTATGCCATTGTGGAGATCTGCAAGCAGCTAATGGTGTTTTGGAGCAGATGATTGCAGGGGGTTTGAAACCAAATGCTGTTCTATTCTCAACTCTAATCAAAGGTCATGTACAACAAAGTAGATTTGACGAGGCAATAACGATATTAAAAGGAATGGAGGAAAAGGGCGTTCTGCCTGACATGTTTTGTTATAATTCTCTTATAATTGGCCTCTGCAAGGCCAAAAAAATGAAAGATGCTGAGAATTTCTTGGTTGAAATGATCGAGAGGGGTCTTAAACCTAATGAATATACATATGGGACTTTCATCGATGGATATGCTAAGGCGGGGAATATGCAATTAGCATACGGTTATTTCATAGAAATGCTAGGTTGGGGTATAGCGCCCAATGGTTTGATCTGCACGGCCTTGATTGATGGGCACTTTAAAGATGGTAACGTAACTGGAGCTCTTTCTGCATTTCAATTATTACTTGGACAAAGGGTCATCCCAGATATCCAGACTTATAGTGTTCTCATCCATGGTCTTTCTATGAATGGAAAAATTGAGGAAGCAATGGAGGTTTTATCTGAAGTCCTTGACAAGGGTCTGGTGCCAGATGTTTTTACCTACACCTCTCTCATTTCTGGATCCTGTAAGCAAGGTGATTTAGACAGAGCTTTTCAACTCTATGATGAGATGTGCCAGAAAGGCATCACTCCAAACATTGTTACTTATAACTCCTTGATCAATGGACTTTGCAAGTCGGGTGACATTGAGAGAGCTAGGGAACTGTTTGATGGAATCTCAAGAAAGGGTTTGGCTAAGAATGGTGTGACCTATGCTACGATTATAGATGGATACTGCAAATCTGGAAATTTAGTTGAGGCATTTCAATTAATGGATGAGATGCCATCTATGGGGGTTCCACCTGATTGTTTCATCTATTGTGCCCTTGTTGATGGGTGCTGCAAAGCAGGAAACATGGAGAAGGCCCTTTCCTTATTTCATGAGATGGTGCAGAAGGGCTTTGCTTCCACACCTTCTTTTAATGCTTTGATTGATGGCTTCTCCAAGTCCGGGAAATTGGATGAAGCTAACCAATTGTTTGAAGACATTGTTGATAAGCATGTGACCCCAGATGATGTGACCTACACAATTCTGATCAATTCGCACTGCAAGGCTGGATTAATGAAGGAAGCTGAGAAGCTCTTTCTGGAGATCAAAAAAAGAAATCTCAAGCCAAATATTTTAACTTACACTGCACTCCTGCATGGGTACAACAACATAGGGAGCAGAGATAAGATGTGTGCTCTTTTCGATGAAATGGTGGCAGCGGGGATTGACCCTGATGAAGAAACATATGGCATGCTCGAGAGAATTCCGTTGATATCTGAGGCTGCAAATACAGAGAGGCCATCTTCAATCACAACTAGCCTTTTCATTGGTGGGGCGCTGGCTGCAAGATCTGATATCTGACAATGAAGATACAAATATTAGTAGTATCTTTGAAGAAGCTTCTGATTCTATTGATCATGTTGAACAAATAGGTAGAAGTGCCACCTTGGTGATGGCGTACTTAATGCTCAGGAAGAACCTAACTCTACTAAAACGAGTTCACCACTGAGCCCAGCGCAATGATGGCTTTGCTAGGATCCTTTTGGATCTGGATAGGAAATTACATGGGACACAGCATCCATGGAATGGCGACAACGAAAGCCAATGATGAAAGTTTGCCCCATTTGTGGGAAGAAGGCCGGTCTGAGCAGCAGTTCACTTAAGCTTCATTCGCAGAAATCACACAAGAATCTTTAATCAGGAAGTGTGGACAGTGGCATGACCATGGAAATACAAAAGTCTTTGACAGCACTCAAACGGGGTCTGCCCGAGTCGAAACTGCTCCCTCGCCTGCGTCGATTGTGCTCTGCCCACCGCCTCCAGCGACACCATCTCTTTCCAGCGACACCGAGGCCGTCTGCACAGCTTCGCCACACCCCTTGTCGCCCAGCTTTCCTCCCTCCCCATTGCCAGCCCATCTCCTTTTCTTCCTCTCCCCACCCCTCGCATCTCCCCCCACCCGCGCCAGTGTACCGGATTCACTAAACGCCCAGCCCTCGTCCCACAGCTCTCCTCCCTCCCTGTTGCCCTCATCGTCCCAGAATTGATATCAACGATCCCTAGAGTCCCTGCTTCAGAATCGACATCAATGAATCTACATCTTGGCAGCCAGGTCCGCTTTATCTGAAACTCCTCACAAAGCATCACCAGCAACTCCAAGAGTTGCTAGACCAAGCAGGGGAGTAGCTAAATCATAATCTGATTCACCCTCTCCTTTGCAAAGTTCACGCCTTTCAGTTGATCGGTCTCCACGATCAGTTCCCTTGAAGCCCACCATAAGATCACCAAAACTTGCTACCCCACCTGAAGTCACTGCAATTGAAATTAATAACCTTTTTCGCGAAGACCTCTTCCTTGCCAAGGTTGGGATGGAGTGCGGCATCGGGATTTTGCAACGTCATTTTCAAGATTGTAAGGGAATCACAACATGAAGCTTTTGCAGCTCTTCATCACAGCATCAATTCCAGTCTTGAAACTGCTCTTGATTTCTGGACTTAGGGTTTATGCCAATCAGAAGAAGATAAACTAATAGAAAGAGAGAATGATCTTCACAAGCTTGAGGACGAACTTTGAAAGCGGATAGTAGAGAATAAATGTGCACATATATTATTGTGTTTGTACTAAGTTTTATTTATTGTAATGGTTTCTAGTTGGTTCAGACTATTTCTGGTTGGTTTTATCATCAATGTGTACTTTATCTATTGCTGAAGATGAATTTAGTTCCTTTTTTTCTCTC\n>HQ320065.1 Uncultured bacterium clone RMAM1139 16S ribosomal RNA gene, partial sequence \nCAGTCGAGGGGCAGCGGGGGTAGCAATACCCGCCGGCGACCGGCGCACGGGTGAGTAACGCGTATGCAACTTACCTATCAGAGGGGGATAACCCGGCGAAAGTCGGACTAATACCGCATGAAGCAGGGGCCCCGCATGGGGATATTTGCTAAAGATTCATCGCTGATAGATAGGCATGCGTTCCATTAGGCAGTTGGCGGGGTAACGGCCCACCAAACCGACGATGGATAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGTACTGAGACACGGACCAAACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGCGAGCCTGAACCAGCCAAGTCGCGTGAGGGATGAAGGTTCTATGGATCGTAAACCTCTTTTATAAGGGAATAAAGTGCGGGACGTGTCCTGTTTTGTATGTACCTTATGAATAAGGATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCTGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGCCTTTTAAGTCAGCGGTGAAAGTCTGTGGCTCAACCATAGAATTGCCGTTGAAACTGGGGGGCTTGAGTATGTTTGAGGCAGGCGGAATGCGTGGTGTAGCGGTGAAATGCTTAGATATCACGCAGAACCCCGATTGCGAAGGCAGCCTGCCAAGCCATGACTGACGCTGATGCACGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCAGTAAACGATGATCACTAGCTGTTTGCGATACACTGTAAGCGGCACAGCGAAAGCGTTAAGTGA\n>XM_048817709.1 PREDICTED: Caretta caretta kinesin family member 19 (KIF19), transcript variant X2, mRNA \nGTGCTACTGTGTCAACAGGAGCCTGCTGCGCTGCGGTTGTTGTGTACAGTTTAAAGATCTCCAGGGGAGCCGGCGAGATCCCGCAGGCAGCAAAAGCAGCTGGGCAGAGCTGGGCTGGCCCTCCTGAGTACAGCCCGGTCAGCTGGCGTGAGAGGCAGCCGGGGCTAGAGCTCCCCGAAGGGAGCAGGAATGCTGCACCCCAGCCCTTTGTGGCTCTGTAGCCTCCTGGGGGGCCGAGAGGACAAAAGGCCCTGAGCCCGTGGATGGGAAAGGAGCAGGCAGGGCTGGCGTCGTCCCTGCAGCCCGCCTCCCCCTTTTGTCTCTGGGAGGATTAGCCTAAGTCTCAGGTTGTTTAGGAAACAGCGGATGCAAGTGACAGGTCTGTGGAGGGGGGAGTGGCGGTTGCAGGGTCCTGAGAGCCATGCCTGTGGCAGCTGCTGCTGGCCCTCCCCTCTAGACCCTCTGTGCACCTGCCAGGATCATGAAGGAGGTGAAGGAGTCCAGAGACCAGCAACTCACGGTGGCCCTTCGGATCCGGCCGATCAGCATGGTGGAGCTGGAGGAAGGAGCTACTCTCATAGCTCATAAAGTGGATGAACAGGTAGCGGTGCTCATGGACCCCATGGAGGACCCCGAGGACATCCTGCGAGCCAACCGCTCCCGCGAGAAATCCTATGTCTTCGACGTGGCCTTTGACTTCACGGCAACTCAGGAGATGGTCTATCGCGCCACCACCAAGGGCCTGATCGAAGGTGTCATCTCTGGGTACAACGCAACCGTCTTCGCCTACGGCCCCACCGGCTGCGGGAAGACGTACACCATGCTGGGCACAGACCGTGAGCCCGGCATCTACGCACGCACCCTCCATGACCTCTTCAGAGCCATTGAGGAGACCAGCGATGACATGGAGTATGAGGTGTCGATGTCCTACCTCGAGATCTACAACGAGATGATCCGGGACCTGCTCAACCCGTCGCTGGGCTTCCTGGAGCTGCGGGAGGACGCCAAGGGAGTGATCCAGGTGGCGGGGATCACGGAAGTCTCCACCATCAACGCCAAGGAGGTCATGCAGCTGCTGCTGAAGGGGAACAAGCAGAGGATGCAGGAGCCCACGGCCGCCAACCAGACGTCGTCGCGGTCCCACGCTGTGCTGCAGGTCACCGTCCGCCAGAAGCCCCGCATCAGGAACATCATGCAGGAGGTGCGGGTGGGGCGGCTCTTCATGATCGACCTGGCTGGCTCCGAGAGGGCATCTCAGACCCAGAACCGTGGGCAGAGGATGAAGGAGGGAGCCCACATCAACCGCTCGCTGCTGGCCCTGGGGAACTGCATCAATGCCCTGAGCGACAAGGGGGCCCCCAAGTACGTCAACTACCGTGACAGCAAGCTCACCCGCCTCCTGAAGGACTCCCTCGGGGGCAACAGCCGCACAGTCATGATCGCCCACATCAGCCCTGCCAGCAGCGCCTTCGAGGAGTCCCGCAGCACCCTCACCTACGCCGACCGCGCCAAGAGCATCAAAACCACGGTGAAGCGGAACCTGCTCAATGTCTCATACCACATTGCCCAGTACACCAGCATCATCTCGGACCTGCGCAGCGAGATCCAACGCCTCAAGTGCAAGATCGACGCGCCGGGGCCGCGCCCGGCCCGGGGCGAGCGGGGTGACATCCGCCACATCCAAGCCGAGGTGCAGCTCCTCAGCTCCCTCTGCGACCGGCAGGAGATGGACCAGCTGCGGGAACAGCTGATCGGTGCCTTCCAGGAGCAGATGGACCTGCGGCGCCAGCTGATGGAGCTGGAGAACAGCTACATGGAGATCCAGATCGAGAGCACCCGGCACCTGCTGACCATTGCGGACTGGGACCAGGAGAAGAGGCACCGGGCGCAGAAGTGCAGGGAGGAGCTGAGGAAGGAAGAGAGCGAGAAGGATTCGGACACCGGGGATGAGCAGCCGGACGCGCCGGAGCCACAGGAAGTGAGCTCGGCCAGGGAGAACATCGCCGCCCTCATGGGGGAGCAGAAGAAGCTGCGCAAGCAAAAGGCGGAGCTGGAGAAGCGGTTCAAGGAGATCCGCCAGCGGGGGCGGCGGCTGGAGGAGGTCCTGCCTCGGCGCATCAGCTCGGAGGAGCAGCGCGAGGTGCTGAGCCTGCTCTGCAAGGTGCACGAGCTGGAGCTGGAGAACACAGAGATGCAGTCCAGCGCCCTGCTGAAGGACGGCGTCATCCGCCACAAGAACTACGTGGTCCGGCGCTTCGAGCAGCACCGCAGCCTCTGTGGCCGCATCATCCAGCAGCAGAGGCAGATCATCCACGAATATCACCTCTCAGTCCCGCACCACCTGGAGGAGCTGTATGAGATCTACCTGCGGGAGCTGGAGGAGGGCAGCCTGGACCGGGTTGCCAGCCTGGACCGCGTGGCCGCCAAAGCCCTGAAGGATACGTCTCTGCCCAAGATCCCCCACCTCCCGGCTGCTGAGAGCGCCCTGGACTCCGACCAGGAGAGCGTGAGGACGCTGGGCTCAGAGCACCAGCCACTGCTGCGGCGTGACTCCCGCAGGCAGGCCCTGCCGCCCCTCGTGCTGGATGCAGAGAGCGACCCGGCCCAGGTGTTCAGGACCAGCCCTCGGGTGCGGCAGATCAAGAGTTCGGCTGTGCTGACCCCGCCCCCCATCCACATGAACGGCATGGTGACCCAAGAGTACCTGCACCGGGGGAGCCTGGCCAGCCTGGAGAGCCCCCCCAACTCCTCCCCGGACAGCAGCGAGAACTGCTCGGACGTCGCTCTGACGCGCAGAGAGCGCAGGGAGATCCTGAGCAGCACCAAGAACATCGCGGTGAAGGCTGCCCGGCGCCGCTCCAGGGTGCTGGAGTCCGACCGGCTGCAGCTGCTGGAGCCCATGAAGGAGCGGAGCAGCCTGTCGCTGCACTCCCTGAGCGAGAGCGAAGACCCCCTCTCCCCAGAGACCCCCGCCTCCCGGGGCCCGCCGTGCCCCGGCCTGCAGCATGCCGCCAGCGAGGACAACCTGTCCAGCAGCACCGGGGAGACGGCCTCGCGGGCCGAGGGCCCCTGCCCCAGCCACTCCCCCGGGCCCTGGCTCCGGGGGCACAAGGAGGCTGGCAAGAAGCTGGAGAAGAGGGAGGAGTCGCTGGACGGCAGAAGGCGGAAACGACGGTCCAGGTCCTTCGAAGTCACCGGCCACGGGGTCTGGGGGACCCGGCATCTCTCCCGCTCCCCCTCCCTCCTCCCGGCAACTTGAAGAAAGGCCCCCAGCCCAGCCAGCACCCCCGCCTGAGCTACATCACGCTGAACGGCACCAACGCTTACGCCAAGGACGGCAGGAGCCGGC\n>BC147860.1 Bos taurus hypothetical protein LOC785621, mRNA (cDNA clone IMAGE:8182959), partial cds \nGAGTGAGAGGTAAAGCATCTCAGACACCAGAGTTAGGCATTTTGTTAAGACAGCTTCTCTTCCTAACAACCTCCATCAGAAGAAATATAAGTCCTTTGTCATTCTTATTCAGAGAAACCTGGGTTCAAGTCAGCCAGTCTTCAGACTTACTTGTGGGGAACCTGTTAGAAAGGAGCTCACTGCCGCTTCACTGCTCTACTATGTCCTTGGTGTTCACCTTGATGCTTGAGATGCTCCTGTTTCTGACAGGAGCTGGAGCCCAGTCAGTGACCCAGCCTGATGACCACATTGCTGTCTCTGAAGGAGCCCGTCTGGAGCTGAAGTGCAACTACTCATCTTCTGTTTCACCGTATCTCTTCTGGTACATACAGTACCCCAACCAAGGACTCCAGCTTCTCCTGAAGTACGTGTCTGGAGACAATCTTGTTTCAGGCATCAAAGGTTTTGAGGCTGAATTTAGGAACAGTGAGACGTCTTTCCACCTGAGGAAAATACCAGCTCATTGGAAAGACTCGGCCAAGTACTTCTGTGCTCTGAGCCCGATGGATGGCAACTATCAGTGGATCTGGGGCTCTGGGACCAAACTAATTATAAAGCCAGAAGTCAAGGACCCCAACCCCACTGTGTACCAGCTGAGAAGCCCCCAATCCAGTGACACTTCTGTCTGCCTATTCACCGATTTTGATTCAAATCAAGTCAACATGGAAAAAATCATGGGGTCCGAGGGGAGCACGGTGCACAAAACAAACAGCACCGTGCTCAACATGGAGATCCTGGGATCCAAGAGCAACGGGATAGTGACTTGGGGAAACACCAGCGATGCTGGATGCGAATACACCTTCAACGAGACCATTCCCTTCGCCTCCAGCTTGGAAATCTCCTGTAATGCCAAGCTGGTAGAGAAAAGCTTTGAAACAGATATAAACCTAAACTCCCAAAACCTGTCAGTGATAGTGTTCCGCATCCTCCTCCTGAAGGTGGTCGGGTTTAATCTGCTCATGACGCTGCGGCTCTGGTCCAGTTGAGGTCACCGACAACCTGAGAGCCCCGTGCTCCCTCGCCCCTTGCTCCTCGTCGCCCTTCCTCTCCCTCTTCAAGCAGAGAGGCGCACTCTCTGCCCCCATGGATGAGAAGGCTCCCTCCTCCTCTCTGGCCTGGCTGGCCATAACACCAACTGGATCCTCCAGATACTGGTGATCAAGATGCTGACAAGCTGCCCAGCACGGCTGCCACCCACTCTCTTCCTCACTGCTGCTTGTCACTGCCTGGCATTCTTGGCAAAGTCGGGGGGCTGCTGCAGCCTCTCCTGGCTGTGGGGACACTCCCTCCCCACCCCCACCCCCCAGAGACTGCCTCTGATGTCCCACTGGATGGTGGATCCCCAGTGGGTTCTCCTGGGCTCTAGCTCCTGGAGAATGTTGTGTGTTGTTTATATTTTTTACATAGTGTTCATAAAAAAATATATATCACCCTTTTCCCCAACATGTGGGGAAAAATTATCTTTTCACGATCTAGGCCCTGCTCTTCTGTGTATCCGAGCCACATTGTATATTCTGCTGCCACGGCTTCAATAAAAGCGATTTGGAAGAGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\n>XR_006744459.1 PREDICTED: Melitaea cinxia uncharacterized LOC123662241 (LOC123662241), ncRNA \nTTTTTGTATGACGCGAACTATAACGGTCGACTTTTACCTATACACAAGTATTAAGTTGCTTACCGTAGGAAGAGACGACCGAGTGTGTAT\n>XM_022921984.1 PREDICTED: Stylophora pistillata protein ZINC INDUCED FACILITATOR-LIKE 1-like (LOC111319159), mRNA \nTGTACCTAGTTGTTTTTATTTTGCATCGGCAGCAGTTGTGATTAATCTTAGGAAGGAAGTTGTTGTTGTACCCACAATGAATTTCTTAATGTCTTTCTTGCGTGGAATATTTTATCCTCCGGGAACAAATTCTTTGAATTGGAAGCTCTTCTTCATCGTTTTCCTCTCTACATTGTGTTCTGCAATGTCCATCACGATATTGTTTCCATTTTTACCAGCTATGGTGAAGAGTTTTGGGATCTCAGATGAAGACACAGGATATTTTGCGGGTCTTATAGCATCTTCAATGTTTATTGGACGCACAGCAGCTTGGTAAGTGTGGAGTGAATCTCTATTTCAATCAA\n>XR_008133656.1 PREDICTED: Oncorhynchus keta uncharacterized LOC118373694 (LOC118373694), ncRNA \nTGCCCCTGAACTAGACAGACTGGAACAACCTCCGTGATTTACAAGAAATCACCCGACTGTCTAGAAATGGAAAACCTTCAAACTAAGGCTGACCTATCACTTCATGAAGTACAACTTGGCCCCACATCACTTTAAAACATCAGCTGTCAATCCTCCCGCAGACATACAACTCCAGATACCCAACTCAACAGGCAGTATACATCAATGATGTCGCTCTTGCTGCTGGTGATTCTCTGATCCACCTCTACGCAGACGACACCATTCTGTATACTTCTGGCCTGATGCTGAATGAAGAGCTCTTCACTAGATACCAACACACTCAAAGGCGATTTTCTGAAAACCGCCGGAAAACGTGTGGCGAGACCCCATTTGCTCCAGTACTTTTTGATCTGCTGCAGCGCTGCTACACCACTTTCAGAGCAGCAGCACCAACCAAGACACTTCTCAGCACATTTTTGCATTCCAGTTCAACATTTACCTGCTCTGTTGCAGTCTATCGTTCTACTTCTGTGGGTTTTATGGCGGACTACAACCCCAAAATGTGTGTTCCCGCCACCAACTTGATGGGGTTGAAAAAACAAGTACATGTTCAAAGGTGGAAGAGACCCTCCAGAGTTGCTGCAGTGTGTGTTCTACTGGCTGTGATCATAGGCCTGTGGGATTCCTATGCAACTGCAGAGAGAGACCAGCTACAAAAAAGTCTAAATACCTCAACCAGAGAGAGAGACCAGCTACAGAATAGTCTGAATACCATGACCACAGAGAGAGACCAGCTACAGAATAGTCTGAATACCATGACCACAGAGAGAGACCAGCTACAGAATAGGCTAAATACCATGACCACAGAGAGAGACCAGCTACGTAATAGTCTATTTTCCACGAACACAAAGAAAGACCAGCCACAAAATAGTCTAATTTCCACAACCACAGAGAGAGACCAGCTACAGAATAGTCTGAAAACCATG\n>HM666087.1 Uncultured bacterium clone GB7N87003F9F57 small subunit ribosomal RNA gene, partial sequence \nAGAGCGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCCCGTAGCAATACGGGAGCGGCAGACGGGATAGTAACACGTGGGAACGCGCCCTTCGGTTCGGAATAACTCAGGGAAACTTGAGCTAATACCGGATACGCCCTTACGGGGAAAGATTTATTGCCGAAGGAACGGCCCGCGTCCGATTAGCTAGTTGGTGAGGTAATGGCTCACCAAGGCGACGATCGGTAGCTGGTCTGAGAGGATGACCAGCATCACTGGGACTGAGGCACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGGATGATGAAGGCCTTAGGGTTGTAAAGTCCTTTTAACGGGGAAGATAAGTGACGGTACCCGTAGAATAAGCCCCGGCTAACTTCGCGCCAGCAGCCGC\n>XM_042080615.1 PREDICTED: Alosa sapidissima tensin 1a (tns1a), transcript variant X8, mRNA \nTTCTTTCTTTCTTTCTGTCTGTCTCTCTCTCTCTCTCTCGCTCTCCCTCCCTCCTCTCCCTCTCCCCCTGTGAGTCGTGTCATGGATTTGCCTTGCCTGGAGAGGCAGCCTTTCGAAATACCAGGCGTTTTTGGGAATACTGCATCCGATGCGGAGATCCGCTGACTCCCTGGAGATGCCCTCCGTGTCCCTCGGACTTCCGGCAGCTTTGGCCGGCCGGGCCAGGACCTGGGTCTGTCTCTCCTGCATGTTCTGGCCAGATGAGTTTGAAGGGGTCCACTCCCATACCTTCCGTGTGAAGGCATTCAAGAAAGCCAAGTGCTGTGCAGTATGCAAGCAGGCTGTCACCAAGGAAGGCCTGGTCTGCAAAGCTTGCCGGTTATCATGTCATAAGAAGTGTGAAGTGAAGGTCTCCACTGCCTGCACGACTGCTGCCAACTATGAGCTGCCTCCCACTGCTGAACTTCCCCTGAAACATGTAGAGACTCCGGGATCCACCAAATCCACCAGAAGTATGGACTCTCGTCAGAGACCCTCACGGAGCCTGAGTATGATCCAGAACCTGGATGACACGGAGGTGGACCTGGTCTACATCACAGAGCGGATCATCTCACTGTCCTTCCCCACGGGCTCCGACGAGCACAGCTACACCTCCCACCTCAAGGACGTGGCCGCCATGATGAGGTCCAAGCACGGAGAGCACTACCTGGTTCTTAACTTGAGTGAACACCGAAATGACATCGTCAAGCTGAACCCAAAGGTCATGGACTTTGGCTGGCCCGATCAACATGCACCTGCCCTGGACAAGATCTGTAGCATCTGCAAGGCCATGGACACCTGGCTCAATGCAGACATACACAATGTAGTTGTCCTACACAACAAGGGCAATCGGGGTCGGACAGGGGTTGTGATCGCGGCCTACATGCACTACAGCAACATCTCTGCCAGTGCTGACCAGGCCCTGGACAGGTTCGCCATGAAGCGCTTTTATGAAGACAAAGCCCTGCCAGTGGGCCAGCCGTCCCAGAGGAGATATGTACAGTATTTCAGCGGACTTCTCTCTGGTCATATCAAGATCAACAACAAGCCTCTGTTCCTGCACCACGTCATCATGCACGGCATCCCCAACTTCGAGTCCAAAGGAGGTTGCAGGCCGTTTCTAAAGATCTATCAGGGGATGCAGCCAATTTATATGTCTGGGATATACAATGTTCAAGGTGACAGCTCCACAAGTATCTGCATAACCATAGAGCCTGGCCTTCTCTTGAAGGGAGACATCCTGCTGAAGTGCTACCACAAGCGCTTCAGGAGCCCGAGCAGGGACGTGATCTTCAGGGTGCAGTTCCACACGTGTGCTGTCCACGACCTCGCCGTGGTCTTCACCAAGAATGAGCTCGACGAGACATTCAAAGATGACAGATTTCCTGAGTATGGGAAGGTTGAGTTTATCTTCTCATTTGGACCAGAAAAGATAAAAGGGCTTGATCATCTGGAGAACGGTCCGAGTGTGTCAGTAGACTACAATACCCAGGACCCCCTGATCCGTTGGGACTCCTATGACAACTTCCACAAGCGCTGTGAAGATGCACCAGACGACGTAGTGCACACGCAGGGTCCAGTCGACGGCAGTCTCTACGCTAAGATCCGAAAGAAGGACTCCAACGAGGGCATTGTTTCCGTTAACGGCCTTCCGCCCTCCGAGCGTGCTCATCCTCCCCTCCAGCAGGCAGTCGGAGTAGCCAACCACGCGCTTCCTCTCCCTGTCGCCAACCACGCCCTCCCGGTCGCTGACCACGCGCTCTCTGTGAGCAGCGACTCGGGCAACTCCACCGCCTCCGTCAAGACCGACCGCACCGATGACCCGCAGTCCCAGCAGGGCGGCGCCGCCGGCGGAGGAAGTGGCAGCGGGGGGGCCTGCGTGAGCCAGCCGCCCGGCGCCGAACCGTCCCTGAGTCCGCGGGAGAAGCGCGAGCTCGAGCAGCTGCTCAGCGGTCTCGAGGGAGGAGGAGGAGCCCAGGGGGGCCGACAGGGGAGCCCAGCGGCCGTCGGGGGTATCCTCCACCTGGTGCCCGCGCAGGTGCACGTGAACGGGCGTGGCTTGATCCGCGCCAACACCGTCCCGGCAGCAGCATCCGCGCGCGCCGCAGACAGCCGGAGCGAAACCGAACGCGAGACTGATATCCTTGACGACGAGCTCCCAGAGGCTCCCAACAGCGCCGACAGCCTCGGGACGATCTCGTCTCTGGACGGACACGAGACGCCAGCCGCCGACAGCCAGGGACACAGCGACTACCAGACTCCCCAGCAGCAGCAGCAGCAGCAGCAGCAGCAACCGCCGTCTGACTCGACCACCGTGGACATCGAGGGACCGTCGGCTCTCCCAGATCTCCGGTCCAGCAGGAGAGACATGCCGGTGCACCAGGTGCACGGCTCGGCCTCCGCGCAGGAGCGTCTGATCGACTACAGCGACCAGAACGGGGCCATGTACCGCTCACAGTCCTACGGGGCTGCCCCAGCCATGGACCCAGGGGCAGCTGCCAGGCTTCTGCCCCAAGCGCCCGAAAGGAGCACGAGCAGCCGCGAGGCCGTCCAGCGCGGCCTCAACGCCTGGCACCAGTACGGCCTGGTGGACGACCCGTTCTTCGGGCCCATGTCGGGCCTGTCGCGCTTCCCCACGTCGCCGAGCGGCGCCTCGCAGAACGACGTGGAGCAGTCCATCGAGGCCCTCAACATGCTCATGATGGACCTTGAGCCCACGCAGACGCCTGTACCCAAGTCCCAGAGCGCCCCCCCGGGCGACAACCCGGCTACCTACCAGACGCCCTTCGCCCAGAACTACCCGAGGCCCTCGTACCAGGCGGACCAGGCCATCCACAGCTACTCGACGGGCTACCCGCCCTCCACCTCGGCCAGCTACGGCCAGTCCTCTCAGAGGTCCTCCCCGGCCTACCCGCCCATGTCGCCCTCCATGGAGCCCCACAGGGGGGCTTTCCACTCCCCCACCCACCCACAGGAGGCGTACATCCACCGGGGAGGTCCCGGGTCCCCGTCCCCCACCCTGCACCACCCGCAACCCCTGAAGCCCCAGAGCGCCTTCACCCCAGGGGGAGGCAGCTCGGTGTGCTACACCCCGGAGCTCCAGGGCATCTCCCCGTACCCCACCACCCAGATGAGCTACAGTGCCTCCTCCTCTCCCCTCCCGTCGGTTACCCCCGCCAGGGAGGCTGACCCCGAGGAGGAGAGCCTGAACCTGGAGGGGCTGGTGGCCCACCGCATAGCTGAGTACAACGCTCGCATCCGGGGCATCTCGGCGAGTATGAGCCCCCAGCCCCAGCCCCGCGAACGCCATCGCTCCTATTCTTTTTCTGGGTCAAGGTCACACACAGCAACCCCAGATGAGTCCGGTTCATCCATGCGTCGCCGCACGACCAGCGAGGGTCAGTACCACAACGGTCACGAGGATCGTCCAGCTCACGGGAATGCCTCCCGCACCCCTGTCTCGCCAGAGTTTGTTACTGTTATCGCCTCGAATCCAGGAGGCCGACCAAGGGAGGTTCACATGCACAGCTATCGGGAGGCGTTTGACGACACCCCAGACGGCAGCGGTGGCGCCCCCACCAGCCCAACCCCCAGCGCCGGTGGTCGCTCCCCGCCAGGCTTGGCCAAGACGCCTCTGTCAGCCCTGGGGCTGAAGGCGCAGAGCCCCAACGATGTTCACATGCAGCAGAGCAGCTCCGAGCCGCGAGGCTACATTGGGCCCGTGGCACACGTTGGAGGGAGGGGTCTCGGCATGTCCCCTAGCCACCAGCACCCCCTGTACCCGTCTGAAGCTATGGAGAGGGCGGCACCCCCTGCCCACGGCATCAACCCCCCGCTCTCACCCCTTGGCACCAGCCACCACCCTGAGGGACACTTCTCACATCCTGACGGCTCCATGCGAGTGGCCAGTCCCCCTGTCCCTGTGTCCAACGTGGGCTACCCGCCCAACACCACCGAGCTCACGCACCCCCACTTTTACCCCGACCCGCTGGGCTACCTGGATCCTGAAACGGCCACGGTCAACATCATGGGCGTCCATCGTGTGCCGGGCAGCCCCAACACGCTCCACCGCACCGTTGCCACCAACACCGCCCCCAGCCCCGTCCTCCAGCGCCGGCTAGCCAATCAGAGCCCAGTCACCGGGCACCGGGTCCCCCCAGCCAATGGCGGCGACCCCAACAGCCCTGTGCCCGCGCGCCACATGGGTGCCACCAAAGCGGTGCCCCAGAGCCCCACGATGGGCCGCCACACTCAGAGCCCGGGCAGCGCCGGAAGCCTGAGTCCGGAGAGGAGGCCCAGCAGGCAGGCCAGCCCCGACGAGAGGCCCGGCGGGCGCCAGTCCGGCGCCTCTGGAGGTCACCTGTATGGCGCGGAGCCAGGCTCCCAGCCCCTGCTGCCCGATAAGAGGCCCAGTGCCACCCCAACTGAGGGCTCCATGAACAGGAAGATGTCCTCGCCAGGGCCCAGCGGTGCCAGCACGCCCGTCATGCCCCCGCACGCAACGTCTGAACCTGCCATTGTCTCCATCTATGCTGATGGACCACCAGACATCAAGCTCAACGTAAAGTTTGTGCAGGACACATCCAAGTTCTGGTACAAGCCAGAGATCTCCCGGGAGCAAGCTATCTGCGTGCTGAAGGACAGAGAGCCTGGGGCGTTTGTTATCCGAGACAGCCACTCCTTCAAGGGGGCCTACGGCCTGGCCATGAAGGTGGCCTCACCTCCACCCACTGTGCAACAGAACAAGAAAGTGGGAGACATCACTAACGAGCTGGTTCGTCACTTCCTGATTGAGACTAGTGCTAAGGGTGTGAGGCTGAAGGGCTGTCCCAACGAGCCCTACTTTGGCTGTCTCTCTGCATTGGTGTACCAGCACTCCATGACACCCCTGGCTCTCCCATGCAAGCTAATGATCCCAACCCGAGACCCGAATGAGGAAGCCATTGAGTTAGCCACCCCAACAAGCTCCACCATTGACCTACTGAAGCAGGGTGCAGCCCCTGTCGGTCCCCTGACAGTTTGTCCCTCTTATGTCACCGTAGGGCCGAAGGTTCCTGATGAGTCACAGGCATGCAATGTTCTGTATATTAACTCGGTGGAGATGGAGTCCCTGACAGGCCCCCAGGCCATTGCCAAAGCCATCAGCGAGACGCTGGCGGCCCAGCCACTGCCCAGTGCCACTGTCGTCCACTTCAAGGTGTCCACCCAGGGCATCACCCTCACCGACAATCAGAGGAAAATCTTCTTCCGGCGCCACTATCCCATCAACACCGTCACCTACTGTAACCTTGACCCGCAGGACAGAAAGTGGAACAAGACAGAGGGTGGAGCGGCTAAGTTGTTTGGATTTGTGGCCCGGAAACAAGGAAGCACAACAGACAACGTCAGTCACCTGTTTGCCGAATTGGAGCCAGACCAGCCGGCCAGTGCCATTGTCAGTTTTGTCTCCAAGGTCATGCTCGGCAACCCCAAACAGTGAAGACTGCCCTGGCAGACATTTTGTTTTTTCTCTAAACTGCGTGTGTTCTTTTTTTCCTCCCACAAAGACACGTTTTTTCATGCCCTTTTTGTGTGGATATATTTTTTCATAAAGGTCTCCCCGCCCCCGTCCTTCTTTCGAAGAGATGGGAAGGAGGAGTTGAGTAAAACTGTTGACTTTATTTTATTTTTTTTTTCTTTAAGTTTTCAAGGTGTTGATTTTTCCTTCAGTGAAGTAGGAGAACATTCAGGATGGAGTCTATGCACGTGCAGGAGAGCTCAGAGGTTTTTCTGGAAGAGGAAGGGGAGAATACTTCTCCCAGTGGTTCATCCAGACTTGAAGAGAATTTAGGAATTAATGAGTTTTAAAAGAAAGACAAGTGAAGAAACAAAAAAGCAACAAAGAATCATTTTTCAGATAGAACAACCAAAGGTAGTGTTCAGAACAAGTATGCCATTATTGGACAATGTATTCCATTTTGTTTTGTAAAGGAATTTTACTTTTAACCAGACTGTCAAAAAAGTACAAAATCCCTCTGGACAAAAAAAAAAGATTTTTTTGTCTGTCTCTGTGACTTCTTCTTTCAAAAAGAACATTGAAAAAAAAAGAAAAAGTATTCAGTGACGATATGCATGTTCGCTTGCAAATGGTCCTTAGCTGCTTCTCTAACCCTTCGTTGTTGGTCAAGACTGCTCTCTTTGTAGACACTGGTGGACTCGAGATTGTAGGATGCTACCAGGTCTACCGATCACAACACCTACACACACAGACACCAGTTCAGTTGACCAAACTGCATATCAGGAAAAAAATTGAAAAACACTGTGGTCCAACATCAGCAATAATGTCACCCAGGCCCCAGGCTCAACTAGTCAAACTCAGAAAGAGGGGGAACTGTTGGGGTGGAGAGGATTGTGGATCGGCTGCTCTGGCCTGTAGATGCAAAATGTGTGTGACTGCACTGTATCAGGATGCAGGTGAGGATACAAGTCTCAGCTCATGCACAGAGCCTGTAAAGCAGGAGAGAGATGTTCTACAGGTCACCTCATACACACACAGACACACACACAGACACACACACACACACACACACACACACACACACTCACACACATACACACAATTACTGTACACACACAGAAATGTGCACATCTCCCTATAATGACCCACACTGGACACTGGAGGGGTGAACAATTCATCGCCTGGATGGACCAACAGCGATGCCCCCGCATGCCGTAGTGCAAAAGTAGCTCCTTTAACCTTTAACCTTTACCCTTCAACCTGACTCAATGAACTTTACCCCCCAGCCCCCCACTATCCTCTGAACGCAGATCACCCCTTTCCCCTGCTGTAGGAAAGAAACAAAAAAAGAAGAAAAATTGCTATGGCGACACTGATCGCTAGAGACTTCAACTGCATGTGATGCTACCTTCAGGTTTTTCTTTTCTTTTCTTTTTTACTTCAAAAAAAGGGTCTTACATCTTGTTGAAGTTCGCTATGCTCTGTCTTTATCTTTGTCACACACACACACACATACTAACACACACACACACACACACACACACACATACTAACACACACACACATCATTTCCTCTCCCGAGTGGAGTTTTATTTCAGCCAAATACACATTAGGCAATGTCTACCTTTTCTTTCAAGAAAAAACAGAGTTGCTTTCTGTTCACACTGCCCATTACCACACTTCTTTTATTCACTGTGTGAGAGCGTGGCTTAAAAAAAGAAGACAACATAAAGAAAAAACAATACACAAAGCCCAATCTTCATAAGCTATTGAAAAAAGATAAACATGACTATAAATAATGATGACTACATATGTATTACTATAAAAAGGTGACTTTAATGAAAATATTTATTTTTGTTGCTCTCTCTTGCTTTTGGGTTATTCATGCAGTATATTGAAATGACAAGATATTGTATAGTCAACATTCAAAACATCTGAGACTACATGGGGGGGAAATTATTTTGGTTAAGAGTTAAAAGTCATGAGTGAAAAAAGACATCTTGTGTGTCCAGCTGAGAGTCACTTTGTTTTGCGTGTGGCCACTGCTCCATTTTGTCTCATGTTGAGGTGTTTGAGGTGTGTGAGGGGAAGACATTCATGTATAAAAAAAAACACAATGTTTTTATTTTTGTTTTTATGCATTTTTTTATTTGTAATCCATCAGTTTGTGCCGTTGCAGGATGATAACGCTGTCTGTCAGTTGTGTGTGTGATGGAGATGGAACTAGAAGTCTGCCAGCTACAGACACTAATTTGCCCATCAAGAATGTCAAGAGGAAGGCACACAAATGTGTTTGCCAAAGAGGCAAACTCAGAAGATCCACAGCGTAGGCTACCCCATCTTTATAATTGTATAGCACTTACAGACTGCCAGTGCCACCCTAGTTAAGTTAAACCAGAATCTAAACATGTCCTCATGACTTTTCTAAGGACAAGCTACAACAGATGTCGGTGCAGTTCTTACATAGCTTCTGTTGTTGGGATTCAGTATTGGAAACGGTTGAATAATATCTCGTTATTATTAGGGGAAGAGCAGGTGTCATGGCTGCCAAGAACCTTTGTTGTAGATCATGCCGCTATTAAGCACCATACTCCATTCAAAACCACTATAGCTGTACACATATATGCAGTTTCTTCGCCTTTTTCATGTAACAAGACCTCAAAGCGAACACAAGATAACAAATGATACTGACTGTCCTTTGTGTAACATAAAAGTATGTATTTATTTCTGTTTTTAAATTATGTTTTGTTTGTGTTTTTTTCACTCACCGGTTGGTCTTCCCCATAGTCAGGCCCAGTGCTTTGGTGTCATCAGTGTTACCCAGAATGCTCTAGACTCGCAGGCGACCCGGCGGACATTTTCCTCGGATGTTTGCCTGAAGTCAGTGAGTTGGCTTTGCGAAGATGAAGTCTGGGGTTTGAATGTGTGAATGTACTACTAAGGCTGTACAGAGCTTCTGTGGGATTTATGTGTTTTTATTTTATTTTATGTTTATTTGTGTTATAATGCAATGGCTTTGTTCCTGAGGAGAAAAAAAAAAAAACATTAAAGCAATACAAACCAGTTA\n>XM_031525737.1 PREDICTED: Punica granatum senescence/dehydration-associated protein At4g35985, chloroplastic-like (LOC116196154), mRNA \nCTTTCGAATCAAACACAGCACAACTTCCTCTGTAAGCCATTCCTATTCCCTTGCCAGCCAATCACAATGTTCTTCTATTCCATGTCCTGACAAAACCAAACACAGCTCTCTCCAAGAACAGGTCCACTTCATCTGCGGGAGAGACAGAGAGGAAGAGGAAGATGGGCTGTTTCAGCTGTGGAAGCAGCAGAAGCAACAGCAGCAGCAGAGGAGGTTCAAATTCTACGTACTTTGATCCTTATGAGACAACCCAGCAAAACTCGGAACCCAGAACGACCAAGCAGCAAGTTCTGCTCCAAATCCCGTCATGCACCGTCCACTTAATGGACCAAGGAGAAGCTTTGGAGCTCTCCAGTGGCAGAGAGTTCACCCTTCTCACCATCTCGGACGAGAACATCTCCCTGGCAACCATCATAAAGGTCGGTGATGACCTCCAGTGGCCGCTCACCAAGGACGAGCCGGTCGTGAAGTTAGACTCCCTTCACTACCTCTTCTCCCTGCCCGTGAAAGATGGTGACCCGCTCAGCTATGGAGTCACTTTCATGGAACAGTATGTAAGCTATTTGGGGTACTTGGACAAGTTCCTTGAAGAACATTCGTGCTTCTCTTCTTCGGCTCCTGCTTCTTCATCTTCATATTCTGCACCGAACCGGAACCTTAACTGGAAGGAGTTTGCCCCGAAAATCAATGACTATAACAATGTCTTGGCTAAGGCCATTGCCGGAGGGACTGGTCAGATTGTTAAAGGCATCTTTATGTGTAGCAATGGCTACACCAATCAGGTCCACAAGGGAGGAGAAATGATCATGACTAGTGTTGTGGAGCAGAGGAATGGTTCGAGTTACCATGAAAGCTATGGAGGCAGCAATGGGGGTGCCCAGAAGAAGAGCGCAGTCAATATAAGCCTGAAACGTGTAAGAAAGGTGTCTAAAATGACTGACAAGATCAGCAAGAAACTGCTAGATGGAGTTCAATTTGCCACTGGATCGGTAATGGCGCCGATGGTGAAGTCCCAAGCAGGGAAGTCCTTCCTAGCAATGGTTCCAGGAGAGGTTCTGCTGGCTTCACTTGATGCTGTCGATAAGGTGTTAGATGCAGCTGAAGCGGCTGAGAAGCAAGCTTACTCGGCTACCTCAAAAGCTGCTACGAGAATGGTCAGCAGAAGGTTTGGAGAGAGTGCAGGGGAGGCAACAGAAGATGCGCTTGCAACAGCAGGTCACTGTGCAAGCACTGCTTGGAACGTCTTCAAGATCAGGAAGGCCGTCAATCCGGCATCTTCCGTCTCCACTGGGGTGCTAAAAAATGCGGGCAAGGCCAAGAATTCATACTCTTGAATTCAGTCCGATTCAACTCTATTAGTTAAAGTCTAGATGGACTAGAAACAGCATGCTCGGGTTTGTAATGGAGTCTGGAATATCTGTCTAGAACTAACTGAGAATGATTTGGTATATCATTTGCATATTGCCATTGCTGCTTCTTTCCTCAGATAGATCTTCCAATGTATGTCTGCACAATTTGTACGTAAGACATTTTTAATGCGTTTGAATTCAGAGTTAAAAAGTAACTTTAATTTTGATTTA\n>LC139547.1 Uncultured bacterium gene for 16S rRNA, partial sequence, clone: SdRy21_50 \nGTGCCAGCAGCCGCGGTAATACGGAGGGGGCAAGCGTTGCTCGGATTTACTGGGCGTAAAGGGTCCGCAGGCGGTTAAGTAAGTTAGATGTGAAAGCTCAAGGCTTAACCTTGAAACTGCATCTAAAACTGCTCGACTAGAGTCCAAGAGGGGTCGGCGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCCGACTGGCTTGGAACTGACGCTCAGGGACGAAAGCGTGGGTAGCGAACCGGATTAGATACCCGGGTAGTCCACGCCCTAAACGATGGATGCTAGGTGTGGGGATTTTATCTCCTTGCCGAAGCTAACGCATTAAGCATCCCGCCTGGGGAGTACGGTCGCAAGGCTGAAACTCAAAGGAATTGGCGGGGGCCCGCACAAGCGGTGGAGCACGTGGTTTAATTCGATGATAAGCGAAGAACCTTACCAGGACTTGACATGTTTACCTAAGCCGATGCGAAAGCATTTGGTGGTTTTGAGCTTGCTTAGAACGGTATTCACAGGTGCTGCATGGCTGTCGTCAGCTCGTGCCGTGAGGTGTCCGGTTAAGTCCGGTAACGAGCGCAACCCCTATTTTTAGTTGCCAGCATTTCGGATGGGCACTCTAAAGGGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCAGCATGGCCCTTATGTCCTGGGCTACACACATGCTACAATGGCTAGTACAATGGGTTGCCAAATCGCAAGATGGAGCTAATCCCATCAAAGCTAGTCTCAGTTCGGATTGCAGGCTGCAACTCGCCTGCATGAAGCTGGAATCGCTAGTAATCGTGGATCAGCATTGCCACGGTGAATACGTTCCCGGGCCTTGCACACACCGCCCGTC\n>XM_007532958.2 PREDICTED: Erinaceus europaeus C1q and tumor necrosis factor related protein 1 (C1QTNF1), transcript variant X1, mRNA \nCCCCCCCCCCCAGGACTTTTCATTTGTCCCACTGGTTCTCCTTCCACAAGTCTGTTTGGACCTAGAAAAAGCTCAGCTGCTGGGAGATGATCTAACCAGTGTCCCAAGAGCCCGTGGCAGTGGGCGCTCCCACTCAGGAGTCAGAGGCTTGGAGGGAAAATGGGCTGCCAGGCACTGGGATTCTCTCTGACCAGCTGCCTGCTCCTGGCCTTTACCTGCAGCCTGGTGCTGAGCCGTGTGCCACATGGACAGCCAGACCCTCAGGAGCAAGAGGGAACTGGGGAGCCACCATTGGATCACACTGAAAGGATTGAAGAAAATCATGAAAAATACAGCCCCAAGCAAGATGAGGAGCCCTCAGCAACCCAGTGTTTGCGCTGCTGTGACCCCAGCACCCCCATGTACCAAGCCATCCCAGTGCCCCAGATCAACATCACCATTCTGAAAGGTGAGAAGGGAGACCGAGGGGACAGGGGCTTGCAGGGCAAATATGGCAAGACAGGCTCTGCAGGTGCCCGGGGCCACATGGGCCCCAAGGGACAGAAGGGGTCCATCGGAGCCCCTGGGGACCGCTGCAAGAATCACTATGCAGCCTTCTCAGTGGGCCGCAAGAAGCCACTGCACAGCAATGACTACTACCAGACTGTCATCTTCGACACGGAGTTTGTGAACCTCTACGGCCACTTCAACATGTTCACAGGCCGGTTCTACTGCTATGTACCTGGCATCTACTTCTTCAACCTCAACGTGCACACTTGGAACCAGAAGGAGACCTACCTGCATATCATGAGGAATGAGGAGGTGGCAGTGATCCTGTACGCCCAGGTGAGCGACCGCAGCATCATGCAGAGCCAGAGCCTGCTGCTGGAGCTGCAGGAGCAGGACGAGGTTTGGGTGAGGCTCTTCCGGGGGGAGCGCGAGAACGCCATCTTCAGCGATGAGTTTGACACCTACATCACCTTCAGTGGCTACCTGGTCAAGCACTCCACAGAGCCCTAACCCATGGCACCTCCTCATCTCCAGCTTGCCTGTTCTCCCACCCCACTGGGTTCCAATGGTCCAGCATCAAAAGGCCCCCTGGCCCTTCACCTCCCCCACTACCCTGCTCCCTGCTCCCCAGCTCTGGCGTTCTACCCCACATTTTTCTTTAGCAGGGACAGGAAGTGAATGTTGCTGTGTGTTCTGGCCCTCTGTGGATGAAATCACAGGGGCAAATGCCCCCTCTGGAATCACATCCTTAAGTGGCCCATGGCCCAGGCAAAACATGTCTGGATATGGCAAAGAGTCTTCTTTCCTTTTCTTTTTAAA\n>XM_032266396.1 PREDICTED: Sapajus apella transmembrane protein 108 (TMEM108), transcript variant X7, mRNA \nTGTGTTTATGTAAATATTATGTCAGATTGTCTTTATTTTAGCTGTTAAAGGTACTAATTAAATATTTGTTAATGAATTATAGTGCTGTATTTATCAAGTTCTGATTTACAGGGTAAAAGCACAGTTGACCAAATTGTGTGAAACCTTGAACCTCAGACCCTCTGACGTGGGCTTACTGCTGCATTAACACCCTGTGCATCTGGTGGTAGCTTCCAAAATGATAGCTGAGGGTCTGAGTCGAAATAAATGGCTTTTAGCAAGTGTTGAACTTTGAATGTGCTATTTAACCTCTGATTAATTGATTACTCAGCTCTGAATATGAGAGGTGTATAGCTATCCCTTATCTCACTTAAGTGATTTGAGCATGGATGCTCCTCTCATTTGAATACAGTTTTTGGGGTGGGTGGGGGTGATATCAGATCCCAGGGTACATGCTATGATAATGACAGGCTTAATTATCACTCAGTATGGTTTAGGACAAAGGTTTTCTTTTGATCACAATATTAAGAAACCTTTCTTTAACAGATAGTTTTACTTGTACGTATGAAGTATATATATAAATTTATCATTTCCTATATATTTGATTCACATTCAGAGGGTATTTAAAATAGTATCTTCTTCAGAATGTATATGTTGGGATTATATATTACTGTTTCTTTCCTTTTTATGTAGTTTCTTTTTGTGGTCAGGTAAAAGAAGACTAAAGGGATGTGATATTTAGTCTCAAATATTTGAAGTATAGTCACTGTTCTGTTTCAGGGCTGTTTCCCTCTATCAATTCCTTTGATATGGAACTCCAATGTCATTTTTACTTTACAATTGATCACATGCTGGCTCACTGACATCAATTAACTAATTTGAGGCAAATTTTTAAACCAAATGCCAAATTTTAATTTACTGAGAGAATATAATCTAATAAGAAAGACTACCCTTGGGCTCTTCACATGGTGAACCCTAGTGTGGTTTTGATAAAGAAGCCCAAGTATATACTAACTATAATCTTTTCTTAAAAAAAAGTGGTGTTCTTATCTAGACCCTCCAGAATCTAGAGTAGCATCGTCCAATAAAAATGTAATATAAACCTCAAGTATGAGCTTTATATGTAATTTTAAATGTTCTAATAGCCACTTTAAAAATGAAATGTGAAATTAATTTTAGCTCTATATTTTATGTTGCTTAATATATGCAGCATATTATTTCAACATGTACAGTTGACCCTTGGTATCCATGGAGAATTGGTTCCAGGACTGCCCACAGATACCGAAATCTGTGGATGCCCAAGTCCCTTGTATAAAATGATGAGGTATTTGCATATAACATGTGCATATCCTCCCATATATTTTAAATCATCTTTAGATAACTTAAAATACCTAATACAATGTAAATGCTATGTAAATAATTGTTGTACTATATTATCTATATTGTTTTTTGTTTTTTATTAATTTACTTTTTAAAAATATTTTTACTGGGCAGTTGGTTGCATATGCAGAACCCATGGATATCGAGGGTTGACTGTAACTAATATAATGAATTATTAATGAGATATTTTGTATTTTTAAAATACAAAGTCTTGAAAGTCCAATTGAGATGTGCTGTAAGCATATTTTACACTTATAGCACATCTCAACTGGGACACTGAGGTTTCATGTACAGTACTTGATCTGTACTTAAATTAAAACTTACAGTAGAAAAAATAGATTCACATACCCAAGTCATTCCAAACATGCAAATCAGTTGTCCAGTAACTGAATCGGTGTCCATTTCTAAATTTAAATTTAACTTTAATTAAAATTAAATAAAATTTAAAGTAAAATTCAATTCCTGATTGACACTAGCAATGTTTAAAGCACTCAGTAACCACCTGTGGAGTGGCTGCCATGTTGTGTTGGACAGCACAGAAAGGACTGCTTTCTCTAGCCTTTTCCTTCACTCCTGCATGTCTCAGATGGGAAGACTTGTGTGAGACCTCTGATGGGAAGAGAATCTCATTTTGAAAGTGTGGAACCACAGACAAAGAGTTGACTTTCTTAAAAAGAAGTTTCCATTCAGGCTATATTAGAACCTGCCTGGCAAGGAGTTATCTGTCTAATATACCACATTATCTCCACCCTTGTTCCTAAATACACCCCTCATTGTCTCCCCAACAGATAAAAATATGCCAACCTTGTGTCAAGGTTGCCTCCCTGATCCCCTTGTCCTCCACTGCAGGCTGGCTCATTTCCATTACGTCAGTGTATTTCCTGGTTATAGTCCTCCTTTCTCATTGTTTCAGTTTCCACATTTGGCCTTAATTTCTATGATACCTCAGTGAAGCATTCAAATGTTTAAATTCCAATTTAGTTCTTAATTAAGGTCATGTATATCAAGGTCAATGTTATGTTAATTTGGATAACAGACATTTCCTTTGTCCCTTGCTCCAGATTTCTAGAGTGGCTGGGCTGAGAAACTTTACTTCCTGTTCACCTAGACAGAATCATGAATAAACTGGAGGATAAGCAGGACCAGATGATACCATGAAGAGAAGTTTACAGGCCCTCTATTGCCAACTGTTAAGTTTCCTGCTGATCTTGGCACTGACCGAAGCGCTGGCATTTGCCATCCAGGAACCATCTCCCAGGGAATCTCTTCAGGTCCTCCCTTCAGGCAGTCCCCCAGGAACCATGATGACAGCACCCCACAGCTCTACCAGACACGCTTCTGTGGTGACACTGACCCCCAATCCCAATGGACCCCCCTCACAGGCTTCAGCTCCCATGGCAACACCGACACCCCATACAGAGGGGCACCCTCCTACGCACACCATCTCCACCATCGCTGCGACAGTAACCACCCCCCATTCTAAAAGCTCCCTACCCACAGGGCCCTCTCCAGTGGCCACAGCAACCACATCCTCCCACCCAGAGGGCCGCCCCCCGGGGCAGGCTACTCCCACCATCCTGCTGACAAAGCCACCGAGGGCCACCGGTCGCCCCACTGCAGCGCCCCCACGCGCTACCACACGCAGGCCCCCCAGGCCCCCAGGCTCCTCCCGAAAAGGGGCTGGCAATTCATCACGCCCTGTCCCACCTGCACCTGGTGGCCACTCCAGGAGTAAGGAAGGACAGCGGGGACGAAACCCAAGCTCCACACCTCTAGGGCAGAAGCGGCCCCTGGGGAAAATCTTCCAGATCTACAAGGGCAACTTCACTGGGTCTGTGGAGCTGGACCCTTCTGCCCTCACCCCCAGGACCCGGCTCTGGGGCTACTCCTCTTCACCACAGCCCCAGACAATGGCTGTCACTACAGCGCCCAGCAATACCTCGTGGGCACCTCCCACCACCTCCCTGGGGCCTGCAGAGGACAAGCCAGGCCTTCGCAGAGTGGCCCAGGGAGGTGGTTCGACCTTCACCAGCCAAGGAGGGACGCCAGATGCCACAGCAGCCTCAGGTGCCCCTGCCAGTCCACAACCTGCCCCAGTGCCTTCTCAGCGCCCCCACCGCGGTGACCCACAGGACGGCCCCAGCCATAGTGACTCTTGGCTTACTGTCACCCCTGGCACCAACAGACCTCCATCTGCCAGCTCTGGGGTCTTCACGGCCGCCACGGGGCCCACCCCAACTGCCTTCGATGCCAGTGTCTCAGCCCCTTCCCAGGGGATTCCTCAGGGAGCATCCACAACCACGCAGGCTCCAACCCATCTCCCCAGGGTCTCAGAAAGCACTATTTCTGGAGCCAAGGAAGAGACTGCAGCCACCTACACCATGACCGACAGGGTGCCCAGTCCTTTCTCCACAGTGGTATCCACAGCCACAGGCAACTTCCTCAACCGCCTGGTTCCTGCCGGGACCTGGAAGCCTGGGACAGCAGGGAACATATCCCACGTGGCCGAAGGGGACAAACCCCAGCACAGAGCCACCATCTGCCTGAGCAAGATGGATATCGCCTGGGTGATCCTGGCCATCAGCGTGCCCATCTCCTCCTGCTCTGTCCTGCTGACAGTGTGCTGCATGAAGAGGAAGAAGAAGACTGCCAACCCAGAGAACAACCTGAGCTACTGGAACAATGCCATCACCATGGACTACTTCAACAGGCATGCTGTGGAGCTGCCCAGGGAGATCCAGTCCCTGGAAACCTCTGAGGACCAGCTTTCAGAGCCCCGTTCCCCAGCCAATGGCGACTACAGAGACACTGGGATGGTCCTTGTTAACCCCTTCTGTCAAGAAACACTGTTTGTGGGAAACGATCAAGTATCTGAGATCTAACTGCAGCAGGCTTCGCTTTGCTATTCCCTATTTTTCGTCTCTAAATTATAAATATACAAATATATATATTATAAATATAACCTTTGTGTAACCCTGACTTAATGAGAAACATTTTCAGCTTTCTTTTCCTATGAATTGTCAACATCTTTTTTACAAGTGTGGTTTAAAAAAAAATTTACAGAATGATCTGTGGCTTTATAAAATAAAGGTATTTCTAAGCAAAGCAGTTGCATTGATTGCTTCTCTTAATAACTATTTTTGAGCACCTGGGGATCCCAGGAACCCTAGTCAGGTGAGGTAAGAGACTGACCTCCTGTAGAAGCTCAGTGTTACAGTGGTCAAGTGCACAGTTCTTTGAGTGATTCTTAAAGCTCTGGTTCCTCTTGATTTGGCGTGGCCCATTTCCTCCCTCTCATACGCACACCTGTAAAGGGAACTGGGCCACCTGGGGGAAGATGGCAGACTCATGCACAGGGCAGGAAAAGGGAACACCTCATCACCCCCAAGGATGGGGGCCCTGGAGCCTCACGACACCACCATTGGATGTCATGTTTAAAAGTTGTAGACAGCAGACAGAAGCATGGAGTCCTTGGGAATCCATGGAGGACATCAAGGCATCCCAAGGCCACATCCCCCTAACATTGCTTCCACTGCTAACAACAAGACTGCCTTTCCCTGGTGGGAAAATGCTCCCTTCATGCCCGTTCCTGCATCCCCTCCAACGCTCAATCTGCATTAAACACCCGTGCCTTTCTCTTGGAGAGGGTTTAGATGCAGATCCCAGCCTTGGAGCTTTAAAATGCTTGCCCTTCTTCAAGGATCAAATGTTTATTGGGGTTTAGCTTTGTTTTCTCAAAAGGCCACGGTATTGTGCCCCTAAGGAACACGTTTATCTAAGAAGCTTTGAGGTAGCAGAGCTATGATTTTTGAAACCTTCCTCCTGCAATCTTTAAAAAAAAAAAAAAAAAAGATTGCCAAGCAAGTCATTTCCGAGAAGACATCATTACACTCCTACTTGCCCCTGCAAACCTGCTCGAAGCACCAGCCGGTGGACTTGCCACGCAGCTCGCAGCTTCCACTGCTCGCCTCGTTCCCCACTGGCTGGCTGCCTCACCGTGCCGTGTCCAGCGTGGCCAACAGGGTCAGACCCTCAGAGATGCCCAAGAGGCTGCCAGAGGTGGCTGCTTCTCTATTTTTTCCTGATCGTGGCTGAGAGAGATGATTACTGCTTTGACACTTTCTTTCTCTAAAATAAAGCTAGTTTGATAGTATATTTTGAATATAGATGCTCTTATAGTTGGATTGGGAATTGAACTCGAATGTTGATTCATATGTTTGTGTTGTTGCTGTGGTCTTTTTATCATGACTTTTTTCTTTCTGCGTTTTCCTTAAAAAAAAAGATGGCCTTCAAAAGTGTGTTCTTAGTGTTGTATAAACCTACTTCATATGAGTTCAGTTGTTGTCTCTCTTCAAAGACTCTTCAACCCACAAAGAAGCAGGTTAAATGTTTCTCTAAGTTTAATTTTCTAGCGTGTTGTTGTCTGACCTTTTTAACCTTACCATAATATTTCTGTTAACTGTTACATTTAATATACCAATGTGTGTGAGTATACATAGAGAAAAATCTGTAAAGTAAAATTTATATATAATATATGTAATCCAAGATACATATGTTATATATACACGTACGTGGATGTATGACTTATTTTTCCGTATCCACAGATTTCGGCTACCATGGATATATAAATAAACTTATTTTGTTAGCCAGAGGA\n>XR_006349495.1 PREDICTED: Manihot esculenta small nucleolar RNA SNORD34 (LOC122722555), ncRNA \nGGAGGCCTAGGATGATCTTAAATTTGCCTACATTGTCAGAGTGTTTAAATCATGACAGATTATTGAATGATTCTGAGGCCACT\n>XM_008548960.2 PREDICTED: Microplitis demolitor basic salivary proline-rich protein 2 (LOC103571010), mRNA \nTATTGTTATGATTATTGGCGGCCATATTTGAAATTTATTCGAGTTTCCAATGTAAAAAACGCCCGAGCTTTAGTTTGGTTTTCATACCCAAGCAAATGTTTGGTCACTAAAAAAAAAGGACTCAACTACGTAATTGTCAGATTATTGTCATAAATCTCATTGTAATAAATTACTTGAAACGTGTGGGTGTGCGGTATTGTATTGGTGATAAAAGAGTAAGAAAAAAAGTAAAACGTGGTATTGTTTTATTAAAATATATCACCAGCCACTAAATTGTGGTATATATATTTAGTTTAGCTTTAAGTAACTAAAAATGTCAGCTACTTTTGCACAACGCGGTCGTGTACCGCCAACTCCAGCTCAAATTCAGAAGATGCTGGACGAGAATAGTCATTTGATACAGACGATACAGGAGTACCAGAATAAAGGAAAACCTCAGGAATGTTTACAATATCAACAGATATTACATCGGAATTTAGTTTATCTCGCTTCTATTGCTGATGCGAATCAAAATATCCAGGCACTGCTACCGCCGCCACAGGGTTTGCCGCCGATGACAAATGGTCCGCAGCATGGAATGATGGGTCCGCAAGGGCCACCGAATGTCGCTCCGGGAACTCCAGGGCCTGGAGGTGAAATGCCACCGAATCCTCCGCAGCCTATGCCAATGCAGGGATTTAATCAGGGACAGCCGATGCCTCAGGGTGGCTACCGTGGTCCAGTGATGGCTGGACAGGGTCCTCCGATGAATAGAGCGAACCCTGGACCTGGGCCTCAGCAGTATCGAGGTGGGCCACAGGCTTATCCGCAGCAACCTGGACAGCAGGGGTATCCTGCTGGTTATGGGGGACAGAATCCTGGTGGGAATTATCCACAAGGTCCTCAGGGAAGTGGTTATGGAGCTGGACAGCCTAATCAGTACCCGCCTAATGCACCGCAGCAAGGCTACCCGGCGTCAGGACAGCAGAATTATGGGCCTCCGGGTTCTGTTAATAGTTATGGAGGTCAACCGGGTGCTTATCCGCCACCGGGAGGTAATCAGCCCTCTGGTGGCTACGGTCCTCCGCCGCCGAATCAGCAAGGATATCCCCCGCCTACTACGCAGCAAAACTTCTCGCCTAATCCTCAGCAGCAGCAGCAACAACAGCAGCAACAACAACAACAGCAACAGCAGCAGCAACAACAACCTGGACAGTATGGTAGTCCTAGTCCTCAGCCAAACTATCAGCCTCCTTCCCAAGCTCCTAATCAGAATGCTTATGGTCCAGGTCAGACTCCCGGTAATTATCCTCCTCAATCCTCTCAAGCTTATCCTAATAATGTTCCTCCACAGAATTATCCTCCTCCACCTCCGACGTCTAATAATGTTGCCCAGCCTAGCCAAGGACCACCACAGCAGAGTCAAGGTGGGCCGCCGCAGAATTACTCAAGTCAGCCAAGTCCTGGTGGTGGACCACCAACTCCATATGGACCTTCATCTACATCACCGCCATTTAGCACCAGTAATGTGAGTGGAGTTAATACGTATGCTCCTAGTAATCAACCTACGAGTACACCTTCTGCTTCGACTCAGACTTACCCACCATCCAGTGGACCTCCACCAGCAACTTCGCAAGCTGGTAGTTATGTTCCTGGGCCTACTCCTTCCGGGTATCCGGTGCATCAGCCGTCGCATCAAGCTCATGGTCCACATGGGCCTCATCCTGGCTCTCATCAGATTCCTCATCCTCCGCCATCACAGTCGCAACCTGGACCGCCACCTCAGTCGCAGCCACCTGGTCAATCGCAGCAACCTTCTCAACAACCGTCTCAGCAGCAGCAGTCTCAGCAACAACCACCAGCCCAATCACCACAGCAGCAACAACAACAAGGACCTCCACCTCAAGGACCCCCTCAGCAGCAACAATCTCAGCAGGGAGCGCCACAGTCTCAACATCAACAATCCCCGAGTCCAGTTCCGAGTAATTTCCCACCAACTTCCGGACCAATATCACAGGGTCCACCCTCTGGGCCTCCAGGTCCACCGGGTCCACCTCAACAACCTCCTGGTGGATATGGACCTCCACAATCTCACCCAGCGACGACGCAGACTTACGTACCCCCGGGTTCTGGTCAACCACCACAAGGCTATCCGACTCACCCCCCATCTCAAGGAGGCCAACCGCATTATGGTCATCCACAGTATCCTCCTCAAAATTATCCGCCTCATCCTCCACCGCCTTCTGCTGGTCAAGGTTATCCTCAGTATCCTCCTCGAGGTCCCCCTGGTGGTCATATGCCACCACCACCGGGTCCTCAAGGTCCTCCGCCACCGAATCAGTATGCAGGGTATGGTTACCAACAACCTCCGCAGTAAATAAAAAAATAACGAGACTTTTTTTAAATAATTCGACTATAGGATTTGTGCTATTTAATGATGTGTAATGTAATGGTTTTTTGCATTGTAATTTTTATATTTTATATATGTAATAATTTGATGATATTGATAATTAAATAAACTGATTTTTTTGTTGTACTTGTGGGATCGTTTGTGGAATAAAAAATGATTTTTGAAATCTTATTAATTATTTTATTATTTTAATTTTAATGCTCACACTTCAGCTGCCCAATTTCAAAACACAGTAAGGGACAAATTTTTCAAAGTTGATTTTTTAGAATTTATAGTTCCAGTGGAGTCTTATGGACATAATTTATTTCATATTTCAAAAATTTTCTTTTTGTCAGTTACTGTGTTTTGAAATTGAGCAGCCGATTTACTCGTACATATTTCCTTTGATATTATTAAGGTAAGAGACCTAGTACCCGATCAGGGAACTAGGATTCGATCGTTTTATAAATTTGTATGTCTATATTTAGTAAATATAGATATACAAATATATGAGTGATCAAGTACTGGGTCTTTTACCTTATATTTATTATTTAATACTTGGTAA\n>JN883616.1 Uncultured bacterium clone 254_InIs3-B9 16S ribosomal RNA gene, partial sequence \nAGAGTTTGATCCTGGCTCAGGATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAAGCACTTTATCACGATTTCTTCGGAATGACGATTTGGTGACTGAGTGGCGGACGGGTGAGTAACGCGTGGGTAACCTGCCTTATACAGGGGGATAACAGTTGGAAACGGCTGCTAATACCGCATAAGCGCACAGGGTCGCATGACCTGGTGTGAAAAACTCCGGTGGTATGAGATGGACCCGCGTTGGATTAGCTGGTTGGTGAGGTAACGGCCCACCAAGGCGACGATCCATAGCCGACCTGAGAGGGTGACCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCGACGCCGCGTGAGCGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGATAATGACGGTACCTGACTAAGAAGCACCGGCTAAATACGTGCCAGCAGCCGCGGTAATACGTATGGTGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGCAGGCGGTACGGCAAGTCTGATGTGAAAGCCCGGGGCTCAACCCCGGTACTGCATTGGAAACTGTCGAACTAGAGTGTCGGAGGGGTAAGTGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACGATAACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATACTAGGTGTCGGGGAGCAAAGCTCTTCGGTGCCGTCGC\n>MZ592923.1 Lysinibacillus sp. strain KEI8 16S ribosomal RNA gene, partial sequence \nCTTGCTCCTTTTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGGCAACCTACCCTATAGTTTGGGATAACTCCGGGAAACCGGGGCTAATACCGAATAATCTCTTTTGCTTCATGGTGAAAAATTGAAAGACGGTTTCGGCTGTCGCTTTAGGATGGGCCCGCGGCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCGACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGGCGAAAGCCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTGTAAGGGAAGAACAAGT\n>XR_004099807.1 PREDICTED: Ipomoea triloba uncharacterized LOC116026275 (LOC116026275), ncRNA \nTTTTTCCCATTAATCTGCAAAAATGAAGGCATTTTGATTAATAATTCAGGAGTGCTATGAAGGTTAGAGCCATACTTCGGTTGTGGAAAGGGAAGGCTCTTCCGAAAAAAAAGAGCAAAGAAATCATCTTCCACGACGAACAGGAATCGAGCTACATAACAGAGTAGTATGTACCAGTTGATATGTTGAAGGTTATCTCTATATTCCACAATAAAAAAGAGTATCCAGTAAAGGTCCATTGTATGTATCAGTTTCTTTGTTGAATTAAGTTCATTGTTCATATTAAATGAACTATTGAAAATATGAATATGTTCGTGATTTTTTTCTTTATGTTTTTTTTTTCTTTATGTTATGTCCATTGTTCATATAACAAAGTAGCATGTACCAGGTTTTGTTTCTTTAACTGTGTAGTTTAAGAAAAAGTTGTGGTTCTTCTCCTTTT\n>XM_029121761.2 PREDICTED: Esox lucius contactin 5 (cntn5), mRNA \nCCCCGCGCACCAGCACGCCGCAGAACAGAAGCTGCTGAGACCAACCGCCAGTCTGACGTGCAGAGTCAACCACCGAATTGTCATCTCCGCGGCTTTTATCCATTTCAAACGGCGTTCGGTAACTGGAAGGTTCCCGAAGTGTTGGCCAAGGAAGTCCAGAAAGCAACCGTCGGTGGAGAAATCGACACAAGATTACAGCGAAAGGAGGGAGGGATGTAGCTACTATTCACGTCGTCGTCTTATTCAGTAAAGACAGAGGAAAGGACCGGTTTGGAATCAGGCTGCTTTGGCATTCTGTGGTTCGGGGCGACGGAGACTGGTTGGTTACCGTTAGATTATCTGGGACTGGCAGTTGAAACAACTTGACGTTACGAAGGGAAAACCTGCATGTTCCCAGCTTTTGGCGGCACAGCTTTAATGAAGGATCACACCTGTTAACAACACTTGTGAAGGGGGCACCCACCTGAACGAGCATGGGGTCGCCGTGGAAACCACTTCTCCTGCTGTCCATCATCAGTGGCCTTTCAGACTTCGCCAAAGCTGTAGGAGGGAGGCAAGTGTCCTACGCAGCTGTTCTGAGAATGAAAGGGGACAGCTCATCATCACTGCTCAGTTCACGGAGCCGACATGCCTACAGCAGAGGACTGGTGACTCCTGATTGGCCGACGTCCTTTTCCAGCCAGCACCCGTCGCCTCTCAATCTGCTCAGCTATCAGGAGGAATACAGGAGTCAAGAGAGTGAGGAGTTCGGGCCAACATTTTCCCAGGAGCCAGATGACTCTATCTTTGCACTGGACTCTGAGGAGAAGAAAGTGATGATGAGCTGTGAAGCCAGAGGCAACCCAACACCTGCCTACAGTTGGTTCATTAATGGGACTAAGCTGGATGTAGAGGCAGATTACCGATACAGCTTGATGGACGGCAACTTGATAATAACCAACGCCAGCGAGACGGCAGATTACGGCAGATACCAGTGCATGGCGGAGAACAGCTACGGGATGATTCTGAGCAGGGATGCGCTCCTACAATTCGCCTATCTCAGGGCCTTCAGCGGCAGGACGCGAGGAGCCGTGTCTGTAAGGGAAGGACAAGGAGTGGTGCTCATGTGCAGCCCTCCACCTCATTCACCAGAGATTATCTACAGCTGGGTCTTCAATGAGTTCCCGTCATTCGTTGCCGAGGACAGCCGGCGGTTTATCTCCCAGGTAACGGGCAACCTGTATGTCTCCAAGGTGCAGCCTAGCGATGTGGGCAGCTACATCTGTCTGGTGAAGAACACTGTGACCAACGCCAAGGTCCTCAGCCCGCCCACGCCCCTTACACTCAGAACAGATGGTGTAATGGGAGAATATGAACCTAAAATCGAGGTGCATTTTTCCCCGTCTGTATTAGCAGCTAATGGAGTCACCGTGAGACTGGAGTGTTTTGCCCTGGGGAATCCTGTTCCAACCATCACATGGAGAAAGATGAACGGTAACATTCCTAAGAAGGCTCGTCTGAGGAAGTCCCAGGCAGTGCTGGAGATCCCAAATGTTCAGCTAGAGGACTCAGGCACCTACGAGTGTAAAGCAGAGAATCCCAGGGGAGGAACGGCCTTCAAGGGACACCTCCAAGTTTACACCCTGCCCCAGTGGAGCAGCAGGATAAATGACACCCAGCTGGACAGTGGGGAGCAGCTCCAGTGGGAGTGCAGAGCCACCGGGAGGCCTAGACCCTCCTATCGCTGGCTCCGTAATGGACAGCCAATTACACAACAGAGCAGGTTGGAGATGGTGAGTGGGGAGCTTATCATTCACAAGGTCCAGCAAGATGACTCAGGGATGTACCAGTGTGTGGCTGAAAACAAGTATGGAGCAATCTACTCCAGTGCAGAACTCAAGATCTTAGCTTCAGCCCCGGTCTTCAACCCCAACCCTATACGCCTGATCGCTACTTTGGGGAAGGACGTGTCGCTGGAGTGTAAACCTAAAGCATCTCCCAAGCCCAGAGTAACATGGAGGAGAGGGGACCGTAGAATACAGCCCAACAGAAGAATAATGCTGTTACGAAACAACACGCTGAGGCTCGTCAACGCCAGCCGCTCTGATGAGGGAAACTACGTCTGTCGGGCTGAGAATCAGTTTGGCTCAGCCGAGATGACGGCCACACTGTGGGTAAAAGAGGCCATGCGTGTGGACCTGAGCCCCAGCAGGGTGGAGGTGACGGTGGGGGAGAGTGTGGTGCTCAGCTGCAAAGCATCACATGACCCTTCTCTGGACGTGTCCTTCCAGTGGCTCCTCAACCAGCAACCCCTCGACTTCCAACAGGAGGGTGGCCATTTTGAATACATCCAAACACAGTCCTCCACGGTGGACCTGATGATCAGAAGCATCTTGCTGAAGCATGCTGGGAAATACGGCTGCCGAGCTCAGACCAGCGCAGACACAGTGTTTGCTGAGGCTGAACTTCTGGTCAGAGGCCCCCCAGGACCTCCTGGGGTGGTGATTGTGGAAGAGATCACAGACACCACAGCCACCCTGTCATGGAGTGCAGGTCTGGACAACCACAGCCCCATCAGCACCTACCACCTCCAGGCCCGGAGCCCTTTCTCCCTGGGCTGGCAGACTGTACGCACAGACCCCGATCCAGTGACAGGGGTTATGGAGTCGGCCATGGCTGTTGAGCTGAACCCCTGGGTGGAGTATGAGTTCAGGGTGGTGGCCAGCAACGCCATTGGGACGGGAGACCCCAGCGTTCCATCCAGAGGAGTGAGGACGAAAGAAGCAGTACCTTCAGTGGCTCCGGCTAACGTCAGTGGAGGGAACGGTCGAAGGCATGAACTGGTCATCTCTTGGGAGCCTGTGTCAGAAGAGTTCCAGAATGGGGAGGGTTTTGGCTACATCGTGGCATTCCGAGCCAATGGGACGAGAGGCTGGAAGGAGAAGATGGTGACATCAGCAGATTCCACTACATACAAGTACAGGGATGAGACATTCCCTCCCCTCACCCCCTTTGAAGTGAAGGTGGGCGTGTACAACAACAAAGGAGATGGGCCCTTCAGTGGAGTGGTCACGGTGTACTCTGCAGAGGGTGAGCCCAGAGAGGCCCCATCTGAGGTAAAAACTTCCAGCACTTCCTCTTCGGAAATTAAGATCACATGGCGACCGCCGAACCCTGGCCCAGGAAGGCCTGCAGGATACGAGGTGAGCTACTGGAGGGAGGGAGAACAGGAGGAATCTGGGAAGAAGAAGAAGACGATAGGGAACGAGACGTCTATGATGCTGACCGGCCTGGGCGGGAATAGTGTGTACCTCATTACAGTCCGAGGCTTCAACAGCATTGGCCAGGGCCCTGCAAGCATACCAAGCGCTGCCAAGACCAGGAAGGACCCTCCTGTCCAGCCTCCAGCCAACCTCATGTGGATTCAGGAAGGGAACAATGTGTCATTAAACTGGGACCCGGTCAAGTCTCAACCAAATGAGTCAGATGTCATTGGATACAAGGTCTTGTTGAGTCAGGAGGGGCGTGTCCACCACCAGGTGATGAGAACCATCAATCCCTCTGCCATCCTAACCCTACCAGAGGGGGGCACCTACATCATTGAAGTGCGGGCAGTTAGTGAGGGAGGAGAGGGAGCAGCCAGCTCCCTGGTCCGTGTACTCACCTCTTCAGGAGTGCGGGCAAAGAGCAGCCAGTGTTCAGTCCACTGTGTTCGACCCTGGGCTCTGCCATGGACATGGACTGCTCTGCTCCTTACTGTTCCTCTGGTGCCTTCAGCTTCCTGGTGAGGCCTACAGAGACCTCCTGCTCCTCTTTTACATGGAGGGACTGGGCCTCTCCTTTGTCCCCTCGCCCTCCTTCCATTCATCTCCTCCTGAAACTGTTTGCTTGCTCTGGCCTTGCCCATCAGCCAGACAGATCTGGGGCCTGCTGAGCGGATCCACTTCTAAAACCAACAAACAGATGGTCAAAAAATAACTCATTTCTGTCTTTTTTTTTCTTCACCTATCAACTTCCTGAGAGCTAAACAAAACTCTTCCTTTTTTTCTTTGGCGGGGGGGGGG\n>XM_016506093.1 PREDICTED: Sinocyclocheilus anshuiensis guanylyl cyclase-activating protein 1-like (LOC107703476), mRNA \nTGTCATTATCCCATTAGCAGTAGTTATTTTAAGGTGCCACCTCTTTTTATTGGTACTTGGATCTAATAGTTTCAGACATTCAGTATCCTGTGCTGTCACTGTGTGCGGAGGCCAGTCTGCACCTCGTTGTCAGAGCTCACAGGCCTGCAACCGTCTGGTCCAGCCATGGGGAACACACACGCAAGTCTGGACGACATACTCGCTGAGGACATGCACCACTGGTATAACAAGTTCATGAGGGAGTCTCCATCAGGCCTGATCACACTTTTTGAACTCAAATCCATCCTGGGACTGCAGGGCATGAATGAGGATGCTAACAGTTATGTGAACCAGGTGTTCTTCACTTTCGACATGGATGGGGATGGATACATAGATTTTGTGGAATATATCGCTGCTATTAGCTTAATGCTGAAGGGGGAAATCAATCAGAAACTGAAATGGTACTTCAAACTTTTTGACCAGGATGGCAATGGAAAAATTGACAAGGATGAATTGGAAACAATATTTACTGCTATACAACACATTACAAGAAATCATGACATTGTGCCAGAGGAAGTAGTGGCTCTTATATTTGAAAAGATTGATGTTAACGGAGAAGGTGAACTGACGCTGGAGGAGTTCATTGAAGGAGCCAAAGATCATCCTGACATTATGGATATGCTGAAGAAACTGATGGACCTCACTCCAGTCCTGGTCATTATTGTGGAAGGGCGACAGAAACCAATCAATACAAGTTAGGCTGACTAAACTCCAACTTAAGGACAGAGAAAACAGAAAATTCTCCGCCTGAAAGCAAAATGAAAGTGGAGTTTGGTAGTCCCACTCTTGAGGAACAGATGTAGCTTCCCACAGCACCTGTGAGAAAATTCTCGGGGGAACTTTTGCCCAAGCATGGTCCTGTCTGACCCCAGTGGAGATACCAAGCCTTGCATCTGAGCTGTCCTCAGCTAAACATTGATCTTCTAATGCTATAAGGGGGATTCAGGAAACTAAGGAACTGCTGGCAAGGCTTAGGAGTGAGCAGTGTGGTGCTTTTTAAGGAAAGGCTCAGTAGAGAACACTGTGCACACATCTAGTGACTTTCATTGGATGAGCACATCATATAATCCATGTACTTGTGCTTGAACTATTTATGGCATGACTATATTGCTCTGAGAGTGAACTCTGAGACAGTACATTGCCGATGTGGCCTGAATTGCCCTAAGAACTGGGAAATGTAGAGCAATGGTTCTCAGCTGGTTTTTGCCTACATTTTAAATTGGACATCAAATGGCAACCCAACACAGAACAAAAATAGTTTATTGTACAAAATGTACCTGTAAATCAAACATTTCTATAGAATGTTGTAATCAACATAATATTACAATGAACTGCATAGACCCAACAATTTACTACATTAGCAACCTGACCAGGCTGAGTGAGAAATATAACAATTTGATAAATTCATAAATGCAATAGTTGGCCACAATATGTTGACATCAATATCTTTGGCGTTATTAACAATGGGAAGTTGTGCCTGTTTATTTTGTTGTCCGTGACCCAGAACAGACCTAAAACCAATTTCTTGTCTGTGGCCCACCAGTTGTGACCACTGATATAATATCACAAATATTATAGCACTTTATCAAAGGAAAGCATCAAATTTTCCTGATACAGTTACCTTATGCAGTAGGTGCAAAAGAAATTCATTAAATGCATTTCCACCTGTCTTTTAGCTGATCTAAACTTGTCAAAACATTAAAACTAAAAGTTTTCAAAATTAGTACCTGCATTTTTTAGACTTATATCCTTTACCATTCAAAGGTTTGGGTT\n>XR_004899828.1 PREDICTED: Phyllostomus discolor uncharacterized LOC118497304 (LOC118497304), ncRNA \nCTGAACACACCTGCTTCATAGCATAACTGTGGGGCTGGCCAAAGTCTGTTTGTTTTTTTCTGTAAAATAAAAGACCCATTTTTCATTTTCACCAATGACATTATTGACTTGGACATTTGGACTATGGCCGCTCTCTCCCGTATGGTAGAACATTGACCGTTCTCCTTCAAAGTCTCAGTGTGATCGCTGTCGATTTCATCTGGTCTGCCCGACTGTGGGGCATCGTCCAGAGAGGAGTCTCCAGCACAGAACTTCGCAAACCACTCCTGACACGTTCCACCAGTCACGGCACCTTCTCCACACACTGCACACATCTTTTTTTGCATTTCAGTTGCATATTTACCTTTCTTGAAATAATAAAGCACAATACACAAAAATGTCTATATACCAGCCCTGG\n>MG876669.1 Uncultured bacterium clone 7H_2119_4993_17823 16S ribosomal RNA gene, partial sequence \nTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCAACGCCGCGTGAGGGATGAAGGATTTTGGTTCGTAAACCTCTGTCAAGTGGGAAGAATAATGACGGTACCACTAAAGGAAGCCCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGGGCAAGCGTTGTTCGGAATTATTGGGCGTAAAGAGTATGTAGGCGGCTAGATAAGTCAGACGTGTAAGCCCATGGCTCAACCATGGAATTGCGTTTGAAACTATTTAGCTTGAGTGCAGGAGAGGAAAGCGGAATTCCCAGTGTAGCGGTGAAATGCATTGATATTGGGAAGAACACCGGTGGCGAAGGCGGCTTTCTGGTCTGTTACTGACGCTGAGATACGAAAGCCAGGGGAGCAAAGGGG\n>JF603243.1 Uncultured bacterium clone GDIC2IK01C8G26 16S ribosomal RNA gene, partial sequence \nTCAGGATGAACGCTAGCGACAGGCCTAACACATGCAAGTCAGGGGCAGCACAAGGAGCAATCTGAGGTGGCGACCGGCGCACGGGTGAGTAACACGTATGCAACCTGCCTGTAAGCGGGGAATAACCCGTTGAAAGACGGACTAATACCGCATAATACTAAATTACTGCATGGTAATTTATTTAAACATTTATGGCTTACAGATGGGCATGCGCATGATTAGCTAGTTGGAGAGGTAACGGCTCCCCAAGGCAACGATCATTAGGGGTTCTGAGAGGAGGGTCCCCCCACACTGGTACTGAGACACGGACCAGACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGACGAGAGTCTGAACCAGCCAAGTCGCGTGCAGGAAGAATTGTCCTATGGATTGTAAACTGCTTTTGCAGGGGAATAAAGTGCATCACGTGTGATGTTTTGTATGTACTCTGCGAATAAGGATCGGCTAACTCCGTGCCAGCCGCGGC\n>XM_029711062.1 PREDICTED: Salmo trutta sodium channel protein type 2 subunit alpha-like (LOC115160726), transcript variant X3, mRNA \nACCCTGCATCTCTGCAGTCATTTGTACCCGGTAACAACCGGAAGCGCAACAGAATGCTCTGAACAAGGCGACTGTGGTGGCAGCAATTTCATAACGCTCTCCTGTGTGATTTTTTTGGGGGGGGTCCATCTCTGGGAAATACTACATTACAGAGAGGAGAACCTTTTGACTTAATCAAGTATCCACATGTGTCCTCGAATCACCTTTTTACTCGGGAGAAAGCAACATCAAGGCGTGCCTGGCGATTTTTGGCGGATTCTTCCCCTTCTTGGATGAAAAACTAATGCCCTTTCTAATGCAGGAGGCTAGCCGTTCACTCTGAAAGTGCAGGATGAAAAGATGGCACAGCTGCTTGTACCGCCAGGACCAGACAGCTTCCGCCCGTTTTGTCGTGAGTCCCTCGATGCCATCGAGAGGCGGATCGCTGACGAGAACGCCAAAAAGTCCAAGGCGAAGCCCAACAACAATGACGACGACGGGCCTAAGCCCAGCAGTGACCTGGAGGCGGGAAAATCACTGCCACTCATATATGGGGACATTCCCAAAGGATTGGTGTCCACACCACTGGAGGATTTGGACACCTTCTACAGCAACCAGAAAACCTTTATAGTGTTGAACCGAGGGAAGGCCATCTTCCGCTTCAACGCCACTCCTGCCTTGTATGTCTTAAACCCCTTCAACCCTCTTAGAAGAATATCAATTAAGGTTTTGGTACACTCATTGTTCAGCATGGTAATCATGTTGACTATCCTTACCAACTGTGCGTTTATGACCCTGAGTCAGCCCCCGGACTGGGCAAAGAATGTAGAGTACACATTCACTGGAATCTACACATTTGAATCTCTTATAAAAATTCTGGCAAGGGGCTTCTGTGTAGGGAAGTTTACCTTTCTCCGAGACCCATGGAACTGGTTGGATTTCTGTGTTATTGTCATGGCATATGTCACAGAGTTTGTGGACCTGGGCAATGTCTCAGCACTGAGAACTTTCAGGGTTCTCCGAGCTTTGAAAACTATATCGGTCATCCCAGGCCTCAAGACCATTGTGGGAGCGCTGATCCAGTCAGTGAAGAAACTATCAGATGTGATGATCCTCACTGTATTCTGCCTAAGTGTCTTTGCCCTGGTAGGGCTGCAGTTGTTCATGGGGAATTTAAGAAACAAATGTTTAAGGATCCCTCTTAACTCAACCGACCTCTTCGATGATTCATTCGACTTTAATGGGACGGACCTCAACAAGACCAAGTCGTTCAACTGGACCTATTACATGAACGATCCCAAAAATTATTACTACCTCCCAGGTAAAAAAGATGCTTTGCTTTGTGGAAATGGCAGTGGTGCTGGGCTGTGCCCAGAGGGATTCTGGTGCATCAAAGCGGGCCGGAACCCAGATTACGGCTACACCAGCTTTGACACGTTCAGCTGGGCCTTCCTGTCTCTGTTCAGACTGATGACTCAGGACTACTGGGAGAACCTCTACCAGCAGACCCTGAGGGCTGCTGGGAAGCCATACATGATCTTCTTTGTGTTGGTCATCTTCCTGGGCTCCTTCTACCTTATCAACCTAATCCTGGCTGTGGTTGCCATGGCCTACGACGAGCAGAACCAGGCCACCATTGAGGAGGCTCAGCAGAAGGAGGAGGAGTTTCAGAAGCTGAAGAAACAGCAGGAGGACGCACAGGCAGCGGCAGCGGTGACAGCGGCTGAGAGCGGGGAGTTCAGTGAGAGAGGGGAGCTCACTGACACCTCCTCAGAGGCCTCCAAACTCAGTTCCAAGAGCGCCAAAGAGAGACGCAACAGGCGCAAGAAGAAAAAGCAGAGAGAGGAGGAGGAGAGAGGGGACAATGACAAGTTTCACAGGTCTGAGTCTGAGGGCAGTGTGCAAAAGAGTCGTTTCCGCTTCTCCATAGATGCCTCCAACCTGCTCAACTACGACATGAGATGTTCCACACCACACCAGTCCTTCCTGAGTATCCGTGGACCCCTGTTCTCATCCAGACGAAACAGCCAGGCAAGCCTCTTCAGCTTCCGGGAACGAGCGCAAGATATGGGCTCGGAGAACGACTTTGCCGACGACGAGAACAGTACTTTCGAGGACAACGACAGTCGCCGGGGATCTCTGTTTGTTCCCCGGCGGAGCGACCGGCGCTCCAGCAACCTCAGCCAGAACAGCATGTCGTCACATGTCCTGTTGCCGGCCAATGGGAAGAAGCACAGCTCCGTGGACTGCAATGGGGTGGTGTCCCTGGTGGGCGGGGCTTCACTTCCCACATCACCTGAGGGACTCCTTCTGCCAGAGGGCAACACTACGGAGACAGAGTACAGAAAGGCCCAATGTGAATCGTACCAGGCCTCTATGAACTTCCTGGAGGACCCAGGGGCCAGGCAGAGGGCCTTCAGTGTAGCTAGTGTTATAACTAATACTATGGAAGAACTTGAAGAGTCGAGACAGGAGTGCCCTCCTTGCTGGTACAAGTTCTCCAACACTTTCCTCATCTGGGACTGTTGTCCGGCATGGCTGAGGATCAAGAAGACAGTCAAGATGATCGTGATGGACCCTTTTGTAGACCTGACTATTACCATATGTATTGTTCTGAACACAGTGTTCATGGCTATGGAGCACCACCCAATGTCTGGGGATTTCAAAAAAATGCTTTCTGTGGGAAACCTGGTGTTTACAGGTATCTTCACAGCTGAGATGTGTTTCAAGATTATTGCTTTGGATCCGTACTGTTATTTTAAGGAAGGCTGGAATATATTTGATGGTATCATTGTCAGTTTGAGCTTGATGGAGATTGGCTTGGCCAACGTGTCTGGAATGTCTGTCCTCAGATCATTCCGATTGCTGAGAGTATTCAAACTGGCCAAGTCTTGGCCCACACTGAACATGCTGATCAAGATCATTGGTAACTCAGTGGGGGCTCTGGGTAACCTCACCCTGGTCCTGGCCATCATTGTCTTCATCTTCGCGGTGGTGGGCATGCAGCTGTTTGGGAAGAACTACAGAGACTGTGTGTGTAAGATCTCTACAGACTGCACACTGCCCCGCTGGCACATGCATGACTTCTTCCACTCCTTCCTGATTGTGTTCCGGGTGCTGTGTGGGGAGTGGATCGAGACCATGTGGGACTGTATGGAGGTGGCTGGCCAGAGCATGTGTCTCATCGTCTTCATGATGGTCATGGTCATCGGGAACCTGGTGGTCCTGAATCTGTTCCTGGCCCTGCTGCTGAGCTCGTTCAGTGCTGATAACCTGGCGGCCACGGATGATGACAGCGAGATGAACAATCTGACGGTGGCCATAGGCCGCATCCACCAGGGCATCGCCTTTGTCAAGGCCTTGGTGTGCCGCTCCTTCCACAGCATCTGTCTGAGGAAAAAGAAGGGGAGCCTGGATGACCTCCACAGAACCAACTACAACTCCAACCACACCACTGTGGAGATCATGAAAGACCCTGAATACGTGAAGGATGACAATGGCACCACCGGTGGGGTAGGCATGGGAGTGGGTAGCAATGCAGCAGGGAAATACATAGTCAACGACAACACTGACTACATGCAGTTCATCCACAACCCCAGTCTGACCGTCACGGTGCCCATCGCTGTGGGGGAGTCGGACTTTGAAAATCTCAACACTGAGGACTTCAGCAGCGATTCCTCGGACATAGAGGGAAGCAAAGAGCAGCTAGCTAAAGACCGTCCACTGAGCTCATCAGAGGGCAGTACAGTGGACATCAGGGCCCCAGGAGAGAGAGAGGGCTCGGTGGACATGGAGCCTGAGGAGTCCATGGAAGCTGAAGGATGCTTCACTGATGGCTGTGTCCGTAGATTCCAATGCTGCCAAGTGAACGTTGAGGAGGGCAAGTGGAAGATGTGGTGGACATTGAGGAAGACCTGCTTCAGGATAGTGGAGCACAACTGGTTTGAGAGCTTTATCATCTTCATGATCCTGCTCAGCAGTGGAGCACTGGCATTTGAGGACATCTACATCGAACAGAGGAAGACCATTAAGACATTGTTGGAGTTTGCGGACAAAATCTTCACCTACATCTTCATCCTGGAGATGTTGCTGAAATGGGTGGCCTATGGATTCGCCAAATACTTCACCAACGCCTGGTGCTGGTTGGACTTTCTTATTGTTGACGTCTCTTTGGTCAGCCTTGTGGCCAACGCCCTGGGCTACGCTGAGCTGAGTGCCATCAAGTCCCTGAGGACGCTGCGAGCGCTGAGGCCCCTGAGAGCGCTGTCCCGCTTCGAGGGCATGAGGGTGGTCATAAACGCTCTGCTTGGAGCCATCCCCTCCATCTTCAATGTGCTGCTGGTCTGCCTCATCTTCTGGCTCATCTTCAGCATCATGGGTGTCAACCTGTTTGCAGGGAAATACTACCATTGTATCAACATGACCACGAGTGATCGCTTCGAAGTCAGAGACGTGGCTAACAAGACAGAATGTTTGGCTTTGACAGGTACCCACTGGAAGAATGTCAAGATCAACTTTGATAACGTGGGAGCAGGCTATCTGGCACTGTTACAAGTGGCTACATTCAAAGGCTGGATGGACATCATGTATGCAGCTGTGGACTCTCGCAATTTGGATGATCAACCCGACTACGAAGTGAATCTGTACATGTATCTGTACTTTGTGGTATTCATCATATTTGGATCCTTCTTCACACTCAATCTCTTCATTGGTGTCATTATAGACAACTTCAATCAGCAAAAGAAAAAGTTTGGAGGTCAAGACATCTTCATGACAGAGGAACAGAAGAAATACTACAATGCTATGAAGAAGCTTGGCTCAAAGAAACCCCAAAAGCCTATCCCTAGGCCAGTGAACAAGTTTCAAGGGTTTGTCTTTGATTTCATTACAAAGCAAGCCTTCGACATTGTCATCATGATTCTTATATGCCTTAATATGGTCACCATGATGGTGGAGACGGAAGACCAGACAGACGACATTCGTAAAATTCTCTACAAGATCAACCTGGTGTTTATTGTCATGTTCACCGGGGAGTGTATTCTGAAGATGATCTCACTCCGACAATACTATTTTACCATTGGTTGGAATGTATTTGACTTTATCGTTGTTATCCTGTCGATAATTGGTATGTTTCTCTCGGAACTGATAGAGAAGTACTTGGTTTCACCAACCTTATTCCGAGTCATTCGACTGGCCCGAATTGGTCGCATCCTTCGCCTCATCAAGAGTGCCAAGGGAATCCGTACACTCTTGTTTGCGTTGATGATGTCACTTCCTGCATTGTTCAACATTGGTCTTCTGCTCTTCTTAGTGATGTTTATCTATGCAATCTTTGGCATGTCAAACTTTGCATACGTCAAGAAGGAGTCTGGGATTGACGACATGTTCAACTTTGAGACGTTCGGCAACAGCATGATCTGCCTGTTCCAGATCACCACGTCTGGGGGCTGGGATCTCCTGCTGGCCCCCATCCTCAACAAGGGAGAGCCAGACTGCGACAGCCGGAAAGAGCACCCAGGAAGCACGTACAAGGGGGGAGACTGTGGAAACCCCCCTGTGGCCATTATCTTCTTTGTGAGCTACATAATCATCTGTTTCCTTGTTGTGGTCAACATGTACATTGCTGTCATTCTAGAGAACTTCAGTGTGGCCACTGAGGAGAGCGCTGAGCCCCTGAGCGAGGATGACTTTGAGATGTTCTATGAGGTCTGGGAGAAGTTTGATGCGCGAGCCACCCAGTTCATGGAGTATGACAAGCTGTCAGACTTTGCTGATGCCCTAGACCCCCCGCTACGCATCTCTAAGCCCAACAAGATCCAGTTGATCTCAATGGATTTACCCATGGTGAGTGGGGAGCGCATCCACTGCCTGGACATCCTGTTTGCCTTCACCAAACGTGTCCTTGGCGAGGGGGAAGGCTTGGACATCCTCAGGGGTCAAATGGAGGAGCGATTTATGGCCTCCAACCCCTCCAAGGTGTCCTACGAACCAATCACCACCACACTGCGCCGCAAGCTAGAGGACATGTCTGCCCTGGTCATCCAGAGAGCTTTCAGACGATATCTTCTCAAGCGTATTGTTAAGCGGGCCTCTGCCATGTACAAGGAGAAAATGCAAAGTGGAGGCACGCTCCTTGATAAAGAGCTTCTCGTCATAGACAAATTTAACGAGATCTCTACTTCAGACAGAACTGACATGACACCCTCCACAGCTTCTCCCCCATCATATGACAGTGTCACAAAACCTGAAAAAAACAAATATGAAAAAGACAAGAGAAAGAAGGAGGTGAAGGAGAAAAAAAAGTACATGGATGTTGGGAAGATTTAGCATAGAATTCATTCTGCTACAAATTGTTTACAGCCTTTGAAGGTGACCAATGCGTCAAGTGAAGTGTCTTTGGTGTGAATATCTATGCCAAACTGACAATGCTTACTTGAGTCTAAATGTAAGGTTGGTGCCTAACATGAGGCAGTGACTCACATTCTTAGGCTGTAAGAATTGTTTGGATGTTAATGGGGACTAAAACAAATGTTTGCCAGCTTTATAGGGACAGGTAAAACATTTTGTTGTGTGTTGTTACAATCAGAAACGTTTAGTTATACTGTAACTTCTCTTGCAGCTAGTACTTCCAGGGTTGCATCCAGTGTCTTGCATTATAACTGCCATATGATTTACTAACTTATTTTTCTTACAGAATCTTGTTTTTAAAACTCATAGGTTGATTGTGTGACTATTTTTGTAAACATATGTTTTACTGTAAAAAGAGGGGTTTCATGTATTGCTTTAAAGGTAGTCTTGTTCACTTTAAATGTTCATACAACTTGACTTGTCAAGTGTGATCAAACACACATCCTTGTGGGGTGCAGGGCCCAAAAAAAAGTTGGTATAAAAGAAATTGTGCCCGCACACTCATAAACCGTTTTTAAATGAAGGTACATGGTGGAGCTTATGCATGTGCGGGCTCTGTTTCGAGCATAAGACATGACTACTCATGACAACCATTATTGCTGCAGTGCAGTTAGGGGGATTGCTGCAGTTCAATCGACGTGTAGACTTGCATGAATGCTTACCCATGATTACAGTGTCGCATTACGCACCATCACCAAAATGAGCTTGATTTCTCCGTGATGTCTGAGGGACTCATACTTTGATGAATCTGTAACATTATGTTACTCTCACTATTACAAATCAACAGAAAAGATTTCTCCTGAGCATACAGTCCAAATACCATTACCAACAACTGTTGTCTATAATCAGTTTCCGAACAATAACACGCTCTAGAAAAACATAGTTTTCCTCCTTTCATTCATCAGAAACTACAGTACAATGCAGAATACATTCATCTTTAGTGCTGGTTGACAGAGTTGATACACATAGTATTCGTAGTCCAGCTCTTCTCTCCAGCTTGAACCTAAATGGCCTCAAAGACATGTCTATACTGTATTTTCTCTTCATAGTGGTGAATGATAAAATGAGGCAATTTCCTCTGCACAGTATAGTTGTGACCATCAGGTGTAAATCGCCTGAAATAATCTCCAAGCCTAGTCTGACAGGTGAAACACTGTATTCTGTGTCATATATGCTCACTTAAGAGGCATTCCGACAGCATGTATCTTGTGTACTCTGTGGTTTTGGTACTGCAACATCATTAGTAAGTGCTATAAAACTTGTCATTTACCAAATCTAAATTGCTTTGAGTTTACCTTTCCTACCCACTTCCCAAATATTTTTCCATTGTTGTTGATGTATCTGTATGTACATATTCTATAATATATGAAATATACAAATATATTTGATATATTATGTGATGTTTCATGTATAATGGAATATATGAAGTTGTTAATGTTATTTAATACATATATCTATTATATTCTGCATTCTCTGCTCTATATGGCAGACAGACCAGAGTATGAAGCATCCAGTTGAGGCTGTGGGAAGATTTTGTAGTTAGATTACACTCAATGTCTATATAAATATTGTAATATAATCATTTTTCTTTGTACTGTACAACTGTTTTGTAAATAGTTTGCTATACAATATAGCCACACTGTCTGCGCTATAGCCACTTTAGTTATTTTAAGTTTCACTGCACCCTTTCATTTGGAAATGCCTCATGTGATCTAGTGAAGGGGATGTGGACATCTCATTTTGATTCTTACATCTTTTATTTTGTGTCATTTGTAAACTGTTGTCACATTTTACCTCACATGCTTTATCATAATAAATATCTAAGATGGAACATCAGGTTCAGAGAATTCTGAATATGATTGTCTCAAGGCTAGTGTGACAGCACAAGTCTTCGATTGTTTCCTACATTTGTTTACATAGTAATCCAATTCCTCAGGATGTTACTTTTGTCAGCTGTTCCCTTTGTATAAAGTGTCACAAGTATCTGTAATTAAAATGTTATAAAGTATGTTATAAAGAGCATATGTTGCATGTAATAAAAACGTTCAGAATATGTATATACTATATATGTATACACAATGAATGTTTTGATTACATAACATTTAATAGATCACATCTTTATATGCATTATGCTTGTAGTGTATGAGTAAACTGCATGCAAGATATTGCTATAACCCATCTCATTGAAAAGCCAAAAGAATAAAGAATACATGTACCTCA\n>XR_989699.2 PREDICTED: Macaca nemestrina uncharacterized LOC105485591 (LOC105485591), transcript variant X1, ncRNA \nTGGTTTGCTGCAGGTCCGCTCCAGACCTTATTCCACTGAATCTTTCCTGCTCTTGGAGATAACACCAGTGGAGTCTGCAGAACGGCAAAGGCGGCTTTCTGCTTCTTCCTCTGAAACCTTTGTGGCAAAGGAGCACTGACATGATGGCAGCCGGAACTCTCCTGTGAAATAGGAAGATGAAGGCTGGAGTTGCATAATGATCCTTCTATTATGAGCTTTGGTAACGTCATTTTCCAGAGGGATAGTCATAAATCTTATTAGTAAAACTCAATTGCACATTTTCATCAAAAATGAGGCAGTTCCTCTAATTCAAATGAACATACACGTTTAAATACAGTCGCTGCTCTTGAGAACGTGTGTCAGTGCGCTCAGTAATTCACCATTGGTGAAGACTGACCTCTACTAAAAAAAAAAAAAAAAGAAAAAGAAAAACTGAGCATCCAAATTCAGAGAGCCTATCAAGAAATTCAGAAAGCCTATCAACAAGAATAATGCACATACCATTCCAACACTGTGTGAAGTGAGAGGACATGAGACAAGGTCATTCTTAAGCAACAAATTCTGAAGACAGACCAAAGTGTTCTGCATATCAAGCAGGTTGTGAGGTCAACGTGCAGAAAATATCACAACATAAGTTAATGCCTGCGAATGACACCCTAAAAACAACTTTTAAAAGCAGTCCTGACAGCTAGAGCATCTGCAGAAATTACCTCCACATGAAACGTTGCTTGGTGCTGCAGAAGGGGCCTCCTGTTAAGGAATACATTTGACAGTGATATCAAGAAGTGCTAGGGCGATTTAGTGGCAAGATGGCCGAATAGGAACAGCTCCAGTTTCCA\n>XR_003517074.1 PREDICTED: Zalophus californianus uncharacterized LOC113913036 (LOC113913036), transcript variant X2, ncRNA \nCCCCGACGTGCACACCCGAGGACCTAAGACACGGCTCCTACACCTGCCGCGTGCGACACCCCCGCACGGAAATCCCGCTCCTCGGCTGACCTGGTGACACAGGCCGTCACCCCTACCCCCACTTCCCCCCCTCCACCCCACTCTCTGCGTTGCTTCCGTGAGGTCAGCACTCACCTTCCCTGCAGGGATGAAAAGGGCAATTCGCGCCTCCCGCCAGCCAAGGAGTCTGCCCTTTCTTCCCCCACGCCGGGCGCTTAGAGAAGAGGAAGGACAGCAAGCTTGCTTTTGCTTTACCCTTACCTTATAAAGCACCGCTCTCGTGGTTCTGACTCAGAAGACCCCGGGGGCCCAATAAGCCAGGCCTGAGCAGCAAGCAAGCGAGGCCCGAGCAACAAGCGAGTGAACGACCAACTTGGAGTGGGAAGAGACCAGACTTAAAGCACTGAACAGGAATTCTGAAACCTAAGAAGTCAATGTTAAGGCTAGTTTCCCTAACTTACAAGGCTGGACAATACTCTTCACCATTTCATGTGGCCCAGATAGCTGGAACAGCTCCAGTCACCAGACCTCACACCAATGTCGCAAGCAAGAAGGAAAAGCAGAGACCAAGAAACTACTTGTAATTCTCAAATCGGTACCAGCAGCTGCCATGGGCCCGCTTCACTTTCACACAAAACAAAACAAACGAGAAAGCACGTATCTTTCCTTTGGCTTTGTGTAAGCTCCTTGACAAAAGATAATGACAAGATGGCCGAGAATTCGGCATCTGACCAGCACCGCATGT\n>XM_028148513.1 PREDICTED: Eptesicus fuscus transcription factor 7 (TCF7), transcript variant X4, mRNA \nCAGCTTTTCCCGCGCCCCTCACGGCCCCTCTGGATTTCCCCGCAGGCTCTCGGGCGGGAACACACTTCGCAGAGACTTTTCCCCGACAAACTTCCAGAATCTCTGGAGGACGGCCTGAAGGCCCCGGAGTGCGCCAGCAGCATGTACAAAGACACCGTCTACTCCGCCTTCAATCTGCTCATGCACTACCCGCCCCCCTCGGGAGCAGGGCAGCACCCCCAGCCGCAGCCCCCACTGCACAACAAGGCCAGTCAGCCTGCCCATGGCGTCACCCAACTCTCTCCTCTCTATGAACATTTCAGCAGCCCACACCCCACACCTGCACCGGCCGAAATCAACCAGAAGCAAGTTCACAGGCCTCTGCAGACCTCTGACATCTCTGGCTTCTACTCTCTGACCTCAGGCAGCATGGGACAGCTCCCCCACACTGTGAGCTGGCCCAGCCCTCCTCTCTATCCCCTGTCCCCTTCCTGCGGATATAGACAGCACTTCCCTGCCCCCACTGCAGCCCCTGGCGCCCCCTATCCCAGGTTCACCCACCCATCCCTGATGCTAGGTTCCAGCGTACCTGGTCACCCAGCAGCCATTCCCCACCCGGCCATTGTGCCCCCCTCAGGGAAGCAGGAACTACAGCCTTATGATCGAAGCCTGAAGACGCAGGCAGAATCCAAGGCAGAGAAGGAGGCCAAGAAACCAACCATCAAGAAGCCACTCAATGCTTTCATGCTGTACATGAAGGAGATGAGAGCCAAGGTTATTGCAGAATGCACACTCAAGGAGAGTGCTGCCATCAACCAGATCCTGGGCCGCAGGTGGCACGCACTGTCACGGGAGGAACAGGCCAAGTATTACGAGCTGGCCCGCAAGGAGAGGCAGCTGCACATGCAGCTATACCCAGGCTGGTCAGCGCGGGACAATTACGGGAAGAAGAAGAGGCGGTCCAGAGAAAAGCACCAAGAATCCAACACAGGAGGAAAAAGAAATGCATTCGGTACTTACCCGGAGAAGGCCGCTGCCCCAGCCCCTTTCCTTCCGATGACAGTTCTCTAGGTTGCTCCGGGTCCCCAGTCCCCCAGGACTCACCCTCATACCTCCTGCTGCCTCACTTCCCTACTGCACTACTTGCTAGCCCTGCAGAACCGGCGCCTACATCACCAGGTCTCTCTGCGGCACTCAGCCTCCCAGC\n>XM_032234808.1 PREDICTED: Thamnophis elegans microtubule affinity regulating kinase 3 (MARK3), transcript variant X2, mRNA \nAGGAAGCCGGGCGGCCATCTTGGATCATCCGGGAGCGGCGGCGTTGTTGCCGCCGCCGCTGCTGCTGCTAGTACTGTGGCTACTGGTTGAGAGAGCCGAGGGAGCTGGTTTGACGGCGGCAGCAGCAGCGCCAGAGGGGTTGTCTTCCTTCAGTGTTTCCAACCCAGGCTGTGACGGAAGCGTCTTTCTCCTTGGGTCTGAGCCTTCCCCCTTTGGGATAGGGGGTTGGTAGGCAGCGAAGGACTTGGGAGTTCTGGAGAAGAAGGAAGAGGAGGGGGCGCAATTAAGTCATGAGAGCCCGAGGCCCGGCGAAGCAATCCGTGTAGAGTTAGAAAACGGCTGAGGGCTTGGCCCGCTTCCCTTTGACCAGCTCTGGGGGGTTGGGGGGGTTGGTTGTTCTTTCGCAGCCGACAGTGGTTGCGCGGAAAGCGGCGGCTGCTTCCCCACTTTTCCTTCCTCAGCAGCCTGCTAGTTGGGCTGTACCGTAATTGCTGCAGCGCCTGCCCTCTCCCGGCTCCCCGCTTTTTTCTTTCGTCTTTTAACGGCACCGGACCATTTTTTGCCCCGTTTTTCTTTTGGTGCTCCATGAGAATCTCCTCTAATCTGTCCGTCCCCACCTTCTAAAGACCCTAATCTGTCTATAAGATGATTCCTGAAGATTCCCAGAGGAATCTAATGCTGCATTATCAGACTGGAAGATAGATGAGAAAAAGGGTGGTGGAGAAAATAATCACCCCAAATTTCTCTTCCCCCGTACTACCTTTTCCTTTGATGGTGGCACTTGATAACTGCTATCATGCTGTAAAATCACATTTTTTTGTAAATATATATATGTATATGTGCTCGGAGGGAGGGAGGTGTTAGGATTTTTTTATTTTTATATAATAAATAGTTGGATTTTGCCATTGCAAACGGTGCTTCAGCTAAGTGAATGAAAATGTCTACTAGAACTCCATTGCCCACGGTGAATGAACGGGACACTGAAAACCATATCTCTCACAGTGAAGGACGACAGGAAATTTCCTCCCGAACTGGTCGGTCTGGGGCTCGCTGTAGGAATTCTATAGCTTCCTGTGCAGATGAGCAGCCTCATATTGGGAATTACAGACTCCTTAAGACAATTGGAAAGGGAAATTTTGCAAAAGTGAAACTGGCCAGACATATCCTTACTGGCAGAGAGGTTGCAATAAAAATAATTGACAAAACTCAATTGAATCCAACTAGTCTACAAAAGCTGTTTAGGGAAGTAAGAATAATGAAGATTTTAAATCATCCTAACATAGTTAAATTATTTGAAGTAATTGAGACTGAAAAAACACTCTACTTAATCATGGAATATGCAAGTGGAGGGGAGGTATTTGATTATTTAGTTGCACATGGAAGAATGAAGGAAAAAGAAGCAAGAGCGAAATTTAGACAGATAGTATCTGCAGTGCAGTATTGTCACCAAAAGCATATTGTTCACAGAGATCTCAAGGCTGAAAATCTATTACTTGATGCAGACATGAACATTAAAATAGCCGATTTTGGTTTTAGTAACGAGTTTACAGTTGGTAATAAACTGGACACATTTTGTGGCAGCCCTCCCTATGCTGCTCCAGAACTCTTCCAAGGCAAGAAATATGATGGACCAGAAGTAGACGTTTGGAGCTTAGGTGTCATTCTTTATACCCTTGTGAGTGGATCTCTGCCTTTTGATGGGCAGAATCTAAAGGAACTCAGAGAGAGAGTGTTAAGAGGAAAATACAGGATTCCTTTCTACATGTCAACAGATTGTGAAAACCTGCTAAAACGTTTCCTGGTGCTAAACCCAACTAAAAGAGGCACTCTTGAGCAAATAATGAAGGACAGATGGATCAATGCAGGACATGAGGATGATGAACTTAAACCATTTGTGGAACCAGAATTAGACATCGCAGACCAAAAGAGAATAGATATTATGATTGGAATGGGATATTCTCAAGAAGAAATTCAGGAATCTCTCAGTAAAATGAAATATGATGAAATCACTGCTACATACTTACTACTCGGGAGGAAATCATCAGAGTTGGATGCTAGTGACTCAAGCTCTAGCAGCAACCTTTCTCTTGCTAAAGTCAGGCCAAGTAGTGATCTCAATAATAGCACTGGACAGTCTCCACATCACAAAGTTCAAAGAAGTATATCTTCTAGCCAGAAGCAGCGAAGGTACAGCGACCATGCTGGTCCATCTATTCCTCCAGTAGCAGCATATCCTAAAAGGAGCCAGACGAGTACTACTGACAATGACCTCAAGGAAGAAGGGATTCCATCAAGGAAATCCAACAGCAATGCAGCTGGAGGAAAAGGAATTGCTCCTGCTAGTCCTATGCTTGGGAATGCAAACAATCCAAATAAAGCTGACATACCTGAGCGTAAAAGAAGTTCTGTTACACCCAATAGCAACACTACACCTGGAGCAGCCATGACACGGCGAAACACTTATGTTTGTAGTGAACGAACTGCTGCAGACAGACACTCGGTAATTCAAAATGGCAAGGAAAGCAGTACCATTCCTGACCAGAGAACACCAGTTGCTTCAACTCACAGTATCAGCAGTGCAACAACACCCGATCGTATCCGATTCCCAAGAGGAACTGCCAGTCGTAGTACTTTCCATGGTCAGCTTAGAGAAAGGCGCACTGCCACCTATAATGGACCTCCTGCGTCACCTAGTTTATCCCATGAGGCAACACCACTTTCACAGACACGAAGTAGGGGCTCCACTAATTTGTTCAGTAAATTGACTTCAAAGCTGACTAGAAGAAACATGTCATTCAGGTTTATCAAAAGTCGTAACGTAGCCGTTGATCAGAAGGATGACAGCAAGGAAGCCAAACCCCGTTCACTACGATTTACTTGGAGCATGAAAACTACCAGTTCAATGGATCCTAATGATATGATGAGGGAAATTCGCAAGGTCCTGGATGCCAATAATTGTGACTATGAACAGAGGGAACGTTTCTTGCTTTTCTGTGTCCATGGGGATGGCCATGCAGAAAACCTCGTGCAATGGGAGATGGAAGTGTGTAAGCTTCCCAGACTGTCTCTGAACGGAGTTCGCTTTAAACGGATATCGGGAACATCCATAGCTTTTAAAAACATTGCTTCCAAAATTGCCAATGAATTAAAGCTGTAATGAGAAGAGCAATCGAGTTTGTAAATTAAGTAGCAAATTCAAGTGTTTTTGTTTTGTTTTTGAGGACACCAATGGTCATGTATAGAATACTTAGGGCAATAACTTCTGCATCTTCTGGATCGTGATATTAAAACAAAACAGTTCAGACAAGCTGCTGAGCTGGGAGGGAAGTTGGACTTTTTTTTATAAGTGCACTACAGCATTAAAGTTGCCTATGTAAAATATTCCCTTCTGCTTTATTTCCATTGCTTTGAGTCTTGACAAACAATCTAAAACACACCATGTATACATTTGGATATTCCTCCTGTTGTGTGGATGTGTGAATGTACAGTATGTGTGTATAATTATAATATAAAAGTATTATATGTAAACAATTCATTTATAGCATCAGAACTGTACCAGTACCTCTTCCGGGTTAATTTTGGTGCTAAAATGGAAATGGCCAAGGTGAAAGCCCTTAAGAATACTAAATAATCGGTAAACACAAGCTTCACAGTTCACTGTTGTGTTTAAGATTATGGAGGTTTGGGTTTATGGGTGTGAACATTATTCCTGTATTTTTTAAAATTAATTTTCATAACATGATTTAAATCCCCCCAAATAATTCTTTCTTTTCTTTTGCCTATTTATTATTATTTAAGTCTGAAATCAATTTAAATTACTTAATTATGATAATGAAAATTGTGGGGGAAATGCTTCAAGGTTACATGTTTTTTTCCTTTGCTAAGCTGATTGAGCATTTTATCCTCACCTTTTTTTGCTAGTACATATTATAATTTTAAAAATTTTACTTGAAAAGTTTGTTCTCAACTCCCATTCATTTCAGTGGAGCTGGTGCAGAGAAAACTTGTTACTAATGAAATACTGTAGAAACAGCCTGAACAATTGATATAAATTTTACATTTAGGCTACCTTATAATAATGTATTTTGAAGTTTAAAAAAACCATATTCAGACATTTCTAGTGTGAAAGAAATTCCTATGGCAAAATAATTGTGCCAGATCAGCAAAAAATGATCAGGAGAGAGAACTTTTGAATTCTAGTAATTTAATATTCTTGTACGTACTATACAATGACTGATAATGTTAATCATAATCAAAACACTATCAGCAAAGTTTATAAAAGTGAGAAAGTATGACCTGTCCAGCCAGGATTTGTGTTTTATTTGGTCTTTCCCAATTGTTTGCTGCCCAGATTTTAAAATTGGTTATGCAGGCTGGGAATTATGGGAATGGTAAAAATAAATATATTAAGGGAGATTAGAGGATTGAGAAAAGCTATTCTAAGTCTATGTCATGTGTTTCAATTTTGTCAGAGGCTTAAACTTCTTAAAAGCCTTGTTGCTGGCCAAGTCTTCCTTCATCATCAATTGCATCTCTCTAGCAAATTCTGCCCTTAGAGACAAAAAGCTATTGAAAACAGGGTGGGTAGGTAGGTGGAGAGGATTGCCTGCCAGTGACATGATAGCTCATAATTTCCATTTGGAAATGCTTCTGTAAATCTGAACAGGTTTATATGCTTTCTTGCACAGCTTCATATTTAAAAATATTTTAGTCACAATGCACTGGAGTTTAGAAGGGGGTTGTAAATGACTTAAATCTTTGTTTTTATGCTGGGTAAACAAATCCAATCCCTGGACCTTTATCTAAACTTCTATTTTCTAAGCTTGTGACAAAGCTTCAGACATTCAACATAATTATGATGACTAAAACACTTTTTAAGAAGGCTTGCTGGTCCTGCATTGCAGGTGATACGAAGCAATTTTAGGGTGTACTCTACATGAATTGGCTGTAACTATCTGCCTTTTTCAAACTGCTATCTCCTCTGCTGGTCCTTACTAAATTGGGTATGATTTGTCTAAATCAAGTCATAGGATGATATAATCTTTTCTGCTGCCTTAATCAATGCCTTTTGATTCAAACTTGTTAGGAGCTTAAAGTATCATGTATTAGATATATGGTCTGGCAGAAAAAACCTTCATTTAAAATGTAGTGAATTGAATTATAATATTTCATTTGGAGGCACCCAACTAAAATTCAATCCAGAGTGGTAATACAGAATACTGAATGTTCTAGACATTTTTCATTTATGTGTAATTCTCCCTTGAAACTTTGTAAAGATGTTATATTAATCCTGCATTGCGGTACTATAGCACAAAGTGACTGACTTCTGGTTTGTTTTTGATTTTTCTTAATGAAAAGAACAGTATTCTGTATAGAGATTTAATTATAACAATTGTTCAACAGTGGCTGTAGCAAGTACTGATTCTCCATTTT\n>XM_019789640.1 PREDICTED: Branchiostoma belcheri mucin-5AC-like (LOC109485937), mRNA \nAGGTGTGTACATGTGAAGTCTATTGATCCCCAACCGCCGTCCTGTGAGACACTTGCCTTCACCATGGAGCCGGGGAAACACATCTGCGCCGCGGTAGTCCTGTTGGGGTACGTTATTTCAATAATATCGACTTCAACAAGCCCGATATATCATGTAAGCTACCAACGTCTTGCCGATGCAACACAAGTGCCACCAACGTCTCAGCAGGAACATACCATTTCGACTGACAAAGAAGCCCCCACAGACAATGTGCAGACCACGGTAGAACAGGATACAGCAACTTCATCCGGTGGGAATGGAGTGACAGCCTTGGGAACAGCAATATCTACAATAACAAGGTTGGTAACAACGTCATTAGTTGACTCTAGTACTGAGTCTGACACTGTTCAGAACACAAACACGACAGCAACAGACGCGTTTACAATTGTGGATGCCCAAAGTACTGCAAACAGTGCCACGGGCGTTGTAACGGCAGCTGTTACAACTGAAAAGTCTTTCGTTACTACCGATACTGTTACAACAACTGATACAGTAACCCCGGTCATTACTACTGATGTTGGCATAAATGACGCAACTGGGTCCACCACCACTGACACCTTCATCACTCCAGTTACAACTGATCCTGTCATTACAACGAAAGCTGGTACAGCATCTGTAAAAACCGAGTCTGGCCTTTCCACACATGCTATCACGCCGTCTATCACAACGGAACCTGTTCAAACAACATATGTTTCTACACCTGCAACAACAGAGAATGTCATTACCGACAATGGCATAACAACACCCGTTACCACAGATTCTGCCCTTACCACTGATGCAATTGCAACATCTAGTAGAACAGAAGATGTCATTACAACTGATGCTGGTACAACGTACGTCAATACACAACCTGCGATAACCACGTATGTTGTAGCAACAGCAGCCACTTCACAGCCAACCGTCATCACTAATGCAGCCACAGCACCTGTTACACCACAACCTGGCCTTATAATAATTACCACTAACGCGGTTACAGCATCAGTTATAACACAGTATGACCTTCCCAGTGGCGCGGTTACAACGCCGGTTACAACACATCCTGGCATTACCACTGGTGCTAACACAATATCGATTACAACAGATCCTATTTCTACCACCAACGCGAATACAACATCACTTACACCACAGCCTACCCCCACCACCATCGCTGATACAACATCTGTCACAACAGATCCTATTTCTACCACGAACGCCGTTACAACATCAGTAACAATAGAACCTATCTCTATCACTAACGTCGATACAACATCTGTTACAGCAGAAACTATTTCTACCACCAACGCTGATACAACACCAGTCACAACAAATCCTATTTCCACCACCAACGCTGTTACATCAGTTACAACAGAACCTATTCCCACTACCAACGCTGAAACAACATCAGTCACAACACAACTCATTCCCACGACGAACGCCGAAACAACATCAGTTAAAACAGATCCTATTCTCACCACCAACGCCAATACAACGGTATTTACAACACAACCTATCCCAACCACCATTGGCTTTACAACATCAGATGTCACATATCCTATTTCTACTACCAACGCTGTCACATCAGTGACACACTGCCTACCCCCACCATCAACTCTGATACAACATCGGTCACAGCAGATTCAATCTCTACCACCAACACTGGTACAACATCAGTCACAACAGATCCCATTTCTACAACCAACGCTGTTACATCAGTCACAACACAGCCTACCCCCGCCACCAACGCTGTAACAACATCTGTCACAA\n>XM_034695841.1 PREDICTED: Notolabrus celidotus SPO11 initiator of meiotic double stranded breaks (spo11), transcript variant X5, mRNA \nGAAGTAAACAACGGCCAAGCTGATAGCGAACCTGCTTCTTTTGCATCACTTAAGAAGTAGTTTGTATGGAATTCAACAACATTCACAGCACCTAAAAACTGAGATCCCTGTCAAACGCGAAGAAAAAAGGAAAGCGGATACGAGCGCTGTGCATTATGGGAAACAGTACGCGAGGTAGACTGGTCCTATGAAAACTTCCCAGATCAGTACGACATCGAGCTGTATTCTGAAATTGACAAGCTCCGTGCTCAGCTGCTGCACAATGTCGAATTAATGTCGGACCGCCAGTGGATGATAGAAGAAATCAGCGACAGAGAAATTCTGACCCGCATCGAAAATGTAATCCTTGGAATAGTGACAAGTCTGTCCAAAGATGAGGCCCCTGTCCTGGCACTGCCCAACAGATCCAGCTGGGCCAACATCAGTTTTGACAGTGCTGTTGGGCTTCAAATGAGTTCAGGAAGTTCTGTCACAACCATAAGGAGCGACTGTAGCTCATCCATCACGAAATTTGCTCAAATTCTCAAGATCCTGGCGGCCATCTACAGACTGGTGCAGAGCAACTCTTATTCTACCAAGAGAGACATCTACTACAACAACCCACAGCTGTTTGTTTCACAAAGGACTGTTGATAGTATAGTAGATGACATCTCCTGTATGCTAAAGGTTCCTCGCAGATCTCTACATGTGTTGGCCTCGTCCAAAGGATTGATCTCAGGTGATCTGTCTTATCTTGAAGAGGACGGCACAAGAGTTGACTGCCGCTCAAGCTCTGCTGCTGTTGCTGTATCGTCAAACATTGGTGGGATTAAGAATATTGTATCATCTGCAAAGTTTGTCATGATAGTGGAGAAGGATGCGACGTTTCAGCGACTGCTCGACAACGACTTCTGCACAAAGCTCGCTCCCTGCATCATCATCACAGGAAAAGGCATGCCAGATGTGAACAGCAGGTTGATGGTGAGAAAGCTTTGGGACACGCTACACATCCCCATCTTCGCTCTGGTGGACGCCGACCCTCACGGGATGGAGATCATGTGTGTCTACAAGTATGGATCAGTGGCCATGTCGTTTGAGGCCCACAGCCTGACCGTCCCCAGCGTTATGTGGCTGGGCCTCCTCCCCTCTGACCTCCAGAGGTTGCGGGTTCCTGAGGATGCCCTGATCCCTCTTACAAAGAGAGACCAAAGCAAACTCAACAGCCTCCTGGAGAGACCGTACTTAAGCAGCCAGTCAGACTGGCAGAAAGAGATGGAGCTGATGCAGCAGAGTAAAGTCAAGGCTGAAATACAGTCCCTGGATGCTATTGCACCTGATTTCCTGACCAGCATCTACCTGCCCAATAAGCTGCGTTATGGTGGCTGGGTATGAGTGCAATGCTGCCACCTAGTGGGGATCTAAGACTACTGAGATCCCTCACCCTTTTATTAAAACCCTGTGAATATGGTGAAAACTCGCACCATGTTTTTTGTGTTTATGTTCCCAAGATGTTTGGACATGCTGTTGAAGTCTCATCAAACACACTATGTTAGTTTAAGTAAAGTCCAGCCTGTTTTACAACCACTCAACACCCCTAAGTATGCTCATTAAAAGACTTCAAGTCAACAGA\n>XR_007695918.1 PREDICTED: Diabrotica virgifera virgifera uncharacterized LOC126878978 (LOC126878978), ncRNA \nTCGGAAAGGAGGTGTTCTCTTCACCAGTTGGTGGTTTTAAAGGCCGTAGCATACCTAGAAGGGCGGTGAATGTGGTTGGACCAAACCCTTTTTCAATTATTTGGACCAAAAGAGACCAATTATAGAAAAAACTCGAGATAATCTGAATTGCGGCATTATTTTGAGTTAGTGTTTTCTATTACGTTTCGCCATGGTTTGACCATGTGATCGTGGTACCTTTTTGTAACATCGGCTATTTATTTTAGGGTTTTTATTTTGGGGGAAAACAGATTTCCTGTATACTTTTATCTTTGATGGGAGATGTTTGCATTTTGATTAAACATATTGCATATTTTGCTGTAGTACTGTACTGGAGTTTTGGTGAATGGTAGTTTCCTGGATTCGCTTGCACGTGGTTTCATTGAGGTTCTGGGGGAACCATGCGGCGTAGCTGAACCTTTTCAGTGGAACGGGTGGATTGGTAACCTATTCAGTTATTTCTATAGGATTTATAGGAGTCCCGTGGGGACGTGATGACCTTAGTTGGGGACAATTGGAGAAGTGTAAATAACTATTTTTATTTATATTGTTTATTGACCTGGGAGGTGCTGCTTGTAAAGAGAAATGGCGAAATTTGCGTGTTGTGTTTATGAGACACTTGAAACCTTTGCCAAGTGGTTCTAAAAAAAAAGACCGTACTATTTACTTGATTATATCCAATTTTTGTCGCCATATGTAAAACCAATTAATCTGCCCGAAGTAGGGGACCTCCCGTCCACTTCAACAGAGGATACCGAAATACATGCTACCATTGATGTGTCAAACGATGTTCCAGAAGATTTGGCTACAGAGTCCGAGCAATCTAAAAAGCCTACCTCTCCCAGTATACATAATAGTACAATAATTCAACATTCTTCCAACTCAAAGCAAATGAAGTTTTCATTTCACGAGACAGATAAGTTTTTCCTCAATTATTTAAAAGAAAAAGCTACTAAATCTTCTACGGAGACTTCCACGGACTCTGTTATGTCATTTTTAAACACTCTTGCACCCGAATTAAGAGAAATGAATATGCACTAGGTCAAAATATTCAAAAGACGTGCACTAAGCCTAGTTGATGATATATTGAATCCATCTTCTACTGCGCCTGAAAGTCAAACAATGAGTGCATTAACTAAATTAAGTAGTGAAACGTCCCGGGACACAATATATTCTCCGCAGCCGTATGGTAGTCCTTCATTTGTGCAGCCACTGCAGTAAGTACCAACAACTAATCCTCTGGACTTCAGCGGGGTACGAACACAAAACTTTATGCAGGCAGTATCAACAACTAATCCTTTGGACTTAAGCGGAGTATCGACAGAAATCTCATTAAATTGTACAGAATACCCTTCTGTCAGCCAGAACATGTCGTTATAACTCATTTTATGTTTAAATATAAGTAATAATAATTAGATACCTACTGATAAAAATTAGATTTCGTCATTTCAATATTATTTTAATCATTGATTTAAATAAATATTTTAAAATACTTA\n>AB291824.1 Bradyrhizobium sp. Pd-E-(r)-e-D-6(2) gene for 16S rRNA, partial sequence \nTTTATCGCCGAAAAGATCGGCCCCGCGTTCTGATTAGCTAGTTGGTGAGGTAATGGCTCACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGATGAAGGCCCTAGGGTTGTAAAGCTCTTTTGTGCGGGAAGATAATGACGGTACCGCAAGAATAAGCCCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCTAGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGGTCTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGATCTTGAGTTCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATGCCAGCCGTTGG\n>XM_037164408.2 PREDICTED: Artibeus jamaicensis staufen double-stranded RNA binding protein 1 (LOC119063191), transcript variant X6, mRNA \nGTTTCTTCCTTCTTTCCTTCTTCCTTCCTTCCTTCTCGCCGCCGCCGCCCAGGACCGCCGGTCAGGAGACGAGCTCCGGGCAGCAGCCAGGAGTTTTCTAACCACATAACCACTCAGATCTGAACCAAAACAACATTGTTCCCGGAGCACCTCTTTTTAAGGTAGAACTTTAGACTTCATAGCACTGAATTAACCTGCACTGAAAGCTGTTTACCTGCAGTTATTCACTTTTGTTGAAAGTGACCATGTCTCAAGTTCAAGTGCAAGTTCAGAACCCATCTGCTGCTCTCTCAGGGAGCCAAATACTGAACAAGAACCAGTCTCTTCTCTCACAGCCTTTGATGAGTATTCCTTCTACTACTAGCTCTCTACCCTCTGAAAATGCAGGTAGACCTATTCAAAACTCTGCTTTACCCTCTGCATCTATTACATCCACCAGTGCAGCTGCAGTTCCTTCTAGCATGGCACACCCCAAAGAGAAAACCCCAATGTGTCTTGTGAATGAGTTAGCCCGTTTCAACAAGATTCAGCCTGAGTATAAGCTTTTGCGTGAGCAAGGTCCGGCTCACTGTAAGGTGTTTACAGTACAGCTAACACTTGGAGATCAGCACTGGGAAGCTGAAGGAAGTAGTATTAAAAAAGCCCAACACACAGCTGCTGCCAAAGCTTTGGAAGGAACAAAATTTCCTAGACCCATAGTCCGCCCTTTTCGTAGCGAAGGAAGGAATCCAGAAAGCATAACCCCTACTGTAGAGCTAAATGCACTGTGCATGAAACTTGGAAAAAAACCAATGTACAAACCCGTTGACCCTTACTCTCGGATGCAGTCCACCTATAACTACAATATGAGAGGAGGTGCTTATCCCCCAAGGTACTTTTACCCATTTCCAGTACCACCCTTACTTTATCAAGTTGAACTTTCTGTGGGAGGACAGCAATTTAACGGGAAAGGAAAAACGAGACAGGCTGCGAAACACGATGCTGCTGCGAAAGCTTTGAGGATCCTGCAGAACGAGCCCCCGCCCGAGAGGCTGGAGGTGAACGGAAGAGAATCAGAAGAAGAAAATCTCAATAAATCTGAAATAAGTCAAGTGTTCGAGATTGCACTTAGACGGAACTTGCCTGTGAATTTTGAGGTCGCCCGGGAAAGTGGCCCACCTCACATGAAGAGCTTTGTGACCAAGGTGTCGGTTGGGGAGTTTGTGGGGGAAGGTGAAGGGAAGAGCAAGAAGATTTCAAAGAAAAATGCTGCTATAGCTGTTCTTGAGGAGCTGAAGAAGTTACCACCCCTGCCTGCAGTCGAGCGGGTGAAGCCCCGAATCAAAAAGAAAACAAAGCCCATAGTCAGGGTACAGAGTGGCCCAGAGCATGGCCAGGCGATGAACCCCATCAGCAGACTCGCCCAGATCCAGCAGGCGAAGAAGGACAAGGAGCCGGAGTACATGCTCCTCACAGAGCGAGGCCTCCCACGTCGCAGAGAGTTTGTGATGCAGGTGAAAGTGGGAAAGCACACTGCAGAGGGAACGGGCACCAACAAGAAGGTAGCCAAGCGCAATGCGGCCGAGAACATGCTGGAGATTCTTGGTTTCAAAGTCCCACAAGCTCAGCCCACCAAACCAGCCCTCAAGTCAGAGGATAAGACACCCATAAAGAAACCAGGGGATGGAAGAAAAGTAACCTTTTTTGAACCTGGCTCTGGGGATGAAAATGGGACTAGCAATAAGGAGGATGAATTTAGGATGCCTTATCTTAGTCATCAGCAACTGCCTGCTGGAATTCTTCCCATGGTGCCCGAGGTTGCCCAAGCCGTAGGAGTCAGTCAAGGACATCACACCAAAGATTTTACCAGGGCAGCTCCGAATCCCGCGAAGGCCACGGTAACTGCCATGATAGCCCGTGAATTGTTGTATGGGGGCACGTCGCCCACAGCCGAGACCATTTTAAAGAATAACATCTCTTCAGGCCACGCACCCCATGGACCTCTCACGAGACCCTCTGAGCAGTTGGACTATCTTTCCAGAGTCCAGGGATTCCAGGTCGAATACAAAGACTTCCCCAAAAACAACAAGAACGAATTTGTATCTCTTATCAATTGCTCCTCTCAGCCACCTCTGATCAGCCACGGTATTGGAAAGGATTTGGAGTCCTGCCATGACATGGCTGCACTGAACATTTTAAAGTTGCTGTCTGAGCTGGACCAACAAAGCACAGAGATGCCAAGACCAGGAAATGGACCAATGTCTGTGTGTGGGAGGTGCTGAACCTCTTCTGGTCATGAACCGTTATATAAACTTCCCAACAGATACTGAAAATCCTGAGACTGCTTTTGAAAATTTGGAATTTCTGATACCTCGAGTGGGCCGAGAGACGCGATGGGTAAAGAACTGGAGACAGCAGTGGTGACAGAGGCTGAGGCTGCTCGCATGTGCTGTGGTTTGTCCCCACACGGCAGCAGCTGCTGTGGGGGAGGTTGGGACCTGCCAAGCAGCCCTTAATTGCAAAACCAGCAGGTCCCTGCCCCTGGCACTTCAGTGCTTGGGTTTTTTTTTTTTTTTTTTTTTTT\n>XM_035643150.2 PREDICTED: Scophthalmus maximus uncharacterized LOC118315681 (LOC118315681), transcript variant X2, mRNA \nGCTCCGGGTCCACGTTCAGTTCATCTGGTTTCCTTGTTGCACCCAGCCAGAGGACAGGACTTTAGAAACCTCACACTTTACTTTCAAAGAAGACAATTTGTTGCCTCTGCAGAACTAGAGCCGACTTAAAACATGGTTGATAGAAGGATTGCACTGGAGGCGTTGGGTGTGCTCTGCAATGCCAATGTGACGTCTGTTCAGCAACAGAGATCACAACCTGGTGTGTGCATCCTTCAAGGACGACAGGAGCAGCTGTTCATCAAGCAGCTCATCCCCTCTGTCTTGGATGCAGATGAAACCTGCCAGGTGTCCAGATCCAGCTTCTACCGCATCCAAGCCATCTTGGAGAGCAGTGAACCGGCAGATGGCTTCCCCAGGCTGGCCGTGGTGGCTGTTCCAAAGAAGGACCACATCATCGATGAGGAAGAATTCTTTGCGCCGCAGTTTGACTATGATTTCACCAAGCTGACCGACAGCGAGACTTATTGGAGGGGCGGAGAGAAGTACGAGCGCCCGTGTGGTTGGTACCGCTTTGGCCTCAAGGTCCTGGACAAGTACTGTGGAAACACCTGGCTGGGAACCACATACCGGAGCACCCAGTCCTGTCCAGGGGAGTGGCCCGTGTCCTACCACGGGACATCAAAGAAAGGTGCTGAGGGCATCATCGGAGACCACTACAAGCCAGGCTGTTTTAAAGGAATTTGGTATCAACGTCTCTGCCACACCAAGGGGACACAGAAGGCTGAACAGTATATCACAACTGTGCCCGTATCATTTTCTATTTCGCAAAACTGGGCTTGTATTTGCAATGCAGAGTTGGAGAAAAGAGTCCCAGGAGAGGTTTGGCTGCCGTGATTATTTGAAATCAGATTTTGAGACGACTTCTAGTAAAGAATGTGTGTCTGGGCCGACCGATGAAGTTTTTCCACTTTCATTGGAACTCACTAGCCACAACAGGGAGTCGTGACCTTGAGGTTATATAGAATAAATAAGTGAAACTGCCTAA\n>XM_038305068.1 Cyprinodon tularosa uncharacterized protein LOC119796484 transcript variant X1 (LOC119796484), mRNA \nTTCAATCCTCCAGCTGCACTTGATCAAGCAGTTTGACTAGAAGAGAATCAAGCAGAGCTCTGACAGCACAGAGACCATCATGAGACAGAAACCTCTAGAGATGGAGTTTAAAGACTCCCATGTTCCAGTTCTCAGTGTGTCTCACTGCTCCTCTCTTTCCCTCTCTGTCTCCTCAGCAGCAACATTTGTAGTGAATGTGACACAGAGCTCCTATCAGGCAGAGGAGAACCACAACATCACTCTGGAGTGGACCTTCACCACAAGACCCAACAGAACCTGGATCATCTACTGTTGCGTGTTGACTCTTCCCAGAGAAATAGTCCTCTATTCAGTCTATGAAGATGTTGAAGAGACAGAGTTTACAGATGAACACTTTAAAGGACGAGTCCAGATGGACAAAGACGTCCTCAGAGAAGGACGGATCAGATTCCATCTGTCCAGACTGAGGACTGAAGACTCTGGACTGTATGTGTGTAACATCAGGACTGACTATGGGGAAGGTTCTGCAGACTGCAACGTTACAATCACTGAGACGGTTCCTGAGAGAAACCTCATCACTCCGACTCTACAGGATAAAACCATCAGTAACGGAGGTCGGTCCAGGCTCTTCCTTTTATTTCCTTTTATTTTCTTCATCATTTCTCCGTGTTTGGTTTTACTCTTCATTTCTAAAAATAAGAACTCTAGGAAGAGTCCTTCTAGGTCAACCATCTACATTACAGAATGGAAACCTTGCATAAGGGCAAACTTGTGTTAATGTAGCTGAGATCAGAGCAAAGTCTTCTCTCCTTCATCTTTCTGAGGTCTCCAACTGTTCAATAAATTGCAGGAGACCCTGGAGATAGAAGGAGTCTTAATGATACCTTAGAAGCTGTTGATGAAACCAGGAGTCTTTTCAATGTTTAAAGTCAGTCTCTGCAGGAACCCAACAAACTTCACATCAAAACACAATCAGATGCTGTGGATTTATCTCCAGGAAGAGGAAAATCAGACATTTCGGAAATTGTGCATTGTTTTCTCACAGCAGTGATTTTTTTTTTCTCCCTCAATGCATTTTATCAAAGTACAGATAAAAAAAATGCTAACCCTCGGTTGGGGGGAATCTTCAAATTTCATGTATATATGTTATTTATTATTATTATTTTTTTATTATTGTTTTTTACTCTGTTGTAATTAAAGAAAGGCTACATATGTAAAGTGTTTCATAAATATTGATTTTTGTAATTATTCATTATTAAATAATAGTTATCATTATTACCTCCAACTACATGGCTAAGAACCTCATCTTTTCCTTTTCTACAACTCTCAACTGCCTGTAGGACACATT\n>HQ018492.1 Uncultured Candidatus Microthrix sp. clone R4CP1R1E11 16S ribosomal RNA gene, partial sequence \nTCGCGTAACACGTAGGCAACCTGCCTCGAAGTGGGGGACAACAGCCCGAAAGGGTTGCTAATACCGCATGTGGATGTTTGGTGGCATCACCGATCATCTAAAGCCTTGTGCGCTTCGAGATGGGCTTGCGGCCTATCAGGTAGTTGGTGGGGTAATGGCCTACCAAGCCGACGACGGGTAGCTGGTCTGAGAGGACGATCAGCCGGATTGGGACTGAGATACGGCCCAGACTCCTACGGGGGGCAGCAATTAGGAATCTTGCGCAATGGGGGAAACCCTGACGCAGCGACAGCCGCGTGCGGGATGACG\n>XM_013285616.1 PREDICTED: Papilio polytes antichymotrypsin-2-like (LOC106105325), mRNA \nATGTTTAAATCAGCTAAACCAAGGTACGATACTGCCGTTGAATCATTATGGCAAGGAAATACGGAGTTCACACTAAACTTTTTAAATTTAAAACTAAATGAAAGTCCTTATAACAGTTTTATAGTATCTCCGTTTTCTGTTCTAATACCCCTGGCAGAACTTGCACTGTACGCCAATGGAACAACACACGATCAACTAACAAATATCCTTCATGTCGACAATAGAATAGAGGTTGGGGGTGGTTTCCGTGAAATTTTGAAGTCTTTTTCATCTTCTGATGATGTACAGATTTCATTAGCTCAAAGAATCTACTCCAATGTAAATACAGAATTATCTGAAGACTTTAAAAATGACACTAAGGATTATTTTAATGCCGAAGCTCAAAATGTAGACTTTGAAAAGAATCAAGAAGTAGCGAAAATGATCAACGAGTGGGTGCAAGAACAAACCCATGGTCTCATTTCACGAATTGTTGAACCCAATATGTTGGACCAATCAACAAATATGGTTTTAGTTAATGCCATTTATTTCAAGGGTGATTGGGACTATGCTTTCAATCCAAATGACACAAAACATAAAGACTTTTACTTATCGATAGGCGAGCAGGTTGAAGTAAAAATGATGTATCAAAAGAATACGTTTAAATACATGGAAAATCCAGCTCTTCAAATAAAGGCATTGCAACTACCATACACGAAGCAGCATTATAGCCTTTTAGTTATACTACCCACGTCACGAGTTGATTATGGTTTGCAAAAAGTGGCTAAGAGGATTAGAAATCCCCAAGTGTTTACAGAAATTATCGATGATTTGAGAAACGCAGAAGTTGAAGTATCATTACCGTCTATAGAAACTTCCAGTACAACAGATTTACAGGGAATCCTAAAAGGCGTAAATGTCACTGAAATGTTCGTGTCTGGCAATTCGGATCTTAATGGGTTACTGAAAAATAATCAATCAATACATATCTCTGTTGCTGTTCAAAAAGCCGTTGTGGTTATCAATGAGTTGGGTACAAAAGCAGCTGCATCAAATAATATAGAATTTTTACCATCGGCGCCACTGGTCAAACCGCCCCCAATAACTTTCAACGCTAACCGGCCTTTCCTTTATTTCATTCTATATAAGAAGAACGTTTTGTTCTGTGGATCATACTATGGAGAATACTTAAAAACCAGAGAAAATCCTGGACAAGGTTTCATAGCATCGCCATTCTCTGTGTTGCTGCCTTTAGCGGAACTTACGCTATATGCCACTAGAATAGCGTACGAACAACTTTCTAATGTTTTGAATATTGATGAAAGAGATGAGGTTCGACTGGGATTCAGAAAACTTTTGGATAACTTTGCGTTGCCACAAAAAGTATCAATTACTTTTGCTCAAAAAGTATACGGCAGTCTCGATTTCGATTTCATTGACGACTTTAAATATGATACCAAAGAATATTTTGATGCAGAAGCACAAAATTTAGATTTCAGTCAAAACCAACAAGCTGCAGAAATAATCAACGATTGGGCTAAATGGAAAGATCCATTTGACCCAGATGATACTAAACCAGAAGACTTTTATATAACAAAAGATGAAAAAATAACCGTTAACATGATGTTTCAAGAAGGATATTTCTTATACGCTGAAAACCCTGAACTACAAATACAGGCATTGGAACTAAAGTATGAAGACGAAGATTATAGTCTCTTGATTATTTTGCCAACGTCTGAAGATGATTACAGCGTAGAAGGTGTAGTACAAAAAATTCAAGAACCACATGTTTTTGAAGGAATAATTAACGATTTATCAATTGATGAAGTTGAAGTACATTTACCTTCAATATTAACTACTACAACAACAGATCTAAAACCAATTCTAGAAGGAGTTAATGTTACTGAAATATTTAACCCAGATACAACTGACATAAGTGGGATGCTAGAATACATTCAGCCAATGCACGTTTCCGTAGCTATCCAAAAAGCAGTCTGTAATAACCAGCCTGAGAATGGCAATTATAAAGTCAGCAATTTTTAA\n>FQ672044.1 16S rRNA amplicon fragment from a soil sample (ferralsol, Madagascar) resulting from a 16 days laboratory incubation experiment \nTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGGGTGATGAAGGCCCTAGGGTTGTAAAGCCCTTTCGGCGGGGAAGATAATGACGGTACCCGCAGAAGAAGCCCCGGCTAATTTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCTAGCGTTGCTCGGAATCACTGGGCGTAAAGCGCACGTAGGCGGATTGTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGGCGATCTTGAGTCCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTG\n>XM_030518924.1 PREDICTED: Scaptodrosophila lebanonensis dynein beta chain, ciliary (LOC115624302), transcript variant X1, mRNA \nATGGAGCCATCCACGAGCGCCGAAGCAGCTGCAGCCGCTGCCGGCGGTGGGCCGGATCCACGTTTGGAGCTGATGGGTTCCTTTGTCATCAAGTCCCTCAAACTGAAGCCGGAGAAATGGACGCGTGTCATCACCGTGGAGGAGCACAAGGGCATTATTAAGGAGTTCTTGGATCGAAATACACCGGTAGTGCTCATCATTATATTGACAACCGCTGCCCAATTGGTGCCCTCCACCACCTTTCCGCTGTCGCAGCTCAAGAGCAAGGGGGTGTACTTCATAAAGAAGTACGCCAAGCCGATACCACGCGAGCTCTGTGAGAATTTCATTATTTTCGGCGACTTGGCAACGCGCACCATCGACCAACTGTCCGCCCTGGTGGAGGAGGTGGTTGTGCCTCTGCTCTCCAACGAGGACAATTACAGGGCCTGGCCCACTATGGTGGCGCAGGATGTGCAGAAGCATGTGCATAGCCTAAAGAGTACGGTGCACCAGGTGAAGGGTCAGGTGAGCGGTGAAACTATTCTGGCCATGCCTGTGGGCGTCGAGAAAATTGTCAAGGCCGCCAAGGAGTTGGTCGAAACCGAACAATGCCAGTTCGATCTGTATCTGAAGAGCGCCATCGAGGGTGTGGTCATCAAGTGGGCGACACAGATCCATGAGGTCATCAAGGAGAGTCCGTCGAATGCCTTCGCCAATGGCCAGAATCCCACGCCCCACACAGAATTTACATTTTGGAATAATCGCCTTAAGAACCTATCTTTTATCTACGACCAATTGCGCAACGAACGTATCCGTGCCATGGCAATAATACTTGAATACTCGCTAAGTGCCTACCATCCGTGCTTTCAAACGCTCTTCAAGAACGTCGTTACGGCACTCGCCGAAGCAAAGGACATAACACTCTATTTAAATCCATTGAAACGTCCATTGCAACAGCTGGAGGAAATAGATTTTGCGGAAAGCAAGCCACTGCTCATCCCCTTCATGAATATCGTCTGTATTCTGTGGGGAAACTCGCGCTATTATTGTCAGTCATCGAAAATAACGATTCTGTTGCAAGAGATATGCAATCTGATTATCCATCAGGCCAAACGCTATTTGGATCCCTCGTCAATTTTTCACAGCGACATCGATGAGGCCATGCAACGCCTCACTCTCTCCATACAGATACTGAAGTTCTTTCGGGAGCTTTTCGATTATTATAAGGAACGTTTGGCCGATTTCTTTACAGAGCCCGAGGAGCGGCCACCGATTTTCTGGACTTTTCATCCAAATTCAGTTTTCAAGCGCTTTAATGCATTCCTAGAGCGTTTAACAACCATACAATGGTTCTTCTTTACTGTGATTGAATTCCTGAAATTAGAGAAAGTCGAAATCGGTGGCTTGCGTGGTCGTCAGCTCAGCACACGCATTACAGATGTCTATGTCGAGTTCAATCAATATTTTACAGCCTTTGCGTCCAAAAGCTACGATGTGCTGGACCCAGACGATCATGACTTTGACGATGACTTTAAGGGCTTTCAAACCCGTATACTTGAACTAGATATGAAGTTGGCCGCCATATTGTGCCAGGCCTTTGATGATTGCCACAATTTGGAGAGCATTTTTAAGCTCATTAGCATTGTGGGTAGCGTTTTAGATAGACCCAAAATTAGAGAAGAATTCACACAACGCTATGCCGAAATTCTTGAGATGCTGAACGATGAGATGACGATGTGTGAGGCCATCTACGAGAAGCAAATGGAACTGAGAAAGATTGGCGAGAATCTCTATCCGGACTATAACTGTCCACCTGTGGCTGCCTTCATACGTTGGTGCAATCAGCTGGAGACTCGTATTACAGGGCCTGTGAAGAACTTCAAGGCGCTTCAGCATGAAATATCAAAGTGTGAGAAGGCTCTAGAGATAATGGAACGCTACGATCGCTTGATCGAAAAGTTGGGTGCCTGTAAGACACAGTGTTTTGAGGAATGGAGCTCCCAGCTAGCCGAACAAATCGAGGAGAATCTAAAGAAGTCGCTTATTGCGCGCGGTCCCCAAGGCAACTCGTTAATTTTAAACTTTAGCGCTGCCCTATTCTCAATACTGCGTGAGGTTCATTATATGCAGCAAATGAAAATCGAAGGCATACCCGATATAGCTATAGAGTTCGCTGAGAAGAGCGATGTCTTTCGTGGATATACGTTGAATTTGGAGAAGACTATCGATTGGTATAACAGCATACAGGAGGCTAGCTCGCCGGTTGAGTTGCAATTGATTGGACCCGAAATAAAAATGATTGATGACCTTGTGGAGATCGGTGTGGATAACTTAGTCTGGAATTCAGAAGACATCTTGACGTATTTGGAAAAGTTACGTAAGCCCGTTGCTGCTCTCCAATATCGCATGGATCATACGCAGGGAAATTTGCGGCAAATACGCAAAATTATGAGTGTGTGGGCCAAGCAGCCGTTGTTTGAGCGTCGGGACTGCAAAAAGGATTCGGTGTTGTCTATTGACGAGCGACCTGATCGCACCTCCAAGCGTTATGCTGAGATACAAGCGGCCTCCGTTGAGATACACAAACTACTGCACGACAATATGCTGCAGTTCGACATGGAGGATAAACAGCAGGATGAGGTCTGGCTCAGCTATGTGAACTTTGTCGATAACATCGTCTACGAGAACCTGCTGCGCACTGTGGGCGTAAGTGTTGGGTATTTAGCCGAGAACATGGATCCGGAGAACAATTATGCACCACTTTTTGAGTCCCGTCTGGAGCTAGTCGAACCCGATCTTGTGTTTGTGCCCTCCCTTGAGCCGGAAGACCCGATGGGCTTTAACAACATGCTGATTGAATTAATGCGCGATATTATGAAAATGGGTTCGCTAATCAAGCGTCTGACTCACGAGAAGCGCAGCTATGCTGAGATTATTAAAGAGAACCAGGACATAATTGATATGCGACGTGAAATTCTGAACGGTGTGGACTTGGTAATGGAGGAGGCATCCCGTTTTTGTCGCCAGTTTGAACGCTACTCGTACCTATGGCTGGATGATCGCGAGGAATGCATGGAATACTTTTTGGAATATGGTCATATTTTGGATCCCGACGAAATCGAATTAGTTTTGATGAACGATCCGAATGCACCGAAGCCCTGTTTGCCAACCATTGAGGCATTCCGAGAGCAGATCGATAACTATGAGTCGCTATTCAATGAGATTGAGGATATATCGCCATTTCAAGTGTTTAGCTCGTGGTTTCAAGTGGATGTGCGACCCTTTCGTCAAGCGCTGCTCAATACAGTGTGCAAATGGGGAAATATGTTCAAGGAGCATTTGGTTACAACCGTCACAACCAATCTAATGGACTTAAGTCACTTCATACACAAGGCCGACGAGGGTTTGCTGCAAACAGTGAAGGAGGGCGACTACGAGGGCTTGGTTAATCTAATGGCCTATCTTATGCAGGTTAAGGAGCGGGCCATCAAGACAGATGATATGTTCGAGCCGATGCAGGAAACCATACAGCTGCTAAAATACTATGACATGGATATACCTGAGGAGGTGAATGTGTTGCTTCAAGAATTGCCCGAACAATGGGCCAACACCAAGAAGATTGCTTCAACGGTTAAGCAACAGGTATCGCCACTCCAAGCCACTGAGGTGGTCAGCATACGGAACAAGATAGCGTTATTTGAGGCCCACATACAGCTCTTCCGGGAGGTCTTCAAGAATTACGACTTCTTTCGCTTTGATTGTCATAAGCCATACCAACTTATGGATCGCATTAACGATGACATGTTTCTGTGCGAGAGCGAAATGCGCGACATACAAGAGTCGGGCAGTCTCTTCGAGGTCAATATACCAGAGTTCAAAGTGCTGAGGCAATGTCGCAAGGAATTACGCATGCTTAAGCAACTCTGGGATTATGTTAATATTGTGCAGACCAGCATCGAAGATTGGAAGACTACGCCATGGCGTAAAGTCGATGTGGAGAATATGGATATAGAGTGCAAGAAGTTTGCCAAGGATATACGCTTGTTGGATAAGGAAATGCGTGCCTGGGACACTTTCATAAATCTCGAGTCGACGGTGAAAAATATGTTAACCTCATTGCGCGCTGTGGGAGAGCTACAGAATCCTGCCATACGTGAGAGACACTGGAATCAGCTGATGAACTCGACAAAGAGCCTTGCCGCCTTGCCCAAGGAAGTGACCGTGAAATTTATAATGGATCATGAGACAACGTTGGCAGAGCTTCTGGGCTTGAACCTGCACGAGTGCGAGGAGGAGGTGAAAAACATTGTTGATAAGGCTGTTAAGGAAATGTCTATGGAGAAAATATTGCGTGATTTAAACACAACATGGTCTGCGATGGAATTCGATCATGAACTCCATCCACGCACTGGCTGTAATCTCCTTAAAGCATCGGAAGAACTCATAGAGACGCTCGAAGATAATCAGGTTTGCCTACAAAATTTAATAACATCCAAGTACATCGCCCATTTTCTCGAAGAAGTTTCAACTTGGCAAAATAAATTAATGATCGCCGATCAAGTGATAACCGTTTGGTTCGAGGTGCAACGCACTTGGACCCATCTTGAGAGTATCTTCATGAGTTCGGAAGACATACGCAAACAGCTGCCCGTCGACTCGGATCGTTTCGATAATATCGACGCCGAATTTCGTATACTCATGGATGAGATGTGCGTCTCATCGAATGTTGTGGCCTCGACTAATCGATCTGGGCTAATCGAACGTTTGGAGCATTTGCAGAAGGAGCTTACACTTTGCGAAAAGGCACTGGCAGAGTACTTGGAAACGAAGCGTTTGGCTTTTCCTCGTTTCTACTTTGTATCATCGGCCGATCTTCTCGATGTCCTAAGCAATGGCATCCAACCGGAAATGGTGACCAAACATCTAACAAAATTATTCGATTCGATCGCACGCTTAAAATTCAATCGCGATACGGCCAATGAGATAGAGACAGCTTCGGGCATGTATGCCAAAGATGGCGAATACGTTGAGTTCAACGAGCTGGCCAGCATACGCGGGCCGGTTGAGGTGTGGCTGAATCGTATACAAGCGGCCATGCGAGCCACCCTGCGACACTATGTCACAGAAGCTGTGGTCGCTTATGAGGAAAAGCAACGCGAACAGTGGTTATTCGATTATCCTGCACAGGTGTCGCTCTGTGGATCACAAATCTGGTGGTCGACAGAGGTGAACATTGCCTTCAGCCGTTTAGAGGAAGGTTACGATAATGCCATCAAGGACTACTATAAGAAACAGATCTCACAACTCAGTTTACTCATAACACTGCTGCTGGGCGAGCTGACCAAGGGTGATCGTCAAAAAATAATGACGATTTGCACAATTGATGTGCACTCACGAGACGTGGTCGCTAAGATGATTCAGGCCAAATTGGATTCAGGTTCGGCTTTTATGTGGCAATCGCAGCTAAGGCATCGCTTCGACGATGTAGAGAAGGATTGCTTTGCCAATATTTGCGACGCTGAGTTCCAGTATTGTCACGAATACTTAGGCAATACGCCACGACTGGTCATCACGCCTCTGACAGATCGCTGCTACATTACACTAACACAGAGTCTACACTTAATTTTGGGCGGTGCGCCTGCAGGTCCAGCTGGAACAGGGAAAACAGAGACTACAAAGGATCTGGGACGTGCCATTGGAATAATGGTGTACGTGTTCAATTGCTCAGAGCAAATGGACTATCAGTCGTGTGGTAATATTTACAAGGGTCTAGCCCAGACAGGGGCCTGGGGCTGCTTCGATGAGTTCAACCGCATTACTGTCGAGGTGTTGTCTGTGGTGGCAGTGCAGGTGAAGTCTGTGCAGGATGCGATACGTGACAAAAAGGACAAGTTTAATTTTATGGGCGAGATTATAACCTGTGTGCCCACAGTTGGCATATTTATAACCATGAATCCCGGCTACGCGGGTCGCACAGAGCTGCCGGAGAATTTGAAGGCACTTTTTAGGCCGTGCGCCATGGTGGTGCCAGACTTTGAGCTGATCTGCGAGATTATGTTGGTCGCCGAGGGCTTTCAAGATGCACGAATATTGGCGCGTAAGTTCATCACACTCTATACACTCTGCAAGGAGCTGCTTTCCAAACAGGATCACTATGATTGGGGATTGCGCGCAATTAAATCTGTATTGGTCGTTGCTGGATCGCTGAAGCGTGGTGATCCTGGCCGTCCTGAGGAGGAGGTCCTTATGCGTGCCTTGCGCGATTTCAATATACCAAAAATAGTTACCGATGATATGCCCGTGTTCATGGGGCTCATCAGCGATTTATTTCCCGCTTTGGATGTGCCGCGCAAACGTGATCAGGACTTTGAACGCACCGTAAAACAAGCTGCCTCCGATTTGCTACTACAACCCGAAGATAATTTTATATTGAAAGTGGTGCAACTGGAGGAACTGTTGGAGGTACGTCACTCTGTGTTCATCGTTGGCAATGCTGGCACTGGAAAGACACAAGTGTGGAAAACGCTGCTGCGCACCTATCAGAACATCAAGCGCAAGCCCATTTTCAATGACTTGAACCCGAAAGCCGTGACCAATGACGAACTTTTCGGCATTATAAACCCAGCTACGCGTGAATGGAAAGACGGCCTCTTCTCGGTACTGATGCGGGATCAGGCAAATATCGCGGGTGATCAACCAAAATGGATAGTCCTAGATGGTGATATTGATCCCATGTGGATCGAGAGCTTAAATACCGTCATGGATGATAATAAGGTCTTGACTTTGGCGAGCAATGAACGTATTGCTTTGACGCCTTCAATGCGCTTGCTTTTCGAAATCTCCAATCTGAGAACAGCAACACCGGCAACTGTATCCAGAGCCGGCATATTGTATATCAATCCGCAGGACTTGGGTTGGAATCCCTATGTAACCAGTTGGGTTGAGACGCGCAAAATTCCAGCCGAAAAGTCCAATTTGGTCATGTTATTCGATAAGTACATACCATCATCATTGGAGACGATACGCGTGCGTTTTAAAAAGATCACGCCTATCGCCGAAATGGCCCACATACAAATGTTGTGCCATCTATTGGACTGTTTTCTAATACCAGCGAACACACCGGCCGATTGTCCAAAGGAATGGCATGAGCTCTACTTCGTGTTTGCCTGCATTTGGGCCTTCGGATCGGCTATGTTCCAGGATCAAGCCATTGATTATCGTGTGGAGTTCAGCAAATGGTGGGTAAATGAGTTCAAAACAGTTAAGTTCCCAGCAGGTGGCACTGTTTTCGATTATTTTTTGGATAGCGAGACTAAGACATTTCTGCCCTGGATCGAGAAGACACCCAAATTCGAGCTGGACTCTGATCTGCCATTGCAAGCTGTACTCGTGCACACCTCCGAGTCCATTCGCTTGCGTTTCTTTTTGGACTTACTTATGGATAAGAAGCACCCGGTGATGCTAGTCGGCAATGCCGGTTGCGGCAAAAGTGTTTTGGTCAACGAGAAGCTTCAATCGCTTTCTGAGAATTTCGCTGTCACCACAATACCATTCAATTACTACACAACGTCCGAAATGTTGCAAAAGATATTGGAGAAGCCGCTGGAGAAGAAAGCGGGACGCAACTTTGGACCGCCCGGCAATAAAACCTTGATATACTTCATCGACGACATCAATATGTCGGAGGTAGACTGCTACGGCACCGTACAACCCCACACTCTAATGCGCCAGCATCTTGATTATGGCCATTGGTACGATAGGAACAAACTAACTCTCAAGGATATACACAATTGTCAGTATGTGGCGTGCATGAACCCAACTTCGGGCAGCTTTACCATCAATCCGCGACTCCAACGCCACTTCTGCGTATTAGCTGTCAGTTTTCCGGGACCCGATTCGATAACCGTCATGTACTCGGCCATCTTGTCTCAACATTTTGCGAATGCCGAGCAGAAATTCATTCCGATCGTAACACGCATGACGCCAAATATTGTGGCCGCAACCATAGCGTTGCACAACAAATGCCTCCAGATATTCCTGCCCACGGCCATAAAGTCACACTATATATTCAATTTGCGCGACATCAGCAATGTATTTCAAGGTTTACTCTTCAGTTCAACAGAATGCCTAACGGGCTCTACAGATCTTATACGTTTGTGGCAACATGAGACACAGCGTGTCTACGCCGATAAGCTAACCGATGATAAGGATATTGATAGCTTTACTAAAATGCAGCATGACATTGTTAAGAAATCGTTCGAGGAAATTGACGAATCCGTAATATTCGACAAACCGAATATCTATTGTCATTTCGCTGGAGGAATTGGTGATCCTAAGTACATGCCCATCAAGGGCTGGCCTGAGCTTCACAAACTCCTTCAGGAAGCAATGTCATCGTATAATGATCTGGTCGCTGCCATGAATCTGGTGTTATTCGAAGATGCGATGATGCATGTGTGCAGAATCAATCGCATATTAGAATCACCGCGTGGCAGCGCTTTATTGGTTGGTGTTGGTGGCAGTGGTAAACAATCTCTAGCGCGCTTGGCAGCATTCATATCCAGCTTGGAGGTCGTGCAGATACAGCTTAAGAAGGGCTATGGTGTCAACGACTTGAAGATTGAGTTTTCCGGTTTGTATCTGAAAGCGGGACTTAAAAACGTCAGCATCATGTTCCTAATGACGGATGCGCAAATTCCCAGTGAGGATTTTCTTGTCTTAATCAACGATATGTTAGCCACTGGCGAGATTCCAGATCTATTTCCGGACGACGAAATCGAGAACATAATCGCTGGCGTGCGTAATGAGGTCAAAGGTGCGGGGCTGGTTGATACGCGAGAAAACTGCTGGAAATTCTTCATCGATCGTGTACGCAAGCAACTGAAGATAGTTCTGTGTTTTTCACCAGTGGGCTCAACATTGCGTGTTCGGTCGAGAAAATTCCCTGCCATCATCAATGCAACGTCCATCAATTGGTTCCACGAATGGCCTCAAGAGGCACTCATATCGGTTGCCATGAACTTTTTGGCACAGAACAAAGTACTGCCTGACAATCATCGGGACTCTGTTGCTAAATTCATGGCATATGTCCACACAGCTGTAAATTCCACATCCAAAGTTTATTTGCAGAACGAGCGCCGTTACAACTACACAACTCCCAAGAGCTATCTCGAGCAAATAAATCTCTATTTAAAGCTACTGAATCACAAAAACCAGGATTTGCAGAGCAAAATCGAGCGTCTGGAAAATGGATTGGAGAAGCTTCGTTCCACGGCCGTCCAGGTGGCCGATTTAAAAGTTAAGCTAGCCGTTCAGGAGGTCGAGCTTAAAGAGAAGAACGAGGCGGCCGATGCTTTAATTGAAATTGTGGGTATTGAAACGGAGAAAGTGCAGACGGAGAAAGCGGTGGCGGATGAGGAGGAAATGAAGGTTGCTTTGATAGCGGACGAAGTCAGCAAGAAACAACGTGATTGTGAAGAGGATCTATTAAAGGCCGAACCGGCGCTTCTCGCAGCCCAGGAAGCCTTGAACACGTTGAACAAAGCGAATCTAACGGAATTAAAGAGTTTTGGTTCGCCCCCGGGTGCGGTCACAAACGTAACAGCCGCCGTTATGGTATTGCTGGCTCCAGGTGGAAAACTGCCCAAGGACCGCTCCTGGAAAGCTGCAAAAATTTCGATGGCAAAAGTCGACGCCTTTCTAGACGCATTGATCAATTATGACAAAGAAAACATACATCCTGAAATCATTAAGGCTATACAACCATATCTAAAGGATCCAGAATTTGAGCCCGAATTCGTGCGCTCCAAGTCAGGTGCAGCGGCCGGTTTGTGTGCTTGGGTTATCAACATTATCAAGTTTTATGAAGTCTATTGCGACGTGGAGCCCAAACGTAAGGCGTTAGCAGCCGCCAATGCAGAGTTGGCTGCTGCTCAGGATAAGCTTGCGGGCATTAAACGCAAAGTGGCGAGTCTGGAGGAACAACTAGCTAAGCTAACAGCCGATTTTGAGAAGGCCACGGCGGACAAATTGCGTTGCCAGCAGGAAGCTGATGCCACGCAAGCAACCATAGCATTGGCTAATCGTCTTGTAGGTGGTCTAGCCAGCGAGAATGTGCGCTGGGCAGAGGCTGTCAATAACTTTGTCAAGCAGGGCATTACGCTTCCCGGCGACATTCTACTGATTACCGCCTTCATTTCCTATGTTGGCTGTTTCACGAAAGGATTTCGCATCGATTTGCTGCAAAAGATGTGGACACCCTTCCTGAAGGGCATCGATCCTCCCATACCCACAACCGAAAATCTCGATCCACTCTCGCTGCTGACAGATGACACAACCATCGCCGTTTGGACAAACGAGGGCCTGCCGAGTGATCGCATGTCCATTGAGAATGCAACCATTCTTTCCAACTCTGATCGCTGGCCACTGATGATAGATCCCCAGCTGCAGGGTGTGAAATGGATTAAACAGAAATATGGCGATGAACTTAAGGTTATCCGTTTGGGTCAGCGCAGCTATTTGGACATCATAGAGAAGGCCATAAACACGGGTAGCACTGTCTTGATTGAGAACATAGATGAGAACTTGGATCCTGTTTTGGATTCATTGCTTGGTCGTAATCTCATCAAAAAGGGAAAAGCTATTAAAATCGGCGACAAAGAGGTCGAGTATAACTCCAACTTCCGTTTGATCCTGCACACGAAACTAGCAAATCCACATTATAAGCCCGAGATGCAAGCACAAACCACACTTATTAATTTCACTGTTACCCGCGATGGGTTAGAAGATCAATTGCTGGCGGAAGTTGTGAAGGCCGAACGTCCCGATCTGGAGGATCTCAAGGCCGAATTAACCAAACAACAGAATGACTTCAAAATCATGCTAAAGAAACTGGAGGACGATTTGCTGTCGCGCTTATCGTCTGCTGGTGAGAATATTTTAGGTGACACCGCTTTGGTGGAAAATCTAGAGACCACAAAGAGTACAGCATCGGAGATTGAGGAGAAAGTGGCTGAGGCCAAGATCACATCGAAGGAGATTGACAAGGCGCGTGAATACTACAGACCAGCGGCGACCAGAGCCAGCTTGCTTTACTTCATCTTAAATGAACTAAACACTATAAATCCGATCTATCAGTTTTCCCTGAAGGCTTTTAGTGTAGTTTTCCAAAAGGCCATAGCTAAGGCTGAACCAGGCGAATCCTTGGATTTGCGTGTCTCCAATCTGATCGATTGCATAACGTACTCGGTCTTTCAGTATACTTCGCGTGGTCTTTTTGAATGCGACAAACTGATATTCGCATCTCAAATGACTTTTCAGATACTGCTTATGAACGAGGAAGTAACATCTGTGGAACTGGACTTCCTACTCCGCTTCCCGATCAAACCGCATGTGACAAGTCCTGTTGACTTTTTGTCAAACCAATCGTGGGGCGGAATATGCAGTCTAGCGTCCAAGGATGAGTTTAGGAATTTGGACCGTGACATAGAGACCTCATCGAAGCGTTGGAAGAAACTGGTGGAATCGGAACTGCCGGAGAAGGAGAAGTTCCCACAGGAGTGGAAGAATAAAACGGCTCTGCAACGTCTTTGCATGATTAGAGCTTTGCGACCTGATCGCATGACTTATGCTCTAGGGGATTTTATTGAGGAGAAACTGGGCTCCAAATATGTGGAAAGTCGAGCAATGGAATTTGCAAAATCTTTCGAAGAGGCTAGTCCTTCAACACCCATCTTCTTCATATTATCGCCTGGCGTCAATCCTCTGAAGGATGTGGAAGCGTTGGGAAAACAGCTGGGCTTTTCCATGGATCTGGGCAATTTTCACAATGTATCACTGGGTCAGGGTCAGGAGGCAATTGCTGAAGCGGCCATGGATATAGCAGCAAAGAATGGACACTGGGTCATACTACAGAACATACATCTGGTACGCAAATGGCTGCCTGCCCTGGAGAAGAAGCTGGAATATTATGCTGAGGGCTCACATAAAGATTATCGCATGTTTCTGAGTGCAGAGCCCGCATCTACGCCCTCGGCGCATATTATACCACAGGGAATTTTGGAGTCATCGATTAAGATCACAAATGAACCCCCCACGGGCATGCTGGCGAATCTGCACAAGGCCCTCGATAATTTTACACAAGAAACACTGGAAATGTCCGGCAAGGAGGCCGAATTCAAGGCAATACTTTTTTCGCTTTGCTACTTCCATGCTGTGGTGGCTGAGCGCCGTAAATTTGGTCCACAAGGTTGGAATAAGATATATCCGTTTAATGTGGGTGACTTGAACATAAGCGTATCGGTTCTCTACAACTATCTGGAGGCCAACGCAAAGGTGCCGTGGGAGGACCTGCGCTATCTGTTTGGAGAAATTATGTACGGTGGACATATAACTGACGATTGGGATCGACGCTTATGCATCACCTATCTAGAGGAGTATATGCAACCTGATTTGGTGGACGGTGAACTTTTTCTGGCGCCATCATTTCCCGCCCCACCAAATACCGATTATCTCGGCTATCACACATATGTCGACGAAATGATGCCCGCCGAGTCGCCTTATCTCTATGGCTTACACCCGAATGCCGAGATAGGTTTTTTGACCACACGTGCCGAGAACATTTTCCGCACCGTCTTCGAAATGCAACCTCGGGAGGCTGGCGCTGGAGGCGGCGCCACTGTGACGCGTGAGGACAAGGTCAAACAAATCGTGGATGAAATACTGGAAAAGTTGCCCGAGGAATTTAACATGGTGGAGATAATGAACAAAGTGGAGGAGCGCACGCCATATGTAATTGTGGCTTTTCAGGAATGCGAGCGCATGAATTACCTAACAAGCGAAATGAAGCGTAGCTTGAAGGAGCTAGACCTCGGCCTTAAGGGCGAATTAACCATAACTTCGGATATGGAAGTGCTGGAAAACTCTTTATTTTTGGATCAAGTGCCGCCGATTTGGACATCGCGCGCCTATCCATCCCTCTTAGGTCTAAACAATTGGTTCATTGACTTATGTTTGCGTTTGCGGGAGTTGGAGACTTGGTCAACGGATTTTGTGCTTCCGTCTTGCGTCTGGTTAGCCGGATTCTTTAATCCCCAATCACTGCTAACGGCCATTATGCAGAGTACGGCGCGTCGCAACGAATTGCCGCTGGACAAGATGTGTTTGCAATGCGATGTCACTAAGAAGCAGAAGGAGGACTTTACAACGGCACCGCGCGAGGGCGCCTACGTTCATGGCATATTTATGGAAGGCGCCAGATGGGACATACAGCAGGGTATTATAATGGAGTCGCGTCTTAAAGAGCTCTATCCATCAATGCCAGTCATCAATATTCGGGCCATTACCCAAGATAAGCAGGATTTGCGTAATATGTACGAGTGCCCCGTCTATAAGACACGCACACGTGGACCAACCTATGTTTGGACATTTAATTTGAAGACCAAAGATAAGCCCGGCAAATGGACGTTGGCCGGCGTGGCATTATTGCTACAAACTTAGCTGGAATATACCTATATCGACATTTTTCCAATTCATTTTTCTCGAATTAAATT\n>XR_002553663.2 PREDICTED: Helianthus annuus DNA-binding protein HEXBP-like (LOC110871340), transcript variant X4, misc_RNA \nTTGGGATCGATCGAACAAGGGCAGGGAGAGGGTGAATAACCCTAAACTCAAGAAATCAAGAATTGAAGCTAAAATCTCAAGGAAAATTCGATGCATGAGCCCTTCTTTGCGAAAATCTAACCCTAATTATTGAAGTGGCGTGAAAGAAGAAGGTACAAGCACTAAGCAAGCGGAAGGAGCACGAGATCGAGGTAAAGCACCTCTATAGGCGATATGGAGATATGGAACGAGCACATGTTTAAGCCTTATAATACCAAGCGCTTTCGC\n>XM_033245137.1 PREDICTED: Anneissia japonica ataxin-2-like protein (LOC117104323), mRNA \nATTGGCCTTTAGCATAATTATTTTCTGGTCTCTGTCGAAGGCCAAAGCATTGTCGATTTATCAAAAACATTGCCTTTGAAATCATCCTCTGGTGGTAGTGGGAAGCAGTTGCGAATATTAAAGACAAGCATTTTTATCGATATGCTTTGTTGATTGTTATAAAATACAAATTAATTGATTTTGCAAGGCTCGTGCTTCTGAGAAGCAGCTCACCGGCGATCCGAAGGCATGATGAGTACACAGCAAGCACCACAAAACAAACGTAAAGGGGGGAGAACCGGGAACAGTGGTCATGGAAGAAATCGAAACTCAACTCGATCAAGTAATCTTACAGCTAACTCGCAATCACACTCAACGCCGGTCATTCCACCTAGATTATACGCAAATGCTCACTTTGTACACGCTACAGCTGTTCTCAAGGGATTAAAAGTTCAAGTTGTGGTTGTATCAGGCAAAAAGTATGAGGGAATATTCAGCACAATAAGTAATAATGGTGAGATTGTAATAGAATTGGCACACATGGTAGAAGGCAATACAAATGCTGTACCAAGCAAGGAAAGGACAATTGATAAGCTGGTTGTTAAGTTCAAAGATGTAGTCTCGCTTACAGCATTAGATGTTGATCTCGAATACGCTGTTAAAAGCGATGTTCAGCCTGGATTTCAGACAGATTCAGATATCAGCGGGAAGAAATCGAATGGTCAAGCAGGAGAGAGAGAATTACAGCAGTGGACTCCAAGCAATGAGACCCCAGCAGATTTATCATTAGATGGTGATACTAATGGATGGAGTGTGGAAGATATGTTTAAAGCTAATGAAAAACAATTTGGTTATGAATCCTCATACGACACAACTCTAAAAGATTACACGACGCTCTTACGCAAAGAGGATACAGAGGAGTTCCGTCAGAAATCAGAAAGGGCGAATAGACTAGCAATGGAAATTGAAGAAAGTGCAGGCTACAAACAAAGAGCAGCTCTTGAATTAGATGATGGGCAAACAGAGGAGGATAGATTCAGTGCTGTGCAACGGCCGAAGGCCAGAATGAGCCCATCGGGATCACAGCAGGGAAGATCCGCTAGCCCAAAAGGAAACCCACAGTTTGATGGTAATGCATCAACTAATAAGTATGTACCCCCTCATTTAAGAAATAACAAGCCGGCTCAAAGGAATTATAATCAACCCTCACATAGGCCTCACACTCCAACACAGGGGGGCCAAAGAGGACCGACACACGCACAGAACATGGCTAGGCCACCTAGACATGCTGTGCCTGATGAACGTCTGACAATGCAAGATGTACGAATGTCACCAGAATCTAGGCAATCCCAAGATGTTAGGTTGTCACAGGATGCAAGGCTTGCGTATGAACCTCGACCTCAAAGGTCTGCTGCACAAGTTGTTGCAGGAAGCAATCCCCAACGTGGCATGGTTCCACAGCAACAAAATGTTATGAAGCAACGAGAAGTCAAGCCGGAGTCCATAGGAATATCGCCCAGCCCAGGCCCTCCAGCAAACATGGCCAAGCAGCCTACAAAAGATATACCTAGGGTACCAAGCCCAATGGTTGGAAGCTTACCACCAACAGGTGAAACCAATCCTCAACACCCAGTTGCATCAGAGGATAAGAAGCCACAGAAATCACAGAAATCTCAAAAAATTAGTGAATTGAATGAATTTAGCAACAACTTCAGGTTACAAGAGAATCAAACTACACCTAGCAACAACCATGTTGCTACCCAGGCCCATGAAGCCAAACCAGTTCAGTCCTTAAATCCAGCTCCAACACCACAGCAAGGAAACCAGCAACCTGTACCCCAACAGGCAGCACAACAGGTAGCTCAGCCATCTTCTCAGTCGCCTCAAACACGACCAGTACCACCACCTGCGCAGGCTCAACCGCAGGCACTTATTACACAAATTATACAACAGCAACCTTTACCGGCTCAGAAGCTAGGCCAGGCACCATCTCAAGTATCAATTCTTCAGCACCAGGCTCATTCCCAAGCTCAACCTATCTCCACAGCTCAGCCACCAAGGCCAGTGGATGAAAAGAAACCAGAATTTAAGCTGAACCCAAATGCTAAGGAATTTACCTTGAACCCATCAGCTAAGCCTTTCACACCGAACTCACTACGTAAGGGGGTGAGTGTGAGTAAAACACCGACACCTCCCCGACCGCATTCACGACAGAGTCAGAGTCCAACACTCCATCCACCATCAATGCCAATGACCCAAATAATGACTGGTGGACCCCCTCCACCGCACACCTTTATCCCTCAAATGCCCTCAGTTGTCTATGCACACCAAATTCCTCTTCAGAAAAAATATCCTAAAAGTCCGGCAACCAATCTACCACAGCCCCCAAGGCAGCAGCAACCAGGGGATATATCTGGACAAATGATGTCGGCATCAACAGCAACCGGGCAACCACTGCTAGCCCCTTCTCATTTTGTACCGCCGTATCATCAGCATCCAGGGGCACATCCTGGTCAGATGATCCCAGGTCAGCCTATAATGCAACCTCAACCCATGCCATTTGTGCAGATGCAACAACAAAAGCTGCCTTATCGTCACGCCAGTTCGATGTCCAATGTACAACAATCACAAGCTCAACTCCATCCACTGCCAGAGGTCTCTCCAAATACCCCTCTCTTTGTTACACCCCAAGGTTCCAGTCAAGTCTATCCAGGTCAGCAACAGCCATCAGTGTACCCTCATCACCCCTCATCTGCTCAACAAGGAGGCCAACAACATCCCCAGGGCCAAGCAGGTCACCATCAAATGGTCCAGTCAGCCCATCCTCACTCCCATGGAGCTCAACAAGGACAAAACCAGCACCATCAAGGCCAGCCTCAGGGTCATAGACCAACGCCTAGCCCAGTTCAACATTCTATACAGTCACCCTCACAATCTACTCAGCAAAATATACCGTTACCGATATATTACAACATGCCACAGCACAGCCAACCAATTCAAGGTCACACACCTCAATCTCAGCAGACGTTTACAACTGTTTTAATGCATCAACAACAGCAGCAGCCTCAACCCCAGCCATACTCTGCTACCTCCCACAGCATAACAAATATGACGACAGTTCACACTAGCCCTCACCCGCACCCTCATGCACAACCTGGCAATGTGATGTATGTAGGAGGGGGACAGCCAGTCCCCCAACATTCACACACAGTCATGCTACCAAGTGGAAGCATATCATATCTGCCCCCACAAGGAGGTCAAGGTCAACACCCTCCTATTCAAGCCTACCAGCAGACTAACTAGAGCAATGTGTAGTGCATAAAATTCAAAAATATATATAGAACTGATCAAGGCCTTCATAATTTATTATATTATAGAGACCTGATGTCTAAGAGCTGGAGGAATTTCTTATTGAAAAGGATATATGCTGCTTATGTGTGACAGCTGAGCCTTGTATTGAATGTACAAGATGTGTTTTACCTGATGGGAAATAATGTTGTTTCCTCCTGATGGATCGGCTCTTAGGAAAATCCTACCAAGGGCCTAGGATTTAAATTGAAGCAAGCAGAAGAATCCTACAGAATTATCTAATCGTACTCCAAGAATCATATTGTGCAAGTTACCAACATGTTTGGTTTTCTTTTAATGCACCTTATAATTAAAAACTACCGGGGGCTTGTGTCTGCTCCTGGCCCTCTATGTGGAGTACAAACAGGGTTTCTGTCTGCTCTGAATATTTATAGAGTACCACCAGCCAGGCTGCAGTAGTTTACTGTCTGATCCAGCCTTTTAAAATGGATTTGCCAATTGGCCTAGTGTGCTGTTTGCTCTTTACTCTCTAAATGGAGTGCCAACAAGGCTCCTGGTCCGCAGATATTATTGAGATTTTAACAATGAGGATATAAGTCAGAATCGTAGGCTAATTATTGCTGACTAAACTCTAGATGAATTAAATTAAGGTTTTAAGATGTTTCTGCAACAGATTTATCCTATCTAAAGATTTCAAAATTCGCCCCATAAATTGGTAAATTATTCTTATTTAAATATTGTTTAAATGACCTTGACTTCAGATTCTTTATATGCAAATGTATTTTCCCTGATATTAAATTCTAAATTCCATTTAAATGTGATAATTTACATCACAAAATTAAAGAAAACAAATACGATATATATATTATGAAATTTGAAAACCATGTCATTTAATTGAAAACTCTGGTGACTGAATAGTGCTTACATTGAATATGTAATTTCACATTCATTGCATATTCCTATGAATCTAAGTAAAAAATAATATGCATGAATGAGCACAGAAATAATTGTTAAAGTTGCTTACCTTTGCTTTATTCATCCTGATAACACTAATTGTATTCTAATATTTTATTATGTAGCTTATGTTTTCTCGGTCCCCCACATGTGGACAATGTTCACACGTTTTCTGGTCCCTATGTATAAATATTAGGGTATGCTTACTGATAGTCCCTCAGGTTAGTTATTCAAATATATTGGTAATATTTTCACCCCGTAAGGATTAACACGAAACAACTGTTTTATAAAATGATTATTGTTGATTTCATGTTTTAGTTAAAATGATTAAGTTGATCAGTGAAGTAATGCAAATTGGATGTTAAGCTATTATTTTGAAATAGTTTCTACTTAATAATTTAACAATCTGTCATCAAATGCCATTGCATAAATGAATGTCGGCTTTTTTTTTACTGATCTGTGGTGTTGACTTATGACACCTAATTATAGTTCTTTGTGACAGGAGTTCCTGCTTCACTTCAGATTTCTTTGAGTGAGCCAATTACATGGTGTGAACAGCTCCACAGTTAATTAGATATGAGTAAGGTATTCTTGAAATCACTCCATTTAAGATGCATATCACTTTACAGTATAAGGCATAGTTGTTTATTTCATTAATCATTAAGATAACACATATCATCAGTGACATCTAATGTCATAAATACATGGCTAAGCCTGGTATAGTCTGCAAATGCAAAATGGGGTGTAAATGTTTTGGTTGTTTCAGATTTAATTTCAACACAGTTATTTATTCAGGATGTGAAATGGAAATAGTTTGACTGTTTTTATCGACAATTTCTTAACCAGTGCATCAAAGTATATAAATATTTATTTTATTAATGCAGTATTATATTATTATTATTATTATTATTATTATTATTATTATTATTATTATTCATATATTGATTTTAGTGTTTATTTTTAAAATAAAATAATGCTGATGTGTAATGAACTACTGTATTAAAATGAACATTTTACATTATATACATGTACATGCATGTTGGTGACACATGCATACATACATACATACATACATACATACACACACACACGCACACAAGGATGAGCAAAGCAAAAGTTTAAACTTACAGATCTTTATGACCTGTTTGCTGCCCTCTATAGTTAAGTTATTTTGGCAGCTACTGTAGTTTAAAGAATCTGATATTTGAATTAGTTCTATCATGTCTATGTTTTTATGACAACAATATAAGGGGGTTATTTTCAAGGATATAGCAAGGGAGGGCACTGCTCAAGGGAAGTGTATGAAAACGGTGAACATCGTTCTTTGTGTTACAAACGAGTTCTATTGTTCTTCCGTTTTTTGTCTTGATGTGAAATGAAATAAAAAATGACATGATTGCATTTTATCCAAATAAGAA\n>LN587638.1 Uncultured eukaryote partial 18S rRNA gene, clone SIGW489_N9D4_16S_A \nAGTCGGCTCAGCGCCTGGTCATCCGTATGGGAAACTAGCTCGACCTTCACTGGTCGGCTAGTGGATCATACACTTTACTTTGAAAAAATTAGAGTGTTTCAGGCAGGCAATTGCTTGGATACTGTAGCATGGAATATGGAATAGGACTTTGACCTTATTTGTTGGTTTCTCGAGGTCAAAGTAATGATTAATAGGGACAGTTGGGGGCATTCGTATTTAATTGTCAGAGGTGAAATTCTTGGATTTTTTAAAGACGAACTTATGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCAAAGACGATCAGATACCGTCCTAGTCTTAACCATAAACTATACCGACTAGGGATTGGTGAGGTCTTTTAAGCCTCATCAGCACCTTATGAGAAATCAAAGTCTTTGGGTTCTGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTCCAGACATAGTTAGGATTGACAGATTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGTTAACGAACGAGACCTTAACCTGCTAACTAGTCACCTTTATGTCAATAGGGGTCTGACTTCTTAGAGGGACTTTATG\n>XR_004845356.1 PREDICTED: Anopheles albimanus uncharacterized LOC118464036 (LOC118464036), transcript variant X5, ncRNA \nCTCTCTCTCTCTCTCTCTGAATTGCTCTCTCCCTGACAGTCTCTATCTCTGTTTTACTTCATGCCCATCGCCTGCTTGTCCAGGTTCCGTGTGGCACGTACAGGATACGAAATTCTTCCTATTTCTTCTGAATGGCAAACTGACATGCCTTGCATTCGAAATTTCGAGTATTGTACAGAGAACGACGGCATGTGCTGCATAACCAATGAAACCGGTGCGTTACAGCCGATGAGTCGCTGCGGAGTGTGATTTCGAAAGTGCCGACAGTCGGAAGTGGTGGCCGCTCCTAGGAGGACGTTCGCTTATCTCTGTAGCAGTGTTCTTGAAAAATATTCTAGAATTAAGCGTGAGAAACATGCGTTTAGCTAGGTGGAATACTATTTTACGAACCTGAGGAAGTTCCCCGGAACAGTGTGAGACTCACACTCACTAAACCTCACTAGCTTGGTTTTCCGTTACCACCCTGCAGCTGTGTGCCTCTTTCGAGATGACTTGCAGCGAGGGTGGCAACGCCGAACCACTTGCTGCGCGAAAACATGGGTCTGAAGCGACTATATTTTTTGGAGTAACGTTGTTAAAACCACCTTACACGCTCGTTACTGCTAAAAAACGGTCCTCGCAAATGCGCGGGTGGCCGAATGGAAGGTACTCTCTGAAGTACCCATGTCCCGATAGGAACGGGGCCAAGCAGGGGTTAATCTCGCCGTATCTACGAGACAACCATCTCTCAAGATTGGGAAGTAGACGATAAGTCCATCGGCCGTTCTGGTCATTTTCCCATTATCGTTGCCAGCGCTGCAGCGACCTCGCCCGCCTCGCCACGACCAGCGTAGCGTTCCCTGTTCTCTTCGATGAGAATGCCAACCGGGATCATGCCGGTGATCACACTGATGGCCGCTGGTGATACGGTTGGGAAGGCACCCGCAACCCCAATCCCAGTAAGCCTGTGAACGCGGTTCAGCTCGACCAGGTTCCGTCCGGTCGACAGAGCCGAATACCGAGGTGACTACGCTGGATAGTAACCTCGTCCTCGAGCAACTGAGGCCGTCTGCTCCACGCATAATGGCCGAAAGGGCGTTAAGAGCCATCAGTGCGTTAAGAGGTGGTAGCATAATCAACATGGTCTCCGAAGGCAAGCGTGCGATCTACTATCACCCCGAGGTACTTAATCGCCTCCTGGGACCGATCCACTAGATCGCCGATTTCAATCGATATCTCTTGGACAGGCTGCAGGCTGCTAACAAGCATTGCCTTGGTTTTGTGCACGCTTCCACTGATTCGATCAACCGTTCCGCGTTAACTTTCACCTCGCTCAGGCTCTGACCATTAACCGCTAGGACCATATCGACGACCAATGACATAACAGGGAGTTTCGGCCGCAGAACCCCGTCAAACATCATTTTTCAGAATGTTGGCCCTAGAACGGATCCTTGGAGAACGTCAGCCGTAAGCGGCATTACCTCTGGTCATGAGTCGGTGTCGTACAGCAGAACGCGTCGATCGAAGTGCCTACCCAGGATGCGCCCGAGGGATCGCCACCCCAATTGGCGTTGTTGAAGGCGTTCTTCGCGTCGATCCGCGTGACAACCGCGCAGAGACGGTCGGCTCCCCGCTTTTGGCGAACACCACTAGCAGTTTCGAGTACCATCTTTATCGCGTCCAAATATAATTCAGCTGGTGTAGCTAGAAATGTTGTATAATACCTAAAGGCAGTTGGGTATTGTTTAGTTAATGCTCAACATTTTTGTGCACTTAGTAGATTAGATATGGTTGGTCGTAGTGGTTAAGTGGCCCAACCGTACCCGATCAGAATGAAAATGGAATACTCCAATACTGTCCTAGTCTAACATTGCGACAAGAGACGGTTCAGATACTCTCATTTCTTCCTCCTTACACATCCGCTGAAGTTACTCTACTGGAATATTTGGGGCGATGGTTTTCCAGTTTCCAAACCAGTTTGGACTGTATCTCAGGTGAGAGAACATGGTCACAATGCATCTTCTGAGACCCAAGAGAATGGGCGCTGGGTTTTGTATCCCTTTCTCGCGAGGACAGCACTGATTATAAAACATGAAACTAAAGTTTCTATTGTAGAAGGTTTGTAGTACCAGATGAAAAGCCCGTTAACTTGCAGATTTCAGACCAGGTCATGGGTAATACTGCCTCCAATCATAATTGCAATAATTAAAATGTGTAAAATTTCGGACGATGTAACTCAGTAATTAATTTGCACCACCAAAGTGAATGAAACCCCCTATTTTATTGCTAGAAACTCGATATAACGGATATGATATGTGTGAAAAAATCGGATATCGCAGCATATAATCGGTCCATTAAGCTACTGACCTGCAAGCCACAATGGGACTCGCAAACCCGTACTGCACTTGCCACATGCGACAGGATGAAATCGCCCGTAGGTACAATGGTTCACTGTTTGATTATCGTCAGAAAACAACGGCTAATCAAATGATGCAACAAAACGGGCATCAATGGTGGTTTAGGCCATTACAGGATGTGTTGGGGTTAAGGGTGACATGACTCTTTGGAAAACCAGAAAGGTGGGGCAAACAGCCATCAATGGTAGTATGTTGGAGTGACTACCTATTAGGAAAGCGAGTAGGAAAAGGTTCACCTTTCCGGTATGGTAATTCACCGAAAAAAATGAACTGATATACATAATACAACTGATACACTAATATACCAAAGCATTAATGCTTGCGATCGAACTTCGCAAACCTCAATTGTTGCAGATCTGCTCTTTGATGTGCTTGGTTCGCCAATCGATCTGATCGAGGACTTTTAGCGGCCGCAGGCAGGTAACGCTAAATCGTGGAAGCATTGGATCAGGACAGTCGCTTACGTCTGAATCGCGCATCGCCATTGATCCAAAGGGTGTTGAAAACATACGTCAGTATGTTGTACAGCCTGCCCTAAACATAGTGCAACAATCGAATTGCTTGTGTCTTTGCACTCATCGTTTGCGAACTTGCCGAGAGAGATAAGTGGGCAAATGATGCATATTCAATGAAGTTGGCTTTGGCAGCTATTGCATATGTTGCAGCCAACATACACATTCCAAAGGCACCAAACACATATAATGTTGAATATCTTCTGATTTGGCTATTATCTATTCGAACTTTCTCATGATAAAGCATTCTGTAAATTTTTCAAGGTTTTAACGAGACATGTTGCTCTTGAAGCATGGACACGCGAATGTTCGATCGGTAATGCACCGCTTCCTCTCATGCATTGGTCACTGTTATCAGCATATCCGAACTGCCACCGATCGAATTGTCCTGTCACTAAAGGAACATGAACATTACCGCCATTAGTTGCAGAAGTGGCCACCCTAGAGCACCAATCTATCCAGGCAGTGCAATGGTTCCATATCGGACACAATTAATCATCCGTGCAAAAGAAGTATGCGGATGACGATCAACATGGTACATGTCCCTCAAAGTGCATGACCACGATCTAACGTTATGTGACTCTTACACGTGGAAAATCGCAAGCAAACGTAATGGCGCTGATCTTGGACTCAATAGTAAAAAATATGTATCGGTTTGGAATGGAAGATTTTGAGGACTGAGTACTCACGTCTGGCGAAACTGATGCGTTCGTGCTCTACGTATGGTATCAATGGCCCCTATTATGAAACAAGTCGATAACGCTATCGATCGACAAGAGTAAATTTTTGAATGAACTTTTCTTGCAAACGAACATAAAAATGAACACTTGTCGACTTTTTTGTCGATCGATAACGTTATCGACTTTTTCATAATAGGGGCCACTGTCCGTCTGCAATTGTTTCTATGCTATCCGCTGCCGATGGTCCTGTGTTTGCCACTTATAGGCTACGGTAGATCCTTGCAACAAAAGCTCTTCTAGTCAATGCAATCAATAAACTTACAGTGTTTTTTCTAAGATGTTCGCAGCGTTCAAATGGCACTCCTGGAAACAGCTGAACAAACATCAATAATCTGTTGAATGGAGAAAATAAGCCTGCCTCGGATAGAACAATCAGAATGAATAGAAAATAACAGCAATTTACACCTAGAAGAAGCCTCTCATCTTTGTAATGTATGCGTACCCTGAATTCTAGCTCCATGGATGATAAACTATTCTTAGATGATGAGCTAGACTGTTAAAGTAATGTTATTAGTTCATCAAGTGTCAGTTGCACAGCTGATTATAAAAACAAGACAAAGTGCGTTGTTAAAGGGAAAACACATCGCGATAGTCATTTGGAATACTCAGCTTTTACAGTTATTGTGGTGAGCATTTAATGTGTTTGAGTATAGAATTGAAAAAGAACCAAAATGAGTTTTGTCTAAAATACACTAATATAAAACCAGCTTATCATATAGACTATTTGTTGTATTTTGATAATTTCTGTTTTTCCAAAAAGCGTTGTATTGGCAGACAGGCGTCAGTTCCGTTCCTCTTCCTAAAAGCAGAGGATCGCCAGATGCGGCGCAATCACGATCACTATAATTGAAAGTAAAATGAAGACCCTCCACTCCCATTCCTTTCAATGGCAATTCAATGGCCCGTACGCGCCATTCTCCTACTCCCGAGACCAGCGCTTCAACGCCTTTTAACTTACCGTAAATGCCATCGAATTGCACTCTTTCTCACTCAATGGGTATTCTGATGCGGATCCTATCTCCAATTACACATACGGTCCTCAAACATCCAATGCACAAATGATAAACCCACCCTTCGGTGAGTAGAATGAATTGAGTTTTTGCAGGTGACGCTTTGGTTAGACAGTCGGTCGACCGATTCCCATATATCACAGTTAATCATCACGCCGAGATACCTGACAGCATGATTCAACGAAAAACCACGCAACTTTAGTTTTGTGATTCGCGAAGAGTAAACTTTCTCTCGTTTATTTTGCCCCTTTTCCAGGATTTGGCCACAGATTCTATAGATCACTGATACATGCGATAATCAAAACCCCTAAAGAAAGCGCTTGAGATCAGCGCCCGACATGTACGTATTTATAGATGTCAATTCCTCAAAACGCCGGTTATTTATTGGTTTTTATCATAATAACTGCGTGTTTTCATACACATAGTGTTGATAGTTGGTTGGTCGTTACTATTTCTTCCTTCATTTAACTGTCATTTTAAGATTGCCTTAGAAACTTGCCATAAGGAATTCAAAAACGAGCATTTTCAACGGACATCTGTCAGCCAGAATGAAAGTTAAAAGTCATTGAACAAAATGTAATATATATTATTAGTAAACCATTATCTTAAGTATTTGAAGAATTGAATTTAAGAATTTCTTTTGTAAAATTTAATGTATAAGTAAAATTGAAGCACTGTTGTAAAGTTTAAGTAGCTTTTAAACTATGCTATTCTGTAAAACGAGAATGCAAACCCAAGAGATTGGACACGCATTTAAAATCCTAGCAAAGCATTTTCTAGCATCGTCGAATGGTGCCAATTGTTTCATCTTTTTCGTATTGGTTAGTTTAAAAAGGAATATGAAGAATGGATTTTAATTTGATTATATAAATTCATAGAAAACACATTTCCTAGAGCATTGCCATTATCGACATCGATTGACACCATTCACGAAGCCTGATTGTTAAAATGAAGAAACACCTCCGCTCCTCTATTCAACACTACCGGGATCTACTCAATAAATATGCAAATCATGTAGCTACTACGCTCTTACTGTTAAAAGATCCTATTCATGGTATTCTCCAAAAATATTCAAGATTTATGAATATATTTACATCAATTGTGTCAAACGAAGGACTCTTCGTTTCACCTTTATTCTGTAGCTATTTATGAAGACGCGTGCCGCGTTGTGTGTTGTTGGGGCAATTTTAATGTCATCATCGTGCCGTGAGGGAATGGTAACTGAAAGGCTTTAAGATGCAAAAAGTTTAAAATTCCAGTAGCAGAATTACTTGAAGGATAATTCTTCTGAAGAAATGAAACCCATAAAATATGAATATTAGACTGTGTACCTGCATTAGTCTAACACCAAAATGTATGACCTTCCACAAATCATCCTACCACCCACGACACATGGATCAAACATCAGCTGTATATTGTAATATATTTTATCAAGATTGTTCTAATATCGATGAAATCTTAGTTTGTAAATGAAGATATCCATCTTTATTTTGCCTCGGTTCTCATCAGTGCTCAATGAAGTTGAAACTGTTTAGAATTGACTGACTCTGTTTTTTTTTTTTTTATTGAAAACATCTAGCGATTTGTGAAGAAAGAAACTTAATAAAACTGATAATATTTGATAATAAAAAATCAATAAAAAGATAGCCATTTGAAATAATCAGGCTATACAGGTGCGTAACCAACATGCCTCCAAACTCATTCCGGAACCATTCCGGAAACTTCTCTGACGTCTACCATAAAGCAAATAAACTTAATTGACCATATCTCAATTCAGTCAAACAACCGGTCAAAAAGCAATAATCTTTTGCCCAGGGATGTGGCTGCATGCAAACGTTTACCATGGGATAAGGCAGCAAGTGCCCCGGCTCGTGCCCTTGGACGCTGTGACTGGGCTAAATCATTGGGGAATTGGTCAACGGTCACCTAATGGATAGGCACAAGGAATGAAATCAATTATTACTACTCATGTGGAAAATGCCGTCAACATTGCTTACAAGGGGGTGCAAACTATTCAAATACTCTCACTATTAGAAGTAATACAGTTCGTAAGCAAACGTGTGCAGCAGGTTTTTTTTATTGAAAAAAAAAACACAAAATTGTAATAAAACTGCTACTTGCACCTTTTTCACCTTGCATATTTTTTCTGAGTGGTGAAACTTCCAACAGTATTGCGTAATCGTTTTAGAGCAATCGAATTAATTTGCGCATGGTAGCTTTTGTTTTAATAAAGTTACTTTTACTTTATTTTAAGAAGATCCCGAACCCCCCTACAAATTCTGAGCAGTGCCTTTTGAAGCGGATATCTCAAAACTATGGTTTTCAATCTCGATGGTCATTACAGTACTTCCTTTCGTTTTGAAATTTTGAACACATCATTTACCCTTTAAATGTTTACTTGTCAAGCTCGAACATTTTTTAAATTTTTCGATACTTTTTATACCCCAAAGGAAAAATCGATTATCGATTGTATTGATTGGTAGTAATCGTTCTAAATGCACAAACAATTATTTCTGCAGCTTAGGAGAATCATACCCGTATGCCTTTATCGAACAGTAATTGACGGACGTAGTGAATCGTTTAGAGCAATCGAATCGTTTTAGAGCAATCGAAT\n>XM_009271859.1 Wallemia ichthyophaga EXF-994 Phenol 2-monooxygenase partial mRNA \nATGGCGTCAGATCCGCAAATCAAAAACTCAAACGTAGACGTACTAATCATCGGAGCTGGTCCTGCTGGTGTCATTGCCGCTGACTGGCTCGCGAGATTCACCAAATACGGTGTTAAGACAAGGGTGGTGGACAAGCGCTCGCACAAAGTCTTCACCGGACAAGCAGACGGACTCAACCCGCGCTCTATTGAAATGTTCCAGTCTTTCAACATTGCAAACAAGATCGTCAGTGAAGCGAACCCGATGAATGAGGTTTGTTTCTGGGCCCCAAATGAGAGCCATGGTGGTATTGAGCGTGGTAGACGTATTCCAGATACCATCCCTGGTATATCAAGATACGTCCAGTCTGTCCTCCACCAAGGTAGAATCGAGAGACACATCCTCGACGACATGAACGAAAAGAGCAATGGTACAATGAAGATCGAGCGTGGTGTGCTTCCCGAGACGTTGGAAGTCAATGAAGAACTCTGCCAAGACGACAACGCGTACCCAGTCAAAGTCGGTATTCGCCAACTCTCAGAAGAGGAATCACGTCCAAAGCTAGGCTCAAAGAACGGTGAAGTAGAATCTGGTCTCTACAAGTCAAACCTCGTCAAGGATGAAGACGATGACGTCGAATTCAAACCAGATGTTCCGGTCGGCGACAGAGAAATTATCAACGCAAAGTATGTTATTGGTGCAGATGGTGCGCACTCGTGGGTGCGTCGTCAATTAGGATTCAAGATGCAAGGTGAAGGATCTGATTTCGTTTGGGGTGTTGTCGATGGTGTTCCAATCACAAACTTCCCTGATATCCGCTGCCGTGCTGCTATCCACTCAAACGCTGGTAGCATGATGATCATTCCACGCGAAGGTAGCCTCGTTCGTCTGTACATTCAGCTCAACTTGCAAGTGGACGAGGGTGGACATGTCGACCGTAGCTTGATCACACCAAAGATGCTGATGGACCAAGCTAAGGCTGTGTTCCATCCATACTCGATCGAGATTCCTGATATCATGTGGTACACCGGTTACCAAGTCGGACAACGTCTCACCTCGGAGTATGCAAAGAATGACCGTGTTTTCATCGCCGGTGACGCTTGCCACACGCACTCTCCTAAGGCCGGTCAGGGTATGAATGCATCCATGGCTGACACATACAACCTGTGTTGGAAAATTGGTCATGTCTTAGCTGGACACGCTCCACGCTCCATTCTCAAAACATACGAGAGCGAGAGACGTCCATTCGCGGAGCACTTGATTATGAACGATGCCCAACTCGCCAAGCTCTTTTCAGGAAAGCCATTGTCATCAGCTGAGCTTAATGAACTTGGTGTCGACATGAAGGACTTTGAAAACATTCTCGAGAGAGGAATTTCATTCTTTTTGGGTACTTCTATTGAGTACTTCAACTCCACTGCCACCGCCAACGGAAGAGACGGTAGACTTTCATCGAAGCAGGAGCTGGCGAAGAATATACCAGTCGGACAACGTTTCCCCTCTCACCAAGTCGTCTCGCAGTTCGACGGCAGACACTACCACTTAGTCGACACCATGTTTGCTGATGGACAGTTTACTATTGTGTTATTCGCAGGCAATATGGACAAACAAGTAAACCGTCAACGTTTGCAAACCATTGCTCAACGTCTCGACAGCGATGATGGCGTAGTGAGCAAGTATACACCTAAGGACAGACAAAGAGATGGCGTGATTGACGTCAAGACAGTCCACTGTGGAGGCAGAACGAACATTGAAGTGCATGAGTTCCCACAACCAACTATTTACCCACCAGGCACATACAACAAGCTCTACGTCGACGACGTTTCCTACCACGCAGGTCACGGAGAGGCTTACAAGAACTACGACATCAGCAAGGAAGATGGTGCTGTTGTTGTTGTGCGTCCAGACCACTTTGTCGGATTAGTTACCTCGCTCGACGGTGCTGGTATGGATGATGTCGACAAATACTTTAGCGGATTGCTCAAGACTGTTCCGGCAGAGCAACGCAACTCGGCAAAGGATATCAAGGTTATTCCACAACCTAAAGTTTAA\n>XM_041320268.1 Suillus paluster uncharacterized protein (EDB91DRAFT_1172848), partial mRNA \nATAACCCTCCTTGGGCACGCTATCCTTTATTGCTCTCTTTCCCCACAACTCCATTGCATGTGCTGCCACACCTCCTTCACCTCCCTCCGATGATAACAGCACACTTGTTGATCTTACAGTTCATGAGACACTGTTGGACTGCTGCATGGGAAGCATCGAGGAGAAAGCATATATAGCTCCTCCTACCAGTGACAGATATCAACCTCACACACTTCTGTGCAGCTTCGGTTATCGACGATGACAAGCTCATTGCATATTAATAAAGTGGCGTATTCATCGTGGGCGCTGGCAAGTTGGTCTGGAGCGTCGTGTGGTAGACATACAGTGCAGCAGTTCAACTCATCAGTGTCAGAAAGACAGGCGTACACGACCTGCTCAGATAGCATTATGAGTATTTTGACTTCATTCTGCGCTACATATTCAAGGCGACAGACACCCGTCCCCACACCTCAGTCTCGTTAACCGTTGACTGAGGCTCGTGCACTAGCTCTTACCTTTGATACTCTGCTACTTCTCCAGCTACCTTAAAAGCCCGCCTATCAACAATTGCTCGTTCATCCAGGTCATGCATT\n>XM_025612137.1 Aspergillus sclerotioniger CBS 115572 methyltransferase (BO94DRAFT_536881), mRNA \nGAACTATGCGCATTGCACACCGAATTTCCTGTTCCTTAGTGAAGTCTAGAAATGTGACAGCCATGCATCGCCCTGATATACGAGGCATTTCAAGCGCATATAAAAGGCGAAGACGCCCCAGCTGTACGAGAGGTGATGTCGCCATCAACGTAATTTTACAGAGCAAAATGCCGACCACTATCGCTCAGACCATCCAATCTTACGCCCTTCGCTTGGTACAAGACACTCTGCGGCAGATTGCAGCCCCTGTGAAACTGATCTATGTTGTTGATGGAGTGAAGAGTGTCTTGTACAACGACCCAGCGATACAGGATGCCGATAAAGCGGTGATCTATGTCACCCATGTGAATTTCTGGAGAAAAGTCCTCCTAGACTTCGATCTGGGATTTGCAGAAGCCTTCATGCTTCAGGAAGTGGAATGCGACCAACTAAGTAAAGTCTTCGACTTATATATCAAAAACCGCGCGACCCTCGACTCCGGTGACTCACTGTTTCATCTCGCTCAGCGATTAGCCCAGTGGTGGAGACCAGCGAACAACATCGACAATGCGCGCATCAACATCGCATCCCATTATGACACCTCAAATGGATTATTTACCAACTTTCTCTCTGCAGATATGAACTATTCCTGTGCGCACTGGTCCAACGATACTGCGGAATCCCTACAGACAGCACAGCGACGCAAGGTTCACTATATGATCAGAAAGGCCCGCGTGCAACACGACCACCACTTATTAGACGTCGGTTGCGGATGGGGAGATTTGATTATCGAAGCGGCGCAACTAACCGGCTGTCGAGCGACAGGTTTGACACTCTCAGAAGAGCAAAAGAATTTGACGGATGAGCGCATCCGTGACGCGGGCCTGCAGGACCGCGTTCGTGTACTGTTGTGCGACTATCGCAACGCCCCGCGGCCAGGCAACGGATATGATTGCATTATCTCAATCGGCATGTTTGAACACGTCGGACCTGAGTATATGGATCAATATTTCGAAGTGATATCTCAATTACTAAAGTCTCAAAACGGCGTGATGGTCATTGACGGCATAACTAAAATACACCCATTTCACGAGACCAATCCTCGCGTGGGTGATTACATCAATCGCTACGTCTTCCCAGGCGGATACTTGCCCACACCAAGTATACTCTTCGAGGCACTCCATCGGGGCAGCAAAGGGACATTGGAAGTGTCCTCTGTTCTCAACACCGGTCCTCACTACGGCAAAACCTTACTAGCTTGGAGGAACAACTTCATTTCCAACTGGGAACATATCCGATCTGATTTTTCCCCCCGATATCCCGATGCGTCGGAAAAGGAAATCGAGACCTACCGGCGGCGCTGGCTATACTACTTTGAGTATTGCGAGGCTGGGTTCCGTAATCGTATCTTGGGAAATTACACCATTTGCGCGGTCCGCACCCCCGAGGTGACCATTGACTACAAGAGCCTGGACATTGATGATGCGCAGAGTATCAAATTATATGAATGAATCATTGTTCTTATTGGGGTCTGGGTCTTCAAATACGTCTTGACTTCATGATGAGCTGCAGAACAAAGATAAGTCATGCTTTATGTTCGGC\n>XM_041003117.1 PREDICTED: Ochotona curzoniae negative regulator of reactive oxygen species (NRROS), transcript variant X3, mRNA \nTCCTTCCGCAAGTGCGAAAATAACCCGATGCCCTAGAGAGCAGGCAGCCCAGCCCTGCGTTTGGTTGCTCTCAGGGAGGCAGGAGCCCTGGGAGAGGATGCACCCCGCCGAGCCGCCTGGGCCTGCGGGAGGAGCCGGCTGCCCTTGAAATGGAGTTGCTGCCCCTCTGGCTCTGCCTGGGTTGTCACTTCTTAGCCGTGGGATGGACAAAGAGCAGTGGAGCGGACATTGCTGTGTCCCAAGGGAGCTGCAAGTGGGACGACGGAACCGGAACCGCTGACTGCCGTGCTCAGGGCCTGGCCTCGGTGCCCAGCAGCCTCTCTCCGCGCTCTCGGACGCTCCTCCTGGAGGCCAACCCGCTTGAGAAGCTAGAGAATCACTCCCTGCAGCGTTACCGTCTCCTGGAGAGCCTCGGCCTGCGCGGCTGCCACCTGCACCGTCTGGACCGCAACGCCTTCCGCCAGCAGCAAGGCCACCTCCGCAGCCTGGACCTGGCTGACAACCGACTGGCCGAGGACTACCACGAGGCAGCCGCCGCCCTGCACACTCTGCCGCACCTGCAGACGCTCGACCTGTCCGGGAACTCCCTGACGGAAGACATGGCGGCCGTCCTGCTGCACAACCTGTCGTCGCTGGAGGCCGTGTCTCTGGCCAGGAACACGCTCATGAGGCTGGACGAGTCGGTCTTCGAGGGCCTGGAGCGTCTCCGGGAACTGGATCTACAGAGAAACTACATCTTCGAGATCGAAGGCGCCGCCTTTGACGGCCTGCCGGGGCTCCAGCGTCTCCACCTGGCCTACAACAACCTGCCGTGCATCGTGGACTTCCGCCTCACGCAGCTGCGCTTCCTCAACGTCAGTTACAACGGCCTTGAGTGGTTCCTGGCGTCGAGGACCGAGGCCACCTTCGAGCTGGAGACGCTGGACCTGTCCCACAACCAGCTGCTCTTCTTCCCGCTGCTGCCCCAGTGCCCCAAGCTGCGCACACTGCTGCTGCGGGACAACAACATGGGCTTCTACCGGGACCTATATAACACCTCATCACCTCAGGAGATGGTGGCCCAGTTCCTCCTGGTGGACGGCAACGTGACCAACGTGACCACCGTCAGCCTCTGGGACGAGTTCTCTGCCAACAGCCTCCCGGACCTCCGTCTCCTGGACCTGAGCCAGAATCAGTTCCAGTACCTGCCCGAAGGCTTCCTGAGGCAAATGCCTGCCCTCGCCCACCTCAACCTCAACCGGAACTGCCTGACCACGCTCCACATCCAGGAGCAGGAGCCCCCCGGGGCGCTCACCGAGCTGGATCTGAGCCACAACCAGCTGTCGCAGCTGCACCTGACGCCCGGGCCCAGTGGCTGCCTGAGAAACCTCCGCTCCTTCAATTTGAGCTCCAATCAGCTCCTGGACGTGCCCTCCGGCCTTTTTGCCAATGCCAGCAGCATCACTACAATCGACATGAGCCACAATCGAATCTCACTGTGTCCCGGGGCTGGCCCATCCAGCTGTGTGGATTTCAGGAATCTCACCTCTCTGAGGAGCCTCTCTCTGGAGGACTGCGGGCTGGACACGTTGCGGGACTGCCCATTCCAAGGGACACCCCTTACGCACTTGGACCTGTCCAGCAACTGGGGTGTTCTAAACGGGGGTATCAGCCCACTGCGGGATGTTGCCCCCATGCTGCAGGTCCTGGCCCTCAGGGATGTGGGCCTCAGTTCCAGTTTGACCCAGTTGGACTTCTCCGGGTTTGGGCACTTGCAGAACCTGGATTTGGCAGGAAACGCCTTGACCAGCTTCCCGAGGCTAGGGGGCAGCCTGCCCCTGCAGACCCTGGATCTGCGCAGGAACCGACTCACAGCCCTGCCCCACAAGGCTGTGTCTGAGCAGCTCCCTCAGAGTCTGCGGATCATCTACCTCAGTCACAATCCCTATGACTGCTGCCTGGTGGAGGGCTGGGACGCCCTGCAGCACCTGGGCGTCGTGGCTGACGCAGCCTCCATCACCTGCAACCTGTCCTCCAGGGTCATTCGTGTGCTGGAGCTGCCCGGTAGTGTGTGGCATGACTGTAAGTGGGAGCAGGTGGACACGGGCCTCCTCTACCTTGTGCTCATCCTGCCCAGCTGCCTCACCCTGCTGGTGGCCTGCACTGTCATCTTCCTCACCTTTAAGAAACCTCTGTTCCTACTGATCAAGACCCGCTGCCGCTGGTCCTCTGTGTACTGACTCAGGGGCAAGCCTGGGTTTGCTACTGGGCCTGGGCAGCTGAGGACATCTCTGGGCTGGACTGGGGGCTCTCCATGCAGAGGCTAGTGTGATAAGCCAGGGTTTAAATTAAACTGGAAAATGGTTCCATCCCTTAGCCTCTGCCTCCCCCTCCACCTATAAGTTTTTATCTCATTTTGATGGTTCAGCCTCATCATTCTGGTCAAATATTTATTAAATGACACTGTATAAAAATAAAAGACAATGGTCTCATATA\n>XM_043331653.1 Rhizoctonia solani uncharacterized protein (RhiXN_11838), partial mRNA \nATGTCTCGCCTCGCCGCTGTGGCCTTTATTCTTCTTTCACTCAGCTTCCTTGCTCATGCCTCGCCCATCGCCGCCCCTGCTCCAGAGCCCGAGCCTGGGAAGAAAATTGTTGCGATTGAGGAGCGCGCTGGAAGCCATTGCTACGGGGGATATTGCTACGGTGGTCTAGACCTTGTGACTCTACTCTTGCAACTCCAGGCTGCGATTGAAATCAAGCTTGGGTTGCTTGATGGATGTCTACACGGCGGAGATTACAAGGCGATTATCCTTGAGATTGAAGCGCTGTTGTATGCTGCTATTGGTGCTGTCCGAGGCTACAAAATTGGTCTTCTTGGGCTTCTCACTGGCAAGATTCTGGTCATCGCTAAAATCTGGTTTGCTATCGTGATTTCTATTGCTACTCACTGTGGAAAATGGGCAGGCCACGCAGATTTTGAGATCTTCCTGGTTCTTATCGTCAAACTTGATCTTGCCCTTAAGCTCTTGCTCCTTGCCATCATTAATCTCGGCGGTATTCTCAGTGGCTTGCTTAGCATCATTATCGGCTTGTTTGCGAAGGTTCATATTGCTCTACTAATCAAAGTCAAGTTCTTCCTGTGCCTTGGCGCTCTGAGACTCGGCGGCTACTAA\n>XM_039822988.1 PREDICTED: Perca fluviatilis glucosidase 2 subunit beta-like (LOC120573318), transcript variant X6, mRNA \nTTTCAGGAAGTCAGGACATGGCCAGTTTAAATGTTGGATGTCATGAGTTTGAAACACCTTTGAGCGGGTTTTTGCGAGGCAGGAGGCAGACAATTTACAATTATGTCATCTGACATGCATTTCCATATTATTATCGCCGCTGTCTTTTGGTGTGGTTTCGTAGACTCGCGGAAAATAAGAGGGATATCTTCGTCCTGTCCTTATCTTCAACACAGACAACATGTTGCAAGTTCCTATCAAGTTGCCATCGCTGCAGATGACAAGCGGTTCTACAGGGAGAGGAAGTCTTTTCTGTGCATTGATGGGTCGAAGATCATCCCATTTGAGCAGGTGAACGATGACTACTGCGACTGTGAAGATGGCTCTGATGAACCTGGCACCTCAGCCTGTCCTCGTGGCCGATTCTACTGCACCAATCTGGGTTTCCGCCCACACTACATCCCATCATCGCGAGTCAATGATGGCATCTGTGATTGCTGCGATGCCTCCGATGAATACAACAGCCACGCTCACTGCCAGAACACTTGCTGGAATCTGGGACAGAGAGAGAGAGCATACGTGGAGGGCCAGATGAGGACCTTGGACGAGGGTTTGCAACTCAAGCAGCAACTGATTGAGGAAGGAGTACTGCTCTGGAGGGAGAAACAGGCCCAGCTCAGAGAGCTTCAGCAAGTAGCTGAGGACCTACAGATCAAATTAGAGGAACACAGAAGGAAGAAACATGAGGCCGACCGACTCAAAGAGCAAACTATAAAGGCGCTGGAAGCAGGGGGCAGCAGTCTCAGACGTCAAAACAGGACAGTATCAAGTACTTTCAAGCTACTGGACAGCAATAAAGATGGCAGTATAACAGTGGATGAAGTCCAGGCAAAAGTGGCACTCGTCCATGATGAAGAGCAGGTTCTCTCTGAGGATGAAGCAGTGGCTTTGTTGGGCGGAGGCCATCAGATGGATCTCACCAAGTTTCAGTACACTCTCTGGGACATCCTGACAAAAGGAGACCATGTCAAGATCAAAGACACCCGTGGTGCACCAGGCAGTCTTGTGGGTGAAGATCCTCACTTAAAGGCAGCTGATACAGATATCATGACCCGGTTACTCAAGATAATCCACAGACCTGGTTGTGGGCAGATTAATTTAGGAAACTATTTTCTTTCTACCGAACTCCACCCGCCAAACGTACCACGGTGCAGAAGGAAGCATACTTATGGACTAGCGGCTACTCCTCTTTGGCTGAGCTGTAACGTTGCTTACTGATAATGCTAGCTGACGTGAGCTAGCTTACGCTACAGCTCTGCAGGGAAGGACGCCATAGATGTTTACATCTCGCGCTTTCACAAGCACAAGCCTCTCGTCCATTAGTACTCTTCCTTGTCGAAAAATTAATCTAAAACATTTAGAAGATAACTTATGATGGACACTATTTTTAAACAAGTGTAAAGTTTATGTGATTATTGCATGTTTTAAAGAAGAAAATGAGACAGTCCTGTTAAAATTTTGGTGGAGGGGGTGGTGGTGGTTGCAGTCTTTTTTAATACCACCACTAGACGGTGCCAAAGTCAGAAATGTACACATCCTAAATAGTAGCTTTAACTTATTATTAAATACTTACTTATTTACACACAATTTGTTTAGCTTTTTGTATTAAGTGGATTTTGGAAATATATATATATATATAAAAAAAAGGTGCAGACCCAGAGGGGACTGAAATGTTAGTTTTCATAATAAATGGTGATGCTAGAGCAAGAGTAGAGTGTGAGATTTTTCTTTTCTTTGTTCAAGTTTGTGAT\n>XM_017639444.1 PREDICTED: Rhagoletis zephyria uncharacterized LOC108383066 (LOC108383066), partial mRNA \nATGGAGCAATTGGAGAAGGAATTTGCTGACTTCTTCGGCGAATGTAAGCAGCAAGGATTTACCTCCAAAGAAATGCGTGCCATATGTCAGCCGCTGTTGCATCGTCGCAACAACAGATGTTACGTGTTACTGGGCGTCTTGTTGGCTATGATGGCCGCCTTTTATTTACTCTATAACTGGTCCGAAGAATTTAGTTGGTTTGTTAGCGCCATTGGACGTTTGGTGTTGCTACAGCTGTTGCCCTACTGGAATTGGACGCCTCTATATAGTAGCCGGTGTCTAATTGAGCGTGCGGTAGATAAAAACGGTGCGCAGAGTGCAACTTCAACAACGAAAGCCTTGGGCCGTTATGAGACTGAAGCTGAAAATTGCGTACTTTGCGAGACGCTTG\n>XM_047907316.1 Fulvia fulva Putative ariadne-like RING finger protein (CLAFUR5_08168), partial mRNA \nATGGCCAACAGCTCGGAAAAAGAGGTTGTGGACCTCCTCATACTGGTTGACGCCACGGCGTCTATGACCAGCTATCTCCAAGCACTGAAGCAATCACTACCACAAATCATCTCTATTTCAGCCCTGACGAACTGCTTTGATCGCATCGGCATACTAGCGTATCGCGACTATGCCCACCGCGACCTCCTCGACTGGTCAGGCTGGACTTCTTGCGCTCAAATGCAGCAAGACGGCGGAGCCACCCTAATCGCCAAAGCAAACGCTCTGCACGCCGTTCGCGGGGAATCCGACGACCACCCTGAAGCCGCGAAGACTGGCCTTGCTCAGGCATATGAGTACATGCGCACCGATGCAAAGACCCTCATGCTAGTCTACGCCGATGCGCCACCTCATATCGAAGGCCTTAAGACCCGTGCTCACAACGGAGACAAGGAGTTACAAGCCCTCTCTGATCCGCAGAGTTATGGCGGATACGGGCCACTCTTCGCGGATTGGGTCTCTGCTGCGAAGACCATGCGCGAGGGAGAGAAGAGGGTACAAGTCATGTCGATTCTACACTTCCCGTACCATCCACAGGATTCTGCCTATTTCGACTACCTAGCCACCATGACGCGAGGCGCTGCTATTCACTTGAACAACTCCCAGGCACGTACCATTTCTGAGGTCACGGTTGAGGTCTTGCTAGCTTGGATGGGTGTGAAGAAGGAGGGAGCTGGATCGGTCGCACTTCCTGCGAAGCTCTCCTGGTACGTGGACACAGATATCGGAAAAGTGAAAGCAGAAGGCGAGCTCGCTGCTTTCCTCCCGTTTGGAGATGTGATTGCATCTCAACGGCTAGCTCTCACATCCGAGCTTCTCGAACAACGACTGCCAAAGAAGGCGACTCCGCTAAAGGACTTTGCACGGTCTTATAAGGAAGATGCAGCGTATCGAGACATCGTTACCACGCATCTCCGCGCTATTATTGAGAGCGATGTGGCTGCTATGAGCTTGAATCCTGTCTTTGGTTCTCTTTGGCGGACCTTCTGTAATGATAAGGAAAACCCTCATGGGCAAGACCTCCTGGATCTGTTCGGGCTGAAAGTCAACGGTCTCGCGTACGCGGATGACCGAGCGAAGATGAAGACCTGGCTGGAAGAGTCTTACGACTATACTGCAGAGGTTCTCGAGGCTATCGCTAAGGTGCCAAAGGGGTTGCAGTATCCATGCGTATGCTTGGATCCAACGCTGTCGTATGAGTTGGCGCCTCAAGCCGAGGACGAGGACAGCGAAGACAACCGCCCCATCACTTCCTTCCGGCGGGATGAGCTCCTAGAGCTGGGACGATCTTGTGATTACCGTATCCTGCGACGCTTAGGACGAGTGCTTACCCGACTGACATTTGTCGAGTCTGCTGATGCGATGCCAGGTCACATTGCTGCCGCTGGACAGGAGACTGTGACCAGGATCCCTATGGCATTGGTCCGAAAGGAGTATGGCCGCAAGTTCTGGCGGATTCTCCTACATATCGTGGTCCCGGGTACTATGCTCTCCGGTCGCGCTGCTGCATTGCTTGGAGCTCTCACTATCCGGATGGGAGTACAGCCCCTGAGACGTGCTGCTGAGGAAATTCCTGAGACGTGGAATGTCAGCTGTCTGTCCCTGATTCTTGATGCTGATAAGGCTTATACTGAGCACTATAATGACGGCTTCATGGGAAGTGAGGCTGGCTTGCTCTGGGACCAGGATCGGGAGCTGTTCAGGCGCCTCGTGGATTACAAGATGTTGGAGCTTAATCTTGATACAACGCTGCACGCTCAAGTAGCCTGGACGCCTCACAAGACGACTATGTCTCTCGGTCCTACCATCATGTGCAAGCTATGCCAGTACCATCGATCAGTGACTGGCATGGGACCAGAAAACATTTGTGGACTGTGCTGCTACAATCGTGACAATCCCAATGCCACTGATCAAGCCAATATCCATTGCCACACTGCAGACGCTGATGGCGAAGCGGAGAACATATACTGGTACGAATGCAGCGCTAAGCACTGTCGAGCCCAGTACATCGTCCACGAAGCCGACAGGCTGAACGTGCGACCAAAGTGTCATTACTGCCGCATGGGAGAAACCGCTCCGATACTAGAATGCTCCAAGTGTCTCAACGGAATGATCAGGCCGCTGGAGTATCGACACGGCCTGGACGAAGCAACCTTTACTTGTGTAGGCTGCTCACAGGGACGCCAGACAATCATCGATATTTATGAGCATATGAACGAGGCGCATGGAGGGTACTATGGTGATTTGGAGGATGATGAGGACGGGGAATAG\n>LN871451.1 Bacillus licheniformis partial 16S rRNA gene, strain IRQBAS20 \nTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTTTTCGGATCGTAAAACTCTGTTGGTAGGGAAGAACAAGTACCGTTCGAATAGGGCGGTACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAAGAGGAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGAGGGTTTCCGCCCTTTAGTGCTGCAGCAAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTCTGACAACCCTAGAGATAGGGCTTCCCCTTCGGGGGCAGAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGATCTTAGTTGCCAGCATTCAGTTGGGCACTCTAAGGTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGGCAGAACAAAGGGCAGCGAAGCCGCGAGGCTAAGCCAATCCCACAAATCTGTTCTCAGTTCGGATCGCAGTCTGCAACTCGACTGCGTGAAGCTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGTCGGTGAGGTAACCTTTGGAGCCAGCCGCCGAATGATGATATGAAATC\n>OP114738.1 Raoultella ornithinolytica strain X13 16S ribosomal RNA gene, partial sequence \nTGCAAGTCGAGCGGTAGCACAGAGAGCTTGCTCTCGGGTGACGAGCGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATAACGTCGCAAGACCAAAGTGGGGGACCTTCGGGCCTCATGCCATCAGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAATGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGAGGAGGAAGGCGTTAAGGTTAATAACCTTAGCGATTGACGTTACTCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTTGAAACTGGCAGGCTTGAGTCTTGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGTCGACTTGGAGGTTGTTCCCTTGAGGAGTGGCTTCCGGAGCTAACGCGTTAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACTCTTGACATCCAGAGAACTTAGCAGAGATGCTTTGGTGCCTTCGGGAACTCTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGATTCGGTCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGAGTAGGGCTACACACGTGCTACAATGGCATATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTATGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTAGATCAGAATGCTACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTACCAC\n>XM_021864905.1 PREDICTED: Chenopodium quinoa outer envelope protein 61-like (LOC110688195), transcript variant X2, mRNA \nTAAGAGTCCTAGTCCTAATTCAAGTGTGGTTGGCGTCTTGGCGACCCACCTTATTTATTTCCAACAAAATTAAAATTATAAATTCTAATTCTTCACCTCTTTCCTCTATTTAACTTCACAATTATCACCGAATTTCCCTAACTGTTTAATTCTCTCTCTTCAATTTTGCATCCATCGCAATTAATCAATCCCTAGATTCTACGAATTTCTGCTTCGATTTGATCTCAATTGTAACTTATTGATTTTGAAACCCTAATCAATCGAAGGATTTTGCCAGATGTTTAACGGTATGATGGATCCTGAGTTGTTTCGGATTGCGCAAGAACAGATGAGTCGCATGTCTCCTGCTGAGATGGCTAAGATCCAACAGCAGATGATGTCTAATCCGGAATTGCTTAAGATGGCTTCGGAAGGTATGAAGAATATGAGACCTGAGGATCTAAAGATGGCTGCAGAGCAAATGAAGAATGTACGTCCTGAAGAAATGGCTCAGATTGGTGAGAAGATGGCTAATTCATCCCCGGAAGAAATTGCATCAATGCGTGCACGTGCTGATGCTCAATTAGTCTACGAGTTAGATGCAGCTGAATTACTAAAGAAACAGGGAAATGACCTTCACAAACAGGGGAAGTATCATGACGCTGCACAGAAATACTTGCGGGCAAAGAACAACCTACAAGGGGCTCCAGTTGCCAGAAGTAGAGCATTGCAGTTGGCATGCTCACTTAATCTGATGACATGTTATTTGAAAACAAGACAATTTCATGACTGTGTCAAAGAAGGCAGTGAGGTTTTGGCCTATGATGAAAAGAATGTCAAGGCCTTGTACCGTAGGGGTCAAGCATACAAAGAATTAGGTCAATTAGAGGTTGCTGCTTCTGACCTGACAAGGGCACTTGAAGTTACCCCTGGTGATGACACAATTGCTGAAGTTTTAAGGGAGGTCAAAGAAAGTCTAGGAAAAGAAGGTGTCACACGAACTTCGACAGTTGCAAATGGTAAGAGAACGTCTCAAGATTGTTCAGTTACTCAACCTGAGGAAAGCAGTGGGCATTCTAAATATCAATCAGAAACTGTTAGTAAGAGACCAACGACAGAATCAGAATGTTTGCAGGCAATGAAGGATGATCCAGACACAATCAGATCTTTCCAGAATTTCATTTCCGAAACTGATCCTGAGGTTCTAGCCAGAATGAATATTGGAAACAACAGAGAGGTTCCTGCTGACATGCTGAAGACAGCATCAAATATGATTGGACGAATGTCTCCTGAGGAGCTCCAAAATATGGTGAAAATGGCCTCCTCATTTAAGGGTGATAATTCACCCTTTAATGGTAACTTTGGACCGGGCTCAGTTCCTCCAAATTTGTCACCTGAAATGCTGAAAACAGCTAGTGATATGATGGGTAAAATGTCACCTGAGGAAGTTCAAAGGATGTTTGAGATGGCTTCCTCTTTGAAGCAGGACTCAGTTCCTAGCTCATCAGGTTCGTCAAGTGGCAGATCGAGTTTGGAGTCTGGTTCAAAGTTCACTGCAACTCGGGGTGTACCTGTTGATAGAAATAATGTTATTGGTGAGAGGAGCAGTATTTCTGGCTCATATTCTAATCCTGGAAGTACTTCCCAATCAAGTTTTCCTACATCAATGGGTGATATGCAAGAACAGATGAGAAATCAAATGAAGGATCCTGCCATGCGACAAATGTTTTCGTCGATGATGAAAAATATGAGCCCCGATATGATGGCCAGCATGAGTGAGCAATTTGGACTCAAGCTTTCTAAAGAAGACGCTGCAAAAGCTCAAGAAGCCATGTCGTCATTGTCACCTGAAGACCTAGATAAAATGATGCGTTGGGCAGATAGAATTCAAAGAGGAGTAGAAGGTGCGAAGAAGACAAAGAACTGGCTACTGGGAAGACCGGGGATGATTATAGCCGTATGCATGCTTCTTCTGGCTGTTATCCTTCACTTTTTCGGCTTCATTGGTAGGTGATTTTTCAGGACAGTAAGATAAATCTCCTGTTATAACAGCTTGTACTTGCTGATATCAGCAAATCCAGGGCCGAACTTATGGTGTTCAAGGGGTGTGTAAATC\n>XM_028853279.1 PREDICTED: Macaca mulatta estrogen related receptor gamma (ESRRG), transcript variant X13, mRNA \nGGAAGCTTGTACTGAAATATATACAAATAATTAAGAATACTTTTAGTGCACTGTTTAGTAATGCTCTCCCTACAAAAAAAAAAAAAAAATGCTCTCTTTATTTTGTCAAAATGCATTGAGAGAGATTTAATTCGCTATTTACCCCCACAACCCTCAGTCTCCCCACCCCTAAAACTGAAGAAGCCAATTTGTCCTGCGGTTGTTTACCTTTGTTTTGAAAAGCTATGCGTTGTATCTACACGTAAAGAGACAGTCGCAGGTATAGAAAGGTTTACACATATAATTTACTTAGGCATTCTCTCAAATTGTATTGTCACTGTTTCCTCTTCTGTAGTTGTGTAAAACTGCATTCCACCTCAGAGATGACGATCCCAGTTCACATGCTCAAACAATTTAGAAGAATGTCTTTATTATTATTATTTTTAATGCCCAGCATACATCAGGAAAACAGGAAAAGACATGATTAGGAATACATGAGAAAGTACAGCACCAAATAAACAGCAGCCCCCGGTGTAATCAAAACACAGACAACGGCAGGACAAACTTAATTCTCTACCTTCCGCAGAATCCTTTCCCAAATTAACTGAGAGTCTGCGTGAGTTCTCCTTTTCAAGGCAAAAGAGATCTTAGGTTAGAAATCAAAGGCAAATCCCTCCAGTGCTTAGAGAGTTAAGTTAGTTATGTTTCTTTTGTAGCTTCCCAGAAGAAAAAAAAAAAGAGAGAGAGAGAGAGAAGGGAGGAAAAAAAAAAAATCAAACCCGAGAGTGTGTATTGGGAGCGTTTCAACCGCTCCCTTCTCCGCTCCCTTTTTCTCTGCCCACTCTCAGTTTCCAGCCCCCTTCGGCTCTCTGCACCCTGCCTACCTGCCTGGCTCCTCTCGCTCCGTGCAGCCTCCCGTCGCCTCCCTCCTGATTGGGCAGAGGCCCCCCAATCGGCTGCGCGGCTGGGCCGGTGGGACTGCATATGTAAAGCCCTACTTCATATTAATAAGCTCCAATCGGGGCTTTAAGTCCTTGATTAGGAGAGTGTGAGAGCTTTGGTCCCAACTGGCTGTGCCTATAGGCTTGTCACTAGGAGAACATTTGTGTTAATTGCACTGTGCTCTGTCAAGGAAACTTTGATTTATAGCTGGGGTGCACAAATAATGGTTGCCGGTCGCACATGGATTCGGTAGAACTTTGCCTTCCTGAATCTTTTCCCCTGCACTACGAGGAAGAGCTTCTCTGCAGAATGTCAAACAAAGATCGACACATTGATTCCAGCTGTTCGTCCTTCATCAAGACGGAACCTTCCAGCCCGGCCTCCCTGACGGACAGCGTCAACCACCACAGCCCTGGTGGCTCATCAGACGCCAGTGGGAGCTACAGTTCAACCATGAATGGCCATCAGAACGGACTTGACTCGCCACCTCTCTACCCTTCTGCTCCTATCCTGGGAGGTAGTGGTCCTGTCAGGAAACTGTATGATGACTGCTCCAGCACTATCGTTGAAGATCCCCAGACCAAGTGTGAATACATGCTCAACTCGATGCCCAAGAGACTGTGTTTAGTGTGTGGTGACATCGCTTCTGGGTACCACTATGGGGTAGCGTCATGTGAAGCCTGCAAGGCGTTCTTCAAGAGGACAATTCAAGGGGTGCGTCTTGACAGAGTACGTGGAGGTCGGCAGAAGTACAAGCGCAGAATAGATGCGGAGAACAGCCCATACCTGAACCCTCAGCTGGTTCAGCCAGCCAAAAAGCCATTGCTCTGGTCTGATCCTGCAGATAACAAGATTGTCTCACATTTGTTGGTGGCTGAACCGGAGAAGATCTATGCCATGCCTGACCCTACTGTCCCCGACAGTGACATCAAAGCCCTCACTACACTGTGTGACTTGGCCGACCGAGAGTTGGTGGTTATCATTGGATGGGCGAAGCATATTCCAGGCTTCTCCACGCTGTCCCTGGCAGACCAGATGAGCCTTCTGCAGAGTGCTTGGATGGAAATTTTGATCCTTGGTGTCGTATACCGGTCTCTTTCGTTTGAGGATGAACTTGTCTATGCAGACGATTATATAATGGACGAAGACCAGTCCAAATTAGCAGGCCTTCTTGATCTAAATAATGCTATCCTGCAGCTGGTAAAGAAATACAAGAGCATGAAGCTGGAGAAAGAAGAATTTGTCACCCTCAAAGCTATAGCTCTTGCTAATTCAGACTCCATGCACATAGAAGATGTTGAAGCCGTTCAGAAGCTTCAGGATGTCTTACATGAGGCGCTGCAGGATTATGAAGCTGGCCAGCACATGGAAGACCCTCGTCGAGCTGGCAAGATGCTGATGACACTGCCACTGCTGAGGCAGACCTCTACCAAGGCCGTGCAGCATTTCTACAACATCAAACTAGAAGGCAAAGTCCCCATGCACAAACTTTTTTTGGAAATGCTGGAGGCCAAGGTCTGACTAAAAGCTCCCTGGGCCTTCCCATCCTTCATGCTGAAAAAGGGAAAATAAACCCAAGAGTGACGTCAAAGAAACTTAGAGTTTAGTTAACAACATCAAAAATCAACAGACTGCACTGACAATTTAGCAGCAAGACTATGAAGCAGCTTTCAGATTCCTCCATAGCTTCCTGATGAGTTTCTTTCTACTTTCTCCATCATCTTCTTTCCTCTTCCTTCCCACATTTCTCTTCCTGTTTATTTTTTCTCCCTTTCTTCTTTCCCCCTCCCTTATTTCTTTGCTTCTTTCATTCCTAGTTCCCATTCTCCTTTATTTTCTTCCCATCTGCCTGCCTGCCTTCTTTCTTTTCTTTGCTGCTCTCGTTCCTCTCTTTACTCATCTTCCTCCTGTTTTCTAAATTTTAAATAGCTTTAGTTGTAAAAAAAAAAAAAAAATCCTTCCTTCCCCCTTTCCTTTCTCTTTCTTCCCTTTTTTCCTTTTTCCCTTTCCCCTTTGCCCTTTCCCCTTTCCTTTCCTTCTGATCTTCTTTCCATCTTTCTTTTTCTTCCTTCTGCTGCTGAACTTTTAAAAGAGGTCTCTAACTGAAAAGAGATGGAAGCCAGCCCTGCCAAAGGATGGAGATCCATAATATGGATGCCAGTGAACTTATTGTGAACCATACCGTCCCCAGTGACTAAGGAATCAAAGAGAGAGAACCAACGTACCTAAAAGTACAGTGCAACATATACGAATTGACTGAGTGCAGTATTAGATTTCATGGGAGCAGCCTCTAATTAGACAACTTAAGCAACGTTGCATCGGCTGCTTCTTATCATTGCTTTTCCATCTAGATCAGTTACAGCCATTTGATTCCTTAATTGTTTTTTCAAGTCTTCCAGGTATTTGTTAGTTTAGCTACTATGTAACTTTTTCAGGGAATAGTTTAAGCTTTATTCATTCATGCAATACTAAAGAGAAATAAGAATACTGCAATTTTGTGCTGGCTTTGAACAATTATGAACAATAATGAAGGACAAATGAATCCTGAAGGAAGATTTTTAAAAATGTTTTGTTTCTTCTTACAAATGGAGATTTTTTTGTACCAGCTTTACCACTTTTCAGCCATTTATTAATATGGGAATTTAACTTACTCAAGCAATAGTTGAAGGGAAGGTGCATATTATCACGGATGCAATTTATGTTGTGTGCCAGTCTGGTCCCAAACATCAGTTTCTTAACATGAGCTCCAGTTTACCTAAATGTTCACTGACACAAAGGATTAGATTACACCTACAGTGACTCTGAGTAGTCACACATATAAGCACTGCACATGAGATATAGATCCGTAGAATTATCAGGAGTGCACCTCTCTACTTGGGAGGTACAGTTGCCATATGATTTCTAGCTGCCACGGTGGTTAGGAATGTGATACTGCCTGTTTGCAAAGTTACAGACCTTGTCTCAGAAGGAGCTGTGAGCCAGTATTCATTTAAGAGGCAATAAGGCAAATGCCAGAATTTAAAAAAAAAAAAAAAATCATCAAAGACAGAAAACGCCTGACCAAATTCTAAAACCTAATCCATATAAGTTTATTCATTTAGGAATGTTTGTTTAAATTAATCTGCAGTTTTTACCAAGAGCTAAGCCAATATATGTGCTTTTCAACCAGTATTGTCACAGCATGAAAGTCAGTCAGGTTCCAGACTGTTAAGAGGTGTAATCTAATGAAGAAATCAATTAGATGCCCCAAAATCTACAGTCGCTGAATAACCAATAAACAGTAACCTCCATCAAATGCTATACCAATGGACCAGTGTTAGTAGCTGCTCCCTGTACTATGTGAACAGTCTTATTCTATGTACACAGATGTAATTAAAATTGTAATCCTAACAAACAAAAGAAATGTAGTTCAGCTTTTCAATGTTTCATGTTTGCTGTGCTTTTCTGAATTTTATGTTGCATTCAAAGACTGTTGTCTTGTTCTTGTGGTGTTTGGATTCTTGTGGTGTGTGCTTTTAGACACAGGGTAGAATTAGAGACAATATTGGATGTACAATTCCTCAGGAGACTACAGTAGTATATTCTATTCCTTACCAGTAATAAGGTTCTTCCTAATAATTAATTAAGAGATTGAAACTCCAAACAAGTATTCATTATGAACAGATACACATCAAAATCATAATAATATTTTCAAAACAAGGAATAATTTCTCTAATGGTTTATTATAGAATACCAATGTATAGCTTAGAAATAAAACTTTGAATATTTCAAGAATATAGATAAGTCTAATTTTTAAATGCTGTATATATGGCTTTTGCTCAATCATCTCTCAGATGTTGTTATTAACTCGCTCTGTGTTGTTGCAAAACTTTTTGGTGCAGATTCGTTTCCAAAACTATTGCTACTTTGTGTGCTTTAAACAAAATACCTTGGGTTGATGAAACATCAACCCAGTGCTAGGAATACTGTGTATCTATCATTAGCTATATGGGACTATATTGTAGATTGTGGTTTCTCAGTAGAGAAGTGACTGTAGTGTGATTCTAGATAAATCATCATTAGCAATTCATTCAGATGGTCAATAACTTGAAATTTATAGCTGTGATAGGAGTTCAGAAATTGGCACATCCCTTTAAAAATAACAACAGAAAATACAACTCCTGGGAAAAAAGGTGCTGATTCTATAAGATTATTTATATATGTAAGTGTTTAAAAAGATTATTTTCCAGAAAGTTTGTGCAGGGTTTAAGTTGCTACTATTCAACTACACTATATATAAATAAAATATATACAATATATACATTGTTTTCACTGTATCACATTGAAGTACTTGGGCTTCAGAAGTAAGAGCCAACCAACTGAAAACCTGAGATGGAGATATGTTCAAAGAATGAGATACAATTTTGTAGTTTTCAGTGTAACTCTCGGCATTTCAAAAGAGTAAGTATCTCACAAATAGGAAATACAACTAAAACGTAGATTTAAAAAGAACTGCACGGGCTTTAGGGTAATTGCTCATCTTAAACCTCACTAGAGGGAAGTCTTTTCAAGTTTCAAGCAAGACCATTTACTTAATGTGAAGTTTTGGAAAGTTATAAAGGTGTATGTTTTAGCCATATGATTTTAATTTTAATTTTGCTTCTTTTAGGTTCGTTCTTATTTAAAGCAATATGATTGTGTGACTCCTTGTAGTTGCACTTGTGTTTCAATCAGATCAGATTGTTGTATTTATTCCACTATTTTGCATTTAAATGATAACATAAAAGATATAAAAAATTTAAAACTGCTATTTTTCTTATAGAAGAGAAAATGGGTGTTGGTGATTGTATTTTAATTATTTAAGCGTCTCTGTTTACCTGCCTAGGAAAACATTTTATGGCAGTCTTATGTGCAAAGATCGTAAAAGGACAAAAAATTTAAACTGCTTCTAATAATCCAGGAGTTGCATTATAGCCAGTAGTAAAAATAATAATAATAATAATAATAATAATAAAACCATGTCTATAGCTGTAGATGGGCTCCACATCTGTAAAGCAATCAATTGTATATTTTTGTGATGTGTACCATACTGTGTGCTCCAGCAAATGTCCATTTGTGTAAATGTATTTATTTTATATTGTATATATTGTTAAATGCAAAAAGGAGATATGATTCTGTAACTCCAATCAGTTCAGATGTGTAACTCAAATTATTATGCCTTTCAGGATGATGGTAGAGCAATATTAAACAAGCTTCCACTTTTGACTGCT\n>AF377161.1 Rhizopogon sp. AHF133 internal transcribed spacer 1, partial sequence; 5.8S ribosomal RNA gene, complete sequence; and internal transcribed spacer 2, partial sequence \nTCCGTAGGTGAACCTGCGGAAGGATCATTAACGAATATAATTCGAGGGGTTGTCGCTGGCCTCGCTCGCGCGAGGCATGTGCACGCTTCTCGTTTTTCTCTCAACTCACCTGTGCACCTAATGTAGGATGCCTCTCCTCCGGGAGGGGGGACCTATGTCTTCGTAACATCTTCGTGTAGAAAGTCTTTGAATGTTTACTATCATCGAGTCGCGACTTCTAGGAGACGCGATTCTTTGAGATAAAAGTTATTACAACTTTCAGCAACGGATCTCTTGGCTCTCGCATCGATGAAGAACGCAGCGAAAAGCGATATGTAATGTGAATTGCAGATCTACAGTGAATCATCGAATCTTTGAACGCACCTTGCGCTCCTCGGTGTTCCGAGGAGCATGCCTGTTTGAGTGTCAGTAAATTCTCAACCCCTCTCGATTAGCTTCGAGAGGGAGCTTGGATAGTGGAGGTTGCCGGAGACTTGGATTCGTCCGAGACTCGGGCTCTTCTGAAATGCATCGGCTTGCGGTCGACTTTTGACTATGTGCGACAAGGCTTTCGGCGTGATAATGATCGCCGTTCGCTGAAGCGCATGACTGAACGTCCCGTGCCTCTAATACGTCGACCGCTTATTATCTCTCCGGAGAGAACAGGGTCTTCCTTATTGACTTTGACCTCAAATCAGGTAGGACTACCC\n>XM_023987877.2 PREDICTED: Salvelinus alpinus transmembrane protein 88-like (LOC111964137), mRNA \nAGACAGACAGGAGACAGACAGGAGACAGAGGGGAGACAGACAGGAGACAGACAGGAGACAGAGGGGAGACTCAGTGACTAACCAAACTGGAATGAAAGTGAGGAAACAGCACGGCAGGAAAGGAAGAGTCAGAGCCAAACAGAAAAGCAATATTTGCCTTAACTGTGCAGAGCGTAGAATTTAACACAAAGCAAAGGGGAAAGAGAGTGACACCGACTGAGACCTTTGCAGACACAAAGCATCTGCTGAATACCTGGAGTTTCAGAAACACCAGGATATATCAGAGAATGACAAAGGTCTAAACTCTCATCATCAGGGTATAAACCTCCACCTGGTCAATGTCATCAGTCTGACCTCAGGATCTGGATGTTCATGTCGTGGAGACCTACCTCTTCTTCTCTCGACGCGCATTCTCAGAGAAGGAAGACAGGTTAAAGAATAGAGTGTATTCACATCTTCTCTTACTGCTACTGTGAGAGGCGAGAGACAGAGAGACAAATCCTCAGAACTGCTCCACCAATCACAAAGCCTAGGGAGGATGAGTCTGCCGAGGAACCAGACCCTGGAGAACGGCATCACCAAGCTGCATCACATTAACAATGGGGAACCTCTGTCTTCACTGCAGTTCCACCTCCAGCACACAGGCTCTGTGACCTCTGTGCCWGGGTCGCCCACGGGGGGGTCAGGGGTGGTGGTGCCACCCCCGTACTCAGTAGCGGGCAGCGTGGCGGGGGCTACGGACGCCACTCTGGAGCTAAGAGGCTCTCTGGACTGCTGGGCGTGCTCAGTACTGGTGACGGCTCAGAACCTGATCATTGCCCTGGTCAACAGTACGCTGGTCAGTATTGTGTTCGGCACCATCATGACCCCAGCGCTGGTCATGGTCGTGTTTGGCTTCCTATGTCACTCTACGGTGCAACCCAATGGCACGTCCCTGTACTGTTCAGACCTGCTGGATGACGGTGGCTGTGTGGCCCTGCTGGTGGTGGGCTTCATCCTGGTCACCCCTCTCCTGGTCCTGGCTCTGGCTGCTTACTGCCGCCTGGCCCGCCACCTCCAACTGGGCCTCTGTTTCATCCCCTACAGCAGGGCCGTCTACAAGAACCTGCCTGCCTCGCGCCAACGTGGAGGAGGCTGCTGTGGCCAGCAGGGGGCCTCAGAGGGGGAGGGCAAAGGCAGTGTGTGGGTGTGAGGGGAGGGATATGTTGACCCTAACCACTGATGCAGGGTCAGATAACATTTTCTTGCCTCTTAAGGTTAAGGTTAGGATTGGGGATCAAGTAATCTGATCCTAGATCTGTAGATAGAGGCAACTTCTACCTTGAGCAGGGAGGGAAGGAATGTGAAGGAAGGGAGAAAACAGGGCATGAGGGTAGTAGGGAAAGTTGAGGTGTGGACACGTGGAGATGATGTTTATGGACACAGTTATAATATGCCTATGAGTCTTTTGGTGGGGGTGGTGTGGAGGTGGATCTTACAATACACTGGTTTGTAGATTGCAGAGAGCAAAGGTGAAGCTGTAAAAACACAAGTATGCTACATGAAGTACTATCAAATACCACTGTAACTACACTGCAATTATTTGTTATTATGTTTGTTTTTTATGTTGAATTATCCTGTACTATTATTAAATTATGTTTGTTTAGAATAAAATATTTCCATTA\n>XR_003517021.2 PREDICTED: Zalophus californianus uncharacterized LOC113912871 (LOC113912871), transcript variant X2, ncRNA \nTAATGCTCCCCTCCTCCTCCCCTCTCCTCCTGGGCTCCTAGCCCGCCCGCTTGCCAGCCCGGGCGGCGGCGGGACCGCAGGGCCCCGTGCCTCGGCCTCTCCCCCGACGCCTGGCCCCCCCTCGCCGCCCAGTGGGACCGGGCGGGGGCGGGGTGGGGGGAGAGGGAGAAGGGTGCAGTTACGGAGGGGACCCGGGCAGACGCCGCGGCCACGCCTGGCACCCTGTGCCGGGCGGGTGGGGGTGGCGAGGGTGGCGGGGCCGGGGTCACCCGGAGGGGACGCGTCGGAGAGGGCCAGGCGGAACCAGCGCCCTGCCTAACCTGAGGGGGTGGCCCGGGGGTGTGCACCGCTGGACCTGATGTGGTCCTGAAGGCGTCCTTAAATTGTTAAAAATAGTCTCGCTGTATAGAGAAGAACACTGGAACCTTTTAAGTCCCCATCCCCTCGCCTGAGTCCGGAGTGAAACTCCAAACATACTTATTAAGAAACTGTTGCTTTATTTTGACTCGTTTACATAAATTTTCCACTTTGGGGGGATGGTGGTGGGCTTGTGGAATTCCTAAAATAACTTTTAATGGAGCGAAGCCTTCCATTATGGGAAGCGCCTAGACGCGAGAGGCGTCTGGAGGCCTAGGTTCCCGTCACAGCCCTGCCACCAACTGGCTGAGCGACTGAGGCACATCGCCGCCCCTCTCGGCCGGGGTTAGGAGAGTGGACGCCCCCTCCACCCCGAAAGGGGAGACCGGAGAGCTGTCTCAACCATTAATAATGAGACTGGGTTTTCCTTCCTTAAAATGTTCTGATAGTATGGAGAGGCAACTTGGAGATGAGAATAAAAATAAAAGAGGGAGCCATAACAGGTTTATGGCCCTGACCCGGGGAGGCCCTGCCCACCTTACCACCGAGGATCCGAGAAGCTGAGTACTGTGGACACCTGGGTGAAACAGCCATGAAGCTTTACTAACTGCTCTGCAGCCTGACTCACTTGGGGCGGGTCTACACCACAGTCTAAGTACAGCGAAGGAGGAAAGTGACTTCAAGCAAACTGAAAACCATTTGGAAGAAGAGACAGTAGGCACACAGTGTGACGAAGTCTGCGCTGGAGCTAGAAGGACGAGTATGCCCGCAGCTCTGTCCCGAACTGACCTCAAAGGGCCATCAGAGGACTGCCGTGAGGTGCAGCGAAGGGGACGCGGAGCCGCACGGGGATAAAACCACTCGCCCAGGGTCACCAGGCTAATGCTCCTTAAAGGTTCTTGTCTCAGTCATGTCCTCTAACCGGCTGGCTCACCAAGCTGCCGCTGTGACCAGGAGTTGTATTGTTTCCTTAA\n>AJ288639.1 Centruroides exilicauda mitochondrial partial 16S rRNA gene, haplotype CexTE \nCCCCTCCTCTTGCGGAGTGGAGGAAATCTAATCCAACATCGAGGTCGCAAACATGTTTGTCAATTTGAGCTTTCAAAACACATTACGCTGTTATCCCTAAAGTAACTTATTTAACTTTCAAAAATTTTGGGTATTAAAATAATGTCATTTATATATTTTAAAAGTGTTTTTCTTCTTACCGCCCCAGTAAAACATATTTTTAATTTATTAAATTATTTTATGTAAAGCTTTATAGGGTCTTCTTGTCTAAAAGAAACATTTTAGCCTTTTTACTAAAAAGTAAATTTCAAAAGAAAAAGTCAAGAAAGAAACTTTCTAGTTTATCCTTTCATTCCAGTCTTAAATTACAAGACTA\n>XM_012291159.1 PREDICTED: Megachile rotundata mucin-17-like (LOC100879044), transcript variant X1, mRNA \nGACCAGTGCACGCGACAAGAAGGAAGAAGCCGCGTGGCCCCAGGTGTTTTGAAATGAAACATTGGATCGGACTCTAAGAAGCTGCAAGAATGGCGCGGAGATTTTCGTGGTGCACGGCGGTGGCATTGGTGGTGCTGCTTTTCGTCACGACCGAAGGTCTTCGTGAACGTGGCACTCAGGTCGACGATCAGAAAACCGCAGGTCGAGGTACTCTGAGGTTCAACTCAAGATCGCTAGAGGAATCCACAACCGCTTCGCTCTCAAGATCCAGATCTCAAGACAGATCGCAGTCAAGAAAATCGAACTTCGAACGAAACGACAGAACAACCTCATCGAACTTCGAACGAAACGACAGAACAACCTCTCCGACCGACTCGGAGTCCACAACCAAACGTCCAAGCCCCACAGCGAGCGATGTGACCGAAATCCCCGCAAGAAGGACCACGGACCCGAACAGAAGAAACGGTAAAAGGTTCTCTCCAGAGAGGACGAGGTCGAAGGATGAAAACGCGATAGATTCCAAGGTCATATCTCGAAGGGTGTCGAACGGGAGATCCGACGGAGTCACGGAGAGGCTGGACAACACAGGGCCGTCGGTCTTCGCGTTGACGACGGAGTCCTCGAGGTCGAGGACCGGCAGGAAGATCCAGACGACGTTCTCCACGAAGGACCTGAAGACGCAGATACCCGCGTCGAGGAGGTATAATAAAAAATCGGAGAACGTAGAGGCGACTACAGTTTCCTTCAAAAGAGGCAGACCCACAACGGAGCGCAGTAGGTCCGGCAGGTCGAAGGTGAACAGGGAGAACTCTGTTGCTCGCAAAGGTCAAGAAGCCCTTTTGTACGAGTCTGAAAGCGTCAGAGTCGACATTCCTCTCGCAGTCGACGGAACAGAGAGTCCTTCCAGTGATCCAACGACCGTCGGCTTCGGTATCGTTTCCCAAAGAAGGTCGGACACCAAGGAGACTCTCAGGGGCAGGTCAGGAGCCGAGAGGAAGAGCAGAGGACGATCGAGCGACTCCGAAGCTGCCGGCTCCTCCAGAAACGGCTCCCGAAGAGGATCGTCCAGGTTCAACGACTTCTCCACCACGGAAGCTAACGAGGTTGGTTCGAGGAAAAGCTCTTCCAGGGATCGTTTGAAGGAAACTAGGAAGAGCGCTAGTGAATCGAGATCGAGATCTAGAGGTAGAGAACAGACGAAGAGTGCAGATGTGGATGTCAAACGAAAATCGGGAGACAGGAATTCTTTGGATAGGAGGTCCAGACTTTCCGAGGGAACTACGAGGTCGGTGGAAAGTCGCGGACAGGATCAGGATGCCAGGAGATCCAGGAGCAGAGCGAGGACGGAAACGACGCCTCTGGCTACGGATGTCACCACAACCGTCGCGCCAGAGACAACAGTCTTCACCGACTCGACGAGCACCGAGCCCGAAGTCTCCAGCACCACCCTTAAACCAACGACAACTTCAACCACAACCCGAAGCACGTCGCGATCATCTTCTACAACCGAAAGAAACCGAGGAAGAGGCAGAGGCAATCAAGGAAGAAAACTAAAGGAAGATTTCTTCAACCACGGACTCGGATTTCGAGGACGAAAGCCATCTCTGGATGCATCAAGCACCGGGGAGTCCAGAAGACCCACCCCCAAAAACGATTCCTACATAAACCCCGGTTGGACCCTCAGAAGACGACCACCTAACTTGAACTACTCCGACAACCTTCCACAAACGATCCCTTCGTCGAGAGACCAAACGAACGAAGTGATTCCTCAGAACGAGGTATCGACGAGCACCGAAATCGTAACTACGGTGGAAACCTCTACATCCACCGCGAGAAGAGGTTCTAAAAAGCTGCAGTCCACGGAGGAGAGCACTACGGAGATGGATGTTACTACGAAGAGTTTCAGAAGGGGTAATAAAACGTTCGAGAAGAATAGGAACGTTGCACCTGGGAAGCAGGAGCATGAAGAGAGCGACAACTATCCGCCGGAGTTTAAGGCCAGGTTGTCTCTGTTGAAGAGTACGAACACGAAAATACCAGCCCCGAAAACTACCTCTAGAACGCCATTGGAGGTGAAGAGATCGTCGGCCGCTCTGTTCGCCGAACGATCGAGGATGAAGCTGGAGCTGGCTAGGAGGTTAGTGAAGCCAGAGTTGAACATCGAGGAGAATGATCTCGACGCAACCACGGCCTCCTCTTTCAGCAAACCGAGGCCGACCGTGGCGTCGACGGTCGATGAGACGGCCAAGGTCGCCAAGTTCGTTAAACCGTCTGCGGGTCGCAGAACGTCCACGGAAAAGAGGTCTCGAGAAGACGAGAAGTCGAAAGTTTCCGCGAGGACAGGCGACGACTCCTCTAGGTTCGCTAGACCGAATTCGAAGAAAGGACGAATCATCTCCGAGAGAATGGTCACCTCGATCTCGGTGGAGGAAAGGGCTGCCGAACAAACCACCAAGCCATACTCGTCGAGTCAGTCGGTGGTCACCTTGTCCTCCGCTGAAGAGGGATCGGCGACCACCATAGACACCACGCGGATTCGCCTGTCCAGCGCTCGGAACGGAAAGAAATCCAAGGAGGAGACCTCGAAGAGACGCGAACACGACGACACCATTACCACTTTCAAACCGAAGAAGCCCTACGCGTATCAATCGCGCGTCACCAAATCGCAGGAACAATCTACGACCCCCGAAGAGAATCTAGTAACGTCCAAAAAGACCTACGCCTCGTCCAAACAGAACGGAGGGCAACGGAAGTTCCAAAGCTCCCGCGAAGAGGATGCGAGAAGAACCAAGTCCACGACAGTTACCAAACCCACCTTCAGACCCCGATACAGCAAACGAACGAAACCGAAATCGATCGACGACAAGTTGACAGACTACGAAGCGACGATCACCACGAAGGTACCTGTTGCTACCAGCAGGTACTCCAGGAAGAAGTCCGTGGTAAAGGCTACAGAGGGTAAATCGAAGACCACCACGGAAGGAGTAGCAACGCAGACGAAGAAGCTGGAGTTTCGTCCTAGAACCGCGACCTACAGAAGACACTCCGAGGTGCCGACGACCTTGGTGGAATCGAGTACCAAGGTTGAGGGTGCAGGAGTCGCCATCACTCCCAGATCGACCAAGTATTCCGCGACTCTGAAGACCTCGACAGAAAGCGCTCGATCGGTAGCGCAGGAACCGCAGGTTAACCTGAGGATCAGCAACGACACCGCGCAGGAAGCGGCTGGCATTACCGGCAGCAGTAACGGAGACACCGGCAGCAATATCTTCAATCCGACCAGAAGCACCATTCTCGCTGGAAATGGAACCCTGTTGGAACAACTGCGAAGCACCGTCGCGCCGCTGCTCAACTCGCTCGGTAACAAGACTCCGGTGTTCTCTGGATCCTACAGCAACGTTAATGTGAATTCAGCTCCCAGAATCACACCAAACGGATCACCGCCCCGATTTAGCGCGAGATACAAAGGTGCAGAATTATTTGTCAGAAAACAAAATAACATTTATCAACCCACTGTGCCATCGATCACTAGCTCGTCTACAACACCAGCTACAACCGTAGAGAACTCTGGTTCGGCACCACCGATCGATGTCTCGAGTCCTGGCGAGCCAAGGTTCTTGACCCTTTATCACGCGTTGGAGTCGGCAGACATCAGGAACGAATTAGAAGCGAACACGAGCGTACAGGCCGACAGGGTTCTCCAGGTAGACTCTAACGCCACTGTCGCTAACGACAACAGCAGTAATTCTAACAATGACACCACAAGCCCCTCCGTAGCGACCACCGGCCCACAGACCCCAGACACCACCGCGAACACTACTCTGACCTCGAGATTATCCGAGGATACGGAGAACACCACCCCCGCGGTTACCACGGGAGTCCCTGAAACCCCTGCGACCACCGAACAACCCTCTAACGCCGAACAACAAGCCTCCAGCACGGAATCACCCTCTACCGAGCAACCTTCCACCAACGCAGTTTCCATGTCGCCACCTGAACAAAGTAGCACGGATGCGCCGACTACGACCGTCGGAAACTCAGAAAGTAGTCAGATACTCTCGACGACTACCACGGAAGTTCCTACCACGACAGGGTCCAGTACCGAAGCAAATGTGCCTAGTACGACCGAGGCCGCGTCGACCACTCAAGGTGCGCAAGGTCTGACGGAGAGTACCACGATGGCTGCCGTCAGCGACGCCGCGAGTATGTCCGAAAGTCCGGAGAGCAATACTATACCGTTCTCCGAGACGCCAGCCACTCAGTCGACCGATTCGAGTTCGACCGATGCCCCCACGACCGAGGCCATATCGAGCAATATGGTGGATGCGGAGACAACTACCGTGATACCTACCACCACGTCGCGACCTAGACTGATCGATTTAGCGCAGGATATTCTGTCCCGTTTGCAAGCGTCTCTGAACGTTACCACGCAGCCGAGTGTAGACTCCACGACTATACCTCCAACGACCGAGATATCGAACGCGATATTAGATATTAGATTCGACGCGAACAATACCCTGCAGAGTCTGTCGCAGTTGAACGAAACGGGAACAGCTGAACCGGCAACCACCGATGAAACCACTACCCAGAGCGCAGTAGGCTCAGTCCCTACTACGACACCTGCGACCACGAATGACCCGTCCAGCTCAATGGTATCTACCCAAGAAGCCAACACGCTGGACGAATCGAGTCCAGTTACAACCACCACACCAGTAACACCACAAGACTCTCAAACAGTTCCGAACACAGAATCGACCACCGTAGGCGACCCCAACAGTTCCTCCAGCCCTCCGTTAGACGTTGATGCGACCACTGCGTCGACGGTTACCACCACGAACGATACTTTACTGACAGAATTAATGTCCATCGCCAAGACCCTCTTTTCGGAAGAGATGAACGACACCGAAACATCGGTACCTGTTCAAACGACGACCGATGTTTCTGGCGTGTCAGGCACGATTCAAGCCACGGAATCGTCGTCGATTTCGCCGGATGTCACGACAGAAACCGTAGAAGCAACTCCGACCACTGTAACTATGTCTGACGTTACCACATTTTCGGTCGATCCCTCGCAGAACGAGGTGGACTCCACAGACCCCACCGTGACCGTTTCGTCTACGGAGAGTTCGACAGACACGCCCAGTACAACTCTAGTGAATAACATGCTCGACAACCTGGTGGATGTCGCGCGAACGAACGACACCGCAACGTTAGGAACACCCCTCGCCGAGAACGTAGAGTCGACCACCCCCTCGTTAACGACCGAAAACGAACAAACGACCCTCTCGATTAACGTATTGTCCAGGCTCGAAAGTGGCCCGGACACCACGACTCAGTTGTCGACAACCACACAAAACACGGAAACGACAGTCGCATCCACCGCCATTAATTTTGAACTAACCACTAACACGTTCGATTTGATATCGACCGACTCGACGACGACGACGACGGGGCCGCAAGCGGCTCCCGAACTTACAGAAACCACCACACCATTAACCGATCTCACGACCGTAACACCAGAGCTTTCGCCAAACACTAGCACTAATCAACCCGAAGTAACCACGATTCCTGAAACAACTCAGTCCACTGTAAATACGATGAGCACGCCGTTGCCCGAAATGATAGTCGAGCAAACCACGGTGGTGTCCACTACAGAGTCGATCCAAAGCGTAACAACCGACGTGACAACCACGTCGCCGATCACGAGCACTCCGCGATTGGACGTTAACCCGATGGACGACGCTGAGGTCACCACCAGCCAGACCCCGCTAACGTCCAGCCTAGAGTCCATTGTGGAAACCACTACTAATACGCCCAGCGAAACAACAAACCTCCCCCAAACAACCCCGACCCTCGAGAACGAAACTCCAACTGTTGTTGCCCGTTTCCAGGATACGACATCAGCAACCGCCCAAGGGACGGCAGGTTCAGGAATCGGCCAAACGACCGAGAACACCACTCCCATGACCATGATACCTTCCACACCTTCTCCCATGCAATCCACCACCCAGTCTCTCGTTTCAACCACTTCATCTTCGGTCGAGACTACGACTACGACGCCGACGATGACTACGACGACGCAGACAACGACGAAAATCGGACGCGTTCCCGAGCTCGCAACGACACAGTCGAGCATGGGTGTCGTCACCGTCACGCCGATGCCCGACACGACGGTTCCTACGACGGTCACGGGTGCCGTAGAGGACAATCTCGTTTCCACCGAAGCTGGGACAACGATGCAACCTATGGGACCCATGAACGCAACGATGATGACCATGAACGCAACCGCCGCGAACACAACCGCCGAAACGACGACCCCGTCGATGCAAACCACTCCTGCGACTTCGACGATGGCTCCGTCTTCTCAGGCTCCCACGACGGCGTACATGGGTCGATTCGGGGGCTCCAGGTTGACGCCTGCCCCCAGGTTCAGCCTCAGCTCCACCACCAGAGCTCCTCTGCGGGACTATCTGGTCTACGGGATATATCCTAACAAAACGATCGTTAGGAAACGACCGGAGGACAACCTGATCGACGCTAGGAACGTGGACAGCCCGTACGTGATATTCGGTATCTTCCCGGATGGCAGGCTGGTCCGGAAATTCCCGAACGGAACGATAATACCGGACCCACCTAGGAGCCCCGTCGAGGTTGTGTTCTCACTTAGCACTACCACTACCACTAACAGGCCACCACCCAGACCGTATTATAACCAGGCTAACCAAGGCGTTTACAATCAGTATCAAGGCCCGGTGTACAGTAATATTCGTAGACCTGAGCCGATGAGAATCGTCCAAAGTCCCGGCACCGTTGACCTCGGCCTTACTGGTAACGCGATCGTCGGCCCCAATGGAGGTGGACCCGGTTTCACGGGGCCACTTGGTACCCCTGCTAGCCTCCCGAGCACCAACGAAATGAGCAATGCCCTGGTAAATACGCAAATGGGGACAGCATCGGTGACGCCGACAGTAAGTACCGGTCGACCGCCGACCGTTTCGCAGGGCGGTCGTATCGTACAGGATCGAGAGAGGGACGAGGCCACCAGGACGAAAGAGGTCGGAGGTCAACGCAGCTCCGTGTACATCGGACAGGACAAGTTCGTCAATTATTGGACCGATGGGGCCTCCACCACCAACCCGCGTGTCCTCGGTGTCAAAATAAACTCGGTGGCTACCGGATCAAATTTGGGACCGTCGCCATCCGTGCCGTCTTTCGCAAATCTTTTGAACAATGAACCAGGAGGTCAAGTTACAGCTCCACCAGGATTCCCATGGAGGGATCCATTGGATCAAATTTTCGGTATTACTACCTCCTCGCCGATAATAACAGCTTCAGTTGCATCGAACTCGCTGGATGATTCTTCGGAATCGAGCAATCCGACTGCAGCAAGGCCGGTGAACCCATTCGTGGAAATTTTCACTCCACTTTCGAACGCGATTGGTATGCCAAGGGGAAATGGCGTGCTTAGTGTCACAGGAGCTGTTCCTAGTACGACGATGCAAACTACTCCTATTACTACTACTATGGCACCAACACCACCAGCTGCACCATCAACACCACCAGCAACACCACCACCACCTCCATCAACACCACCAACTACTACCGCAGCTCCAACTACAACTACACCACCTACAACTACACCACAGCCTACAACTCCTCAAACTAATGCTGCATCGCAAGCACCTCAGTCAACTCCTGGATCCACAGGACCTCCTTCGACAACACCGACTAATTTGCCTGCAAACTTGTTGAATAATATGCAACAGCAGAACGCATTTGGAACGTCGTTTAATGACCTGGTGTTCCTGAATTCGTTGTTGCAGGATAATTCTCGAGGATCTAAAACAAAGACGCTGACCCAAGTCGAGCAGCTGTTAGCCAACAAGATTTTGTCCCTGGCACTGAACGGCCCCGACCCAGGCCCAACCCGCGCCCCAAAGGCCATCAGCTTCGAGAACGCCTCTCCGAATTCCGTCTACCAGTCTCCAAAGTCCTACGAGCCGATAGTGATCGATTTATCCCCATCATCGACCGCCACGTCGCCAACGTGGAAACCGACCCAGCAAACTAGTCAGAAAGCGCCCATTAGTTCAACGACGGAACAAGTCACTCAGACCTCGATTTCGACCACGACCGCGAAGAGAGACATCATCACGAGCGCTCCTTCGACGACTGACAAAACCACCCTAATAAGCACCACAAAAGTCCCAGTCTCCCCTAAAACAGTGACTCGGCCCAGAACCACCACTGAGGCTCCCGTGGGTTTAGCGGGACTCTTGTGGCAAACTCTTCTGGGCGGAGGACTTTTTGGGCCATCGACTACTGAGAGACCTTTGAGGACTAAGCAGGTGAAGACTGTTACGAAGTCTGTGAACATCACTCCGAAGCCGATACCAACTACGCAAAGACCGACGACGACTAGTACCACTACCACAACTACCACCACGACTACCACAGCTCGTACTACAACAGTCAACACGATTGATATCTCGAAGATTCATGTGAGCACTCCGAATTCGATCGGAGTAGAAAAGAAGGCTGCTACGCCGGTTCCACTGTTGTCGACGACGAAGAAGTCGTTGCTGAATAATCCGAACCCCAGGTTGTCTGTTCCTACTTCCACTTTCTCTCCTGAAGAGGAGACCAGGTTCTTGCTGTCGATACTGAGAGCCGCTCAACAGGATGAGAAAGCTGGCGGTTCGAAAAATTCTCTGGACGATGAAGCCTTCTTGAGAGCAATTTTAAGCGGACAGGCTTCCCCGACAAGTACTCCTCCTCCGCAAACGGAAATCAGCAACGCTGCTCTGTTGGCAGCGTTGTTGAAGGCTCAAGGCATCGAACCCGAAACGCCTGCTACTAACATCAGGGAGCAATTGCAGTTGGCTAGCCTCGGCCAGAGCGTCACCTCTGCTCCGAGCTTATCCCCGGCTAGCAGCGGGTCTACGACAATTACAACAAGGCCGACTTCGACTGCGACTCGAGCCACGGATACGACGAAAAACACGGTGACACCGAGACCAACCTCAAGACCAAGGGTACGCACAACAACGTGGTCGCCGAGCTCCACGTATCCACCTCCTCTCTTCAGCTCCTTCTCCAATTACGCTACACCGGGACAGTCGGCTGCCGCTGGCAATTCGGATAATGGCGCGATATTTGGTGCTACCAGGGCGTTCAGTCAATTCCTCGGTGCTGCATTAAGCGGAGCGGCACAACAGTTGCAGTCGTTAGTGAGAAATGGTACTAGGATCGTGTCCGAAGTAGTGGGATAAAATTAGCAAGAAAATAATAAAAATTTTTCGCGTAATCCATAGAATAAGAGAAGCGATTCGCGAGCATGAAAATCTGGAATGAACAAGCTGGTGGTAGCGATGCTTCGAAATAAGTATTCTTTTAGATATTCATTAAAAGTCAATCTGTTTGCTCGATGTTGAAGAGAAACTTCTCGAAATTTCCTCCTCCTTTTTTTATGTATAGATCGTAGCGTTACGCGCAGATAGTTGTTGGGTGATTATGTATTTTATTTTTATTGTACGTAGCTGATAACGGGACGTGACGTGACTCGATCGTTCATTCTTAAAACATGAAGAACGTATTTTATAATAATTCATTTTCAACTTTTCCGAAATATAATTTAGTAACTTTTAATTTTCAAGTTTGTTACATTTTGAGGAAGAGAGATGTAAAAGTATTAACAGTTGAAAATTTAGAAATATTGTAATTTTAATTTTCTATATTGTTTACTTATAAGTTTTTATGAATGTAATTCAGAGCTTCAGAACTTTATAAATTTATAAATTGAGAAATGTAATAATTTAGTGAGTGATTTAGTTTTAATTGAGTGATTTAATCTTCATGTTTTAAGAGTTGAGCGATGCCCGTCGACAGCGATGACGAAACAATTCGGAAAGTGTGGAGTTTCGTTCCGATTCGCGACAGGAGTAACGACTGGACGCCTTGCAAACGTTTCTGGGGTAGGAGCGACCGATGGCTCGTACCACTTTGAAACATTTGTAACGTTGGTCGCAATTAAGGTAATTAATCGAGGGCGATGCGGCTCGTCACGACTCTCTGGACAGTGACGATCCGCGGTGTCTTCGCGTGAAAGAGGGCGTTCCGACTTCTGATGCCCACCCACAAAGATCGATTTAAGGGTCCAGTATCGTGGACCTCTTCCGGGAAAATCGAAAAGCCGACTTCATTTCTTCTGCGATAAAAGCAATTTAACTAATGTATGATTATCAAGCGAAACACCTCGTACTGTCATTCTCAAAATATTC\n>OQ027676.1 Uncultured bacterium clone 703 16S ribosomal RNA gene, partial sequence \nTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGCGGGATGAAGGCCTTCGGGTTGTAAACCGCTTTCAGCAGGGACGAGGCCGCAAGGTGACGGTACCTGCAGAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCGAGCGTTATCCGGATTCATTGGGCGTAAAGCGCGCGTAGGCGGCTTGTTAGGTCGGAGGTTAAAGACCGAGGCTCAACCTCGGCACGCCTCCGATACCGGCAGGCTTGAGTGTGGTAGAGGAAGGTGGAATTCCCAGTGTAGCGGTGGAATGCGCAGATATTGGGAAGAACACCAGCGGCGAAGGCGGCCTTCTGGGCCATTACTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACAGG\n>XM_035742444.2 PREDICTED: Oncorhynchus keta protein phosphatase 2, regulatory subunit B', gamma a (LOC118362247), transcript variant X2, mRNA \nCGCTTCATTTTCTCATCTGCTTTTGTGCTAAAATGGAGGCTGGCCCCTTACCTTAAGTGGATTGCCTTCCTGGTCGAGTTTAGATGTTGACATGCAATAAAGCTGGAATCAGGATGGTTGTGGATGCACCTAATTCCAATGGGCCTTTCCAGCCGGTGGCTCTTATGCACTTCAGAGACTGTGCTCCGGCAGAGCAGGAGAAGCTGTTTGTGCAGAAGCTGCGCCAGTGCTGCGTGCTCTTTGACTTCCTGTCGGACCCACTAAGTGACCTGAAATGGAAGGAGGTGAAGCGGGCGGCGCTGAGCGAGATGGTGGAGTACATCACGCACAACCGGAATGTCATCACAGAGCCCATCTACCCAGAGGTGGTGCATGTGTTTGCGGTGAACATGTTCCGAACGTTGCCTCCGTCGTCCAACCCCACAGGAGCAGAGTTCGACCCCGAGGAGGACGAGCCTACACTTGAGGCTGCATGGCCACATCTCCAGCTCGTCTACGAATTTTTCCTTCGGTTTTTAGAATCCCCTGATTTTCAACCGAACATAGCGAAGAAGTACATCGACCAGAAGTTTGTGATGCAGCTTTTAGACCTGTTTGACAGTGAAGACCCACGGGAGAGGGACTTCCTCAAAACAACTCTCCACAGGATATATGGGAAGTTCCTGGGACTACGGGCCTACATCAGAAAACACATCAATAATATATTTTATAGGTTTATCTATGAGACTGAGCACCATAATGGAATTGCAGAATTACTGGAGATACTTGGAAGTATAATCAATGGGTTTGCCTTACCACTAAAAGAGGAGCACAAGATATTCCTTTTAAAGGTCCTGTTGCCTTTGCACAAAGTCAAATCACTTAGTGTCTACCATCCGCAGTTGGCATACTGTGTGGTGCAGTTTCTAGAGAAGGACAGCACTCTCACTGAACCAGTGGTCATGGCCCTTCTGAAATACTGGCCCAAGACTCACTCCCCCAAAGAGGTGATGTTCCTTAACGAGCTGGAGGAGATTCTAGACGTCATCGAGCCATCCGAGTTCGTCAAGGTCATGGAGCCACTGTTCAGGCAGCTGGCCAAGTGTGTGTCCAGCCCACACTTCCAGGTAGCAGAGAGAGCTCTGTACTACTGGAACAACGAGTACATCATGAGTCTGATCAGTGACAACGCAGCCAAGATCCTGCCCATCATGTTCCCGGCGCTCTACCGCAACTCCAAGACCCACTGGAACAAGACCATCCATGGCCTCATCTACAACGCTCTCAAGCTCTTCATGGAGATGAACCAGAAGTTGTTTGATGACTGCACACAGCAGTTCAGAGCAGAGAAAAACAAAGAGAAGGCCAAGTCAAAAGACCGGGAAGAGGCTTGGATAAAGATTGAGAACCTTGCCAAATCCAACCCACAGGTAGTCTTCTAGGGTGGATGTTGAACAGTCCTAGCATAAGTTACGAACGAGAGACCAGAGGAAAGACCGGCCTATGAAGCGGCGTAAGTCTGATCTCCCTCAGGACATCTACACCGCAAAAGCCTTGGAGACCCGTCGCCGAGCCGACGTCATGATCACTACCCGCGATGGGCTCTAGGTCTGCCCCTCTCTCTCTCTAGTTTCCAGTCCCATCTTCTCTCTTTCCTCTAGTGTCCAGTCCCCTCTTCTCTCCACCCTCATCCACACAGCACATTCAGATTACTGGCCCAGTTTCCTCATCGTCGCCAGTACACAACCCCCTGGATTTCTGCTTTCTCAGGTGTTTCTTTTTGGGAGGGGTGGGGCCGCAACTTTCTTTTTTAGTCTTGCCGTCAATTTTTTATTTTTTTTTGCTTAATCGTGCATAACAGTATCGGCTCATCCCTCCAGGCTCTTACTGTACAAATGAAAATGGGGGAAGTTCCGTTCCACTAGCAACATGACAAGCTCCTATGTTCCCCCATTGAGCGCAGTTGGTAGAGAGCAGAAACAGAATGGGGGAGGCTCCTCTCGTTTCCTCTCATGTCAGTTTCTGTTAAGGGGAAACAAAACTAAGAACAGCCATTGTTGGATGGTGGGGGGTGATTGGATCGACTTTTCTGAAGTTTTGTTTCTTCTCTTTTTTTGTAATCCCAGGGACATTTGCCAGTGCCAAGACTGTTTGTTCTTTCTGTGTCTGTGTTTTTCTGTGTGAGAGAAACCAGGATGACTGACTATCTAGGTAGACAGCCTGTGTCGTTTGCCTTCGTTTTTTTTTTTGGAGCCTCAGATGATTCAAATGTTGTTTTTTTAATAAGCTGAAGAGCAACAGGACTTTCTGAAGTGACTGATCCATCTGTTCTGATGAAGTCACTTTATGACTAGGATGGGTGGCAGGACGGGAGGTTCTCTGTGGACACTGGACTCTTTACACCCTACACTTTGTGCCATGCACATTCTTTCGTTGGATTGATTTCCTTTCTGTTGAAGTCCATTGGCAATATGTGAGCCAGATCACAATGAAATATTGACAGTTCAAACAATGGTACTTATTTCATACGCAGAAACACATTGGGTGGTTGTTAGTCTGCACCCACTTTGTCATATTCAAAAGCCCTTCTTAGACATTTCAGTCTCCTTAATTCATACATAATGCATGTCCCCAGTTCTTACTGCTATTGGGAAGCTTCATTTAAATCTCAATGGCCAGCTAGGAAGTGTTTGGTTTGACACAGAGTCCATCAAGACACCTGTAGCCACACACACTGTAATGCTACGTTATGCAGAACATTCCACAAACGTTCCAACTGAAATTACATTATGACACTTTACCTGGGGGTGTCAGTTTGAGGAAGGCGAGGTGCAGAATTACTCATCTCGATCACATAATACGTTATGTGGGATGTAGGGTGATGTTGTAGAACTGTGATTCTGCACAGCCTGACTGTAATGAAGTCCTTCTCAAAAGCACACCTTGTCCTCAGATGCAGGCTTTTCAGAATCCCCGGCGCTGCTTGCTAGTCAAGCATGTTCCAGAAGTACACATGGTATCACATGCCCTGAAGCCCCCCCACACAGCGGTCTCACGTTTCCCCATGTTGGTTTTTACCAGTGCCCTCCTACCCAGAGGTGCTTTGCTGTGGAGCTGAAAGGACTGTTACGTGTCTTGTTGTGAAGTACTGAACAAATGGGGATCAGAGAGCCGTTTATGGAATGGCGGAATGCTACAGGATGAGAACATCAACACTGTTTGGATGACAACCGTTTCATGTGACAGTTGAATGAGCATTGGAAGAGGTGATTTCAAACCTGAATACCTCTTTGGATGATATCTGTAACCGTTGAGAATACGTCTATTGAAAAAGCACTTCCTGAAACTTGAAAGATGTGACATGTTTGTGTATCTTCATTGAAGCGCTCTTCAGTGTCCCGTTGAGTCTATATGTACAGTCTGCTCTGCTTTGTCAAGTTCAGGAAGCTGTCCATTTCCTGGACTGGACAAGGAAACGACCCATAAGTAAGCATTTCAGTGTTAGTCCACGCCTGTTGTTTACGAAGCATGTGACGAATACAATTTTATTTGATTGGGGCCCCATTGTAAATGTTAGTCTTTCTCTGGTACCATTGTTTGAACTTGCAAATCTAGTACGTGTATCCAATCTGTATTGTCTTTTCTGTTTCTAGTCTGGCAACTGGTAGCCTGGATGCTCATTTTAGCATTGTAGCTGCCAATGGAAAGGGCCAATGTTGAAAGACTGGCATCCAGGCTTGGCTTGGTAACTACATTATTAATACTTAAATGCAAAAAGGTGTTCATTTAACTACCATGTATCTTTTGTCCTGGACGAATGGCACTCGCCGAAACAATTTGACCCCCCCCAAAAAAAAAAAAAAAAATCTTCACTTTTATATAACAGTATCATTTGGAAAGATGTTTGATCAGTTTGCTTTTTATTTGTGTTCAAACTTTTTTTTTTTTTTAGACACATCAATTACTCGTATGACAAGTTAGACAACAAATGTTTTGGATTGTTTTCCAGAATTGTTTGCTTGGCCTCTGCAGGTTTTTAGTTAGAACATGTACTTTCCAGAATATAATAACTTGACAAGTGTCCTTTTGTCTGTGATCTGTACTATGTGGCTTCATTTAATATTGTACATATGATTTACTTTGTTTTATGTAGTGTTATATCTAGATTAATTTTGTATAAAATTGTCCTCTGTACAGAATAAAACATCAATAGCAATGACAAAGAAGTCAATGTGGCACATAACTTCTCTCTCCCCTGTAACTTTCTGCATTATTAGAAATAACACATCTAATATTTTCTTTAATTCCCAATTATCTGTGACCAGATTTCAGTCCGTAGCCTTTTGTGTGCTTTTATCACAATCTCAACTGGTGTTCATCTGTAATAGAATGAATAAAGAGAATATTTGAATTTTATATTTTCAACCATA\n>XM_023493610.1 PREDICTED: Eurytemora affinis uncharacterized LOC111718108 (LOC111718108), mRNA \nGGCTCGTAAACTAGGGTTTAAAAAAGATTACTACCTGGAATCAGAGAACTGGTTTGGAAACACAACAAACATGACTTCAGATCAGATCCTTCAGGAGATAGTTCTGAAGAGGAATGAAGTGTTTGCTGACAACGATGCGATCAGAATCAAGACAGGGCAAGAGTATTGGAAGTTTTATATAGAGAAAGGGTATTACAGGTCACCAGGACCTGATTTTAGGTACTACTACTACGAGAGGCCGGATAGTAACATCAGTTCTCCTCTGTTTACGGAGAAGAATAAAAACTCTGGTGTCTGTTATAAGTTCCAGGTTCCAGAGTTTCTCTGGAAGAAAGGAGTTTCACAAATTTATATAAATACAAAGGTTAACACATTGATCGGATTCAGCCACTATGGCCAGAGGAGTGGAATTGACAATCAGGACAGGGTGTTCCTAAATACAGATGAGAAGATATATCTAATATTAACCCAACAGCACTTTGAGAGGATCCGGGTTCATGGAAAGCTCTGCAATTCAGAACTAAATACCGGGTTTGACAGTTGCAATGAGCAATGGCTTCATGATTACTCTGTGGCAGAGTATGGATGTATAAGTCCATGGAACAATGTTCCCTCCAACTACTCTGTGTGTAAGAATAAAACGTGTACTAGCGGAGTAAATGATATTGTTTTGAACTGGGTTAATGGATTCAATGATAGTATGTGTGGATCCCCGTGTGAGAGCTCGGAGGTGATGTTTGCCTCGCAGTTCTCCTACAAGGTGGAGGGGATGGGGTATGGATACCTAGCCATCACATTCAAACAATCTGTCAAGGTTACGAGGTCTTCTATACCCTACGGGTTTCTAGAGATGCTGGCTGAAGTAGGAGGATATGTTGGACTATTCCTAGGAGTCTCTATTCAACAACTTGTAGCCATGCCAGAGACCTTTATTGATAAAATATACAAAATACAGTTTTAAATATATCACCATCATCATACACTACACTAGTTAAACAATGATCAGTTTTTGGTAAGAAATATTTGT\n>XM_035042612.1 PREDICTED: Populus alba uncharacterized LOC118036784 (LOC118036784), transcript variant X6, mRNA \nAATCAGCTCGCCCATGATTCCTCACAACCACATCTCACCAACAAACCCTCAATATGCATTCAGCAGTCCAGTTCAGATGCTATTCATCAGAAACTATGAATATTTCTGCTGGTGCTAACAACTGTTCTGGTCTTGACATTATTATGGGAAGGGGAAGAAAAGAGGAGTACAAAATATTGAGGATGTTTACATCAAGCAGCTTTATGGGAGCCGAATCAAGTTCATATATCAGAGATGGCTTGAAGCTGCATTGATGAGAGTATTGACTTTGCAAATCGCTATTTAGAATGACATGATACATGCAGCACAGTAAAGACAACGTTTGGTTTGGACGAGTGGGTGATTTTAGAAAAAGAAAACAGGATGCTCGGACAGACAAAACATGCATGCTTTTCTGTCAGATTATATGCAAATCTGAACGACACCCTGTAAGATTAAAAAAAGAAAAAGCAAAGAGAAACTCGATCGAGAGTACTGACGAGCTGCCAGCAAGAGTACTAGTTTGAAAGGTCATGGATTGAATTTTTATTTTATTTTATCTACTGACTTGGAAAATTATGCCCAAGTGTCCAAGTCCTTTTGACCAAAAGACTCGCCTTTGAGTAAGTGGGCCATTGTCAAATTCGGACACCAAAAGGGAAGGGCTGAACTGTTAGATATGATGCCTCAGCTTCATAGAAGTAAGTTGATTCCCAAGTATTAATTATGCCGACTAGGAGAAAACCAAAGGAGTACTGCATGCATGTGAACTCTGGAAGAAACACATCTACACACGATAAAACCGCCGACGGCTATGGAGTGAACCCATTTCCAATCGGGCAGTGCCTATCACCTCTACCTGGAGAGTCTCCTACTGCCCATACTAAGCCGAAAAGAAAAGCTCCTAAAACTGCCAAGGATCTTGAAAAGAAAAGAGAGTACGACAGGGCATATCGGCGACGATGCAGGGAAAATAAAAGGAAAACTGAGCAAGAATTGTTTGTGCTCACAGAAGAGAATAAGAAATTAAATAGAGAGAATGACTACTTCAAAAGGGAAGAAGTTCAGCTGCAAGAGATGGTGCAATCTCAGAAAGACGAAATGACACTGCTACAGAATAAACTTCGCCAACAGAAGGCCCAGCTTCAGGGGCAAAATGTAGTCGTGGATGTGCTTTCGAAGAAAGTAGCTAGTATCGAAGATAATATGGATCCTCAGCGCGAAAATAAACGGCTGAAATTAGAAATGGATTTGCTGATTAAGAAGATTAACAACGATGACTATTTAAACCTCATTCAACCTCGAGAAAAAAACATGAAACTAGAAAAAGAGAAGAATGATCTCCAGTTGATTATTGATGCCTTATGTGCAAAGATAAACAAGGATAATGACCTCGAACCAAAGCAAGCATCCTAATTAATGTACTGAGCTACAAAGTAAATGGACAGAGGAGGTGTTCTGACAGGAGAATTAAGAGGCTACACGAATTTAAATACCCAAGGATGTGACCTAATGTGTTCTTAGAATTGCATGACCTATTATATTGACCTAATCATCATGTATGAAGGGTGTTCTTAGATTTTAGCAGCAAAAGTATCAAGAAGTAAATAAATAAATTGGTACTTGGAGGTTTTGATTTGCCTTTTAAATTGGTAATCTCTCTTGTACTTAGTGTATGTAAATCTCACTGGTTAAGGCCATCTTATAAGCCTACTAATATCGCTCATGAGCACCGGTCTCCCCCATTTGATGGAGGAATAAAATTGACAGTGGTGGAACCAGCAAGATGAATGATCCGTATAGGGATATTTCCTTGGGGTATTTCATGGCAGGATTTGCAGCTGGATTGGCTATGGAATTTGGGAATCAGATGTTTGCATCTTGAAGTAGCTTCCAAGTGGTTAAACATGTTTTGGCAGATGATCAAGGACAGGGCAGGCCCTTATGCTATTTTTCCAAGATGGGTATAAATCTTCCACGCAGCGACTGGAGGGCAGAAACCTCTCCAGTGTAGGGGGGGTCTAGCTCATGTTCTTATAG\n>XM_011946569.1 PREDICTED: Colobus angolensis palliatus RIB43A domain with coiled-coils 1 (RIBC1), transcript variant X2, mRNA \nGGAGTTGGTGCTGGGCGGAGTCAGAGCAGCTCTTGAGGGTCAAGGAGGCGGGGGAGACCTGAGTTCACGCTTGCTGAGACAGAAGTCACAGCAGGATTATGCCCCTCAGGGCAAGAGGAAGGTGGGAGCTCGGCTGTGGCTTTAGCCTGGCCAACCTTCAAGGCTAGGACAAGGACAGGGGCGGGAATTGGAAAGACCCGGGGGGAGCGGAGGGCTGGACGAGAATGAGGGGCCAACGGGAGGATTCAGTGTTAGAGTTCAGAAACTGCCGCTGTAACCCAAGAACAAGGTTGCATGCAGAGCCAACCTAAGAGCTTCAAAATCGGGATTCCTTACTGAGAAAGATGTATAACATAAACCAGTCAACAGATACCAAGGAAGCAGCAGCCATCGAGGCCAGAAGAAATCGAGAAAAAGAGCGACAAAACCGATTCTTCAATGTGCGGAACCGAGTCATGGGGGTGGATGTCCAGGCCCTGAACAACCAGGTAGGAGACCGAAAGCATCAGGAAGCAGCAGAAAGAAGCAAGGAGGCAGCTTATGGTACCAGCCAGGTGCAGTATGATGTGGTAGTCCAGATGTTAGAGAAGGAAGAGGCAGATCGAACACGTCGGCTGGCCAAGAAAGTCCAGGAGTTTCGGGAGCAGAAGCAGCAGCTCAAGAACGGGCGTGAATTTAGTCTTTGGGATCCAGACCAAGTCTGGAAGGGGCTTCCAACCTATCTTAGTTACAGTAATACCTATCCTGGTCCAGCCAGCCTGCAGTACTTCTCTGGGGAAGACCTAGACAGGGCCACACGGCTGAGAATGCAGCAGAGGCAGTTCAGGTACAACTTGGAAAGGCAGCAGCAGGAGCAACAGCAAGCCAAGGTTGATGAGAATTGTGCAGATGCGCTCAGTAACCAGCTGCGCCTCGCCATGGACGCGCAGGCCACCCATCTGGCCAGGCTGGAGGAGTCTTGTCGTGCGGCCATGATGTGTGCCATGGCCAATGCCAACAAAGCGCAGGCAGCTGTGCAGGCTGGGCGTCAGCGCTGTGAGCGTCAGCGTGAAAAGAAGGCCAACCTTGCAGAGATCCGGCACCAGAGCACAAGTGACCTACTGACTGAAAACCCCCAGGTCGCCCAACACCGTACAGCTCCCCACCGGGTCCTGCCCTATTGCTGGAAGGGCATGACTCCAGAGCAGCGAGCTGCCATCAGGAAAGAGCAGGAAGTACAACGCTCTAAGAAGGAAGCTCACCGTCAGGCTGAGAAAACACTGGATACTGAATGGAAAAGCCAGACCATGAGTTCAGCCCAGGCATTGCTGGAGCTAGAAGAGCAGGAGAGGGAATTGTGTGCTGTATTTCAAAGGGGTCTAGGCTCTTTCAACCAGCAGCTGGCTAATGAGCAAAAAGCCCAGCAGGATTACCTGAATTCAGTAATCTATACCAATCAACCTACAGCCCAGTATCACCGGCAGTTTAACACCAGCAGCCGCTAAGTTCAGGATGTTTATCTCTTCCTTCTCCTCCATCAAGCTCACAGGCAGTTAGGAGTCAAAGAGAAAAATGCTGCATACTCCCACCTTCTAACCTAGGTAATAAAGTTCTTCACTCAAAATCAA\n>HM954641.1 Uncultured Sphingobacteriales bacterium clone GG5QJA201E0Q5R 16S ribosomal RNA gene, partial sequence \nTAAAGGGATACTTCTTCGGACAATATACAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGGTTAAGTCCCATAACGAGCGCAACCCCTATCATTAGTGCCATCAGGTCAAGCTGGGGACTCTAATGAAACTGCCTACGCAAGTAGTGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTACGTCCAGGGCTACACACGTGCTACAATGGCCGGTACAAAGGGCAGCTACCTGGTGACAGGATGCTAATCTCAAAAGCCGGTCTCAGTTCGGATCGGAGTCTGCAACCCGACTCCGTGAAGCTGGAATCGCTAGTAATCGCGCATCAGCCATGGCGCGGTGAATACGTTCCCGGGCCTT\n>JN110382.1 Trichosporon asahii strain f2fp12 26S ribosomal RNA gene, partial sequence \nACGGCGAGTGAAGCGGGAAGAGCTCAAATTTGAAATCTGGCAGTCTTCGATTGTCCGAGTTGTAATCTATAGAGGCGTTTTCCGTGCCGGACCGTGTCCAAGTCTCCTGGAAAGGAGTATCAAAGAGGGTGATAATCCCGTACTTAACACGACCACCGGTGCTCTGTGATACGTCTTCTACGAGTCGAGTTGTTTGGGAATGCAGCTCAAAATGGGTGGTGAATTCCATCTAAAGCTAAATATTGGCGAGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGAAAAGCACTTTGGAAAGAGAGTTAAACAGTACGTGAAATTGTTGAAAGGGAAACGATTGAAGTCAGTCGTGTTCTTTGGATTCAGCCAGTTCTGCTGGTCTACTTCCTTGGAACGGGTCAACATCAGTTTTGTCCGGTGGATAAAGGTAGTAGGAATGTGACTTCTCCGGAAGTGTTATAGCCTATTATCACATACACTGGGTGAGACTGAGGACTGCAGCTCGCCTTTATGGCCGGCCTTCGGGCA\n>XM_022629730.1 Penicillium arizonense hypothetical protein (PENARI_c005G05025), partial mRNA \nATGGCCCCCGTGGAAACACAGCAGTATGATTACATTGTCCTTGGCGGTGGTAGCGGTGGCAGTGGAAGCGCTCGCCGTGCAGCCGGTTGGTATGGTAAAAAGACCTTGATTGTGGAAAGTGGACGGTCAGGAGGTACCTGTGTCAACGTTGGTTGTGTGCCTAAGAAAATGACCTGGAACTTCGCAACCATTAACGAGATGCTGCATGTTGGCAAGAGCTATGGCTATGACATTCCTGATAACATCGCTATGGACTACACCCACTTCAAGAACACCCGTGACGCCGTTATTAAGCGGCTCAATGGCGCATACGAGCGCAACTGGAACCGGGAAGGAATTGATCTCGTGCAGGGTCGTGCAGGCTTCGTTGAGCCTCAAACCATTGAGGTCAAGCTAGCCGACGGCTCCGGTTCTGCCCGCTACACTGCGCCGCACATCCTCTTGGCCACCGGCGGCCGGCCCAACATCCCCTCCGTGCCCGGTGCCGAGCACGGTATCACTAGCGACGGATTCTTTGAGATGGAGGATCTTCCCCCGAAGGTTGCAGTCGTGGGTGCTGGCTACATTGCTGTCGAGCTTGCTGGCGTCATGAACGCTGTCAATGTCGAGACCCACATGTTCATTCGCGGGGAAACCTTCCTCCGCAAGTTTGACCCTATGATCCAGAAGACCATGACCGATCGGTATGAGGCTTCCGGTGTCAAGCTTCACCGTAACCACTCCGGATTCAAGGAAGTGCAACTCATCCGTGACGGCAAAGGCAAGGATAAATTGCTCAAGCTCATTGGCCATGACGGCTCTGAGCTTGAGGTGAACGAGCTGCTCTGGGCCGTGGGTCGTGCCCCCGAGGTCGAGGACCTGAACCTCAATATCCCCGGAGTCAAGCTGAATGCCGGCGGTCACGTTGTGGTTGACGAGTACCAGAACACCTCGGTCGAAGGTGTCTATGCTCTTGGTGACGTGACAGGTCAAGCCGAGCTGACCCCAGTCGCCATCGCCGCCGGTCGTCAACTCGGCAGCCGTCTGTTCGGTCCCCCGGAGCTCAAGTCATCCAAGCTTTCATACGAGAACATCCCTACGGTCGTCTTCTCCCACCCCGAAGTCGGCTGTGTTGGTCTCACGGAGCCCGAGGCCCGCGAGCGCTACGGTGATGACAAGATCAAGATCTACCACACCAAGTTCACGGCCATGTTCTACGACGTCATGCCCGCCGAGGAGAAGGCTAAGAATCCGACTGAGATGAAGATAATCTGCGCCGGTCCCCAGGAGAAGGTTGTCGGTCTCCACATCTTGGGCCTCGGTGTCGGTGAGATGCTTCAGGGCTTCGGTGTCGCTGTCAAGATGGGCGCCACAAAGCAGGACTTTGATAGCTGTGTTGCTATCCACCCTACTAGCGCCGAGGAGCTGGTGACGATGCGGTGA\n>AF339527.1 Harposporium helicoides strain Arsef 5354 large subunit ribosomal RNA gene, partial sequence \nAAATTTGAAATCTGGCCCCCCCCGGGGGGCCCGAGTTGTAATTTGCAGAGGATGCTTCTGGCGCGGCGCCTTCCGAGTTCCCTGGAAAGGGACGCCACAGAGGGTGAGAGCCCCGTCTGGTCGGACGCCAAGCCTGTGTGAAGCCCCTTCGACGAGTCGAGTAGTTTGGGAATGCTGCTCAAAACGGGAGGTATATGTCTTCTAAAGCTAAATACCGGCCAGAGACCGATAGCGCACAAGTAGAGTGATCGAAAGATGAAAAGCACTTTGAAAAGAGGGTTAAACAGTACGTGAAATTGTTGAAAGGGAAGCGCTTGTGACCAGACTCGGACCCGGCGAATCACCCAGCGTTCTCGCTGGTGCACTTCGCCGGGCCCGGGCCAGCATCAGTTCGCCGCGGGGGACAAAGGCGGCGGGAACGTGGCTCCCCCGGGAGTGTTATAGCCCGCCGCGCAATGCCCTGGGGCGGACTGAGGTTCGCGCTCCGCAAGGATGCTGGCGTAATGGTCACCAGCGACCCGTCTTGAAACACGGACCAAGGAGTCGTCTTCGTATGCGAGTGTTCGGGTGTGAAACCCTTGCGCGTAATGAAAGTGAACGCAGGTGAGAGCTTCGGCGCATCATCGACCGATCCTGATGTTCTCGGATGGATTTGAGTAAGAGCATACGGGGCCGGACCCGAAAGAAGGTGAACTATGCCTGTGTAGGGTGAAGCCAGAGGAAACTCTGGTGGAGGCTCGCAGCGGTTCTGACGTGCAAATCGATCGTCA\n>XM_024173345.1 PREDICTED: Morus notabilis allantoinase (LOC21397670), transcript variant X1, mRNA \nGTTCATGAACCTCTCCACGACACGAGCGAGATTCTTCTCTCTCTTTCTCTCTCTTATTGGTCAGTGTAACGCATAATATTAGAAGTAGATGAAGAAGAGAGAGAATATGGAGAATAGGCTTCAATGGAGGCTCTTTCCCCTGCTTGCGATACTCGCTTCATATTTGGTCTTCTTCTACGTCCAAAACCATTCCGAGCTCTCACATAATAGATGTAGTCTGCTGCCTCACCAACACTATTGGATAGCTAGCAAGCGGATTGTGATACCACAAGGGATTATATCTGGAGCAGTTGAGGTGAAGAATGGGAAGATTGTATCGATTGTCAAAGAAGAAGAAAGGTTGTGGAGTTCCAAGTTGGGGCAAGTAATTGACTATGGAGATGCGGTTGTCATGCCTGGCTTGATTGACGTGCATGCACATCTTGATGATCCCGGAAGAACTGAATGGGAAGGATTTCCTTCAGGAACTAAAGCGGCTGCTGCTGGAGGTATAACGACATTGGTTGACATGCCTCTGAATAGTTTCCCCTCAACTGTGTCTAGGGACACATTGAAACTTAAGATTAAGTCGGCAGAGAACAGAATTCATGTCGATGTTGGTTTTTGGGGAGGTCTTGTTCCTGAAAATGCGTTCAACCATTCCGCTCTTGAAGACCTCTTAAATGCTGGTGCTCTTGGTCTAAAGTCGTTTATGTGTCCTTCAGGGATCGATGATTTTCCCATGACAAACATTAGTCATATTAAGGAGGGCCTGTCAATACTTGCAAAATTTAGAAGACCTTTACTTGTGCATTCAGAGATTCAAAAAGATCTTGAAAGCCCTTTGGGACTCGAAGAAGATGGTGCCAATGACCCTCGTTCTTATTCAACATATCTCAAGACTAGGCCGCCTTCAATGTTGCTGAAACTTTCCAACTCTGTTTTTTTAACTTTTTGGTTCAAACACAGGGAGGAAGCAGCTATTAGGGAGCTCTTGACAGTGTCAAAAGACACGAGGATTGGTGGCCCTTTAGTTGGAGCTCATCTTCACATTGTTCACTTGTCTGATTCAAGTTCTTCCTTGAATCTTATCAAGGAAGCAAAACGTGGCGGTGACAGTTTGACTGTTGAGACTTGCCCACACTACTTGGCTTTCTCAGCGGAAGAAATTAAGGACGGAGACACTCGTTTTAAGTGTGCGCCACCCATTCGCGACGCAGTCAATAGAGAAAAACTGTGGGAGGCAGTAATGGAAGGACATATCGACATGTTAAGTTCCGATCATTCGCCAACAGAGCCAAAACTCAAGCTTCTTGAGGAGGGTAACTTCTTAAAGGCATGGGGAGGAATATCATCTTTGCAGTTTGTGCTTCCTGTGACATGGTCATATGGGAGAAAATATGGTGTAACATTGGAACAATTAGCTTTATGGTGGAGTGAGAGGCCCGCAAAGCTTGCTGGACAAGAATTAAAGGGGTCCATTGCAGTTGGTAATTATGCAGATATAGTTGTATGGGAACCTGAAGTAGAGTTCAACCTCAATGATGAATATCCTGTATACCTTAAACATCCTGGTATTTCTGCCTACATGGGAAGCAAGCTATATGGAAGAGTTTCGGCAACCTTTGTGAGGGGAAACCTTGTCTACAAAGAGAAGAACCATGCCACTGCTGCTTGTGGTGTCCCAATCCTCGCAATATAGAAGTTGCTGCACCATTGAACTCCTTTTGTTTTCCTCTTCTTTTTTTTTTTTGGTTTATGTTATGTAATTAAACATCGAGTTTGTTGTTTCTTTCTTAACATCATGTGAATATTATGTACATCTGTATAGTACACCACTTTTAAGTACTTTTTCTGTTTTTTCTTTTTTTTCAATACAATACGGAATCAAACCCGCACTCTCAATTGAAGCTC\n>XM_016927369.2 PREDICTED: Pan troglodytes S100 calcium binding protein A8 (S100A8), transcript variant X2, mRNA \nGAGAAACCAGAGACTGTAGCAACACTGGCAGGGAGAAGCTGTCTCTGATGGCCTGAAGCTGTGGGCAGCTGGCCAAGCCTAACCGCTATAAAAAGGAGCTGCCTCTCAGCCCTGCATGTCTCTTGTCAGCTGTCTTTCAGAAGACCTGGTTCTGTTTTTCAGGTGGGGCAAGTCCGTGGGCATCATGTTGACCGAGCTGGAGAAAGCCTTGAACTCTATCATCGATGTCTACCACAAGTACTCCCTGATAAAGGGGAATTTCCATGCCGTCTACAGGGATGACCTGAAGAAATTGCTAGAGACTGAGTGTCCTCAGTATATCAGGAAAAAGGGTGCAGACGTCTGGTTCAAAGAGTTGGATATCAACACTGATGGTGCAGTTAACTTCCAGGAGTTTCTCATTCTGGTGATAAAGATGGGCGTGGCAGCCCACAAAAAAAGCCACGAAGAAAGCCACAAAGAGTAGCTGAGTTACTGGGCCCAGAGGCTGGGCCCCTGGACATGTACCTGCAGAATAATAAAGTCATCAATACCTCA\n>XM_050595833.1 PREDICTED: Cataglyphis hispanica C1GALT1-specific chaperone 1-like (LOC126851659), transcript variant X2, mRNA \nTCGCGTTGCGAGAGTGGACAAGCGGCAGCATGCATATAGCATCTCCGGATGTCCACTCAACGCAGATAGTGCGGCCACCGTGAGGCTTTAGTGGGTAAAAATCTCACATAATCCTCGACTCTCCCCGAAGTCGAGGATATCTTTGGAAGATTTCCTCACGTAAAAAAAAAAAAGAATGCATTTATATACCAATCATACACATATATGATTGGTGGTGGAAGGGGAAGAGGGTTATGTGAGTTAGGTTAAGCAAACAGATGACTTGTTTATGTCACCTGTTGAATATTGTGATCACTAGCAAACACTACCGATTGATCGTCGCAGATGTATATAGGTGTGTTTATAATGTAAAAATGTCAGATATAGAATTTTACACAATTATGTAAACGCTTCAAAATATAATCTTCATGTTAATTCGTCGAATAATATTATAAATGATTTTGCGATGATTTCATCGCATATTTTTATCGATAATACAAGCGCAAAATGCATACTACAGACTATATACATCAACTTTACAAATAAGAGGATACATATAAATTTAAAGTATGCATAAGAAAAGATCTTAATGAGATAATTGAGTTTAACGAAGGTCAAATATAATGATAGTCAAAGAAACTTGTGATTGGCATTACTTGACTACTTGGCATTAGTGTTGAGAGAACTGGATTGTTATTATGTATTTATCGAATTCAATTTTTACTGTGATGACAAGATGCGATTTCGATTTTTAAAACAGAGATCTATATTTCTGATTGGTTTGACAATTGGCTTTGTTTTTCCATTATTGTTATCTTTATTAAGGAATATATTTGTGATTGATTCGATGTGTAAACAAGATCAACCATTGTGGCAACCTGAATATTATCTGAGTAAGGAACCTCACCACGAAGAAATTATTTTACAGCATTGGGAAAAAGTGAAGAGATCTGGAAATTTTAATATCGTTACATACAACACTTGGTTGGCAGCACAAAACTTGAAACCATACAAACTTGATTTGGATAGATATCTATATCTCCAAAAAGGATACAATACAAGAAAAATTGAAAGCGAATGGAACTGGTTAAAAGAACGAGTATCTGTCACATGTATAGTTTTTGTAGAAAAACTCAAATTGGGGAAATCAATCCAGAATACATGGGGTAAACGCTGTAACAATATTTATTTCTTTGGACACCGTTTGAAAGACGATGAATTGCCTATTATAAATATAAATACAAAGATTGTGTCATCTTGGCAATTGCTGTGTGAAGCTATGAACTACATTTGGAAAAAAGAAGCAGACAAATTGGAGTGGATTATTTTCGTAAAAGATAATACTATAGTCATACCGGAAAATCTGCGCTATATGATTGCTCCGTTAGACCACAGAGATGATTACTATCTGGGTCATCCAATAGTTCTGTGGGGTCAGATTTATAACGTTGCTCAATCTGGATATGTTCTTAGTAAAGGAGCACTTGTTAAAGTATTACAAATGTTCAATACTACAGAAAAATGCATTGAAGGTGGAAAATATTGGAAGAAGGAAGATTATTATCTTGGAAAACACTTATCGTTTTTGGGTATACGTCCATCTGATACCAGAGATCAGTATTTGAGAGGTACTTTTCATGGTCATTCTTTACAAAATCTTCTATGGGGTATTATCAGACCAGATAGCTACTTTACACATGCTGTGTATCCGACGAAAGGAGAATGCTGTTCACCGATATCTGTGACTTTCAGTGTCAGTGAACCCGACAAAATGCATATGTTAAATTATTTGCTATATCACTTGCATGTATTTAACAGTGAAAGCAAATTTGGCAATATATCCATCAAAATTCAAGTACCTGAAGACAATGTATGGAAGATTGCACTGCAGGAGGAATTCAACATCACACATTTGAACGATATATCGAGTGACGCTTATTACGAAATATGGCACTCGAAATATTCGGAACCTGGACAGCTAAGAATTGCTAAAAATTATCGAATGACGTCGGATGTACTAAACTGTTTATTGACGAACTACAAAACAGGAAACACGTCTGCGTATAATTGTAGAAGTAAAACAGTCGTCGACAGTACAAAAACCTAAGCCATTAAAACAGCTATTAAAACATTATTTAACAGCTTTATATTATTATTATCAAGACAGAAGATTTACAAAAAACCAATAGACGGTGAATATCTCCAGTCTTGTAATATGCGATTTTCTATACATAAAAATCACGTTATAAACTTTAACAGATAAGTACATTAATAAAGTTAATATTATTTGACCTAA\n>XM_030571406.1 PREDICTED: Gopherus evgoodei complement factor H-related protein 2-like (LOC115655701), mRNA \nATGACGCAGCTTGGATATACTGCCATTCTGATATTATGGGCGTGCTCCACTGCATTAGCTATTTCATGTGGTAACATAGAAAATGGGAGGGTAAAGCCAAGTTTCTTCTTCCAGAGAAGAAAAAGAACATTTGAATGTAATGCCGGGTATATAGCAGAAAATGACAACAACAGAATTGAGTGTACTTCTTCAGGATGGGCTCCTGTACCCAGATGCATTCCAATACAATGTGGAAGGATAGAAAATGGGAAAATAGTGGACAAAGTTGAAGAAAAAACCACCTTTCGATGTGATCATGGATATAAATCTGAAAATGGAATTAATGAAACTACCTGTACCGCTGAAGGCTGGTCTCCAGTACCTATATGTATTGTTCAAGAGTGTTCGCATCCACCTGACATCGATTTGGCAGAAATTGTCAGTGGGGAGAAAGCAGAATATCAGGAGGGTGATGTTGTTCAGTACAGGTGCTACCCAGGATATACTTTGGCAGGATCTGAAAGGATAACATGCAATGGAGAAAAATGGACACCTCCACCAAAGTGCTTCGCTCCATGTATTATCACAAGGCAGCAATTAGAAACAAAAAAATTGCTTCTGTCTAATGGCCGAAGACGTACAGTATTGATTCAAAGTGACCAAACAATGGAATTTCTTTGTGGTGAACATTCTGACCTTAAAATCCCCTACTTCATCAAGTGTGTAGATGGGCACATGGATTTACCAACTTGTGTATCAGGAACTGGGGAAAAGTGTGGCCGGCCACCTACTATTGAGAACGGAGACATAACTACTTTATCCCTAAAAGAGTATGCATTTGGATCTTCGGTAGAATACAGATGCCAGCATTATTACATAATAGAAGGAGACCGGAAATCATACTGTTACAATGGAATCTGGACAAAAGTACCAGTTTGTTTGGAGCCATGTGTTATCACGCAAGAAGATATGAGATCACGCAACATAGATCTAAAGGGGGAGTCAGCTCAAAAACGCTATGTGTCACATGGAGATTTTGTAGAGTTTAAGTGTAGATCCAGTTGGTTTCAAAACTCTTCAAATAATTATAGAGTGCAGTGCAATGCGGGCCAAATACCTTATCCCCAATGCACTTAG\n>XM_045878377.1 PREDICTED: Mirounga angustirostris ret proto-oncogene (RET), transcript variant X2, mRNA \nCCAGACCCAGGCGCGCAGCAGCGGAGGGCAGCTGGAGTCCGCGCCCCGACGCTCTGCGCCCCCCGTGTCTCCCGCGTCCGCCGCGCCCCGGGCGGGCATGGGGCGGCCAGGCTGAGCGCCGCACCCCGCCGCCGACACCCCGGGCCCCAGCCAGCAGCCCTCTTGCCGCGGCCCCGGCGCGCACGGGCCATGGCGAAGGCGACGGCGACGGCCGGCGCCGCGGGGCTGCGGCTGCTGCTGCTGCTGCCGCTGCTCAGCGAAGCTCCGCTAGGACTCTACTTCTCTAGGGATGCTTACTGGGAGAAACTGTATGTGGACCAGCCAGCTGGCATGCCCCTGCTCTATGTCCATGCCCTGCGGGACGTCCCCGAGGAGGTGCCCAGCTTCCGCCTGGGTCAGCATCTCTACGGCATCGCCTACCGTGCGAGGCTGCATGAGAACGACTGGATCCGCATCGAGGAGGACACAGGCCTTCTCTACCTTAACCGGAGCCTAGATCGCAGCGCCTGGGAGAAGCTCAGCATCCAAAATGGCGGCTTCCCTGTGCTCACCATCTACCTCCAGGTCTTCCTGTTGTCTACGTCCCTGCGTGAGGGCGAGTGCCAGTGGCCAGGCTGTGCCCGGGTGTACTTCTCCTTCATCAACACTTCCTTCCCGGCTTGTGGTTCCCTCAAACCCCGGGAGCTCTGCTTTCCCGAAACAAGCGTCTCCTTCCGCATCAGAGAGAACAGGCCTCCTGGCACCTTCCACCAATTCCGGCTGCTGCCTGTGCAGTTCCTGTGCCCCAACATCAGTGTGTCCTACAGGCTCCTAGAAGGTGAGAATCTGCCCTTCCGTTGCGCCCCGGACAGCCTGGAGGTGAGCACACGCTGGGCCCTGGACCGCGAGCTGCGGGAGAAGTATGAGCTGGTGGCCGCGTGCACGGTGCGCGTCGGCGCGCGCAAAGAGGAGGTGGTGATGGTGCCCTTCCCCGTGACCGTGTATGATGAGGACGACTCGGCGCCCACCTTCCTCGGGGGCTTCGACACCGCCAGCGCTGTGGTGGAGTTCAAGAGGAAGGAGGGCACTGTGGTGGCCACGATACGTGTCTTCGATGCAGATGTGGTGCCAGCATCTGGGGAGCTGCTGAGGCGATACACAAGCACACTACTCCCTGGGGATGCCTGGGCCCTCCAGACTTTCCGTGTCGAGCACTCACCCAACGAGACCTTGACCCAGGCCAACGGCAGCTTTGTGCGGGCAACTGTGCATGACTACAGGCTGGTTCTCAACCGGAGCCTCCCCATCTCGGAGTGCCGCTCGCTGCAGCTGGCCGTGCTGGTCAATGACTCGGACTTCCAGGGCCCGGGGGAGGGCGTCCTCCGCCTCCACTTCAACGTGAGCGTGCTGCCCGTCAGCCTGCACTTACCCAGCGCCTACTCCTTCACTGTGAGCAGGCGAGCCCGCCGCTTTGCCCAGATTGGGAAAGTCTGTGTGGACAACTGCCAGGAGTTCAGCGGCATCCACGTGCAGTACAAGCTGCAGCTGTCCAGCACCAACTGCAGTGTCCTGGGGGTGGTCACCTCAGCCGAGGACACCACGGGGACCCTGTTCGTGAATGACACGGAAGCCCTGCAGCGGCTCGATTGTTCTCAACTCCAGTACACGGTGGTGGCCACCAACCGGCCAACCCGCAGGCAGACCCAGGCCCCGCTGGTCGTCACCGTGGAGGGGACGTATGTGGCTGAGGAGCCAGGCTGCCCCCTGTCCTGTGCAGTCAGCAAGAGGCGGCCTGAGTGTGAGGAGTGCGGCGGCCTGGGCTCTCTGACGGGCAGGTGCGAGTGGAGACAGGGAGATGGCAAAGGGATCACCAGGAACTTCTCCACCTGCTCCCCCAGCATCAAGACCTGCCCCGATGGCCACTGTGATGCTGTGGAGAGCAGAAATGTCAACATCTGCCCCCAGGACTGCCTCCGGGGCGGCAGCATCATTGGTGGGCACGAGCCAGGGGACCGCTGGGGGATAAAAGCTGGCTTCGGTATCTGCAACTGTTTCCCTGAAGAGAAGAAGTGCTTCTGTGAGCCTGAAGACAGCCAGGACCCGCTGTGCGATGAGCTCTGCCGCACAGTGATCGCGGCGGCCGTGCTCTTCTCCTTCATCGTCTCCATGCTGCTCTCCACCTTCTGCATTCACCGCTACCACAAGAATGCCCACAAGCCGCCCGTCGCCTCCGCCGAGATGACTTTCCGCCGGCCGGCCCAGGCCTTCCCAGTCAGCTACTCCTCGTCGGGCGCCCGCCGGCCCTCCTTGGACTCCATGGAGAACCAGGTTTCTGTGGACGCCTTCAAGATCCCGGAGGATCCGAAGTGGGAATTCCCTCGGAAGAACTTGGTTCTTGGAAAAACTCTGGGAGAAGGCGAATTTGGAAAAGTGGTTAAGGCAACAGCCTTCCGGCTTAAAGGCAAAGCAGGATACACGACCGTGGCCGTGAAGATGCTGAAAGAGAACGCCTCCCCAAGCGAGCTGCGGGACCTGCTGTCAGAGTTCAACCTCCTGAAGCAGGTCAACCACCCGCACGTCATCAAGCTGTACGGGGCCTGCAGCCAGGATGGGCCACTCTTCCTCATTGTGGAGTATGCCAAGTACGGCTCCCTGCGGGGCTTCCTCCGAGAGAGCCGCAAGGCGGGGCCGGGCTACGTGGGCAGTGGAGGCAGCCGCAGCTCCAGCTACCTGGACAACCCCGAGGAGCGGGCCCTGACCATGGGCGACCTAATCTCCTTCGCCTGGCAGATCTCTCGGGGGATGCGGTACCTGGCGGAGATGAAGCTTGTCCATCGGGACTTGGCCGCCAGAAACGTCCTGGTAGCCGAGGGGCGGAAGATGAAGATTTCGGACTTTGGCCTATCCCGAGATGTTTATGAAGAGGATTCCTACGTGAAGAGGAGCAAGGGTCGGATTCCAGTCAAATGGATGGCAATTGAGTCTCTTTTCGATCATATCTACACCACCCAAAGTGATGTGTGGTCCTTCGGTGTCCTGCTGTGGGAGATTGTGACTCTGGGGGGCAACCCCTACCCCGGGATTCCTCCGGAGCGGCTCTTCAACCTTCTGAAGACAGGCTACCGGATGGAGAGGCCCGACAACTGCAGTGAGGAGATGTACGGTCTAATGCTGCAGTGTTGGAAGCAGGAACCAGACAAGAGGCCAGTGTTTGCTGACATCAGCAAAGACCTGGAGAAGATGATGGTTAAGAACAGAGACTACTTGGACCTGGCCGCGTCCACCCCATCTGACTCCCTGCTTTATGACGACGGCCTCTCGGAGGAGGAGACGCCCCTGGTGGACTGTAATAATGCTCCCCTCCCTCGAGCCCTCCCCTCCACGTGGATTGAAAACAAACTCTATGGTAGAATTTCACATGCATTTACTAGATTCTAGCAACATCGTTCCTCTCTGCACTATCCTTACTCTCTGTAATGCTTTTTAAGAGTGTTTCTGATCTGAATGAAACCAAAGTTCTCCCTGAACCTTTTTATTTGTAAATGTCTGACTTTGCATCCGTTTACATTCGGGCATTTTTGAAACTATGTTTTTTTAAAAGGATGTGAAAATAAGTATAATTACCACACTGCCCGGCTACTTATGATTATGGAGAAGAAAGGGAGCTGGGCAGAACTCTCAGGGGATATTGAGAAGATGATAAATAAGTCGTCTCTGGGGTGGGTATGTATCAAGTCATAGTACTTCTAATTTAACTACTGGGATAAATTTACCCAATCTGGGGAGGCAGTTAATTGAGACAGGAGGAGCCAGCACCACCCTGCCTGCACTGAGGGCACAGCCTGTGGTCACTCCCAGACCCCATCTGGGCGGGCAGGTGGCTCTCAGAGGCCACTTGGTACTAGGGAGCATTGGCCCGCCCGGCCTGAGCCCCGCCCACATGCCCACTATCAGGGAGGACACCTGCAGACTGCTGTTTTCACATCCTTTGCATTACACACTGTCATGACAGTTGTCACTCATGAAGTCAGTGCTAAAAGCTGAAGCAAATGCTTTTGAAAGAACATAGTCTGTGGTGCTGTGGTCTTGCAATGGACAGTAAATATGGTTCTTGCCAAAACTCCTTCTTTTGTCTTTGATTAAATACTTGAAAATTT\n>XM_028244121.1 PREDICTED: Camellia sinensis uncharacterized LOC114299398 (LOC114299398), mRNA \nACACCGACGACACGAGTCGTCGTCGCGAGTCGTGACTCATCTCATCTGCACTTCACAAGAAGTTAGTCACCAGACCCCCCCGTATGCACCATCATCAATCAATGTCTTTCCATGTATGAAACCCTAGCTTTGCAAAGCATTTTTCCTATTCAGGAACTAGGGTTTCTCTCTCTCTCTCTCTCTCTCTAAATTAGGGTTTCTATTTTTCTTCAGTCACTCTTGCGCGCTTTCTCTCAAACCCTCCATCGAATCAATTTTTTTTGTCTTTTCTTTTAATTTTATCGTTGTCAGGTAGTTTCCAGGAAAAAAAAATTGTAAATGCGAGAAATCGTAAGAAAGACGTTTTGACACAGCAGGTGCTTTCTTGGAAACCCCATCAAAGATTCCATCTATTTCCTTTCAATATCTTTGATGACAGTGAGGAGGAAGAGGAAAACACATGAAAGATTCGAGAATTTGTGCGAAAATTGTTGAAAAACCTAGGCACTAGTGTGAACTTCGATGGAGTCGACGCATGTGGTACTCGATATAAGCTCGGACGAAGATTATGATTATGATTGGATATCGGAGTTTTTGGACGATGCGGATGACTCTGATGAAGTGGTGGTGGTGAGTGAAGTTGTGGCGAATCACAAGCAGAGGTCGTCAAAGTCTTCTAGTGTTGCTGCTGCGAAGCCGAAAGATTTGGATGATGATTGTGTGGTATTGGAGGGTGATCCAGATAAACCGGTTGCGATCGAGATCGAGAACAATACGGAAGGTGATTCGGATGATTTGTCCATTGTTGGCGAGAAGGGGCAGATTGCTTGCAGAGATTACCCTCACGCTCGCCACCTCTGTGCTAAGTTTCCTTTCACTTCCTCTCTGCATGAGAGGCATTGTCCTCAGTGCCACTGCTATGTATGTGACTCACTTGCACCATGTGTCAATTGGGGCAATGGCACTTCCAGAAATGACCATTGTCACGCTACCGATAAAGATGAGTTCTGGAAATCTCAGAGGCAGAGTTTCAAGCAAGGGAATAAAGCCCCACTACCAGGTCCTAAATTTCCTGACACTTCTCGCTCAATTCGACCACCGCCAACAATCACACAGCTGCAACCAAAGAATCAGATCTCCAGGTCAGCCACAATCCGTGCTTGCTCTATGCCTACCAGTTTTGGCGTCCCAAATATCACAGATCAAGGCAGAAGCCAACAGTCTGTATATGTAAGAAACAAATTCCACCCAGATTTGGTCTCTCGGCAGTTGCTTAGTACCCGTAATAATATCATTCAAAGGGACAGAAGGTTTGGTAATTTAGGGCCTCCATATATCAATTCCCACACAATTTTCAAAAGGGCAGCAGGATCAACTAGAGTTGCTTTGGCAACAAATCGAACTAGATATGGCTCATCTGACAACAATTATGCAACTCAATTCTCCAGAAATCCCTCTCCTGTGGCAGCTTCAAATGATAACAATCCCACTAGGTGGCGAGACCTTTCAAGTGGAATGATTTCAGACTCAGAAGCATATCAGAACCTCTCCCAGCAAAACACTGGCAGCAGCTTGGAGAATTCAGTGCCTTCTCAACCCCTGTTATCCTCACATCCAAACATGGGCAGTGTCTTTCTGAATTCAGTGCCTTCTGGACCCCGACTGTCCTCCCAGCCAAACATAGGCTGCAGCTTTGTCGATTCAGTGCCTTCACCGCAAGTCTCTTCCCAGCCAAGCATGGGAAGCAATTTCGAAAATCCTTTGTCTTGTCAACCGCAAGTGTCCTCACGGCCAAACATGGGCAGCAGCTTTGTCTATCCTGTGCCTTCGCAACCCCAAGTGTATAGTAGTCAGCCTATTCCTGCAGCAAATGATGGCCAATATGGCTTCCAGCAAGGAAACGAGACTCAAAGTGCTGTGGATCCAAGTTTTTCAGATTTTGACTCAAGTTGGGTTGCCCCAACTGGCTGCCAGAGCAACCAACCTTTGGCAGATAATTCCCTATTTCAAATTCCAGGGCTGACTTATCATCATCCTCCTCTTGTCACAGGGTTTGATCCCCAGATTCCTGTAAACACAAATCCAGGCTTACCGGACTTCCAATTTGATTGGATGTTGGAGAATCAATCTTTTTCTGGGGCCCTAGAAGTTCCTGTTCCTTCTGGATGCAATGTATACTCTCCGGAAACTGCCCCTGTTGATGATGTTGCGTTCTTTGATTTCTAAACCTCCTGGGAGTAACCAACCCATGTAAAAAGCCCTCAACCCTGCAAAGAATGAAAATGGCATTCCATTCTTTGGATGATATAATAGGGATTATTAGTAATTGGGTTAAAACATCAACAGTAGAACAGTTGTACTGTACAGTATTTTTTTGTTTTTAATTTTAATATGAGGTACATACTCAAGTAGCCTTGTTTTTACGGTTGCTTTAGGGATGTAGGGTGCCGGTGATGTAACATTATATATGAAATTCTCAGATTGTCATTTTTCTATCCAATCATTTTAGGCTCTACTCAAA\n>HM725485.1 Uncultured bacterium clone GB7N87003GN9MT small subunit ribosomal RNA gene, partial sequence \nAGGACGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAGCGGGGTCCATCCAGTGGCAACACTGGTGAAGACCTAGCGGCGAACGGGTGAGTAACACGTGAGAAACCTGCCCTGAAGTCTGGGATAACCCGAGGAAACTCGAGCTAATACCGGATGTCCCCACCGAGCCGCATGGTTTGGTGAGGAAAGATTTATCGCTTCAGGAGGGTCTCGCGGCCTATCAGCTAGTTGGCGGGGTAACGGCCCACCAAGGCATCGACGGGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCAACGCCGCGTGCGGGATGAAGGCCTTCGGGTTGTAAACCGCTTTCAGTGGGACGAAAACGAGACGGTACCCACAGAAGAACGCCCGGCCAACTACGTGCCAGCAGCCGCGGT\n>EF082344.1 Picea sitchensis clone WS0277_P22 unknown mRNA \nCCCCCAAAAATGAAAGAAGCAGAGGAGAGGAGAAAGCAAGAGGAAGAAGAGAAGCAAAGAAGAGAGGAGGAAGAACGGCTCAGATTAGAAGAACTAGAAAGAGAGAAAGAGGAAGCAAAACGCCGGAAGAAAGAACGGGAAAAGGAAAAGATCCTGAAGAAGAAGCAGGAAGGCAAATTGTTGACTGGCAAAAAGAAGGAAGAAGCTCGTAGGTTGGCTATAATGAGAGAACAATTTCTTGCTCAAAGTGGGGTTTCATCCGATATCTCAAAGGAGGAAAATCATGCTATGCCCAAGAAACCAAAGTATGAAACAAAGAAGAAGAGGCATGGTCCAATTATTTCTGATGCTGTGGCAGTTGAGCCTGTTGAGATTCAGCCAGATGTGGAAATGAAAGAAGCAGAGGAGAGGAGAAAGCAAGAGGAAGAAGAGAAGCAAAGAAGAGAGGAGGAAGAACGGCTCAGATTAGAAGAACTAGAAAGAGAGAAAGAGGAAGCAAAACGCCGGAAGAAAGAACGGGAAAAGGAAAAGATCCTGAAAAAAAAAAAAAAAA\n>KJ417285.1 Leucopaxillus eucalyptorum strain REH9110 voucher NYBG:01115433 18S small subunit ribosomal RNA gene, partial sequence; internal transcribed spacer 1 and 5.8S ribosomal RNA gene, complete sequence; and internal transcribed spacer 2, partial sequence \nGAAGGATCATTATTGAATAAATTGAGTTGGGTTGTTGCTGGCTCTTAGGAGTAATGTGCACACTTGACATTAATTTTATTTTACCACCTGTGCACTTTGTGTAGATTTGGGGGAAACTGTATTATTGAGTTGTCATGTGTATATTTGCATTTGGCTCTCGTTGATATATTATTTTCCAAGTCTATGTATTTTATATACCCCTATAGTATGTCAAAGAATGTAGTGAAGGGCATGAATGGCCCTATAAACTTAATACAACTTTCAACAACGGATCTCTTGGCTCTCGCATCGATGAAGAACGCAGCAAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACCTTGCGCTCCTTGGTATTCCGAGGAGCATGCCTGTTTGAGTGTCATGAAATTCTCAACCCTACAAAGTTATTTACTTTGTCTGGCTTGGATTGTGGGATCTGCTGGCTTGTTCAGCTCTCCTTAAATGTATTAGCAGAATCTTATATGGGTCAGCTTTTAGTGTGATAATTATCTACGCTATAAAGTGACTTGTTTGTAATTCAGCTTCTAATTGTCTGATTTTTGAAGACACCCTATGA\n>XR_007078499.1 PREDICTED: Homo sapiens uncharacterized LOC124906680 (LOC124906680), ncRNA \nCTCATGGCGGCCTCTGCAGGCCCAGCTGTTCCTCCTGGCTGCATCTCTCGGCCCAGCTCCTGCCTCCCAGCAGGCAAGCTCTTTTGGCTCAGCTCCCTCCAGCGTTTGTAGACCCCGAAGTTTCTGCAGCCAAGCTCTTCAGGCCCACATCCTGCCTCCCGGCGGGCGCGAAGAGCTTGGCTCGAGAAAGTTCGGGGCCTACAAAGGCGGTTTTGAGCTGGGCAGGAGTTGAGCCCAAAGAGCTTGCTTACTTGCTGGGAGGCAGGGCCGGGAGACGCTGACTTCAGGACGACTTGGGCCTGCAGAGGTCGCCAGGAGGCCCAAGCTGGGCGCGGAGGAGCCCACCGACCGGAGACCGTTTGGGGCCTGGAGACGCCATCGGAGGGCAGGAGCTGATCCTGGAGAGGCCACCGTGAGGCCTGACCTGGGCCTGGGGAGCTTGGCTTGAGGAAGCTGTGGGCCGACCAAGGCCGCCAGGAGATGGGCAGGCGCTGAGTCCAAAGAGGTTGTTGGGAGGCAGCAGTCGGGCCTGGAGACGCAGCCGGGAGGAAGAGCTGGGCCCGGAGAGGACGCCGGGAGGCCGCATGTGGGTCTGGAGAGGCCGACTTGAGGAGGCCCGGCCTCTGCCTCCCTCAGGGCGGCCTCTGCAGGCCCAGCTGTTCCTCCTGGCTGCATCTCTCGGCCCAGCTCCTGCCTCCCAGCAGGCAAGCTCTTTTGGCTCAGCTCCCTCCAGCGTTTGTAGACCCCGAAGTTTCTGCAGCCAAGCTCTTCAGGCCCACATCCTGCCTCCCGGCGGGCGCGAAGAGCTTGGCTCGAGAAAGTTCGGGGCCTACAAAGGCGGTTTTGAGCTGGGCAGGAGTTGAGCCCAAAGAGCTTGCTTACTTGCTGGGAGGCAGGGCCGGGAGACGCTGACTTCAGGACGACTTGGGCCTGCAGAGGTCGCCAGGAGGCCCAAGCTGGGCGCGGAGGAGCCCACCGACCGGAGACCGTTTGGGGCCTGGAGACGCCATCGGAGGGCAGGAGCTGATCCTGGAGAGGCCACCGTGAGGCCTGACCTGGGCCTGGGGAGCTTGGCTTGAGGAAGCTGTGGGCCGACCAAGGCCGCCAGGAGATGGGCAGGCGCTGAGTCCAAAGAGGTTGTTGGGAGGCAGCAGTCGGGCCTGGAGACGCAGCCGGGAGGAAGAGCTGGGCCCGGAGAGGACGCCGGGAGGCTGCATGTGGGTCTGGAGAGGCCGACTTGAGGAGGCCCGGCCTCTGCCTCCCTCATGGCGGCCTCTGCAGGCCCAGCTGTTCCTCCTGGCTGCATCTCTCGGCCCAGCTCCTGCCTCCCAGCAGGCAAGCTCTTTTGGCTCAGCTCCCTCCAGCGTTTGTAGACCCCGAAGTTTCTGCAGCCAAGCTCTTCAGGCCCACATCCTGCCTCCCGGTGGCCTGTACAGTCCCAGCTCTGGCAGCAGAAGAGCGTCAGCAGGCCCCGCTGTTGCCTCCCAGGGGCGTCTCCAGGCCCAGCTCTCGCCCCACCACGGCCTCCCGCGGCCAAGTCCCTGCCTGCTCCCGGCAGCCTGCGTACGGCCCTGCTCCTCCCTCACGGTGGCCTGTTGAGGCAGGGGCTCACGCTGACCTCTCTCGGCGTGGGAGGGGCCGGTGTGAGGCAAGGGCTCACGCTGACCTCTCTCGGCG\n>XM_014708519.1 Ordospora colligata OC4 valyl-tRNA synthetase partial mRNA \nATGGAATCTGAGAAAGATGAAAAGAAAAGGATTAAAGAGGAGAAGAAAAGACAGAAGCTTGAGAAGTTTCTACAGAAGAAAACACAGGAAGTGAGTGTGACAAAACCCAGAGGAGAGTACAAATCAGGAGGATACGACCCTATGGAGATTGAAAGTAAATGGTATAAGTACTGGGAGAGCAATGGTCTTTTTAAGCCAATGCGCAGTGAGAAGAAGTATGTTATTCCCATTCCACCGCCAAATGTGACTGGAAATCTGCATATTGGGCATGCTATGATGGTTTCTATACAGGATGCGATATGCAGGTATAAAAGGATGTGTGGATATGAAGTTCTGTATATTCCCGGGACCGATCATGCAGGAATAGCAACACAAAGTGTTGTTTCTAAGCAATTGGCCAAGGAAGGAGTGGTTGATGTTGATCGAGGAAGGTTTTTGAAGAGAGCATGGGAATGGAAGAATACGCATGGAAGTAAGATATATGAGCAGTTTAAGAGACTGGGTACCAGTGTTGATTTTTCAAGGGAAAGATTTACTCTTGATCCTGGGATGAGTGATGCAGTTAGTGAGGCTTTTGTGAGATTGTATGAGAAAGGACTGATATACAGGGAGCCAAAGATAGTGAATTGGTGTGGGAAGTTGTGTACGACTATAAGTGATCTTGAGGTGAATCATGAAGAGATTGAACCGAATACTGTTATTCAGGTTGATGGAGGTATGTATGAGTTTGGAGTCATTTATCATGTGAAGTATCCATTAACTACATGTGCAGAATATAAAGGATGTGTTAGTGAACTACCAAGTGTTGAGATAGCAACCACAAGACCTGAAACGATTCTTGGAGACACAGCTATATGTGCGAATGCAAATGACGAACGATTTGGCAGTGATGGGATAAGGAAGATGTTTGGAGATGTATCTCGAGATACAAAGGTGTATGGAGTGAATCCATTGACAAAGAGAGTGATTCCTGTGATATTTGATGATTATGCAGACATGAGTTTTGGAACGGGCGTACTGAAGGTGACACCTGCACATGATGCAAATGATTTTGAGTTGTCTAAGAGACATGGGCTTGAATGTATTGTTGTATTTGATGAAAATAATAAAGTGAGTGTTGAGGGAGAGTTTAAAGGGCTTGGAAGGTTTGAAGCTAGGAAGGCGGTTATATGCGATCTTAAGTCTATGGGACTGTATGTGGGTAAGAAAGGACATCCTCAAGTGATTCCAAGATGCTCTAGATCGAATGATGTTATTGAGCCTATGATCAAAAGTCAGTGGTGGATGGATTGTAAGGAGATGGCAAGAAAAGCAATTGATGTGGTTAGGAATGGTGAGATGGATATTCTACCACCAGGTGCTGAGAAGCAATGGTATAAGTGGCTTGAGAATATAAGAGATTGGTGTTTATCAAGGCAGTTGTGGTGGGGACATAGGATACCAGCGTATAGAGTATCTGATGGACAGTGGGTAGTTGGAAGAACGAAGGAAGAGGCGTATGAGAAGATGAGAAAAGAGTATCCTGAGTGCAAGTGTACAATTGATGAAATGGAGCAGGACGAGGATGTATTAGACACCTGGTTTTCATCTGGGCTATGGCCATTTGCAGTGCTTGGATGGCCTAATATAGCAGATGATTATGCGCGATATTATCCAACTACGCTTCTTGAGACTGGTAGTGATATTCTTTTTTTCTGGGTTGCCAGGATGGCAATGCTAGGGATAGAACTTACGAGAAAGATCCCGTTTGATCAGGTTCTTCTGCATGGGATAGTTAGGGATGCACATGGAAGAAAGATGAGCAAAAGTCTTGGGAACGTGATAGACCCGATATTTGTGATAGATGGATGCAGCTTGAATGAACTTATTGCAACGATGAAGAGTGGAAACCTTGATGAGAAGGAAGTGAAAGTTGCTGAAGCAGCTTTGCGTAAAGACTTTCCGAACGGAATACCTAGATGTGGTGCAGATGCACTTCGTTTTACGTTACTCTCTTACACTTCAGGAATGAAAGACATTAATTTAGATGTGCTTAGGGTTGAAGGATACAGAAGGTTCTGCAATAAGATTTGGAATGCACAAAAGTTTGTTAAGATGATGGTTGATGAAGCAAAGGATTGCCTGAGCTCTGAATGTGGATATGCAGAGTATACTTTAAATGTCTCTGACCTTACTAATGGATTTGATTCTGGGCCGATTGAATGGATCCTTATGAAAAGAAACGAAACAATAGAGTATGTCAAAGAGATGATGGAGATGTATAAGTTTATGGAGGCAACACAGGCAATTCATCAGTTTTTTATGTATGACATTTGCGATGTTTTTATTGAGATTGTGAAAGGAAACAAGGAAAAGATGTATGTCAGTGTCTTACTGACAGTGTTTATTGACTCTATGAAGATATTTCATCCGTTCATGCCTTTTATTACTGAAGAAGTGTTTTCAAGCTACTTTGATACATCAATTTCAACATCGGAATATCCAGTAAGTGATGGTAATGCTCACAACAATAATTTTGGTGCAACATTACAACTGGTGAAGCATCTGAGAGGTTTATTGGAGACGAATGGGCCTGGAGGAATGAATGTGCTTGAGATTGTCCCTGGACCTGAGATTAACCACCATGATTTGAAATTTATCCATCTGCTTTGTAGAAGGATATGCAGTGTTGAAATATTATGCGATTATGACGAGAGGTTCTTGGACTTCGGAGGCACAAAAGCATATCTTCGGAAAATTGAATAA\n>XM_039636903.2 PREDICTED: Drosophila santomea uncharacterized LOC120452602 (LOC120452602), mRNA \nTCCAGTATTCTATCAGTATAGAAAACAACACACACACACTTTGTAGACACGCGTAAATAATTTTTCGAAATTTGTACTTTTATGCGTGCTATTCTTTTTCGACTTTTATCTTAAATATATTACCATTTTCAAACTATAAAGAACATATTTACAATCACCGAACCTCAAAATGCCGCCCGTTTTAAAACGGAGTCTACGGAAAAGATCAAAACCAGTTCAAGAAACTCCAGCCGAAATCAAGAAGACGAGTACGCTTTCGAAAATAATCATTCAAGGCACTGAACAGCTGTTATTGGATTCTGAAAATAATCCAAATATTCGAGTTATTGAAAAACCCAGAAAAATGCGGTATTCAAAATCATCGATTCCCACTGCGGAACCGGATTTCCAGCTGCATTCCACACCGAAAATTGGTAATCTGGCAAATAAAAGCAACGCACGCGGGATGTTTGGTCCGATCAAAAATAAACAGACATCCATAGAAGCTATTTCTGAAATTAGTGATATGTCCATTGCTTCAGTGTCGGTGAGGAATCAGCCGTTTGTGAACTTTCTCCAGGATTTCTGCATGACTCGTGGTTCCGATCCCAGAGAAAGTGTTCAAGAGGCCATCGCCAAATGGGATAAAATGACACCCAAACAAAAAGCAGAATTCAGTCCAGAAAACTACGTTCTAAAATTGTGTAATCAAGTGCAGAATCGTAATGAAATTTTAAATGCGGTTGCACTGCAGCCGGTTTATGAAACTACAAAAAAAAATCAAAATGGATTTAATAAAGCCAGCAAGGTCAAGAGATTGTCTCCAAAGCTACGTAAGTTGACAAAGCGATTAAACCCAAGACCACGAGGTGTGGTGAGTCCCAGAAAATCAATTAAAAATGCGGCCAAAAAGGAGGTGCCTCCAATGGTGTCGGTGCGTCTAACTAATAGTGCTTCGGCTTACAAAAACTTTCTGCGCAAAGTCCGTCAAGCAAATCCTGGTCTGATGTCCGTAGAAAAGACCTCCCTGTGGCGCAAAATGACTCCTGCCGAAAAGGATCTCTATCGGGTAGTCAGCAAGCGAAGCCAAGAGAAAACCAATGTCAAGAAAACCAAGTTAAGAGCTCTAGCTGCCAAACGCGTAAGGAAGCAAAGAACCTCACGATCAACCCAGATGCCTGAAAATGCTTTACATTATTTGCAAAGCAGTTTCGATATTCAGCGAGATGGCCAACTAGAAATTTGGAACGAGAGCAACACTTTGCTACGGGATAGTCAACGCTCCTGGGTCACACTTGACTACATTTCAAAAGCCTTTGAAAAAGTGAAGAATATATTTAGTTAACTACTTGTTGTCCAAATTTTATACAAAACATATGTAATTGCTATAAAAAAAACTGCGTAGAAACATA\n>XM_045247888.1 PREDICTED: Portunus trituberculatus adhesive plaque matrix protein-like (LOC123499604), transcript variant X2, mRNA \nGGCAGGATGAGGGTGGTCACTTGTAGGAAGAACACGAGAGGAGGAGGAGGTCATGACGAGGTTCACAGGACGGTCGCTGGTGGTGGTGGTGGTGGTGGCGGTGGTGGTGGTGGTGGGAGTGGCAGGGGAGAAGCTGGAACACGGTCTGGAGCTCATCACACGGGGGGAGCTGACGGGGGAGACAGACTTTGCGCCCCAGGGGAGGGAAGATGAGCGGACCAGCGCCCACCGAAGCTTTCCCGCGGCGCCCATAGCCCTCACCTACCTGCCGCCCATACAGAGCCCCTTACCCATAGAGGAAACACAGGGGACCACCACAGGCACCAGCGCTACCCCGGGGGAGGTCTTCGTGGCTCCTGACCATGGGGGAGAGATACTTAGACCATTCAACCAAGCAGGGTCACACCTCGAGCAGACCAGCCAACAGCACCACCACCACCATCACCACCTTGGCCCCTTTGAGTCCTCCCAAGAGAACACGCCCTTCCATACAGAGTTCCAGCCCTCAACAAGTGACCAGGACCCAGACGCCCTCCCAGCTGTGGTCCCAGGCCTGAAGAGCGCAGTAACAGCCAAGACAGAAGCATTTGGTACCCTCACGAAAGCTGCACCGTTTGAACACACCCCCCAAACTGCACCAGCCCCCGTGGTACCGTACCCGATCTACCCGCCGTACCCCAAGCCCCAGCAGACGTACCCCCAGCCTTCCTACGTGTACCACAAAGCCTCGTATCCTCAGCCAGTGTACCATAAACCAGTGTACCATAAGCAAATGTACCCTGTAGTGGTGTACCCTGGATATCATCAGTACCACGCCAAGCCGAGCCCCCTGGAGGCGTTGAAGGCTAAGGTGGAGGGCTACGTGGAGACTAAGAGAGCGGCTGTGAGTGGAGCGCTGGCCAAGGTGGAGGAGGCTAAGGCGAAGCTGGACGCAAAAATCAAAGGTCTTTTTAAACCCACTTCCTTGAAAAAAACACCTATTCCATACCCTTCCAAGCCCCTTCCAGCCCCGTCTGCACCCTTCTACCCCTTCAGACCCTATCTCAATGTGCCCCTGACGCCTCACAAGGGGTACTCCATCAAGGCCACCCCTGCCAAGCCCCTGCCAGCCCCTGTACACCACGTCAAAGGCCCGGTACCAAAACCTTACCCTGTGAATGTATACCCAGCCATACCACAGCCTTCCCTTGCTACTACCCCTGCTCCTACCCCTGTCCCGATCCCTGCCACGCTTCCTGCCGCTTCTACAGGCCCCCAGATACCCCAGGAGACCTACCCCATGGCCACAGCACCCCAGTATCAGCCTGTGTATGCAATTTACCCCGTGGCAGCCTCGCCTGACGTGGGACTCAAGGAAAAGCTGGAGGCGAAGAAGAAGCAAGTGATGGGAGCGATTACAGGCGCGTTTGCAAAGTTGAAGGCGCCATTCCAGTACCTGCACCCTTCCTACTCCTACTACTACGCCCCCCAGCATTGGTAGAGGCGCGGCAGGGGCTGGGAAGGCGGCAGGGGGTAAAAAGCTAAGGAGGTATTGGATTAAGCACGTGGTAAGCAGACGCCTTTCAGCCGCCCTGCTCGTGACGTCATCTTAGAGACCGCGGGTGTAAACTAAAATTAAATACATTGGGTTAAAAATATTAGTAATCTGAGCCTATGTTAGTTTATAGTGTGTAATATTTTGTTTATTAGTTAATCTTCTATATAATGTTAATTTGTAGGGTTATGATTGTTATTCTTAAGAGTTTTGAGATTAAGTTTATATTTTATTTTTGGGGTTTTGTATGTAAGGAAGGTACTGGCTAATGGAAGACAAAAAAATGAAATATATAAAAAAAAATGAGTTTAAATGCCAGACCTAACATGAAAAGCACCAAAAGGATTATGAAATTTGGAGAAGTGTTCGATAATAAGGAACAAAGGTACGATGCAGCGAGGAGAGCGCGGCATTTTCAAAACACTGCTAGCGCGCTCCTTTTTAGCCAAGTAGAAGTGAAAAAAAAAGTGCTAAATATTTTTCTAACTCTTGTTATATGTTAATAAAAAAATAAAATAGTTGTTTTT\n>MH123473.1 Homo sapiens isolate NUB087 cytochrome b (CYTB) gene, partial cds; tRNA-Thr and tRNA-Pro genes, complete sequence; and D-loop, partial sequence; mitochondrial \nGGGCCTGTCCTTGTAGTATAAACTAATACACCAGTCTTGTAAACCGGAGATGAAAACCTTTTTCCAAGGACAAATCAGAGAAAAAGTCTTTAACTCCACCATTAGCACCCAAAGCTAAGATTCTAATTTAAACTATTCTCTGTTCTTTCATGGGGAAGCAGATTTGGGTACCACCCAAGTATTGACTCACCCATCAACAACCGCTATGTATTTCGTACATTACTGCCAGCCACCATGAATATTGTACGGTACCATAAATACTTGATCACCTGTAGTACATAAAAACCCAATCCACATCAAAATGCTTACAAGCAAGTACAGCAATCAACCTTCAACTATCACACATCAACTGCAACTCCAAAGCCACCCCTCACCCACTAGGATACCAACAAACCTACCCTCCCTTAACAGTACATAGCACATAAAGCCATTTACCGTACATAGCACATTACAGTCAAATCCTTTCTCGCCCCCATGGATGACCCCCCTCAGATAGGGGTCCCTTGGCCACCATCCTCCGTGAAATCAATATCCCGCACAAGAGTGCTACTCTCCTCGCTCCGGGCCCATAACACTTGGGGGTAGCTAAAGTGAACTGTATCCGACATCTGGTTCCTACTTCAGGGCCATAAAGCCTAAATAGCCCACACGTTCCCCTTAAATAAGACATCACGATGGATCACAGGTCTATCACCCTATTAACCACTCACGGGAGCTCTCCATGCATTTGGTATTTTCGTCTGGGGGGTGTGCACGCGATAGCATTGCGAGACGCTGGAGCCGGAGCACCCTATGTCGCAGTATCTGTCTTTGATTCCTGCCCCATCCTATTATTTATCGCACCTACGTTCAATATTACAGGCGAACATACTTACTAAAGTGTGTTAATTAATTAATGCTTGTAGGACATAATAATAACAATTGAATGTCTGCGCAGCCGCTTTCCACACAGACATCATAACAAAAAATTTCCACCAAAGCTTCTGGCCACAGCACTTAAACACATCTCTGCCAAACCCCAAAAACAAAGAACCCTAACACCAGCCTAACCAGATTTCAAATTTTATCTTTTGGCGGTATGCACTTTTAACAGTCACCCCCCAACTAACACATTATTTTCCCCTCCCACTCCCATACTACTAATCTCATCAATACAACCCCCGCCCATCCTACCCAGCCGCTGCTAACCCCATACCCCGAACCAACCAAACCCCAAAGACACCCCCC\n>XM_026551140.1 PREDICTED: Papaver somniferum ketol-acid reductoisomerase, chloroplastic-like (LOC113302251), mRNA \nGAGTCAGTTGGCTCCCTGCAATCGTTCTGGCGGGATGGAGTTGAACAGTGAGTCGAAGTTAAAAGTTTGAATCTTTTACTACCTCGTATAGAAGAGTCCAAGGGAGGTAAAAATATAGAAGAGGAGGAGTTATGGATTAAGTAACCGCTGTATCCGCACTGAACTGCAGGAGAAACTTATCCAGATGAAATTCGTGTGATTATGGATTCGTTTGGGTTTCATTTCCGCTGATTTGAATTCCTATGATATACTTGCTGTATTTGGTTAATTCTCAAGTAGAATTTGTTACTCATGGGAACTTCCACTCCGTCCATAGCTTCTTCTTGTTCATTTAAAACCCTAAAACTACTTCACTCAACATCCTCCTCTTCTTCTTTGGGTTTTAAAGTAGGGTTTCTTTCTTCATCTTCTAAAACCTTAAAATTTCTTCTTATTCGTGTTTCTAACAACAGTGTCTCGTTCCCTATTGGATCATCTCTTCTTGCATCTCGTATGATGGTTTCAGTTCCCGATACTAAACCTTTGACTGCTCTTGATTTTGAAACCTCTGTGTTTTACAAGGAGAAGGTCACTCTTGCTGGAAATGACGAGTATGTTGTGAGAGGAGGAAGGGATTTATTCCATTTGTTGCCTGAAGCATTCAAAGGAATTAAGCAGATTGGTGTTCTTGGTTGGGGTTCTCAGGCTTGTGCACAAGCTCAGAACTTGAGGGATTCACTTGCAGAAGCCAGATCTAACATTGTTGTCAAGATCGGATTGAGGAAGGGATCCCGTTCTTTTGCTAAAGCACGTGCTGTTGGTTTTACCGAGGAGACTGGAACTCTGGGTGATATATATGAAACAGTAGCAGAGAGTGATCTTGTGCTGCTATTAATTTCTGATTCTGCACAGGCAGATAATTATGAGAAAATATGCTCCCACATGAAACCTAACAGCATTCTTGGACTCTCTCATGGATTCCTCCTTGGACACCTACAGTCCCTAGGGCTCGACTTCCCTGAAAGTGTGAGTGTGATAGCTGTGTGCCCCAAGGGCCTGGGTCCGTCTATCAGAAGACTTTATGTTCAAGGGAAAGGGATAAATGGTCCTGGAGTTAATGCAAGTTTTGCCGTCCACCAGGATGTTGATGGTAGAGCAACAGATGTCGCCTTAGCATGGTCTGTTGCTCTTGGTTCTCCTTTAACATTCTCCACTACTCTGGAACAAGAATACAAGAGAGACACTTTCGGAAACCAGGATAGCCAGGAAACTGAAAGACGGAGAAAGATAGGGTTTGCAAACAAAGGGAGAACACCATGGAACAAAGGAAAGAAACACAGTGCCGAGACTCGTAAGAAGATCAAACAAAGAACCATAGAGGCACTGAGTGATCCCAAGGTCAGAAAGAAGATGTCTGAGTGTCCCCGTGCTCATAGTGAGGAGAACAAGATAAAAATAAGCATTGCTCAGAAGAAAATGTGGAGAAAACGCTTGCAGATGAAAAGACTGAAGGATGAGTTTTATCTGAAGTGGGCAGAAAGAATTGCAGAGGCAGCTAGGTTAGGCGGCTGTGACCAACAGGAACTAAATTGGGATAGCCATGAAAAGATCACAGAGGAATTGGTTCTTAAACAGCTTCAGTTGACTGCAGATAAAGCAAGGGAAAAAGAAATTGCAAAATTAAGAAGAGCTAGAGCAGCGAAGGAAAGAGAGGAGAAAATGGCTAGAATTGCCCAGAGGAGAAAAGAGAGGATAGAAAAGGAGAGGGAAGAAAAATCAAAACCCAGAGTAGAAATAAAGAGAAAGACACGTAGAAAATCAGAAAAAGAGAAGCAACTACTGGCTCTTTCCAAGGGCTCAAAACTCAAGGAAAAATTGACGAAGATTCGCCGTAAGAAGACTGTTGATGGTCAAGGAGTAGTGGCAACCGGCAATCAACCAGCGATTGAGAAATTGGATTTAGAGTTTATAGAAAGAGAGAAACTGCGGAAGGAAGTGTCTCTTGCGGATCAGATTCGAGCTGTAAAAAAGATGAGAGAGGAGTTAAACAAGGAACCTCTTGCCAGAGCCATCTTATAGATTAAGCCAGCTAGATCATTTTCCTAGTCGAAGTGTTTAGGCTTGGGCTGCTATACATGTCAAAGTTGATAGGCTGAAAACTAAATTAGAAATAAGAACATGAGTTGATCTAGGCTTAGATTTGTTTTTGTTTTTTTTTCCCTCATTCTCCTTGTAAGAACAAATAAGAGCACCAACATCGTCTACCTTCTTTTATCAATCAGTTTTGAAATTGTTGAAGGAAAATGTTATGTCGTTGGGTAATAGATTTGTCCAAAACTTACACTTGGGCACCAACGTATGTCCAGGTGGTTATTATTGACCAATTGAATTTGAAAAAGATATT\n>OK585766.1 Setaria viridis SvmiRp606 miRNA gene, partial sequence \nTCGGACCAGGCTTCAATCCC\n>XM_008174878.2 PREDICTED: Chrysemys picta bellii olfactory receptor 52R1-like (LOC101936597), transcript variant X1, mRNA \nATGTCAGATTCCAACACAACCGAATTCACCAACCCCTCCACTTTCATCCTGCTGGGCATTCCTGGCCTGGAGGCAGCCCATGTCTGGATCTCCATCCCCTTCTGCACCATGTACACCATAGCCATCTTGGGGAACTTCACCATCCTATTCATTGTGAAGATGGAGCCGAGTCTCCATGGGCCCATGTACTATTTCCTTTGCATGCTGGCCGTCACTGACCTGGTGGAATCTACGTCCATTGTGCCCAAAATGCTGAGCATCTTCTGGTTCAATTCGAGAGAGATAGATTTCAATTCTTGCCTCACCCAGTTGTACTTCATTCACTGCTTCTCAGTGATGGAGTCTGGGATCTTCTCAGGCATCTTTGTGGCTATGGCTTTGGATCGCTACGTGGCCATCTGCAATCCCCTGAGACATTTCACCATCCTGACAAACTCCATCGTGGCCAAGATTGGCCTGGCCATGATGCTGCGCAGCGGCTTGCTTGCATTGCCCTATCCCTTCCTGGTAAGACAATGGCCATATTGCAGAACCAACATCATCCCCCAGTCGTACTGCGCACACATTGCCGTGGTGAAGCTGGCCTGCACCGACATCCGCGTCAGTAGTTACTATGGCCTCTTTGTGGTATTCTGTGTGATGGGTCTGGATGCGATTTTTATTGCCCTGTCCTACTCCCAGATCCTCAGGGTCATCTTCAGCCTCCCCACAAAGGATGCCCGGATAAAGACTTTTGGGACCTGCATCTCCCACCTTTGTGCCATCTTAGCCTTTTACATCCCAAGTCTCTTCTTCTCCCTCATGTATCGGTTTGGCCAGAATGTGCCCCTGCATTTCCACGTTCTCATTGCCAACGTTTACCTCTTGATGCCCCCCATGCTAAATCCCATCATCTACGGGGTGAGGACCAAACAGATCCGGGACAGGCTGCTCCGACTCTTTACTCATAAAGGGACCTAA\n>XM_013231282.1 PREDICTED: Biomphalaria glabrata lipoxygenase homology domain-containing protein 1-like (LOC106071234), partial mRNA \nGATGACATTGCCACAGATTGGAAAGTTGATAATCTTGTCATGGAAAATCCTAGCACTGGTGAGAAGCACAGCTTTGAGGTGAACAGATGGCTGTCCCATAAAGAAATTGATGGAGACATTGTATTTGAAGGTGCAGTCAAACAGCACAACCAACCAGTTGCTTCTACTTGTAAATACATTGTTAAGACCATTACTGAAAGTGAAGAAAATGCAGGAACTGAGGCTAATGTGTATATAAATCTTATAGGAAATCTAGGGGATTCTGGAAAAAGATTTCTAGTGAACAGCAGTAATGGAGGTGAAAAGTTTTCAGCAGGAAAAACAAACTATTTCACTATTGAAGCAGTGGATCTTGGTGATCTAGAAAAAATAGTCATTGGTCATGATGGAACAACACCTGAAGATGCTTGGAAACTTCTGTGCGTTATGGTTCGCAAAGCTGACTCTGCCAACAGAGATACTTCTGTGTTTCCTTGTGGAAA\n>XM_017243286.2 PREDICTED: Drosophila bipectinata nuclear transcription factor Y subunit gamma (LOC108126631), mRNA \nTTTCACCCCTAACTGGAGGCTGCCACACTGTTCGCGTGTATGTGTGCATTGCGCATTTCGTTGATTTTAACAAAATTTTAGCCTTCCAGCCGGCTGTGATAGCCAAACCGTTGCCGTCACCGCACCGCAGATCACGTGAGTCAACCGGGACATGTACGCCACCAACAACGGTGGCACAAACAAGGCGCCAAACAGCAATGCCAGCACGCTGTTCGAGAACACCATAACCGTGACGCCAATTAAGGTGGAGTTGGGCACAACGTATGGCGCCGGAAAGCCACCCACACCGGCGCTACAACGAAGGACGCCCAATGCCGTGGTGGTGACCACTAGTAATCCGCAACAACAGCAGCAGCAGCAGCAGCAACAACAGCATCAAACTGGTGCCGGAACCACCACTCTGAACCTGCCCATGCAAGCCACCCTGGTCTCGAATGCCTGCACCATAATGAATCCCAGCCTGAGTGTGACTGTGAATACCACCACCACTGGAGCCCTGGCCAAGGAACCGAAGGGTAAAGCAGCGCGGGCGCAGGTGGTACGGAAACCGCCGCCTACCATCGACAACTTCTGGCCGAATATCGTGAACGAGGTGCATGCAATCGGGCAAGTGGACGCCAAGCATCAAGTCTTGCCACTGGCGCGGATCAAGAAGATAATGAAGCTGGACGAGAATGCCAAGATGATAGCGGGCGAGGCGCCGCTGCTGTTTGCCAAGGCGTGCGAATACTTCATCCAGGAGCTGACGATGCACGCGTGGGTGCACACCGAGGAGAGCAGACGTCGCACGCTCCAGAGATCGGACATTGCCCAGGCGATCGCCAATTATGATCAGTTCGACTTCCTTATTGACATTGTGCCGCGCGAGGAGATCAAGCCGTCGTCGGCGCAGAAGAGCAAGGATGCGGGTGGATCGAGTACGTCGAGCGGGAGTGCCACAGGAGTTACCTCATCCACGTCGTCCGGCACCAGTGCCGGCGGTGTCGTCAGTTCTTCCGTCAATGCATCTGCAGCTTCGGTCACGGGATCGGCTGGAGCCGCTGGGAATTTCGTGGTCGGAGCCACTGCTGTACCTGCTGCCAAGATGGATACGGGTGGAGGAGCCACCGCTACAGAGGTACTAGGCTTTAGCACGGTCACGCCGGACCTGTTCGCCACGCAACTGCAGCAGCAGCAGCAGCAGCACGTCGCCCAGCAGCAACAGCAGCAACAACAACAGCAGCAGGCGCATCCACAACAAGTGCAAATAATCCAGCAGGCCGGACACGGCGGCGCCCAGCAATTGCAGTACTTTATTGCGCTGCCGGGCCAGCAGACGGCACAGCCGGCCCAGAATCATCTGGCCAATAGTCTGGGCCTCAACATTGTGGCCGCCCAACAGCCCGCCCAGCAGCTGATCCTCACCGCGGGCCCCAACGGCCAGCTAACTGCCACCCCAGCCCCCGCGGCCACGGTGCAGCAACAACAGACGGCCCTGCTCCAGAATCTCGCCCAGCAGCAGCAACAGCAACAGCAGGCCCAGCAGCAACAGCAGCAGATCCAATTGCTCCAGCAGGTGGTCACTCCCACGGGGGAACTGACCAATGTCCCGATTGCAATCAATGCCAACCACTTGCATCTGCTCCGGTTGCAGATGCAGCAACAACAACAGCAGCAACAGCAACAACAGCAGCAGCAACAACAACAGCAGGTGATAATACCGACACAGTTGCTGACGGCACAACAGATACTCCAATTGGGCGGAGCACCCGCTACCGTTGGACAGCAGCAGGCGCAGGTTCAAGTCCAGCAGCAGCAGCCACAGGTGCAAGTTCAAGTCCAACAGCAGCATCCAAATCTCAGTCAGGGCAATGCCAGTGCCACGCCCATTTTTATAAATTCAACAGCGACACAGCAAGTGGCGCAACAGCAGGCGCAGCAACAGCAACAACAACAACAACAGGCGCAACAGCAACAACAACAACAACAACAACAGCAGCAGCAACAACAACAACAACAGAGCAACATGGCCGGGGAAAGGACACTAACCGGAGGATTTCGGTAAAAGGAGCTCGCGCTGAGCGTGCACTGGTCGTGCAATGGTAACCATATCGAGGCATGGGTGGGAAAGGTCCAGCACAATTTGTATAATATATAGTTTACGTTTGTATATCGGAAAGAAGATTATATATATAGTTAGTGCTGTAAGTGTAGAAACGA\n>XM_002365330.1 Toxoplasma gondii ME49 Ctr copper transporter family protein mRNA \nAGAATTGAGTTGGTGGTTGTTTTCGATGGAAGGAAGCGAGAGTTTCGGAAGAATTCTCGGAAAAGTGGATGTCAACCTGGCAATTCTGTCCCGTTCGCGGGGGGCTCTCCTTTTCCGTGCAAGCACGCGTCCACCTTGATCTCGCGTTCTGCGCTGTGGATTGCAGGAGACGTGTAAGGCAGGCGCCTCTGTTTCCCCGCGGGAGGCACAGGCGATGCAGGAAGCGTCTCCTTTCACGACACCTTGGCAATTCACGAAGGAAATTCCCGTCTGCCTTGTCTGACTCAGGTGGCAAAACTCTTCCTGCGTTCTTGCTGCCTCTGAGTCGAGGGTTTAGGGACTTTTAGGGTTTAAGCCTTCAACTGCCGAGGGCCCCCCCGCGAGTCAAAGACACACGCCGCGTGTCTCTCCTGTGGCGACTCTCCGCGAGAGAGGAAAGAAAACTTCACAAGAATCATAGGCTGAAGCGAACCTCCGATTAACAAGTGTGTGCGCTCCGTGGGGAGAGAGAACGCGTTCGAGAAAGACCTACAGAGGGCAGACCAAGAGAGTCAAGATGGCAACGCACGCTCAGTCAGGTGCTTCCTGCTCTCTGAGCACTTCTCCGAGATCTGGACGCGAAGGAGGACAGAGAAAGACGGAAGCCTACCTTCTGTCCCTCCGCAAAATCCCCAGTTCCAGACGGCGAGGTCTTCCGACCGGTCCTCAATCAAAGGCCTCTCTTCTGCGAGTGTCCACGTTCTTCCTTGTTTGCGCGCTTCACTGCGTGTCTTCTCTCCCCGGCGCTCTGTCCTCCGCCTCGAACTCTCCCGTCTCTTCTGACAACGAGGTGCCCGACCCTCAGCGAAACCGTGACAGCTCAAAACCTTCCAGTTCCGATGCTACGCCAGATAAGACGCATGACAAGCAGCGGCCGAGAAACAGGTATGAAGATGTCGAGGACTGCTGCAAGGGACAGAAGAAGCGCGCTGCCGACGACGCTTCTGCTGCGAGAGAGGCGGACGGAAAAGAGGAGTCTTGCTGCGACAAGAAAGGCGCTGCCGGAGGGTCGGGCGGAGAGGGACCTTCCAGTGAAGGAAAACAGTCCTGCTGTAAAAAGAAGAAAGCAGTGGCTGCGGAAGGAACCGCCCACGTCGCTGCGGAGGGACATAAGTCCTCTTGCTGTGGGGTCATGCCCATGTCTTTTCAAAACTCGCTGCACACCGTGATTCTCTTCCACTCATGGGAGACACTCGAGCGGTGGCAGTACGTGCTGTCGCTGCTGACGTGCGTGGTTCTGGGGATGCTCTCCGTGGTTCTGAAAGTCCTTCGCCTGCGACTCGAGTTCTTCCTCGCCAAGCGCGACCGCGCCGCGGAGGACGCCCAACGAGTCGAGAAATTGAAGGAAAAGGAAGGACAGAGTTCGGCGGCTTCTCCGTCTTCAGCAATTGTCGAACGCCTTTGCGGGAATTTCCCTCTGAAGCAAAACTCCTGGCGGATGCTGGAGGCGTTCGTCATCTACGGGTACGACTACCTTCTCATGCTGATCGTGATGACCTACAACGTAGGGCTCTTCTTCGCTGTCACGGGAGGCCTCGCTCTGGGCTTCTTCTGCTTCGGGCACCTCCTCAGAATCCAGGCAGAAAAAGAAGAGAACTCGCTGGAAGAAGACTACCGCGGGGACCCCTGCTGCTGCGGAACATAAGAACTGGAGACAAAAAGAGAAGACGAAAGGTGTTGGAGACCGAGAATGAAGGAAGAGGAGACAGAGAAAGAAGGAAAGGGAGACAGAGAAAGAAGAAACTGAAGAGTGGAACTAGGAGAGACCACAGGAAGGCGTGGAGCTGGAAATTATTCCTTTGAAACTGGTAGCAGAGCAGGGAGGTCCCTTGAACTTTTGGATTTAAAACATCCTTTTTTTAAAAGCCTCCCTGAGGGAAGAAGCTGGAACGCAGGGTCAAGAGACTAAGGTTGCCGCGTGGAATCGGTTGATCCGCCGTTTTTGTGTAGAACTGCATTCTTTACCGACGCGTTTCAGCGCGTTTTTTGCCGTCGGGGAAGAGTCGAGAAGGGCGCACACATGCGTGTACAAGATGCACACAGACTGTGGCCCTCGTCTGTTCTCCAACAGACCGCGTTTCAGAACGAACATGTAGAATACGCACAGAGACGCGTTCAAGCCTCTGCGCCGGTG\n>XM_037418793.1 PREDICTED: Rhipicephalus microplus uncharacterized LOC119167324 (LOC119167324), mRNA \nTGCAAGAAACTACGTACATCATGGTCTCGAGAACTTCCTCCGTATAAAGGTCCAATCGTAGCGCTGATATATGTTTATTTTCGCCTTTTACGACGTGCATCAACAGGAGCACCATGCAAACAGGGAATGGCGTCGTACTGCTCTTGGTTATTTTATCTTATTTGACAGGATTTGGCCAGTCAATATTCATAAAGGAAAATGATTTCAAAGTGTTCTTAAACACAACGCAACCCATATGGACCTTCAACACGACAAACAAATACAACAAGAATTACTGCATTGTGGACGTTACAAAAAAACTGCTGGGAGAAACTGTCATGTATACTCACTCCTTCTATGTCGACCCCACGAGAAAACAGAGGGTTTCTGTTCATATGGAAGGTGCCTTGAAATATAGCAATAAAATGGTTGCCACGCAAAAAGGTTCGAAAGTGACTTTTAAGCACAAGCTCGTGTATCTTGACTTCGACAACATGTGCGCTGTGGTGAAAGTTACTCCAAAGCTTCCTATCCCTGGGCAGCCTTGGCATGACCTGCGAATGTGGAATTCCTCGCTTGTGAGACATCGCCACCCTTCGATAACCTGTTTACACTATTTCAATCTTGAAGCAAAGCATGGACGCCTAACTTATAAGCCTATATGCCAAAAACTCCTTTATCAAGTGAATCCGTATCAAAAGAAAATTCTTCAAGGGCAGAAGACGCCGCAGACATACAGGAGCACGAGCGTGTGAACTGTCGAGCATACTTCGGAAGTATGTAGCACATCAAAGCTTTCTCTAGTGGTTCACGAGAACCACTGGAGGCAGAGATGAATAACTTGTCTAGCCTGTGCTATAAATTTCCATGGGTAAAATGAACAAATCGTTGTCTGATTTCATATGTGTGGTATAATGCGCGCAGCGCTTACATAGATTGCCACAGCTTTCAAGCAGCAACACAACGTGCAACATAAATATGCTGAACCTTACAGATACGCAACCAATAAGTTTTAAATAATGTAAAAATCCACAGACAATGAAA\n>XM_027137582.2 PREDICTED: Tachysurus fulvidraco probable endonuclease 4 (si:ch211-141o9.10), transcript variant X3, mRNA \nGACGCAGCTAATTATGAAAACGAGTCCTCCACAGTGCTGTTTGTAACTATGCAATGGGGATAATGTAAACGAAGAAAAGACCACACTGGTTTTAAAGCGTTGAAAAGTCAGTTGGTTGACGGTCGGCCATTTTACTGCTCGGATTATACACTTAAAGTGAGCGAATCCCTTCTCACTGACAACAGTACATAAATTAAAGGCACATTGACCACGCCCCCATACCAAAGTATATGTGGAGATGGGCGGGGCTACAACACACACCTACATACCTACCTACACCTACCTCTCGATGATACAGATTGTGATCTTTTAAGGTGACTAAACTGAAAAAGAGATGGCTTCGTGCAAAAAAGGAGAGAAGAGAAGAAAAGAGAGAAATGTGAAAACGTTAGAGGAATTTGAAGACTCGGCTGAAAGGAAAGGAAGGACAAGAGAACAAAAAAAGTACATTGGTGCTCATGTGTCCATAGTAGGAGGGATATGGAAAGCAGTTGAAGCAAGTGTAGAAATGGGGGGCCACAGTTTTGGATTATTTTTGGGTTCCCAACGCTCTTGGCAAAGACCTGCTCTTGATCAGAAAGCTGCAGTGAAATTTCAGCAGGCTTGTGCTCAACACAGCTTTGACGCAAGACACATTCTGCCACATGGATCTTACCTGATGAATTGTGGCTCTCCCAAAGAAGATGTGTTTAGTAAGAGCCAGGTCATGCTGGTTGATGAACTCAGTCGCTGTAGTCTTTTGGGCCTTACTCAGTTCAACTTTCACCCCGGGGCCTCCCTTGACTCCAGCAAAGAGCAATGTATCGAGAGGATTGCCGAAGCTATAAACAATGCTCACCAGCAAATACCTGCAGTCTGTACCGTTCTTGAAAATATGAGTGGACAGGGAAGTACAGTTGGTGGAGATTTTAATGAACTGAAGTCCATAATTGACCGTGTTCGAGATAAGACACGTGTTGGAGTATGTCTAGACACGTGCCATGCATTTGCAGCAGGTTATGACATTTCTTCAGAGGGAGGAGTGAAGTCTGTGCTTGATGAATTTGACCAAGTGGTTGGACTGCACTACCTGAGAGCAGTTCATCTAAATGACTCAAAAGGTAAATTGGGCTGCCATCTGGATCGCCATGAGGACATTGGCCGTGGACAGATTGGCATCTCTGCTTTCCGAAACATTGTGAATGAACCTCGATTTGACAACATCCCTCTTATTCTCGAGACACCTGGCCGCCCAGGTTTTGAATATGCTGAACAAATACAGCTCCTGTATTCTTTATGTGAGGACTAGAATGCAAGAGGACCTCTTCATTAGACAGTTATAAAGATTTTGTGTTCTATTTTATTCTGTTCACGCATTGTATATTTCATACAGGCATACAATAAACATAAATTGGATTCATATAATCTGTTATCTGTAAAGTATAAAGTACTGTAAAGTGTAGTTGATTGCACAACTACAATTTAGTTGTTTAGTCAGCAGAGGGAGCTGGAAACAAGGAAAACATGATAGAGTAGGTTGAAATCCCATCAGTAAATCTTAAACTAGGTCTGCTAAAGCAATTCTGCTTCCATATTGTACTTTCATATGTATTAAAGAATTTACTCAATCA\n>BT130104.1 Oryza sativa clone RRlibC00934 mRNA sequence \nCCCTTTCATCCATCCATCCATCCATCCATCCACATAGCAACGACCTCTCACAATTCACGAATCACCACTGCACACTACACTAGCGGCAGCAAGGATGAAGCTTATTGGCAGCGGCAGCGGCAGCGGCGGGCAGAGGAGAGGGATCGCGAGGGCACTCAAGGAGCACAAGGCGAGGCTCTACATCATCCGCCGATGCGTCGTCATGCTCCTCCGCTGCTGATGATCGAGCTGAGGATGGCGTGCACACGCCTTAATTTCTTCTCGGTGGAATATCTTTCGCAGTTTTTCTCTCACCAATTCACCATGGATCGGTGGGGGCGAATGTTTGTCCCTTGTTTGGGTAGATCTGTTTGGATCTGTCTCTCTTAAATTTGTACATACTGATGAGCTAGTGTAGACCATATCAATATAGGATGCAGATGGAAGTAGTATTAGTTAGTATGAGAGGTAAATTAGTTAGTTGGGGCTGAAGAATTGGGGGTTGTCCTCTACCCAGGACCAATTTTGCCTTGTATGATGATCAGAAGTGGGAATGCAAGAGAAATCTACATGATTTACAAAACAAAAAAAAAAAAAAA\n>XM_020061516.1 Plasmodium coatneyi Cleavage and polyadenylation specifity protein partial mRNA \nATGAACAACATTAATATTGTGTGCCTGGGTGGGGCGAGCGAAGTGGGTCGTTCGTGCGTAATTATAGAAAGTGCGAACAGGTCAATTATGTTGGATTGTGGAATTCACCCTGCCTTTATGGGGATTGGCTGTTTACCCATCTATGACGCGTACGACATTTCGAAGGTGGACTTGTGTTTAATAACACATTTCCATATGGATCACAGTGGTGCCTTACCGTACTTGGTTAACAGAACCCGTTTTAAAGGAAAGGTATACATGACCGAGGCGACGAAAAGTATCTGCTATTTATTATGGAACGACTATGCAAGAATTGAAAAATGTATGCACATGATGAATAAGATGAAAGGAGGTAGGAGTAAAAATGAAGCGGGTGAAAATGAAACAGACGAATATGGAAACAAGGTTAAAAGAGGAGGACTATACTCCAGTGATGAATACGCAAGTGAAGACAATGAAGACGATGATTATTACCAAAGTTACATTTGCGAAATGGGAGATGGAGATATAAAGCATAATGTACTGTATGACGAAAATGATATAAACGCAGCGATGAAAAGGATAGAAACTTTAAATTTTCACGAACACATAGAATTTGAGGATGTAAAATTTACAGCATATAGAGCAGGACACGTGATCGGTGCGTGTATGTTCCTAGTCGAAATAAATAATATACGTTTTTTGTACACAGGAGATTATAGCAGGGAGGTGGATAGGCACATTCCCATAGCGGAGATCCCCACTATTGATGTCCACGTGTTAATTTGCGAAGGAACCTATGGAATAAAAGTGCATGACGATAGAAAAAAAAGGGAAATTCGCTTCCTTAACATGATTACCAGTATATTAAATAATAAAGGGAAAGTGTTACTCCCTGTGTTTGCTTTAGGAAGGGCTCAAGAATTGCTGCTAATTATGGAAGAACATTGGGAAAGAAACACACAGTTGCAGAAAATCCCCATTTTTTACATATCCTCTATGGCTACAAAATCGTTATGTATATATGAGACCTTCATAAATTTGTGTGGAGATTTTGTAAGGCATGTATTAAATGAAGGAAAGAATCCTTTTAACTTTAAGTTTGTAAAGTATGCGAAATCTTTGGACTCCATTTTGAATTATTTATACCAGGATAATTATCCGTGTGTTGTTATGGCTTCGCCTGGTATGCTACAGAATGGAATTTCGAAAAATATTTTTAACATCATTGCACCTGATAAGAAGAGTGGAGTTATCCTTACTGGGTATACAGTCAAGGGAACTTTGGCCCATGAGTTAAAAACTGAACCGGAATATGTCCTCATTAACGACAAACCGGTTAAGAGGAGGTGCCGCTTCGAGGAAATTTCCTTCAGTGCTCATTCTGATTTTAATCAAACTAAAACGTTTATTGAAAAGTTGAAGTGCCCAAATGTGGTTCTTGTGCATGGCGATAGGAATGAATTGAACAGACTGAAAAATAAGCTAACGGAGGAGAAAAAATATTTGTCCGTTTTTACGCCCGAGTTGCTGCAGAGGCTGACTTTTCGCTTTGAGCACAGTGACCACGTGGTGTCCCTAGGTCGGCTTTCCCAACATATTAGAGGGAAGCACCAACCGGGGGATGAAAAACTGAGTGACAGAAATGGAGAGGAAAAAACAATTCCCAACGGGGTGGATGCCATAATAATATCGGAGCCGAAAGCCATCCCGATTATGATTTACGCCAAGGATATTTATGAGTATACAAATTTGAAGACTGCGCTGATCGACCAGACGATTAGCATAAAATTCCCCTACAAGTTCGAGCTGCTGTATCATATGTTGAAGGGTGTGTACGAGGAAACGCATATGGAGGGTGAAGGCAGCGAAAGTGGGAATAGTAACAATGGTGATAATGGTGTCAATGGTGACAACGGCGGAGCGGTCATCTTCGTGCAGGACGTAAAAATCCACCACTGCAGGAAAGAGAAGGTTATTAGTATTAATTGGCTTTCAAGCCCAGTGAACGACCTAGTAGCTGACAGCGTCAATTTTCTAATTCTAGAATTTCTCGACACCATGAAGAATAACAACAACCACCTGCCCATCTGCGACGAAGTAACAGATGATGAGATTTATGAAATGATCATTTCGTATGTGCGGGAAAATTATACCAATGTGGAGAGATTTTCCAAAGTGGAGTTGAAAAGGTTTCTTTTGCAAAATGGCTGTGACAGTCCCGAGGGGGGAAAAAACGAAAAAGCAAATGCTTCATACACAGATGGGTTGACCCATTTGAAGAATGCCCAATCGTATTCATCTGGCAGGGTGAACCAAATCGATCATAACAGAATGGAAGAAGGGGTTACTTTACACGAGGAACATGATGAACAAAGCGGGGATGGAGACAAAATGAAGAAATTCCGCGCCCTTGATAAAATCTTATTCGACTATATCGCGGCAGATGCTAGTTTAGCCATGTCCACTGATGAGGAGGAACCCGTTGTACCGGTTCTTAATGGCGGGATGCTTTATGAAATACTAAAGTTTGAGGTGAAGGATAATAACAACAACGACGTTAATGTGTACGTCGATATAGACAACCGGGAAGTCATCTGTGAGGAAGTTACAATTTTGTCAAAAATTAGAGAAATTCTAAAAAATATAGAGGAGTCGCTATTGCCCATGTGCTTCTAA\n>XR_001369330.2 PREDICTED: Pelodiscus sinensis uncharacterized LOC102457183 (LOC102457183), transcript variant X2, ncRNA \nTTTCTCTAGTGCTCAGTCATTGCCTAGTGCCAAGGCTCAAGATCTTTCTCTGCCCTGAGCTGAAACCGTTGCATTTGTTACATTTGTTCTAGAGCCACTGGAGCATTTCAGGCCATTCATCTCATGAGACACGTGAACTAAAGACACTTTGCTGGCATGGAGATGGCCAGTTCCTGGCACAGGACCTTTCCAATCAGTACTGCTCTGCATTGCAAGGTGCAGAAGGAAGCAGAATTGCAGGAGTTTGGTCAAATCTCCAGGAGATCATAACAAGTCCATAAGAGTAAGTCACCACTACTTGCAGGGATCTCGTGTGGGGCTGGCATATGCTTCCATTACTTTGTCACGTCTGCTTCTAGTCGGGTGCGTGACTGCAAACATACGAGAAATCTCTCAGAGTACCTCGCCTGCATTTTCTCCTGTTCCCAGACTTCCTTCTTGTGAAGCAACTGGCCCAACAGCTACTTGGCTTCTTTGTGATCTTGAAGACACTTTACACTTAGATTTGATCATCACCTGCTGGGTTATTTCCCCAATCCTCTCGTTTATGCCTTCACAATGGTGATTGTGTTTCTAGAAGCTCTATGTGCAACATCTGGCAAGACACAGGCATCCAAGATGGCTCCGCCTGACTCTATTCTTCATGCCACGGTGCCTTTGCCTGGCTTTGCCTTAATAGTTTAAAACAGCTGGTCACAGATGATTCAGGAAAACATGAAGAGGAAGCGTTATCTGTGTGTGTAGAGTACAGGCGCTACGGTTTTTGCTTCATTCTTCTTTAAAGAACCAGTGCGAGACTCATGTTAGACATGGGGAACAATACCTCCTACGCTACAGCATAGGGAGAGAAAAACACTTTTGGGGTTCTTGCCTTTATGTTCTAGTCCATAAATTCTACTTTGCTATATATAATCCTTAGCTAGAGGTACAGGCAGTCCCTGGGTTATGTACAAGA\n>XM_048564862.1 PREDICTED: Pyrus x bretschneideri LIM domain-containing protein WLIM2b (LOC103942600), transcript variant X2, mRNA \nGCTTTTTATTTATATTTTATAACGCCTTTAAAATCTCTCCCATCGGATTTGGAGGGGTCTCTCTCACGCTCTAATCTCTGTAATTTCATCGTCGTCGTCTTCCTCCACTACGCCGCATCCGCTCCCTGCAAAAAGCCTTCGCCATTCACCGTCCGCCATCTCATTCCTTCTGTACGGAAAAGGACCCATTTGCGCTCCTCACTTTTTTTCGCTCTTTCCATTTTTCAAAATCTTTTCTCTTTTATTCTACCCTTTTTATTTGTCGAGATTTTTTAGCTTCACTCAGTCAGCCTTAAAGCTTTTAAGGGTACGCTTTTCTGACTCTGAAGAATGTTTATTGACTTCAATTTATAATCTCTGCTGCCAGATCTCCATTCATTTGTTCTTGCATTTGTGTGCTTTGAAGGTGGAAGCTTAAGAGGTGGTGGTCTGGGTTGGGAGAGAAGAATCAGATCTAGAAGGAGAAAGAATTATGTCTTTCATTGGCACCCAGCAGAAATGCAAGGCTTGTGAAAAGACAGTTTACCCAGTGGAGGAGCTTTCTGCTGATGGGATTTCCTACCACAAGTCTTGCTTCAAATGCACCCACTGCAAAGGGACTTTGAAGCTGAGCAATTATTCCTCAATGGAAGGTGTCCTGTACTGTAAGCCTCACTTTGAGCAACTGTTCAAGGAGACTGGCAATTTCAACAAGAACTTTCAGTCGCCTGCAAAGTCAGCTGAGAAGTTAACTCCAGAGCTGACTAGATCACCTAGCAAAGCTGCTAGCATGTTTTCTGGAACACAAGACAAATGTGCTACTTGTGGTAAAACAGCTTACCCATTGGAGAAGGTGACAGTGGAGAGCCAGGCCTACCACAAGTCGTGTTTCAAGTGTTCTCACGGCGGCTGTCCTATTACTCCCTCAAACTACGCCGCCCTGGAGGGCATTTTATACTGCAAACACCATTTCTCCCAGCTTTTCAAGGAGAAGGGGAGCTACAACCATCTTATTAAGTCTGCATCAATCAAGCGCACAGCAGCTGCAGCAGCAGCGGCAGCAGCAACAGTAGCCTCCATTCCAGAAGCATAAATTCCATATTTAAATGTTCGATTACATGGCTTTCGTTTGTTTGAGAGTGTTGCATCCCTCTTCAACCTCACGCTTTTCCATGGCGGAGTGAGAAAACTTGGTTCTTCTCTTTTGTATTTGGCTCATCAATCTTGGGCACATTGTTGTGTTTTGCTTCATGTATGTGATTCTGGGTCCGGCAGTTAGTAAAATGACCTTCTTCGGGA\n>MG270501.1 Uncultured bacterium clone OTU7751 16S ribosomal RNA gene, partial sequence \nGTGAGGAATATTGGTCAATGGGCGGGAGCCTGAACCAGCCAAGTCGCGTGAGGGAAGACGGTCCTATGGATTGTAAACCTCTTTAGGCGGGGAGCAATGCCGGGCACGCGTGCCCGGAGGGAGAGTACCCGCAGAATAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGATTTTTAAGTCAGCGGTAAAATGTCCGGGCTCAACCCGGGCCGGCCGTTGAAACTGGGGATCTTGAGTGGGCGAGAAGTATGCGGAATGCGTGGTGTAGCGGTGAAATGCATAGATATCACGCAGAACTCCGATTGCGAAGGCAGCATACCGGCGCCCGACTGACGCTGAGGCACGAAAGCGTGGGGATCGAACAGG\n>MT590786.1 Dendriscosticta praetextata isolate 16_52820 small subunit ribosomal RNA gene, partial sequence; internal transcribed spacer 1, 5.8S ribosomal RNA gene, and internal transcribed spacer 2, complete sequence; and large subunit ribosomal RNA gene, partial sequence \nAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTATCGAGAGAGGCGTCCCGCCTCGGGGGGGGCTTCCGGCCCCCCGACTCTTCACCCGATGGGTACTCAGCAGCGTTTCTTTGGCGGCGGCTCTTCCGCCGTCCGAGGACCCCCTCCACCACTCCAGTGATTGATGTCGTCGGAGCGCGAAACGAATGAACGCAAAACTTTCAACAACGGATCTCTTGGTTCTGGCATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCCTTGGTATTCCGAGGGGCATGCCTGTTCGAGCGTCATTACACCCGTCAAGCCGTGCTTGGTGTTGGGCCGACGTCCCGTTCCGGGACGGGCTCGAATGGCAGTGGCGGCCCGGCGTGGCTTCGAGCGGAGTAGACGTATGCCGTGTCGCTCGGGAGACGCGTCCGGGTCCGGCCAGTCAACCCTTTTTTTTTCTATGTTTGACCTCGGATCAGGTAGGGATACCCGCTGAACTTAAGCATATCA\n>CR627091.1 Homo sapiens mRNA; cDNA DKFZp779E152 (from clone DKFZp779E152) \nTGTGCAAAACCCAGGAGCCACCCCTGCCAAGTGCTGGGCGTGTCTGTGGAGCAGATGAGGCCACAGGCACTGGCCACAGGACTGCGCTGTCTGGAGAGGGATTCGCACACATTTGCAGGGGTGCAGGGCTGGTGTTCTCAGGATTTTGCCTGGCTTCTCTGGATCCGGAGGTCCTGGGAAGGTGGCTTGGACCCTGGTGGGCGGAGTCTTTGAAGTGCAGTCTGGAATCTTCCATGCACAGTTGGGCGACCTGGACAGTGCCCACTGTGTTCTCTAGAGAGTTCCTCAAGGATGCAGCCCCTTTGTCCAGACACTGTTGCAGGAGGCAGGGAGGGAGGCCTGCCCCATGTCCCCTGGATGGCAGGATGGGCTCCCACCTTGTGTCTGGCTGGGCTGTAGTGTGCGGGGCAGCCAAAAGGCACCCTCCGGGTAATCAAGGCCTACCCCACATGGGGACTCTGGTGAGAACCGGGCCTCCACCGACCCCCTGTCCAGGGTGCAGGAGCCAGGCCCGTGCTGTCAGCTGTGTCTGTTTGTCTGTGGTTTCCCTGTGGCTTCATGGCACATGCAGGTCTCTCTTCATGCTTTGGGTGTGGAAGCCGTCGTCAGCTGAGAGTGTTCTGTGGGTGGGTAGCTCTCCTTCCTCCTGAATTTGGGGTGACCTTCTGTGTGGAGGCCCATGACGGTTTCCCATGCATTCTGGGGCTCTGGGATGCTGTGGGCACGAGTTCTGGAGGGGTCTGCACACCTAGGTTCATCTCACGGGCCTCGGGGTGGGCAGAGGGTCCTGGACTGCAGGGACTTGCCCTTCTTTGCAGCTTTGTGCTTTGGTGGTAAAGAAAGGGCTGTGTCCTCAGCCACACTGGGAGCTGCTGCCCTTGCGTGGAACAGGAGCAGCTGTTTGTGGGCAGTCCAGGTGTGGGCTGCAGGCGGGTCGGGGTGGGCTGCAGGCAGGCATTTAAGGAAGTCACAGCTCCAGGCACCAAGGAGGCAGTGGCTGCTGGCCCTGTCCTTTGCTGCATTTCTGTGGACTCCTAGCCCAGGGAATGGAGCCCTGGAGGGTCCCAGGGTAGTCGGTGTCACCTGAAGTGTCCCAGGGACACCTGGTCCTCTGGCTGATGGGGCCGCCCTGTGGGGTAGGCCAGGCCCTGGCTCTCTGGCCCTCAGGGCAGGGTGCGGGTTCCCCACTTCCCCGGCCCTCACACACACCCTTCCAGCCACCCGCGTGAGCATGCTCCAAACACGGCCTTCTGCCCTTGCCTTTTCTTCTCCTTTTGCGTTTTAAAAATCAAATCAGCGGTTCGGAAGGCCTGGAGCTTGGAGGACTCACGCAGAGGCGGCCTTCTGCCTGCCCTCAGGGGCTCCTGAACTTCCCAGAAGCAGCCCTCCCTCCCAGGCTGAACTTTCTGTCTCAGTCCCCGCACTTTCCCAGCTAGGCGGGCTCCTTGTTCCTGCCCATTTTACTCCAGAAGCGAAGCAGGCAGGCCCGGGTTATCCTGCAGGTGCCAGGAGCCCCCTTGGCCAAGCTCCATCTGTGCATAATGGGGGCTCCAGTGGTTTGGGGGGTTGGTCCATGGGAGAACTGGATGTTCACCAGGGGTCAGCATTGGCCTTGAAGTGTGGAGAAGGGTCATCTTGGCAGAGGTGGCAAGGTGGTGAGCCCCTGGGGCTGAGCACAGGTGCGTCTGGTGAGAGGGGCCTGGCCATGACCGCAGTGACTGCTCTTCACTGTCACCTCCTTTGCTCCTCAGGCCACCTGCGCAGAGGGTGTGATCCTTGCATGACTTTGCCATTGAGGAAATGCAAGGGTAGAAAGTGCAGTCTCGTCGGCCGCCTCGGCCTCTAGAATGCCCAAGCAGTGGTATCAACGCAGAGTCGCCATTATGGCCGGGACCACAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\n>JN907114.1 Uncultured microorganism clone GF13U7304JJ6AB 16S ribosomal RNA gene, partial sequence \nGAGTTTGATCATGGCTCAGAACGAACGCTGGCGGCGTGGATAAGACATGCAAGTCGAACGGGAGAATTGCTAGCTTGCTAATAATTCTCTAGCGGCGCACGGGTGAGTAACACGTGAGTAACCTGCCCCGAGAGCGGGATAGCCCTGGGAAACTGGGATTAATACCGCATAGTATCGAAAGATTAAAGCAGCAATGCGCTTGGGGATGGGCTCGCGGCCTATTAGTTAGTTGGTGAGGTAACGGCTCACCAAGGCGATGACGGGTAGCCGGTCTGAGAGGATGTCCGGCCACACTGGAACTGAGACACGGTCCAGACACCTACGGGTGGCAGCAGTCGAGAATCATTCACAATGGGGGAAACCCTGATGGTGCGACGCCGCGTGGGGGAATGAAGGTCTTCGGATTGTAAACCCCTGTCATGTGGGAGCAAATTAAAAAGATAGTACCACAAGAGGAAGAGACGGCTAACTCTGTGCCAGCCGCCGCAGT\n>XM_019753900.1 PREDICTED: Rhinolophus sinicus cytochrome c oxidase assembly factor 5 (LOC109459430), mRNA \nTTCCGGTTCTTTCCTCCGGACGTTGTTCGCTCGCAGCCGGGTCGCCGCGGTTGCGGACGGAAGCGGTGGGGACGGCGGCGGCCGAGAGGCGCGGCCATGCCCCGGTATTACGAGGACAAGCCGGAGGGCGGCGCGTGCGCGGGCGTGAAGGAGGACCTGGGCTCCTGCCTGCTGCAGTCGGACTGTGTGCTCCAGGAAGGAAAATCCCCTCGGCAGTGTCTGAAGGAGGGAAACTGCAAAGCTTTGAAATATTCATTTTTTGAATGTAAAAGATCAATGTTGGATGCCAGATCAAGATTCAGAGGAAGAAAAGGATATTGACACTACTATGTTGAAACTGAGCTGAAAACAACAAGGGATTTTTTCTGGTCATTAAAACAGAGAAGCCAAAATAGGAAACATACTTTTTCTCACATCCGTTTGGTTAGACCAGTTTTTCCCTCCGTGGGACACTGGAGAAATGCATGAGTTCTAGTTTTGAATATGTATAAATGATCCTCTTGCTCTAAGTTATTTTTAGAAGAAAAATGTAATGGATGAGTTACGAGCTCGGAGTATGAGAATTGTTCTGAAGCACAAAGAATGGAAAGGTTGTTATTTTCAAACCTGACTCCTCAAATGACAATTAGTACATCCTTTGTGAATGTTATCAAGGCCACTGATGGGACTGTTAAAATGAGGAACATGGAGCCTGGGGAGAAGGTATCTATTGGGAAAGTTTAGGATACAACTTTCTGTTATTCATTCTGTCCTGTTTACTTCTAAAATAAACTGTGTTTGATTCCTGGGA\n>XM_052447470.1 PREDICTED: Populus trichocarpa kinesin-like protein KIN-10C (LOC7454519), transcript variant X5, mRNA \nTTTGAAAAAAAAAAACAGAAAAGAAACAGCAGAGCCCTTCCTTCTTTCGACGTCTCTCTTTCCTTCTTTCCTTTTTTATTATCATCAAATTAATTACTACAAAATATCATCCATTTCAATCTCTCTCTCTATATCTCTATCTACGAATTCAAACACTCTCTCTCTCTCTCTCTCTCTCTCTCTCAATCAACCAGGTAAAGAAGAAGAAGAAGCAGAAGCAGAAGCAGAAGAAGAAGAAGAGTAAAGATGAGTGGCGTACCAAGAAAGCAAAACCTCAACCCCAAGGTTCGCGTCATTGCCAAAATCAGAGGTTCCTCACATCTTGACGGTCTTTCAACTTCTTGGATTTCCGTTCACAATAACATACGTGACGGCATTTTTTCTCACTCTCTCACTTTTTCTCTTGGAGACCGACCAGTTGCTACCAGTGGTGGTGGTGGTAGGAAGGAGGCTTATGTGGTGGATTATTGCTACGAACAAAACGAGAAAAATGATTTGGTTTTTGAAAGAGAAGTTAAGCCTTTTATTAATGAAGTTTTTGATGGCCGTAATGCCACGATTATTGCTTGTGGAGCAAGGGGCACTGGAAAATCCTACCTCTTTCAGGGTACGGATGATGAACCGGGTCTGACAGTGTTGGCTGTGGATGAAATGCTTCGATTGGCTGCGGATAACGGGAAGTCCATTGCCGTTTCCTTTTATGAGGTTGATCAAGATCATCATGTCAAAGACTTGTTGGATCCCAATCGACAACAAGTTTTTGTATTGAAGGATGCTCATGGAAAAACACAATTAAAAGGACTTTCTCAGGTTTCGGTGACATCCGTGTCTCAATTTCACAATTTCTATGGTGGTGGGACTAATCCACGTAAATCGATTCAGAAAGCAGTGACTGAACTTCCCAAGAGAAGTCATAAAGGGTTGATAGTATATGTATCGTCTCATGGTGGAGAAAAGTTGGACGTTTCTGTCAGCAAATTGAATTTTGTTGACTTGGCAGGTTATCAGGATGCTAGAAGGAAGAGTATTGATGGACATAATTTGGTTGAGAGTACAAGGAATATTAATAAGTCCATTCATGCCATTCATAATGTTGTTTACTCTTTGAAAGCTAATGAAACTCATGTGCCATACCGGGAAAGTAAGATCACTACCATGTTGCAAGATTCACTAGGAGGGGCTGGCAGAATTTTGATGGTCACTTGCTTAAACCCATCTTTTTGCCAAGAATCTATTTACATGGTGAAATTAGCATCTCGTTCTTGTCAAGGAAGTAGTTGGGCTATCACAGACTCCACAAAGAAAGCCAACAGCTCAGCAAGACCAATGGTGCCTTCTTCACATAATAGCCGGATGCTTGGTAGTGTTTCCACATCTGTGAAGAAACAAATTGTGTCTCGAGGGCACATTTCTGGAAAAAAAGCACACTGTTCAACTTCCACACTGAAAGCTAGGAAACTGTTTGATGAGTCAAGTGATTTGATATCTCAGAAGATTACTGTGCAGCCAAGTTCCTCAAACAATGTTCCAACAGTTGAATCTGTTATGCATGAAGCGGACCAGCTCACTTCAAATGTTGCCAAAGAAGCATCATCTTTGGAAGAAGGTGTATCATTGTTCACTCATGAGGATTCAAACTCTGTTTCTGTGGATGTTTCTCCTGTAGCAGCAATTTCTAGTACTTGTGAAACTACAATACTTGATAAGGAAGTTTCTCCTGTAGCAGCAGTTTCTGTTACTTGTGAAGCTACAATACTTGATAAGGAAGCTTCTCCACTAGCTATTTCCAGTACTTGTGAAATTACCGTACTTGATAAGGCTGACGAGGACCAAAACAAAACTGTGCTTTACACTGGAGAGTTATCTATGTTCAATGAAGGTAAAAAAATAGACAAGGAAAACAACAGTTCAATTGTCAATCAAGGTGGATCGCCACCCATTAGCGCACAATTGCAAGAACTATCAAACAGTTTGAAGTTACTATGTTCCTCAACCCCATCGTGCATGGATATAACACTAAAAAATGATGCATTTCACAATCAAACTTCAACTGATATCGGGGAACCAACAACTCCCAGTTCAAGTATGAGAGTAACAAATAGGGAAATTACAAGCTTTTGTAGTCCATGGGAAAAATTCAACGCCCGCAGCACTGGGATGAAGAACTCACTTGTTCAAGATTATCTTAGATTGTTGAACACAGCTGACAAGGAAGAATTGAGGAAATTGAAGGGTATTGGAGAAAAGAGAGCTACTTCCATCCTTGAACTTCGAGAAGATTGTCCAGAGCCATTTAAGAATCTTGATGATTTGAAAGACATCGGACTCTCAGCCAAGCAGGTAAAAGGATGGCTTAAAAAGGAAGTTGGGGGACTCTTTGATTAGCATGGCAGCTATGATTAATATGTTGGTTTGGAAGATAATTTACTTTGGGCAACCGAAAGTTGCTTTGAAACTTAATTAGAATTGATTGTAAAGTGGTTACTATATATATATAAATTTGGCATGCATTATTATTCA\n>XM_013532536.1 PREDICTED: Lingula anatina FMRFamide receptor (LOC106157047), mRNA \nTACTTATGAACTCCGCTGTGACCAAAAAAAGGAGAAATAAAACACAAAGAGAAAACTGATATTTAAAAAAACTGTAGGTAGAATTGACCTCTGGAAGTGAAAAAACCAGCACCAATATAAACTTTTGTACCTGGACTACCTTATCTGAAGTACTGCTCTGAGGAAAAAGAGTCACCTGTCAAGAATGGACCACTCGGCATTGATATTGGGAACCTTGATTCCAACGGCTGCTGCTGAGCCACAGGGAAATCTCACTGCTGAACTTTACATGGCAGGAGGTGGCGAAAACCAGTTTCCATCCCATGACTTGAGCTACCAGGACAAGCAGCAATGCTTTAATTATGCCAATGGCTCTTTTAAGGATGATGAGCGACTTGAGCAGATACAGTTTGTGATGTTTGGAATAATCTTGCACATCATTTGCATATTTGGAGTTGTTGGCAACCTTGTTTCGTTCTTTGTCCTCAGCAGAAAAGAAATGCGCTCCTCTTCCTCCTGCTATCTTATGGCTTTAATGATATTCAATACAGTTGTCCTACTGACTGCATATTCCAATGATGTTATGACAGGTATTGGAGTGGGAAGCATGTATGGCGCTGTTTCCAACTATATCCTGACATTTGGTTCAGCTGTTGGTCAGTGGTGTTCCGACTGCAGCACTTGGTTGACCATTGCCCTCACTGTAGAACGCTACATATTTGTCTGTCACACTTTTCAAGCTTCAACAATGTGTACCATGCGCCGAGCCATCATAGTTATTGTGTTTTTGTCTATTGGGATGTTTCTTTATGATATCCCATGGTTTCTGCGGCAAGAAGTGAGAAGTGTCACTTGTCCATTTAACGATGAGCCTATCACATACATTGTGATGCGTTCTGAAAAGCATCGCCCTTCAGATATGTACTATAATATACAGCTTTTGTATATTATGCCTGCCTTATTTCTCATTGTGCCCATATTTGTTTTGACAGCGTTCACAGTAATCTTGTTACTTGAGGTGCGAAAGTCAAATAAGCTACGCCAACAGATGTCTACCACACAGACTGCTGAGATCAATGTCACAGTTGTTCTCATCAGTGTTGTTGTGGTTTTTCTTATTTGCACCCTACCAAATTGTATTTTTGCCATTACTCGCACTGTTAAAAAAATTGAAAAAGCAGACGACCCATATTTCGACATTTACTTCACTTTCACTGGAAGAGTCTGTTTTATTGTAGCAAATGTGTTCTTTTATTCAAATTCAGCTCTAAATTTCTTGATTTTTTGTACAGTTGGTCAAAAATTTAGAAAAACATTCAAGCGTATATTTCTTCGACGCTGCAAGTTCTTGACAACGGAAGTGGTTCGTTACAGCAGTGTGAGTGTTGGCTCGAGAACTGGTTCAACCAGGGCAAGCTTTTATCAGACTGAGACAAACATATAGTCAGGTGACAAGTTCTATAGTTATTGGAAATGCAAGAGAGACTGATTTTTTAAATGAAAGTACTATCATTTCAATATTTATAAACATGATTTATAAGTTGCATTGATACTATCATTTTGATTTTGACAACATATATGACCTGATTCTTTTAGAGTTAAAAAGGGTCATTTGCCCATGAATTGATGTGTTTTAATCAGTTTATAAAAGTACAATTAATGAGATTTGATCTATATTCAGGTAGCAGAATATCTGTGGATTTTTTGTTTCAAGGCAACAGTTTCTGAACATGAAAAGGTTAAATTAACCAAAGCAGAGCAGGAAATGTAACTTTTGATGCTATTGATTTTGCAGCTCATGCAAAAATGGACAAAAAATTCAAATTTCTTTAAAACTAACATCAGTTGTGGTAAATCGATTTCCCAGGACGTCACAGTTGGTAGAATGATCCAACAAAAACGTCATATTACAGGAAAGACAAGGTACTAGAAACTAGATTACAGAATGGAGTTCAGGTTCTATTAAGATCTATATTTGTTACTGAATATAGCAGAATTCTAAATTTAAAGGTGCTTCAGAATTTTTTGTAACATGTTGATGGTGTTATCACCCATTTACTACGTTGTGGGTAATTTTTACGGTAATCGTTATTTCGATTAGAGCAAAATGCTTAATGTACTTTGTATACATGTAACATAATTTATACCACTGCTCAAGCAAGAAACAATGGGTCACACCATGACCTGTTCCAAGCAGAGTCGTGGCACACATGGTTGAGTATTGATTCCATTTCTAATTGGTTTTAAATCTGATAAAGCTCTCGTGCTGAAGCTTAGATTTATGTAAAATGGAGGAGTATCCAATTATTTCCACTATTTTACTTAAAACTTTGCGATCTTTATCTTTCATGTTATTGTCACTGCAGAAGTGGTCAAAATATCACAGCTGTTCATTAATGACATGTTTCAAATATGTATCACGAGGCACTTGTGCTTTTTTTTAATGTGCAAGTGACGTGAAATTGAATTTTAATTTAAATATTTATTAGGTAGGTCTGTATTTTACATGATTTGCCAGTGTAACGGTTGTATTTTAAGCTACTTTGGCTGAATGTACTTTTTATGTAAGACTATAGTAAAATAATTAAGTCTGATATTGTTTGATAAGTTGGTGTGGCAGTAGATTGTAATTTTTGTCGATCTATTTAGTTTCTATGTTTGCTTGTTTGAACTTTTCACCTAAAAAATAAATAGTTATGTTTATCATGATCCTACCTGTTTATTGTGATTCTCACAATAAGTA\n>XM_030059219.1 PREDICTED: Myripristis murdjan zinc finger and BTB domain containing 5 (zbtb5), transcript variant X2, mRNA \nAGGTCATGGATGCGAAGAATAGCGTCACCTTGTGAGTCTGGCTGTAAAACACAGTCTGGGAGAGGAAATTCTTAGGGAATATTATACATACATATTCATACCTGAGCGGTGGGGATTGTTAGCTAGTAGGCTCCCTCGTACAGTTTTTGGTGAACATCTGTTTTAAACACAACTTAGCGTGTAAACAGATGTGTGTGTGTGTGTGCTGAAGCTGCTCCAGCCCGTGGATGTAACGGCAGCTCCAGCCAGACAACCGTCGCGGACGCACAGCCACGGCAGTGCCCCCGCCCCTGCCCTGACCATGCACCCTACATACACCGGATAGAGGATAACGGTGGGACACGGAAAAGATTTGGATAAACTTTTGGGGTTTTATCGGAAGAAAGTAGCCTTGCGATACACAAACATTAATCCTGGTGGCCGCATGTGAGTGCTGCTTGAAAGCGACAACTCAGCGAGCTAACGGGCTAGCCTGCTAATCGCTAGCCAGCTAGCTTTGTTAGTTGGTGGTCGGGGGCCCTGTTGTACTTCGCCTTACACTTTTACCTTCACCTGTTCCGGACAATTCAAGGAACATGGATTTCCCAGGTCACTTTGAGCAGATCTTTCAGCAGCTGAATTACCAGCGTGTCCATGGCCAGCTGTGCGACTGTGTTATAGTCGTGGGCAGCCGTCACTTCAAGGCCCACCGCTCAGTGCTGGCAGCCTGCAGCACCCACTTCAGAGCCCTGTTCACTGTTGCAGAGGGAGATGCTAGCATGAACATGATCCAGCTGGACAGTGAGGTGGTGACAGCTGAGGCTTTTGCCGCCCTGGTGGACATGATGTACACCTCAACACTGATGCTGGGAGAGAGCAATGTAATGGACATCCTCCTTGCAGCCTCACACCTGCACCTCAACAATGTAGTCAAAGCCTGCAAACACTATTTGACCACCCGCACCCTGCCCATGTCCCCATCATCTGACAGACCCACCCATCGCCACCCTCAACAGGACCAGCCGAGACACAGGCAGCAGCAACAGCAGCAACAAGTAGCAGATTTAGCAGTGAATCCTAATCTAGCAGCTAATGCCAATCTTGCAGCTAATGCTGCTACATCCAGGTTGCAGCGCTCCTTCCTTCTGCAGCAGCTGGGGCTGAGTTTGGTGAGCTCTGCCCTAGGGGGGATGGAGGAAGATGGGGTGGGCAACGTAGTTGGCAATGGAGTAGTTGAACAGAGAGCTTCCTTTCCAATCAGACGCTTCCACAAGCGTAAGCCCTCTCATGCCCTGGCCATATCAGATGACAGACCTCGGCAGAGGGCGCGTCCCTCTGCCCCTCCTCGGGGTTTGCTGGGAGAGGAAGGGGTTAATGTTGAGCGGGAGGAAGGAGCACTGCTCTCTCCGGATTCCCATAAAATGGGAGATGAATCGAAATTGGATGCTGCAATTGCGGGCCTAGTGGGGGTGTCCCCAGATGATCCTCAAATGCCTAGCCAGTCAGACAGTGGTCACTGTGAAGGAGAGGACTCAGGGAGGATGCAGGGAGGAGTGGGGAAGGAGGAGTACATGGAAGACGGGGATCACCAGGACAATAGAGTTGGGACTAAGATTAAGTCTGGGACGGAGGAAGAGGAAGAGGTGGAAGCACAGGAACAGAAGGTGGTGGTAAAACGAGAACCACTGAGCTCCCCTGAGCCAACAGATGAAACCAGTGATGTAACATCACAGGCAGAAGGCAGCGACACAGCTGCGCCCGGAGGCCAGGAGGAGGAGGAGAAGGTGGAGCTGAGCCCAGAGAGCAGCGACCGCAGCTTTACCTCTGACCCCCAGTCCAGTTCTGACCCTCTGCTTAAGCCCAGCTCCCAGCTCCTCCTCAAGACCAGTATGGGTGGAGGCGCTGGGGCTGAAGGAGGTGGAGGAGGTTTTGGGTGTAGCAATGGATTGAATGGCAAATCTGGTTTCAGCATTTCCAGTTTTCTCAGCCCTAAGGGTTTCAGGGGTGGCGAGGCAGGCTTGGTTGCTGGGGACGATGACCTCCCCAACACAACAACTGGTGATGCAGCCACACATCACTTCCTGCTTGGACAGGAAGCTGCTGGGACATCTGCCTCTGCTTCTAGCTCTCTCCTGCAATCCAGTTCACTGAACTGTGAGAATCATAGCAGTTTTGGAGACAGCCTCCAGGCTGATTCTCTTTTCCTTCGACCCCTGCATGACGGGTTGGGAAGCCCCAGAGGAAGTGGAGGAAGTGGTGGAGGAGGAGGGGTAGACCCCTTTGGTTTGGACTACCAGCGCTCCAGTCTGGGGCTGCACTCCCTGGCACGAGCCACAAGAGGGGCTGGAGGAGCCGCTGCTGCTTCTCTGGGCTACCCAGGCTACCGTCGCATAGCTCCCAAAATGGCCAATGGCATGGGAGGAGAAGGAGATGTGGGTGCTGTGCTCCAGGATGCTGCCTCCTCCTCCTCAAGTCTAGGAGGGCCCCTGCTTCTCAATGAGAGCGGTGGTTATGAGATGAACAGCGGCAGGCCCACTTCCCTTCCCCCTCAGCTGACACGAGCCTCTGCCGATGTGCTGTCCAAGTGTAAGAAGGCTCTGTCAGAGCACAATGTCTTAGTTGTGGAGGGAGCCCGAAAATATGCCTGCAAAATCTGTTGCAAAACCTTCCTCACCCTGACTGATTGCAAGAAGCACATTCGGGTCCACACAGGAGAGAAACCCTATGCTTGTCTCAAGTGTGGAAAGCGCTTCAGTCAGTCCTCCCATCTATACAAGCATTCCAAGACAACCTGTCTACGCTGGCAGAACAGCAACACGCCCAATGCCCTGCTATAGAACTGAGACAGCTGCATCAAAACACCATCTATTCCCCCGCTCCTTAGAGCAAATCATGGTATGGAACTAATCAGGCAAGCTCTCAGTCACAGTGGTGCCTCCCCTGCCTGTTCATGTGGCCTGTCATTTGTTTTGTTACCCACTCCCCTCTCCCGACACACACACGCACACACATACAAGGAATTATCCAGCAGCTGTCATTACCAGCTGTGATGTATACAGTATATGGAAGCCCCGCTTCCCCAGCAAGTTTGCCATCATTACTCTTCTGCTGCCTCTGGACCTCGCATCTTGGAAACTTCTGGGCTCTTCTTTTGGATGCGGTAAACCCCAGTTGTATGTATCCTTGATTCAGATATGGATTCCAGATATATTGCTTCTAAAAAGGAAGTATTAATCCAGAAACTGTTAAGCATCTAAACTTGTGTAAGAACTGGTGGTAGTTTTGTGCGTTCTTGATGTTTCTGTGTACTGTAGAAAGAGAGAGGGTCAAGCTCTATCCTGTGTGCTTGTTGCTACCTCCATTCCCTTAAGAAAGGGTGGAAAGCCGAAGATGTTAATGAGGAGGAGTTAGACCATTCCTCTTCTCGTACTAAATCAGTTCAAATCCATGTGAGATGTTTGACATCTGAAGTTGCCTTTGCGTACAAGCACCTTTTTAATCACCAGTGGTTTTGTTTAGGTTACAGAAGGGGAGAGCTAATTTGTCCCGGCTGGCTTTCTTTACTTGTAGTATCAGTGACTCAGAGCTCTTGCATGCAAAAATAAGGTTTGCACTGACAGGGCATTGGGTCTGTAAGTGACTTAGCTGACGAGTCACTGCTGTGGCCCATCGTGGATGGTGTAAGAGACTCAGATTGTGTTTATGTAATAGTCTGCAGCTGCAAAGATTTAAACAGACAAATCAGGTTTTTGCTCCTGAAAAGTTTTAACATGTTAACATAGCTAGCTTGCAAGCGTAAACTAGGTAGCACTGAGTGAAAACATACAGAAAAAAAACTCTTGTCGACATATTAATTATCTAATGTTTATTCCGGCTGTTGACCACTGGGAAGTTTTGAATGACTGTAACCAACTTCTTAACCATTTTGCAATTGCCTGTTGGAACTATTTATAATACAATGAAGGCACATCAGTCGAGCAACAAACAAGCATGAAAATCTGAGCATCTGTTCCCCCGTCCCAATTCGGCCCTTAAACGCTGACGCCCAGGAAATATACTGTGCGGCTGTAAACTACAAAAAGAACATTCCAGTGCTGCATCCTTTACACAGACATGTTGAGAAACATGTCTTTTCTTAGTAGTATGGTATATTTATATCAGAGTCCTATGGATGGAACTGGATTAAAAAACAACATAAAAGTTAAATTAAAGAAATAATGAGAATCAGCCACACATAATTTAAATAAATGGCGAAATTGTAAAATGTGTTGTTTGAGTGTTTACTCAGATTTTCAATGTCAGCTGTGAACTTTACATGTTTTCAGGGGGAAAACATTAATTGTTTGTCCCGTGGTTTAACCATGTTTCCCCATTTGATCATTTCATATTTGTGAAACAGTCCAATGAAATTTGTACAGTTCCAAATTGTTCAGATAAAAAGTGGCACATTCATTAATTAAGGTACTTAATTTAAAGCCGTATTTGTAGGAAGTTGGCTTCTCCTTTGCCACGCTCTCCGCTGTGGGTAATTTTGGTATCCAAGTGCCTGCTGGGGGCAGCTCTTGCTTACCAGCACTTTTAATTCCTTCAGTTTCAGTGGAACGCAGGTGGCTTTAACAGCCACTACCGCTCGCTTCAGTTGGCTCACTTGGTAATGGGACCTGGTTGAACTTAGTGGTGGTGAGTGAGCAAATCTATGATTGGTACCTAGGTTTAGTGTTGAGGGGTGGAATTGGAACAAGGGTTATCAAGTGTCCTGCAGTAAGCAAACCCAAACAAAAGTAGTACTTTGTCCATTTCTGATTTAAGTTTGAACTTGCAATAGAACAGTATAAAGTGAATATATACTCCTGTAAAAGCTCGTGAAGTTGCTCTCAAATGCTGACATGGTTTGATGTCTGTTGCTGGTAACACTGAACAGTTGCATCAGCAAAGCTAGACATTTACATCACCCTAATTTCTTAATCAGTTTAAGTTTATGTATCATGTTCATGTTTTCATCTAGTCAGCGATATAGTTATCCCCTCACAGCTAAATGAACTTCAGCTCGACTTGGCTCCCAGCCAGGCACAAAGGACTAAGGGTTGCAGATTGCAGGAGGCCCCCTAGTTGCTCCTGATTGGCTCTTTACAGTCAACAACCGCCAAATGTCCAGCCATGGCCAACTTTCTTAGCTGACAAGCTTGTTGACCGTCCAAACACCAGCTGAGTGTCTCTGGTCGCTCAGCTGTGTGGTGAATGAATGAACTCCTCGTGAGCTGTTGAGTGTGTTGCTGGTAATCTGAATGCATGGTAAGATTAAAAATGTGCCGACAAAGGCATCGTTAAGAGAAGGTCTTCGAATAGGTGGCTTTGAGCTGATGTGACTTCTGTTTGTTTTCATTTGCACTTTGTGTGTCTATGCGCGCAAGATTGTGTTTGTGTTTGAAAAGGGCAGTGATGTTGAGTCCAGCATTTTGTACTGAGAGGCAGAGTCAACCGAACTTAGCTGGTTGCAGACTTTTTTTTTTTTTTTTTTTTTTTTTGGTGTACAGCACTTGTTGAACAGTGCTTTCAAAGTGTAAATATGACACATTTGTGATGTCTGTCATTTTCACTTGGAACAGAAATATAAAAAACAACACATAATGAACTAAATGTTGTGTAAAAGTTTGCTACTCTACTTGGTATCAGTGCTTTCTACATATCTCTTATATGTCAAATGTTTCATCCATAACAAAACAAAGGCACTTAGAGACAAATCTTTGTTTTTTAGGATAGTCCAAAAATGTTTACTGGAATGTTGAACTATGTGAAAATATTGCTGTTTTTCAATTATCCAACTCTACATCTCTGATGTCTATTACAATAGGTGTCCAAGCCAAAGCGAGTTTGTTGCATTGTGGTCTTCTAACTAGGTGATTTTTTTATTTATGTCATTGAAGGAAAACCCAAAAGGAAAGACTTCTAAAGAATGGAAATCTAACTGGAAGTGTGGGAGTGTTTGTTCTGTTTATTTGTTTGTTCATTTGATTTACAATTTGTGCTTGTTTCTGAATGCAGGATGGTAACACTCCCCTCAGCCCCATTTTAACTCTCATAGAAACCAAACAATATATAATTTAATAAGAAATTATATATATAAGAAATTCCCCATAGAGCAAAACACCACCATGTGGGGAAGGAATCTTAATTTGCCTTTTATAAGAATAAGCATAATTAAAGTCATCAAACAATCATCAATCTCAGTTTTAGAGTCCTGATTTCCAACTGGTTGGAAACAAGAGAGGCTCCATGGGTAGAAAGTTGGGTAATTGAGATCAGCATTCATGCAGTGCTGTAGACTTCTGCTTTAGTGAAGTGGAGGAAAAAATGAAGAAGAAAGAAAACACCTTAATTACACGTTTGCCTTTTTGTATACTTTATTTCGTGTCATATTGTGTCACCTGCACTGTCACTGAGAATTACAAGGTCCTTGCTTCCATTCCTAGTTGGCACCTTATTGTACAGTCGTTACACTGTTAGTCTGTACAAAACGATCTGACAGTTTTATTTGAGGCAAGTAAATGGATAATTCTGCCTTTTTATTTTGCTAGAAAAATAACTGCCTTGCAGGATGTTCTTACTGTAAACATAAGCTAGTATACTGTTTCTTTGAGTAAGTCTTGAATATACAGAACCAATAGTATTTCAGTCACACTGAGGATATTTTCTAGCTTGTCTTGAGTGTTTAAAACAACCACTGATGGTTAAATCTTGAATCTGACTTCTGTTCCTTAGTGTTCATATTCAAGAGAAAGGAGGCTGTGATAGACCCAATAGCATAAATATTGTTATTATTATTATTTTTTTGTTTGTTTTAAAGACATGGAGGGGAGGGGATATACAGAACCAATGAGAGATTAAGTCATCCAAAATGGCTTCCATGTCTCACACAGTGGCCTGAACAGATCTGTTATGGTGCTGTCTTCTGAAACTGTTGCATGGACAGTTTACAGTATGTGAATCTATGAAAAATGCACTGAAATATTGTTAATTTATTACCCCTGTATAAATATGCCAAAACTAAAATGTGTACAAGGCCTAAATTGACCATCAAATTCACTGCCTTATGTGCTCTAGCTTGAAAAGCTGAGCTTTTATTGATATGCCAAAATTGAAGGATTTTGTTCTTTCTGTATACCTAACATAGTGTAACCATGAGAGAACTAAATGTTTGTCTCTTTACTGTTGAAGGTTATGAAGGATGTACAGTATTTTCAGTTGTTGTATAGACTGAATTAAAAAAATGAAATTTTA\n>XM_043813081.1 PREDICTED: Vespula pensylvanica cytochrome P450 9e2-like (LOC122629547), mRNA \nGTTAGTAGTATTGAACCTCTCGCTAGCATAACGTTGAGTAGTTTTCCACTCAGGATCTTTTAATTAATCGAGCACACGATGGAGACTTGGGCAATGATCTTGGCCTTGGTAGCAGTGATAGTCAGCATTTATTACTACGTCTTTAAGGACTTGAGTTACTTCAAAAAAATTGGTATACCGTATTTAGAACCATGGCCGATTGTGGGCAACATGGGCCCAGCAATTTTACGTCTGAAATCGCTGATTAATATAATTAAAGACATTTACAATCTAAATCCGGAAGCCAAATACGTAGGCTTCTTCGATATGGGTAAACCAGTTTTCTTTATTCGCGATCCAGAATTAATCAAAATGATCGCGGTTAAGAGTTTCGATAATTTCCCGGATCACAGAGGTTTCGTCGACGAGGTACAAGAGCCACTGTTCGGAAAGAATTTGTTTTCCTTGAAAGGCAATCGATGGAGAGAAACTAGAACGATGTTGAGTCCGGCGTTTACTTTGCGCAAGCTAAAGGGTATGTTCAAATTGATGAACGAATGCGGAGCAGATTTTACCGATTATCTATCGAAAATGCCGAAGGATAAGAAAACTATAGAAATGAAGGACGTCTTCGCGAGATATACCAACGACGTAATAGCCACTTGTGCATTTGGTATCAGTATTAATTCTATGAAAGATCGGAACAACGATTTCTACGTTCTCGGTAGAAAAGCAACCAATTTCGAAGGTATTCAATTTCTGAAATTCTTCCTTATTCGTTCTTTCCCAAATATTGTAAAATTTTTCAACGTCAAGCTCATATCCGGTAATATCGACAATTTCTTCACGAACGTTGTCAAGGAAGTAATCGACACTAGAGATCAAAATAAGATCGTACGATCAGACATGATACAATTGATGATGGAAGCTAGAGACAAGAGAGTCGAAATGGGACAAGAATTACCTCTGATAGACATAGTAGCTCAAGCGTTTATATTTTTCTTTGGTGGCTTTGACACCGTCTCCACGGCCATGTGCTTCACCTGTCACGAAATTGGTATCAATCTGGATATACAAAAGAGATTGCAGCAAGAGATCGACGAGGTCATTGAGAAGACCAATGGAAATCTAACTTATGATATTATCAACACCATGCAATATTTAGACGCCGTGATACAAGAATCCCTACGGAGATATCCGATCGTTGTCTTTCTTGATAGAGTATGCATCGAAGATTTCGAACTGCCACCAAGTTTACCTGGAAAGAAACCTTTGTTAATAAAAAAAGGCACGAATGTTTGGTTCCCAGTTAGTGCACTCCACTTGGACCTCAAATATTTCGAGGATCCGTACAAATTCGATCCAGAAAGATTTATAAAAAATGGAAAGGAGATCAACAATTCCGGTGTCTATTTGCCCTTCGGATTAGGACCTAGAATGTGCATTGGTAATAGATTCGCTTTGCTGGAGATAAAAGTTTTGATATTTAATTTATTGGCAAGATGTAGTCTGAAGCCATCCATCAAAACCCAAAATCCAATTCGATTATCCAAGAGTGGAATCAACTTGTCGGCTGAAAAAGGTTTTTGGATGGATTTAGAAGAAAGAAGCGATGTTCATCCTGCTCTTAAAAATATTGTCTGTAATAATAATTCTGATACTATTAAACTATGTAGCCATTAATGGAGTTACTATTGATCGTACTGTTAAAACTTAAGATATAGAAATGAAATAATGAAAATAATTTTATGAAGATAAACTTATGTAATGGATATATATATATTTTTTTTTCGTGATCGAAATGATAAAACATCGAATTTGGATTAAACGTTTACGTATCGTAGTCGGTGCTATTAGGAATTATCCTCTTTTAAATTTCACACAACTATAAAAGCATAACCTCTTGTCATTGAATTACGTATCGTTTTAGAGATTAATACAACTGAAGCTGTTATTTTATTATTATCTTACGATATAAATAACGTATAATTACTA\n>XM_001591429.1 Sclerotinia sclerotiorum 1980 UF-70 predicted protein partial mRNA \nATGGCTAAAGGGCTAAAGCTTATCACAAATGGCGACGATGCAACCACCCTAACTCAAGCACAGCAGGAACAAGCCGCTGAAGAAAGAATTACTTGGCCGGAGATTGGTTGTATTGGGACATCTTAG\n>XM_006974024.3 PREDICTED: Peromyscus maniculatus bairdii hook microtubule tethering protein 1 (Hook1), transcript variant X1, mRNA \nGGTGCCGTGGCACGGGACGGACGCGGTGGGCGAGGGGGGCGGTCGCGCCGCGGCGACGTCGGCGGCGTGAGGCTTCGCGCGTGAGCGGCGCGGGCGCCAGGCCTGACGGCCGAGCTCCGGGTGGCGGGCGCGTAGGTCGTTGACGCGGGCCCGGGCCGGAGGTGCGTCCGTCGCCGAGAGCGCGGCGTCGAGGTTCCCGGACCATGGAGGACCCGCAGCCGCTGCCCCAGCCCGAGCTGCCGCTGTGTGACAGCCTCATCATCTGGCTGCAGACATTCAAGACTGCCTCACCCTGTCAAGATGTCAAACAGCTGACTAATGGAGTGACCATGGCACAAGTTCTTCATCAAATTGACGTAGCCTGGTTCAACGATTCTTGGTTAAGCCGAATTAAAGATGATGTTGGAGACAACTGGAGAATAAAGGCTAGTAACTTAAAGAAGGTCCTCCATGGAATTACAAGTTATTATCATGAGTTTTTGGGGCAGCAGATTTCTGAAGAACTTATCCCTGATTTAAACCAAATAACTGAGTGTTCAGACCCTGTGGAGCTTGGAAGGTTGCTTCAGCTTATTCTAGGCTGTGCAGTCAACTGTGAAAGGAAGCAAGAGCATATTAAAAATATAATGACCCTTGAAGAATCTGTTCAGCATGTGGTCATGACTGCAATTCAGGAGTTGATGAGTAAAGAAATCGTGAGCTCTCCTGCAAGTGACACCATTGGAGAATTAGAGCAGCAGCTTAAAAGGGCATTAGAAGAGCTTCAGGAAGCCACAGCAGAGAAGGAAGAGCTGAAGCAAAGGTGCCAGGAACTGGATATGCAGGTGACTGCACTTCAAGATGAGAAGAACTCACTGGTTTCTGAGAATGAGATGATGAATGAAAAGCTTGACCAGTTGGATGGCTCTTTTGATGATCCAAATACAATGGTTGCGAAAAAGTATTTTCATGCACAGTTACAACTAGAACAATTACAAGAAGAAAACTACAGGCTTGAAGCTGCAAAAGATGATTACCGTGTTCACTGTGAGGAACTTGAAAAGCAGCTGATTGAATTTCAGCACAGAAACGATGAGCTGACGAGCCTTGCTGAGGAAACCAGAGCCCTGAAAGATGAGATAGATGTTCTTAGGGCTACCTCAGACAAAGCAAATAAACTGGAGTCGGCAGTGGAAGTGTATCGTCAGAAGCTACAGGATCTAAATGACCTCCGTAAGCAGGTGAAATCTTTACAGGAGACAAATATGATGTATATGCACAACACCGTGAGCTTGGAAGAGGAGCTGAAGAAGGCCAACGCAGCACGTGCGCAGCTGGAGACCTATAAGCGCCAGGTTCAAGACCTTCACACTAAGCTTTCCTCTGAGTCTAAAAGGGCAGATACACTAGCATTTGAGATGAAACGGCTTGAAGAAAAACATGAAGCTTTACTCAAGGAAAAAGAGAGACTGATAGAACAGCGTGACACTCTGAAAGAGACGAATGAGGAGCTACGGTGCTCACAGGCACAGCAAGATCACCTAAATCAAGCTGATGCATCTACTACAAAAAGTTATGAGAACCTCGCTGCTGAGATCATGCCAGTGGAATACAGAGAGGTGTTCATTCGACTGCAGCATGAAAACAAAATGCTTCGCCTGCAGCAGGAAGGGACGGAGAATGAACGCATTGAGCAGCTGCAGGAGCAGCTGGAGCAGAAGCACCGCAAGATGAACGAGTTGGAAACTGAACAAAGATTGAGCAAGGAGCGCATTGGAGAATTGCAGCAGCAAATTGAGGACCTCCAGAAATCGTTACAAGAACAGGGCTCCAAGACTGAAGGCGAAAGTTCCAGCAAACTAAAGCAGAAGTTGGAAGCTCATATGGAAAAACTAACAGAAGTCCATGAAGAATTACAGAAGAAACAGGAGCTCATTGAAGACCTTCAGCCAGATATAAGTCAGAACGTCCAAAAGATCAGTGAGCTTGAAGCTGCTCTTCAGAAGAAGGATGAAGACATGAAAGCAATGGAGGAGAGATATAAAATGTACTTAGAGAAAGCCAGAAATGTAATAAAAACTTTAGATCCCAAATTAAATCCAGCATCAGCAGAAATAATGTTACTTAGAAAGCAGCTGGCGGAGAAAGAAAGAAGAATTGAGATTCTAGAGAGTGAATGTAAAGTAGCAAAATTCCGTGATTATGAGGAAAAACTCATTGTTTCTGCCTGGTATAACAAGAGCCTGGCGTTTCAGAAACTGGGCATGGAGTCTCGGCTTGTGAGCGGCACTGGTGCTTGCAAAGACGCTGGTGCGGGGGCGCCTGCACGGTCCTTCTTAGCACAGCAGCGGCACATCACCAGCACCCGGAGAAATCTCTCTGTTAAAGTCCCAGCCGCGGCATCTGACTAGTCCGCAAAGCAAACACGAACAGAAGTGCCTCAAAATGTTTTGTACCCCAAGAAACTACCAGATGGAAAACAAAGGTTAAGATGCTTGGTAGCAGCTAGTTTTGTTTGGATTTTGTTTTGAGATAGGGTCTCCCATCCCCCAAACTGGCACTGAATTGACAGCGTATTCAAGGATGACCTTGCCATCTGATCAGTCCTTCCCTCACTTCCTGCATGCTGGGATTAATAGTTGTGTACCACCATATTGGGTGGATACAGTGCTGGGGATCAAAACTTGCACTTAGGTCAAGCCAGCTACCAACTAGCTACATTCCTAACCTGGGTATCAACTATTTTTATGTCAAAATATATCAAGTTAACATTTAAGTTTACTCTGAAAACAAAATGCAAAATCAGCTCTGTCCCTGGGCAGCACTTTTGAGTAGTTGGAAGTGTGATAAAACAAATATTTGTCTTGAGATGGCATCATGTGTGGGAAAGCAACTGCATATTCCAGCTTTATGCTTTCAGTTGTAACAGCGAGTCAGTTAAGGTAGAAAAGTAATAGTTTGTCATTTAGTAATATATCTAGATTTGCTTTATGGGAAGCAGCCTCCAGTAAGGCATGTAGATAAGAACTGTGCAAAGTAATTTCTTTGACCTGGTGTGTACAAAGCTTTCCTCTACTTGCTAGTTCTGTCCTCAAGAGGATCCTTTGTCATGCTGTGGAATCGATAATGCATGGAAGACTTTACTGTTGGAGTGACTTTGTCCTATAAAAGCGACTGATTGGACATTTGCAGTTTCTCTGAGCTGTATCTCAGTTTGTACATGTACTGCTGTGAATGAAGACTTTGGAGGGCTTGACTGAAATGGTAAGGTGGGAAATAAACTGGTATTTCTAAGAGGTACCTTTCTGTTGGAAAGCAAACTAGAAGAATACATGTTGAAATATCCATATGCTTTTGAGCATGAAATTGTTGTGGCCTTTGTTTTCAAAGAAGGGTATAATTTTGCTTTATTACCTGTAAAGAAACAATGATGAAACAGCTTAGGACCAGTTTGGTTTCTGCTTACCTCTTACGGAGTTTCTGGAGCTGGATTTGTGGCATTCAGTTCATTTCTGCCCAGGGTTGTTCTTTTCAGAGATGTTACTTTCTAATTTGGGGTCACTTTTTAAAGTCACACTTTGGAATATTAGTTGTTAAATCAGTATTGATTGATGTAGCCACAAGTGGTTCATTCTTGTGTCAGACACATTTCCAACACTTAGCAGCCACGTTTCCATCATTGTTGAGAGTTCTGGTGTGATGCAGTGTCACGGTAGATCTTGGTTTTGGTAACTTGGGAAAATTCTTTGATCCTTAGACTACAGAAGTGGGAATAATTCATCTCATATCTAGAGAAGAATCAGATGGTGACAAGAATGCAGCAACACAAATGTCGCAGCATTGTGTATACACTGAACGTTAGCAGGCATTCTGTGAGGGAGTGAGCTTGTGGGCTGCATGATCCTTGATTGGTCAGCTCCTCACCACTCCCCTCAGCATGAAAGGAGGGATGCTAATATGTAAACAAAATGGGTGTGAGCCAGATTAAGCTGGCAGGCTGTAGAGCTGTGGTCTACACTTTATTCTTAGTCCTTCATAAATATGAGTATTGTTCTATTTGAAGTGTTAACTCATGTAGATAACTGCCTTTAAATCCTTGCCCAGTAATTTTTTTAACCACTTAACAACACAAGAATTTCACAGTGATTTGGGGTTTTGAGATTAGTGGCATCTGCCAGGATATTTTGTTTTATCAGGGTTCCTTCTGTTGACTACCTCTTAGATTTTTATGCTTTGTGCATTTAAACTGTTGGTTTGCATTTTGGTATGTTCTTATGGTGTCTGCTTGCCTATGTCTTTTAGTGAAATAGGACTTTGGAAAATACTTTAGCATGCTATTTAAAATTTTCTAAAAATTGTGGCATTTGGGTATATTTTTGTTAATGAAGATATTGATGTTAGTGTTTGTATTTGCTTATAATTGAGATTTTACAAGTTCTCTTTTAATGGAACTTACTGTAAAAGATGAACTTCAATAAATTAATGTTTCTAGTGTAATTGCTCATAAATTTCTAAATAACTAATGTAGCATAGATAAGGACATAAGGATAAGTTTTCTTTTCTTAAAGAAAAGGCAGATTTTCTGATTTTTCTAGTTTTAAGTAGAATTTCAAACGTTTGATACATGTTTATACAAAACTATGTAAAGTTCTATATAATTGAGACTAATCACAGAAATTGAGGCAGTGATCAGGGTGATTCTTTCCCTATGTGGTTCATGCAGTGAGATCGGTGCCTGCCACATATAAAGTATACATGTTTCATCTGGAACCATAATTCTACAAATGTGTTACAAGGGAGGACTGAATGTATAAACATGGAATTGACAAAAAAAATTTATGTCCCAGTGATTATAAAGTTAGAAACAATTTTGAATTTCAAGTGGTTGTCCTTGGATTGATATTCCTTTCTCTTTTTGGATATAATTATGACCAATTGTTTATCTTGGAAATTAACTTAATGTATTGAAAAATATTTGAAGTTTATTCTATTTTTTCCCGTGATTAAAACTAATGATTTAATGTAAGTTAAAAATACCTTGCCTAGCATCCTTTAGCAGAGTATCCCTTAGTAAGATCTGGTAGATTGTTGATGACTAGATGTTAAACACTTCAAAAACACACCTACTTTTGTGTAATGTACATCTGGCCTTTGGGAATGATGGTGATTTAGGCCAGAGTAGTGTCACTTTGTGTAAAAATAAATGTATATGGCTCGTTATACATACAGTCTTATTGTGATCTTGTTTATTGCACAGAAATTGGACACTTATAAAGCACAAATCATCAGAGGAAATAGTGTGTAGTTTATTGAATTTGAGGAAGTCTCAGTACAGTGTTTAGTTTATAAAAAGGTCCTTTCTATTTTCTATGACAAATACTGTCACACTTGAAAAATAGATGCAATACTTGATTTATTTTTGTAAGTATTTAGAATATTATTTTAAATAAATGATTGTCAATATAATTGTGAAATGTTTTGAGTAAATAAACTTCTGCTTCTGTA\n>XR_008312440.1 PREDICTED: Hemicordylus capensis uncharacterized LOC128337805 (LOC128337805), ncRNA \nCGGAGGGTGGCGGACCGCCAGAAGGGTGGCAGAGGCCGAAGGAGATGCAAGAGAAATGGATTGGGAAGGGCAGGATCATCAGAGGACCAACATCTCCCCAGCATAAAGACACTATCGTGGAAATGCAGAATGCATCGGACAAGTACCTAGGCATGCTGCTGACCACCTGTTGGATGCTCACCATGTCCAGCGAAGGGCCATCACACGCCAGACCATTGCGCCAGCTCCCTGCGCTGGTTGGAGCCGCTTCTGGGAGTTCAACGGCCTCCTTCCTCCCACTTCTGGCTGGAGATTCTTCTGGCTGGCAGCAGCACCCTGAAGCCAACACGAGGCTTCTTCCCATCTTGCACTTTGTCCAGGTGGCACCAGCAGCAGCAGCAGCAGCAGCAGCAGCACCAATATTTATATACCGCTTTTCAACAAAAGAGAACAAAGCGGTTTACTATCTATCTATCTATCTATCTATCTATCTATCTATCTATCATATTTCTATGCCGCCTAATATGTACATCTCTAGGCTGTTTACACAGAGAAATAATAAATAAATGAATGAATAATTGA\n>XM_024685516.1 PREDICTED: Selaginella moellendorffii transcription factor TCP20-like (LOC112350051), mRNA \nATGGGATCTAGTAGCGAGGTCTCGGAGGACATCGAGTGGCACTCCCCGGGAGGAGTGCCAGCGGCGGCTGCGCCATCGCCAGCCCCGCCGGAGGAGGCGAAATTGATCGCGCCCATCAAAGGCAAGCGGAGCTGCGGGATCAGGAAGAGGAATTCGAGCGTGAAAAATCGCAAGGCTGAAGTGGTGGAGGAGGAGCCGGAGGAGAAGAAGTTGAAGAAGGCGGCGCCAAAGCGGAGCTCGACCAGGGATCGCCACACCAAGGTGGAGGGGCGGGGGCGGAGAATCAGGATGCCGGCGGCGTGCGCCGCCAGGATCTTCCAGCTCACGCGGGAGCTGGGCAATAAGTCTGAGGGCGAGACCATCGAGTGGCTGCTCAAGCAGGCGGAACCTTCGATCATCAAGGCCACGGGCACAGGTACCATCCCGGCGCTCGCCTTCTCAGTGGCGGCGCCGCTGGCCCTCCGCCAGGCCGCCGCCAATTACGTCTCGCCGATCGCCGTCGCCACCCGCTCCAGCCTGCCGCTGGATTTCGCGGCGCCGCGAGTGGACAACGCTAACGCCACCACCACCACCACCACCACCACCACCACTATCACCACCGAGGGTGGCGGCGGTGGTGGCGGTGGCGGCGATGAGAACTCCAACGAGAGCCATCGAAGGTACGAGTTCCAAGAGAATGGGGACAGTGGATCCATCGGAGACGATCATGGAGAGGGGAACGCCAAGAACTTGCTCACTAGCTTGAAAGATGATCCACGATCTCTCCAATCCAAGCAACAGCAAGCTCTCGACGACCACCACCAGCATGACCAAGAAGAACTCGCGATCCATCACCAGCAGCAGCAAATCTCTTGGCCCGTGCCAAACCTGTGGATGCTGCCAGTTCCATCTATGGGTGATCACTCGTGGGCATACACCACTTCGACTTCGTGTCCCTCGAGCTTCTCATCGTCGGCGGCGATGATCCAGCAGCAGCTCCAGCGGATGAATGCGAGCAGCCTGATCGAGCTGGGGCCTCTGGGATCGATGCTGGCGATGCAGCATCACCCGGATCTTTGCGCCCCTGGCAGCGATAACTTCAACCTCTTTGCCGCGACGTACCACCACCATCTCCAACGCCAAACATATGATCCTCACGTTACTTCACGAGACGATAGCGGCTAG\n>XM_053129038.1 Zychaea mexicana uncharacterized protein (BDB00DRAFT_931432), partial mRNA \nTGCCACGATGGCCCTGGTATCCTCACAGGCTGTTACCAGAAGTGTCATCGCCATGTTAGTCCAGCCATCGAGGAAACCATCCACCCAGATATCCGGACTGCACCTCATCGACTGACTCCCACGAGCACCGTGACCGCACCATCAGCAGAGCCTGCAGATGTTTTTCCGTTTGGTTATGATATTGGGAATAGCCGCCGTGCGCAACGAGAGCGCACCCAGAACGCAAGCAAACGAAACGCAAAGGCGCAACGCACACCACAGAGGAATACCAAAGATGGCGGAAGAAAAGAAAGGGGGGCCGGAACGGAAGGCAGATACGGAACATACTGAATAGATCTTGGTGAAACACCGATCAGCTATGCTCAGGAAGAAGTTGTCATTATTGGGATCACGTAATTCAC\n>XM_050140454.1 PREDICTED: Microtus fortis uncharacterized LOC126500504 (LOC126500504), mRNA \nCTCGGATCCCCCGCACTCCCGGAAGAGAATGTCCACCGCTCCTGCGGGAGAGGAAGGCGAGTTTTGCAGCCATGCTCCGCAGAGTGGCCCGGACCGTGGTCCCAGGGCTCAAGGTGCCCTGGGCGCGGTGGTCTAGGAACTGGGCGGGGGTCCCAGACCAGGTGGTAGACCTGCGCAGCGACACGGTGACCCGGCCAGGGCCGGCCATGAGGCGCGCCATGGCCGAGGCGGTCGTGGGAGACGACGATTACGGCGAAGACCCTACGGTCCTCGAACTGCAGGAGAAGGCTGCAAAGCTGCTTGGGGTGGAGCAGACCCTGTTTGTGCCAACCAACACCATGGCCAACCTCATCTCTGTGATGGGTCACTGCCGGCGCCGGGGTTCCCAGGTCCTCCTTGGGCAGGAATGCCACCTCCACATCTATGAGCAGGGCGGGGTGGCTCAGATCGCCGGGGTGCATTCCCAGCCCCTCCCAGACATGCCCCATGGCACCTTGGACCTGAACGAGCTGGAGAGGGCACTCTCTCGGGGTTTCAGGAACTCCTACCATCCTGTCTGTGAGCTTGTGTGTCTGGAGAACACACACAGCAGCGCAGGGGGCCGGGTCCTTCCCATCCACTACCTCCGCCAGGTGCGCCTCCTGGCCCACGCCTACGGAGCACGGGTCCACCTGGATGGGGCGCGGCTGATGAATGCAGCTGTGGCTCTGCGTGTGCCTCCCGCCCACCTCGTGGAGCACTGTGACTCCGTATCCTTCTGCTTCTCTAAGGGTCTTGGTGCACCAGTCGGGGCGCTGGTCGGTGGAGCCAAAGGCTTCATTGAGGAAGCCTGGCGCCTCCGCAAAGCCCTGGGTGGAGGCATGCGCCAGGCTGGAGTACTGGCTGCGGCTGCCATGGTGGGACTGGCTGAGGCAGAGGAGGTGCTGCCAAGAGATCATGAGAATGCCCGGAGATTCGCTAAAGGACTCCGGGACCTGGCATCACCCATTTGCTCCGTGGATCCCGACACTGTGGAGACCAACATGGTGCTGGTGCAGGTGGCGGGGCGGCCTCCTGCAGAACTGTGCCAGCGCCTACAGGCTGTGAGCGCCGAGGAGGTGGCTCAGACTGGCCGCGCTGTGAGCGTGCTGCTCTTTCCCTGGACAGAACACTCCGTGCGGGCCGTGTGGCACCGGGATGTGTCTGCTCAGGACACGGAACTGGCGCTGAGGAAATGGGAATTTGTGCTGAGGCAGTTGAGGCCCTGAGATCAGGGGACCAGGAGCCCTGTGCCCTGGCTAGGATTGAAGTGTAGAGTAAGCTGGTCCAAGCCATTAGCCTAGTGGAGGCCCGCCCTTCTGGGGGATGACGACACCATTCCGGCCTCTGAATTCCTCCACTGACACTCATGTGATGGCCTCATTCAATCAGGAACAACCAGGCACGGGCTGGGATAAGAAGGGGCTGAATATCAAGAGAAGGGAATGAATTCAGGAAGCAGACCTGGGGCTGGGACGTGCAGCGTGACTGCCTGGTGTGTGTAAGCCCCGGGTCTAGTCCCAGCACTGTATAAACAGGTGTGTTGACTCACACCTGTAATCTTAGCAAGCTGAGAAATTAGAAGTTCAAGGTTGGGCTGGAGAGATGGCTCAGGGGTTGAGAGCACTGGCTGCTCTTCCAGAGTTCGATTCCCAGCAACCACATGGTGGCTCACCACCATTTGTAATGAGATCTGGTGCCCTCTTCTGGCCTGCAGCCATACATGCAGGCAGAGCACTGTATAGATAATAAATATTTTTTTTTAAAAAGTTCAGTCATTCTCAGATACAGAGTTTGATTCAACCCTGGGCTACATGAGACCCTATCTGCAAACAAACAGATCCTGTGTGACTGGCATAGTTATTAGAGATGGACTGTAAAATAATAATGTGGGATTTCCTTCTGTGTGCTGTGATTACCATTAATGAATAAACTGCTTTGGGCCTGTTGATAGAGCAGAACTTAGATAGGCGGGGAAAACTAAATGGAATGCTGGGAGGAAGAAGGCGGAGTCAGGGAGCCGCCATGGAGCAGCCAGAGTCAGACATGCCAAAACTGCTGATAAGCCACTGCCACGTGGTGATACACAGATTAATAGAAATGGGTTAAATGAAGAGGTAAGAGTTAGCCAGTAAGAAGCTAGAGCTAATGGGCCAAGCAGTGTTATAATTAATATAGTTTCTGTGTGGTTATTTTGGTTCTGGGCAGCCAGGATGAACAAGTGACCCTTCCCCCAATAAAGTATTGAAGGAGCTGTATTTGTACTTTTAT\n>XM_025755560.1 PREDICTED: Arachis hypogaea protein LURP-one-related 10 (LOC112703951), mRNA \nTGCATGAAAAATATGAGAACCAACTACTTCATCTCCTATATATGATAGTGTTCTTACTTCTTACAACTGAAAAAGGAAACTCTTATCAATTAATTTGTGAAGTAATGGAGGCAAGTGCACCTGATTTTGCATTGGCACATGGGTTCCCCATGAATATGATAAGTGTAGTAGATGATAAGTTCTATGTTGCAAACCCAACAGAAATGATTGTGAAGAAGAAATACAATGGATTGTTGTTGAAGCAACGTTACAAAGTGAAAGATGTTAATGGGAAACTCTTGCTTCAAGTTGATGGGCCAAGCTTAAGCATCCACAAAAAGAGGGTTATGCGTGATGCTCAAGGTTCACCAATCCTCATAATGCAAGAGAAGGTTAAAATGGTATCGCTCCGGCACAGGTGGACGGTTCATAGAGGGAAAAGCTCAGATGATAAGAATGTGATATTTGGGGTGAAAAGGTCACACCCAATGGACATGAAACCACGGCTTGATGTGTTCATGCCTGGTAATACTGATGAAGATGTAAGCAACTTTCAAGTTGTTGGTAGCCACATTCAAAAATCTTGCACTATTTACAAAGGTGACACCATCATTGCTCAGGTAAGTGATGTGTTCCCAAGCAGAAACTTCAGCAAATGGAAAGAAAGCTATAAAGTGAAGATTAATGAAGGGGTGGATTATGCTTTCGTCATGGCATTACTTGTAATATTAACCGTAAATGACTACATTTGAATTTGGTTTCCCTCAACATTAAATCAATAATAATAATAAGAAGTAGGAGTGGGAATATGTACCTTACCTGCAGGTACCCAATCCGATCTTACCTGATCGGGTAGGGTTGTCAACCCAATCCGCAGCGGGTAGGGTAGAGTGCGGGTAGGATTTTCATGTAGGTCGGATAGAGTGCGGGTTGAACTTCAATCCTACCCGACCAACCCGCACCCTATATATGTATATGTTATATACTTATATAAAAATATGTTCTAAGTGGATGTTGAA\n>XR_004838883.1 PREDICTED: Vespa mandarinia uncharacterized LOC118444101 (LOC118444101), transcript variant X2, misc_RNA \nGATTTATATTTAATTTAAAAAATTTTTTTTCTTCAATAGTTCCTAAATAAAAAATTATTTCTTATTTTCAAAATCAAAAATGATAGTTCCTAAATATCTATTTTAATAGTAATAAAGTACTTCAATGGCAAAAGTTCGTAAGTCCATATTCTAAATTATATCAATCTTTAAATTAATTTTATGAAGAATTAATATTAATAGTACAATATGAATATTATAACAGAGGATGATAAATTTGTCCCATTACATTTTGTATTTTGTAATTTTTATGGTGAAGATACATGTTTTTGTTGGAACGATGATAAATTTGTTATGTTTCCATACATACAAGAAAAATATACATCTTTGCTGCCAGTTTTGATTGCACCGAGGCAAATAAAAACTATACAATGTTTTTCCAATAGAGTTTTCTTTACATGTTTACCCCATGGTGTATATAAACTTTCAAGAGATAGAAGATTCAGTGTATTAAGTAAAAGTGCTATAAGTGTTGGTTCCATATTTTTTGAGATACTTAAGACAAAGGATGATCACTTATATTTGGAAAATAAACAGAACAAATCGAGTAAGATATTACTCCATTTGCCACTCATGTCAAAACAACTAGAAGAATTATGTACTTTTCCTTTGAACATGGAAAATTCAGAACATGAATTTAGAAACATATTACTAGATGAAATTGATATGGTAGATAATTTATGTTTGATTGGTAATGGTAAAAAGTTATTTACTTTAACAAAAGAAGTAATTCATTTAATTCATAGTTTTGATAATAAAATAATAAACATTGTACCTATACAAAATGACAAAAAGATTAATGGATTAGTACTTATAACAAATACAGATGCAATTATCATTGTGCATTCAAAAAATAATATATTACGCTATAAAAAACTTTATCTAGGAGTAAATGTTAAAACCCTTTGCGCAGGACTTAATCATCAATGTAGCGATAAAATATGGATTGTTTATTCCGATGAATCCAAATTGTATTACATGATAATGACACTTTCTACCGAAATATATAAGAAAGTAAAAATAGAAGAAAAAAATTTTATTTGCCTGCAATATTATGAAAAAGATAAATTTGTAGGTCTAACTAAAACAAAAGAACTTCATGAATTATCCATTAATACAATAGAAAATTGTGTAAATGAAGAAATTTCCAAAGATGATTTTATAAATCTTCATAAAGATATGTTAAAAGGTACAGATTTAATTGTTGAACAAATCTATGAAAGAGCAAAAGAATTAGAATTGTGGAATAAAATACTTCTTACTGAAGAAGATAAACTTTATAGAATAAATCTTTATGCTTGCAGAAAGAAAATACAAATGTATCCTAAAATGACAGTATATAGAATAGCAAAACAATTATTTCTTAATATAGATTTTCAAGAAAATTTACCAAAAAATGTTTATATTGTTTGTTTCTTAGTATCCAATCATGAAACAACTTTCTCTATCAAAGAAATAGTAAATAATGAAACTTCAATCGATTTACCTATAGTAACAAAAAAATTATTTAATTCTTTACAAATCAGAATGGATTTAGTAACAATCATAAACGTAGAACAACCATGGTTTCTTATAAAAGATTTTGTAACAGATCCAGTTATAGAGAAGAAAAAGAAACAAAAAGAAATGCAAATTAAGAGAGATAAAACAAATTTTATAAATGCTAAAATAAATCTTATAAGGAATTTAATGTTGACAAAAAACTTAACTATGAAGAAATTATCAGAGATGAAAAAGAAGATAAGAAAAGAAATATGTGACTTTTAATTTAATAATGTAAGCAATCATTTCATAACATAAAATGTCTTATGTTATTACTATCACAATTTTTTAAAAAAGTTTATAAAATCGTTTATGTAATTAAGAACTGGGCATTTCTATTATACTTCCAATACTGCAACTGGAACTCTTTGGTTGTTTCACAGAATTTCTAAAACTATTTTGTATTCTGGGACCACCAAGTCGATCTTGAAGTGTATCTAATGATTTAGCACTTTTCTTCGAACCATTAGCACTACGATCTTCTTGTTCATCGTTTTTATTGGAACGACGTTGTAGAATTTTGGTAACACAGACTTTAAAGTTTTCTGAGAATATACCATAAAGAATAGGATTGACCACTGTATTCAATTGAGCTGTAATAAGTGCCCAAATGAAATGATGCGATCTCATGAAAAAATCAGTTTGTTTAGGTGGTCTCTGAGCATCAATGAAAAGCAAGAGAGCGATGATCGTTATTGGCAACCACATGACTAAAACGGCAACTACGTTTAATAATAAAATCCGCATGACACGTATATGCTTGTGAAGACGGACTTCCTCGTGTTGTGACATACTACCAGTTCTACCAGTACGTTCTATAACTGATGATGTAGATAATTTTCTTCCAACCCATGGTATTAATGATCCTACCACCGATAATTCCGAATCTCTTCTGTTTCCTTTACCAGTTGTTAAGTCCTATAAGATATAAAATTTATCAAATTAAATTAAAAAGATTTAGCAA\n>XM_033905725.1 PREDICTED: Pecten maximus uncharacterized LOC117343383 (LOC117343383), mRNA \nTACCGCCAGAGGGCAGTATGTCTCGCATTACTTCCGGATAGTTCAGTAAACAATGGCGGACCGTAGCAACAGTATAAACAAAGAGAATGAAGACGTGAACCTGCAGACAATTGATCGGCTTACTGTTCAAGAATTGAAGAGTTTTTTGCGCCAGCATGACCAGCCAGTTAGTGGACGATCAACTGAATTAAAGGAACGTGCGAAAGGTGTGTTGAAACTTGGTATCAGACGGAAAGATATACTACAGCGGGAAGATGAAAGACAATCCACTCTCTACCAAGCCCGTAAGTTCGTGTCCCCTCTTGGCGAAATTTTACCCCACCCATCCACATTGAAGAACTGGACCGACAATGCTAGGCAGATACCTGTGTTTCTAGAAGATGCCTTATATAATTACCTTGTTCTGAACAGACAGCGGACGTTTGATAATGCTCCAATGGGTGCTGTTAAACAACTTAAAGCAAAGGTCTTCTATGAAGATAGTCATGTTCACCATATACGATACAGCCCTATCACAGACCTCTGTTCTCACTGTTATGTATCATGTAAAGTGGTACCATCCATGCCAACGGCAGATGTGAACAAGTCTCCTGACTACAGTGTTTGGATATGTATATCGAAGCAGACTGGACAAGTGCATGCAGCTGATTGTAACTGTCCTGCAGGAAATGGAGAATCGTGCAACCATGTGGCAAGTCTTCTGTATGGCCTTGTTGACATCACAGAGAAGAAGCAGTCTGGGGAATTAGCGCCAACCGCTGAACCCTGTAAATGGAGCCAGCCAAGAAAGAGGAAATTGTCCCCCAAAAAGGCAGAACAGATGAAATTTCGAAAATACACAAATACTGGTAATGCTGATAAATCAGACTACACATTATTCCGACCATCTGGAGTTCAGCCACCATTGGATAGGAATTCGTTCCTAGCAGAGATGAAGGAAGTCTTGCCAAATGCAGGGTACATGAAGCTGTTTCCAAAACAGAAAGCTCCAGAACATGTCTTACAAGAGTGTTGTTTACCAGAACCAAAATTTAATTTTCATAATAGTGTAGACTTGTCTTCAAGTGCTTGTCAGATTGAGTTTGATAACTATGTACAGGATTTGATAGACAATAGTGCATGTACAGATACTATTGAGGGATTGACCAAAGGACAGAGTACAAATGATGTCTGGCTGAAAGCAAGAATAGGGCGGATCACAGCATCGCGTTTCGGGGTAGTGTGTCGCAGGAAACAAGATGTAAATCCAAACAGTCTGGTAAAATCTGTAATGGGTTATTACTCTGATAAAACCAACGATGGAATGGAATGGGGGATTAATCATGAAAGAACAGCCAATCTGGAATATATTCAGAAGATGAGAAGCAATGGTCATAGCTCAATAACTGTGCAAGAGAGTGGACTGTGTGTTATGGTAGATCATCCATATATAGGTGCTAGTCCTGATGGTTTTGTTTCATGTGGTGACTGTGAAGACAGTAAAGGACTGGAAATCAAATGTCCTTTCAAATATCGAGACTTTTTCTCCAAAACATGCTGCTACACATAA\n>XM_034976728.1 PREDICTED: Maniola hyperantus cytochrome c oxidase assembly factor 6 homolog (LOC117989378), mRNA \nAGACATTTGTCAAATACGAAATATCCGTCCTACAATTTTCTGCGAGGTTATATTTTGCTCTCAAGATAAAAAATCGCTAATTTCATTATCTAAATCGAAAGCTTCATCAAGATTTGATCTTTGAAACAAGTACATAGGCTCAAAGATGTCATTTCCTGATAAACAACAACGAAAGATTTGTTGGGATTCTAGAGACCGTTACTGGGAATGTTTAGACGATCAAAGTATAAAAGACAATTCGCTAAAGCCTAAAGTATGCGCGGAGCTTAGGAGAATATTTGAAAAGTCGTGCCCCCCCAAATGGGTGACCCATTTCGATAGGAAGCGAGACTATGAAATATTTAAACAAAAAATGCAAAAAGAGGGTTTTGACCCTATTAAAGACAGTAAATAATTACTCTAAGTAATTTATTTAATTGTGATTGTAAATATAGTTTATTTATTTAGTGAAGTAAATTGTTTTTATTT\n>XM_046179821.1 Filobasidium floriforme uncharacterized protein (HD553DRAFT_310221), mRNA \nGCGAGCTACGTATACATCAACCGGTAAACGTAGCTGTCGAACAGGCCACGTTAAGGACTTCCATTAGGACCGAGAAATGCAACTGACCGACGACCGACCTACCCGGGTCAACCGATATTCGGCTCCCCCCTTCTTCCCTGTACCGGCACTCCTGCTCGTCCTCATACCTTTCCAACTCTTCGTACACTTCTCTTCGCACTCGATAGCCGCCTACGTCAAGGATACAGTCGAGGGTCTTCTCGGGAAGGGGTTCGTTGCTGCGAGTTTCAAGTTTCTGCTCGGAGCCGTAAGCACCTCTTGCCCGTCGTCCACCGCATTTCGCCGTCTTTACAACTTACCGGACTCGACCTTGTTTATCGAAGCACGGAGCGGAAGCCTCGTACATGCTATCCCAATGCATCAAGTATCACTGCCCAGCGGATGTTGGTGCCAAGTACGTCGTGACCACCCTCTTGTTCGGGTTTGTGGGGATACAACAGTTCAATCGGCAAGCGAGGATAGCGGAGAAGGGGAAATCCAAGGGTCTTTGATGAGGGAGACGCTTCTATACCGGGCTTGTGGCCGTACAAGAGATGTCGAGATTAGGATGATCAGAGATGGACGAGATGATAGTCCAGCTGGCGATCGCGATAGCTGTTCAGCTAGCTAAAGGCGACCTGGGTAGTCTTGACCATAACCGTGCGTTTTGCGGGTATGCGAGCCGACAGTATCAGCGGGAGGGATCGGAGACCATGACAACAGATGACGGAGAAGTTGGGCATGGTCATCGGGCTTCTCTTCATGTTGTCATACTTTTACATCTACTCTAGGCGAAATACAACTCGTGACA\n>XM_009314119.1 Trypanosoma grayi hypothetical protein partial mRNA \nATGCCCTCAACGGGTTCCGGCTACACCTTTGAGGACTTCCTCAAGCGGATGGAGCGCAGCCCCACGTCACATATGTCGCCACTCTACCACGAGCATCGGGAACTATTCGTTGGCCGCCCCGACATGTTCACTCGCGCTATTAGCTCCGTTTCGTGGGAGAAGGGGTGTGCGTTGGTCGACGCCGCCTACCACTCGCAGCCCATCGCAGTCGACACGTACCGTGCCCTGCTGGCCCGCATGTTGCTGCACAATCGCCATGTACAGCGCAGCGGTGCCGGTAGCCTTGTTATGTGGAAGGCGGCCTTCCGCACATACTCGGAGGCCATCCTTTCCCACGGAAATGCTGTTCCCACACGCATGACTTTATCCACGCTGCGCTTGCTTGCTCCGCACCGCCAGTGGGAAGCCGCCGTGTCTTTACTGAAGCTCAGCCAGGCGAACGAGAAGCTGACACTTCCGATGCTTGTTGACGCCGCTCGTTGCTCAGCGACGCCAGCGACGTGGCCTATGGCATTGGACTTTCTCAGCATGGTGCATGCGCAGGCACCCAACATGCTCGCTGATAGCATACAGAGTCTGCGGCCGCTTGGTACAAGCGCCGCAACAGTATCTGCTGCTGCGAATGCGATGCTGGTGGACAACAGCAAGGGGCCGACGGCAGAACAGAGACACGTTTTGTCGGTGCTTAACGATGTGGTAGCGGCTGTGCCATGGAAAACGGCACTGTCGAACGAGATGTGTGTGTCCTACCTCACGTATCTTGCCGCGAGTACGACGTACCCATCGCAGGAAAAGACTGTTGCGCTCACAGCCGTGTTGCGGCAGTACCCGTGGGAGGCATTCAAGCAGCTGATGATGAGGCAGAGTGTTGTGCTGCCGGCGGTCTCTGGTGAGGCCACTTCGCCGCCAATCCCGGAGGACAAGAAACTGCTGCATCAGCAACAGGAGTATAAACTGGAGGCTTCACCACTGAACTACCCCGCAGTTCAAGAAAGCCTGCTGCTGCTTAAAAGTGAACCCGAGACAGCGGTGCCATTTATTGCAGCTATCGTTGAGAAACTTCCTTCCGCCGAGGTCTCCGCCTCGTTTCTTCACGAGACGGCCGACATACATCGCGACACTAGGGTTGCCGCTGCGCTGCGCCACCCCTTGGTGGTGAGTGCCCTGCTGCGAAAATGCGCGGAACATAATGAATGGCGTCTCGCGTCCTCGGTAATGCTGTCGATGTCCCCAAGCACGATTCCATGCGACGTAGCCAGCACGCTCGTGCTGCAGATGCGGGCTGCTAAACAGGCATCCCTGGTGGTGGAGATACTACAAAAGTGCATTGTGCCCTCAAGGACCATGCTGACGCAAGAAGCAATGGAGGCGGTGCTCCTGTGTGTGCTCGCACATAATCGCGCCATAACCGAAACCGCATCACTCACATTCCCCAAGACGCGAAATACGAACACCACGGCAGTGATACACTGGCGCTCTGCGTTGAGTTGGGCGGTGGACTTGCTGCAGGACGACACGGAGGGACGCATTGTGGAGACAGGCTCCGCTCCCTCCAAGGGCGCCGTGAGACACACGCATACCAAGGTGATTCCACGCCTAAAGCCCATGTCTTCTCGCATACTCAGTCTTCTTATTCACATTTGTGTGAACGCCGGTAGTCCGCAAGGAGCATTGCAGGCAATGGGATATGCTCGCACTGTCAACAAGACGGAGTTGGCCATGTCAGATGAGATCCAAGCGCTTCTGTACTGCATGCTGTACGACCG\n>XM_020925385.1 PREDICTED: Boleophthalmus pectinirostris protocadherin beta-15-like (LOC110160707), mRNA \nATGATGGAGATTAAAAGGCCATTTGCAGTGGGAATCAGCGCGTGGATCGTTTTGTGTTCGGCTCTACTGCTGCTTTTTGGACAGTCCGTTTTGGCTCAGATCAGATACTCTGTTCCGGAGGAGGTGAAGGACGGGACTGTGGTTGGAAATGTGGCAAAGGATCTTGGTCTTGATGTTGCCTCTTTGGGTGAGAGACGGTTCCGTATTTCTGAAACAAAGGACACTATATTTGCTGTAAACTCTGATAATGGCGCTTTGTACGTCCACGGGCGCATTGACAGAGAGCAGCTGTGTCAGGGCAGCGGTACGTGTCTGATGGAGCTGAAGGTTCTGGTGGAAAACCCTTTGGAAGTTCACTATGTTGTTGTAGAAATCACCGATGTAAACGACCACGCGCCCACCTTTCCCAAAAGAAATGAAACCATAGAAATAGCGGAACATACCTTATCTGGAAAACGATTTCAGCTGCACTCTGCTCATGATCCTGACGCAGGGATGAACTCAGTCCGCACGTACAGTTTGTCTGCTAATGAACATTTTGACATTAATATTCGCGAAACTAATGGTGAAAAAATACCATTTCTAGTTTTGAAAAAAATGCTGGACAGAGAAAAAAGCAGTGAACATTCTTTAGTGGTCACAGCGGTTGATGGAGGTAAACCCCAGAGGTCAGGCACACTTAATGTTACCATTATTGTTCTTGATACTAATGATAATAGACCAGTTTTTAGTCAAGAGATTTATGAAATTACAGCGAAAGAAAATCTACAAACAGGCACGTCAATTTTTAAGCTCACAGCTACAGACCCAGACGAAGGAACAAACGGAGAAATTGATTATAGTCTGGCAAAAATATTAAAGCAAAGAATCTATGATATTTTTGAATTAGACACGAAAACAGGAGACATTGTTGTAAAGGGGCACATCGATTACGAAGAAAATGATTTCTATGAATTGGAAGTGCAAGCGTCAGATAAAGGCACACCTCCATTAACAGGTGAATGTAGAGTTATTATAAAAATCATAGATGTAAATGATAATTCTCCAGAAATAGACGTGACTTCTCTGTCAAACACAGTGTCTGAAGACTCCAAACCAGGGACAGTAGTTTCTCTCATTCGCGTCAAAGACAAAGACTCTGGTGTCAATGGTAAAATCATCGCTCACATAACAAACAACGTGCCTTTTGAACTCAAACCCTCGTATAAAGAAAACACATATTCAGTTGTCACTAAGGATTTCCTGGACAGGGAGGAGGTGTCACATTATGACATAACTATAAAAGCCACTGACTGTGGGGAGCCTCCTTTATCCACCACTAAAACTCTGAGTATTCAGATATTAGATGTAAACGACAACAGTCCACAGTTTGAACAAAATCCTCTGTACTTTTATATTGTAGAAAATAACGTGGCAGGGACGTCACTGTTCTCTGTAACTGCATCAGACAAAGACAAGAATGAAAACGCAGATATTTCCTACAGCATTGCGCGTGCAGGACAGGAGAAGGACGTGACGCTCTTTTTAAACGTGAACGCGGAAAATGGTCAAATCACTGCTCTGAAAAGCTTTGACTTTGAGACATTAAAGTCTTTCCAGTTTCAAGTCGTGGCCTCAGACTCTGGGACTCCGTCACTGAGCAGCAACGCGACAGTGCACGTGTTCATCCTGGATCAGAACGACAACGCTCCAGTCATTCTGTATCCAGTCAGGTCTAATGGTTCTGCTGAAGGAGTGGAGGAGATCCCCCGCAATGTGAACGCGGGACACTTGGTGACTAAAGTCAGGGCCTATGACTCTGATATCGGATATAACGGCTGGCTGCTGTTTTCACTGCAGGAAGTGACTGACCACAGTCTGTTTGGGTTGGACCGCTACACAGGACAGATCAGGACACTTCGCTCGTTCACAGAGACAGACGAGGCCGAGCACAAACTCGTCATACTGGTCAAAGACAATGGCAACGTGTCCCTGTCAGCTACAGCTACTGTGCTCGTGAAAGTGGTGGAGCCCAGAGAGGCTTTTGCAGCTTCTGACGTTAAGAGCTCCTCTAAAGACTCTGAGGACACTAACGTGACTTTTTACCTGATGATAACTCTGGCCTCGGTCTCAGCTCTGTTCATTCTCAGTATCATTGTGCTGATTGCAATGCAGTGCTCCAAGTCCAGCACTGACTACACCTCCAAGTACTTACAGGACACAAACTATGACGGGACTCTGTGCCACAGCATCCAGTACAGATCTGGAGACAAGCGCTACATGTTAGTTGGACCCAGAATGAGCGTAGGATCCACTATAGTCCCAGGGAGCCAAGCCAACACACTGGTGCTGCCTGACAGGAGGAGGCCCTCTGAGGAGGACACAAACTATGACGGGACTCTGTGCCACAGCATCCAGTACAGATCTGGAGACAAGCGCTACATGTTAGTTGGACCCAGAATGAGCGTAGGATCCACTATAGTCCCAGGGAGCCAAGCCAACACACTGGTGCTGCCTGACAGGAGGAGGCCCTCTGAAGAGGTAAAGAGACAAGCGCTACATGTTAGTTGGACCCAGAATGAGCGTAGGATCCACTATAGTCCCAGGGAGCCAAGCCAACACACTGGTGCTGCCTGA\n>XM_042877628.1 PREDICTED: Lagopus leucura von Willebrand factor D and EGF domain-containing protein-like (LOC122183568), transcript variant X25, mRNA \nTTGCTCAGTCCAAATGCCAGGAGGCAGTGCTAAGATACAAATTTTTAACTTATTTAACTGTTGGAAGAGTTGGGTATCACCTACATGGCTAATGTGATATCCCTAGCTAGGGATGGTGAAGTCCAGGTTCACTGGGAAGATAGTAGTAAGCCCTTAAGTAGCAAACTGTTGCTGGGCTTCAATACAATCACATCTGATAGGAAAATCAGAGCAAAGATACAGGCCCTCCCCATGTTTTGCTGGAGCAAGACTCTGCAGTGGCTTTCTGCCTGTATTTCTGAGGACTTCTTGATAAACTAATGATGATTTTCACCGTGTTACCACAGTGGTCAGCGTTGCATTGTGTCTGACAACAGTATGCTGATAGCTCAGCTGGCAGGAGTTTTGCAAGAGATCAAGGTGCAAGGTAACAACCAGGCACTCCACATAGGAAGCAACCCAGCTGGAAATGTAAGATAATATCCAAAATAATTAAAAGCTCCTCACACTATATTTCCTGCTCGCATTCTGTCTCCAAGACATCTTCCACGGGAGCAATTCAGCTCTATGTATACACTGGGACCAATTCTGCCCTACTGAAAATATGTGGAATTTCATGGCTGACTTCTCCAGGATCAGGATCAGTCCACAGAGAAAATATAGTGTGTTGTGTGTGTTCGGACCATCAAACCCCAAAGCTGACCCTACACCCTATGCACAGAACCTCACCCTGCCCAGCAGAGATGTGTAGGTCGAGACTCATCATGGAACTGTCTGCACTGCCTGGAGCACAAGTTCAGTGTTTAGTGCCTGAATGCAAACTTGGTTCCACCCATGAAGACTCTGGTGCCGCAGCCCCAGAAGTTTCTTCTCCCTCTCTCCTTATGCATACGTATATGGAAATGTGTCTGAGGGCTGCTGATCCAAAGGGGCTCCTTGGCAGCAGGGAGGGAGAGATGCATGGATGATTGTCCTGCACATTACAAACAACAGGGTAGCCTCCCCGTAGCCATGATTCCCACCTGGGAGGAGCTGACAGCCTGAGGGAGGACTTGTCCACATTTACACTGTGTCTCCAATGTGCTCTCCTACAGTCACCTAACAGTCAGGTGTGTGCAGCGTGGACAAATGGTAAAACCTTCTTACACTCCTTACTGGACATCCCTCTCTCCTTGTCCCATGGAAAGCAATACAGATAGCACCAGCAACGAGCAATTTCAAGCCCCAATTATTGAATTTACTGACAGCTCATGTGTTTCCATGGAATTACCATGCCAGCAGGATCAGGCAGGACATTTCTTTAGCTACACCTTTGCATTTTTGAGGGTTTGAAAAGGAGCTGAAATGCTGTTTCAGGATGACAGGGAGAAGAGAGGCAAAGTCTGAAGAGCACAGAAACACACTGCAAGCACAACATAATTTGGACAAATAGAAGTGCTTAGTTCTGTTTAATGTGAATTAGCTTTCAGAAGTGTTGCTGGTTCTCAATACACACGTGCATTGGTGTCTCAGAGGCCGGAGGGGAGGACCAGTAGTACTGCAGGATCCTTGCTCAGTGTCTGCCATCAGTGAACCATACTGCTGTGCGATGCACATCTGACCCCAAAACAATGGAAGAAGAGTGATAACAGAAATGAACACTGCTGACAAGGTAAACAGAGAGACATGGCAGCCTGCTTGTTAGAGACAGCTAATGCTTGAGGGAACTCTGCATTCAACTCCATTGCAAGAAAAAAATCTAAAGACGAGTTCCACCCATTGAAGTGAATTGGCTTCTCAATGTTTTTCAGTGAGGTATCATTCGAATTTGGCTAGGAATCTTAATATATTTTTGACTCTCCATTATTACATTAATTTGAGTTAATTGCATTTATGCGGCTTGTTCTTTTTGATAGGCTTCAGAGCAAATGCTGGGTGTAAAAATCACCAGTCATGATACAGTGGTTTCCTAACACTTAAGACAGTTTCATAACAGAAGAAAAATTCTACAAACAGATGCTCTCGCTTCTCTGTAGATGGAGAATATAAATGTGTTATTACTGTGGAACTTCATAGTGCAATTTATGTATTTGGTTTATTCATAAGTTATGTTCACATTTTAAGAATAAACATATTCAGTTTTCCACTGCAGATAAAATTATTCTCAGATTTTAAATGCTGCTTTTCATCAGATTAGTCTTGTTTGTAAGATTGTGTAAAGTAATAAAGGTACATTTTCCTGCTAAACGCATTTGGGGATGGAAAACACCTAGCAATAACAATAACAGCAATTCTTGGCATTACTGTAGCAACTTTCATCCAAAGATCTCCAAATGCTTTCCAATAAGTAATTAATTAGGCCTCACAGCACCCTGGAGAGTTAATTACAAATTATCAAGCATACTCTCAAACCATTTCCATTGAAATTATACTTGTTCCCTTTCCAGAAGAAAACAAAATACGCTGGCTATCATACCATGACCTTTCAATACCATGATTCATTTTGAAAATGTAATTAGATGAGAATTTGAACGTATCCAGTTTTAGGAAAAGCTAATATAATTATACCTGACCACAAAACTCATTAGAATTTTTGGTTTCTTCAGTGAGATGATACTTTTTAATCTAACTCTTTAATAAAACTGCAACATCTATAGGAAAAAAAAAAATGAAATGCAGCTGGATATCCCAGTAAAATTCCAGAGAGATTTTAAATTGTGGACATCCATCTGTTCTTCCGTCACAAGAGTGTTTGGTTTTGAGGATGTTTGATCCAGACTTTGCTTCTGACACAGTCAGAAGGCAGAAGGACAAATCAGTGTTGCCTCCAGACTGAGCATCCCTCCAGAAATGTAGTGAGCTCCACTAATTCAAGTGCTGCAATCTGGGCCAGAGGAGGTATTTGTTAGAGAATGTTGTTTGCCACAGAATGTAGGAGGCAGAGAAAGGCAAGAAAAGGCTGAAATCTCAAATCCATTTATAATGGAAACATCCTGCATTTCCTGAAGCACTGAGTAGATGCTACAAGATATAATTCCTTCCTACCAAAAATCTGAAGCTGTAATTTTACCTTCATCACATAGAATCATGGGAGTAATTAAAAACACTTTTACTATGTCTTTTGCTGCAACATAGTGATTGTCTTGTTTTGATGTAAGATGAAAGTAGTTTTCTTGCATAATTTTCTGAAGGCAAAGAATTTTCTTCTTTTACATCCTAGTTTTGTAGGAAAGCAAAATAATGCTTGTTTGCATGGACAGAACTTGCATATAATTTGAAAAAAAAACCTAGTATTTTATCGATGAAAATATGGTACAAATGAAAATATATCCGCATCTCATAGATTTCAAAGGCTGCATTAAATTAACAGTGAAGATCTATTTTTCCTTATTGTATGGGAACTGCTGAGTTACGGCCTGAACCTCTGATTGATCACCTGAGGGAATCCACCTCTCTTTGAGAAGAAAGAACTGTCTACGGCTTGTTCAGAGCACACAGGGTCTGGACAAGAGGAATGCAGAGGACTCTGGGCAGTCCCATTGCTGAAGAAAAACTCTAAACAGGCATTCTTCAGGATTCAGTTATAGAGTAAAGCAATATCTGGACAAGGTGACTGACAGACCCTGGTCCCCCACTGGGGCAGGACTGACCTACATGGATATTTCTCTGAGCAAGGAAGGAGACATTTCCTAAAAAACTGTGTTCAAGATCTGCTTTCATTTGAACCTATCCTGAAGTCAAAGAAGTTAATGTGGCTTCATCTGAGAGCAGAATTTTGTCTAAAATCTTCATTACATGCCAATTCCACGAGGATAATTCATAGTTAAGGCCTCTGAACACCTTTAAAATAATCCTCTTTTGCTTCATATAATGAATAGAATAGATAGGGAATTGCTTTCCCAGACTTTCTGAGGAAACTGAAGCAATGTGTTAAAGTTTTAACAGCTTTTATTTCTCTTTTCAGATCTTAACCCAGTATCAAATATTAAAGTCCTAATATATTTAAGGAAAGCAGAAGTTGCTGTTATAATTAATTTCCTATCTGAGGGGAAAAATAAATGTATTGCTAGCCCTTTTGGAAAGAATCTCAGTTGCAGACTTGTAGTGATCACCTGGAAGAGCATGCAGTGATTTCATGAAATCATACTGGAAGAGGAAAAGGATGATTTCACAGGAATTCTGTTGGGAGGATTTTAGATGCTGCAAATGAACTGGAAAAAGAGGCTGAGAAAATGCTAAAGCAGCATAATTTTTGTCTTCTTCCAGTGGAGGAAAATACCGACAGATTTATTATACCCAGACTTTTGCTGAGAAACAAGCATTTGGGATCTATTTTAAATTAATTTTGCAAGAATTTTATTTTTTTTTTTAATGAGAAATAATTTATTTTCCTTCTGGTTAAATCTTGAAATACTAGAAGCAGTATGAAAGAAACACTTGTAGATAAGCTTAAAAATTCCAGTATTTTAATTTGCTTATGCATTCACATCTTGGTTTATTATTTGCAGTCTAACAGTCTTCATGCTTAGTCTAAAACCTTTAATTTCCTCTATAATATGTATCGCCGTGAAAGTGAACATATCAGAAGACTTAGGCACTACAGACATGACAGCAGACAACCCTTTGAAAATGTTTTTAAGGTTTCACTTGAAAAGGAAATTATGCCAATGGGCATTAATCATTTTGGAGGCTTCATATTGCTTCACAGATATTTATAATGTTAATGAAAACAGTGACGCTGTTATGAGCTACTGAATCAAGAAGTTCATTTGCCCCAATAACAGCAGGGGCTTGAAATGAGAAAAAAAATCTTTCAGACAGGGATGCTGCAAAGTTCTGAGTATGGAAAATCTTAGGAGTGTTGTGACATTCAAAAATGTCTCCAAAGATGTGTTATGCCAAAAAGCCTGAAAATAGGCACATGCATATCTTACCTTTCTGCATTTCTTTGCATTGTAAACTACACAACAACATTTTTTTTTTCTGTCTACATCACTTTACTTAATAATATAGGGCAGTGATAGAGTTTTAAAAGTTCCTTGTGATTTTTTCATTACAGCATTTTGATTGGTTTTAAGGTTAACATAAACTGATCTTTTCTGCCTAATTGGCTTTTTTTTTTCTCTTTTATATAAGCAATTTAATTCCCAGTTGTGATATATCATGCAGGAGAAATATATATCAGAGAAAGAAGAAGATATGTCATGTGGAAAGGAGGAAGGAAGGAACTGCAAGAGGGATAGGCTATAACCTTAAAAAAAAAGATTGAAAGTTATCCAGAGTTTTTTTCTGTGGGGCCATACAATCTGTGTGTGATCTTGAAATGATTGGTTTTGGTCACAGCGGGCAAGATGTTGAATGTGGTCTTATTTGTGTTATTAGACATCTTCCATTTAATGCCATGGCTGTAAAGGGTGATACAAGTGTTGGCTTCATTTCAGAGTCAGTAGTACCAGCAAACATAGCCCAGCTAAAAATAATGAATTTTCAACTACTTATTTTCCTATTTTGCCTTGAGGTTAAGGCACTTTAGCATGCAAGCCTTCTGCAAGACATATTTGAGTCTACCAAATGTAGTTTAGCAGGTAATGAGATGCATTTTTTCATCAGGGTCATGCTACCTAATCAGACGCTAAATGTAATTATTCACGATCGAACCTCAAATGCAATTTTAGAAAGTGTCTGTATTACAAACTAAGAAATCAACAGGAGGACTGCTTTAAACATGTTTTCAGTATGCCAACATTGCCTTTAATTATTTTTTGATGTTTTATATGAAGTCAAAAGACAAAAAGAACAAGCTCTGAAAAAGTTGTGAAAAAGAGATAGCATGTGCGTGTCAGAAGAAACACAGGGAGAGAGAACATGAAAGAAAGTATAGAAAAAGAAAGGAAGTACTAAAAAGATGAAGAAACAGAGAAAGAAAGAAAGAGAGATAGAGAATAGAACTCACATATAGCATTTGATAGCCGTAATTGCTCTGCTCTTTTATAAAGGCTTCCTTTTTCTGATTAGAGACTTTAAGATAGTTACTACCGAAAACAGTATTTAAAATTCATTCTTTTCCTCCTTTTTCTTTGAATTCTTCATTATGTAAAACATGTACTTCAGTGCTCTTGAAATGTTTTGTTCTCTTCATTAAATTGCTCCATTTTTATTTTAATGTCCCTGTAGTCTGGATTTTTCTCTAAAAATGTCTGTATATCTGTTAAGAACACTTGTTCTTTCAGAACCTGTTTTCCCTTTTATTTTTTTAATTCTATTTCTGAGTGAAAATGTGATTTTGTTTCTTTTTTCTTTTTTTTTTTAACACCTATTTGTCTTTTTTCTTTTTCTTTCAACAATTCTTTTGCACCAGCAAAGGGCCCATCATTCCAGACCACATTCATTTTGTTTAAATCTGGCCAAAGAAGGACTGTGCACGATTAGTATATACAATAGATGAGTAATGATGATTTTTATTCCATCAGTATTAATTTTATGCCCTTGCCTAAAGATTACTTGTAAATGCTTAGATTTTAAGTATTAAAGTAAACATCACCCCTATTGATATTTTGGAAATGTCAGGTTAGTTAATTGGGGTAATATACAGGTACAAGTTTCCAAACCATTATATCAAACTTTGCCCACCATTGGGCTCATGCTCTGTCAGCTAGCAGAGGAAAGAAAGCCAGAGGAGCAGCTCAGGCCACCATAACCCATTCTTGCCTGCTCCTCTCTACTCTTTTTTTGCTCCCCAAAGTGAGTTCAGCAAATGCCTATTTAGTTGGACCAGTTCTTTTGATATAGGCTTATACGTCTTCACTTAAGGAAACGTTTTTATTGAGGGAGAAAAGCCTCATGACGGTATTTGTTTTTACTGTGGGTTTCAGCACTTCAAGAGTTATGGACACCATCTAACCTGCACTAATGTGCAGAAGCAGTATCAGGCTGATATACTGAGCATCATTACTTACCGTGGTCTTTTTAAGAAGTTGGGAATTGAAGGCTGAAATCTCAAGACAGTCCTCTCAGCAGTCCAAGGACTTGAGTTTAGAGTTATCTGTAAATTCTGTTTATGTTTATCCAATAAGAACTCAGCCAGTGAGTGCTGCAAATAATCGTTTACTTAAACATAAATGGGAATTAATTAGTCTATCAAATGAAAGGAAAGAAGATTCTGAGCCAGGAATGCACTCATAGTCACAGTAGCACATCATAACTTTGCTCGATGTACCTAAAATTTCTTTTAAGTGTGGCTGCCAAATCATCATGATTCTTTTGTTTATTAGCCAAAAATCCTACCCAAAATGGGAAAACTTCCAGTCTTTTCTATGATACTTATGACAGCCTTTTTTAGTAGCTGATTTCTTATTAGAATATATTCCTCTAAAAAAATACATTTGGCTATTTATTGATTAATGCTCATTTTTTAATGGAGCTGTTTTGCTAAGATTCAGTGTCAGGTGCATTTCTAACACCCCAGCTCCTCTGTTCTGTGCATCAATTGGCACACTCATCAGTTAGCCAGTTCTGCAATAAAATAAATTAATGGACTATCCTATTTCATTTCATGGCATCCGGCCGATGGAGTACAGAAACTGCTATAAACCCTAGGACTCAGTGGGACTGCTGGTATGAGGAAGGAGTGCAGCATTTGGCCCACATTTTGCATTGATCAAGCAGAATTAAAATTAGCACAGCAGTTTGCCTTGAATGAAGCAGAAAAGCGTGGTGCAGGCTATGCAGCCTCCCAACTACTAAATTGACCCCTTTTCCCTTTTATTTTCTCTTAGCTTAATTTTTGCCCTACTGAAATAAATGAGGCTACTTATACTGTGAAAGGAAGGACTGGATAATCTGACCAGTATAGCATATTAAAATTATATGTATTCTATGGTTCATAATCAAATATGATTCTCTTCCTGAAATAAGCACTATATGGCTGTAGTGATAATCACTAATGGGTCAGTTGGGTACCAGAGCACTGTAAATTCTGGTGATGAATACACGGGGATGCTGTAGACTTCTGCCTTGTATTATTTTAATAGAGAGCAGAGGAAAACAAGGGAAGATTTCCTCGGAGGTATACTGATAAAATCTCACTTAATTATGTTATAGATCTCACATTGCTTAATTTTTTTTCTTAAAACTTCAGCTCTTTGAATCGCATTATTTAAAAATGGATTTCCCTGGATGGGAAAAAAAAAAAAAAGAAGAGAGAATTCTTCATAGCTGGGAAGAAAATCTTTACACTGGAAGCTTAAAAAGCAGAGAGTAAACACAAACAAAGAAGAAAAATGGAGGACCAGCGGTGAAATCATAGGCTGAGTGATGTCATGGAAATAATGTCCTTAGAGGAGGACTTCATGCCAAAACCCAGGAGCAGACAGATTTCTGAGAAAGATCTTGATCATCAATAACTCCTGCTAATTCAGTGGAAATCACAGTCAGGTTGGCAAGCACTATGAATCATCTCTTCTGATCCCTGCATGCTTTTGTAGAAGAAATTGGAAAGGCAACATCCACGAGGAAATACATGAAGATCTAACCTGGCCTGTGTGAAAATATTCATGTCATAACCCAGACAAGAAACAAATGTGCCATCTCAGACGAATCCACCTTTCTCTCTTTGCATCTCATGGAAGACTTTGAAATTTCGGGACAAAATTGCATTCTCTTATTCAAAACTGAACAAAGCAGGGCGAGTCCTGCCGTTTTGCTGAAAATGCTCTGTATAGAAAGTATATGTACATTAAATTGCCTCTGTGACCATGTTTGACTCTTACTCTACAAATAAATGGGAGTAGATAGCTCCCTTCCCTCAGGAACTTCTGTCTGCGAAAACTGTGGATTGCTGGGATATGCAGATGAAACATCTCTTTCTCTCCACCAAGATATGAAAGCAAAGAGCTCCTTCCCCTTCTGAGCTTCAGGCCAAGGGGCTCCGACACACACCGAGCAAATGGGAAGATGTGTGATTAGGTAACTTCCAAACTTCAGAAACATTTCCATTTCAAATTCTGACTTCCTGCCATGCACATACTCTTCTGCAGCCAGCTCCGAGGCAATTTATTAACAACTCCAGTGGAGTGATATCTGCAGAATCTGTTTTTCAGCTTTTGACAGCTGAGCTGGGCTAATGTTCCTGTTCCAGAGTGCCGTCGTGGAAGCAGTGCATATTCTATATATTCAATGAAGAAGTGTCCTTTGAAAGTGTAAATGAAATCGCTTATCTGAAGTAAAGAGATAAAAAATCAATTTAAAACATTTTAGATTGTTTATCAGCATGTAAGAAAAAAATACAAGATTGACCAGGTTTTACAAAGAAAGTTTTAAACCACAAACTACCAGTACTTTTAGGTTGTATTTCCTGTTCACTAAATTAAACGTTTCAATGGATAGCAATGCATTTCAGAAAAATAAATTAAAAACAAATCAATAAACAATAGAATAAAACCTACTAAATGCTTTCAGTATTTTAACTTCTTAAATACAAAAGCCTATTGAAGTTGTTTCTGCAACCTTAAAATATAACAGAACCCATTGAGATCAGCACTACATCCAAGATCTGAAATGAGGGGTTTTAAAAAATACCTGAAATACTCTAAATATTAGATAAAGAAAAGTTAGAGAGGTGTTCAGGGAAAGAAAAAGGGCAATTTTTTCACATCAGGGATTTAAACGAATGTGAAATCATGAAAGTCTTAACACTGTTCTTGAACTTTCACAGAACATAGGTCTTACTTGGATGAATGTTACAAGGAGAGTGGAAGAAGGACTTAGACTAAAAACAGGATTGACATGCATGATGAATTACAGTTCATTAATCCAATTAATGAGTAATTTCAGAGGCTTTAATCCCAGATAAAGCTCCTTATTGCAGCTCTGTTGGCTAGTGATGCACAAACTAAGAGCCTGTCAGCAAATCAATTGTAAAATTCTATTAAATAAAGCCTGCCATACACTTCTGTAGCTTATGTGACAATATTTTGTCCAAAAAAACCCCAAAAACATATATATATATATGTACATATGTAAGAGAAGGAGAGGAGGGAGCAATCTCTAACCTTATTCACCCTGATTTGTAATATAAGAGTTCAAGATATATTTAAAATGATGCAAGCCAGCTGAATGCAACTTCAGATATTTATAAGCACTCTTGATTTAGAAGGTAAACATATGCCCCAGTTTCTGAAGTCATCTGTATGTATGATTTCCTCATACACATTCTGTTGACTAATGGGAGTCAATAAAGTACATCAGGCTGCTTTGGGAATAGTCTCTGTTCTGTTCTTAGTTTATTTTATTTGTGGTGCCACTGCATCCAAGTGATTCTTTCTGAGCGCTTCAGAAATAGACTCTGTCCTCCAAAAGTCTCACAAGCAGAGAGCAAAGAAAGGAGATAAAGAGAGGAAAAATTGTGAGAGTTGTCTTCATTGACTGTAGAATCATAGCACAACAGCTGACAGAGCAGTAAGTATGAAGCAAGCATTTGAAATTTCAGCTAAAAAGTCAAAACCTAAAAACCTAAAACCTAAAAACCTAAAGAGTCAAAACATGATTTAAAGCAGAAACAACAGTGTTTCACGGCTTCTCAGAAAACCAGGAGGACTCCCCTCCCAAAAAACCATTCCCCTCTGACTGAACCAGGCTTTGTATCCCTGTTATAACAACCCTCTCCCCCTGACAATCAAGCACTTCAAATATTCCCTTGCCCACCATAATGGAATGAAGAGTGGACCTTCACTAAGACGCCTCTGAAAACAGGCAGGCTGGCAACTTGCAGTGACAGCCATGTACTGACTTCTATGTAGCGACTTTGATTTGTTGAGTACTGGGCTACCCTGCACAAAAAACATAAATGCATTCCATTTTAACAATGAAGAAGGCTTGCAGTACTGTGAGAGGCTGTGCAACACACACAAATATTGATCCTGATCTCTTTGAACAGCTATGTCAATTACCTTCCGCATTCTCAGTTTGTAAAAGCTGTGTTACCAAAGAGACAAGATCCTGCTATGACGACTATTTAAGTAAAAGTGCATCCTTTCTGATATTGCCGAAGAGTATGCTGTGGGAGGATGGCAGTTCACACCCAATTACACACCATGATGGATTCATATTTCTTGATCTTTGAAGCCTTCTGAAACAACATTGCACAATGACCCTCAGTCTTAAAGACCAAATAAGATGATTAGTGACATGCAGAAAAAAGGCTCAGAATTTCATGCATGTCAGAAAAACTCTTAAGCACTTTCTGTTTGTGGCAGTGCTCCTGAACTGGAAGAAACTTCAGTCACTCCAGCACAGAGAAAGCTGTTTGATGGAAACAAACAACTGCAGAGACTATAAGATCGGTAACACCATTGTCCCTAAAAGGCTCCCATTTAACAAAAGATATATCACAATTTGAAACCAAAAGCAAAATACTTGTGTGCCTATTGCTAGAATTTTGGATTTCTGCAGTTTGAAAATACAATGGAAATCACAAATGTTAATGAAGATTCAGTGCACATCAGCGTGATGATGCATATTACTATAGCTGACAGATTTTGAAAATGAAGGTCATAAGAAATTGTGGCATTGAGAAAATCTTTTATGCTACTAGTGCTAAAAGTTTGTTCTATACCACGCAAAGCAAACGCTGTGTACTTCAGAAAATGCAGCTGTTGAAGGAAAATGAATCTGATCCACAGCTTAATCCCATTGTATGAATACAATCCTGAAAGTATGATGTCTATCCAGGAGAAACAATGCATGAATCAGTACTTAACTAATGGAAACAATAATTCCTGTAGTTGTTTCAATAACAACCATGGCTGAGAGTGTCCTAAAGGATCAACCAGGCTGAGGGTAAGACTGCTCAGCAGATTAGAAATCAAATCAAAATGAAAATGGGAGTGGAGAAAGAAAGTTCTCACCCTTGCAAAGTCCCAAGGAATATCAGAGCCACTCTGGGAGCATCTCCATGTGGGGATGTCAGATGCCATCCTTCACCTTCTCTCTGCACTGACCCACATGGGGGCACCTAGGAGGGTGGGCCAGTTCTGCCACCATCAAAATCTTTGATGACTGCAGCTTTTGGCCTCCCACCACAGCAGGCGTGTTAGCAGCCAGGTCACCAGAGGAACTGCCAAACATATGACAAGTGACAGGAATTGAAACACTTTGACCTTGAGCCATGCATAGGCTTGAAGCAGTGCATTTAGTGCCTCGAGAGGAGCAGGAGGTGTGAGACGTGCGTTTTGAAGAGAAAACTAAAACTGATAAAAGCACAAGATTAAGAAACGAATGAAAGTTACCAAAAAATGACCAGGCTGTTTAATGTGAGGAGAAAATGATCATGCTATAGTCCTCCAAATGCTTTTAAAGACAGAAAGGTATCCATATATCTTTTCTTCCGCCTTTGAAGCTTCAACTGTGAAAGTTAATCTAAAGGAAGCAAAATGCAGCCACTCTCTTCAGACCATTTGATATGCTATTGCTTGCAAACTTCCTTTAAAAATATCTTTCATAACTAAGAAAATTGCCATATGCTCACTGGCTTATAAATGGGAAATTAAAGATAAGAAAGTCTGAATAAAATAAGACTACTCGATATTAGCATTCCGAGCACTTGGCCAGTATCGGTCAATTACTTCACTGCTCTTCTTTGCCATCCCCAATCTCACTGAAAAATACAAGCCCACAACTTCCCCACGAGATGGATGTTATTAACCCATTTTTCACAGCTGAGAGCTGAGACACAGGGGAGATGGGTGACTCCCTCTGGGTCACCGTGCTGCTATTGAGAAAGCTGGAAATAGGCCTTGAATCTCGTTTATAAGACAAGACACGGGGCAGTTCATTTCAACCAGAGTGGTTTCCACATTGGGATTTTACAAGCTTACATTATATGGATGAATTAATAATTTGACGTCTCAAAAGCCTCCTGCTATTCACAGAACTCGTTTTAATTCTTACGTTACTTTTTTTTTGGCAAGACTGTGACGAGCAGTGTGAGGGCAGAGGTGTGGTCTGATGGCATTTATCAGTGTCAGTTGTCACCTTACAAAGCGTTATGGGGATGTACGTGTCCAGCTTTCACTGTTTGCACTGCTGGCAGATTGTGTGATCCCACTTTATTGCCTTTTGGCTTTTTCCCTTAAAAACAAACAAACAGTATACTGTTCCCTGGAGAAGGACAGGTAGTGCTTTTTACATCTAATAACGAGCCAAGAAGAAATCTATTCTGGAACACTCATTTTCACTCTGTTGCTGATTGTAACATCAGTACTTCTTTTCTACGAGCACTCATTCAGTCTGCTGTTCCTACTAACACATTATACATGACATTTGCTATGTATAGTTAAATCAAATTTTATTTATGATATTCTCCATAGTGATAATGCACTTTGTGTCCAGGCCAAAACATTGAGAATTCAGTTGTTTTGCATTCATTATATGCTTCTTCCTCCCCAACCATACAAGGAATAGCATCCAAGCGATGTTTGGATCCCCTGTCCCAATGCCAGGCAAGTCTCTGCCAAAGACAGTTCTGATAAGAGGTGTTAAATAGTTAAACACAATGGATTTTGATTTTTTTTTTCATTTTATTTTCAGTCATTAGGGTAATTTCTTATATATGGAACATCACTTGTTCTTGAATACTGTGATAATGCGAGTCTCCAGTTAAAGACTGAAGATGAAATAATTAAAAATGGCTTATTGACCTTGAAAGCCATGTCCTTCTGAGCATCAATATGAGATATGCACATTAATTAGTGTTTTTCAAATTCAATCCTTAACATTTACCAAAGGAGAACAGTTTTCTCAGTAAGTCAAAGACAGGCCTGGTTAGCCAGTAACTTATTACATATTTGTCCACATCACAATTTTCTTCATCCTTGATTTAATCTGCAAAAATATTTAATAAGGAAAGCTCTGTTGAAAATAACATGTTTATTAGAGCTTCATTTTTGAAAAAAAATTCTTTTGAATAGCAGACTGAATTGCTAGCATTATAGAGTAACCACTTCTTAATGAATAATAGAAATTTGAGATAAAGGACATCAAATTATTATGACTTATTAGAAGATACAAAGGACCAAATTTGCAAATGAAACTGGCTAAATTTTAACAAATATGTCCATAATAAATCTTAATTTCAGTATGACTTTCTAAAACTCCATTTCTATAGTATTTAACAAAAAGCTCTGCAAAGAAGAGCTTAAGCTTTATATTTTTTCACTTATTAGAGCGAGGAGTGGAATTTCTGACAAACACCAATAAAGAGTAAAATTTATATCTTGTCAATAGGACCTATTTTGTTGCTAAATTATCTCAGAAGTCTCACAGTCAGGAACACAGTAGTCTAAAGCAGTCAGGACATAGAAGAAACAATGGGCAGACAATCTTGTGCTAACTGAAAAGTGAGCACTGTAAGGGAACAGCTGAATTGGGGCCTGAACCTCTGATTGACCACCTGAGGTGAGTAATGAGCCAGCTGTGGGAGCACAGGTGAAGGCAATTCATGTGTGCTGCTGGAAGGGGTGGAGCCTGGCTGCACCTCTCCTGGACCCATTTAAGAGCTGACTACTGGGGTGGAAAGATCTTTTTGTGGAGATCCCTCCTTTGGAGTTTTACAGTGTGCCCAGGATAAGGTGAAGAAAGTAAGTTCAAGTGACTGGTCCAAAATTACACAACCACACTGATGCTCAGCTAGCAACGGGGACTTCCTTCATCCAGTGCGGCACACCATCGCTTTACATCACTCAGCTTGCAGAGAGAGAAGATTGAAGTTATTTGTGGGCAAATTTATGCTGATAAGAGAGAGCACAGAGAGCCCCAGAGATGGAAAGGTTTCAGAAGACACTTCTGCTGGAAAGCCAGCTCCTGAGTGCTCCCCAGCTGGACATCGCATCCTCCGCAGCCCATACCGCAGCACCAGGTTTGACTCGCTGGAGCTGCAGCGAACGTCTGCTCAGGTCCTGGTGTGTGACCACTCATTGCCACCAGCATGGTATCGGTTCATGATCAACAACACGCCTGCGGAAATGCCAACGAGATGCATTGAAATGAACAAATGTGGGACACAAGCTCCGGTGTGGCTGTCACTGAGGTCTGAATCCCTGCCTGCTCCAGGTGAAAGCAAGCACCTGATGGCCTGTGGTACCTGGCAGGTCTTTGGGGGCACCAAGGACTGCTGCTTGTTCCGGATACCCATCACTGTCAGGAACTGCATCAAGTTCTTTGTTTATCTCTTGCAGCCGACTCAAGGATGCATGGGCTACTGTGCAGAAGAAAAACTCCCAAGCCTGACTTTACAGCCAGTGATAACTTCTGAGCTCGTGCGAGGTCGCGCCCACCTGAAATGCGCCTACAGCTCACCCAGCTGGGGGCTGAGCTACACGGTGCTCTGGTCACGTCTGGTCGCCCCGGGCAAACAGGAGCAGATCCATCAGGACACCACCCTGCAGACGTGTTCCTACCTGGAGATAAGCAGCAGACATCTCCAGCTGGGAGACACAGTCTTCTGCACTGTGACTGCATTTGCAAGGGACACTTCTGAGCAGCGGTCATTGCCTGAGCAGAGCAAAGGTTTCTACGCTGGGATTAAGTTTTTACCAGAATCATTACAAATTGCAGAAGATGGCAAGGAGCACATTTTGACCATCCTGAGCACTGTGCCCATTACCTGTGCTGGGCATAACGATTCATGTAAAATCACATTACGGCTCAGTACTGAGGATCTGGACAGCCAATTACTGGGGCCCCCAAACACTGTCCTCTCAGCGTGCCAGGTGGATCTGGTGCCGGCGCCCTGCTCACAAGGCAGCTGTGCAGCAGCTGTACTAACAGTGACAGCCGTCACCGACTTCGCTCAGGATGGGAACCGCGTCAGCTACATCAGAGCCGAGCCAGTTGGACACAGAGATGTACTTTGGAGGGCTCACGCCTCGAAGGATGTAAAGGTCACAGTTCAGGACCTCCCAACAGGGAACTGCTACTCTTTCACTGATCCACACATTATCACGTTTGATGGATGGCGTTACGATAACTATAAAATCGGCACCTTCCTTTTGTGCCAGAGCACGTCACGGGCATTCGAAGTGCACGTCCGTCAGTGGGACTGTGGGGGACACCACTCTGCCACTGCCTGCAACTGTGGGGTGGCTGCATGGGAAGGGAGCGACGTCGTCCGCCTGGATGCCTGCAATGGGCACTTTCGGGACAGCAGGCCGCAGCTCAGCATCCAAAGTACTGAGGCATCACCACAGGTCAAAATCCTAACGTCCTACGGAGGGAGAAAGATAACAATCCTATTCCCTTCAGGAGCGTTCATTCGAGCCGATGTGAGTGAGTGGGGAATGGGCTTGACAGTGAGGATACCAAGCAGTGACTTCAACAGCACCAGAGGTTTGTGTGGCCTCTTTGATGGGATCAGTCACAACGACTTGAACAATGTGCCTGAGGAAGACTTCATAGAGGAGTGGAGAATACCTCCAGGGAAGAGTTTATTTGACAAAACTCCAGCATCTTCAGAGGGGAAGCAGAGGAAAAACTACTGCAGATGCCAGAAGGAGAGCACAAAGTCCATGCCCTTGCTAAAGACGCTGAATGCCTTTCAGATGCAATCTCCTGGTTGTCATTATGATAATGTGGATTACACTTTTGCAATTCCATATCTGGATGTTACATCAGAGTTTGTCACTCACTCAGGCAAAGAGTTTGCTTCAAGAGATGATGAGGAACGGTCGCCCAAGTCTTTTGATCAAAGATCTCTCCCTAAATCAGCCAAGAAGCGAGGTAGCCGTGAGGAGCGATTAAAACCCTTCTCACATCATGCTTCCATGAAAAACAACAGTTCCCTTAACTTTACCAAGCCAACAGAAGAACTACAGAGACCAAAAAGACAAGAAAACTACTTTGAATACTCAGCCCTTCACCCGTTGCATAGCCCAAGCCAGACAGACACGGAAAGCTTTGCCTATTTTTTCCCAGAGGATTATTTTGAAGGGATTCGGATAAAACTCCCACTGGGATGGCCCACTCCCAGCGGCCTAACCTCTGCCAAAGCTCAGGAGATTTGCCACCAAATTCTTGCAAATTCCACCATTGGCTTAGCGTGTAAGTCTCTGCTGGGAAAACTGATAGATGAGGCCATCAATATATGCATGTTAGATCTGCAGCTCAAGGATGATGTGGCCTGGGTAAGGGCACTGATAGCGCTTTTGGAAAATGAGTGTGAAAGACGAGTGCTGAGGCACAGAGGTGAAGTGTTTCGTGTTGGAAGCCAGCCAACTTCTAACCAGGAGGAAATCCTTACCATTCTCCGCTGTCCTGCTTTCTGTAATGGCAATGGACAATGTACAGACATGGGCTGCCAATGCTTTGAAGACCACAGCTCTTATGATTGTAGCACTGCCAGAAAGCAAACTCTGGAAATCACAAGCTTGGAGAACAGGGGCCTATGTGACATTCGCACCTCTGACTGCAGTCGTGTCCGAGTGTTTGGCGTTGGCTTCAAGGATTCTCCCCATCTGCACTGTGAAGTCACCAGATTAATTCATCTCAACGGCGAATGGATATCAAGAGAGCAAGAAACCACACAAGCAGATTTTCTCAGCTCTAAGGCTGTTGACTGCCAGATTCCTCTCCTGAACATTGCAGAGACGGAGGCTGTGCACTTTGTAGCTGGCGATGAGCCGTTCGCAAGATGGCAAGTAAAAATCACTGATGATGGCTTCCAGTACAGTAATTCCAGAGTGCTGACCCTGTACGACGCAGTCTGCCAGGCCTGCGAATCCCATCCAACTGGACTTTGTAAATTAAAGGACAATACTTGTAATATAGATGGACTTTGCTATGGGGAAGGAGAGTCAAACCCTGCCAGTCCTTGTCTTCTCTGTGAACCTGATATCTCTAAGTTCACCTGGTCTATTAATGAAAACAACCTGCCTCCTGTGTTCCAGGCCCCCTCCAGCCAGCTGCTGACATTTATTGGTGAGAATTTTGTTTACCAGTTAACAGCGGTGGATCCGGAAGGGTCAGCTGTGCTATTCATCTTAGAGGCTGGGCCACAGGATGCCAGGCTCTCTCCCGCTGGCCTTCTTATCTGGAAAGTTGATTCAGAAGAAATGCAGACCTTTGAATTCACTGTGTCGGATGAATGCAACGCGCAGAGCAGATACGCTGTTGAGGTTCGAGTGAAGCCCTGCAGCTGTCTCAATGGCGGAACGTGTGTTACCAATATTAAATTCCCCCCGGGCCTTGGTGAATATCTGTGTTTATGTCCAAATGGATTTGATGGAGGGCTTTGCCAGGAAGATATTAATGAGTGCAAATCAAACCCGTGCAAAAGCGGAACTTGTGTGGATGGTGTGGACAGCTATGCTTGTCAATGTCCCCCTGGTTTAGGAGGGCTTACTTGTCAGGAAGACAAGAATGAGTGTGAAGAAGGTCTGTGTTTTCCAGGAGTGTCCTGCATGAACACCTTTGGATCATACGTGTGTGGAATTTGTCCAAGTGGGATGGAGGGAAATGGTAAAACTTGCAAATCTGTGCTTGCTGGTGACTTTACAAAAGCTTTAATCGTTGACAACAACAATGGCAAAGGTGATTTGAACAAAACTGAAGTTGAGTGGCCACTGCACCCCTTAGAAGCAAATAATTCTCCTGTAATTAGGAATTTTAACATAAGCACTAATCATGTCCACACAGCACATCAGCCCCGTGTTACCACCTGTGCCAATAGGCCATGCTTTCCTGGAGTGCTGTGTTTCAATAGGAAACCCCCTTACGTTGGCTATGTCTGTGGCCGATGTCCAATAGGGTTTTTTGGAAATGGCCGAACCTGCAGCAAAGCCTCCAGACCAGTTTCAAGATCTTCCCAAAGCCATACAGATGTTGCTGAAAGAAATAGTGAAGATGCCAGAGGCTCTCATCAGGAAGGCAAGACATCAAGAAACATCTATTCGTTCCTATCCCAAACCCAAATTCCAAGGCAAGAAACTACATACTTTGTGGAAAGAAACCACACAGTTATTAATGCAGCATCCTTTACAACGAAAAGGAAGATTTCCCAGCCTCAGATGCTGTCAGCAAAAATACCTGATACAGAGTCCACTGTATCTGAGAAACAGACTTTTACTGAAAAAAGAAGTCATACACACACTTTCCTTCTGCATGAGGAGCCAGATCCCAAAGCAGCAGCTGTCAATGTGACTACTCCTACCCCTGTGCATTTTAAACAGTACAAGCCAGGAACAAGACAGACCATTCCTTCTCATCTCAACACAAACGCAAGCTCACTCTTCGCACGGCTGCATGCTGTACAGCAAGCTCGTTCCAGATACAGCTTATCTTCCAGGAAATGGCCCAGTCAAGTGACAGGCTCAAAGACTGAACTCTCCAAAAATCTCCCAACAAAGCAGCAGAGAGTTTCTTCTTTGGAAACATCCCTCACATCCCCTTTGCATGAAATAGGTTTTTCCCTTGACACAGCTCCACAGAGTGCCAGTGTCCTGCCTGGACCTGCTCCCCCAGCAAGGCTTCCAGCACATACCACAACCTTCAGAAGAGCATCCAGTGTAGCAATGGACCATGCAGAACTGCCAAAACCCATCAGTGGGTCCTATGAGAAAGCTCTCTGTGGTTCAACACCATGCTTTAGTGGTGTGCAGTGTGAGCTAGCCAAAGATGGAGAATTTAAATGTGGGTCTTGTCCCAGTGGATACAGCGGTAATGGAATTACATGTGAAGTGCAGTGTGACCCACCGTGTGAGCATGGAGGAACCTGTGTAGCTCAGAACACTTGTTCTTGTGCCTATGGATTTGTTGGTCCTCGATGTGAAACAATGGTGTGTAACAGGCACTGCCATAATGGCGGGGTCTGTGTGTCGCCAGACGAGTGCAAATGCAGAAGCGGATGGAGCAGCCCTTCCTGTGAAATAGCTGTGTGCAACCCTGTGTGCTTAAATGGAGGAATCTGCGTGCGACCAAACACTTGCACGTGTCCTTACGGTTTCTATGGGCCCCAGTGCCAGAGAGCTGTCTGCATTCCTCCTTGTAAGAATGGCGGCCACTGTGTTCGAACCAACGTGTGCTCCTGTACTGAGGGCTACACTGGAAGAAGATGTCAGAAGAGTGTCTGTGATCCTGCGTGCATGAATGGAGGGAAATGTGTAAGCCCAAATGTTTGTGACTGCCCATCTGGTTGGAGAGGAAAGCACTGTAATAAACCTGTTTGCCTGCAGAAATGCCTGAATGGTGGAGAATGTATAGGTCCAAACATCTGCGAGTGCCCTGAAGGATGGGTGGGAATGCTGTGCCAAACCCCAATTTGTGAGCAAAAATGTCTGTTTGGAAGCAGATGCATAAAACCAAATGTCTGTGCTTGCAGAAGTGGCTATACTGGGTCAGCATGTGAAAAGAAGGAGTACTCAAAGCTAATGACTGCTCATTTAGAAACCATATCTTTAACTACCCACAGGATGAAGATAACATAACAGCAGGACAATGAAGACAATCATTTGGGTATCGATAAGCCCAAACTGAGTTCGTTTTTCATTTGGGAAGACACGGTGTGAAAACATTACTACTTCTCTCCCTTCTACTCTCCTATAATCACAAAGAAAAACTAAAACAAAACACCAAGGCATATGTCAATAAACAGACCTCTATTTTCAAAA\n>XM_038827982.1 PREDICTED: Tripterygium wilfordii uncharacterized LOC119984160 (LOC119984160), mRNA \nCCTACTTCTCACCGCCATTATTAACCTCCTAAACCTTCTCTTCTCTGCAAAAATTGTTAAAAAAATACAAATTATATATAAACCAAACAACAAATCCTGTATTATACAGAAACCTTGATAACTGATCGTCCGCAATCATTCACATCCTCTCTCTCGAGTCGCAACGAATCCAAATCTTCATCGTTGGATCAGAGGGCCAGACCAAACACCACCACTAGCAGAAAACATGGTTGAAACCAGACGCAGCTCTTCGTCTAAGCGCCCTCTCGCCTCGTCTGCTAACCCCGTGCCTTCACCATCGGCCAAGCGATCCAAGGCTGGTGAGGCATCCTCGAAGGCAAACGATGCGGCGGCGGTTGAGTTATCGACGGATACCAATGGTTCGGTCAAAGAATCTGGGTCTGGAAGTCTTGAACCGGAGCTGCAATCCCCTGATCTGCAGGCCGACGATGCTGCCAAGCCCGCCGATGGGGAGAAATCGCCAGATGCTGAGGTGGAAGAGGAGGCCTTGGCGTCTCCGCGCTCCATAGGTGAAGCTGCAGTGGATGCTGCGGGTAATCGGCAGAAGAAGCGGCCTGTGAAAGCGGCAAAACTGAATACGAAGGCTGCGTGGGGAAAGCTTCTTTCGCAGTTCTCCCAGAATCCTCACCTTAACATGTGTGGTGCTACTTTCACTGTTGGCCAAAGTCGTACTTGCAATTTGTGTCTTAATGATCCATCCGTCAGTTCTACTTTATGTAAACTGAGGCATGTTGAGCGTGGAGGTTCATCTGTTGCCCTATTGGAGATATCTGGGGGCAAAGGATTTGTCCAAGTGAATGGGAAAATTTACTACAAGAATTCCAGTAAGACATTAACTAGTGGTGATGAACTGGTTTTCAGTTCTTCTGGAAAACATGCTTACATTTTTCAGCAGCTCACTCATGATACTGTAGCTGCTACCGGTCTATCTTCATCATTAAGCATTCTGGAAGCACAAAGTGCTCCATTAAAGGAAATACATATTGAGGCAAGGGCAGGGGACTCCTCTGCTGTTGCTGGAGCGTCAATATTAGCCTCTTTGTGCCAGAAGGACATATCCCTTCTTCCTCCACCCCCCAAGACTAGTGGTGATGTGCAGCAAAGCACTGAGATGCCTCAACTTCCGTCTGGATGTGGAGAATCTGATGATCGCACTCCAGACATTGATATGAAGGATGGTCCGAGTACTAATGAGCCTGCTGATGCTTCTTTGAGGGGAAAAACTGGTTGTCCATCATCTTGTGCTGCTCATGAAAACCACAATATTGATAGCCTTGGATTGGATTCATGTCCACATGCCGCCTCCAAAAAGATTAGTGGGACAACGTACGAGTTGACGCCTCTACTGAGGATGCTTACGGGAACGTCATCATCTAATTATGATTCAAGAGGCGGCATTCCTAAAATACCTGATGAGCATAGGGAAATCAGGGACCTGCTGAAGGAGTTTGGTTCTCGTGCAAATTTGATTAAACGACAAGCACTTAAGGATAGTTTGCAGCAAGGAATCCTAAATCCTGGCAGCATTGGTATTTCATTTGCAAGTTTTCCATATTACCTCAGCGACACTACGAAGAATGTTTTGATAGCTTCTACATACATCCAGCTGAAGTGTGACAAGTTTTCAAAATTGGCCTCAGATCTTCCTACTGTGTCTCCCCGAATATTATTATCTGGTCCAGCAGGTTCTGAGATATACCAGGAGACATTGGTGAAGGCACTTGCCACACATTTTGGGGCTAGACTTCTAATTGTTGATTCCCTTCTCTTGGCCGGTGGATCAGGGGCCAAAGATTCTGATTTGGTGAAGGAAAGTTCAAGGCCTGAGAGAGTCTCTGCATTTGCAAAACGAGCTTCACATGCTGCTGCATTGCAGCATAAAAAACCGACATCTACTGTTGAGGCTGATATTACGGGTGGCTCAATGATAAATTCTCAGACGCCGACAAAGCAGGAGACGTCAACTGCTTCATCCAAAAACTATACATTTAAACAAGGTGACAGAGTGAAGTTTGTGGGCAGCTGTCATACAGTTGCTTCCATACAACCTCCTTTGAGGGGACCGACAGTTGGTTTTCGAGGCAAAGTAGTCCTTGCTTTTGAAGACAATAGTTCCTCAAAAATTGGGGTTAGATTTGATAAATCAATCCCTGAAGGAAATGACCTTGGGGGTCTCTGCGAAGAAGATCACGGTTTCTTCTGCTCTGCTAATTCCCTTCGGTTAGAGAGTTCTGCTGGGGATGATGTTGACAAATTTGCTATTAATGAACTTTTTGAGGTTGCTTCAAATGAAAGTAAAAGTGGTTCCTTGATACTGTTTATGAAAGACATAGAGAAGTCTATGGTGGGGAATCAGGATGCATATGTGGCCTTCAAGAGTAAGTTCGACAATTTACCAGGGAATGTTGTTGTAATTGGCTCCCATACACAGGCGGACAGCCGTAAAGAGAAGTCTCATCCTGGAGGTCTTCTATTTACGAAATTTGGAAGCAATCACACAGCTTTACTTGATCTTGCTTTCCCGGATAGCTTTGGTAGGCTGCATGAGCGGGGGAAAGAGACGCCCAAAACGATGAAGCAACTTTCTCGACTTTTCCCTAACAAAGTGGGAATACAGCTGCCCCAGGATGAAGCTTTACTTTTGGACTGGAAGCAGCAGTTGGAGCGTGATATTGAAACTTTAAAAGCACAGGCCAACATTGTTAGCTTTCGCTCGGTGCTCGGTCGGATTGGCCTGGAATGCCCTGATCTTGAAAGTCTTTGCATCAATGATCAGGCTCTTACAACTGAAAATGTGGAGAAAATAGTAGGCTGGGCTTTAAGTCACCACTTGATGCATTATTCAGAAGGTTTGGCCAGAGATGCTAAGCTTGCGATTTCTACTGAAAGTATAAGGTATGGTTTGAACATTTTACTAGGCGTTCAAAACGAAAGCAAGAGCTTGAAGAAATCACTCAAGGATGTCGTAACGGAGAATGAATTTGAGAAGAAACTTCTTGCGGATGTTATTCCTCCAAATGACATCGGGGTCACATTTGATGACATAGGAGCCTTAGAAAATGTCAAGGATACCTTGAAGGAGCTGGTGATGCTTCCTCTTCAGAGGCCGGAATTGTTTTTGAAAGGACAGCTGACTAAGCCATGCAAGGGAATTTTACTGTTTGGGCCTCCTGGCACTGGAAAAACAATGTTAGCCAAGGCTGTCGCGACTGAGGCGGGTGCAAATTTTATCAATATATCAATGTCAAGCATCACTTCAAAGTGGTTTGGTGAAGGCGAGAAATATGTTAAAGCAGTGTTCTCTTTAGCTAGTAAAATTGCTCCTAGTGTTGTTTTTGTTGACGAGGTTGATAGCATGTTGGGTAGACGTGAAAATCCAGGAGAACATGAAGCTATGCGCAAAATGAAGAATGAATTTATGGTGAATTGGGATGGTCTTCGTACAAAGGATAAAGAGCGGGTATTGGTACTTGCTGCCACCAATAGGCCTTTTGATCTTGACGAGGCTGTTATAAGAAGGTTACCCCGGAGGTTGATGGTTAATTTGCCTGATGCCTCCAACAGAGAGAAAATCCTTAAAGTTATCTTAGCCAAAGAAGAATTGTCACCCGATGTGGAGTTAGAGGCAATTGCAAATATGACTGATGGGTATTCTGGAAGTGACCTTAAGAATCTGTGTGTGACTGCAGCTCATTTTCCGATACGCGAAATACTTGAGAGAGAAAAGAAGGAGAGAGCTTCAGCATTGGCGGAAAACAGACCATTGCCTGGACTTCATAACAGCACTGATGTACGCTCTCTGAAGATGGATGATTTTAAGTGTGCGCATGAACAAGTATGTGCAAGCGTTTCATCGGAGTCTACAAATATGAATGAGCTCCTCCAGTGGAATGATTTATATGGAGAAGGTGGCTCCAGGAAAAAGACGTCTCTCAGCTACTTCATGTAGAGAACGTATGTTTGTGTACAGCGATCCATGTTACAGATGTTTATTCACCTCTCTCTACCTGGCAGAGTCGGGAGTCGGGACACCATTGATTATGGAATTCTATCGCAGGTACTGAGCTCGGTGTACCATATTATCATAGGTTTTGGAATCATTTACCATTTTAGGGAGGTTTTACAATATTTATCAAGCAGGTTTTGTTTGACGGAAGCCGTCTTCTTGTTAATCTATCTAGTTTTGAATTCCTTCTCTTTCCCCTTTTCTTGTCTCGTCTGTAGCATGTAAATTCTCATTTTGATCAATTGAATAAGCATTCCCCTCTTTTTCTCCC\n>XR_004155863.1 PREDICTED: Punica granatum putative leucine-rich repeat receptor-like protein kinase At2g19210 (LOC116201365), transcript variant X2, misc_RNA \nGAACTAAACTTCTATAAGTGCCCATATTATTTGTATCAAATCTCTGTTGTGTATTATAATTAGCATGAAGATGTTATTCGTGATACTTGTATGTATCAGTCTCAATGCTATCGCTCAAGCACAAGAAAATCCAGGTTTCATAAGCATCGACTGTGGAGCACCTAATGGTTATCACGATGACAACCTTGACATTTACTACACGATAGACACGGGATTTGTTGAGTCAGGGAAAAACATGCAGATTTCTTCGAAGTACATCGATCGAGTTCCTATGCAACAGCTAATGAACTTGAGATGCTTTCCTAATGGAACAAGGAACTGTTACACGCTAAGGCCAACGCAAGGGAAGAGCAAGAGATATCTAATCCGGGCATCTTTCTTTTACGGAAATTATGATACTCTCTCCCAAACCCCAACATTCGACCTCTATATCGATGTAAACTACTGGATCACCGTGAAAGATCCATCAAACTACACGTACGAAGAGATTATATACACTACCTCAAGAGATTATATACAAGTGTGTCTTGTGAATCGGGGCTCGGGGGTTCCCTTCATTTCAGCACTAGAGCTACGAACCCTCGACAATTCCACTTATGATACTTCAGCTGGAGCACTACAGACCTCATGGCGATATAATATTGGGTCCAAAACCACATACAGGCATCCGCAAGATGACTATGACCGGATTTGGGAAGGCCAGAGTTTCAATTGGACTACAATCACAAACAAGACGAATGTTGACAGCTTAAGAAGCACAAACAATGCGTATAAAGTTCCACTGGAAGTCCTAATGACTGGCCAACAATCCCTGGATAATATTTCAAGCAGCCTGAAATTATTCTGGATTTCTTCTGAACCCACATATAAATGGTACTTGTTCTTTCACTTCGCCGAGTTTCAGGTATTGCGATCCGGACAGCTGAGGCGATTCAGAGTTTACGTCAATGATAACAAACTGATAACAACCGTTACACCTGAGTACCTCAAACCTGTGACCGTGTCCACGTTTCCCTTTGATGGGACCGTCCTGAACTTCTCAATCACCTCTGTGACTTCTCAATCAAGCCTCCCGCCGTTCCTCAATGCTGTCGAGTGGTTTCGTTCCATTGACCTTCCACATTCTACCACGGACTTAAATGATGTTACCGGTATTAACAGCATCAAGACGATTTACGGAGTGGCTATAGATGACTGGCAGGGCGATCCATGTGTTCCAGTGTCTTTTATTTGGAGTTTTTTGAACTGCAGCGAAGACGATATTCCGAGGATCATCTCCTTGAACTTGAGCTCTAGCAATTTGAAGGGGAGCATTGCTACCTCATTCTCCAGTCTCACGGCATTAGTCTCCCTGGATCTATCGTTCAATGAACTAAGTGGACAGATACCTGATTTTTTTGCTGACATGCCGAATTTGAGGATCTTAAACTTAAGTGGAAACAACCTCAACGGTTCAATTCCTGCAGTTCTTGAAAAGAAGATGGCGGATAAGACATTGCAATTAAGCTTGGATGGTAATCCGAATCTTTGTCGACAAGACTCTAATTGCAATCAAGACGGCCGCAAGAAGAAAAATACCGTTGTCCCAGCTGTTGCTGCTACTGTGGGCTCATTGGCTCTGGTATTCTTTCTCATTTGTGCCATCGTTGTCATTCGCAGACGTAGGAAGAAGATAGAAGAAATTAATACTGGATCAATGGAAGTCACTGCATCGAAGGAACATAGACCTAAGGAGGTATCCGAGCCTAGTACTGGTACCGGATTTAACGAGGGGCGACTAGTAGTTGGAAAGAACCGACCATTTACATCTGCTGAAGTTTTGAGTATCACCGGGAACTTCAGAACAGTTATCGGGGAAGGTGGATTCGGAAACGTGTACCTTGGAACTCTCGATGATGGTTGGAAAGTCGCAGTGAAAGTGCTCTCTCAGTCATCAAAGCAGGGCTACAAGGAATTCCAAGCAGAGGCACAGCTTCTGATGATTGTTCATCACAAAAATCTTGTTTCTCTCATCGGGTATTGCGAAGATTTCGATAACATGGCCCTGATTTATGAATTTATGCCCAATGGAAACTTAAGGCAGCATCTGGCAGGAAACACATCTAATGTCATAAGTTGGAGTCAGAGACTGCAAATTGCAATAGACGCAGCACAGGTTTTGGTCAATCTTTTGATGCAGGGCTGGAGTATTTGCATAATGGTTGCCGACCTTCGATCATTCACAGAGATCTCAAGACTTCAAATATCCTTCTAAATGAGAACATGCAAGCCAAAATAGCTGATTTTGGTCTCTCTCGGGTTTTCATGATGGAAGATGGCTGTCAAATTTCGACTCAACCTGCCGGCACACCCGGTTACCTTGACCCGGTGTTCAACACGGGTGGAAACTTGAACAAGAAAAGTGATGTGTACAGCTTCGGGATCATTCTGTTCGAGCTGATTACCGGACAGCCTGCTATTCTAAGAAGTCCGACGGGCAGTATTCACATCGTTAAATGGGTGACTCCACTC\n>XM_030225762.1 PREDICTED: Drosophila hydei latent-transforming growth factor beta-binding protein 2 (LOC111599265), partial mRNA \nCAATCGCGTAACGATCAGTGCACAGCAAACGAGATCCAGCTCGATCCCCACGACTGTGCTGCCTATTTCCTATGTGTGAAGGGAGAATTTGTGAGTCAGAAATGTGTTCGTGGCTTTTACTTCGATGCCGCAATCCAGGCGTGTGTGGGCGACACCAAAGAGTCGTCTAACAAGCGGACTGCGAAAATGGCTCACAATAGAAACCTCAAATTTGTGTATCTCCTTTCCATTGCTGTGACCCTGGTCTTTGGAGCTGCAGCCGATGATGATTGCTGTCAACCCGGCGATACCAAGCCCGTCGAAGGCGATTGCACCCAGTACTACGGCTGCTGTACGGGAAAGTTCGTTCTGAAGTCGTGCCCTAGCGGACAATACTGGAATTCAAACAACCAACAATGTGAACCTGACAACGGCCAATGCGTTCCTGTTGAGCCCGGTGCGCCCGGTGCGCCCTGTGCGCCCGGTGAGCCCGGTGCGCCCGGTGCATGCACAGAAGGAGATACCAAAGTGGATGCCTCCGATTGTACCAAATATCAAGTCTGCAAGAACGGAGAGTATGTCTCGGCCTCCTGTAACTCTGGTTACTACTGGAACTCGGCTAACAGCCAGTGCGAGCAGGATAACGGCCAGTGCGTTTCAGTAACATGTAAGGACGGAGAGCTTAGTGCAGACTCATCTGACTGCGCAGGCTACTTCATATGTCTGGATAATAAGTTAGTCAAGAGGAAGTGCGCTAGTCAAACCTATTTCGATGCCAGTCTGGAGACTTGCGTTATCGACACTGAGGGTGTTTGCATACCCAAGGTTTGCGATTCCGAATGCTGCGATAAGCCCAACAATTGGATTGGACCCGTCGATAAGAACTGCTCCGCATTCATTCACTGCCTTTACGGCCAACTGATTCAACAGACCTGTCCCAACAATCTGCAGTTCAACAACATTACCAAGCAGTGCGACTTCCCCGATGTTGTCCAATGCGATGACGGCAGCCCACCGCCAAGCGGACCCACAGCCGGTCCCTCGGGCACCTACTGTGAGAGCAAGGGTCGCTGCGTCGGACAACGTGATGGCGCCATGTTCGCCGATGCCAAGTCTGCCTCCAGTGGTGGCTACATCGTATGCCAATGTGAATGTGAGATTAACTTCAACTGTGTCGCCGGCTTAGTTTTCAACGAGAAGATTCGCACCTGCGATTGGCCATAA\n>XM_035486762.1 Talaromyces rugulosus uncharacterized protein (TRUGW13939_03582), partial mRNA \nATGACACCCAAGCGAGTGAGAACTGTCGAGGGCTCATGCTGGCTATGCAAAGATCGCCGGGTTCTATGCGACTTGCAGCAGCCTCGTTGCTCCCGATGCGTGTCCAAAGGTGAACCATGTGAATACGGTGAGGTACGCTTGCGCTGGTGCAATGGCGTAGCGGCTCGAGGCCGATATGCTGGTCAGAATGTACCTGTGTCAATACCATCAGCCAGGAGGGATTCTTCTAGAGGGTCGTTAGGAAAGACACCGCCGTTGCAATCAACCGAAAACGATCAAGGTGATGGGGAAGTCCCTAAAGTCGAAACATTGTCGCCAGTAAGCTCCAATGCACTACAGATATCGGGGCTTTCATCACAAGTGACAGCAGAGCAGCTATTGCTCTATTTTTCCAACGTCGTGGTCGACCGTTTCAGCCTTTCCACGGATCGGATATCGATTAATCTCCCATCAGTATGCGAAGAGCCTGCTCTTCGTGACTCGATGAGCGCCGTTGCAAATGCACATCATGTTCTTTCCCTGTATCCTGGTCGTCCAGGTGTAGGGCTCGCCAAGAAGAGGGCACGTTGGAGCGCTATTCACAATTTCCGAGCTCGGCTGGAATGCCCGAGCATGGAGTCGAGGACACCGGGCCTCGATCTGTTCATGGCCAACGTCCTGCTCTGTATACTAGACGGAGTCATTGACCCGCATGACGAAAGCGCAGCTACTCATATGCATTATCGCGGCGGACGAGCAATCCTCAGTCAATGGAAGCTTCAGAAACAGTTATATCAGGAAAAACGCGGCTTGCCGGCTTTGATGTTGTCTGTTTTTGCAACCATGGATTTGACATACTCGATGCTTAGCGGTGAAGAACAGTATTTTCAGCATACTATCTGGAATGGCTTTGCTGAGAGTGATGGCTGGTGGGGGACTCTTCCTCAAGATGATCCCTTTTTGGAAGTTATGTGTACTCTATCGCGTCTGACTCGACTGGGGTCTCTCGTAAGCAAGGGCCTTGATTTTCCTGATGAGGCCCTCAACGAGGAAGTGAGTACTCTCCTGACGACTCTGCAGGGCCCTCCCCAGATTCCGTATGATATTTCTTGTCCCGAAAGAATGGACTTGGAAGACCAACCGGCTCCTCTATTGCTTTTTACCTCGCCAGGCCACCACGATTTAGATCACAACCAGTCATGGATTGTCTTCTGCAATGCATACCGGATTGCCGGTCTAATATACGCGTACCGCGTCTTTTATCGGCTAAATTTCGGCGATCCCTTGATACAACAGGCCGTGAACCTGGGTATACAAGCCGTCTGCAAAACACGACTAACAGGCAAACTATCACACTGCTTGCTCTTCCCAGCGCTCGTAATCGGAAGCCATTGCCAATCCAACGAAGACCAGGCAGCGATACTCGCGACGATCCAATCAACCGCGGCATTCTTGCATTTTGGGTCGCTTCGAGTTATGGAGAGCTTTTTGCATCGAGTGTGGGAGCGAGCTCCAGCGGCGGAGACTTGGTGGCAGTTTTTTGAGCCGATTTCCAAGAAGGCCTTTTTATTTTGA\n>XM_012357333.1 Saprolegnia parasitica CBS 223.65 hypothetical protein partial mRNA \nATGGGCATCAAGATCCGCAACGACACGCGCCACGACGTCCTCGTCATTGTCTTCACGTACTTCACGACGCCGTTCCCGACGCTGTACTACCGCAAGACACTGCTCATCCCGGCCGGCGAGCGCTACAACTGCCCGACGTGGCAGAGCGCTGTCAAGATCTACGCGTGGGAAGCCGACAGTAGCAACGG\n>XM_021677838.1 PREDICTED: Neomonachus schauinslandi translation initiation factor IF-2-like (LOC110569879), mRNA \nATGGCGTCGCCGCGGAGTCCGGCACACGCATCCATTTTATCAGGAGCCCGGCGCGGCGGCGCTCAGGAACGAAGGCTGCGGTGTGGAAGGCCGGGCCGGCTCCGCGCTCAGCGAGCGGAGACCCCGCGGCCGCCGCAGGTGCAAGCGCCGCAAGCCCCGCCCCGCCCGCCGCCCCAGCCAACCGCGGGCGGCGGGGGCGGGGCCTGGACCCGCCACACCTGGGGCGGCCGCCCGGCCGTGTCCCAACCACGCTGCCCACAGCCCGCGGCCCGCCGCTCAAGCCCGCCGCCCCGCCCCACCCGCGTCCCCGGCCCCTGCCTGCCCCGCGACCGGTGCGAGGCCCGCCCTGCCCACCCGGCCGGAGTCGTCCCCTCAGTCCCGCCGCCGCGCCGCCCCAGCCGTTTCCACAACGGCTCCGCCTCAACCGTCGGGAGGCTGGCCGTCCGCCCGCTCGCCCACCCGCCGCTGCTGGAGACCGGCCCGGCGTCACGGCCCCCCTCCACGCAGCCCCGCTGTCAGGGAGGCCCGGCCCGGCGCCCGGCTCTACCTGCGGCTGGAGGAAGCCTCCCCGTCCGGGCCCGGGAGCCGCCGCCACGGCCGCCGACTCGAGTCGCGTCTCTGCTCTCCGCGACCGCCGCGGCTCTTCAGGCGGCCGACGGTGGGCGGGAAGCGCCCGCCCAATCAGCGCCGCGTGCGTTCGGAATCGCGTCCAATCAGCGCAGCTCGCAGTCCAGGCTCCGCCCCTCGTGCTCGCCGGCGACGCAGGGGTCGCCAGAGGCCGAAGCCAGGGGCGCCGCGGTGGGCGCGGCTCGGGGCCGGGCCGGGTAG\n>MF950468.1 Uncultured bacterium clone OTU1501_Control_T4.8037 16S ribosomal RNA gene, partial sequence \nATACGGGAGGCAGCAGTGGGGAATCTTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGCGATGAAGCCCTTCGGGGTGTAAAGCTCTTTCGGCGGGGACGATAATGACGGTACCCGCAGAAGCAGCTGCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGCAGCGAGCGTTGTTCGGAGTTACTGGGCGTAAAGGGTGTGTAGGCGGTTCCTTAAGTTTGGTGTGAAATCTCCCGGCTCAACTGGGAGGGTGCGCCGGATACTGAGGAGCTAGAGTGCGGGAGAGGAAAGTGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCTGTGGTGTAGACGGCTTTCTGGACCGTGACTGACGCTGAGACACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGT\n>XM_038920781.1 Brettanomyces nanus uncharacterized protein (FOA43_000450), partial mRNA \nATGATGAAAGCTTTAACATATGTCAGACCAGGAGTTATCAAGTACCAGGATGTGGAGAAACCAAAATTACTTCAGCCTACAGATGTGATCGGAAAGACCGTTGTAACAACTATTTGCGGATCGGATCTTCATATCCTTTCAGGTGCTTTCCCAGAGTTCAACAAGTTGGCCGAGAAAAAGGCTGGCCGAGGATTTATCTTGGGTCATGAGGGTATCATCAAGGTGGAGCAAATAGGTTCTGAAGTAAAGAACTTTAAAGTCGGTGATGTGTGCATCGTCTCTTGCATCACTCCTTGTGGTGAATGCTTTTACTGTAAAGAAGGTTGCGAAGCTCATTGTACACAGAACGAGGGAACCTGTGGATGCATCTTGGGTAGTGAGATTGATGGAACTCAAGCTGATTATGTTAGAGTTCCTCTTGCTGACAATTCTTTAATCAAATGCCCGGATAACGTGAAGTTGGAGTCTTTATTAATGCTTAGTGACATTTTACCAACCTCCTACGAACTTGGTGTTCTGGATGGAGGTGTCAAAGAAGGAAGTACCGTTGCCATTGTCGGTATGGGACCTGTTGGGTTGGCTGCTTTGATCAGTGCTAAGGCATTGAATCCAGATTATATTGTTGCTATCGACTTGAACGAATCCAGATTGAAGACTGCCAAAAAATTGGGTGCCGACTACACCTTTAATCCAAGCAAGGATGATGTTGTTAAACTTGTTATGGGGCTTCCTGTGAAACAGGGTAAGCTACCCGGTGTCGATGTGGCCATCGAATGCTGTGGTATTCCGGCAACTTTCGAGATGTGCCAGGATATTGTTGGTATGAACGGTAGAATTGCCAATGTCGGTGTTCACTCTAAGTCATGCAAACTTGCTATGGAAAAGTTATGGGTCATGAATATCAACATAAGTACCGGATTGGTCTGCGGCCATTCTACAAAAGATTTACTCAGGAAAGTTGTATCCGGAGAATTGGATCCTTCGTCTTTGATTACTCATCGCTTCAAACTAAATGAGATCGAAAAGGCTTACGATGTCTTCAGCAATGCTTCTGAGACTGATGCCATTAAGATGCTTCTTATCAACGATTGA\n>MW263500.1 Cortinarius sp. PDD 112391 isolate JAC15241 large subunit ribosomal RNA gene, partial sequence \nCATATCAATAAGCGGAGGAAAAGAAACTAACAAGGGATTCCCCCTAGTAACTGCGAGTGAAGCGGGAAAAGCTCAAATTTAAAATCTGGCGGTCTTTGGCTGTCCGAGTTGTAATCTAGAGAAGTGTTATCCGCGCCGGACCGTGTACAAGTCTCCTGGAATGGAGCGTCATAGAGGGTGAGAATCCCGTCTTTGACACGGACTACCGGGGCTTTGTGATGCGCTCTCAAAGAGTCGAGTTGTTTGGGAATGCAGCTCAAAATGGGTGGTAAATTCCATCTAAAGCTAAATATTGGCGAGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGAAAAGAACTTTGGAAAGAGAGTTAAACAGTACGTGAAATTGCTGAAAGGGAAACGCTTGAAGTCAGTCGCGTTGTCCAGGGATCAACCTTGCTTTTGCTTGGTGCACTTTCTGGTTGACGGGTCAGCATCAATTTTGACTATTGGAAAAAGATTAGGGGAATGTGGCATCTTTGGATGTGTTATAGCCCTTGGTTGCATACAATGGTTGGGATTGAGGAACTCAGCACGCCGCAAGGCCGGGTTTTTAACCACGTACGTGCTTAGGATGCTGGCATAATGGCTTTAATCGACCCGTCTTGAAACACGGACCAAGGAGTCTAACATGCCTGCGAGTGTTTGGGTGGAAAACTCGAGCGCGTAATGAAAGTGAAAGTTGAGATCCCTGTCGTGGGGAGCATCGACGCCCGGACCAGACCTTTTGTGACGGTTCCGCGGTAGAGCATGTATGTTGGGACCCGAAAGATGGTGAACTATGCCTGAATAGGGTGAAGCCAGAGGAAACTCTGGTGGAGGCTCGTAGCGATTCTGACGTGCAAATCGATCGTCAAATTTGGGTAT\n>MN640403.1 Mycobacterium simiae strain a18 16S-23S ribosomal RNA intergenic spacer and 23S ribosomal RNA gene, partial sequence \nGAATCTTGACTGGGGTGTGAGCCGTGAGGGGTTCTCGTCTGTAGTGGACGAGGGCCGGGTGCACAACAACAGGCAATCGCCAGACACACTATTGGGCCCTGAGACAACACTCGGCCGACTTCGGTTGAAGTGGTGTCCCTCCATCTTGGTGGTGGGGTGTGGTGTTTGAGTATTGAATAGTGGTTGCGAGCATCAGGAGGTACCTCCGTTCTGTTTGAGTATTGGATAGTGGTTGCGAGCATCAGGGTGGTGGGGTGTGGGGTTTGACATCAGAATGGTGAAGGCAATTATCAGGTACCGCCTC\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/pdb_mmcif/5y2e.cif",
    "content": "data_5Y2E\n#\n_entry.id 5Y2E\n#\nloop_\n_chem_comp.formula\n_chem_comp.formula_weight\n_chem_comp.id\n_chem_comp.mon_nstd_flag\n_chem_comp.name\n_chem_comp.pdbx_synonyms\n_chem_comp.type\n\"C3 H7 N O2\"     89.093  ALA y ALANINE         ? \"L-peptide linking\" \n\"C6 H15 N4 O2 1\" 175.209 ARG y ARGININE        ? \"L-peptide linking\" \n\"C4 H7 N O4\"     133.103 ASP y \"ASPARTIC ACID\" ? \"L-peptide linking\" \n\"C5 H10 N2 O3\"   146.144 GLN y GLUTAMINE       ? \"L-peptide linking\" \n\"C5 H9 N O4\"     147.129 GLU y \"GLUTAMIC ACID\" ? \"L-peptide linking\" \n\"C2 H5 N O2\"     75.067  GLY y GLYCINE         ? \"peptide linking\"   \n\"C6 H10 N3 O2 1\" 156.162 HIS y HISTIDINE       ? \"L-peptide linking\" \n\"H2 O\"           18.015  HOH . WATER           ? non-polymer         \n\"C6 H13 N O2\"    131.173 ILE y ISOLEUCINE      ? \"L-peptide linking\" \n\"C6 H13 N O2\"    131.173 LEU y LEUCINE         ? \"L-peptide linking\" \n\"C6 H15 N2 O2 1\" 147.195 LYS y LYSINE          ? \"L-peptide linking\" \n\"C5 H11 N O2 S\"  149.211 MET y METHIONINE      ? \"L-peptide linking\" \n\"C4 H9 N O3\"     119.119 THR y THREONINE       ? \"L-peptide linking\" \n\"C5 H11 N O2\"    117.146 VAL y VALINE          ? \"L-peptide linking\" \n#\n_entity.id               1\n_entity.pdbx_description \"Non-structural glycoprotein 4\"\n_entity.type             polymer\n#\n_entity_poly.entity_id      1\n_entity_poly.pdbx_strand_id A\n_entity_poly.type           polypeptide(L)\n#\nloop_\n_entity_poly_seq.entity_id\n_entity_poly_seq.hetero\n_entity_poly_seq.mon_id\n_entity_poly_seq.num\n1 n MET 1  \n1 n ILE 2  \n1 n GLU 3  \n1 n LYS 4  \n1 n GLN 5  \n1 n MET 6  \n1 n ASP 7  \n1 n ARG 8  \n1 n VAL 9  \n1 n VAL 10 \n1 n LYS 11 \n1 n GLU 12 \n1 n MET 13 \n1 n ARG 14 \n1 n ARG 15 \n1 n GLN 16 \n1 n LEU 17 \n1 n GLU 18 \n1 n MET 19 \n1 n ILE 20 \n1 n ASP 21 \n1 n LYS 22 \n1 n LEU 23 \n1 n THR 24 \n1 n THR 25 \n1 n ARG 26 \n1 n GLY 27 \n1 n ILE 28 \n1 n GLU 29 \n1 n GLN 30 \n1 n VAL 31 \n1 n GLU 32 \n1 n LEU 33 \n1 n LEU 34 \n1 n LYS 35 \n1 n ARG 36 \n1 n ILE 37 \n1 n HIS 38 \n1 n ASP 39 \n1 n LYS 40 \n1 n LEU 41 \n1 n MET 42 \n1 n ILE 43 \n1 n ARG 44 \n1 n ALA 45 \n1 n VAL 46 \n1 n ASP 47 \n#\n_exptl.method \"X-RAY DIFFRACTION\"\n#\n_pdbx_audit_revision_history.revision_date 2018-03-14\n#\n_pdbx_database_status.recvd_initial_deposition_date 2018-03-14\n#\nloop_\n_pdbx_poly_seq_scheme.asym_id\n_pdbx_poly_seq_scheme.auth_seq_num\n_pdbx_poly_seq_scheme.entity_id\n_pdbx_poly_seq_scheme.hetero\n_pdbx_poly_seq_scheme.mon_id\n_pdbx_poly_seq_scheme.pdb_ins_code\n_pdbx_poly_seq_scheme.pdb_seq_num\n_pdbx_poly_seq_scheme.pdb_strand_id\n_pdbx_poly_seq_scheme.seq_id\nB 94  1 n MET . 94  A 1  \nB 95  1 n ILE . 95  A 2  \nB 96  1 n GLU . 96  A 3  \nB 97  1 n LYS . 97  A 4  \nB 98  1 n GLN . 98  A 5  \nB 99  1 n MET . 99  A 6  \nB 100 1 n ASP . 100 A 7  \nB 101 1 n ARG . 101 A 8  \nB 102 1 n VAL . 102 A 9  \nB 103 1 n VAL . 103 A 10 \nB 104 1 n LYS . 104 A 11 \nB 105 1 n GLU . 105 A 12 \nB 106 1 n MET . 106 A 13 \nB 107 1 n ARG . 107 A 14 \nB 108 1 n ARG . 108 A 15 \nB 109 1 n GLN . 109 A 16 \nB 110 1 n LEU . 110 A 17 \nB 111 1 n GLU . 111 A 18 \nB 112 1 n MET . 112 A 19 \nB 113 1 n ILE . 113 A 20 \nB 114 1 n ASP . 114 A 21 \nB 115 1 n LYS . 115 A 22 \nB 116 1 n LEU . 116 A 23 \nB 117 1 n THR . 117 A 24 \nB 118 1 n THR . 118 A 25 \nB 119 1 n ARG . 119 A 26 \nB 120 1 n GLY . 120 A 27 \nB 121 1 n ILE . 121 A 28 \nB 122 1 n GLU . 122 A 29 \nB 123 1 n GLN . 123 A 30 \nB 124 1 n VAL . 124 A 31 \nB 125 1 n GLU . 125 A 32 \nB 126 1 n LEU . 126 A 33 \nB 127 1 n LEU . 127 A 34 \nB 128 1 n LYS . 128 A 35 \nB 129 1 n ARG . 129 A 36 \nB 130 1 n ILE . 130 A 37 \nB 131 1 n HIS . 131 A 38 \nB 132 1 n ASP . 132 A 39 \nB 133 1 n LYS . 133 A 40 \nB 134 1 n LEU . 134 A 41 \nB 135 1 n MET . 135 A 42 \nB 136 1 n ILE . 136 A 43 \nB 137 1 n ARG . 137 A 44 \nB 138 1 n ALA . 138 A 45 \nB ?   1 n VAL . 139 A 46 \nB ?   1 n ASP . 140 A 47 \n#\n_pdbx_struct_assembly.details            author_and_software_defined_assembly\n_pdbx_struct_assembly.id                 1\n_pdbx_struct_assembly.method_details     PISA\n_pdbx_struct_assembly.oligomeric_count   4\n_pdbx_struct_assembly.oligomeric_details tetrameric\n#\n_pdbx_struct_assembly_gen.assembly_id     1\n_pdbx_struct_assembly_gen.asym_id_list    A,B,C,D,E,F,G\n_pdbx_struct_assembly_gen.oper_expression 1\n#\n_pdbx_struct_oper_list.id                 1\n_pdbx_struct_oper_list.matrix[1][1]       1.0000000000\n_pdbx_struct_oper_list.matrix[1][2]       0.0000000000\n_pdbx_struct_oper_list.matrix[1][3]       0.0000000000\n_pdbx_struct_oper_list.matrix[2][1]       0.0000000000\n_pdbx_struct_oper_list.matrix[2][2]       1.0000000000\n_pdbx_struct_oper_list.matrix[2][3]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][1]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][2]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][3]       1.0000000000\n_pdbx_struct_oper_list.name               1_555\n_pdbx_struct_oper_list.symmetry_operation x,y,z\n_pdbx_struct_oper_list.type               \"identity operation\"\n_pdbx_struct_oper_list.vector[1]          0.0000000000\n_pdbx_struct_oper_list.vector[2]          0.0000000000\n_pdbx_struct_oper_list.vector[3]          0.0000000000\n#\n_refine.ls_d_res_high 2.70\n#\n_software.classification other\n_software.name           \"DeepMind Structure Class\"\n_software.pdbx_ordinal   1\n_software.version        2.0.0\n#\n_struct_asym.entity_id 1\n_struct_asym.id        B\n#\nloop_\n_atom_site.group_PDB\n_atom_site.id\n_atom_site.type_symbol\n_atom_site.label_atom_id\n_atom_site.label_alt_id\n_atom_site.label_comp_id\n_atom_site.label_asym_id\n_atom_site.label_entity_id\n_atom_site.label_seq_id\n_atom_site.pdbx_PDB_ins_code\n_atom_site.Cartn_x\n_atom_site.Cartn_y\n_atom_site.Cartn_z\n_atom_site.occupancy\n_atom_site.B_iso_or_equiv\n_atom_site.auth_seq_id\n_atom_site.auth_asym_id\n_atom_site.pdbx_PDB_model_num\nATOM 1   N N   . MET B 1 1  ? 2.644   6.839  -46.028 1.00 83.71  94  A 1 \nATOM 2   C CA  . MET B 1 1  ? 1.400   7.612  -45.825 1.00 86.32  94  A 1 \nATOM 3   C C   . MET B 1 1  ? 1.210   7.971  -44.344 1.00 87.15  94  A 1 \nATOM 4   O O   . MET B 1 1  ? 1.479   7.188  -43.421 1.00 80.48  94  A 1 \nATOM 5   C CB  . MET B 1 1  ? 0.170   6.890  -46.382 1.00 88.07  94  A 1 \nATOM 6   C CG  . MET B 1 1  ? -0.124  7.275  -47.840 1.00 91.84  94  A 1 \nATOM 7   S SD  . MET B 1 1  ? -1.789  6.807  -48.325 1.00 103.69 94  A 1 \nATOM 8   C CE  . MET B 1 1  ? -2.264  8.027  -49.569 1.00 97.89  94  A 1 \nATOM 9   N N   . ILE B 1 2  ? 0.696   9.166  -44.185 1.00 87.93  95  A 1 \nATOM 10  C CA  . ILE B 1 2  ? 0.364   9.779  -42.948 1.00 84.67  95  A 1 \nATOM 11  C C   . ILE B 1 2  ? -0.678  8.946  -42.258 1.00 75.98  95  A 1 \nATOM 12  O O   . ILE B 1 2  ? -0.634  8.714  -41.080 1.00 67.98  95  A 1 \nATOM 13  C CB  . ILE B 1 2  ? -0.321  11.082 -43.309 1.00 89.99  95  A 1 \nATOM 14  C CG1 . ILE B 1 2  ? 0.696   12.146 -43.577 1.00 94.59  95  A 1 \nATOM 15  C CG2 . ILE B 1 2  ? -1.197  11.546 -42.182 1.00 92.79  95  A 1 \nATOM 16  C CD1 . ILE B 1 2  ? 1.132   12.780 -42.294 1.00 93.36  95  A 1 \nATOM 17  N N   . GLU B 1 3  ? -1.625  8.499  -43.046 1.00 71.66  96  A 1 \nATOM 18  C CA  . GLU B 1 3  ? -2.745  7.716  -42.585 1.00 68.44  96  A 1 \nATOM 19  C C   . GLU B 1 3  ? -2.273  6.463  -41.883 1.00 69.98  96  A 1 \nATOM 20  O O   . GLU B 1 3  ? -2.890  6.024  -40.946 1.00 67.88  96  A 1 \nATOM 21  C CB  . GLU B 1 3  ? -3.613  7.332  -43.745 1.00 73.44  96  A 1 \nATOM 22  C CG  . GLU B 1 3  ? -4.382  8.485  -44.320 1.00 87.42  96  A 1 \nATOM 23  C CD  . GLU B 1 3  ? -3.735  9.039  -45.551 1.00 89.38  96  A 1 \nATOM 24  O OE1 . GLU B 1 3  ? -4.454  9.413  -46.477 1.00 97.81  96  A 1 \nATOM 25  O OE2 . GLU B 1 3  ? -2.511  9.105  -45.593 1.00 88.14  96  A 1 \nATOM 26  N N   . LYS B 1 4  ? -1.212  5.844  -42.364 1.00 71.45  97  A 1 \nATOM 27  C CA  . LYS B 1 4  ? -0.676  4.669  -41.671 1.00 72.76  97  A 1 \nATOM 28  C C   . LYS B 1 4  ? 0.097   5.062  -40.408 1.00 74.11  97  A 1 \nATOM 29  O O   . LYS B 1 4  ? 0.209   4.268  -39.462 1.00 77.84  97  A 1 \nATOM 30  C CB  . LYS B 1 4  ? 0.197   3.807  -42.578 1.00 66.63  97  A 1 \nATOM 31  N N   . GLN B 1 5  ? 0.624   6.270  -40.364 1.00 72.03  98  A 1 \nATOM 32  C CA  . GLN B 1 5  ? 1.295   6.749  -39.158 1.00 65.60  98  A 1 \nATOM 33  C C   . GLN B 1 5  ? 0.255   7.097  -38.099 1.00 58.64  98  A 1 \nATOM 34  O O   . GLN B 1 5  ? 0.462   6.888  -36.942 1.00 52.26  98  A 1 \nATOM 35  C CB  . GLN B 1 5  ? 2.143   7.976  -39.487 1.00 63.76  98  A 1 \nATOM 36  N N   . MET B 1 6  ? -0.861  7.648  -38.542 1.00 49.04  99  A 1 \nATOM 37  C CA  . MET B 1 6  ? -1.953  7.954  -37.679 1.00 45.66  99  A 1 \nATOM 38  C C   . MET B 1 6  ? -2.486  6.679  -37.100 1.00 50.63  99  A 1 \nATOM 39  O O   . MET B 1 6  ? -2.882  6.643  -35.948 1.00 50.11  99  A 1 \nATOM 40  C CB  . MET B 1 6  ? -3.050  8.640  -38.449 1.00 42.97  99  A 1 \nATOM 41  C CG  . MET B 1 6  ? -4.395  8.703  -37.753 1.00 42.67  99  A 1 \nATOM 42  S SD  . MET B 1 6  ? -5.430  9.916  -38.524 1.00 47.21  99  A 1 \nATOM 43  C CE  . MET B 1 6  ? -6.803  9.938  -37.397 1.00 48.85  99  A 1 \nATOM 44  N N   . ASP B 1 7  ? -2.531  5.622  -37.894 1.00 56.67  100 A 1 \nATOM 45  C CA  . ASP B 1 7  ? -3.070  4.383  -37.401 1.00 55.17  100 A 1 \nATOM 46  C C   . ASP B 1 7  ? -2.223  3.846  -36.257 1.00 53.54  100 A 1 \nATOM 47  O O   . ASP B 1 7  ? -2.785  3.365  -35.256 1.00 47.69  100 A 1 \nATOM 48  C CB  . ASP B 1 7  ? -3.067  3.354  -38.520 1.00 57.94  100 A 1 \nATOM 49  C CG  . ASP B 1 7  ? -3.936  2.164  -38.236 1.00 62.42  100 A 1 \nATOM 50  O OD1 . ASP B 1 7  ? -5.111  2.416  -37.949 1.00 67.59  100 A 1 \nATOM 51  O OD2 . ASP B 1 7  ? -3.401  1.020  -38.206 1.00 61.64  100 A 1 \nATOM 52  N N   . ARG B 1 8  ? -0.900  3.909  -36.428 1.00 54.78  101 A 1 \nATOM 53  C CA  . ARG B 1 8  ? -0.002  3.384  -35.432 1.00 61.23  101 A 1 \nATOM 54  C C   . ARG B 1 8  ? -0.168  4.177  -34.127 1.00 63.20  101 A 1 \nATOM 55  O O   . ARG B 1 8  ? -0.017  3.620  -33.077 1.00 67.94  101 A 1 \nATOM 56  C CB  . ARG B 1 8  ? 1.484   3.327  -35.943 1.00 64.73  101 A 1 \nATOM 57  C CG  . ARG B 1 8  ? 2.403   4.541  -35.635 1.00 73.16  101 A 1 \nATOM 58  N N   . VAL B 1 9  ? -0.406  5.483  -34.222 1.00 63.14  102 A 1 \nATOM 59  C CA  . VAL B 1 9  ? -0.546  6.334  -33.061 1.00 59.81  102 A 1 \nATOM 60  C C   . VAL B 1 9  ? -1.853  6.121  -32.347 1.00 55.82  102 A 1 \nATOM 61  O O   . VAL B 1 9  ? -1.880  6.066  -31.150 1.00 48.46  102 A 1 \nATOM 62  C CB  . VAL B 1 9  ? -0.421  7.813  -33.454 1.00 60.39  102 A 1 \nATOM 63  C CG1 . VAL B 1 9  ? -0.731  8.703  -32.272 1.00 60.03  102 A 1 \nATOM 64  C CG2 . VAL B 1 9  ? 0.994   8.091  -33.943 1.00 61.68  102 A 1 \nATOM 65  N N   . VAL B 1 10 ? -2.941  6.014  -33.079 1.00 56.18  103 A 1 \nATOM 66  C CA  . VAL B 1 10 ? -4.231  5.743  -32.481 1.00 53.53  103 A 1 \nATOM 67  C C   . VAL B 1 10 ? -4.236  4.419  -31.704 1.00 52.90  103 A 1 \nATOM 68  O O   . VAL B 1 10 ? -4.772  4.355  -30.607 1.00 49.99  103 A 1 \nATOM 69  C CB  . VAL B 1 10 ? -5.317  5.742  -33.553 1.00 51.75  103 A 1 \nATOM 70  C CG1 . VAL B 1 10 ? -6.606  5.137  -33.045 1.00 52.18  103 A 1 \nATOM 71  C CG2 . VAL B 1 10 ? -5.610  7.153  -33.983 1.00 52.67  103 A 1 \nATOM 72  N N   . LYS B 1 11 ? -3.601  3.402  -32.243 1.00 55.55  104 A 1 \nATOM 73  C CA  . LYS B 1 11 ? -3.521  2.104  -31.626 1.00 56.87  104 A 1 \nATOM 74  C C   . LYS B 1 11 ? -2.709  2.164  -30.350 1.00 60.76  104 A 1 \nATOM 75  O O   . LYS B 1 11 ? -2.986  1.464  -29.399 1.00 58.80  104 A 1 \nATOM 76  C CB  . LYS B 1 11 ? -2.837  1.155  -32.582 1.00 60.72  104 A 1 \nATOM 77  C CG  . LYS B 1 11 ? -3.729  0.487  -33.601 1.00 72.80  104 A 1 \nATOM 78  C CD  . LYS B 1 11 ? -2.915  -0.472 -34.451 1.00 79.85  104 A 1 \nATOM 79  C CE  . LYS B 1 11 ? -3.664  -0.963 -35.666 1.00 84.90  104 A 1 \nATOM 80  N NZ  . LYS B 1 11 ? -5.110  -0.693 -35.513 1.00 94.50  104 A 1 \nATOM 81  N N   . GLU B 1 12 ? -1.674  2.982  -30.369 1.00 56.70  105 A 1 \nATOM 82  C CA  . GLU B 1 12 ? -0.798  3.204  -29.249 1.00 54.71  105 A 1 \nATOM 83  C C   . GLU B 1 12 ? -1.507  3.946  -28.155 1.00 52.45  105 A 1 \nATOM 84  O O   . GLU B 1 12 ? -1.387  3.608  -27.007 1.00 51.88  105 A 1 \nATOM 85  C CB  . GLU B 1 12 ? 0.404   4.036  -29.667 1.00 60.63  105 A 1 \nATOM 86  C CG  . GLU B 1 12 ? 1.418   4.261  -28.569 1.00 71.75  105 A 1 \nATOM 87  C CD  . GLU B 1 12 ? 2.100   2.985  -28.105 1.00 83.66  105 A 1 \nATOM 88  O OE1 . GLU B 1 12 ? 1.973   1.951  -28.793 1.00 97.71  105 A 1 \nATOM 89  O OE2 . GLU B 1 12 ? 2.729   3.008  -27.039 1.00 91.62  105 A 1 \nATOM 90  N N   . MET B 1 13 ? -2.250  4.972  -28.495 1.00 50.99  106 A 1 \nATOM 91  C CA  . MET B 1 13 ? -2.993  5.703  -27.508 1.00 53.07  106 A 1 \nATOM 92  C C   . MET B 1 13 ? -4.045  4.874  -26.849 1.00 51.54  106 A 1 \nATOM 93  O O   . MET B 1 13 ? -4.220  4.974  -25.651 1.00 48.88  106 A 1 \nATOM 94  C CB  . MET B 1 13 ? -3.640  6.915  -28.107 1.00 61.60  106 A 1 \nATOM 95  C CG  . MET B 1 13 ? -2.651  8.032  -28.402 1.00 65.35  106 A 1 \nATOM 96  S SD  . MET B 1 13 ? -3.551  9.590  -28.498 1.00 76.88  106 A 1 \nATOM 97  C CE  . MET B 1 13 ? -3.620  9.931  -26.737 1.00 76.03  106 A 1 \nATOM 98  N N   . ARG B 1 14 ? -4.714  4.016  -27.571 1.00 53.52  107 A 1 \nATOM 99  C CA  . ARG B 1 14 ? -5.703  3.187  -26.952 1.00 50.53  107 A 1 \nATOM 100 C C   . ARG B 1 14 ? -5.040  2.268  -25.975 1.00 51.01  107 A 1 \nATOM 101 O O   . ARG B 1 14 ? -5.527  2.040  -24.903 1.00 48.89  107 A 1 \nATOM 102 C CB  . ARG B 1 14 ? -6.358  2.367  -28.011 1.00 54.79  107 A 1 \nATOM 103 C CG  . ARG B 1 14 ? -7.580  1.648  -27.566 1.00 60.71  107 A 1 \nATOM 104 C CD  . ARG B 1 14 ? -7.895  0.586  -28.570 1.00 70.83  107 A 1 \nATOM 105 N NE  . ARG B 1 14 ? -8.689  1.116  -29.658 1.00 78.79  107 A 1 \nATOM 106 C CZ  . ARG B 1 14 ? -8.278  1.182  -30.911 1.00 81.77  107 A 1 \nATOM 107 N NH1 . ARG B 1 14 ? -7.086  0.746  -31.233 1.00 91.09  107 A 1 \nATOM 108 N NH2 . ARG B 1 14 ? -9.071  1.675  -31.832 1.00 79.36  107 A 1 \nATOM 109 N N   . ARG B 1 15 ? -3.896  1.754  -26.355 1.00 46.73  108 A 1 \nATOM 110 C CA  . ARG B 1 15 ? -3.174  0.827  -25.534 1.00 45.05  108 A 1 \nATOM 111 C C   . ARG B 1 15 ? -2.681  1.503  -24.248 1.00 47.85  108 A 1 \nATOM 112 O O   . ARG B 1 15 ? -2.752  0.930  -23.189 1.00 50.40  108 A 1 \nATOM 113 C CB  . ARG B 1 15 ? -2.063  0.286  -26.404 1.00 50.23  108 A 1 \nATOM 114 C CG  . ARG B 1 15 ? -1.165  -0.750 -25.876 1.00 59.06  108 A 1 \nATOM 115 C CD  . ARG B 1 15 ? -0.358  -1.317 -27.046 1.00 59.59  108 A 1 \nATOM 116 N NE  . ARG B 1 15 ? 0.861   -1.991 -26.583 1.00 65.92  108 A 1 \nATOM 117 N N   . GLN B 1 16 ? -2.221  2.739  -24.349 1.00 49.74  109 A 1 \nATOM 118 C CA  . GLN B 1 16 ? -1.810  3.511  -23.193 1.00 47.85  109 A 1 \nATOM 119 C C   . GLN B 1 16 ? -2.993  3.774  -22.279 1.00 48.41  109 A 1 \nATOM 120 O O   . GLN B 1 16 ? -2.898  3.560  -21.091 1.00 46.33  109 A 1 \nATOM 121 C CB  . GLN B 1 16 ? -1.209  4.809  -23.611 1.00 49.18  109 A 1 \nATOM 122 C CG  . GLN B 1 16 ? 0.208   4.681  -24.112 1.00 53.75  109 A 1 \nATOM 123 C CD  . GLN B 1 16 ? 0.618   5.857  -24.974 1.00 61.24  109 A 1 \nATOM 124 O OE1 . GLN B 1 16 ? -0.145  6.791  -25.159 1.00 69.70  109 A 1 \nATOM 125 N NE2 . GLN B 1 16 ? 1.786   5.782  -25.546 1.00 63.00  109 A 1 \nATOM 126 N N   . LEU B 1 17 ? -4.098  4.266  -22.817 1.00 45.61  110 A 1 \nATOM 127 C CA  . LEU B 1 17 ? -5.278  4.506  -22.010 1.00 41.80  110 A 1 \nATOM 128 C C   . LEU B 1 17 ? -5.848  3.244  -21.329 1.00 44.01  110 A 1 \nATOM 129 O O   . LEU B 1 17 ? -6.378  3.314  -20.232 1.00 49.63  110 A 1 \nATOM 130 C CB  . LEU B 1 17 ? -6.380  5.133  -22.818 1.00 41.83  110 A 1 \nATOM 131 C CG  . LEU B 1 17 ? -6.545  6.610  -23.075 1.00 44.57  110 A 1 \nATOM 132 C CD1 . LEU B 1 17 ? -6.481  7.448  -21.815 1.00 46.53  110 A 1 \nATOM 133 C CD2 . LEU B 1 17 ? -5.534  7.076  -24.054 1.00 46.70  110 A 1 \nATOM 134 N N   . GLU B 1 18 ? -5.724  2.085  -21.974 1.00 48.92  111 A 1 \nATOM 135 C CA  . GLU B 1 18 ? -6.176  0.854  -21.354 1.00 50.45  111 A 1 \nATOM 136 C C   . GLU B 1 18 ? -5.278  0.446  -20.173 1.00 50.00  111 A 1 \nATOM 137 O O   . GLU B 1 18 ? -5.748  -0.088 -19.155 1.00 52.97  111 A 1 \nATOM 138 C CB  . GLU B 1 18 ? -6.361  -0.236 -22.405 1.00 54.05  111 A 1 \nATOM 139 C CG  . GLU B 1 18 ? -7.693  -0.095 -23.112 1.00 59.57  111 A 1 \nATOM 140 C CD  . GLU B 1 18 ? -7.804  -0.858 -24.438 1.00 68.03  111 A 1 \nATOM 141 O OE1 . GLU B 1 18 ? -6.834  -1.521 -24.893 1.00 73.96  111 A 1 \nATOM 142 O OE2 . GLU B 1 18 ? -8.896  -0.808 -25.069 1.00 73.24  111 A 1 \nATOM 143 N N   . MET B 1 19 ? -4.000  0.760  -20.284 1.00 48.79  112 A 1 \nATOM 144 C CA  . MET B 1 19 ? -3.094  0.512  -19.186 1.00 52.15  112 A 1 \nATOM 145 C C   . MET B 1 19 ? -3.371  1.430  -18.007 1.00 47.91  112 A 1 \nATOM 146 O O   . MET B 1 19 ? -3.429  0.986  -16.872 1.00 45.58  112 A 1 \nATOM 147 C CB  . MET B 1 19 ? -1.653  0.667  -19.617 1.00 54.11  112 A 1 \nATOM 148 C CG  . MET B 1 19 ? -1.053  -0.654 -20.052 1.00 58.96  112 A 1 \nATOM 149 S SD  . MET B 1 19 ? 0.471   -0.323 -20.923 1.00 65.09  112 A 1 \nATOM 150 C CE  . MET B 1 19 ? 1.501   -0.237 -19.466 1.00 67.56  112 A 1 \nATOM 151 N N   . ILE B 1 20 ? -3.541  2.711  -18.297 1.00 43.25  113 A 1 \nATOM 152 C CA  . ILE B 1 20 ? -3.900  3.677  -17.287 1.00 40.09  113 A 1 \nATOM 153 C C   . ILE B 1 20 ? -5.165  3.240  -16.596 1.00 40.28  113 A 1 \nATOM 154 O O   . ILE B 1 20 ? -5.297  3.383  -15.395 1.00 41.67  113 A 1 \nATOM 155 C CB  . ILE B 1 20 ? -4.079  5.077  -17.885 1.00 41.26  113 A 1 \nATOM 156 C CG1 . ILE B 1 20 ? -2.700  5.633  -18.275 1.00 39.56  113 A 1 \nATOM 157 C CG2 . ILE B 1 20 ? -4.715  6.029  -16.880 1.00 44.72  113 A 1 \nATOM 158 C CD1 . ILE B 1 20 ? -2.722  6.963  -19.009 1.00 37.40  113 A 1 \nATOM 159 N N   . ASP B 1 21 ? -6.096  2.680  -17.346 1.00 41.39  114 A 1 \nATOM 160 C CA  . ASP B 1 21 ? -7.302  2.201  -16.728 1.00 46.35  114 A 1 \nATOM 161 C C   . ASP B 1 21 ? -7.074  1.044  -15.762 1.00 45.76  114 A 1 \nATOM 162 O O   . ASP B 1 21 ? -7.662  1.035  -14.682 1.00 43.56  114 A 1 \nATOM 163 C CB  . ASP B 1 21 ? -8.272  1.734  -17.759 1.00 51.71  114 A 1 \nATOM 164 C CG  . ASP B 1 21 ? -9.647  1.640  -17.208 1.00 60.74  114 A 1 \nATOM 165 O OD1 . ASP B 1 21 ? -10.153 2.682  -16.742 1.00 68.50  114 A 1 \nATOM 166 O OD2 . ASP B 1 21 ? -10.199 0.528  -17.210 1.00 73.36  114 A 1 \nATOM 167 N N   . LYS B 1 22 ? -6.258  0.070  -16.178 1.00 47.51  115 A 1 \nATOM 168 C CA  . LYS B 1 22 ? -5.942  -1.062 -15.321 1.00 50.59  115 A 1 \nATOM 169 C C   . LYS B 1 22 ? -5.255  -0.563 -14.028 1.00 52.11  115 A 1 \nATOM 170 O O   . LYS B 1 22 ? -5.648  -0.941 -12.919 1.00 55.27  115 A 1 \nATOM 171 C CB  . LYS B 1 22 ? -5.085  -2.111 -16.025 1.00 52.86  115 A 1 \nATOM 172 C CG  . LYS B 1 22 ? -5.829  -3.010 -17.008 1.00 57.80  115 A 1 \nATOM 173 N N   . LEU B 1 23 ? -4.266  0.312  -14.176 1.00 48.62  116 A 1 \nATOM 174 C CA  . LEU B 1 23 ? -3.594  0.880  -13.039 1.00 44.80  116 A 1 \nATOM 175 C C   . LEU B 1 23 ? -4.511  1.665  -12.106 1.00 44.04  116 A 1 \nATOM 176 O O   . LEU B 1 23 ? -4.412  1.565  -10.897 1.00 41.22  116 A 1 \nATOM 177 C CB  . LEU B 1 23 ? -2.492  1.781  -13.511 1.00 43.26  116 A 1 \nATOM 178 C CG  . LEU B 1 23 ? -1.353  1.039  -14.177 1.00 45.18  116 A 1 \nATOM 179 C CD1 . LEU B 1 23 ? -0.449  2.064  -14.839 1.00 45.01  116 A 1 \nATOM 180 C CD2 . LEU B 1 23 ? -0.582  0.210  -13.156 1.00 45.90  116 A 1 \nATOM 181 N N   . THR B 1 24 ? -5.402  2.445  -12.674 1.00 49.17  117 A 1 \nATOM 182 C CA  . THR B 1 24 ? -6.382  3.155  -11.886 1.00 49.60  117 A 1 \nATOM 183 C C   . THR B 1 24 ? -7.250  2.198  -11.085 1.00 51.60  117 A 1 \nATOM 184 O O   . THR B 1 24 ? -7.503  2.441  -9.918  1.00 50.82  117 A 1 \nATOM 185 C CB  . THR B 1 24 ? -7.248  4.024  -12.811 1.00 54.67  117 A 1 \nATOM 186 O OG1 . THR B 1 24 ? -6.463  5.126  -13.253 1.00 58.01  117 A 1 \nATOM 187 C CG2 . THR B 1 24 ? -8.464  4.559  -12.141 1.00 57.77  117 A 1 \nATOM 188 N N   . THR B 1 25 ? -7.718  1.116  -11.704 1.00 53.09  118 A 1 \nATOM 189 C CA  . THR B 1 25 ? -8.495  0.117  -10.981 1.00 50.55  118 A 1 \nATOM 190 C C   . THR B 1 25 ? -7.709  -0.503 -9.820  1.00 49.50  118 A 1 \nATOM 191 O O   . THR B 1 25 ? -8.267  -0.695 -8.720  1.00 50.25  118 A 1 \nATOM 192 C CB  . THR B 1 25 ? -8.933  -0.983 -11.947 1.00 53.52  118 A 1 \nATOM 193 O OG1 . THR B 1 25 ? -9.796  -0.396 -12.916 1.00 60.17  118 A 1 \nATOM 194 C CG2 . THR B 1 25 ? -9.619  -2.127 -11.260 1.00 58.18  118 A 1 \nATOM 195 N N   . ARG B 1 26 ? -6.447  -0.762 -10.054 1.00 48.62  119 A 1 \nATOM 196 C CA  . ARG B 1 26 ? -5.575  -1.319 -9.076  1.00 52.29  119 A 1 \nATOM 197 C C   . ARG B 1 26 ? -5.362  -0.349 -7.936  1.00 56.15  119 A 1 \nATOM 198 O O   . ARG B 1 26 ? -5.203  -0.758 -6.818  1.00 60.08  119 A 1 \nATOM 199 C CB  . ARG B 1 26 ? -4.262  -1.609 -9.738  1.00 57.25  119 A 1 \nATOM 200 C CG  . ARG B 1 26 ? -4.341  -2.608 -10.845 1.00 67.09  119 A 1 \nATOM 201 C CD  . ARG B 1 26 ? -4.671  -3.974 -10.307 1.00 78.77  119 A 1 \nATOM 202 N NE  . ARG B 1 26 ? -4.743  -4.923 -11.390 1.00 95.96  119 A 1 \nATOM 203 C CZ  . ARG B 1 26 ? -3.703  -5.558 -11.900 1.00 111.57 119 A 1 \nATOM 204 N NH1 . ARG B 1 26 ? -3.881  -6.412 -12.892 1.00 120.54 119 A 1 \nATOM 205 N NH2 . ARG B 1 26 ? -2.494  -5.350 -11.417 1.00 114.95 119 A 1 \nATOM 206 N N   . GLY B 1 27 ? -5.312  0.940  -8.241  1.00 57.29  120 A 1 \nATOM 207 C CA  . GLY B 1 27 ? -5.176  2.005  -7.265  1.00 55.03  120 A 1 \nATOM 208 C C   . GLY B 1 27 ? -6.391  2.105  -6.381  1.00 51.16  120 A 1 \nATOM 209 O O   . GLY B 1 27 ? -6.273  2.252  -5.174  1.00 48.31  120 A 1 \nATOM 210 N N   . ILE B 1 28 ? -7.570  1.983  -6.973  1.00 48.29  121 A 1 \nATOM 211 C CA  . ILE B 1 28 ? -8.807  2.040  -6.198  1.00 51.59  121 A 1 \nATOM 212 C C   . ILE B 1 28 ? -8.893  0.889  -5.227  1.00 54.18  121 A 1 \nATOM 213 O O   . ILE B 1 28 ? -9.376  1.068  -4.118  1.00 53.53  121 A 1 \nATOM 214 C CB  . ILE B 1 28 ? -10.053 2.141  -7.095  1.00 55.27  121 A 1 \nATOM 215 C CG1 . ILE B 1 28 ? -10.187 3.601  -7.621  1.00 55.95  121 A 1 \nATOM 216 C CG2 . ILE B 1 28 ? -11.306 1.807  -6.320  1.00 61.76  121 A 1 \nATOM 217 C CD1 . ILE B 1 28 ? -11.126 3.822  -8.793  1.00 55.74  121 A 1 \nATOM 218 N N   . GLU B 1 29 ? -8.420  -0.273 -5.627  1.00 61.84  122 A 1 \nATOM 219 C CA  . GLU B 1 29 ? -8.319  -1.378 -4.700  1.00 67.68  122 A 1 \nATOM 220 C C   . GLU B 1 29 ? -7.415  -1.069 -3.537  1.00 65.03  122 A 1 \nATOM 221 O O   . GLU B 1 29 ? -7.791  -1.331 -2.393  1.00 64.70  122 A 1 \nATOM 222 C CB  . GLU B 1 29 ? -7.868  -2.634 -5.431  1.00 78.78  122 A 1 \nATOM 223 C CG  . GLU B 1 29 ? -9.069  -3.428 -5.962  1.00 86.76  122 A 1 \nATOM 224 C CD  . GLU B 1 29 ? -8.878  -4.019 -7.353  1.00 87.49  122 A 1 \nATOM 225 O OE1 . GLU B 1 29 ? -7.768  -4.558 -7.636  1.00 84.73  122 A 1 \nATOM 226 O OE2 . GLU B 1 29 ? -9.870  -3.959 -8.121  1.00 77.87  122 A 1 \nATOM 227 N N   . GLN B 1 30 ? -6.256  -0.484 -3.829  1.00 59.57  123 A 1 \nATOM 228 C CA  . GLN B 1 30 ? -5.315  -0.084 -2.773  1.00 55.23  123 A 1 \nATOM 229 C C   . GLN B 1 30 ? -5.910  0.955  -1.841  1.00 51.86  123 A 1 \nATOM 230 O O   . GLN B 1 30 ? -5.662  0.942  -0.653  1.00 44.12  123 A 1 \nATOM 231 C CB  . GLN B 1 30 ? -4.037  0.514  -3.362  1.00 55.92  123 A 1 \nATOM 232 C CG  . GLN B 1 30 ? -3.221  -0.371 -4.262  1.00 61.37  123 A 1 \nATOM 233 C CD  . GLN B 1 30 ? -2.863  -1.664 -3.614  1.00 62.35  123 A 1 \nATOM 234 O OE1 . GLN B 1 30 ? -2.326  -1.663 -2.512  1.00 63.09  123 A 1 \nATOM 235 N NE2 . GLN B 1 30 ? -3.188  -2.787 -4.276  1.00 70.63  123 A 1 \nATOM 236 N N   . VAL B 1 31 ? -6.703  1.858  -2.386  1.00 57.05  124 A 1 \nATOM 237 C CA  . VAL B 1 31 ? -7.323  2.883  -1.569  1.00 56.37  124 A 1 \nATOM 238 C C   . VAL B 1 31 ? -8.333  2.246  -0.629  1.00 61.68  124 A 1 \nATOM 239 O O   . VAL B 1 31 ? -8.461  2.699  0.470   1.00 58.51  124 A 1 \nATOM 240 C CB  . VAL B 1 31 ? -7.969  3.950  -2.456  1.00 57.06  124 A 1 \nATOM 241 C CG1 . VAL B 1 31 ? -9.007  4.756  -1.702  1.00 58.79  124 A 1 \nATOM 242 C CG2 . VAL B 1 31 ? -6.871  4.864  -2.974  1.00 58.78  124 A 1 \nATOM 243 N N   . GLU B 1 32 ? -9.044  1.205  -1.068  1.00 67.95  125 A 1 \nATOM 244 C CA  . GLU B 1 32 ? -9.940  0.481  -0.175  1.00 64.07  125 A 1 \nATOM 245 C C   . GLU B 1 32 ? -9.140  -0.246 0.887   1.00 61.43  125 A 1 \nATOM 246 O O   . GLU B 1 32 ? -9.521  -0.248 2.049   1.00 58.85  125 A 1 \nATOM 247 C CB  . GLU B 1 32 ? -10.821 -0.511 -0.911  1.00 70.57  125 A 1 \nATOM 248 C CG  . GLU B 1 32 ? -11.844 0.047  -1.875  1.00 81.60  125 A 1 \nATOM 249 C CD  . GLU B 1 32 ? -12.772 1.105  -1.306  1.00 92.01  125 A 1 \nATOM 250 O OE1 . GLU B 1 32 ? -13.833 0.773  -0.713  1.00 101.96 125 A 1 \nATOM 251 O OE2 . GLU B 1 32 ? -12.392 2.286  -1.482  1.00 95.64  125 A 1 \nATOM 252 N N   . LEU B 1 33 ? -8.042  -0.849 0.489   1.00 55.72  126 A 1 \nATOM 253 C CA  . LEU B 1 33 ? -7.201  -1.483 1.447   1.00 58.91  126 A 1 \nATOM 254 C C   . LEU B 1 33 ? -6.628  -0.487 2.476   1.00 56.58  126 A 1 \nATOM 255 O O   . LEU B 1 33 ? -6.271  -0.829 3.592   1.00 59.20  126 A 1 \nATOM 256 C CB  . LEU B 1 33 ? -6.089  -2.149 0.676   1.00 63.68  126 A 1 \nATOM 257 C CG  . LEU B 1 33 ? -5.181  -3.155 1.283   1.00 71.88  126 A 1 \nATOM 258 C CD1 . LEU B 1 33 ? -4.453  -3.972 0.195   1.00 73.91  126 A 1 \nATOM 259 C CD2 . LEU B 1 33 ? -4.179  -2.480 2.169   1.00 75.78  126 A 1 \nATOM 260 N N   . LEU B 1 34 ? -6.482  0.743  2.064   1.00 51.59  127 A 1 \nATOM 261 C CA  . LEU B 1 34 ? -6.054  1.821  2.952   1.00 47.43  127 A 1 \nATOM 262 C C   . LEU B 1 34 ? -7.162  2.293  3.867   1.00 49.18  127 A 1 \nATOM 263 O O   . LEU B 1 34 ? -6.917  2.748  4.956   1.00 48.29  127 A 1 \nATOM 264 C CB  . LEU B 1 34 ? -5.537  2.996  2.165   1.00 43.17  127 A 1 \nATOM 265 C CG  . LEU B 1 34 ? -4.031  2.968  1.890   1.00 42.73  127 A 1 \nATOM 266 C CD1 . LEU B 1 34 ? -3.630  4.313  1.305   1.00 42.46  127 A 1 \nATOM 267 C CD2 . LEU B 1 34 ? -3.088  2.610  3.005   1.00 43.31  127 A 1 \nATOM 268 N N   . LYS B 1 35 ? -8.399  2.214  3.408   1.00 52.51  128 A 1 \nATOM 269 C CA  . LYS B 1 35 ? -9.553  2.535  4.233   1.00 52.46  128 A 1 \nATOM 270 C C   . LYS B 1 35 ? -9.710  1.492  5.330   1.00 53.78  128 A 1 \nATOM 271 O O   . LYS B 1 35 ? -10.040 1.823  6.442   1.00 47.30  128 A 1 \nATOM 272 C CB  . LYS B 1 35 ? -10.830 2.641  3.381   1.00 54.62  128 A 1 \nATOM 273 C CG  . LYS B 1 35 ? -12.138 2.251  4.078   1.00 59.22  128 A 1 \nATOM 274 N N   . ARG B 1 36 ? -9.454  0.236  4.997   1.00 56.56  129 A 1 \nATOM 275 C CA  . ARG B 1 36 ? -9.471  -0.853 5.953   1.00 60.75  129 A 1 \nATOM 276 C C   . ARG B 1 36 ? -8.392  -0.650 7.014   1.00 59.48  129 A 1 \nATOM 277 O O   . ARG B 1 36 ? -8.620  -0.927 8.185   1.00 63.52  129 A 1 \nATOM 278 C CB  . ARG B 1 36 ? -9.292  -2.210 5.247   1.00 65.76  129 A 1 \nATOM 279 C CG  . ARG B 1 36 ? -10.535 -2.769 4.547   1.00 68.71  129 A 1 \nATOM 280 C CD  . ARG B 1 36 ? -10.167 -3.835 3.488   1.00 67.67  129 A 1 \nATOM 281 N N   . ILE B 1 37 ? -7.221  -0.161 6.611   1.00 54.56  130 A 1 \nATOM 282 C CA  . ILE B 1 37 ? -6.140  0.129  7.539   1.00 49.62  130 A 1 \nATOM 283 C C   . ILE B 1 37 ? -6.541  1.250  8.466   1.00 49.00  130 A 1 \nATOM 284 O O   . ILE B 1 37 ? -6.319  1.155  9.647   1.00 47.20  130 A 1 \nATOM 285 C CB  . ILE B 1 37 ? -4.839  0.472  6.806   1.00 51.01  130 A 1 \nATOM 286 C CG1 . ILE B 1 37 ? -4.243  -0.830 6.231   1.00 57.41  130 A 1 \nATOM 287 C CG2 . ILE B 1 37 ? -3.851  1.181  7.755   1.00 49.06  130 A 1 \nATOM 288 C CD1 . ILE B 1 37 ? -2.922  -0.695 5.533   1.00 59.59  130 A 1 \nATOM 289 N N   . HIS B 1 38 ? -7.179  2.276  7.957   1.00 50.21  131 A 1 \nATOM 290 C CA  . HIS B 1 38 ? -7.618  3.356  8.797   1.00 53.53  131 A 1 \nATOM 291 C C   . HIS B 1 38 ? -8.670  2.891  9.780   1.00 62.35  131 A 1 \nATOM 292 O O   . HIS B 1 38 ? -8.744  3.378  10.880  1.00 61.76  131 A 1 \nATOM 293 C CB  . HIS B 1 38 ? -8.175  4.452  7.947   1.00 51.42  131 A 1 \nATOM 294 C CG  . HIS B 1 38 ? -9.034  5.412  8.688   1.00 54.14  131 A 1 \nATOM 295 N ND1 . HIS B 1 38 ? -10.380 5.221  8.850   1.00 59.92  131 A 1 \nATOM 296 C CD2 . HIS B 1 38 ? -8.749  6.586  9.283   1.00 55.36  131 A 1 \nATOM 297 C CE1 . HIS B 1 38 ? -10.887 6.229  9.522   1.00 62.46  131 A 1 \nATOM 298 N NE2 . HIS B 1 38 ? -9.918  7.073  9.795   1.00 61.48  131 A 1 \nATOM 299 N N   . ASP B 1 39 ? -9.476  1.928  9.394   1.00 63.84  132 A 1 \nATOM 300 C CA  . ASP B 1 39 ? -10.480 1.421  10.286  1.00 65.95  132 A 1 \nATOM 301 C C   . ASP B 1 39 ? -9.837  0.648  11.420  1.00 61.61  132 A 1 \nATOM 302 O O   . ASP B 1 39 ? -10.164 0.840  12.551  1.00 56.16  132 A 1 \nATOM 303 C CB  . ASP B 1 39 ? -11.456 0.577  9.509   1.00 73.60  132 A 1 \nATOM 304 C CG  . ASP B 1 39 ? -12.373 1.404  8.658   1.00 76.60  132 A 1 \nATOM 305 O OD1 . ASP B 1 39 ? -12.277 2.631  8.703   1.00 70.60  132 A 1 \nATOM 306 O OD2 . ASP B 1 39 ? -13.195 0.833  7.937   1.00 81.44  132 A 1 \nATOM 307 N N   . LYS B 1 40 ? -8.926  -0.245 11.106  1.00 59.87  133 A 1 \nATOM 308 C CA  . LYS B 1 40 ? -8.191  -0.985 12.129  1.00 59.13  133 A 1 \nATOM 309 C C   . LYS B 1 40 ? -7.573  -0.021 13.157  1.00 58.88  133 A 1 \nATOM 310 O O   . LYS B 1 40 ? -7.579  -0.267 14.361  1.00 63.83  133 A 1 \nATOM 311 C CB  . LYS B 1 40 ? -7.093  -1.864 11.503  1.00 58.69  133 A 1 \nATOM 312 C CG  . LYS B 1 40 ? -7.577  -3.018 10.646  1.00 62.42  133 A 1 \nATOM 313 C CD  . LYS B 1 40 ? -6.463  -3.844 9.987   1.00 62.93  133 A 1 \nATOM 314 N N   . LEU B 1 41 ? -7.038  1.086  12.674  1.00 60.19  134 A 1 \nATOM 315 C CA  . LEU B 1 41 ? -6.454  2.092  13.561  1.00 62.93  134 A 1 \nATOM 316 C C   . LEU B 1 41 ? -7.487  2.707  14.452  1.00 63.64  134 A 1 \nATOM 317 O O   . LEU B 1 41 ? -7.205  2.982  15.605  1.00 73.06  134 A 1 \nATOM 318 C CB  . LEU B 1 41 ? -5.765  3.197  12.764  1.00 64.98  134 A 1 \nATOM 319 C CG  . LEU B 1 41 ? -4.531  2.611  12.036  1.00 68.88  134 A 1 \nATOM 320 C CD1 . LEU B 1 41 ? -4.332  3.201  10.638  1.00 78.49  134 A 1 \nATOM 321 C CD2 . LEU B 1 41 ? -3.301  2.685  12.900  1.00 67.40  134 A 1 \nATOM 322 N N   . MET B 1 42 ? -8.669  2.955  13.913  1.00 63.76  135 A 1 \nATOM 323 C CA  . MET B 1 42 ? -9.752  3.512  14.704  1.00 67.57  135 A 1 \nATOM 324 C C   . MET B 1 42 ? -10.186 2.561  15.817  1.00 72.44  135 A 1 \nATOM 325 O O   . MET B 1 42 ? -10.413 2.985  16.975  1.00 66.48  135 A 1 \nATOM 326 C CB  . MET B 1 42 ? -10.932 3.853  13.816  1.00 69.82  135 A 1 \nATOM 327 C CG  . MET B 1 42 ? -10.710 5.112  13.020  1.00 74.54  135 A 1 \nATOM 328 S SD  . MET B 1 42 ? -10.062 6.547  13.958  1.00 82.27  135 A 1 \nATOM 329 C CE  . MET B 1 42 ? -11.073 6.663  15.446  1.00 83.33  135 A 1 \nATOM 330 N N   . ILE B 1 43 ? -10.271 1.274  15.477  1.00 81.93  136 A 1 \nATOM 331 C CA  . ILE B 1 43 ? -10.594 0.243  16.446  1.00 79.15  136 A 1 \nATOM 332 C C   . ILE B 1 43 ? -9.526  0.183  17.546  1.00 79.65  136 A 1 \nATOM 333 O O   . ILE B 1 43 ? -9.854  0.128  18.719  1.00 82.01  136 A 1 \nATOM 334 C CB  . ILE B 1 43 ? -10.781 -1.129 15.738  1.00 80.39  136 A 1 \nATOM 335 C CG1 . ILE B 1 43 ? -12.176 -1.237 15.090  1.00 78.84  136 A 1 \nATOM 336 C CG2 . ILE B 1 43 ? -10.586 -2.294 16.708  1.00 84.53  136 A 1 \nATOM 337 C CD1 . ILE B 1 43 ? -12.480 -0.642 13.720  1.00 74.74  136 A 1 \nATOM 338 N N   . ARG B 1 44 ? -8.250  0.200  17.158  1.00 85.15  137 A 1 \nATOM 339 C CA  . ARG B 1 44 ? -7.131  0.216  18.111  1.00 90.78  137 A 1 \nATOM 340 C C   . ARG B 1 44 ? -7.103  1.498  18.957  1.00 91.00  137 A 1 \nATOM 341 O O   . ARG B 1 44 ? -6.632  1.453  20.068  1.00 96.79  137 A 1 \nATOM 342 C CB  . ARG B 1 44 ? -5.803  0.033  17.373  1.00 95.82  137 A 1 \nATOM 343 C CG  . ARG B 1 44 ? -4.883  -1.005 17.902  1.00 101.09 137 A 1 \nATOM 344 C CD  . ARG B 1 44 ? -3.772  -1.099 16.880  1.00 107.64 137 A 1 \nATOM 345 N NE  . ARG B 1 44 ? -2.978  -2.299 17.060  1.00 124.71 137 A 1 \nATOM 346 C CZ  . ARG B 1 44 ? -2.237  -2.882 16.112  1.00 137.30 137 A 1 \nATOM 347 N NH1 . ARG B 1 44 ? -2.186  -2.387 14.871  1.00 128.35 137 A 1 \nATOM 348 N NH2 . ARG B 1 44 ? -1.533  -3.990 16.400  1.00 147.87 137 A 1 \nATOM 349 N N   . ALA B 1 45 ? -7.688  2.601  18.506  1.00 92.41  138 A 1 \nATOM 350 C CA  . ALA B 1 45 ? -7.783  3.810  19.381  1.00 96.29  138 A 1 \nATOM 351 C C   . ALA B 1 45 ? -8.773  4.837  18.851  1.00 95.46  138 A 1 \nATOM 352 O O   . ALA B 1 45 ? -8.386  5.847  18.235  1.00 81.53  138 A 1 \nATOM 353 C CB  . ALA B 1 45 ? -6.408  4.475  19.603  1.00 97.91  138 A 1 \n#\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/pdb_mmcif/6s61.cif",
    "content": "data_6S61\n#\n_entry.id 6S61\n#\nloop_\n_chem_comp.formula\n_chem_comp.formula_weight\n_chem_comp.id\n_chem_comp.mon_nstd_flag\n_chem_comp.name\n_chem_comp.pdbx_synonyms\n_chem_comp.type\n\"C3 H7 N O2\"     89.093  ALA y ALANINE         ? \"L-peptide linking\" \n\"C6 H15 N4 O2 1\" 175.209 ARG y ARGININE        ? \"L-peptide linking\" \n\"C4 H8 N2 O3\"    132.118 ASN y ASPARAGINE      ? \"L-peptide linking\" \n\"C4 H7 N O4\"     133.103 ASP y \"ASPARTIC ACID\" ? \"L-peptide linking\" \n\"C3 H7 N O2 S\"   121.158 CYS y CYSTEINE        ? \"L-peptide linking\" \n\"Fe 3\"           55.845  FE  . \"FE (III) ION\"  ? non-polymer         \n\"C5 H10 N2 O3\"   146.144 GLN y GLUTAMINE       ? \"L-peptide linking\" \n\"C5 H9 N O4\"     147.129 GLU y \"GLUTAMIC ACID\" ? \"L-peptide linking\" \n\"C2 H5 N O2\"     75.067  GLY y GLYCINE         ? \"peptide linking\"   \n\"C6 H10 N3 O2 1\" 156.162 HIS y HISTIDINE       ? \"L-peptide linking\" \n\"H2 O\"           18.015  HOH . WATER           ? non-polymer         \n\"C6 H13 N O2\"    131.173 ILE y ISOLEUCINE      ? \"L-peptide linking\" \n\"C6 H13 N O2\"    131.173 LEU y LEUCINE         ? \"L-peptide linking\" \n\"C6 H15 N2 O2 1\" 147.195 LYS y LYSINE          ? \"L-peptide linking\" \n\"C5 H11 N O2 S\"  149.211 MET y METHIONINE      ? \"L-peptide linking\" \n\"C9 H11 N O2\"    165.189 PHE y PHENYLALANINE   ? \"L-peptide linking\" \n\"C5 H9 N O2\"     115.130 PRO y PROLINE         ? \"L-peptide linking\" \n\"C3 H7 N O3\"     105.093 SER y SERINE          ? \"L-peptide linking\" \n\"C4 H9 N O3\"     119.119 THR y THREONINE       ? \"L-peptide linking\" \n\"C11 H12 N2 O2\"  204.225 TRP y TRYPTOPHAN      ? \"L-peptide linking\" \n\"C9 H11 N O3\"    181.189 TYR y TYROSINE        ? \"L-peptide linking\" \n\"C5 H11 N O2\"    117.146 VAL y VALINE          ? \"L-peptide linking\" \n\"Zn 2\"           65.409  ZN  . \"ZINC ION\"      ? non-polymer         \n#\nloop_\n_entity.id\n_entity.pdbx_description\n_entity.type\n1 \"Ferritin heavy chain\" polymer     \n3 \"ZINC ION\"             non-polymer \n#\n_entity_poly.entity_id      1\n_entity_poly.pdbx_strand_id M\n_entity_poly.type           polypeptide(L)\n#\nloop_\n_entity_poly_seq.entity_id\n_entity_poly_seq.hetero\n_entity_poly_seq.mon_id\n_entity_poly_seq.num\n1 n MET 1   \n1 n THR 2   \n1 n THR 3   \n1 n ALA 4   \n1 n SER 5   \n1 n PRO 6   \n1 n SER 7   \n1 n GLN 8   \n1 n VAL 9   \n1 n ARG 10  \n1 n GLN 11  \n1 n ASN 12  \n1 n TYR 13  \n1 n HIS 14  \n1 n GLN 15  \n1 n ASP 16  \n1 n ALA 17  \n1 n GLU 18  \n1 n ALA 19  \n1 n ALA 20  \n1 n ILE 21  \n1 n ASN 22  \n1 n ARG 23  \n1 n GLN 24  \n1 n ILE 25  \n1 n ASN 26  \n1 n LEU 27  \n1 n GLU 28  \n1 n LEU 29  \n1 n TYR 30  \n1 n ALA 31  \n1 n SER 32  \n1 n TYR 33  \n1 n VAL 34  \n1 n TYR 35  \n1 n LEU 36  \n1 n SER 37  \n1 n MET 38  \n1 n SER 39  \n1 n CYS 40  \n1 n TYR 41  \n1 n PHE 42  \n1 n ASP 43  \n1 n ARG 44  \n1 n ASP 45  \n1 n ASP 46  \n1 n VAL 47  \n1 n ALA 48  \n1 n LEU 49  \n1 n LYS 50  \n1 n ASN 51  \n1 n PHE 52  \n1 n ALA 53  \n1 n LYS 54  \n1 n TYR 55  \n1 n PHE 56  \n1 n LEU 57  \n1 n HIS 58  \n1 n GLN 59  \n1 n SER 60  \n1 n HIS 61  \n1 n GLU 62  \n1 n GLU 63  \n1 n ARG 64  \n1 n GLU 65  \n1 n HIS 66  \n1 n ALA 67  \n1 n GLU 68  \n1 n LYS 69  \n1 n LEU 70  \n1 n MET 71  \n1 n LYS 72  \n1 n LEU 73  \n1 n GLN 74  \n1 n ASN 75  \n1 n GLN 76  \n1 n ARG 77  \n1 n GLY 78  \n1 n GLY 79  \n1 n ARG 80  \n1 n ILE 81  \n1 n PHE 82  \n1 n LEU 83  \n1 n GLN 84  \n1 n ASP 85  \n1 n ILE 86  \n1 n LYS 87  \n1 n LYS 88  \n1 n PRO 89  \n1 n ASP 90  \n1 n ARG 91  \n1 n ASP 92  \n1 n ASP 93  \n1 n TRP 94  \n1 n GLU 95  \n1 n SER 96  \n1 n GLY 97  \n1 n LEU 98  \n1 n ASN 99  \n1 n ALA 100 \n1 n MET 101 \n1 n GLU 102 \n1 n CYS 103 \n1 n ALA 104 \n1 n LEU 105 \n1 n HIS 106 \n1 n LEU 107 \n1 n GLU 108 \n1 n LYS 109 \n1 n SER 110 \n1 n VAL 111 \n1 n ASN 112 \n1 n GLN 113 \n1 n SER 114 \n1 n LEU 115 \n1 n LEU 116 \n1 n GLU 117 \n1 n LEU 118 \n1 n HIS 119 \n1 n LYS 120 \n1 n LEU 121 \n1 n ALA 122 \n1 n THR 123 \n1 n ASP 124 \n1 n LYS 125 \n1 n ASN 126 \n1 n ASP 127 \n1 n PRO 128 \n1 n HIS 129 \n1 n LEU 130 \n1 n CYS 131 \n1 n ASP 132 \n1 n PHE 133 \n1 n ILE 134 \n1 n GLU 135 \n1 n THR 136 \n1 n TYR 137 \n1 n TYR 138 \n1 n LEU 139 \n1 n SER 140 \n1 n GLU 141 \n1 n GLN 142 \n1 n VAL 143 \n1 n LYS 144 \n1 n SER 145 \n1 n ILE 146 \n1 n LYS 147 \n1 n GLU 148 \n1 n LEU 149 \n1 n GLY 150 \n1 n ASP 151 \n1 n HIS 152 \n1 n VAL 153 \n1 n THR 154 \n1 n ASN 155 \n1 n LEU 156 \n1 n ARG 157 \n1 n LYS 158 \n1 n MET 159 \n1 n GLY 160 \n1 n ALA 161 \n1 n PRO 162 \n1 n GLU 163 \n1 n ALA 164 \n1 n GLY 165 \n1 n MET 166 \n1 n ALA 167 \n1 n GLU 168 \n1 n TYR 169 \n1 n LEU 170 \n1 n PHE 171 \n1 n ASP 172 \n1 n LYS 173 \n1 n HIS 174 \n1 n THR 175 \n1 n LEU 176 \n1 n GLY 177 \n1 n HIS 178 \n1 n GLY 179 \n1 n ASP 180 \n1 n GLU 181 \n1 n SER 182 \n#\n_exptl.method \"ELECTRON MICROSCOPY\"\n#\n_pdbx_audit_revision_history.revision_date 2019-07-10\n#\n_pdbx_database_status.recvd_initial_deposition_date 2019-07-10\n#\n_pdbx_nonpoly_scheme.asym_id       PA\n_pdbx_nonpoly_scheme.auth_seq_num  201\n_pdbx_nonpoly_scheme.entity_id     3\n_pdbx_nonpoly_scheme.mon_id        ZN\n_pdbx_nonpoly_scheme.pdb_ins_code  .\n_pdbx_nonpoly_scheme.pdb_seq_num   201\n_pdbx_nonpoly_scheme.pdb_strand_id M\n#\nloop_\n_pdbx_poly_seq_scheme.asym_id\n_pdbx_poly_seq_scheme.auth_seq_num\n_pdbx_poly_seq_scheme.entity_id\n_pdbx_poly_seq_scheme.hetero\n_pdbx_poly_seq_scheme.mon_id\n_pdbx_poly_seq_scheme.pdb_ins_code\n_pdbx_poly_seq_scheme.pdb_seq_num\n_pdbx_poly_seq_scheme.pdb_strand_id\n_pdbx_poly_seq_scheme.seq_id\nM ?   1 n MET . 0   M 1   \nM ?   1 n THR . 1   M 2   \nM ?   1 n THR . 2   M 3   \nM ?   1 n ALA . 3   M 4   \nM ?   1 n SER . 4   M 5   \nM 5   1 n PRO . 5   M 6   \nM 6   1 n SER . 6   M 7   \nM 7   1 n GLN . 7   M 8   \nM 8   1 n VAL . 8   M 9   \nM 9   1 n ARG . 9   M 10  \nM 10  1 n GLN . 10  M 11  \nM 11  1 n ASN . 11  M 12  \nM 12  1 n TYR . 12  M 13  \nM 13  1 n HIS . 13  M 14  \nM 14  1 n GLN . 14  M 15  \nM 15  1 n ASP . 15  M 16  \nM 16  1 n ALA . 16  M 17  \nM 17  1 n GLU . 17  M 18  \nM 18  1 n ALA . 18  M 19  \nM 19  1 n ALA . 19  M 20  \nM 20  1 n ILE . 20  M 21  \nM 21  1 n ASN . 21  M 22  \nM 22  1 n ARG . 22  M 23  \nM 23  1 n GLN . 23  M 24  \nM 24  1 n ILE . 24  M 25  \nM 25  1 n ASN . 25  M 26  \nM 26  1 n LEU . 26  M 27  \nM 27  1 n GLU . 27  M 28  \nM 28  1 n LEU . 28  M 29  \nM 29  1 n TYR . 29  M 30  \nM 30  1 n ALA . 30  M 31  \nM 31  1 n SER . 31  M 32  \nM 32  1 n TYR . 32  M 33  \nM 33  1 n VAL . 33  M 34  \nM 34  1 n TYR . 34  M 35  \nM 35  1 n LEU . 35  M 36  \nM 36  1 n SER . 36  M 37  \nM 37  1 n MET . 37  M 38  \nM 38  1 n SER . 38  M 39  \nM 39  1 n CYS . 39  M 40  \nM 40  1 n TYR . 40  M 41  \nM 41  1 n PHE . 41  M 42  \nM 42  1 n ASP . 42  M 43  \nM 43  1 n ARG . 43  M 44  \nM 44  1 n ASP . 44  M 45  \nM 45  1 n ASP . 45  M 46  \nM 46  1 n VAL . 46  M 47  \nM 47  1 n ALA . 47  M 48  \nM 48  1 n LEU . 48  M 49  \nM 49  1 n LYS . 49  M 50  \nM 50  1 n ASN . 50  M 51  \nM 51  1 n PHE . 51  M 52  \nM 52  1 n ALA . 52  M 53  \nM 53  1 n LYS . 53  M 54  \nM 54  1 n TYR . 54  M 55  \nM 55  1 n PHE . 55  M 56  \nM 56  1 n LEU . 56  M 57  \nM 57  1 n HIS . 57  M 58  \nM 58  1 n GLN . 58  M 59  \nM 59  1 n SER . 59  M 60  \nM 60  1 n HIS . 60  M 61  \nM 61  1 n GLU . 61  M 62  \nM 62  1 n GLU . 62  M 63  \nM 63  1 n ARG . 63  M 64  \nM 64  1 n GLU . 64  M 65  \nM 65  1 n HIS . 65  M 66  \nM 66  1 n ALA . 66  M 67  \nM 67  1 n GLU . 67  M 68  \nM 68  1 n LYS . 68  M 69  \nM 69  1 n LEU . 69  M 70  \nM 70  1 n MET . 70  M 71  \nM 71  1 n LYS . 71  M 72  \nM 72  1 n LEU . 72  M 73  \nM 73  1 n GLN . 73  M 74  \nM 74  1 n ASN . 74  M 75  \nM 75  1 n GLN . 75  M 76  \nM 76  1 n ARG . 76  M 77  \nM 77  1 n GLY . 77  M 78  \nM 78  1 n GLY . 78  M 79  \nM 79  1 n ARG . 79  M 80  \nM 80  1 n ILE . 80  M 81  \nM 81  1 n PHE . 81  M 82  \nM 82  1 n LEU . 82  M 83  \nM 83  1 n GLN . 83  M 84  \nM 84  1 n ASP . 84  M 85  \nM 85  1 n ILE . 85  M 86  \nM 86  1 n LYS . 86  M 87  \nM 87  1 n LYS . 87  M 88  \nM 88  1 n PRO . 88  M 89  \nM 89  1 n ASP . 89  M 90  \nM 90  1 n ARG . 90  M 91  \nM 91  1 n ASP . 91  M 92  \nM 92  1 n ASP . 92  M 93  \nM 93  1 n TRP . 93  M 94  \nM 94  1 n GLU . 94  M 95  \nM 95  1 n SER . 95  M 96  \nM 96  1 n GLY . 96  M 97  \nM 97  1 n LEU . 97  M 98  \nM 98  1 n ASN . 98  M 99  \nM 99  1 n ALA . 99  M 100 \nM 100 1 n MET . 100 M 101 \nM 101 1 n GLU . 101 M 102 \nM 102 1 n CYS . 102 M 103 \nM 103 1 n ALA . 103 M 104 \nM 104 1 n LEU . 104 M 105 \nM 105 1 n HIS . 105 M 106 \nM 106 1 n LEU . 106 M 107 \nM 107 1 n GLU . 107 M 108 \nM 108 1 n LYS . 108 M 109 \nM 109 1 n SER . 109 M 110 \nM 110 1 n VAL . 110 M 111 \nM 111 1 n ASN . 111 M 112 \nM 112 1 n GLN . 112 M 113 \nM 113 1 n SER . 113 M 114 \nM 114 1 n LEU . 114 M 115 \nM 115 1 n LEU . 115 M 116 \nM 116 1 n GLU . 116 M 117 \nM 117 1 n LEU . 117 M 118 \nM 118 1 n HIS . 118 M 119 \nM 119 1 n LYS . 119 M 120 \nM 120 1 n LEU . 120 M 121 \nM 121 1 n ALA . 121 M 122 \nM 122 1 n THR . 122 M 123 \nM 123 1 n ASP . 123 M 124 \nM 124 1 n LYS . 124 M 125 \nM 125 1 n ASN . 125 M 126 \nM 126 1 n ASP . 126 M 127 \nM 127 1 n PRO . 127 M 128 \nM 128 1 n HIS . 128 M 129 \nM 129 1 n LEU . 129 M 130 \nM 130 1 n CYS . 130 M 131 \nM 131 1 n ASP . 131 M 132 \nM 132 1 n PHE . 132 M 133 \nM 133 1 n ILE . 133 M 134 \nM 134 1 n GLU . 134 M 135 \nM 135 1 n THR . 135 M 136 \nM 136 1 n TYR . 136 M 137 \nM 137 1 n TYR . 137 M 138 \nM 138 1 n LEU . 138 M 139 \nM 139 1 n SER . 139 M 140 \nM 140 1 n GLU . 140 M 141 \nM 141 1 n GLN . 141 M 142 \nM 142 1 n VAL . 142 M 143 \nM 143 1 n LYS . 143 M 144 \nM 144 1 n SER . 144 M 145 \nM 145 1 n ILE . 145 M 146 \nM 146 1 n LYS . 146 M 147 \nM 147 1 n GLU . 147 M 148 \nM 148 1 n LEU . 148 M 149 \nM 149 1 n GLY . 149 M 150 \nM 150 1 n ASP . 150 M 151 \nM 151 1 n HIS . 151 M 152 \nM 152 1 n VAL . 152 M 153 \nM 153 1 n THR . 153 M 154 \nM 154 1 n ASN . 154 M 155 \nM 155 1 n LEU . 155 M 156 \nM 156 1 n ARG . 156 M 157 \nM 157 1 n LYS . 157 M 158 \nM 158 1 n MET . 158 M 159 \nM 159 1 n GLY . 159 M 160 \nM 160 1 n ALA . 160 M 161 \nM 161 1 n PRO . 161 M 162 \nM 162 1 n GLU . 162 M 163 \nM 163 1 n ALA . 163 M 164 \nM 164 1 n GLY . 164 M 165 \nM 165 1 n MET . 165 M 166 \nM 166 1 n ALA . 166 M 167 \nM 167 1 n GLU . 167 M 168 \nM 168 1 n TYR . 168 M 169 \nM 169 1 n LEU . 169 M 170 \nM 170 1 n PHE . 170 M 171 \nM 171 1 n ASP . 171 M 172 \nM 172 1 n LYS . 172 M 173 \nM 173 1 n HIS . 173 M 174 \nM 174 1 n THR . 174 M 175 \nM 175 1 n LEU . 175 M 176 \nM 176 1 n GLY . 176 M 177 \nM ?   1 n HIS . 177 M 178 \nM ?   1 n GLY . 178 M 179 \nM ?   1 n ASP . 179 M 180 \nM ?   1 n GLU . 180 M 181 \nM ?   1 n SER . 181 M 182 \n#\n_pdbx_struct_assembly.details            author_and_software_defined_assembly\n_pdbx_struct_assembly.id                 1\n_pdbx_struct_assembly.method_details     PISA\n_pdbx_struct_assembly.oligomeric_count   24\n_pdbx_struct_assembly.oligomeric_details 24-meric\n#\n_pdbx_struct_assembly_gen.assembly_id     1\n_pdbx_struct_assembly_gen.asym_id_list    A,B,C,D,E,F,G,H,I,J,K,L,M,N,O,P,Q,R,S,T,U,V,W,X,Y,Z,AA,BA,CA,DA,EA,FA,GA,HA,IA,JA,KA,LA,MA,NA,OA,PA,QA,RA,SA,TA,UA,VA,WA,XA,YA,ZA,AB,BB,CB,DB,EB,FB,GB,HB,IB,JB,KB,LB,MB,NB,OB,PB,QB,RB,SB,TB,UB,VB,WB,XB,YB,ZB\n_pdbx_struct_assembly_gen.oper_expression 1\n#\n_pdbx_struct_oper_list.id                 1\n_pdbx_struct_oper_list.matrix[1][1]       1.0000000000\n_pdbx_struct_oper_list.matrix[1][2]       0.0000000000\n_pdbx_struct_oper_list.matrix[1][3]       0.0000000000\n_pdbx_struct_oper_list.matrix[2][1]       0.0000000000\n_pdbx_struct_oper_list.matrix[2][2]       1.0000000000\n_pdbx_struct_oper_list.matrix[2][3]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][1]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][2]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][3]       1.0000000000\n_pdbx_struct_oper_list.name               1_555\n_pdbx_struct_oper_list.symmetry_operation ?\n_pdbx_struct_oper_list.type               \"identity operation\"\n_pdbx_struct_oper_list.vector[1]          0.0000000000\n_pdbx_struct_oper_list.vector[2]          0.0000000000\n_pdbx_struct_oper_list.vector[3]          0.0000000000\n#\n_refine.ls_d_res_high 1.84\n#\n_software.classification other\n_software.name           \"DeepMind Structure Class\"\n_software.pdbx_ordinal   1\n_software.version        2.0.0\n#\nloop_\n_struct_asym.entity_id\n_struct_asym.id\n1 M  \n3 PA \n#\nloop_\n_struct_conn.conn_type_id\n_struct_conn.id\n_struct_conn.pdbx_ptnr1_PDB_ins_code\n_struct_conn.pdbx_ptnr1_label_alt_id\n_struct_conn.pdbx_ptnr2_PDB_ins_code\n_struct_conn.pdbx_ptnr2_label_alt_id\n_struct_conn.pdbx_role\n_struct_conn.pdbx_value_order\n_struct_conn.ptnr1_auth_asym_id\n_struct_conn.ptnr1_auth_seq_id\n_struct_conn.ptnr1_label_asym_id\n_struct_conn.ptnr1_label_atom_id\n_struct_conn.ptnr1_label_comp_id\n_struct_conn.ptnr1_label_seq_id\n_struct_conn.ptnr1_symmetry\n_struct_conn.ptnr2_auth_asym_id\n_struct_conn.ptnr2_auth_seq_id\n_struct_conn.ptnr2_label_asym_id\n_struct_conn.ptnr2_label_atom_id\n_struct_conn.ptnr2_label_comp_id\n_struct_conn.ptnr2_label_seq_id\n_struct_conn.ptnr2_symmetry\nmetalc metalc1 ? ? ? ? ? ? M 27 M OE2 GLU 28 1_555 M 201 PA ZN ZN . 1_555 \nmetalc metalc2 ? ? ? ? ? ? M 62 M OE1 GLU 63 1_555 M 201 PA ZN ZN . 1_555 \nmetalc metalc3 ? ? ? ? ? ? M 65 M ND1 HIS 66 1_555 M 201 PA ZN ZN . 1_555 \n#\n_struct_conn_type.criteria  ?\n_struct_conn_type.id        metalc\n_struct_conn_type.reference ?\n#\nloop_\n_atom_site.group_PDB\n_atom_site.id\n_atom_site.type_symbol\n_atom_site.label_atom_id\n_atom_site.label_alt_id\n_atom_site.label_comp_id\n_atom_site.label_asym_id\n_atom_site.label_entity_id\n_atom_site.label_seq_id\n_atom_site.pdbx_PDB_ins_code\n_atom_site.Cartn_x\n_atom_site.Cartn_y\n_atom_site.Cartn_z\n_atom_site.occupancy\n_atom_site.B_iso_or_equiv\n_atom_site.auth_seq_id\n_atom_site.auth_asym_id\n_atom_site.pdbx_PDB_model_num\nATOM   1    N  N    . PRO M  1 6   ? 122.212 117.597 42.494 1.00 9.28  5   M 1 \nATOM   2    C  CA   . PRO M  1 6   ? 122.084 118.174 43.835 1.00 9.28  5   M 1 \nATOM   3    C  C    . PRO M  1 6   ? 120.908 117.581 44.601 1.00 9.28  5   M 1 \nATOM   4    O  O    . PRO M  1 6   ? 119.808 117.491 44.064 1.00 9.28  5   M 1 \nATOM   5    C  CB   . PRO M  1 6   ? 121.864 119.662 43.555 1.00 9.28  5   M 1 \nATOM   6    C  CG   . PRO M  1 6   ? 121.230 119.694 42.219 1.00 9.28  5   M 1 \nATOM   7    C  CD   . PRO M  1 6   ? 121.846 118.564 41.447 1.00 9.28  5   M 1 \nATOM   8    H  HA   . PRO M  1 6   ? 122.903 118.063 44.342 1.00 9.28  5   M 1 \nATOM   9    H  HB2  . PRO M  1 6   ? 121.285 120.040 44.235 1.00 9.28  5   M 1 \nATOM   10   H  HB3  . PRO M  1 6   ? 122.714 120.128 43.534 1.00 9.28  5   M 1 \nATOM   11   H  HG2  . PRO M  1 6   ? 120.274 119.558 42.308 1.00 9.28  5   M 1 \nATOM   12   H  HG3  . PRO M  1 6   ? 121.419 120.545 41.793 1.00 9.28  5   M 1 \nATOM   13   H  HD2  . PRO M  1 6   ? 121.199 118.179 40.836 1.00 9.28  5   M 1 \nATOM   14   H  HD3  . PRO M  1 6   ? 122.642 118.866 40.982 1.00 9.28  5   M 1 \nATOM   15   N  N    . SER M  1 7   ? 121.145 117.181 45.845 1.00 7.08  6   M 1 \nATOM   16   C  CA   . SER M  1 7   ? 120.080 116.612 46.653 1.00 7.08  6   M 1 \nATOM   17   C  C    . SER M  1 7   ? 119.029 117.671 46.964 1.00 7.08  6   M 1 \nATOM   18   O  O    . SER M  1 7   ? 119.342 118.844 47.176 1.00 7.08  6   M 1 \nATOM   19   C  CB   . SER M  1 7   ? 120.641 116.033 47.949 1.00 7.08  6   M 1 \nATOM   20   O  OG   . SER M  1 7   ? 119.605 115.511 48.745 1.00 7.08  6   M 1 \nATOM   21   H  H    . SER M  1 7   ? 121.906 117.238 46.241 1.00 7.08  6   M 1 \nATOM   22   H  HA   . SER M  1 7   ? 119.655 115.894 46.159 1.00 7.08  6   M 1 \nATOM   23   H  HB2  . SER M  1 7   ? 121.264 115.319 47.741 1.00 7.08  6   M 1 \nATOM   24   H  HB3  . SER M  1 7   ? 121.098 116.727 48.450 1.00 7.08  6   M 1 \nATOM   25   H  HG   . SER M  1 7   ? 119.939 115.148 49.425 1.00 7.08  6   M 1 \nATOM   26   N  N    . GLN M  1 8   ? 117.777 117.226 47.005 1.00 6.97  7   M 1 \nATOM   27   C  CA   . GLN M  1 8   ? 116.610 118.112 47.218 1.00 6.97  7   M 1 \nATOM   28   C  C    . GLN M  1 8   ? 116.732 118.800 48.583 1.00 6.97  7   M 1 \nATOM   29   O  O    . GLN M  1 8   ? 116.136 119.848 48.758 1.00 6.97  7   M 1 \nATOM   30   C  CB   . GLN M  1 8   ? 115.306 117.326 47.078 1.00 6.97  7   M 1 \nATOM   31   C  CG   . GLN M  1 8   ? 115.074 116.345 48.214 1.00 6.97  7   M 1 \nATOM   32   C  CD   . GLN M  1 8   ? 113.835 115.494 48.045 1.00 6.97  7   M 1 \nATOM   33   O  OE1  . GLN M  1 8   ? 112.862 115.903 47.422 1.00 6.97  7   M 1 \nATOM   34   N  NE2  . GLN M  1 8   ? 113.875 114.298 48.614 1.00 6.97  7   M 1 \nATOM   35   H  H    . GLN M  1 8   ? 117.574 116.339 47.027 1.00 6.97  7   M 1 \nATOM   36   H  HA   . GLN M  1 8   ? 116.628 118.808 46.520 1.00 6.97  7   M 1 \nATOM   37   H  HB2  . GLN M  1 8   ? 114.560 117.960 47.043 1.00 6.97  7   M 1 \nATOM   38   H  HB3  . GLN M  1 8   ? 115.326 116.836 46.229 1.00 6.97  7   M 1 \nATOM   39   H  HG2  . GLN M  1 8   ? 115.854 115.755 48.288 1.00 6.97  7   M 1 \nATOM   40   H  HG3  . GLN M  1 8   ? 115.001 116.846 49.054 1.00 6.97  7   M 1 \nATOM   41   H  HE21 . GLN M  1 8   ? 114.576 114.063 49.098 1.00 6.97  7   M 1 \nATOM   42   H  HE22 . GLN M  1 8   ? 113.201 113.736 48.510 1.00 6.97  7   M 1 \nATOM   43   N  N    . VAL M  1 9   ? 117.388 118.172 49.551 1.00 6.25  8   M 1 \nATOM   44   C  CA   . VAL M  1 9   ? 117.529 118.728 50.894 1.00 6.25  8   M 1 \nATOM   45   C  C    . VAL M  1 9   ? 118.772 119.591 51.047 1.00 6.25  8   M 1 \nATOM   46   O  O    . VAL M  1 9   ? 118.891 120.310 52.048 1.00 6.25  8   M 1 \nATOM   47   C  CB   . VAL M  1 9   ? 117.547 117.608 51.957 1.00 6.25  8   M 1 \nATOM   48   C  CG1  . VAL M  1 9   ? 116.257 116.809 51.898 1.00 6.25  8   M 1 \nATOM   49   C  CG2  . VAL M  1 9   ? 118.761 116.689 51.824 1.00 6.25  8   M 1 \nATOM   50   H  H    . VAL M  1 9   ? 117.757 117.402 49.445 1.00 6.25  8   M 1 \nATOM   51   H  HA   . VAL M  1 9   ? 116.763 119.289 51.092 1.00 6.25  8   M 1 \nATOM   52   H  HB   . VAL M  1 9   ? 117.602 118.020 52.833 1.00 6.25  8   M 1 \nATOM   53   H  HG11 . VAL M  1 9   ? 116.190 116.261 52.696 1.00 6.25  8   M 1 \nATOM   54   H  HG12 . VAL M  1 9   ? 115.507 117.422 51.853 1.00 6.25  8   M 1 \nATOM   55   H  HG13 . VAL M  1 9   ? 116.261 116.241 51.112 1.00 6.25  8   M 1 \nATOM   56   H  HG21 . VAL M  1 9   ? 118.720 116.025 52.530 1.00 6.25  8   M 1 \nATOM   57   H  HG22 . VAL M  1 9   ? 118.732 116.240 50.965 1.00 6.25  8   M 1 \nATOM   58   H  HG23 . VAL M  1 9   ? 119.588 117.186 51.922 1.00 6.25  8   M 1 \nATOM   59   N  N    . ARG M  1 10  ? 119.714 119.469 50.120 1.00 6.80  9   M 1 \nATOM   60   C  CA   . ARG M  1 10  ? 121.028 120.137 50.287 1.00 6.80  9   M 1 \nATOM   61   C  C    . ARG M  1 10  ? 120.873 121.657 50.283 1.00 6.80  9   M 1 \nATOM   62   O  O    . ARG M  1 10  ? 120.265 122.177 49.352 1.00 6.80  9   M 1 \nATOM   63   C  CB   . ARG M  1 10  ? 122.014 119.698 49.205 1.00 6.80  9   M 1 \nATOM   64   C  CG   . ARG M  1 10  ? 123.450 120.070 49.528 1.00 6.80  9   M 1 \nATOM   65   C  CD   . ARG M  1 10  ? 124.419 119.495 48.512 1.00 6.80  9   M 1 \nATOM   66   N  NE   . ARG M  1 10  ? 125.813 119.611 48.924 1.00 6.80  9   M 1 \nATOM   67   C  CZ   . ARG M  1 10  ? 126.705 118.641 48.816 1.00 6.80  9   M 1 \nATOM   68   N  NH1  . ARG M  1 10  ? 126.346 117.466 48.336 1.00 6.80  9   M 1 \nATOM   69   N  NH2  . ARG M  1 10  ? 127.944 118.830 49.223 1.00 6.80  9   M 1 \nATOM   70   H  H    . ARG M  1 10  ? 119.572 119.093 49.304 1.00 6.80  9   M 1 \nATOM   71   H  HA   . ARG M  1 10  ? 121.392 119.870 51.162 1.00 6.80  9   M 1 \nATOM   72   H  HB2  . ARG M  1 10  ? 121.952 118.726 49.097 1.00 6.80  9   M 1 \nATOM   73   H  HB3  . ARG M  1 10  ? 121.758 120.115 48.356 1.00 6.80  9   M 1 \nATOM   74   H  HG2  . ARG M  1 10  ? 123.539 121.047 49.539 1.00 6.80  9   M 1 \nATOM   75   H  HG3  . ARG M  1 10  ? 123.681 119.732 50.419 1.00 6.80  9   M 1 \nATOM   76   H  HD2  . ARG M  1 10  ? 124.207 118.548 48.368 1.00 6.80  9   M 1 \nATOM   77   H  HD3  . ARG M  1 10  ? 124.299 119.960 47.657 1.00 6.80  9   M 1 \nATOM   78   H  HE   . ARG M  1 10  ? 126.081 120.373 49.252 1.00 6.80  9   M 1 \nATOM   79   H  HH11 . ARG M  1 10  ? 125.518 117.337 48.069 1.00 6.80  9   M 1 \nATOM   80   H  HH12 . ARG M  1 10  ? 126.939 116.820 48.270 1.00 6.80  9   M 1 \nATOM   81   H  HH21 . ARG M  1 10  ? 128.184 119.612 49.550 1.00 6.80  9   M 1 \nATOM   82   H  HH22 . ARG M  1 10  ? 128.532 118.178 49.155 1.00 6.80  9   M 1 \nATOM   83   N  N    . GLN M  1 11  ? 121.516 122.324 51.239 1.00 6.12  10  M 1 \nATOM   84   C  CA   . GLN M  1 11  ? 121.478 123.774 51.352 1.00 6.12  10  M 1 \nATOM   85   C  C    . GLN M  1 11  ? 122.621 124.235 52.245 1.00 6.12  10  M 1 \nATOM   86   O  O    . GLN M  1 11  ? 122.708 123.833 53.406 1.00 6.12  10  M 1 \nATOM   87   C  CB   . GLN M  1 11  ? 120.137 124.237 51.920 1.00 6.12  10  M 1 \nATOM   88   C  CG   . GLN M  1 11  ? 119.911 125.721 51.902 1.00 6.12  10  M 1 \nATOM   89   C  CD   . GLN M  1 11  ? 118.537 126.076 52.435 1.00 6.12  10  M 1 \nATOM   90   O  OE1  . GLN M  1 11  ? 117.830 125.223 52.962 1.00 6.12  10  M 1 \nATOM   91   N  NE2  . GLN M  1 11  ? 118.126 127.312 52.236 1.00 6.12  10  M 1 \nATOM   92   H  H    . GLN M  1 11  ? 121.988 121.938 51.846 1.00 6.12  10  M 1 \nATOM   93   H  HA   . GLN M  1 11  ? 121.591 124.163 50.470 1.00 6.12  10  M 1 \nATOM   94   H  HB2  . GLN M  1 11  ? 119.423 123.835 51.401 1.00 6.12  10  M 1 \nATOM   95   H  HB3  . GLN M  1 11  ? 120.071 123.946 52.843 1.00 6.12  10  M 1 \nATOM   96   H  HG2  . GLN M  1 11  ? 120.572 126.146 52.470 1.00 6.12  10  M 1 \nATOM   97   H  HG3  . GLN M  1 11  ? 119.997 126.048 50.993 1.00 6.12  10  M 1 \nATOM   98   H  HE21 . GLN M  1 11  ? 118.637 127.884 51.847 1.00 6.12  10  M 1 \nATOM   99   H  HE22 . GLN M  1 11  ? 117.347 127.547 52.514 1.00 6.12  10  M 1 \nATOM   100  N  N    . ASN M  1 12  ? 123.445 125.121 51.688 1.00 6.65  11  M 1 \nATOM   101  C  CA   . ASN M  1 12  ? 124.619 125.702 52.391 1.00 6.65  11  M 1 \nATOM   102  C  C    . ASN M  1 12  ? 125.569 124.588 52.872 1.00 6.65  11  M 1 \nATOM   103  O  O    . ASN M  1 12  ? 126.059 124.697 53.982 1.00 6.65  11  M 1 \nATOM   104  C  CB   . ASN M  1 12  ? 124.137 126.571 53.556 1.00 6.65  11  M 1 \nATOM   105  C  CG   . ASN M  1 12  ? 125.258 127.385 54.163 1.00 6.65  11  M 1 \nATOM   106  O  OD1  . ASN M  1 12  ? 126.071 127.935 53.440 1.00 6.65  11  M 1 \nATOM   107  N  ND2  . ASN M  1 12  ? 125.302 127.463 55.473 1.00 6.65  11  M 1 \nATOM   108  H  H    . ASN M  1 12  ? 123.269 125.513 50.886 1.00 6.65  11  M 1 \nATOM   109  H  HA   . ASN M  1 12  ? 125.105 126.283 51.760 1.00 6.65  11  M 1 \nATOM   110  H  HB2  . ASN M  1 12  ? 123.438 127.176 53.235 1.00 6.65  11  M 1 \nATOM   111  H  HB3  . ASN M  1 12  ? 123.749 125.994 54.246 1.00 6.65  11  M 1 \nATOM   112  H  HD21 . ASN M  1 12  ? 124.657 127.104 55.959 1.00 6.65  11  M 1 \nATOM   113  H  HD22 . ASN M  1 12  ? 125.976 127.875 55.869 1.00 6.65  11  M 1 \nATOM   114  N  N    . TYR M  1 13  ? 125.844 123.567 52.055 1.00 5.90  12  M 1 \nATOM   115  C  CA   . TYR M  1 13  ? 126.657 122.414 52.440 1.00 5.90  12  M 1 \nATOM   116  C  C    . TYR M  1 13  ? 127.687 122.174 51.341 1.00 5.90  12  M 1 \nATOM   117  O  O    . TYR M  1 13  ? 127.385 121.578 50.305 1.00 5.90  12  M 1 \nATOM   118  C  CB   . TYR M  1 13  ? 125.780 121.196 52.694 1.00 5.90  12  M 1 \nATOM   119  C  CG   . TYR M  1 13  ? 126.505 120.044 53.350 1.00 5.90  12  M 1 \nATOM   120  C  CD1  . TYR M  1 13  ? 126.937 120.148 54.661 1.00 5.90  12  M 1 \nATOM   121  C  CD2  . TYR M  1 13  ? 126.681 118.836 52.705 1.00 5.90  12  M 1 \nATOM   122  C  CE1  . TYR M  1 13  ? 127.578 119.120 55.287 1.00 5.90  12  M 1 \nATOM   123  C  CE2  . TYR M  1 13  ? 127.319 117.786 53.335 1.00 5.90  12  M 1 \nATOM   124  C  CZ   . TYR M  1 13  ? 127.766 117.935 54.631 1.00 5.90  12  M 1 \nATOM   125  O  OH   . TYR M  1 13  ? 128.404 116.916 55.298 1.00 5.90  12  M 1 \nATOM   126  H  H    . TYR M  1 13  ? 125.574 123.542 51.239 1.00 5.90  12  M 1 \nATOM   127  H  HA   . TYR M  1 13  ? 127.152 122.600 53.253 1.00 5.90  12  M 1 \nATOM   128  H  HB2  . TYR M  1 13  ? 125.041 121.450 53.268 1.00 5.90  12  M 1 \nATOM   129  H  HB3  . TYR M  1 13  ? 125.430 120.884 51.845 1.00 5.90  12  M 1 \nATOM   130  H  HD1  . TYR M  1 13  ? 126.822 120.949 55.119 1.00 5.90  12  M 1 \nATOM   131  H  HD2  . TYR M  1 13  ? 126.385 118.735 51.829 1.00 5.90  12  M 1 \nATOM   132  H  HE1  . TYR M  1 13  ? 127.875 119.221 56.163 1.00 5.90  12  M 1 \nATOM   133  H  HE2  . TYR M  1 13  ? 127.445 116.981 52.887 1.00 5.90  12  M 1 \nATOM   134  H  HH   . TYR M  1 13  ? 128.383 116.208 54.846 1.00 5.90  12  M 1 \nATOM   135  N  N    . HIS M  1 14  ? 128.905 122.635 51.599 1.00 7.28  13  M 1 \nATOM   136  C  CA   . HIS M  1 14  ? 129.958 122.673 50.597 1.00 7.28  13  M 1 \nATOM   137  C  C    . HIS M  1 14  ? 130.572 121.284 50.442 1.00 7.28  13  M 1 \nATOM   138  O  O    . HIS M  1 14  ? 130.617 120.503 51.393 1.00 7.28  13  M 1 \nATOM   139  C  CB   . HIS M  1 14  ? 131.006 123.701 51.029 1.00 7.28  13  M 1 \nATOM   140  C  CG   . HIS M  1 14  ? 131.952 124.116 49.949 1.00 7.28  13  M 1 \nATOM   141  N  ND1  . HIS M  1 14  ? 133.111 123.432 49.663 1.00 7.28  13  M 1 \nATOM   142  C  CD2  . HIS M  1 14  ? 131.927 125.178 49.112 1.00 7.28  13  M 1 \nATOM   143  C  CE1  . HIS M  1 14  ? 133.748 124.039 48.678 1.00 7.28  13  M 1 \nATOM   144  N  NE2  . HIS M  1 14  ? 133.051 125.103 48.327 1.00 7.28  13  M 1 \nATOM   145  H  H    . HIS M  1 14  ? 129.149 122.936 52.367 1.00 7.28  13  M 1 \nATOM   146  H  HA   . HIS M  1 14  ? 129.593 122.954 49.743 1.00 7.28  13  M 1 \nATOM   147  H  HB2  . HIS M  1 14  ? 130.552 124.500 51.338 1.00 7.28  13  M 1 \nATOM   148  H  HB3  . HIS M  1 14  ? 131.532 123.326 51.753 1.00 7.28  13  M 1 \nATOM   149  H  HD2  . HIS M  1 14  ? 131.267 125.832 49.071 1.00 7.28  13  M 1 \nATOM   150  H  HE1  . HIS M  1 14  ? 134.552 123.767 48.298 1.00 7.28  13  M 1 \nATOM   151  H  HE2  . HIS M  1 14  ? 133.267 125.657 47.706 1.00 7.28  13  M 1 \nATOM   152  N  N    . GLN M  1 15  ? 131.037 120.970 49.229 1.00 7.51  14  M 1 \nATOM   153  C  CA   . GLN M  1 15  ? 131.561 119.634 48.946 1.00 7.51  14  M 1 \nATOM   154  C  C    . GLN M  1 15  ? 132.800 119.311 49.780 1.00 7.51  14  M 1 \nATOM   155  O  O    . GLN M  1 15  ? 133.039 118.148 50.120 1.00 7.51  14  M 1 \nATOM   156  C  CB   . GLN M  1 15  ? 131.867 119.500 47.450 1.00 7.51  14  M 1 \nATOM   157  C  CG   . GLN M  1 15  ? 132.933 120.431 46.917 1.00 7.51  14  M 1 \nATOM   158  C  CD   . GLN M  1 15  ? 133.162 120.248 45.425 1.00 7.51  14  M 1 \nATOM   159  O  OE1  . GLN M  1 15  ? 132.551 119.386 44.791 1.00 7.51  14  M 1 \nATOM   160  N  NE2  . GLN M  1 15  ? 134.052 121.052 44.861 1.00 7.51  14  M 1 \nATOM   161  H  H    . GLN M  1 15  ? 131.058 121.511 48.561 1.00 7.51  14  M 1 \nATOM   162  H  HA   . GLN M  1 15  ? 130.879 118.977 49.157 1.00 7.51  14  M 1 \nATOM   163  H  HB2  . GLN M  1 15  ? 132.164 118.595 47.269 1.00 7.51  14  M 1 \nATOM   164  H  HB3  . GLN M  1 15  ? 131.057 119.680 46.948 1.00 7.51  14  M 1 \nATOM   165  H  HG2  . GLN M  1 15  ? 132.652 121.347 47.070 1.00 7.51  14  M 1 \nATOM   166  H  HG3  . GLN M  1 15  ? 133.774 120.264 47.370 1.00 7.51  14  M 1 \nATOM   167  H  HE21 . GLN M  1 15  ? 134.462 121.642 45.333 1.00 7.51  14  M 1 \nATOM   168  H  HE22 . GLN M  1 15  ? 134.218 120.981 44.020 1.00 7.51  14  M 1 \nATOM   169  N  N    . ASP M  1 16  ? 133.599 120.324 50.111 1.00 7.21  15  M 1 \nATOM   170  C  CA   . ASP M  1 16  ? 134.771 120.116 50.956 1.00 7.21  15  M 1 \nATOM   171  C  C    . ASP M  1 16  ? 134.371 119.680 52.361 1.00 7.21  15  M 1 \nATOM   172  O  O    . ASP M  1 16  ? 135.026 118.818 52.953 1.00 7.21  15  M 1 \nATOM   173  C  CB   . ASP M  1 16  ? 135.610 121.393 51.009 1.00 7.21  15  M 1 \nATOM   174  C  CG   . ASP M  1 16  ? 136.321 121.680 49.696 1.00 7.21  15  M 1 \nATOM   175  O  OD1  . ASP M  1 16  ? 136.404 120.772 48.845 1.00 7.21  15  M 1 \nATOM   176  O  OD2  . ASP M  1 16  ? 136.805 122.815 49.519 1.00 7.21  15  M 1 \nATOM   177  H  H    . ASP M  1 16  ? 133.476 121.137 49.858 1.00 7.21  15  M 1 \nATOM   178  H  HA   . ASP M  1 16  ? 135.320 119.415 50.571 1.00 7.21  15  M 1 \nATOM   179  H  HB2  . ASP M  1 16  ? 135.034 122.148 51.207 1.00 7.21  15  M 1 \nATOM   180  H  HB3  . ASP M  1 16  ? 136.282 121.306 51.703 1.00 7.21  15  M 1 \nATOM   181  N  N    . ALA M  1 17  ? 133.297 120.259 52.899 1.00 6.09  16  M 1 \nATOM   182  C  CA   . ALA M  1 17  ? 132.760 119.819 54.182 1.00 6.09  16  M 1 \nATOM   183  C  C    . ALA M  1 17  ? 132.287 118.373 54.109 1.00 6.09  16  M 1 \nATOM   184  O  O    . ALA M  1 17  ? 132.504 117.591 55.040 1.00 6.09  16  M 1 \nATOM   185  C  CB   . ALA M  1 17  ? 131.615 120.738 54.603 1.00 6.09  16  M 1 \nATOM   186  H  H    . ALA M  1 17  ? 132.865 120.907 52.533 1.00 6.09  16  M 1 \nATOM   187  H  HA   . ALA M  1 17  ? 133.452 119.884 54.859 1.00 6.09  16  M 1 \nATOM   188  H  HB1  . ALA M  1 17  ? 131.308 120.487 55.488 1.00 6.09  16  M 1 \nATOM   189  H  HB2  . ALA M  1 17  ? 131.935 121.654 54.614 1.00 6.09  16  M 1 \nATOM   190  H  HB3  . ALA M  1 17  ? 130.887 120.656 53.967 1.00 6.09  16  M 1 \nATOM   191  N  N    . GLU M  1 18  ? 131.621 118.014 53.012 1.00 5.83  17  M 1 \nATOM   192  C  CA   . GLU M  1 18  ? 131.183 116.639 52.793 1.00 5.83  17  M 1 \nATOM   193  C  C    . GLU M  1 18  ? 132.369 115.677 52.836 1.00 5.83  17  M 1 \nATOM   194  O  O    . GLU M  1 18  ? 132.351 114.658 53.547 1.00 5.83  17  M 1 \nATOM   195  C  CB   . GLU M  1 18  ? 130.451 116.566 51.447 1.00 5.83  17  M 1 \nATOM   196  C  CG   . GLU M  1 18  ? 129.838 115.239 51.109 1.00 5.83  17  M 1 \nATOM   197  C  CD   . GLU M  1 18  ? 129.069 115.276 49.797 1.00 5.83  17  M 1 \nATOM   198  O  OE1  . GLU M  1 18  ? 129.047 116.341 49.148 1.00 5.83  17  M 1 \nATOM   199  O  OE2  . GLU M  1 18  ? 128.489 114.242 49.415 1.00 5.83  17  M 1 \nATOM   200  H  H    . GLU M  1 18  ? 131.409 118.555 52.378 1.00 5.83  17  M 1 \nATOM   201  H  HA   . GLU M  1 18  ? 130.552 116.395 53.488 1.00 5.83  17  M 1 \nATOM   202  H  HB2  . GLU M  1 18  ? 129.737 117.223 51.446 1.00 5.83  17  M 1 \nATOM   203  H  HB3  . GLU M  1 18  ? 131.070 116.780 50.732 1.00 5.83  17  M 1 \nATOM   204  H  HG2  . GLU M  1 18  ? 130.539 114.574 51.031 1.00 5.83  17  M 1 \nATOM   205  H  HG3  . GLU M  1 18  ? 129.220 114.990 51.814 1.00 5.83  17  M 1 \nATOM   206  N  N    . ALA M  1 19  ? 133.426 116.014 52.101 1.00 5.64  18  M 1 \nATOM   207  C  CA   . ALA M  1 19  ? 134.627 115.186 52.077 1.00 5.64  18  M 1 \nATOM   208  C  C    . ALA M  1 19  ? 135.261 115.089 53.461 1.00 5.64  18  M 1 \nATOM   209  O  O    . ALA M  1 19  ? 135.695 114.008 53.887 1.00 5.64  18  M 1 \nATOM   210  C  CB   . ALA M  1 19  ? 135.619 115.756 51.068 1.00 5.64  18  M 1 \nATOM   211  H  H    . ALA M  1 19  ? 133.469 116.730 51.627 1.00 5.64  18  M 1 \nATOM   212  H  HA   . ALA M  1 19  ? 134.387 114.294 51.780 1.00 5.64  18  M 1 \nATOM   213  H  HB1  . ALA M  1 19  ? 136.445 115.249 51.108 1.00 5.64  18  M 1 \nATOM   214  H  HB2  . ALA M  1 19  ? 135.231 115.688 50.181 1.00 5.64  18  M 1 \nATOM   215  H  HB3  . ALA M  1 19  ? 135.792 116.686 51.281 1.00 5.64  18  M 1 \nATOM   216  N  N    . ALA M  1 20  ? 135.309 116.209 54.182 1.00 5.19  19  M 1 \nATOM   217  C  CA   . ALA M  1 20  ? 135.912 116.226 55.509 1.00 5.19  19  M 1 \nATOM   218  C  C    . ALA M  1 20  ? 135.118 115.366 56.484 1.00 5.19  19  M 1 \nATOM   219  O  O    . ALA M  1 20  ? 135.694 114.687 57.340 1.00 5.19  19  M 1 \nATOM   220  C  CB   . ALA M  1 20  ? 136.010 117.663 56.015 1.00 5.19  19  M 1 \nATOM   221  H  H    . ALA M  1 20  ? 134.988 116.964 53.924 1.00 5.19  19  M 1 \nATOM   222  H  HA   . ALA M  1 20  ? 136.813 115.873 55.449 1.00 5.19  19  M 1 \nATOM   223  H  HB1  . ALA M  1 20  ? 136.318 117.661 56.935 1.00 5.19  19  M 1 \nATOM   224  H  HB2  . ALA M  1 20  ? 136.643 118.153 55.468 1.00 5.19  19  M 1 \nATOM   225  H  HB3  . ALA M  1 20  ? 135.136 118.080 55.963 1.00 5.19  19  M 1 \nATOM   226  N  N    . ILE M  1 21  ? 133.794 115.373 56.355 1.00 4.65  20  M 1 \nATOM   227  C  CA   . ILE M  1 21  ? 132.950 114.537 57.205 1.00 4.65  20  M 1 \nATOM   228  C  C    . ILE M  1 21  ? 133.187 113.062 56.918 1.00 4.65  20  M 1 \nATOM   229  O  O    . ILE M  1 21  ? 133.212 112.237 57.837 1.00 4.65  20  M 1 \nATOM   230  C  CB   . ILE M  1 21  ? 131.466 114.924 57.036 1.00 4.65  20  M 1 \nATOM   231  C  CG1  . ILE M  1 21  ? 131.165 116.301 57.642 1.00 4.65  20  M 1 \nATOM   232  C  CG2  . ILE M  1 21  ? 130.563 113.897 57.679 1.00 4.65  20  M 1 \nATOM   233  C  CD1  . ILE M  1 21  ? 131.182 116.337 59.164 1.00 4.65  20  M 1 \nATOM   234  H  H    . ILE M  1 21  ? 133.365 115.839 55.774 1.00 4.65  20  M 1 \nATOM   235  H  HA   . ILE M  1 21  ? 133.213 114.693 58.125 1.00 4.65  20  M 1 \nATOM   236  H  HB   . ILE M  1 21  ? 131.263 114.954 56.088 1.00 4.65  20  M 1 \nATOM   237  H  HG12 . ILE M  1 21  ? 131.845 116.927 57.348 1.00 4.65  20  M 1 \nATOM   238  H  HG13 . ILE M  1 21  ? 130.297 116.611 57.340 1.00 4.65  20  M 1 \nATOM   239  H  HG21 . ILE M  1 21  ? 129.700 114.308 57.842 1.00 4.65  20  M 1 \nATOM   240  H  HG22 . ILE M  1 21  ? 130.447 113.140 57.083 1.00 4.65  20  M 1 \nATOM   241  H  HG23 . ILE M  1 21  ? 130.944 113.601 58.521 1.00 4.65  20  M 1 \nATOM   242  H  HD11 . ILE M  1 21  ? 131.445 117.226 59.450 1.00 4.65  20  M 1 \nATOM   243  H  HD12 . ILE M  1 21  ? 130.292 116.138 59.495 1.00 4.65  20  M 1 \nATOM   244  H  HD13 . ILE M  1 21  ? 131.804 115.688 59.529 1.00 4.65  20  M 1 \nATOM   245  N  N    . ASN M  1 22  ? 133.341 112.698 55.646 1.00 4.76  21  M 1 \nATOM   246  C  CA   . ASN M  1 22  ? 133.649 111.301 55.339 1.00 4.76  21  M 1 \nATOM   247  C  C    . ASN M  1 22  ? 134.999 110.889 55.925 1.00 4.76  21  M 1 \nATOM   248  O  O    . ASN M  1 22  ? 135.141 109.784 56.475 1.00 4.76  21  M 1 \nATOM   249  C  CB   . ASN M  1 22  ? 133.598 111.055 53.832 1.00 4.76  21  M 1 \nATOM   250  C  CG   . ASN M  1 22  ? 132.178 111.044 53.293 1.00 4.76  21  M 1 \nATOM   251  O  OD1  . ASN M  1 22  ? 131.264 110.549 53.941 1.00 4.76  21  M 1 \nATOM   252  N  ND2  . ASN M  1 22  ? 132.000 111.547 52.086 1.00 4.76  21  M 1 \nATOM   253  H  H    . ASN M  1 22  ? 133.277 113.220 54.965 1.00 4.76  21  M 1 \nATOM   254  H  HA   . ASN M  1 22  ? 132.976 110.740 55.755 1.00 4.76  21  M 1 \nATOM   255  H  HB2  . ASN M  1 22  ? 134.078 111.762 53.373 1.00 4.76  21  M 1 \nATOM   256  H  HB3  . ASN M  1 22  ? 134.006 110.200 53.626 1.00 4.76  21  M 1 \nATOM   257  H  HD21 . ASN M  1 22  ? 132.665 111.877 51.652 1.00 4.76  21  M 1 \nATOM   258  H  HD22 . ASN M  1 22  ? 131.214 111.556 51.737 1.00 4.76  21  M 1 \nATOM   259  N  N    . ARG M  1 23  ? 135.968 111.799 55.858 1.00 5.20  22  M 1 \nATOM   260  C  CA   . ARG M  1 23  ? 137.304 111.552 56.459 1.00 5.20  22  M 1 \nATOM   261  C  C    . ARG M  1 23  ? 137.134 111.402 57.973 1.00 5.20  22  M 1 \nATOM   262  O  O    . ARG M  1 23  ? 137.736 110.506 58.538 1.00 5.20  22  M 1 \nATOM   263  C  CB   . ARG M  1 23  ? 138.287 112.670 56.112 1.00 5.20  22  M 1 \nATOM   264  C  CG   . ARG M  1 23  ? 138.602 112.743 54.626 1.00 5.20  22  M 1 \nATOM   265  C  CD   . ARG M  1 23  ? 139.855 113.564 54.401 1.00 5.20  22  M 1 \nATOM   266  N  NE   . ARG M  1 23  ? 139.739 114.892 54.977 1.00 5.20  22  M 1 \nATOM   267  C  CZ   . ARG M  1 23  ? 139.293 115.956 54.319 1.00 5.20  22  M 1 \nATOM   268  N  NH1  . ARG M  1 23  ? 138.919 115.844 53.060 1.00 5.20  22  M 1 \nATOM   269  N  NH2  . ARG M  1 23  ? 139.230 117.132 54.915 1.00 5.20  22  M 1 \nATOM   270  H  H    . ARG M  1 23  ? 135.834 112.649 55.562 1.00 5.20  22  M 1 \nATOM   271  H  HA   . ARG M  1 23  ? 137.651 110.704 56.097 1.00 5.20  22  M 1 \nATOM   272  H  HB2  . ARG M  1 23  ? 137.907 113.526 56.400 1.00 5.20  22  M 1 \nATOM   273  H  HB3  . ARG M  1 23  ? 139.120 112.524 56.609 1.00 5.20  22  M 1 \nATOM   274  H  HG2  . ARG M  1 23  ? 138.737 111.838 54.272 1.00 5.20  22  M 1 \nATOM   275  H  HG3  . ARG M  1 23  ? 137.852 113.155 54.148 1.00 5.20  22  M 1 \nATOM   276  H  HD2  . ARG M  1 23  ? 140.622 113.103 54.803 1.00 5.20  22  M 1 \nATOM   277  H  HD3  . ARG M  1 23  ? 140.021 113.643 53.437 1.00 5.20  22  M 1 \nATOM   278  H  HE   . ARG M  1 23  ? 139.984 115.002 55.807 1.00 5.20  22  M 1 \nATOM   279  H  HH11 . ARG M  1 23  ? 138.963 115.063 52.658 1.00 5.20  22  M 1 \nATOM   280  H  HH12 . ARG M  1 23  ? 138.624 116.549 52.626 1.00 5.20  22  M 1 \nATOM   281  H  HH21 . ARG M  1 23  ? 139.480 117.211 55.756 1.00 5.20  22  M 1 \nATOM   282  H  HH22 . ARG M  1 23  ? 138.932 117.833 54.473 1.00 5.20  22  M 1 \nATOM   283  N  N    . GLN M  1 24  ? 136.303 112.230 58.589 1.00 4.27  23  M 1 \nATOM   284  C  CA   . GLN M  1 24  ? 136.057 112.163 60.050 1.00 4.27  23  M 1 \nATOM   285  C  C    . GLN M  1 24  ? 135.381 110.826 60.366 1.00 4.27  23  M 1 \nATOM   286  O  O    . GLN M  1 24  ? 135.792 110.182 61.304 1.00 4.27  23  M 1 \nATOM   287  C  CB   . GLN M  1 24  ? 135.231 113.334 60.583 1.00 4.27  23  M 1 \nATOM   288  C  CG   . GLN M  1 24  ? 135.188 113.347 62.108 1.00 4.27  23  M 1 \nATOM   289  C  CD   . GLN M  1 24  ? 136.537 113.649 62.722 1.00 4.27  23  M 1 \nATOM   290  O  OE1  . GLN M  1 24  ? 137.398 114.230 62.085 1.00 4.27  23  M 1 \nATOM   291  N  NE2  . GLN M  1 24  ? 136.731 113.278 63.973 1.00 4.27  23  M 1 \nATOM   292  H  H    . GLN M  1 24  ? 135.752 112.801 58.143 1.00 4.27  23  M 1 \nATOM   293  H  HA   . GLN M  1 24  ? 136.933 112.175 60.501 1.00 4.27  23  M 1 \nATOM   294  H  HB2  . GLN M  1 24  ? 135.623 114.172 60.260 1.00 4.27  23  M 1 \nATOM   295  H  HB3  . GLN M  1 24  ? 134.319 113.266 60.231 1.00 4.27  23  M 1 \nATOM   296  H  HG2  . GLN M  1 24  ? 134.542 114.023 62.406 1.00 4.27  23  M 1 \nATOM   297  H  HG3  . GLN M  1 24  ? 134.878 112.473 62.429 1.00 4.27  23  M 1 \nATOM   298  H  HE21 . GLN M  1 24  ? 136.087 112.865 64.417 1.00 4.27  23  M 1 \nATOM   299  H  HE22 . GLN M  1 24  ? 137.504 113.442 64.368 1.00 4.27  23  M 1 \nATOM   300  N  N    . ILE M  1 25  ? 134.455 110.366 59.533 1.00 4.04  24  M 1 \nATOM   301  C  CA   . ILE M  1 25  ? 133.757 109.072 59.780 1.00 4.04  24  M 1 \nATOM   302  C  C    . ILE M  1 25  ? 134.814 107.969 59.775 1.00 4.04  24  M 1 \nATOM   303  O  O    . ILE M  1 25  ? 134.825 107.162 60.686 1.00 4.04  24  M 1 \nATOM   304  C  CB   . ILE M  1 25  ? 132.669 108.811 58.722 1.00 4.04  24  M 1 \nATOM   305  C  CG1  . ILE M  1 25  ? 131.463 109.726 58.927 1.00 4.04  24  M 1 \nATOM   306  C  CG2  . ILE M  1 25  ? 132.268 107.346 58.704 1.00 4.04  24  M 1 \nATOM   307  C  CD1  . ILE M  1 25  ? 130.542 109.790 57.732 1.00 4.04  24  M 1 \nATOM   308  H  H    . ILE M  1 25  ? 134.294 110.730 58.714 1.00 4.04  24  M 1 \nATOM   309  H  HA   . ILE M  1 25  ? 133.339 109.104 60.659 1.00 4.04  24  M 1 \nATOM   310  H  HB   . ILE M  1 25  ? 133.057 109.027 57.838 1.00 4.04  24  M 1 \nATOM   311  H  HG12 . ILE M  1 25  ? 130.953 109.407 59.703 1.00 4.04  24  M 1 \nATOM   312  H  HG13 . ILE M  1 25  ? 131.783 110.631 59.129 1.00 4.04  24  M 1 \nATOM   313  H  HG21 . ILE M  1 25  ? 131.520 107.219 58.094 1.00 4.04  24  M 1 \nATOM   314  H  HG22 . ILE M  1 25  ? 133.020 106.805 58.408 1.00 4.04  24  M 1 \nATOM   315  H  HG23 . ILE M  1 25  ? 132.004 107.068 59.598 1.00 4.04  24  M 1 \nATOM   316  H  HD11 . ILE M  1 25  ? 129.788 110.372 57.933 1.00 4.04  24  M 1 \nATOM   317  H  HD12 . ILE M  1 25  ? 131.027 110.141 56.966 1.00 4.04  24  M 1 \nATOM   318  H  HD13 . ILE M  1 25  ? 130.213 108.898 57.525 1.00 4.04  24  M 1 \nATOM   319  N  N    . ASN M  1 26  ? 135.739 107.997 58.831 1.00 4.23  25  M 1 \nATOM   320  C  CA   . ASN M  1 26  ? 136.770 106.935 58.766 1.00 4.23  25  M 1 \nATOM   321  C  C    . ASN M  1 26  ? 137.629 107.000 60.033 1.00 4.23  25  M 1 \nATOM   322  O  O    . ASN M  1 26  ? 137.870 105.966 60.618 1.00 4.23  25  M 1 \nATOM   323  C  CB   . ASN M  1 26  ? 137.632 107.025 57.513 1.00 4.23  25  M 1 \nATOM   324  C  CG   . ASN M  1 26  ? 138.457 105.768 57.372 1.00 4.23  25  M 1 \nATOM   325  O  OD1  . ASN M  1 26  ? 139.615 105.766 57.731 1.00 4.23  25  M 1 \nATOM   326  N  ND2  . ASN M  1 26  ? 137.836 104.688 56.940 1.00 4.23  25  M 1 \nATOM   327  H  H    . ASN M  1 26  ? 135.874 108.705 58.276 1.00 4.23  25  M 1 \nATOM   328  H  HA   . ASN M  1 26  ? 136.310 106.063 58.747 1.00 4.23  25  M 1 \nATOM   329  H  HB2  . ASN M  1 26  ? 137.058 107.133 56.728 1.00 4.23  25  M 1 \nATOM   330  H  HB3  . ASN M  1 26  ? 138.224 107.802 57.579 1.00 4.23  25  M 1 \nATOM   331  H  HD21 . ASN M  1 26  ? 136.953 104.669 56.909 1.00 4.23  25  M 1 \nATOM   332  H  HD22 . ASN M  1 26  ? 138.302 103.982 56.685 1.00 4.23  25  M 1 \nATOM   333  N  N    . LEU M  1 27  ? 137.977 108.199 60.481 1.00 4.02  26  M 1 \nATOM   334  C  CA   . LEU M  1 27  ? 138.840 108.382 61.679 1.00 4.02  26  M 1 \nATOM   335  C  C    . LEU M  1 27  ? 138.126 107.816 62.917 1.00 4.02  26  M 1 \nATOM   336  O  O    . LEU M  1 27  ? 138.760 107.121 63.684 1.00 4.02  26  M 1 \nATOM   337  C  CB   . LEU M  1 27  ? 139.149 109.873 61.835 1.00 4.02  26  M 1 \nATOM   338  C  CG   . LEU M  1 27  ? 140.085 110.228 62.989 1.00 4.02  26  M 1 \nATOM   339  C  CD1  . LEU M  1 27  ? 141.294 109.307 63.013 1.00 4.02  26  M 1 \nATOM   340  C  CD2  . LEU M  1 27  ? 140.521 111.687 62.919 1.00 4.02  26  M 1 \nATOM   341  H  H    . LEU M  1 27  ? 137.610 108.970 60.164 1.00 4.02  26  M 1 \nATOM   342  H  HA   . LEU M  1 27  ? 139.678 107.884 61.539 1.00 4.02  26  M 1 \nATOM   343  H  HB2  . LEU M  1 27  ? 139.548 110.193 61.001 1.00 4.02  26  M 1 \nATOM   344  H  HB3  . LEU M  1 27  ? 138.305 110.351 61.961 1.00 4.02  26  M 1 \nATOM   345  H  HG   . LEU M  1 27  ? 139.588 110.099 63.834 1.00 4.02  26  M 1 \nATOM   346  H  HD11 . LEU M  1 27  ? 141.901 109.586 63.720 1.00 4.02  26  M 1 \nATOM   347  H  HD12 . LEU M  1 27  ? 141.003 108.393 63.178 1.00 4.02  26  M 1 \nATOM   348  H  HD13 . LEU M  1 27  ? 141.753 109.351 62.156 1.00 4.02  26  M 1 \nATOM   349  H  HD21 . LEU M  1 27  ? 141.103 111.888 63.672 1.00 4.02  26  M 1 \nATOM   350  H  HD22 . LEU M  1 27  ? 141.001 111.843 62.087 1.00 4.02  26  M 1 \nATOM   351  H  HD23 . LEU M  1 27  ? 139.737 112.262 62.953 1.00 4.02  26  M 1 \nATOM   352  N  N    . GLU M  1 28  ? 136.831 108.071 63.062 1.00 4.01  27  M 1 \nATOM   353  C  CA   . GLU M  1 28  ? 136.023 107.567 64.213 1.00 4.01  27  M 1 \nATOM   354  C  C    . GLU M  1 28  ? 135.968 106.029 64.180 1.00 4.01  27  M 1 \nATOM   355  O  O    . GLU M  1 28  ? 136.192 105.431 65.200 1.00 4.01  27  M 1 \nATOM   356  C  CB   . GLU M  1 28  ? 134.646 108.231 64.224 1.00 4.01  27  M 1 \nATOM   357  C  CG   . GLU M  1 28  ? 134.708 109.746 64.330 1.00 4.01  27  M 1 \nATOM   358  C  CD   . GLU M  1 28  ? 135.022 110.278 65.717 1.00 4.01  27  M 1 \nATOM   359  O  OE1  . GLU M  1 28  ? 135.132 111.477 65.845 1.00 4.01  27  M 1 \nATOM   360  O  OE2  . GLU M  1 28  ? 135.180 109.480 66.654 1.00 4.01  27  M 1 \nATOM   361  H  H    . GLU M  1 28  ? 136.336 108.472 62.412 1.00 4.01  27  M 1 \nATOM   362  H  HA   . GLU M  1 28  ? 136.491 107.832 65.039 1.00 4.01  27  M 1 \nATOM   363  H  HB2  . GLU M  1 28  ? 134.174 107.988 63.400 1.00 4.01  27  M 1 \nATOM   364  H  HB3  . GLU M  1 28  ? 134.133 107.879 64.981 1.00 4.01  27  M 1 \nATOM   365  H  HG2  . GLU M  1 28  ? 135.391 110.078 63.709 1.00 4.01  27  M 1 \nATOM   366  H  HG3  . GLU M  1 28  ? 133.846 110.118 64.045 1.00 4.01  27  M 1 \nATOM   367  N  N    . LEU M  1 29  ? 135.785 105.403 63.026 1.00 3.51  28  M 1 \nATOM   368  C  CA   . LEU M  1 29  ? 135.765 103.946 62.933 1.00 3.51  28  M 1 \nATOM   369  C  C    . LEU M  1 29  ? 137.136 103.360 63.258 1.00 3.51  28  M 1 \nATOM   370  O  O    . LEU M  1 29  ? 137.245 102.337 63.952 1.00 3.51  28  M 1 \nATOM   371  C  CB   . LEU M  1 29  ? 135.301 103.527 61.538 1.00 3.51  28  M 1 \nATOM   372  C  CG   . LEU M  1 29  ? 133.853 103.850 61.150 1.00 3.51  28  M 1 \nATOM   373  C  CD1  . LEU M  1 29  ? 133.595 103.571 59.675 1.00 3.51  28  M 1 \nATOM   374  C  CD2  . LEU M  1 29  ? 132.868 103.099 62.048 1.00 3.51  28  M 1 \nATOM   375  H  H    . LEU M  1 29  ? 135.653 105.809 62.280 1.00 3.51  28  M 1 \nATOM   376  H  HA   . LEU M  1 29  ? 135.135 103.595 63.582 1.00 3.51  28  M 1 \nATOM   377  H  HB2  . LEU M  1 29  ? 135.875 103.956 60.885 1.00 3.51  28  M 1 \nATOM   378  H  HB3  . LEU M  1 29  ? 135.409 102.566 61.462 1.00 3.51  28  M 1 \nATOM   379  H  HG   . LEU M  1 29  ? 133.694 104.797 61.289 1.00 3.51  28  M 1 \nATOM   380  H  HD11 . LEU M  1 29  ? 132.643 103.636 59.502 1.00 3.51  28  M 1 \nATOM   381  H  HD12 . LEU M  1 29  ? 134.053 104.234 59.135 1.00 3.51  28  M 1 \nATOM   382  H  HD13 . LEU M  1 29  ? 133.912 102.684 59.442 1.00 3.51  28  M 1 \nATOM   383  H  HD21 . LEU M  1 29  ? 132.022 102.980 61.589 1.00 3.51  28  M 1 \nATOM   384  H  HD22 . LEU M  1 29  ? 133.233 102.231 62.281 1.00 3.51  28  M 1 \nATOM   385  H  HD23 . LEU M  1 29  ? 132.726 103.616 62.856 1.00 3.51  28  M 1 \nATOM   386  N  N    . TYR M  1 30  ? 138.197 104.018 62.789 1.00 3.71  29  M 1 \nATOM   387  C  CA   . TYR M  1 30  ? 139.553 103.601 63.125 1.00 3.71  29  M 1 \nATOM   388  C  C    . TYR M  1 30  ? 139.788 103.627 64.630 1.00 3.71  29  M 1 \nATOM   389  O  O    . TYR M  1 30  ? 140.367 102.694 65.193 1.00 3.71  29  M 1 \nATOM   390  C  CB   . TYR M  1 30  ? 140.558 104.494 62.407 1.00 3.71  29  M 1 \nATOM   391  C  CG   . TYR M  1 30  ? 141.983 104.208 62.780 1.00 3.71  29  M 1 \nATOM   392  C  CD1  . TYR M  1 30  ? 142.637 103.095 62.294 1.00 3.71  29  M 1 \nATOM   393  C  CD2  . TYR M  1 30  ? 142.674 105.050 63.634 1.00 3.71  29  M 1 \nATOM   394  C  CE1  . TYR M  1 30  ? 143.934 102.835 62.635 1.00 3.71  29  M 1 \nATOM   395  C  CE2  . TYR M  1 30  ? 143.977 104.793 63.983 1.00 3.71  29  M 1 \nATOM   396  C  CZ   . TYR M  1 30  ? 144.601 103.678 63.482 1.00 3.71  29  M 1 \nATOM   397  O  OH   . TYR M  1 30  ? 145.902 103.394 63.809 1.00 3.71  29  M 1 \nATOM   398  H  H    . TYR M  1 30  ? 138.158 104.711 62.281 1.00 3.71  29  M 1 \nATOM   399  H  HA   . TYR M  1 30  ? 139.690 102.691 62.818 1.00 3.71  29  M 1 \nATOM   400  H  HB2  . TYR M  1 30  ? 140.472 104.349 61.452 1.00 3.71  29  M 1 \nATOM   401  H  HB3  . TYR M  1 30  ? 140.372 105.424 62.613 1.00 3.71  29  M 1 \nATOM   402  H  HD1  . TYR M  1 30  ? 142.192 102.514 61.720 1.00 3.71  29  M 1 \nATOM   403  H  HD2  . TYR M  1 30  ? 142.251 105.805 63.975 1.00 3.71  29  M 1 \nATOM   404  H  HE1  . TYR M  1 30  ? 144.359 102.079 62.298 1.00 3.71  29  M 1 \nATOM   405  H  HE2  . TYR M  1 30  ? 144.429 105.369 64.556 1.00 3.71  29  M 1 \nATOM   406  H  HH   . TYR M  1 30  ? 146.373 103.345 63.115 1.00 3.71  29  M 1 \nATOM   407  N  N    . ALA M  1 31  ? 139.356 104.699 65.292 1.00 3.35  30  M 1 \nATOM   408  C  CA   . ALA M  1 31  ? 139.528 104.812 66.738 1.00 3.35  30  M 1 \nATOM   409  C  C    . ALA M  1 31  ? 138.774 103.707 67.462 1.00 3.35  30  M 1 \nATOM   410  O  O    . ALA M  1 31  ? 139.276 103.129 68.437 1.00 3.35  30  M 1 \nATOM   411  C  CB   . ALA M  1 31  ? 139.056 106.184 67.214 1.00 3.35  30  M 1 \nATOM   412  H  H    . ALA M  1 31  ? 138.946 105.361 64.927 1.00 3.35  30  M 1 \nATOM   413  H  HA   . ALA M  1 31  ? 140.472 104.735 66.949 1.00 3.35  30  M 1 \nATOM   414  H  HB1  . ALA M  1 31  ? 139.116 106.235 68.181 1.00 3.35  30  M 1 \nATOM   415  H  HB2  . ALA M  1 31  ? 139.622 106.867 66.821 1.00 3.35  30  M 1 \nATOM   416  H  HB3  . ALA M  1 31  ? 138.134 106.318 66.945 1.00 3.35  30  M 1 \nATOM   417  N  N    . SER M  1 32  ? 137.564 103.400 66.993 1.00 3.18  31  M 1 \nATOM   418  C  CA   . SER M  1 32  ? 136.811 102.293 67.567 1.00 3.18  31  M 1 \nATOM   419  C  C    . SER M  1 32  ? 137.603 100.999 67.464 1.00 3.18  31  M 1 \nATOM   420  O  O    . SER M  1 32  ? 137.641 100.201 68.404 1.00 3.18  31  M 1 \nATOM   421  C  CB   . SER M  1 32  ? 135.466 102.139 66.865 1.00 3.18  31  M 1 \nATOM   422  O  OG   . SER M  1 32  ? 134.752 101.051 67.407 1.00 3.18  31  M 1 \nATOM   423  H  H    . SER M  1 32  ? 137.174 103.793 66.335 1.00 3.18  31  M 1 \nATOM   424  H  HA   . SER M  1 32  ? 136.630 102.476 68.502 1.00 3.18  31  M 1 \nATOM   425  H  HB2  . SER M  1 32  ? 134.939 102.946 66.973 1.00 3.18  31  M 1 \nATOM   426  H  HB3  . SER M  1 32  ? 135.620 101.974 65.922 1.00 3.18  31  M 1 \nATOM   427  H  HG   . SER M  1 32  ? 135.094 100.829 68.141 1.00 3.18  31  M 1 \nATOM   428  N  N    . TYR M  1 33  ? 138.275 100.799 66.337 1.00 3.03  32  M 1 \nATOM   429  C  CA   . TYR M  1 33  ? 138.957 99.533  66.105 1.00 3.03  32  M 1 \nATOM   430  C  C    . TYR M  1 33  ? 140.246 99.446  66.928 1.00 3.03  32  M 1 \nATOM   431  O  O    . TYR M  1 33  ? 140.590 98.384  67.463 1.00 3.03  32  M 1 \nATOM   432  C  CB   . TYR M  1 33  ? 139.148 99.386  64.594 1.00 3.03  32  M 1 \nATOM   433  C  CG   . TYR M  1 33  ? 139.641 98.067  64.082 1.00 3.03  32  M 1 \nATOM   434  C  CD1  . TYR M  1 33  ? 139.026 96.900  64.464 1.00 3.03  32  M 1 \nATOM   435  C  CD2  . TYR M  1 33  ? 140.504 98.008  63.005 1.00 3.03  32  M 1 \nATOM   436  C  CE1  . TYR M  1 33  ? 139.409 95.696  63.962 1.00 3.03  32  M 1 \nATOM   437  C  CE2  . TYR M  1 33  ? 140.878 96.805  62.460 1.00 3.03  32  M 1 \nATOM   438  C  CZ   . TYR M  1 33  ? 140.315 95.642  62.942 1.00 3.03  32  M 1 \nATOM   439  O  OH   . TYR M  1 33  ? 140.653 94.414  62.435 1.00 3.03  32  M 1 \nATOM   440  H  H    . TYR M  1 33  ? 138.348 101.369 65.698 1.00 3.03  32  M 1 \nATOM   441  H  HA   . TYR M  1 33  ? 138.370 98.818  66.396 1.00 3.03  32  M 1 \nATOM   442  H  HB2  . TYR M  1 33  ? 138.302 99.563  64.154 1.00 3.03  32  M 1 \nATOM   443  H  HB3  . TYR M  1 33  ? 139.791 100.056 64.312 1.00 3.03  32  M 1 \nATOM   444  H  HD1  . TYR M  1 33  ? 138.426 96.924  65.175 1.00 3.03  32  M 1 \nATOM   445  H  HD2  . TYR M  1 33  ? 140.889 98.792  62.686 1.00 3.03  32  M 1 \nATOM   446  H  HE1  . TYR M  1 33  ? 139.016 94.918  64.286 1.00 3.03  32  M 1 \nATOM   447  H  HE2  . TYR M  1 33  ? 141.500 96.784  61.769 1.00 3.03  32  M 1 \nATOM   448  H  HH   . TYR M  1 33  ? 141.157 94.498  61.768 1.00 3.03  32  M 1 \nATOM   449  N  N    . VAL M  1 34  ? 140.915 100.585 67.121 1.00 3.46  33  M 1 \nATOM   450  C  CA   . VAL M  1 34  ? 142.055 100.663 68.039 1.00 3.46  33  M 1 \nATOM   451  C  C    . VAL M  1 34  ? 141.629 100.281 69.455 1.00 3.46  33  M 1 \nATOM   452  O  O    . VAL M  1 34  ? 142.290 99.482  70.134 1.00 3.46  33  M 1 \nATOM   453  C  CB   . VAL M  1 34  ? 142.683 102.071 68.007 1.00 3.46  33  M 1 \nATOM   454  C  CG1  . VAL M  1 34  ? 143.748 102.219 69.088 1.00 3.46  33  M 1 \nATOM   455  C  CG2  . VAL M  1 34  ? 143.311 102.347 66.654 1.00 3.46  33  M 1 \nATOM   456  H  H    . VAL M  1 34  ? 140.716 101.332 66.744 1.00 3.46  33  M 1 \nATOM   457  H  HA   . VAL M  1 34  ? 142.735 100.036 67.747 1.00 3.46  33  M 1 \nATOM   458  H  HB   . VAL M  1 34  ? 141.995 102.736 68.165 1.00 3.46  33  M 1 \nATOM   459  H  HG11 . VAL M  1 34  ? 144.305 102.986 68.882 1.00 3.46  33  M 1 \nATOM   460  H  HG12 . VAL M  1 34  ? 143.331 102.360 69.952 1.00 3.46  33  M 1 \nATOM   461  H  HG13 . VAL M  1 34  ? 144.301 101.423 69.110 1.00 3.46  33  M 1 \nATOM   462  H  HG21 . VAL M  1 34  ? 143.667 103.249 66.651 1.00 3.46  33  M 1 \nATOM   463  H  HG22 . VAL M  1 34  ? 144.029 101.713 66.500 1.00 3.46  33  M 1 \nATOM   464  H  HG23 . VAL M  1 34  ? 142.654 102.259 65.946 1.00 3.46  33  M 1 \nATOM   465  N  N    . TYR M  1 35  ? 140.530 100.866 69.919 1.00 3.20  34  M 1 \nATOM   466  C  CA   . TYR M  1 35  ? 140.001 100.604 71.283 1.00 3.20  34  M 1 \nATOM   467  C  C    . TYR M  1 35  ? 139.639 99.114  71.378 1.00 3.20  34  M 1 \nATOM   468  O  O    . TYR M  1 35  ? 139.849 98.500  72.402 1.00 3.20  34  M 1 \nATOM   469  C  CB   . TYR M  1 35  ? 138.841 101.546 71.587 1.00 3.20  34  M 1 \nATOM   470  C  CG   . TYR M  1 35  ? 139.250 102.931 72.020 1.00 3.20  34  M 1 \nATOM   471  C  CD1  . TYR M  1 35  ? 140.196 103.117 73.010 1.00 3.20  34  M 1 \nATOM   472  C  CD2  . TYR M  1 35  ? 138.646 104.058 71.485 1.00 3.20  34  M 1 \nATOM   473  C  CE1  . TYR M  1 35  ? 140.544 104.389 73.448 1.00 3.20  34  M 1 \nATOM   474  C  CE2  . TYR M  1 35  ? 138.992 105.335 71.899 1.00 3.20  34  M 1 \nATOM   475  C  CZ   . TYR M  1 35  ? 139.942 105.505 72.889 1.00 3.20  34  M 1 \nATOM   476  O  OH   . TYR M  1 35  ? 140.290 106.755 73.319 1.00 3.20  34  M 1 \nATOM   477  H  H    . TYR M  1 35  ? 139.962 101.356 69.405 1.00 3.20  34  M 1 \nATOM   478  H  HA   . TYR M  1 35  ? 140.725 100.784 71.935 1.00 3.20  34  M 1 \nATOM   479  H  HB2  . TYR M  1 35  ? 138.284 101.619 70.784 1.00 3.20  34  M 1 \nATOM   480  H  HB3  . TYR M  1 35  ? 138.294 101.144 72.294 1.00 3.20  34  M 1 \nATOM   481  H  HD1  . TYR M  1 35  ? 140.606 102.366 73.404 1.00 3.20  34  M 1 \nATOM   482  H  HD2  . TYR M  1 35  ? 137.992 103.955 70.813 1.00 3.20  34  M 1 \nATOM   483  H  HE1  . TYR M  1 35  ? 141.198 104.495 74.119 1.00 3.20  34  M 1 \nATOM   484  H  HE2  . TYR M  1 35  ? 138.571 106.086 71.515 1.00 3.20  34  M 1 \nATOM   485  H  HH   . TYR M  1 35  ? 139.593 107.177 73.589 1.00 3.20  34  M 1 \nATOM   486  N  N    . LEU M  1 36  ? 139.084 98.533  70.325 1.00 3.08  35  M 1 \nATOM   487  C  CA   . LEU M  1 36  ? 138.744 97.115  70.332 1.00 3.08  35  M 1 \nATOM   488  C  C    . LEU M  1 36  ? 139.990 96.254  70.508 1.00 3.08  35  M 1 \nATOM   489  O  O    . LEU M  1 36  ? 139.984 95.281  71.274 1.00 3.08  35  M 1 \nATOM   490  C  CB   . LEU M  1 36  ? 138.005 96.750  69.045 1.00 3.08  35  M 1 \nATOM   491  C  CG   . LEU M  1 36  ? 137.534 95.304  68.916 1.00 3.08  35  M 1 \nATOM   492  C  CD1  . LEU M  1 36  ? 136.553 94.968  70.028 1.00 3.08  35  M 1 \nATOM   493  C  CD2  . LEU M  1 36  ? 136.903 95.067  67.564 1.00 3.08  35  M 1 \nATOM   494  H  H    . LEU M  1 36  ? 138.894 98.952  69.598 1.00 3.08  35  M 1 \nATOM   495  H  HA   . LEU M  1 36  ? 138.158 96.956  71.088 1.00 3.08  35  M 1 \nATOM   496  H  HB2  . LEU M  1 36  ? 137.216 97.310  68.970 1.00 3.08  35  M 1 \nATOM   497  H  HB3  . LEU M  1 36  ? 138.587 96.937  68.292 1.00 3.08  35  M 1 \nATOM   498  H  HG   . LEU M  1 36  ? 138.295 94.706  68.982 1.00 3.08  35  M 1 \nATOM   499  H  HD11 . LEU M  1 36  ? 136.178 94.088  69.867 1.00 3.08  35  M 1 \nATOM   500  H  HD12 . LEU M  1 36  ? 137.019 94.970  70.879 1.00 3.08  35  M 1 \nATOM   501  H  HD13 . LEU M  1 36  ? 135.843 95.629  70.043 1.00 3.08  35  M 1 \nATOM   502  H  HD21 . LEU M  1 36  ? 136.535 94.170  67.543 1.00 3.08  35  M 1 \nATOM   503  H  HD22 . LEU M  1 36  ? 136.197 95.717  67.423 1.00 3.08  35  M 1 \nATOM   504  H  HD23 . LEU M  1 36  ? 137.580 95.162  66.875 1.00 3.08  35  M 1 \nATOM   505  N  N    . SER M  1 37  ? 141.069 96.611  69.816 1.00 3.69  36  M 1 \nATOM   506  C  CA   . SER M  1 37  ? 142.323 95.872  69.937 1.00 3.69  36  M 1 \nATOM   507  C  C    . SER M  1 37  ? 142.871 95.954  71.360 1.00 3.69  36  M 1 \nATOM   508  O  O    . SER M  1 37  ? 143.339 94.957  71.924 1.00 3.69  36  M 1 \nATOM   509  C  CB   . SER M  1 37  ? 143.339 96.419  68.940 1.00 3.69  36  M 1 \nATOM   510  O  OG   . SER M  1 37  ? 144.559 95.726  69.033 1.00 3.69  36  M 1 \nATOM   511  H  H    . SER M  1 37  ? 141.104 97.291  69.290 1.00 3.69  36  M 1 \nATOM   512  H  HA   . SER M  1 37  ? 142.174 94.940  69.715 1.00 3.69  36  M 1 \nATOM   513  H  HB2  . SER M  1 37  ? 142.982 96.331  68.042 1.00 3.69  36  M 1 \nATOM   514  H  HB3  . SER M  1 37  ? 143.507 97.356  69.128 1.00 3.69  36  M 1 \nATOM   515  H  HG   . SER M  1 37  ? 144.931 95.734  68.280 1.00 3.69  36  M 1 \nATOM   516  N  N    . MET M  1 38  ? 142.811 97.145  71.956 1.00 3.57  37  M 1 \nATOM   517  C  CA   . MET M  1 38  ? 143.243 97.312  73.342 1.00 3.57  37  M 1 \nATOM   518  C  C    . MET M  1 38  ? 142.431 96.421  74.277 1.00 3.57  37  M 1 \nATOM   519  O  O    . MET M  1 38  ? 142.984 95.719  75.141 1.00 3.57  37  M 1 \nATOM   520  C  CB   . MET M  1 38  ? 143.122 98.784  73.749 1.00 3.57  37  M 1 \nATOM   521  C  CG   . MET M  1 38  ? 144.133 99.719  73.108 1.00 3.57  37  M 1 \nATOM   522  S  SD   . MET M  1 38  ? 143.865 101.435 73.612 1.00 3.57  37  M 1 \nATOM   523  C  CE   . MET M  1 38  ? 145.135 102.271 72.672 1.00 3.57  37  M 1 \nATOM   524  H  H    . MET M  1 38  ? 142.498 97.857  71.588 1.00 3.57  37  M 1 \nATOM   525  H  HA   . MET M  1 38  ? 144.179 97.066  73.411 1.00 3.57  37  M 1 \nATOM   526  H  HB2  . MET M  1 38  ? 142.236 99.102  73.516 1.00 3.57  37  M 1 \nATOM   527  H  HB3  . MET M  1 38  ? 143.231 98.858  74.710 1.00 3.57  37  M 1 \nATOM   528  H  HG2  . MET M  1 38  ? 145.022 99.457  73.394 1.00 3.57  37  M 1 \nATOM   529  H  HG3  . MET M  1 38  ? 144.086 99.664  72.141 1.00 3.57  37  M 1 \nATOM   530  H  HE1  . MET M  1 38  ? 145.182 103.200 72.947 1.00 3.57  37  M 1 \nATOM   531  H  HE2  . MET M  1 38  ? 145.984 101.832 72.837 1.00 3.57  37  M 1 \nATOM   532  H  HE3  . MET M  1 38  ? 144.920 102.220 71.728 1.00 3.57  37  M 1 \nATOM   533  N  N    . SER M  1 39  ? 141.125 96.439  74.059 1.00 3.57  38  M 1 \nATOM   534  C  CA   . SER M  1 39  ? 140.177 95.667  74.882 1.00 3.57  38  M 1 \nATOM   535  C  C    . SER M  1 39  ? 140.572 94.195  74.781 1.00 3.57  38  M 1 \nATOM   536  O  O    . SER M  1 39  ? 140.725 93.591  75.818 1.00 3.57  38  M 1 \nATOM   537  C  CB   . SER M  1 39  ? 138.755 95.858  74.453 1.00 3.57  38  M 1 \nATOM   538  O  OG   . SER M  1 39  ? 137.885 95.283  75.403 1.00 3.57  38  M 1 \nATOM   539  H  H    . SER M  1 39  ? 140.739 96.797  73.317 1.00 3.57  38  M 1 \nATOM   540  H  HA   . SER M  1 39  ? 140.271 95.958  75.829 1.00 3.57  38  M 1 \nATOM   541  H  HB2  . SER M  1 39  ? 138.563 96.819  74.367 1.00 3.57  38  M 1 \nATOM   542  H  HB3  . SER M  1 39  ? 138.616 95.434  73.576 1.00 3.57  38  M 1 \nATOM   543  H  HG   . SER M  1 39  ? 138.336 95.071  76.086 1.00 3.57  38  M 1 \nATOM   544  N  N    . CYS M  1 40  ? 140.888 93.717  73.583 1.00 4.32  39  M 1 \nATOM   545  C  CA   . CYS M  1 40  ? 141.264 92.302  73.348 1.00 4.32  39  M 1 \nATOM   546  C  C    . CYS M  1 40  ? 142.555 92.007  74.115 1.00 4.32  39  M 1 \nATOM   547  O  O    . CYS M  1 40  ? 142.598 91.009  74.795 1.00 4.32  39  M 1 \nATOM   548  C  CB   . CYS M  1 40  ? 141.449 92.000  71.865 1.00 4.32  39  M 1 \nATOM   549  S  SG   . CYS M  1 40  ? 139.891 91.997  70.941 1.00 4.32  39  M 1 \nATOM   550  H  H    . CYS M  1 40  ? 141.025 94.242  72.853 1.00 4.32  39  M 1 \nATOM   551  H  HA   . CYS M  1 40  ? 140.545 91.729  73.700 1.00 4.32  39  M 1 \nATOM   552  H  HB2  . CYS M  1 40  ? 142.044 92.671  71.472 1.00 4.32  39  M 1 \nATOM   553  H  HB3  . CYS M  1 40  ? 141.874 91.124  71.765 1.00 4.32  39  M 1 \nATOM   554  H  HG   . CYS M  1 40  ? 140.354 91.741  69.861 1.00 4.32  39  M 1 \nATOM   555  N  N    . TYR M  1 41  ? 143.500 92.935  74.109 1.00 4.38  40  M 1 \nATOM   556  C  CA   . TYR M  1 41  ? 144.808 92.747  74.775 1.00 4.38  40  M 1 \nATOM   557  C  C    . TYR M  1 41  ? 144.627 92.543  76.279 1.00 4.38  40  M 1 \nATOM   558  O  O    . TYR M  1 41  ? 145.227 91.640  76.793 1.00 4.38  40  M 1 \nATOM   559  C  CB   . TYR M  1 41  ? 145.702 93.952  74.532 1.00 4.38  40  M 1 \nATOM   560  C  CG   . TYR M  1 41  ? 147.002 93.889  75.275 1.00 4.38  40  M 1 \nATOM   561  C  CD1  . TYR M  1 41  ? 148.056 93.128  74.805 1.00 4.38  40  M 1 \nATOM   562  C  CD2  . TYR M  1 41  ? 147.181 94.611  76.438 1.00 4.38  40  M 1 \nATOM   563  C  CE1  . TYR M  1 41  ? 149.266 93.079  75.479 1.00 4.38  40  M 1 \nATOM   564  C  CE2  . TYR M  1 41  ? 148.382 94.574  77.123 1.00 4.38  40  M 1 \nATOM   565  C  CZ   . TYR M  1 41  ? 149.423 93.798  76.649 1.00 4.38  40  M 1 \nATOM   566  O  OH   . TYR M  1 41  ? 150.601 93.766  77.329 1.00 4.38  40  M 1 \nATOM   567  H  H    . TYR M  1 41  ? 143.368 93.789  73.825 1.00 4.38  40  M 1 \nATOM   568  H  HA   . TYR M  1 41  ? 145.245 91.942  74.397 1.00 4.38  40  M 1 \nATOM   569  H  HB2  . TYR M  1 41  ? 145.886 94.017  73.571 1.00 4.38  40  M 1 \nATOM   570  H  HB3  . TYR M  1 41  ? 145.218 94.761  74.802 1.00 4.38  40  M 1 \nATOM   571  H  HD1  . TYR M  1 41  ? 147.951 92.633  74.009 1.00 4.38  40  M 1 \nATOM   572  H  HD2  . TYR M  1 41  ? 146.475 95.140  76.771 1.00 4.38  40  M 1 \nATOM   573  H  HE1  . TYR M  1 41  ? 149.973 92.549  75.150 1.00 4.38  40  M 1 \nATOM   574  H  HE2  . TYR M  1 41  ? 148.487 95.066  77.920 1.00 4.38  40  M 1 \nATOM   575  H  HH   . TYR M  1 41  ? 150.480 93.440  78.113 1.00 4.38  40  M 1 \nATOM   576  N  N    . PHE M  1 42  ? 143.784 93.325  76.942 1.00 3.75  41  M 1 \nATOM   577  C  CA   . PHE M  1 42  ? 143.626 93.250  78.424 1.00 3.75  41  M 1 \nATOM   578  C  C    . PHE M  1 42  ? 142.893 91.962  78.827 1.00 3.75  41  M 1 \nATOM   579  O  O    . PHE M  1 42  ? 142.921 91.650  79.995 1.00 3.75  41  M 1 \nATOM   580  C  CB   . PHE M  1 42  ? 143.056 94.559  78.978 1.00 3.75  41  M 1 \nATOM   581  C  CG   . PHE M  1 42  ? 144.075 95.668  78.885 1.00 3.75  41  M 1 \nATOM   582  C  CD1  . PHE M  1 42  ? 145.167 95.702  79.740 1.00 3.75  41  M 1 \nATOM   583  C  CD2  . PHE M  1 42  ? 144.003 96.615  77.879 1.00 3.75  41  M 1 \nATOM   584  C  CE1  . PHE M  1 42  ? 146.147 96.675  79.609 1.00 3.75  41  M 1 \nATOM   585  C  CE2  . PHE M  1 42  ? 144.963 97.613  77.774 1.00 3.75  41  M 1 \nATOM   586  C  CZ   . PHE M  1 42  ? 146.039 97.634  78.626 1.00 3.75  41  M 1 \nATOM   587  H  H    . PHE M  1 42  ? 143.184 93.883  76.545 1.00 3.75  41  M 1 \nATOM   588  H  HA   . PHE M  1 42  ? 144.541 93.169  78.795 1.00 3.75  41  M 1 \nATOM   589  H  HB2  . PHE M  1 42  ? 142.257 94.803  78.468 1.00 3.75  41  M 1 \nATOM   590  H  HB3  . PHE M  1 42  ? 142.799 94.426  79.914 1.00 3.75  41  M 1 \nATOM   591  H  HD1  . PHE M  1 42  ? 145.254 95.040  80.407 1.00 3.75  41  M 1 \nATOM   592  H  HD2  . PHE M  1 42  ? 143.271 96.606  77.284 1.00 3.75  41  M 1 \nATOM   593  H  HE1  . PHE M  1 42  ? 146.871 96.699  80.214 1.00 3.75  41  M 1 \nATOM   594  H  HE2  . PHE M  1 42  ? 144.890 98.263  77.093 1.00 3.75  41  M 1 \nATOM   595  H  HZ   . PHE M  1 42  ? 146.689 98.314  78.553 1.00 3.75  41  M 1 \nATOM   596  N  N    . ASP M  1 43  ? 142.191 91.322  77.898 1.00 4.58  42  M 1 \nATOM   597  C  CA   . ASP M  1 43  ? 141.473 90.038  78.080 1.00 4.58  42  M 1 \nATOM   598  C  C    . ASP M  1 43  ? 142.425 88.840  77.923 1.00 4.58  42  M 1 \nATOM   599  O  O    . ASP M  1 43  ? 142.006 87.752  78.194 1.00 4.58  42  M 1 \nATOM   600  C  CB   . ASP M  1 43  ? 140.329 89.942  77.072 1.00 4.58  42  M 1 \nATOM   601  C  CG   . ASP M  1 43  ? 139.568 88.639  77.147 1.00 4.58  42  M 1 \nATOM   602  O  OD1  . ASP M  1 43  ? 139.070 88.323  78.243 1.00 4.58  42  M 1 \nATOM   603  O  OD2  . ASP M  1 43  ? 139.491 87.950  76.115 1.00 4.58  42  M 1 \nATOM   604  H  H    . ASP M  1 43  ? 142.065 91.654  77.065 1.00 4.58  42  M 1 \nATOM   605  H  HA   . ASP M  1 43  ? 141.091 90.021  78.989 1.00 4.58  42  M 1 \nATOM   606  H  HB2  . ASP M  1 43  ? 139.701 90.677  77.231 1.00 4.58  42  M 1 \nATOM   607  H  HB3  . ASP M  1 43  ? 140.690 90.039  76.168 1.00 4.58  42  M 1 \nATOM   608  N  N    . ARG M  1 44  ? 143.669 89.028  77.488 1.00 4.59  43  M 1 \nATOM   609  C  CA   . ARG M  1 44  ? 144.629 87.906  77.341 1.00 4.59  43  M 1 \nATOM   610  C  C    . ARG M  1 44  ? 144.872 87.264  78.707 1.00 4.59  43  M 1 \nATOM   611  O  O    . ARG M  1 44  ? 144.960 87.979  79.676 1.00 4.59  43  M 1 \nATOM   612  C  CB   . ARG M  1 44  ? 145.945 88.407  76.749 1.00 4.59  43  M 1 \nATOM   613  C  CG   . ARG M  1 44  ? 145.842 88.780  75.285 1.00 4.59  43  M 1 \nATOM   614  C  CD   . ARG M  1 44  ? 147.064 89.496  74.784 1.00 4.59  43  M 1 \nATOM   615  N  NE   . ARG M  1 44  ? 148.304 88.846  75.136 1.00 4.59  43  M 1 \nATOM   616  C  CZ   . ARG M  1 44  ? 149.445 89.019  74.482 1.00 4.59  43  M 1 \nATOM   617  N  NH1  . ARG M  1 44  ? 149.498 89.823  73.439 1.00 4.59  43  M 1 \nATOM   618  N  NH2  . ARG M  1 44  ? 150.530 88.386  74.877 1.00 4.59  43  M 1 \nATOM   619  H  H    . ARG M  1 44  ? 144.027 89.832  77.290 1.00 4.59  43  M 1 \nATOM   620  H  HA   . ARG M  1 44  ? 144.238 87.234  76.736 1.00 4.59  43  M 1 \nATOM   621  H  HB2  . ARG M  1 44  ? 146.239 89.192  77.257 1.00 4.59  43  M 1 \nATOM   622  H  HB3  . ARG M  1 44  ? 146.623 87.708  76.852 1.00 4.59  43  M 1 \nATOM   623  H  HG2  . ARG M  1 44  ? 145.710 87.966  74.753 1.00 4.59  43  M 1 \nATOM   624  H  HG3  . ARG M  1 44  ? 145.059 89.356  75.152 1.00 4.59  43  M 1 \nATOM   625  H  HD2  . ARG M  1 44  ? 147.011 89.569  73.807 1.00 4.59  43  M 1 \nATOM   626  H  HD3  . ARG M  1 44  ? 147.069 90.407  75.149 1.00 4.59  43  M 1 \nATOM   627  H  HE   . ARG M  1 44  ? 148.305 88.305  75.821 1.00 4.59  43  M 1 \nATOM   628  H  HH11 . ARG M  1 44  ? 148.775 90.249  73.178 1.00 4.59  43  M 1 \nATOM   629  H  HH12 . ARG M  1 44  ? 150.258 89.935  73.012 1.00 4.59  43  M 1 \nATOM   630  H  HH21 . ARG M  1 44  ? 150.499 87.850  75.555 1.00 4.59  43  M 1 \nATOM   631  H  HH22 . ARG M  1 44  ? 151.285 88.501  74.438 1.00 4.59  43  M 1 \nATOM   632  N  N    . ASP M  1 45  ? 145.103 85.958  78.766 1.00 4.97  44  M 1 \nATOM   633  C  CA   . ASP M  1 45  ? 145.355 85.256  80.057 1.00 4.97  44  M 1 \nATOM   634  C  C    . ASP M  1 45  ? 146.668 85.742  80.712 1.00 4.97  44  M 1 \nATOM   635  O  O    . ASP M  1 45  ? 146.819 85.489  81.891 1.00 4.97  44  M 1 \nATOM   636  C  CB   . ASP M  1 45  ? 145.349 83.739  79.894 1.00 4.97  44  M 1 \nATOM   637  C  CG   . ASP M  1 45  ? 146.620 83.284  79.220 1.00 4.97  44  M 1 \nATOM   638  O  OD1  . ASP M  1 45  ? 147.606 83.093  79.940 1.00 4.97  44  M 1 \nATOM   639  O  OD2  . ASP M  1 45  ? 146.633 83.234  77.997 1.00 4.97  44  M 1 \nATOM   640  H  H    . ASP M  1 45  ? 145.234 85.444  78.027 1.00 4.97  44  M 1 \nATOM   641  H  HA   . ASP M  1 45  ? 144.615 85.487  80.666 1.00 4.97  44  M 1 \nATOM   642  H  HB2  . ASP M  1 45  ? 145.279 83.310  80.771 1.00 4.97  44  M 1 \nATOM   643  H  HB3  . ASP M  1 45  ? 144.582 83.466  79.350 1.00 4.97  44  M 1 \nATOM   644  N  N    . ASP M  1 46  ? 147.649 86.258  79.969 1.00 4.81  45  M 1 \nATOM   645  C  CA   . ASP M  1 46  ? 148.928 86.748  80.536 1.00 4.81  45  M 1 \nATOM   646  C  C    . ASP M  1 46  ? 148.867 88.257  80.847 1.00 4.81  45  M 1 \nATOM   647  O  O    . ASP M  1 46  ? 149.900 88.769  81.216 1.00 4.81  45  M 1 \nATOM   648  C  CB   . ASP M  1 46  ? 150.117 86.389  79.649 1.00 4.81  45  M 1 \nATOM   649  C  CG   . ASP M  1 46  ? 149.985 86.864  78.215 1.00 4.81  45  M 1 \nATOM   650  O  OD1  . ASP M  1 46  ? 148.921 87.352  77.865 1.00 4.81  45  M 1 \nATOM   651  O  OD2  . ASP M  1 46  ? 150.959 86.728  77.462 1.00 4.81  45  M 1 \nATOM   652  H  H    . ASP M  1 46  ? 147.592 86.348  79.066 1.00 4.81  45  M 1 \nATOM   653  H  HA   . ASP M  1 46  ? 149.061 86.277  81.392 1.00 4.81  45  M 1 \nATOM   654  H  HB2  . ASP M  1 46  ? 150.928 86.785  80.029 1.00 4.81  45  M 1 \nATOM   655  H  HB3  . ASP M  1 46  ? 150.227 85.417  79.642 1.00 4.81  45  M 1 \nATOM   656  N  N    . VAL M  1 47  ? 147.711 88.919  80.748 1.00 4.20  46  M 1 \nATOM   657  C  CA   . VAL M  1 47  ? 147.532 90.321  81.107 1.00 4.20  46  M 1 \nATOM   658  C  C    . VAL M  1 47  ? 146.468 90.377  82.200 1.00 4.20  46  M 1 \nATOM   659  O  O    . VAL M  1 47  ? 146.740 90.802  83.326 1.00 4.20  46  M 1 \nATOM   660  C  CB   . VAL M  1 47  ? 147.159 91.167  79.874 1.00 4.20  46  M 1 \nATOM   661  C  CG1  . VAL M  1 47  ? 146.894 92.607  80.267 1.00 4.20  46  M 1 \nATOM   662  C  CG2  . VAL M  1 47  ? 148.260 91.084  78.816 1.00 4.20  46  M 1 \nATOM   663  H  H    . VAL M  1 47  ? 146.975 88.546  80.505 1.00 4.20  46  M 1 \nATOM   664  H  HA   . VAL M  1 47  ? 148.355 90.681  81.473 1.00 4.20  46  M 1 \nATOM   665  H  HB   . VAL M  1 47  ? 146.348 90.817  79.473 1.00 4.20  46  M 1 \nATOM   666  H  HG11 . VAL M  1 47  ? 146.844 93.141  79.459 1.00 4.20  46  M 1 \nATOM   667  H  HG12 . VAL M  1 47  ? 146.053 92.662  80.747 1.00 4.20  46  M 1 \nATOM   668  H  HG13 . VAL M  1 47  ? 147.615 92.937  80.825 1.00 4.20  46  M 1 \nATOM   669  H  HG21 . VAL M  1 47  ? 148.056 91.680  78.078 1.00 4.20  46  M 1 \nATOM   670  H  HG22 . VAL M  1 47  ? 149.110 91.329  79.214 1.00 4.20  46  M 1 \nATOM   671  H  HG23 . VAL M  1 47  ? 148.314 90.176  78.480 1.00 4.20  46  M 1 \nATOM   672  N  N    . ALA M  1 48  ? 145.252 89.939  81.871 1.00 4.09  47  M 1 \nATOM   673  C  CA   . ALA M  1 48  ? 144.226 89.581  82.848 1.00 4.09  47  M 1 \nATOM   674  C  C    . ALA M  1 48  ? 143.784 90.780  83.690 1.00 4.09  47  M 1 \nATOM   675  O  O    . ALA M  1 48  ? 143.736 90.720  84.918 1.00 4.09  47  M 1 \nATOM   676  C  CB   . ALA M  1 48  ? 144.712 88.431  83.733 1.00 4.09  47  M 1 \nATOM   677  H  H    . ALA M  1 48  ? 144.982 89.848  81.060 1.00 4.09  47  M 1 \nATOM   678  H  HA   . ALA M  1 48  ? 143.445 89.262  82.369 1.00 4.09  47  M 1 \nATOM   679  H  HB1  . ALA M  1 48  ? 143.981 88.111  84.285 1.00 4.09  47  M 1 \nATOM   680  H  HB2  . ALA M  1 48  ? 145.014 87.713  83.155 1.00 4.09  47  M 1 \nATOM   681  H  HB3  . ALA M  1 48  ? 145.456 88.731  84.279 1.00 4.09  47  M 1 \nATOM   682  N  N    . LEU M  1 49  ? 143.443 91.870  83.008 1.00 3.91  48  M 1 \nATOM   683  C  CA   . LEU M  1 49  ? 142.931 93.101  83.616 1.00 3.91  48  M 1 \nATOM   684  C  C    . LEU M  1 49  ? 141.549 93.386  83.022 1.00 3.91  48  M 1 \nATOM   685  O  O    . LEU M  1 49  ? 141.416 94.075  82.011 1.00 3.91  48  M 1 \nATOM   686  C  CB   . LEU M  1 49  ? 143.918 94.244  83.389 1.00 3.91  48  M 1 \nATOM   687  C  CG   . LEU M  1 49  ? 145.258 94.024  84.111 1.00 3.91  48  M 1 \nATOM   688  C  CD1  . LEU M  1 49  ? 146.322 95.005  83.680 1.00 3.91  48  M 1 \nATOM   689  C  CD2  . LEU M  1 49  ? 145.071 94.083  85.631 1.00 3.91  48  M 1 \nATOM   690  H  H    . LEU M  1 49  ? 143.516 91.927  82.153 1.00 3.91  48  M 1 \nATOM   691  H  HA   . LEU M  1 49  ? 142.808 92.984  84.571 1.00 3.91  48  M 1 \nATOM   692  H  HB2  . LEU M  1 49  ? 144.095 94.342  82.440 1.00 3.91  48  M 1 \nATOM   693  H  HB3  . LEU M  1 49  ? 143.525 95.066  83.722 1.00 3.91  48  M 1 \nATOM   694  H  HG   . LEU M  1 49  ? 145.595 93.140  83.896 1.00 3.91  48  M 1 \nATOM   695  H  HD11 . LEU M  1 49  ? 147.187 94.570  83.732 1.00 3.91  48  M 1 \nATOM   696  H  HD12 . LEU M  1 49  ? 146.165 95.292  82.767 1.00 3.91  48  M 1 \nATOM   697  H  HD13 . LEU M  1 49  ? 146.309 95.769  84.278 1.00 3.91  48  M 1 \nATOM   698  H  HD21 . LEU M  1 49  ? 145.899 94.367  86.048 1.00 3.91  48  M 1 \nATOM   699  H  HD22 . LEU M  1 49  ? 144.367 94.712  85.853 1.00 3.91  48  M 1 \nATOM   700  H  HD23 . LEU M  1 49  ? 144.830 93.201  85.954 1.00 3.91  48  M 1 \nATOM   701  N  N    . LYS M  1 50  ? 140.522 92.794  83.640 1.00 4.48  49  M 1 \nATOM   702  C  CA   . LYS M  1 50  ? 139.116 92.801  83.147 1.00 4.48  49  M 1 \nATOM   703  C  C    . LYS M  1 50  ? 138.529 94.213  83.070 1.00 4.48  49  M 1 \nATOM   704  O  O    . LYS M  1 50  ? 137.806 94.487  82.119 1.00 4.48  49  M 1 \nATOM   705  C  CB   . LYS M  1 50  ? 138.251 91.891  84.020 1.00 4.48  49  M 1 \nATOM   706  C  CG   . LYS M  1 50  ? 138.716 90.445  84.052 1.00 4.48  49  M 1 \nATOM   707  C  CD   . LYS M  1 50  ? 137.781 89.541  84.839 1.00 4.48  49  M 1 \nATOM   708  C  CE   . LYS M  1 50  ? 138.133 88.076  84.693 1.00 4.48  49  M 1 \nATOM   709  N  NZ   . LYS M  1 50  ? 136.916 87.233  84.702 1.00 4.48  49  M 1 \nATOM   710  H  H    . LYS M  1 50  ? 140.604 92.440  84.474 1.00 4.48  49  M 1 \nATOM   711  H  HA   . LYS M  1 50  ? 139.122 92.429  82.235 1.00 4.48  49  M 1 \nATOM   712  H  HB2  . LYS M  1 50  ? 138.251 92.242  84.935 1.00 4.48  49  M 1 \nATOM   713  H  HB3  . LYS M  1 50  ? 137.331 91.918  83.686 1.00 4.48  49  M 1 \nATOM   714  H  HG2  . LYS M  1 50  ? 138.785 90.113  83.132 1.00 4.48  49  M 1 \nATOM   715  H  HG3  . LYS M  1 50  ? 139.611 90.408  84.454 1.00 4.48  49  M 1 \nATOM   716  H  HD2  . LYS M  1 50  ? 137.820 89.785  85.789 1.00 4.48  49  M 1 \nATOM   717  H  HD3  . LYS M  1 50  ? 136.861 89.680  84.528 1.00 4.48  49  M 1 \nATOM   718  H  HE2  . LYS M  1 50  ? 138.613 87.935  83.854 1.00 4.48  49  M 1 \nATOM   719  H  HE3  . LYS M  1 50  ? 138.716 87.803  85.427 1.00 4.48  49  M 1 \nATOM   720  H  HZ1  . LYS M  1 50  ? 137.138 86.370  84.536 1.00 4.48  49  M 1 \nATOM   721  H  HZ2  . LYS M  1 50  ? 136.512 87.285  85.513 1.00 4.48  49  M 1 \nATOM   722  H  HZ3  . LYS M  1 50  ? 136.338 87.519  84.064 1.00 4.48  49  M 1 \nATOM   723  N  N    . ASN M  1 51  ? 138.832 95.061  84.037 1.00 4.04  50  M 1 \nATOM   724  C  CA   . ASN M  1 51  ? 138.313 96.445  84.094 1.00 4.04  50  M 1 \nATOM   725  C  C    . ASN M  1 51  ? 138.979 97.259  82.986 1.00 4.04  50  M 1 \nATOM   726  O  O    . ASN M  1 51  ? 138.313 98.120  82.470 1.00 4.04  50  M 1 \nATOM   727  C  CB   . ASN M  1 51  ? 138.358 97.030  85.502 1.00 4.04  50  M 1 \nATOM   728  C  CG   . ASN M  1 51  ? 137.360 96.332  86.403 1.00 4.04  50  M 1 \nATOM   729  O  OD1  . ASN M  1 51  ? 136.337 95.857  85.933 1.00 4.04  50  M 1 \nATOM   730  N  ND2  . ASN M  1 51  ? 137.675 96.201  87.674 1.00 4.04  50  M 1 \nATOM   731  H  H    . ASN M  1 51  ? 139.425 94.854  84.696 1.00 4.04  50  M 1 \nATOM   732  H  HA   . ASN M  1 51  ? 137.356 96.389  83.863 1.00 4.04  50  M 1 \nATOM   733  H  HB2  . ASN M  1 51  ? 139.259 96.924  85.868 1.00 4.04  50  M 1 \nATOM   734  H  HB3  . ASN M  1 51  ? 138.149 97.986  85.462 1.00 4.04  50  M 1 \nATOM   735  H  HD21 . ASN M  1 51  ? 138.442 96.521  87.975 1.00 4.04  50  M 1 \nATOM   736  H  HD22 . ASN M  1 51  ? 137.119 95.793  88.228 1.00 4.04  50  M 1 \nATOM   737  N  N    . PHE M  1 52  ? 140.264 97.074  82.697 1.00 3.78  51  M 1 \nATOM   738  C  CA   . PHE M  1 52  ? 140.889 97.787  81.553 1.00 3.78  51  M 1 \nATOM   739  C  C    . PHE M  1 52  ? 140.179 97.325  80.269 1.00 3.78  51  M 1 \nATOM   740  O  O    . PHE M  1 52  ? 139.787 98.165  79.473 1.00 3.78  51  M 1 \nATOM   741  C  CB   . PHE M  1 52  ? 142.386 97.523  81.457 1.00 3.78  51  M 1 \nATOM   742  C  CG   . PHE M  1 52  ? 143.231 98.417  82.334 1.00 3.78  51  M 1 \nATOM   743  C  CD1  . PHE M  1 52  ? 143.460 98.114  83.666 1.00 3.78  51  M 1 \nATOM   744  C  CD2  . PHE M  1 52  ? 143.836 99.549  81.815 1.00 3.78  51  M 1 \nATOM   745  C  CE1  . PHE M  1 52  ? 144.276 98.921  84.452 1.00 3.78  51  M 1 \nATOM   746  C  CE2  . PHE M  1 52  ? 144.649 100.353 82.597 1.00 3.78  51  M 1 \nATOM   747  C  CZ   . PHE M  1 52  ? 144.872 100.031 83.914 1.00 3.78  51  M 1 \nATOM   748  H  H    . PHE M  1 52  ? 140.864 96.663  83.243 1.00 3.78  51  M 1 \nATOM   749  H  HA   . PHE M  1 52  ? 140.741 98.761  81.665 1.00 3.78  51  M 1 \nATOM   750  H  HB2  . PHE M  1 52  ? 142.552 96.589  81.703 1.00 3.78  51  M 1 \nATOM   751  H  HB3  . PHE M  1 52  ? 142.662 97.640  80.524 1.00 3.78  51  M 1 \nATOM   752  H  HD1  . PHE M  1 52  ? 143.069 97.340  84.040 1.00 3.78  51  M 1 \nATOM   753  H  HD2  . PHE M  1 52  ? 143.705 99.767  80.906 1.00 3.78  51  M 1 \nATOM   754  H  HE1  . PHE M  1 52  ? 144.419 98.703  85.359 1.00 3.78  51  M 1 \nATOM   755  H  HE2  . PHE M  1 52  ? 145.049 101.123 82.225 1.00 3.78  51  M 1 \nATOM   756  H  HZ   . PHE M  1 52  ? 145.407 100.591 84.454 1.00 3.78  51  M 1 \nATOM   757  N  N    . ALA M  1 53  ? 139.908 96.025  80.142 1.00 3.65  52  M 1 \nATOM   758  C  CA   . ALA M  1 53  ? 139.238 95.471  78.940 1.00 3.65  52  M 1 \nATOM   759  C  C    . ALA M  1 53  ? 137.855 96.116  78.772 1.00 3.65  52  M 1 \nATOM   760  O  O    . ALA M  1 53  ? 137.594 96.572  77.712 1.00 3.65  52  M 1 \nATOM   761  C  CB   . ALA M  1 53  ? 139.126 93.973  79.054 1.00 3.65  52  M 1 \nATOM   762  H  H    . ALA M  1 53  ? 139.978 95.422  80.819 1.00 3.65  52  M 1 \nATOM   763  H  HA   . ALA M  1 53  ? 139.784 95.690  78.148 1.00 3.65  52  M 1 \nATOM   764  H  HB1  . ALA M  1 53  ? 138.698 93.617  78.257 1.00 3.65  52  M 1 \nATOM   765  H  HB2  . ALA M  1 53  ? 140.013 93.587  79.145 1.00 3.65  52  M 1 \nATOM   766  H  HB3  . ALA M  1 53  ? 138.593 93.746  79.835 1.00 3.65  52  M 1 \nATOM   767  N  N    . LYS M  1 54  ? 137.059 96.217  79.827 1.00 4.07  53  M 1 \nATOM   768  C  CA   . LYS M  1 54  ? 135.720 96.798  79.806 1.00 4.07  53  M 1 \nATOM   769  C  C    . LYS M  1 54  ? 135.766 98.273  79.442 1.00 4.07  53  M 1 \nATOM   770  O  O    . LYS M  1 54  ? 134.953 98.751  78.641 1.00 4.07  53  M 1 \nATOM   771  C  CB   . LYS M  1 54  ? 135.038 96.601  81.160 1.00 4.07  53  M 1 \nATOM   772  C  CG   . LYS M  1 54  ? 134.600 95.184  81.418 1.00 4.07  53  M 1 \nATOM   773  C  CD   . LYS M  1 54  ? 133.912 95.041  82.759 1.00 4.07  53  M 1 \nATOM   774  C  CE   . LYS M  1 54  ? 133.444 93.611  82.976 1.00 4.07  53  M 1 \nATOM   775  N  NZ   . LYS M  1 54  ? 132.778 93.456  84.294 1.00 4.07  53  M 1 \nATOM   776  H  H    . LYS M  1 54  ? 137.302 95.910  80.593 1.00 4.07  53  M 1 \nATOM   777  H  HA   . LYS M  1 54  ? 135.183 96.335  79.144 1.00 4.07  53  M 1 \nATOM   778  H  HB2  . LYS M  1 54  ? 135.659 96.855  81.860 1.00 4.07  53  M 1 \nATOM   779  H  HB3  . LYS M  1 54  ? 134.249 97.163  81.211 1.00 4.07  53  M 1 \nATOM   780  H  HG2  . LYS M  1 54  ? 133.980 94.913  80.723 1.00 4.07  53  M 1 \nATOM   781  H  HG3  . LYS M  1 54  ? 135.371 94.596  81.413 1.00 4.07  53  M 1 \nATOM   782  H  HD2  . LYS M  1 54  ? 134.544 95.254  83.463 1.00 4.07  53  M 1 \nATOM   783  H  HD3  . LYS M  1 54  ? 133.151 95.641  82.799 1.00 4.07  53  M 1 \nATOM   784  H  HE2  . LYS M  1 54  ? 132.810 93.380  82.279 1.00 4.07  53  M 1 \nATOM   785  H  HE3  . LYS M  1 54  ? 134.202 93.006  82.939 1.00 4.07  53  M 1 \nATOM   786  H  HZ1  . LYS M  1 54  ? 132.343 92.681  84.331 1.00 4.07  53  M 1 \nATOM   787  H  HZ2  . LYS M  1 54  ? 133.386 93.475  84.944 1.00 4.07  53  M 1 \nATOM   788  H  HZ3  . LYS M  1 54  ? 132.201 94.122  84.421 1.00 4.07  53  M 1 \nATOM   789  N  N    . TYR M  1 55  ? 136.721 99.003  80.017 1.00 3.64  54  M 1 \nATOM   790  C  CA   . TYR M  1 55  ? 136.889 100.416 79.716 1.00 3.64  54  M 1 \nATOM   791  C  C    . TYR M  1 55  ? 137.089 100.630 78.223 1.00 3.64  54  M 1 \nATOM   792  O  O    . TYR M  1 55  ? 136.367 101.408 77.587 1.00 3.64  54  M 1 \nATOM   793  C  CB   . TYR M  1 55  ? 138.079 100.968 80.500 1.00 3.64  54  M 1 \nATOM   794  C  CG   . TYR M  1 55  ? 138.327 102.435 80.293 1.00 3.64  54  M 1 \nATOM   795  C  CD1  . TYR M  1 55  ? 137.546 103.371 80.930 1.00 3.64  54  M 1 \nATOM   796  C  CD2  . TYR M  1 55  ? 139.335 102.885 79.461 1.00 3.64  54  M 1 \nATOM   797  C  CE1  . TYR M  1 55  ? 137.758 104.712 80.757 1.00 3.64  54  M 1 \nATOM   798  C  CE2  . TYR M  1 55  ? 139.557 104.229 79.278 1.00 3.64  54  M 1 \nATOM   799  C  CZ   . TYR M  1 55  ? 138.761 105.141 79.932 1.00 3.64  54  M 1 \nATOM   800  O  OH   . TYR M  1 55  ? 138.958 106.493 79.769 1.00 3.64  54  M 1 \nATOM   801  H  H    . TYR M  1 55  ? 137.298 98.689  80.572 1.00 3.64  54  M 1 \nATOM   802  H  HA   . TYR M  1 55  ? 136.094 100.896 79.997 1.00 3.64  54  M 1 \nATOM   803  H  HB2  . TYR M  1 55  ? 137.905 100.843 81.446 1.00 3.64  54  M 1 \nATOM   804  H  HB3  . TYR M  1 55  ? 138.884 100.486 80.254 1.00 3.64  54  M 1 \nATOM   805  H  HD1  . TYR M  1 55  ? 136.866 103.082 81.495 1.00 3.64  54  M 1 \nATOM   806  H  HD2  . TYR M  1 55  ? 139.873 102.270 79.017 1.00 3.64  54  M 1 \nATOM   807  H  HE1  . TYR M  1 55  ? 137.219 105.326 81.201 1.00 3.64  54  M 1 \nATOM   808  H  HE2  . TYR M  1 55  ? 140.238 104.516 78.714 1.00 3.64  54  M 1 \nATOM   809  H  HH   . TYR M  1 55  ? 139.605 106.634 79.252 1.00 3.64  54  M 1 \nATOM   810  N  N    . PHE M  1 56  ? 138.045 99.916  77.638 1.00 3.26  55  M 1 \nATOM   811  C  CA   . PHE M  1 56  ? 138.361 100.183 76.241 1.00 3.26  55  M 1 \nATOM   812  C  C    . PHE M  1 56  ? 137.272 99.657  75.307 1.00 3.26  55  M 1 \nATOM   813  O  O    . PHE M  1 56  ? 137.034 100.239 74.247 1.00 3.26  55  M 1 \nATOM   814  C  CB   . PHE M  1 56  ? 139.732 99.626  75.871 1.00 3.26  55  M 1 \nATOM   815  C  CG   . PHE M  1 56  ? 140.876 100.339 76.545 1.00 3.26  55  M 1 \nATOM   816  C  CD1  . PHE M  1 56  ? 141.155 101.654 76.234 1.00 3.26  55  M 1 \nATOM   817  C  CD2  . PHE M  1 56  ? 141.736 99.677  77.390 1.00 3.26  55  M 1 \nATOM   818  C  CE1  . PHE M  1 56  ? 142.198 102.309 76.825 1.00 3.26  55  M 1 \nATOM   819  C  CE2  . PHE M  1 56  ? 142.796 100.338 77.966 1.00 3.26  55  M 1 \nATOM   820  C  CZ   . PHE M  1 56  ? 143.023 101.646 77.678 1.00 3.26  55  M 1 \nATOM   821  H  H    . PHE M  1 56  ? 138.498 99.287  78.010 1.00 3.26  55  M 1 \nATOM   822  H  HA   . PHE M  1 56  ? 138.401 101.145 76.120 1.00 3.26  55  M 1 \nATOM   823  H  HB2  . PHE M  1 56  ? 139.762 98.690  76.124 1.00 3.26  55  M 1 \nATOM   824  H  HB3  . PHE M  1 56  ? 139.856 99.697  74.912 1.00 3.26  55  M 1 \nATOM   825  H  HD1  . PHE M  1 56  ? 140.589 102.126 75.666 1.00 3.26  55  M 1 \nATOM   826  H  HD2  . PHE M  1 56  ? 141.590 98.782  77.595 1.00 3.26  55  M 1 \nATOM   827  H  HE1  . PHE M  1 56  ? 142.360 103.203 76.628 1.00 3.26  55  M 1 \nATOM   828  H  HE2  . PHE M  1 56  ? 143.367 99.891  78.548 1.00 3.26  55  M 1 \nATOM   829  H  HZ   . PHE M  1 56  ? 143.739 102.093 78.069 1.00 3.26  55  M 1 \nATOM   830  N  N    . LEU M  1 57  ? 136.563 98.594  75.692 1.00 3.56  56  M 1 \nATOM   831  C  CA   . LEU M  1 57  ? 135.447 98.132  74.871 1.00 3.56  56  M 1 \nATOM   832  C  C    . LEU M  1 57  ? 134.337 99.173  74.852 1.00 3.56  56  M 1 \nATOM   833  O  O    . LEU M  1 57  ? 133.737 99.449  73.801 1.00 3.56  56  M 1 \nATOM   834  C  CB   . LEU M  1 57  ? 134.908 96.802  75.395 1.00 3.56  56  M 1 \nATOM   835  C  CG   . LEU M  1 57  ? 133.841 96.119  74.535 1.00 3.56  56  M 1 \nATOM   836  C  CD1  . LEU M  1 57  ? 134.418 95.725  73.192 1.00 3.56  56  M 1 \nATOM   837  C  CD2  . LEU M  1 57  ? 133.244 94.918  75.242 1.00 3.56  56  M 1 \nATOM   838  H  H    . LEU M  1 57  ? 136.694 98.147  76.415 1.00 3.56  56  M 1 \nATOM   839  H  HA   . LEU M  1 57  ? 135.769 97.997  73.966 1.00 3.56  56  M 1 \nATOM   840  H  HB2  . LEU M  1 57  ? 135.644 96.179  75.496 1.00 3.56  56  M 1 \nATOM   841  H  HB3  . LEU M  1 57  ? 134.506 96.958  76.264 1.00 3.56  56  M 1 \nATOM   842  H  HG   . LEU M  1 57  ? 133.119 96.743  74.361 1.00 3.56  56  M 1 \nATOM   843  H  HD11 . LEU M  1 57  ? 133.810 95.111  72.751 1.00 3.56  56  M 1 \nATOM   844  H  HD12 . LEU M  1 57  ? 134.521 96.524  72.652 1.00 3.56  56  M 1 \nATOM   845  H  HD13 . LEU M  1 57  ? 135.280 95.300  73.323 1.00 3.56  56  M 1 \nATOM   846  H  HD21 . LEU M  1 57  ? 132.555 94.538  74.675 1.00 3.56  56  M 1 \nATOM   847  H  HD22 . LEU M  1 57  ? 133.937 94.258  75.403 1.00 3.56  56  M 1 \nATOM   848  H  HD23 . LEU M  1 57  ? 132.855 95.206  76.083 1.00 3.56  56  M 1 \nATOM   849  N  N    . HIS M  1 58  ? 134.052 99.759  76.015 1.00 3.86  57  M 1 \nATOM   850  C  CA   . HIS M  1 58  ? 133.085 100.842 76.095 1.00 3.86  57  M 1 \nATOM   851  C  C    . HIS M  1 58  ? 133.498 102.006 75.206 1.00 3.86  57  M 1 \nATOM   852  O  O    . HIS M  1 58  ? 132.668 102.593 74.502 1.00 3.86  57  M 1 \nATOM   853  C  CB   . HIS M  1 58  ? 132.940 101.305 77.539 1.00 3.86  57  M 1 \nATOM   854  C  CG   . HIS M  1 58  ? 131.986 102.439 77.703 1.00 3.86  57  M 1 \nATOM   855  N  ND1  . HIS M  1 58  ? 130.619 102.276 77.663 1.00 3.86  57  M 1 \nATOM   856  C  CD2  . HIS M  1 58  ? 132.202 103.764 77.863 1.00 3.86  57  M 1 \nATOM   857  C  CE1  . HIS M  1 58  ? 130.035 103.449 77.821 1.00 3.86  57  M 1 \nATOM   858  N  NE2  . HIS M  1 58  ? 130.974 104.369 77.942 1.00 3.86  57  M 1 \nATOM   859  H  H    . HIS M  1 58  ? 134.418 99.555  76.766 1.00 3.86  57  M 1 \nATOM   860  H  HA   . HIS M  1 58  ? 132.222 100.514 75.798 1.00 3.86  57  M 1 \nATOM   861  H  HB2  . HIS M  1 58  ? 132.604 100.567 78.072 1.00 3.86  57  M 1 \nATOM   862  H  HB3  . HIS M  1 58  ? 133.803 101.589 77.879 1.00 3.86  57  M 1 \nATOM   863  H  HD2  . HIS M  1 58  ? 133.029 104.185 77.920 1.00 3.86  57  M 1 \nATOM   864  H  HE1  . HIS M  1 58  ? 129.118 103.603 77.835 1.00 3.86  57  M 1 \nATOM   865  H  HE2  . HIS M  1 58  ? 130.840 105.212 78.049 1.00 3.86  57  M 1 \nATOM   866  N  N    . GLN M  1 59  ? 134.786 102.339 75.238 1.00 3.55  58  M 1 \nATOM   867  C  CA   . GLN M  1 59  ? 135.333 103.431 74.394 1.00 3.55  58  M 1 \nATOM   868  C  C    . GLN M  1 59  ? 135.113 103.056 72.914 1.00 3.55  58  M 1 \nATOM   869  O  O    . GLN M  1 59  ? 134.716 103.896 72.159 1.00 3.55  58  M 1 \nATOM   870  C  CB   . GLN M  1 59  ? 136.821 103.672 74.668 1.00 3.55  58  M 1 \nATOM   871  C  CG   . GLN M  1 59  ? 137.147 104.192 76.061 1.00 3.55  58  M 1 \nATOM   872  C  CD   . GLN M  1 59  ? 136.194 105.252 76.544 1.00 3.55  58  M 1 \nATOM   873  O  OE1  . GLN M  1 59  ? 135.612 105.142 77.613 1.00 3.55  58  M 1 \nATOM   874  N  NE2  . GLN M  1 59  ? 136.019 106.291 75.759 1.00 3.55  58  M 1 \nATOM   875  H  H    . GLN M  1 59  ? 135.416 101.843 75.668 1.00 3.55  58  M 1 \nATOM   876  H  HA   . GLN M  1 59  ? 134.834 104.257 74.591 1.00 3.55  58  M 1 \nATOM   877  H  HB2  . GLN M  1 59  ? 137.298 102.828 74.527 1.00 3.55  58  M 1 \nATOM   878  H  HB3  . GLN M  1 59  ? 137.153 104.314 74.006 1.00 3.55  58  M 1 \nATOM   879  H  HG2  . GLN M  1 59  ? 137.133 103.442 76.693 1.00 3.55  58  M 1 \nATOM   880  H  HG3  . GLN M  1 59  ? 138.056 104.561 76.058 1.00 3.55  58  M 1 \nATOM   881  H  HE21 . GLN M  1 59  ? 135.434 106.916 75.978 1.00 3.55  58  M 1 \nATOM   882  H  HE22 . GLN M  1 59  ? 136.486 106.365 75.013 1.00 3.55  58  M 1 \nATOM   883  N  N    . SER M  1 60  ? 135.331 101.813 72.512 1.00 3.24  59  M 1 \nATOM   884  C  CA   . SER M  1 60  ? 135.143 101.390 71.126 1.00 3.24  59  M 1 \nATOM   885  C  C    . SER M  1 60  ? 133.699 101.592 70.690 1.00 3.24  59  M 1 \nATOM   886  O  O    . SER M  1 60  ? 133.420 102.123 69.604 1.00 3.24  59  M 1 \nATOM   887  C  CB   . SER M  1 60  ? 135.541 99.924  70.959 1.00 3.24  59  M 1 \nATOM   888  O  OG   . SER M  1 60  ? 135.301 99.505  69.637 1.00 3.24  59  M 1 \nATOM   889  H  H    . SER M  1 60  ? 135.602 101.192 73.042 1.00 3.24  59  M 1 \nATOM   890  H  HA   . SER M  1 60  ? 135.722 101.916 70.552 1.00 3.24  59  M 1 \nATOM   891  H  HB2  . SER M  1 60  ? 136.482 99.810  71.163 1.00 3.24  59  M 1 \nATOM   892  H  HB3  . SER M  1 60  ? 135.013 99.373  71.558 1.00 3.24  59  M 1 \nATOM   893  H  HG   . SER M  1 60  ? 136.017 99.537  69.199 1.00 3.24  59  M 1 \nATOM   894  N  N    . HIS M  1 61  ? 132.766 101.182 71.545 1.00 3.61  60  M 1 \nATOM   895  C  CA   . HIS M  1 61  ? 131.351 101.333 71.224 1.00 3.61  60  M 1 \nATOM   896  C  C    . HIS M  1 61  ? 130.969 102.807 71.111 1.00 3.61  60  M 1 \nATOM   897  O  O    . HIS M  1 61  ? 130.209 103.194 70.212 1.00 3.61  60  M 1 \nATOM   898  C  CB   . HIS M  1 61  ? 130.503 100.619 72.274 1.00 3.61  60  M 1 \nATOM   899  C  CG   . HIS M  1 61  ? 130.658 99.131  72.259 1.00 3.61  60  M 1 \nATOM   900  N  ND1  . HIS M  1 61  ? 130.123 98.316  73.233 1.00 3.61  60  M 1 \nATOM   901  C  CD2  . HIS M  1 61  ? 131.295 98.310  71.392 1.00 3.61  60  M 1 \nATOM   902  C  CE1  . HIS M  1 61  ? 130.422 97.058  72.962 1.00 3.61  60  M 1 \nATOM   903  N  NE2  . HIS M  1 61  ? 131.131 97.028  71.850 1.00 3.61  60  M 1 \nATOM   904  H  H    . HIS M  1 61  ? 132.932 100.839 72.316 1.00 3.61  60  M 1 \nATOM   905  H  HA   . HIS M  1 61  ? 131.177 100.924 70.362 1.00 3.61  60  M 1 \nATOM   906  H  HB2  . HIS M  1 61  ? 130.749 100.941 73.155 1.00 3.61  60  M 1 \nATOM   907  H  HB3  . HIS M  1 61  ? 129.567 100.820 72.116 1.00 3.61  60  M 1 \nATOM   908  H  HD2  . HIS M  1 61  ? 131.758 98.559  70.625 1.00 3.61  60  M 1 \nATOM   909  H  HE1  . HIS M  1 61  ? 130.179 96.315  73.466 1.00 3.61  60  M 1 \nATOM   910  H  HE2  . HIS M  1 61  ? 131.444 96.322  71.471 1.00 3.61  60  M 1 \nATOM   911  N  N    . GLU M  1 62  ? 131.505 103.647 71.997 1.00 3.84  61  M 1 \nATOM   912  C  CA   . GLU M  1 62  ? 131.212 105.075 71.925 1.00 3.84  61  M 1 \nATOM   913  C  C    . GLU M  1 62  ? 131.729 105.689 70.628 1.00 3.84  61  M 1 \nATOM   914  O  O    . GLU M  1 62  ? 131.069 106.546 70.032 1.00 3.84  61  M 1 \nATOM   915  C  CB   . GLU M  1 62  ? 131.806 105.801 73.132 1.00 3.84  61  M 1 \nATOM   916  C  CG   . GLU M  1 62  ? 131.117 105.507 74.458 1.00 3.84  61  M 1 \nATOM   917  C  CD   . GLU M  1 62  ? 129.702 106.056 74.531 1.00 3.84  61  M 1 \nATOM   918  O  OE1  . GLU M  1 62  ? 129.434 107.105 73.910 1.00 3.84  61  M 1 \nATOM   919  O  OE2  . GLU M  1 62  ? 128.856 105.440 75.213 1.00 3.84  61  M 1 \nATOM   920  H  H    . GLU M  1 62  ? 132.043 103.424 72.630 1.00 3.84  61  M 1 \nATOM   921  H  HA   . GLU M  1 62  ? 130.249 105.187 71.946 1.00 3.84  61  M 1 \nATOM   922  H  HB2  . GLU M  1 62  ? 132.737 105.543 73.223 1.00 3.84  61  M 1 \nATOM   923  H  HB3  . GLU M  1 62  ? 131.758 106.757 72.975 1.00 3.84  61  M 1 \nATOM   924  H  HG2  . GLU M  1 62  ? 131.068 104.548 74.594 1.00 3.84  61  M 1 \nATOM   925  H  HG3  . GLU M  1 62  ? 131.631 105.913 75.173 1.00 3.84  61  M 1 \nATOM   926  N  N    . GLU M  1 63  ? 132.904 105.264 70.167 1.00 3.87  62  M 1 \nATOM   927  C  CA   . GLU M  1 63  ? 133.445 105.837 68.937 1.00 3.87  62  M 1 \nATOM   928  C  C    . GLU M  1 63  ? 132.639 105.379 67.724 1.00 3.87  62  M 1 \nATOM   929  O  O    . GLU M  1 63  ? 132.447 106.143 66.768 1.00 3.87  62  M 1 \nATOM   930  C  CB   . GLU M  1 63  ? 134.923 105.479 68.779 1.00 3.87  62  M 1 \nATOM   931  C  CG   . GLU M  1 63  ? 135.854 106.022 69.867 1.00 3.87  62  M 1 \nATOM   932  C  CD   . GLU M  1 63  ? 135.896 107.537 69.978 1.00 3.87  62  M 1 \nATOM   933  O  OE1  . GLU M  1 63  ? 135.774 108.240 68.963 1.00 3.87  62  M 1 \nATOM   934  O  OE2  . GLU M  1 63  ? 136.035 108.032 71.115 1.00 3.87  62  M 1 \nATOM   935  H  H    . GLU M  1 63  ? 133.388 104.654 70.533 1.00 3.87  62  M 1 \nATOM   936  H  HA   . GLU M  1 63  ? 133.379 106.804 68.981 1.00 3.87  62  M 1 \nATOM   937  H  HB2  . GLU M  1 63  ? 135.006 104.513 68.804 1.00 3.87  62  M 1 \nATOM   938  H  HB3  . GLU M  1 63  ? 135.238 105.797 67.919 1.00 3.87  62  M 1 \nATOM   939  H  HG2  . GLU M  1 63  ? 135.596 105.675 70.735 1.00 3.87  62  M 1 \nATOM   940  H  HG3  . GLU M  1 63  ? 136.753 105.720 69.663 1.00 3.87  62  M 1 \nATOM   941  N  N    . ARG M  1 64  ? 132.101 104.161 67.796 1.00 3.76  63  M 1 \nATOM   942  C  CA   . ARG M  1 64  ? 131.222 103.585 66.708 1.00 3.76  63  M 1 \nATOM   943  C  C    . ARG M  1 64  ? 129.982 104.548 66.721 1.00 3.76  63  M 1 \nATOM   944  O  O    . ARG M  1 64  ? 129.586 104.978 65.656 1.00 3.76  63  M 1 \nATOM   945  C  CB   . ARG M  1 64  ? 130.958 102.003 66.808 0.50 3.76  63  M 1 \nATOM   946  C  CG   . ARG M  1 64  ? 129.868 101.512 65.865 0.50 3.76  63  M 1 \nATOM   947  C  CD   . ARG M  1 64  ? 130.261 101.575 64.397 0.50 3.76  63  M 1 \nATOM   948  N  NE   . ARG M  1 64  ? 130.583 100.261 63.843 0.50 3.76  63  M 1 \nATOM   949  C  CZ   . ARG M  1 64  ? 129.698 99.402  63.345 0.50 3.76  63  M 1 \nATOM   950  N  NH1  . ARG M  1 64  ? 130.106 98.233  62.883 0.50 3.76  63  M 1 \nATOM   951  N  NH2  . ARG M  1 64  ? 128.413 99.701  63.309 0.50 3.76  63  M 1 \nATOM   952  H  H    . ARG M  1 64  ? 132.146 103.647 68.546 1.00 3.76  63  M 1 \nATOM   953  H  HA   . ARG M  1 64  ? 131.743 103.924 65.813 1.00 3.76  63  M 1 \nATOM   954  H  HB2  . ARG M  1 64  ? 131.792 101.531 66.603 0.50 3.76  63  M 1 \nATOM   955  H  HB3  . ARG M  1 64  ? 130.704 101.784 67.729 0.50 3.76  63  M 1 \nATOM   956  H  HG2  . ARG M  1 64  ? 129.643 100.585 66.092 0.50 3.76  63  M 1 \nATOM   957  H  HG3  . ARG M  1 64  ? 129.062 102.055 65.999 0.50 3.76  63  M 1 \nATOM   958  H  HD2  . ARG M  1 64  ? 129.523 101.967 63.883 0.50 3.76  63  M 1 \nATOM   959  H  HD3  . ARG M  1 64  ? 131.040 102.163 64.298 0.50 3.76  63  M 1 \nATOM   960  H  HE   . ARG M  1 64  ? 131.419 100.014 63.850 0.50 3.76  63  M 1 \nATOM   961  H  HH11 . ARG M  1 64  ? 130.961 98.028  62.902 0.50 3.76  63  M 1 \nATOM   962  H  HH12 . ARG M  1 64  ? 129.522 97.667  62.549 0.50 3.76  63  M 1 \nATOM   963  H  HH21 . ARG M  1 64  ? 128.135 100.477 63.619 0.50 3.76  63  M 1 \nATOM   964  H  HH22 . ARG M  1 64  ? 127.838 99.124  62.975 0.50 3.76  63  M 1 \nATOM   965  N  N    . GLU M  1 65  ? 129.447 104.893 67.887 1.00 4.14  64  M 1 \nATOM   966  C  CA   . GLU M  1 65  ? 128.292 105.783 67.961 1.00 4.14  64  M 1 \nATOM   967  C  C    . GLU M  1 65  ? 128.612 107.153 67.371 1.00 4.14  64  M 1 \nATOM   968  O  O    . GLU M  1 65  ? 127.777 107.746 66.678 1.00 4.14  64  M 1 \nATOM   969  C  CB   . GLU M  1 65  ? 127.806 105.917 69.404 1.00 4.14  64  M 1 \nATOM   970  C  CG   . GLU M  1 65  ? 127.215 104.648 70.011 1.00 4.14  64  M 1 \nATOM   971  C  CD   . GLU M  1 65  ? 126.815 104.819 71.470 1.00 4.14  64  M 1 \nATOM   972  O  OE1  . GLU M  1 65  ? 127.167 105.858 72.067 1.00 4.14  64  M 1 \nATOM   973  O  OE2  . GLU M  1 65  ? 126.168 103.907 72.026 1.00 4.14  64  M 1 \nATOM   974  H  H    . GLU M  1 65  ? 129.750 104.624 68.646 1.00 4.14  64  M 1 \nATOM   975  H  HA   . GLU M  1 65  ? 127.573 105.393 67.440 1.00 4.14  64  M 1 \nATOM   976  H  HB2  . GLU M  1 65  ? 128.554 106.187 69.959 1.00 4.14  64  M 1 \nATOM   977  H  HB3  . GLU M  1 65  ? 127.121 106.603 69.441 1.00 4.14  64  M 1 \nATOM   978  H  HG2  . GLU M  1 65  ? 126.423 104.393 69.514 1.00 4.14  64  M 1 \nATOM   979  H  HG3  . GLU M  1 65  ? 127.878 103.941 69.968 1.00 4.14  64  M 1 \nATOM   980  N  N    . HIS M  1 66  ? 129.829 107.640 67.616 1.00 4.22  65  M 1 \nATOM   981  C  CA   . HIS M  1 66  ? 130.308 108.938 67.079 1.00 4.22  65  M 1 \nATOM   982  C  C    . HIS M  1 66  ? 130.290 108.866 65.548 1.00 4.22  65  M 1 \nATOM   983  O  O    . HIS M  1 66  ? 129.822 109.783 64.939 1.00 4.22  65  M 1 \nATOM   984  C  CB   . HIS M  1 66  ? 131.713 109.301 67.587 1.00 4.22  65  M 1 \nATOM   985  C  CG   . HIS M  1 66  ? 131.792 109.546 69.053 1.00 4.22  65  M 1 \nATOM   986  N  ND1  . HIS M  1 66  ? 133.003 109.665 69.722 1.00 4.22  65  M 1 \nATOM   987  C  CD2  . HIS M  1 66  ? 130.831 109.635 69.993 1.00 4.22  65  M 1 \nATOM   988  C  CE1  . HIS M  1 66  ? 132.776 109.838 71.000 1.00 4.22  65  M 1 \nATOM   989  N  NE2  . HIS M  1 66  ? 131.461 109.838 71.198 1.00 4.22  65  M 1 \nATOM   990  H  H    . HIS M  1 66  ? 130.452 107.215 68.128 1.00 4.22  65  M 1 \nATOM   991  H  HA   . HIS M  1 66  ? 129.676 109.640 67.364 1.00 4.22  65  M 1 \nATOM   992  H  HB2  . HIS M  1 66  ? 132.330 108.571 67.356 1.00 4.22  65  M 1 \nATOM   993  H  HB3  . HIS M  1 66  ? 132.020 110.107 67.116 1.00 4.22  65  M 1 \nATOM   994  H  HD2  . HIS M  1 66  ? 129.904 109.592 69.854 1.00 4.22  65  M 1 \nATOM   995  H  HE1  . HIS M  1 66  ? 133.434 109.962 71.662 1.00 4.22  65  M 1 \nATOM   996  H  HE2  . HIS M  1 66  ? 131.063 109.939 71.973 1.00 4.22  65  M 1 \nATOM   997  N  N    . ALA M  1 67  ? 130.747 107.775 64.950 1.00 3.84  66  M 1 \nATOM   998  C  CA   . ALA M  1 67  ? 130.771 107.598 63.501 1.00 3.84  66  M 1 \nATOM   999  C  C    . ALA M  1 67  ? 129.362 107.575 62.928 1.00 3.84  66  M 1 \nATOM   1000 O  O    . ALA M  1 67  ? 129.078 108.216 61.908 1.00 3.84  66  M 1 \nATOM   1001 C  CB   . ALA M  1 67  ? 131.504 106.307 63.143 1.00 3.84  66  M 1 \nATOM   1002 H  H    . ALA M  1 67  ? 131.105 107.131 65.393 1.00 3.84  66  M 1 \nATOM   1003 H  HA   . ALA M  1 67  ? 131.257 108.336 63.100 1.00 3.84  66  M 1 \nATOM   1004 H  HB1  . ALA M  1 67  ? 131.443 106.159 62.186 1.00 3.84  66  M 1 \nATOM   1005 H  HB2  . ALA M  1 67  ? 132.433 106.374 63.413 1.00 3.84  66  M 1 \nATOM   1006 H  HB3  . ALA M  1 67  ? 131.087 105.565 63.608 1.00 3.84  66  M 1 \nATOM   1007 N  N    . GLU M  1 68  ? 128.465 106.843 63.583 1.00 4.02  67  M 1 \nATOM   1008 C  CA   . GLU M  1 68  ? 127.104 106.708 63.080 1.00 4.02  67  M 1 \nATOM   1009 C  C    . GLU M  1 68  ? 126.361 108.039 63.154 1.00 4.02  67  M 1 \nATOM   1010 O  O    . GLU M  1 68  ? 125.551 108.363 62.274 1.00 4.02  67  M 1 \nATOM   1011 C  CB   . GLU M  1 68  ? 126.385 105.614 63.868 1.00 4.02  67  M 1 \nATOM   1012 C  CG   . GLU M  1 68  ? 126.941 104.210 63.617 1.00 4.02  67  M 1 \nATOM   1013 C  CD   . GLU M  1 68  ? 126.280 103.138 64.473 1.00 4.02  67  M 1 \nATOM   1014 O  OE1  . GLU M  1 68  ? 125.463 103.483 65.352 1.00 4.02  67  M 1 \nATOM   1015 O  OE2  . GLU M  1 68  ? 126.596 101.946 64.273 1.00 4.02  67  M 1 \nATOM   1016 H  H    . GLU M  1 68  ? 128.615 106.433 64.324 1.00 4.02  67  M 1 \nATOM   1017 H  HA   . GLU M  1 68  ? 127.136 106.429 62.152 1.00 4.02  67  M 1 \nATOM   1018 H  HB2  . GLU M  1 68  ? 126.479 105.804 64.815 1.00 4.02  67  M 1 \nATOM   1019 H  HB3  . GLU M  1 68  ? 125.445 105.608 63.630 1.00 4.02  67  M 1 \nATOM   1020 H  HG2  . GLU M  1 68  ? 126.785 103.976 62.689 1.00 4.02  67  M 1 \nATOM   1021 H  HG3  . GLU M  1 68  ? 127.896 104.193 63.787 1.00 4.02  67  M 1 \nATOM   1022 N  N    . LYS M  1 69  ? 126.644 108.836 64.186 1.00 4.51  68  M 1 \nATOM   1023 C  CA   . LYS M  1 69  ? 126.058 110.167 64.286 1.00 4.51  68  M 1 \nATOM   1024 C  C    . LYS M  1 69  ? 126.543 111.060 63.145 1.00 4.51  68  M 1 \nATOM   1025 O  O    . LYS M  1 69  ? 125.765 111.831 62.573 1.00 4.51  68  M 1 \nATOM   1026 C  CB   . LYS M  1 69  ? 126.392 110.761 65.656 1.00 4.51  68  M 1 \nATOM   1027 C  CG   . LYS M  1 69  ? 125.744 112.081 65.984 1.00 4.51  68  M 1 \nATOM   1028 C  CD   . LYS M  1 69  ? 126.140 112.584 67.379 1.00 4.51  68  M 1 \nATOM   1029 C  CE   . LYS M  1 69  ? 125.446 111.817 68.486 1.00 4.51  68  M 1 \nATOM   1030 N  NZ   . LYS M  1 69  ? 125.760 112.374 69.836 1.00 4.51  68  M 1 \nATOM   1031 H  H    . LYS M  1 69  ? 127.178 108.638 64.831 1.00 4.51  68  M 1 \nATOM   1032 H  HA   . LYS M  1 69  ? 125.092 110.102 64.227 1.00 4.51  68  M 1 \nATOM   1033 H  HB2  . LYS M  1 69  ? 126.106 110.132 66.337 1.00 4.51  68  M 1 \nATOM   1034 H  HB3  . LYS M  1 69  ? 127.353 110.884 65.706 1.00 4.51  68  M 1 \nATOM   1035 H  HG2  . LYS M  1 69  ? 126.054 112.738 65.342 1.00 4.51  68  M 1 \nATOM   1036 H  HG3  . LYS M  1 69  ? 124.779 111.993 65.944 1.00 4.51  68  M 1 \nATOM   1037 H  HD2  . LYS M  1 69  ? 127.097 112.483 67.503 1.00 4.51  68  M 1 \nATOM   1038 H  HD3  . LYS M  1 69  ? 125.887 113.517 67.465 1.00 4.51  68  M 1 \nATOM   1039 H  HE2  . LYS M  1 69  ? 124.487 111.865 68.351 1.00 4.51  68  M 1 \nATOM   1040 H  HE3  . LYS M  1 69  ? 125.737 110.892 68.471 1.00 4.51  68  M 1 \nATOM   1041 H  HZ1  . LYS M  1 69  ? 126.614 112.223 70.038 1.00 4.51  68  M 1 \nATOM   1042 H  HZ2  . LYS M  1 69  ? 125.615 113.252 69.847 1.00 4.51  68  M 1 \nATOM   1043 H  HZ3  . LYS M  1 69  ? 125.247 111.989 70.453 1.00 4.51  68  M 1 \nATOM   1044 N  N    . LEU M  1 70  ? 127.821 110.946 62.778 1.00 4.14  69  M 1 \nATOM   1045 C  CA   . LEU M  1 70  ? 128.312 111.688 61.615 1.00 4.14  69  M 1 \nATOM   1046 C  C    . LEU M  1 70  ? 127.628 111.240 60.328 1.00 4.14  69  M 1 \nATOM   1047 O  O    . LEU M  1 70  ? 127.352 112.060 59.446 1.00 4.14  69  M 1 \nATOM   1048 C  CB   . LEU M  1 70  ? 129.824 111.540 61.473 1.00 4.14  69  M 1 \nATOM   1049 C  CG   . LEU M  1 70  ? 130.714 112.224 62.508 1.00 4.14  69  M 1 \nATOM   1050 C  CD1  . LEU M  1 70  ? 132.178 111.871 62.320 1.00 4.14  69  M 1 \nATOM   1051 C  CD2  . LEU M  1 70  ? 130.530 113.726 62.481 1.00 4.14  69  M 1 \nATOM   1052 H  H    . LEU M  1 70  ? 128.408 110.456 63.170 1.00 4.14  69  M 1 \nATOM   1053 H  HA   . LEU M  1 70  ? 128.095 112.626 61.732 1.00 4.14  69  M 1 \nATOM   1054 H  HB2  . LEU M  1 70  ? 130.029 110.592 61.501 1.00 4.14  69  M 1 \nATOM   1055 H  HB3  . LEU M  1 70  ? 130.074 111.883 60.601 1.00 4.14  69  M 1 \nATOM   1056 H  HG   . LEU M  1 70  ? 130.458 111.911 63.390 1.00 4.14  69  M 1 \nATOM   1057 H  HD11 . LEU M  1 70  ? 132.659 112.176 63.105 1.00 4.14  69  M 1 \nATOM   1058 H  HD12 . LEU M  1 70  ? 132.281 110.911 62.229 1.00 4.14  69  M 1 \nATOM   1059 H  HD13 . LEU M  1 70  ? 132.517 112.314 61.527 1.00 4.14  69  M 1 \nATOM   1060 H  HD21 . LEU M  1 70  ? 131.231 114.137 63.010 1.00 4.14  69  M 1 \nATOM   1061 H  HD22 . LEU M  1 70  ? 130.577 114.045 61.566 1.00 4.14  69  M 1 \nATOM   1062 H  HD23 . LEU M  1 70  ? 129.667 113.945 62.865 1.00 4.14  69  M 1 \nATOM   1063 N  N    . MET M  1 71  ? 127.364 109.948 60.208 1.00 4.44  70  M 1 \nATOM   1064 C  CA   . MET M  1 71  ? 126.697 109.405 59.001 1.00 4.44  70  M 1 \nATOM   1065 C  C    . MET M  1 71  ? 125.291 110.001 58.920 1.00 4.44  70  M 1 \nATOM   1066 O  O    . MET M  1 71  ? 124.905 110.440 57.849 1.00 4.44  70  M 1 \nATOM   1067 C  CB   . MET M  1 71  ? 126.674 107.880 59.051 1.00 4.44  70  M 1 \nATOM   1068 C  CG   . MET M  1 71  ? 128.068 107.310 58.992 1.00 4.44  70  M 1 \nATOM   1069 S  SD   . MET M  1 71  ? 128.013 105.515 59.092 1.00 4.44  70  M 1 \nATOM   1070 C  CE   . MET M  1 71  ? 129.764 105.161 59.006 1.00 4.44  70  M 1 \nATOM   1071 H  H    . MET M  1 71  ? 127.457 109.354 60.890 1.00 4.44  70  M 1 \nATOM   1072 H  HA   . MET M  1 71  ? 127.206 109.698 58.210 1.00 4.44  70  M 1 \nATOM   1073 H  HB2  . MET M  1 71  ? 126.238 107.593 59.878 1.00 4.44  70  M 1 \nATOM   1074 H  HB3  . MET M  1 71  ? 126.151 107.542 58.297 1.00 4.44  70  M 1 \nATOM   1075 H  HG2  . MET M  1 71  ? 128.499 107.576 58.152 1.00 4.44  70  M 1 \nATOM   1076 H  HG3  . MET M  1 71  ? 128.600 107.661 59.738 1.00 4.44  70  M 1 \nATOM   1077 H  HE1  . MET M  1 71  ? 129.900 104.207 59.039 1.00 4.44  70  M 1 \nATOM   1078 H  HE2  . MET M  1 71  ? 130.121 105.509 58.180 1.00 4.44  70  M 1 \nATOM   1079 H  HE3  . MET M  1 71  ? 130.213 105.578 59.752 1.00 4.44  70  M 1 \nATOM   1080 N  N    . LYS M  1 72  ? 124.578 110.039 60.037 1.00 5.09  71  M 1 \nATOM   1081 C  CA   . LYS M  1 72  ? 123.268 110.672 60.109 1.00 5.09  71  M 1 \nATOM   1082 C  C    . LYS M  1 72  ? 123.349 112.134 59.697 1.00 5.09  71  M 1 \nATOM   1083 O  O    . LYS M  1 72  ? 122.508 112.617 58.933 1.00 5.09  71  M 1 \nATOM   1084 C  CB   . LYS M  1 72  ? 122.703 110.527 61.522 1.00 5.09  71  M 1 \nATOM   1085 C  CG   . LYS M  1 72  ? 121.325 111.109 61.739 1.00 5.09  71  M 1 \nATOM   1086 C  CD   . LYS M  1 72  ? 120.796 110.746 63.129 1.00 5.09  71  M 1 \nATOM   1087 C  CE   . LYS M  1 72  ? 119.462 111.406 63.437 1.00 5.09  71  M 1 \nATOM   1088 N  NZ   . LYS M  1 72  ? 118.368 110.935 62.544 1.00 5.09  71  M 1 \nATOM   1089 H  H    . LYS M  1 72  ? 124.846 109.694 60.777 1.00 5.09  71  M 1 \nATOM   1090 H  HA   . LYS M  1 72  ? 122.666 110.214 59.501 1.00 5.09  71  M 1 \nATOM   1091 H  HB2  . LYS M  1 72  ? 122.640 109.582 61.732 1.00 5.09  71  M 1 \nATOM   1092 H  HB3  . LYS M  1 72  ? 123.310 110.959 62.144 1.00 5.09  71  M 1 \nATOM   1093 H  HG2  . LYS M  1 72  ? 121.371 112.076 61.677 1.00 5.09  71  M 1 \nATOM   1094 H  HG3  . LYS M  1 72  ? 120.720 110.757 61.068 1.00 5.09  71  M 1 \nATOM   1095 H  HD2  . LYS M  1 72  ? 120.682 109.785 63.191 1.00 5.09  71  M 1 \nATOM   1096 H  HD3  . LYS M  1 72  ? 121.431 111.046 63.798 1.00 5.09  71  M 1 \nATOM   1097 H  HE2  . LYS M  1 72  ? 119.208 111.187 64.347 1.00 5.09  71  M 1 \nATOM   1098 H  HE3  . LYS M  1 72  ? 119.546 112.368 63.342 1.00 5.09  71  M 1 \nATOM   1099 H  HZ1  . LYS M  1 72  ? 117.580 111.187 62.871 1.00 5.09  71  M 1 \nATOM   1100 H  HZ2  . LYS M  1 72  ? 118.464 111.284 61.731 1.00 5.09  71  M 1 \nATOM   1101 H  HZ3  . LYS M  1 72  ? 118.388 110.047 62.481 1.00 5.09  71  M 1 \nATOM   1102 N  N    . LEU M  1 73  ? 124.372 112.846 60.176 1.00 4.70  72  M 1 \nATOM   1103 C  CA   . LEU M  1 73  ? 124.575 114.232 59.765 1.00 4.70  72  M 1 \nATOM   1104 C  C    . LEU M  1 73  ? 124.735 114.343 58.257 1.00 4.70  72  M 1 \nATOM   1105 O  O    . LEU M  1 73  ? 124.121 115.210 57.626 1.00 4.70  72  M 1 \nATOM   1106 C  CB   . LEU M  1 73  ? 125.792 114.820 60.486 1.00 4.70  72  M 1 \nATOM   1107 C  CG   . LEU M  1 73  ? 126.197 116.293 60.314 1.00 4.70  72  M 1 \nATOM   1108 C  CD1  . LEU M  1 73  ? 126.895 116.563 58.993 1.00 4.70  72  M 1 \nATOM   1109 C  CD2  . LEU M  1 73  ? 125.020 117.220 60.465 1.00 4.70  72  M 1 \nATOM   1110 H  H    . LEU M  1 73  ? 124.966 112.543 60.719 1.00 4.70  72  M 1 \nATOM   1111 H  HA   . LEU M  1 73  ? 123.795 114.747 60.024 1.00 4.70  72  M 1 \nATOM   1112 H  HB2  . LEU M  1 73  ? 125.621 114.717 61.435 1.00 4.70  72  M 1 \nATOM   1113 H  HB3  . LEU M  1 73  ? 126.570 114.287 60.259 1.00 4.70  72  M 1 \nATOM   1114 H  HG   . LEU M  1 73  ? 126.833 116.516 61.011 1.00 4.70  72  M 1 \nATOM   1115 H  HD11 . LEU M  1 73  ? 127.419 117.376 59.068 1.00 4.70  72  M 1 \nATOM   1116 H  HD12 . LEU M  1 73  ? 127.480 115.818 58.782 1.00 4.70  72  M 1 \nATOM   1117 H  HD13 . LEU M  1 73  ? 126.229 116.668 58.295 1.00 4.70  72  M 1 \nATOM   1118 H  HD21 . LEU M  1 73  ? 125.345 118.132 60.408 1.00 4.70  72  M 1 \nATOM   1119 H  HD22 . LEU M  1 73  ? 124.387 117.048 59.750 1.00 4.70  72  M 1 \nATOM   1120 H  HD23 . LEU M  1 73  ? 124.600 117.070 61.327 1.00 4.70  72  M 1 \nATOM   1121 N  N    . GLN M  1 74  ? 125.569 113.483 57.671 1.00 4.76  73  M 1 \nATOM   1122 C  CA   . GLN M  1 74  ? 125.839 113.540 56.238 1.00 4.76  73  M 1 \nATOM   1123 C  C    . GLN M  1 74  ? 124.544 113.406 55.449 1.00 4.76  73  M 1 \nATOM   1124 O  O    . GLN M  1 74  ? 124.287 114.173 54.515 1.00 4.76  73  M 1 \nATOM   1125 C  CB   . GLN M  1 74  ? 126.819 112.433 55.835 1.00 4.76  73  M 1 \nATOM   1126 C  CG   . GLN M  1 74  ? 127.295 112.530 54.401 1.00 4.76  73  M 1 \nATOM   1127 C  CD   . GLN M  1 74  ? 128.249 113.676 54.194 1.00 4.76  73  M 1 \nATOM   1128 O  OE1  . GLN M  1 74  ? 127.849 114.775 53.838 1.00 4.76  73  M 1 \nATOM   1129 N  NE2  . GLN M  1 74  ? 129.532 113.391 54.310 1.00 4.76  73  M 1 \nATOM   1130 H  H    . GLN M  1 74  ? 125.987 112.851 58.078 1.00 4.76  73  M 1 \nATOM   1131 H  HA   . GLN M  1 74  ? 126.241 114.394 56.014 1.00 4.76  73  M 1 \nATOM   1132 H  HB2  . GLN M  1 74  ? 127.609 112.511 56.392 1.00 4.76  73  M 1 \nATOM   1133 H  HB3  . GLN M  1 74  ? 126.415 111.560 55.961 1.00 4.76  73  M 1 \nATOM   1134 H  HG2  . GLN M  1 74  ? 127.762 111.711 54.171 1.00 4.76  73  M 1 \nATOM   1135 H  HG3  . GLN M  1 74  ? 126.548 112.649 53.793 1.00 4.76  73  M 1 \nATOM   1136 H  HE21 . GLN M  1 74  ? 129.777 112.597 54.532 1.00 4.76  73  M 1 \nATOM   1137 H  HE22 . GLN M  1 74  ? 130.123 114.002 54.182 1.00 4.76  73  M 1 \nATOM   1138 N  N    . ASN M  1 75  ? 123.737 112.412 55.802 1.00 4.47  74  M 1 \nATOM   1139 C  CA   . ASN M  1 75  ? 122.429 112.141 55.138 1.00 4.47  74  M 1 \nATOM   1140 C  C    . ASN M  1 75  ? 121.453 113.301 55.386 1.00 4.47  74  M 1 \nATOM   1141 O  O    . ASN M  1 75  ? 120.756 113.695 54.470 1.00 4.47  74  M 1 \nATOM   1142 C  CB   . ASN M  1 75  ? 121.854 110.804 55.586 1.00 4.47  74  M 1 \nATOM   1143 C  CG   . ASN M  1 75  ? 122.406 109.660 54.764 1.00 4.47  74  M 1 \nATOM   1144 O  OD1  . ASN M  1 75  ? 122.981 109.885 53.713 1.00 4.47  74  M 1 \nATOM   1145 N  ND2  . ASN M  1 75  ? 122.233 108.443 55.235 1.00 4.47  74  M 1 \nATOM   1146 H  H    . ASN M  1 75  ? 123.885 111.904 56.543 1.00 4.47  74  M 1 \nATOM   1147 H  HA   . ASN M  1 75  ? 122.592 112.080 54.168 1.00 4.47  74  M 1 \nATOM   1148 H  HB2  . ASN M  1 75  ? 122.072 110.660 56.529 1.00 4.47  74  M 1 \nATOM   1149 H  HB3  . ASN M  1 75  ? 120.879 110.827 55.495 1.00 4.47  74  M 1 \nATOM   1150 H  HD21 . ASN M  1 75  ? 121.801 108.321 55.996 1.00 4.47  74  M 1 \nATOM   1151 H  HD22 . ASN M  1 75  ? 122.549 107.747 54.790 1.00 4.47  74  M 1 \nATOM   1152 N  N    . GLN M  1 76  ? 121.463 113.847 56.588 1.00 5.04  75  M 1 \nATOM   1153 C  CA   . GLN M  1 76  ? 120.581 114.983 56.952 1.00 5.04  75  M 1 \nATOM   1154 C  C    . GLN M  1 76  ? 120.881 116.181 56.044 1.00 5.04  75  M 1 \nATOM   1155 O  O    . GLN M  1 76  ? 119.961 116.839 55.678 1.00 5.04  75  M 1 \nATOM   1156 C  CB   . GLN M  1 76  ? 120.835 115.462 58.374 1.00 5.04  75  M 1 \nATOM   1157 C  CG   . GLN M  1 76  ? 119.945 114.854 59.435 1.00 5.04  75  M 1 \nATOM   1158 C  CD   . GLN M  1 76  ? 119.808 115.830 60.585 1.00 5.04  75  M 1 \nATOM   1159 O  OE1  . GLN M  1 76  ? 118.777 115.913 61.234 1.00 5.04  75  M 1 \nATOM   1160 N  NE2  . GLN M  1 76  ? 120.836 116.632 60.800 1.00 5.04  75  M 1 \nATOM   1161 H  H    . GLN M  1 76  ? 122.100 113.657 57.209 1.00 5.04  75  M 1 \nATOM   1162 H  HA   . GLN M  1 76  ? 119.639 114.714 56.850 1.00 5.04  75  M 1 \nATOM   1163 H  HB2  . GLN M  1 76  ? 121.769 115.267 58.599 1.00 5.04  75  M 1 \nATOM   1164 H  HB3  . GLN M  1 76  ? 120.725 116.436 58.392 1.00 5.04  75  M 1 \nATOM   1165 H  HG2  . GLN M  1 76  ? 119.060 114.661 59.057 1.00 5.04  75  M 1 \nATOM   1166 H  HG3  . GLN M  1 76  ? 120.336 114.015 59.757 1.00 5.04  75  M 1 \nATOM   1167 H  HE21 . GLN M  1 76  ? 121.177 117.105 60.136 1.00 5.04  75  M 1 \nATOM   1168 H  HE22 . GLN M  1 76  ? 121.175 116.708 61.613 1.00 5.04  75  M 1 \nATOM   1169 N  N    . ARG M  1 77  ? 122.137 116.447 55.723 1.00 5.21  76  M 1 \nATOM   1170 C  CA   . ARG M  1 77  ? 122.556 117.638 54.929 1.00 5.21  76  M 1 \nATOM   1171 C  C    . ARG M  1 77  ? 122.537 117.372 53.405 1.00 5.21  76  M 1 \nATOM   1172 O  O    . ARG M  1 77  ? 122.838 118.277 52.658 1.00 5.21  76  M 1 \nATOM   1173 C  CB   . ARG M  1 77  ? 123.908 118.130 55.452 1.00 5.21  76  M 1 \nATOM   1174 C  CG   . ARG M  1 77  ? 123.873 118.631 56.893 1.00 5.21  76  M 1 \nATOM   1175 C  CD   . ARG M  1 77  ? 122.925 119.810 57.098 1.00 5.21  76  M 1 \nATOM   1176 N  NE   . ARG M  1 77  ? 123.250 120.925 56.224 1.00 5.21  76  M 1 \nATOM   1177 C  CZ   . ARG M  1 77  ? 124.148 121.866 56.492 1.00 5.21  76  M 1 \nATOM   1178 N  NH1  . ARG M  1 77  ? 124.811 121.845 57.631 1.00 5.21  76  M 1 \nATOM   1179 N  NH2  . ARG M  1 77  ? 124.387 122.830 55.625 1.00 5.21  76  M 1 \nATOM   1180 H  H    . ARG M  1 77  ? 122.822 115.881 55.924 1.00 5.21  76  M 1 \nATOM   1181 H  HA   . ARG M  1 77  ? 121.896 118.347 55.108 1.00 5.21  76  M 1 \nATOM   1182 H  HB2  . ARG M  1 77  ? 124.554 117.395 55.388 1.00 5.21  76  M 1 \nATOM   1183 H  HB3  . ARG M  1 77  ? 124.221 118.856 54.873 1.00 5.21  76  M 1 \nATOM   1184 H  HG2  . ARG M  1 77  ? 123.594 117.896 57.481 1.00 5.21  76  M 1 \nATOM   1185 H  HG3  . ARG M  1 77  ? 124.776 118.902 57.161 1.00 5.21  76  M 1 \nATOM   1186 H  HD2  . ARG M  1 77  ? 122.005 119.519 56.922 1.00 5.21  76  M 1 \nATOM   1187 H  HD3  . ARG M  1 77  ? 122.974 120.106 58.032 1.00 5.21  76  M 1 \nATOM   1188 H  HE   . ARG M  1 77  ? 122.839 120.970 55.456 1.00 5.21  76  M 1 \nATOM   1189 H  HH11 . ARG M  1 77  ? 124.661 121.204 58.213 1.00 5.21  76  M 1 \nATOM   1190 H  HH12 . ARG M  1 77  ? 125.402 122.472 57.804 1.00 5.21  76  M 1 \nATOM   1191 H  HH21 . ARG M  1 77  ? 123.947 122.853 54.863 1.00 5.21  76  M 1 \nATOM   1192 H  HH22 . ARG M  1 77  ? 124.980 123.453 55.815 1.00 5.21  76  M 1 \nATOM   1193 N  N    . GLY M  1 78  ? 122.159 116.191 52.933 1.00 5.50  77  M 1 \nATOM   1194 C  CA   . GLY M  1 78  ? 122.140 115.887 51.522 1.00 5.50  77  M 1 \nATOM   1195 C  C    . GLY M  1 78  ? 123.459 115.443 50.939 1.00 5.50  77  M 1 \nATOM   1196 O  O    . GLY M  1 78  ? 123.541 115.249 49.723 1.00 5.50  77  M 1 \nATOM   1197 H  H    . GLY M  1 78  ? 121.916 115.531 53.428 1.00 5.50  77  M 1 \nATOM   1198 H  HA2  . GLY M  1 78  ? 121.495 115.178 51.372 1.00 5.50  77  M 1 \nATOM   1199 H  HA3  . GLY M  1 78  ? 121.836 116.659 51.020 1.00 5.50  77  M 1 \nATOM   1200 N  N    . GLY M  1 79  ? 124.495 115.290 51.756 1.00 5.18  78  M 1 \nATOM   1201 C  CA   . GLY M  1 79  ? 125.727 114.712 51.279 1.00 5.18  78  M 1 \nATOM   1202 C  C    . GLY M  1 79  ? 125.645 113.205 51.198 1.00 5.18  78  M 1 \nATOM   1203 O  O    . GLY M  1 79  ? 124.682 112.590 51.648 1.00 5.18  78  M 1 \nATOM   1204 H  H    . GLY M  1 79  ? 124.512 115.509 52.587 1.00 5.18  78  M 1 \nATOM   1205 H  HA2  . GLY M  1 79  ? 125.940 115.050 50.395 1.00 5.18  78  M 1 \nATOM   1206 H  HA3  . GLY M  1 79  ? 126.453 114.957 51.874 1.00 5.18  78  M 1 \nATOM   1207 N  N    . ARG M  1 80  ? 126.638 112.620 50.533 1.00 5.31  79  M 1 \nATOM   1208 C  CA   . ARG M  1 80  ? 126.688 111.162 50.279 1.00 5.31  79  M 1 \nATOM   1209 C  C    . ARG M  1 80  ? 127.898 110.553 51.001 1.00 5.31  79  M 1 \nATOM   1210 O  O    . ARG M  1 80  ? 129.032 110.956 50.759 1.00 5.31  79  M 1 \nATOM   1211 C  CB   . ARG M  1 80  ? 126.670 110.918 48.767 1.00 5.31  79  M 1 \nATOM   1212 C  CG   . ARG M  1 80  ? 125.405 111.442 48.090 1.00 5.31  79  M 1 \nATOM   1213 C  CD   . ARG M  1 80  ? 124.176 110.697 48.584 1.00 5.31  79  M 1 \nATOM   1214 N  NE   . ARG M  1 80  ? 122.876 111.198 48.135 1.00 5.31  79  M 1 \nATOM   1215 C  CZ   . ARG M  1 80  ? 121.961 111.743 48.932 1.00 5.31  79  M 1 \nATOM   1216 N  NH1  . ARG M  1 80  ? 122.198 111.880 50.220 1.00 5.31  79  M 1 \nATOM   1217 N  NH2  . ARG M  1 80  ? 120.804 112.149 48.440 1.00 5.31  79  M 1 \nATOM   1218 H  H    . ARG M  1 80  ? 127.344 113.082 50.191 1.00 5.31  79  M 1 \nATOM   1219 H  HA   . ARG M  1 80  ? 125.874 110.763 50.663 1.00 5.31  79  M 1 \nATOM   1220 H  HB2  . ARG M  1 80  ? 127.450 111.355 48.367 1.00 5.31  79  M 1 \nATOM   1221 H  HB3  . ARG M  1 80  ? 126.744 109.954 48.602 1.00 5.31  79  M 1 \nATOM   1222 H  HG2  . ARG M  1 80  ? 125.303 112.399 48.282 1.00 5.31  79  M 1 \nATOM   1223 H  HG3  . ARG M  1 80  ? 125.482 111.330 47.118 1.00 5.31  79  M 1 \nATOM   1224 H  HD2  . ARG M  1 80  ? 124.254 109.759 48.308 1.00 5.31  79  M 1 \nATOM   1225 H  HD3  . ARG M  1 80  ? 124.185 110.708 49.565 1.00 5.31  79  M 1 \nATOM   1226 H  HE   . ARG M  1 80  ? 122.678 111.115 47.290 1.00 5.31  79  M 1 \nATOM   1227 H  HH11 . ARG M  1 80  ? 122.964 111.608 50.556 1.00 5.31  79  M 1 \nATOM   1228 H  HH12 . ARG M  1 80  ? 121.590 112.243 50.741 1.00 5.31  79  M 1 \nATOM   1229 H  HH21 . ARG M  1 80  ? 120.638 112.062 47.579 1.00 5.31  79  M 1 \nATOM   1230 H  HH22 . ARG M  1 80  ? 120.205 112.515 48.973 1.00 5.31  79  M 1 \nATOM   1231 N  N    . ILE M  1 81  ? 127.627 109.572 51.839 1.00 4.71  80  M 1 \nATOM   1232 C  CA   . ILE M  1 81  ? 128.644 108.852 52.587 1.00 4.71  80  M 1 \nATOM   1233 C  C    . ILE M  1 81  ? 129.483 108.029 51.621 1.00 4.71  80  M 1 \nATOM   1234 O  O    . ILE M  1 81  ? 128.948 107.277 50.797 1.00 4.71  80  M 1 \nATOM   1235 C  CB   . ILE M  1 81  ? 127.982 107.961 53.650 1.00 4.71  80  M 1 \nATOM   1236 C  CG1  . ILE M  1 81  ? 127.205 108.806 54.675 1.00 4.71  80  M 1 \nATOM   1237 C  CG2  . ILE M  1 81  ? 129.034 107.088 54.347 1.00 4.71  80  M 1 \nATOM   1238 C  CD1  . ILE M  1 81  ? 126.224 108.031 55.531 1.00 4.71  80  M 1 \nATOM   1239 H  H    . ILE M  1 81  ? 126.825 109.314 52.012 1.00 4.71  80  M 1 \nATOM   1240 H  HA   . ILE M  1 81  ? 129.217 109.490 53.040 1.00 4.71  80  M 1 \nATOM   1241 H  HB   . ILE M  1 81  ? 127.353 107.381 53.193 1.00 4.71  80  M 1 \nATOM   1242 H  HG12 . ILE M  1 81  ? 127.845 109.217 55.277 1.00 4.71  80  M 1 \nATOM   1243 H  HG13 . ILE M  1 81  ? 126.688 109.497 54.232 1.00 4.71  80  M 1 \nATOM   1244 H  HG21 . ILE M  1 81  ? 128.684 106.748 55.185 1.00 4.71  80  M 1 \nATOM   1245 H  HG22 . ILE M  1 81  ? 129.264 106.336 53.780 1.00 4.71  80  M 1 \nATOM   1246 H  HG23 . ILE M  1 81  ? 129.820 107.628 54.525 1.00 4.71  80  M 1 \nATOM   1247 H  HD11 . ILE M  1 81  ? 125.755 108.653 56.109 1.00 4.71  80  M 1 \nATOM   1248 H  HD12 . ILE M  1 81  ? 125.587 107.584 54.952 1.00 4.71  80  M 1 \nATOM   1249 H  HD13 . ILE M  1 81  ? 126.695 107.375 56.068 1.00 4.71  80  M 1 \nATOM   1250 N  N    . PHE M  1 82  ? 130.802 108.170 51.715 1.00 5.36  81  M 1 \nATOM   1251 C  CA   . PHE M  1 82  ? 131.748 107.327 50.988 1.00 5.36  81  M 1 \nATOM   1252 C  C    . PHE M  1 82  ? 132.688 106.692 51.999 1.00 5.36  81  M 1 \nATOM   1253 O  O    . PHE M  1 82  ? 133.540 107.371 52.577 1.00 5.36  81  M 1 \nATOM   1254 C  CB   . PHE M  1 82  ? 132.521 108.111 49.933 1.00 5.36  81  M 1 \nATOM   1255 C  CG   . PHE M  1 82  ? 131.690 108.495 48.747 1.00 5.36  81  M 1 \nATOM   1256 C  CD1  . PHE M  1 82  ? 131.427 107.575 47.748 1.00 5.36  81  M 1 \nATOM   1257 C  CD2  . PHE M  1 82  ? 131.162 109.762 48.634 1.00 5.36  81  M 1 \nATOM   1258 C  CE1  . PHE M  1 82  ? 130.659 107.920 46.658 1.00 5.36  81  M 1 \nATOM   1259 C  CE2  . PHE M  1 82  ? 130.395 110.107 47.545 1.00 5.36  81  M 1 \nATOM   1260 C  CZ   . PHE M  1 82  ? 130.144 109.187 46.560 1.00 5.36  81  M 1 \nATOM   1261 H  H    . PHE M  1 82  ? 131.185 108.757 52.213 1.00 5.36  81  M 1 \nATOM   1262 H  HA   . PHE M  1 82  ? 131.278 106.615 50.526 1.00 5.36  81  M 1 \nATOM   1263 H  HB2  . PHE M  1 82  ? 132.867 108.921 50.338 1.00 5.36  81  M 1 \nATOM   1264 H  HB3  . PHE M  1 82  ? 133.258 107.563 49.620 1.00 5.36  81  M 1 \nATOM   1265 H  HD1  . PHE M  1 82  ? 131.775 106.715 47.806 1.00 5.36  81  M 1 \nATOM   1266 H  HD2  . PHE M  1 82  ? 131.328 110.393 49.297 1.00 5.36  81  M 1 \nATOM   1267 H  HE1  . PHE M  1 82  ? 130.491 107.296 45.990 1.00 5.36  81  M 1 \nATOM   1268 H  HE2  . PHE M  1 82  ? 130.045 110.966 47.479 1.00 5.36  81  M 1 \nATOM   1269 H  HZ   . PHE M  1 82  ? 129.627 109.423 45.824 1.00 5.36  81  M 1 \nATOM   1270 N  N    . LEU M  1 83  ? 132.516 105.396 52.207 1.00 4.68  82  M 1 \nATOM   1271 C  CA   . LEU M  1 83  ? 133.289 104.642 53.174 1.00 4.68  82  M 1 \nATOM   1272 C  C    . LEU M  1 83  ? 134.622 104.239 52.562 1.00 4.68  82  M 1 \nATOM   1273 O  O    . LEU M  1 83  ? 134.746 104.069 51.348 1.00 4.68  82  M 1 \nATOM   1274 C  CB   . LEU M  1 83  ? 132.521 103.401 53.623 1.00 4.68  82  M 1 \nATOM   1275 C  CG   . LEU M  1 83  ? 131.190 103.642 54.335 1.00 4.68  82  M 1 \nATOM   1276 C  CD1  . LEU M  1 83  ? 130.481 102.327 54.590 1.00 4.68  82  M 1 \nATOM   1277 C  CD2  . LEU M  1 83  ? 131.353 104.418 55.627 1.00 4.68  82  M 1 \nATOM   1278 H  H    . LEU M  1 83  ? 131.943 104.919 51.778 1.00 4.68  82  M 1 \nATOM   1279 H  HA   . LEU M  1 83  ? 133.461 105.184 53.960 1.00 4.68  82  M 1 \nATOM   1280 H  HB2  . LEU M  1 83  ? 132.339 102.858 52.840 1.00 4.68  82  M 1 \nATOM   1281 H  HB3  . LEU M  1 83  ? 133.082 102.899 54.235 1.00 4.68  82  M 1 \nATOM   1282 H  HG   . LEU M  1 83  ? 130.625 104.170 53.750 1.00 4.68  82  M 1 \nATOM   1283 H  HD11 . LEU M  1 83  ? 129.639 102.499 55.040 1.00 4.68  82  M 1 \nATOM   1284 H  HD12 . LEU M  1 83  ? 130.314 101.894 53.738 1.00 4.68  82  M 1 \nATOM   1285 H  HD13 . LEU M  1 83  ? 131.041 101.763 55.146 1.00 4.68  82  M 1 \nATOM   1286 H  HD21 . LEU M  1 83  ? 130.496 104.434 56.082 1.00 4.68  82  M 1 \nATOM   1287 H  HD22 . LEU M  1 83  ? 132.017 103.986 56.187 1.00 4.68  82  M 1 \nATOM   1288 H  HD23 . LEU M  1 83  ? 131.630 105.324 55.420 1.00 4.68  82  M 1 \nATOM   1289 N  N    . GLN M  1 84  ? 135.620 104.103 53.420 1.00 4.98  83  M 1 \nATOM   1290 C  CA   . GLN M  1 84  ? 136.983 103.695 53.032 1.00 4.98  83  M 1 \nATOM   1291 C  C    . GLN M  1 84  ? 137.424 102.574 53.977 1.00 4.98  83  M 1 \nATOM   1292 O  O    . GLN M  1 84  ? 136.776 102.330 54.991 1.00 4.98  83  M 1 \nATOM   1293 C  CB   . GLN M  1 84  ? 137.940 104.889 53.070 1.00 4.98  83  M 1 \nATOM   1294 C  CG   . GLN M  1 84  ? 137.481 106.057 52.206 1.00 4.98  83  M 1 \nATOM   1295 C  CD   . GLN M  1 84  ? 137.435 105.714 50.736 1.00 4.98  83  M 1 \nATOM   1296 O  OE1  . GLN M  1 84  ? 136.691 106.307 49.957 1.00 4.98  83  M 1 \nATOM   1297 N  NE2  . GLN M  1 84  ? 138.254 104.763 50.333 1.00 4.98  83  M 1 \nATOM   1298 H  H    . GLN M  1 84  ? 135.530 104.287 54.308 1.00 4.98  83  M 1 \nATOM   1299 H  HA   . GLN M  1 84  ? 136.952 103.340 52.113 1.00 4.98  83  M 1 \nATOM   1300 H  HB2  . GLN M  1 84  ? 138.027 105.190 53.998 1.00 4.98  83  M 1 \nATOM   1301 H  HB3  . GLN M  1 84  ? 138.823 104.592 52.766 1.00 4.98  83  M 1 \nATOM   1302 H  HG2  . GLN M  1 84  ? 136.587 106.339 52.496 1.00 4.98  83  M 1 \nATOM   1303 H  HG3  . GLN M  1 84  ? 138.091 106.814 52.338 1.00 4.98  83  M 1 \nATOM   1304 H  HE21 . GLN M  1 84  ? 138.896 104.475 50.869 1.00 4.98  83  M 1 \nATOM   1305 H  HE22 . GLN M  1 84  ? 138.164 104.414 49.526 1.00 4.98  83  M 1 \nATOM   1306 N  N    . ASP M  1 85  ? 138.495 101.908 53.612 1.00 4.69  84  M 1 \nATOM   1307 C  CA   . ASP M  1 85  ? 139.059 100.852 54.433 1.00 4.69  84  M 1 \nATOM   1308 C  C    . ASP M  1 85  ? 139.338 101.384 55.830 1.00 4.69  84  M 1 \nATOM   1309 O  O    . ASP M  1 85  ? 139.747 102.533 56.005 1.00 4.69  84  M 1 \nATOM   1310 C  CB   . ASP M  1 85  ? 140.360 100.325 53.827 1.00 4.69  84  M 1 \nATOM   1311 C  CG   . ASP M  1 85  ? 140.159 99.642  52.493 1.00 4.69  84  M 1 \nATOM   1312 O  OD1  . ASP M  1 85  ? 139.068 99.089  52.247 1.00 4.69  84  M 1 \nATOM   1313 O  OD2  . ASP M  1 85  ? 141.111 99.651  51.689 1.00 4.69  84  M 1 \nATOM   1314 H  H    . ASP M  1 85  ? 138.954 102.090 52.908 1.00 4.69  84  M 1 \nATOM   1315 H  HA   . ASP M  1 85  ? 138.430 100.116 54.494 1.00 4.69  84  M 1 \nATOM   1316 H  HB2  . ASP M  1 85  ? 140.983 101.059 53.707 1.00 4.69  84  M 1 \nATOM   1317 H  HB3  . ASP M  1 85  ? 140.739 99.671  54.435 1.00 4.69  84  M 1 \nATOM   1318 N  N    . ILE M  1 86  ? 139.106 100.539 56.825 1.00 3.70  85  M 1 \nATOM   1319 C  CA   . ILE M  1 86  ? 139.459 100.834 58.207 1.00 3.70  85  M 1 \nATOM   1320 C  C    . ILE M  1 86  ? 140.807 100.167 58.441 1.00 3.70  85  M 1 \nATOM   1321 O  O    . ILE M  1 86  ? 140.902 98.937  58.481 1.00 3.70  85  M 1 \nATOM   1322 C  CB   . ILE M  1 86  ? 138.405 100.331 59.202 1.00 3.70  85  M 1 \nATOM   1323 C  CG1  . ILE M  1 86  ? 137.025 100.939 58.911 1.00 3.70  85  M 1 \nATOM   1324 C  CG2  . ILE M  1 86  ? 138.841 100.699 60.622 1.00 3.70  85  M 1 \nATOM   1325 C  CD1  . ILE M  1 86  ? 135.886 100.255 59.630 1.00 3.70  85  M 1 \nATOM   1326 H  H    . ILE M  1 86  ? 138.741 99.767  56.719 1.00 3.70  85  M 1 \nATOM   1327 H  HA   . ILE M  1 86  ? 139.559 101.790 58.338 1.00 3.70  85  M 1 \nATOM   1328 H  HB   . ILE M  1 86  ? 138.343 99.365  59.135 1.00 3.70  85  M 1 \nATOM   1329 H  HG12 . ILE M  1 86  ? 137.028 101.876 59.163 1.00 3.70  85  M 1 \nATOM   1330 H  HG13 . ILE M  1 86  ? 136.822 100.870 57.965 1.00 3.70  85  M 1 \nATOM   1331 H  HG21 . ILE M  1 86  ? 138.100 100.616 61.243 1.00 3.70  85  M 1 \nATOM   1332 H  HG22 . ILE M  1 86  ? 139.559 100.111 60.906 1.00 3.70  85  M 1 \nATOM   1333 H  HG23 . ILE M  1 86  ? 139.154 101.617 60.629 1.00 3.70  85  M 1 \nATOM   1334 H  HD11 . ILE M  1 86  ? 135.049 100.509 59.210 1.00 3.70  85  M 1 \nATOM   1335 H  HD12 . ILE M  1 86  ? 136.000 99.294  59.564 1.00 3.70  85  M 1 \nATOM   1336 H  HD13 . ILE M  1 86  ? 135.882 100.509 60.566 1.00 3.70  85  M 1 \nATOM   1337 N  N    . LYS M  1 87  ? 141.853 100.969 58.576 1.00 4.77  86  M 1 \nATOM   1338 C  CA   . LYS M  1 87  ? 143.193 100.423 58.707 1.00 4.77  86  M 1 \nATOM   1339 C  C    . LYS M  1 87  ? 143.363 99.744  60.060 1.00 4.77  86  M 1 \nATOM   1340 O  O    . LYS M  1 87  ? 142.782 100.155 61.065 1.00 4.77  86  M 1 \nATOM   1341 C  CB   . LYS M  1 87  ? 144.243 101.521 58.530 1.00 30.00 86  M 1 \nATOM   1342 C  CG   . LYS M  1 87  ? 144.208 102.201 57.170 1.00 30.00 86  M 1 \nATOM   1343 C  CD   . LYS M  1 87  ? 144.545 101.226 56.055 1.00 30.00 86  M 1 \nATOM   1344 C  CE   . LYS M  1 87  ? 144.582 101.921 54.704 1.00 30.00 86  M 1 \nATOM   1345 N  NZ   . LYS M  1 87  ? 144.888 100.972 53.599 1.00 30.00 86  M 1 \nATOM   1346 H  H    . LYS M  1 87  ? 141.807 101.827 58.599 1.00 4.77  86  M 1 \nATOM   1347 H  HA   . LYS M  1 87  ? 143.330 99.755  58.017 1.00 4.77  86  M 1 \nATOM   1348 N  N    . LYS M  1 88  ? 144.175 98.693  60.077 1.00 4.97  87  M 1 \nATOM   1349 C  CA   . LYS M  1 88  ? 144.415 97.973  61.311 1.00 4.97  87  M 1 \nATOM   1350 C  C    . LYS M  1 88  ? 145.153 98.877  62.302 1.00 4.97  87  M 1 \nATOM   1351 O  O    . LYS M  1 88  ? 145.866 99.795  61.895 1.00 4.97  87  M 1 \nATOM   1352 C  CB   . LYS M  1 88  ? 145.223 96.704  61.055 1.00 4.97  87  M 1 \nATOM   1353 C  CG   . LYS M  1 88  ? 146.628 96.926  60.549 1.00 4.97  87  M 1 \nATOM   1354 C  CD   . LYS M  1 88  ? 147.328 95.606  60.302 1.00 4.97  87  M 1 \nATOM   1355 C  CE   . LYS M  1 88  ? 148.741 95.814  59.822 1.00 4.97  87  M 1 \nATOM   1356 N  NZ   . LYS M  1 88  ? 149.425 94.518  59.579 1.00 4.97  87  M 1 \nATOM   1357 H  H    . LYS M  1 88  ? 144.595 98.383  59.393 1.00 4.97  87  M 1 \nATOM   1358 H  HA   . LYS M  1 88  ? 143.546 97.705  61.648 1.00 4.97  87  M 1 \nATOM   1359 H  HB2  . LYS M  1 88  ? 145.284 96.205  61.885 1.00 4.97  87  M 1 \nATOM   1360 H  HB3  . LYS M  1 88  ? 144.759 96.168  60.393 1.00 4.97  87  M 1 \nATOM   1361 H  HG2  . LYS M  1 88  ? 146.599 97.427  59.719 1.00 4.97  87  M 1 \nATOM   1362 H  HG3  . LYS M  1 88  ? 147.152 97.407  61.209 1.00 4.97  87  M 1 \nATOM   1363 H  HD2  . LYS M  1 88  ? 147.360 95.100  61.129 1.00 4.97  87  M 1 \nATOM   1364 H  HD3  . LYS M  1 88  ? 146.855 95.105  59.619 1.00 4.97  87  M 1 \nATOM   1365 H  HE2  . LYS M  1 88  ? 148.727 96.320  58.995 1.00 4.97  87  M 1 \nATOM   1366 H  HE3  . LYS M  1 88  ? 149.236 96.296  60.503 1.00 4.97  87  M 1 \nATOM   1367 H  HZ1  . LYS M  1 88  ? 150.258 94.655  59.296 1.00 4.97  87  M 1 \nATOM   1368 H  HZ2  . LYS M  1 88  ? 149.448 94.051  60.337 1.00 4.97  87  M 1 \nATOM   1369 H  HZ3  . LYS M  1 88  ? 148.985 94.051  58.963 1.00 4.97  87  M 1 \nATOM   1370 N  N    . PRO M  1 89  ? 145.005 98.637  63.607 1.00 4.65  88  M 1 \nATOM   1371 C  CA   . PRO M  1 89  ? 145.751 99.442  64.578 1.00 4.65  88  M 1 \nATOM   1372 C  C    . PRO M  1 89  ? 147.253 99.252  64.431 1.00 4.65  88  M 1 \nATOM   1373 O  O    . PRO M  1 89  ? 147.727 98.300  63.811 1.00 4.65  88  M 1 \nATOM   1374 C  CB   . PRO M  1 89  ? 145.249 98.925  65.928 1.00 4.65  88  M 1 \nATOM   1375 C  CG   . PRO M  1 89  ? 143.930 98.331  65.641 1.00 4.65  88  M 1 \nATOM   1376 C  CD   . PRO M  1 89  ? 144.058 97.737  64.286 1.00 4.65  88  M 1 \nATOM   1377 H  HA   . PRO M  1 89  ? 145.536 100.384 64.490 1.00 4.65  88  M 1 \nATOM   1378 H  HB2  . PRO M  1 89  ? 145.858 98.253  66.272 1.00 4.65  88  M 1 \nATOM   1379 H  HB3  . PRO M  1 89  ? 145.173 99.666  66.549 1.00 4.65  88  M 1 \nATOM   1380 H  HG2  . PRO M  1 89  ? 143.743 97.634  66.289 1.00 4.65  88  M 1 \nATOM   1381 H  HG3  . PRO M  1 89  ? 143.239 99.011  65.663 1.00 4.65  88  M 1 \nATOM   1382 H  HD2  . PRO M  1 89  ? 144.416 96.837  64.330 1.00 4.65  88  M 1 \nATOM   1383 H  HD3  . PRO M  1 89  ? 143.192 97.751  63.850 1.00 4.65  88  M 1 \nATOM   1384 N  N    . ASP M  1 90  ? 148.000 100.181 65.028 1.00 6.42  89  M 1 \nATOM   1385 C  CA   . ASP M  1 90  ? 149.444 100.220 64.829 1.00 6.42  89  M 1 \nATOM   1386 C  C    . ASP M  1 90  ? 150.160 99.064  65.521 1.00 6.42  89  M 1 \nATOM   1387 O  O    . ASP M  1 90  ? 151.321 98.786  65.205 1.00 6.42  89  M 1 \nATOM   1388 C  CB   . ASP M  1 90  ? 150.000 101.563 65.307 1.00 6.42  89  M 1 \nATOM   1389 C  CG   . ASP M  1 90  ? 149.765 101.813 66.789 1.00 6.42  89  M 1 \nATOM   1390 O  OD1  . ASP M  1 90  ? 149.098 100.993 67.452 1.00 6.42  89  M 1 \nATOM   1391 O  OD2  . ASP M  1 90  ? 150.256 102.842 67.298 1.00 6.42  89  M 1 \nATOM   1392 H  H    . ASP M  1 90  ? 147.692 100.794 65.546 1.00 6.42  89  M 1 \nATOM   1393 H  HA   . ASP M  1 90  ? 149.632 100.154 63.880 1.00 6.42  89  M 1 \nATOM   1394 H  HB2  . ASP M  1 90  ? 150.954 101.594 65.135 1.00 6.42  89  M 1 \nATOM   1395 H  HB3  . ASP M  1 90  ? 149.555 102.273 64.818 1.00 6.42  89  M 1 \nATOM   1396 N  N    . ARG M  1 91  ? 149.525 98.437  66.501 1.00 6.46  90  M 1 \nATOM   1397 C  CA   . ARG M  1 91  ? 150.159 97.302  67.210 1.00 6.46  90  M 1 \nATOM   1398 C  C    . ARG M  1 91  ? 149.116 96.345  67.771 1.00 6.46  90  M 1 \nATOM   1399 O  O    . ARG M  1 91  ? 147.959 96.741  67.965 1.00 6.46  90  M 1 \nATOM   1400 C  CB   . ARG M  1 91  ? 151.033 97.810  68.360 1.00 6.46  90  M 1 \nATOM   1401 C  CG   . ARG M  1 91  ? 150.288 98.636  69.392 1.00 6.46  90  M 1 \nATOM   1402 C  CD   . ARG M  1 91  ? 151.196 99.661  70.045 1.00 6.46  90  M 1 \nATOM   1403 N  NE   . ARG M  1 91  ? 152.000 99.066  71.096 1.00 6.46  90  M 1 \nATOM   1404 C  CZ   . ARG M  1 91  ? 152.762 99.746  71.952 1.00 6.46  90  M 1 \nATOM   1405 N  NH1  . ARG M  1 91  ? 152.826 101.065 71.888 1.00 6.46  90  M 1 \nATOM   1406 N  NH2  . ARG M  1 91  ? 153.443 99.097  72.877 1.00 6.46  90  M 1 \nATOM   1407 H  H    . ARG M  1 91  ? 148.725 98.709  66.841 1.00 6.46  90  M 1 \nATOM   1408 H  HA   . ARG M  1 91  ? 150.726 96.813  66.571 1.00 6.46  90  M 1 \nATOM   1409 H  HB2  . ARG M  1 91  ? 151.438 97.038  68.808 1.00 6.46  90  M 1 \nATOM   1410 H  HB3  . ARG M  1 91  ? 151.757 98.353  67.985 1.00 6.46  90  M 1 \nATOM   1411 H  HG2  . ARG M  1 91  ? 149.539 99.099  68.960 1.00 6.46  90  M 1 \nATOM   1412 H  HG3  . ARG M  1 91  ? 149.923 98.043  70.083 1.00 6.46  90  M 1 \nATOM   1413 H  HD2  . ARG M  1 91  ? 151.787 100.051 69.366 1.00 6.46  90  M 1 \nATOM   1414 H  HD3  . ARG M  1 91  ? 150.651 100.384 70.423 1.00 6.46  90  M 1 \nATOM   1415 H  HE   . ARG M  1 91  ? 151.982 98.198  71.177 1.00 6.46  90  M 1 \nATOM   1416 H  HH11 . ARG M  1 91  ? 152.368 101.496 71.274 1.00 6.46  90  M 1 \nATOM   1417 H  HH12 . ARG M  1 91  ? 153.329 101.507 72.457 1.00 6.46  90  M 1 \nATOM   1418 H  HH21 . ARG M  1 91  ? 153.398 98.218  72.919 1.00 6.46  90  M 1 \nATOM   1419 H  HH22 . ARG M  1 91  ? 153.948 99.544  73.444 1.00 6.46  90  M 1 \nATOM   1420 N  N    . ASP M  1 92  ? 149.508 95.111  68.064 1.00 7.52  91  M 1 \nATOM   1421 C  CA   . ASP M  1 92  ? 148.594 94.135  68.707 1.00 7.52  91  M 1 \nATOM   1422 C  C    . ASP M  1 92  ? 149.003 94.016  70.176 1.00 7.52  91  M 1 \nATOM   1423 O  O    . ASP M  1 92  ? 148.133 93.680  70.973 1.00 7.52  91  M 1 \nATOM   1424 C  CB   . ASP M  1 92  ? 148.599 92.781  68.004 1.00 7.52  91  M 1 \nATOM   1425 C  CG   . ASP M  1 92  ? 149.977 92.479  67.459 1.00 7.52  91  M 1 \nATOM   1426 O  OD1  . ASP M  1 92  ? 150.923 92.558  68.246 1.00 7.52  91  M 1 \nATOM   1427 O  OD2  . ASP M  1 92  ? 150.093 92.229  66.240 1.00 7.52  91  M 1 \nATOM   1428 H  H    . ASP M  1 92  ? 150.363 94.825  67.949 1.00 7.52  91  M 1 \nATOM   1429 H  HA   . ASP M  1 92  ? 147.678 94.499  68.666 1.00 7.52  91  M 1 \nATOM   1430 H  HB2  . ASP M  1 92  ? 148.342 92.079  68.636 1.00 7.52  91  M 1 \nATOM   1431 H  HB3  . ASP M  1 92  ? 147.956 92.789  67.266 1.00 7.52  91  M 1 \nATOM   1432 N  N    . ASP M  1 93  ? 150.256 94.338  70.525 1.00 6.76  92  M 1 \nATOM   1433 C  CA   . ASP M  1 93  ? 150.729 94.272  71.901 1.00 6.76  92  M 1 \nATOM   1434 C  C    . ASP M  1 93  ? 150.848 95.690  72.446 1.00 6.76  92  M 1 \nATOM   1435 O  O    . ASP M  1 93  ? 151.701 96.460  71.996 1.00 6.76  92  M 1 \nATOM   1436 C  CB   . ASP M  1 93  ? 152.072 93.541  71.962 1.00 6.76  92  M 1 \nATOM   1437 C  CG   . ASP M  1 93  ? 152.556 93.294  73.379 1.00 6.76  92  M 1 \nATOM   1438 O  OD1  . ASP M  1 93  ? 151.901 93.735  74.341 1.00 6.76  92  M 1 \nATOM   1439 O  OD2  . ASP M  1 93  ? 153.612 92.646  73.529 1.00 6.76  92  M 1 \nATOM   1440 H  H    . ASP M  1 93  ? 150.867 94.598  69.979 1.00 6.76  92  M 1 \nATOM   1441 H  HA   . ASP M  1 93  ? 150.095 93.777  72.443 1.00 6.76  92  M 1 \nATOM   1442 H  HB2  . ASP M  1 93  ? 151.972 92.679  71.528 1.00 6.76  92  M 1 \nATOM   1443 H  HB3  . ASP M  1 93  ? 152.743 94.066  71.499 1.00 6.76  92  M 1 \nATOM   1444 N  N    . TRP M  1 94  ? 149.999 96.024  73.413 1.00 4.79  93  M 1 \nATOM   1445 C  CA   . TRP M  1 94  ? 149.951 97.357  74.005 1.00 4.79  93  M 1 \nATOM   1446 C  C    . TRP M  1 94  ? 150.818 97.490  75.257 1.00 4.79  93  M 1 \nATOM   1447 O  O    . TRP M  1 94  ? 150.931 98.589  75.800 1.00 4.79  93  M 1 \nATOM   1448 C  CB   . TRP M  1 94  ? 148.495 97.714  74.308 1.00 4.79  93  M 1 \nATOM   1449 C  CG   . TRP M  1 94  ? 147.719 97.784  73.062 1.00 4.79  93  M 1 \nATOM   1450 C  CD1  . TRP M  1 94  ? 146.925 96.817  72.544 1.00 4.79  93  M 1 \nATOM   1451 C  CD2  . TRP M  1 94  ? 147.702 98.862  72.130 1.00 4.79  93  M 1 \nATOM   1452 N  NE1  . TRP M  1 94  ? 146.394 97.228  71.353 1.00 4.79  93  M 1 \nATOM   1453 C  CE2  . TRP M  1 94  ? 146.862 98.483  71.073 1.00 4.79  93  M 1 \nATOM   1454 C  CE3  . TRP M  1 94  ? 148.312 100.113 72.090 1.00 4.79  93  M 1 \nATOM   1455 C  CZ2  . TRP M  1 94  ? 146.612 99.311  69.994 1.00 4.79  93  M 1 \nATOM   1456 C  CZ3  . TRP M  1 94  ? 148.066 100.930 71.015 1.00 4.79  93  M 1 \nATOM   1457 C  CH2  . TRP M  1 94  ? 147.222 100.529 69.984 1.00 4.79  93  M 1 \nATOM   1458 H  H    . TRP M  1 94  ? 149.420 95.479  73.741 1.00 4.79  93  M 1 \nATOM   1459 H  HA   . TRP M  1 94  ? 150.269 98.003  73.356 1.00 4.79  93  M 1 \nATOM   1460 H  HB2  . TRP M  1 94  ? 148.102 97.033  74.876 1.00 4.79  93  M 1 \nATOM   1461 H  HB3  . TRP M  1 94  ? 148.451 98.582  74.739 1.00 4.79  93  M 1 \nATOM   1462 H  HD1  . TRP M  1 94  ? 146.766 95.992  72.944 1.00 4.79  93  M 1 \nATOM   1463 H  HE1  . TRP M  1 94  ? 145.858 96.772  70.859 1.00 4.79  93  M 1 \nATOM   1464 H  HE3  . TRP M  1 94  ? 148.878 100.387 72.775 1.00 4.79  93  M 1 \nATOM   1465 H  HZ2  . TRP M  1 94  ? 146.050 99.045  69.303 1.00 4.79  93  M 1 \nATOM   1466 H  HZ3  . TRP M  1 94  ? 148.466 101.769 70.978 1.00 4.79  93  M 1 \nATOM   1467 H  HH2  . TRP M  1 94  ? 147.074 101.107 69.270 1.00 4.79  93  M 1 \nATOM   1468 N  N    . GLU M  1 95  ? 151.384 96.385  75.738 1.00 6.28  94  M 1 \nATOM   1469 C  CA   . GLU M  1 95  ? 152.486 96.279  76.696 1.00 6.28  94  M 1 \nATOM   1470 C  C    . GLU M  1 95  ? 152.172 96.600  78.151 1.00 6.28  94  M 1 \nATOM   1471 O  O    . GLU M  1 95  ? 152.860 96.079  79.032 1.00 6.28  94  M 1 \nATOM   1472 C  CB   . GLU M  1 95  ? 153.654 97.191  76.296 1.00 6.28  94  M 1 \nATOM   1473 C  CG   . GLU M  1 95  ? 154.410 96.800  75.049 1.00 6.28  94  M 1 \nATOM   1474 C  CD   . GLU M  1 95  ? 155.561 97.748  74.768 1.00 6.28  94  M 1 \nATOM   1475 O  OE1  . GLU M  1 95  ? 155.686 98.769  75.478 1.00 6.28  94  M 1 \nATOM   1476 O  OE2  . GLU M  1 95  ? 156.334 97.480  73.823 1.00 6.28  94  M 1 \nATOM   1477 H  H    . GLU M  1 95  ? 151.108 95.601  75.516 1.00 6.28  94  M 1 \nATOM   1478 H  HA   . GLU M  1 95  ? 152.814 95.366  76.679 1.00 6.28  94  M 1 \nATOM   1479 H  HB2  . GLU M  1 95  ? 153.340 98.102  76.181 1.00 6.28  94  M 1 \nATOM   1480 H  HB3  . GLU M  1 95  ? 154.302 97.181  77.018 1.00 6.28  94  M 1 \nATOM   1481 H  HG2  . GLU M  1 95  ? 154.776 95.909  75.164 1.00 6.28  94  M 1 \nATOM   1482 H  HG3  . GLU M  1 95  ? 153.808 96.816  74.289 1.00 6.28  94  M 1 \nATOM   1483 N  N    . SER M  1 96  ? 151.102 97.336  78.433 1.00 4.95  95  M 1 \nATOM   1484 C  CA   . SER M  1 96  ? 150.767 97.707  79.804 1.00 4.95  95  M 1 \nATOM   1485 C  C    . SER M  1 96  ? 149.509 98.565  79.794 1.00 4.95  95  M 1 \nATOM   1486 O  O    . SER M  1 96  ? 149.121 99.130  78.771 1.00 4.95  95  M 1 \nATOM   1487 C  CB   . SER M  1 96  ? 151.907 98.467  80.503 1.00 4.95  95  M 1 \nATOM   1488 O  OG   . SER M  1 96  ? 152.134 99.722  79.901 1.00 4.95  95  M 1 \nATOM   1489 H  H    . SER M  1 96  ? 150.553 97.645  77.848 1.00 4.95  95  M 1 \nATOM   1490 H  HA   . SER M  1 96  ? 150.583 96.900  80.310 1.00 4.95  95  M 1 \nATOM   1491 H  HB2  . SER M  1 96  ? 151.648 98.620  81.425 1.00 4.95  95  M 1 \nATOM   1492 H  HB3  . SER M  1 96  ? 152.735 97.962  80.503 1.00 4.95  95  M 1 \nATOM   1493 H  HG   . SER M  1 96  ? 152.947 99.803  79.704 1.00 4.95  95  M 1 \nATOM   1494 N  N    . GLY M  1 97  ? 148.886 98.664  80.967 1.00 4.08  96  M 1 \nATOM   1495 C  CA   . GLY M  1 97  ? 147.786 99.597  81.142 1.00 4.08  96  M 1 \nATOM   1496 C  C    . GLY M  1 97  ? 148.198 101.035 80.900 1.00 4.08  96  M 1 \nATOM   1497 O  O    . GLY M  1 97  ? 147.507 101.781 80.204 1.00 4.08  96  M 1 \nATOM   1498 H  H    . GLY M  1 97  ? 149.080 98.206  81.669 1.00 4.08  96  M 1 \nATOM   1499 H  HA2  . GLY M  1 97  ? 147.044 99.362  80.564 1.00 4.08  96  M 1 \nATOM   1500 H  HA3  . GLY M  1 97  ? 147.481 99.547  82.062 1.00 4.08  96  M 1 \nATOM   1501 N  N    . LEU M  1 98  ? 149.324 101.444 81.487 1.00 4.35  97  M 1 \nATOM   1502 C  CA   . LEU M  1 98  ? 149.821 102.805 81.323 1.00 4.35  97  M 1 \nATOM   1503 C  C    . LEU M  1 98  ? 150.076 103.129 79.861 1.00 4.35  97  M 1 \nATOM   1504 O  O    . LEU M  1 98  ? 149.678 104.190 79.371 1.00 4.35  97  M 1 \nATOM   1505 C  CB   . LEU M  1 98  ? 151.098 102.993 82.141 1.00 4.35  97  M 1 \nATOM   1506 C  CG   . LEU M  1 98  ? 151.816 104.337 82.014 1.00 4.35  97  M 1 \nATOM   1507 C  CD1  . LEU M  1 98  ? 150.932 105.487 82.425 1.00 4.35  97  M 1 \nATOM   1508 C  CD2  . LEU M  1 98  ? 153.073 104.329 82.842 1.00 4.35  97  M 1 \nATOM   1509 H  H    . LEU M  1 98  ? 149.820 100.947 81.983 1.00 4.35  97  M 1 \nATOM   1510 H  HA   . LEU M  1 98  ? 149.157 103.427 81.660 1.00 4.35  97  M 1 \nATOM   1511 H  HB2  . LEU M  1 98  ? 150.874 102.876 83.078 1.00 4.35  97  M 1 \nATOM   1512 H  HB3  . LEU M  1 98  ? 151.731 102.304 81.884 1.00 4.35  97  M 1 \nATOM   1513 H  HG   . LEU M  1 98  ? 152.095 104.478 81.096 1.00 4.35  97  M 1 \nATOM   1514 H  HD11 . LEU M  1 98  ? 151.461 106.299 82.385 1.00 4.35  97  M 1 \nATOM   1515 H  HD12 . LEU M  1 98  ? 150.183 105.557 81.812 1.00 4.35  97  M 1 \nATOM   1516 H  HD13 . LEU M  1 98  ? 150.611 105.342 83.329 1.00 4.35  97  M 1 \nATOM   1517 H  HD21 . LEU M  1 98  ? 153.583 105.131 82.647 1.00 4.35  97  M 1 \nATOM   1518 H  HD22 . LEU M  1 98  ? 152.832 104.310 83.781 1.00 4.35  97  M 1 \nATOM   1519 H  HD23 . LEU M  1 98  ? 153.598 103.545 82.616 1.00 4.35  97  M 1 \nATOM   1520 N  N    . ASN M  1 99  ? 150.760 102.206 79.194 1.00 4.75  98  M 1 \nATOM   1521 C  CA   . ASN M  1 99  ? 151.113 102.418 77.769 1.00 4.75  98  M 1 \nATOM   1522 C  C    . ASN M  1 99  ? 149.818 102.556 76.966 1.00 4.75  98  M 1 \nATOM   1523 O  O    . ASN M  1 99  ? 149.706 103.465 76.165 1.00 4.75  98  M 1 \nATOM   1524 C  CB   . ASN M  1 99  ? 151.972 101.305 77.182 1.00 4.75  98  M 1 \nATOM   1525 C  CG   . ASN M  1 99  ? 152.324 101.638 75.750 1.00 4.75  98  M 1 \nATOM   1526 O  OD1  . ASN M  1 99  ? 152.887 102.690 75.506 1.00 4.75  98  M 1 \nATOM   1527 N  ND2  . ASN M  1 99  ? 152.012 100.765 74.813 1.00 4.75  98  M 1 \nATOM   1528 H  H    . ASN M  1 99  ? 150.924 101.371 79.514 1.00 4.75  98  M 1 \nATOM   1529 H  HA   . ASN M  1 99  ? 151.621 103.260 77.698 1.00 4.75  98  M 1 \nATOM   1530 H  HB2  . ASN M  1 99  ? 152.791 101.209 77.709 1.00 4.75  98  M 1 \nATOM   1531 H  HB3  . ASN M  1 99  ? 151.479 100.460 77.212 1.00 4.75  98  M 1 \nATOM   1532 H  HD21 . ASN M  1 99  ? 152.223 100.926 73.970 1.00 4.75  98  M 1 \nATOM   1533 H  HD22 . ASN M  1 99  ? 151.592 100.017 75.028 1.00 4.75  98  M 1 \nATOM   1534 N  N    . ALA M  1 100 ? 148.838 101.713 77.239 1.00 3.93  99  M 1 \nATOM   1535 C  CA   . ALA M  1 100 ? 147.559 101.755 76.541 1.00 3.93  99  M 1 \nATOM   1536 C  C    . ALA M  1 100 ? 146.852 103.084 76.778 1.00 3.93  99  M 1 \nATOM   1537 O  O    . ALA M  1 100 ? 146.297 103.679 75.850 1.00 3.93  99  M 1 \nATOM   1538 C  CB   . ALA M  1 100 ? 146.675 100.583 76.973 1.00 3.93  99  M 1 \nATOM   1539 H  H    . ALA M  1 100 ? 148.889 101.110 77.850 1.00 3.93  99  M 1 \nATOM   1540 H  HA   . ALA M  1 100 ? 147.721 101.661 75.589 1.00 3.93  99  M 1 \nATOM   1541 H  HB1  . ALA M  1 100 ? 145.808 100.671 76.547 1.00 3.93  99  M 1 \nATOM   1542 H  HB2  . ALA M  1 100 ? 147.087 99.751  76.692 1.00 3.93  99  M 1 \nATOM   1543 H  HB3  . ALA M  1 100 ? 146.559 100.585 77.936 1.00 3.93  99  M 1 \nATOM   1544 N  N    . MET M  1 101 ? 146.875 103.575 78.018 1.00 3.66  100 M 1 \nATOM   1545 C  CA   . MET M  1 101 ? 146.250 104.859 78.321 1.00 3.66  100 M 1 \nATOM   1546 C  C    . MET M  1 101 ? 146.962 106.005 77.611 1.00 3.66  100 M 1 \nATOM   1547 O  O    . MET M  1 101 ? 146.317 106.935 77.120 1.00 3.66  100 M 1 \nATOM   1548 C  CB   . MET M  1 101 ? 146.231 105.092 79.833 1.00 3.66  100 M 1 \nATOM   1549 C  CG   . MET M  1 101 ? 145.292 104.199 80.617 1.00 3.66  100 M 1 \nATOM   1550 S  SD   . MET M  1 101 ? 143.559 104.519 80.234 1.00 3.66  100 M 1 \nATOM   1551 C  CE   . MET M  1 101 ? 142.752 103.227 81.176 1.00 3.66  100 M 1 \nATOM   1552 H  H    . MET M  1 101 ? 147.250 103.190 78.690 1.00 3.66  100 M 1 \nATOM   1553 H  HA   . MET M  1 101 ? 145.330 104.834 78.013 1.00 3.66  100 M 1 \nATOM   1554 H  HB2  . MET M  1 101 ? 147.126 104.958 80.182 1.00 3.66  100 M 1 \nATOM   1555 H  HB3  . MET M  1 101 ? 145.954 106.006 80.000 1.00 3.66  100 M 1 \nATOM   1556 H  HG2  . MET M  1 101 ? 145.479 103.273 80.397 1.00 3.66  100 M 1 \nATOM   1557 H  HG3  . MET M  1 101 ? 145.427 104.340 81.567 1.00 3.66  100 M 1 \nATOM   1558 H  HE1  . MET M  1 101 ? 141.803 103.421 81.221 1.00 3.66  100 M 1 \nATOM   1559 H  HE2  . MET M  1 101 ? 142.900 102.372 80.743 1.00 3.66  100 M 1 \nATOM   1560 H  HE3  . MET M  1 101 ? 143.121 103.207 82.073 1.00 3.66  100 M 1 \nATOM   1561 N  N    . GLU M  1 102 ? 148.293 105.953 77.550 1.00 4.25  101 M 1 \nATOM   1562 C  CA   . GLU M  1 102 ? 149.059 106.982 76.855 1.00 4.25  101 M 1 \nATOM   1563 C  C    . GLU M  1 102 ? 148.734 106.993 75.366 1.00 4.25  101 M 1 \nATOM   1564 O  O    . GLU M  1 102 ? 148.533 108.059 74.766 1.00 4.25  101 M 1 \nATOM   1565 C  CB   . GLU M  1 102 ? 150.554 106.754 77.092 1.00 4.25  101 M 1 \nATOM   1566 C  CG   . GLU M  1 102 ? 151.008 107.015 78.528 1.00 4.25  101 M 1 \nATOM   1567 C  CD   . GLU M  1 102 ? 152.467 106.671 78.766 1.00 4.25  101 M 1 \nATOM   1568 O  OE1  . GLU M  1 102 ? 153.102 106.091 77.863 1.00 4.25  101 M 1 \nATOM   1569 O  OE2  . GLU M  1 102 ? 152.977 106.981 79.862 1.00 4.25  101 M 1 \nATOM   1570 H  H    . GLU M  1 102 ? 148.774 105.332 77.901 1.00 4.25  101 M 1 \nATOM   1571 H  HA   . GLU M  1 102 ? 148.837 107.850 77.227 1.00 4.25  101 M 1 \nATOM   1572 H  HB2  . GLU M  1 102 ? 150.781 105.839 76.862 1.00 4.25  101 M 1 \nATOM   1573 H  HB3  . GLU M  1 102 ? 151.049 107.359 76.518 1.00 4.25  101 M 1 \nATOM   1574 H  HG2  . GLU M  1 102 ? 150.901 107.961 78.712 1.00 4.25  101 M 1 \nATOM   1575 H  HG3  . GLU M  1 102 ? 150.471 106.507 79.156 1.00 4.25  101 M 1 \nATOM   1576 N  N    . CYS M  1 103 ? 148.657 105.810 74.757 1.00 4.27  102 M 1 \nATOM   1577 C  CA   . CYS M  1 103 ? 148.305 105.715 73.345 1.00 4.27  102 M 1 \nATOM   1578 C  C    . CYS M  1 103 ? 146.880 106.192 73.098 1.00 4.27  102 M 1 \nATOM   1579 O  O    . CYS M  1 103 ? 146.597 106.836 72.083 1.00 4.27  102 M 1 \nATOM   1580 C  CB   . CYS M  1 103 ? 148.489 104.281 72.869 1.00 4.27  102 M 1 \nATOM   1581 S  SG   . CYS M  1 103 ? 150.209 103.771 72.899 1.00 4.27  102 M 1 \nATOM   1582 H  H    . CYS M  1 103 ? 148.795 105.055 75.144 1.00 4.27  102 M 1 \nATOM   1583 H  HA   . CYS M  1 103 ? 148.905 106.272 72.824 1.00 4.27  102 M 1 \nATOM   1584 H  HB2  . CYS M  1 103 ? 147.991 103.688 73.453 1.00 4.27  102 M 1 \nATOM   1585 H  HB3  . CYS M  1 103 ? 148.161 104.199 71.960 1.00 4.27  102 M 1 \nATOM   1586 H  HG   . CYS M  1 103 ? 150.444 103.312 73.983 1.00 4.27  102 M 1 \nATOM   1587 N  N    . ALA M  1 104 ? 145.972 105.900 74.029 1.00 3.59  103 M 1 \nATOM   1588 C  CA   . ALA M  1 104 ? 144.597 106.367 73.899 1.00 3.59  103 M 1 \nATOM   1589 C  C    . ALA M  1 104 ? 144.523 107.884 74.011 1.00 3.59  103 M 1 \nATOM   1590 O  O    . ALA M  1 104 ? 143.741 108.529 73.307 1.00 3.59  103 M 1 \nATOM   1591 C  CB   . ALA M  1 104 ? 143.717 105.700 74.952 1.00 3.59  103 M 1 \nATOM   1592 H  H    . ALA M  1 104 ? 146.139 105.455 74.746 1.00 3.59  103 M 1 \nATOM   1593 H  HA   . ALA M  1 104 ? 144.259 106.114 73.026 1.00 3.59  103 M 1 \nATOM   1594 H  HB1  . ALA M  1 104 ? 142.844 106.122 74.943 1.00 3.59  103 M 1 \nATOM   1595 H  HB2  . ALA M  1 104 ? 143.625 104.758 74.741 1.00 3.59  103 M 1 \nATOM   1596 H  HB3  . ALA M  1 104 ? 144.128 105.802 75.825 1.00 3.59  103 M 1 \nATOM   1597 N  N    . LEU M  1 105 ? 145.337 108.468 74.889 1.00 3.78  104 M 1 \nATOM   1598 C  CA   . LEU M  1 105 ? 145.427 109.922 74.991 1.00 3.78  104 M 1 \nATOM   1599 C  C    . LEU M  1 105 ? 145.897 110.530 73.678 1.00 3.78  104 M 1 \nATOM   1600 O  O    . LEU M  1 105 ? 145.317 111.505 73.182 1.00 3.78  104 M 1 \nATOM   1601 C  CB   . LEU M  1 105 ? 146.367 110.302 76.139 1.00 3.78  104 M 1 \nATOM   1602 C  CG   . LEU M  1 105 ? 146.670 111.778 76.392 1.00 3.78  104 M 1 \nATOM   1603 C  CD1  . LEU M  1 105 ? 145.424 112.550 76.719 1.00 3.78  104 M 1 \nATOM   1604 C  CD2  . LEU M  1 105 ? 147.682 111.933 77.520 1.00 3.78  104 M 1 \nATOM   1605 H  H    . LEU M  1 105 ? 145.854 108.045 75.430 1.00 3.78  104 M 1 \nATOM   1606 H  HA   . LEU M  1 105 ? 144.547 110.272 75.200 1.00 3.78  104 M 1 \nATOM   1607 H  HB2  . LEU M  1 105 ? 145.973 109.969 76.960 1.00 3.78  104 M 1 \nATOM   1608 H  HB3  . LEU M  1 105 ? 147.217 109.853 76.006 1.00 3.78  104 M 1 \nATOM   1609 H  HG   . LEU M  1 105 ? 147.066 112.161 75.594 1.00 3.78  104 M 1 \nATOM   1610 H  HD11 . LEU M  1 105 ? 145.649 113.493 76.738 1.00 3.78  104 M 1 \nATOM   1611 H  HD12 . LEU M  1 105 ? 144.751 112.394 76.038 1.00 3.78  104 M 1 \nATOM   1612 H  HD13 . LEU M  1 105 ? 145.089 112.268 77.584 1.00 3.78  104 M 1 \nATOM   1613 H  HD21 . LEU M  1 105 ? 147.677 112.852 77.830 1.00 3.78  104 M 1 \nATOM   1614 H  HD22 . LEU M  1 105 ? 147.440 111.344 78.251 1.00 3.78  104 M 1 \nATOM   1615 H  HD23 . LEU M  1 105 ? 148.565 111.701 77.193 1.00 3.78  104 M 1 \nATOM   1616 N  N    . HIS M  1 106 ? 146.934 109.922 73.114 1.00 4.28  105 M 1 \nATOM   1617 C  CA   . HIS M  1 106 ? 147.520 110.383 71.834 1.00 4.28  105 M 1 \nATOM   1618 C  C    . HIS M  1 106 ? 146.438 110.299 70.751 1.00 4.28  105 M 1 \nATOM   1619 O  O    . HIS M  1 106 ? 146.286 111.244 70.023 1.00 4.28  105 M 1 \nATOM   1620 C  CB   . HIS M  1 106 ? 148.773 109.591 71.459 1.00 4.28  105 M 1 \nATOM   1621 C  CG   . HIS M  1 106 ? 149.411 110.133 70.226 1.00 4.28  105 M 1 \nATOM   1622 N  ND1  . HIS M  1 106 ? 150.540 110.923 70.253 1.00 4.28  105 M 1 \nATOM   1623 C  CD2  . HIS M  1 106 ? 149.036 110.055 68.935 1.00 4.28  105 M 1 \nATOM   1624 C  CE1  . HIS M  1 106 ? 150.858 111.276 69.023 1.00 4.28  105 M 1 \nATOM   1625 N  NE2  . HIS M  1 106 ? 149.945 110.764 68.197 1.00 4.28  105 M 1 \nATOM   1626 H  H    . HIS M  1 106 ? 147.356 109.193 73.463 1.00 4.28  105 M 1 \nATOM   1627 H  HA   . HIS M  1 106 ? 147.772 111.331 71.941 1.00 4.28  105 M 1 \nATOM   1628 H  HB2  . HIS M  1 106 ? 149.416 109.629 72.202 1.00 4.28  105 M 1 \nATOM   1629 H  HB3  . HIS M  1 106 ? 148.531 108.650 71.313 1.00 4.28  105 M 1 \nATOM   1630 H  HD2  . HIS M  1 106 ? 148.293 109.590 68.597 1.00 4.28  105 M 1 \nATOM   1631 H  HE1  . HIS M  1 106 ? 151.595 111.806 68.774 1.00 4.28  105 M 1 \nATOM   1632 H  HE2  . HIS M  1 106 ? 149.939 110.854 67.325 1.00 4.28  105 M 1 \nATOM   1633 N  N    . LEU M  1 107 ? 145.669 109.220 70.709 1.00 3.81  106 M 1 \nATOM   1634 C  CA   . LEU M  1 107 ? 144.621 109.008 69.718 1.00 3.81  106 M 1 \nATOM   1635 C  C    . LEU M  1 107 ? 143.511 110.042 69.856 1.00 3.81  106 M 1 \nATOM   1636 O  O    . LEU M  1 107 ? 143.052 110.622 68.865 1.00 3.81  106 M 1 \nATOM   1637 C  CB   . LEU M  1 107 ? 144.061 107.593 69.870 1.00 3.81  106 M 1 \nATOM   1638 C  CG   . LEU M  1 107 ? 142.912 107.169 68.954 1.00 3.81  106 M 1 \nATOM   1639 C  CD1  . LEU M  1 107 ? 143.350 107.247 67.519 1.00 3.81  106 M 1 \nATOM   1640 C  CD2  . LEU M  1 107 ? 142.426 105.770 69.294 1.00 3.81  106 M 1 \nATOM   1641 H  H    . LEU M  1 107 ? 145.758 108.572 71.268 1.00 3.81  106 M 1 \nATOM   1642 H  HA   . LEU M  1 107 ? 145.012 109.084 68.834 1.00 3.81  106 M 1 \nATOM   1643 H  HB2  . LEU M  1 107 ? 144.787 106.968 69.716 1.00 3.81  106 M 1 \nATOM   1644 H  HB3  . LEU M  1 107 ? 143.748 107.493 70.783 1.00 3.81  106 M 1 \nATOM   1645 H  HG   . LEU M  1 107 ? 142.159 107.768 69.075 1.00 3.81  106 M 1 \nATOM   1646 H  HD11 . LEU M  1 107 ? 142.668 106.841 66.962 1.00 3.81  106 M 1 \nATOM   1647 H  HD12 . LEU M  1 107 ? 143.463 108.179 67.276 1.00 3.81  106 M 1 \nATOM   1648 H  HD13 . LEU M  1 107 ? 144.193 106.777 67.423 1.00 3.81  106 M 1 \nATOM   1649 H  HD21 . LEU M  1 107 ? 141.544 105.640 68.911 1.00 3.81  106 M 1 \nATOM   1650 H  HD22 . LEU M  1 107 ? 143.047 105.123 68.923 1.00 3.81  106 M 1 \nATOM   1651 H  HD23 . LEU M  1 107 ? 142.374 105.669 70.257 1.00 3.81  106 M 1 \nATOM   1652 N  N    . GLU M  1 108 ? 143.069 110.235 71.091 1.00 4.12  107 M 1 \nATOM   1653 C  CA   . GLU M  1 108 ? 141.969 111.176 71.413 1.00 4.12  107 M 1 \nATOM   1654 C  C    . GLU M  1 108 ? 142.399 112.588 70.991 1.00 4.12  107 M 1 \nATOM   1655 O  O    . GLU M  1 108 ? 141.596 113.279 70.406 1.00 4.12  107 M 1 \nATOM   1656 C  CB   . GLU M  1 108 ? 141.587 111.054 72.884 1.00 4.12  107 M 1 \nATOM   1657 C  CG   . GLU M  1 108 ? 140.923 109.727 73.206 1.00 4.12  107 M 1 \nATOM   1658 C  CD   . GLU M  1 108 ? 139.792 109.399 72.241 1.00 4.12  107 M 1 \nATOM   1659 O  OE1  . GLU M  1 108 ? 138.811 110.143 72.219 1.00 4.12  107 M 1 \nATOM   1660 O  OE2  . GLU M  1 108 ? 139.909 108.409 71.485 1.00 4.12  107 M 1 \nATOM   1661 H  H    . GLU M  1 108 ? 143.492 109.895 71.822 1.00 4.12  107 M 1 \nATOM   1662 H  HA   . GLU M  1 108 ? 141.187 110.921 70.871 1.00 4.12  107 M 1 \nATOM   1663 H  HB2  . GLU M  1 108 ? 142.395 111.150 73.430 1.00 4.12  107 M 1 \nATOM   1664 H  HB3  . GLU M  1 108 ? 140.975 111.784 73.114 1.00 4.12  107 M 1 \nATOM   1665 H  HG2  . GLU M  1 108 ? 141.592 109.010 73.166 1.00 4.12  107 M 1 \nATOM   1666 H  HG3  . GLU M  1 108 ? 140.564 109.755 74.118 1.00 4.12  107 M 1 \nATOM   1667 N  N    . LYS M  1 109 ? 143.643 112.984 71.226 1.00 4.42  108 M 1 \nATOM   1668 C  CA   . LYS M  1 109 ? 144.089 114.320 70.843 1.00 4.42  108 M 1 \nATOM   1669 C  C    . LYS M  1 109 ? 144.176 114.453 69.325 1.00 4.42  108 M 1 \nATOM   1670 O  O    . LYS M  1 109 ? 143.880 115.518 68.773 1.00 4.42  108 M 1 \nATOM   1671 C  CB   . LYS M  1 109 ? 145.424 114.669 71.504 1.00 4.42  108 M 1 \nATOM   1672 C  CG   . LYS M  1 109 ? 145.316 114.840 73.017 1.00 4.42  108 M 1 \nATOM   1673 C  CD   . LYS M  1 109 ? 146.618 115.261 73.686 1.00 4.42  108 M 1 \nATOM   1674 C  CE   . LYS M  1 109 ? 146.896 116.730 73.440 1.00 4.42  108 M 1 \nATOM   1675 N  NZ   . LYS M  1 109 ? 148.084 117.253 74.164 1.00 4.42  108 M 1 \nATOM   1676 H  H    . LYS M  1 109 ? 144.242 112.493 71.600 1.00 4.42  108 M 1 \nATOM   1677 H  HA   . LYS M  1 109 ? 143.439 114.968 71.158 1.00 4.42  108 M 1 \nATOM   1678 H  HB2  . LYS M  1 109 ? 146.060 113.958 71.328 1.00 4.42  108 M 1 \nATOM   1679 H  HB3  . LYS M  1 109 ? 145.752 115.499 71.124 1.00 4.42  108 M 1 \nATOM   1680 H  HG2  . LYS M  1 109 ? 144.645 115.513 73.209 1.00 4.42  108 M 1 \nATOM   1681 H  HG3  . LYS M  1 109 ? 145.041 114.001 73.418 1.00 4.42  108 M 1 \nATOM   1682 H  HD2  . LYS M  1 109 ? 146.543 115.125 74.644 1.00 4.42  108 M 1 \nATOM   1683 H  HD3  . LYS M  1 109 ? 147.358 114.745 73.330 1.00 4.42  108 M 1 \nATOM   1684 H  HE2  . LYS M  1 109 ? 147.028 116.881 72.491 1.00 4.42  108 M 1 \nATOM   1685 H  HE3  . LYS M  1 109 ? 146.130 117.236 73.754 1.00 4.42  108 M 1 \nATOM   1686 H  HZ1  . LYS M  1 109 ? 147.963 118.112 74.361 1.00 4.42  108 M 1 \nATOM   1687 H  HZ2  . LYS M  1 109 ? 148.197 116.799 74.921 1.00 4.42  108 M 1 \nATOM   1688 H  HZ3  . LYS M  1 109 ? 148.814 117.172 73.661 1.00 4.42  108 M 1 \nATOM   1689 N  N    . SER M  1 110 ? 144.542 113.374 68.629 1.00 4.37  109 M 1 \nATOM   1690 C  CA   . SER M  1 110 ? 144.545 113.402 67.165 1.00 4.37  109 M 1 \nATOM   1691 C  C    . SER M  1 110 ? 143.136 113.581 66.609 1.00 4.37  109 M 1 \nATOM   1692 O  O    . SER M  1 110 ? 142.915 114.377 65.684 1.00 4.37  109 M 1 \nATOM   1693 C  CB   . SER M  1 110 ? 145.161 112.117 66.620 1.00 4.37  109 M 1 \nATOM   1694 O  OG   . SER M  1 110 ? 144.341 111.009 66.927 1.00 4.37  109 M 1 \nATOM   1695 H  H    . SER M  1 110 ? 144.787 112.625 68.973 1.00 4.37  109 M 1 \nATOM   1696 H  HA   . SER M  1 110 ? 145.089 114.145 66.862 1.00 4.37  109 M 1 \nATOM   1697 H  HB2  . SER M  1 110 ? 145.240 112.181 65.655 1.00 4.37  109 M 1 \nATOM   1698 H  HB3  . SER M  1 110 ? 146.039 111.988 67.011 1.00 4.37  109 M 1 \nATOM   1699 H  HG   . SER M  1 110 ? 144.057 111.077 67.715 1.00 4.37  109 M 1 \nATOM   1700 N  N    . VAL M  1 111 ? 142.176 112.838 67.158 1.00 4.23  110 M 1 \nATOM   1701 C  CA   . VAL M  1 111 ? 140.783 112.978 66.746 1.00 4.23  110 M 1 \nATOM   1702 C  C    . VAL M  1 111 ? 140.298 114.398 67.013 1.00 4.23  110 M 1 \nATOM   1703 O  O    . VAL M  1 111 ? 139.589 114.998 66.193 1.00 4.23  110 M 1 \nATOM   1704 C  CB   . VAL M  1 111 ? 139.905 111.926 67.453 1.00 4.23  110 M 1 \nATOM   1705 C  CG1  . VAL M  1 111 ? 138.430 112.153 67.153 1.00 4.23  110 M 1 \nATOM   1706 C  CG2  . VAL M  1 111 ? 140.296 110.511 67.023 1.00 4.23  110 M 1 \nATOM   1707 H  H    . VAL M  1 111 ? 142.302 112.255 67.777 1.00 4.23  110 M 1 \nATOM   1708 H  HA   . VAL M  1 111 ? 140.727 112.817 65.791 1.00 4.23  110 M 1 \nATOM   1709 H  HB   . VAL M  1 111 ? 140.028 111.997 68.412 1.00 4.23  110 M 1 \nATOM   1710 H  HG11 . VAL M  1 111 ? 137.929 111.367 67.422 1.00 4.23  110 M 1 \nATOM   1711 H  HG12 . VAL M  1 111 ? 138.098 112.918 67.649 1.00 4.23  110 M 1 \nATOM   1712 H  HG13 . VAL M  1 111 ? 138.322 112.290 66.199 1.00 4.23  110 M 1 \nATOM   1713 H  HG21 . VAL M  1 111 ? 139.830 109.881 67.595 1.00 4.23  110 M 1 \nATOM   1714 H  HG22 . VAL M  1 111 ? 140.028 110.373 66.101 1.00 4.23  110 M 1 \nATOM   1715 H  HG23 . VAL M  1 111 ? 141.253 110.372 67.097 1.00 4.23  110 M 1 \nATOM   1716 N  N    . ASN M  1 112 ? 140.717 114.929 68.153 1.00 4.52  111 M 1 \nATOM   1717 C  CA   . ASN M  1 112 ? 140.342 116.303 68.560 1.00 4.52  111 M 1 \nATOM   1718 C  C    . ASN M  1 112 ? 140.887 117.288 67.517 1.00 4.52  111 M 1 \nATOM   1719 O  O    . ASN M  1 112 ? 140.143 118.121 67.037 1.00 4.52  111 M 1 \nATOM   1720 C  CB   . ASN M  1 112 ? 140.871 116.639 69.955 1.00 4.52  111 M 1 \nATOM   1721 C  CG   . ASN M  1 112 ? 140.253 117.911 70.489 1.00 4.52  111 M 1 \nATOM   1722 O  OD1  . ASN M  1 112 ? 139.121 118.212 70.161 1.00 4.52  111 M 1 \nATOM   1723 N  ND2  . ASN M  1 112 ? 140.984 118.639 71.313 1.00 4.52  111 M 1 \nATOM   1724 H  H    . ASN M  1 112 ? 141.351 114.540 68.678 1.00 4.52  111 M 1 \nATOM   1725 H  HA   . ASN M  1 112 ? 139.358 116.369 68.580 1.00 4.52  111 M 1 \nATOM   1726 H  HB2  . ASN M  1 112 ? 140.666 115.899 70.563 1.00 4.52  111 M 1 \nATOM   1727 H  HB3  . ASN M  1 112 ? 141.843 116.744 69.913 1.00 4.52  111 M 1 \nATOM   1728 H  HD21 . ASN M  1 112 ? 141.775 118.347 71.578 1.00 4.52  111 M 1 \nATOM   1729 H  HD22 . ASN M  1 112 ? 140.683 119.419 71.599 1.00 4.52  111 M 1 \nATOM   1730 N  N    . GLN M  1 113 ? 142.141 117.072 67.128 1.00 5.11  112 M 1 \nATOM   1731 C  CA   . GLN M  1 113 ? 142.834 117.940 66.147 1.00 5.11  112 M 1 \nATOM   1732 C  C    . GLN M  1 113 ? 142.073 117.860 64.820 1.00 5.11  112 M 1 \nATOM   1733 O  O    . GLN M  1 113 ? 141.691 118.896 64.332 1.00 5.11  112 M 1 \nATOM   1734 C  CB   . GLN M  1 113 ? 144.297 117.557 65.966 1.00 5.11  112 M 1 \nATOM   1735 C  CG   . GLN M  1 113 ? 145.022 118.572 65.094 1.00 5.11  112 M 1 \nATOM   1736 C  CD   . GLN M  1 113 ? 144.785 119.967 65.611 1.00 5.11  112 M 1 \nATOM   1737 O  OE1  . GLN M  1 113 ? 145.184 120.306 66.717 1.00 5.11  112 M 1 \nATOM   1738 N  NE2  . GLN M  1 113 ? 144.062 120.770 64.847 1.00 5.11  112 M 1 \nATOM   1739 H  H    . GLN M  1 113 ? 142.599 116.316 67.344 1.00 5.11  112 M 1 \nATOM   1740 H  HA   . GLN M  1 113 ? 142.790 118.868 66.475 1.00 5.11  112 M 1 \nATOM   1741 H  HB2  . GLN M  1 113 ? 144.728 117.512 66.845 1.00 5.11  112 M 1 \nATOM   1742 H  HB3  . GLN M  1 113 ? 144.348 116.671 65.551 1.00 5.11  112 M 1 \nATOM   1743 H  HG2  . GLN M  1 113 ? 145.984 118.380 65.094 1.00 5.11  112 M 1 \nATOM   1744 H  HG3  . GLN M  1 113 ? 144.696 118.505 64.171 1.00 5.11  112 M 1 \nATOM   1745 H  HE21 . GLN M  1 113 ? 143.722 120.470 64.088 1.00 5.11  112 M 1 \nATOM   1746 H  HE22 . GLN M  1 113 ? 143.918 121.606 65.096 1.00 5.11  112 M 1 \nATOM   1747 N  N    . SER M  1 114 ? 141.629 116.668 64.416 0.55 4.90  113 M 1 \nATOM   1748 C  CA   . SER M  1 114 ? 140.863 116.555 63.144 0.55 4.90  113 M 1 \nATOM   1749 C  C    . SER M  1 114 ? 139.536 117.326 63.248 0.55 4.90  113 M 1 \nATOM   1750 O  O    . SER M  1 114 ? 139.168 118.017 62.297 0.55 4.90  113 M 1 \nATOM   1751 C  CB   . SER M  1 114 ? 140.631 115.110 62.773 0.55 4.90  113 M 1 \nATOM   1752 O  OG   . SER M  1 114 ? 139.747 114.492 63.686 0.55 4.90  113 M 1 \nATOM   1753 H  H    . SER M  1 114 ? 141.266 116.108 65.036 0.55 4.90  113 M 1 \nATOM   1754 H  HA   . SER M  1 114 ? 141.406 116.977 62.424 0.55 4.90  113 M 1 \nATOM   1755 H  HB2  . SER M  1 114 ? 140.252 115.063 61.866 0.55 4.90  113 M 1 \nATOM   1756 H  HB3  . SER M  1 114 ? 141.490 114.631 62.771 0.55 4.90  113 M 1 \nATOM   1757 H  HG   . SER M  1 114 ? 139.464 115.080 64.225 0.55 4.90  113 M 1 \nATOM   1758 N  N    . LEU M  1 115 ? 138.859 117.253 64.392 1.00 4.69  114 M 1 \nATOM   1759 C  CA   . LEU M  1 115 ? 137.594 117.954 64.591 1.00 4.69  114 M 1 \nATOM   1760 C  C    . LEU M  1 115 ? 137.776 119.467 64.575 1.00 4.69  114 M 1 \nATOM   1761 O  O    . LEU M  1 115 ? 136.914 120.196 64.076 1.00 4.69  114 M 1 \nATOM   1762 C  CB   . LEU M  1 115 ? 136.965 117.506 65.904 1.00 4.69  114 M 1 \nATOM   1763 C  CG   . LEU M  1 115 ? 136.436 116.074 65.961 1.00 4.69  114 M 1 \nATOM   1764 C  CD1  . LEU M  1 115 ? 136.142 115.718 67.392 1.00 4.69  114 M 1 \nATOM   1765 C  CD2  . LEU M  1 115 ? 135.185 115.889 65.113 1.00 4.69  114 M 1 \nATOM   1766 H  H    . LEU M  1 115 ? 139.121 116.786 65.065 1.00 4.69  114 M 1 \nATOM   1767 H  HA   . LEU M  1 115 ? 136.991 117.729 63.865 1.00 4.69  114 M 1 \nATOM   1768 H  HB2  . LEU M  1 115 ? 137.632 117.597 66.602 1.00 4.69  114 M 1 \nATOM   1769 H  HB3  . LEU M  1 115 ? 136.223 118.099 66.102 1.00 4.69  114 M 1 \nATOM   1770 H  HG   . LEU M  1 115 ? 137.112 115.463 65.628 1.00 4.69  114 M 1 \nATOM   1771 H  HD11 . LEU M  1 115 ? 135.645 114.886 67.426 1.00 4.69  114 M 1 \nATOM   1772 H  HD12 . LEU M  1 115 ? 136.992 115.614 67.847 1.00 4.69  114 M 1 \nATOM   1773 H  HD13 . LEU M  1 115 ? 135.636 116.432 67.811 1.00 4.69  114 M 1 \nATOM   1774 H  HD21 . LEU M  1 115 ? 135.004 114.939 65.032 1.00 4.69  114 M 1 \nATOM   1775 H  HD22 . LEU M  1 115 ? 134.437 116.323 65.552 1.00 4.69  114 M 1 \nATOM   1776 H  HD23 . LEU M  1 115 ? 135.315 116.259 64.226 1.00 4.69  114 M 1 \nATOM   1777 N  N    . LEU M  1 116 ? 138.878 119.960 65.131 1.00 5.05  115 M 1 \nATOM   1778 C  CA   . LEU M  1 116 ? 139.138 121.397 65.104 1.00 5.05  115 M 1 \nATOM   1779 C  C    . LEU M  1 116 ? 139.387 121.874 63.680 1.00 5.05  115 M 1 \nATOM   1780 O  O    . LEU M  1 116 ? 138.920 122.949 63.282 1.00 5.05  115 M 1 \nATOM   1781 C  CB   . LEU M  1 116 ? 140.322 121.733 66.011 1.00 5.05  115 M 1 \nATOM   1782 C  CG   . LEU M  1 116 ? 140.104 121.561 67.520 1.00 5.05  115 M 1 \nATOM   1783 C  CD1  . LEU M  1 116 ? 141.408 121.733 68.279 1.00 5.05  115 M 1 \nATOM   1784 C  CD2  . LEU M  1 116 ? 139.056 122.534 68.048 1.00 5.05  115 M 1 \nATOM   1785 H  H    . LEU M  1 116 ? 139.484 119.491 65.522 1.00 5.05  115 M 1 \nATOM   1786 H  HA   . LEU M  1 116 ? 138.360 121.870 65.437 1.00 5.05  115 M 1 \nATOM   1787 H  HB2  . LEU M  1 116 ? 141.064 121.161 65.761 1.00 5.05  115 M 1 \nATOM   1788 H  HB3  . LEU M  1 116 ? 140.578 122.655 65.850 1.00 5.05  115 M 1 \nATOM   1789 H  HG   . LEU M  1 116 ? 139.769 120.669 67.702 1.00 5.05  115 M 1 \nATOM   1790 H  HD11 . LEU M  1 116 ? 141.268 121.446 69.195 1.00 5.05  115 M 1 \nATOM   1791 H  HD12 . LEU M  1 116 ? 142.101 121.192 67.870 1.00 5.05  115 M 1 \nATOM   1792 H  HD13 . LEU M  1 116 ? 141.673 122.666 68.255 1.00 5.05  115 M 1 \nATOM   1793 H  HD21 . LEU M  1 116 ? 139.130 122.592 69.013 1.00 5.05  115 M 1 \nATOM   1794 H  HD22 . LEU M  1 116 ? 139.204 123.408 67.653 1.00 5.05  115 M 1 \nATOM   1795 H  HD23 . LEU M  1 116 ? 138.172 122.210 67.813 1.00 5.05  115 M 1 \nATOM   1796 N  N    . GLU M  1 117 ? 140.102 121.074 62.890 1.00 6.09  116 M 1 \nATOM   1797 C  CA   . GLU M  1 117 ? 140.283 121.391 61.476 1.00 6.09  116 M 1 \nATOM   1798 C  C    . GLU M  1 117 ? 138.942 121.417 60.745 1.00 6.09  116 M 1 \nATOM   1799 O  O    . GLU M  1 117 ? 138.692 122.295 59.908 1.00 6.09  116 M 1 \nATOM   1800 C  CB   . GLU M  1 117 ? 141.244 120.379 60.849 1.00 6.09  116 M 1 \nATOM   1801 C  CG   . GLU M  1 117 ? 142.676 120.511 61.372 1.00 6.09  116 M 1 \nATOM   1802 C  CD   . GLU M  1 117 ? 143.615 119.439 60.848 1.00 6.09  116 M 1 \nATOM   1803 O  OE1  . GLU M  1 117 ? 143.145 118.498 60.174 1.00 6.09  116 M 1 \nATOM   1804 O  OE2  . GLU M  1 117 ? 144.829 119.532 61.124 1.00 6.09  116 M 1 \nATOM   1805 H  H    . GLU M  1 117 ? 140.479 120.343 63.141 1.00 6.09  116 M 1 \nATOM   1806 H  HA   . GLU M  1 117 ? 140.686 122.270 61.398 1.00 6.09  116 M 1 \nATOM   1807 H  HB2  . GLU M  1 117 ? 140.938 119.480 61.047 1.00 6.09  116 M 1 \nATOM   1808 H  HB3  . GLU M  1 117 ? 141.261 120.514 59.889 1.00 6.09  116 M 1 \nATOM   1809 H  HG2  . GLU M  1 117 ? 143.029 121.370 61.094 1.00 6.09  116 M 1 \nATOM   1810 H  HG3  . GLU M  1 117 ? 142.679 120.468 62.341 1.00 6.09  116 M 1 \nATOM   1811 N  N    . LEU M  1 118 ? 138.050 120.493 61.095 1.00 5.44  117 M 1 \nATOM   1812 C  CA   . LEU M  1 118 ? 136.683 120.381 60.513 1.00 5.44  117 M 1 \nATOM   1813 C  C    . LEU M  1 118 ? 135.896 121.645 60.854 1.00 5.44  117 M 1 \nATOM   1814 O  O    . LEU M  1 118 ? 135.268 122.209 59.984 1.00 5.44  117 M 1 \nATOM   1815 C  CB   . LEU M  1 118 ? 136.001 119.162 61.135 1.00 5.44  117 M 1 \nATOM   1816 C  CG   . LEU M  1 118 ? 135.154 118.291 60.216 1.00 5.44  117 M 1 \nATOM   1817 C  CD1  . LEU M  1 118 ? 134.146 117.487 61.035 1.00 5.44  117 M 1 \nATOM   1818 C  CD2  . LEU M  1 118 ? 134.466 119.108 59.137 1.00 5.44  117 M 1 \nATOM   1819 H  H    . LEU M  1 118 ? 138.182 119.944 61.808 1.00 5.44  117 M 1 \nATOM   1820 H  HA   . LEU M  1 118 ? 136.748 120.280 59.536 1.00 5.44  117 M 1 \nATOM   1821 H  HB2  . LEU M  1 118 ? 136.695 118.598 61.532 1.00 5.44  117 M 1 \nATOM   1822 H  HB3  . LEU M  1 118 ? 135.431 119.476 61.865 1.00 5.44  117 M 1 \nATOM   1823 H  HG   . LEU M  1 118 ? 135.758 117.649 59.768 1.00 5.44  117 M 1 \nATOM   1824 H  HD11 . LEU M  1 118 ? 134.618 116.943 61.689 1.00 5.44  117 M 1 \nATOM   1825 H  HD12 . LEU M  1 118 ? 133.634 116.908 60.443 1.00 5.44  117 M 1 \nATOM   1826 H  HD13 . LEU M  1 118 ? 133.542 118.095 61.495 1.00 5.44  117 M 1 \nATOM   1827 H  HD21 . LEU M  1 118 ? 133.946 118.518 58.565 1.00 5.44  117 M 1 \nATOM   1828 H  HD22 . LEU M  1 118 ? 133.876 119.761 59.551 1.00 5.44  117 M 1 \nATOM   1829 H  HD23 . LEU M  1 118 ? 135.136 119.569 58.602 1.00 5.44  117 M 1 \nATOM   1830 N  N    . HIS M  1 119 ? 135.947 122.064 62.122 1.00 5.74  118 M 1 \nATOM   1831 C  CA   . HIS M  1 119 ? 135.252 123.284 62.608 1.00 5.74  118 M 1 \nATOM   1832 C  C    . HIS M  1 119 ? 135.812 124.508 61.869 1.00 5.74  118 M 1 \nATOM   1833 O  O    . HIS M  1 119 ? 135.030 125.369 61.545 1.00 5.74  118 M 1 \nATOM   1834 C  CB   . HIS M  1 119 ? 135.357 123.419 64.135 1.00 5.74  118 M 1 \nATOM   1835 C  CG   . HIS M  1 119 ? 134.535 124.536 64.685 1.00 5.74  118 M 1 \nATOM   1836 N  ND1  . HIS M  1 119 ? 134.975 125.837 64.658 1.00 5.74  118 M 1 \nATOM   1837 C  CD2  . HIS M  1 119 ? 133.302 124.564 65.235 1.00 5.74  118 M 1 \nATOM   1838 C  CE1  . HIS M  1 119 ? 134.060 126.618 65.183 1.00 5.74  118 M 1 \nATOM   1839 N  NE2  . HIS M  1 119 ? 133.035 125.861 65.563 1.00 5.74  118 M 1 \nATOM   1840 H  H    . HIS M  1 119 ? 136.410 121.635 62.778 1.00 5.74  118 M 1 \nATOM   1841 H  HA   . HIS M  1 119 ? 134.298 123.198 62.373 1.00 5.74  118 M 1 \nATOM   1842 H  HB2  . HIS M  1 119 ? 135.068 122.576 64.550 1.00 5.74  118 M 1 \nATOM   1843 H  HB3  . HIS M  1 119 ? 136.298 123.565 64.378 1.00 5.74  118 M 1 \nATOM   1844 H  HD1  . HIS M  1 119 ? 135.747 126.104 64.341 1.00 5.74  118 M 1 \nATOM   1845 H  HD2  . HIS M  1 119 ? 132.745 123.826 65.397 1.00 5.74  118 M 1 \nATOM   1846 H  HE1  . HIS M  1 119 ? 134.129 127.551 65.291 1.00 5.74  118 M 1 \nATOM   1847 H  HE2  . HIS M  1 119 ? 132.296 126.153 65.935 1.00 5.74  118 M 1 \nATOM   1848 N  N    . LYS M  1 120 ? 137.117 124.588 61.642 1.00 6.94  119 M 1 \nATOM   1849 C  CA   . LYS M  1 120 ? 137.704 125.731 60.953 1.00 6.94  119 M 1 \nATOM   1850 C  C    . LYS M  1 120 ? 137.252 125.769 59.501 1.00 6.94  119 M 1 \nATOM   1851 O  O    . LYS M  1 120 ? 136.968 126.841 58.957 1.00 6.94  119 M 1 \nATOM   1852 C  CB   . LYS M  1 120 ? 139.226 125.668 61.063 1.00 6.94  119 M 1 \nATOM   1853 C  CG   . LYS M  1 120 ? 139.965 126.875 60.528 1.00 6.94  119 M 1 \nATOM   1854 C  CD   . LYS M  1 120 ? 141.474 126.717 60.664 1.00 6.94  119 M 1 \nATOM   1855 C  CE   . LYS M  1 120 ? 141.924 126.836 62.124 1.00 6.94  119 M 1 \nATOM   1856 N  NZ   . LYS M  1 120 ? 143.405 126.855 62.278 1.00 6.94  119 M 1 \nATOM   1857 H  H    . LYS M  1 120 ? 137.682 123.981 61.870 1.00 6.94  119 M 1 \nATOM   1858 H  HA   . LYS M  1 120 ? 137.406 126.548 61.382 1.00 6.94  119 M 1 \nATOM   1859 H  HB2  . LYS M  1 120 ? 139.445 125.586 62.004 1.00 6.94  119 M 1 \nATOM   1860 H  HB3  . LYS M  1 120 ? 139.553 124.888 60.587 1.00 6.94  119 M 1 \nATOM   1861 H  HG2  . LYS M  1 120 ? 139.763 126.981 59.585 1.00 6.94  119 M 1 \nATOM   1862 H  HG3  . LYS M  1 120 ? 139.697 127.666 61.021 1.00 6.94  119 M 1 \nATOM   1863 H  HD2  . LYS M  1 120 ? 141.736 125.844 60.333 1.00 6.94  119 M 1 \nATOM   1864 H  HD3  . LYS M  1 120 ? 141.916 127.413 60.152 1.00 6.94  119 M 1 \nATOM   1865 H  HE2  . LYS M  1 120 ? 141.562 127.647 62.515 1.00 6.94  119 M 1 \nATOM   1866 H  HE3  . LYS M  1 120 ? 141.600 126.065 62.615 1.00 6.94  119 M 1 \nATOM   1867 H  HZ1  . LYS M  1 120 ? 143.619 127.107 63.104 1.00 6.94  119 M 1 \nATOM   1868 H  HZ2  . LYS M  1 120 ? 143.740 126.045 62.127 1.00 6.94  119 M 1 \nATOM   1869 H  HZ3  . LYS M  1 120 ? 143.762 127.429 61.699 1.00 6.94  119 M 1 \nATOM   1870 N  N    . LEU M  1 121 ? 137.154 124.601 58.866 1.00 6.89  120 M 1 \nATOM   1871 C  CA   . LEU M  1 121 ? 136.638 124.530 57.503 1.00 6.89  120 M 1 \nATOM   1872 C  C    . LEU M  1 121 ? 135.186 124.986 57.441 1.00 6.89  120 M 1 \nATOM   1873 O  O    . LEU M  1 121 ? 134.803 125.757 56.555 1.00 6.89  120 M 1 \nATOM   1874 C  CB   . LEU M  1 121 ? 136.786 123.102 56.978 1.00 6.89  120 M 1 \nATOM   1875 C  CG   . LEU M  1 121 ? 136.318 122.766 55.565 1.00 6.89  120 M 1 \nATOM   1876 C  CD1  . LEU M  1 121 ? 137.080 123.577 54.538 1.00 6.89  120 M 1 \nATOM   1877 C  CD2  . LEU M  1 121 ? 136.493 121.280 55.308 1.00 6.89  120 M 1 \nATOM   1878 H  H    . LEU M  1 121 ? 137.359 123.837 59.205 1.00 6.89  120 M 1 \nATOM   1879 H  HA   . LEU M  1 121 ? 137.162 125.118 56.936 1.00 6.89  120 M 1 \nATOM   1880 H  HB2  . LEU M  1 121 ? 137.730 122.882 57.011 1.00 6.89  120 M 1 \nATOM   1881 H  HB3  . LEU M  1 121 ? 136.308 122.511 57.580 1.00 6.89  120 M 1 \nATOM   1882 H  HG   . LEU M  1 121 ? 135.373 122.969 55.487 1.00 6.89  120 M 1 \nATOM   1883 H  HD11 . LEU M  1 121 ? 136.899 123.221 53.654 1.00 6.89  120 M 1 \nATOM   1884 H  HD12 . LEU M  1 121 ? 136.791 124.502 54.586 1.00 6.89  120 M 1 \nATOM   1885 H  HD13 . LEU M  1 121 ? 138.029 123.518 54.730 1.00 6.89  120 M 1 \nATOM   1886 H  HD21 . LEU M  1 121 ? 136.305 121.089 54.376 1.00 6.89  120 M 1 \nATOM   1887 H  HD22 . LEU M  1 121 ? 137.408 121.035 55.519 1.00 6.89  120 M 1 \nATOM   1888 H  HD23 . LEU M  1 121 ? 135.882 120.783 55.875 1.00 6.89  120 M 1 \nATOM   1889 N  N    . ALA M  1 122 ? 134.366 124.518 58.380 1.00 6.56  121 M 1 \nATOM   1890 C  CA   . ALA M  1 122 ? 132.956 124.884 58.403 1.00 6.56  121 M 1 \nATOM   1891 C  C    . ALA M  1 122 ? 132.772 126.373 58.681 1.00 6.56  121 M 1 \nATOM   1892 O  O    . ALA M  1 122 ? 131.834 126.996 58.172 1.00 6.56  121 M 1 \nATOM   1893 C  CB   . ALA M  1 122 ? 132.228 124.038 59.443 1.00 6.56  121 M 1 \nATOM   1894 H  H    . ALA M  1 122 ? 134.599 123.980 59.009 1.00 6.56  121 M 1 \nATOM   1895 H  HA   . ALA M  1 122 ? 132.566 124.688 57.537 1.00 6.56  121 M 1 \nATOM   1896 H  HB1  . ALA M  1 122 ? 131.302 124.321 59.497 1.00 6.56  121 M 1 \nATOM   1897 H  HB2  . ALA M  1 122 ? 132.279 123.107 59.175 1.00 6.56  121 M 1 \nATOM   1898 H  HB3  . ALA M  1 122 ? 132.657 124.155 60.305 1.00 6.56  121 M 1 \nATOM   1899 N  N    . THR M  1 123 ? 133.659 126.961 59.484 1.00 7.31  122 M 1 \nATOM   1900 C  CA   . THR M  1 123 ? 133.606 128.398 59.721 1.00 7.31  122 M 1 \nATOM   1901 C  C    . THR M  1 123 ? 134.046 129.166 58.482 1.00 7.31  122 M 1 \nATOM   1902 O  O    . THR M  1 123 ? 133.495 130.227 58.173 1.00 7.31  122 M 1 \nATOM   1903 C  CB   . THR M  1 123 ? 134.470 128.769 60.928 1.00 7.31  122 M 1 \nATOM   1904 O  OG1  . THR M  1 123 ? 133.960 128.120 62.097 1.00 7.31  122 M 1 \nATOM   1905 C  CG2  . THR M  1 123 ? 134.483 130.277 61.145 1.00 7.31  122 M 1 \nATOM   1906 H  H    . THR M  1 123 ? 134.302 126.556 59.886 1.00 7.31  122 M 1 \nATOM   1907 H  HA   . THR M  1 123 ? 132.694 128.650 59.934 1.00 7.31  122 M 1 \nATOM   1908 H  HB   . THR M  1 123 ? 135.385 128.481 60.782 1.00 7.31  122 M 1 \nATOM   1909 H  HG1  . THR M  1 123 ? 133.261 127.701 61.895 1.00 7.31  122 M 1 \nATOM   1910 H  HG21 . THR M  1 123 ? 134.748 130.484 62.055 1.00 7.31  122 M 1 \nATOM   1911 H  HG22 . THR M  1 123 ? 135.113 130.697 60.539 1.00 7.31  122 M 1 \nATOM   1912 H  HG23 . THR M  1 123 ? 133.599 130.644 60.988 1.00 7.31  122 M 1 \nATOM   1913 N  N    . ASP M  1 124 ? 135.030 128.636 57.753 1.00 8.30  123 M 1 \nATOM   1914 C  CA   . ASP M  1 124 ? 135.501 129.298 56.541 1.00 8.30  123 M 1 \nATOM   1915 C  C    . ASP M  1 124 ? 134.428 129.291 55.460 1.00 8.30  123 M 1 \nATOM   1916 O  O    . ASP M  1 124 ? 134.339 130.227 54.657 1.00 8.30  123 M 1 \nATOM   1917 C  CB   . ASP M  1 124 ? 136.770 128.620 56.028 1.00 8.30  123 M 1 \nATOM   1918 C  CG   . ASP M  1 124 ? 137.366 129.322 54.822 1.00 8.30  123 M 1 \nATOM   1919 O  OD1  . ASP M  1 124 ? 136.811 130.351 54.385 1.00 8.30  123 M 1 \nATOM   1920 O  OD2  . ASP M  1 124 ? 138.392 128.834 54.304 1.00 8.30  123 M 1 \nATOM   1921 H  H    . ASP M  1 124 ? 135.429 127.895 57.930 1.00 8.30  123 M 1 \nATOM   1922 H  HA   . ASP M  1 124 ? 135.715 130.220 56.753 1.00 8.30  123 M 1 \nATOM   1923 H  HB2  . ASP M  1 124 ? 137.433 128.611 56.737 1.00 8.30  123 M 1 \nATOM   1924 H  HB3  . ASP M  1 124 ? 136.561 127.710 55.765 1.00 8.30  123 M 1 \nATOM   1925 N  N    . LYS M  1 125 ? 133.639 128.218 55.448 1.00 7.98  124 M 1 \nATOM   1926 C  CA   . LYS M  1 125 ? 132.537 127.992 54.479 1.00 7.98  124 M 1 \nATOM   1927 C  C    . LYS M  1 125 ? 131.232 128.616 54.993 1.00 7.98  124 M 1 \nATOM   1928 O  O    . LYS M  1 125 ? 130.244 128.495 54.287 1.00 7.98  124 M 1 \nATOM   1929 C  CB   . LYS M  1 125 ? 132.390 126.495 54.199 1.00 7.98  124 M 1 \nATOM   1930 C  CG   . LYS M  1 125 ? 133.616 125.856 53.570 1.00 7.98  124 M 1 \nATOM   1931 C  CD   . LYS M  1 125 ? 134.148 126.682 52.423 1.00 7.98  124 M 1 \nATOM   1932 C  CE   . LYS M  1 125 ? 135.243 126.000 51.635 1.00 7.98  124 M 1 \nATOM   1933 N  NZ   . LYS M  1 125 ? 135.481 126.687 50.345 1.00 7.98  124 M 1 \nATOM   1934 H  H    . LYS M  1 125 ? 133.694 127.571 56.087 1.00 7.98  124 M 1 \nATOM   1935 H  HA   . LYS M  1 125 ? 132.780 128.441 53.637 1.00 7.98  124 M 1 \nATOM   1936 H  HB2  . LYS M  1 125 ? 132.195 126.037 55.044 1.00 7.98  124 M 1 \nATOM   1937 H  HB3  . LYS M  1 125 ? 131.625 126.363 53.602 1.00 7.98  124 M 1 \nATOM   1938 H  HG2  . LYS M  1 125 ? 134.314 125.758 54.252 1.00 7.98  124 M 1 \nATOM   1939 H  HG3  . LYS M  1 125 ? 133.380 124.961 53.244 1.00 7.98  124 M 1 \nATOM   1940 H  HD2  . LYS M  1 125 ? 133.408 126.894 51.815 1.00 7.98  124 M 1 \nATOM   1941 H  HD3  . LYS M  1 125 ? 134.496 127.528 52.777 1.00 7.98  124 M 1 \nATOM   1942 H  HE2  . LYS M  1 125 ? 136.069 126.000 52.154 1.00 7.98  124 M 1 \nATOM   1943 H  HE3  . LYS M  1 125 ? 134.993 125.073 51.461 1.00 7.98  124 M 1 \nATOM   1944 H  HZ1  . LYS M  1 125 ? 136.152 126.274 49.896 1.00 7.98  124 M 1 \nATOM   1945 H  HZ2  . LYS M  1 125 ? 134.728 126.664 49.841 1.00 7.98  124 M 1 \nATOM   1946 H  HZ3  . LYS M  1 125 ? 135.712 127.551 50.495 1.00 7.98  124 M 1 \nATOM   1947 N  N    . ASN M  1 126 ? 131.229 129.276 56.154 1.00 8.52  125 M 1 \nATOM   1948 C  CA   . ASN M  1 126 ? 130.015 129.901 56.741 1.00 8.52  125 M 1 \nATOM   1949 C  C    . ASN M  1 126 ? 128.888 128.867 56.820 1.00 8.52  125 M 1 \nATOM   1950 O  O    . ASN M  1 126 ? 127.810 129.160 56.312 1.00 8.52  125 M 1 \nATOM   1951 C  CB   . ASN M  1 126 ? 129.529 131.135 55.978 1.00 8.52  125 M 1 \nATOM   1952 C  CG   . ASN M  1 126 ? 130.525 132.269 56.008 1.00 8.52  125 M 1 \nATOM   1953 O  OD1  . ASN M  1 126 ? 130.814 132.840 54.977 1.00 8.52  125 M 1 \nATOM   1954 N  ND2  . ASN M  1 126 ? 131.085 132.562 57.168 1.00 8.52  125 M 1 \nATOM   1955 H  H    . ASN M  1 126 ? 131.987 129.495 56.603 1.00 8.52  125 M 1 \nATOM   1956 H  HA   . ASN M  1 126 ? 130.235 130.189 57.658 1.00 8.52  125 M 1 \nATOM   1957 H  HB2  . ASN M  1 126 ? 129.357 130.885 55.047 1.00 8.52  125 M 1 \nATOM   1958 H  HB3  . ASN M  1 126 ? 128.685 131.439 56.371 1.00 8.52  125 M 1 \nATOM   1959 H  HD21 . ASN M  1 126 ? 130.925 132.059 57.876 1.00 8.52  125 M 1 \nATOM   1960 H  HD22 . ASN M  1 126 ? 131.621 133.262 57.235 1.00 8.52  125 M 1 \nATOM   1961 N  N    . ASP M  1 127 ? 129.169 127.682 57.357 1.00 6.70  126 M 1 \nATOM   1962 C  CA   . ASP M  1 127 ? 128.151 126.617 57.571 1.00 6.70  126 M 1 \nATOM   1963 C  C    . ASP M  1 127 ? 127.847 126.621 59.071 1.00 6.70  126 M 1 \nATOM   1964 O  O    . ASP M  1 127 ? 128.430 125.802 59.748 1.00 6.70  126 M 1 \nATOM   1965 C  CB   . ASP M  1 127 ? 128.649 125.263 57.062 1.00 6.70  126 M 1 \nATOM   1966 C  CG   . ASP M  1 127 ? 127.592 124.162 57.047 1.00 6.70  126 M 1 \nATOM   1967 O  OD1  . ASP M  1 127 ? 126.669 124.198 57.869 1.00 6.70  126 M 1 \nATOM   1968 O  OD2  . ASP M  1 127 ? 127.711 123.274 56.207 1.00 6.70  126 M 1 \nATOM   1969 H  H    . ASP M  1 127 ? 130.003 127.458 57.645 1.00 6.70  126 M 1 \nATOM   1970 H  HA   . ASP M  1 127 ? 127.350 126.846 57.064 1.00 6.70  126 M 1 \nATOM   1971 H  HB2  . ASP M  1 127 ? 128.987 125.374 56.150 1.00 6.70  126 M 1 \nATOM   1972 H  HB3  . ASP M  1 127 ? 129.391 124.967 57.628 1.00 6.70  126 M 1 \nATOM   1973 N  N    . PRO M  1 128 ? 126.965 127.479 59.619 1.00 5.77  127 M 1 \nATOM   1974 C  CA   . PRO M  1 128 ? 126.741 127.524 61.065 1.00 5.77  127 M 1 \nATOM   1975 C  C    . PRO M  1 128 ? 126.225 126.213 61.679 1.00 5.77  127 M 1 \nATOM   1976 O  O    . PRO M  1 128 ? 126.600 125.891 62.754 1.00 5.77  127 M 1 \nATOM   1977 C  CB   . PRO M  1 128 ? 125.692 128.634 61.255 1.00 5.77  127 M 1 \nATOM   1978 C  CG   . PRO M  1 128 ? 125.083 128.814 59.877 1.00 5.77  127 M 1 \nATOM   1979 C  CD   . PRO M  1 128 ? 126.196 128.501 58.906 1.00 5.77  127 M 1 \nATOM   1980 H  HA   . PRO M  1 128 ? 127.581 127.794 61.513 1.00 5.77  127 M 1 \nATOM   1981 H  HB2  . PRO M  1 128 ? 125.010 128.365 61.906 1.00 5.77  127 M 1 \nATOM   1982 H  HB3  . PRO M  1 128 ? 126.113 129.466 61.561 1.00 5.77  127 M 1 \nATOM   1983 H  HG2  . PRO M  1 128 ? 124.330 128.202 59.749 1.00 5.77  127 M 1 \nATOM   1984 H  HG3  . PRO M  1 128 ? 124.766 129.732 59.755 1.00 5.77  127 M 1 \nATOM   1985 H  HD2  . PRO M  1 128 ? 125.845 128.154 58.065 1.00 5.77  127 M 1 \nATOM   1986 H  HD3  . PRO M  1 128 ? 126.741 129.289 58.725 1.00 5.77  127 M 1 \nATOM   1987 N  N    . HIS M  1 129 ? 125.348 125.514 60.982 1.00 5.02  128 M 1 \nATOM   1988 C  CA   . HIS M  1 129 ? 124.765 124.273 61.476 1.00 5.02  128 M 1 \nATOM   1989 C  C    . HIS M  1 129 ? 125.834 123.227 61.751 1.00 5.02  128 M 1 \nATOM   1990 O  O    . HIS M  1 129 ? 125.834 122.585 62.805 1.00 5.02  128 M 1 \nATOM   1991 C  CB   . HIS M  1 129 ? 123.744 123.740 60.480 1.00 5.02  128 M 1 \nATOM   1992 C  CG   . HIS M  1 129 ? 123.184 122.415 60.872 1.00 5.02  128 M 1 \nATOM   1993 N  ND1  . HIS M  1 129 ? 123.741 121.229 60.452 1.00 5.02  128 M 1 \nATOM   1994 C  CD2  . HIS M  1 129 ? 122.173 122.082 61.706 1.00 5.02  128 M 1 \nATOM   1995 C  CE1  . HIS M  1 129 ? 123.067 120.221 60.972 1.00 5.02  128 M 1 \nATOM   1996 N  NE2  . HIS M  1 129 ? 122.113 120.712 61.739 1.00 5.02  128 M 1 \nATOM   1997 H  H    . HIS M  1 129 ? 125.099 125.746 60.192 1.00 5.02  128 M 1 \nATOM   1998 H  HA   . HIS M  1 129 ? 124.296 124.455 62.305 1.00 5.02  128 M 1 \nATOM   1999 H  HB2  . HIS M  1 129 ? 123.005 124.365 60.417 1.00 5.02  128 M 1 \nATOM   2000 H  HB3  . HIS M  1 129 ? 124.156 123.652 59.606 1.00 5.02  128 M 1 \nATOM   2001 H  HD2  . HIS M  1 129 ? 121.611 122.670 62.158 1.00 5.02  128 M 1 \nATOM   2002 H  HE1  . HIS M  1 129 ? 123.240 119.319 60.828 1.00 5.02  128 M 1 \nATOM   2003 H  HE2  . HIS M  1 129 ? 121.547 120.247 62.189 1.00 5.02  128 M 1 \nATOM   2004 N  N    . LEU M  1 130 ? 126.756 123.052 60.813 1.00 5.28  129 M 1 \nATOM   2005 C  CA   . LEU M  1 130 ? 127.830 122.084 60.980 1.00 5.28  129 M 1 \nATOM   2006 C  C    . LEU M  1 130 ? 128.739 122.462 62.142 1.00 5.28  129 M 1 \nATOM   2007 O  O    . LEU M  1 130 ? 129.133 121.600 62.940 1.00 5.28  129 M 1 \nATOM   2008 C  CB   . LEU M  1 130 ? 128.616 121.985 59.676 1.00 5.28  129 M 1 \nATOM   2009 C  CG   . LEU M  1 130 ? 129.788 121.014 59.622 1.00 5.28  129 M 1 \nATOM   2010 C  CD1  . LEU M  1 130 ? 129.324 119.615 59.936 1.00 5.28  129 M 1 \nATOM   2011 C  CD2  . LEU M  1 130 ? 130.428 121.058 58.252 1.00 5.28  129 M 1 \nATOM   2012 H  H    . LEU M  1 130 ? 126.778 123.490 60.073 1.00 5.28  129 M 1 \nATOM   2013 H  HA   . LEU M  1 130 ? 127.435 121.218 61.169 1.00 5.28  129 M 1 \nATOM   2014 H  HB2  . LEU M  1 130 ? 128.001 121.743 58.966 1.00 5.28  129 M 1 \nATOM   2015 H  HB3  . LEU M  1 130 ? 128.971 122.866 59.479 1.00 5.28  129 M 1 \nATOM   2016 H  HG   . LEU M  1 130 ? 130.459 121.278 60.271 1.00 5.28  129 M 1 \nATOM   2017 H  HD11 . LEU M  1 130 ? 129.948 118.980 59.550 1.00 5.28  129 M 1 \nATOM   2018 H  HD12 . LEU M  1 130 ? 129.297 119.505 60.899 1.00 5.28  129 M 1 \nATOM   2019 H  HD13 . LEU M  1 130 ? 128.439 119.477 59.562 1.00 5.28  129 M 1 \nATOM   2020 H  HD21 . LEU M  1 130 ? 131.261 120.562 58.278 1.00 5.28  129 M 1 \nATOM   2021 H  HD22 . LEU M  1 130 ? 129.823 120.652 57.612 1.00 5.28  129 M 1 \nATOM   2022 H  HD23 . LEU M  1 130 ? 130.597 121.979 57.999 1.00 5.28  129 M 1 \nATOM   2023 N  N    . CYS M  1 131 ? 129.088 123.745 62.240 1.00 5.91  130 M 1 \nATOM   2024 C  CA   . CYS M  1 131 ? 129.904 124.227 63.347 1.00 5.91  130 M 1 \nATOM   2025 C  C    . CYS M  1 131 ? 129.253 123.901 64.682 1.00 5.91  130 M 1 \nATOM   2026 O  O    . CYS M  1 131 ? 129.891 123.335 65.574 1.00 5.91  130 M 1 \nATOM   2027 C  CB   . CYS M  1 131 ? 130.131 125.729 63.203 1.00 5.91  130 M 1 \nATOM   2028 S  SG   . CYS M  1 131 ? 131.134 126.159 61.782 1.00 5.91  130 M 1 \nATOM   2029 H  H    . CYS M  1 131 ? 128.856 124.353 61.678 1.00 5.91  130 M 1 \nATOM   2030 H  HA   . CYS M  1 131 ? 130.777 123.805 63.314 1.00 5.91  130 M 1 \nATOM   2031 H  HB2  . CYS M  1 131 ? 129.273 126.171 63.104 1.00 5.91  130 M 1 \nATOM   2032 H  HB3  . CYS M  1 131 ? 130.578 126.060 63.998 1.00 5.91  130 M 1 \nATOM   2033 H  HG   . CYS M  1 131 ? 130.449 126.104 60.798 1.00 5.91  130 M 1 \nATOM   2034 N  N    . ASP M  1 132 ? 127.967 124.217 64.820 1.00 5.48  131 M 1 \nATOM   2035 C  CA   . ASP M  1 132 ? 127.281 123.991 66.084 1.00 5.48  131 M 1 \nATOM   2036 C  C    . ASP M  1 132 ? 127.145 122.505 66.376 1.00 5.48  131 M 1 \nATOM   2037 O  O    . ASP M  1 132 ? 127.222 122.085 67.531 1.00 5.48  131 M 1 \nATOM   2038 C  CB   . ASP M  1 132 ? 125.909 124.656 66.064 1.00 5.48  131 M 1 \nATOM   2039 C  CG   . ASP M  1 132 ? 125.215 124.578 67.402 1.00 5.48  131 M 1 \nATOM   2040 O  OD1  . ASP M  1 132 ? 125.634 125.300 68.328 1.00 5.48  131 M 1 \nATOM   2041 O  OD2  . ASP M  1 132 ? 124.254 123.795 67.528 1.00 5.48  131 M 1 \nATOM   2042 H  H    . ASP M  1 132 ? 127.475 124.553 64.200 1.00 5.48  131 M 1 \nATOM   2043 H  HA   . ASP M  1 132 ? 127.803 124.396 66.794 1.00 5.48  131 M 1 \nATOM   2044 H  HB2  . ASP M  1 132 ? 126.005 125.590 65.820 1.00 5.48  131 M 1 \nATOM   2045 H  HB3  . ASP M  1 132 ? 125.348 124.203 65.415 1.00 5.48  131 M 1 \nATOM   2046 N  N    . PHE M  1 133 ? 126.935 121.698 65.339 1.00 4.96  132 M 1 \nATOM   2047 C  CA   . PHE M  1 133 ? 126.879 120.250 65.500 1.00 4.96  132 M 1 \nATOM   2048 C  C    . PHE M  1 133 ? 128.176 119.716 66.096 1.00 4.96  132 M 1 \nATOM   2049 O  O    . PHE M  1 133 ? 128.164 118.980 67.093 1.00 4.96  132 M 1 \nATOM   2050 C  CB   . PHE M  1 133 ? 126.616 119.617 64.138 1.00 4.96  132 M 1 \nATOM   2051 C  CG   . PHE M  1 133 ? 126.460 118.140 64.172 1.00 4.96  132 M 1 \nATOM   2052 C  CD1  . PHE M  1 133 ? 125.267 117.579 64.563 1.00 4.96  132 M 1 \nATOM   2053 C  CD2  . PHE M  1 133 ? 127.501 117.309 63.819 1.00 4.96  132 M 1 \nATOM   2054 C  CE1  . PHE M  1 133 ? 125.111 116.227 64.590 1.00 4.96  132 M 1 \nATOM   2055 C  CE2  . PHE M  1 133 ? 127.340 115.952 63.850 1.00 4.96  132 M 1 \nATOM   2056 C  CZ   . PHE M  1 133 ? 126.146 115.419 64.239 1.00 4.96  132 M 1 \nATOM   2057 H  H    . PHE M  1 133 ? 126.826 121.970 64.531 1.00 4.96  132 M 1 \nATOM   2058 H  HA   . PHE M  1 133 ? 126.144 120.020 66.090 1.00 4.96  132 M 1 \nATOM   2059 H  HB2  . PHE M  1 133 ? 125.790 119.981 63.782 1.00 4.96  132 M 1 \nATOM   2060 H  HB3  . PHE M  1 133 ? 127.343 119.833 63.533 1.00 4.96  132 M 1 \nATOM   2061 H  HD1  . PHE M  1 133 ? 124.556 118.129 64.802 1.00 4.96  132 M 1 \nATOM   2062 H  HD2  . PHE M  1 133 ? 128.317 117.667 63.553 1.00 4.96  132 M 1 \nATOM   2063 H  HE1  . PHE M  1 133 ? 124.299 115.859 64.854 1.00 4.96  132 M 1 \nATOM   2064 H  HE2  . PHE M  1 133 ? 128.043 115.393 63.610 1.00 4.96  132 M 1 \nATOM   2065 H  HZ   . PHE M  1 133 ? 126.034 114.496 64.259 1.00 4.96  132 M 1 \nATOM   2066 N  N    . ILE M  1 134 ? 129.305 120.104 65.501 1.00 5.03  133 M 1 \nATOM   2067 C  CA   . ILE M  1 134 ? 130.616 119.674 65.982 1.00 5.03  133 M 1 \nATOM   2068 C  C    . ILE M  1 134 ? 130.840 120.153 67.413 1.00 5.03  133 M 1 \nATOM   2069 O  O    . ILE M  1 134 ? 131.305 119.397 68.272 1.00 5.03  133 M 1 \nATOM   2070 C  CB   . ILE M  1 134 ? 131.719 120.176 65.028 1.00 5.03  133 M 1 \nATOM   2071 C  CG1  . ILE M  1 134 ? 131.577 119.558 63.624 1.00 5.03  133 M 1 \nATOM   2072 C  CG2  . ILE M  1 134 ? 133.105 119.929 65.596 1.00 5.03  133 M 1 \nATOM   2073 C  CD1  . ILE M  1 134 ? 131.748 118.039 63.534 1.00 5.03  133 M 1 \nATOM   2074 H  H    . ILE M  1 134 ? 129.335 120.630 64.821 1.00 5.03  133 M 1 \nATOM   2075 H  HA   . ILE M  1 134 ? 130.642 118.704 65.994 1.00 5.03  133 M 1 \nATOM   2076 H  HB   . ILE M  1 134 ? 131.619 121.137 64.938 1.00 5.03  133 M 1 \nATOM   2077 H  HG12 . ILE M  1 134 ? 130.691 119.745 63.277 1.00 5.03  133 M 1 \nATOM   2078 H  HG13 . ILE M  1 134 ? 132.226 119.978 63.038 1.00 5.03  133 M 1 \nATOM   2079 H  HG21 . ILE M  1 134 ? 133.751 120.040 64.881 1.00 5.03  133 M 1 \nATOM   2080 H  HG22 . ILE M  1 134 ? 133.296 120.575 66.294 1.00 5.03  133 M 1 \nATOM   2081 H  HG23 . ILE M  1 134 ? 133.155 119.026 65.946 1.00 5.03  133 M 1 \nATOM   2082 H  HD11 . ILE M  1 134 ? 131.674 117.779 62.602 1.00 5.03  133 M 1 \nATOM   2083 H  HD12 . ILE M  1 134 ? 132.622 117.784 63.869 1.00 5.03  133 M 1 \nATOM   2084 H  HD13 . ILE M  1 134 ? 131.051 117.593 64.041 1.00 5.03  133 M 1 \nATOM   2085 N  N    . GLU M  1 135 ? 130.489 121.403 67.667 1.00 5.70  134 M 1 \nATOM   2086 C  CA   . GLU M  1 135 ? 130.686 122.013 69.003 1.00 5.70  134 M 1 \nATOM   2087 C  C    . GLU M  1 135 ? 129.853 121.255 70.039 1.00 5.70  134 M 1 \nATOM   2088 O  O    . GLU M  1 135 ? 130.444 120.817 71.036 1.00 5.70  134 M 1 \nATOM   2089 C  CB   . GLU M  1 135 ? 130.277 123.487 68.999 1.00 5.70  134 M 1 \nATOM   2090 C  CG   . GLU M  1 135 ? 131.234 124.397 68.267 1.00 5.70  134 M 1 \nATOM   2091 C  CD   . GLU M  1 135 ? 130.626 125.767 68.005 1.00 5.70  134 M 1 \nATOM   2092 O  OE1  . GLU M  1 135 ? 129.620 126.068 68.646 1.00 5.70  134 M 1 \nATOM   2093 O  OE2  . GLU M  1 135 ? 131.138 126.504 67.151 1.00 5.70  134 M 1 \nATOM   2094 H  H    . GLU M  1 135 ? 129.997 121.908 67.091 1.00 5.70  134 M 1 \nATOM   2095 H  HA   . GLU M  1 135 ? 131.639 121.943 69.245 1.00 5.70  134 M 1 \nATOM   2096 H  HB2  . GLU M  1 135 ? 129.391 123.562 68.586 1.00 5.70  134 M 1 \nATOM   2097 H  HB3  . GLU M  1 135 ? 130.200 123.790 69.927 1.00 5.70  134 M 1 \nATOM   2098 H  HG2  . GLU M  1 135 ? 132.051 124.508 68.798 1.00 5.70  134 M 1 \nATOM   2099 H  HG3  . GLU M  1 135 ? 131.482 123.989 67.409 1.00 5.70  134 M 1 \nATOM   2100 N  N    . THR M  1 136 ? 128.607 120.926 69.710 1.00 5.69  135 M 1 \nATOM   2101 C  CA   . THR M  1 136 ? 127.648 120.409 70.673 1.00 5.69  135 M 1 \nATOM   2102 C  C    . THR M  1 136 ? 127.901 118.943 70.981 1.00 5.69  135 M 1 \nATOM   2103 O  O    . THR M  1 136 ? 127.792 118.527 72.139 1.00 5.69  135 M 1 \nATOM   2104 C  CB   . THR M  1 136 ? 126.231 120.615 70.132 1.00 5.69  135 M 1 \nATOM   2105 O  OG1  . THR M  1 136 ? 125.987 122.016 69.958 1.00 5.69  135 M 1 \nATOM   2106 C  CG2  . THR M  1 136 ? 125.180 120.022 71.054 1.00 5.69  135 M 1 \nATOM   2107 H  H    . THR M  1 136 ? 128.290 121.021 68.916 1.00 5.69  135 M 1 \nATOM   2108 H  HA   . THR M  1 136 ? 127.735 120.908 71.500 1.00 5.69  135 M 1 \nATOM   2109 H  HB   . THR M  1 136 ? 126.146 120.171 69.274 1.00 5.69  135 M 1 \nATOM   2110 H  HG1  . THR M  1 136 ? 126.306 122.271 69.224 1.00 5.69  135 M 1 \nATOM   2111 H  HG21 . THR M  1 136 ? 124.308 120.381 70.826 1.00 5.69  135 M 1 \nATOM   2112 H  HG22 . THR M  1 136 ? 125.137 119.058 70.952 1.00 5.69  135 M 1 \nATOM   2113 H  HG23 . THR M  1 136 ? 125.382 120.243 71.977 1.00 5.69  135 M 1 \nATOM   2114 N  N    . TYR M  1 137 ? 128.255 118.148 69.967 1.00 5.32  136 M 1 \nATOM   2115 C  CA   . TYR M  1 137 ? 128.285 116.699 70.109 1.00 5.32  136 M 1 \nATOM   2116 C  C    . TYR M  1 137 ? 129.681 116.086 70.112 1.00 5.32  136 M 1 \nATOM   2117 O  O    . TYR M  1 137 ? 129.812 114.924 70.507 1.00 5.32  136 M 1 \nATOM   2118 C  CB   . TYR M  1 137 ? 127.446 116.053 68.996 1.00 5.32  136 M 1 \nATOM   2119 C  CG   . TYR M  1 137 ? 125.993 116.445 69.078 1.00 5.32  136 M 1 \nATOM   2120 C  CD1  . TYR M  1 137 ? 125.173 115.917 70.061 1.00 5.32  136 M 1 \nATOM   2121 C  CD2  . TYR M  1 137 ? 125.435 117.320 68.164 1.00 5.32  136 M 1 \nATOM   2122 C  CE1  . TYR M  1 137 ? 123.854 116.266 70.149 1.00 5.32  136 M 1 \nATOM   2123 C  CE2  . TYR M  1 137 ? 124.109 117.674 68.238 1.00 5.32  136 M 1 \nATOM   2124 C  CZ   . TYR M  1 137 ? 123.318 117.142 69.235 1.00 5.32  136 M 1 \nATOM   2125 O  OH   . TYR M  1 137 ? 121.991 117.479 69.329 1.00 5.32  136 M 1 \nATOM   2126 H  H    . TYR M  1 137 ? 128.481 118.435 69.189 1.00 5.32  136 M 1 \nATOM   2127 H  HA   . TYR M  1 137 ? 127.872 116.438 70.947 1.00 5.32  136 M 1 \nATOM   2128 H  HB2  . TYR M  1 137 ? 127.794 116.325 68.132 1.00 5.32  136 M 1 \nATOM   2129 H  HB3  . TYR M  1 137 ? 127.491 115.087 69.065 1.00 5.32  136 M 1 \nATOM   2130 H  HD1  . TYR M  1 137 ? 125.528 115.329 70.687 1.00 5.32  136 M 1 \nATOM   2131 H  HD2  . TYR M  1 137 ? 125.965 117.681 67.491 1.00 5.32  136 M 1 \nATOM   2132 H  HE1  . TYR M  1 137 ? 123.322 115.905 70.821 1.00 5.32  136 M 1 \nATOM   2133 H  HE2  . TYR M  1 137 ? 123.756 118.269 67.616 1.00 5.32  136 M 1 \nATOM   2134 H  HH   . TYR M  1 137 ? 121.786 118.019 68.719 1.00 5.32  136 M 1 \nATOM   2135 N  N    . TYR M  1 138 ? 130.715 116.820 69.695 1.00 4.75  137 M 1 \nATOM   2136 C  CA   . TYR M  1 138 ? 132.058 116.267 69.521 1.00 4.75  137 M 1 \nATOM   2137 C  C    . TYR M  1 138 ? 133.140 116.945 70.353 1.00 4.75  137 M 1 \nATOM   2138 O  O    . TYR M  1 138 ? 133.898 116.247 71.032 1.00 4.75  137 M 1 \nATOM   2139 C  CB   . TYR M  1 138 ? 132.409 116.289 68.026 1.00 4.75  137 M 1 \nATOM   2140 C  CG   . TYR M  1 138 ? 131.612 115.244 67.293 1.00 4.75  137 M 1 \nATOM   2141 C  CD1  . TYR M  1 138 ? 132.096 113.958 67.141 1.00 4.75  137 M 1 \nATOM   2142 C  CD2  . TYR M  1 138 ? 130.320 115.500 66.879 1.00 4.75  137 M 1 \nATOM   2143 C  CE1  . TYR M  1 138 ? 131.360 112.991 66.518 1.00 4.75  137 M 1 \nATOM   2144 C  CE2  . TYR M  1 138 ? 129.567 114.535 66.263 1.00 4.75  137 M 1 \nATOM   2145 C  CZ   . TYR M  1 138 ? 130.093 113.277 66.087 1.00 4.75  137 M 1 \nATOM   2146 O  OH   . TYR M  1 138 ? 129.368 112.286 65.485 1.00 4.75  137 M 1 \nATOM   2147 H  H    . TYR M  1 138 ? 130.649 117.652 69.486 1.00 4.75  137 M 1 \nATOM   2148 H  HA   . TYR M  1 138 ? 132.058 115.331 69.774 1.00 4.75  137 M 1 \nATOM   2149 H  HB2  . TYR M  1 138 ? 132.226 117.161 67.643 1.00 4.75  137 M 1 \nATOM   2150 H  HB3  . TYR M  1 138 ? 133.350 116.078 67.917 1.00 4.75  137 M 1 \nATOM   2151 H  HD1  . TYR M  1 138 ? 132.959 113.757 67.423 1.00 4.75  137 M 1 \nATOM   2152 H  HD2  . TYR M  1 138 ? 129.963 116.350 66.999 1.00 4.75  137 M 1 \nATOM   2153 H  HE1  . TYR M  1 138 ? 131.714 112.139 66.400 1.00 4.75  137 M 1 \nATOM   2154 H  HE2  . TYR M  1 138 ? 128.706 114.734 65.975 1.00 4.75  137 M 1 \nATOM   2155 H  HH   . TYR M  1 138 ? 129.810 111.572 65.461 1.00 4.75  137 M 1 \nATOM   2156 N  N    . LEU M  1 139 ? 133.243 118.277 70.343 1.00 5.15  138 M 1 \nATOM   2157 C  CA   . LEU M  1 139 ? 134.409 118.924 70.952 1.00 5.15  138 M 1 \nATOM   2158 C  C    . LEU M  1 139 ? 134.414 118.788 72.475 1.00 5.15  138 M 1 \nATOM   2159 O  O    . LEU M  1 139 ? 135.460 118.504 73.074 1.00 5.15  138 M 1 \nATOM   2160 C  CB   . LEU M  1 139 ? 134.485 120.398 70.541 1.00 5.15  138 M 1 \nATOM   2161 C  CG   . LEU M  1 139 ? 134.810 120.765 69.087 1.00 5.15  138 M 1 \nATOM   2162 C  CD1  . LEU M  1 139 ? 134.728 122.282 68.909 1.00 5.15  138 M 1 \nATOM   2163 C  CD2  . LEU M  1 139 ? 136.168 120.241 68.631 1.00 5.15  138 M 1 \nATOM   2164 H  H    . LEU M  1 139 ? 132.663 118.816 70.008 1.00 5.15  138 M 1 \nATOM   2165 H  HA   . LEU M  1 139 ? 135.217 118.493 70.633 1.00 5.15  138 M 1 \nATOM   2166 H  HB2  . LEU M  1 139 ? 133.626 120.801 70.744 1.00 5.15  138 M 1 \nATOM   2167 H  HB3  . LEU M  1 139 ? 135.163 120.828 71.085 1.00 5.15  138 M 1 \nATOM   2168 H  HG   . LEU M  1 139 ? 134.147 120.368 68.501 1.00 5.15  138 M 1 \nATOM   2169 H  HD11 . LEU M  1 139 ? 134.996 122.514 68.006 1.00 5.15  138 M 1 \nATOM   2170 H  HD12 . LEU M  1 139 ? 133.819 122.579 69.071 1.00 5.15  138 M 1 \nATOM   2171 H  HD13 . LEU M  1 139 ? 135.323 122.712 69.543 1.00 5.15  138 M 1 \nATOM   2172 H  HD21 . LEU M  1 139 ? 136.264 120.441 67.687 1.00 5.15  138 M 1 \nATOM   2173 H  HD22 . LEU M  1 139 ? 136.878 120.678 69.128 1.00 5.15  138 M 1 \nATOM   2174 H  HD23 . LEU M  1 139 ? 136.219 119.282 68.765 1.00 5.15  138 M 1 \nATOM   2175 N  N    . SER M  1 140 ? 133.263 118.984 73.122 1.00 5.52  139 M 1 \nATOM   2176 C  CA   . SER M  1 140 ? 133.212 118.887 74.580 1.00 5.52  139 M 1 \nATOM   2177 C  C    . SER M  1 140 ? 133.454 117.457 75.050 1.00 5.52  139 M 1 \nATOM   2178 O  O    . SER M  1 140 ? 134.145 117.230 76.053 1.00 5.52  139 M 1 \nATOM   2179 C  CB   . SER M  1 140 ? 131.870 119.403 75.101 1.00 5.52  139 M 1 \nATOM   2180 O  OG   . SER M  1 140 ? 131.723 120.784 74.840 1.00 5.52  139 M 1 \nATOM   2181 H  H    . SER M  1 140 ? 132.513 119.176 72.748 1.00 5.52  139 M 1 \nATOM   2182 H  HA   . SER M  1 140 ? 133.909 119.450 74.952 1.00 5.52  139 M 1 \nATOM   2183 H  HB2  . SER M  1 140 ? 131.153 118.933 74.647 1.00 5.52  139 M 1 \nATOM   2184 H  HB3  . SER M  1 140 ? 131.806 119.255 76.058 1.00 5.52  139 M 1 \nATOM   2185 H  HG   . SER M  1 140 ? 130.981 121.049 75.132 1.00 5.52  139 M 1 \nATOM   2186 N  N    . GLU M  1 141 ? 132.881 116.482 74.341 1.00 5.44  140 M 1 \nATOM   2187 C  CA   . GLU M  1 141 ? 133.127 115.075 74.648 1.00 5.44  140 M 1 \nATOM   2188 C  C    . GLU M  1 141 ? 134.614 114.753 74.571 1.00 5.44  140 M 1 \nATOM   2189 O  O    . GLU M  1 141 ? 135.157 114.061 75.441 1.00 5.44  140 M 1 \nATOM   2190 C  CB   . GLU M  1 141 ? 132.330 114.187 73.684 1.00 5.44  140 M 1 \nATOM   2191 C  CG   . GLU M  1 141 ? 132.429 112.681 73.926 1.00 5.44  140 M 1 \nATOM   2192 C  CD   . GLU M  1 141 ? 133.700 112.071 73.369 1.00 5.44  140 M 1 \nATOM   2193 O  OE1  . GLU M  1 141 ? 134.274 112.642 72.421 1.00 5.44  140 M 1 \nATOM   2194 O  OE2  . GLU M  1 141 ? 134.137 111.025 73.895 1.00 5.44  140 M 1 \nATOM   2195 H  H    . GLU M  1 141 ? 132.350 116.619 73.678 1.00 5.44  140 M 1 \nATOM   2196 H  HA   . GLU M  1 141 ? 132.818 114.891 75.549 1.00 5.44  140 M 1 \nATOM   2197 H  HB2  . GLU M  1 141 ? 131.391 114.422 73.750 1.00 5.44  140 M 1 \nATOM   2198 H  HB3  . GLU M  1 141 ? 132.635 114.353 72.778 1.00 5.44  140 M 1 \nATOM   2199 H  HG2  . GLU M  1 141 ? 132.425 112.522 74.882 1.00 5.44  140 M 1 \nATOM   2200 H  HG3  . GLU M  1 141 ? 131.671 112.224 73.528 1.00 5.44  140 M 1 \nATOM   2201 N  N    . GLN M  1 142 ? 135.292 115.259 73.542 1.00 4.79  141 M 1 \nATOM   2202 C  CA   . GLN M  1 142 ? 136.713 114.986 73.383 1.00 4.79  141 M 1 \nATOM   2203 C  C    . GLN M  1 142 ? 137.530 115.642 74.486 1.00 4.79  141 M 1 \nATOM   2204 O  O    . GLN M  1 142 ? 138.505 115.063 74.971 1.00 4.79  141 M 1 \nATOM   2205 C  CB   . GLN M  1 142 ? 137.196 115.455 72.011 1.00 4.79  141 M 1 \nATOM   2206 C  CG   . GLN M  1 142 ? 136.700 114.641 70.837 1.00 4.79  141 M 1 \nATOM   2207 C  CD   . GLN M  1 142 ? 137.195 113.215 70.874 1.00 4.79  141 M 1 \nATOM   2208 O  OE1  . GLN M  1 142 ? 136.418 112.283 71.061 1.00 4.79  141 M 1 \nATOM   2209 N  NE2  . GLN M  1 142 ? 138.501 113.044 70.749 1.00 4.79  141 M 1 \nATOM   2210 H  H    . GLN M  1 142 ? 134.959 115.766 72.933 1.00 4.79  141 M 1 \nATOM   2211 H  HA   . GLN M  1 142 ? 136.847 114.028 73.454 1.00 4.79  141 M 1 \nATOM   2212 H  HB2  . GLN M  1 142 ? 136.902 116.370 71.877 1.00 4.79  141 M 1 \nATOM   2213 H  HB3  . GLN M  1 142 ? 138.165 115.421 71.989 1.00 4.79  141 M 1 \nATOM   2214 H  HG2  . GLN M  1 142 ? 135.730 114.621 70.832 1.00 4.79  141 M 1 \nATOM   2215 H  HG3  . GLN M  1 142 ? 137.031 115.050 70.022 1.00 4.79  141 M 1 \nATOM   2216 H  HE21 . GLN M  1 142 ? 139.007 113.729 70.633 1.00 4.79  141 M 1 \nATOM   2217 H  HE22 . GLN M  1 142 ? 138.848 112.257 70.771 1.00 4.79  141 M 1 \nATOM   2218 N  N    . VAL M  1 143 ? 137.154 116.857 74.890 1.00 4.49  142 M 1 \nATOM   2219 C  CA   . VAL M  1 143 ? 137.859 117.519 75.985 1.00 4.49  142 M 1 \nATOM   2220 C  C    . VAL M  1 143 ? 137.719 116.709 77.269 1.00 4.49  142 M 1 \nATOM   2221 O  O    . VAL M  1 143 ? 138.703 116.478 77.990 1.00 4.49  142 M 1 \nATOM   2222 C  CB   . VAL M  1 143 ? 137.350 118.966 76.144 1.00 4.49  142 M 1 \nATOM   2223 C  CG1  . VAL M  1 143 ? 137.845 119.590 77.428 1.00 4.49  142 M 1 \nATOM   2224 C  CG2  . VAL M  1 143 ? 137.827 119.821 74.969 1.00 4.49  142 M 1 \nATOM   2225 H  H    . VAL M  1 143 ? 136.490 117.304 74.577 1.00 4.49  142 M 1 \nATOM   2226 H  HA   . VAL M  1 143 ? 138.802 117.565 75.764 1.00 4.49  142 M 1 \nATOM   2227 H  HB   . VAL M  1 143 ? 136.380 118.968 76.157 1.00 4.49  142 M 1 \nATOM   2228 H  HG11 . VAL M  1 143 ? 137.733 120.551 77.358 1.00 4.49  142 M 1 \nATOM   2229 H  HG12 . VAL M  1 143 ? 137.317 119.266 78.174 1.00 4.49  142 M 1 \nATOM   2230 H  HG13 . VAL M  1 143 ? 138.783 119.383 77.559 1.00 4.49  142 M 1 \nATOM   2231 H  HG21 . VAL M  1 143 ? 137.236 120.583 74.866 1.00 4.49  142 M 1 \nATOM   2232 H  HG22 . VAL M  1 143 ? 138.728 120.131 75.150 1.00 4.49  142 M 1 \nATOM   2233 H  HG23 . VAL M  1 143 ? 137.831 119.297 74.152 1.00 4.49  142 M 1 \nATOM   2234 N  N    . LYS M  1 144 ? 136.507 116.220 77.544 1.00 4.83  143 M 1 \nATOM   2235 C  CA   . LYS M  1 144 ? 136.288 115.404 78.735 1.00 4.83  143 M 1 \nATOM   2236 C  C    . LYS M  1 144 ? 137.105 114.119 78.678 1.00 4.83  143 M 1 \nATOM   2237 O  O    . LYS M  1 144 ? 137.698 113.704 79.680 1.00 4.83  143 M 1 \nATOM   2238 C  CB   . LYS M  1 144 ? 134.801 115.079 78.899 1.00 4.83  143 M 1 \nATOM   2239 C  CG   . LYS M  1 144 ? 133.922 116.256 79.272 1.00 4.83  143 M 1 \nATOM   2240 C  CD   . LYS M  1 144 ? 132.501 115.808 79.620 1.00 4.83  143 M 1 \nATOM   2241 C  CE   . LYS M  1 144 ? 131.707 115.401 78.389 1.00 4.83  143 M 1 \nATOM   2242 N  NZ   . LYS M  1 144 ? 130.284 115.092 78.707 1.00 4.83  143 M 1 \nATOM   2243 H  H    . LYS M  1 144 ? 135.811 116.327 77.050 1.00 4.83  143 M 1 \nATOM   2244 H  HA   . LYS M  1 144 ? 136.569 115.910 79.514 1.00 4.83  143 M 1 \nATOM   2245 H  HB2  . LYS M  1 144 ? 134.473 114.724 78.058 1.00 4.83  143 M 1 \nATOM   2246 H  HB3  . LYS M  1 144 ? 134.693 114.412 79.595 1.00 4.83  143 M 1 \nATOM   2247 H  HG2  . LYS M  1 144 ? 134.301 116.702 80.045 1.00 4.83  143 M 1 \nATOM   2248 H  HG3  . LYS M  1 144 ? 133.865 116.875 78.527 1.00 4.83  143 M 1 \nATOM   2249 H  HD2  . LYS M  1 144 ? 132.542 115.043 80.215 1.00 4.83  143 M 1 \nATOM   2250 H  HD3  . LYS M  1 144 ? 132.032 116.540 80.050 1.00 4.83  143 M 1 \nATOM   2251 H  HE2  . LYS M  1 144 ? 131.724 116.123 77.741 1.00 4.83  143 M 1 \nATOM   2252 H  HE3  . LYS M  1 144 ? 132.098 114.597 78.012 1.00 4.83  143 M 1 \nATOM   2253 H  HZ1  . LYS M  1 144 ? 129.888 114.729 77.997 1.00 4.83  143 M 1 \nATOM   2254 H  HZ2  . LYS M  1 144 ? 130.240 114.522 79.389 1.00 4.83  143 M 1 \nATOM   2255 H  HZ3  . LYS M  1 144 ? 129.853 115.839 78.925 1.00 4.83  143 M 1 \nATOM   2256 N  N    . SER M  1 145 ? 137.167 113.489 77.507 1.00 4.26  144 M 1 \nATOM   2257 C  CA   . SER M  1 145 ? 137.864 112.212 77.389 1.00 4.26  144 M 1 \nATOM   2258 C  C    . SER M  1 145 ? 139.374 112.391 77.507 1.00 4.26  144 M 1 \nATOM   2259 O  O    . SER M  1 145 ? 140.058 111.572 78.133 1.00 4.26  144 M 1 \nATOM   2260 C  CB   . SER M  1 145 ? 137.494 111.546 76.069 1.00 4.26  144 M 1 \nATOM   2261 O  OG   . SER M  1 145 ? 136.114 111.241 76.049 1.00 4.26  144 M 1 \nATOM   2262 H  H    . SER M  1 145 ? 136.834 113.784 76.771 1.00 4.26  144 M 1 \nATOM   2263 H  HA   . SER M  1 145 ? 137.575 111.628 78.108 1.00 4.26  144 M 1 \nATOM   2264 H  HB2  . SER M  1 145 ? 137.692 112.151 75.337 1.00 4.26  144 M 1 \nATOM   2265 H  HB3  . SER M  1 145 ? 138.006 110.728 75.968 1.00 4.26  144 M 1 \nATOM   2266 H  HG   . SER M  1 145 ? 135.685 111.835 76.460 1.00 4.26  144 M 1 \nATOM   2267 N  N    . ILE M  1 146 ? 139.906 113.464 76.921 1.00 3.93  145 M 1 \nATOM   2268 C  CA   . ILE M  1 146 ? 141.327 113.772 77.054 1.00 3.93  145 M 1 \nATOM   2269 C  C    . ILE M  1 146 ? 141.676 114.000 78.517 1.00 3.93  145 M 1 \nATOM   2270 O  O    . ILE M  1 146 ? 142.687 113.494 79.012 1.00 3.93  145 M 1 \nATOM   2271 C  CB   . ILE M  1 146 ? 141.700 114.985 76.176 1.00 3.93  145 M 1 \nATOM   2272 C  CG1  . ILE M  1 146 ? 141.605 114.623 74.688 1.00 3.93  145 M 1 \nATOM   2273 C  CG2  . ILE M  1 146 ? 143.080 115.516 76.549 1.00 3.93  145 M 1 \nATOM   2274 C  CD1  . ILE M  1 146 ? 141.639 115.802 73.726 1.00 3.93  145 M 1 \nATOM   2275 H  H    . ILE M  1 146 ? 139.459 114.044 76.469 1.00 3.93  145 M 1 \nATOM   2276 H  HA   . ILE M  1 146 ? 141.845 113.016 76.736 1.00 3.93  145 M 1 \nATOM   2277 H  HB   . ILE M  1 146 ? 141.057 115.690 76.348 1.00 3.93  145 M 1 \nATOM   2278 H  HG12 . ILE M  1 146 ? 142.348 114.041 74.462 1.00 3.93  145 M 1 \nATOM   2279 H  HG13 . ILE M  1 146 ? 140.779 114.139 74.530 1.00 3.93  145 M 1 \nATOM   2280 H  HG21 . ILE M  1 146 ? 143.453 116.028 75.814 1.00 3.93  145 M 1 \nATOM   2281 H  HG22 . ILE M  1 146 ? 143.004 116.096 77.322 1.00 3.93  145 M 1 \nATOM   2282 H  HG23 . ILE M  1 146 ? 143.670 114.772 76.744 1.00 3.93  145 M 1 \nATOM   2283 H  HD11 . ILE M  1 146 ? 141.513 115.471 72.823 1.00 3.93  145 M 1 \nATOM   2284 H  HD12 . ILE M  1 146 ? 140.926 116.419 73.952 1.00 3.93  145 M 1 \nATOM   2285 H  HD13 . ILE M  1 146 ? 142.493 116.259 73.778 1.00 3.93  145 M 1 \nATOM   2286 N  N    . LYS M  1 147 ? 140.838 114.750 79.232 1.00 3.89  146 M 1 \nATOM   2287 C  CA   . LYS M  1 147 ? 141.100 115.021 80.643 1.00 3.89  146 M 1 \nATOM   2288 C  C    . LYS M  1 147 ? 141.039 113.741 81.475 1.00 3.89  146 M 1 \nATOM   2289 O  O    . LYS M  1 147 ? 141.881 113.521 82.354 1.00 3.89  146 M 1 \nATOM   2290 C  CB   . LYS M  1 147 ? 140.111 116.076 81.137 1.00 3.89  146 M 1 \nATOM   2291 C  CG   . LYS M  1 147 ? 140.203 116.479 82.594 1.00 3.89  146 M 1 \nATOM   2292 C  CD   . LYS M  1 147 ? 141.543 117.081 82.931 1.00 3.89  146 M 1 \nATOM   2293 C  CE   . LYS M  1 147 ? 141.512 117.806 84.271 1.00 3.89  146 M 1 \nATOM   2294 N  NZ   . LYS M  1 147 ? 141.164 116.952 85.399 1.00 3.89  146 M 1 \nATOM   2295 H  H    . LYS M  1 147 ? 140.115 115.097 78.920 1.00 3.89  146 M 1 \nATOM   2296 H  HA   . LYS M  1 147 ? 141.991 115.394 80.726 1.00 3.89  146 M 1 \nATOM   2297 H  HB2  . LYS M  1 147 ? 140.260 116.884 80.621 1.00 3.89  146 M 1 \nATOM   2298 H  HB3  . LYS M  1 147 ? 139.208 115.763 80.971 1.00 3.89  146 M 1 \nATOM   2299 H  HG2  . LYS M  1 147 ? 139.522 117.145 82.774 1.00 3.89  146 M 1 \nATOM   2300 H  HG3  . LYS M  1 147 ? 140.052 115.711 83.167 1.00 3.89  146 M 1 \nATOM   2301 H  HD2  . LYS M  1 147 ? 142.200 116.369 82.982 1.00 3.89  146 M 1 \nATOM   2302 H  HD3  . LYS M  1 147 ? 141.797 117.719 82.246 1.00 3.89  146 M 1 \nATOM   2303 H  HE2  . LYS M  1 147 ? 142.398 118.159 84.450 1.00 3.89  146 M 1 \nATOM   2304 H  HE3  . LYS M  1 147 ? 140.870 118.533 84.241 1.00 3.89  146 M 1 \nATOM   2305 H  HZ1  . LYS M  1 147 ? 140.321 116.682 85.309 1.00 3.89  146 M 1 \nATOM   2306 H  HZ2  . LYS M  1 147 ? 141.684 116.230 85.411 1.00 3.89  146 M 1 \nATOM   2307 H  HZ3  . LYS M  1 147 ? 141.256 117.398 86.164 1.00 3.89  146 M 1 \nATOM   2308 N  N    . GLU M  1 148 ? 140.069 112.873 81.186 1.00 3.93  147 M 1 \nATOM   2309 C  CA   . GLU M  1 148 ? 139.953 111.593 81.882 1.00 3.93  147 M 1 \nATOM   2310 C  C    . GLU M  1 148 ? 141.201 110.738 81.676 1.00 3.93  147 M 1 \nATOM   2311 O  O    . GLU M  1 148 ? 141.770 110.195 82.632 1.00 3.93  147 M 1 \nATOM   2312 C  CB   . GLU M  1 148 ? 138.707 110.863 81.379 1.00 3.93  147 M 1 \nATOM   2313 C  CG   . GLU M  1 148 ? 138.412 109.544 82.057 1.00 3.93  147 M 1 \nATOM   2314 C  CD   . GLU M  1 148 ? 137.135 108.897 81.547 1.00 3.93  147 M 1 \nATOM   2315 O  OE1  . GLU M  1 148 ? 136.491 109.475 80.647 1.00 3.93  147 M 1 \nATOM   2316 O  OE2  . GLU M  1 148 ? 136.772 107.813 82.046 1.00 3.93  147 M 1 \nATOM   2317 H  H    . GLU M  1 148 ? 139.476 112.996 80.575 1.00 3.93  147 M 1 \nATOM   2318 H  HA   . GLU M  1 148 ? 139.842 111.748 82.833 1.00 3.93  147 M 1 \nATOM   2319 H  HB2  . GLU M  1 148 ? 137.937 111.438 81.511 1.00 3.93  147 M 1 \nATOM   2320 H  HB3  . GLU M  1 148 ? 138.820 110.688 80.432 1.00 3.93  147 M 1 \nATOM   2321 H  HG2  . GLU M  1 148 ? 139.142 108.926 81.893 1.00 3.93  147 M 1 \nATOM   2322 H  HG3  . GLU M  1 148 ? 138.316 109.694 83.011 1.00 3.93  147 M 1 \nATOM   2323 N  N    . LEU M  1 149 ? 141.633 110.603 80.423 1.00 3.53  148 M 1 \nATOM   2324 C  CA   . LEU M  1 149 ? 142.801 109.782 80.110 1.00 3.53  148 M 1 \nATOM   2325 C  C    . LEU M  1 149 ? 144.070 110.354 80.727 1.00 3.53  148 M 1 \nATOM   2326 O  O    . LEU M  1 149 ? 144.912 109.604 81.235 1.00 3.53  148 M 1 \nATOM   2327 C  CB   . LEU M  1 149 ? 142.940 109.646 78.594 1.00 3.53  148 M 1 \nATOM   2328 C  CG   . LEU M  1 149 ? 141.908 108.748 77.901 1.00 3.53  148 M 1 \nATOM   2329 C  CD1  . LEU M  1 149 ? 141.939 108.934 76.394 1.00 3.53  148 M 1 \nATOM   2330 C  CD2  . LEU M  1 149 ? 142.163 107.282 78.252 1.00 3.53  148 M 1 \nATOM   2331 H  H    . LEU M  1 149 ? 141.264 110.980 79.743 1.00 3.53  148 M 1 \nATOM   2332 H  HA   . LEU M  1 149 ? 142.663 108.899 80.487 1.00 3.53  148 M 1 \nATOM   2333 H  HB2  . LEU M  1 149 ? 142.866 110.527 78.196 1.00 3.53  148 M 1 \nATOM   2334 H  HB3  . LEU M  1 149 ? 143.824 109.298 78.397 1.00 3.53  148 M 1 \nATOM   2335 H  HG   . LEU M  1 149 ? 141.017 108.970 78.215 1.00 3.53  148 M 1 \nATOM   2336 H  HD11 . LEU M  1 149 ? 141.323 108.313 75.976 1.00 3.53  148 M 1 \nATOM   2337 H  HD12 . LEU M  1 149 ? 141.662 109.840 76.186 1.00 3.53  148 M 1 \nATOM   2338 H  HD13 . LEU M  1 149 ? 142.840 108.782 76.068 1.00 3.53  148 M 1 \nATOM   2339 H  HD21 . LEU M  1 149 ? 141.692 106.719 77.618 1.00 3.53  148 M 1 \nATOM   2340 H  HD22 . LEU M  1 149 ? 143.113 107.090 78.213 1.00 3.53  148 M 1 \nATOM   2341 H  HD23 . LEU M  1 149 ? 141.832 107.102 79.146 1.00 3.53  148 M 1 \nATOM   2342 N  N    . GLY M  1 150 ? 144.227 111.677 80.690 1.00 3.59  149 M 1 \nATOM   2343 C  CA   . GLY M  1 150 ? 145.373 112.298 81.331 1.00 3.59  149 M 1 \nATOM   2344 C  C    . GLY M  1 150 ? 145.401 112.034 82.822 1.00 3.59  149 M 1 \nATOM   2345 O  O    . GLY M  1 150 ? 146.454 111.747 83.394 1.00 3.59  149 M 1 \nATOM   2346 H  H    . GLY M  1 150 ? 143.677 112.226 80.321 1.00 3.59  149 M 1 \nATOM   2347 H  HA2  . GLY M  1 150 ? 146.196 111.985 80.925 1.00 3.59  149 M 1 \nATOM   2348 H  HA3  . GLY M  1 150 ? 145.322 113.257 81.197 1.00 3.59  149 M 1 \nATOM   2349 N  N    . ASP M  1 151 ? 144.233 112.095 83.464 1.00 3.83  150 M 1 \nATOM   2350 C  CA   . ASP M  1 151 ? 144.141 111.783 84.884 1.00 3.83  150 M 1 \nATOM   2351 C  C    . ASP M  1 151 ? 144.541 110.337 85.159 1.00 3.83  150 M 1 \nATOM   2352 O  O    . ASP M  1 151 ? 145.269 110.058 86.121 1.00 3.83  150 M 1 \nATOM   2353 C  CB   . ASP M  1 151 ? 142.722 112.049 85.382 1.00 3.83  150 M 1 \nATOM   2354 C  CG   . ASP M  1 151 ? 142.356 113.522 85.358 1.00 3.83  150 M 1 \nATOM   2355 O  OD1  . ASP M  1 151 ? 143.268 114.366 85.450 1.00 3.83  150 M 1 \nATOM   2356 O  OD2  . ASP M  1 151 ? 141.152 113.836 85.264 1.00 3.83  150 M 1 \nATOM   2357 H  H    . ASP M  1 151 ? 143.483 112.301 83.098 1.00 3.83  150 M 1 \nATOM   2358 H  HA   . ASP M  1 151 ? 144.747 112.358 85.377 1.00 3.83  150 M 1 \nATOM   2359 H  HB2  . ASP M  1 151 ? 142.097 111.579 84.809 1.00 3.83  150 M 1 \nATOM   2360 H  HB3  . ASP M  1 151 ? 142.633 111.725 86.292 1.00 3.83  150 M 1 \nATOM   2361 N  N    . HIS M  1 152 ? 144.078 109.425 84.300 1.00 3.63  151 M 1 \nATOM   2362 C  CA   . HIS M  1 152 ? 144.374 107.967 84.419 1.00 3.63  151 M 1 \nATOM   2363 C  C    . HIS M  1 152 ? 145.893 107.773 84.328 1.00 3.63  151 M 1 \nATOM   2364 O  O    . HIS M  1 152 ? 146.470 107.176 85.208 1.00 3.63  151 M 1 \nATOM   2365 C  CB   . HIS M  1 152 ? 143.627 107.139 83.350 1.00 3.63  151 M 1 \nATOM   2366 C  CG   . HIS M  1 152 ? 142.152 107.067 83.552 1.00 3.63  151 M 1 \nATOM   2367 N  ND1  . HIS M  1 152 ? 141.562 107.495 84.711 1.00 3.63  151 M 1 \nATOM   2368 C  CD2  . HIS M  1 152 ? 141.148 106.653 82.753 1.00 3.63  151 M 1 \nATOM   2369 C  CE1  . HIS M  1 152 ? 140.263 107.300 84.645 1.00 3.63  151 M 1 \nATOM   2370 N  NE2  . HIS M  1 152 ? 139.980 106.801 83.453 1.00 3.63  151 M 1 \nATOM   2371 H  H    . HIS M  1 152 ? 143.551 109.623 83.584 1.00 3.63  151 M 1 \nATOM   2372 H  HA   . HIS M  1 152 ? 144.079 107.668 85.311 1.00 3.63  151 M 1 \nATOM   2373 H  HB2  . HIS M  1 152 ? 143.806 107.531 82.466 1.00 3.63  151 M 1 \nATOM   2374 H  HB3  . HIS M  1 152 ? 143.990 106.226 83.347 1.00 3.63  151 M 1 \nATOM   2375 H  HD1  . HIS M  1 152 ? 141.990 107.805 85.410 1.00 3.63  151 M 1 \nATOM   2376 H  HD2  . HIS M  1 152 ? 141.232 106.303 81.885 1.00 3.63  151 M 1 \nATOM   2377 H  HE1  . HIS M  1 152 ? 139.639 107.518 85.316 1.00 3.63  151 M 1 \nATOM   2378 N  N    . VAL M  1 153 ? 146.528 108.396 83.356 1.00 3.75  152 M 1 \nATOM   2379 C  CA   . VAL M  1 153 ? 147.971 108.297 83.143 1.00 3.75  152 M 1 \nATOM   2380 C  C    . VAL M  1 153 ? 148.724 108.840 84.351 1.00 3.75  152 M 1 \nATOM   2381 O  O    . VAL M  1 153 ? 149.692 108.237 84.822 1.00 3.75  152 M 1 \nATOM   2382 C  CB   . VAL M  1 153 ? 148.374 109.028 81.848 1.00 3.75  152 M 1 \nATOM   2383 C  CG1  . VAL M  1 153 ? 149.883 109.083 81.695 1.00 3.75  152 M 1 \nATOM   2384 C  CG2  . VAL M  1 153 ? 147.762 108.349 80.624 1.00 3.75  152 M 1 \nATOM   2385 H  H    . VAL M  1 153 ? 146.125 108.884 82.774 1.00 3.75  152 M 1 \nATOM   2386 H  HA   . VAL M  1 153 ? 148.214 107.364 83.040 1.00 3.75  152 M 1 \nATOM   2387 H  HB   . VAL M  1 153 ? 148.054 109.943 81.879 1.00 3.75  152 M 1 \nATOM   2388 H  HG11 . VAL M  1 153 ? 150.096 109.335 80.783 1.00 3.75  152 M 1 \nATOM   2389 H  HG12 . VAL M  1 153 ? 150.253 109.751 82.293 1.00 3.75  152 M 1 \nATOM   2390 H  HG13 . VAL M  1 153 ? 150.261 108.211 81.886 1.00 3.75  152 M 1 \nATOM   2391 H  HG21 . VAL M  1 153 ? 147.770 108.976 79.884 1.00 3.75  152 M 1 \nATOM   2392 H  HG22 . VAL M  1 153 ? 148.296 107.572 80.397 1.00 3.75  152 M 1 \nATOM   2393 H  HG23 . VAL M  1 153 ? 146.848 108.071 80.793 1.00 3.75  152 M 1 \nATOM   2394 N  N    . THR M  1 154 ? 148.291 109.995 84.858 1.00 3.85  153 M 1 \nATOM   2395 C  CA   . THR M  1 154 ? 148.932 110.603 86.022 1.00 3.85  153 M 1 \nATOM   2396 C  C    . THR M  1 154 ? 148.898 109.660 87.218 1.00 3.85  153 M 1 \nATOM   2397 O  O    . THR M  1 154 ? 149.918 109.443 87.885 1.00 3.85  153 M 1 \nATOM   2398 C  CB   . THR M  1 154 ? 148.248 111.938 86.336 1.00 3.85  153 M 1 \nATOM   2399 O  OG1  . THR M  1 154 ? 148.471 112.832 85.239 1.00 3.85  153 M 1 \nATOM   2400 C  CG2  . THR M  1 154 ? 148.742 112.558 87.655 1.00 3.85  153 M 1 \nATOM   2401 H  H    . THR M  1 154 ? 147.608 110.423 84.559 1.00 3.85  153 M 1 \nATOM   2402 H  HA   . THR M  1 154 ? 149.860 110.796 85.817 1.00 3.85  153 M 1 \nATOM   2403 H  HB   . THR M  1 154 ? 147.293 111.795 86.429 1.00 3.85  153 M 1 \nATOM   2404 H  HG1  . THR M  1 154 ? 147.948 112.664 84.604 1.00 3.85  153 M 1 \nATOM   2405 H  HG21 . THR M  1 154 ? 148.362 113.444 87.759 1.00 3.85  153 M 1 \nATOM   2406 H  HG22 . THR M  1 154 ? 148.441 112.039 88.417 1.00 3.85  153 M 1 \nATOM   2407 H  HG23 . THR M  1 154 ? 149.709 112.627 87.668 1.00 3.85  153 M 1 \nATOM   2408 N  N    . ASN M  1 155 ? 147.717 109.104 87.452 1.00 3.90  154 M 1 \nATOM   2409 C  CA   . ASN M  1 155 ? 147.514 108.206 88.617 1.00 3.90  154 M 1 \nATOM   2410 C  C    . ASN M  1 155 ? 148.382 106.953 88.457 1.00 3.90  154 M 1 \nATOM   2411 O  O    . ASN M  1 155 ? 149.095 106.632 89.362 1.00 3.90  154 M 1 \nATOM   2412 C  CB   . ASN M  1 155 ? 146.035 107.938 88.833 1.00 3.90  154 M 1 \nATOM   2413 C  CG   . ASN M  1 155 ? 145.392 109.062 89.613 1.00 3.90  154 M 1 \nATOM   2414 O  OD1  . ASN M  1 155 ? 145.664 109.232 90.787 1.00 3.90  154 M 1 \nATOM   2415 N  ND2  . ASN M  1 155 ? 144.564 109.846 88.966 1.00 3.90  154 M 1 \nATOM   2416 H  H    . ASN M  1 155 ? 147.019 109.144 86.870 1.00 3.90  154 M 1 \nATOM   2417 H  HA   . ASN M  1 155 ? 147.833 108.687 89.416 1.00 3.90  154 M 1 \nATOM   2418 H  HB2  . ASN M  1 155 ? 145.592 107.849 87.964 1.00 3.90  154 M 1 \nATOM   2419 H  HB3  . ASN M  1 155 ? 145.926 107.097 89.323 1.00 3.90  154 M 1 \nATOM   2420 H  HD21 . ASN M  1 155 ? 144.376 109.687 88.117 1.00 3.90  154 M 1 \nATOM   2421 H  HD22 . ASN M  1 155 ? 144.194 110.535 89.378 1.00 3.90  154 M 1 \nATOM   2422 N  N    . LEU M  1 156 ? 148.402 106.337 87.289 1.00 4.14  155 M 1 \nATOM   2423 C  CA   . LEU M  1 156 ? 149.191 105.131 87.050 1.00 4.14  155 M 1 \nATOM   2424 C  C    . LEU M  1 156 ? 150.684 105.404 87.191 1.00 4.14  155 M 1 \nATOM   2425 O  O    . LEU M  1 156 ? 151.413 104.605 87.787 1.00 4.14  155 M 1 \nATOM   2426 C  CB   . LEU M  1 156 ? 148.864 104.560 85.670 1.00 4.14  155 M 1 \nATOM   2427 C  CG   . LEU M  1 156 ? 147.513 103.856 85.526 1.00 4.14  155 M 1 \nATOM   2428 C  CD1  . LEU M  1 156 ? 147.157 103.593 84.075 1.00 4.14  155 M 1 \nATOM   2429 C  CD2  . LEU M  1 156 ? 147.544 102.535 86.278 1.00 4.14  155 M 1 \nATOM   2430 H  H    . LEU M  1 156 ? 147.967 106.623 86.605 1.00 4.14  155 M 1 \nATOM   2431 H  HA   . LEU M  1 156 ? 148.956 104.473 87.722 1.00 4.14  155 M 1 \nATOM   2432 H  HB2  . LEU M  1 156 ? 148.864 105.293 85.035 1.00 4.14  155 M 1 \nATOM   2433 H  HB3  . LEU M  1 156 ? 149.564 103.938 85.417 1.00 4.14  155 M 1 \nATOM   2434 H  HG   . LEU M  1 156 ? 146.815 104.402 85.921 1.00 4.14  155 M 1 \nATOM   2435 H  HD11 . LEU M  1 156 ? 146.301 103.139 84.044 1.00 4.14  155 M 1 \nATOM   2436 H  HD12 . LEU M  1 156 ? 147.092 104.435 83.598 1.00 4.14  155 M 1 \nATOM   2437 H  HD13 . LEU M  1 156 ? 147.842 103.039 83.669 1.00 4.14  155 M 1 \nATOM   2438 H  HD21 . LEU M  1 156 ? 146.739 102.033 86.079 1.00 4.14  155 M 1 \nATOM   2439 H  HD22 . LEU M  1 156 ? 148.323 102.036 85.987 1.00 4.14  155 M 1 \nATOM   2440 H  HD23 . LEU M  1 156 ? 147.597 102.688 87.234 1.00 4.14  155 M 1 \nATOM   2441 N  N    . ARG M  1 157 ? 151.130 106.511 86.611 1.00 4.62  156 M 1 \nATOM   2442 C  CA   . ARG M  1 157 ? 152.566 106.885 86.712 1.00 4.62  156 M 1 \nATOM   2443 C  C    . ARG M  1 157 ? 152.921 107.087 88.185 1.00 4.62  156 M 1 \nATOM   2444 O  O    . ARG M  1 157 ? 153.909 106.536 88.619 1.00 4.62  156 M 1 \nATOM   2445 C  CB   . ARG M  1 157 ? 152.855 108.202 85.999 1.00 4.62  156 M 1 \nATOM   2446 C  CG   . ARG M  1 157 ? 152.830 108.083 84.492 1.00 4.62  156 M 1 \nATOM   2447 C  CD   . ARG M  1 157 ? 153.154 109.409 83.844 1.00 4.62  156 M 1 \nATOM   2448 N  NE   . ARG M  1 157 ? 153.240 109.244 82.412 1.00 4.62  156 M 1 \nATOM   2449 C  CZ   . ARG M  1 157 ? 152.921 110.186 81.543 1.00 4.62  156 M 1 \nATOM   2450 N  NH1  . ARG M  1 157 ? 152.486 111.355 81.979 1.00 4.62  156 M 1 \nATOM   2451 N  NH2  . ARG M  1 157 ? 153.027 109.953 80.247 1.00 4.62  156 M 1 \nATOM   2452 H  H    . ARG M  1 157 ? 150.642 107.005 86.024 1.00 4.62  156 M 1 \nATOM   2453 H  HA   . ARG M  1 157 ? 153.121 106.166 86.331 1.00 4.62  156 M 1 \nATOM   2454 H  HB2  . ARG M  1 157 ? 152.188 108.864 86.277 1.00 4.62  156 M 1 \nATOM   2455 H  HB3  . ARG M  1 157 ? 153.737 108.524 86.279 1.00 4.62  156 M 1 \nATOM   2456 H  HG2  . ARG M  1 157 ? 153.485 107.412 84.204 1.00 4.62  156 M 1 \nATOM   2457 H  HG3  . ARG M  1 157 ? 151.940 107.789 84.201 1.00 4.62  156 M 1 \nATOM   2458 H  HD2  . ARG M  1 157 ? 152.455 110.063 84.060 1.00 4.62  156 M 1 \nATOM   2459 H  HD3  . ARG M  1 157 ? 154.009 109.746 84.189 1.00 4.62  156 M 1 \nATOM   2460 H  HE   . ARG M  1 157 ? 153.523 108.480 82.102 1.00 4.62  156 M 1 \nATOM   2461 H  HH11 . ARG M  1 157 ? 152.417 111.503 82.842 1.00 4.62  156 M 1 \nATOM   2462 H  HH12 . ARG M  1 157 ? 152.272 111.983 81.403 1.00 4.62  156 M 1 \nATOM   2463 H  HH21 . ARG M  1 157 ? 153.315 109.170 79.965 1.00 4.62  156 M 1 \nATOM   2464 H  HH22 . ARG M  1 157 ? 152.811 110.582 79.670 1.00 4.62  156 M 1 \nATOM   2465 N  N    . LYS M  1 158 ? 152.072 107.791 88.925 1.00 5.18  157 M 1 \nATOM   2466 C  CA   . LYS M  1 158 ? 152.305 108.139 90.355 1.00 5.18  157 M 1 \nATOM   2467 C  C    . LYS M  1 158 ? 152.363 106.858 91.193 1.00 5.18  157 M 1 \nATOM   2468 O  O    . LYS M  1 158 ? 153.242 106.774 92.033 1.00 5.18  157 M 1 \nATOM   2469 C  CB   . LYS M  1 158 ? 151.255 109.143 90.834 1.00 5.18  157 M 1 \nATOM   2470 C  CG   . LYS M  1 158 ? 151.459 110.545 90.277 1.00 5.18  157 M 1 \nATOM   2471 C  CD   . LYS M  1 158 ? 150.766 111.657 91.039 1.00 5.18  157 M 1 \nATOM   2472 C  CE   . LYS M  1 158 ? 151.182 113.041 90.582 1.00 5.18  157 M 1 \nATOM   2473 N  NZ   . LYS M  1 158 ? 152.590 113.343 90.962 1.00 5.18  157 M 1 \nATOM   2474 H  H    . LYS M  1 158 ? 151.240 108.010 88.630 1.00 5.18  157 M 1 \nATOM   2475 H  HA   . LYS M  1 158 ? 153.187 108.574 90.412 1.00 5.18  157 M 1 \nATOM   2476 H  HB2  . LYS M  1 158 ? 150.368 108.823 90.568 1.00 5.18  157 M 1 \nATOM   2477 H  HB3  . LYS M  1 158 ? 151.282 109.184 91.812 1.00 5.18  157 M 1 \nATOM   2478 H  HG2  . LYS M  1 158 ? 152.422 110.733 90.258 1.00 5.18  157 M 1 \nATOM   2479 H  HG3  . LYS M  1 158 ? 151.140 110.558 89.349 1.00 5.18  157 M 1 \nATOM   2480 H  HD2  . LYS M  1 158 ? 149.796 111.565 90.928 1.00 5.18  157 M 1 \nATOM   2481 H  HD3  . LYS M  1 158 ? 150.970 111.564 91.995 1.00 5.18  157 M 1 \nATOM   2482 H  HE2  . LYS M  1 158 ? 151.094 113.105 89.612 1.00 5.18  157 M 1 \nATOM   2483 H  HE3  . LYS M  1 158 ? 150.594 113.708 90.984 1.00 5.18  157 M 1 \nATOM   2484 H  HZ1  . LYS M  1 158 ? 152.792 114.199 90.737 1.00 5.18  157 M 1 \nATOM   2485 H  HZ2  . LYS M  1 158 ? 152.696 113.238 91.856 1.00 5.18  157 M 1 \nATOM   2486 H  HZ3  . LYS M  1 158 ? 153.153 112.781 90.528 1.00 5.18  157 M 1 \nATOM   2487 N  N    . MET M  1 159 ? 151.514 105.879 90.895 1.00 5.22  158 M 1 \nATOM   2488 C  CA   . MET M  1 159 ? 151.432 104.578 91.613 1.00 5.22  158 M 1 \nATOM   2489 C  C    . MET M  1 159 ? 152.658 103.713 91.315 1.00 5.22  158 M 1 \nATOM   2490 O  O    . MET M  1 159 ? 152.825 102.725 91.997 1.00 5.22  158 M 1 \nATOM   2491 C  CB   . MET M  1 159 ? 150.172 103.809 91.228 1.00 5.22  158 M 1 \nATOM   2492 C  CG   . MET M  1 159 ? 148.916 104.469 91.735 1.00 5.22  158 M 1 \nATOM   2493 S  SD   . MET M  1 159 ? 147.452 103.782 90.930 1.00 5.22  158 M 1 \nATOM   2494 C  CE   . MET M  1 159 ? 147.174 102.347 91.968 1.00 5.22  158 M 1 \nATOM   2495 H  H    . MET M  1 159 ? 150.989 105.909 90.152 1.00 5.22  158 M 1 \nATOM   2496 H  HA   . MET M  1 159 ? 151.413 104.766 92.580 1.00 5.22  158 M 1 \nATOM   2497 H  HB2  . MET M  1 159 ? 150.128 103.739 90.254 1.00 5.22  158 M 1 \nATOM   2498 H  HB3  . MET M  1 159 ? 150.229 102.903 91.593 1.00 5.22  158 M 1 \nATOM   2499 H  HG2  . MET M  1 159 ? 148.843 104.335 92.704 1.00 5.22  158 M 1 \nATOM   2500 H  HG3  . MET M  1 159 ? 148.958 105.433 91.559 1.00 5.22  158 M 1 \nATOM   2501 H  HE1  . MET M  1 159 ? 146.343 101.926 91.717 1.00 5.22  158 M 1 \nATOM   2502 H  HE2  . MET M  1 159 ? 147.900 101.722 91.853 1.00 5.22  158 M 1 \nATOM   2503 H  HE3  . MET M  1 159 ? 147.129 102.623 92.891 1.00 5.22  158 M 1 \nATOM   2504 N  N    . GLY M  1 160 ? 153.447 104.059 90.305 1.00 6.11  159 M 1 \nATOM   2505 C  CA   . GLY M  1 160 ? 154.641 103.293 89.915 1.00 6.11  159 M 1 \nATOM   2506 C  C    . GLY M  1 160 ? 154.401 102.326 88.772 1.00 6.11  159 M 1 \nATOM   2507 O  O    . GLY M  1 160 ? 155.296 101.539 88.514 1.00 6.11  159 M 1 \nATOM   2508 H  H    . GLY M  1 160 ? 153.270 104.785 89.785 1.00 6.11  159 M 1 \nATOM   2509 H  HA2  . GLY M  1 160 ? 155.354 103.929 89.655 1.00 6.11  159 M 1 \nATOM   2510 H  HA3  . GLY M  1 160 ? 154.964 102.788 90.703 1.00 6.11  159 M 1 \nATOM   2511 N  N    . ALA M  1 161 ? 153.295 102.429 88.028 1.00 5.68  160 M 1 \nATOM   2512 C  CA   . ALA M  1 161 ? 153.010 101.513 86.900 1.00 5.68  160 M 1 \nATOM   2513 C  C    . ALA M  1 161 ? 154.054 101.713 85.779 1.00 5.68  160 M 1 \nATOM   2514 O  O    . ALA M  1 161 ? 154.506 102.844 85.635 1.00 5.68  160 M 1 \nATOM   2515 C  CB   . ALA M  1 161 ? 151.618 101.684 86.356 1.00 5.68  160 M 1 \nATOM   2516 H  H    . ALA M  1 161 ? 152.714 103.128 88.073 1.00 5.68  160 M 1 \nATOM   2517 H  HA   . ALA M  1 161 ? 153.078 100.613 87.280 1.00 5.68  160 M 1 \nATOM   2518 H  HB1  . ALA M  1 161 ? 151.477 101.064 85.620 1.00 5.68  160 M 1 \nATOM   2519 H  HB2  . ALA M  1 161 ? 150.970 101.504 87.058 1.00 5.68  160 M 1 \nATOM   2520 H  HB3  . ALA M  1 161 ? 151.503 102.595 86.037 1.00 5.68  160 M 1 \nATOM   2521 N  N    . PRO M  1 162 ? 154.409 100.749 84.886 1.00 7.28  161 M 1 \nATOM   2522 C  CA   . PRO M  1 162 ? 154.085 99.312  84.954 1.00 7.28  161 M 1 \nATOM   2523 C  C    . PRO M  1 162 ? 154.971 98.516  85.926 1.00 7.28  161 M 1 \nATOM   2524 O  O    . PRO M  1 162 ? 154.581 97.457  86.342 1.00 7.28  161 M 1 \nATOM   2525 C  CB   . PRO M  1 162 ? 154.330 98.822  83.521 1.00 7.28  161 M 1 \nATOM   2526 C  CG   . PRO M  1 162 ? 155.490 99.653  83.076 1.00 7.28  161 M 1 \nATOM   2527 C  CD   . PRO M  1 162 ? 155.248 101.006 83.709 1.00 7.28  161 M 1 \nATOM   2528 H  HA   . PRO M  1 162 ? 153.129 99.190  85.181 1.00 7.28  161 M 1 \nATOM   2529 H  HB2  . PRO M  1 162 ? 154.554 97.867  83.506 1.00 7.28  161 M 1 \nATOM   2530 H  HB3  . PRO M  1 162 ? 153.546 98.977  82.953 1.00 7.28  161 M 1 \nATOM   2531 H  HG2  . PRO M  1 162 ? 156.335 99.269  83.388 1.00 7.28  161 M 1 \nATOM   2532 H  HG3  . PRO M  1 162 ? 155.514 99.725  82.100 1.00 7.28  161 M 1 \nATOM   2533 H  HD2  . PRO M  1 162 ? 156.091 101.420 83.972 1.00 7.28  161 M 1 \nATOM   2534 H  HD3  . PRO M  1 162 ? 154.791 101.601 83.086 1.00 7.28  161 M 1 \nATOM   2535 N  N    . GLU M  1 163 ? 156.116 99.069  86.313 1.00 9.11  162 M 1 \nATOM   2536 C  CA   . GLU M  1 163 ? 157.116 98.359  87.156 1.00 9.11  162 M 1 \nATOM   2537 C  C    . GLU M  1 163 ? 156.554 97.984  88.534 1.00 9.11  162 M 1 \nATOM   2538 O  O    . GLU M  1 163 ? 156.810 96.847  88.932 1.00 9.11  162 M 1 \nATOM   2539 C  CB   . GLU M  1 163 ? 158.407 99.172  87.161 1.00 9.11  162 M 1 \nATOM   2540 C  CG   . GLU M  1 163 ? 158.962 99.335  85.753 1.00 9.11  162 M 1 \nATOM   2541 C  CD   . GLU M  1 163 ? 159.605 98.072  85.199 1.00 9.11  162 M 1 \nATOM   2542 O  OE1  . GLU M  1 163 ? 160.214 97.338  85.995 1.00 9.11  162 M 1 \nATOM   2543 O  OE2  . GLU M  1 163 ? 159.535 97.834  83.968 1.00 9.11  162 M 1 \nATOM   2544 H  H    . GLU M  1 163 ? 156.311 99.945  86.185 1.00 9.11  162 M 1 \nATOM   2545 H  HA   . GLU M  1 163 ? 157.316 97.512  86.695 1.00 9.11  162 M 1 \nATOM   2546 H  HB2  . GLU M  1 163 ? 158.228 100.055 87.545 1.00 9.11  162 M 1 \nATOM   2547 H  HB3  . GLU M  1 163 ? 159.070 98.718  87.722 1.00 9.11  162 M 1 \nATOM   2548 H  HG2  . GLU M  1 163 ? 158.236 99.605  85.151 1.00 9.11  162 M 1 \nATOM   2549 H  HG3  . GLU M  1 163 ? 159.631 100.052 85.753 1.00 9.11  162 M 1 \nATOM   2550 N  N    . ALA M  1 164 ? 155.776 98.815  89.227 1.00 7.30  163 M 1 \nATOM   2551 C  CA   . ALA M  1 164 ? 155.234 98.411  90.546 1.00 7.30  163 M 1 \nATOM   2552 C  C    . ALA M  1 164 ? 154.122 97.408  90.223 1.00 7.30  163 M 1 \nATOM   2553 O  O    . ALA M  1 164 ? 153.116 97.838  89.664 1.00 7.30  163 M 1 \nATOM   2554 C  CB   . ALA M  1 164 ? 154.740 99.593  91.340 1.00 7.30  163 M 1 \nATOM   2555 H  H    . ALA M  1 164 ? 155.409 99.570  88.902 1.00 7.30  163 M 1 \nATOM   2556 H  HA   . ALA M  1 164 ? 155.952 97.964  91.051 1.00 7.30  163 M 1 \nATOM   2557 H  HB1  . ALA M  1 164 ? 154.393 99.288  92.195 1.00 7.30  163 M 1 \nATOM   2558 H  HB2  . ALA M  1 164 ? 155.473 100.212 91.492 1.00 7.30  163 M 1 \nATOM   2559 H  HB3  . ALA M  1 164 ? 154.034 100.043 90.847 1.00 7.30  163 M 1 \nATOM   2560 N  N    . GLY M  1 165 ? 154.236 96.151  90.658 1.00 6.92  164 M 1 \nATOM   2561 C  CA   . GLY M  1 165 ? 153.314 95.083  90.241 1.00 6.92  164 M 1 \nATOM   2562 C  C    . GLY M  1 165 ? 151.868 95.338  90.628 1.00 6.92  164 M 1 \nATOM   2563 O  O    . GLY M  1 165 ? 151.010 95.167  89.782 1.00 6.92  164 M 1 \nATOM   2564 H  H    . GLY M  1 165 ? 154.779 95.909  91.347 1.00 6.92  164 M 1 \nATOM   2565 H  HA2  . GLY M  1 165 ? 153.372 94.981  89.258 1.00 6.92  164 M 1 \nATOM   2566 H  HA3  . GLY M  1 165 ? 153.612 94.231  90.648 1.00 6.92  164 M 1 \nATOM   2567 N  N    . MET M  1 166 ? 151.605 95.837  91.826 1.00 5.59  165 M 1 \nATOM   2568 C  CA   . MET M  1 166 ? 150.221 96.059  92.311 1.00 5.59  165 M 1 \nATOM   2569 C  C    . MET M  1 166 ? 149.565 97.323  91.718 1.00 5.59  165 M 1 \nATOM   2570 O  O    . MET M  1 166 ? 148.351 97.431  91.853 1.00 5.59  165 M 1 \nATOM   2571 C  CB   . MET M  1 166 ? 150.183 96.094  93.844 1.00 5.59  165 M 1 \nATOM   2572 C  CG   . MET M  1 166 ? 149.711 94.770  94.463 1.00 5.59  165 M 1 \nATOM   2573 S  SD   . MET M  1 166 ? 150.210 94.519  96.182 1.00 5.59  165 M 1 \nATOM   2574 C  CE   . MET M  1 166 ? 150.247 96.218  96.745 1.00 5.59  165 M 1 \nATOM   2575 H  H    . MET M  1 166 ? 152.252 96.152  92.384 1.00 5.59  165 M 1 \nATOM   2576 H  HA   . MET M  1 166 ? 149.687 95.288  92.011 1.00 5.59  165 M 1 \nATOM   2577 H  HB2  . MET M  1 166 ? 151.079 96.301  94.177 1.00 5.59  165 M 1 \nATOM   2578 H  HB3  . MET M  1 166 ? 149.584 96.812  94.130 1.00 5.59  165 M 1 \nATOM   2579 H  HG2  . MET M  1 166 ? 148.732 94.732  94.416 1.00 5.59  165 M 1 \nATOM   2580 H  HG3  . MET M  1 166 ? 150.062 94.028  93.926 1.00 5.59  165 M 1 \nATOM   2581 H  HE1  . MET M  1 166 ? 149.345 96.557  96.802 1.00 5.59  165 M 1 \nATOM   2582 H  HE2  . MET M  1 166 ? 150.662 96.258  97.616 1.00 5.59  165 M 1 \nATOM   2583 H  HE3  . MET M  1 166 ? 150.754 96.752  96.122 1.00 5.59  165 M 1 \nATOM   2584 N  N    . ALA M  1 167 ? 150.296 98.233  91.066 1.00 5.07  166 M 1 \nATOM   2585 C  CA   . ALA M  1 167 ? 149.727 99.509  90.580 1.00 5.07  166 M 1 \nATOM   2586 C  C    . ALA M  1 167 ? 148.602 99.286  89.562 1.00 5.07  166 M 1 \nATOM   2587 O  O    . ALA M  1 167 ? 147.510 99.735  89.842 1.00 5.07  166 M 1 \nATOM   2588 C  CB   . ALA M  1 167 ? 150.817 100.366 89.972 1.00 5.07  166 M 1 \nATOM   2589 H  H    . ALA M  1 167 ? 151.155 98.122  90.809 1.00 5.07  166 M 1 \nATOM   2590 H  HA   . ALA M  1 167 ? 149.348 99.989  91.353 1.00 5.07  166 M 1 \nATOM   2591 H  HB1  . ALA M  1 167 ? 150.435 101.202 89.655 1.00 5.07  166 M 1 \nATOM   2592 H  HB2  . ALA M  1 167 ? 151.494 100.556 90.643 1.00 5.07  166 M 1 \nATOM   2593 H  HB3  . ALA M  1 167 ? 151.224 99.894  89.227 1.00 5.07  166 M 1 \nATOM   2594 N  N    . GLU M  1 168 ? 148.815 98.511  88.504 1.00 4.44  167 M 1 \nATOM   2595 C  CA   . GLU M  1 168 ? 147.748 98.325  87.474 1.00 4.44  167 M 1 \nATOM   2596 C  C    . GLU M  1 168 ? 146.605 97.530  88.114 1.00 4.44  167 M 1 \nATOM   2597 O  O    . GLU M  1 168 ? 145.468 97.850  87.878 1.00 4.44  167 M 1 \nATOM   2598 C  CB   . GLU M  1 168 ? 148.344 97.782  86.175 1.00 4.44  167 M 1 \nATOM   2599 C  CG   . GLU M  1 168 ? 149.229 98.839  85.535 1.00 4.44  167 M 1 \nATOM   2600 C  CD   . GLU M  1 168 ? 149.720 98.632  84.117 1.00 4.44  167 M 1 \nATOM   2601 O  OE1  . GLU M  1 168 ? 149.618 97.495  83.616 1.00 4.44  167 M 1 \nATOM   2602 O  OE2  . GLU M  1 168 ? 150.234 99.621  83.538 1.00 4.44  167 M 1 \nATOM   2603 H  H    . GLU M  1 168 ? 149.551 97.986  88.400 1.00 4.44  167 M 1 \nATOM   2604 H  HA   . GLU M  1 168 ? 147.392 99.221  87.272 1.00 4.44  167 M 1 \nATOM   2605 H  HB2  . GLU M  1 168 ? 148.872 96.980  86.369 1.00 4.44  167 M 1 \nATOM   2606 H  HB3  . GLU M  1 168 ? 147.619 97.540  85.561 1.00 4.44  167 M 1 \nATOM   2607 H  HG2  . GLU M  1 168 ? 148.743 99.691  85.554 1.00 4.44  167 M 1 \nATOM   2608 H  HG3  . GLU M  1 168 ? 150.020 98.955  86.104 1.00 4.44  167 M 1 \nATOM   2609 N  N    . TYR M  1 169 ? 146.921 96.577  88.980 1.00 4.01  168 M 1 \nATOM   2610 C  CA   . TYR M  1 169 ? 145.892 95.728  89.630 1.00 4.01  168 M 1 \nATOM   2611 C  C    . TYR M  1 169 ? 144.938 96.568  90.492 1.00 4.01  168 M 1 \nATOM   2612 O  O    . TYR M  1 169 ? 143.761 96.423  90.331 1.00 4.01  168 M 1 \nATOM   2613 C  CB   . TYR M  1 169 ? 146.555 94.628  90.464 1.00 4.01  168 M 1 \nATOM   2614 C  CG   . TYR M  1 169 ? 145.550 93.777  91.191 1.00 4.01  168 M 1 \nATOM   2615 C  CD1  . TYR M  1 169 ? 144.937 92.700  90.566 1.00 4.01  168 M 1 \nATOM   2616 C  CD2  . TYR M  1 169 ? 145.160 94.088  92.479 1.00 4.01  168 M 1 \nATOM   2617 C  CE1  . TYR M  1 169 ? 143.997 91.924  91.224 1.00 4.01  168 M 1 \nATOM   2618 C  CE2  . TYR M  1 169 ? 144.243 93.310  93.161 1.00 4.01  168 M 1 \nATOM   2619 C  CZ   . TYR M  1 169 ? 143.646 92.236  92.524 1.00 4.01  168 M 1 \nATOM   2620 O  OH   . TYR M  1 169 ? 142.716 91.496  93.177 1.00 4.01  168 M 1 \nATOM   2621 H  H    . TYR M  1 169 ? 147.751 96.468  89.336 1.00 4.01  168 M 1 \nATOM   2622 H  HA   . TYR M  1 169 ? 145.357 95.295  88.917 1.00 4.01  168 M 1 \nATOM   2623 H  HB2  . TYR M  1 169 ? 147.091 94.061  89.871 1.00 4.01  168 M 1 \nATOM   2624 H  HB3  . TYR M  1 169 ? 147.158 95.045  91.115 1.00 4.01  168 M 1 \nATOM   2625 H  HD1  . TYR M  1 169 ? 145.176 92.483  89.680 1.00 4.01  168 M 1 \nATOM   2626 H  HD2  . TYR M  1 169 ? 145.567 94.814  92.922 1.00 4.01  168 M 1 \nATOM   2627 H  HE1  . TYR M  1 169 ? 143.597 91.189  90.788 1.00 4.01  168 M 1 \nATOM   2628 H  HE2  . TYR M  1 169 ? 143.994 93.534  94.042 1.00 4.01  168 M 1 \nATOM   2629 H  HH   . TYR M  1 169 ? 142.054 91.991  93.406 1.00 4.01  168 M 1 \nATOM   2630 N  N    . LEU M  1 170 ? 145.441 97.487  91.311 1.00 4.13  169 M 1 \nATOM   2631 C  CA   . LEU M  1 170 ? 144.616 98.274  92.218 1.00 4.13  169 M 1 \nATOM   2632 C  C    . LEU M  1 170 ? 143.909 99.399  91.476 1.00 4.13  169 M 1 \nATOM   2633 O  O    . LEU M  1 170 ? 142.798 99.792  91.845 1.00 4.13  169 M 1 \nATOM   2634 C  CB   . LEU M  1 170 ? 145.469 98.813  93.366 1.00 4.13  169 M 1 \nATOM   2635 C  CG   . LEU M  1 170 ? 146.030 97.767  94.341 1.00 4.13  169 M 1 \nATOM   2636 C  CD1  . LEU M  1 170 ? 146.951 98.399  95.361 1.00 4.13  169 M 1 \nATOM   2637 C  CD2  . LEU M  1 170 ? 144.904 97.009  95.034 1.00 4.13  169 M 1 \nATOM   2638 H  H    . LEU M  1 170 ? 146.286 97.642  91.355 1.00 4.13  169 M 1 \nATOM   2639 H  HA   . LEU M  1 170 ? 143.922 97.699  92.576 1.00 4.13  169 M 1 \nATOM   2640 H  HB2  . LEU M  1 170 ? 146.226 99.287  92.988 1.00 4.13  169 M 1 \nATOM   2641 H  HB3  . LEU M  1 170 ? 144.932 99.435  93.881 1.00 4.13  169 M 1 \nATOM   2642 H  HG   . LEU M  1 170 ? 146.553 97.119  93.843 1.00 4.13  169 M 1 \nATOM   2643 H  HD11 . LEU M  1 170 ? 147.356 97.694  95.890 1.00 4.13  169 M 1 \nATOM   2644 H  HD12 . LEU M  1 170 ? 147.644 98.911  94.915 1.00 4.13  169 M 1 \nATOM   2645 H  HD13 . LEU M  1 170 ? 146.426 98.981  95.933 1.00 4.13  169 M 1 \nATOM   2646 H  HD21 . LEU M  1 170 ? 145.268 96.464  95.749 1.00 4.13  169 M 1 \nATOM   2647 H  HD22 . LEU M  1 170 ? 144.268 97.648  95.391 1.00 4.13  169 M 1 \nATOM   2648 H  HD23 . LEU M  1 170 ? 144.460 96.432  94.393 1.00 4.13  169 M 1 \nATOM   2649 N  N    . PHE M  1 171 ? 144.530 99.912  90.419 1.00 3.79  170 M 1 \nATOM   2650 C  CA   . PHE M  1 171 ? 143.872 100.895 89.568 1.00 3.79  170 M 1 \nATOM   2651 C  C    . PHE M  1 171 ? 142.682 100.273 88.847 1.00 3.79  170 M 1 \nATOM   2652 O  O    . PHE M  1 171 ? 141.621 100.894 88.730 1.00 3.79  170 M 1 \nATOM   2653 C  CB   . PHE M  1 171 ? 144.874 101.442 88.562 1.00 3.79  170 M 1 \nATOM   2654 C  CG   . PHE M  1 171 ? 144.340 102.550 87.735 1.00 3.79  170 M 1 \nATOM   2655 C  CD1  . PHE M  1 171 ? 144.342 103.846 88.205 1.00 3.79  170 M 1 \nATOM   2656 C  CD2  . PHE M  1 171 ? 143.774 102.294 86.510 1.00 3.79  170 M 1 \nATOM   2657 C  CE1  . PHE M  1 171 ? 143.840 104.856 87.442 1.00 3.79  170 M 1 \nATOM   2658 C  CE2  . PHE M  1 171 ? 143.267 103.300 85.759 1.00 3.79  170 M 1 \nATOM   2659 C  CZ   . PHE M  1 171 ? 143.300 104.576 86.223 1.00 3.79  170 M 1 \nATOM   2660 H  H    . PHE M  1 171 ? 145.328 99.706  90.173 1.00 3.79  170 M 1 \nATOM   2661 H  HA   . PHE M  1 171 ? 143.555 101.638 90.105 1.00 3.79  170 M 1 \nATOM   2662 H  HB2  . PHE M  1 171 ? 145.651 101.772 89.040 1.00 3.79  170 M 1 \nATOM   2663 H  HB3  . PHE M  1 171 ? 145.148 100.727 87.967 1.00 3.79  170 M 1 \nATOM   2664 H  HD1  . PHE M  1 171 ? 144.718 104.044 89.032 1.00 3.79  170 M 1 \nATOM   2665 H  HD2  . PHE M  1 171 ? 143.749 101.423 86.186 1.00 3.79  170 M 1 \nATOM   2666 H  HE1  . PHE M  1 171 ? 143.856 105.730 87.758 1.00 3.79  170 M 1 \nATOM   2667 H  HE2  . PHE M  1 171 ? 142.897 103.113 84.927 1.00 3.79  170 M 1 \nATOM   2668 H  HZ   . PHE M  1 171 ? 142.954 105.265 85.703 1.00 3.79  170 M 1 \nATOM   2669 N  N    . ASP M  1 172 ? 142.886 99.054  88.392 1.00 4.02  171 M 1 \nATOM   2670 C  CA   . ASP M  1 172 ? 141.806 98.292  87.727 1.00 4.02  171 M 1 \nATOM   2671 C  C    . ASP M  1 172 ? 140.659 98.138  88.738 1.00 4.02  171 M 1 \nATOM   2672 O  O    . ASP M  1 172 ? 139.533 98.351  88.327 1.00 4.02  171 M 1 \nATOM   2673 C  CB   . ASP M  1 172 ? 142.330 96.951  87.193 1.00 4.02  171 M 1 \nATOM   2674 C  CG   . ASP M  1 172 ? 141.273 96.045  86.572 1.00 4.02  171 M 1 \nATOM   2675 O  OD1  . ASP M  1 172 ? 140.506 95.464  87.323 1.00 4.02  171 M 1 \nATOM   2676 O  OD2  . ASP M  1 172 ? 141.246 95.911  85.334 1.00 4.02  171 M 1 \nATOM   2677 H  H    . ASP M  1 172 ? 143.713 98.680  88.321 1.00 4.02  171 M 1 \nATOM   2678 H  HA   . ASP M  1 172 ? 141.480 98.822  86.962 1.00 4.02  171 M 1 \nATOM   2679 H  HB2  . ASP M  1 172 ? 143.014 97.129  86.515 1.00 4.02  171 M 1 \nATOM   2680 H  HB3  . ASP M  1 172 ? 142.753 96.464  87.929 1.00 4.02  171 M 1 \nATOM   2681 N  N    . LYS M  1 173 ? 140.916 97.846  90.025 1.00 4.18  172 M 1 \nATOM   2682 C  CA   . LYS M  1 173 ? 139.818 97.616  90.960 1.00 4.18  172 M 1 \nATOM   2683 C  C    . LYS M  1 173 ? 139.128 98.913  91.381 1.00 4.18  172 M 1 \nATOM   2684 O  O    . LYS M  1 173 ? 137.897 98.991  91.389 1.00 4.18  172 M 1 \nATOM   2685 C  CB   . LYS M  1 173 ? 140.325 96.848  92.179 1.00 4.18  172 M 1 \nATOM   2686 C  CG   . LYS M  1 173 ? 140.865 95.460  91.866 1.00 4.18  172 M 1 \nATOM   2687 C  CD   . LYS M  1 173 ? 139.777 94.534  91.328 1.00 4.18  172 M 1 \nATOM   2688 C  CE   . LYS M  1 173 ? 140.229 93.101  91.153 1.00 4.18  172 M 1 \nATOM   2689 N  NZ   . LYS M  1 173 ? 139.141 92.269  90.574 1.00 4.18  172 M 1 \nATOM   2690 H  H    . LYS M  1 173 ? 141.708 97.794  90.356 1.00 4.18  172 M 1 \nATOM   2691 H  HA   . LYS M  1 173 ? 139.134 97.087  90.521 1.00 4.18  172 M 1 \nATOM   2692 H  HB2  . LYS M  1 173 ? 141.048 97.352  92.584 1.00 4.18  172 M 1 \nATOM   2693 H  HB3  . LYS M  1 173 ? 139.597 96.747  92.812 1.00 4.18  172 M 1 \nATOM   2694 H  HG2  . LYS M  1 173 ? 141.556 95.531  91.189 1.00 4.18  172 M 1 \nATOM   2695 H  HG3  . LYS M  1 173 ? 141.237 95.075  92.675 1.00 4.18  172 M 1 \nATOM   2696 H  HD2  . LYS M  1 173 ? 139.010 94.546  91.921 1.00 4.18  172 M 1 \nATOM   2697 H  HD3  . LYS M  1 173 ? 139.524 94.850  90.446 1.00 4.18  172 M 1 \nATOM   2698 H  HE2  . LYS M  1 173 ? 140.984 93.064  90.545 1.00 4.18  172 M 1 \nATOM   2699 H  HE3  . LYS M  1 173 ? 140.476 92.729  92.014 1.00 4.18  172 M 1 \nATOM   2700 H  HZ1  . LYS M  1 173 ? 139.354 91.406  90.625 1.00 4.18  172 M 1 \nATOM   2701 H  HZ2  . LYS M  1 173 ? 138.377 92.403  91.010 1.00 4.18  172 M 1 \nATOM   2702 H  HZ3  . LYS M  1 173 ? 139.022 92.484  89.719 1.00 4.18  172 M 1 \nATOM   2703 N  N    . HIS M  1 174 ? 139.898 99.937  91.734 1.00 4.28  173 M 1 \nATOM   2704 C  CA   . HIS M  1 174 ? 139.326 101.141 92.340 1.00 4.28  173 M 1 \nATOM   2705 C  C    . HIS M  1 174 ? 138.808 102.130 91.299 1.00 4.28  173 M 1 \nATOM   2706 O  O    . HIS M  1 174 ? 137.635 102.510 91.318 1.00 4.28  173 M 1 \nATOM   2707 C  CB   . HIS M  1 174 ? 140.365 101.793 93.254 1.00 4.28  173 M 1 \nATOM   2708 C  CG   . HIS M  1 174 ? 140.680 100.984 94.467 1.00 4.28  173 M 1 \nATOM   2709 N  ND1  . HIS M  1 174 ? 139.808 100.871 95.527 1.00 4.28  173 M 1 \nATOM   2710 C  CD2  . HIS M  1 174 ? 141.767 100.251 94.792 1.00 4.28  173 M 1 \nATOM   2711 C  CE1  . HIS M  1 174 ? 140.345 100.097 96.451 1.00 4.28  173 M 1 \nATOM   2712 N  NE2  . HIS M  1 174 ? 141.533 99.709  96.031 1.00 4.28  173 M 1 \nATOM   2713 H  H    . HIS M  1 174 ? 140.752 99.957  91.635 1.00 4.28  173 M 1 \nATOM   2714 H  HA   . HIS M  1 174 ? 138.576 100.895 92.904 1.00 4.28  173 M 1 \nATOM   2715 H  HB2  . HIS M  1 174 ? 141.193 101.898 92.761 1.00 4.28  173 M 1 \nATOM   2716 H  HB3  . HIS M  1 174 ? 140.046 102.661 93.547 1.00 4.28  173 M 1 \nATOM   2717 H  HD2  . HIS M  1 174 ? 142.533 100.137 94.277 1.00 4.28  173 M 1 \nATOM   2718 H  HE1  . HIS M  1 174 ? 139.951 99.866  97.261 1.00 4.28  173 M 1 \nATOM   2719 H  HE2  . HIS M  1 174 ? 142.076 99.200  96.462 1.00 4.28  173 M 1 \nATOM   2720 N  N    . THR M  1 175 ? 139.668 102.559 90.381 1.00 3.92  174 M 1 \nATOM   2721 C  CA   . THR M  1 175 ? 139.281 103.609 89.443 1.00 3.92  174 M 1 \nATOM   2722 C  C    . THR M  1 175 ? 138.388 103.072 88.331 1.00 3.92  174 M 1 \nATOM   2723 O  O    . THR M  1 175 ? 137.333 103.648 88.043 1.00 3.92  174 M 1 \nATOM   2724 C  CB   . THR M  1 175 ? 140.529 104.288 88.884 1.00 3.92  174 M 1 \nATOM   2725 O  OG1  . THR M  1 175 ? 141.222 104.932 89.958 1.00 3.92  174 M 1 \nATOM   2726 C  CG2  . THR M  1 175 ? 140.176 105.309 87.815 1.00 3.92  174 M 1 \nATOM   2727 H  H    . THR M  1 175 ? 140.472 102.269 90.290 1.00 3.92  174 M 1 \nATOM   2728 H  HA   . THR M  1 175 ? 138.774 104.287 89.917 1.00 3.92  174 M 1 \nATOM   2729 H  HB   . THR M  1 175 ? 141.117 103.628 88.485 1.00 3.92  174 M 1 \nATOM   2730 H  HG1  . THR M  1 175 ? 141.349 105.742 89.774 1.00 3.92  174 M 1 \nATOM   2731 H  HG21 . THR M  1 175 ? 140.922 105.911 87.670 1.00 3.92  174 M 1 \nATOM   2732 H  HG22 . THR M  1 175 ? 139.977 104.866 86.975 1.00 3.92  174 M 1 \nATOM   2733 H  HG23 . THR M  1 175 ? 139.402 105.826 88.086 1.00 3.92  174 M 1 \nATOM   2734 N  N    . LEU M  1 176 ? 138.787 101.981 87.690 1.00 3.89  175 M 1 \nATOM   2735 C  CA   . LEU M  1 176 ? 138.029 101.435 86.571 1.00 3.89  175 M 1 \nATOM   2736 C  C    . LEU M  1 176 ? 137.001 100.390 86.986 1.00 3.89  175 M 1 \nATOM   2737 O  O    . LEU M  1 176 ? 136.269 99.897  86.125 1.00 3.89  175 M 1 \nATOM   2738 C  CB   . LEU M  1 176 ? 138.981 100.835 85.536 1.00 3.89  175 M 1 \nATOM   2739 C  CG   . LEU M  1 176 ? 139.949 101.826 84.877 1.00 3.89  175 M 1 \nATOM   2740 C  CD1  . LEU M  1 176 ? 140.858 101.121 83.920 1.00 3.89  175 M 1 \nATOM   2741 C  CD2  . LEU M  1 176 ? 139.256 102.990 84.197 1.00 3.89  175 M 1 \nATOM   2742 H  H    . LEU M  1 176 ? 139.499 101.538 87.883 1.00 3.89  175 M 1 \nATOM   2743 H  HA   . LEU M  1 176 ? 137.528 102.142 86.135 1.00 3.89  175 M 1 \nATOM   2744 H  HB2  . LEU M  1 176 ? 139.518 100.161 85.981 1.00 3.89  175 M 1 \nATOM   2745 H  HB3  . LEU M  1 176 ? 138.456 100.406 84.843 1.00 3.89  175 M 1 \nATOM   2746 H  HG   . LEU M  1 176 ? 140.518 102.192 85.573 1.00 3.89  175 M 1 \nATOM   2747 H  HD11 . LEU M  1 176 ? 140.996 101.648 83.117 1.00 3.89  175 M 1 \nATOM   2748 H  HD12 . LEU M  1 176 ? 141.711 100.998 84.365 1.00 3.89  175 M 1 \nATOM   2749 H  HD13 . LEU M  1 176 ? 140.472 100.264 83.679 1.00 3.89  175 M 1 \nATOM   2750 H  HD21 . LEU M  1 176 ? 139.918 103.538 83.747 1.00 3.89  175 M 1 \nATOM   2751 H  HD22 . LEU M  1 176 ? 138.608 102.648 83.562 1.00 3.89  175 M 1 \nATOM   2752 H  HD23 . LEU M  1 176 ? 138.811 103.528 84.870 1.00 3.89  175 M 1 \nATOM   2753 N  N    . GLY M  1 177 ? 136.922 100.050 88.265 1.00 4.79  176 M 1 \nATOM   2754 C  CA   . GLY M  1 177 ? 135.933 99.110  88.758 1.00 4.79  176 M 1 \nATOM   2755 C  C    . GLY M  1 177 ? 134.724 99.796  89.358 1.00 4.79  176 M 1 \nATOM   2756 O  O    . GLY M  1 177 ? 134.403 100.926 88.999 1.00 4.79  176 M 1 \nATOM   2757 H  H    . GLY M  1 177 ? 137.440 100.352 88.881 1.00 4.79  176 M 1 \nATOM   2758 H  HA2  . GLY M  1 177 ? 135.628 98.522  88.049 1.00 4.79  176 M 1 \nATOM   2759 H  HA3  . GLY M  1 177 ? 136.344 98.561  89.444 1.00 4.79  176 M 1 \nHETATM 2760 ZN ZN   . ZN  PA 3 .   ? 134.712 110.111 68.601 1.00 16.76 201 M 1 \n#\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/pdb_mmcif/6ydw.cif",
    "content": "data_6YDW\n#\n_entry.id 6YDW\n#\nloop_\n_chem_comp.formula\n_chem_comp.formula_weight\n_chem_comp.id\n_chem_comp.mon_nstd_flag\n_chem_comp.name\n_chem_comp.pdbx_synonyms\n_chem_comp.type\n\"C10 H14 N5 O8 P\"   363.221 5GP . \"GUANOSINE-5'-MONOPHOSPHATE\"                  ? non-polymer         \n\"C10 H14 N5 O7 P\"   347.221 A   y \"ADENOSINE-5'-MONOPHOSPHATE\"                  ? \"RNA linking\"       \n\"C3 H7 N O2\"        89.093  ALA y ALANINE                                       ? \"L-peptide linking\" \n\"C6 H15 N4 O2 1\"    175.209 ARG y ARGININE                                      ? \"L-peptide linking\" \n\"C4 H8 N2 O3\"       132.118 ASN y ASPARAGINE                                    ? \"L-peptide linking\" \n\"C4 H7 N O4\"        133.103 ASP y \"ASPARTIC ACID\"                               ? \"L-peptide linking\" \n\"C9 H14 N3 O8 P\"    323.197 C   y \"CYTIDINE-5'-MONOPHOSPHATE\"                   ? \"RNA linking\"       \n\"C3 H7 N O2 S\"      121.158 CYS y CYSTEINE                                      ? \"L-peptide linking\" \n\"C6 H11 N O3 S\"     177.221 FME n N-FORMYLMETHIONINE                            ? \"L-peptide linking\" \n\"C10 H14 N5 O8 P\"   363.221 G   y \"GUANOSINE-5'-MONOPHOSPHATE\"                  ? \"RNA linking\"       \n\"C5 H10 N2 O3\"      146.144 GLN y GLUTAMINE                                     ? \"L-peptide linking\" \n\"C5 H9 N O4\"        147.129 GLU y \"GLUTAMIC ACID\"                               ? \"L-peptide linking\" \n\"C2 H5 N O2\"        75.067  GLY y GLYCINE                                       ? \"peptide linking\"   \n\"C10 H17 N6 O13 P3\" 522.196 GNP . \"PHOSPHOAMINOPHOSPHONIC ACID-GUANYLATE ESTER\" ? non-polymer         \n\"C10 H16 N5 O14 P3\" 523.180 GTP n \"GUANOSINE-5'-TRIPHOSPHATE\"                   ? non-polymer         \n\"C6 H10 N3 O2 1\"    156.162 HIS y HISTIDINE                                     ? \"L-peptide linking\" \n\"H2 O\"              18.015  HOH . WATER                                         ? non-polymer         \n\"C6 H13 N O2\"       131.173 ILE y ISOLEUCINE                                    ? \"L-peptide linking\" \n\"C6 H13 N O2\"       131.173 LEU y LEUCINE                                       ? \"L-peptide linking\" \n\"C6 H15 N2 O2 1\"    147.195 LYS y LYSINE                                        ? \"L-peptide linking\" \n\"C5 H11 N O2 S\"     149.211 MET y METHIONINE                                    ? \"L-peptide linking\" \n\"Mg 2\"              24.305  MG  . \"MAGNESIUM ION\"                               ? non-polymer         \n\"C9 H11 N O2\"       165.189 PHE y PHENYLALANINE                                 ? \"L-peptide linking\" \n\"C5 H9 N O2\"        115.130 PRO y PROLINE                                       ? \"L-peptide linking\" \n\"C3 H7 N O3\"        105.093 SER y SERINE                                        ? \"L-peptide linking\" \n\"C10 H26 N4\"        202.340 SPM . SPERMINE                                      ? non-polymer         \n\"C4 H9 N O3\"        119.119 THR y THREONINE                                     ? \"L-peptide linking\" \n\"C11 H12 N2 O2\"     204.225 TRP y TRYPTOPHAN                                    ? \"L-peptide linking\" \n\"C9 H11 N O3\"       181.189 TYR y TYROSINE                                      ? \"L-peptide linking\" \n\"C9 H13 N2 O9 P\"    324.181 U   y \"URIDINE-5'-MONOPHOSPHATE\"                    ? \"RNA linking\"       \n\"C4 H9 N O2\"        103.120 UNK . UNKNOWN                                       ? \"L-peptide linking\" \n\"C5 H11 N O2\"       117.146 VAL y VALINE                                        ? \"L-peptide linking\" \n\"Zn 2\"              65.409  ZN  . \"ZINC ION\"                                    ? non-polymer         \n#\n_entity.id               17\n_entity.pdbx_description \"Mitochondrial ribosomal protein L46\"\n_entity.type             polymer\n#\n_entity_poly.entity_id      17\n_entity_poly.pdbx_strand_id Bj\n_entity_poly.type           polypeptide(L)\n#\nloop_\n_entity_poly_seq.entity_id\n_entity_poly_seq.hetero\n_entity_poly_seq.mon_id\n_entity_poly_seq.num\n17 n MET 1   \n17 n ALA 2   \n17 n ALA 3   \n17 n PRO 4   \n17 n VAL 5   \n17 n ARG 6   \n17 n ARG 7   \n17 n THR 8   \n17 n MET 9   \n17 n LEU 10  \n17 n ARG 11  \n17 n VAL 12  \n17 n VAL 13  \n17 n ARG 14  \n17 n GLY 15  \n17 n TRP 16  \n17 n ARG 17  \n17 n ARG 18  \n17 n PHE 19  \n17 n GLU 20  \n17 n GLY 21  \n17 n PRO 22  \n17 n TRP 23  \n17 n ALA 24  \n17 n HIS 25  \n17 n SER 26  \n17 n LEU 27  \n17 n GLY 28  \n17 n SER 29  \n17 n ARG 30  \n17 n ASN 31  \n17 n LEU 32  \n17 n ALA 33  \n17 n LEU 34  \n17 n ALA 35  \n17 n VAL 36  \n17 n ALA 37  \n17 n PRO 38  \n17 n SER 39  \n17 n SER 40  \n17 n SER 41  \n17 n SER 42  \n17 n SER 43  \n17 n PRO 44  \n17 n TRP 45  \n17 n ARG 46  \n17 n LEU 47  \n17 n LEU 48  \n17 n GLY 49  \n17 n ALA 50  \n17 n LEU 51  \n17 n CYS 52  \n17 n LEU 53  \n17 n GLN 54  \n17 n ARG 55  \n17 n PRO 56  \n17 n PRO 57  \n17 n LEU 58  \n17 n VAL 59  \n17 n THR 60  \n17 n LYS 61  \n17 n PRO 62  \n17 n LEU 63  \n17 n THR 64  \n17 n PRO 65  \n17 n LEU 66  \n17 n GLN 67  \n17 n GLU 68  \n17 n GLU 69  \n17 n MET 70  \n17 n ALA 71  \n17 n ASP 72  \n17 n LEU 73  \n17 n LEU 74  \n17 n GLN 75  \n17 n GLN 76  \n17 n ILE 77  \n17 n GLU 78  \n17 n ILE 79  \n17 n GLU 80  \n17 n ARG 81  \n17 n SER 82  \n17 n LEU 83  \n17 n TYR 84  \n17 n SER 85  \n17 n ASP 86  \n17 n HIS 87  \n17 n GLU 88  \n17 n LEU 89  \n17 n ARG 90  \n17 n ALA 91  \n17 n LEU 92  \n17 n ASP 93  \n17 n GLU 94  \n17 n ALA 95  \n17 n GLN 96  \n17 n GLN 97  \n17 n LEU 98  \n17 n ALA 99  \n17 n LYS 100 \n17 n LYS 101 \n17 n LYS 102 \n17 n SER 103 \n17 n ASP 104 \n17 n LEU 105 \n17 n TYR 106 \n17 n GLU 107 \n17 n GLU 108 \n17 n GLU 109 \n17 n ASP 110 \n17 n GLU 111 \n17 n GLN 112 \n17 n ASN 113 \n17 n ILE 114 \n17 n LEU 115 \n17 n LEU 116 \n17 n ALA 117 \n17 n GLN 118 \n17 n ASP 119 \n17 n LEU 120 \n17 n GLU 121 \n17 n ASP 122 \n17 n MET 123 \n17 n TRP 124 \n17 n GLU 125 \n17 n GLN 126 \n17 n LYS 127 \n17 n PHE 128 \n17 n LEU 129 \n17 n HIS 130 \n17 n PHE 131 \n17 n LYS 132 \n17 n LEU 133 \n17 n GLY 134 \n17 n ALA 135 \n17 n ARG 136 \n17 n LEU 137 \n17 n THR 138 \n17 n GLU 139 \n17 n ALA 140 \n17 n ASP 141 \n17 n LYS 142 \n17 n LYS 143 \n17 n ASP 144 \n17 n ASP 145 \n17 n ARG 146 \n17 n THR 147 \n17 n SER 148 \n17 n LEU 149 \n17 n HIS 150 \n17 n ARG 151 \n17 n LYS 152 \n17 n LEU 153 \n17 n ASP 154 \n17 n ARG 155 \n17 n ASN 156 \n17 n LEU 157 \n17 n ILE 158 \n17 n LEU 159 \n17 n LEU 160 \n17 n VAL 161 \n17 n ARG 162 \n17 n GLU 163 \n17 n LYS 164 \n17 n LEU 165 \n17 n GLY 166 \n17 n ASP 167 \n17 n GLN 168 \n17 n ASP 169 \n17 n ILE 170 \n17 n TRP 171 \n17 n MET 172 \n17 n LEU 173 \n17 n PRO 174 \n17 n GLN 175 \n17 n SER 176 \n17 n ASP 177 \n17 n TRP 178 \n17 n GLN 179 \n17 n PRO 180 \n17 n GLY 181 \n17 n GLU 182 \n17 n THR 183 \n17 n LEU 184 \n17 n ARG 185 \n17 n GLN 186 \n17 n THR 187 \n17 n ALA 188 \n17 n GLU 189 \n17 n ARG 190 \n17 n THR 191 \n17 n LEU 192 \n17 n ALA 193 \n17 n THR 194 \n17 n LEU 195 \n17 n SER 196 \n17 n GLU 197 \n17 n ASN 198 \n17 n ASN 199 \n17 n MET 200 \n17 n GLU 201 \n17 n ALA 202 \n17 n LYS 203 \n17 n PHE 204 \n17 n LEU 205 \n17 n GLY 206 \n17 n ASN 207 \n17 n ALA 208 \n17 n PRO 209 \n17 n CYS 210 \n17 n GLY 211 \n17 n HIS 212 \n17 n TYR 213 \n17 n LYS 214 \n17 n PHE 215 \n17 n LYS 216 \n17 n PHE 217 \n17 n PRO 218 \n17 n GLN 219 \n17 n ALA 220 \n17 n MET 221 \n17 n ARG 222 \n17 n THR 223 \n17 n GLU 224 \n17 n THR 225 \n17 n SER 226 \n17 n LEU 227 \n17 n GLY 228 \n17 n ALA 229 \n17 n LYS 230 \n17 n VAL 231 \n17 n PHE 232 \n17 n PHE 233 \n17 n PHE 234 \n17 n LYS 235 \n17 n ALA 236 \n17 n LEU 237 \n17 n LEU 238 \n17 n LEU 239 \n17 n THR 240 \n17 n GLY 241 \n17 n ASP 242 \n17 n PHE 243 \n17 n SER 244 \n17 n GLN 245 \n17 n ALA 246 \n17 n GLY 247 \n17 n LYS 248 \n17 n LYS 249 \n17 n GLY 250 \n17 n HIS 251 \n17 n HIS 252 \n17 n VAL 253 \n17 n TRP 254 \n17 n VAL 255 \n17 n SER 256 \n17 n LYS 257 \n17 n GLU 258 \n17 n GLU 259 \n17 n LEU 260 \n17 n GLY 261 \n17 n ASP 262 \n17 n TYR 263 \n17 n LEU 264 \n17 n LYS 265 \n17 n PRO 266 \n17 n LYS 267 \n17 n TYR 268 \n17 n LEU 269 \n17 n ALA 270 \n17 n GLN 271 \n17 n VAL 272 \n17 n ARG 273 \n17 n ARG 274 \n17 n PHE 275 \n17 n LEU 276 \n17 n LEU 277 \n17 n ASP 278 \n17 n LEU 279 \n#\n_exptl.method \"ELECTRON MICROSCOPY\"\n#\n_pdbx_audit_revision_history.revision_date 2020-07-15\n#\n_pdbx_database_status.recvd_initial_deposition_date 2020-07-15\n#\nloop_\n_pdbx_poly_seq_scheme.asym_id\n_pdbx_poly_seq_scheme.auth_seq_num\n_pdbx_poly_seq_scheme.entity_id\n_pdbx_poly_seq_scheme.hetero\n_pdbx_poly_seq_scheme.mon_id\n_pdbx_poly_seq_scheme.pdb_ins_code\n_pdbx_poly_seq_scheme.pdb_seq_num\n_pdbx_poly_seq_scheme.pdb_strand_id\n_pdbx_poly_seq_scheme.seq_id\nQ ?   17 n MET . 1   Bj 1   \nQ ?   17 n ALA . 2   Bj 2   \nQ ?   17 n ALA . 3   Bj 3   \nQ ?   17 n PRO . 4   Bj 4   \nQ ?   17 n VAL . 5   Bj 5   \nQ ?   17 n ARG . 6   Bj 6   \nQ ?   17 n ARG . 7   Bj 7   \nQ ?   17 n THR . 8   Bj 8   \nQ ?   17 n MET . 9   Bj 9   \nQ ?   17 n LEU . 10  Bj 10  \nQ ?   17 n ARG . 11  Bj 11  \nQ ?   17 n VAL . 12  Bj 12  \nQ ?   17 n VAL . 13  Bj 13  \nQ ?   17 n ARG . 14  Bj 14  \nQ ?   17 n GLY . 15  Bj 15  \nQ ?   17 n TRP . 16  Bj 16  \nQ ?   17 n ARG . 17  Bj 17  \nQ ?   17 n ARG . 18  Bj 18  \nQ ?   17 n PHE . 19  Bj 19  \nQ ?   17 n GLU . 20  Bj 20  \nQ ?   17 n GLY . 21  Bj 21  \nQ ?   17 n PRO . 22  Bj 22  \nQ ?   17 n TRP . 23  Bj 23  \nQ ?   17 n ALA . 24  Bj 24  \nQ ?   17 n HIS . 25  Bj 25  \nQ ?   17 n SER . 26  Bj 26  \nQ ?   17 n LEU . 27  Bj 27  \nQ ?   17 n GLY . 28  Bj 28  \nQ ?   17 n SER . 29  Bj 29  \nQ ?   17 n ARG . 30  Bj 30  \nQ ?   17 n ASN . 31  Bj 31  \nQ ?   17 n LEU . 32  Bj 32  \nQ ?   17 n ALA . 33  Bj 33  \nQ ?   17 n LEU . 34  Bj 34  \nQ ?   17 n ALA . 35  Bj 35  \nQ ?   17 n VAL . 36  Bj 36  \nQ ?   17 n ALA . 37  Bj 37  \nQ ?   17 n PRO . 38  Bj 38  \nQ ?   17 n SER . 39  Bj 39  \nQ ?   17 n SER . 40  Bj 40  \nQ ?   17 n SER . 41  Bj 41  \nQ ?   17 n SER . 42  Bj 42  \nQ 43  17 n SER . 43  Bj 43  \nQ 44  17 n PRO . 44  Bj 44  \nQ 45  17 n TRP . 45  Bj 45  \nQ 46  17 n ARG . 46  Bj 46  \nQ 47  17 n LEU . 47  Bj 47  \nQ 48  17 n LEU . 48  Bj 48  \nQ 49  17 n GLY . 49  Bj 49  \nQ 50  17 n ALA . 50  Bj 50  \nQ 51  17 n LEU . 51  Bj 51  \nQ 52  17 n CYS . 52  Bj 52  \nQ 53  17 n LEU . 53  Bj 53  \nQ 54  17 n GLN . 54  Bj 54  \nQ 55  17 n ARG . 55  Bj 55  \nQ 56  17 n PRO . 56  Bj 56  \nQ 57  17 n PRO . 57  Bj 57  \nQ 58  17 n LEU . 58  Bj 58  \nQ 59  17 n VAL . 59  Bj 59  \nQ 60  17 n THR . 60  Bj 60  \nQ 61  17 n LYS . 61  Bj 61  \nQ 62  17 n PRO . 62  Bj 62  \nQ 63  17 n LEU . 63  Bj 63  \nQ 64  17 n THR . 64  Bj 64  \nQ 65  17 n PRO . 65  Bj 65  \nQ 66  17 n LEU . 66  Bj 66  \nQ 67  17 n GLN . 67  Bj 67  \nQ 68  17 n GLU . 68  Bj 68  \nQ 69  17 n GLU . 69  Bj 69  \nQ 70  17 n MET . 70  Bj 70  \nQ 71  17 n ALA . 71  Bj 71  \nQ 72  17 n ASP . 72  Bj 72  \nQ 73  17 n LEU . 73  Bj 73  \nQ 74  17 n LEU . 74  Bj 74  \nQ 75  17 n GLN . 75  Bj 75  \nQ 76  17 n GLN . 76  Bj 76  \nQ 77  17 n ILE . 77  Bj 77  \nQ 78  17 n GLU . 78  Bj 78  \nQ 79  17 n ILE . 79  Bj 79  \nQ 80  17 n GLU . 80  Bj 80  \nQ 81  17 n ARG . 81  Bj 81  \nQ 82  17 n SER . 82  Bj 82  \nQ 83  17 n LEU . 83  Bj 83  \nQ 84  17 n TYR . 84  Bj 84  \nQ 85  17 n SER . 85  Bj 85  \nQ 86  17 n ASP . 86  Bj 86  \nQ 87  17 n HIS . 87  Bj 87  \nQ 88  17 n GLU . 88  Bj 88  \nQ 89  17 n LEU . 89  Bj 89  \nQ 90  17 n ARG . 90  Bj 90  \nQ 91  17 n ALA . 91  Bj 91  \nQ 92  17 n LEU . 92  Bj 92  \nQ 93  17 n ASP . 93  Bj 93  \nQ 94  17 n GLU . 94  Bj 94  \nQ 95  17 n ALA . 95  Bj 95  \nQ 96  17 n GLN . 96  Bj 96  \nQ 97  17 n GLN . 97  Bj 97  \nQ 98  17 n LEU . 98  Bj 98  \nQ 99  17 n ALA . 99  Bj 99  \nQ 100 17 n LYS . 100 Bj 100 \nQ 101 17 n LYS . 101 Bj 101 \nQ 102 17 n LYS . 102 Bj 102 \nQ 103 17 n SER . 103 Bj 103 \nQ 104 17 n ASP . 104 Bj 104 \nQ ?   17 n LEU . 105 Bj 105 \nQ ?   17 n TYR . 106 Bj 106 \nQ ?   17 n GLU . 107 Bj 107 \nQ ?   17 n GLU . 108 Bj 108 \nQ ?   17 n GLU . 109 Bj 109 \nQ ?   17 n ASP . 110 Bj 110 \nQ ?   17 n GLU . 111 Bj 111 \nQ ?   17 n GLN . 112 Bj 112 \nQ ?   17 n ASN . 113 Bj 113 \nQ ?   17 n ILE . 114 Bj 114 \nQ ?   17 n LEU . 115 Bj 115 \nQ 116 17 n LEU . 116 Bj 116 \nQ 117 17 n ALA . 117 Bj 117 \nQ 118 17 n GLN . 118 Bj 118 \nQ 119 17 n ASP . 119 Bj 119 \nQ 120 17 n LEU . 120 Bj 120 \nQ 121 17 n GLU . 121 Bj 121 \nQ 122 17 n ASP . 122 Bj 122 \nQ 123 17 n MET . 123 Bj 123 \nQ 124 17 n TRP . 124 Bj 124 \nQ 125 17 n GLU . 125 Bj 125 \nQ 126 17 n GLN . 126 Bj 126 \nQ 127 17 n LYS . 127 Bj 127 \nQ 128 17 n PHE . 128 Bj 128 \nQ 129 17 n LEU . 129 Bj 129 \nQ 130 17 n HIS . 130 Bj 130 \nQ 131 17 n PHE . 131 Bj 131 \nQ 132 17 n LYS . 132 Bj 132 \nQ 133 17 n LEU . 133 Bj 133 \nQ 134 17 n GLY . 134 Bj 134 \nQ 135 17 n ALA . 135 Bj 135 \nQ 136 17 n ARG . 136 Bj 136 \nQ 137 17 n LEU . 137 Bj 137 \nQ 138 17 n THR . 138 Bj 138 \nQ 139 17 n GLU . 139 Bj 139 \nQ 140 17 n ALA . 140 Bj 140 \nQ 141 17 n ASP . 141 Bj 141 \nQ 142 17 n LYS . 142 Bj 142 \nQ 143 17 n LYS . 143 Bj 143 \nQ 144 17 n ASP . 144 Bj 144 \nQ 145 17 n ASP . 145 Bj 145 \nQ 146 17 n ARG . 146 Bj 146 \nQ 147 17 n THR . 147 Bj 147 \nQ 148 17 n SER . 148 Bj 148 \nQ 149 17 n LEU . 149 Bj 149 \nQ 150 17 n HIS . 150 Bj 150 \nQ 151 17 n ARG . 151 Bj 151 \nQ 152 17 n LYS . 152 Bj 152 \nQ 153 17 n LEU . 153 Bj 153 \nQ 154 17 n ASP . 154 Bj 154 \nQ 155 17 n ARG . 155 Bj 155 \nQ 156 17 n ASN . 156 Bj 156 \nQ 157 17 n LEU . 157 Bj 157 \nQ 158 17 n ILE . 158 Bj 158 \nQ 159 17 n LEU . 159 Bj 159 \nQ 160 17 n LEU . 160 Bj 160 \nQ 161 17 n VAL . 161 Bj 161 \nQ 162 17 n ARG . 162 Bj 162 \nQ 163 17 n GLU . 163 Bj 163 \nQ 164 17 n LYS . 164 Bj 164 \nQ 165 17 n LEU . 165 Bj 165 \nQ 166 17 n GLY . 166 Bj 166 \nQ 167 17 n ASP . 167 Bj 167 \nQ 168 17 n GLN . 168 Bj 168 \nQ 169 17 n ASP . 169 Bj 169 \nQ 170 17 n ILE . 170 Bj 170 \nQ 171 17 n TRP . 171 Bj 171 \nQ 172 17 n MET . 172 Bj 172 \nQ 173 17 n LEU . 173 Bj 173 \nQ 174 17 n PRO . 174 Bj 174 \nQ 175 17 n GLN . 175 Bj 175 \nQ 176 17 n SER . 176 Bj 176 \nQ 177 17 n ASP . 177 Bj 177 \nQ 178 17 n TRP . 178 Bj 178 \nQ 179 17 n GLN . 179 Bj 179 \nQ 180 17 n PRO . 180 Bj 180 \nQ 181 17 n GLY . 181 Bj 181 \nQ 182 17 n GLU . 182 Bj 182 \nQ 183 17 n THR . 183 Bj 183 \nQ 184 17 n LEU . 184 Bj 184 \nQ 185 17 n ARG . 185 Bj 185 \nQ 186 17 n GLN . 186 Bj 186 \nQ 187 17 n THR . 187 Bj 187 \nQ 188 17 n ALA . 188 Bj 188 \nQ 189 17 n GLU . 189 Bj 189 \nQ 190 17 n ARG . 190 Bj 190 \nQ 191 17 n THR . 191 Bj 191 \nQ 192 17 n LEU . 192 Bj 192 \nQ 193 17 n ALA . 193 Bj 193 \nQ 194 17 n THR . 194 Bj 194 \nQ 195 17 n LEU . 195 Bj 195 \nQ 196 17 n SER . 196 Bj 196 \nQ 197 17 n GLU . 197 Bj 197 \nQ 198 17 n ASN . 198 Bj 198 \nQ 199 17 n ASN . 199 Bj 199 \nQ 200 17 n MET . 200 Bj 200 \nQ 201 17 n GLU . 201 Bj 201 \nQ 202 17 n ALA . 202 Bj 202 \nQ 203 17 n LYS . 203 Bj 203 \nQ 204 17 n PHE . 204 Bj 204 \nQ 205 17 n LEU . 205 Bj 205 \nQ 206 17 n GLY . 206 Bj 206 \nQ 207 17 n ASN . 207 Bj 207 \nQ 208 17 n ALA . 208 Bj 208 \nQ 209 17 n PRO . 209 Bj 209 \nQ 210 17 n CYS . 210 Bj 210 \nQ 211 17 n GLY . 211 Bj 211 \nQ 212 17 n HIS . 212 Bj 212 \nQ 213 17 n TYR . 213 Bj 213 \nQ 214 17 n LYS . 214 Bj 214 \nQ 215 17 n PHE . 215 Bj 215 \nQ 216 17 n LYS . 216 Bj 216 \nQ 217 17 n PHE . 217 Bj 217 \nQ ?   17 n PRO . 218 Bj 218 \nQ ?   17 n GLN . 219 Bj 219 \nQ ?   17 n ALA . 220 Bj 220 \nQ ?   17 n MET . 221 Bj 221 \nQ ?   17 n ARG . 222 Bj 222 \nQ ?   17 n THR . 223 Bj 223 \nQ ?   17 n GLU . 224 Bj 224 \nQ ?   17 n THR . 225 Bj 225 \nQ ?   17 n SER . 226 Bj 226 \nQ 227 17 n LEU . 227 Bj 227 \nQ 228 17 n GLY . 228 Bj 228 \nQ 229 17 n ALA . 229 Bj 229 \nQ 230 17 n LYS . 230 Bj 230 \nQ 231 17 n VAL . 231 Bj 231 \nQ 232 17 n PHE . 232 Bj 232 \nQ 233 17 n PHE . 233 Bj 233 \nQ 234 17 n PHE . 234 Bj 234 \nQ 235 17 n LYS . 235 Bj 235 \nQ 236 17 n ALA . 236 Bj 236 \nQ 237 17 n LEU . 237 Bj 237 \nQ 238 17 n LEU . 238 Bj 238 \nQ 239 17 n LEU . 239 Bj 239 \nQ 240 17 n THR . 240 Bj 240 \nQ 241 17 n GLY . 241 Bj 241 \nQ 242 17 n ASP . 242 Bj 242 \nQ 243 17 n PHE . 243 Bj 243 \nQ 244 17 n SER . 244 Bj 244 \nQ 245 17 n GLN . 245 Bj 245 \nQ 246 17 n ALA . 246 Bj 246 \nQ 247 17 n GLY . 247 Bj 247 \nQ 248 17 n LYS . 248 Bj 248 \nQ 249 17 n LYS . 249 Bj 249 \nQ 250 17 n GLY . 250 Bj 250 \nQ 251 17 n HIS . 251 Bj 251 \nQ 252 17 n HIS . 252 Bj 252 \nQ 253 17 n VAL . 253 Bj 253 \nQ 254 17 n TRP . 254 Bj 254 \nQ 255 17 n VAL . 255 Bj 255 \nQ 256 17 n SER . 256 Bj 256 \nQ 257 17 n LYS . 257 Bj 257 \nQ 258 17 n GLU . 258 Bj 258 \nQ 259 17 n GLU . 259 Bj 259 \nQ 260 17 n LEU . 260 Bj 260 \nQ 261 17 n GLY . 261 Bj 261 \nQ 262 17 n ASP . 262 Bj 262 \nQ 263 17 n TYR . 263 Bj 263 \nQ 264 17 n LEU . 264 Bj 264 \nQ 265 17 n LYS . 265 Bj 265 \nQ 266 17 n PRO . 266 Bj 266 \nQ 267 17 n LYS . 267 Bj 267 \nQ 268 17 n TYR . 268 Bj 268 \nQ 269 17 n LEU . 269 Bj 269 \nQ 270 17 n ALA . 270 Bj 270 \nQ 271 17 n GLN . 271 Bj 271 \nQ 272 17 n VAL . 272 Bj 272 \nQ 273 17 n ARG . 273 Bj 273 \nQ 274 17 n ARG . 274 Bj 274 \nQ 275 17 n PHE . 275 Bj 275 \nQ 276 17 n LEU . 276 Bj 276 \nQ 277 17 n LEU . 277 Bj 277 \nQ 278 17 n ASP . 278 Bj 278 \nQ 279 17 n LEU . 279 Bj 279 \n#\n_pdbx_struct_assembly.details            author_defined_assembly\n_pdbx_struct_assembly.id                 1\n_pdbx_struct_assembly.method_details     ?\n_pdbx_struct_assembly.oligomeric_count   95\n_pdbx_struct_assembly.oligomeric_details 95-meric\n#\n_pdbx_struct_assembly_gen.assembly_id     1\n_pdbx_struct_assembly_gen.asym_id_list    A,B,C,D,E,F,G,H,I,J,K,L,M,N,O,P,Q,R,S,T,U,V,W,X,Y,Z,AA,BA,CA,DA,EA,FA,GA,HA,IA,JA,KA,LA,MA,NA,OA,PA,QA,RA,SA,TA,UA,VA,WA,XA,YA,ZA,AB,BB,CB,DB,EB,FB,GB,HB,IB,JB,KB,LB,MB,NB,OB,PB,QB,RB,SB,TB,UB,VB,WB,XB,YB,ZB,AC,BC,CC,DC,EC,FC,GC,HC,IC,JC,KC,LC,MC,NC,OC,PC,QC,RC,SC,TC,UC,VC,WC,XC,YC,ZC,AD,BD,CD,DD,ED,FD,GD,HD,ID,JD,KD,LD,MD,ND,OD,PD,QD,RD,SD,TD,UD,VD,WD,XD,YD,ZD,AE,BE,CE,DE,EE,FE,GE,HE,IE,JE,KE,LE,ME,NE,OE,PE,QE,RE,SE,TE,UE,VE,WE,XE,YE,ZE,AF,BF,CF,DF,EF,FF,GF,HF,IF,JF,KF,LF,MF,NF,OF,PF,QF,RF,SF,TF,UF,VF,WF,XF,YF,ZF,AG,BG,CG,DG,EG,FG,GG,HG,IG,JG,KG,LG,MG,NG,OG,PG,QG,RG,SG,TG,UG,VG,WG,XG,YG,ZG,AH,BH,CH,DH,EH,FH,GH,HH,IH,JH,KH,LH,MH,NH,OH,PH,QH,RH,SH,TH,UH,VH,WH,XH,YH,ZH,AI,BI,CI,DI,EI,FI,GI,HI,II,JI,KI,LI,MI,NI,OI,PI,QI,RI,SI,TI,UI,VI,WI,XI,YI,ZI,AJ,BJ,CJ,DJ,EJ,FJ,GJ,HJ,IJ,JJ,KJ,LJ,MJ,NJ,OJ,PJ,QJ,RJ,SJ,TJ,UJ,VJ,WJ,XJ,YJ,ZJ,AK,BK,CK,DK,EK,FK,GK,HK,IK,JK,KK,LK,MK,NK,OK,PK,QK,RK,SK,TK,UK,VK,WK,XK,YK,ZK,AL,BL,CL,DL,EL,FL,GL,HL,IL,JL,KL,LL,ML,NL,OL,PL,QL,RL,SL,TL,UL,VL,WL,XL,YL,ZL,AM,BM,CM,DM,EM,FM,GM,HM,IM,JM,KM,LM,MM,NM,OM,PM,QM,RM,SM,TM,UM,VM,WM,XM,YM,ZM,AN,BN,CN,DN,EN,FN,GN,HN,IN,JN,KN,LN,MN,NN,ON,PN,QN,RN,SN,TN,UN,VN,WN,XN,YN,ZN,AO,BO,CO,DO,EO,FO,GO,HO,IO,JO,KO,LO,MO,NO,OO,PO,QO,RO,SO,TO,UO,VO,WO,XO,YO,ZO,AP,BP,CP,DP,EP,FP,GP,HP,IP,JP,KP,LP,MP,NP,OP,PP,QP,RP,SP\n_pdbx_struct_assembly_gen.oper_expression 1\n#\n_pdbx_struct_oper_list.id                 1\n_pdbx_struct_oper_list.matrix[1][1]       1.0000000000\n_pdbx_struct_oper_list.matrix[1][2]       0.0000000000\n_pdbx_struct_oper_list.matrix[1][3]       0.0000000000\n_pdbx_struct_oper_list.matrix[2][1]       0.0000000000\n_pdbx_struct_oper_list.matrix[2][2]       1.0000000000\n_pdbx_struct_oper_list.matrix[2][3]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][1]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][2]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][3]       1.0000000000\n_pdbx_struct_oper_list.name               1_555\n_pdbx_struct_oper_list.symmetry_operation ?\n_pdbx_struct_oper_list.type               \"identity operation\"\n_pdbx_struct_oper_list.vector[1]          0.0000000000\n_pdbx_struct_oper_list.vector[2]          0.0000000000\n_pdbx_struct_oper_list.vector[3]          0.0000000000\n#\n_refine.ls_d_res_high 4.20\n#\n_software.classification other\n_software.name           \"DeepMind Structure Class\"\n_software.pdbx_ordinal   1\n_software.version        2.0.0\n#\n_struct_asym.entity_id 17\n_struct_asym.id        Q\n#\nloop_\n_atom_site.group_PDB\n_atom_site.id\n_atom_site.type_symbol\n_atom_site.label_atom_id\n_atom_site.label_alt_id\n_atom_site.label_comp_id\n_atom_site.label_asym_id\n_atom_site.label_entity_id\n_atom_site.label_seq_id\n_atom_site.pdbx_PDB_ins_code\n_atom_site.Cartn_x\n_atom_site.Cartn_y\n_atom_site.Cartn_z\n_atom_site.occupancy\n_atom_site.B_iso_or_equiv\n_atom_site.auth_seq_id\n_atom_site.auth_asym_id\n_atom_site.pdbx_PDB_model_num\nATOM 1    N N   . SER Q 17 43  ? 162.672 264.147 303.911 1.00 104.46 43  Bj 1 \nATOM 2    C CA  . SER Q 17 43  ? 161.478 264.930 303.620 1.00 104.46 43  Bj 1 \nATOM 3    C C   . SER Q 17 43  ? 160.551 264.181 302.669 1.00 104.46 43  Bj 1 \nATOM 4    O O   . SER Q 17 43  ? 160.970 263.766 301.589 1.00 104.46 43  Bj 1 \nATOM 5    C CB  . SER Q 17 43  ? 161.857 266.287 303.024 1.00 104.46 43  Bj 1 \nATOM 6    O OG  . SER Q 17 43  ? 162.640 267.043 303.931 1.00 104.46 43  Bj 1 \nATOM 7    N N   . PRO Q 17 44  ? 159.295 264.000 303.074 1.00 115.21 44  Bj 1 \nATOM 8    C CA  . PRO Q 17 44  ? 158.333 263.328 302.193 1.00 115.21 44  Bj 1 \nATOM 9    C C   . PRO Q 17 44  ? 157.997 264.188 300.984 1.00 115.21 44  Bj 1 \nATOM 10   O O   . PRO Q 17 44  ? 157.754 265.392 301.099 1.00 115.21 44  Bj 1 \nATOM 11   C CB  . PRO Q 17 44  ? 157.110 263.118 303.093 1.00 115.21 44  Bj 1 \nATOM 12   C CG  . PRO Q 17 44  ? 157.236 264.161 304.150 1.00 115.21 44  Bj 1 \nATOM 13   C CD  . PRO Q 17 44  ? 158.707 264.346 304.379 1.00 115.21 44  Bj 1 \nATOM 14   N N   . TRP Q 17 45  ? 157.996 263.551 299.814 1.00 124.11 45  Bj 1 \nATOM 15   C CA  . TRP Q 17 45  ? 157.732 264.221 298.549 1.00 124.11 45  Bj 1 \nATOM 16   C C   . TRP Q 17 45  ? 156.706 263.430 297.755 1.00 124.11 45  Bj 1 \nATOM 17   O O   . TRP Q 17 45  ? 156.918 262.249 297.460 1.00 124.11 45  Bj 1 \nATOM 18   C CB  . TRP Q 17 45  ? 159.014 264.384 297.726 1.00 124.11 45  Bj 1 \nATOM 19   C CG  . TRP Q 17 45  ? 159.872 265.522 298.174 1.00 124.11 45  Bj 1 \nATOM 20   C CD1 . TRP Q 17 45  ? 160.962 265.456 298.990 1.00 124.11 45  Bj 1 \nATOM 21   C CD2 . TRP Q 17 45  ? 159.709 266.903 297.831 1.00 124.11 45  Bj 1 \nATOM 22   N NE1 . TRP Q 17 45  ? 161.490 266.710 299.176 1.00 124.11 45  Bj 1 \nATOM 23   C CE2 . TRP Q 17 45  ? 160.738 267.616 298.475 1.00 124.11 45  Bj 1 \nATOM 24   C CE3 . TRP Q 17 45  ? 158.793 267.605 297.042 1.00 124.11 45  Bj 1 \nATOM 25   C CZ2 . TRP Q 17 45  ? 160.877 268.997 298.355 1.00 124.11 45  Bj 1 \nATOM 26   C CZ3 . TRP Q 17 45  ? 158.932 268.975 296.925 1.00 124.11 45  Bj 1 \nATOM 27   C CH2 . TRP Q 17 45  ? 159.966 269.656 297.577 1.00 124.11 45  Bj 1 \nATOM 28   N N   . ARG Q 17 46  ? 155.602 264.083 297.413 1.00 135.34 46  Bj 1 \nATOM 29   C CA  . ARG Q 17 46  ? 154.591 263.520 296.531 1.00 135.34 46  Bj 1 \nATOM 30   C C   . ARG Q 17 46  ? 154.887 263.943 295.098 1.00 135.34 46  Bj 1 \nATOM 31   O O   . ARG Q 17 46  ? 155.343 265.063 294.855 1.00 135.34 46  Bj 1 \nATOM 32   C CB  . ARG Q 17 46  ? 153.191 263.983 296.943 1.00 135.34 46  Bj 1 \nATOM 33   C CG  . ARG Q 17 46  ? 152.052 263.259 296.243 1.00 135.34 46  Bj 1 \nATOM 34   C CD  . ARG Q 17 46  ? 150.703 263.776 296.723 1.00 135.34 46  Bj 1 \nATOM 35   N NE  . ARG Q 17 46  ? 149.585 263.097 296.074 1.00 135.34 46  Bj 1 \nATOM 36   C CZ  . ARG Q 17 46  ? 148.306 263.372 296.309 1.00 135.34 46  Bj 1 \nATOM 37   N NH1 . ARG Q 17 46  ? 147.977 264.316 297.180 1.00 135.34 46  Bj 1 \nATOM 38   N NH2 . ARG Q 17 46  ? 147.353 262.704 295.673 1.00 135.34 46  Bj 1 \nATOM 39   N N   . LEU Q 17 47  ? 154.641 263.040 294.152 1.00 137.26 47  Bj 1 \nATOM 40   C CA  . LEU Q 17 47  ? 154.910 263.296 292.743 1.00 137.26 47  Bj 1 \nATOM 41   C C   . LEU Q 17 47  ? 153.644 263.057 291.937 1.00 137.26 47  Bj 1 \nATOM 42   O O   . LEU Q 17 47  ? 152.955 262.053 292.143 1.00 137.26 47  Bj 1 \nATOM 43   C CB  . LEU Q 17 47  ? 156.056 262.414 292.233 1.00 137.26 47  Bj 1 \nATOM 44   C CG  . LEU Q 17 47  ? 156.329 261.107 292.986 1.00 137.26 47  Bj 1 \nATOM 45   C CD1 . LEU Q 17 47  ? 155.350 260.012 292.587 1.00 137.26 47  Bj 1 \nATOM 46   C CD2 . LEU Q 17 47  ? 157.766 260.652 292.776 1.00 137.26 47  Bj 1 \nATOM 47   N N   . LEU Q 17 48  ? 153.331 263.982 291.030 1.00 138.18 48  Bj 1 \nATOM 48   C CA  . LEU Q 17 48  ? 152.120 263.883 290.230 1.00 138.18 48  Bj 1 \nATOM 49   C C   . LEU Q 17 48  ? 152.394 264.339 288.806 1.00 138.18 48  Bj 1 \nATOM 50   O O   . LEU Q 17 48  ? 153.199 265.246 288.575 1.00 138.18 48  Bj 1 \nATOM 51   C CB  . LEU Q 17 48  ? 150.977 264.725 290.818 1.00 138.18 48  Bj 1 \nATOM 52   C CG  . LEU Q 17 48  ? 150.485 264.427 292.237 1.00 138.18 48  Bj 1 \nATOM 53   C CD1 . LEU Q 17 48  ? 151.283 265.210 293.269 1.00 138.18 48  Bj 1 \nATOM 54   C CD2 . LEU Q 17 48  ? 149.000 264.730 292.359 1.00 138.18 48  Bj 1 \nATOM 55   N N   . GLY Q 17 49  ? 151.716 263.701 287.855 1.00 135.43 49  Bj 1 \nATOM 56   C CA  . GLY Q 17 49  ? 151.707 264.149 286.482 1.00 135.43 49  Bj 1 \nATOM 57   C C   . GLY Q 17 49  ? 150.384 264.812 286.131 1.00 135.43 49  Bj 1 \nATOM 58   O O   . GLY Q 17 49  ? 149.360 264.601 286.775 1.00 135.43 49  Bj 1 \nATOM 59   N N   . ALA Q 17 50  ? 150.428 265.639 285.090 1.00 130.02 50  Bj 1 \nATOM 60   C CA  . ALA Q 17 50  ? 149.244 266.346 284.629 1.00 130.02 50  Bj 1 \nATOM 61   C C   . ALA Q 17 50  ? 149.304 266.468 283.116 1.00 130.02 50  Bj 1 \nATOM 62   O O   . ALA Q 17 50  ? 150.384 266.588 282.529 1.00 130.02 50  Bj 1 \nATOM 63   C CB  . ALA Q 17 50  ? 149.121 267.730 285.275 1.00 130.02 50  Bj 1 \nATOM 64   N N   . LEU Q 17 51  ? 148.131 266.439 282.491 1.00 127.85 51  Bj 1 \nATOM 65   C CA  . LEU Q 17 51  ? 148.013 266.429 281.039 1.00 127.85 51  Bj 1 \nATOM 66   C C   . LEU Q 17 51  ? 147.458 267.759 280.549 1.00 127.85 51  Bj 1 \nATOM 67   O O   . LEU Q 17 51  ? 146.498 268.285 281.121 1.00 127.85 51  Bj 1 \nATOM 68   C CB  . LEU Q 17 51  ? 147.117 265.280 280.572 1.00 127.85 51  Bj 1 \nATOM 69   C CG  . LEU Q 17 51  ? 146.876 265.173 279.065 1.00 127.85 51  Bj 1 \nATOM 70   C CD1 . LEU Q 17 51  ? 148.194 265.030 278.321 1.00 127.85 51  Bj 1 \nATOM 71   C CD2 . LEU Q 17 51  ? 145.949 264.010 278.748 1.00 127.85 51  Bj 1 \nATOM 72   N N   . CYS Q 17 52  ? 148.064 268.295 279.492 1.00 126.27 52  Bj 1 \nATOM 73   C CA  . CYS Q 17 52  ? 147.580 269.488 278.806 1.00 126.27 52  Bj 1 \nATOM 74   C C   . CYS Q 17 52  ? 147.282 269.077 277.369 1.00 126.27 52  Bj 1 \nATOM 75   O O   . CYS Q 17 52  ? 148.176 269.073 276.517 1.00 126.27 52  Bj 1 \nATOM 76   C CB  . CYS Q 17 52  ? 148.607 270.615 278.866 1.00 126.27 52  Bj 1 \nATOM 77   S SG  . CYS Q 17 52  ? 149.201 271.004 280.527 1.00 126.27 52  Bj 1 \nATOM 78   N N   . LEU Q 17 53  ? 146.033 268.707 277.107 1.00 117.88 53  Bj 1 \nATOM 79   C CA  . LEU Q 17 53  ? 145.621 268.248 275.787 1.00 117.88 53  Bj 1 \nATOM 80   C C   . LEU Q 17 53  ? 145.134 269.436 274.969 1.00 117.88 53  Bj 1 \nATOM 81   O O   . LEU Q 17 53  ? 144.159 270.096 275.343 1.00 117.88 53  Bj 1 \nATOM 82   C CB  . LEU Q 17 53  ? 144.526 267.191 275.898 1.00 117.88 53  Bj 1 \nATOM 83   C CG  . LEU Q 17 53  ? 143.910 266.774 274.563 1.00 117.88 53  Bj 1 \nATOM 84   C CD1 . LEU Q 17 53  ? 144.958 266.142 273.659 1.00 117.88 53  Bj 1 \nATOM 85   C CD2 . LEU Q 17 53  ? 142.749 265.828 274.792 1.00 117.88 53  Bj 1 \nATOM 86   N N   . GLN Q 17 54  ? 145.803 269.698 273.851 1.00 118.52 54  Bj 1 \nATOM 87   C CA  . GLN Q 17 54  ? 145.488 270.830 272.992 1.00 118.52 54  Bj 1 \nATOM 88   C C   . GLN Q 17 54  ? 144.817 270.326 271.723 1.00 118.52 54  Bj 1 \nATOM 89   O O   . GLN Q 17 54  ? 145.391 269.510 270.993 1.00 118.52 54  Bj 1 \nATOM 90   C CB  . GLN Q 17 54  ? 146.748 271.626 272.652 1.00 118.52 54  Bj 1 \nATOM 91   C CG  . GLN Q 17 54  ? 147.464 272.202 273.860 1.00 118.52 54  Bj 1 \nATOM 92   C CD  . GLN Q 17 54  ? 148.683 273.016 273.478 1.00 118.52 54  Bj 1 \nATOM 93   O OE1 . GLN Q 17 54  ? 148.961 273.222 272.297 1.00 118.52 54  Bj 1 \nATOM 94   N NE2 . GLN Q 17 54  ? 149.419 273.484 274.478 1.00 118.52 54  Bj 1 \nATOM 95   N N   . ARG Q 17 55  ? 143.598 270.796 271.480 1.00 113.62 55  Bj 1 \nATOM 96   C CA  . ARG Q 17 55  ? 142.952 270.625 270.189 1.00 113.62 55  Bj 1 \nATOM 97   C C   . ARG Q 17 55  ? 143.238 271.852 269.337 1.00 113.62 55  Bj 1 \nATOM 98   O O   . ARG Q 17 55  ? 142.879 272.968 269.740 1.00 113.62 55  Bj 1 \nATOM 99   C CB  . ARG Q 17 55  ? 141.455 270.444 270.349 1.00 113.62 55  Bj 1 \nATOM 100  C CG  . ARG Q 17 55  ? 140.733 270.185 269.037 1.00 113.62 55  Bj 1 \nATOM 101  C CD  . ARG Q 17 55  ? 139.290 270.650 269.102 1.00 113.62 55  Bj 1 \nATOM 102  N NE  . ARG Q 17 55  ? 139.013 271.693 268.119 1.00 113.62 55  Bj 1 \nATOM 103  C CZ  . ARG Q 17 55  ? 139.321 272.974 268.284 1.00 113.62 55  Bj 1 \nATOM 104  N NH1 . ARG Q 17 55  ? 139.923 273.375 269.395 1.00 113.62 55  Bj 1 \nATOM 105  N NH2 . ARG Q 17 55  ? 139.032 273.855 267.337 1.00 113.62 55  Bj 1 \nATOM 106  N N   . PRO Q 17 56  ? 143.874 271.703 268.180 1.00 114.98 56  Bj 1 \nATOM 107  C CA  . PRO Q 17 56  ? 144.258 272.868 267.384 1.00 114.98 56  Bj 1 \nATOM 108  C C   . PRO Q 17 56  ? 143.057 273.471 266.683 1.00 114.98 56  Bj 1 \nATOM 109  O O   . PRO Q 17 56  ? 142.018 272.811 266.528 1.00 114.98 56  Bj 1 \nATOM 110  C CB  . PRO Q 17 56  ? 145.255 272.283 266.375 1.00 114.98 56  Bj 1 \nATOM 111  C CG  . PRO Q 17 56  ? 144.800 270.875 266.201 1.00 114.98 56  Bj 1 \nATOM 112  C CD  . PRO Q 17 56  ? 144.288 270.438 267.549 1.00 114.98 56  Bj 1 \nATOM 113  N N   . PRO Q 17 57  ? 143.156 274.726 266.247 1.00 116.15 57  Bj 1 \nATOM 114  C CA  . PRO Q 17 57  ? 142.053 275.331 265.494 1.00 116.15 57  Bj 1 \nATOM 115  C C   . PRO Q 17 57  ? 141.864 274.658 264.144 1.00 116.15 57  Bj 1 \nATOM 116  O O   . PRO Q 17 57  ? 142.830 274.337 263.446 1.00 116.15 57  Bj 1 \nATOM 117  C CB  . PRO Q 17 57  ? 142.492 276.791 265.334 1.00 116.15 57  Bj 1 \nATOM 118  C CG  . PRO Q 17 57  ? 143.977 276.762 265.492 1.00 116.15 57  Bj 1 \nATOM 119  C CD  . PRO Q 17 57  ? 144.251 275.681 266.490 1.00 116.15 57  Bj 1 \nATOM 120  N N   . LEU Q 17 58  ? 140.600 274.449 263.778 1.00 116.27 58  Bj 1 \nATOM 121  C CA  . LEU Q 17 58  ? 140.270 273.823 262.504 1.00 116.27 58  Bj 1 \nATOM 122  C C   . LEU Q 17 58  ? 140.215 274.830 261.361 1.00 116.27 58  Bj 1 \nATOM 123  O O   . LEU Q 17 58  ? 140.604 274.507 260.234 1.00 116.27 58  Bj 1 \nATOM 124  C CB  . LEU Q 17 58  ? 138.934 273.084 262.609 1.00 116.27 58  Bj 1 \nATOM 125  C CG  . LEU Q 17 58  ? 138.884 271.888 263.562 1.00 116.27 58  Bj 1 \nATOM 126  C CD1 . LEU Q 17 58  ? 137.503 271.254 263.554 1.00 116.27 58  Bj 1 \nATOM 127  C CD2 . LEU Q 17 58  ? 139.946 270.864 263.194 1.00 116.27 58  Bj 1 \nATOM 128  N N   . VAL Q 17 59  ? 139.743 276.044 261.628 1.00 110.63 59  Bj 1 \nATOM 129  C CA  . VAL Q 17 59  ? 139.613 277.074 260.606 1.00 110.63 59  Bj 1 \nATOM 130  C C   . VAL Q 17 59  ? 140.674 278.138 260.846 1.00 110.63 59  Bj 1 \nATOM 131  O O   . VAL Q 17 59  ? 141.190 278.295 261.959 1.00 110.63 59  Bj 1 \nATOM 132  C CB  . VAL Q 17 59  ? 138.197 277.692 260.596 1.00 110.63 59  Bj 1 \nATOM 133  C CG1 . VAL Q 17 59  ? 138.060 278.749 261.681 1.00 110.63 59  Bj 1 \nATOM 134  C CG2 . VAL Q 17 59  ? 137.873 278.271 259.228 1.00 110.63 59  Bj 1 \nATOM 135  N N   . THR Q 17 60  ? 141.010 278.864 259.784 1.00 105.54 60  Bj 1 \nATOM 136  C CA  . THR Q 17 60  ? 142.011 279.914 259.869 1.00 105.54 60  Bj 1 \nATOM 137  C C   . THR Q 17 60  ? 141.427 281.168 260.510 1.00 105.54 60  Bj 1 \nATOM 138  O O   . THR Q 17 60  ? 140.245 281.483 260.349 1.00 105.54 60  Bj 1 \nATOM 139  C CB  . THR Q 17 60  ? 142.562 280.246 258.481 1.00 105.54 60  Bj 1 \nATOM 140  O OG1 . THR Q 17 60  ? 143.384 281.417 258.558 1.00 105.54 60  Bj 1 \nATOM 141  C CG2 . THR Q 17 60  ? 141.426 280.489 257.498 1.00 105.54 60  Bj 1 \nATOM 142  N N   . LYS Q 17 61  ? 142.275 281.882 261.244 1.00 98.53  61  Bj 1 \nATOM 143  C CA  . LYS Q 17 61  ? 141.844 283.097 261.913 1.00 98.53  61  Bj 1 \nATOM 144  C C   . LYS Q 17 61  ? 141.540 284.190 260.890 1.00 98.53  61  Bj 1 \nATOM 145  O O   . LYS Q 17 61  ? 142.039 284.151 259.762 1.00 98.53  61  Bj 1 \nATOM 146  C CB  . LYS Q 17 61  ? 142.918 283.578 262.886 1.00 98.53  61  Bj 1 \nATOM 147  C CG  . LYS Q 17 61  ? 143.171 282.633 264.046 1.00 98.53  61  Bj 1 \nATOM 148  C CD  . LYS Q 17 61  ? 144.091 283.258 265.081 1.00 98.53  61  Bj 1 \nATOM 149  C CE  . LYS Q 17 61  ? 144.264 282.348 266.288 1.00 98.53  61  Bj 1 \nATOM 150  N NZ  . LYS Q 17 61  ? 145.130 282.959 267.333 1.00 98.53  61  Bj 1 \nATOM 151  N N   . PRO Q 17 62  ? 140.716 285.171 261.253 1.00 97.74  62  Bj 1 \nATOM 152  C CA  . PRO Q 17 62  ? 140.458 286.288 260.340 1.00 97.74  62  Bj 1 \nATOM 153  C C   . PRO Q 17 62  ? 141.703 287.136 260.133 1.00 97.74  62  Bj 1 \nATOM 154  O O   . PRO Q 17 62  ? 142.668 287.080 260.898 1.00 97.74  62  Bj 1 \nATOM 155  C CB  . PRO Q 17 62  ? 139.357 287.083 261.049 1.00 97.74  62  Bj 1 \nATOM 156  C CG  . PRO Q 17 62  ? 139.506 286.725 262.488 1.00 97.74  62  Bj 1 \nATOM 157  C CD  . PRO Q 17 62  ? 139.933 285.287 262.495 1.00 97.74  62  Bj 1 \nATOM 158  N N   . LEU Q 17 63  ? 141.667 287.934 259.071 1.00 100.40 63  Bj 1 \nATOM 159  C CA  . LEU Q 17 63  ? 142.797 288.761 258.672 1.00 100.40 63  Bj 1 \nATOM 160  C C   . LEU Q 17 63  ? 142.618 290.179 259.198 1.00 100.40 63  Bj 1 \nATOM 161  O O   . LEU Q 17 63  ? 141.553 290.781 259.027 1.00 100.40 63  Bj 1 \nATOM 162  C CB  . LEU Q 17 63  ? 142.946 288.779 257.150 1.00 100.40 63  Bj 1 \nATOM 163  C CG  . LEU Q 17 63  ? 143.056 287.411 256.475 1.00 100.40 63  Bj 1 \nATOM 164  C CD1 . LEU Q 17 63  ? 143.238 287.556 254.972 1.00 100.40 63  Bj 1 \nATOM 165  C CD2 . LEU Q 17 63  ? 144.195 286.614 257.080 1.00 100.40 63  Bj 1 \nATOM 166  N N   . THR Q 17 64  ? 143.657 290.697 259.845 1.00 107.97 64  Bj 1 \nATOM 167  C CA  . THR Q 17 64  ? 143.667 292.093 260.253 1.00 107.97 64  Bj 1 \nATOM 168  C C   . THR Q 17 64  ? 143.516 292.982 259.019 1.00 107.97 64  Bj 1 \nATOM 169  O O   . THR Q 17 64  ? 144.073 292.666 257.964 1.00 107.97 64  Bj 1 \nATOM 170  C CB  . THR Q 17 64  ? 144.974 292.410 260.987 1.00 107.97 64  Bj 1 \nATOM 171  O OG1 . THR Q 17 64  ? 145.120 291.524 262.105 1.00 107.97 64  Bj 1 \nATOM 172  C CG2 . THR Q 17 64  ? 145.005 293.848 261.485 1.00 107.97 64  Bj 1 \nATOM 173  N N   . PRO Q 17 65  ? 142.750 294.076 259.102 1.00 107.81 65  Bj 1 \nATOM 174  C CA  . PRO Q 17 65  ? 142.603 294.962 257.932 1.00 107.81 65  Bj 1 \nATOM 175  C C   . PRO Q 17 65  ? 143.921 295.427 257.333 1.00 107.81 65  Bj 1 \nATOM 176  O O   . PRO Q 17 65  ? 144.005 295.621 256.112 1.00 107.81 65  Bj 1 \nATOM 177  C CB  . PRO Q 17 65  ? 141.785 296.141 258.486 1.00 107.81 65  Bj 1 \nATOM 178  C CG  . PRO Q 17 65  ? 141.775 295.966 259.988 1.00 107.81 65  Bj 1 \nATOM 179  C CD  . PRO Q 17 65  ? 141.881 294.498 260.212 1.00 107.81 65  Bj 1 \nATOM 180  N N   . LEU Q 17 66  ? 144.958 295.608 258.152 1.00 108.37 66  Bj 1 \nATOM 181  C CA  . LEU Q 17 66  ? 146.280 295.907 257.613 1.00 108.37 66  Bj 1 \nATOM 182  C C   . LEU Q 17 66  ? 146.764 294.776 256.714 1.00 108.37 66  Bj 1 \nATOM 183  O O   . LEU Q 17 66  ? 147.264 295.010 255.605 1.00 108.37 66  Bj 1 \nATOM 184  C CB  . LEU Q 17 66  ? 147.261 296.150 258.760 1.00 108.37 66  Bj 1 \nATOM 185  C CG  . LEU Q 17 66  ? 148.674 296.601 258.394 1.00 108.37 66  Bj 1 \nATOM 186  C CD1 . LEU Q 17 66  ? 148.637 297.948 257.693 1.00 108.37 66  Bj 1 \nATOM 187  C CD2 . LEU Q 17 66  ? 149.550 296.661 259.635 1.00 108.37 66  Bj 1 \nATOM 188  N N   . GLN Q 17 67  ? 146.602 293.533 257.172 1.00 108.81 67  Bj 1 \nATOM 189  C CA  . GLN Q 17 67  ? 146.992 292.387 256.360 1.00 108.81 67  Bj 1 \nATOM 190  C C   . GLN Q 17 67  ? 146.109 292.247 255.126 1.00 108.81 67  Bj 1 \nATOM 191  O O   . GLN Q 17 67  ? 146.569 291.758 254.091 1.00 108.81 67  Bj 1 \nATOM 192  C CB  . GLN Q 17 67  ? 146.951 291.114 257.204 1.00 108.81 67  Bj 1 \nATOM 193  C CG  . GLN Q 17 67  ? 147.901 291.140 258.391 1.00 108.81 67  Bj 1 \nATOM 194  C CD  . GLN Q 17 67  ? 148.113 289.770 259.002 1.00 108.81 67  Bj 1 \nATOM 195  O OE1 . GLN Q 17 67  ? 147.728 288.754 258.424 1.00 108.81 67  Bj 1 \nATOM 196  N NE2 . GLN Q 17 67  ? 148.730 289.735 260.177 1.00 108.81 67  Bj 1 \nATOM 197  N N   . GLU Q 17 68  ? 144.851 292.683 255.209 1.00 110.89 68  Bj 1 \nATOM 198  C CA  . GLU Q 17 68  ? 143.985 292.678 254.034 1.00 110.89 68  Bj 1 \nATOM 199  C C   . GLU Q 17 68  ? 144.476 293.670 252.987 1.00 110.89 68  Bj 1 \nATOM 200  O O   . GLU Q 17 68  ? 144.512 293.356 251.791 1.00 110.89 68  Bj 1 \nATOM 201  C CB  . GLU Q 17 68  ? 142.545 292.997 254.438 1.00 110.89 68  Bj 1 \nATOM 202  C CG  . GLU Q 17 68  ? 141.839 291.878 255.186 1.00 110.89 68  Bj 1 \nATOM 203  C CD  . GLU Q 17 68  ? 141.367 290.766 254.268 1.00 110.89 68  Bj 1 \nATOM 204  O OE1 . GLU Q 17 68  ? 141.481 290.917 253.034 1.00 110.89 68  Bj 1 \nATOM 205  O OE2 . GLU Q 17 68  ? 140.877 289.740 254.783 1.00 110.89 68  Bj 1 \nATOM 206  N N   . GLU Q 17 69  ? 144.845 294.877 253.421 1.00 119.08 69  Bj 1 \nATOM 207  C CA  . GLU Q 17 69  ? 145.448 295.841 252.506 1.00 119.08 69  Bj 1 \nATOM 208  C C   . GLU Q 17 69  ? 146.723 295.281 251.888 1.00 119.08 69  Bj 1 \nATOM 209  O O   . GLU Q 17 69  ? 146.964 295.440 250.684 1.00 119.08 69  Bj 1 \nATOM 210  C CB  . GLU Q 17 69  ? 145.744 297.150 253.237 1.00 119.08 69  Bj 1 \nATOM 211  C CG  . GLU Q 17 69  ? 144.526 297.820 253.844 1.00 119.08 69  Bj 1 \nATOM 212  C CD  . GLU Q 17 69  ? 144.878 299.094 254.586 1.00 119.08 69  Bj 1 \nATOM 213  O OE1 . GLU Q 17 69  ? 146.016 299.584 254.422 1.00 119.08 69  Bj 1 \nATOM 214  O OE2 . GLU Q 17 69  ? 144.018 299.605 255.334 1.00 119.08 69  Bj 1 \nATOM 215  N N   . MET Q 17 70  ? 147.551 294.620 252.702 1.00 119.12 70  Bj 1 \nATOM 216  C CA  . MET Q 17 70  ? 148.786 294.039 252.184 1.00 119.12 70  Bj 1 \nATOM 217  C C   . MET Q 17 70  ? 148.499 292.952 251.153 1.00 119.12 70  Bj 1 \nATOM 218  O O   . MET Q 17 70  ? 149.177 292.872 250.123 1.00 119.12 70  Bj 1 \nATOM 219  C CB  . MET Q 17 70  ? 149.628 293.487 253.335 1.00 119.12 70  Bj 1 \nATOM 220  C CG  . MET Q 17 70  ? 150.879 292.746 252.892 1.00 119.12 70  Bj 1 \nATOM 221  S SD  . MET Q 17 70  ? 151.859 293.670 251.693 1.00 119.12 70  Bj 1 \nATOM 222  C CE  . MET Q 17 70  ? 152.198 295.174 252.604 1.00 119.12 70  Bj 1 \nATOM 223  N N   . ALA Q 17 71  ? 147.494 292.112 251.408 1.00 117.23 71  Bj 1 \nATOM 224  C CA  . ALA Q 17 71  ? 147.151 291.056 250.461 1.00 117.23 71  Bj 1 \nATOM 225  C C   . ALA Q 17 71  ? 146.601 291.635 249.164 1.00 117.23 71  Bj 1 \nATOM 226  O O   . ALA Q 17 71  ? 146.901 291.130 248.075 1.00 117.23 71  Bj 1 \nATOM 227  C CB  . ALA Q 17 71  ? 146.146 290.093 251.089 1.00 117.23 71  Bj 1 \nATOM 228  N N   . ASP Q 17 72  ? 145.790 292.690 249.260 1.00 117.37 72  Bj 1 \nATOM 229  C CA  . ASP Q 17 72  ? 145.300 293.360 248.060 1.00 117.37 72  Bj 1 \nATOM 230  C C   . ASP Q 17 72  ? 146.459 293.920 247.245 1.00 117.37 72  Bj 1 \nATOM 231  O O   . ASP Q 17 72  ? 146.511 293.759 246.020 1.00 117.37 72  Bj 1 \nATOM 232  C CB  . ASP Q 17 72  ? 144.317 294.468 248.446 1.00 117.37 72  Bj 1 \nATOM 233  C CG  . ASP Q 17 72  ? 143.468 294.941 247.276 1.00 117.37 72  Bj 1 \nATOM 234  O OD1 . ASP Q 17 72  ? 143.969 294.974 246.132 1.00 117.37 72  Bj 1 \nATOM 235  O OD2 . ASP Q 17 72  ? 142.289 295.283 247.504 1.00 117.37 72  Bj 1 \nATOM 236  N N   . LEU Q 17 73  ? 147.405 294.580 247.919 1.00 119.96 73  Bj 1 \nATOM 237  C CA  . LEU Q 17 73  ? 148.572 295.115 247.226 1.00 119.96 73  Bj 1 \nATOM 238  C C   . LEU Q 17 73  ? 149.385 294.005 246.571 1.00 119.96 73  Bj 1 \nATOM 239  O O   . LEU Q 17 73  ? 149.873 294.161 245.443 1.00 119.96 73  Bj 1 \nATOM 240  C CB  . LEU Q 17 73  ? 149.436 295.910 248.205 1.00 119.96 73  Bj 1 \nATOM 241  C CG  . LEU Q 17 73  ? 150.798 296.368 247.685 1.00 119.96 73  Bj 1 \nATOM 242  C CD1 . LEU Q 17 73  ? 150.633 297.215 246.438 1.00 119.96 73  Bj 1 \nATOM 243  C CD2 . LEU Q 17 73  ? 151.550 297.134 248.760 1.00 119.96 73  Bj 1 \nATOM 244  N N   . LEU Q 17 74  ? 149.546 292.877 247.266 1.00 118.44 74  Bj 1 \nATOM 245  C CA  . LEU Q 17 74  ? 150.309 291.766 246.709 1.00 118.44 74  Bj 1 \nATOM 246  C C   . LEU Q 17 74  ? 149.627 291.192 245.476 1.00 118.44 74  Bj 1 \nATOM 247  O O   . LEU Q 17 74  ? 150.288 290.911 244.472 1.00 118.44 74  Bj 1 \nATOM 248  C CB  . LEU Q 17 74  ? 150.513 290.683 247.766 1.00 118.44 74  Bj 1 \nATOM 249  C CG  . LEU Q 17 74  ? 151.495 291.024 248.888 1.00 118.44 74  Bj 1 \nATOM 250  C CD1 . LEU Q 17 74  ? 151.535 289.909 249.915 1.00 118.44 74  Bj 1 \nATOM 251  C CD2 . LEU Q 17 74  ? 152.883 291.289 248.326 1.00 118.44 74  Bj 1 \nATOM 252  N N   . GLN Q 17 75  ? 148.305 291.017 245.529 1.00 121.57 75  Bj 1 \nATOM 253  C CA  . GLN Q 17 75  ? 147.584 290.533 244.356 1.00 121.57 75  Bj 1 \nATOM 254  C C   . GLN Q 17 75  ? 147.705 291.512 243.195 1.00 121.57 75  Bj 1 \nATOM 255  O O   . GLN Q 17 75  ? 147.891 291.101 242.042 1.00 121.57 75  Bj 1 \nATOM 256  C CB  . GLN Q 17 75  ? 146.116 290.286 244.704 1.00 121.57 75  Bj 1 \nATOM 257  C CG  . GLN Q 17 75  ? 145.881 289.058 245.568 1.00 121.57 75  Bj 1 \nATOM 258  C CD  . GLN Q 17 75  ? 146.176 287.763 244.836 1.00 121.57 75  Bj 1 \nATOM 259  O OE1 . GLN Q 17 75  ? 146.161 287.713 243.606 1.00 121.57 75  Bj 1 \nATOM 260  N NE2 . GLN Q 17 75  ? 146.449 286.705 245.592 1.00 121.57 75  Bj 1 \nATOM 261  N N   . GLN Q 17 76  ? 147.617 292.813 243.483 1.00 121.41 76  Bj 1 \nATOM 262  C CA  . GLN Q 17 76  ? 147.734 293.811 242.425 1.00 121.41 76  Bj 1 \nATOM 263  C C   . GLN Q 17 76  ? 149.103 293.751 241.760 1.00 121.41 76  Bj 1 \nATOM 264  O O   . GLN Q 17 76  ? 149.204 293.703 240.529 1.00 121.41 76  Bj 1 \nATOM 265  C CB  . GLN Q 17 76  ? 147.468 295.209 242.984 1.00 121.41 76  Bj 1 \nATOM 266  C CG  . GLN Q 17 76  ? 146.016 295.474 243.336 1.00 121.41 76  Bj 1 \nATOM 267  C CD  . GLN Q 17 76  ? 145.782 296.899 243.795 1.00 121.41 76  Bj 1 \nATOM 268  O OE1 . GLN Q 17 76  ? 146.644 297.764 243.637 1.00 121.41 76  Bj 1 \nATOM 269  N NE2 . GLN Q 17 76  ? 144.612 297.151 244.370 1.00 121.41 76  Bj 1 \nATOM 270  N N   . ILE Q 17 77  ? 150.173 293.743 242.560 1.00 121.50 77  Bj 1 \nATOM 271  C CA  . ILE Q 17 77  ? 151.509 293.737 241.969 1.00 121.50 77  Bj 1 \nATOM 272  C C   . ILE Q 17 77  ? 151.794 292.406 241.283 1.00 121.50 77  Bj 1 \nATOM 273  O O   . ILE Q 17 77  ? 152.530 292.360 240.289 1.00 121.50 77  Bj 1 \nATOM 274  C CB  . ILE Q 17 77  ? 152.579 294.076 243.026 1.00 121.50 77  Bj 1 \nATOM 275  C CG1 . ILE Q 17 77  ? 152.598 293.031 244.141 1.00 121.50 77  Bj 1 \nATOM 276  C CG2 . ILE Q 17 77  ? 152.341 295.466 243.594 1.00 121.50 77  Bj 1 \nATOM 277  C CD1 . ILE Q 17 77  ? 153.596 293.329 245.239 1.00 121.50 77  Bj 1 \nATOM 278  N N   . GLU Q 17 78  ? 151.203 291.311 241.770 1.00 127.63 78  Bj 1 \nATOM 279  C CA  . GLU Q 17 78  ? 151.360 290.022 241.105 1.00 127.63 78  Bj 1 \nATOM 280  C C   . GLU Q 17 78  ? 150.720 290.042 239.724 1.00 127.63 78  Bj 1 \nATOM 281  O O   . GLU Q 17 78  ? 151.334 289.616 238.738 1.00 127.63 78  Bj 1 \nATOM 282  C CB  . GLU Q 17 78  ? 150.751 288.916 241.968 1.00 127.63 78  Bj 1 \nATOM 283  C CG  . GLU Q 17 78  ? 150.750 287.538 241.324 1.00 127.63 78  Bj 1 \nATOM 284  C CD  . GLU Q 17 78  ? 149.964 286.520 242.129 1.00 127.63 78  Bj 1 \nATOM 285  O OE1 . GLU Q 17 78  ? 149.341 286.910 243.139 1.00 127.63 78  Bj 1 \nATOM 286  O OE2 . GLU Q 17 78  ? 149.967 285.329 241.753 1.00 127.63 78  Bj 1 \nATOM 287  N N   . ILE Q 17 79  ? 149.483 290.539 239.634 1.00 128.89 79  Bj 1 \nATOM 288  C CA  . ILE Q 17 79  ? 148.823 290.642 238.336 1.00 128.89 79  Bj 1 \nATOM 289  C C   . ILE Q 17 79  ? 149.572 291.607 237.426 1.00 128.89 79  Bj 1 \nATOM 290  O O   . ILE Q 17 79  ? 149.639 291.400 236.208 1.00 128.89 79  Bj 1 \nATOM 291  C CB  . ILE Q 17 79  ? 147.349 291.057 238.519 1.00 128.89 79  Bj 1 \nATOM 292  C CG1 . ILE Q 17 79  ? 146.601 290.011 239.349 1.00 128.89 79  Bj 1 \nATOM 293  C CG2 . ILE Q 17 79  ? 146.667 291.245 237.171 1.00 128.89 79  Bj 1 \nATOM 294  C CD1 . ILE Q 17 79  ? 145.159 290.370 239.635 1.00 128.89 79  Bj 1 \nATOM 295  N N   . GLU Q 17 80  ? 150.159 292.661 237.996 1.00 120.51 80  Bj 1 \nATOM 296  C CA  . GLU Q 17 80  ? 150.899 293.625 237.187 1.00 120.51 80  Bj 1 \nATOM 297  C C   . GLU Q 17 80  ? 152.154 292.998 236.589 1.00 120.51 80  Bj 1 \nATOM 298  O O   . GLU Q 17 80  ? 152.403 293.116 235.384 1.00 120.51 80  Bj 1 \nATOM 299  C CB  . GLU Q 17 80  ? 151.254 294.849 238.029 1.00 120.51 80  Bj 1 \nATOM 300  C CG  . GLU Q 17 80  ? 150.076 295.764 238.317 1.00 120.51 80  Bj 1 \nATOM 301  C CD  . GLU Q 17 80  ? 150.361 296.745 239.436 1.00 120.51 80  Bj 1 \nATOM 302  O OE1 . GLU Q 17 80  ? 151.384 296.573 240.132 1.00 120.51 80  Bj 1 \nATOM 303  O OE2 . GLU Q 17 80  ? 149.562 297.686 239.621 1.00 120.51 80  Bj 1 \nATOM 304  N N   . ARG Q 17 81  ? 152.958 292.327 237.415 1.00 127.65 81  Bj 1 \nATOM 305  C CA  . ARG Q 17 81  ? 154.175 291.694 236.924 1.00 127.65 81  Bj 1 \nATOM 306  C C   . ARG Q 17 81  ? 153.910 290.416 236.139 1.00 127.65 81  Bj 1 \nATOM 307  O O   . ARG Q 17 81  ? 154.830 289.913 235.485 1.00 127.65 81  Bj 1 \nATOM 308  C CB  . ARG Q 17 81  ? 155.125 291.390 238.086 1.00 127.65 81  Bj 1 \nATOM 309  C CG  . ARG Q 17 81  ? 155.793 292.620 238.677 1.00 127.65 81  Bj 1 \nATOM 310  C CD  . ARG Q 17 81  ? 156.934 292.237 239.606 1.00 127.65 81  Bj 1 \nATOM 311  N NE  . ARG Q 17 81  ? 157.606 293.409 240.160 1.00 127.65 81  Bj 1 \nATOM 312  C CZ  . ARG Q 17 81  ? 158.686 293.357 240.933 1.00 127.65 81  Bj 1 \nATOM 313  N NH1 . ARG Q 17 81  ? 159.223 292.186 241.246 1.00 127.65 81  Bj 1 \nATOM 314  N NH2 . ARG Q 17 81  ? 159.230 294.475 241.393 1.00 127.65 81  Bj 1 \nATOM 315  N N   . SER Q 17 82  ? 152.693 289.881 236.188 1.00 132.55 82  Bj 1 \nATOM 316  C CA  . SER Q 17 82  ? 152.370 288.695 235.409 1.00 132.55 82  Bj 1 \nATOM 317  C C   . SER Q 17 82  ? 152.400 289.006 233.917 1.00 132.55 82  Bj 1 \nATOM 318  O O   . SER Q 17 82  ? 152.138 290.132 233.487 1.00 132.55 82  Bj 1 \nATOM 319  C CB  . SER Q 17 82  ? 150.995 288.155 235.799 1.00 132.55 82  Bj 1 \nATOM 320  O OG  . SER Q 17 82  ? 150.618 287.084 234.953 1.00 132.55 82  Bj 1 \nATOM 321  N N   . LEU Q 17 83  ? 152.726 287.986 233.123 1.00 141.40 83  Bj 1 \nATOM 322  C CA  . LEU Q 17 83  ? 152.784 288.167 231.677 1.00 141.40 83  Bj 1 \nATOM 323  C C   . LEU Q 17 83  ? 151.391 288.102 231.062 1.00 141.40 83  Bj 1 \nATOM 324  O O   . LEU Q 17 83  ? 150.906 289.086 230.495 1.00 141.40 83  Bj 1 \nATOM 325  C CB  . LEU Q 17 83  ? 153.703 287.117 231.046 1.00 141.40 83  Bj 1 \nATOM 326  C CG  . LEU Q 17 83  ? 155.217 287.359 231.080 1.00 141.40 83  Bj 1 \nATOM 327  C CD1 . LEU Q 17 83  ? 155.777 287.271 232.494 1.00 141.40 83  Bj 1 \nATOM 328  C CD2 . LEU Q 17 83  ? 155.934 286.382 230.159 1.00 141.40 83  Bj 1 \nATOM 329  N N   . TYR Q 17 84  ? 150.729 286.953 231.185 1.00 138.40 84  Bj 1 \nATOM 330  C CA  . TYR Q 17 84  ? 149.374 286.749 230.687 1.00 138.40 84  Bj 1 \nATOM 331  C C   . TYR Q 17 84  ? 148.911 285.361 231.099 1.00 138.40 84  Bj 1 \nATOM 332  O O   . TYR Q 17 84  ? 149.722 284.476 231.384 1.00 138.40 84  Bj 1 \nATOM 333  C CB  . TYR Q 17 84  ? 149.286 286.904 229.164 1.00 138.40 84  Bj 1 \nATOM 334  C CG  . TYR Q 17 84  ? 148.728 288.236 228.722 1.00 138.40 84  Bj 1 \nATOM 335  C CD1 . TYR Q 17 84  ? 147.825 288.929 229.517 1.00 138.40 84  Bj 1 \nATOM 336  C CD2 . TYR Q 17 84  ? 149.110 288.805 227.515 1.00 138.40 84  Bj 1 \nATOM 337  C CE1 . TYR Q 17 84  ? 147.313 290.147 229.120 1.00 138.40 84  Bj 1 \nATOM 338  C CE2 . TYR Q 17 84  ? 148.604 290.023 227.109 1.00 138.40 84  Bj 1 \nATOM 339  C CZ  . TYR Q 17 84  ? 147.706 290.690 227.916 1.00 138.40 84  Bj 1 \nATOM 340  O OH  . TYR Q 17 84  ? 147.198 291.905 227.517 1.00 138.40 84  Bj 1 \nATOM 341  N N   . SER Q 17 85  ? 147.594 285.185 231.119 1.00 142.26 85  Bj 1 \nATOM 342  C CA  . SER Q 17 85  ? 146.972 283.899 231.385 1.00 142.26 85  Bj 1 \nATOM 343  C C   . SER Q 17 85  ? 146.297 283.383 230.122 1.00 142.26 85  Bj 1 \nATOM 344  O O   . SER Q 17 85  ? 145.916 284.154 229.237 1.00 142.26 85  Bj 1 \nATOM 345  C CB  . SER Q 17 85  ? 145.951 284.005 232.523 1.00 142.26 85  Bj 1 \nATOM 346  O OG  . SER Q 17 85  ? 145.350 282.749 232.786 1.00 142.26 85  Bj 1 \nATOM 347  N N   . ASP Q 17 86  ? 146.159 282.058 230.045 1.00 146.76 86  Bj 1 \nATOM 348  C CA  . ASP Q 17 86  ? 145.513 281.453 228.884 1.00 146.76 86  Bj 1 \nATOM 349  C C   . ASP Q 17 86  ? 144.067 281.911 228.760 1.00 146.76 86  Bj 1 \nATOM 350  O O   . ASP Q 17 86  ? 143.592 282.202 227.656 1.00 146.76 86  Bj 1 \nATOM 351  C CB  . ASP Q 17 86  ? 145.586 279.929 228.976 1.00 146.76 86  Bj 1 \nATOM 352  C CG  . ASP Q 17 86  ? 147.009 279.410 228.939 1.00 146.76 86  Bj 1 \nATOM 353  O OD1 . ASP Q 17 86  ? 147.939 280.227 228.775 1.00 146.76 86  Bj 1 \nATOM 354  O OD2 . ASP Q 17 86  ? 147.198 278.182 229.073 1.00 146.76 86  Bj 1 \nATOM 355  N N   . HIS Q 17 87  ? 143.355 281.991 229.886 1.00 143.58 87  Bj 1 \nATOM 356  C CA  . HIS Q 17 87  ? 141.955 282.403 229.864 1.00 143.58 87  Bj 1 \nATOM 357  C C   . HIS Q 17 87  ? 141.808 283.826 229.339 1.00 143.58 87  Bj 1 \nATOM 358  O O   . HIS Q 17 87  ? 141.013 284.086 228.428 1.00 143.58 87  Bj 1 \nATOM 359  C CB  . HIS Q 17 87  ? 141.361 282.274 231.266 1.00 143.58 87  Bj 1 \nATOM 360  C CG  . HIS Q 17 87  ? 139.966 282.801 231.387 1.00 143.58 87  Bj 1 \nATOM 361  N ND1 . HIS Q 17 87  ? 138.892 282.220 230.748 1.00 143.58 87  Bj 1 \nATOM 362  C CD2 . HIS Q 17 87  ? 139.468 283.854 232.078 1.00 143.58 87  Bj 1 \nATOM 363  C CE1 . HIS Q 17 87  ? 137.793 282.893 231.039 1.00 143.58 87  Bj 1 \nATOM 364  N NE2 . HIS Q 17 87  ? 138.115 283.889 231.844 1.00 143.58 87  Bj 1 \nATOM 365  N N   . GLU Q 17 88  ? 142.573 284.764 229.906 1.00 144.20 88  Bj 1 \nATOM 366  C CA  . GLU Q 17 88  ? 142.496 286.152 229.463 1.00 144.20 88  Bj 1 \nATOM 367  C C   . GLU Q 17 88  ? 142.938 286.295 228.013 1.00 144.20 88  Bj 1 \nATOM 368  O O   . GLU Q 17 88  ? 142.350 287.073 227.251 1.00 144.20 88  Bj 1 \nATOM 369  C CB  . GLU Q 17 88  ? 143.348 287.040 230.370 1.00 144.20 88  Bj 1 \nATOM 370  C CG  . GLU Q 17 88  ? 142.916 287.043 231.827 1.00 144.20 88  Bj 1 \nATOM 371  C CD  . GLU Q 17 88  ? 141.589 287.744 232.044 1.00 144.20 88  Bj 1 \nATOM 372  O OE1 . GLU Q 17 88  ? 141.201 288.571 231.193 1.00 144.20 88  Bj 1 \nATOM 373  O OE2 . GLU Q 17 88  ? 140.932 287.466 233.070 1.00 144.20 88  Bj 1 \nATOM 374  N N   . LEU Q 17 89  ? 143.972 285.551 227.614 1.00 150.45 89  Bj 1 \nATOM 375  C CA  . LEU Q 17 89  ? 144.455 285.625 226.240 1.00 150.45 89  Bj 1 \nATOM 376  C C   . LEU Q 17 89  ? 143.384 285.161 225.263 1.00 150.45 89  Bj 1 \nATOM 377  O O   . LEU Q 17 89  ? 143.108 285.834 224.263 1.00 150.45 89  Bj 1 \nATOM 378  C CB  . LEU Q 17 89  ? 145.732 284.795 226.090 1.00 150.45 89  Bj 1 \nATOM 379  C CG  . LEU Q 17 89  ? 146.537 284.942 224.794 1.00 150.45 89  Bj 1 \nATOM 380  C CD1 . LEU Q 17 89  ? 148.022 284.792 225.081 1.00 150.45 89  Bj 1 \nATOM 381  C CD2 . LEU Q 17 89  ? 146.100 283.926 223.748 1.00 150.45 89  Bj 1 \nATOM 382  N N   . ARG Q 17 90  ? 142.765 284.008 225.537 1.00 152.73 90  Bj 1 \nATOM 383  C CA  . ARG Q 17 90  ? 141.701 283.518 224.667 1.00 152.73 90  Bj 1 \nATOM 384  C C   . ARG Q 17 90  ? 140.519 284.478 224.647 1.00 152.73 90  Bj 1 \nATOM 385  O O   . ARG Q 17 90  ? 139.922 284.715 223.590 1.00 152.73 90  Bj 1 \nATOM 386  C CB  . ARG Q 17 90  ? 141.249 282.128 225.114 1.00 152.73 90  Bj 1 \nATOM 387  C CG  . ARG Q 17 90  ? 142.304 281.042 224.985 1.00 152.73 90  Bj 1 \nATOM 388  C CD  . ARG Q 17 90  ? 141.785 279.721 225.532 1.00 152.73 90  Bj 1 \nATOM 389  N NE  . ARG Q 17 90  ? 142.813 278.685 225.563 1.00 152.73 90  Bj 1 \nATOM 390  C CZ  . ARG Q 17 90  ? 142.621 277.456 226.032 1.00 152.73 90  Bj 1 \nATOM 391  N NH1 . ARG Q 17 90  ? 141.435 277.105 226.511 1.00 152.73 90  Bj 1 \nATOM 392  N NH2 . ARG Q 17 90  ? 143.613 276.577 226.022 1.00 152.73 90  Bj 1 \nATOM 393  N N   . ALA Q 17 91  ? 140.174 285.051 225.804 1.00 151.16 91  Bj 1 \nATOM 394  C CA  . ALA Q 17 91  ? 139.046 285.974 225.863 1.00 151.16 91  Bj 1 \nATOM 395  C C   . ALA Q 17 91  ? 139.295 287.204 225.000 1.00 151.16 91  Bj 1 \nATOM 396  O O   . ALA Q 17 91  ? 138.448 287.586 224.184 1.00 151.16 91  Bj 1 \nATOM 397  C CB  . ALA Q 17 91  ? 138.774 286.377 227.313 1.00 151.16 91  Bj 1 \nATOM 398  N N   . LEU Q 17 92  ? 140.462 287.836 225.160 1.00 153.35 92  Bj 1 \nATOM 399  C CA  . LEU Q 17 92  ? 140.757 289.032 224.378 1.00 153.35 92  Bj 1 \nATOM 400  C C   . LEU Q 17 92  ? 140.911 288.700 222.898 1.00 153.35 92  Bj 1 \nATOM 401  O O   . LEU Q 17 92  ? 140.504 289.488 222.035 1.00 153.35 92  Bj 1 \nATOM 402  C CB  . LEU Q 17 92  ? 142.008 289.729 224.920 1.00 153.35 92  Bj 1 \nATOM 403  C CG  . LEU Q 17 92  ? 143.367 289.021 224.908 1.00 153.35 92  Bj 1 \nATOM 404  C CD1 . LEU Q 17 92  ? 144.128 289.267 223.608 1.00 153.35 92  Bj 1 \nATOM 405  C CD2 . LEU Q 17 92  ? 144.198 289.456 226.107 1.00 153.35 92  Bj 1 \nATOM 406  N N   . ASP Q 17 93  ? 141.477 287.531 222.583 1.00 158.04 93  Bj 1 \nATOM 407  C CA  . ASP Q 17 93  ? 141.618 287.134 221.188 1.00 158.04 93  Bj 1 \nATOM 408  C C   . ASP Q 17 93  ? 140.259 286.958 220.528 1.00 158.04 93  Bj 1 \nATOM 409  O O   . ASP Q 17 93  ? 140.031 287.459 219.422 1.00 158.04 93  Bj 1 \nATOM 410  C CB  . ASP Q 17 93  ? 142.435 285.845 221.091 1.00 158.04 93  Bj 1 \nATOM 411  C CG  . ASP Q 17 93  ? 142.537 285.325 219.671 1.00 158.04 93  Bj 1 \nATOM 412  O OD1 . ASP Q 17 93  ? 143.236 285.958 218.852 1.00 158.04 93  Bj 1 \nATOM 413  O OD2 . ASP Q 17 93  ? 141.915 284.283 219.372 1.00 158.04 93  Bj 1 \nATOM 414  N N   . GLU Q 17 94  ? 139.338 286.257 221.195 1.00 152.75 94  Bj 1 \nATOM 415  C CA  . GLU Q 17 94  ? 138.009 286.061 220.624 1.00 152.75 94  Bj 1 \nATOM 416  C C   . GLU Q 17 94  ? 137.242 287.374 220.544 1.00 152.75 94  Bj 1 \nATOM 417  O O   . GLU Q 17 94  ? 136.508 287.609 219.576 1.00 152.75 94  Bj 1 \nATOM 418  C CB  . GLU Q 17 94  ? 137.232 285.028 221.439 1.00 152.75 94  Bj 1 \nATOM 419  C CG  . GLU Q 17 94  ? 137.821 283.622 221.404 1.00 152.75 94  Bj 1 \nATOM 420  C CD  . GLU Q 17 94  ? 137.812 283.008 220.014 1.00 152.75 94  Bj 1 \nATOM 421  O OE1 . GLU Q 17 94  ? 138.701 283.342 219.202 1.00 152.75 94  Bj 1 \nATOM 422  O OE2 . GLU Q 17 94  ? 136.913 282.189 219.734 1.00 152.75 94  Bj 1 \nATOM 423  N N   . ALA Q 17 95  ? 137.404 288.249 221.541 1.00 149.73 95  Bj 1 \nATOM 424  C CA  . ALA Q 17 95  ? 136.744 289.549 221.485 1.00 149.73 95  Bj 1 \nATOM 425  C C   . ALA Q 17 95  ? 137.228 290.374 220.300 1.00 149.73 95  Bj 1 \nATOM 426  O O   . ALA Q 17 95  ? 136.409 290.925 219.556 1.00 149.73 95  Bj 1 \nATOM 427  C CB  . ALA Q 17 95  ? 136.966 290.311 222.791 1.00 149.73 95  Bj 1 \nATOM 428  N N   . GLN Q 17 96  ? 138.545 290.458 220.098 1.00 150.30 96  Bj 1 \nATOM 429  C CA  . GLN Q 17 96  ? 139.069 291.205 218.961 1.00 150.30 96  Bj 1 \nATOM 430  C C   . GLN Q 17 96  ? 138.693 290.549 217.637 1.00 150.30 96  Bj 1 \nATOM 431  O O   . GLN Q 17 96  ? 138.419 291.247 216.653 1.00 150.30 96  Bj 1 \nATOM 432  C CB  . GLN Q 17 96  ? 140.587 291.346 219.080 1.00 150.30 96  Bj 1 \nATOM 433  C CG  . GLN Q 17 96  ? 141.037 292.145 220.293 1.00 150.30 96  Bj 1 \nATOM 434  C CD  . GLN Q 17 96  ? 142.543 292.301 220.364 1.00 150.30 96  Bj 1 \nATOM 435  O OE1 . GLN Q 17 96  ? 143.262 291.925 219.438 1.00 150.30 96  Bj 1 \nATOM 436  N NE2 . GLN Q 17 96  ? 143.029 292.859 221.467 1.00 150.30 96  Bj 1 \nATOM 437  N N   . GLN Q 17 97  ? 138.657 289.214 217.595 1.00 151.44 97  Bj 1 \nATOM 438  C CA  . GLN Q 17 97  ? 138.274 288.528 216.367 1.00 151.44 97  Bj 1 \nATOM 439  C C   . GLN Q 17 97  ? 136.824 288.819 216.005 1.00 151.44 97  Bj 1 \nATOM 440  O O   . GLN Q 17 97  ? 136.511 289.077 214.838 1.00 151.44 97  Bj 1 \nATOM 441  C CB  . GLN Q 17 97  ? 138.504 287.024 216.512 1.00 151.44 97  Bj 1 \nATOM 442  C CG  . GLN Q 17 97  ? 138.299 286.242 215.225 1.00 151.44 97  Bj 1 \nATOM 443  C CD  . GLN Q 17 97  ? 138.665 284.777 215.367 1.00 151.44 97  Bj 1 \nATOM 444  O OE1 . GLN Q 17 97  ? 138.752 284.049 214.377 1.00 151.44 97  Bj 1 \nATOM 445  N NE2 . GLN Q 17 97  ? 138.881 284.336 216.601 1.00 151.44 97  Bj 1 \nATOM 446  N N   . LEU Q 17 98  ? 135.926 288.798 216.992 1.00 148.86 98  Bj 1 \nATOM 447  C CA  . LEU Q 17 98  ? 134.535 289.147 216.723 1.00 148.86 98  Bj 1 \nATOM 448  C C   . LEU Q 17 98  ? 134.399 290.617 216.343 1.00 148.86 98  Bj 1 \nATOM 449  O O   . LEU Q 17 98  ? 133.602 290.963 215.462 1.00 148.86 98  Bj 1 \nATOM 450  C CB  . LEU Q 17 98  ? 133.663 288.821 217.936 1.00 148.86 98  Bj 1 \nATOM 451  C CG  . LEU Q 17 98  ? 132.970 287.455 217.941 1.00 148.86 98  Bj 1 \nATOM 452  C CD1 . LEU Q 17 98  ? 133.982 286.318 217.938 1.00 148.86 98  Bj 1 \nATOM 453  C CD2 . LEU Q 17 98  ? 132.028 287.335 219.129 1.00 148.86 98  Bj 1 \nATOM 454  N N   . ALA Q 17 99  ? 135.174 291.494 216.988 1.00 145.68 99  Bj 1 \nATOM 455  C CA  . ALA Q 17 99  ? 135.111 292.915 216.661 1.00 145.68 99  Bj 1 \nATOM 456  C C   . ALA Q 17 99  ? 135.546 293.172 215.225 1.00 145.68 99  Bj 1 \nATOM 457  O O   . ALA Q 17 99  ? 134.966 294.018 214.534 1.00 145.68 99  Bj 1 \nATOM 458  C CB  . ALA Q 17 99  ? 135.974 293.716 217.636 1.00 145.68 99  Bj 1 \nATOM 459  N N   . LYS Q 17 100 ? 136.567 292.452 214.755 1.00 146.95 100 Bj 1 \nATOM 460  C CA  . LYS Q 17 100 ? 137.039 292.630 213.387 1.00 146.95 100 Bj 1 \nATOM 461  C C   . LYS Q 17 100 ? 136.219 291.845 212.371 1.00 146.95 100 Bj 1 \nATOM 462  O O   . LYS Q 17 100 ? 136.274 292.159 211.177 1.00 146.95 100 Bj 1 \nATOM 463  C CB  . LYS Q 17 100 ? 138.514 292.233 213.279 1.00 146.95 100 Bj 1 \nATOM 464  C CG  . LYS Q 17 100 ? 139.442 293.056 214.160 1.00 146.95 100 Bj 1 \nATOM 465  C CD  . LYS Q 17 100 ? 139.237 294.550 213.946 1.00 146.95 100 Bj 1 \nATOM 466  C CE  . LYS Q 17 100 ? 139.610 294.973 212.533 1.00 146.95 100 Bj 1 \nATOM 467  N NZ  . LYS Q 17 100 ? 139.301 296.408 212.288 1.00 146.95 100 Bj 1 \nATOM 468  N N   . LYS Q 17 101 ? 135.468 290.833 212.812 1.00 146.63 101 Bj 1 \nATOM 469  C CA  . LYS Q 17 101 ? 134.598 290.100 211.900 1.00 146.63 101 Bj 1 \nATOM 470  C C   . LYS Q 17 101 ? 133.263 290.804 211.699 1.00 146.63 101 Bj 1 \nATOM 471  O O   . LYS Q 17 101 ? 132.679 290.714 210.613 1.00 146.63 101 Bj 1 \nATOM 472  C CB  . LYS Q 17 101 ? 134.377 288.677 212.420 1.00 146.63 101 Bj 1 \nATOM 473  C CG  . LYS Q 17 101 ? 133.447 287.827 211.565 1.00 146.63 101 Bj 1 \nATOM 474  C CD  . LYS Q 17 101 ? 133.953 287.708 210.137 1.00 146.63 101 Bj 1 \nATOM 475  C CE  . LYS Q 17 101 ? 132.991 286.903 209.277 1.00 146.63 101 Bj 1 \nATOM 476  N NZ  . LYS Q 17 101 ? 133.449 286.811 207.864 1.00 146.63 101 Bj 1 \nATOM 477  N N   . LYS Q 17 102 ? 132.768 291.510 212.721 1.00 149.37 102 Bj 1 \nATOM 478  C CA  . LYS Q 17 102 ? 131.516 292.243 212.568 1.00 149.37 102 Bj 1 \nATOM 479  C C   . LYS Q 17 102 ? 131.629 293.337 211.515 1.00 149.37 102 Bj 1 \nATOM 480  O O   . LYS Q 17 102 ? 130.622 293.722 210.910 1.00 149.37 102 Bj 1 \nATOM 481  C CB  . LYS Q 17 102 ? 131.084 292.839 213.908 1.00 149.37 102 Bj 1 \nATOM 482  C CG  . LYS Q 17 102 ? 130.550 291.819 214.900 1.00 149.37 102 Bj 1 \nATOM 483  C CD  . LYS Q 17 102 ? 130.124 292.485 216.198 1.00 149.37 102 Bj 1 \nATOM 484  C CE  . LYS Q 17 102 ? 129.052 293.533 215.952 1.00 149.37 102 Bj 1 \nATOM 485  N NZ  . LYS Q 17 102 ? 127.840 292.944 215.321 1.00 149.37 102 Bj 1 \nATOM 486  N N   . SER Q 17 103 ? 132.836 293.849 211.283 1.00 153.12 103 Bj 1 \nATOM 487  C CA  . SER Q 17 103 ? 133.065 294.846 210.248 1.00 153.12 103 Bj 1 \nATOM 488  C C   . SER Q 17 103 ? 133.347 294.232 208.883 1.00 153.12 103 Bj 1 \nATOM 489  O O   . SER Q 17 103 ? 133.244 294.935 207.872 1.00 153.12 103 Bj 1 \nATOM 490  C CB  . SER Q 17 103 ? 134.228 295.762 210.645 1.00 153.12 103 Bj 1 \nATOM 491  O OG  . SER Q 17 103 ? 135.428 295.024 210.805 1.00 153.12 103 Bj 1 \nATOM 492  N N   . ASP Q 17 104 ? 133.696 292.950 208.828 1.00 150.06 104 Bj 1 \nATOM 493  C CA  . ASP Q 17 104 ? 133.990 292.286 207.564 1.00 150.06 104 Bj 1 \nATOM 494  C C   . ASP Q 17 104 ? 133.253 290.954 207.461 1.00 150.06 104 Bj 1 \nATOM 495  O O   . ASP Q 17 104 ? 132.042 290.886 207.671 1.00 150.06 104 Bj 1 \nATOM 496  C CB  . ASP Q 17 104 ? 135.497 292.067 207.412 1.00 150.06 104 Bj 1 \nATOM 497  C CG  . ASP Q 17 104 ? 135.859 291.377 206.111 1.00 150.06 104 Bj 1 \nATOM 498  O OD1 . ASP Q 17 104 ? 135.698 292.000 205.040 1.00 150.06 104 Bj 1 \nATOM 499  O OD2 . ASP Q 17 104 ? 136.307 290.212 206.158 1.00 150.06 104 Bj 1 \nATOM 500  N N   . LEU Q 17 116 ? 133.163 280.213 224.046 1.00 145.92 116 Bj 1 \nATOM 501  C CA  . LEU Q 17 116 ? 133.824 281.452 224.439 1.00 145.92 116 Bj 1 \nATOM 502  C C   . LEU Q 17 116 ? 134.248 281.400 225.904 1.00 145.92 116 Bj 1 \nATOM 503  O O   . LEU Q 17 116 ? 134.010 280.409 226.594 1.00 145.92 116 Bj 1 \nATOM 504  C CB  . LEU Q 17 116 ? 132.909 282.657 224.197 1.00 145.92 116 Bj 1 \nATOM 505  C CG  . LEU Q 17 116 ? 132.645 283.081 222.748 1.00 145.92 116 Bj 1 \nATOM 506  C CD1 . LEU Q 17 116 ? 133.940 283.098 221.947 1.00 145.92 116 Bj 1 \nATOM 507  C CD2 . LEU Q 17 116 ? 131.596 282.203 222.072 1.00 145.92 116 Bj 1 \nATOM 508  N N   . ALA Q 17 117 ? 134.878 282.476 226.373 1.00 150.38 117 Bj 1 \nATOM 509  C CA  . ALA Q 17 117 ? 135.358 282.543 227.748 1.00 150.38 117 Bj 1 \nATOM 510  C C   . ALA Q 17 117 ? 134.316 283.114 228.702 1.00 150.38 117 Bj 1 \nATOM 511  O O   . ALA Q 17 117 ? 134.259 282.710 229.870 1.00 150.38 117 Bj 1 \nATOM 512  C CB  . ALA Q 17 117 ? 136.638 283.378 227.815 1.00 150.38 117 Bj 1 \nATOM 513  N N   . GLN Q 17 118 ? 133.490 284.050 228.229 1.00 142.89 118 Bj 1 \nATOM 514  C CA  . GLN Q 17 118 ? 132.488 284.656 229.099 1.00 142.89 118 Bj 1 \nATOM 515  C C   . GLN Q 17 118 ? 131.425 283.644 229.507 1.00 142.89 118 Bj 1 \nATOM 516  O O   . GLN Q 17 118 ? 130.930 283.680 230.639 1.00 142.89 118 Bj 1 \nATOM 517  C CB  . GLN Q 17 118 ? 131.852 285.861 228.409 1.00 142.89 118 Bj 1 \nATOM 518  C CG  . GLN Q 17 118 ? 132.831 286.982 228.103 1.00 142.89 118 Bj 1 \nATOM 519  C CD  . GLN Q 17 118 ? 132.150 288.215 227.546 1.00 142.89 118 Bj 1 \nATOM 520  O OE1 . GLN Q 17 118 ? 130.942 288.218 227.309 1.00 142.89 118 Bj 1 \nATOM 521  N NE2 . GLN Q 17 118 ? 132.924 289.274 227.337 1.00 142.89 118 Bj 1 \nATOM 522  N N   . ASP Q 17 119 ? 131.065 282.731 228.601 1.00 146.82 119 Bj 1 \nATOM 523  C CA  . ASP Q 17 119 ? 130.108 281.686 228.951 1.00 146.82 119 Bj 1 \nATOM 524  C C   . ASP Q 17 119 ? 130.655 280.792 230.056 1.00 146.82 119 Bj 1 \nATOM 525  O O   . ASP Q 17 119 ? 129.943 280.472 231.016 1.00 146.82 119 Bj 1 \nATOM 526  C CB  . ASP Q 17 119 ? 129.759 280.857 227.715 1.00 146.82 119 Bj 1 \nATOM 527  C CG  . ASP Q 17 119 ? 129.136 281.688 226.613 1.00 146.82 119 Bj 1 \nATOM 528  O OD1 . ASP Q 17 119 ? 128.456 282.687 226.932 1.00 146.82 119 Bj 1 \nATOM 529  O OD2 . ASP Q 17 119 ? 129.325 281.343 225.428 1.00 146.82 119 Bj 1 \nATOM 530  N N   . LEU Q 17 120 ? 131.922 280.388 229.941 1.00 143.97 120 Bj 1 \nATOM 531  C CA  . LEU Q 17 120 ? 132.531 279.559 230.976 1.00 143.97 120 Bj 1 \nATOM 532  C C   . LEU Q 17 120 ? 132.639 280.316 232.294 1.00 143.97 120 Bj 1 \nATOM 533  O O   . LEU Q 17 120 ? 132.434 279.736 233.367 1.00 143.97 120 Bj 1 \nATOM 534  C CB  . LEU Q 17 120 ? 133.907 279.077 230.517 1.00 143.97 120 Bj 1 \nATOM 535  C CG  . LEU Q 17 120 ? 133.963 278.376 229.157 1.00 143.97 120 Bj 1 \nATOM 536  C CD1 . LEU Q 17 120 ? 135.379 277.917 228.843 1.00 143.97 120 Bj 1 \nATOM 537  C CD2 . LEU Q 17 120 ? 132.992 277.205 229.107 1.00 143.97 120 Bj 1 \nATOM 538  N N   . GLU Q 17 121 ? 132.949 281.613 232.235 1.00 138.39 121 Bj 1 \nATOM 539  C CA  . GLU Q 17 121 ? 133.032 282.405 233.459 1.00 138.39 121 Bj 1 \nATOM 540  C C   . GLU Q 17 121 ? 131.674 282.510 234.141 1.00 138.39 121 Bj 1 \nATOM 541  O O   . GLU Q 17 121 ? 131.573 282.370 235.366 1.00 138.39 121 Bj 1 \nATOM 542  C CB  . GLU Q 17 121 ? 133.586 283.796 233.152 1.00 138.39 121 Bj 1 \nATOM 543  C CG  . GLU Q 17 121 ? 133.560 284.751 234.337 1.00 138.39 121 Bj 1 \nATOM 544  C CD  . GLU Q 17 121 ? 134.430 284.285 235.491 1.00 138.39 121 Bj 1 \nATOM 545  O OE1 . GLU Q 17 121 ? 135.428 283.575 235.242 1.00 138.39 121 Bj 1 \nATOM 546  O OE2 . GLU Q 17 121 ? 134.114 284.628 236.650 1.00 138.39 121 Bj 1 \nATOM 547  N N   . ASP Q 17 122 ? 130.617 282.755 233.364 1.00 136.27 122 Bj 1 \nATOM 548  C CA  . ASP Q 17 122 ? 129.278 282.822 233.938 1.00 136.27 122 Bj 1 \nATOM 549  C C   . ASP Q 17 122 ? 128.853 281.471 234.501 1.00 136.27 122 Bj 1 \nATOM 550  O O   . ASP Q 17 122 ? 128.190 281.408 235.543 1.00 136.27 122 Bj 1 \nATOM 551  C CB  . ASP Q 17 122 ? 128.281 283.308 232.888 1.00 136.27 122 Bj 1 \nATOM 552  C CG  . ASP Q 17 122 ? 128.626 284.682 232.352 1.00 136.27 122 Bj 1 \nATOM 553  O OD1 . ASP Q 17 122 ? 129.645 285.254 232.793 1.00 136.27 122 Bj 1 \nATOM 554  O OD2 . ASP Q 17 122 ? 127.881 285.189 231.488 1.00 136.27 122 Bj 1 \nATOM 555  N N   . MET Q 17 123 ? 129.232 280.381 233.829 1.00 138.10 123 Bj 1 \nATOM 556  C CA  . MET Q 17 123 ? 128.929 279.051 234.345 1.00 138.10 123 Bj 1 \nATOM 557  C C   . MET Q 17 123 ? 129.632 278.806 235.675 1.00 138.10 123 Bj 1 \nATOM 558  O O   . MET Q 17 123 ? 129.032 278.278 236.618 1.00 138.10 123 Bj 1 \nATOM 559  C CB  . MET Q 17 123 ? 129.329 277.991 233.319 1.00 138.10 123 Bj 1 \nATOM 560  C CG  . MET Q 17 123 ? 128.950 276.572 233.702 1.00 138.10 123 Bj 1 \nATOM 561  S SD  . MET Q 17 123 ? 129.525 275.362 232.494 1.00 138.10 123 Bj 1 \nATOM 562  C CE  . MET Q 17 123 ? 128.763 275.986 230.998 1.00 138.10 123 Bj 1 \nATOM 563  N N   . TRP Q 17 124 ? 130.906 279.192 235.770 1.00 136.46 124 Bj 1 \nATOM 564  C CA  . TRP Q 17 124 ? 131.634 279.040 237.027 1.00 136.46 124 Bj 1 \nATOM 565  C C   . TRP Q 17 124 ? 131.008 279.885 238.129 1.00 136.46 124 Bj 1 \nATOM 566  O O   . TRP Q 17 124 ? 130.875 279.430 239.272 1.00 136.46 124 Bj 1 \nATOM 567  C CB  . TRP Q 17 124 ? 133.102 279.416 236.828 1.00 136.46 124 Bj 1 \nATOM 568  C CG  . TRP Q 17 124 ? 133.795 278.588 235.791 1.00 136.46 124 Bj 1 \nATOM 569  C CD1 . TRP Q 17 124 ? 133.472 277.320 235.405 1.00 136.46 124 Bj 1 \nATOM 570  C CD2 . TRP Q 17 124 ? 134.920 278.975 234.994 1.00 136.46 124 Bj 1 \nATOM 571  N NE1 . TRP Q 17 124 ? 134.331 276.891 234.423 1.00 136.46 124 Bj 1 \nATOM 572  C CE2 . TRP Q 17 124 ? 135.229 277.889 234.152 1.00 136.46 124 Bj 1 \nATOM 573  C CE3 . TRP Q 17 124 ? 135.698 280.134 234.913 1.00 136.46 124 Bj 1 \nATOM 574  C CZ2 . TRP Q 17 124 ? 136.283 277.927 233.242 1.00 136.46 124 Bj 1 \nATOM 575  C CZ3 . TRP Q 17 124 ? 136.743 280.169 234.009 1.00 136.46 124 Bj 1 \nATOM 576  C CH2 . TRP Q 17 124 ? 137.026 279.073 233.186 1.00 136.46 124 Bj 1 \nATOM 577  N N   . GLU Q 17 125 ? 130.604 281.116 237.802 1.00 133.02 125 Bj 1 \nATOM 578  C CA  . GLU Q 17 125 ? 129.992 281.984 238.803 1.00 133.02 125 Bj 1 \nATOM 579  C C   . GLU Q 17 125 ? 128.671 281.413 239.299 1.00 133.02 125 Bj 1 \nATOM 580  O O   . GLU Q 17 125 ? 128.403 281.405 240.507 1.00 133.02 125 Bj 1 \nATOM 581  C CB  . GLU Q 17 125 ? 129.785 283.386 238.231 1.00 133.02 125 Bj 1 \nATOM 582  C CG  . GLU Q 17 125 ? 131.071 284.154 237.985 1.00 133.02 125 Bj 1 \nATOM 583  C CD  . GLU Q 17 125 ? 130.819 285.533 237.408 1.00 133.02 125 Bj 1 \nATOM 584  O OE1 . GLU Q 17 125 ? 129.640 285.874 237.179 1.00 133.02 125 Bj 1 \nATOM 585  O OE2 . GLU Q 17 125 ? 131.799 286.274 237.184 1.00 133.02 125 Bj 1 \nATOM 586  N N   . GLN Q 17 126 ? 127.828 280.928 238.383 1.00 132.06 126 Bj 1 \nATOM 587  C CA  . GLN Q 17 126 ? 126.550 280.374 238.808 1.00 132.06 126 Bj 1 \nATOM 588  C C   . GLN Q 17 126 ? 126.735 279.073 239.580 1.00 132.06 126 Bj 1 \nATOM 589  O O   . GLN Q 17 126 ? 125.981 278.808 240.520 1.00 132.06 126 Bj 1 \nATOM 590  C CB  . GLN Q 17 126 ? 125.624 280.176 237.605 1.00 132.06 126 Bj 1 \nATOM 591  C CG  . GLN Q 17 126 ? 126.097 279.164 236.583 1.00 132.06 126 Bj 1 \nATOM 592  C CD  . GLN Q 17 126 ? 125.303 279.223 235.293 1.00 132.06 126 Bj 1 \nATOM 593  O OE1 . GLN Q 17 126 ? 124.412 280.057 235.137 1.00 132.06 126 Bj 1 \nATOM 594  N NE2 . GLN Q 17 126 ? 125.624 278.335 234.359 1.00 132.06 126 Bj 1 \nATOM 595  N N   . LYS Q 17 127 ? 127.748 278.271 239.234 1.00 128.96 127 Bj 1 \nATOM 596  C CA  . LYS Q 17 127 ? 128.037 277.081 240.029 1.00 128.96 127 Bj 1 \nATOM 597  C C   . LYS Q 17 127 ? 128.495 277.455 241.433 1.00 128.96 127 Bj 1 \nATOM 598  O O   . LYS Q 17 127 ? 128.100 276.813 242.414 1.00 128.96 127 Bj 1 \nATOM 599  C CB  . LYS Q 17 127 ? 129.093 276.223 239.332 1.00 128.96 127 Bj 1 \nATOM 600  C CG  . LYS Q 17 127 ? 128.593 275.496 238.093 1.00 128.96 127 Bj 1 \nATOM 601  C CD  . LYS Q 17 127 ? 129.699 274.667 237.457 1.00 128.96 127 Bj 1 \nATOM 602  C CE  . LYS Q 17 127 ? 129.191 273.901 236.246 1.00 128.96 127 Bj 1 \nATOM 603  N NZ  . LYS Q 17 127 ? 130.253 273.047 235.645 1.00 128.96 127 Bj 1 \nATOM 604  N N   . PHE Q 17 128 ? 129.328 278.493 241.547 1.00 124.78 128 Bj 1 \nATOM 605  C CA  . PHE Q 17 128 ? 129.778 278.943 242.861 1.00 124.78 128 Bj 1 \nATOM 606  C C   . PHE Q 17 128 ? 128.613 279.459 243.694 1.00 124.78 128 Bj 1 \nATOM 607  O O   . PHE Q 17 128 ? 128.543 279.208 244.903 1.00 124.78 128 Bj 1 \nATOM 608  C CB  . PHE Q 17 128 ? 130.845 280.026 242.703 1.00 124.78 128 Bj 1 \nATOM 609  C CG  . PHE Q 17 128 ? 131.325 280.607 244.004 1.00 124.78 128 Bj 1 \nATOM 610  C CD1 . PHE Q 17 128 ? 132.290 279.956 244.754 1.00 124.78 128 Bj 1 \nATOM 611  C CD2 . PHE Q 17 128 ? 130.821 281.810 244.470 1.00 124.78 128 Bj 1 \nATOM 612  C CE1 . PHE Q 17 128 ? 132.737 280.489 245.948 1.00 124.78 128 Bj 1 \nATOM 613  C CE2 . PHE Q 17 128 ? 131.264 282.348 245.663 1.00 124.78 128 Bj 1 \nATOM 614  C CZ  . PHE Q 17 128 ? 132.223 281.687 246.403 1.00 124.78 128 Bj 1 \nATOM 615  N N   . LEU Q 17 129 ? 127.688 280.186 243.064 1.00 122.50 129 Bj 1 \nATOM 616  C CA  . LEU Q 17 129 ? 126.535 280.696 243.799 1.00 122.50 129 Bj 1 \nATOM 617  C C   . LEU Q 17 129 ? 125.558 279.583 244.162 1.00 122.50 129 Bj 1 \nATOM 618  O O   . LEU Q 17 129 ? 124.879 279.670 245.192 1.00 122.50 129 Bj 1 \nATOM 619  C CB  . LEU Q 17 129 ? 125.829 281.784 242.989 1.00 122.50 129 Bj 1 \nATOM 620  C CG  . LEU Q 17 129 ? 126.260 283.226 243.273 1.00 122.50 129 Bj 1 \nATOM 621  C CD1 . LEU Q 17 129 ? 126.103 283.546 244.752 1.00 122.50 129 Bj 1 \nATOM 622  C CD2 . LEU Q 17 129 ? 127.688 283.484 242.817 1.00 122.50 129 Bj 1 \nATOM 623  N N   . HIS Q 17 130 ? 125.472 278.535 243.339 1.00 124.27 130 Bj 1 \nATOM 624  C CA  . HIS Q 17 130 ? 124.581 277.424 243.653 1.00 124.27 130 Bj 1 \nATOM 625  C C   . HIS Q 17 130 ? 125.137 276.570 244.785 1.00 124.27 130 Bj 1 \nATOM 626  O O   . HIS Q 17 130 ? 124.395 276.174 245.691 1.00 124.27 130 Bj 1 \nATOM 627  C CB  . HIS Q 17 130 ? 124.343 276.571 242.407 1.00 124.27 130 Bj 1 \nATOM 628  C CG  . HIS Q 17 130 ? 123.598 277.281 241.320 1.00 124.27 130 Bj 1 \nATOM 629  N ND1 . HIS Q 17 130 ? 122.957 278.485 241.521 1.00 124.27 130 Bj 1 \nATOM 630  C CD2 . HIS Q 17 130 ? 123.400 276.962 240.019 1.00 124.27 130 Bj 1 \nATOM 631  C CE1 . HIS Q 17 130 ? 122.391 278.873 240.392 1.00 124.27 130 Bj 1 \nATOM 632  N NE2 . HIS Q 17 130 ? 122.645 277.967 239.465 1.00 124.27 130 Bj 1 \nATOM 633  N N   . PHE Q 17 131 ? 126.434 276.275 244.753 1.00 123.12 131 Bj 1 \nATOM 634  C CA  . PHE Q 17 131 ? 127.041 275.459 245.795 1.00 123.12 131 Bj 1 \nATOM 635  C C   . PHE Q 17 131 ? 127.241 276.280 247.061 1.00 123.12 131 Bj 1 \nATOM 636  O O   . PHE Q 17 131 ? 127.634 277.449 247.007 1.00 123.12 131 Bj 1 \nATOM 637  C CB  . PHE Q 17 131 ? 128.378 274.890 245.322 1.00 123.12 131 Bj 1 \nATOM 638  C CG  . PHE Q 17 131 ? 128.932 273.819 246.221 1.00 123.12 131 Bj 1 \nATOM 639  C CD1 . PHE Q 17 131 ? 128.636 272.485 245.993 1.00 123.12 131 Bj 1 \nATOM 640  C CD2 . PHE Q 17 131 ? 129.747 274.145 247.292 1.00 123.12 131 Bj 1 \nATOM 641  C CE1 . PHE Q 17 131 ? 129.144 271.497 246.816 1.00 123.12 131 Bj 1 \nATOM 642  C CE2 . PHE Q 17 131 ? 130.257 273.162 248.118 1.00 123.12 131 Bj 1 \nATOM 643  C CZ  . PHE Q 17 131 ? 129.955 271.837 247.880 1.00 123.12 131 Bj 1 \nATOM 644  N N   . LYS Q 17 132 ? 126.965 275.659 248.206 1.00 116.35 132 Bj 1 \nATOM 645  C CA  . LYS Q 17 132 ? 127.090 276.303 249.505 1.00 116.35 132 Bj 1 \nATOM 646  C C   . LYS Q 17 132 ? 128.171 275.612 250.323 1.00 116.35 132 Bj 1 \nATOM 647  O O   . LYS Q 17 132 ? 128.289 274.383 250.305 1.00 116.35 132 Bj 1 \nATOM 648  C CB  . LYS Q 17 132 ? 125.759 276.283 250.264 1.00 116.35 132 Bj 1 \nATOM 649  C CG  . LYS Q 17 132 ? 125.018 277.611 250.239 1.00 116.35 132 Bj 1 \nATOM 650  C CD  . LYS Q 17 132 ? 124.841 278.121 248.819 1.00 116.35 132 Bj 1 \nATOM 651  C CE  . LYS Q 17 132 ? 124.220 279.507 248.803 1.00 116.35 132 Bj 1 \nATOM 652  N NZ  . LYS Q 17 132 ? 124.099 280.040 247.419 1.00 116.35 132 Bj 1 \nATOM 653  N N   . LEU Q 17 133 ? 128.955 276.411 251.041 1.00 122.76 133 Bj 1 \nATOM 654  C CA  . LEU Q 17 133 ? 130.066 275.909 251.829 1.00 122.76 133 Bj 1 \nATOM 655  C C   . LEU Q 17 133 ? 129.629 275.679 253.274 1.00 122.76 133 Bj 1 \nATOM 656  O O   . LEU Q 17 133 ? 128.461 275.844 253.634 1.00 122.76 133 Bj 1 \nATOM 657  C CB  . LEU Q 17 133 ? 131.244 276.879 251.757 1.00 122.76 133 Bj 1 \nATOM 658  C CG  . LEU Q 17 133 ? 131.666 277.326 250.356 1.00 122.76 133 Bj 1 \nATOM 659  C CD1 . LEU Q 17 133 ? 132.813 278.319 250.434 1.00 122.76 133 Bj 1 \nATOM 660  C CD2 . LEU Q 17 133 ? 132.045 276.128 249.501 1.00 122.76 133 Bj 1 \nATOM 661  N N   . GLY Q 17 134 ? 130.584 275.293 254.118 1.00 129.65 134 Bj 1 \nATOM 662  C CA  . GLY Q 17 134 ? 130.282 275.055 255.514 1.00 129.65 134 Bj 1 \nATOM 663  C C   . GLY Q 17 134 ? 130.327 276.328 256.339 1.00 129.65 134 Bj 1 \nATOM 664  O O   . GLY Q 17 134 ? 131.088 277.255 256.064 1.00 129.65 134 Bj 1 \nATOM 665  N N   . ALA Q 17 135 ? 129.488 276.366 257.371 1.00 138.35 135 Bj 1 \nATOM 666  C CA  . ALA Q 17 135 ? 129.408 277.524 258.252 1.00 138.35 135 Bj 1 \nATOM 667  C C   . ALA Q 17 135 ? 130.539 277.469 259.271 1.00 138.35 135 Bj 1 \nATOM 668  O O   . ALA Q 17 135 ? 130.677 276.482 260.002 1.00 138.35 135 Bj 1 \nATOM 669  C CB  . ALA Q 17 135 ? 128.051 277.571 258.950 1.00 138.35 135 Bj 1 \nATOM 670  N N   . ARG Q 17 136 ? 131.347 278.530 259.322 1.00 130.79 136 Bj 1 \nATOM 671  C CA  . ARG Q 17 136 ? 132.483 278.568 260.234 1.00 130.79 136 Bj 1 \nATOM 672  C C   . ARG Q 17 136 ? 132.087 278.942 261.655 1.00 130.79 136 Bj 1 \nATOM 673  O O   . ARG Q 17 136 ? 132.785 278.556 262.599 1.00 130.79 136 Bj 1 \nATOM 674  C CB  . ARG Q 17 136 ? 133.536 279.556 259.727 1.00 130.79 136 Bj 1 \nATOM 675  C CG  . ARG Q 17 136 ? 133.810 279.469 258.237 1.00 130.79 136 Bj 1 \nATOM 676  C CD  . ARG Q 17 136 ? 135.032 280.286 257.861 1.00 130.79 136 Bj 1 \nATOM 677  N NE  . ARG Q 17 136 ? 134.968 281.647 258.384 1.00 130.79 136 Bj 1 \nATOM 678  C CZ  . ARG Q 17 136 ? 135.943 282.541 258.256 1.00 130.79 136 Bj 1 \nATOM 679  N NH1 . ARG Q 17 136 ? 137.061 282.218 257.620 1.00 130.79 136 Bj 1 \nATOM 680  N NH2 . ARG Q 17 136 ? 135.801 283.757 258.764 1.00 130.79 136 Bj 1 \nATOM 681  N N   . LEU Q 17 137 ? 130.992 279.683 261.830 1.00 133.57 137 Bj 1 \nATOM 682  C CA  . LEU Q 17 137 ? 130.559 280.141 263.149 1.00 133.57 137 Bj 1 \nATOM 683  C C   . LEU Q 17 137 ? 129.570 279.126 263.717 1.00 133.57 137 Bj 1 \nATOM 684  O O   . LEU Q 17 137 ? 128.360 279.345 263.762 1.00 133.57 137 Bj 1 \nATOM 685  C CB  . LEU Q 17 137 ? 129.956 281.539 263.059 1.00 133.57 137 Bj 1 \nATOM 686  C CG  . LEU Q 17 137 ? 130.891 282.628 262.527 1.00 133.57 137 Bj 1 \nATOM 687  C CD1 . LEU Q 17 137 ? 130.188 283.977 262.488 1.00 133.57 137 Bj 1 \nATOM 688  C CD2 . LEU Q 17 137 ? 132.159 282.703 263.364 1.00 133.57 137 Bj 1 \nATOM 689  N N   . THR Q 17 138 ? 130.111 277.993 264.160 1.00 133.35 138 Bj 1 \nATOM 690  C CA  . THR Q 17 138 ? 129.322 276.936 264.778 1.00 133.35 138 Bj 1 \nATOM 691  C C   . THR Q 17 138 ? 129.133 277.144 266.275 1.00 133.35 138 Bj 1 \nATOM 692  O O   . THR Q 17 138 ? 128.651 276.236 266.959 1.00 133.35 138 Bj 1 \nATOM 693  C CB  . THR Q 17 138 ? 129.970 275.573 264.522 1.00 133.35 138 Bj 1 \nATOM 694  O OG1 . THR Q 17 138 ? 131.309 275.575 265.032 1.00 133.35 138 Bj 1 \nATOM 695  C CG2 . THR Q 17 138 ? 129.999 275.269 263.033 1.00 133.35 138 Bj 1 \nATOM 696  N N   . GLU Q 17 139 ? 129.508 278.309 266.795 1.00 134.95 139 Bj 1 \nATOM 697  C CA  . GLU Q 17 139 ? 129.306 278.647 268.196 1.00 134.95 139 Bj 1 \nATOM 698  C C   . GLU Q 17 139 ? 128.457 279.891 268.396 1.00 134.95 139 Bj 1 \nATOM 699  O O   . GLU Q 17 139 ? 127.841 280.034 269.453 1.00 134.95 139 Bj 1 \nATOM 700  C CB  . GLU Q 17 139 ? 130.659 278.842 268.900 1.00 134.95 139 Bj 1 \nATOM 701  C CG  . GLU Q 17 139 ? 130.604 278.798 270.422 1.00 134.95 139 Bj 1 \nATOM 702  C CD  . GLU Q 17 139 ? 130.428 280.169 271.046 1.00 134.95 139 Bj 1 \nATOM 703  O OE1 . GLU Q 17 139 ? 130.488 281.174 270.307 1.00 134.95 139 Bj 1 \nATOM 704  O OE2 . GLU Q 17 139 ? 130.231 280.241 272.277 1.00 134.95 139 Bj 1 \nATOM 705  N N   . ALA Q 17 140 ? 128.404 280.792 267.412 1.00 139.06 140 Bj 1 \nATOM 706  C CA  . ALA Q 17 140 ? 127.569 281.980 267.543 1.00 139.06 140 Bj 1 \nATOM 707  C C   . ALA Q 17 140 ? 126.090 281.623 267.616 1.00 139.06 140 Bj 1 \nATOM 708  O O   . ALA Q 17 140 ? 125.316 282.326 268.275 1.00 139.06 140 Bj 1 \nATOM 709  C CB  . ALA Q 17 140 ? 127.829 282.937 266.380 1.00 139.06 140 Bj 1 \nATOM 710  N N   . ASP Q 17 141 ? 125.681 280.539 266.954 1.00 140.48 141 Bj 1 \nATOM 711  C CA  . ASP Q 17 141 ? 124.289 280.111 267.023 1.00 140.48 141 Bj 1 \nATOM 712  C C   . ASP Q 17 141 ? 124.001 279.307 268.283 1.00 140.48 141 Bj 1 \nATOM 713  O O   . ASP Q 17 141 ? 122.859 279.293 268.754 1.00 140.48 141 Bj 1 \nATOM 714  C CB  . ASP Q 17 141 ? 123.924 279.291 265.784 1.00 140.48 141 Bj 1 \nATOM 715  C CG  . ASP Q 17 141 ? 124.675 277.976 265.714 1.00 140.48 141 Bj 1 \nATOM 716  O OD1 . ASP Q 17 141 ? 125.822 277.916 266.203 1.00 140.48 141 Bj 1 \nATOM 717  O OD2 . ASP Q 17 141 ? 124.116 277.002 265.168 1.00 140.48 141 Bj 1 \nATOM 718  N N   . LYS Q 17 142 ? 125.010 278.635 268.840 1.00 134.61 142 Bj 1 \nATOM 719  C CA  . LYS Q 17 142 ? 124.797 277.853 270.053 1.00 134.61 142 Bj 1 \nATOM 720  C C   . LYS Q 17 142 ? 124.838 278.740 271.293 1.00 134.61 142 Bj 1 \nATOM 721  O O   . LYS Q 17 142 ? 123.839 278.877 272.005 1.00 134.61 142 Bj 1 \nATOM 722  C CB  . LYS Q 17 142 ? 125.847 276.744 270.155 1.00 134.61 142 Bj 1 \nATOM 723  C CG  . LYS Q 17 142 ? 126.107 276.000 268.857 1.00 134.61 142 Bj 1 \nATOM 724  C CD  . LYS Q 17 142 ? 124.858 275.311 268.339 1.00 134.61 142 Bj 1 \nATOM 725  C CE  . LYS Q 17 142 ? 125.153 274.532 267.067 1.00 134.61 142 Bj 1 \nATOM 726  N NZ  . LYS Q 17 142 ? 123.939 273.858 266.530 1.00 134.61 142 Bj 1 \nATOM 727  N N   . LYS Q 17 143 ? 125.993 279.349 271.561 1.00 130.78 143 Bj 1 \nATOM 728  C CA  . LYS Q 17 143 ? 126.225 280.262 272.679 1.00 130.78 143 Bj 1 \nATOM 729  C C   . LYS Q 17 143 ? 125.934 279.638 274.039 1.00 130.78 143 Bj 1 \nATOM 730  O O   . LYS Q 17 143 ? 125.924 280.350 275.050 1.00 130.78 143 Bj 1 \nATOM 731  C CB  . LYS Q 17 143 ? 125.421 281.559 272.519 1.00 130.78 143 Bj 1 \nATOM 732  C CG  . LYS Q 17 143 ? 125.982 282.503 271.471 1.00 130.78 143 Bj 1 \nATOM 733  C CD  . LYS Q 17 143 ? 127.408 282.899 271.812 1.00 130.78 143 Bj 1 \nATOM 734  C CE  . LYS Q 17 143 ? 127.980 283.857 270.782 1.00 130.78 143 Bj 1 \nATOM 735  N NZ  . LYS Q 17 143 ? 129.382 284.238 271.109 1.00 130.78 143 Bj 1 \nATOM 736  N N   . ASP Q 17 144 ? 125.698 278.330 274.099 1.00 131.40 144 Bj 1 \nATOM 737  C CA  . ASP Q 17 144 ? 125.447 277.643 275.360 1.00 131.40 144 Bj 1 \nATOM 738  C C   . ASP Q 17 144 ? 126.492 276.583 275.666 1.00 131.40 144 Bj 1 \nATOM 739  O O   . ASP Q 17 144 ? 127.062 276.578 276.763 1.00 131.40 144 Bj 1 \nATOM 740  C CB  . ASP Q 17 144 ? 124.048 277.003 275.351 1.00 131.40 144 Bj 1 \nATOM 741  C CG  . ASP Q 17 144 ? 122.935 278.027 275.449 1.00 131.40 144 Bj 1 \nATOM 742  O OD1 . ASP Q 17 144 ? 122.551 278.595 274.407 1.00 131.40 144 Bj 1 \nATOM 743  O OD2 . ASP Q 17 144 ? 122.442 278.263 276.571 1.00 131.40 144 Bj 1 \nATOM 744  N N   . ASP Q 17 145 ? 126.762 275.685 274.723 1.00 125.63 145 Bj 1 \nATOM 745  C CA  . ASP Q 17 145 ? 127.651 274.554 274.962 1.00 125.63 145 Bj 1 \nATOM 746  C C   . ASP Q 17 145 ? 129.095 275.042 274.977 1.00 125.63 145 Bj 1 \nATOM 747  O O   . ASP Q 17 145 ? 129.719 275.197 273.922 1.00 125.63 145 Bj 1 \nATOM 748  C CB  . ASP Q 17 145 ? 127.441 273.482 273.897 1.00 125.63 145 Bj 1 \nATOM 749  C CG  . ASP Q 17 145 ? 128.031 272.142 274.292 1.00 125.63 145 Bj 1 \nATOM 750  O OD1 . ASP Q 17 145 ? 128.682 272.064 275.355 1.00 125.63 145 Bj 1 \nATOM 751  O OD2 . ASP Q 17 145 ? 127.837 271.162 273.542 1.00 125.63 145 Bj 1 \nATOM 752  N N   . ARG Q 17 146 ? 129.624 275.289 276.173 1.00 123.19 146 Bj 1 \nATOM 753  C CA  . ARG Q 17 146 ? 131.031 275.617 276.354 1.00 123.19 146 Bj 1 \nATOM 754  C C   . ARG Q 17 146 ? 131.912 274.378 276.423 1.00 123.19 146 Bj 1 \nATOM 755  O O   . ARG Q 17 146 ? 133.141 274.505 276.438 1.00 123.19 146 Bj 1 \nATOM 756  C CB  . ARG Q 17 146 ? 131.221 276.448 277.628 1.00 123.19 146 Bj 1 \nATOM 757  C CG  . ARG Q 17 146 ? 130.339 277.684 277.717 1.00 123.19 146 Bj 1 \nATOM 758  C CD  . ARG Q 17 146 ? 130.774 278.756 276.734 1.00 123.19 146 Bj 1 \nATOM 759  N NE  . ARG Q 17 146 ? 130.058 280.011 276.945 1.00 123.19 146 Bj 1 \nATOM 760  C CZ  . ARG Q 17 146 ? 130.291 281.128 276.265 1.00 123.19 146 Bj 1 \nATOM 761  N NH1 . ARG Q 17 146 ? 131.225 281.151 275.325 1.00 123.19 146 Bj 1 \nATOM 762  N NH2 . ARG Q 17 146 ? 129.590 282.224 276.524 1.00 123.19 146 Bj 1 \nATOM 763  N N   . THR Q 17 147 ? 131.314 273.189 276.464 1.00 120.18 147 Bj 1 \nATOM 764  C CA  . THR Q 17 147 ? 132.038 271.936 276.619 1.00 120.18 147 Bj 1 \nATOM 765  C C   . THR Q 17 147 ? 132.125 271.136 275.328 1.00 120.18 147 Bj 1 \nATOM 766  O O   . THR Q 17 147 ? 132.651 270.018 275.343 1.00 120.18 147 Bj 1 \nATOM 767  C CB  . THR Q 17 147 ? 131.373 271.081 277.702 1.00 120.18 147 Bj 1 \nATOM 768  O OG1 . THR Q 17 147 ? 130.082 270.655 277.249 1.00 120.18 147 Bj 1 \nATOM 769  C CG2 . THR Q 17 147 ? 131.209 271.884 278.982 1.00 120.18 147 Bj 1 \nATOM 770  N N   . SER Q 17 148 ? 131.625 271.672 274.219 1.00 118.54 148 Bj 1 \nATOM 771  C CA  . SER Q 17 148 ? 131.618 270.943 272.961 1.00 118.54 148 Bj 1 \nATOM 772  C C   . SER Q 17 148 ? 133.006 270.928 272.336 1.00 118.54 148 Bj 1 \nATOM 773  O O   . SER Q 17 148 ? 133.743 271.916 272.398 1.00 118.54 148 Bj 1 \nATOM 774  C CB  . SER Q 17 148 ? 130.617 271.567 271.988 1.00 118.54 148 Bj 1 \nATOM 775  O OG  . SER Q 17 148 ? 130.928 272.926 271.735 1.00 118.54 148 Bj 1 \nATOM 776  N N   . LEU Q 17 149 ? 133.361 269.790 271.735 1.00 117.15 149 Bj 1 \nATOM 777  C CA  . LEU Q 17 149 ? 134.619 269.711 271.001 1.00 117.15 149 Bj 1 \nATOM 778  C C   . LEU Q 17 149 ? 134.608 270.627 269.785 1.00 117.15 149 Bj 1 \nATOM 779  O O   . LEU Q 17 149 ? 135.662 271.129 269.377 1.00 117.15 149 Bj 1 \nATOM 780  C CB  . LEU Q 17 149 ? 134.891 268.267 270.579 1.00 117.15 149 Bj 1 \nATOM 781  C CG  . LEU Q 17 149 ? 136.256 267.992 269.944 1.00 117.15 149 Bj 1 \nATOM 782  C CD1 . LEU Q 17 149 ? 137.367 268.200 270.960 1.00 117.15 149 Bj 1 \nATOM 783  C CD2 . LEU Q 17 149 ? 136.314 266.588 269.358 1.00 117.15 149 Bj 1 \nATOM 784  N N   . HIS Q 17 150 ? 133.431 270.864 269.203 1.00 119.46 150 Bj 1 \nATOM 785  C CA  . HIS Q 17 150 ? 133.275 271.750 268.056 1.00 119.46 150 Bj 1 \nATOM 786  C C   . HIS Q 17 150 ? 132.939 273.179 268.467 1.00 119.46 150 Bj 1 \nATOM 787  O O   . HIS Q 17 150 ? 132.307 273.912 267.695 1.00 119.46 150 Bj 1 \nATOM 788  C CB  . HIS Q 17 150 ? 132.203 271.196 267.115 1.00 119.46 150 Bj 1 \nATOM 789  C CG  . HIS Q 17 150 ? 132.333 271.667 265.700 1.00 119.46 150 Bj 1 \nATOM 790  N ND1 . HIS Q 17 150 ? 133.406 271.334 264.901 1.00 119.46 150 Bj 1 \nATOM 791  C CD2 . HIS Q 17 150 ? 131.523 272.440 264.939 1.00 119.46 150 Bj 1 \nATOM 792  C CE1 . HIS Q 17 150 ? 133.252 271.884 263.709 1.00 119.46 150 Bj 1 \nATOM 793  N NE2 . HIS Q 17 150 ? 132.118 272.561 263.706 1.00 119.46 150 Bj 1 \nATOM 794  N N   . ARG Q 17 151 ? 133.334 273.589 269.675 1.00 116.45 151 Bj 1 \nATOM 795  C CA  . ARG Q 17 151 ? 133.014 274.930 270.155 1.00 116.45 151 Bj 1 \nATOM 796  C C   . ARG Q 17 151 ? 133.683 276.000 269.299 1.00 116.45 151 Bj 1 \nATOM 797  O O   . ARG Q 17 151 ? 133.011 276.780 268.616 1.00 116.45 151 Bj 1 \nATOM 798  C CB  . ARG Q 17 151 ? 133.432 275.069 271.620 1.00 116.45 151 Bj 1 \nATOM 799  C CG  . ARG Q 17 151 ? 133.285 276.474 272.176 1.00 116.45 151 Bj 1 \nATOM 800  C CD  . ARG Q 17 151 ? 133.694 276.533 273.637 1.00 116.45 151 Bj 1 \nATOM 801  N NE  . ARG Q 17 151 ? 133.681 277.899 274.151 1.00 116.45 151 Bj 1 \nATOM 802  C CZ  . ARG Q 17 151 ? 133.957 278.225 275.408 1.00 116.45 151 Bj 1 \nATOM 803  N NH1 . ARG Q 17 151 ? 134.267 277.282 276.287 1.00 116.45 151 Bj 1 \nATOM 804  N NH2 . ARG Q 17 151 ? 133.923 279.495 275.788 1.00 116.45 151 Bj 1 \nATOM 805  N N   . LYS Q 17 152 ? 135.011 276.043 269.313 1.00 117.42 152 Bj 1 \nATOM 806  C CA  . LYS Q 17 152 ? 135.770 277.054 268.591 1.00 117.42 152 Bj 1 \nATOM 807  C C   . LYS Q 17 152 ? 136.622 276.389 267.521 1.00 117.42 152 Bj 1 \nATOM 808  O O   . LYS Q 17 152 ? 137.171 275.304 267.735 1.00 117.42 152 Bj 1 \nATOM 809  C CB  . LYS Q 17 152 ? 136.655 277.866 269.542 1.00 117.42 152 Bj 1 \nATOM 810  C CG  . LYS Q 17 152 ? 135.879 278.626 270.605 1.00 117.42 152 Bj 1 \nATOM 811  C CD  . LYS Q 17 152 ? 136.809 279.386 271.538 1.00 117.42 152 Bj 1 \nATOM 812  C CE  . LYS Q 17 152 ? 136.029 280.083 272.644 1.00 117.42 152 Bj 1 \nATOM 813  N NZ  . LYS Q 17 152 ? 136.923 280.801 273.593 1.00 117.42 152 Bj 1 \nATOM 814  N N   . LEU Q 17 153 ? 136.727 277.048 266.368 1.00 116.24 153 Bj 1 \nATOM 815  C CA  . LEU Q 17 153 ? 137.460 276.511 265.234 1.00 116.24 153 Bj 1 \nATOM 816  C C   . LEU Q 17 153 ? 138.638 277.371 264.802 1.00 116.24 153 Bj 1 \nATOM 817  O O   . LEU Q 17 153 ? 139.490 276.883 264.051 1.00 116.24 153 Bj 1 \nATOM 818  C CB  . LEU Q 17 153 ? 136.518 276.317 264.036 1.00 116.24 153 Bj 1 \nATOM 819  C CG  . LEU Q 17 153 ? 135.239 275.539 264.342 1.00 116.24 153 Bj 1 \nATOM 820  C CD1 . LEU Q 17 153 ? 134.370 275.417 263.102 1.00 116.24 153 Bj 1 \nATOM 821  C CD2 . LEU Q 17 153 ? 135.573 274.168 264.908 1.00 116.24 153 Bj 1 \nATOM 822  N N   . ASP Q 17 154 ? 138.712 278.626 265.242 1.00 114.21 154 Bj 1 \nATOM 823  C CA  . ASP Q 17 154 ? 139.819 279.499 264.880 1.00 114.21 154 Bj 1 \nATOM 824  C C   . ASP Q 17 154 ? 140.864 279.628 265.977 1.00 114.21 154 Bj 1 \nATOM 825  O O   . ASP Q 17 154 ? 141.912 280.237 265.742 1.00 114.21 154 Bj 1 \nATOM 826  C CB  . ASP Q 17 154 ? 139.301 280.893 264.510 1.00 114.21 154 Bj 1 \nATOM 827  C CG  . ASP Q 17 154 ? 138.591 281.574 265.661 1.00 114.21 154 Bj 1 \nATOM 828  O OD1 . ASP Q 17 154 ? 138.041 280.861 266.526 1.00 114.21 154 Bj 1 \nATOM 829  O OD2 . ASP Q 17 154 ? 138.580 282.823 265.698 1.00 114.21 154 Bj 1 \nATOM 830  N N   . ARG Q 17 155 ? 140.614 279.065 267.154 1.00 117.24 155 Bj 1 \nATOM 831  C CA  . ARG Q 17 155 ? 141.560 279.082 268.258 1.00 117.24 155 Bj 1 \nATOM 832  C C   . ARG Q 17 155 ? 141.854 277.656 268.702 1.00 117.24 155 Bj 1 \nATOM 833  O O   . ARG Q 17 155 ? 141.141 276.711 268.356 1.00 117.24 155 Bj 1 \nATOM 834  C CB  . ARG Q 17 155 ? 141.020 279.897 269.441 1.00 117.24 155 Bj 1 \nATOM 835  C CG  . ARG Q 17 155 ? 140.581 281.306 269.091 1.00 117.24 155 Bj 1 \nATOM 836  C CD  . ARG Q 17 155 ? 140.132 282.057 270.334 1.00 117.24 155 Bj 1 \nATOM 837  N NE  . ARG Q 17 155 ? 139.613 283.382 270.013 1.00 117.24 155 Bj 1 \nATOM 838  C CZ  . ARG Q 17 155 ? 139.268 284.288 270.921 1.00 117.24 155 Bj 1 \nATOM 839  N NH1 . ARG Q 17 155 ? 139.392 284.015 272.212 1.00 117.24 155 Bj 1 \nATOM 840  N NH2 . ARG Q 17 155 ? 138.803 285.469 270.538 1.00 117.24 155 Bj 1 \nATOM 841  N N   . ASN Q 17 156 ? 142.922 277.508 269.478 1.00 113.83 156 Bj 1 \nATOM 842  C CA  . ASN Q 17 156 ? 143.233 276.233 270.102 1.00 113.83 156 Bj 1 \nATOM 843  C C   . ASN Q 17 156 ? 142.516 276.132 271.441 1.00 113.83 156 Bj 1 \nATOM 844  O O   . ASN Q 17 156 ? 142.286 277.135 272.123 1.00 113.83 156 Bj 1 \nATOM 845  C CB  . ASN Q 17 156 ? 144.741 276.067 270.300 1.00 113.83 156 Bj 1 \nATOM 846  C CG  . ASN Q 17 156 ? 145.277 276.908 271.442 1.00 113.83 156 Bj 1 \nATOM 847  O OD1 . ASN Q 17 156 ? 144.906 278.071 271.601 1.00 113.83 156 Bj 1 \nATOM 848  N ND2 . ASN Q 17 156 ? 146.154 276.320 272.247 1.00 113.83 156 Bj 1 \nATOM 849  N N   . LEU Q 17 157 ? 142.156 274.908 271.811 1.00 117.97 157 Bj 1 \nATOM 850  C CA  . LEU Q 17 157 ? 141.427 274.665 273.045 1.00 117.97 157 Bj 1 \nATOM 851  C C   . LEU Q 17 157 ? 142.163 273.643 273.900 1.00 117.97 157 Bj 1 \nATOM 852  O O   . LEU Q 17 157 ? 142.908 272.801 273.397 1.00 117.97 157 Bj 1 \nATOM 853  C CB  . LEU Q 17 157 ? 139.997 274.188 272.760 1.00 117.97 157 Bj 1 \nATOM 854  C CG  . LEU Q 17 157 ? 139.112 275.189 272.013 1.00 117.97 157 Bj 1 \nATOM 855  C CD1 . LEU Q 17 157 ? 137.703 274.642 271.833 1.00 117.97 157 Bj 1 \nATOM 856  C CD2 . LEU Q 17 157 ? 139.084 276.528 272.733 1.00 117.97 157 Bj 1 \nATOM 857  N N   . ILE Q 17 158 ? 141.952 273.734 275.213 1.00 113.83 158 Bj 1 \nATOM 858  C CA  . ILE Q 17 158 ? 142.549 272.815 276.169 1.00 113.83 158 Bj 1 \nATOM 859  C C   . ILE Q 17 158 ? 141.443 272.284 277.071 1.00 113.83 158 Bj 1 \nATOM 860  O O   . ILE Q 17 158 ? 140.365 272.871 277.184 1.00 113.83 158 Bj 1 \nATOM 861  C CB  . ILE Q 17 158 ? 143.669 273.481 276.999 1.00 113.83 158 Bj 1 \nATOM 862  C CG1 . ILE Q 17 158 ? 144.690 272.440 277.466 1.00 113.83 158 Bj 1 \nATOM 863  C CG2 . ILE Q 17 158 ? 143.086 274.213 278.188 1.00 113.83 158 Bj 1 \nATOM 864  C CD1 . ILE Q 17 158 ? 145.859 273.029 278.223 1.00 113.83 158 Bj 1 \nATOM 865  N N   . LEU Q 17 159 ? 141.723 271.155 277.716 1.00 117.96 159 Bj 1 \nATOM 866  C CA  . LEU Q 17 159 ? 140.729 270.429 278.495 1.00 117.96 159 Bj 1 \nATOM 867  C C   . LEU Q 17 159 ? 140.864 270.768 279.973 1.00 117.96 159 Bj 1 \nATOM 868  O O   . LEU Q 17 159 ? 141.962 270.695 280.535 1.00 117.96 159 Bj 1 \nATOM 869  C CB  . LEU Q 17 159 ? 140.876 268.922 278.285 1.00 117.96 159 Bj 1 \nATOM 870  C CG  . LEU Q 17 159 ? 139.756 268.048 278.849 1.00 117.96 159 Bj 1 \nATOM 871  C CD1 . LEU Q 17 159 ? 138.420 268.435 278.235 1.00 117.96 159 Bj 1 \nATOM 872  C CD2 . LEU Q 17 159 ? 140.053 266.577 278.608 1.00 117.96 159 Bj 1 \nATOM 873  N N   . LEU Q 17 160 ? 139.745 271.135 280.597 1.00 129.48 160 Bj 1 \nATOM 874  C CA  . LEU Q 17 160 ? 139.681 271.396 282.030 1.00 129.48 160 Bj 1 \nATOM 875  C C   . LEU Q 17 160 ? 138.594 270.526 282.642 1.00 129.48 160 Bj 1 \nATOM 876  O O   . LEU Q 17 160 ? 137.483 270.456 282.110 1.00 129.48 160 Bj 1 \nATOM 877  C CB  . LEU Q 17 160 ? 139.396 272.874 282.319 1.00 129.48 160 Bj 1 \nATOM 878  C CG  . LEU Q 17 160 ? 140.586 273.780 282.641 1.00 129.48 160 Bj 1 \nATOM 879  C CD1 . LEU Q 17 160 ? 141.302 273.297 283.894 1.00 129.48 160 Bj 1 \nATOM 880  C CD2 . LEU Q 17 160 ? 141.543 273.865 281.466 1.00 129.48 160 Bj 1 \nATOM 881  N N   . VAL Q 17 161 ? 138.908 269.869 283.754 1.00 136.87 161 Bj 1 \nATOM 882  C CA  . VAL Q 17 161 ? 137.973 268.976 284.427 1.00 136.87 161 Bj 1 \nATOM 883  C C   . VAL Q 17 161 ? 137.583 269.581 285.768 1.00 136.87 161 Bj 1 \nATOM 884  O O   . VAL Q 17 161 ? 138.402 270.219 286.438 1.00 136.87 161 Bj 1 \nATOM 885  C CB  . VAL Q 17 161 ? 138.566 267.564 284.611 1.00 136.87 161 Bj 1 \nATOM 886  C CG1 . VAL Q 17 161 ? 138.693 266.867 283.267 1.00 136.87 161 Bj 1 \nATOM 887  C CG2 . VAL Q 17 161 ? 139.917 267.637 285.303 1.00 136.87 161 Bj 1 \nATOM 888  N N   . ARG Q 17 162 ? 136.323 269.392 286.149 1.00 151.13 162 Bj 1 \nATOM 889  C CA  . ARG Q 17 162 ? 135.837 269.829 287.450 1.00 151.13 162 Bj 1 \nATOM 890  C C   . ARG Q 17 162 ? 135.852 268.656 288.420 1.00 151.13 162 Bj 1 \nATOM 891  O O   . ARG Q 17 162 ? 135.243 267.615 288.155 1.00 151.13 162 Bj 1 \nATOM 892  C CB  . ARG Q 17 162 ? 134.425 270.405 287.339 1.00 151.13 162 Bj 1 \nATOM 893  C CG  . ARG Q 17 162 ? 133.794 270.771 288.675 1.00 151.13 162 Bj 1 \nATOM 894  C CD  . ARG Q 17 162 ? 134.649 271.772 289.435 1.00 151.13 162 Bj 1 \nATOM 895  N NE  . ARG Q 17 162 ? 134.041 272.166 290.702 1.00 151.13 162 Bj 1 \nATOM 896  C CZ  . ARG Q 17 162 ? 134.595 273.012 291.565 1.00 151.13 162 Bj 1 \nATOM 897  N NH1 . ARG Q 17 162 ? 135.775 273.556 291.298 1.00 151.13 162 Bj 1 \nATOM 898  N NH2 . ARG Q 17 162 ? 133.971 273.316 292.694 1.00 151.13 162 Bj 1 \nATOM 899  N N   . GLU Q 17 163 ? 136.552 268.826 289.540 1.00 162.19 163 Bj 1 \nATOM 900  C CA  . GLU Q 17 163 ? 136.655 267.786 290.555 1.00 162.19 163 Bj 1 \nATOM 901  C C   . GLU Q 17 163 ? 136.528 268.410 291.935 1.00 162.19 163 Bj 1 \nATOM 902  O O   . GLU Q 17 163 ? 137.204 269.398 292.237 1.00 162.19 163 Bj 1 \nATOM 903  C CB  . GLU Q 17 163 ? 137.981 267.024 290.442 1.00 162.19 163 Bj 1 \nATOM 904  C CG  . GLU Q 17 163 ? 138.128 266.212 289.165 1.00 162.19 163 Bj 1 \nATOM 905  C CD  . GLU Q 17 163 ? 139.362 265.332 289.175 1.00 162.19 163 Bj 1 \nATOM 906  O OE1 . GLU Q 17 163 ? 140.126 265.387 290.161 1.00 162.19 163 Bj 1 \nATOM 907  O OE2 . GLU Q 17 163 ? 139.566 264.582 288.197 1.00 162.19 163 Bj 1 \nATOM 908  N N   . LYS Q 17 164 ? 135.663 267.833 292.764 1.00 165.97 164 Bj 1 \nATOM 909  C CA  . LYS Q 17 164 ? 135.477 268.256 294.149 1.00 165.97 164 Bj 1 \nATOM 910  C C   . LYS Q 17 164 ? 136.057 267.171 295.050 1.00 165.97 164 Bj 1 \nATOM 911  O O   . LYS Q 17 164 ? 135.463 266.101 295.210 1.00 165.97 164 Bj 1 \nATOM 912  C CB  . LYS Q 17 164 ? 134.004 268.509 294.456 1.00 165.97 164 Bj 1 \nATOM 913  C CG  . LYS Q 17 164 ? 133.424 269.735 293.773 1.00 165.97 164 Bj 1 \nATOM 914  C CD  . LYS Q 17 164 ? 132.024 270.035 294.284 1.00 165.97 164 Bj 1 \nATOM 915  C CE  . LYS Q 17 164 ? 131.472 271.312 293.673 1.00 165.97 164 Bj 1 \nATOM 916  N NZ  . LYS Q 17 164 ? 130.115 271.638 294.195 1.00 165.97 164 Bj 1 \nATOM 917  N N   . LEU Q 17 165 ? 137.217 267.450 295.636 1.00 168.90 165 Bj 1 \nATOM 918  C CA  . LEU Q 17 165 ? 137.880 266.496 296.515 1.00 168.90 165 Bj 1 \nATOM 919  C C   . LEU Q 17 165 ? 137.275 266.587 297.915 1.00 168.90 165 Bj 1 \nATOM 920  O O   . LEU Q 17 165 ? 136.251 267.238 298.138 1.00 168.90 165 Bj 1 \nATOM 921  C CB  . LEU Q 17 165 ? 139.386 266.743 296.518 1.00 168.90 165 Bj 1 \nATOM 922  C CG  . LEU Q 17 165 ? 140.073 266.659 295.154 1.00 168.90 165 Bj 1 \nATOM 923  C CD1 . LEU Q 17 165 ? 141.578 266.829 295.293 1.00 168.90 165 Bj 1 \nATOM 924  C CD2 . LEU Q 17 165 ? 139.738 265.346 294.462 1.00 168.90 165 Bj 1 \nATOM 925  N N   . GLY Q 17 166 ? 137.912 265.927 298.884 1.00 171.61 166 Bj 1 \nATOM 926  C CA  . GLY Q 17 166 ? 137.369 265.914 300.232 1.00 171.61 166 Bj 1 \nATOM 927  C C   . GLY Q 17 166 ? 137.561 267.231 300.961 1.00 171.61 166 Bj 1 \nATOM 928  O O   . GLY Q 17 166 ? 136.656 267.703 301.656 1.00 171.61 166 Bj 1 \nATOM 929  N N   . ASP Q 17 167 ? 138.736 267.843 300.815 1.00 174.91 167 Bj 1 \nATOM 930  C CA  . ASP Q 17 167 ? 139.046 269.091 301.495 1.00 174.91 167 Bj 1 \nATOM 931  C C   . ASP Q 17 167 ? 139.291 270.254 300.545 1.00 174.91 167 Bj 1 \nATOM 932  O O   . ASP Q 17 167 ? 139.620 271.352 301.010 1.00 174.91 167 Bj 1 \nATOM 933  C CB  . ASP Q 17 167 ? 140.268 268.910 302.408 1.00 174.91 167 Bj 1 \nATOM 934  C CG  . ASP Q 17 167 ? 141.477 268.372 301.667 1.00 174.91 167 Bj 1 \nATOM 935  O OD1 . ASP Q 17 167 ? 142.126 269.149 300.937 1.00 174.91 167 Bj 1 \nATOM 936  O OD2 . ASP Q 17 167 ? 141.778 267.169 301.815 1.00 174.91 167 Bj 1 \nATOM 937  N N   . GLN Q 17 168 ? 139.144 270.054 299.236 1.00 175.00 168 Bj 1 \nATOM 938  C CA  . GLN Q 17 168 ? 139.378 271.108 298.261 1.00 175.00 168 Bj 1 \nATOM 939  C C   . GLN Q 17 168 ? 138.382 270.985 297.119 1.00 175.00 168 Bj 1 \nATOM 940  O O   . GLN Q 17 168 ? 138.082 269.879 296.661 1.00 175.00 168 Bj 1 \nATOM 941  C CB  . GLN Q 17 168 ? 140.810 271.056 297.710 1.00 175.00 168 Bj 1 \nATOM 942  C CG  . GLN Q 17 168 ? 141.878 271.477 298.705 1.00 175.00 168 Bj 1 \nATOM 943  C CD  . GLN Q 17 168 ? 143.281 271.320 298.157 1.00 175.00 168 Bj 1 \nATOM 944  O OE1 . GLN Q 17 168 ? 143.477 270.789 297.063 1.00 175.00 168 Bj 1 \nATOM 945  N NE2 . GLN Q 17 168 ? 144.267 271.783 298.916 1.00 175.00 168 Bj 1 \nATOM 946  N N   . ASP Q 17 169 ? 137.876 272.129 296.665 1.00 168.27 169 Bj 1 \nATOM 947  C CA  . ASP Q 17 169 ? 136.985 272.221 295.510 1.00 168.27 169 Bj 1 \nATOM 948  C C   . ASP Q 17 169 ? 137.646 273.173 294.517 1.00 168.27 169 Bj 1 \nATOM 949  O O   . ASP Q 17 169 ? 137.390 274.379 294.534 1.00 168.27 169 Bj 1 \nATOM 950  C CB  . ASP Q 17 169 ? 135.589 272.706 295.915 1.00 168.27 169 Bj 1 \nATOM 951  C CG  . ASP Q 17 169 ? 134.950 271.832 296.978 1.00 168.27 169 Bj 1 \nATOM 952  O OD1 . ASP Q 17 169 ? 135.285 270.631 297.048 1.00 168.27 169 Bj 1 \nATOM 953  O OD2 . ASP Q 17 169 ? 134.109 272.348 297.743 1.00 168.27 169 Bj 1 \nATOM 954  N N   . ILE Q 17 170 ? 138.499 272.629 293.653 1.00 159.42 170 Bj 1 \nATOM 955  C CA  . ILE Q 17 170 ? 139.305 273.423 292.734 1.00 159.42 170 Bj 1 \nATOM 956  C C   . ILE Q 17 170 ? 138.930 273.073 291.301 1.00 159.42 170 Bj 1 \nATOM 957  O O   . ILE Q 17 170 ? 138.527 271.941 291.010 1.00 159.42 170 Bj 1 \nATOM 958  C CB  . ILE Q 17 170 ? 140.815 273.204 292.968 1.00 159.42 170 Bj 1 \nATOM 959  C CG1 . ILE Q 17 170 ? 141.172 271.723 292.823 1.00 159.42 170 Bj 1 \nATOM 960  C CG2 . ILE Q 17 170 ? 141.225 273.726 294.336 1.00 159.42 170 Bj 1 \nATOM 961  C CD1 . ILE Q 17 170 ? 142.645 271.427 293.007 1.00 159.42 170 Bj 1 \nATOM 962  N N   . TRP Q 17 171 ? 139.059 274.056 290.411 1.00 144.42 171 Bj 1 \nATOM 963  C CA  . TRP Q 17 171 ? 138.893 273.855 288.972 1.00 144.42 171 Bj 1 \nATOM 964  C C   . TRP Q 17 171 ? 140.241 273.390 288.437 1.00 144.42 171 Bj 1 \nATOM 965  O O   . TRP Q 17 171 ? 141.054 274.182 287.960 1.00 144.42 171 Bj 1 \nATOM 966  C CB  . TRP Q 17 171 ? 138.414 275.138 288.303 1.00 144.42 171 Bj 1 \nATOM 967  C CG  . TRP Q 17 171 ? 138.043 274.985 286.860 1.00 144.42 171 Bj 1 \nATOM 968  C CD1 . TRP Q 17 171 ? 138.831 275.252 285.779 1.00 144.42 171 Bj 1 \nATOM 969  C CD2 . TRP Q 17 171 ? 136.785 274.539 286.340 1.00 144.42 171 Bj 1 \nATOM 970  N NE1 . TRP Q 17 171 ? 138.144 274.997 284.618 1.00 144.42 171 Bj 1 \nATOM 971  C CE2 . TRP Q 17 171 ? 136.885 274.557 284.935 1.00 144.42 171 Bj 1 \nATOM 972  C CE3 . TRP Q 17 171 ? 135.586 274.124 286.925 1.00 144.42 171 Bj 1 \nATOM 973  C CZ2 . TRP Q 17 171 ? 135.832 274.177 284.106 1.00 144.42 171 Bj 1 \nATOM 974  C CZ3 . TRP Q 17 171 ? 134.541 273.747 286.101 1.00 144.42 171 Bj 1 \nATOM 975  C CH2 . TRP Q 17 171 ? 134.672 273.775 284.707 1.00 144.42 171 Bj 1 \nATOM 976  N N   . MET Q 17 172 ? 140.479 272.086 288.520 1.00 147.69 172 Bj 1 \nATOM 977  C CA  . MET Q 17 172 ? 141.806 271.514 288.352 1.00 147.69 172 Bj 1 \nATOM 978  C C   . MET Q 17 172 ? 142.015 270.976 286.940 1.00 147.69 172 Bj 1 \nATOM 979  O O   . MET Q 17 172 ? 141.082 270.507 286.285 1.00 147.69 172 Bj 1 \nATOM 980  C CB  . MET Q 17 172 ? 142.030 270.391 289.368 1.00 147.69 172 Bj 1 \nATOM 981  C CG  . MET Q 17 172 ? 143.468 269.917 289.488 1.00 147.69 172 Bj 1 \nATOM 982  S SD  . MET Q 17 172 ? 143.610 268.411 290.466 1.00 147.69 172 Bj 1 \nATOM 983  C CE  . MET Q 17 172 ? 142.770 267.241 289.402 1.00 147.69 172 Bj 1 \nATOM 984  N N   . LEU Q 17 173 ? 143.260 271.057 286.478 1.00 139.16 173 Bj 1 \nATOM 985  C CA  . LEU Q 17 173 ? 143.650 270.404 285.241 1.00 139.16 173 Bj 1 \nATOM 986  C C   . LEU Q 17 173 ? 143.738 268.894 285.468 1.00 139.16 173 Bj 1 \nATOM 987  O O   . LEU Q 17 173 ? 143.996 268.445 286.588 1.00 139.16 173 Bj 1 \nATOM 988  C CB  . LEU Q 17 173 ? 144.996 270.950 284.764 1.00 139.16 173 Bj 1 \nATOM 989  C CG  . LEU Q 17 173 ? 145.334 270.960 283.270 1.00 139.16 173 Bj 1 \nATOM 990  C CD1 . LEU Q 17 173 ? 144.311 271.766 282.496 1.00 139.16 173 Bj 1 \nATOM 991  C CD2 . LEU Q 17 173 ? 146.725 271.512 283.037 1.00 139.16 173 Bj 1 \nATOM 992  N N   . PRO Q 17 174 ? 143.500 268.080 284.423 1.00 136.31 174 Bj 1 \nATOM 993  C CA  . PRO Q 17 174 ? 143.610 266.621 284.586 1.00 136.31 174 Bj 1 \nATOM 994  C C   . PRO Q 17 174 ? 144.959 266.176 285.134 1.00 136.31 174 Bj 1 \nATOM 995  O O   . PRO Q 17 174 ? 146.003 266.377 284.503 1.00 136.31 174 Bj 1 \nATOM 996  C CB  . PRO Q 17 174 ? 143.377 266.087 283.164 1.00 136.31 174 Bj 1 \nATOM 997  C CG  . PRO Q 17 174 ? 143.447 267.291 282.257 1.00 136.31 174 Bj 1 \nATOM 998  C CD  . PRO Q 17 174 ? 142.983 268.434 283.092 1.00 136.31 174 Bj 1 \nATOM 999  N N   . GLN Q 17 175 ? 144.935 265.578 286.323 1.00 135.35 175 Bj 1 \nATOM 1000 C CA  . GLN Q 17 175 ? 146.121 265.112 287.030 1.00 135.35 175 Bj 1 \nATOM 1001 C C   . GLN Q 17 175 ? 146.040 263.602 287.238 1.00 135.35 175 Bj 1 \nATOM 1002 O O   . GLN Q 17 175 ? 145.028 262.962 286.944 1.00 135.35 175 Bj 1 \nATOM 1003 C CB  . GLN Q 17 175 ? 146.278 265.834 288.372 1.00 135.35 175 Bj 1 \nATOM 1004 C CG  . GLN Q 17 175 ? 146.579 267.318 288.255 1.00 135.35 175 Bj 1 \nATOM 1005 C CD  . GLN Q 17 175 ? 146.837 267.965 289.602 1.00 135.35 175 Bj 1 \nATOM 1006 O OE1 . GLN Q 17 175 ? 146.707 267.325 290.646 1.00 135.35 175 Bj 1 \nATOM 1007 N NE2 . GLN Q 17 175 ? 147.204 269.241 289.585 1.00 135.35 175 Bj 1 \nATOM 1008 N N   . SER Q 17 176 ? 147.130 263.036 287.754 1.00 133.75 176 Bj 1 \nATOM 1009 C CA  . SER Q 17 176 ? 147.220 261.598 287.965 1.00 133.75 176 Bj 1 \nATOM 1010 C C   . SER Q 17 176 ? 148.177 261.315 289.116 1.00 133.75 176 Bj 1 \nATOM 1011 O O   . SER Q 17 176 ? 148.730 262.227 289.736 1.00 133.75 176 Bj 1 \nATOM 1012 C CB  . SER Q 17 176 ? 147.683 260.882 286.694 1.00 133.75 176 Bj 1 \nATOM 1013 O OG  . SER Q 17 176 ? 146.894 261.256 285.582 1.00 133.75 176 Bj 1 \nATOM 1014 N N   . ASP Q 17 177 ? 148.364 260.026 289.395 1.00 134.79 177 Bj 1 \nATOM 1015 C CA  . ASP Q 17 177 ? 149.341 259.551 290.362 1.00 134.79 177 Bj 1 \nATOM 1016 C C   . ASP Q 17 177 ? 149.995 258.296 289.806 1.00 134.79 177 Bj 1 \nATOM 1017 O O   . ASP Q 17 177 ? 149.390 257.559 289.023 1.00 134.79 177 Bj 1 \nATOM 1018 C CB  . ASP Q 17 177 ? 148.706 259.260 291.728 1.00 134.79 177 Bj 1 \nATOM 1019 C CG  . ASP Q 17 177 ? 148.221 260.516 292.424 1.00 134.79 177 Bj 1 \nATOM 1020 O OD1 . ASP Q 17 177 ? 147.166 261.051 292.025 1.00 134.79 177 Bj 1 \nATOM 1021 O OD2 . ASP Q 17 177 ? 148.898 260.969 293.370 1.00 134.79 177 Bj 1 \nATOM 1022 N N   . TRP Q 17 178 ? 151.238 258.056 290.216 1.00 142.13 178 Bj 1 \nATOM 1023 C CA  . TRP Q 17 178 ? 152.031 256.996 289.615 1.00 142.13 178 Bj 1 \nATOM 1024 C C   . TRP Q 17 178 ? 153.041 256.465 290.620 1.00 142.13 178 Bj 1 \nATOM 1025 O O   . TRP Q 17 178 ? 153.592 257.217 291.429 1.00 142.13 178 Bj 1 \nATOM 1026 C CB  . TRP Q 17 178 ? 152.752 257.500 288.360 1.00 142.13 178 Bj 1 \nATOM 1027 C CG  . TRP Q 17 178 ? 153.556 258.740 288.606 1.00 142.13 178 Bj 1 \nATOM 1028 C CD1 . TRP Q 17 178 ? 153.092 260.023 288.654 1.00 142.13 178 Bj 1 \nATOM 1029 C CD2 . TRP Q 17 178 ? 154.966 258.815 288.843 1.00 142.13 178 Bj 1 \nATOM 1030 N NE1 . TRP Q 17 178 ? 154.126 260.891 288.906 1.00 142.13 178 Bj 1 \nATOM 1031 C CE2 . TRP Q 17 178 ? 155.287 260.173 289.026 1.00 142.13 178 Bj 1 \nATOM 1032 C CE3 . TRP Q 17 178 ? 155.987 257.865 288.916 1.00 142.13 178 Bj 1 \nATOM 1033 C CZ2 . TRP Q 17 178 ? 156.588 260.604 289.277 1.00 142.13 178 Bj 1 \nATOM 1034 C CZ3 . TRP Q 17 178 ? 157.276 258.293 289.166 1.00 142.13 178 Bj 1 \nATOM 1035 C CH2 . TRP Q 17 178 ? 157.565 259.650 289.344 1.00 142.13 178 Bj 1 \nATOM 1036 N N   . GLN Q 17 179 ? 153.282 255.155 290.554 1.00 140.75 179 Bj 1 \nATOM 1037 C CA  . GLN Q 17 179 ? 154.303 254.528 291.375 1.00 140.75 179 Bj 1 \nATOM 1038 C C   . GLN Q 17 179 ? 155.685 254.777 290.770 1.00 140.75 179 Bj 1 \nATOM 1039 O O   . GLN Q 17 179 ? 155.812 254.956 289.556 1.00 140.75 179 Bj 1 \nATOM 1040 C CB  . GLN Q 17 179 ? 154.047 253.026 291.496 1.00 140.75 179 Bj 1 \nATOM 1041 C CG  . GLN Q 17 179 ? 154.330 252.219 290.233 1.00 140.75 179 Bj 1 \nATOM 1042 C CD  . GLN Q 17 179 ? 153.239 252.345 289.187 1.00 140.75 179 Bj 1 \nATOM 1043 O OE1 . GLN Q 17 179 ? 152.254 253.059 289.380 1.00 140.75 179 Bj 1 \nATOM 1044 N NE2 . GLN Q 17 179 ? 153.408 251.645 288.072 1.00 140.75 179 Bj 1 \nATOM 1045 N N   . PRO Q 17 180 ? 156.741 254.792 291.602 1.00 139.20 180 Bj 1 \nATOM 1046 C CA  . PRO Q 17 180 ? 158.082 255.138 291.101 1.00 139.20 180 Bj 1 \nATOM 1047 C C   . PRO Q 17 180 ? 158.545 254.295 289.922 1.00 139.20 180 Bj 1 \nATOM 1048 O O   . PRO Q 17 180 ? 159.406 254.726 289.148 1.00 139.20 180 Bj 1 \nATOM 1049 C CB  . PRO Q 17 180 ? 158.976 254.914 292.327 1.00 139.20 180 Bj 1 \nATOM 1050 C CG  . PRO Q 17 180 ? 158.072 255.131 293.486 1.00 139.20 180 Bj 1 \nATOM 1051 C CD  . PRO Q 17 180 ? 156.734 254.597 293.063 1.00 139.20 180 Bj 1 \nATOM 1052 N N   . GLY Q 17 181 ? 157.983 253.098 289.770 1.00 135.25 181 Bj 1 \nATOM 1053 C CA  . GLY Q 17 181 ? 158.324 252.240 288.655 1.00 135.25 181 Bj 1 \nATOM 1054 C C   . GLY Q 17 181 ? 157.674 252.589 287.337 1.00 135.25 181 Bj 1 \nATOM 1055 O O   . GLY Q 17 181 ? 157.880 251.875 286.352 1.00 135.25 181 Bj 1 \nATOM 1056 N N   . GLU Q 17 182 ? 156.897 253.667 287.282 1.00 137.08 182 Bj 1 \nATOM 1057 C CA  . GLU Q 17 182 ? 156.183 254.062 286.078 1.00 137.08 182 Bj 1 \nATOM 1058 C C   . GLU Q 17 182 ? 156.697 255.404 285.572 1.00 137.08 182 Bj 1 \nATOM 1059 O O   . GLU Q 17 182 ? 157.089 256.276 286.354 1.00 137.08 182 Bj 1 \nATOM 1060 C CB  . GLU Q 17 182 ? 154.675 254.141 286.339 1.00 137.08 182 Bj 1 \nATOM 1061 C CG  . GLU Q 17 182 ? 153.829 254.307 285.086 1.00 137.08 182 Bj 1 \nATOM 1062 C CD  . GLU Q 17 182 ? 152.344 254.191 285.367 1.00 137.08 182 Bj 1 \nATOM 1063 O OE1 . GLU Q 17 182 ? 151.980 253.776 286.487 1.00 137.08 182 Bj 1 \nATOM 1064 O OE2 . GLU Q 17 182 ? 151.541 254.515 284.466 1.00 137.08 182 Bj 1 \nATOM 1065 N N   . THR Q 17 183 ? 156.690 255.560 284.252 1.00 130.92 183 Bj 1 \nATOM 1066 C CA  . THR Q 17 183 ? 157.170 256.770 283.603 1.00 130.92 183 Bj 1 \nATOM 1067 C C   . THR Q 17 183 ? 156.071 257.827 283.567 1.00 130.92 183 Bj 1 \nATOM 1068 O O   . THR Q 17 183 ? 154.878 257.512 283.596 1.00 130.92 183 Bj 1 \nATOM 1069 C CB  . THR Q 17 183 ? 157.647 256.460 282.182 1.00 130.92 183 Bj 1 \nATOM 1070 O OG1 . THR Q 17 183 ? 158.349 255.210 282.177 1.00 130.92 183 Bj 1 \nATOM 1071 C CG2 . THR Q 17 183 ? 158.582 257.550 281.671 1.00 130.92 183 Bj 1 \nATOM 1072 N N   . LEU Q 17 184 ? 156.490 259.094 283.506 1.00 129.02 184 Bj 1 \nATOM 1073 C CA  . LEU Q 17 184 ? 155.532 260.194 283.444 1.00 129.02 184 Bj 1 \nATOM 1074 C C   . LEU Q 17 184 ? 154.716 260.147 282.159 1.00 129.02 184 Bj 1 \nATOM 1075 O O   . LEU Q 17 184 ? 153.502 260.384 282.173 1.00 129.02 184 Bj 1 \nATOM 1076 C CB  . LEU Q 17 184 ? 156.266 261.528 283.563 1.00 129.02 184 Bj 1 \nATOM 1077 C CG  . LEU Q 17 184 ? 157.066 261.730 284.849 1.00 129.02 184 Bj 1 \nATOM 1078 C CD1 . LEU Q 17 184 ? 157.941 262.967 284.754 1.00 129.02 184 Bj 1 \nATOM 1079 C CD2 . LEU Q 17 184 ? 156.125 261.830 286.034 1.00 129.02 184 Bj 1 \nATOM 1080 N N   . ARG Q 17 185 ? 155.367 259.842 281.035 1.00 125.72 185 Bj 1 \nATOM 1081 C CA  . ARG Q 17 185 ? 154.653 259.763 279.767 1.00 125.72 185 Bj 1 \nATOM 1082 C C   . ARG Q 17 185 ? 153.671 258.598 279.760 1.00 125.72 185 Bj 1 \nATOM 1083 O O   . ARG Q 17 185 ? 152.540 258.735 279.279 1.00 125.72 185 Bj 1 \nATOM 1084 C CB  . ARG Q 17 185 ? 155.652 259.644 278.618 1.00 125.72 185 Bj 1 \nATOM 1085 C CG  . ARG Q 17 185 ? 155.034 259.681 277.235 1.00 125.72 185 Bj 1 \nATOM 1086 C CD  . ARG Q 17 185 ? 156.064 260.119 276.211 1.00 125.72 185 Bj 1 \nATOM 1087 N NE  . ARG Q 17 185 ? 155.563 260.025 274.845 1.00 125.72 185 Bj 1 \nATOM 1088 C CZ  . ARG Q 17 185 ? 156.149 260.598 273.800 1.00 125.72 185 Bj 1 \nATOM 1089 N NH1 . ARG Q 17 185 ? 157.250 261.316 273.971 1.00 125.72 185 Bj 1 \nATOM 1090 N NH2 . ARG Q 17 185 ? 155.631 260.462 272.587 1.00 125.72 185 Bj 1 \nATOM 1091 N N   . GLN Q 17 186 ? 154.083 257.448 280.298 1.00 132.51 186 Bj 1 \nATOM 1092 C CA  . GLN Q 17 186 ? 153.167 256.318 280.411 1.00 132.51 186 Bj 1 \nATOM 1093 C C   . GLN Q 17 186 ? 151.994 256.642 281.326 1.00 132.51 186 Bj 1 \nATOM 1094 O O   . GLN Q 17 186 ? 150.860 256.229 281.055 1.00 132.51 186 Bj 1 \nATOM 1095 C CB  . GLN Q 17 186 ? 153.914 255.087 280.925 1.00 132.51 186 Bj 1 \nATOM 1096 C CG  . GLN Q 17 186 ? 155.119 254.696 280.089 1.00 132.51 186 Bj 1 \nATOM 1097 C CD  . GLN Q 17 186 ? 155.882 253.529 280.683 1.00 132.51 186 Bj 1 \nATOM 1098 O OE1 . GLN Q 17 186 ? 155.493 252.978 281.713 1.00 132.51 186 Bj 1 \nATOM 1099 N NE2 . GLN Q 17 186 ? 156.978 253.147 280.037 1.00 132.51 186 Bj 1 \nATOM 1100 N N   . THR Q 17 187 ? 152.245 257.383 282.408 1.00 131.91 187 Bj 1 \nATOM 1101 C CA  . THR Q 17 187 ? 151.163 257.778 283.304 1.00 131.91 187 Bj 1 \nATOM 1102 C C   . THR Q 17 187 ? 150.188 258.718 282.606 1.00 131.91 187 Bj 1 \nATOM 1103 O O   . THR Q 17 187 ? 148.971 258.593 282.773 1.00 131.91 187 Bj 1 \nATOM 1104 C CB  . THR Q 17 187 ? 151.737 258.432 284.560 1.00 131.91 187 Bj 1 \nATOM 1105 O OG1 . THR Q 17 187 ? 152.712 257.561 285.147 1.00 131.91 187 Bj 1 \nATOM 1106 C CG2 . THR Q 17 187 ? 150.634 258.703 285.570 1.00 131.91 187 Bj 1 \nATOM 1107 N N   . ALA Q 17 188 ? 150.705 259.659 281.814 1.00 133.19 188 Bj 1 \nATOM 1108 C CA  . ALA Q 17 188 ? 149.827 260.556 281.066 1.00 133.19 188 Bj 1 \nATOM 1109 C C   . ALA Q 17 188 ? 149.020 259.794 280.020 1.00 133.19 188 Bj 1 \nATOM 1110 O O   . ALA Q 17 188 ? 147.848 260.110 279.775 1.00 133.19 188 Bj 1 \nATOM 1111 C CB  . ALA Q 17 188 ? 150.647 261.666 280.409 1.00 133.19 188 Bj 1 \nATOM 1112 N N   . GLU Q 17 189 ? 149.632 258.789 279.390 1.00 135.20 189 Bj 1 \nATOM 1113 C CA  . GLU Q 17 189 ? 148.905 257.958 278.433 1.00 135.20 189 Bj 1 \nATOM 1114 C C   . GLU Q 17 189 ? 147.783 257.190 279.121 1.00 135.20 189 Bj 1 \nATOM 1115 O O   . GLU Q 17 189 ? 146.649 257.145 278.628 1.00 135.20 189 Bj 1 \nATOM 1116 C CB  . GLU Q 17 189 ? 149.869 257.000 277.732 1.00 135.20 189 Bj 1 \nATOM 1117 C CG  . GLU Q 17 189 ? 150.860 257.688 276.807 1.00 135.20 189 Bj 1 \nATOM 1118 C CD  . GLU Q 17 189 ? 151.898 256.735 276.247 1.00 135.20 189 Bj 1 \nATOM 1119 O OE1 . GLU Q 17 189 ? 151.856 255.537 276.598 1.00 135.20 189 Bj 1 \nATOM 1120 O OE2 . GLU Q 17 189 ? 152.755 257.183 275.457 1.00 135.20 189 Bj 1 \nATOM 1121 N N   . ARG Q 17 190 ? 148.085 256.576 280.268 1.00 137.16 190 Bj 1 \nATOM 1122 C CA  . ARG Q 17 190 ? 147.053 255.885 281.035 1.00 137.16 190 Bj 1 \nATOM 1123 C C   . ARG Q 17 190 ? 145.950 256.847 281.459 1.00 137.16 190 Bj 1 \nATOM 1124 O O   . ARG Q 17 190 ? 144.768 256.483 281.473 1.00 137.16 190 Bj 1 \nATOM 1125 C CB  . ARG Q 17 190 ? 147.674 255.206 282.256 1.00 137.16 190 Bj 1 \nATOM 1126 C CG  . ARG Q 17 190 ? 146.670 254.507 283.159 1.00 137.16 190 Bj 1 \nATOM 1127 C CD  . ARG Q 17 190 ? 147.358 253.841 284.338 1.00 137.16 190 Bj 1 \nATOM 1128 N NE  . ARG Q 17 190 ? 148.133 254.792 285.129 1.00 137.16 190 Bj 1 \nATOM 1129 C CZ  . ARG Q 17 190 ? 147.632 255.522 286.120 1.00 137.16 190 Bj 1 \nATOM 1130 N NH1 . ARG Q 17 190 ? 146.352 255.413 286.445 1.00 137.16 190 Bj 1 \nATOM 1131 N NH2 . ARG Q 17 190 ? 148.412 256.362 286.786 1.00 137.16 190 Bj 1 \nATOM 1132 N N   . THR Q 17 191 ? 146.318 258.084 281.795 1.00 139.17 191 Bj 1 \nATOM 1133 C CA  . THR Q 17 191 ? 145.327 259.090 282.158 1.00 139.17 191 Bj 1 \nATOM 1134 C C   . THR Q 17 191 ? 144.388 259.378 280.996 1.00 139.17 191 Bj 1 \nATOM 1135 O O   . THR Q 17 191 ? 143.164 259.268 281.131 1.00 139.17 191 Bj 1 \nATOM 1136 C CB  . THR Q 17 191 ? 146.024 260.373 282.606 1.00 139.17 191 Bj 1 \nATOM 1137 O OG1 . THR Q 17 191 ? 146.894 260.085 283.707 1.00 139.17 191 Bj 1 \nATOM 1138 C CG2 . THR Q 17 191 ? 144.999 261.416 283.027 1.00 139.17 191 Bj 1 \nATOM 1139 N N   . LEU Q 17 192 ? 144.945 259.747 279.841 1.00 141.63 192 Bj 1 \nATOM 1140 C CA  . LEU Q 17 192 ? 144.109 260.056 278.687 1.00 141.63 192 Bj 1 \nATOM 1141 C C   . LEU Q 17 192 ? 143.341 258.840 278.185 1.00 141.63 192 Bj 1 \nATOM 1142 O O   . LEU Q 17 192 ? 142.352 259.004 277.463 1.00 141.63 192 Bj 1 \nATOM 1143 C CB  . LEU Q 17 192 ? 144.956 260.651 277.557 1.00 141.63 192 Bj 1 \nATOM 1144 C CG  . LEU Q 17 192 ? 146.099 259.830 276.954 1.00 141.63 192 Bj 1 \nATOM 1145 C CD1 . LEU Q 17 192 ? 145.628 258.957 275.794 1.00 141.63 192 Bj 1 \nATOM 1146 C CD2 . LEU Q 17 192 ? 147.225 260.747 276.511 1.00 141.63 192 Bj 1 \nATOM 1147 N N   . ALA Q 17 193 ? 143.770 257.628 278.546 1.00 143.93 193 Bj 1 \nATOM 1148 C CA  . ALA Q 17 193 ? 143.045 256.438 278.119 1.00 143.93 193 Bj 1 \nATOM 1149 C C   . ALA Q 17 193 ? 141.916 256.066 279.074 1.00 143.93 193 Bj 1 \nATOM 1150 O O   . ALA Q 17 193 ? 140.870 255.584 278.626 1.00 143.93 193 Bj 1 \nATOM 1151 C CB  . ALA Q 17 193 ? 144.010 255.261 277.971 1.00 143.93 193 Bj 1 \nATOM 1152 N N   . THR Q 17 194 ? 142.098 256.279 280.377 1.00 145.46 194 Bj 1 \nATOM 1153 C CA  . THR Q 17 194 ? 141.129 255.841 281.375 1.00 145.46 194 Bj 1 \nATOM 1154 C C   . THR Q 17 194 ? 140.242 256.970 281.888 1.00 145.46 194 Bj 1 \nATOM 1155 O O   . THR Q 17 194 ? 139.014 256.846 281.870 1.00 145.46 194 Bj 1 \nATOM 1156 C CB  . THR Q 17 194 ? 141.855 255.179 282.553 1.00 145.46 194 Bj 1 \nATOM 1157 O OG1 . THR Q 17 194 ? 142.819 256.090 283.094 1.00 145.46 194 Bj 1 \nATOM 1158 C CG2 . THR Q 17 194 ? 142.563 253.912 282.096 1.00 145.46 194 Bj 1 \nATOM 1159 N N   . LEU Q 17 195 ? 140.840 258.069 282.358 1.00 142.21 195 Bj 1 \nATOM 1160 C CA  . LEU Q 17 195 ? 140.050 259.165 282.911 1.00 142.21 195 Bj 1 \nATOM 1161 C C   . LEU Q 17 195 ? 139.145 259.793 281.860 1.00 142.21 195 Bj 1 \nATOM 1162 O O   . LEU Q 17 195 ? 138.038 260.239 282.181 1.00 142.21 195 Bj 1 \nATOM 1163 C CB  . LEU Q 17 195 ? 140.968 260.229 283.517 1.00 142.21 195 Bj 1 \nATOM 1164 C CG  . LEU Q 17 195 ? 141.597 259.972 284.891 1.00 142.21 195 Bj 1 \nATOM 1165 C CD1 . LEU Q 17 195 ? 142.698 258.923 284.829 1.00 142.21 195 Bj 1 \nATOM 1166 C CD2 . LEU Q 17 195 ? 142.128 261.271 285.480 1.00 142.21 195 Bj 1 \nATOM 1167 N N   . SER Q 17 196 ? 139.594 259.839 280.604 1.00 140.98 196 Bj 1 \nATOM 1168 C CA  . SER Q 17 196 ? 138.776 260.410 279.541 1.00 140.98 196 Bj 1 \nATOM 1169 C C   . SER Q 17 196 ? 137.616 259.503 279.154 1.00 140.98 196 Bj 1 \nATOM 1170 O O   . SER Q 17 196 ? 136.610 259.998 278.635 1.00 140.98 196 Bj 1 \nATOM 1171 C CB  . SER Q 17 196 ? 139.642 260.710 278.317 1.00 140.98 196 Bj 1 \nATOM 1172 O OG  . SER Q 17 196 ? 138.870 261.273 277.272 1.00 140.98 196 Bj 1 \nATOM 1173 N N   . GLU Q 17 197 ? 137.739 258.194 279.389 1.00 135.62 197 Bj 1 \nATOM 1174 C CA  . GLU Q 17 197 ? 136.656 257.236 279.156 1.00 135.62 197 Bj 1 \nATOM 1175 C C   . GLU Q 17 197 ? 136.208 257.234 277.696 1.00 135.62 197 Bj 1 \nATOM 1176 O O   . GLU Q 17 197 ? 135.013 257.193 277.396 1.00 135.62 197 Bj 1 \nATOM 1177 C CB  . GLU Q 17 197 ? 135.470 257.510 280.085 1.00 135.62 197 Bj 1 \nATOM 1178 C CG  . GLU Q 17 197 ? 135.840 257.617 281.554 1.00 135.62 197 Bj 1 \nATOM 1179 C CD  . GLU Q 17 197 ? 134.680 258.079 282.413 1.00 135.62 197 Bj 1 \nATOM 1180 O OE1 . GLU Q 17 197 ? 133.581 258.302 281.863 1.00 135.62 197 Bj 1 \nATOM 1181 O OE2 . GLU Q 17 197 ? 134.868 258.222 283.639 1.00 135.62 197 Bj 1 \nATOM 1182 N N   . ASN Q 17 198 ? 137.171 257.276 276.779 1.00 129.66 198 Bj 1 \nATOM 1183 C CA  . ASN Q 17 198 ? 136.857 257.290 275.358 1.00 129.66 198 Bj 1 \nATOM 1184 C C   . ASN Q 17 198 ? 138.089 256.875 274.568 1.00 129.66 198 Bj 1 \nATOM 1185 O O   . ASN Q 17 198 ? 139.210 256.881 275.082 1.00 129.66 198 Bj 1 \nATOM 1186 C CB  . ASN Q 17 198 ? 136.372 258.671 274.903 1.00 129.66 198 Bj 1 \nATOM 1187 C CG  . ASN Q 17 198 ? 137.500 259.681 274.800 1.00 129.66 198 Bj 1 \nATOM 1188 O OD1 . ASN Q 17 198 ? 138.430 259.675 275.605 1.00 129.66 198 Bj 1 \nATOM 1189 N ND2 . ASN Q 17 198 ? 137.425 260.552 273.801 1.00 129.66 198 Bj 1 \nATOM 1190 N N   . ASN Q 17 199 ? 137.862 256.515 273.307 1.00 121.02 199 Bj 1 \nATOM 1191 C CA  . ASN Q 17 199 ? 138.944 256.208 272.374 1.00 121.02 199 Bj 1 \nATOM 1192 C C   . ASN Q 17 199 ? 139.384 257.519 271.734 1.00 121.02 199 Bj 1 \nATOM 1193 O O   . ASN Q 17 199 ? 138.711 258.055 270.850 1.00 121.02 199 Bj 1 \nATOM 1194 C CB  . ASN Q 17 199 ? 138.496 255.185 271.335 1.00 121.02 199 Bj 1 \nATOM 1195 C CG  . ASN Q 17 199 ? 137.204 255.577 270.646 1.00 121.02 199 Bj 1 \nATOM 1196 O OD1 . ASN Q 17 199 ? 136.405 256.339 271.189 1.00 121.02 199 Bj 1 \nATOM 1197 N ND2 . ASN Q 17 199 ? 136.993 255.057 269.443 1.00 121.02 199 Bj 1 \nATOM 1198 N N   . MET Q 17 200 ? 140.516 258.044 272.190 1.00 123.96 200 Bj 1 \nATOM 1199 C CA  . MET Q 17 200 ? 141.014 259.341 271.760 1.00 123.96 200 Bj 1 \nATOM 1200 C C   . MET Q 17 200 ? 142.451 259.205 271.279 1.00 123.96 200 Bj 1 \nATOM 1201 O O   . MET Q 17 200 ? 143.258 258.501 271.895 1.00 123.96 200 Bj 1 \nATOM 1202 C CB  . MET Q 17 200 ? 140.927 260.358 272.901 1.00 123.96 200 Bj 1 \nATOM 1203 C CG  . MET Q 17 200 ? 141.315 261.768 272.517 1.00 123.96 200 Bj 1 \nATOM 1204 S SD  . MET Q 17 200 ? 141.001 262.928 273.857 1.00 123.96 200 Bj 1 \nATOM 1205 C CE  . MET Q 17 200 ? 141.986 262.202 275.165 1.00 123.96 200 Bj 1 \nATOM 1206 N N   . GLU Q 17 201 ? 142.767 259.880 270.176 1.00 115.66 201 Bj 1 \nATOM 1207 C CA  . GLU Q 17 201 ? 144.092 259.821 269.570 1.00 115.66 201 Bj 1 \nATOM 1208 C C   . GLU Q 17 201 ? 144.889 261.040 270.022 1.00 115.66 201 Bj 1 \nATOM 1209 O O   . GLU Q 17 201 ? 144.619 262.164 269.586 1.00 115.66 201 Bj 1 \nATOM 1210 C CB  . GLU Q 17 201 ? 143.988 259.759 268.048 1.00 115.66 201 Bj 1 \nATOM 1211 C CG  . GLU Q 17 201 ? 143.149 258.601 267.531 1.00 115.66 201 Bj 1 \nATOM 1212 C CD  . GLU Q 17 201 ? 143.120 258.531 266.017 1.00 115.66 201 Bj 1 \nATOM 1213 O OE1 . GLU Q 17 201 ? 143.950 259.207 265.373 1.00 115.66 201 Bj 1 \nATOM 1214 O OE2 . GLU Q 17 201 ? 142.265 257.803 265.470 1.00 115.66 201 Bj 1 \nATOM 1215 N N   . ALA Q 17 202 ? 145.869 260.814 270.892 1.00 117.10 202 Bj 1 \nATOM 1216 C CA  . ALA Q 17 202 ? 146.717 261.870 271.422 1.00 117.10 202 Bj 1 \nATOM 1217 C C   . ALA Q 17 202 ? 148.131 261.723 270.876 1.00 117.10 202 Bj 1 \nATOM 1218 O O   . ALA Q 17 202 ? 148.651 260.609 270.767 1.00 117.10 202 Bj 1 \nATOM 1219 C CB  . ALA Q 17 202 ? 146.744 261.840 272.952 1.00 117.10 202 Bj 1 \nATOM 1220 N N   . LYS Q 17 203 ? 148.748 262.853 270.539 1.00 120.82 203 Bj 1 \nATOM 1221 C CA  . LYS Q 17 203 ? 150.096 262.887 269.981 1.00 120.82 203 Bj 1 \nATOM 1222 C C   . LYS Q 17 203 ? 150.986 263.704 270.910 1.00 120.82 203 Bj 1 \nATOM 1223 O O   . LYS Q 17 203 ? 150.846 264.929 270.994 1.00 120.82 203 Bj 1 \nATOM 1224 C CB  . LYS Q 17 203 ? 150.087 263.476 268.572 1.00 120.82 203 Bj 1 \nATOM 1225 C CG  . LYS Q 17 203 ? 151.408 263.346 267.834 1.00 120.82 203 Bj 1 \nATOM 1226 C CD  . LYS Q 17 203 ? 151.757 261.888 267.591 1.00 120.82 203 Bj 1 \nATOM 1227 C CE  . LYS Q 17 203 ? 153.066 261.752 266.833 1.00 120.82 203 Bj 1 \nATOM 1228 N NZ  . LYS Q 17 203 ? 153.409 260.327 266.571 1.00 120.82 203 Bj 1 \nATOM 1229 N N   . PHE Q 17 204 ? 151.897 263.028 271.606 1.00 125.72 204 Bj 1 \nATOM 1230 C CA  . PHE Q 17 204 ? 152.832 263.707 272.490 1.00 125.72 204 Bj 1 \nATOM 1231 C C   . PHE Q 17 204 ? 153.972 264.322 271.689 1.00 125.72 204 Bj 1 \nATOM 1232 O O   . PHE Q 17 204 ? 154.445 263.744 270.707 1.00 125.72 204 Bj 1 \nATOM 1233 C CB  . PHE Q 17 204 ? 153.391 262.739 273.531 1.00 125.72 204 Bj 1 \nATOM 1234 C CG  . PHE Q 17 204 ? 152.415 262.383 274.614 1.00 125.72 204 Bj 1 \nATOM 1235 C CD1 . PHE Q 17 204 ? 151.538 261.325 274.454 1.00 125.72 204 Bj 1 \nATOM 1236 C CD2 . PHE Q 17 204 ? 152.379 263.106 275.795 1.00 125.72 204 Bj 1 \nATOM 1237 C CE1 . PHE Q 17 204 ? 150.641 260.996 275.451 1.00 125.72 204 Bj 1 \nATOM 1238 C CE2 . PHE Q 17 204 ? 151.484 262.782 276.795 1.00 125.72 204 Bj 1 \nATOM 1239 C CZ  . PHE Q 17 204 ? 150.615 261.725 276.624 1.00 125.72 204 Bj 1 \nATOM 1240 N N   . LEU Q 17 205 ? 154.414 265.504 272.120 1.00 121.24 205 Bj 1 \nATOM 1241 C CA  . LEU Q 17 205 ? 155.467 266.215 271.402 1.00 121.24 205 Bj 1 \nATOM 1242 C C   . LEU Q 17 205 ? 156.851 265.713 271.799 1.00 121.24 205 Bj 1 \nATOM 1243 O O   . LEU Q 17 205 ? 157.602 265.202 270.961 1.00 121.24 205 Bj 1 \nATOM 1244 C CB  . LEU Q 17 205 ? 155.344 267.719 271.658 1.00 121.24 205 Bj 1 \nATOM 1245 C CG  . LEU Q 17 205 ? 153.967 268.330 271.399 1.00 121.24 205 Bj 1 \nATOM 1246 C CD1 . LEU Q 17 205 ? 153.973 269.814 271.724 1.00 121.24 205 Bj 1 \nATOM 1247 C CD2 . LEU Q 17 205 ? 153.536 268.092 269.962 1.00 121.24 205 Bj 1 \nATOM 1248 N N   . GLY Q 17 206 ? 157.202 265.847 273.070 1.00 130.10 206 Bj 1 \nATOM 1249 C CA  . GLY Q 17 206 ? 158.515 265.444 273.539 1.00 130.10 206 Bj 1 \nATOM 1250 C C   . GLY Q 17 206 ? 158.419 264.700 274.853 1.00 130.10 206 Bj 1 \nATOM 1251 O O   . GLY Q 17 206 ? 157.446 264.831 275.598 1.00 130.10 206 Bj 1 \nATOM 1252 N N   . ASN Q 17 207 ? 159.458 263.909 275.133 1.00 132.28 207 Bj 1 \nATOM 1253 C CA  . ASN Q 17 207 ? 159.476 263.119 276.359 1.00 132.28 207 Bj 1 \nATOM 1254 C C   . ASN Q 17 207 ? 159.764 263.982 277.581 1.00 132.28 207 Bj 1 \nATOM 1255 O O   . ASN Q 17 207 ? 159.380 263.618 278.699 1.00 132.28 207 Bj 1 \nATOM 1256 C CB  . ASN Q 17 207 ? 160.510 261.999 276.242 1.00 132.28 207 Bj 1 \nATOM 1257 C CG  . ASN Q 17 207 ? 160.456 261.029 277.405 1.00 132.28 207 Bj 1 \nATOM 1258 O OD1 . ASN Q 17 207 ? 159.414 260.859 278.039 1.00 132.28 207 Bj 1 \nATOM 1259 N ND2 . ASN Q 17 207 ? 161.581 260.384 277.690 1.00 132.28 207 Bj 1 \nATOM 1260 N N   . ALA Q 17 208 ? 160.429 265.117 277.395 1.00 129.27 208 Bj 1 \nATOM 1261 C CA  . ALA Q 17 208 ? 160.739 265.987 278.515 1.00 129.27 208 Bj 1 \nATOM 1262 C C   . ALA Q 17 208 ? 159.476 266.692 279.008 1.00 129.27 208 Bj 1 \nATOM 1263 O O   . ALA Q 17 208 ? 158.549 266.940 278.230 1.00 129.27 208 Bj 1 \nATOM 1264 C CB  . ALA Q 17 208 ? 161.789 267.020 278.115 1.00 129.27 208 Bj 1 \nATOM 1265 N N   . PRO Q 17 209 ? 159.410 267.019 280.299 1.00 132.17 209 Bj 1 \nATOM 1266 C CA  . PRO Q 17 209 ? 158.236 267.726 280.821 1.00 132.17 209 Bj 1 \nATOM 1267 C C   . PRO Q 17 209 ? 158.110 269.117 280.221 1.00 132.17 209 Bj 1 \nATOM 1268 O O   . PRO Q 17 209 ? 159.065 269.686 279.688 1.00 132.17 209 Bj 1 \nATOM 1269 C CB  . PRO Q 17 209 ? 158.499 267.795 282.331 1.00 132.17 209 Bj 1 \nATOM 1270 C CG  . PRO Q 17 209 ? 159.515 266.734 282.598 1.00 132.17 209 Bj 1 \nATOM 1271 C CD  . PRO Q 17 209 ? 160.359 266.661 281.366 1.00 132.17 209 Bj 1 \nATOM 1272 N N   . CYS Q 17 210 ? 156.902 269.668 280.318 1.00 129.55 210 Bj 1 \nATOM 1273 C CA  . CYS Q 17 210 ? 156.616 271.006 279.817 1.00 129.55 210 Bj 1 \nATOM 1274 C C   . CYS Q 17 210 ? 156.563 272.051 280.922 1.00 129.55 210 Bj 1 \nATOM 1275 O O   . CYS Q 17 210 ? 156.967 273.196 280.703 1.00 129.55 210 Bj 1 \nATOM 1276 C CB  . CYS Q 17 210 ? 155.294 271.012 279.044 1.00 129.55 210 Bj 1 \nATOM 1277 S SG  . CYS Q 17 210 ? 155.139 269.674 277.842 1.00 129.55 210 Bj 1 \nATOM 1278 N N   . GLY Q 17 211 ? 156.076 271.687 282.100 1.00 136.75 211 Bj 1 \nATOM 1279 C CA  . GLY Q 17 211 ? 156.066 272.608 283.225 1.00 136.75 211 Bj 1 \nATOM 1280 C C   . GLY Q 17 211 ? 156.247 271.868 284.528 1.00 136.75 211 Bj 1 \nATOM 1281 O O   . GLY Q 17 211 ? 155.885 270.695 284.650 1.00 136.75 211 Bj 1 \nATOM 1282 N N   . HIS Q 17 212 ? 156.808 272.561 285.516 1.00 134.65 212 Bj 1 \nATOM 1283 C CA  . HIS Q 17 212 ? 157.023 272.000 286.842 1.00 134.65 212 Bj 1 \nATOM 1284 C C   . HIS Q 17 212 ? 156.523 272.973 287.897 1.00 134.65 212 Bj 1 \nATOM 1285 O O   . HIS Q 17 212 ? 156.786 274.177 287.812 1.00 134.65 212 Bj 1 \nATOM 1286 C CB  . HIS Q 17 212 ? 158.502 271.694 287.090 1.00 134.65 212 Bj 1 \nATOM 1287 C CG  . HIS Q 17 212 ? 158.933 270.348 286.601 1.00 134.65 212 Bj 1 \nATOM 1288 N ND1 . HIS Q 17 212 ? 159.905 269.605 287.236 1.00 134.65 212 Bj 1 \nATOM 1289 C CD2 . HIS Q 17 212 ? 158.530 269.612 285.539 1.00 134.65 212 Bj 1 \nATOM 1290 C CE1 . HIS Q 17 212 ? 160.079 268.468 286.587 1.00 134.65 212 Bj 1 \nATOM 1291 N NE2 . HIS Q 17 212 ? 159.258 268.447 285.553 1.00 134.65 212 Bj 1 \nATOM 1292 N N   . TYR Q 17 213 ? 155.805 272.454 288.892 1.00 135.25 213 Bj 1 \nATOM 1293 C CA  . TYR Q 17 213 ? 155.323 273.300 289.979 1.00 135.25 213 Bj 1 \nATOM 1294 C C   . TYR Q 17 213 ? 155.377 272.542 291.296 1.00 135.25 213 Bj 1 \nATOM 1295 O O   . TYR Q 17 213 ? 154.938 271.392 291.372 1.00 135.25 213 Bj 1 \nATOM 1296 C CB  . TYR Q 17 213 ? 153.896 273.793 289.707 1.00 135.25 213 Bj 1 \nATOM 1297 C CG  . TYR Q 17 213 ? 153.785 274.683 288.490 1.00 135.25 213 Bj 1 \nATOM 1298 C CD1 . TYR Q 17 213 ? 153.974 276.055 288.588 1.00 135.25 213 Bj 1 \nATOM 1299 C CD2 . TYR Q 17 213 ? 153.497 274.151 287.241 1.00 135.25 213 Bj 1 \nATOM 1300 C CE1 . TYR Q 17 213 ? 153.875 276.870 287.476 1.00 135.25 213 Bj 1 \nATOM 1301 C CE2 . TYR Q 17 213 ? 153.395 274.957 286.125 1.00 135.25 213 Bj 1 \nATOM 1302 C CZ  . TYR Q 17 213 ? 153.585 276.315 286.248 1.00 135.25 213 Bj 1 \nATOM 1303 O OH  . TYR Q 17 213 ? 153.485 277.120 285.137 1.00 135.25 213 Bj 1 \nATOM 1304 N N   . LYS Q 17 214 ? 155.902 273.189 292.333 1.00 138.67 214 Bj 1 \nATOM 1305 C CA  . LYS Q 17 214 ? 156.024 272.582 293.650 1.00 138.67 214 Bj 1 \nATOM 1306 C C   . LYS Q 17 214 ? 155.177 273.334 294.667 1.00 138.67 214 Bj 1 \nATOM 1307 O O   . LYS Q 17 214 ? 154.975 274.547 294.559 1.00 138.67 214 Bj 1 \nATOM 1308 C CB  . LYS Q 17 214 ? 157.483 272.554 294.123 1.00 138.67 214 Bj 1 \nATOM 1309 C CG  . LYS Q 17 214 ? 158.319 271.446 293.510 1.00 138.67 214 Bj 1 \nATOM 1310 C CD  . LYS Q 17 214 ? 159.715 271.422 294.112 1.00 138.67 214 Bj 1 \nATOM 1311 C CE  . LYS Q 17 214 ? 160.537 270.265 293.567 1.00 138.67 214 Bj 1 \nATOM 1312 N NZ  . LYS Q 17 214 ? 159.905 268.949 293.855 1.00 138.67 214 Bj 1 \nATOM 1313 N N   . PHE Q 17 215 ? 154.684 272.594 295.658 1.00 143.45 215 Bj 1 \nATOM 1314 C CA  . PHE Q 17 215 ? 153.944 273.179 296.769 1.00 143.45 215 Bj 1 \nATOM 1315 C C   . PHE Q 17 215 ? 154.171 272.332 298.012 1.00 143.45 215 Bj 1 \nATOM 1316 O O   . PHE Q 17 215 ? 154.077 271.103 297.954 1.00 143.45 215 Bj 1 \nATOM 1317 C CB  . PHE Q 17 215 ? 152.446 273.293 296.456 1.00 143.45 215 Bj 1 \nATOM 1318 C CG  . PHE Q 17 215 ? 151.816 272.015 295.975 1.00 143.45 215 Bj 1 \nATOM 1319 C CD1 . PHE Q 17 215 ? 151.873 271.659 294.637 1.00 143.45 215 Bj 1 \nATOM 1320 C CD2 . PHE Q 17 215 ? 151.143 271.185 296.855 1.00 143.45 215 Bj 1 \nATOM 1321 C CE1 . PHE Q 17 215 ? 151.287 270.489 294.190 1.00 143.45 215 Bj 1 \nATOM 1322 C CE2 . PHE Q 17 215 ? 150.553 270.015 296.414 1.00 143.45 215 Bj 1 \nATOM 1323 C CZ  . PHE Q 17 215 ? 150.626 269.667 295.079 1.00 143.45 215 Bj 1 \nATOM 1324 N N   . LYS Q 17 216 ? 154.477 272.988 299.126 1.00 149.62 216 Bj 1 \nATOM 1325 C CA  . LYS Q 17 216 ? 154.790 272.310 300.375 1.00 149.62 216 Bj 1 \nATOM 1326 C C   . LYS Q 17 216 ? 153.709 272.593 301.408 1.00 149.62 216 Bj 1 \nATOM 1327 O O   . LYS Q 17 216 ? 153.137 273.687 301.440 1.00 149.62 216 Bj 1 \nATOM 1328 C CB  . LYS Q 17 216 ? 156.158 272.749 300.906 1.00 149.62 216 Bj 1 \nATOM 1329 C CG  . LYS Q 17 216 ? 157.300 272.479 299.940 1.00 149.62 216 Bj 1 \nATOM 1330 C CD  . LYS Q 17 216 ? 158.639 272.904 300.519 1.00 149.62 216 Bj 1 \nATOM 1331 C CE  . LYS Q 17 216 ? 159.771 272.621 299.544 1.00 149.62 216 Bj 1 \nATOM 1332 N NZ  . LYS Q 17 216 ? 161.098 272.996 300.105 1.00 149.62 216 Bj 1 \nATOM 1333 N N   . PHE Q 17 217 ? 153.435 271.602 302.250 1.00 143.58 217 Bj 1 \nATOM 1334 C CA  . PHE Q 17 217 ? 152.407 271.732 303.275 1.00 143.58 217 Bj 1 \nATOM 1335 C C   . PHE Q 17 217 ? 153.018 272.091 304.624 1.00 143.58 217 Bj 1 \nATOM 1336 O O   . PHE Q 17 217 ? 152.899 271.339 305.590 1.00 143.58 217 Bj 1 \nATOM 1337 C CB  . PHE Q 17 217 ? 151.599 270.437 303.392 1.00 143.58 217 Bj 1 \nATOM 1338 C CG  . PHE Q 17 217 ? 150.831 270.087 302.150 1.00 143.58 217 Bj 1 \nATOM 1339 C CD1 . PHE Q 17 217 ? 150.463 271.069 301.245 1.00 143.58 217 Bj 1 \nATOM 1340 C CD2 . PHE Q 17 217 ? 150.477 268.774 301.886 1.00 143.58 217 Bj 1 \nATOM 1341 C CE1 . PHE Q 17 217 ? 149.756 270.748 300.101 1.00 143.58 217 Bj 1 \nATOM 1342 C CE2 . PHE Q 17 217 ? 149.771 268.447 300.744 1.00 143.58 217 Bj 1 \nATOM 1343 C CZ  . PHE Q 17 217 ? 149.410 269.435 299.851 1.00 143.58 217 Bj 1 \nATOM 1344 N N   . LEU Q 17 227 ? 157.135 268.148 304.312 1.00 125.05 227 Bj 1 \nATOM 1345 C CA  . LEU Q 17 227 ? 156.195 267.564 303.362 1.00 125.05 227 Bj 1 \nATOM 1346 C C   . LEU Q 17 227 ? 156.009 268.470 302.151 1.00 125.05 227 Bj 1 \nATOM 1347 O O   . LEU Q 17 227 ? 155.534 269.599 302.277 1.00 125.05 227 Bj 1 \nATOM 1348 C CB  . LEU Q 17 227 ? 154.846 267.299 304.034 1.00 125.05 227 Bj 1 \nATOM 1349 C CG  . LEU Q 17 227 ? 153.726 266.761 303.141 1.00 125.05 227 Bj 1 \nATOM 1350 C CD1 . LEU Q 17 227 ? 154.132 265.448 302.492 1.00 125.05 227 Bj 1 \nATOM 1351 C CD2 . LEU Q 17 227 ? 152.443 266.591 303.938 1.00 125.05 227 Bj 1 \nATOM 1352 N N   . GLY Q 17 228 ? 156.388 267.969 300.971 1.00 128.22 228 Bj 1 \nATOM 1353 C CA  . GLY Q 17 228 ? 156.244 268.718 299.745 1.00 128.22 228 Bj 1 \nATOM 1354 C C   . GLY Q 17 228 ? 155.646 267.856 298.647 1.00 128.22 228 Bj 1 \nATOM 1355 O O   . GLY Q 17 228 ? 155.531 266.635 298.775 1.00 128.22 228 Bj 1 \nATOM 1356 N N   . ALA Q 17 229 ? 155.272 268.518 297.555 1.00 135.59 229 Bj 1 \nATOM 1357 C CA  . ALA Q 17 229 ? 154.709 267.825 296.410 1.00 135.59 229 Bj 1 \nATOM 1358 C C   . ALA Q 17 229 ? 155.086 268.574 295.142 1.00 135.59 229 Bj 1 \nATOM 1359 O O   . ALA Q 17 229 ? 155.273 269.793 295.151 1.00 135.59 229 Bj 1 \nATOM 1360 C CB  . ALA Q 17 229 ? 153.186 267.691 296.522 1.00 135.59 229 Bj 1 \nATOM 1361 N N   . LYS Q 17 230 ? 155.195 267.821 294.052 1.00 134.09 230 Bj 1 \nATOM 1362 C CA  . LYS Q 17 230 ? 155.610 268.330 292.755 1.00 134.09 230 Bj 1 \nATOM 1363 C C   . LYS Q 17 230 ? 154.658 267.812 291.689 1.00 134.09 230 Bj 1 \nATOM 1364 O O   . LYS Q 17 230 ? 154.215 266.660 291.748 1.00 134.09 230 Bj 1 \nATOM 1365 C CB  . LYS Q 17 230 ? 157.044 267.900 292.437 1.00 134.09 230 Bj 1 \nATOM 1366 C CG  . LYS Q 17 230 ? 157.266 266.407 292.605 1.00 134.09 230 Bj 1 \nATOM 1367 C CD  . LYS Q 17 230 ? 158.738 266.053 292.685 1.00 134.09 230 Bj 1 \nATOM 1368 C CE  . LYS Q 17 230 ? 158.919 264.566 292.931 1.00 134.09 230 Bj 1 \nATOM 1369 N NZ  . LYS Q 17 230 ? 158.240 264.126 294.181 1.00 134.09 230 Bj 1 \nATOM 1370 N N   . VAL Q 17 231 ? 154.339 268.668 290.723 1.00 135.01 231 Bj 1 \nATOM 1371 C CA  . VAL Q 17 231 ? 153.447 268.325 289.624 1.00 135.01 231 Bj 1 \nATOM 1372 C C   . VAL Q 17 231 ? 154.143 268.676 288.317 1.00 135.01 231 Bj 1 \nATOM 1373 O O   . VAL Q 17 231 ? 154.717 269.766 288.179 1.00 135.01 231 Bj 1 \nATOM 1374 C CB  . VAL Q 17 231 ? 152.083 269.037 289.740 1.00 135.01 231 Bj 1 \nATOM 1375 C CG1 . VAL Q 17 231 ? 152.256 270.540 289.888 1.00 135.01 231 Bj 1 \nATOM 1376 C CG2 . VAL Q 17 231 ? 151.200 268.706 288.544 1.00 135.01 231 Bj 1 \nATOM 1377 N N   . PHE Q 17 232 ? 154.109 267.736 287.371 1.00 135.12 232 Bj 1 \nATOM 1378 C CA  . PHE Q 17 232 ? 154.776 267.856 286.079 1.00 135.12 232 Bj 1 \nATOM 1379 C C   . PHE Q 17 232 ? 153.708 267.897 284.994 1.00 135.12 232 Bj 1 \nATOM 1380 O O   . PHE Q 17 232 ? 152.998 266.910 284.777 1.00 135.12 232 Bj 1 \nATOM 1381 C CB  . PHE Q 17 232 ? 155.736 266.691 285.848 1.00 135.12 232 Bj 1 \nATOM 1382 C CG  . PHE Q 17 232 ? 156.600 266.370 287.032 1.00 135.12 232 Bj 1 \nATOM 1383 C CD1 . PHE Q 17 232 ? 157.175 267.378 287.786 1.00 135.12 232 Bj 1 \nATOM 1384 C CD2 . PHE Q 17 232 ? 156.831 265.055 287.394 1.00 135.12 232 Bj 1 \nATOM 1385 C CE1 . PHE Q 17 232 ? 157.968 267.079 288.875 1.00 135.12 232 Bj 1 \nATOM 1386 C CE2 . PHE Q 17 232 ? 157.623 264.749 288.481 1.00 135.12 232 Bj 1 \nATOM 1387 C CZ  . PHE Q 17 232 ? 158.192 265.763 289.223 1.00 135.12 232 Bj 1 \nATOM 1388 N N   . PHE Q 17 233 ? 153.597 269.034 284.318 1.00 138.91 233 Bj 1 \nATOM 1389 C CA  . PHE Q 17 233 ? 152.629 269.220 283.246 1.00 138.91 233 Bj 1 \nATOM 1390 C C   . PHE Q 17 233 ? 153.266 268.835 281.917 1.00 138.91 233 Bj 1 \nATOM 1391 O O   . PHE Q 17 233 ? 154.289 269.410 281.525 1.00 138.91 233 Bj 1 \nATOM 1392 C CB  . PHE Q 17 233 ? 152.141 270.667 283.211 1.00 138.91 233 Bj 1 \nATOM 1393 C CG  . PHE Q 17 233 ? 151.342 271.064 284.416 1.00 138.91 233 Bj 1 \nATOM 1394 C CD1 . PHE Q 17 233 ? 151.971 271.457 285.584 1.00 138.91 233 Bj 1 \nATOM 1395 C CD2 . PHE Q 17 233 ? 149.959 271.042 284.380 1.00 138.91 233 Bj 1 \nATOM 1396 C CE1 . PHE Q 17 233 ? 151.233 271.818 286.695 1.00 138.91 233 Bj 1 \nATOM 1397 C CE2 . PHE Q 17 233 ? 149.218 271.404 285.489 1.00 138.91 233 Bj 1 \nATOM 1398 C CZ  . PHE Q 17 233 ? 149.856 271.793 286.646 1.00 138.91 233 Bj 1 \nATOM 1399 N N   . PHE Q 17 234 ? 152.663 267.863 281.235 1.00 134.22 234 Bj 1 \nATOM 1400 C CA  . PHE Q 17 234 ? 153.088 267.418 279.917 1.00 134.22 234 Bj 1 \nATOM 1401 C C   . PHE Q 17 234 ? 152.037 267.799 278.884 1.00 134.22 234 Bj 1 \nATOM 1402 O O   . PHE Q 17 234 ? 150.840 267.584 279.098 1.00 134.22 234 Bj 1 \nATOM 1403 C CB  . PHE Q 17 234 ? 153.301 265.902 279.885 1.00 134.22 234 Bj 1 \nATOM 1404 C CG  . PHE Q 17 234 ? 154.564 265.447 280.554 1.00 134.22 234 Bj 1 \nATOM 1405 C CD1 . PHE Q 17 234 ? 154.684 265.473 281.933 1.00 134.22 234 Bj 1 \nATOM 1406 C CD2 . PHE Q 17 234 ? 155.625 264.972 279.802 1.00 134.22 234 Bj 1 \nATOM 1407 C CE1 . PHE Q 17 234 ? 155.845 265.047 282.547 1.00 134.22 234 Bj 1 \nATOM 1408 C CE2 . PHE Q 17 234 ? 156.786 264.542 280.410 1.00 134.22 234 Bj 1 \nATOM 1409 C CZ  . PHE Q 17 234 ? 156.896 264.580 281.784 1.00 134.22 234 Bj 1 \nATOM 1410 N N   . LYS Q 17 235 ? 152.488 268.350 277.760 1.00 127.98 235 Bj 1 \nATOM 1411 C CA  . LYS Q 17 235 ? 151.591 268.748 276.685 1.00 127.98 235 Bj 1 \nATOM 1412 C C   . LYS Q 17 235 ? 151.407 267.614 275.685 1.00 127.98 235 Bj 1 \nATOM 1413 O O   . LYS Q 17 235 ? 152.342 266.861 275.399 1.00 127.98 235 Bj 1 \nATOM 1414 C CB  . LYS Q 17 235 ? 152.120 269.988 275.962 1.00 127.98 235 Bj 1 \nATOM 1415 C CG  . LYS Q 17 235 ? 151.913 271.288 276.717 1.00 127.98 235 Bj 1 \nATOM 1416 C CD  . LYS Q 17 235 ? 152.321 272.477 275.865 1.00 127.98 235 Bj 1 \nATOM 1417 C CE  . LYS Q 17 235 ? 151.978 273.788 276.547 1.00 127.98 235 Bj 1 \nATOM 1418 N NZ  . LYS Q 17 235 ? 152.378 274.957 275.719 1.00 127.98 235 Bj 1 \nATOM 1419 N N   . ALA Q 17 236 ? 150.191 267.503 275.155 1.00 124.65 236 Bj 1 \nATOM 1420 C CA  . ALA Q 17 236 ? 149.871 266.534 274.120 1.00 124.65 236 Bj 1 \nATOM 1421 C C   . ALA Q 17 236 ? 148.912 267.176 273.129 1.00 124.65 236 Bj 1 \nATOM 1422 O O   . ALA Q 17 236 ? 148.201 268.130 273.453 1.00 124.65 236 Bj 1 \nATOM 1423 C CB  . ALA Q 17 236 ? 149.260 265.254 274.706 1.00 124.65 236 Bj 1 \nATOM 1424 N N   . LEU Q 17 237 ? 148.905 266.645 271.911 1.00 117.02 237 Bj 1 \nATOM 1425 C CA  . LEU Q 17 237 ? 148.078 267.159 270.829 1.00 117.02 237 Bj 1 \nATOM 1426 C C   . LEU Q 17 237 ? 146.925 266.201 270.561 1.00 117.02 237 Bj 1 \nATOM 1427 O O   . LEU Q 17 237 ? 147.072 264.984 270.709 1.00 117.02 237 Bj 1 \nATOM 1428 C CB  . LEU Q 17 237 ? 148.906 267.358 269.556 1.00 117.02 237 Bj 1 \nATOM 1429 C CG  . LEU Q 17 237 ? 148.232 268.081 268.388 1.00 117.02 237 Bj 1 \nATOM 1430 C CD1 . LEU Q 17 237 ? 147.874 269.508 268.773 1.00 117.02 237 Bj 1 \nATOM 1431 C CD2 . LEU Q 17 237 ? 149.124 268.062 267.157 1.00 117.02 237 Bj 1 \nATOM 1432 N N   . LEU Q 17 238 ? 145.780 266.752 270.167 1.00 111.74 238 Bj 1 \nATOM 1433 C CA  . LEU Q 17 238 ? 144.598 265.953 269.875 1.00 111.74 238 Bj 1 \nATOM 1434 C C   . LEU Q 17 238 ? 144.550 265.637 268.385 1.00 111.74 238 Bj 1 \nATOM 1435 O O   . LEU Q 17 238 ? 144.436 266.545 267.555 1.00 111.74 238 Bj 1 \nATOM 1436 C CB  . LEU Q 17 238 ? 143.330 266.688 270.308 1.00 111.74 238 Bj 1 \nATOM 1437 C CG  . LEU Q 17 238 ? 142.006 266.022 269.930 1.00 111.74 238 Bj 1 \nATOM 1438 C CD1 . LEU Q 17 238 ? 141.964 264.588 270.427 1.00 111.74 238 Bj 1 \nATOM 1439 C CD2 . LEU Q 17 238 ? 140.831 266.812 270.482 1.00 111.74 238 Bj 1 \nATOM 1440 N N   . LEU Q 17 239 ? 144.634 264.350 268.050 1.00 112.02 239 Bj 1 \nATOM 1441 C CA  . LEU Q 17 239 ? 144.528 263.909 266.665 1.00 112.02 239 Bj 1 \nATOM 1442 C C   . LEU Q 17 239 ? 143.084 263.603 266.282 1.00 112.02 239 Bj 1 \nATOM 1443 O O   . LEU Q 17 239 ? 142.601 264.068 265.245 1.00 112.02 239 Bj 1 \nATOM 1444 C CB  . LEU Q 17 239 ? 145.409 262.678 266.433 1.00 112.02 239 Bj 1 \nATOM 1445 C CG  . LEU Q 17 239 ? 146.918 262.867 266.591 1.00 112.02 239 Bj 1 \nATOM 1446 C CD1 . LEU Q 17 239 ? 147.642 261.536 266.459 1.00 112.02 239 Bj 1 \nATOM 1447 C CD2 . LEU Q 17 239 ? 147.442 263.866 265.571 1.00 112.02 239 Bj 1 \nATOM 1448 N N   . THR Q 17 240 ? 142.387 262.825 267.107 1.00 112.72 240 Bj 1 \nATOM 1449 C CA  . THR Q 17 240 ? 140.988 262.492 266.862 1.00 112.72 240 Bj 1 \nATOM 1450 C C   . THR Q 17 240 ? 140.284 262.360 268.201 1.00 112.72 240 Bj 1 \nATOM 1451 O O   . THR Q 17 240 ? 140.656 261.510 269.017 1.00 112.72 240 Bj 1 \nATOM 1452 C CB  . THR Q 17 240 ? 140.855 261.198 266.056 1.00 112.72 240 Bj 1 \nATOM 1453 O OG1 . THR Q 17 240 ? 141.478 261.363 264.776 1.00 112.72 240 Bj 1 \nATOM 1454 C CG2 . THR Q 17 240 ? 139.389 260.842 265.860 1.00 112.72 240 Bj 1 \nATOM 1455 N N   . GLY Q 17 241 ? 139.281 263.204 268.427 1.00 112.39 241 Bj 1 \nATOM 1456 C CA  . GLY Q 17 241 ? 138.518 263.163 269.658 1.00 112.39 241 Bj 1 \nATOM 1457 C C   . GLY Q 17 241 ? 137.166 262.503 269.490 1.00 112.39 241 Bj 1 \nATOM 1458 O O   . GLY Q 17 241 ? 136.235 263.106 268.948 1.00 112.39 241 Bj 1 \nATOM 1459 N N   . ASP Q 17 242 ? 137.047 261.262 269.950 1.00 120.39 242 Bj 1 \nATOM 1460 C CA  . ASP Q 17 242 ? 135.806 260.495 269.875 1.00 120.39 242 Bj 1 \nATOM 1461 C C   . ASP Q 17 242 ? 135.359 260.229 271.309 1.00 120.39 242 Bj 1 \nATOM 1462 O O   . ASP Q 17 242 ? 135.683 259.189 271.887 1.00 120.39 242 Bj 1 \nATOM 1463 C CB  . ASP Q 17 242 ? 136.006 259.200 269.088 1.00 120.39 242 Bj 1 \nATOM 1464 C CG  . ASP Q 17 242 ? 134.704 258.479 268.811 1.00 120.39 242 Bj 1 \nATOM 1465 O OD1 . ASP Q 17 242 ? 133.900 258.990 268.004 1.00 120.39 242 Bj 1 \nATOM 1466 O OD2 . ASP Q 17 242 ? 134.484 257.400 269.399 1.00 120.39 242 Bj 1 \nATOM 1467 N N   . PHE Q 17 243 ? 134.612 261.172 271.876 1.00 125.10 243 Bj 1 \nATOM 1468 C CA  . PHE Q 17 243 ? 134.205 261.109 273.274 1.00 125.10 243 Bj 1 \nATOM 1469 C C   . PHE Q 17 243 ? 132.791 260.548 273.376 1.00 125.10 243 Bj 1 \nATOM 1470 O O   . PHE Q 17 243 ? 131.858 261.086 272.771 1.00 125.10 243 Bj 1 \nATOM 1471 C CB  . PHE Q 17 243 ? 134.284 262.493 273.916 1.00 125.10 243 Bj 1 \nATOM 1472 C CG  . PHE Q 17 243 ? 133.967 262.500 275.384 1.00 125.10 243 Bj 1 \nATOM 1473 C CD1 . PHE Q 17 243 ? 134.948 262.216 276.319 1.00 125.10 243 Bj 1 \nATOM 1474 C CD2 . PHE Q 17 243 ? 132.690 262.797 275.830 1.00 125.10 243 Bj 1 \nATOM 1475 C CE1 . PHE Q 17 243 ? 134.661 262.224 277.670 1.00 125.10 243 Bj 1 \nATOM 1476 C CE2 . PHE Q 17 243 ? 132.398 262.805 277.179 1.00 125.10 243 Bj 1 \nATOM 1477 C CZ  . PHE Q 17 243 ? 133.384 262.518 278.100 1.00 125.10 243 Bj 1 \nATOM 1478 N N   . SER Q 17 244 ? 132.637 259.471 274.141 1.00 130.58 244 Bj 1 \nATOM 1479 C CA  . SER Q 17 244 ? 131.334 258.873 274.383 1.00 130.58 244 Bj 1 \nATOM 1480 C C   . SER Q 17 244 ? 130.729 259.423 275.668 1.00 130.58 244 Bj 1 \nATOM 1481 O O   . SER Q 17 244 ? 131.444 259.824 276.591 1.00 130.58 244 Bj 1 \nATOM 1482 C CB  . SER Q 17 244 ? 131.443 257.349 274.467 1.00 130.58 244 Bj 1 \nATOM 1483 O OG  . SER Q 17 244 ? 130.182 256.759 274.733 1.00 130.58 244 Bj 1 \nATOM 1484 N N   . GLN Q 17 245 ? 129.395 259.434 275.717 1.00 128.80 245 Bj 1 \nATOM 1485 C CA  . GLN Q 17 245 ? 128.640 259.945 276.861 1.00 128.80 245 Bj 1 \nATOM 1486 C C   . GLN Q 17 245 ? 129.024 261.398 277.157 1.00 128.80 245 Bj 1 \nATOM 1487 O O   . GLN Q 17 245 ? 129.573 261.730 278.209 1.00 128.80 245 Bj 1 \nATOM 1488 C CB  . GLN Q 17 245 ? 128.834 259.050 278.092 1.00 128.80 245 Bj 1 \nATOM 1489 C CG  . GLN Q 17 245 ? 127.890 259.349 279.253 1.00 128.80 245 Bj 1 \nATOM 1490 C CD  . GLN Q 17 245 ? 126.435 259.074 278.920 1.00 128.80 245 Bj 1 \nATOM 1491 O OE1 . GLN Q 17 245 ? 126.126 258.253 278.055 1.00 128.80 245 Bj 1 \nATOM 1492 N NE2 . GLN Q 17 245 ? 125.531 259.762 279.608 1.00 128.80 245 Bj 1 \nATOM 1493 N N   . ALA Q 17 246 ? 128.731 262.266 276.186 1.00 127.68 246 Bj 1 \nATOM 1494 C CA  . ALA Q 17 246 ? 129.038 263.683 276.337 1.00 127.68 246 Bj 1 \nATOM 1495 C C   . ALA Q 17 246 ? 128.140 264.366 277.359 1.00 127.68 246 Bj 1 \nATOM 1496 O O   . ALA Q 17 246 ? 128.472 265.463 277.821 1.00 127.68 246 Bj 1 \nATOM 1497 C CB  . ALA Q 17 246 ? 128.926 264.394 274.987 1.00 127.68 246 Bj 1 \nATOM 1498 N N   . GLY Q 17 247 ? 127.018 263.748 277.720 1.00 128.61 247 Bj 1 \nATOM 1499 C CA  . GLY Q 17 247 ? 126.115 264.325 278.695 1.00 128.61 247 Bj 1 \nATOM 1500 C C   . GLY Q 17 247 ? 126.252 263.710 280.072 1.00 128.61 247 Bj 1 \nATOM 1501 O O   . GLY Q 17 247 ? 125.267 263.595 280.808 1.00 128.61 247 Bj 1 \nATOM 1502 N N   . LYS Q 17 248 ? 127.468 263.311 280.433 1.00 125.96 248 Bj 1 \nATOM 1503 C CA  . LYS Q 17 248 ? 127.713 262.724 281.739 1.00 125.96 248 Bj 1 \nATOM 1504 C C   . LYS Q 17 248 ? 127.891 263.817 282.791 1.00 125.96 248 Bj 1 \nATOM 1505 O O   . LYS Q 17 248 ? 127.941 265.012 282.488 1.00 125.96 248 Bj 1 \nATOM 1506 C CB  . LYS Q 17 248 ? 128.946 261.822 281.702 1.00 125.96 248 Bj 1 \nATOM 1507 C CG  . LYS Q 17 248 ? 130.258 262.572 281.540 1.00 125.96 248 Bj 1 \nATOM 1508 C CD  . LYS Q 17 248 ? 131.448 261.630 281.626 1.00 125.96 248 Bj 1 \nATOM 1509 C CE  . LYS Q 17 248 ? 132.761 262.393 281.596 1.00 125.96 248 Bj 1 \nATOM 1510 N NZ  . LYS Q 17 248 ? 133.934 261.479 281.668 1.00 125.96 248 Bj 1 \nATOM 1511 N N   . LYS Q 17 249 ? 127.991 263.389 284.050 1.00 120.94 249 Bj 1 \nATOM 1512 C CA  . LYS Q 17 249 ? 128.204 264.319 285.150 1.00 120.94 249 Bj 1 \nATOM 1513 C C   . LYS Q 17 249 ? 129.630 264.849 285.213 1.00 120.94 249 Bj 1 \nATOM 1514 O O   . LYS Q 17 249 ? 129.879 265.823 285.932 1.00 120.94 249 Bj 1 \nATOM 1515 C CB  . LYS Q 17 249 ? 127.843 263.653 286.481 1.00 120.94 249 Bj 1 \nATOM 1516 C CG  . LYS Q 17 249 ? 126.360 263.355 286.649 1.00 120.94 249 Bj 1 \nATOM 1517 C CD  . LYS Q 17 249 ? 125.530 264.631 286.660 1.00 120.94 249 Bj 1 \nATOM 1518 C CE  . LYS Q 17 249 ? 124.617 264.713 285.447 1.00 120.94 249 Bj 1 \nATOM 1519 N NZ  . LYS Q 17 249 ? 123.811 265.964 285.445 1.00 120.94 249 Bj 1 \nATOM 1520 N N   . GLY Q 17 250 ? 130.565 264.239 284.488 1.00 123.18 250 Bj 1 \nATOM 1521 C CA  . GLY Q 17 250 ? 131.923 264.742 284.431 1.00 123.18 250 Bj 1 \nATOM 1522 C C   . GLY Q 17 250 ? 132.013 266.047 283.669 1.00 123.18 250 Bj 1 \nATOM 1523 O O   . GLY Q 17 250 ? 131.833 266.074 282.448 1.00 123.18 250 Bj 1 \nATOM 1524 N N   . HIS Q 17 251 ? 132.289 267.138 284.379 1.00 125.29 251 Bj 1 \nATOM 1525 C CA  . HIS Q 17 251 ? 132.322 268.470 283.778 1.00 125.29 251 Bj 1 \nATOM 1526 C C   . HIS Q 17 251 ? 133.687 268.686 283.137 1.00 125.29 251 Bj 1 \nATOM 1527 O O   . HIS Q 17 251 ? 134.647 269.104 283.786 1.00 125.29 251 Bj 1 \nATOM 1528 C CB  . HIS Q 17 251 ? 132.019 269.538 284.821 1.00 125.29 251 Bj 1 \nATOM 1529 C CG  . HIS Q 17 251 ? 130.737 269.315 285.560 1.00 125.29 251 Bj 1 \nATOM 1530 N ND1 . HIS Q 17 251 ? 129.511 269.688 285.053 1.00 125.29 251 Bj 1 \nATOM 1531 C CD2 . HIS Q 17 251 ? 130.489 268.757 286.769 1.00 125.29 251 Bj 1 \nATOM 1532 C CE1 . HIS Q 17 251 ? 128.563 269.370 285.917 1.00 125.29 251 Bj 1 \nATOM 1533 N NE2 . HIS Q 17 251 ? 129.131 268.803 286.966 1.00 125.29 251 Bj 1 \nATOM 1534 N N   . HIS Q 17 252 ? 133.771 268.392 281.842 1.00 117.65 252 Bj 1 \nATOM 1535 C CA  . HIS Q 17 252 ? 134.965 268.633 281.044 1.00 117.65 252 Bj 1 \nATOM 1536 C C   . HIS Q 17 252 ? 134.674 269.751 280.053 1.00 117.65 252 Bj 1 \nATOM 1537 O O   . HIS Q 17 252 ? 133.661 269.713 279.348 1.00 117.65 252 Bj 1 \nATOM 1538 C CB  . HIS Q 17 252 ? 135.405 267.363 280.309 1.00 117.65 252 Bj 1 \nATOM 1539 C CG  . HIS Q 17 252 ? 134.422 266.883 279.289 1.00 117.65 252 Bj 1 \nATOM 1540 N ND1 . HIS Q 17 252 ? 133.315 266.131 279.617 1.00 117.65 252 Bj 1 \nATOM 1541 C CD2 . HIS Q 17 252 ? 134.377 267.051 277.946 1.00 117.65 252 Bj 1 \nATOM 1542 C CE1 . HIS Q 17 252 ? 132.631 265.856 278.521 1.00 117.65 252 Bj 1 \nATOM 1543 N NE2 . HIS Q 17 252 ? 133.254 266.403 277.493 1.00 117.65 252 Bj 1 \nATOM 1544 N N   . VAL Q 17 253 ? 135.556 270.746 280.008 1.00 119.25 253 Bj 1 \nATOM 1545 C CA  . VAL Q 17 253 ? 135.344 271.959 279.228 1.00 119.25 253 Bj 1 \nATOM 1546 C C   . VAL Q 17 253 ? 136.541 272.173 278.314 1.00 119.25 253 Bj 1 \nATOM 1547 O O   . VAL Q 17 253 ? 137.691 272.100 278.762 1.00 119.25 253 Bj 1 \nATOM 1548 C CB  . VAL Q 17 253 ? 135.137 273.190 280.131 1.00 119.25 253 Bj 1 \nATOM 1549 C CG1 . VAL Q 17 253 ? 134.861 274.428 279.291 1.00 119.25 253 Bj 1 \nATOM 1550 C CG2 . VAL Q 17 253 ? 134.007 272.948 281.121 1.00 119.25 253 Bj 1 \nATOM 1551 N N   . TRP Q 17 254 ? 136.269 272.431 277.036 1.00 115.00 254 Bj 1 \nATOM 1552 C CA  . TRP Q 17 254 ? 137.283 272.897 276.101 1.00 115.00 254 Bj 1 \nATOM 1553 C C   . TRP Q 17 254 ? 137.325 274.418 276.147 1.00 115.00 254 Bj 1 \nATOM 1554 O O   . TRP Q 17 254 ? 136.330 275.082 275.836 1.00 115.00 254 Bj 1 \nATOM 1555 C CB  . TRP Q 17 254 ? 136.987 272.415 274.681 1.00 115.00 254 Bj 1 \nATOM 1556 C CG  . TRP Q 17 254 ? 136.967 270.928 274.547 1.00 115.00 254 Bj 1 \nATOM 1557 C CD1 . TRP Q 17 254 ? 135.876 270.139 274.334 1.00 115.00 254 Bj 1 \nATOM 1558 C CD2 . TRP Q 17 254 ? 138.092 270.046 274.625 1.00 115.00 254 Bj 1 \nATOM 1559 N NE1 . TRP Q 17 254 ? 136.251 268.819 274.269 1.00 115.00 254 Bj 1 \nATOM 1560 C CE2 . TRP Q 17 254 ? 137.607 268.735 274.446 1.00 115.00 254 Bj 1 \nATOM 1561 C CE3 . TRP Q 17 254 ? 139.461 270.236 274.827 1.00 115.00 254 Bj 1 \nATOM 1562 C CZ2 . TRP Q 17 254 ? 138.443 267.622 274.463 1.00 115.00 254 Bj 1 \nATOM 1563 C CZ3 . TRP Q 17 254 ? 140.289 269.130 274.842 1.00 115.00 254 Bj 1 \nATOM 1564 C CH2 . TRP Q 17 254 ? 139.778 267.840 274.662 1.00 115.00 254 Bj 1 \nATOM 1565 N N   . VAL Q 17 255 ? 138.473 274.965 276.535 1.00 119.35 255 Bj 1 \nATOM 1566 C CA  . VAL Q 17 255 ? 138.586 276.379 276.870 1.00 119.35 255 Bj 1 \nATOM 1567 C C   . VAL Q 17 255 ? 139.797 276.969 276.160 1.00 119.35 255 Bj 1 \nATOM 1568 O O   . VAL Q 17 255 ? 140.791 276.276 275.919 1.00 119.35 255 Bj 1 \nATOM 1569 C CB  . VAL Q 17 255 ? 138.678 276.575 278.400 1.00 119.35 255 Bj 1 \nATOM 1570 C CG1 . VAL Q 17 255 ? 139.988 276.026 278.940 1.00 119.35 255 Bj 1 \nATOM 1571 C CG2 . VAL Q 17 255 ? 138.506 278.030 278.766 1.00 119.35 255 Bj 1 \nATOM 1572 N N   . SER Q 17 256 ? 139.702 278.248 275.804 1.00 122.61 256 Bj 1 \nATOM 1573 C CA  . SER Q 17 256 ? 140.792 278.967 275.164 1.00 122.61 256 Bj 1 \nATOM 1574 C C   . SER Q 17 256 ? 141.580 279.743 276.219 1.00 122.61 256 Bj 1 \nATOM 1575 O O   . SER Q 17 256 ? 141.375 279.576 277.423 1.00 122.61 256 Bj 1 \nATOM 1576 C CB  . SER Q 17 256 ? 140.249 279.877 274.066 1.00 122.61 256 Bj 1 \nATOM 1577 O OG  . SER Q 17 256 ? 141.298 280.548 273.390 1.00 122.61 256 Bj 1 \nATOM 1578 N N   . LYS Q 17 257 ? 142.489 280.613 275.772 1.00 127.00 257 Bj 1 \nATOM 1579 C CA  . LYS Q 17 257 ? 143.375 281.318 276.695 1.00 127.00 257 Bj 1 \nATOM 1580 C C   . LYS Q 17 257 ? 142.610 282.285 277.595 1.00 127.00 257 Bj 1 \nATOM 1581 O O   . LYS Q 17 257 ? 142.840 282.324 278.811 1.00 127.00 257 Bj 1 \nATOM 1582 C CB  . LYS Q 17 257 ? 144.455 282.054 275.899 1.00 127.00 257 Bj 1 \nATOM 1583 C CG  . LYS Q 17 257 ? 144.923 283.367 276.506 1.00 127.00 257 Bj 1 \nATOM 1584 C CD  . LYS Q 17 257 ? 146.041 283.168 277.511 1.00 127.00 257 Bj 1 \nATOM 1585 C CE  . LYS Q 17 257 ? 146.569 284.511 277.993 1.00 127.00 257 Bj 1 \nATOM 1586 N NZ  . LYS Q 17 257 ? 147.753 284.372 278.882 1.00 127.00 257 Bj 1 \nATOM 1587 N N   . GLU Q 17 258 ? 141.695 283.069 277.021 1.00 126.69 258 Bj 1 \nATOM 1588 C CA  . GLU Q 17 258 ? 141.007 284.103 277.788 1.00 126.69 258 Bj 1 \nATOM 1589 C C   . GLU Q 17 258 ? 140.134 283.494 278.880 1.00 126.69 258 Bj 1 \nATOM 1590 O O   . GLU Q 17 258 ? 140.313 283.776 280.071 1.00 126.69 258 Bj 1 \nATOM 1591 C CB  . GLU Q 17 258 ? 140.173 284.979 276.851 1.00 126.69 258 Bj 1 \nATOM 1592 C CG  . GLU Q 17 258 ? 140.982 285.777 275.834 1.00 126.69 258 Bj 1 \nATOM 1593 C CD  . GLU Q 17 258 ? 141.362 284.971 274.602 1.00 126.69 258 Bj 1 \nATOM 1594 O OE1 . GLU Q 17 258 ? 141.635 283.760 274.732 1.00 126.69 258 Bj 1 \nATOM 1595 O OE2 . GLU Q 17 258 ? 141.381 285.553 273.498 1.00 126.69 258 Bj 1 \nATOM 1596 N N   . GLU Q 17 259 ? 139.174 282.652 278.490 1.00 129.80 259 Bj 1 \nATOM 1597 C CA  . GLU Q 17 259 ? 138.332 281.997 279.482 1.00 129.80 259 Bj 1 \nATOM 1598 C C   . GLU Q 17 259 ? 139.126 281.043 280.365 1.00 129.80 259 Bj 1 \nATOM 1599 O O   . GLU Q 17 259 ? 138.712 280.779 281.498 1.00 129.80 259 Bj 1 \nATOM 1600 C CB  . GLU Q 17 259 ? 137.179 281.259 278.797 1.00 129.80 259 Bj 1 \nATOM 1601 C CG  . GLU Q 17 259 ? 136.278 282.148 277.950 1.00 129.80 259 Bj 1 \nATOM 1602 C CD  . GLU Q 17 259 ? 136.700 282.197 276.494 1.00 129.80 259 Bj 1 \nATOM 1603 O OE1 . GLU Q 17 259 ? 137.140 281.154 275.965 1.00 129.80 259 Bj 1 \nATOM 1604 O OE2 . GLU Q 17 259 ? 136.592 283.278 275.878 1.00 129.80 259 Bj 1 \nATOM 1605 N N   . LEU Q 17 260 ? 140.270 280.549 279.888 1.00 130.83 260 Bj 1 \nATOM 1606 C CA  . LEU Q 17 260 ? 141.148 279.742 280.729 1.00 130.83 260 Bj 1 \nATOM 1607 C C   . LEU Q 17 260 ? 141.669 280.562 281.901 1.00 130.83 260 Bj 1 \nATOM 1608 O O   . LEU Q 17 260 ? 141.580 280.142 283.062 1.00 130.83 260 Bj 1 \nATOM 1609 C CB  . LEU Q 17 260 ? 142.301 279.197 279.882 1.00 130.83 260 Bj 1 \nATOM 1610 C CG  . LEU Q 17 260 ? 143.280 278.143 280.407 1.00 130.83 260 Bj 1 \nATOM 1611 C CD1 . LEU Q 17 260 ? 143.986 277.497 279.232 1.00 130.83 260 Bj 1 \nATOM 1612 C CD2 . LEU Q 17 260 ? 144.307 278.740 281.346 1.00 130.83 260 Bj 1 \nATOM 1613 N N   . GLY Q 17 261 ? 142.232 281.735 281.610 1.00 132.72 261 Bj 1 \nATOM 1614 C CA  . GLY Q 17 261 ? 142.661 282.625 282.674 1.00 132.72 261 Bj 1 \nATOM 1615 C C   . GLY Q 17 261 ? 141.510 283.111 283.530 1.00 132.72 261 Bj 1 \nATOM 1616 O O   . GLY Q 17 261 ? 141.689 283.389 284.720 1.00 132.72 261 Bj 1 \nATOM 1617 N N   . ASP Q 17 262 ? 140.317 283.220 282.943 1.00 135.25 262 Bj 1 \nATOM 1618 C CA  . ASP Q 17 262 ? 139.148 283.630 283.717 1.00 135.25 262 Bj 1 \nATOM 1619 C C   . ASP Q 17 262 ? 138.742 282.558 284.722 1.00 135.25 262 Bj 1 \nATOM 1620 O O   . ASP Q 17 262 ? 138.354 282.874 285.853 1.00 135.25 262 Bj 1 \nATOM 1621 C CB  . ASP Q 17 262 ? 137.986 283.951 282.778 1.00 135.25 262 Bj 1 \nATOM 1622 C CG  . ASP Q 17 262 ? 136.680 284.169 283.519 1.00 135.25 262 Bj 1 \nATOM 1623 O OD1 . ASP Q 17 262 ? 136.568 285.178 284.246 1.00 135.25 262 Bj 1 \nATOM 1624 O OD2 . ASP Q 17 262 ? 135.764 283.332 283.373 1.00 135.25 262 Bj 1 \nATOM 1625 N N   . TYR Q 17 263 ? 138.823 281.286 284.330 1.00 135.63 263 Bj 1 \nATOM 1626 C CA  . TYR Q 17 263 ? 138.387 280.204 285.207 1.00 135.63 263 Bj 1 \nATOM 1627 C C   . TYR Q 17 263 ? 139.450 279.853 286.242 1.00 135.63 263 Bj 1 \nATOM 1628 O O   . TYR Q 17 263 ? 139.148 279.738 287.435 1.00 135.63 263 Bj 1 \nATOM 1629 C CB  . TYR Q 17 263 ? 138.020 278.968 284.383 1.00 135.63 263 Bj 1 \nATOM 1630 C CG  . TYR Q 17 263 ? 136.748 279.113 283.580 1.00 135.63 263 Bj 1 \nATOM 1631 C CD1 . TYR Q 17 263 ? 136.444 278.220 282.560 1.00 135.63 263 Bj 1 \nATOM 1632 C CD2 . TYR Q 17 263 ? 135.849 280.139 283.842 1.00 135.63 263 Bj 1 \nATOM 1633 C CE1 . TYR Q 17 263 ? 135.282 278.346 281.823 1.00 135.63 263 Bj 1 \nATOM 1634 C CE2 . TYR Q 17 263 ? 134.685 280.272 283.109 1.00 135.63 263 Bj 1 \nATOM 1635 C CZ  . TYR Q 17 263 ? 134.407 279.373 282.101 1.00 135.63 263 Bj 1 \nATOM 1636 O OH  . TYR Q 17 263 ? 133.250 279.500 281.367 1.00 135.63 263 Bj 1 \nATOM 1637 N N   . LEU Q 17 264 ? 140.698 279.676 285.808 1.00 134.80 264 Bj 1 \nATOM 1638 C CA  . LEU Q 17 264 ? 141.750 279.206 286.706 1.00 134.80 264 Bj 1 \nATOM 1639 C C   . LEU Q 17 264 ? 142.092 280.291 287.720 1.00 134.80 264 Bj 1 \nATOM 1640 O O   . LEU Q 17 264 ? 142.757 281.278 287.390 1.00 134.80 264 Bj 1 \nATOM 1641 C CB  . LEU Q 17 264 ? 142.981 278.790 285.908 1.00 134.80 264 Bj 1 \nATOM 1642 C CG  . LEU Q 17 264 ? 142.804 277.524 285.068 1.00 134.80 264 Bj 1 \nATOM 1643 C CD1 . LEU Q 17 264 ? 144.129 277.063 284.492 1.00 134.80 264 Bj 1 \nATOM 1644 C CD2 . LEU Q 17 264 ? 142.169 276.422 285.898 1.00 134.80 264 Bj 1 \nATOM 1645 N N   . LYS Q 17 265 ? 141.633 280.107 288.955 1.00 137.65 265 Bj 1 \nATOM 1646 C CA  . LYS Q 17 265 ? 141.877 281.041 290.049 1.00 137.65 265 Bj 1 \nATOM 1647 C C   . LYS Q 17 265 ? 143.260 280.904 290.689 1.00 137.65 265 Bj 1 \nATOM 1648 O O   . LYS Q 17 265 ? 143.947 281.921 290.850 1.00 137.65 265 Bj 1 \nATOM 1649 C CB  . LYS Q 17 265 ? 140.794 280.889 291.122 1.00 137.65 265 Bj 1 \nATOM 1650 C CG  . LYS Q 17 265 ? 140.067 279.555 291.107 1.00 137.65 265 Bj 1 \nATOM 1651 C CD  . LYS Q 17 265 ? 139.195 279.392 292.339 1.00 137.65 265 Bj 1 \nATOM 1652 C CE  . LYS Q 17 265 ? 140.022 279.484 293.612 1.00 137.65 265 Bj 1 \nATOM 1653 N NZ  . LYS Q 17 265 ? 141.088 278.445 293.660 1.00 137.65 265 Bj 1 \nATOM 1654 N N   . PRO Q 17 266 ? 143.720 279.709 291.071 1.00 140.01 266 Bj 1 \nATOM 1655 C CA  . PRO Q 17 266 ? 144.940 279.634 291.881 1.00 140.01 266 Bj 1 \nATOM 1656 C C   . PRO Q 17 266 ? 146.183 279.907 291.050 1.00 140.01 266 Bj 1 \nATOM 1657 O O   . PRO Q 17 266 ? 146.185 279.801 289.822 1.00 140.01 266 Bj 1 \nATOM 1658 C CB  . PRO Q 17 266 ? 144.937 278.195 292.416 1.00 140.01 266 Bj 1 \nATOM 1659 C CG  . PRO Q 17 266 ? 143.732 277.520 291.808 1.00 140.01 266 Bj 1 \nATOM 1660 C CD  . PRO Q 17 266 ? 143.299 278.360 290.659 1.00 140.01 266 Bj 1 \nATOM 1661 N N   . LYS Q 17 267 ? 147.260 280.264 291.753 1.00 148.42 267 Bj 1 \nATOM 1662 C CA  . LYS Q 17 267 ? 148.508 280.602 291.080 1.00 148.42 267 Bj 1 \nATOM 1663 C C   . LYS Q 17 267 ? 149.209 279.379 290.506 1.00 148.42 267 Bj 1 \nATOM 1664 O O   . LYS Q 17 267 ? 150.039 279.526 289.603 1.00 148.42 267 Bj 1 \nATOM 1665 C CB  . LYS Q 17 267 ? 149.447 281.333 292.041 1.00 148.42 267 Bj 1 \nATOM 1666 C CG  . LYS Q 17 267 ? 149.947 280.481 293.195 1.00 148.42 267 Bj 1 \nATOM 1667 C CD  . LYS Q 17 267 ? 150.971 281.233 294.030 1.00 148.42 267 Bj 1 \nATOM 1668 C CE  . LYS Q 17 267 ? 151.539 280.354 295.132 1.00 148.42 267 Bj 1 \nATOM 1669 N NZ  . LYS Q 17 267 ? 152.570 281.070 295.935 1.00 148.42 267 Bj 1 \nATOM 1670 N N   . TYR Q 17 268 ? 148.900 278.181 291.005 1.00 155.87 268 Bj 1 \nATOM 1671 C CA  . TYR Q 17 268 ? 149.550 276.982 290.487 1.00 155.87 268 Bj 1 \nATOM 1672 C C   . TYR Q 17 268 ? 149.064 276.652 289.082 1.00 155.87 268 Bj 1 \nATOM 1673 O O   . TYR Q 17 268 ? 149.833 276.147 288.255 1.00 155.87 268 Bj 1 \nATOM 1674 C CB  . TYR Q 17 268 ? 149.315 275.807 291.434 1.00 155.87 268 Bj 1 \nATOM 1675 C CG  . TYR Q 17 268 ? 149.991 275.984 292.771 1.00 155.87 268 Bj 1 \nATOM 1676 C CD1 . TYR Q 17 268 ? 151.334 275.678 292.934 1.00 155.87 268 Bj 1 \nATOM 1677 C CD2 . TYR Q 17 268 ? 149.290 276.466 293.867 1.00 155.87 268 Bj 1 \nATOM 1678 C CE1 . TYR Q 17 268 ? 151.960 275.843 294.150 1.00 155.87 268 Bj 1 \nATOM 1679 C CE2 . TYR Q 17 268 ? 149.907 276.633 295.090 1.00 155.87 268 Bj 1 \nATOM 1680 C CZ  . TYR Q 17 268 ? 151.242 276.319 295.225 1.00 155.87 268 Bj 1 \nATOM 1681 O OH  . TYR Q 17 268 ? 151.863 276.483 296.440 1.00 155.87 268 Bj 1 \nATOM 1682 N N   . LEU Q 17 269 ? 147.796 276.926 288.793 1.00 143.98 269 Bj 1 \nATOM 1683 C CA  . LEU Q 17 269 ? 147.256 276.720 287.458 1.00 143.98 269 Bj 1 \nATOM 1684 C C   . LEU Q 17 269 ? 147.228 277.995 286.627 1.00 143.98 269 Bj 1 \nATOM 1685 O O   . LEU Q 17 269 ? 147.115 277.912 285.399 1.00 143.98 269 Bj 1 \nATOM 1686 C CB  . LEU Q 17 269 ? 145.845 276.130 287.545 1.00 143.98 269 Bj 1 \nATOM 1687 C CG  . LEU Q 17 269 ? 145.752 274.727 288.149 1.00 143.98 269 Bj 1 \nATOM 1688 C CD1 . LEU Q 17 269 ? 144.310 274.253 288.179 1.00 143.98 269 Bj 1 \nATOM 1689 C CD2 . LEU Q 17 269 ? 146.624 273.751 287.375 1.00 143.98 269 Bj 1 \nATOM 1690 N N   . ALA Q 17 270 ? 147.339 279.164 287.255 1.00 137.42 270 Bj 1 \nATOM 1691 C CA  . ALA Q 17 270 ? 147.361 280.426 286.528 1.00 137.42 270 Bj 1 \nATOM 1692 C C   . ALA Q 17 270 ? 148.680 280.671 285.810 1.00 137.42 270 Bj 1 \nATOM 1693 O O   . ALA Q 17 270 ? 148.785 281.646 285.059 1.00 137.42 270 Bj 1 \nATOM 1694 C CB  . ALA Q 17 270 ? 147.068 281.588 287.482 1.00 137.42 270 Bj 1 \nATOM 1695 N N   . GLN Q 17 271 ? 149.681 279.820 286.021 1.00 132.72 271 Bj 1 \nATOM 1696 C CA  . GLN Q 17 271 ? 150.970 279.944 285.357 1.00 132.72 271 Bj 1 \nATOM 1697 C C   . GLN Q 17 271 ? 151.126 278.967 284.199 1.00 132.72 271 Bj 1 \nATOM 1698 O O   . GLN Q 17 271 ? 152.241 278.789 283.699 1.00 132.72 271 Bj 1 \nATOM 1699 C CB  . GLN Q 17 271 ? 152.102 279.749 286.366 1.00 132.72 271 Bj 1 \nATOM 1700 C CG  . GLN Q 17 271 ? 152.097 280.762 287.495 1.00 132.72 271 Bj 1 \nATOM 1701 C CD  . GLN Q 17 271 ? 153.182 280.502 288.519 1.00 132.72 271 Bj 1 \nATOM 1702 O OE1 . GLN Q 17 271 ? 154.178 279.838 288.232 1.00 132.72 271 Bj 1 \nATOM 1703 N NE2 . GLN Q 17 271 ? 152.994 281.024 289.725 1.00 132.72 271 Bj 1 \nATOM 1704 N N   . VAL Q 17 272 ? 150.038 278.325 283.767 1.00 127.77 272 Bj 1 \nATOM 1705 C CA  . VAL Q 17 272 ? 150.113 277.466 282.590 1.00 127.77 272 Bj 1 \nATOM 1706 C C   . VAL Q 17 272 ? 150.313 278.305 281.335 1.00 127.77 272 Bj 1 \nATOM 1707 O O   . VAL Q 17 272 ? 150.913 277.842 280.356 1.00 127.77 272 Bj 1 \nATOM 1708 C CB  . VAL Q 17 272 ? 148.858 276.577 282.494 1.00 127.77 272 Bj 1 \nATOM 1709 C CG1 . VAL Q 17 272 ? 147.619 277.418 282.237 1.00 127.77 272 Bj 1 \nATOM 1710 C CG2 . VAL Q 17 272 ? 149.029 275.519 281.414 1.00 127.77 272 Bj 1 \nATOM 1711 N N   . ARG Q 17 273 ? 149.836 279.552 281.344 1.00 126.48 273 Bj 1 \nATOM 1712 C CA  . ARG Q 17 273 ? 150.044 280.452 280.218 1.00 126.48 273 Bj 1 \nATOM 1713 C C   . ARG Q 17 273 ? 151.496 280.886 280.074 1.00 126.48 273 Bj 1 \nATOM 1714 O O   . ARG Q 17 273 ? 151.838 281.516 279.067 1.00 126.48 273 Bj 1 \nATOM 1715 C CB  . ARG Q 17 273 ? 149.146 281.684 280.353 1.00 126.48 273 Bj 1 \nATOM 1716 C CG  . ARG Q 17 273 ? 147.662 281.390 280.204 1.00 126.48 273 Bj 1 \nATOM 1717 C CD  . ARG Q 17 273 ? 146.993 281.126 281.543 1.00 126.48 273 Bj 1 \nATOM 1718 N NE  . ARG Q 17 273 ? 146.890 282.333 282.357 1.00 126.48 273 Bj 1 \nATOM 1719 C CZ  . ARG Q 17 273 ? 146.190 282.414 283.484 1.00 126.48 273 Bj 1 \nATOM 1720 N NH1 . ARG Q 17 273 ? 145.525 281.357 283.930 1.00 126.48 273 Bj 1 \nATOM 1721 N NH2 . ARG Q 17 273 ? 146.150 283.552 284.163 1.00 126.48 273 Bj 1 \nATOM 1722 N N   . ARG Q 17 274 ? 152.349 280.573 281.051 1.00 119.98 274 Bj 1 \nATOM 1723 C CA  . ARG Q 17 274 ? 153.770 280.876 280.920 1.00 119.98 274 Bj 1 \nATOM 1724 C C   . ARG Q 17 274 ? 154.394 280.073 279.786 1.00 119.98 274 Bj 1 \nATOM 1725 O O   . ARG Q 17 274 ? 155.151 280.611 278.970 1.00 119.98 274 Bj 1 \nATOM 1726 C CB  . ARG Q 17 274 ? 154.489 280.596 282.239 1.00 119.98 274 Bj 1 \nATOM 1727 C CG  . ARG Q 17 274 ? 155.996 280.753 282.164 1.00 119.98 274 Bj 1 \nATOM 1728 C CD  . ARG Q 17 274 ? 156.653 280.440 283.497 1.00 119.98 274 Bj 1 \nATOM 1729 N NE  . ARG Q 17 274 ? 158.106 280.552 283.422 1.00 119.98 274 Bj 1 \nATOM 1730 C CZ  . ARG Q 17 274 ? 158.925 280.351 284.449 1.00 119.98 274 Bj 1 \nATOM 1731 N NH1 . ARG Q 17 274 ? 158.434 280.026 285.638 1.00 119.98 274 Bj 1 \nATOM 1732 N NH2 . ARG Q 17 274 ? 160.236 280.475 284.288 1.00 119.98 274 Bj 1 \nATOM 1733 N N   . PHE Q 17 275 ? 154.086 278.781 279.719 1.00 124.86 275 Bj 1 \nATOM 1734 C CA  . PHE Q 17 275 ? 154.571 277.923 278.649 1.00 124.86 275 Bj 1 \nATOM 1735 C C   . PHE Q 17 275 ? 153.499 277.598 277.619 1.00 124.86 275 Bj 1 \nATOM 1736 O O   . PHE Q 17 275 ? 153.784 276.886 276.652 1.00 124.86 275 Bj 1 \nATOM 1737 C CB  . PHE Q 17 275 ? 155.151 276.626 279.226 1.00 124.86 275 Bj 1 \nATOM 1738 C CG  . PHE Q 17 275 ? 154.189 275.853 280.081 1.00 124.86 275 Bj 1 \nATOM 1739 C CD1 . PHE Q 17 275 ? 153.410 274.846 279.535 1.00 124.86 275 Bj 1 \nATOM 1740 C CD2 . PHE Q 17 275 ? 154.073 276.123 281.434 1.00 124.86 275 Bj 1 \nATOM 1741 C CE1 . PHE Q 17 275 ? 152.527 274.130 280.320 1.00 124.86 275 Bj 1 \nATOM 1742 C CE2 . PHE Q 17 275 ? 153.191 275.411 282.224 1.00 124.86 275 Bj 1 \nATOM 1743 C CZ  . PHE Q 17 275 ? 152.418 274.412 281.666 1.00 124.86 275 Bj 1 \nATOM 1744 N N   . LEU Q 17 276 ? 152.279 278.098 277.799 1.00 117.83 276 Bj 1 \nATOM 1745 C CA  . LEU Q 17 276 ? 151.240 277.932 276.795 1.00 117.83 276 Bj 1 \nATOM 1746 C C   . LEU Q 17 276 ? 151.359 279.017 275.733 1.00 117.83 276 Bj 1 \nATOM 1747 O O   . LEU Q 17 276 ? 151.592 280.188 276.045 1.00 117.83 276 Bj 1 \nATOM 1748 C CB  . LEU Q 17 276 ? 149.857 277.977 277.444 1.00 117.83 276 Bj 1 \nATOM 1749 C CG  . LEU Q 17 276 ? 148.658 277.885 276.498 1.00 117.83 276 Bj 1 \nATOM 1750 C CD1 . LEU Q 17 276 ? 148.689 276.585 275.710 1.00 117.83 276 Bj 1 \nATOM 1751 C CD2 . LEU Q 17 276 ? 147.359 278.018 277.275 1.00 117.83 276 Bj 1 \nATOM 1752 N N   . LEU Q 17 277 ? 151.203 278.619 274.472 1.00 108.03 277 Bj 1 \nATOM 1753 C CA  . LEU Q 17 277 ? 151.313 279.567 273.372 1.00 108.03 277 Bj 1 \nATOM 1754 C C   . LEU Q 17 277 ? 150.175 280.577 273.422 1.00 108.03 277 Bj 1 \nATOM 1755 O O   . LEU Q 17 277 ? 149.048 280.245 273.802 1.00 108.03 277 Bj 1 \nATOM 1756 C CB  . LEU Q 17 277 ? 151.306 278.836 272.032 1.00 108.03 277 Bj 1 \nATOM 1757 C CG  . LEU Q 17 277 ? 152.569 278.060 271.666 1.00 108.03 277 Bj 1 \nATOM 1758 C CD1 . LEU Q 17 277 ? 152.537 277.695 270.195 1.00 108.03 277 Bj 1 \nATOM 1759 C CD2 . LEU Q 17 277 ? 153.805 278.877 271.992 1.00 108.03 277 Bj 1 \nATOM 1760 N N   . ASP Q 17 278 ? 150.474 281.816 273.030 1.00 106.80 278 Bj 1 \nATOM 1761 C CA  . ASP Q 17 278 ? 149.461 282.864 273.029 1.00 106.80 278 Bj 1 \nATOM 1762 C C   . ASP Q 17 278 ? 148.629 282.835 271.754 1.00 106.80 278 Bj 1 \nATOM 1763 O O   . ASP Q 17 278 ? 147.422 283.101 271.794 1.00 106.80 278 Bj 1 \nATOM 1764 C CB  . ASP Q 17 278 ? 150.123 284.231 273.199 1.00 106.80 278 Bj 1 \nATOM 1765 C CG  . ASP Q 17 278 ? 151.058 284.283 274.390 1.00 106.80 278 Bj 1 \nATOM 1766 O OD1 . ASP Q 17 278 ? 150.918 283.436 275.297 1.00 106.80 278 Bj 1 \nATOM 1767 O OD2 . ASP Q 17 278 ? 151.932 285.174 274.420 1.00 106.80 278 Bj 1 \nATOM 1768 N N   . LEU Q 17 279 ? 149.259 282.519 270.625 1.00 104.98 279 Bj 1 \nATOM 1769 C CA  . LEU Q 17 279 ? 148.601 282.483 269.320 1.00 104.98 279 Bj 1 \nATOM 1770 C C   . LEU Q 17 279 ? 147.938 283.817 268.987 1.00 104.98 279 Bj 1 \nATOM 1771 O O   . LEU Q 17 279 ? 148.618 284.810 268.729 1.00 104.98 279 Bj 1 \nATOM 1772 C CB  . LEU Q 17 279 ? 147.567 281.354 269.263 1.00 104.98 279 Bj 1 \nATOM 1773 C CG  . LEU Q 17 279 ? 148.068 279.941 269.566 1.00 104.98 279 Bj 1 \nATOM 1774 C CD1 . LEU Q 17 279 ? 147.007 278.919 269.200 1.00 104.98 279 Bj 1 \nATOM 1775 C CD2 . LEU Q 17 279 ? 149.365 279.652 268.834 1.00 104.98 279 Bj 1 \n#\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/pdb_mmcif/7rye.cif",
    "content": "data_7RYE\n#\n_entry.id 7RYE\n#\nloop_\n_chem_comp.formula\n_chem_comp.formula_weight\n_chem_comp.id\n_chem_comp.mon_nstd_flag\n_chem_comp.name\n_chem_comp.pdbx_synonyms\n_chem_comp.type\n\"C3 H7 N O2\"     89.093  ALA y ALANINE         ? \"L-peptide linking\" \n\"C6 H15 N4 O2 1\" 175.209 ARG y ARGININE        ? \"L-peptide linking\" \n\"C4 H8 N2 O3\"    132.118 ASN y ASPARAGINE      ? \"L-peptide linking\" \n\"C4 H7 N O4\"     133.103 ASP y \"ASPARTIC ACID\" ? \"L-peptide linking\" \n\"C3 H7 N O2 S\"   121.158 CYS y CYSTEINE        ? \"L-peptide linking\" \n\"C5 H10 N2 O3\"   146.144 GLN y GLUTAMINE       ? \"L-peptide linking\" \n\"C5 H9 N O4\"     147.129 GLU y \"GLUTAMIC ACID\" ? \"L-peptide linking\" \n\"C2 H5 N O2\"     75.067  GLY y GLYCINE         ? \"peptide linking\"   \n\"C6 H10 N3 O2 1\" 156.162 HIS y HISTIDINE       ? \"L-peptide linking\" \n\"C6 H13 N O2\"    131.173 ILE y ISOLEUCINE      ? \"L-peptide linking\" \n\"C6 H13 N O2\"    131.173 LEU y LEUCINE         ? \"L-peptide linking\" \n\"C6 H15 N2 O2 1\" 147.195 LYS y LYSINE          ? \"L-peptide linking\" \n\"C5 H11 N O2 S\"  149.211 MET y METHIONINE      ? \"L-peptide linking\" \n\"C9 H11 N O2\"    165.189 PHE y PHENYLALANINE   ? \"L-peptide linking\" \n\"C5 H9 N O2\"     115.130 PRO y PROLINE         ? \"L-peptide linking\" \n\"C3 H7 N O3\"     105.093 SER y SERINE          ? \"L-peptide linking\" \n\"C4 H9 N O3\"     119.119 THR y THREONINE       ? \"L-peptide linking\" \n\"C11 H12 N2 O2\"  204.225 TRP y TRYPTOPHAN      ? \"L-peptide linking\" \n\"C9 H11 N O3\"    181.189 TYR y TYROSINE        ? \"L-peptide linking\" \n\"C5 H11 N O2\"    117.146 VAL y VALINE          ? \"L-peptide linking\" \n#\n_entity.id               1\n_entity.pdbx_description \"Protein PrgI\"\n_entity.type             polymer\n#\n_entity_poly.entity_id      1\n_entity_poly.pdbx_strand_id J\n_entity_poly.type           polypeptide(L)\n#\nloop_\n_entity_poly_seq.entity_id\n_entity_poly_seq.hetero\n_entity_poly_seq.mon_id\n_entity_poly_seq.num\n1 n MET 1  \n1 n ALA 2  \n1 n THR 3  \n1 n PRO 4  \n1 n TRP 5  \n1 n SER 6  \n1 n GLY 7  \n1 n TYR 8  \n1 n LEU 9  \n1 n ASP 10 \n1 n ASP 11 \n1 n VAL 12 \n1 n SER 13 \n1 n ALA 14 \n1 n LYS 15 \n1 n PHE 16 \n1 n ASP 17 \n1 n THR 18 \n1 n GLY 19 \n1 n VAL 20 \n1 n ASP 21 \n1 n ASN 22 \n1 n LEU 23 \n1 n GLN 24 \n1 n THR 25 \n1 n GLN 26 \n1 n VAL 27 \n1 n THR 28 \n1 n GLU 29 \n1 n ALA 30 \n1 n LEU 31 \n1 n ASP 32 \n1 n LYS 33 \n1 n LEU 34 \n1 n ALA 35 \n1 n ALA 36 \n1 n LYS 37 \n1 n PRO 38 \n1 n SER 39 \n1 n ASP 40 \n1 n PRO 41 \n1 n ALA 42 \n1 n LEU 43 \n1 n LEU 44 \n1 n ALA 45 \n1 n ALA 46 \n1 n TYR 47 \n1 n GLN 48 \n1 n SER 49 \n1 n LYS 50 \n1 n LEU 51 \n1 n SER 52 \n1 n GLU 53 \n1 n TYR 54 \n1 n ASN 55 \n1 n LEU 56 \n1 n TYR 57 \n1 n ARG 58 \n1 n ASN 59 \n1 n ALA 60 \n1 n GLN 61 \n1 n SER 62 \n1 n ASN 63 \n1 n THR 64 \n1 n VAL 65 \n1 n LYS 66 \n1 n VAL 67 \n1 n PHE 68 \n1 n LYS 69 \n1 n ASP 70 \n1 n ILE 71 \n1 n ASP 72 \n1 n ALA 73 \n1 n ALA 74 \n1 n ILE 75 \n1 n ILE 76 \n1 n GLN 77 \n1 n ASN 78 \n1 n PHE 79 \n1 n ARG 80 \n#\n_exptl.method \"ELECTRON MICROSCOPY\"\n#\n_pdbx_audit_revision_history.revision_date 2021-11-10\n#\n_pdbx_database_status.recvd_initial_deposition_date 2021-11-10\n#\nloop_\n_pdbx_poly_seq_scheme.asym_id\n_pdbx_poly_seq_scheme.auth_seq_num\n_pdbx_poly_seq_scheme.entity_id\n_pdbx_poly_seq_scheme.hetero\n_pdbx_poly_seq_scheme.mon_id\n_pdbx_poly_seq_scheme.pdb_ins_code\n_pdbx_poly_seq_scheme.pdb_seq_num\n_pdbx_poly_seq_scheme.pdb_strand_id\n_pdbx_poly_seq_scheme.seq_id\nJ ?  1 n MET . 1  J 1  \nJ ?  1 n ALA . 2  J 2  \nJ 3  1 n THR . 3  J 3  \nJ 4  1 n PRO . 4  J 4  \nJ 5  1 n TRP . 5  J 5  \nJ 6  1 n SER . 6  J 6  \nJ 7  1 n GLY . 7  J 7  \nJ 8  1 n TYR . 8  J 8  \nJ 9  1 n LEU . 9  J 9  \nJ 10 1 n ASP . 10 J 10 \nJ 11 1 n ASP . 11 J 11 \nJ 12 1 n VAL . 12 J 12 \nJ 13 1 n SER . 13 J 13 \nJ 14 1 n ALA . 14 J 14 \nJ 15 1 n LYS . 15 J 15 \nJ 16 1 n PHE . 16 J 16 \nJ 17 1 n ASP . 17 J 17 \nJ 18 1 n THR . 18 J 18 \nJ 19 1 n GLY . 19 J 19 \nJ 20 1 n VAL . 20 J 20 \nJ 21 1 n ASP . 21 J 21 \nJ 22 1 n ASN . 22 J 22 \nJ 23 1 n LEU . 23 J 23 \nJ 24 1 n GLN . 24 J 24 \nJ 25 1 n THR . 25 J 25 \nJ 26 1 n GLN . 26 J 26 \nJ 27 1 n VAL . 27 J 27 \nJ 28 1 n THR . 28 J 28 \nJ 29 1 n GLU . 29 J 29 \nJ 30 1 n ALA . 30 J 30 \nJ 31 1 n LEU . 31 J 31 \nJ 32 1 n ASP . 32 J 32 \nJ 33 1 n LYS . 33 J 33 \nJ 34 1 n LEU . 34 J 34 \nJ 35 1 n ALA . 35 J 35 \nJ 36 1 n ALA . 36 J 36 \nJ 37 1 n LYS . 37 J 37 \nJ 38 1 n PRO . 38 J 38 \nJ 39 1 n SER . 39 J 39 \nJ 40 1 n ASP . 40 J 40 \nJ 41 1 n PRO . 41 J 41 \nJ 42 1 n ALA . 42 J 42 \nJ 43 1 n LEU . 43 J 43 \nJ 44 1 n LEU . 44 J 44 \nJ 45 1 n ALA . 45 J 45 \nJ 46 1 n ALA . 46 J 46 \nJ 47 1 n TYR . 47 J 47 \nJ 48 1 n GLN . 48 J 48 \nJ 49 1 n SER . 49 J 49 \nJ 50 1 n LYS . 50 J 50 \nJ 51 1 n LEU . 51 J 51 \nJ 52 1 n SER . 52 J 52 \nJ 53 1 n GLU . 53 J 53 \nJ 54 1 n TYR . 54 J 54 \nJ 55 1 n ASN . 55 J 55 \nJ 56 1 n LEU . 56 J 56 \nJ 57 1 n TYR . 57 J 57 \nJ 58 1 n ARG . 58 J 58 \nJ 59 1 n ASN . 59 J 59 \nJ 60 1 n ALA . 60 J 60 \nJ 61 1 n GLN . 61 J 61 \nJ 62 1 n SER . 62 J 62 \nJ 63 1 n ASN . 63 J 63 \nJ 64 1 n THR . 64 J 64 \nJ 65 1 n VAL . 65 J 65 \nJ 66 1 n LYS . 66 J 66 \nJ 67 1 n VAL . 67 J 67 \nJ 68 1 n PHE . 68 J 68 \nJ 69 1 n LYS . 69 J 69 \nJ 70 1 n ASP . 70 J 70 \nJ 71 1 n ILE . 71 J 71 \nJ 72 1 n ASP . 72 J 72 \nJ 73 1 n ALA . 73 J 73 \nJ 74 1 n ALA . 74 J 74 \nJ 75 1 n ILE . 75 J 75 \nJ 76 1 n ILE . 76 J 76 \nJ 77 1 n GLN . 77 J 77 \nJ 78 1 n ASN . 78 J 78 \nJ 79 1 n PHE . 79 J 79 \nJ 80 1 n ARG . 80 J 80 \n#\n_pdbx_struct_assembly.details            author_defined_assembly\n_pdbx_struct_assembly.id                 1\n_pdbx_struct_assembly.method_details     ?\n_pdbx_struct_assembly.oligomeric_count   24\n_pdbx_struct_assembly.oligomeric_details 24-meric\n#\n_pdbx_struct_assembly_gen.assembly_id     1\n_pdbx_struct_assembly_gen.asym_id_list    A,B,C,D,E,F,G,H,I,J,K,L,M,N,O,P,Q,R,S,T,U,V,W,X\n_pdbx_struct_assembly_gen.oper_expression 1\n#\n_pdbx_struct_oper_list.id                 1\n_pdbx_struct_oper_list.matrix[1][1]       1.0000000000\n_pdbx_struct_oper_list.matrix[1][2]       0.0000000000\n_pdbx_struct_oper_list.matrix[1][3]       0.0000000000\n_pdbx_struct_oper_list.matrix[2][1]       0.0000000000\n_pdbx_struct_oper_list.matrix[2][2]       1.0000000000\n_pdbx_struct_oper_list.matrix[2][3]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][1]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][2]       0.0000000000\n_pdbx_struct_oper_list.matrix[3][3]       1.0000000000\n_pdbx_struct_oper_list.name               1_555\n_pdbx_struct_oper_list.symmetry_operation ?\n_pdbx_struct_oper_list.type               \"identity operation\"\n_pdbx_struct_oper_list.vector[1]          0.0000000000\n_pdbx_struct_oper_list.vector[2]          0.0000000000\n_pdbx_struct_oper_list.vector[3]          0.0000000000\n#\n_refine.ls_d_res_high 3.90\n#\n_software.classification other\n_software.name           \"DeepMind Structure Class\"\n_software.pdbx_ordinal   1\n_software.version        2.0.0\n#\n_struct_asym.entity_id 1\n_struct_asym.id        J\n#\nloop_\n_atom_site.group_PDB\n_atom_site.id\n_atom_site.type_symbol\n_atom_site.label_atom_id\n_atom_site.label_alt_id\n_atom_site.label_comp_id\n_atom_site.label_asym_id\n_atom_site.label_entity_id\n_atom_site.label_seq_id\n_atom_site.pdbx_PDB_ins_code\n_atom_site.Cartn_x\n_atom_site.Cartn_y\n_atom_site.Cartn_z\n_atom_site.occupancy\n_atom_site.B_iso_or_equiv\n_atom_site.auth_seq_id\n_atom_site.auth_asym_id\n_atom_site.pdbx_PDB_model_num\nATOM 1   N N   . THR J 1 3  ? 180.798 156.981 49.506 1.00 100.87 3  J 1 \nATOM 2   C CA  . THR J 1 3  ? 180.336 158.053 50.380 1.00 100.87 3  J 1 \nATOM 3   C C   . THR J 1 3  ? 178.888 157.811 50.811 1.00 100.87 3  J 1 \nATOM 4   O O   . THR J 1 3  ? 178.076 157.312 50.030 1.00 100.87 3  J 1 \nATOM 5   C CB  . THR J 1 3  ? 180.468 159.436 49.691 1.00 100.87 3  J 1 \nATOM 6   O OG1 . THR J 1 3  ? 180.169 160.478 50.627 1.00 100.87 3  J 1 \nATOM 7   C CG2 . THR J 1 3  ? 179.541 159.546 48.488 1.00 100.87 3  J 1 \nATOM 8   N N   . PRO J 1 4  ? 178.569 158.139 52.065 1.00 96.05  4  J 1 \nATOM 9   C CA  . PRO J 1 4  ? 177.201 157.918 52.554 1.00 96.05  4  J 1 \nATOM 10  C C   . PRO J 1 4  ? 176.203 158.873 51.924 1.00 96.05  4  J 1 \nATOM 11  O O   . PRO J 1 4  ? 176.293 160.090 52.112 1.00 96.05  4  J 1 \nATOM 12  C CB  . PRO J 1 4  ? 177.326 158.152 54.065 1.00 96.05  4  J 1 \nATOM 13  C CG  . PRO J 1 4  ? 178.504 159.047 54.212 1.00 96.05  4  J 1 \nATOM 14  C CD  . PRO J 1 4  ? 179.457 158.664 53.117 1.00 96.05  4  J 1 \nATOM 15  N N   . TRP J 1 5  ? 175.251 158.334 51.169 1.00 82.05  5  J 1 \nATOM 16  C CA  . TRP J 1 5  ? 174.242 159.172 50.543 1.00 82.05  5  J 1 \nATOM 17  C C   . TRP J 1 5  ? 173.275 159.710 51.591 1.00 82.05  5  J 1 \nATOM 18  O O   . TRP J 1 5  ? 173.068 159.105 52.647 1.00 82.05  5  J 1 \nATOM 19  C CB  . TRP J 1 5  ? 173.467 158.390 49.486 1.00 82.05  5  J 1 \nATOM 20  C CG  . TRP J 1 5  ? 172.575 159.261 48.675 1.00 82.05  5  J 1 \nATOM 21  C CD1 . TRP J 1 5  ? 172.953 160.130 47.697 1.00 82.05  5  J 1 \nATOM 22  C CD2 . TRP J 1 5  ? 171.158 159.402 48.811 1.00 82.05  5  J 1 \nATOM 23  N NE1 . TRP J 1 5  ? 171.856 160.778 47.189 1.00 82.05  5  J 1 \nATOM 24  C CE2 . TRP J 1 5  ? 170.741 160.351 47.859 1.00 82.05  5  J 1 \nATOM 25  C CE3 . TRP J 1 5  ? 170.199 158.807 49.634 1.00 82.05  5  J 1 \nATOM 26  C CZ2 . TRP J 1 5  ? 169.408 160.720 47.709 1.00 82.05  5  J 1 \nATOM 27  C CZ3 . TRP J 1 5  ? 168.877 159.176 49.482 1.00 82.05  5  J 1 \nATOM 28  C CH2 . TRP J 1 5  ? 168.493 160.120 48.527 1.00 82.05  5  J 1 \nATOM 29  N N   . SER J 1 6  ? 172.676 160.860 51.291 1.00 78.94  6  J 1 \nATOM 30  C CA  . SER J 1 6  ? 171.730 161.484 52.213 1.00 78.94  6  J 1 \nATOM 31  C C   . SER J 1 6  ? 170.799 162.391 51.422 1.00 78.94  6  J 1 \nATOM 32  O O   . SER J 1 6  ? 171.235 163.417 50.892 1.00 78.94  6  J 1 \nATOM 33  C CB  . SER J 1 6  ? 172.462 162.265 53.300 1.00 78.94  6  J 1 \nATOM 34  O OG  . SER J 1 6  ? 173.149 161.389 54.176 1.00 78.94  6  J 1 \nATOM 35  N N   . GLY J 1 7  ? 169.526 162.014 51.347 1.00 80.09  7  J 1 \nATOM 36  C CA  . GLY J 1 7  ? 168.512 162.855 50.750 1.00 80.09  7  J 1 \nATOM 37  C C   . GLY J 1 7  ? 168.082 163.958 51.698 1.00 80.09  7  J 1 \nATOM 38  O O   . GLY J 1 7  ? 168.539 164.059 52.838 1.00 80.09  7  J 1 \nATOM 39  N N   . TYR J 1 8  ? 167.174 164.804 51.207 1.00 78.37  8  J 1 \nATOM 40  C CA  . TYR J 1 8  ? 166.760 165.964 51.991 1.00 78.37  8  J 1 \nATOM 41  C C   . TYR J 1 8  ? 166.084 165.523 53.284 1.00 78.37  8  J 1 \nATOM 42  O O   . TYR J 1 8  ? 166.332 166.093 54.351 1.00 78.37  8  J 1 \nATOM 43  C CB  . TYR J 1 8  ? 165.830 166.858 51.167 1.00 78.37  8  J 1 \nATOM 44  C CG  . TYR J 1 8  ? 165.412 168.151 51.846 1.00 78.37  8  J 1 \nATOM 45  C CD1 . TYR J 1 8  ? 164.409 168.939 51.311 1.00 78.37  8  J 1 \nATOM 46  C CD2 . TYR J 1 8  ? 166.073 168.622 52.974 1.00 78.37  8  J 1 \nATOM 47  C CE1 . TYR J 1 8  ? 164.036 170.122 51.913 1.00 78.37  8  J 1 \nATOM 48  C CE2 . TYR J 1 8  ? 165.705 169.801 53.581 1.00 78.37  8  J 1 \nATOM 49  C CZ  . TYR J 1 8  ? 164.688 170.550 53.044 1.00 78.37  8  J 1 \nATOM 50  O OH  . TYR J 1 8  ? 164.318 171.735 53.638 1.00 78.37  8  J 1 \nATOM 51  N N   . LEU J 1 9  ? 165.226 164.506 53.213 1.00 73.64  9  J 1 \nATOM 52  C CA  . LEU J 1 9  ? 164.645 163.967 54.439 1.00 73.64  9  J 1 \nATOM 53  C C   . LEU J 1 9  ? 165.730 163.390 55.340 1.00 73.64  9  J 1 \nATOM 54  O O   . LEU J 1 9  ? 165.719 163.604 56.560 1.00 73.64  9  J 1 \nATOM 55  C CB  . LEU J 1 9  ? 163.595 162.906 54.109 1.00 73.64  9  J 1 \nATOM 56  C CG  . LEU J 1 9  ? 162.192 163.335 53.661 1.00 73.64  9  J 1 \nATOM 57  C CD1 . LEU J 1 9  ? 162.211 164.303 52.488 1.00 73.64  9  J 1 \nATOM 58  C CD2 . LEU J 1 9  ? 161.355 162.112 53.321 1.00 73.64  9  J 1 \nATOM 59  N N   . ASP J 1 10 ? 166.683 162.668 54.750 1.00 75.23  10 J 1 \nATOM 60  C CA  . ASP J 1 10 ? 167.828 162.189 55.511 1.00 75.23  10 J 1 \nATOM 61  C C   . ASP J 1 10 ? 168.631 163.360 56.062 1.00 75.23  10 J 1 \nATOM 62  O O   . ASP J 1 10 ? 169.140 163.297 57.186 1.00 75.23  10 J 1 \nATOM 63  C CB  . ASP J 1 10 ? 168.695 161.293 54.624 1.00 75.23  10 J 1 \nATOM 64  C CG  . ASP J 1 10 ? 169.793 160.577 55.393 1.00 75.23  10 J 1 \nATOM 65  O OD1 . ASP J 1 10 ? 169.921 160.785 56.617 1.00 75.23  10 J 1 \nATOM 66  O OD2 . ASP J 1 10 ? 170.537 159.796 54.764 1.00 75.23  10 J 1 \nATOM 67  N N   . ASP J 1 11 ? 168.742 164.442 55.289 1.00 76.21  11 J 1 \nATOM 68  C CA  . ASP J 1 11 ? 169.449 165.624 55.770 1.00 76.21  11 J 1 \nATOM 69  C C   . ASP J 1 11 ? 168.755 166.229 56.984 1.00 76.21  11 J 1 \nATOM 70  O O   . ASP J 1 11 ? 169.416 166.658 57.932 1.00 76.21  11 J 1 \nATOM 71  C CB  . ASP J 1 11 ? 169.573 166.658 54.651 1.00 76.21  11 J 1 \nATOM 72  C CG  . ASP J 1 11 ? 170.510 166.210 53.546 1.00 76.21  11 J 1 \nATOM 73  O OD1 . ASP J 1 11 ? 171.452 165.444 53.836 1.00 76.21  11 J 1 \nATOM 74  O OD2 . ASP J 1 11 ? 170.303 166.623 52.386 1.00 76.21  11 J 1 \nATOM 75  N N   . VAL J 1 12 ? 167.423 166.274 56.973 1.00 71.19  12 J 1 \nATOM 76  C CA  . VAL J 1 12 ? 166.679 166.814 58.107 1.00 71.19  12 J 1 \nATOM 77  C C   . VAL J 1 12 ? 166.846 165.921 59.330 1.00 71.19  12 J 1 \nATOM 78  O O   . VAL J 1 12 ? 167.032 166.405 60.457 1.00 71.19  12 J 1 \nATOM 79  C CB  . VAL J 1 12 ? 165.197 166.989 57.729 1.00 71.19  12 J 1 \nATOM 80  C CG1 . VAL J 1 12 ? 164.358 167.240 58.967 1.00 71.19  12 J 1 \nATOM 81  C CG2 . VAL J 1 12 ? 165.039 168.124 56.733 1.00 71.19  12 J 1 \nATOM 82  N N   . SER J 1 13 ? 166.779 164.604 59.130 1.00 71.31  13 J 1 \nATOM 83  C CA  . SER J 1 13 ? 167.004 163.691 60.244 1.00 71.31  13 J 1 \nATOM 84  C C   . SER J 1 13 ? 168.397 163.882 60.831 1.00 71.31  13 J 1 \nATOM 85  O O   . SER J 1 13 ? 168.555 163.965 62.054 1.00 71.31  13 J 1 \nATOM 86  C CB  . SER J 1 13 ? 166.801 162.246 59.794 1.00 71.31  13 J 1 \nATOM 87  O OG  . SER J 1 13 ? 165.459 162.023 59.402 1.00 71.31  13 J 1 \nATOM 88  N N   . ALA J 1 14 ? 169.413 163.985 59.972 1.00 73.94  14 J 1 \nATOM 89  C CA  . ALA J 1 14 ? 170.773 164.209 60.451 1.00 73.94  14 J 1 \nATOM 90  C C   . ALA J 1 14 ? 170.904 165.566 61.130 1.00 73.94  14 J 1 \nATOM 91  O O   . ALA J 1 14 ? 171.700 165.728 62.061 1.00 73.94  14 J 1 \nATOM 92  C CB  . ALA J 1 14 ? 171.765 164.087 59.295 1.00 73.94  14 J 1 \nATOM 93  N N   . LYS J 1 15 ? 170.140 166.557 60.668 1.00 71.21  15 J 1 \nATOM 94  C CA  . LYS J 1 15 ? 170.140 167.860 61.321 1.00 71.21  15 J 1 \nATOM 95  C C   . LYS J 1 15 ? 169.612 167.753 62.742 1.00 71.21  15 J 1 \nATOM 96  O O   . LYS J 1 15 ? 170.146 168.383 63.660 1.00 71.21  15 J 1 \nATOM 97  C CB  . LYS J 1 15 ? 169.311 168.855 60.511 1.00 71.21  15 J 1 \nATOM 98  C CG  . LYS J 1 15 ? 170.142 169.773 59.635 1.00 71.21  15 J 1 \nATOM 99  C CD  . LYS J 1 15 ? 169.313 170.920 59.089 1.00 71.21  15 J 1 \nATOM 100 C CE  . LYS J 1 15 ? 170.176 171.888 58.300 1.00 71.21  15 J 1 \nATOM 101 N NZ  . LYS J 1 15 ? 169.369 172.970 57.676 1.00 71.21  15 J 1 \nATOM 102 N N   . PHE J 1 16 ? 168.559 166.963 62.943 1.00 68.61  16 J 1 \nATOM 103 C CA  . PHE J 1 16 ? 168.102 166.713 64.308 1.00 68.61  16 J 1 \nATOM 104 C C   . PHE J 1 16 ? 169.128 165.927 65.120 1.00 68.61  16 J 1 \nATOM 105 O O   . PHE J 1 16 ? 169.342 166.226 66.300 1.00 68.61  16 J 1 \nATOM 106 C CB  . PHE J 1 16 ? 166.749 166.005 64.309 1.00 68.61  16 J 1 \nATOM 107 C CG  . PHE J 1 16 ? 165.587 166.929 64.088 1.00 68.61  16 J 1 \nATOM 108 C CD1 . PHE J 1 16 ? 165.736 168.293 64.256 1.00 68.61  16 J 1 \nATOM 109 C CD2 . PHE J 1 16 ? 164.345 166.437 63.736 1.00 68.61  16 J 1 \nATOM 110 C CE1 . PHE J 1 16 ? 164.670 169.147 64.068 1.00 68.61  16 J 1 \nATOM 111 C CE2 . PHE J 1 16 ? 163.277 167.286 63.544 1.00 68.61  16 J 1 \nATOM 112 C CZ  . PHE J 1 16 ? 163.439 168.643 63.710 1.00 68.61  16 J 1 \nATOM 113 N N   . ASP J 1 17 ? 169.768 164.918 64.521 1.00 77.06  17 J 1 \nATOM 114 C CA  . ASP J 1 17 ? 170.752 164.149 65.286 1.00 77.06  17 J 1 \nATOM 115 C C   . ASP J 1 17 ? 171.927 165.017 65.719 1.00 77.06  17 J 1 \nATOM 116 O O   . ASP J 1 17 ? 172.413 164.888 66.848 1.00 77.06  17 J 1 \nATOM 117 C CB  . ASP J 1 17 ? 171.254 162.929 64.509 1.00 77.06  17 J 1 \nATOM 118 C CG  . ASP J 1 17 ? 170.136 162.119 63.888 1.00 77.06  17 J 1 \nATOM 119 O OD1 . ASP J 1 17 ? 170.103 162.001 62.647 1.00 77.06  17 J 1 \nATOM 120 O OD2 . ASP J 1 17 ? 169.286 161.602 64.642 1.00 77.06  17 J 1 \nATOM 121 N N   . THR J 1 18 ? 172.399 165.901 64.845 1.00 76.90  18 J 1 \nATOM 122 C CA  . THR J 1 18 ? 173.485 166.801 65.205 1.00 76.90  18 J 1 \nATOM 123 C C   . THR J 1 18 ? 173.016 167.991 66.028 1.00 76.90  18 J 1 \nATOM 124 O O   . THR J 1 18 ? 173.851 168.678 66.626 1.00 76.90  18 J 1 \nATOM 125 C CB  . THR J 1 18 ? 174.203 167.303 63.949 1.00 76.90  18 J 1 \nATOM 126 O OG1 . THR J 1 18 ? 175.476 167.849 64.314 1.00 76.90  18 J 1 \nATOM 127 C CG2 . THR J 1 18 ? 173.381 168.373 63.253 1.00 76.90  18 J 1 \nATOM 128 N N   . GLY J 1 19 ? 171.709 168.255 66.067 1.00 78.19  19 J 1 \nATOM 129 C CA  . GLY J 1 19 ? 171.207 169.320 66.916 1.00 78.19  19 J 1 \nATOM 130 C C   . GLY J 1 19 ? 171.381 169.012 68.389 1.00 78.19  19 J 1 \nATOM 131 O O   . GLY J 1 19 ? 171.777 169.879 69.172 1.00 78.19  19 J 1 \nATOM 132 N N   . VAL J 1 20 ? 171.089 167.780 68.785 1.00 76.12  20 J 1 \nATOM 133 C CA  . VAL J 1 20 ? 171.317 167.329 70.150 1.00 76.12  20 J 1 \nATOM 134 C C   . VAL J 1 20 ? 172.694 166.684 70.220 1.00 76.12  20 J 1 \nATOM 135 O O   . VAL J 1 20 ? 173.054 165.862 69.368 1.00 76.12  20 J 1 \nATOM 136 C CB  . VAL J 1 20 ? 170.212 166.362 70.606 1.00 76.12  20 J 1 \nATOM 137 C CG1 . VAL J 1 20 ? 168.869 167.069 70.596 1.00 76.12  20 J 1 \nATOM 138 C CG2 . VAL J 1 20 ? 170.158 165.132 69.713 1.00 76.12  20 J 1 \nATOM 139 N N   . ASP J 1 21 ? 173.487 167.090 71.210 1.00 78.41  21 J 1 \nATOM 140 C CA  . ASP J 1 21 ? 174.863 166.617 71.290 1.00 78.41  21 J 1 \nATOM 141 C C   . ASP J 1 21 ? 174.916 165.113 71.524 1.00 78.41  21 J 1 \nATOM 142 O O   . ASP J 1 21 ? 175.347 164.349 70.653 1.00 78.41  21 J 1 \nATOM 143 C CB  . ASP J 1 21 ? 175.608 167.363 72.396 1.00 78.41  21 J 1 \nATOM 144 C CG  . ASP J 1 21 ? 175.835 168.824 72.061 1.00 78.41  21 J 1 \nATOM 145 O OD1 . ASP J 1 21 ? 175.946 169.149 70.861 1.00 78.41  21 J 1 \nATOM 146 O OD2 . ASP J 1 21 ? 175.903 169.647 72.998 1.00 78.41  21 J 1 \nATOM 147 N N   . ASN J 1 22 ? 174.471 164.668 72.693 1.00 74.91  22 J 1 \nATOM 148 C CA  . ASN J 1 22 ? 174.565 163.267 73.084 1.00 74.91  22 J 1 \nATOM 149 C C   . ASN J 1 22 ? 173.277 162.819 73.765 1.00 74.91  22 J 1 \nATOM 150 O O   . ASN J 1 22 ? 173.294 162.151 74.799 1.00 74.91  22 J 1 \nATOM 151 C CB  . ASN J 1 22 ? 175.777 163.050 73.987 1.00 74.91  22 J 1 \nATOM 152 C CG  . ASN J 1 22 ? 175.825 164.032 75.138 1.00 74.91  22 J 1 \nATOM 153 O OD1 . ASN J 1 22 ? 174.925 164.855 75.304 1.00 74.91  22 J 1 \nATOM 154 N ND2 . ASN J 1 22 ? 176.881 163.956 75.938 1.00 74.91  22 J 1 \nATOM 155 N N   . LEU J 1 23 ? 172.134 163.193 73.182 1.00 72.21  23 J 1 \nATOM 156 C CA  . LEU J 1 23 ? 170.852 162.915 73.824 1.00 72.21  23 J 1 \nATOM 157 C C   . LEU J 1 23 ? 170.648 161.425 74.053 1.00 72.21  23 J 1 \nATOM 158 O O   . LEU J 1 23 ? 170.248 161.010 75.146 1.00 72.21  23 J 1 \nATOM 159 C CB  . LEU J 1 23 ? 169.708 163.483 72.989 1.00 72.21  23 J 1 \nATOM 160 C CG  . LEU J 1 23 ? 168.328 163.271 73.612 1.00 72.21  23 J 1 \nATOM 161 C CD1 . LEU J 1 23 ? 168.229 163.983 74.946 1.00 72.21  23 J 1 \nATOM 162 C CD2 . LEU J 1 23 ? 167.237 163.743 72.669 1.00 72.21  23 J 1 \nATOM 163 N N   . GLN J 1 24 ? 170.920 160.601 73.039 1.00 70.63  24 J 1 \nATOM 164 C CA  . GLN J 1 24 ? 170.840 159.157 73.230 1.00 70.63  24 J 1 \nATOM 165 C C   . GLN J 1 24 ? 171.802 158.707 74.320 1.00 70.63  24 J 1 \nATOM 166 O O   . GLN J 1 24 ? 171.425 157.974 75.242 1.00 70.63  24 J 1 \nATOM 167 C CB  . GLN J 1 24 ? 171.143 158.435 71.917 1.00 70.63  24 J 1 \nATOM 168 C CG  . GLN J 1 24 ? 170.834 156.949 71.947 1.00 70.63  24 J 1 \nATOM 169 C CD  . GLN J 1 24 ? 169.405 156.644 71.556 1.00 70.63  24 J 1 \nATOM 170 O OE1 . GLN J 1 24 ? 168.697 157.505 71.042 1.00 70.63  24 J 1 \nATOM 171 N NE2 . GLN J 1 24 ? 168.972 155.412 71.801 1.00 70.63  24 J 1 \nATOM 172 N N   . THR J 1 25 ? 173.052 159.167 74.242 1.00 72.05  25 J 1 \nATOM 173 C CA  . THR J 1 25 ? 174.029 158.829 75.267 1.00 72.05  25 J 1 \nATOM 174 C C   . THR J 1 25 ? 173.628 159.382 76.627 1.00 72.05  25 J 1 \nATOM 175 O O   . THR J 1 25 ? 173.752 158.681 77.636 1.00 72.05  25 J 1 \nATOM 176 C CB  . THR J 1 25 ? 175.407 159.349 74.865 1.00 72.05  25 J 1 \nATOM 177 O OG1 . THR J 1 25 ? 175.777 158.785 73.601 1.00 72.05  25 J 1 \nATOM 178 C CG2 . THR J 1 25 ? 176.447 158.961 75.898 1.00 72.05  25 J 1 \nATOM 179 N N   . GLN J 1 26 ? 173.147 160.627 76.676 1.00 73.20  26 J 1 \nATOM 180 C CA  . GLN J 1 26 ? 172.756 161.219 77.951 1.00 73.20  26 J 1 \nATOM 181 C C   . GLN J 1 26 ? 171.656 160.400 78.610 1.00 73.20  26 J 1 \nATOM 182 O O   . GLN J 1 26 ? 171.709 160.118 79.814 1.00 73.20  26 J 1 \nATOM 183 C CB  . GLN J 1 26 ? 172.301 162.663 77.739 1.00 73.20  26 J 1 \nATOM 184 C CG  . GLN J 1 26 ? 173.397 163.693 77.939 1.00 73.20  26 J 1 \nATOM 185 C CD  . GLN J 1 26 ? 172.920 165.105 77.674 1.00 73.20  26 J 1 \nATOM 186 O OE1 . GLN J 1 26 ? 171.782 165.454 77.979 1.00 73.20  26 J 1 \nATOM 187 N NE2 . GLN J 1 26 ? 173.791 165.926 77.101 1.00 73.20  26 J 1 \nATOM 188 N N   . VAL J 1 27 ? 170.660 159.989 77.824 1.00 70.38  27 J 1 \nATOM 189 C CA  . VAL J 1 27 ? 169.615 159.113 78.339 1.00 70.38  27 J 1 \nATOM 190 C C   . VAL J 1 27 ? 170.211 157.789 78.796 1.00 70.38  27 J 1 \nATOM 191 O O   . VAL J 1 27 ? 169.787 157.217 79.808 1.00 70.38  27 J 1 \nATOM 192 C CB  . VAL J 1 27 ? 168.521 158.911 77.274 1.00 70.38  27 J 1 \nATOM 193 C CG1 . VAL J 1 27 ? 167.570 157.803 77.685 1.00 70.38  27 J 1 \nATOM 194 C CG2 . VAL J 1 27 ? 167.761 160.204 77.059 1.00 70.38  27 J 1 \nATOM 195 N N   . THR J 1 28 ? 171.208 157.285 78.067 1.00 66.97  28 J 1 \nATOM 196 C CA  . THR J 1 28 ? 171.814 156.011 78.437 1.00 66.97  28 J 1 \nATOM 197 C C   . THR J 1 28 ? 172.453 156.080 79.821 1.00 66.97  28 J 1 \nATOM 198 O O   . THR J 1 28 ? 172.163 155.246 80.688 1.00 66.97  28 J 1 \nATOM 199 C CB  . THR J 1 28 ? 172.841 155.591 77.388 1.00 66.97  28 J 1 \nATOM 200 O OG1 . THR J 1 28 ? 172.192 155.449 76.118 1.00 66.97  28 J 1 \nATOM 201 C CG2 . THR J 1 28 ? 173.475 154.265 77.774 1.00 66.97  28 J 1 \nATOM 202 N N   . GLU J 1 29 ? 173.322 157.072 80.055 1.00 72.66  29 J 1 \nATOM 203 C CA  . GLU J 1 29 ? 173.906 157.156 81.396 1.00 72.66  29 J 1 \nATOM 204 C C   . GLU J 1 29 ? 172.874 157.531 82.451 1.00 72.66  29 J 1 \nATOM 205 O O   . GLU J 1 29 ? 172.996 157.088 83.594 1.00 72.66  29 J 1 \nATOM 206 C CB  . GLU J 1 29 ? 175.107 158.111 81.526 1.00 72.66  29 J 1 \nATOM 207 C CG  . GLU J 1 29 ? 176.428 157.677 80.874 1.00 72.66  29 J 1 \nATOM 208 C CD  . GLU J 1 29 ? 176.594 158.116 79.452 1.00 72.66  29 J 1 \nATOM 209 O OE1 . GLU J 1 29 ? 175.740 158.874 78.981 1.00 72.66  29 J 1 \nATOM 210 O OE2 . GLU J 1 29 ? 177.582 157.707 78.806 1.00 72.66  29 J 1 \nATOM 211 N N   . ALA J 1 30 ? 171.858 158.331 82.113 1.00 71.55  30 J 1 \nATOM 212 C CA  . ALA J 1 30 ? 170.840 158.641 83.113 1.00 71.55  30 J 1 \nATOM 213 C C   . ALA J 1 30 ? 170.124 157.377 83.571 1.00 71.55  30 J 1 \nATOM 214 O O   . ALA J 1 30 ? 169.974 157.134 84.776 1.00 71.55  30 J 1 \nATOM 215 C CB  . ALA J 1 30 ? 169.842 159.654 82.555 1.00 71.55  30 J 1 \nATOM 216 N N   . LEU J 1 31 ? 169.710 156.541 82.619 1.00 67.57  31 J 1 \nATOM 217 C CA  . LEU J 1 31 ? 169.026 155.299 82.949 1.00 67.57  31 J 1 \nATOM 218 C C   . LEU J 1 31 ? 169.947 154.332 83.681 1.00 67.57  31 J 1 \nATOM 219 O O   . LEU J 1 31 ? 169.513 153.645 84.613 1.00 67.57  31 J 1 \nATOM 220 C CB  . LEU J 1 31 ? 168.470 154.664 81.675 1.00 67.57  31 J 1 \nATOM 221 C CG  . LEU J 1 31 ? 167.565 153.444 81.827 1.00 67.57  31 J 1 \nATOM 222 C CD1 . LEU J 1 31 ? 166.434 153.521 80.822 1.00 67.57  31 J 1 \nATOM 223 C CD2 . LEU J 1 31 ? 168.355 152.161 81.641 1.00 67.57  31 J 1 \nATOM 224 N N   . ASP J 1 32 ? 171.217 154.256 83.275 1.00 72.67  32 J 1 \nATOM 225 C CA  . ASP J 1 32 ? 172.149 153.367 83.960 1.00 72.67  32 J 1 \nATOM 226 C C   . ASP J 1 32 ? 172.379 153.821 85.398 1.00 72.67  32 J 1 \nATOM 227 O O   . ASP J 1 32 ? 172.414 152.997 86.319 1.00 72.67  32 J 1 \nATOM 228 C CB  . ASP J 1 32 ? 173.467 153.305 83.188 1.00 72.67  32 J 1 \nATOM 229 C CG  . ASP J 1 32 ? 174.413 152.240 83.718 1.00 72.67  32 J 1 \nATOM 230 O OD1 . ASP J 1 32 ? 174.073 151.558 84.706 1.00 72.67  32 J 1 \nATOM 231 O OD2 . ASP J 1 32 ? 175.507 152.083 83.137 1.00 72.67  32 J 1 \nATOM 232 N N   . LYS J 1 33 ? 172.532 155.130 85.610 1.00 71.55  33 J 1 \nATOM 233 C CA  . LYS J 1 33 ? 172.715 155.655 86.958 1.00 71.55  33 J 1 \nATOM 234 C C   . LYS J 1 33 ? 171.496 155.382 87.824 1.00 71.55  33 J 1 \nATOM 235 O O   . LYS J 1 33 ? 171.628 155.006 88.994 1.00 71.55  33 J 1 \nATOM 236 C CB  . LYS J 1 33 ? 173.001 157.155 86.900 1.00 71.55  33 J 1 \nATOM 237 C CG  . LYS J 1 33 ? 174.385 157.517 86.392 1.00 71.55  33 J 1 \nATOM 238 C CD  . LYS J 1 33 ? 174.482 159.007 86.104 1.00 71.55  33 J 1 \nATOM 239 C CE  . LYS J 1 33 ? 174.396 159.829 87.379 1.00 71.55  33 J 1 \nATOM 240 N NZ  . LYS J 1 33 ? 174.607 161.279 87.119 1.00 71.55  33 J 1 \nATOM 241 N N   . LEU J 1 34 ? 170.296 155.566 87.269 1.00 70.34  34 J 1 \nATOM 242 C CA  . LEU J 1 34 ? 169.095 155.291 88.045 1.00 70.34  34 J 1 \nATOM 243 C C   . LEU J 1 34 ? 168.944 153.807 88.358 1.00 70.34  34 J 1 \nATOM 244 O O   . LEU J 1 34 ? 168.263 153.458 89.327 1.00 70.34  34 J 1 \nATOM 245 C CB  . LEU J 1 34 ? 167.865 155.824 87.305 1.00 70.34  34 J 1 \nATOM 246 C CG  . LEU J 1 34 ? 166.493 155.819 87.987 1.00 70.34  34 J 1 \nATOM 247 C CD1 . LEU J 1 34 ? 165.645 156.923 87.403 1.00 70.34  34 J 1 \nATOM 248 C CD2 . LEU J 1 34 ? 165.773 154.496 87.808 1.00 70.34  34 J 1 \nATOM 249 N N   . ALA J 1 35 ? 169.587 152.930 87.582 1.00 66.69  35 J 1 \nATOM 250 C CA  . ALA J 1 35 ? 169.434 151.494 87.785 1.00 66.69  35 J 1 \nATOM 251 C C   . ALA J 1 35 ? 169.942 151.034 89.144 1.00 66.69  35 J 1 \nATOM 252 O O   . ALA J 1 35 ? 169.492 149.995 89.640 1.00 66.69  35 J 1 \nATOM 253 C CB  . ALA J 1 35 ? 170.153 150.726 86.678 1.00 66.69  35 J 1 \nATOM 254 N N   . ALA J 1 36 ? 170.865 151.775 89.759 1.00 67.09  36 J 1 \nATOM 255 C CA  . ALA J 1 36 ? 171.402 151.403 91.059 1.00 67.09  36 J 1 \nATOM 256 C C   . ALA J 1 36 ? 171.016 152.357 92.179 1.00 67.09  36 J 1 \nATOM 257 O O   . ALA J 1 36 ? 171.066 151.959 93.347 1.00 67.09  36 J 1 \nATOM 258 C CB  . ALA J 1 36 ? 172.933 151.307 90.996 1.00 67.09  36 J 1 \nATOM 259 N N   . LYS J 1 37 ? 170.632 153.590 91.860 1.00 66.94  37 J 1 \nATOM 260 C CA  . LYS J 1 37 ? 170.209 154.579 92.850 1.00 66.94  37 J 1 \nATOM 261 C C   . LYS J 1 37 ? 168.843 155.099 92.431 1.00 66.94  37 J 1 \nATOM 262 O O   . LYS J 1 37 ? 168.736 156.111 91.726 1.00 66.94  37 J 1 \nATOM 263 C CB  . LYS J 1 37 ? 171.229 155.709 92.979 1.00 66.94  37 J 1 \nATOM 264 C CG  . LYS J 1 37 ? 172.582 155.242 93.477 1.00 66.94  37 J 1 \nATOM 265 C CD  . LYS J 1 37 ? 172.450 154.552 94.823 1.00 66.94  37 J 1 \nATOM 266 C CE  . LYS J 1 37 ? 173.808 154.194 95.400 1.00 66.94  37 J 1 \nATOM 267 N NZ  . LYS J 1 37 ? 173.680 153.478 96.700 1.00 66.94  37 J 1 \nATOM 268 N N   . PRO J 1 38 ? 167.768 154.426 92.850 1.00 68.68  38 J 1 \nATOM 269 C CA  . PRO J 1 38 ? 166.442 154.759 92.315 1.00 68.68  38 J 1 \nATOM 270 C C   . PRO J 1 38 ? 165.804 155.974 92.952 1.00 68.68  38 J 1 \nATOM 271 O O   . PRO J 1 38 ? 165.061 156.684 92.265 1.00 68.68  38 J 1 \nATOM 272 C CB  . PRO J 1 38 ? 165.630 153.501 92.616 1.00 68.68  38 J 1 \nATOM 273 C CG  . PRO J 1 38 ? 166.222 153.021 93.902 1.00 68.68  38 J 1 \nATOM 274 C CD  . PRO J 1 38 ? 167.701 153.332 93.834 1.00 68.68  38 J 1 \nATOM 275 N N   . SER J 1 39 ? 166.056 156.240 94.230 1.00 70.54  39 J 1 \nATOM 276 C CA  . SER J 1 39 ? 165.383 157.320 94.933 1.00 70.54  39 J 1 \nATOM 277 C C   . SER J 1 39 ? 166.204 158.596 94.992 1.00 70.54  39 J 1 \nATOM 278 O O   . SER J 1 39 ? 165.705 159.612 95.488 1.00 70.54  39 J 1 \nATOM 279 C CB  . SER J 1 39 ? 165.027 156.887 96.360 1.00 70.54  39 J 1 \nATOM 280 O OG  . SER J 1 39 ? 166.196 156.601 97.104 1.00 70.54  39 J 1 \nATOM 281 N N   . ASP J 1 40 ? 167.425 158.579 94.500 1.00 71.51  40 J 1 \nATOM 282 C CA  . ASP J 1 40 ? 168.310 159.702 94.730 1.00 71.51  40 J 1 \nATOM 283 C C   . ASP J 1 40 ? 167.868 160.912 93.909 1.00 71.51  40 J 1 \nATOM 284 O O   . ASP J 1 40 ? 167.348 160.766 92.800 1.00 71.51  40 J 1 \nATOM 285 C CB  . ASP J 1 40 ? 169.741 159.324 94.374 1.00 71.51  40 J 1 \nATOM 286 C CG  . ASP J 1 40 ? 170.519 158.829 95.569 1.00 71.51  40 J 1 \nATOM 287 O OD1 . ASP J 1 40 ? 170.038 159.024 96.701 1.00 71.51  40 J 1 \nATOM 288 O OD2 . ASP J 1 40 ? 171.606 158.245 95.379 1.00 71.51  40 J 1 \nATOM 289 N N   . PRO J 1 41 ? 168.040 162.115 94.445 1.00 72.15  41 J 1 \nATOM 290 C CA  . PRO J 1 41 ? 167.725 163.323 93.677 1.00 72.15  41 J 1 \nATOM 291 C C   . PRO J 1 41 ? 168.792 163.594 92.630 1.00 72.15  41 J 1 \nATOM 292 O O   . PRO J 1 41 ? 169.806 162.902 92.531 1.00 72.15  41 J 1 \nATOM 293 C CB  . PRO J 1 41 ? 167.709 164.427 94.737 1.00 72.15  41 J 1 \nATOM 294 C CG  . PRO J 1 41 ? 167.558 163.713 96.031 1.00 72.15  41 J 1 \nATOM 295 C CD  . PRO J 1 41 ? 168.278 162.420 95.862 1.00 72.15  41 J 1 \nATOM 296 N N   . ALA J 1 42 ? 168.537 164.627 91.831 1.00 68.90  42 J 1 \nATOM 297 C CA  . ALA J 1 42 ? 169.449 165.183 90.837 1.00 68.90  42 J 1 \nATOM 298 C C   . ALA J 1 42 ? 169.710 164.237 89.674 1.00 68.90  42 J 1 \nATOM 299 O O   . ALA J 1 42 ? 170.388 164.632 88.718 1.00 68.90  42 J 1 \nATOM 300 C CB  . ALA J 1 42 ? 170.795 165.605 91.445 1.00 68.90  42 J 1 \nATOM 301 N N   . LEU J 1 43 ? 169.199 163.008 89.712 1.00 66.88  43 J 1 \nATOM 302 C CA  . LEU J 1 43 ? 169.214 162.168 88.523 1.00 66.88  43 J 1 \nATOM 303 C C   . LEU J 1 43 ? 167.793 161.722 88.216 1.00 66.88  43 J 1 \nATOM 304 O O   . LEU J 1 43 ? 167.436 161.561 87.048 1.00 66.88  43 J 1 \nATOM 305 C CB  . LEU J 1 43 ? 170.136 160.956 88.678 1.00 66.88  43 J 1 \nATOM 306 C CG  . LEU J 1 43 ? 169.723 159.783 89.565 1.00 66.88  43 J 1 \nATOM 307 C CD1 . LEU J 1 43 ? 170.578 158.575 89.251 1.00 66.88  43 J 1 \nATOM 308 C CD2 . LEU J 1 43 ? 169.875 160.147 91.011 1.00 66.88  43 J 1 \nATOM 309 N N   . LEU J 1 44 ? 166.976 161.526 89.255 1.00 62.81  44 J 1 \nATOM 310 C CA  . LEU J 1 44 ? 165.564 161.231 89.034 1.00 62.81  44 J 1 \nATOM 311 C C   . LEU J 1 44 ? 164.891 162.349 88.255 1.00 62.81  44 J 1 \nATOM 312 O O   . LEU J 1 44 ? 164.229 162.103 87.240 1.00 62.81  44 J 1 \nATOM 313 C CB  . LEU J 1 44 ? 164.850 161.025 90.366 1.00 62.81  44 J 1 \nATOM 314 C CG  . LEU J 1 44 ? 164.662 159.603 90.876 1.00 62.81  44 J 1 \nATOM 315 C CD1 . LEU J 1 44 ? 164.144 159.655 92.300 1.00 62.81  44 J 1 \nATOM 316 C CD2 . LEU J 1 44 ? 163.706 158.844 89.980 1.00 62.81  44 J 1 \nATOM 317 N N   . ALA J 1 45 ? 165.051 163.589 88.717 1.00 63.51  45 J 1 \nATOM 318 C CA  . ALA J 1 45 ? 164.565 164.727 87.951 1.00 63.51  45 J 1 \nATOM 319 C C   . ALA J 1 45 ? 165.278 164.805 86.611 1.00 63.51  45 J 1 \nATOM 320 O O   . ALA J 1 45 ? 164.660 165.085 85.577 1.00 63.51  45 J 1 \nATOM 321 C CB  . ALA J 1 45 ? 164.759 166.015 88.748 1.00 63.51  45 J 1 \nATOM 322 N N   . ALA J 1 46 ? 166.587 164.547 86.611 1.00 63.88  46 J 1 \nATOM 323 C CA  . ALA J 1 46 ? 167.322 164.470 85.356 1.00 63.88  46 J 1 \nATOM 324 C C   . ALA J 1 46 ? 166.799 163.335 84.489 1.00 63.88  46 J 1 \nATOM 325 O O   . ALA J 1 46 ? 166.675 163.486 83.270 1.00 63.88  46 J 1 \nATOM 326 C CB  . ALA J 1 46 ? 168.815 164.297 85.627 1.00 63.88  46 J 1 \nATOM 327 N N   . TYR J 1 47 ? 166.483 162.190 85.100 1.00 60.60  47 J 1 \nATOM 328 C CA  . TYR J 1 47 ? 165.886 161.089 84.350 1.00 60.60  47 J 1 \nATOM 329 C C   . TYR J 1 47 ? 164.618 161.528 83.639 1.00 60.60  47 J 1 \nATOM 330 O O   . TYR J 1 47 ? 164.476 161.336 82.427 1.00 60.60  47 J 1 \nATOM 331 C CB  . TYR J 1 47 ? 165.579 159.921 85.282 1.00 60.60  47 J 1 \nATOM 332 C CG  . TYR J 1 47 ? 164.985 158.730 84.578 1.00 60.60  47 J 1 \nATOM 333 C CD1 . TYR J 1 47 ? 165.771 157.885 83.811 1.00 60.60  47 J 1 \nATOM 334 C CD2 . TYR J 1 47 ? 163.629 158.457 84.675 1.00 60.60  47 J 1 \nATOM 335 C CE1 . TYR J 1 47 ? 165.223 156.798 83.168 1.00 60.60  47 J 1 \nATOM 336 C CE2 . TYR J 1 47 ? 163.073 157.376 84.037 1.00 60.60  47 J 1 \nATOM 337 C CZ  . TYR J 1 47 ? 163.872 156.550 83.285 1.00 60.60  47 J 1 \nATOM 338 O OH  . TYR J 1 47 ? 163.317 155.471 82.646 1.00 60.60  47 J 1 \nATOM 339 N N   . GLN J 1 48 ? 163.681 162.118 84.380 1.00 61.22  48 J 1 \nATOM 340 C CA  . GLN J 1 48 ? 162.418 162.506 83.769 1.00 61.22  48 J 1 \nATOM 341 C C   . GLN J 1 48 ? 162.618 163.572 82.703 1.00 61.22  48 J 1 \nATOM 342 O O   . GLN J 1 48 ? 162.021 163.485 81.623 1.00 61.22  48 J 1 \nATOM 343 C CB  . GLN J 1 48 ? 161.441 163.000 84.832 1.00 61.22  48 J 1 \nATOM 344 C CG  . GLN J 1 48 ? 160.073 163.333 84.276 1.00 61.22  48 J 1 \nATOM 345 C CD  . GLN J 1 48 ? 159.096 163.765 85.344 1.00 61.22  48 J 1 \nATOM 346 O OE1 . GLN J 1 48 ? 159.445 163.860 86.519 1.00 61.22  48 J 1 \nATOM 347 N NE2 . GLN J 1 48 ? 157.858 164.028 84.941 1.00 61.22  48 J 1 \nATOM 348 N N   . SER J 1 49 ? 163.461 164.571 82.975 1.00 66.01  49 J 1 \nATOM 349 C CA  . SER J 1 49 ? 163.666 165.643 82.010 1.00 66.01  49 J 1 \nATOM 350 C C   . SER J 1 49 ? 164.298 165.117 80.729 1.00 66.01  49 J 1 \nATOM 351 O O   . SER J 1 49 ? 163.843 165.437 79.628 1.00 66.01  49 J 1 \nATOM 352 C CB  . SER J 1 49 ? 164.529 166.744 82.623 1.00 66.01  49 J 1 \nATOM 353 O OG  . SER J 1 49 ? 164.839 167.732 81.658 1.00 66.01  49 J 1 \nATOM 354 N N   . LYS J 1 50 ? 165.348 164.301 80.851 1.00 62.23  50 J 1 \nATOM 355 C CA  . LYS J 1 50 ? 165.992 163.755 79.662 1.00 62.23  50 J 1 \nATOM 356 C C   . LYS J 1 50 ? 165.074 162.806 78.908 1.00 62.23  50 J 1 \nATOM 357 O O   . LYS J 1 50 ? 165.080 162.796 77.674 1.00 62.23  50 J 1 \nATOM 358 C CB  . LYS J 1 50 ? 167.292 163.045 80.036 1.00 62.23  50 J 1 \nATOM 359 C CG  . LYS J 1 50 ? 168.320 163.948 80.688 1.00 62.23  50 J 1 \nATOM 360 C CD  . LYS J 1 50 ? 168.804 165.014 79.725 1.00 62.23  50 J 1 \nATOM 361 C CE  . LYS J 1 50 ? 169.815 165.927 80.391 1.00 62.23  50 J 1 \nATOM 362 N NZ  . LYS J 1 50 ? 171.093 165.218 80.672 1.00 62.23  50 J 1 \nATOM 363 N N   . LEU J 1 51 ? 164.282 162.004 79.620 1.00 55.13  51 J 1 \nATOM 364 C CA  . LEU J 1 51 ? 163.386 161.078 78.942 1.00 55.13  51 J 1 \nATOM 365 C C   . LEU J 1 51 ? 162.306 161.830 78.175 1.00 55.13  51 J 1 \nATOM 366 O O   . LEU J 1 51 ? 161.984 161.482 77.034 1.00 55.13  51 J 1 \nATOM 367 C CB  . LEU J 1 51 ? 162.773 160.118 79.955 1.00 55.13  51 J 1 \nATOM 368 C CG  . LEU J 1 51 ? 161.865 159.044 79.373 1.00 55.13  51 J 1 \nATOM 369 C CD1 . LEU J 1 51 ? 162.675 158.158 78.450 1.00 55.13  51 J 1 \nATOM 370 C CD2 . LEU J 1 51 ? 161.246 158.227 80.487 1.00 55.13  51 J 1 \nATOM 371 N N   . SER J 1 52 ? 161.739 162.876 78.783 1.00 58.66  52 J 1 \nATOM 372 C CA  . SER J 1 52 ? 160.769 163.700 78.069 1.00 58.66  52 J 1 \nATOM 373 C C   . SER J 1 52 ? 161.418 164.423 76.896 1.00 58.66  52 J 1 \nATOM 374 O O   . SER J 1 52 ? 160.815 164.553 75.825 1.00 58.66  52 J 1 \nATOM 375 C CB  . SER J 1 52 ? 160.119 164.699 79.023 1.00 58.66  52 J 1 \nATOM 376 O OG  . SER J 1 52 ? 159.266 164.041 79.940 1.00 58.66  52 J 1 \nATOM 377 N N   . GLU J 1 53 ? 162.646 164.910 77.081 1.00 65.81  53 J 1 \nATOM 378 C CA  . GLU J 1 53 ? 163.360 165.549 75.985 1.00 65.81  53 J 1 \nATOM 379 C C   . GLU J 1 53 ? 163.519 164.593 74.816 1.00 65.81  53 J 1 \nATOM 380 O O   . GLU J 1 53 ? 163.285 164.966 73.663 1.00 65.81  53 J 1 \nATOM 381 C CB  . GLU J 1 53 ? 164.729 166.027 76.468 1.00 65.81  53 J 1 \nATOM 382 C CG  . GLU J 1 53 ? 164.823 167.501 76.834 1.00 65.81  53 J 1 \nATOM 383 C CD  . GLU J 1 53 ? 164.613 168.437 75.659 1.00 65.81  53 J 1 \nATOM 384 O OE1 . GLU J 1 53 ? 164.395 167.965 74.524 1.00 65.81  53 J 1 \nATOM 385 O OE2 . GLU J 1 53 ? 164.659 169.667 75.875 1.00 65.81  53 J 1 \nATOM 386 N N   . TYR J 1 54 ? 163.901 163.351 75.104 1.00 59.32  54 J 1 \nATOM 387 C CA  . TYR J 1 54 ? 164.070 162.346 74.065 1.00 59.32  54 J 1 \nATOM 388 C C   . TYR J 1 54 ? 162.742 162.013 73.396 1.00 59.32  54 J 1 \nATOM 389 O O   . TYR J 1 54 ? 162.683 161.828 72.175 1.00 59.32  54 J 1 \nATOM 390 C CB  . TYR J 1 54 ? 164.710 161.104 74.676 1.00 59.32  54 J 1 \nATOM 391 C CG  . TYR J 1 54 ? 164.986 159.991 73.707 1.00 59.32  54 J 1 \nATOM 392 C CD1 . TYR J 1 54 ? 166.049 160.070 72.828 1.00 59.32  54 J 1 \nATOM 393 C CD2 . TYR J 1 54 ? 164.208 158.845 73.697 1.00 59.32  54 J 1 \nATOM 394 C CE1 . TYR J 1 54 ? 166.316 159.055 71.945 1.00 59.32  54 J 1 \nATOM 395 C CE2 . TYR J 1 54 ? 164.470 157.819 72.819 1.00 59.32  54 J 1 \nATOM 396 C CZ  . TYR J 1 54 ? 165.527 157.929 71.944 1.00 59.32  54 J 1 \nATOM 397 O OH  . TYR J 1 54 ? 165.800 156.912 71.061 1.00 59.32  54 J 1 \nATOM 398 N N   . ASN J 1 55 ? 161.668 161.931 74.183 1.00 55.92  55 J 1 \nATOM 399 C CA  . ASN J 1 55 ? 160.344 161.659 73.629 1.00 55.92  55 J 1 \nATOM 400 C C   . ASN J 1 55 ? 159.925 162.748 72.647 1.00 55.92  55 J 1 \nATOM 401 O O   . ASN J 1 55 ? 159.524 162.458 71.511 1.00 55.92  55 J 1 \nATOM 402 C CB  . ASN J 1 55 ? 159.340 161.529 74.777 1.00 55.92  55 J 1 \nATOM 403 C CG  . ASN J 1 55 ? 157.922 161.278 74.306 1.00 55.92  55 J 1 \nATOM 404 O OD1 . ASN J 1 55 ? 157.659 161.123 73.117 1.00 55.92  55 J 1 \nATOM 405 N ND2 . ASN J 1 55 ? 156.998 161.213 75.253 1.00 55.92  55 J 1 \nATOM 406 N N   . LEU J 1 56 ? 160.012 164.010 73.071 1.00 57.85  56 J 1 \nATOM 407 C CA  . LEU J 1 56 ? 159.659 165.115 72.183 1.00 57.85  56 J 1 \nATOM 408 C C   . LEU J 1 56 ? 160.587 165.185 70.980 1.00 57.85  56 J 1 \nATOM 409 O O   . LEU J 1 56 ? 160.148 165.503 69.871 1.00 57.85  56 J 1 \nATOM 410 C CB  . LEU J 1 56 ? 159.665 166.437 72.945 1.00 57.85  56 J 1 \nATOM 411 C CG  . LEU J 1 56 ? 158.428 166.781 73.772 1.00 57.85  56 J 1 \nATOM 412 C CD1 . LEU J 1 56 ? 158.257 165.920 74.998 1.00 57.85  56 J 1 \nATOM 413 C CD2 . LEU J 1 56 ? 158.539 168.224 74.179 1.00 57.85  56 J 1 \nATOM 414 N N   . TYR J 1 57 ? 161.872 164.895 71.176 1.00 60.05  57 J 1 \nATOM 415 C CA  . TYR J 1 57 ? 162.800 164.844 70.054 1.00 60.05  57 J 1 \nATOM 416 C C   . TYR J 1 57 ? 162.362 163.824 69.013 1.00 60.05  57 J 1 \nATOM 417 O O   . TYR J 1 57 ? 162.299 164.134 67.817 1.00 60.05  57 J 1 \nATOM 418 C CB  . TYR J 1 57 ? 164.203 164.534 70.578 1.00 60.05  57 J 1 \nATOM 419 C CG  . TYR J 1 57 ? 165.239 164.289 69.513 1.00 60.05  57 J 1 \nATOM 420 C CD1 . TYR J 1 57 ? 165.328 163.058 68.881 1.00 60.05  57 J 1 \nATOM 421 C CD2 . TYR J 1 57 ? 166.114 165.288 69.127 1.00 60.05  57 J 1 \nATOM 422 C CE1 . TYR J 1 57 ? 166.257 162.825 67.909 1.00 60.05  57 J 1 \nATOM 423 C CE2 . TYR J 1 57 ? 167.052 165.063 68.149 1.00 60.05  57 J 1 \nATOM 424 C CZ  . TYR J 1 57 ? 167.118 163.828 67.545 1.00 60.05  57 J 1 \nATOM 425 O OH  . TYR J 1 57 ? 168.044 163.579 66.567 1.00 60.05  57 J 1 \nATOM 426 N N   . ARG J 1 58 ? 162.069 162.598 69.446 1.00 58.38  58 J 1 \nATOM 427 C CA  . ARG J 1 58 ? 161.680 161.562 68.498 1.00 58.38  58 J 1 \nATOM 428 C C   . ARG J 1 58 ? 160.373 161.916 67.804 1.00 58.38  58 J 1 \nATOM 429 O O   . ARG J 1 58 ? 160.238 161.726 66.587 1.00 58.38  58 J 1 \nATOM 430 C CB  . ARG J 1 58 ? 161.566 160.217 69.208 1.00 58.38  58 J 1 \nATOM 431 C CG  . ARG J 1 58 ? 162.900 159.553 69.491 1.00 58.38  58 J 1 \nATOM 432 C CD  . ARG J 1 58 ? 163.871 159.707 68.335 1.00 58.38  58 J 1 \nATOM 433 N NE  . ARG J 1 58 ? 165.241 159.437 68.753 1.00 58.38  58 J 1 \nATOM 434 C CZ  . ARG J 1 58 ? 166.293 159.472 67.948 1.00 58.38  58 J 1 \nATOM 435 N NH1 . ARG J 1 58 ? 166.171 159.760 66.663 1.00 58.38  58 J 1 \nATOM 436 N NH2 . ARG J 1 58 ? 167.498 159.214 68.445 1.00 58.38  58 J 1 \nATOM 437 N N   . ASN J 1 59 ? 159.399 162.432 68.558 1.00 58.16  59 J 1 \nATOM 438 C CA  . ASN J 1 59 ? 158.133 162.817 67.945 1.00 58.16  59 J 1 \nATOM 439 C C   . ASN J 1 59 ? 158.327 163.928 66.924 1.00 58.16  59 J 1 \nATOM 440 O O   . ASN J 1 59 ? 157.735 163.893 65.839 1.00 58.16  59 J 1 \nATOM 441 C CB  . ASN J 1 59 ? 157.133 163.240 69.017 1.00 58.16  59 J 1 \nATOM 442 C CG  . ASN J 1 59 ? 156.401 162.065 69.619 1.00 58.16  59 J 1 \nATOM 443 O OD1 . ASN J 1 59 ? 156.905 161.403 70.521 1.00 58.16  59 J 1 \nATOM 444 N ND2 . ASN J 1 59 ? 155.203 161.796 69.117 1.00 58.16  59 J 1 \nATOM 445 N N   . ALA J 1 60 ? 159.154 164.925 67.250 1.00 62.06  60 J 1 \nATOM 446 C CA  . ALA J 1 60 ? 159.407 166.012 66.314 1.00 62.06  60 J 1 \nATOM 447 C C   . ALA J 1 60 ? 160.081 165.504 65.052 1.00 62.06  60 J 1 \nATOM 448 O O   . ALA J 1 60 ? 159.709 165.896 63.940 1.00 62.06  60 J 1 \nATOM 449 C CB  . ALA J 1 60 ? 160.257 167.092 66.980 1.00 62.06  60 J 1 \nATOM 450 N N   . GLN J 1 61 ? 161.067 164.621 65.203 1.00 65.39  61 J 1 \nATOM 451 C CA  . GLN J 1 61 ? 161.748 164.072 64.037 1.00 65.39  61 J 1 \nATOM 452 C C   . GLN J 1 61 ? 160.774 163.310 63.148 1.00 65.39  61 J 1 \nATOM 453 O O   . GLN J 1 61 ? 160.735 163.512 61.925 1.00 65.39  61 J 1 \nATOM 454 C CB  . GLN J 1 61 ? 162.895 163.171 64.494 1.00 65.39  61 J 1 \nATOM 455 C CG  . GLN J 1 61 ? 164.044 163.067 63.519 1.00 65.39  61 J 1 \nATOM 456 C CD  . GLN J 1 61 ? 165.192 162.262 64.080 1.00 65.39  61 J 1 \nATOM 457 O OE1 . GLN J 1 61 ? 166.240 162.807 64.420 1.00 65.39  61 J 1 \nATOM 458 N NE2 . GLN J 1 61 ? 164.998 160.957 64.189 1.00 65.39  61 J 1 \nATOM 459 N N   . SER J 1 62 ? 159.959 162.442 63.753 1.00 64.39  62 J 1 \nATOM 460 C CA  . SER J 1 62 ? 159.025 161.644 62.969 1.00 64.39  62 J 1 \nATOM 461 C C   . SER J 1 62 ? 157.998 162.522 62.267 1.00 64.39  62 J 1 \nATOM 462 O O   . SER J 1 62 ? 157.716 162.331 61.078 1.00 64.39  62 J 1 \nATOM 463 C CB  . SER J 1 62 ? 158.333 160.619 63.865 1.00 64.39  62 J 1 \nATOM 464 O OG  . SER J 1 62 ? 157.410 159.843 63.125 1.00 64.39  62 J 1 \nATOM 465 N N   . ASN J 1 63 ? 157.438 163.504 62.976 1.00 65.16  63 J 1 \nATOM 466 C CA  . ASN J 1 63 ? 156.437 164.361 62.357 1.00 65.16  63 J 1 \nATOM 467 C C   . ASN J 1 63 ? 157.033 165.219 61.252 1.00 65.16  63 J 1 \nATOM 468 O O   . ASN J 1 63 ? 156.389 165.421 60.216 1.00 65.16  63 J 1 \nATOM 469 C CB  . ASN J 1 63 ? 155.767 165.233 63.413 1.00 65.16  63 J 1 \nATOM 470 C CG  . ASN J 1 63 ? 154.853 164.439 64.316 1.00 65.16  63 J 1 \nATOM 471 O OD1 . ASN J 1 63 ? 154.525 163.290 64.026 1.00 65.16  63 J 1 \nATOM 472 N ND2 . ASN J 1 63 ? 154.434 165.045 65.416 1.00 65.16  63 J 1 \nATOM 473 N N   . THR J 1 64 ? 158.252 165.729 61.444 1.00 66.60  64 J 1 \nATOM 474 C CA  . THR J 1 64 ? 158.875 166.543 60.408 1.00 66.60  64 J 1 \nATOM 475 C C   . THR J 1 64 ? 159.147 165.725 59.153 1.00 66.60  64 J 1 \nATOM 476 O O   . THR J 1 64 ? 158.846 166.169 58.035 1.00 66.60  64 J 1 \nATOM 477 C CB  . THR J 1 64 ? 160.169 167.158 60.935 1.00 66.60  64 J 1 \nATOM 478 O OG1 . THR J 1 64 ? 159.877 167.977 62.072 1.00 66.60  64 J 1 \nATOM 479 C CG2 . THR J 1 64 ? 160.819 168.011 59.865 1.00 66.60  64 J 1 \nATOM 480 N N   . VAL J 1 65 ? 159.707 164.523 59.310 1.00 64.00  65 J 1 \nATOM 481 C CA  . VAL J 1 65 ? 159.978 163.718 58.124 1.00 64.00  65 J 1 \nATOM 482 C C   . VAL J 1 65 ? 158.671 163.316 57.452 1.00 64.00  65 J 1 \nATOM 483 O O   . VAL J 1 65 ? 158.580 163.285 56.220 1.00 64.00  65 J 1 \nATOM 484 C CB  . VAL J 1 65 ? 160.858 162.499 58.464 1.00 64.00  65 J 1 \nATOM 485 C CG1 . VAL J 1 65 ? 162.203 162.957 58.999 1.00 64.00  65 J 1 \nATOM 486 C CG2 . VAL J 1 65 ? 160.176 161.571 59.442 1.00 64.00  65 J 1 \nATOM 487 N N   . LYS J 1 66 ? 157.626 163.047 58.241 1.00 65.12  66 J 1 \nATOM 488 C CA  . LYS J 1 66 ? 156.341 162.691 57.649 1.00 65.12  66 J 1 \nATOM 489 C C   . LYS J 1 66 ? 155.745 163.847 56.855 1.00 65.12  66 J 1 \nATOM 490 O O   . LYS J 1 66 ? 155.240 163.645 55.745 1.00 65.12  66 J 1 \nATOM 491 C CB  . LYS J 1 66 ? 155.366 162.235 58.733 1.00 65.12  66 J 1 \nATOM 492 C CG  . LYS J 1 66 ? 153.992 161.855 58.202 1.00 65.12  66 J 1 \nATOM 493 C CD  . LYS J 1 66 ? 154.088 160.891 57.032 1.00 65.12  66 J 1 \nATOM 494 C CE  . LYS J 1 66 ? 152.711 160.542 56.496 1.00 65.12  66 J 1 \nATOM 495 N NZ  . LYS J 1 66 ? 151.754 160.214 57.587 1.00 65.12  66 J 1 \nATOM 496 N N   . VAL J 1 67 ? 155.779 165.064 57.402 1.00 65.92  67 J 1 \nATOM 497 C CA  . VAL J 1 67 ? 155.163 166.185 56.696 1.00 65.92  67 J 1 \nATOM 498 C C   . VAL J 1 67 ? 155.958 166.528 55.442 1.00 65.92  67 J 1 \nATOM 499 O O   . VAL J 1 67 ? 155.381 166.863 54.397 1.00 65.92  67 J 1 \nATOM 500 C CB  . VAL J 1 67 ? 154.993 167.401 57.629 1.00 65.92  67 J 1 \nATOM 501 C CG1 . VAL J 1 67 ? 156.328 167.937 58.097 1.00 65.92  67 J 1 \nATOM 502 C CG2 . VAL J 1 67 ? 154.200 168.492 56.929 1.00 65.92  67 J 1 \nATOM 503 N N   . PHE J 1 68 ? 157.288 166.435 55.509 1.00 66.56  68 J 1 \nATOM 504 C CA  . PHE J 1 68 ? 158.076 166.682 54.308 1.00 66.56  68 J 1 \nATOM 505 C C   . PHE J 1 68 ? 157.826 165.606 53.260 1.00 66.56  68 J 1 \nATOM 506 O O   . PHE J 1 68 ? 157.772 165.899 52.059 1.00 66.56  68 J 1 \nATOM 507 C CB  . PHE J 1 68 ? 159.558 166.785 54.657 1.00 66.56  68 J 1 \nATOM 508 C CG  . PHE J 1 68 ? 159.991 168.177 55.012 1.00 66.56  68 J 1 \nATOM 509 C CD1 . PHE J 1 68 ? 160.099 168.568 56.333 1.00 66.56  68 J 1 \nATOM 510 C CD2 . PHE J 1 68 ? 160.268 169.101 54.022 1.00 66.56  68 J 1 \nATOM 511 C CE1 . PHE J 1 68 ? 160.490 169.850 56.660 1.00 66.56  68 J 1 \nATOM 512 C CE2 . PHE J 1 68 ? 160.658 170.384 54.343 1.00 66.56  68 J 1 \nATOM 513 C CZ  . PHE J 1 68 ? 160.769 170.758 55.664 1.00 66.56  68 J 1 \nATOM 514 N N   . LYS J 1 69 ? 157.646 164.356 53.694 1.00 70.04  69 J 1 \nATOM 515 C CA  . LYS J 1 69 ? 157.283 163.302 52.755 1.00 70.04  69 J 1 \nATOM 516 C C   . LYS J 1 69 ? 155.929 163.584 52.123 1.00 70.04  69 J 1 \nATOM 517 O O   . LYS J 1 69 ? 155.731 163.326 50.934 1.00 70.04  69 J 1 \nATOM 518 C CB  . LYS J 1 69 ? 157.291 161.944 53.465 1.00 70.04  69 J 1 \nATOM 519 C CG  . LYS J 1 69 ? 157.067 160.718 52.570 1.00 70.04  69 J 1 \nATOM 520 C CD  . LYS J 1 69 ? 155.593 160.436 52.289 1.00 70.04  69 J 1 \nATOM 521 C CE  . LYS J 1 69 ? 155.424 159.353 51.239 1.00 70.04  69 J 1 \nATOM 522 N NZ  . LYS J 1 69 ? 153.999 158.953 51.085 1.00 70.04  69 J 1 \nATOM 523 N N   . ASP J 1 70 ? 154.979 164.093 52.908 1.00 70.15  70 J 1 \nATOM 524 C CA  . ASP J 1 70 ? 153.667 164.418 52.356 1.00 70.15  70 J 1 \nATOM 525 C C   . ASP J 1 70 ? 153.770 165.503 51.293 1.00 70.15  70 J 1 \nATOM 526 O O   . ASP J 1 70 ? 153.172 165.386 50.216 1.00 70.15  70 J 1 \nATOM 527 C CB  . ASP J 1 70 ? 152.719 164.850 53.472 1.00 70.15  70 J 1 \nATOM 528 C CG  . ASP J 1 70 ? 152.353 163.710 54.396 1.00 70.15  70 J 1 \nATOM 529 O OD1 . ASP J 1 70 ? 152.337 162.552 53.930 1.00 70.15  70 J 1 \nATOM 530 O OD2 . ASP J 1 70 ? 152.082 163.970 55.587 1.00 70.15  70 J 1 \nATOM 531 N N   . ILE J 1 71 ? 154.538 166.558 51.574 1.00 64.31  71 J 1 \nATOM 532 C CA  . ILE J 1 71 ? 154.721 167.619 50.588 1.00 64.31  71 J 1 \nATOM 533 C C   . ILE J 1 71 ? 155.375 167.070 49.326 1.00 64.31  71 J 1 \nATOM 534 O O   . ILE J 1 71 ? 154.941 167.362 48.203 1.00 64.31  71 J 1 \nATOM 535 C CB  . ILE J 1 71 ? 155.545 168.772 51.188 1.00 64.31  71 J 1 \nATOM 536 C CG1 . ILE J 1 71 ? 154.860 169.327 52.435 1.00 64.31  71 J 1 \nATOM 537 C CG2 . ILE J 1 71 ? 155.751 169.866 50.159 1.00 64.31  71 J 1 \nATOM 538 C CD1 . ILE J 1 71 ? 155.778 170.127 53.325 1.00 64.31  71 J 1 \nATOM 539 N N   . ASP J 1 72 ? 156.423 166.261 49.492 1.00 68.85  72 J 1 \nATOM 540 C CA  . ASP J 1 72 ? 157.144 165.727 48.343 1.00 68.85  72 J 1 \nATOM 541 C C   . ASP J 1 72 ? 156.266 164.795 47.517 1.00 68.85  72 J 1 \nATOM 542 O O   . ASP J 1 72 ? 156.316 164.814 46.282 1.00 68.85  72 J 1 \nATOM 543 C CB  . ASP J 1 72 ? 158.398 165.005 48.825 1.00 68.85  72 J 1 \nATOM 544 C CG  . ASP J 1 72 ? 159.551 165.947 49.062 1.00 68.85  72 J 1 \nATOM 545 O OD1 . ASP J 1 72 ? 160.691 165.462 49.183 1.00 68.85  72 J 1 \nATOM 546 O OD2 . ASP J 1 72 ? 159.318 167.171 49.125 1.00 68.85  72 J 1 \nATOM 547 N N   . ALA J 1 73 ? 155.464 163.963 48.181 1.00 65.97  73 J 1 \nATOM 548 C CA  . ALA J 1 73 ? 154.553 163.081 47.466 1.00 65.97  73 J 1 \nATOM 549 C C   . ALA J 1 73 ? 153.501 163.878 46.715 1.00 65.97  73 J 1 \nATOM 550 O O   . ALA J 1 73 ? 153.128 163.520 45.593 1.00 65.97  73 J 1 \nATOM 551 C CB  . ALA J 1 73 ? 153.894 162.103 48.437 1.00 65.97  73 J 1 \nATOM 552 N N   . ALA J 1 74 ? 153.004 164.960 47.319 1.00 64.99  74 J 1 \nATOM 553 C CA  . ALA J 1 74 ? 152.063 165.819 46.610 1.00 64.99  74 J 1 \nATOM 554 C C   . ALA J 1 74 ? 152.700 166.405 45.358 1.00 64.99  74 J 1 \nATOM 555 O O   . ALA J 1 74 ? 152.080 166.428 44.288 1.00 64.99  74 J 1 \nATOM 556 C CB  . ALA J 1 74 ? 151.567 166.931 47.533 1.00 64.99  74 J 1 \nATOM 557 N N   . ILE J 1 75 ? 153.947 166.864 45.469 1.00 67.26  75 J 1 \nATOM 558 C CA  . ILE J 1 75 ? 154.634 167.425 44.307 1.00 67.26  75 J 1 \nATOM 559 C C   . ILE J 1 75 ? 154.797 166.367 43.222 1.00 67.26  75 J 1 \nATOM 560 O O   . ILE J 1 75 ? 154.522 166.615 42.042 1.00 67.26  75 J 1 \nATOM 561 C CB  . ILE J 1 75 ? 155.993 168.017 44.717 1.00 67.26  75 J 1 \nATOM 562 C CG1 . ILE J 1 75 ? 155.807 169.113 45.765 1.00 67.26  75 J 1 \nATOM 563 C CG2 . ILE J 1 75 ? 156.721 168.564 43.502 1.00 67.26  75 J 1 \nATOM 564 C CD1 . ILE J 1 75 ? 154.983 170.274 45.286 1.00 67.26  75 J 1 \nATOM 565 N N   . ILE J 1 76 ? 155.244 165.170 43.607 1.00 71.16  76 J 1 \nATOM 566 C CA  . ILE J 1 76 ? 155.503 164.119 42.627 1.00 71.16  76 J 1 \nATOM 567 C C   . ILE J 1 76 ? 154.216 163.694 41.935 1.00 71.16  76 J 1 \nATOM 568 O O   . ILE J 1 76 ? 154.164 163.579 40.705 1.00 71.16  76 J 1 \nATOM 569 C CB  . ILE J 1 76 ? 156.205 162.925 43.299 1.00 71.16  76 J 1 \nATOM 570 C CG1 . ILE J 1 76 ? 157.602 163.325 43.761 1.00 71.16  76 J 1 \nATOM 571 C CG2 . ILE J 1 76 ? 156.302 161.755 42.342 1.00 71.16  76 J 1 \nATOM 572 C CD1 . ILE J 1 76 ? 158.489 163.764 42.631 1.00 71.16  76 J 1 \nATOM 573 N N   . GLN J 1 77 ? 153.158 163.457 42.708 1.00 74.01  77 J 1 \nATOM 574 C CA  . GLN J 1 77 ? 151.870 163.093 42.139 1.00 74.01  77 J 1 \nATOM 575 C C   . GLN J 1 77 ? 151.276 164.203 41.291 1.00 74.01  77 J 1 \nATOM 576 O O   . GLN J 1 77 ? 150.522 163.917 40.355 1.00 74.01  77 J 1 \nATOM 577 C CB  . GLN J 1 77 ? 150.903 162.718 43.266 1.00 74.01  77 J 1 \nATOM 578 C CG  . GLN J 1 77 ? 149.608 162.063 42.818 1.00 74.01  77 J 1 \nATOM 579 C CD  . GLN J 1 77 ? 148.547 163.075 42.436 1.00 74.01  77 J 1 \nATOM 580 O OE1 . GLN J 1 77 ? 148.119 163.881 43.261 1.00 74.01  77 J 1 \nATOM 581 N NE2 . GLN J 1 77 ? 148.126 163.046 41.178 1.00 74.01  77 J 1 \nATOM 582 N N   . ASN J 1 78 ? 151.610 165.453 41.583 1.00 75.47  78 J 1 \nATOM 583 C CA  . ASN J 1 78 ? 151.007 166.584 40.903 1.00 75.47  78 J 1 \nATOM 584 C C   . ASN J 1 78 ? 151.656 166.793 39.532 1.00 75.47  78 J 1 \nATOM 585 O O   . ASN J 1 78 ? 151.100 167.503 38.692 1.00 75.47  78 J 1 \nATOM 586 C CB  . ASN J 1 78 ? 151.109 167.797 41.862 1.00 75.47  78 J 1 \nATOM 587 C CG  . ASN J 1 78 ? 150.672 169.138 41.268 1.00 75.47  78 J 1 \nATOM 588 O OD1 . ASN J 1 78 ? 150.393 169.290 40.093 1.00 75.47  78 J 1 \nATOM 589 N ND2 . ASN J 1 78 ? 150.555 170.120 42.149 1.00 75.47  78 J 1 \nATOM 590 N N   . PHE J 1 79 ? 152.755 166.084 39.244 1.00 76.77  79 J 1 \nATOM 591 C CA  . PHE J 1 79 ? 153.341 166.125 37.905 1.00 76.77  79 J 1 \nATOM 592 C C   . PHE J 1 79 ? 152.308 165.775 36.843 1.00 76.77  79 J 1 \nATOM 593 O O   . PHE J 1 79 ? 152.188 166.465 35.824 1.00 76.77  79 J 1 \nATOM 594 C CB  . PHE J 1 79 ? 154.513 165.146 37.794 1.00 76.77  79 J 1 \nATOM 595 C CG  . PHE J 1 79 ? 155.770 165.599 38.471 1.00 76.77  79 J 1 \nATOM 596 C CD1 . PHE J 1 79 ? 155.885 166.866 39.000 1.00 76.77  79 J 1 \nATOM 597 C CD2 . PHE J 1 79 ? 156.855 164.744 38.553 1.00 76.77  79 J 1 \nATOM 598 C CE1 . PHE J 1 79 ? 157.054 167.261 39.614 1.00 76.77  79 J 1 \nATOM 599 C CE2 . PHE J 1 79 ? 158.021 165.138 39.162 1.00 76.77  79 J 1 \nATOM 600 C CZ  . PHE J 1 79 ? 158.121 166.398 39.692 1.00 76.77  79 J 1 \nATOM 601 N N   . ARG J 1 80 ? 151.557 164.702 37.066 1.00 84.01  80 J 1 \nATOM 602 C CA  . ARG J 1 80 ? 150.552 164.246 36.118 1.00 84.01  80 J 1 \nATOM 603 C C   . ARG J 1 80 ? 149.236 164.973 36.361 1.00 84.01  80 J 1 \nATOM 604 O O   . ARG J 1 80 ? 148.856 165.220 37.506 1.00 84.01  80 J 1 \nATOM 605 C CB  . ARG J 1 80 ? 150.365 162.730 36.232 1.00 84.01  80 J 1 \nATOM 606 C CG  . ARG J 1 80 ? 149.526 162.108 35.127 1.00 84.01  80 J 1 \nATOM 607 C CD  . ARG J 1 80 ? 148.094 161.873 35.581 1.00 84.01  80 J 1 \nATOM 608 N NE  . ARG J 1 80 ? 148.029 160.982 36.733 1.00 84.01  80 J 1 \nATOM 609 C CZ  . ARG J 1 80 ? 146.964 160.838 37.510 1.00 84.01  80 J 1 \nATOM 610 N NH1 . ARG J 1 80 ? 145.848 161.512 37.286 1.00 84.01  80 J 1 \nATOM 611 N NH2 . ARG J 1 80 ? 147.022 159.999 38.541 1.00 84.01  80 J 1 \nATOM 612 O OXT . ARG J 1 80 ? 148.527 165.332 35.421 1.00 84.01  80 J 1 \n#\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/pdb_seqres_2022_09_28__subsampled_1000.fasta",
    "content": ">4ffz_X mol:protein length:111  Envelope protein E\nMASMTLKGMSYVMCTGSFKLEKEVAETQHGTVLVQVKYEGTDAPCKIPFSSQDEKGVTQNGRLITANPIVTDKEKPVNIEAEPPFGESYIVVGAGEKALKLSWFKKGSSIG\n>2y3e_A mol:protein length:134  STREPTAVIDIN\nMAEAGITGTWYNQLGSTFIVTAGADGALTGTYESAVGNAEGDYVLTGRYDSAPATDGSGTALGWTVAWKNNYRNAHSATTWSGQYVGGAEARINTQWLLTSGTTEANAWKSTLVGHDTFTKVKPSAASHHHHHH\n>7rye_J mol:protein length:80  Protein PrgI\nMATPWSGYLDDVSAKFDTGVDNLQTQVTEALDKLAAKPSDPALLAAYQSKLSEYNLYRNAQSNTVKVFKDIDAAIIQNFR\n>5eq0_B mol:protein length:6  unc3866\nXFALXX\n>5thk_C mol:protein length:266  Putative dehydrogenase\nMAHHHHHHMVATHTLADKVVLIAGGAKNLGGLIARDLAGHGAKAVAIHYNSAASQAQAEETAAAVRAAGAEAATFQADLTTAAAVEKLFDDAKQRFGKIDIAINTVGKVLKKPFTEISEAEYDEMFAVNSKSAFFFIKEAGRHLEDHGKLVTLVTSLLGAFTPFYAAYEGSKAPVEHFTRAASKEYGARGISVTAVGPGPMDTPFFYPAEGADAVAYHKTAAALSPFSKTGLTDIEDVVPFIRHLVTDGWWITGQTILINGGYTTK\n>1svu_B mol:protein length:327  Modification methylase HhaI\nMIEIKDKQLTGLRFIDLFAGLGGFRLALESCGAECVYSNEWDKYAQEVYEMNFGEKPEGDITQVNEKTIPDHDILCAGFPCQAFSISGKQKGFEDSRGTLFFDIARIVREKKPKVVFMENVKNFASHDNGNTLEVVKNTMNELDYSFHAKVLNALDYGIPQKRERIYMICFRNDLNIQNFQFPKPFELNTFVKDLLLPDSEVEHLVIDRKDLVMTNQEIEQTTPKTVRLGIVGKGGWGERIYSTRGIAITLSAYGGGIFAKTGGYLVNGKTRKLHPRECARVMGYPDSYKVHPSTSQAYKQFGNSVVINVLQYIAYNIGSSLNFKPY\n>3c0r_B mol:protein length:75  Ubiquitin\nMQIFVKTLTGKTITLEVEPSDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRG\n>3dnn_H mol:protein length:170  HIV-1 envelope glycoprotein gp120\nTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTGAGHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWF\n>4igl_D mol:protein length:690  YenC2\nMDIQLFSKTPSVTVFDNRGLSVRDIAYRRHPDTPKVTEECITYHQFDFRGFLAQSLDPRLNHKEVTNFSYLTDLNGNIIYTQSVDAGNTLVLNDTEGRSVIAMTNISRGENGKDDLSLAVTRTFQYENAPLPGRPLSVTEQVNGENARITEHFVYAGNTPQEKNLNLAGQCVSYYDAAGLIQTDSVSLTGKPLSVSRKLLKNLDDTNILADWQGNDTSAWNSLLATEIYTTVTRTDAAGAVLTTIDAVGNQQRVAFDIAGQLSASWLTLKGGQEQVIIKVLTYSAAGQKLREEGGNGVVTTYTYEAETQRLIGIKTERPNGHAAGAKVLQDLRYEYDPVGNVLSITNDAEETRFWRNQKVVPENAYRYDSLYQLVSASGREVAGAGQQGSDLPSPLVPLPSDSSVYTNYTRTYTYDSAGNLMRIRHSAPATNNNYTLNITVSERSNRGVMSSLTENPADVDALFTASGSQKCLQQGQSLIWTPRGELRTVLLVARGETADDSESYRYDGSSQRILKISSQQTNHSARVQRALYLPGLEWRTMTGGVAEAENLQVICIGEAGRAQVRVLHWESGKPDGIINDQIRWSYDNLTCSSGLEVDGDGLVISMEEYYPYGGTAVWAARSHIETAYKTVRYSGKERDATGLYYYGFRYYQPWAGRWLSADPAGTVDGLNLYRMVRNNPLRLTDPDGM\n>2y1z_B mol:protein length:94  ALPHA-CRYSTALLIN B CHAIN\nGAMEMRLEKDRFSVNLDVKHFSPEELKVKVLGDVIEVHGKHEERQDEHGFISREFHGKYRIPADVDPLTITSSMSSDGVLTVNGPRKQVSGPER\n>7vy3_V mol:protein length:54  Antenna pigment protein alpha chain\nMSKFYKIWMIFDPRRVFVAQGVFLFLLAVMIHLILLSTPSYNWLEISAAKYNRV\n>7v2c_P mol:protein length:208  NADH dehydrogenase [ubiquinone] iron-sulfur protein 3, mitochondrial\nTRPTIRPRNDVVHKQLSAFGQYVAEILPKYVQQVQVSCFNELEIFIHPDGVIPVLTFLRDHTNAQFKSLADLTAVDVPTRQNRFEIVYNLLSLRFNSRIRVKTYTDELTPIESSVTVYKAANWYEREIWDMFGVFFANHPDLRRILTDYGFEGHPFRKDFPLSGYVELRYDDEVKRVVAEPVELAQEFRKFDLNSPWEAFPAYRQPPE\n>7eca_A mol:protein length:333  Kelch-like ECH-associated protein 1\nMGHHHHHHENLYFQGHMTLHKPTQAVPCRAPKVGRLIYTAGGYFRQSLSYLEAYNPSNGSWLRLADLQVPRSGLAGCVVGGLLYAVGGRNNSPDGNTDSSALDCYNPMTNQWSPCASMSVPRNRIGVGVIDGHIYAVGGSHGCIHHSSVERYEPERDEWHLVAPMLTRRIGVGVAVLNRLLYAVGGFDGTNRLNSAECYYPERNEWRMITPMNTIRSGAGVCVLHNCIYAAGGYDGQDQLNSVERYDVETETWTFVAPMRHHRSALGITVHQGKIYVLGGYDGHTFLDSVECYDPDSDTWSEVTRMTSGRSGVGVAVTMEPCRKQIDQQNCTC\n>2maa_A mol:protein length:13  Temporin-A\nFLPLIGRVLSGIL\n>7xi7_A mol:protein length:187  Dihydrofolate reductase\nMVGSLNCIVAVSQNMGIGKNGDLPWPPLRNEFRYFQRMTTTSSVEGKQNLVIMGKKTWFSIPEKNRPLKGRINLVLSRELKEPPQGAHFLSRSLDDALKLTEQPELANKVDMVWIVGGSSVYKEAMNHPGHLKLFVTRIMQDFESDTFFPEIDLEKYKLLPEYPGVLSDVQEEKGIKYKFEVYEKND\n>6zmn_A mol:protein length:125  Mothers against decapentaplegic homolog 3\nGPAVKRLLGWKQGDEEEKWCEKAVKSLVKKLKKTGQLDELEKAITTQNVNTKCITIPRSLDGRLQVSHRKGLPHVIYCRLWRWPDLHSHHELRAMELCEFAFNMKKDEVCVNPYHYQRVETPVLP\n>7vbn_G mol:protein length:88  Acyl carrier protein, mitochondrial\nSDAPPLTLEAIKDRVLYVLKLYDKIDPEKLSVNSHFMKDLGLDSLDQVEIIMAMEDEFGFEIPDIDAEKLMCPQEIVDYIADKKDVYE\n>7vaq_J mol:protein length:188  V-type ATP synthase subunit E\nMSKLEAILSQEVEAEIQALLQEAEAKAEAVKREAEEKAKALLQARERALEAQYRAALRRAESAGELLVATARTQARGEVLEEVRRRVREALEALPQKPEWPEVVRKLALEALEALPGAKALVANPEDLPHLEALARERGVELQAEPALRLGVRAVGAEGKTQVENSLLARLDRAWDALSSKVAQALWG\n>7osz_B mol:protein length:512  Bifunctional glutamate/proline--tRNA ligase\nGAGEGQGPKKQTRLGLEAKKEENLADWYSQVITKSEMIEYHDISGCYILRPWAYAIWEAIKDFFDAEIKKLGVENCYFPMFVSQSALEKEKTHVADFAPEVAWVTRSGKTELAEPIAIRPTSETVMYPAYAKWVQSHRDLPIKLNQWCNVVRWEFKHPQPFLRTREFLWQEGHSAFATMEEAAEEVLQILDLYAQVYEELLAIPVVKGRKTEKEKFAGGDYTTTIEAFISASGRAIQGGTSHHLGQNFSKMFEIVFEDPKIPGEKQFAYQNSWGLTTRTIGVMTMVHGDNMGLVLPPRVACVQVVIIPCGITNALSEEDKEALIAKCNDYRRRLLSVNIRVRADLRDNYSPGWKFNHWELKGVPIRLEVGPRDMKSCQFVAVRRDTGEKLTVAENEAETKLQAILEDIQVTLFTRASEDLKTHMVVANTMEDFQKILDSGKIVQIPFCGEIDCEDWIKKTTARDQDLEPGAPSMGAKSLCIPFKPLCELQPGAKCVCGKNPAKYYTLFGRSY\n>6y0u_A mol:protein length:115  Fucose-binding lectin\nMATQGVFTLPANTRFGVTAFANSSGTQTVNVLVNNETAATFSGQSTNNAVIGTQVLNSGSSGKVQVQVSVNGRPSDLVSAQVILTNELNFALVGSEDGTDNDYNDAVVVINWPLG\n>3j3y_5T mol:protein length:231  capsid protein\nPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIEPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVL\n>7pmz_D mol:protein length:504  Inosine-5'-monophosphate dehydrogenase\nGSHMTANVDGVPEKFATLGLTYDDVLLLPGASAVLPNAVDTSSRISRNVRVNIPLLSAAMDKVTESRMAISMARQGGVGVLHRNLSIEDQANQVDLVKRSESGMVANPITIHPDATLGEADALCAKFRISGVPVTDGAGKLLGIVTNRDMAFETDRSRQVREVMTPMPLVTGQVGISGVDAMELLRRHKIEKLPLVDGDGILKGLITVKDFVKAEQYPHAAKDAKGRLLVGAAVGASPEALDRAQALAEAGVDFLVVDTSHGHNSNALSWMSKIKSSVGIDVVGGNVATRDGAQALIDAGVDGIKVGVGPGSICTTRVVAGIGVPQVTAIYEASLAARAAGVPLIGDGGLQYSGDIGKALAAGADTVMLGSLLAGCEESPGELQFINGKQFKSYRGMGSLGAMQSRGQGRSYSKDRYFQAEVASDDKLVPEGIEGQVPYRGPLANVLHQLVGGLRQTMGYVGAATIEEMESKGRFVRITSAGLKESHPHDIQMTVEAPNYSRSK\n>3ccr_F mol:protein length:120  50S ribosomal protein L7Ae\nMPVYVDFDVPADLEDDALEALEVARDTGAVKKGTNETTKSIERGSAELVFVAEDVQPEEIVMHIPELADEKGVPFIFVEQQDDLGHAAGLEVGSAAAAVTDAGEADADVEDIADKVEELR\n>5omf_A mol:protein length:774  DNA polymerase,DNA polymerase,DNA polymerase\nMILDTDYITEDGKPVIRIFKKENGEFKIEYDRTFEPYFYALLKDDSAIEEVKKITAERHGTVVTVKRVEKVQKKFLGRPVEVWKLYFTHPQDVPAIRDKIREHPAVIDIYEYDIPFAKRYLIDKGLVPMEGDEELKMLAFAIATLYHEGEEFAEGPILMISYADEEGARVITWKNVDLPYVDVVSTEREMIKRFLRVVKEKDPDVLITYNGDNFDFAYLKKRCEKLGINFALGRDGSEPKIQRMGDRFAVEVKGRIHFDLYPVIRRTINLPTYTLEAVYEAVFGQPKEKVYAEEITTAWETGENLERVARYSMEDAKVTYELGKEFLPMEAQLSRLIGQSLWDVSRSSTGNLVEWFLLRKAYERNELAPNKPDEKELARRRQSYEGGYVKEPERGLWENIVYLDFRSLYPSIIITHNVSPDTLNREGCKEYDVAPQVGHRFCKDFPGFIPSLLGDLLEERQKIKKKMKATIDPIERKLLDYRQRAIKILANSYYGYYGYARARWYCKECAESVTAWGREYITMTIKEIEEKYGFKVIYSDTDGFFATIPGADAETVKKKAMEFLKYINAKLPGALELEYEGFYKRGFFVTKKKYAVIDEEGKITTRGLEIVRRDWSEIAKETQARVLEALLKDGDVEKAVRIVKEVTEKLSKYEVPPEKLVIHEQITRDLKDYKATGPHVAVAKRLAARGVKIRPGTVISYIVLKGSGRIGDRAIPFDEFDPTKHKYDAEYYIENQVLPAVERILRAFGYRKEDLRYQKTRQVGLSAWLKPKGT\n>4chk_E mol:protein length:127  AUXIN RESPONSE FACTOR 5\nGAMSKGSSWQKIATPRVRTYTKVQKTGSVGRSIDVTSFKDYEELKSAIECMFGLEGLLTHPQSSGWKLVYVDYESDVLLVGDDPWEEFVGCVRCIRILSPTEVQQMSEEGMKLLNSAGINDLKTSVS\n>5yfm_A mol:protein length:414  Isocitrate dehydrogenase [NADP] cytoplasmic\nMSKKISGGSVVEMQGDEMTRIIWELIKEKLIFPYVELDLHSYDLGIENRDATNDQVTKDAAEAIKKHNVGVKCATITPDEKRVEEFKLKQMWKSPNGTIRNILGGTVFREAIICKNIPRLVSGWVKPIIIGRHAYGDQYRATDFVVPGPGKVEITYTPSDGTQKVTYLVHNFEEGGGVAMGMYNQDKSIEDFAHSSFQMALSKGWPLYLSTKNTILKKYDGRFKDIFQEIYDKQYKSQFEAQKIWYEHRLIDDMVAQAMKSEGGFIWACKNYDGDVQSDSVAQGYGSLGMMTSVLVCPDGKTVEAEAAHGTVTRHYRMYQKGQETSTNPIASIFAWTRGLAHRAKLDNNKELAFFANALEEVSIETIEAGFMTKDLAACIKGLPNVQRSDYLNTFEFMDKLGENLKIKLAQAKL\n>1h0k_B mol:protein length:364  2,4-DIENOYL-COA REDUCTASE\nMITAQAVLYTQHGEPKDVLFTQSFEIDDDNLAPNEVIVKTLGSPINPSDINQIQGVYPSKPAKTTGFGTAEPAAPCGNEGLFEVIKVGSNVSSLEAGDWVIPSHVNFGTWRTHALGNDDDFIKLPNPAQSKANGKPNGLTINQGATISVNPLTAYLMLTHYVKLTPGKDWFIQNGGTSAVGKYASQIGKLLNFNSISVIRDRPNLDEVVASLKELGATQVITEDQNNSKEFGPTIKEWIKQSGGEAKLALNCVGGKSSTGIARKLNNNGLMLTYGGMSFQPVTIPTSLYIFKNFTSAGFWVTELLKNNKELKTSTLNQIIAWYEEGKLTDAKSIETLYDGTKPLHELYQDGVANSKDGKQLITY\n>1b4n_B mol:protein length:619  FORMALDEHYDE FERREDOXIN OXIDOREDUCTASE\nMYGWWGRILRVNLTTGEVKVQEYPEEVAKKFIGGRGLAAWILWNEARGVEPLSPENKLIFAAGPFNGLPTPSGGKLVVAAKSPLTGGYGDGNLGTMASVHLRRAGYDALVVEGKAKKPVYIYIEDDNVSILSAEGLWGKTTFETERELKEIHGKNVGVLTIGPAGENLVKYAVVISQEGRAAGRPGMGAVMGSKKLKAVVIRGTKEIPVADKEELKKLSQEAYNEILNSPGYPFWKRQGTMAAVEWCNTNYALPTRNFSDGYFEFARSIDGYTMEGMKVQQRGCPYCNMPCGNVVLDAEGQESELDYENVALLGSNLGIGKLNEVSVLNRIADEMGMDTISLGVSIAHVMEAVERGILKEGPTFGDFKGAKQLALDIAYRKGELGNLAAEGVKAMAEKLGTHDFAMHVKGLEVSGYNCYIYPAMALAYGTSAIGAHHKEAWVIAWEIGTAPIEGEKAEKVEYKISYDPIKAQKVVELQRLRGGLFEMLTACRLPWVEVGLSLDYYPKLLKAITGVTYTWDDLYKAADRVYSLIRAYWVREFNGKWDRKMDYPPKRWFTEGLKSGPHKGEHLDEKKYDELLSEYYRIRGWDERGIPKKETLKELDLDFVIPELEKVTNLE\n>5b66_c mol:protein length:455  Photosystem II CP43 reaction center protein\nNSIFATNRDQESSGFAWWAGNARLINLSGKLLGAHVAHAGLIVFWAGAMTLFELAHFIPEKPMYEQGLILIPHIATLGWGVGPGGEVVDTFPFFVVGVVHLISSAVLGFGGVYHAIRGPETLEEYSSFFGYDWKDKNKMTTILGFHLIVLGIGALLLVAKAMFFGGLYDTWAPGGGDVRVITNPTLDPRVIFGYLLKSPFGGEGWIVSVNNLEDVVGGHIWIGLICIAGGIWHILTTPFGWARRAFIWSGEAYLSYSLGALSMMGFIATCFVWFNNTVYPSEFYGPTGPEASQAQAMTFLIRDQKLGANVGSAQGPTGLGKYLMRSPTGEIIFGGETMRFWDFRGPWLEPLRGPNGLDLNKIKNDIQPWQERRAAEYMTHAPLGSLNSVGGVATEINSVNFVSPRSWLATSHFVLAFFFLVGHLWHAGRARAAAAGFEKGIDRESEPVLSMPSLD\n>6ujv_A mol:protein length:129  Envelope glycoprotein GP41\nLLELDKWASLWNWFDITNWLWYIRIFIIIVGSLIGLRIVFAVLSLVNRVRQGYSPLSFQTHLPTPRGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLSLFSYHRLRDLLLIVTRIVELLGRR\n>5lzf_d mol:protein length:205  30S ribosomal protein S4\nARYLGPKLKLSRREGTDLFLKSGVRAIDTKCKIEQAPGQHGARKPRLSDYGVQLREKQKVRRIYGVLERQFRNYYKEAARLKGNTGENLLALLEGRLDNVVYRMGFGATRAEARQLVSHKAIMVNGRVVNIASYQVSPNDVVSIREKAKKQSRVKAALELAEQREKPTWLEVDAGKMEGTFKRKPERSDLSADINEHLIVELYSK\n>3j92_l mol:protein length:51  eL39\nMSSHKTFRIKRFLAKKQKQNRPIPQWIRMKTGNKIRYNSKRRHWRRTKLGL\n>4ato_A mol:protein length:194  TOXN\nMTNKDNPKFHTISTEYIDYLREADSKVPFNKDEQHSRPYVGVLEKINGHDYFVPLTSRNDKNFNSQVSVKLFDNDEKRIGVLLVNNMIPVPEKECKEIDIAEKTAADPQYGNLMLKQYLFLKENMDRVTNKVEKVYKDVTVQGKPSHKQKFLKGVCCDFPKLEEKCQEYKERDQAKERDKARRIAYMRQMGRER\n>6sh8_N mol:protein length:174  CRISPR-associated protein Cmrx\nMSTQREYVFIPITNSITIDVKITIGGSDHITNIDERGIHNVLVITGYAVDEKNGRLVPTLDPCDYVKGILVAGTPQQAQSNDFLTLKLPANKLYLIRKKGNISDDLKIYIPYSSPDARNSMKTKPVSISDDTIVNNIIKEVFDKIYNITQKEKVKIEKVKEDIKELFSYYALEQ\n>4v86_S mol:protein length:520  Capsid protein VP1\nGADGVGNASGNWHCDSTWLGDRVITTSTRTWALPTYNNHLYKQISSASTGASNDNHYFGYSTPWGYFDFNRFHCHFSPRDWQRLINNNWGFRPKRLNFKLFNIQVKEVTTNDGVTTIANNLTSTVQVFSDSEYQLPYVLGSAHQGCLPPFPADVFMIPQYGYLTLNNGSQAVGRSSFYCLEYFPSQMLRTGNNFTFSYTFEDVPFHSSYAHSQSLDRLMNPLIDQYLYYLNRTQNQSGSAQNKDLLFSRGSPAGMSVQPKNWLPGPCYRQQRVSKTKTDNNNSNFTWTGASKYNLNGRESIINPGTAMASHKDDKDKFFPMSGVMIFGKESAGASNTALDNVMITDEEEIKATNPVATERFGTVAVNLQSSSTDPATGDVHVMGALPGMVWQDRDVYLQGPIWAKIPHTDGHFHPSPLMGGFGLKHPPPQILIKNTPVPANPPAEFSATKFASFITQYSTGQVSVEIEWELQKENSKRWNPEVQYTSNYAKSANVDFTVDNNGLYTEPRPIGTRYLTRPL\n>4kis_B mol:protein length:328  Putative integrase [Bacteriophage A118]\nRDRMVMGKIKRIEAGLPLTTAKGRTFGYDVIDTKLYINEEEAKQLRLIYDIFEEEQSITFLQKRLKKLGFKVRTYNRYNNWLTNDLYCGYVSYKDKVHVKGIHEPIISEEQFYRVQEIFSRMGKNPNMNKESASLLNNLVVCSKCGLGFVHRRKDTVSRGKKYHYRYYSCKTYKHTHELEKCGNKIWRADKLEELIIDRVNNYSFASRNIDKEDELDSLNEKLKIEHAKKKRLFDLYINGSYEVSELDSMMNDIDAQINYYEAQIEANEELKKNKKIQENLADLATVDFNSLEFREKQLYLKSLINKIYIDGEQVTIEWLLEHHHHHH\n>3vap_A mol:protein length:272  Aurora kinase A\nGAMGSKRQWALEDFEIGRPLGKGKFGNVYLAREKQSKFILALKVLFKAQLEKAGVEHQLRREVEIQSHLRHPNILRLYGYFHDATRVYLILEYAPLGTVYRELQKLSKFDEQRTATYITELANALSYCHSKRVIHRDIKPENLLLGSAGELKIADFGWSVHAPSSRRTTLCGTLDYLPPEMIEGRMHDEKVDLWSLGVLCYEFLVGKPPFEANTYQETYKRISRVEFTFPDFVTEGARDLISRLLKHNPSQRPMLREVLEHPWITANSSKPS\n>2ybu_F mol:protein length:381  ACIDIC MAMMALIAN CHITINASE\nEAEAYQLTCYFTNWAQYRPGLGRFMPDDINPCLCTHLIYAFAGMQNNEITTIEWNDVTLYQAFNGLKNKNSQLKTLLAIGGWNFGTAPFTAMVSTPENRQTFITSVIKFLRQYEFDGLDFDWEYPGSRGSPPQDKHLFTVLVQEMREAFEQEAKQINKPRLMVTAAVAAGISNIQSGYEIPQLSQYLDYIHVMTYDLHGSWEGYTGENSPLYKYPTDTGSNAYLNVDYVMNYWKDNGAPAEKLIVGFPTYGHNFILSNPSNTGIGAPTSGAGPAGPYAKESGIWAYYEICTFLKNGATQGWDAPQEVPYAYQGNVWVGYDNIKSFDIKAQWLKHNKFGGAMVWAIDLDDFTGTFCNQGKFPLISTLKKALGLQSASCTAPA\n>7ebk_A mol:protein length:187  Tripartite motif-containing protein 66\nSPIENEDFCAVCINGGELLCCDRCPKVYHLSCHVPALLSFPGGEWVCTLCRSLTQPEMEYDCENARYGVRVLPGLSMYDQKKCEKLVLSLCCNSLSLPFHEPVSPLARHYYQIIKRPMDLSIIRRKLQKKDPAHYTTPEEVVSDVRLMFWNCAKFNYPDSEVAEAGRCLEVFFEGWLKEIYPDKCFA\n>4pcf_B mol:protein length:239  Ma18-TIM\nMSKPQPIAAANWKSGSPDSLSGLIDLFNSTSINHDVQCVVASTFVHLAMTKERLSHPKFVIAAQNAGNTDALASLKDFGVNWIVLGHFERRWYYGETNEIVADKVAAAVASGFMVIACIGETLQERESGRTAVVVLTQIAAIAKKLKKADWAKVVIAYEPVWAIGTGKVVTPQQAQEAHALIRSWVSSKIGADVAGELRILYGGSVNGKNARTLYQQRDVNGFLAGLKPEFVDIIKATQ\n>3txx_F mol:protein length:359  Putrescine carbamoyltransferase\nMGSSHHHHHHSSGLVPRGSHMKRDYVTTETYTKEEMHYLVDLSLKIKEAIKNGYYPQLLKNKSLGMIFQQSSTRTRVSFETAMEQLGGHGEYLAPGQIQLGGHETIEDTSRVLSRLVDILMARVERHHSIVDLANCATIPVINGMSDYNHPTQELGDLCTMVEHLPEGKKLEDCKVVFVGDATQVCFSLGLITTKMGMNFVHFGPEGFQLNEEHQAKLAKNCEVSGGSFLVTDDASSVEGADFLYTDVWYGLYEAELSEEERMKVFYPKYQVNQEMMDRAGANCKFMHCLPATRGEEVTDEVIDGKNSICFDEAENRLTSIRGLLVYLMNDYEAKNPYDLIKQAEAKKELEVFLDTQSI\n>6oro_A mol:protein length:153  RC1 variant of HIV-1 Env glycoprotein gp41\nAVGIGAVSLGFLGAAGSTMGAASMTLTVQARNLLSGIVQQQSNLLRAPEPQQHLLKDTHWGIKQLQARVLAVEHYLRDQQLLGIWGCSGKLICCTNVPWNSSWSNRNLSEIWDNMTWLQWDKEISNYTQIIYGLLEESQNQQEKNEQDLLALD\n>2yso_A mol:protein length:46  Zinc finger protein 95 homolog\nGSSGSSGSREKSHQCRECGEIFFQYVSLIEHQVLHMGQKNSGPSSG\n>7nal_H mol:protein length:697  NAD(+) hydrolase SARM1\nLAVPGPDGGGGTGPWWAAGGRGPREVSPGAGTEVQDALERALPELQQALSALKQAGGARAVGAGLAEVFQLVEEAWLLPAVGREVAQGLCDAIRLDGGLDLLLRLLQAPELETRVQAARLLEQILVAENRDRVARIGLGVILNLAKEREPVELARSVAGILEHMFKHSEETCQRLVAAGGLDAVLYWCRRTDPALLRHCALALGNCALHGGQAVQRRMVEKRAAEWLFPLAFSKEDELLRLHACLAVAVLATNKEVEREVERSGTLALVEPLVASLDPGRFARCLVDASDTSQGRGPDDLQRLVPLLDSNRLEAQCIGAFYLCAEAAIKSLQGKTKVFSDIGAIQSLKRLVSYSTNGTKSALAKRALRLLGEEVPRPILPSVPSWKEAEVQTWLQQIGFSKYCESFREQQVDGDLLLRLTEEELQTDLGMKSGITRKRFFRELTELKTFANYSTCDRSNLADWLGSLDPRFRQYTYGLVSCGLDRSLLHRVSEQQLLEDCGIHLGVHRARILTAAREMLHSPLPCTGGKPSGDTPDVFISYRRNSGSQLASLLKVHLQLHGFSVFIDVEKLEAGKFEDKLIQSVMGARNFVLVLSPGALDKCMQDHDCKDWVHKEIVTALSCGKNIVPIIDGFEWPEPQVLPEDMQAVLTFNGIKWSHEYQEATIEKIIRFLQGRSSRDSSAGSDTSLEGAAPMGPT\n>3dv5_C mol:protein length:402  Beta-secretase 1\nGPDEEPEEPGRRGSFVEMVDNLRGKSGQGYYVEMTVGSPPQTLNILVDTGSSNFAVGAAPHPFLHRYYQRQLSSTYRDLRKGVYVPYTQGKWEGELGTDLVSIPHGPNVTVRANIAAITESDKFFINGSNWEGILGLAYAEIARPDDSLEPFFDSLVKQTHVPNLFSLQLCGAGFPLNQSEVLASVGGSMIIGGIDHSLYTGSLWYTPIRREWYYEVIIVRVEINGQDLKMDCKEYNYDKSIVDSGTTNLRLPKKVFEAAVKSIKAASSTEKFPDGFWLGEQLVCWQAGTTPWNIFPVISLYLMGEVTNQSFRITILPQQYLRPVEDVATSQDDCYKFAISQSSTGTVMGAVIMEGFYVVFDRARKRIGFAVSACHVHDEFRTAAVEGPFVTLDMEDCGYNI\n>5lky_C mol:protein length:300  N-acetylneuraminate lyase\nMEHHHHHHNKDLKGLYAALLVPFDENGQVNEQGLKQIAQNAIETEELDGLYVNGSSGENFLLNTEQKKQVFKVAKEAVGDKVKLIAQVGSLDLNEAIELGKYATELGYDALSAVTPFYYPFTFEEIRDYYFDIIEATQNNMIIYAIPDLTGVNISIEQFSELFNHEKIVGVKYTAPNFFLLERIRKAFPDKLILSGCDEMLVQATISGVDGAIGSTYNVNGRRARKIFDLARQGQIQEAYQLQHDSNDIIETVLSMGIYPTLKEILRHRGIDAGLPKRPFKPFNEAHRQTLDQLIAKYDL\n>5lzz_OO mol:protein length:168  uS11\nMKARALSGSGVRRRRAAMAPRKGKEKKEEQVISLGPQVAEGENVFGVCHIFASFNDTFVHVTDLSGKETICRVTGGMKVKADRDESSPYAAMLAAQDVAQRCKELGITALHIKLRATGGNRTKTPGPGAQSALRALARSGMKIGRIEDVTPIPSDSTRRKGGRRGRRL\n>6swb_A mol:protein length:135  Two-component response regulator\nHHHHHHWKVLIADDEAIIREGIRESIDWNEFNMEVVAEAEDGEEALELALRHRVDVLFVDLSMPIMDGLTLMKYAREKLPNCHMIVITGYDEFSYAQEAIRLQVDDYLLKPTDPQRLREVVAKVKEKLEQEQKEK\n>1z7h_A mol:protein length:447  Tetanus toxin light chain\nGSHMMPITINNFRYSDPVNNDTIIMMEPPYCKGLDIYYKAFKITDRIWIVPERYEFGTKPEDFNPPSSLIEGASEYYDPNYLRTDSDKDRFLQTMVKLFNRIKNNVAGEALLDKIINAIPYLGNSYSLLDKFDTNSNSVSFNLLEQDPSGATTKSAMLTNLIIFGPGPVLNKNEVRGIVLRVDNKNYFPCRDGFGSIMQMAFCPEYVPTFDNVIENITSLTIGKSKYFQDPALLLMHELIHVLHGLYGMQVSSHEIIPSKQEIYMQHTYPISAEELFTFGGQDANLISIDIKNDLYEKTLNDYKAIANKLSQVTSCNDPNIDIDSYKQIYQQKYQFDKDSNGQYIVNEDKFQILYNSIMYGFTEVELGKKFNIKTRLSYFSMNHDPVKIPNLLDDTIYNDTEGFNIESKDLKSEYKGQNMRVNTNAFRNVDGSGLVSKLIGLCKKII\n>6sic_o mol:protein length:174  CRISPR-associated protein Cmrx\nMSTQREYVFIPITNSITIDVKITIGGSDHITNIDERGIHNVLVITGYAVDEKNGRLVPTLDPCDYVKGILVAGTPQQAQSNDFLTLKLPANKLYLIRKKGNISDDLKIYIPYSSPDARNSMKTKPVSISDDTIVNNIIKEVFDKIYNITQKEKVKIEKVKEDIKELFSYYALEQ\n>1nlq_C mol:protein length:108  Nucleoplasmin-like protein\nMAEESFYGVTLTAESDSVTWDVDEDYARGQKLVIKQILLGAEAKENEFNVVEVNTPKDSVQIPIAVLKAGETRAVNPDVEFYESKVTFKLIKGSGPVYIHGHNIKDDV\n>3gtc_A mol:protein length:358  Beta-lactamase\nAPQQINDIVHRTITPLIEQQKIPGMAVAVIYQGKPYYFTWGYADIAKKQPVTQQTLFELGSVSKTFTGVLGGDAIARGEIKLSDPTTKYWPELTAKQWNGITLLHLATYTAGGLPLQVPDEVKSSSDLLRFYQNWQPAWAPGTQRLYANSSIGLFGALAVKPSGLSFEQAMQTRVFQPLKLNHTWINVPPAEEKNYAWGYREGKAVHVSPGALDAEAYGVKSTIEDMARWVQSNLKPLDINEKTLQQGIQLAQSRYWQTGDMYQGLGWEMLDWPVNPDSIINGSDNKIALAARPVKAITPPTPAVRASWVHKTGATGGFGSYVAFIPEKELGIVMLANKNYPNPARVDAAWQILNALQ\n>7av1_A mol:protein length:613  Leukotriene A-4 hydrolase\nGPGPEIVDTCSLASPASVCRTKHLHLRCSVDFTRRTLTGTAALTVQSQEDNLRSLVLDTKDLTIEKVVINGQEVKYALGERQSYKGSPMEISLPIALSKNQEIVIEISFETSPKSSALQWLTPEQTSGKEHPYLFSQCQAIHCRAILPCQDTPSVKLTYTAEVSVPKELVALMSAIRDGETPDPEDPSRKIYKFIQKVPIPCYLIALVVGALESRQIGPRTLVWSEKEQVEKSAYEFSETESMLKIAEDLGGPYVWGQYDLLVLPPSFPYGGMENPCLTFVTPTLLAGDKSLSNVIAHEISHSWTGNLVTNKTWDHFWLNEGHTVYLERHICGRLFGEKFRHFNALGGWGELQNSVKTFGETHPFTKLVVDLTDIDPDVAYSSVPYEKGFALLFYLEQLLGGPEIFLGFLKAYVEKFSYKSITTDDWKDFLYSYFKDKVDVLNQVDWNAWLYSPGLPPIKPNYDMTLTNACIALSQRWITAKEDDLNSFNATDLKDLSSHQLNEFLAQTLQRAPLPLGHIKRMQEVYNFNAINNSEIRFRWLRLCIQSKWEDAIPLALKMATEQGRMKFTRPLFKDLAAFDKSHDQAVRTYQEHKASMHPVTAMLVGKDLKVD\n>3wkm_B mol:protein length:180  Putative zinc metalloprotease aq_1964\nGSEVPKYLKEPVVVGYVQRDSIAQKIGIKPGDKIIKINGYEVRTWEDLRDALIRLSLDGVKETTLFLERNGEVLHLTIKVPNVQKGEELGIAPLVKPVVGGVKKGSPADQVGIKPGDLILEVNGKKINTWYELVEEVRKSQGKAIKLKILRNGKMIEKELIPAKDPKTGTYFIGLFPKTE\n>7mei_e mol:protein length:215  DNA-directed RNA polymerases I, II, and III subunit RPABC1\nMDQENERNISRLWRAFRTVKEMVKDRGYFITQEEVELPLEDFKAKYCDSMGRPQRKMMSFQANPTEESISKFPDMGSLWVEFCDEPSVGVKTMKTFVIHIQEKNFQTGIFVYQNNITPSAMKLVPSIPPATIETFNEAALVVNITHHELVPKHIRLSSDEKRELLKRYRLKESQLPRIQRADPVALYLGLKRGEVVKIIRKSETSGRYASYRICM\n>1e67_D mol:protein length:128  AZURIN\nAECSVDIQGNDQMQFNTNAITVDKSCKQFTVNLSHPGNLPKNVMGHNWVLSTAADMQGVVTDGMASGLDKDYLKPDDSRVIAHTKLIGSGEKDSVTFDVSKLKEGEQYMFFCTFPGHSALMKGTLTLK\n>5dzn_F mol:protein length:114  T-cell immunoglobulin and mucin domain-containing protein 4\nMVTSETVVTEVLGHRVTLPCLYSSWSHNSNSMCWGKDQCPYSGCKEALIRTDGMRVTSRKSAKYRLQGTIPRGDVSLTILNPSESDSGVYCCRIEVPGWFNDVKINVRLNLQRA\n>3s34_L mol:protein length:214  1121B Fab light chain\nDIQMTQSPSSVSASIGDRVTITCRASQGIDNWLGWYQQKPGKAPKLLIYDASNLDTGVPSRFSGSGSGTYFTLTISSLQAEDFAVYFCQQAKAFPPTFGGGTKVDIKRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC\n>6wz5_A mol:protein length:135  Histone H3.2\nARTKQTARKSTGGKAPRKQLATKAARKSAPATGGVKKPHRYRPGTVALREIRRYQKSTELLIRKLPFQRLVREIAQDFKTDLRFQSSAVMALQEASEAYLVALFEDTNLCAIHAKRVTIMPKDIQLARRIRGERA\n>6r1u_A mol:protein length:135  Histone H3.2\nARTKQTARKSTGGKAPRKQLATKAARKSAPATGGVKKPHRYRPGTVALREIRRYQKSTELLIRKLPFQRLVREIAQDFKTDLRFQSSAVMALQEASEAYLVALFEDTNLCAIHAKRVTIMPKDIQLARRIRGERA\n>1ht6_A mol:protein length:405  ALPHA-AMYLASE ISOZYME 1\nHQVLFQGFNWESWKQSGGWYNMMMGKVDDIAAAGVTHVWLPPPSHSVSNEGYMPGRLYDIDASKYGNAAELKSLIGALHGKGVQAIADIVINHRCADYKDSRGIYCIFEGGTSDGRLDWGPHMICRDDTKYSDGTANLDTGADFAAAPDIDHLNDRVQRELKEWLLWLKSDLGFDAWRLDFARGYSPEMAKVYIDGTSPSLAVAEVWDNMATGGDGKPNYDQDAHRQNLVNWVDKVGGAASAGMVFDFTTKGILNAAVEGELWRLIDPQGKAPGVMGWWPAKAVTFVDNHDTGSTQAMWPFPSDKVMQGYAYILTHPGIPCIFYDHFFNWGFKDQIAALVAIRKRNGITATSALKILMHEGDAYVAEIDGKVVVKIGSRYDVGAVIPAGFVTSAHGNDYAVWEKN\n>2av7_E mol:protein length:100  Beta-2-microglobulin\nMIQRTPKIQVYSRHPAENGKSNFLNCYVSGFHPSDIEVDLLKNGERIEKVEHSDLSFSKDWSFYLLYYTEFTPTEKDEYACRVNHVTLSQPKIVKWDRDM\n>5pcd_A mol:protein length:138  Bromodomain adjacent to zinc finger domain protein 2B\nMHHHHHHSSGVDLGTENLYFQSMSVKKPKRDDSKDLALCSMILTEMETHEDAWPFLLPVNLKLVPGYKKVIKKPMDFSTIREKLSSGQYPNLETFALDVRLVFDNCETFNEDDSDIGRAGHNMRKYFEKKWTDTFKVS\n>5cx1_L mol:protein length:523  Nitrogenase molybdenum-iron protein beta chain\nMSQQVDKIKASYPLFLDQDYKDMLAKKRDGFEEKYPQDKIDEVFQWTTTKEYQELNFQREALTVNPAKACQPLGAVLCALGFEKTMPYVHGSQGCVAYFRSYFNRHFREPVSCVSDSMTEDAAVFGGQQNMKDGLQNCKATYKPDMIAVSTTCMAEVIGDDLNAFINNSKKEGFIPDEFPVPFAHTPSFVGSHVTGWDNMFEGIARYFTLKSMDDKVVGSNKKINIVPGFETYLGNFRVIKRMLSEMGVGYSLLSDPEEVLDTPADGQFRMYAGGTTQEEMKDAPNALNTVLLQPWHLEKTKKFVEGTWKHEVPKLNIPMGLDWTDEFLMKVSEISGQPIPASLTKERGRLVDMMTDSHTWLHGKRFALWGDPDFVMGLVKFLLELGCEPVHILCHNGNERWKKAVDAILAASPYGKNATVYIGKDLWHLRSLVFTDKPDFMIGNSYGKFIQRDTLHKGKEFEVPLIRIGFPIFDRHHLHRSTTLGYEGAMQILTTLVNSILERLDEETRGMQATDYNHDLVR\n>3cw1_1 mol:protein length:86  Small nuclear ribonucleoprotein F\nMSLPLNPKPFLNGLTGKPVMVKLKWGMEYKGYLVSVDGYMNMQLANTEEYIDGALSGHLGEVLIRCNNVLYIRGVEEEEEDGEMRE\n>7toc_A mol:protein length:363  Ketol-acid reductoisomerase, mitochondrial\nSNAPVVSAAPLATRGLKTINFGGTEEVVHERADWPREKLLEYFKNDTMALIGYGSQGYGQGLNLRDNGLNVIIGVRKNGASWKAAIEDGWVPGENLFDVKEAITKGTIIMNLLSDAAQSETWPDLKPLITEGKTLYFSHGFSPVFKDLTKVEPPSNVDVILAAPKGSGRTVRSLFLEGRGINSSYAVWNDVTGKAEEKAIAMAVAIGSGYVYQTTFEREVNSDLYGERGCLMGGIHGMFLAQYEVLRENGHTPSEAFNETVEEATQSLYPLIGKYGMDYMYDACSTTARRGALDWYPRFKDALKPVFVELYESVKNGTETQRSLDFNGAPDYRERLEEELETIRNMEIWKVGKEVRKLRPENQ\n>6yfg_IG mol:protein length:130  coat protein\nSKPIAIFKLRELSSDSTLFTLPGHSVTLPNTLGIVSHLPTPRKGNPGTVKTMRNLRKTILLGAGTASERAVPIVIKTETSFPVGTTEEDRAEVLKQMASFLIEEVKNNQELAYSGYVQDKYFIEDLVITE\n>4ac5_H mol:protein length:258  REACTION CENTER PROTEIN H CHAIN\nMYHGALAQHLDIAQLVWYAQWLVIWTVVLLYLRREDRREGYPLVEPLGLVKLAPEDGQVYELPYPKTFVLPHGGTVTVPRRRPETRELKLAQTDGFEGAPLQPTGNPLVDAVGPASYAERAEVVDATVDGKAKIVPLRVATDFSIAEGDVDPRGLPVVAADGVEAGTVTDLWVDRSEHYFRYLELSVAGSARTALIPLGFCDVKKDKIVVTSILSEQFANVPRLQSRDQITLREEDKVSAYYAGGLLYATPERAESLL\n>5m9e_B mol:protein length:77  Microtubule integrity protein mal3\nSGSAKQAQQQITSLETQLYEVNETMFGLERERDFYFNKLREIEILVQTHLTTSPMSMENMLERIQAILYSTEDGFEL\n>5o61_BH mol:protein length:132  30S ribosomal protein S8\nMTMTDPIADFLTRLRNANSAYHDEVTLPHSKLKANIAEILKREGYISDYRTEDARVGKSLVVQLKYGPSRERSIAGLRRVSKPGLRVYAKSTNLPRVLGGLGVAIISTSSGLLTDRQAARQGVGGEVLAYVW\n>6owg_CF mol:protein length:105  Ethanolamine utilization protein EutN/carboxysome structural protein Ccml\nMQMAKVCGTVVGTQKLPSMTGVKLLLLQFIDANGELLPKYEVAADPVGAGLGEWVLVNRGSAARQTEYHQNRPLDAMVVAIIDTVTVNNRRLYGEGSWSHPQFEK\n>6ywv_K mol:protein length:249  60S ribosomal protein L16\nMKHNASSALLSAFQGLRISSSATPFRAASLATSAVRRPIAPTPVSVASHVRLFSATAIQAGSWLEPNLNRKKKMMKGRPRVPTGGSTKGTTVVWGDYGLRMRDHHRRISAQQLKLAEDTIKQRLRGQKYRLYKRVACNVGVYVSGNEMRMGKGKGSFDHWATRVAVNQIIFEIRGQLHEQVIRDAFRLAGHKLPGLYEFVKKGDPPVVGITKLEDGLTVEDLKNPRKKLLMPEITQSAASTSSTAAPPS\n>2f0x_F mol:protein length:148  Thioesterase superfamily member 2\nMTSMTQSLREVIKAMTKARNFERVLGKITLVSAAPGKVICEMKVEEEHTNAIGTLHGGLTATLVDNISTMALLCTERGAPGVSVDMNITYMSPAKLGEDIVITAHVLKQGKTLAFTSVDLTNKATGKLIAQGRHTKHLGNLEHHHHHH\n>2q28_B mol:protein length:564  oxalyl-CoA decarboxylase\nMSDQLQMTDGMHIIVEALKQNNIDTIYGVVGIPVTDMARHAQAEGIRYIGFRHEQSAGYAAAASGFLTQKPGICLTVSAPGFLNGLTALANATVNGFPMIMISGSSDRAIVDLQQGDYEELDQMNAAKPYAKAAFRVNQPQDLGIALARAIRVSVSGRPGGVYLDLPANVLAATMEKDEALTTIVKVENPSPALLPCPKSVTSAISLLAKAERPLIILGKGAAYSQADEQLREFIESAQIPFLPMSMAKGILEDTHPLSAAAARSFALANADVVMLVGARLNWLLAHGKKGWAADTQFIQLDIEPQEIDSNRPIAVPVVGDIASSMQGMLAELKQNTFTTPLVWRDILNIHKQQNAQKMHEKLSTDTQPLNYFNALSAVRDVLRENQDIYLVNEGANTLDNARNIIDMYKPRRRLDCGTWGVMGIGMGYAIGASVTSGSPVVAIEGDSAFGFSGMEIETICRYNLPVTIVIFNNGGIYRGDGVDLSGAGAPSPTDLLHHARYDKLMDAFRGVGYNVTTTDELRHALTTGIQSRKPTIINVVIDPAAGTESGHITKLNPKQVAGN\n>3n7k_A mol:protein length:426  Botulinum neurotoxin type C1\nNNINDSKILSLQNRKNTLVDTSGYNAEVSEEGDVQLNPIFPFDFKLGSSGEDRGKVIVTQNENIVYNSMYESFSISFWIRINKWVSNLPGYTIIDSVKNNSGWSIGIISNFLVFTLKQNEDSEQSINFSYDISNNAPGYNKWFFVTVTNNMMGNMKIYINGKLIDTIKVKELTGINFSKTITFEINKIPDTGLITSDSDNINMWIRDFYIFAKELDGKDINILFNSLQYTNVVKDYWGNDLRYNKEYYMVNIDYLNRYMYANSRQIVFNTRRNNNDFNEGYKIIIKRIRGNTNDTRVRGGDILYFDMTINNKAYNLFMKNETMYADNHSTEDIYAIGLREQTKDINDNIIFQIQPMNNTYYYASQIFKSNFNGENISGICSIGTYRFRLGGDWYRHNYLVPTVKQGNYASLLESTSTHWGFVPVSE\n>6q6g_A mol:protein length:1855  Anaphase-promoting complex subunit 1,Anaphase-promoting complex subunit 1\nMSNFYEERTTMIAARDLQEFVPFGRDHCKHHPNALNLQLRQLQPASELWSSDGAAGLVGSLQEVTIHEKQKESWQLRKGVSEIGEDVDYDEELYVAGNMVIWSKGSKSQALAVYKAFTVDSPVQQALWCDFIISQDKSEKAYSSNEVEKCICILQSSCINMHSIEGKDYIASLPFQVANVWPTKYGLLFERSASSHEVPPGSPREPLPTMFSMLHPLDEITPLVCKSGSLFGSSRVQYVVDHAMKIVFLNTDPSIVMTYDAVQNVHSVWTLRRVKSEEENVVLKFSEQGGTPQNVATSSSLTAHLRLAPETEPIVPELCIDHLWTETITNIREKNSQASKVFITSDLCGQKFLCFLVESQLQLRCVKFQESNDKTQLIFGSVTNIPAKDAAPVEKIDTMLVLEGSGNLVLYTGVVRVGKVFIPGLPAPSLTMSNTMPRPSTPLDGVSTPKPLSKLLGSLDEVVLLSPVPELRDSSKLHDSLYNEDCTFQQLGTYIHSIRDPVHNRVTLELSNGSMVRITIPEIATSELVQTCLQAIKFILPKEIAVQMLVKWYNVHSAPGGPSYHSEWNLFVTCLMNMMGYNTDRLAWTRNFDFEGSLSPVIAPKKARPSETGSDDDWEYLLNSDYHQNVESHLLNRSLCLSPSEASQMKDEDFSQNLSLDSSTLLFTHIPAIFFVLHLVYEELKLNTLMGEGICSLVELLVQLARDLKLGPYVDHYYRDYPTLVRTTGQVCTIDPGQTGFMHHPSFFTSEPPSIYQWVSSCLKGEGMPPYPYLPGICERSRLVVLSIALYILGDESLVSDESSQYLTRITIAPQKLQVEQEENRFSFRHSTSVSSLAERLVVWMTNVGFTLRDLETLPFGIALPIRDAIYHCREQPASDWPEAVCLLIGRQDLSKQACEGNLPKGKSVLSSDVPSGTETEEEDDGMNDMNHEVMSLIWSEDLRVQDVRRLLQSAHPVRVNVVQYPELSDHEFIEEKENRLLQLCQRTMALPVGRGMFTLFSYHPVPTEPLPIPKLNLTGRAPPRNTTVDLNSGNIDVPPNMTSWASFHNGVAAGLKIAPASQIDSAWIVYNKPKHAELANEYAGFLMALGLNGHLTKLATLNIHDYLTKGHEMTSIGLLLGVSAAKLGTMDMSITRLLSIHIPALLPPTSTELDVPHNVQVAAVVGIGLVYQGTAHRHTAEVLLAEIGRPPGPEMEYCTDRESYSLAAGLALGMVCLGHGSNLIGMSDLNVPEQLYQYMVGGHRRFQTGMHREKHKSPSYQIKEGDTINVDVTCPGATLALAMIYLKTNNRSIADWLRAPDTMYLLDFVKPEFLLLRTLARCLILWDDILPNSKWVDSNVPQIIRENSISLSEIELPCSEDLNLETLSQAHVYIIAGACLSLGFRFAGSENLSAFNCLHKFAKDFMTYLSAPNASVTGPHNLETCLSVVLLSLAMVMAGSGNLKVLQLCRFLHMKTGGEMNYGFHLAHHMALGLLFLGGGRYSLSTSNSSIAALLCALYPHFPAHSTDNRYHLQALRHLYVLAAEPRLLVPVDVDTNTPCYALLEVTYKGTQWYEQTKEELMAPTLLPELHLLKQIKVKGPRYWELLIDLSKGTQHLKSILSKDGVLYVKLRAGQLSYKEDPMGWQSLLAQTVANRNSEARAFKPETISAFTSDPALLSFAEYFCKPTVNMGQKQEILDLFSSVLYECVTQETPEMLPAYIAMDQAIRRLGRREMSETSELWQIKLVLEFFSSRSHQERLQNHPKRGLFMNSEFLPVVKCTIDNTLDQWLQVGGDMCVHAYLSGQPLEESQLSMLACFLVYHSVPAPQHLPPIGLEGSTSFAELLFKFKQLKMPVRALLRLAPLLLGNPQPMVM\n>6riq_F mol:protein length:144  MinC\nKDSAPRKPAEEPSPSVGEARPEPAKAEEKPAEPVSRPTKVVKTPVRGGMQIYAAGGDLIVLAAVSPGAELLADGNIHVYGPMRGRALAGVKGDATARIFCQQLAAELVSIAGNYKVAEDLRRSPQWGKAVHVSLSGDVLNITRL\n>7ohr_v mol:protein length:231  Nucleolar protein 16\nMTSVRKRKMNRSSVGKATRRNKDKQRKINIQSNPIIAANWDYSLTMAQNYKKLGLRAKLQTPAGGKEADLSKVVKRIPLTKPVLDEDEDEDEGEDEQNDYNAATVELDENEIPEGGARIQRDKNGDVVRVVYGKKKNFDADEDVNEIKARDTTEETEVVKKLEELASRPVIRKERSQSEREEEWLEKLYKKHGDDYKKMFFDKKLNIYQQSEGDLKRRLLRWKKRNGIASK\n>4v89_B7 mol:protein length:65  50S ribosomal protein L35\nMPKIKTVRGAAKRFKKTGKGGFKHKHANLRHILTKKATKRKRHLRPKAMVSKGDLGLVIACLPYA\n>3gdv_D mol:protein length:3  YQF peptide\nYQF\n>7du2_M mol:protein length:708  DNA-directed RNA polymerase III subunit RPC5\nMANEEDDPVVQEIDVYLAKSLAEKLYLFQYPVRPASMTYDDIPHLSAKIKPKQQKVELEMAIDTLNPNYCRSKGEQIALNVDGACADETSTYSSKLMDKQTFCSSQTTSNTSRYAAALYRQGELHLTPLHGILQLRPSFSYLDKADAKHREREAANEAGDSSQDEAEDDVKQITVRFSRPESEQARQRRVQSYEFLQKKHAEEPWVHLHYYGLRDSRSEHERQYLLCPGSSGVENTELVKSPSEYLMMLMPPSQEEEKDKPVAPSNVLSMAQLRTLPLADQIKILMKNVKVMPFANLMSLLGPSIDSVAVLRGIQKVAMLVQGNWVVKSDILYPKDSSSPHSGVPAEVLCRGRDFVMWKFTQSRWVVRKEVATVTKLCAEDVKDFLEHMAVVRINKGWEFILPYDGEFIKKHPDVVQRQHMLWTGIQAKLEKVYNLVKETMPKKPDAQSGPAGLVCGDQRIQVAKTKAQQNHALLERELQRRKEQLRVPAVPPGVRIKEEPVSEEGEEDEEQEAEEEPMDTSPSGLHSKLANGLPLGRAAGTDSFNGHPPQGCASTPVARELKAFVEATFQRQFVLTLSELKRLFNLHLASLPPGHTLFSGISDRMLQDTVLAAGCKQILVPFPPQTAASPDEQKVFALWESGDMSDQHRQVLLEIFSKNYRVRRNMIQSRLTQECGEDLSKQEVDKVLKDCCVSYGGMWYLKGTVQS\n>6qiu_P mol:protein length:10  Ataxin-1 phosphopeptide\nKRRWSAPESR\n>7dbc_D mol:protein length:445  Tubulin beta chain\nMREIVHIQAGQCGNQIGAKFWEVISDEHGIDPTGSYHGDSDLQLERINVYYNEATGNKYVPRAILVDLEPGTMDSVRSGPFGQIFRPDNFVFGQSGAGNNWAKGHYTEGAELVDSVLDVVRKESESCDCLQGFQLTHSLGGGTGSGMGTLLISKIREEYPDRIMNTFSVMPSPKVSDTVVEPYNATLSVHQLVENTDETYCIDNEALYDICFRTLKLTTPTYGDLNHLVSATMSGVTTCLRFPGQLNADLRKLAVNMVPFPRLHFFMPGFAPLTSRGSQQYRALTVPELTQQMFDSKNMMAACDPRHGRYLTVAAIFRGRMSMKEVDEQMLNVQNKNSSYFVEWIPNNVKTAVCDIPPRGLKMSATFIGNSTAIQELFKRISEQFTAMFRRKAFLHWYTGEGMDEMEFTEAESNMNDLVSEYQQYQDATADEQGEFEEEEGEDEA\n>2kd3_A mol:protein length:113  Sclerostin\nGSHMNGGRPPHHPYDAKDVSEYSCRELHYTRFLTDGPCRSAKPVTELVCSGQCGPARLLPNAIGRVKWWRPNGPDFRCIPDRYRAQRVQLLCPGGAAPRSRKVRLVASCKCKR\n>3e15_D mol:protein length:312  Glucose-6-phosphate 1-dehydrogenase\nMAHHHHHHMDCQALAKSLEQMNHLHNVKYLEAKDLTDFNQKSAYYICHQIAEKQLSKEGGHVVIGLSGGKTPIDVYKNIALVKDIKIDTSKLIFFIIDERYKRDDHKFSNYNNIKFLFESLKINEKEQLYRPDTSKNIVECVRDYNEKIKNMVKKYTKVDIAILGMGSDFHIASLFPNIFFNIYMNNYQNSYIYDESSIKVANSNDTSDNDNLDLLKEYVYFTTTNNFDVRKRITVSLDLLGNASSKIFLLNSTDKLDLWKNMLLKSYVDVNYCLYPAVYLIDSMNTTVVTCGYTNYPQMLEDIYVSNSSLS\n>6xhv_1S mol:protein length:112  50S ribosomal protein L18\nMARLTAYERRKFRVRNRIKRTGRLRLSVFRSLKHIYAQIIDDEKGVTLVSASSLALKLKGNKTEVARQVGRALAEKALALGIKQVAFDRGPYKYHGRVKALAEGAREGGLEF\n>4l1u_E mol:protein length:138  RNA polymerase-associated protein RTF1 homolog\nGDITHMVSLPEELNRVRLSRHKLERWCHMPFFAKTVTGCFVRIGIGNHNSKPVYRVAEITGVVETAKVYQLGGTRTNKGLQLRHGNDQRVFRLEFVSNQEFTESEFMKWKEAMFSAGMQLPTLDEINKKELSIKEALN\n>4v3p_LX mol:protein length:122  60S ribosomal protein L23a\nRKSKKIRTSVTFHRPKTLKKARDPKYPRVSAPGRNKLDQYQILKYPLTTESAMKKIEDNNTLVFIVDLKADKKKIKAAVKKMYDIQAKKVNTLIRPDGKKKAYVKLTPDYDALDVANKIGII\n>6vwr_A mol:protein length:346  Clavaminate synthase 3\nMGSSHHHHHHSSGLVPRGSHMMMTVVDCSEYSADLLALASRLPRIPRQDLYGFLDAAHEAAGDLPEGLGTALDRFNADGSHDGYLMLRGLPVEDDDDLPATPTSTPAPVDRPLQNMEAMLAVIGRRLGLHTGYRELRSGTVYHDVYPSPGAHHLSSETSETLLEFHTEMAYHVLQPNYVMLACSRADHERKAATLVGSIRKALPLIPEEVRARLFDRPMPCCVDVAFRGGVENPGAIANVKPLYGDPRDPFLGYDRELLAPREPDDVEAVAVLSKALDEVSEAVRLTPGDLLVVDNFRTTHARTPFSPRWDGKDRWLHRVYIRTDRNDQLSGGERAGDVVDFSPRR\n>6hsv_A mol:protein length:124  Toxin B subunit\nTPQNITDLCAEYHNTQIYTLNDKIFSYTESLAGKREMAIITFKNGAIFQVEVPGSQHIDSQKKAIERMKDTLRIAYLTEAKVEKLCVWNNKTPHAIAAISMANGVSALEKEVSALKEKVSALEF\n>4u1v_DW mol:protein length:76  50S ribosomal protein L27\nTRNGRDSEAKRLGVKRFGGESVLAGSIIVRQRGTKFHAGANVGCGRDHTLFAKADGKVKFEVKGPKNRKFISIEAE\n>5s53_D mol:protein length:445  Tubulin beta-2B chain\nMREIVHIQAGQCGNQIGAKFWEVISDEHGIDPTGSYHGDSDLQLERINVYYNEATGNKYVPRAILVDLEPGTMDSVRSGPFGQIFRPDNFVFGQSGAGNNWAKGHYTEGAELVDSVLDVVRKESESCDCLQGFQLTHSLGGGTGSGMGTLLISKIREEYPDRIMNTFSVMPSPKVSDTVVEPYNATLSVHQLVENTDETYCIDNEALYDICFRTLKLTTPTYGDLNHLVSATMSGVTTCLRFPGQLNADLRKLAVNMVPFPRLHFFMPGFAPLTSRGSQQYRALTVPELTQQMFDSKNMMAACDPRHGRYLTVAAIFRGRMSMKEVDEQMLNVQNKNSSYFVEWIPNNVKTAVCDIPPRGLKMSATFIGNSTAIQELFKRISEQFTAMFRRKAFLHWYTGEGMDEMEFTEAESNMNDLVSEYQQYQDATADEQGEFEEEEGEDEA\n>3tbt_I mol:protein length:9  GLYCOPROTEIN G1\nKAPSNFATM\n>6yfg_LM mol:protein length:130  coat protein\nSKPIAIFKLRELSSDSTLFTLPGHSVTLPNTLGIVSHLPTPRKGNPGTVKTMRNLRKTILLGAGTASERAVPIVIKTETSFPVGTTEEDRAEVLKQMASFLIEEVKNNQELAYSGYVQDKYFIEDLVITE\n>2b9v_H mol:protein length:652  alpha-amino acid ester hydrolase\nAPAADAAQAHDPLSVQTGSDIPASVHMPTDQQRDYIKREVMVPMRDGVKLYTVIVIPKNARNAPILLTRTPYNAKGRANRVPNALTMREVLPQGDDVFVEGGYIRVFQDIRGKYGSQGDYVMTRPPHGPLNPTKTDETTDAWDTVDWLVHNVPESNGRVGMTGSSYEGFTVVMALLDPHPALKVAAPESPMVDGWMGDDWFHYGAFRQGAFDYFVSQMTARGGGNDIPRRDADDYTNFLKAGSAGSFATQAGLDQYPFWQRMHAHPAYDAFWQGQALDKILAQRKPTVPMLWEQGLWDQEDMWGAIHAWQALKDADVKAPNTLVMGPWRHSGVNYNGSTLGPLEFEGDTAHQYRRDVFRPFFDEYLKPGSASVHLPDAIIYNTGDQKWDYYRSWPSVCESNCTGGLTPLYLADGHGLSFTHPAADGADSYVSDPAHPVPFISRPFAFAQSSRWKPWLVQDQREAESRPDVVTYETEVLDEPVRVSGVPVADLFAATSGTDSDWVVKLIDVQPAMTPDDPKMGGYELPVSMDIFRGRYRKDFAKPEALQPDATLHYHFTLPAVNHVFAKGHRIMVQIQSSWFPLYDRNPQKFVPNIFDAKPADYTVATQSIHHGGKEATSILLPVVKQKLGPEQKLISEEDLNSAVDHHHHHH\n>7z1z_G mol:protein length:281  Pol polyprotein\nWIENIPLAEEEHNKWHQDAVSLHLEFGIPRTAAEDIVQQCDVCQENKMPSTLRGSNKRGIDHWQVDYTHYEDKIILVWVETNSGLIYAERVKGETGQEFRVQTMKWYAMFAPKSLQSDNGPAFVAESTQLLMKYLGIEHTTGIPWNPQSQALVERTHQTLKNTLEKLIPMFNAFESALAGTLITLNIKRKGGLGTSPMDIFIFNKEQQRIQQQSKSKQEKIRFCYYRTRKRGHPGEWQGPTQVLWGGDGAIVVKDRGTDRYLVIANKDVKFIPPPKEIQKE\n>5lj5_O mol:protein length:590  Pre-mRNA-splicing factor CEF1\nMPPVPIYVKGGVWTNVEDQILKAAVQKYGTHQWSKVASLLQKKTARQSELRWNEYLNPKLNFTEFSKEEDAQLLDLARELPNQWRTIADMMARPAQVCVERYNRLLESEDSGGAALSTGVTDLKAGDINPNAETQMARPDNGDLEDEEKEMLAEARARLLNTQGKKATRKIRERMLEESKRIAELQKRRELKQAGINVAIKKPKKKYGTDIDYNEDIVYEQAPMPGIYDTSTEDRQIKKKFEQFERKVNRKGLDGNKDKPSKKNKDKKRKHDENEHVEKAALGESTTLTDEYKKPKLILSAPGTKQGKVTYKKKLESKRQKLIEAQATGTVLTPKELLPHDSGQEDNERSNIKSGKQLKSRIRKFLVQMFASLPSPKNDFEIVLSEDEKEEDAEIAEYEKEFENERAMNEEDNFIEPPSQNDAPRVSLVAVPLAYSTLPIPEFKNNPQSAIDNKYNLLVANAINKEPHMVPEDTVDFLKEVESRMQHITQGRTSMKIQFKTAMPPTEVLLESIQSKVESIEQLQRKLQHVQPLEQQNNEMCSTLCHHSLPALIEGQRKYYADYYAYRQEIRSLEGRRKRLQAMLNSSSSI\n>6j8m_D mol:protein length:147  Cytochrome c oxidase subunit 4 isoform 1\nAHGSVVKSEDYALPSYVDRRDYPLPDVAHVKNLSASQKALKEKEKASWSSLSIDEKVELYRLKFKESFAEMNRSTNEWKTVVGAAMFFIGFTALLLIWEKHYVYGPIPHTFEEEWVAKQTKRMLDMKVAPIQGFSAKWDYDKNEWKK\n>6vw1_F mol:protein length:217  SARS-CoV-2 chimeric RBD\nRVVPSGDVVRFPNITNLCPFGEVFNATKFPSVYAWERKKISNCVADYSVLYNSTFFSTFKCYGVSATKLNDLCFSNVYADSFVVKGDDVRQIAPGQTGVIADYNYKLPDDFMGCVLAWNTRNIDATSTGNYNYKYRLFRKSNLKPFERDISTEIYQAGSTPCNGVEGFNCYFPLQSYGFQPTNGVGYQPYRVVVLSFELLNAPATVCGPKLSTDLIK\n>3n99_b mol:protein length:290  uncharacterized protein TM1086\nHHHHHHGHMRTNKDRLVRISVVGEIAPAKMRSPYSVTTEGTVRVIPVLGGITYNVKVGDSAYGWAGDHVEPGVSVMARRKEEEIPLMTLSCIGNEVIVMSGDAKGSRGFVTGKHGGVNHVLVHFEEEVLGKLMVGDKILIKAWGQGLKLLDHPDVKVMNIDPDLFEKLGIQEKNGKIHVPVVAKIPAHMMGSGIGASSSASTDYDIMASNPEDLGVADLKLGDIVAIQDHDNSYGVGKYRKGAVSIGVVVHSACVSAGHGPGVVVIMTGDESKILPEEVERANISDYLVR\n>2j1k_M mol:protein length:197  FIBER PROTEIN\nMRGSHHHHHHGSPPAAPITLWTGPGPSINGFINDTPVIRCFICLTRDSNLVTVNASFVGEGGYRIVSPTQSQFSLIMEFDQFGQLMSTGNINSTTTWGEKPWGNNTVQPRPSHTWKLCMPNREVYSTPAATISRCGLDSIAVDGAPSRSIDCMLIINKPKGVATYTLTFRFLNFNRLSGGTLFKTDVLTFTYVGENQ\n>5dc3_D1 mol:protein length:87  40S ribosomal protein S21-A\nMENDKGQLVELYVPRKCSATNRIIKADDHASVQINVAKVDEEGRAIPGEYVTYALSGYVRSRGESDDSLNRLAQNDGLLKNVWSYSR\n>1nun_A mol:protein length:145  Fibroblast growth factor-10\nGRHVRSYNHLQGDVRWRKLFSFTKYFLKIEKNGKVSGTKKENCPYSILEITSVEIGVVAVKAINSNYYLAMNKKGKLYGSKEFNNDCKLKERIEENGYNTYASFNWQHNGRQMYVALNGKGAPRRGQKTRRKNTSAHFLPMVVHS\n>2w58_A mol:protein length:202  PRIMOSOME COMPONENT (HELICASE LOADER)\nDERKRQESLIQSMFMPREILRASLSDVDLNDDGRIKAIRFAERFVAEYEPGKKMKGLYLHGSFGVGKTYLLAAIANELAKRNVSSLIVYVPELFRELKHSLQDQTMNEKLDYIKKVPVLMLDDLGAEAMSSWVRDDVFGPILQYRMFENLPTFFTSNFDMQQLAHHLTYSQRGEEEKVKAARIMERIRYLAYPIEITGPNRR\n>4bp7_CY mol:protein length:129  COAT PROTEIN\nASNFTQFVLVDNGGTGDVTVAPSNFANGVAEWISSNSRSQAYKVTCSVRQSSAQNRKYTIKVEVPKVATQTVGGVELPVAAWRSYLNMELTIPIFATNSDCELIVKAMQGLLKDGNPIPSAIAANSGIY\n>6kbp_A mol:protein length:338  D-amino-acid oxidase\nMRVVVIGAGVIGLSTALCIHERYHSVLQPLDIKVYADRFTPLTTTDVAAGLWQPYLSDPNNPQEADWSQQTFDYLLSHVHSPNAENLGLFLISGYNLFHEAIPDPSWKDTVLGFRKLTPRELDMFPDYGYGWFHTSLILEGKNYLQWLTERLTERGVKFFQRKVESFEEVAREGADVIVNCTGVWAGALQRDPLLQPGRGQIMKVDAPWMKHFILTHDLERGIYNSPYIIPGTQTVTLGGIFQLGNWSELNNIQDHNTIWEGCCRLEPTLKNARIIGERTGFRPVRPQIRLEREQLRTGPSNTEVIHNYGHGGYGLTIHWGCALEAAKLFGRILEEKK\n>6yfg_HY mol:protein length:130  coat protein\nSKPIAIFKLRELSSDSTLFTLPGHSVTLPNTLGIVSHLPTPRKGNPGTVKTMRNLRKTILLGAGTASERAVPIVIKTETSFPVGTTEEDRAEVLKQMASFLIEEVKNNQELAYSGYVQDKYFIEDLVITE\n>2wqj_K mol:protein length:35  TUMOR PROTEIN P73\nGSDEDTYYLQVRGRENFEILMKLKESLELMELVPQ\n>3lyc_F mol:protein length:241  Putative pectinase\nGGDGNITTENIPVSEYDCLELEGGGMVVNYTQSDAPEGLEIKTDRNIFEKYEFNVENHKLKIRPKKEFRKHTNFRPTEFMVTANSRNLKKLAAAGSTHVNINSPLQAEEFEAGLAGSGIIQFHDTASFTNLKIEIAGSGDFVGHKVYCEELNGDMAGSNTIVLGGTVGIAEFSIAGSGTVRAFDCTMDELECKIAGSGDIEAFVVNKIKAEIAGSGSVKYKGDPQDIQKKVMGSGKIEKVE\n>6oj2_QQ mol:protein length:105  30S ribosomal protein S17\nMPKKVLTGVVVSDKMQKTVTVLVERQFPHPLYGKVIKRSKKYLAHDPEEKYKLGDVVEIIESRPISKRKRFRVLRLVESGRMDLVEKYLIRRQNYESLSKRGGKA\n>3sln_J mol:protein length:311  Capsid\nESRTKPFTVPILTVEEMTNSRFPIPLEKLFTGPSSAFVVQPQNGRCTTDGALLGTTQLSPVDICTFRGDVTHIAGTQNYTMNLASQNWNNYDPTEEIPAPLGTPDFVGKIQGVLTQTTRRDGSTRGHKATVSTGSVHFTPKLGSVQFSTDTSNDFETGQNTRFTPVGVVQDGSTTHQNEPQQWVLPDYSGRDSHNVHLAPAVAPTFPGEQLLFFRSTMPGCSGYPNMNLDCLLPQEWVQHFYQESAPAQSDVALLRFVNPDTGRVLFECKLHKSGYVTVAHTGQHDLVIPPNGYFRFDSWVNQFYTLAPMG\n>6yfh_AK mol:protein length:156  coat protein\nPAMTNIVLRDDQTSVATKTLIPIVSDGNMSVWRENAANVPIDGQIKLTGQWERMKDGTYRLNAKLEVPVMETAGAGGAYVAPPKVAYKVTASLTLYAPSRSTIADRANAMKMLSAVLCGADATAGTTLSPQSVTGDAWKNSALPFVFGFINQAFPT\n>4qe8_D mol:protein length:13  Nuclear receptor coactivator 2\nKENALLRYLLDKD\n>5gaq_I mol:protein length:310  Lysenin\nMSAKAAEGYEQIEVDVVAVWKEGYVYENRGSTSVDQKITITKGMKNVNSETRTVTATHSIGSTISTGDAFEIGSVEVSYSHSHEESQVSMTETEVYESKVIEHTITIPPTSKFTRWQLNADVGGADIEYMYLIDEVTPIGGTQSIPQVITSRAKIIVGRQIILGKTEIRIKHAERKEYMTVVSRKSWPAATLGHSKLFKFVLYEDWGGFRIKTLNTMYSGYEYAYSSDQGGIYFDQGTDNPKQRWAINKSLPLRHGDVVTFMNKYFTRSGLCYDDGPATNVYCLDKREDKWILEVVGLVPRGSGHHHHHH\n>4c5q_B mol:protein length:79  PHOSPHOPROTEIN\nMGDHYDDELFSDVQDIKTALAKIHEDNQKIISKLESLLLLKGEVESIKKQINRQNISISTLEGHLSSIMIAIPHHHHHH\n>6f2n_A mol:protein length:227  Metallo-beta-lactamase type 2\nSQKVEKTVIKNETGTISISQLNKNVWVHTELGSFNGEAVPSNGLVLNTSKGLVLVDSSWDDKLTKELIEMVEKKFQKRVTDVIITHAHADRIGGIKTLKERGIKAHSTALTAELAKKNGYEEPLGDLQTVTNLKFGNMKVETFYPGKGHTEDNIVVWLPQYNILVGGCLVKSTSAKDLGNVADAYVNEWSTSIENVLKRYRNINAVVPGHGEVGDKGLLLHTLDLLK\n>5ef0_F mol:protein length:74  Transcription attenuation protein MtrB\nMYTNSDFVVIKALEDGVNVIGLTRGADTRFHHSEKLDKGEVLIAQFTEHTSAIKVRGKAYIQTRHGVIESEGKK\n>3tsz_A mol:protein length:391  Tight junction protein ZO-1\nGSHMILRPSMKLVKFRKGDSVGLRLAGGNDVGIFVAGVLEDSPAAKEGLEEGDQILRVNNVDFTNIIREEAVLFLLDLPKGEEVTILAQKKKDVYRRIVESDVGDSFYIRTHFEYEKESPYGLSFNKGEVFRVVDTLYNGKLGSWLAIRIGKNHKEVERGIIPNKNRAEQLASVQYTLPKTAGGDRADFWRFRGLRSSKRNLRKSREDLSAQPVQTKFPAYERVVLREAGFLRPVTIFGPIADVAREKLAREEPDIYQIAKSEPRDAGTDQRSSGIIRLHTIKQIIDQDKHALLDVTPNAVDRLNYAQWYPIVVFLNPDSKQGVKTMRMRLCPESRKSARKLYERSHKLRKNNHHLFTTTINLNSMNDGWYGALKEAIQQQQNQLVWVSEG\n>3jaj_d mol:protein length:107  Ribosomal protein eL31\nNEVVTREYTINIHKRIHGVGFKKRAPRALKEIRKFAMKEMGTPDVRIDTRLNKAVWAKGIRNVPYRIRVRLSRKRNEDEDSPNKLYTLVTYVPVTTFKNLQTVNVDE\n>5a1v_E mol:protein length:874  COATOMER SUBUNIT GAMMA-1\nMLKKFDKKDEESGGGSNPLQHLEKSAVLQEARVFNETPINPRKCAHILTKILYLINQGEHLGTTEATEAFFAMTKLFQSNDPTLRRMCYLTIKEMSCIAEDVIIVTSSLTKDMTGKEDNYRGPAVRALCQITDSTMLQAVERYMKQAIVDKVPSVSSSALVSSLHLLKCSFDVVKRWVNEAQEAASSDNIMVQYHALGLLYHVRKNDRLAVSKMISKFTRHGLKSPFAYCMMIRVASKQLEEEDGSRDSPLFDFIESCLRNKHEMVVYEAASAIVNLPGCSAKELAPAVSVLQLFCSSPKAALRYAAVRTLNKVAMKHPSAVTACNLDLENLVTDSNRSIATLAITTLLKTGSESSIDRLMKQISSFMSEISDEFKVVVVQAISALCQKYPRKHAVLMNFLFTMLREEGGFEYKRAIVDCIISIIEENSESKETGLSHLCEFIEDCEFTVLATRILHLLGQEGPKTNNPSKYIRFIYNRVVLEHEEVRAGAVSALAKFGAQNEEMLPSILVLLKRCVMDDDNEVRDRATFYLNVLEQKQKALNAGYILNGLTVSIPGLEKALQQYTLEPSEKPFDLKSVPLATTPMAEQRPESTATAAVKQPEKVAATRQEIFQEQLAAVPEFQGLGPLFKSSPEPVALTESETEYVIRCTKHTFSDHLVFQFDCTNTLNDQTLENVTVQMEPTEAYEVLSYVPARSLPYNQPGTCYTLVALPTEDPTAVACTFSCVMKFTVKDCDPNTGEIDEEGYEDEYVLEDLEVTVADHIQKVMKVNFEAAWDEVGDEFEKEETFTLSTIKTLEEAVGNIVKFLGMHPCERSDKVPENKNTHTLLLAGVFRGGHDILVRSRLLLLDTVTMQVTARSSEELPVDIILASVG\n>1b12_C mol:protein length:248  SIGNAL PEPTIDASE I\nVRSFIYEPFQIPSGSMMPTLLIGDFILVEKFAYGIKDPIYQKTLIETGHPKRGDIVVFKYPEDPKLDYIKRAVGLPGDKVTYDPVSKELTIQPGCSSGQACENALPVTYSNVEPSDFVQTFSRRNGGEATSGFFEVPKNETKENGIRLSERKETLGDVTHRILTVPIAQDQVGMYYQQPGQQLATWIVPPGQYFMMGDNRDNSADSRYWGFVPEANLVGRATAIWMSFDKQEGEWPTGLRLSRIGGIH\n>1ev4_D mol:protein length:221  GLUTATHIONE S-TRANSFERASE A1-1\nSGKPVLHYFNARGRMECIRFLLAAAGVEFDEKFIQSPEDLEKLKKDGNLMFDQVPMVEIDGMKLAQTRAILNYIATKYDLYGKDMKERALIDMYSEGILDLTEMIMQLVICPPDQKEAKTALAKDRTKNRYLPAFEKVLKSHGQDYLVGNKLTRVDIHLLELLLYVEEFDASLLTSFPLLKAFKSRISSLPNVKKFLQPGSQRKLPMDAKQIEEARKIYKF\n>7eyd_V4 mol:protein length:173  C-phycocyanin beta subunit\nMTLDVFTKVVSQADSRGEFLSNEQLDALANVVKEGNKRLDVVNRITSNASAIVTNAARALFEEQPQLIAPGGNAYTNRRMAACLRDMEIILRYVTYAILAGDASVLDDRCLNGLRETYQALGTPGSSVAVGVQKMKDAAVGIANDPNGITKGDCSQLISEVASYFDRAAAAVG\n>2cvk_A mol:protein length:110  Thioredoxin\nMAKPIEVTDQNFDETLGQHPLVLVDFWAEWCAPCRMIAPILEEIAKEYEGKLLVAKLDVDENPKTAMRYRVMSIPTVILFKDGQPVEVLVGAQPKRNYQAKIEKHLPATA\n>4ctf_D3 mol:protein length:226  P1\nAPIRVVSVPESDSFMSSVPDNSTPLYPKVVVPPRQVPGRFTNFIDVAKQTYSFCSISGKPYFEVTNTSGDEPLFQMDVSLSAAELHGTYVASLSSFFAQYRGSLNFNFIFTGAAATKAKFLVAFVPPHSAAPKTRDEAMACIHAVWDVGLNSAFSFNVPYSSPADFMAVYSAEATVVNVSGWLQVYALTALTSTDIAVNSKGRVLVAVSAGPDFSLRHPVDLPDKQ\n>6vgn_G mol:protein length:200  ATP-dependent Clp protease proteolytic subunit\nILPSFIEHSSFGVKESNPYNKLFEERIIFLGVQVDDASANDIMAQLLVLESLDPDRDITMYINSPGGGFTSLMAIYDTMQYVRADIQTVCLGQAASAAAVLLAAGTPGKRMALPNARVLIHQPSLSGVIQGQFSDLEIQAAEIERMRTLMETTLARHTGKDAGVIRKDTDRDKILTAEEAKDYGIIDTVLEYRKLSAQTA\n>6ase_A mol:protein length:170  GTPase KRas\nGMTEYKLVVVGAGGVGKSALTIQLIQNHFVDEYDPTIEDSYRKQVVIDGETCLLDILDTGGQEEYSAMRDQYMRTGEGFLCVFAINNTKSFEDIHHYREQIKRVKDSEDVPMVLVGNKCDLPSRTVDTKQAQDLARSYGIPFIETSAKTRQGVDDAFYTLVREIRKHKEK\n>1nno_B mol:protein length:543  NITRITE REDUCTASE\nKDDMKAAEQYQGAASAVDPAHVVRTNGAPDMSESEFNEAKQIYFQRCAGCHGVLRKGATGKPLTPDITQQRGQQYLEALITYGTPLGMPNWGSSGELSKEQITLMAKYIQHTPPQPPEWGMPEMRESWKVLVKPEDRPKKQLNDLDLPNLFSVTLRDAGQIALVDGDSKKIVKVIDTGYAVHISRMSASGRYLLVIGRDARIDMIDLWAKEPTKVAEIKIGIEARSVESSKFKGYEDRYTIAGAYWPPQFAIMDGETLEPKQIVSTRGMTVDTQTYHPEPRVAAIIASHEHPEFIVNVKETGKVLLVNYKDIDNLTVTSIGAAPFLHDGGWDSSHRYFMTAANNSNKVAVIDSKDRRLSALVDVGKTPHPGRGANFVHPKYGPVWSTSHLGDGSISLIGTDPKNHPQYAWKKVAELQGQGGGSLFIKTHPKSSHLYVDTTFNPDARISQSVAVFDLKNLDAKYQVLPIAEWADLGEGAKRVVQPEYNKRGDEVWFSVWNGKNDSSALVVVDDKTLKLKAVVKDPRLITPTGKFNVYNTQHDVY\n>6u3m_C mol:protein length:191  HLA class II histocompatibility antigen, DQ alpha 1 chain\nEDIVADHVASYGVNLYQSYGPSGQYTHEFDGDEQFYVDLGRKETVWSLPVLRQFRFDPQFALTNIAVLKHNLNSLIKRSNSTAATNEVPEVTVFSKSPVTLGQPNILICLVDNIFPPVVNITWLSNGHSVTEGVSETSFLSKSDHSFFKISYLTLLPSAEESYDCKVEHWGLDKPLLKHWEPETSGDDDDK\n>6wdh_z mol:protein length:58  50S ribosomal protein L30\nAKTIKITQTRSAIGRLPKHKATLLGLGLRRIGHTVEREDTPAIRGMINAVSFMVKVEE\n>4nrl_D mol:protein length:182  Hemagglutinin HA2 chain\nGFFGAIAGFLEGGWEGMIAGWHGYTSHGAHGVAVAADLKSTQEAINKITKNLNSLSELEVKNLQRLSGAMNELHDEILELDEKVDDLRADTISSQIELAVLLSNEGIINSEDEHLLALERKLKKMLGPSAVEIGNGCFETKHKCNQTCLDRIAAGTFNAGDFSLPTFDSLNITAASGALVPR\n>43ca_H mol:protein length:117  PROTEIN (IMMUNOGLOBULIN (HEAVY CHAIN))\nQVQLVESGPGLVAPSQSLSITCTVSGISLSRYNVHWVRQSPGKGLEWLGMIWGGGSIEYNPALKSRLSISKDNSKSQIFLKMNSLQTDDSAMYYCVSYGYGGDRFSYWGQGTLVTVS\n>5us9_c mol:protein length:541  Capsid protein VP2\nMSENEIQDQQPSDSMDGQRGGGGGATGSVGGGKGSGVGISTGGWVGGSYFTDSYVITKNTRQFLVKIQNNHQYKTELISPSTSQGKSQRCVSTPWSYFNFNQYSSHFSPQDWQRLTNEYKRFRPKGMHVKIYNLQIKQILSNGADTTYNNDLTAGVHIFCDGEHAYPNATHPWDEDVMPELPYQTWYLFQYGYIPVIHELAEMEDSNAVEKAICLQIPFFMLENSDHEVLRTGESTEFTFNFDCEWINNERAYIPPGLMFNPLVPTRRAQYIRRNNNPQTAESTSRIAPYAKPTSWMTGPGLLSAQRVGPATSDTGAWMVAVKPENASIDTGMSGIGSGFDPPQGSLAPTNLEYKIQWYQTPQGTNNNGNIISNQPLSMLRDQALFRGNQTTYNLCSDVWMFPNQIWDRYPITRENPIWCKKPRSDKHTTIDPFDGSLAMDHPPGTIFIKMAKIPVPSNNNADSYLNIYCTGQVSCEIVWEVERYATKNWRPERRHTTFGLGIGGADNLNPTYHVDKNGTYIQPTTWDMCFPVKTNINKVL\n>8dja_G mol:protein length:123  Major prion protein\nGSKKRPKPGGWNTGGSRYPGQGSPGGNRYPPQGGTWGQPHGGGWGQPHGGSWGQPHGGSWGQPHGGGWGQGGGTHNQWNKPSKPKTNLKHVAGAAAAGAVVGGLGGYMLGSAMSRPMIHFGND\n>4z96_A mol:protein length:530  Ubiquitin carboxyl-terminal hydrolase 7\nSGPLGSEAHLYMQVQIVAEDQFCGHQGNDMYDEEKVKYTVFKVLKNSSLAEFVQSLSQTMGFPQDQIRLWPMQARSNGTKRPAMLDNEADGNKTMIELSDNENPWTIFLETVDPELAASGATLPKFDKDHDVMLFLKMYDPKTRSLNYCGHIYTPISCKIRDLLPVMCDRAGFIQDTSLILYEEVKPNLTERIQDYDVSLDKALDELMDGDIIVFQKDDPENDNSELPTAKEYFRDLYHRVDVIFCDKTIPNDPGFVVTLSNRMNYFQVAKTVAQRLNTDPMLLQFFKSQGYRDGPGNPLRHNYEGTLRDLLQFFKPRQPKKLYYQQLKMKITDFENRRSFKCIWLNSQFREEEITLYPDKHGCVRDLLEECKKAVELGEKASGKLRLLEIVSYKIIGVHQEDELLECLSPATSRTFRIEEIPLDQVDIDKENEMLVTVAHFHKEVFGTFGIPFLLRIHQGEHFREVMKRIQSLLDIQEKEFEKFKFAIVMMGRHQYINEDEYEVNLKDFEPQPGNMSHPRPWLGLDHFN\n>3d2c_A mol:protein length:181  Lipase\nAEHNPVVMVHGIGGSSSNFEGIKSYLVSQGWSRDKLYAVDFWDKTGTNYNNGPVLSRFVQKVLDETGAKKVDIVAHSMGGANTLYYIKYLDGGNKVANVVTLGGANRLTTDKAPPGTDPNQKILYTSIYSSDDMIVMNYLSRLDGARNVQIHGVGHMGLLYSSQVYSLIKEGLNGGGQNTN\n>6yxl_HHH mol:protein length:221  ACPA F3 Fab fragment - heavy chain\nQVQLVQSGAEVKKPGASVRVSCKASGFVTDYFIQWVRQAPGQGPEWMAWINPHNGETDYAPKLQDRVTVTCDTSTNTAFMELSRLTSDDTALYYCGRSGRTDARRAPVSYWGQGALVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKRVEP\n>2jdt_I mol:protein length:20  CAMP-DEPENDENT PROTEIN KINASE INHIBITOR ALPHA\nTTYADFIASGRTGRRNAIHD\n>4qua_D mol:protein length:6  ACE-ASP-GLU-VAL-ASP-CHLOROMETHYLKETONE INHIBITOR\nXDEVDX\n>3daq_C mol:protein length:292  Dihydrodipicolinate synthase\nTHLFEGVGVALTTPFTNNKVNLEALKAHVNFLLENNAQAIIVNGTTAESPTLTTDEKELILKTVIDLVDKRVPVIAGTGTNDTEKSIQASIQAKALGADAIMLITPYYNKTNQRGLVKHFEAIADAVKLPVVLYNVPSRTNMTIEPETVEILSQHPYIVALKDATNDFEYLEEVKKRIDTNSFALYSGNDDNVVEYYQRGGQGVISVIANVIPKEFQALYDAQQSGLDIQDQFKPIGTLLSALSVDINPIPIKALTSYLGFGNYELRLPLVSLEDTDTKVLREAYDTFKAGE\n>2ddw_B mol:protein length:283  Pyridoxine kinase\nMSSLLLFNDKSRALQADIVAVQSQVVYGSVGNSIAVPAIKQNGLNVFAVPTVLLSNTPHYDTFYGGAIPDEWFSGYLRALQERDALRQLRAVTTGYMGTASQIKILAEWLTALRKDHPDLLIMVDPVIGDIDSGIYVKPDLPEAYRQYLLPLAQGITPNIFELEILTGKNCRDLDSAIAAAKSLLSDTLKWVVVTSASGNEENQEMQVVVVTADSVNVISHSRVKTDLKGTGDLFCAQLISGLLKGKALTDAVHRAGLRVLEVMRYTQQHESDELILPPLAEA\n>6xt5_A mol:protein length:451  Legumain\nRGSHHHHHHGSEVGTRWAVLVAGSNGYGNYRHQADVCHAYQLLIKGGVKEENIVVFMYDDIAYNAMNPRPGVIINHPQGPDVYAGVPKDYTGEDVTPENLYAVILGDKSKVKGGSGKVINSNPEDRIFIFYSNHGGPGVLGMPNAPFVYAMDFIDVLKKKHASGGYKEMVIYIEACESGSIFEGIMPKDLNIYVTTASNAQENSFGTYCPGMNPPPPEEYVTCLGDLYSVSWMEDSETHNLKRETVQQQYQSVRKRTSNSNSYRFGSHVMQYGDTNITAEKLYLYHGFDPATVNFPPHNGNLEAKMEVVNQRDAELLFMWQMYQRSNHQPEKKTHILEQITETVKHRNHLDGSVELIGVLLYGPGKSSSVLHSVRAPGLPLVDDWTCLKSMVRVFETHCGSLTQYGMKHMRAFGNVCNSGVSKASMEEACKAACGGYDAGLLYPSNTGYSA\n>6l3t_E mol:protein length:279  Gap junction gamma-3 protein\nMCGRFLRRLLAEESRRSTPVGRLLLPVLLGFRLVLLAASGPGVYGDEQSEFVCHTQQPGCKAACFDAFHPLSPLRFWVFQVILVAVPSALYMGFTLYHVIWHWELSGKGKEEETLIQGREGNTDVPGAGSLRLLWAYVAQLGARLVLEGAALGLQYHLYGFQMPSSFACRREPCLGSITCNLSRPSEKTIFLKTMFGVSGFCLLFTFLELVLLGLGRWWRTWKHKSSSSKYFLTSESTRRHKKATDSLPVVETKEQFQEAVPGRSLAQEKQRPVGPRDA\n>3uk4_B mol:protein length:6  C-terminal peptide from Lactotransferrin\nLEACAF\n>1ztg_A mol:protein length:74  POLY(RC)-BINDING PROTEIN 1\nGILTIRLLMHGKEVGSIIGKKGESVKRIREESGARINISEGNCPERIITLTGPTNAIFKAFAMIIDKLEEDINS\n>1usv_H mol:protein length:170  AHA1\nMRGSHHHHHHGMASMVVNNPNNWHWVDKNCIGWAKEYFKQKLVGVEAGSVKDKKYAKIKSVSSIEGDCEVNQRKGKVISLFDLKITVLIEGHVDSKDGSALPFEGSINVPEVAFDSEASSYQFDISIFKETSELSEAKPLIRSELLPKLRQIFQQFGKDLLATHGNDIQV\n>5mfc_B mol:protein length:257  (KR)4-Green fluorescent protein,Green fluorescent protein\nGPGSGSPKRKRKRKREGKLMSKGEELFTGVVPILVELDGDVNGHKFSVRGEGEGDATNGKLTLKFICTTGKLPVPWPTLVTTLTYGVQCFSRYPDHMKRHDFFKSAMPEGYVQERTISFKDDGTYKTRAEVKFEGDTLVNRIELKGIDFKEDGNILGHKLEYNFNSHNVYITADKQKNGIKANFKIRHNVEDGSVQLADHYQQNTPIGDGPVLLPDNHYLSTQSVLSKDPNEKRDHMVLLEFVTAAGITHGMDELYK\n>4v7s_CF mol:protein length:100  30S ribosomal protein S6\nMRHYEIVFMVHPDQSEQVPGMIERYTAAITGAEGKIHRLEDWGRRQLAYPINKLHKAHYVLMNVEAPQEVIDELETTFRFNDAVIRSMVMRTKHAVTEAS\n>6zvt_ZA mol:protein length:258  Vipp1\nMGLFDRIKRVVSSNLNDLVNKAEDPEKMLEQAILEMQEDLVQLRQGVAQAIAAQKRSEKQYNDAQNEINKWQRNAQLALQKGDENLARQALERKKTYTDTSAALKASLDTQSTQVETLKRNLIQLESKISEAKTKKEMLKARITTAKAQEQLQGMVRGMNTSSAMSAFERMEEKVLMQESRAQALGELAGADLETQFAQLEGGSDVDDELAALKAQMLPPATPVTQAQLPPQQETTPAKSNEVVDAELDSLRKQLDQL\n>6pg2_A mol:protein length:189  Thiol:disulfide interchange protein DsbA\nAQYEDGKQYTTLEKPVAGAPQVLEFFSFFCPHCYQFEEVLHISDNVKKKLPEGVKMTKYHVNFMGGDLGKDLTQAWAVAMALGVEDKVTVPLFEGVQKTQTIRSASDIRDVFINAGIKGEEYDAAWNSFVVKSLVAQQEKAAADVQLRGVPAMFVNGKYQLNPQGMDTSNMDVFVQQYADTVKYLSEKK\n>6pm2_B mol:protein length:458  Glycine receptor subunit alphaZ1\nMFALGIYLWETIVFFSLAASQQAAARKAASPMPPSEFLDKLMGKVSGYDARIRPNFKGPPVNVTCNIFINSFGSIAETTMDYRVNIFLRQQWNDPRLAYSEYPDDSLDLDPSMLDSIWKPDLFFANEKGANFHEVTTDNKLLRISKNGNVLYSIRITLVLACPMDLKNFPMDVQTCIMQLESFGYTMNDLIFEWDEKGAVQVADGLTLPQFILKEEKDLRYCTKHYNTGKFTCIEARFHLERQMGYYLIQMYIPSLLIVILSWVSFWINMDAAPARVGLGITTVLTMTTQSSGSRASLPKVSYVKAIDIWMAVCLLFVFSALLEYAAVNFIARQHKELLRFQRRRRHLKEDEAGDGRFSFAAYGMGPACLQAKDGMAIKGNNNNAPTSTNPPEKTVEEMRKLFISRAKRIDTVSRVAFPLVFLIFNIFYWITYKIIRSEDIHKQLVPRGSHHHHHHHH\n>5nc7_J mol:protein length:12  ActA-derived 10-mer Ac-FPPPPTEDEL-NH2 with acetylated (Ac) and amidated (NH2) termini. Phe is substitued by Trp to increase affinity for crystallization\nXWPPPPTEDELX\n>7cwl_B mol:protein length:1273  Spike glycoprotein\nMFVFLVLLPLVSSQCVNLTTRTQLPPAYTNSFTRGVYYPDKVFRSSVLHSTQDLFLPFFSNVTWFHAIHVSGTNGTKRFDNPVLPFNDGVYFASTEKSNIIRGWIFGTTLDSKTQSLLIVNNATNVVIKVCEFQFCNDPFLGVYYHKNNKSWMESEFRVYSSANNCTFEYVSQPFLMDLEGKQGNFKNLREFVFKNIDGYFKIYSKHTPINLVRDLPQGFSALEPLVDLPIGINITRFQTLLALHRSYLTPGDSSSGWTAGAAAYYVGYLQPRTFLLKYNENGTITDAVDCALDPLSETKCTLKSFTVEKGIYQTSNFRVQPTESIVRFPNITNLCPFGEVFNATRFASVYAWNRKRISNCVADYSVLYNSASFSTFKCYGVSPTKLNDLCFTNVYADSFVIRGDEVRQIAPGQTGKIADYNYKLPDDFTGCVIAWNSNNLDSKVGGNYNYLYRLFRKSNLKPFERDISTEIYQAGSTPCNGVEGFNCYFPLQSYGFQPTNGVGYQPYRVVVLSFELLHAPATVCGPKKSTNLVKNKCVNFNFNGLTGTGVLTESNKKFLPFQQFGRDIADTTDAVRDPQTLEILDITPCSFGGVSVITPGTNTSNQVAVLYQDVNCTEVPVAIHADQLTPTWRVYSTGSNVFQTRAGCLIGAEHVNNSYECDIPIGAGICASYQTQTNSPRRARSVASQSIIAYTMSLGAENSVAYSNNSIAIPTNFTISVTTEILPVSMTKTSVDCTMYICGDSTECSNLLLQYGSFCTQLNRALTGIAVEQDKNTQEVFAQVKQIYKTPPIKDFGGFNFSQILPDPSKPSKRSFIEDLLFNKVTLADAGFIKQYGDCLGDIAARDLICAQKFNGLTVLPPLLTDEMIAQYTSALLAGTITSGWTFGAGAALQIPFAMQMAYRFNGIGVTQNVLYENQKLIANQFNSAIGKIQDSLSSTASALGKLQDVVNQNAQALNTLVKQLSSNFGAISSVLNDILSRLDKVEAEVQIDRLITGRLQSLQTYVTQQLIRAAEIRASANLAATKMSECVLGQSKRVDFCGKGYHLMSFPQSAPHGVVFLHVTYVPAQEKNFTTAPAICHDGKAHFPREGVFVSNGTHWFVTQRNFYEPQIITTDNTFVSGNCDVVIGIVNNTVYDPLQPELDSFKEELDKYFKNHTSPDVDLGDISGINASVVNIQKEIDRLNEVAKNLNESLIDLQELGKYEQYIKWPWYIWLGFIAGLIAIVMVTIMLCCMTSCCSCLKGCCSCGSCCKFDEDDSEPVLKGVKLHYT\n>7oo2_B mol:protein length:214  anti-MenX Fab light chain\nETTVTQSPASLSVATGEKVTIRCITSTDIDDDMTWYQQKPGEPPKLLISEATTLRPGVPSRFSASGYGTDFVFTIENTLSEDVADYYCLQSDNMPYTFGGGTKLEIKRADAAPTVSIFPPSSEQLTSGGASVVCFLNNFYPKDINVKWKIDGSERQNGVLNSWTDQDSKDSTYSMSSTLTLTKDEYERHNSYTCEATHKTSTSPIVKSFNRNEC\n>1h4l_D mol:protein length:147  CYCLIN-DEPENDENT KINASE 5 ACTIVATOR\nSTSELLRCLGEFLCRRCYRLKHLSPTDPVLWLRSVDRSLLLQGWQDQGFITPANVVFLYMLCRDVISSEVGSDHELQAVLLTCLYLSYSYMGNEISYPLKPFLVESCKEAFWDRCLSVINLMSSKMLQINADPHYFTQVFSDLKNES\n>3b07_A mol:protein length:309  Gamma-hemolysin component B\nMGHHHHHHAMEGKITPVSVKKVDDKVTLYKTTATADSDKFKISQILTFNFIKDKSYDKDTLVLKATGNINSGFVKPNPNDYDFSKLYWGAKYNVSISSQSNDSVNVVDYAPKNQNEEFQVQNTLGYTFGGDISISNGLSGGLNGNTAFSETINYKQESYRTTLSRNTNYKNVGWGVEAHKIMNNGWGPYGRDSFHPTYGNELFLAGRQSSAYAGQNFIAQHQMPLLSRSNFNPEFLSVLSHRQDGAKKSKITVTYQREMDLYQICWNGFYWAGANYKNFKTRTFKSTYEIDWENHKVKLLDTKETENNK\n>6zqn_B mol:protein length:510  ATP synthase subunit alpha, mitochondrial\nEKTGTAEVSSILEERILGADTSVDLEETGRVLSIGDGIARVHGLRNVQAEEMVEFSSGLKGMSLNLEPDNVGVVVFGNDKLIKEGDIVKRTGAIVDVPVGEELLGRVVDALGNAIDGKGPIGSKARRRVGLKAPGIIPRISVREPMQTGIKAVDSLVPIGRGQRELIIGDRQTGKTSIAIDTIINQKRFNDGTDEKKKLYCIYVAIGQKRSTVAQLVKRLTDADAMKYTIVVSATASDAAPLQYLAPYSGCSMGEYFRDNGKHALIIYDDLSKQAVAYRQMSLLLRRPPGREAYPGDVFYLHSRLLERAAKMNDAFGGGSLTALPVIETQAGDVSAYIPTNVISITDGQIFLETELFYKGIRPAINVGLSVSRVGSAAQTRAMKQVAGTMKLELAQYREVAAFAQFGSDLDAATQQLLSRGVRLTELLKQGQYSPMAIEEQVAVIYAGVRGYLDKLEPSKITKFENAFLSHVISQHQALLGKIRTDGKISEESDAKLKEIVTNFLAGFEA\n>7oue_C mol:protein length:242  N-glycosylase/DNA lyase\nGSHMIARIIGEIGIEGARFIEENIDEQFKALRYLSKGIDSETFVKLVIANSLVSYQLTGKGEQWWWEFAKYFYGRDVKSIYLAYKEFLPNSRFNRRLIPQKLSRIRRVETFLSTLTEERIEEYYGDMSSLWGSIARALGVDKESKTVVFSVKMFGYAARIVLSTFNPYPMEIPIPEDSRIVKLTKKLTNEKPRKFWMKIARESGVPPLHIDSILWPLLGGASIDSAPPELRDKLAELIKIIR\n>6vyy_h mol:protein length:273  50S ribosomal protein L2\nMAVVKCKPTSPGRRHVVKVVNPELHKGKPFAPLLEKNSKSGGRNNNGRITTRHIGGGHKQAYRIVDFKRNKDGIPAVVERLEYDPNRSANIALVLYKDGERRYILAPKGLKAGDQIQSGVDAAIKPGNTLPMRNIPVGSTVHNVEMKPGKGGQLARSAGTYVQIVARDGAYVTLRLRSGEMRKVEADCRATLGEVGNAEHMLRVLGKAGAARWRGVRPTVRGTAMNPVDHPHGGGEGRNFGKHPVTPWGVQTKGKKTRSNKRTDKFIVRRRSK\n>6hgh_B mol:protein length:40  Alpha-1-antichymotrypsin\nSALVETRTIVRFNRPFLMIIVDHFTWSIFFMSKVTNPKQA\n>4g7g_B mol:protein length:448  sterol 14-alpha-demethylase\nGKLPPVYPVTVPILGHIIQFGKSPLGFMQECKRQLKSGIFTINIVGKRVTIVGDPHEHSRFFLPRNEVLSPREVYSFMVPVFGEGVAYAAPYPRMREQLNFLAEELTIAKFQNFVPAIQHEVRKFMAANWDKDEGEINLLEDCSTMIINTACQCLFGEDLRKRLDARRFAQLLAKMESSLIPAAVFLPILLKLPLPQSARCHEARTELQKILSEIIIARKEEEVNKDSSTSDLLSGLLSAVYRDGTPMSLHEVCGMIVAAMFAGQHTSSITTTWSMLHLMHPANVKHLEALRKEIEEFPAQLNYNNVMDEMPFAERCARESIRRDPPLLMLMRKVMADVKVGSYVVPKGDIIACSPLLSHHDEEAFPEPRRWDPERDEKVEGAFIGFGAGVHKCIGQKFGLLQVKTILATAFRSYDFQLLRDEVPDPDYHTMVVGPTASQCRVKYIRR\n>4glm_A mol:protein length:72  Dynamin-binding protein\nGGAAQPAMAQGALTYGVALYRFQALEPNELDFEVGDKIRILATLEDGWLEGSLKGRTGIFPYRFVKLCPAAA\n>7eyd_V5 mol:protein length:173  C-phycocyanin beta subunit\nMTLDVFTKVVSQADSRGEFLSNEQLDALANVVKEGNKRLDVVNRITSNASAIVTNAARALFEEQPQLIAPGGNAYTNRRMAACLRDMEIILRYVTYAILAGDASVLDDRCLNGLRETYQALGTPGSSVAVGVQKMKDAAVGIANDPNGITKGDCSQLISEVASYFDRAAAAVG\n>1mfr_K mol:protein length:176  M FERRITIN\nMVSQVRQNYHSDCEAAVNRMLNLELYASYTYSSMYAFFDRDDVALHNVAEFFKEHSHEEREHAEKFMKYQNKRGGRVVLQDIKKPERDEWGNTLEAMQAALQLEKTVNQALLDLHKLATDKVDPHLCDFLESEYLEEQVKDIKRIGDFITNLKRLGLPENGMGEYLFDKHSVKESS\n>7nvm_Q mol:protein length:548  T-complex protein 1 subunit theta\nMALHVPKAPGFAQMLKEGAKHFSGLEEAVYRNIQACKELAQTTRTAYGPNGMNKMVINHLEKLFVTNDAATILRELEVQHPAAKMIVMASHMQEQEVGDGTNFVLVFAGALLELAEELLRIGLSVSEVIEGYEIACRKAHEILPNLVCCSAKNLRDIDEVSSLLRTSIMSKQYGNEVFLAKLIAQACVSIFPDSGHFNVDNIRVCKILGSGISSSSVLHGMVFKKETEGDVTSVKDAKIAVYSCPFDGMITETKGTVLIKTAEELMNFSKGEENLMDAQVKAIADTGANVVVTGGKVADMALHYANKYNIMLVRLNSKWDLRRLCKTVGATALPRLTPPVLEEMGHCDSVYLSEVGDTQVVVFKHEKEDGAISTIVLRGSTDNLMDDIERAVDDGVNTFKVLTRDKRLVPGGGATEIELAKQITSYGETCPGLEQYAIKKFAEAFEAIPRALAENSGVKANEVISKLYAVHQEGNKNVGLDIEAEVPAVKDMLEAGILDTYLGKYWAIKLATNAAVTVLRVDQIIMAKPAGGPKPPSGKKDWDDDQND\n>6s61_M mol:protein length:182  Ferritin heavy chain\nMTTASPSQVRQNYHQDAEAAINRQINLELYASYVYLSMSCYFDRDDVALKNFAKYFLHQSHEEREHAEKLMKLQNQRGGRIFLQDIKKPDRDDWESGLNAMECALHLEKSVNQSLLELHKLATDKNDPHLCDFIETYYLSEQVKSIKELGDHVTNLRKMGAPEAGMAEYLFDKHTLGHGDES\n>5j8k_F mol:protein length:429  COMPLEX I 51KDA/NDUFV1\nXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXCXXCXXCXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXCXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX\n>4wuz_B mol:protein length:229  Exonuclease\nGSHMTPDIILQRTGIDVRAVEQGDDAWHKLRLGVITASEVHNVIAKPRSGKKWPDMKMSYFHTLLAEVCTGVAPEVNAKALAWGKQYENDARTLFEFTSGVNVTESPIIYRDESMRTACSPDGLCSDGNGLELKCPFTSRDFMKFRLGGFEAIKSAYMAQVQYSMWVTRKNAWYFANYDPRMKREGLHYVVIERDEKYMASFDEIVPEFIEKMDEALAEIGFVFGEQWR\n>7xve_C mol:protein length:215  Sodium channel subunit beta-2\nMHRDAWLPRPAFSLTGLSLFFSLVPPGRSMEVTVPATLNVLNGSDARLPCTFNSCYTVNHKQFSLNWTYQECNNCSEEMFLQFRMKIINLKLERFQDRVEFSGNPSKYDVSVMLRNVQPEDEGIYNCYIMNPPDRHRGHGKIHLQVLMEEPPERDSTVAVIVGASVGGFLAVVILVLMVVKCVRRKKEQKLSTDDLKTEEEGKTDGEGNPDDGAK\n>5nd8_G mol:protein length:179  50S ribosomal protein L5\nMNRLKEKFNTEVTENLMKKFNYSSVMEVPKIDKIVVNMGVGDAVQNSKVLDNAVEELELITGQKPLVTKAKKSIATFRLREGMPIGAKVTLRGERMYEFLDKLISVSLPRVRDFQGVSKKAFDGRGNYTLGVKEQLIFPEIDYDKVSKVRGMDIVIVTTANTDEEARELLANFGMPFRK\n>7pr0_E mol:protein length:205  Spike protein S1\nETGHHHHHHTNLCPFGEVFNATRFASVYAWNRKRISNCVADYSVLYNSASFSTFKCYGVSPTKLNDLCFTNVYADSFVIRGDEVRQIAPGQTGKIADYNYKLPDDFTGCVIAWNSNNLDSKVGGNYNYLYRLFRKSNLKPFERDISTEIYQAGSTPCNGVEGFNCYFPLQSYGFQPTNGVGYQPYRVVVLSFELLHAPATVCGKK\n>2af7_A mol:protein length:125  gamma-carboxymuconolactone decarboxylase\nMERYRRGMEILNRMNRKSYTAIRDELEDVAPDLARFVAEFAYGDVYSRGVLDLKTRELLTLAALTVLRADDQLKSHVRGALNAGCSKDEIIEVMIQMAVYAGFPAAINAVLAAKEVFTENDPAEV\n>7ukn_A mol:protein length:1142  DNA damage-binding protein 1\nGAMSYNYVVTAQKPTAVNGCVTGHFTSAEDLNLLIAKNTRLEIYVVTAEGLRPVKEVGMYGKIAVMELFRPKGESKDLLFILTAKYNACILEYKQSGESIDIITRAHGNVQDRIGRPSETGIIGIIDPECRMIGLRLYDGLFKVIPLDRDNKELKAFNIRLEELHVIDVKFLYGCQAPTICFVYQDPQGRHVKTYEVSLREKEFNKGPWKQENVEAEASMVIAVPEPFGGAIIIGQESITYHNGDKYLAIAPPIIKQSTIVCHNRVDPNGSRYLLGDMEGRLFMLLLEKEEQMDGTVTLKDLRVELLGETSIAECLTYLDNGVVFVGSRLGDSQLVKLNVDSNEQGSYVVAMETFTNLGPIVDMCVVDLERQGQGQLVTCSGAFKEGSLRIIRNGIGIHEHASIDLPGIKGLWPLRSDPNRETDDTLVLSFVGQTRVLMLNGEEVEETELMGFVDDQQTFFCGNVAHQQLIQITSASVRLVSQEPKALVSEWKEPQAKNISVASCNSSQVVVAVGRALYYLQIHPQELRQISHTEMEHEVACLDITPLGDSNGLSPLCAIGLWTDISARILKLPSFELLHKEMLGGEIIPRSILMTTFESSHYLLCALGDGALFYFGLNIETGLLSDRKKVTLGTQPTVLRTFRSLSTTNVFACSDRPTVIYSSNHKLVFSNVNLKEVNYMCPLNSDGYPDSLALANNSTLTIGTIDEIQKLHIRTVPLYESPRKICYQEVSQCFGVLSSRIEVQDTSGGTTALRPSASTQALSSSVSSSKLFSSSTAPHETSFGEEVEVHNLLIIDQHTFEVLHAHQFLQNEYALSLVSCKLGKDPNTYFIVGTAMVYPEEAEPKQGRIVVFQYSDGKLQTVAEKEVKGAVYSMVEFNGKLLASINSTVRLYEWTTEKELRTECNHYNNIMALYLKTKGDFILVGDLMRSVLLLAYKPMEGNFEEIARDFNPNWMSAVEILDDDNFLGAENAFNLFVCQKDSAATTDEERQHLQEVGLFHLGEFVNVFCHGSLVMQNLGETSTPTQGSVLFGTVNGMIGLVTSLSESWYNLLLDMQNRLNKVIKSVGKIEHSFWRSFHTERKTEPATGFIDGDLIESFLDISRPKMQEVVANLQYDDGSGMKREATADDLIKVVEELTRIH\n>4i10_A mol:protein length:406  Beta-secretase 1\nMRGSFVEMVDNLRGKSGQGYYVEMTVGSPPQTLNILVDTGSSNFAVGAAPHPFLHRYYQRQLSSTYRDLRKGVYVPYTQGKWEGELGTDLVSIPHGPNVTVRANIAAITESDKFFINGSNWEGILGLAYAEIARPDDSLEPFFDSLVKQTHVPNLFSLQLCGAGFPLNQSEVLASVGGSMIIGGIDHSLYTGSLWYTPIRREWYYEVIIVRVEINGQDLKMDCKEYNYDKSIVDSGTTNLRLPKKVFEAAVKSIKAASSTEKFPDGFWLGEQLVCWQAGTTPWNIFPVISLYLMGEVTNQSFRITILPQQYLRPVEDVATSQDDCYKFAISQSSTGTVMGAVIMEGFYVVFDRARKRIGFAVSACHVHDEFRTAAVEGPFVTLDMEDCGYNIPQTDESRSHHHHHH\n>5j88_D1 mol:protein length:56  50S ribosomal protein L32\nAVQQNKPTRSKRGMRRSHDALTAVTSLSVDKTSGEKHLRHHITADGYYRGRKVIAK\n>6wl8_oA mol:protein length:29  Form 2 peptide\nQAKILEADAEILKAYAKILEAHAEILKAQ\n>4z3s_1q mol:protein length:105  30S ribosomal protein S17\nMPKKVLTGVVVSDKMQKTVTVLVERQFPHPLYGKVIKRSKKYLAHDPEEKYKLGDVVEIIESRPISKRKRFRVLRLVESGRMDLVEKYLIRRQNYESLSKRGGKA\n>1tyq_D mol:protein length:300  Arp2/3 complex 34kDa subunit\nMILLEVNNRIIEETLALKFENAAAGNKPEAVEVTFADFDGVLYHISNPNGDKTKVMVSISLKFYKELQAHGADELLKRVYGSYLVNPESGYNVSLLYDLENLPASKDSIVHQAGMLKRNCFASVFEKYFQFQEEGKEGENRAVIHYRDDETMYVESKKDRVTVVFSTVFKDDDDVVIGKVFMQEFKEGRRASHTAPQVLFSHREPPLELKDTDAAVGDNIGYITFVLFPRHTNASARDNTINLIHTFRDYLHYHIKCSKAYIHTRMRAKTSDFLKVLNRARPDAEKKEMKTITGKTFSSR\n>7jxs_F mol:protein length:137  Matrix protein\nGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGRLQPSLQTGSEELRSLYNTIAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQVSQNYHHHHHH\n>1ww4_D mol:protein length:160  galectin\nTTSAVNIYNISAGASVDLAAPVTTGDIVTFFSSALNLSAGAGSPNNTALNLLSENGAYLLHIAFRLQENVIVFNSRQPNAPWLVEQRVSNVANQFIGSGGKAMVTVFDHGDKYQVVINEKTVIQYTKQISGTTSSLSYNSTEGTSIFSTVVEAVTYTGLA\n>3waa_G mol:protein length:131  Histone H2A.V\nGSHMAGGKAGKDSGKAKAKAVSRSQRAGLQFPVGRIHRHLKTRTTSHGRVGATAAVYSAAILEYLTAEVLELAGNASKDLKVKRITPRHLQLAIRGDEELDSLIKATIAGGGVIPHIHKSLIGKKGQQKTA\n>6ryr_H mol:protein length:123  Histone H2B 1.1\nMAKSAPAPKKGSKKAVTKTQKKDGKKRRKTRKESYAIYVYKVLKQVHPDTGISSKAMSIMNSFVNDVFERIAGEASRLAHYNKRSTITSREIQTAVRLLLPGELAKHAVSEGTKAVTKYTSAK\n>6umr_A mol:protein length:441  Damage-control phosphatase DUF89\nMAVVPASLSGQDVGSFAYLTIKDRIPQILTKVIDTLHRHKSEFFEKHGEEGVEAEKKAISLLSKLRNELQTDKPFIPLVEKFVDTDIWNQYLEYQQSLLNESDGKSRWFYSPWLLVECYMYRRIHEAIIQSPPIDYFDVFKESKEQNFYGSQESIIALCTHLQQLIRTIEDLDENQLKDEFFKLLQISLWGNKCDLSLSGGESSSQNTNVLNSLEDLKPFILLNDMEHLWSLLSNCKKTREKASATRVYIVLDNSGFELVTDLILADFLLSSELATEVHFYGKTIPWFVSATTIHDFNWLIEQVKHSNHKWMSKCGADWEEYIKMGKWVYHNHIFWTLPHEYCAMPQVAPDLYAELQKAHLILFKGDLNYRKLTGDRKWEFSVPFHQALNGFHPAPLCTIRTLKAEIQVGLQPGQGEQLLASEPSWWTTGKYGIFQYDGPL\n>1m64_A mol:protein length:571  flavocytochrome c3\nADNLAEFHVQNQECDSCHTPDGELSNDSLTYENTQCVSCHGTLAEVAETTKHEHYNAHASHFPGEVACTSCHSAHEKSMVYCDSCHSFDFNMPYAKKWLRDEPTIAELAKDKSERQAALASAPHDTVDVVVVGSGGAGFSAAISATDSGAKVILIEKEPVIGGNAKLAAGGMNAAWTDQQKAKKITDSPELMFEDTMKGGQNINDPALVKVLSSHSKDSVDWMTAMGADLTDVGMMGGASVNRAHRPTGGAGVGAHVVQVLYDNAVKRNIDLRMNTRGIEVLKDDKGTVKGILVKGMYKGYYWVKADAVILATGGFAKNNERVAKLDPSLKGFISTNQPGAVGDGLDVAENAGGALKDMQYIFAHPTLSVKGGVMVTEAVRGNGAILVNREGKRFVNEITTRDKASAAILAQTGKSAYLIFDDSVRKSLSKIDKYIGLGVAPTADSLVKLGKMEGIDGKALTETVARYNSLVSSGKDTDFERPNLPRALNEGNYYAIEVTPGVHHTMGGVMIDTKAEVMNAKKQVIPGLYGAGEVTGGVHGANRLGGNAISDIITFGRLAGEEAAKYSKKN\n>5kwy_D mol:protein length:133  Epididymal secretory protein E1\nEPVQFKDCGSVDGVIKEVNVSPCPTQPCQLSKGQSYSVNVTFTSNIQSKSSKAVVHGILMGVPVPFPIPEPDGCKSGINCPIQKDKTYSYLNKLPVKSEYPSIKLVVEWQLQDDKNQSLFCWEIPVQIVSHLA\n>5jc9_AU mol:protein length:56  30S ribosomal protein S21\nPVIKVRENEPFDVALRRFKRSCEKAGVLAEVRRREFYEKPTTERKRAKASAVKRHA\n>2jd7_C mol:protein length:174  FERRITIN HOMOLOG\nMLSERMLKALNDQLNRELYSAYLYFAMAAYFEDLGLEGFANWMKAQAEEEIGHALRFYNYIYDRNGRVELDEIPKPPKEWESPLKAFEAAYEHEKFISKSIYELAALAEEEKDYSTRAFLEWFINEQVEEEASVKKILDKLKFAKDSPQILFMLDKELSARAPKLPGLLMQGGE\n>4r6o_H mol:protein length:19  Agglutinin beta-3 chain\nEQSGISQTVIVGPWGAKVS\n>2hzi_B mol:protein length:277  Proto-oncogene tyrosine-protein kinase ABL1\nGAMDPSPNYDKWEMERTDITMKHKLGGGQYGEVYEGVWKKYSLTVAVKTLKEDTMEVEEFLKEAAVMKEIKHPNLVQLLGVCTREPPFYIITEFMTYGNLLDYLRECNRQEVNAVVLLYMATQISSAMEYLEKKNFIHRDLAARNCLVGENHLVKVADFGLSRLMTGDTYTAHAGAKFPIKWTAPESLAYNKFSIKSDVWAFGVLLWEIATYGMSPYPGIDLSQVYELLEKDYRMERPEGCPEKVYELMRACWQWNPSDRPSFAEIHQAFETMFQES\n>6wyd_E mol:protein length:467  Myeloperoxidase heavy chain\nVNCETSCVQQPPCFPLKIPPNDPRIKNQADCIPFFRSCPACPGSNITIRNQINALTSFVDASMVYGSEEPLARNLRNMSNQLGLLAVNQRFQDNGRALLPFDNLHDDPCLLTNRSARIPCFLAGDTRSSEMPELTSMHTLLLREHNRLATELKSLNPRWDGERLYQEARKIVGAMVQIITYRDYLPLVLGPTAMRKYLPTYRSYNDSVDPRIANVFTNAFRYGHTLIQPFMFRLDNRYQPMEPNPRVPLSRVFFASWRVVLEGGIDPILRGLMATPAKLNRQNQIAVDEIRERLFEQVMRIGLDLPALNMQRSRDHGLPGYNAWRRFCGLPQPETVGQLGTVLRNLKLARKLMEQYGTPNNIDIWMGGVSEPLKRKGRVGPLLACIIGTQFRKLRDGDRFWWENEGVFSMQQRQALAQISLPRIICDNTGITTVSKNNIFMSNSYPRDFVNCSTLPALNLASWREAS\n>3cgx_A mol:protein length:242  Putative nucleotide-diphospho-sugar transferase\nGMSESCILFFVKYPEPGKVKTRLGEVVGNDKAAMLYRHFVQDMLQGLARLHADLHICYVPGDADLPEKFKAWLGPQHMFAAQQGLDLGERMKHAMQKAFDDGYDRVVLMGSDIPDYPCELVQKALNDLQHYDAAIGPAFDGGYYLIGFRKDSFCPDVFDGIRWGEADVYQPTVEKMRRARLEVLQLPDWNDVDTVWDLNVLYRTNKNSSFRRSSTYALLRENDALIRQYDIDLPGMAPVEKE\n>3dke_X mol:protein length:164  Lysozyme\nMNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAAAINLVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL\n>6jxq_A mol:protein length:147  Lysozyme C\nMRSLLILVLCFLPLAALGKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRL\n>1ju2_A mol:protein length:536  hydroxynitrile lyase\nLATTSDHDFSYLSFAYDATDLELEGSYDYVIVGGGTSGCPLAATLSEKYKVLVLERGSLPTAYPNVLTADGFVYNLQQEDDGKTPVERFVSEDGIDNVRGRVLGGTSIINAGVYARANTSIYSASGVDWDMDLVNQTYEWVEDTIVYKPNSQSWQSVTKTAFLEAGVHPNHGFSLDHEEGTRITGSTFDNKGTRHAADELLNKGNSNNLRVGVHASVEKIIFSNAPGLTATGVIYRDSNGTPHQAFVRSKGEVIVSAGTIGTPQLLLLSGVGPESYLSSLNIPVVLSHPYVGQFLHDNPRNFINILPPNPIEPTIVTVLGISNDFYQCSFSSLPFTTPPFGFFPSSSYPLPNSTFAHFASKVAGPLSYGSLTLKSSSNVRVSPNVKFNYYSNLTDLSHCVSGMKKIGELLSTDALKPYKVEDLPGVEGFNILGIPLPKDQTDDAAFETFCRESVASYWHYHGGCLVGKVLDGDFRVTGINALRVVDGSTFPYTPASHPQGFYLMLGRYVGIKILQERSASDLKILDSLKSAASLVL\n>3oi9_A mol:protein length:164  Molybdenum cofactor synthesis domain\nGPGSMTTRSARVIIASTRASSGEYEDRCGPIITEWLAQQGFSSAQPEVVADGSPVGEALRKAIDDDVDVILTSGGTGIAPTDSTPDQTVAVVDYLIPGLAEAIRQSGLPKVPTSVLSRGVCGVAGQTLIVNLPGSPGGVRDGLGVLAGVLDHALDQLAGKDHPR\n>5zf0_C1 mol:protein length:80  Photosystem I iron-sulfur center\nAHTVKIYDTCIGCTQCVRACPTDVLEMVPWDGCKAGQIASSPRTEDCVGCKRCETACPTDFLSIRVYLGAETTRSMGLAY\n>3fq3_H mol:protein length:197  Inorganic pyrophosphatase:Bacterial/Archaeal inorganic pyrophosphatase\nMAHHHHHHMGTLEAQTQGPGSMNIDAISIGSNPPEDVNVIIEVPVGGQPIKYEMDKKAGALIVDRFLYTPMTYPGNYGFVPHTLSEDGDPIDVLVCNTRPLIPGCVINVRPIGVLVMEDNSGKDEKIIAVPSPHLTRRYEKIHDYTDMPEITLKQIAHFFEHYKDLEPGKWVKIGDWGDEDYARKFIVEAIERAKGK\n>7s5z_A mol:protein length:390  ATP-sensitive inward rectifier potassium channel 11\nMLSRKGIIPEEYVLTRLAEDPAKPRYRARQRRARFVSKKGNCNVAHKNIREQGRFLQDVFTTLVDLKWPHTLLIFTMSFLCSWLLFAMAWWLIAFAHGDLAPSEGTAEPCVTSIHSFSSAFLFSIEVQVTIGFGGRMVTEECPLAILILIVQNIVGLMINAIMLGSIFMKTAQAHRRAETLIFSKHAVIALRHGRLCFMLRVGDLRKSMIISATIHMQVVRKTTSPEGEVVPLHQVDIPMENGVGGNSIFLVAPLIIYHVIDANSPLYDLAPSDLHHHQDLEIIVILEGVVETTGITTQARTSYLADEILWGQRFVPIVAEEDGRYSVDYSKFDNTVKVPTPLCTARQLDEDHSLLEALTLASARGPLRKRSVPMAKAKPKFSISPDSLS\n>6zsb_g mol:protein length:166  39S ribosomal protein L49, mitochondrial\nMAATMFRATLRGWRTGVQRGCGLRLLSQTQGPPDYPRFVESVDEYQFVERLLPATRIPDPPKHEHYPTPSGWQPPRDPPPNLPYFVRRSRMHNIPVYKDITHGNRQMTVIRKVEGDIWALQKDVEDFLSPLLGKTPVTQVNEVTGTLRIKGYFDQELKAWLLEKGF\n>7xoa_C mol:protein length:1270  Spike glycoprotein\nMFVFLVLLPLVSSQCVNLITRTQSYTNSFTRGVYYPDKVFRSSVLHSTQDLFLPFFSNVTWFHAIHVSGTNGTKRFDNPVLPFNDGVYFASTEKSNIIRGWIFGTTLDSKTQSLLIVNNATNVVIKVCEFQFCNDPFLDVYYHKNNKSWMESEFRVYSSANNCTFEYVSQPFLMDLEGKQGNFKNLREFVFKNIDGYFKIYSKHTPINLGRDLPQGFSALEPLVDLPIGINITRFQTLLALHRSYLTPGDSSSGWTAGAAAYYVGYLQPRTFLLKYNENGTITDAVDCALDPLSETKCTLKSFTVEKGIYQTSNFRVQPTESIVRFPNITNLCPFDEVFNATRFASVYAWNRKRISNCVADYSVLYNFAPFFAFKCYGVSPTKLNDLCFTNVYADSFVIRGNEVSQIAPGQTGNIADYNYKLPDDFTGCVIAWNSNKLDSKVGGNYNYLYRLFRKSNLKPFERDISTEIYQAGNKPCNGVAGFNCYFPLRSYGFRPTYGVGHQPYRVVVLSFELLHAPATVCGPKKSTNLVKNKCVNFNFNGLTGTGVLTESNKKFLPFQQFGRDIADTTDAVRDPQTLEILDITPCSFGGVSVITPGTNTSNQVAVLYQGVNCTEVPVAIHADQLTPTWRVYSTGSNVFQTRAGCLIGAEYVNNSYECDIPIGAGICASYQTQTKSHGSASSVASQSIIAYTMSLGAENSVAYSNNSIAIPTNFTISVTTEILPVSMTKTSVDCTMYICGDSTECSNLLLQYGSFCTQLKRALTGIAVEQDKNTQEVFAQVKQIYKTPPIKYFGGFNFSQILPDPSKPSKRSPIEDLLFNKVTLADAGFIKQYGDCLGDIAARDLICAQKFNGLTVLPPLLTDEMIAQYTSALLAGTITSGWTFGAGPALQIPFPMQMAYRFNGIGVTQNVLYENQKLIANQFNSAIGKIQDSLSSTPSALGKLQDVVNHNAQALNTLVKQLSSKFGAISSVLNDILSRLDPPEAEVQIDRLITGRLQSLQTYVTQQLIRAAEIRASANLAATKMSECVLGQSKRVDFCGKGYHLMSFPQSAPHGVVFLHVTYVPAQEKNFTTAPAICHDGKAHFPREGVFVSNGTHWFVTQRNFYEPQIITTDNTFVSGNCDVVIGIVNNTVYDPLQPELDSFKEELDKYFKNHTSPDVDLGDISGINASVVNIQKEIDRLNEVAKNLNESLIDLQELGKYEQYIKWPWYIWLGFIAGLIAIVMVTIMLCCMTSCCSCLKGCCSCGSCCKFDEDDSEPVLKGVKLHYT\n>5dgf_M9 mol:protein length:188  60S ribosomal protein L19-A\nANLRTQKRLAASVVGVGKRKVWLDPNETSEIAQANSRNAIRKLVKNGTIVKKAVTVHSKSRTRAHAQSKREGRHSGYGKRKGTREARLPSQVVWIRRLRVLRRLLAKYRDAGKIDKHLYHVLYKESKGNAFKHKRALVEHIIQAKADAQREKALNEEAEARRLKNRAARDRRAQRVAEKRDALLKEDA\n>4otz_A mol:protein length:395  Amino acid/amide ABC transporter substrate-binding protein, HAAT family\nSNATNTDTNSTNNSPNNTTNTTTNVTTTSDKNTIPIGIALAQTSNVALLGQEQVAGAKIAEKYFNDKGGVNGTPIKLIFQDTAGDEAGTINAFQTLINKDKVVGIVGPTLSQQAFSANPIAERAKVPVVGPSNTAKGIPEIGDYVARVSAPVSVVAPNSVKAALKQNPNIKKVAVFFAQNDAFSKSETEIFQQTVKDQGLELVTVQKFQTTDTDFQSQATNAINLKPDLVIISGLAADGGNLVRQLRELGYQGAIIGGDGLNTSNVFAVCKALCDGVLIAQAYSPEYTGEINKAFRQAYVDQYKKEPPQFSAQAFAAVQVYVESLKALDTKNKVSKIQLPELRTELNKQLLTGKYNTPLGEISFTPIGEVVQKDFYVAQIKMEKDGSQGKFTFLK\n>1dps_L mol:protein length:167  DPS\nMSTAKLVKSKATNLLYTRNDVSDSEKKATVELLNRQVIQFIDLSLITKQAHWNMRGANFIAVHEMLDGFRTALIDHLDTMAERAVQLGGVALGTTQVINSKTPLKSYPLDIHNVQDHLKELADRYAIVANDVRKAIGEAKDDDTADILTAASRDLDKFLWFIECNIE\n>7wxi_A mol:protein length:776  Delta-1-pyrroline-5-carboxylate synthase\nMLQNSFKLAQSLRNGFYRNAWRAFSSHGPRQPLVSPERRLEKAHPTFTERSQLKYARRLVVKLGSAVITREDNHGLALGRLASIVEQVAECHLEGREVMMVTSGAVAFGKQKLAQELLMSLSMRETLNPKDSKEFDGATLEPRAAAAVGQSGLMSLYDAMFAQYGVKIAQVLVTKPDFYNEETRNNLFCTLSELISLNIVPIINTNDAVSPPMFIRDDEPAGGARRGIPIKDNDSLSAMLAAEVQADLLILMSDVDGIYNKPPWEDGAKLMHTYTSDDSNSIEFGKKSKVGTGGMDSKVKAATWALDRGVSVVICNGMQEKAIKTIIGGRKVGTFFTEATESANAVPVEVMAENARTGSRQMQALTPAQRASAVNTLADLLVSREKFILDANAKDLAEAQKSGLAKPLLSRLSLNPAKLKNLSVGLKQIAEDSHKNVGRVLRRTRLADQLELKQVTVPIGVLLVIFESRPDSLPQVAALAMASANGLLLKGGKEAAHSNKALMELVKEALATVGAEHAVSLVSTREEISDLLSMENHIDLIIPRGSSDLVRSIQQQSLHIPVLGHAEGVCHVYIDRDADLEKALRIARDAKCDYPAACNAMETLLIHEDLMSGAIFGDVCNMLKREGVKIYAGPRLNQQLTFGPPAAKSLKHEYGALECCIEVVPSLDEAINHIHTYGSSHTDVIVTENDAAARQFLGSVDSACVFHNASSRFADGFRFGLGAEVGISTARIHARGPVGVEGLLTTKWILEGQDHAAADFAEGGGRTWLHETLPLD\n>4u1v_B3 mol:protein length:64  50S ribosomal protein L35\nPKIKTVRGAAKRFKKTGKGGFKHKHANLRHILTKKATKRKRHLRPKAMVSKGDLGLVIACLPYA\n>5l5h_J mol:protein length:198  Proteasome subunit beta type-4\nMDIILGIRVQDSVILASSKAVTRGISVLKDSDDKTRQLSPHTLMSFAGEAGDTVQFAEYIQANIQLYSIREDYELSPQAVSSFVRQELAKSIRSRRPYQVNVLIGGYDKKKNKPELYQIDYLGTKVELPYGAHGYSGFYTFSLLDHHYRPDMTTEEGLDLLKLCVQELEKRMPMDFKGVIVKIVDKDGIRQVDDFQAQ\n>6mu3_M mol:protein length:225  Fab 2G12, heavy chain\nEVQLVESGGGLVKAGGSLILSCGVSNFRISAHTMNWVRRVPGGGLEWVASISTSSTYRDYADAVKGRFTVSRDDLEDFVYLQMHKMRVEDTAIYYCARKGSDRLSDNDPFDAWGPGTVVTVSPASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKS\n>3sud_B mol:protein length:203  NS3 protease, NS4A protein\nGSHMASMKKKGSVVIVGRINLSGDTAYAQQTRGEEGCQETSQTGRDKNQVEGEVQIVSTATQTFLATSINGVLWTVYHGAGTRTIASPKGPVTQMYTNVDKDLVGWQAPQGSRSLTPCTCGSSDLYLVTRHADVIPVRRRGDSRGSLLSPRPISYLKGSAGGPLLCPAGHAVGIFRAAVSTRGVAKAVDFIPVESLETTMRSP\n>6bfq_I mol:protein length:127  Granulocyte-macrophage colony-stimulating factor\nAPARSPSPSTQPWEHVNAIQEARRLLNLSRDTAAEMNETVEVISEMFDLQEPTCLQTRLELYKQGLRGSLTKLKGPLTMMASHYKQHCPPTPETSCATQIITFESFKENLKDFLLVIPFDCWEPVQE\n>5fl8_R mol:protein length:189  60S ribosomal protein L19-A\nMANLRTQKRLAASVVGVGKRKVWLDPNETSEIAQANSRNAIRKLVKNGTIVKKAVTVHSKSRTRAHAQSKREGRHSGYGKRKGTREARLPSQVVWIRRLRVLRRLLAKYRDAGKIDKHLYHVLYKESKGNAFKHKRALVEHIIQAKADAQREKALNEEAEARRLKNRAARDRRAQRVAEKRDALLKEDA\n>6hiv_BJ mol:protein length:333  mL76\nMLRLSSWNLKSQHHNVLRRSRPHIHKYRELNRWQRQAQGISKWDQSHSHRPLPYVERFNPESVGLTRGTSAFAWKWWHTQYPWLPNVPPEAAQIDEAQKQERRSHRPPAWDDEFAKVVLNMNDAEIREYLMSKLTDVIFLETQRDGYELRRLDFEGKPLTSLPEPRIIENFVLEEETIRERVIYQVVEGVFRLSPTSADRRELRSVANIIDYVLTHVRAARPTDRERRQERPITSAALAVMQKCPIQPQLGFVHALPHDTRDALLQEWERMHHLDWQFGKAVYTPRSKENVRGNLTWLREDRHYDQRMKFMQEVESGEARAKHMKLIAEAAGN\n>7kf1_B mol:protein length:218  anti-VEGF-A Fab bH1 light chain\nDIQMTQSPSSLSASVGDRVTITCRASQDIPRSISGYVAWYQQKPGKAPKLLIYWGSYLYSGVPSRFSGSGSGTDFTLTISSLQPEDFATYYCQQHYTTPPTFGQGTKVEIKRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC\n>2v7n_B mol:protein length:229  IMMUNOGLOBULIN HEAVY CHAIN\nQVQLVESGGGLVQPGGSLRLSCAASGFTFRNSAMHWVRQAPGKGLEWVSSIWYSGSNTYYADSVKGRFTISRDNSKNTLYLQMNSLRAEDTAVYYCARFAGGWGAYDVWGQGTLVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSEFHHHHHH\n>4ium_A mol:protein length:142  papain-like protease 2\nGYNPPGDGACGYRCLAFMNGATVVSAGCSSDLWCDDELAYRVFQLSPTFTVTIPGGRVCPNAKYAMICDKQHWRVKRAKGVGLCLDESCFRGICNCQRMSGPPPAPVSAAVLDHILEAATFGNVRVVTPEGQGSSGHHHHHH\n>5qob_B mol:protein length:189  Thiol:disulfide interchange protein\nAQYEDGKQYTTLEKPVAGAPQVLEFFSFFCPHCYQFEEVLHISDNVKKKLPEGVKMTKYHVNFMGGDLGKDLTQAWAVAMALGVEDKVTVPLFEGVQKTQTIRSASDIRDVFINAGIKGEEYDAAWNSFVVKSLVAQQEKAAADVQLRGVPAMFVNGKYQLNPQGMDTSNMDVFVQQYADTVKYLSEKK\n>7odk_AAA mol:protein length:617  Receptor-like protein kinase HSL1\nGSSMDNQDGFILQQVKLSLDDPDSYLSSWNSNDASPCRWSGVSCAGDFSSVTSVDLSSANLAGPFPSVICRLSNLAHLSLYNNSINSTLPLNIAACKSLQTLDLSQNLLTGELPQTLADIPTLVHLDLTGNNFSGDIPASFGKFENLEVLSLVYNLLDGTIPPFLGNISTLKMLNLSYNPFSPSRIPPEFGNLTNLEVMWLTECHLVGQIPDSLGQLSKLVDLDLALNDLVGHIPPSLGGLTNVVQIELYNNSLTGEIPPELGNLKSLRLLDASMNQLTGKIPDELCRVPLESLNLYENNLEGELPASIALSPNLYEIRIFGNRLTGGLPKDLGLNSPLRWLDVSENEFSGDLPADLCAKGELEELLIIHNSFSGVIPESLADCRSLTRIRLAYNRFSGSVPTGFWGLPHVNLLELVNNSFSGEISKSIGGASNLSLLILSNNEFTGSLPEEIGSLDNLNQLSASGNKFSGSLPDSLMSLGELGTLDLHGNQFSGELTSGIKSWKKLNELNLADNEFTGKIPDEIGSLSVLNYLDLSGNMFSGKIPVSLQSLKLNQLNLSYNRLSGDLPPSLAKDMYKNSFIGNPGLCGDIKGLCGSENEAKKRGYVLEGSENLYFQ\n>1ixm_B mol:protein length:192  PROTEIN (SPORULATION RESPONSE REGULATORY PROTEIN)\nMKDVSKNQEENISDTALTNELIHLLGHSRHDWMNKLQLIKGNLSLQKYDRVFEMIEEMVIDAKHESKLSNLKTPHLAFDFLTFNWKTHYMTLEYEVLGEIKDLSAYDQKLAKLMRKLFHLFDQAVSRESENHLTVSLQTDHPDRQLILYLDFHGAFADPSAFDDIRQNGYEDVDIMRFEITSHECLIEIGLD\n>7c0w_A mol:protein length:406  Sugar ABC transporter, periplasmic sugar-binding protein\nMMKPEDVIKEQCARAKVVAELWHGFTGGAPKAALENLVVEFNKAQQGRCVRPVPQGGYRDLSTKIKAAFAAGKVPTMAQAFENNIALYLEAKALLPIESLGVKLQGVNLTFLNAVRFGGVVYGVPFNKSIQVLYYNKDLLKKHGVPVPATLEEFVAAAKKLSRAEGGPVYWFQPDASTFAYFFFNLGGSYLKDGKLVLNSKEAVEALTLLQNGVKEGWAKPITSGAINQNLGSGPYAFSVDTSAGYTYYLRAAKFDLGVATLPGRTKGQPGYGLVQGTNLVVFRQASKEEQAVAKDFLEFVLSPRAQAVFATATGYVPVTEGALKDPVYQAYAAENPDYATIVRQSRYAKFEPALAEWEQIRFDILGQAIKEAILNKADPKAALDRAQKLAEDLLSSRTRHHHHHH\n>5pln_A mol:protein length:364  Lysine-specific demethylase 4D\nMHHHHHHSSGVDLGTENLYFQSMETMKSKANCAQNPNCNIMIFHPTKEEFNDFDKYIAYMESQGAHRAGLAKIIPPKEWKARETYDNISEILIATPLQQVASGRAGVFTQYHKKKKAMTVGEYRHLANSKKYQTPPHQNFEDLERKYWKNRIYNSPIYGADISGSLFDENTKQWNLGHLGTIQDLLEKECGVVIEGVNTPYLYFGMWKTTFAWHTEDMDLYSINYLHLGEPKTWYVVPPEHGQRLERLARELFPGSSRGCGAFLRHKVALISPTVLKENGIPFNRITQEAGEFMVTFPYGYHAGFNHGFNCAEAINFATPRWIDYGKMASQCSCGEARVTFSMDAFVRILQPERYDLWKRGQDR\n>7xxg_A mol:protein length:277  VP1\nGDNQDRTVANTQPSGPSNSKEIPALTAVETGHTSQVDPSDTLQTRHVVNFHSRSESTVENFMGRAACVFMDQYKLNGEETSTDNFAVWTINVREMAQLRRKCELFTYMRFDIEMTMVITSCQDQGTQLEQDMPVLTHQIMYVPPGGPIPAKVDSYEWQTSTNPSVFWTEGNAPARMSIPFISVGNAYSLFYDGWSHFTQDGTYGYTTLNAMGKLFVRHVNKSSPHQITSTIRVYFKPKHIKAWVPRPPRLCPYINKGDVNFVVTEVTDARKSITDTP\n>6ynl_A mol:protein length:183  YTHDC1\nMHHHHHHSSGRENLYFQGTSKLKYVLQDARFFLIKSNNHENVSLAKAKGVWSTLPVNEKKLNLAFRSARSVILIFSVRESGKFQGFARLSSESHHGGSPIHWVLPAGMSAKMLGGVFKIDWICRRELPFTKSAHLTNPWNEHKPVKIGRDGQEIELECGTQLCLLFPPDESIDLYQVIHKMRH\n>7xat_A mol:protein length:563  Somatostatin receptor type 2,LargeBit\nMKTIIALSYIFCLVFADYKDDDDKGSGSHHHHHHHHHHLEVLFQGPMDMADEPLNGSHTWLSIPFDLNGSVVSTNTSNQTEPYYDLTSNAVLTFIYFVVCIIGLCGNTLVIYVILRYAKMKTITNIYILNLAIADELFMLGLPFLAMQVALVHWPFGKAICRVVMTVDGINQFTSIFCLTVMSIDRYLAVVHPIKSAKWRRPRTAKMITMAVWGVSLLVILPIMIYAGLRSNQWGRSSCTINWPGESGAWYTGFIIYTFILGFLVPLTIICLCYLFIIIKVKSSGIRVGSSKRKKSEKKVTRMVSIVVAVFIFCWLPFYIFNVSSVSMAISPTPALKGMFDFVVVLTYANSCANPILYAFLSDNFKKSFQNVLCLVKVSGTDDGERSDSKQDKSRLNETTETQRTVFTLEDFVGDWEQTAAYNLDQVLEQGGVSSLLQNLAVSVTPIQRIVRSGENALKIDIHVIIPYEGLSADQMAQIEEVFKVVYPVDDHHFKVILPYGTLVIDGVTPNMLNYFGRPYEGIAVFDGKKITVTGTLWNGNKIIDERLITPDGSMLFRVTINS\n>3k7z_A mol:protein length:33  General control protein GCN4\nRMKQLEDKVEELLSKAYHLENEVARLKKLVGER\n>1uld_C mol:protein length:150  galectin-2\nMLYHLFVNNQVKLQNDFKPESVAAIRSSAFNSKGGTTVFNFLSAGENILLHISIRPGENVIVFNSRLKNGAWGPEERIPYAEKFRPPNPSITVIDHGDRFQIRFDYGTSIYYNKRIKENAAAIAYNAENSLFSSPVTVDVHGLLPPLPPA\n>1nz0_A mol:protein length:118  Ribonuclease P protein component\nGSTESFTRRERLRLRRDFLLIFKEGKSLQNEYFVVLFRKNGMDYSRLGIVVKRKFGKATRRNKLKRWVREIFRRNKGVIPKGFDIVVIPRKKLSEEFERVDFWTVREKLLNLLKRIEG\n>7wt2_B mol:protein length:184  Lactoylglutathione lyase\nMAEPQPPSGGLTDEAALSCCSDADPSTKDFLLQQTMLRVKDPKKSLDFYTRVLGMTLIQKCDFPIMKFSLYFLAYEDKNDIPKEKDEKIAWALSRKATLELTHNWGTEDDETQSYHNGNSDPRGFGHIGIAVPDVYSACKRFEELGVKFVKKPDDGKMKGLAFIQDPDGYWIEILNPNKMATLM\n>4v79_AS mol:protein length:81  30S ribosomal protein S19\nXRSLKKGPFIDLHLLKKVEKAVESGDKKPLRTWSRRSTIFPNMIGLTIAVHNGRQHVPVFVTDEMVGHKLGEFAPTRTYRX\n>4prp_B mol:protein length:99  Beta-2-microglobulin\nIQRTPKIQVYSRHPAENGKSNFLNCYVSGFHPSDIEVDLLKNGERIEKVEHSDLSFSKDWSFYLLYYTEFTPTEKDEYACRVNHVTLSQPKIVKWDRDM\n>6zpo_H mol:protein length:146  ATP synthase subunit delta, mitochondrial\nAEAAAAQAPAAGPGQMSFTFASPTQVFFNSANVRQVDVPTQTGAFGILAAHVPTLQVLRPGLVVVHAEDGTTSKYFVSSGSVTVNADSSVQLLAEEAVTLDMLDLGAAKANLEKAQSELLGAADEATRAEIQIRIEANEALVKALE\n>1yxo_B mol:protein length:328  4-hydroxythreonine-4-phosphate dehydrogenase 1\nMSLRFALTPGEPAGIGPDLCLLLARSAQPHPLIAIASRTLLQERAGQLGLAIDLKDVSPAAWPERPAKAGQLYVWDTPLAAPVRPGQLDRANAAYVLETLTRAGQGCLDGHFAGMITAPVHKGVINEAGIPFSGHTEFLADLTHTAQVVMMLATRGLRVALATTHLPLREVADAISDERLTRVARILHADLRDKFGIAHPRILVCGLNPHAGEGGHLGREEIEVIEPCLERLRGEGLDLIGPLPADTLFTPKHLEHCDAVLAMYHDQGLPVLKYKGFGAAVNVTLGLPIIRTSVDHGTALDLAGSGRIDSGSLQVALETAYQMAASRC\n>7n2u_Pp mol:protein length:3  Nascent peptide\nMFK\n>4ui8_C mol:protein length:48  TANKYRASE-2\nMAHSPPGHHSVTGRPSVNGLALAEYVIYRGEQAYPEYLITYQIMRPEG\n>4v8d_DT mol:protein length:96  50S ribosomal protein L23\nMKTAYDVILAPVLSEKAYAGFAEGKYTFWVHPKATKTEIKNAVETAFKVKVVKVNTLHVRGKKKRLGRYLGKRPDRKKAIVQVAPGQKIEALEGLI\n>5dcm_B mol:protein length:243  PhoB family transcriptional regulator\nMSQEQGKIYIVEDDMTIVSLLKDHLSASYHVSSVSNFRDVKQEIIAFQPDLILMDITLPYFNGFYWTAELRKFLTIPIIFISSSNDEMDMVMALNMGGDDFISKPFSLAVLDAKLTAILRRSQQFIQQELTFGGFTLTREGLLSSQDKEVILSPTENKILSILLMHPKQVVSKESLLEKLWENDSFIDQNTLNVNMTRLRKKIVPIGFDYIHTVRGVGYLLQNDPSSSVDKLAAALEHHHHHH\n>6v1q_A mol:protein length:773  Two pore channel 3\nMSEGKTEKTSHTLTKDEGFTNGGNHVPSNVTDQMTEKFDLATVYVSDAKYNRNIFFDTSPQAVKLYLLYNHWFMQTLVYVFIIINLALALFEDPAVVPLPIWATSTIETICLSAFTVRIIHYAKVIPKDKFWKDPKNICIIIIVTLSFIDMVIYGALKATGHYGIRWSRVLRPLLLVNVTEGRQLRRAFRSIRNALPQISYVFFLFMFSVLVFSLMALKLFGKRGLLTINGSPYFTDYMDIVFDLYVLVTTANSPDVMMPAYNSSVYFTIFFILYIVINTYTFMSFFLAVVYNNYKKYLKEEVRQLVKAKRIKMCRAFSLLQENRGEGGEPVVTQANWNHLVKLVKPKISTAHRELLWSVLDDQNKGHIGKFAFVQLADLLSIQVITVKSQAHPIQICFPSLYNSLPSRFIRQMVHHRVFVYAYDLIILVNAVFIGLDEENPVVSNAEWGFLALYMLEILLKLYATEPRAFFARHQFWNWFDTIIVVSALFGTIINSALKHSGGYTSRQVLDIVFILRVLRLIRVVDSIKRFRAIINTLIKIGPTILTFGQLILVVYYIFAMVGMELFKGKIQFFEPNSTSPDREYCGNPLLKSTSFAKLNYCKNNFNDVISSFILLLELTVVNQWHVLTSGFTAVTHVSARLFFVIFHIVVVIIIINIFVAFILEAFLVEYTVDKSELQTSLEKKIEELELNVQQDGVDTGLVDAMETNDSDLGSSEDGKRKPSLMFKIASRRSRTVDGLLQRMFETDLRPEDFNEEELDNTNFSNPVFDSV\n>6xza_O2 mol:protein length:117  50S ribosomal protein L18\nMDKKSARIRRATRARRKLQELGATRLVVHRTPRHIYAQVIAPNGSEVLVAASTVEKAIAEQLKYTGNKDAAAAVGKAVAERALEKGIKDVSFDRSGFQYHGRVQALADAAREAGLQF\n>7of6_J mol:protein length:192  39S ribosomal protein L11, mitochondrial\nMSKLGRAARGLRKPEVGGVIRAIVRAGLAMPGPPLGPVLGQRGVSINQFCKEFNERTKDIKEGIPLPTKILVKPDRTFEIKIGQPTVSYFLKAAAGIEKGARQTGKEVAGLVTLKHVYEIARIKAQDEAFALQDVPLSSVVRSIIGSARSLGIRVVKDLSSEELAAFQKERAIFLAAQKEADLAAQEEAAKK\n>5ltq_M mol:protein length:269  Green fluorescent protein blFP-Y3\nMRGSHHHHHHGMASMTGGQQMGRDLYDDDDKDPMVSKGEEDNMASLPATHELHIFGSFNGVDFDMVGRGTGNPNDGYEELNLKSTKGALQFSPWILVPQIGYGFHQYLPFPDGMSPFQAAMKDGSGYQVHRTMQFEDGASLTSNYRYTYEGSHIKGEFQVIGTGFPADGPVMTNSLTAADWCVTKMLYPNDKTIISTFDWTYTTGSGKRYQSTARTTYTFAKPMAANILKNQPMFVFRKTELKHSKTELNFKEWQKAFTDVMGMDELYK\n>1rx0_B mol:protein length:393  Acyl-CoA dehydrogenase family member 8, mitochondrial\nMVQTGHRSLTSCIDPSMGLNEEQKEFQKVAFDFAAREMAPNMAEWDQKELFPVDVMRKAAQLGFGGVYIQTDVGGSGLSRLDTSVIFEALATGCTSTTAYISIHNMCAWMIDSFGNEEQRHKFCPPLCTMEKFASYCLTEPGSGSDAASLLTSAKKQGDHYILNGSKAFISGAGESDIYVVMCRTGGPGPKGISCIVVEKGTPGLSFGKKEKKVGWNSQPTRAVIFEDCAVPVANRIGSEGQGFLIAVRGLNGGRINIASCSLGAAHASVILTRDHLNVRKQFGEPLASNQYLQFTLADMATRLVAARLMVRNAAVALQEERKDAVALCSMAKLFATDECFAICNQALQMHGGYGYLKDYAVQQYVRDSRVHQILEGSNEVMRILISRSLLQE\n>1c4y_1 mol:protein length:36  THROMBIN:SHORT CHAIN\nTFGSGEADCGLRPLFEKKSLEDKTERELLESYIDGR\n>7tab_A mol:protein length:130  Isoform 4 of Transcription activator BRG1\nGSAEKLSPNPPNLTKKMKKIVDAVIKYKDSSSGRQLSEVFIQLPSRKELPEYYELIRKPVDFKKIKERIRNHKYRSLNDLEKDVMLLCQNAQTFNLEGSLIYEDSIVLQSVFTSVRQKIEKEDDSEGEES\n>6p4h_E mol:protein length:281  uS3\nMSARRRRRRAAFRRRAEPFIPISVREPLPFLSAARGGKMAVQISKKRKFVADGIFKAELNEFLTRELAEDGYSGVEVRVTPTRTEIIILATRTQNVLGEKGRRIRELTAVVQKRFGFPEGSVELYAEKVATRGLCAIAQAESLRYKLLGGLAVRRACYGVLRFIMESGAKGCEVVVSGKLRGQRAKSMKFVDGLMIHSGDPVNYYVDTAVRHVLLRQGVLGIKVKIMLPWDPSGKIGPKKPLPDHVSIVEPKDEILPTTPISEQKGGKPEPPAMPQPVPTA\n>6zzy_7 mol:protein length:221  Chlorophyll a-b binding protein, chloroplastic\nVRELWFPGNKEVVPDYLDGSLVGDHGFDPLGLGSSPEQLSWNVHAEIFHGRLAMTGVAGILLTSLLHKGGADVPEWFEAGRVYLDRNPNVDFGALLFSTIVMSGFVEFKRLNDIRNPGSQGSGILPEDFKGVGGPQGRTVGGPYVGGRYFDPMGLCRGSPEQTLKYKWNEIRNGRLAMMAFLGFAAQYAATGKGPIDNLVDHVADPFHTTFVHNGVSVPFI\n>5ai4_A mol:protein length:549  BIFUNCTIONAL EPOXIDE HYDROLASE 2\nGMTLRAAVFDLDGVLALPAVFGVLGRTEEALALPRGLLNDAFQKGGPEGATTRLMKGEITLSQWIPLMEENCRKCSETAKVCLPKNFSIKEIFDKAISARKINRPMLQAALMLRKKGFTTAILTNTWLDDRAERDGLAQLMCELKMHFDFLIESCQVGMVKPEPQIYKFLLDTLKASPSEVVFLDDIGANLKPARDLGMVTILVQDTDTALKELEKVTGIQLLNTPAPLPTSCNPSDMSHGYVTVKPRVRLHFVELGSGPAVCLCHGFPESWYSWRYQIPALAQAGYRVLAMDMKGYGESSAPPEIEEYCMEVLCKEMVTFLDKLGLSQAVFIGHDWGGMLVWYMALFYPERVRAVASLNTPFIPANPNMSPLESIKANPVFDYQLYFQEPGVAEAELEQNLSRTFKSLFRASDESVLSMHKVCEAGGLFVNSPEEPSLSRMVTEEEIQFYVQQFKKSGFRGPLNWYRNMERNWKWACKSLGRKILIPALMVTAEKDFVLVPQMSQHMEDWIPHLKRGHIEDCGHWTQMDKPTEVNQILIKWLDSDARN\n>6vlz_A0 mol:protein length:218  28S ribosomal protein S34, mitochondrial\nMARKKVRPRLIAELARRVRALREQLNRPRDSQLYAVDYETLTRPFSGRRLPVRAWADVRRESRLLQLLGRLPLFGLGRLVTRKSWLWQHDEPCYWRLTRVRPDYTAQNLDHGKAWGILTFKGKTESEAREIEHVMYHDWRLVPKHEEEAFTAFTPAPEDSLASVPYPPLLRAMIIAERQKNGDTSTEEPMLNVQRIRMEPWDYPAKQEDKGRAKGTPV\n>3j3q_eB mol:protein length:231  capsid protein\nPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIEPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVL\n>1c2y_H mol:protein length:156  PROTEIN (LUMAZINE SYNTHASE)\nMNELEGYVTKAQSFRFAIVVARFNEFVTRRLMEGALDTFKKYSVNEDIDVVWVPGAYELGVTAQALGKSGKYHAIVCLGAVVKGDTSHYDAVVNSASSGVLSAGLNSGVPCVFGVLTCDNMDQAINRAGGKAGNKGAESALTAIEMASLFEHHLKA\n>7vfk_B mol:protein length:505  Glycosyl transferase, group 1 family protein\nSMNYFVGNSLGVNLTGIEKAIINRLNLFKEMGRPAQCVFLSWNRYLYRNAQNYITSSDYINMYDFFQEATYLERNEPFDWLSYWTDECHYTLKHVENSHDFRIYDQERFLMYAHFQDPKYRILDYVNHFDSQRRKVKRDFYDVRGFLSCSRILVDKQQTLCEFFYNPEGDTKLEKYFSYKDGKPEVQKIIVYYANKQYFFNNETELGAFFIKQLYQHGDLFFSDRNVYTAPIFNLTPESIPVVAVLHSTHIKNIDALDSSPFKNVYKAMFENLSRYRAIIVSTEQQKLDVEKRINHTIPVVNIPVGYSETIDTPVQTLDQRSVKLISVARYSPEKQLHQQIELIKRLVSYVPKIELHMYGFGSESKKLNELIQKYGLENHVYLRGFLSNLDQEYSDAYLSLITSNMEGFSLALLESLAHGVPVISYDIKYGPNELITSDFNGYLITKNDEDALFDKVKYVIDHPEVQQRLSKGSLAKAQQYSKASLIKQWDQFVRLILEHHHHHH\n>5wns_L mol:protein length:124  30S ribosomal protein S12\nPTINQLVRKGREKVRKKSKVPALKGAPFRRGVCTVVRTVTPKKPNSALRKVAKVRLTSGYEVTAYIPGEGHNLQEHSVVLIRGGRVKXLPGVRYHIVRGVYDAAGVKDRKKSRSKYGTKKPKEA\n>4wss_B mol:protein length:514  Hemagglutinin\nADPGDKICIGYHANNSTTQVDTILEKNVTVTHSVELLETQKESRFCRVLNKAPLDLGDCTTEGWILGNPRCDKLLGDRSWSYIVERPDAQNGICYPGVLKEAEELKALIGSIDTIQRFEMFPKSTWTGVDTNSGVTSACTYNGGSSFYRNLLWIIKIRSDPYSLIKGTYTNTGSQSILYFWGVHHPPDDVEQANLYGLGTRYVRMGTESMNFAKGPEIADRPPANGQRGRIDYYWSVLKPGETLNVESNGNLIAPWYAYKFTSSRHKGAIFRSDLPIENCDAVCQTLTGAINTNKTFQNVSPIWIGECPKYVKSKSLKLATGLRNVPQVKTRGLFGAIAGFIEGGWTGMVDGWYGYHHENSQGSGYAADKESTQKAIDGITNKVNSIIDKMNTQFEAVEHEFSNLEKRISNLNKRMEDGFLDVWTYNAELLVLLENERTLDMHDANVKNLHEKVKSQLRDNAKDLGNGCFEFWHKCDNECINSVKNGTYNYPKYQEESRLNREEIKSGRLVPRG\n>6ip5_2X mol:protein length:125  60S ribosomal protein L31\nMAPAKKGGEKKKGRSAINEVVTREYTINIHKRIHGVGFKKRAPRALKEIRKFAMKEMGTPDVRIDTRLNKAVWAKGIRNVPYRIRVRLSRKRNEDEDSPNKLYTLVTYVPVTTFKNLQTVNVDEN\n>5lng_C mol:protein length:164  Putative Fml fimbrial adhesin FmlD\nFSCNVDGGSSIGAGTTSVYVNLDPVIQPGQNLVVDLSQHISCWNDYGGWYDTDHINLVQGSAFAGSLQSYKGSLYWNNVTYPFPLTTNTNVLDIGDKTPMPLPLKLYITPVGAAGGVVIKAGEVIARIHMYKIATLGSGNPRNFTWNIISNNSVVMPTHHHHHH\n>6u42_Z0 mol:protein length:443  Tubulin beta\nMREIVHIQGGQCGNQIGAKFWEVVSDEHGIDPTGTYHGDSDLQLERINVYFNEATGGRYVPRAILMDLEPGTMDSVRSGPYGQIFRPDNFVFGQTGAGNNWAKGHYTEGAELIDSVLDVVRKEAESCDCLQGFQVCHSLGGGTGSGMGTLLISKIREEYPDRMMLTFSVVPSPKVSDTVVEPYNATLSVHQLVENADECMVLDNEALYDICFRTLKLTTPTFGDLNHLISAVMSGITCCLRFPGQLNADLRKLAVNLIPFPRLHFFMVGFTPLTSRGSQQYRALTVPELTQQMWDAKNMMCAADPRHGRYLTASALFRGRMSTKEVDEQMLNVQNKNSSYFVEWIPNNVKSSVCDIPPKGLKMSATFIGNSTAIQEMFKRVSEQFTAMFRRKAFLHWYTGEGMDEMEFTEAESNMNDLVSEYQQYQDASAEEEGEFEGEEEEA\n>6htr_b mol:protein length:196  PROTEASOME SUBUNIT BETA TYPE-1\nTSIMAVTFKDGVILGADSRTTTGAYIANRVTDKLTRVHDKIWCCRSGSAADTQAIADIVQYHLELYTSQYGTPSTETAASVFKELCYENKDNLTAGIIVAGYDDKNKGEVYTIPLGGSVHKLPYAIAGSGSTFIYGYCDKNFRENMSKEETVDFIKHSLSQAIKWDGSSGGVIRMVVLTAAGVERLIFYPDEYEQL\n>3loe_A mol:protein length:30  Neutrophil defensin 1\nACYCRIPACIAGERRYGTCIYQGRLWAACC\n>7o5h_K mol:protein length:117  30S ribosomal protein S11\nRKQVSDGVAHIHASFNNTIVTITDRQGNALGWATAGGSGFRGSRKSTPFAAQVAAERCADAVKEYGIKNLEVMVKGPGPGRESTIRALNAAGFRITNITDVTPIPHNGCRPPKKRRV\n>4dsq_D mol:protein length:184  Peroxiredoxin type-2\nMGHHHHHHMSDLVNKKFPAGDYKFQYIAISQSDADSESCKMPQTVEWSKLISENKKVIITGAPAAFSPTCTVSHIPGYINYLDELVKEKEVDQVIVVTVDNPFANQAWAKSLGVKDTTHIKFASDPGCAFTKSIGFELAVGDGVYWSGRWAMVVENGIVTYAAKETNPGTDVTVSSVESVLAHL\n>5nhk_B mol:protein length:140  Ferric uptake regulation protein\nMNSKNLDLKEFGFKVTQPRVEILKLFEKNKDKHLSPDDVFSKLKAQGSTTGIATVYRVLNQFESAGIINRLKLDNEQVMYELNQGEHHDHIICVKCNMIQEFYSPGIEALQKQIVESFGAEMIDYSLNIYVKCKSCREKI\n>4gkf_A mol:protein length:169  CRISPR system Cmr subunit Cmr5\nMEVHMLSKDNKKSIRKTLEQRRGEYAYYVIKEVADLNDKQLEEKYASLVKKAPVMILSNGLLQTLAFLLAKAETSPEKANQILSRVNEYPPRFIEKLGNDKDEHLLLYLHIVYWLRENVDRNIDVKTLLSQDYSKVLWATKEAIALLNWMRRFAVAMLKEEGKENEGSS\n>3sdj_B mol:protein length:448  Serine/threonine-protein kinase/endoribonuclease IRE1\nPEKKKRKRGSRGGKKGRKSRIANIPNFEQSLKNLVVSEKILGYGSSGTVVFQGSFQGRPVAVKRMLIDFCDIALMEIKLLTESDDHPNVIRYYCSETTDRFLYIALELCNLNLQDLVESKNVSDENLKLQKEYNPISLLRQIASGVAHLHSLKIIHRDLKPQNILVSTSSRFTADQQTGAENLRILISDFGLCKKLDSGQSSFRTNLNNPSGTSGWRAPELLEESTKRRLTRSIDIFSMGCVFYYILSKGKHPFGDKYSRESNIIRGIFSLDEMKCLHDRSLIAEATDLISQMIDHDPLKRPTAMKVLRHPLFWPKSKKLEFLLKVSDRLEIENRDPPSALLMKFDAGSDFVIPSGDWTVKFDKTFMDNLERYRKYHSSKLMDLLRALRNKYHNFMDLPEDIAELMGPVPDGFYDYFTKRFPNLLIGVYMIVKENLSDDQILREFLYS\n>3oeb_A mol:protein length:144  S-layer associated multidomain endoglucanase\nMVNMVSNPGFEDGLDSWQDWQQDMSAVPEAAHNGALGLKIGGGKAAGGGQDIPLKPNTTYILGAWAKFDSKPAGTFDVVVQYHLKDANNTYVQHILNFNETDWTYKQLLFTTPDVFGSTPELALWKGDTSKANLYVDDVYLVEV\n>6y5l_E mol:protein length:70  X-31 Influenza Haemagglutinin HA1,X-31 Influenza Haemagglutinin HA1\nAVPNGTLVKTITDDQIEVTNATELVCITPNGSIPNDKPFQNVNKITYGACPKYVKQNTLKLATGMRNVPE\n>5den_A mol:protein length:453  Phenylalanine-4-hydroxylase\nMAAVVLENGVLSRKLSDFGQETSYIEDNSNQNGAISLIFSLKEEVGALAKVLRLFEENDINLTHIESRPSRLNKDEYEFFTYLDKRSKPVLGSIIKSLRNDIGATVHELSRDKEKNTVPWFPRTIQELDRFANQILSYGAELDADHPGFKDPVYRARRKQFADIAYNYRHGQPIPRVEYTEEEKQTWGTVFRTLKALYKTHACYEHNHIFPLLEKYCGFREDNIPQLEDVSQFLQTCTGFRLRPVAGLLSSRDFLGGLAFRVFHCTQYIRHGSKPMYTPEPDICHELLGHVPLFSDRSFAQFSQEIGLASLGAPDEYIEKLATIYWFTVEFGLCKEGDSIKAYGAGLLSSFGELQYCLSDKPKLLPLELEKTACQEYSVTEFQPLYYVAESFSDAKEKVRTFAATIPRPFSVRYDPYTQRVEVLDNTQQLKILADSINSEVGILCNALQKIKS\n>7jsd_A mol:protein length:263  Lysine hydroxylase\nGPHMDVHEIDETLEKFLAENYTPERVQQLADRFQRTGFVKFDSHMRIVPEELITAVRAEADRLVREHKERRDLVLGTTGGTPRNLSVVKSQDVEQSDLIRAVTRSEVLLTFLAGITRERIIPEVSDDERYLITHQEFASDTHGWHWDDYSFAFNWALRMPPIASGGMVQAVPHTHWDKNAPRINETLCERQIDTYGLVSGDLYLLRSDTTMHRTVPLTEDGAVRTMLVVSWSAERDLGKVLTGNDRWWENPEAGAAQPVHRAG\n>3hzo_B mol:protein length:293  protein Rv0554, putative Bromoperoxidase\nMSYYHHHHHHDYDIPTTENLYFQGAMDPEFRVINLAYDDNGTGDPVVFIAGRGGAGRTWHPHQVPAFLAAGYRCITFDNRGIGATENAEGFTTQTMVADTAALIETLDIAPARVVGVSMGAFIAQELMVVAPELVSSAVLMATRGRLDRARQFFNKAEAELYDSGVQLPPTYDARARLLENFSRKTLNDDVAVGDWIAMFSMWPIKSTPGLRCQLDCAPQTNRLPAYRNIAAPVLVIGFADDVVTPPYLGREVADALPNGRYLQIPDAGHLGFFERPEAVNTAMLKFFASVKA\n>4whv_G mol:protein length:83  Polyubiquitin-B\nGPGYQDPMQIFVKTLTGKTITLEVEPSDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGG\n>4ng3_D mol:protein length:335  5-carboxyvanillate decarboxylase\nSLRLIATEEAVTFQPVVDALRAHSRTDDASLDMILVRDVYGDEPARPAMIGRLSDVTGERLAEMDSNGVDMHLLSLTAPGVQMFDAETGTRLARIANDLMAQTVAANPTRFAGLGTFAPQDPASAAREIERVATQLRLNGLVINSHTNDLYYDDPFFHPVFEAIEASGLALYIHPRAPSKQIDRAFRDYGMNSAIWGYGIETSTNAVRMILSGLFDRFPRLKIVLGHMGEAIPFWLWRLDYMHGNATTFGGAPKLKLKPSEYFRRNFAITTSGVESHAALRYSIEVLGPENVMWAIDYPYQPMAPAVQFIRTAPIPEDVKAMVAGGNAARIFRIT\n>7og4_0 mol:protein length:188  39S ribosomal protein L32, mitochondrial\nMALAMLVLVVSPWSAARGVLRNYWERLLRKLPQSRPGFPSPPWGPALAVQGPAMFTEPANDTSGSKENSSLLDSIFWMAAPKNRRTIEVNRCRRRNPQKLIKVKNNIDVCPECGHLKQKHVLCAYCYEKVCKETAEIRRQIGKQEGGPFKAPTIETVVLYTGETPSEQDQGKRIIERDRKRPSWFTQN\n>7kbl_B mol:protein length:481  2-oxoglutarate carboxylase small subunit\nMKHHHHHHAMFKKVLVANRGEIACRVIRACKELGIQTVAIYNEIESTARHVKMADEAYMIGVNPLDTYLNAERIVDLALEVGAEAIHPGYGFLAENEHFARLCEEKGITFIGPHWKVIELMGDKARSKEVMKRAGVPTVPGSDGILKDVEEAKRIAKEIGYPVLLKASAGGGGRGIRICRNEEELVRNYENAYNEAVKAFGRGDLLLEKYIENPKHIEFQVLGDKYGNVIHLGERDCSIQRRNQKLVEIAPSLLLTPEQREYYGSLVVKAAKEIGYYSAGTMEFIADEKGNLYFIEMNTRIQVEHPVTEMITGVDIVKWQIRIAAGERLRYSQEDIRFNGYSIECRINAEDPKKGFAPSIGTIERYYVPGGFGIRVEHASSKGYEITPYYDSLIAKLIVWAPLWEVAVDRMRSALETYEISGVKTTIPLLINIMKDKDFRDGKFTTRYLEEHPHVFDYAEHRDKEDFVAFISAVIASYHGL\n>3itu_D mol:protein length:345  cGMP-dependent 3',5'-cyclic phosphodiesterase\nGSAMDDEYTKLLHDGIQPVAAIDSNFASFTYTPRSLPEDDTSMAILSMLQDMNFINNYKIDCPTLARFCLMVKKGYRDPPYHNWMHAFSVSHFCYLLYKNLELTNYLEDIEIFALFISCMCHDLDHRGTNNSFQVASKSVLAALYSSEGSVMERHHFAQAIAILNTHGCNIFDHFSRKDYQRMLDLMRDIILATDLAHHLRIFKDLQKMAEVGYDRNNKQHHRLLLCLLMTSCDLSDQTKGWKTTRKIAELIYKEFFSQGDLEKAMGNRPMEMMDREKAYIPELQISFMEHIAMPIYKLLQDLFPKAAELYERVASNREHWTKVSHKFTIRGLPSNNSLDFLDEE\n>7mt7_n mol:protein length:61  30S ribosomal protein S14 type Z\nMAKKALVNKAAGKPRFAVRAYTRCSKCGRPRAVYRKFGLCRICLREMAHAGELPGVQKSSW\n>5xnl_2 mol:protein length:232  Chlorophyll a-b binding protein 8, chloroplastic\nRKSATTKKVASSGSPWYGPDRVKYLGPFSGESPSYLTGEFPGDYGWDTAGLSADPETFSKNRELEVIHSRWAMLGALGCVFPELLSRNGVKFGEAVWFKAGSQIFSEGGLDYLGNPSLVHAQSILAIWATQVILMGAVEGYRIAGGPLGEVVDPLYPGGSFDPLGLADDPEAFAELKVKELKNGRLAMFSMFGFFVQAIVTGKGPLENLADHLSDPVNNNAWSYATNFVPGK\n>6cjn_B mol:protein length:225  Chalcone--flavonone isomerase 1\nGSHMAASITAITVENLEYPAVVTSPVTGKSYFLGGAGERGLTIEGNFIKFTAIGVYLEDIAVASLAAKWKGKSSEELLETLDFYRDIISGPFEKLIRTSKIRELSGPEYSRKVMENCVAHLKSVGTYGDAEAEAMQKFAEAFKPVNFPPGASVFYRQSPDGILGLSFSPDTSIPEKEAALIENKAVSSAVLETMIGEHAVSPDLKRCLAARLPALLNEGAFKIGN\n>2d10_F mol:protein length:28  Ezrin-radixin-moesin binding phosphoprotein 50\nKERAHQKRSSKRAPQMDWSKKNELFSNL\n>1xbp_D mol:protein length:180  50S ribosomal protein L5\nMQQLKTKYNDQVRPALMQQFGYSSVMAVPRIEKIVVNEGLGSSKEDSKAIDKAAKELALITLQKPIITKAKKSISNFKLRQGMPVGIKVTLRGERMYVFLEKLINIGLPRIRDFRGINPNAFDGRGNYNLGIKEQLIFPEITYDMVDKTRGMDITIVTTAKTDEEARALLQSMGLPFRKQ\n>4y8m_R mol:protein length:260  Proteasome subunit alpha type-5\nMFLTRSEYDRGVSTFSPEGRLFQVEYSLEAIKLGSTAIGIATKEGVVLGVEKRATSPLLESDSIEKIVEIDRHIGCAMSGLTADARSMIEHARTAAVTHNLYYDEDINVESLTQSVCDLALRFGEGASGEERLMSRPFGVALLIAGHDADDGYQLFHAEPSGTFYRYNAKAIGSGSEGAQAELLNEWHSSLTLKEAELLVLKILKQVMEEKLDENNAQLSCITKQDGFKIYDNEKTAELIKELKEKEAAESPEEADVEMS\n>6jvb_B mol:protein length:540  Dihydropyrimidinase-related protein 2\nMHHHHHHHMSYQGKKNIPRITSDRLLIKGGKIVNDDQSFYADIYMEDGLIKQIGENLIVPGGVKTIEAHSRMVIPGGIDVHTRFQMPDQGMTSADDFFQGTKAALAGGTTMIIDHVVPEPGTSLLAAFDQWREWADSKSCCDYSLHVDISEWHKGIQEEMEALVKDHGVNSFLVYMAFKDRFQLTDCQIYEVLSVIRDIGAIAQVHAENGDIIAEEQQRILDLGITGPEGHVLSRPEEVEAEAVNRAITIANQTNCPLYITKVMSKSSAEVIAQARKKGTVVYGEPITASLGTDGSHYWSKNWAKAAAFVTSPPLSPDPTTPDFLNSLLSCGDLQVTGSAHCTFNTAQKAVGKDNFTLIPEGTNGTEERMSVIWDKAVVTGKMDENQFVAVTSTNAAKVFNLYPRKGRIAVGSDADLVIWDPDSVKTISAKTHNSSLEYNIFEGMECRGSPLVVISQGKIVLEDGTLHVTEGSGRYIPRKPFPDFVYKRIKARSRLAELRGVPRGLYDGPVCEVSVTPKTVTPASSAKTSPAKQQAPPVR\n>2pmp_A mol:protein length:160  2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase\nTLPFRIGHGFDLHRLEPGYPLIIGGIVIPHDRGCEAHSDGDVLLHCVVDAILGALGLPDIGQIFPDSDPKWKGAASSVFIKEAVRLMDEAGYEIGNLDATLILQRPKISPHKETIRSNLSKLLGADPSVVNLKAKTHEKVDSLGENRSIAAHTVILLMKK\n>4lbp_A mol:protein length:100  5-chloro-2-hydroxyhydroquinone dehydrochlorinase (TftG)\nMLFLIYRKDRPGSLQVRIDNYAAHLAYLEPLKAKIQVGGPTLGAGTGTDDKDMTGSFLIMEAESWDEVHSFVENDPFTKAGLFAATIVERWKHGKHNDSK\n>6jmq_D mol:protein length:219  Antibody\nDIVMSQSPSSLVVSVGEKVTMSCXXXXXXXXXXXXXXXXXWYQQKPGQSPKLLIYXXXXXXXGVPDRFTGSGSGTDFTLTISSVKAEDLAVYYCXXXXXXXXXFGGGTKLEIKRADAAPTVSIFPPSSEQLTSGGASVVCFLNNFYPKDINVKWKIDGSERQNGVLNSWTDQDSKDSTYSMSSTLTLTKDEYERHNSYTCEATHKTSTSPIVKSFNRNE\n>5j46_A mol:protein length:189  Peptide deformylase\nMAHHHHHHMANAAHRFTEYRKTMALLNILHYPDKRLHKVAKPVDKVDDRIRKLVADMAETMYAAPGIGLAATQVDVHERVIVIDVSEDKNELRAFINPEIIWSSDGKQVYEEGCLSVPGIYDEVERPDRVRVRALNEQGETFELDCEGLLAVCIQHEMDHLMGRVFVEYLSPLKQSRIKTKMKKLERAM\n>5pf4_A mol:protein length:138  Bromodomain adjacent to zinc finger domain protein 2B\nMHHHHHHSSGVDLGTENLYFQSMSVKKPKRDDSKDLALCSMILTEMETHEDAWPFLLPVNLKLVPGYKKVIKKPMDFSTIREKLSSGQYPNLETFALDVRLVFDNCETFNEDDSDIGRAGHNMRKYFEKKWTDTFKVS\n>6zcd_V mol:protein length:95  Vascular endothelial growth factor A\nEVVKFMDVYQRSYCHPIETLVDIFQEYPDEIEYIFKPSCVPLMRCGGCCNDEGLECVPTEESNITMQIMRIKPHQGQHIGEMSFLQHNKCECRPK\n>4zzc_B mol:protein length:317  Proton-gated ion channel\nGQDMVSPPPPIADEPLTVNTGIYLIECYSLDDKAETFKVNAFLSLSWKDRRLAFDPVRSGVRVKTYEPEAIWIPEIRFVNVENARDADVVDISVSPDGTVQYLERFSARVLSPLDFRRYPFDSQTLHIYLIVRSVDTRNIVLAVDLEKVGKNDDVFLTGWDIESFTAVVKPANFALEDRLESKLDYQLRISRQYFSYIPNIILPMLFILFISWTAFWSTSYEANVTLVVSTLIAHIAFNILVETNLPKTPYMTYTGAIIFMIYLFYFVAVIEVTVQHYLKVESQPARAASITRASRIAFPVVFLLANIILAFLFFGF\n>5t0x_C mol:protein length:19  Estrogen receptor peptide\nRAANLWPSPLMIKRSKKNS\n>6msb_d mol:protein length:349  26S proteasome non-ATPase regulatory subunit 8\nFIKGRAPRAPPRERRRATRGGLRQVVAPPRALGSTSRPHFRRASVCRRRCRKSGGLLAASRKMAAAAVNGAAGFSSSGPAATSGAVLQAATGMYEQLKGEWNRKSPNLSKCGEELGRLKLVLLELNFLPTTGTKLTKQQLILARDILEIGAQWSILRKDIPSFERYMAQLKCYYFDYKEQLPESAYMHQLLGLNLLFLLSQNRVAEFHTELERLPAKDIQTNVYIKHPVSLEQYLMEGSYNKVFLAKGNIPAESYTFFIDILLDTIRDEIAGCIEKAYEKILFTEATRILFFNTPKKMTDYAKKRGWVLGPNNYYSFASQQQKPEDTTIPSTELAKQVIEYARQLEMIV\n>7o7y_Aq mol:protein length:135  40S ribosomal protein eS17\nMGRVRTKTVKKAARVIIEKYYTRLGNDFHTNKRVCEEIAIIPSKKLRNKIAGYVTHLMKRIQRGPVRGISIKLQEEERERRDNYVPEVSALDQEIIEVDPDTKEMLKLLDFGSLSNLQVTQPTVGMNFKTPRGAV\n>1trs_A mol:protein length:105  THIOREDOXIN\nMVKQIESKTAFQEALDAAGDKLVVVDFSATWCGPCKMIKPFFHSLSEKYSNVIFLEVDVDDAQDVASEAEVKATPTFQFFKKGQKVGEFSGANKEKLEATINELV\n>6zv6_I mol:protein length:208  40S ribosomal protein S8\nMGISRDNWHKRRKTGGKRKPYHKKRKYELGRPAANTKIGPRRIHTVRVRGGNKKYRALRLDVGNFSWGSECCTRKTRIIDVVYNASNNELVRTKTLVKNCIVLIDSTPYRQWYESHYALPLGRKKGAKLTPEEEEILNKKRSKKIQKKYDERKKNAKISSLLEEQFQQGKLLACIASRPGQCGRADGYVLEGKELEFYLRKIKARKGK\n>3nff_D mol:protein length:121  RNA polymerase I subunit A34.5\nMGYQPPSDYKQCKHLKSFPVSELKGDNKELWLMKVPANIDISQLKSLPLDTDATVSTVELGSKNFNVLQNTSTQEGSDNTNLSLLIPSEKKKETLKVATSKDNKSVYFDRVFTISETARIP\n>7lus_B mol:protein length:207  Immunoglobulin heavy constant gamma 2\nGPSVFLFPPKPKDTLMISRTPEVTCVVVDVSHEDPEVQFNWYVDGVEVHNAKTKPREEQFNSTFRVVSVLTVVHQDWLNGKEYKCKVSNKGLPAPIEKTISKTKGQPREPQVYTLPPSREEMTKNQVSLTCLVKGFYPSDIAVEWESNGQPENNYDTTPPMLDSDGSFFLYSDLTVDKSRWQQGNVFSCSVMHEALHNHYTQKSLSL\n>5t15_E mol:protein length:4676  Ryanodine receptor 1,Ryanodine receptor 1,Ryanodine receptor 1,Ryanodine receptor 1,Ryanodine receptor 1,Ryanodine receptor 1,Ryanodine receptor 1\nQFLRTDDEVVLQCSATVLKEQLKLCLAAEGFGNRLCFLEPTSNAQNVPPDLAICCFTLEQSLSVRALQEMLANTVEAGVESSQGGGHRTLLYGHAILLRHAHSRMYLSCLTTSRSMTDKLAFDVGLQEDATGEACWWTMHPASKQRSEGEKVRVGDDLILVSVSSERYLHLSTASGELQVDASFMQTLWNMNPICSCCEEGYVTGGHVLRLFHGHMDECLTISAADSDDQRRLVYYEGGAVCTHARSLWRLEPLRISWSGSHLRWGQPLRIRHVTTGRYLALTEDQGLVVVDACKAHTKATSFCFRVSKEKLDTAPKRDVEGMGPPEIKYGESLCFVQHVASGLWLTYAAPDPKALRLGVLKKKAILHQEGHMDDALFLTRCQQEESQAARMIHSTAGLYNQFIKGLDSFSGKPRGSGPPAGPALPIEAVILSLQDLIGYFEPPSEELQHEEKQSKLRSLRNRQSLFQEEGMLSLVLNCIDRLNVYTTAAHFAEYAGEEAAESWKEIVNLLYELLASLIRGNRANCALFSTNLDWVVSKLDRLEASSGILEVLYCVLIESPEVLNIIQENHIKSIISLLDKHGRNHKVLDVLCSLCVCNGVAVRSNQDLITENLLPGRELLLQTNLINYVTSIRPNIFVGRAEGSTQYGKWYFEVMVDEVVPFLTAQATHLRVGWALTEGYSPYPGGGEGWGGNGVGDDLYSYGFDGLHLWTGHVARPVTSPGQHLLAPEDVVSCCLDLSVPSISFRINGCPVQGVFEAFNLDGLFFPVVSFSAGVKVRFLLGGRHGEFKFLPPPGYAPCHEAVLPRERLRLEPIKEYRREGPRGPHLVGPSRCLSHTDFVPCPVDTVQIVLPPHLERIREKLAENIHELWALTRIEQGWTYGPVRDDNKRLHPCLVNFHSLPEPERNYNLQMSGETLKTLLALGCHVGMADEKAEDNLKKTKLPKTYMMSNGYKPAPLDLSHVRLTPAQTTLVDRLAENGHNVWARDRVAQGWSYSAVQDIPARRNPRLVPYRLLDEATKRSNRDSLCQAVRTLLGYGYNIEPPDQEPSQVENQSRWDRVRIFRAEKSYTVQSGRWYFEFEAVTTGEMRVGWARPELRPDVELGADELAYVFNGHRGQRWHLGSEPFGRPWQSGDVVGCMIDLTENTIIFTLNGEVLMSDSGSETAFREIEIGDGFLPVCSLGPGQVGHLNLGQDVSSLRFFAICGLQEGFEPFAINMQRPVTTWFSKSLPQFEPVPPEHPHYEVARMDGTVDTPPCLRLAHRXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXMPLSAAMFLSERKNPAPQCPPRLEVQMLMPVSWSRMPNHFLQVETRRAGERLGWAVQCQDPLTMMALHIPEENRCMDILELSERLDLQRFHSHTLRLYRAVCALGNNRVAHALCSHVDQAQLLHALEDAHLPGPLRAGYYDLLISIHLESACRSRRSMLSEYIVPLTPETRAITLFPPGRKGGNARRHGLPGVGVTTSLRPPHHFSPPCFVAALPAAGVAEAPARLSPAIPLEALRDKALRMLGEAVRDGGQHARDPVGGSVEFQFVPVLKLVSTLLVMGIFGDEDVKQILKMIEPEVFTEEEEEEEEEEEEEEEEEEDEEEKEEDEEEEEKEDAEKEEEEAPEGEKEDLEEGLLQMKLPESVKLQMCNLLEYFCDQELQHRVESLAAFAERYVDKLQANQRSRYALLMRAFTMSAAETARRTREFRSPPQEQINMLLHFKDEADEEDCPLPEDIRQDLQDFHQDLLAHCGIQLEGEEEEPEEETSLSSRLRSLLETVRLVKKKEEKPEEELPAEEKKPQSLQELVSHMVVRWAQEDYVQSPELVRAMFSLLHRQYDGLGELLRALPRAYTISPSSVEDTMSLLECLGQIRSLLIVQMGPQEENLMIQSIGNIMNNKVFYQHPNLMRALGMHETVMEVMVNVLGGGETKEIRFPKMVTSCCRFLCYFCRISRQNQRSMFDHLSYLLENSGIGLGMQGSTPLDVAAASVIDNNELALALQEQDLEKVVSYLAGCGLQSCPMLLAKGYPDIGWNPCGGERYLDFLRFAVFVNGESVEENANVVVRLLIRKPECFGPALRGEGGSGLLAAIEEAIRISEDPARDGPGVRRDRRREHFGEEPPEENRVHLGHAIMSFYAALIDLLGRCAPEMHLIQAGKGEALRIRAILRSLVPLDDLVGIISLPLQIPTLXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXNFDPRPVETLNVIIPEKLDSFINKFAEYTHEKWAFDKIQNNWSYGENVDEELKTHPMLRPYKTFSEKDKEIYRWPIKESLKAMIAWEWTIEKAREGEEERTEKKKTRKISQTAQTYDPREGYNPQPPDLSGVTLSRELQAMAEQLAENYHNTWGRKKKQELEAKGGGTHPLLVPYDTLTAKEKARDREKAQELLKFLQMNGYAVTRXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXTPLYNLPTHRACNMFLESYKAAWILTEDHSFEDRMIDDLSKAGEQEEEEEEVEEKKPDPLHQLVLHFSRTALTEKSKLDEDYLYMAYADIMAKSCHLEEGGENGEAEEEEVEVSFEEKEMEKQRLLYQQSRLHTRGAAEMVLQMISACKGETGAMVSSTLKLGISILNGGNAEVQQKMLDYLKDKKEVGFFQSIQALMQTCSVLDLNAFERQNKAEGLGMVNEDGTVINRQNGEKVMADDEFTQDLFRFLQLLCEGHNNDFQNYLRTQTGNTTTINIIICTVDYLLRLQESISDFYWYYSGKDVIEEQGKRNFSKAMSVAKQVFNSLTEYIQGPCTGNQQSLAHSRLWDAVVGFLHVFAHMMMKLAQDSSQIELLKELLDLQKDMVVMLLSLLEGNVVNGMIARQMVDMLVESSSNVEMILKFFDMFLKLKDIVGSEAFQDYVTDPRGLISKKDFQKAMDSQKQFTGPEIQFLLSCSEADENEMINFEEFANRFQEPARDIGFNVAVLLTNLSEHVPHDPRLRNFLELAESILEYFRPYLGRIEIMGASRRIERIYFEISETNRAQWEMPQVKESKRQFIFDVVNEGGEAEKMELFVSFCEDTIFEMQIAAQISEPEGEPEADEDEGMGEAAAEGAEEGAAGAEGAAGTVAAGATARLAAAAARALRGLSYRSLRRRVRRLRRLTAREAATALAALLWAVVARAGAAGAGAAAGALRLLWGSLFGGGLVEGAKKVTVTELLAGMPDPTSDEVHGEQPAGPGGDADGAGEGEGEGDAAEGDGDEEVAGHEAGPGGAEGVVAVADGGPFRPEGAGGLGDMGDTTPAEPPTPEGSPILKRKLGVDGEEEELVPEPEPEPEPEPEKADEENGEKEEVPEAPPEPPKKAPPSPPAKKEEAGGAGMEFWGELEVQRVKFLNYLSRNFYTLRFLALFLAFAINFILLFYKVSDSPPGEDDMEGSAAGDLAGAGSGGGSGWGSGAGEEAEGDEDENMVYYFLEESTGYMEPALWCLSLLHTLVAFLCIIGYNCLKVPLVIFKREKELARKLEFDGLYITEQPGDDDVKGQWDRLVLNTPSFPSNYWDKFVKRKVLDKHGDIFGRERIAELLGMDLASLEITAHNERKPDPPPGLLTWLMSIDVKYQIWKFGVIFTDNSFLYLGWYMVMSLLGHYNNFFFAAHLLDIAMGVKTLRTILSSVTHNGKQLVMTVGLLAVVVYLYTVVAFNFFRKFYNKSEDEDEPDMKCDDMMTCYLFHMYVGVRAGGGIGDEIEDPAGDEYELYRVVFDITFFFFVIVILLAIIQGLIIDAFGELRDQQEQVKEDMETKCFICGIGSDYFDTTPHGFETHTLEEHNLANYMFFLMYLINKDETEHTGQESYVWKMYQERCWDFFPAGDCFRKQYEDQLS\n>2isc_A mol:protein length:239  purine nucleoside phosphorylase\nATPHNSAQVGDFAETVLMCGDPLRAKLIAETYLENPKLVNNVRGIQGYTGTYKGKPISVMGHGMGLPSICIYAEELYSTYKVKTIIRVGTCGAIDMDIHTRDIVIFTSAGTNSKINRIRFMDHDYPATASFDVVCALVDAAKELNIPAKVGKGFSTDLFYNPQTELAQLMNKFHFLAVEMESAGLFPIADLYGARAGCICTVSDHILHHEETTAEERQNSFQNMMKIALEAAIKLHHHH\n>4kzx_b mol:protein length:84  40S ribosomal protein S27\nMPLAKDLLHPSPEEEKRKHKKKRLVQSPNSYFMDVKCPGCYKITTVFSHAQTVVLCVGCSTVLCQPTGGKARLTEGCSFRRKQH\n>1y5k_A mol:protein length:141  Hemoglobin alpha chain\nVLSPADKTNVKAAWGKVGAHAGEYGAEALERMFLSFPTTKTYFPHFDLSHGSAQVKGHGKKVADALTNAVAHVDDMPNALSALSDLHAHKLRVDPVNFKLLSHCLLVTLAAHLPAEFTPAVHASLDKFLASVSTVLTSKYR\n>3ddo_D mol:protein length:253  Uridine phosphorylase\nMSKSDVFHLGLTKNDLQGAQLAIVPGDPERVEKIAALMDKPVKLASHREFTSWRAELDGKAVIVCSTGIGGPSTSIAVEELAQLGIRTFLRIGTTGAIQPHINVGDVLVTTASVRLDGASLHFAPMEFPAVADFACTTALVEAAKSIGATTHVGVTASSDTFYPGQERYDTYSGRVVRRFKGSMEEWQAMGVMNYEMESATLLTMCASQGLRAGMVAGVIVNRTQQEIPNAETMKQTESHAVKIVVEAARRLL\n>2klw_C mol:protein length:32  (POG)10\nXPPGPPGPPGPPGPPGPPGPPGPPGPPGPPGX\n>6qml_B mol:protein length:76  Polyubiquitin-B\nLQIFVKTLTGKTITLEVEPSDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGG\n>6s1v_A mol:protein length:114  Gag-Pro-Pol polyprotein\nWVQPITCQKPSLTLWLDDKMFTGLINTGADVTIIKLEDWPPNWPITDTLTNLRGIGQSNNPKQSSKYLTWRDKENNSGLIKPFVIPNLPVNLWGRDLLSQMKIMMCSPNDIVTA\n>6cbe_X mol:protein length:736  Capsid protein VP1\nMAADGYLPDWLEDTLSEGIRQWWKLKPGPPPPKPAERHKDDSRGLVLPGYKYLGPFNGLDKGEPVNEADAAALEHDKAYDRQLDSGDNPYLKYNHADAEFQERLKEDTSFGGNLGRAVFQAKKRVLEPLGLVEEPVKTAPGKKRPVEHSPVEPDSSSGTGKAGQQPARKRLNFGQTGDADSVPDPQPLGQPPAAPSGLGTNTMATGSGAPMADNNEGADGVGNSSGNWHCDSTWMGDRVITTSTRTWALPTYNNHLYKQISSASTGASNDNHYFGYSTPWGYFDFNRFHCHFSPRDWQRLINNNWGFRPKRLNFKLFNIQVKEVTQNDGTTTIANNLTSTVQVFTDSEYQLPYVLGSAHQGCLPPFPADVFMVPQYGYLTLNNGSQAVGRSSFYCLEYFPSQMLRTGNNFTFSYTFEDVPFHSSYAHSQSLDRLMNPLIDQYLYYLSRTNTPSGTTTQSRLQFSQAGASDIRDQSRNWLPGPCYRQQRVSKTSADNNNSEYSWTGATKYHLNGRDSLVNPGPAMASHKDDEEKFFPQSGVLIFGKQGSEKTNVDIEKVMITDEEEIRTTNPVATEQYGSVSTNLQRGNRQAATADVNTQGVLPGMVWQDRDVYLQGPIWAKIPHTDGHFHPSPLMGGFGLKHPPPQILIKNTPVPANPSTTFSAAKFASFITQYSTGQVSVEIEWELQKENSKRWNPEIQYTSNYAKSANVDFTVDNNGVYSEPRPIGTRYLTRNL\n>2ide_E mol:protein length:157  Molybdenum cofactor biosynthesis protein C\nMDLTHFQDGRPRMVDVTEKPETFRTATAEAFVELTEEALSALEKGGVGKGDPLVVAQLAGILAAKKTADLIPLCHPLPLTGVEVRVELLKAEKRVRIEATVKTKAETGVEMEAMTACAVAALTVYDMLKAASKGLVISQVRLLHKAGGKSGEWRREQ\n>7f27_D mol:protein length:408  3-oxoacyl-(Acyl-carrier-protein) synthase\nMKRVVVTGMAGITSLGETADDIFARFEAGKSGIRYMPEWEQYVDLRTKLAGPVETFHIPKHFNRKVTRGMGRVALMSVVCAETALQNAGLLGHEILSSGEAGVAFGSSAGSVDAVGEFASMLLHQSMSKINATTYIRMMAHTSAVNMTVYFGLKGLTLPTSSACTSGSMAIGQAYEAIKYGKQQVMIAGGAEELSAAGAAVFDVLFATSGMNDQPEKTPRPFDAKRDGLVIGEGAGCLILEEYEHAKARGAHIYAEVIGYGSNTDGQHVTRPESEMMGRCMELALKDASVEAKDIAYVNAHGTSTDQGDVAESQATAKVLGYKPISSLKSYFGHTLGACGAIEAWLSIEMMNRGRFIPTLNLDEIDSLCGELDYIVQQPRNLDADIIMSNNFAFGGINTSLIFKRVKQ\n>3fi2_A mol:protein length:353  Mitogen-activated protein kinase 10\nMSKSKVDNQFYSVEVGDSTFTVLKRYQNLKPIGSGAQGIVCAAYDAVLDRNVAIKKLSRPFQNQTHAKRAYRELVLMKCVNHKNIISLLNVFTPQKTLEEFQDVYLVMELMDANLCQVIQMELDHERMSYLLYQMLCGIKHLHSAGIIHRDLKPSNIVVKSDCTLKILDFGLARTAGTSFMMTPYVVTRYYRAPEVILGMGYKENVDIWSVGCIMGEMVRHKILFPGRDYIDQWNKVIEQLGTPCPEFMKKLQPTVRNYVENRPKYAGLTFPKLFPDSLFPADSEHNKLKASQARDLLSKMLVIDPAKRISVDDALQHPYINVWYXXXXXXDEREHTIEEWKELIYKEVMNSE\n>4p18_G mol:protein length:176  Ferritin, middle subunit\nMVSQVRQNYHSDCEAAVNRMLNLELYASYTYSSMYAFFDRDDVALHNVAEFFKEHSHEEREHAEKFMKYQNKRGGRVVLQKIKKPERDEWGNTLEAMQAALQLEKTVNQALLDLHKLATDKVDPHLCDFLESEYLEEQVKDIKRIGDFITNLKRLGLPENGMGEYLFDKHSVKESS\n>4lb1_D mol:protein length:30  Neutrophil defensin 1\nACYCRIPACIAGERRAGTCIYQGRLWAACC\n>6unz_H mol:protein length:604  fumarate hydratase 2\nMGSSHHHHHHSSGLVPRGSHMASMTGGQQMGRGSEFMSLCDQCEIGCRRVGIKDIEDASAVNADFHFSAIFQPTDPHHHQTEFAKVEGSEKYVEEVEVFGRQALKVNPEALTILAHRAFSDVHHFFRKDHLEGWRRAIEDPEASDNDRYVATTLLKNACIAAGRVLPSCQDTGTAIVLGKRGELCWTGGEDEKYLSKGIWNAYRYHNLRYSQTAALDMFKECNTGDNLPAQLDLLAVPGSDYEFLFIAKGGGSANKAYLYQETKALLNPKSLRAFIEEKLKTLGTAACPPYHIALVIGGTSAEMTMKTVKLASCRYYDSLPTTGDKYGRAFRDPEWEKIVMEVAQKSGIGAQFGGKYFAHQARVIRLPRHGASCPVGLAVSCSADRQILAHINKSGIYIEQLEQNPAQYLPDIPEVHLSTTSVKVDLKRPIDKVRQQLSQYPVGTRVMLNGTLIVARDIAHAKIKEMMDNGEPLPEYMKTSPIYYAGPAKTPEGYASGSFGPTTAGRMDSYVDLFQSHGGSYITLAKGNRSKQVTDACKKHGGFYLGSIGGPAAILAKDSIKQVTCLAFPELGMEAVWKIEVEDFPAFIVVDDKGNDMYSKTLA\n>7emd_A mol:protein length:275  Leucocyte antigen\nGPHSLSYFYTAVSRPDRGDSRFIAVGYVDDTQFVRFDSDAPNPRMEPRAPWIQQEGQDYWDRETRKQRDTSQTYRVGLKNLRGYYNQSEAGSHTYQSMYGCYLGPDGLLLRGYRQYAYDGADYIALNEDLRSWTAADTAAQITKRKWETANVAERRRSYLQGLCVESLREYLEMGKDTLQRAEPPKTHVTRHPSSDLGVTLRCWALGFYPKEISLTWQREGQDQSQDMELVETRPSGDGTFQKWAALVVPPGEEQSYTCHVQHEGLQEPLTLRWD\n>7sym_K mol:protein length:194  uS4\nMPVARSWVCRKTYVTPRRPFEKSRLDQELKLIGEYGLRNKREVWRVKFTLAKIRKAARELLTLDEKDPRRLFEGNALLRRLVRIGVLDEGKMKLDYILGLKIEDFLERRLQTQVFKLGLAKSIHHARVLIRQRHIRVRKQVVNIPSFIVRLDSQKHIDFSLRSPYGGGRPGRVKRKNAKKGQGGAGAGDDEEED\n>2n8n_A mol:protein length:72  Translation initiation factor IF-1\nMAKQDVIELEGTVLDTLPNAMFKVELENGHEILAHVSGKIRMNYIRILPGDKVTVEMSPYDLTRGRITYRYK\n>6v8z_O mol:protein length:231  VRC03 Fab Heavy Chain\nQVQLVQSGAVIKTPGSSVKISCRASGYNFRDYSIHWVRLIPDKGFEWIGWIKPLWGAVSYARQLQGRVSMTRQLSQDPDDPDWGVAYMEFSGLTPADTAEYFCVRRGSCDYCGDFPWQYWCQGTVVVVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPK\n>5nqv_H mol:protein length:11  EAR motif of IAA27\nTELRLGLPGSE\n>2fzd_A mol:protein length:316  aldose reductase\nMASRILLNNGAKMPILGLGTWKSPPGQVTEAVKVAIDVGYRHIDCAHVYQNENEVGVAIQEKLREQVVKREELFIVSKLWCTYHEKGLVKGACQKTLSDLKLDYLDLYLIHWPTGFKPGKEFFPLDESGNVVPSDTNILDTWAAMEELVDEGLVKAIGISNFNHLQVEMILNKPGLKYKPAVNQIECHPYLTQEKLIQYCQSKGIVVTAYSPLGSPDRPWAKPEDPSLLEDPRIKAIAAKHNKTTAQVLIRFPMQRNLVVIPKSVTPERIAENFKVFDFELSSQDMTTLLSYNRNWRVCALLSCTSHKDYPFHEEF\n>4x0g_D mol:protein length:109  Blastoderm-specific gene 25A\nPMVTIGPNGTEVSRISLSAINWAMTGPSITRKLLCEIFDRDTLAHHTLSGKPSPAFRDCARPSKQQLDPLKVADLVYLMTNSCDMTPREVRTAITTKCADENKMLRSRM\n>6cxa_C mol:protein length:209  Chimeric T cell antigen receptor alpha chain Va14,Va24,Ja18\nMKTQVEQSPQSLVVRQGENCVLQCNYSVTPDNHLRWFKQDTGKGLVSLTVLVDQKDKTSNGRYSATLDKDAKHSTLHITATLLDDTATYICVVGDRGSALGRLHFGAGTQLIVIPDIQNPDPAVYQLRDSKSSDKSVCLFTDFDSQTNVSQSKDSDVYITDKCVLDMRSMDFKSNSAVAWSNKSDFACANAFNNSIIPEDTFFPSPESS\n>5y6p_z6 mol:protein length:177  R-phycoerythrin beta chain\nMLDAFSRVVVNSDSKAAYVGGSDLQSLKTFISDGNKRLDAVNCIVSNASCIVSDAISGMICENPGLIAPGGNCYTNRRMAACLRDGEIILRYVSYALLAGDSSVLDDRCLNGLKETYIALGVPTASTSRAVSIMKAASTAFIMNTASGRKIEIAAGDCQALQSEAAAYFDKVGSAVD\n>4r8o_B mol:protein length:104  Uncharacterized protein\nGGNPGDNLIYNAEEVNGVVVSETIFKMEGTMLTNYMKHNYKYDANNQRTEDEAQKWNSNKNRWENNLCIRYTYGNKSMTTEYYKWNSKKKEYILVPEMTVTMDK\n>2big_B mol:protein length:361  PHOSPHOSERINE AMINOTRANSFERASE\nMVKQVFNFNAGPSALPKPALERAQKELLNFNDTQMSVMELSHRSQSYEEVHEQAQNLLRELLQIPNDYQILFLQGGASLQFTMLPMNLLTKGTIGNYVLTGSWSEKALKEAKLLGETHIAASTKANSYQSIPDFSEFQLNENDAYLHITSNNTIYGTQYQNFPEINHAPLIADMSSDILSRPLKVNQFGMIYAGAQKNLGPSGVTVVIVKKDLLNTKVEQVPTMLQYATHIKSDSLYNTPPTFSIYMLRNVLDWIKDLGGAEAIAKQNEEKAKIIYDTIDESNGFYVGHAEKGSRSLMNVTFNLRNEELNQQFLAKAKEQGFVGLNGHRSVGGCRASIYNAVPIDACIALRELMIQFKENA\n>1dmx_A mol:protein length:248  MURINE CARBONIC ANHYDRASE V\nCATGTRQSPINIQWKDSVYDPQLAPLRVSYDAASCRYLWNTGYFFQVEFDDSCEDSGISGGPLGNHYRLKQFHFHWGATDEWGSEHAVDGHTYPAELHLVHWNSTKYENYKKASVGENGLAVIGVFLKLGAHHQALQKLVDVLPEVRHKDTQVAMGPFDPSCLMPACRDYWTYPGSLTTPPLAESVTWIVQKTPVEVSPSQLSMFRTLLFSGRGEEEDVMVNNYRPLQPLRDRKLRSSFRLDRTKMRS\n>6u42_Z7 mol:protein length:451  Tubulin alpha\nMREVISIHIGQAGIQVGNACWELYCLEHGIQPDGQMPSDKTIGGGDDAFNTFFSETGAGKHVPRCIFLDLEPTVVDEVRTGTYRQLFHPEQLISGKEDAANNFARGHYTIGKEIVDLALDRIRKLADNCTGLQGFLVFNAVGGGTGSGLGSLLLERLSVDYGKKSKLGFTVYPSPQVSTAVVEPYNSVLSTHSLLEHTDVAVMLDNEAIYDICRRSLDIERPTYTNLNRLIAQVISSLTASLRFDGALNVDITEFQTNLVPYPRIHFMLSSYAPIISAEKAYHEQLSVAEITNAAFEPASMMVKCDPRHGKYMACCLMYRGDVVPKDVNASVATIKTKRTIQFVDWCPTGFKCGINYQPPTVVPGGDLAKVQRAVCMISNSTAIGEIFSRLDHKFDLMYAKRAFVHWYVGEGMEEGEFSEAREDLAALEKDFEEVGAESAEGAGEGEGEEY\n>3oda_H mol:protein length:116  Poly [ADP-ribose] polymerase 1\nMGSSHHHHHHSSGLVPRGSHMAESSDKLYRVEYAKSGRASCKKCSESIPKDSLRMAIMVQSPMFDGKVPHWYHFSCFWKVGHSIRHPDVEVDGFSELRWDDQQKVKKTAEAGGVTG\n>3kaq_A mol:protein length:147  Flavodoxin\nSKVLILFGSSTGNTESIAQKLEELVAAGGHEVTLLNAAEASADNLADGYDAVLMGCSAWGMEDLELQDDFAPLFDEMENMGLKGKKLAAFASGDMEYEHYCGAVPAIEEKARGLGAEVICEGLKIEGDASSDPDAVSAFAEDVLKKL\n>5xxb_c mol:protein length:120  Ribosomal protein eL31\nMKGTTRKAQNKSLQPVCRDYTIHLHKLIHGIQFKKRAPRALREIRRFAQKTMHTKDVRIDTKLNKFIWSGGIRNVPRRVRVRIARRRNDDEDSKEKFYTLVQHVPVASFENLKTEYVNEE\n>2j57_B mol:protein length:105  AMICYANIN\nDKATIPSESPFAAAEVADGAIVVDIAKMKYETPELHVKVGDTVTWINREAMPHNVHFVAGVLGEAALKGPMMKKEQAYSLTFTEAGTYDYHCTPHPFMRGKVVVE\n>6y2l_SV mol:protein length:83  40S ribosomal protein S21\nMQNDAGEFVDLYVPRKCSASNRIIGAKDHASIQMNVAEVDKVTGRFNGQFKTYAICGAIRRMGESDDSILRLAKADGIVSKNF\n>7vxc_A mol:protein length:1261  Spike glycoprotein\nMFVFLVLLPLVSSQCVNLTTRTQLPPAYTNSFTRGVYYPDKVFRSSVLHSTQDLFLPFFSNVTWFHAIHVSGTNGTKRFDNPVLPFNDGVYFASTEKSNIIRGWIFGTTLDSKTQSLLIVNNATNVVIKVCEFQFCNDPFLDVYYHKNNKSWMKSEFRVYSSANNCTFEYVSQPFLMDLEGKQGNFKNLREFVFKNIDGYFKIYSKHTPINLVRDLPQGFSALEPLVDLPIGINITRFQTLLALHRSYLTPGDSSSGWTAGAAAYYVGYLQPRTFLLKYNENGTITDAVDCALDPLSETKCTLKSFTVEKGIYQTSNFRVQPTESIVRFPNITNLCPFGEVFNATRFASVYAWNRKRISNCVADYSVLYNSASFSTFKCYGVSPTKLNDLCFTNVYADSFVIRGDEVRQIAPGQTGKIADYNYKLPDDFTGCVIAWNSNNLDSKVGGNYNYRYRLFRKSNLKPFERDISTEIYQAGSTPCNGVQGFNCYFPLQSYGFQPTNGVGYQPYRVVVLSFELLHAPATVCGPKKSTNLVKNKCVNFNFNGLTGTGVLTESNKKFLPFQQFGRDIADTTDAVRDPQTLEILDITPCSFGGVSVITPGTNTSNQVAVLYQGVNCTEVPVAIHADQLTPTWRVYSTGSNVFQTRAGCLIGAEHVNNSYECDIPIGAGICASYQTQTNSRGSASSVASQSIIAYTMSLGAENSVAYSNNSIAIPTNFTISVTTEILPVSMTKTSVDCTMYICGDSTECSNLLLQYGSFCTQLNRALTGIAVEQDKNTQEVFAQVKQIYKTPPIKDFGGFNFSQILPDPSKPSKRSFIEDLLFNKVTLADAGFIKQYGDCLGDIAARDLICAQKFNGLTVLPPLLTDEMIAQYTSALLAGTITSGWTFGAGAALQIPFAMQMAYRFNGIGVTQNVLYENQKLIANQFNSAIGKIQDSLSSTASALGKLQDVVNQNAQALNTLVKQLSSNFGAISSVLNDILSRLDPPEAEVQIDRLITGRLQSLQTYVTQQLIRAAEIRASANLAATKMSECVLGQSKRVDFCGKGYHLMSFPQSAPHGVVFLHVTYVPAQEKNFTTAPAICHDGKAHFPREGVFVSNGTHWFVTQRNFYEPQIITTDNTFVSGNCDVVIGIVNNTVYDPLQPELDSFKEELDKYFKNHTSPDVDLGDISGINASVVNIQKEIDRLNEVAKNLNESLIDLQELGKYEQGSGYIPEAPRDGQAYVRKDGEWVLLSTFLENLYFQGDYKDDDDKHHHHHHHHH\n>6yam_f mol:protein length:71  ribosomal protein eS31\nKKSYTTPKKNKHKRKKVKLAVLKYYKVDENGKISRLRRECPSDECGAGVFMASHFDRHYCGKCCLTYCFNK\n>2fvv_A mol:protein length:194  Diphosphoinositol polyphosphate phosphohydrolase 1\nMHHHHHHSSGVDLGTENLYFQSMMKLKSNQTRTYDGDGYKKRAACLCFRSESEEEVLLVSSSRHPDRWIVPGGGMEPEEEPSVAAVREVCEEAGVKGTLGRLVGIFENQERKHRTYVYVLIVTEVLEDWEDSVNIGRKREWFKIEDAIKVLQYHKPVQASYFETLRQGYSANNGTPVVATTYSVSAQSSMSGIR\n>4fna_C mol:protein length:280  Ferric hydroxamate receptor 2\nGSNNKAETKSYKMDDGKTVDIPKDPKRIAVVAPTYAGGLKKLGANIVAVNQQVDQSKVLKDKFKGVTKIGDGDVEKVAKEKPDLIIVYSTDKDIKKYQKVAPTVVVDYNKHKYLEQQEMLGKIVGKEDKVKAWKKDWEETTAKDGKEIKKAIGQDATVSLFDEFDKKLYTYGDNWGRGGEVLYQAFGLKMQPEQQKLTAKAGWAEVKQEEIEKYAGDYIVSTSEGKPTPGYESTNMWKNLKATKEGHIVKVDAGTYWYNDPYTLDFMRKDLKEKLIKAAK\n>3zw8_A mol:protein length:742  PEROXISOMAL BIFUNCTIONAL ENZYME\nMGSSHHHHHHSSGLVPRGSHMAEYLRLPHSLAMIRLCNPPVNAVSPTVIREVRNGLQKAGSDHTVKAIVICGANGNFCAGADIHGFSAFTPGLALGSLVDEIQRYQKPVLAAIQGVALGGGLELALGCHYRIANAKARVGLPEVTLGILPGARGTQLLPRVVGVPVALDLITSGKYLSADEALRLGILDAVVKSDPVEEAIKFAQKIIDKPIEPRRIFNKPVPSLPNMDSVFAEAIAKVRKQYPGVLAPETCVRSIQASVKHPYEVGIKEEEKLFMYLRASGQAKALQYAFFAEKSANKWSTPSGASWKTASAQPVSSVGVLGLGTMGRGIAISFARVGISVVAVESDPKQLDAAKKIITFTLEKEASRAHQNGQASAKPKLRFSSSTKELSTVDLVVEAVFEDMNLKKKVFAELSALCKPGAFLCTNTSALNVDDIASSTDRPQLVIGTHFFSPAHVMRLLEVIPSRYSSPTTIATVMSLSKKIGKIGVVVGNCYGFVGNRMLAPYYNQGFFLLEEGSKPEDVDGVLEEFGFKMGPFRVSDLAGLDVGWKIRKGQGLTGPSLPPGTPVRKRGNSRYSPLGDMLCEAGRFGQKTGKGWYQYDKPLGRIHKPDPWLSTFLSQYREVHHIEQRTISKEEILERCLYSLINEAFRILEEGMAARPEHIDVIYLHGYGWPRHKGGPMFYAASVGLPTVLEKLQKYYRQNPDIPQLEPSDYLRRLVAQGSPPLKEWQSLAGPHGSKL\n>7ad0_M mol:protein length:14  Modified p53 peptide\nATSFAEYWALLXPA\n>2d0c_A mol:protein length:310  ribonuclease HIII\nMSNYVIQADQQLLDALRAHYEGALSDRLPAGALFAVKRPDVVITAYRSGKVLFQGKAAEQEAAKWISGASASNETADHQPSALAAHQLGSLSAIGSDEVGTGDYFGPIVVAAAYVDRPHIAKIAALGVKDSKQLNDEAIKRIAPAIMETVPHAVTVLDNPQYNRWQRSGMPQTKMKALLHNRTLVKLVDAIAPAEPEAIIIDEFLKRDSYFRYLSDEDRIIRERVHCLPKAESVHVSVAAASIIARYVFLEEMEQLSRAVGLLLPKGAGAIVDEAAARIIRARGEEMLETCAKLHFANTKKALAIAKRRK\n>6ba1_O mol:protein length:321  Inosine-uridine preferring nucleoside hydrolase\nGSHMKKLILDLDTGVDDTLAISYALGSPEMELIGITGTYGNVLMEQGVRNALAITDLLGHPEVKVYKGLSHASTKDSFEVLPISAFIHGDNGIGDVEIPDSPRKAEDESAVDFIIDSVKKYGKDLVYVPTGPMTNIAAALKKAPEIKDEIGKIVLMGGALTIHGNVNAWTEANISQDPDAADILFRSGAPVTMIGLDVTLQTLLTYKETKQWRDLNTKAGKFLADMTDFYIKAYETTAPHLGGCGLHDPLAVAVAVDPTLVTTLPINMQVDVEGPTRGRTIGDVTRLNDPVKTMQVAVGVDVPRFLNEFMTRISGLAKIAG\n>3fch_B mol:protein length:281  Carboxysome shell protein CsoS1D\nMSYYHHHHHHDYDIPTTENLTFQGAMEPTSSLNRGDRKKGSSLVTGSEVQSQSNGASCFITTDSEKSLVSRQASQVEQIELRTYVFLDSLQPQLAAYMGTVSRGFLPIPGDSCLWMEVSPGMAVHRVTDIALKASNVRLGQMIVERAFGSLALYHKDQSTVLHSGDVVLDAIGSEVRKRTKPSTSWTEVICAITPDHAVLINRQNRSGSMIQSGMSMFILETEPAGYVLKAANEAEKSANITIIDVKAVGAFGRLTLAGKEGDVEEAAAAAIRAIDQISNY\n>3r37_B mol:protein length:151  4-hydroxybenzoyl-CoA thioesterase\nMHRTSNGSHATGGNLPDVASHYPVAYEQTLDGTVGFVIDEMTPERATASVEVTDTLRQRWGLVHGGAYCALAQMLATEATVAVVHEKGMMAVGQSNHTSFFRPVKEGHVRAEAVRIHAGSTTWFWDVSLRDDAGRLCAVSSMSIAVRPRRD\n>7zpp_G mol:protein length:281  Integrase\nWIENIPLAEEEHNKWHQDAVSLHLEFGIPRTAAEDIVQQCDVCQENKMPSTLRGSNKRGIDHWQVDYTHYEDKIILVWVETNSGLIYAERVKGETGQEFRVQTMKWYAMFAPKSLQSDNGPAFVAESTQLLMKYLGIEHTTGIPWNPQSQALVERTHQTLKNTLEKLIPMFNAFESALAGTLITLNIKRKGGLGTSPMDIFIFNKEQQRIQQQSKSKQEKIRFCYYRTRKRGHPGEWQGPTQVLWGGDGAIVVKDRGTDRYLVIANKDVKFIPPPKEIQKE\n>3aty_B mol:protein length:379  Prostaglandin F2a synthase\nMATFPELLRPLKLGRYTLRNRIIMAPLTRCQATEDDHVPRTESMLKYYEDRASAGLIIAEATMVQPNYTGFLTEPGIYSDAQIEEWRKIVDAVHKKGGLIFLQLIHAGRAGIPEKILQQSKSDQDPLAGRLLAASAIPIKDHRIPAYFAASGEKETYGVPEELTDDEVRDGIIPLFVEGAKNAIFKAGFDGVEIHGANGYLLDAFFRESSNKRQSGPYAGTTIDTRCQLIYDVTKSVCDAVGSDRVGLRISPLNGVHGMIDSNPEALTKHLCKKIEPLSLAYLHYLRGDMVNQQIGDVVAWVRGSYSGVKISNLRYDFEEADQQIREGKVDAVAFGAKFIANPDLVERAQQNWPLNEPRPETYYTRTAVGYNDYPTYNK\n>3rkc_A mol:protein length:148  Capsid protein\nSRPFSVLRANDVLWLSLTAAEYDQTTYGSSTNPMYVSDTVTFVNVATGAQGVSRSLDWSKVTLDGRPLTTIQQYSKTFFVLPLRGKLSFWEAGTTKAGYPYNYNTTASDQILIENAPGHRVCISTYTTNLGSGPVSISAVGVLAPHSA\n>3gew_B mol:protein length:224  Chaperone protein faeE\nSLAVDQTRYIFRGDKDALTITVTNNDKERTFGGQAWVDNIVEKDTRPTFVVTPSFFKVKPNGQQTLRIIMASDHLPKDKESVYWLNLQDIPPALEGSGIAVALRTKLKLFYRPKALLEGRKGAEEGISLQSRPDGRTMLVNTTPYIFAIGSLLDGNGKKIATDNGTTQKLLMFMPGDEVQVKGNVVKVDSLNDYGELQTWTINKKKPAAPEAAKAEKADTAEQK\n>2zmv_A mol:protein length:227  Trafficking protein particle complex subunit 4\nMAIFSVYVVNKAGGLIYQLDSYAPRAEAEKTFSYPLDLLLKLHDERVLVAFGQRDGIRVGHAVLAINGMDVNGRYTADGKEVLEYLGNPANYPVSIRFGRPRLTSNEKLMLASMFHSLFAIGSQLSPEQGSSGIEMLETDTFKLHCYQTLTGIKFVVLADPRQAGIDSLLRKIYEIYSDFALKNPFYSLEMPIRCELFDQNLKLALEVAEKAGTFGPGSLEHHHHHH\n>6y7f_A mol:protein length:288  Elongation of very long chain fatty acids protein 7\nMAFSDLTSRTVHLYDNWIKDADPRVEDWLLMSSPLPQTILLGFYVYFVTSLGPKLMENRKPFELKKAMITYNFFIVLFSVYMCYEFVMSGWGIGYSFRCDIVDYSRSPTALRMARTCWLYYFSKFIELLDTIFFVLRKKNSQVTFLHVFHHTIMPWTWWFGVKFAAGGLGTFHALLNTAVHVVMYSYYGLSALGPAYQKYLWWKKYLTSLQLVQFVIVAIHISQFFFMEDCKYQFPVFACIIMSYSFMFLLLFLHFWYRAYTKGQRLPKTVKNGTCKNKDNAENLYFQ\n>3ejm_A mol:protein length:146  Nucleoside diphosphate kinase\nYKKAGLQRTLVLIKPDAFERSLVAEIMGRIEKKNFKIVSMKFWSKAPRNLIEQHYKEHSEQSYFNDNCDFMVSGPIISIVYEGTDAISKIRRLQGNTNPLASAPGTIRGDLANDIRENLIHASDSEDSAVDEISIWFPETKMETDN\n>4hem_E mol:protein length:123  Anti-baseplate TP901-1 Llama vHH 02\nQVQLVESGGGLVQAGGSLRLSCAASESTFSNYAMGWFRQAPGPEREFVATISQTGSHTYYRNSVKGRFTISRDNAKNTVYLQMNNMKPEDTAVYYCAAGDNYYYTRTYEYDYWGQGTQVTVSS\n>3njk_A mol:protein length:128  Peptidase\nSNAMFAPQGLAQFIKVNVTLENGEPVFIYTDANGQVCQGDITVTQAGTITYLLNDQTLKGLKFVGVGFVTPFDGIIDAVTISSDGMLVQLVDLDKTPGTTKFQFVLSNTANTLLVLSPAPQIINRPQN\n>2xwq_B mol:protein length:133  SIROHYDROCHLORIN COBALTOCHELATASE\nGMRRGLVIVGHGSQLNHYREVMELHRKRIEESGAFDEVKIAFAARKRRPMPDEAIREMNCDIIYVVPLFISYGLHVTEDLPDLLGFPRGRGIKEGEFEGKKVVICEPIGEDYFVTYAILNSVFRIGRDGKGEE\n>7spi_F3 mol:protein length:453  TraB\nMANVNKVVRRRQVALLIALVLGIGAGGAGTWMVSEMNLKKAPPAKAPKGEPAPDMTGVVNQSFDNKVQRSAIAEAQRLNKETQTEIKKLRTEMGLVSRDLKGSQDRIRELEDQNQLLQTQLEAGKNFDSLSAEPLPGALASQGKPAPAGNVPPPTSFWPAGGGQAPAAPVMTPIQRPGMMDSQEFSLPDTGPKKPRFPWISSGSFVEAIVVEGADANASVTGDKNTAPMQLRLTGKVQMPNDEEFDLTGCFVTLEAWGDVSSERAIVRSRSISCKLGDDDIDQKIAGHVSFMGKNGIKGEVVMRNGQILLYAGGAGFLDGIGKGIEKASSTTVGVGATASMSAADIGQAGLGGGVSSAAKTLSDYYIKRAEQYHPVIPIGAGNEVTLVFQDGFQLETLEEARAKAAARKKQNQPSASSTPAAMPGNTPDMLKQLQDFRVGDTVDPATGQVVTQ\n>4clr_D mol:protein length:288  PTERIDINE REDUCTASE 1\nMGSSHHHHHHSSGLVPRGSHMEAPAAVVTGAAKRIGRAIAVKLHQTGYRVVIHYHNSAEAAVSLADELNKERSNTAVVCQADLTNSNVLPASCEEIINSCFRAFGRCDVLVNNASAFYPTPLVQGDHEDNSNGKTVETQVAELIGTNAIAPFLLTMSFAQRQKGTNPNCTSSNLSIVNLCDAMVDQPCMAFSLYNMGKHALVGLTQSAALELAPYGIRVNGVAPGVSLLPVAMGEEEKDKWRRKVPLGRREASAEQIADAVIFLVSGSAQYITGSIIKVDGGLSLVHA\n>4u50_C0 mol:protein length:105  40S ribosomal protein S10-A\nMLMPKEDRNKIHQYLFQEGVVVAKKDFNQAKHEEIDTKNLYVIKALQSLTSKGYVKTQFSWQYYYYTLTEEGVEYLREYLNLPEHIVPATYIQERNPTQRPQRRY\n>7ezx_G8 mol:protein length:177  B-phycoerythrin beta chain\nMLDAFSRVVVNSDAKAAYVGGSDLQALKSFIADGNKRLDAVNSIVSNASCMVSDAVSGMICENPGLISPGGNCYTNRRMAACLRDGEIILRYVSYALLAGDASVLEDRCLNGLKETYIALGVPTNSSIRAVSIMKAQAVAFITNTATERKMSFAAGDCTSLASEVASYFDRVGAAIS\n>5da5_c mol:protein length:116  Rru_A0973\nMAQSSNSTHEPLEVLKEETVNRHRAIVSVMEELEAVDWYDQRVDASTDPELTAILAHNRDEEKEHAAMTLEWLRRNDAKWAEHLRTYLFTEGPITAANSSSVDKLAAALEHHHHHH\n>2amf_A mol:protein length:259  1-Pyrroline-5-Carboxylate reductase\nSNAMKIGIIGVGKMASAIIKGLKQTPHELIISGSSLERSKEIAEQLALPYAMSHQDLIDQVDLVILGIKPQLFETVLKPLHFKQPIISMAAGISLQRLATFVGQDLPLLRIMPNMNAQILQSSTALTGNALVSQELQARVRDLTDSFGSTFDISEKDFDTFTALAGSSPAYIYLFIEALAKAGVKNGIPKAKALEIVTQTVLASASNLKTSSQSPHDFIDAICSPGGTTIAGLMELERLGLTATVSSAIDKTIDKAKSL\n>4v5r_AJ mol:protein length:105  30S RIBOSOMAL PROTEIN S10\nMPKIRIKLRGFDHKTLDASAQKIVEAARRSGAQVSGPIPLPTRVRRFTVIRGPFKHKDSREHFELRTHNRLVDIINPNRKTIEQLMTLDLPTGVEIEIKTVGGGR\n>7n02_B mol:protein length:362  Aminopeptidase P family protein\nMSKIERISAFLNDKEVDMTFITNPTTLNYLTGLAISPHERIAGLMIFRDSTPMLFTPALEVEKAKEHTSGLDIFGYEDSQNPWEVVKNHVKSDVKSIAVEFSDIPLAKTEGLKAQFGDINFVNLTPLIERMRLIKSADEIEKMKVAGDFADKCFEIGFATAAERNGVTESDIVAKIEYEMKRMGVPQMSFDTLVLSGARAANPHGAPENVEIQENKLLLFDLGVMSGGYASDATRTIAIGQPNDFDAEIHKIVKEAQQAAMDFIKPGVTAHEVDAVARDLITKAGYGEYFNHRLGHGIGMDVHEYPSIVAGNDLVIQEGMCFSNEPGIYIPGKVGVRIEDCLYVTENGCESFTHTDHDLLIF\n>2ivq_J mol:protein length:156  CYANATE HYDRATASE\nMIQSQINRNIRLDLADAILLSKAKKDLSFAEIADGTGLAEAFVTAALLGQQALPADAARLVGAKLDLDEDSILLLQMIPLRGCIDDRIPTDPTMYKFYEMLQVYGTTLKALVHEKFGDGIISAINFKLDVKKVADPEGGERAVITLDGKYLPTKPF\n>2p1n_D mol:protein length:160  SKP1-like protein 1A\nMSAKKIVLKSSDGESFEVEEAVALESQTIAHMVEDDCVDNGVPLPNVTSKILAKVIEYCKRHVEAAASKAEAVEGAATSDDDLKAWDADFMKIDQATLFELILAANYLNIKNLLDLTCQTVADMIKGKTPEEIRTTFNIKNDFTPEEEEEVRRENQWAFE\n>6png_A mol:protein length:421  Nitric oxide synthase, brain\nCPRFLKVKNWETEVVLTDTLHLKSTLETGCTEYICMGSIMHPSQHARRPEDVATKDQLFPLAKEFIDQYYSSIKRFGSKAHMERLEEVNKEIDTTSTYQLKDTELIYGAKHAWRNASRCVGRIQWSKLQVFDARDCTTAHGMFNYICNHVKYATNKGNLRSAITIFPQRTDGKHDFRVWNSQLIRYAGYKQPDGSTLGDPANVQFTEICIQQGWKPPRGRFDVLPLLLQANGNDPELFQIPPELVLEVPIRHPKFEWFKDLGLKWYGLPAVSNMLLEIGGLEFSACPFSGWYMGTEIGVRDYCDNSRYNILEEVAKKMNLDMRKTSSLWKDQALVEINIAVLYSFQSDKVTIVDHHSATESFIKHMENEYRCRGGCPADWVWIVPPMSGSITPVFHQEMLNYRLTPSFEYQPDPWNTHVWK\n>4v55_DR mol:protein length:103  50S ribosomal protein L21\nMYAVFQSGGKQHRVSEGQTVRLEKLDIATGETVEFAEVLMIANGEEVKIGVPFVDGGVIKAEVVAHGRGEKVKIVKFRRRKHYRKQQGHRQWFTDVKITGISA\n>5y6p_v1 mol:protein length:161  beta_APC\nMQDAITAVINTADVQGKYLDDNSLDKLRGYFETGELRVRAAATIAANAATIIKESVAKALLYSDITRPGGNMYTTRRYAACIRDLDYYLRYATYGMLAGDPSILDERVLNGLKETYNSLGVPIGATVQAIQAMKEVTASLVGTNAGQEMAVYFDYICSGLS\n>1lqo_A mol:protein length:135  PROBABLE Fosfomycin Resistance Protein\nMLTGLNHLTLAVADLPASIAFYRDLLGFRLEARWDQGAYLELGSLWLCLSREPQYGGPAADYTHYAFGIAAADFARFAAQLRAHGVREWKQNRSEGDSFYFLDPDGHRLEAHVGDLRSRLAACRQAPYAGMRFAD\n>1z5n_B mol:protein length:242  MTA/SAH nucleosidase\nFQGAMDPEFSMKIGIIGAMEEQVTLLRDKIENRQTISLGGCEIYTGQLNGTEVALLKSGIGKVAAALGATLLLEHCKPDVIINTGSAGGLAPTLKVGDIVVSDEARYHDADVTAFGYEYGQLPGCPAGFKADDKLIAAAEACIAELNLNAVRGLIVSGDAFINGSVGLAKIRHNFPQAIAVEMEATAIAHVCHNFNVPFVVVRAISDVADQQSHLSFDEFLAVAAKQSSLMVESLVQKLAHG\n>2xm1_A mol:protein length:716  O-GLCNACASE BT_4395\nQNVSLQPPPQQLIVQNKTIDLPAVYQLNGGEEANPHAVKVLKELLSGKQSSKKGMLISIGEKGDKSVRKYSRQIPDHKEGYYLSVNEKEIVLAGNDERGTYYALQTFAQLLKDGKLPEVEIKDYPSVRYRGVVEGFYGTPWSHQARLSQLKFYGKNKMNTYIYGPKDDPYHSAPNWRLPYPDKEAAQLQELVAVANENEVDFVWAIHPGQDIKWNKEDRDLLLAKFEKMYQLGVRSFAVFFDDISGEGTNPQKQAELLNYIDEKFAQVKPDINQLVMCPTEYNKSWSNPNGNYLTTLGDKLNPSIQIMWTGDRVISDITRDGISWINERIKRPAYIWWNFPVSDYVRDHLLLGPVYGNDTTIAKEMSGFVTNPMEHAESSKIAIYSVASYAWNPAKYDTWQTWKDAIRTILPSAAEELECFAMHNSDLGPNGHGYRREESMDIQPAAERFLKAFKEGKNYDKADFETLQYTFERMKESADILLMNTENKPLIVEITPWVHQFKLTAEMGEEVLKMVEGRNESYFLRKYNHVKALQQQMFYIDQTSNQNPYQPGVKTATRVIKPLIDRTFATVVKFFNQKFNAHLDATTDYMPHKMISNVEQIKNLPLQVKANRVLISPANEVVKWAAGNSVEIELDAIYPGENIQINFGKDAPCTWGRLEISTDGKEWKTVDLKQKESRLSAGLQKAPVKFVRFTNVSDEEQQVYLRQFVLTIEKK\n>3dll_2 mol:protein length:47  50S ribosomal protein L34\nMKRTYQPNNRKRAKTHGFRARMKTKSGRNILARRRAKGRHQLTVSDE\n>4cub_B mol:protein length:183  BETA-GALACTOSIDASE\nQTEQGANISDQWTGSELPLAFASDSNPSDPVSNVNDKLISYNNQPANRWTNWNRSNPEASVGVLFGDSGILSKRSVDNLSVGFHEDHGVGAPKSYVIEYYVGKTVPTAPKNPSFVGNEDHVFNDSANWKPVTNLKAPAQLKAGEMNHFSFDKVETYAIRIRMVKADNKRGTSITEVQIFAKQV\n>1otr_B mol:protein length:76  Ubiquitin\nMQIFVKTLTGKTITLEVESSDTIDNVKSKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGG\n>2oig_A mol:protein length:111  RS21-C6\nGPLGSRPFRFSPEPTLEDIRRLHAEFAAERDWEQFHQPRNLLLALVGEVGELAELFQWKSDTEPGPQAWPPKERAALQEELSDVLIYLVALAARCHVDLPQAVISKMDTNR\n>5vhr_E mol:protein length:262  26S proteasome regulatory subunit 10B\nGNVSYSEIGGLSEQIRELREVIELPLTNPELFQRVGIIPPKGCLLYGPPGTGKTLLARAVASQLDCNFLKVVSSSIVDKYIGESARLIREMFNYARDHQPCIIFMDEIDAIGGRRFSEGTSADREIQRTLMELLNQMDGFDTLHRVKMIMATNRPDTLDPALLRPGRLDRKIHIDLPNEQARLDILKIHAGPITKHGEIDYEAIVKLSDGFNGADLRNVCTEAGMFAIRADHDFVVQEDFMKAVRKVADSKKLESKLDYKPV\n>6zke_s mol:protein length:137  NADH:ubiquinone oxidoreductase subunit B7\nMGAHLARRYLGDASVEPEPLRMPTFPPDYGFPERKEREMVATQQEMNDAQLVLQQRDYCAHYLIRFLKCKRDSFPNFLACKHEQHDWDYCEHLDYVKRMKEFERERRLLQRKKRREQREADMAKGLGPGEVAPEVAL\n>7lmx_C mol:protein length:75  Integrin inhibitor\nSTKCVVRFVFRGDLATLMLRAVKDHLKKEGPHWNITSTNNGAELVVRGIHESDAKRIAKWVEKRFPGVHTETQCD\n>6qn7_L mol:protein length:216  Light chain of bovine anti-RSV B13\nQAVLTQPPSVSGSLGQRVSITCSGSSDNIGIFAVGWYQQVPGSGLRTIIYGNTKRPSGVPDRFSGSKSGNTATLTINSLQAEDEADYFCVCGESKSATPVFGGGTTLTVLGQPKSPPSVTLFPPSTEELNGNKATLVCLISDFYPGSVTVVWKADGSTITRNVETTRASKQSNSKYAASSYLSLTSSDWKSKGSYSCEVTHEGSTVTKTVKPSECS\n>5b00_A mol:protein length:294  MoeN5\nMAHHHHHHVDDDDKAASWSHPQFEKGAENLYFQSMLAAEAANRDHVTRCVAQTGGSPDLVAHTAALRLYLRVPHFLTEWTTDPDRRAAVSRALALDIVSMKLLDDLMDDDTGLDRVELACVCLRLHLRALHELESLARDPKAVTDILEQDAVHLCGGQIRTKRSRATNLREWRAHASTYGSTFLGRYGALAAACGGEGQPADSVREFAEAFAMTITMADDLTDYDRNGERDGNLAHLMRTGAVAGQDVVDLLEELRGRALAAVAAPPGAPGLVPVVHLYTDDVLVRLLPRHLGE\n>6iqt_D mol:protein length:166  Cag pathogenicity island protein (Cag10)\nGTSSMADIGSGEFKIVKRSDARQIVNSEAVVDSATSKFVSLLFGYSKNSLRDRKDQLMQYCDVSFQTQAMRMFNENIRQFVDKVRAEAIISSNIQREKVKNSPLTRLTFFITIKITPDTMENYEYITKKQVTIYYDFARGNSSQENLIINPFGFKVFDIQITDLQN\n>4o26_A mol:protein length:257  Telomerase reverse transcriptase\nGSGFLYGGRGMHGFCLNRKRRTAAGPRRLQGQDLVRLVFFEGLPYLNGQERKPKKLPLRYFNMVPVFGRLLQRHRKCRYSSVLHRMCPVVELSRAAQGELSSLIPQHCAPHRVYLFVRECLTAVVPEELWGSDHNRLQFFSRVRGFLKSGKFERISVAELMWKIKVMDCDWLKLRRTAGRFPPSELAYRTRILSQFLTWLLDGFVVGLVRACFYATESVGQKNAIRFYRQEVWSKLQDLAFRRHIAKGEMEELSPAQ\n>8d0k_B mol:protein length:374  CST complex subunit STN1\nMHHHHHHQPGSSRCEEETPSLLWGLDPVFLAFAKLYIRDILDMKESRQVPGVFLYNGHPIKQVDVLGTVIGVRERDAFYSYGVDDSTGVINCICWKKLNTESVSAAPSAARELSLTSQLKKLQETIEQKTKIEIGDTIRVRGSIRTYREEREIHATTYYKVDDPVWNIQIARMLELPTIYRKVYDQPFHSSALEKEEALSNPGALDLPSLTSLLSEKAKEFLMENRVQSFYQQELEMVESLLSLANQPVIHSASSDQVNFKKDTTSKAIHSIFKNAIQLLQEKGLVFQKDDGFDNLYYVTREDKDLHRKIHRIIQQDCQKPNHMEKGCHFLHILACARLSIRPGLSEAVLQQVLELLEDQSDIVSTMEHYYTAF\n>7mus_FD mol:protein length:163  DotD\nMNNNKIVIMFIFSALLAGCAGTMKFKKPPINNPSDDATIKLAEAAVSVSDSMLEMAKVEKVITPPSKDNTLTIPNAYNLQARASVDWSGPIEELTARIAKAAHFRFRVLGKSPSVPVLISISTKDESLAEILRDIDYQAGKKASIHVYPNSQVVELRYAKIYS\n>2olh_A mol:protein length:361  Chitinase-3-like protein 1\nYKLICYYTSWSQYREGDGSCFPDAIDPFLCTHVIYSFANISNNEIDTWEWNDVTLYDTLNTLKNRNPKLKTLLSVGGWNFGPERFSKIASKTQSRRTFIKSVPPFLRTHGFDGLDLAWLYPGRRDKRHLTALVKEMKAEFAREAQAGTERLLLSAAVSAGKIAIDRGYDIAQISRHLDFISLLTYDFHGAWRQTVGHHSPLFRGNSDASSRFSNADYAVSYMLRLGAPANKLVMGIPTFGRSFTLASSKTDVGAPISGPGIPGRFTKEKGILAYYEICDFLHGATTHRFRDQQVPYATKGNQWVAYDDQESVKNKARYLKNRQLAGAMVWALDLDDFRGTFCGQNLTFPLTSAVKDVLARV\n>6ue6_D mol:protein length:141  Histone-lysine N-methyltransferase NSD2\nGGRDKDHLLKYNVGDLVWSKVSGYPWWPCMVSADPLLHSYTKLKGQKKSARQYHVQFFGDAPERAWIFEKSLVAFEGEGQFEKLCQESAKQAPTKAEKIKLLKPISGKLRAQWEMGIVQAEEAASMSVEERKAKFTFLYVG\n>2nvy_C mol:protein length:318  DNA-directed RNA polymerase II 45 kDa polypeptide\nMSEEGPQVKIREASKDNVDFILSNVDLAMANSLRRVMIAEIPTLAIDSVEVETNTTVLADEFIAHRLGLIPLQSMDIEQLEYSRDCFCEDHCDKCSVVLTLQAFGESESTTNVYSKDLVIVSNLMGRNIGHPIIQDKEGNGVLICKLRKGQELKLTCVAKKGIAKEHAKWGPAAAIEFEYDPWNKLKHTDYWYEQDSAKEWPQSKNCEYEDPPNEGDPFDYKAQADTFYMNVESVGSIPVDQVVVRGIDTLQKKVASILLALTQMDQDKVNFASGDNNTASNMLGSNEDVMMTGAEQDPYSNASQMGNTGSGGYDNAW\n>2vd0_D mol:protein length:199  GLUTATHIONE-REQUIRING PROSTAGLANDIN D SYNTHASE\nMPNYKLTYFNMRGRAEIIRYIFAYLDIQYEDHRIEQADWPEIKSTLPFGKIPILEVDGLTLHQSLAIARYLTKNTDLAGNTEMEQCHVDAIVDTLDDFMSCFPWAEKKQDVKEQMFNELLTYNAPHLMQDLDTYLGGREWLIGNSVTWADFYWEICSTTLLVFKPDLLDNHPRLVTLRKKVQAIPAVANWIKRRPQTKL\n>1yf1_B mol:protein length:186  Alkyl hydroperoxide reductase subunit C\nSLINTKIKPFKNQAFKNGEFIEVTEKDTEGRWSVFFFYPADFTFVCPTELGDVADHYEELQKLGVDVYSVSTDTHFVHKAWHSSSETIAKIKYAMIGDPTGALTRNFDNMREDEGLADRATFVVDPQGIIQAIEVTAEGIGRDASDLLRKIKAAQYVAAHPGEVCPAKWKEGEATLAPSLDLVGKI\n>4g4s_B mol:protein length:250  Proteasome component Y7\nMTDRYSFSLTTFSPSGKLGQIDYALTAVKQGVTSLGIKATNGVVIATEKKSSSPLAMSETLSKVSLLTPDIGAVYSGMGPDYRVLVDKSRKVAHTSYKRIYGEYPPTKLLVSEVAKIMQEATQSGGVRPFGVSLLIAGHDEFNGFSLYQVDPSGSYFPWKATAIGKGSVAAKTFLEKRWNDELELEDAIHIALLTLKESVEGEFNGDTIELAIIGDENPDLLGYTGIPTDKGPRFRKLTSQEINDRLEAL\n>6mjz_C mol:protein length:495  Fusion glycoprotein F0\nQIDITKLQHVGVLVNSPKGMKISQNFETRYLILSLIPKIEDSNSCGDQQIKQYKRLLDRLIIPLYDGLKLQKDVIVTNQESNENTDPRTERFFGGVIGTIALGVATSAQITAAVALVEAKQAKSDIEKLKEAIRDTNKAVQSVCSSVGNCIVAIKSVQDYVNKEIVPSIARLGCEAAGLQLGIALTQHYSELTNCFGDNIGSLQEKGIKLQCIASLYRTNITEIFTTSTVDKYDIYDLLFTESIKVRVIDVDLNDYSITLQVRLPLLTRLLNTQIYKVDSISYNIQNREWYIPLPSHIMTKGAFLGGADVKECIEAFSSYICPSDPGFVLNHEMESCLSGNISQCPRTTVTSDIVPRYAFVNGGVVANCITTTCTCNGIGNRINQPPDQGVKIITHKECNTIGINGMLFNTNKEGTLAFYTPDDITLNNSVALDPIDISIELNKVKSDLEESKEWYRRSNQKLSAIEDKIEEILSKIYHIENEIARIKKLIGEAP\n>5vbr_A mol:protein length:113  Bromodomain testis-specific protein\nGAASTNQLQYLQKVVLKDLWKHSFSWPFQRPVDAVKLQLPDYYTIIKNPMDLNTIKKRLENKYYAKASECIEDFNTMFSNCYLYNKPGDDIVLMAQALEKLFMQKLSQMPQEE\n>1wuu_B mol:protein length:399  Galactokinase\nMAHHHHHHAALRQPQVAELLAEARRAFREEFGAEPELAVSAPGRVNLIGEHTDYNQGLVLPMALELMTVLVGSPRKDGLVSLLTTSEGADEPQRLQFPLPTAQRSLEPGTPRWANYVKGVIQYYPAAPLPGFSAVVVSSVPLGGGLSSSASLEVATYTFLQQLCPDSGTIAARAQVCQQAEHSFAGMPCGIMDQFISLMGQKGHALLIDCRSLETSLVPLSDPKLAVLITNSNVRHSLASSEYPVRRRQCEEVARALGKESLREVQLEELEAARDLVSKEGFRRARHVVGEIRRTAQAAAALRRGDYRAFGRLMVESHRSLRDDYEVSCPELDQLVEAALAVPGVYGSRMTGGGFGGCTVTLLEASAAPHAMRHIQEHYGGTATFYLSQAADGAKVLCL\n>1wp9_D mol:protein length:494  ATP-dependent RNA helicase, putative\nMVLRRDLIQPRIYQEVIYAKCKETNCLIVLPTGLGKTLIAMMIAEYRLTKYGGKVLMLAPTKPLVLQHAESFRRLFNLPPEKIVALTGEKSPEERSKAWARAKVIVATPQTIENDLLAGRISLEDVSLIVFDEAHRAVGNYAYVFIAREYKRQAKNPLVIGLTASPGSTPEKIMEVINNLGIEHIEYRSENSPDVRPYVKGIRFEWVRVDLPEIYKEVRKLLREMLRDALKPLAETGLLESSSPDIPKKEVLRAGQIINEEMAKGNHDLRGLLLYHAMALKLHHAIELLETQGLSALRAYIKKLYEEAKAGSTKASKEIFSDKRMKKAISLLVQAKEIGLDHPKMDKLKEIIREQLQRKQNSKIIVFTNYRETAKKIVNELVKDGIKAKRFVGQASKENDRGLSQREQKLILDEFARGEFNVLVATSVGEEGLDVPEVDLVVFYEPVPSAIRSIQRRGRTGRHMPGRVIILMAKGTRDEAYYWSSRQKEKIMQE\n>6mxv_B mol:protein length:252  Rhodanese-like family protein\nMKIMQHSSGFLKLVDDAKSRIQECSVDDIQKMNETQTLDGLLIDTREESEVANGYIPNAIHLSKGIIESAIESAVPNKNQKMYFYCGGGFRSALVADKLREMGYKNVISVDGGWRAWNAKGYPTVSPNQFRPNEFLKLVNNAKTQIKECSTTELYNKINSQELDGIVFDVREDSEFNRFHIQGATHLSKGQIEVKIENLVPNKQQKIYLYCGSGFRSALAAESLQHMGYTNVVSIAGGIKDWLANNYPVSQN\n>6owg_B9 mol:protein length:113  Microcompartments protein\nMAVAVGMIETLGFPAVVEAADAMVKAARVTLVGYEKIGTGRVTVIVRGDVSEVQASVSAGTESVKRVNGGQVLSTHIIARPHENLEYVLPIRYTEEVEQFREGVGTPRNITRQ\n>6x6s_IC mol:protein length:481  Type IV secretion system apparatus protein Cag3\nMFRKLATAVSLIGLLTSNTLYAKEISEADKVIKATKETKETKKEAKRLKKEAKQRQQIPDHKKPQYVSVDDTKTQALFDIYDTLNVNDKSFGDWFGNSALKDKTYLYAMDLLDYNNYLSIENPIIKTRAMGTYADLIIITGSLEQVNGYYNILKALNKRNAKFVLKINENMPYAQATFLRVPKRSDPNAHTLDKGASIDENKLFEQQKKMYFNYANDVICRPDDEVCSPLRDEMVAMPTSDSVTQKPNIIAPYSLYRLKETNNANEAQPSPYATATAPENSKEKLIEELIANSQLVANEEEREKKLLAEKEKQEAELAKYKLKDLENQKKLKALEAELKKKNAKKPRVVEVPVSPQTSNSDETMRVVKEKENYNGLLVDKETTIKRSYEGTLISENSYSKKTPLNPNDLRSLEEEIKSYYIKSNGLCYTNGINLYVKIKNDPYKEGMLCGYESVQNLLSPLKDKLKYDKQKLQKALLKDSK\n>6th6_Al mol:protein length:135  30S ribosomal protein S9\nMRVIQTAGKRKTAVARATIREGKGRVRINHKPVEIIEPEIARFTIMEPLILAGEEIVSRVDIDVKVEGGGFMGQAEAARVAIARALVEWTNDMNLKEKFMKYDRTMLVGDSRRTEPHKPNRSTKGPRAKRQKSYR\n>6lvv_G mol:protein length:775  N,N-dimethylformamidase large subunit\nMKDIAIRGYCDRPSVATGETIRFYVSANETRGTFDAELVRLIHGDSNPAGPGYKEEAIKSDLEGQYPARFQRTQFGSYVEVADPDAGLQPDGAFSVHLFLWSTTPSRGRQGIASRWNDERQSGWNLAIEDGRVVFTIGDGSGATSSVVSDRPLFQQIWYSITGVYDPEKKQLRLYQKSVVNRTNSRFGLVVPLDSDCAVSADATVKAADSETSLLIAGLGEAAAQDGRTWCIAHYNGKVDAPKIYGCALGQDDAEKLSRGEIVRPISRLAHWDFSAGIGLNGIPTDHVVDASGYGHHGRCMNQPSRGSTGWNWDGHEENFIHCPEQYGALWFHEDCLDDCRWEKDFEFTVPEGLKSDFYAVKIRYEDTEDYIPFFVLPPRGTATAPILVIASTLSYLAYANEQIMHKADIGQAVAGHTPVLNENDVELHKNLSYYGLSTYDGHIDGRGVQYTSWRRPIMNLRPKHRQGFGSIWELPADLHLIDWLNHNGFEYDVATEHDLNDQGAELLRRYKVVLTGSHPEYQTWANADAWEDYLADGGRGMYLAANGMYWIVEVHPEKPWVMEVRKELGVTAWEAPPGEYHYSTNGRRGGRFRGRARATQKIWGTGMSSFGFDHSGYFVQMPDSQDERVAWIMEGIDPEERIGDGGLVGGGAGGYELDRYDLALGTPPNTLLLASSVEHSVVYTVIPDDKAFPHPGMNGGEHPFVRADITYFSTANGGGMFATSSISWLGSLSWNDYDNNVSKMTKNVLNQFIKDEPAPRVKLAAALEHHHHHH\n>1esb_A mol:protein length:240  PORCINE PANCREATIC ELASTASE\nVVGGTEAQRNSWPSQISLQYRSGSSWAHTCGGTLIRQNWVMTAAHCVDRELTFRVVVGEHNLNQNNGTEQYVGVQKIVVHPYWNTDDVAAGYDIALLRLAQSVTLNSYVQLGVLPRAGTILANNSPCYITGWGLTRTNGQLAQTLQQAYLPTVDYAICSSSSYWGSTVKNSMVCAGGDGVRSGCQGDSGGPLHCLVNGQYAVHGVTSFVSRLGCNVTRKPTVFTRVSAYISWINNVIASN\n>3wry_B mol:protein length:431  Tm-1 protein\nMATAQSNSPRVFCIGTADTKFDELRFLSEHVRSSLNSFSNKSSFKVGVTVVDVSTSWKETNSCADFDFVPSKDVLSCHTLGEETMGTFADTRGLAIAIMSKALETFLSIANDEQNLAGVIGLGGSGGTSLLSSAFRSLPIGIPKVIISTVASGQTESYIGTSDLVLFPSVVDICGINNVSKVVLSNAGAAFAGMVIGRLESSKEHSITNGKFTVGVTMFGVTTPCVNAVKERLVKEGYETLVFHATGVGGRAMEDLVRGGFIQGVLDITTTEVADYVVGGVMACDSSRFDAILEKKIPLVLSVGALDMVNFGPKTTIPPEFQQRKIHEHNEQVSLMRTTVGENKKFAAFIAEKLNKASSSVCVCLPEKGVSALDAPGKDFYDPEATSCLTRELQMLLENNERCQVKVLPYHINDAEFANALVDSFLEISPK\n>4i55_F mol:protein length:384  Tubulin tyrosine ligase, TTL\nMYTFVVRDENSSVYAEVSRLLLATGQWKRLRKDNPRFNLMLGERNRLPFGRLGHEPGLVQLVNYYRGADKLCRKASLVKLIKTSPELSESCTWFPESYVIYPTNLKTPVAPAQNGIRHLINNTRTDEREVFLAAYNRRREGREGNVWIAKSSAGAKGEGILISSEASELLDFIDEQGQVHVIQKYLEKPLLLEPGHRKFDIRSWVLVDHLYNIYLYREGVLRTSSEPYNSANFQDKTCHLTNHCIQKEYSKNYGRYEEGNEMFFEEFNQYLMDALNTTLENSILLQIKHIIRSCLMCIEPAISTKHLHYQSFQLFGFDFMVDEELKVWLIEVNGAPACAQKLYAELCQGIVDVAISSVFPLADTGQKTSQPTSIFIKLHHHHHH\n>3dal_B mol:protein length:196  PR domain zinc finger protein 1\nSSGLVPRGSKKMDMEDADMTLWTEAEFEEKCTYIVNDHPWDSGADGGTSVQAEASLPRNLLFKYATNSEEVIGVMSKEYIPKGTRFGPLIGEIYTNDTVPKNANRKYFWRIYSRGELHHFIDGFNEEKSNWMRYVNPAHSPREQNLAACQNGMNIYFYTIKPIPANQELLVWYCRDFAERLHYPYPGELTMMNLTQ\n>6pjj_A mol:protein length:351  Serine/threonine-protein kinase PRP4 homolog\nSMDFKENPNLRDNWTDAEGYYRVNIGEVLDKRYNVYGYTGQGVFSNVVRARDNARANQEVAVKIIRNNELMQKTGLKELEFLKKLNDADPDDKFHCLRLLRHFYHKQHLCLVFEPLSMNLREVLKKYGKDVGLHIKAVRSYSQQLFLALKLLKRCNILHADIKPDNILVNESKTILKLCDFGSASHVADNDITPYLFSRFYRAPEIIIGKSYDYGIDMWSVGCTLYELYTGKILFPGKTNNHMLKLAMDLKGKMPNKMIRKGVFKDQHFDQNLNFMYIEVDKVTEREKVTVMSTINPTKDLLADLIGCQRLPEDQRKKVHQLKDLLDQILMLDPAKRISINQALQHAFIQE\n>7ajb_AO mol:protein length:75  ATP synthase F(0) complex subunit C2, mitochondrial\nDIDTAAKFIGAGAATVGVAGSGAGIGTVFGSLIIGYARNPSLKQQLFSYAILGFALSEAMGLFCLMVAFLILFAM\n>7a4g_FI mol:protein length:197  Antitermination protein N,6,7-dimethyl-8-ribityllumazine synthase,6,7-dimethyl-8-ribityllumazine synthase\nMGNAKTRRRERRAEKQAQWKAANAGAGAGAMATPHFDYIASEVSKGLANLSLELRKPITFGVITADTLEQAIERAGTKHGNKGWEAALSAIEMANLFKSLRGTGHHHHHHGSSMEIYEGKLTAEGLRFGIVASRFNHALVDRLVEGAIDCIVRHGGREEDITLVRVPGSWEIPVAAGELARKEDIDAVIAIGVLIRG\n>6r8h_E mol:protein length:250  Triosephosphate isomerase\nASNRKFFVGGNWKMNGSKESNQKLLKTLSDAKPDANTEILVAVPFVYLKDVREHLDKRFHVAAQNCYKVASGAFTGEISPAMIRDCGCEWVILGHSERRHIFGESDELIGEKVNHALTCGLKVVPCIGEKLDEREAGKTEQVCFRQLDAIKKGIPKAEDWSRVVIAYEPVWAIGTGKTASPEQAQEVHHAVRQWLEKNVSQAVASSLRITYGGSVTAANCKELAKKPDVDGFLVGGASLKPEFVDICNAN\n>7of2_U mol:protein length:153  39S ribosomal protein L23, mitochondrial\nMARNVVYPLYRLGGPQLRVFRTNFFIQLVRPGVAQPEDTVQFRIPMEMTRVDLRNYLEGIYNVPVAAVRTRVQHGSNKRRDHRNVRIKKPDYKVAYVQLAHGQTFTFPDLFPEKDESPEGSAADDLYSMLEEERQQRQSSDPRRGGVPSWFGL\n>1xa6_A mol:protein length:466  Beta2-chimaerin\nMRLLSSLSGSSVSSDAEEYQPPIWKSYLYQLQQEAPRPKRIICPREVENRPKYYGREFHGIISREQADELLGGVEGAYILRESQRQPGCYTLALRFGNQTLNYRLFHDGKHFVGEKRFESIHDLVTDGLITLYIETKAAEYISKMTTNPIYEHIGYATLLREKVSRRLSRSKNEPRKTNVTHEEHTAVEKISSLVRRAALTHNDNHFNYEKTHNFKVHTFRGPHWCEYCANFMWGLIAQGVRCSDCGLNVHKQCSKHVPNDCQPDLKRIKKVYCCDLTTLVKAHNTQRPMVVDICIREIEARGLKSEGLYRVSGFTEHIEDVKMAFDRDGEKADISANVYPDINIITGALKLYFRDLPIPVITYDTYSKFIDAAKISNADERLEAVHEVLMLLPPAHYETLRYLMIHLKKVTMNEKDNFMNAENLGIVFGPTLMRPPEDSTLTTLHDMRYQKLIVQILIENEDVLF\n>6y9i_BBB mol:protein length:292  Major Capsid Protein VP1\nGSHMGGVEVLNIITGPDSTTEIELYLEPRMGINSPTGDKKEWYGYSEVIHHADGYDNNLLSIQMPQYSCARVQLPMLNTDMTSDTLMMWEAVSCKTEIVGIGSLISVHLLEAKMAAKEGGDGPSQPIEGMNYHMFAVGGEPLDLQGIESNALTKYASAIPPKTIHPNDIAKLAEEEKPQLQGLVPKAKARLDKDGFYPIEEWSPDPSRNENSRYFGSFVGGLNTPPNLQFTNAVTTVLLDENGVGPLCKGDGLFVSAADICGVMVKADNEAIRYRGLPRYFKVTLRKRAVKN\n>5hrm_B mol:protein length:504  Haloalkylphosphorus hydrolase\nQVVIGPGDRPETGLQGQTTIEDVVSGRSKLPYHAGVRLVGRTDIWNRGGNLQLSWVDQCAYVSTFKQAGPITANSRSALFLREPAGVAVIDVRDPRAPKPVRLLRDRGSIDAVETMHAIAAPGRKVLVAGAYSGGIAGRGEEDAAWLSIYDASNCLNPKLQSEFKWPANIHMVTISPNGRRVYGTEVVPGLGSGKGGLHVLDISDMKRPRYLGRFGVTRPNGLTAGFTPHEVSISHDERRIYAAVLASETGDVPVGASILASDGDVPVENGSVYILDNSDIVDGRSQPKMRLVGEAKQGGFHSVVPASINGVPHLVGAAELGACPGTWPRIINIADEKNPKIVGEFKLQMNIKENCDAIRFTPRKEDPYASFIPIPDITARLGAVGSHFNDVDDARNTRLGLFPFFAGGVRIVDLRDPTKPVEVGYYKPGANPDTPLSGNGLNWTGLNDQVTDGCMSHVRYVPESGHIWFACVTTGFHVVELNPDLRARLGFPTVKLEHHHHHH\n>1s5c_F mol:protein length:103  cholera enterotoxin B-subunit\nTPQNITDLCAEYHNTQIHTLNDKIFSYTESLAGKREMAIITFKNGATFQVEVPGSQHIDSQKKAIERMKDTLRIAYLTEAKVEKLCVWNNKTPHAIAAISMAN\n>3nvv_K mol:protein length:334  Xanthine dehydrogenase/oxidase\nLFNPEEFMPLDPTQEPIFPPELLRLKDVPPKQLRFEGERVTWIQASTLKELLDLKAQHPEAKLVVGNTEIGIEMKFKNQLFPMIICPAWIPELNAVEHGPEGISFGAACALSSVEKTLLEAVAKLPTQKTEVFRGVLEQLRWFAGKQVKSVASLGGNIITASPISDLNPVFMASGTKLTIVSRGTRRTVPMDHTFFPSYRKTLLGPEEILLSIEIPYSREDEFFSAFKQASRREDDIAKVTCGMRVLFQPGSMQVKELALCYGGMADRTISALKTTQKQLSKFWNEKLLQDVCAGLAEELSLSPDAPGGMIEFRRTLTLSFFFKFYLTVLKKLG\n>6lum_G mol:protein length:138  Succinate dehydrogenase subunit C\nMSTQTEVPAPQPKKTRRRTLYRGDPGMWSWVLHRITGATIFFFLFVHVLDTALVRVSPQAYNEVIETYKTPIVGLMEIGLVAAVLFHALNGIRVILIDFWAKGPRYQRQMLAVIAGLFLVIFIAAVGVIGMHMVERFL\n>1vav_B mol:protein length:222  Alginate lyase PA1167\nPDLSTWNLTIPQGRPAITISTSQLQRDYRSDYFQRTADGIRFWVPVNGSHTRNSEFPRSELRETLSSGRPYNWRYARADNWLEATLRIEAVPSTRRMIIGQIHSDGSNSGQAAPLVKLLYQLRLDQGRVQALVRERPDDGGTRAYTLMDGIPLGQPFSYRIGVSRSGLLSVSVNGSALEQQLDPQWAYQGLYFKAGLYLQDNRGPSSEGGRATFSELRVSHQ\n>3q6e_A mol:protein length:21  Insulin A chain\nGIVEQCCTSICSLYQLENYCN\n>4s17_F mol:protein length:481  Glutamine synthetase\nSNAMTALETKADAEALINKEGIEYVSVRFTDLIGVQQHFTVPASEFLKDAFTDGMPFDGSSVEGFQAINESDMKLVPDVSTAFIDPFRKHKTLDVAFSIVDPLTDEPYSRDPRQVAGKAEAYLKSTGIADTASFAPEAEFFIFDKVRFENSMQRSFYEVDSIEAPWNSGIDTEDDGTPNIAFKNRVKKGYFPVPPIDHTQDLRDDMVANLQKVGLILERSHHEVAGAGQQEINYRFNSLQHAGDDLMKYKYVVHETAALAGKAATFMPKPIAGDNGTGMHCHQSLWKDGKPLFYDEKNYGGLSDLARWYIGGLIKHSSSVLAFTNPSLNSYHRLVPGFEAPVNLVYSARNRSAAIRIPLAGTSPAAKRIEFRAPDPSCNPFLAFSAQLMAGLDGILNHIEPPAPVDKDLYELPPEEHAGIKQVPSSLAEAMDALEEDHDFLTAGDVFTDDLIDTWISIKRGEIDQARLAPTPLEYELYFHI\n>4dv4_D mol:protein length:209  ribosomal protein S4\nMGRYIGPVCRLCRREGVKLYLKGERCYSPKCAMERRPYPPGQHGQKRARRPSDYAVRLREKQKLRRIYGISERQFRNLFEEASKKKGVTGSVFLGLLESRLDNVVYRLGFAVSRRQARQLVRHGHITVNGRRVDLPSYRVRPGDEIAVAEKSRNLELIRQNLEAMKGRKVGPWLSLDVEGMKGKFLRLPDREDLALPVNEQLVIEFYSR\n>3zv2_A mol:protein length:320  Tyrosine-protein phosphatase non-receptor type 1\nMEMEKEFEQIDKSGSWAAIYQDIRHEASDFPCRVAKLPKNKNRNRYRDVSPFDHSRIKLHQEDNDYINASLIKMEEAQRSYILTQGPLPNTCGHFWEMVWEQKSRGVVMLNRVMEKGSLKCAQYWPQKEEKEMIFEDTNLKLTLISEDIKSYYTVRQLELENLTTQETREILHFHYTTWPDFGVPESPASFLNFLFKVRESGSLSPEHGPVVVHAAAGIGRSGTFCLADTCLLLMDKRKDPSSVDIKKVLLEMRKFRMGLIQTADQLRFSYLAVIEGAKFIMGDSSVQDQWKELSHEDLEPPPEHIPPPPRPPKRILEPH\n>4lyc_A mol:protein length:129  Lysozyme C\nKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRL\n>6gaw_Bp mol:protein length:112  mL53\nMAAALARLGLRAVKQVRVQFCPFEKNVESTRTFLQAVSSEKVRCTNLNCSVIADVRHDGSEPCVDVLFGDGHRLIMRGAHLTAQEMLTAFASHIQARGAAASGDKPSASTGR\n>3bvb_B mol:protein length:99  Protease (Retropepsin)\nPQITLWKRPLVTIKIGGQLKEALLNTGADDTVIEEMSLPGRWKPKMIGGIGGFIKVRQYDQIIIEIAGHKAIGTVLVGPTPVNIIGRNLLTQIGATLNF\n>5djb_E mol:protein length:99  Microcompartments protein\nMADALGMIEVRGFVGMVEAADAMVKAAKVELIGYEKTGGGYVTAVVRGDVAAVKAATEAGQRAAERVGEVVAVHVIPRPHVNVDAALPLGRTPGMDKSA\n>6jpa_F mol:protein length:1046  Voltage-dependent calcium channel subunit alpha-2/delta-1\nFPSAVTIKSWVDKMQEDLVTLAKTASGVHQLVDIYEKYQDLYTVEPNNARQLVEIAARDIEKLLSNRSKALVRLALEAEKVQAAHQWREDFASNEVVYYNAKDDLDPEKNDSEPGSQRIKPVFIDDANFRRQVSYQHAAVHIPTDIYEGSTIVLNELNWTSALDDVFKKNREEDPSLLWQVFGSATGLARYYPASPWVDNSRTPNKIDLYDVRRRPWYIQGAASPKDMLILVDVSGSVSGLTLKLIRTSVSEMLETLSDDDFVNVASFNSNAQDVSCFQHLVQANVRNKKVLKDAVNNITAKGITDYKKGFSFAFEQLLNYNVSRANCNKIIMLFTDGGEERAQEIFAKYNKDKKVRVFTFSVGQHNYDRGPIQWMACENKGYYYEIPSIGAIRINTQEYLDVLGRPMVLAGDKAKQVQWTNVYLDALELGLVITGTLPVFNITGQFENKTNLKNQLILGVMGVDVSLEDIKRLTPRFTLCPNGYYFAIDPNGYVLLHPNLQPKPIGVGIPTINLRKRRPNVQNPKSQEPVTLDFLDAELENDIKVEIRNKMIDGESGEKTFRTLVKSQDERYIDKGNRTYTWTPVNGTDYSLALVLPTYSFYYIKAKIEETITQARYSETLKPDNFEESGYTFLAPRDYCSDLKPSDNNTEFLLNFNEFIDRKTPNNPSCNTDLINRVLLDAGFTNELVQNYWSKQKNIKGVKARFVVTDGGITRVYPKEAGENWQENPETYEDSFYKRSLDNDNYVFTAPYFNKSGPGAYESGIMVSKAVEIYIQGKLLKPAVVGIKIDVNSWIENFTKTSIRDPCAGPVCDCKRNSDVMDCVILDDGGFLLMANHDDYTNQIGRFFGEIDPSLMRHLVNISVYAFNKSYDYQSVCEPGAAPKQGAGHRSAYVPSIADILQIGWWATAAAWSILQQFLLSLTFPRLLEAADMEDDDFTASMSKQSCITEQTQYFFDNDSKSFSGVLDCGNCSRIFHVEKLMNTNLIFIMVESKGTCPCDTRLLIQAEQTSDGPDPCDMVKQPRYRKGPDVCFDNNVLEDYTDCG\n>2zoq_A mol:protein length:382  Mitogen-activated protein kinase 3\nLGSMAAAAAQGGGGGEPRRTEGVGPGVPGEVEMVKGQPFDVGPRYTQLQYIGEGAYGMVSSAYDHVRKTRVAIKKISPFEHQTYCQRTLREIQILLRFRHENVIGIRDILRASTLEAMRDVYIVQDLMETDLYKLLKSQQLSNDHICYFLYQILRGLKYIHSANVLHRDLKPSNLLINTTCDLKICDFGLARIADPEHDHTGFLTEYVATRWYRAPEIMLNSKGYTKSIDIWSVGCILAEMLSNRPIFPGKHYLDQLNHILGILGSPSQEDLNCIINMKARNYLQSLPSKTKVAWAKLFPKSDSKALDLLDRMLTFNPNKRITVEEALAHPYLEQYYDPTDEPVAEEPFTFAMELDDLPKERLKELIFQETARFQPGVLEAP\n>6pee_K mol:protein length:562  Protein InvG\nMKTHILLARVLACAALVLVTPGYSSEKIPVTGSGFVAKDDSLRTFFDAMALQLKEPVIVSKMAARKKITGNFEFHDPNALLEKLSLQLGLIWYFDGQAIYIYDASEMRNAVVSLRNVSLNEFNNFLKRSGLYNKNYPLRGDNRKGTFYVSGPPVYVDMVVNAATMMDKQNDGIELGRQKIGVMRLNNTFVGDRTYNLRDQKMVIPGIATAIERLLQGEEQPLGNIVSSEPPAMPAFSANGEKGKAANYAGGMSLQEALKQNAAAGNIKIVAYPDTNSLLVKGTAEQVHFIEMLVKALDVAKRHVELSLWIVDLNKSDLERLGTSWSGSITIGDKLGVSLNQSSISTLDGSRFIAAVNALEEKKQATVVSRPVLLTQENVPAIFDNNRTFYTKLIGERNVALEHVTYGTMIRVLPRFSADGQIEMSLDIEDGNDKTPQSDTTTSVDALPEVGRTLISTIARVPHGKSLLVGGYTRDANTDTVQSIPFLGKLPLIGSLFRYSSKNKSNVVRVFMIEPKEIVDPLTPDASESVNNILKQSGAWSGDDKLQKWVRVYLDRGQEAIK\n>6zg6_C mol:protein length:1273  Protein transport protein SEC31\nMVKLAEFSRTATFAWSHDKIPLLVSGTVSGTVDANFSTDSSLELWSLLAADSEKPIASLQVDSKFNDLDWSHNNKIIAGALDNGSLELYSTNEANNAINSMARFSNHSSSVKTVKFNAKQDNVLASGGNNGEIFIWDMNKCTESPSNYTPLTPGQSMSSVDEVISLAWNQSLAHVFASAGSSNFASIWDLKAKKEVIHLSYTSPNSGIKQQLSVVEWHPKNSTRVATATGSDNDPSILIWDLRNANTPLQTLNQGHQKGILSLDWCHQDEHLLLSSGRDNTVLLWNPESAEQLSQFPARGNWCFKTKFAPEAPDLFACASFDNKIEVQTLQNLTNTLDEQETETKQQESETDFWNNVSREESKEKPSVFHLQAPTWYGEPSPAAHWAFGGKLVQITPDGKGVSITNPKISGLESNTTLSEALKTKDFKPLINQRLVKVIDDVNEEDWNLLEKLSMDGTEEFLKEALAFDNDESDAQDDANNEKEDDGEEFFQQIETNFQPEGDFSLSGNIEQTISKNLVSGNIKSAVKNSLENDLLMEAMVIALDSNNERLKESVKNAYFAKYGSKSSLSRILYSISKREVDDLVENLDVSQWKFISKAIQNLYPNDIAQRNEMLIKLGDRLKENGHRQDSLTLYLAAGSLDKVASIWLSEFPDLEDKLKKDNKTIYEAHSECLTEFIERFTVFSNFINGSSTINNEQLIAKFLEFINLTTSTGNFELATEFLNSLPSDNEEVKTEKARVLIASGKSLPAQNPATATTSKAKYTNAKTNKNVPVLPTPGMPSTTSIPSMQAPFYGMTPGASANALPPKPYVPATTTSAPVHTEGKYAPPSQPSMASPFVNKTNSSTRLNSFAPPPNPYATATVPATNVSTTSIPQNTFAPIQPGMPIMGDYNAQSSSIPSQPPINAVSGQTPHLNRKANDGWNDLPLKVKEKPSRAKAVSVAPPNILSTPTPLNGIPANAASTMPPPPLSRAPSSVSMVSPPPLHKNSRVPSLVATSESPRASISNPYAPPQSSQQFPIGTISTANQTSNTAQVASSNPYAPPPQQRVATPLSGGVPPAPLPKASNPYAPTATTQPNGSSYPPTGPYTNNHTMTSPPPVFNKPPTGPPPISMKKRSNKLASIEQNPSQGATYPPTLSSSASPLQPSQPPTLASQVNTSAENVSHEIPADQQPIVDFLKEELARVTPLTPKEYSKQLKDCDKRLKILFYHLEKQDLLTQPTIDCLHDLVALMKEKKYKEAMVIHANIATNHAQEGGNWLTGVKRLIGIAEATLN\n>6v00_F mol:protein length:355  MCherry fluorescent protein,Potassium voltage-gated channel subfamily E member 3\nGGMVSKGEEDNMAIIKEFMRFKVHMEGSVNGHEFEIEGEGEGRPYEGTQTAKLKVTKGGPLPFAWDILSPQFMYGSKAYVKHPADIPDYLKLSFPEGFNWERVMNFEDGGVVTVTQDSSLQDGEFIYKVKLRGTNFPSDGPVMQCRTMGWEASTERMYPEDGALKGEIKQRLKLKDGGHYDAEVKTTYKAKKPVQLPGAYNVDIKLDILSHNEDYTIVEQYERAEGRHSTGGMDELYKGSGENLYFQSSRATMETTNGTETWYESLHAVLKALNATLHSNLLCRPGPGLGPDNQTEERRASLPGRDDNSYMYILFVMFLFAVTVGSLILGYTRSRKVDKRSDPYHVYIKNRVSMI\n>5a15_L mol:protein length:120  BTB/POZ DOMAIN-CONTAINING PROTEIN KCTD16\nSMGSAVPNSFPEVVELNVGGQVYFTRHSTLISIPHSLLWKMFSPKRDTANDLAKDSKGRFFIDRDGFLFRYILDYLRDRQVVLPDHFPEKGRLKREAEYFQLPDLVKLLTPDEIKQSPDE\n>4k6a_B mol:protein length:279  Triosephosphate isomerase\nMHHHHHHSSGVDLGTENLYFQSNAMRHPLVMGNWKLNGSRHMVHELVSNLRKELAGVAGCAVAIAPPEMYIDMAKREAEGSHIMLGAQNVDLNLSGAFTGETSAAMLKDIGAQYIIIGHSERRTYHKESDELIAKKFAVLKEQGLTPVLCIGETEAENEAGKTEEVCARQIDAVLKTQGAAAFEGAVIAYEPVWAIGTGKSATPAQAQAVHKFIRDHIAKVDANIAEQVIIQYGGSVNASNAAELFAQPDIDGALVGGASLKADAFAVIVKAAEAAKQA\n>4yzv_QL mol:protein length:132  30S ribosomal protein S12\nMPTINQLVRKGREKVRKKSKVPALKGAPFRRGVCTVVRTVTPKKPNSALRKVAKVRLTSGYEVTAYIPGEGHNLQEHSVVLIRGGRVKDLPGVRYHIVRGVYDAAGVKDRKKSRSKYGTKKPKEAAKTAAKK\n>5iia_D mol:protein length:129  Vitelline envelope sperm lysin receptor\nAQTNAAADWDVYCSQDESIPAKFISRLVTSKDQALEKTEINCSNGLVPITQEFGINMMLIQYTRNELLDSPGMCVFWGPYSVPKNDTVVLYTVTARLKWSEGPPTNLSIQCYMPKSPVAPKLEHHHHHH\n>7br8_y mol:protein length:176  Small capsomere-interacting protein\nMARRLPKPTLQGRLEADFPDSPLLPKFQELNQNNLPNDVFREAQRSYLVFLTSQFCYEEYVQRTFGVPRRQRAIDKRQRASVAGAGAHAHLGGSSATPVQQAQAAASAGTGALASSAPSTAVAQSATPSVSSSISSLRAATSGATAAASAAAAVDTGSGGGGQPHDTAPRGARKKQ\n>1aql_A mol:protein length:532  BILE-SALT ACTIVATED LIPASE\nAKLGSVYTEGGFVEGVNKKLSLFGDSIDIFKGIPFAAAPKALEKPERHPGWQGTLKAKSFKKRCLQATLTQDSTYGNEDCLYLNIWVPQGRKEVSHDLPVMIWIYGGAFLMGASQGANFLSNYLYDGEEIATRGNVIVVTFNYRVGPLGFLSTGDSNLPGNYGLWDQHMAIAWVKRNIEAFGGDPDNITLFGESAGGASVSLQTLSPYNKGLIKRAISQSGVGLCPWAIQQDPLFWAKRIAEKVGCPVDDTSKMAGCLKITDPRALTLAYKLPLGSTEYPKLHYLSFVPVIDGDFIPDDPVNLYANAADVDYIAGTNDMDGHLFVGMDVPAINSNKQDVTEEDFYKLVSGLTVTKGLRGANATYEVYTEPWAQDSSQETRKKTMVDLETDILFLIPTKIAVAQHKSHAKSANTYTYLFSQPSRMPIYPKWMGADHADDLQYVFGKPFATPLGYRAQDRTVSKAMIAYWTNFARTGDPNTGHSTVPANWDPYTLEDDNYLEINKQMDSNSMKLHLRTNYLQFWTQTYQALPTV\n>2acl_C mol:protein length:238  Retinoic acid receptor RXR-alpha\nSANEDMPVERILEAELAVEPKTETYVEANMGLNPSSPNDPVTNICQAADKQLFTLVEWAKRIPHFSELPLDDQVILLRAGWNELLIASFSHRSIAVKDGILLATGLHVHRNSAHSAGVGAIFDRVLTELVSKMRDMQMDKTELGCLRAIVLFNPDSKGLSNPAEVEALREKVYASLEAYCKHKYPEQPGRFAKLLLRLPALRSIGLKCLEHLFFFKLIGDTPIDTFLMEMLEAPHQMT\n>7p1t_J mol:protein length:265  29 kDa antigen, Cfp29\nMNNLYRDLAPVTEAAWAEIELEAARTFKRHIAGRRVVDVSDPGGPVTAAVSTGRLIDVKAPTNGVIAHLRASKPLVRLRVPFTLSRNEIDDVERGSKDSDWEPVKEAAKKLAFVEDRTIFEGYSAASIEGIRSASSNPALTLPEDPREIPDVISQALSELRLAGVDGPYSVLLSADVYTKVSETSDHGYPIREHLNRLVDGDIIWAPAIDGAFVLTTRGGDFDLQLGTDVAIGYASHDTDTVRLYLQETLTFLCYTAEASVALSH\n>7pk6_K mol:protein length:758  Biodegradative arginine decarboxylase\nMRALIVYTELTDKDSVISHAVARLASELNDEHVETVIIRDFEDGLAYIRSNTSIDCLLYGRDMSDRDEQIQAHRLITQLHRRQEDVPVFLLSDREEALVAFDRNMMEQVDEFAWILEDSADFIAGRVLAAIQRYRSQLLPPLMKSLIKYSDVHEYSWAAPGHQGGVGFTKTPAGRIYHDFFGENLFRTDIGIERVAVGSLLDHTGAFGECEKNAARIFGADQSYSVVVGTSGSNRTIMQACMTDDDVVVIDRNCHKSIEQGLILTGAKPVYMIPSRNRYGIIGPIYPKEMTPDAIKFKIAANPLTKGKVKQKPAYSVVTNCTYDGVCYNARKVQDLLDGSLDRIHFDEAWYGYARFNPLYRNHFAMRDEERTENEPTIFATHSTHKLLNALSQASFIHVRNGRNAIDFNRFNQAYLMHSTTSPLYAICASNDIAADMMDGNSGRSLTDEVIRESIDFRQSLAYLYKEFLNDDEWFFKPWNQEMVKDPATGKRYAFEDAPVELLMREQSCWVMHPEDKWHGFNDIPDNWAMLDPIKVSILAPGMGDDGKLLDTGVPAALVTAWLNHYGIVPTRTTDFQIMFLFSMGITKGKWGTLVNTLLSFKRHYDNNTALKKVLPEVVASAPEIYGEMGLRDLGDKMFAYLQKNNPGARLNQAYSQLPQVMMTPRDAYQQIVANRVEAVPVDQLMGRVAANSIIPYPPGIPMLLSGENFGDENSPHIHYLRSLQAWDSEFPGFEHETEGTEIIDGQYYVMCVKTCDE\n>3pvg_A mol:protein length:331  Casein kinase II subunit alpha\nSKARVYADVNVLRPKEYWDYEALTVQWGEQDDYEVVRKVGRGKYSEVFEGINVNNNEKCIIKILKPVKKKKIKREIKILQNLCGGPNIVKLLDIVRDQHSKTPSLIFEYVNNTDFKVLYPTLTDYDIRYYIYELLKALDYCHSQGIMHRDVKPHNVMIDHELRKLRLIDWGLAEFYHPGKEYNVRVASRYFKGPELLVDLQDYDYSLDMWSLGCMFAGMIFRKEPFFYGHDNHDQLVKIAKVLGTDGLNVYLNKYRIELDPQLEALVGRHSRKPWLKFMNADNQHLVSPEAIDFLDKLLRYDHQERLTALEAMTHPYFQQVRAAENSRTRA\n>2bcb_A mol:protein length:75  CALBINDIN D9K\nKSPEELKGIFEKYAAKEGDPNQLSKEELKLLLQTEFPSLLKGGSTLDELFEELDKNGDGEVSFEEFQVLVKKISQ\n>6w6c_B mol:protein length:313  Probable dimethyladenosine transferase\nMPKVKSGAIGRRRGRQEQRRELKSAGGLMFNTGIGQHILKNPLIINSIIDKAALRPTDVVLEVGPGTGNMTVKLLEKAKKVVACELDPRLVAELHKRVQGTPVASKLQVLVGDVLKTDLPFFDTCVANLPYQISSPFVFKLLLHRPFFRCAILMFQREFALRLVAKPGDKLYCRLSINTQLLARVDHLMKVGKNNFRPPPKVESSVVRIEPKNPPPPINFQEWDGLVRITFVRKNKTLSAAFKSSAVQQLLEKNYRIHCSVHNIIIPEDFSIADKIQQILTSTGFSDKRARSMDIDDFIRLLHGFNAEGIHFS\n>4pbp_B mol:protein length:210  C-reactive protein\nMEFFKNLSGKVLQFKTATDNSYVKLYPEKPLSLSAFTLCMRVATELPLDREVILFAYYTPDVDELNVWRERDGRVSLYIQSSKDAAFFRLPPLSTLQTHLCVAWESATGLTAFWMDGRRSLHQVYRKGYSIRSGGTVVLGQDPDSYVGSFDVDQSFVGEIANLQMWDYVLSSAQIKAVYYNQDNRVKGNVFDWDTIEYDVTGNVLVVPDN\n>3pdg_A mol:protein length:98  Fibronectin(III)-like module\nMVTIDSPVAGERFEAGKDINISATVKSKTPVSKVEFYNGDTLISSDTTAPYTAKITGAAVGAYNLKAVAVLSDGRRIESPVTPVLVKVIVLEHHHHHH\n>1ttv_A mol:protein length:107  Ubiquitin-protein ligase E3 Mdm2\nNHISTSDQEKLVQPTPLLLSLLKSAGAQKETFTMKEVLYHLGQYIMAKQLYDEKQQHIVHCSNDPLGELFGVQEFSVKEHRRIYAMISRNLVSANVKESSEDIFGNV\n>6mux_Z mol:protein length:211  20S proteasome beta-5 subunit\nTTTLAFKFKDGIIVAVDSRASMGSFISSQNVEKIIEINKNILGTMAGGAADCLYWEKYLGKIIKIYELRNNEKISVRAASTILSNILYQYKGYGLCCGIILSGYDHTGFNMFYVDDSGKKVEGNLFSCGSGSTYAYSILDSAYDYNLNLDQAVELARNAIYHATFRDGGSGGKVRVFHIHKNGYDKIIEGEDVFDLHYHYTNPEQKDQYVM\n>4wiz_CB mol:protein length:338  Coat protein\nMVRKGEKKLAKPATTKAANPQPRRRANNRRRSNRTDAPVSKASTVTGFGRGTNDVHLSGMSRISQAVLPAGTGTDGYVVVDATIVPDLLPRLGHAARIFQRYAVETLEFEIQPMCPANTGGGYVAGFLPDPTDNDHTFDALQATRGAVVAKWWESRTVRPQYTRTLLWTSSGKEQRLTSPGRLILLCVGNNTDVVNVSVLCRWSVRLSVPSLENPEETTAPIMTQGSLYNDSLSTNDFKSILLGSTPLDIAPDGAVFQLDRPLSIDYSLGTGDVDRAVYWHLKKFAGNAGTPAGWFRWGIWDNFNKTFTDGVAYYSDEQPRQILLPVGTVCTRVDSEN\n>6b55_D mol:protein length:48  Flower-specific defensin\nARECKTESNTFPGICITKPPCRKACISEKFTDGHCSKILRRCLCTKPC\n>4hnp_L mol:protein length:222  Proteasome component C5\nQFNPYGDNGGTILGIAGEDFAVLAGDTRNITDYSINSRYEPKVFDCGDNIVMSANGFAADGDALVKRFKNSVKWYHFDHNDKKLSINSAARNIQHLLYGKRFFPYYVHTIIAGLDEDGKGAVYSFDPVGSYEREQCRAGGAAASLIMPFLDNQVNFKNQYEPGTNGKVKKPLKYLSVEEVIKLVRDSFTSATERHIQVGDGLEILIVTKDGVRKEFYELKRD\n>3i4e_B mol:protein length:439  Isocitrate lyase\nGPGSMSRQQQAQELQKQWETDPRWKGIKRAFTAEDVVRLRGSIQQEHTLAKRGAEKLWTLINNEPFVNALGALTGNQAMQQVKAGLKAIYLSGWQVAGDANVAGEMYPDQSLYPANSVPLVVKRINNTLTRADQIQWSEGKNPGDEGYVDFFAPIVADAEAGFGGVLNAFELMKAMIEAGASGVHFEDQLASVKKCGHMGGKVLVPTREAVAKLTAARLAADVMGTPTVLVARTDAEAADLITSDIDDNDKPYLTGERTVEGFFRTKPGLEQAISRGLAYAPYADLIWCETGKPDLEYAKKFAEAIHKQFPGKLLSYNCSPSFNWKKNLDDATIAKFQKELGAMGYKFQFITLAGFHALNYSMFNLAHGYARTQMSAFVELQQAEFAAADKGFTAVKHQREVGTGYFDAVTQTVEREASTTALHGSTEDEQFFDGQKVA\n>1s89_C mol:protein length:152  Methylglyoxal synthase\nMELTTRTLPARKHIALVAHDHCKQMLMSWVERHQPLLEQHVLYATGTTGNLISRATGMNVNAMLSGPMGGDQQVGALISEGKIDVLIFFWDPLNAVPNDPDVKALLRLATVWNIPVATNVATADFIIQSPHFNDAVDILIPDYQRYLADRLK\n>7az7_H mol:protein length:6  Peptide 37\nXQAXLF\n>4elf_B mol:protein length:166  Dihydrofolate reductase\nMIVSFMVAMDENRVIGKDNNLPWRLPSELQYVKKTTMGHPLIMGRKNYEAIGRPLPGRRNIIVTRNEGYHVEGCEVAHSVEEVFELCKNEEEIFIFGGAQIYDLFLPYVDKLYITKIHHAFEGDTFFPEMDMTNWKEVFVEKGLTDEKNPYTYYYHVYEKQQLVPR\n>4ji2_B mol:protein length:256  RIBOSOMAL PROTEIN S2\nMPVEITVKELLEAGVHFGHERKRWNPKFARYIYAERNGIHIIDLQKTMEELERTFRFIEDLAMRGGTILFVGTKKQAQDIVRMEAERAGMPYVNQRWLGGMLTNFKTISQRVHRLEELEALFASPEIEERPKKEQVRLKHELERLQKYLSGFRLLKRLPDAIFVVDPTKEAIAVREARKLFIPVIALADTDSDPDLVDYIIPGNDDAIRSIQLILSRAVDLIIQARGGVVEPSPSYALVQEAEATETPEGESEVEA\n>6ydp_Ak mol:protein length:325  Mitochondrial ribosomal protein S35\nMAATSLPAWLILKSRAGTFRAFSTAMSPATRSPRPALRTTERTSKPERALRRKALPPRTEKMAVDQDWPSVYPVAAPFKPSAVPLPVRMGYPVKRGVPMAKEGNLELLKIPNFLHLTPVAIKRHCEALKDFCTEWPAALDSDEKCEKHFPIEIDTADYVSAGPSIRNPKARVVTLRVKLSSLNLDDHAKKKLIKLVGDRYCKSTDVLTIKTDRCPLKRQNYDYAVYLLTVLYHESWKTEEWEKKKTEADMEEYIWENSTSEKNILETLLQIKAAEKNLELSKEELLGTKEVEDYRKSVVSLKNEGDNENTLSQYKESVKRLLNLA\n>7f5s_Ld mol:protein length:125  60S ribosomal protein L31\nMAPAKKGGEKKKGRSAINEVVTREYTINIHKRIHGVGFKKRAPRALKEIRKFAMKEMGTPDVRIDTRLNKAVWAKGIRNVPYRIRVRLSRKRNEDEDSPNKLYTLVTYVPVTTFKNLQTVNVDEN\n>1izl_L mol:protein length:472  Photosystem II: Subunit PsbB\nMGLPWYRVHTVLINDPGRLIAAHLMHTALVAGWAGSMALYELATFDPSDPVLNPMWRQGMFVLPFMARLGVTGSWSGWSITGETGIDPGFWSFEGVALAHIVLSGLLFLAACWHWVYWDLELFRDPRTGEPALDLPKMFGIHLFLAGLLCFGFGAFHLTGLFGPGMWVSDPYGLTGSVQPVAPEWGPDGFNPYNPGGVVAHHIAAGIVGIIAGLFHILVRPPQRLYKALRMGNIETVLSSSIAAVFFAAFVVAGTMWYXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXGGELNGQTFTDPPTVKSYARKAIFGEIFEFDTETLNSDGIFRTSPRGWFTFAHAVFALLFFFGHIWHGARTLFRDVFSGIDPELSPEQVEWGFYQKVGDVTTRRKEAV\n>2y0d_D mol:protein length:478  UDP-GLUCOSE DEHYDROGENASE\nHHHHHHGSMNLTIIGSGKVGLVTGACLADIGHDVFCLDVDQAKIDILNNGGVPIHEPGLKEVIARNRSAGRLRFSTDIEAAVAHGDVQFIAVGTPPDEDGSADLQYVLAAARNIGRYMTGFKVIVDKSTVPVGTAERVRAAVAEELAKRGGDQMFSVVSNPEFLKEGAAVDDFTRPDRIVIGCDDDVPGERARELMKKLYAPFNRNHERTLYMDVRSAEFTKYAANAMLATRISFMNELANLADRFGADIEAVRRGIGSDPRIGYHFLYAGCGYGGSCFPKDVEALIRTADEHGQSLQILKAVSSVNATQKRVLADKIVARFGEDLTGRTFAIWGLAFKPNTDDMREAPSRELIAELLSRGARIAAYDPVAQEEARRVIALDLADHPSWLERLSFVDDEAQAARDADALVIVTEWKIFKSPDFVALGRLWKTPVIFDGRNLYEPETMSEQGIEYHPIGRPGSRQAVAARVTGTAPASA\n>7pi2_J mol:protein length:343  Cysteine-rich protective antigen\nDSRHVFIRTELSFIKNNVPCIRDMFFIYKRELYNICLDDLKGEEDETHIYVQKKVKDSWITLNDLFKETDLTGRPHIFAYVDVEEIIILLCEDEEFSNRKKDMTCHRFYSNDGKEYNNAEITISDYILKDKLLSSYVSLPLKIENREYFLICGVSPYKFKDDNKKDDILCMASHDKGETWGTKIVIKYDNYKLGVQYFFLRPYISKNDLSFHFYVGDNINNVKNVNFIECTHEKDLEFVCSNRDFLKDNKVLQDVSTLNDEYIVSYGNDNNFAECYIFFNNENSILIKPEKYGNTAAGCYGGTFVKIDENRALFIYSSSQGIYNIHTIYYANYEGGGGSEPEA\n>1n2r_A mol:protein length:276  HLA class I histocompatibility antigen, BW-44(B-12) B*4403 alpha chain\nGSHSMRYFYTAMSRPGRGEPRFITVGYVDDTLFVRFDSDATSPRKEPRAPWIEQEGPEYWDRETQISKTNTQTYRENLRTALRYYNQSEAGSHIIQRMYGCDVGPDGRLLRGYDQDAYDGKDYIALNEDLSSWTAADTAAQITQRKWEAARVAEQLRAYLEGLCVESLRRYLENGKETLQRADPPKTHVTHHPISDHEVTLRCWALGFYPAEITLTWQRDGEDQTQDTELVETRPAGDRTFQKWAAVVVPSGEEQRYTCHVQHEGLPKPLTLRWEP\n>2nxx_B mol:protein length:235  Ultraspiracle (USP, NR2B4)\nMTSNLQADMPLERIIEAEKRVECNDPLVALVVNENNTTVNNICQATHKQLFQLVQWAKLVPHFTSLPLTDQVQLLRAGWNELLIAAFSHRSMQAQDAIVLATGLTVNKSTAHAVGVGNIYDRVLSELVNKMKEMKMDKTELGCLRAIILYNPDVRGIKSVQEVEMLREKIYGVLEEYTRTTHPNEPGRFAKLLLRLPALRSIGLKCLEHLFFFKLIGDVPIDTFLMEMLEGTTDS\n>4s3s_A mol:protein length:143  Thermonuclease\nATSTKKLHKEPATLIKAIDGDTAKLMYKGQPMTFRLLLVDTPEFNEKYGPEASAFTKKMVENAKKIEVEFDKGQRTDKYGRGLAYKYADGKMVNEALVRQGLAKVAYVYKGNNTHEQLLRKAEAQAKKEKLNIWSEDNADSGQ\n>4e9x_C mol:protein length:339  Multicopper oxidase\nMAEREFDMTIEEVTIKVAPGLDYKVFGFNGQVPGPLIHVQEGDDVIVNVTNNTSLPHTIHWHGVHQKGTWRSDGVPGVTQQPIEAGDSYTYKFKADRIGTLWYHCHVNVNEHVGVRGMWGPLIVDPKQPLPIEKRVTKDVIMMMSTWESAVADKYGEGGTPMNVADYFSVNAKSFPLTQPLRVKKGDVVKIRFFGAGGGIHAMHSHGHDMLVTHKDGLPLDSPYYADTVLVSPGERYDVIIEADNPGRFIFHDHVDTHVTAGGKHPGGPITVIEYDGVPVDDWYVWKDKDYDPNFFYSESLKQGYGMFDHDGFKGEFEQRQRRPGRKLAAALEHHHHHH\n>6tg2_A mol:protein length:351  MotA\nMGSSHHHHHHSSGLVPRGSHMDVVIASSGGGWQEAQDKALWAPAAKALNITYTQDTFQNWAEARAQVESGSVTWDIIQIGIADEPQAKAAGVLEKLDPDIVNKADFPPGSVTDSFVANSNYSTLIAWNKKTYGDNGPKSMADFFDVKKFPGKRALWNQPIGMIEAAALALGTPRDKVYEFLSTEEGRKAAIAKLTELAPSVSVWWESGAQAAQLIKDGEVDMIITWGGRVQGAINDGANFAYTFNDAQLGTDGYAIVKGAPHRDAAMRFLKEMSKAEYQKDLPNSFATAPANMKAYDLAKYTPEKMATMASAPENVAVQYSVDPNFWAKHAKWASEAYDNVRLSRHHHHHH\n>6p60_K mol:protein length:212  Antibody A12V163-a.02 light chain\nQFVLAQPPSVSGAPGQRVTLSCTGSNSNIGVNYVQWYQQLPGTAPKLLIYENNKRPSGVSDRFSGSQSGTSASLTITGLQSEDEADYYCQCYDISLGAHVFGSGTELTVLGQPKAAPSVTLFPPSSEELQANKATLVCLISDFYPGAVEVAWKADGSAVNAGVETTKPSKQSNNKYAASSYLSLTSDQWKSHKSYSCQVTHEGSTVEKTVAP\n>5pg2_A mol:protein length:138  Bromodomain adjacent to zinc finger domain protein 2B\nMHHHHHHSSGVDLGTENLYFQSMSVKKPKRDDSKDLALCSMILTEMETHEDAWPFLLPVNLKLVPGYKKVIKKPMDFSTIREKLSSGQYPNLETFALDVRLVFDNCETFNEDDSDIGRAGHNMRKYFEKKWTDTFKVS\n>2oa6_C mol:protein length:320  Aristolochene synthase\nMKKPNGTNGASSSLEPPPSTFQPLCHPLVEEVSKEVDGYFLQHWNFPNEKARKKFVAAGFSRVTCLYFPKALDDRIHFACRLLTVLFLIDDLLEYMSFEEGSAYNEKLIPISRGDVLPDRSIPVEYIIYDLWESMRAHDREMADEILEPVFLFMRAQTDRTRARPMGLGGYLEYRERDVGKELLAALMRFSMGLKLSPSELQRVREIDANCSKHLSVVNDIYSYEKELYTSKTAHSEGGILCTSVQILAQEADVTAEAAKRVLFVMCREWELRHQLLVARLSAEGLETPGLAAYVEGLEYQMSGNELWSQTTLRYSVVVD\n>6qz0_5b mol:protein length:448  Major capsid protein\nMRITFNDVKTSLGITESYDIVNAIRNSQGDNFKSYVPLATANNVAEVGAGILINQTVQNDFITSLVDRIGLVVIRQVSLNNPLKKFKKGQIPLGRTIEEIYTDITKEKQYDAEEAEQKVFEREMPNVKTLFHERNRQGFYHQTIQDDSLKTAFVSWGNFESFVSSIINAIYNSAEVDEYEYMKLLVDNYYSKGLFTTVKIDEPTSSTGALTEFVKKMRATARKLTLPQGSRDWNSMAVRTRSYMEDLHLIIDADLEAELDVDVLAKAFNMNRTDFLGNVTVIDGFASTGLEAVLVDKDWFMVYDNLHKMETVRNPRGLYWNYYYHVWQTLSVSRFANAVAFVSGDVPAVTQVIVSPNIAAVKQGGQQQFTAYVRATNAKDHKVVWSVEGGSTGTAITGDGLLSVSGNEDNQLTVKATVDIGTEDKPKLVVGEAVVSIRPNNASGGAQA\n>7eqd_3 mol:protein length:62  Light-harvesting protein B-870 alpha chain\nMWRIWQLFDPRQALVGLATFLFVLALLIHFILLSTERFNWLEGASTKPVQTSMVMPSSDLAV\n>5k5o_A mol:protein length:98  AspA\nGKISTDKYIFLTPRAYIIVHLLKVGKAKASEISENTQIPYQTVIQNIRWLLAEGYVVKEQKGEEIYYKLTDKGKQLATAELEKIRKLVEVVQHHHHHH\n>3dby_N mol:protein length:269  uncharacterized protein\nMSLERNYEESALFEHQFWLKVLTDHAQFLLDALAPKEKEDIKKATYFVETFTNLLNKVRNVNLMAFSKEAEQAAKEIRAFKLNIIQKQLEGKITIHFTPTFINHMVNEVEEYIAVLEFLKKGEVPPVFHELHYHLVWLTDAAGHAGSISGGLDLVEKRLKEKSEEFTKHFEQFYLKAVEMTGYLRTELHHFPALKKFTKDVSLELKLFSHFLHEVEELELSNEVLSVLSARMADHMAREECYYLLKLAQSSGLEMPKCNPLEGHHHHHH\n>1sfo_E mol:protein length:215  DNA-directed RNA polymerases I, II, and III 27 kDa polypeptide\nMDQENERNISRLWRAFRTVKEMVKDRGYFITQEEVELPLEDFKAKYCDSMGRPQRKMMSFQANPTEESISKFPDMGSLWVEFCDEPSVGVKTMKTFVIHIQEKNFQTGIFVYQNNITPSAMKLVPSIPPATIETFNEAALVVNITHHELVPKHIRLSSDEKRELLKRYRLKESQLPRIQRADPVALYLGLKRGEVVKIIRKSETSGRYASYRICM\n>2zee_B mol:protein length:329  Glutaminyl-peptide cyclotransferase\nASAWPEEKNYHQPAILNSSALRQIAEGTSISEMWQNDLQPLLIERYPGSPGSYAARQHIMQRIQRLQADWVLEIDTFLSQTPYGYRSFSNIISTLNPTAKRHLVLACHYDSKYFSHWNNRVFVGATDGAVPCAMMLELARALDKKLLSLKTVSDSKPDLSLQLIFFDGEEAFLHWSPQDSLYGSRHLAAKMASTPHPPGARGTSQLHGMDLLVLLDLIGAPNPTFPNFFPNSARWFERLQAIEHELHELGLLKDHSLEGRYFQNYSYGGVIQDDHIPFLRRGVPVLHLIPSPFPEVWHTMDDNEENLDESTIDNLNKILQVFVLEYLHL\n>6cae_1c mol:protein length:239  30S ribosomal protein S3\nMGNKIHPIGFRLGITRDWESRWYAGKKQYRHLLLEDQRIRGLLEKELYSAGLARVDIERAADNVAVTVHVAKPGVVIGRGGERIRVLREELAKLTGKNVALNVQEVQNPNLSAPLVAQRVAEQIERRFAVRRAIKQAVQRVMESGAKGAKVIVSGRIGGAEQARTEWAAQGRVPLHTLRANIDYGFALARTTYGVLGVKAYIFLGEVIGGQKPKARPELPKAEERPRRRRPAVRVKKEE\n>3hhq_J mol:protein length:167  Deoxyuridine 5'-triphosphate nucleotidohydrolase\nMGSSHHHHHHSSGLVPRGSHMTATSDKVLKIQLRSASATVPTKGSATAAGYDIYASQDITIPAMGQGMVSTDISFTVPVGTYGRIAPRSGLAVKNGIQTGAGVVDRDYTGEVKVVLFNHSQRDFAIKKGDRVAQLILEKIVDDAQIVVVDSLEESARGAGGFGSTGN\n>2a3s_A mol:protein length:101  Myocyte Nuclear Factor\nESKPPYSYAQLIVQAISSAQDRQLTLSGIYAHITKHYPYYRTADKGWQNSIRHNLSLNRYFIKVPRSQEEPGKGSFWRIDPASEAKLVEQAFRKRRQRGVS\n>5dcp_A mol:protein length:175  Filamin-B\nSMMNGLGFKPFDLVIPFAVRKGEITGEVHMPSGKTATPEIVDNKDGTVTVRYAPTEVGLHEMHIKYMGSHIPESPLQFYVNYPNSGSVSAYGPGLVYGVANKTATFTIVTEDAGEGGLDLAIEGPSKAEISCIDNKDGTCTVTYLPTLPGDYSILVKYNDKHIPGSPFTAKITDD\n>2qsp_B mol:protein length:145  Hemoglobin subunit beta\nMLTAEEKAAVTAFWGKVKVDEVGGEALGRLLVVYPWTQRFFESFGDLSTADAVMNNPKVKAHGKKVLDSFSNGMKHLDDLKGTFAALSELHCDKLHVDPENFKLLGNVLVVVLARNFGKEFTPVLQADFQKVVAGVANALAHRYH\n>3fp9_H mol:protein length:153  Proteasome-associated ATPase\nMPSGYGVLLATHDDDTVDVFTSGRKMRLTCSPNIDAASLKKGQTVRLNEALTVVEAGTFEAVGEISTLREILADGHRALVVGHADEERVVWLADPLIAEDLPDGLPEALNDDTRPRKLRPGDSLLVDTKAGYAFERIPKAEVEDLVLEELVPR\n>6v3o_E mol:protein length:970  Phosphoenolpyruvate carboxylase\nMASTKAPGPGEKHHSIDAQLRQLVPGKVSEDDKLIEYDALLVDRFLNILQDLHGPSLREFVQECYEVSADYEGKGDTTKLGELGAKLTGLAPADAILVASSILHMLNLANLAEEVQIAHRRRNSKLKKGGFADEGSATTESDIEETLKRLVSEVGKSPEEVFEALKNQTVDLVFTAHPTQSARRSLLQKNARIRNCLTQLNAKDITDDDKQELDEALQREIQAAFRTDEIRRAQPTPQDEMRYGMSYIHETVWKGVPKFLRRVDTALKNIGINERLPYNVSLIRFSSWMGGDRDGNPRVTPEVTRDVCLLARMMAANLYIDQIEELMFELSMWRCNDELRVRAEELHSSSGSKVTKYYIEFWKQIPPNEPYRVILGHVRDKLYNTRERARHLLASGVSEISAESSFTSIEEFLEPLELCYKSLCDCGDKAIADGSLLDLLRQVFTFGLSLVKLDIRQESERHTDVIDAITTHLGIGSYREWSEDKRQEWLLSELRGKRPLLPPDLPQTEEIADVIGAFHVLAELPPDSFGPYIISMATAPSDVLAVELLQRECGVRQPLPVVPLFERLADLQSAPASVERLFSVDWYMDRIKGKQQVMVGYSDSGKDAGRLSAAWQLYRAQEEMAQVAKRYGVKLTLFHGRGGTVGRGGGPTHLAILSQPPDTINGSIRVTVQGEVIEFCFGEEHLCFQTLQRFTAATLEHGMHPPVSPKPEWRKLMDEMAVVATEEYRSVVVKEARFVEYFRSATPETEYGRMNIGSRPAKRRPGGGITTLRAIPWIFSWTQTRFHLPVWLGVGAAFKFAIDKDVRNFQVLKEMYNEWPFFRVTLDLLEMVFAKGDPGIAGLYDELLVAEELKPFGKQLRDKYVETQQLLLQIAGHKDILEGDPFLKQGLVLRNPYITTLNVFQAYTLKRIRDPNFKVTPQPPLSKEFADENKPAGLVKLNPASEYPPGLEDTLILTMKGIAAGMQNTG\n>2gf0_C mol:protein length:199  GTP-binding protein Di-Ras1\nSMPEQSNDYRVVVFGAGGVGKSSLVLRFVKGTFRDTYIPTIEDTYRQVISCDKSVCTLQITDTTGSHQFPAMQRLSISKGHAFILVFSVTSKQSLEELGPIYKLIVQIKGSVEDIPVMLVGNKCDETQREVDTREAQAVAQEWKCAFMETSAKMNYNVKELFQELLTLETRRNMSLNIDGKRSGKQKRTDRVKGKCTLM\n>1p3q_Q mol:protein length:54  Vacuolar protein sorting-associated protein VPS9\nSSLIKKIEENERKDTLNTLQNMFPDMDPSLIEDVCIAAASRIGPCVDALLSLSE\n>3c91_O mol:protein length:233  Proteasome subunit alpha\nMQQGQMAYDRAITVFSPDGRLFQVEYAREAVKKGSTALGMKFANGVLLISDKKVRSRLIEQNSIEKIQLIDDYVAAVTSGLVADARVLVDFARISAQQEKVTYGSLVNIENLVKRVADQMQQYTQYGGVRPYGVSLIFAGIDQIGPRLFDCDPAGTINEYKATAIGSGKDAVVSFLEREYKENLPEKEAVTLGIKALKSSLEEGEELKAPEIASITVGNKYRIYDQEEVKKFL\n>4wra_1A mol:protein length:105  30S ribosomal protein S10\nMPKIRIKLRGFDHKTLDASAQKIVEAARRSGAQVSGPIPLPTRVRRFTVIRGPFKHKDSREHFELRTHNRLVDIINPNRKTIEQLMTLDLPTGVEIEIKTVGGGR\n>4n06_A mol:protein length:347  CRISPR-associated endonuclease Cas1 1\nGGMRLVVDGFGKYLGIENGLIVVKEKGKALRKVRPEDLKQVLIIGKAAISSDAIKLLLKNRVDVVFLDFNGEILGRLSHPLIGTAKTRREQYLAYGDKRGVHLAKEFIKAKMANQMAILTNLAKARKDSNPEVAESLLKAKKEIDACLNELDGVEAEMIDKVRERLLGIEGKASKHYWDAISLVIPEEYRFNGRRGIEIGSPRYAKDIVNAMLNYGYSILLAECVKAVELAGLDPYAGFLHVDVSGRSSLAIDLMENFRQQVVDRVVLRLISYRQIKPEDCEKRNMVCQLSDNARRLLLASLLERLDSKTQYRGRNLAYSSIILLHARDVVAFLRGERRYEGFVQKW\n>6d6e_A mol:protein length:129  Lysozyme C\nKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRL\n>1v1m_A mol:protein length:400  2-OXOISOVALERATE DEHYDROGENASE ALPHA SUBUNIT\nSSLDDKPQFPGASAEFIDKLEFIQPNVISGIPIYRVMDRQGQIINPSEDPHLPKEKVLKLYKSMTLLNTMDRILYESQRQGRISFYMTNYGEEGTHVGSAAALDNTDLVFGQYREAGVLMYRDYPLELFMAQCYGNISDLGKGRQMPVHYGCKERHFVTISSPLATQIPQAVGAAYAAKRANANRVVICYFGEGAASEGDAHAGFNFAATLECPIIFFCRNNGYAISTPTSEQYRGDGIAARGPGYGIMSIRVDGNDVFAVYNATKEARRRAVAENQPFLIEAMTYRIGHASTSADSSAFRSVDEVNYWDKQDHPISRLRHYLLSQGWWDEEQEKAWRKQSRRKVMEAFEQAERKPKPNPNLLFSDVYQEMPAQLRKQQESLARHLQTYGEHYPLDHFDK\n>7pak_H mol:protein length:132  30S ribosomal protein S9\nMEKQSYYGLGRRKSSSAKVYLTPTQDKGKITVNRRDPSEYFPNKLVIQDMEQPLDLTDLKKNFDINVVVKGGGFTGQAGAIRLGIVRALLQFNPELKKILKSKKLTTRDKRVKERKKFGLYGARRAPQFTKR\n>4gob_A mol:protein length:230  Kaede-type Fluorescent Protein\nMSVIKSDMKIKLRMEGTVNGHKFVIEGEGEGKPYEGTQTMNLKVKEGAPLPFAYDILTTVFHYGNRVFAKYPKHIPDYFKQSFPEGYSWERSMTFEDGGICTARNDITLEGDCFFNEIRFDGVNFPPNGPVMQKKTLKWEPSTEKMYVRDGVLTGDINMALLLEGGGHYRCDFKTTYKAKKGVQLPDYHFVDHCIEILSHDKDYNNVKLYEHAVAHSGLPRQAKHHHHHH\n>5f5k_B mol:protein length:7  Peptidic derivative of Gurken: ACE-ARG-LYS-VAL-ARG-MET-ALA-aldehyde\nXRKVRMX\n>6rkm_P mol:protein length:12  Cellular tumor antigen p53\nKLMFKTEGPDSD\n>2p1m_B mol:protein length:594  TRANSPORT INHIBITOR RESPONSE 1 protein\nMQKRIALSFPEEVLEHVFSFIQLDKDRNSVSLVCKSWYEIERWCRRKVFIGNCYAVSPATVIRRFPKVRSVELKGKPHFADFNLVPDGWGGYVYPWIEAMSSSYTWLEEIRLKRMVVTDDCLELIAKSFKNFKVLVLSSCEGFSTDGLAAIAATCRNLKELDLRESDVDDVSGHWLSHFPDTYTSLVSLNISCLASEVSFSALERLVTRCPNLKSLKLNRAVPLEKLATLLQRAPQLEELGTGGYTAEVRPDVYSGLSVALSGCKELRCLSGFWDAVPAYLPAVYSVCSRLTTLNLSYATVQSYDLVKLLCQCPKLQRLWVLDYIEDAGLEVLASTCKDLRELRVFPSEPFVMEPNVALTEQGLVSVSMGCPKLESVLYFCRQMTNAALITIARNRPNMTRFRLCIIEPKAPDYLTLEPLDIGFGAIVEHCKDLRRLSLSGLLTDKVFEYIGTYAKKMEMLSVAFAGDSDLGMHHVLSGCDSLRKLEIRDCPFGDKALLANASKLETMRSLWMSSCSVSFGACKLLGQKMPKLNVEVIDERGAPDSRPESCPVERVFIYRTVAGPRFDMPGFVWNMDQDSTMRFSRQIITTNGL\n>1jf1_B mol:protein length:100  beta-2-microglobulin\nMIQRTPKIQVYSRHPAENGKSNFLNCYVSGFHPSDIEVDLLKNGERIEKVEHSDLSFSKDWSFYLLYYTEFTPTEKDEYACRVNHVTLSQPKIVKWDRDM\n>7vot_Y mol:protein length:53  Rsp_7571 Protein-Y PufY\nMPEVSEFAFRLMMAAVIFVGVGIMFAFAGGHWFVGLVVGGLVAAFFAATPNSN\n>7o11_C mol:protein length:308  Probable ABC transporter ATP-binding protein NosF\nMNAVEIQGVSQRYGSMTVLHDLNLNLGEGEVLGLFGHNGAGKTTSMKLILGLLSPSEGQVKVLGRAPNDPQVRRQLGYLPENVTFYPQLSGRETLRHFARLKGAALTQVDELLEQVGLAHAADRRVKTYSKGMRQRLGLAQALLGEPRLLLLDEPTVGLDPIATQDLYLLIDRLRQRGTSIILCSHVLPGVEAHINRAAILAKGCLQAVGSLSQLRAEAGLPVRIRASGISERDSWLQRWTDAGHSARGLSESSIEVVAVNGHKLVLLRQLLGEGEPEDIEIHQPSLEDLYRYYMERAGDVRAQEGRL\n>7nt9_A mol:protein length:1287  Spike glycoprotein\nMGILPSPGMPALLSLVSLLSVLLMGCVAETGMFVFLVLLPLVSSQCVNLTTRTQLPPAYTNSFTRGVYYPDKVFRSSVLHSTQDLFLPFFSNVTWFHAIHVSGTNGTKRFDNPVLPFNDGVYFASTEKSNIIRGWIFGTTLDSKTQSLLIVNNATNVVIKVCEFQFCNDPFLGVYYHKNNKSWMESEFRVYSSANNCTFEYVSQPFLMDLEGKQGNFKNLREFVFKNIDGYFKIYSKHTPINLVRDLPQGFSALEPLVDLPIGINITRFQTLLALHRSYLTPGDSSSGWTAGAAAYYVGYLQPRTFLLKYNENGTITDAVDCALDPLSETKCTLKSFTVEKGIYQTSNFRVQPTESIVRFPNITNLCPFGEVFNATRFASVYAWNRKRISNCVADYSVLYNSASFSTFKCYGVSPTKLNDLCFTNVYADSFVIRGDEVRQIAPGQTGKIADYNYKLPDDFTGCVIAWNSNNLDSKVGGNYNYLYRLFRKSNLKPFERDISTEIYQAGSTPCNGVEGFNCYFPLQSYGFQPTNGVGYQPYRVVVLSFELLHAPATVCGPKKSTNLVKNKCVNFNFNGLTGTGVLTESNKKFLPFQQFGRDIADTTDAVRDPQTLEILDITPCSFGGVSVITPGTNTSNQVAVLYQDVNCTEVPVAIHADQLTPTWRVYSTGSNVFQTRAGCLIGAEHVNNSYECDIPIGAGICASYQTQTNSPSRASSVASQSIIAYTMSLGAENSVAYSNNSIAIPTNFTISVTTEILPVSMTKTSVDCTMYICGDSTECSNLLLQYGSFCTQLNRALTGIAVEQDKNTQEVFAQVKQIYKTPPIKDFGGFNFSQILPDPSKPSKRSFIEDLLFNKVTLADAGFIKQYGDCLGDIAARDLICAQKFNGLTVLPPLLTDEMIAQYTSALLAGTITSGWTFGAGAALQIPFAMQMAYRFNGIGVTQNVLYENQKLIANQFNSAIGKIQDSLSSTASALGKLQDVVNQNAQALNTLVKQLSSNFGAISSVLNDILSRLDPPEAEVQIDRLITGRLQSLQTYVTQQLIRAAEIRASANLAATKMSECVLGQSKRVDFCGKGYHLMSFPQSAPHGVVFLHVTYVPAQEKNFTTAPAICHDGKAHFPREGVFVSNGTHWFVTQRNFYEPQIITTDNTFVSGNCDVVIGIVNNTVYDPLQPELDSFKEELDKYFKNHTSPDVDLGDISGINASVVNIQKEIDRLNEVAKNLNESLIDLQELGKYEQSGRENLYFQGGGGSGYIPEAPRDGQAYVRKDGEWVLLSTFLGHHHHHH\n>5euj_T mol:protein length:573  Pyruvate decarboxylase\nMYTVGMYLAERLAQIGLKHHFAVAGDYNLVLLDQLLLNKDMEQVYCCNELNCGFSAEGYARARGAAAAIVTFSVGAISAMNAIGGAYAENLPVILISGSPNTNDYGTGHILHHTIGTTDYNYQLEMVKHVTCAAESIVSAEEAPAKIDHVIRTALRERKPAYLEIACNVAGAECVRPGPINSLLRELEVDQTSVTAAVDAAVEWLQDRQNVVMLVGSKLRAAAAEKQAVALADRLGCAVTIMAAAKGFFPEDHPNFRGLYWGEVSSEGAQELVENADAILCLAPVFNDYATVGWNSWPKGDNVMVMDTDRVTFAGQSFEGLSLSTFAAALAEKAPSRPATTQGTQAPVLGIEAAEPNAPLTNDEMTRQIQSLITSDTTLTAETGDSWFNASRMPIPGGARVELEMQWGHIGWSVPSAFGNAVGSPERRHIMMVGDGSFQLTAQEVAQMIRYEIPVIIFLINNRGYVIEIAIHDGPYNYIKNWNYAGLIDVFNDEDGHGLGLKASTGAELEGAIKKALDNRRGPTLIECNIAQDDCTETLIAWGKRVAATNSRKPQALVPRGSGGGLEHHHHHH\n>5y6p_A2 mol:protein length:318  LR_gamma4\nMDSPAFAVNGMFSAVKVGNSSFTENKVTAVSKTAPTASVRMVVDPFQRKFQSIGKIGIDYSRPKKLATYKRVGYSVGLDFPNAVSMAGHYSLTDCTRAGGAAKILMKYDEYCAKGMLQVYKRSAVSTGVYTTKCTEATQPGVAYDVRVFNRTAAFRQAQKPVNVRLGEQYAARKACVTLAHNCSREEAQFKNMPMSCATFLAGKMEAMGTCYRTVRPSSKAEDYMAGSVRMQVYQKGNASGVYPVGGCEDGHAKGDADLRRVIALASEYRAAQQGAAAVTGAQYASSKMAIQLYGHSCNHEEGQFCDYPAVAAAMCRY\n>7qgr_S mol:protein length:179  50S ribosomal protein L5\nMAKLHDYYKDEVVKKLMTEFNYNSVMQVPRVEKITLNMGVGEAIADKKLLDNAAADLAAISGQKPLITKARKSVAGFKIRQGYPIGCKVTLRGERMWEFFERLITIAVPRIRDFRGLSAKSFDGRGNYSMGVREQIIFPEIDYDKVDRVRGLDITITTTAKSDEEGRALLAAFDFPFRK\n>3q9i_A mol:protein length:10  Cyclic pseudo-peptide LV(4BF)FA(ORN)(HAO)LK(ORN)\nLVYFAAXLKA\n>4a35_A mol:protein length:441  MITOCHONDRIAL ENOLASE SUPERFAMILY MEMBER 1\nSMVRGRISRLSVRDVRFPTSLGGHGADAMHTDPDYSAAYVVIETDAEDGIKGCGITFTLGKGTEVVVCAVNALAHHVLNKDLKDIVGDFRGFYRQLTSDGQLRWIGPEKGVVHLATAAVLNAVWDLWAKQEGKPVWKLLVDMDPRMLVSCIDFRYITDVLTEEDALEILQKGQIGKKEREKQMLAQGYPAYTTSCAWLGYSDDTLKQLCAQALKDGWTRFKVKVGADLQDDMRRCQIIRDMIGPEKTLMMDANQRWDVPEAVEWMSKLAKFKPLWIEEPTSPDDILGHATISKALVPLGIGIATGEQCHNRVIFKQLLQAKALQFLQIDSCRLGSVNENLSVLLMAKKFEIPVCPHAGGVGLCELVQHLIIFDYISVSASLENRVCEYVDHLHEHFKYPVMIQRASYMPPKDPGYSTEMKEESVKKHQYPDGEVWKKLLPA\n>3zpv_S mol:protein length:62  PROTEIN PYGOPUS\nGAMAIYPCGMCHKEVNDNDEAVFCESGCNFFFHRTCVGLTEAAFQMLNKEVFAEWCCDKCVS\n>7y15_C mol:protein length:71  Guanine nucleotide-binding protein G(I)/G(S)/G(O) subunit gamma-2\nMASNNTASIAQARKLVEQLKMEANIDRIKVSKAAADLMAYCEAHAKEDPLLTPVPASENPFREKKFFCAIL\n>3glh_D mol:protein length:376  DNA polymerase III subunit tau\nGPHMSYQVLARKWRPQTFADVVGQEHVLTALANGLSLGRIHHAYLFSGTRGVGKTSIARLLAKGLNCETGITATPCGVCDNCREIEQGRFVDLIEIDAASRTKVEDTRDLLDNVQYAPARGRFKVYLIDEVHMLSRHSFNALLKTLEEPPEHVKFLLATTDPQKLPVTILSRCLQFHLKALDVEQIRHQLEHILNEEHIAHEPRALQLLARAAEGSLRDALSLTDQAIASGDGQVSTQAVSAMLGTLDDDQALSLVEAMVEANGERVMALINEAAARGIEWEALLVEMLGLLHRIAMVQLSPAALGNDMAAIELRMRELARTIPPTDIQLYYQTLLIGRKELPYAPDRRMGVEMTLLRALAFHPRMPLPEPEVPRQ\n>3k6s_C mol:protein length:1095  Integrin alpha-X\nFNLDTEELTAFRVDSAGFGDSVVQYANSWVVVGAPQKITAANQTGGLYQCGYSTGACEPIGLQVPPEAVNMSLGLSLASTTSPSQLLACGPTVHHECGRNMYLTGLCFLLGPTQLTQRLPVSRQECPRQEQDIVFLIDGSGSISSRNFATMMNFVRAVISQFQRPSTQFSLMQFSNKFQTHFTFEEFRRSSNPLSLLASVHQLQGFTYTATAIQNVVHRLFHASYGARRDAAKILIVITDGKKEGDSLDYKDVIPMADAAGIIRYAIGVGLAFQNRNSWKELNDIASKPSQEHIFKVEDFDALKDIQNQLKEKIFAIEGTETTSSSSFELEMAQEGFSAVFTPDGPVLGAVGSFTWSGGAFLYPPNMSPTFINMSQENVDMRDSYLGYSTELALWKGVQSLVLGAPRYQHTGKAVIFTQVSRQWRMKAEVTGTQIGSYFGASLCSVDVDSDGSTDLVLIGAPHYYEQTRGGQVSVCPLPRGWRRWWCDAVLYGEQGHPWGRFGAALTVLGDVNGDKLTDVVIGAPGEEENRGAVYLFHGVLGPSISPSHSQRIAGSQLSSRLQYFGQALSGGQDLTQDGLVDLAVGARGQVLLLRTRPVLWVGVSMQFIPAEIPRSAFECREQVVSEQTLVQSNICLYIDKRSKNLLGSRDLQSSVTLDLALDPGRLSPRATFQETKNRSLSRVRVLGLKAHCENFNLLLPSCVEDSVTPITLRLNFTLVGKPLLAFRNLRPMLAADAQRYFTASLPFEKNCGADHICQDNLGISFSFPGLKSLLVGSNLELNAEVMVWNDGEDSYGTTITFSHPAGLSYRYVAEGQKQGQLRSLHLTCDSAPVGSQGTWSTSCRINHLIFRGGAQITFLATFDVSPKAVLGDRLLLTANVSSENNTPRTSKTTFQLELPVKYAVYTVVSSHEQFTKYLNFSESEEKESHVAMHRYQVNNLGQRDLPVSINFWVPVELNQEAVWMDVEVSHPQNPSLRCSSEKIAPPASDFLAHIQKNPVLDCSIAGCLRFRCDVPSFSVQEELDFTLKGNLSFGWVRQILQKKVSVVSVAEITFDTSVYSQLPGQEAFMRAQTTTVLEKYKVHGCGGLENLYFQ\n>3tvu_C mol:protein length:769  Acetyl-CoA carboxylase\nMASGSMHLRPIATPYPVKEWLQPKRYKAHLMGTTYVYDFPELFRQASSSQWKNFSADVKLTDDFFISNELIEDENGELTEVEREPGANAIGMVAFKITVKTPEYPRGRQFVVVANDITFKIGSFGPQEDEFFNKVTEYARKRGIPRIYLAANSGARIGMAEEIVPLFQVAWNDAANPDKGFQYLYLTSEGMETLKKFDKENSVLTERTVINGEERFVIKTIIGSEDGLGVECLRGSGLIAGATSRAYHDIFTITLVTCRSVGIGAYLVRLGQRAIQVEGQPIILTGASALNKVLGREVYTSNLQLGGTQIMYNNGVSHLTAVDDLAGVEKIVEWMSYVPAKRNMPVPILETKDTWDRPVDFTPTNDETYDVRWMIEGRETESGFEYGLFDKGSFFETLSGWAKGVVVGRARLGGIPLGVIGVETRTVENLIPADPANPNSAETLIQQAGQVWFPNSAFKTAQAINDFNNGEQLPMMILANWRGFSGGQRDMFNEVLKYGSFIVDALVDYKQPIIIYIPPTGELRGGSWVVVDPTINADQMEMYADVNARAGVLEPEGTVEIKFRREKLLDTMNRLDDKYRELRSQLSNKSLAPEVHQQISKQLADRERELLPIYGQISLQFADLHDRSSRMVAKGVISKELEWTEARRFFFWRLRRRLNEEYLIKRLSHQVGEASRLEKIARIRSWYPASVDHEDDRQVATWIEENYKTLDDKLKGLKLESFAQDLAKKIRSDHDNAIDGLSEVIKMLSTDDKEKLLKTLKLEHHHHHH\n>2kj4_A mol:protein length:87  plasminogen\nYVEFSEECMHGSGENYDGKISKTMSGLECQAWDSQSPHAHGYIPSKFPNKNLKKNYCRNPDRDLRPWCFTTDPNKRWEYCDIPRCAA\n>7s3d_G mol:protein length:782  Photosystem I P700 chlorophyll a apoprotein A1\nMTASPPKRNQASAATEQSPIPTSFERWAKPGHFDRTLARGPKTTTWIWNLHADAHDFDSHTNDLQDISRKIFSAHFGHLAVVFVWLSGMYFHGARFSNFSSWMADPTHIRPSAQVVWPLVGQDILNGDMGGGFRGIQITSGLFQMWRGEGFTNEFQLYCTAIGALVMAGLMIFAGWFHYHVRSPKLEWFQNVQSMLNHHLAGLLGLGSLGWAGHLIHVALPTNKLLDAGVAPQDIPLPHEFVLDKALMAELYPSFAQGIRPFFTLNWATYSDFLTFNGGLNPVTGGLWMTDIAHHHVAIAVLFIFAGHMYRTNWGIGHSIRTMLEDARHPKMLPFLSFIGPVGHRGLFEVLTTSWHAQLSINLAMMGSLSIIVAQHMYSMPPYPYLATDYGTVTSLFTHHMWIGGFLIVGAAAHAGIFMVRDYDPAENVNNVLDRVLRHRDAIISHLVWVCQFLGFHSFAMYCHNDTMRAFGRPQDMFSDTGIQLQPIFAQWVQHIQTMAVGSAQVAEPLGDALGGIQNIALSGVGTTAPGVASPASYAFGGGLVAVGGKVAMMPISLGTADFLIHHIHAFTIHVTVLVLLKGVLFARNSRLIPDKSELGFRFPCDGPGRGGTCQVSAWDHVFLGLFWMYNSIAMVIFHFFWKMQSDVWGAVDANGTVSHITGGNFAQSSITINGWLRDFLWAQATQVISSYGSALSAYGLMFLAGHFVFAFSLMFLFSGRGYWQELIESIVWAHNKLRITTAIQPRALSITQGRAVGAAHYLLGSIVTTWAFFLARMAAIG\n>1hqz_9 mol:protein length:141  ACTIN-BINDING PROTEIN\nMALEPIDYTTHSREIDAEYLKIVRGSDPDTTWLIISPNAKKEYEPESTGSSFHDFLQLFDETKVQYGLARVSPPGSDVEKIIIIGWCPDSAPLKTRASFAANFAAVANNLFKGYHVQVTARDEDDLDENELLMKISNAAGA\n>6fq5_H mol:protein length:95  Histone H2B\nRKTRKESYAIYVYKVLKQVHPDTGISSKAMSIMNSFVNDVFERIAGEASRLAHYNKRSTITSREIQTAVRLLLPGELAKHAVSEGTKAVTKYTSA\n>6ek5_L mol:protein length:205  Capsid protein\nAPMYRKPTMYRMYRSPDIPRGCEGPCKVQSFEQRDDVKHLGICKVISDVTRGPGLTHRVGKRFCIKSIYILGKIWLDETIKKQNHTNNVIFYLLRDRRPYGNAPQDFGQIFNMFDNEPSTATIKNDLRDRFQVLRKFHATVVGGLYCMKEQALVKRFYRLNHHVTYNHQEAGKYENHTENALLLYMACTHASNPVYATLKIRIYF\n>6f7b_A mol:protein length:361  Mitotic checkpoint serine/threonine-protein kinase BUB1\nGSSLGTVDAPNFIVGNPWDDKLIFKLLSGLSKPVSSYPNTFEWQCKLPAIKPKTEFQLGSKLVYVHHLLGEGAFAQVYEATQGDLNDAKNKQKFVLKVQKPANPWEFYIGTQLMERLKPSMQHMFMKFYSAHLFQNGSVLVGELYSYGTLLNAINLYKNTPEKVMPQGLVISFAMRMLYMIEQVHDCEIIHGDIKPDNFILGNGFLEQDDEDDLSAGLALIDLGQSIDMKLFPKGTIFTAKCETSGFQCVEMLSNKPWNYQIDYFGVAATVYCMLFGTYMKVKNEGGECKPEGLFRRLPHLDMWNEFFHVMLNIPDCHHLPSLDLLRQKLKKVFQQHYTNKIRALRNRLIVLLLECKRSRK\n>3cic_A mol:protein length:390  Beta-secretase 1\nGSFVEMVDNLRGKSGQGYYVEMTVGSPPQTLNILVDTGSSNFAVGAAPHPFLHRYYQRQLSSTYRDLRKGVYVPYTQGKWEGELGTDLVSIPHGPNVTVRANIAAITESDKFFINGSNWEGILGLAYAEIARPDDSLEPFFDSLVKQTHVPNLFSLQLCGAGFPLNQSEVLASVGGSMIIGGIDHSLYTGSLWYTPIRREWYYEVIIVRVEINGQDLKMDCKEYNYDKSIVDSGTTNLRLPKKVFEAAVKSIKAASSTEKFPDGFWLGEQLVCWQAGTTPWNIFPVISLYLMGEVTNQSFRITILPQQYLRPVEDVATSQDDCYKFAISQSSTGTVMGAVIMEGFYVVFDRARKRIGFAVSACHVHDEFRTAAVEGPFVTLDMEDCGYNI\n>6qea_A mol:protein length:129  Lysozyme C\nKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRL\n>4br6_A mol:protein length:197  SUPEROXIDE DISMUTASE\nKATLPDLKYDYGALEPYISARIMELHHSKHHQTYVNGLNSALEATAEAEAKGDFTKAASLAPLLNFHGGGHLNHTLFWENLAPASREGGGEPDGALKKAIEADFGSFETFRKQMNAALTGIQGSGWAWLAKDKDSGNLAIVTRANQDPVTGQLVPLMGIDAWEHAYYLQYENRKAEYFEAIWNVINWKTVAQRFEKA\n>4hpe_B mol:protein length:308  Putative cell wall hydrolase Tn916-like,CTn1-Orf17\nGADSDDENSNFSSGITGMNLSAEVLKHQPMVEKYARENGISEYVNVLLAIIQVESGGTAEDVMQSSESLGLPPNSLDTESSIKQGCKYFASLLSSSKNQGIDDLNVAIQSYNYGGGYVGYVAGKGKKHTFNLAESFAREKSGGKKVTYTNPIAVAKNGGWRWNYGNMFYVELVNQYLTVPQVSGELAQKVMNEALKYQGWKYVYGGSNPNTSFDCSGLTQWCYGKAGISLPRTAQAQYDATQHLPLSQAKAGDLVFFHSTYNAGSYVTHVGIYVGNNQMYHAGDPIGYADLSSSYWQQHLIGAGRVKQ\n>6c7g_A mol:protein length:342  cGMP-dependent 3',5'-cyclic phosphodiesterase\nSAMDDEYTKLLHDGIQPVAAIDSNFASFTYTPRSLPEDDTSMAILSMLQDMNFINNYKIDCPTLARFCLMVKKGYRDPPYHNWMHAFSVSHFCYLLYKNLELTNYLEDIEIFALFISCMCHDLDHRGTNNSFQVASKSVLAALYSSEGSVMERHHFAQAIAILNTHGCNIFDHFSRKDYQRMLDLMRDIILATDLAHHLRIFKDLQKMAEVGYDRNNKQHHRLLLCLLMTSCDLSDQTKGWKTTRKIAELIYKEFFSQGDLEKAMGNRPMEMMDREKAYIPELQISFMEHIAMPIYKLLQDLFPKAAELYERVASNREHWTKVSHKFTIRGLPSNNSLDFLD\n>6a83_A mol:protein length:394  Phosphoethanolamine transferase EptC\nMGSSHHHHHHSSGLVPRGSHMYRQQLNSLTKLLNENNALPPLANFKDESGNEPRTLVLVIGESTQRGRMSLYGYPRETTPELDALHKTDPNLTVFNNVVTSRPYTIEILQQALTFANEKNPDLYLTQPSLMNMMKQAGYKTFWITNQQTMTARNTMLTVFSRQTDKQYYMNQQRTQSAREYDTNVLKPFQEVLNDPAPKKLIIVHLLGTHIKYKYRYPENQGKFDGNTDHVPPGLNAEELESYNDYDNANLYNDHVVASLIKDFKAANPNGFLVYFSDHGEEVYDTPPHKTQGRNEDNPTRHMYTIPFLLWTSEKWQATHPRDFSQDVDRKYSLAELIHTWSDLAGLSYDGYDPTRSVVNPQFKETTRWIGNPYKKNALIDYDTLPYGDQVGNQ\n>4eqh_A mol:protein length:128  Histidine triad nucleotide-binding protein 1\nSLMADEIAKAQVARPGGDTIFGKIIRKEIPAKIIFEDDRCLAFHDISPQAPTHFLVIPKKHISQISVAEDDDESLLGHLMIVGKKCAADLGLNKGYRMVVNEGSDGGQSVYHVHLHVLGGRQMHWPPG\n>7mjk_F mol:protein length:244  Fab ab1 Heavy Chain\nEVQLVESGGGLVQPGGSLRLSCAASGFTVSSNYMSWVRQAPGKGLEWVSVIYSGGSTYYADSVKGRFTISRHNSKNTLYLQMNSLRAEDTAVYYCARGYGDYYFDYWGQGTLVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTSGQAGHHHHHHGDYKDDDDKG\n>5p35_A mol:protein length:330  endothiapepsin\nSTGSATTTPIDSLDDAYITPVQIGTPAQTLNLDFDTGSSDLWVFSSETTASEVDGQTIYTPSKSTTAKLLSGATWSISYGDGSSSSGDVYTDTVSVGGLTVTGQAVESAKKVSSSFTEDSTIDGLLGLAFSTLNTVSPTQQKTFFDNAKASLDSPVFTADLGYHAPGTYNFGFIDTTAYTGSITYTAVSTKQGFWEWTSTGYAVGSGTFKSTSIDGIADTGTTLLYLPATVVSAYWAQVSGAKSSSSVGGYVFPCSATLPSFTFGVGSARIVIPGDYIDFGPISTGSSSCFGGIQSSAGIGINIFGDVALKAAFVVFNGATTPTLGFASK\n>3j3y_9P mol:protein length:231  capsid protein\nPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIEPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVL\n>2wq5_A mol:protein length:119  PHOSPHOLIPASE A2, ACIDIC\nNLYQFKNMIKCTVPSRSWWDFADYGCYCGRGGSGTPVDDLDRCCQVHDNCYNEAEKISKCWPFFKTYSYKCSQGTLTCKGGNNACAASVCDCDRLAAICFAGAPYNDNNYNIDLKARCQ\n>5ot7_H mol:protein length:127  30S ribosomal protein S9\nEQYYGTGRRKEAVARVFLRPGNGKVTVNGQDFNEYFQGLVRAVAALEPLRAVDALGHFDAYITVRGGGKSGQIDAIKLGIARALVQYNPDYRAKLKPLGFLTRDARVVERKKYGKHKARRAPQYSKR\n>3iml_D mol:protein length:399  S-adenosylmethionine synthetase\nGPGSMANDYLFTSESVSEGHPDKVADQISDAILDAILAQDKYSRVAAETLCNTGLVVLAGEITTTANIDYIQIARDTIKRIGYDNTDYGIDYRGCAVLVAYDKQSPDIAQGVDRAHDNNLDQGAGDQGLMFGYACDETPELMPLPIHLSHRLVERQANLRRDGRLPWLRPDAKSQVTVRYVDGKPHSIDTVVLSTQHAPEIDLPALREAVIEEVIKPTLPADLIKGDIKFLVNPTGRFVIGGPQGDCGLTGRKIIVDTYGGAAPHGGGAFSGKDPSKVDRSAAYAGRYVAKNIVAAGLASRALIQVSYAIGVAEPTSVMVNTFGTGRVSDETITKLVREHFDLRPKGIIQMLDLLRPIYEKTAAYGHFGREEPEFSWEAADKALALAEAAGVEPAVQVA\n>6gsl_H5 mol:protein length:60  50S ribosomal protein L30\nMPRLKVKLVKSPIGYPKDQKAALKALGLRRLQQERVLEDTPAIRGNVEKVAHLVRVEVVE\n>3j3q_4p mol:protein length:231  capsid protein\nPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIEPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVL\n>5u23_A mol:protein length:382  Putative aminotransferase\nMGSSHHHHHHSSRNLYFQGGGHMFFLNLKQINDRFNTEFITKFKEILESGWYILGKQCEKFENNFAKYCGVKHCIGVANGLDALRLIIKAYDFKENDEIIVPANTYIASILAITDNKCKPILIEPDINTYNINPDLIEEKITKKTKAIMVVHLYGQVCDMEKIQLLANKYNLKIIEDCAQAHGAIYKDKRVGNLGDAAGFSFYPGKNLGALGDAGCICTNDDNFASKIRALANYGSHKKYENLYTGLNSRLDEIQAAFLDIKLKYLDEDNNKRKNIANFYLQNIKNENIILPSNKFDHVWHLFVVKTKLRDELQHYLNNHDIQTIIHYPIPPHKQKCYKDLNHLKLPITENIHQEVLSLPISPTMKENDFKKVADILNKWKV\n>6i7v_C5 mol:protein length:45  50S ribosomal protein L36 2\nMKVLNSLRTAKERHPDCQIVKRKGRLYVICKSNPRFKAVQGRKKK\n>6mrc_2 mol:protein length:100  10 kDa heat shock protein, mitochondrial\nGQAFRKFLPLFDRVLVERSAAETVTKGGIMLPEKSQGKVLQATVVAVGSGSKGKGGEIQPVSVKVGDKVLLPEYGGTKVVLDDKDYFLFRDGDILGKYVD\n>5jw4_B mol:protein length:162  Hemagglutinin\nGLFGAIAGFIEGGWQGMVDGWYGYHHSNEQGSGYAADKESTQKAIDGVTNKVNSIIDKMNTQFEAVGREFNNLERRIENLNKKMEDGFLDVWTYNAELLVLMENERTLDFHDSNVKNLYDKVRLQLRDNAKELGNGCFEFYHKCDNECMESVRNGTYDYPQY\n>6rjh_P mol:protein length:171  Ferritin light chain\nSQIRQNYSTEVEAAVNRLVNLYLRASYTYLSLGFYFDRDDVALEGVCHFFRELAEEKREGAERLLKMQNQRGGRALFQDLQKPSQDEWGTTLDAMKAAIVLEKSLNQALLDLHALGSAQADPHLCDFLESHFLDEEVKLIKKMGDHLTNIQRLVGSQAGLGEYLFERLTLK\n>6ch9_G mol:protein length:518  Envelope glycoprotein gp120\nMDAMKRGLCCVLLLCGAVFVSPSQEIHARFRRGARAAKKWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEIVLGNVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCNNVNTNNTNNSTNATISDWEKMETGEMKNCSFNVTTSIRDKIKKEYALFYKLDVVPLENKNNINNTNITNYRLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNSKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENITDNAKTIIVQLNEAVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGNIRQAHCNISKARWNETLGQIVAKLEEQFPNKTIIFNHSSGGDPEIVTHSFNCGGEFFYCNTTPLFNSTWNNTRTDDYPTGGEQNITLQCRIKQIINMWQGVGKAMYAPPIRGQIRCSSNITGLLLTRDGGRDQNGTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTACKRRVVQ\n>1w76_B mol:protein length:543  ACETYLCHOLINESTERASE\nDDHSELLVNTKSGKVMGTRVPVLSSHISAFLGIPFAEPPVGNMRFRRPEPKKPWSGVWNASTYPNNCQQYVDEQFPGFSGSEMWNPNREMSEDCLYLNIWVPSPRPKSTTVMVWIYGGGFYSGSSTLDVYNGKYLAYTEEVVLVSLSYRVGAFGFLALHGSQEAPGNVGLLDQRMALQWVHDNIQFFGGDPKTVTIFGESAGGASVGMHILSPGSRDLFRRAILQSGSPNCPWASVSVAEGRRRAVELGRNLNCNLNSDEELIHCLREKKPQELIDVEWNVLPFDSIFRFSFVPVIDGEFFPTSLESMLNSGNFKKTQILLGVNKDEGSFFLLYGAPGFSKDSESKISREDFMSGVKLSVPHANDLGLDAVTLQYTDWMDDNNGIKNRDGLDDIVGDHNVICPLMHFVNKYTKFGNGTYLYFFNHRASNLVWPEWMGVIHGYEIEFVFGLPLVKELNYTAEEEALSRRIMHYWATFAKTGNPNEPHSQESKWPLFTTKEQKFIDLNTEPMKVHQRLRVQMCVFWNQFLPKLLNATACDGELSS\n>7tk0_O mol:protein length:195  ATP synthase subunit 5\nASKAAAPPPVRLFGVEGTYATALYQAAAKNSSIDAAFQSLQKVESTVKKNPKLGHLLLNPALSLKDRNSVIDAIVETHKNLDGYVVNLLKVLSENNRLGCFEKIASDFGVLNDAHNGLLKGTVTSAEPLDPKSFKRIEKALSASKLVGQGKSLKLENVVKPEIKGGLIVELGDKTVDLSISTKIQKLNKVLEDSI\n>5ap8_C mol:protein length:166  TSR3\nMKVYIIDYHKDDPKRCTGKKLVKLKIAEFTRVGKGVVLDPFAQITLSNKDKDIVRRIGITIVDTSWNNTSQSEFKNIRGEHRRIPILFAGNPIHYGIAYKLSSIEALIATLYIVDEVEEAIKLSNVVKWGHTFIELNKELLEAYKNKTEEDIKKIEREIIEKILEK\n>5qfe_A mol:protein length:321  Tyrosine-protein phosphatase non-receptor type 1\nMEMEKEFEQIDKSGSWAAIYQDIRHEASDFPSRVAKLPKNKNRNRYRDVSPFDHSRIKLHQEDNDYINASLIKMEEAQRSYILTQGPLPNTVGHFWEMVWEQKSRGVVMLNRVMEKGSLKCAQYWPQKEEKEMIFEDTNLKLTLISEDIKSYYTVRQLELENLTTQETREILHFHYTTWPDFGVPESPASFLNFLFKVRESGSLSPEHGPVVVHCSAGIGRSGTFCLADTCLLLMDKRKDPSSVDIKKVLLEMRKFRMGLIQTADQLRFSYLAVIEGAKFIMGDSSVQDQWKELSHEDLEPPPEHIPPPPRPPKRILEPHN\n>5xhz_A mol:protein length:66  SH3 domain-containing kinase-binding protein 1\nGPGSEFRRRRRCQVAFSYLPQNDDELELKVGDIIEVVGEVEEGWWEGVLNGKTGMFPSNFIKELSG\n>5ndg_C7 mol:protein length:136  40S ribosomal protein S17-A\nMGRVRTKTVKRASKALIERYYPKLTLDFQTNKRLCDEIATIQSKRLRNKIAGYTTHLMKRIQKGPVRGISFKLQEEERERKDQYVPEVSALDLSRSNGVLNVDNQTSDLVKSLGLKLPLSVINVSAQRDRRYRKRV\n>5lzd_e mol:protein length:157  30S ribosomal protein S5\nELQEKLIAVNRVSKTVKGGRIFSFTALTVVGDGNGRVGFGYGKAREVPAAIQKAMEKARRNMINVALNNGTLQHPVKGVHTGSRVFMQPASEGTGIIAGGAMRAVLEVAGVHNVLAKAYGSTNPINVVRATIDGLENMNSPEMVAAKRGKSVEEILG\n>5anb_E mol:protein length:136  60S RIBOSOMAL PROTEIN L23\nMSKAQAVGSNYRVSLGLPVGAVMNSADNSGAKNLYVIAVKGIKGRLNRLPSAGVGDMVMATVKKGKPELRKKVCTGLVVRQRKHWKRKDGVYIYFEDNAGVMCNPKGEVKGNILGPVAKECSDLWPKVATNAGTIV\n>6ydw_Bj mol:protein length:279  Mitochondrial ribosomal protein L46\nMAAPVRRTMLRVVRGWRRFEGPWAHSLGSRNLALAVAPSSSSSPWRLLGALCLQRPPLVTKPLTPLQEEMADLLQQIEIERSLYSDHELRALDEAQQLAKKKSDLYEEEDEQNILLAQDLEDMWEQKFLHFKLGARLTEADKKDDRTSLHRKLDRNLILLVREKLGDQDIWMLPQSDWQPGETLRQTAERTLATLSENNMEAKFLGNAPCGHYKFKFPQAMRTETSLGAKVFFFKALLLTGDFSQAGKKGHHVWVSKEELGDYLKPKYLAQVRRFLLDL\n>3jbt_N mol:protein length:105  Cytochrome c\nMGDVEKGKKIFVQKCAQCHTVEKGGKHKTGPNLHGLFGRKTGQAPGFTYTDANKNKGITWKEETLMEYLENPKKYIPGTKMIFAGIKKKTEREDLIAYLKKATNE\n>1htq_N mol:protein length:477  glutamine synthetase\nTEKTPDDVFKLAKDEKVEYVDVRFCDLPGIMQHFTIPASAFDKSVFDDGLAFDGSSIRGFQSIHESDMLLLPDPETARIDPFRAAKTLNINFFVHDPFTLEPYSRDPRNIARKAENYLISTGIADTAYFGAEAEFYIFDSVSFDSRANGSFYEVDAISGWWNTGAATEADGSPNRGYKVRHKGGYFPVAPNDQYVDLRDKMLTNLINSGFILEKGHHEVGSGGQAEINYQFNSLLHAADDMQLYKYIIKNTAWQNGKTVTFMPKPLFGDNGSGMHCHQSLWKDGAPLMYDETGYAGLSDTARHYIGGLLHHAPSLLAFTNPTVNSYKRLVPGYEAPINLVYSQRNRSACVRIPITGSNPKAKRLEFRSPDSSGNPYLAFSAMLMAGLDGIKNKIEPQAPVDKDLYELPPEEAASIPQTPTQLSDVIDRLEADHEYLTEGGVFTNDLIETWISFKRENEIEPVNIRPHPYEFALYYDV\n>1sor_A mol:protein length:235  Aquaporin-0\nRSASFWRAIFAEFFATLFYVFFGLGASLRWAPGPLHVLQVALAFGLALATLVQAVGHISGAHVNPAVTFAFLVGSQMSLLRAICYVVAQLLGAVAGAAVLYSVTPPAVRGNLALNTLHPGVSVGQATIVEIFLTLQFVLCIFATYDERRNGRLGSVALAVGFSLTLGHLFGMYYTGAGMNPARSFAPAILTRNFTNHWVYWVGPVIGAGLGSLLYDFLLFPRLKSVSERLSILKG\n>6dv5_A mol:protein length:205  Heat shock protein beta-1\nMTERRVPFSLLRGPSWDPFRDWYPHSRLFDQAFGLPRLPEEWSQWLGGSSWPGYVRPLPPAAIESPAVAAPAYSRALSRQLSSGVSEIRHTADRWRVSLDVNHFAPDELTVKTKDGVVEITGKHEERQDEHGYISRCFTRKYTLPPGVDPTQVSSSLSPEGTLTVEAPMPKLATQSNEITIPVTFESRAQLGGPEAAKSDETAAK\n>5dat_c1 mol:protein length:155  40S ribosomal protein S11-A\nSTELTVQSERAFQKQPHIFNNPKVKTSKRTKRWYKNAGLGFKTPKTAIEGSYIDKKCPFTGLVSIRGKILTGTVVSTKMHRTIVIRRAYLHYIPKYNRYEKRHKNVPVHVSPAFRVQVGDIVTVGQCRPISKTVRFNVVKVSAAAGKANKQFAKF\n>1o1e_2 mol:protein length:375  SKELETAL MUSCLE ACTIN\nDEDETTALVCDNGSGLVKAGFAGDDAPRAVFPSIVGRPRHQGVMVGMGQKDSYVGDEAQSKRGILTLKYPIEHGIITNWDDMEKIWHHTFYNELRVAPEEHPTLLTEAPLNPKANREKMTQIMFETFNVPAMYVAIQAVLSLYASGRTTGIVLDSGDGVTHNVPIYEGYALPHAIMRLDLAGRDLTDYLMKILTERGYSFVTTAEREIVRDIKEKLCYVALDFENEMATAASSSSLEKSYELPDGQVITIGNERFRCPETLFQPSFIGMESAGIHETTYNSIMKCDIDIRKDLYANNVMSGGTTMYPGIADRMQKEITALAPSTMKIKIIAPPERKYSVWIGGSILASLSTFQQMWITKQEYDEAGPSIVHRKCF\n>5b02_A mol:protein length:343  MoeN5,DNA-binding protein 7d\nMAHHHHHHVDDDDKMLAAEAANRDHVTRCVAQTGGSPDLVAHTAALRLYLRVPHFLTEWTTDPDRRAAVSRALALDIVSMKLLDDLMDDDTGLDRVELACVCLRLHLRALHELESLARDPKAVTDILEQDAVHLCGGQIRTKRSRATNLREWRAHASTYGSTFLGRYGALAAACGGEGQPADSVREFAEAFAMTITMADDLTDYDRNGERDGNLAHLMRTGAVAGQDVVDLLEELRGRALAAVAAPPGAPGLVPVVHLYTDDVLVRLLPRHLGEAGAGAMATVKFKYKGEEKEVDISKIKKVWRVGKMISFTYDEGGGKTGRGAVSEKDAPKELLQMLEKQKK\n>6r4o_A mol:protein length:1533  Adenylate cyclase 9\nMASPPHQQLLQHHSTEVSCDSSGDSNSVRVRINPKQPSSNSHPKHCKYSISSSCSSSGDSGGVPRRMGAGGRLRRRKKLPQLFERASSRWWDPKFDSVNLEEACMERCFPQTQRRFRYALFYIGFACLLWSIYFGVHMKSKLIVMVAPALCFLVVCVGFFLFTFTKLYARHYVWTSLVLTLLVFALTLAAQFQVLTPLSGRVDNFNHTRAARPTDTCLSQVGSFSMCIEVLFLLYTVMHLPLYLSLILGVAYSVLFETFGYHFQDEACFASPGAEALHWELLSRALLHLCIHAIGIHLFIMSQVRSRSTFLKVGQSIMHGKDLEVEKALKERMIHSVMPRIIADDLMKQGDEESENSVKRHATSSPKNRKKKSSIQKAPIAFRPFKMQQIEEVSILFADIVGFTKMSANKSAHALVGLLNDLFGRFDRLCEETKCEKISTLGDCYYCVAGCPEPRADHAYCCIEMGLGMIRAIEQFCQEKKEMVNMRVGVHTGTVLCGILGMRRFKFDVWSNDVNLANLMEQLGVAGKVHISEATAKYLDDRYEMEDGKVTERLGQSVVADQLKGLKTYLIAGQRAKESHCSCSEALLSGFEVLDGSRVSSGPRGQGTASPGSVSDLAQTVKTFDNLKTCPSCGITFTPKPEAGAEGGAVQNGCQEEPKNSAKASGGPSSKTQNGLLSPPPEEKLTNSQTSLCEILQEKGRWAGVSLDQSALLPLRFKNIREKTDAHFVDVIKEDSLMKDYFFKPPINQFSLNFLDPELERAYRTSYQEEVVKSSPVRTFASATFSSLLDVLLSTTVFLILSITCFLRYGAASTPPPPAALAVFGAALLLEILSLVVSVRMVFFLEDVMTCTKRLLEWIAGWLPRHFIGAILVSLPALAVYSHVTSEFETNIHSTMFTGSAVLTAVVQYCNFCQLSSWMRSSLATVVGAGPLLLLLYVSLCPDSSTVISHLDAVQNFSSTRKLCNASLPHDGRSPASLIGQEVILVFFLLLLLVWFLNREFEVSYRLHYHGDVEADLHRTKIQSMRDQADWLLRNIIPYHVAEQLKVSQTYSKNHDSGGVIFASIVNFSEFYEENYEGGKECYRVLNELIGDFDELLSKPDYSSIEKIKTIGATYMAASGLNATQCRDGSHPQEHLQILFEFAKEMMRVVDDFNNNMLWFNFKLRVGFNHGPLTAGVIGTTKLLYDIWGDTVNIASRMDTTGVECRIQVSEESYRVLSKMGYEFDYRGTVNVKGKGQMKTYLYPKCTDSGAAALEVLFQGPGGVSKGEELFTGVVPILVELDGDVNGHKFSVSGEGEGDATYGKLTLKFICTTGKLPVPWPTLVTTFGYGLQCFARYPDHMKQHDFFKSAMPEGYVQERTIFFKDDGNYKTRAEVKFEGDTLVNRIELKGIDFKEDGNILGHKLEYNYNSHNVYIMADKQKNGIKVNFKIRHNIEDGSVQLADHYQQNTPIGDGPVLLPDNHYLSYQSALSKDPNEKRDHMVLLEFVTAAGITLGMDELYKAASAWSHPQFEKGGGSGGGSGGSAWSHPQFEK\n>7ac8_E mol:protein length:253  Imidazole glycerol phosphate synthase subunit HisF\nMLAKRIIACLDVKDGRVVKGTNFENLRDSGDPVELGKFYSEIGIDELVFLDITASVEKRKTMLELVEKVAEQIDIPFTVGGGIHDFETASELILRGADKVSINTAAVENPSLITQIAQTFGSQAVVVAIDAKRVDGEFMVFTYSGKKNTGILLRDWVVEVEKRGAGEILLTSIDRDGTKSGYDTEMIRFVRPLTTLPIIASGGAGKMEHFLEAFLAGADAALAASVFHFREIDVRELKEYLKKHGVNVRLEGL\n>7l88_D mol:protein length:498  BG505 SOSIP MD39 - gp120\nMGILPSPGMPALLSLVSLLMGCVAETGAENLWVTVYYGVPVWKDAETTLFCASDAKAYETKKHNVWATHCCVPTDPNPQEIHLENVTEEFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLQCTNVTNNITDDMRGELKNCSFNMTTELRDKKQKVYSLFYRLDVVQINENQGNRSNNSNKEYRLINCNTSAITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGTGPCPSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVIIRSENITNNAKNILVQLNTPVQINCTRPNNNTVKSIRIGPGQWFYYTGDIIGDIRQAHCNVSKATWNETLGKVVKQLRKHFGNNTIIRFAQSSGGDLEVTTHSFNCGGEFFYCNTSGLFNSTWISNTSVQGSNSTGSNDSITLPCRIKQIINMWQRIGQAMYAPPIQGVIRCVSNITGLILTRDGGSTNSTTETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTRCKR\n>1v9w_A mol:protein length:130  putative 42-9-9 protein\nGSEGAATMATFEEVSVLGFEEFDKAVKEHESKTIFAYFSGSKDTEGKSWCPDCVEAEPVIREGLKHVTEDCVFIYCQVGDKPYWKDPNNDFRQKLKITAVPTLLKYGTPQKLVESECCQSSLVEMIFSED\n>7uck_M mol:protein length:138  60S ribosomal protein L14\nVFRRFVEVGRVAYVSFGPHAGKLVAIVDVIDQNRALVDGPCTRVRRQAMPFKCMQLTDFILKFPHSARQKYVRKAWEKADINTKWAATRWAKKIEARERKAKMTDFDRYKVMKAKKMRNRIIKNEVKKLQRAALLKAS\n>4v9j_BU mol:protein length:117  50S ribosomal protein L20\nPRAKTGVVRRRKHKKILKLAKGYWGLRSKSFRKARETLFAAGNYAYAHRKRRKRDFRRLWIVRINAACRQHGLNYSTFIHGLKKAGIEVDRKNLADLAVREPQVFAELVERAKAAQG\n>2cvl_D mol:protein length:124  protein translation initiation inhibitor\nMEAVKTDRAPAAIGPYAQAVKAGGFVFVSGQIPLAPDGSLVEGDIRVQTERVMENLKAVLEAAGSGLSRVVQTTCFLADMEDFPGFNEVYARYFTPPYPARATVAVKALPRGVRVEVACVALAE\n>1joj_R mol:protein length:8  HEXAPEPTIDE\nXMYWYPYX\n>6w83_A mol:protein length:312  Potassium channel subfamily K member 2\nMSFSSKPTVLASRVESDSAINVMKWKTVSTIFLVVVLYLIIGATVFKALEQPQEISQRTTIVIQREKFLRAHPCVSDQELDELIQQIVAAINAGIIPLGASSNQVSHWDLGSSFFFAGTVITTIGFGNISPRTEGGKIFCIIYALLGIPLFGFLLAGVGDQLGTIFGKGIAKVEDTFIKWNVSQTKIRIISTIIFILFGCVLFVALPAVIFKHIEGWSALDAIYFVVITLTTIGFGDYVAGGSDIEYLDFYKPVVWFWILVGLAYFAAVLSMIGDWLRVIAKKTKEAVGEFRAHAAEWTANVTSNSLEVLFQ\n>3ijj_B mol:protein length:114  Macrophage migration inhibitory factor\nPMFIVNTNVPRASVPDGFLSELTQQLAQATGKPPQYIAVHVVPDQLMAFGGSSEPCALCSLHSIGKIGGAQNRSYSKLLCGLLAERLRISPDRVYINYYDMNAANVGWNNSTFA\n>5c54_F mol:protein length:312  Dihydrodipicolinate synthase/N-acetylneuraminate lyase\nMASATFTGVIPPVMTPLHADGSVDVESLRKLVDHLINGGVDGLFALGSSGEAAFLTRAQRKLALTTIIEHTAGRVPVTAGVIETTTARVIELVEDALEAGAEGLVATAPFYTRTHDVEIEEHFRKIHAAAPELPLFAYNIPVSVHSNLNPVMLLTLAKDGVLAGTKDSSGNDGAIRSLIEARDDAGLTEQFKILTGSETTVDFAYLAGADGVVPGLGNVDPAAYAALAKLCLDGKWAEAAALQKRINHLFHIVFVGDTSHMSGSSAGLGGFKTALAHLGIIESNAMAVPHQSLSDEETARIHAIVDEFLYTA\n>6kuo_A mol:protein length:300  Poly(ethylene terephthalate) hydrolase\nMGSSHHHHHHSSGLVPRGSHMRGPNPTAASLEASAGPFTVRSFTVSRPSGYGAGTVYYPTNAGGTVGAIAIVPGYTARQSSIKWWGPRLASHGFVVITIDTNSTLDQPSSRSSQQMAALRQVASLNGTSSSPIYGKVDTARMGVMGWSMGGGGSLISAANNPSLKAAAPQAPWDSSTNFSSVTVPTLIFACENDSIAPVNSSALPIYDSMSRNAKQFLEINGGSHSCANSGNSDQALIGKKGVAWMKRFMDNDTRYSTFACENPNSTRVSDFRTANCSLEDPAANKARKEAELAAATAEQ\n>1dmh_B mol:protein length:311  CATECHOL 1,2-DIOXYGENASE\nMEVKIFNTQDVQDFLRVASGLEQEGGNPRVKQIIHRVLSDLYKAIEDLNITSDEYWAGVAYLNQLGANQEAGLLSPGLGFDHYLDMRMDAEDAALGIENATPRTIEGPLYVAGAPESVGYARMDDGSDPNGHTLILHGTIFDADGKPLPNAKVEIWHANTKGFYSHFDPTGEQQAFNMRRSIITDENGQYRVRTILPAGYGCPPEGPTQQLLNQLGRHGNRPAHIHYFVSADGHRKLTTQINVAGDPYTYDDFAYATREGLVVDAVEHTDPEAIKANDVEGPFAEMVFDLKLTRLVDGVDNQVVDRPRLAV\n>3j3q_53 mol:protein length:231  capsid protein\nPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIEPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVL\n>6q8y_BH mol:protein length:172  60S ribosomal protein L20-A\nMAHFKEYQVIGRRLPTESVPEPKLFRMRIFASNEVIAKSRYWYFLQKLHKVKKASGEIVSINQINEAHPTKVKNFGVWVRYDSRSGTHNMYKEIRDVSRVAAVETLYQDMAARHRARFRSIHILKVAEIEKTADVKRQYVKQFLTKDLKFPLPHRVQKSTKTFSYKRPSTFY\n>7wu9_S mol:protein length:255  scFv16\nDVQLVESGGGLVQPGGSRKLSCSASGFAFSSFGMHWVRQAPEKGLEWVAYISSGSGTIYYADTVKGRFTISRDDPKNTLFLQMTSLRSEDTAMYYCVRSIYYYGSSPFDFWGQGTTLTVSSGGGGSGGGGSGGGGSDIVMTQATSSVPVTPGESVSISCRSSKSLLHSNGNTYLYWFLQRPGQSPQLLIYRMSNLASGVPDRFSGSGSGTAFTLTISRLEAEDVGVYYCMQHLEYPLTFGAGTKLELKGENLYFQ\n>1rxo_H mol:protein length:475  RIBULOSE BISPHOSPHATE CARBOXYLASE/OXYGENASE\nMSPQTETKASVGFKAGVKDYKLTYYTPEYETLDTDILAAFRVSPQPGVPPEEAGAAVAAESSTGTWTTVWTDGLTNLDRYKGRCYHIEPVAGEENQYICYVAYPLDLFEEGSVTNMFTSIVGNVFGFKALRALRLEDLRIPVAYVKTFQGPPHGIQVERDKLNKYGRPLLGCTIKPKLGLSAKNYGRAVYECLRGGLDFTKDDENVNSQPFMRWRDRFLFCAEALYKAQAETGEIKGHYLNATAGTCEDMMKRAVFARELGVPIVMHDYLTGGFTANTTLSHYCRDNGLLLHIHRAMHAVIDRQKNHGMHFRVLAKALRLSGGDHIHSGTVVGKLEGERDITLGFVDLLRDDYTEKDRSRGIYFTQSWVSTPGVLPVASGGIHVWHMPALTEIFGDDSVLQFGGGTLGHPWGNAPGAVANRVALEACVQARNEGRDLAREGNTIIREATKWSPELAAACEVWKEIKFEFPAMDTV\n>6lkh_A mol:protein length:294  ABC transporter, solute-binding protein\nNVLTVYSPYQSNLIRPILNEFEKQEHVKIEIKHGSTQVLLSNLHNEDFSERGDVFMGGVLSETIDHPEDFVPYQDTSVTQQLEDYRSNNKYVTSFLLMPTVIVVNSDLQGDIKIRGYQDLLQPILKGKIAYSNPNTTTTGYQHMRAIYSMHHRVSDVHQFQNHAMQLSKTSKVIEDVAKGKYYAGLSYEQDARTWKNKGYPVSIVYPIEGTMLNVDGIALVKNAHPHPKRKKLVQYLTSRSVQQRLVAEFDAKSIRKDVSEQSDQSIENLKNIPLIPKSKLPDIPHHKFLEMIQ\n>2pnv_A mol:protein length:43  Small conductance calcium-activated potassium channel protein 2\nGSHMNIMYDMISDLNERSEDFEKRIVTLETKLETLIGSIHALP\n>5uyk_Q mol:protein length:80  30S ribosomal protein S17\nKIRTLQGRVVSDKMEKSIVVAIERFVKHPIYGKFIKRTTKLHVHDENNECGIGDVVEIRECRPLSKTKSWTLVRVVEKAV\n>7mtw_q mol:protein length:518  Capsid protein VP1\nDGVGSSSGNWHCDSQWLGDRVITTSTRTWALPTYNNHLYKQISNSTSGGSSNDNAYFGYSTPWGYFDFNRFHCHFSPRDWQRLINNNWGFRPKRLNFKLFNIQVKEVTDNNGVKTIANNLTSTVQVFTDSDYQLPYVLGSAHEGCLPPFPADVFMIPQYGYLTLNDGSQAVGRSSFYCLEYFPSQMLRTGNNFQFSYEFENVPFHSSYAHSQSLDRLMNPLIDQYLYYLSKTINGSGQNQQTLKFSVAGPSNMAVQGRNYIPGPSYRQQRVSTTVTQNNNSEFAWPGASSWALNGRNSLMNPGPAMASHKEGEDRFFPLSGSLIFGKQGTGRDNVDADKVMITNEEEIKTTNPVATESYGQVATNHQSAQAQAQTGWVQNQGILPGMVWQDRDVYLQGPIWAKIPHTDGNFHPSPLMGGFGMKHPPPQILIKNTPVPADPPTAFNKDKLNSFITQYSTGQVSVEIEWELQKENSKRWNPEIQYTSNYYKSNNVEFAVNTEGVYSEPRPIGTRYLTRNL\n>7jg2_D mol:protein length:355  Igh protein\nWGQGTLVTVSAESARNPTIYPLTLPPALSSDPVIIGCLIHDYFPSGTMNVTWGKSGKDITTVNFPPALASGGRYTMSSQLTLPAVECPEGESVKCSVQHDSNPVQELDVNCSGPTPPPPITIPSCQPSLSLQRPALEDLLLGSDASITCTLNGLRNPEGAVFTWEPSTGKDAVQKKAVQNSCGCYSVSSVLPGCAERWNSGASFKCTVTHPESGTLTGTIAKVTVNTFPPQVHLLPPPSEELALNELLSLTCLVRAFNPKEVLVRWLHGNEELSPESYLVFEPLKEPGEGATTYLVTSVLRVSAETWKQGDQYSCMVGHEALPMNFTQKTIDRLSGKPTNVSVSVIMSEGDGICY\n>6boh_DA mol:protein length:54  50S ribosomal protein L33\nMASEVRIKLLLECTECKRRNYATEKNKRNTPNKLELRKYCPWCRKHTVHREVKI\n>6j3h_D mol:protein length:264  Glutathione S-transferase\nGLVPRGSHMIQQIHFYDIPRNRDEDDRTWNPNTSKTRLTLTYKRLPYKTIWVEYPDIERVCKEIGAEPSAFGLLKEGKPYYSLPVIHDPNTGTTISDSIRIARYLDKTYPDTPAVIPAELEAFHAVFEDAFWDTIFMPLFPFLVPAACPQLNPRSEAYFRETREGKFGSILGGKMENWAPTGPVRDDRWKALQAGFTKMAGWLSADGQERPFFMGEKLCYTDIVVGAWLISVKKVFGSDHPEWLQVEKWDGGRWSRLVQVVENF\n>3tty_C mol:protein length:675  Beta-galactosidase\nMINEKFPKIWYGGDYNPEQWDKATMEEDMRMFNLAGIDVATVNVFSWAKIQRDEVSYDFTWLDDIIERLTKENIYLCLATSTGAHPAWMAKKYPDVLRVDYEGRKRKFGGRHNSCPNSPTYRKYAKILAGKLAERYKDHPQIVMWHVSNEYGGYCYCDNCEKQFRVWLKERYGTLEALNKAWNTSFWSHTFYDWDEIVAPNALSEEWSGNRTNFQGISLDYRRFQSDSLLECFKMERDELKRWTPDIPVTTNLMGFYPELDYFKWAKEMDVVSWDNYPSMDTPFSFTAMAHNLMRGLKSGQPFMLMEQTPGVQNWQPYNSAKRPGVMRLWSYQAVAHGADTVMFFQLRRSVGACEKYHGAVIEHVGHEHTRVFRECAELGKELQQLGDTILDARSEAKVAVMYDWENRWALELSSGPSIALNYVNEVHKYYDALYKQNIQTDMISVEEDLSKYKVVIAPVMYMVKPGFAERVERFVAQGGTFVTTFFSGIVNENDLVTLGGYPGELRNVMGIWAEEIDALLPGHQNEIVLRQDWGGLRGSYSCGILCDVIHAETAEVLAEYGADYYKGTPVLTRNKFGNGQSYYVASSPDADFLQGLIANLCEEQGVKPLLNTPDGVEVAERVKNGTSYLFVMNHNAEEMTFDAGASRQRDLLTGKTISGQATIPARGVMILERA\n>4adj_C mol:protein length:473  E1 ENVELOPE GLYCOPROTEIN\nEEAFTYLCTAPGCATQTPVPVRLAGVRFESKIVDGGCFAPWDLEATGACICEIPTDVSCEGLGAWVPTAPCARIWNGTQRACTFWAVNAYSSGGYAQLASYFNPGGSYYKQYHPTACEVEPAFGHSDAACWGFPTDTVMSVFALASYVQHPHKTVRVKFHTETRTVWQLSVAGVSCNVTTEHPFCNTPHGQLEVQVPPDPGDLVEYIMNYTGNQQSRWGLGSPNCHGPDWASPVCQRHSPDCSRLVGATPERPRLRLVDADDPLLRTAPGPGEVWVTPVIGSQARKCGLHIRAGPYGHATVEMPEWIHAHTTSDPWHPPGPLGLKFKTVRPVALPRALAPPRNVRVTGCYQCGTPALVEGLAPGGGNCHLTVNGEDVGAFPPGKFVTAALLNTPPPYQVSCGGESDRASARVIDPAAQSFTGVVYGTHTTAVSETRFEDDDDKAGWSHPQFEKGGGSGGGSGGGSWSHPQFEK\n>5d80_F mol:protein length:517  V-type proton ATPase subunit B\nMVLSDKELFAINKKAVEQGFNVKPRLNYNTVSGVNGPLVILEKVKFPRYNEIVNLTLPDGTVRQGQVLEIRGDRAIVQVFEGTSGIDVKKTTVEFTGESLRIPVSEDMLGRIFDGSGRPIDNGPKVFAEDYLDINGSPINPYARIYPEEMISTGVSAIDTMNSIARGQKIPIFSASGLPHNEIAAQICRQAGLVRPTKDVHDGHEENFSIVFAAMGVNLETARFFKQDFEENGSLERTSLFLNLANDPTIERIITPRLALTTAEYLAYQTERHVLTILTDMSSYADALREVSAAREEVPGRRGYPGYMYTDLSTIYERAGRVEGRNGSITQIPILTMPNDDITHPIPDLTGYITEGQIFVDRQLHNKGIYPPINVLPSLSRLMKSAIGEGMTRKDHGDVSNQLYAKYAIGKDAAAMKAVVGEEALSIEDKLSLEFLEKFEKTFITQGAYEDRTVFESLDQAWSLLRIYPKEMLNRISPKILDEFYDRARDDADEDEEDPDTRSSGKKKDASQEESLI\n>5fxy_H mol:protein length:85  METASTASIS-ASSOCIATED PROTEIN MTA1\nGAAMKTRQAFYLHTTKLTRIARRLCREILRPWHAARHPYLPINSAAIKAECTARLPEASQSPLVLKQAVRKPLEAVLRYLETHPR\n>1gav_5 mol:protein length:129  BACTERIOPHAGE GA PROTEIN CAPSID\nATLRSFVLVDNGGTGNVTVVPVSNANGVAEWLSNNSRSQAYRVTASYRASGADKRKYTIKLEVPKIVTQVVNGVELPVSAWKAYASIDLTIPIFAATDDVTVISKSLAGLFKVGNPIAEAISSQSGFYA\n>6zkb_k mol:protein length:355  NADH dehydrogenase [ubiquinone] 1 alpha subcomplex subunit 10, mitochondrial\nMALRFLRLVPASAASRGLAAVPPRVGGIHTSVQRKLQYGPLAYILGEKTTKKMTENSKLITVDGNICSGKSKLAKEVAEKLGLKHFPEAGIHYADSTTGDGKPLPVRFSGNCSLEKFYDDPKSNDGNSYRLQAWLYASRLLQYADALEHLLSTGQGVVLERSIYSDFVFLEAMYRQGFIRKQCVDHYNQVKKVTVCEYLPPHVVIYVDVPVSEVQSRIQKKGNPHEMKITSAYLQDIENVYKGTFLPEMSEKCEVLQYSAWEAEDAEKVVEDIQYLKYDKGPWLDQDDRKLHNLRMLVQDKLEVLNYTSIPVFLPEVTIGAHQSDRVFQEFTELPGRKYRAGYNEDVGDKWIWLK\n>3kts_A mol:protein length:192  Glycerol uptake operon antiterminator regulatory protein\nMSLELPFSNQSIIPAAHNQKDMEKILELDLTYMVMLETHVAQLKALVKYAQAGGKKVLLHADLVNGLKNDDYAIDFLCTEICPDGIISTRGNAIMKAKQHKMLAIQRLFMIDSSAYNKGVALIQKVQPDCIELLPGIIPEQVQKMTQKLHIPVIAGGLIETSEQVNQVIASGAIAVTTSNKHLWEGHHHHHH\n>1tqb_C mol:protein length:219  VRQ14 Fab light chain\nDVVMSQTPLTLSVTIGQPASISCKSSQSLLDSDGKTYLNWLLQRPGQSPKRLIYLVSRLDSGVPDRFTGSGSGTDFTLKISRVEAEDLGIYFCWQGSHFPQTFGGGTKLEIKRADAAPTVSIFPPSSEQLTSGGASVVCFLNNFYPKDINVKWKIDGSERQNGVLNSWTDQDSKDSTYSMSSTLTLTKDEYERHNSYTCEATHKTSTSPIVKSFNRNEC\n>5tbw_l mol:protein length:361  60S ribosomal protein L4-A\nSRPQVTVHSLTGEATANALPLPAVFSAPIRPDIVHTVFTSVNKNKRQAYAVSEKAGHQTSAESWGTGRAVARIPRVGGGGTGRSGQGAFGNMCRGGRMFAPTKTWRKWNVKVNHNEKRYATASAIAATAVASLVLARGHRVEKIPEIPLVVSTDLESIQKTKEAVAALKAVGAHSDLLKVLKSKKLRAGKGKYRNRRWTQRRGPLVVYAEDNGIVKALRNVPGVETANVASLNLLQLAPGAHLGRFVIWTEAAFTKLDQVWGSETVASSKVGYTLPSHIISTSDVTRIINSSEIQSAIRPAGQATQKRTHVLKKNPLKNKQVLLRLNPYAKVFAAEKLGSKKAEKTGTKPAAVFTETLKHD\n>2z6i_B mol:protein length:332  Trans-2-enoyl-ACP reductase II\nMKTRITELLKIDYPIFQGGMAWVADGDLAGAVSKAGGLGIIGGGNAPKEVVKANIDKIKSLTDKPFGVNIMLLSPFVEDIVDLVIEEGVKVVTTGAGNPSKYMERFHEAGIIVIPVVPSVALAKRMEKIGADAVIAEGMEAGGHIGKLTTMTLVRQVATAISIPVIAAGGIADGEGAAAGFMLGAEAVQVGTRFVVAKESNAHPNYKEKILKARDIDTTISAQHFGHAVRAIKNQLTRDFELAEKDAFKQEDPDLEIFEQMGAGALAKAVVHGDVDGGSVMAGQIAGLVSKEETAEEILKDLYYGAAKKIQEEASRWTGVVRNDLEHHHHHH\n>6o7a_B mol:protein length:554  Ion channel CASTOR\nMAKGKSEVVEQNHTLILGWSDKLGSLLNQLAIANESLGGGTIAVMAERDKEDMELDIGKMEFDFKGTSVICRSGSPLILADLKKVSVSKARTIIVLAEDGNADQSDARALRTVLSLTGVKEGLRGHIVVEMSDLDNEVLVKLVGGDLVETVVAHDVIGRLMIQCARQPGLAQIWEDILGFENCEFYIKRWPQLDGMLFEDVLISFPAAIPCGIKVASYGGKIILNPDDSYVLQEGDEVLVIAEDDDTYAPAPLPMVRRGSLPKDFVYPKSPERILFCGWRRDMEDMITVLDASLAPDSELWMFNDVPEKEREKKLIDGGLDISRLENISLVNREGNAVIRRHLESLPLESFDSILILADESVEDSAIQADSRSLATLLLIRDIQARRLPYVAMASQTQGGNFSKGSWIGEMKQASDKTVIISEILDPRTKNLLSMSKISDYVLSNELVSMALAMVAEDRQINDVLEELFAEEGNEMHIRQADIYLREGEEMSFYEIMLRARQRREILIGYRLANAERAVINPPAKTGRRKWSLKDVFVVITEKEGSRSHHHHHH\n>3j3q_6T mol:protein length:231  capsid protein\nPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIEPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVL\n>7ls9_G mol:protein length:215  1-57 Fab light chain\nEIVLTQSPGTLSLSPGERATLSCRASQSVSSSYLAWYQQKPGQAPRLLIYGASSRATGIPDRFSGSGSGTDFTLTISRLEPEDFAVYYCQQYGSSPSTFGQGTKLEIKRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC\n>2v2z_A mol:protein length:271  4-DIPHOSPHOCYTIDYL-2C-METHYL-D-ERYTHRITOL KINASE\nGSHMIKVLSPAKINLGLWVLGRLPSGYHEILTLYQEIPFYDEIYIREGVLRVETNIGIPQEENLVYKGLREFERITGIEINYSIFIQKNIPPGAGLGGGSSNLAVVLKKVNELLGSPLSEEELRELVGSISADAPFFLLGKSAIGRGKGEVLEPVETEISGKITLVIPQVSSSTGRVYSSLREEHFVTPEYAEEKIQRIISGEVEEIENVLGDIARELYPEINEVYRFVEYLGFKPFVSGSGSTVYFFGGASEELKKAAKMRGWKVVELEL\n>2jhu_B mol:protein length:138  RHO GDP-DISSOCIATION INHIBITOR 1\nAMVPNVVVTGLTLVCSSAPGPLELDLTGDLESFKKQSFVLKEGVEYRIKISFRVNREIVSGMKYIQHTYRKGVKIDKTDYMVGSYGPRAAAYEFLTPVEEAPKGMLARGSYSIKSRFTDDDKTDHLSWEWNLTIKKDW\n>6bet_A mol:protein length:12  H(DPR)(DVA)CIP(DPR)E(DLY)VC(DGL)\nHPVCIPPEKVCE\n>7r3v_D mol:protein length:239  Cytochrome c1, heme protein, mitochondrial\nDLELHPPSYPWSHRGLLSSLDHTSIRRGFQVYKQVCSSCHSMDYVAYRHLVGVCYTEDEAKALAEEVEVQDGPNEDGEMFMRPGKLSDYFPKPYPNPEAARAANNGALPPDLSYIVRARHGGEDYVFSLLTGYCEPPTGVSLREGLYFNPYFPGQAIGMAPPIYNEVLEFDDGTPATMSQVAKDVCTFLRWAAEPEHDHRKRMGLKMLLMMGLLLPLVYAMKRHKWSVLKSRKLAYRPP\n>3e21_A mol:protein length:45  FAS-associated factor 1\nGSMDREMILADFQACTGIENIDEAITLLEQNNWDLVAAINGVIPQ\n>6gcv_C mol:protein length:146  Chemotaxis transducer\nSGLVPAGSHMYLSMSISPETINVAGAQRMLSQKMAREALQLRLGAGDPKALAATIAQYERSAADLDAGNAERNVSRMGAPEIAAQRQKVAQIWGRYRAMLDQVAQPASQVDLRGFSQYSTELLGELNNLVSLMSARADSVQHTQMW\n>6ev1_A mol:protein length:220  Heavy chain\nEVQLQQSGAELAKPGASVKMSCKASGYTFTSYWMHWVKQRPGQGLEWIGYINPSTGYTEYNQKFKDKATLTADKSSSTAYMQLSSLTSEDSAVYYCAPLWPLGTDYWGQGTTLTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSC\n>6pbz_D mol:protein length:494  Guanosine-5'-triphosphate,3'-diphosphate pyrophosphatase\nMGSTSSLYAAIDLGSNSFHMLVVREVAGSIQTLTRIKRKVRLAAGLNSENALSNEAMERGWQCLRLFAERLQDIPPSQIRVVATATLRLAVNAGDFIAKAQEILGCPVQVISGEEEARLIYQGVAHTTGGADQRLVVDIGGASTELVTGTGAQTTSLFSLSMGCVTWLERYFADRNLGQENFDAAEKAAREVLRPVADELRYHGWKVCVGASGTVQALQEIMMAQGMDERITLEKLQQLKQRAIHCGRLEELEIDGLTLERALVFPSGLAILIAIFTELNIQCMTLAGGALREGLVYGMLHLAVEQDIRSRTLRNIQRRFMIDIDQAQRVAKVAANFFDQVENEWHLEAISRDLLISACQLHEIGLSVDFKQAPQHAAYLVRNLDLPGFTPAQKKLLATLLLNQTNPVDLSSLHQQNAVPPRVAEQLCRLLRLAIIFASRRRDDLVPEMTLQANHELLTLTLPQGWLTQHPLGKEIIAQESQWQSYVHWPLEVH\n>5k00_A mol:protein length:335  Maternal embryonic leucine zipper kinase\nMDYDELLKYYELHETIGTGGFAKVKLACHILTGEMVAIKIMDKNTLGSDLPRIKTEIEALKNLRHQHICQLYHVLETANKIFMVLEYCPGGELFDYIISQDRLSEEETRVVFRQIVSAVAYVHSQGYAHRDLKPENLLFDEYHKLKLIDFGLCAKPKGNKDYHLQTCCGSLAYAAPELIQGKSYLGSEADVWSMGILLYVLMCGFLPFDDDNVMALYKKIMRGKYDVPKWLSPSSILLLQQMLQVDPKKRISMKNLLNHPWIMQDYNYPVEWQSKNPFIHLDDDCVTELSVHHRNNRQTMEDLISLWQYDHLTATYLLLLAKKARGKPVHHHHHH\n>7xtb_R mol:protein length:584  Soluble cytochrome b562,5-hydroxytryptamine receptor 6\nDYKDDDDAKLQTMHHHHHHHHHHHHHHHADLEDNWETLNDNLKVIEKADNAAQVKDALTKMRAAALDAQKATPPKLEDKSPDSPEMKDFRHGFDILVGQIDDALKLANEGKVKEAQAAAEQLKTTRNAYIQKYLASENLYFQGGTVPEPGPTANSTPAWGAGPPSAPGGSGWVAAALCVVIALTAAANSLLIALICTQPALRNTSNFFLVSLFTSDLMVGLVVMPPAMLNALYGRWVLARGLCLLWTAFDVMCCSASILNLCLISLDRYLLILSPLRYKLRMTPLRALALVLGAWSLAALASFLPLLLGWHELGHARPPVPGQCRLLASLPFVLVASGLTFFLPSGAICFTYCRILLAARKQAVQVASLTTGMASQASETLQVPRTPRPGVESADSRRLATKHSRKALKASLTLGILLGMFFVTWLPFFVANIVQAVCDCISPGLFDVLTWLGYCNSTMNPIIYPLFMRDFKRALGRFLPCPRCPRERQASLASPSLRTSHSGPRPGLSLQQVLPLPLPPDSDSDSDAGSGGSSGLRLTAQLLLPGEATQDPPLPTRAAAAVNFFNIDPAEPELRPHPLGIPTN\n>6y35_C mol:protein length:119  CCAAT-binding factor complex subunit HapE\nMGTWANVNQGLQGTARDILTTYWQHIINHLESDNHDYKIHQLPLARIKKVMKADPEVKMISAEAPILFAKGCDIFITELTMRAWIHAEDNKRRTLQRSDIAAALSKSDMFDFLIDIVPR\n>1bcf_L mol:protein length:158  BACTERIOFERRITIN\nMKGDTKVINYLNKLLGNELVAINQYFLHARMFKNWGLKRLNDVEYHESIDEMKHADRYIERILFLEGLPNLQDLGKLNIGEDVEEMLRSDLALELDGAKNLREAIGYADSVHDYVSRDMMIEILRDEEGHIDWLETELDLIQKMGLQNYLQAQIREEG\n>3oqm_A mol:protein length:339  Catabolite control protein A\nMNITIYDVAREANVSMATVSRVVNGNPNVKPTTRKKVLEAIERLGYRPNAVARGLASKKTTTVGVIIPDISSIFYSELARGIEDIATMYKYNIILSNSDQNMEKELHLLNTMLGKQVDGIVFMGGNITDEHVAEFKRSPVPIVLAASVEEQEETPSVAIDYEQAIYDAVKLLVDKGHTDIAFVSGPMAEPINRSKKLQGYKRALEEANLPFNEQFVAEGDYTYDSGLEALQHLMSLDKKPTAILSATDEMALGIIHAAQDQGLSIPEDLDIIGFDNTRLSLMVRPQLSTVVQPTYDIGAVAMRLLTKLMNKEPVEEHIVELPHRIELRKSTKSHHHHHH\n>6epf_4 mol:protein length:201  Proteasome subunit beta type-2\nMEYLIGIQGPDYVLVASDRVAASNIVQMKDDHDKMFKMSEKILLLCVGEAGDTVQFAEYIQKNVQLYKMRNGYELSPTAAANFTRRNLADCLRSRTPYHVNLLLAGYDEHEGPALYYMDYLAALAKAPFAAHGYGAFLTLSILDRYYTPTISRERAVELLRKCLEELQKRFILNLPTFSVRVIDKDGIHNLENITFTKRSS\n>6t7g_CCC mol:protein length:674  Glyco_hydro_42M domain-containing protein\nMGSSHHHHHHSSGLEVLFQGPAERISKQSTPFVGAQIFIEPGQTQEQIEQWFKLLAESNMTTCRIRMFGKYMKTPSGTYDFTLFDRAFKLADKYHIKVYATLFPDTEFTDVGGFKFPHSREHQKEVEDYIKNVVSHFSQYKNLAAWVLINEPGTPNLPFNEPFTKERFSDWKKEHNFSEYNEKGYPVLNFEKENFIIDYHNWYLNWLANQVRLYDKQHDLHVNPHNVFKLSGLYDFPTWRTFLNSLGGSAHASWHFGYFPRKAYTVAMSANAELIRSGAGELPWLMTELQGGNNLYSGANPLCPTAEEIIQWLWINFATEAKGGIFWSFNARSTAAEAGEWAMINFKNKSSDRLIAAATIGKFITENVKMMSNIKTLNSGISILYNHESMWVEAAQTRGKLNGNGRSIGAVMCSPLSYFEALSETGLQANFKEIKEFDFSLNDYTDQVIILSHQIALDNKVIKQLESFVEKGGTLIADGLTGYYDYQAHSTVVSGFALENLFGSYPIEYKIKENLFSLDFEKDNYKLPAHLWKGTIETSKATPIMDKEGECIACINQYGKGKVFWIPSPIALGARESKDFSELSKLTVSLLPNKILNDNPHFDKHYKDVMMKSFKSNGTMYSLIINKSASVQTVDIVGGKGKAFILFANKNAHSTANKLTISPEETVIIKWKNN\n>5ysl_F mol:protein length:215  1H1 light chain\nDIILTQSPAIMSASLGERVTLTCTASSSVSSSYLHWYQQKPGSSPKLWIYSTYNLAGAVPPRFSGSGSGTSYSLTISSMEAEDAATYYCQQYHRSPWTFGGGTKLEIKRADAAPTVSIFPPSSEQLTSGGASVVCFLNNFYPKDINVKWKIDGSERQNGVLNSWTDQDSKDSTYSMSSTLTLTKDEYERHNSYTCEATHKTSTSPIVKNFNRNEC\n>5ydz_C mol:protein length:580  mammalian endo-lysosomal TRPML1 channel\nMATPAGRRASETERLLTPNPGYGTQVGTSPAPTTPTEEEDLRRRLKYFFMSPCDKFRAKGRKPCKLMLQVVKILVVTVQLILFGLSNQLVVTFREENTIAFRHLFLLGYSDGSDDTFAAYTQEQLYQAIFYAVDQYLILPEISLGRYAYVRGGGGPWANGSALALCQRYYHRGHVDPANDTFDIDPRVVTDCIQVDPPDRPPDIPSEDLDFLDGSASYKNLTLKFHKLINVTIHFQLKTINLQSLINNEIPDCYTFSILITFDNKAHSGRIPIRLETKTHIQECKHPSVSRHGDNSFRLLFDVVVILTCSLSFLLCARSLLRGFLLQNEFVVFMWRRRGREISLWERLEFVNGWYILLVTSDVLTISGTVMKIGIEAKNLASYDVCSILLGTSTLLVWVGVIRYLTFFHKYNILIATLRVALPSVMRFCCCVAVIYLGYCFCGWIVLGPYHVKFRSLSMVSECLFSLINGDDMFVTFAAMQAQQGHSSLVWLFSQLYLYSFISLFIYMVLSLFIALITGAYDTIKHPGGTGTEKSELQAYIEQCQDSPTSGKFRRGSGSACSLFCCCGRDSPEDHSLLVN\n>6gqv_AF mol:protein length:124  40S ribosomal protein S15\nKKRVFKTHSYRGVDLEKLLEMSTEDFVKLAPARVRRRFARGMTSKPAGFMKKLRAAKLAAPENEKPAPVRTHMRNMIIVPEMIGSVVGIYNGKAFNQVEIRPEMLGHYLGEFSITYTPVRHGRA\n>3is7_S mol:protein length:158  Bacterioferritin\nMKGDKKVIQHLNKILGNELIAINQYFLHSRMWNDWGLKRLGAHEYHESIDEMKHADKLIERILFLEGLPNLQDLGKLLIGENTQEMLQCDLNLELKATKDLREAIVHCEQVHDYVSRDLLKDILESEEEHIDYLETQLGLIQKVGLENYLQSHMHEDD\n>3g5f_A mol:protein length:396  Cytochrome P450 121\nMTATVLLEVPFSARGDRIPDAVAELRTREPIRKVRTITGAEAWLVSSYALCTQVLEDRRFSMKETAAAGAPRLNALTVPPEVVNNMGNIADAGLRKAVMKAITPKAPGLEQFLRDTANSLLDNLITEGAPADLRNDFADPLATALHCKVLGIPQEDGPKLFRSLSIAFMSSADPIPAAKINWDRDIEYMAGILENPNITTGLMGELSRLRKDPAYSHVSDELFATIGVTFFGAGVISTGSFLTTALISLIQRPQLRNLLHEKPELIPAGVEELLRINLSFADGLPRLATADIQVGDVLVRKGELVLVLLEGANFDPEHFPNPGSIELDRPNPTSHLAFGRGQHFCPGSALGRRHAQIGIEALLKKMPGVDLAVPIDQLVWRTRFQRRIPERLPVLW\n>6wdh_l mol:protein length:143  50S ribosomal protein L15\nRLNTLSPAEGSKKAGKRLGRGIGSGLGKTGGRGHKGQKSRSGGGVRRGFEGGQMPLYRRLPKFGFTSRKAAITAEIRLSDLAKVEGGVVDLNTLKAANIIGIQIEFAKVILAGEVTTPVTVRGLRVTKGARAAIEAAGGKIEE\n>3ej7_D mol:protein length:70  Beta-subunit of trans-3-chloroacrylic acid dehalogenase\nPFIECHIATGLSVARKQQLIRDVIDVTNKSIGSDPKIINVLLVEHAEANMSISGRIHGEAASTERTPAVS\n>5t5h_e mol:protein length:245  60S ribosomal protein L2\nGKTVLTCRKGNGSIYQVHGHKRLGPAKLRILDYAERHGFMRGVVKTIEHEPGRGAPLARVEFRHPYKYRRVKELMVAPEGMFTGQSVLCGVKAPLAIGNVLPLGQITEGCIVCNVEAKVGDRGTIARASGDYCIIISHNHETGRTRLKLPSGQKKTVPSNCRAMIGIIAGGGRIEKPVLKAGNSFYRFRGKRNCWPKVRGVARNPVEHPHGGGNHQHIGHPSTVSRHAPPGQKVGLIAARRTGRI\n>6nsh_XJ mol:protein length:105  30S ribosomal protein S10\nMPKIRIKLRGFDHKTLDASAQKIVEAARRSGAQVSGPIPLPTRVRRFTVIRGPFKHKDSREHFELRTHNRLVDIINPNRKTIEQLMTLDLPTGVEIEIKTVGGGR\n>5lnn_A mol:protein length:206  Histidine kinase CKI1\nGSSHHHHHHSSGLVPRGSHMASTDSESETRVKSVRTGRKPIGNPEDEQETSKPSDDEFLRGKRVLVVDDNFISRKVATGKLKKMGVSEVEQCDSGKEALRLVTEGLTQREEQGSVDKLPFDYIFMACQMPEMDGYEATREIRKVEKSYGVRTPIIAVSGHDPGSEEARETIQAGMDAFLDKSLNQLANVIREIESKRHLEHHHHHH\n>2qxu_A mol:protein length:179  Lipase\nHNPVVMVHGIGGASFNFAGIKSYLVSQGWSRDKLYAVDFWDKTGTNYNNGPVLSRFVQKVLDETGAKKVDIVAHSMGGANTLYYIKNLDGGNKVANVVTLGGANRLTTGKALPGTDPNQKILYTSIYSSADMIVMNYLSRLDGARNVQIHGVGHIGLLYSSQVNSLIKEGLNGGGQNTN\n>1kyo_A mol:protein length:430  UBIQUINOL-CYTOCHROME C REDUCTASE COMPLEX CORE PROTEIN I\nAEVTQLSNGIVVATEHNPAHTASVGVVFGSGAANENPYNNGVSNLWKNIFLSKENSAVAAKEGLALSSNISRDFQSYIVSSLPGSTDKSLDFLNQSFIQQKANLLSSSNFEATKKSVLKQVQDFEDNDHPNRVLEHLHSTAFQNTPLSLPTRGTLESLENLVVADLESFANNHFLNSNAVVVGTGNIKHEDLVNSIESKNLSLQTGTKPVLKKKAAFLGSEVRLRDDTLPKAWISLAVEGEPVNSPNYFVAKLAAQIFGSYNAFEPASRLQGIKLLDNIQEYQLCDNFNHFSLSYKDSGLWGFSTATRNVTMIDDLIHFTLKQWNRLTISVTDTEVERAKSLLKLQLGQLYESGNPVNDANLLGAEVLIKGSKLSLGEAFKKIDAITVKDVKAWAGKRLWDQDIAIAGTGQIEGLLDYMRIRSDMSMMRW\n>7dbn_D mol:protein length:444  HIV-1 RT p51 subunit\nMAHHHHHHALEVLFQGPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKQKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLSKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMKGAHTNDVKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQ\n>7unu_Q mol:protein length:116  50S ribosomal protein L18\nMSVKKETRLRRARKARLKMRELETVRLCVYRSSQHIYAQVIAADGGKVLASASTLDKDLREGATGNIDAAKKVGQLVAERAKAAGVTQVAFDRSGFKYHGRVKALADAAREGGLEF\n>7lst_A mol:protein length:800  Pullulanase\nMRTTKKIVSAVLAACMLASTAVVSSFAATADDSSAVSSDYARDNSYTKAAEDIDAQYAYSGNDLGVTYTKDATTFKVWSPTATGVKLNIFTKGSDDEQGASKVASYTLEKMLVDGEWNGVWTITLVGEWKDYYYTYSVTTTDTTHIGSDATKTYETQDVYSTATGVNGKRSMIVDLDETDPEGWSNDSHVLLDKSTKSSVWELHIKDFSYDKASGVSDANRGKYLAFTENGTTLNGEGKVSTCIDYLKELGVTTVQLNPFYDFQSVNEAGDDSQFNWGYDPVNYNVPEGSYSSNPYDGKVRIKECKEMIKALHDAGISVVMDVVYNHTYSTDSCFQYTVPNYYYRMKTTGAFSDGSGCGNEGATERAMYRQYVIDSLKYWVNEYHVDGFRFALMGLMDVETMNMAREALDQIDPRITMWGEGWAGGDSYHPTNTCSGTKFYPATQANASRLSDRIAIFNDGIRDGIKGSAMDISDVGFIQGSKSSAKGVSYGVRANSSGTYKWKAQAPSQCVTYDACHDNATLYDQIIASTGLADYGERNSEAVKMNRLASAIIYTSQGISFTLAGEEMARSKDGDTNSYKSAANLNMIKWQNVVDYADVVSYYKGMMQIKSAFSPLTAMDNSYADKYTFTKKVSASTNQISFTIQNDVEGEWNKMAVIYNNATTAADVTLSDTSVTDWVVIANGETAGLDSLGEVTGSTFTVPARSAIVAVDKAGYESAGIHSSKGKVKVNYVYEATGEKLEDSVILQGSVGSGYVTVPSAVIPDTYIVSRIGGNAEGKYTSDMQEVTYYYTDYIPESL\n>4z9k_B mol:protein length:116  VHH2(F5) antibody\nVQLVESGGGLVQPGGSLRLSCAASGFTLDDYAIGWFRQVPGKEREGVACVKDGSTYYADSVKGRFTISRDNGAVYLQMNSLKPEDTAVYYCASRPCFLGVPLIDFGSWGQGTQVTV\n>7vnr_G mol:protein length:1049  Potassium voltage-gated channel subfamily KQT member 4,Maltodextrin-binding protein\nMDYKDDDDKAEAPPRRLGLGPPPGDAPRAELVALTAVQSEQGEAGGGGSPRRLGLLGSPLPPGAPLPGPGSGSGSACGQRSSAAHKRYRRLQNWVYNVLERPRGWAFVYHVFIFLLVFSCLVLSVLSTIQEHQELANECLLILEFVMIVVFGLEYIVRVWSAGCCCRYRGWQGRFRFARKPFCVIDFIVFVASVAVIAAGTQGNIFATSALRSMRFLQILRMVRMDRRGGTWKLLGSVVYAHSKELITAWYIGFLVLIFASFLVYLAEKDANSDFSSYADSLWWGTITLTTIGYGDKTPHTWLGRVLAAGFALLGISFFALPAGILGSGFALKVQEQHRQKHFEKRRMPAANLIQAAWRLYSTDMSRAYLTATWYYYDSILPSFRELALLFEHVQRARNGGLRPLEVRRAPVPDGAPSRYPPVATCHRPGSTSFCPGESSRMGIKDRIRMGSSQRRTGPSKQHLAPPTMPTSPSSEQVGEATSPTKVQKSWSFNDRTRFRASLRLKPRTSAEDAPSEEVAEEKSYQCELTVDDIMPAVKTVIRSIRILKFLVAKRKFKETLRPYDVKDVIEQYSAGHLDMLGRIKSLQTRVDQIVGRGPGDRKAREKGDKGPSDAEVVDEISMMGRVVKVEKQVQSIEHKLDLLLGFYSRCLRSGTSALEVLFQGPMAKIEEGKLVIWINGDKGYNGLAEVGKKFEKDTGIKVTVEHPDKLEEKFPQVAATGDGPDIIFWAHDRFGGYAQSGLLAEITPDKAFQDKLYPFTWDAVRYNGKLIAYPIAVEALSLIYNKDLLPNPPKTWEEIPALDKELKAKGKSALMFNLQEPYFTWPLIAADGGYAFKYENGKYDIKDVGVDNAGAKAGLTFLVDLIKNKHMNADTDYSIAEAAFNKGETAMTINGPWAWSNIDTSKVNYGVTVLPTFKGQPSKPFVGVLSAGINAASPNKELAKEFLENYLLTDEGLEAVNKDKPLGAVALKSYEEELAKDPRIAATMENAQKGEIMPNIPQMSAFWYAVRTAVINAASGRQTVDEALKDAQTNAAAEHHHHHHHHHH\n>6mng_A mol:protein length:208  4738 TCR alpha chain\nMQQVRQSPQSLTVWEGETAILNCSYENSAFDYLPWYQQFPGEGPALLIAIRSVSDKKEDGRFTIFFNKREKKLSLHITDSQPGDSATYFCAGIDTGANTGKLTFGHGTILRVHPNIQNPDPAVYQLRDSKSSDKSVCLFTDFDSQTNVSQSKDSDVYITDKCVLDMRSMDFKSNSAVAWSNKSDFACANAFNNSIIPEDTFFPSPESS\n>4r4j_A mol:protein length:366  Aspartate-semialdehyde dehydrogenase\nMGYTVAVVGATGAVGAQMIKMLEESTLPIDKIRYLASARSAGKSLKFKDQDITIEETTETAFEGVDIALFSAGSSTSAKYAPYAVKAGVVVVDNTSYFRQNPDVPLVVPEVNAHALDAHNGIIACPNCSTIQMMVALEPVRQKWGLDRIIVSTYQAVSGAGMGAILETQRELREVLNDGVKPCDLHAEILPSGGDKKHYPIAFNALPQIDVFTDNDYTYEEMKMTKETKKIMEDDSIAVSATCVRIPVLSAHSESVYIETKEVAPIEEVKAAIAAFPGAVLEDDVAHQIYPQAINAVGSRDTFVGRIRKDLDAEKGIHMWVVSDNLLKGAAWNSVQIAETLHERGLVRPTAELKFELKLEHHHHHH\n>7p7j_B mol:protein length:220  NADH-quinone oxidoreductase subunit B\nMDYTLTRIDPNGENDRYPLQKQEIVTDPLEQEVNKNVFMGKLNDMVNWGRKNSIWPYNFGLSCCYVEMVTSFTAVHDVARFGAEVLRASPRQADLMVVAGTCFTKMAPVIQRLYDQMLEPKWVISMGACANSGGMYDIYSVVQGVDKFIPVDVYIPGCPPRPEAYMQALMLLQESIGKERRPLSWVVGDQGVYRANMQSERERKRGERIAVTNLRTPDEI\n>1ocz_D mol:protein length:147  CYTOCHROME C OXIDASE\nAHGSVVKSEDYALPSYVDRRDYPLPDVAHVKNLSASQKALKEKEKASWSSLSIDEKVELYRLKFKESFAEMNRSTNEWKTVVGAAMFFIGFTALLLIWEKHYVYGPIPHTFEEEWVAKQTKRMLDMKVAPIQGFSAKWDYDKNEWKK\n>7p7q_P mol:protein length:144  50S ribosomal protein L16\nMLVPKRVKHRREFRGKMRGEAKGGKEVAFGEWGLQATESHWITNRQIEAARIAMTRYMKRGGKVWIKIFPHKSYTSKAIGVRMGKGKGAPEGWVSPVKRGKIMFEIAGVPEEVAREALRLASHKLPVKTKIVKREEMGGESNEG\n>7tqa_C mol:protein length:231  Fab S9.6 heavy chain\nEVQLQQSGPELVKPGASVKMSCKASGYTFTSYVMHWVKQKPGQGLEWIGFINLYNDGTKYNEKFKGKATLTSDKSSSTAYMELSSLTSKDSAVYYCARDYYGSRWFDYWGQGTTLTVSSAKTTAPSVYPLAPVCGDTTGSSVTLGCLVKGYFPEPVTLTWNSGSLSSGVHTFPAVLQSDLYTLSSSVTVTSSTWPSQSITCNVAHPASSTKVDKKISALPETGGGHHHHHH\n>3taz_B mol:protein length:471  DNA double-strand break repair protein nurA\nMGSSHHHHHHSSGLVPRGSHMRLLSKQSIERITKILLDELENVRENEQIRNIINSWKPLPSPEKSSIYAVDGSRSVSRLSGTVIYFLSALAVGSGKQLRLSYANAIKSNYGTSDQIVRMQMETLENMLGYLAYRKLEGEKRAILMDGTLTGSLVRPPVYPEDIRSLNVMRALIGESDFENLLNEFLEKLRDHYRKVEEHLEKNGNYDSPILTDNVVEKLRKKYIDTKVIAYGSGKVKVKIPRKALGYSPRVIPIEVLESSRGKSVDELLQELDEEKVELYLGKDDIYDALHMTLSYIEYLYSIDKLLEVKNLAYIAKSFYTKTLARTLGVEIVDTALLDAVIRTLIGHEKEGYLEIEHAVVPPKWSFPDFLLSKFRNIEKLIDKGIHLAYVRFEQGDVIYMLQSTTNIEKILPLILHHKAGGYLRPLQLAHHGVKISYKEARHTLEALINALRNRDPALKIFVKYGRSPLE\n>7uwd_a mol:protein length:823  V-type proton ATPase subunit a\nMAELQSGGGGGCCPPMDLFRSEPMQLVQIIIPIESAHLTVSYLGELGLLQFKDLNSEKSPFQRTYAAQIKKCAEMARKLRFFKEQMLKAGILSSVKSTTRADNNTDDLEVKLGDLEAELVEINANGDKLQRAHSELVEYKLVLQKAGEFFSSALTSAAAQQREMESQQTGEMTIETPLLTDKEMSADPSKQIKLGFIAGLVPREKSMSFERMLFRATRGNVFLRQAVVDEPVVDPVSGEKMEKNVFVVFYSGERAKNKILKICDAFGANRYPFNEEFDKQAQAISEVSGRLSELKTTLDAGLLHRGNLLQTIGDQFEQWNLLVKREKSIYHTLNMLSLDVTKKCLVGEGWSPVFATKQIQDALERAAFDSNSQVGAIFQVLHTKESPPTYFRTNKFTSAFQEIVDAYGVAKYREANPGVFTIVTFPFLFAVMFGDWGHGICLLLGTLVLIVREKKLASQKLDDITDMTFGGRYVILMMALFSIYTGLIYNEFFSVPFEIFSHSAYACRDLSCSEATTVGLIKVRDTYPFGVDPVWHGSRSELPFLNSLKMKMSILLGVAQMNLGIILSYFNATFFRIGVNIWCQFIPQIIFLNSLFGYLSLLIILKWITGSQADLYHVMIYMFLSPTDELGDNQLFPGQKTAQLVLLLLAFVSVPWMLLPKPFILKMQHQDRHQGQSYEALQSTDESLQPDTNHDSHGHEEFEFSEVFVHQMIHTIEFVLGAVSNTASYLRLWALSLAHSELSSVFYEKVLLLAWGYNNILILIVGIIVFIFATVGVLLVMETLSAFLHALRLHWVEFQNKFYEGDGYKFSPFSFALLDDEDE\n>2r5b_L mol:protein length:17  HIV entry inhibitor PIE7\nXKGACDYPEWQWLCAAX\n>4zzh_A mol:protein length:356  NAD-dependent protein deacetylase sirtuin-1\nGPYTFVQQHLMIGTDPRTILKDLLPETIPPPELDDMTLWQIVINILSEPPKRKKRKDINTIEDAVKLLQECKKIIVLTGAGVSVSCGIPDFRSRDGIYARLAVDFPDLPDPQAMFDIEYFRKDPRPFFKFAKEIYPGQFQPSLCHKFIALSDKEGKLLRNYTQNIDTLEQVAGIQRIIQCHGSFATASCLICKYKVDCEAVRGDIFNQVVPRCPRCPADEPLAIMKPEIVFFGENLPEQFHRAMKYDKDEVDLLIVIGSSLKVRPVALIPSSIPHEVPQILINREPLPHLHFDVELLGDCDVIINELCHRLGGEYAKLCCNPVGGGSGGGSQYLFLPPNRYIFHGAEVYSDSEDDV\n>2i03_C mol:protein length:726  Dipeptidyl peptidase 4\nSRKTYTLTDYLKNTYRLKLYSLRWISDHEYLYKQENNILVFNAEYGNSSVFLENSTFDEFGHSINDYSISPDGQFILLEYNYVKQWRHSYTASYDIYDLNKRQLITEERIPNNTQWVTWSPVGHKLAYVWNNDIYVKIEPNLPSYRITWTGKEDIIYNGITDWVYEEEVFSAYSALWWSPNGTFLAYAQFNDTEVPLIEYSFYSDESLQYPKTVRVPYPKAGAVNPTVKFFVVNTDSLSSVTNATSIQITAPASMLIGDHYLCDVTWATQERISLQWLRRIQNYSVMDICDYDESSGRWNCLVARQHIEMSTTGWVGRFRPSEPHFTLDGNSFYKIISNEEGYRHICYFQIDKKDCTFITKGTWEVIGIEALTSDYLYYISNEYKGMPGGRNLYKIQLSDYTKVTCLSCELNPERCQYYSVSFSKEAKYYQLRCSGPGLPLYTLHSSVNDKGLRVLEDNSALDKMLQNVQMPSKKLDFIILNETKFWYQMILPPHFDKSKKYPLLLDVYAGPCSQKADTVFRLNWATYLASTENIIVASFDGRGSGYQGDKIMHAINRRLGTFEVEDQIEAARQFSKMGFVDNKRIAIWGWSYGGYVTSMVLGSGSGVFKCGIAVAPVSRWEYYDSVYTERYMGLPTPEDNLDHYRNSTVMSRAENFKQVEYLLIHGTADDNVHFQQSAQISKALVDVGVDFQAMWYTDEDHGIASSTAHQHIYTHMSHFIKQCFS\n>4nb5_B mol:protein length:171  DNA binding protein\nVSVNDGVDQMGAEPDIMEFVEQMGGYFESRSLTRLAGRLLGWLLVCDPERQSSEELATALAASSGGISTNARMLIQFGFIERLAVAGDRRTYFRLRPNAFAAGERERIRAMAELQDLADVGLRALGDAPPQRSRRLREMRDLLAYMENVVSDALGRYSQRTGEDDHHHHHH\n>5whf_A mol:protein length:90  Vimentin\nGPHMEMRELRRQVDQLTNDKARVEVERDNLAEDIMRLREKLQEEMLQREEAENTLQSFRQDVDNASLARLDLERKVESLQEEIAFLKKLH\n>2rfz_B mol:protein length:430  Cellulose 1,4-beta-cellobiosidase\nQRAGNETPENHPPLTWQRCTAPGNCQTVNAEVVIDANWRWLHDDNMQNCYDGNQWTNACSTATDCAEKCMIEGAGDYLGTYGASTSGDALTLKFVTKHEYGTNVGSRFYLMNGPDKYQMFNLMGNELAFDVDLSTVECGINSALYFVAMEEDGGMASYPSNQAGARYGTGYCDAQCARDLKFVGGKANIEGWKSSTSDPNAGVGPYGSCCAEIDVWESNAYAFAFTPHACTTNEYHVCETTNCGGTYSEDRFAGKCDANGCDYNPYRMGNPDFYGKGKTLDTSRKFTVVSRFEENKLSQYFIQDGRKIEIPPPTWEGMPNSSEITPELCSTMFDVFNDRNRFEEVGGFEQLNNALRVPMVLVMSIWDDHYANMLWLDSIYPPEKEGQPGAARGDCPTDSGVPAEVEAQFPDAQVVWSNIRFGPIGSTYDF\n>3blw_J mol:protein length:354  Isocitrate dehydrogenase [NAD] subunit 2\nATVKQPSIGRYTGKPNPSTGKYTVSFIEGDGIGPEISKSVKKIFSAANVPIEWESCDVSPIFVNGLTTIPDPAVQSITKNLVALKGPLATPIGKGHRSLNLTLRKTFGLFANVRPAKSIEGFKTTYENVDLVLIRENTEGEYSGIEHIVCPGVVQSIKLITRDASERVIRYAFEYARAIGRPRVIVVHKSTIQRLADGLFVNVAKELSKEYPDLTLETELIDNSVLKVVTNPSAYTDAVSVCPNLYGDILSDLNSGLSAGSLGLTPSANIGHKISIFEAVHGSAPDIAGQDKANPTALLLSSVMMLNHMGLTNHADQIQNAVLSTIASGPENRTGDLAGTATTSSFTEAVIKRL\n>7nvo_q mol:protein length:548  T-complex protein 1 subunit theta\nMALHVPKAPGFAQMLKEGAKHFSGLEEAVYRNIQACKELAQTTRTAYGPNGMNKMVINHLEKLFVTNDAATILRELEVQHPAAKMIVMASHMQEQEVGDGTNFVLVFAGALLELAEELLRIGLSVSEVIEGYEIACRKAHEILPNLVCCSAKNLRDIDEVSSLLRTSIMSKQYGNEVFLAKLIAQACVSIFPDSGHFNVDNIRVCKILGSGISSSSVLHGMVFKKETEGDVTSVKDAKIAVYSCPFDGMITETKGTVLIKTAEELMNFSKGEENLMDAQVKAIADTGANVVVTGGKVADMALHYANKYNIMLVRLNSKWDLRRLCKTVGATALPRLTPPVLEEMGHCDSVYLSEVGDTQVVVFKHEKEDGAISTIVLRGSTDNLMDDIERAVDDGVNTFKVLTRDKRLVPGGGATEIELAKQITSYGETCPGLEQYAIKKFAEAFEAIPRALAENSGVKANEVISKLYAVHQEGNKNVGLDIEAEVPAVKDMLEAGILDTYLGKYWAIKLATNAAVTVLRVDQIIMAKPAGGPKPPSGKKDWDDDQND\n>5z9m_B mol:protein length:207  DNA gyrase subunit B\nGLDAVRKRPGMYIGDTDDGTGLHHMVFEVVDNAIDEALAGHCKEIIVTIHADNSVSVQDDGRGIPTGIHPEEGVSAAEVIMTVLHAGGKFDDNSYKVSGGLHGVGVSVVNALSQKLELVIQREGKIHRQIYEHGVPQAPLAVTGETEKTGTMVRFWPSLETFTNVTEFEYEILAKRLRELSFLNSGVSIRLRDKRDGKEDHFHYEGG\n>3c74_F mol:protein length:253  Uridine phosphorylase\nKSKSDVFHLGLTKNDLQGAQLAIVPGDPERVEKIAALMDKPVKLASHREFTSWRAELDGKAVIVCSTGIGGPSTSIAVEELAQLGIRTFLRIGTTGAIQPHINVGDVLVTTASVRLDGASLHFAPMEFPAVADFACTTALVEAAKSIGATTHVGVTASSDTFYPGQERYDTYSGRVVRRFKGSMEEWQAMGVMNYEMESATLLTMCASQGLRAGMVAGVIVNRTQQEIPNAETMKQTESHAVKIVVEAARRLL\n>4unm_A mol:protein length:615  SECRETED PROTEIN\nGSHMSTEKYHQYKINQPEYKAANGKWEIIEFPEKYRQNTIHAALLRTGKVLMVAGSGNNQDNSDDKQYDTRIWDPVKGTIKKVPTPSDLFCTGHTQLANGNLLIAGGTKRYEKLKGDVTKAGGLMVVHNENPDKPITLPAGTKFTGKENGKTFVSKDPVLVPRAEKVFDPATGAFVRNDPGLGRIYVEAQKSGSAYETGTEDNYRVQGLSGADARNTYGIAQKLALDKKDFQGIRDAFEFDPVAEKYIKVDPMHEARWYPTLTTLGDGKILSVSGLDDIGQLVPGKNEVYDPKTKAWTYTDKVRQFPTYPALFLMQNGKIFYSGANAGYGPDDVGRTPGVWDVETNKFTKVPGMSDANMLETANTVLLPPAQDEKYMVIGGGGVGESKLSSEKTRIADLKADDPKFVDGPSLEKGTRYPQASILPDDSVLVSGGSQDYRGRGDSNILQARLYHPDTNEFERVADPLVGRNYHSGSILLPDGRLMFFGSDSLYADKANTKPGKFEQRIEIYTPPYLYRDSRPDLSGGPQTIARGGSGTFTSRAASTVKKVRLIRPSASTHVTDVDQRSIALDFKADGDKLTVTVPSGKNLVQSGWYMMFVTDGEGTPSKAEWVRVP\n>5nh3_H mol:protein length:121  anti-human ActRIIB mAb BYM338 Fv heavy-chain\nQVQLVQSGAEVKKPGASVKVSCKASGYTFTSSYINWVRQAPGQGLEWMGTINPVSGSTSYAQKFQGRVTMTRDTSISTAYMELSRLRSDDTAVYYCARGGWFDYWGQGTLVTVSSHHHHHH\n>5osi_D mol:protein length:182  Vacuolar protein sorting-associated protein 29\nMLVLVLGDLHIPHRCNSLPAKFKKLLVPGKIQHILCTGNLCTKESYDYLKTLAGDVHIVRGDFDENLNYPEQKVVTVGQFKIGLIHGHQVIPWGDMASLALLQRQFDVDILISGHTHKFEAFEHENKFYINPGSATGAYNALETNIIPSFVLMDIQASTVVTYVYQLIGDDVKVERIEYKKP\n>6ysr_T mol:protein length:100  50S ribosomal protein L23\nMIREERLLKVLRAPHVSEKASTAMEKSNTIVLKVAKDATKAEIKAAVQKLFEVEVEVVNTLVVKGKVKRHGQRIGRRSDWKKAYVTLKEGQNLDFVGGAE\n>2x6r_B mol:protein length:416  TREHALOSE-SYNTHASE TRET\nMKMYEVKEFSSGKRKLEDYKSIIGEEEVSKIQEKAEKLKGRSFVHVNSTSFGGGVAEILHSLVPLLRSIGIEARWFVIEGPTEFFNVTKTFHNALQGNESLKLTEEMKELYLNVNRENSKFIDLSSFDYVLVHDPQPAALIEFYEKKSPWLWRCHIDLSSPNREFWEFLRRFVEKYDRYIFHLPEYVQPELDRNKAVIMPPSIDPLSEKNVELKQTEILRILERFDVDPEKPIITQVSRFDPWKGIFDVIEIYRKVKEKIPGVQLLLVGVMAHDDPEGWIYFEKTLRKIGEDYDVKVLTNLIGVHAREVNAFQRASDVILQMSIREGFGLTVTEAMWKGKPVIGRAVGGIKFQIVDGETGFLVRDANEAVEVVLYLLKHPEVSKEMGAKAKERVRKNFIITKHMERYLDILNSLGG\n>6rj0_C mol:protein length:337  Coat protein\nVRKGNKKLAKQATTKAVNPQPRRRNNNRRRGMRADAPLAKASTITGFGRGTNDVHLTGMSRIAQAVIPAGTGTDGYIVVDETIVPELLPRLGFAARIFQRYAVETLEFEIQPMCPANTGGGYVAGFLPDPTDSDHTFDAIQATRGAVVAKWWESRTIRPQYARALLWTSVGKEQRLTSPGRLILLCVGNNTDVVNVSVLCRWSVRLSVPSLETPEDTFAPILTLGPLYNDSLAANDFKSILLGSTQLDIAPEGAVYSLDRPLSIDYNLGTGDVDRAVYWHVKKVAGNAGTPAGWFHWGLWDNFNKTFTQGTAYYSDAQPRQILLPVGTLFTRADSGN\n>5qn5_B mol:protein length:189  Thiol:disulfide interchange protein\nAQYEDGKQYTTLEKPVAGAPQVLEFFSFFCPHCYQFEEVLHISDNVKKKLPEGVKMTKYHVNFMGGDLGKDLTQAWAVAMALGVEDKVTVPLFEGVQKTQTIRSASDIRDVFINAGIKGEEYDAAWNSFVVKSLVAQQEKAAADVQLRGVPAMFVNGKYQLNPQGMDTSNMDVFVQQYADTVKYLSEKK\n>5e7k_L5 mol:protein length:49  50S ribosomal protein L34\nMKRTWQPNRRKRAKTHGFRARMRTPGGRKVLKRRRQKGRWRLTPAVRKR\n>4ru4_F mol:protein length:602  tail spike protein gp49\nGSVGQSLQFLEMGRVTPAQFGAVGDGASHPLSERYATLAEAQTVYPHAVALSDEIDWAALQAAVDSGAPVHIPSGDYQINRGISSTGSLQIAGDGATSIIRPTAAFTGTSVLSCVGSLVALPNISSVSAGSLTIDFASTPNLVAGDVFIIYNPTDSSFSGFRTSYRAGEFCEVRAVSGNTVTIRSALYAAYDGATVAIYKVVSGVVDIASIQIVGGTVPMNGLLVEAVVSPRVDDVTVTLANNAGVYFARCYDAKITNSNISNIGDGGDDYGIIFGNCHDGGADNCKVYARRHAIATGGDAEVGCVPVRNVRMRNCTLRNDITSGTHCADFHGNAEDCSYENCTIYGGATWQGKDISYRHCTITNASGGWIVISAEILGGTFLLDQCTLYTTGDPQPGNRGVIDVGGNSAVLTTNTTQPCNFLIQGGSLRAPSLSTSSYLLRARLEGSTVPVNIQYSGQAIDVGSLGKVLQLDITSGSTSPEYLIVENLAGLPSGITLASAAGGFASAPMRMPVLGGRVQVTTATNASSVTAPVTFRYIYPKAPTVQVTKTDRSYAGNRVGVAIANPTSASGATLGLFTDDGTNFSSAVTNQLNWQAGIYEV\n>4y0g_A mol:protein length:90  5'-AMP-activated protein kinase subunit beta-2\nGPLGSPNSQARPTVIRWSEGGKEVFISGSFNNWSTKIPLIKSHNDFVAILDLPEGEHQYKFFVDGQWVHDPSEPVVTSQLGTINNLIHVK\n>6pv4_D mol:protein length:653  Glycoside Hydrolase\nMGSSHHHHHHSSGLVPRGSHMASTDGITENFYEIYPKPQEISYSGGEFQISDEINIVYDDGIDTYTKKRVDEVLEASNLEATVSNEIVPGKTNFLVGINESGGVVDNYFNKNIPHDESFFDEKMDANIVSVKDGVIGVIAEDTDSAFYGVTTLKHVFNQLEEGNEIKNFRADDYAEVAHRGFIEGYYGNPWSNEDRAELMKFGGDYKLNQYVFAPKDDPYHNSKWRDLYPEEKLSEIKKLAQMGNETKNRYVYALHPFMNNPVRFDTEENYQNDLGVIKAKFTQLLENDVRQFAILADDASAPAQGASMYVKLLTDLTRWLEEQQSTYPDLKTDLMFCPSDYYGNGSSAQLKELNKAEDNVSIVMTGGRIWGEVDENFANNFMNNISTEGHPGRAPFFWINWPCSDNSKQHLIMGGNDTFLHPGVDPSKIDGIVLNPMQQAEANKSALFAIADYAWNIWDNKEEADENWNDSFKYMDHGTAEETNSSLALREISKHMINQNMDGRVRPLQESVELAPKLEAFKQKYDSGASIKEDALELIEEFTNLQKAAEYYKNNPGNERTRDQIIYWLNCWEDTMDAAIGYLKSAIAIEEGDDEAAWANYSEAQSAFEKSKTYGFHYVDHTEYAEVGVQHIVPFIKSMGQNLSVVIGSIVD\n>4e51_A mol:protein length:467  Histidine--tRNA ligase\nMAHHHHHHMGTLEAQTQGPGSMTEQKRKLEKLTGVKGMNDILPQDAGLWEFFEATVKSLLRAYGYQNIRTPIVEHTPLFTRGIGEVTDIVEKEMYSFVDALNGENLTLRPENTAAVVRAAIEHNMLYDGPKRLWYIGPMFRHERPQRGRYRQFHQVGVEALGFAGPDADAEIVMMCQRLWEDLGLTGIKLEINSLGLAEERAAHRVELIKYLEQHADKLDDDAQRRLYTNPLRVLDTKNPALQEIVRNAPKLIDFLGDVSRAHFEGLQRLLKANNVPFTINPRLVRGLDYYNLTVFEWVTDKLGAQGTVAAGGRYDPLIEQLGGKPTAACGWAMGIERILELLKEEHLVPEQEGVDVYVVHQGDAAREQAFIVAERLRDTGLDVILHCSADGAGASFKSQMKRADASGAAFAVIFGEDEVTNGTASVKPLRGTGDDGEKSVQQSVPVESLTEFLINAMVATAEDGDD\n>1j0n_A mol:protein length:752  XANTHAN LYASE\nSDEFDALRIKWATLLTGGPALDPADSDIAARTDKLAQDANDYWEDMDLSSSRTYIWYALRGNGTSDNVNAVYERLRTMALAATTVGSSLYGNADLKEDILDALDWLYVNSYNSTRSRSAYNWWHWQLGIPMSLNDTAVLLYDDISAARMATYMDTIDYFTPSIGLTGANRAWQAIVVGVRAVIVKDAVKLAAARNGLSGTGIFPYATGGDGFYADGSFVQHTTFAYTGGYGSSVLETTANLMYLLSGSTWSVSDPNQSNVWQWIYEAYRPLLYKGAMMDMVRGREISRSYAQDHAVGHGIVASIVRLAQFAPAPHAAAFKQIAKRVIQEDTFSSFYGDVSTDTIRLAKAIVDDPSIAPAAAPNLYKQYAAMDRAVLQRPGFALGLALYSTRISSYESINSENGRGWYTGAGATYLYNQDLAQYSEDYWPTVDAYRIPGTTVASGTPIASGTGTSSWTGGVSLAGQYGASGMDLSYGAYNLSARKSWFMFDDEIVALGSGISSTAGIPIETVVDNRKLNGAGDNAWTANGAALSTGLGVAQTLTGVNWVHLAGNTADGSDIGYYFPGGATLQTKREARTGTWKQINNRPATPSTAVTRNYETMWIDHGTNPSGASYGYVLLPNKTSAQVGAYAADPAIEIVVNTSGVQSVKEKTLGLVGANFWTDTTQTADLITSNKKASVMTREIADERLEASVSDPTQANNGTIAIELARSAEGYSADPGITVTQLAPTIKFTVNVNGAKGKSFHASFQLG\n>4qyj_D mol:protein length:516  Aldehyde dehydrogenase\nMGSSHHHHHHSSGLVPRGSHMNSSLSAIDGLRLPHQMLIGGQWVSAQSGKTLNVYNPATGDILTEVPDGDVEDVNAAVESAAATLRSDTWRRMPPSARERILLRLADLLEVHGDELARLETLNNGKLLIYSKLMEVGASAQWLRYMAGWATKLTGSTLDLSLPLPPEVRSRASTQRVPVGVVAAIIPWNFPLLMAVWKIAPALACGNTVVLKPAEETPLTALRLAELAMEAGLPAGALNVVTGRGETAGDALVRHPKVAKVAFTGSTEVGRIIGSACGRSLKAVSLELGGKSPVIVLADCDPQEAAEGAAAAIFFNHGQVCTAGSRLYVHESIYEDVIQRLAVIGESIVVGSGLEQGVHMGPMVSKKHHENVLRHIRNGIEDGADLICGGTEAPCAQGFFVKPTIFANREKKDIRLLSQEVFGPVLVATPFSDIAEVVNEANRSVYGLGASIWTNDLSAALRINDELEAGTVWVNTHNMVDPNLPFGGFKDSGVGREHGAAAIEHYTTTRSLVIAY\n>4b3w_B mol:protein length:190  CYTOGLOBIN\nMEKVPGEMEIERRERSEELSEAERKAVQAMWARLYANSEDVGVAILVRFFVNFPSAKQYFSQFKHMEDPLEMERSPQLRKQASRVMGALNTVVENLHDPDKVSSVLALVGKAHALKHKVEPVYFKILSGVILEVVAEEFASDFPPETQRAWAKLRGLIYSHVTAAYKEVGWVQQVPNATTPPATLPSSGP\n>6sql_A mol:protein length:270  Enoyl-[acyl-carrier-protein] reductase [NADH]\nSMTGLLDGKRILVSGIITDSSIAFHIARVAQEQGAQLVLTGFDRLRLIQRITDRLPAKAPLLELDVQNEEHLASLAGRVTEAIGAGNKLDGVVHSIGFMPQTGMGINPFFDAPYADVSKGIHISAYSYASMAKALLPIMNPGGSIVGMDFDPSRAMPAYNWMTVAKSALESVNRFVAREAGKYGVRSNLVAAGPIRTLAMSAIVGGALGEEAGAQIQLLEEGWDQRAPIGWNMKDATPVAKTVCALLSDWLPATTGDIIYADGGAHTQLL\n>2pty_A mol:protein length:432  Enolase\nGSHMTIQKVHGREVLDSRGNPTVEVEVTTEKGVFRSAVPSGASTGVYEACELRDGDKKRYVGKGCLQAVKNVNEVIGPALIGRDELKQEELDTLMLRLDGTPNKGKLGANAILGCSMAISKAAAAAKGVPLYRYLASLAGTKELRLPVPCFNVINGGKHAGNALPFQEFMIAPVKATSFSEALRMGSEVYHSLRGIIKKKYGQDAVNVGDEGGFAPPIKDINEPLPILMEAIEEAGHRGKFAICMDCAASETYDEKKQQYNLTFKSPEPTWVTAEQLRETYCKWAHDYPIVSIEDPYDQDDFAGFAGITEALKGKTQIVGDDLTVTNTERIKMAIEKKACNSLLLKINQIGTISEAIASSKLCMENGWSVMVSHRSGETEDTYIADLVVALGSGQIKTGAPCRGERTAKLNQLLRIEEELGAHAKFGFPGWS\n>3otw_D mol:protein length:163  Phosphopantetheine adenylyltransferase\nHHHHHHMQKIGIYPGTFDPVTNGHIDIIHRSSELFEKLIVAVAHSSAKNPMFSLDERLKMIQLATKSFKNVECVAFEGLLANLAKEYHCKVLVRGLRVVSDFEYELQMGYANKSLNHELETLYFMPTLQNAFISSSIVRSIIAHKGDASHLVPKEIYPLISKA\n>7ojp_J mol:protein length:261  Acyl-[acyl-carrier-protein]-UDP-N-acetylglucosamine O-acyltransferase\nGSHMSLIDPRAIIDPSARLAADVQVGPWSIVGAEVEIGEGTVIGPHVVLKGPTKIGKHNRIYQFSSVGEDTPDLKYKGEPTRLVIGDHNVIREGVTIHRGTVQDRAETTIGDHNLIMAYAHIGHDSVIGNHCILVNNTALAGHVHVDDWAILSGYTLVHQYCRIGAHSFSGMGSAIGKDVPAYVTVFGNPAEARSMNFEGMRRRGFSSEAIHALRRAYKVVYRQGHTVEEALAELAESAAQFPEVAVFRDSIQSATRGITR\n>6ev1_D mol:protein length:213  Light chain\nDIVLTQSPAIMSASPGEKVTMTCSASSSVSYMHWYQQKSGTSPKRWIYDTSKLASGVPARFSGSGSGTSYSLTISSMEAEDAATYYCQQWSSNPPTFGAGTKLELKRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLRSPVTKSFNRGEC\n>1p44_B mol:protein length:269  Enoyl-[acyl-carrier-protein] reductase [NADH]\nMTGLLDGKRILVSGIITDSSIAFHIARVAQEQGAQLVLTGFDRLRLIQRITDRLPAKAPLLELDVQNEEHLASLAGRVTEAIGAGNKLDGVVHSIGFMPQTGMGINPFFDAPYADVSKGIHISAYSYASMAKALLPIMNPGGSIVGMDFDPSRAMPAYNWMTVAKSALESVNRFVAREAGKYGVRSNLVAAGPIRTLAMSAIVGGALGEEAGAQIQLLEEGWDQRAPIGWNMKDATPVAKTVCALLSDWLPATTGDIIYADGGAHTQLL\n>4v9c_DU mol:protein length:104  50S ribosomal protein L24\nMAAKIRRDDEVIVLTGKDKGKRGKVKNVLSSGKVIVEGINLVKKHQKPVPALNQPGGIVEKEAAIQVSNVAIFNAATGKADRVGFRFEDGKKVRFFKSNSETIK\n>6d3g_B mol:protein length:284  Beta-lactamase\nSAQSPLLKEQIETIVTGKKATVGVAVWGPDDLEPLLLNPFEKFPMQSVFKLHLAMLVLHQVDQGKLDLNQSVTVNRAAVLQNTWSPMMKDHQGDEFTVAVQQLLQYSVSHSDNVACDLLFELVGGPQALHAYIQSLGVKEAAVVANEAQMHADDQVQYQNWTSMKAAAQVLQKFEQKKQLSETSQALLWKWMVETTTGPQRLKGLLPAGTIVAHKTGTSGVRAGKTAATNDAGVIMLPDGRPLLVAVFVKDSAESERTNEAIIAQVAQAAYQFELKKLSAVSPD\n>7ce1_K mol:protein length:341  LacI-type transcription factor\nERPTLKTIAYMTGLGITTVSRALKDAPDIGAETKERVRLIAQQIGYQPNRAGVRLRTGKTNVIALVLSVDEELMGFTSQMVFGITEVLATTQYHLVVTPHTHAKDSMVPIRYILETGSADGVIISKIEPNDPRVRFMTERKMPFVTHGRSDMGIEHAYHDFDNEAYAYEAVERLAQCGRKRIAIIVPPSRFAFHDHARKGFTRGIRDFGVSEFPLDAITIETPLDKIRDFGKRLMQSDDRPDGIVSISGSSTIALVAGFEAAGVRIGKDIDIVSKQSAEFLNWIQPQIHTVNEDIKLAGRELAKALLARINGAPPETLQSVSRPVWSSMAPKPLEHHHHHH\n>5tzc_B mol:protein length:344  cGMP-dependent 3',5'-cyclic phosphodiesterase\nSAMDDEYTKLLHDGIQPVAAIDSNFASFTYTPRSLPEDDTSMAILSMLQDMNFINNYKIDCPTLARFCLMVKKGYRDPPYHNWMHAFSVSHFCYLLYKNLELTNYLEDIEIFALFISCMCHDLDHRGTNNSFQVASKSVLAALYSSEGSVMERHHFAQAIAILNTHGCNIFDHFSRKDYQRMLDLMRDIILATDLAHHLRIFKDLQKMAEVGYDRNNKQHHRLLLCLLMTSCDLSDQTKGWKTTRKIAELIYKEFFSQGDLEKAMGNRPMEMMDREKAYIPELQISFMEHIAMPIYKLLQDLFPKAAELYERVASNREHWTKVSHKFTIRGLPSNNSLDFLDEE\n>1zwu_A mol:protein length:30  AMARANTHUS CAUDATUS ANTIMICROBIAL PEPTIDE 2 (ACMP2)\nVGECVRGRCPSGMCCSQAGYCGKGPKYCGR\n>7nei_A mol:protein length:267  Polyester Hydrolase Leipzig 7 (PHL-7)\nMANPYERGPDPTESSIEAVRGPFAVAQTTVSRLQADGFGGGTIYYPTDTSQGTFGAVAISPGFTAGQESIAWLGPRIASQGFVVITIDTITRLDQPDSRGRQLQAALDHLRTNSVVRNRIDPNRMAVMGHSMGGGGALSAAANNTSLEAAIPLQGWHTRKNWSSVRTPTLVVGAQLDTIAPVSSHSEAFYNSLPSDLDKAYMELRGASHLVSNTPDTTTAKYSIAWLKRFVDDDLRYEQFLCPAPDDFAISEYRSTCPFLEHHHHHH\n>3ab4_E mol:protein length:421  Aspartokinase\nMALVVQKYGGSSLESAERIRNVAERIVATKKAGNDVVVVCSAMGDTTDELLELAAAVNPVPPAREMDMLLTAGERISNALVAMAIESLGAEAQSFTGSQAGVLTTERHGNARIVDVTPGRVREALDEGKICIVAGFQGVNKETRDVTTLGRGGSDTTAVALAAALNADVCEIYSDVDGVYTADPRIVPNAQKLEKLSFEEMLELAAVGSKILVLRSVEYARAFNVPLRVRSSYSNDPGTLIAGSMEDIPVEEAVLTGVATDKSEAKVTVLGISDKPGEAAKVFRALADAEINIDMVLQNVFSVEDGTTDITFTCPRSDGRRAMEILKKLQVQGNWTNVLYDDQVGKVSLVGAGMKSHPGVTAEFMEALRDVNVNIELISTSEIRISVLIREDDLDAAARALHEQFQLGGEDEAVVYAGTGR\n>3qjn_I mol:protein length:7  Beta-PIX\nAWDETNL\n>6yft_AD mol:protein length:113  coat protein\nSTFSSLVIGSNTFIPTAPGYYSLSTRGFSDPRNQIKISGGKFNAKTGRVTAAVSRLWETDVTVAGLPVRSAAEVAIIMTLGRGITATNADVLLSDLNTLLDPARLDQILQGGF\n>5w08_E mol:protein length:291  Hemagglutinin HA1\nTNATELVQNSSIGEICDSPHQILDGENCTLIDALLGDPQCDGFQNKKWDLFVERSKAYSNCYPYDVPDYASLRSLVASSGTLEFNNESFNWNGVTQNGTSSACIRRSNNSFFSRLNWLTHLNFKYPALNVTMPNNEQFDKLYIWGVHHPVTDKDQIFLYAQPSGRITVSTKRSQQAVIPNIGFRPRIRNIPSRISIYWTIVKPGDILLINSTGNLIAPRGYFKIRSGKSSIMRSDAPIGKCKSECITPNGSIPNDKPFQNVNRITYGACPRYVKQSTLKLATGGALEVLFQ\n>6t7m_C mol:protein length:266  3-oxoacyl-[acyl-carrier-protein] reductase FabG\nMHHHHHHSSGVDLGTENLYFQSMSFEGKIALVTGASRGIGRAIAETLVARGAKVIGTATSENGAKNISDYLGANGKGLMLNVTDPASIESVLENIRAEFGEVDILVNNAGITRDNLLMRMKDDEWNDIIETNLSSVFRLSKAVMRAMMKKRCGRIITIGSVVGTMGNAGQANYAAAKAGLIGFSKSLAREVASRGITVNVVAPGFIETDMTRALSDDQRAGILAQVPAGRLGGAQEIASAVAFLASDEASYITGETLHVNGGMYMV\n>4www_XU mol:protein length:51  30S ribosomal protein S21\nIKVRENEPFDVALRRFKRSCEKAGVLAEVRRREFYEKPTTERKRAKASAVK\n>3ab4_I mol:protein length:421  Aspartokinase\nMALVVQKYGGSSLESAERIRNVAERIVATKKAGNDVVVVCSAMGDTTDELLELAAAVNPVPPAREMDMLLTAGERISNALVAMAIESLGAEAQSFTGSQAGVLTTERHGNARIVDVTPGRVREALDEGKICIVAGFQGVNKETRDVTTLGRGGSDTTAVALAAALNADVCEIYSDVDGVYTADPRIVPNAQKLEKLSFEEMLELAAVGSKILVLRSVEYARAFNVPLRVRSSYSNDPGTLIAGSMEDIPVEEAVLTGVATDKSEAKVTVLGISDKPGEAAKVFRALADAEINIDMVLQNVFSVEDGTTDITFTCPRSDGRRAMEILKKLQVQGNWTNVLYDDQVGKVSLVGAGMKSHPGVTAEFMEALRDVNVNIELISTSEIRISVLIREDDLDAAARALHEQFQLGGEDEAVVYAGTGR\n>6sn9_E mol:protein length:87  Outer membrane protein assembly factor BamE\nERVVYRPDINQGNYLTANDVSKIRVGMTQQQVAYALGTPLMSDPFGTNTWFYVFRQQPGHEGVTQQTLTLTFNSSGVLTNIDNKPAL\n>5o9f_B mol:protein length:352  Alcohol dehydrogenase\nMKAVQYTEIGSEPVVVDIPTPTPGPGEILLKVTAAGLCYSDISVMDMPAAQYAYGLPLTLGHEGVGTVAELGEGVTGFGVGDAVAVYGPWGCGACHACARGRENYCTRAADLGITPPGLGSPGSMAEYMIVDSARHLVPIGDLDPVAAAPLTDAGLTPYHAISRVLPLLGPGSTAVVIGVGGLGHVGIQILRAVSAARVIAVDLDDDRLALAREVGADAAVKSGAGAADAIRELTGGQGATAVFDFVGAQSTIDTAQQVVAVDGHISVVGIHAGAHAKVGFFMIPFGASVVTPFAGTRSELMEVVALARAGRLDIHTETFTLDEGPAAYRRLREGSIRGRGVVVPTSHHHHH\n>7vec_F mol:protein length:118  Gamma-aminobutyric acid receptor-associated protein\nGPMKFVYKEEHPFEKRRSEGEKIRKKYPDRVPVIVEKAPKARIGDLDKKKYLVPSDLTVGQFYFLIRKRIHLRAEDALFFFVNNVIPPTSATMGQLYQEHHEEDFFLYIAYSDESVYG\n>6r72_C mol:protein length:599  Multidrug exporter ATP-binding cassette\nMSSSHHHHHHMPTKKQKSKSKLKPFFALVRRTNPSYGKLAFALALSVVTTLVSLLIPLLTKQLVDGFSMSNLSGTQIGLIALVFFVQAGLSAYATYALNYNGQKIISGLRELLWKKLIKLPVSYFDTNASGETVSRVTNDTMVVKELITTHISGFITGIISVIGSLTILFIMNWKLTLLVLVVVPLAALILVPIGRKMFSISRETQDETARFTGLLNQILPEIRLVKASNAEDVEYGRGKMGISSLFKLGVREAKVQSLVGPLISLVLMAALVAVIGYGGMQVSSGELTAGALVAFILYLFQIIMPMGQITTFFTQLQKSIGATERMIEILAEEEEDTVTGKQIENAHLPIQLDRVSFGYKPDQLILKEVSAVIEAGKVTAIVGPSGGGKTTLFKLLERFYSPTAGTIRLGDEPVDTYSLESWREHIGYVSQESPLMSGTIRENICYGLERDVTDAEIEKAAEMAYALNFIKELPNQFDTEVGERGIMLSGGQRQRIAIARALLRNPSILMLDAATSSLDSQSEKSVQQALEVLMEGRTTIVIAHRLSTVVDADQLLFVEKGEITGRGTHHELMASHGLYRDFAEQQLKMNADLENKAG\n>2w85_B mol:protein length:12  PEROXIN-19\nSQEKFFQELFDS\n>1z4v_A mol:protein length:532  Hemagglutinin-neuraminidase\nSPSESLITQKQIMSQAGSTGSNSGLGSITDLLNNILSVANQIIYNSAVALPLQLDTLESTLLTAIKSLQTSDKLEQNCSWSAALINDNRYINGINQFYFSIAEGRNLTLGPLLNMPSFIPTATTPEGCTRIPSFSLTKTHWCYTHNVILNGCQDHVSSNQFVSMGIIEPTSAGFPFFRTLKTLYLSDGVNRKSCSISTVPGGCMMYCFVSTQPERDDYFSAAPPEQRIIIMYYNDTIVERIINPPGVLDVWATLNPGTGSGVYYLGWVLFPIYGGVIKGTSLWNNQANKYFIPQMVAALCSQNQATQVQNAKSSYYSSWFGNRMIQSGILACPLRQDLTNECLVLPFSNDQVLMGAEGRLYMYGDSVYYYQRSNSWWPMTMLYKVTITFTNGQPSAISAQNVPTQQVPRPGTGDCSATNRCPGFCLTGVYADAWLLTNPSSTSTFGSEATFTGSYLNTATQRINPTMYIANNTQIISSQQFGSSGQEAAYGHTTCFRDTGSVMVYCIYIIELSSSLLGQFQIVPFIRQVTLS\n>5xf9_E mol:protein length:591  NAD-reducing hydrogenase\nMTTERQRTAPGLLAALHQARSRFGRPLDAQALAELSTAFSLPPGEIAATASFYHFFQTPPARYQIHFVDHVVDHHAGVAALCNHLCAAFAIQPGQRTADARLFVGWTACAGLSDQAPAALINGRPMPRLDAARIDALIEKIQAQIPMDQWPTEWFAVTNAIHRHGPLLTWLDTTPAEAVFEHPTAHDPDAILQAVTDAGLRGRGGAGFPTATKWRFCRENADPERFLICNADEGEPGTFKDRVLLTRYPEHLFAGMILAARAIGADKAILYLRYEYQYLLPQLEAARERIASAQATVPQAERVTLEIALGAGAYVCGEESALIESLEGKPGRPRVRPPYPVTQGYLGHPTVVNNVETLVAVAAIVGNGAAWWRALGTPDSSGPKLFCVSGDVAQPGLYEFPYGVALGDVVTAARPLGTRYAVQVSGPSGTLLPATPEQLARPLAFEALPCNGTVMVFDVRRDPVAIVHHFARFFAHESCGFCTPCRVGTQLIAKTFEKIAAGYATRFDLERLAPALEAMRLASNCGFGLSAGNPVRDLIAHFRQQLEAQLQPHDFIPAFSLDAELAATRRLTGRDDPHAHLAQFEQPEVTR\n>2zh3_A mol:protein length:437  CCA-adding enzyme\nMKVEEILEKALELVIPDEEEVRKGREAEEELRRRLDELGVEYVFVGSYARNTWLKGSLEIDVFLLFPEEFSKEELRERGLEIGKAVLDSYEIRYAEHPYVHGVVKGVEVDVVPCYKLKEPKNIKSAVDRTPFHHKWLEGRIKGKENEVRLLKGFLKANGIYGAEYKVRGFSGYLCELLIVFYGSFLETVKNARRWTRRTVIDVAKGEVRKGEEFFVVDPVDEKRNVAANLSLDNLARFVHLCREFMEAPSLGFFKPKHPLEIEPERLRKIVEERGTAVFAVKFRKPDIVDDNLYPQLERASRKIFEFLERENFMPLRSAFKASEEFCYLLFECQIKEISRVFRRMGPQFEDERNVKKFLSRNRAFRPFIENGRWWAFEMRKFTTPEEGVRSYASTHWHTLGKNVGESIREYFEIISGEKLFKEPVTAELCEMMGVKD\n>5md0_C mol:protein length:74  Capsid protein p24\nTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGV\n>6myg_A mol:protein length:178  Gamma-crystallin S\nMSKTGGKISFYEDRNFLGRRYDCDCDCADFRSYLSRCNSIRVEGGTWAVYERPNFSGHMYILPQGEYPEYQRWMGLNDRLGSCRAVHLSSGGQAKIQVFEKGDFNGQMYETTEDCPSIMEQFHLREIHSCKVVEGTWIFYELPNYRGRQYLLDKKEYRKPVDWGAASPAIQSFRRIVE\n>3vyt_B mol:protein length:372  Hydrogenase expression/formation protein HypD\nMEEPFEAYRSREVAMKLVEKIREEAKTLDGEIRIMHVCGTHEDTVTRHGIRSLLPENVKVVSGPGCPVCITPVEDIVAMQLIMRKAREEGEEIILTTFGDMYKIPTPMGSFADLKSEGFDVRIVYGIFDTYRIAKENPDKTVVHFSPGFETTTAPAAGMLNVAAQEELENFKIYSVHRLTPPAVEVLLKQGTVFQGLIAPGHVSTIIGVKGWEYLTEKYGIPQVVAGFEPNDVLMAILMLIRMYKEGEARIINEYERAVKYEGNVVAQKMIDKFFEVVDAKWRALGVFPKSGLELRKEWKDFEIRSFYKVEVPKNLPDLEKGCRCGAVLRGLALPTDCPLFGKTCTPRHPVGPCMVSYEGTCQIFYKYGVLF\n>4atq_L mol:protein length:456  4-AMINOBUTYRATE TRANSAMINASE\nMTTTANELSYRIEQKRNINGAFPGPKSQALAERRSAVVAAGVASGVPVYVEDADGGIIRDVDGNSFIDLGSGIAVTSVGASDPAVVAAVQEAAAHFTHTCFMVTPYEGYVAVTEQLNRLTPGDHAKRTVLFNSGAEAVENAVKVARLATGRDAVVAFDHAYHGRTNLTMALTAKAMPYKTNFGPFAPEVYRMPMSYPFREENPEITGAEAAKRAITMIEKQIGGDQVAAIIIEPIQGEGGFIVPAEGFLPALSEWAKEKGIVFIADEVQSGFCRTGEWFAVDHEGVVPDIITMAKGIAGGLPLSAITGRADLLDAVHPGGLGGTYGGNPVACAAALAAIDTMEQHDLNGRARHIEELALGKLRELAAELSAGGGSVVGDIRGRGAMLAIELVQPGSKEPNAELTKAVAAACLKEGVIILTCGTYGNVIRLLPPLVISDELLIDGLEVLAAAIKAHA\n>2cha_C mol:protein length:97  ALPHA-CHYMOTRYPSIN A\nANTPDRLQQASLPLLSNTNCKKYWGTKIKDAMICAGASGVSSCMGDSGGPLVCKKNGAWTLVGIVSWGSSTCSTSTPGVYARVTALVNWVQQTLAAN\n>1r7x_A mol:protein length:283  Glycoprotein-fucosylgalactoside alpha-galactosyltransferase\nMVSLPRMVYPQPKVLTPCRKDVLVVTPWLAPIVWEGTFNIDILNEQFRLQNTTIGLTVFAIKKYVAFLKLFLETAEKHFMVGHRVHYYVFTDQPAAVPRVTLGTGRQLSVLEVGAYKRWQDVSMRRMEMISDFCERRFLSEVDYLVCVDVDMEFRDHVGVEILTPLFGTLHPSFYGSSREAFTYERRPQSQAYIPKDEGDFYYMGAFFGGSVQEVQRLTRACHQAMMVDQANGIEAVWHDESHLNKYLLRHKPTKVLSPEYLWDQQLLGWPAVLRKLRFTAVP\n>6gzq_S2 mol:protein length:78  30S ribosomal protein S19\nKGVFVDDHLLEKVLELNAKGEKRLIKTWSRRSTIVPEMVGHTIAVYNGKQHVPVYITENMVGHKLGEFAPTRTYRGHG\n>4lmv_F mol:protein length:252  Glutathione transferase\nSQPIVFYDIPSNDTLKQSPWSPNTWKIRYALNIKGIKYKTEWVEYPDIEDVVKKLGGKPTGKKPDGRDHYTVPVIYDPNTKTVVEDGIKIAKYLDDAYPDTPRLFPAGTDAFQAAFDDFVWSVTLAFPLLSLLLLDVSNSLPPRSSAYFRATREQQFGKRLEEQGGEERWQQLEAGLGKFKGYLERNGAGNDLLLMGTQGGITYSDVQIASLFVWAKVVWGEGSEKWKRLMGFHGGKWAQFCAQFAEYERAD\n>1lhu_A mol:protein length:189  SEX HORMONE-BINDING GLOBULIN\nLRPVLPTQSAHDPPAVHLSNGPGQEPIAVMTFDLTKITKTSSSFEVRTWDPEGVIFYGDTNPKDDWFMLGLRDGRPEIQLHNHWAQLTVGAGPRLDDGRWHQVEVKMEGDSVLLEVDGEEVLRLRQVSGPLTSKRHPIMRIALGGLLFPASNLRLPLVPALDGCLRRDSWLDKQAEISASAPTSLRSCD\n>3fx7_A mol:protein length:94  Putative uncharacterized protein\nMSRVQMDTEEVREFVGHLERFKELLREEVNSLSNHFHNLESWRDARRDKFSEVLDNLKSTFNEFDEAAQEQIAWLKERIRVLEEDYLEHHHHHH\n>4xkj_A mol:protein length:335  D-lactate dehydrogenase\nMKIIMFSVRDDEEAAIREWEKKTGVQVDINRLELDAETAQLTKGYDGIVIQQRSHISNPAVYETLQKNGLRQLTSRTAGYDMIDLEQASERGLVVTNVPAYSPNSVAELALTQTMRLIRNLPLFDARGAEQDFRWAGLMAREIRSLTVGIIGAGRIGGTVARLFKALGATVIANDIVERVELKDIVTYVSKEELLQAADVVTLHVPLMDSTTQLIDADALALMKNDAVLINASRGPVVDTDALIAALQNKQIAGAALDTLNGEEHFFNQDLCGKELPSEQLKVLRTLPNVLITPHIGFYTNKAVQNMVEISLNDVLAILKTGTSEHQLNKVAVEN\n>6aw9_A mol:protein length:228  Catechol O-methyltransferase\nMGDTKEQRILRYVQQHAKPGDPQSVLEAIDTYCTQKEWAMNVGDAKGQIMDEVIQEHNPSLVLELGAYCGYSAVRMARLLSPGARLLTMEKNPDYAAITQQMLNFAGLQDKVTILIGASQDLIPQLKKYDVDTLDMVFLDHWKDRYLPDTILLEECGLLRKGTVLLADNVIVPGTPDFLAYVRGSSSFECTHYSSYLEYMKVVDGLEKAVYKGPSSPKQPLEHHHHHH\n>5w93_F mol:protein length:20  Paxillin\nMDDLDALLADLESTTSHISK\n>2fkb_C mol:protein length:180  Putative Nudix hydrolase yfcD\nMEQRRLASTEWVDIVNEENEVIAQASREQMRAQCLRHRATYIVVHDGMGKILVQRRTETKDFLPGMLDATAGGVVQADEQLLESARREAEEELGIAGVPFAEHGQFYFEDKNCRVWGALFSCVSHGPFALQEDEVSEVCWLTPEEITARCDEFTPDSLKALALWMKRNAKNEAVETETAE\n>4z2y_A mol:protein length:359  CalO6\nGSHMELTTTAARPGLRHRMQQLIYGFFTAQTLHVAVRLRIPDLLADGARDVGDLASATGADAPSLRRLLRALVFLEVLDEPAPGTFALTEQGEVLRADVTGSMRELVLLLSGPESWAAWGQLEHSVRTGEVAWEHVHGRSCFDHLMADPQRQAAFNAAMAEGSRAFVPTLLSAYDFGDLRTVVDVGGGSGALLAGVLAAHPHLRGTVFDTPDGVADAARTVAEQGVADRCGVETGDFFVSVPPGADAYVLKSVLHDWDDEQCVEVLRTVRRAVRPDSRVILVESLMPTTVTTAPSVAQVVMNDLNMMVCHGGRERTVAEFRELLRVAGFRLESVTPCPAPSVVGILEAAPAPATGPDGS\n>2prf_A mol:protein length:125  PROFILIN IA\nSWQTYVDTNLVGTGAVTQAAILGLDGNTWATSAGFAVTPAQGQTLASAFNNADPIRASGFDLAGVHYVTLRADDRSIYGKKGSAGVITVKTSKSILVGVYNEKIQPGTAANVVEKLADYLIGQGF\n>5m32_I mol:protein length:205  Proteasome subunit beta type-3\nMSIMSYNGGAVMAMKGKNCVAIAADRRFGIQAQMVTTDFQKIFPMGDRLYIGLAGLATDVQTVAQRLKFRLNLYELKEGRQIKPYTLMSMVANLLYEKRFGPYYTEPVIAGLDPKTFKPFICSLDLIGCPMVTDDFVVSGTCAEQMYGMCESLWEPNMDPDHLFETISQAMLNAVDRDAVSGMGVIVHIIEKDKITTRTLKARMD\n>1xm2_A mol:protein length:173  Tyrosine Phosphatase\nMARMNRPAPVEVTYKNMRFLITHNPTNATLNKFIEELKKYGVTTIVRVCEATYDTTLVEKEGIHVLDWPFDDGAPPSNQIVDDWLSLVKIKFREEPGCCIAVHSVAGLGRAPVLVALALIEGGMKYEDAVQFIRQKRRGAFNSKQLLYLEKYRPKMRLRFKDSNGHRNNCCIQ\n>1nez_B mol:protein length:99  Beta-2-microglobulin\nIQKTPQIQVYSRHPPENGKPNILNCYVTQFHPPHIEIQMLKNGKKIPKVEMSDMSFSKDWSFYILAHTEFTPTETDTYACRVKHDSMAEPKTVYWDRDM\n>6i50_A mol:protein length:170  SFRICE_029225\nRPFIAAHFHGNTSHLNSAIHDHYKGNGLVRVSHDAPHDVWYPAPWTVASPHPRPTLTRTGHVHVHHTGVYLVYVQIYYLDSHDTISWVLHRTNADIEGRETLLQCAQSSYSTEPIDKPNSCFSAAALFLKAGDRLAVRNTAGDRHSLMQPEKSFIGLVKLADAEDPTQEL\n>5zbo_c mol:protein length:209  Capsid protein\nMGSSHHHHHHSSGLVPRGSHFNTRLSRTFGYTIKRTTVKTPSWAVDMMRFNINDFLPPGGGSNPRSVPFEYYRIRKVKVEFWPCSPITQGDRGVGSSAVILDDNFVTKATALTYDPYVNYSSRHTITQPFSYHSRYFTPKPVLDSTIDYFQPNNKRNQLWLRLQTAGNVDHVGLGTAFENSIYDQEYNIRVTMYVQFREFNLKDPPLNP\n>5j8a_BM mol:protein length:114  30S ribosomal protein S13\nARIAGINIPDHKHAVIALTSIYGVGKTRSKAILAAAGIAEDVKISELSEGQIDTLRDEVAKFVVEGDLRREISMSIKRLMDLGCYRGLRHRRGLPVRGQRTKTNARTRKGPRKP\n>7ban_B mol:protein length:1932  Teneurin-4\nMETACGDSKDNDGDGLVDCMDPDCCLQPLCHINPLCLGSPNPLDIIQETQVPVSQQNLHSFYDRIKFLVGRDSTHIIPGENPFDGGHACVIRGQVMTSDGTPLVGVNISFVNNPLFGYTISRQDGSFDLVTNGGISIILRFERAPFITQEHTLWLPWDRFFVMETIIMRHEENEIPSCDLSNFARPNPVVSPSPLTSFASSCAEKGPIVPEIQALQEEISISGCKMRLSYLSSRTPGYKSVLRISLTHPTIPFNLMKVHLMVAVEGRLFRKWFAAAPDLSYYFIWDKTDVYNQKVFGLSEAFVSVGYEYESCPDLILWEKRTTVLQGYEIDASKLGGWSLDKHHALNIQSGILHKGNGENQFVSQQPPVIGSIMGNGRRRSISCPSCNGLADGNKLLAPVALTCGSDGSLYVGDFNYIRRIFPSGNVTNILELRNKDFRHSHSPAHKYYLATDPMSGAVFLSDSNSRRVFKIKSTVVVKDLVKNSEVVAGTGDQCLPFDDTRCGDGGKATEATLTNPRGITVDKFGLIYFVDGTMIRRIDQNGIISTLLGSNDLTSARPLSCDSVMDISQVHLEWPTDLAINPMDNSLYVLDNNVVLQISENHQVRIVAGRPMHCQVPGIDHFLLSKVAIHATLESATALAVSHNGVLYIAETDEKKINRIRQVTTSGEISLVAGAPSGCDCKNDANCDCFSGDDGYAKDAKLNTPSSLAVCADGELYVADLGNIRIRFIRKNKPFLNTQNMYELSSPIDQELYLFDTTGKHLYTQSLPTGDYLYNFTYTGDGDITLITDNNGNMVNVRRDSTGMPLWLVVPDGQVYWVTMGTNSALKSVTTQGHELAMMTYHGNSGLLATKSNENGWTTFYEYDSFGRLTNVTFPTGQVSSFRSDTDSSVHVQVETSSKDDVTITTNLSASGAFYTLLQDQVRNSYYIGADGSLRLLLANGMEVALQTEPHLLAGTVNPTVGKRNVTLPIDNGLNLVEWRQRKEQARGQVTVFGRRLRVHNRNLLSLDFDRVTRTEKIYDDHRKFTLRILYDQAGRPSLWSPSSRLNGVNVTYSPGGYIAGIQRGIMSERMEYDQAGRITSRIFADGKTWSYTYLEKSMVLLLHSQRQYIFEFDKNDRLSSVTMPNVARQTLETIRSVGYYRNIYQPPEGNASVIQDFTEDGHLLHTFYLGTGRRVIYKYGKLSKLAETLYDTTKVSFTYDETAGMLKTINLQNEGFTCTIRYRQIGPLIDRQIFRFTEEGMVNARFDYNYDNSFRVTSMQAVINETPLPIDLYRYDDVSGKTEQFGKFGVIYYDINQIITTAVMTHTKHFDAYGRMKEVQYEIFRSLMYWMTVQYDNMGRVVKKELKVGPYANTTRYSYEYDADGQLQTVSINDKPLWRYSYDLNGNLHLLSPGNSARLTPLRYDIRDRITRLGDVQYKMDEDGFLRQRGGDIFEYNSAGLLIKAYNRAGSWSVRYRYDGLGRRVSSKSSHSHHLQFFYADLTNPTKVTHLYNHSSSEITSLYYDLQGHLFAMELSSGDEFYIACDNIGTPLAVFSGTGLMIKQILYTAYGEIYMDTNPNFQIIIGYHGGLYDPLTKLVHMGRRDYDVLAGRWTSPDHELWKHLSSSNVMPFNLYMFKNNNPISNSQDIKCFMTDVNSWLLTFGFQLHNVIPGYPKPDMDAMEPSYELIHTQMKTQEWDNSKSILGVQCEVQKQLKAFVTLERFDQLYGSTITSCQQAPKTKKFASSGSVFGKGVKFALKDGRVTTDIICVANEDGRRVAAILNHAHYLENLHFTIDGVDTHYFVKPGPSEGDLAILGLSGGRRTLENGVNVTVSQINTVLNGRTRRYTDIQLQYGALCLNTRYGTTLDEEKARVLELARQRAVRQAWAREQQRLREGEEGLRAWTEGEKQQVLSTGRVQGYDGFFVISVEQYPELSDSANNIHFMRQSE\n>4o6c_D mol:protein length:377  NS1\nAEHHHHHHSSGVDLGTENLYFQSNADTGCAIDISRQELRCGSGVFIHNDVEAWMDRYKYYPETPQGLAKIIQKAHKEGVCGLRSVSRLEHQMWEAVKDELNTLLKENGVDLSVVVEKQEGMYKSAPKRLTATTEKLEIGWKAWGKSILFAPELANNTFVVDGPETKECPTQNRAWNSLEVEDFGFGLTSTRMFLKVRESNTTECDSKIIGTAVKNNLAIHSDLSYWIESRLNDTWKLERAVLGEVKSCTWPETHTLWGDGILESDLIIPVTLAGPRSNHNRRPGYKTQNQGPWDEGRVEIDFDYCPGTTVTLSESCGHRGPATRTTTESGKLITDWCCRSCTLPPLRYQTDSGCWYGMEIRPQRHDEKTLVQSQVNA\n>5wyk_AD mol:protein length:575  Utp9\nXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX\n>6grj_D mol:protein length:367  AhlB\nMTNATTITMDQGMANQASQAMQIQTYCNSVKQQVPVDFSQFPNLKDNQTQINQGLDLAKGHADLYLNTIQPQIITNISNISNYFALQNAIPAVLPPGSTKAQWLRQLSVIKEQATEYQRLSSDTRLVIVNLNNNLITDSSNFQGIVVNLNSKVQGDNGVLAQLNGDIDKVNAAIDGAIAGIVAGGLLVIGGAFVTAIGAVADFVTAGTSTPVVIGGVAMMVAGAGGITAGAIVLHNSLGARQDLYQKRSSLNSEVLIATQIGNGYKGLQVQAQNAVTAATQMSNAWDSLTSDLGSLITDLDKGITSGDDIRQLWLTAADTTVKTVLTDVTTIKAQIAGVSPLQVPQTDTIANFVARLAALEHHHHHH\n>3ria_G mol:protein length:221  Mouse monoclonal Fab fragment, heavy chain\nEVQLQQSGPELVRPGASMKISCKASGYSFTGYTMNWVKQSHGKNLEWIGLINPYNGGTSYNQKFKGKATLTVDKSSSTAYMELLSLTSEDSAVYYCARDGDYYRYGRYFDYWGQGTTLTVSSAKTTPPSVYPLAPGSAAQTNSMVTLGCLVKGYFPEPVTVTWNSGSLSSGVHTFPAVLQSDLYTLSSSVTVPSSTWPSETVTCNVAHPASSTKVDKKIVP\n>3jbv_u mol:protein length:104  50S ribosomal protein L24\nMAAKIRRDDEVIVLTGKDKGKRGKVKNVLSSGKVIVEGINLVKKHQKPVPALNQPGGIVEKEAAIQVSNVAIFNAATGKADRVGFRFEDGKKVRFFKSNSETIK\n>6tj2_B mol:protein length:285  Alpha/beta hydrolase\nMKSIHIKIVLALCISIFTIMGLQPLNQHSTVAAANHKSSTKQTPLTFVLIHGSWATAGFWDETASELRKLGHTVYTPEYAGHGADKNNNVTHEQITKSVVDYIKQKDLKDFILLGHSFGGSVIQTVSQQVPDRIKRIVFFDAFAPLDGQSVADQFPAESLKSFEQLRDASGNNTITLPFPLFRDTFVNTASLAQAQAFYKQAPPEPATPLFEKLDLKKFYSLQIPKSYLYLTEDTAIPQGPYGFHPTQSSHLGVFRFIEGKGDHMTTVRTEPKMMAELMVKAGRD\n>1vy7_AC mol:protein length:239  30S ribosomal protein S3\nMGNKIHPIGFRLGITRDWESRWYAGKKQYRHLLLEDQRIRGLLEKELYSAGLARVDIERAADNVAVTVHVAKPGVVIGRGGERIRVLREELAKLTGKNVALNVQEVQNPNLSAPLVAQRVAEQIERRFAVRRAIKQAVQRVMESGAKGAKVIVSGRIGGAEQARTEWAAQGRVPLHTLRANIDYGFALARTTYGVLGVKAYIFLGEVIGGQKPKARPELPKAEERPRRRRPAVRVKKEE\n>6q16_AJ mol:protein length:252  Lipoprotein PrgK\nMIRRYLYTFLLVMTLAGCKDKDLLKGLDQEQANEVIAVLQMHNIEANKIDSGKLGYSITVAEPDFTAAVYWIKTYQLPPRPRVEIAQMFPADSLVSSPRAEKARLYSAIEQRLEQSLQTMEGVLSARVHISYDIDAGENGRPPKPVHLSALAVYERGSPLAHQISDIKRFLKNSFADVDYDNISVVLSERSDAQLQAPGTPVKRNSFATSWIVLIILLSVMSAGFGVWYYKNHYARNKKGITADDKAKSSNE\n>2bo9_C mol:protein length:308  CARBOXYPEPTIDASE A4\nSSNNFNYGAYHSLEAIYHEMDNIAADFPDLARRVKIGHSFENRPMYVLKFSTGKGVRRPAVWLNAGIHSREWISQATAIWTARKIVSDYQRDPAITSILEKMDIFLLPVANPDGYVYTQTQNRLWRKTRSRNPGSSCIGADPNRNWNASFAGKGASDNPCSEVYHGPHANSEVEVKSVVDFIQKHGNFKGFIDLHSYSQLLMYPYGYSVKKAPDAEELDKVARLAAKALASVSGTEYQVGPTCTTVYPASGSSIDWAYDNGIKFAFTFELRDTGTYGFLLPANQIIPTAEETWLGLKTIMEHVRDNLY\n>7jor_A mol:protein length:137  Dehaloperoxidase B\nGFKQDIATLRGDLRTYAQDIFLAFLNKYPDEKRNFKNYVGKSDQELKSMAKFGDHTEKVFNLMMEVADRATDCVPLASDASTLVQMKQHSGLTTGNFEKLFVALVEYMRASGQSFDSQSWDRFGKNLVSALSSAGMK\n>5o09_2C mol:protein length:238  Bacterial kinesin light chain\nDTALERQIASASRSVEEARRLAYHDPIRVGALVEQISVLADLRQKEGDFRKAESLYREALFRAQELRKQDPDLLTGIYSLLAHLYDRWGRMDKAAEFYELALKISAENGLEESDKVATIKNNLAMIFKQLRKFERAEGYYCEALETFQRLDGEQSARVASVYNNLGVLYYSHMDVDRAQVMHERALAIRQNLHEGQMDPADLSQTFINLGAVYKAAGDFQKAEACVDRAKRIRAAMNG\n>6eq4_A mol:protein length:182  7,8-dihydro-8-oxoguanine triphosphatase\nMKHHHHHHPMSDYDIPTTENLYFQGAMGASRLYTLVLVLQPQRVLLGMKKRGFGAGRWNGFGGKVQEGETIEDGARRELQEESGLTVDALHKVGQIVFEFVGEPELMDVHVFCTDSIQGTPVESDEMRPCWFQLDQIPFKDMWPDDSYWFPLLLQKKKFHGYFKFQGQDTILDYTLREVDTV\n>7ezx_NP mol:protein length:161  Allophycocyanin alpha subunit\nMSIVTKSIVNADAEARYLSPGELDRIKSFVLSGQRRLRIAQTLTENRERIVKQGGQQLFQRRPDVVSPGGNAYGEEMTATCLRDLDYYLRLVTYGIIAGDVTPIEEIGLVGVKEMYSALGTPISGVAEGIRCMKDVACSLLSGEDAAEVGFYFDYTLAAMQ\n>5aqj_B mol:protein length:118  BAG FAMILY MOLECULAR CHAPERONE REGULATOR 1\nGPLGSNSPQEEVELKKLKHLEKSVEKIADQLEELNKELTGIQQGFLPKDLQAEALCKLDRRVKATIEQFMKILEEIDTLILPENFKDSRLKRKGLVKKVQAFLAECDTVEQNICQETE\n>6d8s_A mol:protein length:31  Potassium channel toxin alpha-KTx 5.4\nAFCNLRRCELSCRSLGLLGKCIGEECECVPY\n>1wgj_B mol:protein length:286  INORGANIC PYROPHOSPHATASE\nTYTTRQIGAKNTLEYKVYIEKDGKPVSAFHDIPLYADKENNIFNMVVEIPRWTNAKLEITKEETLNPIIQDTKKGKLRFVRNCFPHHGYIHNYGAFPQTWEDPNVSHPETKAVGDNDPIDVLEIGETIAYTGQVKQVKALGIMALLDEGETDWKVIAIDINDPLAPKLNDIEDVEKYFPGLLRATNEWFRIYKIPDGKPENQFAFSGEAKNKKYALDIIKETHDSWKQLIAGKSSDSKGIDLTNVTLPDTPTYSKAASDAIPPASLKADAPIDKSIDKWFFISGSV\n>4jfz_H mol:protein length:235  Fab heavy chain\nEISEVQLVESGGGLVQPGGSLRLSCVTSGFTFRKFGMSWVRQAPGKGLEWVASIATGGHTTYYSDSVKGRFTISRDNSKNTLYLQMNSLRAEDTAVYYCTRGYSSTSYAMDYWGQGTLVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKSHTATGA\n>5gup_Aj mol:protein length:47  Cytochrome c oxidase subunit 7C, mitochondrial\nSHYEEGPGKNIPFSVENKWRLLAMMTLFFGSGFAAPFFIVRHQLLKK\n>4e8g_B mol:protein length:391  Mandelate racemase/muconate lactonizing enzyme, N-terminal domain protein\nMHHHHHHSSGVDLGTENLYFQSMKIAEIHVYAHDLPVKDGPYTIASSTVWSLQTTLVKIVADSGLAGWGETCPVGPTYAPSHALGARAALAEMAPGLIGANPLQPLVLRRRMDGLLCGHNYAKAAIDIAAYDLMGKHYGVRVADLLGGVAAERVPSYYATGIGQPDEIARIAAEKVAEGFPRLQIKIGGRPVEIDIETVRKVWERIRGTGTRLAVDGNRSLPSRDALRLSRECPEIPFVLEQPCNTLEEIAAIRGRVQHGIYLDESGEDLSTVIRAAGQGLCDGFGMKLTRIGGLQQMAAFRDICEARALPHSCDDAWGGDIIAAACTHIGATVQPRLNEGVWVAQPYIAQPYDEENGIRIAGGHIDLPKGPGLGITPDESLFGPPVASFS\n>4h5r_B mol:protein length:383  Heat shock cognate 71 kDa protein\nSKGPAVGIDLGTTYSCVGVFQHGKVEIIANDQGNRTTPSYVAFTDTERLIGDAAKNQVAMNPTNTVFDAKRLIGRRFDDAVVQSDMKHWPFMVVNDAGRPKVQVEYKGETKSFYPEEVSSMVLTKMKEIAEAYLGKTVTNAVVTVPAYFNDSQRQATKDAGTIAGLNVLRIINEPTAAAIAYGLDKKVGAERNVLIFDLGGGTFDVSILTIEDGIFEVKSTAGDTHLGGEDFDNRMVNHFIAEFKRKHKKDISENKRAVRRLRTACERAKRTLSSSTQASIEIDSLYEGIDFYTSITRARFEELNADLFRGTLDPVEKALRDAKLDKSQIHDIVLVGGSTRIPKIQKLLQDFFNGKELNKSINPDEAVAYGAAVQAAILSGDK\n>6uea_J mol:protein length:245  Immunoglobulin heavy constant alpha 2\nDYKDDDDKLVPRGSCHPRLSLHRPALEDLLLGSEANLTCTLTGLRDASGATFTWTPSSGKSAVQGPPERDLCGCYSVSSVLPGCAQPWNHGETFTCTAAHPELKTPLTANITKSGNTFRPEVHLLPPPSEELALNELVTLTCLARGFSPKDVLVRWLQGSQELPREKYLTWASRQEPSQGTTTYAVTSILRVAAEDWKKGETFSCMVGHEALPLAFTQKTIDRLAGKPTHINVSVVMAEADGTCY\n>3pi4_A mol:protein length:152  Hemoglobin II\nXTTLTNPQKAAIRSSWSKFMDNGVSNGQGFYMDLFKAHPETLTPFKSLFGGLTLAQLQDNPKMKAQSLVFCNGMSSFVDHLDDNDMLVVLIQKMAKLHNNRGIRASDLRTAYDILIHYMEDHNHMVGGAKDAWEVFVGFICKTLGDYMKELS\n>4hmj_A mol:protein length:143  Thermonuclease\nATSTKKLHKEPATLIKAIDGDTVKLMYKGQPMTFRDLLVDTPEFNEKYGPEASAFTKKMVENAKKIEVEFDKGQRTDKYGRGLAYIYADGKMVNEALVRQGLAKVAYVYKGNNTHEQLLRKAEAQAKKEKLNIWSEDNADSGQ\n>6hhq_AC mol:protein length:59  60S ribosomal protein L29\nMAKSKNHTAHNQTRKAHRNGIKKPKTYKYPSLKGVDPKFRRNHKHALHGTAKALAAAKK\n>2c37_X mol:protein length:248  PROBABLE EXOSOME COMPLEX EXONUCLEASE 1\nMREMLQVERPKLILDDGKRTDGRKPDELRSIKIELGVLKNADGSAIFEMGNTKAIAAVYGPKEMHPRHLSLPDRAVLRVRYHMTPFSTDERKNPAPSRREIELSKVIREALESAVLVELFPRTAIDVFTEILQADAGSRLVSLMAASLALADAGIPMRDLIAGVAVGKADGVIILDLNETEDMWGEADMPIAMMPSLNQVTLFQLNGSMTPDEFRQAFDLAVKGINIIYNLEREALKSKYVEFKEEGV\n>1gvd_A mol:protein length:52  MYB PROTO-ONCOGENE PROTEIN\nLIKGPWTKEEDQRLIKLVQKYGPKRWSVIAKHLKGRIGKQCRERWHNHLNPE\n>5d2q_A mol:protein length:102  Fibroin-modulator-binding protein-1\nMHHHHHHETSEERAARLAKMSAYAAQRLANESPEQRATRLKRMSEYAAKRLSSETREQRAIRLARMSAYAARRLANETPAQRQARLLRMSAYAAKRQASKKS\n>1u8t_F mol:protein length:16  Flagellar motor switch protein fliM\nMGDSILSQAEIDALLN\n>2vj0_P mol:protein length:12  SYNAPTOJANIN-1\nNPKGWVTFEEEE\n>6opd_A mol:protein length:275  HLA class I histocompatibility antigen, A-2 alpha chain\nGSHSMRYFFTSVSRPGRGEPRFIAVGYVDDTQFVRFDSDAASQRMEPRAPWIEQEGPEYWDGETRKVKAHSQTHRVDLGTLRGYYNQSEAGSHTVQRMYGCDVGSDWRFLRGYHQYAYDGKDYIALKEDLRSWTAADMAAQTTKHKWEAAHVAEQLRAYLEGTCVEWLRRYLENGKETLQRTDAPKTHMTHHAVSDHEATLRCWALSFYPAEITLTWQRDGEDQTQDTELVETRPAGDGTFQKWAAVVVPSGQEQRYTCHVQHEGLPKPLTLRWE\n>4jaw_B mol:protein length:644  Lacto-N-biosidase\nMGSSHHHHHHSSGLVPRGSHMGYSATAPVNLTRPATVPSMDGWTDGTGAWTLGEGTRVVSSDALAARAQSLASELTKFTDVDIKAATGSATGKDISLTLDASKKAELGDEGFKLNIGSKGLEVIGATDIGVFYGTRSVSQMLRQGQLTLPAGTVATKPKYKERGATLCACQINISTDWIDRFLSDMADLRLNYVLLEMKLKPEEDNTKKAATWSYYTRDDVKKFVKKANNYGIDVIPEINSPGHMNVWLENYPEYQLADNSGRKDPNKLDISNPEAVKFYKTLIDEYDGVFTTKYWHMGADEYMIGTSFDNYSKLKTFAEKQYGAGATPNDAFTGFINDIDKYVKAKGKQLRIWNDGIVNTKNVSLNKDIVIEYWYGAGRKPQELVQDGYTLMNATQALYWSRSAQVYKVNAARLYNNNWNVGTFDGGRQIDKNYDKLTGAKVSIWPDSSYFQTENEVEKEIFDGMRFISQMTWSDSRPWATWNDMKADIDKIGYPLDIREYDYTPVDAGIYDIPQLKSISKGPWELITTPDGYYQMKDTVSGKCLALFTGSKHLDVVTQVGARPELRNCADVSVGQDQRNTANERNTQKWQIRADKDGKYTISPALTQQRLAIATGNEQNIDLETHRPAAGTVAQFPADLVSD\n>5e7r_A mol:protein length:314  TAK1 kinase - TAB1 chimera fusion protein\nSLHMIDYKEIEVEEVVGRGAFGVVCKAKWRAKDVAIKQIESESERKAFIVELRQLSRVNHPNIVKLYGACLNPVCLVMEYAEGGSLYNVLHGAEPLPYYTAAHAMSWCLQCSQGVAYLHSMQPKALIHRDLKPPNLLLVAGGTVLKICDFGTACDIQTHMTNNKGSAAWMAPEVFEGSNYSEKCDVFSWGIILWEVITRRKPFDEIGGPAFRIMWAVHNGTRPPLIKNLPKPIESLMTRCWSKDPSQRPSMEEIVKIMTHLMRYFPGADEPLQYPCQHSLPPGEDGRVEPYVDFAEFYRLWSVDHGEQSVVTAP\n>4ndy_W mol:protein length:74  Centromere protein X\nSGFRKELVSRLLHLHFKDDKTKVSGDALQLMVELLKVFVVEAAVRGVRQAQAEDALRVDVDQLEKVLPQLLLDF\n>6u5t_G mol:protein length:2073  Fatty acid synthase subunit beta\nMDAYSTRPLTLSHGSLEHVLLVPTASFFIASQLQEQFNKILPEPTEGFAADDEPTTPAELVGKFLGYVSSLVEPSKVGQFDQVLNLCLTEFENCYLEGNDIHALAAKLLQENDTTLVKTKELIKNYITARIMAKRPFDKKSNSALFRAVGEGNAQLVAIFGGQGNTDDYFEELRDLYQTYHVLVGDLIKFSAETLSELIRTTLDAEKVFTQGLNILEWLENPSNTPDKDYLLSIPISCPLIGVIQLAHYVVTAKLLGFTPGELRSYLKGATGHSQGLVTAVAIAETDSWESFFVSVRKAITVLFFIGVRCYEAYPNTSLPPSILEDSLENNEGVPSPMLSISNLTQEQVQDYVNKTNSHLPAGKQVEISLVNGAKNLVVSGPPQSLYGLNLTLRKAKAPSGLDQSRIPFSERKLKFSNRFLPVASPFHSHLLVPASDLINKDLVKNNVSFNAKDIQIPVYDTFDGSDLRVLSGSISERIVDCIIRLPVKWETTTQFKATHILDFGPGGASGLGVLTHRNKDGTGVRVIVAGTLDINPDDDYGFKQEIFDVTSNGLKKNPNWLEEYHPKLIKNKSGKIFVETKFSKLIGRPPLLVPGMTPCTVSPDFVAATTNAGYTIELAGGGYFSAAGMTAAIDSVVSQIEKGSTFGINLIYVNPFMLQWGIPLIKELRSKGYPIQFLTIGAGVPSLEVASEYIETLGLKYLGLKPGSIDAISQVINIAKAHPNFPIALQWTGGRGGGHHSFEDAHTPMLQMYSKIRRHPNIMLIFGSGFGSADDTYPYLTGEWSTKFDYPPMPFDGFLFGSRVMIAKEVKTSPDAKKCIAACTGVPDDKWEQTYKKPTGGIVTVRSEMGEPIHKIATRGVMLWKEFDETIFNLPKNKLVPTLEAKRDYIISRLNADFQKPWFATVNGQARDLATMTYEEVAKRLVELMFIRSTNSWFDVTWRTFTGDFLRRVEERFTKSKTLSLIQSYSLLDKPDEAIEKVFNAYPAAREQFLNAQDIDHFLSMCQNPMQKPVPFVPVLDRRFEIFFKKDSLWQSEHLEAVVDQDVQRTCILHGPVAAQFTKVIDEPIKSIMDGIHDGHIKKLLHQYYGDDESKIPAVEYFGGESPVDVQSQVDSSSVSEDSAVFKATSSTDEESWFKALAGSEINWRHASFLCSFITQDKMFVSNPIRKVFKPSQGMVVEISNGNTSSKTVVTLSEPVQGELKPTVILKLLKENIIQMEMIENRTMDGKPVSLPLLYNFNPDNGFAPISEVMEDRNQRIKEMYWKLWIDEPFNLDFDPRDVIKGKDFEITAKEVYDFTHAVGNNCEDFVSRPDRTMLAPMDFAIVVGWRAIIKAIFPNTVDGDLLKLVHLSNGYKMIPGAKPLQVGDVVSTTAVIESVVNQPTGKIVDVVGTLSRNGKPVMEVTSSFFYRGNYTDFENTFQKTVEPVYQMHIKTSKDIAVLRSKEWFQLDDEDFDLLNKTLTFETETEVTFKNANIFSSVKCFGPIKVELPTKETVEIGIVDYEAGASHGNPVVDFLKRNGSTLEQKVNLENPIPIAVLDSYTPSTNEPYARVSGDLNPIHVSRHFASYANLPGTITHGMFSSASVRALIENWAADSVSSRVRGYTCQFVDMVLPNTALKTSIQHVGMINGRKLIKFETRNEDDVVVLTGEAEIEQPVTTFVFTGQGSQEQGMGMDLYKTSKAAQDVWNRADNHFKDTYGFSILDIVINNPVNLTIHFGGEKGKRIRENYSAMIFETIVDGKLKTEKIFKEINEHSTSYTFRSEKGLLSATQFTQPALTLMEKAAFEDLKSKGLIPADATFAGHSLGEYAALASLADVMSIESLVEVVFYRGMTMQVAVPRDELGRSNYGMIAINPGRVAASFSQEALQYVVERVGKRTGWLVEIVNYNVENQQYVAAGDLRALDTVTNVLNFIKLQKIDIIELQKSLSLEEVEGHLFEIIDEASKKSAVKPRPLKLERGFACIPLVGISVPFHSTYLMNGVKPFKSFLKKNIIKENVKVARLAGKYIPNLTAKPFQVTKEYFQDVYDLTGSEPIKEIIDNWEKYEQSDYKDHDGDYKDHDIDYKDDDDK\n>2cbo_A mol:protein length:115  NEOCARZINOSTATIN\nAAPTATVTPSSGLSDGTVVKVAGAGLQAGTAYWVAQWARVDTGVWAYNPADNSSVTADANGSASTSLTVRRSFEGFLFDGTRWGTVDCTTAACQVGLSDAAGNGPEGVAISFNHH\n>7z46_N mol:protein length:352  Major head protein\nMANPTLFVSYDQNGKKLSFANWISVLSPQDTPFVSMTGKESINQTIFSWQTDALASVDGNNAHVEGSRAEDGEMKPTVIKSNVTQILRKVVRVSDTANTTANYGRGRELMYQLEKKGKEIKRDLEKILLSGQARTDVLADQYLTNSAADPAVAGLNDTHAARKTGAFQFLCAHGGLAGGVVDKTKNGPADPDTGAVTVKVAQNASNPTTNIGFDEADIFDMTLQLYTAGSEADIIMINPAHAKIFAGLQENTQGSRKRIFENTKQFIYEVNSITDPLGQSYKIIVNRWMPTDAVYFFRSADWTQMVLRAPKRTELAKDGSYEKWMIEMEVGLRHRNPYASGVLFTAAGKAAA\n>1hmv_D mol:protein length:440  HIV-1 REVERSE TRANSCRIPTASE (SUBUNIT P51)\nPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFKKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETF\n>6e34_AN mol:protein length:233  Capsid protein of PCV2\nMTYPRRRYRRRRHRPRSHLGQILRRRPWLVHPRHRYRWRRKNGIFNTRLSRTFGYTIKRTTVKTPSWAVDMMRFNINDFLPPGGGSNPRSVPFEYYRIRKVKVEFWPCSPITQGDRGVGSSAVILDDNFVTKATALTYDPYVNYSSRHTITQPFSYHSRYFTPKPVLDSTIDYFQPNNKRNQLWLRLQTAGNVDHVGLGTAFENSIYDQEYNIRVTMYVQFREFNLKDPPLNP\n>7z4a_X mol:protein length:352  Major head protein\nMANPTLFVSYDQNGKKLSFANWISVLSPQDTPFVSMTGKESINQTIFSWQTDALASVDGNNAHVEGSRAEDGEMKPTVIKSNVTQILRKVVRVSDTANTTANYGRGRELMYQLEKKGKEIKRDLEKILLSGQARTDVLADQYLTNSAADPAVAGLNDTHAARKTGAFQFLCAHGGLAGGVVDKTKNGPADPDTGAVTVKVAQNASNPTTNIGFDEADIFDMTLQLYTAGSEADIIMINPAHAKIFAGLQENTQGSRKRIFENTKQFIYEVNSITDPLGQSYKIIVNRWMPTDAVYFFRSADWTQMVLRAPKRTELAKDGSYEKWMIEMEVGLRHRNPYASGVLFTAAGKAAA\n>3l51_B mol:protein length:166  Structural maintenance of chromosomes protein 4\nGKVLDAIIQEKKSGRIPGIYGRLGDLGAIDEKYDIAISSCCHALDYIVVDSIDTAQECVNFLKKHNIGIATFIGLDKMTVWAKKMSKIQTPENTPRLFDLVKVKNEEIRQAFYFALRDTLVANNLDQATRVAYQRDRRWRVVTLQGQIIEQSGTMSGGLEHHHHHH\n>5f59_A mol:protein length:154  Histone-lysine N-methyltransferase 2C\nSKSSQYRKMKTEWKSNVYLARSRIQGLGLYAARDIEKHTMVIEYIGTIIRNEVANRKEKLYESQNRGVYMFRMDNDHVIDATLTGGPARYINHSCAPNCVAEVVTFERGHKIIISSSRRIQKGEELCYDYKFDFEDDQHKIPCHCGAVNCRKWM\n>6tuv_D mol:protein length:76  Polyubiquitin-C\nMQIFVKTLTGKTITLEVEPSDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGG\n>3gfj_A mol:protein length:146  146aa long hypothetical transcriptional regulator\nMLESNENRIQIMSTIAKIYRAMSRELNRRLGELNLSYLDFLVLRATSDGPKTMAYLANRYFVTQSAITASVDKLEEMGLVVRVRDREDARKILIEITEKGLETFNKGIEIYKKLANEVTGDLSEDEVILVLDKISKILKRIEEISQ\n>4lf4_H mol:protein length:138  ribosomal protein S8\nMLTDPIADMLTRIRNATRVYKESTDVPASRFKEEILRILAREGFIKGYERVDVDGKPYLRVYLKYGPRRQGPDPRPEQVIHHIRRISKPGRRVYVGVKEIPRVRRGLGIAILSTSKGVLTDREARKLGVGGELICEVW\n>5j4d_KC mol:protein length:65  50S ribosomal protein L35\nMPKMKTHKGAKKRVKITASGKVVAMKTGKRHLNWQKSGKEIRQKGRKFVLAKPEAERIKLLLPYE\n>2hnb_A mol:protein length:147  Protein mioC\nMADITLISGSTLGGAEYVAEHLAEKLEEAGFTTETLHGPLLEDLPASGIWLVISSTHGAGDIPDNLSPFYEALQEQKPDLSAVRFGAIGIGSREYDTFCGAIDKLEAELKNSGAKQTGETLKINILDHDIPEDPAEEWLGSWVNLLK\n>7c2b_C mol:protein length:115  Thioredoxin F2, chloroplastic\nETVNVTVGQVTEVDKDTFWPIVKAAGDKIVVLDMYTQWCGPSKVIAPKYKELSEKYQDMVFLKLDCNQDNKPLAKELGIRVVPTFKILKDNKVVKEVTGAKYEDLLAAIEAARSG\n>6be2_H mol:protein length:227  Fab (F598) Heavy Chain\nQVQLQESGPGLVKPSETLSLTCTVSGGSISGYYWSWIRQPPGKGLEWIGYIHYSRSTNSNPALKSRVTISSDTSKNQLSLRLSSVTAADTAVYYCARDTYYYDSGDYEDAFDIWGQGTMVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKAEPKSC\n>6uti_E mol:protein length:227  Proteasome subunit alpha\nAYDRAITVFSPDGRLFQVEYAREAVKKGSTALGMKFANGVLLISDKKVRSRLIEQNSIEAIQLIDDYVAAVTSGLVADARVLVDFARISAQQEKVTYGSLVNIENLVKRVADQMQQYTQYGGVRPYGVSLIFAGIDQIGPRLFDCDPAGTINEYKATAIGSGKDAVVSFLEREYKENLPEKEAVTLGIKALKSSLEEGEELKAPEIASITVGNKYRIYDQEEVKKFL\n>6rxq_B mol:protein length:254  NAD-dependent protein deacylase\nMGSSHHHHHHSQDPKPRVLVLTGAGISAESGIRTFRAADGLWEEHRVEDVGTPEGFDRDPELVQAFYNARRRQLQQPEIQPNAAHLALAKLQDALGDRFLLVTQNCDNLHERAGNTNVIHMHGELLKVRCSQSGQALDWTGDVTPEDKCHCCQFPAPLRPHVVWFGEMPLGMDEIYMALSMADIFIAIGTSGHVYPAAGFVHEAKLHGAHTVELNLEPSQVGNEFAEKYYGPASQVVPEFVEKLLKGLKAGSIA\n>2vil_A mol:protein length:126  VILLIN 14T\nVELSKKVTGKLDKTTPGIQIWRIENMEMVPVPTKSYGNFYEGDCYVLLSTRKTGSGFSYNIHYWLGKNSSQDEQGAAAIYTTQMDEYLGSVAVQHREVQGHESETFRAYFKQGLIYKQGGVASGMK\n>5szs_C mol:protein length:1325  Spike glycoprotein\nFFTCNSNANLSMLQLGVPDNSSTIVTGLLPTHWFCANQSTSVYSANGFFYIDVGNHRSAFALHTGYYDANQYYIYVTNEIGLNASVTLKICKFSRNTTFDFLSNASSSFDCIVNLLFTEQLGAPLGITISGETVRLHLYNVTRTFYVPAAYKLTKLSVKCYFNYSCVFSVVNATVTVNVTTHNGRVVNYTVCDDCNGYTDNIFSVQQDGRIPNGFPFNNWFLLTNGSTLVDGVSRLYQPLRLTCLWPVPGLKSSTGFVYFNATGSDVNCNGYQHNSVVDVMRYNLNFSANSLDNLKSGVIVFKTLQYDVLFYCSNSSSGVLDTTIPFGPSSQPYYCFINSTINTTHVSTFVGILPPTVREIVVARTGQFYINGFKYFDLGFIEAVNFNVTTASATDFWTVAFATFVDVLVNVSATNIQNLLYCDSPFEKLQCEHLQFGLQDGFYSANFLDDNVLPETYVALPIYYQHTDINFTATASFGGSCYVCKPHQVNISLNGNTSVCVRTSHFSIRYIYNRVKSGSPGDSSWHIYLKSGTCPFSFSKLNNFQKFKTICFSTVEVPGSCNFPLEATWHYTSYTIVGALYVTWSEGNSITGVPYPVSGIREFSNLVLNNCTKYNIYDYVGTGIIRSSNQSLAGGITYVSNSGNLLGFKNVSTGNIFIVTPCNQPDQVAVYQQSIIGAMTAVNESRYGLQNLLQLPNFYYVSNGGNNCTTAVMTYSNFGICADGSLIPVRPRNSSDNGISAIITANLSIPSNWTTSVQVEYLQITSTPIVVDCATYVCNGNPRCKNLLKQYTSACKTIEDALRLSAHLETNDVSSMLTFDSNAFSLANVTSFGDYNLSSVLPQRNIRSSRIAGRSALEDLLFSKVVTSGLGTVDVDYKSCTKGLSIADLACAQYYNGIMVLPGVADAERMAMYTGSLIGGMVLGGLTSAAAIPFSLALQARLNYVALQTDVLQENQKILAASFNKAINNIVASFSSVNDAITQTAEAIHTVTIALNKIQDVVNQQGSALNHLTSQLRHNFQAISNSIQAIYDRLDSIQADQQVDRLITGRLAALNAFVSQVLNKYTEVRGSRRLAQQKINECVKSQSNRYGFCGNGTHIFSIVNSAPDGLLFLHTVLLPTDYKNVKAWSGICVDGIYGYVLRQPNLVLYSDNGVFRVTSRVMFQPRLPVLSDFVQIYNCNVTFVNISRVELHTVIPDYVDVNKTLQEFAQNLPKYVKPNFDLTPFNLTYLNLSSELKQLEAKTASLFQTTVELQGLIDQINSTYVDLKLLNRFENLIKRMKQIEDKIEEIESKQKKIENEIARIKKIKLVPRGSLEWSHPQFEK\n>2fsy_C mol:protein length:282  major capsid protein\nSLGSDADSAGSLIQPMQIPGIIMPGLRRLTIRDLLAQGRTSSNALEYVREEVFTNNADVVAEKALKPESDITFSKQTANVKTIAHWVQASRQVMDDAPMLQSYINNRLMYGLALKEEGQLLNGDGTGDNLEGLNKVATAYDTSLNATGDTRADIIAHAIYQVTESEFSASGIVLNPRDWHNIALLKDNEGRYIFGGPQAFTSNIMWGLPVVPTKAQAAGTFTVGGFDMASQVWDRMDATVEVSREDRDNFVKNMLTILCEERLALAHYRPTAIIKGTFSSGS\n>6rxx_Cn mol:protein length:145  40S ribosomal protein s23-like protein\nMSGGKPRGLNAARKLRNNRREQRWADLQYKKRALGTAYKSSPFGGSSHAKGIVLEKVGVEAKQPNSAIRKCVRVQLIKNGKKVTAFVPNDGCLNFVDENDEVLLAGFGRKGKAKGDIPGVRFKVVKVSGVGLLALWKEKKEKPRS\n>6xqn_I mol:protein length:394  Calcium uptake protein 1, mitochondrial\nGPTAAALEPHPEEKKKKRSGFRDRKVMEYENRIRAYSTPDKIFRYFATLKVISEPGEAEVFMTPEDFVRSITPNEKQPEHLGLDQYIIKRFDGKKISQEREKFADEGSIFYTLGECGLISFSDYIFLTTVLSTPQRNFEIAFKMFDLNGDGEVDMEEFEQVQSIIRSQTSMGMRHRDRPTTGNTLKSGLCSALTTYFFGADLKGKLTIKNFLEFQRKLQHDVLKLEFERHDPVDGRITERQFGGMLLAYSGVQSKKLTAMQRQLKKHFKEGKGLTFQEVENFFTFLKNINDVDTALSFYHMAGASLDKVTMQQVARTVAKVELSDHVCDVVFALFDCDGNGELSNKEFVSIMKQRLMRGLEKPKDMGFTRLMQAMWKCAQETAWDFALPKQSNW\n>4fny_A mol:protein length:327  ALK tyrosine kinase receptor\nRTSTIMTDYNPNYSFAGKTSSISDLKEVPRKNITLIRGLGHGAFGEVYEGQVSGMPNDPSPLQVAVKTLPEVCSEQDELDFLMEALIISKFNHQNIVRCIGVSLQSLPRFILLELMAGGDLKSFLRETRPRPSQPSSLAMLDLLHVARDIACGCQYLEENHFIHRDIAARNCLLTCPGPGRVAKIGDFGMAQDIYRASYYRKGGCAMLPVKWMPPEAFMEGIFTSKTDTWSFGVLLWEIFSLGYMPYPSKSNQEVLEFVTSGGRMDPPKNCPGPVYRIMTQCWQHQPEDRPNFAIILERIEYCTQDPDVINTALPIEYGPLVEEEEK\n>7c5l_R mol:protein length:352  Glyceraldehyde-3-phosphate dehydrogenase\nHHHHHHSSGLVPRGSHMASMSKVGINGFGRIGRLVLRRLLEVKSNIDVVAINDLTSPKILAYLLKHDSNYGPFPWSVDFTEDSLIVDGKSIAVYAEKEAKNIPWKAKGAEIIVECTGFYTSAEKSQAHLDAGAKKVLISAPAGEMKTIVYNVNDDTLDGNDTIVSVASSTTNCLAPMAKALHDSFGIEVGTMTTIHAYTGTQSLVDGPRGKDLRASRAAAENIIPHTTGAAKAIGLVIPELSGKLKGHAQRVPVKTGSVTELVSILGKKVTAEEVNNALKQATTNNESFGYTDEEIVSSDIIGSHFGSVFDATQTEITAVGDLQLVKTVAWYDNEYGFVTQLIRTLEKFAKL\n>6f0v_B mol:protein length:317  Proton-gated ion channel\nGQDMVSPPPPIADEPLTVNTGIYLIECYSLDDKAETFKVNAFLSLSWKDRRLAFDPVRSGVRVKTYAPEAIWIPEIRFVNVENARDADVVDISVSPDGTVQYLERFSARVLSPLDFRRYPFDSQTLHIYLIVRSVDTRNIVLAVDLEKVGKNDDVFLTGWDIESFTAVVKPANFALEDRLESKLDYQLRISRQYFSYIPNIILPMLFILFISWTAFWSTSYEANVTLVVSTLIAHIAFNILVETNLPKTPYMTYTGAIIFMIYLFYFVAVIEVTVQHYLKVESQPARAASITRASRIAFPVVFLLANIILAFLFFGF\n>6yto_C mol:protein length:314  Calcium homeostasis modulator protein 4\nMCPTLNNIVSSLQRNGIFINSLIAALTIGGQQLFSSSTFSCPCQVGKNFYYGSAFLVIPALILLVAGFALRSQMWTITGEYCCSCAPPYRRISPLECKLACLRFFSITGRAVIAPLTWLAVTLLTGTYYECAASEFASVDHYPMFDNVSASKREEILAGFPCCRSAPSDVILVRDEIALLHRYQSQMLGWILITLATIAALVSCCVAKCCSPLTSLQHCYWTSHLQNERELFEQAAEQHSRLLMMHRIKKLFGFIPGSEDVKHIRIPSCQDWKDISVPTLLCMGDDLQGHYSFLGNRVDEDNEEDRSRGIELKP\n>6p4g_K mol:protein length:194  uS4\nMPVARSWVCRKTYVTPRRPFEKSRLDQELKLIGEYGLRNKREVWRVKFTLAKIRKAARELLTLDEKDPRRLFEGNALLRRLVRIGVLDEGKMKLDYILGLKIEDFLERRLQTQVFKLGLAKSIHHARVLIRQRHIRVRKQVVNIPSFIVRLDSQKHIDFSLRSPYGGGRPGRVKRKNAKKGQGGAGAGDDEEED\n>4v6w_CU mol:protein length:299  60S ribosomal protein L22\nMAPTAKTNKGDTKTAAAKPAEKKAAPAAAAAKGKVEKPKAEAAKPAAAAAKNVKKASEAAKDVKAAAAAAKPAAAKPAAAKPAAASKDAGKKAPAAAAPKKDAKAAAAPAPAKAAPAKKAASTPAAAPPAKKAAPAKAAAPAAAAPAPAAAAPAVAKPAPKPKAKAAPAPSKVVKKNVLRGKGQKKKKVSLRFTIDCTNIAEDSIMDVADFEKYIKARLKVNGKVNNLGNNVTFERSKLKLIVSSDVHFSKAYLKYLTKKYLKKNSLRDWIRVVANEKDSYELRYFRISSNDDEDDDAE\n>1oxy_A mol:protein length:628  HEMOCYANIN (SUBUNIT TYPE II)\nTLHDKQIRICHLFEQLSSATVIGDGDKHKHSDRLKNVGKLQPGAIFSCFHPDHLEEARHLYEVFWEAGDFNDFIEIAKEARTFVNEGLFAFAAEVAVLHRDDCKGLYVPPVQEIFPDKFIPSAAINEAFKKAHVRPEFDESPILVDVQDTGNILDPEYRLAYYREDVGINAHHWHWHLVYPSTWNPKYFGKKKDRKGELFYYMHQQMCARYDCERLSNGMHRMLPFNNFDEPLAGYAPHLTHVASGKYYSPRPDGLKLRDLGDIEISEMVRMRERILDSIHLGYVISEDGSHKTLDELHGTDILGALVESSYESVNHEYYGNLHNWGHVTMARIHDPDGRFHEEPGVMSDTSTSLRDPIFYNWHRFIDNIFHEYKNTLKPYDHDVLNFPDIQVQDVTLHARVDNVVHTFMREQELELKHGINPGNARSIKAKYYHLDHEPFSYAVNVQNNSASDKHATVRIFLAPKYDELGNEIKADELRRTAIELDKFKTDLHPGKNTVVRHSLDSSVTLSHQPTFEDLLHGVGLNEHKSEYCSCGWPSHLLVPKGNVAGMEYHLFVMLTDWDKDKVDGSESVACVDAVSYCGARDHKYPDKKPMGFPFDRPIHTEHISDFLTNNMFIKDIKIKFHE\n>7vmv_E mol:protein length:82  Core protein\nMSYYHHHHHHDYDIPTTENLYFQGAMGSADLSLEKAANVQWDEMADITGSSPIIEVKQDEDGSFSIRDIEETNMIAQVKTQR\n>5o4y_F mol:protein length:16  PHE-MAA-ASN-PRO-HIS-LEU-SER-TRP-SER-TRP-9KK-9KK-ARG-CCS-GLY-NH2\nFANPHLSWSWXXRCGX\n>4hel_B mol:protein length:525  60 kDa chaperonin 4\nAAKDVKFGNDARVKMLRGVNVLADAVKVTLGPKGRNVVLDKSFGAPTITKDGVSVAREIELEDKFENMGAQMVKEVASKANDAAGDGTTTATVLAQAIITEGLKAVAAGMNPMDLKRGIDKAVTAAVEELKALSVPCSDSKAIAQVGTISANSDETVGKLIAEAMDKVGKEGVITVEDGTGLQDELDVVEGMQFDRGYLSPYFINKPETGAVELESPFILLADKKISNIREMLPVLEAVAKAGKPLLIIAEDVEGEALATLVVNTMRGIVKVAAVKAPGFGDRRKAMLQDIATLTGGTVISEEIGMELEKATLEDLGQAKRVVINKDTTTIIDGVGEEAAIQGRVAQIRQQIEEATSDYDREKLQERVAKLAGGVAVIKVGAATEVEMKEKKARVEDALHATRAAVEEGVVAGGGVALIRVASKLADLRGQNEDQNVGIKVALRAMEAPLRQIVLNCGEEPSVVANTVKGGDGNYGYNAATEEYGNMIDMGILDPTKVTRSALQYAASVAGLMITTECMVTDLPK\n>3dmd_B mol:protein length:328  Signal recognition particle receptor\nGSHMASMFGKLREKLKSFVKRVEEEVEKEEEEVEKKGLLDRILTVEIKEKDVDKALDELEIDLLEADVALEVVDALREKIKQKLVGKKVRIGTDKGKIIEEAVKEAVSEILETSRRIDLIEEIRKAEKPYVIMFVGFNGSGKTTTIAKLANWLKNHGFSVVIAASDTFRAGAIEQLEEHAKRIGVKVIKHSYGADPAAVAYDAIQHAKARGIDVVLIDTAGRSETNRNLMDEMKKIARVTKPNLVIFVGDALAGNAIVEQARQFNEAVKIDGIILTKLDADARGGAALSISYVIDAPILFVGVGQGYDDLRPFEKEWFLERIFGEENA\n>3jcd_D mol:protein length:209  50S ribosomal protein L3\nMIGLVGKKVGMTRIFTEDGVSIPVTVIEVEANRVTQVKDLANDGYRAIQVTTGAKKANRVTKPEAGHFAKAGVEAGRGLWEFRLAEGEEFTVGQSISVELFADVKKVDVTGTSKGKGFAGTVKRWNFRTQDATHGNSLSHRVPGSIGQNQTPGKVFKGKKMAGQMGNERVTVQSLDVVRVDAERNLLLVKGAVPGATGSDLIVKPAVKA\n>3ccj_K mol:protein length:132  50S ribosomal protein L14P\nMEALGADVTQGLEKGSLITCADNTGARELKVISVHGYSGTKNRHPKAGLGDKITVSVTKGTPEMRRQVLEAVVVRQRKPIRRPDGTRVKFEDNAAVIVDENEDPRGTELKGPIAREVAQRFGSVASAATMIV\n>7c2o_A mol:protein length:368  R-specific carbonyl reductase\nMTKAVPDKFQGFAVSDPKNWNRPKLASYERKQINPHDVVLKNEVCGLCYSDIHTLSAGWQPLQRDNLVVGHEIIGEVIAVGDEVTEFKVGDRVGIGAASSSCRSCQRCDSDNEQYCKQGAATYNSKDVRSNNYVTQGGYSSHSIADEKFVFAIPEDLPSSYGAPLMCAGITVFSPLIRNLGLDARGKNVGIIGIGGLGHLALQFANAMGANVTAFSRSSSKKEQAMKLGAHDFVATGEDKTWYKNYDDHFDFILNCASGIDGLNLSEYLSTLKVDKKFVSVGLPPSEDKFEVSPFTFLQQGASFGSSLLGSKTEVKEMLNLAAKHNVRPMIEEVPISEENCAKALDRCHAGDVRYRFVFTDFDKAFKA\n>6iax_B mol:protein length:355  Cyclic nucleotide-gated potassium channel mll3241\nMSVLPFLRIYAPLNAVLAAPGLLAVAALTIPDMSGRSRLALAALLAVIWGAYLLQLAATLLKRRAGVVRDRTPKIAIDVLAVLVPLAAFLLDGSPDWSLYCAVWLLKPLRDSTFFPVLGRVLANEARNLIGVTTLFGVVLFAVALAAYVIERDIQPEKFGSIPQAMWWAVVTLSTTGYGDTIPQSFAGRVLAGAVMMSGIGIFGLWAGILATGFYQEVRRGDFVRNWQLVAAVPLFQKLGPAVLVEIVRALRARTVPAGAVICRIGEPGDRMFFVVEGSVSVATPNPVELGPGAFFGEMALISGEPRSATVSAATTVSLLSLHSADFQMLCSSSPEIAEIFRKTALERRGAAASA\n>5l64_F mol:protein length:288  Probable proteasome subunit alpha type-7\nMTSIGTGYDLSNSVFSPDGRNFQVEYAVKAVENGTTSIGIKCNDGVVFAVEKLITSKLLVPQKNVKIQVVDRHIGCVYSGLIPDGRHLVNRGREEAASFKKLYKTPIPIPAFADRLGQYVQAHTLYNSVRPFGVSTIFGGVDKNGAHLYMLEPSGSYWGYKGAATGKGRQSAKAELEKLVDHHPEGLSAREAVKQAAKIIYLAHEDNKEKDFELEISWCSLSETNGLHKFVKGDLLQEAIDFAQKEINGDDDEDEDDSDNVMSSDDENAPVATNANATTDQEGDIHLE\n>6zn5_a mol:protein length:72  40S ribosomal protein S25\nDKLNNLVLFDKATYDKLCKEVPNYKLITPAVVSERLKIRGSLARAALQELLSKGLIKLVSKHRAQVIYTRNT\n>3b3v_A mol:protein length:291  Bacterial leucyl aminopeptidase\nMPPITQQATVTAWLPQVDASQITGTISSLESFTNRFYTTTSGAQASDWIASEWQALSASLPNASVKQVSHSGYNQKSVVMTITGSEAPDEWIVIGGHLDSTIGSHTNEQSVAPGADDDASGIAAVTEVIRVLSENNFQPKRSIAFMAYAAEEVGLRGSQDLANQYKSEGKNVVSALQLDMTNYKGSAQDVVFITDYTDSNFTQYLTQLMDEYLPSLTYGFDTCGYACADHASWHNAGYPAAMPFESKFNDYNPRIHTTQDTLANSDPTGSHAKKFTQLGLAYAIEMGSATG\n>2owp_A mol:protein length:129  Hypothetical protein Bxe_B1374\nGMEVNQPDIVAQVQAAFVEYERALVENDIEAMNALFWHTPETVRYGIAEVQHGGEAIRAWRERCEPVPKSRKLHRTVVTTFGTDFATVSTEFTSDATPLLGRQMQTWARLSPADGWKIVAAHVSLIAMP\n>6dr6_A mol:protein length:16  ORT-CYS-VAL-PHE-XXX-CYS-GLU-ASP-ORT-ALA-ILE-ILE-GLY-LEU-ORA-VAL\nACVFACEDAAIIGLAV\n>7phw_F mol:protein length:209  Monoclonal antibody Cy.004 light chain\nALTQPSSVSANPGETVKITCSGSTYNYGWYQQKSPGSAPVTVIYYNDKRPSDIPSRFSGSKSGSTGTLTITGVQAEDEAVYYCGNSDSRNVAFGAGTTLTVLRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC\n>3gvt_B mol:protein length:351  Pumilio homolog 2\nGTGRSRLLEDFRNNRFPNLQLRDLIGHIVEFSQDQHGSRFIQQKLERATPAERQIVFNEILQAAYQLMTDVFGNYVIQKFFEFGSLDQKLALATRIRGHVLPLALQMYGCRVIQKALESISSDQQSEMVKELDGHVLKCVKDQNGNHVVQKCIECVQPQSLQFIIDAFKGQVFVLSTHPYGCRVIQRILEHCTAEQTLPILEELHQHTEQLVQDQYGNYVIQHVLEHGRPEDKSKIVSEIRGKVLALSQHKFASNVVEKCVTHASRAERALLIDEVCCQNDGPHSALYTMMKDQYANYVVQKMIDMAEPAQRKIIMHKIRPHITTLRKYTYGKHILAKLEKYYLKNSPDLG\n>6z0l_B mol:protein length:50  Cys-N2 Strand\nXGLCALRSELQALRREGFSPEELAALESELQALERELAALRSELQALRGX\n>4ujc_CC mol:protein length:293  40S RIBOSOMAL PROTEIN US5\nMADDAGAAGGPGGPGGPGMGNRGGFRGGFGSGIRGRGRGRGRGRGRGRGARGGKAEDKEWMPVTKLGRLVKDMKIKSLEEIYLFSLPIKESEIIDFFLGASLKDEVLKIMPVQKQTRAGQRTRFKAFVAIGDYNGHVGLGVKCSKEVATAIRGAIILAKLSIVPVRRGYWGNKIGKPHTVPCKVTGRCGSVLVRLIPAPRGTGIVSAPVPKKLLMMAGIDDCYTSARGCTATLGNFAKATFDAISKTYSYLTPDLWKETVFTKSPYQEFTDHLVKTHTRVSVQRTQAPAVATT\n>6ywy_OO mol:protein length:320  Related to ribosomal protein S15 (Mitochondrial)\nMPPRLPGPQGLRSLTLCLRPAVASPAQALQPLIQTANISQKEKKRKMKQDPYGWAQAQQRKAVNVKRQAELQAQRDAAWGDPVKGITTPFVESFDSAGQASVSPPKVGPDGQLVEEPKPLPTSPHLRNYLLNKDEFDSAIQYAEHILKPIKAEDRLTADPEKEDEEAREHAARHAKAVAALERIAKLEHGGAKDRKHANIRRCIETFGRHITDQSLERPTPPLARGVEPKPQPVRAGPDTGSSEVQIAILTSKIRALSKALEGHGGNRDKNNKRSLRRLCHKRQRLLRYMERKERGSGRWHHMLETLGLTPATWKGQITL\n>5vyo_D mol:protein length:200  Thiol:disulfide interchange protein\nSNAAGFAQASPSAPVAGKDFEVMKSPQPVSAPAGKVEVIEFFWYGCPHAYEFEPTIEAWVKKQGDKIAFKRVPVAFRDDFVPHSKLFYALAALGVSEKVTPAVFNAIHKEKNYLLTPQAQADFLATQGVDKKKFLDAYNSFSVQGQVKQSAELLKNYNIDGVPTIVVQGKYKTGPAYTNSLEGTAQVLDFLVKQVQDKKL\n>2i0c_A mol:protein length:259  Glutamate receptor, ionotropic kainate 2\nGSNRSLIVTTILEEPYVLFKKSDKPLYGNDRFEGYCIDLLRELSTILGFTYEIRLVEDGKYGAQDDVNGQWNGMVRELIDHKADLAVAPLAITCVREKVIDFSKPFMTLGISILYRKGTPIDSADDLAKQTKIEYGAVEDGATMTFFKKSKISTYDKMWAFMSSRRQSVLVKSNEEGIQRVLTSDYAFLMESTTIEFVTQRNCNLTQIGGLIDSKGYGVGTPMGSPYRDKITIAICQLQEEGKLHMMKEKWWRGNGCPS\n>2pod_A mol:protein length:410  Mandelate racemase / muconate lactonizing enzyme\nMSLKITEIETLRPEEFPNLLWVLVHTDEGITGLGETFYGACSAEAYIHEWAANRLIGEDPLQIDRHAKRLSGYLGFRSAGAEMRGNSALDIALWDIFGKATGQPIYQLLGGKCRDTIRTYNTCAGPHYVRTAKQQSVANWGLANSVSARYDDLNAFLHRADELALDLLDSGITAMKIWPFDPYAEASDGYYISKSDLKRALEPFEKIRRAVGDKMDVMVEFHSLWNLPPALQIAEALREYETFWHEDPIRMDSLSSLKRYAERSLAPVCASETLATRWGFRDLLETNAAGIVMLDISWCGGLSEARKIASMAEAWHLPVAPHDCTGPVVLTASTHLSLNAPNALVQESVRAFYDGWYRDLVTALPTVKDGHITVPDGPGLGLELMPDIRERLTIAVRNTSDCEGHHHHHH\n>6bsr_A mol:protein length:666  PBP4 protein\nMGSDKIHHHHHHENLYFQGHMSQWQAKQELAEAKKTATTFLNVLSKQEFDKLPSVVQEASLKKNGYDTKSVVEKYQAIYSGIQAEGVKASDVQVKKAKDNQYTFTYKLSMSTPLGEMKDLSYQSSIAKKGDTYQIAWKPSLIFPDMSGNDKISIQVDNAKRGEIVDRNGSGLAINKVFDEVGVVPGKLGSGAEKTANIKAFSDKFGVSVDEINQKLSQGWVQADSFVPITVASEPVTELPTGAATKDTESRYYPLGEAAAQLIGYTGTITAEDIEKNPELSSTGVIGKTGLERAFDKELRGQDGGSLVILDDKENVKKALQTKEKKDGQTIKLTIDSGVQQQAFAIFDKRPGSAVITDPQKGDLLATVSSPSYDPNKMANGISQKEYDAYNNNKDLPFTARFATGYAPGSTFKTITGAIGLDAGTLKPDEELEINGLKWQKDKSWGGYFATRVKEASPVNLRTALVNSDNIYFAQQTLRMGEDKFRAGLNKFIFGEELDLPIAMTPAQISNEDKFNSEILLADTGYGQGQLLISPIQQATMYSVFQNNGTLVYPKLVLDKETKKKDNVISANAANTIATDLLGSVEDPSGYVYNMYNPNFSLAAKTGTAEIKDKQDTDGKENSFLLTLDRSNNKFLTMIMVENSGENGSATDISKPLIDYLEATIK\n>1i48_J mol:protein length:445  CYSTATHIONINE GAMMA-SYNTHASE\nMAKAVDAAAAAAAAIAPVDTTVVNEDVALVENETCNDQNVQFDSLPSMKYASFLNSDGSVAIHAGERLGRGIVTDAITTPVVNTSAYFFNKTSELIDFKEKRRASFEYGRYGNPTTVVLEEKISALEGAESTLLMASGMCASTVMLLALVPAGGHIVTTTDCYRKTRIFIETILPKMGITATVIDPADVGALELALNQKKVNLFFTESPTNPFLRCVDIELVSKLCHEKGALVCIDGTFATPLNQKALALGADLVLHSATKFLGGHNDVLAGCISGPLKLVSEIRNLHHILGGALNPNAAYLIIRGMKTLHLRVQQQNSTALRMAEILEAHPKVRHVYYPGLQSHPEHHIAKKQMTGFGGAVSFEVDGDLLTTAKFVDALKIPYIAPSFGGCESIVDQPAIMSYWDLSQSDRAKYGIMDNLVRFSFGVEDFDDLKADILQALDSI\n>3u39_C mol:protein length:319  6-phosphofructokinase\nMKRIGVLTSGGDSPGMNAAIRSVVRKAIYHGVEVYGVYHGYAGLIAGNIKKLEVGDVGDIIHRGGTILYTARCPEFKTEEGQKKGIEQLKKHGIEGLVVIGGDGSYQGAKKLTEHGFPCVGVPGTIDNDIPGTDFTIGFDTALNTVIDAIDKIRDTATSHERTYVIEVMGRHAGDIALWSGLAGGAETILIPEADYDMNDVIARLKRGHERGKKHSIIIVAEGVGSGVDFGRQIQEATGFETRVTVLGHVQRGGSPTAFDRVLASRLGARAVELLLEGKGGRCVGIQNNQLVDHDIAEALANKHTIDQRMYALSKELSI\n>5i8e_C mol:protein length:222  VRC34.01 Fab heavy chain\nQEVLVQSGAEVKKPGASVKVSCRAFGYTFTGNALHWVRQAPGQGLEWLGWINPHSGDTTTSQKFQGRVYMTRDKSINTAFLDVTRLTSDDTGIYYCARDKYYGNEAVGMDVWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEP\n>3mhv_C mol:protein length:117  Vacuolar protein sorting-associated protein 4\nGSPDLAARTTMFEINVGDTPCVLTKEDYRTLGAMTEGYSGSDIAVVVKDALMQPIRKIQSATHFKDVSTEDDETRKLTPCSPGDDGAIEMSWTDIEADELKEPDLTIKDFLKAIKST\n>7opd_d mol:protein length:1143  DNA damage-binding protein 1\nSNAMSYNYVVTAQKPTAVNGCVTGHFTSAEDLNLLIAKNTRLEIYVVTAEGLRPVKEVGMYGKIAVMELFRPKGESKDLLFILTAKYNACILEYKQSGESIDIITRAHGNVQDRIGRPSETGIIGIIDPECRMIGLRLYDGLFKVIPLDRDNKELKAFNIRLEELHVIDVKFLYGCQAPTICFVYQDPQGRHVKTYEVSLREKEFNKGPWKQENVEAEASMVIAVPEPFGGAIIIGQESITYHNGDKYLAIAPPIIKQSTIVCHNRVDPNGSRYLLGDMEGRLFMLLLEKEEQMDGTVTLKDLRVELLGETSIAECLTYLDNGVVFVGSRLGDSQLVKLNVDSNEQGSYVVAMETFTNLGPIVDMCVVDLERQGQGQLVTCSGAFKEGSLRIIRNGIGIHEHASIDLPGIKGLWPLRSDPNRETDDTLVLSFVGQTRVLMLNGEEVEETELMGFVDDQQTFFCGNVAHQQLIQITSASVRLVSQEPKALVSEWKEPQAKNISVASCNSSQVVVAVGRALYYLQIHPQELRQISHTEMEHEVACLDITPLGDSNGLSPLCAIGLWTDISARILKLPSFELLHKEMLGGEIIPRSILMTTFESSHYLLCALGDGALFYFGLNIETGLLSDRKKVTLGTQPTVLRTFRSLSTTNVFACSDRPTVIYSSNHKLVFSNVNLKEVNYMCPLNSDGYPDSLALANNSTLTIGTIDEIQKLHIRTVPLYESPRKICYQEVSQCFGVLSSRIEVQDTSGGTTALRPSASTQALSSSVSSSKLFSSSTAPHETSFGEEVEVHNLLIIDQHTFEVLHAHQFLQNEYALSLVSCKLGKDPNTYFIVGTAMVYPEEAEPKQGRIVVFQYSDGKLQTVAEKEVKGAVYSMVEFNGKLLASINSTVRLYEWTTEKELRTECNHYNNIMALYLKTKGDFILVGDLMRSVLLLAYKPMEGNFEEIARDFNPNWMSAVEILDDDNFLGAENAFNLFVCQKDSAATTDEERQHLQEVGLFHLGEFVNVFCHGSLVMQNLGETSTPTQGSVLFGTVNGMIGLVTSLSESWYNLLLDMQNRLNKVIKSVGKIEHSFWRSFHTERKTEPATGFIDGDLIESFLDISRPKMQEVVANLQYDDGSGMKREATADDLIKVVEELTRIH\n>7ba7_A mol:protein length:236  14-3-3 protein sigma\nGAMGSMERASLIQKAKLAEQAERYEDMAAFMKGAVEKGEELSNEERCLLSVAYKNVVGGQRAAWRVLSSIEQKSNEEGSEEKGPEVREYREKVETELQGVCDTVLGLLDSHLIKEAGDAESRVFYLKMKGDYYRYLAEVATGDDKKRIIDSARSAYQEAMDISKKEMPPTNPIRLGLALNFSVFHYEIANSPEEAISLAKTTFDEAMADLHTLSEDSYKDSTLIMQLLRDNLTLWT\n>4v8d_CE mol:protein length:256  30S RIBOSOMAL PROTEIN S2\nMPVEITVKELLEAGVHFGHERKRWNPKFARYIYAERNGIHIIDLQKTMEELERTFRFIEDLAMRGGTILFVGTKKQAQDIVRMEAERAGMPYVNQRWLGGMLTNFKTISQRVHRLEELEALFASPEIEERPKKEQVRLKHELERLQKYLSGFRLLKRLPDAIFVVDPTKEAIAVREARKLFIPVIALADTDSDPDLVDYIIPGNDDAIRSIQLILSRAVDLIIQARGGVVEPSPSYALVQEAEATETPEGESEVEA\n>6ald_D mol:protein length:363  FRUCTOSE-1,6-BIS(PHOSPHATE) ALDOLASE\nPHSHPALTPEQKKELSDIAHRIVAPGKGILAADESTGSIAKRLQSIGTENTEENRRFYRQLLLTADDRVNPCIGGVILFHETLYQKADDGRPFPQVIKSKGGVVGIKVDKGVVPLAGTNGETTTQGLDGLSERCAQYKKDGADFAAWRCVLKIGEHTPSALAIMENANVLARYASICQQNGIVPIVEPEILPDGDHDLKRCQYVTEKVLAAVYKALSDHHIYLEGTLLKPNMVTPGHACTQKYSHEEIAMATVTALRRTVPPAVTGVTFLSGGQSEEEASINLNAINKCPLLKPWALTFSYGRALQASALKAWGGKKENLKAAQEEYVKRALANSLACQGKYTPSGQAGAAASESLFISNHAY\n>3eff_N mol:protein length:139  Voltage-gated potassium channel\nSALHWRAAGAATVLLVIVLLAGSYLAVLAERGAPGAQLITYPRALWWSVETATTVGYGDLYPVTLWGRLVAVVVMVAGITSFGLVTAALATWFVGREQERRGHFVRHSEKAAEEAYTRTTRALHERFDRLERMLDDNRR\n>1px6_B mol:protein length:209  Glutathione S-transferase P\nPPYTVVYFPVRGRCAALRMLLADQGQSWKEEVVTVETWQEGSLKASCLYGQLPKFQDGDLTLYQSNTILRHLGRTLGLYGKDQQEAALVDMVNDGVEDLRCKYISLIYTNYEAGKDDYVKALPGQLKPFETLLSQNQGGKTFIVGDQISFANYNLLDLLLIHEVLAPGCLDAFPLLSAYVGRLSARPKLKAFLASPEYVNLPINGNGKQ\n>6lkn_C mol:protein length:361  Cell cycle control protein 50A\nMAMNYNAKDEVDGGPPCAPGGTAKTRRPDNTAFKQQRLPAWQPILTAGTVLPIFFIIGLIFIPIGIGIFVTSNNIREIEIDYTGTEPSSPCNKCLSPDVTPCFCTINFTLEKSFEGNVFMYYGLSNFYQNHRRYVKSRDDSQLNGDSSALLNPSKECEPYRRNEDKPIAPCGAIANSMFNDTLELFLIGQDSYPIPIALKKKGIAWWTDKNVKFRNPPGGDNLEERFKGTTKPVNWLKPVYMLDSDPDNNGFINEDFIVWMRTAALPTFRKLYRLIERKSDLHPTLPAGRYWLNVTYNYPVHYFDGRKRMILSTISWMGGKNPFLGIAYIAVGSISFLLGVVLLVINHKYRNSSNTADITI\n>1ees_A mol:protein length:178  GTP-BINDING PROTEIN\nMQTIKCVVVGDGAVGKTCLLISYTTNKFPSEYVPTVFDNYAVTVMIGGEPYTLGLFDTAGQEDYDRLRPLSYPQTDVFLVCFSVVSPSSFENVKEKWVPEITHHCPKTPFLLVGTQIDLRDDPSTIEKLAKNKQKPITPETAEKLARDLKAVKYVECSALTQKGLKNVFDEAILAALE\n>3ow9_B mol:protein length:6  KLVFFA hexapeptide segment from Amyloid beta\nKLVFFA\n>7ezx_hI mol:protein length:164  Phycoerythrin alpha subunit\nMKSVITTVVSAADAAGRFPSNSDLESIQGNIQRSAARLEAAEKLAGNHEAVVKEAGDACFAKYAYLKNPGEAGENQEKINKCYRDVDHYMRLVNYCLVVGGTGPLDEWGIAGAREVYRTLNLPTSAYVASIAYTRDRLCVPRDMSAQAGVEFSAYLDYLINALS\n>7o2z_P mol:protein length:9  P/A#1 epitope peptide\nXAPAPAAPA\n>6zsk_A mol:protein length:158  Cytochrome c\nMNKPSFLLVGLLVVSGVLGAAETKVKYPDGFRSWYHVKSMVIQPGHPLENPFGGIHHVYANAEAIQGLRGGNYPDGAVLVFDLFDYQEDNHALVEGKRKLIGVMERDAKRFSATGGWGYEGFGEGKPDKRLVTDGGQGCFGCHAAQKESQYVFSRLRD\n>5k28_B mol:protein length:64  Mitogen-activated protein kinase kinase kinase 11\nHMPVWTALFDYEPSGQDELALRKGDRVEVLSRDAAISGDEGWWAGQVGGQVGIFPSNYVSRGGG\n>6xc7_D mol:protein length:215  CC12.3 light chain\nEIVLTQSPGTLSLSPGERATLSCRASQSVSSYLAWYQQKPGQAPRLLIYGASSRATGIPDRFSGSGSGTDFTLTISRLEPEDFAVYYCQQYGSSPRTFGQGTKLEIKRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGECS\n>3mfe_O mol:protein length:240  Proteasome subunit alpha\nMEQAMRERSELARKGIARAKSVVALAYAGGVLFVAENPSRSLQKISELYDRVGFAAAGKFNEFDNLRRGGIQFADTRGYAYDRRDVTGRQLANVYAQTLGTIFTEQAKPYEVELCVAEVAHYGETKRPELYRITYDGSIADEPHFVVMGGTTEPIANALKESYAENASLTDALRIAVAALRAGSADTSGGDQPTLGVASLEVAVLDANRPRRAFRRITGSALQALLVDQESPQSDGESSG\n>5uuh_A mol:protein length:241  DNA-7-methylguanine glycosylase\nGPVPMHPFVKALQEHFTAHQNPEKAEPMARYMKNHFLFLGIQTPERRQLLKDIIQIHTLPDQKDFQIIIRELWDLPEREFQAAALDIMQKYKKHINETHIPFLEELIVTKSWWDSVDSIVPTFLGDIFLKHPELISAYIPKWIASDNIWLQRAAILFQLKYKQKMDEELLFWIIGQLHSSKEFFIQKAIGWVLREYAKTNPDVVWEYVQNNELAPLSKREAIKHIKQNYGINNEKIGETLS\n>4y6t_C mol:protein length:166  Coat protein\nMTAPIPVVPVSRPQAKTSLKLPNNQVWVTRKASEWSAKTIDTNDAIPFKTIVEGIPEINSETKFYRLLIGFVAVSDGTFGMVDGVTGDVIPDPPVVGRLGFKKNTYRSRDFDLGGKLLNQLDDRAIVWCLDERRRDAKRVQLAGYWIAISKPAPLMPPEDFLVNQD\n>1hx6_B mol:protein length:394  MAJOR CAPSID PROTEIN\nAQVQQLTPAQQAALRNQQAMAANLQARQIVLQQSYPVIQQVETQTFDPANRSVFDVTPANVGIVKGFLVKVTAAITNNHATEAVALTDFGPANLVQRVIYYDPDNQRHTETSGWHLHFVNTAKQGAPFLSSMVTDSPIKYGDVMNVIDAPATIAAGATGELTMYYWVPLAYSETDLTGAVLANVPQSKQRLKLEFANNNTAFAAVGANPLEAIYQGAGAADCEFEEISYTVYQSYLDQLPVGQNGYILPLIDLSTLYNLENSAQAGLTPNVDFVVQYANLYRYLSTIAVFDNGGSFNAGTDINYLSQRTANFSDTRKLDPKTWAAQTRRRIATDFPKGVYYCDNRDKPIYTLQYGNVGFVVNPKTVNQNARLLMGYEYFTSRTELVNAGTISTT\n>2hbg_A mol:protein length:147  HEMOGLOBIN (DEOXY)\nGLSAAQRQVIAATWKDIAGADNGAGVGKKCLIKFLSAHPQMAAVFGFSGASDPGVAALGAKVLAQIGVAVSHLGDEGKMVAQMKAVGVRHKGYGNKHIKAQYFEPLGASLLSAMEHRIGGKMNAAAKDAWAAAYADISGALISGLQS\n>3wry_D mol:protein length:451  Replicase large subunit\nSYTRSEEIESLEQFHMATASSLIHKQMCSIVYTGPLKVQQMKNFIDSLVASLSAAVSNLVKILKDTAAIDLETRQKFGVLDVASKRWLVKPSAKNHAWGVVETHARKYHVALLEHDEFGIITCDNWRRVAVSSESVVYSDMAKLRTLRRLLKDGEPHVSSAKVVLVDGVPGCGKTKEILSRVNFEEDLILVPGRQAAEMIRRRANASGIIVATKDNVRTVDSFLMNYGKGARCQFKRLFIDEGLMLHTGCVNFLVEMSLCDIAYVYGDTQQIPYINRVTGFPYPAHFAKLEVDEVETRRTTLRCPADVTHFLNQRYEGHVMCTSSEKKSVSQEMVSGAASINPVSKPLKGKILTFTQSDKEALLSRGYADVHTVHEVQGETYADVSLVRLTPTPVSIIARDSPHVLVSLSRHTKSLKYYTVVMDPLVSIIRDLERVSSYLLDMYKVDAGTQ\n>6hvt_U mol:protein length:252  Proteasome subunit alpha type-1\nMSGAAAASAAGYDRHITIFSPEGRLYQVEYAFKATNQTNINSLAVRGKDCTVVISQKKVPDKLLDPTTVSYIFCISRTIGMVVNGPIPDARNAALRAKAEAAEFRYKYGYDMPCDVLAKRMANLSQIYTQRAYMRPLGVILTFVSVDEELGPSIYKTDPAGYYVGYKATATGPKQQEITTNLENHFKKSKIDHINEESWEKVVEFAITHMIDALGTEFSKNDLEVGVATKDKFFTLSAENIEERLVAIAEQD\n>5z3u_H mol:protein length:122  Histone H2B 1.1\nAKSAPAPKKGSKKAVTKTQKKDGKKRRKTRKESYAIYVYKVLKQVHPDTGISSKAMSIMNSFVNDVFERIAGEASRLAHYNKRSTITSREIQTAVRLLLPGELAKHAVSEGTKAVTKYTSAK\n>2ex3_C mol:protein length:575  DNA polymerase\nMKHMPRKMYSCAFETTTKVEDCRVWAYGYMNIEDHSEYKIGNSLDEFMAWVLKVQADLYFHNLKFAGAFIINWLERNGFKWSADGLPNTYNTIISRMGQWYMIDICLGYKGKRKIHTVIYDSLKKLPFPVKKIAKDFKLTVLKGDIDYHKERPVGYKITPEEYAYIKNDIQIIAEALLIQFKQGLDRMTAGSDSLKGFKDIITTKKFKKVFPTLSLGLDKEVRYAYRGGFTWLNDRFKEKEIGEGMVFDVNSLYPAQMYSRLLPYGEPIVFEGKYVWDEDYPLHIQHIRCEFELKEGYIPTIQIKRSRFYKGNEYLKSSGGEIADLWLSNVDLELMKEHYDLYNVEYISGLKFKATTGLFKDFIDKWTYIKTTSEGAIKQLAKLMLNSLYGKFASNPDVTGKVPYLKENGALGFRLGEEETKDPVYTPMGVFITAWARYTTITAAQACYDRIIYCDTDSIHLTGTEIPDVIKDIVDPKKLGYWAHESTFKRAKYLRQKTYIQDIYMKEVDGKLVEGSPDDYTDIKFSVKCAGMTDKIKKEVTFENFKVGFSRKMKPKPVQVPGGVVLVDDTFTIK\n>2jo4_D mol:protein length:22  KIA7\nXAKAAAAAIKAIAAIIKAGGYX\n>7vd5_b mol:protein length:484  Photosystem II CP47 reaction center protein\nALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDPVLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGIWSFEGVALSHIILSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLSGLLCFGFGAFHVTGLFGPGIWVSDAYGITGKVQPVAPAWGADGFNPFNPGGIAAHHIAAGIFGIFAGIFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFAAFVTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVETSVSEGLSESQAWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFRDKEGRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVDFYGGKLNGQTFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGWYTYGHANFALLFFFGHLWHGGRTIFRDVFTGIGAE\n>7c4w_C mol:protein length:240  Capsid protein VP3\nGIPAELRPGTNQFLTTDDDTAAPILPGFTPTPTIHIPGEVHSLLELCRVETILEVNNTTEATGLTRLLIPVSSQNKADELCAAFMVDPGRIGPWQSTLVGQICRYYTQWSGSLKVTFMFTGSFMATGKMLVAYSPPGSAQPANRETAMLGTHVIWDFGLQSSVSLVIPWISNTHFRTAKTGGNYDYYTAGVVTLWYQTNYVVPPETPGEAYIIAMGAAQDNFTLKICKDTDEVTQQAVLQ\n>4w2f_CS mol:protein length:93  30S Ribosomal Protein S19\nMPRSLKKGVFVDDHLLEKVLELNAKGEKRLIKTWSRRSTIVPEMVGHTIAVYNGKQHVPVYITENMVGHKLGEFAPTRTYRGHGKEAKATKKK\n>5s64_B mol:protein length:445  Tubulin beta-2B chain\nMREIVHIQAGQCGNQIGAKFWEVISDEHGIDPTGSYHGDSDLQLERINVYYNEATGNKYVPRAILVDLEPGTMDSVRSGPFGQIFRPDNFVFGQSGAGNNWAKGHYTEGAELVDSVLDVVRKESESCDCLQGFQLTHSLGGGTGSGMGTLLISKIREEYPDRIMNTFSVMPSPKVSDTVVEPYNATLSVHQLVENTDETYCIDNEALYDICFRTLKLTTPTYGDLNHLVSATMSGVTTCLRFPGQLNADLRKLAVNMVPFPRLHFFMPGFAPLTSRGSQQYRALTVPELTQQMFDSKNMMAACDPRHGRYLTVAAIFRGRMSMKEVDEQMLNVQNKNSSYFVEWIPNNVKTAVCDIPPRGLKMSATFIGNSTAIQELFKRISEQFTAMFRRKAFLHWYTGEGMDEMEFTEAESNMNDLVSEYQQYQDATADEQGEFEEEEGEDEA\n>3tdp_B mol:protein length:257  formate/nitrite transporter\nRAHKETLDKLTNAAINKINLLNTSKVKYLVSSAFAGLYVGIGILLIFTIGGLLTDAGSPMTKIVMGLSFAIALSLVIMTGTELFTGNNMVMSAGMLNKGVSIKDTSKIWAYSWVGNLIGALVLGIIFVGTGLVDKGPVAEFFANTAASKASMPFTALFFRGILCNILVCVSVLCSFRTNSDTAKIIMIFLCLFAFITSGFEHSVANMTIYSVSLFSPTISTVTIGGAIYNLVAVTLGNIVGGALFMGLGTYILGKEK\n>4jpj_B mol:protein length:181  Germline-targeting HIV-1 gp120 engineered outer domain, eOD-GT6\nDTITLPCRPAPPPHCSSNITGLILTRDGGVSNDETEIFRPSGGDMRDIARCQIAGTVVSTQLFLNGSLAEEEVVIRSVDFRDNAKSICVQLDTSVEIDCTGAGHCDISRAKWDNTLKQIASKLREQFGDRTIIFKQSSGGDPEFVTHSFNCGGEFFYCDSTQLFDSTWFDSTGTKHHHHHH\n>5ohm_F mol:protein length:116  K33-specific affimer\nMSAATGVRAVPGNENSLEIEELARFAVDEHNKKENALLEFVRVVKAKEQIWEMDASKETMYYLTLEAKDGGKKKLYEAKVWVKMTHWIGAMNNFKELQEFKPVGDAAAAHHHHHHG\n>7eqg_B mol:protein length:434  Type I-F CRISPR-associated protein Csy1\nMTSPLPTPTWQELRQFIESFIQERLQGKLDKLHPDEDDKRQTLLATHRREAWLADAARRVGQLQLVTHTLKPIHPDARGSNLHSLPQAPGQPGLAGSHELGDRLVSDVVGNAAALDVFKFLSLQYQGKNLLNWLTEDSAEAVQALSDNAEQAREWRQAFIGITAVKGAPASHSLAKQLYFPLPGSGYHLLAPLFPTSLVHHVHALLREARFGDAAKAAREARSRQESWPHGFSEYPNLAIQKFGGTKPQNISQLNSERYGENWLLPSLPPHWQRQDQRAPIRHSSVFEHDFGRSPEVSRLTRTLQRLLAKTRHNNFTIRRYRAQLVGQICDEALQYAARLRELEPGWSATPGCQLHDAEQLWLDPLRAQTDETFLQRRLRGDWPAEVGNRFANWLNRAVSSDSQILGSPEAAQWSQELSKELTMFKEILEDERD\n>4a98_F mol:protein length:307  CYS-LOOP LIGAND-GATED ION CHANNEL\nPVDVSVSIFINKIYGVNTLEQTYKVDGYIVAQWTGKPRKTPGDKPLIVENTQIERWINNGLWVPALEFINVVGSPDTGNKRLMLFPDGRVIYNARFLGSFSNDMDFRLFPFDRQQFVLELEPFSYNNQQLRFSDIQVYTENIDNEEIDEWWIRGKASTHISDIRYDHLSSVQPNQNEFSRITVRIDAVRNPSYYLWSFILPLGLIIAASWSVFWLESFSERLQTSFTLMLTVVAYAFYTSNILPRLPYTTVIDQMIIAGYGSIFAAILLIIFAHHRQANGVEDDLLIQRCRLAFPLGFLAIGCVLVI\n>6trc_z mol:protein length:36  Photosystem I 4.8K protein\nMATKSAKPTYAFRTFWAVLLLAINFLVAAYYFGILK\n>3lte_O mol:protein length:132  Response regulator\nMSLKQSKRILVVDDDQAMAAAIERVLKRDHWQVEIAHNGFDAGIKLSTFEPAIMTLDLSMPKLDGLDVIRSLRQNKVANQPKILVVSGLDKAKLQQAVTEGADDYLEKPFDNDALLDRIHDLVNEGHHHHHH\n>7jql_1D mol:protein length:276  50S ribosomal protein L2\nMAVKKFKPYTPSRRFMTVADFSEITKTEPEKSLVKPLKKTGGRNNQGRITVRFRGGGHKRLYRIIDFKRWDKVGIPAKVAAIEYDPNRSARIALLHYVDGEKRYIIAPDGLQVGQQVVAGPDAPIQVGNALPLRFIPVGTVVHAVELEPKKGAKLARAAGTSAQIQGREGDYVILRLPSGELRKVHGECYATVGAVGNADHKNIVLGKAGRSRWLGRRPHVRGAAMNPVDHPHGGGEGRAPRGRPPASPWGWQTKGLKTRKRRKPSSRFIIARRKK\n>6wvt_O mol:protein length:236  Catenin alpha-1\nAIMAQLPQEQKAKIAEQVASFQEEKSKLDAEVSKWDDSGNDIIVLAKQMCMIMMEMTDFTRGKGPLKNTSDVISAAKKIAEAGSRMDKLGRTIADHCPDSACKQDLLAYLQRIALYCHQLNICSKVKAEVQNLGGELVVSGVDSAMSLIQAAKNLMNAVVQTVKASYVASTKYQKSQGMASLNLPAVSWKMKAPEKKPLVKREKQDETQTKIKRASQKKHVNPVQALSEFKAMDSI\n>6oq5_F mol:protein length:142  7F\nSNSQVQLVESGGGLVEAGGSLRLSCVVTGSSFSTSTMAWYRQPPGKQREWVASFTSGGAIKYTDSVKGRFTMSRDNAKKMTYLQMENLKPEDTAVYYCALHNAVSGSSWGRGTQVTVSSEPKTPKPQTSGAPVPYPDPLEPR\n>5ekc_C mol:protein length:491  Aldehyde dehydrogenase\nMIDLNIMKVANYINGEFKEPSTGAFQVKTSPVDGSKIAEVPRSGREDAREAIDSAFEALKAWANIPAIRRAEYLYKMLEVFRQMKEDFMKILTVEGGGTYRKVWGEVVFTERLIQNAAELARHYQGRVLQSDSESTISVVFKRSKGVVGVITPWNYPLSISMKKIAHTLAVGNTVVYKPASDTPVTGWLIAQMVAKAGLPKGVFNLVIGPGPVVGEEIVTHKRVAHVTFTGESSTGREIAAKAAGTLKTVTLELGGSDPLIILDDVDVDYAARLAVFASLFHQGQICTSAKRIIVHKAVADKFIERYVHYVKMLRIDDPRKDEKVDLGPLINERQVALMKEFVDDAVSRGGRLLIGGRSWGNFFEPAIFVDVDRNFRIMREEVFGPVRPIVVVENDDQAVEVANDTDYGLSGAVLTNNVNRAFRIAEAVESGMFHINDVTFLEESHVPFGGIKASGVGREGGEWSFHETTYDRWVTVTLRTRRFPIPSALK\n>3fby_A mol:protein length:551  Cartilage oligomeric matrix protein\nRSPWPGVPTSPVWWNSAQRFCPDGSPSECHEHADCVLERDGSRSCVCAVGWAGNGILCGRDTDLDGFPDEKLRCPERQCRKDNCVTVPNSGQEDVDRDGIGDACDPDADGDGVPNEKDNCPLVRNPDQRNTDEDKWGDACDNCRSQKNDDQKDTDQDGRGDACDDDIDGDRIRNQADNCPRVPNSDQKDSDGDGIGDACDNCPQKSNPDQADVDHDFVGDACDSDQDQDGDGHQDSRDNCPTVPNSAQEDSDHDGQGDACDDDDDNDGVPDSRDNCRLVPNPGQEDADRDGVGDVCQDDFDADKVVDKIDVCPENAEVTLTDFRAFQTVVLDPEGDAQIDPNWVVLNQGREIVQTMNSDPGLAVGYTAFNGVDFEGTFHVNTVTDDDYAGFIFGYQDSSSFYVVMWKQMEQTYWQANPFRAVAEPGIQLKAVKSSTGPGEQLRNALWHTGDTESQVRLLWKDPRNVGWKDKKSYRWFLQHRPQVGYIRVRFYEGPELVADSNVVLDTTMRGGRLGVFCFSQENIIWANLRYRCNDTIPEDYETHQLRQAGT\n>6h58_h mol:protein length:129  30S ribosomal protein S8\nSMQDPIADMLTRIRNGQAANKAAVTMPSSKLKVAIANVLKEEGFIEDFKVEGDTKPELELTLKYFQGKAVVESIQRVSRPGLRIYKRKDELPKVMAGLGIAVVSTSKGVMTDRAARQAGLGGEIICYVA\n>4bts_DN mol:protein length:55  40S RIBOSOMAL PROTEIN RPS29E\nMPNKLWRTHPRNYGKDSKECRVCGARQGLITKYEMMTCRRCFREQAPHIGFVKYR\n>6qq8_A mol:protein length:239  Green fluorescent protein\nMVSKGEELFTGVVPILVELDGDVNGHKFSVSGEGEGDATYGKLTLKFICTTGKLPVPWPTLVTTLTWGVQCFARYPDHMKQHDFFKSAMPEGYVQERTIFFKDDGNYKTRAEVKFEGDTLVNRIELKGIDFKEDGNILGHKLEYNAISDNVYITADKQKNGIKANFKIRHNIEDGSVQLADHYQQNTPIGDGPVLLPDNHYLSTQSALSKDPNEKRDHMVLLEFVTAAGITLGMDELYK\n>1a93_B mol:protein length:34  MAX PROTEIN\nXCGGMRRKNDTHQQDIDDLKRQNALLEQQVRALX\n>2fyq_A mol:protein length:194  Chymotrypsin-like cysteine proteinase\nMAHHHHHHDDDDKAPPTLWSRVTKFGSGWGFWVSPTVFITTTHVVPTGVKEFFGEPLSSIAIHQAGEFTQFRFSKKMRPDLTGMVLEEGCPEGTVCSVLIKRDSGELLPLAVRMGAIASMRIQGRLVHGQSGMLLTGANAKGMDLGTIPGDCGAPYVHKRGNDWVVCGVHAAATKSGNTVVCAVQAGEGETALE\n>6q98_n mol:protein length:130  30S ribosomal protein S9\nMAENQYYGTGRRKSSAARVFIKPGNGKIVINQRSLEQYFGRETARMVVRQPLELVDMVEKLDLYITVKGGGISGQAGAIRHGITRALMEYDESLRSELRKAGFVTRDARQVERKKVGLRKARRRPQFSKR\n>4ujd_Cc mol:protein length:69  40S RIBOSOMAL PROTEIN ES28\nMDTSRVQPIKLARVTKVLGRTGSQGQCTQVRVEFMDDTSRSIIRNVKGPVREGDVLTLLESEREARRLR\n>4eef_G mol:protein length:74  F-HB80.4, DESIGNED HEMAGGLUTININ BINDING PROTEIN\nMDYKDDDDKGSHMASTRGSGRPWKFSENIAFEIALSFTNKDTPDRWKKVAQYVKGRTPEEVKKHYELEHHHHHH\n>4quo_A mol:protein length:868  Aminopeptidase N\nKTVHYLKDYQTPAYHILKTDLHFDINEPQTVVKSRLTVEPQRVGEPLVLDGSAKLLSVKINGAAADYVLEGETLTIAGVPSERFTVEVETEILPAENKSLMGLYASGGNLFTQCEPEGFRKITFYIDRPDVMSKFTTTIVADKKRYPVLLSNGNKIDGGEFSDGRHWVKWEDPFSKPSYLFALVAGDLAVTEDYFTTMSGRNVKIEFYTTEADKPKVGFAVESLKNAMKWDETRFGLEYDLDIFMVVAVGDFNMGAMENKGLNIFNTKFVLADSRTATDTDFEGIESVVGHEYFHNWTGNRVTCRDWFQLSLKEGLTVFRDQEFSGDRASRAVRRIENIRLLRQHQFPEDAGPTAHPVRPASYEEMNNFYTMTVYEKGAEVVRMYHTLLGEEGFQKGMKLYFQRHDGQAVTCDDFRAAMADANGINLDQFALWYSQAGTPVLEAEGRLKNNIFELTVKQTVPPTPDMTDKQPMMIPVKVGLLNRNGEAVAFDYQGKRATEAVLLLTEAEQTFLLEGVTEAVVPSLLRGFSAPVHLNYPYSDDDLLLLLAHDSDAFTRWEAAQTLYRRAVAANLATLSDGVELPKHEKLLAAVEKVISDDLLDNAFKALLLGVPSEAELWDGAENIDPLRYHQAREALLDTLAVHFLPKWHELNRQAAKQENQSYEYSPEAAGWRTLRNVCRAFVLRADPAHIETVAEKYGEMAQNMTHEWGILSAVNGNESDTRNRLLAQFADKFSDDALVMDKYFALVGSSRRSDTLQQVRTALQHPKFSLENPNKARSLIGSFSRNVPHFHAEDGSGYRFIADKVIEIDRFNPQVAARLVQAFNLCNKLEPHRKNLVKQALQRIRAQEGLSKDVGEIVGKILDSNA\n>6olg_BM mol:protein length:120  40S ribosomal protein S12\nVMDVNTALQEVLKTALIHDGLARGIREAAKALDKRQAHLCVLASNCDEPMYVKLVEALCAEHQINLIKVDDNKKLGEWVGLCKIDREGKPRKVVGCSCVVVKDYGKESQAKDVIEEYFKC\n>6wgc_9 mol:protein length:513  Cell division control protein 6\nMSAIPITPTKRIRRNLFDDAPATPPRPLKRKKLQFTDVTPESSPEKLQFGSQSIFLRTKALLQKSSELVNLNSSDGALPARTAEYEQVMNFLAKAISEHRSDSLYITGPPGTGKTAQLDMIIRQKFQSLPLSLSTPRSKDVLRHTNPNLQNLSWFELPDGRLESVAVTSINCISLGEPSSIFQKIFDSFQDLNGPTLQIKNMQHLQKFLEPYHKKTTFVVVLDEMDRLLHANTSETQSVRTILELFLLAKLPTVSFVLIGMANSLDMKDRFLSRLNLDRGLLPQTIVFQPYTAEQMYEIVIQKMSSLPTIIFQPMAIKFAAKKCAGNTGDLRKLFDVLRGSIEIYELEKRFLLSPTRGSLNSAQVPLTPTTSPVKKSYPEPQGKIGLNYIAKVFSKFVNNNSTRTRIAKLNIQQKLILCTIIQSLKLNSDATIDESFDHYIKAITKTDTLAPLQRNEFLEICTILETCGLVSIKKTKCKGKTKRFVDKIDVDLDMREFYDEMTKISILKPFLH\n>7nqh_BF mol:protein length:294  Mitochondrial ribosomal protein L4\nMLQLVRAGARTWFRPSGCRGLNTLAEEAVQQAEKPESVASLGLQPPVLRKCELPVPAHRRPVQAWIESLRGYEQERVGLTELHPDVFSTAPRLDILHQVAIWQKNFKRISYAKTKTRAEVRGGGRKPWVQKGSGRARHGSIRSPIWRGGGVAHGPRGPTSYYYMLPMKVRVQGLKVALTVKLAQDDLHIVDSLELPTADPQYLIELARYRRWGDSVLLVDLEHEDMPQNVVAATSGLKTFNLVPAVGLNVHSMLKHQTLVLTLPTVAFLEEKLLWHNSRYTPLYPFRLPYCDFP\n>1xm9_A mol:protein length:457  plakophilin 1\nGLTIPKAVQYLSSQDEKYQAIGAYYIQHTCFQDESAKQQVYQLGGICKLVDLLRSPNQNVQQAAAGALRNLVFRSTTNKLETRRQNGIREAVSLLRRTGNAEIQKQLTGLLWNLSSTDELKEELIADALPVLADRVIIPFSGWCDGNSNMSREVVDPEVFFNATGCLRNLSSADAGRQTMRNYSGLIDSLMAYVQNCVAASRCDDKSVENCMCVLHNLSYRLDAEVPTRYRQLEYNARNAYTEKSSTGCFSNKSDKMMNNNYDCPLPEEETNPKGSGWLYHSDAIRTYLNLMGKSKKDATLEACAGALQNLTASKGLMSSGMSQLIGLKEKGLPQIARLLQSGNSDVVRSGASLLSNMSRHPLLHRVMGNQVFPEVTRLLTSHTGNTSNSEDILSSACYTVRNLMASQPQLAKQYFSSSMLNNIINLCRSSASPKAAEAARLLLSDMWSSKELQGVL\n>6h06_D mol:protein length:219  HUMAN FAB ANTIBODY FRAGMENT OF HCBTAU-22.1\nDVVMTQSPLSLPVTPGEPASISCRSSQSLLHRSGHKYLHWYLQRPGQSPQVLIYLGSNRASGVPDRFSGSGSGTDFTLKISRVEAEDVGLYYCMQTLQTPWTFGQGTKVEIKRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC\n>4xr3_A mol:protein length:316  DNA replication terminus site-binding protein\nMHHHHHHMARYDLVDRLNTTFRQMEQELAIFAAHLEQHKLLVARVFSLPEVKKEDEHNPLNRIEVKQHLGNDAQSLALRHFRHLFIQQQSENRSSKAAVRLPGVLCYQVDNLSQAALVSHIQHINKLKTTFEHIVTVESELPTAARFEWVHRHLPGLITLNAYRTLTVLHDPATLRFGWANKHIIKNLHRDEVLAQLEKSLKSPRSVAPWTREEWQRKLEREYQDIAALPQNAKLKIKRPVKVQPIARVWYKGDQKQVQHACPTPLIALINRDNGAGVPDVGELLNYDADNVQHRYKPQAQPLRLIIPRLHLYVAD\n>4wqr_5I mol:protein length:61  30S ribosomal protein S14 type Z\nMARKALIEKAKRTPKFKVRAYTRCVRCGRARSVYRFFGLCRICLRELAHKGQLPGVRKASW\n>5dkn_A mol:protein length:92  Protein S100-B\nMSELEKAVVALIDVFHQYSGREGDKHKLKKSELKELINNELSHFLEEIKEQEVVDKVMETLDSDGDGECDFQEFMAFVAMITTACHEFFEHE\n>5z0z_B mol:protein length:465  Pilus assembly protein\nMGRDPNSTTTVDFTLHKIEQTSDEQIQNTGHDLGLTGRKPVQGAQFKIFNVTDAFYQLLENHDKTTAASMISQNLGQYVNLQDPNAATVTTDADGLAAFKGLAAKTNGRHSVYAFHEAVTPQPYQKAADMIVSLPVRQDDGSDLTNIHLYPKDSLVTKNLTEINEQAVATKDLHDVAVGDVLTYQVQFQIPHDIGALADHSQDTFKYNQFKVLAYMTKEGLTFKALTAITVDGQDILKALTGKMAFMSSNDAAWQQTHNYPFGFELDFLGGTDPDAVRNLLTQYAGKRVTVAYTGIVNEKMIPDQKVGNTAEVSFDPDSKITVNGPEIQTGGIRFFKHEAGSSKSLANATFILQRMNGNVREYAVLEGVNGMAGTYQPTKITWTTNQDAATRLKTSGAETANLTIQGLLPGRYTLVETAAPEGYEILDPTTDFEVIAGTWGTKTIRIANTPVNQLLPLEHHHHHH\n>6bjc_D mol:protein length:445  Tubulin beta chain\nMREIVHIQAGQCGNQIGAKFWEVISDEHGIDPTGSYHGDSDLQLERINVYYNEAAGNKYVPRAILVDLEPGTMDSVRSGPFGQIFRPDNFVFGQSGAGNNWAKGHYTEGAELVDSVLDVVRKESESCDCLQGFQLTHSLGGGTGSGMGTLLISKIREEYPDRIMNTFSVVPSPKVSDTVVEPYNATLSVHQLVENTDETYCIDNEALYDICFRTLKLTTPTYGDLNHLVSATMSGVTTCLRFPGQLNADLRKLAVNMVPFPRLHFFMPGFAPLTSRGSQQYRALTVPELTQQMFDAKNMMAACDPRHGRYLTVAAVFRGRMSMKEVDEQMLNVQNKNSSYFVEWIPNNVKTAVCDIPPRGLKMSATFIGNSTAIQELFKRISEQFTAMFRRKAFLHWYTGEGMDEMEFTEAESNMNDLVSEYQQYQDATADEQGEFEEEGEEDEA\n>2v6a_M mol:protein length:140  RIBULOSE BISPHOSPHATE CARBOXYLASE SMALL CHAIN 1\nMMVWTPVNNKMFETFSYLPPLTDEQIAAQVDYIVANGWIPCLEFAEADKAYVSNESAIRFGSVSCLYYDNRYWTMWKLPMFGCRDPMQVLREIVACTKAFPDAYVRLVAFDNQKQVQIMGFLVQRPKTARDFQPANKRSV\n>3x37_A mol:protein length:123  ZYRO0C14696p\nMSSWRLVASVRTLPSSLRLELDGAQVNSYEEFVPNIISESRANKIGLRHLIHNPDKYCVLERYGNGFWIRYDVLQMDLQEVEDEFTGNEHLINWAAIKEWNLMGFKDLLPLWKEDLEHHHHHH\n>6yfc_EW mol:protein length:124  coat protein\nMRLTDVDLTVGEETREYAVSEQQGTLFRFVDKSGTVANNTGVFSLEQRFGAANSNRKVTMLLTDPVVVKDASGADMTIKANASVTFSLPKTYPNEHITKLRQTLIAWLGQQCVSDPVDSGLNNY\n>1vvj_QK mol:protein length:129  30S ribosomal protein S11\nMAKKPSKKKVKRQVASGRAYIHASYNNTIVTITDPDGNPITWSSGGVIGYKGSRKGTPYAAQLAALDAAKKAMAYGMQSVDVIVRGTGAGREQAIRALQASGLQVKSIVDDTPVPHNGCRPKKKFRKAS\n>1w4r_A mol:protein length:195  THYMIDINE KINASE\nMRGSHHHHHHLVPRGSKTRGQIQVILGPMFSGKSTELMRRVRRFQIAQYKCLVIKYAKDTRYSSSFCTHDRNTMEALPACLLRDVAQEALGVAVIGIDEGQFFPDIVEFCEAMANAGKTVIVAALDGTFQRKPFGAILNLVPLAESVVKLTAVCMECFREAAYTKRLGTEKEVEVIGGADKYHSVCRLCYFKKAS\n>5lmt_D mol:protein length:209  30S ribosomal protein S4\nMGRYIGPVCRLCRREGVKLYLKGERCYSPKCAMERRPYPPGQHGQKRARRPSDYAVRLREKQKLRRIYGISERQFRNLFEEASKKKGVTGSVFLGLLESRLDNVVYRLGFAVSRRQARQLVRHGHITVNGRRVDLPSYRVRPGDEIAVAEKSRNLELIRQNLEAMKGRKVGPWLSLDVEGMKGKFLRLPDREDLALPVNEQLVIEFYSR\n>7e6c_A mol:protein length:419  Cysteine desulfurase SufS\nMGHMNITDIREQFPILHQQVNGHDLVYLDSAATSQKPRAVIETLDKYYNQYNSNVHRGVHTLGTRATDGYEGAREKVRKFINAKSMAEIIFTKGTTTSLNMVALSYARANLKPGDEVVITYMEHHANIIPWQQAVKATGATLKYIPLQEDGTISLEDVRETVTSNTKIVAVSHVSNVLGTVNPIKEMAKIAHDNGAVIVVDGAQSTPHMKIDVQDLDCDFFALSSHKMCGPTGVGVLYGKKALLENMEPAEFGGEMIDFVGLYESTWKELPWKFEAGTPIIAGAIGLGAAIDFLEEIGLDEISRHEHKLAAYALERFRQLDGVTVYGPEERAGLVTFNLDDVHPHDVATVLDAEGIAVRAGHHAAQPLMKWLDVTATARASFYLYNTEEEIDKLVEALQKTKEYFTNVFVDLEHHHHHH\n>3pkj_F mol:protein length:355  NAD-dependent deacetylase sirtuin-6\nGSVNYAAGLSPYADKGKCGLPEIFDPPEELERKVWELARLVWQSSSVVFHTGAGISTASGIPDFRGPHGVWTMEERGLAPKFDTTFESARPTQTHMALVQLERVGLLRFLVSQNVDGLHVRSGFPRDKLAELHGNMFVEECAKCKTQYVRDTVVGTMGLKATGRLCTVAKARGLRACRGELRDTILDWEDSLPDRDLALADEASRNADLSITLGTSLQIRPSGNLPLATKRRGGRLVIVNLQPTKHDRHADLRIHGYVDEVMTRLMEHLGLEIPAWDGPRVLERALPPLPRPPTPKLEPKEESPTRINGSIPAGPKQEPCAQHNGSEPASPKRERPTSPAPHRPPKRVKAKAVPS\n>7mkd_K mol:protein length:91  DNA-directed RNA polymerase subunit omega\nMARVTVQDAVEKIGNRFDLVLVAARRARQMQVGGKDPLVPEENDKTTVIALREIEEGLINNQILDVRERQEQQEQEAAELQAVTAIAEGRR\n>1kz8_A mol:protein length:337  FRUCTOSE-1,6-BISPHOSPHATASE\nTDQAAFDTNIVTLTRFVMEQGRKARGTGEMTQLLNSLCTAVKAISTAVRKAGIAHLYGIAGSTNVTGDQVKKLDVLSNDLVINVLKSSFATCVLVTEEDKNAIIVEPEKRGKYVVCFDPLDGSSNIDCLVSIGTIFGIYRKNSTDEPSEKDALQPGRNLVAAGYALYGSATMLVLAMVNGVNCFMLDPAIGEFILVDRNVKIKKKGSIYSINEGYAKEFDPAITEYIQRKKFPPDNSAPYGARYVGSMVADVHRTLVYGGIFMYPANKKSPKGKLRLLYECNPMAYVMEKAGGLATTGKEAVLDIVPTDIHQRAPIILGSPEDVTELLEIYQKHAAK\n>5puo_B mol:protein length:156  Bromodomain-containing protein 1\nMHHHHHHSSGVDLGTENLYFQSMEQVAMELRLTELTRLLRSVLDQLQDKDPARIFAQPVSLKEVPDYLDHIKHPMDFATMRKRLEAQGYKNLHEFEEDFDLIIDNCMKYNARDTVFYRAAVRLRDQGGVVLRQARREVDSIGLEEASGMHLPERPA\n>6olf_F mol:protein length:294  60S ribosomal protein L5\nVKVVKNKAYFKRYQVKFRRRREGKTDYYARKRLVIQDKNKYNTPKYRMIVRVTNRDIICQIAYARIEGDMIVCAAYAHELPKYGVKVGLTNYAAAYCTGLLLARRLLNRFGMDKIYEGQVEVTGDEYNVESIDGQPGAFTCYLDAGLARTTTGNKVFGALKGAVDGGLSIPHSTKRFPGYDSESKEFNAEVHRKHIMGQNVADYMRYLMEEDEDAYKKQFSQYIKNSVTPDMMEEMYKKAHAAIRENPVYEKKPKKEVKKKRWNRPKMSLAQKKDRVAQKKASFLRAQERAAES\n>6x6k_AT mol:protein length:278  Cag pathogenicity island protein\nMKLRASVLIGATILCLILSACSNYAKKVVKQKNHVYTPVYNELIEKYSEIPLNDKLKDTPFMVQVKLPNYKDYLLDNKQVVLTFKLVHHSKKITLIGDANKILQYKNYFQANGARSDIDFYLQPTLNQKGVVMIASNYNDNPNSKEKPQTFDVLQGSQPMLGANTKNLHGYDVSGANNKQVINEVAREKAQLEKINQYYKTLLQDKEQEYTTRKNNQREILETLSNRAGYQMRQNVISSEIFKNGNLNMQAKEEEVREKLQEERENEYLRNQIRSLLS\n>3j78_82 mol:protein length:130  60S ribosomal protein L32\nMASLPHPKIVKKHTKKFKRHHSDRYHRVAENWRKQKGIDSVVRRRFRGNISQPKIGYGSNKKTKFLSPSGHKTFLVANVKDLETLTMHTKTYAAEIAHNISAKNRVVILARAKALGIKVTNPKGRLALEA\n>3sbp_D mol:protein length:638  Nitrous-oxide reductase\nMSDKDSKNTPQVPEKLGLSRRGFLGASAVTGAAVAATALGGAVMTRESWAQAVKESKQKIHVGPGELDDYYGFWSGGHQGEVRVLGVPSMRELMRIPVFNVDSATGWGLTNESRHIMGDSAKFLNGDCHHPHISMTDGKYDGKYLFINDKANSRVARIRLDIMKCDKMITVPNVQAIHGLRLQKVPHTKYVFANAEFIIPHPNDGKVFDLQDENSYTMYNAIDAETMEMAFQVIVDGNLDNTDADYTGRFAAATCYNSEKAFDLGGMMRNERDWVVVFDIHAVEAAVKAGDFITLGDSKTPVLDGRKKDGKDSKFTRYVPVPKNPHGCNTSSDGKYFIAAGKLSPTCSMIAIDKLPDLFAGKLADPRDVIVGEPELGLGPLHTTFDGRGNAYTTLFIDSQVVKWNMEEAVRAYKGEKVNYIKQKLDVHYQPGHLHASLCETNEADGKWLVALSKFSKDRFLPVGPLHPENDQLIDISGDEMKLVHDGPTFAEPHDCIMARRDQIKTKKIWDRNDPFFAPTVEMAKKDGINLDTDNKVIRDGNKVRVYMTSMAPAFGVQEFTVKQGDEVTVTITNIDQIEDVSHGFVVVNHGVSMEISPQQTSSITFVADKPGLHWYYCSWFCHALHMEMVGRMMVEPA\n>6yft_HF mol:protein length:113  coat protein\nSTFSSLVIGSNTFIPTAPGYYSLSTRGFSDPRNQIKISGGKFNAKTGRVTAAVSRLWETDVTVAGLPVRSAAEVAIIMTLGRGITATNADVLLSDLNTLLDPARLDQILQGGF\n>5w40_B mol:protein length:352  PopP2 protein\nSEFELGAPAGRQAGQQATVDRLRTQVTGFLSGALGKLQALSAQNMDPELAQFRVLDVDRAIMPLLIVAENARNPGLNLVPLHMDMAEDEEVRTQPPMAGSRHIAEFVASARPGRYRAVIDDGSHTRAADIRKDASGTSVIVVDPLRKEKDESAYVDYADNVNMEFGEHAKCAFIPVDIQKSSFDCRILSLSLALKMHDKDDAFAAFHETLRNGGDPSHHVSRAQQTEELGATLVLDGAPLVDARMMKHGQAASSVSRYLGNHPEQSTVPVNKRNETLGERTTRHLVKRKVRNRADSEGRVTSGETKEITFSNSVEQKRIALLNRAASYVNSAPPPVVMRMAKLLQDSLLDTN\n>6lqt_B1 mol:protein length:923  Periodic tryptophan protein 2\nMKSDFKFSNLLGTVYRQGNITFSDDGKQLLSPVGNRVSVFDLINNKSFTFEYEHRKNIAAIDLNKQGTLLISIDEDGRAILVNFKARNVLHHFNFKEKCSAVKFSPDGRLFALASGRFLQIWKTPDVNKDRQFAPFVRHRVHAGHFQDITSLTWSQDSRFILTTSKDLSAKIWSVDSEEKNLAATTFNGHRDYVMGAFFSHDQEKIYTVSKDGAVFVWEFTKRPSDDDDNESEDDDKQEEVDISKYSWRITKKHFFYANQAKVKCVTFHPATRLLAVGFTSGEFRLYDLPDFTLIQQLSMGQNPVNTVSVNQTGEWLAFGSSKLGQLLVYEWQSESYILKQQGHFDSTNSLAYSPDGSRVVTASEDGKIKVWDITSGFCLATFEEHTSSVTAVQFAKRGQVMFSSSLDGTVRAWDLIRYRNFRTFTGTERIQFNCLAVDPSGEVVCAGSLDNFDIHVWSVQTGQLLDALSGHEGPVSCLSFSQENSVLASASWDKTIRIWSIFGRSQQVEPIEVYSDVLALSMRPDGKEVAVSTLKGQISIFNIEDAKQVGNIDCRKDIISGRFNQDRFTAKNSERSKFFTTIHYSFDGMAIVAGGNNNSICLYDVPNEVLLKRFIVSRNMALNGTLEFLNSKKMTEAGSLDLIDDAGENSDLEDRIDNSLPGSQRGGDLSTRKMRPEVRVTSVQFSPTANAFAAASTEGLLIYSTNDTILFDPFDLDVDVTPHSTVEALREKQFLNALVMAFRLNEEYLINKVYEAIPIKEIPLVASNIPAIYLPRILKFIGDFAIESQHIEFNLIWIKALLSASGGYINEHKYLFSTAMRSIQRFIVRVAKEVVNTTTDNKYTYRFLVSTDGSMEDGAADDDEVLLKDDADEDNEENEENDVVMESDDEEGWIGFNGKDNKLPLSNENDSSDEEENEKELP\n>3fi0_N mol:protein length:326  Tryptophanyl-tRNA synthetase\nMKTIFSGIQPSGVITIGNYIGALRQFVELQHEYNCYFCIVDQHAITVWQDPHELRQNIRRLAALYLAVGIDPTQATLFIQSEVPAHAQAAWMLQCIVYIGELERMTQFKEKSAGKEAVSAGLLTYPPLMAADILLYNTDIVPVGEDQKQHIELTRDLAERFNKRYGELFTIPEARIPKVGARIMSLVDPTKKMSKSDPNPKAYITLLDDAKTIEKKIKSAVTDSEGTIRYDKEAKPGISNLLNIYSTLSGQSIEELERQYEGKGYGVFKADLAQVVIETLRPIQERYHHWMESEELDRVLDEGAEKANRVASEMVRKMEQAMGLGR\n>6y67_MMM mol:protein length:293  Capsid protein VP1\nMGSSHHHHHHSSGENLYFQGSHMGGIEVLDVKTGPDSTTTIEAYLNPRVGQNWGFSTEITVASNGYNDAPHLTEIPCYSSARISLPLLNEDITSPTLLMWEAVSVKTEVVGISSMLNMHSYGLRAFGGYGGGYTIEGSHIHFFSVGGEPLDLQGLMQNHSTQYPSPLVGPKKPDGTTDDSAQVLNPIYKAKLDKDATYPIECWCPDPSRNENSRYFGSYTGGVETPPVLSFTNTSTTILLDENGVGPLCKGDGLYLSSADVAGTFVQQTSQKQYWRGLPRYFNITLRKRAVKN\n>1dzr_A mol:protein length:183  DTDP-4-DEHYDRORHAMNOSE 3,5-EPIMERASE\nMMIVIKTAIPDVLILEPKVFGDERGFFFESYNQQTFEELIGRKVTFVQDNHSKSKKNVLRGLHFQRGENAQGKLVRCAVGEVFDVAVDIRKESPTFGQWVGVNLSAENKRQLWIPEGFAHGFVTLSEYAEFLYKATNYYSPSSEGSILWNDEAIGIEWPFSQLPELSAKDAAAPLLDQALLTE\n>6gmt_A mol:protein length:108  Magnetosome protein MamM\nGSHMEAVQNRIVEAAERVPGVRGVIHLRARYVGQDIWADMIIGVDPENTVEQAHEICEAVQAAVCGKIRRIESLHVSAEAREIGDTTKPSFSDQPLSFDEVMLSKVDN\n>5a1w_F mol:protein length:177  COATOMER SUBUNIT ZETA-1\nMEALILEPSLYTVKAILILDNDGDRLFAKYYDDTYPSVKEQKAFEKNIFNKTHRTDSEIALLEGLTVVYKSSIDLYFYVIGSSYENELMLMAVLNCLFDSLSQMLRKNVEKRALLENMEGLFLAVDEIVDGGVILESDPQQVVHRVALRGEDVPLTEQTVSQVLQSAKEQIKWSLLR\n>5e81_3E mol:protein length:209  30S ribosomal protein S4\nMGRYIGPVCRLCRREGVKLYLKGERCYSPKCAMERRPYPPGQHGQKRARRPSDYAVRLREKQKLRRIYGISERQFRNLFEEASKKKGVTGSVFLGLLESRLDNVVYRLGFAVSRRQARQLVRHGHITVNGRRVDLPSYRVRPGDEIAVAEKSRNLELIRQNLEAMKGRKVGPWLSLDVEGMKGKFLRLPDREDLALPVNEQLVIEFYSR\n>6y5e_F mol:protein length:83  Histone H4\nKVLRDNIQGITKPAIRRLARRGGVKRISGLIYEETRGVLKVFLENVIRDAVTYTEHAKRKTVTAMDVVYALKRQGRTLYGFGG\n>5pgy_A mol:protein length:286  Corticosteroid 11-beta-dehydrogenase isozyme 1\nGSHMASMTGGQQMGRGSNEEFRPEMLQGKKVIVTGASKGIGREMAYHLAKMGAHVVVTARSKETLQKVVSHCLELGAASAHYIAGTMEDMTFAEQFVAQAGKLMGGLDMLILNHITNTSLNLFHDDIHHVRKSMEVNFLSYVVLTVAALPMLKQSNGSIVVVSSLAGKVAYPMVAAYSASKFALDGFFSSIRKEYSVSRVNVSITLCVLGLIDTETAMKAVSGIVHMQAAPKEECALEIIKGGALRQEEVYYDSSRWTTLLIRNPCRKILEELYSTSYNMDRFINK\n>7r4n_A mol:protein length:362  Hydroxyacid oxidase 1\nMLPRLICINDYEQHAKSVLPKSIYDYYRSGANDEETLADNIAAFSRWKLYPRMLRNVAETDLSTSVLGQRVSMPICVGATAMQRMAHVDGELATVRACQSLGTGMMLSSWATSSIEEVAEAGPEALRWLQLYIYKDREVTKKLVRQAEKMGYKAIFVTVDTPYLGNRLDDVRNRFKLPPQLRMKNFETSTLSFSPEENFGDDSGLAAYVAKAIDPSISWEDIKWLRRLTSLPIVAKGILRGDDAREAVKHGLNGILVSNHGARQLDGVPATIDVLPEIVEAVEGKVEVFLDGGVRKGTDVLKALALGAKAVFVGRPIVWGLAFQGEKGVQDVLEILKEEFRLAMALSGCQNVKVIDKTLVRK\n>6dec_R mol:protein length:9  unidentified\nXXXXXXXXX\n>6j9f_C mol:protein length:1383  DNA-directed RNA polymerase subunit beta\nMTSYSFTEKKRIRKDFGKQRSILEVPFLLAIQVDSYREFLQEDVESTKRKDLGLHAALKSVFPISSYSGNAALEYVGYKLGQPVFDERECRQRGMSYGAPLRVTVRLVIYDRESSTKAIKYVKEQEVYLGEIPLMTGNGTFIVNGTERVIVSQLHRSPGVFFDHDRGKTHSSGKLLYSARIIPYRGSWLDFEFDPKDALFTRIDRRRKLPVSILLRALGYNNEEMLAEFFEINTFHINPDEGVQLELVPERLRGETLNFDLADGDKVIVEAGKRITARHVKQLEAAGVAALAVPDDYLVGRILSHDVVDGSTGELLANANDEISEDQLTAFRKAGVDAVGTLWVNDLDRGPYLSNTLRIDPTKTQLEALVEIYRMMRPGEPPTKEAAQNLFHNLFFTFERYDLSTVGRMKFNRRVGRKDVLGESVLYDKKYFAERNDEESKRLVAEHTDTSDILEVIKVLTEIRNGRGVVDDIDHLGNRRVRSVGEMAENVFRVGLVRVERAVKERLSMAESEGLTPQELINAKPVAAAIKEFFGSSQLSQFMDQNNPLSEVTHKRRVSALGPGGLTRERAGFEVRDVHPTHYGRVCTIETPEGPNIGLINSLAVFARTNQYGFLETPYRKVLDGKVSDDVEYLSAIEENEYVIAQANALTDAKNMLTEQFVPCRFQGESLLKPPSEVHFMDVSPMQTVSVAAALVPFLEHDDANRALMGANMQRQAVPTLRSQKPLVGTGIERAVARDSGVTVNALRGGVIEQIDAARIVVKVNEAEIGGGTDAGVDIYNLIKYTRSNQNTCINQRPLVNVGDVIARGDVLADGPSTDIGELALGQNMLIAFMPWNGYNFEDSILLSERVVEEDRYTTIHIEELTCVARDTKLGPEEISADIPNVSEQALNRLDESGVVYIGAEVRAGDIMVGKVTPKGESQLTPEEKLLRAIFGEKASDVKDSSLRVPPGMDGTVIDVQVFTRDGIEKDKRARQIEENEIKRVKKDFDDQFRILEAAIYARLRSQIVGKVANGGANLKKGDSVTDAYLDGLKKSDWFQLRMKDEDAADAIERAQKQIQAHEKEFEARFADKRGKITQGDDLAPGVLKMVKVFLAVKRRIQPGDKMAGRHGNKGVVSNVVPVEDMPYMATGESVDIVLNPLGVPSRMNIGQILEVHLGWAAKGLGRKIQRMLEAQAAVSELRKFLDDIYNHDNAINAQRVDLSQFSDEELLNLGKNLIDGVPMATPVFDGASEAEIKRMLELADLPQSGQTQLYDGRTGEAFDRKTTVGYMHYLKLNHLVDDKMHARSTGPYSLVTQQPLGGKAQFGGQRFGEMEVWALEAYGAAYTLQEMLTVKSDDVQGRNQMYKNIVDGEHEMVAGMPESFNVLVKEIRSLAIHMELEE\n>2e7s_E mol:protein length:135  Rab guanine nucleotide exchange factor SEC2\nGPLGSLEEQLNKSLKTIASQKAAIENYNQLKEDYNTLKRELSDRDDEVKRLREDIAKENELRTKAEEEADKLNKEVEDLTASLFDEANNLVADARMEKYAIEILNKRLTEQLREKDMLLDTLTLQLKNLKKVMHS\n>2wfz_A mol:protein length:537  ACETYLCHOLINESTERASE\nDDHSELLVNTKSGKVMGTRVPVLSSHISAFLGIPFAEPPVGNMRFRRPEPKKPWSGVWNASTYPNNCQQYVDEQFPGFSGSEMWNPNREMSEDCLYLNIWVPSPRPKSTTVMVWIYGGGFYSGSSTLDVYNGKYLAYTEEVVLVSLSYRVGAFGFLALHGSQEAPGNVGLLDQRMALQWVHDNIQFFGGDPKTVTIFGESAGGASVGMHILSPGSRDLFRRAILQSGSPNCPWASVSVAEGRRRAVELGRNLNCNLNSDEELIHCLREKKPQELIDVEWNVLPFDSIFRFSFVPVIDGEFFPTSLESMLNSGNFKKTQILLGVNKDEGSFFLLYGAPGFSKDSESKISREDFMSGVKLSVPHANDLGLDAVTLQYTDWMDDNNGIKNRDGLDDIVGDHNVICPLMHFVNKYTKFGNGTYLYFFNHRASNLVWPEWMGVIHGYEIEFVFGLPLVKELNYTAEEEALSRRIMHYWATFAKTGNPNEPHSQESKWPLFTTKEQKFIDLNTEPMKVHQRLRVQMCVFWNQFLPKLLNATAC\n>5cnv_D mol:protein length:761  Ribonucleoside-diphosphate reductase 1 subunit alpha\nMNQNLLVTKRDGSTERINLDKIHRVLDWAAEGLHNVSISQVELRSHIQFYDGIKTSDIHETIIKAAADLISRDAPDYQYLAARLAIFHLRKKAYGQFEPPALYDHVVKMVEMGKYDNHLLEDYTEEEFKQMDTFIDHDRDMTFSYAAVKQLEGKYLVQNRVTGEIYESAQFLYILVAACLFSNYPRETRLQYVKRFYDAVSTFKISLPTPIMSGVRTPTRQFSSCVLIECGDSLDSINATSSAIVKYVSQRAGIGINAGRIRALGSPIRGGEAFHTGCIPFYKHFQTAVKSCSQGGVRGGAATLFYPMWHLEVESLLVLKNNRGVEGNRVRHMDYGVQINKLMYTRLLKGEDITLFSPSDVPGLYDAFFADQEEFERLYTKYEKDDSIRKQRVKAVELFSLMMQERASTGRIYIQNVDHCNTHSPFDPAIAPVRQSNLCLEIALPTKPLNDVNDENGEIALCTLSAFNLGAINNLDELEELAILAVRALDALLDYQDYPIPAAKRGAMGRRTLGIGVINFAYYLAKHGKRYSDGSANNLTHKTFEAIQYYLLKASNELAKEQGACPWFNETTYAKGILPIDTYKKDLDTIANEPLHYDWEALRESIKTHGLRNSTLSALMPSETSSQISNATNGIEPPRGYVSIKASKDGILRQVVPDYEHLHDAYELLWEMPGNDGYLQLVGIMQKFIDQSISANTNYDPSRFPSGKVPMQQLLKDLLTAYKFGVKTLYYQNTRDGAEDAQDDLVPSIQDDGCESGACKI\n>6fzd_A mol:protein length:392  Lipase\nSRANDAPIVLLHGFTGWGREEMFGFKYWGGVRGDIEQWLNDNGYRTYTLAVGPLSSNWDRACEAYAQLVGGTVDYGAAHAAKHGHARFGRTYPGLLPELKRGGRIHIIAHSQGGQTARMLVSLLENGSQEEREYAKAHNVSLSPLFEGGHHFVLSVTTIATPHDGTTLVNMVDFTDRFFDFQKFVLKAAAVASNVPYTSQVYDFKLDQWGLRRQPGESFDQYFERLKRSPVWTSTDTARYDLSVPGAEKLNQWVKASPNTYYLSFATERTYRGALTGNYYPELGMNAFSAVVCAPFLGSYRNATLGIDDRWLENDGIVNAFSMNGPKRGSTDRIVPYDGTIKKGVWNDMGTYNVDHFEVIGVDPNPLFDIRAFYLRLAEQLASLQPHHHHHH\n>6stf_C mol:protein length:178  Ras-related protein Rab-8A\nMDYLFKLLLIGDSGVGKTCVLFRFSEDAFNSTFISTIGIDFKIRTIELDGKRIKLQIWDTAGQERFRTITTAYYRGAMGIMLVYDITNEKSFDNIRNWIRNIEEHASADVEKMILGNKCDVNDKRQVSKERGEKLALDYGIKFMETSAKANINVENAFFTLARDIKAKMDKKHHHHHH\n>7pny_K mol:protein length:128  28S ribosomal protein S14, mitochondrial\nMAAFMLGSLLRTFKQMVPSSASGQVRSHYVDWRMWRDVKRRKMAYEYADERLRINSLRKNTILPKILQDVADEEIAALPRDSCPVRIRNRCVMTSRPRGVKRRWRLSRIVFRHLADHGQLSGIQRATW\n>8d5p_C mol:protein length:209  TCR-alpha\nMDSVTQTEGQVALSEEDFLTIHCNYSASGYPALFWYVQYPGEGPQFLFRASRDKEKGSSRGFEATYNKETTSFHLQKASVQESDSAVYYCALGDPTGANTGKLTFGHGTILRVHPNIQNPDPAVYQLRDSKSSDKSVCLFTDFDSQTNVSQSKDSDVYITDKCVLDMRSMDFKSNSAVAWSNKSDFACANAFNNSIIPEDTFFPSPESS\n>6o22_D mol:protein length:279  Histone chaperone ASF1\nSSIVSLLGIKVLNNPAKFTDPYEFEITFECLESLKHDLEWKLTYVGSSRSLDHDQELDSILVGPVPVGVNKFVFSADPPSAELIPASELVSVTVILLSCSYDGREFVRVGYYVNNEYDEEELRENPPAKVQVDHIVRNILAEKPRVTRFNIVWDNENEGDLYPPEQPGVDDEEEEDDEEEDDDEDDEDDEDDDQEDGEGEAEEAAEEEEEEEEKTEDNETNLEEEEEDIENSDGDEEEGEEEVGSVDKNEDGNDKKRRKIEGGSTDIESTPKDAARSTN\n>6gqb_AA mol:protein length:105  40S ribosomal protein S10-A\nMLMPKEDRNKIHQYLFQEGVVVAKKDFNQAKHEEIDTKNLYVIKALQSLTSKGYVKTQFSWQYYYYTLTEEGVEYLREYLNLPEHIVPGTYIQERNPTQRPQRRY\n>1z9x_C mol:protein length:321  Death-associated protein kinase 2\nGMEPFKQQKVEDFYDIGEELGSGQFAIVKKCREKSTGLEYAAKFIKKRQSRASRRGVSREEIEREVSILRQVLHHNVITLHDVYENRTDVVLILELVSGGELFDFLAQKESLSEEEATSFIKQILDGVNYLHTKKIAHFDLKPENIMLLDKNIPIPHIKLIDFGLAHEIEDGVEFKNIFGTPEFVAPEIVNYEPLGLEADMWSIGVITYILLSGASPFLGDTKQETLANITSVSYDFDEEFFSHTSELAKDFIRKLLVKETRKRLTIQEALRHPWITPVDNQQAMVRRESVVNLENFRKQYVRRRSKLAFSIVSLCNHLTR\n>6qbx_S3 mol:protein length:228  NADH:ubiquinone oxidoreductase core subunit S3\nESASADTRPTVRPRNDVAHKQLSAFGEYVAEILPKYVQQVQVSCFSELEICIHPDGVIPVLTFLRDHSNAQFKSLADLTAVDIPTRQNRFEIVYNLLSLRFNSRIRVKTYTDELTPVESSVSVYKAANWYEREIWDMFGVFFANHPDLRRILTDYGFEGHPFRKDFPLSGYVELRYDDEVKRVVAEPVELAQEFRKFDLNSPWEAFPAYRQPPESLKLEAGDKKPEAK\n>3h0r_Q mol:protein length:478  Aspartyl/glutamyl-tRNA(Asn/Gln) amidotransferase subunit B\nMNEKYEAVIGLEIHVQMDTKTKMFCGCKVEFGAEPNTNVCPVCLGMPGALPIVNKRAVEYAIRASLALNCEVHEESVFARKHYFYPDLPKGYQISQYEKPLATNGWVELNLPNGEKKKVRIRRLHIEEDAGKNIHEGDKTLVDLNRAGTPLMEIVTEPDIRTPEEARLFLEKLRNIMRYAGVSKADMEKGQLRCDINVSIRPKGSKEFGTRVEIKNVNSFRFVQKALEYEIERQINVVEEGGEVVQETRTFDPQTGKTYPMRTKEEAEDYRYFPDPDLVPLKVKKEWIEEIKKNMPELPDQRFERLIKEYGLSEYEAGILVNHKEVGDFFEEAVRHFKEPKGIVNWLINDLLGLLRDKGISIEESPVKPEHLAELVKLIKEKVISTKIGKEVIKEMVETGKTPSQIVEEKGLKQITDENQIKELVKKIFEKHPKEVERLKQGEEKLIGFFVGQVMRETRGKANPQVVNKVIRELVKEV\n>4v99_Al mol:protein length:242  Capsid protein\nMNRNGATPTRGRGKRAIPNPPRRRARGKSVERGSTPLQYVTTLGPSRPRMGQGQGWQKLSHEEIILQVNSSTAADTIQTIPIIPRLSVPAGDKPIYSGSAPHLRTIGSAFAIHRWRALSFEWIPSCPTTTPGNLVLRFYPNYSTETPKTLTDLMDSESLVLVPSLSGKTYRPKIETRGNPPELRNIDATAFSALSDEDKGDYSVGRLVVGSSKQAVVIQLGLLRMRYSAEMRGATSISGVSA\n>6zsa_XS mol:protein length:205  39S ribosomal protein L21, mitochondrial\nMAASSLTVTLGRLASACSHSILRPSGPGAASLWSASRRFNSQSTSYLPGYVPKTSLSSPPWPEVVLPDPVEETRHHAEVVKKVNEMIVTGQYGRLFAVVHFASRQWKVTSEDLILIGNELDLACGERIRLEKVLLVGADNFTLLGKPLLGKDLVRVEATVIEKTESWPRIIMRFRKRKNFKKKRIVTTPQTVLRINSIEIAPCLL\n>7pe9_I mol:protein length:409  DEP domain-containing mTOR-interacting protein\nMEEGGSTGSAGSDSSTSGSGGAQQRELERMAEVLVTGEQLRLRLHEEKVIKDRRHHLKTYPNCFVAKELIDWLIEHKEASDRETAIKLMQKLADRGIIHHVCDEHKEFKDVKLFYRFRKDDGTFPLDNEVKAFMRGQRLYEKLMSPENTLLQPREEEGVKYERTFMASEFLDWLVQEGEATTRKEAEQLCHRLMEHGIIQHVSSKHPFVDSNLLYQFRMNFRRRRRLMELLNEKSPSSQETHDSPFCLRKQSHDNRKSTSFMSVSPSKEIKIVSAVRRSSMSSCGSSGYFSSSPTLSSSPPVLCNPKSVLKRPVTSEELLTPGAPYARKTFTIVGDAVGWGFVVRGSKPCHIQAVDPSGPAAAAGMKVCQFVVSVNGLNVLHVDYRTVNNLILTGPRTIVMEVMEELEC\n>5v3t_A mol:protein length:132  Globin\nMSKQPMTPFEAIGGEQCIEILVDTFYSYVSKHPDLSPIFPDDLTETARKQKQFLTQYLGGPNLYTEEHGHPMLRARHLPFEITPKRAEAWLSCMEQAMDDTGVHGHIREFVFERLALTAQHMVNTPNETGEI\n>4wra_E5 mol:protein length:85  50S ribosomal protein L27\nMAHKKGLGSTRNGRDSQAKRLGVKRYEGQVVRAGNILVRQRGTRFKPGKNVGMGRDFTLFALVDGVVEFQDRGRLGRYVHVRPLA\n>4waj_A mol:protein length:229  Carbonic anhydrase 2\nMDKIKQLFANNYSWAQRMKEENSTYFKELADHQTPHYLWIGCSDSRVSPEKLTNLEPGELFVHRNVANQVIHTDFNCLSVVQYAVDVLKIEHIIICGHTNCGGIHAAMADKDLGLINNWLLHIRDIWFKHGHLLGKLSPEKRADMLTKINVAEQVYNLGRTSIVKSAWERGQKLSLHGWVYDVNDGFLVDQGVMATSRETLEISYRNAIARLSILDEENILKKDHLENT\n>2c97_A mol:protein length:160  6,7-DIMETHYL-8-RIBITYLLUMAZINE SYNTHASE\nMKGGAGVPDLPSLDASGVRLAIVASSWHGKICDALLDGARKVAAGCGLDDPTVVRVLGAIEIPVVAQELARNHDAVVALGVVIRGQTPHFDYVCDAVTQGLTRVSLDSSTPIANGVLTTNTEEQALDRAGLPTSAEDKGAQATVAALATALTLRELRAHS\n>5j4b_2e mol:protein length:162  30S ribosomal protein S5\nMPETDFEEKMILIRRTARMQAGGRRFRFGALVVVGDRQGRVGLGFGKAPEVPLAVQKAGYYARRNMVEVPLQNGTIPHEIEVEFGASKIVLKPAAPGTGVIAGAVPRAILELAGVTDILTKELGSRNPINIAYATMEALRQLRTKADVERLRKGEAHAQAQG\n>7n6p_A mol:protein length:227  1C3 Fab heavy chain\nQVQLVQSGAEVKKPGSSVKVACKVSGGTFSSYTISWVRQAPGQGLEWMGGIIPSFGVGHYSQKFRDRVTLTADKSTTTAFLELSSVRSEDTALYYCAILGTFNWKSGGNYFGPWGQGTLVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSC\n>2vt5_B mol:protein length:338  FRUCTOSE-1,6-BISPHOSPHATASE 1\nMADQAPFDTDVNTLTRFVMEEGRKARGTGELTQLLNSLCTAVKAISSAVRKAGIAHLYGIAGSTNVTGDQVKKLDVLSNDLVMNMLKSSFATCVLVSEEDKHAIIVEPEKRGKYVVCFDPLDGSSNIDCLVSVGTIFGIYRKKSTDEPSEKDALQPGRNLVAAGYALYGSATMLVLAMDCGVNCFMLDPAIGEFILVDKDVKIKKKGKIYSLNEGYAKDFDPAVTEYIQRKKFPPDNSAPYGARYVGSMVADVHRTLVYGGIFLYPANKKSPNGKLRLLYECNPMAYVMEKAGGMATTGKEAVLDVIPTDIHQRAPVILGSPDDVLEFLKVYEKHSAQ\n>6dhf_c mol:protein length:451  Photosystem II CP43 reaction center protein\nATNRDQESSGFAWWAGNARLINLSGKLLGAHVAHAGLIVFWAGAMTLFELAHFIPEKPMYEQGLILIPHIATLGWGVGPGGEVVDTFPFFVVGVVHLISSAVLGFGGVYHAIRGPETLEEYSSFFGYDWKDKNKMTTILGFHLIVLGIGALLLVAKAMFFGGLYDTWAPGGGDVRVITNPTLDPRVIFGYLLKSPFGGEGWIVSVNNLEDVVGGHIWIGLICIAGGIWHILTTPFGWARRAFIWSGEAYLSYSLGALSMMGFIATCFVWFNNTVYPSEFYGPTGPEASQAQAMTFLIRDQKLGANVGSAQGPTGLGKYLMRSPTGEIIFGGETMRFWDFRGPWLEPLRGPNGLDLNKIKNDIQPWQERRAAEYMTHAPLGSLNSVGGVATEINSVNFVSPRSWLATSHFVLAFFFLVGHLWHAGRARAAAAGFEKGIDRESEPVLSMPSLD\n>5hg0_A mol:protein length:264  Pantothenate synthetase\nSNAMIIADNIKQFHSIRNSLIKQQKIGFVPTMGALHNGHISLIKKAKSENDVVIVSIFVNPTQFNNPNDYQTYPNQLQQDIQILASLDVDVLFNPSEKDIYPDGNLLRIEPKLEIANILEGKSRPGHFSGMLTVVLKLLQITKPNNLYLGEKDYQQVMLIKQLVKDFFINTKIIVCPTQRQPSGLPLSSRNKNLTSTDIEIANKIYEILRQDDFSNLEELTNKINSTGAKLQYIQKLNNRIFLAFYIGKVRLIDNFLKETGPSC\n>2h6s_A mol:protein length:340  Candidapepsin-3\nQTVPVKLINEQVSYASDITVGSNKQKLTVVIDTGSSDLWVPDSQVSCQAGQGQDPNFCKNEGTYSPSSSSSSQNLNSPFSIEYGDGTTSQGTWYKDTIGFGGISITKQQFADVTSTSVDQGILGIGYKTHEAEGNYDNVPVTLKNQGIISKNAYSLYLNSRQATSGQIIFGGVDNAKYSGTLIALPVTSDNELRIHLNTVKVAGQSINADVDVLLDSGTTITYLQQGVADQVISAFNGQETYDANGNLFYLVDCNLSGSVDFAFDKNAKISVPASEFTAPLYTEDGQVYDQCQLLFGTSDYNILGDNFLRSAYIVYDLDDNEISLAQVKYTTASNIAALT\n>6atb_B mol:protein length:501  Nicotinamide phosphoribosyltransferase\nMNPAAEAEFNILLATDSYKVTHYKQYPPNTSKVYSYFECREKKTENSKLRKVKYEETVFYGLQYILNKYLKGKVVTKEKIQEAKDVYKEHFQDDVFNEKGWNYILEKYDGHLPIEIKAVPEGFVIPRGNVLFTVENTDPECYWLTNWIETILVQSWYPITVATNSREQKKILAKYLLETSGNLDGLEYKLHDFGYRGVSSQETAGIGASAHLVNFKGTDTVAGLALIKKYYGTKDPVPGYSVPAAEHSTITAWGKDHEKDAFEHIVTQFSSVPVSVVSDSYDIYNACEKIWGEDLRHLIVSRSTQAPLIIRPDSGNPLDTVLKVLEILGKKFPVTENSKGYKLLPPYLRVIQGDGVDINTLQEIVEGMKQKMWSIENIAFGSGGGLLQKLTRDLLNCSFKCSYVVTNGLGINVFKDPVADPNKRSKKGRLSLHRTPAGNFVTLEEGKGDLEEYGQDLLHTVFKNGKVTKSYSFDEIRKNAQLNIELEAAHHLEHHHHHHHH\n>1oqj_B mol:protein length:97  Glucocorticoid Modulatory Element Binding protein-1\nGAMEDMEIAYPITCGESKAILLWKKFVCPGINVKCVKFNDQLISPKHFVHLAGKSTLKDWKRAIRLGGIMLRKMMDSGQIDFYQHDKVCSNTCRSTK\n>5m7g_A mol:protein length:451  Tubulin alpha-1B chain\nMRECISIHVGQAGVQIGNACWELYCLEHGIQPDGQMPSDKTIGGGDDSFNTFFSETGAGKHVPRAVFVDLEPTVIDEVRTGTYRQLFHPEQLITGKEDAANNYARGHYTIGKEIIDLVLDRIRKLADQCTGLQGFLVFHSFGGGTGSGFTSLLMERLSVDYGKKSKLEFSIYPAPQVSTAVVEPYNSILTTHTTLEHSDCAFMVDNEAIYDICRRNLDIERPTYTNLNRLISQIVSSITASLRFDGALNVDLTEFQTNLVPYPRIHFPLATYAPVISAEKAYHEQLSVAEITNACFEPANQMVKCDPRHGKYMACCLLYRGDVVPKDVNAAIATIKTKRSIQFVDWCPTGFKVGINYQPPTVVPGGDLAKVQRAVCMLSNTTAIAEAWARLDHKFDLMYAKRAFVHWYVGEGMEEGEFSEAREDMAALEKDYEEVGVDSVEGEGEEEGEEY\n>6z6j_LW mol:protein length:155  60S ribosomal protein L24-A\nMKVEIDSFSGAKIYPGRGTLFVRGDSKIFRFQNSKSASLFKQRKNPRRIAWTVLFRKHHKKGITEEVAKKRSRKTVKAQRPITGASLDLIKERRSLKPEVRKANREEKLKANKEKKKAEKAARKAEKAKSAGTQSSKFSKQQAKGAFQKVAATSR\n>6mte_F mol:protein length:225  uL30\nNFAELKIKRLRKKFAQKMLRKARRKLIYEKAKHYHKEYRQMYRTEIRMARMARKAGNFYVPAEPKLAFVIRIRGINGVSPKVRKVLQLLRLRQIFNGTFVKLNKASINMLRIVEPYIAWGYPNLKSVNELIYKRGYGKINKKRIALTDNTLIARSLGKYNIICMEDLIHEIYTVGKHFKEANNFLWPFKLSSPRGGMKKKTTHFVEGGDAGNREDQINRLIRRMN\n>4v93_BD mol:protein length:151  EXTRACELLULAR GLOBIN-4\nADDEDCCSYEDRREIRHIWDDVWSSSFTDRRVAIVRAVFDDLFKHYPTSKALFERVKIDEPESGEFKSHLVRVANGLKLLINLLDDTLVLQSHLGHLADQHIQRKGVTKEYFRGIGEAFARVLPQVLSCFNVDAWNRCFHRLVARIAKDLP\n>7nk4_B mol:protein length:757  RNA-directed RNA polymerase catalytic subunit\nMDVNPTLLFLKVPAQNAISTTFPYTGDPPYSHGTGTGYTMDTVNRTHQYSEKGRWTTNTETGAPQLNPIDGPLPEDNEPSGYAQTDCVLEAMAFLEESHPGIFENSCLETMEVVQQTRVDKLTQGRQTYDWTLNRNQPAATALANTIEVFRSNGLTANESGRLIDFLKDVMESMDKEEMEITTHFQRKRRVRDNMTKKMVTQRTIGKKKQRLNKRSYLIRALTLNTMTKDAERGKLKRRAIATPGMQIRGFVYFVETLARSICEKLEQSGLPVGGNEKKAKLANVVRKMMTNSQDTELSFTITGDNTKWNENQNPRMFLAMITYITRNQPEWFRNVLSIAPIMFSNKMARLGKGYMFESKSMKLRTQIPAEMLASIDLKYFNDSTRKKIEKIRPLLIDGTASLSPGMMMGMFNMLSTVLGVSILNLGQKRYTKTTYWWDGLQSSDDFALIVNAPNHEGIQAGVDRFYRTCKLLGINMSKKKSYINRTGTFEFTSFFYRYGFVANFSMELPSFGVSGINESADMSIGVTVIKNNMINNDLGPATAQMALQLFIKDYRYTYRCHRGDTQIQTRRSFEIKKLWEQTRSKAGLLVSDGGPNLYNIRNLHIPEVCLKWELMDEDYQGRLCNPLNPFVSHKEIESVNNAVMMPAHGPAKNMEYDAVATTHSWIPKRNRSILNTSQRGILEDEQMYQKCCNLFEKFFPSSSYRRPVGISSMVEAMVSRARIDARIDFESGRIKKEEFAEIMKICSTIEELRRQK\n>2bwp_D mol:protein length:401  5-AMINOLEVULINATE SYNTHASE\nMDYNLALDKAIQKLHDEGRYRTFIDIEREKGAFPKAQWNRPDGGKQDITVWCGNDYLGMGQHPVVLAAMHEALEAVGAGSGGTRNISGTTAYHRRLEAEIAGLHQKEAALVFSSAYNANDATLSTLRVLFPGLIIYSDSLNHASMIEGIKRNAGPKRIFRHNDVAHLRELIAADDPAAPKLIAFESVYSMDGDFGPIKEICDIAEEFGALTYIDEVHAVGMYGPRGAGVAERDGLMHRIDIFNGTLAKAYGVFGGYIAASARMVDAVRSYAPGFIFSTSLPPAIAAGAQASIAFLKTAEGQKLRDAQQMHAKVLKMRLKALGMPIIDHGSHIVPVVIGDPVHTKAVSDMLLSDYGVYVQPINFPTVPRGTERLRFTPSPVHDLKQIDGLVHAMDLLWARCA\n>3nno_C mol:protein length:171  Peptidoglycan recognition protein 1\nEDPPACGSIVPRREWRALASECRERLTRPVRYVVVSHTAGSHCDTPASCAQQAQNVQSYHVRNLGWCDVGYNFLIGEDGLVYEGRGWNIKGAHAGPTWNPISIGISFMGNYMNRVPPPRALRAAQNLLACGVALGALRSNYEVKGHRDVQPTLSPGDRLYEIIQTWSHYRA\n>2feu_A mol:protein length:411  Cytochrome P450-cam\nNLAPLPPHVPEHLVFDFDMYNPSNLSAGVQEAWAVLQESNVPDLVWTRCNGGHWIATRGQLIREAYEDYRHFSSECPFIPREAGEAYDFIPTSMDPPEQRQFRALANQVVGMPVVDKLENRIQELACSLIESLRPQGQCNFTEDYAEPFPIRIFMLLAGLPEEDIPHLKYLTDQMTRPDGSMTFAEAKEALYDYLIPIIEQRRQKPGTDAISIVANGQVNGRPITSDEAKRMCGLLLVGGLDTVVNFLSFSMEFLAKSPEHRQELIERPERIPAACEELLRRFSLVADGRILTSDYEFHGVQLKKGDQILLPQMLSGLDERENACPMHVDFSRQKVSHTTFGHGSHLCLGQHLARREIIVTLKEWLTRIPDFSIAPGAQIQHKSGIVSGVQALPLVWDPATTKAVHHHHHH\n>6v3b_V mol:protein length:85  50S ribosomal protein L27\nMATKKAGGSTKNGRDSNPKMLGVKVYGGQTVTAGNIIVRQRGTEFHAGANVGMGRDHTLFATADGVVKFEVKGQFGRRYVKVETV\n>3qjv_C mol:protein length:34  Cytochrome c oxidase polypeptide 2A\nMEEKPKGALAVILVLTLTILVFWLGVYAVFFARG\n>6az1_b mol:protein length:112  ribosomal protein S26e\nMTTKRRNHGRSKPAHSRGRVKPIHCFNCGRLTPKDKAVGRFVVRRMLDAASARDVAEASPVYGANFPMPKLYMKQRFCIACAIHSRTVRARPVGNRKIRYTRKVPFRPAGKK\n>4v5l_AS mol:protein length:93  30S RIBOSOMAL PROTEIN S19\nMPRSLKKGVFVDDHLLEKVLELNAKGEKRLIKTWSRRSTIVPEMVGHTIAVYNGKQHVPVYITENMVGHKLGEFAPTRTYRGHGKEAKATKKK\n>3siq_F mol:protein length:136  Apoptosis 1 inhibitor\nMASVVPIAFDQVDNNTNATQLFKNNINKTRMNDLNREETRLKTFTDWPLDWLDKRQLAQTGMYFTHAGDKVKCFFCGVEIGSWEQEDQPVPEHQRWSPNCPLLRRRTTNNVPINAEALDRILPPISYDLEHHHHHH\n>7qp7_H mol:protein length:84  40S ribosomal protein S27\nMPLAKDLLHPSPEEEKRKHKKKRLVQSPNSYFMDVKCPGCYKITTVFSHAQTVVLCVGCSTVLCQPTGGKARLTEGCSFRRKQH\n>3wkn_O mol:protein length:54  AFFinger p17\nGPGISAFSPGRGVYDPETGTWYDAAWHLGELVWATYYDPETGTWEPDWQRMLGQ\n>5y2e_A mol:protein length:47  Non-structural glycoprotein 4\nMIEKQMDRVVKEMRRQLEMIDKLTTRGIEQVELLKRIHDKLMIRAVD\n>3rtf_B mol:protein length:258  Glutamate receptor 2\nKTVVVTTILESPYVMMKKNHEMLEGNERYEGYCVDLAAEIAKHCGFKYKLTIVGDGKYGARDADTKIWNGMVGELVYGKADIAIAPLTITLVREEVIDFSKPFMSLGISIMIKKGTPIESAEDLSKQTEIAYGTLDSGSTKEFFRRSKIAVFDKMWTYMRSAEPSVFVRTTAEGVARVRKSKGKYAYLLESTMNEYIEQRKPCDTMKVGGNLDSKGYGIATPKGSSLGNAVNLAVLKLNEQGLLDKLKNKWWYDKGEC\n>7cme_A mol:protein length:214  Cadherin-3\nMDWVVAPISVPENGKGPFPQRLNQLKSNKDRDTKIFYSITGPGADSPPEGVFAVEKETGWLLLNKPLDREEIAKYELFGHAVSENGASVEDPMNISIIVTDQNDHKPKFTQDTFRGSVLEGVLPGTSVMQVTATDEDDAIYTYNGVVAYSIHSQEPKDPHDLMFTIHRSTGTISVISSGLDREKVPEYTLTIQATDMDGDGSTTTAVAVVEILD\n>6vq7_h mol:protein length:155  V-type proton ATPase 16 kDa proteolipid subunit\nMADIKNNPEYSSFFGVMGASSAMVFSAMGAAYGTAKSGTGIAAMSVMRPELIMKSIIPVVMAGIIAIYGLVVAVLIANSLTDGITLYRSFLQLGAGLSVGLSGLAAGFAIGIVGDAGVRGTAQQPRLFVGMILILIFAEVLGLYGLIVALILSTK\n>5af9_I mol:protein length:12  HIRUDIN VARIANT-2\nGDFEEIPEEYLQ\n>3nhn_A mol:protein length:193  Tyrosine-protein kinase HCK\nGIREAGSEDIIVVALYDYEAIHHEDLSFQKGDQMVVLEESGEWWKARSLATRKEGYIPSNYVARVDSLETEEWFFKGISRKDAERQLLAPGNMLGSFMIRDSETTKGSYSLSVRDYDPRQGDTVKHYKIRTLDNGGFYISPRSTFSTLQELVDHYKKGNDGLCQKLSVPCMSSKPQKPWEKDAWELEHHHHHH\n>1gn2_H mol:protein length:207  SUPEROXIDE DISMUTASE\nMAEYTLPDLDWDYGALEPHISGQINELHHSKHHATYVKGANDAVAKLEEARAKEDHSAILLNEKNLAFNLAGHVNHTIWWKNLSPNGGDKPTGELAAAIADAFGSFDKFRAQFHAAATTVQGCGWAALGWDTLGNKLLIFQVYDHQTNFPLGIVPLLLLDMWEHAFYLQYKNVKVDFAKAFWNVVNWADVQSRYAAATSQTKGLIFG\n>2y2p_A mol:protein length:494  PENICILLIN-BINDING PROTEIN 1B\nDISSISEITYSDGTVIASIESDLLRQDFLPSGTVTGISRDYLYFTTLAEAQERMYDYLAQRDNVSAKELKNEATQKFYRDLAAKEIENGGYKITTTIDQKIHSAMQSAVADYGYLLDDGTGRVEVGNVLMDNQTGAILGFVGGRNYQENQNNHAFDTKRSPASTTKPLLAYGIAIDQGLMGSETILSNYPTNFANGNPIMYANSKGTGMMTLGEALNYSWNIPAYWTYRMLRENGVDVKGYMEKMGYEIPEYGIESLPMGGGIEVTVAQHTNGYQTLANNGVYHQKHVISKIEAADGRVVYEYQDKPVQVYSKATATIMQGLLREVLSSRVTTTFKSNLTSLNPTLANADWIGKTGTTGQDENMWLMLSTPRLTLGGWIGHDDNHSLSQQAGYSNNSNYMAHLVNAIQQASPSIWGNERFALDPSVVKSEVLKSTGQKPGKVSVEGKEVEVTGSTVTSYWANKSGAPATSYRFAIGGSDADYQNAWSSIVGSLP\n>7tpb_G mol:protein length:66  Ras GTPase-activating protein 1\nGPLGSRRRVRAILPYTKVPDTDEISFLKGDMFIVHNELEDGWMWVTNLRTDEQGLIVEDLVEEVGR\n>3dfq_A mol:protein length:363  Fructose-bisphosphate aldolase A\nPHSHPALTPEQKKELSDIAHRIVAPGKGILAASESTGSIAKRLQSIGTENTEENRRFYRQLLLTADDRVNPCIGGVILFHETLYQKADDGRPFPQVIKSKGGVVGIKVDKGVVPLAGTNGETTTQGLDGLSERCAQYKKDGADFAKWRCVLKIGEHTPSALAIMENANVLARYASICQQNGIVPIVEPEILPDGDHDLKRCQYVTEKVLAAVYKALSDHHIYLEGTLLKPNMVTPGHACTQKYSHEEIAMATVTALRRTVPPAVTGVTFLSGGQSEEEASINLNAINKCPLLKPWALTFSYGRALQASALKAWGGKKENLKAAQEEYVKRALANSLACQGKYTPSGQAGAAASESLFISNHAY\n>1anc_A mol:protein length:223  ANIONIC TRYPSIN\nIVGGYTCQENSVPYQVSLNSGYHFCGGSLINDQWVVSAAHCYKSRIQVRLGEHNINVLEGNEQFVNAAKIIKHPNFDRKTLNNDIMLIKLSSPVKLNARVATVALPSSCAPAGTQCLISGWGNTLSSGVNEPDLLQCLDAPLLPQADCEASYPGKITDNMVCVGFLEGGKDSCQGDSGGPVVCNGELQGIVKWGYGCALPDNPGVYTKVCNYVDWIQDTIAAN\n>6d0u_I mol:protein length:214  Antibody C05, light chain\nDIQLTQSPSSLSASVGDRVTLTCQASQDIRKFLNWYQQKPGKGPKLLIYDASNLQRGVPSRFSGGGSGTDFTLIISSLQPEDVGTYYCQQYDGLPFTFGGGTKVVIKRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC\n>2nti_F mol:protein length:244  DNA polymerase sliding clamp A\nMKVVYDDVRVLKDIIQALARLVDEAVLKFKQDSVELVALDRAHISLISVNLPREMFKEYDVNDEFKFGFNTQYLMKILKVAKRKEAIEIASESPDSVIINIIGSTNREFNVRNLEVSEQEIPEINLQFDISATISSDGFKSAISEVSTVTDNVVVEGHEDRILIKAEGESEVEVEFSKDTGGLQDLEFSKESKNSYSAEYLDDVLSLTKLSDYVKISFGNQKPLQLFFNMEGGGKVTYLLAPKV\n>3prc_C mol:protein length:336  PHOTOSYNTHETIC REACTION CENTER\nCFEPPPATTTQTGFRGLSMGEVLHPATVKAKKERDAQYPPALAAVKAEGPPVSQVYKNVKVLGNLTEAEFLRTMTAITEWVSPQEGCTYCHDENNLASEAKYPYVVARRMLEMTRAINTNWTQHVAQTGVTCYTCHRGTPLPPYVRYLEPTLPLNNRETPTHVERVETRSGYVVRLAKYTAYSALNYDPFTMFLANDKRQVRVVPQTALPLVGVSRGKERRPLSDAYATFALMMSISDSLGTNCTFCHNAQTFESWGKKSTPQRAIAWWGIRMVRDLNMNYLAPLNASLPASRLGRQGEAPQADCRTCHQGVTKPLFGASRLKDYPELGPIKAAAK\n>7pi5_V mol:protein length:32  Photosystem II reaction center protein Ycf12\nSLTLILQLVALFAVVAAGPLVVVLLSVRGGNL\n>6s39_P mol:protein length:12  Cellular tumor antigen p53\nKLMFKTEGPDSD\n>4v1a_b mol:protein length:380  MITORIBOSOMAL PROTEIN ML38, MRPL38\nMAAPWWRAALCASRRWRGFSTSAALSRRAAPLGPMPNEDIDVSDLERLKKYRSFDRYRRRAEQEARKPHWWRTYREHFGEESGPKDRVDIGLPPPKVSRTQQLLERKQALRELRANVEEERAARLQTARIPLEAVRAEWERTCGPYHKQRLAEYCGLYRDLFHGATFVPRVPLHVAYAVGEDDLMPVYHGNEVTPTEAAQAPEVTYEADEGSLWTLLLTNLDGHLLEPDAEYVHWLVTNIPGNRVTEGQETCPYLPPFPARGSGFHRFAFLLFKQDKRIDFSGDTRPSPCYQLAQRTFHTFDFYKKHQDAMTPAGLAFFQCRWDDSVTRVFHQLLDMREPVFEFVRPPPYHPKQKRFPHRQPLRYLDRYRDSHEPTYGIY\n>1z7n_E mol:protein length:208  ATP phosphoribosyltransferase\nMIKIAITKGRIQKQVTKLLENADYDVEPILNLGRELQIKTKDDLQIIFGKPNDVITFLEHGIVDIGFVGKDTLDENDFDDYYELLYLKIGQCIFALASYPDFSNKNFQRHKRIASKYPRVTKKYFAQKQEDIEIIKLEGSVELGPVVGLADAIVDIVETGNTLSANGLEVIEKISDISTRMIVNKSSFKFKKDKIIEMVERLEDAQTN\n>1ygz_A mol:protein length:173  Inorganic pyrophosphatase\nMNLEKLEVSHDADSLCVVIEISKHSNIKYELDKESGALMVDRVLYGAQNYPANYGFVPNTLGSDGDPVDALVLSDVAFQAGSVVKARLVGVLNMEDESGMDEKLIALPIDKIDPTHSYVKDIDDLSKHTLDKIKHFFETYKDLEPNKWVKVKGFENKESAIKVLEKAIKAYQG\n>5rkm_A mol:protein length:149  PH-interacting protein\nMHHHHHHSSGVDLGTENLYFQSMSYDIQAWKKQCEELLNLIFQCEDSEPFRQPVDLLEYPDYRDIIDTPMDFATVRETLEAGNYESPMELCKDVRLIFSNSKAYTPSKRSRIYSMSLRLSAFFEEHISSVLSDYKSALRFHKRNTITKR\n>4dvi_B mol:protein length:217  Tankyrase-1\nQGTILLDLAPEDKEYQSVEEEMQSTIREHRDGGNAGGIFNRYNVIRIQKVVNKKLRERFCHRQKEVSEENHNHHNERMLFHGSPFINAIIHKGFDERHAYIGGMFGAGIYFAENSSKSNQYVYGIGGGTGCPTHKDRSCYICHRQMLFCRVTLGKSFLQFSTMKMAHAPPGHHSVIGRPSVNGLAYAEYVIYRGEQAYPEYLITYQIMKPEHHHHHH\n>6xu6_CD mol:protein length:290  60S ribosomal protein L5\nKNKQYFKRYQVKFRRRREGKTDYYARKRLTFQDKNKYNTPKYRLIVRLSNKDITVQIAYARIEGDRVVCAAYSHELPKYGIQVGLTNYAAAYCTGLLVARRVLNKLGLDSLYAGCTEVTGEEFNVEPVDDGPGAFRCFLDVGLARTTTGARVFGAMKGAVDGGLNIPHSVKRFPGYSAETKSFNADVHRAHIFGQHVADYMRSLEEEDEESFKRQFSRYIKLGIRADDLEDIYKKAHQAIRNDPTHKVTAKKSSAVTKKRWNAKKLTNEQRKTKIAAHKAAYVAKLQSET\n>6m0s_E mol:protein length:159  V-type proton ATPase subunit c\nMTELCPVYAPFFGAIGCASAIIFTSLGAAYGTAKSGVGICATCVLRPDLLFKNIVPVIMAGIIAIYGLVVSVLVCYSLGQKQALYTGFIQLGAGLSVGLSGLAAGFAIGIVGDAGVRGSSQQPRLFVGMILILIFAEVLGLYGLIVALLLNSRATQDVV\n>7ckb_Bj mol:protein length:98  Major carboxysome shell protein 1A\nMADVTGIALGMIETRGLVPAIEAADAMTKAAEVRLVGRQFVGGGYVTVLVRGETGAVNAAVRAGADACERVGDGLVAAHIIARVHSEVENILPKAPQA\n>7l6g_B mol:protein length:299  Metallo-mystery pair system four-Cys motif protein\nAGVKTQPVAVRFALVADGKEVGCGAPLANLGSGRLAGKLHEARLYVYGFELVDAKGKHTPIALTQNDWQYADVALLDFKDARGGNAACTPGNPAKNTTVVGAAPQGAYVGLAFSVGAPVESLVDGKPVFVNHSNVEAAPPPLDISGMAWNWQAGRRFVTIEVIPPAAVIKPDGSKSRTWMVHVGSTGCKGNPATGEIVACAHENRFPVVFDRFDPKTQRVELDLTTLFESSDISVDKGGAVGCMSALDDPDCPAVFRALGLNLADSAPGANDAGKPSRPGVSPIFSVGAAASKVAGGKQ\n>3lcb_C mol:protein length:416  Isocitrate dehydrogenase [NADP]\nMESKVVVPAQGKKITLQNGKLNVPENPIIPYIEGDGIGVDVTPAMLKVVDAAVEKAYKGERKISWMEIYTGEKSTQVYGQDVWLPAETLDLIREYRVAIKGPLTTPVGGGIRSLNVALRQELDLYICLRPVRYYQGTPSPVKHPELTDMVIFRENSEDIYAGIEWKADSADAEKVIKFLREEMGVKKIRFPEHCGIGIKPCSEEGTKRLVRAAIEYAIANDRDSVTLVHKGNIMKFTEGAFKDWGYQLAREEFGGELIDGGPWLKVKNPNTGKEIVIKDVIADAFLQQILLRPAEYDVIACMNLNGDYISDALAAQVGGIGIAPGANIGDECALFEATHGTAPKYAGQDKVNPGSIILSAEMMLRHMGWTEAADLIVKGMEGAINAKTVTYDFERLMDGAKLLKCSEFGDAIIENM\n>2wl6_A mol:protein length:392  ACETYL-COA ACETYLTRANSFERASE\nSTPSIVIASAARTAVGSFNGAFANTPAHELGATVISAVLERAGVAAGEVNEVILGQVLPAGEGQNPARQAAMKAGVPQEATAWGMNQLCGSGLRAVALGMQQIATGDASIIVAGGMESMSMAPHCAHLRGGVKMGDFKMIDTMIKDGLTDAFYGYHMGTTAENVAKQWQLSRDEQDAFAVASQNKAEAAQKDGRFKDEIVPFIVKGRKGDITVDADEYIRHGATLDSMAKLRPAFDKEGTVTAGNASGLNDGAAAALLMSEAEASRRGIQPLGRIVSWATVGVDPKVMGTGPIPASRKALERAGWKIGDLDLVEAHEAFAAQACAVNKDLGWDPSIVNVNGGAIAIGNPIGASGARILNTLLFEMKRRGARKGLATLCIGGGMGVAMCIESL\n>6qz0_6E mol:protein length:448  Major capsid protein\nMRITFNDVKTSLGITESYDIVNAIRNSQGDNFKSYVPLATANNVAEVGAGILINQTVQNDFITSLVDRIGLVVIRQVSLNNPLKKFKKGQIPLGRTIEEIYTDITKEKQYDAEEAEQKVFEREMPNVKTLFHERNRQGFYHQTIQDDSLKTAFVSWGNFESFVSSIINAIYNSAEVDEYEYMKLLVDNYYSKGLFTTVKIDEPTSSTGALTEFVKKMRATARKLTLPQGSRDWNSMAVRTRSYMEDLHLIIDADLEAELDVDVLAKAFNMNRTDFLGNVTVIDGFASTGLEAVLVDKDWFMVYDNLHKMETVRNPRGLYWNYYYHVWQTLSVSRFANAVAFVSGDVPAVTQVIVSPNIAAVKQGGQQQFTAYVRATNAKDHKVVWSVEGGSTGTAITGDGLLSVSGNEDNQLTVKATVDIGTEDKPKLVVGEAVVSIRPNNASGGAQA\n>5ez8_D mol:protein length:31  CC-Hept-I-C-I\nXGEIAQALKEIAKALKEIAWACKEIAQALKG\n>7jqm_2H mol:protein length:180  50S ribosomal protein L6\nMSRIGRLPIPVPKGVSVEVAPGRVKVKGPKGELEVPVSPEMRVVVEEGVVRVERPSDERRHKSLHGLTRTLIANAVKGVSEGYSKELLIKGIGYRARLVGRALELTVGFSHPVVVEPPEGITFEVPEPTRVRVSGIDKQKVGQVAANIRAIRKPSAYHEKGIYYAGEPVRLKPGKAGAKK\n>7ck8_B mol:protein length:173  Ferritin heavy chain\nSTSQVRQNYHQDSEAAINRQINLELYASYVYLSMSYYFDRDDVALKNFAKYFLHQSHEEREHAEKLMKLQNQRGGRIFLQDIKKPDSDDWESGLNAMESALHLEKNVNQSLLELHKLATDKNDPHLSDFIETHYLNEQVKAIKELGDHVTNLRKMGAPESGLAEYLFDKHTLG\n>5gaq_C mol:protein length:310  Lysenin\nMSAKAAEGYEQIEVDVVAVWKEGYVYENRGSTSVDQKITITKGMKNVNSETRTVTATHSIGSTISTGDAFEIGSVEVSYSHSHEESQVSMTETEVYESKVIEHTITIPPTSKFTRWQLNADVGGADIEYMYLIDEVTPIGGTQSIPQVITSRAKIIVGRQIILGKTEIRIKHAERKEYMTVVSRKSWPAATLGHSKLFKFVLYEDWGGFRIKTLNTMYSGYEYAYSSDQGGIYFDQGTDNPKQRWAINKSLPLRHGDVVTFMNKYFTRSGLCYDDGPATNVYCLDKREDKWILEVVGLVPRGSGHHHHHH\n>2g2w_B mol:protein length:165  Beta-lactamase inhibitory protein\nAGVMTGAKFTQIQFGMTRQQVLDIAGAENCETGGSFGDSIHCRGHAAGDYYAYATFGFTSAAADAKVDSKSQEKLLAPSAPTLTLAKFNQVTVGMTRAQVLATVGQGSCTTWSEYYPAYPSTAGVTLSLSCFDVDGYSSTGFYRGSAHLWFTDGVLQGKRQWDLV\n>1egm_G mol:protein length:173  PROPANEDIOL DEHYDRATASE\nMNTDAIESMVRDVLSRMNSLQGEAPAAAPAAGGASRSARVSDYPLANKHPEWVKTATNKTLDDFTLENVLSNKVTAQDMRITPETLRLQASIAKDAGRDRLAMNFERAAELTAVPDDRILEIYNALRPYRSTKEELLAIADDLESRYQAKICAAFVREAATLYVERKKLKGDD\n>4oko_B mol:protein length:312  Rapid Encystment Phenotype Protein 34 KDa\nMPAQYHIGTPGKKWGSEEKSQWLAEQNKKRSYQQEAEKKILALVSDFDIDEYGQLDYPVGSYKLYALKTKNWDASKPYVLVTGGVHGYETSGVQGAISFAQTRALEFARDYNIVILPCLSPWGYETINRWNPNALDPNRSFYLESGCQEAVLAMKYVFSLGVEFLMHIDLHETTDTDDSEFRPALAAREGIAINKWGIPDGFYLVANNRNPHYDFQKYIIDAVAKVTHIAPTDPSINILGDDIIRDGIMACDSDKERLCMSFTTAEYTTTTEVYPDSPRTNPQECILAQVEAIVAGLNFLKQKNLEHHHHHH\n>4cih_B mol:protein length:150  LISTERIA NUCLEAR TARGETED PROTEIN A\nRPKLSTKDLALIKADLAEFEARELSSEKILKDTIKEESWSDLDFANDNINQMIGTMKRYQQEILSIDAIKRSSEASADTEAFKKIFKEWSEFKIERIQVTIDLLNGKKDSEAVFKKTYPNQIIFDDVRTNKLQTALNNLKVGYELLDSQK\n>6k3a_A mol:protein length:264  Proliferating cell nuclear antigen\nGPGMFEARLVQGSILKKVLEALKDLINEACWDISSSGVNLQSMDSSHVSLVQLTLRSEGFDTYRCDRNLAMGVNLTSMSKILKCAGNEDIITLRAEDNADTLALVFEAPNQEKVSDYEMKLMDLDVEQLGIPEQEYSCVVKMPSGEFARICRDLSHIGDAVVISCAKDGVKFSASGELGNGNIKLSQTSNVDKEEEAVTIEMNEPVQLTFALRYLNFFTKATPLSSTVTLSMSADVPLVVEYKIADMGHLKYYLAPKIEDEEGS\n>1myw_A mol:protein length:239  Green fluorescent protein\nMVSKGEELFTGVVPILVELDGDVNGHKFSVSGEGEGDATYGKLTLKLICTTGKLPVPWPTLVTTLGYGLQCFARYPDHMKQHDFFKSAMPEGYVQERTIFFKDDGNYKTRAEVKFEGDTLVNRIELKGIDFKEDGNILGHKLEYNYNSHNVYITADKQKNGIKANFKIRHNIEDGGVQLADHYQQNTPIGDGPVLLPDNHYLSYQSALSKDPNEKRDHMVLLEFVTAAGITHGMDELYK\n>5zmu_A mol:protein length:314  Cis-epoxysuccinate hydrolase\nMGSSHHHHHHSSGLVPRGSHMTRTKLILEARINEYMPRRGNPHVPWTPKEIGEAAAQAREAGASIVHFHARQADGSPSHDYETYAESIREIRARSDVLVHPTLGQITLGGRESRLAHIERLCLDPALKPDFAPVDLGSTNIDRYDDVEKRYETGDRVYLNNIDTLQHFSKRLRELGVKPAFIAWTVPFTRTLDAFMDMGLVDDPAYLLFELTDCGIRGGHPGTIRGLRAHTDFLPPGRQIQWTVCNKIGNLFGPAAAAIEEGGHVAIGLGDYLYPELGTPTNGEVVQTVANMARAMGREIATPAETKEILGISN\n>6yfb_CB mol:protein length:166  coat protein\nSYTQSFGYTIPTEKDTLEIPQYQALLAKKASYMDDSQGKNTATYMNTAAPKDQPETITFGVNKVDNVYKQSNVQNQTFYASSSKGTKIRIDGKRIWRTQSTDVNTGLPVIVDCPLWTSFTLGFADFTLVDDSARKSTIEWMISQLELLKDDGVWSKLCSGVTRIYG\n>1j0a_A mol:protein length:325  1-aminocyclopropane-1-carboxylate deaminase\nMHPKIFALLAKFPRVELIPWETPIQYLPNISREIGADVYIKRDDLTGLGIGGNKIRKLEYLLGDALSKGADVVITVGAVHSNHAFVTGLAAKKLGLDAILVLRGKEELKGNYLLDKIMGIETRVYDAKDSFELMKYAEEIAEELKREGRKPYVIPPGGASPIGTLGYVRAVGEIATQSEVKFDSIVVAAGSGGTLAGLSLGLSILNEDIRPVGIAVGRFGEVMTSKLDNLIKEAAELLGVKVEVRPELYDYSFGEYGKITGEVAQIIRKVGTREGIILDPVYTGKAFYGLVDLARKGELGEKILFIHTGGISGTFHYGDKLLSLL\n>4hgj_B mol:protein length:455  Bifunctional P-450/NADPH-P450 reductase\nTIKEMPQPKTFGELKNLPLLNTDKPVQALMKIADELGEIFKFEAPGRVTRYLSSQRLIKEACDESRFDKNLSQALKFVRDFAGDGLATSWTHEKNWKKAHNILLPSFSQQAMKGYHAMMVDIAVQLVQKWERLNADEHIEVPEDMTRLTLDTIGLCGFNYRFNSFYRDQPHPFITSMVRALDEAMNKLQRANPDDPAYDENKRQFQEDIKVMNDLVDKIIADRKASGEQSDDLLAHMLNGKDPETGEPLDDENIRYQIITFLIAGHETTSGLLSFALYFLVKNPHVLQKAAEEAARVLVDPVPSYKQVKQLKYVGMVLNEALRLWPTAPAFSLYAKEDTVLGGEYPLEKGDELMVLIPQLHRDKTIWGDDVEEFRPERFENPSAIPQHAFKPFGNGQRACIGQQFALHEATLVLGMMLKHFDFEDHTNYELDIKETLTLKPEGFVVKAKSKKIPL\n>6vmi_5 mol:protein length:423  39S ribosomal protein L37, mitochondrial\nMALASGPARRALAGSGQLGLGGFGAPRRGAYEWGVRSTRKSEPPPLDRVYEIPGLEPITFAGKMHFVPWLARPIFPPWDRGYKDPRFYRSPPLHEHPLYKDQACYIFHHRCRLLEGVKQALWLTKTKLIEGLPEKVLSLVDDPRNHIENQDECVLNVISHARLWQTTEEIPKRETYCPVIVDNLIQLCKSQILKHPSLARRICVQNSTFSATWNRESLLLQVRGSGGARLSTKDPLPTIASREEIEATKNHVLETFYPISPIIDLHECNIYDVKNDTGFQEGYPYPYPHTLYLLDKANLRPHRLQPDQLRAKMILFAFGSALAQARLLYGNDAKVLEQPVVVQSVGTDGRVFHFLVFQLNTTDLDCNEGVKNLAWVDSDQLLYQHFWCLPVIKKRVVVEPVGPVGFKPETFRKFLALYLHGAA\n>6uzq_C mol:protein length:9  Synthetic peptide THR-VAL-ARG-ALA-SER-GLY-HIS-SER-TYR\nTVRASGHSY\n>6wwl_A mol:protein length:451  Tubulin alpha-1B chain\nMRECISIHVGQAGVQIGNACWELYCLEHGIQPDGQMPSDKTIGGGDDSFNTFFSETGAGKHVPRAVFVDLEPTVIDEVRTGTYRQLFHPEQLITGKEDAANNYARGHYTIGKEIIDLVLDRIRKLADQCTGLQGFLVFHSFGGGTGSGFTSLLMERLSVDYGKKSKLEFSIYPAPQVSTAVVEPYNSILTTHTTLEHSDCAFMVDNEAIYDICRRNLDIERPTYTNLNRLISQIVSSITASLRFDGALNVDLTEFQTNLVPYPRIHFPLATYAPVISAEKAYHEQLSVAEITNACFEPANQMVKCDPRHGKYMACCLLYRGDVVPKDVNAAIATIKTKRSIQFVDWCPTGFKVGINYQPPTVVPGGDLAKVQRAVCMLSNTTAIAEAWARLDHKFDLMYAKRAFVHWYVGEGMEEGEFSEAREDMAALEKDYEEVGVDSVEGEGEEEGEEY\n>7l20_D mol:protein length:305  39S ribosomal protein L2, mitochondrial\nMALCALTRALRSLNLAPPTVAAPAPSLFPAAQMMNNGLLQQPSALMLLPCRPVLTSVALNANFVSWKSRTKYTITPVKMRKSGGRDHTGRIRVHGIGGGHKQRYRMIDFLRFRPEETKSGPFEEKVIQVRYDPCRSADIALVAGGSRKRWIIATENMQAGDTILNSNHIGRMAVAAREGDAHPLGALPVGTLINNVESEPGRGAQYIRAAGTCGVLLRKVNGTAIIQLPSKRQMQVLETCVATVGRVSNVDHNKRVIGKAGRNRWLGKRPNSGRWHRKGGWAGRKIRPLPPMKSYVKLPSASAQS\n>7d28_D mol:protein length:117  Endoribonuclease MazF\nMVSDYVPDAGHLVWLNFTPQAGHEQGGRRPALVLSPAAYNGVTGLMQACPVTSRAKGYPFEVTLPAHLGVSGVVLADHCRSLDWRSRRAEQLAEAPADVLAEVRGKLGSLLGMSEKA\n>6hvu_b mol:protein length:196  Proteasome subunit beta type-1\nTSIMAVTFKDGVILGADSRTTTGAYIANRVTDKLTRVHDKIWCCRSGSAADTQAIADIVQYHLELYTSQYGTPSTETAASVFKELCYENKDNLTAGIIVAGYDDKNKGEVYTIPLGGSVHKLPYAIAGSGSTFIYGYCDKNFRENMSKEETVDFIKHSLSQAIKWDGSSGGVIRMVVLTAAGVERLIFYPDEYEQL\n>2nyz_E mol:protein length:93  Lymphotactin\nVGSEVSDKRTCVSLTTQRLPVSRIKTYTITEGSLRAVIFITKRGLKVCADPQATWVRDVVRSMDRKSNTRNNMIQTKPTGTQQSTNTAVTLTG\n>5sce_D mol:protein length:447  Pyruvate kinase\nGSMEGPAGYLRRADVAQLTQELGTAFFQQQQLPAAMADTFLEHLCLLDIDSEPVAARSTSIIATIGPASRSVERLKEMIKAGMNIARLNFSHGSHEYHAESIANVREAVESFAGSPLSYRPVAIALDTKGPGSGPGLSEQDVRDLRFGVEHGVDIVFASFVRKASDVAAVRAALGPEGHGIKIISKIENHEGVKRFDEILEVSDGIMVARGDLGIEIPAEKVFLAQKMMIGRCNLAGKPVVCATQMLESMITKPRPTRAETSDVANAVLDGADCIMLSGETAKGNFPVEAVKMQHAIAREAEAAVYHRQLFEELRRAAPLSRDPTEVTAIGAVEAAFKCCAAAIIVLTTTGRSAQLLSRYRPRAAVIAVTRSAQAARQVHLCRGVFPLLYREPPEAIWADDVDRRVQFGIESGKLRGFLRVGDLVIVVTGWRPGSGYTNIMRVLSIS\n>7qrv_B mol:protein length:281  Tripartite motif-containing protein 2\nSMNPIEDDLIFRVGTKGRNKGEFTNLQGVAASTNGKILIADSNNQCVQIFSNDGQFKSRFGIRGRSPGQLQRPTGVAVHPSGDIIIADYDNKWVSIFSSDGKFKTKIGSGKLMGPKGVSVDRNGHIIVVDNKACCVFIFQPNGKIVTRFGSRGNGDRQFAGPHFAAVNSNNEIIITDFHNHSVKVFNQEGEFMLKFGSNGEGNGQFNAPTGVAVDSNGNIIVADWGNSRIQVFDGSGSFLSYINTSADPLYGPQGLALTSDGHVVVADSGNHCFKVYRYLQ\n>6wef_L mol:protein length:159  Uncharacterized protein\nGGEVPIGDPKELNGMEIAAVYLQPIEMEPRGIDLAASLADIHLEADIHALKNNPNGFPEGFWMPYLTIAYELKNTDTGAIKRGTLMPMVADHGPHYGANIAMEKDKKGGFGVGNYELTFYISNPEKQGFGRHVDEETGVGKWFEPFKVDYKFKYTGTPK\n>1v2a_A mol:protein length:210  glutathione transferase gst1-6\nMDYYYSLISPPCQSAILLAKKLGITLNLKKTNVHDPVERDALTKLNPQHTIPTLVDNGHVVWESYAIVLYLVETYAKDDTLYPKDPKVRSVVNQRLFFDIGTLYKRIIDVIHLVMKKEQPSDEQMEKLKGALDLLEQFVTERAYAAADHLTVADICLLGTVTALNWLKHDLEPFPHIRAWLERVRAEMPDYEEFSKQVADDTLAYVASRK\n>6onk_B mol:protein length:137  Dehaloperoxidase B\nGFKQDIATLRGDLRTYAQDIFLAFLNKYPDEKRNFKNYVGKSDQELKSMAKFGDHTEKVFNLMMEVADRATDCVPLASDASTLVQMKQHSGLTTGNFEKLFVALVEYMRASGQSFDSQSWDRFGKNLVSALSSAGMK\n>4v8e_CG mol:protein length:182  50S ribosomal protein L5\nMPLDVALKRKYYEEVRPELIRRFGYQNVWEVPRLEKVVINQGLGEAKEDARILEKAAQELALITGQKPAVTRAKKSISNFKLRKGMPIGLRVTLRRDRMWIFLEKLLNVALPRIRDFRGLNPNSFDGRGNYNLGLREQLIFPEITYDMVDALRGMDIAVVTTAETDEEARALLELLGFPFRK\n>7d1t_b mol:protein length:505  Photosystem II CP47 reaction center protein\nGLPWYRVHTVLINDPGRLIAAHLMHTALVAGWAGSMALYELATFDPSDPVLNPMWRQGMFVLPFMARLGVTGSWSGWSITGETGIDPGFWSFEGVALAHIVLSGLLFLAACWHWVYWDLELFRDPRTGEPALDLPKMFGIHLFLAGLLCFGFGAFHLTGLFGPGMWVSDPYGLTGSVQPVAPEWGPDGFNPYNPGGVVAHHIAAGIVGIIAGLFHILVRPPQRLYKALRMGNIETVLSSSIAAVFFAAFVVAGTMWYGSATTPIELFGPTRYQWDSSYFQQEINRRVQASLASGATLEEAWSAIPEKLAFYDYIGNNPAKGGLFRTGPMNKGDGIAQAWKGHAVFRNKEGEELFVRRMPAFFESFPVILTDKNGVVKADIPFRRAESKYSFEQQGVTVSFYGGELNGQTFTDPPTVKSYARKAIFGEIFEFDTETLNSDGIFRTSPRGWFTFAHAVFALLFFFGHIWHGARTLFRDVFSGIDPELSPEQVEWGFYQKVGDVTTRK\n>1swr_B mol:protein length:127  CORE-STREPTAVIDIN\nAEAGITGTWYNQLGSTFIVTAGADGALTGTYESAVGNAESRYVLTGRYDSAPATDGSGTALGWTVAWKNNYRNAHSATTWSGQYVGGAEARINTQWLLTSGTTEANAAKSTLVGHDTFTKVKPSAAS\n>5xke_B mol:protein length:445  Tubulin beta chain\nMREIVHIQAGQCGNQIGAKFWEVISDEHGIDPTGSYHGDSDLQLERINVYYNEATGNKYVPRAILVDLEPGTMDSVRSGPFGQIFRPDNFVFGQSGAGNNWAKGHYTEGAELVDSVLDVVRKESESCDCLQGFQLTHSLGGGTGSGMGTLLISKIREEYPDRIMNTFSVMPSPKVSDTVVEPYNATLSVHQLVENTDETYCIDNEALYDICFRTLKLTTPTYGDLNHLVSATMSGVTTCLRFPGQLNADLRKLAVNMVPFPRLHFFMPGFAPLTSRGSQQYRALTVPELTQQMFDSKNMMAACDPRHGRYLTVAAIFRGRMSMKEVDEQMLNVQNKNSSYFVEWIPNNVKTAVCDIPPRGLKMSATFIGNSTAIQELFKRISEQFTAMFRRKAFLHWYTGEGMDEMEFTEAESNMNDLVSEYQQYQDATADEQGEFEEEGEEDEA\n>6nx9_A mol:protein length:333  L-asparaginase 2\nMHHHHHHLPNITILATGGTIAGGGDSATKSNYTVGKVGVENLVNAVPQLKDIANVKGEQVVNIGSQDMNDNVWLTLAKKINTDCDKTDGFVITHGTTTMEETAYFLDLTVKCDKPVVMVGAMRPSTSMSADGPFNLYNAVVTAADKASANRGVLVVMNDTVLDGRDVTTTNTTDVATFKSVNYGPLGYIHNGKIDYQRTPARKHTSDTPFDVSKLNELPKVGIVYNYANASDLPAKALVDAGYDGIVSAGVGNGNLYKSVFDTLATAAKTGTAVVRSSRVPTGATTQDAEVDDAKYGFVASGTLNPQKARVLLQLALTQTKDPQQIQQIFNQY\n>2qr0_S mol:protein length:213  Fab-Fragment Light Chain\nDIQMTQSPSSLSASVGDRVTITCRASQSVSSAVAWYQQKPGKAPKLLIYSASSLYSGVPSRFSGSRSGTDFTLTISSLQPEDFATYYCQQYSYYYYPFTFGQGTKVEIKRTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNR\n>4v7v_B2 mol:protein length:46  50S ribosomal protein L34\nMKRTFQPSVLKRNRSHGFRARMATKNGRQVLARRRAKGRARLTVSK\n>5lze_r mol:protein length:65  30S ribosomal protein S18\nFCRFTAEGVQEIDYKDIATLKNYITESGKIVPSRITGTRAKYQRQLARAIKRARYLSLLPYTDRH\n>7b4v_A mol:protein length:132  Broadly neutralizing DARPin bnD.2\nGPGSDLGKKLLEAARAGQDDEVRILMANGADVNASDADVGATPLHLAAWAGHLEIVEVLLKTGADVNAVDIWGLTPLHLAAAVGHLEIVEVLLKHGADVNAQDKFGKTPFDLAIDNGNEDIAEVLQKAAKLN\n>7xjh_R mol:protein length:395  Beta-3 adrenergic receptor\nDYKDDDDAMGAPWPHGNGSVASWPAAPTPTPDAANTSGLPGAPWAVALAGALLALEVLATVGGNLLVIVAIARTPRLQTMTNVFVTSLATADLVVGLLVVPPGATLALTGRWPLGATGCELWTSVDVLCVTASIETLCALAVDRYLAVTNPLRYGALVTKRRARAAVVLVWVVSAAVSFAPIMSKWWRVGADAEAQRCHSNPHCCAFASNIPYALLSSSVSFYLPLLVMLFVYARVFLVATRQLRLLRRELGRFPPAESPPAASRSRSPGPARRCASPAAVPSDRLRPARLLPLREHRALRTLGLIVGTFTLCWLPFFVANVMRALGGPSLVPSPALLALNWLGYANSAFNPLIYCRSPDFRSAFRRLLCRCRREEHRAAASPPGDPSENLYFQG\n>6bx1_z mol:protein length:540  VP2\nSGVGHSTGNYNNRTIFHYHGDEVTIICHATRHIHLNMSPTEEYKIYDTNHGPEFPNTGDQTQQGRNTVNDSYHAKVETPWYLINPNSWGIWFNPADFQQLITTCTHVTIETLTQEIDNIVIKTVSKQGSGAEETTQYNNDLTALLEVALDKSNMLPWVADNMYLNSLGYIPWRPCKLTQFCYHTNFYNTINLLEGTQQNQWSQIKEGIQYDNLQFTPIETSAEIDLLRTGDSWTSGTYHFKCKPTQLFYHWQSTRHIGAPHPTTSPEQEGQKGQIIQDTNGWQWGDRDNPISASTTVKDFHIGYSWPEWRWHYSTGGPSINPGSAFSQTPWGSEVGGTRLTQGASEKAIFDYNHGEAEPGHRDQWWQNNAQQTGQTNWAIKNAHQSELRNATASRETFWTQDYHNTFGPYTAVDDVGIQYPWGAMWGKQPDTTHKPMMSAHAPFTCQNGPPGQLLVKLAPNYTDSLNNEGLQTNRIVTFATFWWTGRCTFKAKLRTPRQFNAYQLPGIPSGTNPKKFVPDAIGRFELPFMPGRAMPNYTY\n>7lkj_D mol:protein length:423  Aminofutalosine deaminase\nMHHHHHHENLYFQGMQEIIGASLVFLCNEKCEVLEDYGVVFDEKIVEIGDYHNLTLKYPHLKAQFFENSVLLPAFINAHTHFEFSNNKASFDYGSFSGWLGSVLNNGGAILENCQGAIQNAIMAQLKSGVGSVGAISNHLIEVNLLKESPLNAVVFLEFLGSSYSLEKLKAFEAKFKELKDLEDQKLKAALAVHAPYSVQKDMALSVIQLAKDSQSLLSTHFLESLEELEWVENSKGWFENFYQRFLKESNFTSLYEGANDYIDMFKDTHTLFVHNQFASLEALKRIKSQVKNAFLITCPFSNRLLSGKALDLERVREAGLSVSVATDGLSSNISLSLLDELRAFLLSHNMPLLELAKIALLGATRHGAKALALNNGEIETNKRADLSVFGFNEKFTKEQAILQFLLHAKEVERLFLGGKRVI\n>4xuc_A mol:protein length:218  Catechol O-methyltransferase\nNLLAGDTKEQRILNHVLQHAEPGNAQSVLEAIDTYCEQKEWAMNVGDKKGKIVDAVIQEHQPSVLLELGAYCGYSAVRMARLLSPGARLITIEINPDCAAITQRMVDFAGVKDKVTLVVGASQDIIPQLKKKYDVDTLDMVFLDHWKDRYLPDTLLLEECGLLRKGTVLLADNVICPGAPDFLAHVRGSSCFECTHYQSFLEYREVVDGLEKAIYKGP\n>3l0s_A mol:protein length:223  Adenylate kinase\nMNILIFGPNGSGKGTQGNLVKDKYSLAHIESGGIFREHIGGGTELGKKAKEFIDRGDLVPDDITIPMVLETLESKGKDGWLLDGFPRNTVQAQKLFEALQEKGMKINFVIEILLPREVAKNRIMGRRICKNNPNHPNNIFIEAIKPNGDVCRVCGGALSARADDQDEGAINKRHDIYYNTVDGTLAAAYYYKNMAAKEGFVYIELDGEGSIDSIKDTLLAQLA\n>7rqc_2P mol:protein length:150  50S ribosomal protein L15\nMKLSDLRPNPGANKRRKRVGRGPGSGHGKTATRGHKGQKSRSGGLKDPRRFEGGRSTTLMRLPKRGMQGQVPGEIKRPRYQGVNLKDLARFEGEVTPELLVRAGLLKKGYRLKILGEGEAKPLKVVAHAFSKSALEKLKAAGGEPVLLEA\n>4yus_A mol:protein length:382  Family 3 adenylate cyclase\nMNHKVHHHHHHIEGRHMKRLTYISKFSRPLSGDEIEAIGRISSQKNQQANVTGVLLCLDGIFFQILEGEAEKIDRIYERILADERHTDILCLKSEVEVQERMFPDWSMQTINLDENTDFLIRPIKVLLQTLTESHRILEKYTQPSIFKIISQGTNPLNIRPKAVEKIVFFSDIVSFSTFAEKLPVEEVVSVVNSYFSVCTAIITRQGGEVTKFIGDCVMAYFDGDCADQAIQASLDILMELEILRNSAPEGSPLRVLYSGIGLAKGKVIEGNIGSELKRDYTILGDAVNVAARLEALTRQLSQALVFSSEVKNSATKSWNFIWLTDSELKGKSESIDIYSIDNEMTRKSSGGLEIARNIGHYLERVGDRQPSQIFGVKSLPL\n>1ziq_A mol:protein length:173  Gamma crystallin E\nGKITFYEDRGFQGRHYECSTDHSNLQPYFSRCNSVRVDSGCWMLYEQPNFTGCQYFLRRGDYPDYQQWMGFSDSVRSCRLIPHSSSHRIRIYEREDYRGQMVEITDDCPHLQDRFHFSDFHSFHVMEGYWVLYEMPNYRGRQYLLRPGEYRRYHDWGAMNARVGSLRRIMDFY\n>4qx8_D mol:protein length:68  Lysine-specific demethylase 2A\nQVHLTHFELEGLRCLVDKLESLPLHKKCVPTGIEDEDALIADVKILLEELASSDPKLALTGVPIVQWP\n>6r0z_B mol:protein length:578  V-type ATP synthase alpha chain\nMIQGVIQKIAGPAVIAKGMLGARMYDICKVGEEGLVGEIIRLDGDTAFVQVYEDTSGLKVGEPVVSTGLPLAVELGPGMLNGIYDGIQRPLERIREKTGIYITRGVVVHALDREKKWAWTPMVKPGDEVRGGMVLGTVPEFGFTHKILVPPDVRGRVKEVKPAGEYTVEEPVVVLEDGTELKMYHTWPVRRARPVQRKLDPNTPFLTGMRILDVLFPVAMGGTAAIPGPFGSGKTVTQQSLAKWSNADVVVYVGCGERGNEMTDVLVEFPELTDPKTGGPLMHRTVLIANTSNMPVAAREASIYVGVTIAEYFRDQGFSVALMADSTSRWAEALREISSRLEEMPAEEGYPPYLAARLAAFYERAGKVITLGGEEGAVTIVGAVSPPGGDMSEPVTQSTLRIVGAFWRLDASLAFRRHFPAINWNGSYSLFTSALDPWYRENVAEDYPELRDAISELLQREAGLQEIVQLVGPDALQDAERLVIEVGRIIREDFLQQNAYHEVDAYCSMKKAYGIMKMILAFYKEAEAAIKRGVSIDEILQLPVLERIGRARYVSEEEFPAYFEEAMKEIQGAFKALA\n>6fl9_E mol:protein length:320  Cys-loop ligand-gated ion channel\nMASLAAEPSDVFIGLKIDQITGINQKEENFSVVGSLRIDWRQPLLAFEHAPGEPKHRTYTLATFLKLLEEKQIRWPAFTYHNQQGRMDFQNRLISLSEDGTVMYLERFTSTFQAPAFDFRLFPFDNQLFFIHVDSIFPQHLFRFQEMQGFSGLGDQLGEEEWIVTEVNTHLTTHNEFTKGDASRFVLEFHAERHLNYYLMRILIPVLLIITVSWFTFFLQDYTKRIDLAGGNLLLFIAFNFTISSDLPRLGYITLMDAFLVGTFIITALVVLGNVWLRRLENHGKQALARKLDIYAITSYPLAYLLGALTLWLLFFWRSY\n>7som_CC mol:protein length:443  Tubulin beta\nMREIVHIQGGQCGNQIGAKFWEVVSDEHGIDPTGTYHGDSDLQLERINVYFNEATGGRYVPRAILMDLEPGTMDSVRSGPYGQIFRPDNFVFGQTGAGNNWAKGHYTEGAELIDSVLDVVRKEAESCDCLQGFQVCHSLGGGTGSGMGTLLISKIREEYPDRMMLTFSVVPSPKVSDTVVEPYNATLSVHQLVENADECMVLDNEALYDICFRTLKLTTPTFGDLNHLISAVMSGITCCLRFPGQLNADLRKLAVNLIPFPRLHFFMVGFTPLTSRGSQQYRALTVPELTQQMWDAKNMMCAADPRHGRYLTASALFRGRMSTKEVDEQMLNVQNKNSSYFVEWIPNNVKSSVCDIPPKGLKMSATFIGNSTAIQEMFKRVSEQFTAMFRRKAFLHWYTGEGMDEMEFTEAESNMNDLVSEYQQYQDASAEEEGEFEGEEEEA\n>4r8p_H mol:protein length:122  Histone H2B 1.1\nAKSAPAPKKGSKKAVTKTQKKDGKKRRKTRKESYAIYVYKVLKQVHPDTGISSKAMSIMNSFVNDVFERIAGEASRLAHYNKRSTITSREIQTAVRLLLPGELAKHAVSEGTKAVTKYTSAK\n>2euz_A mol:protein length:345  NDT80 protein\nGPLGSMNEMENTDPVLQDDLVSKYERELSTEQEEDTPVILTQLNEDGTTSNYFDKRKLKIAPRSTLQFKVGPPFELVRDYCPVVESHTGRTLDLRIIPRIDRGFDHIDEEWVGYKRNYFTLVSTFETANCDLDTFLKSSFDLLVEDSSVEGRLRVQYFAIKIKAKNDDDDTEINLVQHTAKRDKGPQFCPSVCPLVPSPLPKHQTIREASNVRNITKMKKYDSTFYLHRDHVNYEEYGVDSLLFSYPEDSIQKVARYERVQFASSISVKKPSQQNKHFSLHVILGAVVDPDTFHGENPGIPYDELALKNGSKGMFVYLQEMKTPPLIIRGRSPSNYASSQRITVR\n>5e18_A mol:protein length:315  DNA-directed RNA polymerase subunit alpha\nMLDSKLKAPVFTVRTQGREYGEFVLEPLERGFGVTLGNPLRRILLSSIPGTAVTSVYIEDVLHEFSTIPGVKEDVVEIILNLKELVVRFLNPSLQTVTLLLKAEGPKEVKARDFLPVADVEIMNPDLHIATLEEGGRLNMEVRVDRGVGYVPAEKHGIKDRINAIPVDAVFSPVRRVAFQVEDTRLGQRTDLDKLTLRIWTDGSVTPLEALNQAVEILREHLTYFSNPQAAAVAAPEEAKEPEAPPEQEEELDLPLEELGLSTRVLHSLKEEGIESVRALLALNLKDLKNIPGIGERSLEEIKEALEKKGFTLKE\n>5xru_A mol:protein length:193  adenylate kinase\nMADKIKDAKIIFVVGGPGSGKGTQCEKIVAKYGYTHLSSGDLLRAEVSSGSERGKQLQAIMQKGELVPLDTVLDMIKDAMIAKADVSKGYLIDGYPREVKQGEEFEKKIGKPCLLLYIDAKGETMVKRLMKRGETSGRADDNEETIKKRLDLYYKATEPVIAFYEGRGIVRKIDSELPVDEVFKQVSTAIDAL\n>7oiz_l mol:protein length:136  50S ribosomal protein L16\nMLQPKRTKFRKMHKGRNRGLAQGTDVSFGSFGLKAVGRGRLTARQIEAARRAMTRAVKRQGKIWIRVFPDKPITEKPLAVRMGKGKGNVEYWVALIQPGKVLYEMDGVPEELAREAFKLAAAKLPIKTTFVTKTVM\n>7l08_4 mol:protein length:103  39S ribosomal protein L36, mitochondrial\nMANLFIRKMVNPLLYLSRHTVKPRALSTFLFGSIRGAAPVAVEPGAAVRSLLSPGLLPHLLPALGFKNKTVLKKRCKDCYLVKRRGRWYVYCKTHPRHKQRQM\n>5w5f_O mol:protein length:163  Tail tube protein gp19\nMFVDDVTRAFESGDFARPNLFQVEISYLGQNFTFQCKATALPAGIVEKIPVGFMNRKINVAGDRTFDDWTVTVMNDEAHDARQKFVDWQSIAAGQGNEITGGKPAEYKKSAIVRQYARDAKTVTKEIEIKGLWPTNVGELQLDWDSNNEIQTFEVTLALDYWE\n>1cah_A mol:protein length:259  CARBONIC ANHYDRASE II\nSHHWGYGKHNGPEHWHKDFPIAKGERQSPVDIDTHTAKYDPSLKPLSVSYDQATSLRILNNGHAFNVEFDDSQDKAVLKGGPLDGTYRLIQFHFHWGSLDGQGSEHTVDKKKYAAELHLVHWNTKYGDFGKAVQQPDGLAVLGIFLKVGSAKPGLQKVVDVLDSIKTKGKSADFTNFDPRGLLPESLDYWTYPGSLTTPPLLECVTWIVLKEPISVSSEQVLKFRKLNFNGEGEPEELMVDNWRPAQPLKNRQIKASFK\n>1rd4_D mol:protein length:191  Integrin alpha-L\nGAMSCIKGNVDLVFLFDGSMSLQPDEFQKILDFMKDVMKKLSNTSYQFAAVQFSTSYKTEFDFSDYVKRKDPDALLKHVKHMLLLTNTFGAINYVATEVFREELGARPDATKVLIIITDGEATDSGNIDAAKDIIRYIIGIGKHFQTKESQETLHKFASKPASEFVKILDTFEKLKDLFTELQKKIYVIEG\n>5tg8_A mol:protein length:332  Hemagglutinin HA1 chain\nADPGDKICLGHHAVANGTKVNTLTERGVEVVNATETVEITGIDKVCTKGKKAVDLGSCGILGTIIGPPQCDLHLEFKADLIIERRNSSDICYPGRFTNEEALRQIIRESGGIDKESMGFRYSGIRTDGATSACKRTVSSFYSEMKWLSSSMNNQVFPQLNQTYRNTRKEPALIVWGVHHSSSLDEQNKLYGTGNKLITVGSSKYQQSFSPSPGARPKVNGQAGRIDFHWMLLDPGDTVTFTFNGAFIAPDRATFLRSNAPSGIEYNGKSLGIQSDAQIDESCEGECFYSGGTINSPLPFQNIDSRAVGKCPRYVKQSSLPLALGMKNVPEKI\n>7pi2_E mol:protein length:231  Monoclonal antibody Cy.003 heavy chain\nAVTLDESGGGLQTPGGALSLVCKGSGFFSFSSYTMQWVRQAPGKGLEWVASISSGGGTNYGAAVKGRATISRDNGQSTLRLQLNNLRAEDTGTYYCAKHGVNGCDWSYSVGCVDAWGHGTEVIVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDK\n>7qyd_B mol:protein length:724  Pesticidal crystal protein Cry11Ba\nMQNNNFNTTEINNMINFPMYNGRLEPSLAPALIAVAPIAKYLATALAKWAVKQGFAKLKSEIFPGNTPATMDKVRIEVQTLLDQRLQDDRVKILEGEYKGIIDVSKVFTDYVNQSKFETGTANRLFFDTSNQLISRLPQFEIAGYEGVSISLFTQMCTFHLGLLKDGILAGSDWGFAPADKDALICQFNRFVNEYNTRLMVLYSKEFGRLLAKNLNEALNFRNMCSLYVFPFSEAWSLLRYEGTKLENTLSLWNFVGESINNISPNDWKGALYKLLMGAPNQRLNNVKFNYSYFSDTQATIHRENIHGVLPTYNGGPTITGWIGNGRFSGLSFPCSNELEITKIKQEITYNDKGGNFNSIVPAATRNEILTATVPTSADPFFKTADINWKYFSPGLYSGWNIKFDDTVTLKSRVPSIIPSNILKYDDYYIRAVSACPKGVSLAYNHDFLTLTYNKLEYDAPTTQNIIVGFSPDNTKSFYRSNSHYLSTTDDAYVIPALQFSTVSDRSFLEDTPDQATDGSIKFTDTVLGNEAKYSIRLNTGFNTATRYRLIIRFKAPARLAAGIRVRSQNSGNNKLLGGIPVEGNSGWIDYITDSFTFDDLGITTSSTNAFFSIDSDGVNASQQWYLSKLILVKESSFTTQIPLKPYVIVRCPDTFFVSNNSSSTYEQGYNNNYNQNSSSMYDQGYNNSYNPNSGCTCNQDYNNSYNQNSGCTCNQGYNNNYPK\n>2vbj_B mol:protein length:152  DNA ENDONUCLEASE I-CREI\nNTKYNKEFLLYLAGFVDADGSIIAQIEPNQSSKFKHRLKLTFQVTQKTQRRWFLDKLVDEIGVGYVRDSGSVSNYILSEIKPLHNFLTQLQPFLKLKQKQANLVLKIIEQLPSAKESPDKFLEVCTWVDQIAALNDSKTRKTTSETVRAVLD\n>6nlj_K mol:protein length:158  Ferroxidase\nMKGDKKVIQHLNKILGNELIAINQYFLHSRMWNDWGLKRLGAHEYHESIDEMKHADKLIERILFLEGLPNLQDLGKLLIGENTQEMLQCDLNLELKATKDLREAIVHCEQVHDYVSRDLLKDILESEEEHIDYLETQLGLIQKVGLENYLQSHMHEDD\n>6zh9_FFF mol:protein length:134  Nanobody H11-H4\nQVQLVESGGGLMQAGGSLRLSCAVSGRTFSTAAMGWFRQAPGKEREFVAAIRWSGGSAYYADSVKGRFTISRDKAKNTVYLQMNSLKYEDTAVYYCAQTHYVSYLLSDYATWPYDYWGQGTQVTVSSKHHHHHH\n>6yfp_BQ mol:protein length:164  coat protein\nSYTIDINCSTGDTQANLVLTEIPAEPYVHVSGDNKSTIEYLDTGSDNSLLVRPTQQFNCVSSQYPYRNYSKIPRSQQDPLAVRREFYTRRVEYWRKADASNVDAPEYTLPQSCSIRLASTVTKETTAADIAGIVLRTLAPIFPNGSGDWIKLQQLIDGLPRIFG\n>3rap_R mol:protein length:167  PROTEIN (G protein RAP2A)\nMREYKVVVLGSGGVGKSALTVQFVTGTFIEKYDPTIEDFYRKEIEVDSSPSVLEILDTAGTEQFASMRDLYIKNGQGFILVYSLVNQQSFQDIKPMRDQIIRVKRYEKVPVILVGNKVDLESEREVSSSEGRALAEEWGCPFMETSAKSKTMVDELFAEIVRQMNYA\n>4fk2_A mol:protein length:903  DNA polymerase\nMKEFYLTVEQIGDSIFERYIDSNGRERTREVEYKPSLFAHCPESQATKYFDIYGKPCTRKLFANMRDASQWIKRMEDIGLEALGMDDFKLAYLSDTYNYEIKYDHTKIRVANFDIEVTSPDGFPEPSQAKHPIDAITHYDSIDDRFYVFDLLNSPYGNVEEWSIEIAAKLQEQGGDEVPSEIIDKIIYMPFDNEKELLMEYLNFWQQKTPVILTGWNVESFAIPYVYNRIKNIFGESTAKRLSPHRKTRVKVIENMYGSREIITLFGISVLDYIDLYKKFSFTNQPSYSLDYISEFELNVGKLKYDGPISKLRESNHQRYISYNIIAVYRVLQIDAKRQFINLSLDMGYYAKIQIQSVFSPIKTWDAIIFNSLKEQNKVIPQGRSHPVQPYPGAFVKEPIPNRYKYVMSFDLTSAYPSIIRQVNISPETIAGTFKVAPLHDYINAVAERPSDVYSCSPNGMMYYKDRDGVVPTEITKVFNQRKEHKGYMLAAQRNGEIIKEALHNPNLSVDEPLDVDYRFDFSDEIKEKIKKLSAKSLNEMLFRAQRTEVAGMTAQINRKALINGLAGALGNVWFRYYDLRNATAITTFGQMALQWIERKVNEYLNEVCGTEGEAFVLYGDTDSIYVSADKIIDKVGESKFRDTNHWVDFLDKFARERMEPAIDRGFREMCEYMNNKQHLMFMDREAIAGPPLGSKGIGGFWTGKKRYALNVWDMEGTRYAEPKLKIMGLETQKSSTPKAVQKALKECIRRMLQEGEESLQEYFKEFEKEFRQLNYISIASVSSANNIAKYDVGGFPGPKCPFHIRGILTYNRAIKGNIDAPQVVEGEKVYVLPLREGNPFGDKCIAWPSGTEITDLIKDDVLHWMDYTVLLEKTFIKPLEGFTSAAKLDYEKKASLFDMFDF\n>1yja_A mol:protein length:275  SUBTILISIN 8397+1\nAQSVPYGVSQIKAPALHSQGYTGSNVKVAVIDSGIDSSHPDLKVAGGASFVPSETNPFQDNNSHGTHVAGTVAALDNSIGVLGVAPSASLYAVKVLGADGSGQYSWIINGIEWAIANNMDVINMSLGGPSGSAALKAAVDKAVASGVVVVAAAGNEGTSGSSSTVGYPAKYPSVIAVGAVDSSNQRASFSSVGPELDVMAPGVSICSTLPGNKYGAYSGTSMASPHVAGAAALILSKHPNWTNTQVRSSLENTTTYLGDSFYYGKGLINVQAAAQ\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/rfam_14_4_clustered_rep_seq__subsampled_1000.fasta",
    "content": ">AY587142.1/1755-1856 Arsenophonus endosymbiont of Aleurodicus dugesii 16S ribosomal RNA gene, partial sequence; tRNA-Glu gene, complete sequence; and 23S ribosomal RNA gene, partial sequence. \nCTTTAACAATCTGGAACAAGCTGAAAATTGAAACACACATTATTGAAAAATAGTGTGGGGAACTCTCAAAACTCCAAGTTGAAGTGTTATGCAAATAGGCAG\n>MTKT01000541.1/46599-46389 Punica granatum cultivar Dabenzi scaffold481, whole genome shotgun sequence. \nCTCATTACCCTAAAACCACAGGTTTCCGCAAAGTCGTAAGACCATGTATGGGGGCTGACGCTTGCCCTGTGTCGGAAGGTCAAGGAAGTTGATGACCTGATGACGAGGGAGTCGACGATCGAAGCCCCGGTGGACGAAGACTGTAACTATAACAGTCCTAAGGTAGGGAAATTTCTTGTCGGGTAAGTTCCAACCCGCACAAAAGGCGTAA\n>ABRO02008320.1/60058-60003 Dipodomys ordii contig_8320, whole genome shotgun sequence. \nGGAGATATGGCTCAAGTGGTAGAGCACCTGCCTAGAAAGCACGTGGCCTATTGCCA\n>MTKT01004810.1/4745052-4744924 Punica granatum cultivar Dabenzi scaffold70, whole genome shotgun sequence. \nTCGTTTGCAGATGCAGCTTCATCAAGATTCACATGCCGGCCTCTACGTTCGTCAGAGGTACCGTGTTTCTCGGACAGCTATAGTAGGTTCTGGTATTGGGAATCTTGATGATGCTGCATCGGCAAGAGA\n>ABRO02033548.1/61663-61950 Dipodomys ordii contig_33548, whole genome shotgun sequence. \nGTAAGGGCAATCTGGCTACAACATCTGTCACCTCATTGATCACCACGGTTGATCTGGGTATCTGGCCTGCTAGGCAGGTGTCCCCTTCCTCCCTTACCTGTGTGCCCCTCCTGAAGCTGCATGCTTGGTTGAGGACGACCATCCCAGCATCTGATCGAGGAGGACTGGTCTTTAGTCAAGGGTATATGAGTAGCTGTGTTCTGATAGAACCTCCAAACAAGCTCTCAACAGAAGGGACAGGAGGGGAAAACAGAGAGAACACTGCCCATAAAGAAATGTAATCTTTAT\n>AUSU01004475.1/2209-2114 Genlisea aurea contig_6775, whole genome shotgun sequence. \nCTTCTGCGGTGATGAAATTAATTTTCGCATGTCAGACTTCAGAGATTTTTCATTAAATCAATGAGATGAATAACTTCACTTTGACCTGAGCAGAAG\n>GL896952.1/11483861-11483692 Mustela putorius furo unplaced genomic scaffold scaffold00055, whole genome shotgun sequence. \nAGCTTTGCGCAGTGGCAGTATTGTAGCCAATGAGGTTTATCCGAGGCGTGATTATTGCTAATTGAAAACTAGTTCATCATATTGGTCACGTGAGCTTCTCTCATCCAGCCTAGGAAATGTGAGATTTTGAGTGTGAGAGAATGCTGTTACCAGTTTTGCCTGGGAGAAGA\n>KQ414408.1/749-926 Termitomyces sp. J132 unplaced genomic scaffold C248965, whole genome shotgun sequence. \nAACAGGCTGATCGCGGACGAGAGTACACATTGTCTCCGCGGATTGGCACCTCGATGTCGACTCATCCTATCCTCTGGGGGAAGAAGCTTGGAAGGGTTCGGCTGTTCGCCGATTAAAAGGGTACGTGAGTTGGGTTTAATACGACGTGAACTACAAAATTTTAATTAAACCCTTAAAT\n>CP000593.1/393484-393597 Ostreococcus lucimarinus CCE9901 chromosome 13, complete sequence. \nTCTTCCTTAACTCAGCTGGTAGAGTGTCAGACTGTTAGGAAAAAGTCTCCGTCGAATATGACGGCTGCTCCGATAGAGATCTGGAAGCCGCGGGATCGAAACCCGCAGGAAGAG\n>JFYO01000008.1/890-1 Microbacterium oleivorans strain RIT293 contigs6, whole genome shotgun sequence. \nGCGACTGTTTACTAAAAACACAGGTCCGTGCCAAGTCGCAAGACGATGTATACGGACTGACGCCTGCCCGGTGCTGGAAGGTTAAGAGGACCGGTTAGCCGCAAGGCGAAGCTGAGAATTTAAGCCCCAGTAAACGGCGGTGGTAACTATAACCATCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGCGTAACGACTTCCCAACTGTCTCAACCGCGAACTCGGCGAAATTGCATTACGAGTAAAGATGCTCGTTACGCGCAGCAGGACGGAAAGACCCCGTGACCTTTACTATAGCTTTGTATTGGTGTTCGGTGTGGCTTGTGTAGGATAGGTGGGAGACTTTGAAGCGGTGACGCCAGTTACCGTGGAGTCATTGTTGAAATACCACTCTGGTCACTCTGGATATCTAACTTCGAACCGTAATCCGGTTCAGGGACAGTGCATGGTGGGTAGTTTAACTGGGGCGGTTGCCTCCCAAAAAGTAACGGAGGCGCCCAAAGGTTCCCTCAACCTGGTTGGCAATCAGGTGGCGAGTGTAAGTGCACAAGGGAGCTTGACTGTGAGACTGACAGGTCGAGCAGGGACGAAAGTCGGGACTAGTGATCCGGCAGTGGCTTGTGGAAGCGCTGTCGCTCAACGGATAAAAGGTACCTCGGGGATAACAGGCTGATCTTGCCCAAGAGTCCATATCGACGGCATGGTTTGGCACCTCGATGTCGGCTCGTCGCATCCTGGGGCTGGAGTAGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGTACGCGAGCTGGGTTTAGAACGTCGTGAGACAGTTCGGTCCCTATCCGCTGCGCGCGTAGGAAATTTGAGAGGATCTGACCCTAGTAC\n>FWWT01000006.1/33934-33831 Desulfonispora thiosulfatigenes DSM 11270 genome assembly, contig: Dest_Contig00014 \nATATTTTATATCGGGAGCTTGAAAAGGCTGAGAGTATGATGTTTTCGTAGACCGATTGAACCTGTTGGGTAATGCCAGCGTAGGGAATGTGATTAAATTATTAC\n>AWHE01032144.1/18768-18530 Amborella trichopoda AMTR_V1.0_contig_32144, whole genome shotgun sequence. \nTAGCGAGTGGTTTGAGTTTTTCATTTATTTTTTAATTCCATGGGAAGTGGTGCATGGCCATTCATAGTTGGTGGGGTGGGGTGATTTGTTGCCTAATTCCATTAATGAATGAGACTTTCAGCCTGCTAACTAGCTTCGTGAGATATCCTCCACAACCAACTGCTTAGACAGAGCGACGAAGTATGGCTGTTTAGGTCAAGAATGTTTGAGGTGAAAACAGGTTTGTGATGCCCTTAGAT\n>CP014699.1/1893224-1893021 Streptococcus sp. TA 26, complete genome. \nAAATGTCTTCAGGGCAGGGTGCAATTCCCGACCGGCGGTGACTTTTCGTTTACTGTTCCAGCTTGATGGCCTGCAGAGTAGTTCTGCAGAGCTGATGCTTAAAAATAAGCAGCAGGAATATGAAGCGAGAAGAAGTCCGCGAGCGCAAGCTGATGCGGTGCAATTCCGCAACCGACAGTAAAGTCTGGATGGGAGAAGACGAAG\n>JRRC01354587.1/210-1 Gossypium arboreum cultivar AKA8401 contig_360664_1, whole genome shotgun sequence. \nCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTTAAGCGCGCGACCTATACCCGGCCGTCGGGGCAAGAGCTAGGCCCCGATGAGTAGGAGGGCGCGGCGGTCGCCGCAAAACCCGGGGCGCGAGCCCGGGCTGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAA\n>LFZV01000001.1/3925782-3925615 Bacillus sp. FJAT-27916 Scaffold1, whole genome shotgun sequence. \nTTTTCTGTATAAGCGCCAGAACTAAACCCATGTGGTGGGATTTAGTTGACGAGGTGGAGGTTATCGAAATGTTCGGCGGGAGCCTCCCAGCTTACATGTGCGGGCTGCAACTCTTTTTACCAAAACAGTTTGGCGACAAACTGGACAGAATAAAGAGAGAAGCACATA\n>JJRU01049126.1/2855-2468 Picoides pubescens contig49126, whole genome shotgun sequence. \nTATACTCAGTCCAAAAATTTCTTGCAATGCATTTATAGAAGCTTTCTGATGCAGGTAGTTAAAGACTTGTGGCGGTCAAGTGTTCACAGCGACGTTGCTTTTTGATCCTTCATTGTCAGTTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCTACTAATAGGGAACATGAGCTGGGATTAGACCATCATGAGACAGGTTAGTTCTACCCTACTGATGATGTGTTGTTGCAATAGTAATCCTGCTCAGTATGAGAGGTACCACAGGTTCAGATTCTTGGTACATGCGATTGGCTGAGGAATCATGGATTCATAGAATCAAAAAGGTTGGAAAAGACCTCAAAGATCACACAATCACACAGAATCACAGAATC\n>NC_009988.1/26865-27149 Bat coronavirus HKU2, complete genome \nGCATTTTTTTATTAACATTGGCAAATTTTGCAGATTTGTTTGACATACAATCCCTAGCTTTGCTTGTGGATTTAGTCTCATACACAATGGTAAGCACGTAATTATGCTAGTATGAGTAGAGTATAATTATATTGAGTCCTATAGACCAACGCAGTTAACTACATGTCCGGTGTGGCGGAGTAATCAAAGATCCGCTTGACGAGCCTATATGGAAGAGCCGTCACACCTCGTATGTATGTTGCTGCTAGTAGTTGTTAATTAGTTGATTCTTTGACAGTGATACAC\n>GG697144.2/73122-72404 Mitsuokella multacida DSM 20544 genomic scaffold Scfld3, whole genome shotgun sequence. \nTGAGTAGCGAAACGATCCGTGAGAATCGGATCCACCGAAAGCCTAAGGGATCCTGAGCAACGCTCGTCGTCTCAGGGTAAGTCGGGACCTAAGCCGAGGCATAAAGCATAGGCGATGGACAACAGGCGAAAATTCCTGTACTGCATGATGTTGTTTGAGGATGGAGTGACACAGCAAGGAGCTTGAGCGCGCGATTGGAAATGCGCGTCGAAGGCGGTAGGCTGGTACAGAGGCAAATCCCTGTACTAAGGCCGAGAACTGATAGATAGGAGCGTACTTCGGTACAATCCAAATTCAAGCGTACTACACTGTCGAGAAAAGCTTCTAACGAGACATCATGTACCCGTACCAAAACCGACACAGGTAGGCGGGGAGAGAATCCTAAGGTGCGCGGGAAAACCCTCGTTAAGGAACTCGGCAAAATGCATCCGTAACTTCGGGAGAAGGATGGCCGGAGCTGGTGAAGACCCTTGCGGTTGGAGCTGGAGCCGGCGGCAGAAGAGAAGCCCAAGCGACTGTTTACCACAAACACAGGTGCCTGCTAAAGAGAAATCTGACGGTTANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCCCATAGAGCTTGCCAGCCGTGCCGTTCAGAGCGATACCCTGATAGTTGGCAGCAT\n>CP000482.1/1312853-1313047 Pelobacter propionicus DSM 2379, complete genome. \nAATTGAATATCTGATCAAGGTGCCCGAGAGGGCTTGATAGGGAAGAGGGGTGCCGCTCTCAGTAACGAGCCATTCCCCCGCGGACCCGCCGCTGTAAGCGATGACGAAGGGCAGTATGCCACTGGTGAATAACCGGGAAGGCGCCCGGAGGATGACTCGCGAGCCAGAAGACCTGCCTTTTGATTATTGCCACAG\n>LL238006.1/6014-5950 Echinostoma caproni strain Egypt genome assembly, scaffold: ECPE_scaffold0004910 \nATTCTGTCTGTGAGGTCCCCGATCAGGTACATTGCTGATGAGACCCAGACAGGTCGAAACAGTAG\n>HF952018.1/1220924-1220795 Thermobrachium celere DSM 8682 genomic scaffold, scaffold33 \nGATGTTGTTAAAGGGGAGTAGCTGCCCATTTTGGGTTGATAAAGTCAACATGCTGGCCTTTGGCCTGGCTTTATCGGACGTTTGTCAAGTGAGACCTTTAACACAATGCTTTGCATTGTGTTAAAGGTCT\n>JH472210.1/112-1 Nannochloropsis gaditana CCMP526 unplaced genomic scaffold scaffold1650, whole genome shotgun sequence. \nGGGTTACTCCATTGCGCTACGCGCTAGTTGATAAAAGTTCGCACCTCTATCAAACTGGGTAACCCCACCTCTTGGCAAGGCCTAATTGTCAGATCAAATCGAAACTACTTCA\n>AEYP01109460.1/2187-2427 Mustela putorius furo breed Sable contig109460, whole genome shotgun sequence. \nAAAAAGACACTGTGTTCGGGGATCATTTCTACAGTTTGTTGCTAGAGAAGTTTTTCTGAACATGTAGAGTACCTCAAACCATGTGGAGGAAGAGGAGTGCTCTCTTGTGAGCCTGAAGCTGGATTTAGGTGTTCTTTCCAAACAGCCAATTATGGGTGCCTGGGTTGCTCAGTTTGTTAAACAACTGCCTTTGGCTCAGGTCATGATACTGGAGTCCTGAGATCAAGTCCCACATCAGAGT\n>ADNJ02000004.1/3715450-3715582 Metarhizium robertsii ARSEF 23 MAA_Scf_4, whole genome shotgun sequence. \nGACAGAGTGCCCGAGTGGTTAAGGGGAGTGACTTGAAGCGCTAGGCCTGGAGTGCGAGAAATCGTATGAAGAACCGCCTAGCAATAGATATCACTTGGTTTCGGCCTCGCAGGTTCGAATCCTGTCTCTGTCG\n>CCCW010014085.1/4006-862 Brassica napus, WGS project CCCW01000000 data, contig: 30103 \nTATTTTTAATTCTGGTCGAACCAACTCCAAAATGGTCGAGCTGAATTTTTCTCGACCAAAATTTTATCTGCTCGTGAGGGTTATTACAGTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCCAATCGGGCGGTAAATTCCATCCAAGGCTAAATATGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGTAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGAAGTGGGCTTGCGATGCATCCCGGTCGGATGCAGAATGGAGCAATCCTGTCTGCCGATCGATTCAGGGCGTGGACCGACGCGGATTAAGGTGGTGACCTAAGCCCGGCTTTTGTTACGCCGCTACCTTAATCATTGTCTGCGGCACGAGCCTCACGGCATTCCTTGGCATCTGCGTGCTCAGGGCGTCGGCCTGTGGGCTCCCCATTCGACCCCTCTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGTGAGTAAACCCATAAGGCGCAAGGAAGCTGATTGGCTGGATCCCTCACGGGTGCACAGCCGACCGACCTTGATCTTCTGTGAAGGGTTCGAGTGTGAGCATGCCTGTCGGGACCCGAAAGATTGTGAACTATGCCTGAGTGGGGCGAAGCCAGAGGAAACTCTAGTGGAGGCCCGCAGCGATACTAACGTGCAAATCGTTCGTCTGACTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGGTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCTCGGAAACGAGTTCTATCGGGTAAAGCCAATGATTAGAGGCATCGGGGACGCAACGTCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACAGGTGGCTGCTTTGTTGAGCCATCCCACGGAATCGAGAGCTCCAAGTGGGCCATTTTTGGTATGCAGAACTGGCGATACGGGATGAACAAGAAGCCGGGTTACAGTGCCCAACTGCGCTAACCTAGAACCCTCAAAGGGTGTTGGTCGATTAAGATAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTAAAGCACGCGACCTATAACCGGCCGTCGGGCAAGAGCCATGCCTCGATGAGTTGGAGGACGCGGCGGTCGCTGCAAAAACTAGGGCGCGAGCCCGGGCAGAGCGGTCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGGGAACTTGGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAATGGCACTTTCACATGGGTTAGTCGATCCTAAGAGTCGGGGGAAACCCATCTGATAGCGCTTATGCACGAACTTCGAAAGGGGATCCAGTTAAAATTCCTGAACCGGGACGTGGCGGTTGACGGCAACGTTAGGGAGTCCAGAGACGTCAGCGGGAATTCCGGAAAGAGTTATCATTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGGCAAAGGTAGGGTCAAGTGGCTGGAAGAGCACCGCACATCGTGTGGTGTCCGGTGCATTCCCGGCGGCCCTTGAAAACCTGGAGGACCGAGTGCCGCTCACGCCCGGTCGTACTCATAACCACATCAGGTCTCCAAGGTGAACAGCCTCTGGTCAATGGAACAATGTAGGCAAGGGAAGTCACAAAATAGATCCATAACTTTGGGAAAAGGATTGGCTCTGAGGGCTGGGATCGGGGGTCCCAGTTCCGAACCCGTCGACTGTTGGCGGGCTACTTGAGCTGCTAACATGGCGAGAGCGGACCGCCTTGTGTCGGCCGGGGGACGGACTGGGAACGGCTCTTTCGGGAGCTTTCCCCAGGCGTCAAACAGCAAACTCAGAACCGGTACGGACAAGGAGAATCCGACTATTTAATTAAAACAAAGCACTGCGATGGTCCATGCGGATGCTAATGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCAGGAGTAACTATGACTCTCTTAAGGTAACCAAATGCCTCGTCATCTAATTAGTGACGTGCATGAATGGATTAACGAGATTCCCACTGTGCATGTCTACTATCCTGCGAAACTACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGAAAAGAAGACCCTATTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGAATAAGTGGGAGCTCCGGCGGGGTAACAACCCCTTCTTTTAGACCCAAGACTCGCTTTGGCGTGTCGATCCAGGTGGAGGACATTATCAGGTCGGGAGTTTGGCTGGGGCGGCACATTTGTTAAAAGATAACGCAGGTTTCCTAAGATAAGCTCGACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGTACGAATATGAACCGTGAAAGCGTGGCCTATCGAACCTTTAGACCTTTGGAATTTGAATCTAGAGGTGTCAAAAAAGTTACCACAGGGATAACTGGCTAGTGGCAGCCAAACGTTCATAGTGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAATGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACAGTCGTGAGACAGGTTAGTTTTACCCTACTGATGCCGGCGTCGCAATAGTAATTCAACCTAGTACAAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGCTGGATTATGACTGAACGCCTCTAAGTCAGAATCCGAGCTAGAAGGGACGCATGCGCCTGCCGCCCGATTACCGACCCTCAGTAAGAGCTTCGGCTCCCAAAGGAACGTGTCATTGGCTAAGTCCGTTCGGCAGAAGCGTCCTTTGGACCGCCTTGAATTATAATTACCACCGAGTGGCGGGTAGAATCCTTTGCAGACGACTTAAATACGCGACGGGGTATTGTAAGTGGCAGAGTGGCCTTGCTGCCACGATCCACTGAGATTAAGCCCTTTGTCGCTAAGATTCGA\n>CM001407.1/48474749-48475301 Lepisosteus oculatus linkage group LG4, whole genome shotgun sequence. \nAAACAACAACAACTTATCTCTTAATTTTTTTCAATCCCTCTCTTACTCAATGAAGTGGCAGAATGACCTCAGAGCAGGCTCATGTTACTGGCATCAGGTAGCCAGCACCTGCCAGCCACAACCTGCTCCAGGAACAGTGGTAGGTAGGAGATTTGACCGAGGAAGTACTATACCCATTAAAACATTATCGCAAGTATCCTAAAGTGAGGTCAAGGAGCACAGAAACCTCCTGTGGAGCAAAAGGCCACTATCTTAGCTTATGAAAACTCATTATGAATATAGATATTGAAAGTGGCAATCCTTTTGGCTTTTGGAAATTTAAGTAGAAAGTGTCAAAAAGTTACCACAGGTATACTGTAACTAGCTTTTGGAAGCCAAGCATTCGTAGAAGCATTACATTTTGATCCTTCAATGTCGGGTGTTTGAATTATTCTTCAACAAGACTTCACCTTCCGTTCAAACATTGGCTTGTTCAACCGCTAATAGGGGGAGTGATCTGTGCTGAGACTGTTGCAAGGCAAACAGGAGTTGAGCATGGGTCAGTTGGTATTAC\n>JQCA01000072.1/4381-4571 Lactobacillus paucivorans strain DSM 22467 NODE_100, whole genome shotgun sequence. \nTTGGTTCTAAGGTGTACGCGTTGTCTCACTACAAGTTGCCGAACAAGTAATTTATATATGGGAATGTTCTATGGTGGAGAAGATGGCAGGCCTTTTCACTTGGAAGTCAGACACTCCAACAGACATTCCCCCCTGCATTGTCATCGCGGGTCAACATGACTGGACAATTAACGGCACCACTTAGATCAACC\n>KB018237.1/393050-393252 Camelus ferus unplaced genomic scaffold scaffold2244, whole genome shotgun sequence. \nATCGCTTCTTGGCCTTTTGGCTAAGATGAAGTGTAGTATCTGTTCTTATCAGTCAGGGCACCAGCAGATTCGGTGTCTGGTGAGAGCCCACATCCCGGTTCATAGACCTTCCAGCTGTAAGCTCACTTGGCGAGAAGGACCGGGGTTTTCTCTGATCTCTTTTATAAGAGCACTCATCCCATTCATGATGGCTCTGCCCCACC\n>APMT01104059.1/10100-10194 Mesocricetus auratus contig104059, whole genome shotgun sequence. \nGATTGTATGCTGGCACTCCCCCGATCCATTGGAATGATACAGAGAAGATTAGCATGGCCCCTGCACCTACATATTGTAGGGTACCACCTATGTTT\n>URS0001A24371_12908/1-89 unclassified sequences L2-Alphaproteobacteria ribosomal protein leader \nGGGGACCUUCGGGGCCCUAUACCAACGGUGGGCUUCACCCACCCUACAUAAGACGGGGAGACCCGUCUAAGCUAAACGGAAGACAGAAA\n>LN907827.1/31808-32053 Erwinia sp. EM595 isolate E_g_EM595 genome assembly, chromosome: 1 \nTATTCACAGCGTCAGGTAGACGAGCTTCCTCAGGAAGCGCTCAGGGATAGCCCGGAAGGCAGCAGAGCAGGGAAAAAGGATGGGGTCTGAAGGAGAGACCGTCAGGGATAAGGAAGCGCTCGGGATGAGTGGACAGCAGACGGGATAAACCGGGATGTTGATTGCATAAAGGGATGTAAAGGATGACTGTCCTTCTACGGAAGGTACGAAAAAAGGCGACAGATTGCTCTGTCGCCTTTTTTCTTT\n>FR872580.1/1712617-1713059 Parachlamydia acanthamoebae UV-7, complete genome \nGGGGGTGTCACGGTTTCGACTGAGAAGTCAAGTATTGATTGCATGCGGAGGATGTCGGTTGGCCTCCTAAAAAAGCCGATAAAACAATAAATGCTAACACAAATAGCAAACTAATTAGTGGTGTTGATTTTGCCGCTGCTGTAGAAGCTGATTCAGTTTCTTACGCTGCTGCTGCTTAACCTGACTAATTGGTCGCTGTATAAAGCCTAACAGCTTTATCAGCACAGCAGTCTGAGACTGGACCAAGGGTCGAGGAGTCTGCTGTCATTGACTTGGTACGGAATAAAGTCCGCCGCTTCTAGGGTTTTATTCTAAGATAAATGAAGCAAGTTAATCATAGTGTGGTGGCTGCAATGTGATTGACTTATTTTCAGCACACTAAGCATGTAGATATTAATATGTAGATTTGCCCAGGACGAGAGTTCAATTCTCTCCACCTCCAA\n>JH835313.1/5567540-5567270 Erinaceus europaeus unplaced genomic scaffold scaffold00025, whole genome shotgun sequence \nGGATATGAGGGTGATCTGGCTGCGACATCTGTCATCCATTGATTCAGCTGATCTGGTTGGCTAGGCGAGTGTTCTCTTCCTCCCTCATTGCTCCATGTGAGTCCCTGCCGATGGCCTTTCCCAAATAGAGAAGGGCGGGCGAGTCTTCAGTTGAGGGTATAGGAATAGCTGCGCTCCCCTGCTAGGACCTCCAAGCAAGCTCTCAAGAGTCATCTTCAACCTTAAGGTCAGCTAGACTTTTTATGTTCTCCTTGTAGATCACCATTTTACA\n>CM007648.1/27503544-27503238 Zea mays cultivar B73 chromosome 2, whole genome shotgun sequence. \nCATTGGTGAGAATCCAATGCCCCGAAAACCCAAGGTTTCCTCCGCAAGGTTCGTCCACGGAGGGTGAGTCAGGGCCTAAGATCAGGCCGAAAGGCGTAGTCGATGGACAACAGGTCAATATTCCTGTACTACCCCTTGTTGGTACGGAGGGACAGAGGAGGCTAGGTTAGCCGAAAGATGGGGCTAGTTTGATAACTCCATTTTCTCAAGAAAAATGAACTAATTGTTCCTGGGGAAAATGAAAATCCTTTACATCACGTTTGGATCATTGGAATCGAATTTCATTCTAATAATAGTAATTTAGGCG\n>CCCW010011448.1/3522-244 Brassica napus, WGS project CCCW01000000 data, contig: 32740 \nCATGGTCGGATTTTGATGTTCTAGTGTGTTTTGTTGGAAACTGTTTATGAGAATCTCTTATTTGGGAGTTATCAGAGATTATCATGAATTTTAATTAGTTTTTGGGAATTTATTTGAGTATGTTGGTTTGGACAGGTTATAGATTCTAAGTAGCCGAACCATGCTTATCTAGACTTGATGTTAGGATATCGGCCTTATGAATGTGCATTGTGTCTTGTGTGGTTTCAGGATCGGACATGGACCGTGGTAAGGGAAAGGCACCGTGAAGACTCAGGCCATGAGAAGATGTGTGGTGAATGGGTCATTGTAGATAGATGTGACATACTGATAGCCTATTGTGCAACTTGTGAACTTATGTTTGACTAAGTGTGTATAACTTATTAGGACGAACCTAAGAATGATGTATGAATCTCAGTTTATATTTATACAATTGATTTGCCCCTTATGTTTCCTTGTTTAGATTTTTTGTATTGAACCTCAGTTGAATTGAATTGAATTTACAAAGATAAGAATTAAAACTTGGTTCACTCGGACTTAGATTGAAAGGATAAGGCCGCAGATCAGTTTGAGCAGCCACAAATTTCCTGTGTGTGCTGACGGACACACACGGACGTCCTGTGTTTGCTGACGGACACCCACGGACGTCCTGTGTGTACTGAACAAACAGCCCACGGGACATCACATACAACCCTTGGTAACTAGTGACCTTTGGCCACTCGTGCCTCTTGGGACATGACCAACCGTTTAGCCCAACAGCCCAGTCTATGGTGCAATTCGAACCGACCATCTAACCGACCAGCATCTAGGTTAGCGGTTTGGTTATGACCGGCCAAGTCTAGGGACGTGTTCCTTGGACTGAACCAACACAACCCTTCGTTTATAATCAGAAAGAAGAGAAAGGGCCGGATAGAAACAAGAAGAGGAGAAGCGGTTAGGTCTAATGGACCGACCAGAGCCGCGGTGCGATCACAAGGACCGTCCGTTCGGTCTGATGGAGCCATAGGCCACCACGTACGTTCTGAACCGTGTCAGGTTTCTCCATGCTCTTCTCCTGCTCTCGGTCTCCCATACTTGATCAGAGGTTGCTTCACAAACGATCAGATCGCCGGAAACCTAACCACCACACAATCGGCCTTGCTTTGGCCGGAAACTCTCTCTTTCTTTCTTTCTCTCTCTCTATGATTTTTCTGAGTATTTTACTCTGGAATTGGATGATTGAAATTGACATAGAGGACCCCATATTTAGAGAAAATTAGGGGGTAAGTCTTGCCCAAAGAACAGGCATGACTGGCAAACGGATGGGCACAATCGGCCAAGGGTTACACCCTCTCGGCCGCATACGTCCCTTCGCCAATACCACATGGGATTGGGTCGGATAGAGGGCCACGGCCTTGTCCCAAGCCCCAACGGTCCATGGCCTCATGGCCGGACCCCCATGTCCCGCCACCAGCCCGGACCCGGGCCATCGGACCGAAACCCGAACAGTCCGTCCAGCTGAGTTTAGCTGACTCCCAGCTGTCTCAGCTGAGTGGGCTAGTAGTTCAGCTAGTGGAGCTGACTTAGTAGTGGCCGAGCTGGAGTGAGCTTAACCTAACTCCGTTGAGCTGGTCGAGCTACTTGTTCCATCCGTCCAGCTACCGTCTTACTCGTCCTAGCTGACTCTCGACTTGTATAAGATTAAGTCTAAGTTTCCTTACGTCCTTAACCTTCTTATCTGGCCATGGAACACTTGTCTTGATGTCCTAAGACTAACTAGTACGTTTCCTCGAAACATGGCCGTCCCAATGATCCTATTCAGGATCCGGGATGTTACAACGTCGGCGGGAATTTCGGAAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGCACGTCGCCTGGTGTCCGGTGCATTCCCAGCGGCCCCTGAAAATCTGGAGGACCGACTGCTGCTCACGCCCGTTCGTACTCATAACCACATCAGGTCTCCAAGGTGAACAGCCTCTGGTCGATGGAACAATGTAGGCAAGGGAAGTCGGCAAAATGGATCCGTAACTTTGGGAAAAGGATTGGCTCTGAGGGCTGGGCTCGGGGGTCCCAGTTCCGAACCCGTCGACTGTTAGTGGGCTGCTTGAGCTGCTAACTTGGCGAGAGCGGACCGCCTCGTGTCGGCCGGGTGATGGACTGGGAACGGCTCTTTTGGGATCTTTCCCCGGGCGACGAACAGCCAACTCATATTTGGTACGGATAAGGGGAATCCGTCTGTTTTATTAAAACAAAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGATGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGAAAAATCAGCGGGGAAAGAAGACCACTAATTTTAACGTTATTTTACTTACTCCGTGAATCGGAGGCGGGGTAACAACCCCTCCTTTTAGACCCAAGACTCGCTTCGGCGGGTCGATCCGGGCGGAGGACATTGTCAGGTGGGGAGTTTTTCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCTTAAGATAAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGTACGAATACGAACCGTGAAAGCGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTTGATGTCGGCTCTTCCTATCATTATGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTTGGTTTAGACCATCGTGAGACAGGTTAGTTTTACCCTACTGATGCCCGCGTCGCAATAGTAATTCAACCTAGTACGAGAGGAACTGTTGATTCGCACAATTCGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGCTGGATTATGACTGAACGCCTCTAAGTCAGAATCAGGGCTAAAAGCAACGCATGCGCCCGCCGCCCGATTGCCGACCCTCAGTAGGAGCTTCGGCTCCCAAAGGCACGTGTCGTTGGCTAAGTCCGTTCGGCGAAAGCGCTGTTCGGACAGCCTTGAATTATAATTACCACCGAGCGGCGGGTAGAATCCTTTGCAGATGACTTAAATACGCGACAGGGTATTGTAAGTGGCAGAGTGGCCTTGCTGTCACGATCCACTGAGATTCAGCCCTTTGTCACTAAGATTCGA\n>MJHW01000006.1/498708-498411 Roseburia sp. 831b contig000006, whole genome shotgun sequence. \nGTAAACACGAGGAAAAAGAGAGTACATCCCTTAGAACTTTACAGAGAAGTTTTTGAATGAGATGCATCCGCATACATTCGCTGAGAGAAAACGGGCAAAGAGAGATGGAAGATGGCTTTGGAGTGGCAGAGCTGAACGAAAAGCACTACATTTACAAACGTAGTTGAATTTCGATAAGTTTTGACAGGACCGCCTGTTATAGCGGTAGAACGTAACAACAAATGTTGCGTCAATGAGGCTTTCTCTGCAAAGAGAAGGTAAAGAGAAGTGGTACCACGGGTAGCAGCTCGTCTTCTGG\n>JH835659.1/1480072-1479972 Erinaceus europaeus unplaced genomic scaffold scaffold00371, whole genome shotgun sequence \nAAAAAGCATTATCCAGCTTCCTTCCTACTCTGTCTCCAATATCTTTTTTGAACAAAAAAGATATTGGAGACAGAGTAGGAAGGAAGCTGGATAATGCCCAT\n>MHBM01000110.1/8313-8490 Lentisphaerae bacterium RIFOXYA12_FULL_48_11 rifixya3_full_scaffold_2456, whole genome shotgun sequence. \nAATACCCTGCCTTGTTCGCAAACAGGCTGACGTCTCTGGCCCATTAATTGTAAGTTAGGGAGTTTGAATACGGCGGCAACTGAACGCCCTTTACTGGGACTCAGGAACCGACGGATAAAGCACCCACCTCGATTTCGAGGATCAGAGATAAATGCCTCTACGACAAAGTGGGGTATTT\n>CM000379.2/41198104-41197644 Equus caballus chromosome 3, whole genome shotgun sequence. \nAACAAAAATGTCACGTTTAGTTACTTAATTTGACTCAACACAGGAGACCTCGCTTGGCCTGGCATGGACAAGACTGACAGGTTGATAGCTCTTTCTCTGTTCCATAGGTGGTAGAGTGTGGCCATTCTTAGTTGGTAGAGCCATTTGTCGGGCTAGTTCTGATAACAAACAAGACTCAGGCATGCTAACTAGTTATGGAACCTCCAAGCAGTGGTATCCTCCAACTTCTCAGAGGGACAAGTGCTGTTCAGCCACCCAAGGTTTAAGCAAATAACAGGTCTGGGCTGCCCTTAGATGTCCCGGTTTGCAGGCACTACACTAACTGGCTGAGTGTGGCCTATCCTGAGAATGCAGCTTCAGGTAACCCTTTGAACCCCATTCATGATGGGAATCTGGGATTACAATTATTCCCAAAGAACACAGAATTTCCATTAAGGGCCATAAGCTTGTGTTGATTGGTT\n>CM000028.3/22112491-22112645 Canis lupus familiaris chromosome 28, whole genome shotgun sequence. \nAGCTTTGTGCAGTGGCAGTATCGTAGCCAATGAGGTTTATCCGAGGCGCGATTATTGCTAATTGAAAAGTGAGTGCTGGCCAGGAGAACAGGTGCATGCAGATGCTCAGCAAACTTTCATTGAGCACCTATTGTGCATCACCTTCTGTTTTAGGT\n>JH594435.1/493167-492948 Eubacterium infirmum F0142 genomic scaffold supercont1.1, whole genome shotgun sequence. \nGAATAATAATATCATATTAATCCAGAGGAACGCATATTAGAGAGAACAGGCGCGGAACCCTGTATCGAGTGCCCTTCTTTGCAGATTCATATCAGCAGAGAAACTGTATTGTGGAGTTTTACTTATATGCCATTGGAACGAGGGACAAATTCTTCTTCCGAGAAGGCAAGTAAGACGGTGAAGCATAGCCAGGAGACTTATTAATGAGATATACACCTGA\n>LL810796.1/383-1371 Gongylonema pulchrum genome assembly, scaffold: GPUH_scaffold0038229 \nCTGTCGCATTTACGATGAAGTTATTGCACGGTAATAAAGAAATTACGCAGCAAATTACCGTAATTACAGTTAAGTGTCATAAAACCAATATAATGAACTATCCCAGTTACTATAATGATTTGCGTGTAATTTGAATTACTGTAATATTTGGTACCGTAGCATATGTTATTACTGGAATATATTACTGTAACGTAGGGCTACTGTAGTATGTATTAGTTTTTGGCATTCGATTACCGTTTGCCTCAGATCGCAGCCTAGAGTGGGTGGTAAACCTCATCTAAGGCTAAATACGGCCACGAGACAGATAGCAAACAAGTACCGTGAGGGAAAGAACTTTGAAGAAAGAGTTCAAAAAGGCGTGAAACTTTTTTTGCAGTAATGATAGTTTTCAGCAATTTTTCTTAGTTATAATTGAAAAAACAATTGAAATTTCGGCGTTCTCTTCAGGAGTAACTTAGCATTACTACATGTCTGCGATTTGTTACGATGCTCATCCACGACGGTACAGTGGTCTGATCACATCCCACTACTCCTACATATTGCTGTCCTGGGGCTGGATTCATTGCNNNNNNNNNNNNNNNNNNNNTTAGCGTTACTACATGTCTGCGATTTGTTACGATGCTCATCCACGGCGGTACAGTGGTCTGATCACATCCCACTACTCCTACATATTGCTGTCCTGGGGCTGGATTCATTGCGACCCACGATTTGCCGGCACGCTCGGCAGCTTCTCATCAATATTGTTCTTCTTCAAGCCGGTGAAGCAGTAGCCGCCTCACAGCTTTCCAATATTTTATTGAGCAATCAGGTTTGTCTTCGAGTTTTTTATGTTCGAGGTTTTTTCTAAGATCAGATTTTTGAGGTTTTTTTTTTTTTAAAAAACAGTACCTGCGATTTCTAATTTGCGCTTCCCGCGATCCTGGTTTTTTTTTCCAGTTAAAAAGTACCTTTTCACCCATTTCGGCCCTTTTTGGACCGGCCGTTTTTGG\n>ALYE01010731.1/119708-119256 Gossypium raimondii Chr08_contig_1147, whole genome shotgun sequence. \nGTCCTTATACACTGGCAACAATGTCAATGCCAATCGAGTTAATACTCAATCAGCAAAATAGCACAAAATTTCATTAATTTATTTTATGAATAGTTTAGGAACGTGGATACAAGTGGTGCATGGCTATCGTCAGCTCGTGCTGGAAGGTGTTCGGTTAAGTCCCGCAATGAGTGCAACCTTCGTGTTTAGTTGCCACCGTTGAGTTTGGAACCCTGAGTAGATTGCCGATGATAAATTGGAGGAAGGTGAGGATCAAGTCAAGTCATCATACCCCTTATGCCCTGGGTGATACACTTGCTACAATGGACAAGTCAAAGGGTCACGACCCTGCAAGAGTGGGCTAACTCCAAAAACTTACCCTCAATTCGGATTGCAAGCTACAACTCGCCTACATGAAGCTGAAATTGTTAATAATCGCCGATCAACCATACGACGGTGAATTCGTTCCTGGGC\n>JOOK01005830.1/289-4 Oesophagostomum dentatum strain OD-Hann O_dentatum-1.0_Cont11200.2, whole genome shotgun sequence. \nAAAGCGGATACAGGCGCAAAAGAATAATAGAATAATAGATACATAGCAGGAGATAACTGCGGCAATTCCGGAGCTAATATATGTGAATAAACCCTGATTTTCGAAAGGGTGCAATTATGAGAGCAAAACAATCATCTTCGGATGTAGTTTGCTGACTCTAAATAACGCTGCATATCGTCGGCTTGTCCAACGATATTCCGAAAAAGTGTCTGCCCTATCAATCTGATGGTAGTCTACCAGTCTACTATAGTTATTACGGGTAACCGAGAATAAGGGCTCGGTTCCA\n>KB016774.1/3281454-3281537 Camelus ferus unplaced genomic scaffold scaffold490, whole genome shotgun sequence. \nTGGAGTGGGGGGGCAGGAGGGGCTCAGGGAGAAAGTGTGTGCAGCCCCTGGCCCTCTCTGCCCTTCCGTCCCCCGTTCCTAGAC\n>CP013118.1/3064815-3064903 Salinivirga cyanobacteriivorans strain L21-Spi-D4 chromosome, complete genome. \nTGAGAACCGTAGCGAAGCGGAGCTCATGACCGTAGAGAATAACTCAGCCGAAGCCATAGTATCCCGATACTTCTAATTAGGAGAAGGGC\n>FXAH01000012.1/80855-80720 Paraburkholderia caryophylli strain Ballard 720 genome assembly, contig: Ga0139045_112 \nATGAGTTCCCGTTTATTCCGTTTCCGCTGCAGTTGCGCCTTTCGACCGAACACGCCTTTCTTTCGTTCGCCGGGCGCAGCGCTTCGCTCGAAGCCGAGCCGCCAGCTCCGATGCACGAGGAGCGGCGGCTTTTTTA\n>LZPO01018772.1/1933-2618 Neotoma lepida isolate 417 scaffold_18136, whole genome shotgun sequence. \nCTATGACCCTGAGATTAAGAGTCTCATGCTCTACAGACTGAACTAGCCAAGACTGTGGCAGCCAAACATTCATAGTGACATAACTTTTTGATCCTTAAATGTTGGCTCTTCTTATGATTGTGAGGCTGAATTTACCAGGCAGTGGATTGTTCATCCACTAATAAGAATGTGAGCTGAGTTTAGATTGTCATGAGACAGATTAGTTTTTCCCTACTGATGATGATGTATTGTTGCCATCATAATACTGCTCAGTACAAGAGGAACCACAGGCTCAGACATTTGGTGTATGTGCTTGGCTGAGGAGCCAATAGTGTGAAGCTACCATCTGTGGGATTATGACTGAATGCCTGTAAGTCAGAATTCTGGCAGAACAATATGGCAGTGCCAAAGGAGCCTCGGTTGGCCCCAGATAGCCAGATCCCCTTCCAGCTCCATTGGCAGTCTGTCCTGTTCTCGCACATGGCGGGTCCCCACAGTGTGTTGGGACCAGAGTCTGGTATGGACAGCCATTCATACAGAGAAACAGGGTATGGCTGAAAAGGGTGCTGCCCTCTCACCCATCACATTGAACACACATTTGTGTGGAACCTGGTGCTAAACCATCCATAGATGACCTATTTCAATGGTTATAAGTTGTAATAGGGTTGTTGGTGGAACAATGAAGTCTAGACTCAGGATCCTCTTTT\n>HF986408.1/139458-139379 Blautia hydrogenotrophica CAG:147 genomic scaffold, scf339 \nACAGGTATGAGCACGCAGGCATATGCGCCGGAGTGCGAATGCCTGTCGGGATTGCGGGAGTGCGATGCACGGGGCAATCC\n>LBYD01000004.1/63542-63156 Parcubacteria (Moranbacteria) bacterium GW2011_GWC2_40_12 UT79_C0004, whole genome shotgun sequence. \nGGGGATGCTAGGCATCGACAATTTGTTCTCTCAAAATACGCAAGCCGAGCATGACATTAGACTCGTAAAACCTTGTGTCAACGATCATAAGTGCAAACTTATTTTCAAAGGTTAAGCAAGCTTTTCAGCCTGCTTACGCCGTTGTTCCTGCCTAATTCGCGGGGACCATCAGCCTGCTGATGCCTAATAAGCAACCGCTGGTGTCATACATTGGGCTTGATTGATAGTTTTTCTCTGCGGCTATCTCTGACCATTGAGCAAAGAGGACTTTTCAAGGTTTTGTTTACTTTATACTTGAAAAGTTTCTCAAAACAAGTAAACTAAGCTTGTAGAATATTTTGGAAGATATAAATTTGGACATGGGTTCGAGTCCCATCATCTCCACCA\n>CP013023.1/5009948-5010143 Paenibacillus bovis strain BD3526, complete genome. \nCGATGAGGTAGAGGTCGCAGCATGAATCAGTACAACCGGAGCAGGCGTAGAGCCGCCGCGAATCCCGGTTGAAAAGGTCCTGCTGCCGAAGTGCAGATTCCGCTCTGGGAATCCTGTGCTGGGGCTGTACCCGAAAGGGACAGAACTGTCACAATGAAAAAATCCAAGCATTTCATTGTGTTGAGCTATCTTAAAG\n>AFEY01018855.1/2775-2892 Sarcophilus harrisii ctg7180001412063, whole genome shotgun sequence. \nGGATGTGAGGGCTATCTGGCTGCGATATCTGTCACCCCATTGATCGCCAGGATTGATTCGGCTGATCTGGCTGGCTAGGCGGGTGTCCCCTTCCTCCCTCACCGCTCCATGTGCGTCC\n>CM000246.2/64301032-64300896 Rattus norvegicus chromosome 16, whole genome shotgun sequence. \nTATACAAGCAGCTACTCTCTCCCTCTGGAAAGTCCAGTCAAGATTTCAGGGCCATTGCAGGAGAGTGTAGGGCAGTCAGGCGTCTAGAACTGTAGGTCCATCCAAAGGAGGTGCTTCATGGTGGTCAGCCCTTGTTT\n>LPNL01000017.1/7001-6356 Hanseniaspora opuntiae strain AWRI3578 Hanseniaspora_opuntiae_AWRI3578_scaffold228, whole genome shotgun sequence. \nTGCCAGAAGATTCGGTTAGACGATAAAAGCAAAGTTTAATTCAGAGTTTAAAACAGCTGTAGGCAATAAATTATACTTGAATGAATATTAAATAAGAGGTAAAATTCTAAGACTTTAATTAGCATTCCAAATAGTATAATGCTGAGAGCTAAAGCCATTACTTAAGGACTAGGATTAGAGACCCTACTACTGATGGTACTATCTATGATAATTATAGTAAACGAAAGTCAAGAATTATCTACTCGAAGATTAAGCCTTAACGGGTGAAAATCAAAGTTGAAGAGCGTTATATCATCAATTGAGTGGATCGTGCTGTTTAATTTGACAACCCCCAATAAACCTTACCTAATCTTGTATAATACAGGTGTTACATTATCGTCTTTAGGCATTATTGTGAAATTATTGCTGCAGGAGCTATTACTTATGGCCCCGTGACTGATCTACATGACTCTAACGATTAGGGCTACAGGCGCGATATCAAGAATTGAATTATGAAACTCTAATTCATGAATAAATAATCAGAAGTAATATGGTGTTAGAATTACCATATGAATATCAAAGATATAAGCTACTAATTGCCCATCAATCTCCTAGTGAGATAAGTTGACACAAAGTTACGCTAGATGAATTTGGCGTGGGAAATTAA\n>LMAW01002579.1/3015099-3014999 Amazona aestiva scaffold_41, whole genome shotgun sequence. \nTGCTATGATGATGTAATTTGCATCTTATCCAGTGCTCAGCGACAGTTGCCTGCTGTCAGCATGCTGGCACTGCTGAGCTGAAGACCCCTTCGTTCTGAGCA\n>GL010075.1/7513268-7513324 Loxodonta africana unplaced genomic scaffold scaffold_48, whole genome shotgun sequence. \nGATTCAGGGGTAGAATTCTCACCTTCCAAGTGAGAGAGGTTTGGGTTCAATTCCCAG\n>APLE01005677.1/5643-4894 Erythranthe guttata cultivar DUN x IM62 scaffold_74_contig_8, whole genome shotgun sequence. \nCAACGGTTGACCAAGCCGCCTTGAAGAACAGTGCTGTGTAGCCGTCTGGCCCCGGTGCTTTAGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCGAGAGGTACTCCATGCATATAACGAAAAGATAAGGGGATAGCAATTATTTGGGGGTCGACCGGTTTGCACGTTGACTGAGAGCTCAGAAAATTCCGGTAAAAGGACTCGAATTCTTCAAGTACCTCATCCCTTGAGGTAGTAACCGATTCCGTTAACGAACGAGACCTCAGCCTGCTAACTAGCTATGCGGAGGTATCCCTTCGTGGCCAGCTTCTTAGAGGGACTACGGCCTTTTAGGCCGCGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGATGTATTCAACGAGTTTATAGCCTTGGCCGACAGGTCCGGGTAATCTTTGAAATTTCATCGTGATGGGGATAGATCATTGCAATTGTTGGTCTTCAACGAGGAATTCCTAGTAAGCGCGAGTCATCAGCTCGCGTTGACTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATTGAATGGTCCGGTGAAGTGTTTGGATCGAGGCGACGTGGGCGGTTCGCTGCCCGCGACGTCGCGAGAAGTCCACTGAACCTTATCATTTAGAGGAAGGAGAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTG\n>APMT01208959.1/14589-14458 Mesocricetus auratus contig208959, whole genome shotgun sequence. \nTCAAACCAAAATAAGGTCATAAGGTGTTCTTCCTAGGGACCTAATATGCTGTGGCTATAAACATCAGCAACCCTGGGGGTGTATTCAACCTCTTGCTTAAATGGGTTTCCCTAAGCAAACTTGAAGACAATT\n>ALWT01321998.1/3958-4053 Myotis davidii contig321998, whole genome shotgun sequence. \nTGAAGGTGATGCTGCTATAACATCTATCACCCCATTGATCACCAGGGTTGATTCTGCTGACCTGGCTGGCTAGGTGTGTGTCCCTCTCCTCCCTTA\n>AZNC01047644.1/7457-7628 Glycine soja cultivar W05 scaffold3943_7, whole genome shotgun sequence. \nTTGCACTATGTAGTATCGTAGGTCTCTCTGATTATGTGGAGCGGCCTTTGAGCAATGGTGCATAAAGTGAGAGCTGATTAGTCAGCAGGCAGCCAGACAACTGCCGAGGTGGATCCACAGATGAACGGCTCATTTGTTAATGCTGTTTGTCTACTAATTCCACCTTACATTT\n>AWGT02000388.1/78840-78931 Colinus virginianus strain Texas jcf7180006226242, whole genome shotgun sequence. \nAAGCACAGCGATCACGACTGAACGCATCAATCTTTCGCCTTTTACTAAAGACTGCAGTGTCGTTTCAGCAAATAATGCGCCTCATACATCAA\n>CP002637.1/13277-13481 Selenomonas sputigena ATCC 35185, complete genome. \nCTATGCTACAATCAAAGAACGCAATGGGCGTTTTCTATGTTGCTCTTTTGAGAAGCCTTTTCCAGTTCGGAGCGCGGCGCCTTGGTCTTGCGCAATGGAGTCTCGTGAACCCCGTCAGGTCCGGAAGGAAGCAGCGGTAAGCGAACCGCTTCATGTGCCGCGAGGGCGCCTGGGGGTCGCGCCCCGAAGTGGAAAAGGAGTATTT\n>CM000232.2/104162388-104162527 Rattus norvegicus chromosome 2, whole genome shotgun sequence. \nACATGGTTCAAACTTATAAATAAAGACTTATCTCATCCTGTGGGCCTCTCATAGTGTCCCGTGCTAGAGCAAACTGGCTCCTAACCATTGCCCAGCCTCGGTGCATGTAGGCTGCTGGCACTGAAGTGGGTCACACAGTG\n>HE612865.1/664054-663926 Tetrapisispora phaffii CBS 4417 chromosome 10, complete genome \nTATTGTGATGACAAGTTGTCGCCCCAGGCGGATCTATTCAGTGTATATTATTTCTATTTAAGTATAAAATAATGTGCAGTCGGAAATGACAGAAATATAACAACAAGCCAAACACTGAAAATTCTGATA\n>MEPB01000070.1/175699-175987 Bacteroidetes bacterium RIFCSPLOWO2_12_FULL_35_15 rifcsplowo2_12_scaffold_36, whole genome shotgun sequence. \nTACATTTGTCAACTTTTTGGTTCCTGAGTTTGATAAAATATCAAACCGGATTAAATGGGAATCAGGTGAAAATCCTGGACATTTCCCGATGCTGTAAGTTCTTATTAGTTTAAAGTTTATTTTTTAATTTTCTGGTTGTTAGACCTGAAAAACAAAAAACAAAACAAAATTCTAATATTTTTTTTAACATTCTTAGCCACTGTCTTGAATCGAATAAAGATTCTTTAAAGATGGGAAGGCGTTAAAAACAGAACAAGTCAGAAGACCTGCCAAAGAAATTAACATTTGT\n>AAGB01000009.1/14123-14306 Wolbachia endosymbiont of Drosophila ananassae gdan_434, whole genome shotgun sequence. \nACTGATTCCTTTATGATGGTGTCATCCCAGTGCCCAGACACTGGGATCCAGGAAACTTAATTGCAAGTAATGCATTGGATTTGGTGAGTATGGGTTTTGCGTTATAGAATGAAGCACTTTTGGTGAATTTATAAAGAAAGCTGGATCCCAGTGTCAAGCACTGGGATGACAAGGTATAAACCTT\n>NATD01000006.1/25331-26764 Candidatus Parcubacteria bacterium 4484_255 ex4484_255_scaffold_717, whole genome shotgun sequence. \nTAGAGAATTAATTAGAGCATATGGTGGATGCCTAGACACCAAAAGCCGATGAAGGACGTAGCAGCCTGCGATAAGCCTCGGGGAGGCGGCAAGCAACCTTTGATCCGAGGATTTCCGAATGGGGAAACCTAGCGTTACAAAACAGCGCTGCACACCGTTTCACAGTGAATTCAAAAATCAAAAATCAAAGTGCAAAAATAATAAGAAAATTTACAAGAAACAAGATGCAATAACCAAACAATAGTCAATAAATCAATGACCGAATAATCAAACGGTTTGATTATTGAATATTGGAATTTGGAATTTGTTTGTATTTTGTATCTTGGTTATTGGTTGTTTCAAATAATTTTGATTTTTACATTTTACATTTTGAATTTACCGCGAAGCGGTGTGGGGGTACCCGGGGAAGTGAAACATCTCAGTACCCGGAGGAAAAGAGAGAAACCACCGCGCCTCACTATCGTTCGGCACGAATGTCTAATATCTAATGTCTAATTTCTAATAAATGTTTAATGTCAAAATGTCCAATGTCTAATTATTTTAGTCACTTGGTTATTAAGTCATTGGGATTTTATTAGTCATTAGGAATTAGGATTTAGAAATTCCTGTGACGAGCGGTAGCGAGGCACGGTGATATTTCCTTAGTAGTGGCGAGCGAAAGGGAAACAGTCTAAACTCTATAGAATCTTAGTTTTATAAGAGTCTTATCTTCGGATATTTCTTTTATTTAATGAAAGGTAGTAAAGCCAAAATATTCTATAAAGTGTTGTGGGGTAACTAATGTTTTGTTTTTTACTGAACAGAGTTAGGATTTAAATTTTTAGTCCAATAGCATGGAATTGCTAACCATAGAGGGTGAAAGTCCTGTAGATTAAAAAAATTTAAATTTTAATAATTAGTTATGCCCGAGTAATGCCAAACTCGTGAAATTTGGTATGAATCAAGGCGGACTATCGCCTAAGACTAAATACTTTTGGTGATCGATAGTGAACTAGTACCGTGAGGGAAAGGTGAAAAGTAGCCCGGTTAGGGCAATGAAAAGTACCTGAAACCATATGCTAACAAAGAGTCAGAGCCTTGTGCTTCGCACAAGGAAATTCAAAGCACGAAGCACGAAATCCCAAACAATATCAAAATCCTAATGTTTTAAATTCAAAACAAATTCGAGAAATTTCTGTTTTGGTCATTTGGATTTAGAATTTAAGATTTGTTTAGGGTTTCGTATTTAGAATTTTGGATTTTCTCGCGCGGAGCGCGAGGTAGGGTGAGTCTGTCTTAATTGACAGAGGAGGCCCGAACCCGTTGACCGTACAACATCATGGGATGAGCCGTGGATAGGGGTAAAAAGCCAATCGAACTCAGTGATAGCTGGTTCTCCCCGAAATAGCTTTAGGGCTAGCCCGTTCTTTACTCTCTGGGGGTAGAGCTACTGGA\n>CM000129.1/18755739-18758932 Oryza sativa (indica cultivar-group) chromosome 4, whole genome shotgun sequence. \nAAAGAAATCGTTAAGGGCGTATGGCGGATGCCTAGGCTTTCAGAGGCGACGAAGGACGTGGTAAGCTGCGAAAAGCTGCGGGGATTGGCACACACGAATTGATCCGCAGATATCCGAATGGGGCAACCCGGCATATTGAAGATATGTCACCTCGCAAGAGGAGCAAACCCGGAGAACTGAAACATCTAAGTACCCGGAGGAAAAGAAATCGAAGAGATTCCGTAAGTAGTGGCGAGCGAAAGCGGATTAGCCCAAAAGTCTTTTTATGTTTAGAGGAATGTTCTGGAAAGAACAATCATAGAAGGTGATAATCCTGTACTCGAAAGGCATATAGAGATGATAAATGAGTAGGGCGGGACACGTGAAATCCTGTCTGAATATGGGGGGACCATCCTCCAAGGCTAAATACTCCTGAAAGACCGATAGTGAACAAGTACTGTGAAGGAAAGGTGAAAAGCACTTCGAATAGAAGGGTGAAATAGAACCTGAAACCGTACGCCTACAAGCGGTCGGAGCAGCGTAATGCTGTGACGGCGTGCCTTTTGCATAATGAGCCTACGAGTTAATTTTACTAGCGAGGTTAAGGTATTAAGTACCGGAGCCGGAGCGAAAGCGAGTCTGAATAGGGCGCATAGTTAGTAGGATTAGACGCGAAACCTTGTGATCTACCCATGGGCAGGTTGAAGCTCTGGTAACACAGAGTGGAGGACCGAACCGGTTGACGTTGAAAAGTCTTCGGATGACCTGTGGGTAGGGGTGAAAGGCCAATCAAACTGGGAGATAGCTCGTACTCTCCGAAATGCATTTAGGTGCAGCGTCGTATATAAGTTTATTAGAGGTAGAGCTACTGATTGGATGCGGGGGTTTCATCGCCTACCATTCCTGACAACTCCGAATGCTAATAAATGTTCTACGGCAGTGAGGGCATGGGTGCTAAGGTCCATGTCCGAGAGGGAAAGAACCCAGACCCACAGCTACAGGTCCCCAATATATGTTAAGTTGAAGCAACGCGGTTGGACTGCATTGACAGCTAGGATGTTGGCTTGGAAGCAGCCATTCATTTAAAGAGTGCGTAACAGCTCACTAGTCGAGCGGTCCGGCATGGATAATAATCGGGCATAAACATATTACCGAAGCTATGGATTTATATTTTAGATATATCTGGTAGGAGAGCATTCTATTTGCGCCGAAGCAGTACTGTGAGGTATTGTGGAGCGGATAGAAAAGAAAATGTAGGCATAAGTAACGATAAAGCAGGCGAGAAACCTGCTCACCGAAAGACCAAGGCTTCCTCAGCCATGCTAATCAGCTGAGGGTTAGTCGGGACCTAACGCGAACCCGAAAGGGGTAGTGGATGGACATGGGTTAATATTCCCATACTTGCTCACAATAAAAGGGGACGGTTGGATGTAGCTGCTGGAGACTGACGGAATAGTCAAGGCCTAGCCTTCGGGCGAAGCTGCTGTAGTGTAATCTGATCCGAGAAAAGCCGAAGTGAAGCNACCCGTACCAAAACCGACCCAGGTGGTCGAGGAGAGAATCCTAAGGTGCTCGAGTGAGTCGTGGCTAAGGAACTAGGCAAAATAGTCTCGTAACTTCGGAAGAAGAGACGCCACAGCANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNAATGTAGGCATAAGTAACGATAAAGCAGGCGAGAAACCTGCTCACCGAAAGACCAAGGCTTCCTCAGCCATGCTAATCAGCTGAGGGTTAGTCGGGACCTAACGCGAACCCGAAAGGGGTAGTGGATGGACAATGGGTTAATATTCCCATACTTGCTCACAATAAAAGGGGACGGTTGGATGTAGCTGCTGGAGACTGACGGAATAGTCAAGGCCTAGCCTTCGGGCGAAGCTGCTGTAGTGTAATCTGATCCAAGAAAAGCCGAAGTGAAGCAACCCGTACCAAAACCGACACAGGTGGTCGAGGAGAGAATCCTAAGGTGCTCGAGTGAGTCGTGGCTAAGGAACTAGGCAAAATAGTCTCGTAACTTCGGAAGAAGAGACGCCAACAGCAATGTTGGCCGCAGTGAAGAGGCCCAGGCGACTGTTTATCAAAAACACAGGACTCTGCTAAATCGAAAGATGCTGTATAGGGTCTGACACCTGCCCGGTGCTGGAAGGTTAAGGAAGGTGCTTAGCGTAAGCGAAGGCATTAACTGAAGCCCCAGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGTGTAACGATCTGGGCACTGTCTCAGCCACGAGCTCGGTGAAATTGTAGTATCGGTGAAGATGCCGATTACCCGCAATGGGACGAAAAGACCCTGTGAACCTTTACTATAACTTCGTATTGACTTTGAGTAAGTAATGTGTAGGATAGGTGGGAGGCTTTGAAGCAGGCACGCTAGTGTTTGTGGAGCCGACGTTGAAATACCACCCTTTACTTACTTGGAGCCTAACTTCTTTCAGAAGGACATTGCGTGGTGGGTAGTTTGACTGGGGTGGTCGCCTCCAAAAGAGTAACGGAGGCTTTCAAAGGTACCCTCAGCACGCTTGGTAACCGTGCGTAGAGTGTAATGGCATAAGGGTGCTTGACTGTGAGACCTACAAGTCGATCAGGTGCGAAAGCAGGACATAGTGATCCGGTGGTTCCGTATGGAAGGGCCATCGCTCATAGGATAAAAGGTACTCCGGGGATAACAGGCTAGTCTCCCCCAAGAGCTCACATCGACGGGGAGGTTCGGCACCTCGATGTCGGCTCGTCACATCCTGGGGCTGGAGAAGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGTGGCACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCTCTATCTATTGCGGGCGTTAGATGTTTGAGAGGGCTTGATTCTAGTACGAGAGGACCGAATTGAACAAACCTCTGGTGTATCAGTTGTACCGCCAGGTGCACCGCTGAGTAGCTACGTTTGGAAGAGATAAGCACTGAAAGCATATAAGTGCGAAACTCGCCTCAAGATGAGACATCTTTTAAGGGTCGTTGTAGATGACGACGTTGATAGGCTATAGGTGTAAAGACAGTAATGTCATAGCCAAGTAGTACTAATTACCCGTAGATTTATAGTC\n>CYGY02000008.1/113318-113432 Burkholderia sp. STM 7183 genome assembly, contig: CYGY01000008 \nTCACCCCTGCGTGACTGGCGATAGAACCCGAAGCTGTCAAGCCTGACGGGTTCAAGGTGGAGCATCCCACCGTGAAGCGCAGGGTGCCGTTTTGCCGTTCGCCTGGGCAGCCATG\n>ALWZ044793892.1/3195-2923 Picea glauca, whole genome shotgun sequence. \nGTCTGTGATGCCCTTAGATGTTCTGGGCCACACGCGCGCTACACTGATGCAGTCAACGAGTTTTTCTCCCTGGTTCGAGAGGATCGGGAAATCTTCTCAAATTGCATCATGATGGGGATAGACCATTGCAATTATTGGTCTTCAACGAGGAATTCCTAGTAAGCGCGTGTCATCAGCTCGTGTTGACTACGTCCCTGCCCTTTGTACACACTGCCCATGGGTGTGTGTTTTTTGGTCCGGTGGGAGTGCTTTGTTGAAACCTGGAGCTCAAGT\n>CM000335.3/6839130-6839055 Pan troglodytes isolate Yerkes chimp pedigree #C0471 (Clint) chromosome 22, whole genome shotgun sequence. \nTGTCCTCTGGGGACTCAGCTTGCTCTGGCTGCTGGATTGAATTAGCTGCAGGACCAAGATGAGCCCTTGGTGGAGA\n>AAQR03125679.1/12691-13758 Otolemur garnettii contig125679, whole genome shotgun sequence. \nGGGGAGTATGGTTGCAAACTGAAACTTAAAGAAATTGACAGAAGGGAACACCAGGGTGAAAACTATGGCTTAATGTGACCCGACTTGAGAAACCTCACCCAGCCTGAACACAGACCGCTTGGCAGACTGACAGCTCTTTCTTTCTTTCCTTTTTTGTTTTTCTTTTTTTCCTGAGACAGAGTCTCACTCTGTTGCTGCTCTGTAGAGTGCTGTGCTGTCACAGCTCATAGCAACCTCAAACTCTTGGGCTCAAGCATTTATTTCTCTTGCCTCAGCCTCCCAAGTAGCTGGGACTACAGGTGCCTGCAACAACCCCTGGCTTTTTTTTTTTTTTTTTTTTTTTCTAGTTGTCATTGTGGTTTTAGCAGGCCTCGGGCTGGAACCCACCAACTCCAGTGTATGTGGCTGGCGCTGTAACCACTGAGCTACGGGCACCATCTGATAGCTCTTTCTTGATTCCTTGGGTGGTGGTATGTGGCTGATCTTAGCTGAGGGAGCAATTTGGTTAATTCTGATAACAAACTCTGAGATTCTGGCATTCTAATTAGTTAGGCAACCCCAAGCGACCCACTGTCTCAACTTCTTTTTTTTTTTTGAGACAGAGCCTCAAGCTGTCCCCCTGGGTAGAGTGCTGTGGCATTACAGCTCACAGCAACCTCCAACTCCTGGGCTCAAGCGAGTCTCCTGCCTCCGCCTCCCAAGTAGCTGGAACCACAGGCGCCCGCCACAACGCCTGGCTATTTTTTGGTTGCAGCCGTCATTGTTGTTTGGCGGGTCTGGGCTGGGGATTCGAACCCGCCACCTTAGGTGTACGTGGCTGGCGCCTTAGCCGGTTGAGCTATAAGCGCCGAGCCACTGTCTCAACTTCTTAGAGGGCAAGTGGCATCCAGCCACCAGAGATTGATGCCCTTATATTGTCCAAGGCTGTAGACGCACTGTGCCTACCCTGTCATGGATAACTTGCTGAGCCCCATTTGTGAGGGAGATCAGGGATTGCAATTACCAGCATGAACAAGGAATTCCCAGTAAGTGCGAGCCATAAACTTGTGTTTATTAAGTCCCTTTAAA\n>MKQR01000007.1/110347-110112 Actinokineospora bangkokensis strain 44EHW Scaffold15, whole genome shotgun sequence. \nACACGAGAGAGGAGGTGGTCCACCAGTGAGTTCCGGTAGGACGCGTGAGGTGGCTGTCCGCTAAGGACCACCCATCAACGATGGACGCCGGCTCCGCCCACGGCAGACACCGGGTACCCGGTGCCGTAGGCGCGGCGCGTGGTCGGCGAATACCAGGCAGTCACCCGGCCCCTGGGCTTCCGTGGTAGTCCGCCACGGGCCTCCCTCGCGGAGGAGTCGCCCAGGGGCTGTGCCCT\n>CM000916.2/23724354-23724270 Nasonia vitripennis chromosome 2, whole genome shotgun sequence. \nAACGTGTCAAAGTCTGGTAACTCCACCACCGTTGGCGGAATGTTAAAAAGCCAATGGGGTACGAGTTTCCTACCATTGACGCGTT\n>JH209564.1/9089797-9089999 Pelodiscus sinensis unplaced genomic scaffold scaffold80, whole genome shotgun sequence. \nAGCTTTGCGCAGTGGCAGTATCGTAGCCAATGAGGTTAATCCGAGGCGCGATTATTGCTAATTGAAAACTTTTCCCATTCCTTTCCCTTCTCCCTCCGATCCCCCTTTCCTGTCCCTGTTCAGGGACCCTTTCTCATGAGAATCTCTTATGTCTGGAGGTACATCAGCTCATGGTGATAGGAATAATAGAAGTGGTTCCACCA\n>DS546278.1/1-991 Physcomitrella patens subsp. patens PHYPAscaffold_3506 genomic scaffold, whole genome shotgun sequence. \nCAAGCATTGCGATGGTCCCCACGGATGTTGACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTATCTACTATCTAGCGAAACCACAGCCAAGGGAACGGGCTTGGAAAAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTAAGAGGTGTAGAATAAGTGGGAGCCCTCAAAGCGCAAGTGAAATACCACTACTTTTAACGTTATTTTACTTATTCCATGAGGTGGAGGCGGGACTCTGTCCCTGCTTCTAGTCTTAAGGCGCGCCCCTCGGGTGCGCCGATCCAGGTGGAAGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCATTTGATTTTGATTTTCAGTACGAATACAAACTGTGAAAGCATGGCCTATCGATCCTTTAGTCTTTCGGAATTTGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGNGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGCTCGGTGCCGCAATAGTAATTCAACTTAGTACGAGAGGAACCGTTGATTCACATAATTGGTCATTGCGTTTGGTTGAAAAGCCAGTGACGCGAAGCTACCATGTGTAGGATTATGACTGAANNNNNNNNNNNNNNNNNN\n>DS232073.1/119557-119157 Culex pipiens quinquefasciatus supercont3.261 genomic scaffold, whole genome shotgun sequence. \nTATCAACATGACAAGATTATTCAATTCACGGTGGGAATGATCTGCCAAATCAGCGCTAATCAATTAGCTAATTGACAAAAATCAACGCTAGTTGATTAGCGTTACTATAATTGATTAGGTGTGTCTCACCCCTCGATAGAGGACTACCATGGTTGCAACGGGTAACGGGGAATCAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAATGGCTTCCATTTCCAAGGAAGGCAGCAGGCGCGTAAATTACCCAATCCCGGCACGGGGAGGTAGTGGCGAGAAATAACAATATAAGACTCTTTTATGATGTTTTATAATTGGAATGAACCGAGCATAAATCCTTCGGTAAGGATCAAGTAGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCACT\n>LZPO01108083.1/67281-67406 Neotoma lepida isolate 417 scaffold_2510, whole genome shotgun sequence. \nAATGGAAATCAACTTGTTGGCTATGGCAGCCTCCCATTACAAGCCATGGAACAGCATATTCCTATTTGTTGGCAAGGCTGTCTCCATTTATTTGGTGTCTGTTTCTTATTTGCCCAAATAACTAAC\n>JTHE01000287.1/5907-6033 Lyngbya confervoides BDU141951 scaffold_83, whole genome shotgun sequence. \nGCCTGTCAGGAACGCGGCTACCTCCTCCCAGCCGCCTACTGAAGGTGTTTTGCAAGGGCACCTCCTCCCGCCCTTGCAACTCGTGTTGAGCCGGACCGCTACCTCCTCCCAGCGGTCCGGCTTTTCT\n>CM000685.2/62840825-62842378 Homo sapiens chromosome X, GRCh38 reference primary assembly. \nAGGGAACCATGAAAGAATAATTACAAATACAGAAAGGCAAAGATAATCCCTTCTAACATTTGCATAATGAATTAACTAGTATAATATTACTAAGAGAACTTTTTAGCTAAAATCCTTGAGACCAGAGGAGCTACCCATAGAAAGTCAAGAGAACACACTCATTTATACAGCAAAATAATGAGAAAATCAATGGGTAGAGGTAAAAGGCCTACCGAACCTGGTGACAGCTGGTTTTATCAAGATAGAATTTAAGTTTAACTTTAAGTTTACCTATAGAATTGTCTAATCCTATTGTAATTTTATATGTTAGTCTAAAGGGGGACAGCTCTTTAGATGTAGGAAATCACTTTTTCACTAACGGTAAGACACAAAACTCCTTTAGTTTGCCTAAAAGCAGACACCGATTAAGAAATCATTGAAGTTAAACATTTGAAACCCCTTAATTTCAATCACTACATCTAATTTCTAACACTATACTGGACCAATCTATTTTTAAATAGAAGAAATACTGTTAGTATAAGTAACAATAAATAATTGTCTTTGCATAAGCTTAGTCTTTGCGTAAGCTTAATCTTTGCATAAGCTTATGTCAAACTGGAAAATCCACTGAGAGTTAATAATCCAATACAGATAATCATATTATAAACTTTTTATTGTCCCAATTGGTAACCTAACACACAGATGCATTAAGGAAAGATTTTAAAAAGTAAAAGGAACTCAGCAAAATCAAACCCTGCCTGTTTACCAAAAACATCACCTCTGACATAACTAGTATTAGAGGCACTACCTGCCCAGTGACATAAGTTTAACAGCCACAGTATCCTGACCATGCTAAGGTAGCATAATCATTTGTTCCCAAAATGGGAACTTCCATGAATGGCCTCACAAGGGTTTAATTGTCTCTTACGTTTAATCAGTGAAATTGACCTATCTGTGGAGAGGCAGAAATATTTAAGTAAGATAAAAAAAACCTTATGGAGTTTCAATTTATTAGTAGAAATAAACTTATAAAAAAGCCTTAATAGGTCTTTTTGGGAGTAATTATTTTTATTTTTAAATATCTAGTGTACCACCATGGCATGTATTCTTTAAATTTTATACAAACAAGCACATTTTTTCAGTGTTTTGATGTATTTTCATATTTTTCTAACTTAGACGTGTAGGCAATACATTTTATCTAATGAACCAAAAATTTTGGTTGGGGTGACCTCAGAGCATAACACAACCTCTGAAATGATTTCAGCTAGGACCACACTAGTCAAGGTAATCTATTACACATTGACCCAAGTAGTTTGAGCAATGGAACACGTTACCTTAGGGATAGCAGTACAATCCTATTCTAGAATCCGTATCAGCAATAGGGTGTATGACTTCGATATTGGATCAGGATATTCCAATGATGTAACTACAATTAATGGCTCATATGTCCAATGATTAAAGTCCTATGTGATCTGAGTTCAGACCAGAGTAATCCAGGTAAGCTGCTATCTATTCAATATTTCTCTCAGTACAAAAGGACAAGAGAAACAGGGCCCACTTCAAAAAGTGCCCTCG\n>DS022294.1/558139-558315 Mariprofundus ferrooxydans PV-1 scf_1099921033919 genomic scaffold, whole genome shotgun sequence. \nGCGCCCCTGCGTTGAGCGAATGGCAATCATGTTGCCTGAGCCGATACTTGTTGAACGGGAGCCAAGCTACGATGGCTGTGTGAATCCCTTTAGGGGATACCTGATGCCAGAGTGCTGCACCCACCTCTTGTTAGAGGGTTCGACAACAGATTGCCGCAACGTCAACGCGGGGGCGCC\n>AEUN01000020.1/91-28 Staphylococcus simiae CCM 7213 contig00020, whole genome shotgun sequence. \nCTCAACAAACTTATGATGGGGTGCGCGCTTTTTTATTGTACAAGATAACGGATTTGTAGACATT\n>URS0000D66E06_12908/1-81 unclassified sequences freshwater-2 RNA \nCATATAAATCTTTATATGTTCTTATGCGGAACCAAACCGCGTAGGCCTAGAACGCCACTTAATTTAAGGAGAAACAAAATG\n>KV442016.1/37818-37189 Mortierella elongata AG-77 unplaced genomic scaffold K457scaffold_6, whole genome shotgun sequence. \nTTGAAAATGGTGCAGGAAGAGTTCTATATAGGTTTAATAGCTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTGATCCTTCGATGTCGGCTCTTCCTATCATACTGAAGCAGAATTCAGTAAGCGTTGGATTGTTCACCCACTAATAGGGAATGTGAGCTGGGTTTAGACCGTCGTGAGGCAGGTTAGTTTTACCCTATTGATGAAATGTTGTTGCAATAGTAATTGAACTTAGTACGAGAGGAACCGTTCATTCGGATAATTGTTACTTGGACCTGCCTGAGCTGGCAATGGCCCGAAGCTATTATCCATTGGGTTATGGCTGAATGCCCCCAAGTCCGAACCCGTGCTAGAACGCGAAGATTACCGTCTTTCGATTTTTTTTTTAGTTGAATATGAATAGACCTTCGGCTCCAAGATCATACTACATGGGGTTATGTTTTAGGGCTGAAGGCATTATGATGTTCCTGCTAAAACTTTATTCACGAATATCCCTTCCTCCGTACTTTAATTCGAGACAATATTGTGTCGAAAAATTTTGTGTGCTGGGCTCATGCACTTCCATATGATAACTTGCAAAAAGGGAAGCTAACTTAGTTCAAGGTCCATTTTTCATCCACAAA\n>APMT01213728.1/1364-1077 Mesocricetus auratus contig213728, whole genome shotgun sequence. \nTTTGTTCAACGATTAAAGTCCTACGTGATCTGAGTTCAGACCGGAGTAATCCAGGTCGGTTTCTATCTATTTACAATTTCTCCCAGTACAAAAGGACAAGAGAAATGGGGCCTCCTTAATATAAGCGCCCCTAATTAATTAATGAAACCATCTCAATATAGTAAATCCATACTATATTTACCCTAGACAAGGGTTTATTAGGGTGGCAGAGCCCGGAAATTGCGTAAGACTTAAAACCTTGTCCTCAGAGGTTCAAATCCTCTCCCTAATAGTGCATTTAATTAATAT\n>DS028102.1/263782-263910 Coccidioides immitis RMSCC 2394 supercont1.10 genomic scaffold, whole genome shotgun sequence. \nGGGCTGGTGGCGCAGCGGTTAGCGCGTCGGATTGCGTAAGTGGCGAATTAAGACAGATGCATCTCAGCAGCAAGCTAACCCTTTCATATAGAGATCCCAAGGTCCCCGGTTCAAATCCGGGTCAGCCCT\n>CP003614.1/5692256-5692124 Oscillatoria nigro-viridis PCC 7112, complete genome. \nAGGAGCCGTGTGCGGAGAAATCCGCAAGCACGGTTCTGAAGACGAGTCGCTCCGGTGACGGGGCGGCTTCGTTTAACAAGCTTACGCTGTAATCTTTGATTCAGCATAGGAGGATGTCACCGTCCGAGTTTAT\n>AODI01000030.1/8750-8667 Brochothrix thermosphacta DSM 20171 = FSL F6-1036 c30, whole genome shotgun sequence. \nTAAAGGTATAGAAAAAGACACTAGCGCAAACTAGCGTCCGTGTAGAACCGTTTAAGACGGTGGCTACGCAATTATAATACTAAA\n>LBUD01000030.1/9979-10044 Parcubacteria bacterium GW2011_GWA2_38_13 US74_C0030, whole genome shotgun sequence. \nAGGCGTGTAGCTTAATTCAGTGGTTTCCAAAACCAGGGAGTGCGGGTTCAAATCCTGCCACGCCCG\n>HF998384.1/8394-8081 Coprococcus eutactus CAG:665 genomic scaffold, scf48 \nGAAAATGCAATGAAGAGGAGTAGTAGAATCCTGGAGATGTTCAGAGAACTGCCGGTTGGTGTGAGACAGTGATTGAGAGGATTTGAACTCGCCTTGGAGCAGCCCGCTAAAAGATACGACGTTACACAGTAGCGTTGAGCGTATCGAGTAGGATGGGACGGAGGCTGGCCGTTATAGCAGAAGGATATAAGATATGTAAAAGATATGTATTTGAGTTGTATAAGATCTGCATGTCTGTATCTGTAACGAGAGCATATTTTGTAATTATTATGAAGTATGAAATAGAGTGGTACCGCGTAACTTACGTCTCTATA\n>LKEX01010032.1/13186-15658 Cyphomyrmex costatus contig10032, whole genome shotgun sequence. \nCCCGCTGAATTTAAGCATATTATTAAGCGGAGGAAGAGAAACTAACTAGGATTTCCTTAGTAGCGGCGAGCGAACAGGAAAGAGCCCAGCACCGAATCCCGCGGTTCCGCCGCAGGGAAATGTGGTGTTCGGGAGGATCCGTTTATCCCATGGTGTCGCGCCGCGTCCAAGTCCATCTTGAATGGGGCCACTTACCCGCAGAGAGTGCCAGGCCCGTAGCGACCGGTGCGCGTCTCGGGAGGATTCCTCCTTAGAGTCGGGTTGCTTGAGAGTGCATCTCTAAGTGGGTGGTAAACTCCATCTAAGGCTAAATACGACCACGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGTTGAAAAGAACTTTGAAGAGAGAGTTCAAGAGTACGTGAAACCGTTCAAGGGTAAACCTAAGAAACCAAAAGATCGAACGGGGAGATTCATCGTCAGCGACGCTGGCTTCGCGTCGGTGAGCGATGATCCTCGCGGCCCGCAGCGCGGACACGCTGCCGTGCGTCGACGTCCGGCGTACGTCGTCGTGCACTTCTCCCCTAGTAGAACGTCGCGACCCGCTGGGTGTCGGACTACGGCCCGGGTGCGGTGACTGACGCGTCGCCGGTAAAACGGCACGCGTCAAACCCCCGGTCGCCCGGCCGGCTGCCCGGCGGTACACGCACGGTATCAGGCCGCAGACAACGGTCGGGGCGCGGGGCCCCCCACGTCCTCCGTGGCGTGCGGGGGTCTCCACTCCGTCCTGCTTTGCGTCGAGGCCGTCGCAAGCGCGCGCCACGGTACACGGAGGCTTACGGACCTAGCGCCGTCACCGGTCCTGGCCCGCTGTTGGTCGTACGGTTAACCTTCGACCGGTCTACGAACGTTCCTCGCGTTTCCCCCTCGCGGGGCGGGCGCGGGGGACCGATACCGGTCGGCAACGTTACTGCTTTCGGTACTCTTAGGAACCGTCTTGAAACACGGACCAAGGAGTCTAACATGTACGCGAGTCATTGGGACTCTAGCGATACCTAAAGGCGTAATGAAAGTGAAGGTCGGCCCTGGTTGTCGACCGAGGGAGGATGGGCCGCGTCGCGATGCGGCTCCGCACTCCCGGGGCGTCTCGTTCTCATCGCGAGAAGAGGCGCACCCAGAGCGTACACGTTGGGACCCGAAAGATGGTGAACTATGCCTGGTCAGGACGAAGTCAGGGGAAACCCTGATGGAGGTCCGTAGCGATTCTGACGTGCAAATCGATCGTCGGAACTGGGTATAGGGGCGAAAGAATAATCGAATCACCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATACCTGGCACTCGGCCGTTCCGCACGGAACGCGCGCGAGTCTCATCTGGTAAAGCGAATGATTAGAGGCATTGGGCCCGAAACGACCTCAACCTATTCTCAAACTTTAAATGGGTGAGATCTCTGACTTTCTTGAACCGTGAAGTCACGAGTATCACTCGGATCAGAGTGCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGCTGTGGGATGAACCAAACACAGAGTTAAGGCGCCCAACTCGACGCTCATAGGACACCATGAAAGGCGTTGGTTGCTTAAGACAGCAGGACGGTAGCCATGGAAGTCGGAATCCACTAAGGAGTGTGTAACAACTCACCTGCCGAAGCAACTAGCCCTGAAAATGGATGGCGCTGAAGCGTCGAGCCTATACTCTGCCGTCAGCGGCAAGTGGGGCGGCCGTGTGCGCGTCGTCAGACGCGTGCGCGCCGCCACGAAGCCCTGACGAGTAGGAGGGTCGCGGCGGTGTGCGCAGAAGGGTCTGGGCGCGAGCCTGCCTGGAGCCGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATACTCCAGCGAGGCCCTGGAGGACTGACGTGGAGAAGGGTTTCGTGTGAACAGCCGTTGCACACGAGTCAGTCGATCCTAAGCCCTAGGAGAAATCCTATGTCAATGACGGCGTACGATACTCTAGTGTTGTCGTTGTCGCGCTCTCGATCTCCGACTCGCCGCCGCTCCCACGCGCGCGCGCGACGACGGGGAGGGGAGAGCGTGGTGTTTTCTTCTTCAACGAGAAGCGCTCTGACAGGACACACGCCCGTCGGGCGAAAGGGAATCCGGTTCCTATTCCGGAACCCGGCAGCGGAACCGCATACAATTCGGGCCCTCGTAAGAGTGTTCGTCGGGGTAACCCAAAATGACCTGGAGACGCCGTCGGGAGATCCGGGAAGAGTTTTCTTTTCTGTATAAGCGTTCGAGTTCCCTGGAAACCTCTAGCAGGGAGATAGGGTTTGGAACGCGAAGAGCACCGCAGTTGCGGCGGTGTCCGGATCTTCCCCTCGGACCTTGAAAATCCAGGAGAGGGCCACGTGGAGGTGTCGCGCCGGCTCGTACCCATATCCGCAGCAGGTCTCCAAGGTAAAGAGCCTCTAGTC\n>ALWZ040927269.1/1-1274 Picea glauca, whole genome shotgun sequence. \nTTCGAATTGGGAGGGCGATCCTCCCGGTGAACTAACCGTACCCCAAACCGACACGGGTGAACAAGTAGAGTATACTAGGGCGCTTGAGAGAACCATGTTGAAGGAACTTGGGAAAATGACCCTGTAACTTTGGGAGAAGGGGTGCTCTCCCTCCTATCTTTGGGTTGGGAAAGTGGCACATACCAGGGGGTAGCGACTGTTTATTAAAAACACAGGACTCTGCCAAATGGTAACACGATGTATAGAGTCTGACACCTACCCGGTGCTGGAAGGTTGGAAGGAGAAGTGTGATAAGCTTCGAATGGAAGCCCCGGTAAACGACGACAGTAACTCTAACTATCCTAAGGTAGCGAAATTCCTTGTCGCATAAGTAGCGACCTGCACGAATGGTGTAACGACTGCCCCACTGTCTCCGACATGGACCCAGTGAAATTGAATTCTCCGTGAAGATGTGAAGTACCAACGGCTAGACGGTAAGACCCCGTGCACCTTGACTATAGCTTCGCAGTGACAACCTCTTATGAATGTGTGGGATAGGTGGGAGGTGGGGAACTCTCAATCCTGGAATACCACTCTTTCATCTAAGGATGCCTAACCATTTCTTTCTCTAGATTTATTCTCAGGGTGGGACACTACAAGGTGGGTAGTTTATCTGGGGCAAATGTCTCCTAAAGAGTAACAAAGGTGTGCGACGGTAGGCACTTTCTATAAGCAAGCATAATGGTCTAAGCCTGCCTGACTGTGAGACTCACTGGTCGAACAGAGACGAAAGTTGGCCATAGTGATCCGGGAGTCCCGCGTGGAAGGGCTCTTACTCAATGGATCAAAGGTATGTCGGGGATAACAGGCTAATGACTCCCAAGAGCTCTTATCGACGGAGTCATTTGGCACGTCGATGTCGACTCATCACATCCTGGGGTTGAAGAAGGTCCCAAGGGTTCGATTGTTCACCGATGAAAGTGGTATGTGAGTTGGGTTTAGAACGTCGTGAGACAGTTCGGTTCCTATCTACCGCTGGTGTTGAAGGGAGAACTGTGAGGAGCCAACCCTAGTATGAGAGGACTGGGTTGGGCCAACCTATGGTGTACCGGTTGTCATGCCTAGCAGCGTTGGGCAACCAAGTTGGTATGGAAGAACTGTTGAAAGCATCTAAGCGGGAAATCCTTTTCTAGACAAGTTCTCGTACGAGGTGAAAGAACATCACTTTGATAGGCGATAGGTGTAAGCACCGCGAGGTGTGAAATGATATCGTACTAATATTTTTACTTAGTCCA\n>AE007869.2/110253-110382 Agrobacterium tumefaciens str. C58 circular chromosome, complete sequence. \nATGGTGAAAGGCAGCGTCCATAAAAATAGACGCGCCCTGGAACATCAGACCGTTGAACGCTTTGACCACGGATGTACTGGCACTGACGAAAAACGGATGGAAAGGTCGGGCTCGCCCGGCCTTTTTGTTT\n>LGKD01302340.1/501-591 Octopus bimaculoides Scaffold36772_contig_40, whole genome shotgun sequence. \nTATAGTTTTCAAAGTGACAACTAGTCACTGACCTATAGTAATTTTTTAAATTATAGATCAGTGACTAGTTGTCACTTTGAAAACTATATAT\n>AACT01052938.1/746-1 Ciona savignyi cont_52938, whole genome shotgun sequence. \nAATTCTTGGATCGGCGCAAGACGAACGACTGCGAAAGCATTTGCCAAGAATGTTTTCTTTAATCAAGAGCGAAAGTCAGAGGTTCGAAGACGATCAGATACCGTCCTAGTTCTGACTATAAACGATGCCAACTAGCGATCGGGGGGCGTTACATTGACGACCCCTCCGGCAGCTTACGGGAAACCAAAGTCTTTGGGTTCCGGGGGAAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGAAATCTCACCCGGCCCGGACACAGTGAGGATTGACAGATTGAGAGCTCTTTCTTGATTCTGTGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGATAACGAACGAGACTCTGGCTTGCTAAATAGTTACGCGACCATCCCGGTCGGCGTTTAACTTCTTAGAGGGACAAGTGGCGTTTAGCCACACGAGATTGAGCAATAACCCCTATTTCCACAAAGGAATAAATTTTAAAATCCAATCTACGTTCAGTTTCTAACATAACACATTTTTATTTTTGTTTCTTTCGCTGCAGCGTTTATCACCAACAATTAAAAAATACATGTCATATATATATATACCAAAACAAATATGGTGTTAACTGAAAATCCAACAATTAACCAAAGAAATAAAAAATACTACAACAAAACAGGAAGGCACCAAAAAAACC\n>CCCW010012867.1/738-403 Brassica napus, WGS project CCCW01000000 data, contig: 31321 \nACTCTAGTCCGACTTTGTGAAATGACTTGAGAGATGTAGAATAAGTGGGAGCTCCGTGAATCGGAGGCGGGGTTGTTACCCCTTGTTTTCGACCCAAGACTCGCTTCGGCGGGTCAATCCGAGCGGATGACATTGTCAGGTGGGGAGTTTGGTTGGGGGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAAAACAGAAATCTCATGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCTGTACGAATATGAACCGTGAAAGCGTGGCCTATCGATCCTTTGGACCTTCGGAATTTGAAGCTAGAGGCTTCAG\n>AFEY01211982.1/140-48 Sarcophilus harrisii ctg7180001785086, whole genome shotgun sequence. \nATTGGTTTTCAGCCTTTTGGCTAAGATCAGTATCTATTCTTATCAGTTTAATATCTGATATGTCATCTATATGTATATACATAGGTATATGTA\n>GL832959.1/2234038-2236146 Salpingoeca sp. ATCC 50818 unplaced genomic scaffold supercont1.5, whole genome shotgun sequence. \nTAACTGGTCGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTCTAAGTATGAATAGTATTCTTGATACTGTGAAACTGCGAATGGCTCATTAAATCAGTTATAGTTTATTTGATAGTTTGCAACTCGTTTTTCGGAGCGGTGTTGTGCTAGACGGATAGCCGTGGTAATTCTAGAGCTAATACGTGCGACAAGGCCCGAGAGAGGGGTGTGTGTATGCGCATTTTTTCTTCTCGAGGGCTGCATTTGTTAGGTATAAAGCCAGCAGGAACATGACTGGTGAATCAGAATAACTTTGCTGACCGTTACACTTTTGTGTGTGATGGTGTCTCATTCGAATTTCTGCCCTATCAACTTTCGATGGTAAGGTATTGGCTTACCATGGTGACAACGGGTGACGGGGAACATTTGGTTCGATTCCGGAGAGGGAGCCTGAGAGACGGCTACCACTTCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACACAGGGAGGTAGTGACAATAAATACCAATGCACGGTGTTTTTTATGCACTGTGCAATTGGAATGAGAACAATGTAAAGACCTTATCAAGGAACAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAAAAGCGTATACTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCATGCGGGGTTCACGGTGTGTGGGTGGGGGTGAGACACTGTTTCACGCGCGCCTTCTTCTGCCCCGCACTGTTTGGACTCTGCAGTTTTAATATTCCCTGGTGGCGCCTTTGGCGCGTGCCCTTGATTGGGTGTGTGTCAAGTCACGTAGTGGTGGGGCGCTGTTGGGGGCTTTACTTTGAAAAAATTAGAGTGTCAAAGCAGGCAGTCATTTGATTTGCTTGAATAGATTAGCATGGAACAACGGAAGAGGACTTTTGGGCCTGTACTGTTGGCGTGTGGTGCGGGGTGTGTGGAAGAAGAAACCGCAAGGTTTTCTTATTCCTCCCTCACCACATCGGGTCTGAAGTAATGATTAATAGGGACGGTTGGGGGCACTGGTATTTCGTTGTCAGAGGTGAAATTCTTGGATTTACGAAAGACCGCCGACTGCGAAAGCATTTGCCAAGGACGCTTTCATTGATCAAGAACGAAAGTTAGGGGATCGAAGACGATTAGATACCGTCGTAGTCTTAACCATAAACGATGCCGGCCAGGGCTCGGTGGGCAGCACAAATGTTTCAACGCATGGTGGCGCCATCGGGACCTTTAGGGAAACCAAAGCGTTTGGGTTCCGGGGGGAGTATGATCGCAAGATTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTCACCAGGTCCAGACATGGGAAGGATTGACAGATTGACAGCTCTTTCTTGATTCCAAGGGAGGTGGTGCATGGCCGTCCAGCTTTTGTTGTGAAATCTCTGTTTGATTACGGTAAACGGCGAGACCTTGACTTGCTGATTGGTGTGCGCCTGCGTTAGCAGGCGTTGGAGATTACGCGCAAGCGTGTCTTTTGATACACCACTCAGAGGGACACTCGGCGTTGCTATTGAGCGTAAGCCGAAGGAAGTTTGAGGCGATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCTGCACGCGCGCTACACTGACGGGGGCAGCGAGTATGCTTTGGGTGTTTGTGGTGGGGAAAGTCTTGTGCTTTTCTGCATTCACAAACATCTATTCCTGCGCTGGAAGGCGTGGGGACTCTTGTGAAAACCCGTCGTGCTGGGGATAGATGCTTGCAATTATTCATCTTGAACGAGGAATTCCTAGTAAGCGCAATTCAACAGATTGCGTTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCGATTGAATGGTTTAGTGAGGCCTCGGGATTGGCGCGTGGGCGCTGGCAACAGCTGCCCATGTGTTTCTTTGCTGAGAACCTGGTCAAACTTGATCATTTAGAGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTC\n>AGTP01003540.1/18890-19069 Ictidomys tridecemlineatus contig003540, whole genome shotgun sequence. \nAAGTATTATCTCTATAAAGACTTACTAGAGAAGTTTCTCTGATTGCATAAAGAACCAGAAATCAAGGAGGTGCAGTGTGAACAGGTACTTGGTGTTGTTTTGTTGCAACTACCATTTCCCATTGATGATTGTTGTTCTCTTCCGTTTAGGGAGAGTAAGAGGGAAAGAATGCCAAGTGGT\n>CM004282.1/30198321-30198152 Daucus carota subsp. sativus cultivar DH1 chromosome 5, whole genome shotgun sequence. \nATACCTTTCTCGGCCTTTTGGCTAAGATCAAGTGTAGTATCTGTTCTTATAATATCTGATATGTGGGCTTATAAGTTCACACGATATTAAGGGGCTGTTTGGTTGAGAGAAGCAGCTTCTGGCTTCTGCTTCTCTTGACCCGTTTGTGTAAAGAAGTAGAAGCACTTTTA\n>AACT01036598.1/1017-1 Ciona savignyi cont_36598, whole genome shotgun sequence. \nTACTCTATTCAGCAGAACAAAAGCTGTTATAGGGGCCAGGCTTACGAAACTAATTGGAGAAGAACCTACCATCAAGACTCTGCAGCAACACCGCATCGAGAGCTTCTCCAAGCAGGTCCAGGGCTACGGATCCAGTCACTTTAGCAACACTCACTCCAACAGCTGGTTAACAGGATCAACCAGGCTAATGACTGGCCGTAACTACGTACAAGCCTGTGCACTCCGGACACAGACCCTGCCAACCCGCGAAGCCGTCTCAAGGGGAAGAGTCGGCGCGAACACCATCTGCCGAAACTGCGGGCTGGCAGAGGAAACACTGTCCCACATCCTGCAGAACTGCCACCGGACCAATAAGATCAGGATTCAACGGCATAACGCGGTTCTGCAGGTACTTGTCAAACATCTACGTAGGAGAAAATGGAAAATCCAAGAAGAACCATACATCCCCACTCCTACGGGCAGTGTCATTAAGCCTGATGTTCTGGCCACGGATCCTGACGGGAACGTGTTTGTCATCGATGCCGCCTGCCCCTACGAGGGTAACAAGAACTCCCTCGTCAATGCAGCAGCGGCAAAGGTGAGCAAATACACACCTTATAAACCCTCCATTCTTCATTATATAGGTGAGACCCCAACAACGGTCACTTTCCTCGGATTCGTGGTGGGAGCCCGTGGCGCAATGCCACCGCAGACACAACACTTCTGCAAGCAGGTAGGTCTTGGTAATGGCCAATTAGATCTAATGTCGGTACGGGCCATAGAAGGAAGCCTAAAAATCTTCCGATTATTTATGGCCCTGTAATATTAACTCGGGTACGCACCCACGAAGTATACGCAAGTGGTACTTCGGTAATGCGAAAAGACACGGTGCTATCGGACCTGACCTTTATGGTAAGGACCCGCGGCACCAAGTCAAACATAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCGCTGTCCCTATCTACTATCTAGCGAAACCACAGCCAAGGG\n>MHIF01000055.1/14859-14981 Candidatus Buchananbacteria bacterium RIFCSPHIGHO2_01_FULL_46_12 rifcsphigho2_01_scaffold_5410, whole genome shotgun sequence. \nGACCTAACCCTTGGGTAATTTATCTAAGGCATGGTCGAAAAACTCATCCTACATAAAGACGGTCTTCCGTCCAGTACTTGTAGGATGAGTCTATGCCCAAAAGGGTATAGTTGGTATATCTAA\n>CP002273.2/732628-732803 Eubacterium limosum KIST612, complete genome. \nTTAATAACTTAATGATGCTGTTTTGTTAGAGGAAAGCGGTTGAAATCCGCTACAGCCCCCGCTACTGTAATTGCAGACAAGATCCTCATAGACCACTGTCAGGCGTATCCTGACGGGAAGGGAGGATGGAGAAGGAAGCAAGAGTCAGGACACTTGAAGCAAAGCAATATAATCAC\n>AAGJ05103349.1/43054-43146 Strongylocentrotus purpuratus Contig103349_fixed, whole genome shotgun sequence. \nCCCGCCAGCCCGATCATTTTTGTGTTTATGCAACTTTTGTATTTTCACCGATCAGAGTAGTTGCATAGTCACAAAAGTGATTGGGAGGGTTGG\n>MLAU01031941.1/12573-12707 Lupinus angustifolius cultivar Tanjil contig_31941, whole genome shotgun sequence. \nCTTGTGGGGAATGCTGTCCGGTTCAAGGACATAACACTATCTTTACAACCTATGATATATATAATTTGCGGATTGTATAATCGATTTTGTGTTATGACTTAGTGTTTCCTCGGACCAGGCTTCATTCCTCTCAAT\n>KB096275.1/1122699-1122634 Helobdella robusta unplaced genomic scaffold HELROscaffold_19, whole genome shotgun sequence. \nTCCTATGATGAACCTGGCTTAGGAAGTGCCGTCAGATACATATATGATGATCGCTATTAGCTGATG\n>CM002813.1/58122422-58122133 Capsicum annuum cultivar Zunla-1 chromosome 2, whole genome shotgun sequence \nTTAATTTGACTCAACATAGGAAAACTTACTAAGTCCAGACATGGTAAGGATTGATAGACTGAGAGCTTTTCTTTATATAATGGGTGGTGGTTCATGGCCATTCTTACTATATGGAGTGATTTGTCTAGTTAATTACTGATACGCCTAAATTACACCTCTTTTTTGAGAGAGTAAGTGATCTCTATCAAATATAGAACTCAACTGGGTTGGGTGTCGAATCACACAAGGAATATTGTGTTCACTAAATATTGTGATTGTTATTAGACTGTTGATCTAAGGTTCCTGAGTAC\n>GL378484.1/35805-36021 Volvox carteri f. nagariensis unplaced genomic scaffold VOLCAscaffold_163, whole genome shotgun sequence. \nACTTGGACAAGGCGGCTGGCGGTAACGCAAGCGAGCCCGGAGACATCGGCATCGGCCCTGGGAAGAGTTCTCTTTTCTTTTTAACAACCCGAAGGCCCTGGAATCGAATCATTCGAAGATAGGGCTCAGAGGTTGGTAAAGCACCGCACTTCTCGCGGTGTCCGGCGCGCCGTTGACGGTCCTTGAAAATCCGGGGGAGCATTTCCGATCTTGCCAA\n>AFSB01153275.1/28776-28952 Heterocephalus glaber contig153275, whole genome shotgun sequence. \nATCGCTTCTCAGCCTTTTGGCTAAGATCAAGTGTATTATCTGACTGTCTTCAGGGCTTTGCTCTCAGGGTAGGTTAATGCACAGGAAGTATTCACAAATGTGGAGCTTACCCACTTGAGTAAGCCCCACACACGCTTGAACACTAATCATCTGAAAAGGTTTTAGGATGTAAAAGTT\n>EU151723.4/3777-3872 Opium poppy mosaic virus isolate PHEL5235, complete genome. \nGCAATATAGTGGGAGCCGGGTCCTGGTAAACAGGTTGAGTTGGTCTCGTAATCTCGGGTGGACTGCCAATCCACCGTCGCACCACTCTCATGGGCT\n>JMQN01000048.1/178591-178475 Marinobacterium sp. AK27 AUG5_contig_7, whole genome shotgun sequence. \nCTATCTTGGTCGGGGTGCCCCGTCATTGGCGTTGGAACGCGAATGGTACGGGCTGAGATTAAACCCGCTGAACCTGATCCGGCTTGGACCGGCGTAGGAAATCGAGATATTCCGTAT\n>URS0000D69473_1118056/1-77 Anaerococcus obesiensis ph10 skipping-rope RNA \nAATCATAGAGGTTAAGAAATCTGCCGATAACGCTATTTTATAGAAATGTGGGAGAGGAGGCAGTCCCACCTATGTTT\n>JRRC01354207.1/1-1013 Gossypium arboreum cultivar AKA8401 contig_36035_3, whole genome shotgun sequence. \nCGTAAACCGTGAAAACGGGGTTGTGGGAGAGCAATAAAAGCGTCGTGCTGCTAGGCGAAGCGGTGAAGTGCCGAACCCTAGATGGCGATAGTCCAGTAGCCGAAAGCATCACTAGCTTACGCTCTGACCCGAGTAGCATGGGGCACGTGGAATCCCGTGTGAATCAGCAAGGACCACCTTGCAAGGCTAAATACTCCTGGGTGACCGATAGCGAAGTAGTACCGTGAGGGAAGGGTGAAAAGAACCCCCGTCGGGGAGTGAAATAGAACATGAAACCGTAAGCTCCCAAGCAGTGGGAGGAGCCCAGGGCTCTGACCGCGTGCCTGTTGAAGAATGAGCCGGCGACTCATAGGCAGTGGCTTGGTTAAGGGAACCCACCGGAGCCGTAGCGAAAGCGAGTCTTCATAGGGCAATTGTCACTGTTTATGGACCCGAACCTGGGTTATCTATCCATGACCAGGATGAAGCTTGGGTGAAACTAAGTGGAGGTCCGAACCGACTGATGTTGAAGAATCAGCGGATGAGTTGTGGTTAGGGGTGAAATGCCACTCGAACCCAGAGCTAGCTGGTTCTCCCCGAAATGCGTTGAGGCGCAGCAGTTGACTGGACATCTAGGGGTAAAACACTATTTCAGTGCAGGCCGCGAGAGCGGTACCAAATCGAGGCAAACTCTGAATACTAGATATGGCCTCAAAATAACAGGGGTCGAGGTCGGCCAGTGAGACGATGGGGGATAAGCTTCATCGTCGAGAGGGAAACAGCCCGGATCACCAGCTAAATATCCGGACTATTCTACAGGTTTCCACTTTCCTTCAATCCGTTGAAATTTCAACAGATGAAACTTGTAGATAAAAAAGACTTAGGTACAATGGTGGGAATTTAATGCTTGAACGGGGACAACACTGAACCAATTCCATTGTTTGTCGAGTTAGTCGATCTTGAGCCCATTGAAAATGTCGTTCTATTAAGTAATCAATTAAAAAGCATGATACGGTTTTTATTGACATTTTTTT\n>KI545835.1/844-926 Toxoplasma gondii VEG unlocalized apicoplast scaffold scaffold00504, whole genome shotgun sequence. \nGGATTGATGTCTGAGTGGTCAATAGAAATAGACTGTAAATCTATAGAAGTTATTCTTCATCGGTTCAAATCCGATTCAATTCA\n>KQ435742.1/1845933-1846233 Melipona quadrifasciata isolate 0111107301 unplaced genomic scaffold scaffold54, whole genome shotgun sequence. \nGAGTTCCCTCGAGTAACGCGGCGGAGCCACAATCGGAGTTCTCAGTGACTCTCAATGCTCTGAGGAAAGTCCCTGGACCTTGGACAGAAAGTGTTCGTAGCATCGCCGTTACTAGCCTCTCGTCGTCTTTCTCGAACTTGAGACAGGAAGCTTCGGCCGATCTTTTCGGGTTAGGACGAGAGTGTATTGGTCAGAGGAAAGTAATGCGTTTCAAATCAAAAAATTCTCTCTTTCAATCTCCCTTTGTGGAGAGAGAAACTGAGAATTTGTCCAACTAAACAGGGCTTACTACGAGGGAAAA\n>KE148148.1/1651271-1651071 Ophiostoma piceae UAMH 11346 chromosome Unknown scf03, whole genome shotgun sequence. \nTCAGCTCTCTTTGCCATGACGGCTTAGATCAAGTGTAGTATCTGTTCTTTTCAGTTTAACAGCTGAAAAAGCCTTACTGAGGCTCTTCTGTTACGCTAATTTTTGGCAACTTGGGCAGGGCGGTCGACTGAGCTCGTCTCGCGCGACCATCCGTCCACGGTGTCCCTGGTATTTCACTGCTTCCAGGCGACGCGAACCCAC\n>FR887668.1/64445-64618 Firmicutes bacterium CAG:41 genomic scaffold, scf118 \nAAGCAAGGTAGAGGTGCGCTTGTGTATTAGTATGTATACGGAGATATGCAATTATCTTTGATGTATACGGAAAGGACACAGTGCCGAAGTTTGAATATTATTGCGAATATTCATTCTGGGCATATCGTTAACAGCGGTATGACTGTCATCGTAAGGTGGGGAGCTATCGCTGTT\n>ASAF01228276.1/12168-11615 Nicotiana sylvestris Nsyl_contig228276, whole genome shotgun sequence. \nCATAAAAAAGTTTTGAATTCTTAATTAATTGTTTCCGATTCACCGGATCTTACCTCTTTTGAAAGGAGTCAATAAAAAGTCAAAATATGGATTAACTTAAACTAATTTAAAAATTAAATCGAANTCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGATGCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCTGTAGGTGGCTTTTTAAGTCCGCCGTCAAATCCCAGGGCTCAACCCTGGACAGGCGGTGGAAACTACCAAGTTGGAGTACGGTAGGGGCATAGGGAATTTCCGGTGGAGCGGTGAAATGCGTAGAGATTGGAAAGAACACCAACGGCGAAAGCACTCTGCTGGGCCGACACTGACACTGAGAGAAGAAAGCTAGGGGAGCGAATGGGATTAGATACCCCAGTAGTCCTAGCCTTAAACGATGGATACTAGGCACTGTGCGTATCGACCCATGTAGTGCTGTAGCTAATGCNAGTGATAAAGGAGGTAGGGGTGCAGAGACAGCCAGGAGGTTTGCCTAGAAGCAGCCACCCTT\n>CP001097.1/1124998-1125215 Chlorobium limicola DSM 245, complete genome. \nATAAGTAATAACAGTTACGGTTTCCGGCGCCTGGAAGGGCGCCGGAATGAAAAGGGAACCCGGTGAAAATCCGGGACAGTGCCCGCTGCTGTGATCCCCCCGTCGGCATCTGCCGGCGGCGCGGTGCTTCCGAAAAGGCCACTGGTCCGCGCCTGCGGACCGGGAAGGCCGGAAGCATGGGGAGAGTCAGAAGACCTGCCGTAACGAAGTAATGCTTC\n>KK502588.1/105838-105391 Glossina austeni unplaced genomic scaffold Scaffold188, whole genome shotgun sequence. \nAGAAGAAAAGATAGGGAAGTGCTGGCTGCAGCCTACTGGGAAGATGGCCAAGGTCCGAATATAAGCGTGTAACACAGATTGATAGCTTTTTCTCAAATCAGCGGATTGTGGTGGATGATCGTTCTTAGTTCTTATTACAAAAAGATGTTTTAAGGGTTAAGGTGTTGAAGCTTTTATGGAATCTGTTTATAAAAGTGGAACCGTATCTGTTAGTTTGTGTTTTTATAGGAGAAAATAATGCGATTAAGCAATGACAGCTCTGTAGCGCCTTTATATGCCCTGGGCTGCACAATGAACGTATTAATATATATTCCCTAGACCTAGTGATCCGGATAAATCGCTGGACCACTTTCAGACTTGGAATTGTGAAATGAAACTGTTCATTTGGAACTTGGAATTCCCAGTAAGTGTGAGTCGTTAATTCACATTGATTGAGTCCATGCTCTTT\n>AFSB01210878.1/11034-11234 Heterocephalus glaber contig210878, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAGTATCAGAAACCAAACAAACCCCAAACAAGATGAAATCCATAACGAAAAACACAGTACTAAAACTGTCATTTACCAAAGATAAAAGGATGCATAAGAAAAGCAGTCAGAAATTTTTGTAAAAATTTTTGAGCTCACTGGGGATTTAGCTCAGTGGTTTGACCGCCT\n>MLAU01024954.1/4432-4362 Lupinus angustifolius cultivar Tanjil contig_24954, whole genome shotgun sequence. \nCTTTTTATGGTGAATTAGTGTCCCAATCGATTTAAGATTGAATAAAAATGGTTCGAACCCATTTGAGGGGA\n>AACT01006374.1/1536-1721 Ciona savignyi cont_6374, whole genome shotgun sequence. \nTGGTTTGTAATGTTGAGATTGATATATGAGTTTGCAAGAAAGCTGGCTATTTTGTTGGTTTTCGGAGAGCGAGGTAATGATTAAAAGAGACAGACGGGGGCATTCGTACTGTGCCGTTAGAGGTGAAATTCTTTGGATCGGCTCAAGACAAACGACTCGAAAGCATTAGCCAAGAATGTTTTCTTT\n>CH990426.1/969-1 Drosophila simulans chrU_M_6102 genomic scaffold, whole genome shotgun sequence. \nTTAGGGTATTTCCGGGGGGGTTTTTTAATGGGATTAAAATTTGTTTTTTTTCTTATGTTCTTCTTATTAAAAACCTGCATTGGGGTTTTTAAACGAGTGTTTTTTTGGGGCGGGTATTTTTCTTTTGAACAAATTAGAGTGTTTAAAGCAGGTTTCAAATGCCTGAATATTTTGTGCATGGGGATAATGAAATAAGACTTCTGGTTTGTTTTCATTGGGTTTTCAGATCAAGAGGTAATGATTAATAGAAGCAGTTTGGGGGCATTAGTATTACGACGCGAGAGGTGAAATTCTTGGACCGTCGTAAGACTAATTTAAGCGAAAGCATTTGCCAAAGATGTTTTCATTAATCAAGAACGAAAGTTAGAGGTTCGAAGGCGATCAGATACCGCCCTAGTTCTAACCATAAACGATGCCAGCTAGCAATTGGGTGTAGCTACTTTTATGGCTCTCTCAGCCGCTTCCCGGGAAACCAAAGCTTTTGGGCTCCGGGGGAAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGAAAACTTACCAGGTCCGAACATAAGTGTGTAAGACAGATTGATAGCTCTTTCTCGAATCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTCGTGGAGTGATTTGTCTGGTTAATTCCGATAACGAACGAGACTCAAATATATTAAATAGATATCTTCAGGATTATGGTGCTGAAGCTTATGTAGCCTTCATTCATGGTGGCAGTAAAATGTTTATTGTGTTTGAATGTGTTTATGTAAGTGGAGCCGTACCTGTTGGTTTGTCCCATTATAAGGACACTAGCTTCTTAAATGGACAAATTGCGTCTAGCAATAATGAGATTGAGCAATAACAGGTCTGTGATGCCCTTAGATGTCCTGGGCTGCACGCGCGCTACGAATCCACCA\n>CP000682.1/2154080-2154188 Metallosphaera sedula DSM 5348, complete genome. \nGCCGGGGTGCCCGAGCGGACCAAGGGGGTAGGCTCGAGACCTTTCCAGCGTTAAAGCGTGCGACCTACTGTCTCTCCGAGACACGCGGGTTCAAATCCCGCCCCCGGCG\n>CBUU010045831.1/1-300 Eimeria praecox, Houghton, WGS project CBUU01000000 data, contig: Eph_scaff15802_1 \nGAGCAATGCGGAAGACACAGTGAGGTGGGGAGTTTGGCTGAGGCGGCACATTTGTGAAACAATAGCGCAGGTGTTTTAAGGCAAGCTCAATGAGAAGAGAAATCTCATGTTTACCAGAAGGGGAAAAGCTTGCTTGATTTTGATTTTCAGTACGAATACAAACTGTGAAAGCATGACCTATCGATCCTTTAGGTCTGAGAAGCTTTCAGTTAGAGGTGGCAGAAAGGTTACCACAGGTATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGG\n>KB016908.1/814362-814466 Camelus ferus unplaced genomic scaffold scaffold638, whole genome shotgun sequence. \nATTTCAAAAAATTATCCCCAGGAGGGCTCTGGACCCCTCGGCATTGTATCTTCAGTACCGGCAGCTTGCAGTCCACCAGTTCAATCCTCAAGCGCCAGAACACGG\n>JQBS01000032.1/75904-76076 Carnobacterium divergens DSM 20623 NODE_75, whole genome shotgun sequence. \nATAAAAAATAGAGGTGCAACAATTATCAGTAATTAGTTGGAGGTTTGACAAAACCTGTGAAGACTAGTGAAAGGAATTTTTGCCGAAACAAAAAACTGTCATCTTTTTGTTGGGTCTTAGGTTGAATAAGCCGAGAACTGTCGCTTATCTTTAAGCGTTGCGCTATCTTACTG\n>CM000839.2/46388956-46388601 Glycine max cultivar Williams 82 chromosome 6, whole genome shotgun sequence. \nCATTAGAGCATTAAGAAGACATTTCCCTAGTACAAGAATATTGGGAAGGACTCACCTTCGGTGTGCCAGTTATCGTGCCCAGCCACGGTAAACGTTGGGTTGCCAAGTGTGGAGTAGATAATTGCTGAAAGCATCTAAGTAGTAACCCTAAGGTGAGTGCTTTCATATTTCAACTTCCCCAAAGCCTCCGGTAGCACAACTGAGATAGTGATGGGTTCTCTGGCCCAACAGGGATGAAGTGAAATTTTTTAAAGAATTCAAGAGAAGGTCACAGTGAGATGAGTTGTTGCTAATTAATGATAGGTGTCAAATAGAAATGCAATGATGTATGTATCTGAGGCATCCTAACAAACCGT\n>ALWZ040783527.1/524-606 Picea glauca, whole genome shotgun sequence. \nTATGGCATAGGATGTTATATCTTATTCTACACACTGAAATTACCGTGTAGATAACTATACACCTCTGACAAGCTGATGCCAAC\n>AAYZ01665444.1/416-340 Ochotona princeps cont2.665443, whole genome shotgun sequence. \nTGCTCTGATGACACAGGTAGCAAATAGGAAGTGCCGTCAGAGCGAGAACTGACGATCCTGGAGACGCGTGTCTGAGC\n>AFYH01197597.1/1946-2009 Latimeria chalumnae contig197597, whole genome shotgun sequence. \nTACACTTTAGTGAAGGCTATATAGAAAACCTTTCAAAGGCATATGTAGTCTGATGTTGTGTGTA\n>MHXH01000017.1/67050-63467 Parcubacteria group bacterium RIFCSPLOWO2_01_FULL_48_18 rifcsplowo2_01_scaffold_382, whole genome shotgun sequence. \nGGGCATATGGTGGATGCCTTGACTTGAGAAGGCGATGAAGGACGTGGCGTGGCTGCGATAAGCTTCGGGGAGGCGCTTAGCAACCTATGATCCGGAGATTTCCGAATGGGGAACCCCCGCCGTGCAAACCACGGCGAGCCGTGCTTTGCACAGAAATCCGAAGTACGAAATACGAAATCCGAAACAAAAAGCTTCGAATTTCGATATTCGAATTTCGAGTTTCCGCGCAGAGCGCGGCGGCGTACCCGCTGAATTGAAACATCTTAGTAAGCGGAGGAAAAGAAACCAACATTCAGCTCTACGCTGTGCTAACTAAGTTACCTGCTCAATTTTTTGGATTTGGAGAATAAAAAAAGAGGACCGTCGCGCGCGGCGGTCCCAGAACTCAAGCACCCCGAGGACAGAAGTCAAGCAAGGGATGCTGATAGTATTATAGCATGCTGGTAGGTTTTGTCAAGAGTCCAAAAATTTGAGCAGGTATAAGGTTGGAACAGTGTTCTACTGAATCATTCCCTTAGTAGCGGCGAGCGAAAAGGGAGGAGCCTAGAGCTCGGGTGTGCAGCATCGGGAAGCTTCAAATTTCAAAGTCCATATTTCTATTTTTTTCGCGAAGCATATTTCAAATTATTTCAGAAATATGTGGAAATATATAGAAACTCAGAAATATGCGGACATATTTTGTCATTTGGAATTTCCGCTGCTGTGCATCTGGGCAGTTGTAAGATAGTAACGTCTTCCTGATTTATCAGAGAGGGGGGGTGTAAGTAAGACTTCGTTAGTAGAACAACTTGGAAAAGTTGGCCAAAGAGGGTGATAGCCCCGTATGCGAAAACGGTCTTATAACCCCAGTTATTATCGACTCTTTAGAGTCGGAGCTATGATATTTTTACATGTCGTAGTTTCTTGAGTACTTCGACGACAGAAAGCGTCGGAGGAAACCGCGAGTACTATCTCGCAAGGCTAAATACTTCTCAAGATCGATAGTGAACAAGTACCGCGAGGGAAAGGTGAAAAGTAGCCCTATTAGGGCAGTGAAATAGTACCTGAAACCATATGCTTACAAGGAACCGAGGCTGAGCATCTCACTGTCGTGAGATGCGGAATATAGAATCTTGAATTTTGAATTTGGAATGATTATTCCAAATTCTCCCGCCAATCTCCGAAGGGCGAAGCCCTAGGCAAGATTGGCGAGGATCCCGTACTGTCCGCGATGAAGATAGGACAAAATCTTCATTCGGAGATTGGCGGGACCCTAGCCAACTGTAGCCGCTCTCCCGCTTTCAGCGGGATCGCGGACAGTTGCGGGACAACTTCTTCCGCCAAAGGCGGATCCGCCTCAGGCGGAAAATTCTGCACCGAACGAGAGTGAGGTGCTTGGTGACGGTGTGCCTATTGAAGAATGAGCCAACGACTTTATCTATGTTGCAAAGTCTAATCCCGAAAAGGGAGAAGGCGCAGGGAAACCGAGTGTTAAAAGCGCGTTACTTTAGCTCGATAGCTTTTTAGCTCAACAGCTCGTTAGTTTTCTATCGAGCTAACGAGCTAATCGGCTAACGAGCTTAAGTTAGCAGCATGGATAAGACCCGAAACCAGATGAGCTTGCCATGGCCAGGATGAACGCCGGGTAACACCGTCGGGAGGTCCGAACCGGTGGGTTGTGCAAAACCCTCGGATGAGCTGTGGTAAGGAGTGAAAAGCTAATCGAATCTGGTAATAGCTGGTTCTCCCCGAAATCGCTTTAGGGCTAGCGGCGTTTTATGTCATGCCGGAGGTAGAGCTACTGGATGATCCTCAAAGGGCGAAAGCTCGGATGATCAATCAAACTCCGAATGCCGGCAGGATTACAACGCTAGTTAGACCGTGGGGGCTAAGCTCCATGGTCGAGAGGGAAACAGCCCAGATCGCCGTCTAAGGTCCCTAAATTCTTGCTAAGTGTAAAAGGTAGTAATCAGCCGAAGACAGGTAGGAGGTTGGCTTAGAGGTAGCCATCCTTTAAAGAGTGTGTAACAACTCACTATCATATCGGCCGCATCTCACTAAGGCGAGATACTTGAATGACCAATTTCTAATTGACCTAATTTCTAATAAATTTCCAATACCCAATTTCGGAATTCGGTTACTGGGATTTATTTAGAAATTAGAAGTTAGGATTTAGAAATTTGAGCACCGAACTTTAGTGAGGTGCGGTTGATTGGCTGGTTGCGCCGAAAATGTACCGGGGCTAAGCAAGATACCGAAGACGCGAATTACCTGCTCAAATTTTTGGACTAATAAAATAATAAAAAAGAGGCCACCCATTGACGAATGACCCCTGACCTGACTCGTGGAAGTTCTTGTTAGACGACTATGGTCGTAACGACCGCGACGATCACCCAAGAGCCGTAGATGAGTGTTCCTTTCATGGGTTCAACTCTCCACGCTTCGATCATGCGGCTTTCCGTAGCTCATGATCATTGAGATCGTTATCGCCCCAAAGACTAATGCCGAAACAAGTGAAGAAGTCGGTTCCACGACAAGCTCCTTGATTGAGGGTTCGTTGCAATTATAGCATAAAGTTAAGTTTTTTGTCGAGAGTCCAAAAATTTGAGCAGGTAGTGGTAGGGGAGCATTTTGTGCGCAGCGAAGGTTGACCCGCGAGGGCGACTGGAGCGCACAGAAGAGAGAATGTTGGCATGAGTAACCAACAATGCCGATGAGAAATCGGCACTCCGTAAGCCCAAGGTTTCCGTGGCAATGGCAATCAACCACGGGTGAGGCGGTCCTAAGCCGATGGCGAAAGCCGAAGGTGATGGACAGACGGTTAATATTCCGTCCCACCGATACTATTTCGATGGAGCGACGGTTGAAATAAGGCCGGGCGTCTTAATGGTTTGACGCTGTTTGCTTGAAGGAATGTTGGACAGGCAAATCCGTTCAACTGTCTTTTATGGCAAATTCCGAAAGCAGACGAAAGTTTTGGTTTTTACCAGGGCAATCCGGCTGAAGAGCGATCCAAGAAAAACTTCTAGAGTTAATAGTATTGGTTCCGTACCGCAATCCGACACTGGTGGGCGGGGCGAGTAGCCCAAGGAGAACGAGTGAGTCCTCGTTAAGGAACTCGGCAAAAAAGCGGCCGTAAGTTAGCGATAAGGCCTTCCCGAGCACCGCAAGGTGCGAGGGACGCAGCGAAAGTTTGCCTGGCGACTGTTTATCAAAAACACAGCTCCCTGCTAACTCGTAAGAGGATGTATAGGGGGTGACGCCTGACCGATGCGAGAAGGTTAAACGATGGGGGTCGTATGCATCTCACTAAGGCGAGATACTTGAATGACCAATTTCTAATTGACCTAATTTCTAATAAATTTCCAATACCCAATTTCGGAATTCGGTTACTGGGATTTATTTAGAAATTAGAAGTTAGGATTTAGAAATTTGAGCACCGAACTTTAGTGAGGTGTGTACGGCTCACTGTTGTAAGCCCTCGTCAATGTCAGCGATAACTATAATCGTTCTAAGGTAGCGCAATTCCTTTCCGGGTAAGTTCCGGAGCGCACGAAAGGCGTAACGACTGGGCAACTGTCTCAACGAGGAGCTCGGTGAAAATG\n>ABRO02033478.1/54894-54660 Dipodomys ordii contig_33478, whole genome shotgun sequence. \nGCTGGGCGCTGTGGTGCGCCTGTAATCCCAGCTATTCGGAAGGCTGAGTCCAAGAGTTCTGGGCTACAGTGCGCTATGCCGATCGGGTGTCCACACTAAGTTCAGCATCAATATGGTGACCTCCCGGGAGCGGGGAACACCAGGTTGCCTAAGGAGGGGTGAACCGGCCCAGGTCAGAATTGTGACTGTGGTTCTGACATAGGAATAGACAGGTAGAACAATGAAACAGACTAGT\n>ABGB01001252.1/615-1121 Enterocytozoon bieneusi H348 ctg01_717, whole genome shotgun sequence. \nCATTAGGTTGATTCTGCCTAACGTAGATGCTAGTCTCTGAGATTAAGCCATGCATGTCAGTGAAGCCTTACGGCGGAACGGCGAACGGCTCAGTAATGTTGCGGTAATTTGGTCTCTGTGTGTAAACTAACCACGGTAACCTGTGGCTAAAAGCGGAGAATAAGGCGCAACCCTATCAGCTTGTTGGTAGTGTAAAGGACTACCAAGGCCATGACGGGTAACGGGAAATCAGGGTTTGATTCCGGAGAGGGAGCCTGAGAGATGGCTCCCACGTCCAAGGACGGCAGCAGGCGCGAAACTTGTCCACTCCTTACGGGGGAGACAGTCATGAGACGTGAGTATAAGACCTGAGTGTAAAGACCTTAGGGTGAAGCAATTGGAGGGCAAGCTTTGGTGCCAGCAGCCGCGGTAACTCCAACTCCAAGAGTGTCTATGGTGGATGCTGCAGTTAAAGGGTCCGTAGTCGTGAATGCAATTAAATGTCGTTGTTCAATAGCGATGATTGCT\n>KV453914.1/432734-432532 Candida tanzawaensis NRRL Y-17324 unplaced genomic scaffold CANTAscaffold_6, whole genome shotgun sequence. \nATCATCAGTAGTGGTTATACTATATCTAATATATATAACTATTATTTCATAAAGATCTTGGATGGAGGCATGCATATCATAGATGTGTGCAGGCTGACCATTTAACTACCCATAGCTAAGCATTCGTTGACCTAACTAACAATTGGGCCACAACGAGTGTTTCGTTTCGGTCTTTTAGATTATTACGTTTGTTGACGGCATTC\n>CM000034.3/40324702-40324549 Canis lupus familiaris chromosome 34, whole genome shotgun sequence. \nAGCTTTACGCAGTGGCAGCATCATAGCCAATGAGGTTTATCTGAGGCACGATTATTGCTAATTAAAATATGGAGGCAACATCTCAAATTCCACCCTGGTTCATTCAACTTTCTGGAGACATCTAGCTTTTTAGCAATCAGATCATGCTATTCTG\n>JYDM01000907.1/879-1 Trichinella sp. T8 scaffold908s, whole genome shotgun sequence. \nGTATCATTCCTGGGGGAAGTGGCGCGGAAGGAAGGTTACCAGGTCATGATAGAGCCTAAGGTGTCAACCCCGGTCGGCGCGCTCAAGCCCGACCTCCTTCTCATCAAAGCCGACACTGCATTCATTGTGGATGTAGGCATTGCGTGGGAAGGTGGACGCCCACTAAAGCTGGTCAACAAAATGAAATGTGACAAGTACAAGATTGCCATCCCGGCAATTTTGGAAACATTTCACGTTGGCCATGCTGAGACGTACGGCGTTATTCTGGGCAGCCGCGGATGCTGGCTCAAGAGCAACGACAAGGCGTTGGCATCAATTGGGCTCAATATCACACGGAAGATGAAAGAACACCTGAGCTGGTTGACGTTTGAAAACACCATCCGAATTTATAACTCATTCATGAAGAACTGAGGTTTTTGTTTTCTTTTACCTTTTACCATTTTTTATTGTTACATTGTTGTTATTTGCTTTAATCCTGCATTTTACCGTCGGCAATTCCATCGTTATTATTACTGTTATTGTTATTATTATTACTATTGTTATTACTTTTACTTACTATTGTTATTACGATTTATTTCGTATACTTACGTTATTGTTACTACTACTTACTTTGCTCTCGCAAACGTTCGTTGTTGTTACTTTTGGACCAGGTTTAGAGAAATCGCACGCACAGCGGAACTGGACCGCTTAAGCCAGAAACAGTAAAGTAACAATAGCCAAATGCCTCGTCATCTAATTAGTGACGCGTATGAATGGATCAACAAGATTCCTTCTGTCCCTATCTACTATCTAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAAAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCTGACTCTGTGAA\n>MEUW01000021.1/52640-49699 Candidate division WWE3 bacterium RBG_19FT_COMBO_53_11 rbg_19ft_combo_scaffold_7, whole genome shotgun sequence. \nAAGAAGGTCTTTTTATAAGGTAGATGAAGGATGCCTTGGGGCAAAGGGCCGATGAAGGACGTACTAGGCTGCGATAAGCCTCGGTGAGCTGCCACGAAGCGTTATTAACCGGGGATTTCCGAATGGGGTAACCCAATCCGTAAGGATTACGCTTAAGCCAAGTTCCTGCCTTTTGGCGGGATAGTAACTTAAGTGAGGGAACTCAGCGAAGTGAAACATCTCAGTAACTGAAGGAAAAGAAAGAGAAGCGCTTTATGCGCGGGTTCCCTAAGGACTCTCGCGATTTATTTCGCGGGAAACCTTGGGGAATCTTCGATCCTCCGAGTAGCGGCGAGCGAAAGGGGGGAAGCCTAAACTCCGGCGCAAGCCGGAGGGTTGCAGGACCTGCATTAGGAAAATTATTGGTAGGAGAATGCCCTGGAAAGGGCGGCCATAGAGGGTGAAAGCCCCGTAACTTAAACTGGTAATTTTCTGGCGGGAATCCTAAGTATCACGAGAAAAGTGAAAGCTTGTGAGAATCGAGCCAAACCACTGGCTAAGGCTAAATACTCTTTGCCACCGATAGTGAACAAGTACCGTGAGGGAAAGGTGAAAAGAACCCCGGTAAGGGGAGTGAAATAGAATCTGAAATCATCTACTTACAAGCAGACGGAGCCCGCAAGGGTGACGTCGTGCCTATTGAAGAATGACCCGAGGAGTTATCGCCAGCAGCAAGGTTAATCGCGTCAAACGCGGCGAGCCGTAGCGAAAGCAAGTCCTAAATGGGCGAATAGTTGCTGGTGGTAGACCCGAAACCTGGTGAGCTAGCCATGGGCAGGATGAAAGCCGACGAGAGTCGGCTGGAGGTCCGAACCGATGTGCGTTGCAATGCGCTCGGATGACCTGTGGTTAGGGGCAATATACCAATCGAACCAGGTGATAGCTGGCTCTCCCCGAAATGTATTTAGGTACAGCCTTGCAAAGTAACGAAGGGGGTAGAGATACTGGAAGGAATGCCGAGCCCGCAAGGGTATCGCTTCCTACCAAACTCCGAATACCTTCGCGAAATTTGCAGGAGTGAGCAGGCGGGAGCAAGTTCCGTCGTGCTAAAGGGAAACAGCCCAGATCATCGGTTAAGGTCCCTAAGTTGGATTTAAGTGGGAAAGGCAGTGGAATTTCTTAGACATCCAGAAGGTAGGCTTAGAAGCAGCCATCCTTGAAAGAGTGCGTAACAGCTCACTGGTTGAGAAATTCTGCGCCGAAAATGTAACGGGGCTCAAAATCCACACCGAAACCGTGAACTCGCCGCAAGGCGAGTGGTAGGGGAGCGTCGCCACAGCAGTGAAGCTGGATCGTAAGGTCCGGTGGAGCGGTGGCGAGTGAGAATCTCGGGATGAGTAACGTTTGGCGGTGAGAATCCGCCTCGCCGGAAGTTCAAGGTTTCCTCCGCTCTGGTCGTCATCGGAGGGTTAGTCGGTCCTAAGCCGAGGTCGAAAGACGTAGGCGATGGGCAGGGCGTTAATATTCGCCCACTTCCGTCCGGTTCGATGGGGTAACGTTTTCCAAAGTTGCGAGCGTCCGCATGGTTGGGCGTTCGGCGCACCAAGGTGCTTTGTTGGCAAATCCGCAAGGCATAAGCCAAGGTGTGACGGGGAGTCCCGTAAGGGACAACTCGTGAGGCTGGAGAACCAAGAAAAACCTCTAAGTTATGCCGGACGGGATCCGTACCGCAAACCGACACAGGTGAACTAGGTGAGTAGCCTAAGGCGAGCGGGATAACGTTCTTTGAGGAATTCGGCAAGTTGGCCCCGTAAGTTCGCAAGAAGGGGTGCCCCGACTTAAACGTCGGGGTCGCAGCAACAAGGCTCAAGCGACTGTTTAACAAAAACACAGGTCTCCGCTCAACCCGTAAGGGGATGTATGGGGGCTGAAGCCTGCCCAGTGTCCGTCGGTTAAGGAGAGGTCTGAGATTATTTCAAGGATCGAACCTAAGCCCGGATGAACGGCAGCAGTAACTATAACTGTTTTAAAGTAGCGAAGTTCCTTGTCGGGTAAGTTCCGACCCGCATGAAAGGCTTCACGACTTGAGCACTCTCTTAAAGAATGACCCGGTGAAATTGAAATGGCCGTGAAGATGCGGCCTACCCACAGCAGGACAAAAAGACCCCGTGGAGCTTTACTGTAGCTTGACATTGGTTTGATGATCGGATTTGTGTAGCGTAGGAGGGAGCCGCAAGGCGCCAATGAAACACCTCTCGATTTGATCCTCAAATCTTACTTAGGCGGTTAACCCGTCTGGGAACAGTGTCTGGTGGGCAGTTTAACTGGGGCGGTTGCCTCGCAAAGAGTAACCGAGGCGCCCCAAGGTCGGCTTAGTCTCGATGGACACGAGACTGTAAGTGCAAAGACATATGCCGGCTTGACTGCGAGACCAACAAGTCGAGCAGGTGCGAAAGCAGGGCTTAGTGACCTGTTCACTTCGAGTGGCGGAGTGAACAACATCGGACAAAAGCTACCCCGGGGATAACAGGCTGATCTCCTCCAAGAGTCCATATCGACGAGGAGGTTTGGCACCTCGATGTCGGCTCGTCCTATCCTGGGGCTGAAGAAGGTCCCAAGGGTTTGGCTGTTCGCCAATTAAAAGGGCACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGACTCTATCCGCTGTGGGCGTTTAGCTTTTGAGGGGATTTCTCTCTAGTACGAGAGGACCGAGAGGAGCCAACCTCTGGTGTACCGGTTGTCCTACCAAGGGCATAAGATATGCCGGGTAGCTATGTTGGTAAGGGATAAGCGCTGAAAGCATCTAAGCACGAAGCCCACCCCAAGATGAAAAGCAGACCCCTTGTAGACTATAAGGTTGATAGACGGCAGGTGGAAGCGCAGTAATGCGTTAAGCCGAGCCGCACTAATAGGTCGTTTGATCTTCTTTT\n>APMT01169783.1/38025-37737 Mesocricetus auratus contig169783, whole genome shotgun sequence. \nAGATGTGAGGGCAATCTGGCTGTGGCATCTGCCATCTCATGAATCACCAGGGTTGATTTGGCTGATCTAGCTGGCTAGGCTGGTGTCCTTTGTCTCCCTCACCATGCTTTGTGCATCCCTCCTAAGGCTGCACACTCAGTCAAAAAGGACAACCTTCCCCAACTAGAGAAAGACCTATCTTCAGTTAAGAATATACTAGTAGCTGTGTTCCCCTGATAGAACTTCAAACAAGCTCTCAAGGAACTACTTAAGTGGGGCCAGTAAGAACTTCGGTGCATGTAACTCAGTT\n>JJRN01037118.1/15094-15301 Fulmarus glacialis contig37118, whole genome shotgun sequence. \nAATCCAGTGAAGGATTCACTGAAGGAAACTGCTTCAAATCCTGGATTCAAGCAAATTAGGAAGTTTGAACAAGGAAAAGACCTATAGGTGAGTTCAGATCTTCAGATTACCCCAAAATACCTTTTGTTCTAAGTTAGCTTACCTAGAGTTAAAACCTTGCTCTGCTTTCTATTTTTGCTCAAACTGACGTATCAGCAGAAGGTGTGGG\n>JJRE01079984.1/1-608 Phoenicopterus ruber ruber contig79984, whole genome shotgun sequence. \nTTTTCATTAATCAAGAACGAAAGTCAGAGGTTCGAAGACGATCAGATACCATCGTAGTTCCGACCATAAACGATGCCGACTGGCGATCCGGCGGGGGTATTTCCATGACCCGCCGGGCAGCTCCCGGGAAACCCAAGTCTTTTGGTTCCGGGGGGAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGAAACCTCACCCGGCCCGGACACGGACAGGATTGACAGATTGAGAGCTCTTTCTCGATTCCGTGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGGTTAATTCCGATAACGAATTAAGCGCGCCCTCCCTCCATTCCCTCCGCTGCGCGGTGGAGGTTTTGGACTTGCGACCTCAGATCAGACGTGGCGACCTGCTGAATTTAAGCATATTAGTCAGTGGAGGAAAAGAAACTAACGAGGATTCCCTCAGTAACGGCGAGTGAAGAGGGAAGAGCCCAGCGCCGAATCCCCGCCCCACGGTGGGGCACGGGACATGTGGCGTACAGAAGCCCCCCTCCCCAGCGGCGCTCTCGGGGGACAC\n>JXUM01141515.1/11783-11841 Aedes albopictus isolate Foshan contig141515, whole genome shotgun sequence. \nTAGCCTAGTGGTTAAGGCTATGGATTGCCAATCCGGAGACGGCGGGTTCGATTCCCGAT\n>JH836770.1/104900-105236 Erinaceus europaeus unplaced genomic scaffold scaffold01482, whole genome shotgun sequence \nGGATGTGAGGACAATCTGGCTGTGACATCTGTCATCCCATTGATTGCCAGGGTTGATTCAGCCTATCTGGCTGGCTGGGCAGGTGTCCCCTCCTCCCTCACCTCCCTCACCGCTCCACGTGCATCACTCCTTTGAAGAGGACAGCCTTCCCAAATAGAGATGGACCAGTCTTCGGTCTAGGGTATACAAATAGCTGCGCTCCCCTGCTAGAACCTCCAAACAAGCTCTCAAAATTGTCAAACCCTTAGTCAGACTTACTAGAAAAGGGCGGTGGGCTAGAAGATACAAATATATAGAACTGTAAACAATAGAGGAGATACTGCCCTCCTTACTAGTT\n>CP003597.1/1039739-1039660 Chroococcidiopsis thermalis PCC 7203, complete genome. \nATCGTTCATCTCTCTTAAAAACACTCTTCACCGGATGCTGAGAGAGACGGAAGTAAGGAAATATCCAGAAGGAACGCACG\n>APGL01003207.1/3249-3375 Dendroctonus ponderosae Seq01003220, whole genome shotgun sequence. \nTGAGGGGTTTTTAGTGGGTAGGCAGCCCCACGGGACTGAATCCCACATAACCTAGCCGACAATGAACATCGTCGGCACAAAATCCAGCACAACATCGGCTGGGTATCTTTGGAAGATTTTCCCCTCA\n>KK198759.1/5784749-5784536 Eucalyptus grandis cultivar BRASUZ1 unplaced genomic scaffold scaffold_7, whole genome shotgun sequence. \nTAGCGACTGTTTATTAAAAACACAGGACTCTGCTAGGTGGTAACAGGATGTATAGAGTCTGACACCTGCCAGGTGCTGGAAGGTCGGAAGGAGAAGTGTTATAAGCTTTGAATGGAAGCCCCAGTAAACGGCGGCAGTAACTCTAACTGTCCTCTTTTCTTATTTATTTGACTCTATTTGAAGTATATTTCTTGCATCTTTTTTGTAATTATTA\n>KB317698.1/876973-877093 Rhizoctonia solani AG-1 IA unplaced genomic scaffold scaffold3, whole genome shotgun sequence. \nGTCCTCTTCGGAGTGACATATACAAAAATTGGAACGATACAGAGAAGATTAGCATGGCCCCTGCACAAGGATGACACGCTAGTTCAGAGTGGACGGTCTACGGACCGCAATATTTATTTTT\n>MJEQ01005272.1/36510-37593 Nicotiana attenuata strain UT scaffold05272, whole genome shotgun sequence. \nTACCTGGTTGGTCGTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCTATGCATGTGTAAGTATGACCAAATTCAGAATGTGAAACTGCGAATGGCTCATTAAATACGTTATAGATTGTTTGCTGGTATCTACTACTCGGATAACCGTAGTAATTCTAGAGCTAATACGTGCAACAAACCTGACTTCTGGAAGGGTTGCATTTATTAGATAAAAGGTCGACGCGGGCTCTGCCTGTTGCTGCGATGATTCATGATAAATCGACGGATCGTACGGCCATTGTGGCGGCGACGCATCATTCAAATTTCTGCCCTTTCAACTTTCGATGGTAGGATAATGGCCTACTATTAGACCCTAACTCTCTTTCATCGGGCGTGGCACGCCTATGGCAAGAATTTGGGTGTGATTGCCTTGTCATTGGCCTATGTGCGTGCGAAACGATCATGCGGACGATGGACAAGATATTGTCATTGAGGGCTGTTGTGGGCAAGTATTGGCCAAGGCCTTGGGACAGGCAAGGCGCGCTTTTCAAAGGCTTGACAAAGCAGCGTGGGCAATGTTAGGGCGGCATGGCACGACATGCACGCCAAAGTCAGTGGAACGACACTTTGGGTTGTGGCAGCTAAGTGCGGGCTAAGCTAAGGCAAGGCGAAAATGCGGGATGATGGCAAAGGCTTTCAATAGCTAAGGCAAGGCTTGTGAAGGAAAATACAAGCAATGGCACGAGGGAAATGAAGGTTGACATGGACAAGGCAGAAACTAAGCCAAGGCAGTGCGCGGGCGGCAGCGACGTCGGGCGTGTGTGGCCAAATCATGGCAGCAGGTTGCGGGCAAGTCATTGGCGCAGAGCAATGTCAAATTGAGCTAAGGCTTGGCACAAAGCAAGCCTTAGGCGTGATTCAGCTGGCCAAGTGAAGATGGCACATGCAATGCACATGAAAAGCAGTTTTGGTGGTTACCTTGTCAGTAACCTCTTTGTCCCATGACTGNCGCGACGTCGCGAGAAGTCCATTGAACCTTATCATTTAGAGGAAGGAGAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTG\n>CP001848.1/3411853-3411422 Pirellula staleyi DSM 6068, complete genome. \nGGAGTTGGGCAGACGACCGCTGGCTGCCATTTGGCAGCGAGAGGAAAGTCCGGGCTCCACAGGACAGGGTGGTCGATAACGTCGACCGGTCGTGAGATCAGGGACAGTGCCACAGAAAACAGACCGCCGCTGCGGGCATGAGCCCCCGTCAAGGTTTGATTGTCTGCATGCGGTAAGGGTGAAACGGTGCGGTAAGAGCGCACCAGCAGTCGAGGCGACTCGGCTGGCTAGGTAAACCCCGCCCGGAGCAAGACCAAGCAGAGAGCATGTTGTCGGTGTCACAGCCGACAGCCGGAATCGGTTCGGTTTCGTATGACTCTCGGGTAGGTTGCCGGAGCTAGCGAGCAATTGCTAGCCTAGAGAAATGGTCGTCAGACGTTTTCGATCCGTCGAAGACGCCAACAGAACCCGGCTTATTGCCTGACTCCGAAA\n>APMT01097187.1/1014-904 Mesocricetus auratus contig097187, whole genome shotgun sequence. \nGTGCTTGATTCAGCAGCACATATGTTAAAAATTGGAACAAGACACAAAAGATTAGCATGACCTCTGTGCAAGAAAGTATCCAAGGGGGCTGGAGAGATGGCTCAGAGGTTA\n>GG697144.2/1-676 Mitsuokella multacida DSM 20544 genomic scaffold Scfld3, whole genome shotgun sequence. \nAGGCTACGAAAGCGGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATGCTAGGTGTAGGAGGTATCGACCCCTCCTGTGCCGGAGTTAACGCAATAAGCATTCCGCCTGGGGAGTACGGCCGCAAGGCTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGTATGTGGTTTAATTCGACGCAACGCGAAGAACCTTACCAGGGCTTGACATTGAGTGAAAGGGCTAGAGATAGTCCCCTCTCTTCGGAGACACGAAAACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCCTTTGTTGCCAGCACATAATGGTGGGAACTCAAAGGAGACTGCCGCGGACAACGCGGAGGAAGGCGGGGATGACGTCAAGTCATCATGCCCCTTATGTCCTGGGCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCCCATTGCGGAAGATTCCCCACTGCTGCCTCCCGTAGGAGTCTGGACCGTGTCTCAGTTCCAATGTGGCCGTTCATCCTCTCAGACCGGCTACTGATCGTCGCCTTG\n>CP000270.1/1720642-1720704 Burkholderia xenovorans LB400 chromosome 1, complete sequence. \nCCGTCTCTCAGGTTCTAGCACGGCCCTCGGAATGGCTAGAACTTTTGGGTATACGGATTTAAT\n>KX552040.1/184526-184806 Kaumoebavirus isolate Sc, complete genome. \nCCGAGTCTCAGATTAAAGCTGAGGCTAGTTACGCATTAATGAAAAATGCTAGCTACATTCGTAAATTGCGGGAAAATCTCACGATTAATAACACCATTAGCAGCTTGAGAAAGTTGCTGAGAACCTCAGGGAAACTTGAGAACAACGGTAAAAGATTATTAATAGAGACAATCCGCAGCCAAGCTTGTGAAGAAATATCTACACAAGAAGGTTCAGAGACTTTATACGAATGGGCGGTTCTACCGCTTAAGATAAAGTCCATGCCCCACTGTGAAGTGGAT\n>LVLJ01001741.1/199221-199340 Marchantia polymorpha subsp. polymorpha scaffold2490, whole genome shotgun sequence. \nATCTTTGCGCTTGGGGCAATGACGCAGTTCATGAGGTGAAACCGCGTCAATTGCTGGTTGAAAACTATTTCCATAAACCCAAAATGTTCTGTGGATTGAATTTAAGTAAAATGCGTGCTT\n>CYZX01000004.1/41603-41740 Clostridium disporicum strain 2789STDY5834856 genome assembly, contig: SCcontig000004 \nTAGTTTTGTGTTTTCTAGTGTGTAAAAGTCTAAGGAATTTTCTATGACTTTTACGCCTGAATGTTTATCATTCACAGGGCAGTAATTGAAAAGTTATTGTCTCCACGTATTTTGGGAAGGAAAATAAGTAGATTTAAT\n>JPGV01000050.1/11129-10707 Chlorobium sp. GBChlB GB_Chlorobi_Contig_4394, whole genome shotgun sequence. \nAAGCTGCGCGGCGGCGGTCGCTGCTCCGACAGGTCGGAGCAGAGGAAAGTCCGAACATCACAGGGCTGGGCGCCGGACAAGGTTTTGTCGGCAACGATGAAACACAAGTTCGGGCGGGCGAAAGCAATTTCGCTCGACAGATAGCGCAACAGAAAGCAAACCGTCTCGACGCAAGTTGGGATAAGGGTGAAACGGCGGTGTAAGAGACCACCAGTTAACGCAGTAATGCGTTAAGCTCGGCAAGCCTCCCCGATGCAAGACTATGTAGGAAAACTTTTTCCGCGAGGAAAAAAGAGTTGCCCGCTCAATTCATGCGCTTTCGGGCGCGGGAGAGTTTTCGGGTGAGTCGCATAGATAAATGACTGCCTCTCGTTCAAGCACTTGAGCGGGAAACAGAATTCGGCTTACAAGCGCGGCTTCATT\n>CM001455.1/27997587-27997665 Oreochromis niloticus linkage group LG12, whole genome shotgun sequence. \nGGCCTGCAAAATCCAATCACCACCTCCTCGCGGTGTCGGCTGGAAACAAGATCCTCTGGAACTTGGCTAACGGTGATGG\n>APLE01000910.1/95410-95331 Erythranthe guttata cultivar DUN x IM62 scaffold_7_contig_2, whole genome shotgun sequence. \nGCCTGTGATGATGCTTTATTCAAGAAATGCATTTATGCATTCATGTTGAAAACTCCATTTTGACTAGGACGGTCTGAGGC\n>JZQY01000031.1/173164-173396 Nitrospira sp. OLB3 UZ03_NOB00100CONTIG000031, whole genome shotgun sequence. \nGCGTCCCGGTAACGGGACCGTGGGTTCGAATCCCACCCTCTCCGCCATACTAGTGTGTTCGACCTCCGGCCGGTCTCGTAAGAATGTGGCGGCGGAGTCCGCCGTCGATGGTGATAGGGGCCGGGCCCTGTGCAACAGAACTCTGTGAACCCCGCCAGGTCCGGAAGGAAGCAACGGTAAGCGGTCCGTTCTGTGTGCCGCAGGATCACCTGGCCCCGCTAATTCTGGGACGT\n>CM000401.2/17156931-17157025 Equus caballus chromosome 25, whole genome shotgun sequence. \nTATGGAATCGCTGGATCATATAGTGGATGTATATTTTGAGAAATTGCCAAACTTTTTTCCAAAGTGCTTGTACTATTTCACATTTCACTAGCAAT\n>CM001002.2/3260960-3260256 Mus musculus chromosome 9, GRC primary reference assembly. \nGAGGGGTGTGGGTACAAAACTGAATCTTAAAGGAATTGATGGAAGTGCACCACTAGGAGTGGAGTCTGCAGCTTATTTTTGACTCAAAATGGGAAACCTCACCTGGCCTGGATATGGACAGCATTGACAAGATTGTTAGCTCTTTCTCAATACCATAGATGGTGGTTCATGGTAATTCTTGGTGGAGTAATTTCTCTGGTTAATTCTGATGAGAAATGAGATTCTGTCATGCTAACAAGTTATGAGACACCCACACACACACACAAGCAGTCAGCATCCTCCAATATTTTGAGGGACAAGTGGCATTCAGCTGCCTGATGTTGAACAATTACAGGTGCATGATGCTGTTAGATATCTTGAGCTGCACACCCATGACACTGACTGTCTCAGCATGTGCCTACCTTATGCTGACAGGCATGGGTAACCCGTTGAACTCCATTCATGCTGGGTGGATAGGGGATGGCAATTTTCCGTACGAATGAGGAATTCTCAGTAAATGTCAGTCAATAGATTGTGTTGACCAAGTCCCTGCCCTTTGTACACACTGCCCATCCCTACTACCGATTGGATGGTTTAGAGAGGCCCTCAGATCGACCCCACCAGGTTGGCACCTGGCCTGATCAGAAATTTGAGAAGATGGTTGAACTTGACTACCTACAGGAAGTAAAAGTCATAAGAAGGTTTCTGTAGGTGAACCTGCAGAAG\n>JH836513.1/219899-219725 Erinaceus europaeus unplaced genomic scaffold scaffold01225, whole genome shotgun sequence \nAAGACTGTACTTTCAGGGATCATTTCTATAGTTTGTTACTGCTTCCTTCTATGGTATCTAAATACAAACTTCTGTAAGAGCAGGAATTTTTCCTGTTTTAGCAAGCTTTAGTCCCAAGAATAGCAGACAGTAGTTTGCACATACCTTTTAAAAATGAATAAGGGATATTTTCTAA\n>DS562880.1/7595309-7595616 Cavia porcellus supercont2_25 genomic scaffold, whole genome shotgun sequence. \nAAATGCTGTATTAGCTGGCTATGGCTTCTGTCACCCCACTGATTGTCATGGCTGATTCTGCTGATCTGTCTAGGTGGGTGACCCCTTCCTCCTTCTCCCTCGCTGCTCCATGTGTATCTCTCCTGAAGCTATGTACTCAGTGGAAGAGAAAGATCATCACTGATAGAAGAGGACACTTTCCTCAGTCAAAGGTATACAAGTAGCTGTACTCCCCTACTAGAACTTCCAAAAAAGCTCTCAAAAAGTCATATACTTGCCAGGGTTACAGCTCAGCAGCAAGGCACCTGCCAGGCAAGCATGAGGTCCTG\n>CCCW010013542.1/2343-2238 Brassica napus, WGS project CCCW01000000 data, contig: 30646 \nAATCCGTGGTGTGGACATTCTCGCTGGAAAAACCTAAATCTAATCCACGTATCTTTGAAGGACTCTCCAGCCTTCTGCGAGAATGTGGAAATTTTGTTCCGAAGTT\n>Y11506.1/699-3910 Pamaria palmata 5.8S & 28S rRNA genes, ITS1, ITS2, IGS \nGGATCTCAAATCAGACAAGATGACCCGCTGAATTTAAGCATATAACTAAGCGGAGGAAAAGAAACTAACAAGGATTCCCCTAGTAGCGGCGAGCGAAGCGGGAACAGCCCAAGATGAAAATCCCTTCGGGGAGTTGTAGTCTGAGTGTCCTTGGGTGGGTCAGTGCGGGCAAGTCTTCTGGAATGAAGCGCCATGGAGGGTGAGAGCCCCGTCCATCCCGCACAGGATCCATTCGTACAAGGACGCTTCAACCGAGTCGGGTAGCTTGGGAATGCTGCTCTAATTGGTGGTAAATCTCATCAAAGGCTAAATAGTGGTGGGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGGAAAGAACTTTGAAAAGAGAGTGAAAAGCACTTGAAACCGTCACGGGGGAAGCGGATTGCGTGAGTGATGGTGTCGCTTGTTCAGCGCTTTATTGCGTGCATTCTGGCGGCGCCGTGCCGGCGTGGCTGGCTGGACTGTGATTTTGACAGTCTCGGCTGGTGAGGGCTCCCTCGTATGAGGTGAGGACGCGGGCAAAATGACGCAATACGACCCGTCTTGAAACACGGACCAAGGAGTCTAGCACGGCTGCGAGTCGAAGAGTGATTAAACTCAAGGGCGCAGTGAAAGCGAAATTATAAGCAAATTGGGGAGGCGTTGCGTTTTTAACAAAATGTCCTACCTCGAGCATTTGTGCTGGGACCCGAAAGATGGTGAACTATGCCGGAGTAGGGCAAAGCCAGAGGAAACTCTGGTGGAGGCTCGTAGCGATGCTGACGTGCAAATCGCTCGTCGAACTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCTCTCAGGATAGCGGGCCGACACGCGTTTGTTGTTTTGTGCGGTAAAGCGAATGATTAGTGCATTTGGGGTACGAAGTACTTCGGGCGATTCTCAAACTTTAAATGCGCAAGGGGGTGGCTGCTTAATTGAGCCTACTCTTTGAAAAACGTCGGCCCTGTGGGCCACTTTTGGTAAGCAGAACTGGCGATAAGGGATGAACCTTAAGCGCGGTTAAGGCGCCTCATTACCCGCTTATAGACCCCACAAAAGGTGTTGATTCATATAGACAGCAGGACGGTGGCCATGGAAGTCGGAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATGAATTAGCCCTGAAAATGGATGGCGCTAAAGCGGGTAGCCGACACCGCGCCGTTCCGGCGAGACGAGGCCGGGATGAGTAGGAGGGCGTGGCGGTCAGTGAAGCAGGCTAGGGTGCAGACCCAGCTGAAACGGCCGCTAGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAGCGAGATCCTTGAAGGGCGAAGCGGGGAAGGGTTCCACGCAAACATTGATTGGGCGTGGGTGAGTCGTTCCTAAGCCGAGTGGCAATTGCTAAGTAGCGGCGAAAGGGAAGCGGGTTAAAATTCCCGCACACGGATATGGAGGCGGCGACGCAAGCAGAGGCGAATACGCTGGCCGAGGCGCTGGGCAGAGTTGTCTTTTCTGTTTGACCGGCATCGCGCCGTGTGGAATCCGCTTATCGGGAGAAACACGCGCGGGTATGGGCAGAGCGTCAAGTTTTTTTTGGCGTCCAGCTCGCCTCGGACGGCCCCTGAAAATTCGCCCGCGAACTTTAAAAATTTCATGCTGTGACGTACCGATATCCGCATCAGGTCCCCAAGGTGAACAGCCTCTGCTCAATATGAACAATGCAGGTAAGGGAAGTCGGCAAAATAGATCCGTAACTTTGGGAAAAGGGTTGGCTCTAGTGGGATGAAGGTCTTCAAAGGGGGCTTCGCTGTGCTTGGCGTCTGACGGGAGTGGCTAGCTTTCGGGCTGGATGCTTCTGTTGGATTCCTTGCGTGGGGGATGTTTCTCGCCTTCAGCATATCCCAGACTAGAACTGCAACGGGCAAAGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGAAGGCCGTGGCCGGTGTTGACGCAATGTGATTTCTGCTCAGTGCTCTGAATGTCAAAGTGAAGAGATTCAATCAAGCGCGGGTAAACAGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCTACTGTCCCTATCTGCTTCTAGCGAAACCACAGCCGAGGGAACGGGCTCGGCGGAATCGGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTATTCTAATTTTGTGAAGCAAGTTAGGAGGTGTAGAATAGGTGGGAGCTTCGGCAACCGTGAAATACCACTACTCTTAATCTTGCTTTACTTAGGGCGTGAGGCTGTACGGCCGCAAGGCTTGCTTATTGCATCAAGCGTGATTCGTTCGCGTGAACAGCGCGCCCAACACATTTAGGAGGGGAGTTTGGCTGGGGCGGCACATCTTCTACAAGACAACGAAGGTGTCCAAAGATAAGCTCAGTGAGAACAGAAATCTCACGTAGCGCAAAAGGGTAAAAGCTTGTTTGATTTTGATTTTCAGTGTGAGTTGAAAACGCGAAAGCGTGGCCTATCGATCCTTTCACGATTCGAGATTTGAAGCGAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCGGCCAAGCGTTCATAGCGACGTCGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGCGAAGCAGAATTCGCCAAGTGTCGGATTGTTCACCCGCCAACAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTATCCTACCGATGAGTTGTTGCCGCGGCAGTAATATATGGCAGTACGAGAGGAACGCATATTTCACACCACTGGTTCATGCAGCTGCCTGAGCAGGCAGTGCTGCGAAGCTACCGTGTGAATGATCAGAATAGCTGAGAGAGTCTAAGCTAGGATCGGTTCTGCTCAGCGGCGACTTATTTGTATCCGCCTCGACACTGTGTACAGATAGCCTTCGGGCGAGCACCATTGGGCGTAAGCTTATCGTCGTGCGTTTTAGCGGATGTAAAATCACCTGCAGATGACTGGGTTGGGACTGGAGCGTGTACAGCGTTGAGAGATCTTGTTATCTCGATTCCTTGAGCGTATCTGAGTCCTTACGATTTGT\n>GL876983.1/220883-220724 Magnaporthe poae ATCC 64411 unplaced genomic scaffold supercont1.18, whole genome shotgun sequence. \nCACCGCCCGTCGCTACTACCGATTGAACGGCTCAGTGAGGCCTTCGGACTGGCCCAGGGAGGTGGGCAACTACCACCCAGGTGCCGGAAAGTTGTACGAACTCGGTCGTTTAGAGGAAGTAAAAGTCGTAACAAGGTCTCCGTTGGTGAACCAGCGGAGG\n>GL897030.1/4179803-4179625 Mustela putorius furo unplaced genomic scaffold scaffold00133, whole genome shotgun sequence. \nAGCTTTGTGTAGTGGCAGTATCGTAGCCAATGAGGTTTATCCAAGGTGCAATTATGGCTAATTGAAAATATTTTTACCAGGCCCCAAAGAAATCTTGTACCCATAAACAATCACTCCCCATCCCTCCCACAGACACTTATTGGCATGCAGAGTTTTTAGCTCCATATCCAAACAACATG\n>AFTD01079003.1/14897-14834 Cricetulus griseus cell line CHO-K1, whole genome shotgun sequence. \nTCTTGATGATGCACTTCCAATAGATCCTTCTGACCCTCCACTGTGGACTCTCCATTCCACAAGG\n>CM007654.1/638658-638533 Prunus persica cultivar Lovell chromosome G4, whole genome shotgun sequence. \nTACATAACGAGGGACAGTTTGTGTGTCTCTTGGATTGAGAAGAATAGCGAGGTAGAGTGAAAAGGCCGAGCCATCGTTTCGGTCGTCATTATTTGGATTGGCGATTCGATTGTTTCTCGTCCACAT\n>AASG02044696.1/921-990 Ricinus communis cultivar Hale ctg_1100012308131, whole genome shotgun sequence. \nCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTAAGCATATCAATAAGCGGAGGAAAAGAAACTACCA\n>KB671965.1/368135-367938 Anopheles epiroticus strain epiroticus2 unplaced genomic scaffold supercont1.71, whole genome shotgun sequence. \nATCAATACAACTCTAGTAGCGTAAGGATGCGAGGTCTTTAGAAGTATAAAATAAGCTCGTCTTAGCTACTCCTATTTGTCACCATCGTACAGAGTGGTAACATATCTCCTAACACCTGAGCTTGGGTATAAGGAGAATTTCTTATAGAAGTGCCCGGTAAGGGCAAGCCAACTTAACTAAATGTTTCAAATGAGAGAA\n>URS0000D6A915_12908/1-80 unclassified sequences skipping-rope RNA \nATTAAATGAGGTGGACAATGGCATCCACGCACCTATATTGGTTAAAAGAGATGAAAGTACAGCCAGACTTTCCATTTAAT\n>FR902120.1/11240-11312 Clostridium sp. CAG:914 genomic scaffold, scf4 \nTTGATTGCTCAACCGCACGAAAAAGGTATATAAGTAGATTTTTCTCACCTTATAGGCGAGTCTTAAACAAAAT\n>CM000941.1/117493038-117492965 Anolis carolinensis chromosome 5, whole genome shotgun sequence. \nCGATGATGATGATGATGATGATGATGATGATGATGATGATATCATCATCATCATCATCATCATTATCTTTATTT\n>AAGD02001768.1/1-584 Caenorhabditis remanei strain PB4641 contig453.2, whole genome shotgun sequence. \nTCCGGACTCCAGGGATCCGAACGTCTAATTAAAACAGAAGTGACCAGATGGTCTTGCGGAAGTTGACTTACAGTGATTCTGCCCCAGTGCTCTGAATGTTAGCTCGTATTAATTAGAGTAAGCGCGGGTAAACTGCGGGAGAAACTATGACTCTCTTAAGGTAGCCAAAGGCATCGTCATTAAATTGTCACGCGCATGAATGGAATAACGAGATTCGTACTGTCCCTAACTACTATTTAGTGAAACCACAGCCAAGAGAACGGGCTTGGCTAAAGTAGCGGGTAAAGAAGACCCTGTTGAGCTTGACTCTGGTTTGACATTGTGAAGAGTCATGAGAGGCGTAGCATAGGTGGGAGACTTCGGTAGACAGTGAATTACCACCACTTTCATCGACTCTTTAATTATTGGGTTGAAAGAGAATACATCCGGCCCGTAGTAGGTCACGGACATAGATCTCGCTGAGATCTACATTTTGGTATATTTTTCAGGTCATAACACTGAGTTTGAAGCATTTACGAGCCGGCCCAGGTCGACCCGGTTTGCAAATATGTTTTGAACTAATTTTCAGAATCCAAATGAGCCGT\n>URS0000D6BD91_395494/1-79 Gallionella capsiferriformans ES-2 int-alpA RNA \nGCCGCACCTAGTCCGTGCTTAATTACCACGGGCGAAAGCACAGAAACCCTTGCTGTGTTGGTGCGGCTTCTATTCAGGG\n>AZRA01000138.1/15527-15395 Sphaerotilus natans subsp. natans DSM 6575 X805_138, whole genome shotgun sequence. \nCCGAAGGGTCGCTAGGGTTCCGAGGCCTACCATGCGGCAGGCCTGTCTGGTCCGAGAGCGACCGGCCTCAAGTGCCCGCGGCAGCTGCCGCGACGGCACTCAGGCTCCACGGCGGGACAAAAGCCCGGGAGGA\n>MJEQ01005736.1/39329-39916 Nicotiana attenuata strain UT scaffold05736, whole genome shotgun sequence. \nTTGTGTATTTTGTTAAGCAAAATCGTCTAAGTCATTTCCTAGGGTGGGAAAATCATTTTGGCCAGGGAATCGGGGAATTCTTTGTCTTGGCCATAGGGTTGGCTATTGTGTTCTTGTATTCACATATTAATACGAGTTGGGAAGAAATTCCTGTATATCGTGTGTGCCTTTTTACTGTTTATGCTGCCTATTTCGTTCTAAGTTTCAAACGTCCCTAAAATAAAACTAAGTGTTGGAAAGGCTGAAGTCAAGGCTGGGCTTGACTGCCGCACGGAGGTGAACCTCGAGTAGAAATTTGAGTGACATAAATCACCCCTGTGACACCTACCATGGTGGTGACGGGTGACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGTAGCAGGCGCGCAAATTACCCAATCCTGACACGGGGAGGTAGTGACAATAAATAACAATACCGGGCTCTATGAGTCTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGGAGGTCAAGTCTGGTGCCAGCAGTCGCGGTAATTCCAGCTCCAATAGCGTATATT\n>MHFR01000003.1/41901-41805 Omnitrophica bacterium RIFCSPLOWO2_12_FULL_44_17 rifcsplowo2_12_scaffold_1117, whole genome shotgun sequence. \nCATGTAGTGTGGCGCAAATCGAAAGGTTAGGACGCAAAGCTTTAGAGCCTAAACCGACCGGGCAAAAACCCGGTAGGCATGGTTGTCAGTTGCCGAA\n>AF137379.1/97379-97053 Nephroselmis olivacea chloroplast DNA, complete genome. \nGGGGTTGTCATGGAATCGACGTCTCTTCTAAGAACGAAAGGTTAAAGCAGGTCGAGGTCGAAGATGGACTCGTACTCTCCACTTCATTGCTTGATTGCATGCTAATCAGATTCTTCCTTTCTCTCGCCGGGTAGCCGTTGCTGCTTAAGCGAGTTTCTAGTGCCACTTTGTCACTAGTTTGTATTATGAGTTTCACACTCACTTCAATGACGGTGATAGATACTACATATCACTCCTGCTTAGAGGGTCATCTAAGCTAAACCATGTGAATATAACCTTTCGGGCCTCGAGAGACGGAAGTGAGTTCAATTCTCACCAACTCCACCA\n>FO117623.1/2019842-2020021 Blastococcus saxobsidens DD2 complete genome \nGACCGAACACCGCCTAATCACCGCGCGGCGTGCAGTCCCGGCGCCCGGGGTGTACCGGGGACCCACCGCAGTTCTGGGGTGAGTTCTCCCGCGGCCGGCTCGCCGGTGCGTGGGGGATAGGGCCAGTCTTCCCAGCCCGAACCCGTCAGCTAACTCGGTCGGCGGTAGCTGAGGAAGAAA\n>JH971392.1/893535-893437 Agaricus bisporus var. burnettii JB137-S8 unplaced genomic scaffold AGABI1scaffold_8, whole genome shotgun sequence. \nCCTATCTGATGATACAAGCGCAATCGCATAGTTCACGCTGAATCAAAAGTGTTGACAATCATGCATCTTTACGTCTTTCGCTCCTATCTGACTCATCTC\n>AZIM01000372.1/334250-333937 Ophiophagus hannah scaffold373.1, whole genome shotgun sequence. \nGGATGTGAGGGTGATCTGTCTGTGACATCTGTCACCCCATTGATACCACAGTTAATTCAGTTGATCTGGCTAGCTAGGCAGGTGTCCCCTTCCTCCGTTACCACTCCATTTTTATTTTTCCATGAACTGTGTGCTCATGGAAGAGACAACTAATTTAGGGAGGAGTGTATCAATCTTTAGGCAAGGGTATGATATCCGTGCTCACCTTCTAGAACCGACAAACAAACCTTTTCCTCCATCCATTTGCCTGTTCGTTTCCCAGGCTTGAGATATAACAATGCATCTCAATGGCTTTGTTTGATCAGCAGTGCTTG\n>CAJI01046266.1/316-1 Cucumis melo, WGS project CAJI01000000 data, contig: 46266 \nAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTGAAGCGCGCGACCTATACCCGGCCGTCGGGGCAAGAGCCAGGCCCCGATGAGTAGGAGGGCGCGGCGGTCGCTGCAAAACCTTGGGCGTGAGCCCGGGCGGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAGGAGACGGGGGAAACCCGTCTGATAGCGCGAC\n>CP013111.1/5040245-5040340 Bordetella sp. N genome. \nACGCTTGAGGAGCGTTGCGACGGATCATTCCGCCAGGCTCAAGCATTCCAGGGTATGCCGCGTTCGCGCGGCACCATGAAACGGCGCTCACCTTAG\n>LFJF01027493.1/1808-5852 Macrostomum lignano unitig_27548, whole genome shotgun sequence. \nTGACCTCGGATCAGACGTGATTACCCGCTGAAATTTAAGCATATTATTAAGCGGAGGAAAAGAAACTAACAAGGATTCCCTAGTAACGGGCGAGTGAACGGGAAGAGCCCAACACCGAATCCCTTGGCGCAAGTCAACGGGGAAATGTGGTGTTAAGGTAGCCCTTCGTGTCAGTCTAGGCGTCTCAAGTCCACCTGATTTGTGTGCTCAAGCCCAGAGAGGGTGTAAGGCCCCGTAGAGACGCTCCGACTGATTCCTGGGGTGTTTACCTACGAGTCGCTTGTTTGGGAATGCAGGCCAAAGCGGGTGGTAAACTCCATCCAAGGCTAAATCTGGCACTGAGTCCGATAGCGGACAAAGTCCGATAGGCGGACAAGTACCGTGAGGGAAAAGTTTGAAAGAACTTTGAAGAGAGAGTTCAATAGTACGTGAAACCGCTTAGAGGTTAAACAACGGACGGATGGAGCTCATAACTGGCCTGAGCTTCAATCAACTGTGACGGTGGCTGGACGAGGCTGGAGCGAGTTCGGATCTCTTCTTTTGGGACGGGCAGATCTGCTCTTTTGGTGACGCTCGGCGTTCGGTTGGCTATCAGCTCCTGACATCGGTGCCAATCTTGTCCCTTGGTGGCCTTCCGCCACGACCACGACACTGGCTACCCGCGGCTGGGGTAAGGTGACAAACTGCTTCGGCAATTTTGTGTATAGACCCGCGGCGTCGTCGGACATGGTTTTGGCCAGGACGTCGAGCTTGGCGGCGCCCGCTCCTTGTGTGGCTCGCATGTTTGGCTATAGCTTGGCTGCCGCCGATGCTTGCACTGGACAACCAGTACAGGTGGACGGTTGTGGTCTATGTCTCTAGTTGGCCTCTGCGAGTTTGGCGCCTTATAGTCTGTGGTGTACTTGTGGGTAGACTATCCGACCCGTCTTGAAACACGGACCAAGAGTCTAACATCTGCGCTGAGTCATGGGGATTTCCTACACGACCAAGTGTGCGCGCGAGTCATGGGGGGATTCTACGAAACCAAAGGCGCAGTTGAAAGTAAAGGCCTGCTTCTCGTAGGCTGAGGGTGGGATCTCGTGCATTCGCGAATTGGCGAGCGCACCAACCGGGCCCGTTCCTATCTGTCTCTGTCAGTGGGGCGGCGCAAGAGCGTACACGTTGGGACCCGAAAGATGGTGAACTATGCTTGCGCAGCTCGAAGTCAGTGGAAAACACTGATGGAGGAGCGCAGCGTTTCTGACGTGCAAATCGATCGTCAAACGTGAGTATAGGGCGAAAGACTAATCGAACCATCTAGTAGCTGTTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGCACTCGGGAAACAGTTTTATCCGGTAAAGCGATGATTAGAGGCATTGGGGTCGAAACGACCTCGACCTATTCTCAAAACTTTAAAAATGGTAAGATGCTCGTCTCGCTTTAATTGGAGGCGGGCTTCACCTCTCTATAAACGTGAATGTGAGTGCCCAGTGGGCCATTTTTGGTAAAGCAGAACTGGCGCTGTGGGATGAACCAAAACGCGCGGTTAAGGCGCCAATGCGGACGCTCATTGAGACACCACAAAAGGTGTTGGTCGATATACTGACAAGCAGGACGGTTCGGCCATGCGAAGTCGGAACCCGCTAAGGAGTGGTAAGCAACTGCACCTGCCGAATCAACAGCCCTGAAAATGGATGGCGCTGGAGCGTCGGGCCTATACCGTGCCGTTGGCAGGCGAAGCAGACAAATAATCTGTGTGGATGTCCCCAAACGAAGTAGGAGGGTCGCCGTGGTGAGCGCAGAAGGTGCGGCCGTGAGGCCGGCTGGAGCCGCCACGGGCGCAGATCTTGGTGTAGTAGCAATTACTCAAGTGTGAGAACCTTTTGAGGACTGAAGTGGAGAAGGGTTCCATGTGAACAGCAGTTGAACATGGGTCAGGCGGTCCTAAGCGATCTCGGTAACTCCGTACACTAGACGAGGGTGACAACTATCACTTGAACTAATACTGTGAAGTGTTATAGCCCTCCGGAGCGAAAGGGAATCGTGTTAATATTTCACGACCCTTACCGTGGAGATCGCCCCTTTCGGGGGGCAAGTGCGGTAACGCAAACGAACACAGAGACGTCGGCTGGAGCCCCGGGAAGAGTTCTCTCTTTTCTTTGTAAGGAGCCGTACCCCCTGGAATCGGCTTGTCCGGAGATAGGGGCGTGGCTTCCGTAAAGGCAGCGCGCGGTCTTGCGCTGTCCGGTGCACTCTAGTCGGCCCTTGAAAATCTGTGGGAGACAGTGTGATTTTCACGGTAGGCCGTACCCATATCCGCAAGCATGCGTCTCCAAGTGAACAGCCTCTAGTCCTAGAACAATGTAGGTAAGGGAAGTCGGCAAAATGGATCCCGTAACTTCGGGCGAAAAGGATTGGCTCTGAGGGCTGGGGTCGGATGGGCTGGCGTAAGAAAGCTGTTCCGGTGGTGAGGACTGGGCGAGGCTTTCGGGCTTTACTCGGACCATGCCGAGACCAGGCAGTAGACGACGTCAGCTGTGCTTGTCGTGTTTCGGCGCGGCGCGGCAGCTTCGTCCGGCAACAAACAGCCAATCTCAGAACTGGCACGGACTAGGGGAATCCGACTGTCTAATTAAAACAAAGCATTATGCGATGGCTCGTGTGCTCGATGTTGACGCAAATGTGATTTCTGCCCAAGCTGCTCTGAATGTCAAAGTGAAGAAATTCAATCAAGCGCTGGGTAAACGGCGGGAGATAACTATGACTCTCTTAAGCGTAGCCAAATGCCTCGTCGTCATCTAATTAGTGACGCGCTTATGAAGGTGGGGTATTAACGAGATTCCACTGTCCTATCTAACTATCTAAGCGAAACCACAGCGCCAAGGGAACGGGCGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACCTTTGTGAAGAGACGCATGAAGAGGTGTAGTATAGGTGGGGAGCGTCAGCGACTTTGAAATACCATACTTTTAATCGTTCTTTACTTATTCAGTGAAGCGGGGGGGGGGAGCGGCCTTCACGGCACTCGTTTCTGCGGTGTTTAAACGGCTGGCCCTCGCGGCCGGCCGTGAACCTTGCTCTGAAGTACAGGTCAGGCGGGGGGAGTTTGACTGGGGCGTGTACATCTGTCAAAAGGTAACGCAGGCTGTCCAAGATGAGCTCAGTCAGGACCAGAAACCTGCGTAGAGCAAAAGGGCAAAAGCTCATTTGATTTTGATTTTCAGTACGAATACAGACGTGAAAGCGCGGCCTATACGCATCCCTTTGATTAATCAGAGTTGATGCAAGGCGGTGTTCAGAAAAGTATCCACAGGATAACTGGCTTTCTCACGCGTCTGCGAGTGCGATGGCGGGCAAGCGTCATAGCGACCGTCGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCAATTGTGAAGCAGAATTCACCAAGCGTTTGGATTTGTTCACCACCCAATAGGAACGGTGAGCTGGGTTTTAGACCGTCGTGAGACAGGTTAGTGTTTACCCTACTTGATGTCTTCGGTCGTTGCCTATGGTAATCCTGCTTAGCTACGAGGAGAACCGCAGGTTCAGACATTTTGGTTTATGTGCTTGGTCGAAAGACCAATGGTGCGAAGCTGACCAATCTTTGACGGCGATTTAAGACCTGAAAGCCTTCTTTAAGTCTTGAATCGCCGCCACGAAACGTGCAACGATACTATCGGTGCCCCTACGCCGGGAGGCAACGAATATACTCGGCCCGCAGAATCCGATTTCGGCGGGCGAGCACTGGCTAAAGCACTCGATTACTGCGTGGCCACACCCGCTGTCTTTGTGAAATTTGCAGTCGGAGGCACAGACACGATTACCACTTGATATTGAGACGTTAGGGGTTTCTATAAATCGTTTGTTAGAGCGACTTAGATTCCGGTCGGGGTGCCGTACTTAGTTGAGCAGTTTCACTTGCGATGCTATTTGAGGGCCTAAGCCTTTTGACGGGGAGATATGT\n>LMNA01000001.1/561241-561047 Pseudorhodoferax sp. Leaf274 contig_1, whole genome shotgun sequence. \nCCGCCCGTCTTGGGGGAGTAGCCAGCCTTCGCTTTGTGCGAGAGGGGTTTGCGTCAACAGACTTGTTCGTGCCGTGCCTTGGTGTGCGGTCCGACATGGCGCAAACGGACCACCAGCAGCAGCCTGCAACGGGCGATGCCTTGCCGGGGTTCAAGCGAGACCTTTGACTGCGCAGCTTCTCGTGCCGGGAAGGCT\n>ALWZ043544869.1/1192-611 Picea glauca, whole genome shotgun sequence. \nGGTTTGGCATAATCAACAGAGAAAGAAGACCTTGTTGAGATTGACTCTAGTCCAACTTTGTGAAATGAATTGAGAGTTGTAGAATAAGTGGGAATCATTTTTGACACAAATGAAATACCACTACTTTTAACATTATTTTACTTATAATTTTGTGGGGCGAAGACGGGGCAGTTACCCTATTTTTGGCCTTAAGTCATGTTTCGATGGGTTGATATGGGCGGAAGACATTGTAGGTGGGGATTTTGGATGGGGAAACACATCTATTAAAAGATAACATAAAATATAATTTGTGTAGATAGAACATTTGTATTTGGGAGATCCTAGTGCACAACCACCCTTATTACCTTTCCCTCCTAATTTGTAGTTACATCCAATCATTTCTAAATTGAATCTAGTTTCCTCACTTGCACAATATGGATAGACGTGTGAACCCTATACATTATTAAATATTTCAAAACCCCTATCCATGAGCCTATGGTTACATACAAATGGGAAAAAAAAGGTGGATACAAAAATGACACCCATTCCTCCTCACAGTCCTCCCTAGGATCTTGTTGTATCTCATAATGTTGCACACTCCAT\n>ALWZ042080687.1/2737-2632 Picea glauca, whole genome shotgun sequence. \nGAAGAATCCTTTATAGACGACTTAAATATGTGACGGGGTATTGTAAGTGGTAGAGTGGCCTTTCTACCACAATCCACTAAGATTCATCCCTTTGTCGCCTCAATTT\n>ALWT01066045.1/576-1 Myotis davidii contig66045, whole genome shotgun sequence. \nTGGAGTCCAGGGGGCGTGGGAGGAACGGCCTCTCCAGCTCCCTTTGCTCCGCCGCCGCGTCCCACCGACCCGCCCCCCGAAGAAGCATCGGGACCGCTCAGATTTGCAGTCGGAGCCGCGTCCCGAGGGAGAGAAGGGGCGTGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAATGAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATGAACGAGATTCCCACTGTCCCTACCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCGGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCTGGCACGGTGAAGAGACATGAGAGGTGTAGAATAAGTGGGAGGCCCCCGGCGCCCTTTCCCTCAGCCCCCTCTCGCGAGGGGGCGGGGAGGGGGGCACGCCGGCCTTGCGGGCCGCCGGTGAAATACCACTACTCTGATCGTTTTTTCACTGACCCGGTGAGGCGGGGGGGCGAGACCCGGGGGGGGGTGC\n>APMT01039647.1/25991-25874 Mesocricetus auratus contig039647, whole genome shotgun sequence. \nATGTTGTATCAGAGAGAATGTCAGCACTCTTCTTGCTAAGTATGAAAAGACCAATGAGCCTAACAGTGTACATTTAAGGCATTGATCCTTACAATGTGGCATCTAACCACTGTTTTTA\n>AKHW03004724.1/5683634-5683707 Alligator mississippiensis ScZkoYb_22, whole genome shotgun sequence. \nCAACAAGAAGATGAATGGTAGGCTGGTCACTTTCCTGGGAAGTAAGAGTCAGGAGTTCAAACCCCTCTAGTTGA\n>LGKD01319461.1/278-207 Octopus bimaculoides Scaffold40646_contig_8, whole genome shotgun sequence. \nTTACTGACCAAGTGGTTGTGAATGTGCTGCTAAATTGGACTTTCATATCACAGCCTGCTTGGATCAGTAACA\n>AACY023405062.1/1217-1321 Marine metagenome ctg_1101668212413, whole genome shotgun sequence. \nAAAGTCGGAATGGGTGTTGAAAGATTACCGACAAGATGAGGGAAACACGCAACCCTCGTTCGATGCGGGTAATTATTCCAACAGTTCCGCATCGATGCCGCTGCT\n>BDFN01000945.1/2677-5912 Ipomoea nil DNA, scaffold: scaffold0945, cultivar: Tokyo-kokei standard. \nCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTAAGCATATCAATAAGCGGAGGAAAAGAAACTTACAAGGATTCCCCTAGTAACGGCGAGCGAACGGGAACAGCCCAGCCTTAGAATCGGACGGCCTTGCCGTTCGAATTGTAGTCTGGAGAAGCGTCCTCAGCGGCGGACCGGGCCCAAGTCCCCTGGAAAGGGGCGCCGGAGAGGGTGAGAGCCCCGTTGTGCCCGGACCCTGTCGCACCACGAGGCGCTGTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCCAATCGGGCGGTGAATTCCGTCCAAGGCTAAATACGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGGAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGATGGAGACCGGCGATGCGCCCGGTAGTATGTGGAACGGTGAGAGCCGGTCCGCCGATCTACTCGGGGCGCAGACCAGCGAGGATTCGGGGGCGGCCAAAGCCCGGGCCTTTGATACGCCCGCGGAACGTCGTCTCTCGGATCGTGGGAAGCAGCGCGCGCCCCTGGCGTGCCTCGGCACCTGCGCGCTCCGGTCGCTGGCCTGTGGGCTCTCCATTCGACCCGTCTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGCGAGTAAACCCGTAAGGCGCAAGGAAGCTGATTGGCGGGATCCCCTCACGGGGGTGCACCGCCGACCGACCTTGATCTTTTGAGAAGGGTTCGAGTGCGAGCATACCTGTCGGGACCCGAAAGATGGTGAACTATGCCTGAGCGGGGCGAAGCCAGAGGAAACTCTGGTGGAGGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTGACTTGGGTATAGGGGCGAAAGACTAATCGAACCGTCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCTGGCGCGAGAGTTCTATCGGGTAAAGCCAATGATTAGAGGCATCGGGGGCGTAACGCCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACGGCGCGCGGCTGCTTCGTTGAGCCGCGCCACGGAATCAACAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGCCGGGTTACGGTGCCCAACTGCGCGCTAACCTAGATCCCACAAAGGGTGTTGGTCGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTTAAGCGCGCGACCTATACCCGGCCGTCGGGGCAAGAGCTAGGCCCCGATGAGTAGGAGGGGCGCGGTCGCTGCAAAACCTTGGGCGTGAGCCCGGGCGGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGGGTCGGGGGAAGCCCGACAGACAGCGCGTTTTGCGCGTGCGCCGAAAGGGAATCGGGGTTAAAATTCCTGAACCGGGACGTGGCGGTTGACGGCAACGTTAGGGATTCCGGAGACGTCGGCGGGGGCCTCGGGAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGCACGTCGCGTGGTGTCCGGTGCGCCCCGGCGGCCCTTGAAAATCCGGAGGACCGAGTGCCGTCCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGCAATGGAACGCTGGCAAGGAACGGGCGGGCCTTCCCGGGCGTCGAACAGCCAACTCAGAACTGGTACGGACAAGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTAACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGGTAAACGGCGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGAAAAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCCGAAAGGCGAAAGTGAAATACCACTACTTTTAACGTTATTTTACTTATTCCGTGAATCGGAGGCGGGGCATTGCCCCTCTTTTTGGACCCAAGGCTCGCTTGCGGGCCGATCCGGGCGGAAGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAGAAGGGTAAAAGCTCGTTTGATTCTGATTTCCAGTACGAATACGAACCGTGAAAGCGTGGCCTAACGATCCTTTAGACCTTCGGAATTCGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGACAGTGTCGCAATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTTTGCGGTTCGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGACCGACGCATGCGCTCGTCGCGTCCGTTTGGCCGACCCGCCAGTATGGGGGCCATTTGGCCCCCAAGGGGCACGTGGTCGTTGGGCTAAGCCGTCGTGGCGGAAAGGGGTCACGGTTGGGCCGCGCTTGAATATACAATTGCCGATCGAGCGGGGCGAGCTGAATCCTTTGCAGACGACTTAAATACGCGACGGGGTATTGTAAGGGGTAGAGTGGCCTTGCTGGCCACGATCCTCTGAGATTCAGCCCTTTGTCGCTCCGATTCGT\n>JARO02002307.1/4880-4968 Scleropages formosus scaffold2307, whole genome shotgun sequence. \nTTGAGTTTTCAGCTTTGAGAACTGAATTCCAAGGGTTTTTGGATCAAGCTTTGCCCGTGGGACTTAGTTCTTAAAACTGGATGCTCCTG\n>BABG01005904.1/1457-1294 Human gut metagenome DNA, contig sequence: In-R_005904. \nTATCGGACGGTGGTGATATTTTCTCGAAAAGTGCTGAAAATCAGGGTGGAGCGAACAGGACGTTCGCGACAGGCGGACGTTGCCATGGATGGCAACTGGAGCCGTGCCCGTGCGGATTAGAACCGATATCTCACTTTTCGTCAGAAAATTCCCACCGGGAGACC\n>MHKX01000006.1/12218-16044 Candidatus Liptonbacteria bacterium RIFCSPHIGHO2_01_FULL_57_28 rifcsphigho2_01_scaffold_11526, whole genome shotgun sequence. \nATGGTTGGCATTAAGGGCGCATGGTGGATGCCTAGACATCAAACGACGACGAAGGACGCAGCATAGCGGCGATACGCCACGGTGAGGTGCGGAGCAACCGTTGACCCGTGGATTTCCGAATGGGGCAACCCTGTTGAGTAAACCTCAACAACCTTCGCAAGAAGGAGTCACACCCGCTGAAGTAAAACATTTCAGTAAGCGGTGGAAACGAAAAAAAGTCCGCGCAAGCGGAAAAATTCCCCAAGTAGCGGCGAGCGAAACGGGAGAAGCCTAAACCACATGTTCGCAAGAATGCGTGGGGTTGTAAGGGAGGAACGCTATCACTTATAACCGAGAGCCGGGAGCGATCCCGGCATATCGGTTATGGGTGAAAAGGAGGAGTTACAAATTCATTTGCTAGCCGAAGCGTCCTGGAAAGGACCGCCAAAGTGGGTGATGGCCCCGTAGGCGAAAGCAGATGAACTTCTTAGTTTCTTTTCTTGAGTAGCTCGAGGTAAAACAGCTTCGAGTGAATCCGGGAGTACTATCTCCTAAGGCTAAATACGTTTGATGATCGATAGTGAACTAGTACCGTGAGGGAAAGGTTAAAAGCAGGCCGGTGAGGCCGTTGAAATAGATCCTGAAACCATGCGTTTACAAGGAACTGACGTCTTATGAGCCCGCCGCAAGGCAGGCCCCGGACTACAGTGTGCCTATTGAAGAATGAGCCAACGACTTTAGGTGTGCGGCAAGGATAAGTCCTCTCGGGGACGCATCCGTAGGGAAACCGAGTATTAACGTGCGATTTAGTCGTACACCTAAGACCCGAAGCCGGATGAGCTTGCCTTGGCCAGGTTGAACTCCGTAGAAATACGGAGGGAGGACCGAACCGGTAGGTTGTTCAACACCTTCGGATGAGCTGAGGTAAGGAGTGAAAAGCTAATCGAATTCGGTAATAGCTGGTTCTCTCCGAAACAGTTTTTGGACTGGCGGCGTAAAGTAGCGGGTGGGGGCTAAGCTCCATGTTCGCGAGGGAAAAAGCCCAGACCATCAATTAAGGTCCCCAAGTGCGTGCTAAGTGTAAAAGGCAGTGTTGTGCCATAGACAGATAGGAGGTTGGCTTAGAGGTAGCCACCCTTTAAAGAGTGTGTAACAACTCACTATTCGATCGGCACGGCGCGCCGAAAATGTATCGGGGCTAAGCACGCCACCGAAATTATGGGTTCGTATGTCCTTCGGGACGTATGAGCGGTAGGAGAGCATTCCCTTCTGCTGTGAAGCAGGACCCGCGAGGGCCTGTGGAGCGTAGGGAAGAGAGAATGTTGGCATGAGTAACCACAATCCCAATGAGAAATTGAGAGCCCGAAAATCCAAGGTTTCCGTGGCACTGGCAATCAACCACGGGTTAGGCGGTCCTAAGGCGATGGCGAAAGCCGCAGCTGATGGATAGCCGGTTAATATTCCGGCCCAGCCATGCGATCATAGCGAAGTGCGAAGGAAAAAGACGGGAGTGCCTTATTGGTTTGGCATTTATACTCCAAGGCGCAAGCCGGGAGCGTATGAATGTCCGGTTTTACCGGACAAACTTCCGAGAAGAGCCTTCCGAGAAAAGCTTCGTGAAAGCGAGCGCATGGTTTCCGTACCGTAAACCGACACTGGTGGGTGAGGCGAGAAGCCTCAGGGTAACGAGTGATTCATCTTTAAGGAACTCGGCAAAAAAGCGGCCGTACCTTCGGTATAAGGCCTGCCCATCGCAAGATGGGCCGCAGCGAAAGTCTCCCTGGCGACTGTTTACCAAAAACACAGCTCCCTGCAAACTCGCAAGAGGACGTATAGGGGGTGACACTTGACCGATGCGAGAAGGTTAAACTTGGCAGTGGTGTGCAGCAATGTGCATTGCCGACCGAGCGAAGCCCTCGTCAATGTCAGCGGTAACTATAACCGTTCTAAGGTAGCGCATTTCCTTTCCGGGTAAGTTCCGGAGCGCACGAAAAGTGTAACGACTGGGGAACTGTCTCAAAGATGAGCTCGGTGAAATTGCGATTCCCGTGAAGACGCGGGATACCTGTAGCGGGACGAAAAGACCCCGGAAGCTTTACTGCAGCCTGGTATTGATTTCAGAGTTATGATGCGTAGCGTAGTGGCGAGCCTTTGAAGCGTCCCTTTCGGGGGACGTGGAGGCGACAATGAAACAGCCATCTTCATCACTTTGACGTCTCACCGGGGAGGGACCTTAAAATGGAAACCTCCCTGGGACAGTGCTTGGTGGGTAGTTTAAATGGGGCGTTTTCCTTAACTTGACAATGCTTCCGTGTTGTCAGAAGGGGGACCCGATCCAGTCTTAAGATTGGAGGGAAAAATCTAATGTATATGCTGGAACATCCGCGGTATCAGTTTGTACCTTTGTCGAAAAGGTGAAAATCAAACTGTGGCGTCCGATGAAAATCGGGCCGGCGGACAATCAGCAGGCAACCTCGACGTAAGAATTGAGGAAGTCCTCAGAGACTATCAGTTAGAGCGGCGCACTACCCGCGCGCCGTATGATATAGTCCGAACTGCATGGCGACATGCAGGCCGCGCAAGCGGCACCTAAATACCATGAGATCAAGAATCATTGAAGAGCTTAAGAAACATCTGAAGCTTACTGCAATGCAAAGATCTCTTCTCGTAGGCCTGCTTTTAGGCGATGGCCATCTGGAACTACAGAGTGGTGGCAGAGAATATCGTCTGAAAGTTGAACATGGAGTTAAGCAGAAGGATTATGTGGATTGGTTGTACGAACAATTCAAAGATTTTGTTCGTACGCCGCCGCGTATCAAGACCAGGATTGTAAAAGGAATAACGTGTAAGAGCTACGGCTTTACCACTTATTCCTACGGATCATTTCGTTTTTACGCCCAGCAATTCTACGTTGGGCGAAAGAAAGTGATCCCGAAACTGATCTCCAAAATGCTTGACCCTAGAGCGTTGGCAATATGGTTCATGGATGATGGATCTTTCAAGTCCGTCAGCCACAAGACCTATATAATCCATACGCATGGTTACGAGAAGAAAGATTTGGAGCGTGTAAAAGATGTGCTCCAAAAGAAATTCGGTATTATCGTAGGACTGCATAAGCAATATGATCGCTGGCGAATCTACATAATGAGTGATTCGGCAACGGCGTTCAGAAATCTTGTCAGTGCCCATGTAATACCGTCAATGCGGTATAAGTTAGGGAACATCAAGCCTAAAGAGTAACGGAGGAGTTTATTAAGGTTGGCTAGGCCCGGATGGAAACCGGGCGCGTCGTGTAAAGGCATATGCCAGCTTGACTGCAAGACCTACAAGTCGCGCAGGCGCGAAAGCGGAACTTAGTGACCCGACGATTCTTTATAGAAAGGTCGGAGACAACGGATAAAAGCTACTCCGGGGATAACAGGCTAGTCTGGTCCGAGCGTCCACAGCGACGACCAGGCTCGGCACCTCGATGTCGGCTCGCCCTAGCGCGGGGGTGAAGAAGCTCCCAAGCGTTTGGCTGTTCGCCAATTAAAAGGGCACGTGAGCTGGGTTCAGACCGTCGTGAGACAGGTTGGTCTCTATCTGTTACAGGCGTTTAATCACTTGAGGGGAGTTGACCCTAGTACGAGAGGACCGGGTTGAACATACCTCTGGTCTACCGGCTTTGGCACCTGCTGAAACGCCGGGTAGCTATGTACGGAAGGGATAAGTGCTGAAAGCATCTAAGCACGAAGCCCACCCCAAGATTAGGTGATATGGTCTCGTCGCAGACTACGACGTTGATAGGCTCTAGGTGTAAGGATCGCAAGGTCTTCAGCCAAGGAGTACTAATGACCCGCCAACCATCC\n>MDEO01000036.1/702348-702384 Mesorhizobium sp. UASWS1009 41, whole genome shotgun sequence. \nGGTCTCGCCGGAAGCGAGACCGCCGAACATGAAGGAG\n>MEQJ01000121.1/2993-1439 Bdellovibrionales bacterium RIFOXYD1_FULL_53_11 rifoxyd1_full_scaffold_587, whole genome shotgun sequence. \nAAACATGAGAGTTTGATCCTGGCTCAGAGCGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGTGAAAGGGGGCAACCCCGAGTAAAGTGGCGTACGGGTGAGTAACGCGTAGGTAATCTACCCTGGAGTTCGGAATAACCTGCCGAAAGGCGGGCTAATACCGGATAGAGCGAGGGAACCTGTAAGAGGGTTTTTCGGGAAAGGGAGCTCGCAAGAGCCCTTGCTCCGGGATGAGCCTGCGTCCCATTAGCTAGTTGGCGAGGTAACGGCTCACCAAGGCGATGATGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAAACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGACGGAAGTCTGACGCAGCGACGCCGCGTGAGTGAAGAAGGCCTTCGGGTTGTAAAGCTCTGTCACACGGGACGAACGGCGAGTGGGTTAACAGCCCATTTGATTGACGGTACCGTGGAAGGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTGCTCGGAATTATTGGGCGTAAAGGGCAAGTAGGTGGTCTCATTAGTCCGGGGTGAAAGCCTTGAGCTCAACTCAAGAAGTGCCTTGGAAACGGTGGGACTGGAGTCCTGGAGAGGGTCGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGAGATCGGGAGGAACACCAGAGGCGAAGGCGGCGGCCTGGACAGGAACTGACACTCAACTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGGGTACTAGACTTGGCGGGATTTGACCCCTGCCGAGTCGGAGCTAACGCGATAAGTACCCCGCCTGGGAAGTACGGTCGCAAGACTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGATCATGTGGTTCAATTCGAAGCAACGCGAAAAACCTTACCTGGGTTTGACATCCCCGGACAGCCGTAGAGATACGGTTTTTGTAGCAATACAACCGGGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTGGTGACATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTGTCCTTAGTTGCCAGCATTAAGTTGGGCTCTCTAAGGAGACTGCCGTGGTTAACACGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCTTTATGTCCAGGGCGACACACGTGATACAATGGCCGGTACAGAGGGAAGCGAAGTGGTGACACGGAGCCAATCTCAAAAAGCCGGTCTCAGTTCGGATTGGAGTCTGCAACTCGACTCCATGAAGGTGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGAAGCTGACTCAACCAGAAGACGTCCAGGCTAACCGTAAGGGGGCCGGCGGCGAAGGTGGGGTTGGTGACTGGGGTGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGCGGCTGGATCACCTCCTTT\n>MNFI01000130.1/10369-10188 Gemmatimonadetes bacterium 13_1_40CM_4_65_7 13_1_40cm_4_scaffold_3525, whole genome shotgun sequence. \nCCGTCCTAGACTGATTCGGGATCCACGTTTGCGAACGGGGATTTACGGAAGCCGGTGCGAATCCGGCGCGGCCCCGCCACTGTAACGGGCTGTTCATCGCGGCTCAGAGCCACTGGGGAAACCTGGGAAGGCGAGCCGCGTAGCCCGAAGCCAGGAGACGTCTTCGTTCGCGCCACCAATCA\n>MLAY01000007.1/1262-1155 Marine bacterium AO1-C Bin2_contig__6B_len_915437_cov_89.8812_ID_11, whole genome shotgun sequence. \nGCCGGTGTGGCGAAAATGGTTTACGCAGCTCAAGTTAGTTTGATTTGCGGCCAAGGCCTTGGGAATCGTGGCCTGTAAGGCGTGGGGGTTCGAGTCCCTCCATCGGTA\n>ANKR01270450.1/11566-11419 Myotis brandtii contig270450, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAGTATCTGTTCTTATCAGTTTAAAATATTATCTATCTGCTGCAAAGCAAGCTGTCTAGAATGATATAACTAAGGTTATCTATAAAATAATGAGGAGTTTCAAAATAAAATATTT\n>DS022282.1/1685882-1685929 alpha proteobacterium HTCC2255 scf_1100007007381 genomic scaffold, whole genome shotgun sequence. \nTAAGGCTTACAACGGCTACCTGAAGTAAGTTGACATAAAAACGGAGCA\n>EU420138.1/1-299 Bat coronavirus 1A strain AFCD62, complete genome. \nGACTTAAAGATATAATCCATCTACAGATAGAGTGTACTCTTCTAGACTTTTGTCTACTCCCCTCAACTAAACGAAATTTTTGCCATATGTTTATGGCTAATTGAAATTTCAGTCGGTTGTTAACATACTTGCACAAGTGTCGTGCATGTCGCCAGTCCCTCCTTTCAGTTCCGTCTGTTAGGTATACTAGGTGGCTGCCTTTGGTTCAGTTCCGTCTGGCCATTGTGTGGATAGTACGTTCCGTCGTGCTTGAAACCGATAACTAGCAGGTATGTCGTCCAACCTTGTGACATTGGCCT\n>LSGP01000020.1/293217-293477 Anaerosporomusa subterraneum strain RU4 RU4_contig_5, whole genome shotgun sequence. \nGAAATGACGATGAACGGAACAGTAGTTACAGTCTGAGATAGTTTCAGAGAACTGGATTTGGTGTGAACCAGTACTATCTGCTGTCATGAATATCCTCCGTGAGTTGCACACCGAAGAATGTAGTAGGCTGTGCCGGGCCTCGATTGAGGAAACGCCACCCGTTATTGTGGCGAGGTATCGAGTGTAAACTCCGTACCGTTGAGAGACTATGGGCAACTATAGTAATTTGGGTGGTAGCGCGGATTAATCTCCGTCCCTTGT\n>MEWZ01000006.1/7057-6737 Candidatus Adlerbacteria bacterium RIFCSPLOWO2_01_FULL_54_21b rifcsplowo2_01_scaffold_18878, whole genome shotgun sequence. \nTGAGCGCGTTGAGTAGTAGCCCCGACGTAACGTCGGGGAGGAAAGTCCGAACACTCCCTCTGGAAAACTGGAGGAGAAAGGTAGCAGGTAACGCCTGTCGTGCGCTTTTTGCGGGCGCAAGAGGTGCGAACAGAGACGAGTCTTCGACAATTTAGGGTTTACCTTGAGTATGTCGAAGGGTGAAACGGCAAAATCCTTACCCGAGTGCAAGGCCGTGTCCCGAGAGTAATCGAAGGAAGTGCCGCTTGATCCCGACGGTGACGTCAGGACCAGATAAATTACTGCTCACGACAGAATTCGGCTTACAGACGCGCGCGCAGA\n>JANL01000037.1/68389-68165 Alkalibacterium sp. AK22 AUG3_contig_1, whole genome shotgun sequence. \nACTAAACTGGATCTTGAAACACGTTCATGATTGATGCTTTACAGAGAGTCAATGCAGGCTGAGAATTGACAAGCAAATATCATGGTCATCATTCAAGGAGTTAGAAGCTGAATGTAGTAGGTTTCTACGTCTATCCGCGTTAAGGATACAGAGGATAAGTAGAAAAGCTCTAGTGGGCTGATACTTTTCAAACTAAGGTGGTACCACGAAGATTTCGTCCTTTCG\n>LITN01000010.1/54782-54831 Bacillus sp. FJAT-21945 super19, whole genome shotgun sequence. \nGAGAGATTTGCTCCGCACAAATGTATACGATGAAGCATTGTGTCAGGAGC\n>JNFA01000019.1/339474-339242 Listeriaceae bacterium FSL A5-0281 contig000019, whole genome shotgun sequence. \nATAAAGACGTTGAAGGAGACAAGTAACGTTACCAAGTCATTGTTAGGGAGAGGTTACCTTAGACTGCAAGTAACCTTAGTGATACGTAATGCGAACATTTCAGCTCTGGAGTCGCTGTCGGGATTTTGTATAATGAAAGACAGATCGGTGTGAAGCCGTTATTGGAATGAAGTGGATAGCTTATTTAGCTGTCTATTAGGGTGGTACCGCGTGATTATAACCTCGTCCCTTTG\n>ABLF02007471.1/1-1768 Acyrthosiphon pisum strain LSR1 Contig7649, whole genome shotgun sequence. \nCATGGAAGTCGGATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAAGCAACTAGCTCTGAAAATGGATGGCGCTGGAGCGTCGTGCCTATACTCGGCCGTCGACGGCATAGTGGGGCCAGTCGTCGCTCGCGGCGGCCGGTCCCGGCAAGCCTCGACGAGTAGGATGGCGCGGCGGTGTGCGTCGAAGGGCAGGTCGCGAGACCGCCTGGAGCCGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATACTCGAGAGGGGCCCTCGGGGGCTGCCGTGGAGAAGGGTTTCTTGTGAACAGCCGTTGTCCAAGAGTCAGTCGATCCTAAGCCCGGGGAGAGATCCTCGTACCACGGGCGAAGGCGTTTTCGAATCGCCCTTGGGGCGAGAGGGAATCCGGTTCGTATTCCGGAACCCGACGCGGAACCGCTCCCTAGTGTTCGGGGCTCTTTTGTCTCGTCTGGGTAACCAGAATGAACTCGAAGAAGCCGCCGGGGGATCTGGGTAGAGTTCTCTTTTCTCTGTGAGCGTTGTACGTCCCTGGAATCCTCTAGCCGGGCGATAGGGACGCGAGCGCGAAGAGCACCGCTCGTTGCGGCGGTGTCCGTGATCCCCACGCGGACCTTGAAAATTCGAGAGAGGGCCACGCGGAGTCTTCGCGTCGGTTCGTACCGATATCCGCAGCAGGTCTCCGAGGTGAGCAGCCTCTAGCCGCATAGAATAATGTAGGTAAGGGAAGTCGGCAAAACCGATCCGTAACTTCGGGATAAGGATTGGCTCTGAGGAGCGTGGCTGCCGGGTTCGGGTCGTCGTAGAAGCGTAGGCGTTTTTGGCGACACCCCGGCCGTCGCCCGTGCGCCCGGTCTTCGGAACGGGAGCCTCGAGGCGGCCGCGGGCCCGTCGCCGTCCGCCGACCGTGGAACCACCGAGCTTCGGTCGCTGGCCGCGTCGCGGCCGGCCGACCGCCTTGGTGTCGGTTCGCCGTCACCGGGCGGTCCGGCCGCCGCGCCGTCGGTCGCGTAGCCGGATCGACAGCCATGTAACGGTCAACTCAGAACTGGCACGGACCAGGGGAATCCGACTGTCTAATTAAAACAAAGCATCGCGATGGCCCGGGACGGGTGTTGACGCGATGTGATTTCTGCCCAGTGCTCTGAATGTCAACGTGAAGAAATTCAAGCAAGCGCGGGTAAACGGCAGGAGTAACTATGACTCTTTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCTCACTGTCCCTATCTACTAGCGTTGCGACAACAGCGACATAGTTCAGACGTGTGTTTCCACGTTCGACGTTGCTCCGAAGGGCGATCCTAGTGGTGATAACTGGCGATTAACTTAACTTCGAAAGTTTACAGGAATTTTTTCAAAAAAGTGTTCAAAAAGTTTTGGTATAGTGCATAGTGCAATCTAAGTCGGGTTTCACGGAAGTTCGCTTAGCCGTTCGTGGTTAAAAGCCGAAAGGCCACTTTTACGTGTTACAGGATAGGACCTTACCGTAAGTGGAGGGGAGAGCTCCGGTCGGCAGTCACGTACACCGAGCAATTCCTGGAATCGGCCGCCCGTCTGGAAATTCGCGACACGTGTAAGTGCGTATCACTGTTCATAAAAGCGCATAAAATAATTAACACGGCCGCCGTGAATATTATTTGGGTAAAATCGTAAATAAAATCGTGTTTTAAGTAAAGCCTATAATTTCGTGATATACGTTAAT\n>LQOS01000013.1/108713-108903 Mycobacterium doricum strain DSM 44339 contig_20, whole genome shotgun sequence. \nGCCGCGCCATGCTTAGGATGTGCGATGTAATCGGCAGGCGTAGGAATCTGGTGAGAATCCAGAACGGTCGCGCCACTGTGAGAGTCAGACCCGACGCCTGCTTCATTCCACTCGGGACGCGAAATCCCGGAAAGGACCCCTGATGACGTCACCGCAAGCGCGCCAGACCCGCGTTCCGGCCATCGACCTGT\n>KL543784.1/20050-21792 Capsicum annuum cultivar Zunla-1 unplaced genomic scaffold scaffold9433, whole genome shotgun sequence \nTACCTAGTTGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTGTAAGTATGAACAAATTCAGACTGTGAAACTACGAATGGCTCATTAAATCAGTTATAGTTTGTTTGATGGTATCTACTACTCGGATAACCGTAGTAATTCTAGAGCTAATACGTGCAACAAACCCCGACTTCTGGAAGGGATGCATTTATTAGATAAAAGGTCGACGCAGGCTCTGCCCGTTGCTGTGATGATTGATGATAACTCGACGGATCGCACGACCATCATGCCAGCGACGCATCATTTAAATTCTGCCCTATCAACTTTTGATGGTAGGATAGTGGCCTACCATGGTGGTGACGGGTGACGGAGAATTAGGGTTCGATTACGGAGAGGGAGACTAAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACACGGGGAGGTAGTGACAATAAATAACAATACCGGGCTCAATGAGTCTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTTAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGACTTTGGGATGGGCCGGCCGGTCCGCCTATGGTGTGCACCGGTCGTCTCGTCCCTTCTGTCGGCGATGCGCTCCTGGCCTTAACTGGCCGGGTCGTGCCTCCGGCGCTGTTACTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTACTGTCACGGGCCTAATTTTAACCACGTGCGGACAGCCTAACACTCACTATATTGAGGCTAAACTTCAGTCCTAAACCGCCCTGAACAACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACAAAAGTTGGGGGCTCGACGACGATCAGATACCGTCCTAGTCTTAACCTTAAACGATGCCGACCAGGGATCGGCGGATGTTGCTTTTAGGATTCTGCCAGCACCTTATGAGAAATCAAAGTTTTTGGGTTCCACGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGATGGAAGGGCACCACAAGGAGTGGAGCCTGCGTCTTAATTTGACTCAACACGGCGAAAATTACCAGGTCCAGACATAGTAAGGATTGACAGACTAAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCCTGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCATTAACGAACGAGACCTCAGCCTGCTAACTAGCTATGCGGAGGTATCCCTTCGCGGCCAGCTTCTTAGAGGCACTACGGCCTTTTAGGCCACGGAAGTTTGAGGCAATAACAGTTTCGTGACGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGATGTATTCAATGAGTTTATAGCCTTGGCCGACAGGCTCGGGTAATCTTTGAAATTTCATCATGATGGGGATAGATCATTGCAATTGTTGGACTTCAACGAGGAATTCCTAGTAAGCGTGAGTCATCAACTCGCGTTGACTACGTTCCTGCCCTTTGTATACACCGCCCGTCGCTCCTACCGATTGAATGATTCGGTGAAATGTTTCGATCGCGGCGACGTGGGCGGTTCGCTGCCCGCGACGTCGCGAGATGTCCATTGAACCTTATCATTTAGAGGAAGGAGAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTG\n>CM001659.1/36667298-36667637 Nomascus leucogenys chromosome 13, whole genome shotgun sequence. \nGCCGGGTGCTGGGGCACGCGCCTGGAGTCCCAGCTACTCCTGAGGCTGAGGCAGGAGGATGCTTGAGCCCAGGAGGTAGAGGCTGCAGTGAGCCATGATCACGCCACTGCACTCCTGCCTGGGCTGTCGTGGGCTATGTCTAGCTGGAGTCTGCACTAAGTTCAGCATCAGCGTGGTGACCTCCCAGGTGCAAGGGGACTACCAGGTTGCCTAAGGAGGGGTGAACCAAATCAGATCAGAAATGGAGCAGGTGGAAATCCTGTGCTAATCAGTAGTGGGATCCCGCCTGTGAATAGCCACTGCACTCCAGGCTGGGTGACATAGCCAGAACCCATCTTTG\n>ALWZ041907802.1/9044-8520 Picea glauca, whole genome shotgun sequence. \nGGGAAAGAAGACCTTGTTGAGATTGACTCTAGTTCGACTTTGTGAAATGACTTGAGAGATGTAGAATAAGTTGGAGTCATTTTCAATGGAAGTGAAATACCACTACTTTTAATGTTATTTTACTTATTCCGTGGGGCGAAGACGGGGCATTGCCCCTGTTTTTGGCCTTAAGACATGTTTCGGTGGGTCAATCCGGGCGGAAGACATTGTTAGGTGGGCAGTTTGTCTAGGGTAGCACATCTATTAAAAGATAACGTAGGTGTCCTAAGATGAGCTCAACGAGAACAAAAATCTCATGTGGAACAAAAGGGTAAAAGCTCATTTGATTTTGATTTTCGGTATGAATACAAACCATGAAAGTGTGGCCTATTATGAAAATGAAGTTATTTTGGCCTTAGATGATGGTGCATGTTTTATCAATGTGTAGCTTCACTTGTAATGCATCTTAAATTAATGCATAGCTTCACGTGTAATGAATAGTAAGAATCACAAGAACTTCCTGCTACATGCCTATAAGTTTAGCTT\n>FAOM01433674.1/17830-17492 Triticum aestivum genome assembly, contig: Triticum_aestivum_CS42_TGACv1_scaffold_433674_5DL \nTCGAATTGTTTGTTGACACGGACAAAGTAAGGGAAAACCTCTGAAAGAATTTCCATATTGACCTTGGACATATAAGAGTTCCGAATCAAATCTCTTTAGAAAGATGATCTTTTGTCTCATGGTAGCCTGCTCCAGTCCCCAAATTCAGAGAAACCTTGGAATTAAAAAGGGCAATCCTGAGGCAAATCCGTGCTTTGAGAAAACAAGGGGTTCTCGAACTAGAATACAAAGGAAAATGATAGGCGCAGAGACTCAATGGAAGTTGTTCTAACGAATCGAGTTAATTACGTTGTGTTTACCAAAAGTTCCTACATTAATGGGAAATGCCCTACCTTTGAG\n>CM000916.2/22526794-22526579 Nasonia vitripennis chromosome 2, whole genome shotgun sequence. \nAAGATCATACTTCACAGGATCATTTCTGTAGTATATCTTCACAGACTCTCTACCCAAAGTAGGAGTCGATGCAACCACGATGAGGAGACGTAGCTCTCCTTCCTGAGCGTGAGGACGACTCGGAATTGCGGCTTCGGTCGGAATACCAGTCATCGATGATCGTTCACCTTCTGCACTTTGTGCAGAAGGCATGGGAGGACGGGCTTTCTGAGTGGC\n>MLCN01000008.1/279819-279740 Alkanindiges sp. H1 contig8, whole genome shotgun sequence. \nGGTCTCGAGGGGTGCTGCAACAGTAAAGTAATATACTGCCAGGCTCGAGCATGTCATTTATTGAACGGCATCCGCGAATT\n>JPUK01000002.1/192788-192900 Candidatus Micrarchaeum sp. AZ1 Contig2, whole genome shotgun sequence. \nCCAAACGGTAATAGGAGCAGGGAAACGCCCGATCCCATTCCGAACTCGGAAGCTAAGCCTGCTCACGATATGTGTGTACTGTCTGCGGATGGGAAAGCATGTTGCTGTTTGGC\n>AAQR03163520.1/18142-17999 Otolemur garnettii contig163520, whole genome shotgun sequence. \nATCCTTTCACAGCTCATAAGCGGGGCGATTGGGTTTTCATGCGCATGCGTGCGCACACCCCTCCTCCCTCTCCTTCCCCCCTTCCCCCACCCTCCCCGACCCCGCCAAATCTTGTTATGACATTGGCACATTACCCATCTGACA\n>ABAV01003903.1/1546-1268 Nematostella vectensis strain CH2 x CH6 NEMVEscaffold_21_Cont3903, whole genome shotgun sequence. \nTAGAACAATGTAGGTAAGGGAAGTCGGCAAAATAGATCCGTAACTTCGGGAAAAGGATTGGCTCTAAGGGTTGGGTCTGTCGGGCTGAGACTTGAAGCCAGTGGACCCGGCCCGGACTGGCCGAGGCCCTTCCGGGGGTCGAAGCTGGACCGGGAAGGGGCTGTTGGTGGATTGGCCCAGCTATGGTCGCGAGGCCAATTCGGCAGGCAATGAACAACCAACTTGCAATCAGATTTCGAATCGATCAAGAATTGAGTTAGAAGGTCCATGTACCATGTA\n>AM910987.1/84270-80099 Plasmodium knowlesi strain H chromosome 5, complete genome \nTGTTTTCTAAATAGGAGAGCGAATCCGCCGAATTTAAGCATATAATTAAGCGGAAGAAAAGAAAATAACTATGATTCCTTTAGTAACGGCGAGTGAACAAGGAAAAGCTCAAGCGGATAATCTGTGTGTCTTTTCCTTTTTTTTTAAAAGGTTTAGCACAAAGAATTGTCGTGTATAAAAATACTATAGTAACTTTTCGGTATCTGTAAAAATAAAGCATATGTTACGAAGCGAGGTGGAATGCCTCCCCCAAAGAGGGTGAAAGGCCCGTAGGAAAACATTTATGGTTTAGCGTTACTGAGAGACCTCTATATGTAAAAGAGTCGTGTTCTTTGAGATTGGAGCACAAATGCGTGTGATACATTTCACATAAAGCTAAATATGTGTAGGAGACCGATAGCAAACAAGTACCGTGAGGGAAAGATGAAATAGTACTCAGGAATGAGCAATTAAAAAGTACCTGAAATCGTTAAGATGGAACGGATTAAGAGAGAAAAAAAGTAAATGCAGTCAAATAGTGATTTAGCAGCACTATCATAATTTAACTGCTTTATTAAAAGAAACATCAGTAAAAAGTTTTACGACCTATTCGGATAAAACTGTTGATGAAAAAAACATTTAATTTTTTTTTCTTATCCCAGGATAAAAAAAAAAATTAATAGTCTTTTTCACATTATCCTTATTTTAAAATATAGGATAAAAGGTTTTATAGAAAATCACGAAATAAAAGTGATAAGATAGTCCATTTTACTGAGGTTATATAAAAATGTGTATTTGCTTGTAAAAAAAAAAAAATATTCTTTGTGAATATCTTTTTTTTTACAGCTGCGCATTTTAAGTTGTTTCTATAAGATACTTTCTTAACCCACTCGTCTTGAAACACGGACCAAGGAGTCTAGCAAATGTGCAAGTGTATATGATATATTAAACATTAATGTACGTGAATAACGTACTGTTTTTATACGCATAATTAATGTAATATGTTATAATTTGTAGAATTAGTTGATAATTGCAAAATTATCACTAACGCATACAATACCGGTAGGCAAATTATGCCATATTGAGTAAGAGCATATTTGGTAGGACCCGAGAGGCTTTGAACTAAGCGTGGTGAGATTGAAGTCAGACGAAAGTCTGATGGAGGATCGAATTGATACTGACGTGCAAATCGTTCATTTCAATCACGTTTAGGGGCGAAAGACTAATCGAAAAGCCTATTAGCTGGTTATTTTCGAAAGATCTCTCAGGATCGCTGGAGTTGATTGTTATAATTTTACCAGGTAGAGACAATGATTAGAGGACTCAGGGAATTGAATTTCCTTGACCTATTCTCAAACTCCCAATGGGTAAAAAGGGATAAAAATAACTTTATTGTATTTTTCTCTATTCAAATAAAATAACTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGAGGGATGCTCCTAACGCTTGGATAAGGTGCCTAAATATTCGCTCATCAGATCCCATAAAAGGTGTTGGTTCATTATGACAGTAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTTACCTACCGAATGAACTAGCCCTGAAAATGGATGGCGCTAAAGCGAATTACCGATACCAGGCCATAGAAGGGCAAGAAAAAGAATTAGTACTTTCGGGTGTTTTTTCTTTTTTAGGAACCTTCTATGAGTAGAAAATCGTGGGGTTTTGTGTAGAAGCGAAATACGTGAGTTTTCGTGGAACATCTCCCTAGTGCAGATCTTGGTGGAAGTAGCAACTATTCAAATGAGAACTTTGAAGACTGAAGTGGAGAAGGGTTTCTTGCCAACTGTGTTTGTACAAGAGTTAGCCGCTCCTAAGAGATAGCTGAAAAGTGTTTATATGGGGAGGATTCTAATCTTTCTATCCCCGTCTCGAAAGGGAAACAGGTTTATATTCCTGTGCCAATACAAATCTATGGGTTAATTTTTAAAAGATGGCAACATATAGACAAATGAACCTCTTTACATAGGTTTTACCATCGGGGTGCGTTATCTTTGCACTTTACCTTTATAGCATACCTTGGAATCAATTTACTTGGAGAAGAGGTATGTTGAAGTCAATTCAGTTAAATTTTTGTATGGTTCTGTAATTCTCATTACAGAATTATATGTAAAAACTTTCCTGTTTTGTAGCAATAGTAATTCGTTTTTATGAATTATTCGATTCGGTATAAACTATCCTTGAAAAAAGGGGGGAACAACAAACCAAAGGGGGAGAAGTAGAATCGCCTACAAGTGATTTTAGTAATCGCAAGATTGCTAGTTCGGTTGTAAAAAGATTCTTTTCTCATTCTTGGTATGTACAACTCTAATTTGTAAAAATGAGCGTACCAACAACCGCATCAGGTCTCCAAGGTTAGTAACCTCTGGTTAAATAGAAAAAAGTAAGTAAGGGAAGTCGGCAAAATAGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGACATTAGAATGGAAAGAAATAGAAATATAGTCGAAAGAAAAGTCATTGAGGTGCTTTTACATGTTTTTTTTTTCCACAAAAAAAACGTGTAGGCATTTCTTTTGCACTCTTTTCTCTTCTGTTTTCCTTTTCTGCCCCCATTCGCCGTCATATATATATCTTTTCGCTTCGGCGATTGGCGTACATATGACACTTATAATGTTAACTCAGAACTGAAACGGACAAGGGGAATCCGACTGTTTAATTAAAACATAGCATTGTGACAAGCCATAACTGGTATTAACACAATGTGATTTCTGCCCAGTGCTTTGAATGTCAACTTGATGAAATTCAATCAAGCGCAGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTACTTGCTATCTAGCGAAACCACAGCCAAGGGAACGGGCTTGGCCAAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTTACTCTAGTCTGGCTTTGTGAAACGACTTAAGAGGTGTAGCATAAGTGGGAGTAGAGATCGAAAGGTCTTTACGACAGTGAAATACCACTACTTTTAACGTTGTTTTACTAATCCATTTATTGGAATATATATGTATAAAAGGGATGCTCCTTTTTTTTTTAAGAAAGGGGTTTTATCTTTTACATATTATCGCAGAATTTATAGTTAGGGCTATGCATGTAAAAAATGTGTAGTTTTATCTATAGTTCCGATTTCTTATGGAGACATAGCCAGGTGGGGAGTTTGACTGGGGCGGTACATCTGTTAAACAATAACGCAGATGTCCAAAGACAAGCTCAGAGAGAACAGAAATCTCTTGTAGACTAAAAGGGGAAAAGCTTGTTTGATTTTTACTTTCAGAAAAAGTAGAAAACGTGAAAGCGTGGCCTATCGATCCTTTACATTTGCAAAATGATGGAGTTTATTCTCTTACTGTGCATGTAGAGGTGTCTGAAAAGTTACCACAGGGATAACTGGCTTGTGGCTGCCAAGCGCTCCTAGCGACGTAGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGGGACGCAGAAGTCTCAAAGTGTCGGATTGTTCACCCGCTAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGAATACTATTATTTTTATATACATATAGTATTGTGACAGTAATCCAACTTAGTACGAGAGGATTAGTTGGTTCAGACAATTGGTACAGCAATTGGTTGACAAACCAGTGTTGCGAAGCTAAGTCTGTTGGATAATGGCTGAACGCCTCTTAAGCCAGAACCCATGCTGATTAAACAATATTATTTCGATCTTTTTTGTAACAAATTTTTTACCGTCGATGTAAAAGAGAAATTATATATGCAGTTCTGTGTTTTTAACCGGGTGCATTATTAATCCTATTAACATATAATACTGTGTGTGTATCGTTTGCAAAAACTTACACCAAAACAGTAAAATGTTTAATATTATTTTAACAACAAGAAAGATTATCTGTGTTTGTAGACTACTTACTTGGTCCCGGGGTGCTGTAAACATGAAAGTAAACTTTGTTTTACGATCTGTTGAGGCTTATCCTCAGTGACATAAGAAAAT\n>LTWW01000048.1/24870-24711 Staphylococcus sp. HMSC078E07 Staphylococcus_spHMPREF2905-1.0_Cont825.1, whole genome shotgun sequence. \nAGTGTCTTTTAAAAAGAGTCCAGAGAGGCTCAAAAGACAGGGTGACTAATGATATAAATATGATTAACTTTAATTGTTCGATTGTTATCAGACGAATCATATAAAATATTTTTATATACATTAAACCTCATGTCTTTGTAAAAGGCATGAGGTTTTTTCT\n>MTEM01000151.1/7116-7366 Desulfobacteraceae bacterium IS3 Ga0073107_10151, whole genome shotgun sequence. \nATACCCGAAATTTGTTCAGGTGTTTTATCGCTTAATAGGGAACCCCGTGAAAATCGGGGGCGGGCCCGCCGCTGTAATCGGGGACGAACGCCGCTTGAAACCACTGACGGAGAAAATGCAAAATGCAAAGTGCAAAATGCAAAGTTAACTTTGCACTTTTAACTTTACATTTTGCATTGTATCTGTCGGGAAGGTGCGGTCAGTAGGATGAACCGAGAGTCAGAAGACCTGTCTGAATGATATACCGGCGT\n>JH591489.1/51165-51260 Lepisosteus oculatus unplaced genomic scaffold UNK80, whole genome shotgun sequence. \nAACCTTTTATTACTTTTTGATAATAAAAAAAAATCTGTTCTTATCAGTTTAATATCTGATACGTCCCCCATCGGGGGACCACATATTAAACNNNNN\n>MICY01000022.1/569-1 Tenericutes bacterium GWF2_38_8 gwf2_scaffold_13316, whole genome shotgun sequence. \nTTTATGGAGAGTTTGATCCTGGCTCAGGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAACGCACCATTTCGGTGGTGAGTGGCGAACGGGTGAGTAACACGTAGGTAACCTGCCCTTAAGACGAGGATAACCAAGGGAAACTTTGGCTAAAACTGGATAGGAACATCGAAGGCATCTTTGATGTTTTAAAAGACCTAGCAATAGGTATGCTTAAGGAGGGGCCTGCGGCGCATTAGTTAGTTGGTGAGGTGAAGGCTCACCAAGACGATGATGCGTAGCCGGACTGAGAGGTTGAACGGCCACATTGGGACTGAGAAACGGCCCAAACTCCTACGGGAGGCAGCAGTAGGGAATTTTCGGCAATGGGGGAAACCCTGACCGAGCAACGCCGCGTGAATGACGAAGTACTTCGGTATGTAAAGTTCTTTTATCAGGGAAGAATGGCTAGCGGAAAAGCTAGATTGACGGTACTTGATGAATAAGCCCCGGCTAACTATGTGCCAGCAGCCGCGGTAATACATAGGGGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGGGTG\n>ABBZ01000577.1/639-936 Beggiatoa sp. PS contig21537_2600-2601, whole genome shotgun sequence. \nCAAGGGACTTAAACAAATTTGAGCACCTATTGCGAAATCTTTAGGTGAATGGAGTCTAATTCGGCGAAACCTTTAAAATGACAACGCCGAGCTAAGCTCAACGGTGGGGGCAAGGAAAGGGGATAATCATATCCCTTTTCCTTTCCCCTTTATTATTTTTTCTAAACCATTTCTCCTCCGTTGAGAAAGTGTAGAGACCATACGGCTCCTGCCTGACTAAATCCCTTCAATTATTTGATTGCGAGGCATTTAAAGGCAAAGACAGGGTCCAGACCACAAACATTCAATTAATTGAAAA\n>MKTL01000001.1/659200-659282 Clostridiales bacterium 38-18 SCNpilot_bf_inoc_scaffold_0, whole genome shotgun sequence. \nCTATTATCTTGGCAAACTGCTTGAAAGAGTAGGACGCAAAGTTTGAAGTCTAAGGCACTAGCTATGACCGTTCAACTGCAGTA\n>CP000680.1/4301122-4301323 Pseudomonas mendocina ymp, complete genome. \nCGGGTTTACTCCTGGTTTTTACCGTTTCGCCAAACCGAGGTTCGGCGGCGTTTTGGTGTCTGATTCGGTAACGAATCGGGAGCACCATCTGCGTAGGCCATCAGGCGAACCTGACATTTAAAACGCGAGTCACCTACGGTCTTGGATAGCCCCCGCCAGGCAGGGACCCCAATCTTTCAAAGCCGGCAGCGCATGGCTGCCG\n>KK198757.1/45732841-45732932 Eucalyptus grandis cultivar BRASUZ1 unplaced genomic scaffold scaffold_5, whole genome shotgun sequence. \nTGATGATAATGATGATGATGATGATGATGATAATGATGATAATACTAGTAGTAGTAGTAGTAACATCATCATCATCATCATCATCAAAGGTA\n>CP000705.1/1964394-1964162 Lactobacillus reuteri DSM 20016, complete genome. \nTAAAAAACGTTGACCGAGAATCGTCAATTCTGCTGAATTAAGAGAGCCGGTGGTTGGTGGAAACCGGTAGGAGGTAGTTGCGACAAATCCCTCGCGAGTTGTATGCCGAAATAATAGTAGAACATACTGGTAGCAGCCATTATCTTGCCGATTAATTGCCATTGTGGGCAGTTGATTGAGGCAACCCTTGTGTTGTAAATAAAGGTGGTACCACGTTGATAGACGTCCTTTTA\n>AHHD01001364.1/1-303 Macrophomina phaseolina MS6 contig01813, whole genome shotgun sequence. \nGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCTGCCGAAGTTTCCCTCAGGATAGCAGTAACGTATTCAGTTTTATGAGGTAAAGCGAATGATTAGAGGCCTTGGGGTTGAAACAACCTTAACCTATTCTCAAACTTTAAATATGTAAGAAGTCCTTGTTACTTAGTTGAACGTGGACACTTGAATGTACCGTTACTAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGAACGCGATGTTAAGGTGCCGGAATGCACGCTCATCAGACACCACAAAA\n>AFYH01130564.1/25905-25790 Latimeria chalumnae contig130564, whole genome shotgun sequence. \nTTTGAAACCCAAACCAGCTAGATTTAATTCTATCCACGTCTGATCTCAGAAGCTAAGCAGGATCGGGCCTGGTCAGTACTTGGATGGGAGACCACTGAGGCAGCCCAGGTGCAGTC\n>KB944511.1/1034622-1034709 Plesiomonas shigelloides 302-73 genomic scaffold scaffold00012, whole genome shotgun sequence. \nGTAAGACGCGCTATTTTGTTGTCATCACATCCCTGAAATTACACACGCAGAGATGTATTTCGGCCACCCCACCTTGGAGTGGCCTTTT\n>CM002812.1/447709-447914 Capsicum annuum cultivar Zunla-1 chromosome 1, whole genome shotgun sequence \nTCAGTCATAGTTTGTTTAATGGTATTTATTACTCAAATAATCATAGTAACTCTAAAGATAATACATGCAACAAACCCTAACTTTTTAAAGGGATGCATATATTAGATAAAAGGTAGATGTGGGCTCTTCCCATTTTTTTGATGATTCATGATAACTCAATGGATTGCACGGTCATTATGTTGGCGACACATCATTCAAATTTTTGC\n>AZHD01000026.1/410476-410398 Sporothrix insectorum RCEF 264 scaffold_26, whole genome shotgun sequence. \nAAAGGGGTAGTATAATAATTAAACACTTAAAAGACGCCGTAACGCCGCGACGTCGTAGGTTCGAATCCTACCCCTTTTA\n>CM002818.1/23807342-23807451 Capsicum annuum cultivar Zunla-1 chromosome 7, whole genome shotgun sequence \nTTTTGTATTTTTCCACAGCTTTCTTGAACTGCATCTAATTACGATTTTCACTAATGAGGAAATTAATTCATATCGTTGCGGTTCAATAAAGCTGTGGGAAGATATAGATA\n>AYZL01000006.1/155934-155671 Lactobacillus floricola DSM 23037 = JCM 16512 strain DSM 23037 NODE_9, whole genome shotgun sequence. \nAATTTTACTGAGAAAAGATGAGTAAATATTTATCTTATTTTAACAGAGAGCCATGTTAGGTGAAAGATGGTATTTAAGAAAATATTGAAGATGGTCTTGGAGTAAGTTTAAATTGTGAGCCAGTTAGGTTAGCAATTTACGGGATAACACACGTTACTGTGTTGAAGGATAGCTACCATGAGTGTCCGGATCGAAGATGGTGATAATAGCATTGTATAATTATCACTAATATAGGGTGGTACCGCGTTTAACAACGCCCCTAGG\n>ALWT01124023.1/1602-1388 Myotis davidii contig124023, whole genome shotgun sequence. \nATCGCTTCTTGGCCTTTTGGCTAAGATCAATTGTAGTATCTGTTCTTATCAGTTTAATATATATTTCCAAATTTTTCAGGTGGATGCCCCAAAGAGGGATTTCTGGGTTATATGGTAGCTCTATTCTCAATTTTTTTTTTGAGGAACTTTCATACTGTTAACATAGCGGCTGTAACAATTTACATTCCCACCAGCAGTGCATGAGGGTTCCCTTT\n>JTDY01005470.1/30475-30582 Operophtera brumata OBRU01_Sc05470, whole genome shotgun sequence. \nTGATGATGATGGTGATGATGTTGGTGGTGGTGGTGATGATGGTGGTGGTGTAGGTGGTGATGTTGGTGACCATCATCATCACCACCATCATCATCATCATCACCTGCA\n>LN774769.1/2382714-2382521 Lactococcus piscium MKFS47 genome assembly, chromosome: I \nGAAGCACTGGAATGTGCGAACTTACTCACATTTTTGACCGACTAAATCGTATTACCTAGGGAGTCTTTGAGACATCTTACCGCGTGCAAGCCATTTTAGATGGAAGCTGCTAAGTAAGAGCGAGACGCCCACCTGTTTAACATTTACAGCGGGTTCAATACAAGAGTGAGTAACGGCATTCAATCAGTGCTTTT\n>AYUG01147828.1/3237-3115 Fukomys damarensis contig147828, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAAACAACATCTTATTAATTCTGGTTTGATTGTCTTTACCAAAAGAAATCATTCCTGAGGTTTTCTTATGGAAAATGTTTTGGAACTTTC\n>URS0000D69AE5_12908/1-140 unclassified sequences RAGATH-24 RNA \nTTGACAGTCCAAAAACCACCTGCCCTCGGGAGATACCCGAGGTGTGACCTTCGCCGTTTATCGGTCGCCTCCCAGATTCATCGGGGGGCGGGGAGAGAGGGTCAGCGATTCGTTCGCTTGATGACGTGGGAATAGGACAC\n>KB095811.1/12337799-12337623 Helobdella robusta unplaced genomic scaffold HELROscaffold_1, whole genome shotgun sequence. \nTGATGACGATGATGATGATGATGATGGCGACGATGATGATGATGATGATGACATTGTTGTTACATCAAAACAGCGATTTCGAATGCATAATTGGATGTGTTTTTGTTTGGCCCGGCAAATAACTGCTATTAAATGTCATCATCATCATCGTCGTCGTCCTCATCATTATCATCATCA\n>LL990082.1/1-981 Schistosoma rodhaini strain Burundi genome assembly, scaffold: SROB_contig0004979 \nGCATTGCGATGTCCACTGATTGGTTTTGACACAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATTACCGACGTTCAATCAGCTGCGTCAACCGCACTGAATTGCATCCTACGTGTGGGGTGAAGCAAGGAGACCCCCTGTCGCCACTCCTCTTCATCATGGTTCTCGACGAAGTACTGGAAGGTCTAGATACAATGACCCACCTAACAGTTGATGGAGAGAGCTTGAACTACATAGCTTATGCTGACGATCTCGTAGTTTTCGCTCCAAATGCAGAACTCCTTCAACGAAAACTCGATCGAATCTCCCTACTTCTACACGAGGCTGGATGGTCGGTTAACCCTGAAAAAAGCCGGACCCTGGACCTAATCTCTGGTGGCCATTCCAAAACCACAGCGCTCTCTCAGACAGAATTCACCAACGCGGGGATGCGTATACCACCGCTTTCTGCCGCCGACACCTTCGACTACCTGGGTATCAAATTCAACTTCAAGGGCCGATGCCCAGTGGCCCATATTGACTTATTGAACAACTACCTCACGGAAATATCGTGCGCTCCACTTAAGCCGCAGCAGCGCATGAAGATCTTGAAAGATAATCTACTCCCTCGACTCCTCTACCCCCTGACTCTAGGAATAGTACACCTGAACACCCTGAAGTCAATGGACCGAAATATCCACACGGCCATAAGGAAATGGTTGCGGCTACCCTCCGACACCCCGCTAGCATATTTTCACTCACCCGTCGCTGCCGGAGGCCTAGGGATCCTCCATCTGTCCTCATCGGTTCCATTCCACCGTCGAAAACGTCTAGAAACCCTCCTATCTTCACCGAACCGCCTACTGCACAAGTTGCCAACTTCTCCAACACTAGCTTCTTATTCACACCTTAGTCAACTGCCAGTTCGAATTGGGCACGAGACCGTAACGTCTAGA\n>BDDD01008159.1/30464-30638 Cephalotus follicularis DNA, scaffold: scaffold8159, isolate: St1. \nATACCCTTAACTTTTGGCTAAGATCAAGTGTAGTATCTGTTCTTCTGAGTTTATCATCTCATATGATTCACACGATATTTTTTTATATGGGAAAAGACTCATCACAATAGCTTACTATTGGGGTTTTTTAGCGTCCCTTATGTGTTCCATACCGTATGGACCTGACGCACCCCTA\n>ALYE01001358.1/3372-2729 Gossypium raimondii Chr01_contig_1358, whole genome shotgun sequence. \nAATACGAACCGTGAAAGCGTGGCCTATCGATCCTTTAGACCTTCGGATTTGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAGCAGAATTCACCAAGTGTTGGATTGTTCACCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTACCCTACTGATGGCCGCGTCGCATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGCTGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGAAGCGACGCACGCGCCCGTCGCCCGATTGCCGACCCGCAGTAGGGCCTCTGGCCCCCAAGGGCACGTGTCGTAGTGCAGCGGCCGCGGCGGACAAGTCGCGGGCGCCTCCTGGAGCGTAATTCCCACCGAGCGGCGGGTAGAATCCTTGCAGACGACTTAAATACGCGACGGGGTATTGTAAGTGGCAGAGTGGCCTTGCTGCCACGATCCACTGAGATTCAGCCCTTTGTCGCTTCGATTCGT\n>CM001740.1/4627691-4627566 Gossypium raimondii chromosome 1, whole genome shotgun sequence. \nGGGCGTAGGCCTCTTAAAAGGAGTGCAAAGGCAGAAGGGAGCTTGATTCAAGACCCACCTGTCTAGTAAGGACGAAAATCAGCTTTAGTGATCCGATTGTGCCGAGTGAAAGGGTCGTCGCTCAAC\n>KB730334.1/190955-191028 Fusarium oxysporum f. sp. cubense race 1 unplaced genomic scaffold scaffold395, whole genome shotgun sequence. \nGCCAAGGTGGCCGAGCGGTCTAAGGCGCCAGACTCAAGATCTGATTGGTTGGATCTAGAATCCCAACCTTGGCA\n>MHLG01000025.1/17211-16820 Candidatus Liptonbacteria bacterium RIFOXYD1_FULL_36_11 rifoxyd1_full_scaffold_658, whole genome shotgun sequence. \nGGGGGTGAAAGGGCTCGACGGAGTTTCTTTGTTATAAAAGTGGCAGGTAGGTTTGACGAGACCTTAAAAACGTCAAAAAAATAAGTGCCAACTTATTCAACAGACAACCGGCTTTAGCTTACGCTTAAGTTGGTTGTAACCTTAGCTTTTATGCTGAGGCGTCGCTCTACTTTTTGCTTATAGGAGTGGAAGCGGTGTAAAAGTATAAGCTTTTCTTACTCTTTTAAACTTGGGGAGTGGGAGAAAAAAACAGGTTTGGCGGGTAAAAACTTTTTGGTAAATTATAAATTTTTACTCGTTTACCGAAAGGTAAAAAATAAAATTTACCTATATCTGTAGAAACTTTTATGGCTCAACTTCGGACATGGGTTCAATTCCCATCATCTCCACTA\n>HF992493.1/15144-15489 Mycoplasma sp. CAG:877 genomic scaffold, scf27 \nAATATATAGACAAACGCTGGGACTCTTGAGGTCCTTGAGGAAAGTCCATGCTCGCACAGTCTGAGATGACTGTAGTGTTCATTCTTAGGGAATAAATAACCTAAGGTAGTACTTGTACTAACGGCGGATACTATATCTAAGTCTTATGATATGATATAGTCCATAAAGTGCCACAGTGACGAATTCTTTGGAAACGAGGAAGTGAAACGCGGTAAACCCAATGAGCGAGAAACCCAAATTTTGGTAGGGGAGTTCCAACTTCGAGAAATGAATTGGAGTGGAGACCAGTAATGGTAGATAAATGTTTGTCGCTTAGGAAACTAAGAACAGAACATGGCTTATTTAT\n>CM001498.2/114148093-114148035 Papio anubis isolate 1X1155 chromosome 8, whole genome shotgun sequence. \nTGACTTATTTGGTTAAAGTACCTGTCTAGTAAACAGGAGATCCTGAGTTTGAATCACAG\n>KE356582.1/1391668-1391842 halophilic archaeon J07HB67 genomic scaffold scf_7180000098878, whole genome shotgun sequence. \nACTGCAGGCTGTCGCTGAGACATGGTCGCTGATGTGCAGAGTAGGTAGGAGTCGTTACCGAGGCCCGTGCGCCAGCACGGCGCCCAGACACACATGAAACACTACCCGTCAGTGACTGTGACTCTCACTCCGGGAGGAGAACACCGGTAGCCGGGCAGTTTGACTGGGGCGGTAC\n>CM000820.5/64985614-64985509 Sus scrofa isolate TJ Tabasco breed Duroc chromosome 9, whole genome shotgun sequence. \nGTTCTTGCCTCGGCAGTATATAAACTAAAACCGACAATACAGAGAAGATGAGCATGGTCCCTGTGCAAACATAGCATGCAAATGTCCATAAAAAAGAATGCTATTT\n>CM000791.1/61008405-61008287 Oryctolagus cuniculus chromosome 2, whole genome shotgun sequence. \nATCGCTTCTTGGCCTTTTGGCTAAGATCAAGTGTAACAATGCTAAAACATCAAAAAGATATTCAGTCTAAGTTATATATTATACAAAATATATTTGCTGTTATATATATTTAAACCTCC\n>GL637601.1/22009363-22009461 Caenorhabditis tropicalis strain JU1373 unplaced genomic scaffold Scaffold629, whole genome shotgun sequence. \nTTTCGAAACAGAGTGACCGTCTGTAGTTTTTTTGTGTAGTGCTCCGAGCCAAAATGTGTTCGAAGCACCACGAGAAGCTGCAGATGGAACAACTTGTAT\n>MNXL01000222.1/6266-6479 Anaerolineae bacterium CG2_30_64_16 cg2_3.0_scaffold_3852_c, whole genome shotgun sequence. \nCTCTTATCCAGAGAGGCAGAGGGACCGGCCCTGTGAAGCCTCGGCAACCAGGAGATGGTAAATTGGTAAACTGGTAAACTGGTAAATTGGTAAATTGGTGGTCTGCTCGATGGGCAGCGACTTGCCACCAATCTACCAACCTACCAATCTACCAATCTACCAGGTTACCACCCCATGGTGCCAATTCCGGCAGAGTTGATCTGGAAGATGAGAG\n>MEVM01000037.1/1634-1766 Candidate division WWE3 bacterium RIFCSPLOWO2_02_FULL_53_10 rifcsplowo2_02_scaffold_176987, whole genome shotgun sequence. \nAGTTTATTAAGAGCGGCGGTTAGAGGCCTGGCTCGTTGACCCGCCCAGCAACTTGTTTGCGAGGCGTTGGAGAAACCCTCCGACAATCTTGGGATAAAGTGCTAAATCCAGCCCCGCTTGGGGAAGATAAATT\n>ALWT01215141.1/49283-49606 Myotis davidii contig215141, whole genome shotgun sequence. \nGTTTGTAAGAACGGACATGTCATGTGACATCTGTCACCCCATTGATCGCCCGGGTTGATTCGGCTGATCTGGCTGGCTAGGCGGGTGTCCCCCTCCTCCCTCACCGACCCATGTGCGTCCCTCCCGAAGCTGCGCGATCAGTCGAAGAGGACGACCTCCGCTCCCCCCAGAGGACCGGTCTTCGGTCAAGGGTATACGAGTAGCTGCGCCGCCCTGCTAGAACCTCCAAACAAGCTCTCAAGAAATATCCAGGGGAGACAGAGTAAAATTTAAAACGAGTTTGGCCTATATTCAGTCTTAAAAGTTTCATGAAAATATAAAACT\n>AYZV02077796.1/1114-1237 Spinacia oleracea cultivar SynViroflay scaffold18850.con0006.1, whole genome shotgun sequence. \nTAACCCCGGCACAAGGTTGACACAAAATTGAAATGATACAGAGAAGACATTTTCAAGATTGAAATTAATATGGCCCCTTTGCAAGGATGACACAAATTTAAGAAAACATTTTCAAGAAATCTTT\n>FR899405.1/21238-21732 Mycoplasma sp. CAG:472 genomic scaffold, scf68 \nTTGATATAATATTTATGTGGTGCATTATGCTAGTCACAATCACTATTTGAAGATGGGGCTAAAAATCCATTAATTGATACAATTGCACTTTATATATTTGCTGCTTCTGCCCAAGTTGGGGTGAATATGTAATTTAAAATTATAGGGAAATCATAACGGCATATGACTAACCCCCTGTAATTAAGCAAAAAAGGAAGAGTTATTCATGTCGTGCGTGGTTATTAGGGATTTAACGAATAATAATGTTGATGAAATCTTAACTGCAAAAGCGAATAAGAATAGTTTAGATGTGTCAGGGAAAACCTCTAGCGTGTTATTTATTATAAAGATTGAAGTGCGGACTATGTGGCAATCGAGTCATTAGTTAGGCAACTACTAATTATTTTCTTTAAAGAGAAATCGCCTAAGGGTAACCAAGGGAGAGAAAATAGAGAAATTCAACTCGACCAAAGCCGTAAGATTAATTTATAATAAACCATAACATTTTTAATAACT\n>AFTD01054950.1/9395-9285 Cricetulus griseus cell line CHO-K1, whole genome shotgun sequence. \nATCGCTTTTCAGTCTTTTGGCTAAGATCAAGTTTAGTATTTGTTCTTATCAGTTTAGATTAGTACCCTGTTCTCTTTGAAGTATAAAAATAAGGTGAATTTAAAAAGTCAT\n>MNTO01000093.1/21391-21316 Ruminococcus sp. CAG:9-related_41_34 Ley3_66761_scaffold_4291, whole genome shotgun sequence. \nAGTCCGTGTGATGATGTAGCACCGCTGGCAAAGGGTACGGCTGGATGAGAACCATGCAGGGGTGAGATTCCCATGA\n>CP002528.1/2537163-2537236 Dokdonia sp. 4H-3-7-5 chromosome, complete genome. \nATAACCAGGAGTTGGTCTATTAGAGAAGTCAGCAGAAGTCATAGTAGCTAAAGCCTGATATTTTAGTGAAGGAC\n>AOTI010107864.1/9315-6890 Triticum urartu cultivar G1812 contig107864, whole genome shotgun sequence. \nTGGACCTAAGCCTGAGACTAAGTGCTTCTACTGCAAAGGGACTGGTCACTAAAAGCGGAACTGTCCCAAGTATTTATTGGATGAAACTAAGCAGAGGTCCGAACCGACTGATGTTGAAGAATCAGCGGATGAGTTGTGGTTAGGGGTGAAATGCCACTCGAACCCAGAGCTAGCTGGTTCTCCCCGAAATGCGTTGAGGCGCAGCAGTTGACTGGACATCTAGGGGTAAAGCACTGTTTCGGTGCGGGCTGCGCGAGCGGTACCAAATCGAGGCAAACTCTGAATACTAGATATGACCCAAAAATAACAGGGGTCAAGGTCGGCCAGTGAGACGATGGGGGATAAGCTTCATCGTCGAGAGGGAAACAGCCCGGATCACCAGCTAAGGCCCCTAAATGACCGCTCAGTGATAAAGGAGGTGGGGGTGCAAAGACAGCCAGGAGGTTTGCCTAGAAGCAGCCACCCTTTAAAGAGTGCGTAATAGCTCACTGATCGAGCGCCCTTGCGCTGAAGATGAACGGGGCTAAGCGATCTGCCGAAGCTGTGGGATGTCAAAATGCATCGGTAGGGGAGCGTTCCGCCTTAGAGGGAAGCAACCGCGAAAGCGGGGGTCGACGAAGCGGAAGCGAGAATGTCGGCTTGAGTAACGAAAACATTGGTGAGAATCCAATGCCCCGAAAACCCAAGGTTTCCTCCGCAAGGTTCGTCCACGGAGGGTGAGTCAGGGCCTAAGATCAGGCCGAAAGGCGTAGTCGATGGACAACAGGTCAATATTCCTGTACTACCCCTTGTTGGTACGGAGGGACGGAGGAGGCTAGGTTAGCCGAAAGATGGTTATAGGTTTAAGGACACAAGGTGACCCTGCTTTTTCAGGGTAAGAAGGGGTAGAGAAAATGCCTCGAGCCGAGGTCCGAGTACCAAGCGCTGCAGCGCTGAAGTATGAGCCCCGTGGACTAGCGATTGCTTCTCCACGAGGCTCATACCAGGCGCTACGGCGCTGAAGTATGTAACTGATGCCATACTCCCAGGAAAAGCTCGAACGACCTTCAACAAAAGGGTACCTGTACCCGAAACCGACACAGGTGGGTAGGTAGAGAATACCTAGGGGCGCGAGACAACTCTCTCTAAGGAACTCGGCAAAATAGCCCCGTAACTTCGGGAGAAGGGGTGCCCCCTCACAAAAGGGGGCCGCAGTGACCAGGCCCGGGCGACTGTTTACCAAAAACACAGGTCTCCGCAAAGTCGTAAGACCATGTATGGGGGCTGACGCCTGCCCAGTGCCGGAAGGTCAAGGAAGTTGGTGAACTGATGACAGGGAAGCCGGCGACCGAAGCCCCGGTGAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCCGCACGAAAGGCGTAACGATCTGGGCACTGTCTCGGAGAGAGGCTCGGTGAAATAGACATGTCTGTGAAGATGCGGACTACCTGCACCTGGACAGAAAGACCCTATGAAGCTTTACTGTTCCCTGGGATTGGCTTTGGGCCTTTCCTGCGCAGCTTAGGTGGAAGGCGAAGAAGGCCCCCTTCCGGGGGGGCCCGAGCCATCAGTGAGATACCACTCTGGAAGAGCTCGGATTCTAACCTTGTGTCAGACCCGCGGGCCAAGGGACAGTCTCAGGTAGACAGTTTCTATGGGGCGTAGGCCTCCCAAAAGGTAACGGAGGCGTGCAAAGGTTTCCTCGGGCCAGACGGACATTGGTCCTCGAGTGCAAAGGCAGAAGGGAGCTTGACTGCAAGACTCACCCGTCGAGCAGAGACGAAAGTCGGCCTTAGTGATCCGACGGTGCCGAGTGGAAGGGCCGTCGCTCAACGGATAAAAGTTACTCTAGGGATAACAGGCTGATCTTCCCCAAGAGTCCACATCGACGGGAAGGTTTGGCACCTCGATGTCGGCTCTTCGCCACCTGGAGCTGTAGGTGGTTCCAAGGGTTGGGCTGTTCGCCCATTAATGCGGTACGTGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCATATCCGGTGTGGGCGTTAGAGCATTGAGAGGACCTTTCCCTAGTACGAGAGGACCGGGAAGGACGCACCTCTGGTGTACCAGTTATCGTGCCTACGGTAAACGCTGGTAGCCAAGTGCGGAGAGGATAACTGCTGAAAGCATATAAGTAGTAAGCCCACCCCAAGATGAGTGCTCTCTCCTCCGACTTCCCTAGAGCCTCCGGTATCACAGCCGAGACAGCGACGGGTTCTCCACCCATACGGGGATGGAGCGACAGAAGTATGGAAATAGGATAAGGTAGCGGCGAGACGAGCCGTTTAAATAGGTGTCAAGTGGAAGTGCCGTGATGTATGCAGCTGAGGCATCCTAACGAACGAACGATTTGAACCT\n>DF157098.1/956789-956946 Plasmodium cynomolgi strain B DNA, chromosome 6. \nTAACTGGCTTTTGGCTGCCAAGCGCTCCTAACGACGTAGTTTTTTGATCCTTCGATGTTGGCTCTTTCCATCATTGGGACGCAGAAGTCTGAAAGTATCGGATTGTTCACCTGCTAAAAGGGAACATGAGCTGGGTTTAGACCGTCGTGAGACAAGTT\n>D90215.1/1270-1191 Nicotiana tabacum par gene, partial cds. \nCTAACAAGGGGATAAAAAAATTCAAATGTGAAACAACTAATATTCAAATGTACGACGACCTTAAACAGCTCGGTGAAACT\n>HG719501.1/1361-1 Eimeria maxima Weybridge genomic scaffold, Emw_scaff1073 \nAGACCTGAAGTCAGTCGAGGTTACTCGCTAAATTTAAGCATATTACTAAGCGGAGGAGGAGAAAATAACACTTCCCTCTAGGGAAGAGCTCAAAGGGAAAATCGTGAGTCCCTTTTGACCTCACGAATTGTAGCCTCTTGAGGCGTTGCCAGTGGGCGGGCAGGCTAAATATTGACGTGAGACCGATGGCGAACAAGTACTGTTAAGGAAATGTGAAAAGGACTTCGAAAAGAGAGTTAAAAGTGTCTGAAATTGCTGAATGGGAGGCGATTGAAACTTTAGTCTCTTCAGGGTGCGGGTGGATATTAGTTGTTCATTAGAAGGTAGCAAAATGCCTCGTCATCAAAATTAGTGAGGTGCATGAATGGATTAACGAGATTCCCACTGTCCCTATCTACTATCTAGCAAAACCACAGCAAAGGGAACGGGCTTGCCGGAATCAGCGGGGGAAGAAGACCCTGTTGAGCTTGACTCCAGTCCGACTTTGCTGAACGACTTGCGGGGTGTATCATAGGTGGGAGCTCCGACGACCGTGAAATACCACTACCCTCAATGTCACTTTACCTATTCCGTTAAGTTGAGATGCATGCTCGGCATCTGTTGAAGTCTTAAGGCACCCTTTTGGATCCGATAAATGCGGAAGACACAGTCAGGTGGGGAATTTGGCTGGGGCGGCACATCTGTGAAACAATAGTGTAGGTGTCCTAAGGCAAGCTCAATGAGAACAGAAGTCTCATGTTGACCAAAAGGGGAAAAGCTTGCTTGATTTTGATTTTCAGTGCGAATACAAACTGTGAAAGCATGGCCTATCTATCCTTTAGGTCTGAGAAACTTTCAGCTAGAGGTGTCAGAAAAGTTACCACAGGGCTTGTGACAGCTAAGCGTCCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGAGACGCAGAAGTCTCAAAGTGTCGGATTGTTCCCCCGCCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATAAAATTGATACTGCGACAGTAATCCAACTTAGTACGAGAGGAACAGTTGGTTCAGATACTTGGTTAATACGGCTAGCTGAGAAGCTGGTGCCGCGAAGCTACCATCTGTTGGATTATGACTGAACGCCTCTAAGTCAGAACCCATGCTGGCTAAGCAGTGTTTCGCATTGCCCCATTTGTTACTTGCATATGGTTTTAGTGCCTTTTGAGCACAACATCTCATCAAAGCCCTTTGCGTCATGCGCTGGGCTATAATCACAATTTCCCACAATTGAGGCGCTACATCCATTGCAGACGACTTTGGCGCAACCAGGTATTGTAAGTGT\n>CP003171.1/2269902-2269995 Oceanimonas sp. GK1, complete genome. \nGCCCGGCGTCGGGTGTTCTCTTACTAGCGCACGGCTCAGCTAATGAGCCATTCCCCTGAGCCAGGTACACGGAATTTGTACCTGGCTTTTTTTG\n>AACT01014037.1/2025-2536 Ciona savignyi cont_14037, whole genome shotgun sequence. \nTTTGGCCGCCAAACCATTGCAAATACCCGAAAGATGGTGAACTATGCCTGAGGAGGTTGAAGCCAGAGGAAACTCTGGTGGAGGACCGTAGCGATTCTGACGTGCAAATCGATCGTCAAATTTGGGTATAGGGGCGAAAGACTAATCGAACCGTCTAGTAGCTGGTTCCCTTCGAAGTTTCCCTCAGGATAGCTGGCGCTCTGTCGCAGTTTTATCTGGTAAAGCGAATGATTAGAGGTCCTTGGGGGCCGAAACGCCCTCAACCTATTCTCAAACTTTAAATTGGTAAGAAGCCCGACTCGCTCGTTTGGAGCCGGGCATGGAATGCGAGTGCCAAGTGGGCCACTCTTGGTAAGCAGGACTGGCGATGCGGGATGAACCGAACGCCGGGTTAAGGCGCCCGACGCGACGCTCATCAGAGCCCCAAAAGGGTGTTTGGTTGATATAGACAGCAGGACGGTGGCCATGGAAGTCGGAAACCGCTAATGGAGTGTGTAACAACTCACCTGCCG\n>CM000236.2/115408586-115408648 Rattus norvegicus chromosome 6, whole genome shotgun sequence. \nGAATGAACACAGCTCTTTTAGAATTTTCCTAACAAGATTTCTGACTTTGGTCAGAAAACCCAA\n>HG417174.1/11014915-11014980 Oryza rufipogon genomic scaffold, chr10 \nAGGCCGATGATGCTAATCATGCTCCTATGGTTTTTCTCTAAGAATGTTTCCCAAGAGCTGAGGACC\n>JH835324.1/5005558-5005616 Erinaceus europaeus unplaced genomic scaffold scaffold00036, whole genome shotgun sequence \nCTCTGTAAAACTTTTCCTATGCTGGGTAGTAAAAGACACCTTGTTACCTGAATGGACAG\n>LMQS01000004.1/71000-70919 Methylophilus sp. Leaf416 contig_4, whole genome shotgun sequence. \nCCTTCTGAGGAACGCTGCGAGAGTTTCATACTCCCAGGCTCAGAGTGATAGCTGCGAAGCTTCTCAACTGCGTTCACTTTTC\n>CM001441.1/4265140-4264954 Desulfosporosinus youngiae DSM 17734 chromosome, whole genome shotgun sequence. \nTGTATATTGGAAAATAAAGGTGCGCGTACTACATAGTACAGCTTAAAAGGGAAGCAGGTAAAATTCTGCACGGTCCCGCCACTGTAATGGGGAAATGTTTTATACTAATAGCCACTAGTCCTACCGGGAAGGCGTAAAGCATTGATGAACCAAAGTCAGAAGACCTGCCTTTGTTGAATGAACCAAT\n>JEMT01029493.1/3587-3436 Rhizophagus irregularis DAOM 197198w jcf7180003195098, whole genome shotgun sequence. \nATCCTCTCTTGCCTATTGGCTAAGATCAAGTGTAGTATCTGTTATTTTCAGTATAATATCTGAAACTTTACACACAGGAGTTCCTTGGCTTGCCAATACTCCCTCATGAGTGTCCCTATTATTGCACTACCTCTAGGCGACGCTCACATTTT\n>URS0000D68632_7029/1-72 Acyrthosiphon pisum (pea aphid) type-P1 twister ribozyme \nUUUUUAAUCAUACCAGUAGUCUAAUUUUUAGAUUACUGACAGUCCUAAGUCUGUAAAAAAUGAGAAGGGAAA\n>LXGJ01000084.1/21313-21202 Bacillus sp. WF146 contig084, whole genome shotgun sequence. \nCGCCTCTTTAACCGCAATCCCGTGAGGTTGCGAAGAGGTTTACGCGCTTTCCATGCCCATGGAAGGATGGAAGGAGTATGCCTCTTTGTGCCCGCACAAAGAGGTTTTTTGT\n>MAVT01008674.1/885-718 Diaporthe helianthi strain 7/96 Scaffold_5759.1, whole genome shotgun sequence. \nTATTATTCAATGGGCAATCCGCAGCCAAATACTAAGTTTAGGTGTAGTCTTATTTAGTATGCAGTTCATCGACTAAACGGGTGTTGGTTTAATTTAAAATATACTGTAGTTAATAGTAAACCTTAAATTAGGCTTAAGATATAGTCAGTCCTAATATGAAAATATTGG\n>MCOG01001818.1/1-185 Neocallimastix californiae strain G1 LY90scaffold_1818, whole genome shotgun sequence. \nCATACAAGAGGACCCCGGTTCAGGCGTGGAAGTATGTCCTGTTCTCGTCCTTGAATGATAACTTCAAATATTAATGAGGATAAATCCTTTGCAGACGACTTAAATTTATAAACTAGGTATTGTAAGCAGTAGAGTAGCCTTGTTGCTACGATCTGCTGAGATTAAGCCTGTGTTTACTGATTTGT\n>GG665194.1/8635-8474 Plasmodium falciparum IGH-CR14 genomic scaffold supercont1.236, whole genome shotgun sequence. \nNNNNNNNNNNNNNATGTTAACAATAATTCATGATGTAAAAATGTTATCCAGTGATGTTTTTATTAGAGGCTAAAAAAAAATGTTTATGCAATGATAAAACGAGTTAAGCATTTTTTTTTAAGTTGCCGACTCACCTGACATTGGAACAACCAAAATTATTGT\n>AYCK01025824.1/19605-19691 Poecilia formosa, whole genome shotgun sequence. \nATTTGCTGCACGCAATTTGCGTACAATATAGCATAAAGTTACAGTTAGTATTTATGCTATATTGTACGCAAATTGCGTGCAGTTACA\n>JOKI01000015.1/68827-69021 Rhizobium sp. R1-200B2 contig_15, whole genome shotgun sequence. \nAGTCAGCACAAGGAGGCAGACATGGGACGCGCTTACTCTCTGAATGTCCTGGCAGTTGGTGTAGCATTCGTATTCGTGGCTTCCATGCTCTTCATTTGAGCGCCACAGTTTCACAACTACCGGTCATATCTGGCATCCGTGACAATCATATAAAGATTTGAAAGCAGGAAACGCAGCTCCATCGGGCTGCGTTTC\n>URS0000D698DF_12908/1-132 unclassified sequences RT-16 RNA \nCTAGCAAACCGTTTTTACGAAGTCAGCTAGTTATACGCTTATTTACTATGGGAGTTTACTCTTATAAAATGCAATCACGACACCTAATGTGTGAAGTGGTGGTGAAAACAAGAAGTAAATAAGCTAACTTGG\n>AE009948.1/273558-273684 Streptococcus agalactiae 2603V/R, complete genome. \nGCTGTTTTTTTAGCGAGCTCAAGGTAGTGAAAGTTGGGTAGAATAGGATGAATATTGGCACTTTTTAGTGAGTAAAAGTACAATCAAAAATGAAGTAATAAATTAGGGTGGAACCGCGTCTTTGACG\n>GL830965.1/1574-57 Succinatimonas hippei YIT 12066 genomic scaffold Scfld66, whole genome shotgun sequence. \nATAATGAAGAGTTTGATCATGGCTCAGATTGAACGCTGGCGGCAGGCTTAATACATGCAAGTCGAACGGTAACATAGCGAAAGCTTGCTTTTGCTGATGACGAGTGGCGGACGGGTGAGTAGTATCTGGGAAACTGCCCTGAAGAGGGGGACAACAGCTGGAAACGGCTGCTAATACCGCATAAACCCTGCGGGGGAAAGGAAGGCAACTTCCGCTTCAGGATGTGCCCAGAAGGGATTAGCTAGTAGGTGAGGTAAAGGCTCACCTAGGCGACGATCTCTAGCCGGTCTGAGAGGATGACCGGCCACATCGGGACTGAGACACGGCCCGGACTCCTACGGGAGGCAGCAGTAGGGAATATTGCACAATGGGGGGAACCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGCGGGGAGGAAATTAAGTTAGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATAACTGGGCGTAAAGGGCACGCAGGCGGGCTGATAAGTAAGGTGTGAAATACCGGGGCTCAACCTCGGGGCTGCATTTTAAACTGTCAGTCTAGAGTATTGCAGAGGGAGACGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAAGAACACCGGAGGCGAAGGCGGTCTTCTGGGCAAATACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGATTAGGAGATTGAGCAGAAGCTTGGTTTTCGGAGCAAACGCGCTAAATCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGACCTTGACATCTGAGGAATGCCTGAGAGATTTAGGCAGTGCCTTCGGGAGCCTCAAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCCTTTGTTGCCAGCGCGTGATGGCGGGAACTCAAAGGAGACTGCCGGTGACAAACCGGAGGAAGGCAGGGATGACGTCAAGTCATCATGGCCCTTACGGTCAGGGCTACACACGTGCTACAATGGGGCGTACAGAGGGAAGCGAGGCCGTGAGGCGGAGCGGAGCCCACAAAGCGTCCCACAGTTCGGATTGGAGTCTGCAACTCGACTCCATGAAGGCGGAATCGCTAGTAATCGCAAATCAGAATGTTGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGATTGCACCAGAAGTGGCTTGCCTAACCCGTAAGGGAGGGCGGTTACCACGGTGTGGTTTATGACTGGGGTGAAGTCGTAACAAGGTAACCCTAGGGGAACCTGGGGTTGGATCACCTCCTTA\n>JH835900.1/331024-330895 Erinaceus europaeus unplaced genomic scaffold scaffold00612, whole genome shotgun sequence \nCTCCATGAATCTTTGAGTCCTGTTGACTGTGGCAAATATCCTTCCTAGACACAGAAGAGCATATTCTTGTATACTGACATAGCTGCCATCAGTTAATTGATTTCAGTTCTAACTTTCACAAGTAACATTT\n>AANH01013162.1/16565-16141 Gasterosteus aculeatus cont1.013161, whole genome shotgun sequence. \nCCTCTTCAGACTCTACCTCGACTAAAGACTAACAAATTGTAGCACTTAAATTGTACTTGTAACGTGACTCATCTATAGCAAATTGTAAATTGGCTTATTTGAGGAAATTGCACTTTCTTGTTTCTTGTTCTCCTTTGTACCCTATGGTTGAATGCACTTATTGTACGTCGCTTTGGATAAAAGCGTCCGCTAAATGACATGTAATGTAATGATGGTGTCAAGCGCCTGGCTCAGACGGTGCGGTACACCTGTCAAACGGTAACGCAGGTGTCCAAAGGCGAGCTCAGGGAGGACAGAAATCTCAGAAGGGCAAAAGCTTGCTTGATCTTGATTTTCAGTATGAATACAGACCGTGAAAGCGCAGCCTCACGATCCTTCTGGCGTTTTGGGTTTTAAGCAGGAGGTGTCAGAAAAGTTACCACAGG\n>ABLF02002078.1/866-1 Acyrthosiphon pisum strain LSR1 Contig2110, whole genome shotgun sequence. \nCCGGCAAGCCTCGACGAGTAGGATGGCGCGGCGGTGTGCGTCGAAGGGCAGGTCGCGAGACCGCCTGGAGCCGCCGTCGGTGCAGATCATAGGTGGTAGTAGCAAATACTCGAGAGGGGCCCTCGGGGGCTGCCGTGGAGAAGGGTTTCTTGTGAACAGCCGTTGTCCAAGAGTCAGTCGATCCTAAGCCCGGGGAGAGATCCTCGTACCACGGGCGAAGGCGTTTTCGAATCGCCCTTGGGGCGAGAGGGAATCCGGTTCGTATTCCGGAACCCGACGCGGAACCGCTCCCTAGTGTTCGGGGCTCTTTTGTCTCGTCTGGGTAACCAGAATGAACTCGAAGAAGCCGCCGGGGGATCTGGGTAGAGTTCTCTTTTCTCTGTGAGCGTTGTACGTCCCTGGAATCCTCTAGCCGGGCGATAGGGACGCGAGCGCGAAGAGCACCGCTCGTTGCGGCGGTGTCCGTGATCCCCACGCGGACCTTGAAAATTCGAGAGAGGGCCACGCGGAGTCTTCGCGTCGGTTCGTACCGATATCCGCAGCAGGTCTCCGAGGTGAGCAGCCTCTAGCCGCATAGAATAATGTAGGTAAGGGAAGTCGGCAAAACCGATCCGTAACTTCGGGATAAGGATTGGCTCTGAGGAGCGTGGCTGCCGGGTTCGGGTCGTCGTAGAAGCGTAGGCGTTTTTGGCGACACCCCGGCCGTCGCCCGTGCGCCCGGTCTTCGGAACGGGAGCCTCGAGGCGGCCGCGGGCCCGTCGCCGTCCGCCGACCGTGGAACCACCGAGCTTCGGTCGCTGGCCGCGTCGCGGCCGGCCGACCGCACATTGGTGTCGGTTCGCCGTCACCGGGCGGTCCGGCCGCCG\n>AYUG01116302.1/14860-14978 Fukomys damarensis contig116302, whole genome shotgun sequence. \nCTCTAGCAAAGTAAGTTTCTTTACTTGTGGATGCACAGTGGCTTCACACAGCAACTCCTTTAGTTGTGTACACAGACTATTGTTTGTATGGGTCGCCCTAAGGGACCTTAAAGAAGTTT\n>KK502427.1/433055-433166 Glossina austeni unplaced genomic scaffold Scaffold27, whole genome shotgun sequence. \nGGCAAGGGCACTCTGTGACACTTGTTATTAATTTTAAAGTGTAAACAATTTGTTACCTTGCCAGAATAAATCAATTACGTAAAACCTTAACCAATGTCGTATTATAGATTGA\n>CM000999.2/44792791-44793384 Mus musculus chromosome 6, GRC primary reference assembly. \nTTCTATAATTCTTTCTATACGAGTACACATTTTCATCTTGCAAGAAACAACCAAAACTAATTTAAGAAATATTATCAAACATGTTAATAAAAATTGAGTGTTAATAAAAATAACTAAAATACAAAATTATTGGATACTTAGATGGTGAACTATGCCTGGGCAGGGCGAAGCCAGAGGAAACTCTGGTGGAGGTCCGTAGCGGTCCTGACGTGCAAATCGGTCGTCCGACCTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCTGAAGTTTCCCTCAGGATAGCTGGCGCTCTCGCTCTTTTCCCGACGTACGCAGTTTTATCCGGTAAAGCGAATGATTAGAGGTCTTGGGGCCGAAACGATCTCAACCTATTCTCAAACTTTAAATGGGTAAGAAGCCCGGCTCGCTGGCGTGGAGCCGGGCGTGGAATGTGAGTGCCTAGTGGGCCACTTTTGGTAAGCAGAACTGGCGCTGCGGGATGAACCGAACGAATTATATTTTATATAATGTATATGAAATATCAAATATTAAGGAATGACATTTGATTTTGTTGTGTAATTGTATCATGCATCTTTT\n>MRAE01000082.1/2029-1 Clostridium sp. IEH 97212 scaffold_81, whole genome shotgun sequence. \nCGCAAATAGGCAGAGATCCAGGGATTTCCGAATGAGGGAACTCACATGGGTAACCCCATGTATCATGCACTGAATACATAGGTGTATGAGGGTAAACCCGGGGAACTGAAACATCTAAGTACCCGGAGGAAGAGAAAGAAAAATCGATTTCCTAAGTAGCGGCGAGCGAACGGGAAAGAGCCCAAACCAGAAACTTGTTTCTGGGGTTGAGGATAGATCATAAAAGAAGAGGTATCTTAATCGAAAAGGGCTGGAACGCCCTACCATAGAAGGTAATAGTCCTGTAGATGAAAAGAGAAAACTTCGAGATCTAATCCAGAGTACCACGAGACACGTGAAACCTTGTGGGAAGCAGGGAGGACCACCTCCCAAGGCTAAATACTACCTAGTGACCGATAGTGAAGCAGTACCGTGAGGGAAAGGTGAAAAGAACCCCGGGAGGGGAGTGAAATAGAACCTGAAACCGTGTGCCTACAACCGATCGGAGCACGTTAAAGTGTGACGATGTGCTTTTTGTAGAACGAGCCAGCGAGTTACGCTATGTAGCAAGGTTAAGTACTTAAGGTATGGAGCCGAAGGGAAACCGAGTCTGAAAAGGGCGAAAAGTTGCATGGTGTAGACCCGAAACCGGGTGACCTATCCATGGCCAGGTTGAAGCGAGAGTAAAATCTCGTGGAGGACCGAACCACGTTGGTGTTGAAAAACCATGGGATGAGCTGTGGATAGCGGAGAAATTCCAATCGAACTCGGAGATAGCTGGTTCTCCCCGAAATAGCTTTAGGGCTAGCGTCGTGTAATTGAGTAATGGAGGTAGAGCACTGAATGGGCTAGGGGCTATAGTAGTTACCGAACCCTATCAAACTCCGAATGCCATATACTTGTATCACGGCAGTCAGACTGCGAATGATAAGATCCGTAGTCAAAAGGGAAACAGCCCAGACCATCAGCTAAGGTCCCAAAGTGTAAGTTAAGTGGAAAAGGATGTGGGATTTCTAAGACAACTAGGATGTTGGCTTAGAAGCAGCCACTCATTTAAAGAGTGCGTAATAGCTCACTAGTCAAGAGATCCTGCGCCGAAGATGTCCGGGGCTCAAACTTACCACCGAAGCTATGGGGTGTACACTATGTGTACGCGGTAGGGGAGCTTTCTGTATGGGTTGAAGTCGTACCGTAAGGAGTGGTGGACTGTACAGAAGTGAGAATGCTGGCATAAGTAGCGAGAAATAAGTGAGAATCTTATTGGCCGAAAACCTAAGGTTTCCTGGGGAAGGCTCGTCCGCCCAGGGTTAGTCGGGACCTAAGCCGAGGCCGAAAGGCGTAGGTGATGGACAATCGGTTGATATTCCGATACCACCTATTTACGTTTGAGAGATGGGGTGACGCAGTAGGATAAGATGTGCGCACTATTGGATGTGCGTCTAAGCATTTAGGCATGCTTGATAGGCAAATCCGTCAGGCTAAGCTGAGATGTTATGGGGAGCCAAATGTGGCGAAGTATCTGATTCCACACTGCCAAGAAAAGCCTCTATCGAGTAAATAGGTGCCCGTACCGCAAACCGACACAGGTAGGTGAGGAGAGAATCCTAAGGCCATCGGAAGAATTGCTGTTAAGGAACTCGGCAAATTGACCCCGTAACTTCGGGAGAAGGGGTGCCTACGAAAGTAGGCCGCAGAGAATAGGCCCAAGCAACTGTTTAGCAAAAACACAGGTCTCTGCTAAAGCGAAAGCTGATGTATAGGGGCTGACGCCTGCCCGGTGCTGGAAGGTTAAGGGGAACACTTAGCGAAGCGAAGGTGTGAACTTAAGCCCCAGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCCGCACGAATGGCGTAATGATTTGGGCACTGTCTCAACAGCAAATCCGGCGAAATTGTAGTGCAAGTGAAGATGCTTGCTACCCGCGATTGGACGGAAAGACCCTGTAGAGCTTTACTGTAGCTTAGCATTGAATCTCGGTATTGTCTGTAC\n>KV454051.1/1465-1655 Pachysolen tannophilus NRRL Y-2460 unplaced genomic scaffold PACTA_scaffold_41, whole genome shotgun sequence. \nACCTGTTTGCCAACACTCTGGTGCCGAATCAAAAAGATTTTATATATTTCTTTTTCGATATATTCGGTTCCTATTTTGGAGCAAACTAGATTGATTTAGCCAATTACTCACCATAATATTCGTGATTTATTTAAAAAAAATTTTTTTTTTAGATTAAGATGAATATGATGGTCCATTTCAGTGGCGTAAAT\n>ACSJ01000007.1/1211646-1211440 Clostridium botulinum D str. 1873 CLG.Contig181, whole genome shotgun sequence. \nCAATAAAATATAAAAATAGGTGTCAGTTATAATAAAAATTTTAATTATGAACTGGTGAAAAGGGAAGATGGGTGTAAATCCTACACGGTCCCGCCGCTGTAAATGAGGAGCTTTTTTATGTGTAACCACTGGTGTTATTTATACTGGGAAGGATAGAAAAGTGATGATACTTAAGTCAGAAGACCTGCCTATTTTTGTACACCGATG\n>ALAR01116409.1/116042-115647 Tupaia chinensis contig116409, whole genome shotgun sequence. \nAAAAGAGTAATGAAATTTCAAAACAAAATATAGAAGCTACATGGTCACTTTTACCAGCTTATGGTGAAATGAAAGGGAAAAAGGATGATTTCAAGAAAGAATTTATAATGAAAAGGGAATTAGGTTCAGTCCTCTGACTCCAGAGCGACCAAAATGGGCACTGCGGCGGGTCCAGTGCAGTGATGCAATCATCCTGGAGAAGCTGCTTGAGTCCCTGGGGAGAGTTCTCTTTTTTGTGGACATAGTGGGGTCACCCCGGGGAAGGGGTCCATGCCTTTAAAATGCTGTGGTTCCCGTAAGTTCTTACTGGCCCTTAAAAAATACAAGGGAGAAGGTATAAATCTACCACCAGGCCACACACATATCCGCAGCAGGTGTCCAAGATAAACAGCCTCT\n>KZ248601.1/687242-687373 Danaus plexippus plexippus isolate F-2 unplaced genomic scaffold DPSCF300057, whole genome shotgun sequence. \nGCTGGCTTTTATCGAAGCTCTCATATTTTTCCTATAAATATGGAAGTCAAACAAAGCCTATAGTGAAGATCTCTATCGGTCGCGGTCTAGGTAAATCATACCTCTAACGTATCACCAAGGAGGTCAACAGTT\n>LRGB01001036.1/60242-60133 Daphnia magna strain Xinb3 scaffold01036, whole genome shotgun sequence. \nTCCTATTGTACCGCAGCTGCTGAACACTGCCCAAGATTGGCGTGAACAATTCTAACGGAAGGCAACTCTTGTGCGTGTGACAGCGGCTATGGTATTCAGGAAATATCTTC\n>AACT01048137.1/180-1 Ciona savignyi cont_48137, whole genome shotgun sequence. \nTACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCAAGTCTAAGTACGAGCTCTCGTACAGTGAAACTGCGAATGGCTCATTAAATCAGTTATGGTTCATTTGATCGTACAGTTTACTTGGATAACTGTGGTAATTCTAGAGCTAATACATGCGAGAAGCG\n>ACJG01011252.1/789-1 Daphnia pulex DAPPUscaffold_852_Cont11252, whole genome shotgun sequence. \nCGACCTGAGAGCAGGCAAGGTGACCCGCCAAATTTAAGCATATTAATAAGCGGAGGAAAAGAAAACAACCGTGATGCCCTTAGTAATGGCGAATGAAACGGGCAGAGCCCAGCACCGAACCGCCGGCCATCCAGGTCGCGCGGAATGTGGTGTTTGGGGGAGCCTCCTCGCGACGCGTCGGCCGGTCCAAGTCCACCTTGACTGGGGCCACGGCCCACAGAGGGTGATAGGCCCGTAAGACGGCCGATGCGTTGTGCCGGCTTTCCCCTAGAGTCGAGTTGCTTGGGAGTGCAGCTCAAAGTGCGTGGTAAACTCCACGTAAGGCTAAATATGACCCCGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGTTGAAAAGAACTTTGAAGAGAGAGTTCAAGAGTACGTGAAACTGTGTAGTGGTAAACGGAGGGGCTCTCGAAGTGGGTCTCGGAGATTCAGGTTGGCGGCCGGGCGGCCGGGGCGAGCGCGATCCGCGAGGACGCCTCGTTTCGGTCGGCTCGGTCGGCGGCTGCACTTCTCCGGGACTTGACGCGACGAACCGCTGTCTGCGGAACGAGGACCGGGGTGAAGTTCGTCGTCCTCACGGGCGGCGAGCCCCCGGCTCCTGTCTTCGCGGGCGGCGGGTATCTGAGTCGACTTGTATAGCAAGCCCTCTCGCTAGGGCGGTCGGCATCTCTGTCGCGAGTAGGTCGGCGGCCCCTCCGACCCGTCTTGAAACACGGACCAAGGAGTCTAACATGTGTGCGAGCCATTGGGCGGACTAA\n>CM000780.4/228503464-228503665 Zea mays cultivar B73 chromosome 4, whole genome shotgun sequence. \nATACCTTTGTCGACCTGTTGACTAAGATAAAGTGTAATGTTTGTTCTTACTAGTTTGATATCTGATATGTGGATCGTATGTTCACTTTATTAAATTTTATTTTTTTATGGGTATCAAATATGATTGTGTGTCTATCGGGGTGATAATTAGGGGTACCCAGATTATCCCTCCGAAAAACGCACTCAGGAGAAGTAAACACATA\n>KN819335.1/889548-890013 Paxillus involutus ATCC 200175 unplaced genomic scaffold PAXINscaffold_13, whole genome shotgun sequence. \nACAGTCCGAAAGTTACGATGCTCACCACACACTGCAAGACATGTCAAAGATCGTGAGTAGACTAAGGTCTGAGTATTCTATTCTCAATCGACTCTTCCTGGGTTCATTCCTAACGGACTGCGCGATGTCCAGAAATGCAATAGCCAGTTTCCCCACGGTTACTGAGTTAGTAGGGACGGACAACTTTGAAAATGCGTCGCAGAGATCGGGTGAGCACCTTTCCTCACTTGATTCCCTGTTGCGGTAGACGTGCCCATCATTGCGCGCAACGTGATCGCGTTCTTCGTTCGCATTCATGTCCGCGTATTAGGACATCGGGTCCGACGAATCAACCGCGGCTCGTACTAGCAGTCATCAATACTACACCCCATCACGCGACTGCAACCAAGTCAACTCGATTATTTTTTCTCGTACGAGATTTTTCAATCATCTTTTGAAACTCGATTCAGACTACTCTTAGGACTGT\n>AASG02001279.1/18109-18241 Ricinus communis ctg_1100012357581, whole genome shotgun sequence. \nTGTCATGCTTTTCCACAGCTTTCTTGAACTTCTTCTTCTTCTTCTTCTTCTTCTTAGATTTCTTTCTCATTGCCTATATCTTTCTTGATGTGGCACAGAATAAGTTCAAGAAAGCTGTGGGAGAACATGGCAA\n>JH835358.1/2695321-2695604 Erinaceus europaeus unplaced genomic scaffold scaffold00070, whole genome shotgun sequence \nGGATCTTAGTGTGATCTGGCTGTGACATCTGTCACCCCATGGATAACATGGGTTGATTTGGCTGGTCTGGCTCGCTAGACGAGTGTCCTCTTCCTCCCTCACTGCTCCTTGTACGTTCAGTCAAAGAGGACAACCTTCCTGAGTCTTGGGTCAAAGGGTATACGAGTAGCTACACTCCCCTGCTAGAACCTCCAAACAAGCTCTCAGTAAGTTTTGCTCTTTATTTTTTTCCCTTTTGTTGCTTATCTTTGTTACTATTATTGTTGTTACTGCTGTCGTTGTTG\n>CM001941.2/563785-564154 Chlorocebus sabaeus isolate 1994-021 chromosome 1, whole genome shotgun sequence. \nGCCGGGCATGGAGATGTGCACCTGTAGTCCCAGCTACTTGGGAGGCTGAGGCGGGCGGATCACTTGAGCCCAGGAGGTCAAGGCTGTAGTGAGGCGTAATCACACTACTGCACTCTAGCCTGAGCGACTGAGACCCTGTCTTGGAAAAAAGAAAAAAAAGGATAAGATGGGACATTTTACATTATTTTTTTTTTTTTTTTGAGACGGAGTCTCGCTTTGTCANNNNNNNNNNAATGTAAAATGTCCCATCTTATCCTTTTTTTTCTTTTTTCCAAGACAGGGTCTCAGTCGCTCAGGCTAGAGTGCAGTAGTGTGATTACGCCTCACTACAGCCTTGCCCTCCGGGGCTAAAGTGACCCGCCCGCCTCAG\n>GL018725.1/468056-468262 Oryctolagus cuniculus unplaced genomic scaffold chrUn0027, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGCAGAATCTCTGTTTCAGAGTCCCCCAGCCATCACGGCGCCTGCGGTCCCTTTTTTTTTTTTTTTTTTGACAGGCAGAGTGGACAGTGAGAGAGACAGAGAGAAAGGTCTTCCTTTGCCGTTGGTTCACCCTCCAATGGCCGCCGCGCTGATCCGATGGCAGGAGCCAGGTACTT\n>MRDE01000088.1/1-303 Tersicoccus phoenicis strain 1p05MA scaffold90_cov825_read201, whole genome shotgun sequence. \nGTGACGGCACTTCGCGTGCTCGAGCGGGTGTGGGCCGCAGAGACCAGGGGGAAGCGACTGTTTACTAAAAACACAGGTCCGTGCGAAGTCGCAAGACGATGTATACGGACTGACTCCTGCCCGGTGCTGGAAGGTTAAGAGGACCGGTTAGCGCCCCTCGCGGGTGCGAAGCTGGGAATTTAAGCCCCAGTAAACGGCGGTGGTAACTATAACCATCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGAGTAACGACTTCCCCGCTGTCTCAACCATAAACTCGG\n>CM000380.2/94669007-94668751 Equus caballus chromosome 4, whole genome shotgun sequence. \nTCGAAGTTTCCCTCAGGATAGCTGGCACTCTCACATGTGAACCCAGGCAGTTTTATCCAGTACAACGAATGATTAGAGGTCTTGGCGCCAAAACGATCTCAATCTATTCCCAATGGGTAAGAAGCCCACTGGCATGGAGCTGGGCATGGAACACAAGGGCCTAGTGGGCCACTTTTGGTAAGTAGAAGTGGCACTGCACGATGAACTGAACACCAGGTTAGGCATTGATAACTTGATAACTATAGTTTTATAATAGA\n>CM000941.1/92177923-92177799 Anolis carolinensis chromosome 5, whole genome shotgun sequence. \nATTTTCCTGACTACTGAAATGCCCTCAATGTACCACATCCCATTTGATCTTGGAAACAATGCAGGATTAGTCCTGATTAGTACTTAGATGGGAGACCACCAACGAATACTAGGAACTGTAAAAAC\n>LBBL01000003.1/104201-103670 Ceratocystis platani strain CFO contig_00003 mitochondrial, whole genome shotgun sequence. \nGAGTTTGGTGATGGCTCTGATTGAACGCTGTCTAAGTGCTTGACACATGCTAATCGAACGATTAATACAGTTAAAAAAAAACTAAATTAATAGTGGTGTACAGGTGAGTATAAGATATTTTTGCCGACCTTAAAGTAAGAGGACAATAAGATCTCTTATAAACAAAAGGGTTGTACCGCTTTAAGAGGATGAGAAATATCATAGAGAGAGGTAGTTGTTAAAGTAATGATTTAGCTAGCCGCAGATTCTCTTAGTCGAAACTGAAAGGTTGATCGACCACATTGGGCCTGAAAAAATCCCAATGCAAAAACGTACAGCAGTGAGGAATATTGGTCAATGGTCTAACGATCGAACTGGCAACTTAGGGAAATGGATGATATAAAATAATTATATAATAAAGTTTATATAATAATTATTAATATGCAATAGTTGTGAAGTTTTGTCTACATATTGATAATGACAATATGTATAAACAGTCTCGACTAATTACGTGCCAGCAGTCGCGGTAATACGTAAGAGACAAGCGTTATTC\n>CM000762.3/2300100-2300430 Sorghum bicolor cultivar BTx623 chromosome 3, whole genome shotgun sequence. \nCTCCCAAGAAACCTCAGGGTCCCAATGGGCCTTCATCATGAATCGAAAAGGGCCCATGGGAGAGGGAAACAGCCCGGATCACCAGCTAAGGCCCCTAAATGACCGCTCAGTGATAAAGGAGGTGGGGGTGCAAAGACAGCCAGGAGGTTTGCCTAGAAGCAGCCACCCTTTAAAGAGTGCGTAATAGCTCACTGATCGAGCGCCCTTGCGCTGAAGATGAACGGGGCTAAGCGATCTGCCGAAGCTGTGGGATGTCAAAATGCATCGGTAGGGGAGCGTTCCGCCTTAGAGGGAAGCAAACGCGAAAGCGGGGGTCGACAAAGCGGAAGCG\n>JSZA01002193.1/1101-1450 Candidatus Thiomargarita nelsonii contig_2193, whole genome shotgun sequence. \nAGATCATTATGAGAATCCCCGTAATGTGGGCACATTGGATAAAGAGGATCCGTCAGTGGGGACGGGCATGGTTGGCGCACCAGCTTGTGGTAAATAACATTGCCACGTAATTCTGCTATATGCAAGAAACTCTCGTTAGGTTGTAGGTACTAATGTTTAACCAAACACGCAAAATAACAAAATAGTGTGCCCAAATACTTGAGTAAAATACTCAAGTATTAACCAGATGGGTTAGTAAAAACCCTACAAATAGAGACAATTTGCAAGGAAGTCGTGGTTGACCCTTCAGAGACTATACGCAGAACATCAATGAGATGAAGACATAGTCCGAACTACACGGAGACGTGTAG\n>MKUE01000019.1/22195-22263 Thiobacillus sp. 65-1059 scnpilot_expt_750_p_scaffold_1345, whole genome shotgun sequence. \nGAACTGAAGAGTTTGATCCTGGCTCAGATTGAACGCTGGCGGAATGCTTTACACATGCAAGTCGAACGG\n>URS0000D699AF_12908/1-539 unclassified sequences ROOL RNA \nAATCAACGCGAAGGATTGTTTCAACCATGTGTATTCACAATTCCATGTGGTCATGGACGTGTTCAAGGAGTTCCACTATGGAGGATACCCCATAGGTAGGCTTTACCAGATAGGTAGAAGAGATGGAAAATCTCAACCGAGCAGGCACGGTGCTGTGATGAAACGCAAGAAAATGGTATTGCTAACTGGTCGCTATCGCAATAGATATGAGGTACGCACCTCATTGAACCAAGTAGAGGATAGTGTGGCAGCTATGTCAATCGCTTGGAGTGCCATAAGATAGTTGTCCAATTGATGCTGGTAATCAGATATAAGACCAGACGCGAGTACGAGTAGCCCAAAGTTGGAATATATTAGAAGATTAATATGCTGAATGGTGGGTGAAAGTTGTTGGTAGCCAATCCAGCCATAGATTGACGTAAGTTGGGATGGAAAGATATGGGGTCGCTCCCTGTGTCTCAGCTCCATTTCCTATGTGACCGAATTACCACTACGTTTTATGAAGGTACGATGAAGATCGGAGACAATCTTTCGCGTTG\n>CM001752.1/52724704-52726253 Gossypium raimondii chromosome 13, whole genome shotgun sequence. \nCAAAAGAAGAGTTTGATCCTGGCTCAGAAGGAACGCTAGCTATATGCTTAACACATGCAAGTCGAACGTTGTTTTCGGGGAGCTAGGAAGAAGGAAAAGAGGCTCCTAGCTAAAGGTAGCTTGTCTCGCCCAGGGGGTGAGAACTGTTGAGAACAAAGTGGCGAACGGGTGCGTAACGCGTGGGAATCTGCCGAACAGTTCGGGCCAAATCCTGAAGAAAGCTAAAAAGCGCTGTTTGATGAGCCTGCGTAGTATTAGGTAGTTGGTCAGGTAAAGGCTGACCAAGCCAATGATGCTTAGCTGGTCTTTTCGGATGATCAGCCACACTGGGACTGAGACACGGCCCGGACTCCCACGGGGGGCAGCAGTGGGGAATCTTGGACAATGGGCGAAAGCCCGATCCAGCAATATCGCGTGAGTGAAGAAGGGCAAGGCCCGCTCGTAAAGCTCTTTCGTCGAGTGCGCGANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTGAGACATGCCGCTTAGAGTGAAAAGTCTTTGCAACCGAAGTGAGCCGACGGAGCCGAAGTGACGGGCCAAGCTCTTCTAATTGAGCGCCTGCACGTAAGCTGTGCTGTCAGTAAGAAGGGGAGCCCGCCGCCTTTCGAATTTGAAAGCACTTTTCTAGTGTGCGCTGTTTTTGATTGCAGCTAGCGAGCGAAGAAAACGGATGGCGCGAACGCGGCTTTTCTTTCGCCTTGCTTGTTGTACTAATAACATAGAAAGGGCTTTCTTTTCTCGCTTGTTTAGTAAAGTCAAGTTTTTGGCCTTATCTTGCAGGTGACGACGACGTCGAGTTGGCGGCGGAGAAAGACTCGGCATTCAGGCGAGCCGCCCGGTGGTGTGGTACGTAGTGGGTTTAGTACGCCCCGCCAAAACAACTCCGAAACAAACGAAAAGGTGCATGCCCCCCTTCCGAGGGACTGCCAGTGATATACCTCACGAAGGTGGGGATGACGTCAAGTCCGCATGGCCCTTATGGGCTGGGCCACACACGTGCTACAATGGCAATTACAATGGGAAGCAAGGCTGTAAGGCGGAGCGAATCCGGAAAGATTGCCTCAGTTCGGATTGTTCTCTGCAACTCGGGAACATGAAGTTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATATGTACCCGGGCCCTGTACACACCGCCCGTCACACCCTGGGAATTGGTTTCGCCCGAAGCATCGGACCAATGATCACCCATGACTTCTGTGTACCACTAGTGCCACAAAGGCTTTTGGTGGTCTTATTGGCGCATACCACGGTGGGGTCTTCGACTGGGGTGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGTGGCTGGATTGAATCCTTC\n>MCGO01000050.1/321272-322593 Rhizoclosmatium globosum strain JEL800 BCR33scaffold_50, whole genome shotgun sequence. \nTACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTCTAAGTATAAACTCGTTTGTACTGTGTGAAACTGCGAATGGCTCATTAAATCAGTTATAGTTTATTTGATATAACCTTACTACTTGGATATCCGTGGTAATTCTAGAGCTAATACATGCAATTAAAATCCTGACTTCTGGAAGGGATGTATTTATTAGATAAAAAACCAACCCGGCAACGGTTCTTTGGTGATTCATAGTAACTTTTCGAATCGCATGACTTTACGTCGGCGATGGTTCATTCAAATTTCTGCCCTATCAAGTTTCGATGGTAGGATAGAGGCCTACCATGCTTTTTACGGGTAACGGCGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCTAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGATTCAGGGAGGTAGTGACAATAAATAACAATCCAGGGCTTTTGTCTTGGAATTGGAATGAGAACAATTTAAATCTCTTAACGAGGAACAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAATAGCTCGTAGTTGAATCTTGGGCCTGGTTTGGCGGTCGCGCTTTAGGGCGTGTACTGTCGGCCGGGTCTTTTACTTGCGGGGAACGTGCGTGCCTCTCGGGGTGTGTACGGGAACCGTGGCTATTACTTTGAAAAAATTAGAGTGTTTAAAGCAGGCGTAAGCTTGTATACATTAGCATGGAATAATAGAATAGGACTTTGGTTTTATTTTGTTGGTTTCTAGGGCCGAAGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTTAATAGTCAGAGGTGAAATTCTTGGATTTATGAAAGACTAACTTCTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTCAGGGGATCGAAGATGATCAGATACCGTCGTAGTCCTGACCGTAAACTATGCCGACTAGGGATCGGGCGTTGTATTTCATGACACGCTCGGCACCTTATGAGAAATCAAAGTCTTTGGGTACCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTCACCAGGTCCAGACATAGTAAGGATTGACAGATTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGATAACGAA\n>AP009608.1/824477-824563 Mycoplasma fermentans PG18 DNA, nearly complete genome. \nCGGTAGTTGCTCGAGAGGCTGAAGAGGTTGGTCTCGAAAACCAATAATGGTGAAAGTCATTCAAGGGTTCAAATCCCTTACTACCGG\n>CP001719.1/360474-360390 Methanobrevibacter ruminantium M1, complete genome. \nGCCATGATGACTGAGTCAGGCTTAAGGTATCCGCCTTGAGAGCGGACGTATGAAAGTACCAGAGGTTCAAATCCTCTTCATGGCG\n>LFJF01047615.1/1-2366 Macrostomum lignano unitig_47682, whole genome shotgun sequence. \nACTTTTTGAGCCCCGTAATTGGAATGAGTACACTTTAAATCCGTTAACAAGTATCTATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAATGTTGCTGCAGTTAAAAAGCTCGTAGTTGGATCTGAGGACTCGAATTGGTGGTGCACCCATACGGTGTTACTGCCCGATTCGGCCTACCTAGTCGGTGCTCGCTCTTGGTGTTCTTAATTGAATGCCCTGAGTGCCCGGCAAGTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCCATTAGCCGGAATACTTCAGCATGGAATAATGGAATAGGACTTCGGTTCTATTTTGTTGGTTTTCGGAACCCGAGGTAATGATTAAGAGAGACAGACGGGGGCATTCGTACTGCGGTGTTAGAGGTGAAATTCTTGGATCGCCGCAAGACGAAACAACTGCGAAAGCATTTGCCAAGAATGTTTTCATTAATCAAGAAACGAAAGTCAGAGGTTCGAAGACGATCAGATACCGTCCTAGTTCTGACCATAAACGATGCCAACTGGCGATCCGAGATCGTTTGCTTATTTGACCTCTCGGGCAGCCTCCGGGAAACCAAAGTTTTTAGGTTCCGGGGGAAGTATGGTTGCAAAGCTGGAACTGGCAAAAATTGAACGGCAAGTGCACAACCAAGTGGTGGAAGGCCCTTGCGGCTTTAAATTTGACTCAAACCCGGAGTAAGATATTTACTTCACTTGTGTGTCGTTAACTGTTCTCCATAACGAATCAGGACACTCCAGGATCAGCTCCCCTATGAGTGTTAGCAAAGTTCAAATTCAAGAATTATTTGATTGTCCATGAGACAGTTAGAATTGAAGAGCAATTACAAAATTTGTATTATGCTATGATATTCCTAATGGTAGGTTTTAACCCTTCTAAATTGCGGCAGTGGCCTGACTTTGAGTGTAACAGGGTAATCTGGTTAGAAAATGTTTAAAGTCACTGAGACCCAGTTGGCCTTAAGTCTAAATTTCCCCCACGAACCTATTGGCTTACTCAGCGACTATATGTTCAGAGCCGCTGGGCGATTAGATAAATTCTTGCAGGCTATCAACGATCGAAATCCTTTGACCTAAGGCTTCCTACTGCACATGGCGGTACTGGTGCTTGAAGGCGGCTCCAGGTTACGATGATCCAAGACAAAAGAAAGTCTAATTAAAAAAAATACTCTCATCACCTGTTAAGCCTAAAAGACTTTGAACCAAAAAATCCGTGTGTGGAAAGGCAAGAAACTGCCTACGTAGGTACCAAAAGCTGCCCGTACGACCTTTATCTGGCTCCATTACCCGGTTTATTGAGGATTATCTGGGCAAGTGTCTTGGTCGACCACGGCTGGAATTTCGCGAAAGGCCACAAAAAGGATCAAGGGAATTTTAGGGTAATAGAAAGGAATCAAGAACTGTTACACAAAGGAAAATAAGAATTTATCGCGGTTAAAGGCGCAAAAATTGAGGGAAGTCGCTTTTCTTTGATCAGAAGCTGCTCGTTCCAAGTCTCATCGGCTGTCGTGGTGGGAAATCACTGCGATTTCAGCTGCCGTTAAGCCACGGAAGGGCCGGAGTAAACGTGAACGCTCGGCTGCTGGGACATCTAAGCGCTTTTCGTAGCAAGGATTAGGGTCATTATATGAGCCTACGGGGTGAACCTAAGGAATATTGACGGGCCAAGGGCACCACCAGGAGTGGAGCGCGCTGGCGCTTAATTGACTCCCACGGCGGAAAGACTCACGTACCGGAATTAGGACAAGCAGGGACAATTGAGAGCTCTTTCTTGATTTCGCGTGGGTGTGGTGCATGGCCCTTTGGCTCTTTAGTTGCCCGTGGAGCGATTTGTCTGGTTAATCCGTATACGAACGACTCTCTAGCCTGCTAAATAGTACGCCGAATTTGCGTGCACTGACTAGACGGACAATTTGCAAAATTTGACCAATAAAGGTACTGTGACAGTGCGCCTTAGAGTTCGCGCACGGCGAGCAGAAACAAGGTCTTTTTTCCTGGTTCGAAGAGCGCGGGTAATCTGTTGAATTCCCTTCGTGACAGGATTCCGGGTTGCAATTATTCCCGGTGAACGGGAATTCCCTTCCCAGTAAGACGCTCATTACCCTGACCTACTTGAGCCGAACCGGTAACTGCCCTTAGAGATTGTTGACGCCGCCAAGGTCCTCCGGATTGGTTTGCACCCGATGGGCGACTCTCTTGGCCGACTTGGTGCAACACTAGGTCGGATACTGAAAAGAAGATCAAACTTGATCATTTAGAGGAAGTAAAAGTCGTAACAAAGGTTTCCGTAGGTGAACCTGCGGAAGATCATTA\n>KZ248836.1/34641-34948 Danaus plexippus plexippus isolate F-2 unplaced genomic scaffold DPSCF300292, whole genome shotgun sequence. \nACTGGGAGCGTGGCGCCTCTTGTAATCCGTGCTACTCGGAGGTCGGGGTCGAGGGATGGTTTGAGGTTTGAGGTCCTGGGACTGAGATGGCCACAACAACCGGATGGCCACATTCAAGCCTAGTATGACTTTGATCTTCTGGAAGAGTCTAGACTCTAGAGGGTGCATTCTACGGAGGGATAACAGTTCAGGCCCAGGGAGACAACTCAGGGGCCTAGGAATCCCTTCGTACCGGGCTGGAGTGGAATTTAGCCGGGAGTGAACTAACTCAGTAACAACCTAACCGATATAACCAGACCCTTCCCTAT\n>CP001899.1/298032-298087 Ferroglobus placidus DSM 10642, complete genome. \nGCCGATGATGACCCCTCCCCTAGCTGAAGAGTGATGAATTTGCCGATTACTGAGGT\n>FAOM01693974.1/1165-1 Triticum aestivum genome assembly, contig: Triticum_aestivum_CS42_TGACv1_scaffold_693974_U_6BS-0.065204_1BS-0.034861 \nCGGTGCGCCCCCGGCGGCCCATGAAAATCCGGAGGACCGAGTACCGTTCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGCCAATGGAACAATGTAGGCAAGGGAAGTCGGCAAAACGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGACTGGGCTCGGGGGTCCCGGCCCCCGAACCCGTCGGCTATCGGCGGATTGCTCGAGCTGCTCACGCGGCGAGAGCGGGTCGCCGCGTGCCGGCCGGGGGACGGACCGGGAATTGCCCCTTCGGGGGCTTTCCCCGAGCATGAAACAGTCGACTCAGAACTGGTACGGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNAACGGGCTTGGCGGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCCCTCACGGGCGCAAGTGAAATACCACTACTTTTAACGTTATTTTACTTATTCCGTGGGTCGGAAGCGGGGCATGTCCCCTCCTTTTGGCTCCAAGGCCCGATCTTACCGGGCCGATCCGGGCGGAAGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTAGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGACAGTGTCGCGATAGTAATTAAACCTAGTACGAGAGGAACCGTTGATTCACACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGTGCCGGATTATGACTGAACGCCTCTAAGTCAGAATCCAAGCTAGCATGCGACGC\n>AEAQ01007696.1/1567-1612 Solenopsis invicta Si_gnG.contig11298, whole genome shotgun sequence. \nTTAATTGCTCCTTTTGGAGCAATAAATATTGCAATATAAAAAATTT\n>CM003288.1/100477756-100477466 Salmo salar isolate Sally breed double haploid chromosome ssa10, whole genome shotgun sequence. \nGGATGACGTGTCAGAGTTTGGGGTTCCTAATGGAAGTATCCACTCTGCATCATTTCCTCCTCATATCTTCCTTGTAGGGTACATAGTGGCCATCCTGTAACCAATTAGACAAGATATGCTCAATTTGTTCAGCATTTGGGCCGTGGTGCGGCCGGAAGCTTTGGCCTGAGGATATACGCAGCAGCTCTCGTTAAACTGAGGATCTGAGATAGTTTCTGACTTCACCATCTGGAATTCTAGTCTGGGGTTCTGCTAAAAGCTGCTGACCCACGATTCAACTCTTAAACTCAG\n>AAVT01000001.1/231300-231180 Marine gamma proteobacterium HTCC2143 1100111000176, whole genome shotgun sequence. \nCGCAAACCTAAGGGGTGGCTTTTGCCTGAGATGCCTTGATCTGCTTGTTACTGTCGATCAACAGCGAACCCTTGAACCTGATCCGGTTAATACCGGCGTAGGAATAGGTGTCCCCAACCGA\n>MHIN01000011.1/1-803 Candidatus Buchananbacteria bacterium RIFCSPLOWO2_01_FULL_40_23b rifcsplowo2_01_scaffold_14059, whole genome shotgun sequence. \nGAAGCTCCCAAGGGTTTGGCTGTTCGCCAATTAAAGCGGTACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTAGATTCGTGCTGTCTATAAATTCGGCTATATGCTGGAAAATCCGAGAATCTTATGATACTCATCCATAAAAATTGGGTAGTGAAAATTCATAAGTGCGGACAATCAGCAGGAAACTTAATAATAGTTTGTTATTAATAATATTATTTATGTTATTGCTAACAAAATTGTCGAGAGCGGCTTCTAATAAAAAAATTATATTATTAGAAGCGTTAAAATAGTAGTGATTGTAAATACAGTAGTGGTTTATAATAACCAATCTACATAAATTATTGCCGTAGACTCGAATTATTATGAATCCTCAGAGACTATACGCCGAAATTCCGATAAAAATCGGAAATAAGATATAGTCCGAACTGCATGGCGACATGCAGATTCCGGCAGAAATTGTCGGAACGCCATAGAGCAATTGATGTTTTAAGATATGGTTTTGCAAAGTAACAGATTGTCGGTCTCCTATCCACTGTGGGCGTTGAAATTTGAGGGGGCTCATTTTTAGTACGAGAGGACCAAAATGAATAAACCTCTAGTGTACCAGCTGTCCTACCAAGGGCACAGCTGGGTAGCTACGTTTAGTTTAGATAAGCGCTGAAAGCATATAAGCGCGAAGCTGTCCCCAAGATTAGATTTCGTTATAGGCTCCCGGGAGACGACCGGGTTGATAGGCGGTAGGTGTAAGGCCAGCAATGGCTTGAGCCGAGCCGTACTAATAGCCAATTTCTATTTAACCAC\n>AP008230.1/3620544-3621014 Desulfitobacterium hafniense Y51 DNA, complete genome. \nTTAATGCTAATGACGAGAAAGAGTACACCTTAGCCGGAATGTCCAAGAGAGTCAGCGTTGGTGAGAGCTGATACAAACCGTTTGGTGGAATGGGTCTCTGAAGCGCAAGCTGAACGAATCTGCATCTTGACTATCAGGATGGAGATATCAAGTAGGCAAGCCGGGGGTTTCCCGTTACAGAAACACGGGTATCGAGAGCATGGATCATTCTCTCCGCATCCGGTTAGAGGTATGGGACAGCTTTTTTAATTCCAGCGGCTTGCGCTGACCCATATAAATTAAGGTGGCAACACAGAAGTACTTTCTGTCCTTTACATAGGACGGGAAGTTTTTTATTTTAAAATAAAGTGCCGCCCTCTCCGGATGAACAAGAGATGAAATTATGTTTTCTCCGTACCTGATAGAGGTACTTGTAGATACACTACACAAGTACAAATTAAGGTGGCACCACAGAAGCTTTCTGTCCTTTGG\n>CM003280.1/7976717-7976643 Salmo salar isolate Sally breed double haploid chromosome ssa02, whole genome shotgun sequence. \nTGCCCCCGTGCGAGGAATCTAAGATAGAATTGGACTTTGCTGTGAAATTCTATCTTAGATTCCTCGCACGGGGGC\n>MGZN01000446.1/306-243 Hydrogenophilales bacterium RIFOXYA1_FULL_63_33 rifoxya1_full_scaffold_3877, whole genome shotgun sequence. \nTCGGGGCGCCAGCCCCCGATGTCTGAGCACGATGCTCACAAGACGGTGTCCCGTCCAAGCCTGG\n>LZPO01097937.1/23658-23530 Neotoma lepida isolate 417 scaffold_12034, whole genome shotgun sequence. \nTTTGCAGGCTGATGGAGTCAGCAAGGAAGAGGTTTATGAACAGCAGCCACTCTGCATAGGATGGCTGCAGGGAATGTTCTCATGCTTGCCCAGAGAAGTCTGCCAGGGTCACTGAGATACCTCTGAGAT\n>CP011974.1/3783475-3783356 Bacillus endophyticus strain Hbe603, complete genome. \nAGACCCTTTAACATCAGTCCTGTGAGGCTGAGAAGGAAACGGACCGCAGATGCAGCAGGCGTCTGCAAGCTTACTATACCCGGCATCCTCTCAGTCACGGACAAAGAGGATGCTTTTTTT\n>JXSO01000068.1/6302-6422 Achromatium sp. WMS3 contig-199_67, whole genome shotgun sequence. \nTAATTTTTTTAAATATTTCACATATATACCGACACAAAACGTAGGGTGCCTTAATTACCTTTAAATATTAAAGTGAATACCTGTTAAAAAGGTTACGTTTTGGGGCATATAGAGGCAAAAC\n>CM002304.1/542199-542383 Ogataea parapolymorpha DL-1 chromosome V, whole genome shotgun sequence. \nCACTCCTGTTTCTGCCTCATATTCCCTTGCTCCATGGAATAATGGGTTCTGGTGATGGAGAAGATCAAGCCCGTCGTCGTCTCTGCGATTTGATACTTTGTTGAGTTCGAGGACGGGATCGTGAAAACGCATATACCCAGGGCTGCCAGACAGGTTGGCGGCTCTGAATTGTCGTTTCTACATCT\n>ABJB010136869.1/1-805 Ixodes scapularis strain Wikel colony gcontig_1108379663008, whole genome shotgun sequence. \nCATCCGCAGCAGGTCTCCAAGGTGAACAGCCTCTAGTCGATGGACCAATGTAGGTAAGGGAAGTCGGCAAAACGGATCCGTAACCTTGGGATAAGGATTGGCTCTGAGGACTGAGCCGGTCGGGCTGGGGACCTGAAGCAGGAACGGCACTGCACCGGGACTGGGCGGGGCTCGCCGTTCACGCGGCGCGGCCAAGCCCGGACCAGCGTCGGGACCTTCCTGTGGAAAGCCTCAGCTGCGCGGCGTCTGAGGGCTTCGTGCCCAAAGTGCTATGCTTCGGCCGGCAAAAAACAGTCAACTCAGAACTGGCACGGACCGGGGGAATCCGACTGTCTAATTAAAACAAAGCATTGCGATGGCCGCTGGTCGGTGTTGACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAACGTGAAGAGATTCATCAAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTGTGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTATCTACTGGGAAGGAAGAAGAAGACCAGACCTCCTAGACCATCAGATTGTAAGCTGTATCGTTCCAGTAATTTTTCTTTAACTTCTAGCCATTATTTCTTAAAAACAACCTAGCGGTAGGATTTCTAAGAACTAGCGATCACCCTGTTATCAAATTTAAGACTGTTAACCCATTAATTTTTCTTAAAATACACCTTTGGAATCACTGTTTACACTGCGGCCATATTGCCACGGTTGTAGATGTTGAACCCCAAATTTGAAAATAACT\n>CVUF01000026.1/144661-144885 Staphylococcus capitis strain CR03 genome assembly, contig: BN1517_Contig_4 \nTTTTTATTCATAAGGCATCTCGGTAATTCAGTTTAGTGAAGTTTATTCAATGATAGGAAAGTGCCTTATATTTTAAAGTATATCGATGTGAAATTACATGGTAATATGTAGTATCTTTGACGAGATTCCTGAAGGAGCAGTCCCAGTCCTAAACCTAGATTGAGACGGACACACTGCGACACGAAACCATACTATACGAAGTAATGAATATAAAAGTAGCAGTAA\n>KC954775.1/132832-132944 UNVERIFIED: Cronobacter phage S13, complete genome. \nGGGGTGATCGTCTAGTGGTAGGACGCTTAAAGACGCAAACTGATAAGTTTGTATTCAGCATTTAACTTTCCATTCCAAGGAAGAAACGCGTGGTTCGAATCCCGCTCACCCCG\n>URS0000D67EE2_12908/1-83 unclassified sequences c-di-GMP-I-GGC riboswitch \nAAUAAAAAAGGUACAUCUGUCGAAAGUUUGGGGCGCGAAGCCGCGGAUUUAAUACGACAGCUGCGAUGAGCGGGCUACCGUGG\n>KE355093.1/339-1 Streptomyces afghaniensis 772 genomic scaffold STAFG_scaffold694, whole genome shotgun sequence. \nGCGCAAGCGGCGGAGGCATGTGGCGTTAATTCGACGCAACGCGAAGAACCTTACCAAGGCTTGACATACACCGGAAAACCCTCGGAGACAGGGTCCCCCTTCGTGGTCGGTGTACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCCCGTGTTGCCAGCAGGCCCTTGTGGTGCTGGGGACTCACGGGAGACCGCCGGGGTCAACTCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGCCCCTTATGTCTTGGGCTGCACACGTGCTACAATGGCCGGTACAATGAGCTGCGAT\n>ALWS01100951.1/21533-21438 Pteropus alecto contig100951, whole genome shotgun sequence. \nATTTTCAGTTATAAGATAAGTAAGTTCTGCTAAGCAGGTTGGACCTGGTTAGTACTTGGATGGGAGACCACCCAGGAAGACCAGGTGCTGTAGGCA\n>CP019433.1/1335117-1334970 Jeotgalibaca sp. PTS2502, complete genome. \nAATATTGAAAGAGGATGCGAAAAAAATCAGTAGGTTTCGAAAGGGTTTTTCGCCGAAATGCAGCTTAGCTGTGTTGGGGTCCGTTTGAATAAGACGGGAACTGCCTGATAGTCTTGCCCAAAGACTATTAAGGAGTGCTGTCATTGTT\n>CM001241.2/28956953-28956880 Oryza brachyantha chromosome 1, whole genome shotgun sequence. \nGTGAGCCGTGTAATAGGCGACTATTTCGCGCGGTTCGGGGGGCACTTGAAATCTTGAATAAGCCGTCAGCCCTC\n>ALWZ044178298.1/15950-15905 Picea glauca, whole genome shotgun sequence. \nTCAAAGGATTCCTTCGAATCCACCATGATCATATTTCGAAAATAGT\n>CP012413.1/1770895-1770659 Piscirickettsia salmonis strain PM15972A1, complete genome. \nAAAGTTCAGCCCTGAAAATGCAGCTCAGCATATCAGGTACCGAGCCTTGAGTAAGTACTGGTAACAGTGCGTGCTAAGCGTAGGCAGGGAAATAATAGGCCGTAAGCCAAAGAGCTGAAGTGATTGAGCCTCGTAAACATAATACTGAGATAGCCGATGGTTTGGAATGTATCAGAAGGCAATATCGAATAGGACGTTAAGAGAAGAAATATTCGACATCTCCGGGGTCTTAGAGCA\n>AGTP01050901.1/2323-2414 Ictidomys tridecemlineatus contig050901, whole genome shotgun sequence. \nGGGGATGTAGCTCAGTGGTAGAGCACCCTTGGGTTCAAATCCCAATACCTAACAGGGGTGGGGGTAATGGTGGTAAGGTCCCTCCATTACCT\n>KE346365.1/91830-91967 Capsaspora owczarzaki ATCC 30864 unplaced genomic scaffold supercont2.6, whole genome shotgun sequence. \nATCTTTGTGCAAGGGTGGTGCCATCGTGCGTGAGGGAATTCCCGATGCGTGGCTTTTTGCTGATTGCAAACTAAACATCCAAGCCCGCGACATGTGAAGCTTGCTTCCTGTCGCAATTTTTGTAGCTGGCCCAGGTCG\n>ALWS01164951.1/7774-7926 Pteropus alecto contig164951, whole genome shotgun sequence. \nATCACTTCTCGGCCTTTTGGCTAAGATCAAGTGTAAAATTGCCTAGATGTAAATATGTGTATATGTGCATGTTTGTACCTGTAAATATGTGTATATGTGCACGTTTGTACCTCTATGCGCGTGCGCGCAGGCGCGCGCGCGCGCGCACACACA\n>GL883275.1/454-1 Melampsora larici-populina 98AG31 unplaced genomic scaffold MELLAscaffold_189, whole genome shotgun sequence. \nTTCTACCCACAAGGAATATCCGGGTGGCTCCGCCACCCGGGGCGCGTCTCCGAAAAAAAAAAAAAAATTAGAGGGCTTGGGAATGTAATGTTCTTAACCTATTCTCAAACTTTAAATATGTAAGACGTACTTGTTTCTTAATTGAACTTGTACATGAATAAAAGTCTTTAGTGGGCCACTTTTGGTAAGCAGAACTGGCGATGTGGGATGAACCAAACGCAGAGTTAAGGTGCCGGAATATACACTTATCAGACACCACAAAAGGTGTTAGTTCATCTAGACAGCCGCACGGTGGCCATGGAAGTCGGAATCCGCTAAGGAGTGTGTAACAACTCAACGGCCGAATGAACTAGCCCTGAAAATGGATGGCGCTCAAGTGTATTACCTATACTCTGCCGTTAGTATTCTTTTAAAGATATTAACGAGTAGGCAGGCGTAAAGGTTGCGTAGAAGC\n>AYZS02020768.1/14673-14528 Beta vulgaris subsp. vulgaris Bvchr7.sca021.con0307.1, whole genome shotgun sequence. \nTTGGGTTCACAATATAGTTAGGCAAAAAATGGTGCTGATTAATAAATGGGCATTGTTTTAAAAAGTGGATCCGAAAGTGAATTGTTCCCCTCGCTATCCAGTGTAGAAATTTCTTTGCTACATTTGGACGTTGGGAAACTATATTT\n>KE159628.1/947698-947606 Lachnospiraceae bacterium COE1 genomic scaffold acPFN-supercont1.2, whole genome shotgun sequence. \nAGCAGTTCCTTAAGTGCCTTGTGAACAGGGAGTTGTCACAGGGACGAAAAAGCCCTCTGGGGCTTTGCGGTACGAGGTTCGCATCCCGCTGCT\n>MGUZ01000016.1/78253-78409 Elusimicrobia bacterium RIFOXYA12_FULL_49_49 rifixya3_full_scaffold_62, whole genome shotgun sequence. \nTTGTCCCTGCGATGTTGGTGTGGTATTATCTGATTTGAACCGACAAGTTCCTTTCAGGGAGTTGCAGGTGAGCTATACGCCTTAGGGCTATAGACCCGGACACCCACTTAATGAAAAGGGCTCAATCAGATGAAACTCACGGCAGAGTGGGGATTTT\n>AE017283.1/720172-720358 Propionibacterium acnes KPA171202, complete genome. \nGCTAAAATCCTCGCGTCAGGTTGCTGGTGACCACACCAGCGCTGGAATCCGGTGAAAAGCCGGAGCTGACGCGCAGCGGTATGACTGATCCGCCCCGACTTGAACCACTGGCGCCATGCGCACTGGGAAGGCGCCGGGAACGGAGACGAAGTCGAGCCCGAAGACCACCTGACGACGCCCTGTTGTT\n>AOTI010241097.1/1-750 Triticum urartu cultivar G1812 contig241097, whole genome shotgun sequence. \nTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCCTCACGGCGACGGTGAAATACCACTACTTTTAACGTTATTTTACTTATTCCGTGAATCGGAAGCGGGGCGTAGCCCCTCCTTTTAGATCTAAGGCCCGTTCGCGGGCCGATCCGGGCGGAAGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGTACGAATACGAACCGTGAAAGCGTGGCCTATCGATCCTTTAGACCTTCGGAATTTGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGACAGCATCGCAATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGTGCCGGATTATGACTGAACGCCTCTAAGTCAGAATCCAAGCTAGCATGCGACGCCTGCGCCCGC\n>LADO01000055.1/61648-61600 Peptococcaceae bacterium BRH_c4b BRHa_1001649, whole genome shotgun sequence. \nGGTTGGCCCCGTGAGGGGTTTCAAGATCCGATTACTTGGGTGGGTAGTC\n>AAQR03071181.1/131-221 Otolemur garnettii contig071181, whole genome shotgun sequence. \nCCCTCAGGAGGACTGTGCCGGTCAGCTCCATGGAGTTTCAGTCAAGGAGTTTCTGAGCCTATGGATCTACAATATTTGACTGCCTGGGGCA\n>KE951434.1/4972-1857 Actinobaculum sp. oral taxon 183 str. F0552 genomic scaffold Scaffold35, whole genome shotgun sequence. \nGTTGTAGGTGTTGTAGGGCGTTCGGTGGATGCCTGGGTACCGGGAGCCGAAGAAGGACGTTGCAGCCTGCGATATGCCTCGGGGAGCCGGCAAGCGGGCTTTGATCCGAGGGTGTCCGAATGGGGGAACCTGGCCGGGGTTGTGCCCGGTCGCTCGTGCCTGAATTCATAGGGTGCGGGTGGTGACGCGGGGAAGTGAAACATCTTAGTACCCGTAGGAAGAGATATTCCGTGAGTAGTGGTGAGCGAAAGCGGAGGAGCCTAAACCGTGGGCGTGTGAGAGCCGTCGGGTGTTGCGTGTGCGGTGTTGTGGGAGATGATCGTGATCATGCCGACGCGTGGTCGCGCAGTGATAAACCGTGGGGATAGGCGAAGGGTCTGGGAAGGCCTGCCGGAGAGGGTGAGAGCCCCGTAGCTGAAATTCTCGTGGCTGTGTGATTGTGTTCCCGAGTAGCATGGGGCCCGTGGAATCCCGTGTGAATCTGGCAAGACCACTTGTCAAGGCTAAATACTCCTGGTGACCGATAGTGGAGAGTACCGTGAGGGAAGGGTGAAAAGTACCCCGGGAGGGGAGTGAAAGAGTGCCTGAAACCGGGCGCCTACAATCCGTCAGAGCCTCCGTGGTGGGGGTGATGGCGTGCCTTTTGAAGAATGAGCCTGCGAGTTAGTGGCATGTGGCGAGGTTAACCCGTGTGGGGGAGTCGTAGCGAAAGCGAGTCCGAAGAGGGCGTGAGTCGCGTGTTCTAGACCCGAAGCGGGGTGATCTACCCATGGCCAGGGTGAAGCTCGTGTAAGAGCGTGTGGAGGCCCGAACCCACCAGGGTTGAAAACCTGGGGGATGAGTTGTGGGTAGGGGTGAAAGGCCAATCAAACTCCGTGATAGCTGGTTCTCCCCGAAATGCATATAGGTGCAGCGTTGCGTGGTTCCTTCCGGAGGTAGAGCGACTGGTTGGCTGATGGGCCTTACCGGGTTACTGACGTCAGCTAAACTCCGAATGCCGGGAGGGTGGAGCGTGGCAGTGAGACGGCGGGGGATAAGCTTCGTCGTCGAGAGGGAAACAGCCCAGATCGCCGGTTAAGGCCCCTAAGCGTGTGCTAAGTGGGAAAGGATGTGGAGTTGCTGGGACAACCAGGAGGTTGGCTTAGAAGCAGCCATCCTTGAAAGAGTGCGTAATAGCTCACTGGTCAAGTGGTTCCGCGCCGACAATGTAGCGGGGCTTAAGCACACCGCCGACGCCGCGGCAGTCCATCGTGGTCCTAGCCTGTCCGTTGGGCGGGTTCAGGGGGTGGGCTGGGTAGGGGAGCGTCCCGCGTTGGGTGAAGTCTCGGGGTGACCCGGGGTGGACGGCGTGGGAGTGAGAATGCAGGCATGAGTAGCGAGAGGCGGGTGAGAAACCCGTCCGCCGATTGACTAAGGGTTCCAGGGCCAGGTTGATCCGCCCTGGGTTAGTCGGGTCCTAAGGCGAGGCCGACGGGCGTAGTCGATGGACAACGGGTTGATATTCCCGTACCGGCGCTTGACCGTTCAATGTTCGCCGGGGTGATGCTAACCATCCCCGATCCTGTGTGTCTCTTTCGGGAGGCGTGTGGGGGAGGGCGTGGGGTCCGAGCCTGGGTGGGCAAGCGTGGTAACAGGTGTGACGCAGAGTGGTAGTCCAACCGTGTCGTATGGCTGAGCACGGCTAAGGGTGCAGCCCGTCTCCCAGGTAAATCCGGGGGGCGTTCGGGTCAGGCCTGATGGGGACCGTTTGACGGGAAGTGGATGATCCTGTGCTGCCGAGAAAAGCATCGACGTCAGGGCAAGCGCCGCCCGTACCCGAAACCGACACAGGTGGTCAGGTAGAGTATACCGAGGCGTGCGAGTCAATCGTGGTTAAGGAACTCGGCAAAATGCCCCCGTAACTTCGGGAGAAGGGGGGCCCGGGCCTTGATGTCCCCGTGCGGGGCGGAGGGGTCGGGGCCGCAGAGTCCAGGGAGAAGCGACTGTTTATCAAAAACACAGGTGCGTGCTAAGCCGCAAGGCGATGTATACGCACTGACGCCTGCCCGGTGCTGGAAGGTTAAGCGGACTGGTCAGCCCTTCGGGGTGAAGCTGGGAAGTTAAGCCCCAGTAAACGGCGGTGGTAACTATAACCATCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGCGTAACGACTTCTCCGCTGTCTCGACCACGAGCTCGGTGAAATTGCAGTACGAGTAAAGATGCTCGTTTCGCGCAGCAGGACGGAAAGACCCCGGGACCTTTACTATAGCTTGGTATTGGTGTTCGGTACGGCTTGTGTAGGATAGGTGGGAGACTGTGAACCGGTCACGCTAGTGGGCGGGGAGTCGTTGGTGAAATACCACTCTGGCCGTGCTGACCATCTAACCTCGGTCCGTGATCCGGGCCAGGGACAGTGCCTGGTGGGTAGTTTAACTGGGGCGGTTGCCTCCTAAAGGGTAACGGAGGCGCTCAAAGGTTCCCTCAGCCTGGTCGGCAACCAGGTGGCGAGTGTAAGTGCACAAGGGGGCTTGACTGTGAGACTGACGGGTCGAGCAGGTACGAAAGTAGGAACTAGTGATCCGGCGGTGGCTTGTGGAAGCGCCGTCGCTCAACGGATAAAAGGTACCCCGGGGATAACAGGCTGATCCTGCCCAAGAGTTCATATCGACGGCATGGTTTGGCACCTCGATGTCGGCTCGTCGCATCCTGGGGCTGGAGTAGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGTACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCCTATCCGCTGCGCGCGTAGGAGAATTGAGAAGGGCTGTCCCTAGTACGAGAGGACCGGGACGGACGAACCTCTGGTGTGCCAGTTGTTCCGCCAGGAGCATGGCTGGTTGGCTACGTTCGGGAGGGATAACCGCTGAAAGCATCTAAGCGGGAAGCCTGCTTCAAGATAAGTTCTCCATCCAGCCTGTGTGCTGGGTGAGGTCCCCCGCAGACGACGGGGTTGATAGGCCGGACGTGGACGCCTCGTAAGGGGTGGAGCTGACCGGTACTAATGGACCGACCGCCTACACCAT\n>AAAB01006367.1/1-1388 Anopheles gambiae str. PEST whole genome shotgun sequencing project, whole genome shotgun sequence. \nTATTCGAACGAGCTCTTGGATGACTGAAGTGGAGAAGGGTTTCGTGTCAACAGCAGTTGAACACGAGTTAGCCAATCCTAAGCCGCATGGGAATCCAGTCGTAACCCATCAGTCGGCGAAAGGGAATCCGGTTACCATTCCGGAGCCTGTTGAGTACCCGTTTGCGCCAGCCTAGTAGGGTTTAGCTCGTCCGCACCCGAACGGTTAGTGTGTAGCTTCATGGCAACATGAATCCTTTTCTTCGAGAAGCCAACGAGAGGCATCGGAAGAGTTTTCTTTTCTGTTTTACAGCCACACCGACCATGGAAGTCACTCACAGAGAGATATGGTTGGACCGGTCTGGTAGAGCACGGCCGCCGCAACTGCCGTGTCGATGCACTCTTCTTGGACCGTGAAAATCGAAGACTGGGGCACACTTTATATGGTAATAACGCACACTCTCAACAGATTGTACCGAATCCGCAGCAGGTCTCCAAGGTGCAGAGTCTCTAGTCGATAGATCAATGTAGGTAAGGGAAGTCGGCAAACTGGATCCGTAACTTCGGGACAAGGATTGGCTCTGAAGGCTGGGTGCGACCAGCCGGGACCGGTGCTCCACCTGCCGCAAGGTAGGCTGGCCCGTGCCCGCGGTCGCACAGCAAACAGCCAATTCAGAACTGGCACGGCTGAGGGAATCCGACTGTCTAATTAAAACAAAGCATTGTGATGGCCCCGGGTGGGTGTTGACACAATGTGATTTCTGCCCAGTGCTCTGAATGTCAACGTGAAGAAATTCAAGCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCTCTGTCCCTATCTACTATCTAGCGAAACCACAGCCAAGGGAACGGGCTTGGATGCACTAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCTGGCATTGTAAGGCGATATAGGAGGTGCAGCATAGGTGGGAGGGCTTCCTCGTGGAGCTCGCCTCTGAGATACCACCACTCTTACTGTTGCCTTACTTACATGATTGGGTGGTACAAGCGCGGGCCCCAGGTCCGGATCGTGCGCGCACCTCCTCCGGGGGGCTGTGGCGGCGGTTCGCCTGCGCGCGCCCAATGCGCCGTGTTTCTCGCTCAGCGTCCAGTGTGTCGCTGGGTGGTGCCGCCGGGGAGACTGCATCGTAGCATCGTCGTGTGTAGCGTGTTACCCGCTTGTCCGACCGTGAGCCGTGGCCCGCAAGGGTACAAGCTTGCGTACGTCGGTGCATTCGTGGTGCACTGCTTCTGCGCGGTCGATCGTTTATGATGTCACGTTTGCCCCCGGTTCCGCGCGCCGC\n>JH835377.1/4969955-4970252 Erinaceus europaeus unplaced genomic scaffold scaffold00089, whole genome shotgun sequence \nGGATGTGAAGGCAATCTGGCTGTGACATCTGTCACCCCATTGATCACAAGGGTTGATTTGGCTGATCTGGCTGGCTAGGCAAGTTTCCCCTTCCTTCCTAACTGCTCCATGTGCATTGAAAATAGCCTTGCTTGAATCGAGACGGACCGGTCTTCATTGGAGGGTATACAAGTAGCTGCGCTCCCCTGCTAGAACCTCCAAACAAGTTCTTCAAGATATACTACAGAACAATTTGTTTAATAATCAGGAACCTAAAGGCAAAAAATATAGCAGATGAGATTCGGGAGGGTCTTCATTT\n>CP014222.1/4334669-4334580 Janthinobacterium sp. B9-8, complete genome. \nTTCAATGGTGGGGCGTGGTGGGGGCTACCTCGGTAGCGTCGGTTTACTATTTCGCCGATACGCCAACTCTGCCACGTTCCTACCTCCTTC\n>FQXP01000006.1/145863-146131 Clostridium collagenovorans DSM 3089 genome assembly, contig: EJ35DRAFT_scaffold00004.4 \nATAAATGCTATGAAAAAGGAAAGTAGTGTATTGGAGGGTTACAGAGAGAAAGCGATGCTGAGAAGCTTTCACCTATAAGATATATGAAGTGCCCTTTGGAGCATGGATCCGAAATGGAGTTACACAATAGTTGAGTAACTTAAAAGTAGGAGACCACGGGTTCGCCCGTTAAAGCGATAGGGCATTATTATGTGCTTGAAGATAAAGTGAGATTCTTTTTGAATCTAATTAGGGTGGAACCACGGAGTAAACATAGCTTCGTCTCTAGA\n>URS0000D6C44C_12908/1-87 unclassified sequences c-di-GMP-II-GAG riboswitch \nGCGAGGGGUAGGAGCUCGGAACCGCGGCCCGCAAGACGGGCACUGAAGGGGCGCAGGGGGCUAGUGGUGCGACCGGCUACCGCUCCG\n>URS0001A235AD_371731/1-41 Rhodobacter sp. SW2 L2-Alphaproteobacteria ribosomal protein leader \nGGAUCCCAACGAUGGAUCCUUCAACUGACGGAAGACAGAAA\n>FQUW01000011.1/34981-34776 Desulfotomaculum australicum DSM 11792 genome assembly, contig: EJ60DRAFT_scaffold00008.8 \nCAATTGAATAATTGAACGGGTGCTCCCTTTTTCAAGGGATAGAGGGAAGTCAGTGCAAATCTGACGCGGTGCCGCCACTGTGAATGGGGAGCTGGCCACACAATGCCACTGGTCGGGCACCTGCATTGGCCGGTGTCCGGTTGGGAAGGCGTGGTTAAAGCGATGATCCATGAGCCAGGAAACCTGCCCGTTCTATTTCACCGTTT\n>URS0000D6A184_12908/1-121 unclassified sequences Flavobacterium-1 RNA \nCGAGATAGGGGTACAAGTTCTGCAGTATTGCGTTCCTCTGGACCTAAGCAACGACCTGAAAGGGTAGCGACGAAGCTCGGCGTTAGTGGAGAGAGTCCCAGACGTGGTGTCTCCACTGACG\n>MUNX01000075.1/101357-101431 Flavobacterium sp. A45 NODE_7_length_112147_cov_12.4241_ID_13, whole genome shotgun sequence. \nTTTTAGCCCCGATAGCAGTGTAAATCCTCTCTCGTTTTTCAACGAGAGAGATTGAAACGGATAGCGGGACTTTGC\n>KQ948572.1/3318-23 Streptomyces longwoodensis strain DSM 41677 genomic scaffold PRJNA299227_s024, whole genome shotgun sequence. \nGGCCAAGTTTTTAAGGGCGCACGGTGGATGCCTTGGCACCAGGAACCGATGAAGGACGTGGGAGGCCGCGATAGTCCCCGGGGAGTCGTCAACCAGGCTTTGATCCGGGGGTTTCCGAATGGGGAAACCCGGCAGTCGTCATGGGCTGTCACCCACTGCTGAACACATAGGCAGTGTGGAGGGAACGAGGGGAAGTGAAACATCTCAGTACCCTCAGGAAGAGAAAACAACCGTGATTCCGGGAGTAGTGGCGAGCGAAACTGGATGAGGCCAAACCGTATGCGTGTGAGACCCGGCAGGGGTTGCGTATACGGGGTTGTGGGATCTCTCTTTCACAGTCTGCCGGCTGTGAGACGAGTCAGAAACCGTTGATGTAGACGAAGGACATGCGAAAGGTCCGGCGTAGAGGGTAAGACCCCCGTAGTCGAAACGTCAGCGGCTCGTTTGAGAGACACCCAAGTAGCACGGGGCCCGAGAAATCCCGTGTGAATCTGGCGGGACCACCCGCTAAGCCTAAATATTCCCTGGTGACCGATAGCGGATAGTACCGTGAGGGAATGGTGAAAAGTACCCCGGGAGGGGAGTGAAATAGTACCTGAAACCGTGTGCCTACAAGCCGTGGGAGCGTCGGANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTTCTCGTGACTGCGTGCCTTTTGAAGAATGAGCCTGCGAGTTTGCGGTGTGTTGCGAGGTTAACCCGGGTGGGGTAGCCGTAGCGAAAGCGAGTCCGAACAGGGCGTTTCAGTAGCACGCTCAAGACCCGAAGCGGAGTGATCTAGCCATGGGCAGGTTGAAGCGGAGGTAAGACTTCGTGGAGGACCGAACCCACCAGGGTTGAAAACCTGGGGGATGACCTGTGGTTAGGGGTGAAAGGCCAATCAAACTCCGTGATAGCTGGTTCTCCCCGAAATGCATTTAGGTGCAGCGTCGTGTGTTTCTTGCCGGAGGTAGAGCACTGGATAGGCGATGGGCCCTACCGGGTTACTGACCTTAGCCAAACTCCGAATGCCGGTAAGTGAGAGCGCGGCAGTGAGACTGTGGGGGATAAGCTCCATGGTCGAGAGGGAAACAGCCCAGAGCATCGACTAAGGCCCCTAAGCGTACGCTAAGTGGGAAAGGATGTGGAGTCGCAGAGACAACCAGGAGGTTGGCTTAGAAGCAGCCACCCTTGAAAGAGTGCGTAATAGCTCACTGGTCTAGTGATTCCGCGCCGACAATGTAGCGGGGCTCAAGCGTACCGCCGAAGTCGTGTCATTGCAGCATATACGGCCAACGCCGGCTGTGATGGGTAGGGGAGCGTCGTCTGCCGGGTGAAGCGGCACTGGAAGGTAGTCGTGGACGGTTGACGAGTGAGAATGCAGGCATGAGTAGCGATACACACGTGAGAAACGTGTGCGCCGATTGACTAAGGGTTCCTGGGTCAAGCTGATCTGCCCAGGGTAAGTCGGGACCTAAGGCGAGGCCGACAGGCGTAGTCGATGGATAACCGGTTGATATTCCGGTACCCGCTGTGAAGCGTCAAACATCGAATCCAGTGATGCTAAGGCCGTGAAGCCGCCCTGATCTCTTCGGAGTTGAGGGGAGTGGTGGAGCCGCTGACCCGATCTGGTAGTAGGTGAGTGATGGGGTGACGCAGGAAGGTAGTCCAGCCCGGGCGGTGGTTGTCCCGGGGTAAGGGTGTAGGCCGTGCGATAGGCAAATCCGTCGCACATAAGGCTGAGACCTGATGCCGAGCCGATTGTGGTGAAGTGGATGATCCTATGCTGTCGAGAAAAGCCTCTAGCGAGTTTCATGGCGGCCCGTACCCTAAACCGACTCAGGTGGTCAGGTAGAGAATACCGAGGCGTTCGGGTGAACTATGGTTAAGGAACTCGGCAAAATGCCCCCGTAACTTCGGGAGAAGGGGGGCCACAACCGGTGATGAGTCTTGCACTCTGAGCTGGGGGTGGCCGCAGAGACCAGCGAGAAGCGACTGTTTACTAAAAACACAGGTCCGTGCGAAGCCGTAAGGCGATGTATACGGACTGACGCCTGCCCGGTGCTGGAACGTTAAGGGGACCGGTTAGCTCCATTTCGGTGGGGCGAAGCTGAGAACTTAAGCGCCAGTAAACGGCGGTGGTAACTATAACCATCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGCGTAACGACTTCTCGACTGTCTCAACCATAGGCCCGGTGAAATTGCACTACGAGTAAAGATGCTCGTTTCGCGCAGCAGGACGGAAAGACCCCGGGACCTTTACTACAGTTTGATATTGGTGTTCGGTTCGGCTTGTGTAGGATAGCTGGGAGACTGTGAAGCCTGGACGCCAGTTCGGGTGGAGTCGTCGTTGAAATACCAGTCTGGTCGTGCTGGATGTCTAACCTGGGTCCGTGATCCGGATCAGGGACAGTGTCTGATGGGTAGTTTAACTGGGGCGGTTGCCTCCTAAAGGGTAACGGAGGCGCCCAAAGGTTCCCTCAGCCTGGTTGGCAATCAGGTGTTGAGTGTAAGTGCACAAGGGAGCTTGACTGTGAGACCGACGGGTCGAGCAGGGACGAAAGTCGGGACTAGTGATCCGGCGGTGGCTTGTGGAAGCGCCGTCGCTCAACGGATAAAAGGTACCCCGGGGATAACAGGCTGATCTTCCCCAAGAGTCCATATCGACGGGATGGTTTGGCACCTCGATGTCGGCTCGTCGCATCCTGGGGCTGGAGTCGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGTACGCGAGCTGGGTTTAGAACGTCGTGAGACAGTTCGGTCCCTATCCGCTGTGCGCGTAGGAGTCTTGAGAAGGGCTGTCCCTAGTACGAGAGGACCGGGACGGACGAACCTCTGGTGTGCCAGTTGTCCTGCCAAGGGCATGGCTGGTTGGCTACGTTCGGGAGGGATAACCGCTGAAAGCATCTAAGCGGGAAGCCTGCTTCGAGATGAGGACTCCCACCCACTTGATGGGGTAAGGCTCCCAGTAGACGACTGGGTTGATAGGCCGGATCTGGAAGCACGGTAACGTGTGGAGGTGACCGGTACTAATAGGCCGAGGGCTTGTCCTC\n>MJAT01000005.1/39405-39606 Firmicutes bacterium MLFW-2 MLFW-2_Contig_13_85X, whole genome shotgun sequence. \nGACAAGGCTACGATAAGGAAAGTAAAAAACGGAGCATTACAGAGAGTGGGCAAACAGCTGAAATTGCTTACATGTTGAAGTTTTTGAAAATGCACCTTGGAGCCGTGCAGAATGATTCTGCAACGGGGAAACCCGTTATTCGTTTGAGTGATGCAAAGGACTTTGCATAATCAGAGTGGAACCACGAGAAATCGTCTCTGTT\n>LBSQ01000033.1/4164-6256 Parcubacteria bacterium GW2011_GWA2_37_10 US35_C0033, whole genome shotgun sequence. \nGAGATCTTTGGAAAACACCATTAGGTGGATAACTAGGTTTAGTTTACTGATGAAGGACGTGGCAAGCTGCGAAAAGTCTTGGCTAGGCGCATGCAGCCTTTGAACCAAGAATTTCTGAATCAGACTTCTGAATCTCTTCGGAGATATGTTGGAAACAACAGGGAACGCAGGGAATTGAAGCGTCTTAGTACCTGCAGGAAAAGATATCAATAGATATGCTGAAAGTAAGGGCGACCGAAATCAGCAAAAGGCAAACTGAATCTGTTATTGAAAAATAACAGAGATGTGGTGTTTTAGGCTAATATTTAATCTTAACCAAAAGACCTGAAGTTTTCTGGAAAGAAACACTTTAAAGGGTGATAGTCCCGTAGGGGAAATTTGGAAAGATTGAGTTAGTACTAGAGTAGTGCTTACTGGATACTAAGCATGAATTTGGGAGGCATTAACTCCTAACTTTAAATATAAACTAAGTCCGATAGCACATAAGTACTGTGAAGGAAAGTTGAAAAGAACTTTTAATCAGGAGTTAAAAGACTTGAAACCTAATGGTAATAGAATATTACGGCTCTTAGGAGTTGTAATGTACGTTTCGAATAACGGACTAGGAAGTGTATTTGAGTGGCGAAGATAATCTTAATATTAGAGTATCTAAAGGGAAACCAATTTTCCGCAATTTATGAGGGAAAAGGTATGAAAATGCCTTTGAGTCACTTGAGTACGACCCGAAACCAGGCGATCTATCCTAGAGCATGGTGAAGTGAGATTTAAAATCTTATGGAGGCCAGAAGAGATACTACGTGCATGTGTTCTTCTGACTTTAGGATAGGGGTGAAAAGCCAATCGAGCCTGGTGATAGCTGGTTCCTGCTGAAATAGGCCGTAGTCTAGTGTTAGAAGAGATAACTAAGATTGTAGAGCTACGGATAGAGAGTTTAGGAGGAGAAATCCTTCGGCTTTCTGTCCAACTCCAAATGTTTTAGTATCGTAGAATCTAATAAACGGGGATGCGGGGTAAGCTCGTATTCCAAGAGGGGAACATCCCAGACCATAGTTAAGGTCCCTAAATGTTAGTTAAGTGTGAACGGGTGAAAGGTGTTCATAACCATAGACAGAGGGGAGGTTTGCTTAGAAGCAGCAATCCTTTAAAGAAAGCGTAACAGCTCACCCTTCAAGGTTATGTGCCCTGAAAATGGACGGGACTAAACTAACTACCGATACTATGGACTTCTTATAAAGAAGGGGTAAGCAGGCATTCTATTAGGGCAGAAGTTTTTTTGTAAAAGAAAATGGACCTAATAGAGAAGAGAATCCTAGTGGTAGTAGGATCTATATATGGTGAGAATCCATATTACTGAAAGGGCCAGGGTTTCTTAGCAATAAAGTTTAGCTAAGAGTAAGTCGATCCTAACTCAGTTCCTAACAGAAACTGGGGAAAGGGCAAAAGGTTAAGATTCCTTTACTATTTAGGTACTTATGGTAACATAAGTTTGATCTCTGACATTTTGGGTTAGATTGACATTTACTATCGTAAATGCTAATTAGAATAAATCAATAGAGTACTGTAATGGTGAGAAATTGATTAAATCTAAGAATGGTTGGCCTTATGGCTGATTTGATTGATACCTGGGATTGATAAAAAGGAGATTAAACGGATCCTAAATAATCGTACCTAGAACCAACACTGGTGCCCCTAGGTGAGAAGCCTAAAGTATTAGGGTTTAATCTAGTTGAGGGAATTCGGCAAGTTGGCTCTGTGACTTCGGTTTAAAGAGTCCCTGGGATTGTAATCGTATGATTGCAATTTCAGGGTGCAATGACAAGGGACGTCCGACTGTTTAACAAAAACGTAACTTATTGCTAATCTGTAAAGATTTATATAATAAGTGACATCTGCCCAGTACTAGTATCTCAAACTTCTTTTCAAGGAAGCTAAGGACTAGCAAACGGCGGGAATAACTGTAATTCTCTTAAGGTTAATTCGTAGCTTTAAGACCCAAAGTTAAACAGAATAACTAAAAAGATTGGGATAATAATTTGGCTATATGCTGGAAAGTCCGGGTATCTCACACTACCATAAATTTTATTAAGGTATAA\n>MTYJ01000241.1/79877-79597 Hypsibius dujardini strain Z151 scaffold0241, whole genome shotgun sequence. \nGCTTTGCATTGAGAGCAGACTGTGTGACCTAAAAGGCGAAAAAATGGGAGCACGCTGTAAGGATAAATAGGAACAGACAGGGGCATTCGTATTGCGGCGTTAGATGTGCAATTCTTGAATCATCATCGCAAGACGCGCTCCTGCGAAAGCATTTGCCAAGAATGATTTCATCAATCAAGAACGAAAGTTGGAGGCTCGAAGGCAATCAGATATCGCTCTGGTTCTAACCGTAAACGATGCCCACAGCACAAGTGCCCACAAGTTCAGCACAAATTTTGGCT\n>CM001380.3/48396693-48396738 Felis catus isolate Cinnamon breed Abyssinian chromosome A3, whole genome shotgun sequence. \nGCACAGGTTCCACTAGGAACTACACACATAATTTGGGAACATTTGG\n>GK000025.2/32398425-32398628 TPA: Bos taurus chromosome 25, whole genome shotgun sequence. \nGCGGCTTAATTTGACTCAACACGGGAAACCTCACCCGGCCCGGACACGGACAGGATTGACAGATTGATAGCTCTTTCTCGATTCCGTGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGATAACGAACGATTCATGTGGCATGCTAACTAGTTACGCGACCCCCGAGCGGTTTTACCTGC\n>CP003316.1/1347629-1347568 Pyrobaculum oguniense TE7, complete genome. \nAACACCCTGGGCAACACCCCTGTAGGGGGGGCGAATGAGCCTGGTGGGTTACCCCGGCCATA\n>KI628545.1/15615-15455 Sclerotinia borealis F-4128 unplaced genomic scaffold scaffold00005, whole genome shotgun sequence. \nGGCGCGATAGTTCAATGGTAGAACATCCTCATCCAACTCAGATCACCCCTTCCACAATTTCAGGAGTGCAGTTATGCGAATAACTGCACTATGTTGTATATTAGGAAGATGGTGGTCTTTGGATAGTGAGGGAGATGGAGGTTTGATTCCTTCTTGTGCCA\n>URS0000D6D378_443218/1-79 Hoyosella subflava DQS3-9A1 hya RNA \nTGCGTCACGCAAGTGGGCCGAGGGTCGACTCCTGTGACGAAGGGGCTTCGAGGCACTGTCCCGCCCCGGAAAGTGGCAA\n>BDFN01002532.1/3650-265 Ipomoea nil DNA, scaffold: scaffold2532, cultivar: Tokyo-kokei standard. \nCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTAAGCATATCAATAAGCGGAGGAAAAGAAACTTACAAGGATTCCCCTAGTAACGGCGAGCGAACCGGGAACAGCCCAGCCTTAGAATCGGACGGCCTTGCGTTCGAATTGTAGTCTGGAGAAGCGTCCTCAGCGGCGGACCGGGCCCAAGTCCCCTGGAAAGGGGCGCCGGAGAGGGTGAGAGCCCCGTTGTGCCGGACCTGTCGCACCACGAGGCGCTGTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCCAATCGGGCGGTGAATTCCGTCCAAGGCTAAATACGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGGAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGATGGAGACCGGCGATGCGCCCCGGTAGTATGTGGAACGGTGAGAGCCGGTCCGCCGATCTACTCGGGGCGCAGACCAGCGAGGATTCGGGGGGCGGCCAAAGCCCGGGCCTTTGATACGCCCGCGGAACGTCGTCTCTCGGATCGTGGGAAGCAGCGCGCGCCCCTGGCGTGCCTCGGCACCTGCGCGCCTCCGGTCGCTGGCCTGTGGGCTCTCCATTCGACCCGTCTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGCGAGTAAACCCGTAAGGCGCAAGGAAGCTGATTGGCGGGATCCCCTCACGGGGGTGCACCGCCGACCGACCCTTGATCTTTTGAGAAGGGTTCGAGTGCGAGCATACCTGTCGGGACCCGAAAGATGGTGAACTATGCCTGAGCGGGGCGAAGCCAGAGGAAACTCTGGTGGAGGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTGACTTGGGTATAGGGGCGAAAGACTAATCGACCGTCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCTGGCGCGAGAGTTCTATCGGGTAAAGCCAATGATTAGAGGCATCGGGGGCGTAACGCCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACGGCGCGGCTGCTTCGTTGAGCCGCGGCCACGGAATCAACAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGCCGGGTTACGGTGCCCAACTGCGCGCTAACCTAGATCCCACAAAGGGTGTTGGTCGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTTAAGCGCGCGACCCTATACCCGGCCGTCGGGCAAGAGCTAGGCCCCGATGAGTAGGAGGGCGCGGCGGTCGCTGCAAAACCTTGGGCGTGAGCCCGGGCGGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGGGTCGGGGGAAGCCCGACAGACAGCGCGTTTTGCGCGTGCGCCGAAAGGGAATCGGGTTAAAATTCCTGAACCGGGACGTGGCGGTTGACGGCAACGTTAGGGATTCCGGAGACGTCGGCGGGGGCCTCGGAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGCACGTCGCGTGGTGTCCGGTGCGCCCCGGCGGCCCTTGAAAATCCGGAGGACCGAGTGCCGTCCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGCCAATGGAACAATGTAGGCAAGGGAAGTCGGCAAAATGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGGCTGGGCACGGGGGTCCCAGTCCCGAACCCGTCGGCTGTTCGGCGGACTGCTCGAGCTGCTACCGCGGCGAGAGCGGGTCGCCGCGTGCCGGCCGGGGGACGGACTGGGAACGGCTCTTTCGGGGCCTTCCCCGGGCGTCGAACAGCCAACTCAGAACTGGTACGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTAACGCAATGTGATTTCTGGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCCGAAAGGCGAAAGTGAAATACCACTACTTTTAACGTTATTTTACTTATTCCGTGAATCGGAGGCGGGGCATTGCCCCTCTTTTTGGACCCAAGGCTCGCTTGCGGGCCGATCCGGGCGGAAGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAGAAGGGTAAAAGCTCGTTTGATTCTGATTTCCAGTACGAATACGAACCGTGAAAGCGTGGCCTAACGATCCTTTAGACCTTCGGAATTCGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGACAGTGTCGCAATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGTTGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGACCGACGCATGCGCTCGTCGCCCGTTTGCCGACCCGCAGTAGGGGCCATTTGGCCCCCAAAGGGCACGTGTCGTTGGCTAAGCCGTCGTGGCGGAAGGGTCACGGTGGCCGCCTTGAATTACAATTCCGATCGAGCGGCGAGCTGAATCCTTTGCAGACGACTTAAATACGCGACGGGGTATTGTAAGGGGTAGAGTGGCCTTGCTGCCACGATCCTCTGAGATTCAGCCCTTTGTCGCTCCGATTCGT\n>FR877557.1/2581256-2582181 Salmonella bongori NCTC 12419, culture collection SGSC SARC11, complete genome \nACCTGAGCTTCCATTTCACGGTCAGACAGGCCACCGCAGATCTGGATAATACGGTCAGACAGCGTCGATTTACCGTGGTCAATGTGAGCAATGATCGAAAAGTTACGTATGTTCTTCATAGAGATAAATTATTATGCCTTACGCCTGGTTGACCAGACTTTAGAGGTCGCTGTTCTGAGCTTAACGTCTGTTTTAACTGAAACGCCGCATTCTACACTACAACGCTAAGGCGAGGAAATGTTCATAATGTAAGGAGAGCGGGAACTGGCAAGCGTCTCACTTTTTACGTAAGTCACTGTAACGCCGAAAAAGCCCCTGATAGCGCAAGCTTATCGGCCCGACATCTCCTGCATGGCAGGAAAAAATGACCTTAGCAGACCAGCTAAACGCAGCGCTATCCGGCACAGCGTCTACTGGCGCGTTTCGATTGATGTGGTTTCGACGCGAACAAGCTCGGACGGGAGGGCAACGCTTAAAATCACCGGTTGCCAGGTATCGCGCTCCGCCAGTTTCCGGGAATAGCCTCGGGCAAGCAAAAAACCGCCAACGCCACCTAAAACAGCGCCGCTTAATGCCGCAAGGTCAGATCCAAACAATACCTGGAAAAGCACTGCAAAGAGAAATAACCCCGCTAAAGGCGACATATAGACCAACAATGCCGACCCTAAGAGGCTTTTTTCGGCGATGCCAAGCTCAACTTTCTGCCCCGGCGACAGCGGCTCCACGCTTGGCACCACAATTGTATGAGTCGTTTGCGGCCCTAATTTATTCAGCACGCGGCTGCCGCATCCCGCCCGGGAGGCGCAGTTGCTGCACGATGTTTTAACATCACAACTCACGACCGCCTGGCCATTCCGCCAGGAGACGACCGTCGCCCACTCTTTAATCATTGTACTGCCCTGAACTTGATACTGTCTGCAATACGC\n>MFEL01000009.1/24516-24224 Candidatus Doudnabacteria bacterium RIFCSPHIGHO2_01_FULL_46_24 rifcsphigho2_01_scaffold_3549, whole genome shotgun sequence. \nATAAATGCGTATTAGTTTGCGCAAATTGCCACAGAGAATTACATGCAGGAATATCGCAGCTTCCGAGCGAAAGCTCGGTTGAAAAACGAGGTGAATTCGGGGAAGTCCAGCCCCACTTTTGAAAAAAGTGGAGCGGGATAATCCCGAGCCAAGCCCAGCCCCGGTTTTGAAAACTGGAGCTGGGAAGGTGTAGAGACTATCTCGAAAGAGAGTAGCCCCCGCCGCAGGCGAGGTCGAAGCGCCTCGGACCTTAAATGGTCATGATATAGTCCATCCCTAGAAGCAATTTTAGG\n>AY765264.1/10602-10676 West Nile virus strain Rabensburg isolate 97-103, complete genome. \nCAGTTGTCAGACCACACGCAAGTGTGCTACTCTGCGAAGAGTACTGTCTGCGTTAGAGCCCCAGGAGGACTGGGA\n>CM007898.1/80153181-80153635 Helianthus annuus linkage group 9, whole genome shotgun sequence. \nAAAAGGCGTAGCAAAAAGCTGTATTTTAACCATTCAAAGTAAGATATTCGAGAGCAAAAAGGTTGATACATTTTGAAGCAGCCAGGGCTCTTGAAAAGGAGGGACGCCTTCGGGAACGCGGACACAGGTGGTGCATGGCTGTAGTCAGCTCGTGCCCTAAGGTGTTGGGTTAAGTCCAGCAACGAGCGCAACCATCGTGTTTTGTTGCCATCATTGAGTTTGAAACCCTGAAGAGACTGCCGGTGATAAGCCGGAGGAAGGTGAGGATGACGTCTAGTCAACATGCCCCTTATGCCCTGGGCGACACACGTGCTACAATGGCCGGGACAAAGGGTCGCGATCCCGCGAGGGTGAGCTAACTCCAAAAACCCGTCCTCAGTTCGGATTGCAGGCTGCAACTCGCCTGCATGATACCGGAATCGCTAGTAATCGCCAGTCAGCCATACGACGTACTT\n>CM000803.1/27767415-27767313 Oryctolagus cuniculus chromosome 14, whole genome shotgun sequence. \nATCAATTCTCCTTCTTTTGGCTAAGATCAAGTGTAGTATCTGTTCTTTTCAGTTTGAAATGTGTCATCAAATTACTGATTTCCCTCTTCAGTTCTTACCCCTG\n>CM000014.3/49188721-49188634 Canis lupus familiaris chromosome 14, whole genome shotgun sequence. \nTGGTCGATGATGATTCCCACATACGCATTCTTTGGAAGTCTGAACAAAATGAGTGAGGGGGAAAAAAAAAGAATCACAATTCTGCCCT\n>MGNC01000058.1/1340-1465 Chloroflexi bacterium RBG_13_60_13 RBG_13_scaffold_216383, whole genome shotgun sequence. \nTCTCCGAAAGGGCAAAGGCACGGGAAACCGTGTCGGCGCAAAGCCGCGGATCTAAGGTCTCCCGCTTCGACAGGGACGTTCACAGCGGCAGTAGGAGCGAGAGACTATGGTGGCCGGGCTACCGAA\n>CM001394.3/25602295-25602396 Felis catus isolate Cinnamon breed Abyssinian chromosome F1, whole genome shotgun sequence. \nGCCGAGTAATACTCCATTTTGTGTGTGTGTGTGTGTGTGTGTGTGTGTATATATATATATACACACACACACACACACACACACACACAAAATGTGTATATA\n>URS0000D67331_12908/1-219 unclassified sequences RT-2 RNA \nCGAGGTCATATGGAGTAGCGAAAGTGAAAGACGACCTTCGCAAAAGGAGATATACTTCCCTGGGTGAAAATCCTTAAAACTGCCTTACGACGATCACACACGGACGCTGCTTGCATGGCGAAGAATTGCGCTACCTTCGTTTCATGTGTGGGATCAAAGTAGTTTAGATGCGCACCTACAAAACAACTATGCGAAAGGCGAAAACTTATTATGACAAGC\n>LQHI01000015.1/6633-6747 Hadesarchaea archaeon DG-33 contigWOR1_52_54_12788, whole genome shotgun sequence. \nGCGGGGATAACTCAACCTGGGAGAGTGTCGGTCGTTCGAGTACAATCGAACGGGCAAAACTGAAGTTCCCAGAATAGATATCCGAATGTTGGGGGTTCAAATCCCCCTCCCCGCA\n>AFCW01000383.1/1-68 Salmonella enterica subsp. enterica serovar Urbana str. R8-2977 Contig383, whole genome shotgun sequence. \nCACACACTTAATTAATTAAGTGTGTGNNNGCCGCAATTCAGCATTAGTAACCAAGGGGTCTGCTCGTG\n>AAQR03179128.1/9880-9794 Otolemur garnettii contig179128, whole genome shotgun sequence. \nATCCTTTTGTATTTCATAAACTACTGACTGTGTTTTCACACTTATGAGCAAACCTTGTTAGGATGTGGATACATTACCTGTCTGATG\n>CCCW010025129.1/8929-12059 Brassica napus, WGS project CCCW01000000 data, contig: 19059 \nCGACCCCCAGTCAGGCGGGATTACCCGATGAGTTTAAGAATATCAATAAGCGGAGGAAAAGAAACGAACAAGGATTCCCTTAGTAACGGCGAGCGAACCGGGAAGAGCCCAGCTTGAAAATCGGACGTCTTCGGTGTTCGAATTGTAGTCTGGAGAATCGTCCTCAGCGACGGACTGGGCCCAAGTTCCTTGGAAAGGGGCGCCAGAGAGGGTGAGAGCCCCGTCGTGCCCAGACCCTATTGCACCACGAGGTGCTGTCTACGAGTTGGGTTGTTTGGAAATGCAGCCCCAATCGGGCGGTAAATTCCGTCCAAGGCTAAATATGGGCGAGAGACCGATAGTGAACAAGTACCACAAGATAAAGATGAAAGGACATTGAAAAGAGAGCCAAAGAGTGCTTTAAATTATCGGGAGGGAAGCGGATGGGGCCGGCGATTCGTCCCGGTCGGATGCGGAACAGAGCAATCTCGTCTACCAATCTATTTGTGGCGTGGACTTACGCGGATTAAGGTGGTGACCTAAGCCCAGGATTTTGTTACACTTGCGGAGACGTCGCTGCCTTGATCGTGGTCTGCAGCTCGCGCCTCACGGCGTGCCTCGGCATCTGCTTGCTCAGGGCGTCGGCCTGTGGGCTCCCCATTTGACCCGTCTTGAAACACTGAACAAGGAGTCTGACATATGTGCGAGTCAAAGGGTGAGTAAACCCATAAGGCGCAAGGAAGCTGATTGGATGGATCCCTCACAGGTGCACAGCCGACCGACCTTAATCTTCTGAGAAGGGTTCGAGTGTGAGCATGCCTGTCAGGACCCGAAAGATGGTGAACTATGCCTGAGCGGGGCAAAGCCAGAGGAAACTCTGGTGGAGGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTCACTTGGGTATAGTGGCGAAAGACTAATTGAACCATCTAGTAGCTGGTTCCCTCTGAAGTTTACCTCAGGATAGCTGGAGCTGGAAACGAGTTCTATCGAGTAAAGCCAATGATTAGAGGCCTCGGGGATGCAATGTCCTCGACGTATTCTCAAACTTTAAATAGGCAGGACGGGGTGGCTGCTTTGTTGAGCCATCCCACGGAATCGAGAGCTCTAAGTGGGCCATTTTTGGTAAGCAGAATTGGCGATGCGGGATGAACCAGAAGCCGGGTTATGGTGCCCAACTGCGCGCTAACCTAGAACCCACAACTCACCTGCCAAATCAACTAGCCCCAAAAATGGATGGCGCTGAAGCGCCCAACCTATACCTGGCCGTCGGGGCAAGAGAGAGGCCTCGATGAGTAGGAGGGCGCGAGCCCGGGCGGAGCGGCCATCGGTGCAGATCTTGGTGGTAGTAAGGGAAATGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCATAAGAGTCGGGGGAAACCCGTCTGATAGCGCTCTTCAAAAGGGGATCCGGTTAAAATTTCGGAACCGGGACATGGCGGTTGACGGCAACGTTAGGGAGTCCAGAGACGTCGGCGGGAATTCCGAAAAGAGTTATATTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGACGGAGGTAGGGTCCAGCGGCTGGAAGAGCACGGCACGTGGCGTGGTGTCCGGTGCATTCTCGGTGGCCCTTGAAAATATGGAGGACCGAGTGCCTCTCACGCCCGGTTGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGTCGATGGAACAATGTAGGCAAGGGAAGTCGGCAAAATGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGGCTGGGTTCGGGGGTCCTAGTTCCGAAATTCTCGACTGTTGGTGGGCTGCTTGAGCCGAACAGACCGCCTCGTGTCAGCCGGGGGATGGACTGGGAACGACTCTTTGGGGAGCTTTTCCCGGGCGTCAAACAGCCAACTTAGAACTGGTACGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTAACACAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCACCCAAGCGTGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATAAGTGATGCGCATGAATGGATTAACGAGATTCCCAGTGTCCATGTTTACTATCCAGCAAAATCACATCCAAGGGAATGGGTTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTCACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGAATAAGTGAGAGCTCCGGTGCAAGTGAAATACCACTACTTTTAACGTTATTTTACTTACTCCGTGAATGGGAGGCGGGGTACCAACCCCTTCTTTTAGACCCAAGACTCGCTTCGGCGGGTCGATCCGGGCAGAGGACATTGTCAGGTGGGCAGTTTGGCTGGGGCAGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGTTCAACGAGAACAGAAATCTCGTGTGAAACAAAATGGTAAAGCTCGTTTGATTCTGATTTTCAGTACGAATACGAACCGTGAAAGTGTGGCCTATCGATCCTTTAAACCTTCGGAACTGGCTTGTGGCAGCCATGCGTTCATAGCGATGTTGCTTTTTGATCCTTCCATGTCGACTCTTTCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGATCGTGAGACAGGTTAGTTTTACCCTACTGATACCCGCATCACAATAGTAATTCAACCTAGTACGAGAGGAACCATTGATTCGCACAATCGGTCATCGCGCTTGGTTGAAGAATAGTCAGTGGCGCGAAGCTACCGTGCGTTGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGAAGCGACGCATGCGCCCGCCGCCCGATTGCCGACCCTCAGTAGGAGCTTCGGCTCCCAAAGGCACGTGTCGTTGGCTAAGTCCGTTTGGTGGAAGCGCCGTTCGGACCGCCTTGAATTATAATTACCACCGAGCGGCGGGTACAATCCTTTGCAGACGACCTTTGTCGCTAAGATTCGA\n>LZPO01045535.1/8544-8610 Neotoma lepida isolate 417 scaffold_13965, whole genome shotgun sequence. \nGCTGGGGTAGTTCAAAGGCAGAACATTTGCCTGGTATGCATGAGAGCCTGGGGGTCATTCCCCAGTA\n>AHJH02011678.1/302-41 Hammondia hammondi strain H.H.34 contig09893, whole genome shotgun sequence. \nAGCGACAATCCTACCACTTAGAGTTGTCGGATCACTAAGACCGACTTTCGTCCTTGTTTAAGTAGTTACTCTCACAATCAAGCCTTTTACGCAACAGTGTTTTAAAAGATAATTATTGTCTAAAAAAAAACTCATATCTAATTAGCTAGTTGGTGAAGTAATAGTTTTACCAAGGCGAAGATTAGTAGCTGCCTTGAGAGGGGAAACAGCCACATAGAGATTGAAATACAGCTCGGCTTATCACACAGTAGGGTAGCTGCAG\n>MTEO01000012.1/38100-38064 Desulfobulbaceae bacterium A2 Ga0073110_1012, whole genome shotgun sequence. \nGTTTTCCGGGGCGCACGCGCCCCGGCCTCTTTGAAGC\n>CP003050.1/1069873-1069696 Halovivax ruber XH-70, complete genome. \nAAGTACCTCTGAGTCCGTCGGACGATACGTCCGCGGATAGGAGTAACGGCTGGTTGGCGCAGCCATCGACTCACCTGTTCGACAAGTCAACGGGTGGATTCCACCCACAAGAACAGGTTGTGTCGTAGACCTTAATATCCCAACTGCGGTCGGGAATCCTCGCCCTTCAGGACGGGAG\n>JMFI01080173.1/8540-8495 Phalacrocorax carbo contig80173, whole genome shotgun sequence. \nAAAGAGGTCTTCCTAAAGACCACACCAGCCTTTGAAGCACACTTTA\n>LDZF01000115.1/1-68 Pluralibacter gergoviae strain JS81F13 contig_136, whole genome shotgun sequence. \nAAACCCCTTTTGATTTGTTAAAACAGATTGCGGTCTGGCAACTGCAACGTTTAACAAGAAATCAAAAG\n>AWGX01000534.1/1451-1535 Smithella sp. ME-1 CONTIG_7599, whole genome shotgun sequence. \nTAGTAAATTTATTTACTTGACAAAAAAGTAAAGTTTTATTAAATAAAAATCGTTCGCTTGGATCCGTAAGGACTGAGACGAGAGG\n>JMFL01092903.1/16205-16066 Opisthocomus hoazin contig92903, whole genome shotgun sequence. \nCTGCATTCTTAACCCTCCTGGCAGCTCTGTTTATTAGCTTCCAGGATAAGAATGAATGCCAGAGAAAACTGTTGATTAATCCAAAATGAAGAGCTCTCCTCCCGTGGCTCTCCATTATTTCACGTCTTCAACATTGATTT\n>JJRE01013351.1/703-1 Phoenicopterus ruber ruber contig13351, whole genome shotgun sequence. \nAAAACAAGCGAGGTAGTGGTATTTCACCAGGGCCGGGAATGGCTAGCATGCAGGGAAAACAACTGGGCTCGGTAACACGACGCGTCATACGCCTGCCGAAAGACACCAATTGCTGGACTCGTCTAAGGTGGACAGGTCCCCTATGCTTAACCTGGAAAAGGAACATGTATAATTTTATATATGTTTGCTAAATAGCCAAATGCCTCGTCATCTAATTAGTGACATGCATGAATGGATGAACAAGATTCCCACTGTCCCCACCTACTATCCAGCGAAACCACAGCCAAAGGAACGGGCTTGGCGGAATCAGCAGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCTGGCGCTGGGAAGAGACATGAGAGGTGTAGAGTAAGTGGGAGGCCGGGTGCACGCTCAGCAGTGCGACCTGCCCACCAGCACCCCGGCCATCGGTGAAATACCACTACTCTGGTCCTTTTTTCACTTACCCGGTGAGGCGGGGGGGGGCAAGCCCCAAGGGGGGCTCTCACTTCTGGCACCAAGCGCCTGGTGTGCACCGGGAACAGTGGCAGGTGGGGAGTTTGACTGGGGCAGTACACCTGTCCAAGCGTAAGGCAGGTGTCCTAAGGCAAGCTCAGAGAGGACGGAAACCTCCTGCAGAGCAGAAGGGCAAAAGCTCACTCGATCTTGTTTTTTCAGTATGAATACAGCACACG\n>MERU01000008.1/32885-32784 Burkholderiales bacterium RIFCSPHIGHO2_01_FULL_63_240 rifcsphigho2_01_scaffold_62, whole genome shotgun sequence. \nACTTTCGAGGAGCGTTGCAAGGCCCGTCCCGTCGTTGAACACGGCGCGAACCGCTGGCCCCAGGCTCGAAAGCTTCTCCTTTTGCAACGGCGCTCACCCGCA\n>FQTV01000009.1/145137-144950 Bacteroides luti strain DSM 26991 genome assembly, contig: Ga0131163_109 \nTATCTTTGTTTCGGTTTTGGTAACAAAGCTTATGCTTTAGGAGAAAAGGGAATACCGTGAAATCCGGTAACAGTACCCGCTGCTGTGATTCTCGAAGAACTTGAGTAACAAGCCACTGCATTTATTTGTGGGAAGGCACTTTAAGAGAGAGATAAGTCAGAAGACCTGCCAGAACTACACATTATAGA\n>HG764815.1/187153-187284 Tetrasphaera australiensis Ben110 genomic scaffold, 2552_scaffold1 \nCGCGTTTTCGCTCAGGCGGAGCTCGACCGCCGACTCAAGTGATCGTGGCCTATATCGACGCCTATCGGGGTCAGTTCGGCGCCCATGCCGATCTGTGCCGTGCTGACCGAGCACGGCATCACGATCGCGCCG\n>MIJY01000003.1/25265-25023 Enterococcus termitis strain LMG 8895 11, whole genome shotgun sequence. \nCAAAACACATATTCAGAACAAGTAGTCATCGTTCATTTCCTGACAGAGACTTTTTCATTCGCTGAGAGAAAAAGCTGGAAACCGTTGACGAACACATCTGTCTAGTCAGCTTCTGAATTTAGTAAGAAGCTGCGGCATTCTCCGTTATCAGAAAAGAATCTCTATTACTATTAGAGACTCTATGAGGTCACCATTGCGAAATCGTGACAAATTGAGGTGGAACCGCGAATCTTCGTCCTCTTG\n>CM000999.2/135584192-135584306 Mus musculus chromosome 6, GRC primary reference assembly. \nTGCTGAGTGCAGTTCCGGGCTGCTTCCATGTTCTGTTAATTAAACATTGAAATTGGCTGAGAGAGATGATTAAATGGAAAGTGTTATTCTGTTCATATACTGATAGCTCACATAT\n>JXUM01069429.1/36725-36871 Aedes albopictus isolate Foshan contig69429, whole genome shotgun sequence. \nTTCAGGCCATATCGAAGCAGGACAAAGGCCATTTCTTATGCCTGTTGTCCTGTCAAAAATTGGCCCAGAGTAAACGCTCCGTCGACGGTCATTGGAAGCCTTGACATCCGTGTGGTTTACCAATAACATATTTGGCGGTGTACAATA\n>CM000999.2/123737012-123736886 Mus musculus chromosome 6, GRC primary reference assembly. \nCCAGCTCCTAGAAGGGTTGCAAGTGTGGCTGCTGTGTCATTTCTGCATCAGGATGTGGCAGAGAAGAGAGAGACAAAAAAAAAAAAAGACCTTCAGTGTTCTGACCTATGATTAATAGCCTAACAGT\n>AP012044.1/987471-987303 Oscillibacter valericigenes Sjm18-20 DNA, complete genome. \nCGCTCAGATAGAGGCGCGAGGTTCATCAGTACCGCGAGCAGCCGGCAGGCAGCCGGCGCGGGAAAGGGGACATCGCCGAAGGGTTTCGGAGCTGCCTGCTCCGAGATACCTGGGCTGTCGGGGAATACCCGTCGGACTGTCACATTTTTTGTGAAGCGCTATCGATGGC\n>ACPB03020461.1/16978-17135 Rhodnius prolixus Rhodnius_prolixus-3.0.3-473.8, whole genome shotgun sequence. \nAGAGTCCTGGCGTCGAGGTTACCATGATCAACAAGGTGGTTCCTCCAGGGTGAGGTCTATTCATTGCACTAAGAATTGGCTGACCCCTGCGAATGTTCCAAAAAATATTTCTAATAGTAGAATTCATTAGTGCTATACTATTTTTGAAATAATATAAA\n>AFYH01196721.1/7358-7251 Latimeria chalumnae contig196721, whole genome shotgun sequence. \nATGAGTCGGTGCATCCCCAAGAGGGGAGGTTGGGAGGGTATTGGTGTGGCTGTATGGAGTATCCCTAATACCCTCCCAACCTCCCCTCTTGGGGATGCACCGACTCAT\n>KQ959571.1/48198-48573 Clostridiales bacterium KA00274 genomic scaffold Scaffold7, whole genome shotgun sequence. \nGGGGATGTAAAGGCTTCGACAGGGTTGTTGAGATTGGAATAGCGGGTAGAGGATGCGCGTTGGCCTCTTTAAAAAACGGGCAAAAAATTTAGTTGCAAAAACTAATAGATTCGCTGTAGCTGCGTAAGCTTGGCGCACAAACTTGATGAATCTGCTAATTGAGTGATTGTGTTAGACTAGCAGACCTTGATCGTTAGAGGTCAAACTTTCAAATTTCAAGTTAAGCTTTGCCCTTGGAATTATCTATGAAGCTACTTTCATAAGCGATTGTTCAAAGTCTACCTTATGAGGGGAATTTAGAAAATTTGAACTGCACCCGGAGAAGTTCTGATTAAGGCGATTTTGGACACGAGTTCGATTCTCGTCATCTCCATTC\n>CM000998.2/25188643-25188361 Mus musculus chromosome 5, GRC primary reference assembly. \nGGATGTGAGGGAGATGTGGCTACATCTGTCACCCCACTGATTACCAGGGTTGATCACCTGCTTTGGCTAACCCGCCTCCCTCATCCTTCCACGTGTGCCCTTCTGGACTTTCCCTGAATAGAGGACGACCAGTCTTCAGTCAAGAGTACATGAGTAGATACATTCCCCTGCTAGAACCTCCCAACAAACTCTCAAGGGAGCTGAATTCTTATGCCACATGTCTACTACAAGATAGTATGCACATACACGGTAGGCAGGTGGGGCAGGGAGGGGCTTCTTTCGT\n>AODH01000041.1/17134-17262 Brochothrix campestris FSL F6-1037 c41, whole genome shotgun sequence. \nATAACCTTTAACCTAGTCCAGAGAGACTAAGAAGGCATTGAATCGTATACAGGGGTAAAACTACCTTTGTAGAACAGTAGTTTGGCTACTGTTAAAAACGCTTATGCCCTCGCATAGGCGTTTTTTTTT\n>GL010035.1/48904364-48904178 Loxodonta africana unplaced genomic scaffold scaffold_8, whole genome shotgun sequence. \nTTGAACCGGTTCTTTCTGGTTCGACCCCCTGCTGAGATGTGAATTTCCACCCCAGATATACTGAATCAGAACCTACATTTTAACTATAATTTTAAAATTTTAACTATAATGTAGGTTCTGACTCAGTATATCTGGGGTGGAAATTTAAATTCTCAGCAGGGGTTCGAACCAGAAAGAACCAGTTCAA\n>LQXD01000036.1/27026-26945 Anaerobacillus sp. NB2006 Ga0137927_1036, whole genome shotgun sequence. \nAAAGAGCTATAACCGCTCATTAAAGGGTTTTGAAGTATTTGCTCTTAGCAAAACACCCCTCATGGCGAGTCTGAGTATATTA\n>CGIH01000026.1/124551-124798 Syntrophomonas zehnderi OL-4 genome assembly, contig: OL-4DRAFT_scaffold-26 \nTAAAATGTGATGAACAGGACAAGTAACCTGCCGGTAACCTTGCAGGGAGGCCGTATCATGGACTGAAAGTATGGCCAGGGGAAAGCAGTTGAATTCACCTGGGAACAGTAAACTGAAACATAGATATCTTTTTACCGTCTATTCAGTAGGTTTAACCGCAGGTCGGCGTTAAAGACATCAAGTGAACCGGTTGCGTTTGACATCGGTTAATCGGGGTGGTACCGCGGAAGCAAGCTTTCGTCCCTTGG\n>CP011382.1/3084471-3084633 Calothrix sp. 336/3, complete genome. \nAAAATTAAATATACCAAGCCGGAGACAGCAGGTGTCCTTGACTTAAATATCCTGCCTAGGTTTGCACTCCATTTGTTCCATGAAGACTCATAGTGGTTTGACCATGGCAAAAAGAGATTTGTAAAACCCCGGCTTGGTATAGCTGGGGTTTATTAATTGGGGA\n>MFFM01000041.1/12342-12480 Candidatus Edwardsbacteria bacterium GWF2_54_11 gwf2_scaffold_564, whole genome shotgun sequence. \nAAATTGAATCTCCGATCCCGTTTTTCTAAAGCTTAAATGCCATGGATGACGGGACGGTTCCCCCGAAAAGGGCGGACAAGGGTAGGACTGGAAACGGTCTTGCCTCCCGTGTTTGGAAAGGAGAGGTTGCGATTAACTT\n>CM000237.2/27621459-27621601 Rattus norvegicus chromosome 7, whole genome shotgun sequence. \nCCTGCCCCTAGAGGCATTGCAGCTACGACTGCTGTGTCATATGTGTGTCAGTAGGTGGCAGAGATGAGACAGGCTATGTCTATGCTCAGTGTTCGGACCTGGGAAACCCGGGGGTGCAGGTGGCAGGGAGTGAGCCTAAGACA\n>CM000780.4/158285691-158285793 Zea mays cultivar B73 chromosome 4, whole genome shotgun sequence. \nGTGCGAATCACAGTGCAGCTCTCCTCTGGCATGAAGGCTGTGAGAGAGGCATGACAATTTCTGGCCTTGCCCTGCCAAAGGAGAGCTGTCCTGCCATTCATTA\n>CM000236.2/108598299-108597972 Rattus norvegicus chromosome 6, whole genome shotgun sequence. \nGGGTGCAAAGGCAATCTGCCTGTGGTGTCGAGCACCCCGTTGATAACCAGAGTTGAATCAGCTGATCTGGAAAGCTAGACAGGTGTCCTCTTCCTCCCTCACCACGTTCCATGTGCCTCCTTCCTGGGGCTGTGTATTTGATGGCAAAGGAAGATCTTCTCAGATAGAAGAGGGCCAGCCGCTGTTAAAGATATCTAAGCAGCTGCTAGATCCCCTGCTAGAGTCTCCAAACAAAGCCCTCAAAGTCCAAAGGCACAAATGGTAAATTAAATGGCAGTAATGTTGATCGAAACCCTCTGTGTTTGAGGAGGTAGCTCTCAACTCTGAG\n>FRBW01000003.1/337999-338120 Labrenzia suaedae strain DSM 22153 genome assembly, contig: Ga0131142_103 \nTCGCGTCTCACCGAGCTACCTCCTCCCAAGCTCGAGACGTGCGACCCGGCGGAGCATCCTCCTCCCAGTTCCGCCAAGTCAAATGCGCCTGCCAGCACCTCCTCCCGCTGGCGGGCGTTTTG\n>MNUO01000109.1/8594-8798 Candidatus Desantisbacteria bacterium CG1_02_38_46 cg1_0.2_scaffold_8344_c, whole genome shotgun sequence. \nCAAGTCCGACTTAGGTAAAGGTTAGCCACCAGCCTAACACTTAATCTCACACTTTATTTGGTAACAAATAAAGTGGTGCGGGAAGCGGGAAATATCGAGCTATAACGCAAGTGAAGGAATTGAGCCCCGAAATAACCAGCGTGTCAGTGGTCGATACTCTTCATTAAGGAGCAGACAATAGTCTCACAACCGATAAAAGGCGAGG\n>AAGD02011599.1/18221-19185 Caenorhabditis remanei strain PB4641 contig406.1, whole genome shotgun sequence. \nAATTATGAAGTAAGAAGTAAGAAAGAAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAAAAATAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTTTGACATTGTGAAGAGTCATGAGAGGTGTAGCATAGGTGGGAGACTTCGGTCGACAGTGAAATACCACCACTTTCATCGACTCTTTACTTATTCGGTTGAAAGAGAATTGGCTTCACGGCCTTTTTTCGAAGCATTAAGCGGAGCCATTTTATGGCACCGTGACTCTCCTCGAAGACAGTGTCAAGCGGGGAGTTTGACTGGGGCGGTACATCTATCAAATCGTAACGTAGGTGTCCTAAGGCGAGCTCAGAGAGGACGGAAACCTCTCGTAGAGCAAAAGGGCAAAAGCTTGCTTGATCTTGACTTTCAGTACGAGTACAGACCGCGAAAGCGTGGCCTATCGATCCTTTTAATCCTGATTGTTTCAGGTAAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTCCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGCGAAGCAGAATTCGCCAAGCGTTGGATTGTTCACCCACTAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGTTGACTTGTTATTGCTAAAAACGACGATTTTCCATGTAAAAACACGTAACTTCCACTACGAACCTTCCTCGTCTATCAATCACTCCTTGTCTCGGATCCATCAGCCCGCCGAGCTTCGGCTTTCCGTTTTCGTAGATCTCTGGGAACTCGACATGAGCGACGGACATTCTTTTCTGCAAAAAACCAAAATCTTAGCCGTGTTTCCCGATTTTTCCGCATTACAATACGGTGCCGGATTTCTACACCGTCAATCGCTCTTCCGAGAGGAGTACACGGCCGGCGGCCTAGGAA\n>ABLE03011848.1/1-1240 Caenorhabditis japonica strain DF5081 Contig9538.1, whole genome shotgun sequence. \nGACTTTTGAAGAGAGAGTTCAAGAGAACGTGAAATCGCTGGAGTGGAACCGGAGACAGTTGATGTTGCTTGGAGACAATCTTGGTGGCTGATCGCTTAGCTGTGATCGCCGCCGGGAGTCGTTTCCTATGCTACGCCGACGGCGTTGGCCGCTCGTTCTGGCCCGACAGTGTTGCCCATCTCGCAAGAGACGGTGTCTTGTTGTCGGTCGTTGGTTCGTGGTGGCTAGCGTTTAGTTACGCTAGTGTGTGTGACGTCGGTGTGAAAGTCGACGACGTTTCCGACCCGTCTTGAAACACGGATTACGGAGTGTTTGTCTGCTGCGAGTCAAAGGGTGTAAACCTTGCGGCGCAATGAAGTGAAGGTTAGTCTCGAACTGACCGACGTGGGATCCGTGCTCTTCGGAGTGCGGCGCACCACGGCCCTATGCGTGTCACTTGTGACTGTGTAGAGGTTGAGCAGTAGGCAAGCGACCCGAAACGATGGTGAACTATGCCTGAGCAGGATGAAGCCAGAGGAAACTCTGGTGGAAGTCCGTATCGGTTCTGACGTGCAAATCGATCGATAGACTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCTTCCGAAGTTTCCCTCAGGATAGCTGGAACTCTTGCAGTTATATTCGGTAAAGCTAATGATTAGAGGCCTTGGGGACGTAATGTCCTCAACCTATTCTCAAACTTTCAATGGATATGGCGTCGCAGTTTCTTTAGTGAACTGCGGCGTGAATGCGAGTTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGCTGTGGGATGAACCAAACGTGGAGTTAAGGTGCCTAACTTCTCGCTTATGAGACCCCATAAAAGGTGTTGGTTGATATTGACAGCAGGACGGTGGCCATGGAAGTCGGTACCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCTGAAAATGGATGGCGCTTAAGCGAGAGACCTATACTCCGCCGTCGCGGCATGTGCGTTGTCTAGCGCCCAGGTCGCGACGAGTAGGAAAGGACGTGGCGGTTGCGTTGAAGGCTATGAGCGTAGGCTCGGCTGGAGCTTCCGTCAGTGCAGATCGTAATGGGTAGTAGCAAATATTCAAGTTCGATCCTTGAAGACTGAAGTGGAGAAGGGTTCCACGTGAACAGTAGTTGGATGTGGGTCAGTTCGATTCCTAAGGTACTGGCGAAAGCTTTG\n>JH159154.1/6686760-6686937 Phytophthora sojae unplaced genomic scaffold PHYSOscaffold_4, whole genome shotgun sequence. \nATGCTTCCCAGGGTGACTACCGATTGGCCAAGAAATGCATGTATGAAAAATGAGAGCGTTGACATGAGCCGGAGCAGGCCCCTTGCACTCCGGTGCTGTAAGGGTTCAGGAATGCTCTTTTGAGTAATTCCACAGTAGAATTTTTGTCAGCGGGGGTGAGCGCGTGCGCCGCCCCCAC\n>AAOX01000007.1/31274-31356 Bacillus sp. NRRL B-14911 1099999053126, whole genome shotgun sequence. \nAAGAATATAGAACACTGTGATGAGCGGTTTTTATTTGCACTTTAAACCGCTTGGAGTGACTAGTGCAGCCGGCCAATGATCTA\n>AZAQ01049668.1/23412-23144 Stegodyphus mimosarum contig49668, whole genome shotgun sequence. \nGGCTTAATTTGACTCGACACGGGCGAACTTTACGCGGCCCAGACACAGGAAGGATTGAGAGATTCAAGAGCTCTTTCTTGATTCTGTGGGTGGTGATGCATGGCCGATTTTAGTTAGTGAAACGGTTTGTCTGTCCGATAGCGAAAGACTCTAGCTTACTAAATAGACGCTCCGATCCTTCGAGTCGGACGTTCTTAGAGCGACGTTTAGCTGCATGAGACAGAGCGATAAACAGGTCTGTGATGCCCTTAAGATGTCCGGGGCCGCAC\n>CP002691.1/7079696-7079516 Haliscomenobacter hydrossis DSM 1100, complete genome. \nATTTTATAGAGAAGAGGGGAGAGAACGGGCTCTAAGAACCTCTGGCAACCATGCTTTTTTAAGCGAAAAGTGAAAAGCGAAAAGTGAAAAGTAAGATTAGCTGCTTTTCGCTTTTCACTTTTCACTTTTCACTAAATAAAAGTAACGGTGCCAAATCCCGCCATTAATGGGCATATAAAAT\n>AB701766.1/10364-10418 Culex flavivirus RNA, complete genome, strain: Toyama71 \nACGCGCGCAAGGAAGGACATGGCTGTCCTTGGGTACTAACGACACCCCGCCCCCA\n>LFJF01047439.1/12546-13056 Macrostomum lignano unitig_47506, whole genome shotgun sequence. \nTATCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTCTAAGTACAAACCTTAATACGGTGAAACCGCGAATGGCTCATTAAATCAGCTATGGTTCCTTAGATCGTCTCATCCTACTCGGATAACTGTGGAAAATCTAGAGCTAATACGTGCTTACAAGCCCTGACCTCACGGGAGGGGCGCATTTATTAGATCAAAACCAATCGGGGCTTGCCCCGTCTGCTTGGTGACTCTGGATAACTTTTGTGGCTGATCGCATGGCCTCTGCGCTGGCGACGTATCTTTCAAGTGTCTGCCCTATCAACTTACGATGGTAGGTGATATGCCTACCATGGTTATAACGGGTAACGGGAATCAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCTAAGGAAGGCAGCAGGCGCGCAAATTACCACACTCCCGGCACGGGGAGGTAGTGACGAAAAATAACGATACGGGACTCTTTTGAGCCCCG\n>KE124372.1/17462-21459 Plasmodium falciparum UGT5.1 unplaced genomic scaffold supercont1.10, whole genome shotgun sequence. \nGAGGATAAAAATAGGAGGGCAAATCCGCTGAACTTAAGCATATAATTAAGCGGAAGAAAAGAAAATAACTATGATTCCTTTAGTAACGGCGAGTGAAGAAGGAATAGCTCAATAAGTAGAATCCTTCGAATCTTAATGATATATTTATACATAGAATAAAGAATTGAAGGAATTGTCAAGTTGAATTGTACTCTTGTAGGCCTCACAGGTGAAATGAATATATAGAAGTAAAGTAGGAATACTTCCTCATAGAGGGTGAAAGGCCCGTATCATATATCATTTCGTGGGCTTTGGAGTATTTATATTTTACTGAGTAGTGTTCTTTGAGATTGGAGCACAAATTGGTGTGATACATTTCACATAAAGCTAAATATGTACAGGAGACCGATAGCAAACAAGTACCGTGAGGGAAAGATGAAATAGTACTCAGGAATGAGCAATTAAATAGTACCTGAAATCGTTAAGATGGAACGGATTAAGAGAGAAAACAAGTAAAGAGGGGAATTTTTAATTTTTTTTGTTATAATTCTCTTCTTTATTAAAAGAAACATCAGTGATTAATTTAATTTCAATAAAGCAATCCCCTGAAATTCAAAATTTCTTTTAATTTTGTTTTCACTTTCTCCCCGCACTAATGTGGGGAAAACTGGCTTTATTTCTTCAATTATTTTTTTTGCTGAGGAATTTTAAAATTATTTGAATTTTTCTTCTTATAATTTAAGTTGTTTCTATATAGTACTTTCTTAACCCACTCGTCTTGAAACACGGACCAAGGAGTCTAGCAAATGTGCAAGTGTATATGATTCTTTAAACATTTCTCTTTTTAATATACGCATAATTAATGTAATATGTTTCTTTATTGTAGATTTGTGGTGTTTAATTTTTATTAAATCCCCACTTTGCATACAATACCGGTAAGCAATTATGCTTTATTGAGTACGAGCATATTTGGTAGGACCCGAGAGGCTTTGAACTAAGCGTGATGAGATTGAAGTCAGGCGAAAGTCTGATGGAGGATCGAGTTGATACTGACGTGCAAATCGTTCATTTCAATCACGTTTAGGGGCGAAAGACTAATCGAAAAGCCTATTAGCTGGTTATTTTCGAAAGATCTCTCAGGATCGCTGGAGTTGAGTTGATTATAATTTTATAAGGTAGAGACAATGATTAGAGGGTTTAGGGGATTAAATATTTCTTAACCTATTCTCAAACTTCCAATATGTAAAAAGGGTGATATATCTGAATTGTGTGTATTTCACTCTGTTTTAAATAAAATAACTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGAGGGATGCTCCTAACGCCTGGATAAGGTGCCTAAATATTCGCTCATGAGATCCCATAAAAGGTGTTGGTTCATAATGACAGTAGGACGATGGTCATGGAAGTCGAAATTCGCTTAGGAGTGTGTAACAACTCACCTACCGAATGAACTAGCCCTGAAAATGGATGGCGCTAAAGCGAATTACCGATACCGGGCCATAAGAAGGTAGAAATTATAAATGTTAATTTAGCTCAGATCTTTTTATGAGTAGAAAATCGTGGGGTTTGTGTTGAAGCGAAATACGTGAGTTTTCGTGGAACATCTCCCTAGTGCAGATCTTGGTGGAAGTAGCAACTATTCAAATGAGAACTTTGAAGACTGAAGTGGAGAAGGGTTTCTTGTCAACTATGTTTGTACAAGAGTTAGCCACTCCTAAGGGATAGCTGAAAAGTGTTTAAAAGAAGAAATTCATTATAAGAATTATATAATGAAACTTCATCTCGAAAGGGAAACAGGTTAATATTCCTGTGCCATAAGTAATAAGAGTGCAAACAGAGATGGTAACATACATATAAATGAACTCCTTNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNGTAAGGGAAGTCGGCAAAATAGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGACATTAGAAAAGAGAAGAAAAAAAGAGGGTTGAGAATAAAATTGCAGATTTATTTGCTTTTCTCTCTGATTTGCTTGTAAATTTTCTTTTTCTTTTTCTTCTTTTCTTTTTTTTTCTGTCCCTCTTTTCGTCTTCATTTTATTGTAATTTTTGTTACTTTAATTTGATACATATATAATGTTAACTCAGAACTGAAACGGACAAGGGGAATCCGACTGTTTAATTAAAACATAGCATTGTGAAAAACCATAACTGGTATTAACACAATGTGATTTCTGCCCAGTGCTTTGAATGTTAAGTTGATGAAAAATTCAATTAAGCGCAGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTACTTGCTATCTAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAAAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTTACTCTAGTCTGGCTTTGTGAAACGACTTAAGAGGTGTAGCATAAGTGGGAGTAGAAACTGAAATATGTTTTTACGACAGTGAAATACCACTACTTTTAAAGTTGTTTTACTAATCCATTGATAGGGATATATAAAACTTATAAATAATTTTTATTTTAAGTTACTTTTGAATTTAAGATATGTGTGCATTTATATCTATTAAATCCCATTTTGTATATATATATATATTATATATATGTGTATAATACGATTTTTTTTATGGAGACATAGTTAGGTGGGGAGTTTGACTGGGGCGGTACATCTGTTAAAAAATAACGCAGATGTCCAAAGACAAGCTCAAAGAGAACAGAAATCTCTTGTAGACTAAAAGGGGAAAAGCTTGTTTGATTTCTATTTTCAGAACAAGTAGAAAACGTGAAAGCGTGGCCTATCGATCCTTTATATTTGCAAAATGACGTAATAAATTACTTACTACTGTGCATATAGAGGTGTCTGAAAAGTTACCACAGGGATAACTGGCTTGTGGCTGCCAAGCGCTCTTAGCGACGTAGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGGGACGCAGAAGTCTCAAAGTGTCGGATTGTTCACCCGCTAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGAATTTTATTATATTTTTTATATATACATATAGTATTGTGACAGTAATCCAACTTGGTACGAGAGGATTAGTTGGTTCAGACAATTGGTACAGCAATTGGTTGACAAACCAGTGTTGCGAAGCTAAGTCTGTTGGATAATGGCTGAACGCCTCTTAAGCCAGAACCCATGCTGATTAGACAATTCTAAATTTGATCTTTTTGTTAAACGATAAAAATTATATATATATTTTTTTTATCTTTACTGCATAATGTAAAAGAGAAATTATACATATATATATATATATATATTAGAAAAGAAAAAATGATGTAATTAATTATTATTATTATTTTTTTTTTTTTTTAGTATTAATATATAATTATGAATATATAAATAATCCTATATCTTTATATAAAAATTAAATTTTTAATTTTATTAGAATTTTTTTTTTTTATATATATAGATTGTAATTTAACAACAAAAAGTATTAAGCCCAAATCGTAGACGACTTTTCTGTCTCAGAGTACTGTAAACATGAGAGTAAACTTTGTTTTACGATCTGTTGAGGTTTATCTCTTGTGACATTGAGCTAA\n>MDLB01000098.1/10133-10486 PVC group bacterium (ex Bugula neritina AB1) isolate AB1-3 AB834_contig000098, whole genome shotgun sequence. \nAAAGTTGATTGGATCATCGGTGCTGTTGATCTCAAGATATTGATTTAACAGTGCAGGAAAGTCTGGACTCCGCAGGGTAAGATGCTACTGTTATGGTTGTGAGGGTGACCTTAAGGAAAGTGCCACAGAAAAAAAACAGCCTATTGGAAACGACTCGTTTCGATTGATGGGTGATGGTGAAAAGGTGAGGTAAGAGCTCACCAGTTCTGGTTTGAAACCCAGAAGCTAGGTAAACCCCATCTGGAGCAAGACCAAGTAGGAAACGTGATAGTTACCCGCTATATGTTTTCGGGTTGGTTGCATTAGATGAATGATGGTCATAAACAGAATCCAGCTTATAGATCAACTTTGCCT\n>JRRC01046601.1/9504-9338 Gossypium arboreum cultivar AKA8401 contig_129_9, whole genome shotgun sequence. \nACTTTTTAAGTTTGCTGTCAAATCTCAAGGCTCAACCCTAGACAGGCGGTGGAAACTACCATGCTGGAGTACGGTAGGGGTAGAGGGAATTTTTGGTGGAACGGTGAAATGCGTAGAGATCGAAAAGAACACCAACGACGAAAGCACTCTACTGGGCTGACACTGAC\n>JH835603.1/135856-135729 Erinaceus europaeus unplaced genomic scaffold scaffold00315, whole genome shotgun sequence \nAGCCCCATTCTAGATGAAAATGGGCACTGTTGCTTTTGGTGTTCAGAAACAGATGTGGCTATATTGATACAGGTTAAGCTTTCACCATAGTACCTTACTGTAGTGGTGACAATGAGGCTGCAACATGT\n>KV428048.1/4065-3885 Sistotremastrum suecicum HHB10207 ss-3 unplaced genomic scaffold SISSUscaffold_45, whole genome shotgun sequence. \nTTCGTGCGGCGTCACGGCTATACTTTCCCCATGTTGCTCACTTCTGCTGATCGTGCGGTGGTTCGAGTGTCAAGCCGTGTCCAGAATAATTTTCGTGGACGTCTTAGTGCCTTTTTAACCCTCCTTTTATGGCTCTTGTAGCCTTTTTGGGAGGAGGGTTGGGTCGGTGGTTCTTACACTC\n>MGVC01000060.1/14949-14867 Elusimicrobia bacterium RIFOXYA2_FULL_39_19 rifoxya2_full_scaffold_498, whole genome shotgun sequence. \nACGTTATCCCGCTACTGGCGGATTTGTGGGCCTAAACCACAAGGGACCGGGATAATTTCAAGCCGACCGCCTGGGCAGAAGTT\n>LZPO01057484.1/678881-679115 Neotoma lepida isolate 417 scaffold_0, whole genome shotgun sequence. \nGGATATGAGGGTGATCTGACTTGACAGTGTCTCCTTTCTCCCTTATTCTTCCATGTGTGTCCCTCCCGAAGGTGCCCATTCACTGTTTTGAAGACTAAAGGAGGATTGGACAAGTACCTGTGCTCCACTGTTAGAGCCTCCAAACAAACTCTCAAGAAGAAAACCAGATGAGAACAGATGGCCAGATAGTTTATTGTTCATCACTCTAAATAGTAGACACAATTCAAATTATTCT\n>AAAB01007393.1/1-1983 Anopheles gambiae str. PEST whole genome shotgun sequencing project, whole genome shotgun sequence. \nATACCATGAAAGGTGTTGATTGCTAAAGACAGCAGGACGGTGGACATGGAAGTCGTCATCCGCTAAGGAGTGTGTACAACTCACCTGCCGAAGCAATTAGCCCTTAAAATGGATGGCGCTCAAGTCGTTTGCCTATACATTGCCGCTGGCGGTATGGCGCATCGGGGGCTTAACCACCCTGCGATGAGACCCCAGTGAGTAGGAGGGTACGGTGGTGCGCGTCGAAGTGTTTGGCGCAAGCGGCATGGAGCCGCCACTGGCACAGATCTTGGTGGTAGTAGCAAATATTCGAACGAGCTCTTGGATGACTGAAGTGGAGAAGGGTTTCGTGTCAACAGCAGTTGAACACGAGTTAGCCAATCCTAAGCCGCATGGGAATCCAGTCGTAACCCATCAGTCGGCGAAAGGGAATCCGGTTACCATTCCGGAGCCTGTTGAGTACCCGTTTGCGCCACCTAGTAGGGTTTAGCTCGTCCGCACCCGAACGGTTAGTGTGTAGCTTCATGGCAACATGAATCCTTTTCTTCGAGAAGCCAACGAGAGGCATCGGAAGAGTTTTCTTTTCTGTTTTACAGCCACACCGACCATGGAAGTCACTCACAGAGAGATATGGTTGGACCGGTCTGGTAGAGCACGGCCGCCGCAACTGCCGTGTCGATGCACTCTTCTTGGACCGTGAAAATCGAAGACTGGGGCACACTTTATATGGTAATAACGCACACTCTCAACAGATTGTACCGAATCCGCAGCAGGTCTCCAAGGTGCAGAGTCTCTAGTCGATAGATCAATGTAGGTAAGGGAAGTCGGCAAACTGGATCCGTAACTTCGGGACAAGGATTGGCTCTGAAGGCTGGGTGCGACCAGCCGGGACCGGTGCTCCACCTGCCGCAAGGTAGGCTGGCCCGTGCCCGCGGTCGCACAGCAAACAGCCAATTCAGAACTGGCACGGCTGAGGGAATCCGACTGTCTAATTAAAACAAAGCATTGTGATGGCCCCGGGTGGGTGTTGACACAATGTGATTTCTGCCCAGTGCTCTGAATGTCAACGTGAAGAAATTCAAGCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCTCTGTCCCTATCTACTATCTAGCGAAACCACAGCCAAGGGAACGGGCTTGGATGCACTAGCGGGGAAAGAAGACCCTGTTGAGCTGACTCTAGTCTGGCATTGTAAGGCGATATAGGAGGTGCAGCATAGGTGGGAGGGCTTCCTCGTGGAGCTCGCCTCTGAGATACCACCACTCTTACTGTTGCCTTACTTACATGATTGGGTGGAACAAGCGCGGGCCCCAGGTCCGGATCGTGCGCGCACCTCCTCCGGGGGGCTGTGGCGGCGGTTCGCCTGCGCGCGCCCAATGCGCCGTGTTTCTCGCTCAGCGTCCAGTGTGTCGCTGGGTGGTGCCGCCGGGGAGACTGCATCGTAGCATCGTCGTGTGTAGCGTGTTACCCGCTTGTCCGACCGTGAGCCGTGGCCCGCAAGGGTACAAGCTTGCGTACGTCGGTGCATTCGTGGTGCACTGCTTCTGCGCGGTCGATCGTTTATGATGTCACGTTTGCCCCCGGTTCCGCGCGCCGCCCGGCTCGAAGACTCCTGGACAGGTCCTTTCGGTCCACGTCATGGACAGTGCCAGGTGCGGAGTTTGACTGGGGCGGTACATCTCCAAAACGATAACGGAGGTGTCCAAAGGTCAGCTCAGTGTGGACAGAAACCACACGCTGAGCATAAGGACAAAAGCTGGCTTGATCCCAACGTTCAGTACACTTCGGGACAGCGAAAGCTTGGCCTTACGATCCTTTTGGTTATAACGAGTTTTTAGCAAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCCGCCAAGCGTTCATAGCGACGTGGCT\n>LCGI01000002.1/5713-5334 Parcubacteria bacterium GW2011_GWA1_43_27 UV92_C0002, whole genome shotgun sequence. \nACGTCAACCCAGGTGATTGCTCCGTATTTTACGGAGAGGAAAGTCCGAACACCACAGTGTTCCCGCTAATTTAAGGGAAGGGTAACTCCTAATTGGAGCCGTTGATCCGAGTAATCGGATCGCAGGACAAGTACAACAGAAAACAAACCCACTTTAATAAAATCATTGAAGATAGGGGTGAAACGGTGAGGTAAGAGCTCACCAGTATCTATGGCAACATTGATGGCTAGGTAAACTCTACCCGGTGCAATACCAAGTAGGTCCGCATCTTGGCGGACGGGTTGGTAGCTTGAATCCTGGTGCGAATCAGGATCTAGATAGATAATCACCGCCCTGCCTCGCGCAGGGTACAGAATTCGGCTTATAAGGTTGAGGTGAGC\n>JPVT01000244.1/2256-2451 Tetragenococcus muriaticus 3MR10-3 WGS_Sequence244_061, whole genome shotgun sequence. \nATATCAATACACAGAAAACCTAGTACATGATTTTGACCTTTCAGAGAGCTGATGTTTGCTGTGAATCAGTAGGAAAAATGATGGAATCCAGTTTTTAATGTTTCTTTTAATAAAGAACCTATACTCTTTGGTTACAAGAGACAAGTGCGGTTAATAACCGAACTTGGGTGGCACCGCGAACTATTTCGTCCCAAGC\n>MHLL01000003.1/8974-8834 Candidatus Lloydbacteria bacterium RIFCSPHIGHO2_02_FULL_50_13 rifcsphigho2_02_scaffold_10435, whole genome shotgun sequence. \nAGTTTATCGCGAGTGCGGGGGAGGGAATTGGCCCTAGAATCCCGCCGGCAACCATTCTGAATGACTCCTACGGTTTTGGAGAACCGTAAGAACTTCAAAAAAGAGGTGCCAAATCCAAACCCTTAAGGGGAAAGATGAAAT\n>ALAR01193235.1/10683-11037 Tupaia chinensis contig193235, whole genome shotgun sequence. \nGAATATGAGGGCAATCTGGCTATGATAACTGTCATCTCGTTGATGGCCAGGGTTGGTTCCTCTGATCGGGCAGGCTGGATGGATATCCTCTTCTTCCCTCACTTCTCCATACATTTCCTTTCCCAAACTGTGTATCCAAAGAAGATGGCCTTTTCAGGTATACAAGGCCCATTGTTGGGCTGAGCTGCTTGGGTAGCTCAGCCCAAGAATGTGTTCCTCAACCAGAACCTCTGAACAGACTCTTCTACTTAGTACTACCTTTACTCACTCTTGTTTTTTATTCTGTAAAGGAATATTCTATGCTATTTCTTGTATATAGAAAATTTCCACAGCATCATTTGGTGGCATGATAGTG\n>ANKR01173204.1/1886-2165 Myotis brandtii contig173204, whole genome shotgun sequence. \nACCGGGCGTGGTGGCGCGCGCCTGTACTCCCAGCTACTCGGGAGGCTGAGGCTGGAGGATCGCTTGAGCCCAGGAGTAGGGCTGTAGTGCGCTATGCCGATTGGGTGTCCACACAAAGTTCGGCATCAATATGGTGACCTCCCGGGAGCGGGGGGCCACCAGGTTGCCTAAGGAGGGGTGAACCGGCCCAGGTCGGAGACGGAGCAGGTCAAAGCTCCCGTGCTGATCAGTAGCGGGAAACCTGGAACCCTTCACTTGCAGGCCAATGCTCTATCCTCTG\n>BA000039.2/281279-281411 Thermosynechococcus elongatus BP-1 DNA, complete genome. \nGACAACTCAAGACTAAAACCGAAGACCGCAGGGGTCTGGCTGAGACATAATCTTCCTGCCGAGGTTTGCGAAGTCCATCCGTTGCGATTGGGCGATCGCCCCGGCACCCTTGCTGGGGTTTTTCTTTCACTGA\n>ALWT01112214.1/10402-10542 Myotis davidii contig112214, whole genome shotgun sequence. \nAGCTTTGCGCAGTGGCAGTATCGTAGCCAATGAGGTTTATCTGAGGCGCGATTATTGCTAATTGAAAGAAAAAAAGAAAAGAAAAGAGGGAGATGACTGGCGGTGGCCATCGCCCTGCCCACTGGTCACCCCACAGATGGG\n>MHQJ01000053.1/3212-2967 Candidatus Sungbacteria bacterium RIFCSPHIGHO2_02_FULL_49_12 rifcsphigho2_02_scaffold_96412, whole genome shotgun sequence. \nNNNNNNNNNNAGAAGCAATTCTCTTGTAACAAACTTGGCTATATGCTGGAAAACCCGCGCATGCAGAAGTACTTAAGTACTGTACAGTACTTAAGTGACAATCTTCTGCCGATGCGGACAATCAGCAGGCAACCTATAAGTTCAATAGACCAGTCTATCGAATTCATAGAGAGTCCCCAGAGACTATACGCCGAGCCCCCAAGTTTTGGGGTGATGATATAGTCCATGCCTTATGGCGACATAGGG\n>DS989904.1/4377794-4377629 Synechococcus sp. PCC 7335 scf_1103496006895 genomic scaffold, whole genome shotgun sequence. \nTTGTGTCGCTATGCGCCGTGCTAGGCTAGGTAGCCTGCATGGGGAAAGTTCGGTGAAAAACCGGCGCTGTCCCGCAACTGTGATGGCAATCTCTAACAAAGTTTCTTCAATATAGTTGCTTTCTTTTGCCTGAGCCAGAATGCCTGTGCGGGTTTTCGCTACACTC\n>AFTD01105653.1/47017-47121 Cricetulus griseus cell line CHO-K1, whole genome shotgun sequence. \nGGCTTGTTTGAAGGTAGTGAGTTATGTATTGCTCAAAGGCAGTTGCATATTAGACCCCTTTTCTATACTTTCTCCTGTCACACTATCACACCTGACAAGTTTAAA\n>MGYS01000080.1/2479-2377 Gammaproteobacteria bacterium RIFCSPLOWO2_02_FULL_57_10 rifcsplowo2_02_scaffold_5319, whole genome shotgun sequence. \nTAACTCAACAACCAACGTCGCACATACACCGTCACATGTGTTTTGGGTGCCTTGAAATCCTCGCGGATTCGGGGTTAAACCATGGGGTGTGTGGAGGCTTAAC\n>CP003219.1/1938094-1938153 Streptomyces cattleya DSM 46488, complete genome. \nCGCCCGGTACGGACCCGTGGGGGGATCCGCTTCCGGGGCACGGGGGCGCCCCGCTCCGGA\n>LJYW01000001.1/1800734-1800628 Prosthecomicrobium hirschii strain 16 C1, whole genome shotgun sequence. \nTGCCAGTCCGAGGGGTGCTCCTGTGGGAGCTGAGATGGCGCTGCGGCGTCGGACCCTTTGAACCTGATCCGGGTCATGCCGGCGAAGGGACGGGATCAACCGGCTTT\n>JH932293.1/704875-704772 Bergeyella zoohelcum ATCC 43767 genomic scaffold supercont1.1, whole genome shotgun sequence. \nCGAGATATAAGCATTTTTTATCAATTATAAAAGTACCATTTTTTACCACATTGCCTAAAAATAAAACACCCCAAACCATCGTTTGGGGTGTTTTTATTAATCTA\n>GL541731.1/40376-40515 Microbotryum lychnidis-dioicae p1A1 Lamole unplaced genomic scaffold supercont1.89, whole genome shotgun sequence. \nTCAGTCTCTCTTCTGGACTGAGCTTAATCGGCATGCGTCTCTGGTAACGGGGGGGTATGAAGCCCGAGGATAACGTAGCCTCTTTAGCTTTTTACTCCTTTATTTTCGAAAATAAAGGCCAAAAGAAAAAAAAAGGGAGG\n>LHUR01000022.1/308140-307852 Clostridium homopropionicum DSM 5847 CLHOM_contig000031, whole genome shotgun sequence. \nAAATATATTAAAGCGCCAGAGCTAAGCAGGGAGCCTGAATCAAAGATTGTCTTATAGGAAACTCAAACTAAGGTCTGAGTAAGCTCGAATAAGCCAAATTAGCACTCTGTGTAAGTGACTTGCACCAAATCATAGATTTGGGCAATCTACTTAAGATTTGGATTCTCGCTTAGCTGACGAGGGTGGGGAGTATCGAAAATTCGGCGGATGCCCCACGGTATAGTGCTACCGATAAAGACTGGCAAAACTGAAAAGTAATTTTCAGTACAAATTCAGTCAGGCACTCACA\n>CP008889.1/1694819-1694882 Dermacoccus nishinomiyaensis strain M25, complete genome. \nGGAATGCCGGTGCGAATCCGGCAGCGGTCCCGCCACTGTGATCCCCGACGGGGTAAGCCAGGAC\n>HF993839.1/17775-17516 Clostridium sp. CAG:127 genomic scaffold, scf188 \nTAGTAGTTCGATGGACTGAGAAGTGAAGAACGAGGAGTTGGTTATGAATCTGGTAAAAGGAACAAGGATGTTGCGGAAGGATAATAACCCATATGGGGCACAGCCCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNGTGAACACGAAAGTGGCTTGCCTGCAATTCCCATGTGTACGGGCGATAGAGGGGTTCGGATGAACCAGAGTACACCTACA\n>CAJW010074381.1/2720-1779 Hordeum vulgare subsp. vulgare, WGS project CAJW01000000 data, contig: morex_contig_74381 \nATGGGGCACGTGGAATCCCGTGTGAATCAGNNNNNNNCACCTTGCAAGGCTAAATACTCCTAGGTGACCGATAGCGAAGTAGTACCGTGAGGGAAAGGTGAAAAAACCAAGTGGGTAATAAAAAACATCGTGAAACCTTGTCGAGCTCCCAAGCAGTGGGAGGGGAAAGTGATCGCTGACCGCGTGCGTGTTGAAGAATGAGCCGACGATTCATATGCAATGGCTTGGTTAAGGGAACGAAACCCACCAGAGTCATAGTGAAAGAAAGTCTTAATAGGGCGATTGTCACTTCTTATGGACCCAAACCCCTGTGGTCTATCCATGACCAGGATGAAGGTTGGACGAAACTAAGCAGAGGACTGAACCAACTGATGTTGAGTAATCAGCGGATGAGTTGTGGTGAGGGTTGAAATGCCACTCGAACCCAGAGCTAGATGGTTCTCCTCGAAATGTGTTGAGGCGCAACAGTTGACTGAACATCTAGGGGTAAAGCACTGTTTCGGTGCGGGCTAAACGATCGGTGCCAAATCGAGGCAAACTCTGAATACTAGATATGACCCAAAAATAACAGGGGTCGAGTCGGCCTGTGAGACGATGGGGAATAAGCTTCGTCGTCGAGAGGGAAACNNNNNNGATCACCAGCTAAGACCCCTAAATGAACGATTAGTGATAAGTAAGGTGGGGGGGGGGGGCAAAGACAGCCATTAGGTTTGCCTAGAAGCAGCCACCCTTTAAAGAGTGCGTAATAGCTCACGGATCGAGCACCATCGTGCTGAAGGTAAACAGGGATAAGCAAGGTGCCTAAGCTATGAGATGTCAAAATGCATTGGTAGGGGAGCGTTCCGTCTTAGAGGGAAGCAACCTCTTTCCTAAATATGTATCGGTTATATTTCATGGTCGAGGCTCATTTTTCTATTGTTTTACCATACATGGTTTGTTTCT\n>FKLB01000042.1/73555-73404 Pseudomonas sp. 1 R 17 genome assembly PSEFL294_LIB5394, contig: PSEFL294_LIB5394_000042 \nATCCTTCCCAAGTGCCTGCTGACGTTGTCAGCAACATGCTCAGGGCAGCTTTGATCTAGAAAGCTGCAACGTACATACCGTACGCCGATCACCACCCAACCGCTAAAGCATTCAATTTGTGGTCACACGTCAGCGTTATCGACGTGGAATGC\n>CM001665.1/38959911-38959726 Nomascus leucogenys chromosome 19, whole genome shotgun sequence. \nATTGCTTCTTGGCCTTTTGGCTAAGATCAAGTGTAGAAATCCATGAACACTAAAGGACTGCATTGACTTTTTCAGAGAGTAGAAAACAACTTAGTTTTTTTTTTTCCTGAATGCGTCATAGGCTTGTGAGTGATTTTTGTCCATTCAATTGTGCCTTCTTTGTATTACAATAAGATGGGGGTACTT\n>CP011568.2/2789266-2789207 Pandoraea thiooxydans strain DSM 25325, complete genome. \nTGTCTCCTCCACCTCCTCCTGGTGGATTTTATGGCCAGCAGATTGCTGGCCATTTTTTTT\n>ARZA01000139.1/3294-3076 Caldisalinibacter kiritimatiensis strain L21-TH-D2 NODE_28, whole genome shotgun sequence. \nATATAAGCTGTGAAAGGTAATAGTAGATATTTAAGGCTTACAGAGAGGAAATCCTAGGCTGAGAGATTTCTAGCCCTCTGAATATTGAACCCGGCCTGGAGCTTCTAGACTGAAAAAAAGTAAGTTTAGACGGTGTTAGCCGTTATAAAATTAAGTGAGCCAATGAAATGTATTAATTGGTTAAATAGGGTGGTACCGCGGATAAACTTCGTCCCTTTT\n>CAGP01000005.1/749-1 Helicobacter bizzozeronii CCUG 35545, WGS project CAGP01000000 data, contig: tsc_c98 \nCTACTACTACACCGATAGCGCACAAGTACCGTGAGGGAAAGGTGAAAAGAACCGTGGGTAACGGAGTGAAATAGAACCTGAAACCATCTACTTACAATCATTCAGAGCACCATAGTGAATCCCCCTGAGGAATTGCGGGGGGGGGCTGTATATAACACTTATACGCCCTCTCCTCCTCCATGATTTCTCGATATCTTTTTTGGTAAGGAGTTTTCATGAAACCCCAAGACAATGCGTCAAACATGCAAAACCCGAATCGTGGGACTAGCGGGACAAATAGGCAATACGACCAAAATCAGGGGAATAGGGGAAGCCAACTAAACCCTAACAACCCCAACAACAGGAAATAGGTAAGGAGAGGTCTCATGGGAAGAGGACAACCAGATAACGACCCTAACGAAGCAGGCTATCCTTCCACGACAGGTAACCCAAGCGGTGGCGGTCGTGGCAATGATGACCCTGATGACGATTAGGTCTAACTAGGTCTCAAACAAGGAGGGGAAAAACTTCAATTCTTCAGTGGGATTCACTGGTGTGATGGACTGCCTTTTGCATAATGATCCTGCGAGTTGTGGTGTCTGGCAAGGTTAAGTGAAAACGAGCCGTAGCGAAAGCGAGTCTGAATAGGGCTATTTAGTCAGACGCTGCAGACCCGAAGCCAAGTGATCTATCCATGGCCAAGTTGAAACGAGTGTAACAGCTTGTGGAGGACTGAACCCGTGCCCATTGAAACGGGCTGGGATGAGCTG\n>BDFN01001244.1/2524-2921 Ipomoea nil DNA, scaffold: scaffold1244, cultivar: Tokyo-kokei standard. \nATTCAAATGAGAACCCGAAGGCCGGTTCAGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGGGTCGGGGGCGCGCCCGACAGACAGCGCGTTTTGCGCGTGGCCGAAAGGGAATGAGAATAATTCGAGGGCGTTCGACCCGATGTTCTAATCATTGGCTTTACCCGAGAGACGGCGCGGCGCTCAAGAGTTGAGGGAAACTTCGGAGGAACCCCCCTGGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCACACGTCGCGTGGTGTCCGGTGCGCCCCCGGCGGCCCTTGAAAATCCGGAGGACCGAGTGCCGTCCACGTTCGGTCGTACTCGGTCCCGCAGGTATCCTGGTGAACAGCCTTGGTG\n>JH815222.1/1813753-1813619 Clostridium sp. 7_2_43FAA genomic scaffold supercont2.3, whole genome shotgun sequence. \nATTGTTAAGAAGAAACAAAGCCGTTTCTCACCTTACGGCAGAGCTTAGTAAGGTAGTATATTCTTATTTTAATTTATTATTTAAATTAAACGTGAGTATTATGAGGACGGCATATTGCTGTCTTTTTTATTTTGT\n>AACY023865031.1/116-206 Marine metagenome ctg_1101668672382, whole genome shotgun sequence. \nCTGAGTTTCTTGCTTTTCTATAAGAGCAAGTGGTGCGCTACATCCGCGTAGTTTCCTAGTTCTACACAAAAACTAGGTGGCGAGCATATTA\n>ANKR01167074.1/25401-25567 Myotis brandtii contig167074, whole genome shotgun sequence. \nATCACTTTTTGGCCTTTTGGCTAACATCAAGTGAAGCATCTGTTCTTATCAGTTTAATAAAATATTTGCTTCAGAAACTGCCACCTCTGAAGAGTCAAGCTGCCATGAAGCAGGTAAGTGCATGGAGCCACCATCAACAGCAAACTCATTTCTGGAGTGAAAGCTCA\n>MHKU01000038.1/195-563 Candidatus Liptonbacteria bacterium GWB1_49_6 gwb1_scaffold_7743, whole genome shotgun sequence. \nTTGGCAATTCAGATGATCGCTCTTTATCGCAAGATAAAGGGAGGAAAGTCGGGACACCCTGAGCCGAAAGGTTTATAAAAAAGTAGCGGCTAACAGCCGTCGTCCGCAAGGACAGAGGTGCGAGCAGTGACGCTCCGACGCGAAAGTATCGGAGGGACCCTATCCCAAGCTAGAAGGTCCAACTCCGCGATAGGGATAAGAAAGCGGAGGTGAAACGGCTAAATCCTTACTGGGTGCAAGACCGTACTCCAATGCGGAGCATTGGTTTGTGTCGCTTGAGCCCGCGAGCAATCAAGGGCCCAGATAAATGATCGCCGCCGCCGATAACAATCGGTGTGCACAGAATCCCGCTTACGAATTGCCGCAAAC\n>MHXM01000167.1/11573-11672 Desulfuromonadaceae bacterium GWC2_58_13 gwc2_scaffold_6790, whole genome shotgun sequence. \nCTTTGCTCAGAGCAAACCACGGGAAACCGTGGGGCGCAGAGCCACGGGACTTCCGGTTTGCAGGCAGGAACCTGCGACCAAAGTCAGCCGGGCCGCCAGA\n>AAPU01011573.1/516306-516391 Drosophila mojavensis strain TSC#15081-1352.22 Ctg01_11574, whole genome shotgun sequence. \nATATTTTCTAATGATGATAACTACATAGCAAATCAGAGCAATAATGTTGAAATTTACAGACAATGCACTACCATCTGATTGCTATA\n>KB916025.1/11687-8703 Neofusicoccum parvum UCRNP2 chromosome Unknown NP2_03_scaffold_387, whole genome shotgun sequence. \nCCTGGAGATAGAGTGCACTTCTAGGGTATAATCTTCACAAAACCCCCCCTTGGTTCTAACCAAGGCAGTTGGTTCTACTAAACTCTTAGAGAAATTATATTAATAAACGAAGTGAATTGAAATATCTTAGTAACTTCAGGAAAATAAATCAAACGAGATTCTATGATTAGTGTGAACGAAAGTAGAAAAGCCTAAATATTAAGCAAGTAAAATGGATTAATCTGTTTGAATATAGGGGAACCTTCCTCTAAGGCTAAATATGATATATAAGCGATAGTGAATGAGTACCGTGAGGGAAATGTTTTGAAATAGTAGTTTTATAAGCAGCTCGAGTGAAGTTTAAATAAAAAACAAGAGCGTACCTTTTGTATAATGGGTCAGCAAGTTAATATTAGATGCGAGCATAGCACTATGCCTAGATAAACCGATTATGAAATAATGAATAAGTATCTAGTATTAGACCCGAAGCCTAGTGATCTTACCATAATCAGGATTATAAAAGTCCGAACGGGTTATCGTTGTAAAGATATCCGAAGAATTGTGGTAAGTTAGTGAAAGACAAAACTGACTAGGATAGCTGGTAAAAATTAGTGTGAGCTACTAATTAGGCCAGTAAGTAGAAGTGAACCTTCTGCTATAGACCATCAAATTGACGGGAAAGCCCTAAAGCAAATTCAACCAAACAAATGTGGTAACACATTTGTGGCGCAGGTAATGACTCGCGGTAAGGTAACATCGAAATTGATAGCGAAAGTGAATGGGTAATCCGCAGCCAAGCACCTTATGGGTGTGCAGTTCATCGACTAAATGTTGGTTGGCGCAAGCTTAAGATATAGTCAAGCCTCATCCAAAAGGATGCAGAATAATAAAATACTTTTTTTATTTAATTTTCCGCCTTTAAGGCACATATCTAATCCTTTATTACCTTCAAATAGACTTAGGTTGTACCTTTTGTATAATAGGTAAACAATCCTAAAGGAAAACATATCTTCTAATGTTTTACATTAGAGGTATGAATCCGAATCTTTTTTTTTAATAGCCGATAAACTATCACAAGTAAATACTAATACAGAATTAGAATATGCAAGTTTAACTGATGCAGCTAAGGCTATAGCTGTTAGTAGAACAGCTGTAAAAAAAGCTCTTGACACAGGTAGAACTGTAAAAGGATAATATATAGTAGCCACAAAAAATTAAATAAAAAAAGTATTTTATTATTTGTAAATGGATAGCTAATAGCTATTTAGGGAGAAGGACCTCAGCTCGGCCCTTTAAAGTTTTATTCATATTCACAATAAAAAAAATAAAGGCTAAAGATGGTCATATCTGTTTCCGCGAAACCTATATAAGTAGGTAATTCAAGTAACATCTTAGCAGGTACAGAACTGTGATCTCAGGTAAAATTATATTATTTTAGAAATCTAAAATAATAATTTTGCATACATCGGGGGATCGTGAAGATTTTATCGGTGAGTATTTGCTCTCGGAAGGGCAAAGATGATTATTGAATAATCAGACATAGTACGATAAGGTTGTATGTCTAAAGGGAAACAGCCCAGAACAAGTGTTTAAGGTTCCAAAATTATTGTTAAGTGAAATTAAGGAAGTATTTTTCAAATACAACCAGGAAATAGGCTTAGAAGCGGCCATTTTTTGAAGACCTCGTAACAGAGCACTGGTTCAATTATAAATTAATATAAATTTATACAAGTTAAAAGCGCCAAAAATATAACGGATCTAAAACAATATACCGAAACCTTGTCCATATTTATAAATATATAGGAAGTTAAAGATCTGGGTGAAATCTTTATTTTTTTTTTTGAAATAAAGATTTCACTTTTTATAGTAATAATAATAATTAACAAATCTTTAAGCTTCATGCTTCAATATGTAGCAAAGATATTGTATTTATGGGGTAGCGGAACGTTGGGGAAATCTTAGATTTTTACTTTTTAAGTAAAAAAATTAGATAACCCAAGTGAGAATGCTGACATGAGTAACGAAAAAGGGGAATACCCTCGCCTTAAGCTTATGGAATTTCTTTAAAGTAACGGCCTCTAAGTTTACAGACCTGTCCTAAAGGATTAAACGATGAGAAAATCTTCCTTATGTATGACAACCTTAGAATAATAGTTAATCTGTTTAATAGATAAGAAGATTTTGTATTAACAGTTAATGCATTTGAAGATTTTGTATTAACACTGTTAATGCATTTGAAGGTCATGTTAAATGCGCCATGATATATCAAATCTGGTCTACTAACCAGATTTGATATACCGACCAGTAAAGCTGGATACTCTGTCACTGCTTGCCACAGGGCCTATGATCGTTGCAGGCCTACTGGTTCTTATTTTTTAGTATTGAATTATATGGCAAGTATTTTCAGTATATCCCTTTTCCCTGCAGAGGAAATATCCCCTCTAAAGGAAACTTAGGGAAATAAACTGTATAGTAACAAAGGATGCTAGACAGATATTAAATAGATTAATAGTTGAGAGTACTAAGCGTTCTGGAAAAAGACATAAGGGTAAAACCGTACCTAGAAACTACCACCAGTAAGCAAGTAGAGAATACGAAGGCGTTTGAGCTAACAATCATTAAGGAACTCGGCAAATTGACTCCGTAACTGCGGGATAAGGAGTGCCATTCTAACTGGATAATATCAGATTTAGAAGAGGAGGCACAGAATGGTGTTGTACGACTGTTTAATTAAAACACAGCACTTTGCGTAAGATGACAAATCGAAGTATAAAGTGTGCCGTCTGCCCGATGATGGATGGTTAACGAATTTATTTAGCTGACTAAAATAGGTTAGGTTTTGAAGGAACCCCCATTCAATGGCGGCCTTATCTATAAGGGTCCTAAGGTAGCGGAATACCTTGGCCGTTAAATGCGGTCTTTGCATGTTTTCTCTTTAGTTTAGGTAACTAAAGTAAAGGATTAACCAATAAAAAAAAATAAATAAGGGAGAAATCTCTCCAAGCC\n>LJSX01000001.1/215848-215664 Rhizobiales bacterium HL-109 ITZY_scaf_5, whole genome shotgun sequence. \nTGGCCCCTTGCCGTGGTCGGCGCCCTTTCGGGCCCAACAGGGAAACCGGTGCGAGACCGGTGCTGCTCCCGCAACTGTAATCGGTGAGCCCGTCCGAAAGCCACTGGTGCCCCGCGCACCGGGAAGGTGGACATCGCGGTGATGACCCGAGAGCCAGGAGACCTGCCGACGTGAAGCAACCCTGA\n>NATL01000046.1/9039-8946 Candidatus Omnitrophica bacterium 4484_70.1 ex4484_70.1_scaffold_5627, whole genome shotgun sequence. \nAGCGATAAAGCCAAACCCAGGGAAATCTGGGGGCGGAAAGCCACGGGTCCTCAAAATCAGGATTATTATTGAGGGGATAGCCGGGTTGCCGAAA\n>CP000248.1/722861-722994 Novosphingobium aromaticivorans DSM 12444, complete genome. \nCCCCAACATCGAGAGTTGGGGTGACGCTCCAACGCCAACCTGCCGTTCCGGGCAAGGTGGTACCCGATCCGCAAGGCGGCCCCGGCCGAATTGCGAAAGGGGATGTGGCCGATCCGGCAACCAAACGGACACGG\n>DS562862.1/42992321-42992756 Cavia porcellus supercont2_7 genomic scaffold, whole genome shotgun sequence. \nAATGGCGGTGACCTCTGGTCCCGTCTGTCTCGTTTGTTCAGTCGTCCGTTGGTCAGTCGGTCGGTTGTCCCCCTCCCTCTGAGACGCGAGCTCAGATCAGACGTGGTGACCGGCTGAATTTAAGCATATTAGCCACCAGAGGAAAAGAAACTAACAAGGATTCCCTCAGTAATGGCGAGTGACCAGGGAAGAGCCCGGCGCCGAATCCCCGCCCTGCGGTGGGACAGGGGAAATGTGGGGAATGGAAGACCCGCTCCCTGGCGACACTTGTGGGAGGCCCAAGTCTTTCTGATTGAGGCAAAGCCCATGAACGGTGTGAGGCTGGGAGCGGCCCCCTGCGTGCTGTGTTCGGGGGAATCACGAGATGGATACTTAAATACCATAAGGGAAAGTTGTAAAGAACTTTGGAGAGAGTTCAAGTGGGCTTGAAACTGTT\n>CAFZ01000031.1/6993-6912 Piriformospora indica DSM 11827, WGS project CAFZ01000000 data, contig: PIRI_contig_0034 \nCCACTCTTAGCTCAGTTGGTAGAGCGTGCGGCTGTAATTTCCCTAAACCGCAAGGTCGCTGGCTCGAATCCGGCAGAGTGGA\n>JPZU01000001.1/1721226-1721354 Lachnospiraceae bacterium TWA4 TWA4_scaffold00001, whole genome shotgun sequence. \nACGAAACGATCAGCACCGCCGAAGACAGCAGGTGCCGTATGGCGTAAGGTGTAACGCCTGCCGAGACGATTTTAAGGAATGCCTTATATACCTCTCTGTCTTTGGATAGAGAGGTTTTGTTTATATACA\n>LQBR01000004.1/128232-128109 Microbulbifer sp. ZGT114 ZB100003, whole genome shotgun sequence. \nTAGCTGGTCTGTAAATATGCACGGGCCAGCCGAATCTTCAAAGCATATTACGACGAGGTAATTCGTTATGGCACTGACTGCAAATGAAAAAGCAGCCATCCTCAAAGAGCACGGCCAGTCTGAA\n>CP009505.1/1989432-1989301 Methanosarcina sp. MTP4, complete genome. \nCGGTTGCTTGCAAGCGGACCTCGAAGCCTCATTTCACACACACACACGAGAATCACAACGATTACTCTAGATGGATAGGTTCATCCCTTCTTCCTGTCCGTTCCGTTCGCTTGTGAGTACCACCCCATCATA\n>CP021112.1/3034288-3034406 Pseudorhodoplanes sinuspersici strain RIPI110, complete genome. \nTTTTATTTCGTGGACGCTTCTCATCGTAGGAAGGCGCATCGCTGGGGGTGGTTGAAACCACCTATGCCGGGCGATGCGCTGTTCAGGGGGCCTCACGGGCCCTTTTTTCTTTTCCCGGA\n>AYZV02091783.1/3282-3039 Spinacia oleracea cultivar SynViroflay scaffold22748.con0008.1, whole genome shotgun sequence. \nAGTAGAGTAAGAGAGCTTCCTTCAGCCCACTCATGGATGGAAAAAAGGGGTATTGAATTATCTGCCGACTCATTCATTCAAACACTGAGTAGAACAAACAAGGAATGTACAACACGCATGCGTACAGGGGGTGCAAGTGCAAGTGCAAGTGCAAGTGCTACTGTGATTGCGTGAATGATGCGGGAGATGATTTCATCCTTGTCTCTCCGTGCTTGGACTGAAGGGAGCTCCCTTTCTCTATTCC\n>URS0000D6BD70_684738/1-44 Lactococcus lactis subsp. lactis KF147 DUF1646 RNA \nGGTTGGGCGCAAGCTTCAAGACATATCTCCAAGGGTGAGGAGAT\n>ASAF01269073.1/1229-1323 Nicotiana sylvestris Nsyl_contig269073, whole genome shotgun sequence. \nCGGAGCCGTATGAGGCGGAAGTCTCACGTATGGTTCTCTAAGAAGGGAGTGACTACCTACAGGAGCTTCGACCAAGCACCACCGGTCAATTCCGC\n>JNGA01002875.1/199-1 Arabis alpina cultivar Pajares Aa.chr2_contig_422, whole genome shotgun sequence. \nCGACGGATCGCATGGCCTTTGTGCTGGCGACGCATCATTCAAATTTCTGCCCTATCAACTTTCGATGGTAGGATAGTGGCCTACCATGGTGGTAACGGGTGACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACACGG\n>FP929041.1/559079-558959 Eubacterium cylindroides T2-87 draft genome. \nATAATGAGACTCCTGTCCAGCCACAGTCCGAGCGTGATATGCCCTGCTTCAGGGTGATGCCGTCGCAGGCAATGGGGGCAGCCGATTTGTAGAGATCCTACCGGGGGTGCAATTCCCGTGG\n>CM001383.3/68159736-68159614 Felis catus isolate Cinnamon breed Abyssinian chromosome B3, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAGTATTGTTATAAGTCAAAATTTAGAAGAGTAAATCACATTCAAGCAAAAAGAAGCAAAAATAGATCTTGCTTCATAGATCTACACAAA\n>AACT01034500.1/16165-16123 Ciona savignyi cont_34500, whole genome shotgun sequence. \nGACTTCGAATCAGAAGATGAGGGTTCGAGTCCCTCTGTGGTCT\n>CP003005.1/936847-936934 Myceliophthora thermophila ATCC 42464 chromosome 4, complete sequence. \nGGCCGTGTGGTGTAGTGGTAGCATACTTGCTTTGGGTCGTGAGATTTCAATCTGCAAGTGGTCCCAGGTTCAAGCCCTGGCTCGGCCC\n>MCOG01000628.1/21312-21242 Neocallimastix californiae strain G1 LY90scaffold_628, whole genome shotgun sequence. \nGGAGGGTTGGCGCAATGGTAGCGCGTCCCCTCCAGAGCGGAAGGTTGGGTGTTCGAATCACTCACTCTCCA\n>KB319013.1/681-1 Rhizoctonia solani AG-1 IA unplaced genomic scaffold scaffold1318, whole genome shotgun sequence. \nGCAGCTCGAAAGCCGCATTTGCTCGCCACGCACGTGCCGATTTACTCGGCGTCTCGCGAGCGGGCTAAGGTCTGAGCATTCTAGTCCCCTTGTACGTGTGTCTAGCCGGCACCGGCTCCAACAGGGCCGAGCAGAGTATCAGACATGCGCTCGGTGCTGCTTGTTCCGCCCAGAGACCCGCAAGGGGAGGGCACAGCAGCACGTGAGCTTGGAACAACTCTGCGGGGACAGAGCCGTCTACTTGCCTCCCCGTCCCGAGTCTCTTTTTGTCCTCTTTCCCACCCGTGCGCTAGCCTCGAGAACTAGCGCCCAGTTTTTTCAGAGACTGAGCATCATGCATCTGACTCTTCCCTCGCTCCGCAAGGCACGGAGCAGTGTACGGCCTGGGTTGGCTTCTGGGCGCCGATCGAACCTGGGGATCTCACATCGCTACGACTGGCGCGGCAGCGCTGAGCACTGGGACTCCCCATGCCCGGCAAAATGCTCCGCGTACAGGTAACGAGCTCTTGTTTTCCTTTTATTTCCTGGATATTCCTGGAGAGGCCACGCTGGTGGTTCGATTGGTTGCGGTGATCGAGGAGGACGATCGGTCTTGGACGGGGAACGGGCGGCTCTTGAGTTCACTTTGCGGCTCGCAGTCATTCGCTTTGGCGATTGCGAAACTCGATTCAGACTACTCTT\n>AFSB01087678.1/359-79 Heterocephalus glaber contig87678, whole genome shotgun sequence. \nGAATGTGAGGGCAATCTGGATGTAACATGTTACCCCATTGATGGCCAGGGTTGATTCAGCTGTATGGCTGGTAGGCAGGTGTCCCCTTCCTCCCTCACTGCTCCAGGCGCGACCCTCCCTAAGCTTCGAGCACAGTTAAAGAGGATGACCACTGTTTCCTTGGTCAAGGGTTTACAAGTAGCTGTGCTCCCCTGCTAGAACCTCCAAACAAGCTCTCAAGATTTAAAAACTAAAAGGAGAATGGGAGTTGGGATATAGCTCAGTGCAAAGGCCCAAGATTT\n>MKUQ01000060.1/39144-39044 Burkholderiales bacterium 70-64 SCNpilot_expt_1000_bf_scaffold_93, whole genome shotgun sequence. \nCGATCTGCTCCGGGGTGCGCAGCACGCTGAGACGGGCCCAGGCCTGAACCCGAGAACTTGATCCGGTTAGGACCGGCGAAAGAAGAGCGATCCGTCGCCCC\n>CM007893.1/130149511-130149874 Helianthus annuus linkage group 4, whole genome shotgun sequence. \nTGTGTCGTAGACTAAGCGTGCATGACGGATGAGTCGTGCAGGCCGCCTTGAAGTACAATTCCCATCAAGCGATGGGTAGAATCCTTTGCAGACGGGTGACGGGATAGAATCCCCTATCAACTTTCGACGGTAGGATAGTGGCCTACTATGGTGGTGACGGGTGACGGAGATTTAGGGTTCGATTTCGAAGAGGGAGCCTGAGAAACGGCTACCACATCCTAGAAAGGCAGCAGGCGTGCAAATTACCCAATCCTGACACGAGGAGTTAGTGACAATAAATAACAATACCAGGATCAAACGAGTCTGGTAATTGGAATGAGTACAGTCTAAATCCCTTAACAAGGATCCATTGGAATAAACCATA\n>AFEY01266293.1/3612-2555 Sarcophilus harrisii ctg7180002245042, whole genome shotgun sequence. \nCCACATTCAGGGCCCCAGGTGGGGCAAGATGGCAGCCGAGGTTACACCCAGAGAGTCTTTAGAAATTCAATAGTAAGATATGATCAATTATCCAAAAGGCAATTGGATGGAAGAAGGAGATTATACAATCAATCAGCCAAAGGGCAATCAGAAGGTAAAAGGGGATTGAAATTAGGAAAAACAGAGTTGTATGCAGTAGAGACTACTGAGATATCATCCCCTGGAGAGGTGAAATCTGTTCCTGTCCAGCTTATAGATCCCTTGCCTCCAGGCACAGTAGGCTTGACCATTTCACCTCCTGAGGGTGCTTACAAAACAGTGGCCATGGACATCGGAATCCTCTAAGGAGTGTCTAACAACTCACCTGCCGAATCAACTAGCCCTGAAAATGGATGGCACTGGAGCATTGGGCCCATACCTGGCCGTCGCTGGCAATGGGCACAAAGCAGGAACAGAAACGTGTTGTTTCCTGAGAACAGATTCCGCACAAGGGAGGAAGGCACGAACTCACTCCTCAGGGGCTAGGCCACGATGAGTAGGAGGGCTGCTGCGGTGGGCCTGGAAGCCTAGGGCATGGGCCCAGGTGGAGCTGCCGCAGGTGTAGATCTTGGTGGTAGTAGCAAATATTCAAACGAGAACTTTGAAGGCTGAGGTGGAGAAGGGTTCCATGTGAACAGCAGTTGAACATGGGTCAGTCAGTCCTGAGAGATAGGCAAGCGCCATTCCAAAGGGACAGGCAATGGTCTCTGTTGCTCTCAGCTGATCGAAAGGGAGTAGCGTTCAGATCCCAGAATCTGGAGTGGCAGAGATGGGCCCTGTGAGGCATCCAGTGCAGTAACGTGCCTGATCCCAGAAAAGCCGGCTGGAGCCCCGGGGGAGAGTTCTCTTTTCTTTGTGAAGGGCAGGGCTGCCCTAGAATGGATTTGCCCTGAGAGTGGGCTTGTGGGCTTCTATATCTCCCAGAGTGCTCCTGGCTCTCAGTCTCCCAGAGTGCTCCTCTCTGACTCTTGTTGATGTTTCGAAGTAACTAACCCAAAGCTAAGAGCCTCTTTATACAT\n>LGSR01000020.1/1425329-1425226 Escovopsis weberi scaffold00001, whole genome shotgun sequence. \nGGCAGAGTGGCCGAGTGGTTAAGGCGATGGTCTTGAATCGTGGGTTCCCATGATAAAGCCAACCATTACGTTCGCGTGCGTAGGTTCGAATCCTGCCTCTGTCG\n>JENH01053621.1/966-1 Agrilus planipennis Contig53639, whole genome shotgun sequence. \nTTTAGTATAAATACTCTGTAAATATTGAAATAAAATTAGTCTAACACCAGGCTCACTCTTATTCTGATGCTGATAAAGTGTCAACCCTTGGGATCCTCAAAGATGCAGATAATGTATCCAACGGTATTACTAAATCGGTTCTTCTCAGAACCCCAACTTTGATAGTCACATCTCTCATCATATACGACTACAGAGAGTGGCTACAGTTGTATCATTTATTACTATTTATTATTTTAACGATTGACCATCTCAGGCTAGACCTTTTTCATCTAATAGCTTGACTCTGTGATATAAGAGTTGTGATATTTATGTGTGTGCGCCGTCCTAGTTTATTATTTTAGGTGACAGCTAGTAACCGATACCAGTGATGCGAGTCCTGGGTTTCAGTCCTGTGTGACGTGGGCCGACTCAGGGCGGCGAAGCGGTTGCTTAACGGCGTCCCAGACGTCTCCGGCGAATTCCGCTTTCTCAGCCAGAGAACTTCGCTTAACGATTTTTCCAAGGCCCGTATATGCCGATACTCCCTTTGAACAGGTCAAGTTTGACAGGTTTCCTCGGGCCAGGAGTCGTTAGTTCTATTGGGGGCGAGACTTAGATGACTCTACAAGGCATCGCTTTGGTACTCGAGGCGAAGCAGATGAGCCAAAGCTACTCGGCAAGGCTCATCGGAGCCGGGGTGCCGAATTAGGGCTTATGCTTGTCTAAGCCCTGTGGCAATCACGCCAGACCACCGTGGAAAGTGTGAGATCGCGGTCTCATAGAAATAGCCAAAAGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACCAGATTCTCTGTGACCCTACCCACTATCTAGCGAAACCACTGCCAAGGGAACGGGCTTGGAAAAATTAGCGGGGAAAGAAGATCCTGTTGAGCTTGACTCTAGTCTGGCACCGTAAGGAGACATGAGAGGTGTAGCATAAGTGGGAGACGGTA\n>AAPU01006125.1/5918-6168 Drosophila mojavensis strain TSC#15081-1352.22 Ctg01_6126, whole genome shotgun sequence. \nGGTCCATCAGGATAAGGATTGGCTCTGAAGATTGAGATAGTCGCGCTTGATTGGGAAACAATAACATGGTTTATGTGCTCTCTAAATAGAGATCTATCATTTTATGGTAGTTTCTAGTTCCCCGGATAGTTTAGTTACGTAGCCAATTGTGGAACTTTCTTGCTAAAATTTTTAAGAATACTAGCCGGGCAACCGATTAGTTCTTTTAAATTATAACGATTATCAATTAACAATCAATTCAGAACTGGCAC\n>LBPO01000002.1/47954-48343 Parcubacteria (Magasanikbacteria) bacterium GW2011_GWC2_34_16 UR53_C0002, whole genome shotgun sequence. \nGGTTGTTGGTGGATGATCGCTTTGCCTGTAAAGGCGGGGAGGAAAGTCCGAACACGCCTCTAGCGAAAGCTAGAAAGGATAGCGGGTAACGCCCGCCTGGAGCAATCCACGAGGTGCGAGCAGAGACGTCTAGGCTTGAAAAGGTCTAGAGAGCTAAACCCTGTATTCTTGATTAATCAGGAATAATAGCTTAATCCTGGCCATAGGGAAATAAGGTCAGGGGTGAAACGGCTAAATCCTTATCTGCGTGCAAGAGCAATGTTTCCTGTTGTTTAGACGGGATTCAGAAAGTTAGCTCGCTTTGATTCTAATGGAAACATTAGAACTAGATAAATGATCGTCGCCCAATTTATTGGGATACAAAATTCGGCTTATAGCCAACAATACCCT\n>CM000856.1/137442353-137442632 Callithrix jacchus chromosome 1, whole genome shotgun sequence \nGTCAGGTATGATGGCGCATGCCTGCAGTCCCAGCTACTTGGGAGGCTGAGGCAGGAGGAGTACTTGATCCCAGGAGTTCTGGGCTGTAGTGTAGTATAGCACTGCACTAAGTATCTGCACTAAGTTCTGCATCAATCAGGTTGCCTAAGGATGGTTGAACTAACCCAGGTGGAAACTGGAGCAGGTCAAAACTTCAGTGCAGTGCTGATCGGCAGCAGGATCTCACCTGTAAGTAGTCACGGCCCTCCAGCCTGGGCAACATAATGAGATCCCATCTCTA\n>CP009129.1/1068541-1068746 Planococcus sp. PAMC 21323, complete genome. \nTTAATGACAGCGAAGAGGACTAGTAGTTTGTGTATTTTCCACAGAGAGCCGGCGTTTGGTGCAAGCCGGTAAAATGCGCAACCGAACTCACCTTGGAGTCAGTGTATGTGAAACTAAGTAAGATACACCGTTTTCCGCGTTAAGGAGTCAAGTTGAGCGAGCAGTCGCTAATTTGGGTGGTACCGCGGGAAAATCCCGTCCCTTAT\n>JTDY01000669.1/96851-97292 Operophtera brumata OBRU01_Sc00669, whole genome shotgun sequence. \nGGTCATTATCACCACAATAGATGGCGCTGTTTGCAACTTTATACCAGGCTATACCTATATATATACATATCGACTTTGTTTTATAACTCAAGAAGTGGGCCGACAATTTTACTTTGAACAAATTAGAGTGCTCAAAGCGGGCTCAAAATGCTGCTTGAATATTTCGTGCATGGAATAATAGAATATGATCTCGGTTTTATTTTGTTGGTTTTCAGAACTCCGAGGTAATGATTAATAGGGATAACTGGGGGCATTCGTATTGCGATGTTAGAGGTGAAATTCTTGGATCGTCGCAAGACGAACATCAGCGAAAGGTGTTTTCATCAATCAAGAACGAAAGTTAGAAGTACGAAGGCGATTAGATACCACCCTAGTTCTAACCGTAAATATGTCATCTAGCGATAAAATTGACGCAATTTTGAAAAAAGAAATGAATCTTTAT\n>FRBH01000005.1/40291-40383 Chishuiella changwenlii strain DSM 27989 genome assembly, contig: Ga0131172_105 \nAAGTAGCGACAGGGATTGACGTGAAAATCCTTTTTACAACTGAGATTCTCTCGAAGTTTAGTAAAAAGATTGTAACAAAAAGCCCGCTCGGTC\n>FQWL01000004.1/126785-126917 Spongiibacterium flavum strain DSM 22638 genome assembly, contig: Ga0070522_104 \nTGGTTATCGAGAAAGGCGGAGGGACTAGACCCTGTGAAGCCTTAGCAACCCTTAGCACATCCCATCATCTGGGATTCTGAGAAGGTGCTACATTCTACCTAACATCGGTACATGATGATGGGATGGATAACGA\n>KQ758491.1/45269-45062 Bacillus enclensis strain SGD-1123 genomic scaffold Scaffold10, whole genome shotgun sequence. \nGGATATTCAATGATGAAGAGAGTAATTCCCGCGTGGATCTAAAAGCGAACCAGGGACGGTGCAAGCCTGGTGTGAAACCCGGAATGAAGCGCACTTCTGAGAAGTCTTTCCCCAAATTTCAGTAGGGAAAGACCGGGTAAAACCGTTAATTTATGAGCGCCCTTTCTGGGAATAAGAGTGGTACCGCGAGTCAAAACTCGTCTCTACA\n>AHIQ01000233.1/47283-47180 Brettanomyces bruxellensis AWRI1499 AWRI1499_contig2762_scaffold53, whole genome shotgun sequence. \nAAACCTAAARATGATGATTGAGAATTAACGCATAGTTCAACTGRTATCTATGAAGAAAATATTTCCATCAATATAGTCTTTCACCCCTATCTGATTTTAGGCTT\n>URS0000D685E2_12908/1-80 unclassified sequences type-P1 twister ribozyme \nAUGUUAAUGCGACCUAGUUACUGGUAACCGUAAUACCUAGUGCUAGAGGGUGGCAAGUCCCUUUAACGCAGAGUCGACAU\n>CM000801.1/33200308-33200628 Oryctolagus cuniculus chromosome 12, whole genome shotgun sequence. \nGTTAGCTCGGGCCGGGAGGAGCCGCCACCGCCGCCGCCGGAGGAGGAGGGGGAGGAGGAAGGAGAGAAGGAAGAGGAGAGGGGGCCGCGGTGACGACTCGGCGCCGGGGAGCCGGGCTCATGGACGGGTGAGGCGGCCGTGTGCGCAGACAGTGCTCCAGCCGCGCGCGCGCCCCAGGCCCTGGCCCGGGCCTCGGCTCCGGGAGCAAGAGGAGCTCGCGGAGGCGCCGAGGAGAGCGGGCCGTCCCGCAGCCCGAGCAGGAGAGGGAGCGCGAGCCGCGCCGGCCCCGGCCGGGCCTCCGAAACCATGAACTTTCTGCTT\n>KB456266.1/1688805-1688699 Sphaerulina musiva SO2202 unplaced genomic scaffold SEPMUscaffold_7, whole genome shotgun sequence. \nGCCCGCTTAGCTCAGGGGTAGAGCGCATCACTCGTATACCTGGATGGCTGTAAATCACCTGGTTTGGTGGGATGATGAGGTCATTAGTTCGATTCTGATAGTGGGCT\n>CM001381.3/152175418-152175578 Felis catus isolate Cinnamon breed Abyssinian chromosome B1, whole genome shotgun sequence. \nATCGCTTCTTGGCCTTTTGGCTAAGATCAAGTGTAATATTAAAAGTTAATATTTCTGTAGTGCTTCCATTGCACAAGGTACTATTCTAAGTATTTTACATATATTGACATATTTACATTTCTAAAAACCTTAAAAGGTAGTCACCTTTTAAGGAAAGTATT\n>AASG02000564.1/14627-14791 Ricinus communis cultivar Hale ctg_1100012361959, whole genome shotgun sequence. \nGCCTTGGTGGTGAAATGGTAGACACGCGAGACTCAAAATCTCGTGCTAAAGAGCGTGGAGTCCTCGGGTAGTCTCCTCTATAAAGGCATTCCAGCTTCAGAGGTAGGTGAGCCAGGTCAGGAAGGAGTTTGACTGCTGGGATAGGATCGGATCCTATTCGAAGCA\n>AZIM01000830.1/116066-116143 Ophiophagus hannah scaffold831.1, whole genome shotgun sequence. \nCGATCTGGCTGCGACATGTGTCACCCCATTGATCGCCAGGGTTGATTTGGCTGATCTGGCTCCATGTACATCCCTCCT\n>MUXU01000055.1/10129-9985 Moraxella caviae strain CCUG 355 355T_ctg_0000055, whole genome shotgun sequence. \nATTTGCTTGACGGAGTGCGGTTTGAGACCGCTGAGATTGCGTCTTTGGTGGGTGCGCCATTGGTGTTCCACATGAAACTTATAACGCAAAATCCGTTGAACCTGAACAGGTTAGTCCCTGCGTAGGAATCAAGCACGTCCGCCAT\n>FQTY01000030.1/12262-12128 Tissierella praeacuta DSM 18095 genome assembly, contig: EK13DRAFT_scaffold00030.30 \nTGTTAATTAAATAGATTGCCGTAGACAGTAGGTACCTTAAGGTTTAATTTCCTACCGAGGTTGAGATTAATCTAATTTATAAAATTGAAATTAGGATCTCTCTGTGTCTACGGAGGGATCTTTATTTATTCGTCC\n>JH835452.1/508250-508573 Erinaceus europaeus unplaced genomic scaffold scaffold00164, whole genome shotgun sequence \nGGATGTGAGGGAGATCTGGCTGCAACATCTGTCACCCCATTGATCAACAGGGTTGATTCCTCTCATCTGCCTGGCTAGGGGGGTGTCCCTTCCTCCTGCACTGGCAGTGTGTCACTAACAAAGCTGCGGGCTCTGTTGAAGAGGACGGCCTTCCCGGAACAGAGACGGCTAGGTCTTCGGTTGAGGGCATATGAGTAGCTGCTCTCCCTTGCTAGAACCTCCAATAAAGCTCTCAAAATGTGTTCAAAATATTTTCGGATTACAAACAGAATTACTCTTCACTAGCAGACACGCAAAGACAATACATTATAGGAATTTCGTTGT\n>HE999757.2/3449466-3449336 Carnobacterium maltaromaticum LMA28 complete genome \nTTAGGTTAATAAATATTACCGAAGACAGTAGGTGGCGTAAGCCTTAAAATACCTGCCGAGGATGAATATATGTGAAAGCATACAACTATCCCTCTATGTCTAAGGTGACATGGGGCTTTTTGCTTTGAATC\n>KZ114138.1/13605-9139 Helianthus annuus unplaced genomic scaffold HanXRQChr00c0817, whole genome shotgun sequence. \nGCCCAGTCTTTCAGATGGGCTTGGCCCATTTCTGTAAAACGTATTTATACGTAAATGCACGTAACCGGCTGTCATTCTTCAACCCTAGCTCCTTGTGTGTGTGACGGCAGACCCTCACATCCGAAGCCAAATCCCTTTTGTTGATCATCCTTAATCTCGGTTAGTATCTGATATCGTATTACTTTTAATTGATTGCTGGAATGATTGATGTTAATTAGTGTGCTAACCGGCCGGACGTGGCTGTTGATCGGCCGGATACGGTTGATAACTGGCCGGACTTGTAATCATTAACCGATCGGATGTTGTTAACCGGGTATTGCTTATATGATAATCGAATAGTTGTTCGGATTCGTTATATGATGTTTGATTGTTAGTATGTTCATTCAAGATTTCGGTATGTGTTCATATGTTATGTTAATAAGGTTCGATAATGTGACATACTATGTTAATCGGCTTGGTGTACGCATAAATTAGGGATCACGATGGGTATTAGTATTATGATGATTGCATGATGATTTGATGATGATCCTATGATTGCTGCATGATTGTTGTTTGATCGATAATGTTGTTGACGGCTGTTAGCATGTTTAGGGTTTCTGAAATTGTAACTGTTGTTGACGTAACTGATATGTGTCGAAAGATACTTGTAGTCGAAACATAGTTGTCGAAACATAGTTGTAACCGAAAGATATCTGTTGACCGAAGGATAGATTTGACCGAAACATAATTAGGTTGACCGAAAGATGCCATTTGGTCGAAAGATGACTGGTGGTTCGAAACATAACAACCAGTCCGAAAGATAACTGTGAAAACTTGTAAGTGTCGAAAGATTACTGATGTGTCGAAAGTTAACAGTGGATCGAAGGATAGTGGCAATTATAAACATCCTTCGAAGGATGGAATGTATACATGAACTATTTGACATGCCATGCTTGATGATGAATGTTTACATTTGTAATTGTGTGCACTAGCTGATGAGTAACTAGGAAATGGTACGTGTTGCGCCGATGTACAAACTGACTGTTACGTGAACATTATATTGCATGCGAATCATTGTGAACATGAACTGATTTGTTATACATGCATACAATAGGACGTGATTAATTACTTGTGAGTACATAACCTAGCATACCGAGCAAACCAAGGTGAGTTCACACTCTTACTAAGGCATGGGATTCCCGGGTTGTGGGAATGGGTTAAAGGCTTGATGATAAACTAATAACGTACATACACTACGCTTTTCCTAGACTATCACCTATCATAGTCCTCGGATGTCAGGACGGTTCCGTAGGTTGGAAAACACCTACGTGGTTCCGTAGGTTGGGATAACACCTACGTGGTCAGATGCCAATTACTATCCTCGATACAAAGGATACGCACGTAAGACATACGTGTACGCATTACTTACTTCTTCCGTAGGTTGGGATAACACCTACGTGGTCATATGCAAATTACTATCCTCGATACAAAGGATACGCACGTAAGACATACGTGTACGCATTACTTACTTCTTCCGTAGGTTGGGATAACACCTACGTGGTCATAATACGAATAGTCTAGTGGTCACTTAACATGGGAAGCCCCCACCTGTATAACTTACTATTGGCCCGGTAGAGCCACCCGTTACTTACTATTACGCATTTACGTACTGTGAACTCGCTCAACTATTTTGTTGATCCTTTCTTTTACATGCCTTGCAGATCGTTAGGTACTGGGAGCTTGCACTGGAGGCGCGGACGTTGTGGACTTGGATCGTGAACATCATATGGAACCCATATGATACTTGATACACTTTTACATTGGATATTTTTATATATACGCTTCCGCTAAACATTGATAACTGGCTTATGTTTTGGAAACACCTTTCATATGGATTTGTTCTGAATTATACTGCAATTACTTTTACTTTATACAATGTTCTATATGATTGGTGGCTTGGTCCTGGTCAGTCACGCTCCCAAGCGGTGATACTCCGCGTGTGGATTTTGGGGGTGTGACACAACGGGTGAGTAAACCCGCAAGGCGCAAGGAAGCTGATTGGCGGGATCCCCCTCGTGGGGTGCACCGCCGACCGACCTTGATCTTCTGAGAAGGGTTCGAGTGTGAGCATGCCTGTCGGGACCCGAAAGATGGTGAACTATGCCTGAGCGGGGCGAAGCCAGAGGAAACTCTGGTGGAGGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTGACTTGGGTATAGGGGCGAAAGACTAATCGAACCGTCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCCCGGGTGCGAGTTCTATCGGGTAAAGCGAATGATTAGAGGCATCGGGGGCGCAACGCCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACGGCGCGGCTGCTTTGTTGAGCCGCGCCACGGAATCGAGAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGCCGGGTTACGGTGCCAAACTGCGCGCTAACCTAGAACCCACAAAGGGTGTTGGTCGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTTAAGCGCGCGACCTACACCCGGCCGTCGAGGCAAGTGCCAGGCCCCGATGAGTAGGAGGGCGCGGCGGTCGCTGCAAAACCTTGGGCGTGAGCCCGGGCGGAGCGGCCGTCGGTGCGGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGAGACGGGGGAAGCCCGTCAGATAGCGTGTTTCACGCGAGCTTCGAAAGGGAATCGGGTTAAAATTCCTGAACCGGGACGTGGCGGCTGACGGCAACGTTAGGGATTCCGGAGACGTCGGCGGGGGCCTCGGGAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGACTCAGTCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGCACGTCGCGCGGTGTCCGGTGCGCCCCCGGCGGCCCTTGAAAATCCGGAGGACCGAGTGCCTCCCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGTCGATGGAACAATGTAGGCAAGGGAAGTCGGCAAAATGGATCCGTAACCTCGGGAAAAGGATTGGCTCTGAGGGCTGGGCACGGGGGTCCCTGTCCCGAACCCGTCGGCTGTCGGTGGACTGCTCGAGCTGCTTCCGCGGCGAGAGCGGGTCACCGCGTGCCGGCCGGGGGACGGACTGGGAACGGCCTCTTCGGGGGCCTTCCCCGGGCGTCGAACAGCCAACTCAGAACTGGTACGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTAACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGTATAAGTGGGAGCCCTCGGGCGAAAGTGAAATACCACTACTTTTAACGTTATTTTACTTATTCCGTGAATCGGAAGCGGGGCAACGCCCCTCTTTTTGGACCCAAGGCCCGCCTCGGCGGGTCGATCCGGGCGGAAGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTAGAACAGAAGGGTAAAAGCTCGTTTGATTCTGATTTCCAGTACGAATACGAACCGTGAAAGCGTGGCCTAACGATCCTTTAGACCTTCGGAATTTGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGATAGTGTCGCAATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGCTGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGAAGCGACGCGTGT\n>FR881992.1/3645-4018 Firmicutes bacterium CAG:238 genomic scaffold, scf351 \nGGGGATGTAAAGGTTTCGACGGGGGTGTAGAAGCCGGATAAGCGAGCGGTAGTTGGCTCAGACTACCTTAAAAAGGGCCCGTTAAATATAAACGCTAAAAATAACAACAATTTCGCATTAGCAGCATAGTTCTGCAGCGCCTAAGGCGCGACGCGCGTCGGCCACAGCTCACCCGTAGGCTGTGATACCGGCGTCGACTATACGGGAAAACCTGCAGGGAGTTCTCGGTACCTCGCAGGGAACAACGAGATAGCCGACATGGCAGCATGTTAATGGGCGGCCACGGAGGCGAAATTTTAAAACATTGACTGCGCTCGGAGAAAGTCCTGTGGAAATGCTTTCGGACGCGAGTTCGACTCTCGCCATCTCCACCA\n>AWUE01008835.1/507-1 Corchorus olitorius cultivar O-4 contig08862, whole genome shotgun sequence. \nCAATAAGCAAAATAAGGGCGCACGGGGGATGCCTGTGGCTCTCAGAGGCGAAGAAGGACGTGATAAGCTGCGATAAGCTTCGGGGACTGGCACACACAGATTGATCCGAAGATTTCCGAATGGGGCAACCCGGTATGTTGAAGACATATCACACCGATAGGTGAGCAAACCCGCTGAACTGAAACATCTAAGTAGGCGGAGGAAGAGAAAACAAAAGTGATTCCGTAAGTAGTGGCGAGCGAAAGCGGATTAGCCCAAACCAGAGTTGTTACGGCAATTTTGGGGTTGTAGGACTGCGAGATTTCATGCAAAGGGAACTGGAATTAACTGGAAAGTTAAGCCATAGAGGGTGATAGCCCCGTATAGGTAACCGATGTAATGGATAGCAGTATCCTGAGTAGGGCGGGGCACGTGAAACCCTGTCTGAATCCGGCGGGACCATCCGCCAAGGCTAAATACTCCTGAGAGACCGATAGTGAACCAGTACCGTGAGGGAAAGGTGAAAAG\n>URS0000D6AF63_12908/1-91 unclassified sequences DUF3800-VII RNA \nGGCAGGCAAGCGCTAGGGGTATCCCCGAGTTACCTTCGGGCAGCAGCTGTCGGTGAGACAGTGGTACAGGGGCCTAGGGGTCTGCCGCTCT\n>LL014082.1/6803-6907 Trichobilharzia regenti genome assembly, scaffold: TRE_scaffold0014079 \nTCCAAGTGCTCTGAATGTCAAAGTGAAGAAATTCAATCAAGCGTGGGTAAACGGCGAGGGTAACTATGACACACCGTCGAAAAATTAGTTCATCCTTCTAATGAA\n>BAUT01000003.1/65796-65988 Bacillus wakoensis JCM 9140 DNA, contig:contig_3. \nTTGAATATCGAGCAAATAGGTTTTTAGGAACGTTTCGTTCTAAACTAAGAGGGAAGTTGGTGCAAGTCCAACACGGTCCCGCCACTGTAAACGATGAGGAAGATTAGTATCGTCCACTGTGCGAGTTAGCATGGGAAGGATAATCGACAATGATTCGTAAGTCAGGAGACCTGCCTATTTGTCTTTAAGCTTC\n>AF221911.1/108-513 Chelydra serpentina telomerase RNA gene, sequence. \nTGCGGCGGCAGGTGGGGGCTCAGTCTTTCTAACCCTAAGCGAAATGTGACCCCTCCCCGCTGCAGCCGTCCGCTGTTTTACTCGCTGACTTTCAGCGGACGGGGGGAGCGGGTGGAGACGCCAACCAAAAAACGTCAGCGAGGGGCCCTCCCCTCCCACGCCGACCTGGGCCTGTGGTGGGGCCCGCCAGCGAAGTCCCCGCCGCCCCGCCCCGGTGAGGCCGCGGTCAGCCGGCTCGCGCCACTGCTGCCGCGAAGAGTTCGTCTCTGTCAGCCTCGGGGGCGGCCGGGGTGGAAGGGCGGGTCCCGAGCCCGTCGGCCGGGAGAGCAAACGTGAGCGGCAGCCCCTGCGCCACCGCCCTCCCCTAAGCTGTGGGGCCCGCGGTCGGGGCTGCGCTCAGACACGC\n>AFSB01201159.1/18941-18806 Heterocephalus glaber contig201159, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAAAGATGTTGATATCTGATTTTAATTTTTAAAAATTCATTTATCTATTTTATTAGTACATGTTTCCAGTACGTAATGATTACATTTATCACAGGGAGTTACT\n>AFSB01036238.1/931-791 Heterocephalus glaber contig36238, whole genome shotgun sequence. \nTTAATGGCTTTGAGGCTATCTCATTTTCATTATACCAGAAGCACAACTGATTAGATACAATCAGCAACACCATAGCATTAAGTACATCTTAGAAAATGACAATTTGTAGTAGTTATTAATCTATCACCTTTAACTCTGTGA\n>MFMU01000019.1/4604-5929 Candidatus Kaiserbacteria bacterium RIFOXYD1_FULL_47_14 rifoxyd1_full_scaffold_6810, whole genome shotgun sequence. \nCATGAGAGACATAAGAGTACACGGTGGATGCCTTGGCCTAGGACGGCTAAGAAGGACGCGACTAACCTGCGAAAAGCTTCGGGGAGGCGGTTTGTAGCCTTTGATCCGGAGATATCCGAATGGGGAAACCCTCCAATTTTAAATTGGAATCCGCGGGGTAACGCCTGCGTGAAGCGAACCCGGGGAAGTGAAACATCTCAGTACCCGGAGGAAAAGAGAACAATATGAGTTGCGTTCCGTCGGCGCGTATGTTCGTGCTGATGGAACGCAACTCGCGTGATACCCTGAATAGCGGCGAGCGAAAAGGGAAAAGCCCAAACCTCATTTTTCGAAATGGGGGGTTGTAAGATATGAACGGCGTACTTGTACGCGAAGAGTTATCAATCGTCTTTATAGCAGAAGCTGCTGGGNNNNNNNNAGGTGAAAAGAACCCCGAGAGGGGAGTGAAATAGAACTGAAACCGTGTACTTACAAGGGGTCGGAGCGGTGAGTTTATTCGAACCGTGACGGCATGCCTATTGAAGAATGAGCCGGCGAGTGTGTGTATCTTGCGCAGCTAAGCCCTTACGGGGCGGAGCTTTAGGGAAACCGAGTGTGAATAGCGCGTCTGTAGGATACATACGACCCGAAGCCAGATGAGCTTGCCATGAGCAGGGTGAAGTTTGTCGAAAGACAAATGGAGGCCCGAACCCGTAGGTCGTACAACGCCTTGGGATGACTTGTGGTAAGGAGTGAAAAGCTAATCGAATCTGGGAATAGCTGGTTCTCTCCGAAACAGCTTTTGGGCTGGCGTTGCCATATCGCGTGCGTGGGGGTAGAGCACTGGAAGGGACCAACAGGGAGAAATCTCGTGGTTCCTATCAAACTCCGAATACCATGCACTCGGGCAGCAGTTAGAAGGTGGGGGCGAAGCTCCATCGATCGAGAGGGGAAGAGCCCAGATCGCCAATTAAGGCCCCAAAATCGACGCTCAGTACATCACAAGGAAGTGAGGACTCATAGACAGTGAGGATGTTGGCTTAGAAGCAGCCACCATTCAAAGAAAGCGTAACAGCTCACTCATCGAGAGTCCTTGCGCCGAAGATGATCGGGGTTAAGCGTCGTGCCGAAATTGCGGGTTTAATCCGTATTTATATAGATTAAGCGGTAGGAGAGCGTTCTGTTCGCGATGAAGCTTAAGGGGTAACCCATGGTGGAGCGTACAGAAGTGAGAATGCCGGTACAAGTAACCACAATGCGGGTGAGAACCCCGCACATCGAAAGACCAAGGTTTCCTCAGCTATGGTGATCAACTGAGGGTTAGTCGGGCCTAAGGGGATGGCGAGA\n>CM008309.1/24191905-24191844 Astyanax mexicanus chromosome 10, whole genome shotgun sequence. \nGATTATGATTGTGCAAGCAACTCTAGTGTATATACACTAGAGTTGCCTGCACAGTCAGAATC\n>LODT01000020.1/379504-379185 Dictyostelium lacteum strain TK GAOABQK02G6SYV, whole genome shotgun sequence. \nTTGTGTTACGTGAAGAATTGATCATAGAAGCCAACAAAACGCCTAGTTGCTCTGTCAACTATAAAACAACCAGATTTTCAAATCAAAATGCTTTTGGAAAAGTCCCCAGACCCTAGAACAGAAAGTGTTGCCCGTTAAGGTTATGATCAAGTTTTAGTTCACTCGACAGAGAAGGTATAAGATTCAAGTTTAAGTATTTGTGCTCTCTACCCGAGTCATTGGTGAAATTACTTGGTCACTGGTCACAGTAAAAGTAATATGAAATTAAGAATTTTAAATAAATATTCTCTACAAAATGGGGCTTACTCTCAACGTACACC\n>DS562862.1/33829905-33829809 Cavia porcellus supercont2_7 genomic scaffold, whole genome shotgun sequence. \nTGTGAGGGTGCCCTGGCTAGGACTGCTGTCCACCACTGAGCCCCAGGGTTGATTGGGTTGATCTAGTTGGGAGGGTGTCCCCTTCCTCCCTCATCAA\n>CM002922.1/12055086-12055241 Cucumis sativus cultivar 9930 chromosome 1, whole genome shotgun sequence. \nGTTTGTATTCTTCCACAGCTTTCTTGAACTGCATCCCTTTCCTGAACTCAATTCGCTCTTAATTTCCCCTTTCTCGATCTCTCTCGATCGATCTCAAAGCGTTTTTTGTTCATCAATTTTGTTGCGGTTCAATAAAGCTGTGGGAAGATACAGTCA\n>CAJI01053789.1/175-1 Cucumis melo, WGS project CAJI01000000 data, contig: 53789 \nAATTAGCAAGGACCACCTTGCAAGCCTCTGACGGGGCTCCTGACTGACCTATAGTGAAGTAGTACCGTGAGGGAAGGGTGAAAAGAACCCCCATCGGGGAGTGAAATAGAAGATGAAACCATCAGTTTCCAAGTAGTGGGAGGAGACCAGGACTCTGACCGCGTACCTATTGAAG\n>AEAQ01060326.1/1-120 Solenopsis invicta Si_gnG.contig39779, whole genome shotgun sequence. \nATGAAGAACGCAGCTAATTGCGCGTCAACTTGTGAACTGCAGGACACATGAACATCGACATTTTGATCGCACTTTGCGGTCCACGTATACAATTCCCGGACCACGCATGGTTGAGCGTCG\n>ADWL01010905.1/30966-31223 Oryza glaberrima chromosome 5 Oglab05_0141_29, whole genome shotgun sequence. \nGTGCCATGCATCTCTCTTATCAAGTTATTTCTGACAGCGGGGAATTCATTGACTGACTTGGCCTTGATTGATGATCCATCAACTCGTGGCTTTGCGCAGTGGGGAATTTTCCGCAATGGGCGAAAGCCTGACGGAGCAATGCCGCGTGGAGGTGGAAGGCCCACGGGTCGTCAACTTCTTTTCTCGGAGAAGAAACAATGACGGTATCTGAGGAATAAGCATCGGTAGTCTCGCCCTGCTTCAAAACTACAGGGCGCA\n>LN554852.1/2943365-2943181 Moritella viscosa genome assembly, chromosome: 1 \nCTCCTAAGTAGAGGTGCGCAATTCATAAGTAGTGTTATTTAGGTAGCTCCAATAATAACAACACAAAAGGGAATTGCGCCGAAGAATGAATTTTAAGCTAAAAAAATTCATTCTGGTGATGTGTTCGAATAGAGACATCACTGTCATAGTCAATTTTATATTAACTATGGGGCGCTACTAAATAG\n>KB706892.1/31142-31033 Eutypa lata UCREL1 unplaced genomic scaffold EL1_03_scaffold_1554, whole genome shotgun sequence. \nTGGGAGTGGGACTATGTAACGAACAGCCCTCTTGCCTTTTACCAGATGGCTCCTTGCATAGCCCAAAATACTCCATTCCCTTAATCTTTGGAACCACTTCTCTGGAGCAT\n>AEXM01000026.1/37053-36910 Anaerococcus prevotii ACS-065-V-Col13 contig00011, whole genome shotgun sequence. \nAAAAACAAAGAAGCGCCAGATCCCTAGTGGATGACGAGGAAGACAGTTATCGAAAGTTCGGCGGGAGCTGTCTGGGTTCACAGCCCTAGTATTAGACAAAACATTTGAGCAATCAGATGGACAGAGAAGATACAGTGGCCTCAT\n>BARX01000002.1/207412-207105 Agarivorans albus MKT 106 DNA, contig: contig00002. \nTAGATTCCGTATAGTTGTTTGTGCACGGAGGCACTGACGTTTATCAGGATGAGAAACGTAGCAGGAGCTAAAAAGGAACAGCTACAGGAAGTAGCAAGGGACACCTCCTAGGAAGGAGACGTGCAACTGGTATGGATGACCGGTTATGCCATAGAAGGCTAAAGGACAGCTCAAAGGATTTGAGAAAAGGATAACTACAGGACGTAGTAACACAGTCAAAAAGGATTGCAGGGAGCAACTACCCGTTCACGGATTTGAGCGATATGACTACTAGGGGCGACACGAAAGTGTCGCCCCGACCTTTTTCT\n>FR853096.2/50293108-50292759 Gorilla gorilla gorilla genomic chromosome, chr3, whole genome shotgun sequence \nGCTGGGTGTGGTGGCACGTGCCTGTAGTCCCAGCTACTCGGGAGGCAGAGGCAGGAGAATTGTTTGAACCCGGGAGGCGGAGGTTGCAGTGAGCCAAGATTGTGCCACTGCACTCCAGCCTGGCGAGAGAATGAGACTCCGTCTCAAAAAAAAAAAGAAAAAAAATGTAGGGAAGTTTATGATTTGTAAATCAAACCAGGATGCTTGAAGATGAACCTTGTGGGTTTTTTTGTTTTTGTTTTTTTTTAAGAGACGGAGTCTCGCTCTGTCACCTAGGCTGGAGTGCAGTGGCACGATCTCGGCTCACTGCAACCTCCGCCTCCCAGGTTCATGCAATTCTCCTGCCCCTC\n>MFUA01000016.1/12713-12896 Candidatus Nomurabacteria bacterium RIFCSPHIGHO2_02_FULL_37_13 rifcsphigho2_02_scaffold_5465, whole genome shotgun sequence. \nATAAGTATATACTAAAAGGGTTCATTAAAAAATCATGAAAAGTGATTGGGGAAACTGGTGACCTACCCGAAATGTTGCGCATAATGTTGCAGGCGGGGATTCCAGTACAGTGCCGCTACGGTAAGCCCACGACGTAAAAAATCGGGGACAAGTCCGAATACCAATCATTTTGTGTGTTTCCCGA\n>CP001700.1/9933843-9933644 Catenulispora acidiphila DSM 44928, complete genome. \nGTCGGGGCACCGCCGAATCCGTGTACGTCGCGGAGCCGGGGAACCAGGTTCGTCGGCGCGGCCCGCGCGGTAAGCGAGGGTGGCGCCAGTGGGGTGAATCGGTCGGCGTGCACTCGCCGTCGTGTGTGCGCGTGCGACCGTAGGGCTACTTCTTCAGTCCGAATCCGTCAGCTAACCCGGTAGGCGGACAAGGAGGAGAT\n>JH930370.1/159056-159130 Tolypothrix sp. PCC 7601 strain UTEX B 481 genomic scaffold FDUTEX481_Contig13, whole genome shotgun sequence. \nGTCCAGGTCGCCAAGTGTTTAAGGCATCGGCTTGCAACACCGACTGCTTCGTGGGTTGAAATCCCACCCTGGACT\n>FCNR01000023.1/21709-21816 Eubacteriaceae bacterium CHKCI004 isolate CHKC4 genome assembly, contig: {contig23} \nCAGCATTACTCTGGAGAGTCTTCACCGGCTTCGGCATACGGTGAAGCGCCGAAGGTGTACGGCAGATAGTTCTGCCAATCTCTCAGGCAAAAGGACAGAACACGTAAA\n>KB016992.1/120673-120603 Camelus ferus unplaced genomic scaffold scaffold726, whole genome shotgun sequence. \nTGGAGCAATGATGACTGCTGTGACATATGGGACCTACAGGATTAATCCCTGTCCGGAACGCTGAGGTCCAG\n>CM001006.2/22879507-22879377 Mus musculus chromosome 13, GRC primary reference assembly. \nTCTGCCCCTAGAGGCATTGTGGATGTGGCTCTTGTTCACCAGTAGGTGGCAGAGAGGAGAAAGGCTGTCTAAGCTCAGTGTTCTGACCTATGACATCTTTAACATTTCCTGAAAGAAACAAGCCTGACACC\n>CP002734.1/2242961-2242819 Pseudopropionibacterium propionicum F0230a chromosome, complete genome. \nGGCCCGCCCCACCGGGCTGGCGGCATTCAACGATGCACAGGGGAACCCGGTCGGATTCCGGGACTGACGCGCAACGGTGGGTGGACGCCTCCGAGGAGACATGCCACGAGTCCGAGCACCTTGCCAGCCCCCGTAAAGAGCCT\n>KE695978.1/687932-687680 Alligator sinensis unplaced genomic scaffold scaffold505_1, whole genome shotgun sequence \nTCAGCATCTCAGCCTTTTGGCAAAGAACAAGCAGTTTTGGCACCAAGGAGAGGGTTTCAGGGCTGGCTCTGGCCTTCCCAGTGCTGACCTGATATTGCAGTACCTCCAGGCCTGGTGCTAGTTCCCTGTGGAAGGAGGTGGGGGAAAGGTTCCCATCAGCATTTTTGGCATCAGCGGAGGGTGTTGAAGCTTGCTCCAGCTTCTCCACGTGCTGGCCTGGTATTGCAGTACCTCTAGGCCTGGTGCTTATTCC\n>LL012517.1/9492-9054 Trichobilharzia regenti genome assembly, scaffold: TRE_scaffold0012516 \nCTGGTTGATCCTACCAGTAGTCATATGCTAGTCTCAGAGATTAAGCCATGCATGTCTAAGTACATACCTTAAAACATGAAACCGCGAATGGCTCATTAAATCAGCTATGGTTCCTTAGATCATATATACTACATAGATAACTGTAGTAATTCTAGAGCTGTTACATGCAATTATGCCCTGACCCGCAAGGGAACAGGTGCATTTATTAGAACAGAACCAACCAGGGGCAGTTTCGGCTGTCTCAGTCGGCCTTGTGTCGGTTACGGATCTTTCAAATGTCTGTCCTATCAATTTGTTGGTAGGTGATCTGCCTACCATTACAATAACGGGTAACGGCGAATCAGGGTCAGACTCCGGAGAGAAGACGGCAGCAGGCGCGAAAAATACCCACTGCCAGCACGGGGAGGTAGTGAAGAAAAAATATTGTAAAGTGTAGTCG\n>NNAY01029724.1/129-174 Trichomalopsis sarcophagae strain Alberta scaffold29957, whole genome shotgun sequence. \nCCATCGGCCCTTTTCAGGGCCACAAAAACATCCATACGTATCGCAT\n>CM002290.1/17870538-17870716 Phaseolus vulgaris cultivar G19833 chromosome 3, whole genome shotgun sequence. \nTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCTGGAAACAACGAAAGTGAAATACCACTACTTTTAACTTTATTTTACTTGTACCGTCCCGTATCCGGGCGTTGACAAAGTCAAGGTCAAAGTCAACGTCGGGGTCAAAGTCAACATA\n>MKTJ01000058.1/456830-456745 Chloroflexi bacterium 54-19 SCNpilot_cont_500_bf_scaffold_42, whole genome shotgun sequence. \nGGGCCGGTGTCAGAGCGGTTAATGTGCCTGTGTGCTAAACAGGTGTGGCCGAAAGGCCACCGGGGGTTCGAATCCCTCCCGGTCCG\n>JH815307.1/89016-89141 Simonsiella muelleri ATCC 29453 genomic scaffold supercont1.8, whole genome shotgun sequence. \nAAACAGCATTCAGAGTTGGATTTTCCATGCCAACCTGCCAACATTCAATCATGCTGGTAAGGTGGATAACGGTTTTAAGATCGTTGATGTGGTCTATTTTTAAAATAGGCAATCATGACGAAACTC\n>HG917868.1/2308269-2308036 Clostridium bornimense replicon M2/40_rep1, complete genome, type strain M2/40T \nTAATAAGCTATGAAAAAGAAAGTAGATTTAAGGAATAAAGTAGGGAGAAAAAGCCAAAGACTGAAAGCTTTTTTATTAGGAATTAAATCGAAGTTCACTTTGGAGCTCTCTAGGGGAAGTTATAGTAGTCTAGAGCGGTATTATAAAAGCCGATATTTTTTAATGAAGTGGATAAGGGTATGGATTATGCTCTTATCAACTAGGGTGGTAACGCGGATATACTCCGTCCCTTTT\n>MNDT01000042.1/12913-12775 Archaeon 13_2_20CM_2_53_6 13_2_20cm_2_scaffold_3200, whole genome shotgun sequence. \nGGGGCCGTCGTCTAGCTTGGTCAAGGGATTAGCCCCGCCCAGAGGATACCAGAGTCCGATTATGGACGGTGACCCTGGGGCGCTGGCGACCTCGAGAAATCGAGGCCAGAGGTCGTGGGTTCAAATCCCACCGGCCCCA\n>JH210461.1/2478657-2478034 Pelodiscus sinensis unplaced genomic scaffold scaffold75, whole genome shotgun sequence. \nACCACTGAATTTAAGTATATTACTTGGTGGAGGAAAATAAACTAACCAGAATTCCCTCAGTAACGGTGAGTGAACAGGAAAGAGCCCAGCGCTGAATCCCCATCCCGCAGTGGGGTATGAGAAATGTGGTGTACAGAAGGCCCACTCTCCCCAGTGCCACTCTCAGGGGCCCAGGTCCTTCTGATAGAGGCACACCCTGTGGACAGTGTGAGTCCGGTAGCAGCCCCTGGCTTACTGGGACCAGGTCTTCTCGGAGTCAGGTTGCTTGGGAATGCAGCCCAAAGAGGGTGATAAACTCCATCTAAGGCTAAATACTGACATGAGACCAATAGTCAACAAGTACCATAAGGGAAAGTTGAAAAGAACTTTGAAGAGAGAGTTCAAGAGGGTGTGAAACCATTAAGGACATATAGGTGATCTAAATCTTTAATGCTTGAATTGGGTTGAATAAATGAATGGTACATTGACTAATACATAATAAAGGCATAGGAAAATGCATATTCATGCACTGAGAGTGAGACAGTCTTGTCACTTTTTATTTTCAAGATGGGAAATGCTATTCCCCTCCCTCAATTACTGGACTAATTCATACTTTTAATTAGTTTAACAATTTTTCAAAGAACT\n>JHTR01000147.1/10830-11400 Villosiclava virens strain UV-8b Sca_147, whole genome shotgun sequence. \nAAAAGCTCTTAAGGTAGCCAAGGGTAAGTCACGTGGGTATCTAGAGGTCACGTGACATTGGGCAAGTCACGTGGGATTACAGAAGGAAGACATAGGCCCACTGTCCCTATCTACTATCTAGCGAAACCACAGCCAAGGGAATGGGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTTTGACATTGTGAAAAGACATAGGAGGTGTAGAATAGGTGGGAGCTTCGGCGCCGGTGAAATACCACTACTCCTATTGTTTTTTTACTTATTCAATGAAGCGGGGCTGGATTTTCGTCCAACTTCTGGTATTGATTAATAGGGACAGTCGGGGGCATCAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAGGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGACGATGTTATTTTTTGACTCGTTCGGCACCTTACGAGAAATCAAAGTGCTTGGGCT\n>MEPC01000031.1/22924-22691 Bacteroidetes bacterium RIFCSPLOWO2_12_FULL_37_12 rifcsplowo2_12_scaffold_5312, whole genome shotgun sequence. \nCCTTTGCAGGCAATCAAAGGTGACATCCTATTTCTTTTCCAAGAAATTATTTGTCATAATAGGGAACCGGGTGAGAATCCCGGATAGTACCCGCTGCTGTAAACTCTAAAAAGTTTTATGCTTACGCTGGATGCTCAATCCGGTAGCCACTGTTAATCCTTTAATTTAAAGATAACGGGAAGGTGCAGAAAACGAGAGTAAGTCAGAAGACCTGCCTTTGAATTTATTTTTATT\n>JXRR01000017.1/5494-5709 Jeotgalibacillus campisalis strain SF-57 contig00017, whole genome shotgun sequence. \nCCTAATGCAATGATAAGGACCAGTAGATAATGCTGATACGAAAGAGATCGGAGTTCAGCGGCTGAAAGACTCCGACGTGCCTCACATTATTGAACCTGCCTTTGAGCGACAGGAAAACCTGTCCGTTCTCCCTCGTTACGGGTGAAGAAGAGTGCCGGATTATTCATGTTCGGCAAATTAAGGTGGTACCACGGAAGCAGCCCTTTCGTCCTTTTA\n>DS544962.1/17936-20730 Physcomitrella patens subsp. patens PHYPAscaffold_73 genomic scaffold, whole genome shotgun sequence. \nATTTAGGATTTAGGATTTGTTTAGGATTTAGGATTTAAGATCTACTTAAGGTTTAGAATTTAGGATTTTTTTAGGATTTAGAATTTAGGATTTGGCCTAAGATTAGATTAAAGTCTATTAAGGTTTTAACCAAGATTAAATTAAGACTTGGTTAAGATTTATTTAAGATATATTTTTTATTATTCTAATAATTTTTTAGGATTTCTTAGGGATTCTTTTAAGGTTTATTGTAGATTTCTTTTGATTGCTTTTAAGATTTCTTATTCTTTCTTTTATGTTTTCTTTAAGATTTCTTTTGAATTTGATTAAAGCTTATTTAACATTGTTAAGATTTAATTAGAATTTATTTAATATTCTATTAGAGTTAAGATTTTGTTATTGTAATTTCTATTCTACTTTCTACAACTATGAGCCTAGTACATTCTTTAGCAAGACTTTATGTAATATAACAATGTTTTCAAAAATCTTCATACAAATTGAATTTTCTTATCTAATATAATATCTTTAGATGGTGAACTATGCCTGAGCAGGACGAAGCTAGAGGAAACTCTAGTAGAGGCTCGTAGCGATACTGACGTGCAAATCGTTCGTCAGACTTGGGTATAGAGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGTTAGAGCTCGTATAAGAGTTTTATCAGATAAAGCGAATGATTAGAGGCATCGGGGGTGTAACACCCTCGACCTATTCTCAAACTTTAAATAGGTAAGCCGACGGGGTTGCTTGGTTGAACCCCGGCACAGAATGAGAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGAAAGCCAGGTTACGGTGCCAAATTGCGCGCTAACCTAGATCCCACAAAGGGTGTTGATTGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGTCCCGAAAATGGATGGCGCTTAAGCACGCAACCTACACCCGGCCATTGGGGCGAGTGTGAGGCTTCAATGAGTAGGAGGGCATGGGGGTCATGGAGCAGCTTTGGATGTGAGCCCGAGTGAAATGGCCCCTAGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGACTGAAGTGGAGAAAGGTTCTATGTGAACAGCAATTGGACATGGGTTAGTCGATCCTAAGAGATGGGACAATCCTGTGTCAATGGCGCAATGTGCGTCGTGCATCGAAAGAGAATCGGGTCAATATTCCTGAATCGGGACATGGCAGTGGACGGTGACGTGGCTGAATCCTGAGACGCCGACGGGGGCCCCTGGAAGAGTTCTCTTTTCTTTTTAACAGCCCGCCCACCCTGGAATCGGATTACCCGGAGATAGGGTCCAGCGGCTGGTAAAGCACCGCACGTCTTGCGGTGTCAGGTACATCCTCGGCGGCCCTTAAAAATCAGGAGGAGCGATTATTGATCATGCTCGGTCGTACTCATAACCGCATCAAGTCTCCAAGGTGAACAGCCTCTAGTCGATAGAACAATGTAGGTAAGGGAAGTCGGCAAAACAGATCCATAACTTCGGGAAAAGGATTGGCTCTGAGGGTTGGGCCTAGGGGTCTGTGCCTTGACCCCGTAGGCTGTCGGAGGTCTGCCCGAGCTGCTCTCGCCGCGATGGCGGACCCCTGCGTGCCGATCAGGCGACGGATACAGAATGAGGTCTAGAGGGTGGGTGACTGCCCCCCTGCCTCGCTTTTCCCTAGGCAGTGAACAACCGACTCAGAACTGGTACGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTTCCCACGGATGTTGACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACGAAGTGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTATCTACTATCTAACGAAACCACAGCCAAGGGAACGAGCTTGGAAAAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTAAGAGGTGTAGAATAAGTGGGAGCCCTCAAAGCGTAAGTGAAATACCACTACTTTTAACGTTATTTTACTTATTCCAAGAGGTGGAGGCGGGACTCTGTCCCTGCTTCTAGTCTTAAGGCGCGCCCCTCGGGTGCGCCGATCCAGGTGGAAGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAATGCAGGTATCCTAAGATGAATCAACGAGGACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGTTCATTTGATTTTGATTTTCAGTACGAATACAAACTGTGAAAGCATGGCCTATCGATCCTTTAGTCTTTCGAAATTTGAAGCTCATGAATATCTATAATAGTTATAAATCTATTTTTACTTCCATTAAAAGTAGCATTTACAATCTTTCCTTCTATAGACAACTCAAACAACTTCAAAAATTTAAATTAAAAGAAGATAATCTACAACCTTTAATATCAAATGAAAATTTCTACAAAGAGAGATAATCTATTTTTTTAAGAAAAAAAATAGTGTTAAAAAAACTACACTATTTATTTAAAGGTGAGTAGTCTACAACCTTCAAAATATAATAATAGAAGTAGAATAATCCACTCACTTCTAAAACAAG\n>LOEY01000035.1/5228-5158 Lutibacter sp. BRH_c52 BRHa_1002952, whole genome shotgun sequence. \nTATCTTTGCCAACTGCAAACCAAAAGGTTTAGCAATACATAAAAATTATTAATAAAATTAATGTTAGCATG\n>MEEQ01000424.1/3292-3474 Bacterium SCN 62-11 ABS71_C0424, whole genome shotgun sequence. \nGGTCGCCTGCAGAGTAGGTGTTGGAGCTTACAATCCTGGGCCAATGTAACAACCTCGGATGTGATGAGCTATCCCTGTGTCGAGTGCCGCGGTGCGGAGTCCTGACGGGGTAGCCCAAGGTCGCGTCCACCTGCTTTGAGCAGGTCCAGGGGTTCAAGCTCGCCACCGCTCAGGTGGGTCCCT\n>CM003505.1/6777488-6777685 Vigna radiata var. radiata cultivar VC1973A chromosome 2, whole genome shotgun sequence \nTCCAATATGCTGCCTTTGCCTGCATTTGCACCTGCACTTTACTTGCTTTTCTCTCTTCAACTATCTACCTGAATTAGTCCCTACAAAACACACATTTTCATGGAAAAAAACACAAGATTACGTTGTGTATGTGTGTGGGAATGGATGAGAAACCAAGCACGAGGTGCAGGTGCATCTGCAGGCGAATGACATCTTGGA\n>KQ435782.1/726561-726383 Melipona quadrifasciata isolate 0111107301 unplaced genomic scaffold scaffold99, whole genome shotgun sequence. \nATTGCTTGACGAGAATAAAAGTTATCTGTTCTTATCAGCTTAATATCTGATATATGTACTTCCCATAGAAAAGTCAGAATATTAACCTAATTTTTAAAAACCGGTGGAATTGGCCAGGCTCGCTCTTCTTCTGTCATAGATTGGCCCAGTATTGCAGTGCCATTGCCAAGCTGTGTTTT\n>ADNT01000040.1/13066-12970 Aerococcus viridans ATCC 11563 = CCUG 4311 strain ATCC 11563 contig00050, whole genome shotgun sequence. \nATAAAAAGAGGGAATGAGGTTCTCCCTGGTCAAGTAGATGGTGATTTTAGGCCATCCCATACCGAACCGCTGAAAAGCTGATGACTTCTGCAAGTAA\n>LK941638.1/22456-22528 Angiostrongylus costaricensis strain Costa Rica genome assembly, scaffold: ACOC_scaffold0001535 \nGCCTCATTGTCTCAGAGAGTAGAGGGTCAGCCTTTTGAACAGGAGGTCTCTGGTTCGATTCCAGCAAGAGGCA\n>NBLS01000022.1/6421-6598 Desulfobacteraceae bacterium 4572_19 ex4572_19_scaffold_9363, whole genome shotgun sequence. \nATCATTATATTATCATTCAGCAAACGGAACACGGTGTAAATCCGTGGCATATCCCGATGCTGTAACCCTTTTTGTTTTCTTTGGCATTTTTTAGTCACTGTTGTAATGTTTTTTTACAATGGGAAGGCTGTCTAAAGATGGGGAAGCCAGAAGACGTGCTGAATGATTAAAACAAGTT\n>CAGS01000178.1/3560-3832 Nitrolancea hollandica Lb, WGS project CAGS01000000 data, contig: 00259-1568 \nGCAACGGCTATGACGGAAACGAGTACGCGGAACACCACGTTTAGCGAGTCCGGGGCCGGTGGAAGCCGGATAATGTCGGGTTTCGCGGAAAATCCTTCCCGAGCCGCCACCTGAACCGTCTGATTTGGACGTAGTAAGCATGGCCGGGGTCGTCGCCCGTTATCGCGACGGAGATGCCGGAGCATCCTTCATCACATCGCGCGGCATCTCGGAAAGTGGGTTCCGTTTACCGGACCAACTGAGGTGGTACCGCGGGTTATCCCCGTCCTCAAC\n>AADN04003456.1/8626-12973 Gallus gallus breed Red Jungle fowl, inbred line UCD001 Contig3860.1, whole genome shotgun sequence. [11-NOV-2016] \nggacctcaggtcagacgtgcgacccgctgaatttaagcatatagtcagcgggaaaagaaactaacgaggattccctcagtaacggcgagtaagagggaagagccccagcgccgaatccccgcccccgccgtggggccgcgggaggtgtggcgtaccggaagccccccatccgccgcgcccgctctcggggggcccaagtccttctgatcgaggcccagcccgcgacggtgtgaggccggtagcgccccccggcgcgccgggcccggggcttctcggagtcgggtgcttgggaatgcagcccaaagcgggtggtaaactccatctaaggctaaatacccggcacgagaccgatagccaacaagtaccgtaagggaaagttgaaaagaactgtgaagagagagttcaaagagggcgtgaaaccgttaagaggtaaacgggtggggtccgcgcagtcgcccggaggattcaacccggcgggccaagtcggccggcgcgggcgccgtcgatccccgcctccgcctccccctccgtccctccccttcgccgggcggggcgggcccaggggggcgggcgggccggggaccgccgcccgccgcgtccggccccgtcggcgcattcctccgcggcggtgcgccgcgaccggctccgggacggctgggaaggctgccggcgggcaggtgcccggcgccggcgcgagcggccgccgggtgttaagccgccgggcccggatcgtcgccgaatcccgggccgaggagaggaccgccgccgcccctcccccgagggcggccccccggagggccccccgcgccgaccgcgtcgggccggccgcgccgcgcgcgcgtccgcgccgccgccgtacgccgccgccgctctctctccgttccccgccccgggtccgtccgggcgcggggcgggggggtcgggtgccggcgcggctcggcgcggcgccgcgcgtgtggcgcgcggcctccagcccggcgcgggcgaggccgcgggggcgccgggggggaaccttcccccttctgtcgggccgcctccgttcccgcggggcggcccgttcgggggacgggcccgccgccccgcgcgctgtccgaccaggggcggactgcgctcagtgcgcccgaccgcgcggcgccgccggccgggccggccacgccagcgcccgggtccgcggcgacgtcgctaccccccgacccgtctgaacacgaccaaggatccagcacgcgccgcgagtcgcggctcgcgcgaaagcccgcgcgcaatgagggagggccgcgcgcgccgctgagtgggatcccgggcggcaggccggaaggcccggcgcaccaccggcccgtctcgcccgcctcgccggggaggtggagcatgagcgcgcgtgctagacccgaaagatggtgaactatgcctggcagggcgaagccagaggaaactctggtggaggtccgtagcggtcctgacggcaaatcgtcgtccgacccgggtataggcgaaagactaatcgaaccatctatactggttccctccgaagtttccctcaggatagctggcgctcgggcggcggtgcagtttacccgtaaagcgaatgattagaggtcttggggccgaaacgatctcaacctattctcaaacttcatgggtaagacgcccgctcgctgcgtggagccggccgtgaatgcgagcgctcagtgggccacttttggtaagcagaactggcgctgcggatgaaccgaacgccgggttaaggcgcccgatgccgacgctcatcagagcccagaaaaggtgttggttgatctagacagcaggacggtggccatggaagtcggaacccgctaaggagtgtgtaacaactcacctgccgaatcaactagccctgaaaatggatggcgctggagcgtcgggcccatacccggccgtcgccggcggtgcggagccgcggggctaccgccgcgacgagtaggagggccgctgcggtgcgcctggaagcctggggcgcggccgggtggaggccgccgcaggtgcagatcttggtggtagtagcaactattcaaacgagagctttgaaggccgaagtggagcagggttccatgtgaacagcagttgaacatgggtcagtcgtcctaagcgataggcgagcgccgttccgaagggacgggcgatggcctccgttgccctcagccgatcgaaagggagtcgggttcagatccccgaatccggagcggcggagacgggcgccgcgaggcgcccagtgcggtaacgcaagcgatcccggagaagccggcggggagccccgggagagttctcttttctttgtgaagggccgggcgccctggaacgggttcgccccgagagagggggcccgcgccttggaaagcgtcgcggttccggcggcggtccggtgagctctcgctggcccgtgaaaatccgggggaggagggtgtaaatctcgcgccgggccgtacccatatccgcagcaggtctccaaggtgaacagcctcttggcatgttggaccaatgtaggtaagggaagtcggcaagccggatccgtaacttcgggataaggattggctctaagggctgggtcggtcgggctggggcgcgaagcggggctggcgcgcgccgcggctggacgaggcgccgcccgcccccgccccccctttccccgctcccgctcgccggggcgccgggggggggtcagcgggcggcgcggcggcggcgactctggacgcgccgccgggcccttcccgtggatcgccccagctgcggcgggcgccgctcgcccccctccttgcccctccgcccccccgctcccggcgcccctcccgtcggccgtcgtcccggccgccccccgtcccgagcgccctcctccgcgaggggcgcgaggggcggcggcggcggccgcgggcgcggcggcggcgggggggggggccgccggcggcgccgggcggggcggtcccgggcggggggggtctccgggccggcgccccgctcggccggcgcctagcagccggcttagaactggtgcggaccaggggaatccgactgtttaattaaaacaaagcatcgcgaaggcccgcggcggtgtgacgcgatgtgattctgcccagtgctctgaatgtcaaagtgaagaaattcaatgaagccgggtaaacggcggagtaactatgactctcttaaggtagccaaatgcctcgtcatctaattagtgacgcgcatgaaggatgaacgagattcccactgtccctacctactctccagcgaaaccacagccaaggaacgggcttggcggaatcagcgggaaaagaagaccctgttgagcttgacctagtctggcgctgtgaagagacatgagaggtgttagaataagtgggagccccgcggtcgcgcgacccgcgccgcggcccggccgccggtgaaataccactactctgatcgttttttcacttacccggtgaggcggggggcgaccccgagggctctcgcttctggcgccaagcgcccggcgcgccggcgcgacccgctcccgggacagcgtcagtggggagtttgactggcggtacacctgtcaaagcgtaacgcaggtgtcctaaggcgagctcagggaggccagaaacctcccgtggacagaagggcaaaagctcgcttgatcttgattttcagtacgaatacagaccgtgaaagcggggcctcacgatccttctgactttttgggttttaagcaggaggtgtcagaaaagttaccacaggataactggcttgtggcggccaagcgtcatagcgacgtcgctttttgatccttcgatgtcggctcttcctatcattgtgaagcagaattcaccaagcgttggattgttcaccccactaataggaacgtgagctgggtttagaccgtcgtgagacaggttattttaccctactgatgatgtgttgttgcgctagtaatcctgctcagtacgagaggaaccgcagttcagacatttggtgtatgtgcttggctgaggagccactggagcgaggctaccatctgtgggattatactgaacgcctctaagtcagaatcccccctaaacgtagcgataccgcagcgccgaggcgcctcggtgggcctcgcgatagccggccgccgcccccctcggcgggcggtcggtgcggagcgccgctcgtggtcgggacccggagcgcggacagatgtggcgccgcctctcccccgccgcgtaccgccatgttcgtggggaaccccggtgctaaatcattccgtagacgacctgattctgggtcggggtttcgtacgtagcagagcagctccctcgctgcgatctattgagagtcagccctcgacacaaagctttgt\n>KE695965.1/2672926-2673057 Alligator sinensis unplaced genomic scaffold scaffold337_1, whole genome shotgun sequence \nGCATCTAAATCTTTCCTGTTCCTTGCAATACAGTGCAGGATTGGGGACACATGGTGCTACAGCAAAGCAGAGTGAATCCAGACAGGTTTCTTCACTTATACTGGGACTTGTCTCTACAACTCTGCAACATTT\n>LNAL01000007.1/177069-176668 Cytophagales bacterium MC1A Contig_23, whole genome shotgun sequence. \nGTGATGCGCCGCCCCACCGCTGCGCCCGCAAGGGCGGAGAGGAAAGTCCGGGCAACGCAGAGCACCCTGCTTCCTAACGGGAAGGACGACGGCGGGAGACGGCCGCCGGACAGCCAGTGCCACAGAAAACTACCGCCTAAGCTGCCCTCGGGCAGCCGGTAAGGGTGAAAAGGTGCGGTAAGAGCGCACCAGCGGGCGGGCAACCGTTCCGGCTGGGTAAACCTCAGGGGTTGAAAGGCCAAATAGGCCGGCAGGCGGGGCTTCGGCCCTGCAACGGGCGGCTCGTTCGTTGTCGGCGGGTAGGCTGATGGAGCCCACGCGCGAGTGTGGGCCTAGATAAATGGTGGGGCCGCTGCCCTTCGGGGTGGCGGACAGAACCCGGCTTACAGGCGCATCACCAAA\n>ACPB03012429.1/2213-2327 Rhodnius prolixus Rhodnius_prolixus-3.0.3-164.10, whole genome shotgun sequence. \nACTAACTTTAGAACTGTATTTACTATCTTTGTGGGAACGATACAGAGAAGATTAGCAAGGCCCCTGAGCAAGGATGACACCGGCAGACGGAACTCCCATGCCGCAGAATGTTTTT\n>GK000028.2/19825245-19825332 TPA: Bos taurus chromosome 28, whole genome shotgun sequence. \nGAGTTGGACACGGCTGAGCAACTTTCACTTAAATTACTCTAAAAGAAATGAATCCTAGATGGTTTTCCATCCAAGTCAAGTGTCTTGT\n>JJRV01059395.1/8054-8163 Calypte anna contig59395, whole genome shotgun sequence. \nAGTATTGATTTCTTAAAACAAAAAGCAGTGCTGCAGTAATTTCAGCAGCTGGCATTGTTGGTTTTCATGCAGATGTGCTGGTTAAACTTGGTATCGCTGCTGAAACAATT\n>MGZC01000016.1/20791-20922 Gemmatimonadetes bacterium GWC2_71_10 gwc2_scaffold_12486, whole genome shotgun sequence. \nGGAAGCCGGTGGAACTCCGGCACGGCCCCGCCACTGTAACGGGTTGGGAGCAGTTGCTCCCCACGGCGCCTCACATGCCACTGGCCTCAGGCCGGGAAGGCGAGGCGGCCGCGACACCCGAAGTCAGGAGAC\n>KB915673.1/27675-28419 Neofusicoccum parvum UCRNP2 chromosome Unknown NP2_03_scaffold_35, whole genome shotgun sequence. \nGGAGCCTGCGGCTTAATTTGGCTCAGCACGGGAAGATTCACCAGGCCAAGACACAGTAAGGACTGACAGATTGAGAGCTCTTTCCTGATTTTGAGGAAGGTGGAGCATGGCCGTTCTTAGTTGGCAGAGTGATCTGTCTGCTTAATTGCGACAACGAACGAGATCTTGACCTGCCAGGCCCGTTTTGGCGGATCGTCGGCTTCTTAGAGGGATGATCGGCTCAATCTCATGGAAGTTTGAGGCGATAACAACTTAACCATTACACGCATGTGATAACGGGGCCCCGACTTACTTTCGTGGGATTTTCCGCCAGTCGATCGTCCGTGACCGTTGGGCAAGCGCCCTAGTATCCAGCAGTCGGGCTGCTGAAGGGCAGCCTAGGATACAGCAAGACAGCCTGGTTTTGGGACTCCAGTTCAGGCTGATCAATCCCGAGGCAAGTTACTATAGCGAGCACCCGTTATAATGCTAAATCCTTATTAATAGAGCTCGTAAGAAAAGGCCTGATACATCGAAGCGTACGGGAGTCACCGAGCAAGGTGGCTGACATGAATTGTTGTTAAGCTCTTAGATTTTCAGGGCCGCCTGCACGCTACGCCAACAGAGTAAACGAGTTTGCTACCCTGGCCGGAAGGTCCGGGGGATTTTTTGAAACTTTCCCGTGCTGATGATACAGCACTACAAACTTCTCAGAGTGTCTGGTGTGCTATAGCCGGCCCTGAGATTAGCGGCACTTGTGTAGAAT\n>KB822693.1/397760-397927 Marinobacter nanhaiticus D15-8W genomic scaffold super1, whole genome shotgun sequence. \nATCTCCATAGACTCAATAGCAGAGGAGACTCTGACATGTATATGGATGCTGTCGTTTTCGCAGGTATCGCTACCGTCGTCCTGATATTCGGCTTCTTTGGCGGTGTGGGTTATTTCATTTACAAGGACTCCCACAAGAAGTCAGACGAGAAGCACTAACCGGTTCCAG\n>ALWS01089583.1/31226-31330 Pteropus alecto contig89583, whole genome shotgun sequence. \nACATATGATTTTATTTTCTTCAGAAAAACTTAATTTTATAAGCAGGGTCGGGCCTGGTTAGTACTTGGATGGGAGACTACCTAGGAAGACCAGGTGCTGTAGGCA\n>FRAG01000030.1/20374-20550 Clostridium caminithermale DSM 15212 genome assembly, contig: EJ27DRAFT_scaffold00030.30 \nTTAAGCCTAGGATGTTCGTTAAAGCCTTGAAATTCAACCACCAATAAGCATCCGGGAGTCCAGGTTTTTATGGCGATGACGGGCCTCAATATAGTGGAAGTCAGAACTATAGAATAGGACACCCACCTAGGTGATACCGGGTGTGAATTTACAAGGTAACGACATCTTGGGTATATA\n>LM154274.1/11133-10866 Schistosoma mattheei strain Denwood, Zambia genome assembly, scaffold: SMTD_scaffold0004766 \nTGTGGTCGCACATAAATCGGGTATGATAATCCAAACATTTCATCATCTAAATACCTGAGAGGGAGCCTGAGAAATGGCTACCACATCCAAGGACGGCAGCAGGCGCGAAAATTACTCACTCCCGGCACGGGGAGGTAGTGACGAAAAATACAAATACGGGACTCAGTTGAGGCTCCGTAATTCGAATGAGTGCAATCTAAATCCTTTAACGAGGACCAATTGGAGGGAAAGTCTGGTGCCAGCAGCCGCGGTAACTCCAGCTTCAAAA\n>GL378999.1/3793-3024 Volvox carteri f. nagariensis unplaced genomic scaffold VOLCAscaffold_724, whole genome shotgun sequence. \nNNNNAATGTATGCGAGTTGGCGGGTTGAAAACCCGTAAGCGCAAGTAACCTGACTGGTGGGATGGCCTGTGCCTGCACCATCGACCGACCATGTTGCTTTTGCGAAAGGTTTGAGTGCGAGCATACCTGTTGGGACCCGAAAGATGGTGAACTATGCCTGAGCAGGGTGAAGCCAGAGTAACCTCTGGTGGAGGCTCGTAGATGTGCTGACGTGCAAATCGCTTTTCAGACTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCCCAGGATAGCTGGAGCTTGATCAGTTTTATCGGGTAAAGCGAATGATTAGAGGTTCGGGGGATGAAACATCCTTCACCTATTCTCAAACTTTAAATAGGTAAGACGTGTCGGTTGCTTAACTGAACCGTCACATTCAATGTGAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGATAGTCGAGTTAAGGTGCCAAACTGCGCGCTAACCTAGATCCCACAAAGGGTGTTGATTGATATAAACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAATTAGCCCCGAAAATGGATGGCGCTTAAGCGCGCGACCTATACTCGGCCATGGATGCAAGTGCGACGCGTCCATGAGTGGGTGGGCGTGTCTCAAAGATTAAGCCATGCATGTCTAAGTATAAACTGCTTATACTGTGAAACTGCGAA\n>LWSG01000002.1/200085-200211 Bacillus litoralis strain C44 Scaffold10, whole genome shotgun sequence. \nTTAAACAAGTAGAGGCACCCGCTTCTCACCTGATTGACACATCCGTTTGTAGTTGGCAGGTTACGATGATCTTTTATGTATACAATCGTAGTGTGGGTGTCTAAGGCATCCACACTTTTTTATTTTC\n>URS0000D696C4_12908/1-84 unclassified sequences c-di-GMP-II-GAG riboswitch \nGGGAGCGGGGGAUCCAGGGCACGACGCCCAAAACGGUCGCCUGACCGUCGUGCCUAGCGAGCGGCGAGACCGGCCCCACCGUGC\n>MNYX01000050.1/4741-9257 Candidatus Nomurabacteria bacterium CG2_30_43_9 cg2_3.0_scaffold_4245_c, whole genome shotgun sequence. \nTAACAGGAAATATAAGAGCATATGGTGGATGCCTTGGTTCTAAGAGGCGATGAAAGACGTAGCATGGCTGCGATAAGCTTCGGGGAGGTGCCTAGCAACCTTTGATCCGGAGATTTCTGAATGGGGAAACCCCATAACCGTAATAGGTTATGACCTACATTTAAATGTAGGAGTATACCCAGGGAAGTGAAACATCTCAGTACCTGGAGGAAAATAAAAAAAGCCGCCGAATGGCGGAACATTTCCTGAGTAGCGGCGAGCGAAACGGAAATAGCCCAAACCTACTATTTATAGTAGGGGTTGTAAGGCAGAGACGTCGTATTTATACGAGAGGAGTTACAAAATGTAATGTTAGTTGAATATGCTGGAAAGCATAGCCCTAGACGGTGATAGCCCAGTAAACGAAAACCTTACATCTTCTTTGTCTTTGTTCTTGAGTACTTCGAGACACGAATAGCTCGGGGGAATCTACCAGAACTAACTGGTAAGGCTAAATACTCTTAGAAACCGATAGTGAACTAGTACCGTGAGGGAAAGGTGAAAAGAACCCCGGTGAGGGGAGTGAAATAGAACTGAAACCATATGCTTACAAGGAGTCGGAGCCCCCCACCACTCGTGGTGGGGGGTGACGGCGTGCCTATTGAAGAATGAGCCAACGAGTTAATGTATACAGCGTGGCTAAGCCCTTGTCGGGTGGAGCCTTAGGGAAACCGAGTGTGAATAGCGCGTTTGTTGTATGCATTAGACCCGAAGCCAGATGAGCTTACCATGAGCAGGGTGAAGTTTGTAGAAATACAGATGGAGGCCCGAACCGGTTGGCCGTGCGACACCATCGGATGACTTGTGGTAAGGAGTGAAAAGCTAATCGAATCTGGTAATAGCTGGTTCTCTCCGAAATATGTTTAGGCATAGCGTCTAGCGTACCCTCTGGGGGTAGAGCACTGGAAGGACTGAACAGGGAGCAATCTCGTCAGTCCTATCAAACTCCGAATACCAGAGATAGGCCCACCACATAATAATTTTTCGTTGCGAAACGAAAATTTTTAGCGGAAATCATGAAGCGTGATGAGCCTATGCGAGCATAGGCGACGAGCGATGAATGATTTGTAGCAAAAATTTTAAGTTGTAGCAGAAAAGATTGTTGTGTGGTGGGCCCAAATACTAGGCAGTAAGACTACGGGGGCGAAGCTCCGTCGGTCAAAAGGGAAACAGCCCTGATCTCAAGTTAAGGTCCCAAAATTTACGCTAAGTGTACTTAAGGAGGTGGAGTTTCTCAGACAGTGAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAAAGCGTAACAGCTCACTCACTAAGAGACTCTGCACCGAAGATAATCGGGGCTAAGCGTAGTACCGAAACTGAGGGTTCTCTCGTCTTTCGAGATGGGGGAGCGGTAGGAGAGCGTTCATGTCTGCGCTGAAGGAGAAGTGTGAGCAACTCTGGAGCGGCATGAAGTGAGAATGTTGGCACAAGTAACCACAATGCGGGTGAGATCCCCGCACGCCGTAAGAGCAAGGTTTCCTTTGCGATGTTGATCAGCGAAGGGTTAGTCGGGCCTAAGGTTATAGCGAAAGCTGAAGCCGATGGACATAGGGTTAATATTCCCTAACTTTTTATTTGTGCGATGGAGTGACGAAGGTTAGTATGTCTTGCGCATTATTGGATTTGCGTTTGTGTCATCAGTGTGACTCTTAGGTAAATCCGGGAGTCTGGTTTTAATACCGACCGCAAGTGAAGCAGAAATGCATGGGTTCGCCCAGTGCAGATAAGGCAAAGCAATTTTCCGAGAAAAGCTTCTAAGCATAACAAATAAAAAACCGTACCTAAAACCGACACAGGTGCTCGAGTCGAGTAGACTAAGGCGAACGAGTGATTGCTTCTCAAGGAACTCGGCAAAAAAGCAGCCGTAACTTCGGGATAAGGCTTGCCTCCACCACTTTGTCTTTAAAGACGCATAGATAAAATTACTTCATTAGCGACGTAGAGCGAGAGAAATGAAAAGGTATTTTTTCATTTCCAAGCCGAGGAGCTAATATAAGAGGTAACCCTGCTTTTATTTGCATCGTTGAGAAGAATTTTTTCCTCCACGCAATGTACACTTGTACATCTTGGTCGTAAAAAATTCTCCCCGCCTCGCAACTAAAGCAATTTAATCAATGCTTATGCAATAGTGATGGAGTCCGAAGAATTGAGTGTATCGAGACCGTGTTTAGTATCAGAGCTGATACTAAACACAAAAAAGTATTTGAGAAAGTGAGTGATTGTGGGTTTCGTAGAGGGGGGATTCTGGATTTAAATAGAGAAGATAAGATTCGCAAGAATCAAACGACACTCAGGTGTCAACTTCGTTGGGTGCTACCATCCACTATTTCTTTGAATAATCTTGTCAGACGGGAAACCGCATAGACTAAAAGATCGTAATTAGATCGATTCGAAGGTTAACCATGAACTCTCTCCATTCTATGAAACTCATAATCATAGATCGTATCAAATACAAAAATGTTGACTAATTTTTCTAGGACTTAGACATCATCTCTCAAAAATCATTTCGCATATCATCAGTAAATTTCTGCTGTGACTTTGAGAAAAATTTTATTCGAACCTCGGTTCGAGTCAAATTTTTCTCTTCGTCTCGCTAGAAATTTCCCTGAAGCTAAGCGAAGCATTTTATGAGAAATGATGTAGCACCGCTTTGAAAATAAAGTGGTGGAGGCCGCAGCGAAAGATTTCCTGCCAACTGTTTACCAAAAACACAGCTCCATGCGAACTCGTAAGAGGATGTATATGGGGTGACGCCTGACCAATGCCAGAAGGTTAAATACGGGTGGTGCCGAGCACCATGAAGTTAAGTAGAATTTCGTTGAATATTTTTGTTCAGTGGTTCTATTTGAAAGCATGGTGCTCGGTGCTGGCTTGTATAAGCCCTGGTGAATGTCGGCCGTAACTATAACGGTCCTAAGGTTCCCTGCTTATCAATGATGAGCAGGGAAGGACTAGGACTGTTATAGAAAAAAGTAAACAATTAATTTAAATTCATTACATGTTTAAGCTACCTGGCACGCAGTAATGTGTGTTAGTCCAATCATGATAAACGAGAGACCAACGTCATGGACCCTACTTTTAAGGAAGAGGGTAAAGATAGAGTCCAACTGAGAGGAATAGTTGAGCGTAATTCCTTGTCTGGTAAGTTCAGACGTGCACGAATGGCGTAATGAGTGGGAAACTGTCTCGAGAAGCAGCTCGGTGAAAATACAATACCGGTGAAGATGCCGGTTACCTGCAGATAGACGAAAAGACCCCGTGAGCTTTACTATAGCTTAATATTGAACATGTTTTGTTTCTGCGTAGCATAGGTGGGAGGCTTTGAAGCGACCGTTTCGGTGGTCGTCGAGCCAACAGTGAAATACCACCCTTAATTGAGGCATGTTCTAATCTGTAAGGAAAAAACTTACGGAGACAGTATTTGGCGGGTAGTTTGAGTGGGGCGCTCTCCTCCTAAAAGGTAACGGAGGAGTCTATTAAGGTCCTCTAGGCGCGAATGGAAACCGTGCCGATAGCGTAATGGCAAAAGAGGGCTTAACTGCAAGACGGACATGTCGAGCAGGTGCGAAAGCAGAGCATAGTGAACCGACGACACGCTTTAGATGCGGTCGAAGATTAACGGATAAAAGCTACCACGGGGATAACAGGCTAGTTCTGCCCAAGAGTTCATATCGACGGCAGAGTTCGGCACCTTAACATAATCGGGGTGCGTCAGGAGTAATCCTGTAGCGACAAATTTATAATCGTCAATAAATAATATATAAACAAGAAATCTTGGCTTATAACGGTGAAACCCATTTGCATGAACAATAAATGGGCAATACCGTGGGAAGTTTGCGTGTAAGAAAGCGATCACTCTAAATTTTTAGAGAGCTGCTACATCCTTTGTGGATGTGATTATACGTATAACCCTGTAGAGACTTGTCACGTTAGCGCGTAGAGATGCAACTAACAAAGTGACGGAGTTATGAGAAAATCATAGCTAATACGCCAACGCCTCTTTTGATCGAGAGGGTGAAGATATAGTCCGATCCTCGCAGTAATGCGAGACAAATACGACAGCGATGTCGGCTCATCTTATCCTGGAGGTGGAGAAGCTTCCAAGGGTTTGGCTGTTCGCCAATTAAAAAGATACGTGAGCTGGGTTCAAACCGTCGTGAGACAGGTTGGTCTCCTATCTTCTGCAGGCGTTGAATTTTGAGGGGATTTGCTCCTAGTACGAGAGGACCGGAGTGAACTGACCTCTGGTGTGGCTGCTGTCCTGCCAAGGGCACCGCAGCGTAGCTATGTCGGGAATGGATAACCTCTGAAAGCATCTAAGAGGGAAACCAACCCCAAGATCAGAATTCGTTTGAGGCCCGTAAGAGATGATTACGTTGATAGGCTCTATGTGTAAGACGAGTAATCGTTTCAGCAGAGGAGTACTAATACGCCGATTCCTGGTGGG\n>AYYY01000070.1/37374-37142 Lactobacillus vaccinostercus DSM 20634 NODE_168, whole genome shotgun sequence. \nTAAAAAACGATGAAAAGATGAGTAGCAGTTAACACCTTTTTAGAGAGCCTCTGGTTGGTGAAAAGGGGTAAGGTTGGTGATTGTGAATATGGTCTTGAAGTGAGGAATGTTGAGCGTATGCGAGGCATTCATGGGGACGCCCATTACCGCGTGCGAGTATGATTGTACTCAGCGAGGGAGTGTATGTGAATACATTCTAAATTAAGGTGGTAACACGAGAGATCGTCCTTACT\n>AAQR03042857.1/1-1187 Otolemur garnettii contig042857, whole genome shotgun sequence. \nGCCCCAGTGCTGCCAGTCCCTGTGCTGTAAGCCCATCTGCTGCCGCCCCAGCTGCTGCCAAACCACCTGCTGCAGGACCACCTGCTGCCGTCCCAGCTGCTGTGTGTCCAGCTGCTGCAGGCCCCAGTGCTGCCAGTCCCTGTGCTGTAAGCCCAGCTGCTGCCAAACCACCTGCTGCAGGACCACCTGCTGCCGCCCCAGCTGCTGCTAGGGACCTGCTATAGAACAATCTGTTGTTGTTCCACCTGCCAGACCACCTCTTGCTGCTGAGTGTCCTGCTCCAGATCCATGAACTTTCATGACCCTTCCTTTAGTCTAGTTAGAGAGGATCTAGTCACTGAAGACATGAACTTCCTGGGGCTATGGACTTAACAAACAGACCCATGGATGAATTTGCAAAACCCTGGTTTCTATATTAGTATTTTCTCTATTCTGTAGGTATATTTCATTATTATAGCAAATCAGTATTTACAGCCAGATTCTGCATCAAATTGCTTTAGTATTCCTAGTTCTGATTCAAAATACAGGAGTCTTCAAATGTTCTCTTCATAGATATTTTTATAACATTTTCAGTAGAATCCATTGTCATGTGGAATTATTGCTCAATGTTGCCAAATAAAAGTTCTTAGCATCCAAATGCACCCAAATTGGTCATTTCTCATTATTAACAAAATGTTCCTGTCTCTTTTCTGCACAACACTAGAGCTCATGTTTTCAGGAGAACACACAATGGAAACATTAAATTGGTCTTCTCCAGTGACATTGTTATCAAAACCTGAATTCACCCCCCAACTTCTAAGAAGGACAAGTGGTGTTAAGCCACCCAAGATTGAGCAATAACAGGCCTGTGATGCCCTTAGATGTCTGGGGCTTCAATGACTGGCTCAGCATGCAGGCACTGGTAACCCGTTGAACCCCATTCATGATGGGGATCAGGGATTGCAATTATTCCCCATGAACGAGGAATTCCCAGTAAGTGCAGGTCATAAGCTTGCGTTGATTAAGTCCCTGCCCTTTGTAGACCCTGCCCGTCGCTACTACCAATTGGATGGTTTGGTGAGGCCCACGGATTGGCCCCAGTGAGGTTGGCCCTGGTGGAACGCTGAGAAGATGATCAAACTTGACTATCTAGAGGAAGTAAAAGTCATGACAAGGTTTCCATAGATGAATCTGAAGAAGGAAAAATT\n>KQ042022.1/603975-604625 Larimichthys crocea isolate SSNF unplaced genomic scaffold scaffold95, whole genome shotgun sequence. \nCCTCACGCTTAAGCCCGGCTTCGGGACCCCCCCACAGCACCCAATGCACACCGCGGCTACCGCGGTGTGCATAGTGACGAAAAATAACAATACAAGACTCTTTCGAGTCCCTGTAATTTAAATGAGTACACTTTAAATCCTTTAACAAGGATCAATTGGAGGGCAATTTTGGTGCCAGCAGCCGCGGTAATTCCAGGTCCAATAGCGTATCTTAAAGTTGCTGCAGTTAAAAAGCTCATAGTTGGATCTCGGGATTGAGCTGACAGTCTGCCGCGAGGTGAGCTACTGTCGGTCCCAGCCCCTGTCTCTCGGTGCCCCCTCGATGCTCTTAGCTGAGTGTCCTGCGGGGTCTGAAGCGTTTACTTTGAAAAAATTTGAGTGTTCAAAGCAGGCCCGGTTGCCTGAATACCGCAGCTAGTAATAATGGAATAGGACTGGCCAGGGGAGGTGCCGCTAGAGGTGAAATTCTTGGACCAGCGCAAGACGGACGAAAGCAAAAGCATTTGCCAAGAATGTTTTCATTAATAAAGAATGGAAGACGATCAGATACCGTTGTAGTTCCGACCATAAACGATGCCAACTAGCGATCCGGCAGCGTTATTCCCATGATCCGCCAGGCAGCATCCAGGAAACCAAAGTCTTTGGGTTCCG\n>GL897038.1/2640067-2640202 Mustela putorius furo unplaced genomic scaffold scaffold00141, whole genome shotgun sequence. \nAGCTTTGCGCAGTGGCAGTATCGTAGCCAATGAGGTTTATCCGAGGCGCGATTATTGCTAATTAAAGCAGCAAGAGAGAAATGAGACCTTATTTATAAGGCAAAAAAATTAGAATGACAGTGAATTTCCCATCAAA\n>AWHE01044218.1/1319-1427 Amborella trichopoda AMTR_V1.0_contig_44218, whole genome shotgun sequence. \nGTGCCTTAGGGTTGAACTAGTCCCGGATATTTAATCATTCCCACCAACTTCACATTCTCAGTGAAGTTTTTCCTTGTTGTCTTATCTGATAATTCAAGATGGAAATATA\n>AFSB01019533.1/7909-8012 Heterocephalus glaber contig19533, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGCAGTAGGAAGAAGGATCCAGTGTGGAGTCATAAATATATAAATTTTATTATTTATCAATACATTAATTTAT\n>AYUG01084532.1/52955-52729 Fukomys damarensis contig84532, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAGGAAAATAGAAAATTTCATACGTAAGCAAAACAATTTCTCCTAACCCTATCTCACCAAAACAAAAACTTCTCACATTTTTTCACAAGTATTTCAATTACGTGCCTCTATTTATCCTAGAGCTCTCTTGCAAAACAGGAACAGATCCAAACTGAGAAAGAATTGCTTTTCAGTTTTAGTGCAGTTGACGTTTA\n>LLXS01000009.1/35786-35931 Stenotrophomonas maltophilia strain JCM 9942 contig_17, whole genome shotgun sequence. \nCTTGGTGTGTGACCACCAATAGCCTGAAGTGGCGTGCGTCTCTGGCAACGGAGGGGTGCGAAGCCCACTGAACAAGTCCCCCGCAAGGGGCGCAACAACCGCGAGGTTTTCGCGCAGATTCCGGTAGCAGCAGACCGGATGAGGGG\n>CCCW010015579.1/1-2359 Brassica napus, WGS project CCCW01000000 data, contig: 28609 \nACGGACAGCCACAGACGTCCTGTATCTGCTGGCGGACACCCACGGATGTCCTGTGTGTACTGAACAGACAGCACACGTGGGCCAAAATCTCCGGAACAGTCCACGGGAAGGGTCAGCGTGCTAAGTCCAAGGACCAATGTGCTGATATGTGTACTGATGGACAGCCACGGACGTCTTGTGTGTGCTGACGGACACACACGGACATCCACGGACGTCCTGTGTGTGCTGATGGACACACACGGACGTCATGTGTGTGCTGACGGACACTTGGTCGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTCTAAAAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTGAAGCACGCGACCTATACCCGGCTGTCGGGGCAAGAGCCAGGCCTCGATGAGTAAGAGGGTGTGGCGGTCGCTGCAAAACCTAGGGCACGAGCCCGAGCGGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCCAATGAGAACTTTGAAGGCCGAATAGGGGAAAGGTTCCATGTGAATGGCACTTGCACATGGGTTAGTCGATCCTAAGAGTCGGGGGAAACCCGTCTGATAGCGATTATGCGCGAACTTTGAAAGGGGATCCAGTTAAAATTCCGGAACCGGGACATGGCGGTTGATGGCAACGTTAGGAACTCCGGAGACGTTGGCAGGAATTCTGGAAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTTGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGTACCGCACGTCGCGTGGTCTCTGGTGCATTCCCGGCAGCCCTTGAAAATACGGACCGAGTGACGCTCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGATGAACAACCTCTGGTCGATGGAACAATGTAGGCAAAGGAAGTCGGCAAAATGGATCCGTAACTTTGGGAAAAGAATTGGCTCTGAGGGCTGGGCTCGGGGGTCCCAGTTCCGAACCCGTCAACTGTTGGCGGGCTGCTTGAGCTGTTAACGTGGCGAGAGCGGACCGCCTCGTGTCGGCCAGGGGAAGGACTGGGAACGGCTCTTTCAGGATCTTTCCCTGAGCGTCGAACAGCCAACTCAAAACTGGTACGGATAAGGGGAATCCAACTGTTTAATTAAAAGAAAGCATTGCGATGATCCCAGTAGATGCTAACGCAATGTTTTTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGTGCGGGTAAACGGCAGGAGTAACTATGGCTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAAACACACCAAGGGAACGGGCTTGGAAGAATCAGCGGGGAAAGAAGACCCGGTTGAGCTTGACTCTAGTCCGATTTTTTGAAATGACTTGAGAGGTGTAGAATAAGTGGGAGCTCCAGCGCAAGTGAATACCACTACTTTTAACGTTATTTTACTTACTCCGTGAATCGGAGGCGGCGTAATAACCCCTTCTTTTAGACCCAAGACTCGCTTTGACGGGTCAATCCGGGCGGAGGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGAAGGGGTCCTAAGATGAGCTCAATGAGAACAGAAATCTCGTGTGGAACAAAAGGGTGAAAGCTCGTTTGACTCTTATTTTCAGTACGAATACGAACCGTGAAAGCTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGCTCGTGTCGCAATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGCTGGATTATGACCGAACGCCTCTAAGTCAGAATCTGGGCTAGAAGCAACGCATGTGCCCGCCGCCCGATTGCCGACCCTCAGTAGGAGCTTCGGCTCCCAAAGGCACGTGTCGTTGGCTAAGTCCGTTCAGCGGAAGCGCCGTTCGGACCGCCTTGAATTATAATTACCACCAAGCGGCGGGTAGAATCGTTTGCAGACGACTTAAATACACGACGGGGTATTGTAAGTGGCAGAGTGGCCTTGCTGCCACGATCCACTGAGATTCAGCCCTTTGTCACTAAGATTCGA\n>MNRN01000197.1/5697-5757 Clostridium sp.CAG:217_53_7 isolate CAG:217_53_7 Ley3_66761_scaffold_9517, whole genome shotgun sequence. \nGGAGAGGTACCGAAGTGGTCATAACGGAGCGGCACCGTGGGTTCGAATCCCACTCTCTCCG\n>LIZX01000155.1/9306-9787 Candidate division WOR_1 bacterium DG_54_3 WOR1_52_54_19713, whole genome shotgun sequence. \nAGAGCAGGCCAGATGATCGTGCCTCGACTCACTTCGTTCGCTCGGCACAAGCCCCTTAGTCTGAGGGGTTTATACCGAGCGAGGCCGAAGGCCGAGTCGAGGTAAGGAAAGTCCGGACTCCGCAGAGCAGCGTGGTTGCTAACGGCAACTGAGGGCGACCTTAAGGAAAGTGTCACAGAAATTACACGGCCCACTCTGACCCTAAAGGTCAGAAGGCAAAGGTGAAATTGGGAGGTAAGAGCTCCCACAGGACTGACCGGTGACGGTCGCTGCGGTAAACCCCACGCGGAGCAAGACCAAATAGGGAAATGGGTGGCTCGCCCGCCCTGCCCGCAATGCTACGCATAGCGTTGCAGGCGGGTATAATCCCGAGTAGGTCGCATTGAGGCAGTCAGCAATGGCTGCCCCAGATAGATGATCATCGAACCCAGCACGGTATGGTGCTGGGTGAACAGAATCCGGCTTACCGGCCTGCTCTTTTT\n>MFJD01000004.1/58273-58056 Candidatus Gottesmanbacteria bacterium RBG_16_52_11 RBG_16_scaffold_141, whole genome shotgun sequence. \nACAGAAGGCTCAATTTGGGCTCACTGAAAACTATTTTAGTGATAGTCCGGCTGTATCGGTGAAATCCTGAGCTAGCCGAAGGACAACACCGAGGCAATCCCCCTTCCGCATAAAATATGGGGGCGAGTCCGTAGAGACTATACGCCGGACCCCGCCTACAGTTGATAACTCAATTGTTGGCGGGGAAGATATAGTCCGACACTCTCAGTAATGGGAGA\n>GK000003.2/42786018-42786224 TPA: Bos taurus chromosome 3, whole genome shotgun sequence. \nATCACTTCTTGGTATTTTGGCTAGAATCAAGTGTAGTTTCTGTTCTTATCAGTTTAATATCTTCTCCCACTGAAAAATGTGGCTCTGCTATGTTGGGGCCAGGAGTAATTAAACCAGTGTTAGGAGGAAAGAAAGTGAAGTCACTCAGTCGTGTCTGACTCTTTGTAGCCCCATGGACACCGGGCTCCTCCGTCCATGGGATTTTCT\n>LFZU01000001.1/2811527-2811462 Bacillus sp. FJAT-27231 Scaffold1, whole genome shotgun sequence. \nCAAAAAGGAACGACGGCTAAAGACGCGACACCGTGTCGCAACGCCCTCACTAGCACATCATGTGCG\n>GL637602.1/252614-252701 Caenorhabditis tropicalis strain JU1373 unplaced genomic scaffold Scaffold630, whole genome shotgun sequence. \nTGTCCACTGATGACAACCTTACATACACCATTACGATCTCTGAAGACTTCGTGCTGAACATGTTTCCATGCAACACCAACTGAGGACG\n>LL029687.1/1-1177 Trichobilharzia regenti genome assembly, scaffold: TRE_scaffold0029590 \nCTCCTTGTGTTTAAAGTTAGTGCTTACAAGAAACAAATGATTATCAGAACAGAACTGTAGGAGATCAGTATCAGTTCTTTATTAATCAGCTTCAACAACAATACATCTCATCCAGTTCTGCTTTAATATTCTCCGTAGGCAAATGAGACAAGTACGCTAAGTATCCCAAAAATGCCTAAGCCCAGTAAGAATGCTAAAGCACCGACGGCGGTGCTGTGCAGTCTACAAACAAACAAAAAGTTGTATTCAAATACCACCAGAAACTTTTCACTCAATCTATTCCACATTCTCAAAATACTTCCGAAGGTTGCAGAACCAGTGCCATTCAATCATTTCACAGAGATGGACACTCCACATTAAGTTGTACAATAATTCCTATCCCTAAATTAACTTAAACTCTGAGATATGCACTGAATGAAGCTAATTTGATCATCAAATGTGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCCCGACAAGAGCATTGATATGACAGACTTATCTCCTGTAATTTCTGTTTCTGCGAATGGTGAGCGGACAAAAAGACTGAAACTCCAAGAACTTCATTATTCGCGTTAAAAACACCACGTTAGCGATTTTAGATAGAACGTACGGACAACTATTGTAAAGTGTGCAAACAAGGTGAAAAGAAACGGGAAATCGGGGTTCGATTCCGGAGAGGGAGCCTGAGAAATGGCTACCACATTCAAAAACCGCAGCAGGCGCGAAAATTACCCACTCCCGGCACGGGGAGGTAGTGACGAAAAATACGAATACGGAACTCAATTGATGCTCCCTGGTTCGAATGAGTACAATTTGAATCCTTTAACGAAAACCGATTGGAGGGCAAGTCTGGTGCCATCAGCCGCTGTAACTCCAGCTCCAAAAGCGTAAAGTTGCTGCAGTTAAAAAGCTCGTAGTTGTGTGGTCGCATGCCATTGGTTCTTCGCGGCTTTGGTTACGATCAGAACTTGTGTTCGGCTCGGTGTAGTGGCTGTGCAGCCTTTCAGTCATATCTGTGTAAAGGGGTGCTGACGGAGATGGGTGAGCTTGTCTTGCCCGCTATCTGTTGGCATGCTTCCGGATGCCTTTAACCGGGTGTCGGGAGCGGACGGCATCTTTC\n>JYDL01002072.1/1-274 Trichinella nelsoni scaffold2457s, whole genome shotgun sequence. \nTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGTGATTAAACCCGTAAGGCGCAAGGAAGCTAATGCGCGGGATCCCTTTACGGGTGCACCGCCGACCGACCTTGATCTTCTGAGAAGGGTTCGAGTGTGAGCATGCCTGTCGGGACCCGAAAGATGGTGAACTATGCCTGAGCGGGGCGAAGCCAGAGGAAACTCTGGTGGAGGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTGACTTGAGTGTAGGGGCGAAAGA\n>DS562881.1/23395652-23395568 Cavia porcellus supercont2_26 genomic scaffold, whole genome shotgun sequence. \nAAATCATAATCCAACTCTAGCATTAGCCATGGGTTTAGCATTCCTCTTGAGGAAAGCAGGGGTTCCTCTTTTGCCCCCCATTGGC\n>FAOM01514816.1/33945-33090 Triticum aestivum genome assembly, contig: Triticum_aestivum_CS42_TGACv1_scaffold_514816_6BS \nCTGTATGATCCTGCTAGTAGTCATATGCTTATCTCAAAGATTAAGCCATGCATGTGCAAGTATGAACCAATTTGAACTATGAAACTGTGAATGGCCCATTAAATCAGTTATAGTTTGTTTGATGGTACGTGCTACTAGGATAACTGTAGTAATTCTAGAGCTAATACATGTAACAAACCCCGACTTCTGGGAGGGGGCACATTTATTAGATAAAAGGCTGACGCGGGCTCTGCTCGCTGATCCGATGATTCATGATAACTCGACGGATCGCACTGCCTTCATGCCAGCGACACATCATTCAAATTTCTGCCCTGTCAACTTTGGATGGTAGGATAGGTGCCTACCATTGTGGTCACGGGTGACGGAGAATTAGGGTTCGATGCCAGAGAGGGAGCTTGAGAAACGGCTACCACATTCAAGGAAGGAAGCATGCGTGTAAATTACCCAACACTGACATGGGGAGGTAGTGACAATAAATAACAATACCGGGCGCATTAGTGTGTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACAAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGTCGTGGTAATTCTAGCTCCAATAGCGTATATTTAAGTTGTTGTAGTTCAAAATCTCATAGTTGGACCTTCGGGCCGGTCGGCCGGTCCGCCTCACAGCGAGCACCGAAATACTCGACCCTAGCCTTAATTGGTCGGGTTGTGTTTTCGGCATCGTTACTTTGAAGAAATTAGAGTGCTCAATGCAAGCCATCGCTCTAGATACATTAGCATGGGTGTCACGCCCAAGATGCGACCCTATCCTAAAGGAACTCGAAGGTCCCACTAAGGATAGAAGCACATCTT\n>GG700527.1/116493-116761 Anaerococcus vaginalis ATCC 51170 genomic scaffold SCAFFOLD1, whole genome shotgun sequence. \nAATAAAACTTTGATCAGAAGTAAGTAAGTTTTATAAATCTTTTATAGAGAGCTTGTGTGTGGTGGAAACAAGCAAAGAAGTAAAACCGAATGGATCTGAGAGTGCTAAGGTGAAAAAAGTACCCGAGGCCGTCTTCCCACGTTATAGGGATATGATATGAAATTATTTTAAATTAGTATCAGAATAAAGATATGTAGGATTTATTAATTTATTGAAATTTATTTTACATAAAAAGGATGGCACCGCGAATTCAACCATTTGCTCCTTTG\n>CM007396.1/65217892-65218035 Nicotiana attenuata strain UT chromosome 6, whole genome shotgun sequence. \nTGTAAAGGTTTCCTCGGGCCGGACGGAGATTTACCCTCGAGTGTAAAGGCAGAAAGGAGCTTGACTGCAAGACCCACCCGTCGAGCAGGGACGAAAGTCGGCCTTAGTGATCCGACGGTGCCGAGTGGAAGGGTCGTCGCTCAA\n>AFSB01270989.1/241-552 Heterocephalus glaber contig270989, whole genome shotgun sequence. \nAGATGTGTGGGACAATGTGGCTATGACATCTGTCACCCCATCGATCACCAGGGTTGATTCGCCCGATCTGGCTGGCTAGGCAGGTGTCCCTTTCCTTCTTCACCACTCCACGTGTGTCCCTCCCAAAGATGCACAATAGGTCGAAAAGAACGAACACCCAAGCTACAGGAGGACAATTTCCTCATCAAGGGTATATGAGTAGCTACACTCCCCTGCTAGAACCTTCATACAAGAGCTCAAGAATACTCCACTATAGGACCCGGATGTAGCTCAGGGGTACAGAACTTGCCTAAATGCACAGGTCTTGGCTTT\n>FN543502.1/2725931-2725592 Citrobacter rodentium ICC168, complete genome \nTTTGGCGACGTCCACCTGCTGGATTTGGGCATACAGTTTGCCGACCACTTCGGCGATCGACGGATGCCAAGAGACGGCGCGATTGACCGCCTGAGAAAGTGTAAGTTCGCCGGGGGCGGCGCTGTCGCCGGTTAGCGGCATTGGTCCATTCAGCGAGGGCAGCTCCTGCTGCTCAACCCACTGCTGCGGGGCGATGCGGGGTGACTCTTCGGCGGCAATGGCCGGAAACGCGCACAGGTTTCCAGCCAGCCACCAACAGGTCAGCTGTCGTTTTCCCATTTTTTACTTCCCTAAGCTGGCTTCTTTTCGCCCCGGGCGAACGTGCGCCCGGGGTCGTTGT\n>CM000685.2/82594813-82595002 Homo sapiens chromosome X, GRCh38 reference primary assembly. \nAGGCATGTGATCAATCAGGCTGAGACATCTGTTACTGCATTGATTGACTTGGATGATCAGGCTTGTGAAATAGGTGGCCCCATCCTACTTTGCTGCCCCCAAGTACATCTGTCTCAAAGCTTACACTGCTGGAAGGGGATGACCATCCCTATTAGAGGACAGTCATTCTCTGGTCAGGAGTAGAGAAATA\n>DS995940.1/1722-1546 Penicillium marneffei ATCC 18224 scf_1105668340736 genomic scaffold, whole genome shotgun sequence. \nGCTGGCGACGGCGACCCGGGAGAAGCCCTGGGCCGCTGGCTGGCGGATTGCAATGTCACCACGCGCGGGGATAAATCCTCTGCAGACGACTGAAGTGACCAAGCGGGTCATGTACGCGTACGAGTAGCCTAGTTGTTACGAGTCGCTGAGTGTCAGCCCGACCTTGGCTCGATTTGT\n>MLHJ01000044.1/15422-15261 Rodentibacter rarus strain CCUG17206 contig_44, whole genome shotgun sequence. \nTTTATCGCATAACTCCGAGCTTGTTTAGTCTAAGTTCCTCTTTGGTGAAAATACTTGGGTGAGGAATATGACGGCAATGCCAATAACGCTATTTGTTATTCAGGGATACGCTGGAAACGGCTTGTCCTCTCCATTTTAGAAAGGTGTCACATGCAATCTATT\n>MAVT01007669.1/869-1028 Diaporthe helianthi strain 7/96 Scaffold_4854.1, whole genome shotgun sequence. \nACACGCATGAGCCGGTGCCAATCCGCCCGTGCCAGGTCCGAGAGTCCTGCTTCAGCAGCACTCAAAGTGATTTCGGCGCGACGGCGGAGTTGCTGAGATTACACGGCTTCGGAACTTGATCTTGGATAATACCAGCGAAAGGATCATGCGTCTCCCCCCC\n>CDMY01000201.1/99855-100012 Vitrella brassicaformis CCMP3155 genome assembly, contig: scaffold135 \nAAACTTACCTGGCTGGGCCTCGGGGGCGCTCACGAAGGTCCCTGTGCTGTCGTGGAGCTCCCATTGCATTCGGGGGTACGTGAAGCGGCATGGGGGGGCTATGCTCCTGCCAACAGCGGAATTTCTGGCAGAGCTGGCTTGCGTTCGCGCAGCCGGCA\n>CM002822.1/201709819-201709930 Capsicum annuum cultivar Zunla-1 chromosome 11, whole genome shotgun sequence \nGTACACCCCAAAGGAGTGTACATGAGAACACAAGTGTATTTTAGTTTTTTACAATTTCAATTTCTATATCTAAAATGTACTTGTGTTCTCAGGTCACGTCTTTGAGAACACC\n>MGVN01000036.1/14680-14207 Elusimicrobia bacterium RIFOXYB2_FULL_49_7 rifoxyb2_full_scaffold_1450, whole genome shotgun sequence. \nCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTCTGTGTTACCAGCGGATAATGCCGGGGACTCACAGAAGACTGCCTCTTTTTTGAGGAGGAAGGTGAGGATGACGTCAAGTCCTCATGGCCCTTACGTCCAGGGCTACACACGTGCTACAATGGCCGGTACAGAGGGTCGCAATGCCGCAAGGTGGAGCTAATCTCAAAAAGCCGGTCTCAGTTCGGATTGGAGTCTGCAATTCGACTCCATGAAGTTGGAATCGCTAGTAATCGCGGATCAGATACGCCGCGGTGAATACGTTATCGGGCCTTGTACACACCGCCCGTCAAGCCATGAAAGCCGGGAGTACTCAAAATGGTTGCCTGAACCGTAAGGAGGGCGCCCCTAAAGTAAAACCGGTGATTGGGGCTAAGTCGTAACAAGGTAGCCGTACCGGAAGGTGCGGCTGGATCACCTCCTTT\n>LVVY01000041.1/1-81 Devosia sp. S37 DIN_R1_(paired)_trimmed_(paired)_contig_135, whole genome shotgun sequence. \nTATGCCACTGGCGCAAGCCGGGAAGGCGCCCGCCGGGGATGATCCCAAGTCAGAAGACCGGCCAGATGACCTCTTGAAGCT\n>ANKR01162454.1/9860-9985 Myotis brandtii contig162454, whole genome shotgun sequence. \nTAACCTCCGCAGGCTGGCTGGCCCTCAGGCTGAGCTGGGTGAGTATCTTTTCTGTTTTGGGAGGACGGGGAAGAGGGGGGACCCAATATCTTTTTGAGAGGCTCGCCCTCAAGCACAACTAAGAGC\n>LGPB01000006.1/253-1 Bacillus galactosidilyticus strain PL133 scaffold000006, whole genome shotgun sequence. \nGATTAAGTTGTTAAGGGCGCACGGTGGATGCCTTGGCACTAGGAGCCGATGAAAAGGGACGGGGACTAACACCGATATGCTTCGGGGAGCTGTAAGCAAGCTTAGATCCGAAGATTTCCGAATGGGGGAACCCCCTACCTTTAATGGGGTAGGATCCAATTCTGATTCTGAATACATAGGAATTGGAACCCGGGGAACTGAAACATCTCAGTACCCGGAGGAAGAGAAAGAGAAAGAAAAATCGATTCCCTAA\n>CAQQ02314174.1/33-1 Megaselia scalaris, Durham, NC isolate 2 -- Noor lab, WGS project CAQQ02000000 data, contig: ctg0000314174 \nAAACCGGTTCTTTTCAGAACCACCAATTTTTTT\n>LL082930.1/890-2011 Trichobilharzia regenti genome assembly, scaffold: TRE_contig0003919 \nGACTGATGAGCAGGTTTCTTTTAAAGTGAGTTCATTTAACCTCTTTTTGTATTCTATTCTATATCCGCCATTTTTCTGAAAAATTTTTGAGTAATATCACCATTCATCTATTCGTTTTATTATTATTATTATTGTTAATATTAACTCACCTCCATTTCAAATTTATTTAAGCGAAAGTGTTCATACTACTAACATAGTCTATTCAGTAGTATTCATTTTAAAATGTATATTTTTCGAATTGAGGTGCATTAAAACAACAGGTGTTATAGTAAAGAAAAAGAAGAAGTTTTGAAGGGAGGACGAATAACTCAGTGGTGATGTGATTTATATCAGATGTCTTTGTATTACCGTCGTTGGATAGACTTTATCGAAAGCATTTGCTAAGAATAATTTCATTGATCAGGAACGAAAGTCAGAGTTTCTAAGACTATCGTTTCAGTTCTACCATTAAACAATGCCAACTGACGATCTGTGTTGGTTCTTTAATTGTCAATGAACGCACTATCCAGGAAAACTTCAAGTCTTTCAGCTCCGGAAGAAATATGGTTAAATAGCTGAAATTTACAGGAATTGAAGGAAGGGTACCACCAGGAGTCGAGCCTGTGGTTTAATGGAACCCAACATGGGAAAAATCGTTCGGCACGGACATATTCAGGATTAACAGATTGAAAGCTGTTTCTTGATTTGGTTGATGGTAGTGCGCGGCCGTTCTTATCTGCTATCTGTTGCTTCTTAGTGGAGTAGTGTGATCGTTAACTGGAGAGTATGGTACCAGCTTTTGTCTCTTAAACAGACAGACTGCACACTGAAGTCGTACGACATTGAGCAACAACAATTCTGTGATGCCCTTAGACGCCCAAAGCTACACCTGCGCTACAATGACGGTGCCAGGGTTAAGCCACCTGTTTTATCACCGTCGTGACTGGGAACGCTACCTGCAATTGTTCTCTGTGGAAGTCATAAACATCTACTGATGACGTCACTGCCCCTTGTACACACTGCCCGTCTCTATTACCGATTGAATACTATTCATAAACATGAACAATTGAGAATGGTTGGCGTTAATGTTTAATATATCGCCAAATTTGTCTTGATTGATGAGTAGACAGAACGAAATCAAAG\n>FWFV01000002.1/64217-64338 Palleronia marisminoris strain CECT 7066 genome assembly, contig: 0002 \nGTGACATACGAGCACCCACCTCCTCCCGGGCGCCTCGTATTCGGCGACGACACCGACCTCCTCCCCGGTGTCGTCGCCACAGATTACGCAGCGCCGACCTCCTCCCCGGTGCTGTGTTTCAG\n>MNVI01000024.1/6358-6450 Candidatus Micrarchaeota archaeon CG1_02_55_41 cg1_0.2_scaffold_10394_c, whole genome shotgun sequence. \nCCCGCAGTAGCTCAATTTGGCAGAGCACCTGACTGTAGTTAGAAAATCCGAGTGGACATCAGGGGGTTGCCAGTTCAAATCTGGCCTGCGGGA\n>AAGJ05017846.1/1565-1174 Strongylocentrotus purpuratus Contig17846_fixed, whole genome shotgun sequence. \nGAGACACTGGCCGGGGCCCCGGGAAGAGTTGTCTTTTCTTGTTAAGGAGCGGGATCCCTGGAATCGGTTCGACCGGAGAGAGGGTCTGCGGCTCCGTAGAGCGCCGCGTCTACGGCGGCGTCCGGTGCGCTCCGGCTGGTCCTTGAAAATCCGGGGGAAGTGTTGGGACTCTCGCCTCGGGTCGTACCCATGACCGCAGCCGGTCTCCAAGGTGAATAGCCTCTGGCCGATAGAACAATGTAGGTAAGGGAAGTCGGCAAGCCGGATCCGTACCCCCCGCAGGGATGGATTCCACCCCTCTGTCACATCATCTCTCTTTACTATAATACCCTCCTCTCCCTTTTCTTTTAAAACCAATGGATGATGTATGGGTCCCCTCCCCTTCCCCTCGT\n>MOOB01000036.1/196011-195921 Penicillium nalgiovense strain IBT 13039 PENNAL_contig0036, whole genome shotgun sequence. \nACTACGTGATGATCAATTTTGAATTTGCAATCCTGACAACCACCTATCATATGTGAGGTTGTGTGTTGACTCTTCTACACTTGATCTGACC\n>CP002770.1/704081-707325 Desulfotomaculum kuznetsovii DSM 6115, complete genome. \nGGTCAAGCTGGTAAGGGCATACGGTGGATGCCTGGGCGCTTTGGGCCGATGAAGGACGTGGCAAGCTGCGAAAAGCCACGGGGAGCCGCAAGCAGGCGTAGATCCGTGGATCTCCGAATGGGGCAACCCGGCGGGGGTGAACCCCCGTCATCCCGTACTGAACACATAGGTACGGGAGGGGCACCCGGGGAACTGAAACATCTTAGTACCCGGAGGAAAAGAAAGCAAAAGCGATCCCCGTAGTAGCGGCGAGCGAAAAGGGGACAGCCTAAACCCGGCACTCAACTGAGTGTTTATGTTATGCATACAACAAGCTGATGCATCCGGGAAGTGAAAGTTGGGGTAAGAGCATAGCGTAAACACCGAGTTGAGTGCCGGGGGTTGCGGGACTCCCGTTGACGTACTGCGGAACTTAGCCGAAGCGGGCTGGAAAGCCCCGCCGCAGAAGGTAAAAGCCCTGTAGGCGAAAAGGGAAGCAGTGCGGGGAGGATCCCAAGTACCGCGGGGCACGTGGAATCCTGCGGGAATCAGGGAGGACCACCTTCCAAGGCTAAATACCCAAAGCGACCGATAGTGGACCAGTACCGTGAGGGAAAGGTGAAAAGCACCCCGGGAGGGGAGTGAAATAGGACCTGAAACCGTATGCCTACAAGCAGTCGGAGCCCAGCACTCAACTGGGTGCTTACCTTAGGCTTTAGAGGGGCTGATACATTCCGGGAGGGAAGGGCCTGTTTAAGGCAACCGTAAGCACCGAGTTGAGTGCTGGGTGACGGCGTACTTTTTGTAGAACGGACCGGCGAGTTACGTTCAGCGGGCGAGGTTAAGGCTGGGAAGGCCGGAGCCGTAGCGAAAGCGAGTCTGAAGAGGGCGATAAGTCCGCTGGAGTAGACCCGAAACCGGGTGAGCTACCCATGTCCAGAGTGAAGCGTAAGTAAAGTTACGTGGAGGCTCGAACCAACCGTCGTTGAAAAGGCGGTGGATGAGGTGTGGGTAGGGGTGAAATGCCAATCGAACCCGGAGATAGCTGGTTCTCCCCGAAATAGCTTTAGGGCTAGCCTCATACGAGAGTACCGGAGGTAGAGCACTGACTGGGCTAGGGGCCTTCGCGGGTTACCGAACCCAATCAAACTACGAATGCCGGTTACTTGATGTATGGGAGTCAGACTACGAGTGCTAAGATCCGTAGTCGAGAGGGGAACAGCCCGGACCGCCGGCTAAGGTCCCGAAGCGGTGCTAAGTGGGGAAGGATGTGGGGCTGCGAAGACAACCAGGATGTTGGCTTAGAAGCAGCCATCATTCAAAGAGTGCGTAATAGCTCACTGGTCAAGTGGCCCTGCGCCGAAAATGAAACGGGGCTCAAGCACCGCACCGAAGCCGCGGATCTGAGAGGTGAGAGGTGAGAGGTTGGAAGTGGGAATAACGATTCTCACATCTCACTTCTCACATCTCACCTCTCAGGTGGTAGGGGAGCGTTCCCACCGGGTAGAAGTCACACTGGGAGGTGTGGTGGACTGGTGGGAAGTGAGAATGCCGGTATAAGTAAGCGAAAAGGCAGGTGAGAATCCTGCCCGCCGAAAGCCTAAGGGTTCCTGGGGAAGGCTCGTCCGCCCAGGGTAAGCCGGGGCCTAAGCCGAGGCCGAAAGGCGTAGGTGATGGGGAATCGGTTGACAATCCGATGCCACCGGTAGGCCGATTGAGGATGGGGTGACGCAGGAGGGTAGGCCAAGCGCGCGGCTGGAAAGGCGCGTCCAAGCCGGTAGGGTGTGGGGCAGGCAAATCCGTCCCACGGTAAGCCCGAGAGGTGATGGGGAGGGAAATAAGAGTACCGAAGTGGCTGAACCCAAACTGCCGAGAAAAACCTCTAACGAGGAATACCGGTGCCCGTACCGCAAACCGACACAGGTAGGCGAGGAGAGAATCCTCAGGCGCGCGAGAGAACCCTCGTTAAGGAACTCGGCAAACTGACCCCGTAACTTCGGGAGAAGGGGTGCCCCGGTAGCGTGAAGGTATGAACTGCTGGAGCGCGAGGGGGCCGCAGAGAAGAGGCCCAAGCGACTGTTTACCAAAAACACAGGTCCCTGCGAAATCGAAAGATGAAGTATAGGGGCTGACGCCTGCCCGGTGCTGGAAGGTTAAGGGGAAGGGTTATCCGAGAGGAGAAGCTCTGAACCGAAGCCCCAGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCCGCACGAAAGGCGTAACGACTTGGGCGCTGTCTCAACGAGGGGCTCGGCGAACTTGTAGTACCCGTGAAGATGCGGGTTACCTGCGACGGGACAGAAAGACCCCGTGGAGCTTTACTGCAGCCTGACATTGGACTTCGGTATTGCATGTACAGGATAGGTGGGAGGCAGGGAAGCCGGGGCGCCAGCCCTGGTGGAGCCGACCTTGGGATACCACCCTTGTGGTATTGGAGTTCTAACAGGGTACCGTGGAGCCGGTACATGGACAGTGTCAGGTGGGCAGTTTGACTGGGGCGGTCGCCTCCTAAAAGGTAACGGAGGCGCCCAAAGGTTCCCTCAGCGCGGTTGGAAATCGCGCGTAAGAGTGCAAAGGCAGAAGGGAGCTTGACAGCGAGACTGACTGGTCGAGCTGGGACGAAAGTCGGGCTTAGTGATCCGGCGGTAGCGAGTGGAAGCGCCGTCGCTCAACGGATAAAAGCTACCCCGGGGATAACAGGCTTATCTCCCCCAAGAGTTCACATCGACGGGGAGGTTTGGCACCTCGATGTCGGCTCATCGCATCCTGGGGCTGGAGTAGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGTACGTGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCCTATCCGTCGCAGGCGCAGGAAACTTGAGAGGAGCTGTCCCTAGTACGAGAGGACCGGGATGGACAGACCGCTGGCGTACCAGTTGTCCCGCCAGGGGCAGCGCTGGGTACCCAAGTCTGGTGGGGATAAGCGCTGAAAGCATCTAAGCGCGAAGCCCTCCTCAAGATAAGGTTTCCCACCCGGCACTCAACTGAGCTTGTCAGGCCAATCCACTTTAAGGAGAGATTGGCACGCTCAGTTGAGTGCCGGGGTAAGACCCCTGGAAGACTACCAGGTAGATAGGCCGGGCGTGTAAGCCGGGTAACCGGTTGAGCGGACCGGTACTAATAGGTCGAGGGCTTGACCAG\n>CM002293.1/9210050-9209896 Phaseolus vulgaris cultivar G19833 chromosome 6, whole genome shotgun sequence. \nATACTTACCTAGATAGGTCAATGGATTATCAAGAAGATTCATGGTTTATGAAAGTAACTTTCATTGCAATTTGGATGGATGCGTTTCTGATTTTGTCAATCTTCATATAATTTGTGACCGATGAAGTCTGAACTTTTGAAAGTTTCACTTTCATT\n>FP929055.1/3038167-3038356 Ruminococcus torques L2-14 draft genome. \nTGATTATGAATGATCAGAGGAACGACGTGGGAAATCTGGACTGGTGAAAAGGGAAACAGGTGAGAATCCTGTACGAACTCGTCACCGTATTTCGTGAGCTTGTGTTTTGAGACCACTGGGAGACCGGGAAGGTGAAGCAGAAGCATTTGAACGATCAGCCGGGAGACCTGCCTTTCGCAGTACAGGAATG\n>ALWZ042737980.1/1504-1133 Picea glauca, whole genome shotgun sequence. \nTGAAGCTTTACTATTTCCTGGGAATAAATATGGATTCTTCTTTACATTTTTGGTGGACAGCAAAGAAGTTCCTTTAATGTGGGGCTTGAGCCATAACTGAGATACAGCTCTAGCAGAGTTAGAATTCCAACCTGTATTAGGACCCATGTTCCAAGGGGATGATCTTGGGTAAATAATTTCTATGGGGCGTAAGACTCAAAAGGTAATGGAGGCATGCAAAGGTTTCTTTGGGCTGCGCAGAAATTGACCCTTGAATGTAAAGCAAGAGCTAGCTTGACTGAAGAACCCACCTGTCAAGCAGAAGCAAAAATTGGCCTTAGTGGTTCAGCAGGATTGAGCAGAAGTGTCATTGCTCAATGGTAGAAGGTACTC\n>CM001000.2/104264790-104264683 Mus musculus chromosome 7, GRC primary reference assembly. \nGTGTTCTTGCTCAGGCATCATATGTGCCCAAAGTAGAATGATCAGGGAATGTTAATATGGCCCCTGCTCATGGATGACATGCGAGTTTATGAAGCATTCCATATTTTT\n>ACTA01010209.1/17005-16720 Ailuropoda melanoleuca scaffold917_80, whole genome shotgun sequence. \nGAGTGTGTTGAGGATCTTTCCACATCAGTTACCCTCCTAATGGCTGGAGTTGACTCGGCTGATGGGGATGGCTAAGTGGTGTCCCCTTCCTTTTTCACTACTCCATGGACATCCCTCCTAAAACGAAGTGCTTTTGGATGCAGAGGACAGCCCCATCGAAGTTGTTTTGTCAAGAGAAATTGATAGCTACACTCTGCTATTTGAATCTTCAAATTTAACACTTGCTTTTCTGTGCTTTCTCTTTGTTTCTCTTAAAAATATTATATATGATAACACATTTGGAAAG\n>CM001415.1/8836720-8836132 Lepisosteus oculatus linkage group LG12, whole genome shotgun sequence. \nAAGGAGCAATGACACAAGAGTTCCTGTCACAAGTCAGACTCGGTCCAGGGATAATGCTGGGTGGGGAGGGCTAGTATTAAGGACAGTGGGCTGCACAGGGCGACATCACTTTTTGATCCTTTGATCCTTCCTAGAACTGTGAAGTAGGATTCACTTAGTATTGGATTGTTCACCCTCTAAATGGGAATGTGAGCTGGGTTAGACACTCATGAGACAGATTAACTTTACCTCATGGCTTTACCGATGATGCGATGTTGCGATTGCTGTTGTGATCTGCTGCTCTTTATGAGAGGAACCACAGGTTCAGACACTTGATGTCTGTCTGTGCTTGGCTGAGGAGCCAATGACACAGAACCCACAATTTGTGGGATTATGGTTGGATACCTTCATGACAACCCCAACGCCTTAAAAGGTGTAAATGTTCTGCGACACAGAGTTACAAAGCAGATTAAGATTTCACAGCAAATCACCAAAGAGACACCTTCTTCACCGTTCTAGAAAATCCTTTTCTACATTAAAGTCCCTGAAATAAGGAAGATCCTTGAAGGTGCTAATTCTTGCACAACAGACACTAGTGCAGTCAATAAGG\n>FR799005.1/397220-397284 Leishmania braziliensis MHOM/BR/75/M2904 complete genome, chromosome 30 \nCCGCTGCATCAGTACAGCGACATCATCTTTTCGAGTGGTGATGCCTGCTGGCGATGTCAGCAAGA\n>AUSU01007329.1/5457-5644 Genlisea aurea contig_12937, whole genome shotgun sequence. \nTAGGGGTATAGAGAGCTTTCTTCAGTTCAACCACAGGAGAATTAGGATTCAATCTGCTGCCGATTCATTTAAACAAACGATGTACGGATTTATCGAGTACTTCGATTGAACGAATGATGCGGGAGTCAAGTTGAATTCCATTTGCTTTTCTTGTGTTTGGACTGAAGGGAGCTCCCTTTTTTCTTCTT\n>GL871722.1/1-494 Dictyostelium purpureum unplaced genomic scaffold DICPUscaffold_800, whole genome shotgun sequence. \nCTCTGGGGTTAGAGTGCGGCAACGTATCTTTGCTTCAAGGAGTGTGTAGTCTGACTTGATAGGTACGTTAACAAAAAACTTCTTAGAGGGACTACCTGCCTCAAGCAGGCGGAAGTCCGAGGCAATAACAGGTCTGTGATGCCCTTAGATACCTTGGGCCGCACGCGCGCTACAATGCAGATAGCAAAAAGGTTCCTGGTCTGGAAAGATTGGGTAATCAATTGAATTTTCTGCGTAACTGGGATTGATCTTTGTAATTATTGATCATCAACGAGGAATTCCTTGTAAGCGTAAGTCATTACCTTATGCTGAATATGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATCGAATGATACGGTAAAGTTAACGGATAGTTTTTTTGTGGCAACACAATTAAAATTAAAAGTTATTTAAATCTCATTGTTTAGAGGAAGGAGAAGTCGTAACAAGGTATCCGTAGGTGAACCTGCGGATGGATCATTT\n>CM002821.1/68112919-68113024 Capsicum annuum cultivar Zunla-1 chromosome 10, whole genome shotgun sequence \nGACCACGTGATTAGGGAATTGATTAATTTATCATTCAATCATTGCCATACTTCATACAAAGGTTCACCATTGAGTTGGCAGAACTTTATTATTCAATCTCTAGGTT\n>AYYE01001153.1/1824-2049 Tannerella sp. oral taxon BU063 isolate Cell 1/3 contig_2519917771, whole genome shotgun sequence. \nATTTTTGCCGCCGTTTTCGGTGACGCCAGGTCGGACGGTCCCGTCCGCGACGTGAAAAGGGAATCCAGTGAAAGACTGGAACAGTGCCCGCTACTGTAACACCCCACCTATCGAACGAAGGAGAGCACCCGCAAGACGTGCCACTGCCGCCACTGAGGCGGTGGGAAGGCCCACAGCCCTCCTTCAGGGTGAAGTCAGGAAACCTGCCGGAAACAACAACGTATAC\n>AZNC01074805.1/442-855 Glycine soja cultivar W05 scaffold3126_15, whole genome shotgun sequence. \nGACTCTGATGCTATATCAATAAATGTCCATATAGGAAATGGCTATCCTAATGGCTCGAGTGGCATAAACGAATGAGAGGTAACAAAGGCTTGCAAGGGTTTCCTCGGATCAGATGGAGATTAGGCCTTTAGTGTAAAGGCAAAACAAAGTTTGATTGTAAGACCCACCCATCGAGTAAAGATGGAAGTCAATCTTAGTGATCTGATGGTGCCAAGTAGAAGGATTGTCCCTCAATGGGCTATAGGGATAACAGACTCATCTTCCCCCAAGAGTTCAGATCGACAAGAAGGTTTGGCACCTCAATGTCGGGTCTTCGACATTTGAGGTTGTAGTATGTTCAAAGGATTAAGTTGTTCGCCCATTAAAGCGGTATATGGAAAATGCAAGTTCTGTAAGGCACATAAGATTGTGTTA\n>MCGE01000002.1/764806-764528 Absidia repens strain NRRL 1336 BCR42scaffold_2, whole genome shotgun sequence. \nAGCAACGAAGAAGATCTGCATGTTTGACGCACCACACACACGGGGGTTTTATACTCATTATAAATTGCGTTAGGGAAGTTCTCCAGACATGTGTACCTGTAATGGGTTATTGAAAGCAGCCTTTCTTAAGGTTGTGGTATTCAATTATGCCAAATTATCAGCTAAGATAGCTGTGGTATGGTTGGGTATCCAATAGTTCTTGTCATAGGAATAGGTATTGCGGATCTTGGTAAAATTTATTTTATCATGAACTCAATGGAGGCTACTCTCTTTTGTTGC\n>ASAF01079751.1/2035-2138 Nicotiana sylvestris Nsyl_contig79751, whole genome shotgun sequence. \nTACGCAGGAGAGATGATGCTGGATAATGGACCATCCCTGCTTAGCTATCTCAAGAGATTGGAGGGAGCTTTGATTATTTAGCCAGCATCATACTCCTGCATATT\n>JXLN01013749.1/1932-192 Sarcoptes scabiei Contig13748, whole genome shotgun sequence. \nTATCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTCTAAGTACATACCGCATTAAGGTGAAACCGCGAATGGCTCATTAAATCAGTTATGATCTATTGGATGTTGACCAATTACATGGATAACTGTGGTAATTCTAGAGCTAATACATGCCGAAAAGCTCCATCGCAAGGTGGGGTGCATTTATTAGACCAAGACCAAAAGGTGGAAACACCTTGTTGTGGTGACTCTGAATAACTGCAGCTGATCGCATGGCCTCGTGCCGGCGACATATCCTTCGAGTGTCTGCCTTATCAACTTTCGATGGTAGGTTATATGCCTACCATGGTTGTAACGGGTAACGGGGAATCAGGGTTCGATTCCGGAGAGGGAGCCTGAGAGATGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCTTGGAACAAGGAGGTAGTGACGAAAAATAACAATACGGGCTTCGCTTACGCGTTCTCGTAATTGGAATGAGCACAGTTTAAATCCTTTAGCGAGGATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCAGCCCAAGTGCATTGGTCCATCATGACGATGGTTACTGGTGTGCTGGGCACTTTACCGTTCACGTGCTATGGTGTTCTTAACCGGGCGTCATAGTCGTACGGTAGTTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCATCATCGCCTGAATACTGTTGCATGGAATAATAGAATAGGACCTTGGTTCTGTTCTGTTGGTCTTCGGATCCGAGGTAATGATTAAGAGGGACGGACGGGGACATTAGTACTGCGGCGATAGAGGTGAAATTCTTGGACCGCCGCATGACTAACCAAAGCGAAAGCATTTGTCAAGAACGTTTTCATTAATCAAGAACGAAAGTTAGAGGTTCGAAGGCGATCAGATACCGCCCTAGTTCTAACCATAAACGATGCCAACTAGCAATCAGCCAGAGTTCGTTTATGACTCGGCTGGCGGCTTCCGGGAAACCAAAGTTTTTCGGTTCCAGGGGAAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTNNNNTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGATAACGAACGAGACTCTAGCCTACTAAATAGCAATCGGAATTCGTTTCGACTTCCGATCCAAGCTTCTTAGAGGGACAAACGGCGTTTCAGCCGTATGAAAAAGAGCAATAACAGGTCTGTGATGCCCTTAGATGTCCGGGGCCGCACGCGCGCTACACTGAAAAGATCAGCGTGCATATGTTACCTACTCCGAAAGGAGCGGGCAACCCAGTGAAACTTTTTCGTGATTGGGATTGGGGATTGTAATTATTGTCCATGAACGAGGAATTCCCAGTAAGCACAAGTCATCAGCTTGTGTTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCGATTGGATGTTTTAGTGAGGTCTTCGGACTGGCCAACGTAGCCATCCTCGTGGTGGCCATGTTGTGCGGGAAAGATGACCAAACTTGAACATCTAGAGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTA\n>CM001648.1/54674393-54674536 Nomascus leucogenys chromosome 2, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAGTATCTGTTCTTATCAGTTTAATCAAGAAATGAAGATGGAATATTATTTTACAATGTCTTGATAAGTTGGGGAGCCTCATTATGAAAATATGGGAATCATAGAATCTCT\n>CP001720.1/2579904-2579665 Desulfotomaculum acetoxidans DSM 771, complete genome. \nTCACAAGTGATGATAGGGAAGAGTAAACCTGTACTGTTTACAGAGAGAAGCCGCCTTGGTTGAAAGCGTCTTTAAAAGAAGGCAGGTTAAAAACCACCCTTGAACTGCATAGCCGAAAATTTTAATCCTCAGGGGATTATAGATCAGTAAGCTTAGCCGGCGGCAAACGTTAATTGCTCTGAAGTGAGGAAATTTTATTTCCTAATTTGGGTGGAACCACGGAATAAGACCGTCCCTATT\n>JMCC02000032.1/46273-46035 Enhygromyxa salina strain DSM 15201 ES-Contig_32, whole genome shotgun sequence. \nACTCCGAGGTCGAGGCTAACAATGGCCCTCCGGCGCGCGAGCGCCGGCTGAAAATCGGGTGAATTGCCAGAAACTCCGGGGACGGACAACCGGCAGCCAAGGTCGAGACGGCGGTGCAGCGATGCCCAAGGGCTCGGCAAGGTTCAGAGACTAGGGCCCGAGCGAAAGCGGTGATGGCCCCACGAGCGCCCGACATCTCCCGCGGGAGATGATGAGATAGTCCGTACTGCCGCGATAAT\n>LPNI01000102.1/691-2685 Bacterium P201 scaffold_101, whole genome shotgun sequence. \nGCGAAAGAAAGTTAGGGCGTCTGGTGGATGCCTTGGCTCTCGGAGGCGATGAAGGACGTGATAAGCTGCGATAAGCCATGGGTAGGTGCAAATAACCTTTGATCCATGGATTTCCGAATGGGACAACCCAGCCGGCTGAAGGCCGGTTATCTCTGCCTATGCAGAGAGGCAAACCTAGGGAACTGAAACATCTTAGTACCTAGAGGAAGAGAAAATAAACAATGATTCCCCCAGTAGTGGCGAGCGACCGGGGAAGAGCCCAAACCGCATGTGTAGCAATGCATATACGGGGTAGTAGGACCACGTCGTGGCATGCTGATCGTGAGAAGAATGTTCTGGAAAGTTCAATCATAGAAGGTGACAATCCTGTAGTCGAAGCGTGATGCAGCCTAGTGGCATCCTGAGTAACGCGGGGCACGAGTAATCCTGCGCGAATCCGCCGGGACCATCCGGTAAGGCTAAATACTCCCGAGAGACCGATAGCGAACCAGTACCGTGAGGGAAAGGTGAAAAGCACCCCGACGAGGGGAGTGAAAGAGTACCTGAAACCAGTCGCCTACAAGCGGTCGGAGCATGTTTATCATGTGACGGCGTGCCTTTTGCATAATGAACCTACGAGTCACCATCACAGGCGAGGTTAAGTCACTAAGTGACGCAACCGCAGTGAAAGCGAGGCTGAAGAGGCCGTTTAGTCTGTGGGGGTGGACGCGAAACCGAGTGATCTACACATGGTCAGGGTGAAGTCCCGGTAACACGGTATGGAGGCCCGCACCAATAAGCGTTGAAAAGCTTCTGGATGAACTGTGTGTAGGAGTGAAAGGCCAATCAAACTCGGAGATAGCTCGTACTCCCCGAAAGGCATTTAGGTGCCGCGTGCTGTGTTCACCCTGTGAGGTAGAGCGACCGATAGGTCAAGAGGGCTTCACCGCCTATCGCGACCTGACGAACTCCGAATGCACAGGGTCCGTAGCAGTGCAGTAAGGGTGCGGGTGCTAAGGTCCGTGCCCGAGAGGAGAAGAATCCAGACCGCCGTCTAAGGTCCCGGAGTTCTGCCTGAGTTAGTCTAACGAAGTCTGGTCTCGATGACAGCTAGGATGTTGGCTTGGAAGCAGCCATTCATTCAAAGAGTGCGTAACAGCTCACTAGTCGAGAGACCGGGCGTGGATAATAATCGGGTATAAGGCAGACACCGAAGGCGCGGGATAGCAAATAATAAAAGTATCGGTAGGGGAGCATTCCATCTGCGCCGAAGCAGACCGGTGACGATCTGTGGAGCGGATGGAAAAGCAAATGTAGGTATAAGTAACGATAAGGGGCGTGAGATCCGCCCCCGCCGAAAGACTAAGGTTTCCCGGGCGATGTCAATCAGCCCGGGGTCAGTCGGGTCCTAAGGCTCAGCCGAACGGCGAGGCCGATGGCTGACACGGTTAATATTCCGTGACTTCCCATTGGGGCGATGTGGTGACGGAGCAGTGGAACTGCCGCGCGGCGACGGATGTCCGCGTTAAAGGGTGTAGGCGTTGATTGGGGCAGGCAAATCCACCCCAAGAGCTGAAACCTGAAAGTACGGGACTCTCTTCGGAGAGACCTGACAGAGCAGGTAATCATACTCCCGAGAAAAACCGCTAAGCTTAACCTTTTGGGAACCCGTACCGCAAACGGACACACGTAGTCGGGTAGAATATACTAAGGCGTTGAGAGATTCGTGGCTAAGGAACTAGGCAAACTGACCCTGTAACTTCGGGATAAAGGGTCCTCGCTTATAGCGAGGCGCAGAGAATAGGTCCAGGCAACTGTTTAACAAAAACACAGGGCTGTGCAAACTCGAAAGATGATGTATACAGCCTGACACCTGCCCGGTGCCGGAAGGTTAAGAGGAGACGTCAGCCTTAAGGTGAAGCGTTGAATTGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGG\n>LXWF01000040.1/121949-121803 Rothia nasimurium strain PT-32 scaffold4_size309601, whole genome shotgun sequence. \nACAAAACAAAAATTATCAGGCAGAAGCGGGGGACCCACCTTTCGGGCTCACCACCTAGGAGCCCTTGGGGTTAAGTTGCAGGCAACTGTGACCGAGTGACTTCATACTCGAACCCGACAGCTCACCTCGTTCGGCAATGGAGGAAAA\n>AFTD01062031.1/43354-43570 Cricetulus griseus cell line CHO-K1, whole genome shotgun sequence. \nAATCAGTTGTATGTATGTACTCTTTTGCATGCATGCACACGCGTGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCCTTTACAAAACTTGGATTAACAAAATCTTTTATGTATGTTGCTTGTTTGGTTTGGTGTTTGTTGAGACAGGGT\n>CM000665.2/44861892-44861973 Homo sapiens chromosome 3, GRCh38 reference primary assembly. \nCAGCGGGTGCCAGGCACGGTGTCAGCAGGCAACATGGCCGAGAGGCCGGGGCCTCCGGGCGGCGCCGTGTCCGCGACCGCGT\n>GL010031.1/37115110-37115156 Loxodonta africana unplaced genomic scaffold scaffold_4, whole genome shotgun sequence. \nAAACAGGCTCTCTAACAGAGCCACAGAATGTTAAAAAAAAAAAAAAA\n>FQXS01000031.1/44397-44023 Desulfofustis glycolicus DSM 9705 genome assembly, contig: EJ46DRAFT_scaffold00031.31 \nCGCCGCCGGATAACAGGCGCATCGTATCTGGTTATTAAGAGGTCCGGTCGAAACATCACATGATGCCTCGGCTCTACCACAAAAGGGGTTCACGAAAGAACCCTGCAAAAAGGAGTAATTCAACATGGCTGAAGGCACAGTAAAGTGGTTTAACGATGCGAAAGGTTTTGGTTTTATCGAGCAGGATGGCGGCAAGGATGTGTTCGTGCACCATTCGGCCATCCAGGCTCAGGGCTTCAAGTCCCTGACCGAGGGTGCTCGCGTATCCTTTGACGTTGTCGACGGCCCGAAAGGACCGGCGGCAGCCAACGTCGTCCAGCTCTAAGAGCCGGATACGGTTGTTGTGGACCCCGCACCCTGGGTGCGGGGTTTTCT\n>LCFB01000050.1/5945-6029 Microgenomates (Gottesmanbacteria) bacterium GW2011_GWA1_43_11 UV59_C0050, whole genome shotgun sequence. \nGCCGAGGTGATGAAATGGTAGACATGCAGGGCTTAGGACCCTGTGAGCCTTAAAACTCGTAGAGGTTCAAGTCCTCTCCTCGGCA\n>AFOY02000015.1/191187-190961 Pseudomonas fluorescens HK44 Contig15, whole genome shotgun sequence. \nCCTACACGCCTTGTTACGGGTGCCCTTCACAGGGTGAAACGGGAAACCGGTGAATCATGTGCTTTACTCAAAAGCCATGTCAGTCCGGTGCTGCCCCCGCAACGGTAAGCGAGCGAAGAATCAGATCCACTGTGCCAGAAGTTCGGCATGGGAAGGCGATTCTTGCAGGTTCGGCGAATGCCAGCCCCTCGTGAGCCCGGAGACCGGCCCGCAACACATAGTGCCTT\n>AAAB01000498.1/1506-345 Anopheles gambiae str. PEST whole genome shotgun sequencing project, whole genome shotgun sequence. \nTGGCGGCGGTTCGCCTGCGCGCGCCCAATGCGCCGTGTTTCTCGCTCAGCGTCCAGTGTGTCGCTGGGTGGTGCCGCCGGGGAGACTGCATCGTAGCATCGTCGTGTGTAGCGTGTTACCCGCTTGTCCGACCGTGAGCCGTGGCCCGCAAGGGTACAAGCTTGCGTACGTCGGTGCATTCGTGGTGCACTGCTTCTGCGCGGTCGATCGTTTATGATGTCACGTTTGCCCCCGGTTCCGCGCGCCGCCCGGCTCGAAGACTCCTGGACAGGTCCTTTCGGTCCACGTCATGGACAGTGCCAGGTGCGGAGTTTGACTGGGGCGGTACATCTCCAAAACGATAACGGAGGTGTCCAAAGGTCAGCTCAGTGTGGACAGAAACCACACGCTGAGCATAAGGACAAAAGCTGGCTTGATCCCAACGTTCAGTACACTTCGGGACAGCGAAAGCTTGGCCTTACGATCCTTTTGGTTATAACGAGTTTTTAGCAAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCCGCCAAGCGTTCATAGCGACGTGGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAAAATTCACCAAGCGTAGGATTGTTCACCCTTTCAAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGGTGTGTGCTTATAGTCGCTATCTTAACGGAATTCCTGTGCAGTACGAGAGGAACCACAGGTACGGACCACTGGCTCATACTAGTCCGACCGGACTTTGGTATGACGCTACGTCCGCTGGATTATGCCTGAACGCCTCTAAGGTCGTAGCCAATCCGAGCTGATAGCGCTTCTCAAACCCATTAGGTGTTCGGAAGCTAGCGGGCCTAACAACCCTCTGAGATCCGTTGGAGTCTGCGTCTGCAGCCCGGCGTCTCATCCCGCTATACCTAGGCCGCAACGAGTGGAGTTCGCTGCACGTGTTAGTACCGTAACTGGGAACGCCGTTGGCTTGAGCTCTGCCCAACGTGGATATACCTAGTTTCGACACCTATCAACCGCCCGCAAACGACGGGACTTCAGGCTGGGAGCTGCGAGTTGTAGAGATGCGTTCGCATCGATCCTCTCAGGCGACCCATGCTTGGTGGTTTGTC\n>URS0000D6AEAC_12908/1-95 unclassified sequences Rhodo-rpoB RNA \nGGGTCGGAGGGCGGCCAGTGGGACGGCCGCCTCGGATGGACCCCTCGACGTCCGCTCTCATGGGGGAAGGCGCCGCGGCCCCGGCGGCGCCCGCC\n>CYSP01000003.1/255745-256067 Propionispora sp. 2/2-37 isolate 2/2-37 genome assembly, contig: 2/2_contig3 \nGTATACGAGGGAACGCTGTACATTGTGCAGAGGAAAGTCCGGACAGGCACGGGCTGCGATGCCCGTAGTGATTGCGCGTGACCTAAGAAGTCACGGAAGGAAGCTCATTCCTTACGGCGGCAAAACCGACTCTGTCTGAGTTGGCGGTAGCCTGAAAGTGCCACAGAAACGAAACGTTCCGGCGACGGAACGATGCAAGGGTAAACCCCGCAAGCCTGAAACTCAAATTACGGTAGAGGAACCCTAGGAAGGGAATAAAACCAGATTAGGGCGCATGAAACTGCGAGATAAATGTTTCCTAAAACAGAATCCGGCTTACGGTA\n>KI669466.1/623363-623809 Kwoniella mangroviensis CBS 10435 unplaced genomic scaffold supercont2.9, whole genome shotgun sequence. \nAGTCCAATCTCATCTCACACTCGCGAGCGGGCCAAGGTCCTGGAATTTCAACCCCCCTTTCATCTTATTTCCTTATGGAAGAAGATGTCTGACCGATCTTAGCGGATCCTTGAGTTAATTTCAAACCAAGTAATTCCCGACCAGAAATGCGTCCTCTCCATCTTATCCGTAAAGGAAACCCATAGAAGCGTTTGACGTGGAGGGTATGGATGGAGATATTTTGGACTTGGTATGGGAATGGTGAGGTAGCCTTATATCGATGTTCTCTATCCTCGATGCCTGGATAAAGAGTCTCTGAAATCAAAGAGAAGTGTTTTGGTCATAGACCAAACCCCGATATACATAAAAAGGCTTTAGTGCAATTTGGTGACGTCCTCATACTCAAAAACCTTCTTTGATCTCAAGTTGAAGAAGGGAGGATAACTCGATCAGGACTACTCTGGGACT\n>LT629734.1/2109114-2109055 Agrococcus carbonis strain DSM 22965 genome assembly, chromosome: I \nGCCGCCCGTCCTGACACAACGGATCGTCCGGCACGTGCCTGCCGGTGGAAGGAAAGAGAC\n>X51710.1/1-45 Dengue-2 virus RNA for capsid protein, partial, from a case of dengue fever (M3) \nATGAATAACCAACGAAAAAATGCGAGAAAAACGCCTTTCAATATG\n>JH835393.1/4707706-4707998 Erinaceus europaeus unplaced genomic scaffold scaffold00105, whole genome shotgun sequence \nGGATGTGAGGGTGATCTGACTACGAAATCTGTCACCCCATTGATCACCAGGGTAGATTCGGCTGATCTGGCTGGCTAGGCGGATATCCCCTTCCTCCCTCACCACTCCATGTGCATCCCTCCTGAAGCTGTGCACCGGTCTTCAGTCGAGGGTATAGGAGTAGCTGCGCCCCCCTGCTAGAACCTCCAAACAAGCTCTCAAGAAAGAGCAGAGCCCTACTCAGCTCTGGCTTATGGTGGTGCTGGGGATTGAACCTGGGACTTCAGAGCCTCAGGCATGAGAATTCTTTGCAT\n>AWUE01002803.1/746-1 Corchorus olitorius cultivar O-4 contig02805, whole genome shotgun sequence. \nAGCTTACCGACTCAAAGCTTTAAGGCCTTAAAGCCCGTTCGCCCTGGATGATTCTGAAAAAATTGAGGATTTTGGTCTTGAAAAAGAGTAGTCGATGATTAACGTTGGATGATTGGAGTCGCGCGAGTACCGTGTGGAAGGGTGAAAAGAACCCCCGTCGGGGAGTGAAATAGAACATGAAACCGTAAGCTACCAAGCAGTGGGAGGAGCCCAGGGCTCTGACCGCGTGCCTCTTGAAGAATGAGCCGGCGACTCATAGGCAGTGGCTTGGTTAAGGGAACCCACCGGAGCCGTAGCGAAAGCGAGTCTTCATAGGGCAATTGTCACTGCTTATGGACCCGAACCTGGGTGATCTATCCATGACCAGGATGAAGCTTGGGTGAAACTAAGTGGAGGTCCGAACCGACTGATGTTGAAGAATCAGCGGATGAGTTGTGGTTAGGGGTGAAATGCCACTCGAACCCAGAGCTAGCTGGTTCTCCCCGAAATGCGTTGAGGCGCAGCAGTTGACTGGACATCTAGGGGTAAAGCACTCTTTCGGTGCGGGCCGCGAGAGCGGTACCAAATCAAGGCAAACTCTGAATACTAGATATGACCTCAAAATAACAGGGGTCGAGGTCGGCCAGTGAGACGATGGGGGATAAGCTTCATCGTCGAGAGGGAAACGGCCCGGATCACCGGCTAAGGCCCCTAAATGACCGCTCAGTGATAAGATAAAGGAGGTAGGGGCAGAGACAGCCAGGAGG\n>AZST01000551.1/9313-8979 Rhizoctonia solani 123E scf_551, whole genome shotgun sequence. \nCTCTTGCCATTGTTGTGGGCAGATATAGTGAATGTGGGCGTCGACCCCCCCAGCTGTGATGATCAGTTTCTCGCCTGCGATCACTTCCGTGTTGGCTCCAGCTACCAAGTCAGGGTCGACTCCGTCCATAATGTCAGGATTCCCCGCTTTTCCAATTCCAACTATCTTCCCGTGTCGTATTCCAATATCAGCCTATGCACGTCGTGAGTATTGACGCAGGGAAAACTGAGCGATGCGAATACCTTGTAAATTCCGGACCAGTCGATGATGAGTGCATTGGTGATTAAGAGATCAAGGACCTCGTATCGCTCTCCGCAAGCCCGGCCCTCTCCGTG\n>LGUE01000001.1/1373798-1373578 Bacillus marisflavi strain JCM 11544 scaffold1, whole genome shotgun sequence. \nCAAAAGGCTGTGACAGGGAGAGTACGTTTCAGCAATAACCTTTATCAGCGAATCGGGGGCGGTGCAAGCCCGGTAGGGAAATGAAGCGGAAGATCACCCTTGAGCCCTGTCTGTGAACAAATGCTAGCAGACGGCGACTGATCCATGTTACGGATTTTCGAGTGAGGGCAATTATGCCCTTATGAGGGTGGTACCGCGGGAAAAGCTTTCTCGTCCCTTTC\n>AEDQ01000029.1/68978-69146 Atopobium vaginae PB189-T1-4 contig00020, whole genome shotgun sequence. \nACGTAGTTTCAGGGCGGGGCGAACATCCCCACTGGCGGTAAATAAACGCACTAGCTGCACTAGCTGTACTAACTGTAATAAACGCGTTTACAAGCCCGCGCGCCACACTGTGGCTGATTTGGTGAAAGTCCAAAGCCAACGGTTATAGTCCGGAAGAAAGAAACGAGGA\n>JMFP01072321.1/1087-1 Pygoscelis adeliae contig72321, whole genome shotgun sequence. \nAACGCACGCTGGAGTAGAGGAAACAAGAAAGATGCAAGGAGAATTGGAGGAAGAGACTAAGAAGCAAGGAGTAGCAGAAAGAAACCATTATGCACTGACCCCAGCCTCCTGCACATTGCCTCACCAAGGGGACTGAGTGTGATGTGCGGTGTTGGCCTGAAGTCAAGCCTGGGAAAGAGGAGGAAATGCATTTCCCTAAGTGTTTGTCTAGTTATCTTCGTGGGAGTTTGGGTTTTTTTTTCTCAATACCCAAATAGGTAATTAAAAGTTTATGTTAATTTGCAATACATTAAATTAGCTGAAATTCCCTGAGTCGAGACTGTTCTGCCCATGACACCTACCCATCCCAGAAAATAACAAGAAGGTTTGACCAGTGATTAGTGTTAAGAGCCTGCTTTGTGCAGCCTTTCACTTTGACCATGATGAAGTTACTTGGTCTCCCGGAGCTGCATTTTCCCATTTCTAAAATGAACACGTCTTTCAAAAGAGACATTGTAAATCTATTTCATTTTTGAGATGCTGAGGTGGAATGGGAAATCATCTGACAATAGAGTGGGGGAAGACCCCCAAGTTGGTCGGCGTCCAACTTCTTAGAGGGACAAGTGGCGTTCAGCCACCCAAGATTGAGCAATAACAGGTCTGTGATGCCCTTAGATGTCCGGGGCCGCACGCGCGCTACACTGACTGGCTCAGCTTGTGCCTACCCTCCGCCGGCAGGCGCAGGTAACCCGTTGAACCCCATTCGTGATGGGTATCGGGGATTGCAATTCTTCCCCGTGAACGACGAATTCCCAGTAAGTGCGGGTCATAAGCTCGCGTTGATTAAGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCGATTGGGTGGTTTAGTGAGGTCCTCGGATCGGCCCCAGCGGGGTCGGCCCCGGCCCTGCCGGAGCGTCAAGAAGACGGTCAAACTTCACTATCTAGAGGAAGTAAAAGTCATAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTACCGGGGGTCGGGGTCGCGCCGGGCGTCCGGCCGCGCCGCCGACTCGATTCGCCGCTCACCCGCGCCCCGCCG\n>LHQN01016515.1/4388-3427 Habropoda laboriosa contig16515, whole genome shotgun sequence. \nGAACATATGGAGAATGTCTACTCCGATGCACTTACGACCATCGTGTCTAGGGAATCCGGTTCCTATTCCGGAACCCGGTAGCGGAACCGAAATCCATTCGGGCCCTCATTGAGTGTTCGTCGGGGTAACCCAAAATGACCTGGAGACGCCGTCGGGAGATCCGGGGAGAGTTTTCTTTTCTGTATAAGCGTTCGAGTTCCCTGGAAACTTCTAGCAAGGAGATAGGGTTTGGAACGCGAAGAGCACCGCAGTTGCGGCGGTGTCCGGATATTCCCCTCGGACCTTGAAAATCCAGGAGAGGGCCACGTGGAGGTGTCGCACCGGTTCGTACCCATATCCGCAGCAGGTCTCCAAGGTTAAGAGCCTCTAGTCGATAGATTAATGTAGGTAAGGGAAGTCGGCAAATTGGATCCGTAACTTCGGGATAAGGATTGGCTCTGAGGAGCGGGGCGTGTCGGGCTTGGTCGGGAAGCGGGTCTGGCTGACGTGCCGGGCCTGGGCGAGGTGAACCTGTGGTGTCTCCGCATGGGATCCGAGCTCGGTCCCGTGCCTTGGCCTCCCGCGGATCTTCCTTGCTGCGAGGCTTCCGTTGGCGGCCTGCCGTCGGCGGTCGTCCTCTTCGGCCGCCATTCAACGCTCAGCTCAGAACTGGCACGGACTAGGGGAATCCGACTGTCTAATTAAAACAAAGCATTGCGATGGCCCCCACGGGTGTTGACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAACGTGAAGAAATTCAAAAAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTTGCAAAGACTTTCGCTCTCCGAGGTGGCGTCATCTGTTCGTCCTGGGGACTATCTTGCCCTCCAGATTGCTAGGGCACGTAGGTGCCTTAGCGATCACGGCGAACCCATCGACACCCCTGCGAAGGAGTCGCGCCGTTGGGCTGCGGC\n>AEWC01017985.1/26701-26812 Solanum tuberosum cultivar DM 1-3 516 R44 scf00126_13, whole genome shotgun sequence. \nATTCCATGAACAACCAGGAAATAACAAATAAAACTGGAATGACATAAAGAAGATTAGCATGCCTATGGGCAAGGATGACATGCCCAAATCAAGAAATAACAAATAAAATCTT\n>CCCW010003393.1/857-2271 Brassica napus, WGS project CCCW01000000 data, contig: 40795 \nAACCCGTCCTGGAGGAGTGTTGTTAAAGGGTGAAGACCTGGGTTCGAGTCTCACCAACAACCTAATTATGGAGTCAGAGAGGACTCATAATGGAGGGGTTGGGGTCGGTGCGCTGCAGCGCTGTGAACCTAGGTTCCTAGTGAGAGGATGGGTTGTCACACTCTGCCCGTTGCTCTGATGATTCATGATAACTCGACGGATCGCATGGCCTTAGTGCTGGCGACGCATCATTCAAATTTCTCCCCTATCAACTTTCGATGGTAGGATAGTGTCCTACCATGGTGGTAACGGGTGACAGAGAATTAGGGTTTGAGTCCAGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGTAAACTACACAATCCTGACACGGGGAGGTAGTGACAATAAATAACAATACCTTAACGAGGATCCATTGGAGGGCAAGTCTGGTGCCAGTAGCCGCGGTAATTCCAGCCCCAATAGCGTATATTTAAGTTGTTGCATTGAACCTTGGGATGGGTCGCCCGGTCCACCTTCAGTGACCACCGGTTGGCTTGTCTCTTCTGTCGGCGATATGCTCCTGGCCTTAACTGGCTGGGTCGTGCCTCCGGTGCTGTTACTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTACGCTCTGTATACATTAGCATGGGATAACTTCATAGGATTTTGATCCTATTGTGTTGGCCTTCGGGATCAGAGTAATGATTAACAGGGACAGTCGGTGTAGAAACCCGTTAAAAAAAGAGAGAATGGTTGAGTATCTTTGTGTTGGTCGAGTCGCGGGTGATACTTATCGATCGAGAAGTTTTGAAGTACGAGGTGGGCGAAGAAGTGATCGTGAGTGAACTGTGAGTCGAATAAGTTGCTCGACCATAGTTACAAAATGTCTTAGATTAACGAGACAGACGTTTTGGAAGCATAACATTTTTGGAAGTACGACGGTTTAGAAGCTCGACGTTTTGGAAAAATGACGTTTCTTCAGCACGAAGTTTTCCGCGAAAACTCGTATCAGCGGAATATTATTTCGAAGACATTGGAAGGAGGACGGGAATTAAGCACGATGGGCAGCAAGCACGACAGGATCGAAGCACGACGGGAAAACCCAAAATTGGACGAAAACCCTAATTTCGGTATTATGAAAGTTTTCGATGAAGCCAAAGGATCTAGAAATGTTTACTGCCAAGGTCATAGTTCAGATTGGAGTTTATTAAAAATATTCCGCTCATCAGAATGGGAGCAGAAAGTATTCGGGATTAATCGCGGGTCAGAAATTTACCGGAATGACCGTAATCAGACAAATAGACCGAGAAGCTCGAGGTGGCTCGTTGCATGGGTTCAGAACGTGGTGTCAACCATCTAAAATGCTGAGTGTCTCCAGAAGCTCGAGG\n>GL637601.1/12317752-12317884 Caenorhabditis tropicalis strain JU1373 unplaced genomic scaffold Scaffold629, whole genome shotgun sequence. \nATCCCACTGATTACAAATTTCGCTGATACCTGCCCACCCGAAAGCCTGGAGGCCACAGGGAGTGGGGTCCCGCCGGTCGATGAATGGCTGACAACGGTGGGAACCATGATACAGATTATGAGAGATGAGGGTT\n>AARH02006624.1/20544-20687 Populus trichocarpa scaffold_19_contig_351, whole genome shotgun sequence. \nAATAACCAAAAATAAAACTTGGGCTAAGGGTAACGTTGGTAATTGTTCTTACATCTCCCACCCCTGGAAACCAGGTATCATATACGGGCCCAAAATAAGGAGCTTTGAATATCTAAAATTGTCGTAATTTTATTTCTCTTTCCA\n>JRES01001669.1/266737-266612 Lucilia cuprina strain LS Scaffold353, whole genome shotgun sequence. \nTAACAAAAAAATAAAAATAAACAAACTAAGTACTGGTGCAGCAGGAACTATATGGAGCTAAATGCTGTTGCTCCATTTAGTTCCTGCTGTACCAGTACTTAGTTTGTTTATTTATAAGAACAAAAC\n>DS981450.1/8754-8822 Bacteroides coprocola DSM 17136 Scfld_02_23 genomic scaffold, whole genome shotgun sequence. \nATGCAGACGCTTAAAACACTTGGATGTATGTGAATATGTGTAAGTGTTACCTGTTCCAGAAGTGGAAAA\n>AJXZ01000015.1/19268-19422 Nitratireductor aquibiodomus RA22 Contig15, whole genome shotgun sequence. \nATAACAAGAGGGTGAAGCTGAAAATTCATCCTCACCACGCGGTCAAAGTCTTGGGAGGATGCGGTCCAGGCGCGGTTACACGCAGCCGCCGACGATGATACGGTAAAGGATCGGACGCGTTGAGTTAGCAAGGCCTCTTGGCCTTGCATTTTTTT\n>KQ034000.1/288106-288014 Lactobacillus apis strain Hma11 genomic scaffold Hma11_scaffold2, whole genome shotgun sequence. \nGGTCAAACATAAGACATGCGAGATTGTAAATAACTTTTGAATCGGAATACTATTATTTAGTTAATAGGATCCATATTCATTGCGATACGTCTC\n>GG729934.1/356366-356523 Oribacterium sp. oral taxon 078 str. F0262 genomic scaffold Scfld1, whole genome shotgun sequence. \nAAATTCCAGTGTCATAAGGAGCTGTCCCCCCATCGTGCTTGCACGAAGGGGGGACAGCTCCTTATGACACGCCCCCTTATGAGCATGCAGCGGAGGTTTTTCCCGCGGAATGCGAATAAGGGACAGCATGGCGAGCTCAGCGATGCCATGCGGAATTT\n>ALXA01000123.1/6897-6525 Pseudomonas putida S11 PPS11_c212, whole genome shotgun sequence. \nCCACCCAATGCGCCACCTATACCTGCTCCGGTATTGCCGCCTGCCGACGCAACGCCGCTCAGCAGGCCAAGTGACAACAACAGAATCGAGGAGTACTTCATTTGTAAAAAGCCTCAAAGGGATACGGAGGCGATCCTGAGGCTCTGGACAGGGCCTTACAATGGAAATCCGACGAGTGACACGACTTGGAAAAATTCTCCAAGTTATTGTTTTCCCGATGGAAACTTAAGGGATTTTCAACGGTCACAGGCTGATTGCAAAAAGCCTTTCCAGTGGTGGAGAAGCCTTTTATTTCTACCCGTCACCCCGTGCCTTCCCCTCCAAACTCACTACCCTTCTGCCCCAGACCTTGCTTGCCCCAAACCGCTGGATC\n>AFSB01219390.1/2517-2353 Heterocephalus glaber contig219390, whole genome shotgun sequence. \nATTCCTTCTTGGCCTTTTGGCTAAGATCAAGTGTAATATTCTAGTTCCTAAAGTAACTATATGCTTATAAAAAAATCTTGCCTTTTGGGGGTCTTAAGAGAGTCTAATGATCTTGTGCAGTGTAAAAAATGCATTATGACTTCCTTGTTATGTTTTGCATTCTCT\n>FR892523.1/19058-19295 Prevotella sp. CAG:592 genomic scaffold, scf208 \nGCAAAGTATATCGCAAGCGGTTTGCCCTCACGGGTGATTAAAAGGGAATCGGGTGGAAATCCCGGACAGTCCCGCTGCTGTGAGCCGCCCCTTATGAAAGGGTCGAACAATAGCCACTGGAAATTCTTATAGCTCCAATCTGTTATTATGAAATGTCTAACGATTGTTGGAGGTTAACGGGAAGGCGTTCGATACCGGGCGGCAAGTCAGAAGACCTGCCATTGCGACACATGGCGTA\n>KB202646.1/8509-7967 Lottia gigantea unplaced genomic scaffold LOTGIsca_5069, whole genome shotgun sequence. \nNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTCGCGGTCCTGCCTCGTTTTTCTCCTTCCGGGAGAGAACCCGCCGCATTTTCTGTCTACCTTGAAAAAATTAGAGTGCTAAAGGCAGGCTAAAACCCCGAGCCTGAATATTTCGTGCATGGAATAAGCGGGGATGCTCTTTTCCGGAGGGCGGTCCGACCGACTGGCGACGTCGCTTTCGCTGTCGGTTTCGCCGGAGAGCTAGGATTCGAGAGGAACGGTGGGGGGCGAGCGTACCGGGCGGGGAGAGGTGAAATTTTGTGATCCGCTCGGGACGACTCGAAGCGAAAGCGCTGGCCCCGGACGTCTTCCTTAATCCAGAACGAAGGTGGGTGGAGCAAAGACGATCAGATACCGTCGTAGTACCGACGGTAAACGCTGCCGACCGGGCCGCGGACGAGGCTCGAGAACAGCGGTTATGGACCCGTCCGTGGCGGCTTCGGGCAACCTGAGAGTTTACGGGT\n>AZGB01000027.1/63184-62919 Lactobacillus ghanensis DSM 18630 NODE_73, whole genome shotgun sequence. \nTAAAAAACAGCAAGAAGAGTAAATGGAAAAATTGTTTTAAGCGAGTCGTTGGTTGATGAAAAACGATAACAATTGACTGTTGAAGATGGTCTTGTTGAGAAGTTCTATTGCTGAGTTGTGCTGAATAATAAGGCAATAGCGGGAACTCCCGTTAGCGAGTCGAAGTATCTTCTGGAGATAAATAAGAATGTACTTTTGAAGGAATAGTTTGTGAGAACTATTTAAATTAAGGTGGTAACGCGAAAAGCAGTCTTTTCGTCCTTAGC\n>CM001425.1/10442330-10442236 Lepisosteus oculatus linkage group LG22, whole genome shotgun sequence. \nCCCAGCAGCCATGTCGCTCTGCCACTCAGCGGGTGTGAGCCTGGGCAGTACCTGGATGGGAGACCTCCTGGGAAAAACTGAGGTTGCTGCTGGAA\n>AP013066.1/2828303-2828212 Sulfuricella denitrificans skB26 DNA, complete genome. \nAGAACCCATGCGGGAGAGCGTGCGATTATTTTCGCACCACCGAAGGCGCAACCACCCGTAACCGCTCAGGTATCAGGAACCGCATGGAACAC\n>CM000251.2/46867717-46868010 Rattus norvegicus chromosome X, whole genome shotgun sequence. \nGAGTTTTCTGGCTTGGATATCTGACATCCCATTGATTGCCACAGTTGATTTAGCTGATCTTGCTGGTCGGCAGGTGTCCCCTTCCTCCTTCACTGCTTCATGTGCATTCCTCCTGATGCTGCGCACTCCGTTGAAGATGATGAACCTTCCCTGAAGGGAGAAGGTCCAGTCTTTGGGCAAAGATATTCGAGTAGTTGTGTTCCCCAGATAGAACCTCCAAACAAACTTTCAAGGAAGAAAATTTTAGTTTGGTTTCTGGTTCCAGATGGTGGGCATGCTGGCATGACAGCAAAC\n>FNHO01000002.1/3411-3594 Pseudomonas balearica DSM 6083 genome assembly, contig: Ga0056079_102 \nCAGCTAACGGAAAAGTATTCCAATTCGGTTTAACGGCCCGGCAGATCCGGTCGGCAGAATCCGAAAAACGGACTAATACTTGAAATCACTGGCGAGACATTCCCCCCACTGTCTGGCCAGTCGAGACCGTGAGGACCGCGTTCTCGAAACTCCTAATGGTCTTGACCCGGCTCCCTCAGGCCGG\n>JH836242.1/293875-293781 Erinaceus europaeus unplaced genomic scaffold scaffold00954, whole genome shotgun sequence \nCTCCGGCGCAGGGCGGCCACTGCCCCCCGCACACTGCGCTGCTCCGACCCACTGTGCGTGTGACAGCGGCTGTCCTGTCCTGGCAGCGCGACCGG\n>CH672395.1/1696787-1697001 Leeuwenhoekiella blandensis MED217 scf_1099517004314 genomic scaffold, whole genome shotgun sequence. \nACTTCGCAAACGTATTTTGGTGGTGTTTTTTGTTTTTAAAAACACCTTAAAAGGGAATCAGGTGCTTCTTTGTAAAAATCCTGAGCTGTTCCCGCAACTGTAAGCTTAGTTCGTAAAAGAACGGTAAAGATCGTCTTACACCACTGTCAATATTGATGGGAAGGTTTGATCTTTATACGCGAGCCAGGAGACCTGCCAGAAGAAACTAATAACTA\n>AZAQ01029315.1/12443-12290 Stegodyphus mimosarum contig29315, whole genome shotgun sequence. \nATACTTACCTGGCACTGGGAACGCCTTGATGAACAAAGAGGCTTCCCGAGCAGAGGGCTCCCGTTGCACAGCGAGAGGTTGACGTTCGCTACACTCGCCGTAAATTGGGCAATTATTTCCTAGCGTACATGGAGTAGCATCAGATGCCAATGGA\n>ALWZ045079265.1/261-1397 Picea glauca, whole genome shotgun sequence. \nAAGATTTTGTGCGTTTCTCTCTCTACGTTCCGGATTTCGTAGTGACGGATTTATGAGTAGATTCGATCGAAGAAGTTACAAATTGTATGATGGAAAAACCAAAGTGAACCCTAGGTACACCTCATTTCGGTGGTCCCGAAATCAATAGGGTAGTCCCGGGTTATCACTGATAATTTCGAGATGAATTCTCCGTAATTGTGTGTTCATCGGAAATAGCTGGTTTTCCGCGAAATCCATTTAAGTGGAGCGTCTAATGTTCAGGCCCGAGGTAGAGCACTCAATGGGCTAGGGTGGCCAAAAGCTTTACCAATCCCAACGAAACTCCGAATACAGGTCTCTGCAGTTAGTACAGACAGACTTTGGGTGCAAAGATCCAAGGTCGAGAGGGAAACAGCCCAGATCGTGCGCTAAGGTCCCAATGCAATTACTTAGTGTCAAAGGTAGTGATCGCGCGATGACAACCAGGAGGTAGGCTTGGAAGCAGCCAGCCTTTGAAGAAAGCGTAATAGCTCACTGGTCCAGCTCCGTAGCACCTAAAATGTATCGGGGCTAAAGTAATTCACCGAAGCGACGAGACTAGTCTCCGAGATTGATAGCTCGGGAAAGTGAGAACCTTGAAAGCACACAAGTAGCTCACGTAGTCTATATGGTCCAGATAGTGTCTAACTAAGCTTATTCAAGGGTCAGTAGCGGAACGTTCCGTATATCGGAGAAGGGGCTACACCTGGAGGKATCAGAAGTGAGAATGCTGACATGAGTAACGATTAATCGTGTGAAAAACACGATCAGTTCACGGGTTTTCACGTTCAGTCAATCTACGTGGAGTGAATCGGTCCCTATAGTGGGAGATGTAAGCACGAGTTACTCCGGCAGCTGTTTTATGGCCCCCGCTGATAGACTAGGGGCTAACCTGATCTTTCTACTGTTGCCACCTATACGCAATTGTTTATTAAAAACACAGGACTCTGCTAAGTGGAAACACAATGTATAGAGTCTTACATCTGCCCAGTACTGGACATCGTATTATGGGTTTCTGTCACTTTTCCCTAGGGAATAAAACTAGATAGGTCAGTTATTATAAGTAAATTCTTGGAGATTTCCTGATTCCGAAAGCTGCCGGTGCACTTGGCCACCTTC\n>GL945483.1/1284982-1284843 Serpula lacrymans var. lacrymans S7.3 unplaced genomic scaffold SERLA73scaffold_10, whole genome shotgun sequence. \nGGCCGACTAGCTCAGTTGGTTAGAGCGTCGTGCTAATAACCTAGGCACAATGGATCAGACCACCATGCATTTGCATGGTGGTCTGATCGCTGGCCTTGTGTCATACGCGAAGGTCTTGGGTTCGATCCCCACGTTGGCCA\n>URS0000D6AED6_12908/1-65 unclassified sequences c-di-GMP-II-GAG riboswitch \nCGGGAAGCUCUGACACGCGGUCCCGGCCGCCGGGACCGCGCCGAGCCACUGGCGAGACCGACCCG\n>ALWT01224760.1/3828-4038 Myotis davidii contig224760, whole genome shotgun sequence. \nATCGCTTCTCTGCCTTTTGGCTAAGATCAAGTGTAGTACAAGTTCTGGTACATAGTAGGGTTCTGCAAGATAGCAGTGGCCATTACTATTATTATGATTAATCATGACCATTGCTATTAAGTTTTCATTGCAAAGTAATGGTATTAGGTGATGAGGAAAGGTGTGTATCTGGTGTGGGAAATGGGTGGGACTTACATTTATTATATGCCTA\n>KV453843.1/252671-252748 Tortispora caseinolytica NRRL Y-17796 unplaced genomic scaffold CANCAscaffold_3, whole genome shotgun sequence. \nGACAGTGATGAAAAAAATTACTCACAGACCTGTACTGAACATTTCATGTGGATAAAGCAATATTGCCTTTTTCTGAGT\n>ABCM01000001.1/368790-368897 Pedobacter sp. BAL39 1103467000516, whole genome shotgun sequence. \nTACTTATAAAGAAAGACTGAGGGAAAGGCCCTGTAACGTCTTAGCAACCTGTACTAGCCGGAAGTAAAAGGTGCTAATTCCTACTCTGTAGAAAGAGAAAGATAAGTT\n>CP002512.1/771378-771640 Aerococcus urinae ACS-120-V-Col10a, complete genome. \nACACACCCATTGATAGGGAGAGTAAGTGTTAAACACTTTGAAGAGAGGTTCCGTTTGGTGAGAGGAACCAAGTGAAAGGCGCTGAAGATGGCCTTTGAGGGTATCTTGTCAATAAGTAGACAAGGTCGGCTGGGCTCGGTCGATAGAAAGAGCGCTAGTCTAGGCATTATCGCCTATGGCTAGGTCGAGGGAGTAGCTACTACTATACTTATTAACAGTAGTACTCTGAACAAAAGGTGGTAACACGATGCGTCGTCCTTTAC\n>CP017623.1/2830701-2830798 Candida albicans SC5314 chromosome 1 sequence. \nTTGGCTATGATTATTTGCATTATATTACCAATTGTTCCAACTGAATATCCCGGGTTGACAACCGCATTATCGTTAAGTTTCAGCCTTGTCTGAGCCTT\n>ALWZ041464526.1/1-432 Picea glauca, whole genome shotgun sequence. \nATAACCGTAGTAATTCTAGAGCTAATACCTGCACCAAGTCCTGAATATTTGGAAGGGATGCATTTATTAGATAAAAGGCCGGTGTGGGCTTGCCTGCTTCTCCAGTGAATCATGATAACTCGACGGATCGCACAGCCATTGTGCTGGCGATGCTTCATTCAAATTTCTTCCCTATCAACTTTAGATGGTAGGATAGAGGCCTACCATGGTGGTGACGGGTGATGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAATGGATACCACATCCAAGGAAGGCAGCAGGCGTGCAAATTACCCAATCCTGACATGGGGAGGTAGTGACAATAAATAACAATACTAGGCTCATCGAGTCTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGGAGGGTTCACTGTCCCCTCCTCT\n>ABDH01025731.1/1497-1292 Termite gut metagenome tgut2b_Contig26382, whole genome shotgun sequence. \nTCCATCGTGAGGTGGAATCTGAAGGAAGCCGGAGGCAAAGTCCCGGGCCGACGAACAGAAACCGCATATAAGGCAATGCAAGGCGGACGAGTTTGCATAACAAAACGAAGTCCAAAAAGGCCGGGGAGGAAGAAAACAGACTCCGGTTTTACTGCCCGAACCTTGCAGTGTAGATGCGGCGGCTATATGGGATGAAGGTTATCAGC\n>AFFK01018367.1/6133-5846 Strigamia maritima strain Brora ctg7180001228879, whole genome shotgun sequence. \nAGGCGTGTGTCTGAGACACATCTGAACATTGATCGCTGTTATTAGGCAGATCTGCTCAGAGGTAGTGTCCCTTAACCACACAAGACCATATTGAGTCGGTATTCCCGCTGCCACAGTACGCACGGTACGAGTACCTTCTCACACAGTTGCGCCCCAAGCGCATATCAGGGTATAAATCTGGCCGTTCTCCTAGCTTAGCTGTTTCAAAATTGGGGAAGTTTGCTAGCATCTTCCATGATTTAAGACGCCACCAATAAAGGCGCTGAGTGTGTCAGCCTGCCTTTTAAT\n>CCCW010037878.1/9850-6604 Brassica napus, WGS project CCCW01000000 data, contig: 6310 \nTCTTTTCAAGTTTCATGTGATCAAAACTCAACATTCCTCCAAATACGTATTCTCCCAAAAGCTTGGTTTCAGATTCTGACTTTTACACTCTTGACAATTTTATTCCGAAGGGCGGGGTAATACAGACTGGGCCCTAGTTCCCTGGAAAGGGCGCCATTGAGGGTTAGAGCCCCGTCGTGCCTGGACCCTGTCGCACCACGAGGAGCTGTCGACGAGTCCAAGTCTGCCGATCGGGCGGTAAATTCCGTCCAAGGCTAAATATGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGTAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGATGGGGGCCGGCGATGCGTCCCGGTCAGATGCGGAATGGAGCAATCCGGTCTGCCGATCGATTCGGGGCATGGACCTACGCAGATTAAGGTGGTGACCTAAGCCCGAGCCTTTTTTACGCCCGCGGAGACGTCGTTGCCTTAATTGTGGTCTGCAGCACGTGCCTCACAGCGTGCCTCGGCATCTGCATGCTCAGGGCGTCGGCCTGTGGGCTCCCCATTCGACCCGTCTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGTGAGTAAACCCATAAGGCGCAAGGAAGCTGATTGGCTGGATCCCTCACGGGTGCACAGCCAACCGACCTTGATCTTCTGAGAAGGGTTCGAGTGTGACCATGCCTGTCGGGACCCGAAACGTAGTGAACTATGCCTGAGCGGGGCGAAGCCAGAGGAAACTCTGGTGGAGGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTGACTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCTCGGAAACGAGTTCTATCGGGTAAAGCCAATGATTAGAGCCATCGGGGATGCAACATCCTCGACCTATTCTCAAACTTTAAATAGGTAGAGCCATCGGGGACGCAACATCCTCGACCTATTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGCCGGTTACGGTGCCCAACTGCGCGCTAACCTAGAACCCACAAAGGGTGTTGGTCGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTGAAGCGTGCAACCTTTACCCGGCCGCCAGGCCTCGATGAGTAGGAGGGCGCGGCGGTCGCTGCAAAACCTAGGGCACAAGACAAGGCAGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGAGTCGGGGGAAACCCGTCTGATAGCGCTTATGCGCGAACTTCGAAAGGGGATCCGATTACAATTCCGGAACCGGGACGTGGTGGTTGACGGCAACGTTAGGGAGTCCGGAGACGTCGGCGGGAATTCCGGAAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGCACGTCGCGTGGTGTCCGGTGCATTCCCGGCGGCCCTTGAAAATCCGGAGGACCGAGTGCCGCTCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGTCGATGGAACAATGTAGGCAAGGGAAGTCGGCAAAATGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGGCTGGGCTCGGGGGTCCCAGTTCCGAACCCGTCGACTGTTGGCGGGCTGCTTGAGCCGCTAACGTGGCGAGAGTGGACCTCCTCGTGTCAACCGGGGGACGGACTGGGAATGGCTCTTTCGGGAGCTTTCCCCGGGCGTCGAACAGCCAACTCAGAACTGGTACAGACAAGGGGAATCTGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTAACACAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGCGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTACCACAGCCAAGGGAACGGGGTTGGTAGAATCAGCGGGGAAAGAAGACCCAACTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGAATAAGTGGGAGCTCCGGCGCAAGTGAAATACCACTACTTTTAACGTTATTTTACTTACTCCGTGAATCGGAGGCGGGGTAACAACCCCTTCTTTTAGACCCAAGACTCGCTTCGGCGGGTCGATCCGGGTGGAGGACATTGTCAGGTGGGGAGTTTTGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGTATGAATACGAACCGTGAAAGCGTGGCCTATCGATCCTTTAGACCTTCGGAATTTGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCACTGTGAGACAGAATTCAACAAGTGTTGGATTGTTCACCCACCAATTGGGAACATGAGCTGGGTTTAAACCGTCGTAAGACAGGTTAGTTTTACCATATTGATGCCCATCTCGCAATAGTAATTCAACCTTGTACGATAGGAACCGTTGATTTGCACAATTTGTCCTCGCGCTTGGTTGAAAAGCCAGTGGCGCAAAGCTGCCACTAAGTCAGAATCCGGGCTAGAAGCGACGCATGCGCCCGCCGCCCGATTGCCGACCCTCAGTAGGAGCTTCGGCTCCCAAAGGCACGTGTCGTTGGCTAAGTCCGTTCGGCTGAAGCGCCGTTCGGACCGCCTTAATTTATAATTACCACCGAGCGGCGGGTAGAATCCTTTGCAAACGACTTAAATACACGACGGTGTATTGTAAGTGGCAGAGTGGCTGATGTGCCCCAGTCCATGGACCAGACCGATCAGAACGTTCTAGACGTCCCA\n>ACJG01006097.1/11398-11489 Daphnia pulex DAPPUscaffold_154_Cont6097, whole genome shotgun sequence. \nGCCTGGCTAGCTCAGTCGGTAGAGCATGAGACTCTTAATCTCTCGCATGAGAATCTTAATCAGGGTCGGGGGTTCGAGCCCCCCGTTTGGCG\n>CM000231.2/255777208-255777080 Rattus norvegicus chromosome 1, whole genome shotgun sequence. \nCAGCCTATTTCCAAGGATAGAGCTGGGTGTGGCTATGGGATCTCCAACTGCAGGCCAGAGTAATTGGAGAGACTTTAACAGCAGAGGTCAACACAGTGCCTGCGGCTGCCACTTGCTTTTCCTGTATGT\n>CYZX01000011.1/96755-96903 Clostridium disporicum strain 2789STDY5834856 genome assembly, contig: SCcontig000011 \nAACTAAATCAAAGATTTAGGATCTCACTTAAGTTGACGAGGATGGGGAGTATCGAATTCTTCGGCGGGTGCCCCACGGTATCGCACTACCGTTAACAGTTAGTAAATCTATGAAGTGATTTGTAGGACAACACTAACTTGGTGTTAAAA\n>KN838613.1/75725-74394 Laccaria amethystina LaAM-08-1 unplaced genomic scaffold K443scaffold_78, whole genome shotgun sequence. \nTACCTAACAGAATTTACAGGTATTCAAGTAGCGTTGATTCAGTCAGATGGTTGGGGTTTGGTATGTCGGCTGGACCGATTCACCATGGTCGTGGCTTTGTATGTCAGCTGGGCTGATCATCACACATGCATACTAGGTCTTATTAGGAGTTATATGTGGTATACTACATTCCAAATGACCGGAAACTGGCCTGGGTGAATAACTTTTCTACCTGGCATAAGTCTGGCGCGGCCTCTGGAAGGGCCTGAATTCCCCTGGTAACAGACGGAAATGTCTGAATTCAGAGGGGACACCTCATGTAGCCAGGTACGAAATCTTGGTGTCTGTCGTACCTGATTCATCTTGTACCAGGTAAGCCAGACACGTGCACATTTCCTGATGCTCTTGGTGAGCCGGCGTGCCCTTTATTGGTGTGTGTTGGGGAACCAGGACTTTTACCTTGAGAAAATTAGAGTGTTCAAAGCAGGCATTTGCCCGAATACATTAGCATGGAATAATAAAATAGGACGTGTGGTTCTATTTTGTTGGTTTCTAGAGTCGCCGTAATGATTAATAGGGATAGTTGGGGGCATTGGTATTGAGTCGCTAGAGGTGAAATTCTTGGATTGACTCAAGACCGACTATTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACAAAGGTTAGGGGATCGAAAATGATCAGATACCGTTGTAGTCTTAACAGTAAACTATGCCGACTAGGGATCGGGCGACCTCAATTATGATGTGTCGCTCGGCACCTTACGAGAAATCAAAGTCTTTGGGTTCTGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGATGGAAGGGCACCACCAGGTGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTCACCAGGTCCAGACATAACTAGGATTGACAGATTGATAGCTCTTTCATGATTTTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGATAACGAACGAGACCTTAACCTGCTAAATAGCCAGGCCGGCTTTCGCTGGTCGCCGGCTTCTTAGAGGGACTGTCAGCGTCTAGCTGACGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGACAGAGCCAGCGAGTTTTTTTTCCTTGGCCGGAAGGTCTGGGTAATCTTGTGAAACTCTGTCGTGCTGGGGATAGAGCATTGCAATTATTGCTCTTCAACGAGGAATACCTAGTAAGCGTGAGTCATCAGCTCGCGTTGATTACGTCCCTGCCCCAACCGACCACTC\n>AFEW01015811.1/2627-2450 Jatropha curcas cultivar GZQX0401 scaffold191_29, whole genome shotgun sequence. \nTGTCATGTTTTTCCACAGCTTTCTTGAACTTCTTTTTTCTTTTCTTTAATTTTTTCTTTCAAGAATCTCCCTCATTTTAATATGTATGAAAGAGATTCTTAAATGGAAGAATTAAAGAGGAGGAAATGTATACGTGTATTGTATAGGAGTTCAAGAAAGCTGTGGGAGAACATGGCAG\n>JH226135.1/756984-757073 Exophiala dermatitidis NIH/UT8656 unplaced genomic scaffold supercont1.6, whole genome shotgun sequence. \nGCTCTCTTAGCTCAGTGGTAGCAGCGCCACACTAGTAGTTCCTAACATTACGAGATGTGGAGGTCACAGGTTCAAGTCCTGTAGGGAGCA\n>AZGY01000051.1/130-3252 Aschersonia aleyrodis RCEF 2490 scaffold_51, whole genome shotgun sequence. \nTACCTGGTTGATTCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTCTGAGTATAAGCAATTATACAGCGAAACTGCGAATGGCTCATTATATAAGTTATCGTTTATTTGATAGTACCTTGCTACTTGGATAACCGTGGTAATTCTAGAGCTAATACATGCTAAAAATCCCGACTCCGGAAGGGATGTATTTATTAGATTAAAAGCCAATGCCCTCTGGGCTCTCTGGTGATTCATGATAACTTCTCGAATCGCACGGCCTTGCGCCGGCGATGGTTCATTCAAATTTCTTCCCTATCAACTTTCGATGTTTGGGTAGTGGCCAAACATGGTTGCAACGGGTAACGGAGGGTTAGGGCTCGACCCCGGAGAAGGAGCCTGAGAAACGGCTACTACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCCGACTCGGGGAGGTAGTGACAATAAATACTGATACAGGGCCCTTTCGGGTCTTGTAATTGGAATGAGTACAATTTAAATCCCTTAACGAGGAACAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGAACCTTGGGCCTGGCGGGCTGGTCCGCCTCACCGCGTGCACTAGTCCCGCCGGGCCTTTCCCTCTGCGGAGCCCCATGCCCTTCACTGGGCGTGGCGGGGAAGCAGGACGTTTACTTTGAAAAAATTAGAGTGCTCCAGGCAGGCGTATGCTCGAATACATTAGCATGGAATAATGAAATAGGACGCGCGGTTCTATTTTGTTGGTTTCTGGGACCGCCGTAATGATTAATAGGGACAGTCGGGGGCATCAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACAACTGCGAAAGCATCTGCCAAGGATGTTTTCATTAATCAGGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGACGATGTTATTCATTGACTCGTTCGGCACCTTACGAGAAATCAAAGTGCGTGGGCTCCAGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGAAATTGACGGAAGGGCACCACCAGGGGTAAACGTGCACTGTCTAAGCCGCAGTCAACTCTGCTCCAGAAAGCCGCCCGAAAGGGTCGGTGGTCGCCCCCCAACGCTGGCTAGTCCCGTCCGCCACCGCGCGGCGGGGCAACACCCTCAAACTGCCGGGGAACTCCTAAAGCCCTCGCTCCGGACGGCGCTGGGAAACCAGCGTCCGCTCACCAGGTTAACGACCTCGGGCATCGGAAGCAACGCGGGGGATGCTACAATGGACGATCCGCAGCCAAGCCCCTACGTGCGACAGCATACGGGGAAGGTTCAGAGACTTGACGGGGGTGGGTCGGGGACGCATGTCGGGACGCCTGAAGGCGCTGGAACACCGGCACGAGGGCGCTGGAGTCTCGCCCGCGAGGGGCTGGCACCTCCGCCTGAAGAGCGCTGGGATCCCGGCGACCGAGACGCCCGCATCGCCCACCGGCTTGAGGTAAAGTCCGCTGTCGCGCCAAAAGCGCGCCCCATGCGATGGATCATCGCTCGGCAACCACAACGGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTCACCAGGTTAACACAGCGGGCAACGCTTGTTGCGTGTCTGGGCCTGGAATAGTGAGAGCCCGCCAGGGGGCGGCCTCGCTAGTATTCGTCCTTAACCCGCGCGGGGGGAGCCCCCCTACTCTGGGCGCAGGGAGCGGTCGCGCTACGGCGCGCCGCTTGGGCGGTGCAACACCAGCTGGTACAGGGAACGCCGACTACCCCTCGGGGGGCAAGGGCCGATCCTGTGGCGAGTCCGGGCTGCGCCGGACCGTCGCAACGCACGCCAAGCGGTGGGCTGGCTCAGGCTGGCTTAAGGTACGTGCTAATCCCACGGGGCAACCGTGGCCGCCCTGAATAGTTCCGAGTTTTACGAAGCAGGGCGGGGGCGCACCTCCGGGTGCGCTCGTCCGAGTCCACAGCGGGCTCGAGTGCCAGACACAATGAGGATTGACAGATTGAGAGCTCTTTCTTGATTTTGTGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGCTTAATTGCGATAACGAACGAGACCTTAACCTGCTAAATAGCCCGTATTGCTCAGGCAGTACGCCGGCTTCTTAGAGGGACTATCGGCTCAAGCCGATGGAAGTTTGAGGCAATAACAGGTTGACCTACACAGGCCTGTAGTAGTGGCGCCTCCGGTGGGACAGAGGGAAGAAGACCGCTAGTCCAACAGCATAACCCCCGTGAAGGGAGCCCTTCGGAATCGGGCGGGGGGGCGGCCACTGCCCGTGGCCGCTCGCTGTGGGCGACACCACCTGGTACAGAAGACGCCCACGGGGCCAATTCTGTGGCGAGTCCGGGTTGCGCCGGACCGTCGCAACGCGCGCTAAGGGGTGGGCCGGCGTCCTCTGCGGAGGCCCGGCTTAAGGTACGTGCTAATCCCACGGGAAGGAGAAACCGTGCCGACACACAGAGCCCCGATCGGCGAAGTGTGCCGGGGCGTCCCTGCGCAGCGTCGCAGGGCGCCGGTCTCGGGGGCACACAGGCTGCTTCAGCATGTCCTGGCCCCCCGAGGAAATGCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGACGGAGCCAGCGAGTACGCCCTTGGCCGGAAGGCCCGGGTAACCTTGTTAAACTCCGTCGTGCTGGGGATAGAGCATTGCAATTATTGCTCTTCAACGAGGAATCCCTAGTAAGCGCAAGTCATCAGCTTGCGTTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCGATTGAATGGCTCAGTGAGGCGTCCGGACTGGCCCAGCGAGGTGGGCAACCACCACGCAGGGCCGGAAAGCTCTCCAAACTCGGTCATTTAGAGGAAGTAAAAGTCGTAACAAGGTCTCCGTTGGTGAACCAGCGGAGGGATCATTA\n>CP022437.1/2870568-2870713 Virgibacillus necropolis strain LMG 19488 chromosome, complete genome. \nGTTACCTTTAATTCAGTCCTGTGAGACTGGCAAGGTGGAACAGATGAAGATCTGTTTTATAAATAAAACTCGGAAAGGTTTCTTCCTTTTGCGAGCCTTTTATTTGTACACTACACCTTGCCAGAATAGGCAAGGTGTTTTTTTGG\n>GL385398.1/3795320-3795665 Gaeumannomyces graminis var. tritici R3-111a-1 unplaced genomic scaffold supercont2.4, whole genome shotgun sequence. \nACATACGACCATACCCACTGGAATATACGGGATCCCGTCCGCTCTCCCCTANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCAAACCAGTGAGGGCCGAACTAGTACTCAGGTGGGTGACCACTGGGGAATCCTCGGTGTTGTATGTT\n>AFEY01233609.1/1-1134 Sarcophilus harrisii ctg7180001910850, whole genome shotgun sequence. \nCCAGCCCCTGCCTCTCGGCGCCCCCTCGATGCTCTTAGCTGAGTGTCCCGCGGGGCCCGAAGCGTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCCCGAGTCGCCTGGATACCCCAGCTAGGAATAATGGAATAGGACCCCGGTTCTATTTTGTTGGTTTTCGGAACTGGGGCCATGATTAAGAGGGACGGCCGGGGGCATTCGTATTGTGCCGCTAGAGGTGAAATTCTTGGACCGGCGCAAGACGGACCAGAGCGAAAGCATTTGCCAAGAATGTTTTCATTAATCAAGAACGAAAGTCGGAGGTTCGAAGACGATCAGATACCGTCGTAGTTCCGACCATAAACGATGCCGACTAGCGATCCGGCGGCGTTATTCCCATGACCCGCCGGGCAGCTTCCGGGAAACCAAAGTCTTTGGGTTCCGGGGGGAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGAAACCTCACCCGGCCCGGACACGGAAAGGATTGACAGATTGATAGCTCTTTCTCGATTCTGTGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGATAACGAACGAGACTCTGGCATGCTAACTAGTTACGCGACCCCCGACGTGGTCGGCGTCCCAACTTCTTAGAGGGACAAGTGGCGTTCAGCCACCCGAGATTGAGCAATAACAGGTCTGTGATGCCCTTAGATGTCCGGGGCTGCACGCGCGCTACACTGACTGGCTCAGCGTGTGCCTACCCTACGCCGGCAGGCGCGGGTAACCCGTTGAACCCCATTCGTGATGGGGATCGGGGATTGCAATTATTCCCCATGAACGAGGAATTCCCAGTAAGTGCGGGTCATAAGCTTGCGTTGATTAAGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCGATTGGATGGTTTAGTGAGGTCCTCGGATCGGCCCCGCCGGGGTCGGCCCACGGCCCTGGCGGAGCGCTGAGAAGACGGTCGAACTTGACTATCTAGAGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTA\n>MEQV01000070.1/1472-1355 Betaproteobacteria bacterium RIFCSPLOWO2_02_FULL_62_17 rifcsplowo2_02_scaffold_16404, whole genome shotgun sequence. \nTAGCGGGTTGAAGTCCCGTCCGGGGAGTTGTCCGTACGCCCCGGTAGCTGAGGAAGCGGCGCCGTGGCAACACGGGGTCGTGAGTTTGCAAACAGCAAGAGAGCAGGCCGTAACGCAA\n>GG738884.1/92380-92084 Naegleria gruberi genomic scaffold NAEGRscaffold_40, whole genome shotgun sequence. \nCTGGGCTACTGTAGGGAGGTAGCTGTTATGGTTCTCTGCCACAGCGTCAGGCAAAGGGATGGTTCTTCAGACTCATTCCTTTGTTAGCAATATGGTGACGATGTTCTGTCTGACCAATAGCGGTGTGACCATAGTATCTCCCCATGAATAAGGAGAAACTAGGGTCCTAATGAAAGGTGAACCGGTTGAGGCAGGATAACTGAGCAAATCATAGCCTTCACACTGTAGGATGGTCAGATTGCAGAACTGAGCATGAGCTATCAGAGAGTGAAATCTGGGAGTCAGACTAATGTTTTT\n>GL349550.1/1-552 Thecamonas trahens ATCC 50062 unplaced genomic scaffold supercont1.118, whole genome shotgun sequence. \nTTTTGATTCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGCGTCGGATTGTTCACCCGCAAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACCGATGGAGCGTTATTGGGCAAGTAGAGCAACTCAGTACGAGAGGAACCGTTGTTCGACAGAATTGGTCTTGCGGTTGGTCGAGGGGCCACGCCGCGCAGCTACCCTGTCTAGGATTACGGCTGAACGCCTCTAAGCCGGAAACCATGCTTAGGCAAGCAGTAACGGGAAACTGGATGCAAGTGGCGAGCGGCGCAGAAGCGCAGAGTAGGGCAGTGCAAGCTGTCGGCAACGCGGGGGGGAGACTCGGTCCTTGCCTTTTTCATGAAGCTGTGGGGCAAGGGCTGGTCTTTGAGATGTGGAGTACGCGGTAGTCACTTGCGTGGATCCTCTGTAGATGACTTTGTTCGCATGGGGAGTTGTAGGAAGCTGAGTGGCCGAGTTTGCCACGAACTTTTGAGACCTTGCCCTATCTTTTTAGAGT\n>MJEQ01002762.1/109736-109880 Nicotiana attenuata strain UT scaffold02762, whole genome shotgun sequence. \nAAAATAAGTGCCTCTTAGAAAGCCTCGGATGATGCCTACAATACCATTTTGTAGGATCATAAGCCTTTTAATTTGAAGTTTAAAACCCTACATAAATTAAGGTTTTAGGCAAGTCATCCTTGGCTATCAAAGCAAGCTCTTTATT\n>FAOM01049750.1/126257-125942 Triticum aestivum genome assembly, contig: Triticum_aestivum_CS42_TGACv1_scaffold_049750_1BS \nTTTTTTTTAAATGTGCCATGTCATGCACATGTATTTTGTAAAAAAGAATGTCAGCATTAAAAATGCAATGTGTGTGATGCCTTGAACGTGATTATAAAAACACTATTGTTACTGACATGTGGTGACGGGTGACGGAGAATTAGGGTTCGATTCCAGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAAAAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACACGGGAAGGTAGTGACAATAAATAACAATACCGGGCGCATTAGTGTCTGGTAATTGGAATGAGTATAATCTAAATCCCTACATCATCATAA\n>AFYH01012672.1/16268-15971 Latimeria chalumnae contig012672, whole genome shotgun sequence. \nACTCAATCTGTTATCATTTTTTCACTTACTTGGTGAGCCAAGTCCCAAGGGGCTCTCAATTCTGGTAACAAGTGCCTGGCTCAGCAGGGTGCGGCCCACTCCAGGGACAGTAGCAGGCGGAGAGTTTCACCAGGGCAGTACATCTGTCAAACAATAACACAGGTGTCCTAAAGCAAGTTCAGGGAGGACAGAAACCTCCCGTGGAGTAGAGGGTTTTGCCTCTGAGTCGGAGGGTTGCAGGTTCAAATCCACCTGGGGACCTTGGGATCTGTCAACTCCCCAGTATGGTATCTGGGGG\n>KB846873.1/2237147-2237221 Nelumbo nucifera unplaced genomic scaffold scaffold00090, whole genome shotgun sequence \nGTCTTACACTTGATCTCTAAGGTAAGTTCATGTGTTGACAAGTACATAGAATAGAAAAAGCTCTGAAAGGTTGCT\n>LKHD01000187.1/27860-29827 Candidate division Hyd24-12 bacterium Vib_1 contig65, whole genome shotgun sequence. \nAATGAAGCTACCAAGGGCATACGGTGGATGCCTTGGCACAGGCAGGCGATGAAGGACGTGGTAAGCTGCGATAAGCTCCGGTGAGGTGCAAGCAACCTTTGACCCGGAGATCTCCGAATGGGAAAACCCACCTGGAATAAAAGACCAGGTATCTCCTTACTGAACACATAGGTTTGGAGAGGCTAACCCGGGGAACTGAAACATCTTAGTACCCGGAGGAAGAGAAAGCGAAAGCGATTCCCTGAGTAGAGGCGATCGAAACGGGAAGAGTCTAAACCGAGCGGTGCGTGATAGCTGCGCAAGCGTTGCACCGCCGGGGTAGAGGGAAGTGTCCGGAGGATGCGTCACCTCGGATCGAAAAGCATGCTAGCAGAAGCTTCTGGAAAGTTGCTCCAAAGAGGGTGAAAGGCCCGTACGCGAAAGCATGCTCTGGATCTGGGACACTCTCCCAAGTAGCACGGGGCACGTGAAATCCTGTGTGAATCCGGGCGGACCACCGCCTAAGACTAAACACTCGCCTGTGACCGATAGTGAACTAGTACCGTGAGGGAAAGGTGAAAAGCACCCCTGGCGGGGAGTGAAATAGTACCTGAAACCGTGTGCCTACAAGCAGTCGGAGCAGACTTGTTCTGTGACGGCGTGCCTTTTGCATAATGAGCCGGGGAGTTGCTCGTACGTAGCGAGGTTAAGGCCGGGAGGCCGGAGCCGCAGGGAAACCGAGTCTGAACAGGGCGATTCAGTTGCGTACGGCAGACCCGAAGCCAGGTGATCTATCCATGGCCAGGCTGAAACTTGGGTAAAACCAAGCGGAGGGCCGAACCCACTAACGTTGAAAAGTTAGGGGATGAGCTGTGGATAGGGGTGAAAGGCCAAACAAACCTGGAGATAGCTGGTTCTCCTCGAAATAGCTCTAGGGCTAGCGTCGATGCAGTGTTCCGGAGGTAGAGCACTGGATGGGTTAAGGGGCCTACAAGCTTACTGACCCCAACCAAACTCCGAATGCCGGAACATGGTCTACGGCAGTCAGGCCGCGGGGGCTAAGCTCCACGGCCGAGAGGGAAACAACCCAGACCGCCGGCTAAGGTCCCCAAGCATACGTTAAGTGTATCTAAGGAAGTGGAGTTGCTTAGACAACTGGGATGTTGGCTTAGAAGCAGCCATTCATTTAAAGAGTGCGTAACAGCTCACCAGTCAATGCGATTCTGCGCCGATAATAATCGGGGCTCAAACGTATCACCGAAGCCGCGGACTGTCGCCTTGAGCGACAGTGGTAGAGGAGCGTTCCGTATGCGCTGAAGGTGTCCTGTGAGGGATGCTGGAGTGTACGGAAGTGATCATCCCGGCATGAGTAGCGATAATGCAGGTGAGAAACCTGCACACCGAAAGCCTAAGGTTTCCTGGGCAAGGCTGATCCTCCCAGGGTAAGTCGGGTCCTAAGCACAGGCCGAAAGGCGTAAGCGATGGGAAGCAGGTGAATATTCCTGCACCATTGTGTGTGCGTTCGAGCGATGGGGTGACGCGGAAGGTAGGGCCATCCGGGTGATGGATGTCCCGGTTTGCACCTGTAGGAGGGAGCGGCAGGCAAATCCACCGCTCCAACTCCGAGGGGTGTGACGAGAGCTTCGGCTCGCAAAGTGGTCGTGTCCATGCCGCCNNATCCTCAGGTGTTCGAGCTAACCCGGGTTAAGGAACTAGGCAAAATGGTCCCGTAACTTAGGGATAAGGGACGCCCGGTCTGGTGACGGTGTACAACCTGAGCCGGGCTGGGCCGCAGAGAAATGGCCTGGGCGACTGTTTACTAAAAACACACGTCTCTGCCAAGTCGTAAGACGACGTATAGGGACTGACACCTGCCCGGTGCTGGAGCGTTAAGGGGAGAGGTCAGAATACGCCTAACCGTGTATTCGAAGCTTTGAACCGAAGCCCCAGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGA\n>AMYB01000001.1/3357429-3357616 Mucor circinelloides f. lusitanicus CBS 277.49 MUCCIscaffold_01, whole genome shotgun sequence. \nCGTATCTGCCTTAGATCCTTTGTCAAGGTTTTGATGTTTATCATCCTAATCTACAGAGCTTATGTTTTGCTTTTCGTTGACAAAGCTTGAGTCATTCAGATACAAGATTACCTATACCTCCATCTCGGTCCAGTTTTATGGCTTCTTGGCTGTCTGTACTCTGTAGATTTTGCTTATATGGATACTTG\n>BBIW01000001.1/9239-9376 Paenibacillus sp. TCA20 DNA, contig: PspTCA2nb01. \nGACTGATAACTGCCGAATTCTCGCACCAAGAAGCGGGGGACCCGACCATTTATGGGTGAATTGATCAATATTAAAGTGATCATAGGGAACCTTCAACCGAATCCTTAGCTAACCTCGCAGGCATTGGAAGGAGTATTA\n>ALWS01013471.1/7379-7260 Pteropus alecto contig13471, whole genome shotgun sequence. \nTCATACGGATAACTTCCAATTAAAATTCAGGACTACAGCCTGATCTCAGAAGCTAAGCAGGGTTGGGCCTGGCTATTACTTGGATAGGCGACCACCTAGGAAGACCAGGTGCTATAGGTG\n>LOER01000038.1/6182-6000 Desulfitibacter sp. BRH_c19 BRHa_1005201, whole genome shotgun sequence. \nATAATCCTGCTAAGTTCGTGTTAGGGCCGGTTATTTTGAAACCAACACTAAAACATTGGGAATTCGGTGTCTGGTTGAGTATGAAAAGCCTTCTGGGAAAGGAATTCAAAACCAACTAGCAGAGTACCCACCTGCGTAGGCAGGTTTCTCAAAATTCCGGCAAACGGCTAGAGCGGGAGATGC\n>GL378346.1/56514-56307 Volvox carteri f. nagariensis unplaced genomic scaffold VOLCAscaffold_25, whole genome shotgun sequence. \nTGCATTCACCGTTTTCGAAAACTCGCAGGCCGACAGCCCCAAGCAGGCCATCAGCAATGCGAACATTGTTCACGACTAAAATATCTGCCCTATCCACTTTCAATGGGAGGATTGAGACCTACCATGGTGGTAGCGCGTGACGGAGGACTAGGGTTCAATACCGGAGAGGGAGCTAGAGAAATGGCGAACACAACCAAGGAAGGCCGCA\n>CM000392.2/29331781-29331980 Equus caballus chromosome 16, whole genome shotgun sequence. \nAAGGACGGAAACAGTGTCTTCTGCTTGATCCAGAAAGACGTTCCTCATAAAAGTCCGTAGAAAATTAAAATCTTCCACAAGAAGGAGGGGCGGCGTTCTCTCCTGAGTGTGAAGCCAGCTCTTGGTGTTGCTTCACTGCAACTGCCATTTGCCATTCATGGTCTTGGGGAATAAGAGAGAGAGGACAGAGTCTGAGTGAT\n>MNYG01000183.1/3075-2991 Deltaproteobacteria bacterium CG2_30_63_29 cg2_3.0_scaffold_12261_c, whole genome shotgun sequence. \nCTTGCCCTCCGCCACGACCAGCAAACAGAAGACGGCGCCGAATTCGGCGCCGTCTTCTGTTTGCTGGCTGACGCGGCACGTCAGC\n>LJSX01000027.1/46243-46357 Rhizobiales bacterium HL-109 ITZY_scaf_197, whole genome shotgun sequence. \nCACTCTGGAAAGAGGCAGGTCGAGACAGGCCTGCCCACCGAAGGGCGTAACTCGGCAGTTTCGAAACCTGGTTTCGAGGGTTCCGAGGAAATCTCTCAGGTTACGGGACAGAGGG\n>KL543181.1/848-2043 Capsicum annuum cultivar Zunla-1 unplaced genomic scaffold scaffold24819, whole genome shotgun sequence \nCGACCCCAGATCAGGATGGATTACCCGCTCAGTTTAAGACTATCAATAAATGGAGGAAAATAAACTTACAAGGATTCCCTCAGTAACGAAAAGCAAACCAAGAATAGCCAACCTTAGAATTGAGCGGCTTCATCATCCGAATTATAGTCTGGAGAAGCTTCCTCAGTGGCAGACCGGCCCAAGTCCCCTGGAAGGGGTGCTAGAGAGGGTGAGAGCCCCATTGTGCTCGGACCCTATCGCACCACAAGGCGCTATCTATGAGTCGAGTTGTTTGGGAATGCAGCCCAAATCGGGCGGTGAATTCCGCCCAAGGCTAAATACGAGCGAGAGGCCGATAATGAACAAGTACCGTGAGGTAAAGATGAAACTGAATTTGAAGAAAGAGTCAAAGAGTGCTTGAAATTATTGGGAGGGAAGCGGATGGGAGACGATGATATGCCCCAGTCAGATGTGGAACGGAGATGAGCCGGTTCGTCGTTCGACTCAGGGTGTGGACCAGCATGGATTGGGGGAGGCCAAAGCCCGAGCTCTTGGTACGCTCGTGGAATGCCGTCTCCTCAATTGTGGCAGGTAGTGCGTGCCTCCGATGTGCTTCAACATCTGCGCACTTTGGATGCTGGCCTGTGGGCTCCCCATTCAACCCGTCTTGAAACACAGACCAAGGATTCTGACATGTGTGCGATTCAATGTTCGAGTAAACCCATAAGACGCAAGGAAGATGATTGGTGGGATCCCCCTGAGGGGTGCATCGCCGACCGACCTTGATCTTCTGAGAATGGTTCTAGTGTGAGCATACTTATCGGGACCCAAAAGATGGTGAACTAGGCCTGAGCTGGGCGAAGCCATAGGAAACTTTGGTGGAGGCCCACAGTGATATTGACGTGTAAATCGTTCGTCTGACTTGCGTGCACCACATGCTAAGTGCACGGATTCACCAATGAACCATGGGCAAAATGGCCACTAAGGATTATGTGCTTGGCACCCGTATGCCCGTGCACCCACTGTGAGCACACTATGTATTCGGCACTCGCACACCACAACACCAATAAAACACCATGCCACATGCCCCAAAATGGATCGGCGACCCCTGCACCATGCAAAAATAAAAGGAACATAAACATGTGAGGGTTCATAACTAGTAACTTCGACAATTACAAAATAAATGCTTCCACCAAGGTTCGTTCATCCTAATACTT\n>LQOK01000039.1/11515-11571 Mycobacterium bohemicum strain DSM 44277 contig_44, whole genome shotgun sequence. \nCCGGGCCCGGTTCCCGCTGGCCGACCAGGTGCAGCTTGCTGCCCGCGACCCGGCCCC\n>CP010951.1/2115046-2114927 Ramlibacter tataouinensis strain 5-10, complete genome. \nGCCGCTGCTCCGGGGTGCGAGCGGCCCTTCGAAAGAAGGCCGGTATCGCTGAGATGGTGAGTCCAAACCCGTGAACTTGAACCGGTTCGTACCGGCGTAAGAAGAGCTGACAGTGTCCCT\n>JH835735.1/956530-956203 Erinaceus europaeus unplaced genomic scaffold scaffold00447, whole genome shotgun sequence \nGGATGTGAGGGCACTCTGGCTGCGACATCTGTCCTCCCATTGATCGCCAGTGTTGATTCGGCTGATCTGGCTGGCTAGGTGGGTGTCCCCTTCCTCCCTCACTGCTCCATGTGTGTCGGTCCCGAAGCTGCGCGCTCGGTCGAAGAGAAAGAGGACAGCCTTCCCCGAATAGAGACAGACCGCTCTTCAGTTATACGAGTTATACGAGTAGCTGCACTCCCCTGCTAGAACCTCCAAACAAGCTCTCGAGAAACCTTGGGGCCTGGCGGTGGTGCACCCAATAAAGGACACATGACACAGTGTGCAAAGAACCTGGTTTGAGCTCCTG\n>CP000517.1/489591-489403 Lactobacillus helveticus DPC 4571, complete genome. \nTTGGATTTAGTATAATTTTATCCGTAGAAAAGCTGAAGCGGTGGCTATCCCTCAAGGAGATGGTACTTATGAGTATTTTTTAACTCGTATTCCTATCTTAAAAGAAAGGAGAAGCCCTCGTGTCTGTATCAGATGCGTTACAGCTAATACTAGATTTCGGCTCATTTGTCGTTATACTAATCTCATTAA\n>CM000798.1/58059981-58060079 Oryctolagus cuniculus chromosome 9, whole genome shotgun sequence. \nATCACATCTTAGCCTTTTGGCTAAGATCAAGTGAGGAATTTTTCAGATTTAATTTTCATTACTACTATAAGTAGTAAAACTATTAAACTTGTAGCCTTC\n>LM151543.1/11334-11803 Schistosoma mattheei strain Denwood, Zambia genome assembly, scaffold: SMTD_scaffold0002192 \nATGTTAGTAGTACAAAATAAGATGACGAATTCCCAACTGTTATTCAGGCTTGACTACTCGTATGATCCCTCGTTCAATAACTTATCGTCATTAAGTGTTAAATTTTCATCGATCTGTAAGCATCTGCTACGAAACCAGTATTTTTTTAGTGAAGTATAGTTTCGAATTGTTGTATTGTGCGGTTTGGGATACGCTGTTTATTTCATTTATTTATTTGAACACATAAATATTAGTTTAAAAGGGTACCGAATACATATGCGCCACACAAGTCAATTGATTTGTGTGTGAGCTGTGATACTACCCAGGTGCTCAGACCGAATGTTTTCATTGATCAGGAGCAAAAGTCCGAGTTTCGAAGACGACCAGATACCGTCGTAGTTGTGACCATAAACGATGCAAACTGACGATCAGCGTTTGTTCTATGATTGACATCGCGGGCAGTCCCCGGGAAACCTTTAAGTCTCTGGGCT\n>EU622808.1/288-49 Bacillus phage Nf, complete genome. \nCAAGGTGCAACACTTCCTATAGTATGGCACATGATTGGGGTATATCCTGATTGAGTTCAGCCCACATGTCACGGGGATTGATAACCCTCTTACTAAAAGTGATTGTTTCTTTGTCCTTTGTAACAATGCCACTGACGAAACGTTAAAGCGTGGGTTTCAGTGGTATTTTAATTTGTTCACAGATGTAGTAAATTATAGGTACATAGATGTATAAATATGCAGTTACAACCCTGCCCTAAT\n>FR853100.2/134335079-134334871 Gorilla gorilla gorilla genomic chromosome, chr7, whole genome shotgun sequence \nGCTGGGTGTGGTGACACGCGCCTGTAGCCCCAGCTACTTGGAAGGCTGAGGTGGGAGAATTGCTTGAACCTGGGAGGGAGAGATTGCAGTGAGCCAAGATTGTGCCACTGCACTCCAGCCTGNNNNNNNNNNCAGGCTGGAGTGCAGTGGCACAATCTCGGCTCACTGCAACCTCTGCCTCCTGGGCTCAAGCAATTCTCCTGCCTCAG\n>CM000316.3/76140660-76140798 Pan troglodytes isolate Yerkes chimp pedigree #C0471 (Clint) chromosome 2B, whole genome shotgun sequence. \nTTATCAGCTTGGGATAATCTTTACCTGTTCCTTCTTTTGGAGGGCCAAATTAAGGACATGATTGGCGGTCTCACATCAGTATGCGATTAACGTCTCTGAGTAGATCAGGAACTTCCAGTACCCTATTGTGCTATCTGAT\n>KE713303.1/22354-22189 Biomphalaria glabrata isolate BB02 unplaced genomic scaffold LGUN_random_Scaffold3540, whole genome shotgun sequence. \nATACTTACCTGGCATAGGCGGACAATGATCACAAAGGTTGTCCTCCCAGGTCGAGGCTCGTCCATTGCACTTAGGGCGGGCTGAAGCCTGCGACCACCCTTATCTTTTTTTATTCAAATTAAAAGCGCTTTTTTTTAATAATGATATCTTTTGAATGTAAATTTGC\n>CM001013.2/117960327-117960221 Mus musculus chromosome X, GRC primary reference assembly. \nGATGCAGTCCCGGGCACCATCTTGGGACTGCTGCTGTAAGACCCCCTTTCGGGGACCCCCACTCTAGTATTGGGAGTGAGAGAGCACTCAAAGAAACATGAGAATCC\n>MHZW01000213.1/12164-11957 Rhodocyclales bacterium GWA2_65_20 gwa2_scaffold_6804, whole genome shotgun sequence. \nATGAATACAACAGACAGCGGCCCGGCTATAATCCGCCCCGATTCGGCCAAGAGAACACGGTGCAAATCCGTGGCGGGCCCGCCGCTGTAACCGGGGACGAACGCCGCCTGTCGCGAGACGGCCACTGCCGGGGACCACCCTGGCGGGAAGGCGCGGCGCTTCGGACGATCCGGGAGCCAGAAGACCTGTCGAGTCCTTTTCTCGAAAC\n>LMSD01000007.1/142068-141895 Paenibacillus sp. Soil750 contig_15, whole genome shotgun sequence. \nTGTGCCTTTAAAAACAGTCCAGAGAGGCTGGCAAGGTAAAACGATAAGAAAAGTCGGGTAATGCTGAATCGAGAATTCAGTAAGCTTACGGATGTGCGCATCCTACAGCCCCGCTCTATCTCTTTATGCACTCGTAAACTCCTTGCCAAGAATTGGGCAAGGAGTTTTTTGGTT\n>FWYF01000005.1/72068-71837 Reichenbachiella faecimaris strain DSM 26133 genome assembly, contig: Ga0069982_15 \nAGATTTGCGGCAATTATTGGTTTTCGAAGGAAACGTATCCTGAGAAATTAAAAGGGAATTCGGTGAAGTGCTTAGCGCTCATTCCGAAGCTGTTCCCGCAACTGTAATTCGAAGATATCCTTGTGATATCATTTTTGATCTACCATTGCCACTGTCCTAATGAATCGGGATGGGAAGGCCGATCAAAAGATTTCGAAGAGCCAGGAGACCTGCCAGTAGTTATTATTTATCT\n>CBUT010022175.1/1809-1930 Eimeria mitis, Houghton, WGS project CBUT01000000 data, contig: Emh_contig2519_2 \nGCTGCTGCTGCTGCTGTTGCTGCTGCTGCTGGTGCAGCAGCAGCAGCAGCAGCAGATGAAGAAGGAGATAGGCTTCGGCTGCTGCAGCTGTGTGACCATTTGCTGCTGAAGAGACACACAGA\n>CM001945.1/16929330-16929657 Chlorocebus sabaeus isolate 1994-021 chromosome 5, whole genome shotgun sequence. \nGCTGGGTGTGGTGGTGCACGCCTGTAATCCCAGCTCCTCAGGAGGCTGGGGCGTGAAAATAGTTTGAACCTGGGAGGCGGAGGTTGCAGGGAGCTGAGATTGCACCACTGCACTCCAGCCTGGGTGATAGAGCAAATGCTCTGGCTATTGTGTTGGCAGCAGATTGGAGGAAAACAAGAGTCGGAGGGTGAGACCTCTGAGCGAGTTACTTATGTTCAGACAGCAGTCCTGTCCTGAACTGCTGGAGTGCCCAGGCTGGAGTGCAGTGGCGTGATCTCTGCTCACTGCAACCTCTGCCTCCCAGGTTCAAGCTATTCTCCTGCCTCAG\n>MTYJ01000796.1/4174-1035 Hypsibius dujardini strain Z151 scaffold0796, whole genome shotgun sequence. \nAGATAAAGCTACTAAGGCATAGGTGGTACCTTGGGGAAGTAGAGGCGATGAAGAGACGTCGGTGTACATCTGCGGATATTTGCTTCGGGGAGCTAGGTAAATAAGCTTTGTATCCGGAGATTCCGAAGTGGGGCAATCCCCTTTACATGAGATGTTGTAAATGACACTGCATGAGTTCAAGTAGTGCTGATGAGTCGACGCAGGCGAATGAAACACTCTAAGTTACCTGCAGCTGAGTAGAATCAAACGAGATTTTCTTGCAGTAGCGGCGAGCGCAGAATCGCAGAAGAGCCCAAAACCATTTGTGCGTGCACATTGGGGTTGTAGGATCTCGTATCAAGGGGAGTTAGTTAGCAAGAACGGTTTGGGAAGGCCGGCATAGAGAGTGAAAGCTCGTATAATACGAAAACTAACAACACCTGGCACGAGTATTCCCTGAGTAGAATCGGGGCACGTTGAAAACCCTGTTTGAAACTGGGGGGACCACCCTCCAAGCTACAAATACTACCTTACTACCACCGTAGTGGAGCTAGTAAACGGCGAGGGAAGGTGAAGAAAGAACCCCGATAGAGGCGGAGTGAAATAGATTTTTTGAAACCGTATGCTTACAAACAGTCAGGAGGGCTATTGTTAAAGCCTGATGACGTAACCTTTTGCATTTGATTCAGCGAGTTTATGGCTATGTGGCAGGTTAAGCCGTTGCGAGGGTGTAGCCGTAGGGAAACCGAGTACTGAAGTAGGGCGTTAAGTCGGCAGTGCTTGTAGAGCCCGAAACGGGATGACTGCTATCATGTTGCGGCAGGCTTTTTGAAGCGGAGGGTAAAACTTCGTATTGGACCTGGGACCGAACTCTTTGAAGGTTAAACTTTGGGATGACTGTGGATTAGGGAGTGAAAGGCTAATACAAACTTCGGAATAGCGGTTCTCTCCGAAAATCTATTTAGGTCATGCGTTCTAACGTATTTTCGGGGGTACAGCACTGACTATGGATAGAGGGTCACGCGTAGCTTACCAAACCTATTCAAACTCCGAATACCAGACGAGTCGAGCAGTGAGACAGATGCGGATGCTAAGTCCGTGGTCAAGAGGGAAAGAAACCCAGCCGCCAGTAAGGTCCCAGAAGATACATACTAAATCTGGACATGAAGTGAGCGAAGGTTGAAACTGACAGTCAGGAGGTTGCTTAGAAGCAGCCCACCCTTTAAAGAAGCCTCGTGAATAGCCACTGGACTTGTGGTTCTGCGGCCGAAAATGTAACTGGGCTTAAGTGTTCGTACGAAGCTACTGGACTTTTTTAAGTGGTAGGAGCACTTTGTGTGTGCCTTGAATGAAGGCGTACCGTACAGGAGCGTTGGGTCTCCACAAGAGCTTGATGCTGAATGAGTAGCGATTAAGGACGAGCGAGAATCTTCTCCCCCGTAATAATCTGGAAGGGTTCCTGGGCTCAGGTGGAATCCTCCCAGGGTAAGTCGGTTTCTAAGGCGAGCGCCGAAAGGCGTAGTTTCGCATGAACCATCAGGTTAATATTCCTGAACTTGTATGGTAAACGTTTGACTGGAAGGAGTGACGGAGAAAGATAGCAGATCTGGAGCATTGTTGTTCCAGATGTGAGGGTAGTAGGTGTGTGAGATAGGCAAATGCCGTCACAGTATATCACAAGGCCTTTGATTGCCGAATGCGCAAGCAGAGTCTGTTACTCTACGCCTTCCAAGAAAAAGTTCGCTAGGGAGTTATGTATTAATCCGTCGCTTAAACCCGACACATGGGTTATAGATGAGGAGAAATCCTAAGGTGATTGGATGAACTCTACGTTAAGCCCGCCCCTCTGGCAACTTAGATACTGGTAACTTCGGGAGAAGGCGCTGAATGTGAAGTCACTTGCTGACGTAGCATTATGAGGGTTGCAGTAAATGGGGTGAGCGACGTGTTTTTACCAAAAACAAGGGCCTTACTGCAACACGCAAGTGGAAGTATATTGGGCTGAGCGCTGCCGCGGTGCTGGAAGGTTAATGAGGTGGGTTATGCGCAAGCGCGCAAGCTTTTAAATTTTTGACAGTCCCAGTAAAACGGGCGGCGTAACATATACGGTTCCTAGTAGCGAATTTCGTTAGTCGGGTAAGTCGACCTGACGAATCGGCGTAACGGACTCCCCCTGTCGTCGAATCTGCGAGATCCAGCGAAATTTTGCGGTTGTGAGCGTCTGTGAAGAAACGCGCTTCGACCGCGCGGAGGATCCGAACAGAGGACCCCGTGAGCCTTTACTTGGTAAAAAAACCTTTTTGGTGGGGGCATTTGGGTTTATTCGGGAAAATAAAGGGGCCATGCGTCTAGGATAGGTGGGAGTTTTTGATCGTGCGTTCCGGCGAATTGAGCGTTCGGGGAGAACCAACCTTGGAAATACCACCCTTGCTTATTTTGGTAAGTCCATAACCTGCGGTCCTAATTCGCGGGCCGGGGGACAAATTGTCTGTGTGGGCACGTTTTGACTGGGGGGCGGTCGGCCTCACTAGAAAGAGTAACGGAGGCGCCGAAGGTCCTCTGAGCAGTTGGAAATCCGGCGAAAGGAGTGTAAACGCATTAAGGGAGCTTGACTGCGAGACAAACACGTCGAGCAGGAACGAAAGTCGCGGCTTAGTGATCCGGTGAGTTTGCCGAGTTGGAAGGGCCATCGCTCAACGGATAAAAGGTACTCCGGGGATAACAGGCTGATCTCCCCCAAGAGTTCACATCGACGGGGAGGTTTGGCACCTCGATGTCGGCTCATCACATCCTGGGGCTGAAGCAGGTCCCAAGGGTTTGGCTGTTCGCCAATTAAAGTGGTACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCCTATCTACTGTGGGCGCAGGAAATTTGAGGGGGTCTGTCCTTAGTACGAGAGGACGACCGGAGTGATGAACGAAACTCTGGTGTACTCGGTTGTCACGCCAGTGCATGCCGGTAGCTAAGTTCGGAAGATAAACCGCTGAAAGCATCTAAGCGGGAAGCTAGCCTAAGATGAGTTCCCTAGCACCCTTGAGTCCTAAGGCCGTTCGAGACCAGACGTTGATAGGTGGGGGTGGAAGCGCTAGTGTGAGCTACCATACTAATTCCGTGAGGCTTACCTAT\n>KQ483358.1/2572342-2572106 Curvibacter sp. PAE-UM genomic scaffold Scaffold1, whole genome shotgun sequence. \nCGTAAAATCTACAACGTTGGTGCTCGCGGTGTGGTTCACATGCCGCAGTTCAACGGGAAGCAGGAAGGTGAGCCGTCATGGCGAGCCCAACCTGCGCTGCCCCCGCAACGGTAAGTGGACGAGCCGCAAGGCTCCGCTTTCATCACCCAGCCACTGGATGCCCTGAACAAGCGTCCGGGAAGGCGATGAAGGTTGTTTCCATCAGCCCGGATACCGGCCAATGAAGTGGTGTCGCGC\n>AOLZ01000036.1/1-202 Halobiforma lacisalsi AJ5 contig_36, whole genome shotgun sequence. \nGTACCGGTTGTTCGAGAGAGCACGTGCCGGGCAGCCACGCACCACGGGGTAAGAGCTGAACGCATCTAAGCTCGAAACCCACCTGGAAACGAGATACCGCCGAGATCTCTCCTAGAAGAGGAGTTCGATAGACTCGGGGTGTACGCGCCAAGGCAACGAGGCGTTGAGCCCGCGAGCACTAATCGATCGAGCCACACACTCA\n>AYZS02054104.1/146-603 Beta vulgaris subsp. vulgaris contig144508.1, whole genome shotgun sequence. \nGCATAAACCAGTTACAGCAATTGATGGATGCCTTGGCTTCATCAGGCGACGAAGGACGCAGCAAGCTGCGATAAGCTTCGGGGAGCGGCACGCACGCTATATATCCGAAGATTTCCGAATGGGGAAACCCGGCACCTCTCATAGGGTGTCACTTCGATCTGAATACATAGGGTCGATAGAGCAATACGTGGAGAAGTGAAACATCTCAGTATCCACAGGAAAAGAACGAGAATCGATTCCGTAAGTAGTGGCGAGCGAAAGCGGAAGAGCCCAAACCGCCGGGATTTATCCTGGCGGGGTTATAGGACCATAATGTGAGACCACAGAAGTTAGACGAACACTCTGGAAAGTGTGACCATAGCGGGTGACAGTCCCGTAGTTTAAAACTCGAGTGGCTCTATTGGTATCCTGAGTAGCACCGTACACGTGAAATTCGGTGTGAATTCGTGGCGACCACG\n>JPJR01003066.1/1-928 Pseudogymnoascus pannorum VKM F-3808 contig_3066, whole genome shotgun sequence. \nGACTGTGAAGGAAACCCCGATCAATGGCGGCCTTATTTTGAGGGTCCTAAGGTAGCGGAATACCCTGGCCGTTAAATGCGGTCTTGCATGAATGATTTAACGATACAACAGCTGTCTCAATGATTGGCTCAGTGAAATTGGAATAACTGTGCAGATACAGTTTACCTCTAGTTAGACGAGAAGACCCTATGCAGCTTTACTGTTGCTAGTTATTGGATATGATTGAATTAATTTTAGTAGTATAAGGTAATTGGTTAGATATAATTGAAATACCTTTATTGTGTTTGTCATATTGATAGATTTAATCTATTTTCTTATCTAAAGATAGGAAATGACCCCTACTATGTTAGGGGAACAATGGCTAGGAGGCAGTTTATGCGGGGCACAGATCCCATAAAAAGTACCTGGGTGTATCCAAAGTTAATTTTGTAAAATTGACATGACTTACTTCTAAATTTATAATTTGGAAATAAGTTTTCATGACTAATAATACATTATATATTTAATGTATTTATTTTTAGTTTGTTATTTGGTATAGCTTATGCTATAACTAATCCAGCTATTTATCTATTAAGTTAGAAATATTTTTTTATCCAAGTAAGATTTTATCTATATGGAAAATAGATGTAATTAAAACATTGACGTAGATATCTTTCCAATGTTTTTTAATTTTTTTATTAGGTGTATTTGGTGAAACCAAACTACAAATTGCTAATAAGACAATTATGTTTATTACTTGTCAAGTTTAATGGCTTAATCTTGCTTTACTGTTTGACTTACACGTCTATCAGTCGCGTAAGCGGGGCATATGATCACAAGATGCAGAAAGGAAAGGTCTTGGATTTATGAAAAAGCTACGCTAGGGATGTTAGTCCTCCAATGTTTAAGTCTACTAATATTTATTATTGGGTTAATTAGACTTAAACTC\n>CP009129.1/1242075-1242156 Planococcus sp. PAMC 21323, complete genome. \nTCATTGCTGCAACCGCTCGAATCAGGTTACGTTAAGAAGATGCTTCGGCAGATCACCTGAATAGGCGAGTCTTAATCTAGAG\n>KM349742.1/1-304 Betacoronavirus HKU24 strain HKU24-R05005I, complete genome. \nGATAAAGTGTGAATCGCTTCCGTAGCATCGCACCCTCGATCTCTTGTTAGATCTAATCTAATCTAAACTTTATAAAAACACTAGGTCCCTGCTAGCCTATGCCTGAGGGTTTAGGCGTTGCATACTAGTGTCTTAGGAATTTGACTGATAACACTTCCCTGCTAACGGCGTGTTGCACTCTCAGTCTAAGCCTCCCACCCATAGGAGGTATCATGGCTAAGCGAGTCAACAAATACGGCCTCACGCTAAAATGGGCCCCAGAATTTCCGTGGATGTTTGAGGACACAGAGGAGAAGTTGGGTAA\n>MFFM01000046.1/175782-172748 Candidatus Edwardsbacteria bacterium GWF2_54_11 gwf2_scaffold_695, whole genome shotgun sequence. \nGGTCAAGCTACAAAGGGCACATGGTGGATGCCTTGGCAGATGAAGGCGATGAAGGGCGTGGTAAGCTGCGATAAGCTTCGGGGAGGTGCAAACAACCTTAGATCCGGAGATGCCCGAATGGGGGAACCCGTTCCGAGTCATATCGGAACACGCCGGGATGAAAACATTAGGAAGTAATCCTGGAGAGCTAACCTGGCGAACTGAAACATCTAAGTACCCAGTGGAAGAGAAATCAACCGAGATTCCCAAAGTAGCGGCGAGCGAAATGGGAAGAGTCTAAACTCGGTCCTGCGTGATAGCTGATACGCGTTGCAGGACGGGGGTATCAGGGTCGTTACGGATCCCGTGTATCAACCGGGGTCGGGGAGTCAAAAAGTCGTTCCTTAGCCGAAAGGTCTGGGAAGTCCTACCATAGACGGTGAAAGTCCGGTAGGCGAAAAGGAAGCGATCTCCCTGGTTGCGATTCCTAAGTACCATGGGGCACGAGAAACCCTGTGGGAATACGGGGGGACCACCCTCCAAGACTAAATACTCTCATCTGACCGATAGTGAACTAGTACCGTGAGGGAAAGGTGAAAAGCACCCCTGGCGGGGAGTGAAATAGTACCTGAAACCATGTGCCTACGATCAGTCGGAGCCTCGATTTATTCGGGGTGACGGCGTGCCTTTTGCATAATGAACCGGCGAGTTGCTTGTATGCAGCAAGGTTAAGTCCTTCTGGGACGTAGCCGAAGCGAAAGCGAGTCTGAATAGGGCGATTCAGTTGCATGCAGCAGACCCGAAACTGGGTGAGCTACCCATGGCCAGGCTGAAGTGACGGTAACACGTCATGGAGGGCCGAACCGGTGAATGTTGAAAAATTCTCGGATGAGCTGTGGGTAGGAGTGAAAGGCCAACCAAACCCAGGGATAGCTGGTTCTCCTCGAAATATATTTAGGTATAGCCTCGGAAAGTATGTGGCGGAGGTAGAGCACTGACAGGGCAAGGGACCTTACCAGGTTACCAACCCCTATCAAACTCCGAATGCCGTGCACAGGAATTCCGGGAGTCAGGCAGTGGGGGATAAGCTTCATTGCCGAGAGGGAAACAACCCAGATCGTCAGCTAAGGCCCCTAAATATCAGCTAAGTGAGAAAGGATGTGGAATCTCATAGACAACCAGGATGTTGGCTTAGAAGCAGCCACCATTTAAAGAGTGCGTAATAGCTCACTGGTCAAGTCATTCTGCGCCTACAATACACGGGACTATTAAGCTGATTGCCGAAGCTGCGGACTTGATTGATGTTCGCATCAGTCATTTGGTAGAGGAGCGTTCCACAGTAGGATGAAGCGGTGCCGTAAGACACCGTCGACGAGCTGGAAGTGAGAATGCCGGTATAAGTAGCGATAAACCAGGCGAGAAACCTGGTCACCGAAAACTCAAGGGTTCCTGGGGAAGGCTAATCCGCCCAGGGTAAGTCGGGCCCTAAGCCGAGGCCGAAAGGCGTAGGCGATGGAAATCCGGTTAATATTCCGGAACCACTGGTAAAGCGTTATCACCTAAGGGGGGACGCAGGAGTGAGATCCCATCCGCGATTGGAAGTGCGGGTCTAAGCTGGTAGGGGGATCCTGTAGGCAAATCCGCAGGGTCGTTAACCCCGAGAAGCGATGGGGAGTCCGTAAGGACATAAAAGGGATCGAATCACGCTGCCAAGAAAAGCCTCGTAGGGAGTTTTGCCGGTGTCCGTACCGTAAACCGACTCAGGTGAGTGAGAAGAGTATTCTAAGGTGCTCGAGATAACCTCCTTTAAGGAACTAGGCAATTTAGCCCCGTAACTTCGGAAGAAGGGGTCCCCGATTCTGTTAGGTAAATTCTTGCTGAAGCAGATTTGGGGCGCAGTAAATGGGCTCGAGTGACTGTTTATCACAAACACACGACTCTGCTAAGCCGATGAGGCGAAGTATAGGGTCTGACACCTGCCCGGTGCCGGAAGGTTAAGAGGAGAGGTCAGCCGCAAGGCGAAGCTTTGAATTGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGTGTAACAACTTGAGCGCTGTCTCAAAGGAGGACTCGGCGAATTTGTAGTGGCGGTGAAGATGCCGCCTACCCGCAGATGGACTAAAAGACCCCGTGAACCTTTACTGTAGCCTGGCATTGAATTTTGGTAAGGCATGTGTAGGATAGGTGGGAGACACTGAAGCTGGGGCGCTAGCCTCGGTGGAGTCGACGTTGAAATACCACCCTTGTGTTATTGGAATTCTAACCTAAATCAGTGAATCCTGGTTGGGAACCGTGTCAGGTGGGCAGTTTGACTGGGGCGGTCGCCTCCTAAAGAGTAACGGAGGCGCGCAAAGGTTTCCTCAGCGCGGTCGGTAATCGCGCTTATAGAGTGTAAAGGCATAAGGAAGCCTGACTGTGAGGGAGACATTCCGAACAGACACGAAAGTGGGCCTTAGTGATCCGGTGGCTACACGTGGAAGCACCATCGCTCAACGGACAAAAGGTACTCCGGGGATAACAGGCTGATCTTGCCCGAGAGTTCACATCGACGGCGAGGTTTGGCACCTCGATGTCGGCTCATCGCATCCTGGGGCTGGAGAAGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGTACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCTCTATCCTCTGTGGGTGTAGGAGATTTGCGAGGATCTGTCCTTAGTACGAGAGGACCAGGATGGACAAACCTCTAGTGTACCAGTTGTTCCGCCAGGAGCAATGGCTGGGTAGCTATGTTTGGTCGGGATAACCGCTGAAAGCATCTAAGTGGGAAACCCACCTCAAAACTAGATCTCCCTTCCTGTTTATTCAGGACTGAAGGCTCCCTGTAGACTACAGGGTTGATAGGCCACCGGTGTAAGATCCGTAAGGATTTCAGCCAAGTGGTACTAAATTGGCCGTGCGGCTTGATCAT\n>CM001436.1/1586328-1586399 Methanoplanus limicola DSM 2279 chromosome, whole genome shotgun sequence. \nGTCCCGATAGGGTAGTGGATATCCTAGAAGCTTGCGGAGCTTTTGACCCGGGTTCGAGTCCCGGTCGGGGCG\n>HG764817.1/91383-91181 Clostridium ultunense Esp genomic scaffold, CULT_3033 \nAACTTCATATCTCTTTTAGGTCACTTAGTTGACTCGCTAAGTGTTAATAGGGAAGTCCGGTGGAAATCCGGCGCGGTCCCGCCACTGTAAGCAGGGAGAGACGTTTAGGCCGAAAGGCAGCCACTGTGTACCGTCGTGCATGGGAAGGTGAACGAATCGAGGAACTGCAAGCCAGGAGACCTGCCTAAAAGAACGGCAAGTTC\n>FOGW01000010.1/58334-58502 Lachnobacterium bovis strain S1b genome assembly, contig: IE07DRAFT_scaffold00007.7 \nTAAAGAGATAGAGGTTGCGCAAGTCAAAAGTACTTTGCTAGATGAAGCAAATCAGATGACAGTAGAGGAAAGGGGCAAGCGCCGAAAGGGTTATTTTTGCAGAATAATTCTTGGGCATAAAGTTAATAGCTTTATGACTGTCATCGTAAGATGGAGTGCTATCATATAA\n>FR883370.1/19793-19582 Clostridium sp. CAG:221 genomic scaffold, scf18 \nTATTGAAGGAATTAGTATGGTGCTTTTAGTTTATAAATATAAATAGGCAAAAGTTAAAAGGGAATGTGATGAAATTTCACAACAGCCCCCACTACTGTGATAGAGGATGAAAGCTAAAATTATAAATTCCATTGAGAGATTTTCTTGAGAAGGAGTTTAGTGAGTAAAGAGATTCTTAAGTCAGGAAACCTGCCATAACTTTAATAGTGTTT\n>CP013068.1/4601278-4601164 Pannonibacter phragmitetus strain 31801, complete genome. \nATACCCTACGGAGCGCCTGGGTCCGCCGCATCTCCTGGGTCCGTGGGGCAAGGCCGGCGCGGTGTCTGCCCGATGAGTGGCCTCCTCGGATTGGCAGTCCCGCGCCGGCCGCCAC\n>AOCG01000006.1/51721-51599 Listeria aquatica FSL S10-1188 c5, whole genome shotgun sequence. \nAGATCCTTTAAATGTAGTCCAGAGAGGCTGAAAAGGTTAACGCTCATTTTGGAGAAGGTTCTCCATTTTAATTCGTGAGGTACGTCTATACCCTTTGCCGCTTTGGCAAAGGTTTTTTTTGTA\n>AQHR01000110.1/102878-102980 Lunatimonas lonarensis strain AK24 S14_contig_28, whole genome shotgun sequence. \nTGCCCATCGGGTGATGGGGTGCCACCCAAATATCAGGGACTTATCCGAAGTTTTCTGATTTTTTGAACCGCTTCGCAAGAATGCTGATGACTCCTACTTCAAC\n>FXAQ01000027.1/27875-27818 Paracoccus sp. J56 genome assembly, contig: M511DRAFT_scaffold00027.27 \nCATGGAGCAGGGTGAAATTTCCGGCTGGGTTTTCCGGCCGCCTGTCCGCCGGACAACC\n>HF986872.1/13619-13817 Firmicutes bacterium CAG:555 genomic scaffold, scf18 \nCAAAACCGATAGGTATTCGGCTCTGGGCCAGCTCGATTAAAAGGGAATCCGGTTCGAGTCCGGAACAGCCGCCATTACTGTATTTGACACAACGGGAGTCCATTTTGCCATTGGTGCGGCCTGTCCTTCGGCGGGCGCATCGAGAAGGCGGGCTTTCCGGTCATAAGTCAGGAGACCTGCCGTGCTTTTTAGGTTTACA\n>CM009307.1/3068679-3068534 Populus trichocarpa isolate Nisqually-1 chromosome 18, whole genome shotgun sequence. \nTTCAAAAGCTATTGGGTGTGACTGAGCAGCCGGATCCAACACTATTGGATCTTGTCATGTAGACCCTAAGCGATTGGGTTTTGTTGGGCAGCAGATTCCAATGTTGTTGAATCCTGCCAAGCTAGACTTAATAACACTTTTTGACT\n>JSDP01000122.1/5559-5705 Aphanizomenon flos-aquae 2012/KM/D3 spades_262_len_T:9526, whole genome shotgun sequence. \nCACTCTCTACAGTCAGAGTTGATAGGAGGGATTCTATCAAGCGTACACCAGAGAGTCCAAACTCAAACCCAGTGATGTGGGTGACTATATCCAAATATAAAACCGAGCCAGTTAGCTTGGTAGGGAAACCGAAGACTTAACTGGCTC\n>AYZS02017825.1/46586-46515 Beta vulgaris subsp. vulgaris Bvchr6.sca027.con0066.1, whole genome shotgun sequence. \nGTCTCTTCAAAGACATCTGATAAAATTGGAACGATATAGAGAAGATTAGAATGGCCCCTGCACAAGGATGAC\n>CCCW010005528.1/2486-80 Brassica napus, WGS project CCCW01000000 data, contig: 38660 \nCGGCCAAAATCACCCAAACAGTCCACGGGAAGGGCCAGCGTGCTGAGTCCAAGGACCAACGTGCTGATATGTGTACTGATGGACAGCCACTGACATCCTGTGTGTGCTGACGGACACACACGGACACACACAAACAGCCACGGACGTCCTGTGTGTGCTGACGGACACACATGGACGTCGTGTGTGTGCTGACGGACACCCACGGACGTTGTGGCTGCTTTGATAGCTGGAGCTCGGAAACGAGTTCTATCGGGTAAAGTCAATGATTAGAGGCATCGGGATGCAATTTCCTTGACCTATTCTCAAACTTTAAATAGGTAGGACGGGGTGGCTGCTTTGTTGAGCCATCCCACGGAATCGAGAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCCATGCGGGATGAACCGAAAGCCGGGTTATGGTGCCCAACTGCTCGCTAACCTAGAACCCACAAAGGGTGTTGTTGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCTGCTAAGGAGTGTGTAACAGCTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTAAAGCGCGCGACCTATACCCGGCCGTCGGAGCAAGAGCCAGGCCTCGATGAGAAGGAGGGCACGGCGGTCGCTGCAAAACCTAGGGCGTGAGCCCGGGTGGAGCAGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCTATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGAGTCGAGGGAAACCTGTCTGATTGCGCTTATGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCAGAACCGGGACGTGGCGGTTGACGGCTACGTTAGGAAGTCCAGAGACGTCGGCGGGAATTCCGGAAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCATGGAAAGGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGTACGTTGCGTGTTGTCCGGTGCATTCCCGGCGGCCCTTGAAAATCCGGAGGACTGAGTGCCGCTCACGCTCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTTGTCGATGGAACAATGTAGGCAAGAGAAGTCGGTAAAATGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGGCTGGGCTCGGGGGTCCCAGTTCCGAACACGTTGACTGTTGGCGGGCTGCTTGAGCTGCTAACGTGGCGAGAGCGGACCGCCTCGTGTTGGCCGAGGGATGGACTGGGAACGGCTCTTTCGAGATCTTTCCCCGGGCGTCGAACAGCCAACTCAGAACTGGTACGGACAATGGTAATCCGATTGTTTAATTAAAACAAAGCATTGTGATGGTCCCTGCGGATGCTAACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGAATCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCACATGAATGGACTAACGAGATTCCCACTGTCCTTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAAGTGTAGAATAAGTGGGAGCTCCGACGCAAGTGAAATACCACTACTTTTAACGTTATTTTACTTACTCCGTGAATCAGAGGCGGGGTAACAACCCCTTCTTTTAGACCCAAGACTCGCTTTGGCGGGTCAATCCGGGCGGAGGACATTGTCAGGTGGGGAGTTTGGCTGGGGTGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGTACGAATACGAACTGTGAAAGCATGGCCTATCGATCCTTTAGACCTTTGGAATTTGAAGCTAGAGGTGTCAAAAAATTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGTGTTCATAGCGACGTTGCTTTTTGATCCTTCAATATCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTTGATTGTTCACCCACCAATAGGAAACGTGAGCTGGGTTTAGACCGTCGTGAGACACGTTAGTTTCACCCTACTGATGCCCGCGTCGCAATAGTAATTCAACCTAGTACAAGAGGAACCGTTGATTCGCACAATTGGTCATCGCACTTGGTTGAAAAGCCAGTGGCGCGAAGCTACTGTGCGCTGGATTATGACTGAACGCCTCTAAGTCAGAATCTAGGCTAGAAGCAACGCATGCGCCCGC\n>ALAR01193061.1/17763-17860 Tupaia chinensis contig193061, whole genome shotgun sequence. \nATCCTTGGGTGGTTTATGAGTGTGATGGTTGGGCGTTCACACCATGTGTGAGATGAGTTCCTGAGCCTTGTTATGATGTGGCGCTGTCACGTCTGATG\n>AAIZ01015480.1/2116-801 Drosophila persimilis strain MSH-3 cont1.015479, whole genome shotgun sequence. \nAGTCGGGCTTGATTGGGAACAATAACATGGTTTATGTGCTCGTTCTGGGTAAATAGAGTTTCTATCATTTATGGTAGTTACTTGTTCCCCGGATAGTTTAGTTACGTAGCCAATTGTGGAACTTTCTTGCTAAAATTTTTAAGAATACTAATTATGTTAAACCAGTTAGTTCTTATTAATTATAACGATTATTAATTAACAATCAATTCAGAACTGGCACGGACTTGGGTAATCCGACTGTCTAATTAAAACAAAGCATTGTGACACAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAAGTAAGCGCGGGTCAACGGCGGGAGTAACTATGACTCTCTTACGTGAAGCGGAACTTTTTCGTCCCCAACACGGCTGGGTGTGTCAGCCCACGCGTTTGCTAACAGGTCAAGATTACCGAAACGGTATCAAGCTGCGAATAAATGTCCTACCATCGAGGTCTCGTACCACGAGGGGCAGAAATGAATTGGAACGGCAATGTCGTGCAGGTTGTGATGCTCCCGAAACAACAAACCACATCCTGCAAAATTGTTACCGTACGCATGGGAGGCGGGTAGCAGGACATAACTGTGTAGTCAATAACCTTCAGAGGATTCTTGAGGAGAAGGGCCACACAGTGCACGTCGAACCAAGTTTGCAGCTGGAAACCTCGGTAAGTAAACCAGACCTGGTGTGTATCCGTGACAATCACGCTTGCGTGATTGATGCGCAGATTATAACAGATGGACTGTTTCTCGACGATGTGCACCATCGCAAAGTTGAGAAATATAAAAGACCTGAAGATATTTCTGCACTGCGGAGAGAATTCGGAGTGTCGGGCAACGTTGAAGTCCTAAACGCGACGTTAAACTGGCGTGGGATCTGGAGCAATCAATCCGTTAGAAAATTGATAGCAAAGGGTCTCATCTCATCCGGTGACAGCAATGTCATCAGCGCCAGAGTGGTAACAGGCGGACTATATTGCTTCAGACAGTTCATGTATCTCGCAGGTTACACGCGAGATTGGACTTAGCCTATACACTATGTTGGAGAGAAGACGCTTGCTACCTAGGCATAATGTGAAATTAGGTATAAACATCGTGGTTGTAAAACTTGAGGTGGGTTTTTAGTACGTATGCGTGATTACTTCGTAATCATGAATCGTGCATGCTAGTGGGGTTTGGCCTCCACTACTATCTTTGAAGATTTTCCTTCCTCAGCGATAAAAAAAAAAAAAAAAAATAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAATGAGATTCCTACT\n>CP014135.1/3524579-3524757 Pseudomonas agarici strain NCPPB 2472 genome. \nACCCCGGTATTATTGCTGTCATGGGTTTTAATCGAGCTTAGCCTTGTTCATTTTTTTACACAACACCCCATAAAAGATCCTACACGGCCCGCTCAAGCCTGCAGGACCCAAAGAGACGCAGAGGCAAAAAACGCCCAAAAACGCCTGAAAAAAGGCTCTGCGGTGCTTTCTCAGCACAA\n>AFFG02002037.1/1014-1 Drosophila ficusphila Contig2037, whole genome shotgun sequence \nAGATCAGAAGAGATTTTAGATAGATCTCGCTCCTCAGCAAGGGGGAGTGTTTGCCCGACAAGCACACACTCGAATTGCTACCGGGATAGTTGCTACGTACATAGCTGTAGCTTCTATTTTGGGGCGTTGGTCTGGCGCTTAATCTAGACACATGCACTATATACATGGGTATATAAGAGTGTCGTGGCTGTACTCCCTTCAATGTGGAACACGCCACGTTAAATAAAACTCGGAGGGATCCGATCCACACCTGTCCCTATCTACTATCTAGCGAAACCACAGCCAAGGGAACGGGCTTGGAATAATTAGCGGGGAAAGAAGACCCTTTTGAGCTTGACTCTAATCTGGCAGTGTAAGGAGACATAAGAGGTGTAGAATAAGTGGGAGATATTAGGCTTCGGTTTGATATCGCCAATGAAATACCACTACTCTTATTGTTTCCTTACTTACTTGATTAAATGGAACGTGTATCATTCCTAGCCATTATACGGATATATTTATTATATCTTATGGTATTGGGTTTTGATGCAAGCTTCTTGATCAAAGTATCACGAGTTTGTTATATAATCGCAAACTAAATCTTTAATAAAACGATGCATTTATGTATTTTTGATTTGAAAATTTGGTATAACTCCAATTACTCAGGTATGATCCAATTCAAGGACATTGCCAGGTAGGGAGTTTGACTGGGGCGGTACATCTCTCAAATAATAACGGAGGTGTCCCAAGGCCAGCTCAGTGCGGACAGAAACCACACATAGAGCAAAAGGGCAAATGCTGACTTGATCTCGGTGTTCAGTACACACAGGGACAGCAAAAGCTCGGCCTATCGATCCTTTTGGTTTAAAGAGTTTTTAACAAGAGGTGTCAGAAAAGTTACCATAGGGATAACTGGCTTGTGGCGGCCAAGCGTTCATAGCGACGTCGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAAAATTCACCAAGCGTTGGATTGTTCACCCATGCAAGGGAACGT\n>URS0001A23A8E_12908/1-67 unclassified sequences L31-Actinobacteria ribosomal protein leader \nGCGGUUCCGGUUCACGCCACCAAGGGUCGGCCCGCCCCAUGACGGGUGACCUGGCGACCCGGCGACC\n>URS0000D6C5EB_12908/1-87 unclassified sequences GA-cis RNA \nGACAGGCGAAATATAACAGCTCGAAGAGCTGTATTGTAATACATTTCGCCGCACAGCCGCCGAACGAAGTGAGGGGCAATACCGCTG\n>MEDQ01000009.1/7811-8223 Bordetella sp. SCN 67-23 ABS43_C0009, whole genome shotgun sequence. \nAGAGCAGATCAGGCAGTCGCGGTGCCTTCGGGCATCGAGGAAGGTCCGGACTCCACAGGACAGGATGGCGGCTAACGGCCGTCCGGCGATCGCTGGGGCGCAAGCCCGGGCGCGAAGCCGAGGAATAGGGCCACAGAGACGAGTCTGCGGCGAGGGCGGACGATGTTCGCACCGGTACGGCCACTCCGTACCGTTCGCACGGGCAACCGTGCGAGTCGCGGCAGGGTGAAACGCGGCAACCTCCATCCGGAGCAACACCAAATAGGCATGCGCGCGGCTTCGGCCGCAATAGGGCGGTCCGCCCGAGCATGCGGGTAGGTGGCTAGAGCCGTCCGGCAACGGCCGGCCCAGAGGAATGACTGCCCGCGGGCGACGCCCGTGTACAGAATCCGGCCTATCGATCTGCTTTGCCT\n>URS0000D69D6E_12908/1-58 unclassified sequences RAGATH-30 RNA \nGTAAAAATAAGATTTTGCCGAATATATTCATATAGATGAATCTGTTATGAAACAGAAA\n>JH835302.1/8483619-8483740 Erinaceus europaeus unplaced genomic scaffold scaffold00014, whole genome shotgun sequence \nAAGACAGAGAAATAGAGAACATTAAAAACTAATCTGTATTTTTTGTAACTGGCGATAGCAATGCCATATTACAAGCCTTAATGACATTGGGGTCTTTAAGGTCCCTGAAAGTGGCTATATGA\n>URS0001A239EB_186490/1-52 Candidatus Baumannia cicadellinicola L31-Gammaproteobacteria ribosomal protein leader \nCGUGUGGCUUAUAGUUAAAAUCGUCGAUAGCGACACAAUCUGACGAAUAGGU\n>JH417673.1/4548-4310 Flavonifractor plautii ATCC 29863 genomic scaffold Scfld77, whole genome shotgun sequence. \nTTAAACGCAATGAGGGAGAAGAGTACTGCGGGGACTCAGTCCCAGCGAGCGGGGGATGGTGAAAGCCCCGCACAGGAGGCCGCGGGAAGAACGCTCCGGAGCGGAAACCCGAACGCACCGCGCCAGTAGGGGGAACGGGCTGCGACCGTTACATCGCGCCGACTTGTCAGAGCCGGAAAAGGGGCCGCCGTCCGGCGGCAAATTAGGTGGCACCGCGGAGCGCAGCATTCGTCCTAATC\n>MHBP01000260.1/25988-25933 Lentisphaerae bacterium RIFOXYB12_FULL_65_16 rifoxyb3_full_scaffold_468, whole genome shotgun sequence. \nGGGTGTAACGGCACGGGGGTTCGTTACAGGCGCTCTGGGTGGTCGGGCCGCCATCC\n>URS0000D65EAA_12908/1-173 unclassified sequences malK-I RNA \nTCCAACCCCCGCGTCTTACTCCACCTATGTAATCCACGGGGGAAATAAAGAAGGAGGAAAGTTTTTCCGCCTGACCGGCGGTGCGGCAGTGTGGAGACCTGTCGTAAGGCAGCGTGGCGGCTGCGAGGCTCCGTTTCGCGGAGGCGGCGGGGCTACGGTCAAGCATTATGGCA\n>CAJW010157214.1/4791-4634 Hordeum vulgare subsp. vulgare, WGS project CAJW01000000 data, contig: morex_contig_157214 \nAAGGAGAAGTGTGATAAGCTTTGAATGGAAGCCCCGGTAAACGGCGGCAGTAACTCTAACTGTCCTAAGGTAGCGAAATTCCTTGTCGCATAAGTAGCGACCTGCACGAATGGTGTAACGACTGCCCCGCTGTCTCCGACATGGACCCGGTGTCGTTT\n>CH966573.1/1-1154 Drosophila willistoni strain TSC#14030-0811.24 scf2_1100000007260 genomic scaffold, whole genome shotgun sequence. \nGAAGTATTTAGGTATCCGGTTCGCTGTGGATGGGCGGGCTCGGTATAGTCCAGCAGACGACCTCGGTCCGAAGCTGTTAAGATTAATAAGAGCCCCTCTGAAACCACAACAGAAGTTATTTGCACTTAGGACTGTCCTTATCCCACAACTCTATCACCAACTAACACTTGGGAATTTGATGATAGGCGTCCTAAGAAAATGTGACAGATTGGTACGGCAATTCGTAAGGAGATGGTTAGATCTCCCACTGGATGTACCAGTTGCGTACTTTCACGCCTTCCACACTTGTGGGGGTCTCGGGATTCCGTCAATTAGATGGATGGCACCGATGCTGCGTCTGACGCGATTGAGCATGATTAAATGGCCCCACCTCGAACAACCCGAGGTAGCTAGCTCTTACATTGACGACGAATTGCAAAGGGCTTGAGATAGATTAAAGGCGGAAAATGTGCAGTTGTGTTCGCGTCCAGGCAAACATTGCCAGGTAGGGATCGGCCTATCGATCCTTTTGGTTTAAAGAGTTTTTAACAAGAGGTGTCAGAAAAGTTACCATAGGGATAACTGGCTTGTGGCGGCCAAGCGTTCATAGCGACGTCGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAAAATTCACCAAGCGTTGGATTCTTCACCCATGCAAGGGAACGTAAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTAATGACAAAACGTTGTTGCGACAGCATTCCTGCGTAGTACGATAGGAACCGCAGGTACGGACCAATGGCACAATACTTGTTCGAGCGAACAGTGGTATGACGCTACGTCCGTTGGATTATGCCTGAACGCCTCTAAGGTCGTATCCGTGCTGGACTGCAATGATAAATAAGGGGCAATTTGCATTGTATGGCTTCTAAACCATTAAAAGTTTATTTTATAAACGACAATGGATGTGATGCCAATGTTATTTGTAACATAGTAAATTGGGAGGATCTTCGATCACCTGATGCCGCGCTAGTTACTTATTAAGACATTATTTAATACAATGACAAAGCCTAGAATCAATTGTAAACGACTTTTGTAACAGGCAAGTGTTGTAAGTGGTTGAGTAGCTGCCATACTGCGATCCACTGAAGCTTATCTT\n>JXUM01182853.1/1550-1 Aedes albopictus isolate Foshan contig182853, whole genome shotgun sequence. \nACTGGAGAGTTCGTTATCTGCCGTAACCGGTCGCTGGTTCAAGTTCAACTAGAATGTGGCTTTTACTCCCAGAGAGGGTGATAGGCCCGTAGAGCGGAGCACCGATGGTAGAAGATCTTTCCATGGAGTCGTGTTGCTTGATAGTGCAGCACAAAGTGGGAGGTAAACTCCTTCTAAAGCTAAATATCACCACGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGTTGAAAAGCACTCTGAATAGAGAGTCAAAAAGTACGTGAAACTGCCTAGGGCTCAAGCCCGTTGAACTCGATTATCCGAGCGGAGACATTCACCTGCGGTTGGCCGGCGACGGCACGGCCGCAGGGCACTTGTCTCTCGCACTAGCCAAGAGGACACTGCGATCCATTACGAAACAGCTTTCGCGCCGCAAGGCGCAAGGTCGCCCGACAACTGCCCCTGGTGCTGGTTGCTTGCCCCACAGTAGCGACGCTCAGTTCTGAAGGCCTGTGCCGCGAGGTGGGGCTTACTGCACGTGGTGTTTTGCAGTCGGGCGCGTGATGGATTCCCCCGGACACCGGGTGGTCTTCCCGTAAGGGGCCACCGGACTGTCGATCGGCAGTGAAAGAATCGAGGTACCTTCGGGACCCGTCTTGAAACACGGACCAAGAAGTCTATCTTGCGCGCGAGCCAATGGTCGTCCTCCGGAGCACCAAAGGCGCAGAAAACATAACTTGAGTTGTGCGGGATTACGGGCGCGGCTCTCTGCTCGTCCCTCCATCCCCGGGTGTTGTAATCGGCATGCGGCTACCGGGACCCAGGCTTCACGGCCCCCGGCACCGTGCCACAACATACCGTGAGTGTGCAGGATGTGACCCGAAAGATGGTGAACTATGCCTGATCAGGTTGAAGTCAGGGGAAACCCTGATGGAGGACCGAAGCAGTTCTGACGTGCAAATCGATTGTCAGAATTGGGCATAGGGGCGAAAGACCAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCACGCAACGTTTCGAATGCTATTCTTATCTGGTAAAGCGAATGATTAGAGGCCTTAGGTTCGAAATGATCTTAACCTATTCTCAAACTATAAATGGGTACGTACCATAGCATTCTTGCATGATGCTGTTGCAAACGTTGGTAAACGCCGGGCCGTCCCCTGTCAGGGCGTGCCACGGCGTAGAAGATATCTGTGTGCTTAGTGGGCCAAGTTTTGGTAAGCAGAACTGGTGCTGTGGGATGAACCAAACGTAATGTTACGGCGCCTAAATAAACGACGCATCATAGATACCATGAAAGGTGTTGATTGCTACAGACAGCAGGACGGTGGACATGGAAGTTGTCATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAAGCAATTAGCCCTTAAAATGGATGGCGCTTAAGTCGTTTGCCTATACATTACCGCTGGCGCACAAGTGGGGCAGCGCCCCTGTAGCGCGTCTGCCCTTTGAGGCGCCAGCGAGTAGGAGGGTCTGGTGGTGTGCGTTGA\n>CP009227.1/527376-527281 Treponema sp. OMZ 838, complete genome. \nGGCGGCATGGATGCCGCTCGTATTAAGCAGAAGCAAGTTTGACACCGGTCAAACTTGTGTTCAGCGAAGTACATGGATGTGCTTCGCTGAACGAGT\n>FQVI01000001.1/71074-70885 Lactonifactor longoviformis DSM 17459 genome assembly, contig: EJ64DRAFT_scaffold00001.1 \nAAAAAGAATAAACGGTATGGTCTGTGCTCAGCAATGAGTCAGTTTACAGGGAATCCGGTGAGAATCCGGAACAGCCTTTCTCTACTGTGTGAGGGACGAAAGCAGCGTAAAACCACTGGAACTATCCGGGAAGGTGCTGCTGGTAGGAAGAACTCAAGTCAGGATATCTGGCATACTGCGTGAAAAAAGC\n>MTEJ01000117.1/16469-16381 Thiothrix lacustris isolate A8 Ga0073116_1117, whole genome shotgun sequence. \nATCGGGTTAAATAAACGACTGACTAAACATGTAGTAGCCTTCAGATGGAGGGTTTGCGGACGCGGGTTCAATTCCCGCCGCCTCCACCA\n>LJIY01000004.1/279997-280249 Psychrobacillus sp. FJAT-21963 super7, whole genome shotgun sequence. \nACATCAAATTTTGAAGGGACGATGGGTGGCCGATGAAGTTTTAATCTTATTTCTCAGTAGAAGTTTTTCTGCGATATATTTGCGCAGTAACAAAATAAAACTTTACGAAACCGGAAATAGGATTAGTCTGCCCATTTTTCAAAATTACTGCAAATAATTCTCTACAATACGCTAACGCTTTGTAGTGGTTTTTTGCATATTCATTTAATGGTCAGTATGTAATCCTACCGTTTAATATCGGAGGGATTTTTTT\n>CP011058.1/4424379-4424646 Paenibacillus beijingensis strain DSM 24997, complete genome. \nGCTATCGCTATGACGGGCACAAGTAGTACTGCGAACGACGCTTTCAGAGAACCGGTGGACGGTGCGAACCGGTACGCGGCGCAGCATGAATTACCGCCTTGAGCTGAACGGGGGAAAGCGGGCCGGTCCCACTGGGGGCAGTGTCCGGCCGGTAGCCCGTTTCCGGAAGCATCCGCTTCCGTTATCAATAATGAAGTGAGAGCCTAATCTGCCCCGGCAGCGGCTCTAACGAGGGTGGTACCGCGAGCAAATCCTTCTCGTCCCTTGA\n>LL009840.1/12805-13384 Trichobilharzia regenti genome assembly, scaffold: TRE_scaffold0009840 \nCTCCTGGAAAAACCAATATCCAGCCAATGCTTGTGTCAGAGATTAAGTCGTGCATGTCTAAGTACATACCTTAAAACGGTGAAACAGCAAATCGCTGATTAAATCAGCTATGGTTGCTTAGACCACATATGCACTACATGGATAACTGTAGTAATTCTAGAGCTAATAAATGAAGTTATGCCCTGACCCGCAAATCAACAGAAAATTTATTAATACAGAACCAACCGCGGGTGGGGGGGGTAGTTTCGCCTGGATAGCTTTAATGTGATCGCGATCGGCCTTCCATTGGCGATGGATCTTATCGTAGAAGGAAACAACACAGAGATTCTGTTTCACCGATCAATTTAGAAGGTTAAACAACATTGGAATAAACACAGGAGTCAGACAATGGTGCTTATTATCACCAATTATACTTCATTCACTTACTTATCTAGGGAGCATTGTCTCAACTACAGGAAGTCGGAGAGGACGAGGATGTCAAATCGAGCTAGAATCGGGAAGGCAGGCGAGAAACATATTCATCAACCTGAAACAACCAATCTGGAAATATTCGTCACTCAGCCAGAATCAACAACAAAAT\n>JRRC01447532.1/91-1 Gossypium arboreum cultivar AKA8401 contig_57480_1, whole genome shotgun sequence. \nGCTGTCTACGAGTCGGTTTGTTTGGGAATGCAGCCCTAATCGGGCGGTAAATTCCGTCCAAGGCTAAATACGGGCGAGAGACCGATAGCGA\n>GG692400.1/806114-806247 Candida tropicalis MYA-3404 genomic scaffold supercont3.6, whole genome shotgun sequence. \nGCCCCCTTGGTGCAGCCGGTAGCATGAACGATTCCGGTTCGACTCCTGTTTCGAAGCTTTAAAATACTTTAAAGGTTTTTGAAAGGAGAATTGGAACTAGCGTTTGGTCGCGGGTTCAAGTCCCGCAGGGGGCT\n>FOVK01000004.1/141686-141486 Proteiniclasticum ruminis strain ML2 genome assembly, contig: Ga0073291_104 \nATATAAACGATGAAAAGAACCAGTATGGAAGTCCTGCCTTCATAGAGAGAGGGGATTGGTGAAAGCCCTCAAGGAAAGTTTCCAGAACCTGTCTTGGAGTTTCTCAACCATTTGAGCGGGGAAAGCCGTTATACTTTAGAGTGGATACGTTAGGAGAAGTATCAATAAGGGTGGTACCGCCGAAGAGATTTGGCCCCTTTT\n>LAKY01000004.1/16245-16356 Clostridiales bacterium PH28_bin88 ph28_547, whole genome shotgun sequence. \nTGATCCTTTAAGCCGGTCCCGCGAGGCCGGTAAGGAGCTACGGTCAGGGTATGCCCGTGTAGACGTGGGATATCAAGGCCTCCTTGCCGCTGGGACAAGGAGGCCTTTTGTT\n>CM000878.1/138264228-138264130 Callithrix jacchus chromosome X, whole genome shotgun sequence \nCTGCCTCGAAGTCTGNNNNNNNNNNGCAATGGCTGCAAACAGCAGCTTCCTTGGTAGTGTTCTTTGTATGGGTTGCTCTAAGGGACCTTGGAGACAGGC\n>FAOM01307123.1/40010-39638 Triticum aestivum genome assembly, contig: Triticum_aestivum_CS42_TGACv1_scaffold_307123_4AS \nTTTTGCAGTTTGCGAGAAAGTTGAAAGTAAAGGGAGAACAACATATAATGAGGTTAGTGCTTTATTAGTTTTTAGCTCAAAATTCCTGTTGTTATTTTTTCATCATTTGTGTGGGCTGCATGCGTTTTGCCATATATTAACCAGAAACCAGGCTGCAACTCGCCTGCATGAAGCAGGAATCGCTAGTAATCGCCGGTCAGCCATACGGCGGTGAATCCGTTCCCGGGCCTTGTACACACCGCCTGTCACACTATAGGAGCTGGCCATGTTTGAAGTCATTACCCTTAACCGTAAGGAGGGGGATGCCTAAGGCTAGGCTTGCGACTGGAGTGAAGTGGCCATAGTTTGATATGTGACCCTATTCCTTCGCATA\n>JMFQ01059681.1/962-834 Aptenodytes forsteri contig59681, whole genome shotgun sequence. \nTAGGCCCTGAATGAAGACCACCGGTTTGCTGTAGCCGTTGGTTTCAAGCAGGAGCCCAAAGGAAACGTCTCCCGGTCTGTGGGCGCTCCCATCCCTGTGGAACGGCCAATTCGTGTGGGAGCGACACTA\n>LFJN01000024.1/399316-399149 Phialophora attae strain CBS 131958 Contig24, whole genome shotgun sequence. \nGGTGAGATGGCCGAGTGGTTATGGCGCTAGTTTCAGGAATACCTGGAGCCTTCGCTTTCTGGTTGAAAGTACTAGTGGGTGTACGTAAAACCATCCTACAGTACCCTCAAGAGCACTACTGACAATTTCCTTTAGAAAACCGCGTGGGTTCGAGTCCCACTCTCATCA\n>AFSB01069799.1/15973-16145 Heterocephalus glaber contig69799, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAATAGTAGCTGCCGTGATTCTGTTAATACAAGTTAGATTGTTTCTTTTCTCTGCTTAAAACCCTCCAATGGCTTCCCATGTCTCTTAGCAAAGCCAAAATTTCTCAAGACTTATGACGTGTGAGTGATTCTGAACCTCT\n>GL378325.1/524376-524459 Volvox carteri f. nagariensis unplaced genomic scaffold VOLCAscaffold_4, whole genome shotgun sequence. \nGAGGTGTGATGATTTGAAACTTTTGGTCCGTGTTTCTGAGTGCCTAGCGCACCTCTGACGACTACAGTTTCTTCGTCTGACCTC\n>GG749280.1/539059-538827 Selenomonas noxia ATCC 43541 genomic scaffold SCAFFOLD3, whole genome shotgun sequence. \nTCATATTGAATTGGATCAAGTGCAGGGGTTTTGACATCATCAAAGCCTCAATGCTTCATAGGGAATCCGGTATAGGAATCATTGATTTCATAAGCCGGAGCGGTCACGCCACTGTAACAGGGAGTGATTCCGCACGCCAATTGAGTTGGCAGTCACTGGAGAGCGATCTCTGGGAAGATGCGGAAGAACGATGAACTGGAGCCAGGAGACCTGCTTGATTAACAATCACCGAT\n>GL988045.1/3052953-3052577 Chaetomium thermophilum var. thermophilum DSM 1495 unplaced genomic scaffold scf7180000011820, whole genome shotgun sequence. \nTCCTCTTCAACGCTGCGTTTCTATGCCACAAACGGAGAGCGCTTGCGCAAGCAGCGCTTTCAAATCCATCTTTCTCTGGCATATGAGAAATTCGGAGAATCGGCTTCACTCTTGGTTTGTCCATTCCTCACTCTCGGGTGTTGGATGGGTTACGAGCTCTGCCGGTGACGGCTTGGCGCGAATTCGCGTCTGTAATTGGCATCAGAAAAGCAGGGCTTAGAGGCCAACCTTGTGCTTTTGCGAGGGGAATTGGTCATCTAGGTTCCTCTGGGAGGGCCGTTACGAAGCTTGTGAGCAATCACTTGAGTGCAATACGCAGCGTGTGGCCTGCCTTCTGGGCAGATCACACAATTCGATTCCGATTATCCTGTTGAGGA\n>CM002820.1/173650899-173648878 Capsicum annuum cultivar Zunla-1 chromosome 9, whole genome shotgun sequence \nAGGCTTACGGTGGATACCTAGGCACCTAGAGATGAGGAAAGGCATAGTAATCGATGAAATGCTTCGGGGAGTTGAAAATAAGCATAGATCCGGAGATTCTCGAATAGGGCAAACTTTCAAACTGCTGCTGAATCCATGCGCAGGCCAGAGACAACCTGGCGAACTGAAACATCTTAGTAGCCAGAGGAAAAGAAAGCAAAAATGATTCCCGTAGTAGCGGCGAGCGAAATGGGAGCAGCCTAAATCGTGAAAACGGGGTTGTGGGAGAGCAATACAAGAGTCGTGTTGCTAGGCGAAACAACCTGAATGCTGGCGAAAAACCAGTAGCCAAAAGCATTACTAGCTTACGCTCTGACCCGAGTAGCATGGGGCACGTAGAATCCCGTGTGAATCAGCAAGGACCACCTTGCAAGGCTAAATACTCCTGGGTGACCGATAGCGAAGTAGTACCGTGAGGGACGGGTGAAAAGAACCCCCATCGGGGAGTGAAATAGAACATGAAATCGTAAGCTCCCAAGCAGTGGGAGGAGCCAGGGCTCTGACCGCGTGCCTATTGAAGAATGAGCTGGCGACTCATAGGCAGTGGCTTAGTTAAGGGAACCCACCGGAGCCGTAGTGAAAGCGAGTCTTCATAGGGCAATTGTCACTGCTTATGGACCCAAACCTGGGTGATCTATCCATGACCAGGATGAAGCTTGGGTGAAACTAAGTAGAGGTCCGAACCGACTGATGTTGAAGAATCAGCGAATGAGTTGTGGTTAGGGGTGAAATGCCACTCGAACCCAGAGCTAGGTGGTTCTCCCCGAAATGCGTTGAGGCACAGCAGTTGACTGGACATCTAGGGGTAAAGCACTGTTTCGGTGTGGGCCACGAGAGCGGTACCAAATCGAGGCAAACTCTGAATACTAGGTATGGCCTTAAAATTAAAAAAGAGGGGTCAAAGTCGGCTAGTGAGACAATGGGGGATAAGCTTCATCATCGAGAAGAAAACAGCCCGGATCACCAGCTAAGGCCCCTAAATGGCCGCTCAGTGATAAAGGAGGTAGGGGTGCGGAGACAGCCAGGAGGTTTGCCTAGAAGCATCCACCCTTGAAAGAGTGCGTAATAGCTCACTGATCGAGCGCTCGTGCGCCGAAGATGAACGGGGCTAAGCGATCTGTCGAAGCTGTAGGGTGTAAAAATACATCGGTAGGGGAGCATTTCGCCTTAGAGGGAAGCCTCCGCATGAGCGGTGGTGGACAAAGCAGAAGCGAGAATGTCGGCTTGAGTAACGCAAACATTGGTGAGAATCCAGTGCCATGAAAACCTAAGGGTTCCTCCATAAGGTTCGTCCACGGAGGGTGAGTCAGGGCCTAAGATCAGGCCGAAAGGCGTAGTCGATGGACAACAGGTGAATAGTCCTGTACTACCCCTTGTTGGTCCCGAGGGACGGAGGAGGCTAGGTTAGCCAAAAGATGGTTATCGGTTCAAGAACGTAAGGTGTCCCTGCCCTTTTTTCAGGGTAAGAAGGGGAAGAGAAAATGCCTCGAGCCAATGTTCGAATACCAGGTGCTATGGCGCTGAAGTAACCCATGCCATACTCCCAGGAAAAGCTCGAACGGCTTTGAGCAAGAGGGTACCTGTACCCAAAACTGATACAGGTGGGTAGGTAGAGAATACCTAGGGGCGCGAGACAACTCTCTCTAAGGAACTCGGCAAAATAGCCCCGTAACTTCGGGAGAAGGGGTGCCTCTTCACATTACAAAGGGGGTCGCAGTGACCAGGCCCGGGCGACTGTTTACGAAAAACACATGTCTCTGCAAAGTCGTAAGACCATGTATAGGGTCTGACGCCTGCCCAGTGCCGGAAGGTCAAGGAAGTTGGTGACCTGATAACAGGGAAGCCGGCGACCGAAGCCCCGGTGAATGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCAGGTAAGTTTCGACCCGCACGAAAGGCGTAACAATCTGGGCACTGTCTCGGAGAAAGGCTCGGTAAAATAG\n>URS0000D6A535_12908/1-73 unclassified sequences RAGATH-1 hammerhead ribozyme \nAAGACAGUCUAGGAGUCUAUAAAAUUGUUACUGAAGAGACUAGAACGAAACUUCUUUAAUUAGAAGUCUAACA\n>AYMY01S001259.1/103935-104737 Nicotiana tabacum cultivar TN90 Ntab-TN90_scaffold1259, whole genome shotgun sequence \nATTTCAAAATTTTGTAGCTTGTTTCGGGCAATAAAATGACTGGTACCATCCTAGTCAAATTAGAAAAACTTTTTGATGAAGGTGCCATTATAAGGCGGACCGGGCCCAAGTCCCCTGGAAGGGGGCGCCAGAGAGGGTGAGAGCCCCGTTGTGCCCGGACCCTGTCGCACCACGAGGCGCTGTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCAAATCGGGCGGTGAATTCCGTCCAAGGCTAAATACGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGGAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGATGGGGGCCGGCGATGCGCCCCGGTCGGATGTGGAACGGTGNTACCGCGAAGGAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGATGGGGGCCGGCGATGCGCCCCGATCGGATGTGGAACGGTGTTGAACCGGTCCGCCGATCGACTCGGGGCATGGACCAGCGTGGATTGGGTAGACTTTTGATTTGGGTGAAGTTACTTGTTGATTGATAGAGCTTAGCTTCTTAATTAGCTTATTCCTAAGACATTTCCTTTTCGGACTTCTTAAATTCTAACTATGTTTAGTTGAATGTTCTAAAGCATACATAGAACAATTTGTTGCTAAGTAGAATAATCCCCTGCTTCACACTTTACCCACAATTCAGTTTGCATTCCATAGTAAAAGTACTATTTTGGGGTTCAAGAAAAAATTTGAAACCTTT\n>CM000024.3/41982868-41983007 Canis lupus familiaris chromosome 24, whole genome shotgun sequence. \nATCGCTTCTCGGCCTTTTGGCTAAGATCAAGTGTAAATAAAAAAATACATTATTTTAAAAATCTGATATGAAATGATATTTATTGGGGCTTCTGGGCAAATCAATCACCCTTGTGCTAGAGTGTTAGGATATGTAGAGTG\n>CM000400.2/42839630-42839710 Equus caballus chromosome 24, whole genome shotgun sequence. \nTGGACCTCTCATGAACCCACCATGACGCCTGGTGGCAGATGTCATAGGTGATGAACATGTGTCTGGAACCCTGAGGTCCAA\n>MNVL01000027.1/1734-2078 Candidatus Hydrogenedentes bacterium CG1_02_42_14 cg1_0.2_scaffold_12826_c, whole genome shotgun sequence. \nGGGGGCGCAAGGTTTTGACGGCGACGGAATTGTCGAGGTGGCGCGCTGGGGCATGCTTAGTTGCCTCGTAAAAAATACTGAGCAACTTTTAACTGCCAACACTGAATTGGCTCTAGCCGCGTAAGCGGCAGACTGCATAGGCGACGCCCGCTGACTCTTGCAGTCCTCATAGCGGGCTGGCTTTCGGTTATGTACCGGGGATCGGGAGCGAGGAGAACACTCGGACTAGCGGAAAGGGAAGCCTGTCCATGGGCCATCTTTTTGCGAAATTAATACACGGACTACGCGCGTAGAAACCCGATGAAACAGTTGTTCGGACGTGGGTTCGATTCCCACCGCCTCCAA\n>JRRC01272952.1/16470-12774 Gossypium arboreum cultivar AKA8401 contig_2968_9, whole genome shotgun sequence. \nTCACTTACTTAAATACTTACTTACTTAATCAAATTTATTAATAAATTTTACTTACCTTTTTTTTTATCAAGCATACATGAACATTATATACTTACCTTTGCTCTTCTAGCATGAACTTGTCTTACCTTTTTAGTATAACTCGTCTTACCTTACCTTACCTTGATATTCTCTTTAAATTATTTCCCGTTGAACCACTTGGAATACTAAGGATACATGGGTACCTTACCATTGCCATGACTTGTCATGGTCTTACGTGGTGTCCTTTTGAAACTTACCATTGCCATGCCTTGGTATGGTCTTACATGGGACTTTTGCCTTATAGTAACTTATTAATGCCTTGTCTTGACATGGTCTTACATGGTATCCTTACCTTAGAAACCTTACCAATTGAGATGCCTTGGCATGGTCTTACATGGTATCCTTAAACCCTAATGTCATGACATTTGTATCCTACACATTCCTAAGGTTCAACCAGGACTTTCTGAAATTACTTCTCCGTCAATTCATGCTTAAGTCTTCTTCGAATAATTTCATAAAATAAATATACACATGCTGGAAATTAGCAAAATTAACATAAAATAATAGAATATTGCATTTATTTACCGCAAACTTACCTCGAAACAAAATACGATCAATTATATCGATTTAGTCCACTATCTTTTTCTTTCCCCGATCTAACTCCGAATTTTTTTCTTCTTGATCTATAATAACAAATTTAGCTTATTTAATACTCACATTTATTAAAACAGTCATTGACTCAAACTTTGGCAAAATTACACTTTTACCCTAAACTTTTACATATTTATACTTTTTTCCTAAGGCTCGGAAATTAAACTTCATCCTATTTTCTTATGTTTTATGACATTCTAATCATTTTTCCCTTCTATGGAAACATAAAATTCTCACTCTAACATGTAGTTATGAACATTAGGTATTTTTACCGATTATGTCGTTTTACTCGTTTTCACATAAAATCGCTTAGCAAAAGTTGTTTAACATAATTTCGAGCTTCATATTCTACCATAAAATATCAAAATAAACACATTTCACCTATGGGTAGTTTTCCAAATATAAACCCTAGGTTAAATTATTGCTAGAATAAGCTTAATCAAGTTATCGGGACCCTAAAAACGTAAAGAACATTAAAAACGGGGCTTAGAATCACTTACTATAGAGCTTGGAATCTTGAAACAAATCCTAGCTACGGGGAACCCTTGAAGATGAGCACATTTTTGCCATTTTTTCCCTTTTTAATTCTTTTATTTGACACTTTACTAAAATGCCCTTTATTAAAATTTTTTAGTTATTTTTACCTATGTATATCCATTTTTGTCCATGAAAATATAATGGTCTAATTCCATTTAAGGACCTCTACTTCAATTATGCAATGACCAGGATGAAGCTTGGGTGAAACTAAGTGGAGGTCCGAACCGACTGATGTTGAAGAATCAGCGGATGAGTTGTGGTTAGGGGTGAAATGCCACTCGAACCCAGAGCTAGCTGGTTCTCCCCGAAATGCGTTGAGGCGCAGCAGTTGACTGGACATCTAGGGGTAAAGCACTGTTTCGGTGCGGGCCGCGAGAGCGGTACCAAATCGAGGCAAACTCTGAATACTAGATATGACCTCAAAATAACAGGGGTCGAGGTCGGCCAGTGAGACGATGGGGGATAAGCTTCATCGTCGAGAGGGAAACAGCCCGGATCACCAGCTAAGGCCCCTAAATGACCGCTCAGTGATAAAGGAGGTAGGGGTGCAGAGACAGCCAGGAGGTTTGCCTAGAAGCAGCCACCCTTGAAAGAGTGCGTAATAGCTCACTGATCGAGCGCTCTTGCGCCGAAGATGAACGGGGCTAAGCGATCTGCCGAGGCTGTGGGATGTAAAAATGCATCGGTAGGGGAGCGTTCCGCCTTAGGGGGAAGCACCCGCGTGAGCGGGAGTAGACGAAGCGGAAGCGAGAATGTCGGCTTGAGTAACGCAAACATTGGTGAGAATCCAATGCCCCGAAAACCCAAGGGTTCCTCCGCAAGGTTCGTCCACGGAGGGTGAGTCAGGGCCTAAGATCAGGCCGAAAGGCGTAGTCGATGGACAACAGGTGAATATTCCTGTACTACCCCTTGTTGGTCCCGAGGGACGGAGGAGGCTAGGTTAGCCGAAAGATGGTTATCGGTTCAAGGACGCAAGGTGCCCCTGCTTTTTCAGGGTAAGAAGGGGTAGAGAAAATGCCCCGAGCCAATGTTCGAGTACCAGGCGCTACGGCGCTGAAGTAACCCATGCTATACTCCCAGGAAAAGCTCGAACGACCTTCAACAAAAGGGTACCTGTACCCGAAACCGACACAGGTGGGTAGGTAGAGAATACCTAGGGGCGCGAGACAACTCTCTCTAAGGAACTCGGCAAAATAGCCCCGTAACTTCGGGAGAAGGGGTGCCTCCTCACAAAGGGGGTCGCAGTGACCAGGCCCGGGCGACTGTTTACCAAAAACACAGGTCTCCGCAAAGTCGTAAGACCATGTATGGGGGCTGACGCCTGCCCAGTGCCGGAAGGTCAAGGAAGTTGGTGACCTGATGACAGGGGAGCCGGCGACCGAAGCCCCGGTGAACGGCGGCCGTAACTATAAGGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCCGCACGAAAGGCGTAACGATCTGGGCACTGTCTCGGAGAGAGGCTCGGTGAAATAGACATGTCTGTGAAGATGCGGACTACCCGCACCTGGACAGAAAGACCCTATGAAGCTTCACTGTTCCCTGGGATTGGCTTTGGGCTTTTCCTGCGCAGCTTAGGTGGAAGGCGAAGAAGGCCTCCTTCCGGGGGGGCCCGAGCCATCAGTGAGATACCACTCTGGAAGAGCTAGAATTCTAACCTTGTGTCAGGACCTACGGGCCAAGGGACAGTCTCAGGTAGACAGTTTCTATGGGGCGTAGGCCTCCCAAAAGGTAACGGAGGCGTGCAAAGGTTTCCTCGGGCCGGACGGAGATTGGCCCTCGAGTGCAAAGGCAGAAGGGAGCTTGACTGCAAGACCCACCCGTCGAGCAGGGACGAAAGTCGGCCTTAGTGATCCGACGGTGCCGAGTGGAAGGGCCGTCGCTCAACGGATAAAAGTTACTCTAGGGATAACAGGCTGATCTTCCCCAAGAGCTCACATCGACGGGAAGGTTTGGCACCTCGATGTCGGCTCTTCGCCACCTGGGGCTGTAGTATGTTCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGTACGTGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCATATCCGGTGTGGGCGTTAGAGCATTGAGAGGACCTTTCCCTAGTACGAGAGGACCGGGAAGGACGCACCTCTGGTGTACCAGTTATCGTGCCCACGGTAAACGCTGGGTAGCCAAGTGCGGAGCGGATAACTGCTGAAAGCATCTAAGTAGTAAGCCCACCCCAAGATGAGTGCTCTCCTATTCCGACTTCCCCAGAGCCTCCGGTAGCACAGCCGAGACGGCAAGGGGTTCTCTGTCCCTGCGGGGATCGAGTGACAGAAGTTTTGAGAATTCAAGAGAAGGTCACGGCGAGACGAGCCGTTTATCATTACGATAGGTGTCAAGTGGAAGTGCAGTGATGTATGCAGCTGAGGCATCCTAACAGACCGGTAGACTTGAACCT\n>JPUW01000003.1/58274-58063 Lysinibacillus sp. BF-4 contig00003, whole genome shotgun sequence. \nAACGATGCAATGATAAGGAAGAGTAAAAAGTACGCGTAGGCAAGAGAGGGAACGGTAGCTGAGAAGTTTCTACTAAAGCGCTTTTGAAGGTAGCCTTGGAGCAACATTTGTGAACAACAGTAGCAAATGTCGGCAGCTAAGCCGTTATGTATTGAGTGCTAAGCTTCGGCTTGGAATAAAGGTGGTACCGCGAAAGCTCCTTCGTCCTTTTT\n>ABWE02002692.1/6421-6661 Hyaloperonospora arabidopsidis Emoy2 Contig279.1, whole genome shotgun sequence. \nTTTAAAAAATGAAAGAATCTAACTCTAGTACGAGAGGACCGAGAAGGGTAAATCTCTGGTGTATCGGTTGTTGAAAAGCATCGCCGAGTAGCTAAATTTATTTTGGATAATTACTGAAAGCATCTAAGTAAGAAACCATTCTTAAATTTTTTTTATATAAAAACTGTAAAAGATCATTACATTGATAGGTTTAAAGTGTACGTATTGTAAAATATTTAGCTTAAAAATACTAAAAGTTTAA\n>CM000842.2/19036600-19036948 Glycine max cultivar Williams 82 chromosome 9, whole genome shotgun sequence. \nGCTTGTGGTTTAATTTTACTTAACATGAGAAAACTTACCAGATCTAAACATAGTATGATTGACAGAATAAGAACTCTTTCTTGATTTTATGGGTGTTGTTACATGACCATTTTTAGTTGGTGGAGTGACTTGTCTAATTAATTTTGTTAACAATGAGAACTCAGTTTGCTTAAAAATGTTTTTGTTGAATAATTGTTCTTAAAAATGTTATGATTCAAGACAAATTCAGATTTAATTTAGAAGTAAATAGTAACTAAATGTTAAACCAGAAAACAAAAGGAATGCATTCAGCAAAATAAAAATTAATGCAAACAGAATGGGCCTCAAATTTTTTAGGTTACATGAGGAC\n>MNRE01000021.1/40-1 Clostridiales bacterium 41_21_two_genomes Ley3_66761_scaffold_14658, whole genome shotgun sequence. \nGGATCACTCCATTTGGGGTTAAGGCCATACGGACAGCCGG\n>KI927239.1/392135-395996 Plasmodium falciparum Palo Alto/Uganda unplaced genomic scaffold supercont1.2, whole genome shotgun sequence. \nGAGGATAAAAATAGGAGGGCAAATCCGCTGAACTTAAGCATATAATTAAGCGGAAGAAAAGAAAATAACTATGATTCCTTTAGTAACGGCGAGTGAAGAAGGAATAGCTCAATAAGTAGAATCCTTCGAATCTTAATGATATATTTATACATAGAATAAAGAATTGAAGGAATTGTCAAGTTGAATTGTACTCTTGTAGGCCTCACAGGTGAAATGAATATATAGAAGTAAAGTAGGAATACTTCCTCATAGAGGGTGAAAGGCCCGTATCATATATCATTTCGTGGGCTTTGGAGTATTTATATTTTACTGAGTAGTGTTCTTTGAGATTGGAGCACAAATTGGTGTGATACATTTCACATAAAGCTAAATATGTGTAGGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGAAATAGTACTCAGGAATGAGCAATTAAATAGTACCTGAAATCGTTAAGATGGAACGGATTAAGAGAGAAAACAAGTAAAGAGGAGAATTTTTTACATTTTTATTTTTGTTTTATAATTCTCTTCTTTATTAAAAGAAACATCAGTGATTAATTTAATTTCAATAAAGCAATCCCCTGAAATTCAAAATTTCTTTTAATTTTGTTTTCACTTTCTCCCCGCACTAATGTGGGGAAAACTGGCTTTATTTCTTCAATTATTTTTTTTGCTGAGGAATTTTAAAATTATTTGAATTTTTCTTCTTATAATTTAAGTTGTTTCTATATAGTACTTTCTTAACCCACTCGTCTTGAAACACGGACCAAGGAGTCTAGCAAATGTGCAAGTGTATATGATTCTTTAAACATTTCTCTTTTTAATATACGCATAATTAATGTAATATGTTTCTTTATTGTAGATTTGTGGTGTTTAATTTTTATTAAATCCCCACTTTGCATACAATACCGGTAAGCAATTATGCTTTATTGAGTACGAGCATATTTGGTAGGACCCGAGAGGCTTTGAACTAAGCGTGATGAGATTGAAGTCAGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTATTCGCTCATGAGATCCCATAAAAGGTGTTGGTTCATAATGACAGTAGGACGATGGTCATGGAAGTCGAAATTCGCTTAGGAGTGTGTAACAACTCACCTACCGAATGAACTAGCCCTGAAAATGGATGGCGCTAAAGCGAATTACCGATACCGGGCCATAAGAAGGTAGAAATTATAAATGTTAATTTAGCTCAGATCTTTTTATGAGTAGAAAATCGTGGGGTTTGTGTTGAAGCGAAATACGTGAGTTTTCGTGGAACATCTCCCTAGTGCAGATCTTGGTGGAAGTAGCAACTATTCAAATGAGAACTTTGAAGACTGAAGTGGAGAAGGGTTTCTTGTCAACTGTGATTGAACAAGAGTTAGCCGCTCCTAAGGGATAGCTGAAAAGTGTTTAAAAGAAGTAAGATATTATATGGAAATATATAATTAGATCTTCGTCTCAAAAGGGAAACAGGTTAATATTCCTGTGCCATAAGTAATAAGAGTGCAAACAGAGATGGTAACATACATATAAATGAACTCCTTAACATAGATTTTACTCATGGGGTGCGTTATCTTTGCACTTTAATTTTATAACAAACCTTGGAATCAATTTATTTGGAGAAGAGGTTCGTTGAACTCAATTCAAAAAAAAAAAAAAAAAAAAAAATTAATTATAGAAGGAAAGGATTTTCGGATCCTTTGTACTTTTTTTTTTTTTTTTTTTTTTTTTTTATGTTTTGTAGCAATAGTAATTCATTTCTTTTGAATTATCCATAGTGGTAAAAACTATCCATGAAACAAGGAGGGAACAGCAGCAATTATATAATTTTTGGGGTTCTTTGAATTCCTTATTATTTTTGCAATATTCTTAATACTTGTACGAGCGTACCAATAACCGCATCAGGTCTCCAAGGTTAGTAGCCTCTGGTTAAATAGAAAAAAGTAAGTAAGGGAAGTCGGCAAAATAGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGACATTAGAAAAGAGAAGAAAAAAAGAGGGTTGAGAATAAAATTGCAGATTTATTTGCTTTTCTCTCTGATTTGCTTGTAAATTTTCTTTTTCTTTTTCTTCTTTTCTTTTTTTTTCTGTCCCTCTTTTCGTCTTCATTTTATTGTAATTTTTGTTACTTTAATTTGATACATATATAATGTTAACTCAGAACTGAAACGGACAAGGGGAATCCGACTGTTTAATTAAAACATAGCATTGTGAAAAACCATAACTGGTATTAACACAATGTGATTTCTGCCCAGTGCTTTGAATGTCAAATTGATGAAATTTAATTAAGCGCAGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTACTTGCTATCTAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAAAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTTACTCTAGTCTGACTTTGTAAAACGACTTAAAAGGTGTAGATATAAGTGGGAGTAGGAAAATGAAATACGTTTTTTACAATAGTGAAATACCACTACTTTTAAAGTTGTTTTACTAATCCATTGATAGGGATATATAAAACTTATAAATAATTTTTATTTTAAGTTACTTTTGAATTTAAGATATGTGTGCATTTATATCTATTAAATCCCATTTTGTATATATATATATATATTATATATATGTGTATAATACGATTTTTTTTATGGAGACATAGTTAGGTGGGGAGTTTGACTGGGGCGGTACATCTGTTAAAAAATAACGCAGATGTCCAAAGACAAGCTCAAAGAGAACAGAAATCTCTTGTAGACTAAAAGGGGAAAAGCTTGTTTGATTTTTACTTTCAGAATGAGTAGAAAACGTGAAAGCGTGGCCTATCGATCCTTTATATTTGCAAAATGACGTAATAAATTACTTACTACTGTGCATATAGAGGTGTCTGAAAAGTTACCACAGGGATAACTGGCTTGTGGCTGCCAAGCGCTCTTAGCGACGTAGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGGGACGCAGAAGTCTCAAAGTGTCGGATTGTTCACCCGCTAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGAATAATATTATTATATTTTTTATATACAATATATAGTATTGTGACAGTAATCCAACTTGGTACGAGAGGATTAGTTGGTTCAGACAATTGGTACAGCAATTGGTTGATAAACCAGTGTTGCGAAGCTAAGTCTGTTGGATAATGGCTGAACGCCTCTTAAGCCAGAACCCATGCTGATTAGACAATTCTAAATTTGATCTTTTTGTTAAACGATAAAAATTATATATATATTTTTTTTATCTTTACTGCATAATGTAAAAGAGAAATTATACATATATATATATATATATATTAGAAAAGAAAAAATGATGTAATTAATTATTATTATTATTTTTTTTTTTTTTAGTATTAATATATAATTATGAATATATAAATAATCCTATATCTTTATATAAAAATTAAATTTTTAATTTTATTAGAATTTTTTTTTTTTATATATATAGATTGTAATTTAACAACAAAAAGTATTAAGCCCAAATCGTAGACGACTTTTCTGTCTCAGAGTACTGTAAACATGAGAGTAAACTTTGTTTTACGATCTGTTGAGGTTTATCTCTTGTGACATTGAGCTAA\n>KI925462.1/351230-352057 Heterobasidion irregulare TC 32-1 unplaced genomic scaffold scaffold_09, whole genome shotgun sequence. \nACAGATCCAAGGCCACAATGCTCGTCCCGCACAGGACGTCTGAACGACAGTTCTGGCTTCCATCTTTGCGAGCGGGCTAAGGTCTGAGTGTATAGCTCCCTCGATCGACTCTCGCAGGGTCCGAGTCTAACGGCTCGAGCAACATACAAGAAATCCGTCTGCTTCACCTTGTCCGAAGACACGCTATCTGTTTCTCTAGATTCGGCGGCGTCGAGGGTGGTGAATGTAGGCTTGAGATATGTTGCGGAGTTTGGGCAGTACGTTTTGTCTCATCTATCCTCCGAGTCGTGGGTCGGAGTGCCCTCGATGCCCTATCGCACCTTTCGTCTGTGTCAGACGATCAGACATCAGGCAGTGTCTGAAGTGTTGTCAACTCGCTTCATTGCGACACAGACAGGAGTATATGACTCTGGGAGCACACCACTCCGATCAGAGCCTCCGGGAGAACACCACTCCAGTCTGATTAGGGAACACCCTTCTCCAAGTCGAACCTCTTTCCTGGACGAATGTTAGCCCTTCAGTCATGATCCGTGGCGAGAAGCGGGGGTCATAACTCACACCTGCCGCCTTTACCCAACGAGATCAGAAGACATAACCTGTCGCTGTTGTGGCTAATACAGGAAAGAGTGTCTGCCAAACCCTGGTGGGACGTGGACCTTGTCCAGTTGCGTTTCGATGGTCATGAGTTGATGACACTGGTGTATGAGGGGTTGGGAGTTTGTGAGGTGCACATCGGTACTGTCCTTCAGTGCAATTTGTGGCTCGCGCCTTTCGTTCTCCTTCTGGAAACGAAGGCGTGAAACTCGATTCAGACTACTCTGGGTCTGT\n>ALWZ046142499.1/4049-4180 Picea glauca, whole genome shotgun sequence. \nGGTTCCTTGGTCTAGTGTTCAGGACATTGGACTCTAAATCCATTTTTGAATGTTGTGTACAAATCCATGGTCTAGTGTACATGACATTGGAATCTGAATCCAATAGCTTGAGTTGTAATCTCGATGGGACCT\n>LATL02000069.1/39931-40100 Limnoraphis robusta CS-951 contig069, whole genome shotgun sequence. \nGTCAAGAACTCGCCGCTAAACCCTATGCGCTTTTCGCGCAGCAGGCTTCGCCAACGGGTTAAGCGCGGGAGCTTGTAAAAAGGCTCTAACTTGACCAGACTCAGCCCTTTTTGGGGCTACGTTATTTGGCTCACGAAACCCATGAATGCGTGCCAGTTTGCGGCTCTTTC\n>CM003279.1/134475214-134476476 Salmo salar isolate Sally breed double haploid chromosome ssa01, whole genome shotgun sequence. \nAACTCTTATGATTCAGAGTGGTTGGGTTAAATGTGGAAGACACATTTCAGTTGAAGGCATTGTTGTACAACTGACTTGGTATCCCCCTTTCCCTTGTAAGGAGAGACGATGATCCCTCTCATTTGCAAAGAGTTGGGATATGATAATATTCATAAATGGGGAATCAGGGTTCGATTCCAGAGAGGAAGCCTGAGATGCACCTACCACATCCAAGGAGGGCAGCTGGCACGCAAATTACCCACTGCTGACTCAAGGAGGTAGTGATGAGAAATAACAATACAGGACTCTTTAGACGCCCCGTAATTGAAATAGGTACTCTTGAAATCCTTTAATGAGGATCCATTGGTGGGCCAATCTGATGCCAGCAGCTGCGGTAATTCAACCTCCAATAGTGCATCTTAAAGTTGCTGCAGTTAAAAAGCCAGTAGTTGGATCTCGGGTATAAGCTGACGGTCTGCCGCAAGTTGAGCTACGGCCTTTCTCAGCCCCGGTACGCTTAACTGACTGTCCCTTGGGGTCTTAAAAAGTGTTCAAAGCAGTCTGTCGCCTGAATACCGCAGCTAGGAATAATGGAGAAAGACTCTGGTTCTATTTTGTTATTGTTTTCTTCTGAACTGGGCCAATGGTTAAGAGGGACTGCCGGGGGCATACATATTGTGCCGCCTGAGGTGAAATTCTTGGACTGGCGCAAGAATGTTTTCATTAATCAAGAATGAAAGTCGGAGGTTTAAAGACTTTCAGATACCGCTGTAGTTACGACCATAAGCGATGACAACTAGCGATCCGGCGGCTTTATTCCCATGACCCGCCGGGCAGCGTCCGGGAAACCAGATTCTGGGTTCCAGGGGGGAGTATTGTTGCAATGCTGAAACTTACAGGAATTGACGGAAGAGCACCAGCAGGAGTGGAGCCTCCGGCTTAATTTGACTCAGGAAACCTCGCCCGTACATGAAAAGATTTGACAGCTCTTTCTCGATTCTGTGGGTGGTGGTGCATGACCGTTCTTAGTTGGTGGAGTGATTTGTTTTGTTAATTCCAATTACGGACATGACAACTAATAAACTTTAAACTAGTTATGCGGCCAGAGCGGTCGGCGTCCAACTTCTTTGGGGGACAAGTAGTGTTCAGCCACACGAGATTGAGCAATAACAGGTCTGTGATGCCTGGGGCTGCACGCGCGCCACACTGAGCCGGTTGGCGTGTCTACCCTTCGCCGAGAGGCGTGGATTGGTTTCCGTAGGTGAACCTGTGGAAGGATCATTA\n>HE978326.1/163659-163887 Kazachstania naganishii CBS 8797 chromosome 13, complete genome \nATCCCCCGTGCCTCGCTCGGCCAGCTGCGTGTCTTCAGGGACACTTTGATCTGCTGGTCTTGAGCTGGACGTGTTTCCCCTCGCGGGAAGCTGGTGGGGGGATACTGAACTTCAGTGACGACTTTTTGAGTACAAGGGCGCCCGGGATACTTCGTATCCCGCACAATGGTGTCTTCAAGATTTAATACTTCATTTTAAATTGTATTGTAATTAGTACGTTCATACATGT\n>LCMH01000002.1/67321-67516 Microgenomates (Amesbacteria) bacterium GW2011_GWC1_46_24 UX46_C0002, whole genome shotgun sequence. \nACGGAAGGCTAGTAGTATGGGCCCCGCCGGTAGTAATACCGGTGCGCAAACTTGGCTATATCGGTGGACATCCTGAGCTTGTCGAAGGACAATACCGAGGCAACCTCGAAAGAGAGAGTCCGTAGAGACTACACGCCAAGCACCCCGACGTTATGTCGGGGTGATGATATAGTCCGACTCCCCGAGTAATCGGGGT\n>GL636099.1/5798-5944 Serratia symbiotica str. Tucson genomic scaffold scaffold00192, whole genome shotgun sequence. \nTAACAAAAAAATACCGAATACGATTCCTATATTCGGTCTAGGGAAATGGCTCCTAGGAGAGCCATGCGCTAAAAGTTAGCGTTTAGTGCATAATTTATCCAGTCATACTGCACTAAGCGTAGCCTATCACACTATTTTTGCCAGCTA\n>JH711579.1/1959477-1959901 Coniophora puteana RWD-64-598 SS2 unplaced genomic scaffold CONPUscaffold_7, whole genome shotgun sequence. \nACGTCGTCTGAAGAATCGCCATCGCAGCACACGCACAAGAAACGTCCTCATACGATGCTTTCTACCCTACGCTGTGGGAAAAGTCCCCGGAGACACAGAGTCCCCCTCGTGGGGCCGGCCCCCGTTCGCTAACGGAAAGCCCTGGCTGCAACCACGCCGAGGAAGGGCGGGGGATCGGTCGGGCGAGTTCACCCTGCTTGCTTCTCTATTCCTCTCGGATGGGAATGCAAGCTCGGCTCGCCCAGCTCTGTTGCGCTGCCCGACGTCCCGCGGTCTATCGCGAAGACACGAGCCTTGGCCGCGCTTTTGTGGGCGGAGGGCGCGCACGTCGTTGCTCATAGACATAGTTATGCGATTGTCGGCTTTCGCGGTTCATTCTTGTGGATCGCGGCCGTCATCTCAATGGGGCTTACTCTCATTCGACG\n>ABLE03011845.1/1131-1 Caenorhabditis japonica strain DF5081 Contig9535.1, whole genome shotgun sequence. \nTACCTGATTGATTCTGTCAGCGCGATATGCTCAAGTAAAAGATTAAGCCATGCATGCTTTGATTCATAAATGAAATTGCGTACGGCTCATTAGAGCAGATATCACCTTTCTCGGAATCCTGAAAAGGATAACTGCGGAAATTCTGGAGCTAATACATGCGACTATACTCCAACGCAAGGCGGGGTGCAATTATTAGAACAGACCAAACGTTTTCGGACGTTGTTTGTTGACTCTGAATACCGTCGTTTACTGTCAGTTTCGACTGACTCTATCCGAGAAGGGTGTCTGCCCTTTCAACTAGATGGTAATCTATTGGACTACCATGGTTGTTACGGGTAACGGAGAATTAGGGTTCGACTCCGGAGAGGGAGCCTTAGAAACGGCTACCACGTCCAAGGAAGGCAGCAGGCGCGAAACTTATCCACTGTTGAGTATGAGATAGTGACTAAAAATATAAAGACTCATCCTTTTGGATGAGTTATTTCAATGAGTTAAATATAAATTATTCTTCGAGTAGCAAGGAGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCTCCTAGTGTATCTCGTTATTGCTGCGGTTAAAAAGCTCGTAGTTGGATCTAGGTTACGTGCCGCAGTTCGCAATTTGCGTTAACTGTGGTCGTGACTTCTAATTTGCTGGTTTGAGGTTGGGTTCGCCCTTCAACTGCCAGCAGGTTTACCTTGAATAAATCAGAGTGCTCAATACAGGCGCTTGCTTGAATAGCTCATCATGGAATAATGAAACAGGACTTCGGTTCTTTTTGTTGGTTCTAGAATTGATCTAATGGTTAAGAGGGACAAACCGGGGGCATTCGTATCATTACGCGAGAGGTGAAATTCGTGGACCGTAGTGAGACGCCCAATAGCGAAAGCATTTGCCAAGAATGTCTTCATTAATCAAGAACGAAAGTCAGAGGTTCGAAGGCGATTAGATACCGCCCTAGTTCTGACCGTAAACGATGCCATCTCGCGATTCGGAGGGTTCATGCCCTACCGAGGAGCTACCCGGAAACGAAAGTCTTTCGGTTCCGGGGGTAGTATGGTTGCAAAGCTGAAACTTAAAGAAATTGACGGAAGGGCACCACAAGGCGTGGAGC\n>MELN01000046.1/18551-19023 Actinobacteria bacterium RBG_16_64_13 RBG_16_scaffold_3124, whole genome shotgun sequence. \nGCAGCTCGGGTAGCCGCAGGGGCTCACCAACCGTGAGTTCTTGAGGAAAGTCCGGACACCATAGAGCAGGGTGCTGGATAACGTCCAGCGGGGGAAACCCCAGGGAAAGCGCCACAGAAATTACACAGCACGCCGGCGCAGCCGGTTGCAAAGGTGAAATGGTGCGGCAAGAGCGCACCGGCGTCGTGGTGACACGGCGGCCAGGCAAGCCCCACCCGGTGCAAGGCCGAATAGAGAGGCGTCTGAGGGCTGCTCGCCCGAAGCCTCCGGGTTGGCCGCATGAGCCGTCCGGCAACGGCCGGCCATAGATAGATGGCTACCCAAGAGGCTGCTGGGGAATGAGGCTCGCCGCCAGGGTGCGATTGGCATGCGCGAGAGAAGGACGCACTATCGGGCCGCCTAGTGCGGTCCGGCGGCCGGGGCCTTATTTCCCAGCAGCCTCAGGACAGAATCCGGCTTACAGGGCTGCTACC\n>CP009284.1/1108194-1108485 Paenibacillus sp. FSL R7-0331, complete genome. \nTCACACGCAATGAACGGGAGCAGTAGATGATGAAGGTGTGCAGAGAGCTGCGGGCTGGTGCAACGCAGTCACCTGATAGGCATTGAATCTCGCCCGGGAGCGGAGCGGCGGAAACAGGAAGTACGCCGCAACGGAAGTCCCCGTTACCGGACATCTGTATTTGCCGGACTATACCCGTATGGGGATGAGCCGGATACGGGGTGAGCTGGGCGCAGCTTGCGGTTTATCAGGAAGGTAAGCCGGATGCGTCAACAAGAGTGGTACCGCGGTGGGGTGACCCGCCGTCTCTTAT\n>KE695927.1/3217556-3217637 Alligator sinensis unplaced genomic scaffold scaffold391_1, whole genome shotgun sequence \nGCATGGAGCTGGCTGCTCCAGGGAGCAGGTGGGAGCTGGATTCCCAGCCTCTGTCTGCTCCCTGGAGCAGCCAGCTCTGACT\n>KQ414443.1/2085-2243 Termitomyces sp. J132 unplaced genomic scaffold C252961, whole genome shotgun sequence. \nACACTGATGGTGAAGTGGTTATCATGCTTGCCTTCCATTGCATAGAAGCTATTGCATCTGTCTGAAGCAAGCGGCAGGGGTTCTGCTTGCCTTCCATTGCATAGAAGATATTGCATCTGTCTGAAGCAAGCGGCAGGGGTTCGATTCCCCTTCAGTGTA\n>FJ872372.1/9644-12466 Uncultured Verrucomicrobia bacterium clone 106 genomic sequence. \nATTCAAGCAAACAGATGGCACATGATGGATGCCTTGGCGTTGATAGGCGATAACGGACGCGACAAGCTGCGATAAGCCATGGATAGCGGCAAATACGCTTTAACACATGGATCTCCTATGGGGTAACCCGAGGGCTCAGCCCTCATCCTGCCTTTTACAGGCAGTGAAGCGACACTCGGTGAAGTGAAACATCTCAGTAACCGAAGGAAAAGAAAGCGAAAGCGATCCTGTGTGTAGCGGCGAGCGAAAGCAGGACAGCCCAAACCGGCGTTAAACCCGGGGTTGTAGGACCAGGCATAAGCGATGTGATCAGGTTGGTTCAAAAGGCTGGAAAGCCTTCCGATACCGGGTGAAAGGCCCTTAAACCGACTCGGCCCACATTGCGCCTGGCTCCTGAGTAACGCGACATAAGTGAAACTTCGCGTGAATCAGCGCGGACCACCGCGTAAGGCTAAATACTCATCAACGACCGATAGTGAACAAGTACCGCGAGGGAAAGGTGAAAAGAACCGCTACAAGCGGAGTGAAATAGATCCTGAAATCATGTGTCTACAAGGTGTCAAAGCCCTTCGGGGCGATGGCGTGCCTTTTGCTTAATGAGTCTGCGAGTTATCTTCAGTGGCCAGCCTAATGTCATTTGACAGGAGGCCCAGCGAAAGCGTGTCCGAAATGGGCGTCAATAAGTCGCTGGAGATAGACCCGAAGCGGAGGTGATCTACCCATGGTCAGGATGAAGCGCGGGTAAAACCGCGTGAAGGTCCGAACTGGTGGACGTTGAAAAGTCCTCAGATGAACTGTGGGTAGGAGCGAAAGACTAATCAAACCCCGTGATAGCTGGTTCTCCCCGAAATAGCTTGAGGGCTAGCCTCTTGTTCCTCCTTCCGGAGGTAGAGCACTGGATGAACTAGAGCCCATACCCGGGTATCGAACTCAATCAAACTCCGAATGCCGGAAGATTTAAACAAGGGAGTCAGTCGGCGAGGGATAAGCTTCGTCGGCGAGAGGCAAACATGCCAGACTAGCAGCTAAGGTGCCCAAATGCCGCGTAGTGCAAAGGCTGTGGCGATACACAGACAATGAGGATGTTGGCTTAGAGGCAGCCACCATTTAAACAGTGCGTAATAGCTGACTCATTTAGTGTCTCCGCGCCGATAATGATTGGCGATCAGCGGTATACCGAAGCTCTAGGATAGTACGTCCGAGAGGATGTGCGATCGGTAGGGGAGCATTGTTGTCTGTATTGCCGTGGCGTAAGCCGCGGTTTAAGAACAACAAGTGAGAATGCAGACATGAGTAACGATAGCCCTGTTGAATCCAGGGCCGCCGAATACCCCAAGGTCTCCTTGGCAAGGATTGTCCGCCAAGGTCTAGTCGGATCCTAAGTTGAACCCATACGGCTACAACGATGGAAACCAGGCTAATATTCCTGGACCGCCGATATTTAACCCATCCTTGGTGCGCAGGTGCAAGCAGGCCGTCGAATGCCTGTCCCGAGAGGGCGAGTTCCAGCTCTGCTGGAGCGAAGTTGTCATGACGCGCACCGCAAGAAAAAGATGGCGTATAATCAGGTGTCCGTACCAAACCGACACAGGTGGGGTCGCGCAAGAGCGCGAAGGCGTAAGAGTGAAACCTCGTTAAGGAACTCGGCAATCTAACCCCGTAACTTTGGAATAAGGGGTGCCCTCGCAAGAGGGTCTCAGTAACCGGGTCAACCGACTGTTTAACAAAAACACAGCACTCTGCCAAGTCGAATACGACGTATAGGGTGTGACACGTGACCAATGCGGAAAGATTACGGTAAGGGGTTAGCCGCAAGGCGAAGCTCTGAGCCCAAGTCCCCGTGAATGTCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATCGTGTAACGAGTTGACCGCTGTCTCGACGAGGAGCTCAGTGAAATTGTAGTGGCGGTGAAGATGCCGCCTACCCGCAGCAGGACGGAAAGACCCTATGCACCTTTACTGTACGCTGTAACTGTGGTCCTTAACCCTTTGCCTAGAGTAAGTGGGAGACTGTGAACCTGTCCCTCCGGGGGCAGGGGAGTCGCCAATGAAACACCACCCTTAGGGTTGAGGGCCTCTAATCTGGATTTTTCTCCAGAGAACATTGCAGTCGGTCAGTTTTACTGGGGCGGTATCCTCCTAAAGAGTAACGGAGGAGTGCGAAGGTTGGCTCAGCCCGGTCAGCAATCGGGTGACGAGTACATGGATATAAGCCAGCCTAACTGCAAGACCTACAAGTCGCGCAGATGCGAAAGCAGGCCCAAGTGATCCGGTGACGGAATGTGGAATCGTCATCGCTCAACGGACAAAAGGTACGCTAGGGATAACAGGCTGATCCTGCCCAAGAGCTCATATCGACGGCAGGGTTTGGCACCTCGATGTCGGCTCATCACATCCTGGGGCTGGAGAAGGTCCCAAGGGTCCGGCTGTTCGCCGGTTAAAGTGGTACGCGAGCTGGGTTCAGAACGTCGCGAGACAGTTCGGTCCTTATCCGCTGTGGGCCCAAAAGAAGTGAGAAGTTTAGATTCTAGTACGAGAGGACCGAATTTAACGGACCAAGGGTGTTAGAGTGGCCGTGTCAACGGCCCGGCTCTGTTGCTATGTCCGGAACGGATAAACGCTGAAAGCATCTAAGCGTGAAGCCACTTTCAAGATTGCTTCTTTATTGTAGGCGTGGGAGACCACCACGTTGATAGGCCAAAAGTGCAGATGCAGCAATGTATCGAGCTAACTGGTACTAATCCGACAAATGCTTGAATGA\n>CP001720.1/3486540-3486319 Desulfotomaculum acetoxidans DSM 771, complete genome. \nGAAATCCCGTCTGGTAAGACTCTAGCCAAGTCACCAGTAGCGAGTCTTGGACTCGATGGAGTAATTCATAGAGTTAAGCGTAGACAGGTAGGTAGTAGGCCTGAATGTGATTGAGCCCCGTAATGGGCAAACGGGAAGGTTGACGGTTTCGAAACTCCGGAAAACTATATCTTGGTACGCGATATGGCGAGTGTATTGAGACTTCCTCGGGGTCTAAGAGCC\n>AFTD01223909.1/154-1 Cricetulus griseus cell line CHO-K1, whole genome shotgun sequence. \nGAATGTGAAGACAATCCTGTGACGTCTTTCACCTCATTGGACTTCAGGGTTAACTTGATTGATGGGGCTAGAGGGCGTGTCCCCTCCTGCATCACTCCAAGTGCATACTTCATGGTGCTGTGCACTCAAACAGGACAACCTTCCCTAATGGAGT\n>MGPA01000055.1/20568-20297 Coxiella sp. RIFCSPHIGHO2_12_FULL_44_14 rifcsphigho2_12_scaffold_6640, whole genome shotgun sequence. \nCCCGATCACTCATTGAGAGGTTTCATTAAGTTGAATTAAAAGGGAATCCGCACGCTTTGATACAAAATCAGAATGAAAGCTAATGCCATACAAAACGGCTGTGTATTTATTCTGCATCATGCTAAAAGTATTAAAGCAATTGGAGCTGTCCCCGCAACTGTATGCAGCAAGTGCTGTTCTATAAACCACTGGCACCCTTGGACGGGGCTGGGAAGGTGGATGGCACGTTTGAGCTGTTAGCCAGTAGACCTGCCTTCGATGAATAATTAGCT\n>CP001472.1/654493-654256 Acidobacterium capsulatum ATCC 51196, complete genome. \nTATTCGTAAACGCTTTGGGATGTTCGGGAAGGCGGTGAAAATCCGCCACTGCCCCGCAACTGTAAGCGCGTTCGTGTGCTTTCTCGTCTGTTGAATACAGAGGGCACACAGAGGTCCGGGCGTAGGATGCCACTGGAGCAGATGCTCCGGGAAGGTGATTCCGCGATGCCGCCCGGCTTCGATTCCACAGGGAATGAGCGCCTAAGTCAGGAGACCGGTCCCATGCGCCTTTTTCACC\n>JRRC01082395.1/3124-5153 Gossypium arboreum cultivar AKA8401 contig_15521_1, whole genome shotgun sequence. \nGTTCAAACGAGGAAAGGCTTACGGTGGATACCTAGGCACCCAGAGACGAGGAAGGGCGTAGTAAGCGACGAAATGCTTCGGGGAGTTGAAAATAAGCGTAGATCCGGAGATTCCCGAATAGGTCAACCTTTCGAACTGCTGCTGAATCCATGGGCAGACAAGAGACAACCTGGCGAACTGAAACATCTTAGTAGCCGGAGGAAAAGAAAGCAAAAGCGATTCCCGTAGTAGCGGCGAGCGAAATGGGAGCAGCCTAAACCGTGAAAACGGGGTTGTGGGAGAGCAATAAAAGCGTCGTGCTGCTAGGCGAAGCGGTGAAGTGCCGAACCCTAGATGGCGATAGTCCAGTAGCCGAAAGCATCACTAGCTTACGCTCTGACCCGAGTAGCATGGGGCACGTGGAATCCCGTGTGAATCAGCAAGGACCACCTTGCAAGGCTAAATACTCCTGGGTGACCGATAGCGAAGTAGTACCGTGAGGGAAGGGTGAAAAGAACCCCCGTCGGGGAGTGAAATAGAACATGAAACCGTAAGCTCCCAAGCAGTGGGAGGAGCCCAGGGCTCTGACCGCGTGCCTGTTGAAGAATGAGCCGGCGACTCATAGGCAGTGGCTTGGTTAAGGGAACCCACCGGAGCCGTAGCGAAAGCGAGTCTTCATAGGGCAATTGTCACTGCTTATGGACCCGAACCTGGGTGATCTATCCATGACCAGGATGAAGCTTGGGTGAAACTAAGTGGAGGTCCGAACCGACTGATGTTGAAGAATCAGCGGATGAGTTGTGGTTAGGGGTGAAATGCCACTCGAACCCAGAGCTAGCTGGTTCTCCCCGAAATGCGTTGAGGCGCAGCAGTTGACTGGACATCTAGGGGTAAAGCACTGTTTCGGTGCGGGCCGCGAGAGCGGTACCAAATCGAGGCAAACTCTGAATACTAGATATGACCTCAAAATAACAGGGGTCGAGGTCGGCCAGTGAGACGATGGGGGATAAGCTTCATCGTCGAGAGGGAAACAGCCCGGATCACCAGCTAAGGCCCCTAAATGACCGCTCAGTGATAAAGGAGGTAGGGGTGCAGAGCTAAGGATACATGGGTACCTTTCCTTTTTAAACTTACCATTGTCATGTCTTGACATGGTCTTACGTGGTATCCTTGCATTATGAACTCACCATTGCCATGCCTTAGCATGGTCTAACATGGGATCTTTGTCTTATCGTAGTTTATCAATGCCATGTCTTGACATGGTCTTACATGATTTCCTTGCCTTGTAAAACTTACCAATGACATGCCTTGGCTTGGTCTTATTTGGTATCCTTAAACCCTAATGTCATGACATTTGTATCTTGCACATGATATTTCGTACGGCCCTATGAACCTCGGACTCAGTTTGCCCTTACGGCCAAATCTGAGTATCTTTTTCAAAGGTGAAACTTTAAGAAACACTTTGTCTCCCACCTGATACTCAATATCTCTTCGTTTTAAATCCGTGTACTACTTCTGATGATCTGATGCTGCCTTCAGACTTTCACAAATTATTTTTATTTTCTGCTCAGTATCTTTAATCAAATCAACTCTGAAATTTTACTTTCACTGAGCTCAGTCCAAAACAATGGTGTACGGCATTTACGACCGTACAAAGCCTCGTAAGGTGCCATCTTAAGACTTGATTGAAAACTATTGTTGTAAGCGAATTCAATCAAAGGTAAATACCGCTCCCATGAACCACTAAACTCAAGGATTCAACATCTCAACATATCCTCGAGTATCTGAATTATTCGTTCGGATTGACCATCGGTCTGAGGATGAAAAGCGGTGCTAAAATGCAACTTGGTACCCAAAGCTTCTTGCAATTTCTTCCAAAATCGTGAGGTGAATCTCGGATCTCTATCCGACACAACAGAAATCGGTACCCCGTGGAATCGCACAATCTGAGAAACGTACAATTCAGCTAGTTTATCCAATCAAAAATCCGTACGCACGGGGATAAAGTGAGCCGACTTAGTCAGTCTATCAACAACAACCCAAATCGCATC\n>MEZX01000002.1/385086-385203 Candidatus Berkelbacteria bacterium RIFCSPLOWO2_01_FULL_50_28 rifcsplowo2_01_scaffold_16, whole genome shotgun sequence. \nGTTGGTGCTTTTTGCGGTTGGGGTACACCTCGTTACATTCCGAACCGAGCAGTTAAGCCAGCCAGCGCCGATGGTACTTACGGCATTCAGCCGCCGGGAGAGTAGGCCAGCGCCAACA\n>LNFO01001542.1/1-433 Phytophthora nicotianae strain race 0 contig1542, whole genome shotgun sequence. \nAACAGGCTGATGACTCCTAAGAGCTCCTATCGACGGAGTCGTTTGGCACCTCGATGTCGACTCATCACATCCTGGAGCTGAAGAAGGTTCCAAGGGTTCGGCTGTTCGCCGATTAAAGTGGTACGTGAGTTGGGTTTAGAACGTCGTGAGACAGTTTGGTTCCTATCTTCTATAGATATTTTGAAAAATGAAAGAATCTAACTCTAGTACGAGAGGACCGAGAAGGGTAAATCTCTGGTGTATCGGTTGTTAAAAGGCATCGCCGAGTAGCTAAATTTATTTTGGATAGTTACTGAAAGCATCTAAGTAAGAAACCATTCTTAAAAATTTTTCATATAAAAACTGTAAAAGACGATTACATTAATAGGTTTTAAGTGTAAGTGTTGTAAAATATTTAGCTTAAAAATACTAAAAGTTTTAAAAATTAAAATAT\n>CP012602.1/5017483-5017399 Bacillus sp. FJAT-18017 genome. \nATCTGACAAAGGCAAACCTGTCTAAAGGCAGGGACGCAAAGCGATGGGCCTACCCGGGAAACCGAACGGCTGCCACGCCGCCGGA\n>KI391971.1/1387979-1387852 Granulicatella elegans ATCC 700633 genomic scaffold supercont2.1, whole genome shotgun sequence. \nTGAGCGTCATGATGGTAATAATCATCTTGCGGTTGTGAGATGAGAAGTCTGAGGCTACTGTAAAGTAGCCTTATTCTTTCTCATGATTATTTAGTCTAGCTCGCTGTCTCCCCGCCAGCGTTGGCGGG\n>CAIX01000365.1/7381-7448 Albugo candida, Ac Nc2, WGS project CAIX01000000 data, contig: AcNc2_CONTIG_365_length_25035 \nAGGGATGTAGCTTGTCGGGAAGGCGTTCGCTAATCGAAAGGACCCGGGATCGAAACCCGGCTTCCCTT\n>HG322950.1/5060379-5060502 Pseudomonas knackmussii B13 complete genome \nTCTGAGATGGCGCAGGACGCGCCATCCGCGCAAACGCGCCGCCCGGGCAGCGGTTGCGGACGGGGCAACGTGGAGCCCCGCGGCAGACCGTGGCGACCAGGGACGGCCGCCTCGGAGTGCACTT\n>DS562870.1/37046228-37046111 Cavia porcellus supercont2_15 genomic scaffold, whole genome shotgun sequence. \nTTGTGTCTAGATGTAGCCCCAAAACCTTATGCTCAAACTAAAGAGATGTCTTTCTATGGTCTGTTGGCCATTTCAGAACTTGGGCGTGAAGTGGTCAATTCATCAGAAAGAAACAGAT\n>AGTP01080057.1/11891-11451 Ictidomys tridecemlineatus contig080057, whole genome shotgun sequence. \nTCTGTTGAAGTGGATGCTCATCAGGGACCCCCTCCTTAGCCAATGGCACAAGCCATCGTGGAAACAGTGCCAGGTGGGTGGTTTGACTGGGGTGGAACACCTGCCAAACAGTGATGCCGGTGTCCTAAGCCAGCTCAGGAGGGCAGAAACCTCCTGTGGTGCCGAAGGGCAAAAGCTCACTAAGTCCTGGTTTTTCAGGATGAATACAGGCGGTGAAAGCAGAGCCTCATGATCCTTCTGATCTTCTGGCTTTCAGCAGGAGGCATCCGAGAAGTTGCACAGGGATAAGTGGCTGACGGCAGCCAAGCCTTCATAGAGCTGTCACTGTTGGACCTGGCCGTCTGCTCTTCCTTTCGATGTGCAGCAGAATTTGTCAACCACTGGACTGTGTGTCTAGTGACCGTGAATGTGAGCTGGGTTTAGACCATCCTGAGACAGGAC\n>BDFN01001543.1/367-1030 Ipomoea nil DNA, scaffold: scaffold1543, cultivar: Tokyo-kokei standard. \nTATGGGGTGTGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGTTAACGAACGAGACCTCAGCCTGCTAACTAGCTATGCGGAGGTATCCCTCCGCGGCCAGCTTCTTAGAGGGACTACGGCCTTTCAAAGCCGCGGAAGTTTGAGGCAATAACAGGTCTGTGTCCTATTACGTTGGCCTTCGGGATCGGAGTAATGATTAACAGGGACAGTCGGGGGCATTCGTATTTCATAGTCAGAGGTGAAATTCTTGGATTTATGAAAGACGAACAACTGCGAAAGCATTTGCCAAGGATGTTTTTCATTAATCAAGAACGAAAGTTGGGGGCGAAGACGATCAGATACCGTCCTAGTCTCAACCATAAACGATGCGACCAGGGATCGGCGGATGTTGCTTTTAGGACTCCGCCGGCACTTATGAGAAATCAAAGTCTTTGGGTTCCGGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTCCAGACATAGTAAGGATTGACAGACCTGAGAGCTCTTTCGAGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTA\n>HE616749.1/573542-573633 Torulaspora delbrueckii CBS 1146 chromosome 8, complete genome \nAATAATGATGAAAAAATGGTCGCTTATCAATGCTTCAGATCTATCTGTGATGGAAACAAATAAATTAACCATTCAGAACCGCTACACTGATT\n>CP022657.1/1323203-1323416 Tumebacillus algifaecis strain THMBR28 chromosome, complete genome. \nAAATAGGCAATGATGGAGCGAGTAGCGTTTTGTAGGATTGTGCAGAGAGCCGGTGGTTGCTGTGAACCGGACAGTCCGATCACGTGAAGTACACTCCGGAGCCGCTTGGAGGCAATGCCAAGCCGGTCGCGCGAGTGATCGTTACGTCAATGAAGGAGTTTCTATTTTTGAAACTGCTTAGGGTGGTACCGCGAGTTCAAACCTCGTCCCTATT\n>CP011601.1/33522-33359 Kluyvera intermedia strain CAV1151 plasmid pCAV1151-296, complete sequence. \nTGGTGCTGGAGGCTTTTGCCCCAGCCAGCGGTAACACTGTTTGACTGTGGTAAAAGCAGAAAGCCCCGAGTAATTTTTCAATTAACCTGTACTGCACCCATTTTGTTGGACGATGAAATGGAATAGTCCCTGATATGTCAAAGCCAAAATACCCCTTCGAAAAG\n>AMPR02000442.1/14789-14883 Cupriavidus sp. HPC(L) contig68, whole genome shotgun sequence. \nCACTCCGAGGAGCGTTGCAACGGACGGCGCGCGGGCCCAACCCCGCATTCTGCCATCCGCCAGGCTCGGAATGTCTTCAACGGCGCTCGCTGAAC\n>CM000811.1/53837939-53838120 Oryctolagus cuniculus chromosome X, whole genome shotgun sequence. \nATCACTTCTCGGCCTTTTGGCTAAGATCAAGTATAGTAATCTTAGGAAATGTCCCTGTCAAATAGCAAGAACTCAGAAATTATAACAATGTTTAGTGATATTAAAGGTTCTAATGTACCTGTCTCATACCTAGGGAGCTTGTATGCTTTTTCTACTTTTGCAAAATTTCTCTAAAGACTTCT\n>KQ059250.1/49614-45799 Gossypium hirsutum cultivar TM-1 unplaced genomic scaffold scaffold2565.1, whole genome shotgun sequence \nCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTAAGCATATCAATAAGCGGAGGAAAAGAAACTTACCAGGATTCCCCTAGTAACGGCGAGCGAACCGGGAAAAGCCCAGCTTGAGAATCGGGCGCCATCGGTGTTCAAATTGTAGTCTGGAGAAGCGTCCTCAGCGGCGGACTAGGCCCAAGTCCCCTAGAAAGGGGCGCCGGAGAGGGTGAGAGCCCCGTCGTGCCCGGACCCTGTCGCACCACGAGACGCTGTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCTAATCGGACGGTAAATTCCATCCAAGGCTAAATACGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGGAAAGATGAAAAAGACTTTGAAAAGAGAGTCAAACAGTGCTTGAAATTGTCAGGAGGGAAGCGGATGGGGGCCGACGATGCGCCCCGGTCGGATGAACAAGTACCGACGCGGGTCGTGGCGGCGGCCCAAGCCCGGGCCTTTGATACGCCCGTGGAGACGTCGTCGCCTCGATCGTGGGATTCAGCACGCGCCGCCTCGGCGTGCTTCGGCACCTGCGTGCTCCGGGCGTCGGCCTGCGGGCTCCCCATTCGGCCCGTCTTGAGCCCCGGTCGGATGTGGAACGGCGAGAGCCGGTTTGCAAATTGGCTCGGGGCGTGGACTGACGCGGGGCGTGGCGGCGGCCCAAGCCCGGGCCTTTGATACGCCTGTGGAGACGTCATCGTCTCGATCATGGGATCCAGCACGCGCCGTCTCGGCGTGCTTCGGCACCTGCGTGCTCCGGGCGTCGGCCTGTGGGCTCCCCATTCGGCCCGTCTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGCTGGAAAACCCGTAAGGCGCAAGGAAGCTGATTGGAGGGATCCCTCACGGGTACACCGCCGACCGACCTTGATCTTCTGAGAAGGGTTCGAGTGAGAGCATGCCTGTCGGGACCCGAAAGATGGTGAACTATGCTTGAGCGGGGCGAAGCCAGAGGAAACTCTGGTGGAGGCCCGCAGCAATACTGACGTGCAAATCGTTCGTCTGACTTGGGTGTAGGGCCGAAAGACTAATCGAACCGTCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCCCTTAGTGAGTTCTATCGGGTAAAGCCAATATTAGAGGCATCGGGGGCGCAACGCCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACGGTGTGGCTGCTTCGTTGAGCCGCCCCACGGAATCGAGAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGCCGGGTTACGGTGCCCAACTACGCGCTAACCTAGAACCCACAAAGGGTGTTGGTCGATTAAGACAGCAGGACGGTGGTCATGAAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCCCCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTTAAGCGCGCGACCTATACCCGGTCGTCGGGGCAAGAGCCAGGCCCCGATGAGTAGGAGGGCGCGGCGGTCGCCGCAAAACCCAGGGCGCGAGCCCGGGCAGAGCGGCCATCGGTGCAGATCTTGGTGGTAGTAGCAAATATTGAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGAGACGGGGGAAGCCCGTCCGATAGCGCGTTCAGCGCGAGCTTTGAAAGGGAATCGGGTTAAAATTCCTGAACTGGGACGCGGCGGCTGACGGCAACGTTAGAGAGTCCGGAGACGTCGGCGGGGGCCTCGGGAAGAGTTATCTTTTCTGTTTAACGGCCTGCCCACCCTGGAAACGGCTCAGCCGAAGGTAAGGTCCAGCGACCGGAAGAGCACCGCACGTCGCGTGGTGTCCGGTGCGCCCCCGGCGGCCCTTGAAAATTTGGAAGACCGAGTGCCGTCCGCGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGTCAATGGAACAATGTAGGCAAGGGAAGTTGGCAAAATGGATCCGTAACCTCGGGAAAAGGATTGGCTCTGAGGGCTGGGCACATCGTGTGGTGTCCGGTGCGCCCCCGGTGGCCCTTGAAAATCAGGAGGACCGAGTGCCGTCTGCGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGTCAATGGAACAATGTAGGCAAGGGAAGTTGGCAAAATGGATCCGTAACCTCGGGAAAAGGATTGGCTCTGAGGGCTGGGTACGGGGTCCCAGTCCCGAACCCGTCGGCTGCCGGTGCACTGCTCGAGCTGCTTCCGCGGCGAGAGCGGGTCGCCGCGTGCCGGCTGGGGGACGGACTAGGAACGACTCCTTCAGGGGCCTTCCTCGGGCGACGAACAGTCGACTCAGAACTGGTACGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTCACGCAATGTGATTTCTGCCCAATGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTCACTCTAGTCTGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCTCTCGGGCGAAATTGAAATACCACTACTTTTAACGTTATTTTACTTATTCTGTGAATCGGAGGCGGAGCACGACCCCTCTTTTTGGACCCAAGGTTGGCTTCGGCCGACCGATCCGGGCAGAAGATATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACACATGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTCCAGTACGAATACGAACCGTGAAAGCGTGGCGACGATCCATCCTGGCGATGATCTGGCGAGCCATCCCAGGATATACAAAACGGCGCAACGAGTCCCCCCCCGGAATTTGAAGCTAAAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCAATCATTGTGAAGCAGAATTCACCAAGTGTTCGATTGTTCACCCACCAATAGGGAACGTGAGCTGGAGTTAGACCGTCGTGAGACAGGTTAGTTTTACCTTACTGATGGCCGCGTCGCAATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGTGCGAAGCTACCGTGCGATGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGAAGCGACGCACGCGCCCGTCGCCCGATTGCTGACCAGTAGTAGGGGCCTTTGGCCCGCAAGGGCAGTGTCGTAGGTGCAGCGACCACGACGGACAAGTCGCGGGCGCCTCCTTGGAGCGTAATTCCCATCGAGCGGCGGGTAGAATCCTTTGCAGATGACTTAAATACGCGACGGGGTATTGTAAGTGGCAGAGTGGCCTTGCTGCCACGATCCACTGAGATTCAGCCCTTTGTCGCTTCGATTCGT\n>ATMG01007873.1/439-612 Angomonas deanei Cont7876, whole genome shotgun sequence. \nCCCGGGGGGTACCCCCCGGGGGGGGGGGTAAAAAAACCCGGGGGGTTAAAAAAAACGGGGGGGGGGTTAAAAAAAAACCCCCCGGGGGTTAAAAAAAAACCCGGGGGTTTTTTTAAAAACGGGGGGGTTTAAACCCCCGGGGTTTTACCCCCGGGGGGGGGGAAAAACCCCCCC\n>GL010040.1/62122050-62122364 Loxodonta africana unplaced genomic scaffold scaffold_13, whole genome shotgun sequence. \nGGATGTGAGGGCAATCTGGCTGAAACACCTGTCACCGCATTGATTGCCAGGGCTGACTGGATGATGCTGCTCACCCTCATCCCTTAATTTCTCCTTCTGTGTCTTTCTGGAAGCCTTGGGCTTGGTGAAAAGGGAAGACTTTCCCAAAGACAGGAGGCCATTCTGCAATTATTAAAGATATGTGGGTAGTAGGTTGACCAGCTTTCCCTTTTTACCTGGGACTGAGGGTTTCCTGGGATGCACGACTCTAGTGCTAAAACCAGGAAACCCAAAAAACCCAGTGCCATTGAGTTGATTCTGACTCATAGTGACCCT\n>LFJF01048753.1/46-1 Macrostomum lignano unitig_48821, whole genome shotgun sequence. \nATACTTACCTGGCGCGGGGGATACCGTGATCAAGAAGGCGGTGCCT\n>URS0000D694FA_12908/1-95 unclassified sequences DUF3800-IX RNA \nTTCCCCTCGGCGAAAGAGTGCCCTCATTGGGCGCGTGCCAGGTGGTTGAATGCTCTGCATAAGAGCCATAACCTGGATAGCCGAGGCGGTTTTAT\n>GL896944.1/3131193-3131114 Mustela putorius furo unplaced genomic scaffold scaffold00047, whole genome shotgun sequence. \nGGAACTTCAAAAAGGGTCGTCCTTCCTGTGCTTGCTTTACTGATGGTGCATTTTTGAAGTGCGTCCCATTTTTCAGAATC\n>AZAF01012014.1/4245-4334 Dictyocaulus viviparus strain HannoverDv2000 D_viviparus-1.0_Cont414.7, whole genome shotgun sequence. \nTATATTCACACAATCGGCGAGCGGTTTTCACTGTGATCTGAGAGTTCATACTTCTGAGATCATTGTGAAGGCCACTTGCCTTGTGCCGAT\n>AP006878.1/1476852-1476910 Thermococcus kodakarensis KOD1 DNA, complete genome. \nACCGATGAGGAGTGTCATCCCTCCTGATGTCGAGATGATGACATTATCCCCACCTGAGG\n>CP004044.1/1196775-1196896 [Clostridium] stercorarium subsp. stercorarium DSM 8532 chromosome, complete genome. \nACAACAAAGTAGAAGTGTCCACTTCTCACCCTGTGTCCTGTTGACTTCAGGGTTTAAATCGTAGCAGTATGTTGCTGTGATTTAACGCAGGTGAAGTGGCTTACCTGCTTTTTTATTTGTCA\n>JMSN01000007.1/154622-154723 Tilletiaria anomala UBC 951 K437scaffold_7, whole genome shotgun sequence. \nGGCCAATTGGCGCAATGGTAGCGCGTTGCTCTCCTACATGTGATGATTGCTTCATGCGCTTGGGGCAAGCAGAGGTTGCAGGTTCGACCCCTGCATTGGTCG\n>LOHF01000026.1/9999-9927 Pseudomonas caspiana strain FBF102 scaffold00026, whole genome shotgun sequence. \nTGGCCTGAAGCATTGGCGGTTGATGCACTGGCCTCATAAGCCAGCGAAGGGGGTTCAAGTCCCCACAGGCCAA\n>AFTD01049056.1/8014-8294 Cricetulus griseus cell line CHO-K1, whole genome shotgun sequence. \nGGACAGTGTGGCTGTGATATCACCCCATTGATTGCTAGGGGGTGGTCCTGATGTCCTTCTCATCACAGCTCCATGTATGTTCCCTGAAGCCACTTGCTGGTTTGAGGAGGACCTTTTTAGGGGAGGACCAGTGTTTTGTCAAAGATGTACAAATAACTACACTCTCCAGCTAGAACCTCCAAACCAGCTTTCAAGGTCCATTTGTAGGGAAATGTGGTGGTCGAGCTTCGAAGACTCAGGGCATACCAAGTGAGGCAATGCGTGGCAGTCTGCCTTCCTTT\n>CP000102.1/1672674-1672743 Methanosphaera stadtmanae DSM 3091, complete genome. \nAACAAATAAGGTGATGAGGTTCCACCTATTTAACTGCCAGTGATTACTGGATGATGACTTCTATTTTTAA\n>LM433890.1/66331-66460 Nippostrongylus brasiliensis genome assembly, scaffold: NBR_scaffold0000505 \nATGCGTGATCTCAACACGCGTACTGCCTCCTACGGCGTACGTGTCTGTAATGCACGCTAGAACGAATGCGCCGGATTTCGCTAGCACCGCGTCCAGTGACCGGAGTTTGATAGTAGACCGGGGCACATTA\n>KV440972.1/762318-763371 Phycomyces blakesleeanus NRRL 1555(-) unplaced genomic scaffold PHYBLscaffold_2, whole genome shotgun sequence. \nGGTCCGTACTTTGAGCGATTCTACCTGCATTTACTGCAGTGGAAAAGAAACCAAAAGGGATTCCGTCTTGGACTTTATTGTTTGAGATGGAGAAGCTCCAATGTTTGAACCGGAGTAGTCTTTTGACTGCTCCGGATTGTGAACTAGTGAACTGCTTTTCCAGACATACCAACAAGTCAGTAGCCTTCACTCCCTGGAAAAGGTTACTGGAGGGTGCAATCCCCTCACCTTGTCTTGAGTTCTTGTCTTTGTGTTAAGTAGCTTCCGATGAGTCGGGTTGTTTTACAAACTCCCTAATCCTGGTGAAAAGTTTCATCGAAGGCTAAATATACTTATAAAAAACCAACTGAACACAAGTACCGTAAGGGAAAGTAGCTCTTAGTGTAGAGCATACTGGACGTTAAAGACCTTCCTGAGCCACTCATATGAAGGCGAAAGCCGGATGAAATCCACGTCAGTTTTTTCTGTGTTGTGCGGCACATAACATGGAGAAGACTGAGGAACGCAGAGGTAGCTTTATGCTATTTTCTTAGGACGTTGGATATTGGCTCTCCAGATTTTGTCCTTTGGGGCATGTCAAGATTGTCACATAAAGGTGCAAGTATAAGGGTGTATCACCTGGATGCGTAGAGTTTTTTAAATTCGTTGAGCACCTGGACGTGAGGTAATACAGGTAGATTCCAGCAGAATCGACAGATTACCCAGTACAATCGCCTGTATTTTACTGCTTCCTGTTGAAATGATCCCTGTGCTTTTCAAGTCCCTCATTGCTTAGACTTTGATACTTGTAACCCACGCTCTGGTAAACAGAACTGGACATGAGGGACGAACCCGAAGCAAAGTTAAGGTGCCTAAGTAAATGCTATGCTGTTCACTTGGGTGTCTCAGACACCTGTCCCGAGCAGTTTGGCATTAAAGCATTTCACCGATACTTTGCCGTCATGGTAAATTTGATGCCATGCCGAGTAGGCAGGAATGAGGGTTGTTGAGAAGCTTGGGTGTAAACTTGAGTGGATCGGCCTTCAAGCGCAGGTCTTGACAAAAAAATCTTTGT\n>GL010085.1/8876859-8876953 Loxodonta africana unplaced genomic scaffold scaffold_58, whole genome shotgun sequence. \nTAGCCTGGGCGGCGGCGGGAGCCTGCGCGGCCAGGTGGGGAGGCGGCAGGGCCCGGGCGGGCGCCTGCTGTCTGCCCAGAGCCGGCCTTTGTACA\n>HF997045.1/49466-49290 Roseburia sp. CAG:50 genomic scaffold, scf107 \nATATCAAATAGAGGCGCGGTTTACCGGGTAGCAGCAAATGATAAGGAACATTATTTCCAAGGTTGTCTGTGAAGGGGTGGATCGCCGAAAGACCGGATCTGTAATGGGAGAAGGACTTGGGGCAAAGGCGGACAGCTTTTGCACTGTCATGTGAAAACGTGGGGCGCTATTCATCAG\n>CP002734.1/423330-423196 Pseudopropionibacterium propionicum F0230a chromosome, complete genome. \nAACTGGCTAGGCTGTCCCGCGACGACTGACCATTCAGCTTGCCGACAACGAAGGAATCCGGTGCGAATCCGGAGCGGTGCCGCCACTGTGACCACCCGGGTGGGAGCCAGATACTTCGGGCCAGCCAAGACCGAA\n>AFYH01035016.1/408-649 Latimeria chalumnae contig035016, whole genome shotgun sequence. \nGTGCCGCACCAGAGACTGAAGTCCTCTGTTTATCCACAGAACAGGTACAGCAAGGGCAGCGGCTGTGCAGGCTTCCCCTCGTATTGTAGAAAAGGCTTTCTCTCATTTTGTACTTATGGCCAGATCCTTTCTGCAGTAGGGCCCATTGCCCTGGCAGTGTGCCTCAACCCTGTCCTGGTGGGACTGCCTCTACAGGGTGAGAGGATAGTTCAGTCTCTATGCCCATTCACTCCTTGGCCTCT\n>AAQR03046981.1/275629-275572 Otolemur garnettii contig046981, whole genome shotgun sequence. \nCAAAAGGCTCTCTCTTTCCTCTTTGCAGAGAGCCACCCAAATTGTAGTAAAATTATAT\n>CM000866.1/73130079-73130313 Callithrix jacchus chromosome 11, whole genome shotgun sequence \nGAATGTGAGGGTGATCTGGCTGTGACATCTGTCACCCCATTGATCACCAGGGTTGATTTGGCTGATCTGGCTGGCTAGGTGGGTGTCCCTTCCTCCCCCACCTCTCTGTGTTCATCCCTCCCAATGTGACCATCCTTGATACAGGGCATATGAGTAGCTGTTATCCCCCTGCTAGAACTTCCAAACAAGCTCTCAAGGTCATGAGAGAATGGGGCAGATCTTGTCCAGTATAGTT\n>AKKU01000011.1/303476-303556 Alishewanella agri BL06 contig011, whole genome shotgun sequence. \nGGATTTTTAGCTCAGCTGGGAGAGCACCGCCCGCTTTTTACAAAAATACGGTTGCCACTGGTTCGAACCCAGTACAATCCA\n>JPDO01000048.1/47729-47855 Acidomyces richmondensis BFW scaffold_48, whole genome shotgun sequence. \nGCTTCGATGGTTTAGTGGTAGAATTTCACCTTCCCAAGGTGGAGGCACGGGTTGTAGGTTGCTCACCTGATTCTCGTAAATTTCCGCATCATACTTATCAATGTTGCAGCGATTCCCGTTCGAAGCA\n>URS0000D6D023_12908/1-115 unclassified sequences EGFOA RNA \nGACTGCCCAGATGTGCGAAAGCGACCGTCCTAGTCCACGAAAGTGGAGGATAATGCCCTGAAAGGTGAAAGTCCTTGCTCTGTAAAGCTAGACCTGGGGGAGTTAGAGGGGTAGC\n>CM002905.2/43709859-43709995 Danio rerio chromosome 21, GRCz11 reference primary assembly. \nAGCCAAAGCGTTGAGTTCAGCTCTGGGTTTCTCCCCAGTTCTGCTAATTAATCTTTGGTACAGAAAATGGCTGAGTGGTGATCAACATGAAGGGGTTATACTTTGACCTCCTTTATTAAACCCTTCAGCCGACATGA\n>FWFW01000005.1/209292-208875 Pacificibacter marinus strain CECT 7971 genome assembly, contig: 0005 \nACGGATGGCTGGATGACCGCGGGTTCTGGGCGCGCAAGCGTACTGGGACGCGAGGAAAGTCCGGACTCCATTGAACAACAGTGCCGGGTAACGCCCGGCGGGGGCAACCCTAGGGACAGCGCCACAGAGAACAGACCGCCCTACGCGCGCGCAAGCGCACGCTGGGGTAAGGGTGAAACGGTGGAGTAAGAGCCCACCGCGCGAGCGGCAACGCAAGCGGCACGGCAAGCCCCACTGGGAGCAATGCCAAATAGGGGTTTCGTGTGAGGCACTGCGTTCGCGCAGAGTGATCATAGGGAGGTTCAAGCCCGAGAGACCCGGGTTGGCAGCTTGAGCGTATTGGTAACAATGCGCCTAGAGGAATGGTCATCGAGGGGGCAACCCCAGACAAAATCCGGCTTATAGGCCATCCGTGCAT\n>AGTP01074074.1/1268-1332 Ictidomys tridecemlineatus contig074074, whole genome shotgun sequence. \nTCCTTGTTCAGATCTGTGTCCAAATGATTTCCTGTACTTGCAGGGGACAGGTGGGGTTTCAGAAG\n>FRCC01000012.1/1582-1684 Flavobacterium flevense strain DSM 1076 genome assembly, contig: Ga0131122_112 \nTTTGCGTTAGGGATGGAAGCGGCATCCTTTTGTGAGAGCAGTAATTTTCAGGTTTAAACTACTATTACCCGAACAAAAGATACAGCGTACAGCCCGACCTTGT\n>CM002818.1/210608794-210608329 Capsicum annuum cultivar Zunla-1 chromosome 7, whole genome shotgun sequence \nAAGGTAGACGTTTATGACATTTTAAGACAATGAACCTGTACAATTGACCACTCTAAAAGGGCTAGAATTCTAACATTATGTTAGGACCTGAGGACCAAGAGATAGTCTCAGATAGACAATTTTTATGGGGCGTAGGCCTACTAAAAGGTAATGGAGGCATGCAAAGATTTCCTCGGGCCGAACAAAGTTTGTCCCTCGAGTTCAAAGGCAGAAGGGAGCTTGAATGCAAGACCCACCCATTGAGCAAGGACAAAAGTCTGCCTTAGTGATTCAACGGCGCCGAGTATAAGGCCCGTCGCTCAACTGATAAAAGTTACTCCTACAGATAGCAGGTTGATCTACCCCAAAAGCTCACATCGATGGAAAGATTTAGCACCTCGATATCGGCTCTAAGCCACCTAGGGTTGTAATATGTTTCAAGGGTTGGGCTGAAAATCAAGACCGGGCCGCTTTGTGGGACACTAGG\n>AGTP01053200.1/11304-11443 Ictidomys tridecemlineatus contig053200, whole genome shotgun sequence. \nGGGGATGTGGCTCAGTGGTTGAGTGCCCCTGAGTTCAATCCCCAGTACCAAAATTAATTAATTAATTAAAATAAAAAATAAAGGACTATGGATGTAGCTCAGAAGTAATGCACCCCTGGGTTCAATCCCCAGTACCCCCA\n>AYUG01121489.1/14996-14569 Fukomys damarensis contig121489, whole genome shotgun sequence. \nTTATTGGTTGATGTCATGATAGCAGCCATTCTTTCTAGGGTGAGGCGGAATCTCAGAGTTGTTTTTATCTGCATCTCTGGAATGAATGACTAGTAACTCAAAAACAGCTCATTGAACCCTGCCCCCTCAGCCTGGTGGAAGGGAGGGGGAGCAGGAGCCTGCAGCTTGGGTGACTCTAGATAACTTCAGGCTAATTGCACAGTGTGCACAGACACACACACGCGCACGCACCCCGAGGTGGCATCAACCCATTTGAACATCAGCCCTATCAACTTTCCATGGTAGTCATCATGCCTACCATGGTGACCTCGGGTGATGGGGAATCAGGGTTCAATGCCGGGGAAGGAGCCTGAGAAATGGCTACCACATCCAAGGAAGGCAGCAGGCATGCAAATTACCCACCTCTGACCCGGGGAGGTAGTGATGAA\n>JJRU01010803.1/22820-23049 Picoides pubescens contig10803, whole genome shotgun sequence. \nGTGCATGCTGGGCTACACTTCATGAAATGGAGCTCAGGAGCAACCAATTGCTTAGCTCCTCCTAACATGTCCAACTGGCTATGAAAAGCTGGAGGTGCTGCACAGAACAATGAAGAGGAGCTATCCCACATATTAATCTGCTTATCAAGGATTGCCTTCTGTATAGGTTAATGGGAAGCATGTAAAAGGGGGGGGGGGGGGGAAGAGGGGGGGAAAAAAAGGGGGGGAAA\n>LM550152.1/1576-1768 Onchocerca flexuosa genome assembly, scaffold: OFLC_contig0009332 \nAATGTTGTTGCGATAGTAGTCCTGCTCAGTACAAGAGAACCGTCAGATCATTGGGTCATTGGGTTCATGTGCCTGACCGATTGGAAAATTGTACGAAGCTACCATCTGAGGGATTATGACTGAACGTCTCTAAGTCAGAATTCCTTTATCAAATTTTGTATTTTGCGTTACAAATAAAACCGAAAAAAAAAAA\n>AAIZ01025588.1/144-25 Drosophila persimilis strain MSH-3 cont1.025587, whole genome shotgun sequence. \nCGACGATCGGGTCTTTCGAGTGGAGGGGAGAGTGTTGGAGTTGGCGGACATGGAGTGTTCCACCATGAACCTCGTCTGCCACTCTCATCTCGTCCACCCGCTCGAGAGGTTGCGATCGTC\n>BX284602.5/14617143-14617209 Caenorhabditis elegans chromosome II \nGTGCGATGAAGGTTAATGATAAGTTTCGGCTGACTCAAATTGATGACACCTTTAATATGCTGAGCAC\n>NHBU01000111.1/1-68 Bacterium TMED15 isolate TMED15 146485, whole genome shotgun sequence. \nTGACAAACATGTAGTAGCTTTTTTTGAGATGTTTTCGGACGCGGGTTCGACTCCCGCCACCTCCAATT\n>AACT01044066.1/1177-1 Ciona savignyi cont_44066, whole genome shotgun sequence. \nAAACTTTGCATTAATCCTGAGAATTTGGTATTTTTGTATGATTATGACTTTAAGAGCTTTAAGAATCTTAGCAAAGAACAATTGACAATTACACTTGTGGATCATCATCACATACAAAAGTGAGTATTTGTCGTCAAAAAAATCCTGGGTTGAACTACAACAATAGTAATGTCTCAACCATGCAATAAGCTGCAATAGCTCTGGTAATCATGCAGTAAGCACTAGGTATTTTTGACTTGCTGTGTGATAATGCCTCTTGTGTTTTTTCATTTACATTCTTTTAATTATTCCTTTTAATAAAGAGAAAACTCATAAAGGTTTTTTCTAATTTTTTGTGTTATGTTAATAGTTCCCATGTGCTTCATGGGTGTGAGATCACACATGACAGAAATATTGGATCATCGCCCACAAGAATATGCTACTGCACCTGGCGTTGAAGTTTCTATTTGTAAAGTGGGTTCATGCAGTACTCTAATTGCTACGAGGGTTTTGCAGAATTTGAGAGAAGATCAACTTCTACCCGAAGTCGTCACTTTGCTGTTAGGTTGGCGCACTAGCGTCGGACGAGGGCCGCGACCGGCTGGGCGGCGGGCAAACGGCTCCGGGCAAGGTAACCCCGCTTCGGCGGGGTGCTACAGGCCCGGTGCGCGCAAGGGTCGCCGCCCGGTCGAGGAGAGATGCGCGCCGCACCTGCCCCGTTCGCGGGGCCGGGGAAGCCGTTCGAGCAGCGTCGTGTCGCGGTCCGGGACTGTCCTCAGTCCCGGGTCGTCTCGGCGCGGTTCCGAGCGGTCGCTCCCTCGCGAGGTGCCGCGGGTCAGCGGCTGACGCCAGCCACCTTCCCGACCCGTCTTGAAACACGGACCAAGGAGTCTAACATGTGCGCGAGCCGCGGGGCAGTACGAAACCCGTAAGGCGAAATGAAGGTGAACGCCGGCGCGGTCCGGCGGAGGTTGGATCCCGTCCCGTCGGGGCGGGCGCACTACCGGCCGATTTTTTCCGCCCTGTCGGCGAGGTCGAGCGAGAGCGTGCAAGTCGGGACCCGAAAGATGGTGAACTATGCCTGAGGAGGTTGAAGCCAGAGGAAACTCTGGTGGAGGACCGTAGCGATTCTGACGTGCAAATCGATCGTCAAATTTGGGTATAGGGGCGAAAGACTAATCGAACCGTCTAGTAGCTG\n>KV454486.1/94097-93978 Ascoidea rubescens DSM 1968 unplaced genomic scaffold ASCRUscaffold_12, whole genome shotgun sequence. \nGCAATATTCTACGGGTGCCTCATGATTTTAATTTCTAATTATGATCTATGGCTGAGATTATACCGTCTACTGGAACTCGATCAAGTTAATACTTGCGTGAGGAAGTAATATTGTTATATT\n>URS0000D69B4B_12908/1-89 unclassified sequences c-di-GMP-II-GAG riboswitch \nCGGCGATTGGACACTTTGACCCCCGGGTGCGGGCAGCAGCGGTCACCAGGTTCCGGGGCGAGTGAATGGTGAGACCGGCCAATCTGCCG\n>JH835753.1/1489368-1489540 Erinaceus europaeus unplaced genomic scaffold scaffold00465, whole genome shotgun sequence \nGGCTGGGCTGTTCGCAGTGCAGGAAGCCAGCTGTTCTGAGGGAATCGAGGTGTCACCAGGAGCCTTGCTATTGCAGTGGGTTGTGGTCACAGGCTGAGTCCCAGGGCAGCCTCCATCCAGGCCTCTTGTGCTGAACTGGAGAGCAGCCTGAGGACTGACTGGGGCTCCCAAGG\n>CP004349.1/2893589-2893441 Polaribacter sp. MED152, complete genome. \nAACTAGCTTGCATGAGCGATAGAAACGACATCCTTTTTATGTATAAATTGGTTCTAAACTTTTTTTAGATAGCTTTAACCTTATAAAAAACCAGATACTGATACAAGTTCTGCATAAATAAAAAGATACAGTGAATAGCGCAGTTTTTG\n>LAZP01002266.1/658-335 Ophiocordyceps unilateralis strain SC16a Contig_2342, whole genome shotgun sequence. \nAATTGGGCGAAGCTACCATCTGCTGGGTAATGGCTGAACGCCTCTAAGTCAGAACCCGTGCTAGAAGCGTGGACGATTTTTTCTTGCTTTGCAATTAGAAGTGCAGAAATAGGAAGTCTTCGGGCTTTCGTGTGCCATAAATTTGAGGGTCCTGGTATCTTGAGCGGAAAGGCTTGGGGTACCTGCCTTCGTAATTACAACGAAAATATGCGGGCAAGGGAGGATCTCTTGCAGACGACTTGAATGGGAACGGGGTGCTGTAAGCAGTAGAGTAGTCTTGTTACTACGATCTGCTGAGGCTCAGCCCTATGTTCTTAGATTTGT\n>MTEJ01000052.1/21539-21679 Thiothrix lacustris isolate A8 Ga0073116_1052, whole genome shotgun sequence. \nAGTTTGCAGCGCTGTTTAGGTGCGCTCATTGCGGTGAGCGTTAAACGGGAAGTTGGTGCAACACCAACACTGCCCTCGCAACGGTAAGCAGGTTATGCCAATCTGATAAGTCCGACACCGGCCTGACAAGGCGCGACTCTA\n>LGKD01099238.1/4615-4769 Octopus bimaculoides Scaffold8256_contig_7, whole genome shotgun sequence. \nATAGTTTTCTTGAATTCCTGGGGTTTGCTGAACCCAATCAGAGACCATCGATATTAAACTGATTTTTAGAACGAGGCGAAGAGTTAGGGGCTTGCTCCGCCTTTGTCACGGGTTGGCCTGGTATATCAGTACTTCTAGGATTCAGCCCATCTCCC\n>MKVI01000100.1/16871-16982 Legionella sp. 40-6 scnpilot_expt_750_p_scaffold_1464, whole genome shotgun sequence. \nTGCCTTGGTAGAATGATCGCCTTTAACGAATACTAAGTAGTTCCGGGAGTGAAGAATGTCGCTAAGTAGCGCAGATAAAGCAGCAATTGTAAATGAGTTCAAGCGTGATGAC\n>LBRP01000004.1/36699-35151 Parcubacteria (Nomurabacteria) bacterium GW2011_GWF2_36_19 US08_C0004, whole genome shotgun sequence. \nAAAGTATCTCTGGCAACTGTTTATCAAAAACACAGCTCCCTGCGAACTCGCAAGAGGATGTATAGGGGGTGACACCTGACCAATGCCAGAAGGTCAAATATCGGTGGTGCATGGTCGCAAGATTGTGTGCTGGCTGATATAAGCCCTGGTGAATGTCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAGTACCTTGTCGGGTAAGTTCCGACGCGCACGAATGGTGTAATGACTGGAGAACTGTCTCGAAGACCTGCTCGGTGAAAATACAATACCGGTGAAGATGCCGGTTACCTGCAGATAGACGAAAAGACCCTAGAAGCTTTACTGCAGCTTGATATTGAGTATATTGTTTTAATGCGTAGCATAGATGGGAGAGGTTTGATGGTTAGGGTCTCGGCTCTGATCTACTCGTCAGTGAAATACCATTCTTTACAATAATATGCTCTAATCTCTAAGGCAAAAACTTAGAGAGACAGTATCTGGTGGGTAGTTTTACTGGGGCGGTATCCTCCTAAAGAGTAACGGAGGAGTTTATTAAGGTTAGCTAGGCGCGAATGGAAACCGTGCCGATAGTGTAATGGCACAAGCTAGCTTAACTGTAAGACGTACATGTCGAGCAGATACGAAAGTAGAACATAGTGAACCGACATTTCGCATTAGATGCGGATGAAGATTAACGGATAAAAGCTACTCTAGGGATAACAGGCTAGTTCCGCCTAAGAGTTCATATCGACGGCGGAGTTCGGCACCTCGATGTCGGCTCACCTTATCCTGGTGGTGGAGAAGCTGCCAAGGGTTTAGCTGTTCGCTAATTAAAAAGGTACGCGAGCTGGGTTCAAACCGTTAAGATCATAAACGATTGTGATTTTAACAGTTTGAACCGTCGAGGAAAGTAAAGAAATCTCGTATATTTCTTTCAATGTTTTAATCTGAGATTAAGACCGCTATACACAGTTGTGTATATCACGGCGGCCCCGCCAATAAAACGACGGGGAGAATTTCACTTATATCGGTGAAGTCCTACTTTTATAAAAGAGGATAATACCGAGGGAAGCGTAAGCACCCGTAGAGACTAAATGTGAAATATTTTTTGAGAAATCAAAAGAGAAAGTTATAGTCCAATCCCACAAGTAATTGTGGTTCCCATTTTTGTATTTAAACGCGCAAAAATGAAGAGACTAAATCATTTTTAGTAAAAAATGATCGTCCGAACTTTTGTTTACAAAAGTTTTAGGAAGTAAAATATAGATGCGTGAGACAGGTTGGTCTCCTATCTACTGCAGGCGTTGATTCTTGAGAAGATCTGCTCTTAGTACGAGAGGACCGGAGTGGACTGACCTCTGGTGTGTGGGCTCTACTGCCAAGTGGACTGCCCAGTAGCTATGTCGGGAATGGATAAGTTCTGAAAGCATCTAAGAACGAAGCCAACTTCAAGATGAGGAATCGTTTGAGAAACCTAAGAGATGATTAGGTTGATAGGCACTAGGTGTACAGACAGTAATGTCTTTAGCCGAGGTGTACTAATCGTTCGATTCCTATTAGGAA\n>CM000244.2/78118522-78118698 Rattus norvegicus chromosome 14, whole genome shotgun sequence. \nAGCTTTGCACAGTGGCAGTATCGTAGCCAATGAGGTTTATCTGAGGCGCGATTATTGCTCATTGAAAACTTGCTCACAACCTCCGGTTCCCCCACACACACATACACACTATAAGCCCAGTATCGATGAGCTGTGCCCTGTCCCCTGCGTGCCTCATTTTCTGGCCCACAGCTCTGT\n>CH476646.1/112655-112774 Sclerotinia sclerotiorum 1980 scaffold_26 genomic scaffold, whole genome shotgun sequence. \nGGTCGTGTGGTCTAATGGTTATGATATCTCGTTCACAAACATGTGTTCATCAATTCTGATTTCGATTGTACCCGTTATCTGATTCCGAGATGGTTCCCAGTTCGATCCTGGGCACGATCA\n>MLBF01000159.1/890-1 Desulfosporosinus sp. OL contig00159, whole genome shotgun sequence. \nCGACTGGAAGAGCACGTCCAAGCAGTGAGGCTGAGTTTACAGGCAAATCCGTAGACTTAAGGCTAGGCTGTGATGGCGGGAAGGAATTATAGTACCGAAGTCACCGATCTCATGCTGCCAAGAAAAGCCTCTAGTGAGGAATGGGGTACCCGTACCGTAAACCGACACAGGTGGGTGAGGAGAGAATCCTAAGGCGCTCGGGAGAACTCTCGTTAAGGAACTCGGCAAAATGACCCCGTAACTTCGGGAGAAGGGGTGCCTCGATAGGGTGAAAGCCCGAGGAGGCCGCAGTGAAAAGGCCCAAGCGACTGTTTAGCAAAAACACAGGTCTCTGCAAAACCGTAAGGTGAAGTATAGGGGCTGACGCTGCCCGGTGCTGGAAGGTTAAGGGGAGAGGTTAGCGTAAGCGAAGCTTTTGAACCGAAGCCCCAGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCAGGTAAGTTCTGACCCGCACGAATGGCGTAACGACTTGGGCACTGTCTCGACGAGAGACCCGGCTGAAATTGTAATACCTGTGAACGATGCAGGTTACCCGCGACAAGACGGAAAGACCCCATGGAGCTTTACTGTAGCCTGATATTGAATTTTGGTACGATCTGTACAGGGATAGGTGGGAGCCAGAGAAGCCGGACCGCTAGGTTCGGTGGAGGCAATGGTGGGATACCACCCTGATCGTATTGAAATTCTAACCTACATCCCTAAACGGGATGAGGGACCGTGTCAGGTGGGCAGTTTGACTGGGGCGGTCGCCTCCTAAAGAGTAACGGAGGCGCCCAAAGGTTCCCTCAGAATGGTTGGAAATCATTCGCAGAGTGTAAAGGCAGAAGGGAGCTTGACTGCGA\n>DF087494.1/2012-1880 Oryzias latipes DNA, scaffold4344, strain: Hd-rR. \nGGCTTAATTTGACTCAACACAGGAAACCTCACACGAAGGATTGACAGACTGATAGCTCTTTCTCAATTCAGTGAGAGGTGGTGGAGTGATTTGTCAGGTTAATTACCCCTTGTGCTATCTTAGATGACCCCAC\n>BA000039.2/1466104-1465982 Thermosynechococcus elongatus BP-1 DNA, complete genome. \nTTGGCGACGTTCACTGTGAGAAGCAGCCTGTAGGGAAAATCCAGTGCAAGTCTGGTGCTGTGCCGCAGCTGTGATGGGAATCTTCCCTCAGCCAGAATGCCTACTTGCTGTGGTTCACTCTAT\n>LCPG01000034.1/4881-5287 Parcubacteria bacterium GW2011_GWA1_48_11b UY24_C0034, whole genome shotgun sequence. \nTGAGGGCGTAATAAGAGCGTATGGTGGATGCCTTGACACAAAATGGCGATGAAGGACGTAGCGTAGCTGCGAAAAGCCCCGGGGAGGTGTGTAGCAACCTTTGATCCGAGGATATCCGAATGGGGAAACCCTCCGCGGTAAACCCGCGGAACCAGTGCGTTGCACTGGAATGACTAATTCCTAATTGACCTAATTCCTAATCAATTTCTAATGCCGAAATGTCCAATGTCTAAAATTATTTTAGTCATTGGCTATTAAATCATTGGGGGTTTATTTAGAAATTAGAAATTAGAGCTTAGAAATTCCACTGCAGCGCAGTGGCGTGGTAGGAGAGCATTCTTAATGCTGCGAAGGAGGATCCGCGAGGACCTCTGGAGCGTTAAGAAGAGAGAATGTTGGTATGAGTA\n>JPKY01000002.1/344887-343367 Acremonium chrysogenum ATCC 11550 scaffold2, whole genome shotgun sequence. \nCAATGCGCGTCGCCTCCCCCACAGTCCTCCGATTCTCGTTTTCCGCAAGGAATGTCTATCGTAGACCCCCCTCACAGGCTGGTTTGCCCACGGTGTGCCGCTCTCGAGCCTGTATCAGGACCTCGCTGCCAGCCGCATTTGGATTCACCGTGGTCTCTTGCCGTCGATTCCTCGAGGTCCAGCCTAGCCCGGGGGAACGATGTTTCGGAACTTAACCCTAAGTATACACGTGGTTTTCAGTTTTGCGCTCTTGTCGTTCGAACCGCCTTCTAAGTTGGCCGGGTTGTACCAGGAGACCGACACCGCTGAATAAGCGGAAGGCTGAACGGAACACCTACGCCGACGGACTGCCGGGGAGGACAGCCCAGTCACCTCACGGTGCGCAAGAGGGGGGATGCCATGAGCCGTATCGGTAAGAGCCTCTGGTCTGAGGACGCTCGTCGGCCCTGCCCGCTGGAACTAGCACAATGGTCAAGAGTAGGCCGTCCAGGAGGTGCTGTCGGTTTGAGGGTGCGGAAGTTGCTGGTCTGCTATGAGCTTGACCTCCGGGTCGAGCCTTGGCGGCAAAGGCGTCGGAAGTACGAGAAGAGAGGGTTTGAGCACAGAACTGGCCACAAACAATCAGCCAAGCGTTTCGACATTCTCCGCCCTGAAATGCTGCTTTGCCGGAAAGCCCACTTGCCCGCGAGCCAGTTGGGTTGCAAGGACTTCAGGCTACACACGGAAACGAAAACGGCTGATCATATCCTTCGCCATTCTGCGAAAGCTCTCGGTACCCTCAAACTCGTACAAGTCCCGTCGTCGCTGTTCATGGCAACCACTGCAACCAACCTGCACTTCTTCCCGTGGCTCCCTGTACCGCACCACAGCAGTAGCTACCGGTGTGTGATGCTGGTTGCATCTGGCCTGGCCAAGCGCATTAACGTCCGGCCGTAGGCTCCGTCCTGCGGCTCAGGAAGGCGCCAGTCACTTGTCGCGGTCGTCCCGATTTGCGACAGCTCCCTCCGGTTCGCACTCTTGTGGTGTACCTGGAGACGATAGCTCGGCTTTTATGGATGTCTTTTGGCCGTGCGGAATGCCCTCCTTGCTCGCTCTGTGAAGAGCATCTGGAGAGGAAATCAAAAACCAATCCTTGTTGGCAGCGCAACACAAACAGAAGGAGCTCTCGGTACCGGTCCTGGACTCTTGGAAGGCTATGGCGCGACTGCGCGGAAAACATACGACGGCATCGGGATTTTGCGATACTTGTTTGGGAGAGGCGATACCGGTACATAGGCACTGGCGTCTCTGGGTGCTTATTCCTCGTCACGATTGCTTGCATCACTGGGACCCATCTCGTGTTGGAGTCAAAGTTTCGTACTTGTCCGGCGGTGTTGGTACTGTGGCGTAAAGGACCTGCTCCCAGGATCCTAAGCCTCGTCCCGTCCTTTCATATTGGATCAAGGGGCAAGCCAAGCAGGGAGGCAGCCCCGGCTGTCCTCGTGCCTGAAATGGTGGGAGGACAGCCCCCCTATGGTGAGG\n>CP010557.1/4001542-4001177 Raoultella ornithinolytica strain S12, complete genome. \nTATGGCCGGAGCAGGGGTGCGAGCAGCAAACCTGTCGCAGTTCCTCGAAGCCGGCGTAAAAGAAGTGCACAGCTCCGCCGGCCAGTGGCTGCCTTCGCCGATGCGCTTTCGTAATTCCAGGCTGTCGATGTCTACGGATGCCGAAGCAGATGAATATTCACGCTATGCCGTTAACGGCGCAGCGGTGGCGGAAATGAAGAGCATTATTTCCGCCTGAGTGCCCGCATTGTTTGCGCGCAGCCTGCGGGCTGGTCAGCACAACGGCTGCGGGCAGAGAGAGAAAACCGTTTTTTGCTGCACATCATGTCGCCCAATATGATGATTGCCCGTACCAGGCCCCTGCAATTTCAACAGGGGCCTTTTTTT\n>ALWZ043173632.1/1-308 Picea glauca, whole genome shotgun sequence. \nGATGGGGAATCCTTGTATCAAGGGTGCACTCTGCATGAACATCGAAAGAGAATTGGGTTAATATTCTCGAACCGGGACATGGTGGTGGACGACAATGTTAGGAAATCTAGAGATGTCATCGGGGGCCTGGGAAGAGTTATCTTTTCTTTTTAACGACTTTCCCACCCTAAAATCAGTTCAAATGGAGATAGGGTCTGTAACCTACCCACTACTTAAATCAAATTTTTCCAGTCCTCTGTCAGACTCGATCTCCTAAATAACCACAGAGATCCAACGTAAACTAGCTCTTTCTATTTTCTTCCCCATTC\n>JJMO01001155.1/572062-572450 Vigna radiata var. radiata cultivar VC1973A scaffold_43, whole genome shotgun sequence \nACGAGGAAGGGCGTAGTAAGCGACGAAATGCTTCGGGGAGTTGAAAATAAGCGTAGATCCGGAGATTCCCGATATAGGTCAACCTTTCGAACTGCTGCTGAATCCACGGGCAGGCAAGAGACAACCTGGTGAACTGAAACATCTTAGTAGCCAGAGGAAAAGAAAGCAAAAGTGATTCCCGTAGTAGCGGCGAGCGAAATGGGAGCAGCCTAAACCGTGAAAACGGGGTTGTGGGAGGGCTATACAAGTGTCGTGCTGCTAGGCGAAGCAGCATAGAATGCTGCACCCTAGATGGCGAGAGTCCAGTAGCCGAAAGCATCACTAGCTTACGCTCTGACCCGAGTAGCATGGGGCACGTGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN\n>HG722747.1/1-1525 Eimeria necatrix Houghton genomic scaffold, Enh_scaff2711 \nAGTGACTGACTATACTCCCCGAGGAAGGTAGGCTTTTCGTGGGCTGTTATAGCCTCTGGGTTTGTGTTCAGTTGTTCACTGAGGTGTGTTTTGTTTGCGTTCGTCAGCTGCACTTTCGAGTACTGGCGTTCTGCGATGCTGTCCTTAACGGTTTCAACCGACCCGTCTTGAAACACGGACCAAGGAGTCTAACATATGTGCGAGTATGCGGGCAGAACCCCTGTATGCACAATGAAAGTGAGAGTAGGGAGAGGTTTTGTTTTTTTGGCAGGCCTCGCACCTACGACCGACCACGAGCTTTGCGAGAGGTTTGAGTTGTAGCACATCTGTTAGGACCCGAAAGATGGTGAACTATGCCTGAGTAGGGTGAAGTCAGGCGAAAGCCTGATGGAGGCTCGTAGCGATACTGACGTGCAAATCGTTCGTCAAACTTGGGTATAGGGGCGAAAGACTAATCGAACCGTCTAGTAGCTGGTTTCTTCCGAAGTTTCTCTCAGGATAGCTGGAGTTCAGTTAGTTTTATCAGGTAAAGCGAATGATTAGAGGCCTCGGGGGCGCGTTGCCCTCGACCTATTCTCAAACTTTAAATGGGTAAGATCCAGCGGTTACTTCACTGAACTGCTGGGGTTAATATGAACTCCANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTAGGGTTGACTGGTTGGTAAAGCTTCCTGGCTTCCAGGGAGTCCGGTGCGCTCCTGACTGCCCTTGAAAAGAGGAGGGAAAGTTGTTATTTGCACCCCTGGCCGTACCATTAACCGCATCAGGTCTCCAAGGTTAGCAGCCTCTGGTCGATAGAAGAAAGTAGATAAGGGAAGTCGGCAAAATGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGGCTGGGTGCATAGCGCCAGTGCGTTCTTCGTTGGTCGGAGCTGTGCGGGCCCGTTCGTGCTTCGCGGCGCGTCTGTGGACCGCCGGCACTGACTGCGTTGTGACCCTTGGTCTGCGTGCACAGTGAACAGCTAACTCAGAACTGGAGCGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGCCGCAAACGGTGTTGACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAATGTGATGAAATTCAACCAAGCGCGGGTTAACGGCGGACGTAACTATGACGTGGAAAATTTTGCTTGCTGGGTTTTTGGAGTGAGTGGTCCTCCCCAAAGAAAAAGGAAAGAGATAGTTTGTAGGGAGCCTCAGCTCCTACGGCACGCCCAAAGTCTAGGGCCAACCGTTTTCACTCGCCATAACATACATCTACTACCGAGAGTGACTAAGTATAAGTGCATCATTTGTGTACTATTCACTGCATGTTGGCTGTGCGAGAGCGATTTCCTCCTCGCGCCCGCCTTGATCCATTGTCAGCCACGTGAAAACCCCAGAT\n>AVBC01000026.1/54293-54503 Halomonas huangheensis strain BJGMM-B45 contig41_scaffold4, whole genome shotgun sequence. \nTGAGCGCACACCGTCTCGGCTTTCCCGCAGATGTGTTGGGGTGAAACGGGAAGTCGGTGATATTCCGACGCTGCCCCCGCAACGGTGATCGAGTTAAATACGGCCCATGAACGCCACTGTGTACTGCATGACAGTCACGGGAAGGTGGTCGTATCCAACACCCTGTGTTGACTCGTCAGCCCGGAGACCGGCCTGAGATTCCATGCCAGGG\n>URS0000D67C52_12908/1-206 unclassified sequences RAGATH-7 RNA \nACUAUACCGCUUUAUUAUGCACAAAUAAAGUUAAAGAUUGUAUAGUAAUCCACGUGGUAGAGGCACAGUUAGGUUCGCUGUGGUGCAACUCUUAGUAGCAACUAAUCUAAAGCAAGUAUGGGAGAAUAGGUUUAAACUAUUUUUAGGUAGUUAAAAAUACGUAAAAUCCGAUCCUAAUAAGGUAGCAUGAUAGUAUUAGUGCAGAU\n>CM000812.5/30921558-30921482 Sus scrofa isolate TJ Tabasco breed Duroc chromosome 1, whole genome shotgun sequence. \nGCTGTACATGATGACAACTGGCTCCCTCTACTGAACTTCTATGAGGAAACTGCCATGTCACCCTATCTGACTACAGC\n>HE717023.1/2219309-2219667 Halobacillus halophilus DSM 2266 complete genome \nTTCCCATAGAAGTACTCTGGAGTTTATTTTTCCGAGTTTCTATGGATTTTTTATGTTCTTATCATCATTTGTGAATTATCACGTATTACGTGTAAGAAGTTTTTAGGAGGATTCATATCATGCAAAACGGTACAGTAAAATGGTTTAACGCGGAAAAAGGTTACGGCTTCATCCAAGTAGAAGGTGGAAATGATGTATTCGTACACTTCTCTGCAATTCAAGAAGAAGGTTTCAAATCTCTAGAAGAAGGTCAAACCGTTTCTTTCGAAATTGTTGAAGGCGACCGCGGACCACAAGCAGCTAATGTTGAAAAACAATAAATAAAATCCAAAGCAGCCTCTATAGAGGCTGCTTTTTTT\n>CM002888.2/48184797-48184945 Danio rerio chromosome 4, GRCz11 reference primary assembly. \nAGACAATCGCGGCTTCTCGTTGGACAAGAGTCTACAGTCTACAGTTACCATTGCACGTTCCCTGGGCAGATGTCTGCGAACTCCCCAAATGTGGGAATCTCGACTGCATAATTTCTGGTAGTGGGGGACTGCGTTCGCGCTCTCCCCTG\n>LXTC01000002.1/1795932-1795468 Metschnikowia bicuspidata var. bicuspidata NRRL YB-4993 METBIscaffold_2, whole genome shotgun sequence. \nATGCCAGTATCAATACCAACACCAGTGTCGAATCAATTAATACCAACACTGAATACCAACACTAATGAATAGCTAAACCAGGATAGACACCAACAAATACCAACACTAAAGACCAAAACTAATAAATACCAATACAAGTATCAATACCGATAAATACCAACACCAATAAAAACCAATACCAATAAATACCAATACCAGTACCAACACCAATATCAATACCATTACCAATTCAACACCATTATTGGTATTCAGTTGTAAAAGGTGAAATTCTTAGATTTTCCAAAGACTAGCTACTGCGAAAGCATTTGTCAAGGACGTTTTCATTAATCAAGAACGAAAGTCAGGGATCGAAGATGATCAGATAGCGCCGTAGTCTTAACCATAAACTATGCTGACTAGGGATGGGGCGACGCCTCATGTAAATGACAGGCCCAGCACCTTACGAGGTATCAAAGGTTTTGGGTT\n>AVOS01044062.1/5145-5403 Chaetura pelagica isolate M959 contig44062, whole genome shotgun sequence. \nCATTAGGGAGGGAGAAGATCATGCTTCATTTCAGACCTGCTTCTCGGTTCAGGATTTTGTGAGATTTGGTAGTTTAAATTTTTTTTTATGTCTTATTTGTCAGCTACACTGACTGGCTCAGCTTGTGTCTGCCCTCTGCCGGCAGGCATGGGTAACCCATTGAACCCCATTTGTGATGGGGATTAGGGATTGCAATTCTTCCCCTTGAACAAGGAATTCCCAGTAAATGCGGGTCATAAGCTCGCATTGATTAAGTACC\n>GL433863.1/231672-231585 Chlorella variabilis unplaced genomic scaffold CHLNCscaffold_29, whole genome shotgun sequence. \nGCACCTATGGTGTAGTAGGTTATCACACTCGCTTAGTAGTGCTCTGTTGAGTAGCGAGAGGTCTGCGGTTCGAATCCGTGTGGGTGCA\n>LCQF01000020.1/16551-16970 Parcubacteria bacterium GW2011_GWA2_49_9 UY50_C0020, whole genome shotgun sequence. \nCTGATGGGAAACAAGGGCGTATGGTGGATGCCTTGGCTTAAGAAGGCGATGAAGGACGCAGCGTGGCGGCGATACGCTCCGGGGAGGTGCCGAGCAACCTTTGATCCGGAGGTCTCCGAATGGGGAAACCCTTCCGTGTAAACCACGGAAGCCGTGTCTTACACAGAATGTCTAATTTCTAATTAACCTAATTCACCTAATAAAATTCCAAATACCAATACCAAATATCCAAACCGGACTTTGTGATTGAGCATTTCTTTACTTTGGGTTTTTATTAGAAATTAGAATAATTAGATGAATTAGGAATTCCGCGTAGGACGCGGCGCGTACCCTGGGAAGTAAAACATTTCAGTACCAGGAGGAGTAGAAACCAATAAGTATTCCGTCAGTAGCGGCGAGCGAACGCGGAGAAGCCCAAAC\n>LCPW01000021.1/2447-2376 Candidate division CPR1 bacterium GW2011_GWC1_49_13 UY40_C0021, whole genome shotgun sequence. \nAGCGCGGAAGCCGAGTGGTGAGGCGGACGGGCCGCAACCTGTCGGATGAAGGTTCGAATCCTTCCCGCGCTT\n>JXRR01000014.1/312777-312893 Jeotgalibacillus campisalis strain SF-57 contig00014, whole genome shotgun sequence. \nAACCTTTTTAATTAAAGTCCAGAGAGGCTTTCAAAAGGGAAGAGCAGCTGCCGCTAAATGTGATGCAGTGTATCTTTTGAACACCTTTTGAGGGCTTTTCTCAAAAGGTGTTTTTTT\n>JH207677.1/46913-46403 Pelodiscus sinensis unplaced genomic scaffold scaffold782, whole genome shotgun sequence. \nGTTTTCACTTTTTTTGATTGTATCCCTTTCGTATATACGGTCATGCCAATTTTCTTCCACAATTTCATCTGAGGAAGTGGGTCTGGCCCACGAAAACTCATCACCTAATAAACCATCTTGTTAGTCTTTAAAGTGCTGCATAGTCCTGTCTTTTGTTTGAGAAAAAAAAAACAGGTTCCAACTAAAGTAAAAAGTTTGGGAAACCCTGGTCTAGCCAGCTTTCTCTCCATCTTACAGTCCATTTATCCAATCCATACTCCCTTAACTTGCTGGCAAGGATATTGTGGATGACCGTATCAAAAGCTAGAGGTGAAATTCTTGGACCGGCACAAGACGGACCAAAGCGAAAGCATTTGCTAAGAACGTTTTCATTAATCAAGAACGAAAGTCGGAGGTTCGAAGACGATCAGATACCATCGTAGTTCCGACCATAAACGATGCCGACTCACGATCCGGCGGCGTTATTCCCATGACCCTCCAGGCAGCCTACAGGAAACCAAAGTCTTTGAGT\n>URS0000D6955D_12908/1-88 unclassified sequences c-di-GMP-I-GGC riboswitch \nGUUGAAAAAGGUACACUAUCCCAAAGGGUAGGCCGCGAAGUUUUGGGUCUAAAUCACUUUUAGUGACAUGAUUGCCAAGCUGCCGAUU\n>CAWC010010349.1/2261-2560 Onchocerca ochengi, WGS project CAWC01000000 data, contig: 07842_10349 \nTAGCATAGATCCGAAAGATGATGAACTATACTTGAGCAGGATGAAGCCAGAGGAAATTCTGGTGGAAATCCGAAATAATTTTGACGTATAAAACGATCGTCTAACTTTGGTATACAGGCGAAAGACTAATCGAACAATCTTAGTAGTTGATTCCTTTTGAATTTTCCCTCAGAATAGCTGGAATATGTAATGAAGCTGTTATATTCGATAAAGTGTTTGATTGGAGGAATAGTGGGACGAAAAATTTTCAGTCTGTCCCCAAACTTTCAAATGAATATGATATTTCGTTTGCTTGAATGA\n>URS0000D6BF5F_12908/1-247 unclassified sequences ARRPOF RNA \nCTAAACCCTACAAGAATATTTTCAAAAAATTTCATCATACAATTTGTGATGAGCTGATAGGCACTAATCAGTCCAAGTCTTTTAAAGGTTGGTAGGAATTGTTGCAACGTGAGGACAACGGAACAAAGGTCAGGTGGTTTATTGTTTTGGGGTGTCTTTTATACCTTTATAAAACTGAATGTAGGCAGTTAAGGTCGAACACGTGGGCAATAAAGCGTGGATTGTATCAAACAAGTAAAAGGCAAGT\n>CAWC010018757.1/493-342 Onchocerca ochengi, WGS project CAWC01000000 data, contig: 15636_18757 \nTCGTTGCGATGGTAGTCATGCTCAATATGATAAGAACCATTGGTTTAGACATTTAGTTCATATGCTTGGCCGATTATACAATGGTGTGAAGCTATCATTTTCGGTACTATTACTGAGTGACTCTAAGTTAGAAATCCTTCTGCACATGATGA\n>AASG02003498.1/19751-18974 Ricinus communis cultivar Hale ctg_1100012349913, whole genome shotgun sequence. \nTACTTGGTTGATCTTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTGTAAGTATGAACTAATTCAGACTGTGAAACTGCGAATGGCTTATTAAATCAGTTATAGTTTGTTTGATGGTATCTGCTACTCGGATAACCGTAGTAATTTTAGAGCTAATACATGCAACAAATCCCAACTTCTGGAAGGGATGCATTTATTAGATAAAAGGTAGACGCGAGTTTTAAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCCCAAATTAGCCAATCCTGACACGGGGAGGTAGCGACAATAAATAACAATACCGGGCTCTTTGAGTTTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGAAGGGCAAGTCTGGTGCCACCAGCCGCGGTAATTCTAGCTCTAATAACATATATTTAAGTTGTTACAGTTAAAAAGCTCGTAGTTGGACCTTGGGTTGGGTCGACCGGTCCGCCTAGCAGTGTGCACCTGTCGTCTCATCCCTTCTGCCGGCGATGCGCTCCTGGCCTTAACTGGCCGGGTCGTGCCTCCGGCGCTATTATTTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTAAGCTCTGTATACATTAACATGGGATAACATCATAGGATTTTGGTCCTATTCTGTTGGCCTTCGGGTAAAAGAAATTATGGCACAGCTAAGAGTTGATTGTACTTCGTCAATTAAGAGCATCAGATCTTGCAGTCTAATGAAACCTTAGCAGAACAATG\n>ABGB01000728.1/1246-78 Enterocytozoon bieneusi H348 ctg01_1523, whole genome shotgun sequence. \nTGTGTGGAAGTTCCGGAGCAGATCTTGGAAGTAGTAGCATCATTTGTATGTGCCAATGGAGGCGGGTTTGTCCTTTTAATAGAAGGAAGTGATACGAGCCTAGTAAAAGGGAATATAGTAGATATTCTATATAGATGTACCTATGTGGCGACACGACAGCGACCCCAACGACGTGTGCCGGTGAGAATTTTCCGGGACACCCAGATCTTATGAGCGTCACGCTGAGACTAAGAACGAGTTGGGCGGTGAAAATGAAGGAACATCCTCGTACCGAACCGCAACAGGACTCCTAGGTGAGAAGCCTAAGGCATAATTGTAATGTGAGCAAGGGAAATCGGCAAAATGGATGAAAAACCTCGGGATAATCATTGGCTCTAGCATGCTAGAACTGGGCTTACAAGGGGAATCTGACTGTTTAATAAAAACATAGCTTTGTGTGTACGCAAAGTGAATTCTGCCCAGTGCTTGGGACGTTAAGGAAGTAATTTTAAGTACGCACCTGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCGCCTAATTAGCGACGCGCATGAATGGAGCAACGAGATTCCCACTGTCCCTGCTCACAGATTTGCGAACCTACAGCCAAGGGAACGGGCTTGGGACATGCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGCCAAGCACAGGCCTCTGTGACTATATCGTAGCGAGGTGGGAGAAATGTGTGAGACCACTGACATAGTCGGCGGGGGCACTCGCAAAGCTTGGTGGGGAGTTTGGCTGGGGCGGCACGACTACTAAAACATAACGTAGACGTCCAAAGGTAAGCTCCGAGGGGATGGAAACCACTCCGAGAGTATAAGGGCAAAAGCTTGCTTTAGTTATTAATGTAAATTAATAATACTGGAAACAGGGGCCTAGAGATCCTCTATGAAACTAAGCATAGAGGTGACGGAAAAGTTACCACAGGGATAACTGGCTTGTGGCGGCCGAGCGTCCATAGCGACGCCGCTTTTTGATTCTTCAAGGTCGGCTCTTCCGAGCATGGGGGAATATCAGCCACCAAGTGGTGTGATTGTTCACCAACTTACAAGGGAACGTGAACCTGGGTTTAAACCGTCCCGAGAAAGGGTAATTTTTACCCTACGGCATTCCCTT\n>CP006019.1/170272-170332 Palaeococcus pacificus DY20341, complete genome. \nACCGGTGATGACTTTGCAGGGTAGCTACTGAAATTGATGAAGAAGTCGCTCCAGTCTGAGG\n>LDJP01000070.1/64830-64953 Stenotrophomonas daejeonensis strain JCM 16244 contig_70, whole genome shotgun sequence. \nCGATGAAGGCGAACAGCTTCCAGCACGAATCCAGCGCCGCCCGGCAGGCCACCGGCATGACCTCGCGCGCGCGTCGACCGGAACCCCACATCCTCGCTGGGTAACCGGAGCTTCGTGCTGTCTG\n>CP001043.1/1023491-1023327 Burkholderia phymatum STM815 chromosome 1, complete sequence. \nATGAGTGCCTGTTCACATACTTTTTTCCGCAGTTGCGCTGCAGATCGCGTAGTCGTCGTCGCTGACCACAAGGCAGTGACAACGGCAATGAAGCGAGCCACGAGGCGCCATGCGATGACCGAAGTCGAGCCGCTTGCCCCGGTTGCCGGGGCGGCGGCTTTTTTA\n>URS0000D6A032_12908/1-68 unclassified sequences type-P1 twister ribozyme \nAAUUUAACCUCGCCUUAUUAUUUAAGAUAAUAUGCUGGUGACAAGCCCAGAUAAAGAGGGAGUCAAAU\n>MHIB01000050.1/15016-14517 Candidatus Buchananbacteria bacterium RIFCSPHIGHO2_01_FULL_39_14 rifcsphigho2_01_scaffold_9139, whole genome shotgun sequence. \nCAAGTAAGCAAGGTGGTCGCCCCCTCACTTGGTCCGATGATTAGTATTTAGGAAACATAAATACCTTATATATTTAATCATTAAGCCAAGTGAGGGGGAGGAAAGTCCGAACACCATTCCCGATTTAATGTCGGGGTAAAATGGCAACTCCTAACGGGAGCCGAGAGTAACAAAAGAGTAGAAGCGCTTAAGACTTCTGCACTTTTGCCAAGCTTAGGGCAAGTGCAACAGAAAATATACCGCCTAAGTCCTCCGCAGTTGCGGTGGAACGGTAAGGTTGAAATCGTGGGCCCACCTTTGGGTGGGATACCCTCGCTTCGGCGAGATAAAGTAAGAGCCCACGGCCGACAGACTGGTAACAGTCGGGTTGGTAAACTCCTGCCTGGTGCAATGCCAAATTAGGTAGGCAGCTTGATCCCGACGGCAACGTCGGGACCAGATAGATGACCACCCCCCTTAAAAGTGGGTGACAGAATTCGGCTTATTAGCTTACTTGGATA\n>AFTD01027444.1/26113-25813 Cricetulus griseus cell line CHO-K1, whole genome shotgun sequence. \nGGATGGGAGGGCCATATAGCTGTAGCTCCTTTCATCTCATTGACTACCAGGACTGATTTGGTTGGTCTGACTGGATTGATAGGTGTCCCCTTCCTCCCTTGTTGTGCATCTCTCTGGAAGCTGTTTGCTCAGCTGGTCAAAGAGGATGACTTTTCCCTTAATAGAGGACCAGTCTTTGGTCAAGGGCATACAGGTAACTACCACCTCTGTTAAAAGCTCCAAACAAGCACTCAAGAGCCTGCCTATATATTTGAAAGAGATCAGACTTTGCCTCTAGGTGGTGCCTTGAATGGCTGTAAGA\n>NGMM01000004.1/415496-415725 Enterococcus sp. 9E7_DIV0242 scaffold00004, whole genome shotgun sequence. \nAAATAGACAGAGAGCAAGAGGAGTACTGTCAGCGGGATTTTTAGAGAGAAAATCGGCTGGTGAAAGATTTTACGATCCTGACAGGAAGGTAGCTTGTGAGTCAATCATTTGAACAATTTTCAGTAGGGTGGTTCGAGTCGTGATCGTTATCTCACGTTGAATGAAGAGGTAATTGATTTATTTGATCAATTACAAATTAGGTGGTACCGCGTAGTATTTACGTCCTAAAA\n>HF991826.1/221174-221022 Clostridium sp. CAG:678 genomic scaffold, scf125 \nATCAACTACTCAGTACTAAATAATTGAGCCTATCTCAGTAACAATGGTGCGTTCGTTTGAACAAGTTGACTACCCTAAGTCTTGAAACAGAGGCTACGTTATACAAGAATATATAGTCACCGGTGGGCATTTGCCCTAACCTGCCGCTCTGAG\n>LK878649.1/3737-3610 Ascaris lumbricoides genome assembly, scaffold: ALUE_scaffold0006683 \nTTACTAACCTTCATGGCGAGGCTTGGTCATTGCACTTTCGACCAGGCTGACCCGTGTGGCAGTCCCGAGTTGGGATTGGCCAACAGCATAATTTTTGCGTTTGGGGACAGCGTTCGCGCTTCCCCGCT\n>ALWZ041214672.1/20-119 Picea glauca, whole genome shotgun sequence. \nATATTTTTAAAAATTAACGTGATAGTACAATTAAGCATGCTCGAGACAGAGTAGTATTAGGATGGGCGACCGCTAGAGAAGTCCTAGTGTTTTACATGTC\n>JH601103.1/54151-54248 Dolosigranulum pigrum ATCC 51524 genomic scaffold supercont1.1, whole genome shotgun sequence. \nGAAGCACAAATCTGAGCAAGCGGTGAATAGGTGACTATTCATGCAGCCCGGCTACTAAACGTAGCAGCAGAGTGTTAAGGCACATCTGTGAGACAGTT\n>LVLJ01000773.1/73947-73799 Marchantia polymorpha subsp. polymorpha scaffold3569, whole genome shotgun sequence. \nATCTTTGCGCGTGGGGCAATGACGCAGTTAGTGAGGTGAAACCGAGAGACGCGTCAATTGCTGGTTGAAAACTATTTCCAAACTATTTGCATACTACGAGTTCGTTTTAGTGCAATTTCTTCTTTTCTCCCTTACAAAAGCGTAAGAAA\n>AGUA01000030.1/104638-104479 Staphylococcus pettenkoferi VCU012 contig00012, whole genome shotgun sequence. \nGTAACAAGGGGATAACGAATAAGGTGATTTAGGGGTAGGCTATTACATAATATAATAGTTACAATCTCTTGTTCGTATGCGTTACTATTCAAACATCTTCAATATTTATTACTTACTTTCCTTTCTATTTGCCGACTAGCGATGACTAGTCGGTTTTTTA\n>JH205222.1/90660-90343 Pelodiscus sinensis unplaced genomic scaffold scaffold192, whole genome shotgun sequence. \nGTCTAAGTAAACAAGGGCGTTACAGTGAAACTGCAAATGGCTCATTAAATTAGTTAGGGTTCCTTGGATCGCTCCAAGCCTTACTTGGATAACTGTGGTAATTCTAGAGCTAATACATGCTGACGAGTGCTGACCTCCGGGGATATGTGCATTTATCAGACCAAAACCAACCCGGGCTTGCCCAGCTGCTTTGGTGACTCTAGATAATTTCGGGCCAATCGCACACCTCCATAGCAGCAACGATGCATTCGAATGTCTGCCCTATCAACTTCAAGAGATGTCCCCATGGGTACTTCACATCTAAGGCTTCATTTTGTT\n>GG700633.1/173169-173635 Leptotrichia hofstadii F0254 genomic scaffold Scfld1, whole genome shotgun sequence. \nGGCGGGCGAGAATCCCGCCGGCCGGAAGTCCAAGGTTTCCAGGGGAAGGTTTGTCCGCCCTGGGGAAGTCGGGACCTAAGCATAAGCAAAATTGTGATGGCGAATGGAAAACAGGTTAATATTCCTGTACCGCTGTTATCGCCTGAGAGACGGAGTGACGCAGGAAGGTATGCGGGAAGGCTGACGGAATAGCCTTTCTAAGGGCGTAGCATGGGCATGCAGGAAAATCCGCATGCCTAAATGTGAGACCTGACGGGTAAGTGCATCTTGCATAAGCCGCAGATCCTACACTGCCGAGAAAAACTTCTATCGATGAGAGCCAGCGCCCGTACTGTAANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTATAGCGGAGCCGAAGGGAAACCCGAGTCT\n>DS990197.1/12350-12464 Ruminococcus lactaris ATCC 29176 Scfld_02_34 genomic scaffold, whole genome shotgun sequence. \nGGATGCCAGGGTCAAAAGGTCTAAACCCACATGAGCTTGCTCATAGGTGGGTGAAAGACCTTAGGACCCGCCCCGATATGAGCATCAAAGTCGGGGGCTTTTGACCCCGACATCT\n>CM003380.1/18255055-18254968 Vigna angularis cultivar Jingnong 6 chromosome 10, whole genome shotgun sequence. \nATGAATGCTGATGCATGCACTGGGCTCTGAGAAGTTTTAACCTCAACTTTTGATGAAAATGCACGGCCTTGAAAGCTATTTCTGATAC\n>CP000673.1/1358718-1358907 Clostridium kluyveri DSM 555, complete genome. \nTATGTGGCAGTGAATAGAAGAAGTAAATATATTCTTATATGTAAAGAGAGGAAGTAGAGGGTGTAAAGCTTCTCATATGAGGTTTATTGAAGGCTGTCTAGGAGCCTATTATGGTGTTTGAGAGATATGGATTTTATAATTTTAAATCTATATAATTAGGGTGGTACCGCGAAAAACTTTCGTCCCTTTT\n>MKSM01000113.1/13291-13495 Nitrobacter sp. 62-23 SCNpilot_cont_300_bf_scaffold_662, whole genome shotgun sequence. \nCTTGTTTGCGGCGTCATCGGTGCCTCCCGAGGGAGGTGAAACGGGAACGCGGTGCGGGGATATGACCCCAACGCCGCGGCTGCCCCCGCAACTGTAAGCGGCCATCCGCGTCCATTCCGCTGCCGAACATGCCGCGCATGTGAGGAAAATCGGATCCGGATAACGGCCGCGAGCCAGGAGACCGGCCGGCGACGCCTTCGGAGCA\n>CP011125.1/5773983-5773818 Sandaracinus amylolyticus strain DSM 53668, complete genome. \nAAGAGGGAAGCCGGTGAGAAGCCGGCGCGGCCCCCGCCACTGTGACCGGGGACGGCGCGGACGCGGTGCGAGCGCACCGAGTCACCACTGCGCGTGCTCGTCGTGTGAGCGGCGGGGCGCGGCGGGAAGGTGGTCCGCGACGGACGATCCGGGAGCCAGGAGACCT\n>CM009294.1/24125792-24125654 Populus trichocarpa isolate Nisqually-1 chromosome 5, whole genome shotgun sequence. \nTAATTTATTTGGGGAAGATTTTCATCTAGTTGTAATATATTTATATTTGATTGCTCAGAATCATCAGTTATTATAAAATTAACTATATCATTGACCCTTATAAAATATATTTAGAAAAAATTGTTTATAAAATCATGAT\n>ALWZ044874107.1/2364-1677 Picea glauca, whole genome shotgun sequence. \nGGGTTTTTCCTTTTGTGGAATTTGAATTTTTATGTTTTTTAATTTTTTATTATGTTATAATATATATAATTATAACACACACACACACACACACACAATATAACCTTATAATAGTCGACTCAGAGCTATTTCAGACAAGGGGAATCTCACTATTTAATTCAAACAAAGAATTGTGATGGTCCTTGTGGATGTTGACGCAATGTGATTTCTGCCCAATGCTCTAAATGTTAAAGTGAATAAATTCAACCAAGCACGGGTAAACGACGGGGGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGCCATCTAATTAGTGATGCACATGAATGGATTAACTAGATTCCCACTATCCCTATCTACTATCTAGTGAAAACACAACCAAGGGAATGGGCTTGGCATAATCAACACGGAAATAAGACCTTGTTGATATTGACTCTAGTCCAACTTTGTGAAATGAATTGAGAGTTGTATAATGATCCAGATTATTTTTGGCACGAAACGAGAGCGGAGATATAACACAAAAATATTCAGAGATATTGCAAGAGAGACAAAAATATAACAATGATATATCATAAATATAACAAGAGTCACATATATAAAGTAATACATGATTTCTATTAATGAAAGAAATGTACAGAGATTGTAAAAATATAGAGTGAAAGACTTGCTAGAATGGTGGCAGCTT\n>JH835382.1/3324878-3324510 Erinaceus europaeus unplaced genomic scaffold scaffold00094, whole genome shotgun sequence \nGGATGTGAGGGCGATCTGGCTGAGACATCTGTCATGTCATTGATCATCAGGGTTGATTTAGCTGGTCTAGATGGCTAGGCAAGTGTCCCCTTCCTCCCTTGCCACTCCATGTGTGTCCTTCCTAAAGACTTTGGGTCTTTGGGACCTATGTGTGCTGGGTCGAAGAGGAAGGCCTTACCAGAATAGTGACTGACCGGTATGCTCGGTAGAAGGTATACAAGTAGCTGTGCTCCCCTGCTAGAGCCTCCATACAAGCTCTCAAGAAAGTTGCAACTGTACTGAGTTTGTAATTGCTTTGATTGATGGCTACTATCTCTGGCAACATTCTGCCTCACCTCAGGCTGGGCTCTCACACAGATGCTCTCTCCT\n>KI930470.1/1116-1201 Candidatus Entotheonella sp. TSY2 genomic scaffold TSY2_scaffold00655, whole genome shotgun sequence. \nGAGAGCCGGATGCAGCGACAAGTTGCATGTCCGGTTCGGAGGGGGTTTGACGCCTAACCTCATGGGCTAGTCGCTTACTACCCTAC\n>AZIM01000385.1/98908-98846 Ophiophagus hannah scaffold386.1, whole genome shotgun sequence. \nAATGGTGTTTATGACATAGTTAGATTAAAGCCTTTGGGAAGTCTAATTGCTGATGTTGCCATT\n>AZFW01000017.1/10903-10974 Lactobacillus harbinensis DSM 16991 NODE_20, whole genome shotgun sequence. \nGCGAATGTAGTTCAGTGGTAGAGCAACAGGTTTTCCAACCTGTGGATGTAGGTTCGACTCCAACCATTCGCT\n>AACY023338535.1/830-742 Marine metagenome ctg_1101668145886, whole genome shotgun sequence. \nTTTCCTTTACACTTCTCAAACCGGGATCAAGAGAAGCAAAGCATCCCTCATATCCACGATGGAGGGTGTCGTGGAGTATACTGTACCAA\n>CAJW011240374.1/263-1 Hordeum vulgare subsp. vulgare, WGS project CAJW01000000 data, contig: morex_contig_1240374 \nCTCGAGCCGAGGTCCGAGTACCAAGCGCTGCAGCGCTGAAGTATGAGCCCCGTGGACTAGCAATTGCTTCTCCACGAGGCTCATACCAGGCGCTACGGCGCTTAAGTATGTAACCGATGCCATACTCCCAGGAAAAGCTCGAACGACCTTCAACAAAAGGGTACCTGTACCCGAAACCGACACAGGTGGGTAGGTAGAGAATACCTAGGGGCGCGAGACAACTCTCTCTAAGGAACTCGGCAAAATAGCCCCGTAACTTCGGG\n>ACTA01130975.1/19881-19796 Ailuropoda melanoleuca scaffold1408_79, whole genome shotgun sequence. \nGATCACGGTGATGGCTGACCAGGGCTCCTTGACCTATACAGACCTCTGCTATGGGGGTGATGGCCAGTCCTGGTGTCTGAGTGATT\n>ABAV01023618.1/749-1 Nematostella vectensis strain CH2 x CH6 NEMVEscaffold_317_Cont23618, whole genome shotgun sequence. \nATTGCTGACTCTATGGGAGACAAGGATGACCTAAATTTTAACAGATTAAGAGTACTGTAAGTAATATTTGAAAGGTTTACTTCTAAAACTTGTGATTTAGACTCATAATATATATTACAGAATGGCAAAGTTAAATTAAGAAACAGCAGGAACTTGGTTCCATTGCATCAATAAATTATGCTCAATTCATTTTCAGACAGTCTTGAGGGCCCGTTTCTTGTCAAGAGAATCAAAACTCTTCCAAAGACTGGCCTTCTCAAAACCTTGGTAACCGAAGCCGGACAGTGAATGCGAGTTCCTAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGAACGCGCGGTTAAGGTGCCAAAGTCGACGCTCATCAGACCCCACAAAAGGTGTTGGTTGCTCTAGACAGCAGGACGGTGGCCATGGAAGTTGGAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAAGCAACTAGCCCTGAAAATGGATGGCGCTCAAGCGTCGCACCTATACCGTGCCGTCGGAGCAGATGCGAAGCTCCGACGAGTAGGAGGGCGTGGGGGTCGTGACGCAGCCTCTGGCGCGAGCCTGGGTGAAACGGCCTCCAGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAGCTTTGAAGACCGAAGTGGAGAAAGGTTCCATGTGAACAGCAGTTGGACATGGGTTAGTCGATCCTAAGAGATAGGGAAATTCCGTTGCAAGCG\n>AWWV01004333.1/1226-446 Corchorus capsularis cultivar CVL-1 contig04341, whole genome shotgun sequence. \nGGGCCAAGGGACAGTCTCAGGTAGACAGTTTCTATGGGGCGTAGGCCTCCCAAAAGGTAACGGAGGCGTGCAAAGGTTTCCTCGGGCCGGACGGAGATTGGCCCTCGAGTGCAAAGGCAGAAGGGAGCTTGACTGCAAGACCCACCCGTCGAGCAGGGACGAAAGTCGGCCTTAGTGATCCGACGGTGCCGAGTGGAAGGGCCGTCGCTCAACGGATAAAAGTTACTCTAGGGATAACAGGCTGATCTTCCCCAAGAGCTCACATCGACGGGAAGGTTTGGCACCTCGATGTCGGCTCTTCGCCACCTGGGGCTGTAGTATGTTCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGTACGTGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCATATCCGGTGTGGGCGTTAGAGCATTGAGAGGACCTTTCCCTAGTACGAGAGGACCGGGAAGGACGCACCTCTGGTGTACCAGTTATCGTGCCCACGGTAAACGCTGGGTAGCCAAGTGCGGAGCGGATAACTGCTGAAAGCATCTAAGTAGTAAGCCCACCCCAAGATGAGTGCTCTCCTATTCCGACTTCCCCAGAGCCTCCGGTAGCACAGCCGAGACGGCAAGGGGTTCTCTGTCCCTGCGGGGATCGAGCGACAGAAGTTTTGAGAATTCAAGAGAAGGTCACGGCGAGACGAGCCGTTTATCATTACGATAGGTGTCAAGTGGAAGTGCAGTGATGTATGCAGCTGAGGCATCCTAACAGACCGGTAGACTTGAACCT\n>LWDE01000750.1/11196-11290 Tilletia controversa strain DAOM 236426 scaffold_750, whole genome shotgun sequence. \nGACGACGTGCCGGAGTGGTTAACGGGTGCGCCTGCTATTCTTAGCATGTCAGTGTATAGGCTCTGCCTGCGTGAGTTCGAATCTCATCGTCGTCG\n>MGWF01000052.1/10424-10220 Firmicutes bacterium GWF2_51_9 gwf2_scaffold_5678, whole genome shotgun sequence. \nGCATAAGCTGTGAACGGGAGTAGTAAACGTCACGCTTCATTCAAGAGAGCCGCTCCTTGGTGCAACGCGGTATGAAGCAACGTCGAACGTGTCCGGGAGCTGGTCGTGCGAAAGTTGAGTGCGATCCGTCGTCGGCGTTAACGAACAGAGTTGCCGGGAGAAATTCCCGGAAGTTAGGTGGTACCGCGTCAATCACGTCCTTTCA\n>CM001219.2/34740290-34740361 Medicago truncatula strain A17 chromosome 3, whole genome shotgun sequence. \nGTGAGTTTAGCCCAGTTGGTAGGGATATTGCATATTATATGCATGGGCCAGGGTTCGAACCCTGAACTCTCC\n>CBUS010004920.1/7915-7704 Eimeria acervulina, Houghton, WGS project CBUS01000000 data, contig: Eah_scaff963_1 \nTGAACGATCCTAAGTATTGCTCCACGAGTGGCAGTTACTCTAGGGATAACGCGTTGATCTCCCCGGAAAGTTCGTACTGGCTGGGAAGGTTGGCACCTTAATATCGGCTCGTCGAATCGTGAGGCTAAAGTAGGTGGGAAGGCTTGGCCTGTTCGCCCAATAAAGCGCCACGTGAGCCGGGATCAGAACACCGCGGAATAGCTCGGTCCATA\n>DS563006.1/382953-382865 Cavia porcellus supercont2_151 genomic scaffold, whole genome shotgun sequence. \nGGGTCAACAATGACACCCCAGCTGCATTCCCTGGAGCTGAATAAAATGGTGCGAACACTAAGCCATCATTCCCAGCAGGCCTGAGGTCC\n>LMSO01000009.1/146994-146864 Arthrobacter sp. Soil782 contig_4, whole genome shotgun sequence. \nGGTAACGAGTGACAGTGCGGCAGGTTCCACCCGCCATCAGCCCCGGCTTGCTGTCCGGCAACCCTCCCTCGCGGCGGGGTGCCCCGGGTGAAGACCAGGCCCTGCATGCAGTGCAGGAGCAAGCGCGATTC\n>BBWW01000001.1/3012297-3012404 Leptolyngbya sp. NIES-2104 DNA, contig: contig1. \nGGAGAGGTTGCTATAGGTAGGGCAAATCGTTTGCTAAACGAACACCTTCGGTGCAGCGAAGCTAGCGAGGATTAATCCCCTCTGTGGGTTCGATTCCCACTCTCTCCG\n>LCQR01000039.1/11318-11692 Parcubacteria bacterium GW2011_GWF2_50_9 UY62_C0039, whole genome shotgun sequence. \nACGCTGAAATAAGCGTCTTGTTGTCCCTTCTATCAGTAATGATAGAATTAGTATGCGGCTTATAACGGTGGAGCGAGAATCGGTCTTTCCTCAAAAGAGGTTTTCGTATTCTCGTAATACCGTGGGAAGTCCCACTACTTAAGTAAAGTGGGACCCCGTAACGACTGGATTCGAGTCCCGCCAACAGGCGAGATAAGATGAAGATAGTGGATGCCCGAGTGCTCGATGTTCGAATAGCACCGCTATAATACGCCGCCTCCAGCCGTAATTTTTGATTGGGCTTTAAGGTTCAACCTTCTTCCCGATTCAAGATTGAACCTTGGAATCAAAAATTACGGCTGGATGAAGATATAGTCTAATTATCGAAAGATAAAT\n>CM001001.2/99651431-99651489 Mus musculus chromosome 8, GRC primary reference assembly. \nTGACTCAGTGGTCTGGAGTGATTGCTTTACAAGCAACAGAATCTGAGTTTAGATCTCAG\n>KN847319.1/4624885-4625042 Exophiala xenobiotica strain CBS 118157 unplaced genomic scaffold supercont1.3, whole genome shotgun sequence. \nGGGGATGTGGTCTAGTGGTATGACGTGTAAGCATCGCACCACACAATTGAACGAAGCACTCATCTAATATGACAACAGTTCCTTAGCAGAAGTTGAATCCTGAAAGGATTGCCCACAACATCTGGAAAAGGTTCTGGGTTCGATTCCCAGCTTCTCCA\n>JARO02016333.1/3903-2330 Scleropages formosus scaffold16338, whole genome shotgun sequence. \nTGGTTTTAAGGTGGCGGGTGGACTGGGCCCTTGTGTGCAGCCGTTGAAAAATACGCACAGGGTATAACATCTTTTCCTGTGTCTCTTGAATTTAAATGTCTATTGGCTGGGTCTCTCCAAAGTTCCCCCTCAGAAGAACATTCACTATCTTGTTGTTTTACCTGGTAAAGCAAACTTCTTGAGGTGCTGGGGCCAAAATGGCATGAAGGCTTATTCACATCACCTGAGACTAAGATCTCAATTTTATTCTGATGAGATCCCAGAAGATCCCATAAGATCTCATCTTTATCCAAAATGTTGACATACTCAAACACCTGAGAATCCTCAACAGTTTAGCATTAGTGTCTTATTGCTCTCACCCAGACTCCCCCCCCCCAATCATTTGCCAAGTTGGGCTCCAGAAATGGTTCCCTAAAGGGTTGTTGGAGATATCATTTTTATTTGCAGATCAATCATTGTTGAATTTGTCTTTTAAGAAATAATTTTAATCTACCCAATGCAAACTGTCATTTAAGGGGATGTGGTGGCGCACTGGGTTTGGCCAGGGTCTGCTCTGTGGTGGGTCTGCGGTTTGAGTCCTGCTGGGGGTGCCTTGTGGCAGACTGGCGTCCTGTCTGGGGTATGGTCCCCCCCGCATCATTTAACTTCTGCCCTAGAAAAAGAAGATTATGGTCAGAATTTTAAAAAGTTCAGTAGGTAAGCTAACTAGTCTTGCATATTTGGCAAAGAAATGTACTTTGTGGAATGCAAGTCACCTAGTGGGCAATCTTTGGTATGTAGAACTGGTGCTGTGGGATGAACCAGATGCTAGGTTAAGACACTCAATGCCAATGCTCATCAGACTACAAAAAAAGGTGTTGGTTGGCATAGACAGCAGGACGGTGGCCATGGAACTCAGAATCTGCTAAAGTGTTTTAACAACCCACCTGCAGAGTCAACCAGCCCTATAACTGGATGGCACTGGAGAGTGTCAGGTCCATCGTGGCAACAGGAGCCGCAAAAGCTAGGACATGACAAATAAGACAGCTGCTGCGGTGAGCTATCCTAGAGTGTAGGCTTCAGTGGAGCCACCACAGGTGCAGATGTCGGTGGTGGTAAGAAATATTCAAACAAAAACTTTGAAGGCTGAAGTCCATGTCAACAGCAAGTGAACACGAGTCAGTGGTTGTAAGATGCAAATGATGGTCAGAGGGGGCCGGCAATGGCCTCTATTTCCCCCTGCTAATTGAAAGAGAATCAGGTTGGGACTCCTGAATCTGGAGTGGTGGAGACAGATACCATGAGGCATCCAACAGAGTAACGTGAACAATCTCGGAGAAGCTGGAGAGAGCCCCAGGGAGAGTTTAGCCTCCTTTGTAAAGGGTAGGGTGCCTCAGAAGGAGTTTGGCTGGAGAAAAGGGCTCCAGCCCTGGAAAGCATTACAGTTTCAACAATGTCTAGTGATCTCTTATTGATGTTAAATCTGTGGACATAGTGTAAATCTTGCACCAAGTTGTACTCATATCTGCAGCAGATCTCCCAGGTGAGCAGTCTCACATGTGTAATGTCAGATCTGTAGCTTTGGGATAAGGATT\n>URS0001A24131_12908/1-50 unclassified sequences eL15-Euryarchaeota ribosomal protein leader \nACGGGAUCCGUCCCGGAGAGGAAUGUGGUCCUUCUGGACUGAACCUAGGU\n>FAOM01224274.1/16511-16416 Triticum aestivum genome assembly, contig: Triticum_aestivum_CS42_TGACv1_scaffold_224274_3B \nAGGAGCCGTATGAGGTGAAAATCTCATGTACGGTTCTTCGTCGTCGTGGAGCTCGTTATGCCAGGGCTCCGGGTGAAAATCTTTGTCTACACGGAC\n>JH835471.1/1830309-1830596 Erinaceus europaeus unplaced genomic scaffold scaffold00183, whole genome shotgun sequence \nGAATATGAGGGTGATCTGGCTGTGACATTTGTCACCCCATTGATCACCAGGGTTGATTCAGCTGACCTGGCCGGCTAGGCAGGTCCCTTTCCTCCTTCACTATTCCATGTGTGTCCCTCCCAAAGCTTTGAGCTCAAAGATGACTGAATAGAGACAGGCCCAGTCTTCAGATGAGAGTCTACAGGTAGCTGTACTCCTCTGCTAGAACCTCCAAACAAGCTCTCAAAGCCCCTAATCTCAGGATGTTTCTTCATATGACGCTATATACTCTTGGGGTAAATCTTCTGA\n>HF997179.1/95514-95443 Ruminococcus gnavus CAG:126 genomic scaffold, scf59 \nGGATACATAACTCAATCGGTCAGAGCGGCAGCCTTATAAGCTGTGTGTCACGGGTTCGATTCCCGTTGTCCG\n>AKWO02000047.1/149928-149814 Leptospira borgpetersenii str. 200701203 ctg1130286793315, whole genome shotgun sequence. \nAAATAGATCAGTATGGACATATCTGGGAGCAAAATGTATTTACTCGAAGAAAAACAAACACAACTGAAAGGGGATCAAACCTTGACTTGCGCAGGATGCAGATCAAAAGTCACGC\n>LFJF01019852.1/9646-11555 Macrostomum lignano unitig_19906, whole genome shotgun sequence. \nCCCGCTGAATTTAAGCATATTATTAAGCGGAGGAAAAGAAACTAACAAGGATTCCCCTCTAGTAACGCGAGTGAACGGGGAAGAGCCCAACACCGAATCCCTTGGCGCAAGTCAAGCGGAAATGTGGTGTTAAAGGTAGCCCTTCGTGTCAGTCTAGGCGTCCTCAAGTCCACCTGATTGTGGCTCAAGCCAGAAGAGGGTGTAAGGCCCGTAGAGACGCCTCCGACTGATTCCTGGGGTTTACCCTACGAGTCGGCTTGTTTGGGAATGCAAGGCCAAAGCGGGGTGTAAACTCCATCCAAGGCTAAATACTGGCACGAGTCCGATAGCGGACAAGTACCGCCGTGAGGGAAAGTTGAAAAGAACTTTGAAGAGAGAGTTCAATAGTACGTGAAACCTGCTTAGAGGCAAACGGATGGTGGCTCATACTGGCCTGAGGAATTCAACTGTGACGGGGCTGGACGAGCTGGCGTTCCGATCTCTTCTTTTGGGACGGGCGTCGGTTTGGCTATCAGGACTCTGACATGGTGCACTTTCCTTGGTGCCTCCGCCGACGACCGACGACACTGGCTACCCCGCGGCTCGGGGTAAGGTGACAAACCTGCTTCGGCATTTGTGTTATAGACCCCGGGGCGTCGGACATGGTTTGGCCAGGACGTCGAAGCTTGCGGCGCCCGCTCGCTTGTGGCTCGCATGTTGGCTACTTGGCTGCGCCGATGCTTGCACTGGAGACAACCAGTACAGGTGACGGTTGTGGTCTTGTCTCTAGTTGGCCTCTGCGAGTTTGGCGCCTATAGTCTGTGGTGTACTTGTGGGTAGACTCTATCCGACCCGTCTTGAAACACGGACCATTGAAGGAGTCTAACATGTGGCGCGAGTCATGGGGATTCTACGAAAACCCAAAGGCGCAGTGAAAGTAAAGGCCTGCTTCTCGTAGGCTGAGGTGGGATCTCGTGGCATCGCATCGCGATTGGCGAGCGCACGCACCGGCACCGTCCTATCTGTCTCTGTCAGTGGGGCGGCGCAAGAGCGTACACGTTTGGGACCCGAAAGATGGTGAACTTATGCTTGCGCAGCTCGAAGTCAGTGGAAACACCTGATGGAGGAGCGCAGCGTTTCTGACGTGCAAAAATCGATCGTCCAAAACGTGAGTATAGGGCGAAAGACTAATAAGGGGGCGAGACGTCATAAGTAGCAACCATCCTTGAGCTGGATTCCCTTCCGAAGTTTCCCTCAGGATAGCTGGCACTGCGGGGAAAACAGTTTTATCCGTAAAGCGAATGATTAGTAGGCATTGGGGGTCGAAAACGACCTCGACCTATTCTCAAAACTTTAAATGGGTAAGGATGCTCGTCTCGCTTAATTGGAGGCGGGCTTCACGCTCTCTAACGTGAATGTGAGTGCCCAGTGGGGCCATTTTGTTGTAAGGCAAGAACTGGCGCTGTGGATGAACCAAACGCGGCGTTGAAGGCGCCCAATGCGGACGCTCATGAGACACCACAAAAGGTGTTGGTCGATACTGACAGCAGGGACGGTGGCCATGGAAGTCGAACGGCCGCTAAGGAGTGTGTAACAACTCACCTGCGCGAATCAACCAGCCCTGAAAATGATGGCGCTGGGAAGCGTCCGGCCTATAGGATCGGGTTGACCTGGTGTGACTCGATGTGGGGATAGGATAGCAGACAAACTAATCTTGTAGGTATGTCCACTAACGAGTAGCGAGGGTAGCCGTGGTGTAGCGCAGAGTGATGTCAGCCGCACGTAATTGTGAGGCCAGTGACTGGAGCCGTCCAACGGGTAAATATTCCGCGGCGGCAGATCTTGCGGTGGTCAGTACAATACTCAGCAAGATAGAAAGCGTTGAGGACTGTAAAGTGTTTGAGAGAGGGTTCATGTGAAACAGCATAGTT\n>JSYM01000001.1/27642-27547 Flavobacterium sp. AED Contig01, whole genome shotgun sequence. \nTTTTAGCCCCGATGGGAGCGATATCCTTTTCGAGTCTTTTCTCGTTCCTAAAACGAGAAAAGACTCGAAAAGATAAAGAGGACAGCGGGACCCATG\n>AP014808.1/1488830-1488748 Lactobacillus acetotolerans DNA, complete genome, strain: NBRC 13120. \nTAATATAAAAAGAAGCCCTGTGAATAACAGAACTTCTCATGTAGAGCCGTAAAAGACGGTGGCATGATAATAATTACTAAAAA\n>FR889406.1/108529-108414 Firmicutes bacterium CAG:449 genomic scaffold, scf101 \nTTTAATAGTTCCAATATACCAAAGACAGCAACGGCTATTAGCTTAATAATGTTGCCGAGGTAAAGTAAGTTATTTATAAATAATGACAAGCATTACTCTTGTATATTGTTGACTAT\n>AGTP01109286.1/18627-18514 Ictidomys tridecemlineatus contig109286, whole genome shotgun sequence. \nGTGTTGTATGAAAGAAGACAAGGTTATTCTGTTTTGTCAAGGATGGAAGAAACCCTTAGGCCTGACCACACGCATATTGTTAAGATATCACATAGCATCTAACCATTGACTTTT\n>CP001014.1/1643612-1643672 Thermoproteus neutrophilus V24Sta, complete genome. \nCGGCGGCGGAGAGCCCCGCGCGGGGCGCCGTGAAGCTACCGCAGTCGGTCCCCCTTGTACA\n>MNDA01000091.1/220-1 Ktedonobacter sp. 13_2_20CM_53_11 13_2_20cm_scaffold_5687, whole genome shotgun sequence. \nGGGGATGTCGGGTTTCGACAGACGAACAGATTGTTGAATTGCAGGCCGAGGTGTCGGTATGCACTCTCGTTAAACAACCGACAAAACAATAGATGCCAACAAACAGGCACCTGCTTACGCTTTCGCTGCTTAATAACCAGTAGGCGTCGTCCGCCCAGTTTTTTCTCGTGGGATTGGAACCGGGCGTCGAAAACACGAGGTGCTATGACGGTGACCGCCC\n>ACTA01034202.1/35881-35939 Ailuropoda melanoleuca scaffold919_18, whole genome shotgun sequence. \nTGCTCTGATGAAATCACTTATAGGAAGTGCCGTCAGAAGCGATACTAGCCATTCTGACA\n>DS028111.1/11289-9911 Coccidioides immitis RMSCC 2394 supercont1.19 genomic scaffold, whole genome shotgun sequence. \nGGGCACATGGTGGATGCCTTGGCATCAAGAGCCGATGAAGGACGTTGGAGCCTGCGATAAGCCCTGGGGAGTTGGCAACCGAGCGTTGATCCGGGGGTGTCCGAATGGGGAAACCCAGCACGAGTCATGTCGTGTTACCTGCGCCTGAATCTATAGGGCGTTTGGAGGGAACGCGGGGAAGTGAAACATCTCAGTACCCGTAGGAAGAGAAAACAATAGTGATTCCGAGAGTAGTGGCGAGCGAAATCGGATGAGGCTAAACCAACTGCGTGTGATAGACGGCAGTCGTTGCGTAGTTGGGGTTGTGGGATATGTCTGTCATCGTCTGCCGGCGGTGAGCTCAGTAAGAAACCAAGCATGAAGGTGAACCAGTTGGGAAGCTGGGCCGTAGCGGGTGATAGCCCCGTAATCGTATGTGTTTGGCTGGGTTGATGTACTCCCAAGTAGGACGGCACTCGTGGAATGTCGTGTGAATCTGGCGGGACCACCCGCTAAGCCTAAATACTTCTTGATGACCGATAGCGGACCAGTACCGTGAGGGAAAGGTGAAAAGTACCCCTGGCGGGGAGTGAAATAGTACCTGAAACCGTGTGCCTACAATCCGTCAGAGCCCGGCCGGCTGTTTACAGCAGTGGGGGTGATGGCGTGCCTTTTGAAGAATGAGCCTGCGAGTTAGCGGTGTGTGGCAAGGTTAACCCGTGTGGGGTAGCCGTAGCGAAAGCGAGTCCTAATAGGGCGATTGAGTCGCGCGCTCTAGACCCGAAGCGAAGTGATCTAGCCATGGGCAGGTTGAAGCGCCGGTAAGACGGCGTGGAGGACCGAACCCACTTCAGTTGAAAATGGAGGGGATGACCTGTGGTTAGGGGTGAAAGGCCAATCAAACTTCGTGATAGCTGGTTCTCCCCGAAATGCATTTAGGTGCAGCGTTGTGTGTTTCTTGCCGGAGGTAGAGCACTGGATAGCCGATGGGCCCGACCAGGTTACTGACGTTAGCCAAACTCCGAATGCCGGTAAGTGAGAGCGCAGCAGTGAGACAGTGGGGGATAAGCTCCATTGTCGAGAGGGAAACAGCCCAGACCATCAGCTAAGGCCCCTAAGCGGTAACTAAGTGGAAAAGGATGTGGAGTCGCAGTGACAACCAGGAGGTTGGCTTGGAAGCAGCCACCCTTGAAAGAGTGCGTAATAGCTCACTGGTCAAGTGATTCCGCGCCGACAATGTAGCGGGGCTCAAGTTATCCGCCGAAGCTATGGCACTCCGGTTTTCCGGGGTGGGTAGGGGAGCGTCGTGTATCGGGTGAAGCAGCGGAGTGATCCAGCGGTGGACGGTACGCGAGTGAGAATGCAGGCATGAGTAGCGAATGATGTGTGAGAAACACATC\n>LN902847.1/6110633-6109254 Echinococcus multilocularis genomic scaffold, pathogen_EmW_scaffold_07 \nTAAAATACTGCAGATGGGGGAAGTCGGGATTCTTAATCCATAACATCGGAAAGAGGATTGGCTCTGAAAGCTGAGCGGAACAGGCTAAGGAAAGAAACAAGCTAACTCAGTTTGCTGATGGACGGGCTGGCTAACTGTTGATACACCGCCTCCACCGCCGTCGTTGCGGTGGTGGGTGGGTGTGGAGCATGCAGTTGAGCCCATCCCTTGGCTGGAGGCGAGTAGGGTGAACCGTGGGCGGACCCAGATAAATGTGCACCTCGGTCGATTGATTGGTTAGTTAGTTGTCGATGATGCTGCTTGTTGGCTGTTAGTTGGCGAGTGTTGTGGTGCTCGGCACTGCTACTGGTTAGCCTCGTTGGGGGGTGCTTGTTTAGTGCCAAACACCCAACCCAGAACTAACATGGACCTGAAAAATCCGACTCTCCAATTAAAACGTAGTTTTGTGATGTCCGCTGGTTTGTTCTAGTGCAATGTGATTTCTGCCCAGTGCTCTGAAGTCAAAGTGAAGATTTTCAACCATACGCGGGTAAATGGCGGGAGTAACTACGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAACTAGTGACGCGCATGAATAAAATTAATGAGATTTCTATTGGCCCTGGCTACCATCTAGCGAAATCACAGCCAAGGGAGCAGGCTTGGCAGAATCAGTGGGAAAAGAAGACCCTGTTCAGCTTGACTCTAGTCCGACTTTGTGAAGAGATATGGTGGGTGTAGCAATAAGTGGTTCAACTGTGGCTTTCTATGAGATAGCTGTGCTTTTCATCTTTGTGCTCAGCATGCACATCACCTTGTTAGCCCGCCAAATCTAACATTTACTCTTTTGCGCTTTTACATTCCTGTCATCAGGAGGTAGATAGAATGCTCGTAAATGCTTAAATAGAAAAATGATTTAAGACAAGGAAAATTGGTTTGGGCATTTCCAGTTCATGTTGTACCTAGTCATTGATTTACTTCCTTTAATGGAAGCTGCGAAGAGGTGGTTTGAGAGCACTAAAAACCTCTAATTTTGTCTCATCAACTGGGCATATAAGCATTCGTTCATTTCCAAAACTTCTGACAAGCCCGCTTGACGCCTCATGTTATTAATGGGTTAGTGTTTGCAATCAGTGGTAAATGAAGTTGATCCATGAAGGTTAAATATGCTTTGCAAATTGCAGTATAGTCACCACAATTGAACAAATTTCACATGCCAAAAAGAGGGGTCACCCATAAATCATGCGATTCATTACAGTCTACAAGGTTAGTAGAACTACTAATTTATCGAAGCGTATGTTTTAGAAAAGGTTGCAGACTAATGTCCATCCCATTCATTCTGCCAATTTTAAAGCATTTCTCTTTTCGTCTGC\n>LZPO01055098.1/393046-393292 Neotoma lepida isolate 417 scaffold_519, whole genome shotgun sequence. \nGGACGGCTAGGCAAGTATCCCCTTCCTCCTTCACTATTCAAGTGAGTTCCTCTCAGAGCTGCATGTTCTGTGCAAAACAATGATTTTCCCCAATAGAGGAGCACCATTCTTGGGTCAAGGGGATCTGAGTAGCTGTGCATCCTTGCTAGAACTTCCAAATAAGCCCTCAGGTGCTGGTGGCCATGTCAGAGGAGTAGCAAGTAGCAGTTGAAGTTCAAGGTGTCAGCCCACCAGGAGGAAACTCTCT\n>AURB01000101.1/106632-106430 Alicyclobacillus acidoterrestris ATCC 49025 contig_19, whole genome shotgun sequence. \nTGAACGGCGTTGAAAGGGAGGAGTAAGGCGGTTTCGATTGTCCAGAGACGGTGCAGCGCGCTGAAATGCACCGCTTTCGTCCGTCTGAAGGTCGCCCTTGAGCTGCTTACCCCGGGTCATTCCGTTATCGATGTCGAGTGTTTCGTTCGTCTCGCGATGAGCGGAAAATTCAGGTGGTAACGCGGAGCCTATCCGTCCTGAGG\n>CM004482.1/68495215-68495614 Xenopus laevis strain J chromosome 9_10L, whole genome shotgun sequence. \nTGATGACTAACATGTCCACGAGAAGGAATTTCATATATGAATGGAATGCCGATTGCCCTGTCCAAAACCCCAGTGTTAGGACCATATTAACCAGCAAGAAAGAAAAAATTGCCTATATACTTGTCAGATTTGCAGTAGTGAGGGGACAACAGCACAAGTACAGTATGATTAACTGCATCATCAACAGTGCCATGGGCAGCACCAAAACCTATAATTGTGACAATACATTCGGATGTCTGCCCCATGAACATTCGATGGTGCTTTCTGCAACTACCATGTTGACCACAGGTAATGGGGAATCAGGGTTCAATTTCGGAGAGGAAGCCTGAGAAACTGCCACATCCAAGGAAGGCAGCAGGTGCGCAAATTACCCACTCAGAACCTTCTGTGAATAAATATG\n>AJMR01000139.1/797-1134 Pseudomonas pseudoalcaligenes KF707 = NBRC 110670 strain KF707 ctg1510, whole genome shotgun sequence. \nCCGCCCAGCGCGCCACCAATACCGGCATCGGTATTGCCGCCGGCAAAGGCGCTGCCACTGGCGAGGCCAAGAGACAGGAGAAGGATCGAGGTGTACTTCATGGTGAGGATCGCCTCAGTGGTTTTGGTGAGGCGATATTTACTGTGGGATTTGTCTTACGCAAGTGTCTGACGACGAAAAACACGAACTTTTATTATTTTTTTTATTGGGCGATTCGACAGAAGAACTTTTTCCCTTCAGGGGAGTCAGAGGCTGGTTGAAACCCCCGCTCCATGCGCGTCTTGCGCTTTCTGGTACTGGCACTTCGCCTAATAAGTTCCCTTTGAAGTTGGAACTTT\n>MNIQ01000128.1/3562-3838 Ktedonobacter sp. 13_1_20CM_4_53_7 13_1_20cm_4_scaffold_29355, whole genome shotgun sequence. \nTTATAGGCAACGAAGGAACGAGTAGGTCCCCATATCTTGTCGAAGAGAGCCTGGGGGTGGTGTAACCAGGTCAGGATCGTGAGCCGAAAATCATTCCAGAGCCGCTAGCCGAAACAACAAAGTAGACCTGGCCGGGACCTTCCCGTTATCATGAAGGGCTGTATGGATCCTCTCAATTGGGGAGTTACAGCTAAACCAAGTGAGCCATATCTATCTCACACCTCGTGAGAATGTGGCTAATAAGGGTGGTACCGCGGGAGTTCCTCTCGTCCCTATG\n>BARX01000007.1/79604-79779 Agarivorans albus MKT 106 DNA, contig: contig00007. \nCAGCGCGCTTTTGGGGAGTAGCTGCCCATATCAATAAGGTATGGGGCATTTATCAACATACTTAGTGCTCATCACTATGGTAAATGCAGCCTTTATTGGCCTAGCAAGACCAAATGCACATTAACGCCATAAAGAGGTGAGCTGCGTTGTGTGCATTGGTTTATTCGCTCGCCTCA\n>CM001383.3/74376359-74376250 Felis catus isolate Cinnamon breed Abyssinian chromosome B3, whole genome shotgun sequence. \nCCTCGATGATGAATTGCCATGCTAATACTGAGTCACCAGGTGGGGCAGTGTTGCCCTGGTTTGGGTGCCAGTGAGTTTAACAAAACTTCTCACATGGAGACCTGAGGGGC\n>AOKF01002516.1/2805-2760 Pseudomonas syringae pv. actinidiae ICMP 19096 scaffold552, whole genome shotgun sequence. \nTTGGCTTTTAACCAATTGGTCGTAGGTTCGAATCCCACACGACCCA\n>AWUE01016600.1/22634-22748 Corchorus olitorius cultivar O-4 contig16633, whole genome shotgun sequence. \nGGGTGCAATCATACCAGCCCTAATGCACCGGATCCCATCAGAACTCCGTACTTAAGCATGCTCTTGGAGTTGGCTATCATCAAAAGTGTCATTATTCTAACTACTTTTGCAAATG\n>JH835377.1/3849674-3849364 Erinaceus europaeus unplaced genomic scaffold scaffold00089, whole genome shotgun sequence \nATGTGAGGGTGCTCTGGCTGTGACATCTGTCACCCCATTGATTAGAAGGGTTGATTCAGCTGATCTGGTTGGTTAGGAGGTGTCCCCTTCCTCCCTCACCACTGAATGTGCTTCCCTCCCAAAGCTGCAGTGCTTGGTGAAGAAGACAGCCTTCCCCAACAGAGATGGACAGGTCTCGGTGGAGGGTATCAGACTAGCTGTACTCCCCTGCTAGAAATTCCAAACAAGCTCTCAAAATGTCTCTTGGAAATTTGCCAGATTTCATATGAAAAGAGTCATTCTATATTTTTCCTATAGAAAGAAGATCATTT\n>URS0000D6B09B_12908/1-98 unclassified sequences skipping-rope RNA \nCATGCCGGAGGTGGGAAATTGTGTTGCACCCACGCACCTTGCGTACATGACGTAACGGTTAAAAGAGATGGAGCAGATTGCAACGGCTCCCCGGCATA\n>CP000108.1/2027693-2027787 Chlorobium chlorochromatii CaD3, complete genome. \nCGGCATCCCCATTACCTATGGTCACGGTGCTGGAAGCTCTGGGAAGGGTTACCCTTCCAATGGTGAATTGATCAGGAGAGCTTTTCCGTGTCCCA\n>LCZI01000091.1/60703-61080 Emmonsia crescens UAMH 3008 supercont1.108, whole genome shotgun sequence. \nGCGTAGGCGAAAATCATTTTACTACATACATATAAAATTCAATTACCCCAATTTGTATAATATTAAATTATGGCTATCTGCAGTTAATGCCGTGAGACATGGTTAATTCTTTTAATGAACCCAAACCCTAACTTTCTTTATTTCTCTATATAAAGTAACTTGCTAAAAATTGGTTAGAGAATAGGGACCAAGACAGGTCATCATGACCATAAATAATATTATGGGCTATAGACGTACCACACACGCCTTAACAAAAGGATGCTATATTGTAAAATGGAGCTAATCCTTAAAACATAATATAATATGAGGTGTTGTCTGTAACTCGACAACAGGGACAAAAAAGTACTAGTGATCGTGAATCATCACGCCACGGTGAGT\n>CP016199.1/1032825-1032926 Mogibacterium pumilum strain ATCC 700696 genome. \nTCCTTATTAAGAGCGAGTGAGGGAATGGGCCCGGCGAACTCGCGGCAGCATCGCATATTGCGGTTGTGCCAAGTCCCACAGGCAAAGCCTGAAAGATGAGGA\n>DS562928.1/6888831-6889130 Cavia porcellus supercont2_73 genomic scaffold, whole genome shotgun sequence. \nGATTCCAGCAATCTGCCTGTGACGTCTGTCACCCTTGTCATTGTGTGGGCTGGTTTGGTTAATCTGGCTGGGGAGGTGGGTGTCCTCTTTCTCTTTCACAGCACCATGTGCATCTCTGTTGAAGCTGTGTGCTTGGTGGAAGAGGAGGACCTTCCCCGAAAGGATCAGGACAAAGATACATGAGTAGCTTCACTTCCCTGCTGGAACCTCCAGACAAGCTCTCGAGGATAGGATTTACCATGTGACACAGTAGTGGAGAATTTGAACAAAAGTCTATGTTGCTCATCATGGTAATTCAGG\n>CM000236.2/126073376-126073451 Rattus norvegicus chromosome 6, whole genome shotgun sequence. \nGAGGGGCTCACAGCTCCGGTCCTTGGAGCTCCAGAGAAAATGTTGCTCCGGGACTGAGTTCTGTGCACCCCCCTTG\n>APWO02002148.1/5885-5949 Astyanax mexicanus Unplaced_Scaffold4491, whole genome shotgun sequence. \nGTGTTTTTCTGCAACTGAAAAACTCCTCTGTAGCTCAAAAATGAGCTTTTTAAGACTGAAACACA\n>CM001883.1/35529231-35529093 Theobroma cacao cultivar Matina 1-6 chromosome 5, whole genome shotgun sequence. \nAATGCCTCCAGAATAACCAGAAGGTTAGAATATGATCCGACGCCGTCTTGGTTCAGACAGAGGCTTAGAGCAATTCGAATCCGTTTGAGGGTAAGGAACGATTTTCCTCCGTTCCTTTCCTAGATGTCTTCGAATATTT\n>JH711575.1/1398613-1398696 Coniophora puteana RWD-64-598 SS2 unplaced genomic scaffold CONPUscaffold_3, whole genome shotgun sequence. \nGGGCGTTTGGCACAGTGGTAGCGCGTATGCTTTGCATTTAAGCAACTTGCATAAGGTCGTGGGCTCGAATCCCATTCATCTCCT\n>FQVZ01000030.1/1153-1 Fibrobacter sp. UWB8 genome assembly, contig: Ga0136280_130 \nTGGAGGTCGCAGGGAAACGGCAGAAGCGACTGTTTACCAAAAACACAGGGCCATGCTAACACGCAAGTGGACGTATATGGTCTGACACGTGCCCGGTGCCGGAAGGTTAACAGGAGGGGTCAGCGCAAGCGAAGCCCTGAATCGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATCGTGTAACGACTTCTGCACTGTCTCCTCCCGGGACTCGGCGAAATTGCAGTGCCGGTGAAGATGCCGGCAACCCGCACCTGGACGGAAAGACCCCATGAACCTTCACTGTATTTTGACATTGGTTTTAGGGCCCGCATGTGTAGGATAGGTGGGAGGCTTTGAAACGGCGACGCCAGTCGTCGCGGAGCCGCCCTTGAAATACCACCCTTGCGCGCTTTGAGATCTAACCTCGTCCCGTCATCCGGGACAGGGACCGTGTCTGATGGTCAGTTTGACTGGGGCGGTCGCCTCCTAAAAGGTAACGGAGGCATCCAACGGTTCCCTCAGCGCGGTCGGCAATCGCGCGTAGAGCATAAAGGCATAAGGGAGCTTGACTGCGAGGCGGACACGCCGGGCAGGTACGAAAGTAGGGCTTAGTGATCCCGCGGTACAGCGTGGAAAGGCCGTTGCTCAATGGATAAAAGGTACTCTGGGGATAACAGGCTGATCTCCCCCAAGCGTTCATAGCGACGGGGAGGTTTGGCACCTCGATGTCGGCTCGTCGCATCCTGGGGCTGGAGAAGGTCCCAAGGGTTTGGCTGTTCGCCAATTAAAGCGGCACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCCTATCCGGTGTGGGCGTTCGAGACTTGAGGGAAGCTGTCCTTAGTACGAGAGGACCGGGACGGACGTACCTCCGGTGTACCGGCTGTCGCGCCAGCGGCATTGCCGGGTAGCCGTGTACGGATCGGAGAAACGCTGAAGGCATCTAAGCGTGAAGCCGTTCCCAAGATCAGGTCTCGCGGGGGCAACCCCATGTAGGGCCGTCGTAGACTACGACGTCGATAGGCCGCAGGTGTGAGCGTGGCGACACGTTGAGCCGAGCGGTACTAATAGCCCGGTAGAGCTTTT\n>AAPE02046865.1/69583-69781 Myotis lucifugus cont2.46864, whole genome shotgun sequence. \nGAATCTGATAATCAACAGGGTTAAAAGACAGTTGAACACCTGAAGTACATTATGATGATTTAAATAATGTGCAGTTTGCCCAAAAACGTTCGGTCCCTGGCGTATGTCTTAGAGATTTCTATGCGGTATGCAATGTGTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACTCGCATGAATGAATGAACGAGATTC\n>HF998428.1/32618-32277 Coprococcus eutactus CAG:665 genomic scaffold, scf147 \nGGGGTTGACTGGTTTCGACAGGGGTTTTGAAGCTATGGAAGCCATCCGTGGACCAGAGCCACGCTAAAAGCTGGACAAAAAATAAACGCTAACGATAATTTAGCATACGCTGCCTAGTTGCAGCCGTCATCCTTTAGGAACGCCGAGCCTTTAGGAATGGCGTCGACTTTCGGCAAACTCCTGCATCTAAGCTTTGCGATGTAGGAAAATCCATGAAGCTACTAAGGTCTATAGCATGTTAGTGGGCGATAGGCTGAGGGAATGTTAAAGCACTGACTGTGATGGAAGAAACTGTAGTGAATGAGCTTTTGGACGGGGGTTCGACTCCCCCCAGCTCCACTA\n>FJUW01000012.1/748132-747973 Rhynchosporium commune strain UK7 genome assembly, contig: RCO7_scaffold012 \nGGCCGAGTAGTGCAATGGTCAGCATCTCACATCCATAATGTTCTGGATTGCGAGCGCGCGTGCGTGTCATCGGATCTTGTATCGTTTACTGTATTCTTATTGCTTCGGCGTTTGGGTGTAGGATTATGTGAGGATGGAGGTTCGATTCCTTCCTTGGCCA\n>CM001586.2/2047421-2047222 Ovis aries breed Texel chromosome 5, whole genome shotgun sequence. \nATCACTTCTCGGCCTTTTGGCTAAGATCAAGTGTAGTATCTGTTCTTAACAGTTTAAAATAGTATGTTCCAGACCCTGGCTGCTGAAATGTATCTCTCAATCTCTAAAATCCCTGTGGGTTGCTGAATCATAAGGGCTTGGTTCCTGGTGCATTTTAAATTTTGTCTTTGTTTCTGACACCGGAGGATGACTCACTCTTT\n>AP008955.1/1357281-1357003 Brevibacillus brevis NBRC 100599 DNA, complete genome. \nTTGATGGCAATGAGGAAGAAGAGTAGTCATTTTACGAGACTTCAGAGAGCTGATGGTTGGTGCGAATCAGTGTTAAGGAAATGATGAATGGGCTTCCGAGCTCCAAACCAAACCCGCTACTCATGGCGGCAGTAGGCTTTGGCGTTACGTCCGTACGTTACAATGGACACCGTATCAAGCTGTCTTACACAGAAACGGTACGGATTAAAGAGATTTTGCGTATGGATGATTCCTTGCGCGAAATAACAAGGGTGGCACCACGGTTCATTCGTCCCTGTC\n>ADKL01000252.1/892-837 Hot springs metagenome ctg_1106426166129, whole genome shotgun sequence. \nCTTGATGAGTACACTCTTTGCTGATTCAATGAGGAGAGTGGCCAGGGCTGAAGAGG\n>MIDV01000105.1/1073-1170 Xanthomonadales bacterium RIFOXYA1_FULL_69_10 rifoxya1_full_scaffold_59073, whole genome shotgun sequence. \nATCCCCCAGACATGCCCGCCGGCGTTGCCGGTGACATGCCCAGGTAGCCATCGATCTTCAAGGCTGCGGCGCGGCTTGTCCGCGTTGATCGAAACCCG\n>FPAA01000006.1/128109-128175 Marininema halotolerans strain DSM 45789 genome assembly, contig: Ga0104500_106 \nGTGTTGGTAGTTTAATTAAAATTCCGACCTTTCAAGTCGGCGATGAAGGTAAAATCCTTCCCACACG\n>MJEQ01037189.1/69339123-69338966 Nicotiana attenuata strain UT chromosome 7, whole genome shotgun sequence. \nATACTTACCTAGACGAGGTCAATGGACGAACGATAAGACTCATGGCCTAGGTTGGGGACTTCCATTGCACTTTGGAGGTGCCCGCCTATGGTCGACCCAAGTGTCTGAACCTACGTCATAATTTGTGGTAGTTGGGGCTTACGTTCGCGGGCCCCTAC\n>KV423970.1/63913-63812 Calocera cornea HHB12733 unplaced genomic scaffold CALCOscaffold_57, whole genome shotgun sequence. \nGGCAACTTGGCGCAGTTGGCTAGCGCATCTGTCTAACAAGTTGCCTCTCCAGGCAGGTCCTTTGTACACAGAAGGTCGCAAGTTCGAGCCTTGCAGTTGTCA\n>ALWZ040150818.1/688-1 Picea glauca, whole genome shotgun sequence. \nCATCGAAAGGAAATCGGGTTAATATTCTCGAACCGGGACATGGCGGCGGACGACAACGTTAGGAAATCCGGAGACGTCGTCGGGGGCCCCGGGAAGAGTTATCTTTTCTTTTTAACAACTTGCCCACCTTGAAATTGGCTCAACCGGAGATAGGGTCCAGCAGCTGGAAGAGCATCACACGTCTTGCGGTGTCTGGTGCGCCCTCGACGGCCCTTGAAAATCTGGAGGACCGAGTACCGTCCATGCCTGGTCATACTCATAACTGCATCAGGTCTCCAAGGTGAACAACCTCTGGTCAATAAAACAATGTAGGTAAGGGAAGTCAGCAAAACGGATCCATAACTTCAGGAAAAGGATTGGCTCTGAGGGCTGGGCCTTGGGGTCTGCGTCCTCAACCCGTGGGATGTCGGCAGTCTACCCGAGCTGCTATCACGGCGAGGGCGGGCAGTCGCGTGCTGATTGGGCTACGGACGTAGAATGTCCTCTCGCGAGGGCTTTTCCCTAGGCGACGAACAGTCGACTCAGAACTGGTACGGAAAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATCGTCCCTGCGGATGCTGACGCAATGTGATTTCTGCCCAGTGCTCTGAATATCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTT\n>AYUG01104772.1/8786-9026 Fukomys damarensis contig104772, whole genome shotgun sequence. \nGGATGTGAGGGCGATCTGGCCGATCTGGCCAGCCAGGCAGGGGTTCCCTCCCTCCTGCGCTGCTACAGAAGCTGCATGCTTGGTCGAAGAGGATGACCACCCTGATGGGGGAGACCGTGTCCTCTGTCAGGGAATCTGAGTAGCTGCACTCCCCTGCTAGAACCAAACAAGCTCTCAAGGAAAGTGAGCCACAGCACTCACCAGAGGCAGAGCTGGGATTTGAACCCCGGCCTCCTGGCTC\n>GL344173.1/24246-24358 Anolis carolinensis unplaced genomic scaffold chrUn0991, whole genome shotgun sequence. \nATCTAGGAGTACAGGGTTGTTGTATGTCTTTTGGGCTGTGTGGCCATGTTCCAGAACATCAGAACTTCTGGAACATGGCCACACAGCCCGAAAGACATACAACAACCCTGTGA\n>URS0001A24820_12908/1-49 unclassified sequences eL15-Euryarchaeota ribosomal protein leader \nGCGGAUAAUAAUCCGUAGGGAUGUAACCCAAACGGGGUUGAACCGCAAA\n>MNWA01000007.1/20574-20446 Candidatus Pacebacteria bacterium CG1_02_43_31 cg1_0.2_scaffold_487_c, whole genome shotgun sequence. \nATATGTTAATTTAACAATGCTGTGGAATGTAGTGAAAATCTACAACTGTGCCGCAACGGTGTATTTTTGGTATTTTCCAAAATAAGTCCGATCTTCAGCAAAAAATTTTTAAACTTGCTTAGGCAAGTT\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/rnacentral_active_seq_id_90_cov_80_linclust__subsampled_1000.fasta",
    "content": ">URS000254B5FC rRNA from 1 species \nATGGAAGTCGACAGAGCCCCGGCCGCTGCCGCGGGAGGAGGATCCTCCTCTGGCGCGATGGCGGTGGACGCGGCCGGCGGCGTGGAGAAGCCGCGGTTCGACGCGCTGATGCCAAGCGAGATGAGCGGCGGGAGGCCACAGTACCGCAAGGTCCAGGTGCCGCCGCACCGCTTCGCGCCGCTGAAGAAGGCGTGGCTGGAGATCTACACCCCCGTCTACGAGCACATGAAGGTCGACATCCGCATGAACCTCAAGGCAAAAAGGGTCGAGCTGAAGACGAGGCATGATACACCAGATGTGAGCAACCTTCAGAAGTGCGCGGACTTCGTGCATGCTTTTATGCTTGGATTTGACATTGCCGATGCCGTTGCCTTGCTTCGTCTTGATGACCTGTATGTGGACTCCTTTGAGATCAAGGATGTGAAGACACTCAGAGGGGAGCATCTGTCACGTGCCATTGGGCGCCTGTCAGGGAAAGGAGGCAAGACCAAGTATGCCATCGAGAACTCTACGAGGACTCGCATAGTTATCGCTGATACGAAGATCCACATACTTGGATCCTTTGTTAACATCAAGGTTGCCAGGGATTCACTCTGTAGTCTTATCTTAGGTTCTCCTGCCGGCAAGGTCTATTCTAAGCTTAGGGCTGTATCTGCTAGGTTGGCAGAAAGGTATTAG\n>URS0000B78375 rRNA from 1 species \nGTGGGGAATATTGGACAATGGGGGGAACCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTTTGGTTGTAAAGCACTTTAAGCGAGGAGGAGGCTACCGAGATTAATACTCTTGGATAGTGGACGTTACTCGCAGAATAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCAAGCGTTAATCGGATTTACTGGGCGTAAAGCGCGCGTAGGTGGCCAATTAAGTCAAATGTGAAATCCCCGAGCTTAACTTGGGAATTGCATTCGATACTTGGTGGGTAGAGTATGGGAGAGGATGGTAGAATTCCAGGTGTAGCGGTGAAAAGCGTAGAAATCTGGAGGAATACCGATGGCGAAGGCAACCATCTGGCCTAATACTGACACTGAGGTGCGAAAGCAAGGGGAGCAAACAGGATTAGATACCCCTGTAGTCC\n>URS0001CC990C rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACGGACGAGAATCTTGCTTCTCTGATGTTAGCGGCGGACGGGTGAGTAGCACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATTTTGAACCGCATGGTTCAAAAGTGAAAGACGGTCTTGCTGTCACTTATAGATGTATCCGCGCTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTACAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGAACTGGGCGGAAGACTGACGGAGCAACGCCGCGTGAGTGATGAGGGTCTTCGGATCGTAAGACTCTGTTCTTAGGGAAGAACATATGTGTAAGTAACTGTGCACATCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS00013D39E1 rRNA from 1 species \nTACGTAGGGGGCAAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGGTCTTTAAGTCAGGGGTGAAATGCCAAGGCTCAACCTTGGAACTGCCTTTGATACTGGAGATCTTGAGTCCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGGAACTGACGCTGAGACGCGAAAGCGTGGGGAGC\n>URS00023ED20D lncRNA from 1 species \nTCAGAATAAGCATAGCTAGGAAGGAATGTTTGAATAATGCACTATTTTTTTCCTCATGAGATAAAAAAAGAAGAAGAAAATATTCTTTTAGAGTAGCAGCAGTGGATGAAAAAAACTCAAAAAAATTGGAAACGTGAAAAAGTGCAAAACCAGAGGGTGAGGAACGTGTCGGTAGAAGAAGGGCTGGCTCGCTCTCGTTCGATCAGATCAAATACTACCGGAG\n>URS00017AA725 rRNA from 1 species \nTACGGGGGGAGCAAGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCACCGCAAGTCGACTGTGAAGTTTCCGGGCTTAACCCGGAAAGGTCAGCCGATACTGCGGGGCTAGAGTGCAGAAGGGGCAACTGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCTGACACTGACGCTGAGGCGCGAAAGCTAGGGGAGCGAACGGG\n>URS00023C6B8F lncRNA from 1 species \nGTCATACTCAATATAAATTAATAGTAATGGATGCAAATGACAACGGTGCTCTCCAACAGGTGCTTTTTAATAAAAGGATGATGACTCAACATAAAAATAAATAGATAGGCCCTACGCAGAGGGAAGCAGGGATTTGTAGAGGTGCCAGAGCTCGATTTTTGAATAGAGATAAATAATATTTTGAGCGGCATACTTTCATTGTTAACATAACAACCGAGAGATCTCGATATCTTCCATGCTACACACATTATAGGCGGTTCCCAAACATAATGGTAAAGTTTATACTCCCCCTCCACCAACAATCATCAATTCATGGCTTTCCCGAAACAACGGGTGCCTCCAACTAACAACAATCCTAGGGGAGTTTTGTTTGCAATTATTTTGATTTGATTTGAGCATGGGACTTGGCATCCGATGACCAGCCATTTTCTCGTGAGTGAGGAGCGGAGTCCACTCCTCTTGAGAATAACCCATCTAGCATGGAAGATACAGACAACCCTAGTTGAGACATGAGCTGTTAAAGCATACAAAATAGAATTTCATTTGAAGGTTTAGAGTTTGGCACATACAAATTTACTTGGAACGACAGGTAGATACCGCATATGGGAAGGTATGGTGAACTCATATGAAATAACTTTGGGGTTTATGGAAGTGAATGCACAAGCAGTATTCCCGCTTAGTACAAGTGAAGGCTAGAAAAAGACTGGGAAGCAACCAACTAGAGAGCGACGACAGTCATGAACATTCATTAAAATTAATAGACATTGAGTGGAAGCATGAGTAGGATATAATCCACCATGAACATAACATCGTGGAGGCTATGTTGATTTTGTTTCAACTACATGCGTGAACATTTGCCAAGTCAAGTCACTCGAATCGTTCAAAGGAGGATACCATCCTATCATACCACATCACAACCATTTTAATAATATGTTGGCATGCAAGGTAAACCTTTATAAACTCCTAGCAAATTAAACATGTCATAAGAAACTATAATCTCTAATTGTCATTGCAAACATGTTTATTCATAATAGGCTGAATCGGGAATGATGAACTAATCATATTTACAAAAACAAGATAGGTCAAGTTCATACCAGCTTCTCTCATCTCAATCAGTCCATCACATATCGTCATTATTGCCTTTCACTTGAACGACCGAACGGTGTGGATAATAATAATAGTGCACGTGCATTGGACTAAGCTGGAATCTGCAAGCATTTGATACAAGGGAGAAGGCAACGTAATATGGGCTTTTGGTTAAATCAACAATAATGCATATGAGAGCCACTCAACATTTTCATCATGGTCTTCCCCTCTCGACCTCCAAAGAAAAGAAAAGAAATAAAACTATTTACACGGGAAAGCTCCCAACAAGCAAAAGAAGAACGGAAAATCTTTTTGAGTTTTCTTTTAATTACTACTACTACAGGAATGGAAAGTAAACTATCTAATAGCTATAACTAATTTAAATTTTTGGTTTTTTCTTAAAGTTTTTCAAACACACAAGAAGAAAGCGAGAAAAAGAAAATAAACTAGCATGGATAGCACAATGAAAAAGTATGAGCACCGACAACTGGAATGAATGTGTGAACATGAATGTAATGTCGATGAGAAATACGCACTCCGCCAAGCTTAGACTTTTGGCCTAAGTTGGTCTATGCCCATGGATTGAAGCTACTCTCTCCGGTGTACTGAGGAATGTCATCAGGGTGCCACTGGTTGGCAATCTCCTCCGAATACCACTTATAAATGGAGCGTCGATAAGGGTCCAGTGGTGGTTCCGGCTCAGGCTCTGGAGCTGGTGTTAGGCTCCGGTATGCGTAAACGGCCTCCGGCAAGATGAGGTACGTGCCTGAAAATATGTTAAGCAAAGATGGTGCAGGCAAGATAATAGTCTCACTGTGAGTTTTATTAAATCCCAAATTATACTCAAGCATCATCTTCTTATTTTTAACAATAAATTCATGTGCTACCATACTCTTATAATCTAGAAAATAGGGGGC\n>URS0001774F8E rRNA from 1 species \nCCTACGGGCGGCAGCAGTGGGGGATATTGCACAATGGGGGGAACCCTGATGCAGCGACGCCGCGTGGGTGAAGGAGTGCTTCGGCATGTAAAGCCCTATCGGCAGGGAAGAAGCAAGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATCCGTAGGGGGCGAGCGTTATCCGGATTCACTGGGTGTAAAGGGAGCGTAGACGGCCATGCAAGCTAGGGGTGAAACCCCGGGGCCCAACCCCGGGACTGCCCTTGGAACTGTGCGGCTAGAGTGCGGGAGGGGCAGGCGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCGGCGGCGAAGGCGGCCTGCTGGACCGCGACTGACGTTGAGGCTCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCCGGTAGTC\n>URS00018E4F15 tRNA from 1 species \nACACCAGTGGTGAAACGGTTATCATGCTTGCCTTCCATTACCGTGAGCAAGCGGCGGGGGTTCGACTCCCTCCTGGTGTA\n>URS0000B64D6B misc_RNA from 1 species \nTGAAGATCTCTCCCTACACACCTCAGCAGTTGCAGATCAAATCTCTGGTTCAGCTAACCAAAGAGTTGAAATTGAAATGGAGATTCTTTCTCTTGGTCAAATGTTTGGGCCTTTGACAAACGGTTCCATCGGTGAAAAAGAGAATTCTTATCATGCTAAGGCTGAATACACAGAAAAACAGCTTCTCTTAAATGTTTCTGCTCAACTTAG\n>URS00011ACD89 rRNA from 1 species \nTACAGAGGTGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTTGTAGGTGGCCAACTAAGTCAGACGTGAAATCCCTCGGCTTAACCGGGGAACTGCGTCTGATACTGGATGGCTGGAGTGTGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCATCCTGGACCATTACTGACACTGAAAAGCGAAAGCCAGGGGAGCAAACGGG\n>URS0001176963 rRNA from 1 species \nTACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGTTTAAAGGGTGCGTAGGTGGTCTATTAAGTCAGTGCTGAAATATCCCGGCTTAACCGGGAGGGTGGCATTGATACTGATGGACTTGAGTAAAGTTGAGGTAGGCGGAATTGACGGTGTAGCGGTGAAATGCTTAGATATCGTCAAGAACACCGATAGCGAAGGCAGCTTACTAAGCTTTAACTGACACTGAGGCACGAAAGTGTGGGGATCAAACAGG\n>URS000182FF44 rRNA from 1 species \nTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGAGGAGGAAGGCGTTGTGGTTAATAACCGCAACGATTGACGTTACTCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTCAAGTCGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCCGAAACTGGCAGGCTAGAGTCTTGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACA\n>URS0000745C0A rRNA from 1 species \nCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGAAAAGCCTGATCCAGCCATGCCGCGTGCAGGATGAGGGCCTTCGGGTTGTAAACTGCTTTTGTACGGAACGAAAAGACTCTGGTTAATACCTGGGGTCCATGACGGTACCGTAAGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTATATAAGACAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTTGTGACTGTATAGCTAGAGTACGGCAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAANCANCCGATGGCGAAGGCAATCCCCTGGGCCTGTACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCAACTGGTTGTTGGGTCTTCACTGACTCAGTAACGAAGCTAACGCGTGAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTGNAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGTTTAATTCGATGCAACGCGAAAAACCTTACCCACCTTTGACATGTACGGAATCCTTTAGAGATAGAGGAGTGCTCGAAAGAGAGCCGTAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGCCATTAGTTGCTACGAAAGGGCACTCTAATGGGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATG\n>URS0001C47DC8 misc_RNA from 1 species \nAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTAAAGTGTTTCGGAGCCTGGCTCGGGCATCTCACCTCGAGGTGTCGGTGTCAGCGCCCCCACACGTGTTTACTCAACTTGGTTGCCTTGGTGAGCCTGCCCTCGTGGCTGCCGGGGATGCCTCACGGCGTTCCGGGCTCGTGCTCACCAGTGGATCATTTGAACTCTTCTGTGAAAATAGCCAGTCTGAGCATTATGCAAATTAAATAAAACTTTCAACAACGGATCTCTTGGTTCCG\n>URS0001C9BECE rRNA from 1 species \nGATGAACGCTAGCGGCAGGCTTAATACATGCAAGTCGAGGGGCAGCATGAAGTAGCCATACTTTGATGGCGACCGGCAAACGGGTGCGGAACACGTACACAACCTTCCTTTAAGTGGGGAATAGCCCAGAGAAATTTGGATTAATACCCCGTAACACAACTAAGTGGCATCACTTTGTTGTTATAGTTTCGGCGCTTAATGATGGGTGTGCGTATGATTAGATAGTTGGCGAGGTAACGGCTCACCAAGTCTACGATCATTAGCTGATGTGAGAGCATGATCAGCCACACGGGCACTGAGACACGGGCCCGACTCCTACGGGAGGCAGCAGTAAGGAATATTGGTCAATGGACGCAAGTCTGAACCAGCCATGCCGCGTGAAGGATTAAGGTCCTCTGGATTGTAAACTTCTTTTATATGGGACGAAAAAAGGTCTTTCTAGACCCCTTGACGGTACCATATGAATAAGCACCGGCTAACTCCGTG\n>URS0000FFB7EB rRNA from 1 species \nTACGTAGGTGACCAGCGTTGTCCGGATTTACTGGGCGTAAAGAGCGCGCAGGCGGTCGTTCAAGTCGAGTGTGAAAGCCCCCGGCTCAACTGGGGAGGGTCACTCGATACTGATCGACTTGAAGGCAGGAGAGGGAAGCGGAATTCCCGGTGTAGTGGTGAAATGCGTAGAGATCGGGAGGAAGACCGGTGGCGAAGGCGGCGCTCTGGAACATTTCTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGG\n>URS00002FFC52 rRNA from 1 species \nTTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAATTTCGGGATCAATATAACGGTCATGCCGTTGGTATGCACTGTTATAATTGATTTCTCACCTTCTAAAGAACCGTAATGCCATTAATTTGGTGTCACGGGGAATTAGGACTGTTACCTTGAAAAAATTAGAGTGTTTAAAGCAGGCTCACGCTTGAATACATTAGCATGGAATAATGAAATAGGACATCCGATTCTATTTTGTTGGTTTCTAGGATCGATGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGGCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGATGATGTTAATTTTTTAATGACTCATTCGGCGCCTTACGGGAAAC\n>URS00002B11A3 rRNA from 1 species \nTGGAACTTGTTCTGGTGGATTAGTGGCGAACGGGTGAGTAACACGTGAGCAACCTGCCCAAGACTTTCGGGATAAGCCTGGGAAACTGGGTCTAATACTGGATATGACCTTTCATCGCATGGTGTTTGGTGGAAAGATTTTTTGGTTTTGGATGGGCTCGCGGCCTATCAGCTTGTTGGTGAGGTAATGGCTTACCAAGGCTTCGACGGGTAACCGGCCTGAGAGGGTGACCGGTCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCAGTCAGGAACAAGCCACTTGTGGTGAGGGTACTGGCAGAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTATCCGGAATTATTGGGCGTAAAGAGCTTGTAGGCGGTTTGTCGCGTCTGCTGTGAAAGCCCGGGGCTTAACTCCGGGTCTGCAGTGGGTACGGGCAGGCTAGAGTGATGTAGGGGTAACTGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCACGAAGAACACCGATGGC\n>URS0000D07B33 snRNA from 1 species \nATACTTACCTGGACGGGGTCAATGGGCGATCAAGAAGACTCATGGCCTGGGCTAGTGACCTCCATTGCACTTCGGAGGGGTGCTTGCTTAAGGTCTCCCCAAGAGGGAGAGCCTACGTCATAATTTGTTGCAAGGGGGTTTGCGTTCGCGCAGCCCCCAC\n>URS00007AB434 rRNA from 1 species \nCCTACGGGGGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCCATGCCGCGTGAATGATGAAGGTCTTAGGATTGTAAAATTCTTTCACCGGGGACGATAATGACGGTACCCGGAGAAGAAGCCCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCTAGCGTTGCTCGGAATTACTGGGCGTAAAGGGAGCGTAGGCGGATAGTTTAGTCAGAGGTGAAAGCCCAGGGCTCAACCTTGGAATTGCCTTTGATACTGGCTATCTTGAGTATGGGAGAGGTATGCGGAACTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCATACTGGCCCATTACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGAGTGCTAGTTGTCGGCATGCATGCATGTCGGTGACGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGAATTAAAACTCAAAGGAAATTGACGG\n>URS0000128881 rRNA from 1 species \nTTGACGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGCCTTGACATGCAGAGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAACTCTGACACAGGTGCTGCATGGCTGTCGTCAGCCCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTACCAGCACGTTATGGTGGGCACTCTAAGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGGCCTGGGCTACACACGTGCTACAATGGTCGGTACAAAGGGTTGCCAAGCCGCGAGGTGGAGCTAATCCCATAAAACCGATCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGTGAATCAGAATGTCACGGTGAATACGTTCCCGGGCCTT\n>URS0000FA1FD2 rRNA from 1 species \nATTGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGATCGGTAACGCGGGGGCAACCCTGGCGACGAGAGGCGGACGGGTGAGGAACGCTTGGGAATCTGCCTATCAGCGGGGGACAACACGGGGAAACTCGTGCTAATACCGCATACGCTCTACGGAGGAAAGCCGGGGACCGCAAGGCCTGGCACTGATAGATGAGCCCAAGTCGGATTAGCTAGTTGGCGGGGTAACGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGAACTGAGACACGGGCCAGACGCATACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGAAACCCTGATCCAGCGACGCCGCGTGGGTGAAGAAGGCCTGCGGGTTGTAAAGCCCTTTCGGTAGGGACGAAAGCTCTCGACCTAACACGTCGGGAGGTTGACTTAACCTACAAAAGAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAAGAC\n>URS000258AA4F rRNA from 1 species \nATGGCCGCTCGTGTTAGCGGGCTCGCGGTGGGCTTCCTCTGCCTGCTTGCAATGTTGTCGCCGTCCGCGCAGCAATCCCCGCCCCCAGACTCCCCAGATTTAAAGTCGTCAATAGACACAGACACCCCACCTCTCCCTGACATACGCCCGCCCCCGAGCTCCCCGCGCGGCTACGAGTTGGACGTGCCCCCCAGGAACGTCACGTGCAAGGATACCGACGGTAAGCGGCCGGGGTGCACGGGAACTTGCCCTCGCCGCTGCCCCCAGTGCATCGTCCTCTGCCCCGACTGCAAGACATTATGCCATGACGAGGTACAGATGCCAAGGCCCGTGCCGCCACCTGCCATGTTGGTGTTCGGAGATGGGCAGTTCGACAACGGTAACAACGGATACTTGGAGCCCCCTAACTACCCCTACTCTGGCACCGGCAGGCTTAGCAACGGGGCCAACCTTGCCGATGCCATTGCATACACTATCGGATTCCCGCAAAGTCCTCTACCCTTCATGTCGTTGCGCGGCCGGATCAGCATGTGGGGCGCCAACTACGCTTCCGTGGGCGCTGGGATTCGGAACTCCACGAACGGAGAGCGGAGCATCCCTCTTTCGCAGCAGCTGGAGGACTTCAGGACGACGAGGGCCCTTATGGGGATAATGCTAGGGGGTGAAGCCAAGCTGCGCGCGTACCTGTCCAAGTCCATCTTCCTCCTCGGCATCGGCAGTCAGGACCTCGACCCAAGATGGAACATACACCTCGCAAATTCGACCGAGATCCAGAGCCTCGTTGCCCTATACGGGGAGGCCGTCACGTCCCTCTACGACATGGGCGCTAGGAAGCTGGCCATCGTCAACGTTGGGCTCATCGGCTGTGCGCCCCAGATCTTTGACTACAGGTACGGTTGCGACGAGAGCCTGAACGACCGCGCCGCCGCGTTCAACGCCGCCCTCAAGCCCCTCATGGCTGGCCTTGCGTCAAAGAAGAAGGGCCTTTTCTACTCCATCGGCGACTTTCATAGCTTCACCACCACCGTCTTCGCCGACCCGTCAGCTTATTGGATGGTGAACATCCGGGACTCGTGTAGCTTCACGGACCACCCAGAGAGGACGTGCTCTCCCCAGGAAGAGCACTGGTTCTGGGATTCAGAGTTCATGACGGATCAGGCATGTAGGCTGACGGCCACTGCATTTTACTATGGACCGCCTCAGTTTACCGCCCCCATGACCTTCAAGGCACTGCTGGAGAAATAA\n>URS0001D7E6BA misc_RNA from 1 species \nGATGAAGAACGCAGCGAAATGCGATAAGTAGTGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCCTTGGTATCCCGAGGGGCATGCCTGTTCGAGCGTCATTTCAACCATCAAGCCCCAGCGCTTGTGTTGGGGGCCTGCGGCTGCCGCAGCCCCCTAAAAGCAGTGGCGGGCTCGCTATCACACCGAGTGCAGTAGTTCATCTTCTCTCCGGTCTTGTGAGGCGGGTTCCGGCCGTGAAACACCCCACTACATTCAAGGTTGACCTCGGATCAGGTAGGAATACCCGCTGAACTTAAGCATATCAATAAGCGGAGGA\n>URS0002341CEB lncRNA from 1 species \nGGCAACGTGTTCCGGTCCTCTTCCACATCACGGAAGATTTGCTCTTTCCTCTTTGCGATGAATCTTGCTGCTGGTCACCCTTTGGGTCCACACAGCATTTATGAGCTGTAACTTTCAGTGCGAAGGTCTGCAGCTTCATTCCTGAAGCCAGCGAGACCACAAACCCACCGGGAGGAAAGAACAGCTCCAGGCGCGCCGCCTTAAGCGCTGTAGCACTCACCGCGAAGGTCTGCAGCTTCACTCCTGAGCCAGCGAGACGACGAACCCACCGGGAGGAACGAACAACTCCAGGCGCGCCGCCTTAAGAGCTGTAACACTCACTGCGAAGGTCCGCAGCTTCACTCCTGAGCCAGCGAGACCACGAACCCACCAGACGGAAGAAACTCTGAACACATCCAAACATCAGAAGGAACAAACTCCGGACACGCCTCCTTTAAGAACTGGAAAGACTCACCGCGAGGGTCCGTGGCTTCATTCTTGAAGTCAGTGAGACCAGGAACCCACCAATTCCGGACGCACTTCCTCCGGACTGTTGGTGCACTGAGTGATCTGAAGTGCTCCCTGGCCACCATGAATGTAAGCAGAGATGGTGTCTCACTTTGTTGTGCAGGCTGGAATGCAGTGGCACAATCATAGCTCACTGCCGCCTCGAACCCTTGGACTCAAGCAATCCTCCTGCCTCAGCCTCCCAAAGTACTGGGATTACAGGTATGA\n>URS0000160626 rRNA from 1 species \nTCTAACACATGACACGTCGAACGGTAACAGGAATTAGCTTGCTAATTTGCTGACGAGTGGCGGACGGGTGAGTAATGCTTGGGAATTTGCCTTTGCGAGGGGGATAACAGTTGGAAACGACTGCTAATACCGCATGATGTCTACGGACCAAAGGGGGCTTTTAGCTCTCGCGCAAAGAGAAGCCCAAGTGAGATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGACGATCTCTAGCTGTTCTGAGAGGAAGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGTTGTGAGGAAAGGTTGGTAGTTAATACCTGCCAGCTGTGACGTTAACAACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTCAAGCGAGATGTGAAAGCCCCGGGCTTAACCTGGGAATTGCATTTCGAACTGGCAGGCTAGAGTCTTGGAGAGGGGAGTGGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAACATCAGTGGCGAAGGCGACTCCCTGGCCAAGACTGACGCTCATGTGCGAAAGTGTGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCCCACCGTAAACGCTGTCTACTAGCTGTGTGTGC\n>URS000188CCB0 rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGGTCTTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGATCTTGAGTTCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGGATTAGATGACCTTGTA\n>URS00019B19CC lncRNA from 1 species \nGTCAGTATGAGCATGGAACTTGCTTTAGCCAGTGAAATGTGAACCGTGTACCCTGTACCACTCTCAGGAGGAAGATTTGCAAGCCACTAAGTGGACCTGCCTGACCCCTCCCTTGATGAAGTTACCTTTGCCCCACGTTCTAATCAACCTATACCCCGTAGGCCATCCTTACACTTCTGCTGGGGGTCTGGGTGGACCCCAGGTCAGACAACAATTCATGCTAAGCTGCTTATGAACAGCAGACCACCTGCTGCAGAATCAGGCAGGACATGTGTAGCCTATTTCCATCAAACCTTCTGAAATGGAAACCCCAGGAGTAGAGTCCAGCATCCAGGCCCACAGGATTCCCAGACATACTCAGGTATAAAAATGCCACTGAGTCCTCTGTTAATTATTGACTCCAAAACATTTCTTTGCAGAAGATGATGTTTTCTAAGACAGTGATCTGATTTTAAATTACCAAGACACTGAGTCCTTATTTTATATTCTTTTTCATCTTTACACAAATTTTCTTAAATTAATGCTCTTTAAAATAAGCTCATTTAAAAAAAATGGTGATAAATCTCCAGGTTCTACAGATGGAAAGACTGAAAATAAGACACAGGTATCAAAAACAGAATAAGTGGATCTAATGCAGGGATGTCAGGTGTGCCTCTGGGCCCTCATCCATTCCAAATCCCACTCCACACCTACCTGTCCATTCTCAGATTAAAGAACAGAATGCCCAGACTGCAAAGAAATTAACATGCCCCTTCGTTTTTATTAGCTTTTATTTTAGGCTCATTATCCATACCTCTGTGCATCCCTATTCTGTGTCTGCACTCATTTAGAAGCCAAATACCAGTAGGCCAATCAGCACATT\n>URS00021FE078 rRNA from 1 species \nGCAGCCCCCTGGGCCAATACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCAACTAGTTGTTGGGGATTCATTTCCTTAGTAACGTAGCTAACGCGTGAAGTTGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGATTAATTCGATGCAACGCGAAAAACCTTACCTACCCTTGACATGGTCGGAATCCTGCTGAGAGGCGGGAGTGCTCGAAAGAGAACCGGCGCACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCCTTAGTTGCTACGCAAGAGCACTCTAAGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGGGTAGGGCTTCACACGTCATACAATGGTCGGAACAGAGGGTTGCCAACCCGCGAGGGGGAGCTAATCCCAGAAAACCGATCGTAGTCCGGATTGCACTCTGCAACTCGAGTGCATGAAGCTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTTTACCAGAAGTGGCTAGTCTAACCCGCAATGAGGACGGTCACCACGGTAGGATTCATGACTGGGGTGAAGTCGTACAGGGTTAGCCCGTAATG\n>URS0000794101 rRNA from 1 species \nCTGATAATTGGAATGAGAACAATCTAAATCCCTTAACGAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGCAGGAGCGACCGGTCACACACTCTGTGTGTGAACTTGTGTTGTCTCTGGCCATCCTTGGGGAGATCCTGTTTGGCATTAAGTTGTCGGGCAGGGGACATCCATCGTTTACTGTGAAAAAATTAGAGTGTTTAAAGCAGGCTTATGCCGTTGAATATATTAGCATGGAATAATAAGATAGGACCTTTGTTCTATTTTGTTGGTTTTTAGAATTGAGGTAATGATTAATAGGGATAGTTGGGGGCATTCGTATTTAACTGTCAGAGGTGAAATTCTTGGATTTGTTAAAGACGGACTACTGCGAAAGCATTTGCCATGGATGTTTTCATTGATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCCTAGTCTTAACCATAAACCATGCCGACTAGAGATTGGAGGTCG\n>URS0000E403FD rRNA from 1 species \nTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGCGATGAAGGCCTTCGGGTCGTAAAGCTCTGTTGTTAGGGAAGAACAAGTGCTAGTTAAATAAGCTGGCACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGAAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCAAGTGTAGCGGTGAAATGCGTAGAGATTTGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCCCGTAGTCC\n>URS00003FB220 rRNA from 2 species \nTTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAGCCCTTGACATACCGGTCGCGGACACAGAGATGTGTCTTTCAGTTCGGCTGGACCGGATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGCCTTTAGTTGCCATCATTTAGTTGGGCACTCTAAAGGGACTGCCAGTGATAAGCTGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTACGGGCTGGGCTACACACGTGCTACAATGGTGGTGACAGTGGGCAGCAAGCACGCGAGTGTGAGCTAATCTCCAAAAGCCATCTCAGTTCGGATTGCACTCTGCAACTCGAGTGCATGAAGTTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTGGTTCTGCCCGAAGGCACTGTGCTAACCGTAAGGAGG\n>URS0000583501 sRNA from 1 species \nTCAAAGTGATCTCCCGCAGGCGGACTGCCA\n>URS0001BC1447 sRNA from 18 species \nCCGCGCCCGCUGCUUGAGGGUCAAGGCCCUCUUGCCUGUGCGCAAAAUCUGGUCGAGCCGCUGACUUCUGGGUCACCGCCAUGCGCACAACAGAUACCGCCGGUCUAAAGCGUCCGCGUAGGUCUCGCGCAGUUUCCGAACUGAUCGGCAAUGCCUUCGGUUUGGCGAUGUAGAUAGCUCGACAGGUCG\n>URS00018C39BD rRNA from 1 species \nTACGGAGGGTGCAAGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGCGGATAGGTAAGTCCGTGGTGAAATCCTGCAGCTTAACTGCAGAACTGCCATGGATACTATCTATCTTGAATGTCGTGGAGGTTAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGAGATGATATAGAACACCCATTGCGAAGGCAGCTAACTACGCGATAATTGACGCTGATGCACGAAAGCGTGGGGATCAAACAGG\n>URS0001C413C7 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACGGACGAGAAGCTTGCTTCTCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATTTTGAACCGCATGGTTCAATAGTGAAAGACGGTCTTGCTGTCACTTATAGATGGATCCGCGCTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCCGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTGGGGAAGAACAAATGTGTAAGTAACTGTGCACATCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS00023022DC rRNA from 1 species \nTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTATGGTTGTAAAGCACTTTAAGCGAGGAGGAGGCTACTTTAGTTAATACCTAGAGATAGTGGACGTTACTCGCAGAATAAGCACCGGCTACTCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCAAGCGTTAATCGGATTTACTGGGCGTAAAGCGCGCGTAGGCGGCTAATTAAGTCAAATGTGAAATCCCCGAGCTTAACTTGGGAATTGCATTCGATACTGGTTAGCTAGAGTGTGGGAGAGGATGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGATGGCGAAGGCAGCCATCTGGCCTAACACTGACGCTGAGGTGCGAAAGCATGGGGAGCAAACAGG\n>URS00003F74AF piRNA from 1 species \nTCTGACCTTCACACCTACACCGT\n>URS000219B0C7 rRNA from 1 species \nTGGTGGGTAGTTTGACTGGGGCGGTCTCCTCCTAAAGAGTAACGGAGGAGCACGAAGGTTGGCTAATCCTGGTCGGACATCAGGAGGTTAGTGCAATGGCATAAGCCAGCTTGACTGCGAGCGTGACGGCGCGAGCAGGTGCGAAAGCAGGTCATAGTGATCCGGTGGTTCTGAATGGAAGGGCCATCGCTCAACGGATAAAAGGTACTCCGGGGATAACAGGCTGATACCGCCCAAGAGTTCATATCGACGGCGGTGTTTGGCACCTCGATGTCGGCTCATCACATCCTGGGGCTGAAGTAGGTCCCAAGGGTATGGCTGTTCGCCATTTAAAGTGGTACGCGAGCTGGGTTTAGAACGTCGTGAGACAGTTCGGTCCCTATCTGCCGTGGGCGCTGGAGAACTGAGGGGGGCTGCTCCTAGTACGAGAGGACCGGAGTAGACGCATCACTGGTGTTCGGGTTGTCATGCCAATGGCACTGCCCGGTAGCTAAATGCGGAAGAGATAAGTGCTGAAAGCATCTAAGCACGAAACTTGCCCCGAGATGAGTTCT\n>URS0000670AD8 snoRNA from 2 species \nCCTGCTCCTGGAAGTGTTGCTGGTGTGGCTGCTGTGCCACATGTTCGCCAGTAGGTGGCAGATAGGAGAGAGGCTGTGTTTATGCTCAGTGTTCTGAACTGTGAACTGTGAATGATTCGTAGCCTAACAAT\n>URS0000C73CE8 ncRNA from 1 species \nGTGTCCGAGGAGCGTTGCAAGGCCGGTCGATTCAGGCGACCGCCCCAGGCTCGGACCCCTTCCCACAGGCAACGGCGCTCACCCGTC\n>URS00002A852C rRNA from 1 species \nAGGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGGAAAGGCCCTTCGGGGTACTCGAGCGGCGAACGGGTGAGTAACACGTGAGCAACCTGCCCTTAGCTCCGGGATAGCTCCGGGAAACCGGAATTAATACCGGATATGACCTAGGCCGACATCGGCTGTGGGTGGAAAGTTTTTCGGCTGGGGATGGACTCGCGGCCTATCAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGGGGGATGAAGGCCTTCGGGTTCGTAAACCCCTTTCAGCAGGGACGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCGCCGGCTAACTACGTGCCAGCAGCCGC\n>URS0002550A56 misc_RNA from 1 species \nTCCGGTTTAGCACCGGCAGTCTCCCTAGAGTTCCCGGCTTTACCCGCTGGCAACTAAGGACAAGGGTTGCGCTCGTTGCGCCACTTAAGGCAACACCTCACGGCACGAGCTGACGACAGCCATGCACCACCTGTGCAGGCTCCGTAGAGCGCCGGCTTTCACCGGCTTTTCCCACCATGTCAAACCCAGGTAAGGTTCTTCGCGTTGCGTCGAATTAAACCACATGCTCCGCTGCTTGTGCGGGCCCCCGTCAATTCCTTTGAGTTTTAGCCTTGCGGCCGTACTCCCCACGCCGTAAACGATGGGCACTTATCGCGTTAGCTACGGCACGGAAGGGGTCAATACCTCCCACACCTAGTGCCCAACGTTTATAGCGTGGACTAC\n>URS00023AAB80 lncRNA from 1 species \nTTTTTTTTTTTTTTTTTGCAGCGCCCCGTGGTGCACCTATTCCTGCTCCAGGTATAGATATATTCATAAATCCTTTGAAAATATAAACCATCAATACAAACTGAATTCTATTTGCTTATTAGTTTATTTATTCGTTTGACAGGTCCAGTCTCTCTAGCACCCAAACTCTCCCCTGGAGCTTCACCATCTTTAAGCCCCCAAAGTCCCATTGTGCCGGAACCGACACCATCTGCCGAGGTGCCTGATTCCGGCACCACACCGGCTCTAACTCCACCATCGTCCACAGCAGGTTCGGGAGCCCCGACGGCCGCAACGGGGAGCCGCCCTGTTCTCACCCCATCAGCTGCCAACCCCGCTTACAGTTTCTCACCATTCCTTTTGGTGTTCACATTGGGATTTGTGATTTTCAAGTACTAATTATATAATATGTATTGATTGATTTGTTTGGCGAGCGGTATTCTTTTAGTGGCTTGAACTGAAAACCATTGTTTTGCCTTTTAAGAGCTAATATTGGGTGACTTTACATTTTATATAAAATATACATATTAGTGTAATTTTTATTTATTGAGTAATAATTTTTTTTTATTTCTGCAATGATTATTTTTTAGGGTAAACTACACATATAGTCACTTTTGTTTACTTTAGGTTACATTTTGGTTACTTATGTTTAAAATATTACGTTTTAGTCACTTACGTTATCGTGTTGTAACATTTTAATCACTGAGCCGTTAATTTCCGTTAACGGTGTGACGGTAAGCTGACGTGGCACGTTAAATCATCATTTCAAACAAAAATTTTAGGTTAAATTATACAACTGATCCCCATATTTTTTTTGGGCAATTTAATTTTTTTCTTTTATATTCTTTAAACCTTACTCTCTCTTTTTCTCTTTATTTTCCATTATCTTCTGTTTCTCCTTCTATTTTCCTACCTTTTCCATGTCTTTTAACATATTAAGAAGTCGAATTGGCAGTGAAGAAAGAAGTAGGAAGCCGAAAGCCATCATTGCCTATAATCAAAACCCATAAACCCGTACCATGATTCTTTCTTCACTGCCAATTTGACTTCCTGATATGTTAAAAGAAATGGAGAAGGTAGGAAAACAGAGGGGGAAGCAGAAGAAAATGGAAAATAAAGAAAAAAAGAAAGTTAAAAGAACATAAAAGAAAAACTTAAATTGCTCAAAATGACAAAAATATGGGGACCAATTGTATAATTTAACCTAAAATTTTTGTTTGAGATGATAATTTAACGTGTCACGTCAGCTTACCGTTACAATGTCAATGGCAATTAATGGCTCAATGACTAAAATGTTACAACATGAAAACGTAAGTGACAAAAATGTAACATTTCAAACATAAGTGACTAAAATGTAACCTGAGATAAACAAAAGTGACCATAGATATAGTTTACCCTATTTTTTATTGGTTAATTTGATGTGAAAAATGGGAAAAGATCATAAATTATTGGTACATTACTGATCTTCTATTATTAGCAAATTAAGTTGTTTATTAATTCCATTTGAGTAATTCTCAAGGAATTCAATATGAGATCCCAGAGGTTTTTTTTTTATCATGTTATTTTTAAGTTTTTTAGAATCAAGATTAAATAGATAGAATGCATAAATTTAAGGGTTAAATTTGTTGAATTTTTAGAATTAGGACCAATTTGATAGAATTTGTAAACATTGTAGGGTTAAATTTGTTGATTTTTTTAGAATTAAGACCAAATTGATAGAATCTGTAATTATTGTAGAGCTAAATTTGTTATTATGTAAATAAAATAGATCACGTCAGCATCCAAATAATAATTTAACAAAGGAGTGATCAAAATATTAAATGTCAATAATGTTAATGACTAAATCTGAAATTTTTGGAGATGGGTGACCAAAACATAAATATGCTAATAGTTGGGTGATTGCGAGTGTGGTTTACCCTAAGATTAACAGTAATAAGAGGATCAGATTGTGATAAATTAAAGTATAGAGACTAAATATCCAAATTGAGTATACAATAAGGATGTAACCGCAATTTAACCTAATTAACTAAAATGATTTATTAGGCCCCTCACTAACGGCCATTCCCGCCATATTCATTTCCAATTTACTTAAATACCCTCTCCCTAACAGATTTTTAACTACCATAATCAACCGTCTCTCACTTCCTCTCACCGCCATGGCAGCGAACATCTTCATATTGCTCCTCCTTGGTGTGGCGGCGCAGCCACTTCCACCAGCACCCCAGCAACCAGGCTGCGTGGAGGAGCTGGTGGCGTTTTCGCCTTGCCTGCCCTTTGTATCAGACCCACCAAACAACGCCACAGACTCAGTTGCTCCACAGTGCTGCGACGTCTTCAATTCTGCTTTCGAATCCGGCGACGGTTACTGTTTCTGTTACATCCTCCGGCAGCCGCGGATCTTTGGGTTTCCGTTGAACAGAGAAAGGGTTGCTTCACTGTCTTCCTTTTGCATGGCCAAGAACGGCGTTGCTTCTCTAGACTCGCTCTGCTCTTCAGGTTTTTCATCTTTTCTTAAACCCAATTGTTTAATTCACGGATTTCCGGATTAAGAATTTCATCAGGTTCAAGGCCATTTTAATCTTTTGATTAAAAGAAAAAATAGTTATTTAACGCTTTGATTGATGTAATTATGCAATTCTTAATTAGTATTATGCATTAGGTGCACCAGCGCTGCCGCCATTGCCAAGCACCACAGATTCAGGGATATTGAAACCATTCAATTCTCGTAAGTAAAGTCCGAATATCTTTTCTTTTTTATTTTTTCTCCTTTCGGAACCGAATCGGCGGTCAAACCTTACTACCTTAGTAGTTCTCGATCAGACTAATTCAATGATCAGACTGGTTTTAATTAAATAAATCATTTAAAAATTTATAAAATTTTTGAAAAGTAAAATATATTAAAAAAGTATAAAACTTGGTTCAACCGGTTTGCAGGTCAGTCAGTTCTTTCCCTTACTCTAGACTAGTGTACCAGCTGGTTCCCGTCCAACCGGCCAACCTTGCATTTTGTTCTTCCATGGCTGTAATAAAAGATTACCTAAAAGGAAATGTTCATTTGCAGCGTTCTTGCTTGTAGATTGACCAAATATAAGCCTAAATTATTTGTTTTAAAGATAGACCGGATTTTAAAACTCGTAAAAGGCCGATACCAAAAGCATATCAAGGCAATGGCATTATCAGTGATCTGTTATTGGTGGTAGAATCCTTATGAAAACTATTCTACAGGTTTAGATAATGATTCAACAAGCTCACCCCCAGAATCTGCGGTCAAGTCGCTAACTCCGCCAAGTTCCTCAGCAGAAGAAGCTGTTTTTTCTTCTGCAACAAACCAGATTTACAAGCATATCACTTGGTTCCTACTTGGAATGGTGATTTTTCTGCTTAATCTACATTCATTCTTGGTCTGACAGTAGCTAAGATTTTCCCGATTTCATTCGATTATACTTACTGATACGATAAACACTTTGTAATCAGCAAAATGATATGATGGAAAGAGTTTTATTAGCAGAAAAACATCATCAAAAACAGATGGTAACAGTGTACGAAGATCTCTCCTCTTTTCGTTTGCTTTTACCACTATGCCGTCGTACTGTCTCTTGAAGTGAACAGGTAAGTTCATCACATTCGCTACTGTGAAAACAAAAGCATAAAAAAGCAAAAGAATCATTGTAGGATGCGTGTATTTCATTTCCACCCATCGGACCACTCAGCTTCATCCGTGAAAGGAATGAGATTTCCAATTTCCTTGGTATCTTCACCCCACATTTCAGCAATGCTGTTTTCATCATCGACCCGACAATCCTCCGGAGTTGAAACTTCTGCATCATCTTCATACTCTTGCCTTTCAGGCAGAGCACAACCCAGGTAAGAGTTATGATCGGCACAACGCCATATAAGCTGACTCCAGTAAGGGTCCTGCCATTCATTTATTATCAATGATTAAAAGCCTTTGGTTGTAGACATTAGATGATAATCACAAGTGAAGATTGGTACCTTGGAAATTATGTGAGGATTTCCAACAATAACAAGTAAAGCTATGGCGCGAGTAACCGCCACATTAAACCTTCTAGGATTGCTCAAAAACCCGAGACAGTGGGTTCTGTCGAACTCATTGTGTTTGATTGTTGATCGGACGGTAGATATAACGATAACTTTTCGTTCTTGGCCTTGAAATTGTTCGACGGTGCCAACCTTGACATCTGGTATGTCGAGATTCTCGAAGGCCTTCATTAGTTTAAGGACTTGCTGCCTATAGGGGGTTATCACCCCGATATCTTTCTCGTTCAGAATCCCACTTGCTGTCAAACTACTAACAATTTCTACAACCTTGCTGGCTTCAATCCGATTGAACCATGACGGATTACTTCCTTCCCTCTCATCACAACCTTGTATACCAAAGAAAAAAACAGGGTAGTCCTTATTAGGAAGAAACTTTACTGAGTTCAATAATGAACCTATGTCATCTTTGCAAGGGATCAATTCATCATTGTAGAAGAGAAGTGAAGGGAGATAGAGGATCTCCGGGTGACATCGATAGTTTCTAACCAGTTTTGTCACATAGTTTTCATTGCCATTAGAATAAAACTCGTGTTCAAACAACCTTTCTAAGTATGACTTCCCCAGTCCAAAATTCTCGGCTTCTTTGGAGTATATAACTGGACCTAACTGCTTTGGATCCCCAGCAAGAACAACAACAGTCTCTCTTCGGCAAAGGTTCGCTACAGGGATCATGCTTTCTGGCTCTGAAGCTTGACCTGACTCATCCAAGAAAATATGAGAGAAATGGCCTTTACCAACACTTTCTGCATACAGAAGGGAGGAACTCATGTAAGTTGAGATGATGATTCTGTAGCAGGCGAGAACACTAAGTGGAGGACATTTGAAAACAAGCTCATCAAAGAAGCAAAACCGGAGAAAATCCGGGTTGACGTCGTAATATGGTCGTGTAGCTGCATTTAGTCTGAATATTTCATTCTCTTTAATCTCAACAGACTCCTCATTAAGGAGTCTCTCTAGTATGAAATCAGCCGCGCTATTTGAAGGTGCACACACAAGAATTCGAGAAGATTTTTGGGTTGAGTAGAGCTGGAGGATTGCCTCCACTATTGTCATGGTCTTCCCTGTACCTGGTGGCCCAAAAATCACATAAGGAGGTCCTCCTTTGCAGCCAAGGATCATCTCAATTGAACACATCTGCTCCTCGTTAAGTGTACAACATATGGGCACTAGTGGAGTGGTTTCAATCACCCTACTTTTGGGTGACCCAGATGGAAAAAGGAGACTTACATTTAGGCTTTTTGCTGCATCAATGGCCTGGTATTGCCTCCGCATATTGATTCGGTTATAGGTGAACTGCACATTATAAAGATTCTCATCTATGTGATTCGAGTGAAATTCTGGTGCAAACTTCAAGTACACTTCATCAGCTTCTACCCGATGGATACAACCCTGAAAATCACCACATTCACTTGTCAGAAAGACAGAAATTCTCCAAAAGAAATAGAGGCCATGGGACTGGAAAGACTAAAATGAACACAAGGGAAAGAGTATACAACAGAAGATACCGAGATAAATTTAAGCCAAAGAGGAAGTACTTCAATGATAAAAGGATAAAGCATATAGTATTTTTCGTGTAAAGCAGACCTCATAAACTCTGTCTGATCCACTAGCATCTTCACATGCAAGTTTAGCAAAAATATGATCTCCATGGACAAGGGAAGGCCTTTTTTCAGCGAGCCCAGGGACCTGAAGTGATAAATAATTCCCTCTCTTCCTCATGTTGATATTCTCCATGTTATAGGCCCTCATGTCCTCCTGAAGCCAAAAAAAGGGAATTTCTCAGTTTTGTAACACGAATATCAACCATCTAAGCTACCGAAGGTTAGAATTACCTCGAGTTGTAACTCTTCCAAGATTAAGAGATGTTTGAAGTAAGATACATAATTATCCCTTGTAAGACCTGCTTTAATAGCATCAGTAGTCTGCTTATTCTCAACCAGTTCTCTAATATCCTTCGGAATGTCATATGGGAGAAGCCTGTTTCGAACACCTCGACCCATTGCCCTTACCGGGCGTGGCCCTGTAACAAATTCATCCACTGGAAATTGCTTCTTTCTTTGAGCTCTGGAATATGGCTTCTTAGAAGCCAAAGATTGTGAGATCTTATCTTCAACCAAGAGAAAGACCATTCTTTCCAATCTTTCACCCTCCACATCAAAATGCACTATGGTAGTATGCAACCCAATTTCCTTTGCTTTGCAAGACAACCAAATGGTTAAAGTCTCTCCAGGCTGTATCATTCGGTCCTCTAAATCGAAAAGCTCGACAAACCCTTGGCTCATATCGTCTTCAGAATTTGCCGATGGGGGTTTCATCAAAGAAAGAACGAAAGAATCCTTAGGCGTTGATGCGTAAATTTTAGTCCACAACTCAACCGGTTCACTAGTGGTGTTTTCGATACTGATCAAATCAAATGCAGTTGCTCCCACGAATACAGATTGAGGATTCCCTTTCGAAAATGGGAATGGTGCAGAAATTATGAGAGGACCCCCCTCATGATTGTAATCACAAACAGATTTGTTGTTTGCATAATCGATGAAATTGATTTCGCGTTTGTCCCCGATGACCGAATACTCATCATCGGATTTGTCACCAACTGTTCCCATCACTAACTAGAAAGGGAAGAACTGCTTTGCAACAAAATCCACAAATATGCAATCATTAAAAAACCCTTATACAAGCAGGAACACACTTGTAAGATACAGTACACCACCATATATATATACCGATAAAATAACACTTTTAAACACGATTATGACGCAACAAAATACACGAAATTAACACGAATGCATAAATAAAGCAGGATGATAATCAAGTTTAAGCATTTTCAAATGTCATAAAAAAAAAGAGAAAAAGAAACCCAGCATTTCAATTTTTGCAATGCAACATAATACAATCATAGATAGATAGATAGTACAATACGTGAATCATAGGCAATAACGATCATTTAAAATTCATGATCAAAAGCAAAAACAAGGTCACAAAGCAGAAATTAACAAAACCCAGAAACAAGATAGTGACAATGTAGAAAAAATTAGAAAAAAATATTATTCAAATTCACTGTGCCAAAATTATAAACATTTAGAGTACGTTAGCATGAACTACTCTATGGGTAAAAAAAAAAAAAAGGAAAAAGAACTCACCTCAGTGAATCATAAACCAAAGCTAGAAACTACCATATGAATGAGAGGTTTTCCTTTTTTTTAAATGCAGAGAAATCAAATGAACCTTGAATTCAGTTTTTTAAAGTTTTTTAATTAAAATCAAATGAAAGAGACAATTTTTAAAGAAAATAAAAATAATATGACCCATCACAATCAGCAGATTTTGCCCTACAAGCTGCAAATAAAAAAAAAAACACATAGGTTCATATATTTCATTTTTTTGGCAAAAACAGGGAATTCATAAACAGACGAGGAAGTTAGTTTCACTTATCTATCACTTAAAATAAAGTATAAAAAATGTAAATTTTAATTAAAAATGGTATAAACAATTTAGATATTAAAGGTTTAATTTTTCTTTCAATCCCTCTAGTTTTTAGTTTTTTTTAATTTAATCCCTTTATTTATTGGATTTAAATTAACTTCAACAAAAATAAATTAAAGTTGTTATTAATTTAATTTTAATTTTTAAATCAAATAAGATACTAAAAAGAGAATGATTAAATTTTAAAAATATTGATAATGGGGAAATTGAGAGTACAATTAGAATTAGGGGTGAGAGTTCGATCGAATCAAGTGAAAAAATTTTGAGTTAATCAAGTTCACAAGTCCTATTTTATCATCTTAACTCAATTTAAATTTTTTCAAATATAGTCAAATTGAGTGAAATTATTCAAGTTAAATTAAAAAAATTAAACATGTTAAATAAAAATATTGTTACAGAATGACTAATTTTATGTTAGAGCATATAAATTTGAAACCATATATATTTGAAATAATTTTCAAAGCAAAATAATAATAATAATAAGATACTTGAGTATGATAAATTTGAATCATTAATTAGGTCTCTAAAATTATTATTTTATAAAATTTTTAGAATTTTTTAAAACTTTTATAATTTTTTAAAAAATATAAAATTTGAAATTTTTATAAATATTTTGAATTATTTTGTAATTTTTGTTGAGAGAAAAGCCAATTTATTTATTTCCAAAGTTGATAGGGACTAAAAGGTATTTACACCATTATTCGAATTGTGAAATTCAACTAACTTGAACTCAAAATTTGAATCGAGTTATTCGTGTTAATGCAAATCATTTAAAATTCAAAATTAACTCGATTCAATTAATTTGAAATTTAAAATTCTTTTCGATATTTTTAAATACCCTGATTCAAACTATTAAAAAGGAACTCATAAATATAGTTGAAAAAATTTACAGAGAAAATTTCTTCTTACATATTTTTATTTATTCTTACTAATAAATCCCATTGGCTTATATGACTCTTTTAGCCAATTGGCTTTCTCAGTGATAGAGACAGTTAATTTCCATTTTGATGAATGTATTAACTAATAATTAGAACTGACGTGGCTAAACCCTATTGGTTATTATGACACTCACCAATTGGCTTGTGAAGGGGTCCAAAAAATTTTCTATTTTTTAGTAATGAAATTAAAATAAAATGAGTTTTAAATTTTCTTTGATTTTTAATTGTATCTATTTTTTTGTAGGGGAAATTTATAGGAGTTTCTCTCCTAGTTTTTTTTAATAAATAAATTTTCTTTTTAATTTTGTTCTTTCATGAAATTGAAATCTTTTTAAAAACCGAATTCATCCAATCCGCTCCTATTCCTGTTGTGATCTTAACATAAATAGTGAGACAAATAACATGCCAAAGCTTCTCTACCTTTATGCAATAATCCTTTGTCTACCAAGTCCGGGGCGTAGTTAGGGGCTTCCCTCCTTTAAATTTTTTTAAATTTTAAATTAGTAAAGATAAAATTATATTTTAATCCTCTAAAATTGATAAAAATTTTTATTTAATTCTTTAAAAATTATAAAGATATAGGTTGTGAAATTATATTTTTACTATTATAAAAATTACAATTTAATTTTGACCCTCCCTAAAATAATTTTCTGGCTTCGTTCCTGACCAAGACCCTTATAAGATTCCAATTATCAAAAATTAAATTTCAGCCCCTCAAAAACTCGGTACTTTATTATTGGATTCAGATATGAAATATGCATATATTATTCTACTAGCTAAGATATATCAAAGCAAGTTAAAAAGGAATAAATCTTAAAAAATACATACCAGAATGAGGGAGCTATATAACCTTTCAGGGAGATCCTTGGAAGAGATGATCTTCAAATATACAAAAAAAAGGGTTGTTTTTTTCTTTTTCTTTTAACACCTGGGTAATTAGCATAGAAGTTTAATATATGTAAGTGATATTTTCGAGCGCGTGAAAATAATCAATTTATATAGAAAGCGAGAAACTTAATTTGGTATGTCCAGTAAGTAACCAAAAGTAATATAAATGAATAAATTTAGAATATTGGGATATTTTTATAATTAAAATATAAATTTAAATGATTTTAAATATGGGTTGTTGAAGCCTCCTCATTTTAAAATATTAATAAAATTATTTGTATATGTAATATATAACTGTAAAAATTATATTATATTGATAATAATGTTATTAATAATTTGTAAAAAAATTTGAATCTAATTATTTTAAACTTTAAATTTTTTTTATGTGAATCTATAATTTCAAAATAACAATTGAATAATCTATTTTATCTAATTTAATAAATAAAAATGTGTGACAATCCTTTTCTTTTACCAATAAATTAATAGAACTCAAATATAAAAAATATGCTACTAAGAGATTAGAAACATAATTCAAAGATCTTTTGCTCTCCATAAAAAATTTCCATCTCAAAATACATTGGTTAAGATGTGGCAGCCACAAATTGCTGTACTCTTTTGAAAGTTTAAATGTTAACTTCTTTATTTTTATTTTGAACAACTTTTATTTAAAAATAATAATTTTTCTATTTTTCAAATTTTAAAGTTCAAGTCTAACCATTAATATTAATATTTTTAAAATTCAAATTAATTATATCTTTTTTTTTAAATTATATGGCTATCAAGTAAGTTTTTTTTTATTTCATAATATCACACTAACAAATTTTAAAAAAAAAGTTAAACAATATTTAATAGTAGAATTTGAATTGTGAAATCTGAAAGGTAAAAAAACTAAATTCCTGAAAAAATACAAAGCTTAAATTTCAATTTTTTGAGAAGTATAGAGACTAATGGCATACTTTAATCAAATACAGTATCCCTACATCCCCAGATTTCGAACACCATCACAGCAACAACTTAGTTTTTAATATAAAAGGTTTGGCTGCTCAAGTCAAACATACTGTTTCCTGTCGTTAAAATGCAAATTAAAACATTCATTATGAAAGAGCAATCAAGGATAAAAATCTTTCAAGCTGAAGCAACTGCAGCATCCTTGACCGATTCACGCCAGGCATACTGCCTCGCTCCATCTTTGTCGACGATCTTGATAACAAAGTTTGGAGGTGCCACAACAAGTCGTGACCTTATCTCCATTATGCATTTATCTACCAAGTCGATGGCTTCTTCCACAGTCATGCCGCTGTGGTAGTGCCTGTCCATCATAGAGAGAGAAAAATAGGATCCGTACCCGAATGCTCCCTTATCAACTTTGTGAAGTGTAGCGATGTAGTCAATGTAGTAAAGTGAGGGGCCTGTCTCTTTGTCGTAGCCAGCAAGAAGAATGTTCACGAAGTATGGGTTCTATAAAAAACCAAATGCCATTGTTAATAATAATGATAGTAAGACGAACACGCGGGTGAGCAGAGACCTTAATTCAGCATTCTCATGTCAGACAGGACAAGAAATAAATAATAATAATAAACTCACTGCTAGAAGGAAAATATGCATAGGCAACCTAATAAGGAACTTCAAAACTAGATTTGCAAGATCCAAGAACCGCAAAGACCAATAAGTGCATTGAGCATCAAGCATGGCAGCAACAAAGATCAACAGAGATTTGAAAAGAAACTACATGTGCCAAGAGTCATCATCGGAACTCCAAAAAAAAAACACAGAGTATTGTAATTGTACTTTCAAAATTCCTTGGCCTTATTCTAATCTGATCTTCCTATCCAAAACAACAGCAATTAATCCATAAAGCTTGACAAGAAGTTCTATCAGAAACTACACCTTAAATTGAAATAAAATGTCATATGGTAATGGTCTCGTGCCATAAAAGCATCAACTCCTTTTTGAATCCTATAACAAGCTTACATATTTCATTATAAATTTCAAGCTCAAAAAATTTTAGTTCGAGCAAGCACAGCTGATTGTCTAGTGGAAATCTGAAGGAATATTTTCCTAGATTGTTTAATACAAGATGTAACCCATCTTTTCTCGGCTGAAAAGAATACCTTTACAGGAATCTCATTCAAAAACATATGGAATGGGAAACCACTAACTAGAAGACCCACAAACCAGACACAAAATCTCAGTGAAGGTACCACTAGTATTGCCAAGGGATGGACCTAGGCATTCCATCTTAGCGTCAAAAGATAAAAGAGCCTCAGATCTCTTCAGGCCAGGTGCATTTGATCAGGCACATGCTTGATGTGCATAAGCATACTTTTAAAGTTCCCTTTAATTTAACTTTTTTTAAAAAACATTTTCACTGGATATACATTTATTAGTAAGAAAAGGGAATTAATCAAGGGCTAAGATCCACTCCATTACTTTTTCATCCATTAATATCCAATACAATGATTATCACCATTCAAATGGTAGGACCCATCTATTAAATGTGAAAATCAACTTGTGAATGATGATTAAACGTGCATTGGATATTAATAGATGAAAAAGTAATTGAGTGGAGCCAAACCCATAAATCAAAACCTCTACTTCCCAGTATTGGAGAACTCGACAACAAATATGGGACCGTAAGGGAATCAAGCATATTGGCCAATAAAAATAAAAGAAAGCTTTGCATGTTTTATAGATAAATTGCATCAATCTTTAGAGTTTATTATCATAATTACATGCCTCAAGCTTTATATATACACAAAGACATAAAATTGCGCCTTTACTCAGTCAAGTGCTTTTTTTGTGCTTTGTGTCTTGGGCAATATAAGGGTTCTAACACTAGAGTGCCCCATGTGCTCTTGACAACACTGGGTAGAGATAGAAGGCCAAATAAAACCTTGAAGCCAAGATGAATAAGACAGTCTCTTAGTGAGGTAGCATCCAAACTTTGCACCAAAAAACAAATCCACAGGTTAACACTAAATGTTTAAGTAAGCAAAGGAAATGATAGCCCAGCAACTTCAAAACTTCCTGTGGTTTAGCTAAGCACTCAATAACTCAGCTGGCCCCAAAAGTGGTTACCATCACCCAGGAATCCCAAAAAAAAAATCGGCTTTAACATAACATATGCTTATCTTAGGTACTAGTTCAATGTCCTATGCTGTAAATCAAGCAAAGAAGTGATTGCAATCGGTTCTGGTAAAAGAGGGACCAAAGCACATATCAAGCTACACCAATCGTCGCACATTTCAGGGCATGGTAAAGCTATATCAAACCACTTTGCTTCCAATTCTAACTCATCTAACCCTTCCAGCATTGCTCTATACAAATAGTTTCCAAACCGGAAGCTTCTTCAATTATCGAATATCACCATAATGAGAAATCAAGCAGAGGTAAAACACAGATTATAGCTAATATTTCAATCCCAACGCACAATACATCATTTGAAACTAGTGCAAACCCTAACAAATATTGTATTCCACATAGATTCATTACTCTTCGCCGGTAAAATTTCCACAAGCAAGTAAATTGCAATTAAAGAGCATAACCCTTAATTGAAACTATATAATTGAAACTATATATATGACTAGTATCGATACCTTCCTTAATGCAGTGGCAAGCTCACCGCGAGTGAAATTGGCAGCGGCGGCAGTTGTCAAAGGAATACCATTGCGAAACTGATACAAAGCCACGTTTTTCTGTATATACTCCGTGAATTGCACTCTAGGGAAAAGGAAAAAAGGTTATATAGGAGGAAAAGAAAACAGGGAAGTATATACGTAGATTTATAGGGAGAGAAAGAAAAAGGGGGAAACCTGTCACCGGATTCACCGCTGGCGGCGATGAGTTTGTGAGAATCGAGGACCATGATCTTGTCTTCGTTGGATTTGTGGACGAGGATGCTGTGAACCGCCGATGTGTCCGCCGCCACTACGGCAAAGCCATTGCCTACGAAGCCGAACACGCACTCCATTTTCACTTTTTTTTTGAGGTTTGATTTTGAGGCTTTTGATTTTTTTTTTTTTAAAGCTAATATAAGTTAGTAGAACTGCCTTGAAGAAAAAGTTGTTCTTAGAGTGGGAAAATGGGGAATTTTGGGGAAAGATCGAGGGCTATTTTGTCATAGAAAGAACACTTGGTTTATTGTAACACGCGGTGCTATTTGCAAGGTCGGATTAAGACTCGATTTTAAAAAGATCCCAAGCCTAGCTCGACTAAGCGAATTCAAAATTTTTATATTCTTTTTTTAAAAAAATAATAAAATAATAAAATATATTTATATTTATATATTTTATAATTAAATTTAAATGAAGATATTTAAAAATCATTCTATTAACAATAAATATATTACTATAGTTTTCAACAAGTAGCATCTTATATTTCATCAATAATACATAAACTTAGGAAACTTATATCCTGATGTTGTCAACTTCAAGTATCAGTCATTTGTTCCAGCCTAGTTTTTAAACCTTCATAGACACAACCCCATAACTCCAAGCTCCAATGCTACGCTGCGTGAGAAGCCCATGATCCAAGTTCCATTTCTGTCTCGAAGCAAGCCTCCAATTACAGCCATCCATATTCAATTTGGTCCAGCAAATCTTTCTTCTCGCCACCCTCCAAAGTGTACTTGCCTAGATCCAGCATTAAAATCACCTGAACTGACAATAATGGAGTTCCTTTGTTCCCAGATTTTCCATACAATAATGTGCATTGTTAAACAATAGCCCATGCAGTCTTTAAATAAAACCAACTTTAATCTGAATTTTATCACTCTAAATGTAATCTATCTGATTATTTATTTATGTACTTCACTCACTCATATTTTATTTTAATAAAAGGGAAAACACAAGATTATGTTAAAGGAAAAAGTAAAGATTTCCCTCTTATTTTATTCCTTAAAACCAAAGGACTCCAAAACACACAACAAAACAAGGCTCTTCCTCTTTACATAGGCCACCCTTATTTTATTCCACCATTACATGCCTTACAAAACTACTACTTAGAACAAGCGTGCAAAGTCCAGGAACGGCGATAAGGGGTTATTACTTCCCCTCCTCTCATCAAATCCACGCCGACTCTGTCCAGACACGAAGTAAGATTCTTGCGGGTTGTTGTTGAATACCTCATCCACCAACCTTGACTCCACCCCAAACGCCAGCTCCTTGGCCTGGCGATCCCATTGTCTCACATTGTTGGTTTTCCCAGCCACGAAGATCCTCTTGTTGTCTTGGCCGTTGTAGAGTCCGAACCCGAGCAATCCTAGGTCCTCGTTTTGGGAGGCAACGAATGTGACTGGATGGCCTGCTGGGACTACAAATAGGTCACCGGTTGATAACTGGGCTCTCACTCTCTTGTATTGTCCACTTCTCCTTTCAACTTCTTGTTCTTCTTGTTCTTCTTCCTCTCGGGAGGACCAGTGTGAGCTCTGCCTAGAAAGGTGAGGGCAGACCATTTCGACGTGGCCGTTTCCTTCG\n>URS0001836490 rRNA from 1 species \nTGCGTAGGCGGATTTTTAAGTCAGTGGTGAAAGCCCGGAGCTCAACTTCGGAACTGCCATTGATACTATTAATCTTGAATACAGTTGAGGTGGGCGGAATGTGTAGTGTAGCGGTGAAATGCTTAGATATTACACAGAACACCGATTGCGAAGGCAGCTCGCTAAACTGTTATTGACGCTAAGGCACGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCC\n>URS000010477A piRNA from 1 species \nGAATATCCCTTTTGAGCTTGCTTG\n>URS000188E1BA rRNA from 1 species \nATACGTAGGGTGCGAGCGTTGTCCGGAATTACTGGGCGTAAAGAGCTCGTAGGTGGTTTGTCGCGTCGTCTGTGAAATTCCGGGGCTTAACTCCGGGCGTGCAGGCGATACGGGCATAACTTGAGTACTGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCAGTAACTGACGCTGAGGAGCGAAAGCATGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGGTGGGCGCTAGGTGTAGGGGTCTTCCACGACTTCTGTGCCGTAGCTAACGCATTAAGCGCCCCGCCTGGGGAGTACGGCCGCAAGGCTGAAACTCAAATGAATTGGCGGGG\n>URS00023A7F2B lncRNA from 1 species \nCCGGCTATACTAGTTAGAAATTTTCCAACAGTATAGTCGCACGGATATACAAAATTGCTTTTCTCATCCAACGAAGTAGTTTTTCATTCTTATTTTTTTCGTAATGGGGCGGGTCAGGGAACTAATTCTGCAATGAAGGCTGGTATGGGCCAATGGCGGATTGAAGACCGGCATATTCTGAATATGGGCACCAATATACCGGTCGACTAGTTCTCCAAGCCAGTGGCAGTGGTTGCAGTTGATTTCCCCCATTATCACCTATTGGACAACCTTTGCCTTTTCTGTGTCTTGGTGTTTCACCATTTTGGCCAACCATAGTCTCCAGTACCTCGGCCATACTTAATTCCAGTCACCTTAAATGTAACCGAAAATACTTGCTCGAACTCATTCATTTTGGCCCGCCCTAGTTGACTCCCATTTATTTGTCTGCTATTCTAGATCTAGTCATTATCAATCACCATAATAAAGCTCCACTCTTGTAGTTTCAGTTTCACCTGTGCCTTTGATTATTTAGAACAATTTAGACTTTAATGATATGGTCACGGTTACAGCACAAAAGACAAATACCAAAAGCGGCCCTCGTGAAGAAGGGTATGGTCATTGGTCACCCTCAGTTTCACCTGTGCCTTCTCATCACTTTCATTCTCGCCTCCTCATCACTCTCTGTCGTCTGTGGTGCTCAGGAGCACCACCACCACAACGGCATTATCAGCCATGGAGCTCTCTCCGACACCGAAGCCCTCTACATCAAGCAGCGCCAGCTTCTCTACTACGGGGACGAGTTCGGCGACCGAGGCGACCTAGTCACGGTCGACCACCATCTCTGGTTTTTGAGAACCAGAGAATCAGAAATGCTTACATGGCTTTACAAGCTTGGAAGCAAGCCATTCTCTCCGACCCGCTTAATCTCACGGGTAATTGGGTCGGATCTAATGTCTGCAACTGTATTCAATTTAATCAACTGTAGGATTCATTTACAAGGCGAGTGGAAGGAGTCATCAATTTTGAATTAACAAGTTTCTACTTTAACGTATAACAACTATGTTCATATTTATTGGCTGGATAACTTGTTATATTCAGCCAATTACTTGGATAACGTATGCACTTAAGGTGCAAGTGCTTTGACATTTGTGCCACATAGAATTACATTCCTTTTTAAATATTTTATGATATAATTTTTTTTTTATTTTTAAAATTTTGAAATCATTTTTTGGTCCAATGTTACCCCTTATGACTTGAATTGGGTAATAGTCATTTATGTCATATTGCCTACTACCTATTGCATAGGTATATATATATATATATATTTTTTTTTTTTCATATTTTCGACAATGTGTCATAGTATTTTATGTACCTTTTTTTAATAGGTAACATATAATTTTATTTTGTCTATTTTTGTATCTGACTTATGGGTAGTCTTCTAATTTATGTTCCTAACTTATAGATAACACGATTTATCACTAAATATTTTTCGTTGCTAATAATAACACTATTTACTTGTATGTCATGTACATAATTTAATATGGGTGCTTGTCTGATCGATTGGTATAATATGTGGGTCTTTACTTTTTATTAATTAAATCGTATTTTATCCATATATTAGGAATATTATCAAAGAAAGAATTTAAATTTTAAATTATGAAATTCAATTACAAGGAAATAATGCATTAAATTTAGATTTTCAATGTGGTTTCCTTATTTGCCTCAAAGGGTAAAATTGACACAACAAAAAAAAGTAATAAATGTCAAAGGACTTACGTCTAAAACCAAAAACGCGAGCACTAAACCCAATGATAGCTAATCGTTTTGGGCCTAGATCTAAGAAGCCCTTTTATTTATTATCTAACATCGTTGCATGCCATTGATAGTGTGCCTATGGATGAGGAAGAGAAAGTTGTGCTTGACTGATGATTGACGGAAACTTTCGCAAGTAAATCCTCGATGCTACTGGTTGAAGGCCCTTTGATGTTAAAGTTAGCTTAAGGGGATGAGCGCAAGCTATCGACAATGCAAGGGCATAAGTGTCAAGTAGCAAGTCTTACCCTGTATCTAGGGTAAGGAGTTATATATATAGGGAATTCTGGGTTTTTTTGGGTGCTTAGTTTCGATGTGGGACTCGTGGGAGTGCCTTCCAAGGCTAACACGCGTCCCAGCAAATATCCTAGCGATGAACTCAAGAACATCCTGCAAGATGCCTTCTAAGGCGTAGAATTTGGCAAGGCATGCCGAACACACTTACCGGTCGTGGGCCGATCAGTGAACAATTGGCGAATGGAGCTAGAAGCGTCTGCCGTTTGTAGGATTAGACCTACCAGGATGGGTTACAGGGCCATGTTGTGCGTAGAATCGGTCGTGGGTGCCGAAAAGACCTACCGATTAGTACTACTGGGCTTGCCAGGGCGGGCCATGGAGCCTTCCTTCACGTGTCATGGCATGAGATGCGGGTCAGGTATGATACAAACAAACTTAAATTAATTAAACCCATCATGCAATGCATTCCCTTTCAATTTTTTGTGATAAACTCATAGATAATTGACTAAATAAACATCATCCAAAGTTTCAATAAAAATTACCAAGTTTTTTTTACAATTTCCGTAGTTTTTATTCAATTTTTATCGATATCGATAATATCCCGATATTTCCATCAAAATTTCCGTGTTTTTGAACTATCGATATTTTTAATACCATCAATATTTTATACCTTGGCTGTAGGCATTGATTATCAAACTAATTATCAGGGGACCAGTTGTTGGATGACACTTGGGCCAGATTAGAAGTGCATTAAATGTTTCCTTTAGTAATTCTTGGAAACCTGTGCAAGCTAGATTGCTTATAGAGGCGATCTGTGGTGGATTTTCCAGTTGTTTTTTATTTTCTTATGCTTGATTTAATCAAGAAGTGTGAAGGAGTTATTATCTAACATCGTTGCATGCCATTGACTATGGATGAGGAAGATAAAGTTGTGCTTGACTGATGATTGACGGAAACTTTCGCAAGTAATCCTCTCTAGCATTGCTCGTGCCGGAAGTGTAATTGAGGAGCTGTATGGGTTTGGTGTTGTGTGATGAGTATATTAAGGCGTATCAAGGGTATTTTTGGTAGTTAAATAGGATGTACTTAGTTAATTTTATATTTTAATTTAAATATTTGGGTGTACTTAGATCATAAGGTGTACTCAGTTAATTTTAGAATTCGTTTAACCACACTATATTATTATTAATAGTTTTCTATCAAAACAAACCCTTAAGGTCCTTAACTATTGGCTTGCAGCCACATATAATTACTGTGGTGACCTTCTCGAATCATCAATTTTTATTCATTTAAGTTGTTGATCAACTGCTGCAGGCAAGTTATTCTCCTGAACTCGAGTCCCATCAAGAGCGGGTCAAGGGGGTGAGTAATTGTCTCAATTCCACACGTAAACAAACAAAGGCTCACAAAACTCTCCAAAATATACGCATTAATTCTTTGCTTCTTTTCCCTTTATAAGAAGAAGAAAGCCGTCTAATTCATCATCACCAACACAAGCAAACTCAACATCAACAATGTCGACAAAGTCTAGCATTACCGTCCTTGCCTTTGCCTTTTGTTTCTTGTCCCTCCTCAGTTTCGCTTACTCCAACACCACCGACGACAAAATCTCTACCTCACCGGCCTGGTCTACTGTGACAACTGCCAATTGAAGTCTATGACCGAGATGAGTAAGATGATAAGATTTGAATATGAGATTTATGCATGCATGCATGCACATTGCCCATTGATCAGGTGCACATCTTTTTATCTTTTACTTTACTAATTCTTAATTAAGATTCAATTTAGGACCTATTTAAAGAGAAGAAAAATACGATTTAAAATATATCTTATAACCTAATAATCTCCTAATCAAAATATTAAACTTTTAAAATGTCACATATCAATTTAGCCCTTAATTATACTAAGCTTAAATTCCATGGTCCATACTAGTTTGATTTTTATTTTTTATTTTGGTGTGAAAATTTGGTATTTTCTTTAAAATAATGTGCTTGATAGCGTGAAAGTAGCAAATAAATAATGATGTGTTCAAATTGGATTTGAACACACATCACAACCCATATCATCATTAAGGCCCTAAAAATTAAATCATTATGTGCTTGGTTAATACGTTAAGTAGTTTATGAAGTGATTAAGATCAAAGAGGATCCATGACTTGTAATGGATCACTTGTTCATTTACTTAAAAATAAATAAATAAATAAATAAAAGCAAAGGACCCACTAGTGTAGTGGTTTGGAGTATTTACTCCCTTAGGTAAGGTCCTGGGTTCGAGTCCTAGCATCCGTGTTGTGTGTGTGAGTTTAATATGCTATCGCCCCTTTCAATAGGAAAGGACCTCAAAAAAAAAAAAAATAAATAAATAAATAAACTCGCAATACCGACTCCATTCGTAATTCCATCAATTACGCGACCAAAACTTCGTCGCTCAAAGTCTTGCGCGACGAAAAACAATTCGTAGCGCAAAGTCACTTCGCGCGACAAACTTTTGCGCGACGACAATACATCGTCGCTCAAAGTCTTGCGCGACCAAATTTTGCTCGACGAAAAAAATTCGTCGCGCAAAGTCACTTCGCGAGACAAACTTTTGCGCGACAACAATACATCGTCGCTCAAAGTGACTTTGCGCGACGAAACAATGAACTTCGTCGCGCAAAGTCCTTATAAAAATAAAATATATATATTTTAAAATCTTTGCATGACGTAATCCAAATATTTCGTCGCCTAAACTAATTTATTTTTGTTTTTTATTTTGTATGCATAACACTTAAGAAATTAAACAGTATATATATTTATTAAGTAGCTTTAAATTTATTATTTTAGATCAGATCGGATTTTTGTTAGAAAAATATATTATTGTTGTTCAGATTGGGTTTTTGTTAGAAAATATATATTTTAAATTGACGATCGAATTAGTTCATTGTATTCATATATGGTCAAGGAGTGTAGCTATAAAAAGCATCAAAATTGGAGTTAAAATAACCGTTAAATCGTGATTTTTCATTATAACCGTCGAAAAGTTTTGTCCCATTACTTGATCTCTGAATGTTTATTTTTTCTGATTTTTGGCGTATATGATCTCGAAGTATAAACAAACAAGTTTGACGGTTGGATCGTTGAAACTAGTTTTGGTGAATGCATATGCCATCAAAACAATATATTCACTAACAGTTAAGAGTTTATTTATACGTTCGTTAAATATAACATAAGATTTTGTGGTATCCACTAGTGTAAATATTTTAAATTGAAGATCAAATTCAGTCGTTGTATTCACATAGGGTCAAGGAGTGTAGCTGTAAAAAATCATCAAAATCGGAGTTAAAATAACCGTTAAATCGTGATTTTTCATTATAACCGTCGAAAAGTTTTGTCCCATTACTTGATCTCTGAATGTTTATTTTTTCCGATTTTTGGCGTATATGATCTCGAAGTATAAACAAACAAGTTTGACGATTGGATCATTGAAACTAGTTTTGGTGAATGCATATGCCATCAAAACAATATATTCACTAACAATTAAGAGGTTATTTATACGTTCGTTAGATATAACATAAGATTTTGTGGTATCCACTAGTGTAAATATTTTAAATTGAAGATCAAATTCAATCATTGTATTCATATATGGTCAAGGAGTGTAGCTGTAAAAAAAATCATCAAAATCGGAGTTAAAATAACCGTTAAATCGTAATTTTTCATTTATAACCATCGAAAAGTTTTGTCTCGTTACTAGATCTCTGAATGTTTGTTTTTTGCGATTTTTGGGGTATACGATCTTGAAGTATATACAAATAAGTCTGACGGTTGGATCGTTGAATGGTGTGTGTATATATATTTATTTATTAAGTAGCTTTAAATTTATTTATTTTGTACGTATAACACTTAAGAAATTGAATAGTATATATATTTATTAAGCAGCTTTAACCTTATTTATATTTTAAATTGTAAAATAAAATAATTTTATTTTTATTATTCCTAACAATTATTTTTATAAATATTGTGTTACGAACCAATTTTTCGTCTCTCAAAAGTTTGCGCAACCAACAGTTTGTCGCGCAAAACTCTAAAAATTTGGACGGGTACCAAAAATGGGACGCGGGATTTTTAAAAAAAATAAAAAAAATTTAGACTTTGTGCGACCAATATTTTTTGTCGCTCAAAACTTTGCGCGACCAATATATATTTTTCGTCTCTCAAAAATTTGGGCAGGTACCAAAAATGGGAAGCGGGAATTTTTTTAGACTTTGCGCGACTAGTATGTATTTTTCGTCGTGCAAAAATTTAAAAATTTTGGCAGGTACCAAAAATGGGACGCGGGGATTTTTATTTTTTTAAATAATTTTTTTAGACTTTGCGCGACCAATATTCCTATATTCGTCGCGCAAAAATTTAAAAATTTTGGCGGGTACCGAAAATGGGACGCGGGGATTTTTATTTTTTTAAATAATTTTTTTAGACTTTGCGCGACCAATATTCCTATATTCGTCGCGCAAAAATTTAAAAATTTTGGCGGGTACCGAAAATGGGACGCGGGGATTTTTATTTTTTTAAATAATTTTTTTAGACTTTGCGCGACCAATATTCCTATATTCGTCGCGCAAAAAATTAAAAATTTTGGCTGGTACCAAAAATGGGACGCGGGGATTTTTATTTTTTTAAATAATTTTTTTAGACTTTGCGCGACCAATATTCCTATATTCGTCGCGCAAAAATTTAAAAATTTTGGCGGGTACCAAAAATGGGACGCGGGGATTTTTATTTTTTTAAAATATTTTTTTTAGACTTTGCGCGACCAATATTCCTATATTCGTCGCGCAAAAATTTAAAAATTTTGGGGGGTACCAAAAATGGGACGCGGGGATTTTTATTTTTTTAAAATAATTTTTTTAGACTTTGCGCGACCAATATTCCTATATTCGTCGCGCAAAAATTTAAAAATTTTGGCGGGTACCAAAAATGGGACGCGGGGATTTTTATTTTTTTTAAATAATTTTTTTAGACTTTGCGCGACCAATATTCTTATATTCGTCGCGCAAAACTTTGCGCGACCAATATGTTTCGTCGGGCAAAAGTTTGCGCGATCAATATTCCAATATTTTTCGTCGCACAAACCTTTGCGCGACCAACAATATTTTTCGTCGCGCAAAGTGATACGGTTTTTAAAACCGAAATAACTCATCCACCATTTTCTCAATGCCTTTCTCTACTCTTACCTCTCCTTTCTCTTTCCCTCTCCCCAAATCCCACCATTTCTCTCACTTACTCCTCTCACTTAATCTCTCATCTCTCTCTCACTCACTCTCTCATCTCTCTCACTCACTCTCTCATCTCTCTATCACTATCTTCTCTAATTCTCTCACACTCACTTCTCCCTCTCATTCTCATTCACTCTCAATCTTGCCAAAAGGTATATTCTCTCCAAATTTTAAATTTTTTTCATTAATATGTGTTTTTGGAGTTAATTTTGAGTTTGTGTGGGTTTTAGGGTTGAGTAAAGGGGAGGGATTGGAGTTTGGGTTGGATTTGTGGTATAACAATTTTAGGGGAGATTATGCCTTCTTTTTTTTTTTTTTTGTGGTTATTTGACCATATTTATTTTTTTTGTAGGGAATCATCGAGACTTTGACGGCTAAAGTTGAGGATTAGGAAGCTATCAAAACATCTCCTCTGCCACTACCACCACAATACGCTTGTATTAGGGTTTTATTATTGTACTTTGTTAATTTATGTGAACATTTTGAATATTATATATATATATATATTTATTGGATAATTTAATCACTATTTTTCATATGTAATTTTATTTTGAATATGTCAATTTAAATTAAAGTAATTAAAAAAATCATACAATTAAATTAAATTTAAAAAGTAAAAATTAATATCAATTTAAATTAAAGTAATTTTAAAAAGAAATCATACAATTAAATTAAATTTAAAACGTAAAAATTTGAAAAAATTCATATAAATAAATTCATATTAAAGAAATAATAAAACAAAAAGTCAAAAATCTTGCGCGACAAAATATTTCGTAGCGCAAACTATTAAATTAGTTTATTTTAAATTAAAAACATTTAAAACAAAAAATATTTCGTCGCGCAAAACTCAAAAAATTTGGGCAGGTACCAAAAATTGGACGTGGGAATTTTTTAGTTTTTTAAAATTTTTTTTAGACTTTGCGCGACCAATGTTTTTCGTCGCGCAAAACTTTGAGCGACCAATATATTTCGTCGCGCAAATCTTTGCGCGACTAATGTATTTCGTCGTGCACAACTTTGCGCTACCAATATTTTTCGTCGTGCAAAGTCACTTTGCGCGACCAATCTTTTTCGTCGCGCAAAGTCGCTTTGTGCGACCAATATTTTTTCGTCGCGCAAAGTCACTTTGCGTGACCAATGAAAAAATTCGTCGCGCAAAGTCTTTCTTCACGATCTTTGCGCGACGGATTCTGCGCGACGAAGTTTCTGTCTCGCTGAAATTTGTGCGACTACAATGTATTTTGCGCGACGAAATTCTCTTCGTCGCGCAAAGTGTAAAATGTAGTAGTGGTACCAGTTGTGCTTATTTACTTTTTACCATGGCTCTCACAAATCAAGAGACCTCTGCTTAGCTTTTCTTTTTATTTTGGCCATTTGCTCCTCTCAAGCATCATCTCACTAAATTTATGATGAGACTGGATGGCTCAATTTGGGCCAGTTTTTTTTATAAGGATGCTGAGGAGAAGGAGAGGCGATTCATGATAGTCAAGGCCAACTTGGAGTTCATTAAGGCTTTTAACAAACACATGAGCCAGAACTACTTCACACTAAGCTTAAATGAATTTGCAGACCTAACCAATGAGGAGTTTCGGGAAATTCGTAATGGTTACACGAAACGATCCTCCAAATCGATCATGTCCAATTCCACGAAAGCTACATGTTTTAGATATTGAAATGTCACTGATGTGCCACCTTCAGTGGATTGGAGAGAAAAGGGTGCAGTGACACCTATCAAGGACCCAGGCAAATGTGGTAAGTATTAAACAAGTTGTTAAATGATGACGCATTCACTGTTTCACAACCTAACATGTTATTGAATGATGAGGCATGTTATTTCAATTTTATAGGGTGTTGTTGGGCATTCTCAGCAGTGGCAGCTACAAAAGGGGTTAACATGCAAGCTCAAAGCCAGAAACTTAATCTCACTATCAGAGCAAGAGCTTGTGGATTATGACACTACAGGTCAAGATCATGGCTGTGAAGGTGGTCTAATGGATGACGCTTTTCAATTCATCCACGCAACAAAGGCTGACAACTGAAGCTAATCACTTCTACCAGGGTTACAACACTCAGAAGGCTGCATCCCAAACAGTGTCCATAAATGGGTACGAGGATGTGCCTAAAAACAACCAAAATGCTATGTTGCAAGCCGTCGCTAACCAACCAATTTCTTTTGGAATTCAGACTATGATCTGAATTATAACTTGCCTTCTACAAATACTACTGAATGAGTAAAGGTTTCAGAGAGATTTTCAGAATGAGAGAGAGCTCGAGGAAAGAGCAAAAAGATGAATTCTATTCTTCTTCTCACGCACACACTGTGCACTAATAACAGTTGGAACAGGAAATTCCCAAATTACATCATTCAAATCTAGCCATCCATTCTTCTATTCTAAGATTACATCTTAGCTGTCCACTTGGATTGTAATCCAAGGGCTCACATTTAAATCTGTAAATTTGAACTAAATACAACATCATATCAGCAAAAACAGTTATATTTCAACACTCCCTTCTAAGTGTTTAGCTGAGATTACTCCAAGCTTTCTTCTCAGGTATTCAAACCAATCTCTTGCTAGAGCCTTAATAAAGATGTCTGCAGTCTGCTCTTCAATTTTGCAACATAGTAAATCAATCTCTCCATTTTGCAAAGCATCTCGGATGAAGTGAAACCTCCTGTTTATATGCCTTGTCTTATGATGATGCACATGATTCTTGGTTATGGCAATAGCAGAGGTATTATCACATAGAATTGTAGTAGCACCCACATGTTCTTCACCAATGTCTGAGAGAATGAAGCGCAACCAGATTGCTTGTGCAGTAGCTTCTGCTGCACTAACATACTCTACTTCTACTGTAGACAGAGCTACACTACTTTGCTTGACTGAAGCCTAGGAAAACATACCTGATCCAAGATTAAATGCAAATCCAGAGGTGCTTCTCATGTCATCCTCGCTCCCCGACCAATCACTGTCACAGTAGCCAATGAGCCTTGCTTCTTTGCCTTTCTCATATGCTATGCCACAATCAAATGTGCCTTGAATGTACCTCAATACCCTTTTGGCAGTTCCCATATGTTTTCTAGTAGGTCCATGCATAAATCTAGCCAAAAGACTTGCTGCAACCATGATGTCTGGCCTTGTTGCAGTCAAGTACAACAGATTTCCAACTATCTGCCTATAAACCCCTTCATCAGCTTGTTCACTTCCATCTTCCTTGGATAGCTTTTCATTCATTGCAAGAGGAGTAGCCACTGCTTTATAGTCCTTGAAGCCAAATTTGTCTAGCAATGTCTTAGCATATTTCTTCTGGTGCAAGAAAATGTAAGACTCAGTTTGTATCACTCCTAACCCCAAGAAATGGTGAAGCAAACCAAGATCAGTCATTTCATACTGCATCACCATTTCAGTTTTGAACTCCATGATCAAGGCTTTTGAGCTTCCAGTGTAGATAATATCATCTACATATAAAGAAACAATAATAATACTACTTTCTGCAGCCTTTACATATACTGTTGCCTCACTAGGACTTCTCTGGAAACTTGCCTTGATGAAGTAAGAATTGATTTCTTCATACCAAGCTCTTGGAGCTTGTTTAAGTCCATATAATGCCTTCTTGAGTCTATACACTCTATCCTCTTTGTTCTTAATCATAAAACCAGGAGGTTGATCCACATACACCTCTTCATGCAATACTCCATTCAAGAATGCAGACTTCACATCTAACTGAAATAGTTTCCACCCCTTTTGTGCAGGCAATGCCACCAATGTTCTAATGGTATCCAGCCTAGCAACAGGTGCAAATGTTTCATTGAAATCTATCCCTGGCTTTTGAGAATAGCCCTTTGCCACTAGCTGAGCCTTGTCTTTTTGAACTGTACCATCTAAATTCAGCTTGGTTTTATAAATCCATTTGACACCAATTACTGGTTTATCAGTTAGTCTATCAACCAACTCCCAAGTTTTGTTCTTCTCTATAATTTCTATCTCATTCTCCATTGCTTTCTGCCATGCTTCATCCTTAACAGCCTCTTCAAAGGTCTCAGGCTTGATAATACACAAGTTACATCTTGCATACACTTCTGCAATACTCTTGTATTTCAGAGGTGTGTGATCAACATCCAGTGATCCTGAGTCAGGATCAACATGCCCCTCTTCTGAAATCTCTTCTTGACTCAGGCTAGAATCATTAGATTCCTCTTCTCTCTCAGTGAGTGTCTCATTAAGAGGTATTGAGATATCACATTCCTTTTGTGCATTTCAATCCCAAATAGATGCCTCATTGAATATCACATCCCTGGAAATAATCATTTTTTTCAGATGCAATGTTATATAGTCTGAAGCCTTTTCACAGTTGCCATACCCTTCTGCCTTTGTTGATTTGGAACATGTGCATAGCACAAAGAACCAAACACTCTTAAATGCTTAACTCCTAGCTTTCTACCACTATAAGCTTCAAATGGAGTTTTCTTGTCTAAGGCCTTAGTTGGACATCTATTCTGGACATACACTGCAGTGTTTACTGCCTTAGCCCAAAATTCTAGAGGCATCTTCTTCTCAATCATCATGCATTTAGCCATCTCCATAATTGTTCTGTTCTTTTGTTCTGCTATTCCGTTTTGCTATGGTGAATATGTCACAGTTAGCTGCCTTTCCATTCCCATGTCTTCACAAAATTTGTTGAATTCATTGGAAGTATATTCGCCCCCCTGTCACATCTTATTTTCTTCAATTTATATCCACTTTGCAGCTCAACAGTGGCTTTAAATTTCTTAAAGACATTAAGGACTTTTGATTTGTATCTCAAGAAATAGATCCAACACATACGAGTACAATCGTCTATGAAGGTAAGAAAATATCTATTTCCAGCTTTGGTAATAGTCTGCATTGGTCCACATACATTTGTGTGTACCAACTCGAGTGGGATTCTGGCAATCCAAGTACCATTCCCTGATCTTGCAGCAGCTTCAAACTGGTGAAGTTTAAATGCCCCATTCTTCTATGCCAAACTAAAGTTGATGACTCTACATTTGCTCTTAATGCAACCTGTAAAGTTGTGTGAAGCTTCAAAGGAAAACTTATGTCGCCTTTCAGTTGCACCTTAGCAACTAGATTTGATAAAGAACAATCATCATAAATTTCAACCTTATTAGCTCCAAAAATCAGAACATATCCATGCTTCATCATTTGCCCTACACTGAGCAAATTCTTCTTGAGACCAGCAACTAACAGCACTCCTTTGACATACCTTCTTCCCATCTTAGTGTCAACAACAAGATTTAATTTCCTTTTCCAACAACATTAACCAATTGTCCTGTCCCCATTGCAACTTTTGCAATTATATTCCTATCAACATCAACTAATACATCTTCTCTCCCAGTCATATGGTTGCTAGATCCGCTATCCAAATACCATATTGTTCACCCGTTTTGTGTTTGTTCCTGTGATGGTAGGGCAAAATTCCCCATTGCCTTGAAAATCATTGACTGGTCAACAAGTCAACTTTCTTTAGTGTGCGAGCGTGCCACTACTAGCAATGAGAAATCCTAGAAGACTTTAAAAATAGATAACTTGCACCCCAAGTTACTGATTTCTAATCAAACAGTTGTGAATTTGGGTGAGGAATATCTCCCAAGTAAGTTCTTTTCTTGCCTCAGACTGGTGAGTACTTCATAATTTTTCACAGTATAAAACTGGTAGTTCTGGCCAGAATAAATGATGAGAAAATGAACTGTTTTGAGGTAGAATTGCCTTTTACAAAACTCAAAAGGGAAAAGCCAACTCTAGAAAGACAAAAAGAAGGCTGGACTTCCATTTCTGCATGGATAGATGCTTCTGATCCAGGCTGGACTAGACTATCAGCAACTTCAACTGTCAAGTTTCAGCTGTAAATCGATACCAACGTTCGAGTTTGGCAGAGCTTTAATCTATTTCAAGCCCTGGAAGGCTTTTTGAACGGACAGAATTACGGCCTATTCAGTCTGAAGGGTGCAGAAGTGGCTGGACTCAAGGATTATTGAGCTGGAACTGCATTGTGATACTTGTTCTACTTGATCAGGGTTCTCCATAAATTTGTTGAGGTTTTCATTTTTGTGAAAACCCAAGCTCTGCTTGTTTTGGCTTTTGCTGAACCAAATTTGTAACAAGAGAAATCTCATTTTAAATGACTTTTCTCTAAGTCTGAAATTGATTTGTAGTTGGCTTCTTTCTTCTTGAAATTGATTTGTAGTTGGCTTCTTTCTTCTGGCTCAATGAGCTTTTGGTTGCTTCAGTTTGTTTGAAGGTTCTTTGAGATCAAGTGATCATTTTGAGTTTTTGTCTTTTGACTGATTTTTTGGTTGTTTGATTGATTGTCTGATCTTTTGCTCTGTTCACCCTCTCCTATATTTATAAGAGATGCTTTGTAGTGGTGCTTCTAATTCTTTTAATAATGGGCGGAAAAATTTCTCAAAAGATCTTTCATTTTTAAATGCAAAGAAAAAGGGTTTTTATCAATTCTGGCAGATAAGCTTTCTATAGTCAGTTCCTAAGGCAGTCACTTCCCTGTATTTCTTGAAAAAGAAACCTAACCCTTCTTCCAATTTAACTGCTCTTTGTAAGAGTTCAAACTGTGATGGTTTAGTTTTGATCTTCCAGATGAACAACTCCCTGCTTCCCACTTATCTTTTTAGAAAATATGGCCTGCTTATCCCTTGGAAATGATATCTAACGAATTTTTTTGGATATAGAAAAGGATTCTGATCTTTTAGCCCCAAAGTTTCAGGGAAGTCTCTCTGCTAATGACCTGCTTTCATTAATTACCAATCTACTCTCTTGTGACAGTTGAAATTGTTGACTTTTTAAAGTCAGGTATTCACGTGGGCTCTGAGAATAGACTTTCCAAAAATCAGCTGATCTTATACTCCGTGTTTTGAGATAAATGGTGAGTACTTAGATGCTGGGCCCAATCCAATTCTTTTTTATCTACTTTAGTGGTCAATTGCCACTTAATTTGGCCTTCTTTTTTTTTTTTTACAACTTTGCCATTTCGTAAAAGACGTGGGCCTTTCTTCTTTTTTAATTATGCCAAGCCCAGTTTGAGTTGAGCTATGGGCTGATTTCTTTCTTTTCTTCCTTTTCGAAGCCCAAGTTTATTGTCGTGGTTTCGATAGATCACGGGCTGGGCTTTTTTGAATTTTGGGCCCTCGATTCCTGTTTATTTTGCAAAGCCCAGACTGCTTGGGCCCTGTGGCTTTATTCTGGGCTCTATAGTGTTGGGCTAGGTGCACAGGATTTTGGCCCCAACACATACATCATCACATCCTTTTACACTAGCAGAACCTTTATTACTAGCATAAAACATGGTTGGTGTGGATTCGGTCTGAGTAGCATAGTTGAGCTGTTGTGCTGGTTTCTTGCTATAGCAATCTTTTGCAATATGACCAAATTTGTCACAGTTGTAACATTTTGGTTTTCCCTTAAACCGAAAATCACCAAAATGTAGTTCGCCACAATGTTTGCAGGGGTTTCTGGCTCCATCAGTTGATATATTATCCCACTTTTTGCCTTTTGTCCTCCAATTCCTTTGATCCCTAAAACCACTTTGACTTCCACTGTAATTTTTTGATTGGGATTCACACAAAGACTAGCAAATGCTTTCTCAGTCTTATCTCCAAAGTGCCTATCTAGCCATAATTCAAAACTCTTCAAAGAGGTTACCACTTCTTGTACCTCAATTTCATCCAAATCCTTAGAATGCTCAATAACAGAACAGATTGAATCATAAGCTGATGGCAAACTGATTAGTAATTTTTGAACAATCCTTGCTCTAGCTAAATCCTTTCCATAGCTCCTCATTTGGTTTATCAGATCAAACGGTTTGGTAAGATAAGCAGAAAGGGACTCATCATCTCTGATTCTTGTATATTCAAATTCTCTACATAGACCTTGCAATTTAACACTTCTAACCTGTTTATCACCATGGAATTCCTTCATCAAGATATCCCAAGCTCCCTCAAAGGTTTCTTCATGAGAGAATCGAGGGAAGATCTCATCAGACGCTGCTCCTTGAATAAGACCCAGAGCTTTAGCATTCTTCATGAGTAGCTCAGTGAGAGTCATCTTCCAAGCACCACTCGATTCTTCCTTTTCTTTCTTCTTTGCATCAGATTCTCCAGCTCCCTTCGAATTTGAGCACTCTATTCCCTTCTCAACCAATTCCCAAAGCCCATGAGATTTGAAAATGGTTTTCATTCTTATGCTCCAATTTTCGTAGTTATCACCGCCAAAGATCGGCACTCTCAGCTCACCACCTCCATACCCTGCCATGTTAGACACAAATCGCGAAACCACTTTTCCAAATTTCAGCTAGTTTTCTTCACAGATTTAATCGCCCAAAGTTAAACAATAGAACCTGGCTCTGAGGCCATGTTAGAATTCAAACTATGATCTGAATTATAACTTGCATTCTACAAATGCTACTGAATGAGTAAAGGTTTCAGAGAGATTTTTAGAATGAGAGAGAGCTTGAGGAAGGAGCAAAAAGATGAATTCTATTCTTCTTCTCTCGCACACACTCTGCACTAATAACAGCTGGAACAGGAAATTCCCAAATTATATCATCCAAATCTAGCCATCCATTCTTCTATTCTAAGATTACATCTTAGCTGTCCACTTGGACTGTAATCCAAGCGCTCACATTTAAATCTGTAAATTTAAACTAAATACAACATCATATCAGCTAAAACACTTATATTTCAACATTTCGGTTGCCATTGACGCAAGTGGCTGTACATTCCAGTTTTATTCAAGTGGTGTGTTCACTGTGGTATAAACTTAGATCATGGTGTTACCGCAGTTGGATACGGGACTAGGACTAGTAGTGATGGGACTAAATACTGGCTGGTGAAGAATTTTTAGGGCACATGGTTGGGGGAGGATGGATATGTGACGATGCAAAGGGGCATTCCTGCCAAGGAAGGACTCTGTGGCATTGCTATGGAAGCTTCTTATCCAACCGCATGATTAATTAAAATGCATATATGTCATAATATAGTGTGGTGTATAAAATATGTATAATTGAATAATATAGAAAGACGCTAGCTATGAGCTGCTATCCTTCCACTTTGAAATCCATGCCTCAAAACATAGAAACAATTAACCCATGACGTGGATTTGCTCTTAAAATCTCACTCAATGAATTAGCAGCTATAGCTATGAGGTTGACATGTTTTCATTACCATTGCAAGGTTAAATCAAGTTAGATTAAGGGTGCATATTTTTGCTCACCATCATTCTTAATATTTGACATGTGTCTATGGGTATAACCATATAGTTCTATAAATATATAACTATGATTATGTCAATGAACACGTGTCAAGTGTTAAAATGGGTAGTGAGAGTACACATTTGGTTAAAGTGGTGAGTAAATATATTCCCTTAGAGTAATCACATGATCATGTCACTGATCCTACAAGGTAAAACTGTGAAACGACGTCATTACACTTGTTCGGAGGTGGCATGGATTGGAAACACGTAATTAACCATATATATAACATCAATTTACAACTTAATTATACTTATTCTTAAAGCCATTTCTGATCGGACATTTTTGGAGAAATTAATTTCTCAGGCAAGTAAATGGCAGCAGAAGAGGACCGGAAAATTTAGGTGCCAGTAGAAGAGAAAAACTCTCTCGCACGTACCTGGTTTATGGAAGTTTGCTGTAACAGGAGAGCTAGATAAAACTTAATTTGAAAAATTCTAGGATACGTAACTAGAGCTTACAAGGTGGTGTTGTTGACTGGCTACAACTTCAAATACAAACCGTTGAGCTAGCTTGCTGTGCGCAGTATATAAAGATTATTTAGGACTAGCTAGGCTCATAATTAATATATACATATATATATAATTACTTTATATTTTTAAAGAGGGGGAAGTACAATATTATGATGAAGAGATGAGTCTTTTTGCCAATTAAAATGCACCATTTATATATTCTGTATCCAGATTACCTTTTGCATGATCTTGCCATGAACATCCAAAAATGCACCAATCTAGTTAAAATTCAAAACAAATTTAAAGATTTTTACATCGTAGTTAAAGGAAATTCATTGTTCCTATAACTTGTGCTTCCTATACACACACAAATTCCATGAATCAATTGACAATGTGATATTAATATTACCATATAACATTTTCAACATTTTCATCTCGTCCTAGCATTCAAGTAAAGAAAAGAATACACGTATACTTGGATTGTTGATGTCTAACTTTGACTCAACGGATTAAGATCGTAAAAACGACACATTCACATCATGACACACACTCAAGTCAGGCTACGTCCATAATATACAATTAGTGAACTGAATTACATGAATCTACAAGTACGGGATATAAAAGCTACAAGCCCTACATGCTACAATATCTGTCCTATTTTTGGGTCAACTGTTCCTTATTCTCTTTGATAGTACAATCGAGTTTACATGTTAGGATCCTAACGGGGATATTAAATGCTGAAAAGGAAATAATCAATTCCCAATAAGCCCTTAAGATCGTCTAACCAAGATACAAGCCTCATATATATCTTAACAAATCTTTCTAGTTCTTAAAGGTTATAGCATCCATCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTATATATATATATATATATATATCCTCTCATATAAGTCCAAATTATCATGATATTTGTCTTTAAAGAATTAATTAACATACTTATCACCGCGCAGAAAATTAATTTATGTCTTCAAGATGTCTATAGAGCATTATTAAACTAATCCTAAAATAAATAAATATTTTTATTCTTAGTGCAATGTGGAAATATCTTTAAAGAATAGAATATTTCACCAATATAGAAGAGCGGCTATACTCAACAAATATAAATTTTCAATAGTCTAGCCGAGTGGCTGTACTCTATAAATATAAATTTTTTAACAGTACAACCGCATGGCTATACTCTTTAAATAGAAATTTCAAAATTATAGCCGTCCGGCTATACTAGTTAAATAGAATTTTTCCAACAGTATAGTCGCACGGATATACAAAATCGCTTTTCTCATTCAACGAAGTAGTTTTTCATTTTTATTTTTTCTGTAACGGGGCGGGTCAGGGAACCAGTTCCTTAATAAAGGCTGGTATGGGCCAATGGCGGATTGAAGACCGACATATTCTGAATATGGGCACCAATATACCGGTCGACTAGTTCTCCTAGCCAGTGGCAGTGGTTGCGGTTGATTTCCCCCATGATCACCTATTGGACAACCTTTGCCTTTTCTGTTCTTGGTGTTTCACCATTTTGGCCAACCATAGTCTCTAGTACCTCGGCCATACTTAATTCCAGTCACCTTAAATGTAACCCAAAATACTTGGTCGAACTCATTCATTTTTGCCCGCCTTAGGTGGCTTTTGGCAGCGCTTAATTTTTTTTAAAAGCAACTTTAATACAAATTTGGCATGAGTTGGGTGTTTGGTAAACCCAAAAAAACACGCTTATTTTAAAAACACCCATCATAAAAAGCAAAAACTCAACGTCAGGTATATGGAGCTTTCAAAAGCTGTTTAAAAAAAGAGCTGGTTTTCTTGTTAATGAAAGTTTCATTATCCCTATAGTACCCCTAAGTATTTCACAAAATGACAACGTTTGACCCTCTCACAAAATAGATCTCGCGACCTTCACACTTTCTGACCTCACTCTCAGACTGCTCTTCTCACTATTCTTCTTCTTCCTCCCCCTGCATCTCAAAACTCCATCTCAATCAAGGACTTTAATTGCCAACAACAATCAGCTACTTATCAGTGAGTTCATCTTCCCATTACATTTATGATTTTTGGGTTTATATATGTTATGAAATTAGGTTTTTCATTTGGTTCTATGCAATTGGGGGCTTTGTGTTCTTGAGGCTTTAAGGGGAAAATACGGGAGAGACAGAGAGAGAGTTTTGCTGCAAGTTTTGTACTGGGTTTGTCTCTCCTTGCTCTTTGACAAGGAGAGATTTCTCCCTAGCTTGGTTCAATTGGCCTTTGGGTCAGATACTTCTCTCTCTGTTTCTATTTCTCTGAAACATGTCTGTCCTGGATGCTTTTTTTCTATAGATTACACAACCATCATTGTTCATAGATTTACTCATTGTATAGTTTGGTACAGTTCCAAAATATCAAGAACAAAACCCGTTATGCTAATCTGGTTCTTTATATACATAAATATAAATATAAATAAATATATATATATATATATACAGTCCCCTTCTATTGAGAGATCTCTCAAATAATTTTATTTGAGGGACGCCCTTAGGGTACCCTACAATTTTCTTTCCAATGATCCAAACCATCTATTTTTTAGGTCTTCATTCATAAATCATCCTTACAAAAAATTAGATAAATCGGAAACCGTTTTGACATCCAATTGTATCTTACAAAATCAATGAACACGTTCCTTCAAGAAAGTACTAAAATTTCAATAACTCAAATGAGTGGTCAAATGATATCATATTCGAGTAATTTTTTTGTAGAGATGATCTTTGAATGAATATCTACAAAATAGACTGTTTGGATTAGTTAAATACAATTCGGAGTGGGGCCTATAAGGAGTGTCCCTCAAATACTTATTTGAGGGATCCCTCAATGGAAACTCTCTGTATATATATATATATATATATATATATATATATGATTGCAACCCAAGTCCCCAAGTCAGGTCCGTGTTGATTTTTCCATTGTCCTAACCTTGTTGTCTTCAAGCTCAAACATAATTCCTTTGGACTTTAGTTTTAGTTCTCTTTTAGTTAGAAGACAAGAAAAGAGTGAAGAAGCCATTAGCTCCAGATCTGGGGCTTCTGTTTTCTCAAGAATTTTTTTAAAAAAAAAAAAGATCCTATTATGTGAAACTGCTGTTCCATCTAAGTTGTCATCCATTATTGTGTTAGAAGATTTTTGGTAAACAAAGCTTTTATTTTTTAGTGGTCATAGTTTCAAGTTCTTCCTTATTATTATTTTTCAGTGTCGGTGGACTTTATTATTGTGTTAGAAGATTTTTGATTGGGTAATGGTTTGAAGTTCTTCCTTCTATTTATATTTTTTTGTGTTGGTGGGCTTTATCAAAAGTGATTGTAGCATGCTGGTCATTGTGGTGGGGAACTCATAAACTGACATATGGTTGAAATATAAAAATTTTGTAAATTGGTATGAAATTGCATTCTCAGTAAATTATGGGAATGCAATATCATCTTGCCTTAGAACATATGATAGAAACAAAACATTTTAACCACAACACAGACTTAAGAGATTCAATAAACTGTTCCCTAGTAAGCTGGAAATATTGGCTAAGACTTTATGTTATCTTTGTCTCCTCTTGGCAGAATAGGCTTGCTAGTTCCTCAAGTAATATATGTTAAAGATTAGGAAAATTATATAGTTCTTGTTCTTAGGTCAATTGTGAAGGTGATCAGTTTATTTTCATGTGTGGATTCTTTTCGTTCTTGGTTTTCTTTCATGAATCATTAGGAATACTCTATGCTTGGACTCTTTGTCCCTTGTTGAGAATGAGAAGTGGGTTTAAGGAAGTTTTGTTGGGAGCCATCATCATTTTTAAACATATAGCATATAGTGGATAATATAGATGAATATTCATACCTGTGGGAAAAGGAAAGTTTGTTATTTTTATGCTTTTAGTATAATGTATATCTTGGGACAATTATTTGCTATTATCTATTTCTCATACTCAACACATATTGCTTTAGTAAGGATGGGAAAGAATGTGAGAAGTTCATCAAAAGCTCCAGCGACATGGAATAACCATAATATATCCATATTCTGTGATTTGTGCATCAAGGAGATATGCCTAATTATCCATTCAACAAGCAAGTGAAGATAGTCATTGCTACAATGACACTTCATAATTATATAAGGAGGCATGCCCAACGTGATAGACATTTTGATGCTTCAAATGATATCTTAAGTGAAGAGATAGGTGAGGATGTTGATGTACAACAAGAAGTTCATAGTCTTAATGACAATGGAACACAAGAGATGGAAGCATTGAGAAATAGCATCGCTACAAGTTTCATGAATGCATCTAATTAGCTTCTTTTATATTGTAGTGATCCATTTTGGCATGTTAAAATTGAACAATTTTTGTATATTTGTTATGCTAACCCTCTCCGAAGCCCTCAAAACACATTGTTATTATTAATATAACAATATTTAGAACTACTTTTGTTACAATATTAATTTATAATTTATGGTAATATATGTGTGCTAATTGTAGATTACAAATTTTGATAAATTAAAAATGTGTAAATTAAAAAAGAAAACAAATTTATGTAGTGAAGTTTGTTTTCTTTTTTTTAAAGTAGAAAAAGAATGAAGAAAAAAAGAAACCGTTTCATCATCATGTCCTTTTCGTTCATTATACATACTAAAAGCACTTCTGATAAAAATTTACCGAACACTTCGACTACTCACAGCCTTTTTTCATATACAGTTTACCAAACGCCTAGCTGTTTTTTTTTCATAGCTGATTATTTTCGCAGCACAGCAGAAACAGTTTTTTTTTAAAGCACAACAATGCCAAACTAGCCCTTAGTTGACTCCCATTTATTTTTCTGCTATTCTAGATCTAGTCATTATCAATCACCATAATAAAGCTCCACTTCTTGTAGTTTCAGTTTCACCTGTGCCTTTGATTATTTAGAACAATTTAGACTTTAATGATATGGTCACGGTTACAGCACAAAAGACAAATACCAAAAGCGGCCCTCGTGAAGAAGGGTATGGTCATTGGTCACCCTCAGTTTCACTTGTGCCTTCTCATCACCTTCGCTCTCGCCTCCTCATCACTCTCTGTCGTCTGTGGTGCGCAGGAGCACCACCACCACAACAACATTATCAGCCATGGAGCTCTCTCCGACACCGAAGCCCTCTACATCAAGCAGCGCCAGCTCCTCTACTACGGGGACGAGTTCGGCGACCGAGACGAGCTAGTCACGGTCGACCCATCTCTGGTTTTCGAGAACCAGAGAATCAGAAATGCTTACATGGCTTTACAAGCTTGGAAGCAAGCCATTCTCTCCGACCCGCTTAATCTCACGGGTAATTGGGTCGGATCTAATGTCTGCAACTGTATTCAATTTAATCAACTGTAGGATTCATTTACAAGGCGAGTGGAAGGAGTCATCAATTTTGAATTAACAAGTTTCTACTGTAACGTATAACAACTATGTTCATATTTATTGGCTGGATAAGTTGTTATATTCAGC\n>URS0000B8F910 rRNA from 1 species \nGTGCCAGCCGCCGCGGTAATACGTAGGGGGCCAGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGCGTAGGCGGCCAGACAAGTCCGGTGTGAAAGTCACAGGCTCAACCTGTGAATGCCGCTGGAAACTGTCTGGCTAGAGTCCGGAAGGGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCTATGGCGAAGGCAGCTCGCTGGGACGGTACTGACGCTGAGGCGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCCTGTAGTCC\n>URS0000C2AFAE pre_miRNA from 1 species \nCAAGTACTCCCTCCGTCCAAAAATACTTGTCGCAGAAATGCATAAAAATGGATGTATCTAAAACTAAAATATGTCTAGATACATTCATTTTTTCCGACAAGTATTTCCGGACGGAGGGAGTACAAC\n>URS00023A1339 lncRNA from 1 species \nCAGCCTATAAACGGACGCAAGTTAATATCGGTACGGCCGACCATCGAATCACCGTCGAAACCAAATTCTACGGCGCAGGACCAGGTTTAAGAGAAGTAGTCATCATCGAACGAAACTCTTCAAAATTCACATTGCCATCACCATCGGCATCCACCGGCTTAATCATCGCCACACATCCATCAACCGAGCACTTAATTCCGAGCCTGTTCAACACCAAATTCAACTCCTCCGCCGAAATCAAGCCGTTCTTGTCCTGATCGTAGAGATCAAACGCCTCGCGGAGCTCGGCCTCGCCGGCGGCACCAGAGGAGGTCCGGC\n>URS000118CADB rRNA from 1 species \nCCTACGAGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGCGAGCCTGAACCAGCCAAGTAGCGTGAAGGATGACTGCCCTACGGGTTGTAAACTTCTTTTATAAAGGAATAAAGTGAGGCACGTGTGCCTTTTTGTATGTACTTTATGAATAAGGATCGGCTAAATCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGAGCGTAGATGGGGTGTTAAGTCAGTTGTGAAAGTTTGCGGCTCAACCGTAAAATTGCAATTGATACTGGCAGCCTTGAGTACAGTTGAGGTAGGCGGAATTCGTGGTGGAGCGGTGAAATGCTTAGATAACACGAAGAACGACGAGTGCGAAGGCAGCTTACTAAACTGCCACTGACATTGAGGCTCGAAAGTGTGGGTATCAAACAGGATTAGATACCCTTGTAGTA\n>URS000006351C rRNA from 1 species \nGCGGGGTAAAGGCCCACCAAGGCAACGATGGGTAGCCGGCCTGAGAGGGTGATCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATTTTGCGCAATGGACGAAAGTCTGACGCAGCAACACCGTGTGAGGGATGAAGCATTTCGGTGTGTAAACCTCTGTCGATGATGAATAATGTTTCGGGGAGTGGAAAGCCTCGGAATTGAAGGTAATCATGAAGGAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGGGGGTGCAAGCGTTGTTCGGAATCACTGGGCGTAAAGGGAGCGTAGGCGGAACTACAAGACAGAGGTTAAATCTCCGGGCTCAACCTGGAACTTGCCTTTGTGACTGTGGTTCTTGAGTATGGTAGAGGTTGGCGGAATTTCCGGTGTAGCGGTGGAATGCGTAGAGATCGGAAAGAACACCAGAGGCGAAGGCGGCCAACTGGACCAATACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGAACACTAGATGTCGGGAGGGGTTCCTTCCGGTGTCGTCGCTAACGCAGTAAGTGTTCCGCCTGGGG\n>URS0000ECDE64 rRNA from 1 species \nGGGCCCGCACAAGCAGCGGAGCATGTTGTTTAATTCGACGCGACGCGAAGAACCTTACCAAGGCTTGACATGCACGGGAATGTCGTAGAAATATGGCAGCCCTTCGGGGCTCGTGCACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTGTCCCATGTTGCCAGCGTGAAAGACGGGGACTCATGGGATACTGCCGGTGACAAATCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGTCTTGGGCTACAAACGTGCTACATTGGCCGGTACAAAGGGCTGCAAACCTGCGAGGGTGAGCGAATCCCAAAAAGCCGGTCCCGGTTCGGATTGGAGGCTGAAACTCGCCTCCATGAAGGCGGAGTTGCTAGTAATCGCGGATCAGCAACGCCGCGGTGAATATGTTCCCGGGCCTT\n>URS0000175B41 rRNA from 1 species \nAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTCTCAGTATAAGCAGTCAAATGGTGAAACTGCGAATGGCTCATTAAAGCAGTTATAGTTTATTTGATGGTTGCTGCTACATGGATAACTGTGGTAATTCTAGAGCTAATACATGCATCCAAGCCCGACTTTGCAGAAGGGTTGTGTTTATTAGATCCAGAACCAACCCAGGCTCCGCCTGGTCATGTGGTGATTCATGATAACTTGACGAATCGTGCGGCCTTGCCGACGATGCGTCATTCAAGTTTCTGACCTATCAGCTTCCGACGGTAGGGTATTGGCCTACCGTGGCAATGACGGGTAACGGAGAATTAGGGTTTGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCTAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACACAGGGAGGTAGTGACAAGAAATAACAATACAGGGCATCCATGTCTTGTAATTGGAATGAACAGAATTTAAATCTCTTTATGAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGTTGAGGATGACCGGTCCGCCCTCTGGGTGAGTATCTGGCTCAGCCTTGACATCTTTCTGAAGAACGTATCTGCACTTGACTGTGTGGTGCGGAATTTGGGACATTTACCTTGAGGAAATTAGAGTGTTTCAAGCAAGCGCACGCTTTGAATACATTAGCATGGAATAATAAGATAGGACCTCAGTTCTATTTTGTTGGTTTCTAGAGCTGTGGTAATGGTTGATAGGGATAGTTGGGGGCATTCGTATTTAACTGTCAGAGGTGAAATTCTTGGATTTGTTAAAGACGGACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTGATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCCTAGTCTTAACCATAAACCATGCCAACTAGAGATTGGAGGTCGTTACTTGCATGACTCTTTCAGCACCTTATGAGAAATCAAAGTCTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTCCAGACATAGTAAGGATTGACAGATTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGTTAACGAACGAGACCTTAACCTGCTAAATAGTTACATGTAACCTCGGTTACATGGGCAACTTCTTAGAGGGACTTTGTGTGTCTAACGCAAGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTAGATGTCCTGGGCTGCACGCGCGCTACACTGATGCGCTCATCAAGTTTTCGATCTTGCCCGAAATGGCTGGGTAATCTTTTTAAAATGCATCGTGATGGGGATAGATCATTGCAATTATTGATCTTCAACGAGGAATTCCTCGTAAGCGCGAGTCATCAGCTCGTGCTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATTGAGTGATCCGGTGAATAATTCGGACTGACGCAGTGCTCAGCTTCCGGACGTTGTGTTGGAAAGTTTCATGAACCTTATCACTTAGAGGAAGGAGAAGTCGTAACAAGGTTTCC\n>URS0001B743B1 rRNA from 1 species \nCCTGGTTGATTCTGCCAGTAGTCATACGCTCGTCTCAAAGATTAAGCCATGCACGTCTAAGTATAAATACTTTACTTTGAAACTGCGAATGGCTCATTATATCAGTTACAGTTTATTTAATAGTCCCTTACTATTTGGATAACCGTAGTAATTCTAGAGCTAATACATGCGTCAATACCCTTCTGGGGTAGTATTTATTAGATTGAAACCAACCCCTTCGGGGTGATGTGGTGATTCATAATAAGCTTGCGGATCGCATGGCTTTGCCGGCGATGGATCATTCAAGTTTCTGCCCTATCAGCTTTGGACGGTAATGTATTGGATTACCGTGGCTTTAACGGGTAACGGGGGATTAGGGTTTGATTCCGGAGAGGGCGCCTGAGAGACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGTAAATTACCCAATCCTGACACAGGGAGGTAGTGACAAAAAATAACAATGGCGGGCCTTTCTAGGTCTGCCAATTGGAATGAGAACAATTTAAAAACCTTATCGAGGACCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTGTGGTGGCGCCCGAGGTCCAATTGTTGGTACTATCGGGTGCTGCCATCCTTGGGTGGAATCTGTGTGGCATAGGTTGTCGTGCAGGGGATGCCCATCGTTTACTGTGAAAAAATCAGCGCGTTCAAAGCAGGCTTATGCCGTTGAATGTATTAGCATGGAATAATAAGATAGGACCTTGGTACTATTTTGTTGGTTTGCGCACCGAGGTAATGATTAATAGGGACAGTTGGGGGTATTCGTATTCCATTGTCAGAGGTGAAATTCTTGGATTTCTGGAAGACGAACTACTGCGAAAGCATTTACCAAGGATGTTTTCATTAATCAAGAACGAAAGTAAGGGGATCGAAGATGATTAGATACCATCGTAGTCTTTACCATAAACTATGCCGACAAGGGATTGGTGGGGTTTCGTTACGTCTCCATCAGCACCTTATGAGAAATCACAAGTTTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGAAATTGACGGAAGGGCACCACCAGTAGTGGAGCCTGCGGCTTAATTTGACACAACACGGGAAAACTTACCAGGTCCAGACATAGTGAGGATTGACAGATTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGTTAACGAACGAGACCGCTGCCTGCTAAATAGTCCAGTCAGTGAATTTCACTGGCGAGGACTTCTTAGAGGGACGTGCATTC\n>URS0001EA0CFC rRNA from 1 species \nATAATAATCGGGCATAAGTATACCACCGAAGCTATGGACTTATTTTATAAGTGGTAGGGGAGCATTCTAGTTACGTTGAAGGTGCATGGCAATGTGTGCTGGAGTGGCTAGAAAAGAAAATGTAGGAATGAGTAACGATAATGCGGGCGAGAAACCCGCACACCGTAAGACTAAGGTTTCCTGAACAACGCTAATCGGTTCAGGGTTAGTCGGGTCCTAAGGCGCACCCGAATGGGGAAGTCGA\n>URS0000169475 rRNA from 1 species \nAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGGGAAAGTGGAGCAATCCACGAGTATAGTGGCGACCGGGTGAGTAACACGTGACTACCTGCCCTTGAGTGGGGGATAACCTTGGGAAACCGGGGCTAATACCGCATAAAATCGAAAGATCAAAGGAGCAATCCGCTTTTGGAGGGGGTCGCGGCTGATTAGCTAGTTGGTGAGGTAATGGCTCACCAAGGCGAAGATCGGTATCCGGCCTGAGAGGGCGCACGGACACACTGGAACTGAAACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGCGCAATGGGGGAAACCCTGACGCAGCAACGCCGCGTGGAGGATGAAGCCCCTTGGGGTGTAAACTCCTTTCGACCGGGAAAATTATGATGGTACCGGTGGAAGAAGC\n>URS00003DDD0E piRNA from 1 species \nTNGGGCCTTAGTATCACTCTCAGTTACC\n>URS0002242497 RNase_P_RNA from 1 species \nGCAGTTGGACGGTCTGTCGCCGGCTCCTTTCGAGGGGCTGGAGGAAAGTCCGGGCAACGCAGAGCGTTCCACTTCTTAACGGAAGTTGTCGGCGACGGCAGGGTAACGCAGAAGAAAACAACCGCCGGTGCGACGTTGCGGGCCCCCGTTTCAAGTAATGTCCATCGGTAAGGGTGAGAAGGTGGGGTAAGAGCCCACCGGGCGACGCGGTGACGCGCCGTGCCGTGCGTCCTGGAAGTTGCAAGTTCATGTAAACCGGCGTCAGAGGGCTGCTCGTCCGAGCCGGAGGGTAGAACGCGTCAGATAAATGACAGACACCTCGCCTGCGCGGGGCACAGAACCTGGCTTACAGACCAACTGCCGTT\n>URS0000AF82F7 rRNA from 1 species \nTGAGGGAAAGGCGAAAAGAACCCCGGCGAGGGGAGTGAAAAAGAACCTGAAACCGTGTACGTACAAGCAGTGGGAGCACAGGTTTACCTGTGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTATATTCTGTAGCAAGGTTAACCGAATAGGGGAGCCGGAGGGAAACCGAGTCTTAACCGGGCGTTAAGTTGCAGGGTATAGACCCGAAACCCGGTGATCTAGCCATGGGCAGGTTGAAGGTTGGGTAACACTAACTGGAGGACCGAACCGACTAATGTTGAAAAATTAGCGGATGACCTGTGGCTGGGGGTGAAAGGCCAATCAAACCGGGAGATAGCTGGTTCTCCCCGAAAGCTATTTAGGTAGCGCCTCGTGAATTCATCTCCGGGGGTAGAGCACTGTTTCGGCTAGGGGGCCATCCCGGCTTACCAACCCGATGCAAACTGCGAATACCGGAGAATGTTATCACGGGAGACACACGGCGGGTGCTAACGTCCGTCGTGAAGAGGGAAACAACCCAGACCGCCAGCTAAGGTCCCAAAGTCATGGTTAAGTGGGAAACGATGTGGGAAGGCCCAGACAGCCAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAAAGCGTAATAGCTCACTGGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAACCATGCACCGAAGCTGCGGCAGCGA\n>URS00019A0A0A lncRNA from 1 species \nGGGGGATGTAGGGATTCATCTTTGTCACATTTTCTCTCTAATTTAGCTGTCTAGGGAGCCTCCCTTGTTTTGCAGAAGTGGAAACATCCAGTTTAATTTCATCTTTTCTCAGACTGCAGTAGCTTGCTTCCTCAGAAGCCAGGGTCTCTCTCCATTTATTCTTAGTGTTTATCCCTTTAATTCTCCTACAGTTTCACAAGTGCTTCTGGTATATTTTGTAATTTTAGCTTATAATCACATTTTTCGAAGAGGCACCATCTGGTTCCTGACATGGCTTAAAATAACAATCTAACTAACACGAACCCTGCAGCAATGCTTTGCGCCCTTCCCAACCCAGTGTGAGAGTGTCCCCACCTATATTTCTTCACAAATGCTCCACTGTTAGGTTCCATCCCTTCCGATAGATCTCACAGAAAGCGGGGCCTTTTACCTCTTTCATCTCGAACCCAGTCGTTTCAGGCAGTCAAAATGGATGCGTTAAAAAAAAAAAAAAAAAACCTTGCAGCTAGGACAGCAGAGGATCTGCTGTGAACTGCTCAGTCAGAGACTTGGAGCTGGAGCTCACGTCTGTATTTCAGCTGCCCTCTGGTGCTTAGCACTGCAGCAGTACACGCCATCATCATGGCCCCAGTGCTTGGAGGTCCCTGCGACGGAGCAGCGGAAACCAAGCACAGCAAAAATTCCTTTGAAGACAGAAAAGTGGCCCAGTGCTGTGCAGCAGGGCTACGGTGCTGGAATCCAGCCCGGCCCAGTGCCGGCGTTGGCAGCGGCCTTCCCATTATATCAGGAAGGGCTGTATCCCGTCGCCACCATGCCCCAACCCCCCCGGCTCGCCTCAGCTGTCTGCGGGACGTGGAGCCAGGCAGAGGGTGCCCTGCAAGAAGCAGAGCTGTTGGTTTGAGGTGCGGAAAGCCGGCCAGTCTGGATGCGACTGCTGCTGCGTGGCGGACAGGAACTGACATACAGCTTCAGTGCTTCCCACCGCAAGGGCACTCCAGGATCCAGACTCTGGAGGAGAAGCTGTGGCTGTAGGATTGCTAATTGCAGCCGGTGCCAACGCTGCTGCCCGTTTTCAGGTGAGTGTGGTGGAGGGCACTGTAGAGACGCACGGCTATTCACAGAGCGTGCACTTCCAGCACCTGAACTGCTGGATCCGCTCTGACCGATGTACGGCAATTACATTTGGTGCTGCACTGCTATAATTTCACTGCACGTTAATAGCCACCTAGTGCAGAGGTAAAGGCCCTTCCCTCGCCCGGTGCAGAAGGAATGCCTGGATTTATTCAGCTGAGTAAAACGAGCTGTGATTTTCGGAGCAGATGGCAGAGGTTTTGTGTGTTGGAAAAGCGTTTGCCGGTGCAGTGCTGTTTCCCTGCACCCTGACGGGTGTGCGGGAGGCTCCTGGAAAAGTCCCATCCTCGGGTCCTGGCAGGGGGAGGGGAAGAGATGGGGATCATGTGCCCCATTTTGAGTGGCTCATCTGCTACCACCCAAACTCTGCTGCAGTCCCCCCCCCTCCCTTCAGCAGCTCGGCTGAGCACTGCAGGCGCTGTCAGATTTCTCTGGCAAAATTAGTGATCAAAACACCCCCCCCCCCCCACACACACACGCACACCTTCACTAAGGCTGGTGTTTTTAAGGTTGGGGGGGTGATGGGGCGCGGGTGGGAGCGCACGGCGAGGGTACGAGGAG\n>URS0000B155C2 tRNA from 1 species \nGGCTTCGTAGTTCAACTGGATAGAATGACGGATTTCGGCTCCGTTGGTTGCAGGTTCGAACCCTGCCGAGGTCACGA\n>URS00025AB7F7 tRNA from 1 species \nGCTGGTGTAGCTCAGTTGGTAGAGCAGCTGATTTGTAATCAGCAGGTCGCGGGTTCGACTCCTGTCACCAGCTCCA\n>URS0000328ABF rRNA from 1 species \nACGCTGGCGGCAGGCTTAACACATGCAAGTCGAACGGTAACATAAAGAAGCTTGCTTCTTTGATGACGAGTGGCGGACGGGTGAGTAATGCTTGGGAATCTAGCTTATGGAGGGGGATAACTATGGGAAACTGTAGCTAATACCGCGTAGAATCGGGAGATGAAAGTGTGGGACCTTCGGGCCACATGCCATAGGATGAGCCCAAGTGGGATTAGGTAGTTGGTGAGGTAAAGGCTCACCAAGCCGACGATCTCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGGGCAACCCTGACGCAGCCATGCCGCGTGAATGATGAAGGCCTTCGGGTTGTAAAGTTCTTTCGGTAGCGAGGAAGGCATTTAGTTTAATAGACTAGGTGATTGACGTTAACTACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATAACTGGGCGTAAAGGGCACGCAGGCGGTGACTTAAGTGAGGTGTGAAAGCCCCGGGCTTAACCTGGGAATTGCATTTCATACTGGGTCGCTAGAGTACTTTAGGGAGGGGTAGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAATACCGAAGGCGAAGGCAGCCCCTTGGGAATGTACTGACGCTCATGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGTCGATTTGGGGGGTTGAGCTTTGAGCTTGGCCGCCCGTAGCTAACGTGATAAATCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAA\n>URS00021F8B86 rRNA from 1 species \nAGAGTTTGATCCTGGCTCAGGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTTGAGCGCTGAAGGTTGGTACTTGTACCAACTGGATGAGCAGCGAACGGGTGAGTAACGCGTGGGGAATCTGCCTTTGAGCGGGGGACAACATTTGGAAACGAATGCTAATACCGCATAAAAACTTTAAACACAAGTTTTAAGTTTGAAAGATGCAATTGCATCACTCAAAGATGATCCCGCGTTGTATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGATGATACATAGCCGACCTGAGAGGGTGATCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTGGTAGAGAAGAACGTTGGTGAGAGTGGAAAGCTCATCAAGTGACGGTAACTACCCAGAAAGGGACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTCCCGAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGTGGTTTATTAAGTCTGGTGTAAAAGGCAGTGGCTCAACCATTGTATGCATTGGAAACTGGTAGACTTGGGTGCAGGAGAGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCGGTGGCGAAAGCGGCTCTCTGGCCTGTAACTGACACTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGATGTAGGGAGCTATAAGTTCTCTGTATCGCAGCTAACGCAATAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATACTCGTGCTATTCCTAGAGATAGGAAGTTCCTTCGGGACACGGGATACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATTGTTAGTTGCCATCATTAAGTTGGGCACTCTAACGAGACTGCCGGTGATAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGATGGTACAACGAGTCGCGAGACAGTGATGTTTAGCTAATCTCTTAAAACCATTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGAAGTCGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGGGAGTTGGGAGTACCCGAAGTAGGTTGCCTAACCGCAAGGAGGGCGCTTCCTAAGGTAAGACCGATGACTGGGGTGAAGTCGTAACAAGGTAACC\n>URS0002423514 lncRNA from 1 species \nAGTGCTTAGGTCCTTTGACACCGTTGGCGGGAGACTTTTCGTCGTTTGGGGTGGGGATGAAAAACATCAGCGTGTTTATTCCTCAGGCAGCCCAGAAACCTTAGGTTTGCACCACCAGTAGCTTGGCAACGCGGTCACGGGTACACAGCACTGGCACAACATGACTGTGTGTGTGTGTGTGTGTGTGTGTGTGCTATGCTGTCCTATGCTCATGATGCTCTCATGGCCTTTCGCTACAACAGGTCCAAGGCCTTATCATTGCCGTCATGTACGAGAAATCCCGGGGAAGGCAGTCACGATGGGCGCCGTACTTGAACCTGATCCCGGACGACATGACCCACATGCCGCTGTACTGGAAGGTACGGTAATGTACGGGAAAGGTGGATCGTACCGTGGACACCGTGCCACTCGCCTCCCAAACTCTATGCGCCGTGGCGAGAGCTCATCTTCACGCACTCAGCGAGTTCTGGTCCCCCGCCCTTAAACCCCGTCTACGGACAGCATAGGGAGTTCAAGGAGCTGCGTGGTACGGCAGCGTACGACAAGATGATGGGCAAGGTGCAGTGTCCCGCCGACGCACCCACGCAGGTCGGTTAACACTTTGTATTGTATGGGGTTGTCATGTGCGTCGCATCACTGCTCTTTTGCGGATCGTGGTACGACACATCACTGCTTTCCCCCCTCCCCGTTGACCGGGCGATCTGCAATCCTCCGCTGTACTGTGCAGGTCCCCGTTCTGTGGAGTGAGGTGGTGGAGCCCTTCATCCAGGAGCACCCGGAATTAGAGCTGCCGGAGGGGAAGGCGGGGTATGACTTATACCGCTGGGCCACGTGCGCTGTGGCGTCGTACAGCTTTATCTTGGGTGATGACAAGTACCAGGTGGGCATTCCAGTCCTGTACGGCCGGGGGCTCGTGACTGCGGCTGCTGCAAATGATGTCGTACCATGAGCACCTTATCCAATCTAACTACGAAAGCCCCCTTCATTCTCTCCCCCCTCTTTTCCTCCCCCTCTCCCCCTCTCCCCCTCTCCCCATCTCTCTCCTTTCCTCCTCTCATTTCTTTCCCACATGCGTATGAAGCCCACCTCTAGGCGCCCTCCTGCTCACCCAGCACCCTCCTCCCCCTCCCCCTCCGTCCCCGCGCTGGCGGCCGCCCCAGGCGATGGTCCCCGTCTGGGACCTGCTCAACCACATCACAGGTCGGGTGAACGTCCGACTGCACCACTGCGCCAAGAGGTAAAGAAGAAGGGAGGAAAGGCGATATTCGGGGTGGCTGCACCCCGTAGGGCCCTCCTGGAGTGGGTGGACGGGTGGCGTCGCGGGCCCCAGGGGAGTGAGTACGACCGCTCGCTGCACGGGGCGAGGCCATGCAAGCCAATCGCCAAGCGTCCTTGCTAGGTTGGGGATAACCCAACCAACCAACCAACTCCGGGCCCTATATCAGTTGGCAACTTGCTCATTGGGTAACCGGTATATATGTATGTATATATATTATATAACCCCCGGACGACTGCTGAAGCCGGAAGGGCGGACATGGTGATCTCGTCGCATGGCAGCTGTCCCGTGAGCCCACGGAGTTGTGTGGGATGTGCCGATGAGGCGGCGGCATTTGGGGCGTGGCGTGAAGCGTGTATGAGGTTGGCTGATGTCGGCGCCTCACGCACCAAGAGCGCCGCCAGGAACGTACCCGCACCGCACGGGAGAGCGGGCGGGGAGCCGTGTCCGCGTTCTTATCCGGCGGGTCTGTCCTAACCCGCCTAACCTTACCCGTCCTAACGGGGCACCGTGCGCCACCCTGCTGGGGATGGAAGCACCCCCCAGGTCTCAGCAGCCACTGGATTGCGCTTCCCGCTTGCGGCGTTGTTTGTTGCGCCGGTACTGCAGGCACGTGCTTCACATGATTGCCACTCGGGACATCCTTCGCGGTGAGGAGCTGGTCAACAACTACGGTGAGCTTTCCAACGCGGAACTTCTGCGGGGGTACGGCTTCGTGGAGGCACGCAACCGGAACAATCACGTACAGGTCGGTTGGGGATTGAAGGAGGCTGCTGGTTTGGGAGGAGAGTTAATATGGCTGTGGAGCGGGTGCTGGAGCAAAGCGCGCTTCGCACATGACGAGGAGGTAGCGGGTGACAAGAAAATGAGGCGGGTCGGGGGCGGGTAAGGGGTGGGCCTCCCTCCCCCCAGCGTGCTGAGCCCGGGTAAACGCTAAGCCGCCAACCCCGTCACCAATGCCTACCACTATAGTTACCCAGTTACCGCCAGGCAAGGCTTGTCCGTTGAAGAGGGGCGGCTGCGGGGCCGACGGGGTGAGGGTGGGGATGCTGGCACCTGCGTTTTGGTTTTGGGAGGGGAGCCATACCCAGCCGCTGCCATTGGACTCCGGCTCGCCCACGTGGCCCTCCGCGCAACCTGCCTAGGTTCCACTGGGCTTTGTGGTCCGTGCGGCGACGGAGCTTCTCCGAGAGGACATCACGGCAGCGGCGGGTGCCGGCCCTGGACCCGGTCCTGGTAGTCAGTCCGACCAGGGGGAGATACGAGCCCGCGCATCTGCGCGGTTGCGCCTGGCTCGCCGGTGCGACCTGTTGCCACAGCACCATGTGTTCAAAATTTTCGAGGGGCGGCCACCTCCGCCCCCCATGACTGCGCTCATCCATCTGCTGCTGGCGTCGGATGCCGACATTCCGGCTGTGCGGGGTGCTGTCCGCCGTGCAGCCGCGGCCGTAGTGGAAGGTGAGGATGGCGCGGATTGCGGCAAGGATAAGGGCAAGGCCCGGCGGCGTAATGTCGCGGCAGCTGGGGCGGTTCTACAAGCACGCACAGCGGCTGCGGTGGCGGCAGCCTTGGCTGGGAACGAGACGGCGCTGGCGCGGGTCGCGAGGGTGTACGACATGATTGTGCAGCGCATGCTCGGCCGGTACAGCTGTGACCTCGCAGAGGACGACAGGTTGCTGGCGGAGGCGGAGGCAGGACGCCGAGTACTTCCGCCACGCTTACATGCGGCGGTGTTGGCTCGGAAGCCGGAGAAGGACGCGTTGCTGAGTTTGCGGAAATTCATCGGTCAGGAAGGAGCTTTGCGTCAATCCTTGGCTGTCAATTCCGGCAAGAGCTTGTCGAAGACAGTCTTCGGAATAGCAGGAGCAAAGGGGTCAGAGGAACAGCTCTCTGAACCGCTAAAATACAGTCGTGCCATGGCTAAGAGCTGTAGCGCTGCTCCTGTCAATAAGTTTGCCCCTGCTTCGTTTTCGTTCGGTTTCTCTCTGTAAGTTTTGAGTTCGACTTGCTTCAGTTCGCTTTAATATGTGAGGATTCAGCAAAACTGGGAGGATCTAGTAAAACCATTGCATCTCAGGGATAGCCGCTTCTGTTCAGTGCGTGCCATTACAGATTTTCGTATCCCCGTCGGCAAGCGCATGTTCCCATCTGCAATGGTACCCAACGCCCTCTTAGTGCTTAGCTGAGGATGACGGTCACAATCCATGGATCGCAGGTTACAGTGGCCAACGTGCCCGCAGGTATAAAGGTGTCACTCTTCTCCTTCAAACGGCCTACCGAACCGCCACGGCTCCAAAAAATGCTGGCTGTCCGAACCCGCAAAAAGACAACGAGGGCATAGCACCCGGCAACCTTAACCAGGACATAGCAGTCGGTCACAAACGCCAGAGCGACAGGCGCACATTCACGTATGACCGTGAAGACGTGCCGATATTGAACCGTCAGGTCGGGAACAGCCTCCCCATACCGCCTCAAATTGCTATTTGTACAGAGACTCAGGCCCAGACATCATCGCTAAGCACTTCCCTCGATGAAGCAGCAAAACGAGAGCCACAGGCGTGAGCGTCACGTGCAAGCACACGCTTCGGCGCATTTACGAGGAGGGAGCCTCCTTCTCAATGTACCTGAGCACGCAGAGATGGGGGCAATGAGGGGGGAAAAGAGATTACGGGGAAAGGAAATAGTTTTGTACACAGTAATAGTCGCATACATACAACTTCAAAAATCAAAATGTGTGGCGTCCCGACACCATGCTCCCAGCTACACCAGCACTCACACGAACAGCGTAGCCATTCCGATGGCTGGCAGAACCAGGCCAGTCAGGGGCACGAACAGCGAGGGAGCCCAGGCCGGGGGCACGAAGGGGTAGCCCTCAGCAGCGCTAGCAACGGTGGCGATGACCTGCGAGGCCTCAGCCTGCAAGCATACAAGTGGACGACGAAAGATCGGTAGCCTGGGAGAGCCTCCGCTGCACTTCAGCATATTCCCAGACAAAGATGCAAAATCTGATTGTGCAAACAGTACGCAGCCATATCTCTGAAGCTTGTAAACAGGACTGGACGGAAGCGCCTTCCCCATCAAACATAAACACATAAACCAAAATTAAGCGCTGAGTAGGAAATGTCAGTTGCCCTC\n>URS0000054DFE rRNA from 1 species \nGTAGTCCTGGCTGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCACGGAAGTTTTCAGAGATGAGAATGTGCCTTCGGGAACCGTGAGACAGGTGCTGCATGGCTGTCGTCGGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTCCGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTGGATCAGAATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTAGGGGAACCTGCGGCTGGATCACCTCC\n>URS000187D73E rRNA from 1 species \nTACAGAGGGGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGCCTGCTAAGTCGAACGTGAAATCCCCGGGCTCAACCCGGGAACTGCGTCCGATACTGTCGGGCTAGAGTGTGGAAGGGGCTACCGGAATTCCGTGTGTAGCGGTGAAATGCGTAGATATACGGAGGAACACCAGCGGCGAAGGCGGGTAGCTGGGCCAACACTGACGCTGAGGCGCGAAAGCTAGGGTAGCAAACGGG\n>URS0002587220 misc_RNA from 1 species \nTCCGGTTTACCACCGGCAGTCTCCCTAGAGTGCTCGGCTTTACCCGTTAGCAACTAAGGACAAGGGTTGCGCTCGTTGCGGGACTTAACCCAACATCTCACGACACGAGCTGACGACAGCCATGCAGCACCTTGCACTCTGCCTAGGTTTCCCTAAGAGGCTCCATCTCTGGAGTTGTCAGAGGCATTCTAGCCCTGGTAAGGTTCTTCGCGTTGCGTCGAATTGAACCACGTGCTCCACCGCTTGTGCGGACCCCCGCCAACTCCTTTGAGTTTCAATCTTGCGATCGTACTTCCCAGGTGGGATACTTAATGCTTTCGCTCAGACACACACTGTGTATCGCGTATGTCGAGTATCCATAGTTTAGGGCGTGGACTAC\n>URS0000A3D8A0 misc_RNA from 1 species \nAATGTGATTGGAAAAGAAAATGAAGGAGAACTAATTAGTGGAGGGTTGAGGGTAAAGTGCTACAATTAGAGACTACAAAGTTAAATGTACAATGAACTAATGTTAAGATTAATGGGTCAAAGTTGTATGTAATGTAGATCCGGTAAACTATAATTCTTCTTTCAGATGCTCAACAGTATCATGTCTTGTCGTTACATTGAAGCTTCTCAATAACTTCCTCCAAGGGAGGATCTCCAGGTCTACGGAAGACTTGATCCCC\n>URS000015B95D rRNA from 1 species \nATGGAAAGTCCGGCCTGCCCGGTGAGAGATTCTCTTAAACGGCAGTAGTAAAGTTCTTTAATCGTAGCTCAATTTTCTTGCCCTTTAATTGTGGAGCGATGTGAATGGTAAGACGAGGGTTCAACTGTCTCGCTGTTACGAAGTGAAAACGGAGTGTAGGTGAAAATACCTACATGGATTATAGGGACGACAAGACCCCGTGGAGCTTTAGTGTGCTATTTTCTAGCTGAATTTAGGTTACTTAGGCTGGGGCAGCCAGATGGGAAGCAAATACCATTTGAGAGACGCTTGAGGCGTGCGGGCTTTTAACGATCCACCTCCCTTGAAATAATGGGGAAAATTGTGTGTATGTATGCAGAAAGAGGTGAAAGACGGAACAACGTTACCCCGGGGGTAACAGGCTAATTTCGCTCTGAGAGATCCTGTCGATGAGCGGGTTTGGCACCTCGATGTTGGCTTAGGGTATCCCGAAGATGCAGGGGTCTTCAAAGGTTGGTCTGTTCGCCCATTAAAACCCT\n>URS0000B01B68 rRNA from 1 species \nTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCCACGCCGCGTGGGTGATGAAGGCCTTCGGGTTGTAAAGCCCTGTCGGGAGGGACGAATACTGACGGTACCTCCAAAGAAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTGCTCGGAATTATTGGGCGTAAAGCGTACGCAGGCGGCCGTACAAGTCGGGTGTGAAAGCCCGGGGCTCAACCCCGGAATTGCGCCCGAGACTGTACAGCTTGAGTGCGGGAGAGGGAAGCGGAATCCGTGGTGTAGAGGTGAAATTCGTAGATATCACGGGGAACACCAGTGGCGAAAGCGGCTTCCTGGCCCGACACTGACGCTCATGTACGAAAGCGTGGGGAGCAA\n>URS000211E027 rRNA from 1 species \nAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGGCAGCACAGTAAGATCTTGCTCTTACGGGTGGCGAGTGGCGGACGGGTGAGGAATACATCGGAATCTACTTTTTCGTGGGGGATAACGGAGGGAAACTTACGCTAATACCGCATACGACCTACGGGTGAAAGCAGGGGATCTTCGGACCTTGCGCGATTGAATGAGCCGATGTCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATACCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAAGAAAAGCAGCAGGTTAATCCCCCGCTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGTG\n>URS00004A1422 rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGAGACCTTCGGGTCTAGTGGCGCACGGGTGCGTAACGCGTGGGAATCTGCCCTTGGGTTCGGAATAACTCAGAGAAATTTGAGCTAATACCGGATGATGACGAAAGTCCAAAGATTTATCGCCCAGGGATGAGCCCGCGTAAGATTAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGACGATCTTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGGCCCTTAGGGTTGTAAAGCCTTCTTACGA\n>URS0000110120 piRNA from 1 species \nTGAGAAAACAGATTTTGAAACTGTCAGTCTT\n>URS0000B33149 rRNA from 1 species \nGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTATCCGGATTTACTGGGTTTAAAGGGTGCGTAGGTGGGCAGTTAAGTCAGTGGTGAAATCTCCGAGCTTAACTCGGAAACTGCCATTGATACTATCTGTCTTGAATATCCTGGAGGTGAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGAAGGCAGCTCACTACGGGGTTATTGACACTGAGGCACGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCC\n>URS00002664CE rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGTGACCCAGGGCTTGCCCTGGTGATCAGTGGCGAACGGGTGAGTAACACGTGGGGCAACCTGCCCCTGACTTCGGGATAACTCCTCGAAAGAGGAGCTAATACCGGATACGACCACTTCGGACATCCGATGGTGGTGGAAAGTTTTTCGGTCAGGGATGGGGCCCGCGGCCTATCAGCTAGTTGGTGGGGTAATGGCCTACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGAGGGATGAAGGCCTTCGGGTTGTAACCTCTTTCAGCAGGGACGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCA\n>URS0000049829 rRNA from 1 species \nGCCAGACTGGAACCGGGAGAGGTAAGAGGTACTACAGGGGTAGGAGTGAAATCTTGTAATCCCTGTGGGACCACCGTGTGGCGAAGGCGTCTTACCAGAACGGGTTCGACGGTGAGGGACGAAAGCTGGGGCACGAACCGGATTAGATACCCGGGTAGTCCCAGCCGTAAACGATGCTCGCTAGGTGTCAGGCATGGCGCGACCGTGTCTGGTGCCGCAGGGAAGCCGTGAAGCGAGCCACCTGGGAAGTACGGCCGCAAGGCTGAAACTTAAAGGAATTGGCGGGGGAGCACAACAACGGGTGGAGCCTGCGGTTTAATTGGACTCAACGCCGGACAACTCACCGGGGGCGACAAGCAATATGTAGGCCAAGCTGAAGACTTTGCCTGAATCCGCTGAGGGGTGGTGCATGG\n>URS00022BB341 rRNA from 1 species \nCCCAAAGGTGGGTGGTAAACTCCATCTAAGGCTAAATACGTGCACGAGTCCGATAGCGGACAAGTACCGTGAGGGAAAGTTGAAAAGAACTTTGAAGGGAGAGTTCAAGAGTACGTGAAACCGCATAGAGGTAAACGGGTGGACCCGCAGCAGTTCGACCCGGGGAATTCAGCTCGGCGGCTAGCGGCGCCGCGGCCGGTACTCAAGGGGATACTCCCGTACCCCGCCGGTCGTCGACCGCGCCTGCCGCCGGGTGCACTTTCTCCGGGCCGAGAGCCACGACCGGCTCCGTCGGCGGTCAGAAGCCCGGCTGGGAAGGTGCCCCGAGCCCGGACGCTTGCGTCCGGCGCGCCGGGAGTTACAGCCCGCCGATGGTGGACACGTCGCGGGGCCGAGGAAGCCTTGCGCCGCCGGTCTCGGTCCTCCGGTGCCCCTCGCCCGTCCCGACCTCCGCGTCACTGCCTCGTCAGTGCGCGGAAACCGCGGAGCGGGGGCCACGCCGGGGTGTGCCAGGCCTGTGCGAAGGGTCGGTGGCGAATCGGTCGGTGCTCCACCCGACCCGTCTTGAAACACGGACCAAGGAGTCTAACGTGTGCGCGAGTCACGGGGACTCGACAAACG\n>URS0002354398 lncRNA from 1 species \nCCAAGTTCAAGCCTTTGCTTGGGTATATTTTTGTTTTTAATTGAATAAACCCCTATCTCTAGTCAGTAGGCTTAAAATAAATATTGGAAAAATATGTCAGAATGGTCCTACTGGTCTGGTGGTTAAGTGGTGTGTTGGGGTCTTGAGTTTGAATCTCTATACGTGTTAGGGGGTTTTTTTGTACATGTGTCGTGAAGGAGTTTGAAATGTGGTAAAATTCTGAGTATTTGAGGAGTGTGAGGATGTTGTGGCCGAT\n>URS00025EA52A lncRNA from 1 species \nGTCTAGCATTGTCTTGCATTAGGAGGAACCCAGGGCCAACCGCACCAGCATATGGTCTCACAAGGGGTCTGAGGATCTCATCTCGGTACCTAATGGCAGTCAGGCTACCTCTGGCGAGCACATGGAGGGCTGTGCGGCCCCCCCAAAGAAATGCCACCCCACACCATGACTGACCCACCGCCAAACCGGTCATGCTGGAGGATGTTGCAGGCAGCAGAACGTTCTCCACGGCGTCTCCAGACTCTGTCACGTCTGTCACAGCGTCGTGTAG\n>URS000112801C rRNA from 1 species \nTACAGAGGGTGCTAGCGTTGTTCGGAATTATTGGGCGTAAAGGGCGCGTAGGCGGCGCCACAAGTCACCTGTGAAAACTCTGGGCTCAACCCAGAGCCTGCAGGCGAAACTGTGGTGCTGGAGTATGGGAGAGGTGCGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAGGAACACCTGTGGCGAAAGCGGCGCACTGGACCATAACTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACAGG\n>URS0000474C22 rRNA from 1 species \nGAGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAGCGGGGTTGAAGCGAGGGGTAACTCGAGTTTCTACCTAGCGGCGGACGGGTGAGTAACGCGTGGGCAACCTGCCTCAAGGACTGGGATAACAGCTCGAAAGGGCTGCTAATACCGGATAAGCCTATGGCCTCGCATGGGGCCATGAGCAAAGGGGAAACCCGCCTTGAGATGGGCCCGCGTCCCATCAGCTAGTTGGTGAGGTGAAGGCTCACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGGGGCAGCAGTGGGGAATCTTGCACAATGGGCGAAAGCCTGATGCAGCGACGCCGCGTGAGCGAAGAAGGCCTTCGGGTTGTAAAGCTCTGTCTGGAGGGACGAAGGAAGTGACGGTACCTCCGGAGGAAGCCACGGCTAACTACGTG\n>URS00019BDD9E misc_RNA from 3 species \nTAACCCTCAAGCCTAGCTTGGTATTGGAGTCGCTATACAGCGGCCCCTAAAATCAGTGGCGGTGCCTATAGGTTCTACGCGTAGTAATTTTTCTCGCTATAGATCCCTATAAGTGCTTGCCAACAACCCCAATTTTTTCA\n>URS0002519978 rRNA from 1 species \nATGTCTGGAAGCACGGGAGAACGTTCTTTTGCTGATATTATTACCAGTATTCGATACTGGGTTATTCATAGCATTACTATACCTTCCCTATTCATTGGTTTGTTATTTTTCAGTACATGTTTAGCTTATGACGTGTTTGGAAGTCCTAGGCCAAACGAGTATTTCACGGAAAGCCGACAAGGAATTCCATTAATAACCGACCGTTTTGATTCTTTAGAACAACTCGATGAATTTAGTAGATCCTTTTAG\n>URS000071DEB1 tRNA from 1 species \nGGGGGTGTAGCTCAGTGGTAGAGTGCTTGCCTGGTATGCATGAGGCCCCGGGTTCCAGCCCCT\n>URS0001088F60 rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGCTCGGAATCACTGGGCGTAAAGCGCACGTAGGCGGATCGTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGGCGACCTTGAGTTCGGGGGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGG\n>URS00008DF95F rRNA from 1 species \nCGCAGGGCCTTGCGCTGGSGATGTTTCATTCAAATTTCTTGCCCTATCAACTGTCGATGGTAAGGTATTGGCTTACCATGGTTACAACGGGTGACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACTCAGGGAGGTAGTGACAAGAAATAACAATACAGGGCTTTTCTAAGTCTTGTAATTGGAATGAGTACAACTTAAATCCTTTAACGAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCGGGACGGGCCGGCCGGTCCGCCGCAAGGCGTGTTACTGACCGGGCTGTTCTTCTTCGCAAAGACTGCATGTGCTCTTAGCTGAGTGTGTGTAGGACTTGTGACGTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCCAGCGCTTGAATACATAAGCATGGAATAATGGAATAGGACTTTGGTTCTATTTTGTTGGTTTCTGGAACCGAAGTAATGATTAAAAGGGACAGTTGGGGGCATTCGTATTTCGTTGTCAGAGGTGAAATTCTTGGATTTACGAAAGACGAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCATTAATCAAGAACGAAAGTTAGAGGATCGAAGACGATCAGATACCGTCCTAGTTCTAACCATAAACGATGCCGACTAGGGATCAGAGAGTGTTATTGGATGACCTCTTTGGCACCTTATGGGAAACCAAAGTTTTTGGGTTCCGGGGGAAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTCACCAGGTCCAGACATAGGAAGGATTGACAGATTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGTTAACGAACGAGACCTTAACCTGCTAAATAGTTACGCGAATCCCGATTCGCGGCTAACTTCTTAGAGGGACTGTTGGTGTTCAACCAAAGTCAGGAAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGACGATGTCAACGAGTCTCTCCTTCGCCGAAAGGCGTGGGTAATCTTCTGAAACATCGTCGTGCTGGGGATAGATCATTGCAATTCTTGATCTTGAACGAGGAATTCCTAGTAAGCGCGAGTCATCAGCTCGCGTTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCG\n>URS00023E717A lncRNA from 1 species \nAGTCCAAGCTACATTATTGGCGCTGGCAGGGCTAAAACGCCTAGATATGACAGAAAATGTCACTTCCATTCTTCCTATAGAGGATATGCTACCGGCAGTTGCTCAGGGAGCCATTGGTATTGCATGCAGAAGTGATGATGAGACAATGGTATTCACATCGTTTCTTCCATAAATATAGTTGCTTCTATTGCAGTTCTCTATTCGATGACGAGACAATGGTATTCACATCGTTTCTTCCATAAATATAGTTGCTTCTATTGCAGTTCTCTATTATTCTTTAATGAAAAACTTCAATCACAGGCCAATTACATTGCCTT\n>URS00007532CF rRNA from 1 species \nTGCTCAGGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAATGGATTAAGAGCTTGCTCTTATGAAGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCCATAAGACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATAACATTTTGAACCGCATGGTTCGAAATTGAAAGGCGGCTTCGGCTGTCACTTATGGATGGACCCGCGTCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGCTTTCGGGTCGTAAAACTCTGTTGTTAGGGAAGAACAAGTGCTAGTTGAATAAGCTGGCACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGCAGGTGGTTTCTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGAGACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACACTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGAGGGTTTCCGCCCTTTAGTGCTGAAGTTAACGCATTAAGCACTCCGCCTGGGGAGTACGGCCGCAAGGCTGAATCAG\n>URS000255B89B rRNA from 1 species \nATGGCGCCATCGACCAAGCTCTTCCTCCTGCTCCTCGGCTTGAACCTGATGGTCGCCGATGTGCACGGTGGCTGCGGAGCCCACTGCCCGACTCCGCCGCCACCGTCGACGACCAACGGCTCGTGTCCGATCGACACGCTGAAGCTGGGCGTGTGCGCCAAGGTGCTGAACCTGCTAAAGCTTGGGCTCGGTGTGCCGCACAGCGAGACGTGCTGCCCGCTGCTGGCCGGTCTGGCCGACCTGGACGCCGCGGTGTGCCTCTGCACCGCCACCAGGGCCAAGGTCCACGGCGTCATCAACCTCAACGTCCCCATCGACATAGTGCTCCTGCTCAACCAGTGCCACAAGACCTGCCCGCCCGGCTTCACCTGCCCGCTCTGA\n>URS00017EA271 rRNA from 1 species \nTACAGAGGTCTCAAGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGTGGCGTGGTAAGTCGGATGTGAAAGCCCCCGGCTCAACTGGGGAGGGTCATTCGATACTGTTCGACTCGAAGGCAGGAGAGGGAAGTGGAATTCCCGGTGTAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGACTTCCTGGCCTGTTCTTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACGGG\n>URS0001FED583 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGACGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACATCGGGAAACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATGGCTCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCGACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACAAATGTGTAAGTAACTATGCACGTCTTGACGGTACCTAAACAGAAAGCCACGGCTAACTACGTG\n>URS0002417CDE lncRNA from 1 species \nAGAGACAAAATCATTGGGACACCAAATCTGTTAAAGCAGGCATCACTCTTGTTTCAATGTGGTTTTCACAGCATCTCAATGCCGTTTCATGCTGTTTAGAAATCATAAACAGCTCTGGAGACGTGCCTCACTCAGTCGTGGGAATCTCCAGTCATCAATTCAGGAGACAATAACACCAAATTTGTTCAATGTGCGTTTAACAACATTCTGAAACGTCATAAGTAATGCAGGCTGTCTCGCATGCAGTCTTTCAGCACTGAAACGTTGTAGAGTCGAAGTGTATAGCGCTGCCTTAGTCCAGACAGCATGCTATTGTGAACTTGTCTCCAGTCAATTGGCTCGATAATTTTGAGCTCTCGTGCATGCAGCGGCATACATCTGAGGGACATGGACTTCCATGGGCCAACGATGAATATTACTCTATTTTCTCATAGGTCACAGCCACGGAAGAATGCGATGCCGCTCAATACGACCTTGGCCAACGATGAATATCACTCTATTTTTTCATAGGTCACAGCCTAGGAAGAACGCGATGCCGCTCAATACGACCTCTATGAGTGGTATTAGCACTTGGTGCTCATTCCCTTGAGGAAGGAAAGGTGACATTGCAAGGGCATATTGGCAAGCATATCGATGGCCATCAAATTTTCATTTTAAGGTTGCATTGCATTATATGATTTCAAGA\n>URS0002158408 rRNA from 1 species \nGGTTTCCTGGGCAAGGCTAATCCTCCCAGGGTCAGTCGGGGGCTAAGGCGAGGCCGGGAGGCGTAGCCGACGCGCAGCAGGCAGACATTCCTGCACCGCGCACGCGGCGCTACGACCGACGGGGCGACGGATGGGGGTGGCTCGGCGGGGTTCTGGACGTCCCCGTGATGGAGCGCGGCCCGCGGACCAGGGAAATCCGGTCCGCACGAGGGCGAGGCTCCGGACGAAGCGATTGAGCGAAGCGAGTGAGCCCGAGGTCCCTAGAAAAACCCCTAGGCAGGCGCGTGCGCGCCCGTACCGCAAACCGACACAGGTGGGTGGGTAGAACATACCGAGGCGATCGGGTCAACCATGGTCAAGGAACTCGGCACAATGGCCCCGTAACTTCGGGAGAAGGGGTGCCCGCGCGTACGTGAACCGGCTTGCCCGGGGAGCGGAGGCGGGCCGCAGTGGAGAGGCCCAAGCGACTGTTTACCAAAAACACAGGACTCTGCAGAAGCCGCAAGGCGACGTATAGGGTCTGACGCCTGCCCGGTGCCGGAAGGTCACGCGGAGGAGTTAGCCGTCAAGGCGAAGCCCCGAAGCCAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAAAGGCGCAACGACTTGGGCGCTGTCTCGACCATGGACCCGGTGAAATTGCACTGGTCGTGAAGATGCGACTTACCCGCGGAAGGACGGAAAGACCCCGTGAACCTTCACTGCAGCTTGGCATTGGCCGCTGGTCCCGCGTGTAGAGGATAGGCAGGAGGCACAGATCCGGAGGCGCCAGCCCCCGGGGAGCCGCCCTTGGAATACTGCCCTCGCGCGACCGGCGTCCTAACCCGAGGCCGTCAACCGGCTCGGGGACCGTGCCAGGCGGGCAGTTTGACTGGGGCGGTCGCCTCCTAAAGGGTAACGGAGGCGCGCGAAGGTCCGCTCGGGACGGTCGGCAACCGTCCTTTTGAATGCAAGAGTACAAGCGGGCTTGACTGCGAGGCCCACAAGCCGAGCAGGTGCGAAAGCAGGCTCTAGTGATCCGGCGGCCCCGAGTGGGTGGGCCGTCGCTCAACGGATAAAAGGTACTCCGGGGATAACAGGCTGATCTTGCCC\n>URS0000E09CF4 tRNA from 1 species \nGCCGGTGTAGCTCAATGGCTAGAGCACTTGACTGTGGATCAAGGGGTTATGGGTTCAAGTCCCGTCGCCGGTA\n>URS0000BDAE45 snRNA from 1 species \nGAATGTTGGGCTAATTTGGCTGAAGCACCTGTCAGCCTACTGATTGCCAGCATGGATTCAGCTGATCTAGCTGGCTAGGTGGGCGTCTCCTTCCTCCCTCACTGCTCTATGTGTAACCCTCCTGAAAGTGGTCAGAGGACACCTTTGTGGAATTGGTTCTTTCCTCTTTCCTTGGGTTCCAGGGGTCAAACTCAGGTCAGTAGGCTTACACAGAAAGCTCACCATCTCT\n>URS0000B28382 lncRNA from 8 species \nTGTAAACAAAACCAAAAAAAAAAAGGCATAAGATTAATAAAGATGTATTAAATACATAAGATTAACACATAAATTTCGTTATACAAAAGCATTTTGATAAACCGAACCAAATCATCTAGATAGGAAAATTGAAAACATGTGATTGAATATCTTGTTTTATACTTTATTTACATATAAAACTTTAAGAAACATGAAAGAGATATTTGGCAGATTTAATCATGCCAACAAAGATTGATTTATCTAATAAATATCTATTGTGTCCCTGGGTACTGGACATTGTTATTAGAGAAAAGAAATAATATGAAACCTCTACCGTAATATCATAGAGTCTAGGAAAGAAAATTCATCTATTCTTCTATCCAGATTAGACTAAGAG\n>URS0002201BE9 tRNA from 1 species \nTCTCCTTTAGCTCAATAGTCAGAGCGTCCGGTTGTTAACCGGAGGGTTCTGGGTGCAAGTCCCAGGGGGAGAT\n>URS00014BEA7C rRNA from 1 species \nTACGGGGGGGGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGTGGCCAACTAAGTCAGACGTGAAATCCCTCAGCTTAACTGGGGAACTGCGTCTGATACTGGATGGCTTGAGTTTGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAATACCGATGGCGAAGGCAGGTCTCTGGGCTGACACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGG\n>URS00023B1992 lncRNA from 1 species \nGACTACGAATCGACATTGTAGCTTAGGAAAGTTTCATTTCATCCGTGGATCCTGAAGAGCAAGGTATCCTCTCTCCGTCGTACCTTTTTTCACATCGATTCGTTATATATTTCTTGCATTTTTGAACTTAGGGTTTTCATGCAAATGTAGGATGCCGAGGCGTGGAAAAGCTAAGAAACTAAGGTAATCTCAACGCCCGTAGTTATGTTATATACTCATTGTTGTGTATCAAATGAAAAAACCTTAAATGTAGGTTTATTCCTAAGTGCGTTTGATTCATAGAACCAAATAAACAAAATTGTAGTTATGGCGCTAAGAAGACCGGAAATGCGTTCGATCCATTGCCTCTGCCTAGTGGTGTTCCAGTGCCGATGTGCTTTTGCGGCGATCCTTGCAAGGTAGCCAAGTCCGAAGAACATGCC\n>URS0001EBED66 rRNA from 1 species \nCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGATACTGGCAAGCTTGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCACGGAAGTTTTCAGAGATGAGAATGTGCCTTCGGGAACCGTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTCCGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTGGATCAGAATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTAGGGGAACCTGCGGTTGGATCAC\n>URS00006566BF snoRNA from 5 species \nCTGCATGATGAACTCTTAATTTCGCTGTGTTCTTACCGAGGCACACTTTGAAGAAACAAAATATCACCTTGGAGAACTGACAC\n>URS00006E3F2F snoRNA from 1 species \nTATGCTGTGATGAGATTAAGCACCATAGGGTGTATTGGGCAGTGGAAGAAGGTTTAAAAGCCTTCTCCGTGAGCTTATTAATTAACGACTTCTCCTTCCACTGAGCATC\n>URS00000BBF13 rRNA from 1 species \nAGAGTTTGATCCTGGCTCAGGATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGAGATTTTATAAAATTACTTTTCGAAGGAAGTTTTATAGATAAAGCGGCGGACGGGTGAGTAACGCGTAGGCAACCTACCTTATACAAAGGGATAGCCTCGGGAAACTGGGATTAATACCTTATAATACTTTGGGATCGCATGATCCTAAAGTCAAAGATTTATCGGTATAAGATGGGCCTGCGTCTGATTAGCTAGTTGGTGGGGTAACGGCCTACCAAGGCAACGATCAGTAGCCGACCTGAGAGGGTAATCGGCCACATTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCAACGCCGCGTGAGCGATGAAGGCCTTCGGGTCGTAAAGCTCTGTCGTGAGATGGGAAAGAATGACGGTACAATAAGAGGAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAACGTTGTCCGGAATTACTGGGCGTAAAGGGCGAGTAGGTGGTTTGCTAAGTCAAAAGTGAAAGGCTACGGCTTAACCGTAGTAAGCCTTAGGAACTGTAAGTCTTGAGTGCAGGAGAGGAAAGCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGACTTCCTGGCTTGTAACTGACACTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGGTGTAGAGGGTATCGACCCCTTCTGTCGCAGCTAACGCAATAAGTATCCCACCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAAGAACCTTACCAGGGCTTGACATCCTACGAATCCTTAGGAAACTAGGGAGTGCCCTTCGGGGGAACATCTAGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCATTAGTTGCTACGCAAGAGCACTCTAATGAAACTGCCGTTGACAAAACGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCAACACACGTACTACAATGGCCGATAACAACGGGAAGCAATACAGCGATGTGGAGCCAATCCCAAAAATCGGTCTCAGTTCGGATTGCAGGCTGCAACTCGCCTGCATGAAGCCGAAATCGCTAGTAATCGCAGGTCAGCATACTGCGGTGAATACGTTCCCGGGCCTTGTACACACC\n>URS0001DD25E8 rRNA from 1 species \nATTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGAACGGCAGCACAGGGAGCTTGCTCCTGGGTGGCGAGTGGCGAACGGGTGAGTAATGTATCGGAACGTGCCTGGTAGTGGGGGATAACTACTCGAAAGAGTGGCTAATACCGCATGAGATCTTTGGATGAAAGCGGGGGACCTTCGGGCCTCGTGCTACTGGAGCGGCCGATATCAGATTAGGTTGTTGGTGGGGTAAAGGCCTACCAAGCCTGCGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATGTGGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGCAGGACGAAGGCCTTCGGGTTGTAAACTGCTTTTGTACAGAACGAAAAGTCTCTGGCTAATATCTAGAGATCATGACGGTACTGTAAGAATAAGCACCGGCTAACTACGTG\n>URS000170AD9B rRNA from 1 species \nTACGTAGGTGGCAAGCGTTTGTCCGGATTTACTGGGCGTAAAGAGCGCGCAGGCGGCTGGGCAAGTCCGATGTGAAAGCTTCCGGCTTAACTGGAAAATTGCATCGGAAACTGCTCGGCTTGAAGGTGGGAGAGGGTAGCGGAATTCCCGGTGTAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCTACCTGGCCCACTCTTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACGGG\n>URS000204CED6 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGATGAAGGGAGCTTGCTCCTGGATTCAGCGGCGGACGGGTGAGTAATGCCTAGGAATCTGCCTGGTAGTGGGGGATAACGTCCGGAAACGGGCGCTAATACCGCATACGTCCTGAGGGAGAAAGTGGGGGATCTTCGGACCTCACGCTATCAGATGAGCCTAGGTCGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCGTAACTGGTCTGAGAGGATGATCAGTCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGTCTTCGGGTTGTAAGGCACTTTAAGTTGGGAGGAAGGGCAGTAAGTTAATACCTTGCTGTTTTGACGGTACCAACAGAATAAGCACCGGCTAACTTCGTG\n>URS0000E460B3 rRNA from 1 species \nCGGCGAGTGAAGCGGCAACAGCTCAAATTTGAAATCTGGCCTCGGCCCGAGTTGTAATTTGCAGAGGATGCTTTTGGTGCGGTGCCTTCCGAGTTCCCTGGAACGGGACGCCACAGAGGGTGAGAGCCCCGTATGGTTGGACACCAATCCTGTGTAAAGCTCCTTCGACGAGTCGAGTAGTTTGGGAATGCTGCTCTAAATGGGAGGTAAATCTCTTCTAAAGCTAAATACCGGCCAGAGACCGATAGCGCACAAGTAGAGTGATCGAAAGATGAAAAGCACCTTGAAAAGGGGGTTAAACAGTACGTGAAATTGTTGAAAGGGAAGCACTTGTGACCAGACTTGGGCCGGGCGGCTCATCAGGGGTTCTCCCCTGTGCATTCCGCCCGGTACAGGCCAGCATCGGTTCTTACCGGGGGATAAGAACGGCAGGAACGTGGCTCCCCCTCGGGGGAGTGTTATAGCCTGCCGTACGATACCCTGGCGGGGACCGAGGTTCGCGCTTCCGCAAGGATGCTGGCGTAATGGTTACTAGTGACCCGTCTTGAAACACGGACCAAGGAGTCGTCCATTAGAGCGAGCGTTTGGGTGTCAAACCCCCACGCGTAATGAAAGTGAAATTAGGTGAGAGCTTCGGCGCATCATCGACCGATCCTGATGTTCTCGGATGGATTTGAGTAAGAGTTTTAACGGACGGACCCGAAAGACAGTGAACTATGCTTGTATAGGGTGAAGCCAGAGGAAACTCTGGTGGAGGCTCGCAGCGGTTCTGACGTGCAAATCGAT\n>URS0000657173 tRNA from 1 species \nGGGGATATAGCTCAGCTGGTAAAGTGCTTGCCTTCCATGCATAAGACTCTGGATTCTATCCCCA\n>URS0001FC8B0A rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTAGAACGCTGAAGGAGGAGCTTGCTCTTCTGGATGAGTTGCGAACGGGTGAGTAACGCGTAGGTAACCTGCCTGGTAGCGGGGGATAACTATTGGAAACGATAGCTAATACCGCATAAAATTGATTATTGCATGATAGTCAATTAAAAGGTGCAATTGCATCACTACCAGATGGACCTGCGTTGTATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATACATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGGAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGGTTTCGGATCGTGAAGCTCTGTTGTAAGAGAAGAACGAGTGTGAGAGTGGAAAGTTCACACTGTGACGGTATCTTACCAGAAAGGGACGGCTAACTACGTG\n>URS00009B8067 lncRNA from 7 species \nTTTGTAGCGGTGCCAGTGAAGAAGAGGACACATGAAGACTTAGCATTCCCTGCAGAAAACGCCCCTTCCCCGTGTGTGTGTGACAGCGTGTATGTAATGGCTTCTGATATCTGTGAAAGCTGCCAGGCAACAAACTTCTTCTACTGGAAATGTCCCCAGATCCACAGCAGGCACACATGTTCCCAAGGGACCAGGGGTTGTATGCATTCTGACTGTGTGCTTCTTGTTCTCTGTGGTAGGTCATGGGAAGAGCCCTTTTGATCAACTTGGAGGGCTCTTCAGCTAACCCCCCAATGGCTGCTTTGAACTTACTCAGGAAAGCCAGCCCCTGGAATATTGTGCAAGTCAACACTATCACTTCCTTAGGAAGGTTCTAGAACATCTCGAAAGGATATCAGTTTTCCTTACCTGCAAACAGAAAACAAACCCACTTTGTTTGTACTGAAGCTTAAAGCAAATGTGGCCAAGTGGGGCCAAACTGACTCAATAGGCAGTCTGTCATAGTCCAGTTCTGCCTCTGTGAAAAGTGTTAGGGCAACTGGGTTAAAATAGGGTTGGAGAAAGAGTCCAGAGCTAGAAAGAAGATATTTTTAGTATGTGAGGTTATCTAGGACTTAAGTTTCATAATTCAGTGCTGTGGAAATGGGAAAATGATTGAAAAGGTAGAAAGGAAATGACCTTAAGGACTGGGGTGAGGCACAGAAATCTGATTAAAGGTTGAAATCAGTGTTTCAGAATTCAGATTGCCTCAATTTTCCAAAATGGTCACTAAAGCATCTGATAAAACCCAGAATTCTTCGGCCAGCTGTGTGGATTAACAGGCCTGTCACAACATAAAAGGCTGGCATGTATATTGGCAGGTGGAGATTGTCACTGTAAAACTTAGCAGTTTCACTCCGAGGTTAGTCTATGGTGGTCAGTGCACTGTGAGGGGAATCCTTGTCCCTCCCTGGCAGCTAGCAAACATTCCTCTATTTACTATAATTGGAATCCTCCCTTCCCCTGCAGCAGGCCGTCAGCTCACCTCACACAGCCCAGTTTTCTCTTCATGTAGCATGTCCAGGCATGCTCCAGAGCTGGGTTTCCTGGCCTTCCCACACTCCCAGATCACAGTCTCTTACAACCATGCTTTTCAGGATCCAGGAAGTAGTAAGTGTGCTGGGAGATACCCAACTAACTGCAAGCTCACAAGCACCACATCTTCTTGAGACATCAGTTTTTCTTTCCAAATGATTTGAAGTCAAGAGATGACCATATTTTTTAATGGAACAAATGCTTATGTTATACAAGAGAATGTTCATACACCTAAAGTGCTAAACTAAAATAGGAAACTTGGAAGGAAACTCATATTTGTAAGTGGACAGTGATTCTATCTCCTCTGCTTGTGTGGTATTTCCATGTTCACTTTGAGATTTTGTCTGAACTGGATTCAGGCAGCCTTGGGGTTGCTGTTGATCAAGGTCTAGACTTCCAGATCCAAGGAGTCCACCTTGGAGTAGTACATCTCCCTTTTCCTGTCAGCCAGCTTGCCTGTGTACTTATCACAAAGCTTTAGGGGCAGCTAACATGTGTATGTACAGGATAGTTCTGAGGCAGAAACAGCATAGACTTATTGTAGGAGTCCTATTTATGTCATTGTTCAGCCCTGTGCATGCTAGAAAATGATTTATCCCTTTGAGGCCAGGAAACTGCCAAGCCACTCTGCTGTAGGCTAGGATTACTGAAACTCACCACACATACAAGGATATTGGGGCAGAGCGGAGTGTGAGATCTAAAAATATGTATACTTTCCCCAGCTGGTGGCTAGTAGATGGCTTAGACAATTTTGGTGTCTTACCATCTGTCTGCAAAGACTGGAGAATTTAATACATCTTGAGTTGACAACCTCCAGTGATATCCTGTTCTGCCAAAATTTTAAAAGAAGGGCCACTGTAGAAAGAGTGTAAACTATCACAAGATTGAAAAGACTTGACAGTTTGGAAGCTTGTCTTGTCTTTCTCAGTAATCATTGATCTTTACATGTTGACCTTATATTAGCAATGAACAGATCATTGCCTCTCCACCCAATCATGCTATTTCTTTAAATCAGTATTTGGGGAATGCAAGCATTTATGCAGTGGTTATAAACAGAAATATAAGATTTGCCAACCTGTCTCTTTAAATTACCATCTCTCTGAAATCCTCAAGGAAAGCATTTTCCCTTTACTTAGTAAGGGTTTCAGATTCACTTTATGGGCTCCTGCTGTCTTCAACACTGATAAAACTTTAACCAGAAAAGCATTAAACACAGCACAGCAGCCCCTAGCCCAGATCCCTAAGTTCCTAGTGGCAGCATTTATCAATGTAAGAACAAGAATACTTTCTGTACTGGTATCAGCTTCGTCCTCAAAGCTATGACCTCTTACTTGGCCTTGTGCCCCATAGTGAACGAAGCTTCTTGCCTTTCCAGGTCAGTGTGAGTTAAGATTGTCAGAGTTGTATGTGTCCTGACAGACTGTGGACAGCAGGGTTTGCCCAAATCATCAAGTGATACAGGTAATGAATGTCTCTAAAATAAGTTGGGTCCTCCAAACAAGTCCTGGATACCTTCTGAATGTTAAGTTTCTGAGTGCTGAGAGTAATTTGTTCATTGGTTTGGTTTGATACCGTTATATCTATCTAGGGCAGTTCCAAGAAGTGCTTGACTTCTCAGCTCTAACAGCCAGTAAGAGTAAGTAACCTTAGTACAGGCAATGAGCCTCTGTAGATGTGCAGAGGACAAGTCACTTGTCTGTAGTTGCTAACAAACAATGGAACCAGTTTTGAGCACAGCACTCCCTGCTCTGCAGTCAGCCCTCTGCCCCACACCATGACTCACCTACAGATTGAGAGAGAGAAAGGCTTTCAGTTCCCCCAGTGTAGTATGCCCATTCACACTCGGAATTCTTTTTCAAAGACATCAAGATGGCCTTAGTACTCTGCTCTAGTAGATGTTGTAAGTATTCATTGTTCCTTCCAGGAGCTGGATTTTTGGTACAGTCCCCACAAAGGAAAATAAAGGCCTTCAAGAGTGTAAAGTTTTTAGACAGAGTTGGAGGTAATGGTAGTCTTCTAACATTATCTAAATATCTCCTGCTTCATTACTATAGAAAGCAACTCTTCATGTTTTAGGAAACCCAGCTACCATGTTTGTACTCTGAGAAGGTGCCAATACAAATCACTAATTTTGGACTCCCTTCCTGGAGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTAAATGAGAATGAGATTTGTACACACCCACATATTCTATACCACTTAATTAAGAGTTAAGTGAAGTTCAAAGCAGCCCCTGGTGATCTTACTTAACACCACAAAGTTTTCTACTAGGTCCATGAAAGTATAAACAGATAATTGGAGTGTGACTGCTGGCTTTCCAGAATAACCCACTTGTGGTAGATGTCAACTCTTACAGCTCCAAGCCAAGGTGACGACAACCCAGCCCTCTTCCACCATGTCTAATAACATGGGACATGGTAGATGCCTTGTCATTTGGTGACCTGGATCTGGGCCCGAGTTTAGAGCTGCAGAATTTATAACCTTGTAGTAGTCAGTGGTCTAAGAAGTCCTCTCTCCCCACAGAGAAAATGTCTTGCTGATTCCTGATATTCTACTCTCATAAGCTGTTCAGTACACACTTCTCAGTCAATTGGTTGCTTGTTTACTATGTGCTGAGCACATCTAGATTTTTTGTTTGTTTAAAGTTAAAAGTCCCATTATAAATCAAGTCTAACCCTGCCCTAAGAGAAAAGACCCACAGAGACTGCACATCTCACTGACGCTGCCTTCACCCATTAGTGTTTGAGGCCCACCATCCTATGGAGCCAGGTATTCCCACATCATTCAGATCACTGGTGTTTCCCATTACTGTTTGAGGCTGAGCAGAAACACTAACAAGGACCAGAGCAGGAACGGGAAAATAAATGAAGACACTTGGAGTGCACTGTTGAGAAAATAGCCAGAGTCCATGCTGGGCTTGATGTGGCTTTAGGGGACCAATCATATATACTTTATGGAAGTTAAACCTGACCAGTCTTTACAGTGACAGGCCACAGCGCGTGAGTGGGTAGAACCAACAAATCCATTGTCTTCTGCCTGTTTTTGTGTGCACAGTCACATTCCCTCCTTAGTCATCTTCCCCTTCCACTCTTTACACTAAACAAGGGAACACTCAATCTTTCAAGGGAATTACATATCTGAGTTAATGTTTCAGTATATCATTTTCATACTGTAAATTATTTTGTAAGAGAGATTTACTGCTATCCCAGGATGTTCGGACTTGGCGCCCCTGTGCATTTGGAAATCAATAAACTATTACTGGAAATACC\n>URS0001E92C0D rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGACGCTCTTCCTTCGGTGAGGTGACGGAGCGGCGAACGGGTGAGTAACACGTGGGCAACCTGCCCCTAGCTCTTGGACAACACCGGGAAACCCGTGCTCATACCGGATACGGCATCGAGCGGCACCTCTCGGTGGGTAAAAAGTTTTCGGGTAGGGATGGGCCCGCGGCCTATCTGCTTGTGGGGGGGGGGTTGTCGCACCCAGGGGCGGACGGGGGGCCGGGCTGGGAGGGCGGCCAGACAGACAGGGACTGAGACACGGCCCAGCCTCCGACGGGAGGAGGGAGGGGGGAAGATTGAGGAACGGGCGAAAGCCGGACGAAGCGAGGCCGCGGGAGGGATGCCGGCCTTCGGGTTGTAACTCTCTTTAAGCAGGGACGAATTCAGACGGTACCTGCAGAAGAAGCACCGGCCAACTACGTG\n>URS00002FCF40 rRNA from 1 species \nTAAGTCACTTTGTCTTAATGGCAAATGTGAGATGCAGTGTATGGAATATCTTAATATCTAGTATGAGAAATTAACGATTTAAGTCCTTCTTAAAAGAGGCCATTTACCCATAGAGGGTGCCAGGCCCGTATAACGTTAATGATTACTAGAAAGATATTTCCAAAGAGTCGTGTTGCTTGATAGTGCAGCACTAAGTGGGTGGTAAACTCCATCTAAAACTAAATATAACCATGAGACCGATAGTAAACAAGTACCGTGAGGGAAAGTTGAAAAGAACTCTGAATAGAGAGTTAAATAGTACGTGAAACTGCTTAGAGGTTAAGCCCGATGAACCTGAATATCCATTATGAAAAATTCATCATTATATATGTAATATTAATTGATTAATATTATAATAATAGTGTGCATTTTTTTCATATAAGGACATTGTAATCTATTAACATAAAAAGTATTTATCAAAAGATCATTGGCTTTAAGTTTATTTTAATTAATTTGCTTTATTGCTTTTTAACATTAAATAAATGCCTAATGATTTGATAAAGTGTTGATAGATTTATTATATATAATGCTTAAATTCATTTTGAATTTTACAATAATGTTATAAACATTGATTTAAAAATTAATGTACGTNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCTTGAAACACGGACCAAGGAGTCTAACATATGTGCAAGTCATTGGGTTATATATATAAACCTAATGGAGTAATTAACTTAACTAATTTAATGGGATTAATTTTTAGTCTATTTATAATAGTCTATTAATTCAATCCCGGGGCGTTCTATATAGTTATGTATAATAATAATTTATTATTATTTATACCTCTAACTGGAGCGTACCTTGAGCATATATGCTGTGACCCGAAAGATGGTGAACTATACTTGATCAGGTTGAAGTCAGGGGAAACCCTGATGGAAGACCGAAACAGTTCTGACGTGCAAATCGATTGTCAGAATTGAGTATAGGGGCGAAAGACCAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGTGCATTTATATATTATGTAAAATAATCTTATCTGGTAAAGCGAATGATTAGAGGCCTTAGGGTCGAAACGACCTTAACCTATTCTCAAACTTTAAATGGGTAAGAACCTCACCTTTCTTGATATGAAGGTTGAGGTTATGATATAATGTGCCCAGTGGGCCACTTTTGGTAAGCAGAACTGGCGCTGTGGGATGAACCAAACGTAATGTTACGGTGCCTAAATTAACAACTCATGCAGATACCATGAAAGGCGTTGGTTGCTTAAAACAGCAGGACGGTGGACATGGAAGTCGTAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAAGCAACTAGCCCTTAAAATGGATGGCGCTTAAGTTGTATACCTATACATTACCGCTAAAGTAGATGATTTATAATACAATTTCGATTGAATTATAAATTTTGAAACTTTAGTGAGTAGGAGGGTACAATGGTGTGCTTAGAAGTGTTGGGCGTAAGCCTGCATGGAGCCGCTATTGGAACACATCTTGGTGGTAGTAGCAAATAATCGAATGAGACCTTGGAGGACTGAAGTGGAGAAGGGTTTCGTGTGAACAGTGGTTGATCACGAGTTAGTCGGTCCTAAGTTCAAGGCGAAAGCCGAAAATTTTCAAGTTTTAATGCAAAGAAATAACCAAACAATTAAAAAAAAAAAAAGAAAAAAGTAAACTTAAAGAAAATGAAAAGAACAATTTTAAAACTTTATTAATAAAAAAATAATTAATTACTACTATGTTTTTTCATTTTTTGTTTAACTTTTTTTCTTTTTTTTTAAATTGAAATTTTTGAATTTTTAAACACTTGAATAATTTTGAACGAAAGGGAATACGGTTCCAATTCCGTAACCTGTTGAGTATCCGTTTGTTATTAAAAATGGGCCTTGTGCTCATCCTGGCAACAGGAACGACCATAAAGAAGCCGTCGAGAGATATCGGAAGAGTTTTCTTTTCTGTTTTATAGTCGTACTACCATGGAAGTCTTTCGAAGAGAGATATGGTAGATGGACTAGAAGAGCATGACATTTACTGTTGTGTCGATATTTTCTCCTCGGACCTTGAAAATTTATGGTGGGGTCACGCAAACTTCTCAACAGGCCGTACCGATATCCGCAGCTGGTCTCCAAGGTGAAGAGTCTCTAGTCGATAGAATAATGTAGGTAAGGGAAGTCGGCAAATTAGATCCGTAACTTCGGGATAAGGATTGGCTCTGAAGATTGAGATAGTCGGGCTTGATTGGGAAGCAATACCATGGTTTATGTACTCGTTCTGGGTAAATAGAAAATTTCGATTTTTGTTCCCCGGATAGTAGTTACGTAGCCAATTGTGGAACTTTCTTGCTAAAATTTTTAAAGTTATATACATTTAATAAAATGTATATTCTTTTTAAATTATAACGATTATCAATTAACAATCAATTCAGAACTGGCACGGACTTGGGGAATCCGACTGTCTAATTAAAACAAAGCATTGTGATGGCCCTAACGGGTGTTGACACAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAAGTAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTATCTACTATCCAGCGAACCACAGCCAAGGGAACGGGCTTGGAATAATTAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCTGGCAGTGTAAGGAGACATAAGAGGTGTAGCATAAGTGGGAGATATATAATTTCGATTATTTATCACCAATGAAATACCACTACTCTTATTGTTTCCTTACTTACTTGATTAAGTGGAACGTGTATCATTGCTTAGCCATATTAAGGATTTATTTATAAGTCTTATGGTATTGGGTTTTGATGCAAGCTTCTTGATCAAAGTATCACGAGTTTGTTATATAATTGTAAACATATTTTAATGAAATGATAACATTTCGGTGTTATTATAATAATTAAAATTTGGTATAACTCCAACACTCAGGTATGATCCAATTCAAGGACATTGCCAGGTGGGGAGTTTGACTGGGGCGGTACATCTCTCAAATAATAACGGAGGTGTCCCAAGGCCAGCTCAGTGCGGACAGAAACCACACATAGAGCAAAAGGGCAAATGCTGACTTGATCTCGGTGTTCAGTACACACAGAGACAGCAAAAGCTCGGCCTATCGATCCTTTTGGTTTAAAGAGTTTTTAACAAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCGGCCAAGCGTTCATAGCGACGTCGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAAAATTCACCAAGCGTTGGATTGTTCACCCATTCAAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTAATGACAATTATTATTGCGACAGCATTCCTGCGTAGTACGAGAGGAACCGCAGGTACGGACCAATGGTACAATACTTGTTCGAGCGAACAGTGGTATGATGCTACGTCCGTTGGATTATGCCTGAACGCCTCTAAGGTCGTATCCGTGCTGGACTGCAATGATAAATATGGGGCAATTGCATTGTATGGCTTCTCTAAACCATTTAAAGTTTATAAATTTTATTTATAAACGACAATGGATATATGTGATGCCAATGTTATTTATAACATAGCAAATGCGGGAGGATCAAATATCACCTGTATGACGCGCTAGTTATATATAAAAACATTATTTAATACAATGACAATGCCTAGAATCAATTGTAAACGACTTTG\n>URS0000ADD968 rRNA from 1 species \nATTGAACGCTGGCGGCATGCCTTACACATGCAAGTCGAACGGCAGCACGGGAGCAATCCTGGTGGCGAGTGGCGAACGGGTGAGTAATACATCGGAACGTGCCCAATCGTGGGGGATAACGCAGCGAAAGCTGTGCTAATACCGCATACGATCTACGGATGAAAGCAGGGGATCGCAAGACCTTGCGCGAATGGAGCGGCCGATGGCAGATTAGGTAGTTGGTGAGGTAAAGGCTCACCAAGCCGTCGATCTGTAGCTGGTCTGAGAGGACGACCAGCTACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGCAGGATGAAGGCCTTCGGGTTGTAAACTGCTTTTGTACGGAACGAAACGGCCTTTTCTAATAAAGAGGGCTAATGACGGTACCGTAAGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTATGTAAGACAGTTGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGTGACTGCATAGCTAGAGTACGGTAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAATCCCCTGGACCTGTACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGG\n>URS0001CBEDC2 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGATGAGGAGCTTGCTTCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATGGATCCGCGCTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACATATGTGTAAGTAACTGTGCACGTCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS00020C5C01 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTTGAGCGATGAAGATTGGTGCTTGCACCAATTTGAAGAGCAGCGAACGGGTGAGTAACGCGTGGGGAATCTGCCTTTGAGCGGGGGACAACATTTGGAAACGAATGCTAATACCGCATAACAACTTTAAACATAAGTTTTAAGTTTGAAAGATGCAATTGCATCACTCAAAGATGATCCCGCGTTGTATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGATGATACATAGCCGACCTGAGAGGGTGATCGGCCACAGTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGCGAGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTGGTAGAGAAGAACGTTGGTGAGAGTGGAAAGCTCATCAAGTGACGGTAACTACCCAGAAAGGGACGGCTAACTACGTG\n>URS00025F86BA lncRNA from 1 species \nTGCGAATCATAGACGGCGCGACATCATAGTCTTCCCTCATGGCAGCCTTTTGGCGCGAAGAAAAGGAAAGTTTGAAAAAATTACCATATCTTTGAACTGTTTTAATAAAGCAAGAAATTATATTGTGCAAATCTGGATGCAAGATAAAGAAACTCTTTGATTTTGTTCATTCTACATTATTTATCAGTTGAAGATCTGTAGTATGATGACACCGTCGATGGAATGTTCGATCAAATCTTTCTGGGTCTTGTCCGTTAACAGGAGCACGGAGATGTGAAGGCATGGAAGTGGGGATGATGTCCTTAAAGAGGCACGGTATTAATCCTGGAGGACTACTTTGGTGGACGGACGTTGGAAGACAACTGATTTCAGGTGTTTTTTCCGTTTTCTCTTGTTATTCCTCTTGGGTTTTTTCCATGAGGTCAGGTGGTTGTTGTTAATGGTCTGGCGTCCAATATGAGCACTCTATCGAAAGTTCCGGGTGACACATCGCTGACTAGCTGGATCCTCCTCAACAAGGAAACAACTCCGTGGGAAATAAATTTTATGGCTTTTAGCCTAACTTGATAAAACGCTCAAAGTTAAGAATTTTTTTAATAATGAAAGTTTAAAATAACACTTTATGGGGAGTCTGTCCCTCACATATATTTAATAATATATTAATTTGTTTAGAGACAGATTAACAACTTGCCTATGATAGAGATTAAAGTATAAATAACTGGAATTTTCATTTTACTTTCATCATTGAAAAAAAACACTATATACATCATGAAAACATTTATCATGGTTGATTAGATTTTTCTATTAATTAAATATTGAAAAATTACTCTTCAAAGCTTTTCCTTAACATATGATTAGTAGCAGTGGTTATTTTTGTGTTACTTGAGTCATTATCAGTTCAGTTTATGTTTAATTCATTTACCTTTCTTATTTTGCTGACAATTAAGTTATCTCTAGGAATGGATCATTTTCATTTTTCTGCTAATTCAGCTTTCTTTGGAAATGAAAATCCTTGTACTTTCGGTCCAGTCAGATAGTTGCCTTTACGCAGGGGCGCCACTAGCTGTTTGAACGCCCGCGTGCAATACCGATTATGTTGCCCCCTGTTTAACTACGATTACTTATGCTGAGCTTGCCAGAAAGGCTCTTTGCCGCCCCCTGGACGTGCCGCCCGCGTGCGGTGCACGTCTTGCACGCCCGCTTACGGCGGCCCTGCCTTTACAATCGGTTATACAGCACTTGTATGGGCATTTTGCATGACCTTATCACATTTACAAATCCCTAATATTTATAAAATGCTTTTGTAACACAGTCAACAAACAAAAAAACCCAAATATTCTAAGAAAATTATCCAATATTTCAATTTAATTACAATAATTGAAAGCATGAGAACTTAACAGCATATGGCTACTATTGTAATAGACAACAATTACCCCATGAGCACTCAGGCCTGATTATGTAGGTGGCATTAATTAGTTTTACCTTTAACATGGAGAAGACCTCATGCGTCCACTTTTGTTAAAGACATGGTATGCACCTTGATCCTGAAACTCACTGAAATGGGATTAAAATTCCAATAGTCAATGAGGCCATGGCTATCAAGGCCTGTTCTTAGCTTCTTGATCCCATTGGAGTGTGTCAAGGCAGTTTCATGATAATGTTGATTAGGGGCTGTTACAGACCATGGAATATCATTTATTACGTATGAGTTAGAGTGGAAAAAAATAAAAAATAATTTATTGTCACACTTATCTTTCAAAAGTCTATGTCATATCTATAAGACTGTGATTTTATTTAACTATTCTTGAGAAAATTTATTATTTTTTGCTATTAAAAATATAAAATAGTAAAAATATGCTTTACTCAAAAACTCATTTGCACATGTATGAAGCCAACTGCATTTAAAGGAAAAAAGCTTCATTGTTTTTTTAAAGGAATAATTACATAATAGATTAAGATATTTTTAATATCTTTCTTGTTACAGGTGTATGGTTTGTTTACACTTTTATTTATCTTGTCACTATTTTTTTGGCAGTGGTTAAGAAGTAATATTTTACATAATCTTGAAATTAATAGATTGGTGATTTCTTTTGGGTGAGTCTCCCTGCCACATCCACATTGAAGCCAAGGGATGAGACACACACAATGCTTTAGTTGCATTCTCAATTTAAACAAAATTTTTTGTTGCATTGGTAATTTGTCTATGTGATTTTTCACAGCTAGGACCATTCCAGTAAGTCTGAGTTGAGGATAATGGAAGCTTCTTGTCCTGAAATCTAATCATGTCGTTTGTTGATGATGATGTCTGGCTCTCTATAAAATTTTCTGTAGCCTGTCTGCATTTGTGTGTCTAGCACAACATGACACAGATAGCCTGCTACTATACCAGTGGCCCAGAAAAGTGAGATATAGGGAAATAACATTGAAAATCAACCAATATAAAATTACAACTGCCTGACTATTTAAAAGGCTACTGATGTTCAGCTTGCATTAATTATGAAAATTGAAACTTATTGGTTCAAGAATTATTAAGTTTCAATAGGTAAATGTTAAAAACAAAAAAAAATCTACTAATCCATGGATATAAAAAAGAATTTATTTTAAA\n>URS0001859E2D rRNA from 1 species \nTACATGGGGTGCAAACGTTGCTCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTACTCAAGTCGGATGTGAAAGCCCTCGGCTTAACTGAGGAAGTGCACCCGAAACTGAGTAGCTAGAGTACCAAAGAGGGTCGCGGAATTCCCGGTGTAGAGGTGAAATTCGTAGATATCGGGAGGAACACCGATGGCGAAGGCAGCCCCCTGGGTCAACACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGG\n>URS0002165809 rRNA from 1 species \nGGGGAACCGCCTGAACTGAAACATCTAAGTAGGGCGAGGAAGAGACATCAAACGAGATTCCGTAAGTAGTGGCGAGCGAACGCGGAAGAGGGCAAACCGAAGGTAGAAATACCTTCGGGGTACGGAGCGCATTTAAGACTCAAGTTGTTAACCGAACGGCATGGGAAGGCCGGTCAGAGAGTGTGAGAACCACGTAGGTGAAAACGGAAAGAGCTGCGCAGATTCCAGAGTACGGCCAGACACGTGAAACCTGGTCGGAAGATGGGGGGACCACCCTCCAACCCTAAATACTACCCAGTGACCGATAGCGTATAGTACTGTGAAGGAAAGGTGAAAAGCACCCCGGGAGGGGAGTGAAAAAGAACCTGAAACCCTGTGCCTACAAGCACCTAGAGCACGTCAAAGTGTGATAGGGTACTTTTTGTAGAACGGTCCGGCGAGCGATTGTATGCAGCAAGGTTAAGGACTTAAGGTCTGGAGCCGAAGCGAAAGCGAGTTTGAAAAGGGCGTTAAGTTGCATATAATGGGCCCGAAACCGGGTGACCTACCCATGGTCAGGTTGAAGTGGAAGTAAAATTCCATGGAGGACCGAACCGACCTCCGTTGAAAAGGCGGCGGATGAACTGTGGGTAGCGGAGAAATTCCAATCGAACCCGGAGATAGCTGGTTCTCCCCGAAATAGTTTTAGGACTAGCCTCAAGTTAGATACCTGGAGGTAAAGCACTGAATAGCCTAGCGGCCGAGAGGTTAGCGAAGCTTATCAAACTCAGAATGCCAGAGTATTGATGCTTGGGAGTCAGACAGTGTCAGATAAATGTCATTGTCAAAAGGGAAACAGCCCAGATCTACAGCTAAGGTCCCAAAGTCAGGTTAAGTGGAAAACGATGTGAAGATACGCAGACAACCAGGATGTTGGCTCAGAAGCAGCCACTCATTCAAAGAGTGCGTAATAGCTCACTGGTCGAGCGTCTTTGCGCGGAGAATTTAACGGGGCTAAACCTGACACCGAAGCTTAGGCAATCCAGTAATGGATTGGGTAGGGGAGCGTTGTATACGCGGAGAAACAGTAGCGTAAGCGGCTGTGGAGTGTATAGAAGTGAGAATGCCGGAATGAGTAGCGCGAATGCAGTGAGAATCTGCATGGCCGAAAGCCTCAGGTTTTTGGAGGAAGGTTCGTCCGCTCCAAGTTAGTCGGGAGCTAAGGTGAGGCCGGAAGGCGTAGCCGATGCACAGACGGTAGAGATTCCGTCACCACCAAAAGAGTTAAGCACAGGGACACATTTGAAGTCTCAGAGCCGGGTGTTGGTTCCGGTAGAGATCGAGGGAAGTTAGTACCGAAGTCTGGGATGGAAGATGGCGAGAAAAGCTGTGTGTATTTCTGAGGTGCCCGTACCGCAAACCGACACAGGTAGGTAGGAAGAAGATTCTAAGGCCAACGGGAGAAGGGTTGTTAAGGAACTCGGCAAATTGACCCCGTAACTTCGGGAGAAGGGGTGCTCCAGAGATGGAGCCGCAGAGAATCGGCCCAAGCAACTGTTTACCAAAAACACAGGTTTGTGCTAAATCGAAAGATGACGTATACGAGCTGACGCCTGCCCGGTGCTGGAAGGTTAAGAGGAGATGTGCAAGCATTGAATCGAAGCCCCAGTGAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCAGGTAAGTTCTGACCCGCA\n>URS000003CBAA rRNA from 1 species \nGTTTCTGCTCAATGGAACTCTAAATAGCCGCAGTACTCTGACTGTGCAAAGGTAGCATAATCAATTGGCCTCTAATTAAGGTCTGGAATGAACGAACTTATGGGTAGCAACTGTCTTAAAATAGTTAATTAAATTGATTAATAAGTGCAAATACTTATTCAGTTACATTAGACGAGAAGACCCTAGAAACTTATAATTATTTTGTTGGGGCGACAGAATTACATAAAAACTAATTTTATTTTACAAGACGTAAAGCAGAAAGAAAAAGTTACTCTAGGGATAACAGCATAATTTTTAATAGCTTGTGACCTCGATGTTGGACTAGGTAGATAGTTTTTTAGAAGAAAGCTTTCTTGGCTCTGTTCGAGCAATTTTAACCT\n>URS0001415BDF rRNA from 1 species \nTACGGGGGGGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGTTCGTAGGTGGCTTGTTAAGTCAGACGTGAAATCCCTCGGCTCAACCGGGGAACTGCGTCTGAGACTGATGAGCTCGAGTGCAGGAGAGGAACGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCGTTCTGGACTGACACTGACGCTGAGGCGCGAAAGCTAGGGTAGCAAACGGG\n>URS00008DF9B1 rRNA from 1 species \nATACGTAGGGAGCAAGCGTTATCCGGATTACTGGGTGTAAAGGGAGTGTAGGCGGGAGTTACAAGTCAGATGTGAAAACTGTGGGCTCAACTCACAGATTGCATTTGAAACTGTAGTTCTTGAGTGAAGTAGAGGTAAGTGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACATCAGTGGCGAAGGCGACTTACTGGGCTTTAACTGTACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGATTACTAGGTGTGGGGGGACTGACCCCTTCCGTGCCGGAGCAAACGCAATAAGTAATCCACCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGCCCCACAAGCAGTGGAGTATGTGGTTTAATTC\n>URS0001F9E606 misc_RNA from 1 species \nAAGTCGTAACAAGGTAACCGTAGGTGAACCTGCGGTTGGATCATTAAAAAAAATTGAAGCTTCAACCCTTTCAAGGGTAGAAGCGTCAGTGCTCCTCTAACAAGGAGCTTGACTACTCCAATTTTGTGAACTTGCAACCAAAAAATGTTTTGATAGTGGTGAAAGATTTGGGCATTACCCGCCCAAGTTTTTCCCTTCTTGAAAAAATTGTTAACCCTGAAGAAATAACTTGTCTTTACCGTTTTTTATAAATAAAAATTAATAAACAACTTTTGACAACGGATCTCTAGGCTCTC\n>URS00023BEA17 lncRNA from 1 species \nGTAAAGGCTGCACAGGAATCGATGGAAGATGCTTGAAAAGCCTCATTCCCAGAAACATCTCCAGCTGCTTTTGCCGTGAACTATCAACCATTGCATTTTTATATCTTCTCTGTAAGGTAATTTTCATGTTTTTCTGTGCTGCAGAAAACTGTTTAAACGCTCCTGACTCTTCACTGAAGATATTGAGAACTTGGCTGTGCATAGCTTTTGAGCCAGTATAGAGAGTTGCATGGATATCACCTTGTTGCAGAAAAAGATCTGCGAGCTCAGACACAGGAGACAAGATAGTTGATCTCTTAAACTCCTCAAACCTCATGTCAAGTCTCTTCCATGGTTTATCAGGACATGGATGACTCCATGTTGTTGTCTTAGTATTGTGATCAATAAAATAAGATTTTCCAGTGACTGCATCAGCTCTTTTCTCCCATCCCGGTGGAAGCGGAGCAGTATAGCTACTCCCAGAATTATAACCATATCCAATATCAGTATCAAGTGATATCCCCAGCCTTCTACATTGCTCAACGAACACTTGAAGACCTATAGAAGTAGCAGAGCCATCAGCAAGACTTCCACCTCCATTCGCGTTGTCCCTGGAGTAGGATTTTGAAAGCAGAACCGCTCCTCTTCCGGCACAACAAGACTTGCAAGCTTTCTTCCTACACTGTAAACATAAGAACACTGAGCCTGGCTCTCCCCCCAAACTCTTGGTAGTAGATCCAACTGAATTTTTGTTGACCTCGGCTCTGACTTGACACACTCCACCGTTACAACCCTCACCAATTCCGTTAATATTCCAGAAATCTATCACACTATTTTCCAGCTTCTCTAAATCAATAGAAGCTATAAGTTTATCTTCAAGAGAAGCCTGGCCAAGAACTGCAAGTGCATTTGCTATTCTGCATAATCTTCCAATATATAACTCGTCGTGTGAAGAGTTCGGATTAATTGTAGCAGGATCAATTCCAATTGATAACAGTGCCCTATCTCTTTCTGCTGCAGAAATATTCAGACGTAGCCGTTCAATTTCAAGTTTAATAGCTTCTATAAACTCAAGCTTCCTTCCCTGTATTATAATAGACATGCAGAAATTAAGTTTACAATTAAAATGGCAGTTTAAGAGGACATATAACATCTGAGATGAATAGCTGAACCAAGAAAGGAGTCATAAGATCAGAAATGGTATGTGACAAGATGAAGTAACATACCATGTTTGGACCCATAACGGACTTCAGACAATTTAAGTACAGATGAGAACCACTCTCTCTAGAACTTTTATCTTGTGAAGAAGACATGCTGGGAACAGTTTCAGGACCACTATATTGAACAACTGCTTGGTCTAAGAAATCAAGCATGTCATTTCCTCCACTTGCAACACATTCCACCGCTGGTTGTGGGAAGGGGTCAGAAGCAGAAACCTCTCCTGTCAAAAGGTCAAGCAGATTACTAGGAAACGGATCATTCTGTTGTACTGGTGTGGACACAGTTTCAGCCTGTAAAGATTTTGCGGCAAAAGGATTCGAGTCAGAACAAGATGAAAAAGGAACTTCATCTTCTTTTGTTTTCCCTGCAATCTCAGCCAATCTTCCTCCGGTACGTTCGCTAGTAAACATTCCTTTCCATGGAAGAGAAACTCCAAGGACTTCTATCTGTATCACAAACACAATGCAGAAGAAGTTTTGTTTTAAACTGTTTTGCTTTCATGTTGGCTAGTCATACTATTAGATAAATCATTAATTTTAGTCCAGAAAGTAGTTATTACCTGACCAAGAGTCATGGGGATTTTAAGAGAACCAGCTGGATAAAATGTAACAGAAACTACACGGGTCAAGAAATCCAGTTGTCCTTCTAGTTCTTCAAAATCATACAGCAGTGAAAGACTTGACGTATCTTTTTCATGGAGACGCGCACCAGCTCCAGTAATAGCAATATCCTCATCACGAATTGGCCCTGGTAAGGGTATCAGAAGATTTGTACCATTCGCACACCGCGGTATCGAAGCATCCTGTCCAAAAACCAGAAATACAGACAATCGTCATCCAGTTGAACTAGCTTGCATGCACGTCTACATGATACAATAAAAGAGAAGGGACAAGAGAGTCAGTCAACCTGAACAACTAATTTAAGGTCCTCTAAGTGGCGTCCAGTTTTCACGTTCACAGTGGATGGACATGTCAAATCATCCGCACCGTGTGATATTGTCAGTACAAGTTGACATACATGGCAAGGCTCACTGAGGTAGATAACTAACTCAACAGCATCTGCAGCTTGTGGACATAGCTGCAAAGTATATAAAAAGCAGGGGAAACTTTTAGCTCAAATTTTTGAGGGATGAGAACAAAGAGGTAATGTTTTATCCAAAAGGAGGTACCCAAGTTATGTCCTTCGTCTTGATACTCAGCAGACTGGACCCATCATTGGAAGTCTCAGACATGCTCGGTACAGGTTTCAGAAAGAAACCACCTGGCCGAGAAAGTACCTGACATGAAAAAAAGTTCCAGTGAGCAGTAACATTAACATAGCTGCAGTGAAAAATTGTATTAGTTTGCTTACATGTAAAGGCTGCACAGGAATCGATGGAAGATGCTTGAAAAGCCTCATTCCCAGAAACATCTCCAGCTGCTTTTGCCGTGAACTATCAACCATTGCATTTTTATATCTTCTCTGTAAGGTAATTTTCATGTTTTTCTGTGCTGCAGAAAACTGTTTAAACGCTCCTGACTCTTCACTGAAGATATTGAGAACTTGGCTGTGCATAGCTTTTGAGCCAGTATAGAGAGTTGCATGGATATCACCTTGTTGCAGAAAA\n>URS00000FB6E5 piRNA from 1 species \nTAATAACAGGTCTGATTGCTTCATTAAC\n>URS00021C6D14 lncRNA from 1 species \nCTAGATTTAGTTTTATCTGATATTAACAAAATTTCTGATAATATTATTTGTTGTTTGAATAAAGCACAAAAGTGCTGATTTTATGAGAAAAAAAATCCATGTAAATATCTTATTGAATTTAGATTCATTTGAAATCGAAGTGAAACATAACTGATGTTTACATTTGTGAAATTAGCTTTTGTGCATAACTGAAATTCACAAATTAATGTTTATTAAGTAGATGTACACAGTTATGTGGATATATTTGATTGGGCGAGTATTCATATTGACTTGACATGCAGATAATTGTTTGAACGAATTAATGTATTGACCGGAGATGTAGATAAATGTTAGGACGACTATTTAATGATTGGACGGATCTATAAATGAATTGACGAATGTATATACTGATTGACATATACAGTATAATTGGATGAATATATAAACGAATTGAAAGATATTTGAACGATTGACAGATGAATAAACGATAGACTGATATATGTATGATTAACGGATACGTTCATGATTGACGGATATATACATGGATAGACGGATATATAAATGATTGACAGATACATGTATATGCATGGCTAGACCGTTATATAAATGATTGACGGATATATGCATGGATAGACGAATATATAAATGATTGACGGATATATGCATGAATAGACGGATATGAAATTGATTTGAATGGTTTTTGAATGATTTGACGAGTATATTAAAAATGATTGAATGGTTTTTGAATGATTGGACGAGTATATTAAAAATAATTGAATGGATATATTTTTGATAAGATGGATATATGAATGGGAATTTGACGGATATATGACTTGACAAATAGATGCATGATATAACGGATATATGATTAATTTGACGGATACATGATTAATTGGACGATTTATAAATAATCGGATAGTATAAACCTCGATATGGGCGATATATTCATATACATATATTTGTTAAATGCTAGATATTATATATCATTCATCGGATGGATATTTTTTGTTTGCAAGGACTCATGATTGAGTAAATGATATTTGGTTATTTGTAAGAAATCCTTTTTTTATTTTTACGTTGTACGAGGTAGTTGCTTATAGTTTTAATATGTTTTTGTATGTTTTTTTGTTATGTTTTT\n>URS00000D240F rRNA from 1 species \nCGTGTAGGCGGCCAGGTAGGTCGGTTGTGAAAACTGGAGGCTTAACCTCCAGACGTCGACCGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCTAAGGCGGCTCTCTAGTACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACA\n>URS000210495B rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCGAGTCGAGCGAACAGACGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATGGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCTTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACAAATGTGTAAGTAACTATGCACGTCTTGACGGTACCTAAGCAGAAAGCCACGGCTAACTACGT\n>URS00023FD586 lncRNA from 1 species \nGGAAGATCCAGCCTCGACAACGGTGGAATTCGGTAGAAGGTCACGGAGGTCAGTGAAGCTTCGCCGGTAGTTAAAACCAGAGGAATGTTCTAGAAACTGCAGAGGAGACGAAGGAATCGAATCCGTCTTGTGAACTTCCTCTTCCTTAACACCCTCCGTAATAGCTTTGTTGTTGTTGTTATCTTCTTCACCGTTTACCTTAGCTTTGATTTTACTAATCTGCAACCAAAAACTTTAAAAATCAAACCTTTTTGCATTTTCGTCTCTGAAGTTTCAATTTTTATGGTTTAAAGTCTCTAATATTGTACCTCTTGGAGAAGGGAATCATTGTCACGGCGGAGAGAATCGAAATTGTGGCGGAGAGAATCGTATTGACCCTTAAGAACACCGTAATCTTTTTCAAGCTGTTTTGTTTTCCACCGTGCACGACGGTTCTGAAACCAAACAGCTACTTGACGAGGTTGAAGTCCAAGCTCTTGTGCTAATTTAGTTTTCCTCTCAGGTTCGAGTTTATTCTCAAGTTCGAAATTCTTCTCAAGAGCTTTGACTTGGTCAACTTTTAATCTTCTCTTCTTCTCCGATAGACCCATGTGGTGGTGGTTGCCGGAATATTCCTCGATTAGTGTAGCATCTTCATCGTAACCTTCAAGCATAGATTGGTAATTACTTCCGTACCCTCTTGGACTCTGTTCATCTGTTGTGTAACCAAATGAATCTTGTCAATAAAAGAAACAGTGGAAAGTGAAGAAAGGATCACATGGGTTTTGTCTGACATTAGCAAAAAGTAGAAAGAACAAAGATGGTAATAAGAACCTGTAGAAGTGGAGATTAGACCACACATTGAATCTGAGCTGCTTAGTCTCTTCATGATGACACTTTAAAATAGTTCTACTCCAGCTTTTTCTTTATTATCAGAGAAATTCTTATGAAGTTTTGAAATTACAACAATGTTGTAAACATAATTGAGCTTCTTCACTTGAACAACAACATGAACAAAACGAGGAGACTTTAGAGGCTCAAATTAGAAAAAACAGAGAGAGGGATATGGATTGAGAAAGTCCAAAAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAAGCTTTTAATCTAGAGAGCAATGGTTCTTTTCAATATGAACAAGTTGGTTTCACACTTTCTCTTTCTTTAAATAAACCAAACTTATCTTTCTTTAAATAAACCAAACTTAGAGAAAGGGTTAAAATGTAACTAAGGTTAAGTTTGAACCAATAGTTATACGGCTTGGCTCGGCTCGGCTTAGAACAAGTGGTGGAGTCTGTGATACGTCACCGTATGGGTTTATTTTTGGTAATGCTTAACCTTATTTTTTTTAAGGGTGTTTCTATTTTCTTAAACTTAAAAATTCAGAGAAATTAATAAACAGCGGATAGTAGAGAGATACGTAAGATGCATTTAAAAAGTAGATTTTTAAAATATAACATCCTCTGAAAAACGTCAGAAGGTACGTCACAGAAGATTTGATGACAAAATGATAAACTATAATTTGTTTGTTGATTAATGAAACCAAATGTAATTTTCCTGAGCAAACTTAAAATTCGATAGGATAAGTTATAAAATTATACGGATGGCATATTTAATCCCATATATTAGATGTGGGATATATTATTAAAAACATTAGTGTTATATGTTATTGTTGGCAACGCAGGGGAGTGGAAAGAAAGACTTGTGGGTGGGGGAACAAGACTGACGCAATTTGGGTTTGGTTCATTGAATTGTCCAAAAACTATGGGCTCGAACGGCACCGTCAAAAAATATCAATTCTTGTTTTGAA\n>URS0000538100 piRNA from 1 species \nTGCTGGCTGCTGGGTGGAGCATGTAGGG\n>URS0000D6DD09 lncRNA from 1 species \nAACTACGAGTCCCGACGTGCCGCGCGCGGCATGCAGAAGCTTCACTGAGCGGGCACTGGAGGTCGCGAGCACGTTGCTAGTGGGCGCGGCTGGCGGGGCCGGGGGCGGCAGGGGGCTAGCGTCCGGCTGAGCCCGGCGGGTTCCTGCACGCGGACCCACGCTTTGTCGGGCTGCTCTGCTGAGTGACACCGCCGTGGCATCCGAGGAGCTGTGGTCCAGCCTGCGCGGCGGGAAGCGGCGGCGGCGGCTCCAGCGTCCTAAGAGATTGCAACACCTGCTCGGTATACCGTGACTTTGGGAGGAACATCTGTCACTGTGAAGTATCTGCGCAGTCATGGCTACATGTCCACGCCGCCACCCGTCAAGGAGTATCTGCAGGACAGGATGGAAGAGACAAAGGAGCTTATCACAGAGAAAATGGAAGAAACAAAAGATAGACTCACTGAAAAGTTACAAGAAACCAAAGAAAAAGTTTCCTTTAAGAAAAAAGTGGAATAAGGTGCCTTATATAGCAGTATAGAAAATTCCTGCACTTTAACCCTTTGGAAACTATGGGCAAAGATACATGTGTCTGATTATTTTTTTGGTTAGTTGCCGAAATATACTAGTTCTCTGAGGGTTAAAGAAGTAAAATACCTTTTTAAAGTTAAATATCACTAGAAAAATCAGTGTTATTACAAGGGAAGAAATGAACCCAGTTTAAGAATTTGCCATCAGTAGCAGTATTAAGCAGTGGTTAATGTCTTAGAAGTCAGACTTCTTTTTCAAGGTCTTCAGAACCACACTTGATTTCTGTTTTGTTGCAGCTGTAATTGACACATACTAGGCAGCTGACTCCTTGAATATCCAGTGTGACCCATAAAATAGTCTGTTAATACCGGATCTTAATTTTTATGTTATTCATTAAGATTTTAACTATATTCAGTACGTAATTTGGAGACAAACTAGCATCATCAAAACTGCCTGTAAATAAGGTGTTTAGTCTTTCTATAAAAACAGAATAGAGCAGTTACCTACCAGTTAAAATATCTTATATGAAGAAAATAGAATAAAGATCCAGTCATATATGTAAATAAGATGTACTGATTGTACGTA\n>URS000037851E rRNA from 1 species \nTTCAGAGGGGGACAACAGTTGGAAACGACTGCTAATACCGCATACGATCTGACCTCGGCATCGAGGATGGATGAAAGGTGGCCTCTATTTATAAGCTATCACTGAAGGAGGGGATTGCGTCTGATTAGCTAGTTGGAGGGGTAACGGCCCACCAAGGCGATGATCAGTAGCCGGTCTGAGAGGATGAACGGCCACATTGGGACTGAGACACGGTCCAA\n>URS00003C52C3 rRNA from 1 species \nACCGGGGCGACGATCAGTAGGGGTTCTGAGGAGGAAGGTCCCCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGAAGGCAGCAG\n>URS0000E650A4 rRNA from 1 species \nGGTTGTCACAATACCATGTGCTGAGATCCTCTAAGCTAAGTAGCATTGGATCTGGTTATTACTTGGATGGGAGACCTCAAAGGAGCATGTAGGATTACAAGTA\n>URS00007CE4A8 rRNA from 1 species \nACATGCAAGTCGAGCGGGGTCCAACCGGTGGCAACACCGGGGACGGCCGAGCGGCGAACGGGTGAGGAACACGTGAGCAACCTGCCCCGAAGTCCGGGATAACACCGGGAAACCGGTGCTAACACCGGATGTCCTCCCTCTGGCGCATGCCAGGAGGAGGAAAGGTTACGCTTCGGGAGGGGCTCGCGGCCTATCAGCTTGTTGGTGGGGTCACGGCCCACCAAGGCGACGACGGGTAGCTGGTCTGAGAGGACGGCCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCAACGCCGCGTGCGGGACGAAGGCCTTCGGGTTGTAAACCGCTTTCAGCAGGGACGAAACTGACGGTACCTGTAGAAGAAGCCCCGGCCAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGCTGGGCAAGTCGGGTGTGAAAACTCCAGGCTCAACTTGGAGACGCCACTTGATACTGCCCTGGTTTGAGTCCGGTAGGGGAGCGCGGAATTCCTGGTG\n>URS0001630D6F rRNA from 1 species \nCCTACGGGAGGCAGCAGTGGGGAATATTGGGCAATGGGCGCAAGCCTGACCCAGCAACGCCGCGTGAAGGAAGAAGGCTTTCGGGTTGTAAACTTCTTTTGTCAGGGAAGAGTAGAAGACGGTACCTGACGAATAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTACTGGGTGTAAAGGGCGTGTAGCCGGGTTGACAAGTCAGATGTGAAATCCTGCGGCTTAACCGCAGAACTGCATTTGAAACTGTTGATCTTGAGTACTGGAGAGGCAGATGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGTCTGCTGGACTGTGACTGACGTTGAGGCCCGAAGGCGTGGGGAGCAAACAGGATTAGATACCCCAGTAGTC\n>URS0000B3F91B rRNA from 1 species \nGAGACCCTACGGGGGGCAGCAGTGAGGAATATTGGTCAATGGGCGCAAGCCTGAACCAGCCACGTCGCGTGAGGGATGACGGTCCTATGGATTGTAAACCTCTTTTGTCGGGGAGCAAGGCCCGCCACGTGTGGCGGGAAGGAGAGTACCCGAAGAAAAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCGAGCGTTATCCGGATTTATTGGGGTTTAAGGGTGCGTATGCGGAAGGGTAAGTCAGC\n>URS0000D2A1B2 rRNA from 1 species \nACGATGAAACCGCGAATGGCTCATTATATCAGACATAGTTTATTAGATCCCCCTCCCCCTACTTGGATAACTGTAGTAATTCTAGAGCTAATACATGCACCAAAGCCTTTACTTTTCGGTAAAGGCGCAGTTATTAGATCAAGACCAACCGAAGCTTGCTTCGTTGTTTTGATGACTCTGGATAACATTAGCCGATCGCATGAGCTTGTCTCGGCGACGTATCTTTCAAATGTCTGACCTATCAACTTTCGATGGTAGGTGATATGCCTACCATGGTTGTAACGGGTAACGGGGAATCAGGGTTTGATTCCGGAGAGGGAGCCTGAGAAATAGCTACCACATCCAAGGAAGGCAGCAGGCGCGTAAATTACCCACTCCCGGCACGGGGAGGTAGTGACGAAAAATAACGATACGGGACTCTTTCGAGGCCCCGTAATTGGAATGAGATCACATTAAACACTATGTGGAAATCTATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAACTCCAGC\n>URS00023D0B22 lncRNA from 1 species \nTATTACAGATCGTGCCCATCCCACTTCTCTCTATCATAACCGAACATAACAACCTCAATCACAGCCTGGCATGCCCACCCCAGCTGGGGGTCCTCTGTCCATGCCTGCCCCGGCGGGGGTTTGCAGGCTAAAGGAGCCCGCCCCGATGGGGGTATAGGAGTTTAGTTTTTTAAATCCTATTACAGATCGTGCCCATCCCACTTCTCTCTATCATAACCGAACATAACAACCTCAATCCCATGAATCCTCTCCAAATCGCCCACTTCCCATAGAAATTGGCCCACTTACACTCCCATATAAATCCAACTCCAATCTCTTCCATTCTATACCAAATCCACATCACACTTCAGATTTCCATCAAAAACCTAGGGTTTCTCATC\n>URS00009F6D70 rRNA from 1 species \nGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGATGAAGGCCCTAGGGTTGTAAAGCTCTTTCAGCTGGGAAGATAATGACGGTACCAGCAGAAGAAGCCCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCAAGCGTTGTTCGGAATCACTGGGCGTAAAGCGTACGTAGGCGGATATTTAAGTCAGGGGTGAAAGCCCGAGGCTCAACCTCGGAACTGCCTTTGATACTGGGTATCTTGAGTCCGGGAGAGGTGAGTGGAATGCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGCGGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGGTACTGACGCTGAGGTACGAAAGCGTGGGGAGCAAAC\n>URS0001120C71 rRNA from 1 species \nTACAGAGGTCTCAAGCGTTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCTCGGGGCTTAACTCCGAAACTGCATTCGATACTGCCGTGATTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCGGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGGTCT\n>URS0000F57DDE rRNA from 1 species \nGTGTCAGCCGCCGCGGTAATACGAAGGGTGCAAGCGTTACTCGGAATTACTGGGCGTAAAGCGTGCGTAGGTGGTTCGTTAAGTCTGATGTGAAAGCCCTGGGCTCAACCTGGGAATTGCATTGGATACTGGCGGGCTAGAGTGCGGTAGAGGATGGCGGAATTCCCGGTGTAGCAGTGAAATGCGTAGAGATCGGGAGGAACATCTGTGGCGAAGGCGGCCATCTGGACCAGCACTGACACTGAGGCACGAAAGCGTGGGGAGCAAACAGGATTAGAAACCCCTGTAGTCC\n>URS0000092071 rRNA from 1 species \nCAAGTCGAGCGGCAGCGACAACATTGAACCTTCGGGGGATTTGTTGGGCGGCGAGCGGCGGACGGGTGAGTAATGCCTGGGAAATTGCCCTGATGTGGGGGATAACCATTGGAAACGATGGCTAATACCGCATGATAGCTTCGGCTCAAAGAGGGGGACCTTCGGGCCTCTCGCGTCAGGATATGCCCAGGTGGGATTAGCTAGTTGGTGAGGTAAGGGCTCACCAAGGCGACGATCCCTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCAGTGAGGAAGGAGGTATCGTTAATAGCGGTATCCTTTGACGTTAGCTGCAGAAGAAGCACCGGCTAACTCCGTGCCAGC\n>URS0002572490 rRNA from 1 species \nATGGCGGCGGCGGTGGACCTGGAGGATGCGTTCGGCGCGGTCTTCGGCGAAGCCAAGCCGGAGGGCCACCCCACCGCGCGCCCCGTCCTCTTCCGCGCCCACGCCCGCTCCGCCGCCGCCCTCCGTGTCGTCGCCACCGACTGCCACTCCCTCGCCTGGGACTGCTCCCTCTCCGTCTCCGACCTCGACGACCTCAGAGACGATGTTGGAATCGGGGGCTCCTGGGCCGACTTTCTAGATTATCTCAAGTCCTCCTTGTCCTCCGGCGAGGTGAAGCTGCTCTTCGCCACCGACAAACTCCGCAAGTCAACCGGTTCTGATGGTGCAAAGCTTGTGGCTACCAAGGCAAAGGGCCTGCCTCGCATCACCATTTCTCTCCATAGTGTTACTGGCGCTACGACGAGTGATATCATAGCCGAGTTCTCGCTAGCGCTCTATGGAGCTTATAGGACTGCACGGGAGCTTGTATCCAAAGAACAAGAACAAATGTCACAGCTGATGGGAAATCTGTCAACTGAAAGAGAAAAGAACGAAATCATGCAAAAACAACTCGAATCTCTTTCTTTCCTAGACAAAAGAAAGGCAACAAAGCCAAAGCTGTTGGCTGATCAGGTTCCAAGTGTGTCTGCTGTGACTCTGGTCTCTGACCAAGTTACAGCTCCTGTGCAGCAGCAAATATCAGTACCTTCACCTAGTAAAGCCCCTCCTGCTAAAGTCACGAAGAGGGTAGCCCCCACGTCTCGGAGGGCAAGAGTGCGAGGAGCTCTGCTGCAAGATAATGAGGATGAGGATGACAACTGA\n>URS00013FFE9F rRNA from 1 species \nGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTCACCGGTGAAGATAATGACGGTAACCGGAGAAGAAGCCCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCTGATATTTAAGTCAGGGGTGAAATCCCGGGGCTCAACCCCGGAACTGCCTTTGATACTGGGTATCTTGAGTATGGAAGAGGTCAGTGGAATTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAGGAACACCAGTGGCGAAGGCGGCTGACTGGTCCATTACTGACGCTGAGGTGCGAAAGCATGGGAAGCAAACAGGATTAGATACCCCTGTAGTCC\n>URS00004AF1E8 rRNA from 1 species \nACAAGCGGTGGAGCATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCTGGGCTCAAATGTATGTTGACGTATTCTGAAAGGGTAATACTTCTTCGGACAATATACAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGGTTAAGTCCCATAACGAGCGCAACCCTATCATTAGTTGCCATCAGGTCAAGCTGGGGACTCTAAGTGAAACTGCCTACGCAAGTAGTGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTACGTCCAGGGCTACACACGTGCTACAATGGCCGGTACAAAGGGCAGCTACCTGGTGACAGGATGCTAATCTCAAAAGCCGGTCTCAGTTCGGATCGGAGTCTGCAACCCGACTCCGTGAAGCTGGAATCGCTAGTAATCGCGCATCCGCCATGGCGCGGTGAATACGTTCCCGGGCCTT\n>URS0000EEE034 lncRNA from 1 species \nGGCTTAGGGGAAAGTCCCCTTAGGGAAGTCCCTATTGACCCAGGAAGTCCAGCCAACTTAGCCACTTAGTCCCTCAGCCCTGGCTTGTGGAAGCAGAGATTCCTAATACGGCCCTCACTTCTCCACTTTCTCCACTGGGGTTGGAAGCAGTAGGAGTAGCTATAGAGGATGTATTAACACCAATTTACAGAGATCCTATTGAATTTACATCTCTCCAGCAGGTGTGATGCAAGGAAAACAAAGCTAATACCCAAAGTCTTTGAGCGTGGAAAGAGAGAAAGTCCACTTTAAGCGATGGAAAATCAGCCCCAATTCTGAAGGAACAACCATGAACAGATGATTTAAGGAGAATCAATTCTTTGCTCTTTGCAGAAGGAGCCAACAGAGTGAGATGAAGGGGACAACTTCAGATACTCAGGCAGAAGCATAAGTCCCCACCTGCTGACCTGCTGCCTGCTATCTTAACACGAATTCTTCATCTGAATGGATGAGCTTTTCACAGAGTTCCAAACTAAGGAATCCAGGAGTGGCCAATCCAGAGATTCATTCCTTATCTTTGACGAACATCTGAACTCCTGGCTCATCCTGTGGAATTCAGGCCATACAGGAGATCAAGGTCATTTGCTTTGGGTTAAATGAATGTTGCCAGGTGGAGGTTGCTAGAGGGAGAGTGCTATGTGAAAGTGCTGTATAAACTGCTTGCTTTTCACAAACAGTAGTGATTCTTTATCCTGTCCAGCCTGCCACAACTGGACCATCCTGTATGTAAGTCCCCTTAATAAATCCTGTGTCTCATTCACTGGCTTCAAGTCTCTTCCTGGGCCTCTTGAACGTGGTGCCACCTGTATTGAAGTCAACAGAAGTTCAGCACAACACAGGTCAAAATGAAGATTCTGACTCAGTAGGTCAGGATGTTCTAACGAGCTCTAGCTGACATGATACGTCAGGGCTGCAGACTAGCTTTGAGCAACAAGGTGCTAGAGAAATACCTATAGAACAACAGAGATGCAAGACAAATGAGTTGGAAGTTAAAAGATTTAAATTCTTGTCTTAGTTTTCTCATTAAAGAAAAGCTGTGTGACTATGAAAAAAAATGGCTCTCTGAGACTTTTGTTTGCTCATCCAAGATGAAAATATTGAAATGTATTATACAATAAACATTTGCAAACAG\n>URS00017D46D8 rRNA from 1 species \nTACGAAGGGGGCGAGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGCAGGCGGCTCATTTTGTCAGGCGTGAAAGCCCCGGGCTTAACCTGGGAGGTGCGTTTGATACGGATGGGCTAGAGTTCGGGAGAGGAGCGTGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCGGTGGCGAAGGCGGCGCTCTGGACCGAGACTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACGGG\n>URS000151634F rRNA from 1 species \nGTTGTATGGTTAAGTGACTAAGCGTACACGGTGGATGCCTTGGCAGTCAGAGGCGATGAAAGACGTAGTAACTTGCGATAAGCCCAGATTAGGTAGTAACAACCATTTGAGTCTGGGATTTCTGAATGGGGAAACCCACGTGCATAAGCACGTATCCTTACCTGAATACATAGGGTAAGGAGGCGAACCGGGGGAACTGAAACATCTAAGTACCCCGAGGAAAAGAAATCAACCGAGATTCCGAAAGTAGCGGCGAGCGAAATTGGACTAGCCCTTAAGCTTTACACGCGTTAGACGAACGGTCTGGAAAGTCCGACGATACAGGGTGATAGTCCCGTAGTTGACGACGTGTGTTCAGTGAAATCGAGTAGGGCGGGACACGTGATATCCTGTCTGAATATGGGGGGACCATCCTCCAAGGCTAAATACTACTGACTGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAAAAGAACCCCTGTGAGGGGAGTGAAATAGAACCTGAAACCGTGTACGTACAAGCAGTAGGAGCACCTTCGTGGTGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTATATTCAGTGGCAAGGTTAACCATCTAGGGGAGCCGTAGGGAAACCGAGTCTTAACTGGGCGTTCAGTCTCTGGATATAGACCCGAAACCAGGTGATCTAGCCATGGGCAGGTTGAAGGTTGAGTAACATCAACTGGAGGACCGAACCGACTAATGTTGAAAAATTAGCGGATGACTTGTGGCTAGGGGTGAAAGGCCAATCAAACCTGGAGATAGCTGGTTCTCCCCGAAAGCTATTTAGGTAGCGCCTCGGACGAATACTACTGGGGGTAGAGCACTGTTAAGGCTAGGGGGTCATCCCGACTTACCAACCCTTTGCAAACTCCGAATACCAGTAAGTACTATCCGGGAGACACACGGCGGGTGCTAACGTCCGTCGTGGAGAGGGAAACAACCCAGACCGCCAGCTAAGGTCCCAAATTACTACTAAGTGGGAAACGATGTGGGAAGGCTCAGACAGCCAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAAAGCGTAATAGCTCACTGGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAGTAGTAAACCGAAGCTGCGGCAATGTGCTTTTGCACATTGGGTAGGGGAGCGTTCTGTAAGCGGTTGAAGGTGTGTGGTAACGCATGCTGGACGTATCAGAAGTGCGAATGCTGACATGAGTAACGATAAAGGGGG\n>URS000043C123 rRNA from 1 species \nCTACGTGCCAGCAGCCGCGGTAATACGTAGGTCCCGAGCGTTATCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGTTAGATAAGTCTGAAGTTAAAGGCTGTGGCTTAACCATAGTACGCTTTGGAAACTGTTTAACTTGAGTGCAAGAGGGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCGGTGGCGAAAGCGGCTCTCTGGCTTGTAACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGGTGTTAGACCCTTTCCGGGGTTTAGTGCCGTAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACTCTTGACATCCAGA\n>URS0001C76D33 rRNA from 1 species \nAAATTGAAGAGTTTGATCATGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGGTAACAGGAAGAAGCTTGCTTCTTTGCTGACGAGTGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAACGGTAGATAATACCGCATAACGTCGCAAGACCAAAGAGGGGGACCTTCGGGCCTCTTGCCATCGGATGTGCCCAGATGGGATTAGCTTGTTGGTGGGGTAACGGCTCACC\n>URS00012CC989 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCTTAATACATGCAAGTCGAGCGAGCGGCGGACTGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAAAGGTAGCTAATACCGCATACCATCAGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAATGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGCGGGGAGGCGTTACTCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATTC\n>URS000186D9C0 rRNA from 1 species \nATTGAACGCTGGCGGAATGCTTTACACATGCAAGTCGAACGGTAGAGGGGGCAACCCCTCGAGAGTGGCGAACGGGTGAGTAATATATCGGAACGTGCCCAGTCGTGGGGGATAACGTAGCCAAAGTTACGCTAATACCGCATACGATCTAAGGATGAAAGCGGGGGATCGCAAGACCTCGCGCGATTGGAGCGGCCGATATCAGATTAGGTAGTTGGTGGGGTAAAGGCTCACCGAGCCAACGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTGCGGGAGGCAGCAGTGGGGAATTTTGGACAATGGACGCAAGTCTGATCCAGCCATTCCGCGTGCAGGATGAAGGCCCTCGGGTTGTAAACTGCTTTTGTACGGAACGAAAAGGTCTCTCTTAATACGGGGGACTCATGACGGTACCGTAAGAATAAGCACCGGCTAACTACGTGCCAGCCGCCGCGGTAACAC\n>URS00000166F6 tRNA from 1 species \nCCTGGTTAGCATAATTAGTAATGCGATTGTTTTGTAATCAATAGACTGTAAGTGCAAGTCTTACACTGGGCTA\n>URS000226E0A8 rRNA from 1 species \nTGGCAGGTCGAGCGAACAGGATAAGGAGCTTGCTCCTTTGAAGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTACCTATAAGACTGGAATAACTTCGGGAAACCGGAGCTAATGCCGGATAACATATAGAACCGCATGGTTCTATAGTGAAAGATGGTTTTGCTATCACTTATAGATGGACCCGCGCCGTATTAGCTAGTTGGTAAGGTAATGGCTTACCAAGGCGACGATACGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTTTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACAAATGCGTAAGTAACTGTGCGCATCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGAAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACGCTGATGTGCGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAATCTTGACATCCTTTGAAAACTCTAGAGATAGAGCCTTCC\n>URS000163AA4F rRNA from 1 species \nTACAGAGGGTGCTAGCGTTGTTCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTCAGGTAGGTCCGTTGTGAAAACTCGAGGCTCAACCTCGAGACGCCGATGGAAACCATCTGACTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCTAAGGCGGCTCTCTAGTACGGTACTGACGCTGAGACGCGAAAGCGT\n>URS00008DBA8C rRNA from 1 species \nAACAGCCAGAAATGGGCTGCTAATACCCGCATAAGACCGAAGCGCCGCATGGCGCGGCGGCCCAAAGCCCCCGGCGGTGCAAGATGGGCCCGCGTCTGATTAGGTAGTTGGCGGGGTAACGGCCCACCAAGCCGACGATCAGTAGCCGACCTGAGAGGGTGACCGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAAGGATGAAGTATTTCGGTATGTAAACTTCTATCAGCAGGGAAGAAGATGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGACGGCGATGCAAGCCAGATGTGAAAGCCCGGGGCTCAACCCCGGGACTGCATTTGGAACTGCGTGGCTGGAGTGTCGGAGAGGCAGGCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCCTGCTGGACGATGACTGACGTTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTA\n>URS0001561C6B rRNA from 1 species \nCCTACGAGAGGCAGCAGTGGGGAATCTTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGAAAATGACGGTACCTGATTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTCCTGGGTGTAAAGGGAGCGTAGACGGCAGCACAAGTCTGGAGTGAAATGCCGGGGCTTAACCCCGGAACTGCTTTGGAAACTGTGCAGCTAGAGTGGAGGAGAGGTAAGTGGAATGCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACTGTAACTGACGTTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCCTGGTAGTC\n>URS0000A47F93 rRNA from 1 species \nCAGAGGGCGCGAGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGTGGCCAGCATAAGGCCGCGGTGAAAGTCCGGAGCTCAACTCCGGATCTGCCGCGGCGACTGTGCGGCTTGGGCACTGTAGAGGCAGATGGAATTCCGGGTGTAGCGGTGGAATGCGTAGAAATCCGGAAGAACACCGGTGGCGAAGGCGATCTGCTGGGCAGTGGACCGCAAGGTCCAATAGCCGACACTGAGGCGCGACAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGGCACTAGGTGCTCCGGGGAGCGACCCTTGGAGTACCGGCGCTAACGCATGAAGTGCCCCGCCTGGGGAGTACGGCCGCAAGGCTG\n>URS0001DD09C6 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGTTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGCGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGCCGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS0000594F9C rRNA from 1 species \nGCAAGTCGAGCGAACGGACTAGAATCTTGCTTCTCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATTTTGAACCGCATGGTTCATAAGTGGAAGACGGTCTTGCTGTCACTTATAGATGGATCCGCGCTGCATTAGATAGTTGGTAAGGTAACGGCTTACCCCGGCAACGATGCATATCCGACCTGAGAGGGTGATCGGCCACGCTGGATCTGAGACGCAGGATCCAGACTCCTACTGTAGGCAACAGTAGGGAATCTTCCTCAGTGGGCGGAAGCCATGAACCGAACAACGCCGCGTGAGTGATGAAGGTCTTCGCATCGTAAAACTCTGTTATTAGGGAAGAACATATGTGTAAGTATCTGTGCACATCTTGACGGTGCCTAATCAGAAAGCCACGGCTCAGTACGTACCAGCAGCCGCGGTAATAGGTAGGTGGCAAGCGTTATCCGGAATTATTGGTCGTAAAGCGCGAGTAGGCGGTTTTTTAAGTATGATGTGAAAACCCACGTCTCATCCGTGGAGGGTCATTGGAATCTGGAAATCTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCGGTGCCGAAGGCGACTTTGTGGTCTGTATCTTCCTCTGATGTGCGAAAGCGTGGGGATCAAACACGATCAGATTCCGTGGTAGTGCTCGCCCTAAACGATGAGTACTAAGTGTTAGGTGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTC\n>URS000230E4F6 sRNA from 1 species \nGACCAATATGATCATCACAATAAATTAGTATACGCAGTAAGGAAAGTGACCGATGATCAAGTATATCACTTCGACTCTAATCAAGGAAAACACAATAAAGTAGTTTAAGCTACCGGCTGTAGCACTGAGAATTCTTTATTAAGAAAGAGGCATTATTTAGCGTTCTCTTTCAATCCACTTCAACTTGCGAAATATCTCTTAACAATCTCAATTTTTTCTTCTTTTGTAATAAAAACATACCAGATGTACCAAATCCAATCCTTGGATGCATAATTTGCTTGAGGGTGGCATAATCTTCAGCCTTAATCAATTGTGAAACTTCATTCCTCGTAGTTTCATCCTAATGCGTTCAATCTGTTAGTTCCACAGTACTTCCATAGTAAATATAGTCCTAATACTTACTTGATCTAATTTGAACCACTCATCTACTAATTCTTGCAAAATCGGATCCATCTTGCCAAATGGGAATTGTTACCATTTGTTTGCTACACACACAATACACGTATCTCATCACCTCGTTTAACGCGTCCTTACGCCGTGGTATTTCGTATCCGTTTTCTTACAAAAATGATTTTAATAAAATAGACTCAAAAACAAAAAGTAGTAATAATATTATACTCATGACCTCCAATTATTCTAGAGAATTTCTTAAAACATTAGCTGCAAAAAGAAGCCTAGTAATTTGAAAGCAGCAGTTAATTACGATATATACCGCTTACAAAAAGGAGAAATTGGAAGAATTCAAGACCTGACGTCAATTCGCAAGCTGAATCGTTTTAATTAATAGGCGTCGGACAATGGGATTCACTTAGGCTTGGCGACGTTCTTGTCTAAAAATTGCTTGTCGGAATGTGTCATTGAACCGAAAAGGTTTGAAGCTCTTGACTAATAAACAACAGTAACTGATGTTAACTTTTTATAGAATATCCCAGGTTTCAATTCAACACGTTTATTCATAAATCTCAATCTATGTTATGCAGATGAGATTGAAAATCAATACCATCAAGTACAACTTCTCTAAACTGAACGGGTTAAGTATGGAATGGTTTAAAGTTTTAAGTACTGGATCACTCCAAGCTTTGAGATACGATAAGAAAATTAGTGTTAGTACATTTGTGGCTTTAATCACACCTTTTCCATAACCAGGAACTAAGTTTTCAAAGATCTACTATTCGATGATGAAAAAATAGCATTCATAAAGTTGATAACAGCATACATAAATGAAACTGAAATATTGAGGAGGTAAGGCAAACATGATGACCATAGTTTCAATTGACTATGTAATACGTACTATGGCTCATTAAAACCTATCAAAGAAAGAGAAATACGAATAAGAGGAAATTCAAGCCTGTTTAGAATGAGAAGAGAATAAAGATTGGGTTTTGGCGAAGGATACGCTGTTGCATTAAAACAGCCTTAAATAGGTTCTATAAATGGTTAGCATGTAAAAAAAATTAAAATTGAATCATGAAAAAATATTAAAAAATAATAAAAAAACCTACCACTTAAGAGCTTGTTCAAATTGTTGAGACGAGAACCAACACTGACATCAAGAATATTATCACCAATTTCAACAAT\n>URS000119B5B9 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGCGTGGCGGACGGGTGAGTAATGTCTGGGTAACTGCCTGATGTAGGGGGATAACTACTGTACACGGTAGCTAATACCGCATACCATCGGATGTGCCCAGATGGGATTAGTTAGTAGGTGGGGTAAAGGCTCCCCTAGCCGACGATCCCTAGCTGGTCTGCCAGGATGACAAGGCAAACTGGAACGGAGACACGGTCCAGACTACGACGGGAGGCAGCAGTGGGGAATGTGGAACAAGGGACGCAAGCCGGATGCAGCCATGCCGCGTGGAGGAAGAAGGGCGTCGGGTTGTAAAGTACTTTCAGCGGGGAGGCGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATAC\n>URS00021073CB rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACGGACGAGAAGCTTGCTTTTCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATTTTGAACCGCATGGTTCAAAAGTGAAAGACGGTCTTGCTGTCACTTATAGATGGATCCGCGCTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGGGTAGCCGGCCTGAGAGGGTGACCGGCCACAATGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATAACGGCCTTCGGGTTATAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAGTGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS0000A0DC81 rRNA from 1 species \nTAGTCCACGCCGTAAACGATGGATACTAGCTGTATGTCTACTTCAGGTAGATGTGTGGCTAAGCGAAAGTGATAAGTATCCCACCTGGGGAGTACGATCGCAAGATTGAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCAGGGCTTAAATGTACGTTGCATGATTTAGAGATAGATCTTTCTTCGGACTACGTACAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCAGGTTAAGTCCTATAACGAGCGCAACCCCTATCGTTAGTTGCCAACAGGTTAAGCTGGGAACTCTAACGAGACTGCCTGTGACAAACCGCGAGGAAGGTGGGGATGACGTCAAATCATCACGGCCCTTACGTCCTGGGCCACACACGTGCTACAATGGCCGGTACAGAGAGCACGCCACTCCGCGAGGAGGAGCGAATCTAATAAAACCGGTCTC\n>URS0000C91A8A tmRNA from 1 species \nCAGGTTTATATCCATTACAAATAGACTTATATTCGTGCTGCCGGCTTGCCGGCTATAGCGCTAAACGGTTTGCGGAATAAGCGTTGCGGACCCGGGGGCGGTACCCGGCGCCTCCACCAGTTTTGTGGCTTTCAATACATCACTGGGGTATTTTTGGGGGCGAAACAGGATCGACGCGCGTGGTAAAGGCAGACTTTGTGCTCGGCATGGTACCACCGTTATCGGGCTATAGTCGTTAAATGCCAACGACAACTTTGCGGGCGAAGCCCGCCTCGCTGCTTAACTTAGGTTAGGTAAGCGCGGTTCGGGGGGCACCGGGCAACAGAAGCCCCCCACT\n>URS000232319A pre_miRNA from 1 species \nGGGGGGAGGTCGGATTCTTGGCTATGTCCCCGGCGCCCTGTGCTCCTGGGCCTGTGCTGTTGGATTCGTGCTCCTGGCCGGACAGCCCCCT\n>URS000259C9B7 misc_RNA from 1 species \nGTGAATCATCGAATTTTTGAACGCAAATTGCACTCTCTTCTGTGAGTATGCCTGTTTGTGGTTCAGCCTAAGAAAAATCGACATATTCGCTGTTTCGCGGTTTCTTTCGTTTGCAGTTTTGTCATCTTAAACCTTTTTGTTTTAAGCGGCTTAAAATTTTCTTTACGTTTCCACTAACTTTTCTAACATTTACTTACTCTTTTAATGTATCGATCTTTATTAGACGTGGCCGTTTCATCGGATCGCGTCCATATATATTTCGTTAACTTA\n>URS00009D7A85 rRNA from 1 species \nGATGAACGCTAGCGGGAGGCTTAATACATGCAAGTCGAACGGTAACAGGTCTTCGGATGCTGACGAGTGGCGCACGGGTGAGTAACGCGTACGTATCTACCTTGTACACGGGGACATACACTGGAAACGGAGTAAATACCCGATAGTCTGGAAACAGTAAAGCTACGGCGGTACAAGATGGGCGTGCGTCTGATTAGCTAGATGGTGAGGTAATGGCTTACCATGGCGATGATCAGTAGGGGGCGTGAGAGCGTGATCCCCCACACGGGTACTGAGACACGGACCCGACTCCTACGGGAGGCAGCAGTAAGGAATATTGGACAATGGGCGGAAGCCTGATCCAGCCATCCCGCGTGTAGGATGACTGCCCTATGGGTTGTAAACTACTTTTATATGAGAAGAAGCGCCTTTCTGCGGAAGGGTTTGACGGTATCATATGAATAAGCACCGGCTAACTCCG\n>URS0001E0D339 rRNA from 1 species \nTACGGAGGGTGAGAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGCTAGATGTGAAAGCCCCGGGCTCAACCTGGGATGGTCATTTAGAACTGGCAGACTAGAGTCTTGGAGAGGGGAGTGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACATCAGTGGCGAAGGCGTCTCCCTGGCCAAAGACTGACGCTCATGTGCGAAAGTGTGGGTAGCGAACAGG\n>URS000061A91B rRNA from 1 species \nTAGGGTTTGATCCTGGCTCAGAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGATCCCTTCGGGGATAGTGGCGCACGGGTGCGTAACGCGTGGGAACCTGCCCTTAGGTTCGGAATAACTCAGAGAAATTTGAGCTAATACCGGATAATGTCTTCGGACCAAAGATTTATCGCCTTTGGATGGGCCCGCGTTGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCATAGCTGGTCTTAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGGCCCTAGGGTTGTAAAGCTCTTTTACCCGGGATGATAATGACAGTACCGGGAGAATAAGCTCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGAGCTAGCGTTGTTCGGATATACTGGGCGTAAAGCGCACGTAGGCGGCGCCGTAAGTCAGGGGTGAAATCCCGGAGCTCAACTCCGGAACTGCCCTTGAAACTGCAGTGCTAGAATCCTGGAGAGGCGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAANGCGACTCGCTGGACAGGTATTGACGCTGANGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGATAACTAGCTGTCCGGGCTCAT\n>URS00023F57E9 lncRNA from 1 species \nGGATCTGAATCCTAGACCCTTTTAGAACGCCAGGGTCGTAGCCTTTCCGCCAAGTCACCGGAGGAGAACCCATTCCCCCGCCCTTCTCTCCACCGGCCTCCTGCTCCAAACCTCTCTGCTCTGCGCTCTGGGCGTCACCCACTCGATCGATATGAAGAGGCCGAGATGTGTTCTTCTTCCCGGGATCTCGATTTTTCGTCTCGTCCTCATTTCTTGCGTCTTTCTGTGCTCTATTCCTAGTAAAGCAAACCAATTCTCTTCTTTTTCTTTAAAAAAATGTTATTTGTAAATATTTTGCATGGATTTCCCTCTTATTTAAAGACAGGAAAGAGAATAAATTGACTGCATGCATTTGGAGAAGTCTATCAAATTTTCTTGGGAACAGTTGGGAGATTTCACAGGTTTCTAATTCATATCGTGAGAGAGAGTAAGAAAGGATAGAGGTTGGAAACTGCTAAAATCTAGTTGAATTTTAGATATGATTTGCAGGAGTAACAGAAATAATTAAGAAAATAAGAGTTGGCTGCCAGTTTGGATAATAATGGTAAGAGGACAGGTTTTGTTTAGGATAGGTGTGAAATTATTATCGTTCATCAGATTCTTTATTGTTCATGAGTTTTTTTCTCCTCCGAAAAAAAACTTAAATATGAGCTGGAGGGTGTTTCCTAGGTTTGTTTTTTATGAATTGTTTTTCGTTTTCTTTGTGCTATTGCAATGGTTGATTTTGTCCCCCAATTGCAAATACATTATTTTCAGTTCCTTGAAAATTAATATAGGAATTTGAAGCAATGAGTCAGAAAATGAAGATCAGCTAAAATTTTTTGGAGCATGCTTTTCAGAGTCAAAGCATACGACTATGCATGTTGACCTACAGTGCTTGATTGTTGCATGGGTAGTTTCTTTACCTAGAGAAATTTGTGGCTTACTATATCAACTACAAACATTATGGAAGTTACATCCAATCCAAGAGAGAGAGAGGGGTCATGGAATACTAGGAAACATTTGGATATTGAGTTATAAAGGAATTTGTGGTAGTTGATAGAATAGACGAAATAATTCAGTGCAAATGGAAAAGGATATTTGCTTTTATTTTTTTTTGTTCTTGCCATATGTATCTGTTGATTTATTAAAAGGTTAAAATTTGCAAGCACAATAAAGATTCATGGTTCGTGTGGTTTGATATCTTTCCATAAAATGCTCTCAAGTTGTCAACTTTAATAGTATTGGCTTCTATGATCATGGGTGAAGGTTTTAGAGTTTTCAGATTGGGG\n>URS0000642F76 tRNA from 1 species \nGGTGGCTCAGTGGTAGAGCGCTTGCCTTGCATGCATGAGGCAGGCCCTGGGTTCGATTCCTCAGCACCA\n>URS0000D63273 lncRNA from 1 species \nCTGTCACTTAAATCTTTGAGCTGTGTAGCCCACAAACTATTGCTAGAAACCAATGACGTTGTAAAGCAACTTTGAATTGGGCTTCCAGGTGGTGCCTGTTAGAAGGGCCTAAGAGCAAGGCATCATGGGAGACCGGGCGCCATGAATGTCTCGCTGTCGACTGGGAGGTTGCAAAGCGGCTGCTGCTGTTTTCCTTCCAATCCCGGAGCCAGCTGTCTGGCCCACAGCTCCAGATATATCAAGATTGAGACACATTTCCAAGCACCAAGAGACTGCTGGGATCTCTCTCTGAATTGGTACCTAAGTACTTTGGCCACCTCAAGCGAAGAGTTGACTGATTGGAAAAGACCCTGATGCTGGGAGGGACTGGGAGCAGGAGGAGAAGAGGACGACAGAGGATGAGATGGCTGGATGACATCACTGACTCGATGAACGTGAGTCTGAGGGAACTCTGGGAGTTGGTGATGGACAGGGAGGCCTGGCGTGCTGCGATTCATGGGGTTGCAAAGAGTCGGAC\n>URS00007413E9 rRNA from 1 species \nTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGGCCTTCGGGTTGTAAAGTACTTTCAGTCGTGAGGAAGGTGTTAAGGTTAATAACCTTAGCAATTGACGTTAGCGACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGGGCACGCAGGCGGTTAATTAAGTTGGATGTGAAATCCCCGGGCTTAACCTGGGAATGGCATTCAAGACTGGTTAGCTAGAGTCTTGTAGAGGGGGTAGAATTCCATGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAATACCGGTGGCGAAGGCGGCCCCTGGGACAAAGGACTGACGCTCATGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACC\n>URS000236D244 lncRNA from 1 species \nAGGCGGTTAGTGAGGTAAGCGCTAGCATGTAACTCAAGGGATATGATAACATAATGACATGTCCAAAAACCAGTCAAAACCATAATGTACACATTTATATACATATATATAAGTTTTCATGATAGGGAACAAGGTTAAAGCATGAGGTTATCATTAACTTGGACTGTGTAGCTCTAACCATTCTAAAAACACCTATGAGCTATATGGGTCTGGATCACCCCACTGAAAGGGCCCTAGTGTATGTTATCCACATGAGCCAGAGAATTCTAAGGAAAGCCCAGGGAATCTATGACCCTACTCTAATCATACGTATATATATATATATATATCAAATAAGAACTATGCACACAGTCATGAAGGCCCCCACACGGAAAATATGGTTTCTAGTATAGGTCGCCCCTAAGGCCTCC\n>URS0002273E9A tRNA from 1 species \nGTTTATGTAGTTTATAAAAACATTACATTTTCAATGTAAAAATAAAAGGAATCTTTTCATAAATA\n>URS00015EFEAA rRNA from 1 species \nCCTACGGGTGGCAGCAGTGAGGAATCTTCCACAATGGGCGCGAGCCTGAACGAGCCACGTAGCGTGAAGGATGACTGCCCTACGGGTTGTAAACTCCTTTTATAAAGGAATAAAGTGAGGCAAGTGAGTCTCTTTTATTTGACTTTATGTATTTGGATCGGCTAACTCCGTGCCAGCAGCGGCGGTACTACGGAGGGTCCGAGCCTTGTCCGGATTTATTGGGTTTAAAGGGAGGGTAGATGGGTTGATAAGTCAGTTGTGAAAGTTTTCGGCTCAACCGTAGAATTGCATTAGATACTGGTGGACTTGAGTACAGTAGAGGTAGGCGGAATTCGAGGTGTAGCGGTGAAATGCTTAGATATAACGAAGAACTCCGATTGCGAAGGCAGCTTACTAAACTGCCACTGACGTTGAGGCTCGAAAGTGTGGGTAGCAAACAGGATTAGATACCCGAGTAGTC\n>URS00016A3A0B rRNA from 1 species \nTACAGAGGTCTCGAGCGTTAGGCGGAATTACTGGGCGTAAAGCGCGTGTAGGCTGCTCAGCAAGTCGGATGTGAAAGCCCTGGGCTTAACCTAGGAAGTGCATTCGAAACTTCTGAGCTAGAGTTCTGGAGAGGAAGGCGGAATTCTCGGTGTAGAGGTGAAATTCGTAGATATCGAGAGGAACACCGGTGGCGAAGGCGGCCTTCTGGACAGTGACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACAGG\n>URS0001B06EC2 rRNA from 1 species \nAGAGTTTGATCATGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGGTAACAGGAAGAAGCTTGCTTCTTTGCTGACGAGTGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACCGGAAACGGTAGCTAATACCGCATAACGTCGCAAGACCAAAGAGGGGGACCTTCGGGCCTCTTGCCATCGGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAACGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCTGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGATACTGGCAAGCTTGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTGAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCACGGAAGTTTTCAGAGATGAGAATGTGCCTTCGGGAACCGTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTCCGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTACGACCAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTGGATCAGAATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACTTTGTGATTCATGACTGGGGTGAAGTC\n>URS0000A96D3A lncRNA from 14 species \nCAATTCCCAATGTCCTCTGAAACCTTGAATACTCCTTTCTGCCTTACACACTTCTTCTCACACAGGTCTGCAGTATTCCCTCCAAAATGGCCCAGCAAGCTTTGATTACAGCTTCAAAGTGTTGCTCTGCTAGCTGCCCCCCCTCCCCATTCTTCCAGTCCCTCCATAAACCAGACCTCAAGGCCTGTGGACCAGATGTTCAGGTTTCTCACAGGGAGTGGCCCACTCCCAGGACTAATTATCCATATTAGTGCAAGTTTTCACTGCTTTGAGACAATATCGACACCAAGCGATTTACGGGAGGAAAAGACTTTTGTTTTGTTTCCACAGATTGAGGAGAATGAAGTTCATCATGTCAGGGAAGCCGTGGCAATGGGCGGCTCTGCTGGGCTTGCGTGTCTGTCAGAGAGGAGGGAGATTTGGGCTGAGACCAGCGATAGATTGGTCGAGCGCGGGAAGAAAAGGAAGAGGAGCGAATTAAATAGGAGCGCCG\n>URS0001F14516 rRNA from 1 species \nGATGAACGCTGTCTACAGGCTTAACACATGCCAGTCGAGGGGAAACGACGGGGAAGCTTGCTTCCCCGGGCGTCGACCGGCGCACGGGTGAGTAACGCGTATCCAACCTGCCTCTGACTGAGGGATAACCCGTCGAAAGTCGGCCTAATACCTCATGGCATCGTCTGCGGGCATCCAACGACGATTAAAGATTTCATCGGTCAGGGATGGGGATGCGTCTGATTAGCTTGTTGGCGGGGTAACGGCCCACCAAGGCTACGATCAGTAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGGGAGCCTGAACCAGCCAAGTAGCGTGCAGGATGACGGCCCTATGGGTTGTAAACTGCTTTTATGCGGGGATAAAGTGAGGGACGTGTCCTTCATTGCAGGTACCGCATGAATAAGGACCGGCTAATTCCGTG\n>URS000021B5FE rRNA from 1 species \nGAGTTTGATCCTGGCTCAGATTGAACGCTGGCGGCATGCCTTACACATGCAAGTCGAACGGCAGCATGATCTAGCTTGCTAGATTGATGGCGAGTGGCGAACGGGTGAGTAATACATCGGAACGTGCCCTGTAGTGGGGGATAACTAGTCGAAAGATTAGCTAATACCGCATACGACCTGAGGGTGAAAGTGGGGGACCGCAAGGCCTCATGCTATAGGAGCGGCCGATGTCTGATTAGCTAGTTGGTGGGGTAAAGGCCCACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGAAAGCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCCTCCGGGTGTAAAGCACTTTGTCCGGAAAGAAATGGCTCTGGTTAATACCTGGGTCGATGACGGTACCGGAAGAATAAGGACCGGCTAACTACGTG\n>URS0000E81CC4 lncRNA from 1 species \nTTCCAATTTCTGTCTTGCGTCTCTGTCCACTTCACACTACTCGTCTATAACTGCCAGTGTTGGAGGAAGCAAGTAAAGGAATAGGGAAGGCCTTACAATTTAGAGTATGAAAAGTATGACCCCCAAGCTGATTATGAGGATCATCTCTATCTCTCATCATCCCCACTCTGTTAAGTGACAAAGAATTTTAGGGGAGTTGTAATTCATGGCACCTGAAGGATCAGAGGAGGAAAAGGAGGAAGAAGGACATTTGAATTCACTTACTTCAGAGAGAAAATGGTTTGAAAACTTCCTAGGCACTAAGAAAGCTTTCAGTGACATCCTTTACCCTTGGAGGACATGCTGCCAAACTCTGAATTCATGGAACATTTATATGGTTCCATTAATTACAAATTAATATGACCTGTACATGGAGTCAGTCTGGAGCATCTCAAGGTAT\n>URS00004DE10A rRNA from 1 species \nGAGTTTGATCCTGGCTCAGGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTTTCGGGGGTACTCGAGTGGCGAACGGGTGAGTAACACGTGGGTGATCTGCCCTGCACTCTGGGATAAGCCTGGGAAACTGGGTCTAATACTGGATAGGACCATGGGATGCATGTTCTGTGGTGGAAAGCTTTTGCGGTGTGGGATGGGCCCGCGGCCTATCAGCTTGTTGGTGGGGTGATGGCCTACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGTGTCCGGCCACACTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGGGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCAGTATCGGCGAAGCTTGCGGGTTTTCTCGCAGGTGACGGTAGGTACAGAAGAAGCACCGGCCAACTACGTGCCAGCAG\n>URS0001FF2370 rRNA from 1 species \nGACGAACGCTGGCGGCGCGCCTAACACATGCAAGTCGAACGAGCGAGAGAGAGCTTGCTTTCTTGAGCGAGTGGCGAACGGGTGAGTAACGCGTGAGGAACCTGCCTCAAAGAGGGGGACAACAGTTGGAAACGACTGCTAATACCGCATAAGCCCACGGTGCCGCATGGCACAGAGGGAAAAGGAGCAATCCGCTTTGAGATGGCCTCGCGTCCGATTAGCTAGTTGGTGAGGTAACGGCCCACCAAGGCGACGATCGGTAGCCGGACTGAGAGGTTGAACGGCTACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAATCCTGATGCAGCGACGCCGCGTGGAGGAAGAAGGTCTTCGGATTGTAAACTCCTGTTGTTGGGGAAGATAATGACGGTACCCAACAAGGAAGTGACGGCTAACTACGTG\n>URS0000F8DDB5 rRNA from 1 species \nTACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGTGGTTTCTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCAAGTGTAGCGGTGAAAATGCGTAGAGATTTGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACACTGAGGCGCGAAAGCGTGGGGAGCGACAGGA\n>URS0001627BDD rRNA from 1 species \nCACGGGGGGAGCAAGCGTTGTTCGGAATCACTGGGCGTAAAGGGCGTCTAGGCGGTCAGATAAGTGGGATGTGAAATGCCCCGGCTCACCCGGGGACCGGCATCCCAAACTGTCTGGCTTGAGTATGGGAGAGGATGTGGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS0002226441 misc_RNA from 1 species \nAACAAGGCGTACCTGCGGACCTGCGGAAGGATCATTACGAGAGTGTCACCACTCCCAACCCATTGTTTACCTACCCGTCCACCGTGCTTCGGCAGGCAGCCCTGTGGGACAGAGCCTCGCCCCCTTTCGCGGGGGGTGCCTGCCGCTTGCCAACCAAAACTCTAGCTGTTTTAGTACCATCTGAGTCTTCCACAAATGAACAAAACTTTTAGCAACGGATCTCAGATCGGAAGAGCACAC\n>URS00002E10EA rRNA from 1 species \nAGGATGAACGCTGGCGGTCTGCTTAACACATGCAAGTCGAACGGAGTAGCAATACTTAGTGGCGGACGGGTGAGTAACGCGTGAGAATCTACCTTCAGGACGGAGACAACAGTTGGAAACGACTGCTAACCCCCGATGTACCGAAAGGGCAAATATTTATAGCCTGAAGAAGAGCTCGCGTCCGATTAGCTAGTTGGAGAGGTAAAAGCTCACCAAGGCGACGATCGGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTCCGCAATGGGCGAAAGCCTGACGGAGCAAGACCGCGTGGGGGAAGAAGGCTCTTGGGTTGTAAACCCCTTTTCTCTGGGAAGAACACAATGACGGTACCAGAGGAATCAGCATCGGCTAACTCCGTGCCAGCAGCCGC\n>URS000137F4FF rRNA from 1 species \nCCTACGGGTGGCAGCAGTGAGGAATATTGGTCAATGGCCGAGAGGCTGAACCAGCCAAGTCGCGTGAGGGAAGACGGCCCTACGGGTTGTAAACCTCTTTTGTCGGGAAACAAAGCGAGTCACGTGTGCCTCATTAAGAGTACCCGAAGAAAAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGAGGGATGCGAGCGTTATCCGAATTTATTGGGTGTAAAGGGTGCGCAGGCGGAGGTGCAAGTCAGTGGTCAAATTGCGGGGCTCAAACCCGTACTGCGGTTGATACTGCATCCCTTGAGTGCGCGAGAGGTATGCGGAATGCGTGGTGTAGCGGTGAAATGCATAGATATCACGCAGAACTCCGATTGCGAAGGCAGCATACCGGCGCGCAACTGACGCTCATGCACGAAAGCGTGGGTATCGAACAGGAGTAGATACCCGAGTAGTC\n>URS0000A3AF07 rRNA from 1 species \nTACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGTCTTTTAAGTCAGTGCTGAAATACTCCAGCTTAACTGGAGGGGTGGCATTGATACTGGAAGACTTGAGTGTAGTCGAAGTAGGCGGAATTGACGGTGTAGCGGTGAAATGCTTAGATATCGTCAAGAACACCGATAGTGAAGACAGCTTACTAGGCTACAACTGACGCTGAGGCACGAAAGTGTGGGGATCAAACAGG\n>URS00010B2DDF rRNA from 1 species \nTACGGGGGGAGCAAGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCGTGACAAGTCACTTGTGAAATCTCCGGGCTTAACTCGGAACGGTCAAGTGATACTGTCGTGCTAGAGTACAGAAGGGGCAACTGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCTGATACTGACGCTGAGGCGCGAAAGCCAGGGGAGCGAGCGGG\n>URS0002390407 lncRNA from 1 species \nGACAAGAAAACAAGGGGAAAGAAGTACCTAATGAGATTATGAAGGAAGAAACTGACCGTGGACTTGCACAAGACCGACTGGACTCTGATTGCTTCGAGGTGGGTAAAAAATTACATTAAGAAATCGTCCCTACTAGGAACGATTAGTTAATGTAAATTTTGGGCTCAACTCGTACCTTGAATCCAAAATTTTGGATTTGGAATTAACGGAATTGGGCAGGTTTTTTGGGGGAAAGGTTACTAAATTGGTATAAAGGGGAGGGTGGAGAGTGTATATGGTGAACTTGGGTTAGTTTAGAGGAGTTATGATTTTTGGTTTGAATCTTAGATCCGAAATATGAGCAATTTAGCGGGGATTTGGGAAAAAATAATTGGGGATCTAGGATGAGGAGGGGGTGAGGAACCGCCATAGGGCGATTTCCAAAAACTAATTTGGAGCATGGGAACCGTCGTGGGGCGATTTTCGGCGGGTGATTTGTGGCGAGGCAGCAGGGGAAATCCTAGGCGGCTAGAGTTTGATCTGTTTATAGAGATGAGAGTAAAAT\n>URS000226779B rRNA from 1 species \nAAACTGGAGAGTTTGATCCTGGCTCAGAACAAACGCTGGCGGCGTGCTTAACACATGCAAGTCGTACGAGAAAGTCCGCTTCGGCGGATGAGTAAAGTGGCGCACGGGTGCGTAACACGTG\n>URS0001472A94 rRNA from 1 species \nTACGTAGGGGGCTAGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGTGTAGGCGGTCCGGTAAGTCCGCTGTGAAAGTCGGGGGCTCAACCCTCGAATGCCGGTGGATACTGTCGGGCTAGAGTGCGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGAGTGGCGAAGGCAGGTCTCTGGGCCGACTACTGACGCTGGAGAAGCGGAAAAGCATGGGGGAGCGAAACGGG\n>URS00006461F6 tRNA from 1 species \nTCCCTGTTGGCTCAGATGGTAAAGCATCTGCCTACAATGCAGGAGAACCAGGTTTAATCCCTGGGTCAGGAA\n>URS000199F6C3 lncRNA from 1 species \nGGAACCGCGGGCACGGCGGGGCAGGGAGCGCGCCCGGGGCTGGGAGACTCAGGGGCGGGGCAGCCCCGGGACAGCGCCGGGACAGCGCTGGGATTGGACTGGGATAGCCCGGGACAGCGCCGGGACAGCGCCGGGACAGCGCTGGGATTGGACTGAGGAGGGCCAGAAGGAATGAAATCCATCGTGGCTCAGCCTGGGCTGGTGAAAGCGAGCTGGGAAAGGCAGGAGCAGGGATTCCAGCATTTCCCTGAACCACAGGAAAATCCTGGGAACGGAGAGGAGCAGAGAGGGGGAGATTCCGAATGGGGATTTGGAGCATCCAGCCAGTTTTACTGGGACTCCTTTCAAGGGCTGCCCGGAGCCCCCCGCGGTAAATAGTGCACAGCTCGGGCCAGGAGGATTTCCTCACCGCTGGGACTCTTAATGTCGAAAGCAGAGGTGTCAAACAAGGGGCTCAAAGCCCCGTGGTGGCCCCGGAGAGTTCCACATCTGGCCTGGATCTCGGTGCTTAACACGTTTTAACTCTTGCCCCGAGCAGCTCCGGATTTCCCTCGGCAGCCCGGGTTAGGTTTGATTTAAGAGGCTGCAAGGAAAAGCCAAAATAAAAA\n>URS00021F6806 misc_RNA from 1 species \nCGGAACTTCATTTCCCAGCCATGGATGTGGACGTCAATCCCTATCCTGGTGCACGCATTCCTGCTGCCTCACACGCTCGCCCACCAGTGTCGTCTTCACCTAGCGCTCGACCTCCAGCTCACCTCTGCCCTCTCATGCTTGCCGAGCTGCTCTCAGATGGTTGCTCGCGAGTTTCTTCCTCCCCAACACCGTCAGCTTGCCGCGTCTCTGGTCCAGCTCCAGCTCGTCGAGTCCCTCTCTGTGTGCGCCATGCAGCTCGCTCGGCCGCGACCTTGCCGAGCTCCGCCCCTGCTCCACGTCTCCTGGTCGGGCTCTCGTTCTGCGCGTGACGCCGCTGTTCCCTGGTGCTCCCTGCTCGACCCTGCTTCTTCTTCCTTGAGCCTCGCCGTGCGAGTTCTCCCTGGCTCATGTGCCTACCGCCGTCGGCCCCAGTCTCTCGCTCGCAAGGTCTTCCCAAGCCGTCGTCTCCTGCCTCTGGCTGTCAAGCGCGACGAACTCGTCCCGAGCTCGTCACAACGTCTCAGCCCTGCGTGTCGCGCTAGCTCGCGTCTATGGTCGCGTCCGCTGAACTCGCCAACGCCCTGTTGCCAGTCCGACTATCGTCGCTACTGCGTGCCTCGCTGCGCGCTCGTTGGTGGTGCCGTCTGTTGTGCCCCTGCATCCGCCCTTGTCGCTAGTGCCAACTCCGGCCGTCGCGGTATCTGCTCCGTCCTGGCGCCCTGCGCTAGTGCTCTGCTTCCTGGCCCCGCCTGGCCTCCAGCTTGCTCAACAGTACTATCCATTTCGTCGTCATACGTCTCCGCGTCATGTACAATAACGTCGTCGACCATGCCTTCGCCTGCTTTGACGCGTCGAGCTCCTTCCCGTTGTGACTCGCGCACCATCTATTCATCAAAATGGAATACTAATGAGCTCCTCGCGACGCAGTTTCTCTGTGTCGTCGTTCGCGCCGGTAAGATCCACGGTTCTGCTTTGTTCCATTAAATTCTCTTCTAGCACTATTTTGGCTAGGTGTGGATTTATGTGTATATGTGTGGATCTGTAAAGGAAGACGAAAGGGAAGCGCCAGTGCAACTTGTAACACCCCAGGTGTTTGCCTTAAATTAAACTGCAATTATGGATCCTTAAGAAAAATATCAGTTTGGATCACTCGAATTAGCGAATGTAAATTTAGGAAGCACTTGTATTTATAATTCGGACCTCACTAGTTTGGATCGACGTGTATTCAATTCAAATTAAATTTAAAATTAAG\n>URS00014751E2 rRNA from 1 species \nTACGTAGGGTGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGTCGCGTCGAATGTGAAAACCCAGGGCTCAACCCCGGGCCTGCAGTCGATACGGGCAGACTAGAGTGCGGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS0001C1925D rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGAGACCTTCGGGTCTAGTGGCGCACGGGTGCGTAACGCGTGGGAACCTGCCCTTAGGTTCGGAATAACTCCCCGAAATTGGTGCTAATACCGGATAATGTCTTCGGACCAAAGATTTATCGCCTTTGGATGGGCCCGCGTTGGATTAGCTAGTTGGTAGGGTAAAAGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTTACCCGGGATGATAATGACAGTACCGGGAGAATAAGCTCCGGCTAACTCCGTG\n>URS0001957C9E lncRNA from 1 species \nCCCACATTGTCCATAACAACTGACTGAGGTTCTTGTACCCAGGGCTCTAACCTGAATTTTTTGCCTGACTTTCTGTCTTCCCTAATCATTTTATATTTGCTAAAGTGGGTCTTAAAGACTTGCTTGTTCCTTTCTTACTTTAAATTCTCAACCTCCAAGATTCCTTGTGCATAGATGCTGGGTTATGCATTCCTTTTTCCAATTTTTATTTTGTTTTTCTAAGTGATGCTATTTTACTATCCTTCCATGACAGGATCCCATCAGGCCTCTACTGCACAAATAACAAGAAAAAAAAGAAAAGAAAAGAAAAGAAAGCAAACAAGTGTAATTTGTAAATCTAATATTCTTGCACAAGGAATCCACTGGATATTGTAGGCAATGGCCTTGTCATCTTAGCCACTAGAAGACTCCATCTATCAGAAGCTGGCAATTCTGAATTTTGTACAGCAAGCCGTGAGTATGGAAATGCAAGTAAGAGTTGACATTGCAGTTTTGATTCCAAATTCCATAGCTAAGCAAGTTAGAAACTCAGGTAGTATTTCTATGTTGCAGTTTTGAGGCAGATTCCTCTTCCTTCAGGAAACCTCAGTGTTTGCTCTTTAGACCTTCAGCTAATTGGATGTGACTCACCCACATTATGCAGGGTATCTAGCTTATTGCAGGTCTGCTGATTAAAAAAAGTGCCTTCATAGCATCAAGACATCTTGTTGTTAATGAAACAACTAGATATCATAACCTCGTCAAGTCGACACACACAATAAACCTTCAAAGGAATATTTTATTTAATAACCT\n>URS000133998B rRNA from 1 species \nTACGTAGGGGGGCAAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGTCCGGTAAGTCGGCTGTGAAAGTCCAGGGCTCAACCCTGGGATGCCGGTCGATACTGCCGGACTAGAGTTCGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAATGGCGAAGGCAGCTCGCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTGGGAGCAAACAGG\n>URS00011EADB4 rRNA from 1 species \nTACGTAGGGGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCATACAGGTCAGCTGTGAAAACTCGAGGCTCAACCTCGAGACGTCGGTTGAAACCGTATGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAAGAACACCCGTGGCGAAGGCGGCCTGCTGGGCAGTTTTGCTGACACTGAGGCGCGACAGCGTGGGGAGCAAACAGGG\n>URS0001797414 rRNA from 1 species \nTACGAAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGTAGGCGGTTGTTTAAGTCTGCTGTGAAATCCCCGGGCTCAACCTGGGAATGGCGATGGATACTGGCGAGCTAGAGTGTGTCAGAGGATGGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGAGATCGGGAGGAACATCAGTGGCGAAGGCGGCCATCTGGGACAACACTGACGCTGAAGCACGAAAGCGTGGGGAGCAAACAGG\n>URS00012E3FAA rRNA from 1 species \nATTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGAACGGTAACAGGTTAAGCTGACGAGTGGCGAACGGGTGAGTAATGCATCGGAACGTGCCCGATCGTGGGGGATAACGCAGCGAAAGCTGCGCTAATACCGCATACGATCTGAGGATGAAAGCGGGGGACCGTAAGGCCTCGCGCGATCGGAGCGGCCGATGTCAGATTAGGTAGTTGGTGGGGTAAAGGCTCACCAAGCCAACGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGAGACGGCGCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGAAAGCCTGATTCAGCAATGCCGCGTGCAGGAAGAAGGCCTTCGGGTTGTAAACTGCTTTTGTACGGAGCGAAAAGGCTCTCTCTAATACAGGGGGCTCATGACGGTACCGTAAGAATAAGCACCGGCTAACTACGTGCCAGCCGCCGCAGTAAGAC\n>URS000218DCF5 lncRNA from 1 species \nTATACTAAACCTCATCTAATAACCCACTCAGGAAACTACATGAAAAAAGTCACTACTGACGTGTAAAGTCATATACATACATACATATATACTAACCTCATCTAACAACCCACTCAGGGAAACTACATGAAAAAGTCACTAATTGATGTAGTAAGATCATATACTACATACATATATACTAAACTCATCTAACTAACCCAACTTCAGGAAAACTAAATGAAAAAGTCCTACTGATTGTAGTAAGTCATATACATACATACATATATACCTAAACCTCATCTAATAACTCACTCAGAACTACACAAAACGAAAAAGTCACTACTGATGTAGTTAAGTTATATACATACAAGACATATATACTAAACCTATCTAAACAACCCATTCAGGAAACTACAAACGAAAAGTCAACTACTGACGTAGTAAGTCATATGCCTACATAAAATAATATACTAAACTCATATAAACAACCCACTCACGGAAACTACAATGAAAAGTCACTACTGACGTAGTAAGTCATATACATACATACATATATACTAAACTCACTACCAACCCACTCAGGAAACTACATGAAAAAGTCACCTACTGACGTAGTAAGTCAATATAACATACATACATATATACTAAACCTCATCTAACAACCCACTCAGGAAACTACATGAAAAAGTCACTACTGATGTAGTAAGTCATATTCATACATACATACTGTATTACATATATGTTAGAAATGAACTAATTTTTTCGACGTATTTGTTCATGTGAATTTTGCAATATAAAGAGTTGTTTCAAATGTGGCGGTATTGAATCTTCTTTTATATACTGTGGATTCATTATGATTATTGGGATACCAATTTTCATAGAATTTGTGGGTATTTGTAAACCACAAGGAAATGTGATATAATTGCCAATGAGACAACTATCCAATGCTGGCAGACAGTTAACATGGGTTGATTCAATGGTTACTGCCTAAGATTTAAGATGAACACTTTATTCATTTATCCAAAAAAGGAGAAAGAGGATGGTTAAGACTTATACAAAAGACTTTTTTAAGTAGTAAAGTACTCCTTAACTAGCACAATAAGAAAAGGCACAAATATCAATTAAAAAAAACTGTTAAATTTTAGTGAAAATTAATTAGCAATTTTAATAGAAATTTTATTTAACATCATGAATCAAAATTTTTAAAAAAAGTAACGCTCATGTATTCTTGTTTAAAAGTATGAACAATTTGTATCTTCCAGGCAGTAGATCTGTTACTCCAGCAGTTAACATCTTCACTGGATGAAGACTTGGCCGATGTTGATGAGTATGAAAGAGGCGTTGATGATGTGAAAAATACGATAAAAACTCCTATCATACCCAGGACTATACAGAAATATTGAG\n>URS000051BDF4 rRNA from 1 species \nATAGCGTATACTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTAATCTCTCTTGGGGTTCCTTTTCTAAAGAAATGTGCGACCATTCAAGAGAGATTATCCTCGTGCCTAGCCTTTCTCACTTTCATTAGTCAGGAAGGGGACGCACGTCATTTACTGTGAGCAAAATAGAGTGTTCAAAGCAGGCTTAGGCCATGAATATATTAGCATGGAATAATAAGATAGGACTTGGGTCTATTTTGTTGGTTTGCAGACCGAAGTAATGATTAATAGGGATAGCTGGGGGTATTTATATTCCGATGTCAGAGGTGAAATTCTTAGATTTTCGGAAGATAAACTTATGCGAAAGCATTTACCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGATGATTAGATACCATCGTAGTCTTAACCATAAACTATGCCGACTCAGGATTGGTGAACGTTGATTTAATGACTTCATCAGCACTGTATGAGAAATCAAAGTCTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTA\n>URS00021995E3 rRNA from 1 species \nGGTTAAGCGACTAAGCGTACACGGTGGATGCCCTGGCAGTCAGAGGCGATGAAGGACGTGCTAATCTGCGATAAGCGTCGGTAAGGTGATATGAACCGTTATAACCGGCGATTTCCGAATGGGGAAACCCAGTGTGATTCGTCACACTATCATTAACTGAATCCATAGGTTAATGAGGCGAACCGGGGGAACTGAAACATCTAAGTACCCCGAGGAAAAGAAATCAACCGAGATTCCCCCAGTAGCGGCGAGCGAACGGGGAGCAGCCCAGAGCCTGAATCAGTGTGTGTGTTAGTGGAAGCGTCTGGAAAGGCGTGCGATACAGGGTGACAGCCCCGTACACAAAAATGCACATACTGTGAGCTCGATGAGTAGGGCGGGACACGTGGTATCCTGTCTGAATATGGGGGGACCATCCTCCAAGGCTAAATACTCCTGACTGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAAAAGAACCCCGGCGAGGGGAGTGAAAAAGAACCTGAAACCGTGTACGTACAAGCAGTGGGAGCACGCTTAGGCGTGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTATATTCTGTAGCAAGGTTAACCGAATAGGGGAGCCGAAGGGAAACCGAGTCTTAACTGGGCGTTAAGTTGCAGGGTATAGACCCGAAACCCGGTGATCTAGCCATGGGCAGGTTGAAGGTTGGGTAACACTAACTGGAGGACCGAACCGACTAATGTTGAAAAATTAGCGGATGACTTGTGGCTGGGGGTGAAAGGCCAATCAAACCGGGAGATAGCTGGTTCTCCCCGAAAGCTATTTAGGTAGCGCCTCGTGAATTCATCTCCGGGGGTAGAGCACTGTTTCGGCAAGGGGGTCATCCCGACTTACCAACCCGATGCAAACTGCGAATACCGGAGAATGTTATCACGGGAGACACACGGCGGGTGCTAACGTCCGTCGTGAAGAGGGAAACAACCCAGACCGCCAGCTAAGGTCCCAAAGTCATGGTTAAGTGGGAAACGATGTGGGAAGGCCCAGACAGCCAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAAAGCGTAATAGCTCACTGGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAACCATGCACCGAAGCTGCGGCAGCGACGCTTATGCGTTGTTGGGTAGGGGAGCGTTCTGTAAGCCTGTGAAGGTGTGCTGTGAGGTATGCTGGAGGTATCAGAAGTGCGAATGCTGACATAAGTAACGATAAAGCGGGTGAAAAGCCCGCTCGCCGGAAGACCAAGGGTTCCTGTCCAACGTTAATCGGGGCAGGGTGAGTCGACCCCTAAGGCGAGGCCGAAAGGCGTAGTCGATGGGAAACAGGTTAATATTCCTGTACTTGGTGTTACTGCGAAGGGGGGACGGAGAAGGCTATGTTGGCCGGGCGACGGTTGTCCCGGTTTAAGCGTGTAGGCTGGTTTTCCAGGCAAATCCGGAAAATCAAGGCCGAGGCGTGATGACGAGGCACTACGGTGCTGAAGCAACAAATGCCCTGCTTCCAGGAAAAGCCTCTAAGCATCAGGTAACATCAAATCGTACCCCAAACCGACACAGGTGGTCAGGTAGAGAATACCAAGGCGCTTGAGAGAACTCGGGTGAAGGAACTAGGCAAAATGGTGCCGTAACTTCGGGAGAAGGCACGCTGATACGTAGGTGAAGCGACTTGCTCGTGGAGCTGAAATCAGTCGAAGATACCAGCTGGCTGCAACTGTTTATTAAAAACACAGCACTGTGCAAACACGAAAGTGGACGTATACGGTGTGACGCCTGCCCGGTGCCGGAAGGTTAATTGATGGGGTTAGCGCAAGCGAAGCTCTTGATCGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGCGTAATGATGGCCAGGCTGTCTCCACCCGAGACTCAGTGAAATTGAACTCGCTGTGAAGATGCAGTGTACCCGCGGCAAGACGGAAAGACCCCG\n>URS0000E9EAA2 lncRNA from 1 species \nCCCATCTCCGTGGCTGAGGGCCTAGGGAGGAGGGAAAATCCATCCTCAGACACACTAGATCCTCAGCGAGACCTGCTGTGGAGAGCATCAAACGGACCGCACGCGGACCCACCTGCCTTCCAAAGTTTGGGGCGTGAGGAAGCTGAGGCACGTGGCGTTTGGTTATGGCACAGCTGAGGGGTCTGCAGGAGACCCCAGAAAATGCCGCTGAGGACGGATTCACCGACGTCATCAAAAGCCGCGCTGGTACTGACAAGACATTGAAATTGCTGCCGAAGTAAATGACTAGAGGAATAGGTAACTCTTTTTATTTTGTAACCTATTATTTTTCTACCTTTCCTAATAAAGAGAGAGAATTGACAAATACTGATTTAGGAACTGTGGGCTAGTCTAATGTGTTGTTGACAGAAGTTGAAGAGGGTAGTGAAAAAATGATCACGAATTATCGCTAAAGTTAAATTCAAAGTAAATTATTTTCTAACTTCAAAACAAAACTTTATAAACATCTCTAGAAAATGTTCTCTTAGTTATGCCCATTTTGTTTACAGTTGATTAGAAGTAGAATAGAAAAATGACAGAGT\n>URS0000292678 rRNA from 1 species \nGCCTAACACATGCAAGTCGAACGAAGGCTTCGGCCTTAGTGGCGCACGGGTGCGTAACGCGTGGGAATCTGCCCCTTGGTTCGGAATAACAGTTGGAAACGACTGCTAATACCGGATGATGACGTAAGTCCAAAGATTTATCGCCGAGGGATGAGCCCGCGTAGGATTAGGTAGTTGGTGTGGTAAAGGCGCACCAAGCCGACGATCCTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTTACCCGGGATGATAATGACAGTACCGGGAGAATAAGCTCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGAGCTAGCGTTATTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGCTTTGTAAGTAAGAGGTGAAAGCCCAGAGCTCAACTCTGGAATTGCCTTTTAGACTGCATCGCTTGAATCATGGAGAGGTCAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTGACTGGACATGTATTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGATAACTAGCTGTCCGGACACTTGGTGTTTGGGTGGCGCAGCTAACGCATTAAGTTATCCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCTGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAGCGTTTGACATGGCAGGACGACTTCCAGAGATGGATTTCTTCCCTTCGGGGACCTGCACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGCCTTTAGTTGCCATCATTTAGTTGGGCACTTTAAAGGAACCGCCGGTGATAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTACGCGCTGGGCTACACACGTGCTACAATGGCGGTGACAGTGGGCAGCAAGCACGCGAGTGTGAGCTAATCTCCAAAAGCCGTCTCAGTTCGGATTGTTCTCTGCAACTCGAGAGCATGAAGGCGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCAGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTGGATTCACCCGAAGGCGTTGCGCTAACTCGTAAGAGAGGCAGGCGACCACGGTGGGTTTAGCGACTGGGGTGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGCGGCTGGATCACCTCCT\n>URS00013010D6 rRNA from 1 species \nTACAGAGGTCTCAAGCGTTGTTCGGATTCATTGGGCGTAAGGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCTTGGAGCTTAACTCCGAAACTGCATTCGATACTGCCGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGCGTAGCGGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACGCTGAGGCACGAAGGTCAGGGGAGCAAACGGGG\n>URS00004F080A rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACGGACGAGAAGCTTGCTTCTCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGTAGCTAATACCGGATAATATTTTGAACCGCATGGTTCAAAAGTGAAAGACGGTCTTGCTGTCACTTATAGATGGATCCGCGCTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACATATGTGTAAGTAACTGTGCACATCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGAAAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACGCTGATGTGCGAAAGCATGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAATCTTGACATCCTTTGACAACTCTAGAGATAGAGCCTTCCCCTTCGGGGGACAAAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTAAGCTTAGTTGCCATCATTAAGTTGGGCACTCTAAGTTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGATTTGGGCTACACACGTGCTACAATGGACAATACAAAGGGCAGCGAAACCGCGAGGTCAAGCAAATCCCATAAAGTTGTTCTCAGTTCGGATTGTAGTCTGCAACTCGACTACATGAAGCTGGAATCGCTAGTAATCGTAGATCAGCATGCTACGGTGAATACGTTCCCGGGTCT\n>URS000069B5BC tRNA from 1 species \nGCCTGGGTGGCTCAGTCGGTTGGGCGTCCGACCTCAGCTTAGGTCATGGTCTCATGGTTCATGGGTTCGAGCCCCACCTCAGGCT\n>URS000209731F rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTGCAGGGTACTCGAGTGGCGAACGGGTGAGTAACACGTGGGTGATCTGCCCTGCACTTCGGGATAAGCCTGGGAAACTGGGCCTAATACCGGATAGGAGCCATTTTTAGTGTGATGGTTGGAAAGTTTTTTCGGTGTAGGATGAGCTCGCGGCCTATCAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGGCGACGGGTAGCCGGCCTGAGAGGGTGGACGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAAGATTGCACAAGGGGCGCAAGCCTGATGCAGCGACGCCGCGTGGGGGATGACGGCCTTCGGGTTGTAAACTCCTTTCGCTAGGGACGAAGCTTTTTGTGACGGTACCTAGATAAGAAGCACCGGCTAACTACGTG\n>URS0001E64AC9 rRNA from 1 species \nAGCGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGAACCTTTCGGGGTTAGTGGCGGACGGGTGAGTAACACGTGGGAACGTGCCTTTAGGTTCGGAATAACTCAGGGAAACTTGTGCTAATACCGAATGTGCCCTTCGGGGGAAAGATTTATCGCCTTTAGAGCGGCCCGCGTCTGCTTAGCTAGTTGGTTGAGGTAATGGCTCACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGATGATCAGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCCATGCCGCGTGAATGATGAAGGTCTTAGGATTGTAAAATTCTTTCACCGGGGATGATAATGACGGTACCCGGAGAAGAAGCCCCGGCTAACTTCGTG\n>URS0000A2C0F7 rRNA from 1 species \nCACCGCGGTTATACGAGAGGCCCAAGCTGACAGCTACCGGCGTAAAGAGTGGTTAATTCACCCCCACAAACTAAAGCCGAACATCTCCAAAGTTGTAAAACGCACTCGAAGGTATGAAGATCACCCACGAAAGTGGCTTTATAACCCTTGAACCCACGAAAACTAGGGAA\n>URS0000BA4FCD rRNA from 2 species \nCGTGGGAATACCTGCCCAGTATGCGGGGGATAACTATCTGAGACTCAGATGCTAATACCGCATAACAACTTCGCCCGCATGGTCCGAGTTTGAAAGATGGCTTCGGCTATCACTTCTGGATGGTCCCGCGGCGTATTAGCTAGATGGTGAGGTAACGGCTCACCATGGCAATGATACGTAGCCGACCTGAGAGGGTAATCGGCCACATTGGGACTGAGACACGGCTCAAACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGACGAAAGTCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGGTTTCGGCTCGTAAAACTCTGTTGTTAAAGAAGAACATATCTGAGAGTAACTGTTCAGGTATTGACGGTATTTAACCAGAAAGCCACGGCTAAGTACGTGTCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGTTTTTTAAGTCTGATGTGAAAGCCTTCGGCTCAACCGAAGAAGTGCATCGGAAACTGGGAAACTTGAGTGCAGAAGAGGACAGTGGAACTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAAGAACACCAGTGGCGAAGGCGGCTGTCTGGTCTGTAACTGACGCTGAGGCTCGAAAGTATGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCATACCGTAAACGATGAATGCTAAGTGTTGGAGGGTTCCGCCCTTCAGTGCTGC\n>URS00004CE42D rRNA from 1 species \nGATCAGGCTCAGGATGAACGCTAGCTACAGGCTTAACACATGCAAGTCGAGGGGCAGCATGGTCTTAGCTTGCTAAGGCCGATGGCGACCGGCGCACGGGTGAGTAACACGTATCCAACCTGCCGTCTACTCTTGGACAGCCTTCTGAAAGGAAGATTAATACAAGATGGCATCATGAGTCCGCATGTTCACATGATTAAAGGTATTCCGGTAGACGATGGGG\n>URS0000251C9B rRNA from 1 species \nGACCAAGGAGTCTAGCATGTGCGCGAGTCATTGGGACATAACTAAACCTAAAGGCGTAATGAAAGTAAAGGTCTGCCTTGCGTAGACCGAGGGAAGATGAGCGGTTTGCCCATAAAGTGGCCGCTCCGCATTCCCGGGGCGTCTCGTTCTCATTGCGAGAAGAGGCGCACCAAGAGCGTACACGCTGGGACCCGAAAGATGGTGAACTATGCCTGGTCAGGACGAAGTCAGGGGAAACCCTGATGGAGGTCCGTAGCGATTCTGACGTGCAAATCGATCGTCGGAACTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGCGCTCGTTGCGTACGAGTTTCATCCGGTAAAGCGAATGATTAGAGGCATTGGGGTCGAAACGACCTCAACCTATTCTCAAACTTTAAATGGGTGAGATCTCCGGCTTGCTCGAACTCATGAAGCCGCGAGACTCGAATCAGAGTGCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGCTGTGGGATGAACCAAACGTCGAGTTAAAGCGCCTAAATCGACGCTTATGGGATACCATGAAAGGCGTTGGTAACTTAAGACAGCAGGACGGTG\n>URS0000A30B64 rRNA from 1 species \nCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGGAATGATGAAGAGGCTTGCTTCTTCTGATTTTAGCGGCGGACGGGTGAGTAACACGTGGGCAACCTACCTTGTAGATTGGGATAACTCCGGGAAACCGGGGCTAATACCGAATAATCCATTTTGCTTCATGGCGAGATGTTGAAAGACGGTTTCGGCTGTCACTATAAGATGGGCCCGCGGCGCATTAGCTAGTTGGTAGGGTAATGGCCTACCAAGGCGACGATGCGTAGCCGACCTGAGAGGGTGGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGGCAGCAGTAGGGAATCTTCCACAATGGACGAAAGTACTGATGGAGCAACGCCGCGTGAGTGAAGAAGGTTTCGGTATCGTAAACTACTGTTGTAAGGAAGAACACGTACGAGAGTAACTGCTCGTACCTTGACGGTACCTTATTAGAAAGCCACGGCTAACTACGTG\n>URS00015CBD71 rRNA from 1 species \nTAGGGAATCTTCCACAATGGACGCAAGTCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGACCGTAAAGCTCTGTTGTTGGTGAAGAAGGATAGAGGTAGTAACTGGCCTTTATTTGACGGTAATCAACCAGAAAGTCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGAAGAATAAGTCTGATGTGAAAGCCCTCGGCTTAACCGAGGAATTGCATCGGAAACTGTTTTTCTTGAGTGCAGAAGAGGAGAGTAGAACTCCATGTGTAGCGGTGGAATGCGTAGATATATGGAAGAATACCAGTGGCGAAGGCGGCTCTCTGGTCTGCAACTGACGCTGAGGCTCGAAAGCATGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATG\n>URS0001547F59 rRNA from 1 species \nTCGGGAATTTTGCTCAATGGGGGAAACCCTGAAGCAGCAACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTTCTCAGGGACGATGATGACGGTACCTGAGGAATAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTACTGGGCGTAAAGAGCGCGCAGGCGGTCGTGCAAGTCGAGTGTGAAAGCCCCCGGCTCAACTGGGGAGGGTCACTCGATACTGCTCGACTCGAAGGCGGGAGAGGGAAGTGGAATTCCCGGTGTAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGACTTCCTGGCCCGTTCTTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACG\n>URS000083C0E2 tRNA from 1 species \nCAGAACATAATTAAATTAGAATGCTGGCTTTGGGGGTCAGTTGTGGGGGTAAGAGTCCCCCTGTTCTGA\n>URS0000ABDE67 miRNA from 1 species \nTTTGGTTTGAAGGGAGCCCCT\n>URS000003005D rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGGACAGATGGGAGCTTGCTCCCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCTGTAAGACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATGCTTGTTTGAACCGCATGGTTCAAACATAAAAGGTGGCTTCGGCTACCACTTACAGATGGACCCGCGGCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTAGGGAAGAACAAGTACCGTTCGAATAGGGCGGTACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGCAGGCGGTTCCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAAGAGGAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTCTGACAATCCTAGAGATAGGACGTCCCCTTCGGGGGCAGAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGATCTTAGTTGCCAGCATTCAGTTGGGCACTCTAAGGTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGACAGAACAAAGGGCAGCGAAACCGCGAGGTTAAGCCAATCCCACAAATCTGTTCTCAGTTCGGATCGCAGTCTGCAACTCGACTGCGTGAAGCTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGTCGGTGAGGTAACCTTTATGGAGCCAGCCGCCGAAGGTGGGACAGATGATTGGGGTG\n>URS00020EF123 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCATTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTCGACTTTGGGATAACTTCAGGAAACTGGGGCTACTACCGGATAGTAGCTCCTGCTGCATGGAGGGGGGTGGAAAGTTTCGGCGGTCGGAGATGGACTCGCGGCTTATCAGCTTGTTGGGGGGGTAGTGGCGTACCACGGCTTGGACGGGTAGCCCGCCTTGGAGGGGGAGCGGGCACATGAGGACTGCGATACGGCGCAGTGTGGAACATGGGGCAGCAGGGGGGAATATTACGCAGCGGGCCGGCGCGTAATGCAACAACGCCGCGTTCGGAATGACCGTCTACGGGTTGTAAACCGCTTAAGCCTGAGACGAAGCGTGATTGACGGTAACGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS00000CB0F4 tRNA from 1 species \nATTAAAGTGGCAGAGTAGTGCATTAGATTTAAGCTTTAAACATAGAGAAGTTCTCTTTAATA\n>URS0000AF4368 rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGAAGATTTATCTTAGTGGCGAACGGGTGAGTAACGCGTGGGAATCTGCCTTTCAGTGGGGGATAACTCAGAGAAATTTGAGCTAATACCGCATACGACCTTCGGGTGAAAGATTTATTGCTGAAAGATGGGCCCGCGTTAGATTAGGTAGTTGGTAGGGTAAAGGCCTACCAAGCCTACGATCTATAGCTGGTTTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGAAACCCTGATCCAGCAATGCCGCGTGAGTGAAGAAGGCCTTCGGGTTGTAAAACTCTTTCAATGGGGAGGATGATGACGTTACCATAGAAG\n>URS000012F352 misc_RNA from 1 species \nTGTACTCGATCCAGAATCATTCCCAAAAGGTCGGAACGAGGTATGTGGCTTTCAAACTAGGTTCTGGGTTCATAAAAGACCTGAATCAGGAACAAGGGATATTAGCTCAGGTGGTTAGAGCGCACCCCTGATAAGGGTGAGGTCCCTGGTTCGAGTCCAGGATGGCCCACCTGCACAGGTGGCAAAAACAAAAAAAACAAGCGAGGAATCCCCACCTTATCTTACTTATATAGTAAGAAAGAATGCTGGCTCTGAGTACAGAGTCCGAAGGAACCTTGAAAACTGCATAGAGCTAGGTGAAAAAGCCAAAAAAAAGGACCGCAAA\n>URS000182AB58 rRNA from 1 species \nTACGTAGGGGCCTAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTCGGTAAGTCAGGTGTGAAATCTCCACGCTCAACGTGGAGGCGCCACCTGAAACTGCCGTGACTCGAGTCCGGTAGGGGAGTGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCTGACACTGACGCTGAAGTGCGAAAGCTAGGGGAGCGAACGGG\n>URS0001D66A4A rRNA from 1 species \nAACGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCCCTTTCGGGGGAGCGGCGGACGGGTGAGTAACGCGTGGGAATATGCCCTTCTCTACGGAATAGCCTCGGGAAACTGAGGGTAATACCGTATACGCCCTGTGGGGGAAAGATTTATCGGGGAAGGATTAGCCCGCGTTGGATTAGGTAGTTGGTGGGGTAATGGCCTACCAAGCCGACGATCCATAGCTGGTTTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTAGACAATGGGGGCAACCCTGATCGAGCCATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTCAGCTGGGAAGATAATGACGGTACCAGCAGAAGAAGCCCCGGCTAACTCCGTG\n>URS000233F9F7 lncRNA from 1 species \nCAGCTCAAGGCTGTAGGAGGAAGAAAAATCTAGTCCCTGGGGGTACTGATGAATCAGTTGGATGGTGGGCGTTGGACTGTGAATTCCTGATGCCTCTGGGTAAACTCTGGAGGAAATTCTGTTTCATTACTTGCACTCAGCCCTCCTATTTTGTACTAAGGTATTCTTGAATACAAGTGCACCGGCCAAAAAAGTAAACTTACGCATAAAAAGAAAGGCTCTCTTCCTTCCAAGAATGCTGAACACCTTTGAAGTCTCTGTTGCTGCCTCATCTTTTAGATACAATCATTGATTATGTATTTTTGGCATCGTCCTGAACTTTGTTTCATTTCCTTCACAGTTGAATGTGCAGTTGGCTTTGTCCACTCAGTGATGGTCCTTGTGACTGTTCTTGGCTTTTCTGTTGTTTTTCCATCTTTCTATAGGAAGCTTGAGACCGATACTCATCGTTTGCTTTCAGCACCTTAATTTTGCTTTGTTCATTTTTGTAAAGTAAGGGCAAATGGCCACCGGAATGTACAGTGATTAAAGAAGCAAACTCTGTCAAAGATGGTGATTAGTGGCCAGCCAGTCCCTCTCAGGATCACTGTATTAAAAAGTGCTCATTTGCCAGTGACATTTTTTTTTGGTTTTGGTTTTTTTTTTTTTTTTTTTTTTTGAGACTGAGTGTCACTCTGTCGCCCAGGCTGGAATGCAGTGGCCTGATCTCAGCTCACTGCAACCTCCACCTCCCAGGTTCAAGTGATTCTCGTGCCTCAGCCTTCTGAGTAGCTGGGACTACAGGCGCCCAATACCATGACTGGCTAATTTTTTTTTTTTTAAATTTTAAGTAGAGATGAGATTTTGCCATGTTGGCCTGTTTGGCCTTATACTCCTCATCTCAGGTGATCCACCTGCCTCGGCCCCCCAAATGCCAGTGACATTTGTAGGTGGATTCAGATTAAGGTGGGTAGCTTAGTTGAGGCGTCTCAACCCTTTTCTGTGCACTCTCTCAAGATGATTTCTGAACACACAACTATAAGTGCATGAGAACTTAAATACGTGTGCTCTTATGCTAATTATACACAAAGTAAAAGTTTTTTCACAAGGAGAATTTTTTTCTCCAGCAAATAGCTCGCTCACCCTAGGGGTACATACACCCCACTTTAGAGACCCTCAAGTTACAGTGGTATCATTAAACGATCCATAAAGGAGTGGGTTTAAGAAAGCTGATACAGGAACATGTTTGAAATAATACATTTTCTCAAGGGTGTCCTCCAACCATTTTCTTTGATAAATTATATTTCTGCCCATTGTTGACTTGAAATTGTCCTCACCCCTCTACCAAGTTCACCCAGTGTATTCTGAAGGAAAATGAATGAATATGGAAACCTCTCTCATCCTAGGCAGTAGAGCGAGGGAAGCTGCACTGGCTGAGAGGCTGTGGAACCGGATGAAAAAGCAGCCCCTGAGTCCTGTGGCGTTGGCTGTGAGTCGGCCACGTGCTTGCTGTGTGCTTTAGGAAAGTTACTTAATTTCTCTGAGCTTTAGTTTTCTCCCTCATAAGTAGGCTTGCTGTGAAAATGAAGTGAAATCACATTAATCTGCATGAGCATTTAACACGGTGCCTGGTGTACATCAGGGGTGTGACAGTGAGTGCTGGCTGCTGTAGTAATTGAATGCTTAGCTACGTGCCGGGCCCTTTGCCAGCTACAGCTCATGTGAGACCTCATGTTCAGTCTTGGCAGTAACCCAGCAAGGTAGGCATTTTACATGTGAGGAGCCTGAGAAATTCAGTCTTGGCCTGGATCACAGAGCTGGTATCCAAATTCAGGTCCGAGGCCAAAGCCCAGATCTTTGCACTACACCTTGTTGCCTGGCACAGGTGAGAGTGCCCAGCCCATAGTGGGTGCGCAATATCTGTTTCTATTTGAATGACCCAGGCAGGCGGTTAATAATGCTTGTGATTTCTTTGAGAGAGAAGTAAGTTCTTGTCTTTGGTGGGGGAAGCATCAGGTGACCAGCATTTGTCCAGAGCCTGGTACCCATCCTCTCCCAAGCCCAATCAGTGGTGCTTTCTCAAAAAGAAACCATCTCCTGACCACTTTGGCCATATTGGGCCTTTGCTCCTCTTCTGTAGCTATTGATAAGAGGGCTGTGGGCAGTTAGTGATAATCAAGGTCGTATCCCAACTAAGTGACAGAGCTGAGACAGTTAAGTTCCAGGACAAGTGTGTTGATCTCTGTACCCACTTGTGCCAGGTGCCTGGGGAGGTAGGGGCATGGCTGTCTGAGGGTGGAGGGGTGAGTAGGGGGCCTGCAGTGTGCTGTGACGCCTGGGAAGGGGATTCTAAGCCATTTCCCATCAGCCGTTTACTAAGTAGCCTGGGGATCTTGTTAAAATGCAGATCCTGATAGATTAGGGCTGGGGTGCTGCCCAAGATTCTACATTTCTAAGAGTCCCTGGATGACGGTGGCATTCACAGACCACAGCTTCTATGTGAGGGAGAGCAGTTGGGTTTCTGTCTGCCTGCCGCACCTGATCAGTAGTTAGTGCCTGCATGTGTGGCGGCCAGAATTTTACTTGGGGAGACGCTCGGCTCCTAGCACCCTCTGTGGTAGGGGTTTTCCAGAGTGTGGGCATTACCCCAACTGTCTCTGCAGACGGCTTCCTGCATGTTTCCCACAAGCGCTCAGATGGCTGAATTGGCAAGTCTGTGGTGCTGCTCTTTGGGGCCACCTCGTTCTTTGCCTTTCCCTCCCCTTAGCGATGTGTCCCATCCGTTGCCTACAGTCAAGTCAGTCCACATGTTTAGGCTAAGGTGGGCATGACCGAGTGGCCTTCCCCCGGGAAGACCAGTGTCGTAACTGGAATTAAGTTGTGGAACATAAGAGTCAAGGCTCGTGTCTGCTGTGAACTGGAGTTGAGGGAATGTTTGGGGATCCCACCTGGTATCAGTAAGGGAACCATGGCGACGGCCAGCCTTGCCCATGTGAGGCATTTGCTTTGTCAGGCCTTCTCAGTAGTGGAGAAGGGAGGAAGGAGAATGCAGCTCTTTCAGTGCTGTCTAGCAGTGCCCAAGAGCCGTGATTGGGCACCTCACTTAACGTCTAACTTCAGATTCACTCTTGGGCATTCCTGTCTTCCTCTCCAATCTTGAATGGATGTTGGCTTCGATAATGTCATCCTGAAGTTTCTTTGTCCACACAGCCCTGGCTGGTTGTTAATAAGCTGTTAATGCAGCCTTGCACTCAGGAAGCCCTGATGTTTAAAGGAACTGTGTCTTTGTTCTTCCTCTCTTCCCTCTTTCTCTTAGTCCCACTTTATCTCTTCTTTCTCTTCCTCTCCCTCCTCCTTTTCCCCTCTCCCTCCTACTCTCCCCCTTTCTCTCCTCCTTCTCTAAGAAACCCAGTCTTAATTCCACACAATGCATGCACATGCAGTAGCTTCTCTGCTTGAGTGAGCTGGTGTGATTAGGTTTTCTAAACATGCACATTGGCCTTGCTACTTGTCCTTTTATTCCCTTCCCACAGACCATAAACCAAGAATTATTTTTATTTGTATTATTTTGATTTTTTTAAAGTAAAATATTAACTTTTCCTCTTTGAAATAAATTCCCATTTGGAACATCAGCATACAGTTTGAACATTTATTCGCCTCCTGAGCTTGTACAACAGTCGTGGGAGTTGCTGCAGAAGCAAGCGAAAAGCCAGATGAGCGCTTCTAAACTTAGAGAGAGGGAGAGCGCCTCATCTCTTCCATTTTCCAGGTATTCCTGAGATGATTTATTGGAGCTCAAAGCTTTGGGAGAGTTGGGGCCTTCCATTCCCTCCAGTAAATACTTGTTTTTCTTCCACCGCTGAGGCAAATGCGGGGTGGCTGATCACCTGGCAGACATCTTAGGAAACAGGAGCACCGGTCTGGGAAACTGCTGGCCTGGCCTAACACCTGGCGCTGTGGTGCAGGCAAGAGGGCAGCCACTGAGGATTCTTGAGGAGAGAGAGACCATAGAATGAATGAAAGAGTTGGAAAGACTTTAAAGCTCTGGGAGGCTGAATCCTTTATTTCGCTGGAAGAAAAACTGAATGCCAAGAGGGCCTCACTTTCCCCAAAGCTATACAGCCATCAGGGGCAATGCTGGGATTCCCCCATGGATCTCTTGACTCCTAATACAGTGCTCTTTCTGATATGCCATCTGGCTCCATAATGAACATTGTGTTCCAGGAAAATCAGTCTGCGCTGAACAGGATGGAATTGGGGCAGGACGTCCAGTGAGGAGGACATTGAGGCAGTAGAGCAGTTGATTGCCGAATGACCACCTACCCTGACTTAAAAGATCAACCTCAGGGAGGATTGGAGCTTTCTAGAGTCTCTTGGGACAGCAGAAGCACAGGCCGGGTTGGACTGAATCTTTAAGTGGACATGAGGGACAAAGTACCTCCTGTTGGTAAACATCTCACCACCAACCCACTGTGGTGGCTAAAATCCCACCTTTAGTCCCAGCAACATATGAGCATGTCACCAGGAGGTCTTCACAGGCCTGTCTGCCACCTGAGTGTAGACATCTTTTGGCCCTGGAGCCCAGAGAGGCTGAATGTGGAGAGGGTGGAGAGAGGTCTGTAGTCCTCAGAGAAGACTTGCAGCTTTTTCAGAGCCACCAACCCATAAAAAAAAAAATCCCCAAACAGAAAAATCCTAACTGTGGTGACCAGGTACCTCCTGAGACATGAAGCCTCCACTTACCTGGACCCTGGAGGCCTCTCCGGGCACAGCTGCCAATGTTGATCTTAGATAAGACCACCAGCAAGTAAACATCCACTGTGCAAAGCTGTGTTATCTTTGGGGAACTGAAATGTCCCCTGGGAGTTGGAAACTCCCCTAGCCACATACCACAGAGTTGAGGAAGGAAGAGCTGATGGACGGAAGAACCATGGCGGGAGGAGTCATCCGGAAGCTACCTCGCTGCCCTGTCAGTTACGGAACAGAGGAGAGATGCCGGCTGGAGGACACAGCAAATTTGAACCAAGAGGAGCTTGGAGGAAGCCCGAGCGACCTGGAGGGGACTGGCTGACCTTCCTCATTCTTTTCAAGTGTGAATAATAACCAAGCCCAGTTTGGCAACTCCTTGAGGGTGAGGACGAAGCCCCATTCTCCTTTTTGGAACTTGGTGGGGCTCAGGAAGCAGGTTCTCTCCAGTCGGTGGCTTTCCTTTCTGTTGCGGGTCTCTTGAGGGCCTGCCTTCATGAAGGCACATGAGTGACTCATCATTTGTGAATTAATTGCTATATGTGAAGGGCATCTGAGAACAAATTATCTTCATAGACTTTTCATTATAATTTTATTTGTACTGATAATTAGTTGGTTTAGCAAGCTCTTTTTTCATAGATTTGGCTAAACTTCAGTCTGAAAGAGGCAAATTCTGGGGTTCTAGAAAGAGATTTTATTCTTTGATATAGGGCTATTTGGTGGGGTTGCTTTTTGTCCTAGTTGTAGCTTTTATAATTTCGAGATTCACATTTTGCAATAGAAATATACAGGCATACCTTGGAGGCATTACAGCTTTGGTCCCAGACCACAATGAAGCAAGTCACACGAATTTTGTTGGTTTCCCAGTAAATATAAAACGTATGCTGATACCATACTATAGTCTAAGTGTGCAACAGCATATGTCTAAATGAATATACATATATATTTTTTTGAGACAGGTTCTTGCTCTGTCACCCAGGCTGGAGTGCAGTGGCACTATCATGGCTCACTGCAGCCTCCACCTCCCTGGACTAAGATGATCCTCCCACCTCAGGCTCCCAAGTAGCTGGGACTACAGGTCACACCACCACACCCAGTTAATTTTTGTATTTTTTGTAGAGACAGAGTCTTGACATGTTGCCTAGGCTGGTCTTGAACTCCTGGCTTAAGTGATCTGCCTGACTTTGCCTCCCAAAGTGCTGGGATTACAGATGTGTAGTCTTTGAAATCCAGTGTGTGTTCTTACAGTGCATTTCAATTTGGACTAGCCATGTTTCAAATGCTCAGCAGCCACATGCGGCTCATTCTAGATAGGCGGCCATCGCTCTTAAATCCTCCCTGACCTTAGCCATGCTCTCTCATCCCTCCTCTTCGCCAAGCTCTGCCTCTCTCACTGGGGCTTCCCTAGCCTCCGGCCATCTTGGGGCCAAAGCTCTAACACTTTGCCTCTCTCGTGTCTTCTGTTCCCCTCCAGTGGCTTCTGCTTTCTGCCTTAAAATACACCCAGGTTCCTAATCCTGAAAACGTCTGTTGTGCACCGATCCCACCCTCCCCTCGTGTTACCATCTCCATTTCCTTCCCCTTTCCTTGTGTCCTCTTCTTTGCTGTGTCCTGGCCCCTCAAAACTTGACCTTGCCTCTCATCCCCACTGCTGTACTGAAACTGTTGTCTCAGCGTTGCTGATCATCCAGCCTTTTAGTCTATGGACCGCTAAGAGCCATAGGACGACCTCAGGGTGGGACGTGGCTTGGAGGGCCATCTCGTCTCAATTTCCAGATACAGACCTGTGTTGGGTTGTGTTGGATTCATGAGGAAAGCTTCATAAGTTTTATGCACGTTTATAAGACTCCATCCTTGGATTCTGATCCAGTAGCTCTGGCGTGGGGGCTTTAGAATCTGTTTCAAGTATCTCAGGTAATTTTGATTATAAATTACCAAGTATCCCAGGTAAATTTTGATTATAAATGCTTGCTTCCAGCAGAAAATATAAACATATGGAAGATGAAATCTTTCTCTCTGAATAACCCAATTCAGTTTCCACTCGTGAATATCTTATATAACCGTAGTACATTTATCAAAATTAAAACACCAGTGTTAGCACATTACTGTTAATCTCCAGACTATTTGTAAGTCACCAATTTTTCCATTGTCCCATCTGTTCTTCCTTTTCTTTCTCTTGTCATAACCACTTTTAGAGGGTTTTGAATGGTATCATTTTGTCTTCACCGTCGGCTTATTAGCTATACTGTACTGTTCTATTCTTTGAGTGGTTGCTCTAGGATTTACAAATATGACTTCAACATATTGCAGAATACCTTCAACAACTACGATATCCTTTCACAGATAGTGTAAGAACTGCACCACAGAATGCTTTCATTTCCCCACTTCTATTCTTTGTGATATTATTGTCACACATTTTATTTTTACTTAAGGTATGAGCCCCACAATGCATGTTAAATAGCCAAAGTTTTTAGACAGATTAAAGAAATTAAGAAAAAGTCTTATGAACTCAGGTATTTACTATCGTGTTGCTCCTTATTCCTTAGTGCAGATCCATTTTTCTTTTCTTTTTTATTTGAGACAGGGTCTCACTGTGTCACCTGTGGTTGAATGCAATGGCGTGATCTCAACTCACTGCAGCCTCCACCTTCTGGGCTCAACTGATCCTCCCACCTCAGCCTGTAAAGGGATATTTGCAAAGGGATATCGGAGTTGTTGAAGGTATTTGCAATATGTTGAAGTCATATTTGTTTTTTTTTTTTTTTTTTTTTTTTTTTTGAGATGGAGTCTTGCTCTGTTGTCCAGGTTAGAGTGCAGTGGCGTGATCTTGGCTCACTGCAACCCATACCTCCTGGGTTCAAGCAATTCTCCTGCCTCAGCCTCCTGAATAGCTGGGACTACAGGCATGCGCCACCACACCCAGCTAATTTTTGTATTTTTGCTAGAGATGGGGTTTTGCCATGTTGGCCAGGCTGGTCTTGAACTCCTGACCTCAAGTGATCCATCTGCCTTGGCCTCCCAAAGTGCTGGGATCACAGGCATGAGCCACCGCGCTGGGCCTGAAGTCGTATTTGTAAATCCTAATTTTTGTATTTTTTTTTGTAGAGACAAGGTCTCACCATGTCGGTCAGGCTGGCCTCACACTCCTGGGCTTAAGCAATCCTGCTGCCTCAGCATCCCAAAGTGCTGGGATTACAGGTGTGAGCCGCTGTGCCCAGCCTGTTTTTCATCTAGTATTTTCCTTCTGCCTGAAGGAAACTTCTTTGACATTTCTTGTAATGGCAGCTCTGCTGGTGATTAATTCTTTCAGCTTTTATTTGAAAGAGTCTGTATTAAAATATATATATATTTTCACTAGGTATAGAATTTGAGGCTGACAGGTTTTTTTTTTTTTAATTTTTTCAGTACTTTAAAGATGTTAATTTTCTTATGGTTTGCCTACTTTCTGATGAGAAGTTGGCTGCTGCTCCTTTTTTTTTTTTTTTTTTTTTGAGACAGAGTCTTGCTCTGTCGCCCAGGCTGGGGTGCAGTGGCGTGATTTCGGCTCACTGCAACCTCCACCTCCCGGGTTCAAGCAATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACAGGCACCTACCACCATGTCTGGCTAATTTTAGTAGGGATGGGGTTTCACCATCTTGGTCAGGCTGATCTCGGACTTCTGACCTCGTGATCCACCCGCCTCAGCCTTCCAAAGTGTTGGGATTATAGGCGTGAGCCACGGCGCCTGGCCTGCTGCCACTCTTATATTTGTTCTTCTGGATGGAATGTCTCTTTTTTTTCTGGTTGCTGGGAACATGGGCTATTCCCACCCCTATGTGAGCTCCAGCTGCTTGGTCTATTGGTTTCACCCTTCATATATGAAGGTTAGTACTTGTCCAAAGACTCCAGGAGACTCTTCAGCTCTCAGGAGCTTGCTCTGTGCAGCTTCCTCCTCTCGTCCTCTTCTGCCTTCAGTTCTGCCTTGGTCTTTTTTGTTTGTTTGTTTGTTTTTTGAGACAGAGCCTTGCTCTTTCGCCCAGGGCAGAGTGCAGTGGTGTAATCTTTGCTCACTGCAACCTCCGCCTCCCTGGTTCAAGCAATTCTCCTGCCTCAGCCTCCCGAGTAGTTGGGATTACAGGGGTGCAACACCACGCCCGGCTAATTTTTGTATTTTTAGTAGAGACAGGGTTTCACCATGTTGGCCAGGCTGGTCTCGAACTCTTGATCTCAGGTGATCTGCCCGCCTTGGCCTCCCAAAGTGCTGGGATTACAAGCGTGAGCCACCGCGCCCGGCCTGCCTTGGTCTTCCTGAACTCTGACTTCTGTCTCTTCAACTCCTGGAGACTACTAGACTCTGGAGTCTCTCTTTACCTTTTGGCCCAGAAACTGCTTCTGGGTAGTAGTAACCTGGTGCATTTGTTG\n>URS000117373B rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGAGCGGCGGACGGGTGAGTAATGTCAGGGAAACTGCCTGATGGAGGGGGAGAACTACTGGAAACGGTAACTAATACCGCATACCATCAGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAATGGCTAACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCAACCTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGAGGAGGCGTTACTCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATTC\n>URS000199CEE7 lncRNA from 1 species \nATGAGCCTTGACAAAACTGTGGACAGCATACTGCTAAGCCTCACATTGTTCAGCCTTCTGATTTTCCTTGGAAGTTTGCTGATATGTGCGTGTAGAAGGTATAGATTCCTGGAAGTTATAACCATGCCCTTTCCAGCTCCTACAGATAAAGTTACAACGTGGTTAGCTACAGATGAGACTCACCATCAGAAACAAAATTCAGTGCAAATGGAGATGCAGTCAGAGGTCATACTGAGAATATCAGAAGATAATGGAGATGAGGACATTCAACAACATACACATTTGAAAGAATCTGAAGACCTGAATTAATGCCTCCTTAGAGGAACTTGGTCAAAGCAGGGACTAGACAGGCAAAAGAGTAATGCATGTGTGTCAGACTGGAGTTTCCAAGACTTGCTGAAATTTTAATAGATCTTCCTGGCATGTGTAATGGATAAATGAGTGAAAGAAGCTAACCCAAGAAAAGTGAACAGACAGATCAAAACTGGTACCACATCATCTGGCTGGGGACTTTGCTAATGTGACAAAACTGATAAGAGTCTATAGCAGCATATAGATGTCCAGGTAATACAGGAGGAAATACATTCTAGTGCTACCTCTTGTGTAACAGCCTCCTCACCCACTTTTCTCTGCCACAGAAGGCCCGCTACTTCTGCCTCTGATGTGCGGACAGAGGTGGCTAATGTCATGTGAGGTGCACCAAGCATGCGGAGTGACAGGAGCAGGTCTTATTAGTAAGTGGGGAGGAGGCAGGC\n>URS000005DFD5 sRNA from 1 species \nCGGCGCTGTGGCGCCGGTTCGTTGCGGAGGATGCCGGCCGAGCGATCAGCCGGCATTCTCCGTTTCTG\n>URS00017CC290 rRNA from 1 species \nCACGTAGGGTCCGAGCGTTGTCCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTGGGTCAGTCGCTGGTGAAAGCCCCACGCTCAACGTGGGAATGGCCAACGAGACGGCCCGACTGGAGGCAGGGAGAGGCCGGTGGAATTCCGGGTGAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGGCGGTTAGCTGGCCTGTAACTGACACTGGAGGCGCGAAAGGCTAGGGGGAGCGAACAGG\n>URS0002351B0D lncRNA from 1 species \nCTTGTGTTCGATTGATTGATAGATGTCTCATTACAAGGCCCTAGGGTCTACATTTATACCCTGCTCAAAGAGCTATAATCAGACTCGACTAGGACTCGAATTCCAAATTAAACAGAATCCATATACAAAACAAATTTAAATAACTAAGAAAAACATAAAACCACCACTTCGTAACCGACCGGAACACCGCCACAGATCAATCGGCAACCTCCACGCTTCCCTTCAGATTCATCGGCAGTCTTCCTGTTATAGCCATCGGCAAACACCAATATTAATCATCGGC\n>URS0002307C0E misc_RNA from 1 species \nAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTAACGAGTTCTGAAAGGGGTTGTAGCTGGCCTTCCGGGGCATGTGCACACCCTGCTCATCCACTCTACACCTGTGCACTTACTGTAGGTTTGGCGTGGGCTTCGGGGCCTCCGGGTCTTTGAGGCATTCTGCCGGCCTATGTATCACTACAAACACATAAAGTAACAGAATGTATTAGCGTCTAACGCATCTAAATACAACTTTCAGCAACGGATCTCTTGGCTCTC\n>URS000259D3E0 sRNA from 1 species \nGTCCCAAGTTACCCCAAGGACGCCGGTGGGCATTCGCTCCCTCCTCACCCAGCTGTCAGGGCGCCGCGAAGCCGGTGCGAACCTGCGGAGGACGTTTTCAACGTGCCAGAGGGAGCGCAAACTCCATGGAGATTCCTAGCGCAGAAGGAATTCCTGCGGTCGGGAATTTCTTGAAAAAGATTCTTCGCAGGGGCCCTGAGCCGATAATGCTGAAATTAACATCTTTGGATATACAATTCTCTGCTTCTGAAGAATGAAAAGATAAATAACAGAGCTAAGAAAGGGACTGATGAAACAACAGCAGGTCTCAAATTTTTGGTCTCAGGACCCCTTTATGCTCTTAAAAATGATTGACAGCCTCCAAGAGCTTTTGTTCATGCTTTGGTAAGGCTGTGAGAGCACAGAGCTGAATTAGGGATCTTGGACTTCAAGTTACTGACTAGCCCCAGCACTCGCCAAGCTCACAAAGAAGACAGAAACGAGGTAAACATCCAACCATGTTTATGGAAGAGTTCATCTCTCTGTCAGCATTACGT\n>URS000094A37D SRP_RNA from 2 species \nGCCAGGCGTGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCAGAGGCAGGTGGATCACCTGAGGTCAGGAGTTCGAGACCAGCCTGACCAACATGGAGAAACCCTGTCTCTA\n>URS00004E1280 rRNA from 1 species \nTCATGCGTCGCATTAGCTAGTTGGCGGGGTAACGGCCCACCAAGGCGACGATGCGTAGGGGTTCTGAGAGGAAGGTCCCCCACACTGGTACTGAGACACGGACCAGACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGCCGCAGGGCTGAACCAGCCAAGTCGCGTGAGGGATGACGGTCCTATGGATTGTAAACCTCTTTTGTCAGGGAGCAAAGGGCGCCACGTGTGGCGCTTTGCGAGTACCTGAAGAAAAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGCAGGCGGAATGTCAAGTCAGCGGTAAAATTTCGGGGCTCAACCCCGTCGTGCCGTTGAAACTGGCGTTCTTGAGTGAGCGAGAAGTATGCGGAATGCGTGGTGTAGCGGTGAAATGCATAGATATCACGCAGAACTCCGATTGCGAAGGCAGCATACCGGCGCTCAACTGACGCTCATGCACGAAAGCGTGGGTATCGAACAGGATTAGATACCCTGGTAGTCCACGCAGTAAACGATGAATACTAACTGTCCGGGCAGAATGATGCCTGG\n>URS0000355545 rRNA from 1 species \nTTCCGGTTGATCCAGCCGGAAGCTACTGCTATCGGGATTCGATTAAGCCATGCGAGTCGAGAGGGTTCGGCCCTCGGCTGACGGCTCAGTAACACGTGGATAACCTGCCCTCAGGTAGGGGATAATCTCGGGAAACTGAGGACAATACCCTATAGACATCCTTTGCTGGAATGCTTGGATGTTCAAAGGCAACGCCTGAGGATGGGTCTGCGGCCTATCAGGTTGTAGTGGGTGTAACGGACCCACTAGCCTACGACGGGTACGGGCCTTGAAAGAGGTAGCCCGGAGATGGACTCTGAGACACGAGTCCAGGCCCTACGGGGCGCAGCAGGCGCGAAAACTTCGCAATGCGGGAAACCGTGACGAGGGAATCCCGAGTGCTCATACAATGTATGGGCTTTTATGATGTGTAAAAAGCATTAGGAATAAGGGCTGGGTAAGACCGGTGCCAGCCGCCGCGGTAATACCGGCAGCTCTAGTGGTAGCCACTTTTATTGGGCCTAAAGCGTTCGTAGCCGGTCAGGTAAATCCTTGGGTAAATCGTACAGCTTAACTGTGCGGATTCCGAGGAGACTGCTTGACTAGGGACCGGGAGAGGTTGGAGGTACTCCTGGGGTAGGGGTGAAATCCTGTAATCCTAGGTGGACCACCGGTGGCGAAGGCGTCCAACCAGAACGGCTCCGACGGTGAGGGACGAAGGCTAGGGGCGCAAACCGGATTAGATACCCGGGTAGTCCTAGCTGTAAACGCTGCAGACTTGGTGTTGGAGATCCTACGAGGGTGTCCAGTGCCGAGAGAAGTTGTTAAGTTTGCCGCCTGGGAAGTATGGCCGCAAGGCTGAAACTTAAAGGAATTGGCGGGGGAGCACGCAACGGGAGGAGCGTGCGTTTAATTGGAATCACGCCGAAATCTC\n>URS0000A75A1F rRNA from 1 species \nTACGGAGGGAGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGTTATTCAAGTCAGAGGTGAAAGCCCGGGGCTCAACCCCGGAACTGCCTTTGAAACTAGATGACTAGAATCTTGGAGAGGTCAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGACTGACTGGACAAGTATTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGATAACTAGCTGTCCGGGTACTTGGTACTTGGGTGGCGCAGCTAACGCATTAAGTTATCCGCCTGGGGAGTACGGTCGCAAGATTAAA\n>URS00009F80D5 rRNA from 1 species \nGACGAACCGAGCGAACGTTGTTCGGAATCACTGGGCTTAAAGGGCGCGTAGGCGGGCTGTCAAGTCTGGGGTGAAATCCCACGGCTCAACCGTGGAACTGCCTCAGATACTGACGGCCTCGAGGGAGGTAGGGGCGAGCGGAACGGGTGGTGGAGCGGTGAAATGCGTTGATATCACTCGGAACTCCGGTGGCGAAGGCGGCTCGCTGGACCTTTTCTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACGGG\n>URS00007B79EE rRNA from 1 species \nAAAACGACTCTCGGCAACGGATATCTCGGYTCTCGCATCGATGAAGAACGTAGCGAAATGCGATACTTGGTGTGAATTGCAGAATCCCGTGAACCATCGAGTCTTTGAACGCAAGTTGCGCCCTAAGCCTTCTGGCCGAGGGCACGTCTGCCTGGGTGTCACAAA\n>URS000123EF67 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAAGTGGCGAACGGGTGAGTAACGCGTAATCAACCTGCCCTTCAGAGGGGGAAAACAGTTGAAAACGACTGCTAATACCGCATACTGAAGGAGGGGATTGCGTCGGATTAGCTAGTTGGAGGGGTAACGGCCCACCAAGGTGATGATCAGTAGCCGGTCTGGAGGGATGGACGGCCACAATGGGACTGGGACCCGGCCCAGACTCCTTCGGGAGGGAGCAGTGGGGAATCTTCCGCAAAGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGACGGCCTTCGGGTTGGAAAGCTCTGTTAATCGGGACGCGGTACCGGAATAGAAAGCCACGGCTAACTACGTGCCAGCCGCCGCGGTAATTC\n>URS0000638341 rRNA from 1 species \nGTCTACGGCCATACCACCCTGAACATGCCCCATCTCGTCTGATCTCGGAAGCTAAGCAGGGTCGGGCCTGGTTAGTACTTGGATGGGAGAAATGTTAACTAAAAATA\n>URS000020D105 rRNA from 1 species \nAATACGAAGGGTGCAAGCGTTACTCGGAATTACTGGGCGTAAAGCGTGCGTAGGCGGTTCGTTAAGTCTGTCGTGAAAGCCCTGGGCTCAACCTGGGAATTGCGATGGATACTGGCGAGCTAGAGTACGGTAGAGGATGGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGAGATCGGGAGGAACACCCGTGGCGAAGGCGGCCATCTGGACCAGTACTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGCGAACTGGATGTTGGGCACACTTAGGTGCTCAGTGTCGAAGCTAACGCGTTAAGTTCGCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGTATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGCCTTGACATGTCCGGAATCCTGCAGAGATGCGGGAGTGCCTTCGGGAATCGGAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCCTTAGTTGCCAGCACGTAATGGTGGGAACTCTAAGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGGCCAGGGCTACACACGTACTACAATGGTCGGTACAGAGGGTTGCAATGCCGCGAGGCGGAGCCAATCCCAGAAAGCCGATCTCAGTCCGGATCGGAGTCTGCGACTCGACTCCGTGAAGTCGGAATCGCTAGTAATCGCGAATCAGCATTGTCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTGGGTTGC\n>URS0002194E4A rRNA from 1 species \nAGAGTTTGATCATGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGGTAACAGGAAGAAGCTTGCTTCTTTGCTGACGAGTGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATAACGTCGCAAGACCAAAGAGGGGGACCTTCGGGCCTCTTGCCATCGGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAACGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGATACTGGCAAGCTTGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTATTGACATCCACGGAAGTTTTCAGAGATGAGAATGTGCCTTCGGGAACCGTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTCCGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTGGATCAGAATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTAGGGGAACCTGCGGTTGGATCACCT\n>URS0001BA8378 rRNA from 1 species \nATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCACGGAAGGCAGCAGGCGCGCAAATTACCCAATCCCGACACGGGGAGGTAGTGACAATAAATAACAATATAGGGCCCTTTTGGGTCCTATAATTGGAATGAGTACAATTTAAATCCGTTAACGAGGAACAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAACTTCAGACCTGACCGGGCGGTCCGCCTAACGGTGTGTACTGTCTGGCCGGGCCTTACCTCTTGGTGAGCCGGCATGCCCTTCACTGGGTGTGTCGGGGAACCAGGACCTTTACCTTGAGAAAATTAGAGTGTTCAAAGCAGGCTTACGCCGGAATACATTAGCATGGAATAATAAAATAGGACGTGCGGTTCTATTTTGTTGGTTTCTAGAGTCGCTGTAATGATTAATAGGGATAGTTGGGGGCATTTGTATTGCGTTGCTAGAGGTGAAATTCTTGGATTTACGCAAGACAAACTATTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAGGTTAGGGGATCGAAAACGATCAGATACCGTTGTAGTCTTAACAGTAAACTATGCCGACTAGGGATCGGACGACCTCAATATTATGCGTCGTTCGGCACCTTACGAGAAATCAAAGTCTTTGGGTTCTGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACAGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACCCAACACGGGGAAACTCACCAGGTCCAGACATAACTAGGATTGACAGATTGATAGCTCTTTCTTGATTTTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGATAACGAACGAGACCTTAACCTGCTAAATAGCCTGGCCGGCTTTTGCTGGTCACCGGCTTCTTAGAGGGACTGTCAGCGTCTAGCTGACGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGACAGAGCCAGCGAGTTTTTTTTCCTTGGCCGGAAGGTCATGGGTAATCTTGTGAAACTCTGTCGTGCTGGGGATAGAGCATTGCAATTATTACTCTTCAACGAGGAATTCCTAGTAAGCGTGAGTCATCAGCTCGCGTTGATTACGTCCCTGCCCTTTGTACACACCGCCCATCGCTACTACCGATTGAATGGCTTAGTGAGACCTCCGGATTGGCTTTGGGGAGTCGGCAACGACACCCCGTTGCTGAAAAGTTGGTCAAACTTGGTCATTTAGAGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAG\n>URS0000DCA084 rRNA from 2 species \nTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTTGACTGGGAGCAAGCCCTTCGGGGTGAGTGTACCTTTCGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTATCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTCGTCGCGTCCGGTGTGAAAGTCCATCGCTTAACGGTGGATCCGCGCCGGGTACGGGCGGGCTTGAGTGCGGTAGGGGAGACTGGAATTCCCGGTGTAACGGTGGAATGTGTAGATATCGGGAAGAACACCAATGGCGAAGGCAGGTCTCTGGGCCGTCACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACA\n>URS0001D81814 misc_RNA from 1 species \nACAAACTTGGTCATTTAGAGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTACAAAGCATGGCGAACCTCGTGTTTCGCGAGGTTTTTGCGTCCATTTTTCGTATTTAAAACATCCACTCTTTTAAAAATTTATCTAATGATAAAATAAAAAAGATCACTTTCAACAACGGATCTCTTGGCTCTCAGAGACAGACAAACTTGGTCATTTAGAGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTACAAAGCATGGCGAACCTCGTGTTTCGCGAGGTTTTTGCGTCCATTTTTCGTATTTAAAACATCCACTCTTTTAAAAATTTATCTAATGATAAAATAAAAAAGATCACTTTCAACAACGGATCTCTTGGCTCTCGCATCGATGAAGAACGCAGC\n>URS00022FF30A rRNA from 1 species \nTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGCGATGAAGGCCTTCGGGTTGTAAAAATCTTTTGTATGGGAAGAAAATGACAGTACCATACGAATAAGGACCGGCTAATTACGTGCCAGCAGCCGCGGTAATACGTAAGGTCCGAGCGTTATCCGGATTCATTGGGCGTAAAGCGCGCGCAGGCGGCTCTTCAAGCGGAACCTCTAACCCCGGGGCTCAACCTCGGGCCGGGTTCCGAACTGGAGGGCTCGAGTGCGGTAGAGGCAGGCGGAATTCCCGGTGTAGCGGTGGAATGCGCAGATATCGGGAAGAAAACCGATGGCGAAGGCAGCCTGCTGGGCCGGCACTGACGCTGAGGCGCGAAAGCTAGGGGAGCGAACAGG\n>URS00012276C6 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAACGCAGTGGGGATGGGTGAGTAACCCGTGGGTAACCTCCCCTCAGACGGGATAACACTTGGAAACAGGTGCTAAACCGATATTGATTGATGGACTCGCGGTGCATTAGCTAGTTGGTGAGGTAACGGCGCACCAAGGCCACGATGCATAGACGACCTGAGAGGGTGAGAGGCCACACGGGGACTGAGACACGGCCCAGAAGCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTGGTAGAGAAGCGGTATCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATAC\n>URS00022361F8 tRNA from 1 species \nCGGGGCTGTGGTAGCCGGCCATCCCGGCACCGATGCCGACGGTGGGCAGTCCGGCGGCGGCGTAACGGCGGTTGTCCGAGGCGACCGGCCCCGCC\n>URS0000016AA7 rRNA from 1 species \nGGGTCTCGAGCTGATCGGGCTCCGGCCCGATCCTCCCACCCTTTGTGTACCTACCTCTGTTGCTTTGGCGGGCCGCGGTCCTCCGCGGCCGCCCCCCTCCCCGGGGGGTGGCCAGCGCCCGCCAGAGGACCATCAAACTCCAGTCAGTAAACGATGCAGTCTGAAAAACATTTAATAAACTA\n>URS00023DAE2E lncRNA from 1 species \nGTCTATGTCAAAAGTTTGCATATAGATAAACTTGTTTCTTGGTCCATAGTTGTTTAAAGGTTACTGATTCTATCATGCTGAAGAACATAAGATGCTCATCAACAGTAGGGCATTCCTTTTGGAAAGAAGTTTCTTAGAGAAGGAACTGATACCTATCAAGTTGAACTTGAAAGTTTGACTTGTAAAAAATGAACTGACATAATCTAGTAAACCTACAGAATCGGATTTGATTAGATCAAACTCGGAGCCCATTAAAGTAACACCTTTAAGG\n>URS0001703742 rRNA from 1 species \nTACGTAGGGGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCATACAGGTCAGCTGTGAAAACTCGAGGCTCAACCTCGAGACGTCGGTTGAAACCGTATGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGGCGGTACTGACGGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>URS0000241E50 rRNA from 2 species \nTTAGAGTTTGATCCTGGCTCAGGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTGATACGTAGGGTGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGGGCTCGTAGGTGGTTGATCGCGTCGGAAGTGTAATCTTGGGGCTTAACCCTGAGCGTGCTTTCGATACGGGTTGACTTGAGGAAGGTAGGGGAGAATGGAATTCCTGGTGGAGCGGTGGAATGCGCAGATATCAGGAGGAACACCAGTGGCGAAGGCGGTTCTCTGGGCCTTTCCTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGCTTAGATACCCTGGTAGTCCACGCTGTAAACGGTGGGTACTAGGTGTGGGGTCCATTCCACGGGTTCCGTGCCGTAGCTAACGCTTTAAGTACCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGCCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGTAGAACCTTACCTGGGTTTGACATGGATCGGGAGTGCTCAGAGATGGGTGTGCCTCTTTTGGGGTCGGTTCACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTCACTGTTGCCAGCACGTTATGGTGGGGACTCAGTGGAGACCGCCGGGGTCAACTCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGTCCAGGGCTTCACGCATGCTACAATGGCTGGTACAGAGAGTGGCGAGCCTGTGAGGGTGAGCGAATCTCGGAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCTCATGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGGCTTGTACACACCGCCCGTCAAGTCATGAAAGTTGGTAACACCCGAAGCCGGTGGCCTAACCGTTGTGGGGGAGCCGTCGAAGGTGGGACTGGTGATTAGGACTAAGTCGTAACAAGGTAGCCGT\n>URS00009FA0E6 rRNA from 1 species \nGTCCACGCCATAAACGATGAGGACTAGACGTTGGAGGCTTTAGGCTTTCAGTGTCGTAGCTAACGCGCTAAGTCCTCCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCATGGAATCCCGCAGAGATGTGGGAGTGCCGTAAGGAACCATGAGACAGGTGCTGCATGGCTGTCGT\n>URS00023F6A50 lncRNA from 1 species \nCTTATCCTAAATAAAGAAAAATTTGATGTCGACGTCATGCCCGACACAATATTTACAGACTCAATATTATTGGCAAAATTAGGACTGTTGACAACCAAAAAGAATCTTAACAAAGTGGTAAAGGGTTTGGTGGATGATTCTTGAGCTCCCAAGGTCGAATGCTAGTTGATTCATATTTTCAACTAAGTTTATTTTTTTAAAAAAATAAATGAAAGAGATAGAATGCTATCATTCTCTCTACAAAAAAAGAAAAGAAAAGAAAATTTA\n>URS0000783EF6 rRNA from 1 species \nTACGTAGGTGGCAAGCGTTATCCGGATTTATTGGGCGTAAAGGGAACGCAGGCGGTCCTTTAAGTCTGATGTGAAAGCCTTCGGCTTAACCGGAGTAGTGCATTGGAAACTGGGAGACTTGAGTGCAGAAGAGGAGAGTGGAACTCCATGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCGGTGGCGAAGGCGGCCTGCTGGACTGCAACTGACGTTGAGGCCCGAAAGCGTGGGGAGCAAACAGG\n>URS0000768CC5 rRNA from 1 species \nGCATATCAATAAGCGGAGGAAAAGAAACCAACCGGGATTGCCTTAGTAACGGCGAGTGAAGCGGCAAAAGCTCAAATTTGAAATCTGGCGTCTTCGACGTCCGAGTTGTAATTTGAAGAAGGCGACTTTGTAGCTGGTCCTTGTCTATGTTCCTTGGAACAGGACGTCATAGAGGGTGAGAATCCCGTGTGGCGAGGATCCCAGTTATTTGTAAAGTGCTTTCGACGAGTCGAGTTGTTTGGGAATGCAGCTCTAAGTGGGTGGTAAATTCCATCTAAAGCTAAATATTGGCGAGAGACCGACAGCGAACAAGTACAGTGATGGAAAGATGAAAAGAACTTTGAAAAGAGAGTGAAAAAGTACGTGAAATTGTTGAAAGGGAAGGGCATTTGATCAGACATGGCGTTTGCTTCGGCTTTCGCTGGGCCAGCATCAGTTTTAGCGGTTGGATAAATCCTCGGGAATGTGGCTCTGCTTCGGTAGAGTGTTATAGCCCGTGGGAATACAGCCAGCTGGGACTGAGGATTGCGACTTTTGTCAAGGATGCTGGCGTAATGGTTAAATGCCGCCCGTCTTGAAACACGGACC\n>URS0000555B9E rRNA from 1 species \nAGAACGAACGCTGGCGGCATGCCTAATACATGCAAGTCGAACGAACTCTTCGGAGTTAGTGGCGCACGGGTGCGTAACGCGTGGGAATCTGCCCCTTGGTTCGGAATAACAGTTGGAAACGACTGCTAATACCGGATGATGACGAAAGTCCAAAGATTTATCGCCAAGGGATGAGCCCGCGCAGGATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCAACGATCCTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATATTGGACAATGGGCGAGAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTACCCGAGATGATAATGACAGTATCGGAGAATAAGCCCGCTAACTCCGTGCTAGCAGCCGC\n>URS000075F11E ncRNA from 2 species \nGTGAGTGCTGGGTAGAATGGGAAATGAGGGATGGAAGCTGCAACCGAGGGGCTATAGGCTCAAGCTGGGCTTGTGATGCTCTCTGTAGAGCATCCTCCTCTCGGCCCCTGTCACTTTCTACTCTACCTTCTACTCAG\n>URS0002564330 rRNA from 1 species \nATGGCTGTCAGCACTGGTAGCTTCTTGGCCATTGCCATGGCCCTCGCTCTCCTTAGTGGCGACATGGCCCACGCCGGCCGCCTCCTGGCCGACACCACGGAGGCAGCAGCGCCCGCTGCAACGCCTGCCGCTGTCCCAGGCATCCCCGCGCCGAAGCCGCCCGTGCCCACCATGCCTACAATGCCACCCGTGCCCGCGCTCGCCGTTCCCCAGTTCACGGTACCCCCCATGACGGCCGTGCCCGCGATCACCGTGTCCCAGGTCACGTTGCCGCCCATGCCGGCCGTCCCTGCGGTCACCGTGCCCAAGGTCACGTTGCCGCCCATGCCCGCAGTTGTTGTGCCGAAGGTGACGATGCCGCCAATGCCTGCAATTCCATCCATCTCCATACCCAAGGTGGCATTGCCTCCGATGCCTTCCATTCCCACTGTGAACGTGCCGATGCCAACCCTTGCGCCACCTCCTTCAGCATAG\n>URS0000DAC67E ncRNA from 1 species \nACACGCGATGCGGGAGAGCTCGGTTCGCCGAGCACCGAAGGAGCAAGCCTCCCCGCCAATCTCTCAGGTTCTGTACCGCATCGAACTG\n>URS00004A01BA rRNA from 2 species \nACTGCTCAGTAACACGTGGACAACCTACCCTTGGGTCTGGCATAATCCTGGGAAACTGGGTATAATTCCGGATAGGTCACAGATGCTGGAATGCACTGTGGCCGAAAGCTCCGGCGCCCAAGGATGGGTCTGCGGCCTATCAGGGTTGTAGTGGGTGTAACGGACCTACTAGCCTACGACGGGTACGGGTTGTGAGAGCAAGAGCCCGGAGATGGATTCTGAGACACGAATCCAGGCCCTACGGGGTGCAGCAGGCGCGAAAACTTTACAATGCGGGAAACCGTGATAAGGGAATCTCGAGTGCCAGCATATAATGTTGGCTGTCCAGATGCCTAAAAAGCATCTGTTAGCAAGGGCCGGGCAAGACCGGTGCCAGCCGCCGCGGTAACACCGGCGGCCCGAGTGGTAACCGCTTTTATTGGGTCTAAAGGGTCTGTAGCCGGCCAAGTAAGTCCCTTGGGAAATCTGGCAGCTTAACTGTCAGGCTGCTAGGGGATACTGCTAGGCTTGGGACCGGGAGAGGTGAGAGGTACCTTGGGGGTAGGGGTGAAATCTTGTGATCCTCGGGGGACCACCAGTGGCGAAGGCGTCTCACCAGAACGGGTCCGACGGTAAGGGACGAAAGCTAGGGGCACGAACCGGATTAGATACCCGGGTAGTCCTAGCCGTAAACGATGCTCGCTAGGTGTCAGTCACGGTGCGACCGTGATTGGTGCCGTAGGGAAGCCGTGAAGCGAGCCACCTGGGAAGTATGGCCGCAAGGCTGAAACTTAAAGGAATTGGCGGGGGAGCAC\n>URS00021D2EAF rRNA from 1 species \nGCGATAGTACCAGCACTAATGCACCGGATCCCATTAGAACTCCGCAGTTAAGCGTGCTTGGGCGAGAGTAGTACTTGGATGTGTGACCCCCTGGGAAGTCCTCATGTTGCACCCC\n>URS0000A1EE98 rRNA from 1 species \nCGGAGGATCCAAGCGTTATCCGGAATCATTGGGTTTAAAGGGTCCGTAGGCGGTTTAGTAAGTCAGTGGTGAAAGCCCATCGCTCAACGGTGGAACGGCCATTGATACTGCTGAACTTGAATTATTAGGAAGTAACTAGAATATGTAGTGTAGCGGTGAAATGCTTAGAGATTACATGGAATACCAATTGCGAAGGCAGGTTACTACTAATGGATTGACGCTGATGGACGAAAGCGTGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGATACTAGCTGTTGGGAGCAATCTCAGTGGCTAAGCGAAAGTGATAAGTATCCCACCTGGGGAGTACGTTCGCAAGAATG\n>URS00008B5885 lncRNA from 1 species \nGCAGTTGAGCAAGATCACGCAAAAACCTCTGCCAAGACAGAACGTGCATCAGCTCAGCAGGAAAACAGTTCAACGTGTATAGGGTCGGCCATCAAATCAGAGAGTGGGAACTCAGCTCGGAGCTCTGGCATCTCCAGTCAGAATAGCTCTACAAGTGATGGAGATCGATCTGTTTCCAGCCAAAGCAGCAGCAGCGTTTCCTCTCAGCTGAATAAACCACATCAAAGGAAAGGGACCACAGTATTTGAATGTTTGAAAGTCTGTAAAGCTTAAGGTTTTAAAAATGTTGCCCGTAATGTTGAACGTGTCTGTTAAAAAATAAAAGAAAAAATAGTTGCTTCAAACTA\n>URS0000F1E2A3 rRNA from 1 species \nTACGTAGGGTGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTCTGTCACGTCGACTGTGAAAACCTGGGGCTCAACCCCGGGCCTGCAGCCGATACGGGCAGACTAGAATTCGGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATATTGACGCTGAGGAGCGAAAGCGTGGGGAGCAAACAGG\n>URS0000D90CA0 rRNA from 1 species \nAACTTTTAATAATAGATCTTTTAGTTTTAATATTAATAAAGAATATAGTAAAATATAATAAGTAATATAAATTATAGAATTTAATAAATTATTAAATCTTTAAACGTATATTACGCTTATTAGTATTTTAATAAGTATACCTATTTAAGCGTTA\n>URS00023A597C lncRNA from 1 species \nTTGTTTTTTTTATTTTCTTTTTAATTTCAGAATTTATATTTAATTGCTTTATTTTGTTTAATTCATAATAATTTCATTTTTAATCCAAAAAATATGGGACTTTCACCAAAAATATTTTTGGATTTTTCTCTTTTATATTCTGAATTAAAATTATTTTTCGGATTAATTTTGATATTTTTCATGAATTAAATATTTTTGTGTATGTTTTTAATTGATTAAAAATACTTCTGATTTTTCAAAAGTGATGATTTTTT\n>URS0000BE2407 tRNA from 1 species \nGCCTTCGTGGTGTAGTGGTCAGAACGTATTCGAGAGGTCCGTGGTTCGAGTCCCGGTGAGGGCA\n>URS0000E01B97 lncRNA from 1 species \nAAAAAGTTTCAGAGAAGTTCAAATTGTGAAAATTAAGGTACTGAGAAATGTTGCCAGAGGTTATGAACTGCATTTTTTTTTTTTTTTAGCGTGTTTGGAGTAAGGATTGGAATGACTGTCTTTTTCCTTGTAGCTGATGAAACTGAATGGTTTGAATGGTGTCCAGGTAACAACAGACAGATGCTGACTCCAGAATGAATGACTGCAGTGATGGAATACTCAAGCAAAGACTGCCAAGCCTCCACACGGGAGTCCGTGCCTGAACGCGAAATAAAGAGGGATCCATGGAATGATTGTCCCACGATGGTAACTTCGTGATCATCTTTACAAAATACGAACATAGGCCCATGGAGAGAGGAAATCAAAC\n>URS0000762E71 miRNA from 1 species \nCGTTTGTGCGTGAATCTAACA\n>URS0001E5F21C rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGAGATCCTTCGGGGTCTAGTGGCGCACGGGTGCGTAACACGTGGGAATCTGCCCTTAGGTTCGGAATAACAGTTAGAAATGACTGCTAATACCGGATGATGACGTTAAGTCCAAAGATTTATCGCCTGAGGATGAGCCCGCGTAGGATTAGCTAGTTGGTGTGGTAAAGGCGCACCAAGGCGACGATCCTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTTACCCGGGATGATAATGACAGTACCGGGAGAATAAGCCCCGGCTAACTCCGTG\n>URS0001C02308 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGTGAAGCGAGTGCTTGCACTCGTGGATCAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCATCACTCTGGGATAAGCACTGGAAACGGTGTCTAATACTGGATACGACCAACCCTTGCATGGGGTGTTGGTGGAAAGATTTATCGGTGATGGATGGACTCGCGGCCTATCAGCTTGTTGGCGGGGTAATGGCCCACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGTGAAAGCCTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCAGCAGGGAAGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCACCGGCTAACTACGTG\n>URS0001E5A028 rRNA from 1 species \nAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGGCAGCACAGTAAGAGCTTGCTCTTACGGGTGGCGAGTGGCGGACGGGTGAGGAATACATCGGAATCTACTTTTTCGTGGGGGATAACATAGGGAAACTTACGCTAATACCGCATACGACCTATGGGTGAAAGCAGGGGATCTTCGGACCTTGCGCGATTGAATGAGCCGATGTCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATACCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAAGAAAAGCAGCAGGTTAATACCCCGCTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGTG\n>URS00012AECC2 rRNA from 1 species \nAGCGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGAAGTCTTCGGACTTAGTGGCGGACGGGTGAGTAACACGTGGGAACGTGCCTTTAGGTTCGGAATAACTCAGGGAAACTTGTGCTAATACCGAATGTGCCCTTCGGGGGAAAGATTTATCGCCTTTAGAGCGGCCCGCGTCTGATTAGCTAATTGGTGAGGTAAAGGCTCACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGATGATCAGCCACATTGGGCACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCCATGCCGCGTGAATGATGAAGGTCTTAGGATTGTAAAATTCTTTCACCGGGGACGATAATGACGGTACCCGGAGAAGAAGCCCCGGCTAACTTCGTGCCAGCCGCCGCGGTAAGAC\n>URS00015A0908 rRNA from 1 species \nTACGTAGGGTGCAAGCGTTGTCCGGAATTATTGGGCGAAAGAGCTCGTAGGCGGTTTGTCGCGTCGAATGTGAAAACCCGGGGGCTCAACCCCGGGCCTGCATTCGATACGGGCAGACTAGAGTTCGGTAGGGGAGTCTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGACTCTGGGCCGATACTGACTGAGGAGCGAAAGCGTGGGGGAGCAAACAGGG\n>URS0002375287 lncRNA from 1 species \nGCGCAAAACCAAAATTGAGTGGGTCAGTAAAACAATTCTTTTCCAAATCCAAACATTTCTCAAAACGTTGTAACCCCTCTCCGTAAAACCTGTATACTTTCCCAGAAATATAAAATATAAATATACATATATATATTCTCAATACTTCAATTCATTAACTCAACATTTTCATCATAATTATGCCATGCCACATCATCTCAACATTTCTCATATTAATTATGCCATGCCACATCATCTCAACAGTAATAAGGTATGAATGCATCAACATAAATCATATCAGGTGCAATAAAGTAATCAACCGGAGGCCCTCTAATAGCCCTGTACGGTTGAACCTAGAGCTCAAAATCTATCACTCTCACACTCTGCCGGAGTCACTCCGCGTGACCTGTACGGCCTTCTGCACATAAGTTACGCTCTAGTGCTTCTCATAAATCATCTGTGCACATAATCTAAGGTTACCCACCAGTCGGAATCTCACTAACACTCTCGCGACTGGCCTGTCGTACCCACTCCGCGTGGACTGTACGACTAGCATCTACTTGGATCCAAGGCGAGCGTGCGATGCGGTGAATACTATAAGCACTAAACTATGGTGCAGGATTTGAGCTCAATATACATCAACATCATCATAACAGAAATAACTACTCACCTGTGCGTCCATCGCACCATTTCATACATATGCATCATATCAATTCTTACCTGTGCGTCCACCGCACCAATTCATACATATGCATCATAAATCAATTCTTACATGTGCGTCCACCGCACCAATTCATACATATGCATCATATATTAATTCATGCATGGCATTTCAACTCACATTTCTATATACTTTTCATATCAATTCTATGCATGGTATTTCACTTCCCGTTTTTCCACATAACTCATATGCATTTCATTTTAAACATATTTTCATTTCAATTCAATTTCTGGGAAACGTCAAGTATATATATATACGGAAAACAAAACTGCCCACTCACCTGGAGTTCATCCAACAACTCCCTAGCACCACACATCAAGGCGTCACGACGATCGCCGCCTAGAATAGTAATCAAATCCAACCTCAGAATTCATATCGATAGAATATATAACTTATATAAAATACGTCCCTACGTAGATC\n>URS0002362E6B lncRNA from 1 species \nAGTCAGGTCCAACCATTAAATGATAGGGTTAAGTCTAATCAACTAATAGATGACCAAGCCCGAGTGTAGCTCGACTCACCTGACCGCCTATTGAAGGTACACTTAACTCATCATATATTGAATGACAATTCCAATGCTTGATAAGTACCAGGCGTGTAGCACCTCCAATAATTATCAAAACATTGGACCCATTATCACCCAACTTAATGGAAGGCTATGATCTAGTTATCTCCATAACCATTCATTTTAAGAACCTAATAATTTTAGAGGATTTCATAATTAGGATAGATGAGAAGATCCGGTTAGTC\n>URS000199E9B9 lncRNA from 1 species \nGGTGTCATGGGAAAGGAAGTGGTGTAATGCAATATATTCACCATCTCCTGACAGTACCACAATGAGATACCTTTTTCTGTAGGTGGTTCAGATGTATGTCAGTAGATAGTGCCGATAAATGCTCTTCCAGCCTGATCCTGCTCGACCTGATGTGCAAATAGATGCAAAAGATATCCAAGCCCATGGAGTGAAACAGTGGTGCTTGCTGCTCGACATGAAAGATGTATCTTCTGTGGGAGCTCATTTCTTTTGTTACAGCAGAAAATAAAAAGATTTTCATAAAAGTGAAGATAAAACACTTGATAATATGTCTGTGAACATAGTTCCATTTTACCTCAGCTGTGGCATGAAAGACCATGAAATATCTTCAACTGGCTCTTCATTAAATCACACTATCTTTAAACATATTTCAAGGAAAGTAAGGAGTTTCAGATATTAAAAAACATATACAAATATTTCATAGGTACTGTATGTGAAGGTTCACTCAATCATCCAAGGCCAAATTACTTGAAGAACTGTTAAATTATTATGATTTTAAAAATAATTACTGTAATACTTTGGGGAATACATTTGTCATAACAAATACAGAACATATTTTCTAATTTCTATTATGGCTGTCAAGGTCATTCGGTGACAGAATGCAAAATCTTATTTTTCTCATTCAGATATTGTTAGATGCATAAATTCTTTAGCTAATGTAGAAAAGCATTTAAAAATTTAAATTAATTAATGAAGAAATTGTCTTTGCCTGATATCACACAACCATTTTTTTATCTTGTGAACAGAATTTAACAATACACAGGCTCAGGCTGGCTTTATTCCACTAATACATGCCATTTCCAAAAGTGTGTTGCCTATGTATTAAACACCATGCACACACAAGTATTTTAGCATTCCTTGAAAATGATTTTTAAATCCACATTTATTGTAAGTGCTTTGGAGGCAAGAACCATCTTTTGTTATTGAACAATGCAAATGGGATCTTGGTCCATAATTGGGGCTTCTAAGCACCGTGAATTCTTTCACTAATGTTTCTCATTCTCTTTTTCCCTCTCTTTGTCCCTCCGCAGATTTGCTAGTGTTTAAAAAAGTTAGGATCCCTTGCATCCTCACCAGTCTTTACATTTGCCCAAGAATCAGATTCAGTTTAGCCCAGCATTCTTCACAAAGATAAAAGGGTGACAGATCCTGACACACTTGTAATTTTCAAAACCAGAGAAGCTGATTCCTAAAACAGCATCCAAACTGAAACTGTACCAGTGTTGGTA\n>URS00023F5E43 lncRNA from 1 species \nTTTTTTTTTTTGGTAGGTCACGGGGAGAAAAGCTCTCCCCACAATTTATTAAGAAACTAAAAAACAAAAATCAAATTCGGATATGCTTTGGAAACGCAGTTTCTCAGTCATCATCCTCTACAAATGACGCCACAAAGGGTGGAGCAACATCTAACAAATGAAACCATAAAGGGAAAGAAAATGCATAGTTCGCTAACCCGTCCGCAAGACGGTTAGCTTCTCTATAAACATGAGTAACATGGACTAACCAGTCTCTTGATAAGAAGCCATGGCACAATCGCACCAGGAACGATAAAGGATGAGTATCACTAATCCCCCTCGTTAAAAAACCCACCACCAACTCTGAATCAACCTCCAACTCCACTCGCCTAAACCGCCTCTCCCAAGCAATATAAAGCCCGTAACAGACACCAATATTCAAGGCGAACCCACCGCACCAACGACCTTGACCATCACGCACAACTCCTCCTACTGTAGCCAATCCCGGATTTCCCCGTGAAGCGCCATCAGTGTTAAGCTTCATCCAATCTTCTTTCGGTCATTTCCAGGCCACCATTCTCTCCATTTGAGTATTCGATCTGCCCGTATAGCGATTCAGTTTGTGAGCTTGACTTACTTGAGAAGCGAAGTCCTTAACAAACTGAACTCTATCTCTACATTTACCAATCTCGCCAAAAACGTAGCCACACCGCCACTTCCAACTCCACCAAACCACAATGGAGAACAAGGTTGCCCATGAATACCCGACCTCATCATTCACCATTCCCAGATTCAAATATAACCAACCAAGAAGAGACCCATTGAAAAAATCATGTCTCCTGCGAACCGGCACTAACCTTCTCCAATGCAAGACTCGGGGTGAGTCTCACACGGGGATAGATATGGTGGCTTCACAAGCTGGCGATCGCTTCTCTCTTGTGAAGGAAAGATGGTCGAAGGTGGAAATCTGACACGCTAGCGGTCGCTTCTCTCGTGTGAGATCAAATCAGGGTTTTGATGGTGGATTGATGATCGCCACTCAAAAGTGTGAAAGCCTTTGTGATAAGATCACGAACCTTTGTCTCAAGGAATCCACACAAGAGACATTGATTCACACGTTTACTAAGTAAAGGAATCTACCTAACTTAAATAAACAAAAACAAAGCCTAAGCTTTAGAGAAAACTCTTTCTATTACTTTCAAATTTCGTGGTCCTTTACAATGAAACAAATGAGCTTTTTATAGCTCTTACATGACTAAGCTACATTAAAAGAAAATATTCTAAGTTAAATACAAATCAATCGATATAATAGAGAAAGCGTGATTGGTGGTGACGATGAGGAACAAATCGTGGGCATTGATGGAGCTTTATCTCTAGATGCATTCTCTGGATTAAATGGTGGATCAAGGATTTCGAGCAAGCAATACTCCTTAGCAATTAATGCTAATTTAATTACGTCGAATAACGAAAGTTTATTTCCTTTGAATTTCTCTTTGATTCCTTTTGATATTCCGGCCAAAGATGTTTTGCAAGCTTCTTCTTCATTTGGAGGGTTTGAAATCTCCAACATAAACGATCCAAGGTTGATGGATGATTCACTTTCCTTGCTTGGTTCGACGTGTAGTAGTTCAGGAAGTCCTTCAGCAAGTCTTTCAGGAAGTTCGTCAGAAAGTCCATCAATCAGTACATCAGCAAATGTGATGTCCGCATCATACTCTCCTTCTTGAGAAAGTTTTGTCCTCAAAACTAATTTCATTTTTTTTTTTTTTTTTAAATCACAGAACAAGAAAAAAAAAATTTAATCGAAGAAAACAAAACAGAAGCAAAAACGATTGATGATATAGGAGCTTTGAGCTCTGATACCAAATGATGCAAGACTCGGGGGTGAGTCTCACACGGGGATAGATATGGCGGCTTCACAAGCTGGCGATCGCTTCTCTTTTGTGAAGGAAAGATGGTCGAAGGTGGAAATCTGACACGCTGGCGGTCGCTTCTCTCGTGTGAGATCAAATGAGGGTTTTGATGGTGGATTGATGATCGCCACTCAAAAGTGTGAAAGCCTTTGTGATAAGATCACGAACCTTTGTCTCAAGGAATCCACACAAGAGACATTGATTCACACGTTTACTAAGTAAAGGAATCTACCTAACTTAGATAAACAAAAACAAAGCCTAAGCTTTAGAGAAAACTCTTTCTATTACTTTCAAATTTTCGAGGTCCTTTACAATGAAACAAATGAGCTTTTTATAACTCTTACATGACTAAGCTACATTAAAAGAAAATATTCTACAAATTACATACAAATCAATCGATATAATAGAGAAAGCGTGATTGGTGGTGATGATGAGGTACAAATCGTGGGCATTGATGGAGCTTTATGTCTAGATGCATTCTCTGGATTAAATGGTGGATCAAGGATTTCGAGCAAGCAATCCTCCTTAGCAATCAATGCTAATTTAATTACGTCGAATAAGGAAAGTTTATTTCCTTTGAATTTCTCTTTGATTCCTTTTGATATTTCGGCCAAAGATGTTTTGCAAGCTTCTTCTTCATTTGGAGGGTTTGAAATCTCCAACATAAACGATCCAAGGTTGATGGATGATTCACTTTCCTTGCTTGGTTCGACACGTAGTAGTTCAGGAAGTCCTTCGTTCAGCAAGTTCTTCAGGAAGTTCGTCAGAAAGTCCATCAACCAGTACATCAGCAAATGTGATGTCTGCATCATTCTCCAAATGCCCGCTATTGACGGACAATCCCTTCGCACATGCAAGATTGGTTCGTCCCCACCTTTGCAGACCTGACAAACACTTGACTCTCCAATATGACCTCGAACTCGTTCCACATTCGTCATGATAACCTGTTGAGTAACCAACCAAAGAAACGTTCTAACCCTTTCCGGAGCCATCACCTGCCACAGTCTAGCAAAAAAGGAAGACATATCTGTTCGGCACTCAGAATTTTCCATCAACATCTCATAAGCCGACGTAACCGTAAAAGCACCATCGGCAGAGTACCCCAAGATAACCTATCCCGCACGCCAGTCACGTTATCTAAAGCAATAGAGGCTAACTCCAACTGAGTATTATGAGAAACGTAGGGCAAAATTCTGTCAAGTCTCCAACCCATGCCATCCACCCATAGATTGTGAGCTCGCAACTCCTTATCTGTATTTGGTATCTCTAGAACTGCTCTTTCAGAGACTGATACGATAACCATTTATCCGCCCAAAAACGAATTTCTTGCCCATTACCAATCACCCATCTACTACCCCGAGTAGCCACTTCTCTTAACCCTGCCACGATGCTTCTCCAAGTTGACGAGCATGGCCTTTTTTTCTCCATCCAAGTTCGATCATGAATCTCTCCCACTTTATACTTTTTGCGCAAGATTCTAGCCCACAAACTCTGCCGATCATGAATAAGCCTCCAGCCAATTTTAGATACTAGAGCTTTGTTCATAAACTTTGACTTTTGAATGCCAAGACCCCCCTCTCTCTTTGGCAAACAAACTCTATCCCAAGCTACCAAATGCATCTTCTTTTTCTCTAACGAACTACCCCACAAGAAAGCTCTCGCCAGCTTATCTAATCCCTCCAACGTTGACTGTGGTAAAGAGAGAGTACTCATTGTGTGTATCAGAATAGAGGAGAGAACCGACTTGGTTAGAGTTAATCTCCCCGCAAAGCTTAAAGAACGGCCTTTCCAACCCGCTAGCCTTGAAGCCACTCTTTCAAGAACCTCTCCAAACGTATCTTTATTTATCCATCTTTCGAGAATAGGCATTCCAAGATACTTCCCCAACTCTCTTGTTGATTTAATCCCACTCTCATTACTAATCAACTTTTCCAAGTCTCATGAAACATTCTTTGAGAAAAATATCTTATATTTCTCCAAGCTCACTTTTTGTCCAGAAGCTACACAAAACGTTTCCAAGATTCTTCGTATAACCCTTATTTGAGAGACCGTTGCTTCTGCAAATAGAATTAGATCATCGACAAAACAAATATGTGAAATCTTCGGCCCTCCCTAAGACAGACCAATAGGCTTCCACTCTTTTGCAGCTACAGATCGATCGATCATGTGACAAAGTCGCTCAAGATAGAGAACAAATAAGTACGGAAACAATGGATCTCCCTGTCGAAGCCCACGTGACGGTTTAAAGCTAGCAGTCTTCTCTCCGTTCCAAAGGATACTCATAGACAGACCAGTGATGCATTGCAAAATCCATTGGACCCATCTCTCCTCCATACCCGCAGCCCGTATCGTATCCTCCAGGAAGTCCCACCGAATACGATCATATGCCTTCTTCAAATCCAGTTTCAAAAGCATCTACCCTTTTCTCCCTTGTTTCCTTCTCATCGAGTGAACAGCTTCTTGCACCACAATAATGTTGTCTAAACTGAGCCTCTCCGGGATGAAGCTAGATTGTGCTGGACCAATTAGCTTTCCAATAACTTGCTTTAAGAGTAACACTAACATCTTAGTAAGCATCTTAAAAAGAGCATTGCGCATCTTAGTATGTGCCAAACTTCAAGACTTGTAGAGTTTTGACGAGTGGAGTAGAAGACTTGGATTTTAGGATCCTCCAGACAGTAGAGACCTTCAAGTGTTCTTCCCATTATCAGCAGCTTCTTGGTTGCCTTATCATTTATACGAACACTATCAACATCAAACTCAATAGAGCACGGGTAGTCACTTGTGAGTTTTGAAACAGACAAAAGAGATTTAGCAATATCATGGCAAGCAAGAACTTCTTTTAAAGGTATTTTACCTGAAGAGGAAGCAATACTACCTGAACCAGTGTGAGTAATGGGCAAGAAGTTACCATCAACTACCATTATAAAATCAGAACCATGATAGGGTTGAGACTATTGCAAAACTTGGTGATTATTGGTAACATGAGCTGTAGCTGCTGAATCTGGAATCCACTTGTGGCCATGATGGTTTGTAACATTTGTAATGCGCATTGTACCAAGAGTCATTGGTAAGTCTTCGTATTGATAGTTGTTGTCAAACCTATGCCAACATTTCAGAGCATGGTGACCAGCTTTACCACAGATTTGACATACCACACTTGAGTTTTCCGACTGAGAAACAGATGAAGATAAAATTTGTTGATGAAAATCATGTCCTCTAGTCGAGAATGAACTCCTGCCACGGCTAGAGTTTGACCTTTCTTTTCCTATGTTGTTGCGAAATTAGCCATTGTCTGAGTGAGTGACATTGAAAGCAACATGAGGAGAGATAGATGCTTCAGTCACATAGCTTTGAAGACGGTCATCATAGCCTTTTAACTTAGAAGCAACTTCATCAAGAGAAAGACTTGGAGTAGAGTCAACAGAGTTTTCAATATTTGTTTTAATTGGCTCATACTCTCTTCCAAGACCATTCAAAGCAGAAAAGATTTTCATTTTCTCTGGAACATGGTTACCAATAGAGGCTAACTGATCAAATATATATTTCAGATCTTTGAGAAAAGTTTCCATGATGTTATGTTTCTTTTCCAGAGTTTGCAATCTTCTTTGCAGTTCAAACAAGCGAGAGGATGATACTCTATTAAAGTGATTAGCAAGAGTCATCCATACCTGATGAGAAGCGAAGCAGTTGACCACCACACTTAAGATATCTTCAGCAAACGAACCAAGTAACCAAGACTTAACAACTTGGTCTGGTTGGTGCCAAGTGTAAAACTCCTGAATTTGTTCTTCAAAGGTGACACTGTTGTGAGTAGCAGTCCGAGTTTGCGTCAGAGCAAAGATAGAACCAATGACAAAGCCGACCAGCCCTTGACCAGATAAAAAATTCTCGAACTAGCTCTTCCTTCTAGAGAATGTAGTTTTGTTGGTAAAGAGTAATGGTGAAACAGTTGGAAATATTGAGAACTGGGTGGAATTGTATAAGGTGCCATGGATCTTACTTCTATGAGATCTGATACCATGTTGACATTTCTAAACTAAGAATGGTTTATGCTCAAATGAGCTTATTAACATAGAAATCTAAAATTGGAAAATACAATAGTTCAATGAGCTTTATTGAAATATAAAGAAGAAAAAGAAGCTTTAGGTTTTGTCACCAAGAACACTTAGAAGAAAAATCCACCATTTTCAATGGAAGACAAAAATCCAATCAGATTTCCCATAAAAACCTAACTCTTCCTCAAGTCATTGAAGAGCTAAAAGAGCTCTGGGCTATGGTTTTACCAATCATAGCAATAATTTTTATATGTATTAGCGTTCTTGGTGAAATAAGAATGAAGCATAATTGTTGTAAATCAGTGACAAATCTAATATACTTCATTCTTTTTTCTCCAAGAATGCTAATATATATATAAACTCGTCAAACAATCTAAACTATTGTTTGTTAATTGAACTTCAAGCAAGCATTATGTATAAGTTTGACATGTTCACAAAACATGTTAAATTCATTTGGTGGTTGGTTGAGGAAGTTTTGCTCACCTATGTTCTTTCAAACAATTTCAACAACACATTTGATGGCACGTTGAATTAAATCTAAGATCATAATCTCGGTGATCAATCTACACTACGCAATAAGAACCACCATAGATGTATAACCATATATGTATTTAATATTAATCTTATTAATTCTGAATTTTGTTGCTTTCAACTCATTACCCCGATAGTATTTAGAAAGCGATGTTGTTTAAACATGAATTAATTGATTCAACATCAAAATTCTGGTAAATATTGGTTGGTAAATTGTTCAAAATCGTGGGTAGAAAATTAACAACATTTCTTCGTTTATAAACTAAATTGCACGTTTTTATTAGTATGTGTTTTATTTTACATAATATAGTTTGTCATACTTTTATTATATACACTATACATTATAACCGTAATTCCATACGAAGAAAACACATATTATAACCGTAAACCCAAATACATAATCTATTATTCAACTATACGAATTTCATTCAATATATAAATTTTATTAAAAAATTGTCAAAATCTAGTTATTAATATTAGAACTTATAAGATGAGGACCCAAATAAGGGTATTAGAAAGTGAAGATCACTTAAACTCTCTCATACACAATGATCGAGGCAGCCTTATCGAACCCTTTCTCCGACGTCGATGAAGCCATGGCTCGCCGGCGTCGGGATTTGTCTTCCCTTTACTACGTTGTTTCTCTCCCAACACATCCAAATCCTTTCTCGGCCCATGTCCCACGATCTCCCATGCCCACTCCTTGCGACGATTCCTATATATCTGAATTTCTTCAAGTTACAATCGTCTTCCTCTGCTATCAAACAACACCGTTTGATGCGGCTCAGCCCACTCCTGAAACAAGATCTTCTCCCTCTAAACCTTTTGTGATTCCTGTAAATCGTCCCTCTCAATGGCTCCCCTTGAAGTCAAGACCTGCATCTCACAACTCCTTTCTTTGGGATTCAATTCCCCCCACCTAGTGTTTTTCTTGGTTTCGTTTGGACCGGAGCTCTGCTTTGACGCCGGAGCCGATGAGGATTTCGACGACGGAATCTTCAACCCACTCCTCAGCTTTGGCAACGCTGACTCGACTAGCTCTATTACCAAGAAAACTCACCGTCGGCGTGCGGCCACCGTTGACGAATAAGGGAGGTAGCTTCCTAACCCTAATGTTGCTTTTCCTTATTTGGTTTGGGCCTAGCCCAAGAACTGTTTACCCTCCCTCCAATCCATTTTTCAAGTCCTCGAAGCCCATGAACAGTTTTTTTAGGTTAAGCCCACATCTTGTTTGGCCCAGGTTAGGTCTTTATTTCACTCTAGCAAACCCAAACGTTTTGATTTCTTTCTCGTCTTTGGAGAGTAGCTACCTTCCGAGATTAGTTGTGATGGTCATTGTTTGGTTTTGGTTTTCTCTCCCACAAAGTTTGGCAAATAGGTTAGCTCGTTGGTTTTATGTTACAAATCTGATCTCAAAAAGCTTTGGGCTAACTCCACTTTTGAAGTGTTTTAGAGTCTTGATGCCCATGATCCGTATTGTTATGTTTCTGTCAATTACAACCCCTATAGCACCCTTTAACTTTGTTTTGGCTGGTCGTGGACTCCACGCTAACAGAGTAACAGTTCTTTTAGGCTGTTTTGATAGATACTTTTGTCGAGGTCATTTGTTAATTTTGTTTCGAACCCTATTTGAGACTATCATCCCAAACCTTTGGCAATGTCCAAAAGAGTGAAGAAGAACGCCATTATGATCCCATCTCCACGGAGCGGTGGTTACCGAAGCTTCTTCAACTCTCTACCTCCTTACCCGCCAATTACCAAGCTCCTTCAAGGTATCTTCAAGTATACGGATAAGTTGCAAATCTGTGAAAGCTTGGCAAAGAGCGGCGTTATGATCTACCCTTTATTTTCTCCCGTGGAGCACCTTTTCAAAGGCTCATATGCATTGTTTGCAATAGCCGTTTATGACCACACGTTGGTCGAGGATTTCGCGAAGCCCGTCTTCATGGTCGAATCCGCCAAAGCCTCAACAGATTTTTCAAACCTTGTAAACTTTTTTAAAAGTGAACACCTCTTTGCAAAACTCATGAAGCCTCTATCTTCATTTTCTTGTACTATCTTAGTTCTAATTTGTATGAACTTCCCTTTTTTTAGGCTTAAGTGAATGAAAATTATTGTTTGAGAAAAAAAAAAAATAAGATGAGGACCCAAAAGCTCATAGTTCGTCATCTGTAACATGCTGCATTTTTCAGGCAAAGCAATCCGACTAAAATCAAGGAGATGTGGAGGGGAGAAGCTTCCGCCTGATACCAACGGTAAGAGCTCCACATGCGGTGTAGCGATGCAGAGTAGAAAAGGGAGATCTACGGCGAAGAACGAGAGAGACAAGTAGATAGATCTGAGACCGAAAATTGTGGCGGTTCCACGAGATCTTTGTCGATGGGGGAGGTATATTTGATCCGGCAAAGCGAAGCCAACGTCGAAGGTCTCTGTTTTCTATTCCCTACTATTTTCTCTCTTTCATGACTGAGCAAGGATCTCTTCAACAAAAACGAGATCGGCTCTCTTCCTCCTTCTCAAAACAACTCTACAGTGGCGGCATGGCAACAAATTTTGGATCACCATCTCGTTTGGCTGTCCTATTTCAGCGAGAATCTGCAGTTTTGGACGGCGGCTCGATCATGTTTTTTGATTGAGATTAGGGTTTTCAATCTTGGTTAGTTAAATTCGGTTTGTAAATTTGAGATGGCTTTAGTTTTGAGCTGCTTTGTTTATTGTATTGAAGTTTGTGGATTGGGTTTTTGCGATTTTGTATATGCTCTATCTAGAAATAGCCCATTAGACATTATATATAACAAAAAAAAAACATGAAAAACACTAGAAATCATACAATCAAATCCGCATACCTGAAACTTAAAAGACTGGCACATTCGCTAATAATGAAACATGCATCAATGGTCTCTCAAGAGTCATATTATTTGCATAAGTTGATTTGTCCCTGCAAATTCCAATACAAAGCCTTGTGGACTTAATTAAGATAATAGATGTGAAAATTCAAACACATGAATCTGTTTAAAAGACAAAATAAACGTGGCATTATATCAAACATCTTGTAATTTCATATACATAAATATCAAATTGATATTTCCCTCTCTTTGAGAACTGTCCTTACGAATTCGTTTCTAAATAACATGTTTTAGATCCTAACTGTTTGTGTTCTTATGTGATGGTTTTTTAGGGACCGGTAGGTACAACGTGACTCATTCTTGTGAGAATCCAAGTTTTGAACTATGATTTAAAGTCACAATATATGGTTACCATCTCAAATTTTATGTAGAGTGCAACTTTTTCTTGAATTGGCGTGTGTTTGGTCTTCTCGAACTTGCTTCTAACGCTATTTCAAACTTGGAAAATTTTGATTTTCACTCTTTATCATCTTGTTTGTTCAATGAGATTAGCCGTTTTGTTTGTATATTGGGTGTGTCCAATTATGCTCTTTTCTTATGTTATTGTTTATGAATAACTTGTTGAACATTTTACTTATCAATTCACTCCAATATATCCTAAAATTGGGATATGCTCAAATCACATCTAGATCTCATGATTCATATTTCTATACCATTCTTTCGATTTTGATCTTGTTTCTGTCTACACCTCCTGTAAAATATATTTTTTACACAAAATGTATTTAAAACCCATTATACAAAATAATAAACTCCAGTAAAGTGAAGAATTACAAGTAGAAGAAAAAAAAAAGACATCTCGTACAAAGTCAGAATTGAGAGAGCCCTAAACACAAGGAAAAAAACAAGAACAACAAGAAAAAGTCCACTTTGTTTGGTTTTAGACAAAAACAGTAACTTACTTTTTTGGTCAAACTCTGTAGAAAGAATCAATCTCCCTTGTAAATCTCACCCTCCTGTCACCATCTTCCCTCCGTCACTTTCCCAATTTAATTTATAATCAGAAACCCTACATATACACCTAGGTTTAGGGTTTCGCTTTTTCAGAGAAAAATAGTTTCTTTTTCTTCAAGTTAAAAAAAAAAAATTATTAATCTGGTACGCTACAGTGCACCGAAATCCCATAGATGTATAATACTCTGAGCCGTTGATGAAGCTGACGCAACCGCCACATGTCTATCATCGGCAACAATGGCGTCAACTTCTCCTACTCTCTCCCTAATACTGTACAGATACTCTCCTCTCTCTACCTCCCACACGCGCATTATACCACCTGCGCACATTAGCGCGTGCAGTCTATTAACACAACCCATTACTCTTCTCTGCGCCGCTCCACTAACACGGAACTCACACACCGTTTGTTGCGTGTTCACCCTTCGCACGCTAGCGTTTCCTCTACTGTCCAATCTAACGTACGCTTCGTCGTTGGCATCGAAGCCTGTCACTATTAGTCCTCTACGTTGCTCTTCGTCTTCTCCGATGATCACTCCTTGGTTTCTTAGATCGATCACCATGATTCTCCATCTCGTGCATGCTACCGCCGTCTCGTTACCGGAGATTCTGAGACGGCCAAGGGACGTTGTTAGCTCTGTTAACGTGTGCCATCCCATGACAGCTTCAGGGTCGGTGAGTGTACCACCGACGAATGTTGTCTCTTCGCTGTTACAGTCCCATATGTGAAAGGCACGACCTGGCACACCCGCGAAAAGACCGACCCACCAACGTCCACAGCCAGTGAAATCTACCAACGCACCGTCGTTAACTATATCTCCTGCGTAAGCCGTGCGTGTGTGACCAACACCGTCTATTTCCGCCACGTGGATGTCTCCGTCCATCGTAGCGAACGTGAGCCTTGAGTCGGAGATAACAATGCCTGAGACGGCTCGTGAGAATCTACCAAAGCGGTCACGTAGAGGTGGCCGTAAGGTCCTGACGTGGAGTCGGTTGTTTAAAAGAAAAAGCCGGACGGTTCCGTCGGCGAACCCTGCGGCTAAGTAGAGGTCTGAGAGGGTGAGACAACGGCAAGAGAGACTATCAGGCTCGTCCACATCAGACGGGTCAAATTGGAGAGTGAAGTAGGTGTGAGTACGCGTCCGGAAGTTTCTAGCCGTCCGATGACGGTAGATGAACTCGTCCCGCCACGTGTCGTGCATCAAATGTGTTCTTGCCCAAACTTGGCGAGATAGTAGTTGCCATAGATGGTCGGAGCGAGAGACAGCGTGCCACGTGGTGCAAACCTGCGATTAAGAAAAATTATTATAAGTTTTAACAAATATTATAATTAGTAGCTTAATTAATAAATGTATAAATAAGGGAGAGAGTAAAAAAAGACATAGAAAGAAGATAAGTAGGCCTGCAACGAAGCATGAAAGACTCTATATATAGGGACTAGGAAGATGGAAAGACAACGACAGACTCAGACACAAGCTCTGCGTAATATTTGTCTTACTCATCGAAACACACAACTCATTTTTATAAAAATCTATTTTATGACATATGTTCAATTGACGGGACTAATCAATCTCTGGAAGCTATAGATAGAGATATAACAACAGAAGCCCTAGTGTAAAAGGAATAATGAGAGGAAGCCCTAGTCCCATGTCAAAAGAACAAAAAACAAATCAATGTGACAATAATACAAAACAGATGATATGTTAATTTATTAGGACAGATGAGAAGACTTTAAATGAGTTAAGCTGAACATGAGATTCCGACTTTGCCAACAAGCGTGCCCTTCTCTCTTTCATTTCCAAGAAAGGATAGCTTTTAAGCCTTTGGTCTTGTTAAAAGTAGAGCTTCCCATAAATACACAAATATTACACTTATATATAGTAGATGTTTCTCTGTCTCTCTCATCCCTCTCCAACAATCCGTGGACCTACATTCTCTACATTTACGTTTATATTGTTATTTATTGTACATCTTTATTCCTCATTAAACGCAAAGTAATGTATTTGACTTCGTACTCTAGCTCTATAGTACAACCTAAAATCAAATATTTCGAATTCTATACGAAAAGAAAAGATATCTTGTCAAACCAAAGGTTTAATGTCTATTAGTCAGATAATCATTATAAAAAAAGAATAATCTAGGCACTAGGGCACGAAATGTAACATAAAATAGATTAGTACAACAAATAACATATGATGGAATGGCAAATCCTATTTATTATTATGCAAATTACCAATCACATCAATATGATATACTTCAAATAAGAAGGGAAAGAAAGTAGTTCAAATATTCCTGAGTTCTAAGATGACCAGATTCAGAATATCACTTTTGTATTTTAATGTGTGATATATCAAATGTAAGAACATAGTATATAATCTATAGACACCACTGCACGTGCTCTAAGAGACCCTTAACATTGGGTTCCATGTGCTTTTCGGCATATGTATGCCCATAATGTCGTCTCTTTTGACTGAAAAAAATTAAGGAAAGAAAAAAAAAAGATAAAAACCCACTTCAATGGAAAAGATGAATCGAGTCAGGAAAAAAGATAATTCCATGATCAATTTCAAAGTAAAAAACAACAATGAAAACTCTAGACTTATAGCCTTAATTCTCTGACAAAAGTGTTATGCTGTAACTACACTGCAGTTTCTTAAAATTTTAGGGCAAATTTGAAAATTCAATTAATTAGAAAATATTATGGGATTTAATAATGATTTAGAATTATCATGTATACATAGAGAAGTGAGATAAAATAAGAGAATGAGAAGTTGTCAGAAGCTCTGCATGCATTACTCAGTGGATCATAATATTGGCAGAGAAAAAAATAACAAAAGCAGGACGCAAAAAATGTACATATGTACTTATATACTATTCCTCGTTACTATATATGAGAAAAATCTTCAGCATAATATATATATGTATTATTTGTTTTTTTATGAACAAAAGAAAAAACAGCTATTTTCATATATAACATAGGATTATTAAAAAGAATAATATGAATGCCTGATATAATACATGGATCATATATCTGTTGATGAATAGAGTTTTCATGTATGTAGAAAATAACCTAATGTGGTAATATAGGACTAACATTGGCAAGGCAAAAAGACAGGACCTTACTTAGGTTTCTTTTCATTCTCTTTTTAGATGTTGTTAAATGTGCAACGACATTTTCTAGTTTTATGAGTCTGTCGTGAGAGGTCACTTTCTATTATTATAATTTTAAAACAATTAGCAGATAAATACCGTTATAATTATAATTCTAAAAAATATTAAATCTATTGGGCATTGGACTAAAGACTGTGCCTAATGTCTATCAACCAATATTTGGAGACAAGAAAGTGTTTAATTTGATTATTATTGTAAGAACTTTTGAGTCAAAAAGTGGATTTCTTGATCTTAAAAAAGGGCTTTCTACATGCCAAGAAAGGAAGATTTAAAGCCAATAAAATAAAATAAAACCTTGATTTTGTGCCCTAAGGGATCCAATTCATAATATAATATTAATATTAGAGTTACTATGCCCAAATGTTGTACAAAGATTACACAAACGAGATGGGGTTGTATGGTCTCCTTAGAGGATCCAAAAATAGACATTAAAAGGTATCAAAAGTAGACGAGAGAACAATGAAAAAGAAATAAACTTATTGGGTAAAAATGGAAGACAAAAAGTTTCTAAATACATAAAAGAAAAACAAAGTCCCCAAACTATATGATATGTGAAAGAGACATCAAATTAATGTCGTCTTGTTAGACATAAAAGTTGGACTTGGACCCATCATAGAAACACAGAAAGGGCGGTTACCTTTCCAAAGGTCAGTTTTTTTTTTTTTTTGTCTCTTCAGAATCCCAACCTTACAAACTAATATCACATTCAATCGAATTGAAGTAACATCATCACTTAATTATGATCTAAAGAGTAAGAATTCGTTATACCAAAAAGAATTAGAACGGCAGAATCAAATCTAAGCTTAGAAACAACTAAAGTACAAGACACTTGAAACAAGCAGTACATTTGACTAGACCAAGATTGTGTCCCTCCACTTAAGTTATTATAGACCCACGACTACTTTGACTTTGTTTTGTCTGCATAAGATCTATGTCTCACTATTTTCAAGTTCAAATATAAGCTAATAAACGAATTCAGATAGTGTAACGAAAATATTACTTTACTACCTGAAGTACATATATATATAGAGAGACACGAGATAATTGATGTGTCTCGACCGTTACAAAACTAAAAGAAGGTATTCAAAGAACGTTAGAACTGACCCGAAAAACGTTGGCAAGAGCCGGAGCTGCGGCGAGGAGGCCGGCGGATGTGGAAGCGTTAACGGCAACTTGAACGGCGAGAGATTCAAGAAAAGGCTCCGGCCAAACATCGTTGGCTCCGCGGCGAGGGCGGGATGGAGATGGGGCCTCGAAAACGCCGCCGCTTCCACCGGCTCCGTTGTCGGAAGAAGAGGAGGAGGTAGACATGAGACGAGAGGGGTTATAAGAGGAACAGGGGAAGAAGAAGAAGCGGAGAGAGGAGAAAGAATGGTGGGGGAGAGAGGAAACAAAGGACAAAAAGTGTAGATAAAGACATACTTCTCCGAGGTGGGGGACCCAGGTTGTGAAGGTATGTTTTTTTCCTATTTTTATTTTCTTTTGTCAAGATTTGTTATTATTTGTTTTTGTTTATTCTTAATAGATGCAGATTTGTTTGTGAAATAGCTTCAATTTTATATTTTTTAGGAAAAGTATTGGTTCAGTATGGTGACATATTTCAAAATTTCTTTCTTTTGATATGCAGATTTTGAATTATAATGGCAATATAACAGCTATATTATTATAAATCACTAGATTTATATTTTGACGATTTTTTATATTTAAAATAGTGTTATATATCATTAAGAATTCAACAATATATTTGCTAAGTTTATTTCCTTCCGCGAACATTAGTAAATTTTTTGTATATGGTAAACTATTGGCTAAACACAAATATTTGTAGATCGATCCATTTTAAAAATGAGAAATAAAATAATATGTATACGCAAAAAATTTGTCAGAGAGATCAAACTCGTAGCACCAAATCTCGACTTTCATACCAGTAGTAAAAACTTTTAAAGCATAGTTTAACATATTTTTTTTTCCCAACATACTATTGTCATTATAAGTAAATAATTTTTGGAAATCTGGTTAAGCATATTCTTATCATTACAATCCTCAAACCTAGAATTCGCCATATTCTGTCATCACAAAACTTAACCCTACTTTTTCTCATATTGCAGCTATCACGATCCTCAAAACCACGGTTCATCGTGAACTTTAGTCCAAACTCATCACAAACCAACACATGAGCATGCGATGCTTTTAAGTTTATTCCTCAATCTAAATATAGAAATATTTACATTTTCTGAAAATTATTCATATATATAGTGCTTTTATATAATTACAATTAACATTTTTGATTAGTATTTTTTAGTTAAAACATTTTTATTCTTTTTTAATTAAAAATAATTAACGAAATAATGATGAATCACGTTATTAAGAGAGAAAAAAAAATAAAGCCACATTATTAACGTCACTAAGAGGAACATTTTGGTTTTCCTCCCAGACATTGTTCATCTTGGGAAAAAAAAATGTCTTCTCTTTTACTAGGTGTTTATCCGAAAACGAAGAAAACCTATTTCTCGTGGCTATTCTCTCTTTCTCTCGTCTCTTCCGCCCGAAACTTTTAACGTCGTTGTCATCGAGTCACATTTCGTCTCAACTCAACTTGTTTCGATATGTGTCAAATCTTTATTTCGATTTTTCCGACAATAATCAGACATCTAAGTTCAATAGCAAGTGATTCCCATGATTAAAACCATTTTCTAAAACCACTGTTATGATATTGATGGTTTTTATCGACGCTTATTACGGCTGATTTTTGCCGTCGATTTACATATGGTGGCTGATTTGTTATTTCTATTCGATTTGATGGCTGAGTTATTGTATGCTTTAGGACTGATTTATGATTTATTAATGCATATGTGGTTGAGTTTGTTTTGTGTTGTGGCTTGGTTACTGTATGTTTTATGACTGATTTATGATTTATCAATGCATATGTGGCTAGGTTTGTTTTATGTTGTGGATGAGTTATTGTATGTTTGACTGAGTTATGATTTATCAATGCATCTGTGGCTAAATTTGTTTTATGTTGTGGCTGAGTTAATGTATGGTTATGGCTGATTTATGGTTTATTAGATGGCTAAGGTTATTTCTGAAGAACAAGCAAAGGATTACCCTCTAAGAATTTACGCAGAAGGAGAGTCTAATCTAGAGAATAAACTCATTAATCACAATATCAAGATGACATATTTCTATGGGATTTAGAGAATTAGTATGATAAGATGTGTGGGATCAAATGAAGGAGGCACCTATTGGAATAATTACTAAGTTATCGAATAGTCAATTCGTGTGGTCTCGTAAGACTGTACATTTTCTATTAAGTAGACAGTTAATAATACTTTTGAAGGAGATTTGGTGTCTCGTTGGTTAATGCTATAAAGATGTTGAGGCCTATTGGAAAGTCGTACACCATCAGTGGTATGGTTTTCATGTTACAGGCTTGGGCATATGATTCAGTCAAATGCTTTGGAGAGCGATATAGGAACGTAGTCAATAAGGATGAAATATCGTTGCTTAGATGGGGTGGAAACCGTACACGTACAACAATGGAATTTGATGTAGGTCAAATTGCTCTAAGTTTACTCCCTCAAATAAGAGATCGTCGTTAGTACTTAAGGGTAAAATTCCACAAAACTCTTTTGTTCACACAATAGGCTAAAGTATCAAAATCAAGCTAGATAGATGATAAGAAAATAAAAAGAAAGCAAGTAAGTAGATAGTGGATTGTGAAGTTGTAAGACAAGATAATAAAAACGTTAGGTTTAGGGTATTCTCAGGAAATAGATGATAAGAGATATAGAAATAGCTAGGATGTTATCGAATCGTTCTTAAACTCAAACCCTAATTACAGAATAAGCGGTGGTTCGCCGTGCTACTCAATATGCCTAGGGCTAAAGATTCCCAGCGGTCGCTTGGCAAATCCCTATATTAAGACATGCATGATAAACGAGTTTGATAAGTTCACCTAAATAGATAGGCCGATTCTTATTTCACATCTATAAACTTGGCTCATCAAATAGTATTTCTGGTAACATATACCTTTTTGGGCATACCTATTATTTAAGATTAAGTTCTAATTAGTTACTCTAGAACTAGCATTAAGAATAACCAAAGATGAAAAATCCTACATATATCCTAGCAGGTGAACAATCTACTAAATCATCTAAATCCCTAATGAGAAACCCTAACCCTAACAAGTAGACTACTCATACATGATGGATGAAACAAACAACATTTATGAATGAGAAAGCATAAACAAAATCAATAAGAAGAAAGAGTTAGAAAATATCTCTTCGGTATTATTGAAATCTCTGATAAAACTCAGAAAAATGAATCCAATGTATAAATAGCTTATAAAATGCTTTAGAACAAGTTAGGTGGCTAAAAACTTGTTAGGTCACAACAATGACCTTAAAACTATATATATATATATATATATATATATATATAACCTAAAAACGTGTAGGTTACATTATTAGGGCGCAACTGGTGTCGATCGACACCAAGAGTGTGTCGATCGACACTCTCGACTTGATCTGAAACTAAATTCGTCATTTGGCTTAGTTTCTTTAGCATTTGCTCCAAATTGTCTCCTTAACTCCATTCTTGTCCCAATCCAAAGAATACCTTAAAAGACTCTAAAAGGACTCTAAAACCTATATTTAAATCATAGTTAATGTTGGTGTCGGATCCCGCATCATGGGCTCGGATCCGGCCAAAGATTGCTACGTGGGTAAAAGAAGCCCATAAGAGAAAGGCCCATAAACGTCCTCGAGGTGAGAGTATGGATGAGGTGTTGAGTTGCGAAGTGAATACATCATCGAAGTCAAGACTACCCGGATTGAAGAGGCCGAATGGGCCGAAAGGTGAAGTCAAGAAAAGCTCGGAGTGGATTCAAGTTCCAACGTTCAAATAGTTAATTCGAAGGCTAGAAACGGACACATTTAAGATAGAATGATTGTGAGTAAATAGGTATTAAATGTATTCTTTGGGTATAAATTGTGGGTCAAAGACCATGTAAAGACAGACGCATTTCTTGGTGCAAATTAGCTATACACACTCTTTTACAATACTCATAGTTTTCTCTATAGTCACTTGTCTATTTTCTAGTATATTTGTCCTCAAGAATAATCCTTCCCACTAAATAAATAAATACTTGAGTGTGCGAATCCGACATCCACAGTTAAAAACAGTAAAAATAGGGTTATATCAGAATCGACCATTGCTAAAGATATCTAAGTGCATGGTGAGATAAGGTTTTGGCTGTGTTGTGATAGTTACTGATTGAGTTATGATTTGAAATGGCTGATTTATGGTTTGTGATGGCTGATTTATATTTTATGATGGATGATTTATGGTTTGTGATGGCTAAGTTATATTAGTGATGGTTTAGTTTTGATTTATTGATATTTGAGTTATATTTTAGTGATGGCTTAGTTATGGTTTAGTGATGGTTGAGTTATGGTTTAGTGATGTCTAAGTTATAATTATTGATGATAGAGTTTAAACTAACTAATGTGTTTTATTTTGTTATAGTTGCGTGTGAGTAAAATGGTTATGAAGGATGATGTAAGAGAGTTATTTCATACGTGGCCAAATCAAGTAGAAGACCCAACACTTGATCACTTGATCGAAAACATACATGAGAATAAGTTTGTTAAAGGTTATAGGGATGTGAAGAGAAATGAGAAGAAGAACAAACATGTAAATGGTAAAGTAGCGGTTGAGTCTGAATCTCACGCAAAGAAGCAGAAAGTCTCCCACAGTGAGGGTGGTGAATATTATGAAGGACATGCACAAAGGAAGAAGAAGAAAGAAAGAAGCAAAGGTAGTGATTTGTGAACAAAAGTGAGGCTGGTGAATCTGGTGAAGGAGATGCACAAAAGATGAAGAAGAAGAAGAAAGAAGCTAAGGTAAGTTATATGGTCTATGGTGAGTTTATATTTTATGTAATGTTTGGCTAGCTTGTTAGTGTTTGTTTTTTTGTATGTATTGCATGGTGTTAGTGAGGAGGATGATGTTCTCGAAGATGTGTTGGTTAGAGCAGTCGTGGATATGGTGTCCAAATTAACTTCAAGTTTTAACACTGTTGATACAAGCATTAGAGAAATGTCTTCAAATCTAGAGAAGGTGATTGGAGATAGAGTGGAAGCGAAGATGGATGCAAAGTTGGAAAGCGGATTTGGATATATTGATAGTGAGTTCAAACAGAAGAAAGAGCATTTGAATGTCATGGCCATGGGGGTAGAGCAAACTGACCAAAAAGCTAATGATTACGAGAACTCAGAATTCAAAATTACAGATCTACTCAGTATTTAGAAGCAGCGAGATCAGCTACTATGACAACAACAACAACAAAAAACACCAAAAGGTTCAAGAAAACCTCGACAAAACTACTATGTTACTAGTCCTCCTCATGTAAGCTAATAGTGCAACACATATGTTTGAATTATAAATACATTGCGGCTGATTAATAATTTTCTTATTTACTTACGGCTGAGTTATCATTATCTTATGACTGAGTTATCATAATGTTTATACAGGCGAAGGATATTGTCGATGTAGTAGAGAAGGATAATGGTATTGATGAGGTCAATAAGAATATGGATAAAAAATTTGTGAAGGCCATTGATGGGGTCAATAAGAATATGGATAAAGAATTTGTTAAGGCCATTGATGAAAAACGATGGTGATATTGGTTTCATTGAGAAGTCTCTTGGTTATAGGAAATTACGCCCTACGACGAGGAGAAATAACAAAGAGAATGAAGAGGTAAAGAAGAAATCCGTCAAAGAGCAAATCATCAAAGAGCCAACCGTGAAAGGTAAGAGAGGTAGAAAACCTGTAGAGGCGAAAAAGTTGACCATATAACTACATCCTGCTCTTGTTATTAATGAGAAGGGAGAAGCTGATGAAACAAAATTACCTGCTCTTAATGTGAAGAGAGAGTGTTGTTGTCTCCAAAAAAGCTGAGGAAGTCACTGACAATGATGGTTAGAAGGAAGGTGACAGTGACGTATGAGATGTCACATACCAGTTTATCGGTGAAAACGGAAGCACGTTCCCTGAGTCTGATGATGATGAGGATTGATATAATCGAAGCTTTAAAGACGCAGAGTATTAAGCTGTCTACGGATGGTAGTGCATTGAATCCACTCTTTAATCTCTCAACACGGGTTTTTCCTAATACTGGAGACAACAGACTGAAGTGCATGAGGAAGAATTGTGTGCCTTCAGCTGGAATATATGATCCTCTATCACCGGCTGATACAGCCAAATTGTAGAAACTTAAGGATTACTTATCCCCATTCTAGTATGACCCTTTATACCTTATTAAGTTGTTAATTACAACTTGTTAACATTATTTCTGTATATTAACTTGTGTTTATTTGTTAGGAATCTCCCATTGGGCAGGGCAACAAACGATGTTGATTTCTACAGGGTTATCATCTCCGAAAGAAAGCACTGACCAACCAGAGAATATGGATGGTTGTTCGATAGTGTAAGTATTACATTAGCAGAGTTATTAGTGTGTTTTGTCAGAGTTTTACTACATTATGGCTGAGTTATTGGTGTGTTATGCTACATTATGGCTGAGTTATTAGTGTGTTTTGTCTAAGTTATGTTATATTGTGTCTGGGTTATTATTTTGTTTTGTCTGAGTTTTTTTTTTGTACAACATGTGGCTGCGTTATATAGAGTCCTCAGGAATAGGTACAAGCGAAATCTCTGCCCATTCCACAACAAACGCATTGCATTTCTAGACACGTGATTCGTGTCTTTTTGGGTTAGAGAGTATGTACAGTGCAAAATATAAAAGAAGATGTTTAAATTCAAAGACACCCCGTATGAAAAGATAGTTAATGGTTTGCTTCCAGATAATCAACAGACAAATATGAAGTGAATAGAAGATGTGAATCACTTGTATTTGATTCCCCAAACCAGAGGCGATCACTAGGTGGCACTACACATGGACCAGATTAAGGGGCACATTGATTGCTATGATATCATTGTGGGATAAGTTACAAGAAACTGAATAGAATTGATTAGAATGTTGTAGGCCGTTTACGAGAATGATTCCAGCAATGATGAACGTGCTAATTCCTACTACAATCGGTGAACATAGGTTTGAGCAGTTTACATTCAAAAGGAGTAGTGTCTCCAGGGTCCCTCAAAACGTACAAGTTGGAGCTGCGGCGTGTACTCGTGTTAATTTTTTGAATGTCTAACGCTTGGTATAACTTTCAATGACATATGTGATTTCAACCTATACAGGTTAAGATGGCAGCATATATCTACAATAAGGCACCTAATCTGCTTGGACAGTTTAGGATTTTGACTTGGGATAATTATATTAACTTTTGAATCGTATTTTTTTCAACAATCCATAAGACCAATGAATTTTGTTTTCTTTATAATGGTTTGATTTCAAACTAATTTTCATATCTTGGCATTTTCAGATAATTAAATTGGAATTTTACATTACAATTATTCTTCTCATAGAATCAAAATGATAAATCTATATTAAATATGTTACTATATTCCAAACTTTTTTGGTTTAGTTTTATGGACTTACTATATTGTGCATAACTCAAATTAAATTAAGACATTTTCACTTGGGATCACTATATTAATTTTTGAACCGTATTTTTTTCAACAAACTATAAGGCCAATGAATTTTGTTTTCTTGTAATGGTTTGATTTTAAACTAATTTTCATATCTTGGCCTTTTTAGATAATTTTATATTAGAACTATTCTTCTCATAAAATCCAAATGATAAATCTAAATTAAATATATTGCAAATCTTCCGAACTTTTGTTTGGTTTAGTTTTATAGACTTGCTATATTATGCATAACTCAAATTACATTTAAAAACTCCATTTGTCAAACATTAGGTTTTAACAAATACCTCCATAATCCCCATGTGGCTTTCTAGTACAATTATTTGTCAAACCTACGATCTATCTTCATTTTAGAATTTCTGAGATTTCTCTCACAGCCTATAAATCAAGTACAACATTAGGTTTATAGCATGATCTCCAACATTAAGAATAATCAAGTTTTTACCATTTGTTGTTATTTCCAACTTAACATGATCAAAACTAAATGCGTGGAGTCTTTATGTCCTCGACATAACATTATGTAAATACTTTTTGACTAAAAATAGTACCATTCACCCTTCTAACTCTATGTCAATTTGACTACAAAAACATTTTGACAAAAAAATGAACGATTACAAATTACACTGATGGAAAATATACTTAGTCGAATAACCACCAACGGTTGAATGTAAATGTGGAGTTCCAATTATTAATCATTTTTTTCGGCACTCAATTCACGAATGTGAATCACCACTAACGCATCTAGGAATATATATAGTAAGGTATACAACTTATTTTTTAATCAAAACAAAAAAATATTTGTAGATTTTTGGGACCTTTGGTTTTCCTTAAAATAGATAAGGGAATATTGGAGGATAGATATGAATCTATATGAATTAGAATTTAAGGTCTTAAATCCCTTTGTGATAAGGTTTGGGATACCTATATTTTAGGATCTGTGTTTATCTCCTGTGGAAACTCTCTTGTATAAATACGAACGTGAGTTCATCAATAAAAGCAAGTCACTTTGATAACCAATTCTACATGGTATCAAAGAGCTGAGATCATCAAAATCATCTTCAAAAATTTTGTGTTCTTAAGTTAAGAATTCTTAAATTGTTTCCTTTCTCTGTTGAGTTGATAGTCTTGTGTGTCAAGTAACAATGACAAACCCAACGTCTGGTGATGGATCTTTGTCAACCATGTCGAGTTCTATCGGAAAACAACCAGAGGTGGTGACGTCGGCGGTGACAGTGTCACCGTTCACTCTTTCTAGCTCCGATAATCCGGGGGCTATGATTCCATCGGTCATGTTGACTGGTGACAACTACAATTCTTGGTCGACAGAGATGCTAAACGCTCTTCAAGCCAAACGAAAGACGGGTATCATTAACGGTGCAATACGTAAACCACCTGCTGATGATCAAAATTTCGAAAATTGGACAGCGGTGAATTCTATGATAGTTGGATGGATCCGAGCTTCCATCGAACCAAAGGTGAAATCCACCGTGACTTTCATCTCAGATGCTCATCAATTGTGGATTGATTTGAAGCAAAGATTTTCTGTGGGCAACAAAGTGCGTATTCATCAACTCATAGCACAGCTCGCGACATGCCGTCAAGATGGACAATCTGTTTTAGATTACTATGGACGGTTGAGTTCGTTGTGGGAAGAATACCAAATTTACAAACCCATCACTACGTGTACGTGTGGTTTGTGCACTTGTGGTGCCACATGACAACCATCCAAAGAACGAGAAGAAGAGAAGATTCATCAATTTGTGTTGGGACTTGATGAATCTAGGTTTGGAGGAGTTAGTACCAATATCATATCTATGGATCCTCTTCCAACTCTTGGTGAAGTATATTCGAGAATCATAAGAGAGGAGCATTCTTCTCGCAACAACGAGCAACATCGAGAGTCAGTTGGTCTGTTTACTCGACATGACCAGTCTGCTTCAGATGTCGCTGCCTACTTTGGGAAATCAGATGTGACTGCTTTAAACAGACCTGAATCCTCAATCATCAAACCCCGAGATTGTAACGTGCTCTGTTCGCATTGTGGACGAGCTGGGCATGAAAAACAGGAGTGTTGGCAGATCGTGGGGTTTCCTGATTGGTGGAAGGAACGAGAACGTCTTCAAAAGGCTAGTGGTCGTGGAGGAGGAGGACGAGGAGCAGGACGAGGAAGAGGACAAGCTTTTACAGCTCATGCCACAAGCTCACATTCCTCTGTTTTTCCTGACTTTACACCGGAACAAATAAAGGTTCTTCAACAAATGGTCACCGAAAAATCAAGCACCAATAACGTCGACAAGTTGTCGGGTAAGAGAGCTCTTGGTAATGTGATACTTGATACAGGGGCTTCTCACCACATGACGGGAAACCTTTCTCTATAACATAACATCAAAAATATTTCGCCATGTTCGGTGGGATTCGCAGATGGAAGTAACACATTTGCCTTGAGTATGGGAGTGTTCCCATTGTCTGACACGGTTTCGTTAACCGATGTCCTATACGTACCATCTTTAAATTGCACACTTATCTCAGTTGCTAAGTTCATAAAACAAACCAAGTGTGTAGCTTTGTTTACTGAGACCTTGTGCGTTTTGCGGGACCAATTTTCGAAGACTTTGATTGGAAGCGGTGAAGAGCGTGATGGGGTTTACTACTTTACGGATGTTGTTTCACCAAAGATACATAGCGTGGATGTTGTTTCTGACAAAGCGTTGTGGCATCGGCGATTGGGACATCCATCATTTTCTGTTCTTTCAACTTTGCCTATGTTTCTAGTTCTTCGAAATCTGCTACTCCAAGTCCTTGTGACATTTGTTTTAGAGCTAAGCAGACTAGAGAGGTTTTTCCAGAGAGTTTTAATAAAGCAAACGATTGTTTTTCTTTAATACATTGCGATGTTTGGGGGCCTTATCGGGTTCCATCTTCATGTGGAGCAGTTTACTTCTTGACTATTGTTGACGATTATTCAAGAGCGATGTGGACATATCTGCTTCTTCAAAAGTCAGAGGTACGAAATGTGTTGACAAACTTCATTGCATATGCAGAGAAACAATTTGGAAAAACAATAAAAATCGTTAGGAGTGACAACGGGACTGAATTTATGTGCCTCTCTTCTCACTTTAAGCAGCAGGGTATCATACATCAAACATCTTGTGTTGCGACGCCACAGCAGAATGGTAGAGTTGAGAGAAAACATCGCCACATTCTTAATGTTGCTAGGGCATTGTTGTTCCAAGCTAGCTTACCTATCAAGTTTTGGGGAGAAGCAATTCTTACTGCAGCATATCTCATCAATTGCACACCCTTTTCAGTTAACAATGGTCGTTCCCCATATGAAATTCTACACAACAGCAAGCCTCCCTACGATCAACTCCGAGTGTTTGGTTCAGCTTGTTATGTTCATCGTATGGCTCGAGACAAAGATAAATTTGGAGAAAGAAGTAGACTTTGCATTTTTGTTGGTTATGCTTATGGAAAGAAGGGATGGAAGGTTTATGATTTGGAGAAAAATGAATTTTTCATATCTCGTGTTGTTATTTTCCGGGAAGATGTTTTTCCATATGCAGCTGGTGATGTTAATTATGTGCATGTTTCTTCAATACAAGTCATTCCTGATGAAGACTGGCTGGTACCTCCGTCTATAGTTGTAAGGGGGAGCTCAGAGTCTCAAATCGACTCTGTTCCAGCAACTCAAGCGGCTCCTCAAATCGACTCTGTTCCAGCAACTCAAGCGGCTCCTCAAATCGACTCTGTTCCAGCAACTTTAGCGGCTCCTCAAAACGACTCTGTTCCAGCAAGTCCGGTTTTGCTTGAAAAATCCACGAGTTCGTCTCCTGTTACAATTACACCACCAGCTTCTCCGAAAATAAGAACATCGTCTTCTTCACCAACACTAGCGCCACTTGTTGATGTTTTAAAACCTGCAGATTCGCCTCATCCTATTGTGGAATTGCGTCGAAGCAAACGAGAACGACAGGAATCTGTTAGACTCAAAGATTATGTGGCTCATAAAGTAGTATGTTCTTCAGAAACCCATCACGCTCTGCCCATCACTGCCTCTCCATCATTGTCTTCGTCAACGGTCTAAGGTACGTTTTCATCTGAATATGAGTCTCTGTATTCGTTAACAGATTTTATCTCGGATGAACAATTCTCACTAGGACATCGTGCGTTTTTGGCTACCATTACAAAATCGGTTGAGCCTAAGCATTTCAAGGAAGCTGTTCAAATAAAAGTTTGGAATGATGCTATGATCAAGGAAGTTGATGCTCTTGAAATTAACAAGACGTGGGATTTGGTTGAGCTTCCTCGCGGAAAAATTGCACTTGGAAGTCAGTGGATTTACAAGACGAAATACAACTCGGATGGTACGATAGAACGGTATAAAGCTCGTCTAGTAGTCCTGGGTAATAATCAGATCGAGGGAGAGGATTACAAAGAAACTTCCGCCCCTGTCGTGAAAATGACTACGGTTTGTGCTCTTCTTCGACTCGTTGCTGCTAATCAATGGGAGGTATACCAAATGGATGTCCATAATGCATTTCTCCACGGAGACTTGGAAGAAGAGGTATACATGAAACTCCCTCCAGGCTTCCGTCATTCACACCCCGATAAAGTTTGTCGACTTAAAAAGTCTCTATACGGACTTTAACAGGCTCCACGTTGTTGGTTCAAGAAGTTGTCTGATTCGTTACTTCGATTCGGGTTTGTTCAATCATATGATGACTACTCTTTATTCTCTTACACTCGTGAAGGTATGGAGATCCGAGTTTTGATATATGTCGACGATCTCCTCATTTGCGGGAATGATAATTATATGCTTCAAAAGTTTAAAGAATATTTGAGTCGTTGCTTTGCAATGAAAGACTTGGGGAAACTCAAATATTTTTTGGGGATAGAGGTGAGAAGAGGACCAGAGGGTATTTTTCTGTCACAGCGCAAGTATGCTTTGGATATTGTGGCGGATTGTGGAACTCTCAGTGCTACAGCTGCTGCAACTCCTCTTGAACAAAACCATCACTTAGCTGATGACGATGGTCCCTTACTGGCTGAACCAAAGAAGTATCGAAGGCTGGTAGGACGCTTGATCTATCTCACTCACACACGACCCGAGTTAAGCTATTCGATACACGTTTTATTTCAATTCATGCAAGTTCCACGTGAGGCTCATTGGGATGCTGCTCTTCGTGTCGCTCGTTATCTAAAGGGAGCTCCTGGTAAAGGCATTTTGCTCAAAGCTAATCCGGATCTTACTCTTACTGTCTACTGCGATTCAGATTATAATTCTTGTCCTCTAACAAGGCGCTCTTTGAGTGCTTTTGTTGTTTTGCTTGGTGGCTCTCCTATTTCTTGGAGAACAAAGAAACAAGACACTGTCTCTCACTCTTCCGCTGAAGCTGAGTATCGCGCAATGTTTGTCGCTCTCCGTGAGATAAAATGACTTCGAAAACTCTTGACAGGATTGGGTATCAAACTCACTGCGCCAGCTCGTTTCTTTTGTGATAGTTAGGCTGTGATTCACATTGCGGCAAACCCAATGTTCCACGAACGCACCAAGCACATCGAATCAGACTGTCACTTTGTCCGAGATGCTGTCCGAGATGGACTTATCACTACTTGTCATATTGGCACTACGGAACAGCTAGCAGATGTCTTAACCAAGGCCCTTGGACGTGTTCAATTTCTTACCTTAATGTCCAAGTTGGGCATTCAAGACCACCATGCTCCAACTTGAGGGGGAGTATTGGAGGATAGATATGAATCTATATGAATTAGAATTTATGGTTTTAAATCCCTTTGTGATAAGGTTTGGGATACCTATATTTTAGGATCTGTGTTTATCTCCTGTGGAGCTCTCTTGTATGAATACGAACGTGAGTTCATCAATAAAAGCAAGCCATGATAACCAATTCTACAGGGAATTTTAATAAAATGTCAAATCTCTCAAATTCATTTTGTTTTGTGGGTACTTGAATTCAGCAAACGATTTGTCATTTAAAAAAAAAATCCTAAGCAATCAAAATTTATGGTTTTTAGCTAATTTGATTTGCGTGGCAACATTGTATTTACCGATTCTGTGCAAATTTGACTTAGGCCTTGTGAAACCCCAAACAAATAGGATGGCAAATAATGACAAGAAAACCTCATTTTGCTGTATGATTGATACATTTATTTTGCAAATGTCTTTGTAGTCAAACCCGACCATACAACTAAATATAAAATTTGATTGGATCAGAAACCATATATTCTCTCGCTGGACTCTTGTAAGAAAACTAAAGATAATCTAATACGATTCAGGTGAAAAAAACTAACATCACATTATTTTTGTATAAGTTAATATTGAACTATATATATATATATATATATATATATATATAATCCTTTTACAAAAAATATATTTTATATATATATATATATATATATATATATATATAAATCTAAAGAAGAAAAACACATGCCTCTTTTCTCGAAATATAGATGAGTGTTGCCATAAAACAAATATGCAAATAAGTATGTACAAACTTAAGTATTTTTTACCAAAAAAAACATAAGTTTTTTGGTCAATTATTTATAATAAAAGATTTTCTAGTTCATATCATTGTGGAGGATGGGCTTTAAAAAGTATTAAAAAGATATTTAAGAAATGAAAAATAAATGGCAGTAGAAAAAAAGAAAAAAGAAAAATAAATGATGGCAAATATATCTAATGAAGAGGAGGATTTAACAAGATTTATGAAAAACTATAAAACGTTATATAGTGTGTAAAAAGGTAATAAATAAGTAATTTTTAAAATTAGTGAAATTTATAATAATAATTTTTAAAATTAAGATTAAATTCTATTATAATTATAAGAGGATAATATAAATCAATTCTTAAGAAATTATCAGAATTGGCAATGGATTCTGTGTATTATAATTATAAGAGGATAATATGATTCATTTAGATTCAGTCAGCGACTCTAAAAAATTATACTTTACAACAACATAATAAATCATAAGAATTGGCAATGGATTCTGTCTACCGAAAGATGTGGGGTGAATTCATATGACGAAATAAGTGGTGCAATTTCGTAATAATCGAAAGATATGGGGACTAAATCTTAAATAGAAACGTTAACTTGATCACAACGGCTATAATTAGTTACTAATCACAGTAATTAAACCACTAAACTCAAAAGAAAAATGGAAACAACAAAAAGCCCTACCCTCTTTCCTTAAAGAGAAGGCAACTTTTTTCTGCATTATTCGATCAGCGGCTCTCCATCTTTCTAATTTCCTTGTTCCTCACGACTTCATTCTCAGAGCTTTCGAGTCTTTCGGTTCCATTACAATGACTATGTACGATCTCACGGATTCAGGGAAGGATATGTGTTCGAGTCTTTGTTTACTGGCCGAAGTTGCGGTTATGGTTGCGGAAGAAGAACAATTTCGTCGTCTTCTAAAGACTGTCTCTAAAGAAGAAGATAGCGACAAGAGTTTCTTCTATCGTTTCCCGAGAAAAATCAGATCGTCTTTGGTGAAGAGAAGATACACGCAGCAAAACCCTAACGGGGCTTCTACTTCTTCAGCGGTTCTCGATCTGAACCTAATCACCACTGATTACGACTTGAAAACCCAACAAAACCCTAGTTTTGATGAGCCGTTAGTTGGTGTATAATGGGGCTTCTGCGTCTTCATCGTTCTTGAACCTTCGTTGTTATGATCCTTCGTTACCCTTGGATTACAACACGGCTAAGTTGGGGAAGACAGAGAAGAAAAACCTAACAAACCCTAATTACCAATCTTCATCTTCGTCTTCATGCCTAACGGAGAACAAAAGCCGCAAGAGGCGTGCCGTGCAGCAGAGGAAGAGTGGTAAACTCAAGAAAGCGAGGGTTGTTTCTTTGCCAAGGATGTCTATAGAGACGCCAGAGTGGGTTTTCCAGGTGATGAGATACATGAACGCTGATGCTGAAACCCCGAGGCTGATATTTGAGAGGACTCTGTTCAATAGTGATGTCAAATCAGGCCTGAGCCGTCTCTTAATCCCTTTCCAGCAGCTAATCAGAAACGACTTCTTGACGCCTGCGGAGTGTAGAGCCATACAGAAAGACGAAGACAACGAAGATGACAAGAATATTGGTGTGGGAACGATTCTTGTGAACCAAAGATCTAAAATGTGGGGTTTGCGTTTCAAGATATGGGCGATGGAGAAGGACTCTGGACACGGAACATTGAATTACATTTTGAATTGGGGTTGGAACGATGTAGTCAAAGGTAACGGCTTAAAGGCTGGCGACAATATCAGTCTTTGGACTTTCAGGTGCCGTGGAGTCCTCTGCTTTCCTCTTGAGACATAGTAGCTCTCTGATATTTTCATTTGTCTCTTGAGGTTTCATTTATATAGTTTCAAGTGATTCTTGAGGTTTTTGCCTTTTTAGCATAGTAGTAACTTGTTGGAAGTGTTAAGTAACTTGTCTGTCTCCTCTGTTGTCTCAGTTCTTTATCATTGTTTGAAAATAAACTATTTTGTCATAAGTATGGTTTGTTGTTTTGTCTACTTAAGTTACTGCATTGTTCAATATACCTTTGTGTTATCTCAGATCTCTCCTCTAAACCTGTTGCAATGATGGAAATGGTCTATTCCTGCAAGAGTTTTGGTACATTCCTCCGAAATGCTCGATTTAGAACCAAAAACAATCAAAAAATGTCAGAGAAAAAGCAAGTTTTGGTAACAAGGATTTATCTACGCATTGATAATATCGACAAGTTAGTTTACTCATATTAACACCAAATCATATTGTTTCTGTCGAAAGCTTAAGCTTCTCCAAGATCTCCCCATCTCACATTGTACTTAGATGCAAGGTAATGTGCACCAACAGGACCTCTGCTTCCATATGGATAGAGCTCAGGAATGATTTTCTTCTCCTCTAGTTCCTTCAAAGCCGGTGTGAATAGATCCCATGCTGCATCTAGCTCATCACTTCTGATAAACAACCTCCTCTCTCCTTCGATTGCATCGAGAAGCAGTCTTTCATATGCATCTGGTATCTCTCTTGGATACCTATCAACCCCAAAAGAATATAAATAAATAATCTCTATAGGAAAACTAGAATCAGTAGTATGCATTGTTGTACCTGGATCGATATAGAAGGTTAAGGTCGCTGCGATCTAGTCTCATTCCAAGACCAGGAACTTTGTTGTTGATCCTCAGGTATATCCCTTCATCAGGCTGAACTCTAATCACTAGTTCATTTGTTGCATTGTCTAAATTAGTAGCAAAACTTTTCTTGTACAAGTTTCCTGGGACATGTCTGAACTGAACTCTGATCTCTGCTCCTCTGGTATGGAGAGCTTTTCCAGCTTTCATAAGAAAAGGAACACCGTCCCATCTCGCATTGTTGATGAACATGGCTGCTGCAGCAAATGTAGGAGTGAGACTGTGATTTGGAACCGTTGGATCGTCTGTATAACCTGGATAAGTTTTTCCTCCCTTGTTATGGCCTTTGTATTGACCAACAACCACATCTTCAAGCCGCAACGGTTTCATTGATCTCAAAACTTTCACCTTACAGGAACACATAATCATCGGTATAGTATTTTATAACCAACCTAAAGCTTTTCTTCTTAGTGAAAAAAGTCTTACCTTTTCACTTCTTATGTCCTCAGCATCTAAGCTCACTGGCGTCTCCATTGCAAAAAGTGCAAGTATTTGCAAGAGATGGTTTTGCATGATGTCTCGTATGATTCCATATTGATCAAAGTAACTGCATCGATTTAACATTAGTAAGGTGTTCAGTGTCATACTGATCAAAGGTGTTCAGTGTTCATGCTTTGTAAGTTGTTTATGAAAGCTTACCCTCCACGCCCTTCTGTTCCGAAATCCTCAGAAAAAATCAGCTGAACGTTGCGTATGTAATTTCTTGACCACAGAGGCTCGAAAACAAGATTTGAGAATCGGAGCACTGAAAGGTTCTCAACAAGCTCCTTTCCCAAATAGTGATCAATCCTACGTATGTCACATAACATTGCAGTTAAGTTCCAGCTTAAAAATGAATGGCAGTGATGGCTGTTGGGCTAAGGAAATGGCTAACCTGAAGATTTGCTCCTCTGTAAGATACTGTTTCAGACATCTAGTTAACTCTCCGGATGATTCAGAGTCACGACCAAATGGCTTTTCCACAATGACCCTTGTCCAGCCATTCTCTGAGGAGGCTCTAAGACTTGCACACCTAACCACATCAACGAATATGTTTGGGGGTATCGACAAATAGTACAGCCTGTTTGATATCTTTCCTGCCTACAAAGCAGAAAGGAATTAGAAATGTGCTTCGTGCCATTGGTACAAGAAATAAGCATAGAGAGAGTGAAAGAAAATTACCTCTTTCTCTTTGAGCTTCTTGTTTAGTTCCGCAAAATCCTCTTCCGAGTTATACTGACCCGAATGGTAAAAGCATCTTTTCAAGAACTGCTCCATCTTATCCCCACATTTTTCCCTGTTGATTCCAACTTTTGTTCATATAACCAAAGCATAAACTTTAACTAAAACATACACTAAAAACGTATAGCAGAATATACCTCTGATCAATCCGGCAAGTTAAAGTACTACTAATCATGTCACGAAGCTCTTCATGAGTGAGTTTAGTCCGAGCATAACCAAAAACAGAAAAGTCCTGAGGAAGACAACCCTCATAAAAGAGAGCAAACAATGCAGGAAATATCTTCTTCTTGGCTAAGTCCCCTGACGCTCCAACAACTGTAATACTAAGAGTAGACTCTCCTTTTGTAACATGTTCCTCTGTAAGTTGATCTCCAGCTGAAACAATTTGGTAAAAACCATCCTCCAAAGAATCAAAAACACAAACAAAAGCTACAAAACTACTTCAATTCATAAAAAGAGAGACTTTATCAACCAAATTGCTAAACCAAACCCTCACTACCTCACAATCACTCTAATCTACTACATTCAATCCTAGAATACTCAAAGACATAATCCTTAGATGAGAAATGGTATCCTTGAGTACAAAAGATACAATCTTGAACTACTTTCTTCAATCGTCAAAAACACAGACAGAGGCTACAAAACTACTTCAGTTCATAAAGAAAGAGACTTTATTAACCAAATTCCAAAACCAAACCCTTACTCATTGCTATCTAACCAACTCACAATCACTCTAATCTTCTACATTCAATCCTAGAATACTCAAAGACATAAACTTTACAATCAAAGATGGTATCTTTGAGTATAAAAGGTCATAAAGATACAATCTTGAACAACTTTCTTCAATAGACATAAAACTGTTACAATCCTAACAACACAATCAACGACAGGTACAAGAAACTTCATCAAGAATTCTATCAAAAACTAATCTAGTCACATAGAAACTGGAGAAGAAACTCACAATCTTGTAAAGAAGCGAAATTAGTGGCACACCCATTTGAAGTATCAAGCTGAGAATGTTTCTCGGCGAAGAATCTCAAGCGAACCTGAGAAAACAAGGATTTTCTCGGGAATGTGAGAGATCTACTAAAGAGTGGTAGAGTCTCTTTAAACGGAGACGCAGCAGTAGCGAGAGACGAGGAAGAAGAAGAAGGAGAAGGAATGATCATAGAATGTGTCGCCATGCAAATTTTCTTGGAGCGTCAAAACAAATGTGATGATGATGATGATGCCATTGTTTTTTGCCTTATGAGGCTATTTGTATCGTCTCTTACATTATCCACAACAGTAGTTTTATTATATAGTTTTCGATATTTCTTATCTCTCACATTATCCACATATCTTATTTGTCAAAAAAGTTTTATTTTTCTTTGCATAAATTCTTTTTTTCTCAAGAAAGTAAACCGTATTAACATCCATCTCTGGTATAGCTTAACCGGATTATTCCATTCGAACGACCACAATTCGCTGGAAAGGTGATTTTGGTTTAGCAGTAAATTTCATACTTTATTCATTTTAGTACTCTCTTATGCACACTTTATTAATTTACTAGGTGAATATCCGGGATTTTTCGTAAATGTTTTACTTATAACAACAACAAAGGAAAGTTGTTTTATGTTATCTCTTTCTAGCCTTTTTGGCTTTTTCTAAATATACTGCATAAGCTGACTTCTCTGATTAACAAAGACTCCAATTTAGCATGATGAATAATGAGCATCATTTATACAAATATTATTTCTAAGATTCTATTTTCACCTAATTTAACCACATTTTGTAGAATTACTTACAATAAAAATTTAAAAAACCTATTCATTTTGTTTAAAATATTTTACTTAATTAAAATTTTATCATTAATCTTTCTGTCATTTACTTTTTGAGTATTATTGATTTTTATAAATCATATCAAAAAAGTTCAAAATATTTTTAATCTAAAAAAAACAAAGTATAAGAAAAATTTTAATGCCTAAAACTTATGAATACTTAAACTTTTTCACATTTATTTAACTACTTTAACTATCTTAAAATTACATACAAACTTATTAAATAGTACACATGCTTGACGACATTAAAATATATTCTCCTACTAAATATACAACAATCACCCAAAATAATAAAACACAGGTTGAATCCTAGTCATTATTTAGAATGATCATCTCTTGTGTCCCTTTTGTGGGACAACTAATCTGCAAAACCACTTTAGAGTCTTCCTATCTCCTTTGAGTTAATGAATTGTGTTAAGACGAATTTACCCCTGTATTTTATTTTGAATGAATAATTAATATTTCTAGAAAACATTTTGAAAAAAAAAAAAACGGAAAAAAAAAAAAAGCTCGAGCTCGTTCTTCTTCGGGCTTCTTCCTCCGGCGAGCCGCATTGTCGTTTTTCTCCTCCTGCAAGCTGCATCAATCTACTAAGTCCAGGTATGGAGAGAGCTTCAAAAGCTTTGAATTACATATTTTGAGGATTTTGAAATTCAATCAAATTAGATTTGGATTATTGTGTTTTAGCACCTACATTAGAAGTTTAAGTATAGATTTAGGCTTCATTTGGTCTGTTAATGGGTAAGCAATTGATTTCACATGCTGATTCATACTAAATTGAACTCAAATCGAATATTTGTTCTTGTCGCGAAAATAATACTGGTCGCACTAACTATAGTAGTACCGTAATTTATATAGATAGTATGTTTTAATAGCACCAATATTACTTAGACACGTAGTATTTCATATATGTAATAGTATTACTCACACATGTAATATTTCAGAATTAGTAATAGTATTACTGAAAATGTACTAGAATCGATAATACTAGTAATATTGACTGAGTATGTGTATTGTTTTGGCAGGTTACAATGAAAGAGAACGTGATCATATATTTTAAATTCCAAGGTCGCATGTATAATGTGATGATGAAGACATTAGGGGAGAAGATTACTCTCTCAATGTTAGAAGATAGGATAATGACGAAGCTTGGATTAGATGCAAATAAGGTAAAATTGCATATGAGGTACAATCCACGGTTGTTCGGAGTAGAGGAAGAAATGAACGTTTGTGATGATGAGGATGTCTTTGTTTATGTAACATCCGCAAAAAATAACTGAAGAAGTGTTTTGGTTGTGGAGGAGATCTCTAAACCGCCCGAGCCGGAGCAATTGCCCGAGCAATTGTCTAGAGTTGGTAAAAGTTCTGTTGGTAAGAACTATACAGAGGAGGATGAAATGAGAGTGGATGATGGTGCACTCATCGTCTTATTAGAAGAGGAACAAGGAACTCAACATCAACTTGAGGCAATAGTGGAGGATCACGGGACTCAACATCAACTTGAGGCAATAGTGGAGGATCACGGAACTCAACATCAACTTGAGGCAATAGTGGAGGATCACGAGACTCAAGAAGATGAAACACGCTATGATGAGTCTATGGATGATTCTGATAGGGGGGAACAGTATGTTGAGTCGCCACCTGTTGTAGAACCGGGTATGTTTAAGAAAGAATGGGAAGACGGAATTGGGTTGACCTTACGTCAAGAATTTCCAAACAAGGCGGCATTGCACGAGGTGGTGGATAGAGCTGTATTTGCTACCATTTTTGGTTATGTGATTAAGAAGTCGGATAAGGAGCGCTATGTCCTAAAGTGTGCCAAAGAGAGCTGTTCTTGGCGTTTACGAGCGTCCAATATCAGTAATATTGATATATTCTCGATTAGAAGGTATAATAAGATGCATAGTTGCACTCGGCTAAGTAAAGGTAGTAGTAGGCTCAGGAAAAAAAAAGGCAACCCACAATTAGTCGCAGCTCTCCTTCATGATCATTTTTCGGGACAGTTGGAAACTCCGGTTCCAAGAATTATCATGGAGCTAGTTCAGACGAAATTAGGTGTGAAAGTATCATACTCGACAGCGCTAAGGGGGAAATATCATGCGATTTATGATTTAAAAGGTAGCCCGGAAAAAAGCTACAAGGATATCAATTGTTATTTATACATGTTGAAGAAGGTAAATGATGGTACAGTTACTTATCTGAAATTGGATGAGAATGATAAATTTCAGTACATATTCGTAGCTTTGGGAGCTAGCATTGAAGGTTTTAGAGTGATGAGGAAAGTTTTAATTGTGGATGCAACACATTTGAAGAACGGATATGGCGGAGTGCTAGTGTTTGCCTCGGCTCAAGATCCTAACCGTCACCATTACATCATAGCGTTTGCCGTACTCGACGGTGAGAATGATGCTAGTTGGGAGTGGTTTTTCGAGAAGCTAAAAACGGTTGTACCCGATACTTCAGAATTGGTTTTCATGACGGACAGAAATGCAAGCCTCATAAAGGCCATACGGAACGTGTATACCGCGGCTCATCACGGGTATTGTATTTGGCATTTGTCCCAAAATGTGAAAGGTCATGCTACTCACACCAACCGAGATGTACTCGCATGGAAGTTTCAGGAGTTAAGTCGGGTCTACGTCGTGGCAGACTTCAACCGAGCGTATGACGGGTTTAAGTTGAGATATCCTAAGGCGACCAAGTATTTGGAGGATACAACCGTGAAAGAAAAATGGGCAAGGTGTTGTTTTCCCGGAGAAAGATACAACTTAGACACAAGCAATTGTGTGGAATCTTTGAACAATGTGTTTAAAAACGCAAGGAAATACTCGTTAATACCAATGCTTGATGCGATCATCAAAAAAATCTCCGTTTGGTTTAATGAACATCGGATGGAAGCCGCGTCTGGATCCTTAGAAAATAAGATGGTGCCTTTGGTCGAGAATTATTTGCATGATTTGTGGGTTTTTGCCGAGAAGCTAAAAGTGGTGGAACTAAACTCATTCGAGCGTGAATATGTAGTCACATGCGACAAAGGAATAGATTATACGGTGAGCTTGCTTTTGAAAACTTGCAGTTGCAAGGTTTTCGATATCCAAAAATATCCTTGTATTCATGCATTAGCCGCTTTCATTAACATTATGGATGATGAAGATCGGAGAAGAGGTTTGGAGTAACATGATTTGGTTACAAAATATTATTGGGCGGAGTTGTGGGCATTGGCCTATTATAGGACTATTTATCTTGTTCCGGATAGGTCGCAGTGGGAAGTACCAGATGAAGTAAAGGCGTTGAAGATAGTTCCGCTGTCTAAAAAACCGAAGAAAGGAAGCAAAAAAATGCTAAGGTTTCCATCAACCGGGGAAAAGCGGCCAAAACGACAAAGGACGCAAAACAAAAGGCGTCCAAGGCAATCGTGTCAATGGTTATTATTTGGGAATACGCCTATCTGAGTTTTTTACTTTGTTTTTGCAGTGATTTGTTGTTTTTATGGTATGGACTTACTATGTAATACTGTATTTCCCCTTCTATAGTACTATGTCTGTTTCTATTGTTTTTTTGTAATACTGGTTATAACAAGTAATATCATGTCTGTTTCTGTCGAATTTGTGGTCATATTAGTACTACTGGTAATACTAAGTTGGTGTTATGGAGTTCGAATTTGTTTACCTCAAAAGTCAATGAAAATGAATACAGTGAGTTATTAACAGATAAAAATGTATTATTAATCATTTATACTTAATTAAATTAGAAATTTTAATATTAAATCGTTTTAACTTATCTTTAGTAGACTCAATACAACATTTCCCTTATACTTTTAAGCTCACTTTTAATATTATCACCAACTTAAAATGAAAAATTCATATTGCTACATATATTTAATTTATAATTACACAAAATATTTAAACCTCTATATTTATAAAGTTCAATCCAGTGTACTACTAAATAAATAAATTATAAATATAGGAAATACTGCTAAACATGAAAAACATGGAAAGTAATACTATTTGAGAAATTGGCACTACCAAAACCTTAGGAAATACTATGCTGTAAAAAGGCTGCGCACATGTCAAAAATCTCCAAAAAACGGCGCACACGTGGGAAATTAATTTTTTTGGTTTTCCTCCAAATTTTTTGGCGCCTAACAAATTTTGAGATTCCCTCCAAAACCAAAAATTTAACTTTTTTCTTTTTCCTCTTTCTTTTTCGATCTCTTCTTACAACTTTCTTTCATCTCTCATCTCTCTTCTCCCACATCTATCATCTCTCTCTTCGACTCGAATTCTCTCACATCTCTAATCTCTCTTTCATCTTTCTACCATGGATAGACTGTGTGAGAGAGACCCCTACTACGTTGATATAAAAGTGGCGAAGAGAGCCATTGAGCAAATGGAAATGGTTGCGATGATGGAAGGGATTCCTAAGTTTTGTCCATGTGGTGGTAGCATTGTCGACACTCGAAAGGATGAAAAGAGATACTATCAATGCGAGAAGTTTAAGGTATGTTGATGTAGAGCACAAGTATTTCAAGTTTGTGTAGATCTAGATCTAGATATATTTGGTATTCCAGAGTATTTCCCGTTTTGGTAATACTGCCTAGAACAAGTAATACTGCACAAGTTTTTCTAGTTTTTGTAGATCTAGATCTATATTTGATAAATATTTGGTACTTTGTAGGATAATAGAACTGATTGTATGCACATCCGTAAACTTTGGGATAAGGCTATAGAAGAAGAGGTGAGTAGCTTAAGGGAGAGTGTTGATTACAATCAGAATAAAGTTCTAAGTCATGAGTATCTCATAGAAGAAATGCAAAAAGAATTGAAAGCCCACCGTGCAGAGATTGTGAACGTGAGCAAAGTGGTATTCCGTAATCCTATGGCTCCCAAGAAGTAATGTGTTATCCTATTGTTCCTTAATCTTATTGTTAATTTGCTTGTAAGACTTTCCCTATGCTTTATAAGACTTTCCGTATGCTTTGTAAGACTTTCCCTTCGATTGTAAGACTTCTCTTTGATTGGTAATACTATGGTTGTTCAGTTTGATATTTCCAGTATATCTCTTAGTAGTAATAGCACGAGGTATTTCCCGTATTATTGTTAACAATATCATAAAATATCCTAATACATTAATTGAATCCAAACATAGTCTTACGAGTACTTGCGAAATCCTAAAACAAAGTCAAAGTACAAGAAATCAAAATACAAATCCGGAGAAGTTACACGAATAGTTTTCACACGTCACTAGACTTTGCACGGGTTGAACGGCTCACTCGTTTGGGCACAACAGGAGCAGCCGCATTTTCCTTGATTGTTGATTCCTCCTCATCTGGTGGGTTCTGAGACATCTGCATTGTTAATTTAGTTAAACCTTGGTATTACGCGATATTACCAATTATGGAACAGTATATCCGGTATTACCCAGATTTACCTTGGCTTTCATCTCATCCATAAATGCTTCGAACGTTGCTTGTTTTTCCTCCATTTCCATAAGCGCCAACAAAGCTTCATTCAGCTTGTCATTGATGGAATGAAGCTTCTCCATTACATCAACTAACGTCGGGTCTCCCGGTCCAACAGCTGTGGGAACTTCCTCTTCATTTGGGGCTTCCATTCGTGCCTGCACATCCTCGTTGTACACCTCTTCAAATCTAATTTAACGCCCTTGACCAAGACGCTTCATCCAACTATCAATTACAACATCGTGCTTATCAACATCATCCTCTACTCCCGTGATTTCAGCCAAAAGAGGTACTTCTTCAGCCTTCTCTCTAATTATACTCTCAATGACCTATGGAAATAATAGACAATGAAATATTAGAAAGAAATAAAATCATATTTGCTCAAGGAATAATAGGAAATACTAACCTCAGTTGTTCCGAGTACATGGTTGATTTGCTCAAGGGTAAACCCTTTCATCTCGGTCCTCTTGAAATTCACCTTGCACATCCTTGGACAACCGGCATGTGCACCATCTTTTTCTTCTATGAATCTTTCCCTAAGTGATGGAATGGCCTCAAATGCTAAAAGCTACACAAAACACATGAAATTTAATTGTTAGCTTCAATTACGAAAATGTAACAAGGATAAACATGTGACTTACCTCAAGCGGCACACAGAATCCGGGAACAGGCCATGGTGACTGAGTGTTCGGGACGACACCGTTAAAATGATCCAATGTGTGTGAGATCGATTTTAACATGTACTCAAATGAATATCTCCCCCATGGAAATGTCTTACAAAACGTAAGATCACTTGCAGCCCTAACACAGAAATCATCAATTGGACTAGCCCTTTCTCCAGTCTTAGTAGGCACGGCAATGATGCTTGTTAGAAAATAGAGGACCGCCATCCGCAACCTATCCTTTGATCTAGCCGGTTCCATCTCCATTAGCTTGGTTTTCACGTCTTCACGTCTAATTACCCCGGTTTTGAAGTACCTGTTGGCGAAGTTCATATTACCAGCGCTCTGATAATTAGCTGGATGGGCCTTGCAGTTGAAACTAAAGATCAAAGCATGCTCCCTAATACCATAGCGGATGGGAACTCCATTAACAACGAACCAAACCTCCTTCTTCTTCTCAATAGATGCCGTTTGAAGAAAAAACATCCACATCCCCATTAACTTGTGGGTATATCCGAAAGGCAGGTGGTAGATGTGCTTGAAACTCGGATGCTCCATAAAATAATTCTTCTCAACATGCGTTAGAGGATGTTCCAAGTCAGCGAAGGTCTTCAACACCTCCGAGATATAACACCTCGTTGCTAACTTCATCTTCTTGGTATACTCCGACGCCGGGAAGTACATACCAAGTGGCTGCATTGCCATCGCTTCCTCCATATCCTGAAAAAAAAAAACATTCATTCATATATCACTCAATTGTAAATAGTACTGCACAGTATTACTCTGTATTTCTCAGAAGTATTCCCCGTAATTACCAGTATTACACAGATACTCCTATTTTACTATGTAGTATTTCTCAAAGTTACTAGTACTAACTATCGATAAATCACAATTATAGTATTACTCTAAGGTATTACCCACATCCGCCAATATTACCTAAATATCAACATAGCATTTCCCAATGTTACTAGTACTGTCCACAGTTCACAATTGCATTATTACCCAATTAGATCGGTATTACGAAATGGAATACTTACCACATTTGCGATGTCCTCGTCTATGGTCCTCTCCTCCACGGGTTTTGCCACTATCACGTCCTTGTCTCTCTCGTCCTCGTTTCCCTCCTCCTCCACGGACTTTTCCACATTGACGTCCTCGTCGCTCGCGGAGCTCCTCTCCTCCTCCTCCTCGATAACGGCTAGGCCGTCATCTTGTCTCTCCACCTCTTCCACGGGATTAGCACACGCGAGTTCTTTGTTTGTCTCCGTCTCCTCTGAATCGGAATCGGAGCCCAAGGTTCGGCTACTCTTCCCTGATTCTTCTTCTTCACTTGCTTCTTCTTTTTCATTTTCATCTTCCACCTCATCAGTTTGCATATTCTCTTGAATTTCTTCAGTAGGAATATGCTTCAAAGCATCATAAAACGTAGAATCATCAAGCATCGGGCTCTCTGTCGTTGGAGCCGTCGTTGGAGCCGTTGTCGTTGGAGCCGCTGTCGTTGGAGCCGCATTGGTTGCCATCGCCGTCGCAGTCGTTTGTGCCGGCGCCTGCTCCTCAGCCGGCACTTTCTCTTTATCTTTCTTCGCCGACGCCTGAACCTTCGCTTTCTTCGCCGGCACCTTCTCCTTCACTTTCTCCGCCGACGCCTTAACTTTCTCTTTCTTCATCGGCGCCGACGCTTCTATCTCCTTTCTTTTCCCTACCTCCTCCACGCGTCTTAGGCGGCATGACTGATTTCGAATCGGAAATAGAACGGAAATACTGGTGAAAGGAAGAAGAACGGTCGATTGAATTTAAAGAAATATGGAATGTTGCGGTTAATTTCAGCGGTTACTAAGGAGAAGAAGAAGAAAAATCGAAAACGGTTGTAATGAGAAAAAGAATGAAATTCGAATAAAGAGTAAAGGTTCCCTAGGCCCTGGAAATATTAGGTTTTTTTTTGGATTTTCAAATAAAGAGTAAAGGTGGTTCGGGTGGTTTGGTTCGGAAACGAACCATGGTTTTTCTGGTAATTAATAGGTTCAGATGGGGATATACTAGTAATATCCATATATTTCAAATTAAAAAATAAATAAATTATTTTTGTTTTTTACAAGGATTTTTTGGCTTCCTCTTTGAAAAAAAGGGACTGGCCAGACGACCATCATAACTACAACATATTTATAAACACAACAACAAAAATGAAACTTGATAATGTTGTAATACGAACAAGAATCGAAGTTATTTTCAGCACATTCTTCGATTTTTTTTCCTGGAAAACCGAAACCAACTCAACATAACCCATTGAAACATTTTGTACCTGGCAGGCACTTGGTAGCAATGCCTTTGTGTGTTTTAAGTCTGGTTTGAGAGGACCACTGTGGAAGAAATGTCTTGGGCAGAGTTGAATTGGGTTTGACCTGAAGAAAGAGAAGAAGAGTCGTTAAAAAGAGATCTTTGGATTTTCTTTAGTTCTTTGACAACTTCCACCATCGTTGGAACTTCTTCACTAGGACCCATGCATCTCAGTGACAACATTCGGAAAGCTTTCATTTGACAAAGCTCTTCTTCGGAAATTTGACCCATCTTTTCTATCATCTTTGGATCTGCAATCTCTTCCATTGATCGGTCTTCCTTTAATGTTGACAGCAAATTTCGAGCATGTCTTTTCATCTTCCTGTCAAATCCACCTTCACTTTCTTCTTCTTCTTCTCCTCGATAATGCTCGAAAAAGCTTTCCTAATAGAAGCCTTATACCCATAAACATTCCAAAGCCAAAGACATCTGTTCTCTCTGAGACTACGCCACTGCTAATGTAATTATCGGCAAAGTAACTATAGAATCCCTCTGCTGCCTCAACCTGGACAAATGTGTCTCCTTCTGGAATTCAGACGCAGTGAGAAAAATCAGTCAGCTTCGCGACCCCATCTTCATCCAATAAAATATTCCAATGAGACAAAATCCTATATACAAAGAGCCTAGGGAACGCAGTGTGAAGGTAAGCTAAAGCAGTAGCAATATCTTCAACTATCTTCATTCTCCTTTTCCATGGATGTTCACTTATTTCTAATTTGTAATGTTTCTTAACACCATGATAAACTTTGACTGAATCTTCAAACTCAAGACAACATCCAACCAATTTCAAAAAGGTTTTGTGACCACTCACCATCGATGAAACTGCTATGTCGCGGCTCAAAAGATCTACTTTGAAGAGACTCGACAAGCCAAGATCTTTCTTAATGAGAATCATGGGATGGTTCTCGTTCTTACCTGAATACCAGTGGTAGTAAAATTCTTTTCGAGAAACAAGATTAGTCGCTGAAATTGTTGGTGGCATTGCGGATCTCATCACCAGAGAAGAATTTGATGGGATTGGATTTGCCATGGCCGAATTCGATGAGCTCTTCTAACAACTTGGCCCCTCTCTTGGCCACTCTACCGGAAAGAAAGCTTTATTTTTCACATAACTCAAAATCTAAGAATTAACGGAAAGAAAGCTTTATTTTTCAATCAAGTGAGCAAAAGTTTCGAGACGACCTCACACTTTCTTGATAACTAAATTCTTGTTGAGTGTTGACTATTCAACACAGATGTCCTTCTGCGAAAATCAGAAATAAACATTTTAATGGATTTTGTGGAAGTTAGAGTTGGAAGAATTGATATCATCCTATTATAATAAATCACCAGTCACTTCCCAAATAACTGCAGCTCTATATATTTGACACTTGTCCTAACTCCTAAGTCTCAAATTCTATTATTTTACTTTCTTTTATATCCTAATTTATGACAATTTTATTATAATAAATCACAAATAACTTCTCAAAGAATTGGCTCTATACCTTTAACACTTGTCCTAAGTCTCAATTTCTATTATTTTACCTTTTTTTTTTCTTTTTATCCCAATTTACGACAATAAAAAAAAAAAATGTTATTCTTCCCCATCTTCTCCACGATCACTATAATATCCAAGCAAACAAAATACAAAATTTTTAAATCTCAAAACTACAAATTATAATTGGTTATTTTACAATTGGAACAGCCATTCAAGCATCTTCAACGTCTCCTTTAAGTTTTTTTAACAAAAATTCTCAATCACAAAAATCATCATCATCGTCACCAAATAATTTTGCAAAATAAATTGTTACACTGATTTGACCGCGTAAAGCGCAGGTTATTAAACTAGTTTTATGATATTAAGGTGATTTTCTACGATTTTTTGGCCATGCTTTAGTTATCAATTCAAAATTATAAACGGTTGTCTTTTTTTTTTAACCGTTGTTATTAATTGTTTAGTGAATGGTCTTCAAAAGCTCACACACTCGGCTGGGATTAGATCATCAATTATTACTATAAATCAATCGTTAAGATTCTCGGTTGCTACCTTTTCCAAATTAAGAAAATATGTTCCGTAAATTTATTCCTCTTCTCTTTTTACCAAATATTTTTCAGCTTTACTGATACTGAGGTAAGCGATTTTTTTCTTATTTGATATAGCATCTGTGTAGTATATGCTAAAAGAATGACGATTTTAGGCTGTGTTGTGTGATTTTAGGATTTTATTGTTTGTGAGTTGAGTCTCATGTATTAATAAAGTTATGTGTATTTATTATTAATTCTGTTGTGTTTATTATTAATTGTATTATGTGTTTATATCATATTGTATTTAAAGGCTTTTTAAATGTACTTCCTCCGTCCCATTAAGATAGATTTTTAAAGAAAAAACTGTCCTACAAAGATAGACATTTTATGTTTTCAATACAAAATTTAGAGTTTTTTTCATATTTTTCTCATTCGTGAGACTGGTCTTCTCCATTAACTAAAAGTACATATTCCAACATTCTCCTTCCTCCATGCACCGAGATTATATAAGTACAACATTTTGTGTCATCATTTTTTTTATTTTCAAAACTAAAAGAAAAATGTCTTCTTCTTCAAATTCATTAAGTCTTTGGGAAACGTGAAAAAGGAAGAAAAAAACAAATGAAGAAGGAAGAAACACATCGTGAAGTTTATATCAATCATGAGCTGGACTTGAACCAACTTTCTATCGAAACCACTATATTAACCATGCTCAAGATAATGTTTCCAAAATATTTTTAAATTTGTGTAAGTTATTTTAAGAATATGGCGTAAGCCTTTTTTTTCTTTGTAAGTTGGCTTAAGATTTTTGTAGTCATGATTTTAATTTTCTAGTTCTAATACAATGATCATGATAATGCTATATTTATTCAGATCTTATTGTAAGATTAATATTTTTGGTTTGAAATCTAAACCTTTTATTTCGGAGCATAGAGGCAAAGCAAAGAATATTCTTATTGATATACATTAACAATCATTTCTTTTTTCATGAACTATTCATTTTTTTGTGGTGATATTGATCTTGTTTTATGTGTGTGTATTTTTAGATGTTTTGACTATTAAATATTGTAAGTCAAAAATAAATTCTCATAAAACAAAATAATAATAATAAATTCTAAAACAACAGATACAATCATTGAAATAAACTCGATTGACCAAATTCAATTAGGAAAAAAACAAACACACAAATCTAAACATAACATGTTCTAAAATAATAAACTTGCTAAAAATTCCATTACACCTCTCACCAAAAATAGATCACAAGAGATTTGTATAGGTAGACGACCTTCTCTTTCCAATGAACCCTTCTTCATATGTAGAATTTTGTACTTATTTGAGCCTTTGGCTTTCATGATCTCTAACATGCAAGATTGCAAAGTTAAAAAGATCTGATTCACCTGTTTGCGGGGTATTCGTCAAATGATGTCTCTGCCGCCGACACAAGTTCTTCTACCGTTGTTGGACATACATTGTGTTGTAGTGATTGGATAGCATTAAAAAATCCAAGATCCAATATATTCAAATCCGGTGAATTCAGTGGTTGACACATCAAGCGTATATCAAACCCAAACTGTGAAGCAATTGCTTGAAATTGTGCATCTCTCGTATCCACATGCGTTCTTGCATTATCTTGTTGAACGAAAATAGTTTTCCCAAAATCTTCTCTTGACCACTTTTCGCGAATTTTTGAGATCACTTTTTCAATCAAGCATCTCTTTATATCCTCTCTCTTGATGGAGACCATCGGTTTCAATTCCAACATTCCCGCTTCTCTATTTATGCTTCGTCGCTTAGACAATGAAGCACAAACCAAGCCCGCTAGCAACTTAAACCCAAGTAAAACTTCATTGGGTGTTGATTGTTAATTATTAGGAATTAATTGTTAAAATATTATAAGATGTGTTGTGTGATGTTATGCGTTAGGTTGTTAGCGTGATATACATGTTGATTTGCTTGACGTCTTTAAGACGTATTTTTAAATAAAAATATAAAGATAAATAAAAGAGAATAATGATATTAAAGAAAGGATAAGATTGAGGATGTTGGACTGTAATGGAACTGACGGGTTTATTACAGGTCATTAATCGCTGACGAGCAATGAGAGGAAGGATCGAGCTACGGGCCGTGGTCTTCCATAATTAGGCTTGAGGAGCCATAAGTTAACGTATGTTAAAAACTAAGAAAAGAAAGTAAAAGATCTTGCGGTGAGCAAGACGGAAGCTTGTCTGTTATAGCTTACTAGGAAAGTTTAAGCTATATGCTTGTTGTTTGAGTCTATGCTTATGAAATAGAAATTGTGTGAAAGTATAATCGTGTTATTGTGATTCGGTGGACAGTTTTGACTGCCTTCACTGAATAATTAATTACTCACCCCCTTTTCTTTTCCCTCAGGTGAGGAAGAGAATGTTGAGTAGCTGCTCGCTTGGTGTTATTTCGGGGACTTTGGGTTTTATTTGATTTATCGTTATTTCTTATATTTCTAAACATGGTTTCTTTATTCATTTTTATCCAACGATTTTAATTTATTTATGCTATTATTTTGAGACAATTTATTTCTGATTCTTAATAAAAGAAAGTTTCCCAAAATTTTGATATTTTATTTCAAGATTTGTTTTGAAGAAATTGAATAAATGAATGGAAAGGATGAAAGTACGCCGTCTCAAGGTTGAGAGAGACGGGTATTATAGAGGGACACCTCTGAAGACACTTTACACCAAATGAGTAGTCGTATTCATTATTTATAACTAATATATTTATATCAATATTATGAGATGTCATCAGTAGCGGAGGCAGAATAGTTAGTCATAGGAGTCATATTTTTTTCTAAGCCAAATACAAAAAAAAAAGTTGAGAAAAAATGACAATATCATAGTTTAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAGAAGATAAAATGAGAAAGAAAAAAATTGTTCTGGTAAAGTAAACACTAAAACTAAGGTAATTTATAATGTGTTAAACAATAATAATGAGATTAACCTAGTTTAATGGACTTATGTTTTTATTTATAAAATTAATTGGGTTAACATGCTGTAGGTTTTATTTTTTTATTAGACTATATTTGGATATATATATTTGATGGGGGTTAATAATACTTTAGGAAAAGGGTCAATCTATAAAAATTAACAAAAAATAAACATATTTTCTAAAATCCATGGAGTCAATTGACCTCCATGGTTAAACACTCCCTCCGCCACTGGATGTCATTGATAATTTATTTTCTACCATAAAAGTTTTGTAACAATTTATAGCCACGAAGACTTTCACGTTTTCGCTCAATTCTCAATATTTCAGTTTTATATTATTCTGATTTTGGGTCCAAATGAAATTTAAGATCACAATTTATGGTGTTACAATTGACTTCTAGGTGTAGTTTTCAAATAAATTTGGAAAGTGTTTCACTTAAATACCAAAGAAACGTACATGCATGATGTTTTGAATTCCTTCTTTTATCAAACATGTTCAGCTTGTCATTAAATTCATTGAAAAGTTCACGTATCCTTTTATGTATTTAAAGTTTAATTTATTTAAAAGTAAATAAGTAATGTTAAAATTGTCATTATATATTATCTCTTAAATAACGTAAAATTTCTAAAAATTCATATTTGTGGGACGGAAGAAGTTTTTTTTTATAATAATAATTGTTTTTATTTTCTTATTTCAAAATTTTTACTAAGAACATAAATAACTAAAAATAGTTATTAAAAATTATGTCAATTTTTGTTAAGTTAGTTTAATTATAGTTGATATTTTAACAATTTATCTACAGTTATTATTAATATGCAATCACAAAAATATAAATATATAAAAAAATATAAAATTGTAAAATAATTAAGATAGAGTGTTGAATTTTATTAAACAAAACTAGTGTAATGTTTTAAAAAGTAAGTGGGTGTTGAATGATAATGTGGAAGAAATAGAAAATGATGTGGAGTCTTAAAAAATGAAGCTTGAAAATATTCTAACGGAATGTAAGAGTAAGACCATCTTCTGTTAAAGTTTGGTTGTTTGTTGTTAGCTTCCAGCATCTTCCGGCACATCTACAAGTAAAAAATAGAATGTTTACGATTAAGTTAGGTTTCATCTCTTATTAAAAGAAATGACCTTTAGAGATAAAGTAAAAAAACGGTAATGTTATTAAGTACCAACAAATATCACCTGTTCATCGGCCAACACCAACTCAAGCTTCTCGCTGGTACTCATGGTATATTAGCACCACAATTATAGGATTTATACTTGCACTCAGCCACGCAGTTTTGTATGGGTGTAAGTCCAGATAAACGAAAGAAGCAACCATAAAAATGATAAATGTTTGTTTGTTGGTTATATGCAATAGTTGCTTTCAGATTTGGTGATGTTAGAAGATGCAAATGATGGGATTATTTATAGTGGTTTAGAAGTCGATAGGGGATGGACATGAGTTAGTAGAGAAAATCTTGGTGAGCAAGCAAAAAAAAGAAAAAAAAATCACCATTATAAAATAAAATAAATGATTTAGAGACATAAAAATCTTTTTAATCTCATAAATTTCTGAATTTCGTCCAGATGTATTTTACTAGACCTGCTTGTAATTCATGATGTAAATTTGAATCACGTAACTCGGATCTAGCACGCACATGACTTGCAAATTCTGGTAACACCTCAATTGAGAATGGTTGTGGTGTACTAGAACCACTTGCCTCAGATTGATTATAATCGGACCAATGTTGAGCATATGTCTCTCGTTCATCATTAACAATCATATTATGCAATATGCAATGTTGAGCATTAGGTGAACGATCTAAAACATTTAATTATATCATTCAATGTGCCTGGACACCTAAAAAAGGCATGCCAGATCTTTTGATCATGAGATGCAACTCCTTCAAAAATAACAATGGTGGTTCCCTTATCTCCCTGAGTAAATTGGTCTTCCCACGCTGTATGAAATTTTTTCTACTCCTAGTGCATGCAATCAATACTCCCAATCATCCTTGAAAACCCCCACAACTCGCTAACACGCAGAATTCTTTGCAGGTTGTCTTGAGGCGGAGCTCTAAGATAATCTTCTTCAATTTTGTTGTGACACACTCTAATCCAGTTGATGATATACCTCACTTCAATATGAGATTATCTTTTATAAGCTTCGATATTGAAAGGAAATTCTGATTGATCCATTGGATTTTTTATTTTAGTAAGATGATCTTTGTGATATTAATTCATTAATAGAAGAATGAGTTTTCATTTATAAAAAATAGAGTGGTTGAAAGAGAAGGATAAGAGAAGGATTTGATTAAAAGATCATGTGGTTGAAATCCAATACTCAACAATTTTACCCCAGTATGATTCACTTTTTTGGTTTTTGCCAACAATGATGTATGTTCCATAATACATCCACTTAATAACACTCAAATTTTGCTCAATTCTCCATTTGAGGCTTTTCCGGCGAGTAGAAGTTGATACATCATTATTTGGAGTATTTTCATTAGCACTGGTCATACTTCCAAGAGTCATTTGTGTTGAAAATCCATGAAATTCAGGAGGCAGTTAAGATGAATATGTCATCATCGATCCATAATATGGATGATATTTTGGAACAGATGATGACATAGAAAAATTTGGTGGTAAACTATAATTTGGGACATTTTGAGATTGGTTGAAAGATGGACTTTGAAATTGATAATTATTGGGATTTAAATAGGGAAAAGGATAATTGGTAGAATTTTGGATAGAATTATTGTTGGAATTTGGATAGGAAAATGGAAAATTTATAATATTTGTGAAGGATTATTTTAGAATCTATTTCACAAAATAAAATAAAAAATAGAAGCAAGAGTTTATTAGAGGATAATAAAGATATTATGATAGAAATGGTGTTTTTTGTATGTATCTGAATGAAATGAATCAAGTTTCCTTTTATAGAGCTTAAAAAGTAATAAATATCCATATAAATGTTTTAAATTTTTTTTTATTATCTATATATTCATTTACATGGGATTTTTGCGTTAATTCCCTTAAACCCGGCTTTAATTCATTTGGGTTGGGTTTCGATCCGGTTTTATCGTATTCAGATCTTGAATAGGATATTTGGGTCGAGATTTCTTTTGTTCGGATCGTGTTTAGGAATAACATGTGCATCTTTAATCGAGTTAAATTCTTCTTTTAATCCACGTAATTATTTCCTTAGATTCTGTCCACCATATTCGGCTTACTACGACTTATCCTTATATATTTGCAATCTTAACAATTATATTGCTACCTACTGAATCTACATATACATTTTTACAGGAATTTTAGCAATTAAATTCTCAAGTTAGAACTTATTTACAAGGAATACCATTGACATTAATTATTATCATTTAATTAATATTCCTAATTATTAGCATTTTCTTATTTAATATATTTCCATCAATTCTAATTACTTTTAAAAAGGAGAAATCTTAGGACTTTATTAATATTATACTTTATTAAAGATAAATACTATAGTTATTTAAAGTTTATAAAATGTTTAAAATATTTAACGAAAAAACTTTTAGAATATATATATTATATAAAATCTATAAAATTAAATAACCATTTCAAAATAAAACTTTTAAATTGATTTGAATTATAAATTTTTTGATAAAAATATTATTAAAACAAACAAAAAAATGTTTAATTTTACGGAACTGGATTAGATGGTGGAACGGGTTTAGAATATTATAATGTATGTATTTTATAACAATTAAATAACCATTTGAAAGAAAAAATTTGTATTAATTTGAATTATATGTTTTTTAAATTAAAATATTATTAAAACAAAAATAACAAAAACAAAATGTTTAATTTCATTGCACGGGGTTAGATGGTAGGACATGTTTGGGTCGACAGTAATACGAGACGGTATACCACGAGTGAAATCCATTAGATATGTTTAGTTTCACTCAACGGGATTAAATGGTAGGACGTGTTTGGGTCGATAGTAAAAAGAGTCGGTATATCACAGGTGAAATCCTAGATATAACAATCAAAATACAATTATATTATCTTAAGAACTAAACAAAACAAATAATATTAATAAAATAAAGATAATTAAAATTTAAATTATTTAGTTATAATCTAGATTTTAAATTAATGAACTGTACATTATTGTTCATATATTTTTAAACAGTAAAAATCAAACATATTAATTGTATATTGAATAATATACATATATAAGAGTTGTACATACATAAAATACAAAATATGAAATCATATATATTCTTAATCGACTAAATAAATTAAATTTTTATTCTTAAAAGAACAAAATCGTCATGCAATACATCGCGGGTTAAAATCTAGTCTTTCTATATTCTCGTTATACTCTGCAACTAAATATACTCCCTCCGTCCCACTAAGATGAACTTTTAAAAAATTTCACATTCTTTAAGAAATATTGTATAAAGATAATTTTAACCTCTTAATATACTTTAAAAATAATAATAAATATTTATCTAATTATTAGTAAGGGTAAAACGGGAAAACAGTTTTAAAATTTGCATTGGAAATATAAAACTTCTATCTTTGTGGGACAAATATTTTTCCTAGAAAATTTATCTTTATGGGACAGAGGGAGTATTTTCTATCATTCTAAAAAGTTTAAACTATCAGAAATCTTTGTGCCACTTATCATATTAGAAAGAAGTAGCCTGTCCATTTCCCACTGCCACCTTACAAAGCTTGTCTATCTCCCTTATGCATGCACGAGGTAGTCTACAAGCTGCAAGCCAAAAATTGCATATGCTCCACAAAACCCAACTGATCAGATTTAAACGTCCAGCAAAAGAAAGAAATCGGGACGTCCAAGATTCAATTTTCCTTGTAATCTTTTATAACAGGGGAAGACAGCCAGATGCTGTGAATCGCTTAGTGACCAGAGGGAGTCCGAGATACCTCACTGGTAACTGACCAACTTCGAAAGGGAACCTTTGGGTTATCTCATGGTGGACTGAATCTTAAATTCCCGTCAGATACATTGTCGACTTTTCCTTGCTTATTTTTAGTCGTGATAATTTTTGCAAAATCGTTTAACACATGAACTATTCCTCCTATTGATATGACCTTTCCATCGGATAGGATCTTAAGGTTATCAGCAAAGCTCAAGTGAGTTAAGCCAAGACTTCCACATTTCAGATGGTAACCAAATTGTCTAGCACCTGAAGCTTTATCCAACATTTTAGAGAGAACATCCATACTAATGACGAATAAGTATGGAGAGAGAGAGCATCCCTGTCTTTAACCTCTTGCACTGTTGAAAAAAACAACTAATTCCCCATTAACTTGAACCGAGAAGGAAGACGTAGCTATGCAGAGGGTAACCCAATGAATAAAGACTGAGGGAAAGTCCATGGCTGTGAGAACTTTGGTGAGGAAGTCCCACTGTACCGAGTCAAACGCTTTTGATATATCAATTATTAGAGCGCAACGGCTAGAAATTGAGTCATTATGGTAGTCCTTGACTAATTCTGTCGCCAACAACACATTCTCTATCAATAGACGGTCCTTTACAAACGCTGACTGATTTCCCGCTATGAATTGAGGAAGAACCAATTTAAGCCGGTTTGCAATTATCTTGGAGATAACTTTATATGTCACATTGCAGCATGAGATAGGCCTATAGTCTTTAATCTCTTTCACATTTTTCTCTTAGGAATAAGTGCTAATATCGTGGAGTTGATGCCTTTAGGTAAGAAGCCTTCAACAAAGAAAGACTGAATCGCCAATACAAACTCATCTCTGGTGATTTCCCAAGCTCCTTTATAGAATTCTGAGGTAAATCCATCTGGTCCCGGAGATTTATCATTAGGCATAGAGAACAAAGCCTTTTTAATCTCAGCTGCAGTGACTTCATTGGTAAGCATCTCTTTTTCTATTTCCATACAACAAAAGGGTAGTAACTCTTGAAGCTCAGCCACTGAAATACCTTCGAAATCATTAGGAACTAGCTGCAAAAATTCTCTAAAGAACCGTTCAGCCTCTGTTGTGATTTCCTCCTCTTGTGCCGTCACAGTCCCATGTTGGCATTGAATCTCTCTAATTGTGTTCCGTGCCTCCCGCGTTGTAACAGCTCTATGAAATGCTTTATTGTTTCGATCACCAATCTTCATCCAATGTAATTTTCATTTCTGCTTCAAATATATTTCTTCCAGAGCTGCGACCTTGTCCCAAGTGTCATACGCCTCATTTTCTTCTTGCATTGAGCTTGTGGTGGGGTTAGACAAATTGGCCTCCTGCTTCTGACACAATTTCTCATACGCATCTTTTGTTAAAAAACACATTTTGATTTTCTTATAAGAAGTTTAAACATTATAAATACTAAAACTTTATATTACGGGTGAAATCTTAGAATTAACGAGTATGAGTCAATATTAATATAGGATGATATACCACCTGTGAGATCCTAAAATTAATAATTAAAATACAATTATAAAATCTTAAAACACTAAATAAAGTAAACATTATTAACAAGACAAATACAACTAAAAATTTCAAATATTTAGTTATAAAATATAGTCTATCTTACATTAAAACCAAACAAAACAATAACATATATCTACAGAATTTGTTTTAACTAAAATATATGCATGCGGTGTATCACGGGTTCATATCTAGTATGCTACATAATAATTGATTGTAAATAAATAAGGTGAGATAAAAATCTCCAAAATCTCAATTGCCAATAACATTACAACAAGTGTGTCTCTCAATAATTTCTTTCTTTTTTGAACAAATAATAATAGAAAACGCTTTACTTGCGAGCTAGGTGTGTGAAACATCTTCCAATCATATGGTGATACGTGGCATGGGCGAACCCAAATAAATTTTTTTCTATATGTTGAATAGATTCAACACCTAAAAATCTAATGCAAATTTTTTTTCAACAGGTCCAATGCAAGCAGTTTTAGTCACATGCAGTTAAAGTATTAAATCCTTCTACTTATAAATATTTTATTCCTACTTAATAGCATGTATGTATTTTGGCAAAAAAATGCTAAATCGGAGATGAAGTTAAAATATATATTGTGCGCTCTAATATCAAATTAAGAATTATATTTCGTCCAAGCTACTTAGTACGTACATGTTGTATTCACTAGTTGTCCTTCCTTTCTTCTTTTCCATGGTCACAATTTGGTTCATTGTTTCTTCTAAGGGATTGAGCAATCACGGTTTTTCGGGAGAGTGTTTTTTGGGCAATATCTCTTTATATATTTAAGAATGCTAAAATGTAGTATTTTTGTTGGTTCTTGTTTCATTGCCAACATTGTACGAGGCGTGATGAAGGCAGTGAAGAGAATAAGGGTAGTTTCGTAGACATAGTAGTTGAAGAGCTAAAGCTAAGAGAAGACGAATAACACACATACATGTTGCTAAGAAAGGAGCGTCTTCGCAAGGGAGAAATCCGAGGTGATTCGAGCTAGGCAAAGAGGATGGAAAGATGTAATTGTGTTTTCAAATCATATATATGAAAGGAGGTGACCTATCTCCATATGAATGACATGTTACACCATAGAGATGATATTTTCTGTATTCTCTCATCTTATTCGGAAACCTAAAAAGGTATGGTGAAAAATATAAGAATAGAAGAATGAGAAAATGGAGGCTTCTTAAACTAATTTTAAATTGTATTTGCTTAATTTAGGACTTGAAAATATATTCTGTATATTTTGAAGATTAGTGAAATTAATGGGTAATTTTCTCAGACATGGAAATCTTGTTTTATTGTTTTTCCTTTATGACTTTGCAAATATAGTAGGTTTCAGGAATTTTTATGAACTATTTTATCTTCAACTAGAATTAATACTCCAAGTACTTATATATATATATATATATATATATATATATATATATATATATATATATATCATATTTAAATTCATATTAATTTGAAAGTGTTAAAAATGCCCTTGAAGATGACAAACAACTGAAACAAGACATTTGAGCAAACAACTTGAGATGCTAACAAATGGTTTTAGTAGACATCTAAACAAATCCAAATTCTAATAAGATTTATTTTGTTAGTCATGTACATATACCCTATAACCCTAATATGGAAACCAAATAAATAGGTCACTATGGATTATGTATTTTGACCAAAAAAAAAAAAAGAAGAAGATGAATAATGTATTTTTCTGTCTCTACATACAACGAAACATAGTTAAATGTTTAAAGTTCAAAATCTACTAGAATTTGGCTACTCAGAATTATAAAAGAGATTCAAGACATTTATGTAGTACCTCTGTTGAAACATTTTTTGAGAATTTATAGTGAAAAGTGTAGTCATTTTGTGATCTTTTCCAGCTTCCTATATTTCATGCGTTTTAGCTATATACTATCCTACTATATTATTTGGGAAGTACATTTTAAAATTTAACCTTAATTTTTATAACTAATTACATGACAATGCCATTAAAAAAATCTAATCAAAGACAAAATTGTTTCAAATCATTAAGGTTAGTAAAATCATTTAACGATAATATCCATCTACTAATCACACAAGTTAATGGATATATAAACGGGTTAAATATTTTTCTGCCATTTATTAAAAATTTTCGTCAATTCATATTTGTAAGATTTTTTAAACAATAAGATCTTTTTGTTACCAGGTGGAGAATAAGTTGGAACACACTTATATAGTTTCCTTTGAAAATCAACAAAATCTTAGCCACTATATCGATTCCTATCACCATATCTCGCTGTTATAATATTTCTCATCACTATATTCCGGTTAACAAGTAATATTCCTTGAGCTACAATTTTTTTAAATAATCTTCTTTCTATCAAATAATCTATCTTAAACAATTAACTACTAACTGATTTAATTAGATCTTCAATCTATTGAATTCACCCATCAGTATTATAAATAAGCAGATAACCATCATGATGTCTGTACCTTCTCACATACACACCTATCAAAAACTTAAAACCTTTCAAAACCTCTTGGTATATTCATATTAGGATTCTTCATTCATGGAATCATTATTCCAAGGGTTTTGGGATGTCTTATGAAATAATTTTGGCAGAAGAGTATGTAAAATTTTTTGAATAAAAAGTAGTCAGCAAAACTTTTCTTTTTTTGGACTTTTTAGATAATTAATTTAGAGAATAGGGTTGGGCATATGATTAACCCATTCGAGTTCGGGTAGAACCCGTTCGAGTTTGGGATTAATGGGTATTGGATTTACTACTTAATACGGTAATTCTAAATATTCGGTTCGGTCGGGTCCAGTCGGTTTTCAGTCAGTTTGGATAAAAAGTTTCAGGCCATAAAAATACCCAAAAAAATAGAAACGGGTATTTTGTATGTAGATAGCGGATCCCCAAACAAAAAAAACTTTTAAATTTGTTAAGTTTTAAGAAATTTAGTTATATTTGAATATATTTTACTAAATTTTGACAAACATAACAAATGATTTTTGAATAGTTTAGTTGTTTTGGATATTTAGGTCCAACATTAATTGACATATTTAAATTTTTTTTTTTTTTTGTCAACCGATATAAATTAAAACTCAAAAGAGCCAATCCCGAGGGATATTGTTTACATACGTGACATGATGCGGTACGGTACGAATCTTTCGTGCCAACTTATCCGCTTTTACATTTGCACTACGAGAAATTAAAGATAAAGAGAAATTTGTGAATTCTTCCCTATCACTCTGCAACTCCTCCAAATACACTGAAAACGCCGGCCATTCGGTTGGAGAAGACACCATCTTCACCAAGTCTGAACAGTCTGTAAAGAAAGCTACGTTCTGGTTATCTGCTCCAATCATGCACTTCATCGCCCAAAGAAGAGCTTCCATTTCGGTATGTAGAGGAGATAGACTTCTACGAACGTTGGCGGCTCCCATGGTTGGCGACTCTCCAAGAGATGATAGACAGAACGTTGGAGACATATTTAGATTTATAATTATAATCTTAGATAATTAGATTATATTAAGATTAAATATATTAATATTTTGGATATTAAATAAATGTTTGGGTTTTCGAATACCTTTTTGGGTAACGGGTAATCTCCGGACCAATCGGATACCCACGGGTTTACTAAAACTCTATCCAATAAGGAAAATTTATTAAAATTCTAACCTGCCCTAACCCGATTTTTTGGTTCGGGTATTGGGTTGGTTATCTGGTCTGTTTTTTTGTCAGCCCTATTAAAGATAATCTAATATAGGGCCCAATTAGGCCACAAATATAACCAAAATACTATACAAATACTAATTCTAAGTTAGGCCAAAAATTAGATCCTCTATTACAAACGAAACATGTTTCTTACCAAAACAACTTGTATACAAATTTTACACATTTACTTAAAACTACATATGTTGTATTTATTATAAAAATGACATTTTTAAACAAAGTTAATCCAATGCAGCATTATATCCAAATAGCAAAAAACATTGAAAAATATTATGGCATCACTTTTACACTATACTATTTTTTATGTAATTCAAACAAAGTATACAATTTAGTTTATACAAAATATTAATGCCTGTGCTATATAGCACGGGTTATGATCTAGTCTACTTAACATTTTTGAAGTACAAAATAAAGAATTTTTCGGGTCGGTTTTTTTTTTTTGTTTTACCCGGTTTTTTTGACCCACATCCTATTATTTTAAATGCTAATCAAATCTTACCAAAATTAATCGCTTTAAATACGATTTAGTTACAATTAATTATTTCCGTTCAGCAAAGTAAATCCGACTTATATGGAATGAATATATTAACATTGCAAAACAAATCCGACTTAGGTAACTTAGTATTTATCCGTTCAGCAAAGTAATTACTCGAGTAAATATTCTATTAACTACGAAATCTTCAAGTTAAACGAAATCAAAATCTGCATTCCACTACATAATTTTCGGAGATCTTAAGAACTAAATTAAAGCATATTCCTAAGCATAATTTAAAAAATCTCGCTACACAATTTCCTAATATCGCAATAGTCAAATCATGGGCGAAGATTGTGATTATCATATGTTCTCTATATAAATAAGGAATTTGAATTGAATTTCTATGCTAAGCCATTTGCCATAAAAATCTCAACAAAATATTGAATTCATTATCTCTACAATCTCGACAATAGAAACTATATGATTGTATTAAAAAACGGATTTGGTGCATATTCCTTGAATATTCGATTAAGAAGATTTGATTTAATTTAGTTAAGGTGCAAATAATTTGTTATGGCCCCAAACCTAATCAGAACTCGCCTATATATATTCTCTAGCTTTACCTCTCATCACATTATCAAACACACAAAGCTCATCACATATCTTTGGATTTTGAGACAGAAAATAAAAAATATGATTCAGGTTGAGAGAGTTACTGAATTCATCACGGAACCACAGAAGCGATGCAGTGGTTCATCGGAGAAGCCTGAAACGGCTTCAAAAGTTTCTAGAGAATATCAGAAGATCCCAATCTCTAATCTTCATAGTGAAGATTAAATAGAGAGAGAGAGAAAGAGAGATTAGATGTACATCACGTAAGATTGGCGACAAAGGAATCGCTAAGGGGTCGAGTGGTTTAATCGGAAATCGTATTCGATAATATCAATGAAGCAAAATGAAAGTAGCACACATAGGTTTGTATGGTGAGACTTGAGAGCATCTTCGACCATCAGAGAGGGACAACTTCATGAGAATCGATGGAAAAAAAAATTAGCTTCGAGGAAGAAGCAATGGTTTGACGAAAAACTAGATGGTCACAAATGATTGGTAGGCATCATGTTCAAAAGCTTAGCTTGCTCGAGAAGTCACCGACGAACGTGGAGTTGGCCGGAGTTTCTGTCATCAAAACCGCGTTCAGTTTTGCATTGCAGAAATCAAAGAAGATGCTTCGTTATTATCGATGGGGAAGAAGCATAAAAAAAAGTCTTCCTCTGATGTTAAAACTAGGCCAAGTATTTGTCATGCCCATAGAACTTGCAACAGAAAGCAACGTTAGTCTTTGGATAGAAAACAATTACGGTATTTTTTTATGTGGTTTATACATTACACTAATTATGTTAAATATTTTTCAATAGTATTAACGAGAAGCACAATCTATATATATATATTTTTGGAGAAACTTTGGGTCAAATCCTTTTATAATTTCTTATTTATACATTTAGTCCTTATAAAATAATCTGATAAAAATATTGTCTTAAGCAATTTTGACAAATAAAATTTAAGTAAATAACATTAATTAGTTATAGATGATTTACGGCAATATTTCCTAAGAAATAAAAAATTTGCGACATTAATGCTATTAGAAAAGAACTAAATAAAAATCTTCAATGGTATATTTCATTATTAATTCGCTTTATTCCTAAAAATATTTAAACAAAATTTAGTCATTGATTTGCAAATACAGAAATTGTATATGTAGTTATAACAAACAAATATTTTCAAATCAAATGATTTTCTATTTAAATGCTAGAAAAAACATAATAAGTTTTTAATGTCATATCTAAGAAAATCAATAAATTGATATATTATTTTAACAAATCAATATCTAATGCTAACAATAAATTAATTTGATACACGTTTTTAATTTAATGCTAATAAAAAAATAATTTGTTCTAACGCTTCCTATTTAAATGCTAGAAAAACGTAATAATTTTTTTAATGTCATATCTAAAATAAACAATAAATTGATATATTGTTATAACAAATAAATATTCAATGCTAACAATAAATTAATTTGATACACGTTTTTAATTTAATGCTAATGAAAATTAATTTGTTCTAACGTTTTTAATTATGGCATTAAAGATTTATTGTCAAAAATAAAATTAAAGTACTTGATAGTTTGTATATATATTAAATTACTTAAAAGTTAAAATTAATGTATATATAAATATAATAACAATTAAAGTACATAAACAAACAATCTTTAGTTGTTATATACTATTAGTAAAAAGAAAAATGACAAAATGATTTTTATTTTAACAGACGGGGTTATATGGTAATACGGATTTTAGTCGATATTAATAAGAGACGATATAGCACGGGTGAAATCCTAAAATTGATAGTCAAAATATAATAATAAAATCTTAAAAAAGAAAACAGACAATTATTTAATTATATAATTATACCGGACAAGGTTATATAGTATGACAGCTTTTGGTCGATATTAATACGAGATGGTATACAACGGGTGAAACCGAAGAATTAACAATCAAAGTACACTTATACAATCTTAAGAATCAATTGCCGGACAATAAACAATATTAGTAAAACAAATACAAATAAAATTTAGTTATAAATTAACCCGCGGACTGGAGCACACCGCGGGTCATATCCTAAACAATAATTTCTTTAGGATAACTACAATTCCATATAAAAAACTAAATTTAAAACAATTTTTTTATAATAATGTTATTTTAAACAAAACAAAAAACAATATAACAAAAATGTAATAATGCACCATAAAATACACACTCTATATAATGATGCGTATAATAAATATGTTTTCTTAAATAAATAAAATTAAATCAAACACATACTAATATAACATCAAAAATGAATAGATATAAAAGGTAAGGTGATAAATTAAAAATATAACTTGATTATTTAGATAAAAACGATATCGAATTAAAAAAATAATTTAATTTCTAACACAAATAATCAACTCGCGGTACACCGCGGGTCAATATATAGTTAAATTAAGGTTAGAAACTTAGAATTAAGAGATTTATAATTATAACCGGTGCCGTGGTCATGGACTCATGCGTATATATCGGTATTTTAAAGACAAAAATAACGAAAACGGCACGCAGTTTATCCCTCAACACCCGAGACAACACTTCTCGTAGTCCGTGCTTAAATTCGCCACGTAGTTCACTTTATTCAACTTAAAAAAGCATGACGTTTTGGTGCATCTATCTTCTTCTTCCCCCTTCCTCTCTTAGCTTCTCTCCCACCACTAAGGAGAAACGTTCCAAAGATCCCTCTCTCAGAAAAATCTCCAAGAAAACGAAACCCTAATGGAGAATCATTCTGATCCCTGAAACTTTTGGCTTGCGGCTGAATCGATTTCAAGATTGCAAGTATTGCCTAGTGTGAATATGCTGTTGCTGTGTGATGCTTTGGTTAAGGAAGTGACTGTTGAATGCTGAAAGGACGACTTGGAACCTTATCTCGGGTTGCATTACTCGGCAAACTTCGATATTTCTTTATATGAGAAACAAGGTTACGATGATTTCAAGAACTGTGCTAATCTTTGCCCAAGATTTACATGTAAATGGTACTGATTGAGTGTTAAAAGGAAGAAGCTTCATACATACAATATACATTGATCGGATATAGTTTTAGAGTAGGTTCCGAGTTCCAAAACAAAGTGAACTATACTGAGTATTTCAACATAGAAAAGTTATAAAATTGACATCCTTTGCAAAGTAAAAGCCATATCATAACAAAAAAATCGGAACATTTAACCGAAAACAGAGACAACCCACAAAAGAAGAAGAAGAATGCTAAAATTGAGAAGCACTGATGGAGTTGGTCGAAGGGGACCAAACGGAAGGGAATATATCTTCTATAGACTGCTTACGAGTTATGAATTGAGTTGCGTCAACGTGTGATTCTGATCCGGCTGAAGGAAAGGCCGCTTCATGTGAATACGCACATGGTTCCTTGTACGCCTCTCTTTCCGAAACGTTGGCTGCAACTTCGTATGATTGTATTTGTAGCGGGCCTAGCGGCATTAGTTTCAGATGGCTGATGATTTTCTTGAAATTTTTTGGTGGAAGCGAATTAGAGATAACATACTTCGGAGGATATGCATTTTAATAACATATTTATAAGTTTTGAGTATCGCATATTACGAAAACGAAAGCATTTGAAAGATTCGAGATTTCACTATCGAAAGTGGGGGAAGACACGC\n>URS00006236D2 tRNA from 1 species \nCTCCCCATAGCTCAACAGGATAGAGCAGCCGCCTCCTAAGCGGCCGATAGAGGTTCGAGTCCTCTTGGGGAGG\n>URS0000187CC4 rRNA from 1 species \nATTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGCGAAAGCCCTTCGGGATGAGTAGAGTGGCGGACGGGTGAGTAACGCGTAGGAATCTATCCTGTAGTGGGGGGATAACGTTTCGAAAGGAACGCTAATACTGCATACGCCCCAAGGGGGAAAGCGGGGGATCTTCGGACCTCGTGCTATAGGAGGAGCCTGCGTCGGATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACCGGAACTGAGACACGGTCCGGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCCATACCGCGTGTGTGAAGAAGGCC\n>URS00023B9165 lncRNA from 1 species \nGATAGAACACACTTCAAGCATTAGATTTAAGAAAATTTATATCTTCTCTCATCTTTTGATTTTCGGTCTTGAATTCGAGTTTGAGAAAGTTGGAAGTTAGAATCTTGACGTCGAAGTTCTAGTTTGCTGCTCTACACAAGGTCAGTAATCTCGTTCATTTGGTTCGTTTTCAAGGATTGGTTATTATAGTATGGAACATTTTTGTGTTGTTATTCTCTGATTTAAATATGCACTGAAATATGTCTTGCTGTATTTTAGTTAGAAATCAGCTTGCAACAGGTTAAATGAGTTTCTTAGATTAAGAGAATTGACT\n>URS0000F2E397 rRNA from 1 species \nCCTACGGGTGGCAGCAGTGAGGAATATTGGTCAATGGGTGGGAGCCTGAACCAGCCAAGTCGCGTGAGGGAAGACGGTCCTACGGATTGTAAACCTCTTTTGCCGGGGAGCAACGGGGTCCTTGCGAGGTCCCAATGAGAGTACCCGGAGAAAAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGAGCGTAGGCCGGTCTTTAAGCGTGCCGTGAAATTTTGTGGCTCAACCATGAGAGTGCGGCGCGAACTGGAGACCTTGAGTGCGCGGAAGGCAGGCGGAATTCGTGGTGTAGCGGTGAAATGCTTAGATATCACGAAGAACCCCGATTGCGAAGGCAGCCTGCCGCAGCGTTACTGACGCTGAAGCTCGAAAGCGCGGGTATCGAACAGGATTAGATACCCTTGTAGTC\n>URS0000620B57 rRNA from 1 species \nAGAGATCATGGCTCAGAGTGAACGCTGGCGGCAGGCCTAACACGTGCAAGTCGAGCGGCAGCGGGTCCTTCGGGATGCCGGCGAGCGGCGGACGGGTGAGGAATGCGTCGGAATCTGCCTCTTTGTGGGGGATAACGTAGGGAAACTTACGCTAATACCGCATACGACCTACGGGTGAAAGCGGGGGACCTTCGGGCCTCGCGCAGGGAGATGAGCCGACGCCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGAAGAAGGCCTTCGGGTTGTAAAGCTCTTTTGTTGGGGAAGAAAAGCACTGGTTTAATACGCTGGTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGTGCAAGCGTTACTCGGAATTACTGGGCGTAAAGCGTGCGTAGGTGGTTCGTTAAGTCTGATGTGAAAGCCCCGGGCTCAACCTGGGAACTGCATTGGATACTGGCGATCTGGAGTGCGGTAGAGGGTGGCGGAATTCCCGGTGTAGCAGTGAAATGCGTAGATATCGGGAGGAACATCCGTGGCGAAGGCGGCCACCTGGACCAGCACTGACACTGAGGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGCGAACTGGATGTTGGGTGCAACTTGGCACTCAGTATCGACCTAACGCGTTAAGTTCGCCGCCTGGGAAGTACGGTCGCAAGACTGA\n>URS0000D14622 rRNA from 1 species \nAACAGCTCAAATTTGAAATCTGGCCTCTTCGGGGTCCGAGTTGTAATTTGTAGAGGGTGTTTCGGGCGCGATGCCGGTCTAAGTTCCTTGGAACAGGACGTCGCAGAGGGTGAGAATCCCGTACGCGACCGGTGATCAAGTCTGTGTGAAGCCCCTTCGACGAGTCGAGTTGTTTGGGAATGCAGCTCAAAATGGGTGGTAAATTTCATCTAAAGCTAAATATTGGCCAGAGACCGATAGCGGACAAGTAGAGTGATCGAAAGATGAAAAGCACTTTGGAAAGAGAGTCAAACAGTACGTGAAATTGTTGAAAGGGAAGCGCTTGCAATCAGACCGGTCCGGAGGCGATCAGCCGCTGCTCGTTCAGCGGTGCACTCGCCTCCGATCCGGCCAGCATCGGTTTGGGCGGCGGGATAAAAGTCCCGGGAATGTAGCTTCTCTCGGGGAGTCTTATAGCCCGGGTCGCAATGCCGCCCGCCTGGACCGAGGACCGCGC\n>URS0001D2993E rRNA from 1 species \nGCTAAGGCCCCCAATTCATGGCTAAGTGGGAAAGCAGGTGGGACGACCAAAACAACCAGGAGGTTGGCTTAGAAGCAGCCATCCTTTAAAGAAAGCGTAACAGCTCACTCATCAAGCGATCCTGCGCCGAAAATGTAACGGGGCTAAAGCCATTTACCGAAATTGTGGGCTCGAAAGAGCGGTAGCGGAGCGTTCCGTAAGCGGATGAAGCCGAAGGGTAACCGACGGTGGACGTATCGGAAGTGCGAATGCTGACATGAGTAGCGACAAA\n>URS000241757C lncRNA from 1 species \nCTACTAAAAGCATACTGCATAAACAGCTTGAGAGCATCATTGTTGTTTAAAAACTCGGGCTCATATATCTCATCACCAAGTCTGCTTAGTGACTGTTTATCTCTAGTTGTTATAATGATTCGACTTCCGCCACCAAATGAAGGTTGCTTTCCAATTAAGGCTTCAATTTGGGATGAACTCTCCACATTATCCACAACAACAACAACAACAACAAAGCCTTTTCCCACTAAGTGGGGTCGGCTATATGAATCCTAGAACGCCATTGCGCTCGGTTTTGTGTCATGTCATCCGTTAGATCCAAGTACTCTAAGTCTTTTCTTAGAGTCTCTTCCAAAGTTTTCCTAGGTCTTCCTCTACCCCTTCGGCCCTGAACCTCTGTCCCGTAGTCACATCTTCAAACCGGAGCGTCAGTCAGCCTTCTTTGCACATGTCCAAATCACCGGAGCCGATTTTCTCTCATCTTTCCTACAATTTCGGCTACTCCTACTTTACCTCGGATATCCTCATTCCCAATCTTATCCTTTCTCGTGTGCCCACACATCCCACGAAGCATCCTCATCTCCGCTACACCCATTTTGTGTGTACGTGTTGATGCTTCACCGCCCAACATTCTGTGCCATACAACATCGCTGGCCTTATTGCCATCCTATAAAATTTTCCCTTGAGCTTCAGTGGCCTACGACGGTCACACAACACGCCGGATGCGCTCTTACACTTCATCCATCCAGCTCGTATTCTATGGTTGAGATTTCCATCTAATTCTCCGTTCTCTTGCAAGATAGATCCTAGGTAGCGAAAACGGTCGCTTTTTGTGATCTTCGCTAGATTGCTCCGGTCATTAGTGTGGATAAGTATATATAAATGGATAGAGATAGGAAAGCAAACACAAGATGTACGTGGTTCACCCAGATTGGCTACGTCCACGGAATAGAAGAGTTCTCATTAATTGTGAAGGGTTTACACAAGTACATAGGTTCAAGCTCTCCTTTAGTGAGTACAAGTGAATGATTTAGTACAAATGACATTAGGAAATATTGTGGGGGAGAATGATCTCGTAATCACGAAACTTCTAAGTATCGGAGTGTGGTGTCGTCTTGACTTGCCTTATCTGTCTCATAGGTAGATGTGGCATCTTCTCTGGAAGTACTTTTTCCTCCATCCAGGGGTGGTATCTTTAACTGGTGGAGATGCACAAGGTAATGTATCAATTTCACTTGAAGCTTACTTGTAGTTTCAGGCTTGGTCAAGCGCGATACAAACCATGTAGTAGGAGTCCCCCAAGTCGCCGAGCTAGGGGGTCTGCTGAAAGAGGTGACAGACAAGGTAAGCAATCAGAGCTCCGACTGATTGTTCACCTTCTCCCCATCTTGCAGCAGCATGAAGGATAAAGAGAAGAAAAATGAGAAGAGATGATATGAGATACTTTTGCTTTTGAAGAAGTAACTTTTCCACAGGCTTATTCTTGAACTGAGCTGGAGGGTTTTCTGGTTTCCTCCAGAGTATAAGGCCGACTGAAGAATTTGAGGGTCAAAACAAGTCCATCAAATCTAGAGTACGTTCCACCCTGCTGATATGGGATACTTTTGCTTTTGACAGAGTAATGGATGTATCGGCACGTGTGCTGTTACGCTTGTCTCCACATGCTTCCTTGTATCCTTCGCACTTGCCCTATCTGTTCCTCAAGCAGATGCGGAATCTTCCCTGGAAACATAAGATGTTGAAGATGAGTACTCGAGAGCAATGCCAGGTAAGTAATCAGGTAAGGGGTTCCAGGCAGTCAGTTCCTGGCTGGAAGCTTGATTCCAAGTGCTGACTGATTGCTCTCTTTCTCCTTGTCTTGCAGGTAAAAACAAGGCCAAAGGAAAAGACAGGGAAAAAGCATGATATGGGATACTCTTGCTTTTAACCCTGATGATATGAGATATTCTTGCTCTAGTATAGCTTGTTTGCAGAGGTATTATCGGGGGGAAAGAAAGCTGAATATTTCGAAAGGCTTCGTTGGGAGTGCCCTCTCAGATATGATGAAGGGTTGAGCATTTTTGCAGGTCTGCCTGTCCGTTGGGGATGGAGGTCGACATATATAGGAGTCTCCCTAACAACAAGTAGTAATGCTATTCCTTTACCCTGCTTGGTCATAGCACGGTAGTGGGAGCTGCCAGTTTCACATGTTTTAACTCTGTCAGAGCACTTTGAAAAAGTGGTCTGTGGTATCTGGCTCTCGAGATTCGGAGAACGATGCCTCTTCGATTTTTGAGAAAGCAATCATGCTGGGGGTCTGGCTCTCGAGATTCGGAGAGCAGTGTCTCTTCGATTTTTGAGGAAGTAATCATGTTGGGAGTCTGGCTCTCGAGATTCGGAGGGCGGTGCCTCTTCGATTTTGGAGCAAGCAATCTTGTTGGGAGTGTTGTCTCGAATGTGAGTAAAGGTTGGGCATGTTTGCTAGTCTACCTTGCCACGAAGCACAAAGGTTGACACACAGGGACTTTCCAATTATCCAGCAATGGTACTGTTCCTTTACCCTCTCTTCGATTTTGAGAAAGTAGTCATGTTGGGAGTCTGGCTCTCGAGATTCGGAGGACGGTGCCTCTTCGATTTTGGAGCAAGCAATCTTGTTGGGAGTGTTTTCTCGAATGTGAGTAAAGGTTGGGCATGTTTGCTAGTCTACCTTGCCACGAAGCACAGAGGTTGACACACAGGGACTTTCCAATTATCCAGCAGTGGTACTGTTCCTTTACCCTTGTGGGTAATAATATGGTAGCTAGACCTTCAAAATTTATGTGTCTAAACTTTGTTAGTGCTGTTTCTTTGCTATTCTTTTACCTTTCTTGGTCAGAGCGATGTAGTGGGAGCTGCAAGCTTCACGTGCTCAACTTTGGCAGAGAACTTTGGCAAAGTTATCTGTGGTACCCATGAGCTATTGTTGCGTGTGGGAAGTGGGTGATTGAACAGTAAGATTCATGTGCTTTCTACTTCACCAGAAGTCTTCGACAGAATGCCCATAATTTCTGCAAAGCTGAGTGTGCGTGTGACAGGTGCTGACAAGGCTAGAAAAGTAGGTGCCTCTTCGATTTCTGAGATCGGCCCTCGTGGTCTCTGAGCAGCCCAGCTTTTGAGAAAGCGAGCGCCTCTTCGATTGATTCGGAGAACGATGCCTCATCGATTTTTGAGAAAGCAATCATGCTGGGGGTCTGGCTCTCGAAGATTCGGGGAGCAGTGTCTCTTCGATTTTTGAGAAAGTAATCATGTTGGGAGTCTGGCTCTCGAGATTCGGAGGGCGGTGCCTCTTCGATTTTGGAGCAAGCAATCTTGTTGGGAGTGTTTTTCTCGAATGTGAGTAAAGGTTGGGCATGTTTGCTAGTCTACCTTGCCACGAAGCACAGAGGTTGACACACAGGGACTTTCCAATTATCCAGCAATGGTACTGTTCCTTTACCCTCTCTCTTCGATTTTTAAGAAAGTAGTCATGTTGGGAGTCTGGCTCTCGAGATTCGGAGGACGGTGCCTCTTCGATTTTGGAGCAAGCAATCTTATTGGGAGTGTTTTCTCGAATGTGAGTAAAGGTTGGGCATGTTTGCTAGTCTACCTTGCCACGAAGCACAGAGGTTGACACACAGGGACTTTCCAATTATCCAGCAGTGGTACTGTTCCTTTACCCTTGTGGGTAATAATATGGTAGCTAGACCTTCAAAATTTATGGGTCTAAACTTTGTTAGTGCTGTTTCTTTGCTATTCTTTTACCCTTCTTGGTCAGAGCGATGTAGTGGGAGCTGCAAGCTTCACGTGCTCAACTTTGGCAGAGAACTTTGGCAAAGTTATCTGTGGTACCCATGAGCTATTGTTGCGTGTGGGAAGTGGGTGATTGAACAGTAAGATTCATGTGTTTTCTACTTCCCCAGAAGTCTTCGACAGAATGCCCATAATTTCCGCAAAGCTGAGTGTGCGTGTGACAGGTGCTGACAAGGCTGGAAAAGTAGGTGCCTCTTCGATTTCTGAGATCGGCCCTCGTGGTCTCTGGGGAGCCCAGCTTTTGAGAAAGCGAGCGCCTCTTCGATTTCTGAGATCGGCCTTCGTGGTCTTTGAGCAGCCCAACTTTTGAGAAAGCAAACGCCTCTTCGATTTCTGAGATCAACCCTCGTGATCTCTAAGCAGCCCAGCTTTTGAGAAAGCAAACGCCTCTTCGATTTCTGAGCAGGCGCCTCTTCGATTTCTGAAGCTCCGTCGAGTGCAGATTTTTATATAGGGGCTGGCATTAAGTTCCAAAGCACACTTGAATCTCCACCAGTAGAAGCTTCATTCTTGCACTTCTAAGATCTTGATTTGTCCGACCTCTTCTCTCTTCAACACCTTTGAAAATGTCTGGCCCCTCCGACCGTCGTTTTGACTTGAACCTTGTTGAAGAGGCAGCCCCGCCTTCTCCAGACAACATATGGCGCCCATCCTTCGTCTCCCCTACTGGTCCTCTTACCGTTGGGGATTCCGTGATGAAGAATGATATGACCGCTGCGGTGGTGGCCAGGAACCTTCTCACTCCCAAAGATAACAGACTACTTTCCAAACGGTCTGATGAGTTAGCTGTTAAGGATTCGCTGGCTCTCAGTGTTCAGTGTGCAGGTTCTGTGTCTAATATGGCCCAACGCCTATTTGCTCGAACCCGCCAAGTTGAATCATTGGCGGCTGAAGTGATGAGTCTCAAACAGGAGATTAGAGGGCTCAAGCATGAGAATAAACAGTTGCACCGGCTCGCACATGACTATGCTACAAACATGAAGAGGAAGCTTGACCAGATGAAGGAAACTGATGGTCAGGTTTTACTTGATCATCAGAGATTTGTGGGTTTGTTCCAAAGGCATTTATTGCCTTCGTCTTCTGGGGCTGTACCGCGTAATGAAGCTCCAAATGATCAACCTCTGATGCCTCCTCCTTCTAGGGTTCTGTCCAGTACTGAGGCTCCAAATGATCCCCCTCCGGTGCCTTCTCTTTCTGGGGCTCTACCGACTGCTGAGACTTCTCCTAAGCAACCTTTGTGAAGGCTCCCTCTTGTGTGTTTATTTTGACTCATGTATATGTACATATTTGTAGCTTATCGGGGATATCAATAAATAAGCTTTCCTTCATTTCAACGTATTGTGTTAAATACACCAAAGCCTTCTTCGCTAAGTTCTTTGAATTTTCTTTTGTTGAAGCTTGTATGTTGAAGCTTTCTGAGTGGAGCATGTAGGTTGGGGTAGTGTTCCCTTAATTTCCCGAGTGAGGAAAACTTCTCGGTTGGAGACTTGGAAAATCCAAGTCACTGAGTGGGATCGGCTATATGAATCTTAGAACGCCATTGTGCTCGATCCTGTGTCATGTCCTTCGTTAGATCCAAGTACTCTAAGTCTTTTCTTAGAGTCTCTTCCAAAGTTTTCCTAGGTCTTCCTCTACCCCTTCGGCCCTGAACCTCTGTCCCATAGTCGCATCTTCTAATCGGAGCGTCAGTAGGCCTTCTTTGCACATGTCCAAACCACCGTAACCGATTTTCTCTCATCTTTCCTTCAATTTCGGCTACTCCTACTTTACCCCGGATATCCTCATTCCTAATCTTATCCTTTCTCGTGTGCCCACACATCCAACGAAGCATCCTCATCTCCGCTACACCCATTTTGTGTACGTGTTGATGTTTCACCGCCCAACATTCTGTGCCATACAGCATCGCCGGCCTTATTGCCGTCCTATAAAATTTTCCCTTGAGCTTCAGTGGCATACGGCGGTCACACAACACGCCGGATGCACTCTTCCACTTCATCCATCCAGCTTGTATTCTATGGTTGAGATCTCCATCTAATTCTCCGTTCTTTTGCAAGATAGATCCTAGGTAACGAAAACGGTCGCTCTTTGGCATTTCTTGATCTCCGATCCTCACCCCTAACTCGTTTTGGCCTCCATTTGCACTGAACTTGCACTCCATATATTCTGTCTTTGATCGGCTTAGGCGAAGACCTTTAGATTCCAACACTTCTCTCCAAAGGTTAAGCTTTGCATTTACCCCTTCCTGAGTTTCATCTATCAACACTATATCGTCTGCGAAAAACATACACCAAGGAATATCATCTTGAATATGGGGTATGGGCGGTATAAACTATTTTAAAATGTAAAATATAAAATATAAAATTAATAAATAATAATTAATAAAAATTGACTGTATTATGTACGATGAATAATTACGATCACGGAATCCCTAGGATCCCAAAAGAAAAATTCGGTGAGAATCCTTTTCCAGAATTTTTAATCCAACCGTTTCTTGTGTTAAATTTATCCCAAAAATTAGTTTTGACCAAAAATTGATTTTTAGTCCAAGGGTTGGAGCAAATTGAGAGAGTTAAAAAACTAAAATTTAAGCTAAAGTCCAAAGATTTGAGTTAGTCTAACAAATACAAATGAGAGAAAGTAACATTCATATTTTATTGCGGCTTTTAATTTTTATTTAAAATGGTATCTAAACTTGGTATAATTACTTACTTTTAAAATTGATAAAAATGGTCTTTGAGATTGTCTACCATCAATCATTTTGGTCATTCTGTGAAAAATCTTAATTAAATTAGAGGTATTTTTATCAATACCTTTGAATTGATGATTTCTTCAATTTAATGAAATATTTTCACAAATCATGGTGCATATTATTGGTGGTCCTAAGCTCCTTTATATGTGTAGCGTATGCTTATGTCATGATCTTTCTGCTTCTACTAAATATCAGATGATTTTGTTTTTACTATTTGTTTTACTTTGTACATGGGGTGGCTTTTAGGTTCCCCTGTTGTCTTACTTGCTATGTTATTTCCTCAACAAGGTTTGCTTTTATGTTTCCCTCATTTGTAAATTTCCTTTTTTTTTGTTTTTACTTTAATATGATAATGGGATGCTCGGTGAGCACTATTACCCCATGATTTTCACGCATGCACACAAAAAAAAAAAAATTTATCGTCACAACTAGCATATTTATCAAAATACTCGAAAAGTTAGAGTTTCTAGTCACAACTAACATTGCCATATAGTCAAAATGCTCAAAGTATAGAAAAGAAATATAAAGAAGATATCAAGTTAGATCAGTTACATAGAGAGAGTCATTCCCATGGGATTGCATGATTTCTCTATCATTGCAATGTATTTTTCATAAAACTTCCTTTTCATGATTAGGGACTACGATCCTTGGTGCTATAAATTCAGCAGTTGACTCAAGCACAGAAGTTATCTACAGTGAGAATCCTGATGGTAATTTTGTAAAGTCAAACAACTTTGCATATGCCATTGTTGTGGTTGGCGAGTACCCTATGCTGGGACTGCGGGAGACAGCCCAAACCTTACGATGGCGGAACCTGGCCCAAGTGTCATCAGCAATGTGTGTGAAAGTGTAATGTGCATTGTTACCATAATAACTGGAAAACCTATTGTAATAGAACCATACTAGAAATTACGCCCGTTGTTGCGGAAACCAACTGTTACAGGCGTAATCGAATTAATAAAACACATTTAAGTTGAATAAGAATGTCCCCATGATTAGTCTTCTCGTTTATTTTTCACAAACCAATCACATATTAAAAATCCAAGTACGAAAGCTTTGCAAAGATAAATAAAAAATTTATATAACTAATTAGACTTTGAACATGCAATCAAGGCACATACTCGTATACCTAAAAATAGCAAGGAACCGGCTTCTTCCTCCCACAACCAGAGTTCCTGAAATTTCCAAAGAAAGTAAATCCGTTAGCAATTCAGAGAAATTGGAAGACCAAATCGTATTACATTTGAGTTAAATGAGCAAAGGTAAACCAATTAAATGAGATACTAAACACATTTCGAATCTATGAAATAGAAGAATAATCATGTTAGGACTCCCAAGATGGTGTCCTAAGCACAAAATTATAGGTTAAGAAAGGTAAATCCCAATCCAAAGCTCCAACCTTTTAACTGAAAATGAAACAAAAAAGCATGGATCATATATTTCAGTTTTATTATTAGATTTTCTAAATCCCCAATTTGAATGTGTTGTAAAGACCTGCTAAAGATAATACCACCAACTAAGGGTGGCAATCTGACCAGCGTTGTGCATGTCATGTCGACTCTATGCAACTTAATATATAACATTTAAGCAGCATTAGACGGTCTCCTAAGCATCTACAAACCATTTAACATTATTTCCCCAATTTTATTTCCCAATTTTATCAAATGCTGCATAAACGATCACAATTTACTCCCTTACAATTTCCACCTAACTCCGAACAAACAATATTGATAAATCTTTATCATCACCTTTAACGAAACAGATTACAGCGAAAAGAAAAAAAAAGTTACTATGAAATCAAATTCTTCTAGATGTCCAACCTAACCCATCTATGGGAAGGCAAGCAATCGGACGTGCATTTAGACCAAGCAAAATAAATTTTACAATTTATCAAAACAGCAACTGATTCTCCCAAAGAGAACACAACATACCAACATATTATTCACCATATTCTAAGCTTTCATTTTCGTTCTATCTCTTTCGTTATCTAAACTTATAGTTATCAAAACAGCAATAAAATCATAGACAAACCTTCAATCATTTATCAAAACTGAATTAATTAAACTTCTGCTCCGCAGTCCGTTAATTTTAATTGCAACTCTCATTCTAAAAATTTAAAATTTTGCATTGAATAATCAAACGCACTTGCACGTTACATTCCTTTTATTGGTTCTTGACATAATACATTTTAGGATTGATGTAATAATATCACTACAAACATGAATTGCGATAGATATAGAAACCAAACTTGCACACAAATGTTTGACTGAATTCAGAACCACTTAATTCAACATAAAAAATTACCTCACATGCTTGCTCCCCTTCTGCTCTCGCATCGTCGGCTCCGCTACTAAACGATTAATGAAGTCCCAAAGCAAAAACAGAACAAAAAACATTTACCAATCCAACATTTCAACACATGGTTTTGGCAGGTATAACATTTCAACATAAGCATGATATAGAAAGAAAGAAATCCACATGTCACTTTGTTTTTTCAGAATCAACAAAAAGGGCAACTAGAAGAGAATGTAACCAATTTTAAAGAGTAAATCAGTCTCCCAATAAAGGAGAACAATGCTGGCGGTAGACCAAGAGTAAGTACAACCCGACTGCAGCAACAAAAACACAATTGACTTTCACACTACAGAAATAAATAATAAAAAAACACATACCTGCACCCAATGCATTGTTTTTTTTTTCCTCTGCAGTATAAGAATAAAAAAGAATAACATTCCCCTGAAACCAAATTCATCCCCCAATTTCTTGCAACAAAGAGGGAGACCAACCTTGTGTTCTTGGAGAACAGTATAACAATTAGACACAATCAGACTAATCCAAGTTCCCACTATGATAATGAAAAATTAAAATTAATAAAATAGCTCAAATCATATCACAGTATGTCACAAAGTACACCATTTGATAACCAATAAATTTAACAAAAATAGATTCAATAGTCTATATCAATTAATCAATAGTCTAAAGTATGAAAAAAATTGATTTCAAAGCCTTCCTTAGGAACTTCACAACGTATCAACAGACATTATGATATCGATGATGGTATCCATGAAACCCCAAGCTGCAAGCAAATACTGCCTTTGGAAATTTTCAATATAAATGGTTTTGCAAACCAGCCACTAATGAAACATCTAATTTCAAACAAATAATAAAAGCTTTCTTTAACTGACACATTATCCTTCTTCTTTCCTCCCATTTACTTCCCACCCTCCCTATTAATCCCTCCATTTTGAAACTCCTATATTCTTCCTATTCTGTACAAAACCTGCCAAATCATTTCCTCACTTCTCAAAACCCAAATAATCACTTAAAATGCACAAAATTACAATTAAATCAATATTACATTACACAAAATGACATTCAAAACCACAATACACTAAAACCAAGCGTGAATTCTACACCCTCAATAAGTGGAAGCATTCGTACCTCAAATGAATTTGCAACTTAATTTTTTGCTGAAAAACCTTGACCTACAAAACCAAATTACATTTAGGGTAAATTACAAAAAATTATCTCAACTATTGGTGGCACGACACTTTCATACCTCATCTTTTAAAATTGACAATGTCATACCTCATTTTACGAATTTATGCCAACGTTATACCTTCCGTTAGCTTGGCATAAATTTCTCAGTTAAATGTTGATGTGGCTTGATCTGGGGCCCATTTTCTGTTAAAAAAATTATTAAAAACTAAAAAAAATCATTTAATTTTTTTTAAATATTAAAATAATAAAGAAAAGTTATATAAAATAAAAAAATAAAAAAACCAACCAACACCCAGTTCGTCCCCTTCCCCCCCCTTTCTCTCTCCTCCCCATCTTCATCTTCTTCCCCCTTCTTGCAACTGCAACCCAGAAAAAAGAAGAGAAAAAAAAAACCAATTTGTCTTCCCCACACCCACTCTCCGCACCCATCTTCATCTTCTTCCCCCTTCCAATTGCAACCCAGAAAAAAAAAAAAAAAAAAAAAAAACCAATTTGTCAATTTTTTTTTTCTTCCTCCTTTCTGGGTTGCAGGAAGATGGGGAAGAGAGAAGGGGGAGGGACAAACTGACCTAAGGTTTTATTTTATTTTATTTTTATTTACTTTTCTTTATTATTTTAATATTTAAAAAATACTAAATAATTTTTTAATAGAAAGTGGGCCCCGATTCAAGCCACGTTAGCATTTAACTGAAAAATTCATGGTCAAGTAACGGAAGGTATAACATTGGCACAAATTCGTAAGATGAGGTATGACATTATCAATTTTAAAAGATGAGATATGAAAGTGTCGTGACACCAATAGTTGAGTTAGTTTTTTGTAATTTACCCTTACATTTATCAACAAAAAGGAATCAATGTAAGAAAGCAAACACAATACAGAAAAAATGGCCATTCAAGTCAGCTCTATTTAGATTATAATAACTCTCAATTTAAGAAAGCAAATGCAATACAGAAAGCAAATATAATCCAAATTACCTTGAACACCACCATCATATTTTTACTCCGTTACGTATACATGTCCTTTTCTTTCTAGATAAACTTTATTTCTTTGAAGTTTCTGCAGGGTGCATTCCAATTTAACCCTTTAAATGTTTGTATAAAACTTAGGGTGCGATGGCAAGTGCCTTCGCCCATAAACGGTAGATCTCGGGTTCGAGACTTGGGAGCAGCCTCTCCATAAATGGGGATAAGGCTAGCCGACATTCACCTCTCTCAGACCCTGCGTAAAGCGGGAGCCTTGTGCACTGGGTACGACCTTTATATTCTCGCCTGCTTGCAAGTCAACTAAGTCAACTATTCAACCTTCACATATTGTTTATTAGTTTTCTTGATACTAATGTATGGAAAGGGCTTAAATCCTTCAATGTATGGAAAGGGCTTAAATCCTTCAATTATGGATATACTAATGTATAATCCTTTGTTCTAGACCAATTTTGTTCTTAGTTCTTAGTTTTCTTGATACAAACTTTTTTTTTTGTATTAATATAAATTTGTTTGCACCAAGGGATGGGGTGGGAACATATCTTGAAATATGGCCACGTCCACATTTGCAGCTGAAGAACACTTCAATATAAGTTTAATTTGGTGCAACTTTAGGTTTAATTTGGGTATGTTCCACCACTTAAAATTTGCAATACTAATTTTGAACAATGAATAAGAAAATTCTACCAAGAGAGAGTAAAATAGTAAATCAACTTAATTTCTGTAAAAAAAAAAAAAAAAACTTGCAAAAATTTCATGAAATTTTGGTAAAAACGGAAAAGAAAAGGGTTAAGACAATCAAGACTAATGGAAAATTTGATATTGTTTTAACATTAACTTAGGTTGATTTTGTTCACCAGCATTAATAAAACGAATGACTTTAACTTGGGCAAGCAAACAATTAAATTAGACGTAAGCCAAGTAACTTAGAAGTTAACCATATGAAAAAAGGAAAACTAATGAAAAAAGCTTGAAAACTTTGAGTTTTAATGATAAGGACAAAATAAAGGGTAAAGTGAATAGTACCATGATTGACTTTTTAGTGTAAAAATGTGGTTTTTCGTTAAAGTGAATAGTACCGAGTGCTTTTCGTTAAAGTTCCCTATGAAAAAAAGCAATGACAATCAAACTGACCTCTTCTTTCATATGAAGTATAATCTGTTCTCTATTTTGCCTTTGTGAAGAATGCACTTTTCACTTCCTACACACAAAATAGCATACATTGAAAATGCTCCGTAGCATTATAAAAACTATAGATATACAGTACTGTATATGTATCATATACTATATTGTGTACGTAGTTGGACATAAGGTATAAAGATTTACTAACATAATTAAGCTTAAATTTAACAAAAGAAGTAATTACAAATTGAAATCAAACGATATTCTAGTTATTCAAAAAAATTCTGGCTAAATTTTACAAATAGTATTATAAATTGTTAAAAAAAATAACACAATTGAAAAAACTCACCACTCAAATCTGCAATTCTATTAAAAACACATCACTAAAAATTAACTCCAACAAAAGGGGATTAACAAATTATACCTTTTTAAGAGTTGGAATTGTTTATCTATATCTTGAGCTGGACCCGCTGGATTTGAATCCTCAGTTGACTTAGAGGGAGGATAGGCATGAAAAGAAGTGTAAGGTTCACTGGATCATATTTTTAAGAGATAGAGAGAGTTCTACTTTTCAACAGCGGAGAGAACATATTCAATCTTGGGCATAAAAAGAAAAAATAGAAGCTTCATAGCACAATAATTAACCACAATCCTCTGTTTTTCTAAATGCAAATAGAAAAAAGGAATCAAAATATTCAACACAAAATCTTCACATTAGCTCAAGAACTATATTATTTCCAGTGCTTTCCAATTTTCCAGCACGGAACAACAAACATAAAAGCATTAAAAATATATAATTGCAAAAAAAAAAAATAGCAATTCCAAGAAACTAAATGCGAAGTTAGCCAGATCTGCACAGTAACACAAACCCATTACTTGAATTAAGAGCATTGTGGCTCACCCTGAAAACACCCATTTTGCAATGAGGAAGAGAGACACTGCTGCTCTGGCTGCTGAGTGCTGCTGGCTCCAAAGCAGTTTGTCTACCAGAACTTTATAAGAGCAAGTCCAACCCTTCAAAGCCACTGTAAATCGCCAAGGATTTACATCATTCTGCTTGCCTAAAAAAAGCAAACAAAAAAGAAAAAAATGGAAAGTATAAAATTCAAATGACCCTTGATGAACATAACCCATAAATTTTCCTTGTATTCCATAAATGCAATAAAACAAAAGTCAGTGTCTCCATTTTCCAAAAAACCAAGCAAGCAAGCAACAAATTTCGAAAACCCTAATTCTAACCAATTTAGAACTATAACCAAGTAAACCACTTAATCAACAAAACTCACTAATTTTCTCAAAAACCCAACAAATTTAAAGGATATCCAGATGATAAATCCCAGTAAAATCCCAAATTTGAAAACCAGAAGAAAAAAAAAGACAAAGAGGCTTATCTTTCTTCACTAATCGGGCACTAACAGAAAAACCTTAATTCATATTATTCAGATTACAAATACACAGGGACCAAATAGCTAATAATGCTGGACAATTTGTCCCCAATCCAACACAAAAATTGTTCTTGTTATACATACGATACCCGCCTAAAATATCAACCAATTCCAAATTAAAATGGAAAATGAAACGGAGCATCATAAATTGAATACAATTTGGAGAAAATTATCTCACTTGGGGCGCCGAATCTCCAAGAGGTCCCAATCCGAGCAGGCTCCAAATTGGGTTGTTGAAAATGGTGATCAAGGAAGGGTTTTGGAGGTGGGTCTGATCAGAACAAAGCCGAAGCCATTAGGTTTGGGGGGAGAGGAACAAAGAGCCACTGAGAGAGAGAGAGAGAGAGAGAGAGAGCATGCGTTGTCCTTTTCTTCTATCCGGCCACTGGATCGCAGTTCCTTCACAAAAATTATACACGTGTGTTACTTTTTCAAGTTCTAGTTTTGTAATCACCTAATCGATCATAACACCATTCGCAAATATGACAAACATAAACAATTAAGTCAGCAACATGATATGCCATTCCTTTCATATTGCACATATAAAGAAAAAAGAAATGAACCAAAATAAAATTATACTATAATCCAATTATATGAAGGCCAAACTTGAGTTGGGGCTGGTGGCCGTTGACCACATCATCGCCTCCATTTGAGAGAAAAGGGTTTGTTTGGCTTTTTTGTCCAATTATTTACACTAACCATATATAAATGAAGAAGGACAACATCTATGTTGCTCCCTTCTTGTGATCCAAATTTGAAGAGGGCCGATGGGGAGGGGCAGTTATAAGTGTCATCCTCTTTGTTTCTCCTATCCCTGCATTATCAACCAAAAAAACATCAAACCAAGTGCAATACAATCCAATTTAATGCTCACAAAATTTGAGCTCCAAACAAGGTCACAGGTCAGCAATCGCCTAATCGATCATAACACCATTCGCAAACATAAACAATTAAGTCAGCAACTTGATATGCCATCCCTTTCATACAAACACAGATTGCAATTCATATATGCCGCATTATTTACAAACAATTACAAATCAAGAAACAATTAAATCATCATCATGAATTATAGTGTAATAACAGCATCATCAATTAGAAGAGACAGAGCTACATGGCAATAAACATATAGAGAGTAAACATACAGAGAGGAACTGCTTCATATCCTTCCCAAAAGCAATCTTCCGCAGGATAACAAAAGAGCGGTTGATCTCTGATCTAATTGCAGACGCAATCTGCAGAACCGACTTCTATGGAATTTTAACTTGTGAAATGTGGGGTGGAGATTTGAATGTAACAAATTGGTGTTAAGTGAATAATTCCAAACATATGAAATTTAGATAATCACATCCGAACGCAAACAGAAGAATTAAATAAAGAATCAAAGGCATATGCAATCTAATTAGACAAATAAGTGAACTTTCCCATGCCAAAATCCGAAAGGCCAACAGATATCTCTCATTACAGGACTTAATACATATCTTAAAAGACAAAACTTAAAATAACAAAAATTAGGTGAAACAATTGAAGAGAACATAATCCTTGTAACCAATCCGGAAAAGATGCTTTTAAATCCCAGAAAACAAATTATGAGAAGTTTTTAAAAAAACCATCATTTCAATTATTTTCCAGTCTTACATTTGGGAATAAACAGAAAATATAACTAAAATGCCAACTTTCTCAAAAAACTACAACTACTTTAACAAATTTCCATCACTCAACACTGAAAAATGAGAATCACGAAGCAACGAAGAACGGAACACGCTAGAAATAACAACAAAGCCTTTTCCCACTAAGTGAGGTCGGCTATATGAATCCTAGAACGCCATTGCGCTCGGTTTTGTGTCATGTCCTCCGTTAGATCCAAGTACTCTAAGTCTTTTCTTAGGGTCTCTTCCAAAGTTTTCCTAGGTCTTCCTCTACCCCTTCGGCCCCGAACCTGTCTCGTAGTCACATCTTCGAACCGGAGCGTCAGTAGGCATTCTTTGCGCATGTCCAAACAACCGTAACCGATTTTCTCTCATATTTCCTTCAACTTCGGCTATTCCTACTTTACCTCGGATATCCTCATTCCCAATCTTATCATTTCTCGTGTGCCCACACATCCCACGAAGCATCATTATCTCCGCTACACCCATTTTGTGTACGTGTTGATGCTTCACCGCCCAACATTCTGTGCCATACAACATCGCTGGCCTTATTACCGTCCTATAAAATTTTCCCTTGAGCTTCAGTGACCTATGACGGTCACACAACACGCCGGATGCACTCTTACACTTCATCCATCCATCTTGTATTCTATGGTTGAGATCTCCATCTAATTCTCCGTTCTCTTGCAAGATAGATCCTAGGTAGCGAAAACGGTCGCTTTTTGTGATCTTCGCTAGATTGCTCCGGTCATTAGTGTGGATAAGTATATAAATGGATAGAGATAGGAAAGCAAACACCAGATGTACGTGGTTCACCCATATTGGCTACGTCCACGGAATAGAGGATTTCTCATTAATTGTGAAGGGTTTACACAAGTACATAGGTTCAAGCTCTCCTTTAGTGAGTACAAGTGAATGATTTAGTACAAATGACATTAAGAAATATTGTGGGAGAATGATCTCGTAATCACGAAACTTCTAAGTACCGGCGTGTGGTATCGTCTTGACTTGCCTTATCTGTCTCGTAGGTAGATGTTGCATCTTCTCTGGAAGTACTCTTCCATCCAGGGGTGGTATCTTTAACTAGTGGAGATGCACAAGGTAATGTATTAATTTCACTTGAAGCTTACTTGTAGTTTCAGGCTTGGTCAAGCGCAATACAAACCATGTAGTAGGAGTCCCCCAAGTCGCCGAGCTAGGGGATCTGCTGAAAGAGGTGACAGATAAGGTAAGCAATCAGAGCTCCAAGCAATCAGTCCTAGATCAGAACTTTGATTTCGAGTTCCGGCTGATTGTTCACATTCTCCCTATCTTGCAGGCAGCATGAAGGATAAAGAGAAGAAAAATGAGAAGAGATGATATGGGATACTTTTGCTTTTGAAGAAGTAACTTTCCACAGGCTTATTCTTGAACTGGGCTGGAGGGTTTTCTAGTTTCCTCCAGAGTATAAGGCCGACTGAAGAATTTGAGGGTCAAAACAAGTCCATCAAATCTATAGTACGTTCGACCCTGCTGATATAGGATACTTTTGCTTTTGACAGAGTAGTGGATGTATCGGCACGTGTGCTGTTACGCTTGTCTCCACATGCTTCCTTGTATCCTTCTCACTTGCCTTATCTGTTCCTCAGGCAGATGCGGTATCTTCCCTGGAAGCATAAAATGTTGAAGATGAGTACTCGAGAGCAATGCCAGGTAAGTAATCAAGTAAGGGGTTCCAGGCAGTCAGTTCATGACTGGAAGCTTGATTCCAAGTGCTGATTGATTGCTCTCTTTCTCCTTGTCTTGCAGGTAAGAACAAGGCCAAAGGAAAAGACAGGGAAAAAGCATGATATGTGATACTCTTGCTTTTAACCCTGATGATATGAGATATTCTTGCTCTAGTATAGCTTGTTTGCAGAGGTATTATCAGGGGGAAAGAAAGCTGAATATTTCGAAAGGCTTCTTTGGGAGTGGCTCTCAGATATGACGAAGGGTTGAACATTTTTGCAGGTCTGCCTGTCCGTTGAGGATGGAGGTCGACATATATAGGAGTCTCCCTAACAACAAGTAGTAATGCTATTCCTTTACCCTGCTTGGTCATAGCACGGTAATGGGAGCTGCCAGCTTCACATGTTTTAACTCTGTCAGAGCACTTTGAAAAAGTGATCTGTGGTATCTGGAAAGCTGATGTTGCGTGTGAAGATTACAGACAAGCTTTATCCAAGGAGATCCAGCTCTTGAAGTTGGGAAAGTGGTGCCTCTTCGGTTTTCGAACAAGTAATCCTGTCGGAGATCTGGCTCTCGAGATTCGGAGAACGATGCCTTTTCGATTTTTGAGAAAGCAATTCTGTTAGGGGTTTGGCTCTCGAGATTCGGAGAGCGGTGTCTCTTCGATTTTTGAGAAAGTAATCATGTTGGGAGTCTGGCTCTCGAGATTCGGAGGGCGGTGCCTCTTCGATTTTGGAGCAAGCAATCTTGTTGGGAGGGTTTTCTCGAATGTGAGAAAAGGTTGGGCATGTTTGCTAGTCTACCTTGCCACGAAGCACAGAGGTTGACACATAGGGACTTTCCAATTATCCAGCAGTGGTACTGTTCCTTTACCCATGTGGGTAATAATATGGTAACTAGACCTTCAAAATTTATGTGTCTAAACTTTGTTAGTGCTGTTTCTTTGCTATTCTTTTACCCTTCTTGGTCAGAGCGATGTAGTAGGAGCTGCAAGCTTCACGTGTCTCAACTTTGTCAGAGAACTTTGGCAAAGTTATCTGTGGTACCCATGAGCTAATGTTGCGTGTGGAAAGTGGGTGATTGAACAGTAAGATTCATGTGCTTTCTACTTCACCAGAAATCTTCGACATAATGCCCATAATTTCCGCAAAGCTGAGTGTGCGTGTGACAGGTGCTGACAAGGTTGGAAAAGTAGGTGCCTCTTCGATTTCTGAGATCGGCCCTCGTGGTCTCTGAGCAGCCCAGCTTTTGAGAAAGCAAGCCTCTTCGATTTCTGAGATCGGCCTTCGTGGTATTTGAGCAGCCCAACTTTTGAGAAAGTAAACGTCTCGTGGTCTCTGAGCAGCCCAGCTTTTGAGAAAGCAAACGCCTCTTCGATTTCTGAAGCTCCGTCGAGTGCAGATTTTTATAGAGGCTGGCATTAAGTTCCAAAGCACACTTGAATCTCCACCAGTAGAAGCTCCATTCTTGCACTTCTAAGATCTTGATTTGTCCGACCTCTTCTCTCTTCAACACCTTTGAAAATGTCTGGCCCCCTCCGACCGTCGTTTTGACTTGAACCTTGTTGAAGAGGCAGCCACGCCTTCTCCAAACAACATATGGCGCCCATCCTTCGTCTCCCCTACTGGTCCTCTTACCGTTGGGGATTCCGTGATGAAGAATGATATGACCGCTGCGGTAGTGGCCAGGAACCTTCTCACTCCCAAAGATAACAGACTACTTTCCAAACGGTCTGATGAGTTGGCTGTTAAGGATTCTCTGGCTCTCAGTGTTCAGTGTGCAGGTTCTGTGTCTAACATGGCCCAACGCCTATTTGCTCGAACCCGCCAAGTTGAATCATTGGCGGCTGAAGTGATGAGTCTCAAACAGGAGATTAGAGGGCTCAAGCATGAGAATAAACAGTTGCACCGGCTCGCACATGACTATGCTACAAACATGAAGAGGAAGCTTGACCAGATGAAGGAATCTGATGGTCAGGTTTTACTTGATCATCAGAGATTTGTGGGTTTGTTCCAAAGGCATTTATTGCCTTCGTCTTCTGGGGCTGTACCGCGTAATGAAGCTCCAAATGATCAACCTCTGCTGCCTCCTCCTTCTAGGGTTCTGTCCAGTACTGAGGCTCCAAATGATCCCCCTCCAGTGCCTGCTCTTTCTGGGGCTCTACCGACTGCTGAGACTTCTCCTAAGCAACCTTTGTGAAGGCTCCCTCTTGTTTGTTTATTTTGACTCATGTATATGTACATATTTGTAACTTATCGGGGATATCAATAAATAAGCTTTCCTTCATTTCAACGTATTGTGTTAAATACACCAAAGCCTTCTTCGCTAAGTTCTTTGAATTTTCTTTTTGTTGAAGCTTGTATGTTGAAGCTTTGTGAGTGGAGCATGTAGGTTGAGGTAGTATTCCCTTAATTTCCCGAGTGAGGAAAACTTCTCGGTTGGAGACTTGGAAAATCCAAGTCACTGAGTGGGATCGGCTATATGAATCTTTGAACGCCATTGTGCTCGGTCCTGTCATGTCCTCCGTTAGATCCAAGTACTCTAAGTCTTTTCTTAGAGTCTCTTCCAAAGTTTTCCTAGGTCTTCCTCTACCCCTTCGGCCCTGAACCTCTGTCCCATAGTCGCATCTTCTAATCGGAGCGTCAGTAGGCCTTCTTTGCACATGTCCAAACCACCGTAACCGATTTTCTCTCATCTTTCCTTCAATTTCGGCTACTCCTACTTTACCCCGGATATCCTCATTCCTAATCTTATCCTTTCTTGTGTGCCCACACATCCAACGAAGCATCCTCATCTCCGCTACACCCATTTTGTGTACGTGTTGATGCTTCACCGCCCAACATTCTGTGCCATACAGCATCGCCGGCCTTATTGCCGTCCTATAAAATTTTCCCTTGAGCTTCAGTGGCATACGGCGGTCACACACAACACGCCGGATGCACTCTTCCACTTCATCCATCCAGCTTGTATTCTATGGTTGAGATCTCCATCTAATTCTCCGTTCTTTTGCAAGATAGATCCTAGGTAACGAAAACGGTCGCTCTTTGGTATTTCTTGATCTCCGATCCTCACCCCTAACTCGTTTTGGCCTCCATTTGCACTGAACTTGCACTCCATATATTCTGTCTTTGATCGGCTTAGGCGAAAGACCTTTAGATTCCAACACTTCTCTCCAAAGGTTAAGCTTTGCATTTACCCCTTCCTGAGTTTCATCTATCAACACTATATCGTCTGCGAAAAGCATACACCAAGGAATATCATCTTGAATATGTCCTGTTAACTCATCCATTACCAACGCAAAAAGGTAAGGACTTAAGGATGAGCCTTGATGTAATCCTACAGTTATGGGAAAGCTTTCGGTTTGTCCTTCATGAGTTCTTACGGCAGTCTTTGCTCCTTCATACATATCCTTTATAGCTTGGATATATGCTACTCGTACTCCTTTTCTTCTCTAAAATCCTCCAAAGAATGTCTCTTGGGACCCTATCATACGCTTTTTTCCAAATCTATAAAGACCATGTGTAAATCCTTTTTCCCATCTCTATATCTTTCCATCAATCTTCGTAAGAGATAGATTGCCTCCATGGTTGAGCGCCCTGGCATGAACCCGAATTGGTTGTCCGAAACCCGTGTCTCTTGCCTCATCTATGCTCAATGACTCTCTCCCAGAGCTTCATTGTATGACTCATTAGCTTAATACCCCTATAGTTCATGCAATTTTGTACGTCGCCCTTATTCTTGTAGATAGGCACCAAAGTGCTCGTTTCGCCACTCATTTGGCATCTTCTTCGTTTTCAAAATCCTATTGAAAAGGTCAGTGAGCCATGTTATACCTGTCTCTCCCAAAACTTTCCACACTTCGATTGGTATATCGTCTGGGCCCACTGCTTTTCTATGCTTCATCTTCTTCAAAGCTACAACCACTTCTTCCTTCCGGATTCGACGATAAAAAGAGTAGTTTCTACACTCTTCTGAGTTACTCAACTCCCCTAAAGAAGCACTCATTTCATGTCCTTCATTGAAAAGATTATGAAAATAACCTCTCCATCTGTCTTTAACCGCGTTTCTCTGTAGCAAGAACCTTTCCATCCTCATCCTTGATGCACCTCACTTGGTTTAGGTCCCTTGTCTTCTTTTCCCTTGCTCTAGCTAGTTTATAGATATCCAACTCTCCTTCTTTGGTATCTAGTCGCTTATACATATCGTCATAAGCCGCTAACTTAGCTTCTCTCACAGCTTTCTTCGCCTCTTGCTTCGCTTTTCTATACCTTTCACCATTTTCATCGGTCCTATCCTTGTATAAGGCTTTACAACATTCCTTCTTAGCCTTCACCTTTGTTTGTACCTCCTCATTCCACCACCAAGATTCCTTTTGGTGTGGGGCAAAGCCCTTGGACTCTCCTAATACCTCTTTTGCTACTTTTCGGATACAACTAGCCATGGAATCCCACATTTGGCTAGCTTCCCCCTCTCTATCCCACACACACTGGGTGATTACTTTCTCTTTGAAAATGACTTGTTTTTTCTTCTTTTAGATTCCACCATCTAGTCCTTGGGCACTTCCAAGTCTTGTTCTTTTTTCTCACTCTTTTGATATGTACATCCATCACCAACAAGCGATGTTGATTAGCCAAGCTCTCTCCTGGTATAACTTTGCAATCCTTACAAGTTATACGATCCCCTTTCCTCATTAGAAGAAAATCTATTTGTGTTTTTGACGACCCACTCTTGTAGGTGATCACATGTTCTTCTCTCTCTTCTTAAAGAAGGTGTTGGCTAAGAAGAGAGATCATATGCCATTGCAAAATCCAAGATAGCTTCCCCATCCTCGTTTCTCTCCCCAAAACCATGGCCACCATGAAAACCTCCATAGTTGCCTGTCTCCCTGCCCACGTGTCCATTTAAATCTCCTCCTATAAATAACTTCTCCGTCTGAGCAATTCCTTGCACCAAGTCTCCAAGGTCTTCCCAAAATTTCTCCTTCGAACTCGTATCCAACCCTACTTGAGGTGCGTACGCACTAATCACATTGATAAGTTCTTGTCCTATTACAATCTTGATTGCCATGATTCTATCTCCTACCCTCTTGACATCTACAACATCTTGTGTCAAGGTCTTGTCCACGATGATGCCAACACCGTTTCTCGTTCTATTTGTGCCCGAATACCAAAGTTTAAACCCTGAGTTTTCTAGATCCTTTGCCTTAAGACCAACCCACTTAGTTTCTTGTAGGCACATAATATTTATCCTTCTCCTCACCATAACTTCCACTACTTCCATAGATTTTCCCGTTAAGGTTCCTATATTCCACGTTCCTAAACGCATTTTGCTCTCTTGAACTCTACCCTTCTGTCCTAGCTTCTTCACCCTCCCCCATCTAATAGGATCAAAGTACTTCTTTTGTGTGTTCCGTGTAAAGTTGATAGGAGCATATGCTTCTAAACAACTTTGAGTGGAGTCGTTCGAAAAGAAGTTTCTATGGCCCCCTTGCTCATTTAACACTGCATCCGGGTGCCGATGGAGATACAACGACCCTTGCTCACTTATCACTGTGCTCGGGCCACACAGCGCGCCACTTACTGGTGACACCCTAGCTTTAGCGCAATTTCGTTCTGGATTCATTTTCATAAGGATTCGACGTAATCATGGAGTGCCGGCTGTCGACTACCTGACGCCCTCCCCCTCCTCCTTTATCCAGGCTTAGGACCGGCAATGTAAGATAAACTTACACAGGCGGAGTTAACGGAACACGCTAGAACTGAAACATTAAAAACAACATGTACCCATTTCAAAGACCAAAAATCCTGCAAGGACAAAAAAAAAATCCGAGAAAATCAGTACATCAGTACTCCCTGCAAAACCCCAAAATCAGAAAATTAGAAAAAGAACCCAAATCAGTGGCATGGTCCTTGTTTCTCCATTAATCAGTAGGTAATGACCTAATGAAAAAGAACCCAAAACAGACGGCTTAAATTATGGAAAGTGCTTATAAAGCTCATGAATAACTTTCAAAGCCTGCATTCCACAGTGTGCACACGCACAAACATAAAATATACATGCATAGTTAATTTTAGACAATAATACCTCAGAACATAAGTTGCAATTTGGGACTATTTGGTTGACTCAAAAGAAATTGATGGGTTAGAAAACCACAAAAAAAATACAAAGACGGATGTTTTTATGTCGTTCATTTCTTACGTCGACAAAACACACACACCTGTGTTTTAATGCTCCTCCAATACTCAATGAGAAGGCACCAGGCAAAAAGAAGGTCAAGGCTGGAAAGAAGCTTCCAAAGAGAACAATATATAAAGCAGACCACAAAAATTAGACAAAACCCAAAAACTAAACAGTAGAAAAACCTCTAAAATATATAAATATATATATAATTAAATAATTTAAAAAAAAACTAAACTGCAAATACTCTAGAAATCGTAAAATGAACTGCAAACCCGTCAATCATTTCCCAAAACCACATAACCAAAGAGTAAAAAAGGGAGTACGGGAGAGAGAAGCAGCCAAAATACAGAGAAGATGGCAAGAGAGAGAGAGAGAGAGAGAAAAATGAATTATTTTGGTGCCTCTGGTTCCTGCCTTTGTTCTTTGTTTTTCATTTATTTATAGGTAACTTGCTCAAGTCCAAAGGCAATTAAACATGATTAGTAAAGCACCATAATAAAGCATGAGAGATATCTATTTTAATTAAATCTGTTGTGGGCTCACTGTGATTGTACATCATCATCATAAATAATGCATGCTTGAACCCCATTTTAGTTTCATGCCTATCATAATTAAATCATGGATGGTCAAGAAGCATAGGACTGAGAAATCAGAGCCTAATTTCCAATATCAAAAGAGTACAAATTATTCAACTTAAACGCTAATTTCGTTAACGAAGATTAAAATAGGCGTGAAATCCATACAATTTATACGTTACCATTGATTCAAGTTCTGGTAGGTATCCATGGAAACTATCCGTTGCCACTCTCTCAGTTCCCATATTTTCTGTATGTTTCATTAAACAATATAAACTTTTGATGCTCTTCCATCTGGAGCTAAAACAGATTACCAATAATAACAAAGAGGTCTAAATAATAGAAATCAAAATTTTGATTTTTGCGGACTTTAGAGAATCTGCAAACTTTAGCCTAACATTATGTGATTGCCTCACTTCTTCAGTAACTCAGAGGAGGTGAATTACTCAAAGTATGGAGGACTTCTGCTAACATATTTCAAGCACTTGTAACATTAAATGTAATGACAGGTTGACATTATTATTATTTTTTTTTTGTAAAGAATTGTTGCAAGAAGTTTGACCCTTTGTCTTTTTATTTCTGTAAGGATTTATAGGTACATATAAAATCCATATTATATATGGTTCACAGATGAGAGTACTTCAAACACCAAATATTCATTCATGATTGGAGATAAGAAAGCTTACTAAGAGGCAATCGCCTTTGTGATGTTTACTTTTGTGCTTATCCTTTGTCTTCTTTTCTGAGGCAAAATATGTCAATGTGATAAGTAATTTCCCATAAAGAATATCATCCTCAATAGGCTAAACAACTACAATGGTTAGTCAAATAATGTACTTTCATGTAGTTAATCTCCTCGGTTTGTGTTTACTTTTTCAATATCAAAACATCTCGAAGAAACAACGTTTTCCCTTACTCTACAAACACCGAATGTGCCCGATAAACCACTAACAACGCCATTACTCTAATTCGACTGCAGAGTGAGAGTTAAGATAAGAAGATACTCACAGGCCAAAACGGATGACATCACCAACACATAAATCCAAAAGCCACAACCAAATTTAATTTTGTTTTTACGTTGAATTTTTTTTTCTTGAATCCGTTTGGATGCTGAGAACGTGTGGTATGGGATTATTAATTACCGGCAGGGAAAATGACGATTTCTCCTATTTGCATTTGCAGGTGGAGGAATCATAGCCGAGGGATTGCAGTTCGTCGGTGACCATCTTCCTCAAATCGTCTTTTTGTTTGAGATTCTTGTTTGCTTCGACGATCCTCGCCGTATCAGCCAGGAGGTTTCTCTCCGAGACGCTCACGCATGGAATCAGACTCTGATTAAACAATAATTAAGCAAACAATCAATCACCCATATTCATATTCTGTGTTTGGTTGCCAAGAAACCGCGAGAAATGCAAAAACAATTTACTAATAAAAAAGTGTAATCAAAGCAACCATTATTTATACTTTTGTACCTTAAGAATATCTGAGGCGTCGCCACCGAACGAACCGGAGGAGATTGAATCACCGAAACCTCCACCGAATATATCGAACTCGTCGTCGGAGCTGTCATTGCTGTTGCCGTGAAAGCAATTGCAGCGGTTCCGTCCACATTTCGGCGGAGGTTGCTTCTCGTTGCTTTCTTCGATGAAATTCTGAACCATCTTCGCCAAGCAGACCGAACTTGGCTTGAACTCAGGCCGCGGCGCTGACGGTCCCTTCATCCTTGCTGATATTGAGGCCGCAGGAGTGGCGAGTTGTGATGTGGACTCAGGCCTCTCGGCCTCTGGGTTTTACGGAGAAGGGGAAGATGGTGAGGGTTGAGAGAGATGCAGAGTCTGAAAGAGAGTGAAAGAGAAAGGGTTATAAGAGAGGTTGAGTGTGACAGAGACGATTGAAGCAAAACGCACGATGATAAACGCGTGTGCTCGGTTCAGAATGGCAAGCCCGTAAATACCCAATGACAGATTTGTAAATAAAATGAAATTCACTTCAAAATACTGTTCATTTTAATAGTGCCTATTGAAAACCTTACTTTAGACTAAAGTAACTAAAAATTATGTTTGCGCGTTGCTACTAGAACCAACTGTTTCAAACGTAATTGGATGGACAAAACACATTTAAGTTGAATAAATTCAAAACAATTACGAACAAACAGAAGGATACATGAGTGCATGAGGCCGGTAAGATCAGCAGTTTTGCTTTTGTACACTTGTAAGTGAGTTGACATATAAACACATTGCACAATGAGTGAGAATAAACTCTACGTGTTTGAAACTTCATTTTAAACTAACATTCACACAATCCTAATCATTTGTGAATTACCATATTCTTATCATTATTCCAATATCTCTTCATGTAGATGGGGTGAGCTCATACCAGTCACTAAGAGCATTTTTGATACTCTACTTGAATCCAACTTTTTAAATTCAAAAACAATTTTCAAGTTTTAAGCCTTAAAAACTTGTTTGGTAAGATTATTTTCAAAAATTGAACTTAAGATTAACTCAAAACTATAGTTTACTCTCTAAAAACACAAAATGTAAATTTTTAGAGTTTTTAAACTTAAACTCACTCATTTCTTTTCTCTCCCTCCTCCTCTCTCACTCCAAATCTATCTCTCTTTTCTTCTTTCTATGTCCCCCTTTTTTTTTTTTTTTTTACCTTTTTCGTCTCTCATCCAATCCGCTCTCTTCATTATCTCGATTCTTTTTCTCACTTATCTTCCTCTATATCTCCTCCGATCCTCTCTTCTTTCTCTTTCCTTCAATCATATCTTACTTTCTTTCCTCCTCTTTCCTCTTTCTCCCTCGACCCCCTCTTTTTGGATCTCTTTGTCCAGTTTAAGTTGTAAGATTTAAAAATTTTAAATTACATACCAAACAAGTTTTTTAGTCTTAAATAAAATTATTTTTCAAGAAAAATTCTTAAAAAATGTTTTGAGAAATGATAAAAAATTTCAAATAGGATACCAAACAAGCATTAAAATTGCTAATGTATTTAGTGATTATACAGAGCAACTTAACTATAGAAACGCTCCTCAAATCACTCTATACGTTTCCATTTTGCTTTTCAAATTAGCATGTTTATATATTGACATTAGAGAAAACGAGAATGCTGATGAAAATTGGATTATTAGAGGTTAAACGGCAGCGACCCCCCCCCCCTCCCCCCCCCAAATCCATTTTTGTTGGTTGACATTCTGAATATTGACGGTTTACCTTGTCCTCCTTAATTTCCTATAATCGGTAGTATAGGGGCGACATCTTGGCATTTGTTGCAGTGTCGTATCCATCTGTACCCCCCTCCACTACCTTGCTTGTCTCCTTTAGTTTATCTGTTGCTTGCCTCCCTTAACGAGCAGAAACCAAACAAGAACACCCAATTTTGACACGTGTACAACACACTCAAACATCATCAGCGTCCAAGAAGGCTAGGCGCCATATCACAGAGATCCATCTTGGCCTAGGTCCCTCTCTAGTTTCTTGCTAATCAAAATTCAAACCCAATTTTTTATTCGGAAATAAATTTCAAAATTTAGGAAATTTTATTATCTGAAAAAGAAATAATTTTCAAGGGTTACACTGTGACTGTGCTGATAAACACATGGATACCAAGCTCTGTTGTGATTGCTTCCCTTTACGTTTTTTCGCCAATCTTTGTGCACCATTTAGACATTGATAGTGATGCCAGTTTTAGCTGTATCCTCACATAAAAATTGCCAAATATACACAGATGTCAAAGATCTTGAAGTTTGGTTCACATGCTTTGTCAGGGAAGATCAATGTATGCGATTGGGTCGTCTGGAATTAGCAGTGTAAAAGGTGTTGGTATACGGTCCAGCCCATGATCAATGTTCTAGATTATTCTAGTAAGCAAGAGATGAGGCTGGAGCTTGCTAGACAATTCTAGCATGTTATTAAGTTGATGGAAGAAGCTAGAGAGTACTAGCTTCCTTGGTTGCAAATGGAAAGATCTAGAAGCTACAAGTATGTGGCTAGTCTAGATTTTTCTATACTAGAGGTTTGAAGAAGGAACTAGAAACTAGTAGAATGCCAAGCCCTCACCTATAAATATGGGTGTGATGTAACCAATTGAAAATCAAGAAAGAGTGAGTAGCAAAGGATCAAGTCCAAAGCTAGAGTTCCACTCCAAGAGTGAGAGTGAGAGTGTTCCACTACACATTGTGTGAGTGAAGTTTAGAGTGATAGAAAGTGTGTGTTATACTTTCTTGTATCCATCAAGCCTTGTCTTTGGCTTGGTAAGACTACTCTTGTTGTATTCATTTTTTTCATATAGTGAAGATTGATCCTTGTTTGGTGGACGTAGGCATAAATTGCCGAACCACATAAATTCTTGGTGTCCATTTTCTACTTTACCTTGTGCATTCTCTATCTTGTAGTACTGACATTCCTAACAAGTGGTATCAGAGCCCGGTTGGCTCGTACTACGAGATGGAAGGAAGTGGCACTATGATCAAACTCACCAACTCCAATTGGGTAACATGGAAGCCAAGGATGGAGGACATTCTCTATTGCAAGGATTTGCATGAGCCAATTGAAGGAGATGCCGCTAAGCCCGAGAGCATGTCCGATGCCGAGTGGAAGAAGATGAATCGCAAGGCTATTGGCACAATTAGACAATGGGTGGATGATAGTGTTTTTCACCATGTGTCTAATGAAACCAATGCTCGCGAGTTTTGGACGAAGCTTGAGTCCTTGTTCGAGAAGAAGACCCCAGCCAAGAAAGCCTTCTTGATCAAAGAGCTCATCAATGTGAAGTACAAGGATGGTTTAAGTGTAGCAGAACACTTGAACAATTTCCAGAATATCATCAACCAGTTGGCTACTATGAAAATGACGATCGAGGACGAGCTACAAGCGCTCTTGTTACTTGGATCCTTGCCAGACAGTTGGGAGACCTTTGTGGTGAGTATAAGTAACTCTGCTTCTAATGGTGTTCTTACTCTTGATAATGTTAAAAATAGCATGCTCAATGAAGAAACAAGGAGAAAGACTTCTGGCACAGATAGCAGCCAAGTATTTGTCACAGAGAACCGCGGAAGAAGCAAGAGTAGAGGGCCTAGAGGTCATGGCAGGAGTCCTAGCCGATCCAAGTCAAGGTTCAGGGGTGCATGCCACCATTGTGGCAAAGAAGGCCATATGAAGAAAAATTGTCGAGTTTGGAAGAGAGAGCAAAAGGAAGGAAACAATCAGAAGAAAGATGATACTGGCAATACCACTGCTGTCATATGTGGTGATGTACCAGAAATATTGTCTGTTGGTGAATGTCTGCATATGGGCAACTCTGACAGAGACATTGAATGGATCTTTGATAATGGAGCTTTCTTCCATGCTACGTCCAAACGGGAGTTCTTCAGTACATACAAAGAAGGTGACTTTGGCATAGTGAAGATGGGGAATGAAAGCTATTCCAAAATTCTTGGAATTTGGTGATATCTGCTTAAGAACTAATCTCGGCTGCCAATTGATGTTGAAAAGATGTGAGACATATTCCTGATATACGTCTCAATCTGATATCCATCGGTACCCTTGATCGACAAGGATATTATCACCATATTGGCGAAGGAAAATTGAAGCTTACTAAAGGCTTAATGGTGGTAGCAAGAGCACGACTTTGTTGTACGTTGTACCGGTCAAATGCCAAGGTTTTGAAAGGTGAGTTGAATGCTGTGGAAGACTCATCTCTAGACTTGTGGCATAAGAGGCTAGGCCACATGAGCGAGAAAGGCCTACAAGTTTTGGCAAAGAAGTCTCATATTCCCTTTGCCAAAGGTACGTCGTTAAACTCTTGTGAGCATTGTTTATTCGGAAAACAAAGAAGAGTTAGTTTTTCTGTTCCATCTACAAAGAAAGGAAACTTGTTAGATCTTGTTTATTCAGATGTGTGTGGTCCCATGGAAGTCGAGTCACTTGGAAGAAATAAAATATTTTGTTACTTATATTGATGATGCTTCACGAAGGGTGTGGGTGTATTTGTTGAAATCCAAAGACCAGGTGTTTCAGACATTCCAGGAGTTCCATGCCATGGTGGAGAGGGAAACTGGGAAACCTCTCAAGTGCCTTCGTAGCGACAACGGCGGCGAATACACATCTCACCAGTTTAGAGAGTATTGTGTAAAACATGGCATACGTCATGAGAAGACAGTTCCTGGAACTCCACAACATAACGGTGTTGCTGAAAGAATGAACCGAACCATCATGGAGAAAGTCAGGTGTATGTTGAGGACTGCAAAGTTATCTAAGCAGTTCTGGGGTGAAGCTGTAAGGACAGCCTGCTATTTGATCAACCGATCTCCATCAGTACCATTAGGTCTTGATGTTCCAGAGAGAGTATGGACTGGTAATGATGTGTCTTACTCTCATCTGAAGGTGTTTGGTTGCAAAGCTTTTGTGCATGTGCCCAAAGAGCAGAGATCGAAGTTAGACTACAAAGCTACACCGTGCATCTTTCTTGGTTATGGCGGTGAAGATTTTGGTTACAGATTATGGGACCCATACCAGAAGAAGTTTATCCGAAGTAGAGACGTGGTCTTTTATGAAGATCAAACAATTGGGGATTCGGATAAAGAGGCACAACCAGATGGCGCAGTCAGAGGAGTTGATCCATTAGTTTCAGATGAAGAAAGTCACGATGACATCCCTGAAGCAACTGCCAATGAAGTGCCTGCAGAATCAGATAATGCTGATCAAGAGGAGCCTGATCAAGATGTGCCAGACCATGAGATTGCTGATCAGGGGGAGCCTAGTCAAGAAGAGCAGATTCAAGGAGAATCCAATCAGGGGGAGCCTCTAGCCCCGCAAGAGAATGAAGATCAGGTCAGAAGATCCAGCAGAAGTCGAAGACCGTCTACCAAGTATTCTTCATCAGAGTATATCATGTTGACTAATTATGGAGAGCCCGAAACTTATGAGGAGGCCAGAGCTCATAACGACAGTGATAAATGGATGAAGGTAACTTGGAGTCATGATCGGAATTCCTCCCTCATGGACTGGAGGGGGAGATTGTTGGTATACGGTCCAGCCCATGATCAATGTTCTAGATTATTCTAGTAAGCAAGAGATGAGGCTGGAGCTTGCTAGACAATTCTAGCATGTTATTAAGTTGATGGAAGAAGCTAGAGAGTACTAGCTTCCTTGGTTGCAAATGGAAAGATCTAGAAGCTACAAGTATGTGGCTAGTCTAGATTTTTCTATACTAGAGGTTTGAAGAAGGAACTAGAAACTAGTAGAATGCCAAGCCCTCACCTATAAATATGGGTGTGATGTAACCAATTGAAAATCAAGAAAGAGTGAGTAGCAAAGGATCAAGTCCAAAGCTAGAGTTCCACTCCAAGAGTGAGAGTGAGAGTGTTCCACTACACATTGTGTGAGTGAAGTTTAGAGTGATAGAAAGTGTGTGTATACTTTCTTGTATCCATCAAGCCTTGTCTTTGGCTTGGTAAGACTACTCTTGTTGTATTCATTTTTTTCATATAGTGAAGATTGATCCTTGTTTGGTGGACGTAGGCATAAATTGCCGAACCACATAAATTCTTGGTGTCCATTTTCTACTTTACCTTGTGCATTCTCTATCTTGTAGTACTGACATTCCTAACAAAAGGAGGATTGATGAATCTGAGAAAGAGGATTGAAAGCAAAAGAGATGAGAAGCTGAATGGAAAACGTCGCTCCAGCTTCCTCTTTGATTCAATCTCGCCCACTGAATAAAAATGAGAGAGACAACGCAAGAAGGAACCGTTACAAACTTCACATGCATTACACACCTCTCATACTCGCAAACCTCTATCCAGTCTAGTAAGGGCTTTGAAGCAGCTTCTAAAACGGACTAAGGGCTCGTTTAAGCATAATAAAAAATTGGGTTTACACCCCCCTTGTGTACCTGGTAAGCCCCTCTTCACATTGGATCTAAGCATATATTCTTAGCTTTTGAAGCATCCGACAAATAAGGAGGATAGGTTTTTTTAGAAGTTTCTGACTCTTCTTCAAATAAATCCATTTTATCGGGATTAAAAATAGGAATTGGTAAAAATCTCAAAGACAACACAAGAAGGAACTGTTGCAAACTTCACATGCATCACACACCTCTCATACTCACATGTCTTGCATGTGTATATCTAAGACAAAGTCCGCTACTATGACAGCTGGCACAATCCGAACCTATGAGCTAGTCTAATCTCAACCATTTAATTTCAATTCAAACAAATAAGGACAAGACTATGGAACTTGAATTCTAAGAAATCAGCTTCAAGGCTTAATCACTAACAATACATACCTGATCAAAAAAGAAAGAAAAAACACAACTTTACAATACATACGGATAAGTAAATACTGTCCACGTACTAACCGCAGGTGAAGAAAGAAATACGCGAAAAAGCAAAAAACTAAATAGAAGAGCTCTCAGAATAAAGAAACCAACTCAAAACACAAAAGAGTGATAAACTCTACCACACAAAATCACCATTTATTCCACCTCCCATGTCCCCAGTCTTACTACATATCAGTGATGATGCGCCAAATACCTCAATCCCCATTACCCCGTGACCCACAGATACAACCCCATATTCTCCCACCTCTCCTTGATGCTGCCACCGCCTTCTCCTTCTCTTCCTCATGGCTCGACTGCTTGAGATAACTCAAAATTGCCTCAACAGCCACCGCCTCCTTTTCCTCGCAGCTTGAGTCCACCGTCACAGTCAACGGTGCGGTGCTCTGATTCTGATCCAAATTCCCAGAAGTGCTGAAACTTTGTCGTTTTGGGTGGGAACCCTTTGATCCATGATTGCTGTCCTGATGTATACTAGTTCCCTCTAGTGTACTCTCTGCCTCAAGGAACTCCAAATCTCGCAGCCTCATCTCTTCCCCATAACTTGACTCCTCATGATCTGTCAAAATTTCTGAACCATCGCTCCAGGGGAGGAGGGATTCCCCATCAGCCACCGCTTCATTTTGCTCATTGTTTGGGACCATGGCAATGATGGCATTAATCATAGGTGCAGTGCTTCGAAACTGAGCCAAATCCGCCAAAGTGATGAATTGTTGTTTAGGGCGGTAACCACGTATACCAGTTCCCCCTATGTGAAGGTTCTTCAAATACCGTAAGTCTTCAGGCAACTTCGAAAGTTCTGAGCACCCATGGAGATTGAGCCATTCGAGACTCAACAAATTGCAGATACTGTCCGGAATATAGACCAGGCTTTTGCACTTTTTCAGATTTAACGACACTAGCCCCTGAAGCCGTTCAATTGATGCAGGAAGCTCTCTGATAGATGTTCGATCCAAATCAAGGCTGGCTAACCTTTCCATATTTTCTAATATGTCTGGAAACACCTCAAACTTTGTACAACCAGAAAGAGAGAGATAATTTAGGGACTTGAGTTGACAAATGTTGCTTGTAAGACTCTTAAAGTCTTTGCTATACCGTAGCGTCAAAGTAGCAAGTCCCGTAAGACTATAAATTATGGATGGCAATTCTTCAATTGCAATCCCTGAAAACTCAACAATTTTTCGGCGGCGAGAGGCTTGCTCACGTTCAAGCTCTGTAAGATTTTTGAATGTTGATGAATCTTCTGTAAATATAGTCCAATCGAAATTAAGCTCTGTTAGGTTCTCCATACCTTCTAGAAACTCTGGAAAATTCTTCAGATTTGAGCAGCCAGAAACATTCAGGACTTGAAGAGATCTCATATGAATGCTGCCTGGAAAAATCTTTAATCTTCTGCAATCCTTCAGGCTCAGGGTAACGAGTCCTGTAAAATTTTTTATGGACGAGGGCAGTTCTGAAATTGCAGTCTCATCTAAATTAAGCTCTAATAGGTTCATAACTTCAGGAATTTCTGAAAAATTATCCAGATTTGAGCAGCCGGAAAGATTAAGGGTTTGAAGAGATCTCATGTGAATGCTGCTTGGAAGGCTATGAAGTTTCTTGCACTGCTTTAGACTCAAACTCTCAAGGTTTTCAAGAGAATAAATTGATGGGCAAAGGTCTTCAACAGATGTCTCATCCAAGCGAAGCTCTCTTAATCCTTCCATATTTCCGCCATTTTCTGGAAAGGCTTTGAGCTTTGAACAACCAGAAAGATTAAGAAATTGCAGGGACTTGAGTTGAACAATGCTGTTTGGAAGAATCTCAAGTTCTCTGCAATATTCAAGATTCAAAGTAACAAGCCCCGTAAGATTGTTAATTGATCGAGGCAGTTCTTTTATTGCAGTCCCTTGCAAATAAAGCTTTGAAAGCTTCTCCATAATTTCTGAAATCTCTGGAAACTTCTCAAGTATTGAGCAAAAAGAGAGATCAAGGGTTTCAAGAGATTTCATACAAATGGTGCTTGAAAAGGTCTTGAGTTTGCCGCACCAACTTAGATCCAAGAGGACAAGTTTTTCAAGGGCAGAAATGGATGGGTGAACCTCATATAAACTTTGTGCATCCACCAAGAATTAGGTTCTCAAGATTCTTTGCCTCAGTGAAGTCAGGTGTTTCCTTAAGACGATAAGAGCCTTTTAAGTTGATAATTTTCAACTTTTCCAGAGGCTGTCAATATACAACAAGGAAAATATGTGTTACCTACATAATAAGGCATTTAAAAACTAAACAATTTAAAAGCAGTATATAGGCAAATGATGAACGTACCTGAGTTCCTTTCCAGAGGTGTTCAACCCAACTATATTGCATGTCAATGTCAACAAGATTCTCTGGGTTAAAATTGGACGATAAAGACTTTAGAGGACATTTGTGCCAGAACAAATAACTTAATTTTTCAGAGAGAAACTTTAGATCCTTGTATTTCCATTCATCATCGGATTCCCTGCCCGGTGGTTGTAAATAGTGGGTATGGACTCTGAGTAGTCTTAGTTTTATCATTTTAAAAAAAGCGGTGTCTAATTCCACCACATTGTTTGAGTATGGCCAACGCACAATTATGCTTTCAACTGCTTCTGTAGCCTGGATAACCAAAATTGCAAATTGAATGAGTACAAAACTTAAGATTATAACTTCTAAATGCACATGTTTCTCATTAATTGGATTTTGGTCAAAGTTGAAGCTTTATACTTTTTATTAATATTAATAATAATAATATTATTATTAACATTATTATTATTATTATTATTATTATTATAATTATTACTATTATTAAATTTACTAATATTAATGTGAGAGAGAAGATTCAAAGCAATTACATTAATGGAAGGGAGGGAGTGCGTTTCTCACCGTTTCTCGACTTAACACATGATGAACATCTTCATAGCTCCACAACCTACTGCGCCTCCCAGGCTCTTTTATAGATTCCTGGCGTACGATTTCGCGACCCATTTCCTCTAGTAAATCATGCATCTCGAGTACACCATCAGATGAGACAGTGACAAGAGCTCTACCAACTAGAACGTCTAATCCGGTATGGGGATGGAAGTCACAACCCTCCATAATCCTTGTTGCAAAGTCTTTCTTCATTTGTTTAAAGAAACATGCAATATCAAGAAATATTTCCTTCTGCAAACCATCTAGTCCATCAAAGCTTGTTCTAAGGACTGTCTGGATTCCCAGGTGCGGATTTCTCGCTATTTTCTTTAACTCATCTTTCCACACAAGTACACTTTTGTTATCGAGGAATGCTCCCAAGACTTTGAGTGCTAAAGGCAAACCTTGAGCATATTTTATGAAATGGCCTGACAAATCAACGTATTCTTCTGTGGGTTGCTTTGTACTGAAAGCATACTGCATAAACAGCTCGAGAGCATCATCGTCATTTAACAACTCGGGCTCATATATCTGATCACCAAGTCTACTTAGTGACTGTTTCTCTCTAGTTGTTATAATGATTCGACTTCCGCCACCAAATGAAGGTTGCTTTCCAATTAAGGCTTCAATTTGGGATGAACTCTCCACATTATCAAGAACAAGTAAAACCTTTTTCCTACCAACTCTTTCCATCATCTTCTGAAAACCATTTCTCAAAATCTCTGAACTCCCCACCTTCATAT\n>URS0000222F4A rRNA from 1 species \nACGGGGTGCAGCAGGCGCGAAAACTTCACACTGCGCGAAAGCGCGATGAGGGAATCCCAAGTGCTTGCACGTAAGTGTAAGCTGTTTCTATGTCTAAAACGCATAGAGAGTAAGAGCTGGGTAAGACGGGTGCCAGCCGCCGCGGTAATACCTGCAGCTCAAGTGGTGGCCGTTATTATTGGGCCTAAAACGTCCGTAGCCGGTTTATTAAATGCCTGGGTAAATCGGGCCGCTTAACGGTTCGAATTCCGGGTAGACTGATAGACTTGGGACCGGGAGAGGCTAGAGGTACTCCTGGGGTAGAGGTGAAATTCTGTAATCCTAGGGGGACCACCAGTGGCGAAGGCGTCTAGCTAGAACGGGTCTGACGGTGAGGGACGAGGCCCTGGGGCGCAAACCGGATTAGATACCCGGGTAGTCCAGGGTGTAAACGCTGCTTGCTTGATGTTAGTCGGGCTCCGAGCCCGATTAGTGTCGGAGAGAAGTTGTTAAGCAAGCTGCCTGGGAAGTACGGCCGCAAGACTGAAACTTAAAGGAATTGGCGGGGGAGCAC\n>URS0000E1B154 rRNA from 1 species \nTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGATGAAGGCCCTAGGGTTGTAAAGCTCTTTCAACGGTGAAGATAATGACAGTAACCGTAGAAGAAGCCCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCTAGCGTTGTCCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGATATTTAAGTCAGAGGTGAAATCCCGGAGCTCAACTTCGGAACTGCCTTTGATACTGGGTATCTTGAGTATGGAAGAGGTAAGTGGAATTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAGGAACACCAGTGGCGAAGGCGGCTTACTGGTCCATTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACA\n>URS00022EEFAF misc_RNA from 1 species \nTGGCTCTCCCATCGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACCTTGCGCCCTCTGGTATTCCGGAGGGCATGCCTGTTTGAGTGTCATTAAATTCTCAACTTCAAAAGTTTTTATTGAATTTTTGAAGCTTGGATGTTGGGGGCTTGCTGGCGTCTTTAGATGTTCGGCTCCCCTTAAAGTTATTAGTGGGAATGTCTTTTATTAGGCAATCCTTGGTGTGATAATTATCTACACTTTGGATGGTTTAATGGTTCCAATGAGGCTATTGGTATTGCAATTAAGTTTGCTGTACCTTGGGTCTTAGGGGAAAAGATAAGTCTTGCTTTCTAACCGTCTGTGTTACATGGACAATTTATTGACTATTTGACCTCAAATCAGGTAGGACTACCCGCTGA\n>URS00001F1239 rRNA from 1 species \nTAAAGGTATTCCGGTAGACGATGGGGATGCGTTCCATTAGATAGTAGGCGGGGTAACGGCCCACCTAGTCTTCGATGGATAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGAGGAACATTGGTCAATGGGCGAGAGCCTGAACCAGCCAAGTAGCGTGAAGGATGACTGCCCTATGGGTTGTAAACTTCTTTTATAAAGGAATAAAGTCGGGTATGGATACCCGTTTGCATGTACTTTATGAATAAGGATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGAGCGTAGATGGATGTTTAAGTCAGTTGTGAAAGTTTGCGGCTCAACCGTAAAATTGCAGTTGATACTGGATATCTTGAGTGCAGTTGAGGCAGGCGGAATTCGTGGTGTAGCGGTGAAATGCTTAGATATCACGAGGAACTCCGATTGCGAAGGCAGCCTGCTAAGCTGCAACTGACATTGAGGCTCGAAAGTGTGGGTATCAAACAGGATTAGATACCCTGGTAGTCCACACGGTAAACGATGAATACTCGCTGTTTGCGATATACGGCAA\n>URS000107D7B1 rRNA from 1 species \nTACGTAGGGGGCTAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGCCCGGTAAGTCCGCTGTAAAAGTCAAAGGCTCAACCTTTGAATGTCAGTGGATACTGCCGGGCTAGAGTCCGGAAGAGGCGAGTGGAACTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAAGAACACCGATGGCGAAGGCAGGTCTCTGGGCCATAACTGACGCTGAGAAGCGAAAGCATGGGGAGCGAACAGG\n>URS0001943432 rRNA from 1 species \nGTGAGGAATATTGGTCAATGGGCGAGAGCCTGAACCAGCCAAGTAGCGTGCAGGATGACGGCCCTATGGGTTGTAAACTGCTTTTACACGGGGATAAAGTGTGCGACGTGTCGTTCATTGCAGGTACCGTGCGAATAAGGACCGGCTAATTCCGTGCCAGCAGCCGCGGTAATACGGAAGGTCCGGGCGTTCTCCGGATTTATTGGGTTTAAAGGGAGCGTAGGCCGTCTGTTAAGCGTGTTGTGAAATGTAGATGCTCAACATCTGAATTGCAGCGCGAACTGATAGACTTGAGTGCGCAGGAAGTAGGCGGAATTCGTGGTGTAGCGGTGAAATGCTTAGATATCACGAAGAACACCGATTGCGTAGGCAGCTCACCAGACCACAACTGACGCTGAGGCACGAAGGTGCGGGGATCAAACAGGATTAGAAACCCTTGTAGTCC\n>URS00007057CD snRNA from 1 species \nAAAATGAGGGCAATCTGGTTGCGACATCTGTCACCCCACTGATCACCAGAGTTGATTCGGCTGATTTGGCTGGCTAGGCGGGTGTCCCCTTCCTCCCTCACTGTTCCATATGCGTCTCTCCTGAAGCTGCATGATTGGTTGAAGAGGACAACATCCCAGGTATAGAAGGAGTGTACTGAGGTCTCCAGTCTTCGATCCCAGATATACTATAGCTGCACTCCCCTGCTAGAACCTCCAAACAAGCTCAAGGCCCATATCAAAGTCCATAATGGTGGCCCCTAAGTTTGTCCTCAACTTATACATGTGGTGGACTTATA\n>URS0000B96F2F misc_RNA from 1 species \nTTGTTATAAATAATAAGCAGAAGAAAAATATATTGTTTACCTAGTTTACTTTTAAACGATGAGAATTGCAAAATTTGGATAAAATTGTGAGATTTGAATTGCAAATCATCAATTTGCTTATGATTTTGATCAATTTCAATTTGCTTATGATTTTGATCAATTTCAATTTGCTTGGTTTGAATTGATTGAGACTTGATTTGGTTCAATTTTAATTGTGAACTTTACAATTCTTGTAACTGTGCCATGTCAATATGTGGATCTCTCTTTGCTGAGCCCTTCTATGCGGCTATGCTAGAGTATGCTAGAGTTTCATCATCATAAAGGTGTGATACTTGGGATAAAAACTACACTTGATACCTGCACGTTAGTCGAGTAACATATATCACCTTTTGACAAAGCTTGTTGTTTCTTTATGTGAAACAAGAAAATGGAGTGGCTGAAGCTCTTTTAGTGGGTGCCACTGCTTCACCCTAAATTAAGTGATTAGCTTTTTCCATTATATCCTATATATCAGTAGCTTTATGTCTTCAGAATCTATTCCCAACATTTGATGTTGTTTTGAGTTTAGAATAGGGGATGGAAAACTATGTGCCGCTTGTTGCTTGTCGCTTGATGTAACAAACTATAAGGTTAAGTGTTCTCAAATCTCAATTTATTGGATTCCATGGCTTATGTTGCTAGGCATTGGCATGAATGGAAAGCGGTCTTTGTACCATAATACATATGGGTACTCCCAATATACATATAGCCCCTTTGGGACTGGTGACTGGTCATATTATATGGTCTTCATGTTCCCCTTGTCATCATTACTGGAAGTCTGGAATGAATGCACAAGCAATGCAATTCTAAGATCAAAATTCTGTCCTTTTTTTCTTTAGTAATAAGTTGACTTAAGTGAAGCCAATTTATTTTTCTCAGTATAATTTTTTGAACTTGGTTAATTTTGCAAATGAGCCCATTGCCACCAATCATTATTCACTATTGGTGTAGAGATTATTGCACATGCTTGATTATCTTGATTTTTTTCTCAAGTGCAAGTGCTTTGGATTCTTTCCTATTAACAGCTTTTCATCATGGATGAAAGAGAATTTCTCTGTTTTTTATTTGATGCATTGTGCCTGTCTTTCTTCTTCTTTTTTAAACTGAGCCAATCTGTATGCATTCGAAAATTGTATTGTAGGCTATAAAATGGAGAATTTTCACATGCTAACTTGCAACATGTGTTTTTATTAAGCGCTGCCAGCTAAATTATGATCTTGCATAAATTTTGTCCTTGTTTATGACATCATATGGCCATTAATTTTTTTTTCTTTTATAATTAACCCTGTTTTTGTCAATAATCTTTTTAGACGGTCTCTCCTATGTGGTCGTTGGTGGTTTTTCTTTCTTTTTAAAGCAGCTTTGAAGTTTTCAGGGATTCTTTGATTTATATCTTAAAGTATCCATATTCTATCTATCCTAATCTATGCTTTGAACAAGTTATGCCATCCAATACTGTCATTACAGGCAAAGTGGAGGCAAGAAGTGA\n>URS0000D729CC rRNA from 1 species \nGGATGCGATCATACCAGCACTAAAGCACCGGATCCCATCAGAACTCCGAAGTTAAGCGTGCTTGGGCGAGAGTAGTACTAGGATNNNNNNNN\n>URS00003FE27D rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAGGTCCACCGCGTAGCAATACAAGGGAAGACCTAGTGGCGAACGGGTGCGTAACACGTGAGGAACTTGTCCCGGTCTCTGGGATAACAGTTGGAAACGACTGCTAATACCAGATGACGTCGGAATCTCGCATGGGATACTGACGAAAGGGTTACTGGATCGGGAGAGCCTCGCGGCCTATCAGCTTGTTGGTGAGGTAACGGCTCACCAAGGCGTCGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCAACGCCGCGTGCGGGAAGAAGGCCCTCGGGTTGTAAACCGCATTCAGTAGGACGAAAATGACGGTACCTGCAGAAGAAGGTGCGGCCAACTACGTGCCAGCAGACGCGGTAAAGTAGTCGTGT\n>URS00023E9193 lncRNA from 1 species \nCAATGTTGGAAACGAAGTTGGATTTGCTCCTAACATCCAGGTTAACCATAGTTCTTGCGGCTTCTCCGGCATTGCACCACCGCCTCCAAACAGACCCCAGTTATGGATCTTGTGATTACCCATCTTCCACAAGGAACAGAAACATTTGGTCAAGTTTCTTGCTCTGCATCTGCGATTACGTCAGCAATGTTTAAGTTATCCTTTCTCAGTGCAGGGAATAAAAAAAAAAACAAAAAGTCCAAACAATTCAGTCGAAGAATACTCGCAGAGAGAGAGACCTAATGGAGGAAGGGCTCAACGGAAAGGAGTACTTGCTCAAGGTGGTGCTGATAGGCGACTGAGATCTGGGACACCGCCAGCCAAGAACGCTTCAGGGCCGTCACCTCTGCTCACTCTCTCTCAAAGCCCTAATCTTTAACCATCGGCCGTCACCTCTGCTCACTCTCTCTCAAAGCCCTAATCTTTAACCCTAAAAAATCCCCAAATCTCTTCATCTCCTTTCCCCCGCACGTACAACGATGGCTCTAATGAGACCCTAATCCGGAAACCAACCCCC\n>URS0000805F26 rRNA from 1 species \nAATAGATACCCCGGTAGTCCATGCCGTAAACGATGAGTACTAGCTGTCTGGGGTATCGACTCCCTGGGTAGCGCAGCAAACGCGATAAGTACTCCGCCTGGGGACTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCAGCGGAGCGTGCGGTTTAATTCGAAGCTACGCGAAGAACCTTACCAGGGCTCGACATGTCCCTGACCGCCGATGAAAGTCGGTTTCCCTTCGGGGCAGGGTCACAGATGCTGCATGGCTGTCGTCAGCTCGTGCCGTGAGGTGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGTCGTGTGTTGAATTTTTCACACGAGACTGCCCGGAGCAACCGGGAGGAAGGCGGGGATGACGTCAAGTCAGCATGGCTCTTACGTCCTGGGCTACTCGCACGCTACAATGGGCAGTACAGACCGTTGCGATATCGCGAGATGGAGCTAATCGGACAAAGCTGTCCTCAGTACGGATTGCAGGCTGC\n>URS0000ACA7F0 rRNA from 1 species \nAATGAACACTGGCGGTAGGCTTAACACATGCAAGTCAGACAGAAACGATGAAGTGCTTGCACTTCAGGCGTCAAGTGGCGGACGGGTGAGTAACACATGGGAATCTACCTATAGTTGGGGACAACATATGGAAACATATGCTAATACCGAATGTGCTCTAAGGAGTAAAGGAGCCCTCTCTTGAAAGGTTTCGCTATAGGATGAGCCCGCGTGAGATTAGCTAGTTAAGGTAATGGCTTACAAGGCAACGATCTCTAGCTGGTTTGAGAGGATGATCAGCCACACTGGGACTGAGACACAGCCCAGACTCCTACAGGAGGCAGCAGTGGGGAATATTGCACAATGAGCGAAAGCTTGATGCAGCCATACCGCATGTGTGAAGAAGGCCCGAGGGTTGT\n>URS00012146AA rRNA from 1 species \nCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGACGAGAGTCTGAACCAGCCAAGTAGCGTGAAGGATGACTGCCCTATGGGTTGTAAACTTCTTTTATATGGGAATAAAATGTTCCACGTGTGGGATTTTGTATGTACCATATGAATAAGGATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGAGCGTAGGGGGATTGTTAAGTCAGTTGTGAAAGTTTGCGGCTCAACCGTAAAATTGCAGTTGAAACTGGCAGTCTTGAGTACAGTAGAGGTGGGCGGAATTCGTGGTGTAGCGGTGAAATGCTGAGATATCACGAAGAACTCCGATTGCGAAGGCAGTTCACTGGACTGCAACTGACACTGAGGCTCGAAAGTGTGGGTATCAAACAGGATTAGATACCCGAGTAGTC\n>URS0000767CA2 rRNA from 1 species \nGATGAACGCTGGCGGCATGCTTAACACATGCAAGTCGGACGGGAAGTGGTGTTTCCAGTGGCGGACGGGTGAGTAACGCGTAAGAACCTGCCCTTGGGAGGGGAACAACAACTGGAAACGGTTGCTAATACCCCGTAGGCTGAGGAGCAAAAGGAGGAATCCGCCCGAGGAGGGGCTTGCGTCTGATTAGCTAGTTGGTGAGGTAATAGCTTACCAAGGCGATGATCAGTAGCTGGTCCGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTCCGCAATGGGCGAAAGCCTGACGGAGCAATGCCGCGTGGAGGTAGAAGGCCCACGGGTCGTGAACTTCTTTTCTCGGAGAAGAAACAATGACGGTATCTGAGGAATAAGCATCGGCTAACTCTGTGCCAGCAGCCGCGGTAAGACAGAGGATGCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCTGTAGGTGGCTTTTCAAGTCCGCCGTCAAATCCCAGGGCTCAACCCTGGACAGGCGGTGGAAACTACCAAGCTGGAGTACGGTAGGGGCAGAGGGAATTTCCGGTGGAGCGATGAAATGCGTAGAGATCGGAAAGAACACCAACGGCGAAAGCACTCTGCTGGGCCGACACTGACACTGAGAGACGAAAGCTAGGGGAGCAAATGGGATTAGATACCCCAGTAGTCCTAGCCGTAAACGATGGATACTAGGCGCTGTGCGTATCGACCCGTGCAGTGCTGTAGCTAACGCGTTAAGTATCCCGCCTGGGGAGTACGTTCGCAAGAATGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAAAGCGAAGAACCTTACCAGGGCTTGACATGCCGTGAATCCTCTTGAAAGAGAGGGGTGCCTTCGGGAACGCGGACACAGGTGGTGCATGGCTGTCGTCAGCTCGTGCCGTAAGGTGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGTGTTTAGTTGCCACCATTGAGTTTGGAACCCTGAACAGACTGCCGGTGATAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGCCCTGGGCGACACACGTGCTACAATGGCCGAGACAAAGGGTCGCGATCCCGCGAGGGTGAGCTAACCCCAAAAACCCGTCCTCAGTTCGGATTGCAGGCTGCAACTCGCCTGCATGAAGCCGGAATCGCTAGTAATCGCCGGTCAGCCATACGGCGGTGAATTCGTTCCCGGGCCT\n>URS0000BE21C0 hammerhead_ribozyme from 1 species \nGTACTGCTGACGAGTCCAAAACAGGACGAAACAGCTGTGCAGTGC\n>URS00023CDC16 lncRNA from 1 species \nGAGATGATTCTACTTTTCAGCTGGAGAACTTAGCAATAAGTTGTGGTAAGGAGATAAAAATTCCTAAGCAATGGCTACTTCAATTAGATAATCTGGAAAGCTTGTCACTGCATCGCTGTTGGTCAGATGAGCTGAAATCTCTACGTTTCCAGAGATTGAAGAAACTCACACTTGGTCAACTTAGTTGCTTCACTGTTTTCTCATTCCCAGACTTTGAAAGACTTCAACAGCTCAGAGAATTACGAATAGCACATTGTGATTCATTGGAACATATCGTGGAGGTTGTTAATGGTGAAGAAGCTTCTGGCATGGATACGGAGACTGCTGCACTAGTTCAGCTGGTAAAAGTCTATCTTGAGGGTTTGCCAAAACTCAGAAGTTTTACACACACAAAGTCTAAGAATCTTATGGCCAGTTTAGAGCAGGTGGAAGTGGAGCCCTCGATTCTTTTCAGGTGCCCTGTCGTTGGAAATCTCCAACAGCTCAGATGGTTAGACGTGACTGATTGCAGATTGTTGGAAGGCATTGTGGAGGTTGCAAGAGGCTATCAGACTTCTCACAGGAATGACCACATTATCACATTCCCTCAGCTCTATTCCATTAAACTTAGAAATTTGCCCAACCTCCAAAATTTCAGTCCCACTAAAAGCTATAGTTTCAAGATGCCCAAATTAACAGGTTTCGGTCTGTTCTATTGTCCCCGGATGGAGAATAAACCCTTCATGCAAATAATCGCAGAAAGGGTACATTTTTCTTCCGAGGAGCGTCGACGACTGATAATAGTTGAAAACCTCAAGGACTACACACTTAGAAAAATAAACAAGCTCGAAAGCGTGGGGGAATCAAGTAACAGCAATCAGGATGTGGAAACAGAAACAATGAGAGTTGAACAAGCGGAAGCCATAGTTGTTCAACAACGGGAAGAGGGAGTTGGTGCAGAAGAAGACGACTTTTTCTTCTTAAGAAAGTCTCAGACTTCATTGTTTTTCATTTTGTTTTTGTTTTTGGTTTTGGTTTTGTGTTTGAAGGAGGTCTGAGCGTCTGACACTGAATTGTAAGTTGTGAAAAGCGACAACTGAGGATGCGGGCTGATTGGAGGCCCAGTTCCAGTAATACAATTTCAGGTCCAATATCTATGGCCTGCATAATTTTTAAGAGTTAAGTTCCATGTAGTATATTTATGTAGTACTGTAGGCCACGTATATTCTGCAACTATAAAATGACATAAAAACATTGCAAAATATATGAAACTTGTTATTTTGTGAAATACATTCTATAAATATCACTATTTCATGAAAAATATTGAAAATCATTTATGTTCGACAAGTATAACACATATGTTCAGTAATATGTAAATATGTTCTGCAAACCTAACATGTGTTGCAGAATAATGTGTTTTTCACTATTTAACTTGTGGAATGTTTAAGATTGTCAAAAATTTTAACAAAATAATGATATTTATAGAACATGATTTGCAAAATAACACAGTTTGCAATGTTTTTATGTCATTTTATAGTTGCAGAACATACGTGGTCTACGGTACTACAGTAAATATGTGGATTACATGGAACTTTGTTCTAATTTTTAATGTATATATTAATTTCAAAGCACTTCATCCAAATTATGTATACACACAATATATATTACATTTTATTATTTATTTTATTGATCTGTTAATTAGAACCTATAACCTAGACTGCAATCGTCAACCTTCAATTTTGATTATTTTTCTGCCAAAAAAATAAATTTTATCAAGTTCAAAATTTGTCAACTTTTATCATGGCGATACTAAATACTCCCTCCGTCCCAAATTAATTGTCCAGTTTGACTTTTTGATGGTCAATTTGACCCAACTTTGATTGGAAATTAAAAATTATCCTTTTACAATTTTACAAAACTGAAAAATATATTCAAAAATAGATTTGATAATCTTTTCAATGATATATATTTCATAATTTTATTCAATTATTTAATATACATATTTTTCAGTCAAAGTTGAGTCAAATTGACCATCGAAAAGTCAAACTGGACAGTTAATTTGGGACGGAGGGAGTAGATATTAAGCAGTTTCTTGATTTGATTATGCCTATAAATTATTTGTTTTTTCATTTAATGATTCCTTCCGTTAATTAGAGGCTTTAATTTAGAATGTATTATTAAATTTTTATTTCTCAAATATTTCTTAAATAAACAATTGAATAATGTTTTTTTTGAGAGAATTGAATAATGTTATGTATCCCAAATTTTATTCTCAAAATTTTTATCAAGTGGAGAAGAACCAATCAAACAGAATTTGGAAACACTTTTTCAAATACCTAATATTTTCCAGTTTCAAAAAAAATACCTAATATTTCCTAAATAATTTATGGGCCAATATACCTCTTTTTAACATTTTTATTGCAATAATACAATTTTCTCCCAAAAATTGCATATTTACTTTTTTTTTTTAAAAAAGCTACAAAGTATTTGCATATATACGACTATGACTATGAACTGCTTCCTGGAGTAAGTGAGAGAGAGAAACAAGCGAACCCGTTCTTTGTTCTTGCCTCACCCTTCCTCCTCTGTGGCTCATTTTGATCTGTCTCTCTCTTTAATTCCCTCTCTCTTCTGCCTCCATCTCTCCTCGCTCTCTCTATCTTTTTCTTCGATCCATTGATTATGTCAGCCGTACATTCTCCGATCACGAAGCCCTAGGTACTCATAGGGAGTACAATCTTAGTGGTGTTCTTGATGATTGTTGGATCGGTGATTATAGCGGATACACACAAGATGACTTTAAAAGAAGGGAGAAACGTCGAAGTAGAAACTCCTAAACATGGCTGCTGATGTTGATTTTATGTGAATATATTTTTGTTTTTTGTTATGCTTCATCTCTGTAGAAGTTTTGGTTAGCGCTGGTTACTTGTGGTTGCAAAACTTGTTGATTCTTTTGGCCCCGCAGGGGCATTTATTTTTCTGTCTTTGCAACTAGTTGCAACTTATTATGCAACCTAATATAATTTTAGCATTTTTTAAAAAAAAAGTTACATATGTAGTTGAAAGTATGGTTGCTCGCAGTTGCAGATTTGGTTACATATGCAAAATCGTATTTTTGCAAAAAAAAATTGAATGATAGAGTTTTTTTTATTTTAAAAAATGATAGTATTTTTGCAAAATTTCTTTTTGACTTGGGTATTTATTAAAAAAACCCATAATTTATTCCTATAAATAAAGAATGTCAAACACATAAATATTTAATTCTCAGGTAGCAAAGAAAGGTTACTCGCAATTATTTAGGAGCCCAAACTAAACCAAGGCACAATTGACAATACCAAACAGCAAAGAACACGCTCCCAAACATAAAAGCGCAAAGGAGCAAATAGCAATTCAAGATCATATTGTACTCCAACCATTGACTAGCTAGTCAGACAAAAACTATCTAAACTTCAACCAATATACAGTATACTTGGGACATAAACATCCACTTAACAAGATCAAAAAGGTCCTGGTTGATATTACTCCTCTTTCTCGACTCTCGAGGAAGTTGGGGTTCGAGTTAGGGTGATTCCATGTTTCCATTGTTGTTACTCCATTAACCATTGATGCAAAGCTGAAGCTGTGGTATTGCTGAATTTATTACATTAAATACTAGTCAGTATTTACTGTATGCCTTAACATGGCTTGATGCAATCAAATAAACGAAATCCTTGCAACACAAACGAATTCAGTGATACAAAACCATAGCTACTAATATATGGGCAAGGCAGACAAAAATAGATGCTACAAACAGTTGGAATACGTCGGTTCTTTATGAACTACCTAAACCAATGACTAATTGTGCAGTCGCATAAAAACTGAAACCGCGTCATTCAAACACAACTGGTGCCAACTCCTACCAGAGATAAAACATGATATATCTATATTAATGAGCTCATGATGCAACTATTTAGTAGTTCCCGAGCTATATTGTTTTGAGATGCACAATATTATTGTAAGAGCTTAGCTGGATTTCATAAAGATCTGCACGTTGAGCCACAGTACAACTTACCAAGCTCTCAATTTCTTCGTGCAATGCTGATTAGCCCAAGGATGTTCTTTCAAATTTTTTAAACCATCTAGTTTCACTGATGAATGATGATAGAATATGGAAACAACTTCTTGTATTGGTTTGGGCCGAAGCCCAGGATCGCTGTACCTGATCCAGATCTTATTAGAGAGGTTTTGATGAATTCCTTAGGCCGAGTTGTTGCTTGGAGATGGACTTGTTGGATATATTGACCGGTGAGAAATGGCCTGTTCTGTATTCTTTTTTAAGATTGCATAGTGGCTTGTTTTTATGGTGTGTGTGTGTGTGAGAAGTGTGTGTTCTGTTTTAATGTCAACACTCCTAAAGTACCAGAGCCCAGGTTAGAATTCAGTACTTAGTTCAGGGAGATGGATTTCCAGACTCTGGAGCTAAATGACAATCAGCTAGGCAGTTTCTGAAACAGTTTCCTGTAGTTCTAATCTAGTTATGTGGCATAGAGGGCAACTATTGCCTGTGATCTCACTTGATCACAAGTCTATTTTAAGAAGGGGAGCTATGTTATATTTTCATTTATATTTTATGTATGTCATGTCAACTCTTACAATTTTGCTGGATAATTAATTAAGTACTCCCTCCGTCCTTTTTTACATGTCCATTTTGATTTTTGACCAGTCAAATTAACTATATTTTGACTGAACTTTACACGTATTAGATAATTGGAAAAATTAATAAAAATTATATTACTAGAAAGTATATTTAATCTATTTTAATATGCAACTTTCAGATTATAAAAATAACGAGTAGATAATTTGTAATGTTTAGTCAAAAATTGGTGAATTTGGCTTCTCGAAAAGCAAAATAGACATGTAAAAGGGGACGGAGGGAGTATTTATTTGCATCTCGGTTTAGTTGGATCGCCATCAATAGAATTTATTTTATACTTCTTCCGTTTCAAAGTAAGTGCCGTTTTAATTTTTGTCACGTGACTTGAGGTGGAATATTTATTTCGTTTACCAAAGACTTTGACCTTTCACCCATGCATACCGGGTAGTTGTTGTTGACCGTTCTTATAAAAAATAAAATATCAACATTGTCACCTCTATTTTTGATTTTTTTATTTATTTCTGACCTATGATCGGTATCTTAGTATTTTAAATTTCACGTGTATCATTGTATCTTATTTGCAATTTAAATAAATAAATTAGTTAATTATTGAAACCTCATTTTTTTTTGCACTTTGGACATCTATAATGATTTACTACTTAAAAGTTGCAATCATAAACTATTTGAATAAATTGAATTTTAAAAATCCAGAAAGTATTTTAAAGAATATTCTTCATTATACTTTGTACTATCAATTTTTTTAGTAAACTTTTTATGTGATATCCTTACCATTGAAGTATGACTAATATTAATTAGTATATTAAATTTGAAATACAATAATATCACCGAAAAATTTAATGAATAAAAAATGATAAGAAAGTCAGAGGCAGAAGGAGTTTTCTTTAAGAAAATTTAATCCTCTTGTGCATGACTTTAAATCTTCATATATCACGTAAATTCGACATGTTTGAGCGACACAAATAACATGCATCGAGCACGATTGGATAGCTCAAGTGGTGGGTTTATCCTCTGTTGTCCCGGAGACCCGAGTTCGACTCTGCCTCATCCGAACAGTATTAGAACGGATACTCATTTGTAAGGCATATAAGATTCTATTATCAAAAAAAGTAAAAAATAAAAAAAATTAACATGCATCATTGCCAGTCGCCCTGAGTGAGGGATGCGGTTGTTATTCTTTGTGAATCATATACGTAAGCTTTTAGTTTCTTCTTTGTCAAATTGATTTCAGTTTTTCTTAATGTTATTGATTTTCTTTTTATTGTTTTGATTTTTTCAATATGTTAAATGAGTTCTCTACTTCTCTTGCCTTTTTATCATGTTAAAATGATTTTTTCAATATATTAAAATGAGTTCTCTTGTGCACTTTAGCGTCGGTTAGAAAAACCGACGCAATAGAGACTACTCTATAGCGTCGGGTTCATATACTGCGCTGGACTGCCGACGCTAAAGGTCTTATTTGACTTAGGCATTTTTGTACTAGTGTAAAATAATAAAAAGTAAAATGATTATTCTACTTTCCTCAGCTTTCCACAAATGGGGACATTTTTTTAGTAATACGAAAAACTCATTTCCAAATATATATATTTCAAATGGACATAATATCGGTTGTCATTTTAAATTTTCTAACTTATTCAAACAATATAATATTCGTGAAAATAGTATACTAGCATTTGGATTGTCATTTGAGATTTTAAATTAAGATTAAATTCCTCATTTCTTACCTAACATATCATGCATCTGGCTAAATATATAATTTGGAACAAACTGTAATTTCCAAATAAGTACTAGAATTTCTTTCTTTATTTTCTTTCCAAACTTTTATCGATGATTTTGTCTGCCCTCTCCGTCAAATTGATTTCTTTCTTTCCTTTTATCTCAGGTTAAAGATTGACCTTCTCATGTGAAATACTTACAGTATGTTACTATGTTAGTATTGAACTGATTTCGTAACAAGTGAAATTTCTTTTTGTGTTTACAATAATATTTGATAATTTAGCACTGAGAAAATGTTTTATCACATGTGGTGATAGGACTCGTATTAAAATATTAAATTAAATATCTGAAAGTAACTTGTCCAAAAGTCAATCTTTCTATAGGCCAATCAAATACAAACAAGTGACACCGACTATATGTGCTTGTTGGTGACAGTCTTTCTGTGATAATTACACCTTTCCTACTACCATTAGTCACATTGACGACTATATATGAAGGTATCAGAGATGACTGTTGAATGGAGGTTGTTTTTTTTTCATAGCAAAAGACGTTAGAGCAAATCCAATGCAAGATGTAAAATAGTTATAGATATTGTTATAAATTAGTATTAAAAAGTGTTTTTCATTGTTGAAATAGAACTTCAACTCCAATGCTAGATGCATTTTGCATCCAAATAATTCCAAATTTAAGTAACTTTAGTCCCTCTCTCTTAAATTTTATTTAAAGTTCACCATTATATATACCAATTATAGTTAATTGATGATGTGTCATGGATGCATAAATGCATATTTGGTTTCAAATTTAGAATTAAAAAGTGTTTTTCATTGTTGAAATAGAACTTCAACTCCAATGCTAGATGCATTTTGCATCCAAATAATTCCAAATTTAAGTAACTTTAGTCCCTCTCTCTTAAATTTTATTTAAAGTTCACCATTATATATACCAATTATAGTTAATTGATGATGTGTCATGGATGCATAAATGCATATTTGGTTTCAAATTTAGAACCAAAGATGCATAAATACATATTTGGTACGAGTAAAGGCCGTTTGACGTGATTTAAAAATAATGTTTATTACTTATAAATGAGAAGTTAATTATAAGTAAAAAGTAACTTTTATCTTATGAGTTGGGATATATTTTTTGGTGTTTATAATTAAGTGGGTATAAAAATTATTAATATAATAATAAATTATCTTTTAAAATGATCTTGTACATATTTGTAAAATCAAGTAAAAAAAATAAAATAAAATTATCAAAAAAAGTTGAGATTTCCAACTTCTCAGATTATGACTTATAAGTTGGAAATGAACTTATAAATTCGTCATACAAATAATAGGAACAAATAAATTCAAAAACTGGGTTTATAAGTGGAGTCAAACACAACCTAAGTCGCTTGTGATTTATAAGTCAAAAAACTGACTTTTAAAATACAGTTAAACTGCCTCTACTATTCAAATTAGGTTTAAAATAATCCATTGACCTAATATAAATACTAAGTTTCCCTAATATAATTGAAATTAGCTGTACTAAGCTGAAATATGTCAAATTCATTCTATTTTACTAAAGAGCATGACGTTTCTCCAATGCATAATTGTTTGAATAACTTATCTTTTAATATTATAAAGAAATAATCCTTTGTACGCGTGAGTTACTTCTTCAAATAGTTTTTGATATTTTTGCACCCCGGGCCTGGGATCGTCTCAGACTCCTCAAGGGGCGGCTAGCATCTGAGGGTTTTCAGTAGATGTTCCCTTTTGCTGTTTTTATATCCTTGATGTCTAAATACTAAGTACTAAGTAGCAAGCTTTTGTTTTCCTAGGTTTGTCTACATGCTTGCATAGTTGCATGACTTTCTTGGAGTCTCTTTCATTTCTATGTAGTTTGGTGCTCTATGACTGGTTCTATGCTTTTTTGTATTGGCTTTGCTAAGTCAATATGTAAGATGTTCCGAGATTGATTTATAAACAGATGTATGGCTGGCTTTATGCTTTTTTGGGTTTTTTTACAATCGGAAAATATTTTTGTAAAATTTTTGTAATTTTTGAAGAAAATTTGCAAAAATATAATTTTACAAATAAAAATTGAAACGATACTAATTTCTGAATTCAATTTTGCAGAAATACGGAAGTTTCATTTGATAAAAAAAAAGAGTTTGTTGACATGATTTCAAATGAAACTTTCGTATTTCTACAGAATTGTTATATACACAATCGTAAATACATAGAAATTTATATTTGCAATTGATTGGAAAAAAGGAAAAATGAGTGTACAAGGTCAATGCTCATATCACATAAAAAATCACAAAATCAAACAGCAGTTGTTGAACTCACAGTTTGTTAAGCTAACATGGAGAGAGAGAACAGAAAAGTAAAACTTGTATTCAACTAACTGAGTCTTACAGAGTGGCTTCACTACAATATATACAAGCAAGCTAACTAATTCTCTAACAAACTATATGCTGTTGACAGGCTGTATGTACACGTGTAGTATAGAGAATAAATATTAATCATGTAATGCCAACACCCCCCCGCAAGTTGGAGGGGAGCACACCCAACTTGGACATAATGTTCTGATGTTTAACACCATTCAGGGCTTTGGTGAACACATCCGCAAGCTGTAATGTAGTAGGAGTGTAGGAAAGTGAAATAAGACCAGAACTTAGTTTTTCACGAACGAAATGGCAGTCCAAATCAATGTGTTTCGTTCGCTCGTGGAAAACTGGGTTCTTAGCTATGTATATTGCAGATTGACTATCACACTTCACTGGAATAGGTGTCACATCTGGAACAGAAAGTTCATTTAGAAGACGAGATAGCCAAGCAAGTTCAACAGTAATGCGGCGGATAGAACGGTATTCAGCTTCTGCTGAAGATAAGGAAACAGTGTGCTGCTTCTTTGATTTCCAGGAAATAATGCTGTCACCTAGCATAACAACAAAACCACTCACAGATTTTCGAGTATGTGGGCAAGCAGCCCAGTCTGCATCGCAATAGGCAGTAAGATTGTATACTGGATTTGAGTTGTAAAATAAACCTTGACTGGGAGTAAGCTTAAGGTATCTGAGAACATGTAAAGCTGCTTCCCAATGTGGAACTCGAGGAGAACTCATGAATTGACTAAGGTGTTGGACAGCAAAAGATATATCAGGACGTGTGTTAGTGAGAAAATTCAGTTTGCCAACCAACTTTCTGTATGAAGAGAAGTCAGAAACAGGATCGCCTTGATCATGGATAAGTTTAATAGTAGGATCGAGGGGACTGACTGCAGGTGGAGCATCGAGACAATCAAATTCTTTGAGTAAATCTTGAGTAAATTTGGTTTGAGACACAACCATACCAGATGAAACATTCTGAAATTCAAGGCCTAAGAAATAACTCAGATTTCCCAAGTCTTTGATTTTGAAGGTGTCGTTGAGAAAGGCTTTTACAGCAGTAATCTCAGTTAAGTCATCCCCAACCAGTAAGATATCGTCAACATAGACAGCTAGAAAAACAGTAGAAGATCCTGTTTTCTTGTAGAAAAGTGAGTAGTCATTCTTGGAATAAGAATATCCCCGTGACAAGAGAGCACAACAAAGTTTGTAATTCCAATTTCTGGATGCTTGACGAAGTCCGTAAAGGGATTTAATGAGTTTGCAAACTAATGTGGAATCACTAACTTCAAGACCTGGAGGTAATTGCATATAAACATCTTCAAATAAATCGCCATGTAAGAAGGCGTTGTTCACGTCTAGCTGGTACATGTGCCATTGTTTCTTAACTGCAGTAGCAACAAGAGTTCGAATAGTTGTCATCTTAACAACTGGAGAAAAAGTTTCAGTAAAATCAATACCAGCCTTTTGAGTGAACCCTTTAACAACTAGTCGAGCTTTGTAACGCTCGATGGAACCATCAGCATTATGTTTTACTTTGAAAACCCAACGACAGGAGATTGCCTTTTTACCAGGAGGCAAGGGGACTAACTTCCAGGTATTATTGGCTTCTAATGCAGAAAACTCAGCAGCCACAGCCTGCTGCCATTCTGGGTAGATCATTGCTTCTGCAAAAGATTTAGGCTCTGCAACTGGTATTTGGAGAGGAAGTGGTGTGGGAATAGCACAGCAAACAGATTGAGGAGAAAGCAATGAATTAAGAGGAATACAATTTGAGGTAATGGTGCATGAACACAAAGAATCTGAACAAGCATTATGTACAGAATGAACATAATCTGTTAGATAGTTTGGCAGTTTTGAAGTTCTGGTTGATTTTCTGAGAGGTGGTGGCTGTGGTGAATCTGAGACAGAACTTTCAGATTGTTGAAATGAAGAGGAGGACTGTATAGGTGTATGAGAGACTGTAGGAGTAGAAGAGTGTATGGGAGACTGTGTAGAAAGTTGTGAAGGGATAGACTGTGATGATGACTGTGATGGTGACTCAACAGTAGGAGTAGATTGATCAGGAATAGGAAAGTCAGGGACAGGTAAGGGAAAGAATGTAGAGGAGTTAACATCTACATATGGAAAATGGTTTTCATAGAAAACAGCATCTCTGGAAATTAAAATTTGCTTTGTTTCCAGACTGTAAAATTTATAGGCTTTCTTGCCCTGTGGATAACCAAGAAAGACACAAGTGATTGCTCTGGGGGTGAATTTATCCCTGACAGCATCTCTGGAGATTAAAATTTGCTTTGTTTCCAGACTGTAAAATTTATAGGCTTTCTTGCCCTGTGGATAACCAAGAAAGACACAAGTGATTGCTCTGGGGGTGAATTTATCCCTATGAGGTTTTGGAGTAGTCACCAGGCTTAAACAACCAAAAGGTTTTAAGTGATCAAAACTGGGTTTTTCCTTGAGTAATACTTCATAAGGGGAAAGATTATTTAAAACTCTGGAAGGAAAGAGATTAATAAGGTGAGTGGCTGTAAGGATGCAATCACCCCAGAACTTAACAGGAAGCTGTGATTGGAAGAGAAGAGCTCTGGCTGTCTCTAGTAAATGCTTGTGTTTTCTCTCCACAACTCCATTTTGTTGTGGAGTAAAAGCACAAGAAGTCTGATGTTGAATGCCTTTAGATTTAAAGAAATCTTTAGCAGCATGACTGAGACCAATTTCTAAAGCATTATCAGACCTTACTGATTGTACAGGTAATTTGAATTGTTTCTCAGCTAAGATAATGAATGATTTAAGGAAGTCAAACGCAGAGCTTTTGTTAGCAAGCAAATAGGTCCAAGTAGCTCTAGAAAAATCATCTACTATGGTAAGAAAATATCTGAATTTGTTGTAAGTGGGAACCTTGTATGGGCCCCAAACATCAACATGAATTAATTGAAAAGGACTTTTACTGTGAATATGACTGACAGGAAATGGCAACCTTTGTTGTCTTGCCTTAGCACAAACAATACAAGGTACATCAAGCATAGAGTCAACATTACAAATATGTAATGATTTAAGTTTGTCAAAAGGTAAATGACCTAATCTGGTATGCCACATCATGCATTCTTTATTATTACTAGCAAAAGTCTTACTAGTATTAGCAATAGAAGCAGAAATGACATTTGGAAAGGTGACAGAAGTGTCTGATGAAGATGATGAAGGTGCAGAGCTGGAATATGAAAGAAGATACAAGCCTTTAAATGCTTTACCAATTTCCAGTTGTCTCTTCTGTGAAGAGTCCTGCAAATAACAAAAGTCATTAGTGAATTGTAAGGTACAATTCAGCTGACTTGTTAATTTGCTCACAGAAAGAAGATTGAACTGGAACAGTGGAACATATAAGACATTGGCAAGAGTGATATCATGTGATATTGGAACAGTGCCAATGGAAGTGATGTGTAAAATGTGACCATTAGGCAGAGATATGGTTAGAGGTGTGTTTAAGATGGTAAGTGAACTGAATAAATGTTTCTGTGAACACATATGATCATTAGCCCCACTATCTATGATCCAAGTAGTAGAGTCAGATTGTGACATACAAGCAACTATAGAGTCTGAACAGAGAGAGTTACCAGCAAAGTTTGCATAAGAAGTATCTTGATCTGGTGGCTTAGTAGTTTTGAGAAGCTGGAGCAATTGAGAGTACAATTCTGGAGTCATAGCTGGAGCAGAATTATTTGATGAAGTTGTAGAATCTGCAACTGTGTCAGGAGTAGAATCATGTTGGAGGACATCAGCATTTGCAGCAAACCTTTTAGTAGACTTTGTGAACTTGAAATCAGATGGGAAGCCATGAACTCTGTAACATTTGTCAATAGTGTGCCCTGTCTTCTTGCAGTATTTGCAAGTAAGATTAGATTTCTTGAATTGACCCTGAGAAGCCTGAGAAGTCTGAGAAGAAAATGGCTTGGAATTGACATGAAGTGATGTAGAATCTGTTATCAGATTGTGAGAAGAATGAATTTCTCGTTGAGCTTCTTCCTGTAGAAGAAGATTGTACACTTGACTGATGGATGGCAGAGGATTGGACATCAGAATAGAACCTCTCATCACATTGTAAGATTCATTTAGACCCATAAGGAATTTGACAACTCGTTGATTCTGACGCAAAACAGCATTCTTAGGTGCTGCTTCACAGGTGCAAACAGGAGTGAGGCAAAGAGAATCAACATCATCCCACAAGACTTTCAATCTAGTGAAGTAATCAGCAACAGTGCTATTTCCTTGACGTATTTCACAAAGATCCTTTTGCAAAGCAAACAGTTGTGTTCCATTAGAGACATTATAGCGCTCATCAAGTTCTTTCCACATTTGATAAGCCGAATCAGCACGACTAACACTACGAGCAATGGTCTTGTCCAAGGCACCAAGAATCCATGAAATTACCATGTCATTACAACGAGACCAGCTGGTAAACGAAGGAGAAGAAGGATCTGGTTCTGGAATCCTTCCATCAACAAACCCTAACTTGTTGCGAGCAGATAAGGCAATTCTCATTGATCTTTTCCAACTACTAAATCCAGTTCCATCAAAACAATCACTCACAAGTTTCATTCCTGGACTGTCTGATGATTGCAAATGCAGTGGATTATCTTGAAGAGTGGTAGAATTGTGATCGAAAACATGATTGTTTGAAGAACTCATGATGTTACAACTCAAAACAATCAATCAATTAAGAAGGGAAGACTAAATCTCTGAATTAATCGCTATGGTAACGAACAATCACCAGAGTAAAACGAGCAAGATTGAACAATCACGAATCAACAAAACAATCTAAAGATGTTTACAAACAAATATGTACAGTAACAGAGAGGAATAACGAAGTAAAGTGAGAAACGAAATCACCGGAGAAATCACCGGAGATGAACAAGCAGCGGAGATGAAGGAACAAGCAGCGGAGTTACAGCGGAGATGAACGGAGATGAGTAGATCGGTGTCGCTCTGATACCATGTTGAACTCACAGTTTGTTAAGCTAACATGGAGAGAGAGAACAGAAAAGTAAAACTTGTATTCAACTAACTGAGTCTTACAGAGTGGCTTCACTACAATATATACAAGCAAGCTAACTAATTCTCTAACAAACTATATGCTGTTGACAGGCTGTATGTACACGTGTAGTATAGAGAATAAATATTAATCATGTAATGCCAACAGCAGTAAATCAGATCTTCAAATCTGAGATTATATTTTTGTTATTTATACAAATATTTGAGATATAATCAAAAAGAAAATTTGATATATTTTAATAATAAAACTTGTTAAACTTGAAAACTAGCGCTTGATTTCTCTGAATTTTAATAAATTTATAATAATCAAAAAGAAGTTTTAATAAATTCTAAATTTGTCAAACAGAGTTTTATCGTCTACCTAAACTATTAAAAGAATTTAACCATTTCATTCTCGTACTATAAATAGTATTCTGCAGGAGCAAATAATTCACCATCTCGACTTTGCAATTCCACTCATTGTATTCTCAAACTCTTCCCTTTTCTTTTTACTATTCATAACATATATACAAAAACAGAAGTTGAAAAAATCATTATGGATCCAACTAGCATTCCCGTTGTGGGAAAAATTGTGGAGAAAATATCCGATATAATCGTGGCAGCTTTGTTTAGCCATCTAAACTATATGTTTTGCTCCAAGTCTCTTGTTGAAGATCTCAAATCTGAGAATGAAAAACTTGAGATCGTGGAGAATGTGATGTCCAGAAAAGCTGATGAAGAAAGTAACAACAGCAGAATAATGGAGAAGCATGTGGTGGACTGGAAAAAAGCTGCCAGACAAAACCAGGAGAGTGTTAAAAGCTGTTTGGAAAAATACGATAACCGTCCTTCAGGGAGGTGCTTCCGGGGCTCCTTCAAATTACTAACCACCCGGAACAAAATCTTTACAAAACTAACCACCTTTTTTTTCACTTCACAAAACTAACCACCCTAATTCATAATCATCCAGAGGCGAACACCACACAAAATATTTTTGCAGGAGGCCCTTCCCAGGGGCGAACAACAAAGAATTTTCCTTATATGTTCGCCCCCCCCCCACGGGCGAACATAGTAGGGAAATTTTTTGTTCGTTTGCTCAAAAATTCTTCACTTTTCAGTTCGTTTATTTAATTTATAAAAAATTCAAAAAAAGGGAAAATTGTGATAATTTATATTATTATATTTTATAATATTATATTATATAATGATATAATATTACAAAATTATTTTATATTAAAATATAATATTTTAATATTTAAGTTCATATTTAAGCTCATAAAAGATAAATAATATTGTTATTGTTTTATTTTTGTTAATCCGAAAACGTCATGTAATATCTTGTCCCGAATGCATTTGATCAAACACAGCACTTTTATTCATAGAAGATATTAAAACAACGATAACACGACTTAAATTGAAAAGCAGAAAACAATCACGACGAAACTACAGACCACTTAATCGTCCTCGGACGACATTACACTATCAGAATAATAATCCGGAGTGGTGACCAATGCAAGGTATTGTTGTTCCTTAAACCGGTCCCCTTCTTCCCGAAACATCCTAGCATCATCGTATAGACTATGACGATGCAGTCGCAGATTCATGCGATTCTCCTCTTCTCTCGCTCTGAGAGGGCGGCCGTCCACGCTGCTGCGGCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTCCCGAAAGGACGGGTCCTGGGTGAAGTGGGGGAGGTGTGTGATCCTCTAAGAATGACATGTCAGGACGATATACATATGACTCTGACAAGTGATCCTGTGACGGACCCTCATCGTCCTGTGCCTCATCATCCCCTAATCTGCTCCTTTGGGGCCATGGAACCCCCTCAGATGTAGAAGGCTGAATGAATGGAGACCAACCACCAGCCTCAAAAGTACCTGCTCCATCATGACCTGCAGAATGTGAGGTGCCTGCAAGGTGTGAGCTACCCACATGGGTGTAGTAAGTGCCCTCTTCGGGCACTACCGGTGTGACTGGTGGTCGTCCCCTACGCCCTGCAGGAGCCCGTGCCCTAGGTCTGGCAGGGGCCTGTTCCGTAGGTCGACGCTGTACACGAGTAACCATATCCTGTAAAATATGGTTTGCCAGACCCAAATCAGGAGCATAAGGGTCAATGGCACGCTGCATAGCGGATAACTGCTCCTCCTGTTTACAAACATGTATATTTAAGTCAGAACAGTGTACAAAACAAGCTGAGAACATGTATATTTAAGCATGTATATTTAAGCATGTATATTTAAACATGTATATTTAAGCTGTATATTTACCAGTTCCGGTGTCGAGAGCTGTGTTCCCTGGAAGGCACCCTCCTGCTGTGGCCAGTGTAAGGGGTTAATGATGATTCGACGTGTGACCCTGTGGAACCATGGCAGGTATGAGGCAGTGCAACCCTCGCCATGCATAAGTGGAGGAGATGCGAGGGCACGCTCCATGCGCGAATCCCAAAGATCAACAAATGGCTCCCTCGCGTACATCCAATCAACCTGCTCGTTGTAGTGGTCGTGCGATTTGCAAAAATAAAAACTGCAAATAAAAGTACATTTGATAAGTTCGAGGTCTTTAATATTCTCAATCCTGAGTTATGTCGACATAATAGTCGGAATCATAATCTTCATCATCATCTTCAGCATCAGCGGCCACCGAGGTATGCTTTTCATAGGTAAATCAGCATATGGCCTCCATCGAAACTGTCGGGGTGTCAACGCATCCAACTCATATTGTGTCATGCGGCTCTGCGCATGCGGCACCTGACAACGCCTAAGTGGCGCCTTCCACCTACAGTGGAAGTTGGCATAAGTGCTCAGAGGTTATACATGCAACAAATATGAATTGAAGTTAATCAACAAAAGGAGTGACAACATACCTCAGCGCCAGCGGGTACTCGAACAAGGGTTGACCCCTGTGCCTAGGCGCTAGTGACGGAAAGCGCTCGTAAATCCACACCTAGCGGCAAGGTTAGTACAAGTGCACATGATGAATAAATAATACAACAATAAAGACGAGAAATAAATATTACTTAATTTTAAATTCGAAATAATTATCTCTAACTATTTTTACAAATCTGATTTTTTTAATTTAAACTAGTAATCTAAACTAAAATTAGCACTACCACTACTAATCAACAACAATCATCACCAACTACTAATCTATTTAATTTAATGGTGTCAAGTTTACTTTTAAATTCGATTTAATTTAATTTCATTAAATTCAATAAAAGCTAAAATTAAATTGATTACTGATGATTAGGGTAGGGAGAGGAATATGGTACACCCTGCATAAAACCAAACTGCCTCGTCACCCTGTCCGTGTAGCACCACTCGACGTAGGACATGTACATCATGGGGGCGGGAGCCGTCCAACGCAAGTACACAGTGGCCTCCGGGTGATGCTCTGCAGGTAAATCAGCATATGGCCTCCATCGAAACTGTCGGGGTGTCAACGCATCCAACTCATATTGTGTCATGCGGCTCTGCGCATGCGGCACCTGACAACGCCTAAGTGGCGCCTTCCACCTACAGTGGAAGTTGGCATAAGTGCTCAGAGGTTATACATGCAACAAATATGAATTGAAGTTAATCAACAAAAGGAGTGACAACATACCTCAGCGCCAGCGGGTACTCGAACAAGGGTTGACCCCTGTGCCTAGGCGCTAGTGACGGAAAGCGCTCATAAATCCACACCTAGCGGCAAGGTTAGTACAAGTGCACATGATGAATAAATAATACAACAATAAAGACGAGAAATAAATATTACTTAATTTTAAATTCGAAATAATTATCTCTAACTATTTTTACAAATCTGATTTTTTTAATTTAAACTAGTAATCTAAACTAAAATTAGCACTACCACTACTAATCAACAACAATCATCACCAACTACTAATCTATTTAATTTAATGGTGTCAAGTTTACTTTTAAATTCGATTTAATTTAATTTCATTAAATTCAATAAAAGCTAAAATTAAATTGATTATATTTAATCTACTCTTAACGTAAATAATACAACAATCATCACCAACTACTAATCTATTTAATTTAATGGTGTCAAGTTTACTTTTAAATTCGATTTAATTTAATTTCATTAAATTCAATAAAAGCTAAAATTAAATTGATTATATTTAATCTACTCTTAACGTAAATAATACAATAATCATCACCAACTACTAATCTAAACTAAAATTATCACTACCACTACTAATCAACAACAATCATCACCAACTACTAATCTAAACTAAAATTATCACTAACATAAGCTACTACCAAATACCAACTAACAAAACCCATTATAAATTATCAAACAAATTACTAATCAAGTCTAATTTTTAATTCATTCAAAATATGAGATCTACACTAATTTTCCCAATTTTATAATTCGAAAAAATTGTACTATATTTAGGATTTTTTTATGCAATATTTGTTATTAAATTCGAAAATTATTTTAATTAAATCAAATAATTAAAACGCTAGTGACGGAAAGCGCTCGTAAATCCACACCTAGCGGCAAGGTTAGTACAAGTGCAAATGATGAATAAATAATGCAACAATAAAGACGAGAAAGAAAGTTGTGGTTGGTTTAGTATTACCTGTACCAATGTGGCGTAGCCACAGAAATCAGTACAGTTAGCCCTGCTAGAAGAACATAGCTTCTGGTATAGGAAGCCAAGAACAGCACTACCCCAGCTATACCGACGCAGCTGGTCCATGTCCCTCATTAACCATAGAAGGTCAAGCTGCACGCGGTTCCCGCTGCTGTGGGGGAACAATGATCCAATAACGCATAGTAGGTGCGCCCGAATATGGTAGGTAACCTGTACACCATAACCTATATCCTCTGGATCCAACTGCTCCAACCGCTCACAAGACCCGAAGTTATCCACAAGCCATTTGATCTTTAAACCACCTCGGTTAACATCGTCCTTGGCTTCTGGTAATAGCCCAAGAAATTCGCCTACTAGCACGCGCCTTTCCTCCACGCTGGTACTCGCTCCACGGAGGATCAGTGGATCCACCCTCAGGTACGGGTNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNAATTCCAAAATCGAAATAATTCAAATTAAATTCGAAAATGTGAGATTGCTTATTTTTATTCTATTTTTTAACGTAAAACACCCAAATTTAATCTACTAACCTAATTTCTAAATTTAATCTACTAACCTAATTTCTAAAATTAACATAATCTACTAACAAATACCAACTAACAACATTCATTATAAATCATCATACAAAATTACTAATCAAGCTTGTCATATAATTTGTAGCTACTAGCAACTAAGAACAATCATTATAAAATTTATAAAAATACATGCATGCAATTTGATGAGATTGAGAATGGTGGAAAAACCTTGAAAATGGGTGAAATTGATTAATTTGATCCGGTGAAAGTAGCAAAGCAAGCTCCTTTTTCCCCCCTTTTCTCTGTCCGGATCACCCTTTCTTCTAGAAATTGAAGCTTGCAATGTGTGAAAATCTGAGAAGAAGCTGTTTGCTGCGGCGAAGATGAAGAAGAAACAAAGGGGTTGGGGTTTTGAGGGGTAAAAGGGACACGTGGCCGCCCCTGACTGGGCCGGACACGTCAATGCTTCACAGGTATGTTCGCCCGTGGCAGGGGCGAACACACTTGCCTGGAGTTCTTCTGTTCGCCCGTAGCAAGATCTGGGCTTAAAAAAAAATTTCAGCTGTGTTCGCCCGAGGGGTGTATGAATTAGGGTGGTTAGAAATGTGAAGTGAAAAAAAAGGTGGTTATATTTGTAAAGCTTTTGTTCAAGGTGCCTAGTAATGTGAAGGAGCCGTGCTTCCGGTGTCTCCCAATTCCTCATCCCTTCTCCCGTTACAGATTAGGCATGGAGGCGGAATCGATAGCCAAGACAACAACTGAATTAGCTACTTCCGGAAATGGCTACCTGGCTCACCCAATTGCATATCTCCCACTGGATATGAAAGCACCAGTAACTGAATTTCATGAATTCAAATCTAGAGAAGAGGCTTATCAAAAGCTGGAAGGGCTAGTCACCGATTCTAGTTCTTCAATCCTTGGGATATACGGAATTCCAGGAACAGGAAAGACTCGATTAATGGAGCGAATCACGACAGAAGTTGGTAAGAAGGGAACCTTTGACAAGGTCGTACGAGCCAATGTGAGGAACGCGAAGTTGGATGTGATAGGCATACAACAACAGCTTGCAGGGAAGCTAGGTTGCGACTTTGAATCTGAAACTGATGTGGAACGTAGAGCTGGTCAGCTGAGATCTAGTTTAAGGCAGGGAGGTAAGGTACTCGTCATACTAGACGACCTATGGAGTGAAATTCCTTTAGATAGAATCGGAATTTTGTCTGAAGATGGTATGAGTTCCAAGGGCGGTAAGATTCTGTTGACATCACGAAGTGAGGAGGTATGCAAGAGCAACAAATGCAAGCATCCAGTCAAAATACAACCTCTTACATTTCCCGAAACTTGGGATATGTTCAGCAAAACAGTTGGTGCTGATACAATCAACTCTTTGCAGAATAGATCCCTTGCCTAGGACATCTGTAAGAGATGCGGGGGTTTACCACTAGTCGTTCTTGCTATAGGTAAAGCGCTCAAATTTAAGCGTCTTGCTTCATGGATGGATGCACTCAATCAACTTAAAAATTCCAATATTGAAGAAGTTCCTGGAATAGGTAAAGAAGAGTATGCGTGTTTAGAGTTGAGTTTTGATAACTTGGAGCACGACGATGCAAAGAAATGTCTCTTGTTGGCTTCTATGTGCCCTGAAGATGCTGACATTCCTACGAGGATGGTGGTTCAGTTAGCAAGAGGCTCCCAGCTTGTGAAGGGTGATGAAATAAAATTAAGAGTACATTCAATGATATCTATACTGCAGTCAGCCTCGTTGTCGCTTCAAGGGAAGGATGGTGATCATATCAAACTACATGACATCATAAGGGACATGGCAAGATCCATTGCCAAGAAACACCACGGATTCTTATTCGCAAGAAGTAGGTCGTTGCCCAATGATTCAGCTGAGTACTCTGGTCTGAAAGTTCTGCATTTAGATGTAGAGGAGACTCATTCACGTTTTCCAAGTGATGTGGAGTGCCCAGACCTGCATCTACACTGTCACTACATTCATCATCATCTACATATATTGACCCAACACCGATGCAGGTATTCATAGACTGTTTTACATATTCACTCAATTGATGATAACTATGATGATTAGTGTTATAGAACGTAAATTGGGACCTTGTAGCACTTTTAAGCGGTTGAGTGAACGTTTAAGTAGAATTTTGAGGCGCTCAATAGCGGATCAATAATATATAATTAAATATTTAATTGCAATATTAATTTAGTTAAAACTAAAGTTATCTATTGGTTAGAATTTAAATTTATAATATTTTTTATAATATATATATATATATATTTTTAATTTTTAATATGACTATAGTTATATTGTAAAAATTATTTTAAAATTAAAAAATTAACAAGTCAACATCATTTTGACCGCTTAATGATCGTTTAATCAATTTATTGTCCGCTTAATTTTCAAAACCACGTAATCACTTTCATACAAAAAATTAGGCGGCCTCTTAATGTGACACAACTGACGATAAAATAAAAATAAATGATTTTTACGGTTCATCAATCAATGCTATCGTCTAGTAATATTAGCTGTATCAATATTTTATAATTGTTATAATATAATTATATATAATTTTACTAAAATATAATATAAACAATAAGTTATAAATCAAGTCATGTTTTAGTGGAATTGTATAATATCAAAAATTAAATATATTTTTGAGTGTATAATTTTAAATATGAACTAAAAATAAAATAATATGTGATACATAATATTTGAATCGGTTTAGTTGTTTATATTAAAAAATTTATTTATTTTAATCATGATCAATTATCAGGTTAAATAATATATATCTGCTACTTAATATATCAATAAAATTAATTTTATACAAAAAAATAATTATTGAAAAAGTATTTCAGTTAAAGAAAAGATTTTATCTTGTACAAATCCCTCTAAATTAAGTTACATACGAACTAAACACAAAATATTAAATCTTGTAATATTTATTTATAAAATATTAAAGTTATAAATAAAGAGTGCCAGTTAATATTTATTTATAAAATATTAAAGTTATAAACCGTATAGAATTGATTGGGACGGAGGGAGTATGAATTAGACTTGTTCATTGAATGACCGTTCAAGGATTAATCAAATAATTGAATCATTAATCAGAACTAATTAAATATTATTTATAAAATTATATATAATTTGGAAGTTAAAATTTAATAAAATAACTTAAATTTATATAGGATAAGTTTTTTTTATTATATATACAATTATCATCAAGAAAATTGACCAAAAATAAAAAAAATTTAACAAAATCATATATGTATATTTAAGCTTATTTAAATTAAATTAATTTTAAAATTTCAATTTTTTATTTATAATTGATCAACTTTTGATCAATCAGATTTTTTAAAAATTATTTTTCGACACGATTACTCAATTCAATCAAGACAGAATCGGTCAATTAAACATCAACTCTAGAAGTTTAAAGGAACGCCTCCAACACACAACTATATTTTCCACATTCACTTTTATGATTTTTTTTATATGTCACTTTTGACTTGTGTATCTAGGTGTATTGACTTGATAGTAAAAAATTATTATTTTTAATTGATTCTTTTTTGAATTAAAATTTTGATTACGTATTTTTTTTCAAAAAAGAAAATTTCAAAAATAATATTTTTAATTCTCCGGTCAAAATACTTAAAAGTGTGTGCTAAAAAATTAAACGTCATATATTAAAAAACATAGGGAGTATATTCATAATGTGTTGTTCAAACGATATTCATCCTCGTCCTTTTTATAAGTCACTTGGACTTTTTACACATAATTTTATATTTTTACCACTTATTTAAAATTATCTTTTCTAATTTTTTTCTTAATTAAAATATGAAACTTATACTTTTATTAAAAAAATTAAAAAATATTAATTCGAAGTATGTGGTCAAAATCAAAAAAGAAAAGAAGTCAAAGTGACTTATATATAAAATTAGGAGGAGTACATGTAAATAAAAAAAAAATAAAAATCACAATTCTTTACAAAAATTTCAGGAATGGATTGGTCAAGGTCAGCAGCTATTTGCAAATCTCAGGTTCTTGGTGCTTGTGGAGTTTAGTTGGCCGGAGAAGTTCTCTCTTGAATCCTTAGACAATCTTAAAACTCTTTGGTTCATCACATGTGACCTTGTCCATTTTGGGAAGAGCGAAGTTGGATTGCTTCCGAAAAAAACTAGAAAATCTTTGTTTTTGGGATTGTGATTTTTCAAAAGAGCTGAATTTAGCAAAACTAAATCATCTTCGCAAGTTAGAGATCTATATCAACACGAGACCTTGGTTGTGGGAAGATAAAATCATTGTGAAGCAGAATACAATATCAAGACTATCCGATCTAGAAGAATTAAGTTTCCCACTGAATTCTACATCCGTGAAGAATGTGCAGAAGATGGATCATTGCCGATATTAGACGAGGTCTGTAAATTGTCACGCTTGACAAGTTTAAATATTTGTTCCCGAGAATCCAAGTCAGGTAAACTTGCAACTATATTTTGCAACTTACGTGAATTCCATTTGTTTGTTGGTAAAAGACCAGATTTTTGGTCTCCGGGAGTGTCTTCGAGGACCAATTCAATTACATTGTCCAACCACGATCTCATAGAACACTACAAGCCTCTGTTTGAAAAGGCTGAAGAGGTGATATTGTGTGGTACTAACTTCACAGGGAGTAGCATTGATATTAGAGACACTAAAGAATTTATCAACTTGAAGTACATGAAGATTCAGGATTGCCGGTTCATTGAGTATTTGGCTAGGATGTCACCGGGTAATAAGATTGGTGGAAGTCTTCCCCAGTCAATACCTTTTTCTAACCTTACCAAATTGAAAATCAATAATTGTCACAGCTTAAAATACCTCTTCTGCAACTCTGTTGCAAGATGTCTTAACAAAGTGCAAAAGCTCAAGATAGAGAATTGTCATATGATGGAAGAAGTCGTGCTCGGAGAAGGCACAAGTGATGGAAATATGAGTATGCCCGAATTACGAAAAATGACCTTAATTGATCTGCCAAGACTCATACATTTTTACAAGGATAACACTTTCTCCGGGCAAATTCAACCTCTCTTTAATCAAACGGTATGCTTGCTTAACCCTTAAATATGTTATAATTGTATTCAAGCGAAATTAGTAAATTATATTTTCAAATATTTAAGCTACATTTATTTCATTAAAAATAAATCATTTTGTTTACTTCATTGAGGCAATATATTTGTTTTCTAGGGATTAAAGTTCAAATTGTCCACCTCAAATATTAGTAATTGCCCATTCTTGATATTTATATAATTTTCATAAACATATGAAATCATTGGCTTAATTAACTTTCTACTAAGCTACATATGAAATATTAGTAATTGTAAATATTGTACAAAATTGGGATAGGGCCACTGTGTACAAAACATGTGAGAAAATATGATTCCCTCCCCTTCGAAAATATCTACTTTCTTATATAGACTAGTACTCTCTGCACAGAGATGAGTACTGGAGTATATACTCTCAGGAGTTATACTTATACATGGCACTTGGAGTGAGTTAGAAATAAGAACCGAACCAAATACCCCTTTCTCTGATGGTATGTTTTGGTTGACTATTTGAGCAGGTTGAATTCCCTTTATTGGAAGAGTTGGATATTAGTGGTCTGGAAGATATAACTGATATTTGGGGAGATAATAATGGCAATGCCTTCTCCTTTTTCGAGCTTAAGAAGTTGAATGTATGGAACTGTAATAAGCTTAAAAATGTGATCCCACCTGCCAAGTTGCCTAGTTCACTCACCTCTGAAGTTGACACTCTTGGAAGCAACACAGATTCGGTCGCTGGCAGAGCTTCTGAAGGACAAGTGAAGGCCATGAATTCTCATAATCCAAACAAAAAATTACAAATTTTTTTGAAGAAAACTGTGCTTGTGTCGAAATCTGTATGCAGGAGGACCCCGACGATAACAGAAGAAAATTTGAATGATCCCTCTGATATTTTAGTTCAAGTTCCGTCACAGAACACAAGGGTATGTCCATTGGTTGAAATGAGTTTACAGAAATTGCCTTGTTTGGAAAAGACAGGGTTGAACTTTGAGGATCCATCTGGAGTAGTGAGTACTTACCCATATCTTGAAAAATTAAATATATGTGAATGCAACAGATTGGAAAACGTGTTCATATCTTCTCGTGATGCAAATTTTAAGAATCTTGAGGACATGTCCGTCACTAATTGCATTATAATGAGAGAGATAATCGGGGCAGGTGACCAAAAAATTGCCAATGGCATTGTGTTCCCTAAGTTATGTTCTGTTAAACTAACGGAGTTGTTAAGTTTGACCAGTTTTTGGGGGTACCCGAGTGAAGAAGCTAACAGCCACAAGGTATATTTACATTTACTGCCAAATGAGTAACATTGATAACATGCATTTGTTTGTGTGCTTGAGTATATATATAAATGCTTAATTCTCTTATGTATGGCTGATAAAACGCGATATTCAGGACCTGATTTTCATGTATATATACTTAAAATCTTCATCTAGTTAGAGCTCCTGTTTGCTGTAAAAGTTTTTAGGTAAAGATTTTCTAAAGTTAGGCATATGCATTATCATAAAGAATGACATTGTTTTGTGTAGGTTGAATTCCCAAATTTGAAGAGTTTTGAACTCAGCTGTGGCAAAATTACTAGCTTGGAAATGATAGAGTTTGGCAGCAGAGATGGCTCTATTTTTCGGCTGGAGAAGTTAGATATAAGTTGTGATGAGGAGATACAAATTCCCAACCAATGGCTACCTCATTTGAATAATCTGGAAAGATTGTCACTGAGACGCTGTTGGTCAGATGAGCTGAAATCTCTACATTTCGCAAAATTGAAGGTGCTCTTACTTCAAGAACTTAGTTGCTCAACTATTTTCTCATTCCCAGACTTTGAAAGACTTCAACAGCTCCGAGGATTAGTGATAACAAAATGTAATTCATTGGAAGCTATTGTGGAGGTTGTTGAGGGTGAAGAAGCTTCTGACATGGATACGGAGACTGTTGCACTAGTTCAGCTGGAATCAGTCCATCTTGAGGGTTTGCCAAAACTCAAAAGTTTTATGCACACAAAGCCTAAGAATCTTATCCCCAGTTTAGAGCATGTGGAAGTGGAGCCCTCCATTCTTTTCATGTGCCCTGTCTTTGGAAATTTCCAACAGCTCAAAAGGTTACAAGTGATTGATTGCAGATTGTTGGAAGGCATTGTGGAGGTTGCAAGAGGCTATGAGACGGATGACAGGATTATCACATTCCCTAAACTCTCTGACATTCATCTTAGAGATTTGCCAAACCTCCAAAATTTCAGTCCCACTACAAGCTATAGTTTCAACATGCCCAAATTATTTCATTTTCATATGTTTCGTTGTCCCCGGGTTGAGAATAAACCCTTATTACAAATAATCGCACAACGGGTACTTGTTTATTCCGATGAGCATCCACAAGGGATTGTCATTCTAAACCTCAACGAGTACACAAGAAGAATAAAAAACCTCGAAAGCGTCGGGGAATCAAGTAACAGCCATCAGGATGTGGAGATGGAAACCATAACAGTTGCAGAAGAGGAAGACAGAGTTGTTGAACAAGAGGCAGAGGTAGTTGTTGTAGGAGAAGAAAGAGGAATAGAGGAAGATTCGTAATTCAATTGTTTTTCATCAACTCAGCTTTCTTTTCCTTTCTTTCTCAAATGTCTCAGACTGTGCATTGTTTTGTATTTGTTTTTCAAGGAAATCTGACGCTGAATTGTGAGATGTGAAAAGTGTCAAGCTCTTAGCTATTTGAATTACAAGATCAACAGACAGGCCTTGTCTTGGAGGTTCTTCGACTCAAGTAACACATTCTTCGTTACTACTTTATTCACATAAGTCATTACTTTTTTTATCTTTTGATAGCAACATATAAATCACTGGATAGGTTTGTCATTAGGTTAGGTTCTGCGTTTTTAACAGGTATGACAGATTTAACAGGTTAGGCTTATTTCCAGATTTCCTCCCTTGCAACTTTTTTAGGCCTCCCTGAAAAGTTACGGTCCGAAATGTGTACTTACTTACTTTGTTGATGTCTCGATATAAGAATCAAGAAAGTAAGGAACAGAAACTGAGCTCCGAAAAAATATTCAATGATGAATGCAAGACATTCTACTTTGCGGGTAAGGAAACGAATGCTAAACAATCTTGTGTCTGTGGAGAGAGTTCATCTCCAAGTGCTGATAATTTAACCGACTTAAAGATTGTAAGTCATATTTTCATTTCATACTGCTTTTTTTAAATTTGTTGTTTTCATAGAATTAACGACCTTTTTGAACTTCTAAAATTAACTAGAAGTGATAAATCTAAATGGATATCCTTGCATTCAACATTGGGAGAGTGATAATTAGTAATACCCGAGTGGATAAAATGCCTGAATTGTGTGTGTTTGTTGGCAGATAAACATGATTCTGAATGAAACACTTCGACTCTACCCACCAGATGTGATGCTAACGAGGGAGACGAATAGAACTGTAAAGCTAGGCAACCTCCAAATTCCAGCTGAAACGCAGCTCTATTTGCCTATGACTGCAATTCATCATGACACTGACATATGGGGAGCAGATGCAAAAGAGTTCAATCCTATATGTCCATGCTCCAAGGCAGTTGATGACCATGCAACCTCAATTTGGGGCACAAATACTTTTTACTAGAATTCCCTGAGTGAAGCCTATAAAACAGACCAGATTATTGTTTTCGACTAATACTTTTGTCTTGTAGAATATTATGACAGGTCAGCTCAATATGTATGTATAACACAATATGAGTGGCAACAAGCCTTCTAATTATATATTTCAAGATTTTTTAAAATGCGAGTTTGAACGGTCTTCTACCAAAGGCACAGGAAAAACGAACCTAAAAAGTCGATCTTCATTTATATTTTGACCATGTAATGTTGATCTTACAAACTTTGTCAGATCATGTGTTGTTGGATTGAGGTCTAGTACGGTGGTCATCACTAAAATTTACTTTAAAGAGAGATTTTAAAGAATTCATCTGTTCCCCAATGAACTCTGGAAAACCCCTGCCGGGATTCTGTTATATTTATTGTTGATGAACAAATCTTTGTTCTTTTGTACTTGAGGGTTAAATTTTATGCGGTGTTTTAGTATGATATCGGTCCTGGTTCTATGGAGTTGGCGGAAATTTCTTATCTTTTTGGATCTATAGGGACTCAGCGCTTGTTGGTGACACTCTTTATTCTATGGTCTGTGGAAGTTACTCACATTGAAGATGGAGGTATGAGATCAGTGTTAAATGGAGGTTGTTTGATACGGTTCGAATGCATAGAGAATAGGCCCATAAATGTCAACAAAAACAGTGACTCCACGTCCACGAGACGGAAGTTCCTGACTATGAAAAATTGATTTTTTTCCCTTTTTCTATAAATCTTTGTGAAGGTGGGGAATCTCTTTTTACTTAAAAAAATACGGTTGTTTTATGGTGGGCACACACTAAACACTAATTTTTATGATTTTGGTGCATTCTTATTGGTCATGTAATCATAAATATGAATGCCTCCTACATTTACACCAAATCCACCAATTAAAATCCACTAAACTCATCAAATTTAGTGCTTAATGTGTGCTCTTGGACACACACTAGAAAGATCCCAAAAAAATATACTCCCTCCGTCTCGTTAAACTTTTCCTGTTTCAAATGTTGGGACTGTTCATAACATGAGACAAATTATTAATTTACGTCTAATCTATAAGACTAAATATAGTCATGAGTGATCTTGTTGGATTCGTATTTACGAGTACTTTAATACAGTGAAATTTTTATATTTAATGCTAATACGAAATTAAAGATATTAACGATTAAAAATGTGCGTTGGCAAACGTGTCCGGTCAAAACAGGAAAAGTATTTAGAGACGGAGGGAGTACAAAGTTGGTTTGGATGTTTGGCGATACCGCCGCGAAGCACGACCTTGACAATTAGTTTATTATAACATAAAGATTCTAATATTATTATAGAAATGATACTCCAATGCTAAATATGCTTTTCATCTTATAAACACTATAAATTATTAATCCTTTTTAATTTATAGTAAAGTAGCTGTATAATGTATAAAATAATTACTAATGATTCGAAAGGCACTAATAATTCTAAAGGCGCCCGCCATAGTTGAACTGCCCACTTTAGTCCAGAGAGCATTCAACAAACAATACACCAATGCATTGAATAAACTCAGCCGGCTGATTCCTTTTTCTTAACCTTTAGAATTATTAGTGGTTTTTGAATCATTAGTAATTATTTTATAAAAGACACCCACCCACTAATGACCAATCAAATACAAAAGACGCCAACTAATCTTCCACTAATGTCAGTTTACCAACCCGGGAGCATCTTCTGCTTATTTCCTGTCATCTAAAAAAAAAAAATATTTTCATAATTCTAAAATATAAAAACTAGGAATTAATGATCAGAACAATTATATTGAATAATTATTTAGTTTTACGAAGTTTCCTATCAGTCTAATCGCAATCTCCTTCCCTTGATAACTGTTATCGTCTCCCATTATCATTAACTTCAGCCTAGAAACTGGAAAATAAAATATTAATGATTATTCAATTCTATTCCAGCCTCTATCCTAATTTTACATACAGATTTTATAGTGTGTGCTGAGCACATATTAAAATCCACTTTTTAATTAGGTGTTGTATATTGACTCGCATCCCTTTAACAATGATGGTCATCTTCCTCTTAATTAAAAAGTGTACCGACCCTTTTCCATACTCCTTCCGTCCTATTTGATTGTATACAGTTTCTTTTTTGGATGTCCCATCAATTGTATACATTCCAAAAATGGTAAATTTTTATAATATAAAAAACTTAACTACACTCACTGCCTTCTTCCACTACACCCGCTTTATACATTAAAAATTAGTAGGTTCCACCATTTTACTAACCCTACACTTATTTTACACATTAAATATTAATGGGTCCCACTATTTCATCCACTTTTCTTACTTTCGTGCCACTTCCCATACGTATACTAATTACTGGGACGGAGGGAGTATAACTCTTGTTAATAAGCCAGGCATACGCAAGGGTCATACGTACCTAACCTTGCTATCTACTCCAATATTCTCAGTCTAAAGACTCCAAACGGAACCTTTCAAACATAAACTGTTACATACAGATATAATATATATTTGATCATAGTTAAAAATTCTAAACGCTACTGGTGAGTGGTGATTGGAGAACTTGTACGATAAATACTGCACACTAAGGGAGAATTCTGAAATTCTTTTTCCCACTCATCTTATTGTCTGATCATCAACTCGCTTCTAGCTTTCCTCGCTATATTATTGCCGCCCAGCTCTTTTCTACTTCTCTCTTGTTAGTCATTGTTGAAGTTTAAGCAATTTCATCAGCATCTTTCCTCTCTTTTCACCATAAAAAAAATTTGAAAAAATCATGATAGATCTGAATTCCATTCCATTTGTAGGACCGTTGGTAGCTAAAATTTCCGACAAGACAATAGAAGCACTGTTCCGACATGTAGAATATATGTTCCGTTACAAGGGTCTTGTTAAGGATCTGAAATCTGAAAATGATAAACTTCTGGCTGAGGAGACGAAGATGTCCAGAAAAGCTGAGCAAGAAAGTAACAATGGTAGAATACTGGAGAAGTATGTGGTGGAGTGGCAGAAAGAAGTCCAAGAAGAGCAGGAGAAAGTCACGAGGTGTTTGCAAGAAAATGAGAAGCTAAAGAGCCAACAGCAAAACTGTCCTCGCTACATCCGCTATATCCCACTTCCTCATCCCATCTCTCGTTATAGATTAGGCAAGGAGGCGGCCAAGGTGGCCAAGAGCACAACTGAGCTTACTGCAACCGGAAGTCACCACCTGGCAAGTCAAATTGCATATCTTCCTCTGGATATGAATGTACCTGTAACTGCATTTCAAGAGTTCAAATCTAGAGAAAAGGCTTATGAAAAGCTGGAGGAGCTAGTGACAGATGGAAGCTCTTCAATCCTTGGGATATATGGAATTGGAGGAGCCGGGAAGACTCGATTAATGGAGCGAATCACCACAGAAGCTGGTAAGAAGGGAACCTTTAACAAGGTCGTCCGAGCCAATGTGGGGAATGAGAAATTGGAGAACAAGACCATCATAAGCATACAAAACCAGATTGCAGGTAATTTAGGTTGCGTTTTTGAACGTCAAGATGATGTGGGACATAGAGCTGGTCAGCTGAGATCTAGTTTAAAGCAGGGGGGTAAGATACTCATCATCTTAGATGATGTATGGAGTAGGATACCTTTAGGTACTATCGGAATCATGTCTGCAGATGGTATGAGTTCCAAAGGAGGTAAGATTCTTTTGACGACACGAGATCACGAGGTATGCCAGCGTAACGACTGCGGGGATCTAGTCAAAGTAGAACCTCTTACACCTGCCGAAGCTTGGGATATGTTCAGTGAAACAGTTGGTGCTAAGATAATCGACTCTCTGCAGAATATATCCGTTGCCGAAGACATCTGTAAGAGATGCGGGGGTTTACCACTAGTCATTCTTGCTGTAGGTAACGCCCTCAAATTTAAGCCTCTTGATTCATGGAAGGATGCACGCAATCAACTTAAATTTTTCAAAATTCAAGAACTTCCTGGAATAAGCAAAGACGTGTATGCGTGTTTAAAGTGGAGTTTTGATAACTTGGTGGACGATGCGAAGGCATGTCTCTTGTTGGCTTCTATATTCCCTGAAGATGCTCACATTTATGTTAGCGAGTTGGTTGAGTTAGCAAGAGGCTCCCAGCTTATAAAGGCTGATGATATAAGAACAAGAGTATATTCAATGATTTATATTCTCAAGTCAGCCTCGTTGGTGCTTCAAGTCCGTTGGGGTATTATTGAACGTATCAAACTACATGACATAATAAGGGACATGGCAAGATCCATTGCTACCAAAGACTACGCATTCTTATTCGCAACAAGTAGCTCGTTGCCCAAGCATCCTGCTGATTACTCCGGTCTGAAAGTTCTGCATATAGATGTCGAGGAGGAGACTAGTCTACGTTTTCCAAGTAATGTAAAGTGCCCAGAACTGCATACACTGTCGCTATATTCATCATCATGGACATCATCATGGAAAACACCACGTACACTGATACAGCAGGTATTCAAAAACTGTTTTACATATTCGCTCAATTTTTGATTTATGATAACTATATATCTGATGATAGAATAAAAATAAGTGATTTGACGACAGATAAGTTTAAACGATATGAATTGTTATGAAACAGGATTTATGAGTCACATTTCATTAATTAATGCTATCGTCTAATATAAGCGTTATTTAACTTTTATAATTATTATATTATAATTGCTATAAAATTTTACTAAATTCTGATGTAAATAATAAATTAAATATTGAGTCATACATTAATCAAGATTGTGGAATTGTATAATATCAAAAATTAATTATATTTTAGGTGTCTAATTTTTAATATAAATTAAATTAAGTAATATGTGATTTATAATACATGAACCCGATCCACTTGTTTATTCTAATGAAAAAATATTTATTTTGATCTTGATTAATTAACGAGATAAATAAAAATATATACTAATTTAAATATATTAATTAAATTAATTTTTTTATTTATGCTAAAAGATTAATTATTTAAAAAGTATTCCAGTTAAAGGGAAAATTTTATTCTTGTACAAATACCTTTAAAATAAAGTTACATATGAACTAAATACAAAATATTAAAGTCTATAATATATATTTAAAATATGAAAATTATAAGTAAATATTAAAAATTTGTACAGGGAAATACTCAGTTTAAAAGGAAGGCCTCCAACAATTGACAAAGGCCAGGTATTTTGGACATTCTCAAACATACTCGTATGATGTTTTTTGAACAAAAAGAACAATCTTATAATAACATATTATTAGACAGTGTTATTTGATTTGAAAATTATATATGATTGAATTTTTGGAATGATATATATTTAATATCCCGTGAAAACTTCTCACTGTTAATATTGTTGTACTGATTTTTACAAAGATGACTTATAATACATATCATAAAAAAGTTTAGTTTGATAACTAAAAAATTTATGAATTTTTTATAGTCTTCTACTATAAATTTGAAATCTTTTATATTTATTTTCGATTATCGGATAACTCTCTCTCGTAGGCTTTTGTTTATCAATGTTTCTAGATTTCTTAATCATTCTCTCACAGTAGTATGGATCGATGATTATGTATTTTATATGTATTATAGTTTTAAAAATTTTGTTTAGCCAAATCTTTAATTTATCCTCAGTTTTCATGGTACCTCTGTGCATGAGGTATTTACCTCAAAACAAATTTGATTAAAAATAGATCTAATTTTATTGTTTGGTTCAAATAGGTATTTTAAATTGTTTATTTTGCATATAGCTAAGTTTAGAGTGTTGTTTATAATTGGGTGCCGGCCCACTCTAAATTTATTTATATTATACATATTCTACATCCTCTTTTATATCAAATTGTGCATGTCTTTTATTATTTCAATTCACCAACTATCGGATAATTTAATACAAAGTAGATGTAAGGGAATGCATAAATCACCACCCTTGTTATTTTTATAAGAAAATAATACAAAAAATAAATATGATTACTCTAATGTTAAATTTGAAGAACATGTACGAGTTCTTTAAAATTTAGTTGTTGTATTTAAGAGCATTCACATCCGGACCCAACCCTCAATCCCAAAAATTTACTAAAAATATTAATTCCTCAAAAAAATTACAAATTTTTAAAAGTTTCTTACATCCCATTCCCTATATTCAATCCCTATTCTCATAGAAGTATAAGATAAGAATTGATATTTAATAAAATTATAATGAAATGATAATGAAATGGAGGATGAATAATGTATGAGGTACAAATAGTGAAACTCCAAATATGGGGATTTATTTCTAGTCCCAAAACCAAACCTTATTTTGGGATCTGAATGTAGACTACGTTTTTACAAAAAATAGTAGATTTCTTTAAAATAAATTATGGAGATGCGGTTGGCTTTGGGGGTTAGGGATGTGAATGCTTGATATGATTGATCCAAAATTTTGTTGTGGAATAATTGATATGGTTGATCCAAAATTTAGTTTTGGAATGATTGATATGATGATTGCTCCAAAATTTAGTTTTGAAAAAATTAGTACTATTGATTTAAAATTTAGATATTAGCTTTAATTGATTAAAAATGAATTAAATTTAACCGGAAGTTAGTTAAACTCAATAAAAGACAAGATCCAACCAATAAATTTGATTGGTCTAAAATTTAATTATGATAGTTTAAAATTATTTCAAAAATGGGTCTAAAATTTAGGTGTGAAGATTAAAAATAAATCAAAATTCACGGTTATATATCTCAAAAGATGAAGACTTAACATTATTGATCTAAATTTAACCGTCATATCAAATTATCTCAAAAATCACTAATCGGTTAAGTCAATGATTCAGGAGACTCGTGTCTTTGTAATTATCTTCCTATAATTTTGATATGAATAAAATGATTATTTATTCTTTTTTTAAGCAACATATACAACACATAACACATTTCATCCTTATTATTGGTTAGCTTCCTGAAAAAGCGAATCAGCGTGATCTTTGCAAATATGATAACTACACAGTTATAATATTTGTTCGTAAAATTTATACCTTTAAACATTTGATTAGACGTATATGTGAGGTAGAGTTACCTATCAATCCTTATATTTGTTCCCATATTATTATTTTAATAATAAATTTGAGAGACAAAATAGAAAATAGACAAAGACCAAGAAAGAAGAGGAGAGATGAATTTTTTATTCATAAATATTAAATATGTAATGACCAATAATTATTTAAAAATAGATAATGGATACCGTATCTAAATATGAGTTTAAGAACTTATTTAACTAATCTATTGGACTCTTTAAGATCTCATCCTCTTCTGTAAGGCCATAAGTAGTCATATTTGTCAAAGAAAATAAAAAAGCTGTTATTTTGAAAATTCTAATTATGTCTGCACTTGATGCATGTTATATGCTGGTGAAATAAAACACAAAAAATAACGATTCTTGCTTAAATTTCAGGACTGGATCAACGGTAAAATATTTACAAATCTCATATTTCTGGTGCTTGTGGGGTTTTCCTGGCCAAAGAAATTGTCTCTCAAATCATTGGGTGAACTTAAAACGCTTTGGTTCGACAATTGTGACCTAGAGTTCTTTGGTGAGACGGATGTTAAAATTCTTCCAGAGGGACTGGAAAATCTTTGTATTTGGGGGTCTCGTATGCCAAAACAGTTGAATGTACCAGAACTGAGCCATCTTCGAAAGCTAGACATCTATTCCAGTTCCGGAGGTAGATTATGTATGGTGCCAAATACCATATCAAGACTATCCACTTTAGAAGAATTACGTTTGCCATCTAATTTCTACATCAATGAAGAATGTGCAGAAGGTGGATCATTGTCGGTATTGGACGAGATTAGTGAATTGCCACTGACAAGTTTACATATTCGTTCCCGAGTATCCAAGTCAAGTAAACTTGCAACTATGTTTTCCAACTTACGTGAATTCCATTTGTTTGTTGGTGAGCCGCCGGCTAATAATCGGTCTATGAATCTGTCACCTGTTTCAGTGACGAAGTCAATTAAGTTGGTCAACCACGATCTTGTAGAGGGCTACCAGACTCTATTTCAGAAGGCTGAAGAGGTGATATTGTATGAGACTGATTTCCCAGGGAGTAGCATTGGGATCAGAGACACTAAAGAATTTATCAACTTAAGGTACATGCAAATTGAAAATTGCAAGGCCATGGAGTATCTAGCAAGGATTTCATCACCACAGGGTGAGATTCAGGAAAGTCTTCAGCGATCAACACCTTTTTCTAACCTGATCAAATTGGAAATTAAGTGTTGTCTCAGCCTAAAATACCTCTTCTGCGACTCTATTGCAAGATGTCTCCTCCTACTGGAAGAGCTCCACATAAGGGACTGTCCTTTAATGGAAGAAGTTGTACGTGAGGAGGGCAAAAGTGATGGAAATATCATTAACATGTCCAAATTACGAAAAATGAGCTTAATTAAATTGCCAAGACTCGTACATTTTTACAAGGACAAGATTCCCTATGCGCAAATTCAACCTCTGTTTGACAGAATGGTATGCTTTGCTTACCCCTCATCAATCATCATCATCATATTAATAATATTACTTACACTGTGTAATGATTTCAGGCAAAGTCAATAAACTATTTTGCACATAATTGATTCTTTTTGGTTACTTCTTTATGTCAATATATTTGTTTTAAGGGATTAAAGTTCGGAACTTGTAATCTTTACATTGTATCATGTACTCTCACAAGTAATAATGGCACTTGGAGTAAACTTTGGAAATAAGAACCTAAACAAACACCCTCGGAACTTGTAATCTTTACATTGTATCATGTACTCTCACAAGTAATAATGGCACTTGGAGTAAACTTTGGAAATAAGAACCTAAACAAACACCCGTCACGTATAAAAAAATATGTTTACGCTGTTCATGTAATATAATTTTAAGATTTTTAATACAGTAGTAACTTTTTATTACAAGTAGCACTTGGTTACAGTGTCCTTTCTGTTCTCTGATGGTATGCCTTTCACTGACTATTTGAGCAGGTTGCATTCCCTTCCTTGGAAATGTTGGATATCAGTGGTTTGGAAGACATAACTGACATTTGGGGAGATAATCATGACAATGCTTCCTCCTTTTCCCAACTGAAGACCCTGAAAGTAAAATTCTGTAATAAGCTTAAAAATGTGATCCCACCTGCCACGTTGCGTAGTTCACTCACCTCTGAAGTTGACACTCATGGAAGCCACACAGATTTGGTTACTGGCAGAGCTCCCGAAGGACTTGTGAAGGCCGTGGTTTCTCATAATCCATACAAAAAATTACAAATTTTTTTGAAGAAAACTGTACGTGCGTCGAGATCTGTATGCAGGAGGACCCCCACAATAACAGAAGAAAATTTGAATGATCCCTCTGATATTTCAGTTCAAGTTCCGTCCCAAAACACAAAGGTATGTCCATTGGTTCAAATGAGTCTAGAATGGTTGCCTTGTTTGGAAAAGACAGGGTTGAACTTTGAGGACCAATCCGGAGCAGTGAGTTTGTACCCGGATCTTAAAAAGTTAAATATAAATATATGCGAAAGATTGGAAAACGTGTCCATCATACCTTGTACCAACGGACATTTGATGAACCTTGAGGAAATGTCCGTGAGGCAATGCATTACGATGAGAGAGATAATTGGGGCAGGACCGGCAGGTAAACACAAAATGGCCAATGGCATTGTGTTCCATAAGTTGTGTTCTCTTCAACTAAGTGACTTGCCAAGTTTGACCAGTTTTTGGGGGGAGGCCAGTGGGGAAGCCAACAGCCACAAGGTATATTTATATTTAATTGCCAAATGAAAAAAATTTAAGATTCATAACATGCATCTGTTTTTTTTTTCGCGCGAGAGTGAGAGTATAGATCTATTATTGCTTTTATATCAAACTGACCACTCGTTTCGTCAAAATTTCTCACTTGACCCATCCATTTAATTTCAAACTCAAGCCACTATAAACCAAATACTATATATATTATTTTACCCACATTATTATTCATATTTCTTCACTTAATCATTTATCAAAAATCAAATGTTTGTTTTTTTTACCACAAAATCACTTCGAGTACTTTCATAATTGTCTCTAGTATATATCAAAATAATTTGGAAATTTTTAAAACAACATTACTATGTAGTTTAAAAAATATAAAGTTATAAATATATAATTATATGATCACCTTAGCTATGTTATTTTAAAAATTCCCAAATTATTTTGATAAATACTAGAGACAGTCATGAAAATACTCGAAGTTGTTTTGTAGTAAAAAAACAAACGATTGATTTTTGATAAATGATTAAGTGAAGAAATATGAATAATGATATGGGTAAAATGATATATATTTGGTTTATAATGACTTAAATGAGTCCGAAATTAAATGTGGGTCAAATGAGAAATTTTGACGAAATGAGTGGTCAGTTTGATATAAAACCCGATCTATTACTGTATCAATTTAACATTTCTGAGGTAAAGACGTTAAAGTGAGGAAGGCGCATTCACCGAGTCAGATTGACATAATGTATGGGATTGTTTTTTGTAGGTTGAATTCCCAAACTTGAAGAAGCTTCAACTCCGTTGTGGGGAAAATACTAGCTTACTGGAAATGATAGAGTCAGGCAGAGATGGTTCTACTTTTCAGCTGGAGAACTTAGCAATAAGCTGTGGTAAGGAGATACAAATTCCTAACCGATGGCTACTTCAATTAGATAATCTGGAAAGCTTGTCACTGGAACGCTGTTGGTCAGATGAGCTGAAATCTCTACGTTTCCAGAGATTGAATAAACTCACACTTGGTCAACTTAGTTGCTCTAGTATTTTCTCATTCCCAGACTTTGAAAGACTTCA\n>URS0000AE3A4B tRNA from 1 species \nGCTCCGATCGTCTAGCCCGGTCCAGGACAATGGCCTTTCGAGCCATGAACACGGGTCCGAATCCCGTTCGGAGCA\n>URS0001D9EE47 rRNA from 1 species \nAGCGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGAACCTTTCGGGCTTAGTGGCGGACGGGTGCGTAACACGTGGGAACGCGCCTGTAGGTTCGCAATACTTCAGGGAAACTTGTGCTAATACCGAATGTGCCCTTCGGGGGTAGGAGTTATCGCCTGTAGAGCGGCCCGCGACCGATTAGCTAGTTGGGTGGGGTAATGGCTCACCACGGCGTGGATCAGTAGCTGGTCTGAGAGAATGAGTAGCCACATTGGGACTGAGACACGGCCCACAATCCTACGGAAGGCAGGAGAGGGGGATCCAGCGCGATGGGGGACAGCCTGACGCAGCCATGCCGGGTGAATGATGAAGGTCTTAGGAAAATGAATTTCTTTAACCGGGGGCGATAATGACGGTACCCGGAGAAGAAGCACCGGCTAACTACGTG\n>URS000212D443 rRNA from 1 species \nTCAAGTGAAGAAGCGCATACGGTGGATGCCTTGGCAGTCAGAGGCGATGAAAGACGTGGTAGCCTGCGAAAAGCTTCGGGGAGTCGGCAAACAGACTGTGATCCGGAGATGTCTGAATGGGGGAACCCAGCCATCATAAGATGGTTATCTTGTACTGAATACATAGGTGCAAGAGGCGAACCAGGGGAACTGAAACATCTAAGTACCCTGAGGAAAAGAAATCAACCGAGATTCCCTTAGTAGTGGCGAGCGAACGGGGACCAGCCCTTAAGTTGTATTGAGATTAGCGGAACGTTCTGGAAAGGACGGCCATAGTGGGTGATAGCCCTGTACGCGAAAATCCCTTTGCAATGAAATCGAGTAGGACGGGGCACGAGAAACCTTGTCTGAATATGGGGGGACCATCCTCCAAGGCTAAATACTACTGACTGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAAAAGAACCGCGGAGAGCGGAGTGAAATAGATCCTGAAACCGTATGCGTACAAGCAGTGGGAGCCCACTTTGTTGGGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTATTTTCAGTGGCGAGCTTAACCGAATAGGGGAGGCGTAGCGAAAGCGAGTCTTAATAGGGCGTCTAGTCGCTGGGAATAGACCCGAAACCGGGCGATCTATCCATGGGCAGGTTGAAGGTTGGGTAACACTAACTGGAGGACCGAACCGACTACCGTTGAAAAGTTAGCGGATGACCTGTGGATCGGAGTGAAAGGCTAATCAAGCTCGGAGATAGCTGGTTCTCCTCGAAAGCTATTTAGGTAGCGCCTCATGTATCACTGTAGGGGGTAGAGCACTGTTTCGGCTAGGGGGTCATCCCGACTTACCAAACCGATGCAAACTCCGAATACCTACAAGTGCCGAGCATGGGAGACACACGGCGGGTGCTAACGTCCGTCGTGAAAAGGGAAACAACCCAGACCGTCAGCTAAGGTCCCAAAGTCATGGTTAAGTGGGAAACGATGTGGGAAGGCTTAGACAGCTAGGAGGTTGGCTTAGAAGCAGCCACCCTTTAAAGAAAGCGTAATAGCTCACTAGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTCAAACCATGCACCGAAGCTACGGGTATCATCTTTTGATGATGCGGTAGAGGAGCGTTCTGTAAGCCTGTGAAGGTGAGTTGAGAAGCTTGCTGGAGGTATCAGAAGTGCGAATGCTGACATGAGTAACGACAATGGGTGTGAAAAACACCCACGCCGAAAGACCAAGGTTTCCTGCGCAACGTTAATCGACGCAGGGTTAGTCGGTCCCTAAGGCGAGGCTGAAAAGCGTAGTCGATGGAAAACAGGTTAATATTCCTGTACTTCTGGTTATTGCGATGGAGGGACGGAGAAGGCTAGGCCAGCCTGGCGTTGGTTGTCCAGGTTTAAGGTGGTAGGCTGAGATCTTAGGTAAATCCGGGATCTTAAGGCCGAGAGCTGATGACGAGTGTTCTTTTAGAACATGAAGTGGTTGATGCCATGCTTCCAAGAAAAGCTTCTAAGCTTCAGGTAACCAGGAACCGTACCCCAAACCGACACAGGTGGTTGGGTAGAGAATACCAAGGCGCTTGAGAGAACTCGGGTGAAGGAACTAGGCAAAATGGCACCGTAACTTCGGGAGAAGGTGCGCCGGTGGAGGTGAAGCATTTACTGCGTAAGCCCCTGCCGGTCGAAGATACCAGGCCGCTGCGACTGTTTATTAAAAACACAGCACTCTGCAAACACGAAAGTGGACGTATAGGGTGTGACGCCTGCCCGGTGCCGGAAGGTTAATTGATGGGGTTAGCGCAAGCGAAGCTCTTGATCGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGCGTAACGATGGCGGCGCTGTCTCCACCCGAGACTCAGTGAAATTGAAATCGCTGTGAAGATGCAGTGTATCCGCGGCTAGACGGAAAGACCCCGTGAACCTTTACTATAGCTTTGCACTGGACTTTGAATTTGCTTGTGTAGGATAGGTGGGAGGCTTTGAAGCGTGGACGCCAGTCTGCGTGGAGCCAACCTTGAAATACCACCCTGGCAACTTTGAGGTTCTAACTCAGGTCCGTTATCCGGATCGAGGACAGTGTATGGTGGGTAGTTTGACTGGGGCGGTCTCCTCCTAAAGAGTAACGGAGGAGTACGAAGGTGCGCTCAGACCGGTCGGAAATCGGTCGTAGAGTATAAAGGCAAAAGCGCGCTTGACTGCGAGACAGACACGTCGAGCAGGTACGAAAGTAGGTCTTAGTGATCCGGTGGTTCTGTATGGAAGGGCCATCGCTCAACGGATAAAAGGTACTCCGGGGATAACAGGCTGATACCGCCCAAGAGTTCATATCGACGGCGGTGTTTGGCACCTCGATGTCGGCTCATCACATCCTGGGGCTGAAGCCGGTCCCAAGGGTATGGCTGTTCGCCATTTAAAGTGGTACGCGAGCTGGGTTTAGAACGTCGTGAGACAGTTCGGTCCCTATCTGCCGTGGACGTTTGAGATTTGAGAGGGGCTGCTCCTAGTACGAGAGGACCGGAGTGGACGAACCTCTGGTGTTCCGGTTGTCACGCCAGTGGCATTGCCGGGTAGCTATGTTCGGAAAAGATAACCGCTGAAAGCATCTAAGCGGGAAACTTGCCTCAAGATGAGATCTCACTGGAACCTTGAGTTCCCTAAAGGGCCGTCGAAGACTACGACGTTGATAGGTTGGGTGTGTAAGCGCTGTGAGGCGTTGAGCTAACCAATACTAATTGCCCGTGAGGCTTGACCAT\n>URS0001E7BB53 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCATGTCGAGCGAACGGACGAGAAGCTTGCTTTTCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATTTTGAACCGCATGGTTCATAAGTGAAAGACGGTCTTGCTGTCACTTATAGATGGATCCGCGCTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACATATGTGTAAGTAACTGTGCACATCTTGGCGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS0001963736 lncRNA from 1 species \nGTCCAGCCTTCAGCCCGGTTCGGTTTCTAGGTTGGACCCAGGGCAACTCCAGCCGTTTCCAGACCCGGTTTCGGAAAAGAAATGATCAAATAAAGCCTCGAAAGCTCCTGAGGTAAAAGCCGCAGAGGATCTGAGCGGGACGGCCCAGCCCCTCCGGAGGCAGCGAGCGCGTGGAGGCGGTGGCTCCGGCTCAGGAAAGAGAGAAGCTAACAAGAAAAGCCACTCTTCTTGTTTCCATCTCCACAGTGGAAGAAATGCCCTCTTTTTTAGTTAAGAAAACAGAGAGTCAAAAGAAGATGGGAGACCTCTGCACACTCAATCAGGAAATTCCTGGAATACCAGACTGTTTCCATCAATGGTAGGTCATTGCTTTTATCAGCTTGTATTGCTGAAATGCAGTAAGCACTGATTACACAAGCACTAAATGCCAAGCAATGCTCATAAATCTTGGTAGGAACATGAGCTTTAGAGTTGAGGTCTCGGATTTTCTTTTTACCTTGGTACTGAGTCAAAAAGAAAGATTTTAGAATCAGGGTCTTCTTCCACCCCTAATAAAATGCTCTCTTCACTCTCTTTGTGGAGTATT\n>URS00015412A1 rRNA from 1 species \nTACGTAGGGTGCAAGCGTTATCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGTCGAGTCTGTTGTGAAATCTCGAGGCTCAACCTCGGGTCTGCAGTGGGTACGGGCAGGCTGGAGTGCGGTAGGGGAGAGTGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGTTCGCTGGGCCGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS000242BE45 lncRNA from 1 species \nCTAGAGAAAAATCAGAAACAACGCCCTACTGTTCCTTCATCTTCCTCAGATTTCAACTCACCTCAACTCGCCCGAGTTCACTCAAATGGTCCCCTTCCCTCCACGTTATTTGATTCCCAACAGTTTTTGTTAGAAAGAATTCGAATATTCTCTCAAAATCGCACAATTTTGGGTACGAAAGAACGATTTGTTGGATGAATGGGAGCTGTGGATAGATGTAAGTCGATCCACGCCCTCCATTTGTCCCAAAATTGTTCAAAAAACTCGAAGATATTTGGATTTTTGGGCAGATTTTTGAGATTTTTTGAAGGCTATATATATGAGGTAAGTTCTATGTGCTAGGTTAGAGGGAGATCAGAGAAAAATCTTCAGAACTTAGCCGAGTAATTTTCTAGGGTTTTAGTTGTTATCGTCTTCAAGTCTACTTTTTCTTCAAAAATAAAACATACCAAAAAGAGCACAATGGTCTGAGTTCAATTTTTCTAGTCGAGTTTACTTTATTTTTTAGAGAAAAATAAAAAAAAAAATCACTGAGCACAGATATGTCTTAGTGCTTGTTCTTTCTTTTGAAGTTCTGTTTTTCTCAAGAGAACTTGATTTTGAAAATTCAAGTTATAGTCGAGTTTGTTTTGGAGTTCAAAATTTCGGTTAGTGGCTCAATTCAAGTTGGTTGATTCTTGTCTTCTTGTTGCTGTTCGTTTCAAGCTCTAAGCCGCGGTTTTGCTCGAGTCGATCTAGTTGCTGTAATCCCTGAAGTTTTTTGTTAATTAAAAGGTTCATCTCTTCACTCCTTCTTAATTTGTTCTGGTATTGATCAAAATGTGATGATGGCTGAGACTTTGCTAGATTGGAAGTGTTTATGAGCTGGTTCATGAGAAACCAGTCTGTGATGCAGTTTTTTTTTGTTTTCTTTCTTGGCTCCGGATACATCTCCCTTATTCTATTCGTTCTGTGTGCTCCAATTCATTCGGGTTATACCCTGTGTTGCCTTGTTATTTACTGGTGAATGGTGTATAAATTCATTTTTCTTTACCATACAGAATTCATGTCTGTTCTTGAATTGATTAAAATTTCCAAACATTGAATGCTAAGGTTGGGTATGGTCTGGATAAGCCAACAGCTTTATAAAATATGAGTGTCACACAGTTTTTAATGAAATACACTAACTTCCACAAGCAGCTTGTATTTAGTTGAGATCCACATTGTCCTTTTAAGAGATACTGTTGATGTTAGTAAGTAGTTAAGAAAAAAAACTTTTAAGTCATGAATCATGATTCTTTTAATTGCATTTGAAGCAAAAACATCAATGGTGAATAATGAAACAAAACTGGAAAGCAGAGAACAACTAGAGCAGTTAGCTTCACTGATTCTCTTTGAGCTCGAAATGTACATGTGAGAGAATGCAAAGCAATGACTACATCAGAAGAAAATTGTTCTAGAGTTAACTTTCTTTCCTTTTTGATGTATTGGCTATCTGTGTATGGTGAACGTGATATCAGGAAATGTGTGTCTTCTATCACTATTACTCCTTGTTAAGTCATATGTAATTGACTTGTTATGATATCAGTAGACTTACTTATGTTTAGACATAGTTTAAATGTTTTCTTTTGTGCTGTTTTGTTGCCTATACGGCCCTGCCATTCAAGAGAACATGGTGATTTCTTAGGCTTGCATATCACTGTTGAAATGCATCTATCTTAGTGTTTGACAAAAGAATATGTCACACATAGGATTAACAAGATGACTGAAGTTGGTTAAAATTAAGTCAAATTGAATGTTAGTTTAAAGTCATTTACCTGCTACATGCTAATATTTTTATATAACAGTGTGACGACCCGACTAGTCATCGCATGAATTACCGCCCTGTTTTTCCTATTTTTGCTTCTTTATGCTTCGTTATTCGTGTTTTATGTGGTCGAGTTGATTGGTTTGCATTTGGTGTGATTTTAGTAAGAAATGAGACACTTAGTCTCTTTTAAGAAGGCTTAAGTTGGAAAAGTCAACTAGATGTTGACTTATGAGTTAGAGGGCTCGGATGTGAGTTCTTATGGTTCGGTTAGCTTCGGGAGGTGACTTGTGACATAGGAGTGTGATCGGAAGTGGTTTTGGAGGCCCAGTGTAGAATTAGGCTTGAATTGGCGAAGTTAGTATTTTGGCAATTTCTGGTTGATAGGTGAGATTTTGATCCGGGGATCGGAATGAAATTTCGAGAGTTACTGTAGCTTTGTTATGTCATTTGTGATGTGAGTGCAAAATGTTAGATCATTCGGACACGGTTTGGTTGGGTTTTGATCAAAAGTGTGTTTCAGAAGTTTCTAGAAAAGCTAGGCTTGAATTCGATGTGAACTGATGTATTTGGTGTTGTTTGAGGTGTTTTGATGATTAGAACAAGTTTGAATGAGGTTTTAGGATGTGTTGGTACTTTTGGTTAAGGTCCCGGGGGCCTCGGGTGGTTTCGGATGGCTAACGGGAAGTTTTGAGTCATTGGAGATTGCAGAAAATGCAGCAGCAGTTGCAGAGGATTTTTGGCCTTCGCGATCGCGTGAGGTCCCTCGCGATCACGTAGAAGGAAGTTGGGTGGCCCTGCATTTGTGCTTCGCATTAACGTCTGCTGCCTCGCATTCGCGAAGGGGCCTTGAGGTTATGCTTTGCGTCCGCGTGATGGGTATCGCGTTCTCATAGTGGAGATGGGCACGTGAAGGTCGAGGAGCTATTGCTCTTCGCGCTCGCGTAAGTGGTATCGCGTTCGCGTAGGTTCAAAGTTCCAAAGCATCGCATTCACGGGTGTGGTGCCGCATTCGTGAAGGGTTATTTGTGGTTCAAGGAAAATTGTGCATCACGAACGCGTGGGTTTGACCGCGTTCGCGAAGGAGGGATTTCCAAAACTGAACAGTGAAGTTTTTAAACATTTCCTCCGTGAGTTTTAGTCTTTTTTCCACCATAGTTGAGTATTTTGAGAGCTCTTTGAGGGGAATTGAAGAGGGATTCAAGGAGAATTGGTTGGAGGTAAGTTCTATGAACCACAAACGTGATTATATTGTGAAGTTAACCTAGAAATTCATGGAAATTTAGCTAAAAATAGAAGAACTAGGGCCTGGGATTTTGAGATTTTAAATTGGGATTTGAAGGGACATTTGAGGTCGGATTTGAGAAATTTTGATATGTATGAACTCGTGGCGAGATAAGGAACCCGTTGATGTGAAAATTTCTGAGTTTCCAGAAGTAAACCCGGGGCTCGGGTTTTGCTAATTTCGGGATTTTTGATATTTTTCGATTGTTTTCGCTTGGCCTTTTTCCCCTTAGCATATTGTGACGTATTCGCTCTGGTTTTGGTTAGATTCGATGTCCGAGAGGCTGATTTGAGAGGCAAAGGCATAGCGAGCTAGAGCTTTAGCCGGTTCGAGGTGAGTCATGAATGTAAATGATATCCTGAGTGTTTGAAACCCCAGATTTGCACATCGTAGTGCTATATTGAGGTGAGACACGCGCTTGATGATGAGAGTGGGGTCATGTACTATTGAGGATTGGGACTTGGTCCGTCCTGAGTGTTGTTTTTACCGTGCATTTTGATTGAAGCTTATTTGTTATCATCATTGTTTGGACTAATTGCCATACTTGGACTTCGTGCCAACTATTTGAACCCTTCGGGGAGTTTTATCACTATTTCCTCACTGTTTTGACTTACTACTTGAACTTACTCGTACCGTTTTCCACTGTTTTACAACTCAACCACTTTTTACTCGGTTTTGAAACTAAAATGATACATATTAAATGATATTTTGGGCTGAGAACTACTGTTTTACTAATGCCCGAGGGGCTTATATGATTTCTGGACGGAGTACGGCCAAAGGCCAGATGGGAGGATACTATGGGATCGGGCTGCGCGCTGCAACAGTGTTATACTGATATTGATACGAGGCTGAGGGCCTAGATTTGATGCCACGAGATGACTTGATATTGTGCTTGGGCCGTAAGGGGCCCCTCCCGGAGTCTGCACATCCCCAGTGAGCGCCGTCAACGATAAATGTATGGATCGGGTTACACGCCGTAGCAGGTACTATAGGGTACCGTTCTATGTGTTGATTTTCTTTATATGTCTGTCACCTAACTGCTTATTTGTGGTAGCATTTCCACATTTCGTTTCCATTGGTTTATTACTTTCATATTACTTATTTAAAATGCTGCATTATAGATTACTCTGTGTTTCTTCGTGATTTCTTATTCTCAGTCATTATTTATGCTTATTACTCACTGGTTCGGAGTACTCACATTACTCCCTGCACCTTGCGTGCAGATCCAGGTGCATCTGAGGCTAAGTGAGGATTTTTAGTTGAGAAGCGCATATCCGGGAGCATCGAGGTAGCTGCATGGCATCCGCAACCCTGATCTCTCCTTTCTATCCTTTTGTTTTATN\n>URS0000BE1683 snRNA from 1 species \nTAACTTACCTGGAGGGTAAGTCCAGTAGTCAACTTCGCTGGACTTATTGGGCATGATGGGGCATTGCACATCCCGTCCGGTCGTGTTCAACGAATGTCATTACGGCATCTCGGCCTTATAATTTCTGGTTTGGATTCCTCTGGCTTGCCGGGGAATCCC\n>URS000002E6E7 rRNA from 1 species \nAACGAACGCTGGCGGCGTGGATAAGACATGCAAGTCGAACGGGATTATTTTTGTAGCAATACAGAAATAATTCAGTGGCGAACGGGTGCGTAACACGTGGGCAATCTGCCGAAAAGTGGGGGATAGCTCGCCGAAAGGCGAATTAATACCGCATGTGGTGAGGGACGACATCTTCCTGAATCCAAAGCCGGGGCAACCTGGCGCTTTTTGTAGGAGCCCGCGGCCTATCAGCTTGTTGGCGGGGTAACGGCCCACCAAGGCTATGACGGGTAGCTGGTCTGAGAGGACGACCAGTCACACTGGAACTGAGACACGGTCCAGACACCTACGGGTGGCAGCAGTCGAGAATTTTTCTCAATGGGGC\n>URS0001E82C61 rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGAGACCTTCGGGTCTAGTGGCGCACGGGTGCGTAACGCGTGGGAACCTGCCCTTAGGTTCGGAATAACTCCCCGAAAGGGGTGCTAATACCGGATAATGTCTTCGGACCAAAGATTTATCGCCTTTGGATGGGCCCGCGTTGGATTAGCCAGTTGGTAGGGTAAAAGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCGACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATACAGCAATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTTACCCGGGATGATAATGACAGTACCGGGAGAATAAGCTCCGGCTAACTCCGTG\n>URS0001712CA9 rRNA from 1 species \nAGAGTTTGATCCTGGCTCAGAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGCGAACGTTTCTTCGGAAACAAGTAGAGTGGCGGACGGGTGAGTAACGCGTAGGAATCTGCCTAAGGGTACGGAATAACGCCGGGAAACCGGTGCTAATACCGTATACGCCTTAAGAGGGAAAGCGCTATGTAGCGCCCTGGGATGAGCCCGCGTTAGATTAGGTAGTTGGTGAGGTAATGGCTCACCAAGCCTATGATCTATAGCTGGTTTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGAAACCCTGATCCAGCGATGCCGCGTGAGTGAAGAAGGCCCTAGGGTTGTAAAGCTCTTTCAGTAGGGAAGATGATGACGGTACCTACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGAGTACGTAGGCGGTTTGATAAGTTGGGAGTGAAATCCCGGGGCTTAACCTCGGAATTGCTCTCAAAACTATTAGACTAGAGTATGGTAGGGGACAGTGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCAGTTGCGAAGGCGGCTTACTGGTCCGGATCTGACGCTGAGATGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGGTGCTAGGTGTTGGGTAGCTTGCTATTCAGTGCCGAAGCTAACGCGTTAAGCACCCCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAGCCCTTGACATACCAATCGCGATTTCCAGAGATGGATTTCTTCAGTTCGGCTGGATTGGATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGCCTTTAGTTGCCAGCATTTAGTTGGGCACTCTAGAGGGACTGCCGGTGATAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTACGGGTAGGGCTACACACGTGCTACAATGGCAGTGACAATGGGTTGCGATCCCGCAAGGGCTAGCTAATCCCCAAAAACTGTCTCAGTTCGGATTGTTCTCTGCAACTCGAGAGCATGAAGTTGGAATCGCTAGTAATCGTGGAACAGCATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTGGTTTTACCCGAAGGTGGTGCGCTAACCGCAAGGAGGCAGCCAACCACGGTAAGGTCAGCGACTGGGGTGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGCGGCTGGATCACCTCCTT\n>URS0000F24664 rRNA from 1 species \nTACGTAGGGGGCAAGCGTTGTCCGGAATCATTGGGCGTAAAGCGCACGTAGGCGGCTTCGCAAGTCCCATGTGAAAGCCCACGGCTTAACCGTGGAAGTGCATGGGAAACTGCAGAGCTTGAGTACTTAAGAGGATCGCGGAATTCCCGGTGTAGAGGTGAAATTCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCGATCTGGGAAGATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGG\n>URS00003B973F rRNA from 1 species \nCGACGAGTTTGATCCTGGCTCAGATTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGAACGGTAACGGGGACTTCGGTCTGCCGACGAGTGGCGAACGGGTGAGTAATATATCGGAACGTGCCCAGTAATGGGGGATAGCTCGGCGAAAGCCGGATTAATACCGCATACGCCCTGAGGGGGAAAGTGGGGGATCTTCGGACCTCACGTTATTGGAGCGGCCGATATCAGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCTGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGAAGAAGGCCTTCGGGTTGTAAAGCTCTTTCAGCCGGGAAGAAAACGCATGGGTTAATACCCTGTGTGGATGACGGTACCGGAATAAGAAGCACCGGCTAACTACGTG\n>URS00019E32A1 tRNA from 1 species \nGGATATAGTTCAGCTGGTAGAATGTGTGCCTCACATGCACAGGCCTGGGGTTCAATACCCAGCACCA\n>URS0000ED2EE6 rRNA from 3 species \nCAAAATGGTGCCGTAACTTCGGGAGAAGGCACGCTGACACGTAGGTGAAGTGATTTACTCATGGAGCTGAAGTCAGTCGAAGATACCAGCTGGCTGCAACTGTTTATTAAAAACACAGCACTGTGCAAACACGAAAGTGGACGTATACGGTGTGACGCCTGCCCGGTGCCGGAAGGTTAATTGATGGGGTCAGCGCAAGCGAAGCTCCTGATCGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGCGTAATGATGGCCAGGCTGTCTCCACCCGAGACTCAGTGAAATTGAACTCGCTGTGAAGATGCAGTGTACCCGCGGCAAGACGGAAAGACCCCGTGAACCTTTACTATAGCTTGACACTGAACATTGAGCCTTGATGTGTAGGATAGGTGGGAGGCTTTGAAGTGTGGACGCCAGTCTGCATGGAGCCGACCTTGAAATACCACCCTTTAATGTTTGATGTTCTAACGTGGACCCGTAATCCGGGTTGCGGACAGTGTCTGGTGGGTAGTTTGACTGGGGCGGTCTCCTCCTAAAGAGTAACGGAGGAGCACGAAGGTTGGCTAATCCTGGTCGGACATCAGGAGGTTAGTGCAATGGCATAAGCCAGCTTGACTGCGAGCGTGACGGCGCGAGCAGGTGCGAAAGCAGGTCATAGTGATCCGGTGGTTCTGAATGGAAGGGCCATCGCTCAACGGATAAAAGGTACTCCGGGGATAACAGGCTGATACCGCCCAAGAGTTCATATCGACGGCGGTGTTTGGCACCTCGATGTCGGCTCATCACATCCTGGGGCTGAAGTAGGTCCCAAGGGTATGGCTGTTCGCCATTTAAAGTGGTACGCGAGCTGGGTTTAGAACGTCGTGAGACAGTTCGGTCCCTATCTGCCGTGGGCGCTGGAGAACTGAGGGGGGCTGCTCCTAGTACGAGAGGACCGGAGTGGACGCATCACTGGTGTTCGGGTTGTCATGCCAATGGCACTGCCCGGTAGCTAAATGCGGAAGAGATAAGTGCTGAAAGCATCTAAGCACGAAACTTGCCCCGA\n>URS00025C3F13 lncRNA from 1 species \nCTTGGGGATTTGCAGCTAATGTAAGAACCAAATGCTATTTAAAAAAAAAAATGTTTTTTAATACTTTTAAGTGTTTTTTGCACACTTTTGAAATATATTTTTACTTTATCTGCACATGCAAAGATAGGTCACGTGTAATAATGATTTCCTAATATAAATAAAGAGGGAACTAGTTAAAAAAAAAATTGAATAAGAATTCCTTGAGAAGGGGAGATGATTAGTCTGAAATGGGTCCACGTATAATGAGCAAAAACCTCCCAGGCGAGCAGCCCCAGGGCCAGAGAATGGGAGACAAGCCTTAAAGTATAGCTGTAGTTGAGACGGTCCTATTTGGGCAGGGGTGAAAAATGCTCCATCGGGAGATCTATATTCAGAAAAATCATGAGATGTATTAAGATAAACAAGACTAAAACTGAAAATATGTTAACCTATCTTTGATCATTAGTCCTTAAACAACAGAGAAGTACTTCTGTTGTCAAAAGTTCAATCAGGTCACAAGCACACCAGCTGCATTTGCTGTCAATCGTCACTGGAATGAATGATTTGAGTTTTCTGGGCCAATGAATGTTTCAGTAGAGTCGGCGAAAACTTAGATAGTCCAGAGATATGCCTAGCTTAAACACAGTGGCATCGCTAAGGGAGCCATGGTCCACCGATCATCATGCCGTGCCTCCAAGTGACGACGCTGTTTCATGGGCCGGCCTTAGGGTTGAGCTCACACAGCTACCCGGTGGAAGATTTCATTATTCTCCACCCGGGATTATTAAAAAACCCAAAACATTGTGACAGGGGCGGTGCATACCAGGAAGCAGAGGTGTGGCTAAAAG\n>URS0000978C1D SRP_RNA from 2 species \nGCTGGGCATGGTGGCGCATGCCTGTAATCCCAGTTACTCTGGAGGCTGAGGCAAGAGAATCGCTTGAACCCGGGAGGCAGAGGTTGCAGTGAGTTGAGATAGCACCACTGCACTCCAGCCTGGGTGACAGAGCCAGACTCTGTCTCAA\n>URS000131FCF1 rRNA from 1 species \nATTGAACGCTGGCGGCATGCCTTACACATGCAAGTCGAACGGTATCAGGTCTTCGGATGCTGACGAGTGGCGAACGGGTGAGTAATACATCGGAACGTGCCTAGTAGTGGGGGATAACTACTCGAAAGAGTGGCTAATACCGCATGAGATCTACGGATGAAAGCAGGGGATCGCAAGACCTTGTGCTACTAGAGCGGCCGATGGCAGATTAGGTAGTTGGTGGGATAAAAGCTTACCAAGCCGACGATCTGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGGGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGTAATGCCGCGTGCAGGATGAAGGCCTTCGGGTTGTAAACTGCTTTTGTACGGAACGAAAAGCCCTGGGTTAATACCCTGGGGTCATGACGGTACCGTAAGAATAAGCACCGGCTAACTACGTGCCAGCCGCCGCAGTAATAC\n>URS00013B03C6 rRNA from 1 species \nTACGAAGGGTGCAAGCGTTACTCGGAATTACTGGGCGTAAAGCGTGCGTAGGTGGTTGTTAAGTCTGATGTGAAGCCCTGGCTCAACCTGGGAACTGCAGTGGATACTGAGAAGCTAGAGTGTGTCAGAGGATGGTGGAATTCCGGTGTAGCGGTGAAATGCGTAGAGATCGGGAGGAACACCAGTGGCGAAGGCGATCACCTGGGATGTTCTGACGCTGAGGAGCGAAAGCTAGGGAGCAACGGGG\n>URS000157F4D5 rRNA from 1 species \nAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGAGTGGCGGACGGGTGCGGAATACATCGGAATCTACTCTGTCGAGGGGGATAACGTAGGGAAACTTACGCTAATCCCGCATAAGATTGTATGAGCCGATGTCGGATTAGCTAGTTGGTGGGGTAAAGGCGCACCAAGGCGACGCTCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGTAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAAGGGGCGCAAGCCTGATCCAGCCATGCCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAGGCGGTACCCAAAGAAGAAGCACCGGCGAACTTCGTGCCAGCAGCCGCGGTAATAC\n>URS00000C806B tRNA from 1 species \nTTTTAAGTAGTTTATGGATAAAATATTAAGTTGTGGTCTTAGAGAAAAAGATTGCTTTCTTAAATG\n>URS00008F77FE rRNA from 1 species \nTACGGAGGGTGCGAGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGTGGCTTGGTAAGCGTGTGGTGAAAGCTCGGGGCTCAACCCCGAGTCGGCCATGCGAACTGCCGAGCTTGAGCACTGTAGAGGCAGACGGAATTCCGGGTGTAGCGGTGGAATGCGTAGAGATCCGGAAGAACACCAGTGGCGAAGGCGGTCTGCTGGGCAGTTGCTGACACTGAGGCGCGACAGCGTGGGGAGCAAACAGG\n>URS000080C6B8 rRNA from 1 species \nTACGGAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGTTTTCCAAGTCAGAGGTGAAAGCCCGGGGCTCAACTCCGGAATTGCCTTTGAAACTGGGAAACTTGAACACGGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGACCGTTGTTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGG\n>URS000134990F rRNA from 1 species \nATTGAACGCTGGCGGCATGCCTACCACATGCAAGTCGAACGCGTGGCGGACGGGTGAGTCATGTCTGGGAAACTGCCCGATGGAGGGGGATAACTACTGGAACCGGTAGCTACTACCGCATACCATCGGATGTGCCCCGATGGGATTAGCTAGTAGGTGGGGTAACGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAAGGGGCGAAAGGCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGAGGAGGCGTTACTCGAAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATTC\n>URS0000B4737C rRNA from 1 species \nTTGCCTACGGGGGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGCGATGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGAAAATGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGACGGTCCTGCAAGCAAGATGTGAAAGCCCGGGGCTCAACCCGGGGACTGCATTTGGATCT\n>URS00000D2088 rRNA from 1 species \nAACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGAGAGCCTGAACCAGCCAAGTAGCGTGCAGGATGACGGCCCTATGGGTTGTAAACTGCTTTTATGCGGGAATAACGTTCACTACGTGTAGTGTTTTGCATGTACCGCATGAATAAGGATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGAGCGTAGGCGGAGGATCAAGTCAGCTGTGAAATGTAGACGCTCAACGTGTGCACTGCAGTTGAAACTGGTTCCCTTGAGTGCGTAAGAGGCAGGCGGAATTCGTCGTGTAGCGGTGAAATGCTTAGATATGACGAAGAACTCCGATCGCGAAGGCAGCTTGCCGGGCCGCAACTGACGCTGAAGCTCGAAGGTGCGGGTATCGAACAGGATTAGATACCCTGGTAGTCCGCACAGTAAACGATGGATACTCGCTGTCGGCGATATACGGTCGGTGGCCAAGCGAAAGCGTTAAGTATCCCACCTGGGGAGTACGCCGGCAACGGTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGAGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCCGGGCTTGAATTGCTAACGACGGTTACTGGAGACAGTTTCCTTCCTTCGGGACGTTAGTGAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTAAGGTGTCGGCTCAAGTGCCATAACGAGCGCAACCCTTGCCGTTAGTTGCCATCAGGTCATGCTGGGCACTCTATCGGGACTGCCATCGTAAGATGTGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTATGTCCGGGGCTACACACGTGTTACAATGGGGGGTACAGAGGGAAGCCACCTGGCGACAGGGCGCGGATCCCGAAATCCCTTCTCAGTTCGGATCGGAGTCTGGAACCCGACTCCGTGAAGCTGGATTCGCTAGTAATCGCGCATCAGCCATGGCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCAAGCCATGAAAGCCGGGGGCGCCTGAAGTCCGTAACCGCGAGGATCGGCCTAGGGCGAACCTGGTAATTGGGGCTAAGTCGTAACAAGGTAGCCGTACCGGAAGGTGCGGCTGGAACAACTCCTTT\n>URS00016E4775 rRNA from 1 species \nTACGTAGGGTGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTCGTCGCGTCGGCTGTGAAATCCCGAGGCTCAACTCCGGGCCTGCAGTCGATACGGGCAGACTGGAGTTCGGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGGTCTCTGGGGCCGATACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS0002360704 lncRNA from 1 species \nTTTTTTTTACTTTTTTCTGTATTTCTTTTTTCTTTTTGTTTCTTCACTCGTTTTCTTCTGTTTTTTATATTCTTTGTTTTTTCACTGGGTTTCTTCATCTTTTTGTTGGGTTTTATTGTTTTTCTTTTATTTGCTTTTGCACGATTTTCTGTGTTTCTTTCTCGATTTCATTTTTTTTCCTGTTTTCTTTAGTTTGTTTTTATTTTATTTGTGTGGTTTCATTTGTTT\n>URS00018D31DC rRNA from 1 species \nTGCCAGCAGCCGCGGTAATACGAAGGGACCTAGCGTAGTTCGGAATCATTGGGCGTAAAGAGAATGTAGGCGGAATTATAAGTCTGGTGTGAAATCCCACAGCTCAACTGTGGAACTGCATCGGATACTGTTTTTCTTGAATTGTAGAGGGGGTCGCGGAATTTCTGGTGTAGAGGTGAAATTTGTAGATATCAGAAAGAACACCGGTGGCGAAGGCGGCGACCTGGCTATTAATTGACGCTGAGATTCGAAAGCGTGGGTAGCGAACAGGATTAGATA\n>URS0000E7B100 lncRNA from 1 species \nACATAAGCAGTAGGTGTCTGAAGGCTGGATTTTCAATACAGGCATAAAAGATAGTATTTAAATAAAACAGAAAGCAGAATTTGAATTGTCTTGGCTCAGGTTGGGACATCCACTGAATCTGATGTTCCTGGTACTGAAGACCCTTGGACCCACCTAGCACGGCTGTAGACTTTGCGGTCTGGCATACACTGGGATATCTGTGGACAGAACTCCCCTGCATGGTGAAGCTTTTTTGTTGGCTGCACAGGAGAGTGACTGTACAGTTGGCTCTAGTGTGGCTGCACACTAGACTGTCTCTCGAAAGGAGCTGAGCTTCATTCCTATCCCTAGGAAAACTTCAGCTAAAGTTAACTTGGTTGGATGCCATGTCTGCTTCCTTTCATTTCAAAGTAGGAAAAGTCAGAATGAGAACACTAGTTCTTCACTTCAGTTCTGCTGTCATGAGGATCGAGTACCTGTAGAGCTCTATCATAGGGCTACAGGTAACACTCTTGTATAAACTGGAGCAAAAATGTTTGCCACAGTCCAGACCCTGAAATAAAATGGACATTTAGCAAAAGATGACCATTTTCAAGGTTACATCCGGAGTGGGAAGAAAACACCACAGATTTTGCATCTTTGTGGCGTATCTTGAAGATGTTCCAGCAAAGTCATCAGTTTGGACTGTGCCCAACAGATTTGTACAAGGGGAAAGAATAAGAGGAAAGAAAATGAACTCCTTATTCTATCCCACTCCACCAAAATGCAATCACATCCATGGATTTTGTCAGAGG\n>URS0001BF4730 lncRNA from 10 species \nctggtccctaagcccttccagcccaggagccagacctgtgagcaaacaagcctttagtgattccaggctctggctggaaccttgagtcttctcagctTGGGGCATGCACCTCAGGGGGAGCCAGCATCAGTGTCCAGCCCCAAGAGCTTCCCTGTACGTCTCAGTGAGTCTTCACATGCCTCCAACTGCCTGGACAACCACACGTGATACCTGTCCTGCCAAACGTGtcctgaacccataaaatccagagaaaagaaaatcgttttaaactgctgaggtttggggtctttcctgtgctgttttcgtgatagtgaatgagtgtcacgagatccgatggttttaaaaacgggagtttcctgcataagctctctctctgcctgctgccatccatgtaagatgtgactcgctcctccctaccttccgccgtgattgtgaggcgtccccagccatgtggaactgtaagtccattaaaccttcttcctgtgtaaatta\n>URS0000115D96 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAATGGATTAAGAGCTTGCTCTTATGAAGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCCATAAGACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATAATATTTTGAACCGCATGGTTCGAAATTGAAAGGCGGCTTCGGCTGTCACTTATGGATGGACCCGCGTCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGCTTTCGGGTCGTAAAACTCTGTTGTTAGGGAAGAACAAGTGCTAGTTGAATAAGCTGGCACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGC\n>URS00009CA41E rRNA from 1 species \nGGCGGACGGGTGAGTAATGCTTAGGAATCTGCCTATTAGTGGGGGACAACATTCCGAAAGGAATGCTAATACCGCATACGTCCTACGGGAGAAAGCAGGGGATCTTCGGACCTTGCGCTAATAGATGAGCCTAAGTCGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCTGTAGCGGGTCTGAGAGGATGATCCGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGGAACCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTATGGTTGTAAAGCACTTTAAGCGAGGAGGAGGCTACTGAGACTAATACTCTTGGATAGTGGACGTTACTCGCAGAATAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCGAGCGTTAATCGGATTTACTGGGCGTAAAGCGTGCGTAGGCGGCTTTTTAAGTCGGATGTGAAATCCCCGAGCTTAACTTGGGAATTGCATTCGATACTGGGAAGCTAGAGTATGGGAGAGGATGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGATGGCGAAGGCAGCCATCTGGCCTAATACTGACGCTGAGGTACGAAAGCATGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGTCTACTAGCCGTTGGGGCCTTTGAGGCTTTAGTGGCGCAGCTAACGCGATAAGTAGACCGCCTGGGGAGTACGGTCGCAAGACTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGT\n>URS0000EF3AE3 lncRNA from 1 species \nCCCTGATGGTGCAGAGACTGTCACGTAAACTGCCTCAGCTTTCTGGGGACTGTTCTGGAGTGCTCACCTACACTAGGCTTGGGGACCATGTTGGTGCCATTTCCCCAGACTGGGTACTGACCTCTTCACAGTTCCCGTGGCGCCTGAAGGACTGGAGAGTTTATGTTCCCATGTCTCCTCTGGGTGTTGGCCAGAGCTGTGATCACCATGACGGGAATCCTCCTTATTTGCTCCTTAAGCAAATAATCCTTGTGTTTTTGATTATGCCCTTAATCTTTGTCCTGAACTGCTGATCTTCAGAGGGACCCAGGAGAAGATGAGTCCAC\n>URS000081BA44 rRNA from 1 species \nATTGAACGCTGGAGGCATGCTTAACACATGCAAGTCGAACGGCAGCATGATGTGTAGCAATACACATTGATGGCGAGTGGCGGACGGGTGAGTAACGCGTAGGAATCTGCCTTGAAGAGGGGGACAACCCGAGGAAACTCGGGCTAATACCGCATAATATCGAGAGATTAAAGTCTGGGTGGTAACACCTGGAGCTTCAAGAGGAGCCTGCGTCCGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGATGATCGGTAACTGGTCTGAGAGGATGACCAGTCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGGACAATGGGGCCAACCCTGATCCAGCGATGCCGCGTGTGTGAAGAAGGCCTC\n>URS0000CE0126 antisense_RNA from 1 species \nTCCTTCCCTTCCGGAGCCCGGGGTAGGCGAGAAGCAGGCAAGGGCGCGGAGGATGGAATCTCGCTCTGTCTCCCAGGCTGAAGTGCAATGACGCAATCTCGGCTCAATGCAGCCTCCGCCTCCCAGGTTTAAGCGATTATCCCGCCTCAGTCTCACAAGTAGCTGGGATTACAGGTGCCCACCACCACGCCCAGAAGTGCATTTCGCCTCCCGCCATGATTCTGAGGCCTCCCCAGCCCTGTGAAACCGTAAGTCCAATTAAACCTCTTTTTCTTCCCAGTCTCAGGTATGTCTTTATCAGCATCATGAAAACGGACTAATACACTATTCTTAATTGATATGCCAACACAAATATAGAGACACATAGCAACATATATACACAAAATGCAAACAAAATTACTTGCAGCTTTAAGTAGATCTAAGTATACTTTTCCTTCTTCAGTGGGAACAAAGGTGTTGTAATTG\n>URS00006C0526 Y_RNA from 2 species \nAGCTGGTTCGAAGATAGTGTTATCTCAATTAACTGTTCACAGTCAGTTACAGATCAAACTCCTTGTTCTACTCTTTCCCCCTTTCTCACTACTGCGCTTGACTAGTCTAGA\n>URS00015EBCF0 rRNA from 1 species \nTACGTAGGGTGCGAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCACGTAGGCGGATTGCTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGGCGATCTTGAGTCCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGGTACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS00016A2BA6 rRNA from 1 species \nCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGGAACCCTGATCCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGAAAATGATGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGTTGGCAAGCGTTGTCCGGATTTACTGGGTGTAAAGGGCGTGCAGCCGGGAAGACAAGTCAGATGTGAAATACCGCGGCTCAACCGCGGAACTGCATTTGAAACTGTTTTTCTTGAGTATCGGAGAGGTAATCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAAGAACACCAGTGGCGAAGGCGGAGTACTGGACGACAACTGACGGTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTC\n>URS000112369F rRNA from 1 species \nTACGGGGGGAGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGCAAGGCAAGTCAGGTGTGAAAGCCCCGAGCTTAACTCGGGAATTGCATCTGAAACTGCTGTGCTTGAGTTCTGGAGGGGGTAGTGGAATTCCCAGTGTAGCGGTGAAATGCGTAGATATTGGGAGGAACACCTGCGGCGAAGGCGGCTACCTGGACAGAAACTGACGCTGAGGCGCGAAAAGCTAGGGGGAGCGAACGGGG\n>URS00022A0584 misc_RNA from 1 species \nGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCGCCAGTATTCTGGCGGGCATGTCTGTCCGAGCGTCATTTCAACCATCAAGCCCCCGGGCTTGTGTTGGGGACCTGCGGCTGCCCGCAGGCCCTGAAAACCAGTGGCGGGCTCGCTGTCACACCGAGCGTAGTAGCAATCACCTCGCTCAGGGCGTGCTGCGGGTTCCGGCCGTTAAACAGCCTTACAAAACCCCAGGTTGACCTCGGATCAGGTAGGAAGACCCGCTGAACTTAAGC\n>URS0000E790F2 lncRNA from 1 species \nATGCAAACTTTGCCCGAATTTTGCTACTTAAAATGCCTTAGCGATAAAGTAAATGTTACTAAAATTATTAACCGAAATATAACAAAACTAAAGCTAGATGGATTTATCGAATTGGATCGTGAGATAGAGGATTTTACGAAATTAAGAAATTCAATTGTTAATGAACAATATAAAGGGTTGACAGAAAAATTATTTCAAGCACACAAAGAATATTTATTTTATTTTGATACTTTTTTAAAAAAAAAACTATTAAAAGATGAAAATAAAGTATTATATACTAATGATTGTTTTGATAGAACAAAAAAGGTTGAATACAATTTTGAAAACGAAATAGTTATTGTTATATATAATATAGGTTTTATTACTACAGCTATATTAAAATCTAAAAAAAAAGACAAGGATGTAAAATTATTAAATAAATTGTCACAAGAAGCAATAAATATTTTTAATTACTTATTCCAAAGTATTATTAATGAAACTTACAATGACTTAAGTGACATAAATTGTTTAAGTTGTTATGTATTTTTAAATTTATCATTAGCTTATCATGAACATTTATTTTATAATACAGCTTTGGCAAAAAAATATAAAAGAAATTTATTAGCAAAAATATCATATAATATATATAGTTATTTTAATAATATGTTAAATTGTTTAGATGGTAAAAAATTAGATGTATTTACAAAAATGGATGCATTTGTTAATGCAAAAAATAATCTTATATTAACTCTTCGAAATAGTAATAGTCTTCTTTATAACTTTATATATGTAAATAAATTAATTTTTTTAAGTATTACCAATTATCAAACAACTTTAAAATACTGTCAATTAAACCCAAATAGTGAAGAAGTAGTAATACAAAAATATGAAGAAGAAAAAATAGGAGAAATTATATCTAGATTACAATTTAGTACAGAAAATATAAAGAAAGCAGAAGATTTAAGTAAAAAATATAATTTACATATTAATGCTGAAATGTTGAAACAAAAAATAAACAATGCTTTAGTTTTTTTTGAAAAAGATAATAAAAATATATATTTTGAGTCAATACCAGAATATAGTACCTTAGACAGTTTAAAAGGAACAGAAATTGTAAAAATACCAGATCCTAATATATCAACTATTTATTTGAAAAAAGAAATCAGTAATAATTTAAAATTATTATTTAATGAAAAAGCAAAAAATATATTTGACGAATATAATACAGAGGCTTGTAAAGTACATGATTTATATGAAAAACATCTTAGCAGTTTAAAAGATCAATATAAATTAATTAATTTATCTTATCGAAAAAATATATTTACAATTCTTAATAATGTACTTTTAAATATATATAATACATTAAAACAATCATATAATCCTACTATATATGATAAAAATTTACATTTTTTAATGGATGTTGAAAAAAATTTAAATTTAACACTAAACCAAATCGAAACAAGTTTAAACACAGAAAATTCTAATCACTTGAATTTCCAAAAAATGTATACCAATATAGGCGTTAACCAAGACTCGTTAAATTCTTATAAAAAATATGTTTACCATTTAAATAACTTTAAAAAAATATTAACCGAAATAACAACTAATATAGTTGAATTTAAAAGTTTTCTTGAAAATAATTATTATTATTTACAACTATGTGAAATGAATGTTTCTAATTTTTTTAAACATATGATAGACGAACTTAACTCCAATTCAAATACATGTGTTGAATCCTTTGATAGCGATTATACATTTTATAAGAACTTATTATCAGAAGAAAAAGAAAAAGAAAACGAAGAAGAAACAAAAGAAGAAACAAAAAAAATGAAAAATAATACATCATCAACAACAACAGCAGCAGAAGCAACAACAACAGCAGCAGCAACAACATATATGAACGAACAAAAAGTAATACTACCAGCTTCACCACCACCATCACTTACCAATAATATTCCTAAATTAACATATTCTAACTTTCACAAATTTTTAAAAAAAAACAATATATCAGTTACTGCGTCAAGTAGTATTAATAATAGTAGTAATATAAAATATTTTGAAATTTTAAAAAATTATATAAATATACATTCAGAAGAAAAATTATATTTTACAATAAATGCTATTTACTTTTCTATGAATATCCAATTAGAACAATTTTCAAACGACCTTGCAGAGATTAAAGGATATATGCAAAATTCATTTTTAAATTTAATAACGGTAATGATATAA\n>URS0001C1D8E2 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGATAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGACGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS000183E284 rRNA from 1 species \nTACGAAGGGAGCTAGCGTTGTTCGGAATCACTGGGCGTAAAGCGCACGTAGGCGGATTTGTTAGTCAGGGGTGAAATCCCGGGGCTCAACCTCGGAACTGCCTTTGATACTGCAAATCTCGAGTCCGGAAGAGGTGGGTGGAATTCCTAGTGTAGAGGTGAAATTCGTAGATATCAGGAGGAACACCGGTGGCGAAAGCGGCTTCCTGGCCCGACACTGACGCTCATGTACGAAAGCGTGGGGAGCGAACAGG\n>URS0000164332 rRNA from 1 species \nCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATACCGCGTGTGTGAAGAAGGCCTGAGGGTTGTAAAGCACTTTCAATGGGAAGGAATACCTACCGGCCAATACCCGGTAGACTGACATTACCCATACAAGAAGCGCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAGGCGTGCGTAGGCGGCTTGTTCAGTCAGATGTGACAGCCCCGGGCTTAACCTGGGAACTGCATTTGATACTGGCAGGCTAGAGTTTAGTAGAGGGGAGTGGAATTTCAGGTGTAGCGGTGAAATGCGTAGAGATCTGAAGGAACACCAGTGGCGAAGGCGGCTCCCTGGACTAAAACTGACGCTGAGGTACGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCAACTAACTGTTGGGTTCTTAAAGAACTTAGTAGTGGAGCTAACGTATTAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACCCTTGACATGTAGTGAACTTTCCAGAGATGGATGGGTGCCTTCGGGAACACTAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTATCCTTAGTTGCCAGCGGGTAATGCCGGGAACTCTAGGGAGACTGCCGGTGATAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTATGGGTAGGGCTACACACGTGCTACAATGGTCGGTACAGAGGGCAGCAAACTCGCGAGAGCCAGCAAATCCCAAAAAGCCGATCCTAGTCCGGATTGCAGTCTGCAACTCGACTGCATGAAGTCGGAATCGCTAGTAATCGCGGATCAGAATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGT\n>URS00013EF64C rRNA from 1 species \nGACAGAGGATGCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCTGTAGGTGGCTTTTTAAGACCGCCGTCAAATCCCAGGGCTCAACCCTGGACAGGCGGTGGAAACTACCAAGCTGGAGTACGGTAGGGGCAGAGGGAATTTCCGGTGGAGCGGTGAAATGCGTAGAGATCGGAAAGAACACCAACGGCGAAAGCACTCTGCTGGGCCGACACTGACACTGAGAGACGAAAGCTAGGGGAGCGAATGGG\n>URS00016C3B12 rRNA from 1 species \nTACGAAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGGGTGCGTAGGCGGTTCGGTAAGTCGGATGTGAAAACTCAGGGCTCAACCCGGAGACGCCATCCGATACTGCTGTGACTTGAGTCTGGTAGGGGAACACGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCAAAGGCAGTGTTCTGGGCCAGTACTGACGCTGAGGAGCGAAAGCGTGGGGAGCAAACAGG\n>URS0000F147F0 rRNA from 1 species \nTACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTTTGTAAGCCAGATGTGAAATCCCCGGGCTCAACCTGGGAATGGCATTTGGGACTGCAAGGCTGGAGTACGGCAGAGGAGACTGGAATTCCTGGTGTAGCAGTGAAATGCGTAGAGATGTGGAGGAACACCGATGGCGAAGGCAGCCTCCTGGGCCAGCACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGG\n>URS0000104AE7 rRNA from 1 species \nGAGCTCGTAGGCGGTTTGTCGCGTCTGCCGTGAAAGTCCGAGGCTCAACCTCGGATCTGCGGTGGGTACGGGCAGACTAGAGTGATGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGGTCTCTGGGCATTTACTGACGCTGAGGAGCGAAAGCATGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGTTGGGCACTAGGTGTGGGGGACATTCCACGTTTTCCGCGCCGTAGCTAACGCATTAAGTGCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGAAGAACCTTACCAAGGCTTGACATGTTCCAGACCGCCTCAGAGATGGGGTTTCCCTTCGGGGCTGGTTCACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGTTCCATGTTGCCAGCGGGTTATGCCGGGGACTCATGGGAGACTGCCGGGGTCAACTCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGTCTTGGGCTTCACGCATGCTACAATGGCCGGTACAATGGGTTGCGATACTGTGAGGTGGAGCTAATCCCTAAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCCCATGAA\n>URS0000D394E6 rRNA from 1 species \nCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGAGCTTAACTTGGGAACTGCATTTGAAACTGGCAAGCTAGAGTCTTGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAAGAAAATTTGACGGA\n>URS0002160948 rRNA from 1 species \nTGCTGGAGGTATCAGAAGTGCGAATGCTGACATAAGTAACGATAAAGCGGGTGAAAAGCCCGCTCGCCGGAAGACCAAGGGTTCCTGTCCAACGTTAATCGGGGCAGGGTGAGTCGACCCCTAAGGCGAGGCCGAAAGGCGTAGTCGATGGGAAACAGGTTAATATTCCTGTACTTGGTGTTACTGCGAAGGGGGGACGGAGAAGGCTATGTTAGCCGGGCGACGGTTGTCCCGGTTTAAGCATGTAGGCTGATTGTCCAGGCAAATCCGGATAATCAAGGCTGAGGTGTGATGACGAGGCACTACGGTGCTGAAGTAACAAATGCCCTGCTTCCAGGAAAAGCCTCTAAGCATCAGGTAACATCAAATCGTACCCCAAACCGACACAGGTGGTCAGGTAGAGAATACCAAGGCGCTTGAGAGAACTCGGGTGAAGGAACTAGGCAAAATGGTGCCGTAACTTCGGGAGAAGGCACGCTGGTGTGTAGGTGAAGTCCCTGCGGATGGAGCTGAGACCAGTCGAAGATACCAGCTGGCTGCAACTGTTTATTAAAAACACAGCACTGTGCAAACACGAAAGTGGACGTATACGGTGTGACGCCTGCCCGGTGCCGGAAGGTTAATTGATGGGGTTATCCGTAAGGAGAAGCTCTTGATCGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGCGTAATGATGGCCAGGCTGTCTCCACCCGAGACTCAGTGAAATTGAACTCGCTGTGAAGATGCAGTGTACCCGCGGCAAGACGGAAAGACCCCGTGAACCTTTACTATAGCTTGACACTGAACATTGAGCCTTGATGTGTAGGATAGGTGGGAGGCTTTGAAGCGTGGACGCCAGTCTGCGTGGAGCCAACCTTGAAATACCACCCTTTAATGTTTGATGTTCTAACGTTGGCCCCTGACCGGGGTTGCGGACAGTGTCTGGTGGGTAGTTTGACTGGGGCGGTCTCCTCCCAAAGCGTAACGGAGGAGCACGAAGGTTAGCTAATCCTGGTCGGACATCAGGAGGTTAGTGCAATGGCATAAGCTAGCTTGACTGCGAGCGTGACGGCGCGAGCAGGTGCGAAAGCAGGTCATAGTGATCCGGTGGTTCTGAATGGAAGGGCCATCGCTCAACGGATAAAAGGTACTCCGGGGATAACAGGCTGATACCGCCCAAGAGTTCATATCGACGGCGGTGTTTGGCACCTCGATGTCGGCTCATCACATCCTGGGGCTGAAGTAGGTCCCAAGGGT\n>URS00025841D4 rRNA from 1 species \nGCGCAGATGACTCGCTACTGAATCAACTAAAACATAAAACAAAATATTTAGTTGATAATGTAAGAAGAAAATAATGATATTATCTTATGTTTAGTGTCGTCTAAAACTGGTGCCAGAAGACTCGGTAAGGCCGGAGACGCAAACGTTAGTCATCCTTATCAGGCGTAAAGGGTTTGTAGGCTGCTTTGAAAGTTTCTATCTTTTAAATTAATTAAAAAATGGGGCGAAGCTCGGTTATAACTAATTATCTTTAAAATATAATAAAATAGAAATAAATTAAAGCTAGAATCTAATAGAGGTTATATTGAATAATACTTAGTTTAGGTCTAATATCCTAATAGATTAAGGGGAATATTAAAAGCGAAGGCTTCTCTCCACTATAGATTGACGCTGAGAAACGAAGGTGAGGAAAGGAAATAGGATTAGATACCCAAACTACCCCTCACTGTCAACGATGAATGGTAGTCATTAGTGCATATTAGTGACGTAGTTAACACAATTACCATTCCGCCTTGTTAGTAAGACTGCAAAGTTAAAAACAAAAAAATTAGTCGGTTTCGGAGTAAACGAAGTGAAGCATGTTATTTAATTCATTAAATCCGCAAA\n>URS0001424B59 rRNA from 1 species \nCTACGGGCCGCAGCAGTGGGGAATATTGGACAATGGGGGAAACCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCCTGCGGGTTGTAAAGCACTTTCGGTTGGGAGGACTGCTTCTAGCACTAATATTGTTGGAAGTTGACGTTACCTTCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGCTAGATCAGTCGGGTGTGAAGGCCCCGGGCTTAACCTGGGAACTGCATCCGATACTGTCTAGCTAGAGTACAGGAGAGGAGAGTGGAATTCCACATGTAGCGGTGAAATGCGTAGATATGTGGAGGAACACCAATGGCGAAGGCAGCTCTCTGGCCTGATACTGACGCTGAGGTGCGAAAGCGTGGGGAACAAACAGGATTAGATACCCCTGTAGTC\n>URS0000AE892D rRNA from 1 species \nTCGAGAATCATTCACAATGGGGGCAACCCTGATGGTGCAACGCCGCGTGGAGGATGAAGGTCTTCGGATTGTAAACTCCTGTCATCTAGGAGCAAGACCTGGCGCTGAATCGTCGACAGGGTTGATAGTACTAGAAGAGGAAGGGACGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGTACCGAGCGTTATTCGGAATCACTGGGCGTAACGGGAGCGTCGGCGGCGTGGGCAGCAAGATGTG\n>URS0000ECDF55 rRNA from 1 species \nTAGATACCCTGGTAGTCCACGCCGTAAATGGTGAGTGCTAGGTGTCGGGAGTCAAATCTCGGTGCCGACGTTAACACATTAAGCACTCCGCCTGGGGAGTACGCACGCAAGTGTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCAGCGGAGCATGTGGTTTAATTCGATGCAACGCGAAAAACCTTACCAGGACTTGACATATGGATGCCCGGTATAGAGATATACCCTTCTTCGGAACATTCAT\n>URS000188AE03 rRNA from 1 species \nACTACGGGTGGCTGCAGTGGGGAATATTGGGCAATGGGCGCAAGCCTGACCCAGCAACGCCGCGTGAAGGAAGAAGGCTTTCGGGTTGTAAACTTCTTTTCTCAGGGACGAAGAAAGTGACGGTACCTGAGGAATAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGATTTATTGGGTGTAAAGGGCGTGTAGGCGGGAGCGCAAGTCAGATGTGAAAACTCAGGGCTCAACCCTGAGCCTGCATTTGAAACTGTGTTTCTTGAGTGCTGGAGAGGCAATCGGAATTCCGTGTGTAGCGGTGAAATGCGTAGATATACGGAGGAACACCAGTGGCGAAGGCGGATTGCTGGACAGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCGTGTAGTC\n>URS000107BACB rRNA from 1 species \nTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGCGGGAAGAAGGCCTTCGGGTTGTAAACCGCTTTTGTCAGGGAAGAAATCTTCTGAGTTAATACCTCGGGAGGATGACGGTACCTGAAGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTTTGTAAGACAGAGGTGAAATCCCCGGGCTCAACCTGGGAACTGCCTTTGTGACTGCAAGGCTTGAGTGCGGCAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAATCCCCTGGGCCTGCACTGACGCTCATGCACGAAAGCGTGGGGAGCAAAACCAGGATTAGATAGCCCCTGGGTAGTCCACGCCCTAAAACGATGTCAACTGGTTGTTGGGAAGGTTCCTTCTCAGTAACGTAGCTAACGCGTGAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTGAAAC\n>URS00003DBB63 rRNA from 1 species \nAGGGAATCTTCCACAATGGACGCAAGTCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGGTTTCGGCTCGTAAAGCTCTGTTGGTAGTGAAGAAAGATAGAGGTAGTGACTGGCCTTTATTTGACGGTAATTACTTAGAAAGTCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTTGGCGTAAAGCGCGCGCAGGCGGATTGGTCAGTCTGTCTTAAAAGTTCGGGGCTTAACCCCGTGATGGGATGGAAACTGCCAATCTAGAGTATCGGAGAGGAAAGTGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAAGAACACCAGTGGCGAAGGCGACTTTCTGGACGAAAACTGACGCTGAGGCGCGAAAGCCAGGGGAGCGAACGGGATTAGATACCCCGGTAGTCCTGGCCGTAAACGATGGGTACTAGGTGTAGGAGGTATCGACCCCTTCTGTGCCGGAGTTAACGCAATAAGTACCCCGCCTGGGGAGTACGACCGCAAGGTTG\n>URS0002247035 tRNA from 1 species \nGCACCGGTCGTATAGTGGCTAGGTATTTAGTACCACACAAATTATCTCGGCCTTCCAAGCCGATAACCCGGGTTCGAATCCCGGCCGGTGCA\n>URS0000B6A44E rRNA from 1 species \nGTGTCAGCAGCCGCGGTAATACGTAGGCAGCGAGCGTTGTTCGGAGTTACTGGGCGTAAAGCGTGCGTAGGCGGCAGTCCAAGTCTGGTGTGAAATCTCCCGGCTCAACCGGGAGGGTGCGCCGGAAACTGGGCTGCTGGAGTGCGGGAGAGGTAAGCGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAGGAACACCTGCGGTGTAGACGGCTTACTGGACCGCCACTGACGCTGAGGCACGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCC\n>URS00008315DC rRNA from 1 species \nGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCAACGCCGCGTGAGGGAAGACGGTTTTCGGATTGTAAACCTCTGTCTTTGGTGAAGAAAAAAATGACGGTAGCCAAGGAGGAAGCTCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGAGCGAGCGTTGTCCGGAATTACTGGGTGTAAAGGGAGCGCAGGCGGGAAGACAAGTCAGCTGTGAAATACATGGGCTCAACCCATGGACTGCAGTTGAAACTGTTTTTCTTGAGTGGAGTAGAGGTAGGCGGAATTCCGAGTGTAGCGGTGAAATGCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCCTACTGGGCTCTAACTGACGCTGAGGCTCGAAAGTGTGGGGAGCAAACAGGATTAGAAACCCTAGTAGTCC\n>URS00014517AB rRNA from 1 species \nTACGTAGGGGGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTGGGTAAGTCGGGTGTGAAAACTCAGGGCTCAACTCTGAGACGCCACTCGATACTGCTCTGACTCGAGTCCGGTAGGGGAGCGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCGCTCTGGGCCGGAACGGACGCTGAGGAGCGAAAGCGTGGGTAGCAAACAGG\n>URS00009B6ECF lncRNA from 8 species \nGATCATCTGAGGTCGGGAGTTTAGACCAGCCTGGCCAACATTGTGAAACCCCATCTCTACTAAAAATACAAAAATTAGCTGGGTGTGGTGGCGCACACTTGTAATCCCAGCTACTTGGGAGGCTGAGGCAGTAGAATCACTTGAACCTGGGAGGCGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTGCACTCCAGCCTGGGCAACAGAGGGAGACTCCATCTCAAAAAGAGAAAATAATTATAAAAGTTGCTTTAAAATCCTTGCTGCTAATTCCCAAGATTAGAAATTCCAACATCTGAGTCATAACTTTTTCTCTTTGGGAGTGAGTTTTGAGTATGATTCCATTTTCTGTTTCTTCATATGCCTAGTACTTGTTTATTGTAGCTGGACATTGTCAAGACTATGGATTTTGTTATGTTCCTCTGAAGAGTGTTAATTTTGTTCTAACAGGCAATTAACCTGGTTGGACTGAAACTCCAATCTTTGTGAAAGGCAGTAGCTGGAATTCCTACTCTGTTCTTGCTCCCAGCTGCTGATTTTACTGGGACTCCTGGAGACTCCTGCGCATATGTGCAGTTGGACAACCAAGGATTTGGACAGAGTTTATATACAGATTTTGGGACTTGTTTGCTCTATAGAATTTCTTTCTGTGAGTTCCCTCTTAATTTTCCAGCCACACTTCTCGCCTAGAACTCTGTACTCGGCACCTCAAACCAGTAAGACCGTAGCTTTCTATGCATTTCCACCTCCCACACAAATTACAGAGTGCCCTCACACAAATAACCACAAAAATATAAGTCTAGTACAGGGCAGCTCCCACCTTTCAAGAGTTGATTTTCCTCACATTTCTAATTGCTGTTAGGTGTTCTTTAGTGCCTTCAAATATTTGGGTTTGGTTGTTGTTTATTTTATTCAGGTTTTTGGTTTTTTGTTTTGGTTTTGTTTTGAGATGGAGTTTTGCTCTTGTCGCCCAGGCTAGAGTGCAATGGCACGATCTGAGCTCACTGCAACCTCTGCCTCCCAGGTTCGAGTGATCCTCCTGCCTCAGCCTCCTGAGTAGCTGGGAATACAGGCATGCACCACCACGCCTGGGTAATTTTTGTATTTTTAATAGAGACAGGGGTTTCACCATGTTGACCAGGCTGGTCATGAATTCCTGACCTCAGGTGATCCACCTGCCTCGGTCTCTTAAAGTGCTGGGATTACAGGTGTGAGCCACTGTGCCCAGCCAGGTTTTTTGTTGTTGTTGTTATTGTTTTGTTTTTAAGAGACAGGATCTTGCTTTGTTGCCCAGGCTGGAGCACAGTGGTATGATCATAGCAAACTGCAGCCTTGAACTCCTGAGCTCCAGCAATCCTCCTGCCTCAGCCTCCCAAGTAGCTGGGACTACCAGCGCATATCACCATGCCTAGTTAATTTTTTGAAAACTATTTTGATAGAGATGGAGTCTTGCTGTGTTGCCCAGGCTGGTCTTGAACTCATGGCCTCAAGCGATCCTCTCACCTAAGTCTCCAAAGGTGCTAAGATTACAGGCATGAGCCACTGTACCTGGCCTTGTTTCAGGTTTTTTTTTGTTTTTGTTTTTGTTTTTGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNACTTCCTGGGTTCAAGTGATTCTCCTGCCTCAGCCACCCGAGCAGCTGGGATTACAGGTGTGCACCACAAGCCTGGCTAATTTTTTGTGTATTTTTAGTAGAGATGAGGTTTCGTCATGTTGGCCAGGCTGGTCTCAAACTCCTGACCTCAAATGATCTGTCTTCCTCAGCCTCCAAAAGTGCTGGAATTACAGGCGTGAACCACGGCACCTGGCCCTTGTTTCAGTTTTATAATTGCTATCTGAGGCATGATTATTCTGACCAAATTATTGTGCTATTAGGGAAACCATTTGTTTAAGTTCACATAGCTAGTTTGTGGAAGAGCCAAAATCTAAAACCAGTCAGATTACATAATCCTATGCTTGCTCCAGTTCACCACTATTCCTAAACACCTCAAGGTGGTTTGGATTCCAGCCTAGAGCCCTCTGGAAAGTATTTGGGGCTGGAAGGAGGAAAGAGCCCTCAAAACTCCTATTCAGGCTAGGGCAGTAGTTGCCCAGGCTGGAGTGCAGTGGAACAATCTTGGCTCACTGCAACCTCTGCCTGCCGGGATCAAGCAATTCTCCTGCCTCAGACTTCTGAGTAGCTGGGATTACAGGCGTACACCACCAAGCCCAGCTAATTTTTGCATTTTAATAAAATCACAAAGCCAGACTTAGATAGTTGAAAGTGCCCACCTCTGTTCCTGAGAGTTGGGCCTGAGACAGAGGATTCTAAGTGGAAACCACGCTCAACTAAGAGGACCCAAGAAAGGCAAGTTCTTTTTAAAAATTTTTTTTTCATTTTTTGTCTCTCTCTGTCACCCAGGCTGGAGTGCAATGGTGCAATCATGGCTCACTGCAGCTTTATCCTCCTGGGCTCAAGCCATCTTCCCACCTCAGCCTCCCAAGTAGCTGGGACTACAGGCACATGCCACCATGCCTGGCTAATTTTTATATTTGTTGTAGACAAGTTTTCACCATGTTGCCCAGGCTAAGTCAAACTTTTCTTTTTTTTCTATTTTTTATTTTTTTTAATTATTATTTTTTGAGATGCAGTCTCGCTCTGTCGCCCAGGCTGAAGTGCCATCTCTGCTCACTGCAAACTCCACTTCCTGGGTTCCTCAGCCTCCCGAGTAGCTGGGACTACAGGTGCCTGCCACCACGCCCAGCTAATTTTTTGTATTTTAATAGAGACGGGGTTTCACCGTGTTAGCCAGGATGGTTTCGATCTCCTGACCTCGTGATCCACCCGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCCACTGCGCCTGGCTCAAATTAGATTTCTATATCCAGTAACAGTATCCTTCAAAAATGAAGACAAAACAGAGACATTGTCAAATAAACAAAAACTGAGTTT\n>URS00011F5567 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGTGAACGAGGGAGCTTGCTCCCTCCGGATCAGTGGCGAACGGGTGAGTAACACGTGAGCAATCTGCCCTGGACTCTGGGATAAGCGTTGGAAACGACGTCTAATACCGGATACGAGACGCGAAGGCATCTGCAGCGTCTGGAAAGAACTTCGGTCCAGGATGAGCTCGCGGCATATCCGTGAGTTGGTGAGGTAACGGGTCACCAAGCCTACGACGGGTAGCCGGCCTGAGGGGGTGACCGGCCACGCTGCAGCAGAGATACGGCCCAGACTGCTACGGGAGGCATGAGTGGGGAAGGTTGCACAATGGGCGCAAGCCTGATGCAGCAACGCCGCGTAGGGGACGACGGCCTTCGGGTTGTACACCTCTTTTAGCAGGGGAGACGCGAAAGTGACGGTACCTGCAGAAAGAGCACCGGTTAACTACGTGCCAGCCGCCGCCGTAACAC\n>URS0000FFF241 rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGCTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGCTTCTTAAGTCGGTGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTCGATACTGGGAAGCTCGAGTCCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGGG\n>URS0002017531 rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGAGACCTTCGGGTCTAGTGGCGCACGGGCGCGTAACGCGTGGGAACCTGCCTTTAGGTTCGGAATAACTCAGAGAAATTTGAGCTGATACCGGATGATGTCTTCGGACCAAAGATTTATCGCCTTTAGATGGGCCCGCGTTGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTTACCCGAGATGATAATGACAGTATCGGGAGAATAAGCTCCGGCTAACTCCGTG\n>URS0000DCAE13 sRNA from 1 species \nGCAACCCGATGTCGGGGGCTTGGGCGGAAGCCCACGTTGCCCGACAAAAAACGTACCCCCGGCGCGGTCTGCGCCAAGGAATCGAAATGAAGCAACGTGAGCAGTCCGCCCCGTTCGCGGGAAGTGGACGGCAACACGGTCTTCCAATGTATACTAAACGACTCTCGGCAACGGATATCTCGGCTCTCGCATCGATGAAGAACGTAGCGAAATGCGATACTTGGTGTGAATTGCAGAATCCCGTGAACCATCGAGTTTTTGAACGCAAGTTGCGCCCGAAGCCATTAGGCCGAGGGCACGCCTGCCTGGGCGTCACGCGCTCCGTCGCCCCGCAACCCCGAACCCCGAAACGGGCCAGGGTACTTGTGGTGCGGAGATTGGTCTCCCGTGTGCCTTGCTCGCGGCTGGCCTAAAATTGAGTCCCGGGCGCTCTGTTCTGCGGCCGACGGTGGTTGAGAAGCCCTCGAAATTGTGCTGCTGCAGTGCTGCCCGATGCGGACCCTGTGACCCTTGCGCGACCTCTCCCCTTGGGGTGAGGGAGCTCCATCTGA\n>URS000109E99B rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGTGCGTAGGTGGTGAGTTAAGTCTGTCGTGAAAGCCCCGGGCTCAACCTGGGAATGGCGATGGATACTGGCTCGCTAGAGTGCGGTAGAGGAGAGTGGAATTCCCGGTGTAGCAGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>URS0001484F89 rRNA from 1 species \nCCTACGGGTGGCTGCAGTGGGGAATATTGGGCAATGGAGGCAACCCTGACCCAGCAACGCCGCGTGAATGATGAAGGCCTTCGGATTGTAAAGTTCTTTTCTTCGGGACGAAGAAAGTGACGGTACCTTAGGAATAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGAGGCAAGCGTTATCCGGAATGACTGGGCGTAAAGGGTGAGTAGGTGGTTGGACAAGTTAGACGCGAAATTCCGGGGCTCAACCCTGGAACTGCGTCTAAAACTGTTGGTCTTGAGTGAAGGAGAGGCAGTCGGAATTCCGGGTGTAGCGGTGGAATGCGTAGATATAAGGAGGAACACCAGTGGCGAAGGCGGATTGCTAGACTGTAACTGACACTGAGGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCCAGTAGTC\n>URS0002155384 rRNA from 1 species \nTCAAGTTACTAAGGGCATGTGGTGGATGCCTTGGCGCCTGGAGCCGATGAAGGACGTGGCGTGACTGCGAAAATCCCTGGCTAGCTGTCAAGCGAGCTTAACCGGGGGTATCCGAATGAGGCAACTCAGCTCAATTTTATTGAGTTACCGCTGATTGAACACATAAATCAGATGGAGGGAACCGGGGGAACTGAAACATCTAAGTACCCTGAGGAATAGAGATTATTCCCTTAGTAGCGGCGAGCGAACGGGGAACAGCCCAAACCGTCTTCTGCGGAAGGCGGGGTTGTAGGACAGTTCATATGGAGTTACAAATTGTTTCGATAGCTGAAGCGCCTGGGACGGCGTGCCACAGATGGTGACAGCCCAGTAAGTGACATTGAAACAACTCCGAGCTGTATCCTGAGTAGTGCGGGACACGAGAAATCCCGTATGAATCTGGGAAGACCACTTTCCAAGGCTAAATACTCCAGGCGACCGATAGCGTATAGTACCGTGAGGGAAAGGTGAAATAGTACCCCGAGAGGGGAGTGAAATAGTTCCTGAAACCGCATGCTTACAAGCAGTTGGAGCCAGTTCGTTCGCGAATTGGTGACAGCGTGCCTATTGAAGAATGAGCCAACGAGTTACGTTCAGTGGCAAGGTTAAGCGATGAGAGTCGTGGAGCCGTAGCGAAAGCGAGTCTTAAAAGGGCGAAAGTGGCTGGACGTAGACCCGAAACCGAGTGATCTACCCATGGGCAGAGTGAAGCGGGAGTAATGCCCCGTGGAGGCTCGAACCTTCCTGAGCTGCAAATCAGTTGGATGACCTGTGGGTAGCGGAGAAATTCCAATCGAACTCGGAGATAGCTGGTTCTCCTCGAAATGTATCTAGGTACAGCCTCGTGTGTTTTCTTCTGGGGGTATGGCTCTGAATGGACTAGGGGGCATAGCGCTTACCAAACCCAATCAAACCGGGAATACCAGAAGATTAGAACGCGGGAGTGAGACTGTGGGAGCTAACTTCCATGGTCAAGAGGGAAACAACCCAGACCCCCGGCTAAGGTCCCTAAATCCATGCTCAGTGTGCAAGGATGTCCAGTTGCATAGACAACCAGGATGTTGGCTTAGAAGCAGCCACCATTTAAAGAGTGCGTAACTGCTCACTGGTCGAGTGGCCGGGCGCCGACAATGTAACGGGGCTCAAGCATGGTACCGAAGCTAGGGGACCGCTTTTTAGCGGTCGGTAGAGGAGCGTTCTGTATGCGATGAAGCTGTGCGGGTGACCGTCGGTGGAGCGTACAGAAGTGAGAATGTTGGCATGAGTAGCGAAATTCAGGTGAGAACCCTGAACGCCGTAAGCCCAAGGGATCCTACGCAAAGCTAATCCGCGTAGAGTTAGGCGGGCCTAAGCCGAGGGCGAGAGCCGTAGGCGATGGACAGCAGGTAAGTATTCCTGCCCCACCATATGGGCGTTTGAGATGTGAGGTGTGACCCAGAAGGATAGACAGAGCGGGCCCTGTGGACATGGTCCGTCCCTACACCGTAGGCGTCTGACGATAGGAAAATCCGTTGTCAGGTTAAGCGGAGGGTGAGGGGGGCAGTGGAGACTTCGGTCAAAACGACTCTGTTGAGTCCATGCTGGCTAGAAAAGCATCGGCATCGAGTGCATATGGTGTCCGTACCGCAAACCGACACAGGTGGGCGACGGTAAGTACCGTAAGGCGAACGAGAGAACCTTCGTTAAGGAACTCGGCAAAATAGCTCCGTAACTTCGGGAGAAGGAGCGCCCTTGTGAGTGAAACACTTTACGTGTGGAGCATCACGAGGGCCGCAGTGAGCAGGCCCAGGCGACTGTTTAACAAAAACACAGGTCTCTGCGAACCAGTAATGGGATGTATAGGGGCTGACGCCTGCCCAGTGCCGGAAGGTTAAGGAGATGGCTGAGAGGCCAGAACTGAAGCCCCGGTGAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCCGCACGAATGGCGTAACGATCTGGGCACTGTCTCAACGAAGGACTCGGCGAAATTGAGATGGCCGTGAAGACGCGGCCTACCCGCAGCAGGACAAATAGACCCCGTGGAGCTTTACTGCAGTTTTGCGCTGGCGTATGTGATTAGTTATATAGTATATGGGGGAGGCTTTGAACCATGACCGTCAGGTTGTGGGGAGCCGTCAGTGGAATACCCCATTTCTAATTTTGTACTCCTCACCAGTGAGCAAGCACTGGGACAGCGCATGATGGGCAGTTTGACTGGGGCGGTCGCCTCCGAAAGAGTAACGGAGGCGCGCAATGGTTCCCTCAAGGTGGATGGTAATCACCTGTCGAGTGCATTGGCATAAGGGAGCTTGACTGCAAGACAGACAAGTCGAGCAGGGGCGAAAGCCGGCCAAAGTGATCCTATGGTCCCGAGTGGAAGGGCCATGGCTTAACGGATAGAAGCTACCCCGGGGATAACAGGCTGATCCTTCCCAAGAGTTCACATCGACGGAAGGGTTTGGCACCTCGATGTCGGCTCGTCGCATCCTGGGGCTGAAGAAG\n>URS000254E3BB rRNA from 1 species \nAACGGCTATACCATGCTGAATATACCGGTTCTCGTTAGATCACCAAAGTCAAGCATCAGTGGGCGCAGTCAGTACTTGGGTGAGTGACCATCTGGGAACACCGCGTGCCGTT\n>URS00000821D9 rRNA from 1 species \nTGCGAACGTTTGCGGCGGGCCTAACACATGCAAGTCGAACGCACTAGCAATAGTGAGTGGCGCACGGGTGCGTAACACGTGGGTAATCAACCCTTCAGCCTGGGATAACGACTCGAAAGGGTCGCTAATACCGGATACGGCGCGAGAGGCTTCGGCTTCTCACGAGAAAGCCACGCAAGGGGCACTGAAGGACGAGCCTGCGGCCCATCAGCTAGTTGGTGAGGTAAGAGCTCACCAAGGCTAAGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCCACGCCGCGTGAGCGATGAAGGCCTT\n>URS00005A9635 rRNA from 1 species \nGGGGCCTGCGGTTAATTTGCTCAACACGGGGAAACTCACCAGGTCCAGACACAATGGGTTGACAGTTGATAGCTCTTTCTTGATCTTGTGGTTGGGGGCATGGCCGTTCTTAGTTGGTGGGTGATTTGTCTGGTTAATTCCGATAACGAACGGCCATCCCCTGCTAAATAGCCGGCCGGCTTTGGCTGGTCGCTGGCTTCTTAGAGGGACTTTTAGCGTTTAGCTAAAGGAAGTTGGTGGCAATAACAGGTTAACGTCTATAATCACAGGCCTGTAAAAGCGGTGGTGCCAACTTATAAGTGCTAGTGATCTAGTGCTACAAAATCCGCTAGTCCAAGAGGTTAATCGATGCGGAAAAGCTTTCCATAGTCGGGCATCGAGAGTGTTTTAACTAACACTTGCTTCTGGGCGACACAACCTGGTACAGGGAACGCCAAACAGGTAATGCTGAGGTCGATCCTGTGGTGAGTTAGAGTAGCGTCTAACCATCGCAACGCGCGCAAAGGTGTGGGTCTTATCTGTGGATAAGGCTTAAGGTACGTGCTAATCCCACTAGTAATAGTGGTTTGCTTGAGAGCCCACAGCTAAATCAGTAAAGGGTTTGGACTTTAAGTTCAGACCGAATCCATTA\n>URS0000F720C2 rRNA from 1 species \nACGGGAGGCAGCAGTGGGGAATATTGGGCAATGGGCGAAAGCCTGACCCAGCAACGCCGCGTGAAGGAAGAAGGTCTTCGGATTGTAAACTTCTTTTATGAGGGACGAAGGACGTGACGGTACCTCATGAATAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCAAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGTAGGCTGTGCGACAAGTCAGGGGTGAAAGCCCGCCGCCCAACGGTGGAACTGCCTTTGATACTGTCGCGCTGGAATACGGATGCCGTGGGAGGAATGAGTAGTGTAGCGGTGAAATGCATAGATATTACTCAGAACACCGATTGCGAAGGCATCTCACGAATCCGTCATTGACGCTGAGGCACGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTA\n>URS0002411ED0 lncRNA from 1 species \nAGCATTATATCCCCACGTTTGGCACATTAATCAACCCAATGTCAATCAAACCAATTGCAAAAGTCCTTTTCTTGGGTAAGTAAGTCTCCTACAACTCGCTAACCCTTTCTAATTGCTACAGGTTTTGTCTTAGAAGCACATAAGGGTATGGACATAGTCATGGATACGCATGTCAAGGAGGACACGTGTGTCCATAACGCGTCCCCAATGAGTCCAATAAAAAAAATAATTAAAAAATAGACAAGCCAAGTGGCATGTCAGTGTTCGACACGTGTCACACAC\n>URS000239296D lncRNA from 1 species \nTTTTTCCAAAACAGCAAAGCACGTCTCCTTAATAAAAGCACCAAGAACTTTACATGAATGTATTTATCGAAGATTCAGTAGCAAGGGCATTATTTACAAAAGGGACCATTTTGCCCCTTACAGGAGACAAAAAACAAACCCATTGAATTGGCATGATCTCAGAACAGCTCCATAATTTAATGAAACTCATGGATTCTCTTGAACTCCCCACCGCCCAAACCAAAATTGAACCTGACAAACAAGTACTGCAAATCACAAAAAAATAACCCACTCTTACTGGCTATTTTCACGCTTGTTTTTGCTGCTTCCACTCTCTTCCCCCTCCCCTGTGGCGTGACCTGTAACCACGTCTATTCAAAAACAAATTTGGAAATAGCAAGCTAACGCCGGTAAAAGAAACAGCAAAAAAGGAAACAAATAACCCTCTTTGATATTTAATACTTGATGACAACGTCAAGATTTCTTTAAAAACTACTGTTACTGTTATTTCCACGCTTGTTTTTGCTGTTTCCACTACCTTCCCCTGCCGCACCCTGACCTGTAACGACATCTCTTCAAAAACAAATTTGGAAATAGCAAGCTAACGCCGATAAAAGAAACAGCAAAAAATGAAACAAATACCCTCTTTGATGTCTAATACTTGACGACAAGGTCAAGATATCTGAAATTGAAAAAAATATGCAGAGAAAAACAGAGTTCTTGCCAAATCCAGATGAAAAAGCATGAAATTGTGGGAATTAGACATGGGTTTTGCTTAATTGTGAAGAGGGTTGGGGCCGGAGGGGACTAGTCTCTTCTCAACGCCGTATCTTGGATCGATTTCGTCGATTGGCGGCAGCGGTGGTGACAGAGGAGGGCCGTGGGGGATTCTTGGAAGGTTGTAGTAGCACATGGTGTTGCAAGAACGGGGTATATGGTGGCAGTGGTGGTGGCGGCTTTGGCTTGAAGAGGTTTCCCGCGACTTTGGGTTTGGTAATACTTGGGCCGATGATGATGATGGGACTATGAGTAGAAAAATTGTGAGAATCTGTAGGTGGCTAATGAGTGGCATGGTTGAAGAGAGAGAGAGCTCTTCACGGCTTGCACTCTGTGCTTAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGGAGTGGTGGTGGTGTTTATAGGAGGAGACGGGAAACTTGATTAATTTCAATCTTGATAGTAAAGATGACAACAAC\n>URS00025DB68B rRNA from 1 species \nATGAGCATGCAGTTGATGGTAGCCACTTTCAATAACTACCAGGAGTTAGTAGATCGTGCGCTTATGATTGAAGGAAAGCAGCAGCAGATTGACAATCGTAAGAGGAAGTATGCACAGGGGAAGTACAATTCTGGAGCTCAGCAGAAGCCACGTTTTACCCCAAAGTCAGGGGACACTTTCAGCATACTCATGGAGGAGGCAGCTCGCACAATCATAATGGCACAAAGAATGGAAACGGAAATGGAGGAAGCAATGGACAAAACCGCACCAACCCGTCAACACCATCCAAGGCAGACCTGA\n>URS0000382751 rRNA from 1 species \nGATCGACCGCAGTCTACGAACCATGACTGCATGTACCGAACGATCGGGTAAGAAGCTCATAAGTACTGTAGAGAACGAGTCTATCATTGTGACGTACTAGATAGCCCGCTACTACGTCAGCAGCGCGTATCGGTAGTCGAGCGTATCGATTACTGCGTAAGCAGGCAGACGTATAGCAGATGTGAAATCCTGCTCAACTGGAACTGCGTCTGAACTGATAGCTAGAGTGGTCAGAGGGGGGTAGATCACGTGTAGCAGTGAATGCGTAGAGATGTGGAGGATACCGATGCGAAGCAGCCCCTGGATAACACTGACGTTCATGCTCGAAGCGTGGGTAGCAACAGGATTAGATACCCTGGTAGTCACGCCTAAACGATGTCGATTAGCTGTTGGGCAACTTGATTGCTTAGTAGCGTAGCTAACGCGTGAAATCGACCGCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATGTACGGAACCTTCCAGAGACGGAAGGGTGCCTTCGGGAGCCGTAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCATTAGTTGCCATCATTTAGTTGGGCACTCTAGCGAGACTGCCGGTAATAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGCTGGTACAACGAGTCGCAAGCCGGTGACGGCAAGCTAATCTCTTAAAGCCAGTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGAAGTCGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGTCGGTGAGGTAACCGTAAGGAGCCAGCCGCCTAAGGTGGGATAGATGATTGGGGTGAAGTCGTAACAAGGTAGCCGTATCGGAAGGTGCGGTTGGATCACCTCCTTC\n>URS000256CAD8 rRNA from 1 species \nATGTCATGTGCATTCCCTGTGCCCATTATTTGCTCACATGACATGATTGCCATGATTTCTTCTAGTGTGTTGCATTTTCGCTCCACTAGTTTGCACGACTTGATTACTATGCTTCCTTATGTTGCATCACCAATGACTCATACTTGCTCATTTCATGCGGTTGACGACAACCATCTATATGCTTTGCACACGATTCATATTGCTCCTTGTCATATCTCTCCATATGTTGACTCCCTCATGCTAGATGATTTGCCATGTATTGAGTGCAATTATGCCTTTATTCCTTATAATGAGTTTGCCCCCATAGCGCATTCTCACATATATTTGGAGATTTTGACATATTCCTTGTGA\n>URS0001407240 rRNA from 1 species \nGACGGAGGATGCAAGTGTTATCCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCACTGTTAGTCAGGCGTGAAAGTCCTGGGCTCAACCTGGGAACTGCGCTTGATACGGCAGAGCTAGAGGATGGAAGAGGCTCGCGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCGGTGGCGAAGGCGGCGAGCTGGTCCATTACTGACGCTGAGGCGCGACAGCGTGGGGAGCAAACAGG\n>URS00021EF7D7 rRNA from 1 species \nACTTACGGCCACACCGCCTGGTTCACGCCCGATCTCGTTTGATCTCGGAAGCTAAGATAGGTTGGGCCTGGTTAGTACTTGGATGGGAGACCGCCTAGGAATACCAGGTGCTGTAAGGC\n>URS0000188C7A rRNA from 1 species \nGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGTGATTTTTGTGGAAATTCTTTCGGGAATGGAAATGAAATGAAAGTGGCGAACGGGTGAGTAACACGTGAGCAACCTACCTTACACAGGGGGATAGCCGTTGGAAACGACGATTAATACCGCATGAGACCACAGAATCGCATGATATAGGGGTCAAAGATTTATCGGTGTAAGAAGGGCTCGCGTCTGATTAGCTAGTTGGAAGGGTAAAGGCCTACCAAGGCGACGATCAGTAGCCGGTCTGAGAGGATGAACGGCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGGAACCCTGATGCAGCGACGCCGCGTGAGCGAAGAAGGTTTTCGAATCGTAAAGCTCTGTCCTATGAGAAGATA\n>URS0000626BAC rRNA from 1 species \nTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAAGGAAGAAGTATCTCGGTATGTAAACTTCTATCAGCAGGGAAGATAATGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGGCGGCGGAGCAAGTCAGAAGTGAAAGCCCGGGGCTCAACCCCGGGACGGCCTTTGAAACTGCCCTGCTTGATTTCAGGAGAGGTAAGCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACTGACAATGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATACTAGGTGTCGGGGCTCATAAGAGCTTCGGTGCCGCAGCAAACGCAATAAGTATTCCACCTGGGGAGTACGTTCGCAAGAATGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGCCTTGACATCCTGCTGACCGGTGAGTAATGTCACCTTTCCTTCGGGACAGCAGAGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATGTTCAGTAGCCAGCATTAAGGATGGGCACTCTGGACAGACTGCCGGGGATAACCCGGAGGAAGGCGGGGATGACGTCAAATCATCATGCCCCTTACGGCCTGGGCTACACACGTGCTACAATGGCGTAAACAAAGGGAAGCAAGAGGGTGACCTGGAGCGAATCCCAGAAATAACGTCCCAGTTCGGACTGTAGTCTGCAACCCGACTACACGAAGCTGGAATCGCTAGTAATCGCGAATCAGCATGTCGCGGTGAATACGTTCCC\n>URS00017894DA rRNA from 1 species \nTACGTAGGGGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTCCGGTAAGTCAGCTGTGAAAGTCAAGGGCTCAACCCTGGAATGCCGGTTGATACTGTCGGGCTAGAGTCCGGAAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAATGGCGAAGGCAGCTCGCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACAGG\n>URS00003589C1 rRNA from 1 species \nCCGCGAATTCGCCCTTCGGGGTGCACCAGGCGCGAAACCTTTACAATGCTGGCAACGGCGATAGGGGGACCTCGAGTGCCAGGTTACAAATCTGGCTGTCGTTGTGTCTAAAAAACACGATATAGCAAGGGCCGGGCAAGACCGGTGCCAGCCGCCGCGGTAACACCGGCGGCTCGAGTGGTAACCGTTATTATTGGGTTTAAAGGGTCTGTAGCCGGCCTGGTTAGTCCTTTGGGAAATCCGGCAGCTCAACTGTCGGGCTTTCAGAGGATACTGCCAGGCTCGAGACCGGGAGAGGTAAGAGGTACTTCAGGGGTAGGGGTGAAATCTTGTAATCCTTGAAGGACCACCAGTGGCGAAGGCGTCTTACCAGAACGGATCTGACGGCAAGGGACGAAAGCTAGGGGCACGAACCGGATTAGATACCCGGGTAGTCCTAGCCGTAAACGATACTCGCTAGGTGTCGGCCACGGTGCGACCGTGGTCGGTGCCGTAGGGAAACCGTGAAGCGAGCCACCTGGGAAGTACGGCCGCAAGGCTGAAACTTAAAGGAATTGGCGGGGGAGCAC\n>URS00024242CB lncRNA from 1 species \nCTAGGTCTTAGTTAATAATTGTTTTTATATTTTCAACTTATACCCCATTGAAAAACCCAACAGCCAAGCGGCTGGGTTTAATTATGGTAGTCCAACAGATTTTTTTTTATTAGTTTTTATTTTAATCCTAATTTTTAATCTATCTTGATTTATATATCCAAGTTGTTGTTGTAAATAATAACTAGTCATGAATGGCCTAGAGGAGAGAGGGTAGTTTCTAGGTCTTTAGTGGAGTGGGTTCAATACCCACATTTGTAGCATTTTTTTTTCTTTTAGCATTTTATTTCTTTTAGCATTTTTTATGTTTATGTTTT\n>URS00010F895C rRNA from 1 species \nACGAACGCTGGCGGCGCGCCTAACACATGCAAGTCGAACGAGCGAGAGAGAGCTTGCTTTCTTGAGCGAGTGGCGAACGGGTGAGTAACGCGTGAGGAACCTGCCTCAAAGAGGGGAACAACAGTTGGAAACGACTGCTAATACCGCATAAGCCCACGACCCGGCATCGGGTAGAGGGAAAAGGAGTGATCCGCTTTGAGATGGCCTCGCGTCCGATTAGCTAGTTGGTGAGGTAACGGCCCACCAAGGCGACGATCGGTAGCCGGACTGAGAGGTTGGACGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGGAGGAAGAAGGTCTTCGGATTGTAAACTCCTGTTGTTGAGGAAGATAATGACGGTACTCAACAAGGAAGTGACGGCTAACTACGTGCCAGCCGCCGCAGTAAGAC\n>URS000253A30D misc_RNA from 1 species \nTCCGGGTTTCGCCCGGCAGTCTCCCTAGATTATTCAACATAGGACAAGGGTTGCGCTCGTTGCGGGACTTAACCCAACATCTCACGACACGAGCTGACGACAACCATGCACCACCTGTGTACGGCCCAAAAGGACACCGTATCTCTACGGCTTTTCCGTACATGCCAAACCCAGGTAAGGTTCTTCGCGTTGCCTCGAATTAAGCAACATGCTCCGCCGCTTGTGCGGGCCCCCGTCAATTCCTTTGAGTTTTAGCCTTGCGGCCGTACTCCCCAGGCGGGGCACTTAATGCGTTAGCTACGGCACAGATCCCGTTGGTTGAGACCCACACCTAGTGCCCAACGTTTACGGCGTGGACTAC\n>URS000078C8E8 rRNA from 1 species \nCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCAGCAGGGACGAAGCGCAAGTGACGGTACCTGCAGAAGAAGCGCCGGCCAACTACGTGCCAGCAGCCGCGGTAAGACGTAGGGCGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGCTTGTCGCGTCGACTGTGAAATCCCGCGGCTCAACCGCGGGTCTGCAGTCGATACGGGCAGGCTAGAGTTCGGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGGTCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGTTGGGCGCTAGGTGTGGGGGACCTCTCCGGTTCTCTGTGCCGCNGCACGCATAGCGCCCGCCGTCGGGAGGTACGGCCGCGACGACGTAAACGTTAAATAGAGTTAGACGGCGTGAGACGTGACCGACGGACGACGACGAGGGAGGTTAGG\n>URS0000E2B2B0 rRNA from 1 species \nCCCCTAGTAACTGCGAGTGAAGCGGGAAGAGCTCAAATTTAAAATCTGGCAGTCTTCGATTGTCCGAGTTGTAATTTAGAGAAGTGTTATCCGCGCTGGACCGTGTATAAGTCTCCTGGAAGGGAGCATCATAGAGGGTGAGAATCCCGTCTTTGACACGGACTACCAGGGCTTTGTGATGCGCTCTCGAAGAGTCGAGTTGTTTGGGAATGCAGCTCTAAATGGGTGGTAAATTCCATCTAAAGCTAAATATTGGCGAGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGAAAAGAACTTTGGAAAGAGAGTTAAACAGTACGTGAAATTGCTGAAAGGGAAACGCTTGAAGTCAGTCGCGTTGGCTGGGGATCAACCTTTCTTCTGATTGGTGTACTTCCTAGTCGACGGGTCAACATCAGTTTTGACCGTTGGATAAAGGTTAGGGGAATGTGGCATCCTCGGATGTGTTATAGCCTCTGATTGTATACAATGGTTGGGACTGAGGAACTCAGCACGCCGCAAGGCCGGGTTTTTAACCACGTACGTGCTTAGGATGTTGGCATAATGGCTTTAATCGACCCGTCTTGAAACACGGACCAAGGAGTCTAACATGCCTGCGAGTATTTGGGTGGAAAACCCATATGCGTAATGAAAGTGAAAGTTGAGAACTCTGTCGTGGAGTGCATCGACGCCCAGACCAGACCTTCTGTGACGGATCTGCGGTAGAGCATGTATGTTGGGACCCGAAAGATGGTGAACTATGCCTGAATAGGGTGAAGCCAGAGGAAACTCTGGTGGAGGCTCGTAGCGATTCTGACGTGCAAATCGATCGTCGAATTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCTGCCGAAGTTTCCCTCAGGATAGCAGAAACTCATTATCAGATTTATGTGGTAAAGCGAATGATTAGAGGCCTTGGGGTTGTAACAACCTTAACCTATTCTCAAACTTTAAATATGTAAGAACAAGCCGTCTCTTGACTGGACCGCTTGGCGATTGAGAGTTTCTAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGAACGCGAGGTTAAGGTGCCGGAATTCACGTTCATCAGACACCACAAAAGGTGTTAGTTCATCTAGACAGCAGGACGGTGGCCATGGAAGTCGGAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATGAACTAGCCCTGAAAATGGATGGCGCTTAAACGTGATACCCATACCTCGCC\n>URS00007CECD4 rRNA from 1 species \nACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCCATGCCGCGTGAATGATGAAGGTCTTAGGATTGTAAAGTTCTTTCGCTCGTGACGATGATGACGGTAACGAGAGAAGAAGCCCCGGCTAACTTCGTGCCAGCAGCCGCGGTAA\n>URS00004EF8E6 rRNA from 1 species \nGAATCTGCCTGTGGGTCGGGGACAACCACTGGAAACGGTGGCTAATACCGGATGAGCCGAAAGGTAAAAAATTTATTGCCCACAGATGAGCTCGCGTCTGATTAGCTAGTTGGTAAGGTAAAAGCGTACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGATGAGCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTCCGCAATGGGCGAAAGCCTGACGGAGCAAGACCGCGTGGGGGAGGAAGGTTTTTGGATCGTAAACCCCTTTTGTCAAGGAAGAAGTTCTGACGGTACTTGACGAATAAGCCTCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGAGGCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCTGTAGGTGGCCAGCTAAGTCTGCTGTTAAAGATCACAGCTCAACTGTGGGAAGGCAGTGGAAACTGGCAAGCTAGAGGCTGGTAGGGGTAAAGGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAAGAACACCGGTGGCGAAAGCGCTTTACTGGGCCAGACCTGACACTGAAGGACGAAAGCTAGGGGAGCGAAAGGGATTAGATACCCCAGTAGTC\n>URS0001F5106B rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCAAATGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS0001EC9022 rRNA from 1 species \nACGAACGCCGGCGGCGTGCTTAACCCATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS000222C3C5 misc_RNA from 1 species \nAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAGCTCGTAGTTGAATTTCGGGATCAATATGTTGGTCGTGCCTCGGTACGTACTAGCATATTGGTTTCTCCTTTCTGAAGAACCATGATGTCATTTATTTGGTGTCGTGGGGAATCAGGACTGTTACTTTGAGAAAATTAGAGTGTTTAAAGCAGGCTCACGCTTGAATACATTAGCATGGAATAATGAAATAGGACGTTTGATTCTATTTTGTTGGTTTCTAGGATCGACGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGATGATGTTAATTTTTAATGTACTCTATTCC\n>URS0002325A80 pre_miRNA from 1 species \nAAAAAGACAAACCCTGGTTTCCGTGCCCAACGTTTGACCGTCTGTCTTATTTAAAAAAATTATGAAAAAAATTAAAAAGACAAGTCATGCATAAAATATTAATCATGTTTTATCATCTAACAACAATGAAAATACGAATTATAAAAAAATTTCATATAAGACGAACAGTCAAAGTTGGACACGGAAAACCAGGGTTTGCCTTTTT\n>URS000130A086 rRNA from 1 species \nGTAGGTGGCAAGCGTTGTCCGGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTTCTTTAAGTCTGATGTGAAAGCCCACGGGCTCAACCGTGGAGGGTCATTGGAAACTGGAGAACTTGAGTACAGAAGAGGAAAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGGCTTTCTGGTCTGTAACTGACGCTGAGGCGCGAAAGTGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGCCGCAAAGGCTG\n>URS00002466F2 rRNA from 1 species \nCCCCTACGGGAGGCAGCAGCGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGGGGGTGAAGGCCTTCGGGTTGTAAACTCCTTTCGCCCGGGACGAAGCCCACCTGGTGGGTGACGGTACCGAGCGAGGAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATGGGG\n>URS00012DC715 rRNA from 1 species \nTACAGAGGTCTCAAGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCTCGGAGCTTAACTTCGAAACTGCATTCGATACTGCCGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCGGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACGCTGAGGCACGAAGGTCAGGGGAGCGAAACGGGGATTAGA\n>URS000259BFCE rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGATCTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGGTCTTGAGTTCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGCTCGATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGG\n>URS000164E0EC rRNA from 1 species \nCAGTCGCCACGGTAATACGGAGGGAGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGTTACTCAAGTCAGAGGTGAAAGCCCGGGGCTCAACCCCGGAACTGCCTTTGAAACTAGGTGACTAGAATCTTGGAGAGGTCAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAGGAGCACCAGTGGCGAAGGCGGCTCACTGGTCCGGTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCCCGTAGTCCCTGTCTCTTATAT\n>URS0000370A15 rRNA from 1 species \nATTGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGGCAGCACAGCAGTAGCAATACTGTGGGTGGCGAGTGGCGGACGGGTGAGGAATACGTCGGAATCTGCCCAGTCGTGGGGGATAACTAGCCGAAAGGTTAGCTAATACCGCATACGACCGAGAGGTGAAAGCGGGGACCGCAAGGCCTCGCGCGATTGGATGAGCCGACGTCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCCTTCGGTTGTAAGACGACTTTATTCAGGACGAAAAGACGTT\n>URS00019773DC lncRNA from 1 species \nACACTTATTGAAGATTTATCTTGTATAGATTCTTTCTAAACTGCTTTATATATTCACTCATGTCATCATCACATAAACCTATGATGCAGGTAATAGTATTATCTCTCTTTTACAGATAAGAATACTAAAGCATGGAGAGATTGCTAGCACTAAATCACTTAGCTAATAAATGTCAGGATAAGAATTTGAGTACAGGGAGTCCAGGTCCAGAGTCTGTCCACTTAGTGCTGCCAAGTTGTGTGCGTGTTGGGGGCAATGGGTAGGTTAGAGGCAAAGATAGAGATATATAGATAGTTTTCAAGAGTTCCTGCCATGCCTCAGTGGAAAAGAATCTGACTAGTATTCATGAGGACACAGGTTCGATCCCTGGCCTCGCTCAGTGGGTTAAGGATCTGGCATTGCTGTGATCTGTGGGGTAGGCCATAGATGTGGCTTGGATCCCATGTTGCTGTGGCTGTGGTGTAAGCCGGCAGCTATAGCTCCGTTTTAACCCCTAACCTGGGAAAATCCATATACTGAGGGTGTGGCACTAAAAAGACAAAAAAAAAAAAAAAAAAAAAAAAAGAGAGAGAGAGATAGTTTTCAGATTCTTAATCTTGGTTACATTGGTGAATGGAGTTGGGCATAAAAGGTTGTTGCTTAATGTGGGATGTGATGAGTTTTTTTTTAAAAAACAGCAAGCAAGAAAGAAAAGTTTCACTTATAATTTGATAATGATTAAATTTTTATAATCTGCATCATCACTTTTACCATAAAAATTTCAAACCTGAAAAAATATTCTTTTTTCCTTCAACACATTTAGAAATACTGCTTTTGATTCTAAAAACAAAAAGAATGTAGATGTGGGCGTTCCCGTCATGGCGCAATCCAACTAAGAACCACGAGGATGTGGGTTTGATCCCTTGCCTTACTCAGTGGATTAGGATCCGGTGTTGCCGTGAACTGTGGTTCAGGTCATAGATGCGGCTTGAATCCTCCATTGCTGTGGTTGTGGTGTAGGCTGACAGCTGCAGCTCCAATTCAACTGCTAGCCTGGGAACCTCTATATGCCACAGGTGCAGCCCTAAAAAGCCTTAAAAAAAAAAGAATTTGTCTGTACTACAGGCCCAGTTTGCCACATATACATCTATGTCCTTGGGTCTTGACTTGACCACACCATGCTTTAGTTTCCTCTCCTGCATAAAAGGAATCATGATCCGTCCTCCCCCACTGGCTTGTGGTGAGTATCCAGTAACATCAGAGTTAAGTGCTCTGTGCAATGCCTGGTGCTTTATTCATCTCTCTCAACATTAGCTACCATAGTCATCATTGCCAGGCTGAACTCTTATTGCCCCTTCTCCTGGCCATTTGGAATTAAGATTGCAAACTGATTAAGTCATCTGAAGCAGTCAAGATACCAGGACAATGACGTTGGTGTGCTGAATAGAGAGTGTAAGTATACATGAGAGACTATCCTCAAGTAACTACTGATTAAAAACTGTTAAGTAGTTGTCAACTGGAAAACAAATGCACCATATGAGTTGTGAGTTAAGCTGGGGCAAAATGATGACTATAGCCTGGGAGAAAGCATTTCATATGGCTCTGAAAAACTGCTTTGAAGAGGTAGGAGAATAATATCAGTATATATGTGGTTTTGGTGAAGGGGAGGTACATGCAATCAAGCACAGATTTTGCAGAAGGTCACTGCTAGTCTTGTGAAGGTTACTGCTAATCATGAGGAGCAGATGTATCCACTAATGATTTCATTGCTTCTTTAGATATGAGAAGATGCAAGAATTCAGCGCATAAAATCTTTTAAAAATATCTAACTATCTGAAGGCCTGTTCTGCCAGGGATTCCCAGGCTGCCTCAATCCAGATCTCTACCTTAAACTCTTTCCAAGGGGTATTGAAGGTCAGGGGCTGCAGTGGCTTGTGCCTTAATCCTTGTAGAGACAGATGGCAAGTACCAATTTTTAGTAGTCAAAGGCTTGACCTGCAATGGTGACCTTGACAATGGTCCACCCCCTGAAGTGCTCCAAGCATTGGAGTTTTAGAAATCCAACCTCTGCCCATCAGCTCTCAGAATAAGGGGTCCCTTTTGTTCAAAATGGTGGTGTCTGCCATTGCTCCTTGTTTGCTCAGTAAGGATGAAAAAAGCCCAATAACATTATAAACCCTTCTTAACTCCTGCCTTTTACTTTTGAGGGAAGACTATGTATTCAGGAAGTGCTCATGGCAAAGCCTATTTAAGAAATAAAAAGAACAATAACAAAACATCTCAGAAATTCCTTTTGAAAACAAGAGCCCAGAACTTGCCTGAGACTTAATTGCCGCACACACACACACACACACACACACACGTGCACACACATACAGAGCTTGTCTCCTACATTTTCAGACTGTTTTAAAGTACAAGGCACAACCAGGTTAATAAAACATGCTTGAGGCTATGTTCTGTTTGTTCATTACACTATAAAGCATTTTAAACCTACAATTAATTTTAGATAAATTAAAGATTTGACACAGCCATGGTACTCGTGCAAGAGCATTTGTGTTAATATCTTATATTTTTCATACTCAATCACCCTGCTGAAAAGTTTAACAGCCTTCCATATTTATAACTGCTTTCTAGATTCTTCTTTCTTTTTTTTTTTCCTACCTTAGTTGTCAAAAGCATTAACGAAGCTGGCTTTGGGGAAGAATTCCAATTCAGAGTTATTTTTCCATGAGGTACTTAAGACTCCACACGGCAGCTTGTGATTATGTTGGCAGTGGCTTTGCATAACTGTTGGTTTCCTGTAGTATAAATAAGTGAACAGCTAAGAATGCTAATGTTTTGCTTTGACTAAGAAAAAGCTCTCAATAAATGACAAGGAATTACCCTCATTGGACTACTTAAGTTTTTCTTTCTCCTTCCTTTAAAGGGGTAAGTTAAACCAAAGCAATAGAGATAAGTGATCACATAATACTTGCTACCGCTTTAAGATCATTCTTCAAGTTGCAAAAAAAAATCAAATTGTTTCATTCCCAAAGTCCTTTCTAGTTGAGAAATTGAAGTGGGAGAAAGGCCATGAGGATCACTGGAAAACGCCAATGCAAGCAGTGTCCAATTGCAGCTAAATACAGGGCAAAGAAAGTCAGAGCCTTTGCCCTCTTGAGATTTGGACCAAAAACAGGAAAAAGATGCTTTGGCTAGGAGAAAGGACAGACAGAGTTTAGGGAGGAAAGGTTGCAGAGGAGAAAGCTTGGCAAAAAAGGTGTATGCAGATGGAATTCTCAGGAGCAGCTCCTGAGAGAGGCTTTGCATCATGTCAGCTGTCATGGTCAGGAGCAGGACAGGGACTCTGTGGGATGAGATATTATGGACCTTGCACAGAGCCCTGGGCCTTTGGCTAATTCCACATCCTCCAAAATCTCGAGTACTAAATGTTCCCATCCAGTCTCATCTGTTTTCACTCTTTCCCTCACAGAAGACAATCCCAATAAATGGAGTAAAAGCCAGAGAAATGTCCTCCCAGGACACCTGGCAGCTACCATTGCCCACAAGCTTCTCTGATCCCCACCTACCTTCTACCCAGTGAAGACTCAGCCTTCCAGCTGCCATCCTTCTTTCCAGGACAGGTTGACTGCACTGCCTTGGTGGATGAGCCATTGTTCACTTGGCTGCTATTCTGCAGTTCTGTGTTTCTCCAAAGGGAACCCTCCTGCACTGCTGGAGGGAATGTAAACTGGTACAGCCACTATGGAGAACAGTTTGGAGATACCTTAGAAATTTATACATAGAACTTCCATATGACCCCGCAATCCCACTCTTGGGCATCTATCCGGACAAAACTCTACTTAAAAGAGACACATGCACCCGCATGTTCATTGCAGCACTATTCACAATAGCCAGGACATGGAAACAACCCAAATGTCCATCGACAGATGATTGGATTCAGAAGAGGTGGTATATATACACAATGGAGTACTACTCAGTCATAAAAAAGAATGACATAATGCCATTTGCAGCAACATGGATGGAACTAGAGAATCTCATCCTGAGTGAAATGAGCCAGAAAGACAAAGACAAATACCATATGATATCACTTATAACTGGAATCTAATATCCAGCACAAATGAACATCTCCTCAGAAAAGAAAATCATGGACTTGGAGAAGAGACTTGTGGCTGCCTGATGGGAGGGGGAGGGAGTGGGAGGGATCGGGAGCTTGGGCTTATCAGACACAATTTAGAATAGATTTACAAGGAGATCCTGCTGAGTAGCATTGAGAACTATGTCTAGATACTCATGTAGCAACAGAACAAAGGGTGGGGGAAAAAATGTAATTGTAATGTATACATGTAAGGATAACCTGACCCCCTTGCTGTACAGTGG\n>URS0000B9BAF2 tRNA from 1 species \nGTCTTCGTGGCTCAGTTGGTTAGAGCGTTGGTCTCATAGTATGATCCAATCTCAGGTTGGGATATCCAAAGGTCGTGAGTTCGAGTCTCACCGAGGACA\n>URS0000679C41 pre_miRNA from 1 species \nCTTTTAATATAAGTATGTCCCATGAAATATTTGGGATATGCTTATACTAAAC\n>URS00004B7CE6 rRNA from 1 species \nGGCCGCGGGAATTCGATTCAGGCCTAACACATGCAAGTCGAGCGATTCTCTTCGGAGAAGAGCGGCGGACGGGTGAGTAACGCGTGGGTAACCTGCCCTGTACACACGGATAACATACCGAAAGGTATGCTAATACGAGATAATATGCTTTTATCGCATGGTAGAAGTATCAAAGCTCCGGCGGTACAGGATGGACCCGCGTCTGATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCGACGATCAGTAGCCGACCTGAGAGGGTGATCGGCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAAGGGGCGAAAGCCTGATGCAGCAACGCCGCGTGAGCGATAGAGGCCTTCGGGTCGTAAAGCTCTGTCCTCAAGGAAGATAATGAC\n>URS0000D1B51B rRNA from 2 species \nAAGTCGAGCGGACCGACGGGAGCTTGCTCCCTTAGGTCAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCTGTAAGACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATGCTTGATTGAACCGCATGGTTCAATCATAAAAGGTGGCTTTTAGCTACCACTTGCAGATGGACCCGCGGCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCGACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTTTTCGGATCGTAAAACTCTGTTGTTAGGGAAGAACAAGTACCGTTCGAATAGGGCGGTACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAAGAGGAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAA\n>URS0000C4FCDB tRNA from 1 species \nGCCTTCGTGGTGTAACTGAAAGCATACTAGACGTGTATTCGATAGGTCCAGGGTTCGAGTCCCGGCGAAGGCA\n>URS00022EE1E1 rRNA from 1 species \nCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAATTTCGAGATCGGTTTATTGGTCGTGCTATTGTACGTACTGGTATTACCGGTTTCTCCTTTCTGACGAACCTTAATGCCATTAATTTGGTGTTTTGGGAAATCAGGACTGTTACTTTGAAAAAATTAGGGTGTTTAAAGCAGGCTCACGCTTGAATACATTAGCATGGAATAACGGAATAGGACGTTTGATTCTATTTTGTTGGTTTCTAGGATCGACGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGATGATGTTAATTTTTTAATGACTCATTCGGCGCCTTAC\n>URS00003E1810 rRNA from 1 species \nACGGGAGGCAGCAGTGGGGAATACTGCGCAATGGGAGAAAGCCCGACCCAGCAACGCCGCGTGAAGGAAGAAGGCCTTCGGGTTGTAAAACTTCTTTTAAGAGGGACGAAGAAGTGACGGTACCTCTTGAATAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCGAGCGTTATCCGGATTTACTGGGTGTAAAGGGCGTGTAGGCGGAGCAGCAAGTCAGAAGTGAAATCTCTGGGCTCAACCCAGAAACTGCTTTTGAAACTGTTGCCCTTGAGTATCGGAGAGGCAGGCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCCTGCTGGACGACAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGAATACTAGGTGTGGGGGGACTGACCCCTTCCGTGCCGCAGTTAACACAATAAGTATTCCACCTGGGGAGTACGATCGCAAGATTGAAACTCAAAGGAATTGACGGGGGGCCCGCACAAGCAGTGGATTATGTGGTTTAATTCGACGCAACGCGAAGAACCTTACCGGGATTTGACATCCTGCTAACGAAGTAGAGATACATTAGGTGCCCTTCGGGGAAAGCAGAGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATTGCCAGTTACTACGCAAGAGGACTCTGGCGAGACTGCCGTTGACAAAACGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCTTTATGACCTGGGCTACACACGTACTACAATGGCGTTTAACAAAGAGAAGCAAGACCGCGAGGTGGAGCAAAACTCAAAAACAACGTCTCAGTTCAGATTGCAGGCTGCAACTCGCCTGCATGAAGTCGGAATTGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGCACTCACCGCCCGTCA\n>URS0000E780C0 lncRNA from 1 species \nGGCGAGGGGGACACCGTGGAGGGGGGTTGGGGGGGACGAGGCCGGGCAGCTCTCCCGCAGGGGGCCGGGCAGGGCAGCGGGGGTGGGCTCTGCTGGGCGTCATCCCCCCCTCCCCTTCTCCCCGGGGAACCGGGGCGGTGTGGGGGGGGGGCCGCTCCCGGAGCATCCCCCCTTTGCCCGGCTCCCCCCCTCCTCCTCCTCCTCCCCGCTTCCTCCGTTTAAAGGCCGGGTCCCGGCGGGGCCGAGCGGAGGAGCAGCGGCCGCTCCGCAGCCCCAGTGCCGCGGCGGGGGCGCGCAGCGCACGGGGCGGGCGCTGGATGCGGCGCCGGGGGCGGGCGGGCGGCAGCCGAGCGGCTCCGGTCCGGTGCCCGGTCCCCGGTCCCCTCCTCCCGTCCCCCCCAGCGGGTCCTCCCCGCGCGGCGGCGCGGAGCTGGGAGCGATGAGCGCGGCCGGAGGAGCCGGCACCGCGGCGGGCACCGCCACCTCCGCCCTCTGCCTGCTCCTCTCGCTCACCGCCGTGGCCGTCTGCCTGCTGCTGGGAGCCAAAACGGCGGAGCTGCAGGGCCGCCTGGCAGCCCTGGAGGAGCGCGGAGCCGCCGGTCCCGGCCCGCTGCTGGAAGCGCTGCAGCCCCGCCTGGAGCAGCTCCTCCGAGAGAAACTGGGTGAAGGACTAGCTAAGCTGCGGACAGCGAGAGAGGCTCCGTCAGACTGCATGTGCCCCCCAGGCCCTCCGGGGAGGCGAGGGAAGCCCGGACGGCGCGGAGAGCCCGGTAAGCATCGCGGTCACCCCACCGCTGTCACGGGGCTGGGCACAAACATCCCGGTACCGCTACCATCACCTCTCTCTGACGGGCTGGCTCCTGGTTAA\n>URS000240ACFD lncRNA from 1 species \nAACCTGTTAATATGATTAATTATTGCAGTCAGAAGCAATCAATTTCCTGAGAGAAAATAAAAGTATTTAGTATTTCCTGAGAAAAGAACAATAAGTACATAAATTGAAATTACAACAGCAATGAAAGGTGGAAACCAAATCAGAGAAGAAGATAAAACTGGCAGAGGAGTGGAGATGTTTTGCCGCACGAAAAAAAAAAGTCAACAAAAAATACCGCATTAAACGTAAGATGATCCTTCGGATATGGTAAATAAATATATCCGATGAGATGAATTCAAACTATTATTGCGACTGTAGAGGAATTAACATGCTGGAACGAAGTCGCCCTAATTTTTCGTCTAGGGAGGGCAACTCGGGAGTCGAAGCGACGCTAGAGATGAAGGTGGAATGAAAAGTCTCTGAAGGAATTAAATGGAAAGAGAATGAGAAAAATAAACTGATGGGTGGGATCCATGAGCAAATAAGTTAAGATGACAATTGACTTCCCATAAAAGCCAATATTTTAAGATGGTAGGTAGGTCCCACAAAATTTTTTTGAAAAGTCTCTTAACCAATTAAAAAAAAACTGATAGATAGGCCCCAACATAAATCCACAATTAAGCAAAATATATTAGGCTGACAGGTAGGTTCAACAAAGATTCAAATTAAGCTAATATCGTCACGTGGACAAAAGGATATGGGATTTTATAGTAGTTAGTAGATGAGATGAATCCAAACCATTATTACGACCGGAGAGGAATTAACACGCTAGAACGAAGTCGCCCCAATTTTCCGTCTAGGGAGGGCAACTTGGGAGACGAAGCGACGCTAGAGACGAAAGTGGAATGAAGAGTTTCTGAAGGAATTAAATGGGAAGAAAATGAGAAAAATAAACTGAAGGATCGGTCCCATGGGCAAATAAGTTAAGATGACAGTTGACTTCCCACAAAAGCCAATGTTTTAAGATGATAGGTAGGTCCCACAAAATAAAATTTTGAAAAGTCTCTTTACCGATTAAAACAAAACTGACAGATGGTCCCCAACATAAATCCACAATTAAACAAAATATGTTGGGCTGACAAGCAGGTCCCATAAAGATTCAAATTAAACTAATATCGCTACATAGACAAAAGAACATAAGATTTCATAATAGTTAATAAATAACTCGCTAGCATTAATTTTTTGGTTTTTTTTTTGTTTTATTTTAGAATTATGTAAATGCATTTTAATTTACTCTCAATCAAACAAAGTTACATTTTGAATATTTTAAAAAACTTTATTTATTTTATAGCATGCGACAGGTGAATGTTCGCTTCCTCGATCTAAAAAGTATGAAACAAAAAATGTCAAATTTTTTTTTCACATGAATAATCGTTTATCTAGTCATCGGTGGGTTTAGTTTTAAGAAAAGAGGAATGCTTCAATACACCGGCTAAATTAAATCTAGCCGTTCATATTTGAGGGGCAAGATTGACTTTTGCATAATAGTTACCTGCTCAACAAGTTACCATTCGTAAGGGTACACTACAACAAAAATAGTCTATAGCTACACTTTTAAATATAGGTACATGTCAAAAAAGTGCTGTTAGCTAAAATTACCGACACTTTTAAAAAGTGTTGCTATACGTGGGGTCGCTAGATATATAGTGACAGTTAAAGAGTGTCGCTATAACCTAAAAGAGTGCTGCTAATTTACCAACACTTATTTGTTGGATTGGGCTTTATATTTAGGCATTAATAGATGTTTTTTTAAGTTTTAGCAAAAATGGGACACTTACTCAAAAGTGTCCCAAATATGTGTCCCTATAACCTAATTCTGTTGTAGTGGTAATATGGGAAAACAAATACAAGCTAATTACCAAATTTGATTAACCCTATACA\n>URS0002381478 lncRNA from 1 species \nACTTACATAGCACTCGTACAATCGACTTGACAAGCAACAGAAAAGTACCCAATTAGTGTAGAATCAAGTATCAAAGCAAACAAAAAGGTAAAAATATAAAAAGAAAAACAAAGGAAATAAAGAACAAGGAAAGAACAAAAAGAAAAGAAAAGAAATGATAGAATTAGTTAGAAGGATTTAAATTAACTACCAACCAGCCTCCCGACGTTTAACAAAAATATTTCTCTATCGCATATAATGGGTTTTGAACTTGGAACCAAATAGAATACAAATATATGCTTAACCAGTGAACCAACAGGTTCATTCTTAACATAAATTTACACAGAATTGCACTTAACTATATAACACGGATAGGGGTTTTTTTTAAAAACAAAAAACAAAACTTCTAACAATGCGACTCGAACTCCCAATTTTTAACACAATAGAAGAACACAGAATCACAGATACAAAATTTTAATTACTGCAGATTCTCACAATTAAATTCTCAAATTTTTAGGGCGTTACACCACCACCCTAAGCTCTCAACAATGGACCTGTTGACTCTCATCCAGCACTCAACTGTATGATTATTCAATCACAAAGCAATATTTATAAACCAAGAAAAATTAGTCATTTTAATACTACTCTTTTCCAATTACTTTAAGGCACAATGTGTGTTTTTCCGTAATAAAACACATTTCCATAGAAAATTATGTCTCTTTATCTTGATACTTTTCCATAAAATTTATTATTTATATTATTTATATTATGTATCTCTTTGTAATGTGGGAACACTAACATTGGAAACTATTAATAGATTTTATTAACAAATTGAAGCACCAACTGAAGTTGTAAATGATTCAATCATTAAGTCAAAAGAGATGGTCAATAGAAAGAAAATGGTAATGATTAAAATAAAATAAAAGAGTTTATATATCATTAAAATAATTATTAAGTATATTTAAAATTATCATTATAAATATTTATATATGTGGAGTGTTTCTTGCATTTTTTGTTCAAATTAGAGTCAAAGTAGAGGCGACGTTGCAATGAGGAATCACGCGACGTCGCAACGAATCGACGACATTCGAAACAGAGGCAATGTCGTGACGATACGACGAGTTCCAAACTTAAAGTAGTTACGTATTAGACTATCAACAAGGTTACTTTTCCTAGTTAAACTCTGATTACATTAGAGATATTATAGTCATATTAGAACTCTAATCTTAGCCTATTTAAAGGGCAATAACAATCCTAAAATCGGAAGAACATAACACAGCATTAGAGAGAAAATCAAGAGAGAGTTTTAGAGAGCTTTAAGGGAATTTTGTGTTTTTAGCCACTGAGAGCTTTGTATTATGGGTTAAGGTTTGTTTTGAATTTCTCCATCTTGAATTCTTTGTTTGTTTGCTCATTAGTGAAGTCTCCTTTGCCTATGGTTTTTTATTCTCTTGATTGGAGGGATTTTTCCACGTAAATTTGTGTGCCTAGTTTTCTCTATTCCTTCTTTCTCGTTGTTTATACGGGTTGATCCCCAACAATATTTAGTATTTTATTATTTTATGTATTTTTATAATTTTTCATTGAAAAAAATATAAATGTTTTAAGTTTTTTTTTTCAATTTTTGAATTTTTTAGAATTAAGATTAAATTGTTAGAATGTGTAAATATTAATACCTAAACTTGTTAAGTTTTTAGAATTAGGATCAAATTGATAGAATGTGTAAACATTGGAGAGATAAATTCATTATTATGCCAATAAAAAATCACATCAAACTTCCCTTAACTATTTAAAGACAGAGTGACAAAAAAATCAAACTTAAAAAATGTTAGTGACTAAATTAAAAAATTTTATAGTTGACATTTTCTTTATTTCTATTCATATTCATTTTACAATACATATAGGATTGTGGGTACCTCCCAACAATGTTGTTTTCAATGTTTAAACTTGTGTTCTTCTCTTATGAATACAATATGTCTTACCACTCCACCAAAAACATGTATATAATAGTAATAAACTTTTTTTTCTCTCCATGCGATGCACGAGTTGCTTGTGTGTATTAATTAAAATATATGTAAAAAATAGAATGTCAGTAATGACAATATATCACAAAGAAAAGAGAAATAAAAATAAAGAACACACCAATTTTTACGTGGAAACCCTTTTGGGAAAAAACTACAGGTAGAGGAGAAAAAAATTCACTATGTCGAATTCGAATGATTACAAGAGGAGTAAACTATGTCTATTTATAGGCTTTGTAAAACCATATTCTAATAGGAGTGTAGTAAGATTGAAACACCTTATTCTAATCAATATCAAATAGATAGAGTTTAATAAGGTTTAAAAAACCTTATTCTAAAATAAAATAAAAGAAGTATAATTCTATAGGGATTTTACTTTTATTTTATTTTACCACTGTATTCTATTTAAATAAGGATTCGGGTCACTTAATTCTAACAATATATTATATTAAATTTTAAAATTTATACATAACATATTATAAATATTATTATTAAAAATTAAAAATAATATAAATATTTAATTTTGTAATGATGATAATTTAAAATATAATCAATATAATTAAAAAAAAATTTAATAAAATAAAATAGTTAATATTACTCTCAATTATGATTTCCGCATTACTTAAAAAAAATGCACAACTAATGGAAATATTTGAGTACAAAAATCTGAATATTAGGATAATGAAATTGTTTAGCAAAAGTCAACAATGATTAAGCATTGACACCCATAAACTTAAAGCATAATGAATGGGGTGTTTAAATTTAATTTTTTTAACATTTACTTGTGGAAAAAAGTATTAACCAATTAGGTAAATATTCAATTTTCAGCGTATTTATTTATTTAATGTAATGCTTTGTAATTTTTTTACTACAAACCATAGTCATAGGGAATACTAACATATTCTTATTCAAATGAAAATTTAATGCTTCATTAAGATAATTTTAAGCATTTAAATGTTAAATTAAATTATTATTCAGTTTACAACTTTTAACAATACGTACACATTAATGTGATAAATGTCATGTTTTAAATATGCTACATTGAATTAGCTGCTTAAATTGTAATTGTATATATATGATGTCATCTCCTACCGACTTAAGAAAAACTCTCAAATCCAAAATAAATTGAAATCTAAATCTAAATACAAATATGCTGAAACCTGCTTGTTTGCACTTTAATGGATCTTATAAACTAGTTGTGGGCCTGTATGTATCAAACCTCCTTATCCAAATGCAAAATAAACCCTAATTCATTTAGAAATAAGTACAGAGAGATCTGGTTATAAGCTTCTTAAGATGGAGGACGCCACATATGCCCCAGAAAAAAGTCCAAAGGCATCGCTTGGTACTTGGTACTCCCATTTCATTCTTTTGGTGGTTTGTTTCACTGAGTTTAATCTTAAATGGTTCCTTATTCACTGTTAATTTCGAATCGTCTATTTGGTTTCAACAATCAGTGATTGGCCGTGATGACACAAAGGCCGGACTTACGGCTGCTACTGCTCTTCCCTTGTGTGGTAGTAGTATGATGTTTGTTGTGATAAGGTGTTTGTGCTGAGCCACTTTTCTCTCTACGCTTTCTCTATTTTACTTGAGATATTTATACTGTGGATTTCTAGTTTGAATACAATTTTTTTGGTTATAGTAAACATGGGTTTGTTTTTGGTGAGCCTGCCCTGAATTTGTGTGGGATTCCCTTTGTAGTTCTAGGAATTAGTTTACCGATTCTACAACTGACCCTTGAAGAATTAAGTATTCCTTCATTTTCCTCATCTTATGCAGCTGATCAGCAATGATTCCTTTTAGGCTTGTTCTCTTCTGAACTTCAAATTACATCCTTTATAAGAGATTTGGTCAAGCTATTGTGTAGGGTTTGTAAGATTTTGCATTTTATTGGCTTTTGCATTGCATCATTGACACATGGTTCCATGTAAATTCTGATATTTCAACTTCTAACAAAGCATTTTTGGCTGTGCCTCAATGCTATGTATGGAACACTACTGGTGTTGTTTTGCCTGCTTTTTTGTTTTTACGAATTATGTTTAAAAGCCTTGTTTTGCTCTCAGTCCAGGATCAGCAGTTAGACATTTAGATCACATCGATGAATGTAGGTCTTGATAGTTGTTGATTCTTTACATGCATAGAAGCTAAAGAAAAAAGTTCCAATTGAATTGCCATGTATCTTTGTCACAAAGACATGATTTTTCCTACATTTGTAGAGTGTATGAGTTGCAATTAACTACTATCATAAGGGCAAACCATGCAACTATTACCTGCAAAAGAAAATGTAAGAGCATTTGAAGTGATGACTGCATTCTATAGCTGAGAATGCAACAAGGCCATAAGAAACAGTTTGTTCAACTTGATAAACATCATAACTTCTCTTGTTCCTATGTGATGATTGTCTGTGGAAGATTAGACCTTTAGAGTTGGCAATACTTAGAAGGTTATTGTTCCATTTAATATTACTCTCAAAGTTAGGCACCTCTGTTGATTTCAATCCTTCATGAAGTTTAACGGACGATCCGAATATCCCTCAAGTCCTGGATCTTCAGAAAAGGACCGACCAAAGTCTCCATGCATTAGAATTGATATGGATATCAAAGAGGGTCAAACAATAACTAGATGTTAACTTTGCAAGCAACCTGGTCTTGTTGGAAAAGAATACACCGAAATGTTCTGCAATTTAATGCACAAAGGTAAATTTTATTTTAATGCTTAAGCCATGATCATTTTAGTTATTTTATATTCTCTGGTCTTATATGTCAATATGCATAATTTTTGTTAAACGAAAAATATGTACAATGCCAAAAAAAAAAAAAGATTATTAGATGTATTTTTTCGCTATTCATAATTCTTCTTTTCGTTCATTTATCAATTGGCTTACAAGTTATCCTACAAAATTAGCTGGGGTGGTTATTTTTTCTGGTTCCAGAAAAATTCAAGATTATCCTTTGAATAGATTTATTTTTATTTTTTATTATCTTATATCAACCTGTTTATATAAAATGTAAACTGACAAGAATTGTTATTGTTTTATTTTGGGATAATGTCACTTTTGATACTTGTACTTTCACAAAATATTTAATGTGATATTTGTACTTTTAAAGATGTATATGTGGTACTTAAACTCAATATATGTTTTATTATAATACTTGTCCTTTCGTAAAATGTCCAATGTGTTACATGTACTTTGAAGATGTCTAATGTGGTACATTAATTATCAATATATGTTTCATTATGGTACTTATTAACAACGATAGTAAATTGCTAAATTAACCAATAAAAATGTGACACAATCTTTTTTCCAAATCATAAAGACTACATGAATAATTTAACATTATGCAAAAAATTAAATAAAAAAATTAAAATTAAAAAACAAGTAACCATATGGTTGATAAAGAAATAAGTAAATAGTAAACTTACAGAAAAGTACATGTATTTTCATGGTAAAAAAAATCATTTCAAAAAGGAAAATTTTATATAGAAGATGATGTTTTTGTTTATGTAAGTTTAATGTTTATTTCCTTTTTATTAATTGTATGATTAGTTATTTGTTTTTTTAATTTAATTTGATGTGTTTTCTTTATTTACTTTCTCACATAATGTTATATTATCTGTTTGGACTTGATGATTTGATAAAAAAATTACGTGTTGAATTTTCATTGGTTGGTTTAGAAATTTTCTAACAGTGCTATTAGTAGGTACCATAATAAAACACATTTATAATTTGAGTACCACATTGAACATTTTATGAAGGTACAAGTATCATAAAAAAATACTTATTAATAGTTTAGGTATCATATTGAATTTTTCAAAGTATAGATACTATATTTTTGAAAGTATAAGTACCAAATGTAGCATTATTCTTTTTATTTTTTATTTATAAAAAGCTTACACCACACGGATTTGTTTGTCTTGGTACATTTTCAACTATCTAAAATATTATTTTCGATAGTCTTTTTTTTTTCTCCGACATCAAACTATTTTTTTTTGTGACTTCGAAGATAAAAAACAAACACAAATTACAAATACTAGCCCAATTCCCCAAGTGGAGATACTTCAAAAATTCACAACTCATGGCTTTCCCTATGTACCAGCTTGACCAGTCTGTCAGTCTCCTGATTGTCTTCTCTAGAAATATGTGAAACACTCCAATGATTAAACTGTGTCAGCAATTGAAAAATCCTCTTTATCAAGGTCGAGTTAAATCCTTCTGTCAGACTCTTTTGAATAATCTTAATTGCTTCAAGACTATCAGTATGAATAATCATGTGATCATAACCCCGATCAATTAAAGTACCTAAATCATCCAAGATTCTCCATAGCTCAGCCTCAAACACTGAGCAGCTCTCCAAGAATCTATTGAAGCTAAAAATTCACTCCCCATTTCGGTTTCTCACAATTCCCCCTGCAGCAGCAGAACCACTTTCATATATGATAAAGCCGTCATTATACAAACACGCCTAGTTCCCAACCAAATGTATAGAAGAAGTCAGAATTTGAGTCGAATAATTTAAAGTCATACCAGATGAGGCAAAATGTTTGGCCCAACAATGAGAAACTTTGATGGACTCAACATTACTCCAAGAAACATCTTGGAATATGAAGATATTACGATTCTTCTATATACACCAAATAATAATCCCAAAAAAGCATTGCCAAATTATGATGATTTTGTAAGTTTGAGGTGAGCCAGTCCTACAGATTGTTAGAATAAAATGTCTTGTCAATCAATGGGAATTAATAGATTCTAAATGTTACACACTGCATTACAGTCCCTGATAGCATGCAGTACATCTTCTGAGATATGTCCACAAACCCTACACAATGAACTGTGCTCGAGACCTCGACGAACCCTTTCCACATTTCTCATCAGCCTCTACTTGAACGCAAGCCAAATGAAGAATCTAACCTTCTGGGGTCCTTGAAACTTAAAAGGAAAAGTGCTACACATCCTACTTTGGTTTCCAAGATGATTCCCAAAGTTTACCATATGCTTTTAACAGAAAAGGAGCCTGTCGAGGTACTTTCCCATATAATTCTATCAGTACCTACTGCCAAATGCGATGGGGGAATCCCTATAATCTTACAAATTATCATCTTAGGCAACCAAAGTTGAAACAAATCTAGATTCCAAGTGCCATTACCAAGAACCATATCACTCAAAACATAGTCCAAATCAAGGTTCATGTGACTAGGAATCATTCAAACAAGAGGCCCCACACCTAGTACCCACGAATCCTGCCAGCATCTGACACTTTTCCCATCTCTCACTAACCAAAGCAGATTCTCCAAGTAAGTGGCCAAACCTTTATAAGGGCTCTCCACAAAAACAATCATCTGTTGCGCGATAATGAGTCGGGCAAACTTTTGCAACCTCATATTTAGCTCGGAGAATCTAGACCCAAAGAGTTTTAGAATCTGTCACAAGTTTGTACCTTAAATTCATTATAAAAGACGTGTTAGAATCTTGAAGCTTCCGAAAACCAAGACCTCCATGATCTTTAGGCTGATAGATATCTTCCTAGCTAATCAAAGCCATTTTCTTGCCACTACTCGAAGATCCCCAATCAAATTGATACACCATATGTTCAACTTCCTCACACAAACCTTTGGGTATCATCATTGACCGCATAAAGTAACTAGGGATCACCAGTAAGACTGATTGAGCCAGAGTAGCCTTACTAGCTAGAGATAACGAGCTTGCATCCCAACATCACAATTTGCTCTGAACCTTGTCAACAACAAACCACAAAGTGTTATTTGTTACTTTTTCATGGAACAAGGGCACATCCAAATATTTCCCAAGATTTTGGACTTTTCGAAAGCCAAGAAGATTGCAAAATCTATCCCCCATATCCTCACACCATCTGAAAAAAAAATATTAGTTTTATTAGCATTAATCTTATGTCCAGAAAAAACATAAAAACTATCTAGGATTCTCTTCAGGACTGTGGCTTGATCCTCTTCTGCTTGGCCAAACAAAATCAGACCATCTGCAAAAAAATAGGTGAGACAGGGGAGGACCTGATTGAGCCAAGTGAATAGGCATTCAACACCTAGAATTGACACTCGAATGTATATTGTGGTCGAGCCATTCCATACATAGAATGAACAGGTACGGTGAAAGTGGACACCCTTGACGTACCCCTTAGTTGGACGGGACTTCTGTGTTGTTGTGTCATTCCACAAAATTTGCATGGTGGAAGTTTTGATAGCTAACATAATAACATTAATTAAAAAATTTGGAATACCTGCAGCTTGGAGAGATGCTTCAATAAACTCTCATCGCACACGATCATAGGCATTCTCAAGATTAATCTTAACTGCAAACCAGTTAATAGACTTTTTCTTAATCCTTATAGAGTGAAACACTTCCTGAGTAATAATAATATTATTTGTAGTGCTCCTTCCTGTAATAAAACCAATCTACTCTTGGCTGATAATTTTTGAAAAAACCAACTTAAACGGATTGACAATGATCTTCATCACCAACTTATAGAGAACCGAGCACAAACTGATAGGTCAAAACTGAGAAAAACATTTTGGAGTTTGAAACCTTTGGAATGAGAACAATTAAAGTATTGTTGAGCTGCGGGTCCATTTTTCCCCTAGCAAAGATATTTTTGATCCATGCACAATGTAACACCCCGAAAGTTGCTACAGTAAGAAAGTGAGATATTATCTTTGATATAGTAAAATAAGAAAATAAAATGAAAAAAAAGGGAAAAGTTTGAGTTAGGTAAACAAAATCTGTTTAGGAAGTATATTATGATGTATTAATTCAAGAAAAGACTAAATAGCAAAAGTGAGAAAAGTTTTGTGACCTAAGAGTAAATACTCAAAATTTGATGGGTTAAAGTGTAAATTTGAAAAAGTTGAAGGACCAATAGTGCAAATATTTTAAGGGTAGAAGGATCTAGAAAATAGGGAAAATGGATGAATTAGGACCAAATTGAATAAGTGGAAAAAATATAAGGGGTTAAATTGCAATTTTACTAGAATGAGTAATGACTCAATGGAGGAATTTTGAAAGATCATAAAGGGCAAAATAGTTATCTAGCAAGAAAGATATTTGAAGAGTAATGATGATGTTGGTGATATTTTAGATTAAATAAATAAATATTAGTTTATTAATATTTTGATTTGACATTTAATTATATTTAATTATTATATTTAGTATATAAGGAAAGAAAGATGAAGAATTCTCTTCATCTTTCCATGGTTCCAACGTGAGAAGAAGAAAAGAAAGAAAGAAAATTTTTCTTTCCTTTACAATTTGGTCATTTCACCAAAAATCCTCCATTTTCATTTTGAAATCAAAAGAATTTCTATAGCCACCAAGAGAGAAAAATAATAAGGAGACTATGGGGAGCTAGAATATCAATTTAGATTCGAGAAAATAGAAGTTGGAGGAGAGAGAAAGTTAAGTTAAAGTTTGGTTTCATTAAGTTGATGTGAAAAAAGAGATAGTGGAATTAATTATGTGAATTAAGTGAGATGTCAAAGAAAAATTATGTAATAATGAATAGAGAACTTTTATGAAAAAAGGTGATTAAATTGGAAAGTTATAAAAGTTTACAAGAAAATATTGATAATAATGCACATAGTGAAAAATAAAAGAATATATGAATATTGTAATCCAAACTAAAATTATTTCCTAAGTTGTGGAAATTAATGGTTAAATCGTAAATTTGAGAAAATTTATATTAGAAATAGAAAAGTGAAGTGCATAACAATTAGAATGAGAAAAATTGATGTTGTAGTGAATTTTGGAATATTAATAAGTATTGAATTATGTTATATGTGTTATTAAAAGTAAATATATTGTTATACGAAATATTGTGCTAATAACTAAATTACAAAATATTAAAAGTGATATGTGAAATACATGATAAGGATTATGAGAGAATTATGGATGAATATTGAATTTAGTAATATATTACATGTATTAAAGATAGTGAAGATATAAGTATATGGATTATTGTTATAAGGATTAAATTGTAAAGTATGTAAAAGCATTATGCGAAAAGTGTAAAAGTGATATGTGTGTATGATATAAATTGCCCAAGTAGACGAGATTAGAACTACTAGGATATTAGTGGCATGCCATTAAGGGACCCTAGCGCGCTCTTCGATTATTAGTACGTCAGTGTTATCTGATTAGCACATTTGTGCTCTTTGTATAGCACTTTAGTGCTCTCTGTTCAATAGTGCATAATAATGCACCTCTGTATCAGTTTCATATATATTAAGTGTTCTGTTTAGTCTACTGGGCCTTTGCTAAAAAGGTAAACAATTTTCGTTACAAGGTAAAGGTTTATCTTTGATTCATGTTTGAAATAATGAATTAAAATAAATTGTGAAAGAAATAGTGAGAAAATCATGAAAAATTACACTAAATGGTGAAATATGATACATGTATAAAAAGAGTAGTAATTTTTATAAGTTTATTTGAGGACTTAAGGACTAAATTGTGAAATATGTAAAAAGTTACAAATGAATATGATAAATAAACAAAGAAACGAGATATTGGAAATTAAGAAATTTAATAGAGTTTAAATATCATGGGTACTTACTAAGTCTTCACTGACTTAATGCGTTTATTTTCAACGCGTAGGTACAGTGCTTTTGAAGAGTTGTAATTGAGGTCATGGACATCCATCTCATCACATCTCCAAGTATCAAGAGGGTATGTTTCAAAATTTTGAATAGAATGACATGTACTTAGGAAGATCAAGCGTGTTCCAAGTAGTAGGGACTAAAATATAAGTTATGAAAACTTTATTTTTTTTAATGTTCAAACATATTAGTGATTAGCCAAAATCACTTTGGCACCAAATGTAATATTCCTATATCAAGTTCCTTTGGGTCAAACCGGGTATAGGGGTGTTACACATAAATCGAGCCCCCAATATGATCTCACTGACTCTGGAAGAAGAGAGCTTGATATCCATCACTTTCTAGAGCCTTTAGAGGGTCCCATATCAAACAAAGTGGTCTTTATTTCCTCATCAGTGATGGGCTTCAAAAATTGGGTCTCGCCATCCTGAAGTTGCGAGAAAGAACTAGTAGGAAGTCCCTTCATCGGTCCTGGGTCTTTACCATATAAATTGTTAAAAAATCAAATCGCCTCATGCCGCAAGTTTTTATCATAAAAAATCCACTCTCTTTTATTATTTTTCAGAGCCACAATTTGACTTTTCTTTCTTCTTCTAATAGTATGGCTACAAAAAAATTTTGTATTTCGGTCCCCCAAAGAGAGCCAATCACATCTCGTCTTCTGTTTCTAGAGAAGTTCTTCGTGATACAAGACCTGTTCCAGTTCCTCCCTAACTTCCAAATCCAACTGAAATAGAGAATCCGACTAAGAATAATCCAAATTATGCTGAATAGAATGAAATTTATGAAGCAACCTTTTTTACGAGACCCAATGTGACCATAAACCTGTTTGTTCCACTCTTTTATTTGACTTGTAAAGTTAGCCACTATATTTGACATTGAGCCATGAAAATTCCAACTCTTCTATACAAAGTCAGTAAACTCTGAATGTTCAACTCATCCTGCTAGAAACTGAAAAGGACATCCCATAATAGAATTAAGCCTAGGATGAAGTGATAAAAACAAAGGCCTGTGGTCAGACTTGAGTCTAGGGAGGTGAGTCACATAACAATTTGGAAAAGACACAAGCCACACACCATTCTTGATAAATCTGTCTAACTACTCATAGACTCTACCTTTATACCACGTGAAAGGAGCCCCTCTGAATCCAAAATCATGAACCCCAGTCGTATCCATAAAATCCCCAAAGTAAGAACATCTTTTCCCACTAACTCGCCCACCTTTCTTTTCGCTAGAGGCTTAAAGCGTGTTAAAATCTCTAACTACCACCCAAGGAGAACCATTACTTGGAAAAGTCGCATTTAGAGCGTCCCAAAGCCGTTTTCGTTTACAACTATTAGAATTATAGTAAACAAAAATAACAAAATGGGATGCTGGGAAGAACTATCGAAAACACGAGTTAAAATAAATTTAGGATGGCTTCGAAGAATTTCGACTTGAAGTGACTTCTTCTATCCAATCCAAATACCTTTAGAGAAACTGATTGCTTCTACCTGGTGAGAACATTGAAAACCAAGATTAAGGATAACCGAGTCAACTTTTCCACCACTAACTCTTATTTCTAACAGACGCACAATATCTGGTTTATATTCTCGATTATATTCATGAAAAATTTGCAAAAACTTGCTACTAGCACACATTTGAAAATTCCAAGAAAAATAGAAATAGTCAAATAATAATAAAAAATAAAGAAGGTAAAAAGTAACTATAAATACTAATTAACAACCTCTTTCACAATTTTTTCCATCATGGTTCAAACTTCCCTTCTCAACCTCTTTCTTGATCTACGAGCTTATGAGTTTGGCCATAGAATTCATGGAGTTTAATAGCGGAACCCTCGCATTACCTGAGTTTTTAAATCATTCCCCACGGTCCCAAACGATTTTGCTAATAGCGTCGCCACTTCAGATAGAACCACTTTTAGCCCCTGAACCCTTCCTTTTGAAATCATTATTCCTTTACCTCTTCCAAAAGAATCAACACCTTCATTTGAACTGATATTTTTAGGTAGCTCATTATCCTTGAAAATAATAACTAAATGTCTCATAGGGTCAAGGACCTCGCTATTGAGTTTCACCATTGACTCAATAGGATCGTTGAAGGTAGGGTTAAAATGGGAATTCACACCCATCATGATTAGATCATCCATAATATGCGAAGCCCCCAAAACTTGATTTTACTTCATACCGTCTTCTTTCAAAGGCAAAACAATATCCAATTTATTCCCATTTCCAAGCTCACATTGACCAGTCTCTGTTAAAATTGGGTCTCCGCTTATTGCATTTTCTATAACCCCCGAATCTGTGTCAATACAAGGTGGACCATTTTGTATACTCGTATTTGCTCCAAGCCCAACCTCTATTAGAGTATCAGTCTCAGGGTGAGTTTGGATGGGTGGTACGTTTACCTGCGGTTAGTGTAAAAACAACGGTGGCGGTGAGATTAGATACTATAGCGATACTGTAGTGTGAGACAAAAAGTAAGCTAAACGCACCACACCGCACCCAATCACCCATCCAAACCCACCAGCATCTATGGCCCAAAAGCCTCTATCGTCTCCACCACCTTATATTTTTCCAATGAGACTTCCACTGCCGAGACTCTATCCACCTCTGTAATGTTCGTTGAGCCGGAGCTAGGACAAAGATTCTGCATGTGTCCAAACCTGCCATAATAGAAGCACACTAACGGGAGCGATTCGAATTCAACCCTCTGAACCACTTTCTTAACCAGGATCTGTGAGATCAGAAGTTTTCCCAGATCGATGAACACTGCCATTTGGGTAAATTTGCCTCTCGAGCCCTTGTCCATCTGAAAGTCGAGTTTCGTGACTTTACCTATCAGACTCCCTATCTATTGCAAAACACACTATTTGTAAAGGTCACTTGGCAGACCAAGCAACCAGACCCAGACCATAGTGCTACTGGGAAAGTCTTGAAGGGGATTAAACTTTGGGGGTCCACGATTGAACAGTGAGGTACTGTCTGATCACGATCCACGACCCTTGGGGGAGAACTTTCTTGTAGTCCTCTCGGCTTTGAAATCTAGCTAGGAAATATCCATTTTCAACATCCATGAGATGGAACTATTGTGAGGGTTTTCAGAGGTTGTGAATCCTATTTTGTAGGAGGGTGTAGGATAAGTTCCGACCTAATAGTTTAACCACCACTGTGGTCGTCATATCTCTAACGACAATTTGTTGGATCCTTTCGGAGAAATTGATTGCTGGAATTCCATTGACATTAGTCCTCATGATATCTCATTCTATAAAGTCAAAGTCCTCATCGCAACCAGATCCAGAAATCCCTCGTCCCAGAACTTTGTCTATCCAAGACATTCCCGATGTTGGTGTTGAATCTACGGCCATATCGCTATTCGAATTTGAATCCAAGTCCTTAAAACGAACTTTTTTGGTGTTCCGATCAATCGAGTTGTCACCTCCGCCATCCTCAGTCATCTATATCAGTTGATTTTATTTTCTCTTATCAGTGCTTTGATTAAATGATAACGATGTTCACATCAACATATATTTTAATGTTTTAGTAGGTACCTAAAAAAGCATAAAGTTAGTTTATGTTTTCCAAGTTTTTTTTCTTTTCTTTTTTAAGTATATATAATTCAACACAATTCAAATTTATTTTCATTCATATTTATATATTTGATAAAAGCATCTTTATTATAACTAAATGACCATAAAATCAATGGGAAAGACCTTGCTTATGCTTGTTATTAGTGCACCCCTCGATCATGACCTTGATTACCTTAGCACAATTGGGTTCGACCACCACCTATCATAATTTATCTCCCTTAACCACGCCATAACTTCTGCAAGATCAGGTGCCAAGCTTCCTAAATTGTGCCCAGTACAACATTTCACCAGAATGTTGATTGCGTCCCTGTTACGCGCCATCCACCCCGCTGCATTTTCATTCTCCAAAGTGATTGCATCAACATTACATTTGGTCCAACAACTAATTTACCTTTTAAATCACCCAACTTATCATTTAGTTTCACATAGATCATAAATCTTTAATTTAATAATATCACATCATTTGACTTTTAATACTGGCAAACTGTTGAGAAGCATCAAACGGTTGAATTCATTTCACAATAAGCTTATGTTAGAATTAAGTGACCCAAATCCTTATTTAAATAAAATACTGTGGTAAAATAAAATAAAAGTAAAATCCCAATAGAATTATACTTCTTTTATTTTATTTTAGAATAAGGTTTCTAAACCTTATTAAACTCCATCTATTTGATATTATTTGAATAAGGAGTTTCACTCCTATTAGAATAAGGTTTACAAGCCTATAAATAGGCATAGTCTACTCCTCTTGTAATTAAGTTTTTTCGACATAGTGAATTTTCTTCTCCTCTGCCCGTGGTTTTTTCCCGAAAGGGTTTCCACGTAAAATTTGTGTGTTCTTTATTTTTCTATTTCTATTTTTCTTTGCGATATATTGTCATTACCGACATTATATTTTTCTCAAATTGGTATCAGAGCTTCCGGGTTGTTCATCTCAATCACGGTAATGACATTTTTAACCTCCTAACTATATTTAACAACTAACCAACTATATATAACTAACATCACTACATTCCCCCTCAAGTTGTGCCCCCAATTTGGATAAAAGATATTTATGTTGTTGAATTCCCAGACCTTTTGATAATATGTCAACTAGTTGTTCCTTTGTTGTGACATGTTTGGGCTAAATGGAGATTTTCTCATATAAAGTGAAAATAAATTTCTATATGTTTAGTTCGCTCGTGAAAGATATGTTGGATAATTTGAGTTGAGATGATAGATCTGGAGACAATATAAAATTAAAACAGTAGACTTCGAGGCACGAGTGACGCTTTCCAAATAGAACAATTTGCCCCCACACAATTTCTAGAGGGTTAAGAAAAGGTCTTTTCGGGACATAATGAAGACTTTTTATTTCTTTTGGTTAGCAAAATCGAGGAATTCCCTAACTCTTACTCTAATTTCTAAATTTGGATTGATTGTAATAATAATGTTTTGAGCTCCATAGTCCCTCTATTTATACGCACTAAATGGAAACTATTAAAGAGCCACAACCATTCATATTGGACATACTTTTTAGAAGAAACATATCCCATGGAAATAAAATGTATCCATTGGACGAATGAATCATCACTTTTTAATCCAAATAAGTGCTCATGAATCACACCAAGTGATCCATTAATAATATTTAATGAATTTGAAATCTACAATTTCCAACAATCCCCCACTAGATTGCTAATTCCAGAAAATAAGTACACAACGATCATGCATAAAGAAGGGTGTCCACAGATTGAACCTTCCTTTAGTGCAAACTCTTAAAGTATCAACAAAGATAATGATGGCTAGTCACTTGAAGCATCACTCGTCAATACCGAAAAAATTACACACATAACCATAAAGTATTAGAGTAAGAATTTATTTGCTTTAGCACTGTTATGCTCATGTGGTCATCCCGTTTCATGAACATGTACGAGAGAAAACCATAAAGAAAACTCTCGTTGAAGTAACACCACTTCATGTCCATGTAGGTGGATTTCATGACAATAAATGTCCATCCATTAAGAGTAAAACTCATCCTCTTAAAACATAAACACTAAATCCTGATTCTTAGTGCACGTTGTCATTCGATAACTTGTTATTACCCTTTGAACCTCGAAACTAACTTTTGGCTAGAAGAAAGTAGGGTTTCCATTATCAATGACGCGATTAGAATGATTTTAATCCTATCTTAGTGGTGGTACTCTTAACCAAATCCCTCGACAAACCTTTTGTTAATGGATCCACTAAATTGCCCATTGACTTAACATAGGTAATAGTTATCACACCGTCCCTAACCAGTTGTTTCACATACTCATGTCTCAAACTTATATGTCTAGACTTTCCATTATACACCTTATTGTACGCTCGAGACATGGTGGATTCACTATTACAATGTACGAAAATAGCAAACCTACGTTGTGGCCATAACTTTAGATCTAGCAAGAGATCTCTTAGCCATTTCGCTTTATTGCCAATATCCGCCAACACTATAAATTCAGCCTCCATAATTGAATGTGAGATGCAAGTTTGTTTTTTGGAGGCCCAACTAATGACTCCACCTGTGATTGTAAAAATCCATCTCGATGTGGACTTATTGTCACTTAAACTTGTAATCCAACTTGCATCCGAGTAACCTTCTAGTATCACGAGATAATCACTATAGAATAATCCCAAATTTTTTGTTTTCTTAAGATAGTAAAAAATCCTACTAATTCCTTTCCAATGATTGATACTAGGAAAACTTGTAAATCTCGCCAATTTGCACACAATAAATGTTATATCGGGTTTAGTGCAATGTATTGCATACATTAGACTTCCCATTGCGCTGGCATACTCAAGTTGCACTATAGCCTTGCCATTATTCTCATTTAACTTGAAGTTCAAATTGAATGGAGTTTTCGAATCCTTAATATTCAAGTGTTTGAACTTCTCCAATAATTTCTCGATGTATTGAGATTGCTTTTGTACAAAGCCTCTTTCATGCTTTTGCACCTTTATACCTAGAATTGTATCTACCTCGTTGAGATCCTTCATCTTAAAATTCGAGGCTAGATACTCTTTGGTCTCACGAATGCCTTCCAAGTTCATCCCAAAAATCAACAAATCGTCTACATAGAGAAAAATAATTACACTGTACATATCGCTGAATTTAGTGTAAATACATTTATTCGCACCATTATGTAAAAAACCATATGACAAGATAATCGAGTCAAATTTCTCATGCCACTTTTAGGTGCTTGTTTTAAACCATATAATGACTTGATCAACTTACACACCTTATGTTTATTCCCAGGAAGCGCAAAGCCTTCTGGTTGCTCTATGTAGACTTCATCTTCGAGATTACCATTCAAAAAAGCTGTCTTAACATCCATTTGATATACATGTAACTTATGGATAGATGCAAGTGCCATGAGAATTCGAATGAAGGTCATTGTAGCCACCAGTGCATAGGTGTCAAAATAATCTAGGCATTCCTTTTACCTGAATCCTTTTGCCACCAATCTAACCTTAAAGGTTGGAGAACCCCTGATTGGATTATTCTTGTAAACACTCATTTACACCTGATAGACTTTGATCATTGAGGAAGATAAACTAGGATCCAAGTATTGTTGGACAATATTGAATCCATTTCATCATTGATCACCTCTTTCCAAAATTCTGCATCCTTAGAAGTCATGGCTTCACCATAGGATTATGGATCACCATCCACATTAAACATTATGAGGATCTTTCTAGTTATGGATTCTCCATTTCCCTCAATGAGGAATGCTAGATATTGCGAGAAAATGAAATCGATACCAAAGTCCTTTACTTTTCTCACTCCTTGACGTTTCCTCAACTTCGTATCATTATTGTCACAAAGACATCTCTTGGTTTGATCACTTGAGATCATTGGTTGATATTCTTTTCCGAATCTGGTGAATCATCGAAAACTTTATTTTTAATGAATACAACATCTCTTATTTCAGTTATCGTATTTGACACTAAGTCAAGAACATTATAAGCCTTAGAGTGTTGGGCATATCCAAATAATGCACCTTTGATGGCTTTTGGTCCTAACTTTTTTCTTCGTTGGTTGAGAACTCTATAGTAAGCCAAACACCCCTACACTTTGAAATAATCTAATTTTGGCATCTGACCCTTCTATAACTCATATGAAGATACTTAGAATTTTCTTGATGATATTCTGTTAAGATATAACATGCAGTCAATAATGCTTTACCCTATAGATTATATGGAAGTTTAACATTTAACAATATCAAGTTAACCATATCCATTAAAGTACGATTGTTTCTTTCTGCTAAACCATTTTGTTGCAGAGTATAAGGTGGGGAACACTCATGTACTACACCTTGTTCCTCACAAAATACATTAAAATCATTTGAAAAATATTCATCCCCTTTATCACTACGAAGCACTTTTATTTTCTTACTAAACAAATTCTTAACCTCATTTTAAAAATGTTTTAACATATCAAAAGCATCCCCTTTACTTCTCATGAGATACACATAAGTAAATATAGAGAAGTCATCTATAAAAGTGATAAAATATCATTTTCTATCTCTTGTTAGAGTTACATTTAATTCACAAACATCTGAATGAATTAAATCTAACACTTGTGAATTCCTTTCACATTTATTAGGAAACAGTTTCTTGGTAATTTTTGATTGAATATAAACATCACATTTATTTACAAACTCATCGTTACTTAGACTGATACAACCATTCTTTTGTATATATGGCAAAGTTTTAAAATTAAAATCTGCTAGACGTGCATGCCGCAAATGAAAAGATTCAACAATATGAGTAAAAGAATTGACTTTATTCATATCAATGCTCAACTTGAACATGCCTTCGTTACAATATTCTTTTCCCACATATATATCACCCTTAAGCAGGACTAACTTATCGGATTCCAAGATAACCTTGAACCCTTTATTACACAGAAGACTTGTGGACACTAAATTCTTTCTCGCATTGGAAACATGCAACAGATTGATCAAATTCAATTTCTTTCCAGATGTGAAGTTAAGTTCCATCGTCCCTTCATCGAGCACCTTAAAATTGATTAGTTGCCCATAAGCACTTCACGGTTTGCCATTAGTTCATAACTCTAGAATTTTTTCGGTCATTACACACATTGACAGTAGCTCCGGGGTTGAGCCACCAATTATAAGACATATCAGTCATGGCTATGTTGAGTTCGGTAATCATACCAATTTTCAAACTCTCGATCCCTTCTGTAACCATGGCCACTAAGTCCATGTCCTCCACCATACTAGCTTTGAAAGTTGTGACATCTTGCTTCTTTTTGAGAAGTTTACAATCCTTAATGTAGTGTCCTTTCTTATTGCAATTATAACAATTACAAGATTTTTTCTTCTTGTCTTGTATGTTCTTGGTTTTGAATGTGGCCTTTCACTTACTGTTTCGAGAGTTCTTGGACTTACTCACATAGTTCACTTTATAACTTTAGGGAAGATACACCCCATCACGCTTTTGATTTTCCTCTTCAATACATAAATGCCTAAGTATTTTCTCCACAGTGAAGTCCTCTTCCATAAGCAGAAGTTTATTTCGATAATTTTTCCAAGACAAGAGAACTTCAAGATGATAGCCCCGACTTGTAACAATTCTGAAATAAAAAATTTTAGGTCACGAAGCCTACTTACAAGGACTTGATCCATGTTTGGGATACTATCGAGCATTTTGAATTCGAAATACTTCATTATTAAAAATTTATCGGTAACTTGTTGCTCGGTGTTGTATTTCTCTTCAAGAGCTTTCCATATTTCCACCAACGATTGCATTCACATGTAGAGATCATACAATCAATTGAACAAGGTGTTAAGGATGGGTCCACAACATGTGAAATTGTCTTCCTCGTGCTTCTTCTTGAGTTTGTCCACTTTCGTAATTTCTTGAGGTTTGTATTAGGGGTAGGATCCTCTATGGATTGTAGGTTTGGGTCCAGAACTTACGCTACATTCAAGATGGTAAGAAGGAAAAACATCTTGTCCTTTTAGTGATTGAAGTTTGAGCATCAAATCGGTCAAGTTTCACAAACTCTTGGTTCATCACTTTGAATATGGTGGTAACCTGCATTGCCATCTCCTAAATTGTTCTATTTGATTGTTGGATAATTTGAGTGGAGACGATAGATCTAGAGATAATATGGAACTAAAATAGTAAACTTTGAGGCACGGGTGACACTTTCCAAAAAGAACAATTTTCCCTCACACAAAATTGTTAGAGGGTTAAGACAAAGGTCTTCCCGGGATATGGACCTTTTTTTATTTCCTTTAATTAGAAAAATTGAGGCATTCCCTAAATCTTACTCTAATTTTTGAAAGTGGATTGATTGTAATAATAATTTTTTGAGCACCATAGTCCCTCTACTTATATGCACTAAATGGACACTATTGAACAGCCACAACCCTTCGTATTAAACATACTTCTTACAAGAAACATGTCTTATGAAAATAAAATGTATTCATTGGATGAACAAATCGTCACTTTCTAATCCAAATAAGTGCTTATGAATCACACTAAGCGATCCATTAATAATATCTAATGAATTTGCAATCTACAATTTCCAACAAGATAGGATTTACAGTTATTTGAATTGTTACTTTACTATCACAACACAACATAGGTGATCCTTTGTGCCTGTCACATCCCGAGATCAGGTTCGGAAGTTTTGGCCATACGAAGTTAAGGTTCACCATCAAAACTTGGGCGAACTGGGGGTTCACCAAGGTTCAAGCGAGCTAGGTGTTCGCTAGGGAAGTTTTAGCAAAGGGGTTTGCTAGCAGCATTGCACTTCAAATGAAGTGGTAAGGGGTTCGCCAGTTCCACTGCGAGGCAAGTTCATTAATGTGTTTGGCAACTTGAGATCCACCAGTCTGTGTGATGAACTGTGTTCGCCAGGTAAGTTGCGAACTGGGTTCGCTAGTCAATGTGCAAACTGGGTTGGCCGATCAAAGTTACAATCAAACTCAAATTAGGAAAAAAGTGATTTACCGTATCTAGGAATACTTTATGTACAAGAAATAAATTTCTTAAGTTAGGTTTTCCAAAGATATCTAGGATTCTTAGGTCTATAAATATGACCCTTAATTCTGTGAATTCTTTACTGAATATTCTGCCATTAAAGTCCCTGTTCTAAGTTCTGTCCGTAGCAATTCGAGTAAGTCTGTGTCTTGCTTAAGTTGATCATCTCTAAAGTTGGGTTCGCTTGTGTGTGTGATGTCTGTATGTTCTATTAGTAATTTGTTTGTTTGTTAATAACCAGCTGGACCATCTTCTAGCAAGGACAAAGCCAAAGCCAAACTCTTTTAAGTTTCTCTATTTTTTGATGAGTGATCAAGTTCAGATATGAATATGCTAACTGTCATGTTTTTCAGTTTATTCTGATATGTTTTTAAGAAATATGTTCCGAAACAAGTTCAAAGGCAGGTTTTCTGAAAAGCTCTGTTCTAAGCTACGAAACTCTGTTAAAAAAGATTTTTAAAAGATGATTTTAAAGCACTATTTAATGCGAGCTTCTATGCAAGCTATTGATAATATGAATGTTTTGAAAGAATGGTTTTAAACTGTGTATTTGAAAGGCACTTAACATGAGAGTTTTTTTAAGCAAACAATTTGGCTTTGCTTTGTACAAGCTCTCTAATTAGCTTTGCCTTAGTATGAGCTTTCTATTCTGTGTGCTCCTTAATGAGCCTTGTGATTGGTATAACAATGGTGTGAATACTCACCCTGTTAAGTCTCACTTTGGTGGTCCTTTGAGAGCATGAGCCTTTGTAAGCCTCACTCTACGTGTTTATTGAGAGCATGGGCTTTTGTGAGATTTGTGATATGTCTCATTCTGTTTGCTCCTTACGAGCTAGGTTGAATATAACTTATTCAATGAGATATGTCTTTTGTTTGATGAACCAGTTGTGTAAACTAAATGCCGACTCTATTCTTAATTTTTGATATGTACGAGCCGATCTCACGGCTTTATTCTAAACTCAAATTCATTTGTTAAAAAGAAATATAGCCTTGCACGATTTTAATGCGAGTCCCTTTTAAAAGAAATTTTTCGAAGGAAAAGATTTGTAAACATTGCTTTTAAACTGTCTTCAAAAAAATTGTTTTCAGATGCAAACTGCTCTTGCATTCTCAACTGCGAACTTAGCACGCAAAACATTTTCAAATTAAAGTTTTCTACTGTTTTCAAATATTTTTTAAGGCATGATTTAATGGTTTCTGATTATTCACTAAGTTCTCCCTGAACTCACCCACTTTTCTCTTACCTCTCAGGTAAGTAGATTGCGAGTGGCATTGGAGAGGTTGATGATTTGGCGAGACACCTAATTGGTATCGACGAACCATATAGATGGGCTATGGGTTGTTATATGATTTTTTTTCTAAGAATAGTTATAACATTGATTTGGTTACCCGAAAAATTTGTTTAAGGATTAGTTTAGTATGTTTGATTTTAAATTAATTTTATTATTGCGAACCATGTCTTGAAATACACATGTTCTTTTTCACTATCAATAGAATGATGTTATTCATGTACGTTTATTTTGTTTACTATTTATGGTTATAAATTACTTGTGTACTCTTGTATGATACATTATTTGCATAAGATTCAAAATTATTGTACATGATCCGCTGAATCCTGTGAACTCATGTTGTTGTGTGAGCCTATATTAAACTGCGAACCTATGGTTGTGTGTTTATCTGTAGCCTTTTATGTTGGTAAAAGTTTGGGAGCTATGTTTGAATGTTTTGCTTGATGTTTTAGAGTAGTGCGAACCTATTGATATTTTTAAGTATTTAGAAGTATTGCTTCACACAATTATATACTCTGATGTTTTGTGCATGCGAACCCTTTTGGTTTGTGTAAGAGTGTTTTTTGCGGCCTTGTTAAAGATTAACACTATGTTCACGTGCTTTATATATATGTATAAGTTGTGTGTTGGAGGTTAGGTTGGGAGTTAATAGAGAGTCACTTCGGTGGCTAATGTGGCACGCCAAATTTGGGTCGGATCTTTCTGACCGAGTTTGGGGTGTGACAGTGCCCAACACCAAGTTCCTTAAGCAAGCCACTTAACTGCACTAGTACAACCATTATTGAAGCAATACTTCAATATTTTGTTTCTATCGAAGAGCATGACATAATGCTTCTTTTTTTACTTCCATGAAAGTAAGGGATCCCCAAGCTTAACATAAAACCCCGAGACAGATTGTCTTGACATGGGACATGATGCCCAATCAGAATCATAATACACCACCAGTTGTATATCATCTATTGCTGGAATAAACAACCCTTGACCAAGATTCTTTTTTATGTACCTAATCACCCAAAGAGCTACATCGTAATGTGACTTCTTTGGCCACTGCATAAATTGACTAAGATGTTGCACCATAAAGTTATTTATAGCCTTGTGTCTATTAAGTATAACAACCTCCCAATAAGTCTTTGATAAAGAGTAATGTCAACAAACTCATTATCATCAGAATTTGCTTTTATAAATTCATCATACTTGCATGATGTCAAATTCTAACTTTGTTCCAAAAGAGTGATTGTCGTCTTAGATCCCCCTAACCTTGCATCATGAATCAACTCTAGAGCATATTTTCATTGGTTCCATAGTATACCAGCCTCGAACTGTGCAACCTCAATACCAAGAAAATACTGAAGATATCCCAAATATATCATTTTAAAATTTTATGCAAAATATTTTTAAGTTCAACTACAAGGTCACTATCATTATTGATTATTAAAAGGTCATCTACATATATAAGCATGAGACTAATTTATCTCAATTTCTCTTAGTGAATAAAGAATAATCATGTTTCCTCTAAACATAATCATTGCAAAGAAAAGCTTCAGTAAGCTTGATATTCTAATTTTGAGAGGTTGCTTCAAACTATACAAGGATTTGAGCAATCGACACACTCATGTCTCCCGCTAATTGTGAAAACCCTAGGGAAGAGTCATATACACTTCCTTATGCAAGTCGCCCTGTAGAAAGGCATTGTAAACATCCATTTGAAATAAAGGACAACCTAACCAAACATCAAAAGCAAGAACGAGATGGGCAATAACCTATTTAGCAACAGGAGAAAATGTATCATAGAAATCAATACTCGGCTATTGAGTATACCCTTGACCAACGAGATGAATTTTAAATTGTTCGATAGTTCCATCCAACTTGTACTTGAACTTATAAACCCATTTACAAACATAGGGGTCTTACCTCGAGGTAAAGGCCTCCAAATCTTGAATCTCGTATTTCACAACATTAACCCAACTAGGGTCCCTAGCTGCTTCTTGATAAGTATTTGGTTCAACAATATCGGATAGAGAAGCAATAAAATATTAAGCATGTAAAGGTAAATGATAATTAGTGATACATTGATAAATGGGATATTAAACTTTAGCAAGTGAAAAAGATGAAGAAGATTGAGAAGAGAAAAAAAAGTCTGTCAACCATGATGGCGGTCGGTTGGACCAGGTAGAATGACATAAGGGTGAAATTGGATTAGACAAAATAAGAGTAGGAGAAGAGGGAGGAATGTTGCAAAAAAATAGGATGAAGAAGATGGGGTGAGAGAAGGTAATGAAGTAAAAGGATGAAACAAGTTAGCAGGTGGGTCAAAAGGTAAGCTAGAACCTAAGGAAAGAAGTTAACGTAAAAATTATAGGAAGAGGAAATGGGAAATAAATGTGGTGTAGTAGACTAACATTAAAAAGGAAAAATCGTCTTATGAAATTTAACATCACAATTAACAAAAAAATGATTGGTAGCAAGATTGAACAAAAGATAATCCTTTTGAACAATGGAGTAACCCATAAAAGTAAAAGGTATAGATTGAGGTTGAAATTTATCTAAAGAATGAAGGACTTTAGCATAGCAAAGGAAACCAAAGACCTGTAAGAGGGACAACTCAAGTGGTTTATTATATAAAATTTCAACGAGTCTTCCAACCTAAAACTGAGGTCCGTAAATGATAGATAATAAAAAAACTAGTGAGAATAAATTCATCCAAAAATTTAGTAGGAACAGTACATTGAAATTTAAGGACTCTAGCTATTTCCAACAAGTGACAATGTTTACCATTAGGTATACCATTTTGTTGGGGCATACAGACACGAATCTTGATGAAAAATACCCAAATAAGAAAACAAAGAATTATACTCGACAATAAAAAATTCAGTAACATTATCATTACGAAAAATTTTATAATAATGAAAAATTGAGTTTTACCAAGGTAATAAATTGCTTTAAAGCAAAAAATAGCATCACTTTTGAGTGTAAGAAGATACGTACAAGTTGCTCGAATATAATCATAAACCATCGTAAGAAAGTAAAGATCCCACTATGTGTGGAAAATTTATATGGCTTTCGCAAGTCAAGATTGACTAAGGAGAATGATGTTTCAACTCGAGAATGACTAAAGGGAAAAGGTAAACGTGTTTGTTTAACTAGTAGAAAAACATGAAAAATATGAATATAACCATTGTTCAAAGGATTATAATGAAAATGGTCCATTTTGTTCATTTTGGAAAAAGGAGGCATGACCAAAGAAATGATGCATCGATTGTGGACAAAAAATAAGAAACTAAAGAAGGTGTAGCCTTAGTTGAAGAAAAATGTGGTAAGAGTAGATAAAGACCATGCCGCACTCTACCAAACCTCTTCACCTATCAATTGCAAAGGTCTTGTAAAAGAGAAATATGAATATAAAAAGAAACAAAAAATGTAAGTCACGAGTCAATTTTTAGATGGAAATCAAATTAAATTAAAATAAGGGATATAAAAAACATTGGTAAGCTTGTGCGAATGTGAAAAGGCTCGAGTACCCATATGAGAAATAGAGATAGACTTATCAATAGGAAATAAAAAAGATGATGGACAAGATGCATGTAGAACTAAAGAATCCAAACAGTGGATATCCGATGTCATATAGTTGGTAGCACCAATATCCAAAATCCAACGAGAAGCAAAAGGCTGTGAAACTATATCTGTTGTAACAACCCGATTTTTAGTGGTGCCAAAAAGGGTAGTTTTGGAACCCCATATTCGTAAAATGGGTCCATAAATATTAAATATAGAAATTTATGAAGTTGGTATAAAAGTTTATTAAAGTTTGGACCATCAATTTTGTTTATTAATTGTTTAATTAATGTACAAGGACTAAATTATAAAACTGTTATCGTTATAGATTTTTAATTGGCAAAAGGCTTAAGGACTTAAATTGTAATTAACCAAATATCCAAAATAGTAATTAAACTATTTTGTAACATGGAATAGTGGCATATGATGACATTCCCTCTAACTTTGATTAATGGTTAATTAATTAAGTTTAAGATAATTAATAAAATTTAGTTAATCCCTAATTATACTATATAAACTAAATTAAACAAAGAAGGAAAGAAAACCCTTATTGAAGGTCAAACTTTCGATCCTCAATTGGTGAGTTCAATTAAGTCATTTTCTTGTAAGTTATATGTTTTGAGGTCATGGGAGCTTGTTTTAGCTAGCCTATGTACGAATTTGTGAAACTGTTAAATTTTTTTAAGTTTCCATTGCTGATTTCTTGAATAAATTGGTCTTAAATTGATAGTTTTTAAGCTTAGATGTGAAAAGGATTAGATTGTAAAGTTTAACTATTAGTTTTGCACAAAAGGAATAAAGGGAATAAATTTTAAAAAGCATGTGAAATATCTAGAATAATAGATAGTAGGGAGTCCCTAAGGGGTGTAATTGAGATCGATTTTAAAATCGAGGCTTAAAATTGAAAGATATTTTTATTTTGGTTTTATGGACTAAATTGAATAAAATACAAAAAATTAAGGGGCATTTAAAAAATGGAATTAAATAGGTTCATGAATATCATGGAGTGATATAAATATGTTTGATATTGATGCATTGTCTAAAATAATTGTTTAGATCAAGAATTGAATCTAATCGGTGATAACCGGAGAACAACAAAATTGTGGAAGTCTTTGAAGTTTCAACTTGTTGTTTTTGCCAGGTAAATTCATATGAAACTTACTAATTTATTTGATGTTATGCTGAATTGTGTTTATTTCATAAATATGTTTAGTTTAAGGTGAATTTGGCATATTTTCATCAATTGGATTGAATTTCAAAATATAGAAATATTGTTTATTACGAATAGGTACAAAGTACAAAAATGAAGATGTTTAACATTGAATTACATGTGCTTGAATATTTTATTGTAAATTGACGATCGGGTCGAGCGAGGGGAGTTACATTTAGTGGTATCAAACCTACGGTTTAGTCAATTCTAGGACTGAAATGTAAAGCATGTTGAGTCTAGAAATACATGCCACAATAACCTGTGATAGTGTGATGTCTTCTGATTCGAATTGACTTTTTTTCCATATAGCTAAACCATGTCAGCCGAATCAAATCGAGTTGTGTCTAATGAAGTTGAAAGTAATATTTGTGCTTTCAAACAGGGAGCTTCCCGAAGTTTTCCCATTCCACAACGGCTAGGGAGTGAGGCAAGAGATGCCTTCTTCCAAATGATGAACTAGTGGTTCACCCAATATATGGGAGCTACCCCTTCCGCTCCACAACCTCAAATGCACCTTCCTTCCCCGATTGTGCCTCCTGTGGTACCCTTTCATCCTCAAGTTTCTAATTCGGTACCCATTAACCATCCTCTGATATATAAAATTTGTAAATGTGGGGCAAAATAATTCAAAGGCAAGAAAAAGGATGAACCAAAAAAAGTTGAGTATTGGATAGAAAACACTAAGAGGGTTGTTGACAAGTTATTTTGTATTCCTGATGATTTTTTAGGATGTGTCGTATCATTGCTCAAAGAAGAAGCATACCAATGGTGGATGACTCTAACGTTTGTTGTTCTGAAAGATCGAGTAAACTGGGAGTTCTTCCAAATTGAATTAAAAAGAAGTATGTTAGCCGACTATATCTTGAAAATAAAAAGAGAGAGTTTATGAAACTGAAACTGAGAGATAGGTTAGTAGTTGAATATGAATGAGAATTCATTTGCCTCAGTAAATATGTCAGAGAGCTTGTATTTAGTGAAGCTGAAATGTGTACTCGTTTTGAGTGGAGATTGAACGAGGACATACAAATGTTAGTAGGAGGTGTGGAATTGGAAAAGTTTGTTATTCTATCGGAGAGGGCTCAGAAAATGGAGGAAATGCATAAGGAGAAAAAGTAGACCAAACCTAAGATATGAGATTCTAGTAAATGGTGTATGGCCATATCTTTCCCAACTCATCCATCTAAAAAGTCAAAATATTTGTAAAGTCGTTTCTCTACTCCATTAGGGATTTTTGAGAGAGATGGGCCGAGACCGAGTATTCTGCAACCTCAGACTACGTCGGTAGCTAGTGTCAAAAGTGTTCGTAATGCAAATAGACCAATTTGATGACATTGTGGAAGAAACATAATGGTGAATGTAGATTGAAAAATGGAGCTTGTTTTCTATGTTGTTCCAAACAACATTTAAGAAGAGATTGTTCGAATAGGCCAGATCAAAGCAAGGAACAAAGTGTAAAGCCAGTGTCGACTCTGTAGAGGATTAGAAGACCAGGAACTGGTAGCAGCGCTGGTGCTAATCGAGGTGGAACTAGAGATAAGTTATGAGATTCGAGGCTTGTGCACCTACTAGAGCTTATGCTATTCGAGCCAGAAAGGAAGGTACTGCTACTAACATTATTGCTGATACATTTTTCTCTATTTGATGCTTTTGTGCCTGCATTGATTGACTCTGGGTCAACATATTCATACATCTACACCTCATTAGTAGCTTAAAAAATATACTAGTAGAATTGATAGAATTTGATGTTTGGGTAACCAACCTGTTAGGTTAAAGTGTTCTTGTCAATAAAAGTTGTAATGACTGTCAACTGGAAATTTGAGGCCGTAAGTTTTTAGCTAATTTGATGTTATTACTTTTTGATGAATATGAAATATTTTTCAGAATGGATTGGTTGACTTTTCACGATGTAGTGGTCAACTGTAAACAAAAGTGAATATCATTGCGGTGTCAGGATGGTGAATTGATAAATGTGAAGGCTGACAGATCTGATTGCTCGACTAACATAATATCAATGATGTTAGCTCGACTAACATAATATCTATGATGTCAACTCAATAATTAATCAAAAAAGGGTTTGAGGCATATTTAGCCTATATTCTAGATACTAGAGTGACAGGATCTAAAATAGAGCAAGTTTCGATGGTTTGAGAATTCACATACATGTTTCCCAAAGAGTTGTTAGGTTTCTCGCCTGAGAGAGAAATTAATTTTGTTGTTGAAATAACACCAAAACTATTTCGATTTCTATTGCATCATACAGGCTGACTCTGATTAAATTAAAAAAATTGAAAGCTCAGTTGCAAGAACTGTTAGATCAGGGATTTATCCGACCAAGTGTGTCACCTTGCTCCAATATTATTTGTGAAAAAGAAAGATGGAACCCTAAGATTGTGTATCGACTACTGGTAGTTGAATAAAGTGACCATAAAGAACAAGTATCTAATGCCCTAAATCGATATTTTTTTATCAATTGATAGGAGAAACAATGTTTTCTAAAATTGACCTTTGGTAATCCATTTGGGGTTACTAATGCTGTAGCCGATTTTATGGATTTGATAAACAAAATATTTCAGCAGTATCTGGAAAAGTTTGTTTTTGTGTCAACATTTCAGAATTGTATTACAGACTTTTCGAGAAAAGCAATTATATGCAAAGTTCAACAAATGTGAATTTAGGTCACGAGAAGTGGGATTCCTAGGTTACATTATATTAGCTAAAGGCATTCAAGTGGATCCGAGTAATATCTCAACAATTGTTAACTAGAAACCTTCGAAGAATATCACTGAGATACAAAGTTTTATAGAATCGGTCTGATACTATCGACAGTTTGTTAAAGGTTTCTCGATAATAGCCCTCCTATTAACAAAATTGTTACAAAATAATATCAACTTTGTTTTGTCAGGAAAGTGCCAGCAAAGTTTCAAACAGTTGGAAGCAATGTTAACAGAAGCTCTAGTTTTAAGTTAGGCTGAATCTGGAAAAGAATTTTTTGTGTTCAGTGACATGTCACTCAACTGTTTGGGTTGTGTACTAATACAAGAGGGAAAATTAGTTGCTTATGCTTCTTAGAAACTTAAGCCACATGAGAAGAATTATCCTACACATGATCTCGAACTTTCAACAGTGGTTTTTACTCTAAAGATTTGGAGACACTATTTGTACGTGGAAAAATGCCACATTTTCATAGATCACAAAAGTCTAAAATACTTGCTGACACAGAAAGAATTGAAATTGAGACAACGCAGGTGGCTTGAATTGCTTAAAGACTATGATCTGATTATAGATTATCATCCTAAAAAAGCTACCATTGTAGCTGATGCCTTGAGTCAAAAGTCCCTATTTACTTTAAAGGTGATGAATACCCGTTTGGCTTTGGAACGAGATAGTTCTATTTTAGCTGAGTTGATAGTTAAACTTATTTTTCTTCAAAAGATTCAGGAGTTGCAAAAAGATGATTCCAAGTTGTAAGCAAAATAGAAACTTGTTGAAGATAATCAGAGCAAAGAGTTCAGTGTTGATGATAACGTAAATCTATATTTTTGAAAGTGTTTGTGTGTACCGAATAATTTAGAATTGAAATGAGACATTTTGCACGAAGCTCATAATAGTACTTACATGATACATTTGGGCATCAATAAGATGTATAATGAGTTGAAACTGTTTTATTGGTGGCCGAGAATGGAAAGATAGAGTACTGAATACAAGTGGAAACACAGAAATATACACACTTTTTCATGCCTTTTTTAACTCAAATTCATGTAGTTTCAGTAAAATTCTTATCGAAAAAATATATAATAATTATAAAATACTTAAGTTGCACTCAAATTATGGACATGTTTAATTTTAATTAATTTTATATAAAATTTTGATTATTTTTTATTATTTTTGACAGATTTGCACAAAGGGCAAAAAATGGCTCGACAGACACTGCTAAAAGCACAAAACCGAGAAGCAATTTTGAAGCATGAAGGCGAAATAATTTTTCAGCATAAGATGGTCAAAATTATGTGTATTAATTCATAATATAATTAATTTTAATTTTAATCCAATTTAATTTGGGTTAAATAAATTACTATTAATTAATTATGAAAAGGGGCCCAATTGAGCTGAACCGAGAAAATTGAACCAATCGAGCACTGGGCAAGCCAAAATCGTCCAACATGCTGACCCAATCAGCTTGCTTGGCTGGTTATTTGGCTTGAAAAATGGCTCTTGAAGACTCCTTCAAATTTCATTCAAACCCTAGTATTTCTGCCTTTCTAGATTTGCCCCAACCTTAAAATAGCAAGTTTGAAACCTTAAAACTTGCCACTAGTGTGGTCGGCCATGGGGGGACTCTATGGCTGCTGATTTTTGCTAATTTTGGAAGCCATCTCAACCTATAACAAACCCCTTGGCTAATCACTTCAAGCACATCTTAAACTCATTCATTTCTTTACTTCTTTTTCATTTTTTTCTCTTCATTCCCTTCCATTGTTATTCATTTTCATCCCCTATTCCTATGCCGATTTCACCTCTTGAAAAAGAGTCCTTCAACCACCATTTGGAGTAGCATTCAAGTGTTCGTGGAAGCCTCGATTTAACAAGAACAAGCAGAGAAGGAGGAGCGGAGCAAACTAGTCAAGCCTCGGAGAAACACCAAATTTGATTCTTGTTCCTTATCTTTTTAATTTAATTGTTGTTGTTATGAACATGTTTATGAATATTTGTGATGTTGATATGTTTAATTTAGTTCATATAGCTTAAATTTAATTCGGGTTAGGTTGATTGCATTTCGTCTACTTGAGTTATTAAAATCGTGTTTGTGTTGTTACAGGCCTCGTTAAGATGTTTGATTAAGTAAAACCATGACTAAGTTATTCTTGCATTACAATTGTAAGGTAACTAATGAATTAATTATTTAATTGGATTTAAATTGTAATTATTGACACGATACTTAATTAGTGCATGTTTAATCATCTAAGGTAGCTGAGGGTTAAGTTAGCAACGGTATCTAACGATACATTAGCCTTGCATAACTTGCAAGATTATTGTGATTAAACTGTTTGAAGGTAGAAATACATTGTTACCTCACGTAATCCTTTATGTGCTTATGAGATTGAATTAATTGTTTGAATTGACATACAGATATGTACAAGAGATTATTTTAATTTCATAGGTATGTATGTGTATTAAAATATTTTCTTATTAAAATTTGTTTATTCAGTTGAATTGACATAGAGATATAGTCAAGAGATAAATGGATTTTGGTATGTAAGTATGTTCATAAGTTAGAAATTACCGAGTTACCGTGAATTTATTCGTAACAACATAAACATGAGTTTAATAATTCTAAGTTAAGAAATGTAATTAATCTAGCACAATTATGTCATTTTGAGTAAAATCATCTTTTGAAATCATGCATTGGAACTTTTATTTTAATTTTATTTATTTTACTTAGTTAAAATATTTTTCTTCACCAAAGTGTTTTTAAAATTGCATTCATAAATATTTTTTTTCACAGTCCTTGTGGGTACGATAACTCTACATTTACTTGTCACTTTATTACTTGTTGCGATTGTGTACACTTGCACATTCCTGTCGTTTCAAGTTTTTGGTGCCGTTGTCGGGGGACAACTTTAAAAATTCATTATTTGTGAATTTGTTAATTTTTCATTTTGGTTTATTTCTCTATTCAATTTTAACTTAATTAATTTTTCTGTGTTTTTTTCAAGTGTTTATGAGTATTGATCGAATTATCGATTTACTCCATGTAGACCCTGAGATTGAAAGAGCTTTTCGACAGCGGAGAAGACAAGCAAGTCAAAGAAGGACCGAAGAGATGAACTTCAAAAATCTGAATCAAGGAAATAGAGCAAACACTGCCCAAAATCCTATCCTTATTGCTGATGATAGGGATAGAGCTTTAAAACAGTATGTTGTGCCAGTGTTTCATGATCATAATTCGGGTATTAGGGGACCCAAAATTGAGGCACAACAGTTCGAGCTGAAGCCATTCATGTTCCAGATGCTTCAGATAGTGGGCTAATTCAGTGGAATGCCTACCGAAGATCCTTAACTTCACTTAAGACTATTCATGGAGGTGAGCGATTATTTTAAGTTAGCTTGAGTACCCGAAGATATGCTACGATTAAAATTGTTCCCATATTCGTTGAGGGACAGATCTCGAGGCCGGTTGTACTCATTGCCCCCGAATTCAATTTCCATATGGCAAGAGTTAATAGAAAGATTCCTCATGAAGTATTTTCTACCTAGCAAGAATGCTAAGTTGAGGAATGAGATCACTGCTTTCTAACAAATGGATGATGAGTCCTTGTATGAGGCATGAGAAAGGTACAAAGAATTATTACTAAAATGCCCTCATCACAGAATCCCATATTGCATCCAACTTGAGACGTTTTATAACGGTCTCAATGCCCACACGAGGATTGTAGTGGATGCTTTTGCTAATGGTGCTCTCCTTTCTGAGTCTTATAATGAGGTTTATGGAATCATTGAGAGGATTGCCAGCAAAAATTATCAATATCCAACCAATCGAGTAACGTCAGGAAGACGAGTTGCTGGAATACATGAAGTAGATGCTCTTACTTCACTCACATCTCAAGTATCCTTAATATCCTTAATGCTTAAAAATTTTACCACTAATGGGTTTAATAGTTTTGCAGCACAACCACCGCACCAATTTGAAAATGTAGCCTGTGTCTATTGTGGGGAAAGACATATGTTTGAAGAATATCCATCGAACTCAGAATCCATTTATTACATGGGTAACTAGAACCAAAACCGAGGAAGGCAGGGAATACAATCCAATTCCTACAACCCATCGTGGCGAAACCACCCTAATTTCTCCTAGAGTAACTAAGGGGTTGGACCCAGTAACACATATGCCCAACCTAGACCGACCCAGCCACCTATTTTTACCCAATAAGTTCAGAAACAACCTCAAGCTGAACCATCCAATGGCTTAGAAAACTTGTTGAAGGTATACATAGCCAAGAATGATGCCTTAATCAAAATCCAGGCAGCTACATTGAAAAACTTGGAAAACCAAATCAGCCAGCTTGCAACTGAACTCAGAAACTGACTACAAGGTGCTTTACCTAGTGATACGGAGAATCTGAGGAATTCTGGGAAGGAACATTGTAAAGCGTTGAAATTGAGAAGCGAAAAGACATTAGAGCCCAACACACTCGAAGTTTAAAAGGAGCCAACTGATGCTCAAGACTCAGGGGAAGTTCCATCGAGTGTTGAAATTCCAGTTACACTAGAACCAGAATATGCCAAATCTGATAAGGTAACTTCTTAACCACTTAATTTTGATAAACTAACAAATTCATTAGATGCAGAATTGCCACAGAAGACGAATAAACCAGTTCCAGTAAAGAAGCCTCCACTACCCTACCCTCAGAGACTTCAGAAGTAGAAGAACGAAGTTCAATTCTAGAAGTTTCTAGACATACTCAAGAAACTTCATATCAACATTCCATTGGTTGAAGCACTTGAATAAATGTCGAACTAGGTCAAATTCATGAAGGATATCCTGTCAAAATAATGAAGACTTGGAGAATTTAACACGGTAGCCTTGACAAAGGAATGCAATGCATATCTTTAAGACAAAGTACCTCCAAAGTTGAAGGATCCTAGATGTTTTACCATACCTTGCAACATTGGAGCAACATATTGTGGTAAGACACTATGTGTTTTGGGCGCGAGTATCAACTTGATGCCCATGTCAATATTTAGGAAGTTGGGGATAGGTGAAGTTAGACCTACTACGGTTACACTTCAATTAGCAGATCGGTCCTTAGCACGCCTAGAAGGAAAAATTGAGGACGTGTAGAAAAAATTATTTTTCTTACTGAATTTGTTATTCTAGACTTTGAAGCAGACAAAGAAGTGCCAATCATACTAGGAAGGCCTTTCCTAGCAACTAGAAGGACCCTTATTGATTTGCAGAAGGGCAAGCTTACCATGCGTGTCCAAGACAATCAGGTAACATTTAATGTTTCTAGGTCCATGAAAATTTCCTAACACAATTGATGATTGTTCTACAGTGTTCGATTTAGAAGAATTAATCATGGAAATTTAACTCAACTATGTTGAGGACCCATTGGAACAAATTTTGACATCAGAACCTCCAAGTGATGAAGAGGAATATGAATACTTAGCTTTGCTAGAAGCTAATCAAAGGGGATTTAATCTGTAATCCCTCTTTGAATCTTTGGAGTCAGAGAATTGAAATTATGCCCAACCAAAAGCGTCAATTGAGGAGCAACCTAAATTAGAACTGAAGGTACTTTCCTCACATTTAAAATATGTTTATTTAGGTAATGCTTCTACTTTGCCTGTGATTGTTTTAGTGGAATTAACCGTTGAGCAAGAAGGCTATCGGATGGACCATAGTCAATATTCACAGTATTAGTCCATCTGTATGCATGCACAAGATCATCGTGGAAGATGGCGAAAAAGGGATGATTGATGGACAACGAAGACTGAACCCCATCACGGAGGACGTGGTAAAGAAAGAAATCATCAAGTTATTAGATGAGGGTATAATTTACCCCATCTCAGATAATTCGTGGGTAAGTCTGGTCCAGTGCATGCTAAAGAAAGAAGGTCTTATAGTCATTGAAAATGATAATAACCATTTGATACTGACTAGAACGGTTATGGGATAGAGAATTTGCATCGATTACCAAAAGCTAAACAAGGCGACTAGGAAATATCACTTTCCTTTGCCATTTTTGGACCAGATGCTGGATAGACTCACAGGGTGAGACTATTACTGTTTTCTCGATGGATACTCGGGGTATAATCAGATTACAGTAGCACCGAAAGATCAAGACAAGACAACATTCACCTACCCATATGTATTCAGAGATACATATGATGATTGCCTAGCCAATCTAGCCAAGGTACTAAAGCGATGCAAAGAAACAAACCTCATACTCAAATGGGAAAAGTGCCATTTCATGGTACAAAAAGGTATTGTTTTAGGGCATTGGATAATGAGACATGAAATTGAGGTAGGTAAAGCAAAAGTAGACTTTATTGAAAAACTCCCACCTCCAACATCTGTAAAGAGTGTTGGGGCTTTTTGGGCCATGCCGGTTTCTATCGAAGATTTATCAAGGACTTCTCCAACATTATTTAACCCTTATACAAATTATTGGAGAATGACACGCCATTCAAATTTGATGAAGAGTGCTTAAGAGCTTCCAAGGATTTGAAGAGTCGATTAGTTTAGGCACCCATAATTGTCACACTAGACTGGGGTTTTCCATTTGAATTGATGTGTGACGCAAGTGACTTCGCGATAGGAGCTGTCATGGGCCAGCGAAGGAATAAGGCTTTTCATCCCATCTACTATACAAGCCGGACTCTTACAGGTGCTCAACTGAATTATACGGTAACAGAGAAAGTGTTACTTGCTATTGTGTTTGCTTTTGACAAGTTTCGATCTTATCTTGTAGGTACCAAAGTGATTATCTATACGAACCATTCAGCAATTAAGTATTTACTTTCCAGGAAAGATGCTAAGCCAAGACTGATTTGATGGGTTTTTCTATTTCAAGAATTTGATCTAGAAATTCAAGATTGAAAGGGAGTAGAAAACCAAGTAGCAGACCACTTGTCCAGATTAGAGCCGCAAGAAGGGAATTCTCCACTTATACCCATTCAAGAGACATTTCTAGATGAACACATACTAAATGTAAATCATGTCCATAATACCCCTTGGTTTGCTGATATTGCTAACTTTTTAGCTTGTGGTTTGATGCCGATTGATAAGACGTATCATCAAAAGAAAAGGTTTCTTCACGATGTGAAGTACTATTTCTTGGAAGAACCATACTTCTTTAAAAAGTTTACAAATCAAATGATTAGGAGATACGTGGCAGAAGATGAAGTGCATAAGATTCTATATCATTGTCACTCAATTCCGAGTGGGGACACTTTAGAGGTACACGTACTGCGGCCAAAGTATTGAAAGTTATATTCTTTCGGCCAACACTATTCAAAGACACATATGCTTCCATAAAGAGTTGTGATCGAAGTCAAAGGGTTGGAAACGTCACCAAAAGAAATGAGATGCCCCAAACAAACATCATTGAGGTAGAATTATTCGAGGTTTGGGGTATTGAATTTCTCAGTCCTTTCCCTCCATCTTTTGGTCACAAGTACATATTGATAGCAGTAGACTACGTGTCTAAGTTGGTTGAGGCCGAGGTATATCCAACAAATGATGATAAGGTTGTGATGAAGTTTTTGCAGAAGCATGTGTTCACAAGGTTTGGAACCCTTAGAGCTATCATTAGTGATGAAGGGTCTCATTTTGTGAACAGATGGTTGAAATGGTTACTCGACAAACATGGAGTGAAGCATAAGGTTTCCACAGCTTACCATCCGCAGACGAATGGGCAAGCTGAACTAGCAAACAAAGAGATCAAAGGCATACTCGAGAAGGTAGTTTGGCCGAACCGATGAGATTGGTCCAAAAGACTGGATGATGCTTTATGGGCCTATAGGACAACATACAAGGCACCTTTAGGGATGTCACCCTATAGGTTGGTCTTTGGGAAAGCCTGTCATCTGCCCTTGGAGTTAGAGCACAAAGCTTACTGGGATCTCCAACAACTCAACTCGGATTTTAAGCTTGCTAAAGAGAAACGAATGCTCCAACTCAACAAGTTAGAAGAATTCCGAATGTTCTCATACGAGAATGCCAAATTACTCAAGGAAAGACTTAAGAGATGGCATGACAAGCACATTCGAGTTCGAGAATTTGAAGTAGGTCAGCAAGTCTTGTTATTCAATTCTAGATTAAGGTTCTTTCTAGGTAAGTCAAAATCACGTTGGTCCAGTCCATTTACGATTCACCGATTTTATCCATACGGAGTTGTCAAACTTCAAAGTAAGGTAGGTAATTTTCGAGTCAATGCTCAGTGCTTAAAACATTACTGGGGGATAAAATTGAACGGGATCAAATTTCGTTCGTTTTATCAAATATTTAATTCTTCTTGTTTTTGTTTTTTAATAAATGATTTAGGGTATATTTTTGGGATTAGTATGTTCAAATAAATTCTGTCTAGGAGATTAGAACTTAAGCGGGACCGATTGTGACCCCTCCAATCTTTCCTAGGAATTGATTTTAACATAATCTTTTGAGAAATTTCCCTAAATGGCAAAATAAATTTTTAGTTTTAAAATAAAAGGGTCAATTTTGATCTACGTTTTAAATTGCAACTCAATTTTGAATTTTCCTTAAGTCCAGGTACTTAATTAAATTATTTTCAAAATTTGGTTTCTCTTTTTGTAAGTATTAAAAATTAGATGTCTCTTTTTGTAAATATTTTCAAAAGGCATCTAGAATAAATGTTTTTAATTTAATAAATAAGATGATAATTATTAATATATAATTATGTCCATTATAATATATATTAATTATTATCAACTTTGCATAGAATTAGGATTAGTTTAAATTTGATCATATTTTATTTAATAAGTTTTATTTTAATAAACTAATAACAAATAATAATTTAATATACATTATATTAATTATTAATTTTTGTTAACTTTATGTAGAATTAGAACTTAGAATATTTTAATTATTAATTTGTTCTAAGAATTCTAATTAAACTCCTACTCCTTTCATTATAAATTTCACCCACCTTTTCCATTTTTTCACTCATCCCTCAATTAAATCCTAGCATCCACAACTCACCAAGCTCCAAATCACCTAGTGCCAAAATCTCTAGCCGCAACACCGCCTAGCTTCACTCGGCACCCTCACCCATTCGGCCAGCAGCCCCACGCATGTACCCAGCAACCCCACGCACAACGTGTGCGCCACCAGCCGCTCTGTGCCGTTGCACCTGCCACTCGTCCGGCTCTAGTAGCTCGCCAGGCCTGCTCGACTCACTTGCTTACTGACCACTACCCTACATCCGAGCGGCACACACATGCCCTGCTACTCCTTAGCATGCTGTTGCCGCCTTGCTACTCACACCACACTATCAAGACACCCTACAACCATCCCTAAACCAACCTCTTTTGCTTTTGCTTTAGATTTATTTTCTTTGAGTTCTTAACTTTTATAAAAAGGTGGTAAGACAAATTTTTCTCCTAAAATTTCAATTTTATTTAATTATTTAAAATTTCAAATTATTGAATTATTAATATTTTATACTAATTAAATTTTTGAGAAAATATTTTTTCTATCTTATGATTAGGTTAATCATGCCTCGTAAAAGAACTCGTGCCTCTACCCAAATTGACGAATCACAAAACAAATTCCACTATGAAGAAGCTAAAGCGAGATACGAAAACATTTTCAAGAATCAATAGATGCACCCAGAAAAAGGCTTTACGCTGAAAAAAACAACTATATTGATTTCATGGCATGCATTCGACAAGTTGCTGAAGCTCTCAATTGGGAGTTGTTTTGTGAGAAAAGACCTAGTGTGGATGAGGAGTTAGTCCGTGAATTTTATGCGAATTTAATTTTAAGCGATTTGATGGAAGTTTCTGTTCGCGAAATCAAGATACCAATAACCTGAAATGCTATTAATGAATTCTTTGAATTACCTAATTTCAAAAACAACGAATATTATTCCTTGATGAGCAATATGGAGTCTAAAAATCTGCAACAAATTCTCGAGGAACTTACAGTTCCAGGTTCTAAGTGGACAGTGTCAAAGTAAGGAATTCACACTTGTCGCAAAGAATATTTGACACCACTAGCGAAGGTATGGTTATATTTCATTCGATTCAGCCTTATGCCTATTTCACATGGGACTACAATTTCATTAGAGCGAATGGTCTTATTATACTCGATTTTAACTGGAAAGACCACTGATGTGGGAAAAATCATCCTGAGAGAAATACAAAATTGTGCCTCTAGACGTTCTGGCCCAGCTTACTTCCCCTTACGATAACAATTTTGTGCTTGAAAGCTAAAATTCTTGCAAACGTAAAGAAAACAAGTTATAGCCAGGGCACAATCACAGATTGGGACCTCTACGGGATAGCCAGAGACTCAGTTCTACAGCAACGAGTTGAAGAAAGCGAGGATCCCGAATAAGAAGAAGAAGATCCCACAGAGATCAAACCGATGCAATCAGCTGAAATCCCTGATAAGGCAGAACCAATGGAACCAGTAGCCGAACCTGATGTCACAACTTCAATGTTTAGAACTCAATCGTCTTGCCTAGATCTTCGAGATGAGCTGTCAAAGTTGATGGACATAATGCAGCATATGCAGTGGCAGCAACAAACTTACTAGAGATATTCAAAAATACGGGATGACTCAATGAGAAGCGCTCTTACGAAAATATACAATAACCCGTTTATTTTTGTTCCTGATTTTCCATATTTCATATTTGAACCATGGAGTCCACTATCGAAGAAGAAGCAAAGACGACGGAGCAAAAGATGAGTCAAATTCGGAAGGATCTGCAAATAAATAAAAGGGGGAGATCTTGACTTTATTTTATTTCTATTCTTAGGTTATTTAATGTTTTAGGATTAGGTTCAATTGGGATTTTTATTTTTCGCATAATAAAACAAGAGGTGGAAATCATAAATAAAAATGAGCAAGTTGCAAAATACAAAGTGTGTCAATAGATATATACATGTCTAAGATTGGATCTAGAGAGAGCTTGGTACTTTGAAATTTTTCTTCTCAGAATAAATTTTTCTTTTAATTATGATTAGTATATATTTTGTTCAAAAATTTGAAATTTTGTTAAGTATGCTAAACTTCAGTATAAATAAAGTTCGATTATTTCAATAATTACTATGTTAGCTTAATAATGACATGAATGTATTTTTAATAAAAATATTTTAGCTCCTTAGGAAAGTTAGGCATGCATGAAAGTTTAAGTCTCTACAATTGGCTTAGTAGTTTCTTGAGGCGAAATCCTAGGAAGCATGGAATGTTCAAAATGATTTAGGCAACTTGTTTTTGGACCGTTTGAGCTTTTCAAGCCAACCATGATGAATTTTTATCCCTTGAAACCCAACTTTGAGACTATATGGCCTAATTTTATTTGAACCCTTGCAATGTTTAGCCATCACTTCTCTCTTAATTATCTTTAAATTATCCGAAACACTAGACTCAGTACTATTTAGAATATTCTTTGAAAATAAGTTTGGAGGAGTTGAAAAGAAGTATCAAATGCTAAAAAAAATTGTAGTGCATATAGTAAAATGATCATGTTAAAAAAAAGAGAGCATATGTACTTGAAAGAAAATAGATGAACAAAAGAGCATGTGAAAGCAAAGTAAGTTGGTGTGTTGAAGGTAATTATTTCGAAGGTCCGATTGAAGCTGAGTCTAGGGTTTTTAGCCTAAATTTATCTATCTTTTACCTACCCCTAGCCTAGCCATGTTACAACCTTTTTAAAGACCTATTGATTCAAGTTTCTATGCTACCTACATTAGTGGAGAGAAGTTGCTATGATCAACATATGAAGGCATAAGTTAAACTTAATGGTTGCAACTTAATCTTGAATAAGAGAATAAAATCAAATTCGCAGGGATTTAACATGTCCAACTATAAATAGATGCCTCTTCCTTCATTGTAAAGAGGGGAAGTGGGGAGTAATAATAATTCTTAAGAGTATTTACTCAAATTTCTCTCTCTCTTGCGTTCTTATTTTGTTAATTTGTGTATAATTTATTTATTGATTTGTATATTATTGATTTCAAATCTCTTTTTCCCTTATTATTCATTTTCAAATTCATTATTTTCAAATTTGTTTACATTTTATTTTGCCTTATATTTTTTTTTGATACTCTTTGTTTTAAATTCATTGGTCTTTGATTATTGATGCTATTTAATCCTCTATTTGTTATTTTAGTTTTTCTTATTATTAAATTAATTATTTTAATATTATTAATACTATTATGTGCCATCATTAATCTTGTATTATTATTATTATTATTATTATTATTATTATTATTATAATATTCATGCGCATGCATCGTTTTTATGTAATATATATATTGTTTTATATATAGTATACGTATGCTTATATATATTTTATACATATGTTTTTGTTTTTATTTTACTTCCTAACTTTTATATACATATATATACTTTTATATTTAGTTTCAATTTTTTTTTACTTTTGTATATATGTACATGTATGTATTTATATATTTTTTCTAATGAATATTTATATATATATATATACGCACATGTCTATGTTTTTTAATTGCTTAAATACAAACTTAAATTTTCAACACATATGTTATAATGTATATATGTATATTTATATATTTTTCTTTATTTTCATAAATGCATTATATATATTTTGTTATAAATTCTATAGTCCAAAATTTTATATGTAAACCCATGTGTATGTATTTTATTCTTTATAATTTCATGTATATATTTTGTACCTTTTTTTTCTCTTTATATTTTTTTGTTTATTTCTTTCATTTGCTTATTGATTTGTGTTTTCATTTATATTGTTCATTTGATACTTTACATGTCGTTGTTTTTTATGTACATTAATTTGGTTTATTTCTATGCCATTGTTGTATTTATTATTGTATTTTACACTTAATGTAGCATTACATCATTTTTTTACTCGATTTTAAAATTTTCAAAATTGAGATAATACTCGTATTTAGGATTTTCAAGGAAATTGAGCCCTAACGTATTGGGTTCCAATTTTCTTCGTTAAATCTAACAATCGAGAATTGCTCATTAATCAAAAACTAAAATGAAAAGCTTGTTGTCGGGAATTTAATATGTTGTATCCTAACGTATTGGATGTGACGTATTGATTTCTCGAGACAAAGATTTTTTTTTTAAAAAATAATAACAAAGGAAATATTTCAAGTTTAGGATTTTGAGAAATTGTGCCCTAACGTATTGGGCCGCGATTTCTTTATAAATCTTAAACAAATGAATATTCTTTTAAATTTTATTACACGAGTATTTTGGACTAATTCATTTTTGAGGAATTAGAATGTCGTGCCCTAACGCATTGGGTGTGACATTTTCTTTCTTCGAAATGATAAGAGTCTTAATAAGTAACGTTTTTTAAGTTTTTATTAAGGATCATATTTTTAAATTTTCGACATTAAAGTACTAATTAATTAACTAGGTACCAATTTTGGGCATTACGAGGGTGCTAATCCTTCCTCGTACGTAACCGACTCCTGGATCCATTTTTCTAAAACTCGTAGGCCAAAGCTATTTTTTAGGTGATCCAATCACACCTCAATAAAATATTGGTGGCGACTCCCAATTTTTGTTTTTTTAAAGTAGACAACTAATTTTTGTTTTTTTCCAAAATAAAAGTTAGTTTCGACAGCTTGGCGACTCCGCTGGGGACAAACACGAGAGTCGAGCCAAAAATTGATTAATTTCTGTCTTATGTCGAAAATTTTTTTGAGATCCTTTTGTATTCATTATTTTCTTGCTTAATTGATCTTTGCATTATACATTGCATGAGTTGAATGATTTTACCCCTCTAAGTGGGAGTGAGAAACTAGTCCTTCGTGATGTTTTCACCTCTGTGCAGGATAGTGGATCTCTTTCGGGATACATTCGTACCTATGTCTTCGTGAGATTTTCATCTCCGTGTAGCCATAGGGAAATGTATCCCCTTGAACTGAACTCGGTCTGTATGAGCCTATAATGGGTGAGGATTGAGAAATCTGCTGGTTCAGGTACCCTTACTTCAGAACCGAACCGCATATAGAAGACCTTAGGAGCTCACCCTAGGTAGAGCCACTTCAAACCCCTAGTGGTCACCCGAATAGACGTTTTATTTATTCTTGCTTGTTTTTGCTTTGTACTAACCTGTTTCTTTTTTGTTATGATTGCATTACATTTTCATCATAAAAAAGAGGTGTTGATTCACGTTCAGTTGTGAAATAGAGAGCTTGTCATAAGAAAATGAGTTTCTTGATAAAATGGAAGACAATATGGTTGTCCGAATATGGTCCAAGAAAACATGGTAAGAGAAGGATGACAGTTTAATGGAGGATTACACGACTATGGCTCCGTTGCCCAAGGATTCAAGATAACAAAGATTATTCGAGAGCCGCTAAACTTTCTTAAAGAGAAGCCAACGAGCATCACGAGGATGAGTGAGCAATGATTTACAGCCCGGATCAAGCAAAGAGGAGATGGAAGAGACGTACCTTTTGAAGAGTTCGTGAGATTTATCTTAACGCTCGAATGAAGAAAAGGATCGAATGTCTTCGCCTATGAGGGCAAGGCCATATAAATATCCATTTTATGCAAAGAGATTTATTTTCTAGAAAAGTTTTCTAAATGAAATTGAATCAAAATTGACGCCTTTTTGCATTCATTTCATGCATTGCATTTGCTTCATATATATTAAAAAAATACTAAAAAATTCTATTTAATTTAAGTCATTCCTCAGATAATCTAGAAACCAACCAACCTACCAAACACCGCTACGGTACTCGATCGAAAACTAAAGACATGGAACAAAGGCTAGAACAGTTCCAAAAGGAAATGCAAGATCAGCTTCAACAACAAATGAATGAGCAGCTTGAGAAGATTCAACAAAAAAGATGGACAAAATGATGGAATCTCAAGGGAATATGATGGTTAAGTTGACTCAGTTGCTGACTGGAGGAATTGATAAAGGAAAAAGCTCTGTGCTTAATGTTGAAGAAGGAGACAGTGAGGGACCTGTTTATCCCCTAGGCTTTACCCCTCAGCATGTTGAGGTATATCCACGCAAATCTTCTGTCACCATCAAGCCCCAGCAGTTTCAGGCCGGTGCTGTAACACCAATGAATTTTCAAGCAGGATCAGGCTCTAACCCCGGAGACAACATTGTTAATCCTGCTATCCCTAACTTCGACGAAACAGCTAAAAAAGAGAAAATGAAGGATGAATTGCCAAAACAGCTAGAAAAAAAGTACAAATGGCTGGAAGAGAAATTTAAAGCGATGGAATGTGTTGAGAGCTACTATGGGATTGATGCTAAAGAATTAAGCTTGGTTCCAGATTTAGTACTCCCTTACAAGTTCAAAGTGCCAGAGTTTGAGAAGTATAATGGAACTAGTAGTCCTGAAGCCCATATTACTACGTTTTGTAGGCGGATGACTGGGTATGTTAGTAATGACCAGTTGCTGATACATTGTTTCCAGGATAGCCTCACAGGGGCAGCGTCCAAGTAATACAGTCGACTAAGTCATGCCAAGATTAATTCATAGAAAGATTTAACATAGGCATTCATAAAGCAGTACAATCATGTAACTGACATGGTACCAGATAGAATCACTCTACAAAACATGGAAAAGAATCCCGGTGAAAGTTTTAGGCAATACGCATAGAGGTGTAGGGAGGTCGCCGTCCAAGTTCAGCCACCGCTCTTGGAAAGGGAAATGACAATGCTATTCATAAATACATTGAAAGCTTCGTTCATCACACATATGTTAGGGAGTGCCACAAAAAGATTTTCTGACATAATCATGAATGATGAAATGATTGAAAGCGCCATAAGGAGAAGAAAGATTGATGCTGGAAGGCAAGCCTCAAAAGAAAAAGAAAATGAGGTGAACAACGTGAATACATACAGCAAATCGATTGCTAATCAGTAGGGTTCATCAAGACAAGAATCATGTGTGAAGCAAGATACTGAAAAACTCCAGTTCACGCCAATTCCAATGTCGTACAAGGAGTTGTATCAAAGTTTATTCGATGCGCATGTTATTTCTCCTTTATATGTGAAGCCTCCATAGCCTCCGTATCCCAAATGGTACGACGCAAGTGCACAATGCGATTATCATGCTGGAATTACGGGACACTCAATAGAGTTTTTTTAAAAAACTCTAACGATTATCATGCGGTTTTGCCTATTGAAGATAAAATTCTTTCTAAGTTTTTGAATCCAATTCTGATTGAAAAGAAATGTTCAAAGTTGTCCATCATGGTCAAATGTGTCAAAAGCAAATGATGCAAGTTCACAAAAAAGGTCCGTCCTAAAGAATTCCTTGAGAGAGACCTGGTATTGAAGAAGATCCTTCCCATACAAAAAGAACTTCATCCCAAGCTGGGAAGGACCTTATGTGAAAGACCTTATTTGGAAAAGCGTCAATTTTGATCAAAAAGAATAACAATGACATGCATAATCCTATGATTTCAGATTCAATCAAAAATATTTCAAAATATAAAAAAAAGCAAAAAAAAAGGAAGAAAAGAAGAAAGAAAATGGAGAGCCAAGGTGAAAACCCGCAAAGGGCGCCTTGAGACCAAAGGGGATTTAAGTTGAAAACTCAAAAAGGGCGGCTCAAATATTGATCAGAATGGGGCATGAGGTGATCAGAGTAGTTCAAATTTTGATCAGATTGGGGCATATGATGATCTTGAATCAACAGGAAAGGGTAGACAACATCTTGGGACATCGACAGAGTACTGTAGATCTCCTAAACACATGTCAAACTCAGAAAGTTTGTATAGAGAAGTTCAAGCTGCGATATCTGGGGCATCCAATTTTTAAATTGAATTTGCTATTTTTGGAATACTTCATTCTTTTCCAAGATACACATTCCCAGTCAATTTCTTTGTTATCCTTATTTTTTGATAATCTATTCCTTTCGAGCTATGCTCAGAACCAATTGTATTCTCATCCATTGTTATACCCTTTTTGCAAGCATGTTGCATTGGAATAATGATTAATGGACTAATAAAACTTTCACAAGGGAAGTTTGGCATATTACTCTAGAAGTTTCTAAATAATACAGGAACCTGAAACAAGACTATTGTTTAGAACGCACCATGTTTAAATGTTGGAAATCTGAAAAGGAAGAGTCTAAATTAGGACTTTCTCTTTGGATTTTGTTGTTAAAAACATTGATTGAACAAAATGACAAAGCTAAAATAAACAAGTAAGCAATGATCACCGAACAGTAGGAAGAGGTTTTCTTGGAGAAGAAAGCCTTCATTTATGATTGAGCCTTTTGTACGATACCTTGGGAATGGTGTAAGGGACCAAAGAGATTTAGATCCTGTATCATTGAATTGTGATAAGAGAGGATCGAGAAAAAGCCATATATTCCTACCTTTGGGTTACAGTGGGAGAATGATGGTACAAATTTTGCGCCCCAATGGATTGAACTTTGAGGTTTATAGTGGGGGGCAACCTGACTAAATGTTTCTTCAAAAAAGCTAGCCAAGCAAGAAGGTGTCGTAGCACATCAGTGTTAAAGCCTTAATAAACTTCGAGCAATGACAACCTAAGTGGGATCATTCTCGGAAAAAAAATTATTAAAAAAATTATGCATTCGTGCAAACACCATTAAAAAATGTCTAGTTAGGAGCATTTGATTCATTTTATGCCATCCTAATCATTAGGCAAAATTAGGTTCATTAGACATGTCATGTTCCCCAGAGAGCAGATCAGTGAAGATAACAGATCTTGCCTTCCTACACTGACAGCAAAGCAGATTGAAGACACCAGCCTTGTCTCCCTGGGTTGTAGCGGAGCAGGTTAAAAATAGCAGATCTTGCCTTCCTGCACCGACAGCGAAGCAGATCGAAGACACCAGCCTTGCCTCCCTGGGTTGCAGCGAAGCAGGTTAAAAATAGCAGATCTTGCCTTCCTGCACGGACAGTGAAGCAGATCGAAGACACCAGTCTTGCCTCCCTGGGTTGTAGCGGAGCAGGTTAAAAATAGCAGATCTTGCCTTCTTGCACCGACAGCAAAGCAGATCGAAGACACCAACCTTGCCTCCCCGGGTTGTAGCGGAGCAGGTTAAAAATAGCAGATCTTGCCTTCCTGCACCGACAGCGAAGCAGATCGAAGACACCAGCCTTGCCTCCCTGGGTTGTAGCGGAGCAGGTTAAAAATAGTAAATCTTGCCTTCCTGCACCGACAGCGAAGCAGATCAATAACCCCAGCCCTATCTCCCTGGACAGCAGTGGAATAGGTTGAAGATTGTAAGTCCTATCTCCCTGGTTAGTAGTGGAATAGGTTGAAGATTGTGAATCCTATCTCCCTGAGCAACAGTGGAGTAGGATGAAAATAGCAGATCTTGCCTTCTTGTACTGGTAGTGAAGCAGATCGAAGACATTAGTCTTATCGCCTTGACGTTGCAATGGAAAAGATTGAAGCCACAAGGCAAATCTTATTTCCCTGGCGTTGTAGCGGAGCAGATTGAAGCTACGACGGTGAATCTTATCTCCTGAGCATTAAGGCTTGGATTATCTGAAGTGGAGCGGATTGAAGCTGTGTGCAGTGAATCCTATATCTTTGGCATTACAGTGGAGCAGATTGAAACCACGACGGTGAATCTTACTCCCCTGACGGTGTAGTGGAACAGATTGAAGCTACGACGGTGAATCTTGTTTCCCCAACATTGCAATTTAAAAGACTGAAGATGGCGAATCTTATCTCCCTGAAGTTGTAGTGGAGCAGATTAAAGCCAATAATCCTATCTCCCTGAAGTCACAGTGGAGCGGATTAAAATCACAAATCTTATCTCCTTGAAGTTGCAGTGGAGCAGACCCAAGAAAGCGAGTCTTATCTCCCTGAAGTTGCAGTGGAGCAGACTCAAGAAATCAAGTCTTATCCCTCTGAAATTGCAGTGGGGCAGACTAAATAAACAAATCCCATCTCTCTAAAGTTGTAGTAGAGTGGATTAGAATCTCTCTGAAATTACAGTAGAGCAGATCGCATCAAGTTCATCTTTAAAGTTGCAGCAGATCAAGTTGAAGCTATAAGTCTTATCTCCCTGGAGTTGCAGTGGAGCAGATTAAAGATAGCAAATTTTGAAAAACTACAACGTGCAAATCCTATCTCCCTGGCATTGCAGTGGAGTAGGTTGAAGCACCAGTTCCTATACCTCTAAAGATGCAGTAGGAAGGAATGAGGCTATTTGAAGAAGAAGAAGAAGAGTGCTAAAGTCTAGTACGACCAGCAAAATTGGTCATTTCTAAAGTCTTTGCTCCGTTCTTGTTACATGATAATGAGAAAAGAGGGGCAGCTGTAATAGACCAATTTAGCCCGGGCTCATAAAAAAATAATAAACCCAAAATAATAAAACAAAGTCCAAAATTATATCATTTGGCCCGATCGGGATGGCCCATTACTTGAAAAGGTTGAAGGTCTATCTACAAGCTTGATGCATATGGAAACATAATCTTCAATGATATGCAATCTTCGATATGATATGTAATCTTAGATATGATATGCAATCTTAGATATGATATGTAATCTTAGATATGATATGCAATCTTAGAAGATATGATTTTGTAATCTTAGAGATTTAATTTGTAGATACCTTTTAATCTTAGCCGTTGATGTAATTAATCTATACCGTTGGATTTGGGGAGGCTCAGCTATAAATAGATGTCTCTCCCTTCATTGTAAAGGGGGGAAGTGGGGAGTAATAATAATTCTTAAGAGTATTTACTCAAATTTCTCTTTCTCTTGCGTTCTTATTTTGTTGATTTGTGTATAATTTATTTATTGATTTGTATATTGTTGATTTCAAATCTCTTTTTCCCTTATTATTCATTTTCAAATTCATTATTTTCAAATTTGTTTACATTTTATTTGGCCTTATATATTTTTTATTTTATACTCTTTGTTTTAAATTCATTGGTCTTTGATTATTGATGCTATTTAATCCTCTATTTGTTATTTTAGTTTTTTTATTATTAAATTAATTATTTTAATATTATTAATACAATTATGTGCCATCATTAATCTTGTATCATTATTATTATTATTATTATTATTATTTTATATTCATGCGCATGCATCGTTTTTATGTAATATATATATTGTTTTATATATATTATACGTATGCTTATATATATTTTATACATATGTTTTTGTTTTTGTTTTTATTTTACTTCCTAACTTTTATATACATATATATACTTTTATATTTAGTATCAATTTTTTTTTTACTTTTGTATATATGTACATGTGTGTATTTATATATTTTTTGGACTAATTCATTTTTGAGGAATTAGAATGTCGTGCCCTAACGCATTGGGTGTGACATTTTCTTTCTCCGAAATGATAAGAGTCTCAATAAGTAACGTTTTTTTAAGTTTTTATTAAGGATCATATTTTTAAATTTTCGACATTAAGGTACTAATTAATTAACTAGGTACCAATTTTGGGCATTATGAGGGTGCTAATCCTTCCTCGTACGTAACTTACTCCCAGATCCATTTTTCTAAAACTCGTAGACCAAAGCTATTTTTTAGGTGATCCAATCACACCTCAATAAAAGATTGGTGGCGACTCCCAATTTTTGTTTTTTAAAGTCGACAACTAATTTTTGTTTTTTTCCAAAATAAAAGTTGGTTTCGACAATTGGTATGGCCTATCTGCGAACACCTTAACTTCGAATCGGTCTAGACTGTGAGGTCGAGAGATAAGTAGCTCTTTCCAACTCATTATTCTAGTGGAAGATCAGAAGATCCTACAAGGGTATCGACTAGTTGATTGAACAAGAAGCCCAAAGAGACAATTGATTATGATTAGTGAAGCGAGCTAATCACCCATGCTTAGATTTGATAAATTCTACTATTTGATTTCCTGCTATTTATTTATTTATGTTCTTTTATTATTATAAAAAAATCCCAAAAACCTTTCTTTATATTTTGATGTAATATAATCTATCTAAAGTATTAATTAGACATATTTGTGCTTAGGTTAGAGTTAACTTGCCTCCCTTGGGTATGATCCTCAGAGTACTTACCTACTCCGTTGTAACTATATTACAACCTGACCCGTATACTTGCGGTTACATCCTTTTTAAAATATTTTGTGCAGAATTTTTACTCTGGACGTTGGTACGTCTGGAGGCGGTCAATATCTTCTTCATTCGACAAAAATAAGGAACATAAAAGAAATAAGCTTGTATGTTACTCAACACCATTTTCGTGAGATAATCCAAAGGTTAATGAGCTTCTTCATTGAAATTTTTATTAGATTTCTACCCTATTATGATAGATGAAAATGACCCACTTGATAAATTAGAAATTGTCAAATTTTAGCTTAGTAACCATTAATGAAAGTTTGAATGCTAGTGACATAATGGTTGAACTTTGAGTAGTATTATGTTTATTGTTAATTAGATGTTCCTCAATTATAGTTTCAAAGTTGTATTTAGATTCGATAGGGTAAAATATAAAATATGAGGATTTCAAATATTAGAGCTATAAGGGACCTAATTAAAAAGAATGCATAAAAAGTTTAATTTAAATTTTTATAAGTAGGAGAATTTAATAATGTCTTTATACTTGAAATATTGAAAGATGCTAAAAACGAGGTTGGAACATTGAGGGACAATGAACAAGTAAGATCAGATAACAAGCAATGATGTCAATTTGTGCTACTATAATTAGATTTCAGTAATTTATTTTATTGAATAGCTAGTCGATATAATCTAGTACGAAATAAATGTCAAGGTAACTACATCTCTACTTAAAAGCTTTGAAATGATGAATTAGATGTGTTTGTGTAAATCATGTTATAAATGATTGATTTTAGGATATGATTCTATATACTCAATTTATAAGCATTGCTATATTGATATTTGACTATGATGATATATGTTATGATAATAATTATAATAATACTTCCCCATTAAACAATGTTAGATGTAGTTTGAGTGTAGTTGGCATGCCATAGGATTATTATCAGTGATTTTATTTAGCCCCAATTCCCAGAAGATCATGAGAAGTCCCAATTCCAAAGGGTCATGCACATATATTGATATACAAATTAGTAGCTTTAATTCCTAAAGAGTCGTGAGCAGTCCCAATTCCCTGAGGGTTGTGGGCAATTCCAATTTCTAGAAGGTCATGGACTTACTTTGACATGCATATTTGAGTATTCATTCTAGTGTCTACATTCAGTTAATAGGGGCTACACTGAATAAGAAATGAAAAGTGATATTTATTGAAATGTTATATGTTTGAATAGGCATTAATGCTTAATAATGAACTATGAAATGAAATAACCTAATATTGGGAAATGAGACAGTAACTATCTTGACTTATATGTAAACATGTTCTATGTTTGATTCATTTATATATAATTGTATTAATTTCAAATTATTGGCACAACTGAATATTCAATATGTAGCGTATAGATTTGTTTGTTTTCATGCGTAGGTACAAATTAGACTTGTTGGTAGACCGTAGGACCATCAAGCGTCCAACTTTTGACAACTCAGCTCAACTTGGTTAAATCTTGTGTTAGTTTTCTATAAAGTTAGTTAATGGCATCTATTTAACAACTCAATTTTTAGTGGTACTGGAAAAGGCAATTTCGGAACCCCACTTTTATAAAACGAGTCTCTAAATATTAAATATTTATATTTATGAGGTAAACATAGAAATATATCAAAGATTGGTCAATTTATTGAATTGATAGTTAATTAAGGTACAAGGACTAAACTGTAAAAGTTTATCTCTATAGGTTTTTAATTGGCCAAAGACTTAGGGAATTAGTTTGAAATTAACCAAAGGTATCAAATGAGAATTAAACCATTTTAATTTATATGTTAGTGGAGTATGATGAGAGAATCCACTTATATAAGTTAATGGTGGATTAAGTTAATAAAATGTAATTAAACTAATTAATTAAAGTGTAATTAAACTAATTAAACATCCTAAAAGTGTAAGGAGAAACCATGTTTTAGCTTAAACAATTCTGTCCCTAATTGGTAAGCTTTTCTAAGTCCTTTTTTCTTGTAATTTTTATGTTTTTAAGGTCATGAGAGCTTGATTTAGCTAGCCCATGTACCAATTCGTAAAAATGTCAAAGTTTTTAAAAGTTTCCATTGTTTATTTCTTGAAAAAATTGGTGCCAAATTGATAGATTTTAAGCTTAGATGTGAAAAAGGACTAGAATGTAAAGTTTAATTGACAGTTTTGTACATAAGGACTAAAGTGTATAAATTGTATAATTGATATGAAATTTTTGTTATAATAGATAGTATAGGGGTCCTAAAAGGGTGTGATTGAGATTGATTTTGAAACTGATGCTCAAAATCGAAAGTTATTGTTATTTCAATTTTAGGGGCGAAATTGAATAAGATGTAAAAATTTAGGGGTTCAAAAAATTGAAATTTTATAGGTTCATGCATATCACGGAATGATATAAAATATTTTATATTGATGAATTGTCTAAAATAATTGTTTAGATCAAGAATTGAATCAAATTAGGGATAATCGAGGAAAAGCCACAATTATTGAATAGCCCCTGAAGATTCAACTTATTTGTTATTTTTTTCCCGGTAAGTTCATATGGTATAAATGTTTTTAAGTTGTGGTTTATTTTATTTGTGATTATATGTGTTTGGTTGCGAATTGGTATTAAGGTGAGATTTGGACTAAATTGTAAAGAAATGTATATATGTGTTAAAAATGCTCAGGTGAATGATCTATCTTAATTTGATATGTCAAAGTAGTCTTCCCAGTTATAATTAAGGAGCTTGTTTTCAAGCAAATTAGTTTTGCGTAGTTTTCAGATTTTTTTTTTATTCAATAAGTGTTTAATGTGTTTTTGTGCTCATTTTGAGACCCAAATTGGACAAATGCGCCATTTGGACCCTAATGATCGATTAAGTGTTGTAAGAACTCAATGATGGCTCATTTTTTAGCGAAAACATCACCAAGGAGGGGTTATTACGATATCAAAGCATGAAAATCATGATACCCTTAACATTCCTAAAATGAAAAGAAAAATGAAGACCACCTACAGTGGTGTTGCGATACCTAATACCCAGCCTTCAAAGGGAACTCCTCATTTAGAAATTGCCAACGATATCATGATATCTAGACCATGGGTATTGCGATATCATTGTCATGAGGGGAAAAAAGTTAACATCAGAGGTAGTCTTTGTCCAACCGAAGCACCAATCAAAAAGACATGTTGAAGGGCATTTTGGTAAAAAAAGGGTCAAAATAGTTGCTAAAAAGAACCAAAAATTGGCTAAAGAGAGTGAGAGGAGGCATTAGGCATAATTTTTAGTCATCTTCTTAGTTGCTCTCCTTTATAGTTGTAGATATAATTTTCTACTAGTTTCCTCGTGTTTCTTTGCATTCTTAACTGTAGCTTAGGTTTATTTACACGTTTAGGACCTTTAACTTTCTTGTACTGACATTTTCATCTCTAGTTTAATGTTCTTTCAATATGTTTTCTTTTTCTTTATTAAAAATCTAATATTTATTATTCTTGTTCATTTATCTTGTTCTTAGTTTCTTTTCCTTTAATTCTTTCAAATTAAAAACCCAAGCTTTCATCTTTTTATTGAGTTTTATGTTCATGCCTTTCATGGTAGCTTCTTTGATGTTAGCTTAGAAAAGATAATGGTTAACTAAACCCTATGGGGGTTGGTTAATGGAGATGTAGGTAACTTATTTTTGGGTCGAGGAATAAATTGCAATAAATTGGACTAAATTGAATGAACTTAAAAACTTAGGATTGATGCCCCTAAGGGAAAATCAAGATAAGTGAGACTGAGAGGTAACCTTATTGGGAACCGATTCATTAATTCTTGGTTAATCAGGTGAGATTGAGAGGTAAACCGAACTAATTTATCTAACTTGGTAAAATTGAGACTGAGAGGTAAAATAGATCCATTTTAGGAGTTTAAGCAATTTAGATCCCTAATTCAATGATTAATAAACCGCATTGAAGTTAACCAACCACCGCTCATTATTGATTGGATAGTTTTATCACCTTGCATGCTTTACAATTTGGTCATTTTGTTAATTATTTAGCTAATTGGTTTAATAAAACTCAAATTCATGGTCTGTCGTACTATGTTATCTAGCGAATAGTTGTTTAAACTCTTTATTTGCATGTTTGTAGCTAGAATTCACTTAATCGTCGAGTTCTGTGGGTTCAATTCTTAGAACACTCATGTACCCCGTTGTACAAATTATATTACAACTGACCTGTCACACTTCTAGACACCACATGTACTTATTCTTGTAATGGCCCAAATTTGCCCAGCCCAAATCAGAAGTAAATAAATAATAAATATAAAACCAAAATTAAAAGTCCAAAATAGTCCCTTTACACCAGGCTCAATGTGGCCCAAACCAAACAGACCCTAAATCCCCAATCCAAGTTACAGAAACCCAACTAGCCTAACCCCAAAACCAAGCCCAAATACCCGCAGCCCAAAATAGAGAAAATCAGCAGCAAACCCTAGAGACCAAAACCCTAAACTAAGACGCCACAGCAGCCTCGCAACGCGCTGCCTTCGGCTTTCCTCTCTACGCGCGCCACGCCACCACCTCCGTACCCCCGTACCTTCAAACAAACAAACAAAAACAGCACAACAAAAAGAAAAAGAACGATTGTATTTTATTTTCGTTTTCGGCTATAAAAGAGCCAACAAAATCTGTAAAAGGTTCCCTTTTTTTACGATCAACAGACAGAGAGAATACGCAGAGATTGTATCAAAAAAAACAAAAATAAATACAAAGGAAAAGGTTTTTTTTCATTCTCTTTTTCGATTGCTTTTCTTTTTGGCTGGTTCGTTATTAATCGCATATAAGCATATATAAGGAAAATAAGAAAGAGAAACTTACCTGGTTGGTGTCGTTAACCCCCCGTTTTGCTCTGTTGAAATCGGAGTTAGAAAAGGTGGTCGTCTCTTGGCTGCAAACGGCGGAGCGGCGCAACATTTGGGGGCTGATGTTTAGTTTTTTTTTTTAAGTTTGTTTAAGGCTAATAGTTATTGATTTAGGGTTTATTTAGTTTTGTTTTATAACCAAAGAAACGACACCATTTTAAGACTGCTTAAGTGGCTTCAAAACGACGCCGTTTAGAGGCTTGCGACCCCGCGGTGACCCGACCCGGGGAAGGATCCGCGCGTTTTGGCCTCTGTTGGGAAATTTGCGCAGATAGTCCTCCACTTTTATAGAGCTTTCAAATTGATCCTTTTATTTCTTTTAAATTTGATCGCTCATTCTGTACTACATTTCAATTAGGTGTGTGCAAGGATACTGTGTATTGAGGGAAGGGATATTTACCCTTTTAGTCCCCAAGTTGTTCGCGCGTTCCTTTGTGGTCCTTAATGTTATTTTATTTTTATTTTCTCTTTTAATTTTGGAATTAAACGCAAGTTAGCCTGTTTTTGCTTAATTTAAATGTATTCAAAATTTTATTTTATTTTAATATTCATCATTTTTAAAATATATTTAACTTTACATCTAGCATTATTTTATGTTTAAATTTAGTATATTTTAAATTTATTACAATATTATTTTAATATTATAACATATTATTGTTCTAAACATATCATTAACATTATTTTAAATTTATCATGTACAATCTTATGCATTCTTGTTGCAAATTCAATATAATTTATACATATTTTACATCTTTATTTTATAATACATTTTTAACTACACTTATATAGTTCTTTGCTTTAAGATTTATACAATAATATTCTTACTTAATATTTTTCTATACATGTATATATAATTTGTGTTAAATTATTTTTATATATATACATAATATATTATCGATTTCATATTATTACATATCCTTTCATATATTTTTATGTATAAATAACTTATTTATTTCAAACCCTATTTTATTATATGTTTTACTTATTTCAACTCTTTTATCTATTATTATGTGTAATTTATTTATATTAAGTTTTCCACTCCATCTATTACTTATTTTAAAGTGTATATCATTCTTTTCTATTTTTGAATGTTTCAAGTTTGCAAATGTATTATTCATTTTAATTCTTTATTCATATACGTATAACCTATTATTGACGATTTCAAATATTTTATTTTTTCTCATCATTTTTGTTTTTGTTAGATGATTCCCTAATTACCTTTTAATTCATTTACCTTTCTAACATAATATTAATATTGGTTTAATGTGCGGTATGATTGCTTTTATGCTTATTGTATAACTTATTCGCATGAATTGATTCTTTGTAACTCGTTAGTATTGATTTTAGTTTGTAAATTAGCTTTTCCCGATGTACAATGTTATTTCGTTATTCATTCAAAAGATTACAAGTGTCAAAGTTATTTCATTCAAAAACTTTCAAAAATACTCGAAGTTTGGAATCCTCGAGAGAATTGAGCCCTAACGTATTGGGTTTCAATTTTCCTCGTCAAATCTAAATAATCGAAATTTTTTCAAACATACAAATTTCAAATAAAAACCCATTTTCGGGAATTCGACATGTTGTGTCCTAACGCATTGGATATGACGTGTTATTTCCTCGAGATGAGAATTTTTAAAATAATAATAAAGGTAATATTCAATATTTAGGAATTTAGTGAAATCGAGCCCTAACTTACTGGGTTTCAATTTTCTCATTTGACCTAAATGATCAAATATCCTTCTCAAAAATGCATAGGTTTTAAAAGTTAAAAGATAAACTTAATTTTGAAGATTAAAAATGTTGCACCCTAACTCACTGGGTGTGACATTTTATTTCTTTGAAATAAGAGTGTTTTATCATTCAATTTATTCAGGTTAAAAGAATCGTACTTTAAAATCTTTTCAAAATTTCGACACTAAGACATAAAATGATCAATTCGGTACCAATTTTGGGCGTTACGAGGGTACTAACCCTTCCTCGTGCGTAACCGACTCCTGAACCTATTTTCTCAAATCTCGCAGACCTAAAATTTATTTTAATGGTGAACCGGTCACACCTTAATAAAAGATCGGTGGCGACTCTCATTTTCATTTTTAACTCGATAACTAAAATATTTTGTTTTTCAAAAATGGTTTCGACAATTCTGATTTGATTGTTGTATTAGTTGTTAGCACCGTTGTCGGGGAGCTAGTGCTAGATTGAGTGACTATAGCTTTATTGCAAGATTTATAGGGAGATAGTTGACTAAAGCTTTATTTATAGATATGAATTTTTATTTTGTTTCTTTGCTTGTTATTTTGTTCAAAAAATTTATTGATTGTGTGAATCTCTTTTGCTTGTAGGAGGTAGTTTATGACTCAGACTAGTAATAAGATTGTACTATTTGAACCGAAATTGAAAAGAATCTTGACACATAGTCAACAAGAACAACTTTTGAGAAGAGCCCAACCTCCACCATTTGACAACCCAAGAGTTGAGGAACATCCACCACCAATTCATCAAAGACCGATGGCGGAAAGGACAATGAGAGACTACACCATGCGTAATCTTTACGCTGTGGAAGGAAGCATTAACCGCCAAGCGATTAATTGGGGAGGTCACAATGAACACAATCAATGTGAAGTTCAACTACTTATGAAATAAGGGGTACCTACAATCAATGGGGTCCTTACAATCAAGAAGTACCCAACTTCAACCCACCTAGGCCTAATGCACCATAACAAGCTCCGTAGCCATTTAGGGTAGCCCAAGAAACTATGAGAAAATTCGCCTAGAATAGCAACCCTCTAATACCCATTCATGTGAGTAAACTAGAGGAAGGCTTGCATTCGATGCAAGCAGAAGTGTGCCTAATGCAAGGTCAATTGCGCCAAATTTTTCATATGCTACAAAGTAGTGCTTCCTTTAGCATATCAAGAAATATTGAACCAAACCCGAAGAGGGAAGGGAAAGAACATGCTACGACCATTACCCTTAGATTTTGAGTGGTGGTTAAAACCCTATTAGACTGGTGAATGGAGAAGAGGTAGTAGAGAAGGAAGAGAACACCTACACTCCTAGTGGTGGACATAGGGTAGGAGAGAGAGTAGAAGCAGAAGTTGATCCCAAACAACCCAAACCTCAGGATAGGCCCATTGCACCCTCAAGTCAAGTACCCGTACCTTTTTTGACCCGTCTTGAGGAAAAAAAAAGAAAAAGAAGAGTAAGGAATTTCCAATTTTCATTTACATGTTTAAGGCGTTGAGTGTTAATCTCCTGTTATTAAAGCTCTTAGAAAAATTTTGAAATATGTTAAGTTTCTAAGGGAAGTTATGTTCCAGAGGAAGAAGATTGGGAGAGGAAAACATATTGCTCTTAACGCTAAGTGTTGTGTGATTGTGCCCATAAAATTTCCCCTAAAACTCAATGACCCGGGCAGCTTCAGAATCCCTATAGAAATAGGAGTGAATTACGAGAAAGCCCTTTGTGATTTAGGGGCTAGTATCAACCTCGTGTCATTATCAATTTATTAGAGGTTAGTATTAGGGAACTTTAGGGAGACCTCAATGACTTTGCAACTTTTCAATTGCCCTTTTTTTCCTTCCTAAGGGAGTCTTTGAGGACGTATTAGTTAGATTTAGGCAATTCATCCCATCAGTGGACTTTATTGTGTTAGACTTTGAGGAAGACCTAAAAATCCCTATCCTACTAGGAATGCCATCTTTGGTAGCCTCTATGGCAACTATAGATGTCAAAAAAGGGGAGTTGACGATAGACAGAGATGGGGAGGTCAAAATCTTTAAGTGTGTTGACCCCAACCTTAGTTCTAATGAGTCATCACTCTCTCAAGGGTATGAGTGTTAAGCAGTTGAGATAATATCCTATCATGCCACTGATCTTGCAACTATTATGAAATGATGTGAACTTAAAGTTTTTAGCTCAATGTGAAAAAAAAAGATCCAAAAACGAAAGAAATTTAGTAAGCCATGGCGATCCTAAAGTAGCCTCAGTCAGGTGATGAACAAGATGTGAATTAAAGTATCGAGCACACCACATTAGTACCACTTCGGGGGCATAACTGATCACCTTGAAGCTAATTTGTAATTTTTCTAGAAGGTAATTCAAATTAAGTTTGTAAATATTTGAATGATCCGAGCACGGAGTCCGTTTGTTTTCCTTGTTTAGTTTAGGTTTAAATTTGAGCATGTTTAATTTTTGCACTTGGTAGGGTAGATTTTGGATAATTGGGAGATTAGATGATAATTTTGTATGTTTTTTGGGCACCCTTCTAGTCGTATTGCGATATCCAAGAGGGAATATCACGATAACCTTAACAGTCTAGGGGGATGCTCAAAATTTTCTAGATATTGCAATACTGGTCCCTTGGTATCGCAATATCCCTAGCTATTTCAAAAATAAAAAAATTGTCAAAGTTATAATGGTATTGTGATACCAGTATCTCGGTATCTCGGTATCGTAGTAGTTTCAAAATAAAGGGTACAAAGTGAAAGGGGTATCACGATACCCACCTTCAGTATCGCAATATCTATGTTAGGTCGTGATCCCCAAGGTTTGGAGGCTTTTTAAGCCTCCAAACACCCTAACACCCAGATCTCTTTCATTCTTATGCCCTATTCGTTTTCAAAACACTCCCATCTTCATCTTCTCCTCTATTTTCCTTTTTAACCTTCATTTACTTTTCTCACAAATTTGCCTATTTAGTATTATTTCTTCTTCTTTTCATTCTTATTTGTAGGTTTTCCTTCTCCTTGCCTTGGAACAATAGTACTACATCCCCTCCAACCGCTTTGCCATTGCCATCAATACATTTTTATCGTGTCAAATTCCTTTTCCCTTTGTTTTCTTTGAAATTTTTATTTTTTTAGTGTTGCACTATTGATTTGTCTATTGGTTAGTTTATTATTTGTTAAAAAGCTTGATTAAATTGTGAGGTTAGTAAAATGTCGCCTAGACAAACTAAACGAACTAGGTCTCAATCGAACCCTCTTCTACCATCGGCGGTGGTTCTAGAGTGATTTACAAATAAAGAGGTTGAAAATTATTTTATGTCAATCCAAGGCGAAACATTTATTCTTGAGCATGGTTCCGACCCAATTGCTTCTCTTTGTAATGAGATTTGGGACTTTGTCTATTACCATGGATGGTTCAATATTTTTCTAGTCCCAAAATCGACTGTGGTTATCCCCACTGTTCTTGAGTTTTATGAAAATTTAAAAGTTTATGTTGAAGCTGCGTACTGGTTCAGGGAATAGAGATTGACATTTCCCTAAGTGCTATTAGCGAGCACTATGGTGTTCCATGGTATCAACAAGATGACATTGAACAAATGGATTTAAAATTTTATAAAATGTCGACATAGACCTCATTCTCGCCTACCTAATGTAAGGTCAAAGGGAATAGAAATGGGAATAGTACAAAAACCTTCCTCTATCTTTTAATCAAGTAATAATATTTTCCTTAGGAAAAATATAGATTCAATTTATCTCGACCCGTGTTAGTCTCATGCTCAACACTAACACAGTTAACAATTTTGTAGCAGTTTTTTTTTCAATTTTGTAATGGAAGCGAGTTTGTCTTGGGATGTGGATAAATCATTAGATGAAGAAGTGTCTTAGGGAGCAAAGTTGGCATGTACTTCCCTCATCTGATTATGGACTTATGTCATAAGAAGAGGGTAAAAATGAACCTGACTGAGTAGTTTCACCGCCCCACTTAGGGTATTATAGGCAATACCATGATACTTTAGCTTCACAAGTTGGAGTGGTAGAAAATTTAGGAGTGGAATCAAAGGCGCAAGCACAAGATGGAAATGCCTACGACCCTAAAGAAGAAAACCACAACAAAGAAGGTGTACGAAGGTACATAGTGGCAACGTAAGTTGTTTGATAAGGTTCGCTACAACACTCGACTACTCGAGGCGATAAAACCATTTATAAAAATATTTTTGATGAGCCAAGGGATAGAGGGCCCACAGTGGCCCGAACGATTGACCAACGCATCCTTTAGTGGCGAGGAGGAACAAGAAGAAAGAGAGAAATTGGAAGAGGAAGCAGATGAGGATGATAAAGAGATAGAAGATGATGACCCCGCACTGTATATTGATGATTTTGACGCGATTTTCGCTCCCGAGTGACCTACCACGACCAAGTTAATCTTCAAAGGCCTGAGACCACCGAGGCATCAGGGCTACTAAAGGTTGGCCAACAAGGGAAAATGGAAGGAGATAGTTAGACCGGAGTCGGGCTCTCATGATGATTAGTTACATGTTTTCACATTCTTTTCTTTT\n>URS0000BE9894 tRNA from 1 species \nGGCTCCATAGTATAGTGGTAGCACATCTGCTTTACATGCAGAAGGTCCTGGATTCGTGCCCCAGATGAAGCCA\n>URS0000C75118 pre_miRNA from 1 species \nGAGATACTCCCTCCGTCCCAAAATTCTTGTCTTAGATTTGTCTAAATACGGATGTATCTAACGTAACTAGATACATCCATATCTAGACAAATCTAAGACAAGAATTTTGGGACGGAGGGAGTATATG\n>URS000029BCEB rRNA from 1 species \nGACGAACGCTGGCGGCGCGCCTAACACATGCAAGTCGAACGGGGAAGTTAGCAATAACTTCTTAGTGGCGAACGGGTGAGTAACGCGTGGACAACCAACCTTCTGGTGGGGGACAACACTTCGAAAGGAGTGCTAATACCGCATGAGCTCTATAGGCCGCATGGTCTGCAGAGGAAAGGAGCTTCGGCTCCGCGAGAAGACGGGTCCGCGTCTGATTAGCTAGTTGGAGGGGTAACGGCCCACCAAGGCAACGATCAGTAGCCGGTCTGAGAGGATGAACGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTCGAGAATAGTCTACAATGGCCGGAAGGCTGATAGTGCGACGCCGCGTGTGGGAAGAAGGCCTTCGGGTCGTAAACCTCTGTCATGGGGGACGAAGGAAGTGACGGTACCCCAAGAGGAAGCCCCTGCTAACTACGTG\n>URS0000023D8D tRNA from 1 species \nACATTTTTAGTATAATAGTACATTTGACTTCCAATCAAAAGGTCCTTTCCAAGGAAAATGTA\n>URS00018C1C85 rRNA from 1 species \nTACGTGAGGGTGCGAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTCTGTCGCGTCGGGAGTGAAAACTCAGGGCTTAACCCTGAGCTGCTTCCGATACGGGCAGACTAGAGGTATGCAGGGGAGAACGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGTTCTCTGGGCATTACCTGACGCTGAGGAGCGAAAGTGTGGGGAGCGAACAGG\n>URS00017FF56C rRNA from 1 species \nTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGCGAGGAGGAAGGTGGTGAACTTAATACGTTCATCAATTGACGTTACTCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTTGAAACTGGCAAGCTAGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACCGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAAACGATGTCGATTTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAATCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGTC\n>URS0000142B05 siRNA from 1 species \nGTCAAATAACCTATCGAAAGTGT\n>URS0001228231 rRNA from 1 species \nTACGTAGGGGGCTAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCTGCTGTGAAAACTCGAGGCTTAACCTCGAGATGTCGGCGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGGACGATACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>URS0002355A6F lncRNA from 1 species \nAAGAACTGTACGCCACTCAACTCTCACAGCTACAAGAAATGGGTTTCTTTGATACCCGAGAGAATATACAGGCGCTGATAGCCACTGCAGGGAATGTTCATGCTGCGGTGGAGCGGCTATTGGGGAACCTTGGTCAGTAGATAATAATCATTTGTTATTGTCCTATTCGTCGCAACATTTATTGTCAGTCGGGCCCGATGAAATTGGTTTGGACCGGACTAAAGAGGATTTTTCAAAACCTATCTTGGCTATGAATTAAAAATACAGATTCGATGTTTTGAAGTTCTTGGCATAAGGTATGATCATGGGAATACCCTCTTCTATTCCCCACCCCAATAGTAAAGCGAGTGATATGTACATACACTATTATGATTGTCTCTCGTAATTTTTTTTATTTGTAATACAAATTTTTCTATTTTTTTTTGGGTGGGTGGGTAATTTACTTTTTCTTTACCCTACGCTGGGTGGGTGAATTCTTATAATTATACTTGATCTGATGTACTGTTTCGTTTTTCTGCACTTTGTTATCTAGATGCAAGTTTCCGATTGCGGAAATGGAGGTGGAATAACTGGGGATCGATATAGTTTTTCTGCCGAATGCGATGTGGTTATTTTCATAGGCAATTGTTATATTATGATGTGTTTTAAAATTAGTGATTATGGTTGGTTGGTTTTTTATTTCTCCTTTTGAATCCCATGGCAACCAGATGGCATTGGAACCCGAAGGGTAGATTAAAATCCATTTTCATAGATAACCAAGCAAATAATAATAAAAAGGGAGCTGCTAATGCCTCGTTGAGAAGTTATGGAGCCATGCACAAGTAGTCAATTTGACATATTTACCCTCGAATCATTTTCAGTCAACTCTCTCTGCAAATTACGTTCCTTTATCCTCCATCAGTTTCCTCTCTCTCCCCAAAACCAGATCACTCTTCCTCAGTTGTTATAAAATTCTCCTTTAAAATATTGTAAACTCGCTAAAGAAATTGAACAATCTTACAAATATCATTTACACTAGGCAAGGCAAATGAGAATCTGACTTTTGACACCCTCCCTGTGATGATGGAATCAACCAGATCCAACACCACCCATCAAAAACCTAACATGATCCCGTCCACAGAGTTAAATTACGCTGCGGATTGTACATCTTTATAGACTTGATGATCATCGGCCTTCACCTGATCAGCCCTTGGTTTCCGGGCTGCCTCTTAGGGTAAGCCAACGGTTTCTTTCATGGTTTTCTAATCCAACCAACAAGATGAAGAGAGTCGCTCCATTTAGAACCATCCTCCATTTCAGAGGATTGAATTTTCATCCTACAGACGTGACGGATGAAAGAAAAAAATAGAAAATCCTTCATTTCACGATTCACTTTTTTAAATTTTCTAAATTGCTCTCTTCAACTCTTTGATTTTAAATTTGAACACCAATTTTATTCTTCTTATTTTTTATTGCTTTCTGATAAACTACATATAACTTTTAACATAGACATTTAAGTTTTATAAAATTAACATGGTTGAATATACATGGACTATACCTTTAAAATGATACCCATATTCAATATATTCTCTAACAATTTGAAAATTGGTTGGACATATAAAATTTCTTAGAAAAACAATGGAGGAAAATTTTTAGAAATGGAAGTAGAGATTTGTGGTTGGAGTTGAATAAAAAAGAATATTTTGATCTTCTAAATTGGGTTGGAGATGCTCTTAGATGGTGTTTGGTGATGCTTATTAGCAATAACTTATTCTTTTTTCTGTTTTAAAAGTTGTATCAGAGTACTTATCACAATTTTTATTTATATTTACGAGCTAAAAATAACTTAAAAATTGATTTTTGCAAAGCTACATTATTATTGTGATACTTTTTTACTTCTATTTTTGAATAATTACTTTTAATATAATTTCAGGTACAACAAACACTCTTAATTTAAATTAGACCAATAAGCCCCATCTAATGAGAAGAAAAAAATTAAAGTACAAAGAATAATGCGCATGATAATAAAAACTTGCAGGAAATAACTTGTTATTATAGAGGACTCATTTGTCTTTTTACATATCGTCACAATATTTTACAAAAAGGCGCTTGAGTATAGCCGTTAGTTCTCGCCTCCACCATCCGGTCCCAGTTGCGATTCCCTACCCACTCACCACCCAAAACTCGATGCACCGGATCACCAACAGCCTCAATCATCACGAACCGTACATTTTCATTATAAAAACAAAAAAACGGACGATCCAAAATCAAGGGACGCAACCTTTTGAAATGAGTTAGATACATTGGGAGTAGGTGAATATAACGGCCAATTCAAAAGTTTCCCACCAAAACTATATATATAACCACCTTCCTATTCCTTCCGCATCCAAATCTCTCTCTCCACAATGACTAACCCCAATGATTCCCCAAACCAATCCCCCACCAACAAAGCCCCGAAGCCTCTCTTCGCCTGATAGGGACCCTTTGGCAACACTCCTCCTCCCCTGAGTCCTATCGAAGTCAGTCTCTCCCGGTAACCTCTTCAAGGCTTCAAAACTCATACTACCACCGTGATTGGCGGCGGAGGCGGTAGGGGCGGAACCAAAATTTATGTTCAGTGGGGTCAAAAGAGTCAGAATTTATATTAGTGGTGTCAAAATTATAAAATTTATAAAATTTAGGACAAATTACTAATTTTTATGAAATCAATATGTATTTATGATAAATTATATTATAAAAAATAGCGTGCTTTTTTTCTGACCTCAATGCCCCTATGTAGCTCCGCCACTAGGGGAGGTGATGCCACCATTGGAGAGTCTTCTTCTGGTGGTGGCGGCGGTGGTGAGACTATACTGGTGTTTGCAAGTTTAGCCCTACTAGCAATTGGTGGTAGTGGGGATAGTGTGGCGGCCGCTGCTGGTGGAGGCAGCAGCATTGTTCGTAGGAAGAGACCCCAAGACTGAGTGCTGCCGCTGGAAGGCCAGCCATTGCAATGCCCAGTGTGCGGAAGGTGTTTTCCTTCTAATCGTAGCTTAAGTGGGCATATGAAGATACACCCCGACCGTGGCTGGCGGGGGATCCATCCACATCCAGTTTTTAGCCGCAACGAGTTTGGTGACATTCTCGGACAGGCGGAGGAGGAAATGGCGGCAGCGATGGTTGTGAATGAGGCCGAGACTGGTGGTGACAAGGAGGAAGAGGAGGTGGTGGTTGCAGCGGTGGCGGAGGGGAGAGAGGAAGTAGCGGCGGAGAAGGGCAGGGATGGAGTTGATCTGAAGGAAGAGCCACCGCGAAAACTGCTGGACTTGAACAGGCCTCCTTCACCGGATGAGTAATATTGGTTTTCTTAATTATTATTGGGTTGTTTCTCTATTTATTAATTACAAAGTTTTTCTTGTTTTTGAATGATGGTTTGGTGAATGGATGTTGTTATGAGGTTGTTTTTTCTAAGTATTAATTACACAGAGTTTATGTCTGTTAAACATGGATTATTCTATGGAGGATTTTAAATTTGGGAGATTAATATTGAGTTCTCTGTATTTTTTGATGAATAATTACATTATTCAATTCTATTTAAGTCCCATGCTTAATTGAACACAGGGAGAGAGAGAGAGAGAGTCTGATTATTAATGATCAACTGTTATGATTATTAATAATTACACTTTCCTCTTTTTATTTGTATTTATCATGATGAATTTACTCAAAATATTACTATTTAAATAAAAGTAAATATTTTAATAAAATTATTCTACTAAAACAAAAAAAATGGGTGCAATTACAGAAAAAGTGAGTGTAAAAATAGCATTTTTAAAAATAACTTAACCGAGTGATTTTCAAACTTTTTTTCAACACTCGTAAGTTTTCTAATTAAAAATAATAAAAAAAGTTATAAGGGAGATAAACGATCCAATCTTTTAACAAACTAAACTTTAATATTTTTTTAAAGTTTGTTAATATTTCAAACAAGCTTGAATACTCTACCATTCATTTCCATAAGTTGTTTAAAAAATTTAAATTACTAAAGGTCAGCAGCACGCTTGAGACCAATATAAGCTCGATTATAATTTTAAAACCTCGTTAATATTTTAAACCAAAATTAAACATTTCGTTAATCAATTCTACTGATTTCCCATGCTTGTTTACTGTGCAAACAAATCCTTAGGTCATGAATCATTGTTTAAATTACAATGAGAATCCTTGTTTCAAAAATCAGGGCGAGCAGTTGCTTTAGTCGGCTATCAACCGTTAGATCCTCAAATGAAAACCCTAGATTTTTGTTGCCTATATAATCACTTCGGGAGAGAAGAAAAAAAGAAAATAGGGTTTTTGTTGTAGAGAGATAAAGAAAGAGAGCGAGCGATAGAGAGCGTCCCGAGACAGAGTTTGTGTGCTACAAAGAGAGTTGCGGTTGAGAGAATTGATTTGATCACTGATTCCGTTAATGCAGTGAGTATTGAGTAATTGCTTCTTGTTTTGAATTTAGATCATCAGGTTTGTTGTTTGATTCTTGTGGTTTTACTTTTTTTTTCTTATTTCATATCATCATCTGTTCTTGGATCTTCGATTCTGTCTTCGTAATTAGGTATTTTGAGACTGATATAGATTTTTATTGCAGTTTTAGTGAAGATATTTGCGTTTGTGTAAGTTCTCCTTGTTTTGATTTCAATTATCAGGTTTGTCTGTCGATTGATTCTTGTGGTTTAGCGTTTTTTTCCTTTTAATATGATCTCCAATTATTTCATATCATCATCTGTTATTGGATCTTTGATTCTGTTTTAATAATTAGATGTTTTGTCTTTTTTTTTTGAGACTGATTTAGATTTCTATTGCATTTGCAGTGAAGATTTTTTTGCGTTTGTGTAAGTTCTCCTTCTTTCATACTTCGATCATCAGTTTGTCCATTTGTCCTTAGATTCTTGGGGTTTTACTTTTTTTTTCTTTGAATTTGATCTCCAATTATTTCATATCATCATCTGTAGATGGTTGTTACCTATAAATAATGCGATTAATTCCTCCATATCACGTCTAGTAGCGATTTGTCTCCCTTCTCTCTCCTTCTCTCTTTGTGTTCTGCGATTATCAATCCAAAACCCTCGCAAGCAATGCAATTCGTGGAATCATTCAATCTACGAGGAGAGACACACGTGAGGGATTGTTAATCTTCTCGATCTTTCTCTGATCTGCTAGCGATTGCCTAATTTGTTATGTAATTTATTTAATTTTTTATGTACATCCATTTATGTAATTGCTTCAAGGATCTTCCTTCTTGTATCAGTACATGCCGATTTGATTCTTCCTGTTCTAATGAATTTCTATGAAGATGTTGTTTTCACTTGCATCAATTAAACTCCAAATATTGCAGGCGTTGAAAAATATCAAAGTGGCTGCACTTTTTGATTGGATAGTCACAATACGAATCTTGGATCTCCTTGAAGTTCTGTCACAATCAGTAGCTCTCTCTCCCCTCTCCTCCTCCTCTTCTTCTTCTTATGATGATGATGAGTTTTCTATGAATATATCATTTTTTTCTTATGCCCATTAAACTCAAATATTGCAGGTGTTGAAAGAAGTTGAAAGTGTTTACTATTCTTGGTTGGATAATCGCAATATGAATCTGGGATTGAATTCTGTCTTTGAAGTGAAGCACTGTCACAATCAATAGCAATCTATCTCTCCCCCCCCCACTCTCTTCTTTTTTTTGTACTGCTGAATCTTCTATTTGTTTTCTCAACCACCAAGTATTTTGTTTCCACATCTAAAATTAACCTAGTGTTAATCTGCAACAGAAGGGCTGTTCTTGGAGACTTGAACAAAAGGGGAGTGTGAAATCACTCATCTATTGAACAATATGATTTCGTTTTTCCTTGAAAAGAAAATAAACAAAAAAGAAGGCTTTTCCTGATTTTAAAACCTCACGGAAGTTATTGCACAAGTCTGAGAAATAATATATTTTTATTGTAGAGGAAATATCAACAAAAAATTATATAGTTTGCTCCCTTTAAGACCTTCACATAATCATGCAAGGGCTCTCTTTTTCCGTCTTTATCCTTTTTTTTCTTCTATTCAGTGTACGGTTTGAATATTGAAGTAGCTTATTATTACTCAGAAATAGGAGAGCAGTTACTTTCTTTTTTGAACAAGAGGAAGGCGTGTTTACCATCTTAGCTAAAATTTACGAGGATGGTGTCATTAACACATGATAATATTCTTGGACCTTCACTTCTTATTATTACCAATGTGGTGAGTATAAATAAAATGACATACTATTGGAAACTAAGGATCTGTTCATAATATTTAACTGATGACATTAAAGGTTGGCTTATTCTTTTTCCTTTTTTAGGTTGGGAGATGGGGCTTGAGGGGGTGGCGCTGCCTGCCATTGCATATAGAGACTGCAGTACATTTTCTACCTCCACATGATAGGCTGGGCTTCTGATTGTTTGGGGACATAAAATGTTTTGGGGGCTATCAAGTGATATAAATGAAGAAACATCTGATCAGTGAGAGAGAAATAAATCTGTGTGGTCGCCCCTGGAGCTGTATTAATCGACACTTGTTGAGAAGCGAATTGATTGTGGGAGGCAGATGCGTCGAGATTCTGTGGTGATAATTAATTGGTTTTATCAGCCCTAGTGGTTTTCCGTTGTTTTTTGGCTGGGGTTCGGGCCTTGAGTTTTCAATATAGAATGGAAGATAGAAAAAATATTAGCTTGGTTTTACAGAGAATCATAGGGTTTGACTGCTTTTGAGAGTGTTTCAGATAGTCAATCGTTGCCTTGAAATTTCTGGCTTTCTTTCAGGCACATTATTAGTTTTATTTTCCAGAATATGCTTTTTTTTTCCTTTTCTTTTCATGTTGCATATTCCTTGATTGTAGACTTCTAGCTTTTCAGTTTGTTATACTTTAAAATTCAAATGGTTAGGCTTTGCATGCCACAATCAAGTAATTAGCCTTTTTATCTATGCTACATCATCTTTCCGTGTTTTCTTTTCATTAAAGTATGTACATGCTTCTGCTTTAGTATTGATTTTACAATTTGGATGCATTCTGCTTTGTATGGATTGAATCTAACATCTTTAAACCTTTTAAGTAACTTTCAGTTCCAGAACTGTATGGCAAGGAGGTGGAAATTGTCATAAATATTAAAGATGATCTTGAGGATTGTTTGATGCTTAAAATTTTTATGTGCCATTTAACAAGACTCCGAAATGTTTATTTGCATGGTTACTAATAGGTTTTTACATATTTTCCGCTGATGGCGGGTTTCTGTTGCTTCAATATTTAAGTAACTCATGGAGCCCTTTGGTAATGCATTCTTGTGACTAAAATTTAAATTCATATTTGAGGATGTTTTTGTTTTCCTCTCTATCCTTTGCGCTTTCTACTGCTCAAATGAATCTTAATTAGTTTTATACCTACGTTGAGATTCTCCACTTCTTAATCTGACTGATATATTTATATTGAATCTTAATGAAGTTTACCAGCCACCTTATGATTCTGCAATTATCGCTCTGATTGAAAAATTTATCATAAATGGTACCTTTAGTCTAAGGCCACCAGTGGGCTTGATTATTATGGCAGTGTCTTGATTCAGCACAATTTCTTTAGCAGGGAAGATGCTATCTTGGAGAGCAGGGAGTCCTTTGAATGACAATGTTGTGGTAATGGAATAGTTACTGTTTCTGACTATCATTCTTTGATTTATCACTAAAGTGTTTCCGTCAGTATATCCTATTTAGTTATCAGTTGGACAGAGTGCTCAGCTGCTCTGTCTTATTACCAGACAAGGAGGAATCCATCTAGTTTATTACAGTGTGCTGGACACTTGTGACATTAAACGGAGATGCTTTTGCAAAAAGCCATTGACCAAATAGATATCTTGTTAACCTCGTAGTAAGAGTTGGTGAACTTTTTGAACTTGTAATTTTACAAAAATAAGCTGGTTTCTCACATCAGCTTCCAGTCCTTTTTAAGTCCATTTCCTTGTCTCTCAATGGCTGTTAGGGAAATCTTTTTTCTATGAGTTTACAGAATATCATAATCCCACTCCCCCCAACCCATCCCCCCACCCAAATGCAATGTGCACCCAAAAAGGAAATCACCTTCAATCTTTGTTCCAGTTTCTTGGTTTCAACTATGTAGATTCGTTTCCTCTGGTAGCGTTCGTTAAATACCAAATTCTTATTTAAGTTTAAAGTATTATGCCATTCTTTACCGTCTCAAAGATGTTCACTTTGTTAGGATGGTTATGTTCAATATTATTCAGTAAGAATCAAATTGTGCTTGGTAACTGCAGAAGACTACTCAAAGAAGTGCAAGTCTTTCTGGAGATGTTGAACAATTCCCGGGCCCAATGTGGGCAGCATGGGTTGTACATCTGATGTGATGTGTTTTTCGGTAACACATCCAAATGCAAGAAATTTAATATTATCATTGTAGAGGTTGGTCAAATGGAGTTTCTTGAGGTAGGCGTGTTTTCAAGGTTTATTTTGTGACTTGAAATTGTGGAGAAAGAATTAGCTAATCGATTGTTGACCCATGTATTATTGTTCAATACTATTTTGTTGACAATTACAATAAAAATGTGTCTTGATTTTTTTTTGTTTATGTTTACTACTATTGATATTTTATTAGTATACTTGACACATTTGTTTGATATTTTTTAAATATTTTTTATCTTGATTCAATCGGTGGTAATATATCTTTGGTCCGTTATCTAAAAATCTATGAGAAAAATACTTTTTTAAATTTAACATGTTTGACAACTCGCCTATTCACAATGTATAGTCGAATGATTTATATTTTACTCTATTTTATAATTATTTTGGTATTTGATTATAATTATATTTATATATTTGTCAAAAAGTTTTTTTCTACTTGCTAATACTTTCTCCTAATGTTTTTGAGCGTATTGTATTTCATCGTCTAAGTTGATTCTCTGTTTTACATATAATTTGCTCAAGTAGTCCATTGTAAGTTTTATCCATACCAATTCCTCGGATTTTTGAAAATCGAATGAGTTTTCCTTAATCGGTACGTAAAGTTTTTTAAAAATTACGTTGTCGTGTTAAATTATTATATTTAGGATATTTAACTTGTAAATTATTACATTTTGAATTGACATCGTTTGTGTTTCATTTGACTTATCATTTCTATTGTTGATTGGGTCTTGGGTAAGTAGCACAATTGTGATGTGATTTACACCCCTTTATAGACGATCTCTTTAATTTATTTCATTTGTGTTTTGTTACCAGGTAGTCTCCTCACATTTGCGTATGCTTTAGGAACTTGTTACGTGCTTGGATGAGTGTTCCTTCATCGTTCCGTGAAGTGTTTAAAACATTGCATAATTGTGAAATAGTTTGATTGTTTAATATACTTGTAATTTGATTTACCCCTACCTTTTTCGATAATATCTCTAATTGACTCGGTTTTAAATTTTTATTTCCAGGTCGTGACTTCTTGGTTATGTAGCTAAGTGGTATTGATCTAGTAGTGCATGGAAAGTGTTATACTTACGATTCTTTTGGTTTTTAAAAATCATAAACAATTTTAAAATTGAGATCCTTGGGGTATTTTTATAGTTGCGATGTGATTTACTGCTAATTTCTTCAATTTTGTATTGTCTTTGCAGGTGATGTCTTCCACATCTACAACTACTTTGGGACCTTGGTCTTGTGCTTGGAATCAATTTTCCTTGTTCCGTGAAGTGTTTTAAAATATTACATAACACATGGATTATTAAATTTGTTTTTTTTAATGTTCTTGTAATGTGGCTTACCCCATGCTTCTTGATAATATCTCTAATTAGCTTAGTTTGAATTTCATTTGTAGGTCGTGACTTCTCATTTCTATAGTTGTGTCGAGCTTACTCAATTAATGCATTGTAAGTGTTATACTTGGTGATTCCTCTGTTTTTTTGAAATTCATAAGCAATTGTAAAGTTTATATTAGGATTATTATATTTTGAGTTTTCTTTGTAGGTGTGTCTTCTCATTTCTATTGCCTCTGCTTTGAGGCACAGTCTTGTGCTTGGAGTGGATTTTCCTCAGCGGGTTCAATGAAGTTTTTAAAATATTGCATTTCATTAAATTATTACTTGTAGGATTTTTACCCATGTGCTTCTCGATATATCTCCAATTGAGGCTTAGTTTGAATTTCTTCTGCAGGTCTCGACTACTAGTTTCTGAAGTTGGTTGAGAGTAGCTTTTGTAGTACATTATAAGTGTTACCCTTAGTGATTCCTTGGATTTTAGTTTATTTCGTTTTGTTGTGATGTGATCTATGCCATTTCGTGGACGATTTCTCTGATTTATTCAATATTGAGTTCCCTTTTTAGATGTTCTCTTCTCACTTCTGGAGATGCTTTGTGACCTTTTCAAGTGCTTCGAACGAGTTTTGATTAACCGTTTCATGAAGTTTTTTCAAAATTTTCAAATTTATTATATTTATTTTTTTAATATACTTGTCTCTAATTTGTAAAATTTTGTATTTCTGTTGTAGGTATTGTTTTGTCACTTCTGCAGCTGCTTTAGGACCTTGTCATGTTTTTGGAATGTTTTTCCTTAACGGTTTTGTTGTGTTTTTTAAAGAATATTCATAATTGTGAAATATTTAGCTTGTTAAATGTACTTGTAATTCGATTTACCTCTACTCTTCTCGATCATATCTCTAACTAATTTAGTTTCAGTTTCTTGTGCAGGTTTTGACTTGATCATTCCACTAGTTTGTTTGGACTTGCTCTAGCAGTGTATTACAAGTGTTACCCTTAGTGATTACTTTATTTTTGAAATTCTTAAGCAATTGTATTATAAGTTTTTTCAAAATTTTTAAAATTTCAAATTTATTATATTTGTTTTTTTAATATACTTATCTCTAATTTGTAAAATTTTGTATTTCTGTTGTAGGTGTTGTTTTATCACTTCTGCAGCTGCTTTAGGACCTTGTCATGTTCTTGGAATGGTTTTCCTTAACGGTTTTATTGTGTTTTTAAAAAATATTCATAATTGTGAAATATTTAGGTTGTTAAATGTACTTGTAATTCGATTTACCTCTACTCTTCTCGATCATATCTCTAACTAACTTAGTTTCAGTTTCTTGTGTAGGTTTTGACTTGATCATTCCACTAGTTTGTTTGGACTTGCTCTAGCAGTGTATTATGAGTGTTACCGTTGGTGATTACTTTATTTTTGAAAGTCTTTAGCAATTGTAAAATTGAGATATTTGGGTTATTCAATTTTTAGTTTCCTTTGCAGGTGGTCTTCTCATTTTTGCAGTTTCTTTGGGACACATGGTCTTGTGCAAGAATGGCTCTTCCTTAATCAGTTGGTGAAATTTTTTAAATATTGCATTGTCTTTAAACTATTATTTTTAGGATTTTTAATATACTTGTAATGTGATTCACCCATTCCTTTCTCGATATCTCTCTTATTGAACTAATTTGAATTCTTTTATAGCTTGTGACTTCTCGTTTCTATTATTGCTTGGGACTTGCTCACTTTGTGCATTGTAAGCATTATCTGTGGTGATTATTTGGAGTTTTTTAAAATGTTAATCAACTTTAGTATTGAGATCTTTAGCTTATCTCTTACAATTGTGATGTAATTTATGCCACTTCGGGGACGGTATCACTGGATTATTCAGTTTTTTATTTCCTTTTGCAAGTGTTGTCTCCTCACTTCTGCAATTGGTTTAGGACCTTGGCATGTGCTTGGTATGAGTTTTTCTGAATCTTTCTATGAAGTTTTTAAAATATTACCTAGTTGTGAAGTTTATATATTTGGAGTTATTTAATATCATTGTAATATGAGTTAATTAAATGGATTGTTACTAATATATATTTAACTTATTTGAACCTGGCAGTTGGAATTGCTGAATCCAGCTAGGGATGCTAGGTTGCCGATAATTGGTGGCCTAAGTGGGTTTTGTCTCCCAGAGGTTGAGAGCATTTTGTTCCAAACAGAACATTGCTTCATTCATTCAGTTTACGCAGAACTCAGCTCTGTGCTCTTTGCACGTCACTTTCATGGATTTGCAAAAAGGATTGAGTACATTCTTTAGGCGGCCCTTTACGAATCTGTTGGGTTGATATTGTGCTTCTTGGACGGTTGGACCTACAACATTGACGCAAGATCACTAAAGCTTAGTACGAGGAGATCAAGAAGCTTATGGAGGAGCTTCATTTGGTTATGTTCTTGCAATTGGTTACTAAGGAGGTTCTAGACTGCAGTTATACTCTCCCATTTGACAAGGCAAGTGAAAATTATCCACTTCCTGATTGATTGAAAACTTGAAATACATGGGGCCCAGTGAGAAGTGGGATATATCTAGCCGTATCCATATTCTATTCTCGTAGGTCTTACCATATTGATGTACCCTCATTGTACCTGTACCCATAAACGTGCTTCATAGCTTTTGACGCATGCACGCGCACAAACACCAATTAATATAGCTTTGTAAACCAATTAACTAGGTACTAAAAGTGTCCTCATGTTTTAGGGATAACACTGATGGAGACTTGGGGAAAATGGCAACTTAGAATTAGGTTTTGGAGGGTGGGGTAGCGTTGAATGGAATTTTTATAGAATTTGAGCATGAATATTGCATTTGGCATTAAAATACTTTAGGAGGACAAGAAGTGTAAGCATGCAGCCGAGCCCCCATCTGGAAGTATTGTCCACTTAGGCCTGGCTAAACAACTTCCCTCAATGGATTGTCCCTCTGGCATCCTAGCCCAAAAGGCACCTCCAAGTTGGAAGTGTCTTTCGCTGTCTTGTTTGGTCATCGCGGGCATTGTCCGCAATCCATGTGAGATTCCCACAAGAAGCATAGAAGTGGATACTCGGACCATAGCCTCTTGTAGGTAAGTTTTTACCTTTTCTTCTTTTTTAGTTTTCCATGCTGATGTAATACTCAATGTGCTTTTATTGATTTTATACATTATAGGATCAACTTTTTGAGTTGCATATAAGAAGTTTCTAAAATTTAGTCTCTTTTTCACAAGGCAGGAGTTGTGTCTTAATAATGAATTCTGTAGTTGAGGCTGTAACTATATTTATTGATTCTTGTAGTTTCATTATGCAAGTTAACTACATCATATGAAGTCTGAACTTTTATTCACTTAATATAGAAATTGCCAAAATGCTTTTGTAAAGTGTTCTTCCAAACCTGGAGTATACTTGAGCCTCTTTCATTGCATTTCCTGGACTTGTTAGATTGGTATGAAACTTTTATTTAGGAGAATAAACAACCTTATGCTTGGAGTTGGCGAGAACTGTGTCTCCACCCCTTCTATGCGTGCGTTCACATAAACCCTATATGGTTGTATCTTCGTGGATTATATTAGTTTACATTACTACGATTTGGATGGTATGCTAGGATGGGGAATAAAAAAGTACGCGTAGTTAGTACCCATAAAAGGTGTCTAGGAGGGATAAATTGGTAAAAACTTGACATTTGACAATATATGCACAAAGTGATTGTCGTCAGGAACCTACAACCTCAGGTTTAGTATGCCATGTTTTAACCACTGAACTAATGGATGGATGGTATGCTAAGAAGGGAAATACGAATGAATATTCATAAAAATCGGGATTGCTTAAATTAATGGATTGAGAGAAGGGGAAAAAACTATTACGAGGCTTGCATCTATATCTATACTTCGACAAGTGCTCTGAAGAATCGGAGTAGAATTAGGCATCGTTGCCAAATCCTAAACAAAGGAAACCTTGCTATCCAAATGTAGTTTTGTGGCTCAGCCGCCACCTCACAAATTATAGATCTAATTGAAGTAACATTACTGTTCATCACCCTTCCCTGTGCCATTTTTTTTTATTCAATGGAAGTCCCTGTGCTATTTTTTTTTTCATCCAAAAACAAATTTGTCCTTTCATTAGGGGATGATGTTTGCAAAAACTGTGTATAGCATCTTCACTTTATTGGTATCATTGAAGTAAACTGTTTGAATAACGGTAAAATATTGATTTACATTTTAGTTATCATGCACTTGTTACGATAAGCAAGATTGCCTGGCCTACATCTTAAAATATGATCGGTAGTGAAGTTTAATAATGAAGTATGTTTTAACGAATTCCTTATGCATTTTTTTTTACAAACTGGTTGTGCCTTTTCACCGTTTTGTTCGACGGAGCCCTGTTATATAAGTTTGTATGTATATCCATGTATAGATGTTGGTTTTATTTCAAAGTCATTTTAGTTATGTTGCATTAACGACTTCAACCATAATATAAGCTGGTTTTTTAGATGAAACTCTTTGCCTTTGCACAGGTTAGTAGTTCCTGAAGACCCTTTTGCCCTGTTCTTTAACACCCTTAAATTCCATATCTCTTCTGCATTTAGTTTACGGACTGGTTGTGCTTTTCACCCTTCTGACTTAATAGTTTCTTGATTGTTTTTTCCCCATATATAAATCTAGCTTTTCTTCTTGGCTAGCACCATTGGGAACTGTCCACATATTATACCTAAACCTGAACTATATTTATTTATTTTCCTTGTATCATGGACAGGATTGGTGGCAGATCACACTGTTCACTTGGTTCGTGGTTTCGCTCCAACTGTACCAGTCACCACTGCATGTGCAACCAACACTGGAGTTCCAAATTCTACTCCAAGTGGCGTGGCGTCTGTTGGTTCTGACGAAGGGGCATTGGGAGGAACTGGTTTGGGCTCTTCGCTCTTTCCTGGACTTGGTTTTAATGGATTAGGCAGCAGCAATGGATTATATGGAGCTGGACTTCCAGAAATTGAACAAGTGCAGCAACAGTTGACTAAGAACCCCAATCTGATGAGAGAATTAATGAACATGCCTCTTGTTCAGAACCTAATGAATAACCCAGACATTATGCGGAATATGATAATGAACAACCCACAGATGCGTGAAATCATTGATCGAAATCCAGAGCTTGGTCACATACTCAATGATCTTAGCACTCTCTGTCAGTCATTGGAGACTGCAAGAAACCCTGAACTCATGCGTGAGATGATGCGCAATACTGACAGAGCAATGAGCAATATCGAATCTTCTCCTGAGGGATTTAACATGCTGAGGCACATGTATGAAAATGTCCAAGAGCCTTTTCTAAATGCAACAACCACGGCTGGGGATACTGGAAATAATCCAGGATCAAACCCTTTTGTGGCTCTTTGGGGGACTCAAGGTGGCTGGCAGGGCAGAGATCTGGATACTAATCCTTCTAGCACTGGTTCCAAAACTAATACCAATTCTCCTGCTTCAAACACTAATCCACTTCCCAATCCGTGGGCCTCTGGTGGAGATAAGTTAAGCTCTCTCTTTAGTCCTCTTTTTCTTCTTTAGGATTTTGAATGTTTTGGTGTTGAGATACATGAATTTGAGGCTGTACTTATCCTTATTATCCTTTGCTCTGCTGCTTCATTTTGTTTGGGTTAAATTGTGGCGTTATACGTTGCTGATGTCAGCATTTTTAAAAATAAAAAGTTGGTTTTTATCTATACTTTTCTCATTTTTATTCAGTGTAGGTTGGAAGGATATCTTGTTTATAAGCTAGTCATATTAATAAGAGAGCCAACATATGACAAAAGTATTAGCATTCATTATAGGCATAGACTATTCAAGTTGAAAAACTTTGCTGCATCATATGTGATATGTGTAGTCCTACTAATTAGAATATCATCCCCAATTTTATTGTTCCTGTTCAATTTTTTAAAAGGTGTCACCGTTTTTCCCTGAACTTCATTATCTGAAGTTGACTTTAAATAAATTATATGGATTGTTACTAATGTTTAACTTACTTTGAATTTGGCAGCTGGTGGTGCCCAAACAAACTCCACTATGAGATCGAGTCCAGGTGGGGATGCTAGGTTGCCGACACTTGGTGGCCTAAGTGGTGTTGGTCTCCCAAGACATGTTTGGTTTCACACAAGACAACGCTTCATTCAGTCAGTTTATGCAAAGCCCAGCTGTATCACAGATGATGCAAAGTCTCCTCTCCAACCCTCAGTACATGAATCAGGTAGTACTTTTAATTTTTTACAATGTAGTACGTGTTTATTACCGCTTTCAGGGCTTGCTTATAGTTCGTTTGGTGTTTCTGTTTGTTGCAGCTTTCTAAAACAGCTCATGACCCTGACTTGAATATGACTATCCAGAAGCACACTTATGGATGCTTTTGGCTTCCGCTTACAGATTATCAACTTTCAGATTTAAATAAGATGAGACCAAACTGCCTCTAATATGGTTCATTTGACTATGGCTTTTCTAATTCTAATATGTATTTCAATTGGTAGATTCTTGGGCTGAATCCCCAGCTGCGCAATATGATGGATTCCAATTCCCAACTTAGAGAGATGATGCAAAACCCAGAATTCCTTCGCCAATTGACTTCCCCTGAAACAATGCAGGTACGATGCTTGAAATCCCACGTCCCTCTCATGCACTCTGTCTCCCTATATTTGGAAATGAAAATGAGACTTGCATATTATTGATATTGGTGTGATTAAAATAATGAAGGGCTGTATTGAGTCATTGACATCTCTCCAAGTGAAATCTGTTCCATTTTAGCATTTTAAAGTATTGTTTTGCAGCTTCCGACAATTATTTAGGAATTTAACATTTCTCTAATATCTTTCAAGAACTGCTTCGCTATAACCATCCCCTTGTGGTTGGTGAAGGGAGGGCCTCAGAGCCCCTATTGGTAGAAAAAAACCCACAATCCCTTGAGGTCCTCCTGAAGAAGAAAACGGATTAAATTCAGTGATAATTTGATTCTTTGTTGTTGCTTAACACATGCCAGTCTTACGAGCCGAAGTAGCTCTGCATGGTATTGTCATTTTACCTATAATAAATTGGTTTACTGAATAAGATTCAATTGGCCGTCTCTTAGGAACTGACCAAAGAGTTAAGGAGTTACGATCATCTCATATTGAGAAAACGTCATTGATAGCTTCCGCTACCCGACCCAGCCTTTGCTTTTTATTTAGGGTAAATTTCATTTATGACAAATGCAACTACCTCCTTTGTAGTTTTAGAAATAGTGTTGACCTCCCTTTCTTTTGAATCTAATGTCAACATTCCACCTGAAACTAATTTTTGTGCAAAAATGACAAATTTGCAATTTGATTTAGGGATTCCAATTTTTTTTTTCTCTATACACATTAAAATAAATAAATATTTTCTTCTTTTTCTCAAAATATCATTTACTTGTAAATAATTTTATTTTTATTTTTTATCACTAAGTAATTTTTGTAAAAAGGATTTTGATCTAAACAGTTTACTTTTTAAGTGCTCCAAATCTAAACATTCTTAAAAAATATTTTTTTTATCATTTTTTTAAAAATAATAGAATGTTTATTTATTTTAATGTGTGTTGAGAAAATAAATTTGGAAGTCCTAAATATAAGGGCGAGATTGTATTTTTGCTCAAAATTAGCTTTCGGGGAGAATCTTGGCCATAATTTCAAAAGTAAGGGAGATTAGAGCTATTTCAGAAACTATAAGGGAAGTGGTTGTATTTGTCAGAAACATCAGGGGAGGTCAATGAAATTTATTCTTTTATTTATTATTGGAAATGGGAGGCTGAAGAGAGGTTTATGTTGTTTTTCCTTTTATTTTTTGAGATTTGTTTGTCAACGACTAGTTTGTTTTCAATCTGGCTGTACAAACTCTTTAAATTTTTATTTTTTACTTAGAAAGGGCTTTCTCCCTAATACTAGGCATTGGATTGGGTACTTATTATCAATTTTCTCATTTTACAGTTTACAGATAGATCAATTGCCATCATAAGTGTCTCGAGTTCTCACCCCTTACTCATTTAGGTTTCTTGTTTTTTGGAACATCATGAGCTAAAATTAAAGTTCCTCCCCACCAACTGCATGGGTTGTTATGGGAAAAGTAAATGATTCATGTAAGAAATATCTCAATAAGTAGCATAGTTTATTCTCTACAGCACACTATAGGCATATGGACCCACTATTCCCGTGGCTTATTGTCATTGGGCGGGGCTTGTAGGCAAGACAATGAACAAGTAAAACACCCGGTGTGGTGCTGTATGATACACGTTAGACAGTCCCGCCAATTTGCAAGCAATAAGTTGACAAAATGCCAAGGAAAAGGCTACTCAAGCATATGAAAGTGAGACATTCAAGAGCGAAATGACAGCTTTCCATTGATCAAAAAGGTGTATTACAATGTTTTAGCCATGCACCCAAGTACATAACTCAAAACAAACCATTGTCAAAAAACTAGTTAAAGACAATGGTTGGGCAAGTCATGAACCTGACCCTAATGGTTCGTCAAAGTAGCTTGTCCCATTTTCCCTCAAGGGACCTTCATCAAATGTTATGCGAGAGAGAATTCACCACACGATGACTTGGTGACAAGCCAAATCTCTGCATCAATCAGCCGTCATAGCTGGAAGGAAATCGAATCCGTTGTTTAACTGCTAGGACTGATCCATGCATTCAACCGTCGGCCAGAAAAGTGAATGGGCTCCAACTGGTTTGCCTCCTGGACCAACCCATTCTATAATTTGAAGGATCTGTTCTCCAACAGAAAGTGAAATCCTCTCCTATTGGGATCATAGATGCCTCACCAGAGATTGCCCTGGCTCCCATCCAGTCATTTTTCTCCTATAATTTTACACTATGTTAGAGCACCATTACTCGTAGGCTCCACCGCGTCATTTCCACAATAAAAAAATAATAAACTTCAGATTTAAGATTCTTATATCTATCAAATAACTTTTTTAATTTGGCAGGCACTTAATTTTTTACGAAACACATTTTCAGCTGACAAAATTCAGCATTCAGTAATTAGTTTTATCTAACGCCACCTATGTTACTTGATTCTTGTAGTTTCATGGTGTAAGTTAACTGCATCTAGTAAATCTTGAATGTCTGTCACTGAATATATAAATTGCCGAATTGCCTCAGTCGATGTGCTCTTCCAAATTGGGAACTACTTGAGCCCCATTTTGCATTCCATTTCCTGCACTTGTTTTGCATAGGAGAAGTCATGATTAATATGAATGAAGTGGGGGAAATAGAACAAATTGGAATGCAAACATGTGGTAGTTACATCTTATTTGAACTTAAGTGGGAACTTTCTTATTTGTGGAGAACTATTCAATATCAGCATGCATATATGCATGTGCATGTGCATGTTTGAGCCTTTTGTCCCTCCTTTTGTTTTAAAACGTATTAACTTTGTTCTTTATTACTTTATTTCCTCTGGGTTGGGCCACTTCTTCCAAGAATTATATATAGCTCGTTCATAAATCCACTTGACCACTCAGACTTAACGACGAAGTCCTTCTTCATTACTTTATTTCCTCTCGTTCTTAATTTTTATTTTCCCTGTTTCAGCAAATTTTGACCTTACAGCGAACTCTTCGTCTCAGCTTGGTCAGCAATCTTCAACCAGGTAAGTGATTTTGCTTCTAGATTTTGTACAGTAAAGGAAACCAATTTCAAGCCTGCTAGTCTTATCATTAACCATACGTTTATCAGTGTAACTCACTTTTTACTCATATAGCTGTATGTAAATGTTGACACAATCAATATGTTCACGTTACTGTCCAGATTATTTGAAACATTGATTTTTCTAGCCTTTTATACCTGGCGACCATATAGAATTTTGTTGATTAGATTTAACCCCTTTCCTTTTTTAATTTGTCTATTTGTAATTGCACTCTTGCAGGGAAGCAGGTCAAGGTGTTGGTGGGACAGGTACGTTATCTTGGAACTTGACATTCTAATTGCATATATTTAACCATAATGCTCAGTGATTCTGAAATCAGAGTGTCTATTCGTGGTAATGCAAGATTGCAGCTTGTCTTGCCTCATCTATCTCAAGTTGAAAATTCTTTAAGCTTAAACTTCAATTCTAAAATAGGGATCTCCCAAGGCTGTGTTTGGATCAAAAGGGAAAAGGTGGAGGATCCAATGGTCCCGAACGGTTGGATCCTCTAACTTTTCTATTTTCTTTTCCTTCACCAAATCCTTGATCCAAACACGGCCTATGAGCTTGAAGACTGTTCCTTTGTAATCTTTTGTTGAATGTGGAGGATTCTGGGATTGTGTCCTTCCATCAATTAAGCACAACATGCCTAATCTGAAATCTCTGTTGATGCTAACCCTGAACCCCATATTTATTTTGTAAAAGAGAAAGGAAAACCGAATAAACAAGACATGAAGATGGCATTATATGAAAATTTCCGGTTGTTTTCTTTAATAGTAGTTATTTAACTCACAGTGACGTGCCCTTGTTCTCTCAATAGCAGAGAAATTGATGGCATGGGGCTGGAGATGTTGATGAACATGTTTGACAGACTCGGGATCGCAATGCCTCCGTCTCTAGGGGTAAGCCAACAGTTTCTTTAATGGTTTTCTAATCCAATAAATAAGATGAAGAGAGCAACTCCATTTGGAGCATCTCCAACCCACCATCTATATCTTCAAAATGAGAAAATAGAGAATCTTTCATTTCACGATTCACTTTTTTAAATTTCAAATTTGCTCCCTTCAACTCTTGATTTTAAATTTGATTACCAATCTTATCCTTTCTACTTTTTATTGCTTTTTGATAAACTACATATAACTTTTAACATACATTTATTTTTTATAAAATTAACATGGTCGAGTATATGTGGAGTATACCTTTAAAATAAGACCAATATTCAATATATTCGCTAACAATTTGAAAATTGATTGGAGGAACTTTTTTAGAAATAAGAGTAGAGATTTGTGAATTGAGTTTGCTTGAATAATAAAAGCCTCTAAACTTAATTTTTGAATAAAAAAGAATATTTTTATGTTATTCTGATTATGGCAATTTTTGAAGCTAGTTATTGTTTACACTATATTTTTTTTTATTTGTATTTGTCAGGGTGAATTTATTTTAAATATTAATATTTGAATAAAAGTGGGTATTTTAATAAATTTATTCTAATAAAGACAAAAAAATAGTGCAATTGAAAAAAAAATGAGTATAAAAATAGCCTTTTAAAAATAACCTAGGCTATTTAAAAAAAATTCTATTTTAACTCGATAATTAGTAACTTTTTTTCTTTCATTAATTTTCTCCTACCGTTCTGAAATCTTATGCTTTCCGATACTATATTCTAAAATTGTAATGCAAGCATATATGAGAATCTTTCACATAATGGGGATTGGGGACCAACAAAGGCCAAACCTATCCGCCATAACAAATTCACGATCCTTCCTAATCTGGCAAATCTTCTTATTTACCAAAAGCAAAAAAATCAAAATTTATGAAAAAATACAAAAAAAAAGAGAAGTGAAAAAATTCTACGGATTCAATTGATCAGAAGATATCAAGATTTTTCAAAATGAAGCCATTGCATATAGGGTAATTACCTCTCCGAACCCAAAGCTCCCTCGAACACAGCCTGCAAAATATATGCCCAGAAGGTGTGAATGCAGCCCCCTTGTGCTTCTCCATACACACGCAAAAGTTTTGCATTTTCAAACCTCTCTTTTCTACCGTTGCACTTATTTTTTTTTCTTTATTATTTGTTATGGTAAATTTACCCAAATATGCTTTTATAAAATAATTTTTTTATTTTTTACTTTATTTTCCCCTTTAAAACGAAGGTATTTTTGTTATTTCACTTAGTCATTATTATATGTGTGATTTGGTTCAAGATAATTATAATTGAATAAGTTTCTTAATGGATTAGGCAACCCCCCAAAAATTATTCTAAACATATCTCAAATAGGAACTTAAACTTTGTTTGATAATAAATTTTGAGGGTGAAATTAGATTATTAGTTATGTGGGGCCTATTTTAATTATGTTTTAGTGCAAAAATTGATTTCTAGACTAATAGTTCATTGAGACTATTAATCTCCAATGAATAGATGATTAAGAATTCCATGGGGGTTGGTTTACTAATTCAATCCCATAAAACTATTAATTCAAAGGAATTAGAATTAGATTTGAATTGATAAACTCACTAAATTGAATTTTGTTATTAAACATGGCCTTAGACCCAATTTTCATATTGTTTGAAAGCCCCTAATATGTTGTTCACCTAAATAGAGAAAAATAAAATTTCAAAAATCAAAATTTCAATGCCCAAACTAGAAGAAAAAAAATCCCAACGCCCAATTTCCAAGACTCATAAATTTCCTAATTAAAGACAATGAAAAAAAGGTGTCATGATTTTCAAAATTCTATTTTGGCTAATTTACAAGGCTAATAAACGAATCAGGTTGCTTTGAGATTGCTTTTGTTCATCTCATTAGAAGCTCATAATTGGTTTGTTACTTTAACAAACTAAGTTTGAACACTATCACTTGTTTCAATAAGCTTGTGCTATTTAACAAAATTCAAGTTACTCGAGTTCAACCGATTACAACGCGCTTAAGATCAACCAAGCTCGAGCATAATTTAAAAAACTCATTAAGTTTACAAACTAAGCTTGAAAACTCTAATGTTCAGCTCTTAAATGAACCCTCTACGCTACACTGTAGGTGTATGGACCCACCATCCACATGGCTAGTAGTCATTGGATGGGGGCTTGTAGGCAAGGTGTGGTGCTTACCAATTCACTTTAGGCAAGTACCCCAAGCTCAAATCACTTGCATCTAGGTTGCAAGCAATAAGTAAAAACAATGCCACGGAGAGGGCTACTTTAGTAATATAAAAGAGATCCTCAAAAGAAAAATGGTAACATTTTATGAATTAAATGGTGCATCACAAATTCTTTAGACATGACCACAAGGTTACAACTCAAAACAATAGTTGAGCAACTCGTCAAGGTAACACTTGATGTAAATAGAATTCTTAACTTTTTATCGTCAAGGTAACACTTGATGTTTTGGGAGTCATAATTCCTCTTAAAAATCACTGAAAATAGAATAATAACAATTGGATATGGGCTAAGCATCACAAAATAATACATCAAATATACATTTGACCTTAGTTTGTGCGGCAAAAGGAGTTTGAATATATTTGTAAAAAGTTAAGAACCTCTCCAATAATAGCTCTTATTCTGTCCCTAAATTTTAACAAAAAAATACATTCTCTATTTTTAAGGGATCATTTTTCAACTACAAACTCCAACAATACTATCTACTTTTATCATATTTCTTTTAAATACTATTTTTTAATTTATAATATTCTCCTCCAACTTCTCTCTCCTCCCTTCATCTCTCTGCACCAACCCAAACATCCAATCTCCCTTTTGCATTAACCCAGACGCCCAATCCCATTGCAATTTTACATAAATGGCATGATCTTCACCTCTTTATTGTGATTTTTCACCTTTGATAGCTATAAATTGGTTCTTGATTTTCTCAATTTTTGCGGTCTCGGTGAGTGATTTCTGAATGGTATTCTCGATCTTGATTTGTGAACTTGGCAATATCTTCACCGATCTCGATGGGGGGATATCCAAGGATATCTTTGATTAGTTTGTAGAGATTCTAGAAGGACTTCTTTTTGTTATTTTTTCTTCATATTGAAGTCTCCAATGACAAAGCAACAAGGAGTTTTCACAACTCAGCGCACATAATCATAATCTCCACCACTTTGGTTGTCTGTGTTGTTATGTGGTTTGCTCGGGCGAGAGACGAAGAATGCTGTTCAATTTCAGTTCTGTGTTGTTTGGGACTTGCTCAATTAATGTATTGTAAGTTTTATCCTTGGTGATTCTTTAGAGTTTTTAAAATCTTAAACAATTGTAAAATTTTGATCTTTAGGTTATTCTTACAGTTGTAATGTGACAATATCTCTAATTTGTAAAATTTTGTGTTTATATTGTAGGTGTTGTTTTGTCACTTCTGTAGTTACGTTGGGACCTTGTCATAATTGAGTTACGTTGGGACCTTGTCATAATTGTGAAATATTTAGGTTGTTAAATGTGCTTGTTGGGACCTTGTCATAATTGTGAAATATTTGGGTTGTTAAATGTGCTTGTAATGCGATTTTCTCCTACCATTCTCTCTAATATCTCTAACTAACTTAGTTTCAATTTCTTGTGTAGGTTTTGACTTGATCATTCCATTAGTTTGTTTGGACTTGCTCTAATAGTGCATTGCAAGTGTTACCTTGGTGATTACTTTATTTTTGAAATTCTTAAGCAATTATAAAATTTAGATATTTGGGTTATTCAATTTTTAGTTTCCTTCGCAGGTGGTCTTCTCATTTATCCAAGAATGGGTATTTCTTAATCATTCGGTGAATTTTTGCGGTCAGTTGGGTTTCGAGATTGCAAAAGATTGTTGCTCTTTCTACCACAGAAGCGGAGTATGTGGCTGCTACCGAAGCTTGCAAGGAGATGGTTTGGTTGCAGAGTTTTATGAGAGAGTTGGGCAAGGAGCAATCGAATTGCACTATCTACAGCGATAGTCAAAGTGCAGTTCATTTGGCAAAGAATTCAGCATTCCATGCCAGAACGAAACACATCGACATTAGATATCACTTCATCCGATCACTCCTAGATGAAGGGTTGATAAGTTTGGAGAAGATCCACACAAATCAGAATCCTGCAGACATGTTCACAAAAGTTGTGATCATTGAGAAACTGAAGCTATGTGCAGCTTCAGTGGGTCTTCTAGTATGAGGGCCGTAATGCCACACCGTTTGAGTAAATATTGAAACAAGTGGGAGTTACCCGGAGGAGCAGTTTGGTGGTCAGCCTTCAAGTGGGAGATTGTTAGGTATGTGAAATGTGGAGCCTGACATTTCAATGTCTACAATTACGGTTGAGTCCAAGTCTCCGATTGCGGCAAGTCCAAGTCTACAATTGTGGCAAGTCCAAGTCTCCGATTACGGCAAGTCCAAGTCTCCGATTGCGGCTGAATGACATCATTGCTTAAGTCATCCTCTTCCTAGGTTTCTCTATAAATAGATGTTGAAGTCTAGGAGAATGATAAGAAGGTAGCTAAGGCTAAGAGAGAGAGAAAGAGTGAGGGAGAGATTGTAATCCTAAATTTTGTTTTGGGGAATTGCTACTCGGTGTGGCCGTGGATGTAGGCTTAATTGGCCGAACCACGTAAAATCTCTGTGTCCCTTTTATTGTTTGTTTCTTACTTGCTTGTTTGTGTTAGAGGTGCACAAAATACCCACCCGACCCGAGACCCGACCCGACCCGACTTCATTGGGTCGGTTTGGGTCGGTTTTTTCAAGTCCATGGGTCGGTTTCGGGTCTAAAAATTATAGACCCGAGCGGTTCGGGTCGGTTCTCGGGTCCCTAAGTTTTTTTACCCAGAACCGACCCGACCGGAACCGACCCGAGAACCGAAGGGTAGAACCAACCCGATCGGACCCGACTTGAGAACCGAAGCCTAGAACCGATTATATGGGCTTATAATGTACTCTACCACACTTGATTATTGCCTATTTTATATAGAATAAGTGAAAATATTTTTAAAAAATTGAAGAACTGACCCGACCCGACGACCCAACCCGAGAATCGAAGAACCGAAGAACCGAACCGAACCGAACCTGAGCGGGTCGGGTCGATTCGGGTCGCCGGGACATTCGGGTCGGTTCTGGGTCTAAATTTCTGGAACCGTTGATGGTCGGGTCGGGTCTGGGTTCGACACATACCCGACCCAACCCGACCCGTGTGCACCCCTAGTTTGTGTGCGTGTTATTATTCCCGATCCATTAGGGTGAAAATACGCATTGGTGTTTTTATCACAACACATTTCTCCAACAGAAAGTGAAATCCTCTCCTATTAGGATCATAGATGCCTCACCAGAGCGCTCTCTCTCTCCATAGATTGCCATGGCTCCCATCCAGTCATTTTTCTCCTATAATTTTACACTACGTTAGAGCACCATTACTCTTAAGCTCACATCCCATCGTACTCAACAATGAACCTTCCCATTTCCCACACATACCATGTAGCATTGCAAAGCAATTCAAGTGTGTATGTGAGTGTATAGATAGTTGCAAACTAGGTACAACTAAGTGTGATCCATGTTCAGGGCCGACATTAATAGAGTGAGCATGAATTTTGCATTTTGGCATTAAAGTACTCTACATGTCAGAGAAGCATAAAAGTGGAAAGCGGGGACCATACCCTCCTGGACATAAGTTTTCACCACATTTTGTTATCAACTTTTAGCTAACCTACAGGTAGCTATCATAGGAAGTATGCATCGATGTGCACCACTATCACACAATTACCATCGCCACCCTTCGACACAATCCCTATGACCACCACCACCACTCCACTCCCACCACCCTCCATCATCATCACCATAGCCACCACAATCATTAATTCCACTACCATTTCACCACAACACCAACACCAACACCACTACCTCCACCTCCACCCCACCTCCACCCACTCTCTACCTTTACCACCATTGTTACCACCATCCCTCCACCTCCACCACCATTGTCATTGTTGCCATAACTATCAACATCATTCTACTACTATTACCGTCACCACACCACCACCATTGCCACTCTACTTCAATCATCACAACTATCACTACCCTACTGCCGCCTTCAGCACCTCCACTATACCACAAACACAACCAGCACTGCCGCCACCACCGCGTCATCACCACAATAGAAAAATAATAAACTTCAGATTTAAGATTCTTATACCTATCAAAAAACTTTGTTAATTTGGCAGGCACTTAATATTTTGTGAAACTTATTTTCAGCTGAAACAATTCAGTATTTAGTTTTCAGTAATTAATTTTATCCAACACCACCTATGTTACTTGATTCTTGTAGTTTCATGGTGTAAGTTAACTGCATCTAGTAAATTTTGAATTCTCTCACTGAATATATAAATTGTCGAAATGCCTCAGTTGATGTGTTCTTCCAAATTGGGAACTACTTGAGCCCCTTTTGCATTCCATTTCCTGCACTTGTTTTGCATAGGAGAAGTCATGATTAATATGAATGAAATGGGGGAAATAGAACAAACTGGAATGCAAACATGTGGTAGTTGCATCTTATTTGAACCTAAGAGGGAGCTTTCTTATTTGTGGAGAACTATTCAATATCAGCATGCATATGCATGTGTGAGCCTTTTGTCGCTCCTTTTTGTTTAAAACGTATTAACTTTGTTCTTTATTACTTTATTTCCTCTCGTTCTTAATTTCTATTTTCCCTGTTTCAGCAAATATTGACCTTACAGCGAACTCTTCTGTCTCAGATTGGTCAGCACCCTTCCACTAGGTAAGTGATTTTGCTTCTAGATTTGTATGGTAAAGCCGTAAAGGAAACCAATTTCAAGCATGATAGTCTTATCATTAACCATACGTTTATCAGTGTAACTCAAGTATTACTCATATGGCAGTATGTAATTGTTGACACAATCAATATGTTTTTGTTACTGTCCAGATTGTTTGAACCATTGACTTTTCTAGCTTTTTATACCTGACGGCCATTTAGAATTTTGTTGATTTGTCTATTTGTAATTGCACTCTTGCAGGGAAGCAGGTCAAGGTGTGGGTGGGGCAGGTACGTTATCTTGGAACTTGAAATTCTAATTTCATATCTTTAACCATAATGCGCAGTGATTCTGAAATCAGAGTGTTTATTCATGGTAATGTGGTAATGCAAGGATTGCAGCTTGTCTTGCCTCATCTATCTCAAGTTGAAAATTCTTTAAGCTTATAAACTTTAGTTCTATGGATCTCCCAAGGTTGTGTTTGGATCAAAAGGGAAAAGGTGGAGAATCCAATAGTCCCGAACGATTTGATCCTCTAACTTTTCTATTTCCTTTTCCTTCACCAAATCCTTCATCCAAACACAGCCTATGAGCTTGAAGACTATTCCTTTGTAATCTTTTGTAAATCCTTCATCCAAACACGGCCTATGAGCTTGAAGACTATTCCTTTGTAATCTTTTGTTGAATGTGGAGGATTCTGGGATTGTGTCCTTCCATCAATTAATCACAACATGCCTAATCTGAAATCTCTGTTGATGCAACCCCTGGACCCCATATTTATTTTTGTCCAGATAAAAGAAAAAGGAAAACCGAATAAACAAGACAGAAAGATGGCATTATATGAAAATTTCCTGTCGTTTTCTTTAATTGTAGTTATTTAACTCAGAGTGACGTGACATTGTTCTCTCAATAGTAGGAACTGATGGCATGGGGTTGGAGATGTTGATGAACATGTTTGGCGGACTCGGGACCGGAAGCCCCGTTGCACCAAGCATATCCAATGGTGATTATTATTTCCTTTTCCCTCGAGCCTTCCGATCTATGTTTTTGTTGATTTGTTGGCTAAATTCTTTTGGGCTCAAGCCCAATGCTAATTCTAGGCCCAAGCTTAGGCCCAAGCCCACAGAGAGCCATTGTCAAAGTTGCAGCTTCTTCTCTTGTTGCTGCCGACAGAGGAAGTAGTCGGCCGAAAGAGGAAGAAGCCATTTGTCAACAATGGTGGCACCTCCCCTCCCAAGTCAAGCTTGGTGAGGTCATTGCTTAGGTAATTCTGTCCCTAGCCTTCTCTATATAAAGCTGCGCTGATAGAGTAAAATGGCAGGGCAGAAATTAGAGAAAAATCAGAGAGAGTAGAAGGGCAGAGAGCTTGAGAGAATTCTCTCAAATTGTATTTGTATTTGTTTCTCTCCATATAATAGAATTGCTGCCACCCGAGGACGTAGGCAACATTGCCGAACCTCGTAAATTGTGTGTTTGTGTTGGATTTGTTAGTGTGTGTTATCAGAATTTGTTATTCCGCACAACAATTGGTATCAGAGCCAAAATCGGCATTTCGGACCTCTGTAAAAGTGGTCGAAATTGATTTCTGATTGCACCACCTTGTTCGTCTCCTCGAGACGAAACTCTAGCATCAAACCGCGTCGAAATCGGACTCCGAACGAGCTCACACGAGTTGCGTGAAGTCGGTGACGCGTCTCTGTTTCGCGTCTCTGTAAATTTGAGGAAGACGAACTGTTCATTGGTAAATTACAGTTTCAACCCCTGAAGTTTCTGTTATTTACATTTTGGTCCTTAAAGTTTTGATAATTACAGTTTGGTCCTTATATTTTCTAAAATTATAGTTTGGTCCCTGTATTTTCTAGAAATTACAGTTTGGTCCCTGAAGTTTTAAAAATTACAGTTTAGTCCCTGTAATTTTTGAAAATTGTATTTTAGTCCCTGAAATTACTAAAAATTTCAGATTGGTCCCCAGGAGTTCTAATTTTGACAAATTGGCCCCACAAGTTTCTGATTGTGACAGATTGGCCCCAAAAGCTTTTGATTTTTTCAGTTAAGCCCTTCTTAAGTTTTTTCAGCATTCCGGACTCACCTGTGTGGTCAAAATTTGCATATTTTGATCCTATATATCAGTTTGGGTGGAGTTAAGTTGTTTAGATGGAAGAAGATAAAATCACTAGCACTTCCACTAGCACTTCCGGTAGCTCTGGGCATAGGACTACAATGTCCAATGCCAAATTTGAAGTTGAAAATTTGATGGGACAAATAACTTTGGCATGTGGCAATGCGAAGTTTTGGATGTCCTAATTCAACAGGACTTGGATATTACTCTGGAGGCCAAGCCAGAGGACATGTCAGAGAAAGATTGGGCAAAATTGAATCGCCAAGCTTGCGGTACGATCAGACTTTGTCTTGCAAAAGACCAGAAGTACTTTGTTATGAAGGAGACCTCAGCAAAAGAATTGTGGGGCAAACTCGAGAACAAGTACATGACCAAAAGCGTTGAGAACCGGCTCTATCTGAAGAAGAAACTCTTCCGGTTCCAATTCAAGCAAGGTACGTCAATGCATGAGCATTTAAATGCATTTAATAAAATTTTGGCTGATTTGCAAAATTTAGACGTAGAAATTGACGATGAAGATAAAGCTCTTTTATTGTTAAATTCCTTGCCTGATACGTATGAGCATTTGACTACTACTTTGCTGTATGGTAAAGATGAAATTAAGTTTAACGATGTTTCAAATGCTTTGATGAACAACGAGGTGAGAAAGAAGGATCAAGACGCTCACCGGGAATTAAGTTTAAATGCATTGACAGCAAGGGGTAGGACGAGTACCCGAAAATCTGGAGGGGATGGAAGTCTCGCTCAAAATCAAGGAAAAAATCATCCGAGAGACGGCAGCTTGCAAAGGATGAGTGTGCCTATTGTCATCAGAAAGGCCACTGGAGAAAAGATTGCCCAAAGATAGAAGGCAAAGAACCAAAAGCGAACATAGCTCATGATGCAGTCGAGAAAGATGACACTGCATTTACTGTTTCTTTGTCTGCTAGCCATTTTGACGAATGGATTCTAGATTCTGGTTATTCCTATCATATGTGTCCTCACAGGGACTGGTTCTCGAGCTTTGAAGAGCTCGATGGAGGAGTTGTTCTAATGGGAAATGACAACGCCTGCAAAACGATGGGAATTGGCACAATCAGATTGAAGATGTTCAGTGGAACCGTCAAGGTTCTTACTGATGTTCGCTATGTACCAGATTTGAAGAAAAATCTCATTTCATTGGGAGATTTTGATTCAAAGGGGTACAAGATTATCTTGGAAGGTGGAGTTCTGAAGGTTGTTCGTGGTGCTCTTGTTATTTTGAAGGGCACTCGTAGAGGAAATCTCTACTTCCTCGATGGGAGTACTGTCACAGGGAGAGCTGCTGTCTCCAACAGTTCAGACGAATCAGACACTTCCAGATTATGGCATATGCGATTGGGGCATACTGGAGAAAAAGCTTTGCAAACTTTGGTACGTCAAGGAGTTCTGAAAGGAGCTAAGACTGGAAAAATTGAATTCTGTGAGCATTGTGTGCTTGGCAAGCAGACAAGGGTGAAGTTTGGCACAACAATTCATCAGACTGAAGGCATTTTGGATTATGTTCATTCCGATGTCTGGGGGCCTTCTAAAAATGCATCTTTGGGAGGCTCACGCTATTTTGTAACCTTCGTTGATGACTTTTCTAGAAGAGTTTGGGTATACACGATGCGGCACAAGGATGAAGTCCTTGAAATCTTCTTGAAATGGAAGAAGATGATCGAAATCCAGACTGGTAGAAAGATCAAGAAGCTCAGATCTGATAATGGTGGAGAATACAGGTCAGATCCTTTCTTCGATGTTTGTTCCAAAGAAGGGATTGTCAGACACTTTACTATTAGGGGCACGCCGCAACAGAATGGAGTTGCAGAAAGGATGAACCGCACCTTAGTAGATAAAGTTCGATGTATGATATGCAATGCTGGTTTGAGCAAAGCATTTTGGGCTGAAGCAATAAACTATGCCGCACACCTTATCAACAGACTTCCTTCCACGGCTATTGAAGGAAAAACTCCTATGGAGGTATGGTCAGGAAAATGTGCTACTGATTATGATAGTCTTCACATATTTGGATGTCCTGCATACTTTCATGTAAAGGAAGATAAGTTGGATCCCAGAGCCAAGAAAGCTATCTTTGTAGGCTTTAGCACTGGGATAAAAGGATACAGACTATGGTGTCCCGAAATAAAGAAAATTATTAACAGTCGGGATGTTACATTTGATGAGTCTGTGATGCTGAAGAATTCTGAGAAAGAAAATCTGAGTCCTACATCCACCCAGCAGGTGGAGCTCGTGAGTCCTGTAGTGCCAACTAAAACTGTTCAGACAGTTGATATTCCTGACGAGGAATCTGATGATATCGACACTACACCAGATCTGAAAGAGGCTCAATCTTCACAACCAGCAGAATTCATCGCGACGAGTAGGCCACAACGAGTGATTCGTAGACCTGCTCGATATACTGATACTGTGGCATATGCACTTCCAGTGATTGAGGGAGTCCCATGTACTTACAAAGATGCTGTGCAGGGGACTGAAAATCCAAAATGGAAGAGGGCCATGGATGAAGAAATGAAGTCGCTTCACAAGAATCAAACTTGGGAGTTGGTGCCGCTGCCCAAAGGAAAGAAAGCGATCGGTTGCAAGTGGATATATGGCAAGAAGGAAGATACTCAGGGAGTCAGATTCAAAGCTAGATTGGTGGCTAAAGGCTACGCACAGAAGGAAGGAATAGACTACAACGAGGTATTTTCTCCTGTTGTGAAGCATTCGTCTATTCGCATTTTGCTAGCTTTGGTTGCTCAGTTTAATCTTGAGTTAGCTCAACTCGATGTCAAAACCGCTTTTCTACATGGAGATTTGGAAGAAGAGATTTACATGTCACAGCCAGATGGGTTCCAGGTGCCTGGAAAAGAACATTTGGCATGTCGGTTAAAAAAGTCTCGAAGACAGTGGTATAAAAGGTTTGATTTGTTCATGGACGAGCATGGGTATACACGGAGTCAGTTTGATCATTGTGTATATTTTCGCAAACTCCAAGATGGTTCCATGATTTATTTGCTCTTATATGTGGATGATATGTTAATTGCATCTAATAGCAAGGTGGAGATTGACCGATTGAAAGCTCAACTCAGTCGGGAATTTGAAATGAAGGATCTTGGCGAAGCCAAGAAAATTTTGGGCATGGAGATTAAGAGAGACAGAGTGAAAGGTACAGTTTGGTTGACTCAATCTCAATATCTGAAAAAGGTTTTACAGAGATTTGGAATTGATAGTTCAACTAAACCTGTTAGTACACCGTTGGCCTCTCACTTCAGATTAAGTGCTTCTATATCTCCTCACACAGAAGATGAGCGAAAGCATATGGAGAATATTCCTTATGCTAATGCTGTTGGTGCCTTGATGTATGCAATGGTTTGCACAAGCCCAGATATTTCACATGCTGTTAGCATGGTCAGCAGGTATATGCACAACCCAGGAAAAGTTCATTGGCAGGCCGTGAAATGGATTTTACGCATGGTTATCAAAATCGCGATCCGGATCGTAGGATCATACGATCCCACGATCCCAAATGGTTGAATCGATCCGGATCGATAAAATAATCGCAGTGGGATAGGATCGTGATAGGATCGTTACAGGATCGTATAGGATCGTATGGGATCGTATAGGATCGTGACAGGATCGTAGTAGGATCGTTAAAGAATATAAGAATAAGAATTCTTGAATTTTTGTACTTTTGAATTCTTATAAGTTCAAACTATTAATATTTTATATGTTACTTTAGGTGCATTCAAAGCAAATAAATCGTTGACACCAAAAAAAATTGAATGATTTGGTTTTTGTTTTGCACAATTTGAAATTGAGACAAAGGCATTTTTTTCTTTTTGATATTTTAACTATTTTTTATATAATTTATGTTCATTTTCTATTAATTTTGAAGTAATTATCATAAATTAAAAAAATTATTAACCTTTTGCTCCTATTTGGTAGGATCTTACGATTCTCGATCCGATCCTACGATCCGATCCGAAAGGCCCCAAAACGATCCAAGGTAGGATCCCGATTTTGACAACCTTGATTTTACGATATATTCACGGTACAGTCAATGTTGGTTTGAAATTTCAGAGGGACAATAAGTCAAGTCAATATTCAGTTGGGTATGTTGATTCAGACTATGCCGGAGATCTTGACAAGCGAAGATCCACCACTGGTTATGTGTTCACTATGGCTGGTGGACCAGTATGTTGGCGATCTACTCTTCAGTCTACAGTTGCTTTGTCTACTACTGAGGCAGAGTACATGGCAGTGACAGAAGCCTTCAAGGAAGCAATCTGGCTTCATGGTTTGATAAATGATTTGGGAATTGATCAGGAGCATGTTGATGTCTATTGCGACAGTCAAAGTGCGATTTGTTTGGCTAAAAACCAAGTTCATCATTCCCGCACCAAACACATTGATGTTCGGTTTCATTTTATTCGAGAAATTCTGAATGAAGGAGATGTACTGCTTGAGAAGATCAGCACCAAAGACAATCCTGCTGATATGTTGACGAAGGTCGTATCTGGAATCAAGTTTAAACATTATTTGAACTTGATCAATATTTCTGAGCAGCATGGCGCCTAACGGCGCATTGGTGGCAGCATCACTCAAGTTGGGAGAAGTTTCGCCAAGGTGGAGATTGTTGATTTGTTGGCTAAATTCTTTTGGGCTCAAGCCCAATGCTAATTCTAGGCCCAAGCTTAGGCCCAAGCCCACAGAGAGCCATTGTCAAAGTTGCAGCTTCTTCTCTTGTTGCTGCCGACAGAGGAAGTAGTCGGCCGAAAGAGGAAGAAGCCATTTGTCAACAATGGTGGCACCTCCCCTCCCAAGTCAAGCTTGGTGAGGTCATTGCTTAGGTAATTCTGTCCCTAGCCTTCTCTATATAAAGCTGCGATGATAGAGTAAAATGGCAGGGCAGAAATTAGAGAAAAATCAGAGAGAGTAGAAGGGCAGAGAGCTTGAAAGAATTCTCTCAAATTGTATTTGTATTTGTTTCTCTCCATATAATAGAATTGCTGCCACCCGAGAACGTAGGCAACATTGCCGAACCTCGTAAATTGTGTGTTTGTGTTGGATTTGTTAGTGTGTTATCAGAATTTGTTATTCCGCACAACAATTTTGTCACATACTCACCCTTTTATTTTATTTTTTTTCATTTTTAGTGCCCCCGGAAGAACTGTACGCCACTCAACTCTCACAGCTACAAGAAATGGGTTTCTTTGATACCCGAGAGAATATACGGGCGCTGATAGCCACTTCAGGGAATGTTCATGCTGCGGTGGAGCAGCTGTTGGGGGAACCTTGGTCAGTAGATAATAATCATTTGTTATTGTCCTATTCGTCTCAACATTTATTGTCTGTCGGGCCGATGAAATTGGTTTGGACCGGACTAAAGAGGATTTTTCAAAACCTATCTTGGCTATGAATTAAAAATATAGATTCGATGTTCTGAAGTTCTTGACATAAGGTATGATTGTGGGAATACCCTCTTCTATTCCCCACCCTAATAGTAAGGTGAGTGATATGTACATACACTATTAT\n>URS000039472C misc_RNA from 1 species \nTTGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTACCGAGTGCGGGCTGCCTCCGGGCGCCCAACCTCCCACCCGTGACTACCTAACACTGTTGCTTCGGCGGGGAGCCCCCTAGGGGCGAGCCGCCGGGGACCACTGAACTTCATGCCTGAGAGTGATGCAGTCTGAGCCTGAATACAAATCAGTCAAAACTTTCAACAATGGATCTCTTGGTTCCGGCATCGATGAAGAACGCAGCGAACTGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAGTCTTTGAACGCACATTGCGCCCCCTGGCATTCCGGGGGGCATGCCTGTCCGAGCGTCATTGCTGCCCTCAAGCCCGGCTTGTGTGTTGGGTCGTCGTCCCCCCCGGGGGACGGGCCCGAAAGGCAGCGGCGGCACCGTGTCCGGTCCTCGAGCGTATGGGGCTTTGTCACCCGCTCGATTAGGGCCGGCCGGGCGCCAGCCGGCGTCTCCAACCTTATTTTTCTCAGGTTGACCTCGGATCAGGTAGGGATACCCGCTGAACTTAAGCATATCAATAAGCGGAGGAA\n>URS00020CB488 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAGACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGTGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATGGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCAGAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGTGATGACGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS0000A7B684 snRNA from 1 species \nGTGCATGCTACAACTTCTTGAATCCACATGCACATATACTAATATTAGAACGGTCTAGAGAAGATTAGCAGGCTTCTGTAAAAGGAAGACATAAAATTTCTGAAGCATTTCAATAGCAT\n>URS0000077F17 rRNA from 1 species \nCGTGTAGGCGGCCAGATAAGTCCGCTGTGAAAACTCGAGGCTCAACTTCGAGCTGTCGGCGGAAACTATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAGCGTGGGAGCGAACA\n>URS0000CF0C65 rRNA from 1 species \nGTGTCAGCCGCCGCGGTAACACGTAGGAGGCGAGCGTTATCCGGATTCACTGGGCGTAAAGCGCGTGCAGGCGGTTTGGTAAGTTGATCGTGAAAGCTCCCGGCTCAACTGGGAGAGGTCGGTCAATACTACCGAACTAGAGAGTAGAAGAGGAAGATGGAATTCCCGGTGTAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGATCTTCTGGTCTATTTCTGACGCTCAGACGCGACAGCTAGGGTAGTAAACGGGATTAGAGACCCCGGTAATCCTAGCCGTAAACGATGTGAACTTGGCGTCGGTGGCTTAAACACCATCGGTGCCGAAGCAAACGCGATAAGTTCACCGCCTGGGGACTACGGCCGCAAGGTTAAA\n>URS00022DC966 tRNA from 1 species \nGCTGCAATAGCTCAGATGGTAGAGCGGCTGCCTTGTAAGCAGCGGGTCGCGGGTTCGATGCCTGCTTGCAGCACCA\n>URS0001ACB2BC rRNA from 1 species \nAGAGTTTGATCATGGCTCAGATTGAACGCTGGCGGCATGCTTAACACATGCAAGTCGAACGAGAAAGTGGGCTTCGGCCCGCGATTAAAGTGGCGGACGGGTGAGTAACACGTAGGAATTTTTCCTGAAGTGGGGGACAACTCCGCGAAAGCGGAGCTAATACCGCATAATCTCTACGGAGCAAAGCAGGGGATCGCATTTCGGTGTGACCTTGCGCTTTAGGGTGAGCCTGCGGCGGATTAGCTTGTTGGTAGGGTAACGGCCTACCAAGGCGACGATCCGTAGCCGGTCTGAGAGGACGATCAGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCCTGCGGGTTGTAAAGCACTTTCAGTAGAGAAGAAATGCTCAAGGTTAATACCCTTGAGAGTTGACGTTACCTACAGAAGAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCAAGCGTTAATCGGAGTTACTGGGCGTAAAGCGTGCGTAGGCGGATATTCAAGTCGAGTGTGAAAGCCCCGGGCTTAACCTGGGAAATGCGCTCGATACTGGGTATCTAGAGTATGGTAGAGGAAAGTGGAATTTCCGGTGTAGCGGTGAAATGCGTAGATATCGGAAAGAACATCAGTGGCGAAGGCGGCTTTCTGGACCAATACTGACGCTGAGGTACGAAAGCGTGGGGAGCAAACAGGATTAGAGACCCTGGTAGTCCACGCCGTAAACGATGAGAACTAGACATTACCTTGCACTTATTTTTATCGAATGGTGAAAATAAGTGCGGGGTAGTGTCGAAGCTAACGCGTTAAGTTCTCCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCTACGCGAAGAACCTTACCTACCCTTGACATCCTCGGAATCCTGTAGAGATACGGGAGTGCCTTCGGGAATCGAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCAGCCTCACTTCGGTGAGAGGAACTCTAAGGAGACTGCCGGTGATAAACCGGAGGAAGGCGGGGACGACGTCAAGTCATCATGGCCCTTACGGGTAGGGCTACACACATGCTACAATGGGTAGTACAGAGGGTTGCCAAACCGCGAGGTGGAGCTAATCTCACAAAACTACTCGTAGTCCGGATTGAAGTCTGCAACTCGACTTCATGAAGTCGGAATCGCTAGTAATCGCGAATCAGAACGTCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGAATTGTACCAGAAGCGGGTAGGATAACCTTCGGGAGTCCGCTCACCACGGTATGATCCATGACTGGGGTGAAGTCGTAACAAGGTA\n>URS000199E147 lncRNA from 1 species \nGGAAGTGGTTCTTAGAGGCAGTGTGTCTCCCTCTGGTGGCAGAAAAACTGGACCACAGGCTCGAGAGCAAACCACAGTCCCCTCTCGCTGCGTCCAGCTCTGTTATATAAAGCAAAAGAAACGATTTAGGAAAATAAAGACAAAGCGTCTCCTTTATAGACATATGAGCACCAATGAGCTGCGGCCTCACACCGCTGAAGGTAAATTTGTCCTACAAAGTTCAAGACTTCCTTTAGGTGACCTCAAATAAATGGAAAAGCTGTGTCTCACTTACAGAGAAGGCTTTTCCATGTTGTTTGTAAAGTAAATAACAGTCAGTGACCTAAACACGCTCACCTTCACCACGGATGCACAGTCCTCTGGATTTTTTACTTGCTAGCAACAAAATACTGAAAACATAGTGAGCTCATCTCCATGACAATGTATCAAACCTAAACCAACACATAAACACTTTAACACAGTACATTTGATAAAGCTCTAGATTTAATGCACATTCATGGGATTTTCTTTTATTAAACCTCTTATGCAGTCATATATAATAAAGCACTAACCTGAGGCTGATGCCATAAAGACTCCTGCCTGCTAGATACAACATGCCCGACTCCTTCAGCTCAGCCACTGCTTCAGGGGAGAACTTCACAACACAATTTGCATATAGCATAAGATCAGCCTTTTACTTTGTGCATGATGCAAACTTTAGTTTTCACTCTTTATTCAAGTAACAGGCCAGATGGCAAGAAAATCCACAGAGAGACACGGCAGCGGCACACCTCGCTTCCATGTTGTGACAACAGCAGCTTGTTTTAATGCTGAAACCTGCCCCTTGTAGGTGTGCACCAGGTAGGAGTCCTCTTTAAGACCTTCAGGTCTTTCAGGGAGCAGATGAGACACAGATGATCATGAGGCGGTTTTTCCGAGCACACCGGGACGAGGACTTCAGTCAGATCCAGTATCTGACGGCCAAGTGCACCCGCTTAGCTCATGACAAAGCGGTGTTGGACAGAGAGTTTCTGGTGTCCCGAGAGAGGGAGAGAAGGCTGCAGAATGATCTGGAAGCTGTGACCGCCCGACTCCTCGAGCAAGACCAGCTCAATATGGAACTCAGGATGAACCAGACCCAACTCATCAGCAGGATCCAGCAGCAGCAGGACCTGGTGAACCTGCTTCGGCAGCGCGTGGTCCTGCTAGTGGAGGCGAGCTCCCGGGATGCAGAGCTACTGCGGCAGGTCGGCGCAGAGCTGCTTTGCCTGCAGAGCTCTGAGGTGAAGCTGGAGGGCCTGGTGGAGGAGCTGCAGGCTGAGGCCCAACATAGAACTGAGGTGGCAGAAAATCTCCAGACAGAGCTGTATGCTGAGGCCCGGCACAGAGCTGCACTCACTGAGAGCCTCCACGCAGAGCTGCGCAGTAAGACAGTGGAGCTGGAAAAGCTAGAAGAAACTAACAGGACGCTGACAGAAGAGCTGACGGATCTGCGCAGAACTTATCAGAAGGAGGTGAGAGAACTGCAGCAGGAAAATGAGGGAAGCCTGAGGAAACTTCAGGAGACGGCAGAGCAGTTCGAGTGGCTCTGTCAGCAACAGCGTTACTGGATGTCTTGTGTGAAGAGGTTCAAAGACTGCCTCATGGAGGAGAGAGAAGCTCTGCTGCGACAGGTCAGCAGGTTGGAAAAGAAAGCTGAGAAACTAAAGCGTTCACACGACGGCAGTCCAACACGGAGGCTTGTCTGCCCCCTTCAGGACGCCGAGAGCTGTGACAGCAGTATAACATCATGGGAGGCAGATGCAGTGACCAACCTGGAGTCTCAGGTGGAGAAGTCAAACGTGCTGTATGAAGAGCTCCTCGACCAGGCAGGGAGCCCTATCAACGGATACCAAAAACCTCCATGAGGACAGAAGCCTGGATGTCTTTGCTTTCTTTTCTCACCTTCTGCAAGCCAGGAGATGCAATGTTTTATGTGTTTGTGGTTAGCTTACCTTCCAGTCATTGTTTTGAAAAACCAAACACCCTTGGAAAAACACACCCGTGAAGCCACACACGCATTGTTTTGTTTCCACTATTGTTCATTGTGATATATGACCGAATTAAAATACAATGTGCTCCTGTCCCGCTTTTGGTGTCACACATGCACATCACATGTGCCTCGAGTCTGTCTGGTCACATTTTTCAGTAATTGTCCATTGTTCAAACCTTGTAATCAACACCACTAACAAGAGCACAAGCACCTGCAAATGTTCTCTTTTGTTGTTTTGCCAATGAAACGTTGCAGGACAACCAGCAGCTGGCGTGCAGAGGAAGCAACAAATGTTCTTTTCAACAAAATGAAGCTATACTGATTATCCCCCCACTGGTACAGCTTGACTCTGATGATCAGATCTCTTCATTCATCAGTTTGCATGTGGCTCACATTAAACACAGTGACTCAGACGCTTTATCATATGTGAACCATATGATACACACATATTGCAAACGCAGTTTACACACGGTGAGCCAAGACTTTTAAAGTATGCATTGTGTCACACTACAAACATTACACTGCAATCAACATGAGGAGCTACACGTTTATTCAGGACTACAGCAAACTTTCAACATGCATAAGAAATCTTAACATCACTAAACCATTAATGACACTGGAACCATCATTATATTTCATCGGTGGTGCTGGGACAACATTTTTTTCTTTGCCCACCTTAAAGTTAGCATGACAGGGGTTCGTTTGACCAACAGTGGACAAGAAGGCCTGTGTGACTTAAGCTTTGACTCCATGATCAATAGGCTTTACACAAACTACACCACAGTCTCATAGCTTTAATGGCACGACCACCAAGCTCCTGCACTCAGTCCGATGATGCTGAATAGCAAACATTTGTTTGCAAATATCAAACATATCTAAAACTTTGGGTATGTTGCTACATTTTATGTCTAAATCTCACAACCAAAAACCTGCTGACTTCATGATGAGTGAACCATTACAGTTCTTACTGGTTTCAGGGCTTGATCCAGTATTTGAGGTAATCAGTTTTTAGCCTGGAAATATTGCTAATTCTCTATGTGAAATAAAAATAATGCATATATATATATGTTCATAACTTACATGATTAAGTTATGTTGGCCCATAGCCTATCAGATCATAAATTTACATGGTGTATTGCAGAGGAGAGATAGTTGGGCATTAACCTATGAACTTTGTTATAAAAATGAAATTCCACATTTCAGAACTGGAGGACATATTGCGACTAAATCACACCAGGACCACATTCATCTTAGAGCTCTGCCTTTGCTTCATTGTAAAACCCCCATATCGAAAGGTTTCTTGACTCTTTTGCTTAGTTGTTATGGTAACAAAGTGACAGAAAAGGCAGTGACTGAATTGGTAGTTTATGCTACCGTAGCATTCTTCCTTTTGCCAAATGAATGTTTGCTCTTTAAAAATGAATTAATAACAGGTTACAAGCCTGTCTGACAGCAAATAAAGCTCTTAACATCCACCTCAGTTCTATGAAGCAGAACTTTGTTTTGTCCAGGTAACTTTAGGGTAACCCTGG\n>URS000201C513 misc_RNA from 1 species \nGATGAAGAACGTAGCAAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCGCCAGTATTCTGGCGGGCATGCCTGTTCGAGCGTCATTTCAACCCTCAAGCACAGCTTGGTGTTGGGACTCGCGTTAATTCGCGTTCCTCAAATTGATTGGCGGTCACGTCGAGCTTCCATAGCGTAGTAGTAAAACCCTCGTTACTGGTAATCGTCGCGGCCACGCCGTTAAACCCCAACTTCTGATTGTTGACCTCGGATCAGGTAGGAATACCCGCTGAACTTAAGCATATCAATAAGCGGAGGA\n>URS00025EF403 lncRNA from 1 species \nGTGTTCTTCACTTCATGATGGAAGGGCTACTGACCCAGAGTGGAAAGTTTAGCTGGTGTTTTGATCAGGATTTCTTACCTTTTTCTTCATTAGAGAGATTCTTCTTGCTGCTGTCCTGCTTCAGAGCTGCAAGGAACACTTGGGAATGACTAAAGCGGTGTCTGTGCTGGAGTCAGAGGAGTGGCAGAGCAGGAGGCACATCTGTCTGTCGCCTTGCCTGCTGAACAACAAAGGCAGTGCTTCATAGCAGCGTGGCTTTTGGATAGGTAGCCCAAAAAAAGCAACCGTGATCAGAAATCTGGGTCGTTGTGCTTCCCCTGAGCAAGCAAAGTTAAAGATAGCTTGGGAGACGTTTGCTGCTTCTCCTGCCTATTCCTGCTGACATCCGTGGGGATTTGCTGGCATAGTGAGCTACAGGCTGGTGCACTTCAGAAGAAAAGACTCTTCATCATCCGTTCCCCAGCTAGTATCCTGGGTGGCTCTCTTCTGCTGTGTTTCTCCACCAGTTGTGGTGCCCTACAGTGTGTAACAATTCTTGTGGCTTCCAAGTAATTATTTTCAAACGCATATGAAGTAACTGAAACTGTCTTGTAAGAAGAAAAAGAAGTTCCATGAAATCTGATGCTGTGTTTAGAGGATGTTGGTGTGTTCTCAGCAGGTGCGCTTTGCCTACATGTGGATCCTCAGGGTGGAGTTTTTAATTGTTAAATGATATATGACGAATCAAATAGCACGTACAAAAGACAAAGGAAAAGAAGACGAGAAGGTAGAAAATGGGAATTCAGGGACTGGTAAATGTTCTGCACACCAACTCACAGAGTGCATTTCTAGTTTGAATGCCAGTGCCTTGCATCAGCTGGAAGAATAAGTTGATAGCTTCCTGATGCTGCTGTTCATTTGCTTTTTATTTGAGTCTGTTTTCACATGGATTATAAAGTACTGCAATCCTTTTCCTGTAAGCCTGAATGCAGAATTACATCACTTGTTTGTATGCAGTACATAGAGCTAAAGTCTCCTGGGAAATGACAAGTCGTTAGCCTGACTACTTAATCATACTGTGATATGAAGAAAAATATTTGTAACTTCACAGTCTGCCATAGAACATCTTCATGCTTTATAATGGTGTGCTCCAAATGAGAAACTGCTTAACCTTGCTTTGCAGTTCTCTCATTGTTCTGGAATTGTTGTTTGAGCAATGAAACTTAATTTGCAGTGCAGAACTATTTTAATAATAAAGAACACTTGATTTCAT\n>URS0000CAA0FA rRNA from 1 species \nCCTACGGGAGGCAGCAGTGGGGAATCTTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGGAGGAAGAAGGTCTTTGGATTGTAAACTCCTTTTCTCGGGGAAGAGTAGGGACGGTACCCGAGGAATAAGTCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTTTCAAGTTCGACGTGAAAGCTCCCGGCTCAACTGGGAGAGGTCGTTGAAAACTGAGGAACTTGAGGCAAGGAGAGGGGTGTAGAATTCCCGGTGTAGTGGTGGAATGCGTAGATATCGGGGGGAATACCAGTGGCGAAAGCGGCACCCTAGCCTTAGCCTGACGCTCAGGTGCGAAAGCGTGGGGAGCGAACGGGATTAGATACCCTAGTAGT\n>URS00005B6C50 rRNA from 1 species \nTACGTAGGGGGCGAGCGTTGTCCGAATTTACTGGGCGTAAAGCGCGCGTAGGCGGGTCAATAAGTTGTGGGTGAAATGCCGAGGCTCAACCTCGGCGCTGCCTGCAAGACTGTTGGTCTTGAGGTATGGAGGGGAAAGCGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCGATGGCGAAGGCAGCTTTCTGGCCATATCCTGACGCTGAGGTGCGAAAGCCAGGGTAGCGAACGGGATTAGATACCCCGGTAGTCCTGGCCGTAAACGATGGATACTAGGTGTTAGAGGTATCGACCCCTCTAGTGCCGGAGCTAACGCATTAAGTATCCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATACGTCACTAACCGTAGGACCTTACCCAGGCTTGACATCTGGAGTAAGTCCATGAAAGTGGCACCCCTGTATGGTAACATACAGCTCCAAGACAGGTGTTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCATTCCATGTTGCCAGCGTAAAGTCGGGAACTCTTGGAAAACTGCCCGTGTAAGCGGGAGGAAGGTGGGGATGACGTCAAGTCAGCATGGCCCTTACGCCTGGGGCTACACACGTGCTACAATGGACGTGAACAAAGGGCAGCGATACCGCGAGGTGGAGCTAATCTCACAAACACGTTCTCAGTTCGGATTGCAGTCTGCAACTCGACTGCATGAAGTCGGAATCGCTAGTAACCGCAGGTCAGCTAAACTGCGGTGAATACGTTCCCGGGCCT\n>URS0001C9C972 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCCGAGAGGGTGGCCGGGCCCCATGGGCCCTGGGGACGGGCCAGGGCGCTACAGGGGGCAAGGGGGGGGAAATTTTGCCAAAGGGGCGGAGCCCGTAGAGAGCAACCCCGGGGGGGGAAGGCCGCCTTTGGGGTGGAAAACCCCTTTCGCCTGTACCGAGGCGGGGGGGCGGTTATTGGTGAAAAAGCCCCGGCTAACTTCGTT\n>URS0001CC6C7B rRNA from 1 species \nGTGAACGCTGGCGGTAGGCCTAACACCTGCACGTCGAACGGCAGCACAGTAAGAGCTTGCTCTTACGGGTGGCGAGTGGCGGACGGGTGAGGAATACATCGGAATCTACTTTTTCGTGGGGGATAACGTAGGGAAACTTACGCTAATACCGCATACGACCTACGGGTGAAAGCAGGGGATCTTCGGACCTTGCGCGATTGAATGAGCCGATGTCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACAATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATACCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAAGAAAAGCAGCAGGTTAATACCCCGCTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGTG\n>URS0002105CC3 rRNA from 1 species \nAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGGCAGCACAGTAAGAGCTTGCTCTTACGGGTGGCGAGTGGCGGACGAGTGAGGAATACATCGGAATCTACTTTTTCGTGGGGGATAACGTAGGGTAACTTACGCTAATACCGCATACGACCTACGGGTGAAAGCAGGGGATCTTCGGACCTTGCGCGATTGAATGAGCCGATGTCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTAGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATACCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAAGAAAAGCAGCAGGTTAATACCCCGCTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGTG\n>URS00025E055D rRNA from 1 species \nATGAGTTCCTTGCCCTGTGGATGCAAGTCACGGACATTCATCTTGACTGAGATGCCACAGACTCAATCTCCCGGTCTTGGGAAACTAGTGGTGACTTCTCTACCAAGACAACATACATGGCGAAGTTTTGGAGAAGACAAGTGTTGCCCAGGCCTGCCTTCACTTCGAAAGCAAGGGCCCCGTTGCAGTGCCATTTTTTTTGCATGGCTTGCACTTCTAACAGATGTTGGACTTCCGACCGCCTGGCATGCCGTGGCTTGGATCATCAGGAGAGTTGCCCTTTCTATGCATGGGAGAGGAGAAAACAATCGAACACATACTGCTTTAATGTGTCATCGCAAGGGAGGCGTGGACCATCATATGTCGAGCTCTAGGCAAAATGGATTGGGTACCAGAGATAGGATCAAAGTTGGTGGATTGATGCACAAACAAGCTTAG\n>URS0000DB583F tRNA from 1 species \nGGGTCCATAGCTCAGTGGTAGAGCATTTGACTGCAGATCAAGAGGTCACCGATTCGAACCCGGTTGGGCCCT\n>URS0002538569 rRNA from 1 species \nATGAGCAGCCGGGCTCCCAAGTTTATGCAGAACGTGCGCAGCTTCCCCGATGGTAAGCGCAACTGCTACAAGATTCGGTCCCTGGTGCGCGGGCTCAAGTACATCATCCGAGCGTGGTTCTTGTACGGCAACTACGACGGCCTTAACACATCGCCCATGTTTGACCTCTACATCGGCGCAAACTTTTGGACGACGGTGAACATGTCAGGGGGGCCATCGGACACTTATTTAACTGTAGAGGCCATGGTGGTCGTGCCGGACGACTACGTGCATGTCTGCCTGGTGAACACCGGCGATGGGACGCCGTTCATCTCGGCCCTGGAGCTGAGGCCGCTTAAGAGCATGCTCTATCCACAGGTGAGCCCGAAGCAGGGCCTGAACCTGCACCGCAGGTTAGACCTCGGCACGGGGAGTAAAACGCGCGTAATAAGGTACCCTGATGACCCACATGACCGAATATGGAGACCAGTGGATACCACCGCAGAATACCCCAGCATCACAACGTTTAGAAGGGTGCAGAACCCAAACGATGACCTTTTCCAGGTGCCGACGGAGGTGATGGAGACAGCGATGACTGCCCGGAACGCCTCCGCGCTCATAGAGATCACCATGCACCCTCAGCCTCAGCGCAACAACCCGTCGCCCGGGTACATTGCTGTCCTGCACATCGCGGAGCTAGGCATTCTCAGAGGCAACGCCGTGCGCCAGTTCTACGTCAACGTCAACGGCAAGCGATGGTACCCAGATGCTCTCACACCGAAATACCTCTCCAGTGGTGCCATCTACGGTGCCATTGTTCCCGATCAACAAGGCACCATCACCATTTCCATCGAAGCCACTGCCGGCTCGACACTGCCGCCGATTGTCAATGCTTTCGAGAGTTTCTCCGTCATGCCCACCACTAAAGTCGACACCGAGTCCGAGGAGGGTACGCCCTCGCCCACTCCCACCACTAACGCCGGGTCCAAGGATGGTAACTTCGGCTCCAACAAGTCCGAGGATGACGTTTGCATCGGTGGCAGTTCATGCAAGAAGAGTAATAAGCTTGTCCTCTACATAGCCGTCCCTATAGCCGGGCTTGTGGTGATAGGATCGGCGGCACTACTAATCTTTTGCTTGCTAAGACGGAAGAAGCAAGGATCAAGATGA\n>URS00008935E5 rRNA from 10 species \nAGTCGAGCGAATGGATTAAGAGCTTGCTCTTATGAAGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCCATAAGACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATAATATTTTGAACTGCATGGTTCGAAATTGAAAGGCGGCTTCGGCTGTCACTTATGGATGGACCCGCGTCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGCTTTCGGGTCGTAAAACTCTGTTGTTAGGGAAGAACAAGTGCTAGTTGAATAAGCTGGCACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGCAGGTGGTTTCTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGAGACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACACTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGAGGGTTTCCGCCCTTTAGTGCTGAAGTTAACGCATTAAGCACTCCGCCTGGGGAGTACGGCCGCAAGGCTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTCTGAAAACCCTAGAGATAGGGCTTCTCCTTCGGGAGCAGAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGATCTTAGTTGCCATCATTAAGTTGGGCACTCTAAGGTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGACGGTACAAAGAGCTGCAAGACCGCGAGGTGGAGCTAATCTCATAAAACCGTTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGAAGCTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGTCGGTGGGGTAACCTTTTGGAGCCAGCCGC\n>URS0000FCD8C1 rRNA from 1 species \nTACGTAGGGTGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTTGTAGGCGGTTTGTCGCGTCTGCCGTGAAAGTCCGGGGCTCAACTCCGGATCTGCGGTGGGTACGGGCAGACTAGAGTGATGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAAGAACACCAATGGCGAAGGCAGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGCGGGGAGCGAACAGG\n>URS000055AC24 piRNA from 1 species \nTGACAAGTCCCAAGCGATAATACAGGCTA\n>URS000027137F rRNA from 1 species \nCCTGGCTCAGGACGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGGAGTTCTTGTGATTGAAGCTTCGGCAGATTTCACTTGAACTTAGTGGCGGACGGGTGAGTAACGCGTGAGGAACCTGCCTTCCAGAGGGGGACAACAGTTGGAAACGACTGCTAATACCGCATAATGCAGCGTGGTCGCATGACCGTGCTGCCAAAGATTTATCGCTGGAAGATGGCCTCGCGTCTGATTAGATAGTTGGTGAGGTAACGGCCCACCAAGTCTGCGATCAGTAGCCGGACTGAGAGGTTGAACGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGGGCAACCCTGACGCAGCAACGCCGCGTGAAGGAAGAAGGTCTTCGGATTGTAAACTTTTGTCTTATGGGAAGATAATGACGGTACCATAGGAGGAAGCTCCGGCTAACTACGTG\n>URS0001F1045E rRNA from 1 species \nATTGAACGCTGGCGGCATGCCTTACACATGCAAGTCGAACGGCAGCACGGGTGCTTGCACCTGGTGGCGAGTGGCGAACGGGTGAGTAATACATCGGAACATGTCCTGTAGTGGGGGATAGCCCGGCGAAAGCCGGATTAATACCGCATACGATCCACGGATGAAAGCGGGGGACCTTCGGGTCTCGCGCTATAGGGTTGGCCGATGGCTGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGAAAGCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTCGGAAAGAAATCCTTGACTCTAATACAGTCGGGGGATGACGGTACCGGAAGAATAAGCACCGGCTAACTACGTG\n>URS00007CE013 rRNA from 1 species \nTTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGAACGGTAACAGCACTTCGGTGGCTGACGAGTGGCGAACGGGTGAGTAAGACATCGGAACGTGCCTGGTAGTGGGGGATAACTACTCGAAAGAGTAGCTAATACCGCATGAGATCTAAGGATGAAAGCAGGGGACCTTCGGGCCTTGTGCTACCAGAGCGGCTGATGGCAGATTAGGTAGTTGGTGGGATAAAAGCTTACCAAGCCGACGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGCAGGATGAAGGCCTTCGGGTTGTAAACTGCTTTTGTACGGAACGAAAAGCTCTCTTCTAATACAGGAGGGTCATGACGGTACCGTAAGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTTTGTAAGACAGAGGTGAAATCCCCGGGCTCAACCTGGGAGCTGCCTTTGTGACTGCAAGGCTGGAGTGCGGCAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAATCCCCTGGGCCTGCACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCAACTGGTTGTTGGGAATTAACTTTCTCAGTAACGAAGCTAACGCGTGAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGTTTAATTCGATGCAACGCGAAAAACCTTACCCACCTTTGACATGGCAGGAACTTACCAGAGATGGTTTGGTGCTCGAAAGAGAACCTGCACACAGGTGCTGCATGGCCGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGCCATTAGTTGCTACGAAAGGGCACTCTAATGGGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATAGGTGGGGCTACACACGTCATACAATGGCTGGTACAAAGGGTCGCCAACCCGCGAGGGGGAGCCAATCCCATAAAGCCAGTCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGTGGATCAGAATGTCACGGTGAATACGTTCCCGGGTCTTGCACTCACC\n>URS00018E2463 rRNA from 1 species \nGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCAACGCCGCGTGAAGGAAGAAGTATTTCGGTATGTAAACTTCTATCAGCAGGGAAGAAAATGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGGTGGTATGGCAAGTCAGATGTGAAAGCCCGGGGCTCAACCCCGGGACTGCATTTGAAACTGTCAGACTAGAGTGCAGGAGAGGTAAGTGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACTGTAACTGACACTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGAAACCCCAGTAGTCC\n>URS000076782D rRNA from 1 species \nCGGATTTCTGGGTACCGGTTAATGCGTAATATCAGAAGAACACCCATGGCGAAGCAGCCAACTGGGCCAATACTGACGCTGAGGTACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCTACTTGTCGTCGGGAGGGCTAAACCTTTCGGTGACGGAGCTAACGCATTAAGTAGACCGCCTGGGGAGTACGGCCGCAAGGTTGAATCTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAAAACCTTACCTGGCCTTGACATCCTGCGAACTTTCTAGAGATAGATTGGTGCCTTCGGGAGCGCAGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCTTTAGTTGCCAGCACGTTATGGTGGGAACTCTAAAGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTATGGCCAGGGCTACACACGTGCTACAATGGTCGGTACAGAGGGTAGCCAAACCGCGAGGTGGAGCCAATCCCATAGAGCTGATCTTAGTCCGGATTGCAGTATGCAAATGGACATGTCATGAAGTCGTCCTCTATAGTGATTCGTG\n>URS0002117D6C rRNA from 1 species \nATTGAACGCTGGCGGCGGGCCTAACACATGCAAGTCGAACGGTAACAGGAAGCAGCTTGCTGCTTTGCTGACGAGTGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATAACGTCGCAAGACCAAAGAGGGGGACCTTCGGGCCTCTTGCCATCGGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAACGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTG\n>URS0001747A8B rRNA from 1 species \nAGTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGATGAGTGGAGCTTGCTCCACCCTTCAGCGGCGGACGGGTCAGTCATGCCTAGGAATCTGCATGGTCGTGGGGGACAACGTTTCGGAAGTAACGCTAATACCCATACGTCCTACGGGAGAGAGCAGGGGACCTTCGGGCCTTGCGCTATCAGATGAGCCATGGTCGGATTAGCTAGTAGGTGAGGTAATGGCCCACCTAGGCGTCGATCCGTAACTGGTCTGAGAGGATGATCAGTCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGTCTTCGGATTGTAAAGCACTTTAAGTTGGGAGGAAGGGCAGTAAGTTAATACCTTGCTGTTTTGACGTTACCAACAGAATAAGCACCGGCTAACTTCGTGCCAGCCGCCGCCGTAACAC\n>URS00004DFF5E rRNA from 1 species \nGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATGCTAATGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTTTAAGGGTGTCTGCTTCTAGTGTCCTACGTGACTCTAAAGTTGCAGACTCCCCTTATTTTGCCTCAGTGCTCGGTTGGGATTCATTTCTCGATCGGGCTTCCGGGGCGTGTTTACTTTGAGAAAATTAGAGTGTTCAAAACAGTCTTGTGATTGTATATCATAGCATGGAATAATAACTGATGACGTCGGTCATTTTTTGTTGGTTCGGATGGCTGAAGTAATGATTGATAGAGTTAGTCGGAGGTATTAGTATTTTATCGTTAGAGGTGAAATTCATGGATCGGTAAAAGACTAACAACTGCGAAAGCATTTATCTAGGATTTGCTCTTTGATCAAGAACGAAAGTTGGGGGATCGAAGACGATCAGATACCGTCGTAGTCTCAACTATAAACTATACCAGCTAGGGATTGGTGGGCGTTGCTTGACCTCATCAGAACCTTATGAGAAATCAAAGCATTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACAAGTTGTGGATCCTGTGGCTTAATTTGACTCAACACGGGAAAACTTACCAGGTCCAGACATAGCAAGGATTGACAGATTGATAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGTTAACGAACGAGACTATTACCTGCTAAATAGTATGCCCGGGCCTTTGGCGCGGGCTTACTTCTTAGAGGGACTAGCCATCTGTTAAGTGGCTGGAAGTTAGTAGCAATAACAGGTCTGTGATGCCCAAGGGCGATTCGTTAAAACTGCAGGA\n>URS00008EA5F3 rRNA from 1 species \nGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGATTGTAAACCACTGTCGCGAGGGACGAAAATCTGACGGTACCTCGAAAGGAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCGAGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCCGGGTGAGTAGGGGGTGAAATCCCACAGCTCAACTGTGGGGCTGCCTTCTAGACTGCTTGGCTCGAGCACGGTAGAGGCTGGTGGAATTCCCGGTGTAGCGGTGGAATGCGTAGAGATCGGGAAGAACATCGGTGGCGAAGGCGGCCAGCTGGGCCGTTGCTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAA\n>URS0000EF886C tRNA from 1 species \nCGGCAATTAGCCGGTCTGAACAGCAGTTCTCAACGCCCTGTTTGAACTTTCTCCAGTACCAATGGTCAGAGTCGTCGTACTTTTCAGGAAACAGCAGACTTTCTGGGTTGTTTCTGAAGAACATTCCACGACCTTGCCTATCAATGCCAT\n>URS0000B48067 misc_RNA from 1 species \nATCGCCTCCAGTTCAACCCACTGCTTGCTTCCTTATTGCCTATGCCCATCTCCCTACCTGCTCCCATTGGATCTGGGGCGCTGCCAAGTCTCAAATCCTCTTCTTTTAGCTAAGAGTTGTGTAGTTAGGGCCATAGAGAACAATGTTGTCGGTCACTAATCACTGCCCAATTTAGTTGCATTATAATTTTGAACCCGTGTTCAGACCCAGGTTGGTCCTGCCCTGCCGTCCTCGTCCTCACCATATTAGTCCATTTGGATTTTATTTGCCAGTACAAGTCATGGTCAAACTCGAGTCAAACTCTTCCTAAGCCTGTCCAAACAAGCTGTGCCAAAACAAGGACCAATAATCTCAATTTTCCCATAATACCCTCCCTTCAGACGACGTCGTTTCCTTCATTGCCTTTTGATATGCTGTGACCACATCACGTCACCTCTACTGCTCTCTTTATAAAAAGCCTAAACACGTGCTTCAACACCGCGATCCCGGAACACGGCCCTTCAGTGGCATCCTCGTTATTTGCAATCTTTTCGAGGTCAAATTCCTTACCTCTCTGTGTTTAGCTCACCTTCCCCGACCCACCCTTTCATATAACTACTCTTGCTGCCTCTTGACCAGAAACTCAGAACAAAACTTGAAGTCCGGTTCACCCTGTTTGCCTCTCGAGAAAATTTCTAATCGAGAAGAGTTTCTATCGATTAGCTTTTCTGGCTCTGTTGCAGTAGTAGTGTTGAGGGAGCTTCGTCGGAAAATGACGTCGGGGACGAGAATGCCGACGTGGAAGGAGAGAGAGAATAATAAGAGAAGAGAGAGGAGAAGAAGGGCGATCGCGGCGAAGATCTATGCTGGACTGAGAATGTATGGAAATTACAAGCTCCCTAAGCACTGCGACAATAATGAAGTCCTTAAAGCTCTCTGCAACGAGGCCGGTTGGACAGTTGAAGAAGACGGCACCACTTACAGAAAGGGCTGCAAACCTGTCGAACGTATGGACATTATTGGAGGGTCTGCGTCAGCAAGTCCGTGCTCATCCTATCACCCAAGTCCATGTGCGTCTTATAATCCAAGTCCTGGATCATCTTCTTTCCCTAGTCCTGTTTCATCCTGTTACACTGCCAATACTAATGGTAAGGCTGATGCCAATTCCCTCATCCCATGGCTTAAAAACCTCTCATCTGGCTCATCATCAGCCTCATCCAAGCACCCTTACCATCTCTTCACTCACAGTGGTTCCATAAGTGCTCCAGTCACCCCTCCATTGAGCTCCCCAACTGCTCGAACTCCGCGTGCCAAAAATGACTGGGATGACCCGGCGGCTGGTCCATCATGGGCAGGTCAGAATTATTCGTTCCTGCCCTCATCTATGCCGTCATCTACCCCACCAAGTCCTGGCCGTCAGGTCCTGCCTGATTCAGGATGGCTAGCTGGTATTGAAATTCCCCTAAGTGGACCATCATCACCCACATTTAGCCTTGTTTCACGGAACCCATTTGGCTTCAGAGATGAGCCTCTATCTGGTGCTGGATCGCGAATGTGGACTCCTGGGCAAAGCGGGACATGCTCTCCTGCTGTTCCTGCAGGTGTTGACCAGACAGCAGATGTTCCAATGCTAGACAGTATGGCAGCTGAGTTTGCATTTGGAAGTAACACAACAGGGTTAGTGAAACCTTGGGAAGGAGAGAGGATCCATGAGGAATGTGTATCTGATGATCTTGAGCTTACACTTGGAAATTCTAGGACCAGATGAGGGGGAACTGACAGAAAGGGTGAGAATGAATTATCCTCGGATTTCTTGATTTGGCTTCTTGCTTCCCTTTATGTTTCATGTCAATGACTTCATATTGTGCATGCTTCGGTTGGCAGAGAGCTGAGATAGAGGTACAGTGAGTAGGAGCACCTGTTCCTTTTTTCTTGTTCTATTATTTTTTACTTTTTGGTTTGCTTTTCC\n>URS0000F753B8 rRNA from 1 species \nTACGTAGGCAGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGAGCTCGTAGGCGGTTTGTCGCGTCTGCCGTGAAAGTCCGGGGCTCAACTCCGGATCTGCGGTGGGTACGGGCAGACTAGAGTGATGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGGTCTCTGGGCATTAACTGACGCTGAGGAGCGAAAGCATGGGGAGCGAACAGG\n>URS00004B85F5 rRNA from 1 species \nGATGAAGGTTTTCGGATCAAAAAGTTCTGTTGTTAGGGAAGAACAAGTACCGTTCGAATAGGGCGGTACCTTGTTGGTATTTTAACAGAAAGCCACGGCTAACTACGGGCCAGCAGCCGCGGTAATACGTAGGCGGCCCGCGTTGTCCCGGAATTATTGGCCGTAAAGGGCTCGCAGGGCGGTTTCTTAAGTCTGATGTGAAAAGCCCCCCGGCTCAACCGGGGAGGGTCATTGGGAAACTGGGGGAACCTTGAGTGCAGAAGAGGAGAGTGGAATTCCCACGTGTAGCGGTGAAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCCGCCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCCGCCCTGGGGGAGGTACGGGTCGCAAGACTGAAACTCAAAGGAATTTGAACGGGGGCCCCGCAACAAGCCGGTGGGAGCATGTGGTTTAATTCGGAGGCAACCGCGGAAAGAGCCTTACCAGGGTCTTGGACGATCCTCTGGACAGTCCTTAGAGATAGGGACGTC\n>URS00022660AC lncRNA from 1 species \nCTAGAATTACTTTTCTTAGTGAATTAAGTCCATAGGAAGCAGTTTGACGGAAGTATGAGTGCCAAGAATGGTTCCAAAAATTCTGATTGGAGAATAGGACTTTCACAAATATGCCATGTGAAAAGCAACCTGTTGAGCTGGATAATGATGTGCTGAGAGTTGCTGTTGAGAGAAATCCAGAAGCAGCAATCAAGGAATTGGTCACAATTGTCCATTCATTCATTTCAACTTTCAGAGGCTTCTACAGGACTTTGATTGTGTGTCAAAAATGGATAATGAGTTTCAGCCACAAAATCTGTGACCTAGCATGTAAATATTTGCATTTCCTTGCTCTCCCATGAAAAGAGAGAGTTGTTTTTGAAAAGAGTGGTTATGGGAAATAAAAAATGTTTTCACAAATGTCCG\n>URS00003A7160 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTAGAACGCACAGGATGCACCGTAGTTTACTACACCGTATTCTGTGAGTTGCGAACGGGTGAGTAACGCGTAGGTAACCTGCCTGGTAGCGGGGGATAACTATTGGAAACGATAGCTAATACCGCATAAGAACATTTACTGCATGGTAGATGTTTAAAAGGCGCAAATGCATCACTACCAGATGGACCTGCGTTGTATTAGCTAGTAGGTGAGGTAACGGCTCACCTAGGCGACGATACATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATTTTCGGCAATGGGGGGAACCCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTAAGGAAGAACGAGTGTGAGAATGG\n>URS0000C46E39 snRNA from 1 species \nATCTTTGCGCTTGGGGCAATGACGCAGTTGGTGAGATGAAACCGAGACGCGTCAATTGCTGGTTGAAACTTTCCAAACATCTATATTTAGAATGTCTAATCTACAAAGATCCGGTGATGATGGATATTTCACATGAAA\n>URS0001CDBEA4 tRNA from 1 species \nGCCGGGGTGGTGGAACAGGTAGACACAGGGGACTTAAAATCCCCTTCGCCGAAAGGCGAGTGCGGGTTCGATCCCCGCCCCCGGCACCA\n>URS000118F557 rRNA from 1 species \nGACGTAGGGGGCAAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGCTCGATAAGTCTGCTGTGAAAGTCCAGGGCTCAACCCTGGAAGGCCGGTGGAAACTGTCGGGCTAGAGTCCGGAAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCTGGAGGAACACCGGTGGCGAAGGCAGATCTCTGGGCCGTAACTGACGCTGAGGAGCGAAAGCATGGGGAGCGAACAGG\n>URS00016F7E24 rRNA from 1 species \nTACGTAGGGCGCAAGCGTTATCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGCCTGTCGCGTCGGGAGTGAAAGCCCACTGCTTAACGGTGGGTCTGCTTCCGGTACGGGCGGGCTGGAGTATGGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGGAATGCGCAAATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCATTACTGACGCTGAGGAGCGGAAGCGTGGGGAGCGAACAGG\n>URS00023D8557 lncRNA from 1 species \nGATTCTTCTTCAGCTTGTTTTCTTTTCCTTTTCTTCTTCTCTCCAGCATCAGCATTTTCAACCGCATCAACATCCTCAGCTGAATGCTTCTTCTTCTTCTTCTTTTCCTTCTTCACGGGTTCCTCTTCTGCTTCCACATTTCCATTTATGTCATTTGACGCAGGCATGTCTTCATCATCAGCCTTCTTCTTCTTTTTCTTCTCTTTCTTATCTTCTCCAGCAGGTGTCGTTTGGCCAAGAACAGAATCTGCTGCGGGATTATATGCCT\n>URS00020BFB22 rRNA from 1 species \nAGCGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGGACCCTTCGGGGTTAGTGGCGGACGGGTGAGTAACACGTGGGAACGTGCCTTTAGGTTCGGAATAGCTCCTGGAAACGGGTGGTAATGCCGAATGTGCCCTTCGGGGGAAAGATTTATCGCCTTTAGAGCGGCCCGCGTCTGATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGATGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCCATGCCGCGTGAATGATGAAGGTCGTAGGATTGTAAAATTCTTTCACCGGGGACGATAATGACGGTACCCGGAGAAGAAGCCCCGGCTAACTTCGTG\n>URS000081A35D rRNA from 1 species \nCTACGACTCTCGACAATGGATATCTCGGCTCTCGCTTCGATGAAGAACGTAGCGAAATGCGATACCTTGTGTGAATTGCAGAATCCCGTGAATCATCGAATCTTTGAACGCAAGTTGCGCCCGAGGCCTAGGCCGAGGGCACGTCTGCCTGGGTGTCGTGAAA\n>URS00004E6ABB rRNA from 1 species \nAGGAAGGAGAAGTCGTAACAAGGTTTCCGTAGGTAAACTTGCGGAAGGATCATTG\n>URS0001751255 rRNA from 1 species \nGACAGAGGGATCAAGCGTTATCCGGAATGATTGGGCGTAAACGCGTCTGTAGGTGGCTTTTCAAGTCCGCCGTCAAATCCCAGGGCTCCAACCCTGGACAGGCGGTGGAAACTACCAAGCCTGGAGTACGGTAGGGGCAGAGGGAATTTCCGGTGGAGCGGTGAAATGCATTGAGATCGGAAAGAACACCAACGGCGAAAGCACTCTGGCTGGGCCGACCACTGACACTGAGAGACGAAAGCTAGGGGAGCAAATGGG\n>URS000100F795 rRNA from 1 species \nTACGGGGGGGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGCGGCCAACTAAGTCAGACGTGAAATCCCTCGGCTTAACCGGGGAACTGCATCTGATACTGGATGGCTTGAGTTCGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGTTCTCTGGGCCTTACCTGACGCTGAGGAGCGAAAGCATGGGGAGCAAACAGG\n>URS0001BD843F lncRNA from 10 species \nTGGGTGCCGGAGAAGCTCCATATAGTGCTAGgcccaactattccatgagctccaaactagagcgtctcacaccccctgtgtcccgtcctcctggatagctaatggatgtcttggatgtgggaaacttatccaggccagcatgggactctggatctttgccctaaacctgctcctccccaggcttcaccttctcagcagtggcatcacatccagccagctgctccagcccaaatgtgatgagatcattttgattccccttctctccacatcctctccccatattcaattcaacagcaggtgctgtcagtgctgccccagcctctgtctccctcgtgtctctccagggctgcactgtgacaaggccacggtgtctacctggacggccacagggactcccagttggtcttcctgcctctactgccgcccccgttgctctattccaacagggaaagtgtgacctcgtaagtcctgctcatcccctcccaggatttttcactgcacatggaaaggatccacctttctgcaaggtcctgcgtgacctggcacttgcctcgttttctgacgtgacctccttccctgctgccccttgttccagctgcactggccatttctccaacacaacaaatcctttctcatcatgccgcattccctgccccagaccttcacctggtggctgcctcaggttcttcaggactcaggggagatgttgtctcctcagatgccttctgggaccacctgaccaatgtggcacctcaagcc\n>URS00008EF1EE rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGGACGGGATTTATTCGACGAACCTAAGTAGTTTACTATGAGGGGGAGTTGGGTAAATTTAGTGGCGGACGGGTGAGTAACGCGTGAGGATCTATCCATTACTGGGGGACAACAGCTGGAAACGGCTGCTAATACCGCATAAGCCTTTGGGTGAAAGAAGCGATTCGGTATAGGAGGAACTCGCGTCCTATCAGCTAGTAGGTGGGGTAACGGCCCACCTAGGCGAAGACGGGTAGCCGGCCTGAGAGGGCGCACGGCCACACTGGAACTGAGATACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGGCAATGGGCGAAAGCCTGACCCAGCGACGCCGCGTGAATGAAGAAATCCTTCGGGATGTAAAGTTCTGTTGTACGGGAAGAGCGAGAGACGGTACCGTACGAGGAAGCCCCGGCAAACTACGTGCCAGCAGCCGCCGTAACAC\n>URS0001035ED5 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAAGTGGCGAACGGGTGAGTAACGCGTAATCAACCTGCCCTTCAGAGGGGGACAACAGTTGGAAACGACTGCTAATACCGCATACTGAAGGAGGGGATTGCGTCTGATTAGCTAGGTGGAGGGGTAACGGCCAACCAAGGCGATGATCAGTAGGCGGTCTGGGATGAAGGACCGCCAAATTGGGAATGAGACAAGGGCCAGGATCCCTAGGGAGGGAACAGTGGGGAATCTTCCGAAATGGGGGGAAGTCTGGAGGAGCAACGCCGGGTGAGTGGTGACGGTCTTCGGGTTGTAAAGCTCTGTTAATCGGGACGCGGTACCGGAATAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATAC\n>URS0001134E72 rRNA from 1 species \nAGTGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAGAACGGAATATAGCTTGCTATATTTGTCAGCTAAGTGGCGCACGGGTGAGTAATGTCTAGATAACCTGCCCTTAAGAAAGGAATAACAGTTGGAAACGACTGCTAATGCCCTATATGCCTTTAATACATAAGTATGCAAGGGAAACGCTTTAGTGCTTAAGGATGGGTCTGTATGGTATCAGCTTGTTGGTGAGGTAATGGCTCGCCAAGGCTATGACGCCTAACTGGCTTGAGAGGATGATCAGTCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGACGAAAGTCTGATGCAGCAACGCCGCGTGGAGGATGACACATTTCGGTGCGTAAACTCCTTTTATATAGGAAGATAATGACGGTACTATATGAATAAGCACCGGCTAACTCCGTGCCAGCAGCCGCAGTAACAC\n>URS000222E680 rRNA from 1 species \nTACGGAGGGGGCTAGCGTTGCTCGGAATTACTGGGCGTAAAGAGCACGTAGGCGGGTATTCTAGTCAGGCGTGAAAGCCCCAGGCTCAACCTGGGAACTGCGTTTGATACTGGATACCTAGAGTCCGAGAGAGGGTGGTGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCAGTGGCGAAGGCGGCCACCTGGCTCGGTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAAC\n>URS00023D9DA4 lncRNA from 1 species \nCCCTCACAGCATGTGTATTTTACACATACGCACCTCCATGTCCGATCTCACGCAATTCGGCACATAAAATATTAGATCTTTTCGCGATTTAACCGTTTTGCCAATTTGACCTCTCAGCGATAACTTTGCAAATACCGGAGATCCATCCGTCGAATTTTCGATCCGACAGTACCATTGCGTTCGGCACGTCGGGTGCATCGAATCTAGCATTTCGTTTCGTCCAATTTGACCCCCGATTCACGACGAAATCCGTCCGCTCTCCAATTTCAAAAACCACACACATATATCGATGTGTAATCCCGCTAAATCCTTAATTCAAATTCAAATTTGAATCTCCTACCACTAGTAGGTACAT\n>URS0001FED5D7 ribozyme from 1 species \nACCTCGTGGAGAGCAATAAGGAAAAGCTGGTCCGTGCCCAGAGAGAGGAGCAGGAGCGGCAGATGGAGAAGGCGGCAGAGCAAGCCGGTCAACAGGCTGCAGTCCCTGACCTTGGATGGAACTCGCACCAGGGAATCGACCAGCAGATTG\n>URS0001E7E931 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGATGAAGGGAGCTTGCTCCTGGATTCAGCGGCGGACGGGTGAGTAATGCCTAGGAATCTGCCTGGTAGTGGGGGATAACGTCCGGAAACGGGCGCTAATACCGCATACGTCCTGAGGGAGAAAGTGGGGGATCTTCGGACCTCACGCTATCAGATGAGCCTAGGTCGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCGTAACTGGTCTGAGAGGATGATCAGTCACACTGGAACTGAGACACGGTCCAGACGCCTACGGGAGGCAGCAGCGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGTCTTCGGATTGTAAAGCACTTTAAGTTGGGAGGAAGGGCAGTAAGTTAATACCTTGCTGTTTTGACGTTACCAACAGAATAAGCACCGGCTAACTTCGTG\n>URS00019E4D72 tRNA from 1 species \nGGCTGTGGCTCAGTGGTTGAGCGTTTGCCTCGCACGTGTGAAGCACTGGGTTCAATCCTCAGCACCA\n>URS00000CF716 rRNA from 1 species \nCCGTGTGGCGGCCCCTGTAAAAAGGTTGGAANCAACTTGGGTGGAGGGATTTTAACCGTAGAGTCGGGTTGCTTAGTACTGCAGCCCTAAGTAGGTGGTAAACTCCATCTAAGGCTAAATACTACCACGAGTCCGATATTTGACAAGTACCGTGAGGGAAAGCTGAAAAGGACTCTGAAGAGAGAGTTCAAGAGGACGTGAAACCATTAGAAGCTGAAACGGGTGGAACTGTGAAGGTGGAAAGAGGGGATTCAGGCTGTGGGCATAGACATTGGCTTGAGTTTTTGTATTGTGAATGGACCCGGCATACGAGTGAGTTGCCGGTGCTTTTCTTGCCTTTGTTTTGTGTCGGCGGGCTTAATTCTCCCTCGAGTACTAAACGTGGCGACCCGCTGGACGGACCCCGAGGGCCCTTAAGGACTGGTAGCCTATATCTTTGGTGTGGGTGATGACCTTAT\n>URS000006D2C9 rRNA from 1 species \nAGAGTGGCGAACGGGTGAGTAACACGTGAATAATCTGCCTCCGGTGTTGGGGATAACAGTTCGAAAGGACTGCTAATACCGAATAAGATGGTAGGTACAAAAGTACTAGTCATTAAAGGTGGGGACCGCAAGGCCTACCGCCTGGAGATGAGTTCGCGGCTGATTAGCTAGTTGGCGGGGTAACGGCCCACCAAGGCGACGATCAGTAGCCGGCCTGAGAGGGTGAACTTTCACATTGGGACTGAGATACGGCCCAGACTCCTACTGGAGGCAGCAGTTAAGAATCTTGCGCAATGGGAGCAATCCTGACGCAGCGACGCCGCGTGAATGATGAAGGCCTTCGGGTTGTAAAGTTCGACAAGCAGGGAAGAATAAGTGTGGGGTAATATTCCACATGATGACGGTACCTGCCTAAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTATGGGGCGAGCG\n>URS000108241F rRNA from 1 species \nTACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGTGTGCGCAGGCGGCCGCGCAAGTCGGGTGTGAAATCCCCGGGCTTAACTTGGGAATTGCGCTCGAAACTACGTGGCTGGAGTGTGGCAGAGGAAGGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCGATGGCGAAGGCAGCCTTCTGGGCCAACACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGG\n>URS0000A837F7 lncRNA from 1 species \nNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCATCTAAGCTAAGGATGTCTTCACTGTAACCTCTGCCTCAGCAAGCTTTTCCCTTGCTGATCCCATCAGAACCATCCCCATTTGAGCTTCAGACTCCCCTCTGCCAACACTTAATCTTCTCTTTCAGCAAGAGTAAACAGATAACAGAATGTTCTTCCCTGAAGCTTACTAAAACTTTAAGTCCCGGTGTTATTCTCCAAAGGAAGCTGCTTTCTTCTGGCCACCAGGTCACCAGCTCCTATAGTGAGCTCTGAGCAGATTCTAGTCAGTCTCTTTAAGGGGCTGGGACTAATCGCTGTGACCTCAATCAAGCCTGCTGGTTTTATGATACCAGGAAGGCTCACCAGGTGAACTTCTGCTCCTTTTAGGAGGCTAAGCATCCCCCAGCCACCTTGGACTTGAGCAGTGTTACCTGCCAGCAAGCGCAACAGTGCCAACCACTGGTCTCTTCTTTTGGAAAACGTTTGACTTTTAACTTGCTTTCTTCTCTATTTCATCATTATCCTCCTTTCTGACTTTCATGTACTCCTAAAATTTTTGGTTGTAGAACTAAGCAAGAGAATGAGAACTGGGAAGAACCTTGGAACAATGCTGAGAGGCTGCCCAGATGCTCTTCTGTGTTCCACAGTACTGCCGAATCTTCCTTGTGGCTCTGGTACTGTACTGCCACTCAAATTTTGGTACAAACCATTGAAGTATTTTTTGCTTGTTTTTATTGGTCTACATAGTAATCTTAGTGTTCTGTTCCTGGAATAGTCTCTCAGTTAGCACATTCCCCCTTGTCCTGAGATCACCAAGACCTTCAAGATTAAGGCTCTTGCTTTCTACCCTGCCAGCTCTGACGCAAAGCAAACACCCTTTTCTACTCTGCAGTATGAAGTGCTCAGGACTGTGTTTTTAGCTGTTCAGAATGTTAGAGTTATTAATGTTGGTTAGTGGAGTTATCCTTCAGTGTAGAAAGAGAAAACTGCATGAAAAACTGGCACTAACTTAAGTGGCCTCTGACACCTTCCCTAACCCTGTCCCAGTTTGTGTCACATTCTACAATAGATGAGTGATCATGATCAGCAAAACTGTTTCTTTCTTTCCTTCATTTCTTCCTTCCTTCCTTCCTTCCTTCCTTCCTTCCTTTCTTCCTGTCTGTCTTTCTTTCTGTCTTTCTTTCTTTCTTCCTATCTATCTATCTATCTATCTATCTATCTATCTATCTATCTATCTATCTATTTATTTTGGTGTTTGTTATAGCAGAATTTGATTCATGAGAAAATCATCAGGCAGCTGGCAAGTCCCAGCTTCTCCCAAACTCTATGTAACCTGTTCCCAGCCACCTATCTTGACCCAGTGTTCCTCATGTTTTAAACTAGCTGGCAAACACATTTGCACAGCCTTATTGTGGGAACATTCAACTTGGCAATAAGTACTTTGCTCTTGATAGGATCTCAAAGATTCCTTCAGACCAAGAGAGACTCCAGCAAGCATACAGTTACAGATACTGTTGCCCAACCTGCACATCTCTGTGCCTGCCTCCCAACACAAGTCAAATGTGGGAACCAATCCCCCACCAACTACACATACACACACAAACACACACCTCTGTCCTTTTTGGTATTAGTATTCCTTTTTTTTTTTTTTTTTAAATTTCACGCATCTCTTCAAAATCTGGACCTCTGGATCTACAGCCCTGGGTCGTCATAAATAGCTCAAAAATGAGAAATCATGACTTCGGCTTTCTTTTTTAAAATTACTTTAATAAATACCCCAACATGTTCACTATACCACTGTACAGACTTTATTTGTTTGTTTGTTTGTTTATTTAAGTGCTTCCAGACCTGTAGTTTGAATATATGTAGTTCAGGGACTGTTGTTTCTAGGCATTCTACCTAGGAGTTTGTGCCTGTGGAGCATGTGGATGCCCCACCCCTCAGCTACACCCAACCCATACAGAAGTGCTGACGGGACTGTTTCCAGAGTTCTAGCCTGTGGTATTAAGACTTTAAAAAAAAAAAAAAATGTAATGATTTTTTAAGCCTTTTCTTTTCTGGTTGCCCTTGCAATTAAATTAAATAAAAAGAGGCATATGTTCAAAGTTTTACTGTGGCAACAGTTAAACATACAACTAAGCCCTGTCAAGAAACAATCAAGTGGGGAGATAGATGCTTAAGTCTAGAAACTGCTGTCTTCGAGAAATGTGAAAGCAGAGACCACATACTCATGATCTCCCTCACTCCCACACGGCAGCAAAGGATTCCTTTCAGCTTTACTGATTCACACTGTGGATACAGAACATTCTAGAAGGCCAGCTCTTGCTTCTCACCTGTGTTTATTGTCCAGAAAGGACAAGTCTTTAGAGACAGAGGAGGCAGTATCATCCAGGATAAGTTATTAGGCCTGGCTTGCCATTCCTTTTAATCTAGTCCTTCAGGGAGGCTGCCATCAAGGAACAAAGCCAGAGAGAATGTAGAGATAGGGCCTCTCATGGCTGGAAAGCCAAGGCCTATTGCTTCAACTTGTGTCCTTGAGGTACTGTGTCTGTACAGAAATTAAGACCCCGAGAGGCCAACAAAAAATGCAATTTAAACTGCACCTAAGATAATAAAATTGGATGAAAAGTAAAAAGAAAAAAACAGATTTCCTGGTACTAGGGTTTCCTGTAAACACCTTGTGGGTACCTCATAAGCAGCTGAGATTATTAGTGTTTGGTCCTAGTGACTATTTCAGCTGCCTTATCCACATTAGCTGCTAAGAAGTGATAACTCCCCAAGTTCCCATATAAAGTCTCTCCTGCTACCGTATTACATGGCAAGGAGAACAGGGGCTTTTGTTTGTTTGCTTGCTTGCTTGCTTGTTTTACTTCCTTGAGGTTAAAACTAGAGTCCCACCCCCACCCCAGATTAGTCTAGAGTTGGGGCAGCAGTAATAAATTAGGACGCATTCAGGTGTGACAACACAGCTACCTTTGATGGTGAAGACCTAGAGTGATTTAGTGTATCTGTGCATTAAATTAGAAAATATTTAGCAGAAACATGTAGCATAGCCGCATTTGAAAACGAGATTGTGCACTTGGGAGGCAGAAGCAGGTAGATATCGGAGTTCAAGGCCACACGTGTTCTACAGAGTGAGTTCCAGGATAGCCAGGGCTACACAGTGAAACTCTGTCTCAAAAACTCCAAGAAAATAAAAAATAAAAAAATGAGATTGCGTTTTGAAAATACTTGAAGTATTTCCTGACCTCCAGGTACCACTTTAAGCATGCTAGATATCTAGGTTGGGAGTCACTGAAGCACACCCCACAGCTATATTGGCCAGTAATGGAAAGTCCACTTTGTAGGAAGTTGATAGTGCCTGCTCCACAGACGCTGTCATTTCTTAAGCCAATCTTTAGAATCCCCAAATGTTTGGGGCAGTGAAAAACAGTAAATATACTTTGTTAATTAAAAACAGACTTTCTTTTTTAATGATATACTTTTACATGACAAATGAAAAAAAAAAAAAACTTGTAATCTGTGTCTGTCACACTAAGACACCAGATACCACAGAGAATCTCTTAAATCGCCACCAAAGAAATGGAGAGAATAAATCAAATGTTTGAAAAAATAGAGAATGGCCTTGGGAGATGGCTCAGTATGTAAAGAACTGACCACACAACTATGGGAGCCTGAGTCAGGACCCTCAGAACAGATATACATCTGGGCAGGCATAACAGCTTCCTGCCATTCCCTTGTCTAAGAACGCAAAGACAAGTGACACCCCGCCCCCACCCCCTGCAACAGGGCAAGCTGGCTAGCTGGATTAGCTCTGGCTTCAAATGGAAGGCCCTGCTCCCATTTATAAAGTGGAGAGATATTAAGGAAGATATTTGACAATAACTTTAGGTCTCCAGAGATATGTGCACACATGTACATCCACACCCAAAGTCACACATGCAAAAGAAAGTGGACTAGAATCATAGTTAGTTCTTAGCACCTTACTGGAGTTCTTATAGTGTGGAACTCTTGTCTTATGGAACGAATGTGGTAACATTCCTACATACAGGAGATGGGTGGCCTCTCAGAGGGGCTCAAGTTTACCCAGAAGGCCAGTTAGTCTTTGAAGCTAGTCACTATTCAGTTTAATCCTTGGAGGCTAGTCTTCTTGACATGAACTGTCTGATTTTCGACACTATATATATAGAAATAGAAGTAGCAATCTATTCATTATGCCAACTTTATAGCTACTTCTGAAGACCTCATGTTGTGCTTGCCTCTCAGAAAGAGATGCCTACTCCTTACCTACTGCCTTCAGTAACAGCAGAGCTCCATGGGGCTGTCCTTCATGACATTATTCAATCCTGACATTCATTGTGGTATTAATATAAAGAAATTTAGTCTGCATACACGAGGTTTTGTGTTCCAACTTGTTTACTATCCTGAGTGTCCAGGTCCCTCATAGAGTCCAGAAGTCTCTGAAGGACTCTGAACATTGCCAAAGGCTTCAGTGAGGGAGTCTAACAGGTCACTACTAAATCAAGGCTTCTAGAGAAATGGTTTGCAGGGTGCTGCTTCAGTCAGATTATTTGCTGTTAGACACTGAGGCTCACAGTTTAGTGTGACTTAGTTCCAACTGTCCAGACTCCTTGGCTGGTAGATGTAATGCTCCGTTTTGTCATGTGAATTTGAAAGGTCACCAGGTGAGGGCAAATGAAAGCCATCACTGTGATTTGGAAATCAGCTCTCAGAAGCAGTTGAGTGACCATCCTTGGACCTTCTGCATGTCACAGTGCATTTTAGGATCTGTCATAGACAAGGCTTATGAAAGTAGCTTTTTGGGAAATTGGAAGGATAAGAGGGGTGGCTCACAGGAGCACAAATGCAGACCCACAACTCATATCAGAATTGAAACTGCTAAGTCCTCACTGCCAACTTCCCAGCTGGCTGGCTTGAAGATGACAACAGCTCAGGGAGCCTTTGAGCAAGTGAAGAAAATTAAATCCTCATTTCCCTGAAAAACTAAATTCTCAGGTGATTGCCTGACAGGGGGAAGGGGGGAATTTTTAAATCATGGCCTTTGTTGATGTTCTCTGGCTTTTTCTTGGGAGGCTGCTTCAAGCAATAACGTGAGGTATGAGGTAACCCTGTCAGGTGGTATGCTGGGCTTTTAAGTCTTGTGCAGGTTGCCTGCTTACCCACACAATTCACATAGGGGCTGAAAAGCTTAACTTATCAGGGATGGAACTAGGTTTTACAGAGTTCCTTTAACCAAATAGGCTTGCTACTTTTTCCTTTCTTCCTGCATCTGCCAAGTCTTTCCGACCATTTTCATTGATCTCACCAGATGAGTAACACTTTAAATTCCAAAGGCTTAAAAATCAACTCCTTGTCATTTTTTTCCAATTTAATTTTTCACTCTTTGTCATATTTTCATCTTCTTGCATTAGTTCCCATGGCAATGTGTCTGTTGGCAGAGAAAATTTAACTCTTTTAGTGTTGATCACAATGTAAAATCCTTTTTAGGCAAGTGCCACAAAAACAAGCAGAGACTGGAATTCTCTTGCTAATACGTTTTCTTATCTCTTATATTGATTTCCCATCCTATCCCCAAGCAAAGCTCTCACAGAAAAACATGCAGAGGCCTTTGAGGCAGCTACAGCTTCAAGGATTTAACCTTTGGCTTCCCATGGCTTCCCGTTCCAAGTGTTAAAAATATGAATGCATCTATCAGGAATGTACAGAAGACAACTTTCAATTTCTATCAGAAACACCCAGTGTATCTGAGGAAATACACACGTCCTAAAATGAGCCTCAAGTCAGGGTCTAATGGCAAGATGAGAGGCACTTAAGCAGATTTCCTCCCAGTAAGTAAATGGCAAAGAGGCCAAGCAAGCTCTAAGTTCTTGAAAGAAGCAGCAAAGACTCAGGTGGAAAGCAAATGACATGGTTACTTGTATGGGGGAAGCGGCACTTCAGTTCAGACAGTTTGTGATCAAGTATGAAAAAGCAAGCAACTGCATCAGGCTTGATGATGTATGCCTATGATTCCAGCAATGGAAGGTCAAAGGCAGGAGGATTACAAGTTTGAGGCCAGTCTGGGCTACATGGGAAGATCTTGCAAGGACTAGGTTTCAAGGTGCTAGGTTCAATTCCTAGGACCTAAAAGGCCTACTAAAGCCTTTAGAAATGCTTTAGAAATAGAATGTAGGGATAAAGGGAAGAGGACTATGCAGAAAGCCCAACCCAAGATTAAATGTTTGTTTCAAACTTTAGGTTCCATCATGGCTTGGCATTGGCAGCTCCTTCTACTGCTTCAGTATCCAGAAGCAACAGGTCTACTGTCAGAAATTGAACAGACTGACCCAAATATGTGTAGGATTTTTTTTTTTTAAGAAAAACTGATGAATTCAGGGGAATGAAATAGATATTAAATAAAATGTGGTTATCTTAAGTATAGTTAGGAAAAACGATCAAATGTAATTGATCTTCTTGCTTAGTCTAATGAGACACTTAAGCACTAAGCTGCTTGTATTGTATAAATGTATTTTTGGCTGTTCAAAGGTTATTTTCCTATATTAAGAAGTTTATTAAAACCTTTTATTGCAACTCAGGTTTTGTGTCTTTTAGACACACATTTTTCTTTGCTAGTTTGTTTTGCACAGCTGGAGTTTTGAGGTGGAATAATGCCTGGGCATGGCAGTCAGCTAAACTGCCTGATAGCGAGACTAAGGAAGGTACTTGACATGTGGACAAGCCACATTGTTGTTTCATAGCTCTCCATGCCTCCACTAAATACAGTTAGCCGGGAAATCTCACATGATTTTGTTTGTTTGTAAAAAGTCTCTGGAGAAACCAAGACGAATCTCTCAGGCAGATAAAGAGCTTTCCGTATTTGCCTAAACGTACTATTGAAATAAATATTATTTTCAATACTTGTTTTTCCACTCAGAGGGCACGCACTGGTCTCAGACCAGGGAGAGGACATCTGGCTTAGATCAGGACTGCTGAGTGCTGTGTAACTCTTAGGAAACTTTGTTTTGATGTCAGTGTCAACAGATTGCAAGGAATGGTTCGTATTTCTGCTCCCAACATTTCGATATTTCCTTTGCTTCCCTCCTCTGAAGAGCGAGCCTTACTGTGATATGTTTGGAGTAAAGACAAAGGCAATTGACAGGCAAACCGCACTTTTGTTGGAAGAGCCAGTTAAGTTCTCTTTGTACTCAGTGAATGTGAGGGACTGAAGGCAGATGGAGAATGTAAAACTGTTTATACATGAAGGAAGGGGCACTGTCCAGGGCTGGCAGGAAGCCAGAGGTAGATCTATTGAACTTCAAAGGGTAAGGTCATTGCAAGGTCACTACAGGTTATAGCAAAACCAGAATTTTCTTTCCTACTTACAGCCATGAAAGGGCACCTCACCATCAGCTGTGTATGAGAAACTCATACTGCAGTCTCATTCTTTTCAGGAAAGAAACATTAAGTAATTCAGATGGAAGAATAGAAAAGTAATTCTGACGGAAGACAATGGTGGGTTTACAAGAGGTTTGTAAAGAATTATACACACTACAGACTGATTTTTTTAAACACTCATGAAATTTATTTTTCACTTTCAAAACTATCAGATTGATGATTTCTTGCCCTCAGTAATTTGTGAGAGATGAACGTATTTCATTATTCTGTAAATGTTTTATGTGTCAAGCACATAAAAATTTTGAGGTCGTATTTGCCAGTTAACATTTCATTCTCATAAAAAGTCGTAAGAGAAATTCCTAAGTGGTGACGCAGCTTTGGGTCTCTTGACCATACTCTCTGATGGGATCTGGCTTCATTACCATAAGTGCGGTACCCGGGTAACAGATCTGCAGTAACCGCAGGAATCTTCCCTCAGAACCAGAACTGGGACCTCATTCCTAAATCTCCCATCTAGCTGATGACAGGTGGCAGGTGAGTGTTCCTTCTGTCCATCCTTTGCTGTCTATGTGGACATTCTGATATGTGTCAGTGAGCTGAATTCTACACGCTGTATATATTGCATGCATTTCACTGCAGTCTATGGACATGCCCTTTGTAGAGCTTTTATGGAAGAACCAAGAAGCCAAGGCAGTTTAGCAAACGAGGCTCAATATTTATAAACTGGGGCCTTTTCTGTCTCTTTGCTAGCCTAGGTGGCTGTATACAAACTGGGTGGGAGGGGCAGCAAACACCTCACACATCACATTTAGATTTTCTACTTGGGTGTACTCTAGCCAATTCAAAACAAATTGCTTACTTTAATAATAAAGTTTACCATTTTATATTAAAGAAAATCAAACCATGACATGTTTAATTGAACTGGCTGTATTGTAATTAATATTTTGAGATAATTGTGATTTTCAGCTTAAAATTATATATAAAAATTGTCATTTTTGTATGTGTTAAAAAAATGTACCATGATTAACAGTACTTTTTAGTTAAACTACATATTGGTGTAAATAAAACTGAATGAAGAAACACTTACTACTTTACTAACTTAGATTGTGAATGTACTTCATGGTTTTTTTGCCATATGAGACCATAACAACCTTGAAAGAAAGCTGTTTAATTTTATGTGCAAAGTCCCACTAACCTGTATTTCAACTCTGCCAAGCCAATGACTTTGCAAGTGTGATCTGTACTCTCCAGCTGTGTCTTACGTTCTGACACTATGGGTTAGGGGTAGGGTGTAGCCTGGAAGCATCTGCAGATGCGCTTTGTACAGATAATAGCGCTGTGTGGTGTATAGCAGAGCCATTTTTAGGTTCTGTTGTACTCAATTTTTTCAGAATTTAAAAAAGTGTTTTGAATAACATAAAAGTCTATTGTATAAATAATAAAATGTCACCTTATTA\n>URS0000CDA9EC sRNA from 1 species \nGTCTTAATTAAGGGAGCCCCGAGACCTTACTCTTTCACTTTACCTAGGAGTTTGGTTCCTAAACTCACCATTCAAATCCAGCAACAGAACTGATTGAAAGGAACCTTTGTCTTTTGTGTGAATGCTCATGAGGGGCCATCCTTACAGTGGAAACGCTCCTGAGGCTCCAGCGAATCAAGACTCTCAGACCCCCGGGCTGTCCCCACCCCATGACCACATGTTCCACAGGCACCCTCAGCACTGTGCCCTGCGTGTCACCCAGGCAGGTGTTTGTTTTCGAGCGCAGATTCTGCCTGTGGCCATAGCCATGTGGAGATGTTCACGCATGTACTTCCCTTTGTGATTTCAGCCGATACGGAAGATGTGTGCATCGTAGAGAGATTGTTCTCCAGCAGCCTAGTGGCCATTGTGAGCCTTAAAGCACCAAGGAAGCTAAAGGTTTGCCACTTTAAGAAGGGAACTGAGATCTGCAACTACAGCTACTCCAACACGATTCTGGCTGTGAAGCTCAACAGGCAGAGGCTGATAGTATGCCTGGAGGAGTCCCTGTACATTCACAACATTCGGGACATGAAGGTGCTGCATACGATCAGGGAGACGCCTCCAAACCCTGCAGGCCTGTGTGCGCTGTCAATCAACAACGACAACTGCTACTTGGCGTACCCAGGGAGCGCGACCATCGGAGAGGTGCAGGTCTTCGATACCATTAATTTGGTGAGATGCCTTTCCTGCTCGAATAGCTCTCTAAAGTGTGGCTTTTTCTTGAAGAGGAGCACTGTGGTGTCCCTGGCATCCTGACTTGGCTCAGCAATACAACCGCTGCACTTTTTTTTTGAGACAGGGTCTTGCTCTGTCGCCCATGCTGGAGTGCAGTGGTGCAGTCCTAGCTCACTGCAGCCTCAACCTCCCGGGCTCAAGTGATCCTCCTGCCTCAGCCTCCCAAGGAGTTACAGTCATGCAACACCACACCCAACTAATTTTTTATTTTTGTAGAGATGGAGTCTTGCTGGGTTGCCGAGGCTGGCCTCAAACTCCTGGCCTCAAGCCATCCTCCCGCCTTGGCCCCCTAAAGTGCTGGGATTACAGGCGGGTGCCCCGCGCCCAGCCCCGCTACTCTCTTCTCAGTAGCAGAGCAGGTCTGGCTCATTCTGCTTCTGGATCTGCTGCAGCGTTCAGACCAGTGCTGAGCTCCTCGCCATGGGAATGTTTGAAGGAACATAGAAAACCTTAGGGATAAACTGCTTTGCTTTTTCTAAATTTGGAGCAGCATTTCCTTGGATGCCCAGCCCCAGTAAATCAAGTGGGTTTGGCATTTGTTTGGACCGTAATGGTGTTTTAGGAATAGCTAATTGGCACTTGCGGACCAAGTGCCAGCCCTGGGGCGTGGGCGGTCACTGTGCGGCGGCCACGCTTTATTGGTGTCCCTTTTTCAGAGAGCTGCAAACATGATTCCGGCTCACGACAGTCCTTTAGCGGCATTGGCCTTTGACGCAAGTGGAACTAAACTTGCCACGGCTTCGGAGAAGGTGAGTCTGCTTTTCCCTGGGGGAGCGCTGGTGCCAAGGCGTCCAGAGACTTTTTCAGTTCTGTTCACACAGCCAGCTTAGAGGCAAGGTCTTATACTTACCAGCTCCGGGAGAAGCGAAGACAGCCACCCGCTTGTCAGGCCATGGGCTCGTGCTGCCCGAGAGTGAGCGGAGCTTGCGGTGTGTCACTGGGACGGGAGAGCTGGTCCACGTTTGTAGTAGAAAATACAGAAATGTCCAGAGGAGACGAAGTGCCGTGTGTAACCACGCCGCTCACCCAGTGTGTTTCTAAATGATGAAACTAACACGTAACAGTAAAGAACCCAGACAGTGATAAAACGTGAAAAAGCAAGGCCAGAATTCTATCCAGCCCGTCTGAACACATTTCAGTGTATTTCCTTTCATTTTCTCTTTAGTCAACAAAATTGGGATCTTACTATGGGTATAATTTATCCTTTTTCACTCTGCATGACATTTGTCTAAGTTCAAAAACACTTGTAATGGCCGTGCAGTATTTAGTTGTGATTTATGTCAACATCACCCTTTTGGGACTTTGTTTCTAATATGTTGCTGCCGTAGGTAGTAGTGTATTTAAGTCATGTATCAATCTTTTATATGTATTTCTAACTATGAATTCAAGAGATTCCAGTAAGAAGAATGTCTGGCTTTAAAGGAGATGGCCTCTAAATGTCCCCGTATACCTGTGACCGCGTGGCGAGGCTCCCTGGCCCCCAGGAGACTGAAGGCTCCTCGTTCTCTTCCTCACTTGGACTGTGCCTCTCTTTTCGTTTCAGTTCCTCTTTTCTTGAAAGTTCCGTCTTCTCTTCTTCTGTCTTGAGGTCGCGTCTGCTCTCCCGCCTCCGTTGTCTCCTCTGGATGCCAGTCTGCTCTTCATTGCCCACCGATGACCTTTACTTTGATTTGGATATGATTTTGCTTCTCATTGAAATCCTAAAATAGCCTCCCCTTTCAAGCCATCTCTCCCCTCAAACTATCGACCAGAGAAGATACAATAAAACGTCGGCTCACTTCCTTA\n>URS0002144F5F rRNA from 1 species \nGCGGAGGGATCATTACACAAAAAATATGAAGGCTGCAACCGCCAGTTTTGGCGGGGAAGCTGAATTATTTTTCACCCATGTCTTTTGCGCACTTGTTGTTTCCTGGGCGGGTTCGCCCGCCACCAGGACCACACCATAAACCTTTTTTATGCAGTTGCAATCAGCGTCAGTATAACAAATGTAAATCATTTACAACTTTCAACAACGGATCTCTTGGTTCTGGCATCGATGAAGAACGCAGCGAAATGCGATACGTAGTGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCTTTGGTATTCCAAAGGGCATGCCTGTTCGAGCGTCATTTGTACCCTCAAGCTTTGCTTGGTGTTGGGCGTTTTGTCTTTGGCTTTTGCCCAAAGACTCGCCTTAAAACGATTGGCAGCCGGCCTACTGGTTTCGGAGCGCAGCACATTTTTGCGCTTGCAACTAGCTAAAGAGGCCAGCAATCCATCAAGACCTTCTTCTCACTTTTGACCTCGGATCAGGTAGGGATACCCGCTGAACTTAAGCATAT\n>URS00023B0815 lncRNA from 1 species \nATACATTCCTAATGGAACTGTCGCTGATCATCTTCATGGAAGACAGTCGAACTCTGGTTTGCTCACTTGGCCTTTTCGGTTGAGCATTGCTATAGAGACAGCCAGTGCACTTGCATACCTCCACGCTTCAGATGTCATACACCGTGATGTCAAAACCAATAACATTCTCCTAGACAACGACTTCCATGTGAAAGTGGCTGATTTTGGTTTGTCGAGATTGTTCCCAACTGATGTTACTCATGTATCGACTGCTCCACAAGGAACGCCTGGATATGTTGATCCGGAGTATTATCAATGCTACCAACTGACGGACAAGAGCGACGTTTACAGCTTTGGTGTGGTCTTGATTGAGCTGATATCAGCTTTAGAAGCAGTGGACACCAATAGGCATCGGCATGATATTAATTTGTCCATCATGGCAGTGAAAAAAATCCAAAACCATGCTTTAAATGAGTTGGTTGATCCATTTCTTGGATTTGACAAGGATTTCGTGGTGAGGAAGATGGTAACATCAGTTGCAGAATTAGCTTTCCGGTGTTTGCAACAACAGAGG\n>URS00021A59B7 tRNA from 1 species \nGGGGGCGTAGCTTAATGGTAAAGCCTCAGTCTTCCAAACTGATTACGCGGGTTCGATTCCCGTCGCCCCCTC\n>URS000061A097 rRNA from 10 species \nGGGCCTCTTGCCATCGGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAACGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGATACTGGCAAGCTTGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCACGGAAGTTTTCAGAGATGAGAATGTGCCTTCGGGAACCGTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTCCGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTGGATCAGAATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTAGGGGAACCTGCGGTTGGATCACCT\n>URS0001E193C8 rRNA from 1 species \nAACGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCGCCCTTCGGGGTGAGCGGCGGACGGGTGAGTAACGCGTGGGAACGTGCCCTTCTCTGCGGAATAGCCTCGGGAAACTGAGAGTAATACCGCATACGCCCTTTGGGGGAAAGATTTATCGGAGAAGGATCGGCCCGCGTTGGATTAGGTAGTTGGTGGGGTAATGGCCCACCAAGCCGACGATCCATAGCTGGTTTGAGAGGATGATCAGCCACACTGGGACTGAGACCCGGCCCAGACTCCTAGGGGAGGCAGGAGGGGGGAACTTGAAAAAATGGGGGCAACCCGAAGCTGGCCTGGCCGGGGGGGGGATGAAGGCCTTGGGGTTGAAAAGCTCTTTCAGCGGGGAAGATAAGAAGGGACCCAGCAAAAAAAGCCCGGGCAACCTCCGG\n>URS0000C56DA5 snoRNA from 1 species \nGAGTGGAGTGATGATTGTATTTGATTCCCTATTGGTTTGATTGCCAGTGTGATGGCACGCATTATAATAGCTTTATCTGACCACTC\n>URS0001BF6C2A lncRNA from 10 species \nccagcagtggcaacccgctagggtccccttccacactgtggaagctttgttctttcgctcttcacaataaatcttgctgcttctcactctttgtgtccacaccgcctttaagagctgtgacactcactgtgaaggtctgtggcttcactcctgaaatcagcgagaccatgaacccaccaagaggaatgaacaactctggacgcgccacctttaagaactgtaacattcactacgaaggtctgcggattcactcctgaagtcagcgagaccatgaacgcaccggaaggaatgaacagctctggacgtgccacttttaagagctgtaacactcactgtgaaggtctgcggcttcactcctgaactcagcaagaccacaaacccaccagaaggaagaaactctggacacatctgaacatctgaaggaacaaactctggacacaccatctttaagaattgtaacactcaccgcgagggtctgcggcttcattcttgaagtcagcaagaccaagaacccactggaagggaccaactctagacacattttggtgacccagatgggactattgcctatcgccaagcagattgaggccatcaagctacagatggtcttacgaatggaatcccaaatgagctcgactaacaacttctatagaggacccctggactgacctgctggccctttcacggcctaaagagttcccctctggaggacactatcactgcagggccccttctttgcccctgtccagcaggaagtagctagagtggtcatcgggtaattcccaacagcagttggggtgtcctgtttagaggggagatGgagaggtgaagccgactgggcttctgggtcaggtggggacttggggaaattttctgtctagctaaaggattgtaaacacaccagtcagtgctctgtgtctagctaaaagtttgtaaatgtaccaatcagcactctgtaaaaatggaccaatcagcactctgtaaaatggacgaatcagtgctctgtaaaatggataaatcagcaggatgtgggtggggccaaataagggaataaaagctggccacctgagccagcagcggcaacctgcttgggtccccttccacgctgtggaagctttgttctttcgctcttcgccgtaaatcttgctgctgctcactctttgggtctgcacaaactttaagaactgtaacactcactgcgaaggtctgcagcttcactcctgaagtcagcaagaccacgaacccaccagaaggaagaaactccggacacatctgaacatctgaaggaacaaactccg\n>URS00022B9349 lncRNA from 1 species \nTTCATTAGCTCAAATATATACATATGTCGAGGCACATTCCTAGGTAATATCTTCTCATTCAGATAAATAACTTCAAGTTAATATTAAAGTCATTATTCATTGATGCAGAAAAGTCTCTCCACTGTACTTTCCCAATTCTTGGGCATTCTACAAAAAATGCTCTTTCTGCAATGTATATCCCCTGAAACACAATGTTAAATTTGAAAAGGTTTAAATATTTTCCCAGCTCAAGAGAAATAAGGCAGATTTTCTATCATTGCTAGAATGAAAGGAGGTTTGTTTATCCTGTTCACTAAATCAACAACATACTTCCTGCTAATAGGATCAGAGAATGAGATGGGTAAAATGTGAAATCATTTGATTTCTTTGTTTTGTTTACACGTGTATGTTAACGAAGCATCAGATAAGAATGAGGTCTAATTTCCTCTTCTGCAGGTAGAATTTGAGTTAGGTTTCCAGAAGGACTTACCAAATTCTAGTAGCCATACACCGGTAAACAGGTCAACCTCTAGGTATTTAGAAAAACAAATGTCCTTTCCCAAACTTCTTAGTTACAGAGCCTTTCAAAAGCAGCTCATAATTTGTTCACATGTTGTTATTTGCCTAATGCACTTGATACATACTATCAGAACTGCACATAATGCCTGAGCTCTACAGATAAAAGCTAAAATGAAGGATACAATATATCTGATTTTCAGAGGCCTAGTATCATTTAAAAAGTCAGCTAACAATTCCAGACTATCTCTAGTTAGATTCTAAACACAAGAATCCATCCATCCATTCAATAAATACTTATTCAGCTAGACAATATGCAAAACCATCCCAAGGGGGTTGAGATTAAAAAAAAAAAAAAAAATCAAGATAAATCTGCCATCTTGCCACTAACAAAACATATCCAGGACAAAAAGTACTATAAGGGAAATGAGAGTGAAGAGCTTCAGCTTATGCAAAGACCCTGTACTGAATGAAAATGAGTAAATTTATGGGCCATAAAATGTAAATACATAGCATTGAAGAGAGGAAAATTCATGTAGTCCATAAAATTGGAATTCAGTAGATTGTGAGCCTTGCAAGAAAATCACTCACCATACAAGTCCTAGAAGCAAGAGGTACAGCTCTCCCATTAACCAGCTCTAGGACTTTAGATCAAGTCATTTCATTGCTCTGAGATTCTGTTTCTTCATCTGTAAAATGAGAGTTAAAATTTCTAAGCTACCTACCACTCATGATTGTCAAGGGATTATGCATGAAAAAATGCTTTACTAAACTAAATATCTCATATATACTAGTACTGGTTCAGCTTTTTTGGGGTCTTATTTTTAAATAAATAAGTTGAAATGATATTTTTTAAGATTGCATTTATTTGGGAGATTGTGCACAGACTAGCAAACTGGGTGGTGGGGGAGGAATAGAGGGAAGAGAGAGACTCGAGCAGATTCCACGCTAAGCATGCAGCTTGACACAGGGCTTGATCTCACAACCCTGAGAGTACAACCCCAGCCAAAATTAAGAGTCGGACGCTTAACCACCTAAGCCACTCAGGCACCCCAAGTTGAAAAGACTTTTAAGTTCTCTTTTTAGCACTGTAAGATTTTACGACCTAAAAACTAATCTTAACTCAATGAGTAACTAAGAGATTTCTAACTTCCTAAGCATTATTATTAGTAGCATCAATCAATAAATTACCACAGAAAAGGAGGTATGAGCTAAAACAAACTGTTCTAAAATATTGGTTAAAAAAGGAAGGGGGATGAGAATCAAAGGACATATGGAAGAAAGTTAAAATGACTATTAATAGTGAAGGAATCAAAAGTAACCCTGAGTCTGAGGGGAGAACCGAGATGACATTCTTCTGGCAATCCTTCACGACGGCAAACTATCAACTTTATAGGAAAAAGTTATTTCAATTGAAAAAGATTTCCCAAGCAAGTCTGGTGAATGAGCTTAGAATTCAAATTCATGATACAGCACTGATTCAAAAGCAAAATGTGCCAGAAATTGAGGGACAGGGCTCAGTATTTCCGAAAAGCGAGTTGTAAAAGGAAATTTCAGAAATCTGACTTCCGCAATTAATGCAGATGGTCTGTTAATGGTAACTCTATTTAGCACTCACTTTAATACATATTCTAAAATACTTCTTTAAAAATTACTACTACTACTACTACTGGCGATGGGTGGCTCAAGTGGTTGAGTCTGCCTTTGGCTTGACGTCAGGGTCCTGGAGTCCTGGGATCGAGTCCCACATCAGACCCCCAATGGGGAGCCTGCTTCTCTCTGTGTGTCTCTCATGGATAAATAAATAAATCTTTAAAAAGAAATTACTACTACTGTTACTTCACAATCAGACTATTCTATCATCCCTATTTTCCAATAATTAAGCATCTGGCTGGGAAAGCAAAACACAGTTAGTTACACAAAAGATAAGACAAAGGACCTACATTTCCAACAAAGCTAGACCGCATATTACACACCAACCCTCTTGCAATTAAAAAGTTAGACAAATGTATATTTTTTTTAATTCTTAAAAATATCAGAGGATATAAACTGGTGCAACCGCTTTGAAAAACTGATAGTTAACTACTGAAGCTAAATTATATCTACCAACAGCACCATACCCAGGAATACTTCCAAAAGAAGGAAGTGCATATCCGACAAAATACACATGTAAGAATGTTTGTAGCAGATTTATTATAGTAGTCCAAAATTGGAAATGATGCAAATGCCATTAAAAGTAGAATGGATAACCAAACTGTGATAGATCTGTATATGAGGCTACTACTATAGCACACTGTATTTTCCAATAATGGTGCCTACAATACTTCTGGTCTCACAAGCTCTTCCAGAACCTCAACTCCCCCCATCAAGAGGTAGAGTCCATTTCCCCTCTCTTTAAACCTCGGCAGGCTCATAACTGCTTCAAAGAGCAGAATACAATGGAAGGAAAATTGCATTAAGTTTCAAAGCCAAGTCATAAGAGGCAATCTAGTGTCTGTCTGGCCCATGGGCTCTCCACCCCACTCCACTCCCCACTGCCTGTGGGTGCAGGACACTAGCCCTTGGAACACTGCCACCGTACTATTAAGCACAGTCAGGCCACATTTAGGTGTTCCGTCATCAACCAGCAGACATGTGAGTAAACCTTCAAACACTTTTAGGCCCAGCCTTCAAACAGCCCTACTTGAAACCAAATGAAGCTAAGACAAGCATTGCACAAATTACAGTGTTGTGCAGAAAATATATGTTGTCACTGTTTAAGTCACTGAGTTGCTAGGCAATTTTTTAGGTGCTACAGTAACTACAAGTACAGTAACTACAAGAAACACTACTGCTATGTGCAACAACACAGCTGAATTTCACTGATACTATACAATGTTGAACAAAACAAGCCAGATCAGACACACGGGAGTAAAACATACCGTATGATACTATTTTGAAAAGAAAACTAAAAACTGCAAAACTGTTGACAGAAAACCAAGTAATTGCAACCTGCATCAGGAAAGGAAGATATAGATGGGGAAGGGGTGTGACAAGGTCTTCTGGGGTGGCAAAAATGTTCTACATCTTGAACTGGATATGATTACATATTTAGTTACATTCATAAAAATTCTTCAGGTTATACATTTAAGATTGGTGCACATTATTATATGTATATTATACCTTAATGAAAACGCAGGAGAGGATAGTAATCAAAGAGCTAACAAGGTAATAAGGAACTACTAGGCACAGTAGTCCAAGAGGACAGAGAGGAGCACAGCACCCTGGGGTCTCTTGTCCCCTGGAAATGCCTGCCTAATCAAAAAACTGCATGTAGGCAGGCTAGGAAAGTAGGAAGACAAAATGTCAGAGTACAAGATCCACCAAAGGAGCCATCCCTTGCTTTAGAATAAGACCCCAAAAAGCTGAATCCTGGAAGAGAGAACACAGAAGGAAACTAAACCAGTCATTGCATAGATAGACTCAAAAAAACAAACACAAAAAAAAAAAAAAAAAAAAAAAAAAAAA\n>URS00023D8047 lncRNA from 1 species \nTAGGGTTTGATTTAGGGTTTAGGGTTTGGTTTAGGATTTGTTTGGAATTTGGTTTAAAGTTTGTTTAGAGTTTGGTTTAGGATTTAGGGTTTGATTTAGGATTTAGGATTTTATTAGGATGTAAGATTTAATTAGTTTTGGCCTAAAGTTTGAATGAAGTTCAATAGGATTTTGACTAGAATTAAATTAAGATTGAATTGAGATGTATTTGAGTGATATTTGTGATCATTCTAATATTTCTTTAAGAATTTTTATTGTTGATTTGAAATTTCTTTGAGGTTTTTTTGTATTTGATTAAGCTTGCATAGCATTATTATGGTCTAATTAGAGCATTTTTAGTATTCTATTAGAATTAGAATTTTGTTATTGTAATTTCCATTCTTTCTTGTAGAGCTAAATGCCCAGAGCA\n>URS0001D8C773 rRNA from 1 species \nTCCTGGAAATAGCCTCCCTATTAGACCGTACCCGAAACCGACACAGGTGGTCAGGTAGAGAATACCAAGGCGCTTGAGAGAACTGCGTTGAAGGAACTCGGCAAATTGCACGCGTAACTTCGGAAGAAGCGTGACCCTCACTCACGCAAGTGGATGAGGGTGGCACAGACCAGGGGGTAGCGACTGTTTATCAAAAACACAGG\n>URS00006048F4 rRNA from 1 species \nGAAATCCCTCGGGATGTAAACTTCGCAAGAACGGGAAGAATAAGTAGGGGACAATACCCCCTATGATGACGGTACCGTTTGTAAGCTCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGGGGGAGCAAGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCAGCACAAGTCAGTTGTGAAATCTCCGAGCTTAACTCGGAAAGGTCAACTGATACTGTGCGGCTAGAGTGCGGAAGGGGCAACTGGAATTCTTGGTGTAGCGGTGAAATGCGTAGATATCAAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCCGACACTGACGCTGAGGCGCGAAAGCTAGGGGAGCGAACGGGATTAGATACCCCGGTAGTCCTAGCCTTAAACGATGAATGCTTGGTGTCTGGGGTTATAAAGTCCCCGGGTGCCGTCGCTAACGCTTTAAGCATTCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAG\n>URS0000A15EFB rRNA from 1 species \nAGCAGAGCACGTCCTACGGGAGGCGAGCAGTGGGGAATCTTAGAGCAATGGGGAAACCCCTGATCTAGCCATGCCGCGTGAGCGATGAAGGCCTTAGGGTTGTAAAGCTCTTTCAGCTGGGAAGATAATGACGGTACCAGCAGAAGAAGCCCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGCATGCAGGTGGTTTGTTAAGTCAGATGTGAAAGCCCGGGGCTCAACCTCGGAATTGCATTTGAAACTGGCAGGCTAGAGTACTGTAGAGGGGGGTAGAATTTCAGGTGTAGCGGTGAAATGCGTAGAGATCTGAAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAGATACTGACACTCAGATGCGAAAGCGTGGGAGCAAACAGGATTAGATACCCTGGTAG\n>URS0001056185 rRNA from 1 species \nTACCAGCACCCCGAGTGGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCGGTTCTGCAAGTCCCCCGTTAAATCCAGCTGCTCAACAGATGGGCCGCGGAGGATACTACAGAGCTAGGAGGCAGGAGAGGCAAGCGGTACTCAGTGGGTAGGGGTAAAATCCGTTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAGAACGCGCTCGACGGTGAGGGATGAAAGCTGGGGGAGCAAACCGGGATTAGAA\n>URS000182C5B8 rRNA from 1 species \nACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGGAAGCCTGAACCAGCCAAGTCGCGTGAAGGATGAAGGTATTATGTATTGTAAACTTCTTTAGATGCAGAGAAATAAGCCCCTCGCGAGGGGTGATGCTAGTATGCATAGAATAAGGATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGCAGGCGGCGCGTTAAGTCAGCGGTGAAATGCAGGGGCCCAACCCCGGCAGTGCCGTTGATACTGGCGTGCTGGAATGCGGTCGAGGCGGGCGGAATGTGGCGTGTAGCGGTGAAATGCATAGATATGCCACAGAACTCCGATAGCGAAGGCAGCTCGCCAGGCCTGCATTGACGCTCAGGCACGAAAGCGTGGGGATCGAACAGGATTAGATACCCTGGTA\n>URS0002400B5F lncRNA from 1 species \nTTTATTGATGAAGAAGGGTGTAGAAGTATTTTTGTGGTTTTTTTTTTGTAGAGAAAGGACAGGAATGTTTTTGTGTTTTTTGTTTATTATGACTGGGCCATATAGAATATGGTTGCCTACGTACTCCCGTGTATCAGGGAGATCAGGTCGACGTAGTTCACCCCTCAGGATGAATTGCAGTTGAAGAGAAGTGTGAATCCCATGTGCATGCTATACTGCGGGGAGAAGAAAGTTTGATACCATGATGGGGACAAACTGTAGGTTTGGAAAAAGTTTGATCCCGTCTTTAAGACAAACTGCAAGCGTAGAAAAGTTTAATCCCGTCTTCAGGATAAACTGCAGGTGTGAAAGGTTCAATTCCGTCTTCTGGATAACCGAAATTGTATGGAAGGTTTGAAATGAGGTGAAACTAGGCTGCTGGTTTGAAGTGTATATTTCCCTGAGGAGCAGAAGAGTATGTATAAAAGGTTAGAAACCGG\n>URS00004FA46A piRNA from 1 species \nTCTGAAACCAGAGGTACAGGTGTA\n>URS000239D036 lncRNA from 1 species \nAAGTGAGGGTTAATATAATTTTTCTACTCCTAATATTGGTTTTTATTTAGAAGAATCATAAACTACCGAAGTTTAAAGAGACTATGCTTTTAGATTCTAAGCCCAATGATTTGGGCATATAGTAATGGGTAAATCTTTTATGATTGGCACTGCATACATTAACGAATTGGTATGCATGCTACATATACAAAATTAATTTGCAGATCTAAATTCAGATGATGTGAGATTTATCTAACTTCATTTATACACTGACAGTATAGAAAAGTTAATCCATATTAATAGGATAAATCTTTTCTGTATCGACACTGTATACATTAGTGGATTTAGATGCATGCCACACACATAAAATCTCAGGGGTACCAAGTTATATTTCTAAAACCACAGGGGGCCAAGTGATGTTAAGAGAAACTTCAAAGGAGGTTTCTAATATTATTCCAACACATATTCAGTAGGCAAAAGATACTATTTCAATTATTTAGGTGGCAACGAGTTTTTTTTTGGCCTTATCACTGCATGTGATACTCGTGTACAAGGACAAAACTAGGGGATTAGGGCTGAAGTTTTATAGAATTCAATTTTCCTCCCTTACAAAATTACATATTGTCAAATCAAATAATCTTGCTCCCGAAAAAACCTAAAGATATTTATATTATA\n>URS00001FA05A rRNA from 1 species \nAGAGTTTGATCCTGGCTCAGATTGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGGCAGCATGAGATGGGGTAACCCATTTTGATGGCGAGTGGCGGACGGGTGAGTAATATGTAGGAATCTACCTAGAGGAGCGGGATAACTTAGGGAAACTTAAGCTAATACCACATAATCCCTACGGGGGAAAGCAGGGGACCGCAAGGCCTTGCGCCTTATGATGAGCCTACATCGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGATGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGCAACCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCCTTAGGGTTGTAAAGCACTTTCAGTGGGGAGGAAGTTTATTGTGTTAATACCATAATGAATTGACGTTACCCACAGAAGAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGGGTGTGTAGGTGGTTGCGTAAGTTAGATGTGAAATCCCCGGGCTTAACCTGGGAACTGCGTTTAAAACTGCGTAGCTAGAGTATTGCAGAGGATAGTGGAATTTCCAGTGTAGCGGTGAAATGCGTAGATATTGGAAGGAACACCAGTGGCGAAGGCGACTATCTGGGCAGATACTGACACTGAGACACGAAAGCGTGGGGAGCAAACAGGA\n>URS0001FB0CF8 rRNA from 1 species \nGGGCACCGGGGGGGTGCCTAATACATGCAGTCGAACGCGTTGGCCCAATTGATTGATGGTGCTTGCACCTGATTGATTTTGGTCGCCAACGAGTGGCGGACGGGTGAGTAACACGTAGGTAACCTGCCCAGAAGCGGGGGACAACATTTGGAAACAGATGCTAATACCGCATAACAGCGTTGTTCGCATGAACAACGCTTAAAAGATGGCTTCTCGCTATCACTTCTGGATGGACCTGCGGTGCATTAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGATGATGCATAGCCGAGTTGAGAGACTGATCGGCCACAATGGGACTGAGACACGGCCCATACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGGCGCAAGCCTGATGGAGCAACACCGCGTGAGTGAAGAAGGGTTTCGGCTCGTAAAGCTCTGTTGTTAAAGAAGAACACGTATGAGAGTAACTGTTCATACGTTGACGGTATTTAACCAGAAAGTCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGATTTATTGGGCGTAAAGAGAGTGCAGGCGGTTTTCTAAGTCTGATGTGAAAGCCTTCGGCTTAACCGGAGAAGTGCATCGGAAACTGGATAACTTGAGTGCAGAAGAGGGTAGTGGAACTCCATGTGTAGCGGTGGAATGCGTAGATATATGGAAGAACACCAGTGGCGAAGGCGGCTACCTGGTCTGCAACTGACGCTGAGACTCGAAAGCATGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGAGTGCTAGGTGTTGGAGGGTTTCCGCCCTTCAGTGCCGGAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCTACGCGAAGAACCTTACCAGGTCTTGACATCTTGCGCCAACCCTAGAGATAGGGCGTTTCCTTCGGGAACGCAATGACAGGTGGTGCATGGTCGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTACTAGTTGCCAGCATTAAGTTGGGCACTCTAGTGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAGATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGACGGTACAACGAGTCGCGAACTCGCGAGGGCAAGCAAATCTCTTAAAACCGTTCTCAGTTCGGACTGCAGGCTGCAACTCGCCTGCACGAAGTCGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGAGAGTTTGTAACACCCAAAGTCGGTGGGGTAACCTTTTAGGAGCCAGCCGCGAAGGTGGAACAGGAT\n>URS0001125F2F rRNA from 1 species \nTACGGGGGGGGCAAGCGTTGTTCGGATTACTGGGCGTAAAGGGCGCGTAGGCGGTCAGCACAAGTCAGTTGTGAAATCTCCGGGCTTAACCCGGAAAGGTCAACTGATACTGTGCGACTAGAGTGCGGAAGGGGCAACTGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGCATCCTGGACCGGTATTGACGCTGAGGCGCGAAAGCCAGGGGAGCAAACGGG\n>URS00020FB289 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGATGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTCCCTATAAGAGTGGGATAACTTCGGGAAACCGGATCAAATACCGGATAATATATTGAACCGTGTGGTTCAATGGTGAAAGACGGTTTTGCTGTAACTTATAGATGGTTCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGGTACGATGCGTAGCCGACCGGCGAGGGGGATCGGCCACACGGGAACTGGGACACGGTCCAGGCGCCTACGGGAGGCAGCAGTAGGGAATGGTCCGCAATGGTCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACAAATGTGTAAGTAACTATGCACGTCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS000014A96C rRNA from 1 species \nAGCCATGCATGTCTAAGTATAAACTGCTTATACTGTGAAACTGCGAATGGCTCATTAAATCAGTTATAGTTTATTTGATGGTACCCACTACTCGGATAACCGTAGTAATTCTAGAGCTAATACGTGCGTACATCCCGACTTCTGGAAGGGACGTATTTATTAGATAAAAGGCCAGCCGAACTTTGTTCGACCTGCGTTGACTCATGATAACTTCACGAATCGCACGGCCTTGTGCCGGCGATGTTTCATTCAAATTTCTGCCCTATCAACTTTCGATGGTAGGATAGAGGCCTACCATGGTGGTAACGGGTGACGGAGGATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCCGACACGGGGAGGTAGTGACAATAAATAACAATACCGGGCATTTAATGTCTGGTAATTGGAATGAGTACAATCTAAATCCCCTAACGAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTTAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCGGGTGGGTGCTAGCGGTCCGGCTCTGCTGTGTACTGCTAGTGCCTATCTTTCTGTCGGGGACGGGCTCTTGGGCTTCATTGTCCGGGACTCGGAGTCGACGTGGTTACTTTGAGTAAATTAGAGTGTTCAAAGCAAGCGTTCGCTGTGAATACATTAGCATGGAATAACACGATAGGACTCTGGCTTATCTTGTTGGTCTGTAAGACCGGAGTAATGATTAAGAGGGACAGTCGGGGGCATTCGTATTTCATTGTCAGAGGTGAAATTCTTGGATTTATGAAAGACGAACTTCTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTGGGGGCTCGAAGACGATTAGATACCGTCGTAGTCTCAACCATAAACGATGCCGACTAGGGATTGGCAGGTGTTTCGTTGATGACCCTGCCAGCACCTTATGAGAAATCAAAGTTTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGGCGGAAGGGCACCACCAGGCGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTCCAGACACGGGGAGGATTGACAGATTGAGAGCTCTTTCTTGATTCTGTG\n>URS00019D9398 rRNA from 1 species \nTGGCGGCGTGCCTAATACATGCAAGTCGAGCGGACAGAAGGGAGCTTGCTCCCGGATGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCTGTAAGACTGGGATAACTCCGGGAAACCGGAGCTAATACCGGATAGTTCCTTGAACCGCATGGTTCAAGGATGAAAGACGGTTTCGGCTGTCACTTACAGATGGACCCGCGGCGCATTAGCTAGTTGGTGGGGTAATGGCTCACCAAGGCGACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTAGGGAAGAACAAGTGCGAGAGTAACTGCTCGCACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGAAACTTGAGTGCAGAAGAGGAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTCTGACAACCCTAGAGATAGGGCTTTCCCTTCGGGGACAGAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGATCTTAGTTGCCAGCATTCAGTTGGGCACTCTAAGGTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGACAGAACAAAGGGCTGCAAGACCGCAAGGTTTAGCCAATCCCATAAATCTGTTCTCAGTTCGGATCGCAGTCTGCAACTCGACTGCGTGAAGCTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGCAACACCCGAAGTCGGTGAGGTAACCTTTATGGAGCCAGCCGCCGAAG\n>URS0000FD7098 rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGGTCTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGATCTTGAGTTCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGTGCGAAAGCTAGGGGAGCAAACGGG\n>URS000131717B rRNA from 1 species \nTACGAAGGTGGCAAGCGTTACTCGGAATTACTAGGCGTAAAGGGCAGGTAGGCGGTTTGGTTAGTCTGTTGTGAAAGCTCCTTGCTTAACGGGGAGAGGCCAACGGATACTGCCAGACTTGAGTATAGGAGAGGGTACTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGAGATCGGGAGGAACACCAATGGCGAAAGCAGGTACCTGGACTATTACTGACGCTCAGCTGCGAAAGCTAGGGGAGCAAACAGG\n>URS000115C7E9 rRNA from 1 species \nTACGGAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGCTTTGTAAGTTAGAGGTGAAAGCCCGGAGCTCAACTCCGGAACTGCCTTTAAGACTGCATCGCTTGAACGTCGGAGAGGTAAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGACCGGTACTGGCGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGG\n>URS0000E4B3A6 misc_RNA from 1 species \nGCGTCCGTTTCTGTCCTGTCGTCGAGGGAAGCGCTGGGATTTATCCCAGCCGTCCCTCGACGGTCGTGTTGAGGCGTCGTCCGGGAACGGGCGTCCCTTCAAGTGCGAA\n>URS00023A6056 lncRNA from 1 species \nTACTTTGGCTAAAGACTTCCAGAATCATCGATCTATGATATCACATAGGATGTTTGCTCTCCTTATTAGGAGTGACTGATCCCTCATTGATTACTCACAACCTTCATGCATACTTTACCACATCCAAAATATCCCATATAAGGATCAAAGAATCAAGTTAGGTAGTGAACCAAAATATGGATTCATGTACACAAGGTATTATGACGATCTCAGGTCAAAGGATCACTTACACAACTCCCATT\n>URS0000CE10A7 sRNA from 1 species \nTTATTACAAAAAAATGCTGTTTAATTTCACATGATAGAGTTATATGGTAGAACGGTTTGGATTGATATTATGGAATATATACCACGCGTAAAATCTTAAAATTAAATAT\n>URS000013D6AF rRNA from 1 species \nCAAATGACTCTCGGCAATGGATATCTTGGCTCTTGCATCGATGAAGAACGTAGTGAAATGCGATACTTGGTGTGAATTGCAGAATCTCGTGAACCATTGAGTCTTTGAACGCAAGTTGTGCCCGAGGCCTTGCGGTCGAAGGCACGCCTGCTTGGGCGTCATT\n>URS0002063A20 rRNA from 1 species \nTTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGATGAAGGGAGCTTGCTCCTGGATTCAGCGGCGGACGGGTGAGTAATGCCTAGGAATCTGCCTGGTAGTGGGGGATAACGTCCGGAAACGGGCGCTAATACCGCATACGTCCTGAGGGAGAAAGTGGGGGATCTTCGGACCTCACGCTATCAGATGAGCCTAGGTCGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCGAAACTGGTCTGAGAGGATGATCAGTCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGTCTTCGGATTGTAAAGCACTTTAAGTTGGGAGGAAGGGCAGTAAGTTAATACCTTGCTGTTTTGACGTTACCAACAGAATAAGCACCGGCTAACTTCGTG\n>URS0001992F3F lncRNA from 1 species \nCAGAACCGAAGATCGCTTACGTTTCCACACGGACCCGTTTTAGTGACGTACCCATCTGCCGTCAGCTTCTGTAAGTTTGGTGACTTGATTTTAATCGTGTTCTGTTCATTTACCTGCTTCCTAAACATAGGTGAACTCTTCTAATGTCTACCATAGAGACTTGCTGTAAGCTACAGACGTCTTTTCTGAATGGAGAAGATGGAGGATTATCCACTCTACTGCATCAAATGATTCCAGCATTACTGATCTGCACCCTAGAATATCCTGGAATAATCACTTGTGCAGTTTTGATGACATCTCTTGAAGTGTTATGA\n>URS0001E8D186 rRNA from 1 species \nTGAGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGCAGGAAGAAGCATCTATGGTGTGTATCCTGCTTTTGTACGGGAAGAAACACTCCTTCGTGAAGGAGCTTGACGGTACCGTAAGAATAAGGATCGGCTAATTCCGTGCCAGCATCCGCGGTTATACGGAGGATCCCAGCGTTATCCGGAATCATTGGGTTTAAAGGGTCCGTAGGCGGTTTAGTAAGTCAGTGGTGAAAGCCCGTCGCTCAACGATGGAACGGCCATTGATACTGCTAGGCTTGAATTATTAGGAAGTAGATAGAATATGTAGTGTAGCAGTGAAATGCTTAGATATTACAAGGAATACCAATTGCGAAGGCAGGTTACTACGAATGGATTGACGCTGATGGACGAAAGCGTGGGGAGCAAACA\n>URS000118D854 rRNA from 1 species \nTACAGAGGGGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGCCTTCTAAGTCGAACGTGAAATCCCCGGGCTCAACCCGGGAACTGCGTCCGATACTGGAAGGCTTGAATCCGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCGGTGGCGAAGGCGGTTCTCTGGGCATTGCCTGACGCTGAGGAGCGAAAGTGTGGGGAGCGAACAGG\n>URS00010E7D1D rRNA from 1 species \nTACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCGCGTAGGCGGTGCGGTAAGTCACCTGTGAAATCTCCTGGCTCAACTGGGAGCTTGCAGGCGAAACTGCCGTGCTGGAGTGTGGGAGAGGTGCGTGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCTGTGGCGAAAGCGGCGCACTGGACCACAACTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACAGG\n>URS00009F8AF6 misc_RNA from 1 species \nCCTGTTGAAGATGGAAGAGTTGGCTGAGATGCCACGGATGTGTTTGACCCTTTTGAAAAAAAGTTGCCTGGGACATCAGTTACAGGTTGAGCAGCAGATCCAGTTGAAGCTTGATAGCCAACTTGTGAAGCAACAGGGGCAGTAGAGCCTTGTGGGAAAATGTTTTCATTGTTAAACTGTGGAGTTGGTCCTATTGCATTTTGATGAGCAACTTGTAAGCCTACTGGGGCAGCAGAACCCTGTTGTTGGAAAAGGTTTCCATTGTTAAACTGTGGAGTTGGTCCCGTTGCATGGTAAGCAGCT\n>URS0002410C40 lncRNA from 1 species \nCAGTCTCTCTCTAACTTTATCCTGGTATAGCATCCGTCTCTTATCCTTTATCTCTGTGAATCTCTCTCGCTAACTCTTTCTCTCTCTTGGAGCATAAAAATCCATCCATCTCAAACTTAGTGGTTTACTTCTTTACTATGTTTTTAGATAGAAAAAGAACTTGGGTATTTTGTTGTTATAGAGAAGAAAGGAAGAATAAATTCCTAAGTTCTTTATCTTTCAAAGCTTCCGCTCAACTTTAGCTTTTAACCCAAAAGAATCTCTTCATTTTGACGCGCCCACAGCCACAAAAAACAGCAACAGTAAGTCAGTCACAGAGTTGGTGGCAAAAAATCTCTTCACATCAGGATTAGGTTTGGGGATTGGGTGTGAGAGAGAAGCAGCAGGCAAATATACAAAATCTCAAAGAAGATCGAAGGATTAGGTTTGGGGATGAGCCTTAATCTGTTTTTTTTTTTTTCCTAAAAATGTTAGGC\n>URS0002280BA0 misc_RNA from 1 species \nGAAATGCGATAATTAATGTGAATTGCAGAATTCAGTGAATCATCGAGTCTTTGAACGCACATTGCGCCCCCTGGTATTCCGGGGGGCATGCCTGTCCGAGCGTCATTGCTACCCTCAAGCACGGCTTGTGTGTTGGGCTTCCGTCCCTGGCAACGGGGACCGGCCCAAAAGGCAGTGGCGGCACCATGTCTGGTCCTCGAGCGTATGGGGCTTTGTCACCCGCTCCCGTAGGTCCAGCTGGCAGCTAGCCTCGCAACCAATCTTTTTAACCAGGTTGACCTCGGATCAGGTAGGGATACCCGCTGAACTTAAGC\n>URS00016372AB rRNA from 1 species \nCAGTCGCCGCGGTAATACCGAGGGTGCGAGCGTTAATCGGATTTACTGGGCGTAAAGCGTGCGTAGGCGGCTTTTTAAGTCGGATGTGAAATCCCTGAGCTTAACTTAGGAATTGCATTCGATACTGGGAAGCTAGAGTATGGGAGAGGATGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGATGGCGAAGGCAGCCATCTGGCCTAATACTGACGCTGAGGTACGAAAGCATGGGGAGCAAACAGGATTAGATACCCGTGTAGTCCCTGTCTCTTATAA\n>URS00017BF492 rRNA from 1 species \nTACGTAGGGTCCGAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTTGTCACGTCGGGCGTGAAAACTCAGGGCTCAACCCTGAGCGTGCGTTCGATACGGGCAGACTAGAGGTATGCAGGGGAGAACGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS00019F2EB9 rRNA from 1 species \nGGCGGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGAAACTTGAGTGCAGAAGAGGAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTCTGACAACCCTAGAGATAG\n>URS000031863D rRNA from 1 species \nTTGGCGGACGGGTGAGTAACGCGTGAGTAACCTGCCTTCAAGAGGGGGATAACATTCTGAAAAGAATGCTAATACCGCATAATGTCGCAAGACCAAAGAGGGGGACCTTCGGGCCTCTTGCCATCGGATGTGCCCAGATGGGATTAGCTTGTTGGTGGGGTAACGGCTCACCAAGGCGACGATCCCTAGCTGGTCTGAGAGGACGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCATG\n>URS00002862DB rRNA from 1 species \nCGGGTGAGTAACACGTGAGCAACCTGCCTTTCAGTGGGGGACAACAGTTGGAAACGACTGCTAATACCGCATAACGTGCCGGAAGGGCATCCTTTTGGTACCAAAGATTTATCGCTGAAAGATGGGCTCGCGTCTGATTAGATAGTTGGTGAGGTAACGGCCCACCAAGTCGACGATCAGTAGCCGGACTGAGAGGTTGATCGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAG\n>URS0002137456 rRNA from 1 species \nGAAAGTAAGAAAGGGCGTATGGCGGATGCCTAGGCTCACGGAGGCGATGAAGGACGTGATAAGCTGCGATAAGCTTCGGGTAGGTGCAAATAACCCTTGATCCGGAGATTTCCGAATGGGACAACCTAGCCGTCTGAAGGACGGTTACTCAATCTTCAAGGTTGAGAGCTAACGCAGGGAACTGAAACATCTTAGTACCTGCAGGAAGAGAAAATAAATGAATGATTCCCCTAGTAGTGGCGAGCGAACGGGGAACAGCCCAAACCGTTGACGTCGCAAGGCGCCAGCGGGGTTGTAGGACCGCGACATTGTATGCAAATCGTGAACAGAACACTTTGGAAAATGTGACCATAGACGGTGATAGTCCAGTATGTGAAGCGAAATGCAGCATAGCGGTATCCTGAGTAACGCGGGACACGAGGAATCCTGCGCGAATCTGCCGGGACCATCCGGTAAGGCTAAATACTCCCGTGAGACCGATAGCGAACGAGTACTGTGAAGGAAAGGTGAAAAGAACCCCGAGCAGGGGAGTGAAATAGTTCCTGAAACCATACGCCTACAAGCGGTCGGAGCATCTTACGATGTGACGGCGTGCCTTTTGCATAATGATCCTACGAGTTACCGTCACTGGCGAGGTTGAGTGTCACGAGACACGTAGCCGCAGTGAAAGCGAGCCTGAACAGGGCGCATAGTCAGTGGGGGTAGACGCGAAACCAAGTGATCTACACTTGGCCAGGATGAAGTCCCGGTAACACGGGATGGAGGTCCGCACCAATAAGCGTTGAAAAGCTTCTGGATGAGCCGAGTGTAGGAGTGAAAGGCCAATCAAACTTGGAGATAGCTCGTACTCCCCGAAAGGCATTTAGGTGCCGCGTCGGATGGTCACCGTGAGAGGTAGAGCGACCGATAGGACAAGAGGGCTTCACCGCCTATCGAGTCCTGACGAACTCCGAATGCTCACGGTCTGCAGTCCGGCAGTAAGGGGGCGGGTGCTAAGGTCCGTCCCCGAGAGGAGAAGAATCCAGACCGCCGTCTAAGGTCCCGGAGTTCTGCCTGAGTTAGTCTAACGAAGTCTGGTCCCCGCGACAGCTAGGATGTTGGCTTGGAAGCAGCCATTCATTTAAAGAGTGCGTAACAGCTCACTAGTCGAGGAGTCGGGCGTGGATAATAATCGGGTATTAAGTTGTCTACCGAAGCAGTGGGATCATTAATATGATCGGTAGGGGAGCATTCCAGTCGGCGTCGAAGGCGTACCGTGAGGTATTCTGGAGCGTCTGGAAAAGCAAATGTAGGTATAAGTAACGATAAAGGGGGCGGGAAACCCCCTCGCCGAAAGACTAAGGTTTCCTGATCAACGCTAATCGGATCAGGGTCAGTCGGGTCCTAAGGCTCAGCCGAACGGCGATGCCGATGGCAGAAACGGTTAATATTCCGTTACTACCTTCAGGAGTGACGTGGAGACGCAGTAGTGACAGTGCCGCCATCTGACGGAATAGATGGTTGAAGGGTGTAGGAGTCGATCATGGCAGGCAAATCCACCATGAGATCCGAACCTGATAGTATGCCGCGTCCTTCGGGACAAGGCAATAGTGCGCGTAAGCATGCTGCCGAGAAAATCCGCTAAACTTAATCCTGCAGGTACCCGTACCGCAAACGGACACACGTAGTCGGGATGAATATTCTAAGGCGCTTGAGTGATTCACGGTTAAGGAACTAGGCAAACTGACCCTGTAACTTCGGGAAAAAGGGTCCCGTCTCGCAAGAGCGGGCGCAGAGAATAGGTCCAGGCAACTGTTTAACAAAAACACAGGGCTGTGCGAAGTTTAAAGACGAAGTATACAGCCTGACACCTGCCCGGTGCCGGAAGGTTAAGAGGAGACGTCATCGCAAGAGAAGCGTTGAATTGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGG\n>URS000140E52B rRNA from 1 species \nTACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGCCTTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAAGGTCATTGGAAACTGAAAGGCTTGAGTACAGAAGAGGAAAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAATACCGATGGCGAAGGCAGGTCTCTGGGCTGACACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGG\n>URS0001C1D63F rRNA from 1 species \nAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGGCAGCACAGTAAGAGCTTGCTCTTACGGGTGGCGAGTGGCGGACGGGTGAGGAATACATCGGAATCTACTTTTTCGTGGGGGATAACGTAGGGAAACTTACGCTAATACCGCATACGACCTACGGGTGAAAGCAGGGGATCTTCGGACCTTGCGCGATTGAATGAGCCGATGTCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGCACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATAGGCGCAAGCCTGATCCAGCCATACCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAAGAAAAGCAGCAGGTTAATACCCCGCTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGT\n>URS0000AD8EAF misc_RNA from 1 species \nTGTGGGAGCGGGCTTGCCCGCGATAGCGGTGTGTCAGTCGATAGCAATGTTGGCTGGCAGTCAGTCATCGCGGGCAAGCCCGCTCCCACA\n>URS000009FFA8 rRNA from 1 species \nAGTCTCAGATAGCCATGCATGTCTAAGTATAAACGCTTTATACTGTGAAACTGCGAATGGCTCATTATATCAGTTATAGTTTATTTGATAATCTCTTACTACTTGGATAACCGTAGTAATTCTAGAGCTAATACATGCATAAATACCTAACTTTCGGGAAGGGTAGTATTTATTAGATTGAAACCAATTGATCTCGGTCATATTGTGGTGATTCATAATAACTTTGCGGACCGCATGGCTTTACGCCGGCGGTAGATCATTCAAGTTTCTGCCCTATCAGCTTTGGATGGTAGGGTATTGGCCTACCATGGCTTTAACGGGTAACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAGACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGTAAATTACCCAATCCTGACACAGGGAGGTAGTGACAATAAATAACAATGCCGGGCCTTTTTAGGTCTGGCAATTGGAATGAGAACAATTTAAATCCCTTATC\n>URS0001F65059 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCTCCTGCTTGCAGGGGTACTCGAGTGGCGAACGGGTGAGTAACACGTGGGTGATCTGCCCTGCACTTCGGGATAAGCCTGGGAAACTGGGTCTAATACCGGATAGGACCACATTTTGGATGGTGTGGTGGAAAGTTTTTCGGTGTGGGATGAGCTCGCGGCCTATCAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGTCGACGGGTAGCCGGCCTGAGAGGGTGTACGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAGGCCTGATGCAGCGACGCCGCGTGGGGGATGACGGCCTTCGGGTTGTAAACTCCTTTCGCTAGGGACGAAGCGCAAGTGACGGTACCTGGAGAAGAAGCACCGGCTAACTACGTG\n>URS000066A79F rRNA from 1 species \nAGCTATGGCTCTGTTGTATTAGGGATGTAGGCAGTTTCTTTCTCGTCTGATCTCGGAAGCTAAGCAGGGTCGGGCCTGGTTAGTACTTGGATGGGAGACCGCCTGGGAATACCGGGTGCTGTAGGCT\n>URS0000B505A9 rRNA from 1 species \nTACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTCGTTAAGTTCGTTGTGAAAGCCCCGGGCTCAACCTGGGAACGGCAATGGAAACTGGCGGGCTTGAGTGCGGCAGAGGGGGGTGGAATTCCGCGTGTAGCAGTGAAATGCGTAGAGATGCGGAGGAACACCGATGGCGAAGGCAGCCCCCTGGGCCGACACTGACGCTCAGGCACGAAAGCGTGGGGAGCAAACAGG\n>URS000084F4BB rRNA from 1 species \nACCTGGCTCAGGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGGACAGAAGGGAGCTTGCTCCCGGATGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCTGTAAGACTGGGATAACTCCGGGAAACCGGAGCTAATACCGGATAGTTCCTTGAACCGCATGGTTCAAGGATGAAAGACGGTTTCGGCTGTCACTTACAGATGGACCCGCGGCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCGACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTAGGGAAGAACAAGTGCAAGAGTAACTGCTTGCACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCATTGGAAACTGGGAAACTTGAGTGCAGAAGAGGAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTCTGACAACCCTAGAGATAGGGCTTTCCCTTCGGGGACAGAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGATCTTAGTTGCCAGCATTCAGTTGGGCACTCTAAGGTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGACAGAACAAAGGGCTGCGAGACCGCAAGGTTTAGCCAATCCCACAAATCTGTTCTCAGTTCGGATCGCAGTCTGCAACTCGACTGCGTGAAGCTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGCAACACCCGAAGTCGGTGAGGTAACCTTTATGGAGCCAGCCGCCGAAGGTGGGGCAGATGATTGGGGTGAAGTCGTAACAAGGTTA\n>URS0002524E6B rRNA from 1 species \nATGGTCGTAGCAGTTGCGATATGGATCATAGGATTCTTTTCTGTTCGCCGCAGGAGTATTTTACCTGTAAAGTTGCGATGCCGATCAAAATGCTGCTTGTTTTCTCTTCTTCCCCACATGGCCACGCCCACCGGATCTTGGACTTCACACCTCTTTCCATTATTTTTAGTTCCCGTTGGAGCGTATCTGTACGTCTGCACCTCAACAAGAATGTTCTCTCACTGGTATTTGATTAATACTACCACTAGTTTTTTGGAGAATGTTTGGTAA\n>URS00020B9359 rRNA from 1 species \nGACGAATGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTGCAGGGTACTCGAGTGGCGAACGGGTGAGTAACACGTGGGTGATCTGCCCTGCACTTCGGGGTAAGCCTGGGAAACTGGGTCTAATACCGGATAGGAACCATTTTTAGTGTGATGGTTGGAAAGTTTTTTCGGTGTAGGATGAGCTCGCGGCCTATCAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGGCGACGGGTAGCCGGCCTGAGAGGGTGGACGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGGGGGATGACGGCCTTCGGGTTGTAAACTCCTTTCGCTAGGGACGAAGCTTTTGTGACGGTACCTAGAGAAGAAGCACCGGCTAACTACGTG\n>URS000047804E rRNA from 1 species \nGATCCTGGCTCAGGATGAACGCTGGCGGCATGCTTAACACATGCAAGTCGAACGAAGCCATAGGAAGCTTGCTTTCTTTGAAGCTTAGTGGCGGACGGGTGAGTAACGCGTGAGTAACCTGCCCTCGAGTGGGGAATAACATCGAGAAATCGGTGCTAATACCGCATAACGTCGGAGAACCGCATGATTTTCCGACCAAAGGATTTATTCGCTTGAGGATGGACTCGCGTCCGATTAGCTAGTTGGTGAGGTAACGGCCCACCCAAGGCGACGATCGGTAGCCGAACTGAGAGGTTGATCGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGGCAATGGGCGAAAGCCTGACCCAGCAATGCCGCGTGAAGGATGAAGGTCTTCGGATTGTAAACTTCTTTGATTGGGGAAGAATAAATGACCTACCCAAAGAACAAGTCACGGCTAACTACGTGCC\n>URS000041CA9B rRNA from 1 species \nTCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTGATACGTAGGGTGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGGGCTCGTAGGTGGTTGATCGCGTCGGAAGTGTAATCTTGGGGCTTAACCCTGAGCGTGCTTTCGATACGGGTTGACTTGAGGAAGGTAGGGGAGAATGGAATTCCTGGTGGAGCGGTGGAATGCGCAGATATCAGGAGGAACACCAGTGGCGAAGGCGGTTCTCTGGGCCTTTCCTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGCTTAGATACCCTGGTAGTCCACGCTGTAAACGGTGGGTACTAGGTGTGGGGTCCATTCCACGGGTTCCGTGCCGTAGCTAACGCTTTAAGTACCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGCCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGTAGAACCTTACCTGGGTTTGACATGGATCGGGAGTGCTCAGAGATGGGTGTGCCTCTTTTGGGGTCGGTTCACAGGTGGTGCATGCCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTCACTGTTGCCAGCACGTTATGGTGGGGACTCAGTGGAGACCGCCGGGGTCAACTCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGCCCCTTATGTCCAGGGCTTCACGCATGCTACAATGGCTGGTACAGAGAGTGGCGAGCCTGTGAGGGTGAGCGAATCTCGGAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCTCATGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGGCTTGTACACACCGCCCGTCAAGTCATGAAAGTTGGTAACACCCGAAGCCGGTGGCCTAACCGTTGTGGGGGAGCCGTCGAAGGTGGGACTGGTGATTAGGAC\n>URS00016BE8EB rRNA from 1 species \nTACGAAGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGCGCAGGCGGTCCTTTAAGTCAGGGGTGAAAGCCCAGAGCTCAACTCTGGAACGGCCTTTGAAACTAGAGGACTTGGGTACGGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGTTACCGACGCTCAGGCGCGACAGCGTGGGGAGCAAACAGG\n>URS000104102D rRNA from 1 species \nTACGTAGGGTGCGAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTTGTAGGCGGTCTGTCGCGTCTGCTGTGAAAATCCGGGGCTCAACCCCGGACTTGCAGTGGGGTACGGGCAGACTAGAGTGTGGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGGTCTCTGGGCCACTACTG\n>URS0001017A28 rRNA from 1 species \nTACGGAGGGTGCGAGCGTTGTTCGGAATCACTGGGCGTAAAGCGCGTGTAGGCGGCCTTGTAAGTCTGGTGTGAAAGCCCGGGGCTTACCCCCGGAAGTGCACTGGAAACTGCAAGGCTAGAGTACCGGAGAGGAAGGTGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCGGTGGCGAAGGCGGCCTTCTGGACGGATACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACAGG\n>URS0000908CE3 ncRNA from 1 species \nCTGGTTAATTCCGATAACGAACGAGACTCTGTCCTGCTAACTAGGCGGGTAAACCCGGGTCGGCGTGTGCGCGGCGCTGGCGGTTTCGGCCGTCAGTGTTCGCGTACCCGTCGGCTCGGCCCGGTATCCCCGAACGCGTTCGCCCGTCGTCCACGGCGGTCGTCGGGCGCGGCCGCGCCATCCGCGTCCCGGCGTTCGGCGGGCGTATGTCGGCCGGGGGGCAACCTCCGGTCGGCCTGCGTCCGTCGTGCGTCGGGCTCCGTGGTGAAGCGCGCCGTGTTCGCGGCCGTCGCCGGCGGATCACGATACGTTACTAGGGCTACCGCCGGCTCCCAGGAGCTTAAACTCTTCTTAGAGGGACAGGCGGCGGACGAACATAGCCGCACGAGACTGAGCGATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGAAGGAATCAGCGTGTTTAACAATCCTGGGCCGACAGGCTTCCGGGTAACCCGCTGAACCTCCTTCGTGCTTAGGGATCGTGGCTTGCAATTTTTCCACGTGAACGAGGAATTCCCAGTAAGCGCGAGTCATCAGCTCGCGTTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCGATTGAACGGTCGCATTGAGGTCTTCGGAGTGGACGCGCGTTATTCGGCCCCCTCGGGGGCTGGGTCGTCGCGCGATCGCGAAGATGACCGAAATCGGCCGTTTAGAGGAAGTAAAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTA\n>URS0001269AD4 rRNA from 1 species \nTACGTAGGTGGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGCGCGCGCAGGCGGTGCGGTAAGTCTGTCGTGAAATCTCCCGGCTCAACTGGGAGGGTGCGGTGGAGACTGCCGGACTGGAGGCACTCAGAGGCCGGTGGAATTCCCGGTGTAGTGGTGAAATGCGTAGAGATCGGGAGGAACACCAGTGGCGAAGGCGGCCCACTGGGCCGGTACTGACGCTGAGGCACGAAGGCGTGGGGAGCGAACGGG\n>URS00004A8CD5 rRNA from 1 species \nCCTTGCCAGCCCGCTCAGAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGTATGTGGTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCCGGAGACCCTTAGGAAACTAGGGGGTGCTTCCATCTGGAAGAATCTGGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGCCTTTAGTTGCCAGCAGTTCGGCTGGGCACTCTAAAGGGACTGCCGGTGTTAAACCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCTTTATGACCAGGGCTACACACGTACTACAATGGCCGATACAAAGGGCAGCGACACTGCGAGGTGAAGCCAATCCCGTAAAATCGGTCTCAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTTGGAATCGCTAGTAATCGTGGATCAGCATGCCACGGTGAATACGTTCCCGGGCCTT\n>URS000236C264 lncRNA from 1 species \nCTGCATCCTTCCAAACAGAGAAATAGGATGAGAATCAGTATGTCTGAACTATAGGCTAAAGCGGCATGAGGTTCAGGTGCATCAACATGATTCAGTTTCCATGACCAGATTGCTCATTACAAAAATCAAAGCAGAAATATATTCCCTACACTAAAACAGAGTAAAGAGTTAGAAATATCATGGTCTCCAAGGCCACAATCCAGTTATGCACTCAAAAAGTCCAATAACGTCCAGGCTAGCAATTAAACATGCTAGCTTTCAAGTTCAACGATTCAAAGTTTATTGATTTATAACGAATCTTGAGAAGTTCCAAAGGAAGCATGCAGTGCATCATCCTAATCATTAATATCCTAAAATAAGGCTTAAATCAACAACAGCTCCAAGTATGCAGGTATCAAGAATCACCTTTGACAGCTAAATACAAGACATTTCATCTCTAATTGGCAGGTATGCTGGTAAGCTATTACAGAATAACCGATGAACAGGGTAACTATTATTTTGCTTCTTAACTGCCAGGGGGAACCAACTGAAGCATGGCATCTACATAATGTCATGTCTTGTGCCTGCTTCAGTTGCGGATCACTGAAGTAAAAATTCTTTAACCTAAATTAATAAATATACTACCAGAAGCAAGAGAGTCAAAAATGAAATGGATTACTAAGTATTACCAATCACATACATTTCCAACAGTCATATCAGAAGCTTCAAATTAACTAATAGATTTAAGATTTCGAATATCTCCCTCATTCCTTTATAATATTTTGTAGGTCACTTGGAAAGAAACGAATAGGAGGGTTTTGATGGGCTTTATTTGGCCTTTTGTAGATATGGATCATTGGCTCCAAAATTCTCTGTTTTTTTTGCTTAAAGATCATCCTCTCTCCCCTAAGTAGGATCGTGAAGAGCTTGATATTTTGACCAGCTTGCAACCTATGGTTTCGTATATGAATGCCACTTCCTTGCTGTCTTGTTAATATACTTAAAAAAATAATAATAAATTTTTAACCTGCCTTGAGCAGGCTTAAATTTAAGGATTATAACAGCAAGAACTTATTTATTATTTTTAAATATTGATATTAACAATGGTACCAATGGGGCACCACCCATATATAATATATTTACATGTCAATTAAAACTTCAATGACATTTCCAAAATTTTCCGGCCTATTAATGTCATGACCCAAAACCAAGAAACCAAAAATATGAATTCATCTATCTCTAATATTAACAAACTCCCTTTTTATTTCTTCAAATGCTCTAACATTCCTTTCTTTCCACACGACCCAAAAAATAGATAAAGGAATCAGAAGAAGATAAGTTTTCTTTGTACATAAGCCCGCCCAAGCCCACAACTCATCTCTCGCCAACCCTGCAATCACCCAATTGATCCCTAGGAGACCGTACACCATAGACCAAATACCATACACCATTGGGCACCATAGCAAAATATGGTTACATGATTCTGCATCCATCTTAAATAAAAGCAGTGATTAACTAGAATTTTGCCCCTCCACCTCAGCCTATCAATAGTTAGGATGCATTCTCTACTCATTTCACAAGCAACCAAAAAACAATTGTTGGTGGTGCCTTCGTCTTCCATATCTATTTAACTGGATAATGGACAGTTTCACTCCTTTTTCCCCTAGTCAAATGCTTGTAGAAGGTCTTTACAGAGTAATCTTCTTGTTTCCTCAATTTCCACATCAACTGGTCCCTTCGATCATCTAATTGAATTTGAGATAACAGGAGTAATAAGGCTTCATACTCTTCGATAATTATTGAGATTTCTTGTGACGTTCATATTCCACCCCCTACTCCCGCTCGCTGTCAAGTGAGCCTCCTCCGCCACCATGTTCTTTGATGACACAATGGCGAAGATCGCTGGAAACTGATCTTTCAGCCTATCCTCACCAACCCATTCATTCTTTCAAAAATGAATTCTATCGCCCTTATCCACCTTCCTCTTTGTGCATTCAAGAAATTTGTGTTTCTCCACACTAATTTTCTTCTATTCACATCCCTGACGTCCTCACCCACTTCCCTCACACCCCACAGAGCCTCCACAACAAGAACTTATTTATAAGTTGCGAGTGAAATATCAACACCACCTTCCATACACTAAATTATTATTATTGGACATTTGCACAAAGAAGTACTCAAATTAATTTACCATGAAAAGGAAATAATGCTCATACAGTATAATGGCCATTAATAAATGCTATTTTAGAACTCATAAAAGCCACTTAGTGTCTAAAAATTGAACAAATTCAGCTTTCAGATATAAAAGAATTAGATATCCCAGCAAAAAGAGAGAATTTCATGTCATATTATTGTTAGAAACTTGGGACTTCTTGCAAGCATTTTAGCAAATATGAAAAAAATCACAAAAGAACTTTGCCTACTACCATCCTCAGTCTCATCAAACTCCATCCTAATGCGATATACATGACTATGTTGCTTCGGTTTGACCTTGTGCAAAGCCCTAGGCTCTCTATGGTTTTTGCTAAAAAAATGTGACCTGTAATTCTGTGTACAATCATCAAACAATAACTGCACTAAATATCATGCAAATACAAAAAGTTGTTTCCTATCAAGTATTTCACAGTTTCTCTCTCAAAAAGTTTTCCATAGTTTTTTATCTCATGTCATATCTCATTTGTGTAGCATGCATACATACATAATAGTCATAACTGCATGTAAAGAATTGACATGCTAGATACATGACTGAAATAACTTACTGAGAAAGCCAACATGAGAGAAAAACTAAGATGAAGCAAAGCAAAATATCCAGTAAATTTTACTACATCCCATACCTTATACTGGTCATGCTATTAATATGTAGGCAAGTAAAACGACAAGACCTAAGCATGCTTCTTAAAACCAGCTGAGAAAAATTAGACAAAATCTAGCAGAAATTATAATAGATCTATCTCCAAATTGTAGTTTCCTGTTTATGGATGCGAATCAAGAAAAATAAATGCCCAAACTATCATAATGACAAGCAAATGCAAGAAAACAAGTTCACAATACAAAATACAGAAGTACAGATCTATGATATTTCTTTTAAAGATAGGGAGGAAGAAAATATCACAAACAATGTAGAAG\n>URS000135D842 rRNA from 1 species \nGACGAACGCTGGCGGCGCGCTTAACACATGCAAGTCGAGCGAAGCGGCGGACGGGAGAGTAACACATGAGTAACCTGCCTCAGACATTGGGATAGCCGCGGGAAACCGGGATTAATAGCAAATGGTCTAAGATGGCCTCGCGTCTCATTAGCTCGTTGGTGAGGTAACGGCCCACCAAGGCGACGATGGGTAGTCGGTCTCAGAGGGTGGACGGCCACATTGGAACTGGGAAGCGGTCCAGACTCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGAGGGAGCTATGAAGATTCGATGCCGCGTGAACGAAGAAGGCTTTCGAGTCGTAAAGTTCTTTTATATGGGCAGTGGTACCATAAGACAAAGGCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATAC\n>URS0002034EF4 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTGTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGATGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS00025BECD2 rRNA from 1 species \nATGCGGGTGGTTGGACTTGTGGTCATGGAAAGCGCTAGGAAAATACCAAGCTCTAGGGTCACTAACATTAAAGAGGGAGATGCCAACACCCGCTATTTTCACTCGAAGATCAATGGAATTCGGTGGAAAATCCTAATTCACCGCCTTAAGCATGGGAGTGGCGGGGTAACGGATCACGACTACAAGAAGGCCATTATCCATGCTCACTTCTCAGCTATGATGAAAAAGAGCAACCCACGCGCTAAGAGCGTCAATTGGGCTTCCATTCCTGCTGCCGACCATGACCTATCCCATCTTGGGGACCCCATCATGGAGGAGATCAAGGCTGCGATTTTTGCCCTCCCTAGTGACAAGGCTCACGGGCCTGACGAATTCACCGGGAAATTCTGCAAAGAATATTGGGATATTATCAAAGATGGCATCATGCTTGTGATCAATAACTTCTCGGGCCTCCACACGAAAAAAATTCACTGGCTAAACTCGACTAATCTTGCTCTCATCCACAAGAAAGATGGCGTCGAGGACATCACTAACTTAGGCATATTAGGCCCAAGGAGCTTGGAGGATCCATGCGCACTGGCGTGCACTTCCCCTGTTCAGGGCGCCATGACGCAGCCTTTAAAGGAGCAACCGGTAGTCAAGGACGACCTGGTTGGCCACGGCGTCACCGGTGGAGGACACTCGGAAGTTGATGGTGCGGATGGCGGGTGGGGAGGGGGGGTCACCGACGCCGGAGAAGAGTCTGAACCTAGAGGAATGGCGGGGGCAGCGGCAAGGCAATGA\n>URS0002234228 rRNA from 1 species \nGGTTAAGTTGTTAAGGGCGCACGGTGGATGCCTTGGCACTAGGAGCCGATGAAGGACGGTACTAACACCGATATGCTTCGGGGAGCTGTAAGTAAGCTTTGATCCGGAGATTTCCGAATGGGGAAACCCACTGCTCGTAATGGAGTAGTATCTTCACCTGAATTCATAGGGTGATGATGGCAGACCCGGGGAACTGAAACATCTAAGTACCCGGAGGAAGAGAAAGCAAACGCGATTTCCCAAGTAGCGGCGAGCGAAACGGAAGAAGCCCAAACCAAGAGGCTTGCCTCTTGGGGTTGTAGGACACTC\n>URS0000D4A060 sRNA from 1 species \nCTCCTGTCTGCAGGATTTACGCGCACGTTGGAACCGAAGAGAGCTCTGTTGTTGCAATGTTCAGCCCACAAGACCTTACTGGTGAAGGAATGGGACAAGACCCATCTTTATGCAAAGCCAGCGTTACAGTAATGTCCCAGCATCTCATAATCTATCCTGGGGAATTCAGCTGCCTCCCAGGGTGAATACAGGTATTCCTGATGACAGTCTGCCTTCTATCTTACAGAGCAGCTTGTTGCTATATACCATTGAAAAGCCTTCAGAGCTGAGAGGTTAGTTGATATTTTTTGTTCCTTACAGCTTATGCCACCAAGTAGGCAGTTTCTATGATGAATCAAACTAGCTCACTATGACCGACAGTGAAAATACATGAACACCTGAGAAACTGGAGAACGCAGGGAGTGGGGGGTAACCATGTCTGAGGAATCTTTCACCCACAGCTTTGTTTTTCTCTAGGTACTACTAACCAATAACCTGCTTGGCTCAAAGGGCCAGCACCTTCTCTCTAAAGCCCAAGAGGAGTTTGAGGTAAA\n>URS0001621A90 rRNA from 1 species \nATACAGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGCTTGGTCAGTCGGATGTGAAAGCCCTGGGCTCAACCTGGGAATTGCATTCGATACTGCCAAGCTAGAGTATGGGAGAGGGAAGTGGAATTTCCGGTGTAGCGGTGAAATGCGTAGATATCGGAAAGAACACCAGTGGCGAAGGCGACTTCCTGGCCCAATACTGACGCTGAGGTGGGAAAGCGTGGGGAGCGAACAGGATTAGAAACCCTAGTAGTCC\n>URS000183796A rRNA from 1 species \nCACGTAGGGTGCAAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCTCGTAGGCGGCTTAGTAAGTCGGGTGTGAAAACCCCAGCTCAACCTGGGGACGCCACCCGATACTGCTATAGCTAGAGTCCAGTAGGGGAGTGTGGAATTCCCAGTGTAGCGGTGAAATGCGCAGATATTGGGAGGAACACCAGCGGCGAAGGCGGCACTCTGGGCTGGAACGTGACGCTGAGGAGCGAAAGCGTGGGTAGCAAACAGG\n>URS0001FEE94D rRNA from 1 species \nGATGAACGCTGACAGAATGCTTAACACATGCAAGTCTACTTGAACTTCGGTTTGGGTGGCGGACGGGTGAGTAACGCGTACAGAACTTGCCTCACAGTTAGGGACAACATTTGGAAACGAATGCTAATACCTGATATTATGATTTTAGGGCATCCTAGGATTATGAAAGCTATATGTGCTGTGAGAGAGCTTTGCGTCCCATTAGCTAGTTGGAGAGGTAACGGCTCACCAAGGCGATGATGGGTAGCCGGCCTGAGAGGGTGAACGGCCACAAGGGGACTGAGACACGGCCCTTACGCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGACCAAAAGTCTGATCAAGCAATTCTGTGTGCACGATGACGTTTTTCGGAATGTAAAGTGCTTTCAGTTGGGAAGAAAAAAATGACGGTACCAACAGAAGAGGTGACGGCTAAATACGTG\n>URS0001E248AA rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCCAGTCGAACGAGACCTTCGGGTCTAGTGGCGCACGGGTGCGTAACGCGTGGGAACCTGCCCTTAGGTTCGGAATAACTCCCCGAAAGGGGTGCTAATACCGGATAATGTCTTCGGACCAAAGATTTATCGTCTTTGGATGGGCCCGCGTTGGATTAGCTAGTTGGTAGGGTAAAAGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCAATGCCGCGTGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTTACCCGGGATGATAATGACAGTACCGGGAGAATAAGCTCCGGCTAACTCCGTG\n>URS00001C5077 rRNA from 1 species \nAGAGTGGGGGATAACGCAGCGAAAGCTGTGCTAATACCGCATACGATCTAAGGATGAAAGCAGGGGACCGCAAGGCCTCGCGCTCATGGAGCGGCCGATGTCAGATTAGGTAGTTGGTGGGATAAAAGCTTACCAAGCCGACGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGAAA\n>URS000002F2FF rRNA from 1 species \nATTGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGGTAACAGGGGGCTTCGGCCCGCTGACGAGTGGCGGACGGGTGAGTAATACGTAGGAATCTACCTTTTAGTGGGGGATAAACTTAGGGAAACTTAAGCTAATACCGCATAATCACTACGGTGGAAAGCAGGGGCTCGCAAGACCTTGCGCTGATAGATGAGCCTACGTCGGATTAGCTTGTTGGTAGGGTAAAGGCCTACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGCAACCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCC\n>URS0000AD69CA ncRNA from 1 species \nGACCGGAAGGCCGTGTGGACTGTATAGAAGAGAGAATGTTGGCATGAGTAGCGAGAGGTGAGTGAGAATCTCACCCATCGAAAGCCTAAGGTTTCCTGAGGAAGGCTCGTCCACTCAGGGTAAGTCGGGACCTAAGCCGAGGCCGAAAGGCGTAGGCGATGGACAACTGGTTGATATTCCAGTACCACCTTTAAACGTTTGAGAGATGGGGTGACACAGAAGGATAGACTATCGCACTGATGGAATAGT\n>URS00025CD331 rRNA from 1 species \nATGGCCAATGGATTTTACACTTCGTCATCGGCCTACAAGGTGCAATTCGAGGGGACTGTGGCCTCCAACATGACACGGGTCGTTTGGGGCAATTGGGGGCCTCCCAAGTGCAAATTATTTGCGTGGCTTGTCATCATGAATCGGGTTTGGACGGCGGATTGGCTTCGGAGGAGAGGATGGCCAAATTATAACTTATGTCAACTCTGTAAGAGGGAGCCTGAGACGGCGGCGCACTTCCTCTTGCATTGCAGGTTCTCCACACGCATTTGGAATGCGGTTAAGTGTTGGCTCGTCGTTCAGGAGTTGGATATCGCCACCTGGGCTGGGATCCCCACGGTCAAGCAATGGTGGGAGAAGACCGTCCTTGGACGAGGTCACAGGAGGAAGGCCGTGTCCTCTCTTCTAATGCTTGTATCATGGGAGCTGTGGAACGAGAGGAATGCGAGGGTGTTCCAAAAGAAAGCCACGATGCCGACCGTTGTGGTCAATCGTATCAAGGCGGAGTCTAGAAATTGGGTTCTGGCCGGGGCAAAACATATGGGATATTTGATGCCGCGAGAGTAG\n>URS0001ED03C2 misc_RNA from 1 species \nCAAGAAGCCGAAAGGCTACTTAAAACCATCGCGAACTTATCCAAGTTGCTTCGGCGGCGCGGCTCCCCTCACGGGGGACCGCAGCCCCCGCCTCTCAGGAGGTAAGGGGCAGCCGCCGGAGGTACGAAACTCTGTATTATAGTGGTATCTCTGAGTATAAAATAAATAAGTTA\n>URS0001607725 rRNA from 1 species \nGCAAGTCGAGCGAGAAGCCATCCTCGGGTGGTAAAGAGCGGCGAACGGGTGAGTAACGCGTAGGTATCTACCTAGTAGTGGGGAATAACCATTGGAAACGATGGCTAAAACCGAACGCCCTGAGGGGGAAAACTGAGGTGCTATTAGAGGAGCCTGCGTTAGATTAGCTAGTTGGTGAGGTAATGGCTCACCAAGGCGACGATCTATAGCTGGTTTGAGAGGATGATC\n>URS0001D85733 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCTGCTTTCCCTTGTGGATTGCGGGTACTCGAGTGGCGAACGGGTGAGTAACACGTGAGTGATCTGCCCCCAACTTGGGTATAAGCCTGGGAAACTGGGTCTAATTCCCGATAGGACTGCAGGGTGGTGCCTGTGGTGGAAAACGATTTTCTAGTGGTTGGGGATGAGCTCGCGGCCTATCAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGGCGACGGGTAGCCGGCCTGAGAGGGTGGACGGCCACATTGGGACTGGGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAGTATTGCACAATGGGCGGAAGCCTGATGCAGCGACGCCGCGGGGGGGATGACGGCCTTCGGGTTGTAAACTCCTTTCGACCGCGAGGAAGCCACCTGGTTGGAAGGGTGGTGACGGTAGTGGTAGAAGAAGCACCGGCTAACTACGTG\n>URS00025A5E17 rRNA from 1 species \nATGGGTTTCCGTGACATCCACTGTTTCAACCTGGCTCTGCTTGCAAAACAAGCATGGCGTCTCCTTGATAATCCTGACTCCTTGTGTGCTACTATTCTAAGGGCCAAGTACTATCCTAATGGTGATTTGCTGAACTCCAAGCCAAAGCATGGTGCTTCCTTCACCTGGCAAAGCATTATGGCAGGCATCACTACTCTTAAGCGAGGTTATATTTGGCGAGTGGGGGATGGACATAACATCAATATTTGGGAAGATGCCTGGATCCCAAATTGTGCCTCTAGGAAGATTATGACACCTAGGGGGGGGCATTTGTTATCAAAAGTCGTAGATTTAATTGACCCAGTCTCCAATAATTGGGATGAGGACCTGATTAGACAAACTATGTGGACCGTTGACGTACAACGAATTCTTTCAATCGCAATTTCGCAACATAATATGACGGATTTTATTGCCTGGAGTTATACGAAAAATGGTATGTTTTCGGTACGGTCTGCTTATTTAGTGGAGTGGAACTATCAATATGGGAGCAAGCTAAAATATTCCAATGGGATGGGACGGAGCACACCTAATCCTATATGGTGTCAGATATGGAAGTTGTCTTGTCTGGCTAAAGTCAATTTTTTTATGGCGGACACTACATGGCACTCTCCCATGCCGGGCAACACTCACTAA\n>URS00017A11C2 rRNA from 1 species \nTACGGAGGGTGCGAGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCTTTTTAAGGGTGCGGTGAAAGCCCGGGGCTTAACCCCGGGTCGGCCGTGCCGACTGAAAAGCTGGAGCACTGTAGAGGCAGGTGGAATTCCGGGTGTAGCGGTGGAATGCGTAGAGATCCGGAAGAACACCAGTGGCGAAGGCGGCCTGCTGGG\n>URS00012833E7 rRNA from 1 species \nAGCGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGGACCCTTCGGGGTTAGTGGCGGACGGGTGAGTAACACGTGGGAACGTGCCTTTTGGTTCGGAATAGCTCCTGGAAAGGGGTGGGAATGCCGAATGTGCCCTTCGGGGGAACGATTTAACGCCTTTAGAGCGGCCCGCGCCTGATTAGCTGGTGGGTTGGGGTAATGGCCCACCAAGGCTACGATCAGTAGCTGGTCTGAGAGGATGACCAGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCCGCAGTGGGGAATCTTGCGAAATGGGCGAAAGCCTGACGCAGCCATGCCGCGTGGATGATGAAGGTCTTAGGATTGTAATATCCTTTCACCGGTGAAGATAATGACTGTAGCCGGAGAAGAAGCCCCGGCTAACTTCGTGCCAGCCGCCGCGGTAAGAC\n>URS0001D3FFBA rRNA from 1 species \nAGTGAACGCTGGCGGCATGCTTAACACATGCAAGTCGCACGGGCAGCAATGTCAGTGGCGGACGGGTGAGTAACACGTAGGAATGTGTCTTGAGGTGGGGGACAACCCTGGGAAACTAGGGCTAATACCGCATATGTCCTGAGGGACAAAGCAGCGATGCGCCTTGAGAGTAGCCTGCGTCCGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCGGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGGGTGAAGAAGGTCTTCGGATCGTAAAGCCCTTTCGGCGGGGACGATGATGACGGTACCCGCAGAAGAAGCCCTGGCTAACTTCGTG\n>URS0000E6A59F rRNA from 1 species \nATCTACAGCCATACCACCCAGAAGGCTCCCAATCTCGTCTGATCTTGAAAGCTGAGCAGGGTTGGGCCTGGTTAATACTTGGATGGTAGAAAACAGTGTGAAGTCGAGG\n>URS00000EB6A6 rRNA from 1 species \nCTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCAGTGAGGAAGGTGGGTATGTTAATAGCATACTCATTTGACGTTAGCTGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGCATGCAGGTGGTTTGTTAAGTCAGATGTGAAAGCCCGGGGCTCAACCTCGGAATTGCATTTGAAACTGGCAAACTAGAGTACTGTAGAGGGGGTAGAATTTCAGGTGTAGCGGTGAAATGCGTAGAGATCTGAAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAGATACTGACACTCAGATGCGAAAGCGTGGGGAGCAAACAGGATTAGATAACCTGGTAG\n>URS000167F6B8 rRNA from 1 species \nTACAGAGGTGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGCCTTCTAAGTCAGACGTGAAATCCCCCGGCTTAACCTGGGAACTGCGTCTGATACTGGGAGGCTAGAGTGCGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAATACCGGTGGCGAAGGCGGCATCCTGGACCGGCATTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS0000D6C981 ncRNA from 1 species \nAAAGGGCCAAAGGCGCCCGGACGAGGTGCGCCGTACCCGGCCAGCGACAAGACGGCGTAAG\n>URS0000E05209 SRP_RNA from 1 species \nGCCATGAGCGATGTCACCCACCTATAATCCAGCTACCAGGGAAGCTGAGCCTGGTAGATCTTTAGTTTAAGAGTTCTGAGCTTTAGTGAGCCATGTTGATGGGATGTTCACACTAAGTTTGGCATCAGTGTGGTGAGCCCCTGGAATTAGAGGACCACTAGGTTGTCTAAGAAGGGTTACAAATGGGAGCAGGTTAGAGCTCCCAGACCACTTAGTAGTGGGATCAGGCCTGTGAGCAGCCCCTGTACCAGTTCCAGCTCAGAGTGAGATGGAGAGACCCAGTCTTT\n>URS0000BAE8CB rRNA from 1 species \nCCTACGGGACGCAGCAGTGAGGAATATTGGTCAATGGCCGGGAGGCTGAACCAGCCAAGTCGCGTGAGGGAAGACGGCCCTACGGGTTGTAAACCTCTTTTGTCAGGGAGCAAGGTGCAGGTCGGGACCTGCTGTGAGAGTACCTGAAGAAAAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAAAACGTAGGGTGCAAGCGTTGTCCGGAATTACTGGGTGTAAAGGGAGCGCAGGCGGATTGACAAGTTGGGAGTGAAAACTACGGGCTCAACCCGTAACCTGCTTTCAAAACTGTCAGT\n>URS00000F1EB4 rRNA from 1 species \nGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAACCTTCGGGTTAGTGGCGGACGGGTGAGTAACGCGTGAGAATCTGCCCTCAGGAGGGGGATAACGGTTGGAAACGACCGCTAATACCCCATATGCCGCGAGGTGAAATGAATTTCGCCTGAGGATGAGCTCGCGTCTGATTAGTTAGTTGGTGGGGTAAAGGCCTACCAAGACATCGATCAGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGGGATGAAGGCCTCTGGGCTGTAAACCTCTTTTATCAAGGAAGAAGATCTGACGGTACTTGATGAATAAGCCACGGCTAATTCCGTGCCAGCAGCCGCGGTAATACGGGAGTGGCAAGCGTTATCCGGAATTATTGGGCTTAAAGCGTCCGCAGGCGGTCTGTCAAGTCTGCTGTTAAAGCGTGGAGCCTAACTCCATTTCGGCAGTGGAAACTGACAGACTA\n>URS0000D30CB5 rRNA from 1 species \nGGATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGGGTGAAGAAGGCCCTAGGGTTGTAAACCCCTTTCAGCGGGGAAGATAATGACGGTACCCGCAGAAGAAGCCCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGACCTGCAAGTCGGGGGTGAAAGCCCGAGGCTCAACCTCGGAACTGCCTTCGATACTGCGGGTCTCGAGTCCGGGAGAGGTGAGTGGAATTCCTAGTGTAGAGGTGAAATTCGTAGATATTAGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGGTACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAA\n>URS00003ED92D rRNA from 1 species \nAACTTCTGAATGTTGACCTCGGATCAGGTAGGAATACCCGCTGAACTTAAGCATATCAATAAGCGGAGGAAAAGAAACCAACAGGGATTGCCCTAGTAACGGCGAGTGAAGCGGCAACAGCTCAAATTTGAAATCTGGCTCTCGGGCCCGAGTTGTAATTTGTAGAGGATACTTTTGATGCGGTGCCTTCCGAGTTCCCTGGAACGGGACGCCATAGAGGGTGAGAGCCCCGTCTGGTTGGATGCCAAATCTCTGTAAAGTTCCTTCAACGAGTCGAGTAGTTTGGGAATGCTGCTCTAAATGGGAGGTATATGTCTTCTAAAGCTAAATACCGGCCAGAGACCGATAGCGCACAAGTAGAGTGATCGAAAGATGAAAAGCACTTTGAAAAGAGAGTTAAAAAGTACGTGAAATTGTTGAAAGGGAAGCGTTTATGACCAGACTTGGGCTTGGTTAATCATCTGGGGTTCTCCCCAGTGCACTTTTCCAGTCCAGGCCAGCATCAGTTTTCCCCGGGGGATAAAGGCGGCGGGAATGTGGCTCTCTTCGGGGAGTGTTATAGCCCACCGTGTAATACCCTGGGGGGGACTGAGGTTCGCGCATCTGCAAGGATGCTGGCGTAATGGTCATCAACGACCCGTCTTGAAACACGGACCAAGG\n>URS00001448B3 rRNA from 1 species \nAACGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCCCAGCAATGGGAGCGGCAGACGGGTGAGTAACACGTGGGAACCTTCCCTATAGTACGGAATAGCCCAGGGAAACTTGGAGTAATACCGCATACGCCCGAGAGGGGAAAGATTTATCGCTATAGGATGGGCCCGCGTAGGATTAGCTAGTTGGTGAGGTAATGGCTCACCAAGGCGACGATCCTTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGATGAAGGCCTTAGGTGTAAGCTCTTTGCCGGGGACGATAATGACGGTACCCGGAGAATAAGCCCGGCTAACTTCGTGCCAGCAGCCGCGGTAAT\n>URS000098BB64 pre_miRNA from 1 species \nTTTTTAGTATCAGTATGTCCCATACAGTATTGGGGACATACTGATGCTAAAA\n>URS0001061001 rRNA from 1 species \nTACGTAGGGGGCAAGCGTTGTCCGGATTCATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCGGTTGTGAAAACTGGAGGCTCAACCTTCAGAGGTCGACCGAAATCATCTGGCTAGAGTCCGGGAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAAGCGGCTCTCTGGAACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>URS0000C64DF9 hammerhead_ribozyme from 1 species \nATCCAGCTGACGAGTCCCAAATAGGACGTGACGCGCGTCGTGTAT\n>URS000215D057 rRNA from 1 species \nTTAAGCGACTAAGCGTACACGGTGGATGCCCTGGCAGTCAGAGGCGATGAAGGACGTGCTAATCTGCGATAAGCGTCGGTAAGGTGATATGAACCGTTATAACCGGCGATTTCCGAATGGGGAAACCCAGTGTGTTTCGACACACTATCATTAACTGAATCCATAGGTTAATGAGGCGAACCGGGGGAACTGAAACATCTAAGTACCCCGAGGAAAAGAAATCAACCGAGATTCCCCCAGTAGCGGCGAGCGAACGGGGAGCAGCCCAGAGCCTGAATCAGTGTGTGTGTTAGTGGAAGCGTCTGGAAAGGCGCGCGATACAGGGTGACAGCCCCGTACACAAAAATGCACATGCTGTGAGCTCGATGAGTAGGGCGGGACACGTGGTATCCTGTCTGAATATGGGGGGACCATCCTCCAAGGCTAAATACTCCTGACTGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAAAAGAACCCCGGCGAGGGGAGTGAAAAAGAACCTGAAACCGTGTACGTACAAGCAGTGGGAGCACGCTTAGGCGTGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTATATTCTGTAGCAAGGTTAACCGAATAGGGGAGCCGAAGGGAAACCGAGTCTTAACTGGGCGTTAAGTTGCAGGGTATAGACCCGAAACCCGGTGATCTAGCCATGGGCAGGTTGAAGGTTGGGTAACACTAACTGGAGGACCGAACCGACTAATGTTGAAAAATTAGCGGATGACTTGTGGCTGGGGGTGAAAGGCCAATCAAACCGGGAGATAGCTGGTTCTCCCCGAAAGCTATTTAGGTAGCGCCTCGTGAATTCATCTCCGGGGGTAGAGCACTGTTTCGGCAAGGGGGTCATCCCGACTTACCAACCCGATGCAAACTGCGAATACCGGAGAATGTTATCACGGGAGACACACGGCGGGTGCTAACGTCCGTCGTGAAGAGGGAAACAACCCAGACCGCCAGCTAAGGTCCCAAAGTCATGGTTAAGTGGGAAACGATGTGGGAAGGCCCAGACAGCCAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAAAGCGTAATAGCTCACTGGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAACCATGCACCGAAGCTGCGGCAGCGACACTATGTGTTGTTGGGTAGGGGAGCGTTCTGTAAGCCTGTGAAGGTGTGCTGTGAGGCATGCTGGAGGTATCAGAAGTGCGAATGCTGACATAAGTAACGATAAAGCGGGTGAAAAGCCCGCTCGCCGGAAGACCAAGGGTTCCTGTCCAACGTTAATCGGGGCAGGGTGAGTCGACCCCTAAGGCGAGGCCGAAAGGCGTAGTCGATGGGAAACAGGTTAATATTCCTGTACTTGGTGTTACTGCGAAGGGGGGACGGAGAAGGCTATGTTGGCCGGGCGACGGTTGTCCCGGTTTAAGCGTGTAGGCTGGTTTTCCAGGCAAATCCGGAAAATCAAGGCTGAGGCGTGATGACGAGGCACTACGGTGCTGAAGCAACAAATGCCCTGCTTCCAGGAAAAGCCTCTAAGCATCAGGTAACATCAAATCGTACCCCAAACCGACACAGGTGGTCAGGTAGAGAATACCAAGGCGCTTGAGAGAACTCGGGTGAAGGAACTAGGCAAAATGGTGCCGTAACTTCGGGAGAAGGCACGCTGATATGTAGGTGAAGTCCCTCGCGGATGGAGCTGAAATCAGTCGAAGATACCAGCTGGCTGCAACTGTTTATTAAAAACACAGCACTGTGCAAACACGAAAGTGGACGTATACGGTGTGACGCCTGCCCGGTGCCGGAAGGTTAATTGATGGGGTTAGCCGCAAGGCGAAGCTCTTGATCGAAGCCCCGGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGCGTAATGATGGCCAGGCTGTCTCCACCCGAGACTCAGTGAAATTGAACTCGCTGTGAAGATGCAGTGTACCCGCGGCAAGACGGAAAGACCCCGTGAACCTTTACTATAGCTTGACACTGAACATTGAGCCTTGATGTGTAGGATAGGTGGGAGGCTTAGAAGTGTGGACGCCAGTCTGCATGGAGCCGACCTTGAAATACCACCCTTTAATGTTTGATGTTCTAACGTTGACCCGTAATCCGGGTTGCGGACAGTGTCTGGTGGGTAGTTTGACTGGGGCGGTCTCCTCCTAAAGAGTAACGGAGGAGCACGAAGGTTGGCTAATCCTGGTCGGACATCAGGAGGTTAGTGCAATGGCATAAGCCAGCTTGACTGCGAGCGTGACGGCGCGAGCAGGTGCGAAAGCAGGTCATAGTGATCCGGTGGTTCTGAATGGAAGGGCCATCGCTCAACGGATAAAAGGTACTCCGGGGATAACAGGCTGATACCGCCCAAGAGTTCATATCGACGGCGGTGTTTGGCACCTCGATGTCGGCTCATCACATCCTGGGGCTGAAGTAGGTCCCAAGGGTATGGCTGTTCGCCATTTAAAGTGGTACGCGAGCTGGGTTTAGAACGTCGTGAGACAGTTCGGTCCCTATCTGCCGTGGGCGCTGGAGAACTGAGGGGGGCTGCTCCTAGTACGAGAGGACCGGAGTGGACGCATCACTGGTGTTCGGGTTGTCATGCCAATGGCACTGCCCGGTAGCTAAATGCGGAAGAGATAAGTGCTGAAAGCATCTAAGCACGAAACTTGCCCCGAGATGAGTTCTCCCTGACCCTTTAAGGGTCCTGAAGGAACGTTGAAGACGACGACGTTGATAGGCCGGGTGTGTAAGCGCAGCGATGCGTTGAGCTAACCGGTACTAATGAACCGTGAGGCTTAACCTT\n>URS00016AAB81 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCTTAACACATGCCAGTCGAGCGAGCGTCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAACGGTCGCTAATACCGCATTCCATCCTATGTGCCCATATGGGATTAGCTAGTAGGTGGGGTAATGGCTAACCTAGGCGACGCTCCCTAGGTGGTCTGAGAGGATGACCAGCGAGACTGGAACTGAGAGACGGACGAGACTAGTACGGGAGGCAGCAGTGGGGAATAGTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCGTTCGGGTTGTAAAGAACGTTCAGCGAGGAGGCGTTACTCGCAGAAGAAGCAACGGCTAACTCCGTGCCAGCAGCAGCGGTAATTC\n>URS00018C3972 rRNA from 1 species \nTACGTAGGGGGCTAGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGCGCAGGCGGTTAATTAAGTTGGGTGTTTAAGCCCGGGGCTCAACCCCGGTTCGCATCCAAAACTGGTTGACTTGAGTGTAGGAGAGGAAAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGCCTATAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGG\n>URS00007617FE rRNA from 1 species \nTACGTAGGGGGCGAGCGTTGTCCGGAATTACTGGGCGTAAAGAGAGCGTAGGCGGCACTACAAGTCTCATGTGAAATACCCGGGCTTAACTTGGGGGTTGCATGGGAAACTGTAGAGCTTGAGTACAGGAGAGGCAAGCGGAATTCCTAGTGTAGCGGTGAAATGCATAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACGGCAACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGG\n>URS0000A668E1 tRNA from 1 species \nTCTAAAATGACAGATGAATGTATAAGATTTAAGCTCTTACCATGGAGATTTATTCTTCTTTTAGAATC\n>URS0001CAF6B7 misc_RNA from 1 species \nGATGAAGAACGCAGCGAAATGCGATAAGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGACCGCCAGTATTCTGGCGGGCATGCCTGTTCGAGCGTCATTTCAACCATCAAGCCCCCGGCTTGTGTTGGGGACCTGCGGCTGCCGCAGGCCCTGAAAAGCAGTGGCGGGCTCGCTGTCACACCGAGCGTAGTAGCATACATCTCGCTCTGGGCGTGCTGCGGGTTCCGGCCGTTAAACCACCTTCATAACCCAAGGTTGACCTCGGATCAGGTAGGAAGACCCGCTGAACTTAAGCATATCAATAAGCGGAGGA\n>URS0001A89386 rRNA from 1 species \nTAGAATTAGGGTTCGATTTCGGAGAGGGAGCATGAGAAACGGCTACCACATCTAAGGAAGGCAGCAGGCGCGTAAATTACCCAATCCTGACTCAGGGAGGTAGTGACAAGAAATAGCAAACCGGGAACCTCATGGTTTCACGGTATTGCAATGAGAACAATTTAAAACCCTTAGCGAGAATCAAGTGGAGGACAAGTCTGGTGCCAGCACCCGCGGTTATTCCAGCTCCACTAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAACCTCTGTCTGGGGCTAGTTTTGGCTTTGGTCAGGCTAGTTCTAGGCATCCGCCTACAAGACTTAGAGGGCATTCAGTTGTTCACTAGGAGTAGTAGGCATTTTACTTTGAAAAAATTAGAGTGTTTAAGGCAGGCAATCGCCCGCATATATTAGCATGGAATAATAGAATAGGACACTTTTCCATTTCGTTGGTTATTGGAATCGTGTAATGATTAATAGGGACAGTTGTGGGCATTTGTATTTAGTTGTCAGAGGTGAAATTCTTGGATTTATTAAAGACAAACTAACGCGAAAGCATTTGCCAAGGGTGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCAAAGACGATCAGATACCGTCCTAGTCTTAACTACAAACTATTCCGACTCAATGTTTGACTGGCTTATATAACCAGTTGAGCGTTGTATGAGAAATCAAAGTCTTTAGGTTCTGGGGGGAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGAGCACAACCAGGAGTGGATTCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTTAAAACAATAGTGGGATTGACAGTTTGAGAGCGCTTTCTTGATTGGTTGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGCTTAATTGCGTTAACGAACGAGACCTTAACCTGCTTACTAGACTGGCGATCATCAATCGTTAGCTCTTCTTAGAGGGACTTTGGTTGTTTTAACTCCAAGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATATCCTGGGCCGCACGCGTCATACAATGACTAGTTCAGAAAGTTTTCTCCTGACCCGAAAGGGGATGGGTAATCTTGATAATACTAGTCGTGTTAGGGATCGATCTTTGCAATTATAGATCTTGAACGAGGAATTCCTAGTAAGTGCGGTTCATCAGACCGTACTGATTACGTCCCTGCTCTTTGTACACACCGCCCGTCGCTTCTACCGAGTGGGTGGTCCGGTGAGATAATTGAACTTCGCAGGTAACTGAGAGGAAAGATTATCAAACCTATCCACCTCGAGGAAGAAGAAGTCGTAACAAGGTT\n>URS00018335DB rRNA from 1 species \nTCTACGGGTGGCAGCAGTGAGGAATATTTGTCAATGGGCGTAAGCCTGAACCAGCCAAGTCGCGTGAGGGATGAAGGTTCTATGGATCGTAAACCTCTTTTATAAGGGAATAAAGTGTGGGACGTGTCCTATTTTGTATGTACCTTATGAATAAGGATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCAGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGCCTTGTAAGTCAGCGGTGAAAGTCTGTGGCTCAACCAAGGAATTGACGTTGAAACTGGGGGGCTTGAGTATGTTTGAGGCAGGCGGAATGCGTGGTGTAGCGGTGAAATGCTTAGATATCAGGCAGAACACCGATTGCGAAGGCAGCCTGCCAAGCCATGACTGACGCTGATGCACGAAGGCGTGGGGATCAAACAGGATTAGATACCCGAGTAGTC\n>URS00021B9194 rRNA from 1 species \nGCTTGTCTCAAAGATTAAGCCATGCATGTCTAAGTATAAATAGTATACAGTGAAACTGCGAATGGCTCATTAAAACAGTTATAGTTTATTTGATAATTGAAAATTACATGGATAACCGTGGTAATTCTAGAGCTAATACATGCTATCAAGCCCGACTTCTTGAAGGGTTGTATTTATTAGACTTAAGCCAATATTCCTTGTGTCTATTGCGATGATTCATAATAACTGATCGAATCTCAAATTTGAGATAAATCATTCAAGTTTCTGCCCTATCAACTGTCGACTGTGATATAGACGCTCACAGTGGTTTTGACGGGTAACGGGGAATCAGGGTTCGATTCCGGAGAGGGAGCCTTAAAAACGGCTACCACATCCAAGGAAGGCAGCAGG\n>URS0000AFABFB rRNA from 1 species \nTAAGGAATATTGGACAATGGGCGGGAGCCTGATCCAGCCATGCCGCGTGAAGGATGAAGGCGCTCAGCGTTGTAAACTTCTTTTGGACGGGAACAATATCCCCGACTTGTCGGGGCTTGAGGGTACCGTCAGAATAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTATCCGGAATCACTGGGTTTAAAGGGTGCGTAGGCGGTCTTGTAAGTCAGTCGTGAAATCGCTGGGCTCAACCCATGCAATTGCGATTGATACTGCTAGACTTGAATGGGGTTAAGGCAGGCGGAATGTGGCATGTAGCGGTGAAATGCTTAGATATGCCATAGAACACCGATTGCGAAGGCAGCCTGCTGGGCCTTTATTGACGCTGAGG\n>URS0001536541 rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGCTCGGATTGACTGGGCGTAAAGGCGCGTAGGCGGTTTGTACAGTCAGACGTGAAATTCCCGGGCTCAACCTGGGGGCTGCGTTTGATACGTGCAGACTTGAGTTCGGAAGAGGGTCGTGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCGGTGGCGAAGGCGGCGACCTGGTCCGATACTGACGCTGAGGCGCCGAAAGCGTGGGGAGCAAACAGG\n>URS0000DB123A rRNA from 1 species \nGGATGCGATCATACTAGTACTGAGGCACCGAATCCCATCAGAACTCCGAAGCTAAGCGTGCTTGGGCGAGAGTAGTACAAGGATGGGAGACCCCCGAGAAGTCCTCGTGTTGCATCCC\n>URS00009B63B2 lncRNA from 7 species \nCACACTCTGACGTTGAAACAGTTTCCATGCAGAGCGCCCCCTCTCCGCCTCCCAGTGCCCCAGGTGCCTCAGGTGTAGAGGGACTGAAGATTTTCGGGGGGCTAGCGGAATGTCAGCACTACTACTAGTGCCCATACGGCAGAATGAACTGTTTCCATGAAAACGGGGCCTAAGGAGTTGGCATCCTTATGACAGAACAGTATTTTAAAAGTCAAGGATGCCCTAAGAGCATTTCAGAAAGAGAAGATCACTTTGGGGTCCTCAAGATGGCTCACTGGGTGAGGGCACATCACCTCTAAGCATGGCAACAGGGGTTCAGTGCCTGCACCCCACACTGAGGAAGGAGGAAACGGACTCCCTCAAATCATCATCCGACCCCCACATCTGAGCAAGATCCGCCTCCCCCTCCAACACACGCA\n>URS0000351846 rRNA from 1 species \nAGAGTTTGATCCTGGCTCAGATTGAACGCTGGCGGCATGCCTTACACATGCAAGTCGAACGGTAGAGGGGCAACCCTTGAGAGTGGCGAACGGGTGAGTAATGCATCGGAACGTGCCCAGTCGTGGGGGATAACGCAGCGAAAGCTGTGCTAATACCGCATGTGATCTGTGGATGAAAGCAGGGGACTTGGTAGCAATACTGGGCCTTGTGCGATTGGAGCGGCCGATGTCAGATTAGCTAGTTGGTAGGGTAAAAGCCTACCAAGGCGACGATCTGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCCACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGCAGGACGAAGGCCTTCGGGTTGTAAACTGCTTTTGTACGGAGCGAAACGGTCTGGGTTAATACCCTAGGCTAATGACGGTACCGTAAGAATAAGCACCGGCTAACTACGTGCCAGCCGCCGCGGTAATAC\n>URS000003707E rRNA from 1 species \nAATGGCCTAACGGCTGAACCAGCAACTTGGAAGAATGTAGGTGTATTAATATTAATTAATGCAATAACGATTCTATCGTATAAAATTCTAAATAGATTAATGATAATGACTATTATCTGTTTATAAGTCTTGACCAAATTGCGTGCCAGCAGTCGCGGTAATACGTAGAAGACTAGTGTTAGTCATCTTTATTAGGTTTAAAGGGTACCTAGACGGTAAATTAAACCTTAACGGGTACTTTTTTACTAGAGTTTTATATGAGAAGGGGAGTATCCTTGAAGTAATGTTATAATATTTTAATAACAAGGAGACTGGTAAAGGCGAAGGCTGCCTTCTATTAAAAACTGACGTTGAGGGACGAAGGCTTGGGTAGCGAGAAGGATTAGATACCCTAGTAGTCCAAGCAGAAAATTATGAATGTCATAAGCTAGATTAGACTTTACAATTAAAACACTAATATATTCGGGATATTAGAAATAAAGAGTAGTTTAACTAAATAGGGTGTTAACTATAAGGAGGACAACCGCCTATAGGTAGTCTCTTCTAATGTAAGTAAATTTTAGCTTATAAATGAAAGTGTAAGCATTCCACCTCAAGAGTAAAATGGCAACATTTAAACTGAAATCATTAGACCGTTTCTGAAACCAGTAGTGAAGTATGTTAGTTAATTCGATAGTCCGCGAAAAACCTTACCACAATTTGTATATTATTAAATTATTACACGAGCTGCATGGCTGTCTTTAGTTAATGTCGTGAGATCTGGTTAACTCCTTTAATTAACGAAAACCCTCACCTTATTTATTTACATAAAGTGGTTCACCGCTATATTGGATTTGATAAGAGGGATTAAGACAAGTCATCATGGCCATAATATTGT\n>URS00004A8811 rRNA from 1 species \nCGGACGGGTTAGTAACGCGTGGGAACGTGCCCAGATCTAAGGAATAGCCACTGGAAACGGTGAGTAATACCTTATACGCCCTTCGGGGGAAAGATTTATCGGATTTGGATCGGCCCGCGTTAGATTAGGTAGTTGGTGGGGTAACGGCCTACCAAGCCTACGATCTATAGCTGGTTTTAGAGGATGATCAGCAACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTAGACAATGGGGGAAACCCTGATCTAGCCATGCCGCGTGAGTGATGAAGGCCCTAGGGTCGTAAAGCTCTTTCGCCAGGGATGATAATGACAGTACCTGGTAAAGAAACCCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGGGTTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGATTGGTAAAGTTGGGGGTGAAATCCCGGGGCTCAACCCCGGAACTGCCTCCAAAACTTCCAGTCTTGAGTTCGAGAGAGGTGAGTGGAACTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGCTCGATACTGACGCTGAGGCGCGAAAGTGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACACCGTAAACGATGAATGCCAGTCGTCGGGCAGTATACTGTTCGGTGACACACCTAACGGATTAAGCATTCCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAACCCTTGACATCCTGATCGCGGTTAGTGGAGACACTTTCCTTCAGTTCGGCTGGATCAGTGACAGGTGCT\n>URS0001995650 lncRNA from 1 species \nATGCCTCGGGGTCACAATGCAGAGAAGGAACACTTCGCTCTGGACGCCCGGAGAGGGACAGCTGGCCTGGGTGTGCCAGCTTCCAAAGGGCGGGAGGGACTTCATCAGGGAGACCATCCGTCCAGGCGGCCCCCAGGGTCTGAAATGGCCAAGGCGTCCAGGCGGCCCCCAGGGTCTGAAATGGCCAAGGCGGGGTCCCGTCCGCCCCCTCCCCCGCAGGGCAGCCCGGGTCCCCAACGTGGGCCGGGGCGCGGGGGCGGCAGGTTTCCGGCCGGTCCCACCCAGGTCCCACCCAGCCGACTGGCCGGGGCGGGGACCCCCCAACCCCCCCAACCTTCCCGGCCCCCCCCCCCCCCGCCGGCCTCCCCAGCCCAGCCTGGTCCCGGGTCCGGAGGCGGGCGAGAGGCAGGGGGGAGGCAGAGGGGAGGGGCGGGGGGGGAGCGGGGGGAGGCGGGCTGGAGGCAGGGGGGAGGCGGGCGGGCGGGGAGGGAGCAGGGGGCAGGCGGGCGGGAGGCAGGGGGGAGACAGAGGGGAGGGGCGGGCGGGGGGGAGCAGGGGGGAGGCGGGCGAGAGGCAGCGGGGAGGCGGGAGCGAGCGGGCCGCTGCCCGGAGGCCGCGCCGCCCCGGCGCAAACATTTCCTTATGTGGTGGCTCCGCGGGGCCGGGGCGGCGCCGGGGGCTGCGGGGACGGCGGCCACGCCCGGGGCCTCGCGGCCACCCTGGCCCTCGGCTGGGCCGCCGCGCCGCGCCTGCTGGACGAGACCAAGAGGGGAGGCCCCCGCCCCGCGTGTCCCCCGCAGCGCGTCCCTCGTTCCCCTGAAGGAGGAGCAGACCCTGTGGCGCCCCGACTTGGCCCGCGCTTGTGGGGGCTCCCGGGTCCGGACGAAGAGGGGGCGCGGGGTCCCCCGGCCCGCCACCTCCCTGCCCCTCCCCGGCGCAGCCGCCCAGCGCCGCAGCCTCCTTGGCCTTGGGAGCTGCATTTGGGGGTGGAGGGATAGCGGGGCGACGGCGGGGGGATGGCCCAGGGCCGGAGCGGCGAGTGCCTCACTGGAAATGTCGCGGCTCTCGGCGGGCTCCAGGCTCCAGGCTCCAGGCTGCAGCCCTCCCGAGAGAGCTCGGCCTCAAAACCTGGAGCCCGCGGCTGCCTTCCTGCGGCCAGGGCGTCCCGAGCCTGAGGAGTGCGACCCGGCTCCGACACCCCCACCCCCACCCCCACCCGAGCTTCGCAGGTGTCTGCTCCGACCCCCCAAACTGTCCTGGGGCCTCAGGCCGGCCTCCTCGCCAATTGCAGCCTTTGAGCCAACTTTCATAGCTGATAGGGCAGGTTCCCTATGGGATATTTATTAA\n>URS0000856D3B rRNA from 1 species \nTACGTAGGGAGCAAGCGTTGTCCGGAGTTATTTGGCGTAAAGCGCTCGTAGGCGGTTCCGTAAGTCGGGTGTGAAAAATCTGGGCTCAACCCAGTGGAGCACCCGATACTGCGGTGACTCGAGTCCGGTAGGGGAGTGTGGAATTTCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGACGGCGAAGGCAGCACTCTGGGGCGGTACTGACGCTGAGGAGCGAAAGCGTGGGGAGCAAACAGG\n>URS0001FB44EA rRNA from 1 species \nACGAACGCTTGCGGCGTGCCTAAGAAATGCAAGTCGAGCGGGGACAGCAATATCCTAGCGGCGAACGGTCGCGTAACACGTAAGCAACCTGCCTCAAAGACCGGGACAACATTCCGAAAGGAGTGCTAATACCGGATGTGGCCACCTTTTCGCATGTTTAGGTGATTAAATCAGGAAACTGGCTTTGAGAGGAGCTTGCGGCCTATCAGCTAGTTGGTGGGGTAACGGCCTACCAAGGCGACGACGGGTAGCTGGTCTGAGAGGACGATCAGCCGGACTGGGACTGAGATACGGCCCAGACTCCTACGGGGGGCAGCAATTAGGAATCTTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGGAGGAGGAAGTCCTTCGGGATGTAAACTCCTTTTAGGTGGGAAGAAACAAATGACGGTACCACCTGAATAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCGAGCGTTGTCCGAAGTTACTGGGCGTAAAGCGCGCGTAGGCGGGTCGTTAAGTGGGAAGTGAAAGGCTGGGGCTCAACCCCATGCAGTGCTTCTCATACTGGCGGTCTTGAGTGAGGTAGGGAGAAGTGGAATGGCTGGTGTAGCGGTGAAATGCGTAGATATCAGTCGGAACACCGGTGGCGAAGGCGGCTTCTTGGGCCTTTGCTGACGCTGATGCGCGAAAGCCAGGGGAGCGAACGGGATTAGATACCCCGGTAGTCCTGGCCGTAAACGATGGATACTAGGTGTAGGGGGTATCGACCCCCCCTGTGCCGCAGCTAACGCATTAAGTATCCCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACTCTTGACATCCTGCGAACTTGGCTGAGAGGCTGAGGTGCCGAAAGGAGCGCAGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTACCATCATTAAGTTGGGGACTCTAAGGAGACTGCCGGTGATGAACCGGAGGAAGGCGGGGACGACGTCAAGTCATCATGGCCTTTATGGGTAGGGCTTCACACGTCATACAATGGTCGGTACAGAGGGTCGCCAACCCGCGAGGGGGAGCTAATCTCACAAAGCCGATCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGCGGATCAGCATGTCGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTTCACCAGAAGAGGGTAGCCTAACCGCAAGGAGGGCGCTCGCCACGGTGAGATTCATGACTGGGGTG\n>URS00021EF114 pre_miRNA from 1 species \nGCTGGTTTCCGATGGTGGCTTAGAGTGCGGTCCTCCATCTAGCACCATTTGAAATCAGTG\n>URS000103BC31 rRNA from 1 species \nTACGTAGGGTGCGAGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCTTGGAGCTTAACTCCGAAACTGCATTCGATACTGCCGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCGGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACGCTGAGGCACGAAGGCCAGGGGAGCAAACGGG\n>URS00005A39E1 rRNA from 2 species \nGGGATGGGGGGCATGCTATACATGCAAGTCGAGCGAACTGATTAGAAGCTTGCTTCTATGACGTTAGCGGCGGACGGGTGAGTAACACGTGGGCAACCTGCCTGTAAGACTGGGATAACTCCGGGAAACCGGAGCTAATACCGGATAACATTTTCTCTTGCATAAGAGAAAATTGAAAGATGGTTTCGGCTATCACTTACAGATGGGCCCGCGGTGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGCTTTCGGGTCGTAAAACTCTGTTGTTAGGGAAGAACAAGTACAAGAGTAACTGCTTGTACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGGAACTTGAGTGCAGAAGAGAAAAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGGCTTTTTGGTCTGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCTGGTAGTGCACGCCGTAAACGATGAGTGCTAAGTGTTAGAGGGTTTCCGCCCTTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGGTCGCAAGACTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTCTGACAACTCTAGAGATAGAGCGTTCCCCTTCGGGGGACAGAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGATCTTAGTTGCCAGCATTTAGTTGGGCACTCTAAGGTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGATGGTACAAAGGGCTGCAAGACCGCGAGGTCAAGCCAATCCCATAAAACCATTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGAAGCTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGTCGGTGGGGTAACCTTTATGGAGCCAGCCGCCTAAGGTGGGACAGATGATTGGGGTGAAGTCGTAACAACAGC\n>URS000041F567 rRNA from 1 species \nTGGATCCAGACTTTGATCATGGCTCAGGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAAGCTTGACGAATGATTTCTTCGGAATGAATTCCGATATGACTGAGTGGCGGACGGGTGAGTAACGCGTGAGGAACCTGCCCTTCAGAGGGGGATAGTGTTTGGAAACGAACAGTAATACCGCATAATGTATTTTTACCGCATGATAGAAATACCAAAGATTTATCGCTGAAGGATGGCCTCGCGTCTGATTAGATAGTTGGTGGGGTAACGGCCTACCAAGTCGACGATCAGTAGCCGGACTGAGAGGTTGAACGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGGGAAACCCTGATGCAGCAACGCCGCGTGAAGGAGGACGGTTTTCGGATTGTAAACTTCTGTTCTTAGTGAAGAAAAATGACGGTAGCTAAGGAGCAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTACTGGGTGTAAAGGGGGCGCAGGCGGGAGAGCAAGTCAGTTGTGAAATCCATGGGCTTAACCCATGAACTGCAGTTGAAACTGTTCTTCTTGAGTGAAGTAGAGGTTGGCGGAATTCCGAGTGTAGCGGTGAAATGCGTAGATATTCGGAGGAACACCGGTGGCGAAGGCGGCCAACTGGGCTTTTACTGACGCTGAGGCCCGAAAGTGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACACTGTAAACGATGATAACTAGGTGTGGGGGGACTGACCCCTTCTGTGCCGCAGCTAACGCAATAAGTTATCCACCTGGGGAGTACGACCGCAAGGTTGCAACTCAAAGGAATTGACGGA\n>URS000022D4E2 rRNA from 1 species \nCGGACGGGTGAGTAACGCGTGGGGAACCTGCCCTGTACAGGGGGATAACACTTAGAAATAGGTGCTAATACCGCATAAGCGCACAGTATCGCATGGATACAGTGTGAAAAACTCCGGTGGTACCAGGATGGACCCGCGTCTGATTAGCTGGTTGGCGGGGTAACGGCCCACCAAGGCGACGATCAGTAGCCGGCCTGAGAGGGTGAACGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGAAGGCAGCAG\n>URS00023619E2 lncRNA from 1 species \nAGCACAGATCCATTAAGGCTGACCACAAATTGATCATAATGTTTGTGAATAGATTTGAATGAATTTGAACTCTTAGCCTAAGCTTTTTTCTTTCTATCAATAAAAGAACAATATCTATAATTATGTTTACTGCTCCGTTCCTTCGATCTACACCAACAATGTTTGTATTTTTGGGGAGATCCGGTGCTTAAAGTAAAATTTTTAACGCAATGAATAGGGTGCATTTTTTTCTGATATTTTGGTTTCTCTGTTCCCTATTTATCCAAAATATGCTCACCCCAAATTCTTTAGTGCAAGAGCATGATGGAGCTTTCTCTTGCTGCTTTTCCTTGAAAGAAAGAATGGCAACCAGGAGGTGCTTGTAGCTAGCCACTTAAGTAGGCATGTGCCTCCCCAAAGCACACACTTAAAATAGAACAAGCTTGATCTTGAAGACTATTTAATCGACAAGATGATACATTTTGCGAGAGGAAGTATTAAGATAATAACAAGCTCGAAGACATCCGTACGTTGTCGGCTAGGATTCCTTTAGATTAATGGATTGGAGATCATCATCCCTCTTCACACCCTACATTCTCTAGATGCTCTTATCCTTGGCATCTGCACGAACAAGGATTTGTA\n>URS00025F6FB7 lncRNA from 1 species \nGTCACAGGAGGGAGAGAGCATTGTTAGATCCATGGACATGCAAGGAGAGGGATGCTCCTGCAGAAGCATGGTCCCCAACTATAAAGGCAGCATTGAATCACAGAATCATTGAAAAGGTTGGAAAGCCAATAAGAACATCTAGTCCAACAATCAACCCATGCCTGTGACTGCTCAAGACCATGTCATCCATGGATACAAAAGGGTTTTCCTTTCGGACAATATGAAACAAAGTGCTTGGTGGGATCAGACCAAGCAGCAGAGCCTTGCTTTGGAGCAGCTGCTCGTGCCACGTTGTTTTGTTTGCTGATGTCCTTGGGCTCTGCAACCTGACAGAATGCTGCATTCCTGGTGCTCCTGCTTTGCATTGGGATCAAACTGAAAGCTGGTATCTGGTGCCAAGAGGAAGGAGAGCTTTGGATTTTTGACCCTGAGCATGGAGCTCTCACTGTTGGGCTGTGAGCTCTTCACAGCATGAAGAAAGCACGATTCACTGCTGTAACGGAGTTCTTCAGAAAAAAAAACGTGTTGTATCCTGGGTATGAAATGCCTAATCAAATCATGTTTACTGCTCAGCACTACACTGC\n>URS0000B25448 lncRNA from 8 species \nTGGAGCCAGCTTATTCTAGACCAAAAGGGCCTGGACTGTTCTAGGTACAAGATGGTGCCATGAATGTGCCAATCTCGCCTCTTAAGAAAATGTTAAAACTAAAGTAAGTGCATAAACTATTAAACTAAATGCATGAGTCTTATTTACATATAGGAAATGGTAATTCAGAAAGCTAGCCTGTGAGATTATCAATCATCACCAAACCAGATCTTGATGACTGTCACATCTCTGCTATATTTTCCAAATAGGAAATCCCATTTACCAGGGCCCTCCTGAAATGCCTGGGATTATGCCAAGGATCGCTTCCCTAGTTATTTTTATGTGTAGACCTGAGGAGTGGCAGAGTATGTAACCTTTAAAGATCATTAAGCACCAGTCTTGGGCTCAGCCTGAATTCTCACTCAGCAAGAGTAATGTAATTGCAATTATAGAACTGATCCATTTTATCACTTTCTGAGAGATCAATTGTCAGAGATTGAGACTCTTAATTCATCCTGGGTTTTAAGGAATATTTAAATGAGAATAAGGAATAAATTGAAAACATCAAGAAACTGACACAAA\n>URS000236373A lncRNA from 1 species \nATTTTATTTGTCTTGGACCAGCGTATCCTTTTGGGGGGAGGTGGGGAGACCTACGAATATTTGAGGAAGAAGCAGCTACCATATTTTTCATTCTCGCGCCAAGAATAAGGGCTCTGGAATTTGGACAGTCGATTGGCATTTGCAGATTCAAACTGAGGAGAAGAACACTAGCGCAAGAACATGAGTTCCGCGACACAAGGTGAACATTCTCGATCTTCTGAAATTTTCTGTTCTTGTTTGTAGCAGTCGCCGATTTATTTTTGATTGAATTTCTGAGACTTGTATTGTTTGACACGATTATGTTGGTATATATTATTTGCATTCCCATAGATGTTGATGGTTGCATCTAATGCGCCACAAATAGAGCGCATCTCGGCGAATTTTTTTCAATTTTCATAAAATATGTTGGATTTATGGAATATATGTCTCAAGCTTGTGTATTACTTGTCGCTGCATACTCAAATATTTTTCTATGGATAGTTGTAATTAATCAATAATTCATTGGGATTAGGTTTTGTGCAAATATCTTATGAATATTTTCTGTAAAATATAATGAGCCTCCTTGACAGCCTCTTGCTCTCTTGATAACTCATATAATTTGTGTACTTCTTGTTGGGGTTGATGGTTTGCAGATGGGAGCAACGGGTTTGTTCGTGGGGGTCGGGTAAACAAGACCGACAAGACTCGACGCAGTTGGTCTACTCAAGAGGAGGCAGTGCTGCTAGCTGCGTTGAAAGAATTGGTGGTGCAAGGATGGAAATCCGACAACGGATTTCGGCCAGGTTATTTGACTAAGTTGGAGGAGGCTATGAAAAAGGTATTCCCAACCACTGACTTGAAAGGGATGCCACATATAAACTCAAAAACCACGACATGGAAGAAGCAATACTATTCGCTAACGCAAATATTGGGGAATACTGGGGTGGGCTTCAATGTGAATGGCATGCATATGGTGGATTGTAATGACGAGCAATGGGAGCAAATCATCAAGGTTAGTAGGTGTTCATATTGTAATATTAAATTCAGGCTGTACAAGTTTTCTAATATGTCTAAATGAACTACAGAAAGATACAAACGCACGCACAATGCGTTACAAAAGTTGGCCCTACCTGGAACAGTGGGCTGAAATATTTGGGAAGGATAGGGCGACGGGAGATGTGGCTGAAGATCTTATGGAGGCCGCACATGACATGTATCGCAAGATTGATCTTAGCGAACCACAAAATGATGGTGACTATCATGTATCCCTCGATGACATGTTCGAGAAGACCGCAACCAATGACAGTGTCAGCCAAACACAAGAAACCGAGTCTGAAGTTCGTGTCAAGCGGAAGAAGAGAAAGCAAGGCGACGAGTTCGAACAAATGTTTCAGGTGTTGGCAGATATCCAACGCACAACCGGACAGCGACTTGTCACAATATCAAGTAGAATGGGCTACGACTTCGACGTATCCAAAGCGAGAAAGGAGGTCTTCGCACAACTAAGCTCAATTCTGGGTTTATCCCTCAAAGCGAAGTTCGAAGTCGCCAATTTACTTGCAAAAGAGGTGGAGATGCTCGATGTATTTACTAGCCTGCCCGAAGAAGCCAAGAATGAGTATGTCAACTTCCTACTCGAGGAGAAATATAAATAGGATTGCTTCGCTGCACCATAGGATCTTGGGTGTTTTTTGGTTTCAAATTTTATTTGCTAACAACTCCTTCATTTCTGGAATTATGTTAGACCAGTAGAACTGCTGTTTCTTTTTATTTTTGGTGTCTTGGAGCTTAGTTCAGACATATCTTATCAAGTGGCTGTATTTTGGAGTCTTGCAGAAGCCACTTGTCTTAAATTATGCAGTTGAAGCTCGACAGAACTTATTTGACATTTTATGTTGCTTTCAAATTTGAATATGTTGGTATGTCTGTTTCAGATTTGCTTATGTTTTATCTTGCGGTGGATTACAAAGGCTTTTGTATAATTTAAATTGTAGTTTCAATAGGGATTTATTTAAATTGCATATGAATCGAAAATTGCTAATTCAGATAAGTTCAAACACAGCTCCCACAGTAAGCACAAATTCATCATAACTAGAAATCATGAGAAAACCAACAAACACAATAGACAATAACAAAGCTGCCTTCATCTACGAGGCACCAAAATAAGAGAAACAACGGTAGACACTGGACCTAACAGCGTGCATCGACGCTAACAAAATGGGAGGGAATAAAATGCGGTCCACAAAAGAGAGTAAGCTCCGCTTACAAATTTATTTAAATGGAGAAGACGAAGCACATGAGCTCCCGCCATAACCGACGTCATCTTTCTTACCATCATTCGGTTTCACGGGAAAGGCGTTCTTTGGAGGAAAGGAGGACGTCGTTTGTTTTGAAAATTTGTTCTTGATGGTAGACCATGGGACGTAGACATGACCCTTATGCGATTTGGGAAACGAGGGAGACACACTCGAACATGCATCATCTGGCTGAACTACCAAGGCACACAGTGGTTGGGTTTTAGTAGACGGGGAGTTCACTTCGTCCTCCGATGAAGTGTCGGTGAAGCTTTCAAATGGAGGACTCTTTTCACCTTTTGACGAGTCCTCTATCACTATCACAGTGTGTGAGATCTCGGGCTTCACATCGTACATTCCGAAGAGGGAGCACAATTTTAGGTACTCGGGCTCACCCTTATGGTAGTAAGCTTTGTAGAACTCATTTTCCTACAACCGATAGTGACTTGTATTAGAAAGACTAGCACACAACAGATTTAAATGATTTAGAACAGCAAAAACAATAGTTATAAAGCATCTCACCTTGAAGAGTTGCTCCCACACTTCATCGCTTGCATGAAGAACATTTGTCGACGCGTCCCGATCGGTCTCCGGGATATTGCAAAGATACTTGAAACNAGCTCTGGAAAAGTCAGCTCTGCCTTTGGTCAGCTCTGGCGATTTTAGCTCTGGAAGTCGGCTCTGGCTCCGAAGTCAGCTCTGGTGACTTAGCTCTGGAACGTCAGCTCTGGCTTCTAAAGTCAGCTCTGGCATGTTGGCTCTGGAAAGTCAGCTCTGGCCTCCGAAAGTCAGCTCTGGCGATTTGCTCGGGAAAGTCAGCTCTGGCCTTCGAAAGTCAGCTCTGCTCTGGCGGTTTCCAGCTCTGCTCTGGAACTTCCAGCTCTGCTCTGGTGTTTCCAGCTCTGCTCTGGAATTTCCAGCTCTGCTCTGGAACTTCCAGCTCTGCTCTGGCATTTTCTAGCTCTGCTCTGGCATTTCCAGTTCTGCTCTGGCATTTCCAACTCTGCTCTGGCATTTTCTACTCTGCTCTGGCATTTTCTAGCTCTGCTCTGGCATTTTCTGTTCTGCTCTGGTATTTTCTGGGCAGAACGACGAGGGTTTCCAGTTTCCAAAACTAGGGTTCTTTGTCCTTTCTTGCCTCGATTCTCACTCGTACGTCGGCCCTAATCTATTCCTATGTGAGCATGCTGTGCTTGTTCAAGTTCATCTACGTTTAAAGCCTAAAGTTCTCGTCGTTTAATCAAGGTTTCAAGCCGTGGGTTCTACCGAAAAAGTGACTTAACATGCTTCTTGTGTTCGTGCGTATCTAGAGCCTAAAACATGCTTTCTACGAGCGTGTGATTCATGCTGAAAGGAGAGGTCGAGAGTTACCTTGATGTCGCGCGCTTTGGTCGGACAAGCACGATGGTTCCTCGCTTCTCCGATCGTCGAGGTTCAAGGTGTCGAGAGAGTGATGGAACTCTTGCTGTTGCTGCTGGATTTCAGAGTGCCGAAGGAAGAGGAAGGGTCACACAAAGGGGTTGAAGGGGAGTTTAAATAGGGTGTTCGGCTGATGCACTTGAGTGCCTAAGGGGAGAGCTTCGGCTGTAGCTCTGCACAGCGTGGAAGAGGGGTGCAGCAGGCGTGCTAAGCTCTGCTGTGGTGTTGCGTGGGGAGGGCTGCTGCTGCTCTGCCGGCGTGGAGATGGAGTGTGGCCTTTCGGCTGCTCGTCCAATGGAGGCTGCTGCCGTGGCTGCTCTGGTCTGGCGTGGAGTGTGGCGTGGCGTGGAAGAGGGGTGCAGCAGGCGGCCCTTCGGCTGCCCAGCCAATGGGGGCTGCTGCCGCACCTTTTCCTACTTTTCCTTTTCTCCATTTTTCCTTCTTTTCTTAACTTGTAGCGTTGGCAAGTGTTGGGATTGGGTGGCGTGAGTGGTGAAGTGATCTAAGAGAAGATCTAAATAAAATCCTTCAGTGTCGGTCATTCTCAGTATTAAAAATACTGGTTTCGTGCTTGCTAACATCGATAAATGCTAAATTAAATCCATAGACTCAATCCGTTCGTCATTCTAATACTTAAATTAAATCCGTAGATTTAATTAGCTTCAAAGTCGGAAATAATTCACGACTTAAGTAACAATGTGAAATAAACTCTATCTTGATAAATAACCCAACTTAGCTAAGTTGGTTATAACTTTGAAGAATAATAATTCATCGACTCAAGGATTCTCATCGCGGTCTTAAACACGCGAAGCTAAATAAATGCATACTTGCTAGTGTAGTGACTCTGTCTCCAAAATACGAAATTCATAAACATAGATGAAAACATGAAACGCTTCAATTACTGGCAGATAGAAAAATAAACATGCAAAAACTGAAATTAAATGATGATAAAAGAGCGGGTTGCTACAACTGAACATCGGGCGGAAGCTTACATCAGAACATACGAGGCAAATCATTATAATTCGGCTCAAAGGTATATACGTCAACATCGTTATAACTTCTTGAATATTAGAAATTTCAAGAAGAAAAGCAAAGTAGGTACAGCTTATTTTCCATAAGGAAACATAATATCAAGAGTACCACAGCAAAAGGCGTAACAATTATATGTATGAAGACATATAACCGCGAGTATATTGCTTGATTAGAAAGGAATAAGACATCATCTCACTAAGGTTTTATCAACATCAGAAGGAAAGCAAAGTACATCATCCTTAAGACTCTAACATCAAAGGAAAAACAATATAGAAACTTCATCAATGAAACCATCCCCACCAGCACCAGTCCAATCTTGCTCCATTGCTTAGCCTGCACATTTAGGCTATGTTTGGTGTCTGGTAATGGATTAGGCAATATAGTTTATTTTCGGCTACCTAATCTTGATTACAATGATATTAGTATGCTTTGTTGTTGTTTGATTATTTAAATAGTTACATAACAATCTATTTTGGTTGGTTTGGTGAGCAGTAATAATAGCACGATTAAAGCTGAATAGATGATAAAATGACTAATATACCCACCCATTTTATTTGTCTTGGACCAGCGTATCCTTTTGGGGGGAGGTGGGGAGACCTACGAATATTTGAGGAAGAAGCAGCTACCATATTTTTCATTCTCGCGCCAAGAATAAGGGCTCTGGAATTTGGTACAGTCGATTGGCATTTGCAGATTCAACTGAGGAGAAGAACACTAGCGCAAGAACATGAGTTCCGCGACACAAGGTGAACATTCTCGATCTTCTGAAATTTTCTGTTCTTGTTTGTAGCAGTCGCCGATTTATTTTTGATTGAATTTCTGAGACTTGTATTGTTTGACACGATTATGTTGGTATATATTATTTGCATTCCCATAGATGTTGATGGTTGCATCTAATGCGCCACAAATAGAGCGCATCTCGGCGAATTTTTTTCGATTTTCATAAAATATGTTGGATTTATGGAATATATGTCTCAAGCTTGTGTATTACTTGTCGCTGCATACTCAAATATTTTTCTATGGATAGTTGTAATTAATCTAATAATTCATTGGGATTAGGTATTGTGCAAATATCTTATGAATATTTTCTAGTAAAATATAATGAGCCTCCTTGACAGCCTCTTGCTCTCTTGATAACTCATATAATTTGTGTACTTCTTGTTGGGGGTTGATGGTTTGCTAGATTGGGGAGCTAACGGGTTTGTTCGTGGGGGGCCGGGTAAACAAGACCGACAAGACTCGACGCAGTTGGTCTACTCAAGAGGAGGCAGTGCTGCTAGCGGCGTTGAAAGAATTGGTGGTGCAAGGATGGAAATCCGACAACGGATTTCGGCCAGGTTATTTGACTAAGTTGGAGGAGGCTATGAAAAAGGTATTCCCAACCACTGACTTGAAAGGGATGCCACATATAAACTCAAAAACCACGACATGGAAGAAGCAATACTATTCGCTAACGCAAATATTGGGGAATACTGGGGTGGGCTTCAATGTGAATGGCATGCATATGGTGGATTGTAATGACGAGCAATGGGAGCAAATCATCAAGGTTAGTAGGTGTTCATATTGTAATATTAAATTCAGGCTGTACAAGTTTTCTAATATGTCTAAACGAACTACAGAAAGATACAAACGCACGCACAATGCGTTACAAAAGTTGGCCCTACCTGGAACAGTGGGCTGAAATATTTGGGAAGGATAGGGCGACGGGAGATGTGGCTGAAGATCTTATGGAGGCCGCACATGACATGTATCGCAAGATTGATCTTAGCGAACCACAAAATGATGGTGACTATCATGTATCCCTCGATGACATGTTCGAGAAGACCGCAACCAATGACAGTGTCAGCCAAACACAAGAAACCGAGTCTGAAGTTCGTGTCAAGCGGAAGAAGAGAAAGCAAGGCGACGAGTTCGAACAAATGTTTCAGGTGTTGGCAGATATCCAACGCACAACCGGACAGCGACTTGACACAATATCAAGTAGAATGGGCTACGACTTCGACGTATCCAAAGCGAGAAAGGAGGTCTTCGCACAACTAAGCTCAATTCCGGGTTTATCCCTCAAAGCGAAGTTCGAAGTCGCCAATTTACTTGCAAAAGAGGTGGAGATGCTCGATGTATTTACTAGCCTGCCCGAAGAAGCCAAGAATGAGTATGTCAACTTCCTACTCGAGGAGAAATATAAATAGGATTGCTTCGCTGCACCATAGGATGTTGGGTGTTTTTTGGTTTCAAATTTCATTTGCTAACAACTCCTTCATTTCTGGAATTATGTTAGACCAGTAGAACTGCTGTTTCTTTTTATTTTTTGGTGTCTTGGAGCTTAGTTCAGACATATCTTATCAAGTGGCTGTATTCTCGGAGGCACACAACAGATTCATATGACCATTTCCACAGCTGCATAGAGGGGTAGGTGTTGATGTCTCAGACGCGGCGTCCATCCTACAACACCAATGTATAGTATTTTAGTATTTTGACATGAGTAGCATAGAAATTGATAGAAAACTTATATGGCCATGACAAGCAGCATCGCAGCAAGATCAGATAAATATTAACAAGGGAATTAGCAAGAGACCACTAGAGACTACTATATTCATTGTAAAAATCAACAAGATTTTAAATTTTATTCACATCAATATCATCAACAGCTGAGATAAGGATTTCTTATGAATTAAAAAATTATTACAATTGTCGAAATCGAACACAATTAAATGGAATTTTATCATGTAAACCCAACATCATCAAAATCACAGCTGAACACAAGCAAATTAGAGATAGATGTCACCAAGAACTTGCTGCAACAGTTTAAAGACGAATTAACATGCAACATTCTAAAGAGAACACCTTAAATGAATGTAAAAATTATTGCAATCGTCACCTAATGATTATTCAAGTATTGAAGCCACATCCCCTCCGCCAATTCATCCCTTGCGGCATTCCATTGGGGAGAAGACTCGACCGTGGCAATGAACTCGTCATGATCGGCTTCAAGGCCATGAGCATTACTATTTGCCATCGCATCAAATTCCTCTTCTATTGGATCGACCGGCATTTGCATTCGAATAAAATTATGAAGTAAAAATGTTGCCATTATTAACCTATTTTGGACCTTAATTGGGTAGAACGTGGTGGACCGTAGAATACCCCACGCATTTTCATAATTCCAAATGCTCTCTCAATCACATTCCTCGCCTTACTATGCCTCAGGTTAAATAACTCCTCCTTGTTTTGGGCCTGGCAGCAGTGGGACCCCACTCCTTCAGGTGGTATCTAACGCCCTTGTAAGGCGTTAGAAAACCATCACTATTTGCGTAACCGTTGTCACACAAATAGTAATTTCCTGTTGAAGCCCCAACAAACCAAAACAAAAGAGTAATTTAGGTAAACTTTGATAAATAATCCACGTAAACACAAACGCTATTCGAATTAAAGAGCAAATAATTGGCATTACCCTTTGGCACTTTAAGACCGTGGGGTCTACTTATGGCATCCCTTAATATCCTAGAATCTGCAGCAGAGCCTTCCCAACCGGAAAGAACGTAGACAAACTTCAAGTTTCGGTCACATACACCTAACACATTCTTGGATATCTGTCCTTTCCTTGTCCTATAGCGTGCTTGGTCGTTAGTGCTCACCATCACATTAACATAGGTGCCGTCTATAGCTCCTAGACAACCCTAAGTTGAAGAGAGACATTTAAAAACGAGTTAGTGCTAATAAAATTTATGATCATACTTACTAGAATAACTACAAGGCTGCCCTACATACCTTAAACCACTGCCACCGGCCATCTGTACAGTCATTGGACACAGCTTCCGGTTTTGATAAAAAAATTTCGTGTATCTTCAATATTGCTCCTAACACGGCATGTACGTAGCGCGATATGGTTTGCCCAGAAACGACAAAAATCAAATCTTACAACTCTATTTTTCTTTGTGATGTGCTAAGACAGACAAGAAAATGGCTACTTGTTCCTCCACACTCACGTAATCACCATCAACTAAGCCTCCCAAACCCCGTAAAATGGTGCACAACCGCCCGAAGGTATTACGATCCATTCGCAAGTTCGCGATGCAATCGACATCATTGACACTTATCAGCCTACTTAAATATTTTATTTGGTCCGGCATTCTACTTATCATCCCATATTTTCGTGATCCAAACCCACGTTTTCTTTTTCTTGAGCTAGACTTGATAAAATATGTAATTACTATAACCAACTGCATTATATGCTGAAGCATTATTTCTTGCAATAGCAAGAACAAGATATCGGACATACGGGGACGTACACGGCCAGACATCTAAAATAGAAACAATAAGAGATAATTATAACTTATATTCACTGCATTTCACCACCATGGCAGATTTATTTAAATTAATTTCAGTTTGAGCAAGTGATGGCAGAAACAAAACGAACCATGAACATATCATCAATCAAAATGTAACTGCAACAAGTGTCGTACACCAAGAGACAATTATAACTTATATTAATTGCATTACCAGGCACTATGTCAGATTTATGCCAACAAGCCATTCAACAACCAATCAATAATTCATCACCACATTAAAACTGTACTACCGAGAAAAAATCCCAATAAGCAAATATTTTCTCATAAAAAAAAAGAATATGTCATGCATATCAGGAAGAGATACTATTCAGCCACAATAGGCACTCCGTTAATTCTTTCAGAAATCATATTATGTTATTGTTTATACATGCATCGATCGTCAATTTGATAGTTTAAAAGACATATACAACGAGTGTGATTTATATATATCCCTAGAGATAACAAGCAATCGGACAAGCACTAACCTTGGTCTGTTCACAAAGCCTTCGACGTGGAGACTGAGGCTGCTTTCCGATGAGCGTAGCGACCAGAAATACGGACAAGAAATCCCAAAGTGTTTTGGC\n>URS0000A5EA3D rRNA from 1 species \nTACGTATGGGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGAGTGCGTAGGTGGTTACCTAAGCGCAAGGTTTAATCTTGAGGCTCAACCTCATTCTGCCTTGCGAACTGGGCTACTTGAGTGCAGGAGGGGAAAGCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTACACAGAACACCAATTGCGTAGGCAGCTTACTGAGCCGACACTGACGCTGAGGCACGAAAGCGTGGGGATCAAACAGGATTAGATACCCCGGTA\n>URS00009D2B09 rRNA from 1 species \nTACGAGGGGTCCTAGCGTTGTTCGGAATCATTGGGCGTAAAGAGTCTGTAGGCGGCTAGATAAGTCAGGTGTGAAATCCCCGGGCTCAACCCGGGACGTGCATTTGATACTGTCTAGCTTGAGTATGGAAGAGGCTAGTGGAATTCTTGGTGTAGTGGTGAAATACGTAGATATCAGGAGGAACACCGGTGGCGAAGGCGGCTAGCTGGTCCTATACTGACGCTGAGAGACGAAAGCATGGGGATCAAACAGG\n>URS0000CEB689 lncRNA from 1 species \nCACCCGCCCTGACACCGTCCTGATGGGGGTCCTGCAGAGAAGACTCCTTACTTAGCCCACAGTGCTCCCACCCACCCTCAATGTATAACTTCACGTTCAGAAATGTGTTACCCCCCTCCTCAGACCTCACACAATTCACGAATTTCCAAACAGCAGGAAACAGAAACTTCTAAGAAAGCAGAACCCTTGAGTCCAGGTGGGAGAAGGTGCCTGAGAAAACAGCCCTGCCAGAGACAGTACCCCAGCATCCGGACGTTACTCCACAGACGGCCACGTGAGAGACCGGGAACCACCCTTCCCACCGTACCCCAGCGTCCGGACGCTACTCCACAGACGGCCACGTGAGAGACCGGGAACCACACTTCCCAAGCCTTCTGCACTCCCAAAAACATCAGCTTCCCGGAAACCTGAGACATGCTCAAGGAAGAGCACGGTGTGAAGTCAGCTGTGGGTGGAGGATGACCCAGGTGCCCAGGCAAGAGACTGAAGGCACAAACTGTTTCAGTATAATAAAGCAAATAGAATAAGAA\n>URS000155D742 rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGGTCTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGATCTTGAGTTCGGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGGATAG\n>URS000074D688 rRNA from 1 species \nTTTATTCAGGGTTCAAAATNAACTTNGGCGGCGNGNATTAGNCATNCAANTTNGTCCTTCCCCAAGGCAGGGCGAGGCNCAAGGGTGANTAAGGCGACGTAANCAACCCCGAGGATGGGCATANCCGCGGNAAANTGCNGGTNATTCCCAGCGACGTCGAGACGTGNCATCACGCTTCGACCCAAAGGTGTGAATCCCCTCGGGACGGNCCNTCGTGGTATCAGGTAGTTGGTGGGGTGATGNCCCACCAAGCCAAAGACGCCTACCGGGCGTGCGAGCGTGGCCCGGCACACTGGGACTGAGACACTGCCCAGACACCTACGGGTGGCTGCAGTCGAGAATCTTCGGCAATGGGCGCAAGCCCGACCGAGCGACGCCGCGTGGAGGACGAAGGCCTTCGGGTTGTAAACTCCTGTCGAGGGGGAACAAGGGGGCGTGAAGAGCGTCTCTTGAGTGATCCCTGGAGGAAGCACGGGCTAAGTTCGTGCCAGCAGCCGCGGTAAGACGAACCGTGCGAACGTTATTCGGAATCACTGGGCTTAAAGCGCGTGTAGGCGGAGTGACACGTCGGATGTTGAAAGCCCCCGGCTCAACCGGGGAACGGGCACCGATACGGTCGCTCTGGAGGGGCGTAGGGGGAGCTGGAACTTCCGGTGGAGCGGTGAAATGCGTTGAGATCGGAAGGAACGCCCGTGGCGAAAGCGAGCTCCTGGACGCCATCTGACGCTGAGACGCGAAAGCCAGGGGAGCGAACGGGATTAGATACCCCGGTAGTCCTGGCCGTAAACGATG\n>URS0000AF452E rRNA from 1 species \nCCTACGGGATGCACCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGAGGAGGAAGGCGTTAAGGTTAATAACCTTAGCGATTGACGTTACTCGCAGTTGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTCAAGTCGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTCGAAACTGGCAGGCTAGGGTCTTGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGTCCACTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTCGTAGTC\n>URS000178FACD rRNA from 1 species \nTACGTAGGTGGCAAGCGTTGTCCGGATTTACTGGGCGTAAAGGGCGTGCAGGCGGTTTGTTAAGTGCAGGGTGAAAGCTCCCGGCTCAACTGGGAGAGGTCCTTGCATACTGGCAAGCTCGAGGGAGGCAGAGGAAAGTGGAATTCCCGGTGTAGTGGTGATATGCGTAGATATCGGGAGGAACACCTGTGGCGAAGGCGGCTTTCTGGGCCTTACCTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACGGG\n>URS0000F98CBA rRNA from 1 species \nTGCGTAGGCGGGCCCGTAAGTCAGTGGTGAAAGTTTGCGGCTCAACCGTAAAATTGCCATTGAAACTATGGGTCTTGAGTGTAAATAAGGTAGGCGGAATGTGTTGTGTAGCGGTGAAATGCCTAGATATAACACAGAACACCAATTGCGAAGGCAGCTTACTGGGATACAACTGACGCTGAGGCACGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCC\n>URS00020667BA rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTAGAACGCACAGTTTATACCGTAGCTTGCTACACCATAAACTGTGAGTTGCGAACGGGTGAGTAACGCGTAGGTAACCTGCCTGGGAGCGGGGTATAACTATTGGAAACGGTAGCTAATACCTCATAATATTGATTATTGCATGATAATTGATTGAAAGATGCTATTGCATCACTACCAGATGGACCTACGTTGTATTAGCTAGTAGGTGAGGTAACGGCTCACCTCGGCGAGGATACATAGCCGACCTGCGAGGGTGAGAGGCAAAACTGGGATTGGAACATGGCCCAGCCCACTACGGGAGGGAGACGTCGGGAACTCCTGGGAATGGAAGCAAGGCTGAACGAGCAACGACGGGCGAGTGAAGAAGGCTGTCGGATCGTAAAGGTCAGTTGTACGAGAAGAATGGGAGTGAGAGTGGAACGTTCACACTGTGACGGTACCTGAACAGAAAGCGACGGCTAACTCCGTG\n>URS00019D34DB guide_RNA from 1 species \nAAAACACGAGACAAAGTAAAGAGGGAGAATAGATAGAATG\n>URS0000089A8C tRNA from 1 species \nTCTAGAAGAATGGGACTTGAACCCACACCTAAGACTCCAAAATCCTTCGTACTACCACTATACTATCCCCTA\n>URS00017CC75E rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTAGAACGCGTGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCCGATGGAGGGGGATAACTAATGGAAACGGTAGCTAATCCCGCATACCATCGGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAACGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGGGAGGTGGACCAGCGCCCATGGAACTTAGACACGTTCCACACTCCTACGGGAGGCAGCTGTGGGGAATATTGCACAATGGGCGCAAGCGTGGTGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGAGGAGGCGTTACTCGCAGAATAAGCACCGGCTAACTCCGTGCCAGCGGCCGAGGTAATTC\n>URS0001993F25 snRNA from 1 species \nATGCTTGTTTCAGTAGCACATAGACTAAAATTGGAACAATACAGAGAAGATTTGCATGGCTGTGTGCAAGAATGATAAGCAAATTTGTGAAGCATGCCATATTTGG\n>URS0001E9A07D rRNA from 1 species \nGATGAACGCTGGCGGTATGCTTAACACATGCAAGTCGAACGGACTCTTCGGAGTTAGTGGCGGACGGGTGAGTAACGCGTGAGAATCTGGCTTTGGGTTCGGGACAACCACTGGAAACGGTGGCTAATACCGGATGTGCCGAGAGGTAAAAGAGAAATTGCCTGAAGATGAGCTCGCGTCTGATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCAGCGATCAGTAGCTGGTCTGAGAGGATGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCGGCAGTGGGGAATTTTCCGCAATGGGCGAAAGCCTGACGGAGCAATACCGCGTGAGAGAAGAAGGCTCTTGGGTTGTAAACCTCTTTTCTTAGGGAAGAACAAAATGACGGTACCTAAGGAATCAGCATCGGCTAACTCCGTG\n>URS00019E5825 rRNA from 1 species \nTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCAGCAGGGAAGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCGCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGCGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGCTTGTCACGTCGGGTGTGAAAGCCCGGGGCTTAACCCCGGGTCTGCATTCGATACGGGCTAGCTAGAGTGTGGTAGGGGAGATCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCCATTACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGGTGGGAACTAGGTGTTGGCGACATTCCACGTCGTCGGTGCCGCAGCTAACGCATTAAGTTCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCAGCGGAGCATGTGGCTTAATTCGACGCAACGCGAAGAACCTTACCAAGGCTTGACATACACCGGAAAGCATCAGAGATGGTGCCCCCCTTGTGGTCGGTGTACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTCTGTGTTGCCAGCATGCCCTTCGGGGTGATGGGGACTCACAGGAGACCGCCGGGGTCAACTCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGCCCCTTATGTCTTGGGCTGCACACGTGCTACAATGGCCGGTACAAAGAGCTGCGATACCGTGAGGTGGAGCGAATCTCAAAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCCCA\n>URS0000291A32 rRNA from 1 species \nGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTGATACGTAGGGTGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGGGCTCGTAGGTGGTTGATCGCGTCGGAAGTGTAATCTTGGGGCTTAACCCTGAGCGTGCTTTCGATACGGGTTGACTTGAGGAAGGTAGGGGGAGAATGGAATTCCTGGTGGAGCGGTGGAATGCGCAGATATCAGGAGGAACACCAGTGGCGAAGGCGGTTCTCTGGGCCTTTCCTGACCCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGCTTAGATACCCTGGTAGTCCACGCTGTAAACGGTGGGTACTAGGTGTGGGGTCCATTCCACGGGTTCCGTGCCGTAGCTAACGCTTTAAGTACCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGCCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGTAGAACCTTACCTGGGTTTGACATGGATCGGGAGTGCTCAGAGATGGGTGTGCCTCTTTTGGGGTCGGTTCACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTCACTGTTGCCAGCACGTTATGGTGGGGACTCAGTGGAGACCGCCGGGGTCAACTCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGTCCAGGGCTTCACGCATGCTACAATGGCTGGTACAGAGAGTGGCGAGCCTGTGAGGGTGAGCGAATCTCGGAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCTCATGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGGCTTGTACACACCGCCCGTCAAGTCATGAAAGTTGGTAACACCCGAAGCCGGTGGCCTAACCGTTGTGGGGGAGCCGTCGAAGGTGGGACTGGTGATTAGGACTAAGA\n>URS0000A4E5B4 misc_RNA from 1 species \nGTACCCTCCAGCCCTGCTGGGTGTTGGGCGTTTTGTTCCGCCGCGCGCGTGAACTCGCCTCAAATACATTGGCAGCCAGCCGTCCCGCGTGGGAGCGCAGCACATTTTGCGCTCTCCGCTGGGTGCGGCGGCGTCCACAAGCCTAATTTTTTACGC\n>URS00007CA1EC rRNA from 1 species \nTGGAATACAGCGTCATAGTGGTGAGAACCCAGTATATGATGTGGATGCCTAGTGCTTTGTGATACATTTTCAAAGAGTCGAGTTGTTTGGGAATGCAGCTCAAAATGGGTGGTAAATTCCATCTAAAGCTAAATATTGGCGAGAGACCGATAGCGAACAAGTRCCGTGAGGGAAAGATGAAAAGCACTTTRGAAAGAGAGTTAACAGTACGTGAAATTGTTGAAAGGGAAACGCTTGAAGTCAGACTTGCTTTTGAGTTTACTTGATGGCAGGCTAGCATCAGTTTCTGASAGTAGAAAAGGGTATTGAGAAGGTMGCAGCTTAGGTTGTGTTATAGCTCTTTACTGGATGTGCTCTTGGGGACTGAGGAACGCAACACGCTTTGTGCAATGTCTTCGGGCATTTCGTGTTAAGGATGCTAGTTAATGGCTTTAAACGACCCGTCTTGAAACACG\n>URS0000B0FA7A rRNA from 1 species \nTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGAGTGAAGAAGGCCTTAGGGTTGTAAAACTCTTTCACCGGGGAAGATAATGACGGTACCGGAGAAGAAGCCCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGGGCTAGCGATGTTCTGAATTACTGGGCGTAAAGCGCGCGTAGGCGGCTTGGTAAGTTGGAGGTGAAATCCCGAAGCTCAACTTCGGAACTGCCTTAAAAACTGCTTGGCTAGAGGCAAGGAGAGGAGAGCGGAATACCCAGTGTATAGGTGAAATTCGTAGATATTGGGTGTAACACCGGTGGCGAAGGCGGCTCTCTGGCCTTGATCTGACGCTAAGGCGCGAAAGCGTGGGGCGCAAACAGGATTAGATACCCCCGTAGTCC\n>URS00001D86A5 rRNA from 1 species \nGGGTCGATACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTNCACGCCCTAAACGATNTCAACTAGGTGTTGGTAGGGTAAAACCTATTAGTACCGTAGCTAACGCGTGAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGATTAATTCGATGCAACGCGAAAAACCTTACCTACCCTTGACATGTCCAGAATCCCTGAGAGATTGGGGAGTGCCTTCGGGAACTGGAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCATTAATTGCCATCATTCAGTTGGGCACTTTAATGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGGGTAGGGCTTCACACGTCATACAATGGTCGGTACAAAGGGTTGCCAAACCGCGAGGTGGAGCTAATCTCAGAAAGCCGATCGTAGTCCGGATCGTAGTCTGCAACTCGACTACGTGAAGTCGGAATCGCTAGTAATCGTGGATCAGCATGTCACGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTTCACCAGAAGTAGGTAGCCTAACCGCAAGGAGGGCGCTTACCACGGTGGGGTTCATGACTGGGGTG\n>URS000235E350 lncRNA from 1 species \nGCTTAGTTTGCTAAATAAATAAATAAATGAAGTTTGCTATGAACCCTCATGATAAGCTCTCACATAAAAATGATGAATAGTTGCTCTGCCATTACTAGTTCTCAAAATTGAAATCTCTCTCAAGTTTAGGCATGACTGTTATGAATTAAGATTTGCTCTAAAACTGAACTTGTGGGAAGAGTACTTGATCAAAAGTCTATGTCGTTAACGGATACGATATGGGAAGGTTGAGCTGCTATTTATCTGTTCCTAGAGATGCTAGAATTCTAGAGAATTTTATCTTTGAAAATCTTTAAAATATTGCATGATGAGTTCCTGTATGATGAGTGTTTAAAATCCTACCACAGCCATATATACATGCTTATTAGACTATGAACCATACATTTACTTTTTACTACTTATGAGCATTGAGTGTGGTGAAGTTGTGTAGACCCTTAGGAGCTTGTCATGTGGTTAAAATCAAGATTCACTTGCACATTCACTCATACATGCTGCTTCTACTTCAGAAGTACGCATCTACATACATCCATTCATTTCCATCTCCAGATTCACCCAAAATTATTCAACTCCTATTCAGGAGAGAATAGCCAAAAACATTATCCTATCCCTGTAATTCCCCGTGAAATAAATGCTCTTGATATTTTGGTTACTACCAATTGCTACATTATTCTAGGAGGGTGAGTGCTCTGAAAAAAAGTGAATACGAGGAAATAAAAAGGGACAAGTGCCCGAAACCTCGAAGAAAAGAAAAAGTGAGACGAGAGGTAAAAATGGACAAGTGTCCGACAGTAGAATTAGGGGTACAAGATACCCACCTGAGAGAAAAGAAAAAAAGAGAAAATATAGAGCATCTCATTCCCCTAAAAAAAGCTTCAAAGTGCAAGAAAGGTATGTATCCCCTCAAAAGAGCAACAGTAGAATTAGACTTTCACCATTATCACCATCATCACCATACACCATTCATGCGCCACACATGCACATCTTGATTTGACTTATTGACTTGTTTCTTTGGATCCATGGTTTGACTATGCAATAAATGACTTGTAAGTATGTATTAGCTGTCTCCCACCTATGAGCTCCAGATATCAAAACCTTGTTAGAGTAGGGTGAGAGAGAGGGCAATATCATTATGCCTCATACCACAAATAACACATACTTTGAGAGAAGGCATATATCATCACTGCGTTGGTAAGGATCTAGAAATACCACAAAAGAGAGACTAGAGAGAGTCATACAAGGAATCTCTGAGTTTTATTTGAAAATTTGCAAAAACTCCAGAGCTATAGTTGATGAAAGAACAAGAGACATGGTGCTTGACTTGACCGTTCTATCTTTTAACTGCTCAAGACACAAGTGACGGTTGCAAGCCCCATGGTGGAAGGTAATATGAGTAATTTTAAATCTTAACAGTTTACCTTAACCCAGAGATGAGATTTTGTTTGAACGCATGTGTACCTTTAAGGCATAAAACCACTGAAGAAACTATTGAGTCCATCCTTGCTCAGGGACGAGCAAGAGGTATGCTTGAGGGAGTTGTTGACGGTCCTTAAGTACTAAATATAACGATCAAATAAATAAAGAAAAGGATCCAAATGCAACGAACACCCAGACTTAGGGTTTTATCTGACAGAATTCCATGAGTTTTGGTGTTTGTCTATTTCTGCAGGGGGTTATCAGGAAATATGGAGGAAAGGCCCACATGTCGGGTTTACATAGAGATATGAACGTACCGTGCAAATTTTTATCATCTAGAAGACTCTAGAAGCCACGGGAACGAACGGGAGGCCAAGCGGGCTCGGGGGTAGGGCGCCCGCCCTCCCCCCTTCGGCGCCCGCCCTATCCCACAGTCCAATCAGGACTCGCTTCGGGGATTATGCTCCACCGAGCTAAAGGATCAAGAATAACCGTTCAATCAACGTCGGTTTGATCCGACGGCCCAGATTCACTTGAGGGGACTATATAAGCAGACCCCTAGCCTCTGGAGGAGGCACCCCTTGATCCCTATTCATTATTCATAGATAGAGCAAAAGCTAGGGTTTGGAGATGAGAGCTCTCCTCTCATCTCTAAACTAGAGTAGATCTAGATAGTAGCGAGACGGAGAGCGAGGGAGGATTGGAGGAGAGGCCGGCCTGTCGATTCTTCCTCCGGTTGTACTTCGCCATGATCAAGCTCTAATCAAGCTTCCTCATGGGATGACTCTGGTAATCTACTTCTAATTCACTATGCAATTACTATTCATGTATGTTCTGGTTCACAACTCTTTTGTGTACTTCTAATCTCTAGGACCCTATAGGTTAGAGTTGTAGTATAGGTGTAAGCATGGTGCTTAGACCTAGATTACTTGTGAATATCCCCTGTCTAGCTGGATCGTGTGGTAGGCCGCGTAGGTGACAGTTACGTTGGTCCCCTGTAGTAAACCTCCTGTTAGCAGGACAGGTAGGGTTTATCGGCCTATGGATAAGCATCCTTTGTGGTGTATTCTTATCACGTAGTTCATCCCAGACATAGACATACCCCTTTGAAGTAGAAAAACCATAGTTATCATCTCTATTCTGCAACCATCGCCCATATACTAGAATGCTCTACTCTCTATTCCCATATTATCACCCATTGTTATCTTACCTTTAATATTGTTCTTATTCAATTCTACCATCTTTCCTATTTACACTTATCTATCTATCTTGGTTAAGTTAGAGCGTAGTTGGTTCTCCCGTTTCCCTGTGGATACGATAAAACCTTTAACCGGGTAAAAGCTACAACGGTATCCATGCGCTTGCAGATTTATCTGTGTCCGTATAAATACCATAGTACACTCTAGTGTCATGCTGGGGATGACAACCTAGTATTCAAGTGGTGTTAGCAAGTGTCAACAGTCGTCGGATGATGATCAAAGGGCTTAGGATTGGGTGGAGAGGTATTTCTAGTATTTGACTTCTGGCTAAGCTATCCTAAGTATATTTGAGAGTTAACTCCCTTCCTACTGTGGCCGATAGGTGAAAAGGGTGTGGCGAAACACTTCCCTAGGCAGCTACCATGCAAGCCAACTATTATTTGCAACTTGCCTAACAACACACTAAAGAGAACTCCTAATGTCCAGTAGAGGAATGTTATGCTTCGCTGCTGGTGTTCTTCAGGTGCGACAAGAAGTCCACAAGGGCAGACAAAGTCTAGACACCATGTCTACACTAATTCTACTACTCTAGACCCAGCTAAGGTTTCGAGCACTTCACACAAGGCAAAGCAATGTGCCAGATAGGCCGGTTGTATACTTAAAATAAACTAAGATAGAAAGTAAATACTGGAAATACTCAGATGAAAGGAAACTAGAAGGAAGACTTACTAGAAGACAAGCATCCGCTGAGGCACTCCTAGAAGAAGACTCCCGACAAGTCGGTGTTGACACTTGCTAACACCACTTGAATACTAGGTTGTCATCCCCAGCATGGCACTAGAGTGTACTATGGTATTTATACGCACACAGATAATCCGCAAGCGCACGGATACCGTTGAAGCTTTTACCCGGTTAAAGGTTTTATCGTATCCACAAGGAAACGGGAGAACCAACTACGCTCTAACTTAACCTAGATAGATAGATAGGTGTAAATAGGAAAGATGGTAGAATCGAATAAGAACAATATTAAAGGTAAGATAACAGTGAGTGATAATATGGGAATAGAGAATAGAGCAATTCTAGTATATGGGCGATGGTAGCAGAATAGAGAGAATAACTAAGGTTTCTCTACTTCAAAGGGGTATGTCTATGTCTGGGACGAACCACGTGATAAGAGTACACCACAAAGGATGCTTATCCTTAGGCTGATAAACCCTACCCATGCTGCTAACAAGAGGTGGACTACAGAGGACCAACGTAACCGTCACCTACGCGGCCTACCACACGATCCAGCTAGATAGGGGATATCCACAAGTAATCTAGGTCTAAGTGCCACGCTTACACCTATACTACAACTCTCACCTATAGCGTCCTATAGATTAAAGTACTCAAAAGAGTTGTGAACCAGAACATACATAATTAATAATTGCATAATGAATTAGAAGTAGATTACCAGAGTCATCCCATGAGCAAGCTTGATTAGAGCTTGATAATGACGAAGTACAACCGGAGGAAGAACCGACAGGCCGGCCTCTCCTCTAATCCTCCTTCGTTCTCCATCTTGCTATTATCTAGATCTACTCTAGTTTAGAGAAGAGAGGAGAGCTCTCCTCACTAAACCCTAGCTTTTGCTCTGTCTATGAATAATGAATAATGATCAAGGGGTGCGTCCTCTAGGGGCCAGGGTGTCTGGTTATATAGTCTTTTCAGATGAATCTGGGTCGTCGGATCAAACCGACATTGATCGTGTGGTTTTCCTTGAAGTATTAGGTCGGTGGAGCATGATCCACGAAGTTGAAGCTGATTGGTTACTGTAGCTGGGCGGGCACCCATGGGACTTGGGCGGGCGCCCTGCCCCCGGGCCCGATCGGCCTCCCGTTCGTTCCCGTGGCTTCTGGAGTCTTCTAGATGGTAGAAAATTGCGCGGCACGTTAATATCTCTATGTAAACCCGATGTGTGGGTCTTTCTTTCATATTTCCTGATAACCCCCTACAGAAATAGACAAACACCAAAACTCGTGGAATTCTGTCAGATAAAACCCTAAGTCTAGATGTTGATTTCATTTGGATCCTTTTCTTTGTTTATTTGATAATTAAATTTGATACTTAAGGACCGTCAACAAACTCCCCCAAGCTTACCTCTTGCTCGTCCATGAGCAAGGATAGACTCAGCAATGGATCAGAAGTTGTTGCAATATCTTAAAATTTTGATGGTACACATGCTTTTAAATAAGATCTCATCTCTGAGTTAGAGTAAACTGTCAAGAACTAAAACTTACTTACTTTACCTTTCACCATGGGACTTGTAACCATCACTTCTGTCTTGAGTAGTTAAAAGATAGAACAGTCTAGCCAAGTGCCATATCTCTTATTCTTGATCAGCTATAGCTCTGGAGTTTTTGCAGATTTTCAAATAAAACTCAGAGATTCCTTGTATGACTCTCTAAATCTCTCTTTTGTGGTATTTCTGGATCCTTACCAAGGCAGCGATGGTATATGCCTTCTCTCAAGATATGTGGTAGTTGTGGTATAAGGCATAGTGACATTTCCTTCTCTCTCACCCTACTCTAATAAGGCTTTAATATCTGGAGCTCATAGGTGGGAGATAAAGTATACATACTTACAAGACATTTATTGTATAGTTAAACCATGGATCCAAAGAAACAAATCAATAAGCCAAATCAAGATGTGCATGTGTGGCGAATGAATGGTGTATGGTGATGATGGTGATAACAATGGTGAAAGTCTAATTCTACTTTTGCTCTTTTGAGGGGATATATACCTTCTTTGCTTTTTGAAACTTTATGAGGAGAATGAGATGTTCTATCTTCCATTTTTCTTTCCTCTCAGGTGCGTATCCTGTACCCCTAATTCTACTGTCGGACACTTGTCCATTTTTACCTCTCGTCTCACTCTTTTTCTTTTCTTTCGAGGTTCCGGGCACTTGCCCCTTTTTATTTCCTCGTTTATTTATTTTTTTTTCTTTTCTTCTCTTTTCTTTTTTTTCAGAGCACTCATCTCTTGAGATAATATAGCAAGTGGTAGTAGCAAGATAACTTGAGCATTTATTTCACAAGGGAAAACAGAAATATTTTTGGCTATTCTCTCCCGGATTAGGAGTAGAATATTTTTGGGTGGTTCTGGAGATGGACATGGATGGATATATGTGGATGGTACTTTCAGAGTAGAAGTAGCATATATGAGTGAATGTGCAAGTGAAATCTTGATTTAACCACATGACATGCTCCTAAGGGTCTACACAGCTTGACCACACTCAATGCTCATAAGCAGTAAATAGTAAATGTGTGGCTCAAAGTCTAGCAAGCATGTATATATGGCTGTGGTAGGAATTTAAACTTTCATCATACCGGAACTCATCATGCAATATTTTAATGATTTTTCAAAGATAAAATTCTCCAGAATTTTAGCATATCTAGGAACAGATAAACAGCAGCTCAACCTTCCCATATCATATCCGTTAACAACTTAGATTTCAGATCAAGTTTTTATCCCACAAGTTTAGATCTAGAGCAAGCTTTAAATTATAACAGTTATGTCTAAACTTGAGAGAGAACTTCAAATTTACAAATTAGGCAGAGCAACTATTCATCATATCCATGCTAGAGTTTTATTATTAAGATTCAGATTAGCATAGCCACTTTATTTATTTATTAAACACACTAAGCAAAAGATATATATAAGCACAAAATCTTTATTTGGTTTTTCATAGTTTATGTATTTTAATATTCTAATATAATATAAGTATAAAGATAGTTAGAAATACTTAGCGAGATAAATGGGGGTGCTCTTCCCCAAGCTGAATTTTGACGTAATTTCTCTTGATGTAGCTAGCAGGTGGCAGAGGTGTATTTGAAAGTCAGTAGCATTCTGACAGCGATTAGAATGTCCTCCGTCTGCTAGTCTTCTTGATTCTTAAATTCTGTGGAGCTCAAATAGACAACAAAGCTTGTGGAACTAATTAAGTGTTAGCATAAATATCTAGCCTTCATCATGTTGAGCTTCGTCAATAAATATTACTCCCTGTTTTTATATTTTTATTTTATAAAGCAGAAAAGAAATATTTATTTTATTTTTATGCCACCACAGTGAAGGTACTTATGGGTTTTATGCCACTCGTATACTCACATGGGGCTTAGTATTTTTTAATATTTTTATTTTCTTTTCAAGATAGCATGATTAACTAATAATCTATTTAAGGAAAGTAAATAATTAAAGGGAAAAGGGAATGCAGAAAGGATAAATATGGATAACTACCGATCTTACCTTTCGGCGAGGGTTCAATGTTTTAAGTCTTCTTAACAAGACTTCTCACCGTGTTCATTCTTCAGGTGCGTCATTTGATTCAGGTGCGGACCTTGACGTCTGCACCTCTTCGTTTGCCCAGCAGTGGCGTTGGCAGTATCCTGCTCAGTGTGTTTGTGCTCGTAGATCCAGGTCCTTCACTTGGTAGAGTTTGAGAGTTACAAAACTTCTCTGTGTTTTGTTCAAAGTATACCTGCTCATAGAGACAAGGCAGAGATCATGTGCATGGGTCCTGTTGGTGGAAAACACCAACAGAACCTAAAGTGTATTTGTTCTTCTCTAACCCTAAGCATAGTGAGCAAGACAAAGTTGATGGATGAAAAGTTCATGAGTGTAGCACTTATAACATTTGTCAGATCAGATCGCTCAACCTTATGGAAAGATAATCTATCTATGTATAATGCTTTTTCTTTATATCTTCTCAAAGATTGAATGTATAACATTTTAGCTCATATGATTAGGAGTGTGGGATCATGGAGGTAGTACTAAGAACAAGGATTAAAGGACTAAACATGTTGAATCAGTTGGGTTGGTTAATATAGAGTTGTAAATCATACATGTTTGTCTCTTTTATTTATATGAACGCTAGAACCAAGGAGAAGCTTATAAAAGTGATAGTCAAGTACCTTAAGATGTTACCTTGCTTGAAGAGTGATGGTACAATATCACCTTGTGGAAGCTTTCCTTTCTTAGCGGTTGTGCATCGTGTTTGTGGCACCCTCCGTGGATCATCTCTCTATGATGAATGAGCTATGTCCTTCTTGTGCAAATTGTTAAACTTCATGTGTCACTCTCTTCGTCTCTGATGTGAGTTTATCTCAGGACTTCCCAAATCGATATTGAAAGTTTTTCTGCAGGGGTTAGTCCGACAAAAATATACCAATGTCTACACAAGCAGTTTTTAGTTCAATAACCGAACTAGACTCCATGTCTAATCAGATTAAGGAAGGCTGTTTAACTTAAGCACCATGCTTAATTTAAAAGCCAATAGAAGTATGTGTAGTACTTCCAAACTAACACTTACTAGGATAAACAAAGGTAGCGTGATGGCATTTATAGAGATCTACTCGAGTGGAGACGAAGTAGTGTGATTAGTATTTAACAAATTGAGCATGTCTTAAAGGTAGGGACAACCAACATAGCAACATGGCAAAGAATGTTTTTATGTAAAGTACTCCCCTAAGCTTGATTTTTGCAGAATTCAAGTTTGGATGAATTTAATTCAGTGTTGCATGATGATTGGTTGGACATACCTTGTACTTGCTTGTCATTCATCTGATCTTCTTGTTCCAATCCTGAAAAGGTTAGTGACAAGAATACCTGAAGGAATATTTTTACAATTATCCTTATATGCTCAATACACAAGGTAATGTTGCAAATAATTAAAAACTCATGTTACGATCTGATCAGTGCTTATTTTAGGACACTGAGCTTGTCCTTGGGAAACCATCAATTTATGTCGGCGAAGTGGTTTCCCTTCCAACGCTGACCTAAATCAAGATCAACTCAACGCGATCTGCAATATTTATTATAGACATATGCATCGACAACCACCCTTTTAAAGTTTTTATAAATAGAAAGGAAGAGGGGGTTGGAGATCTCAAATGTGGTGATGTTAGAGAGACCAATAGATTGGGAAGATGTTACATATGAGCATGGAGTAAACAAAGTGGCTATGAAATAAATTCCATGCTCATTAATGTTATCTTCGTCTCCAATCTGAATGTTCAGAGTTCCTCTTGGATTGGTCTAACTTATGTCCTCTTCTATAGTTGGATGAATCCCATCTTCAAAGGGAGTCAAGAACTCACCATTTGAAATTGAACCAAAGTCAGAATTCATTAAGGCTTCTTCCTTATCCATCCATTCTACACATTCTAGCCATTTAGAACTTGTGATCAGGAAAGGGGAGGTGTTAGAATTTTCTATATGGCTTAGCTCTCCTTCACTTGATATGTCATCCTTGACTTCTTCATAACAGGAACCAGGACATTCTCTAAGGATATGTCATCCTCGACTTCTTCATAACAGGAACCAGGATATTCTCTAAGAGAACCATTATTGCAAGGATTTGAATTATCCCTACTTGAAGGTCTCTTATGGAACCAGAAGTCTAAACCATCAGCATCTGAAAGATTTAAGGTCGGAATTCCTTCCTCCCTTCGACAATTTTGGGGTATTGATGGTTTAGGATTGATAGCTAAAGTTTGGAATTGAAGTGGTTGTGATCTGGCTATCGAAACTTCTTCTTCTTGTCTAGGAACTGGTTCTGTCTCTTTCTCAGGGATATAAAAGCTAGGAGACTTTCCACTTAATAAATCAATCAAATTCCAAGCTTCACTAGCAGGTAGGTGATAGAAGGATCCTCTAGAGGCTGTATTCAAGGTTTGCTTATCTTCCCTACTAAGGCCCTCAAAAAAGTGAATTAGAAGAACTTCTTCTGGAATAGAAAGCTTTGGGCCAGTGAGAGTAAGGTTAATAAAGCGGTCCCATGATTTGCCAAGAGATTCTTCTTCCAGTTGTCTAAAAGAAATAATCTCACGCCGAAGTTCCGCCACTTTGGAGATTGGAAAATACTTAGAAATAAAACTACTATATAACTCCTTCCAATCTCCATGAACACTCCCTATTTTGAGTTTGTACCAATGTCTAGCTTTTCCCGTTAAAGAGAACGGAAAGAGCTTCCATTTGAGGGTCTCATCGGACATTCCTTCTATGCGAAGGAGGTCACAGACTCGATAAAACTCTCTTAGGTGTGTCTATGGGTTTAGACAGAGCAAAAGCTAGGGTTTAGAGATGAGAGCTCTCCTCTCTTCTCTAAACTAGAGTAGATCTAGATAGTAGCGAGATGGAGAGCGAGGGAGGATGGGAGGAGAGGCCGGCCTGTCGGTTCTTCCTCCAGTTGTACTTCGCCATGATCAAGCTCTAATCAAGCTTGCTCATGGGATGACTCTGGTAATCTAATTCTAATTCATTATACAATTACTAATCCTGTATGTTCTGGTTCACAATTCTTTTGAGTACTTTAATCTATAGGACGCTATAGGTGAGAGTTGTAGTATAGGTGTAAGCGTGGTGCTTAGACCTAGATTACTTGTGGATATCCCCTCTCTAGCTAGATCTTGTGGTAGGCCGCGTAGGTGACAGTTACGTTGGTCCCCTGTAGTCCACCTCTTGTTAGTAGGACGGGTAGGGTTTATCGGCCTATGGATAAGCATCCTTTGTGGTGTATTCTTATCACGTGGTTCATCCCAGACATAGACATACCTTTTTGAAGTAGACAAACCATAGTTATCCTCTCTATTCTCCTACCATCGCTCGTATACTAGATTGCTCAATTCTCTATTCCCCTATTATTACACATTGTTATCTTATCTTTAATATTGCTCTTATTCAATTCTACCATCTTTCCTATTTACACTTATCTATCTATCTTGGTTAAGTTAGAGCATAGTTGGTTCACCAGTTTCCTTGTGGATACGATAAAACCTTTAACCGGGAAAAAGCTACAATGGTATCCGTGCGCTTGCGAATTTATCTGTGTGCATATAAATACCATAGTACACTCTAGTGCCATGTTGGGGATGACAACCTAGTATTCAAGTGGTGTTAGCAAGTGTCAACAAGCATTTTTGGCACCGTTGCCGGGGAGACGGTTGCTGAGTTGACTACGAACTAGCTTAATCATTTTATAAAAAAATAATAAAAAAATATATATTTTCCTTTTATCCTTTGCCTCATCTCTGCTATTCTTTCTTCTTATCTAATCCTTGATTTCTGGTCTATCATGAATGCAAACATGTCTATCTATGAATTTCATAGACCTACGGGCACACATCTCGAACCACCAAAATCTTCAAAGCCTATCATAGCATCTAGTTTTGAGATAGACCCCGAATACATAGAATTTGTTCAAAAACAACCTTTCTCAGGAGAAGGTGAGGAAAACCCATACACACACCTAAGAGAGTTTTATAGAGTCTGTGACCTGCTTCGCATAGAAGGCATGTCCGATGAGACCCTTAAATGGAAGCTCTTTCCGTTCTCTTTAATAGGAAAAGCTAGACATTGGTATAAACTCAAAGTAGGGAGTGTTCATGGAGATTGGAAGGAGTTACATAATAGTTTTCTTTTAAAATATTTTCCAATCTCTAAAGTGGTGGAACTTCGGCGTGAGATTATTTCTTTTAGACAACTGGAAGAAGAATCTCTTGGCAAATCATGGGACCGCTTTGTTAACCTTACTCTCACAGGCCCAAAGCTTTCTATTCCACAAGAAGTTCTTCTAATTAACTTTTTTGAGGGCCTTAGTATGGAAAATAAGCAAACATTGAATACAGCCTTCGGAGGATCTTTCCACCACCCATCCGCTAGTGAAGCTTGGAATTTGATTGATTTAATGAGCGGAAAGTCTCCTAGCTTTTTTATCCTTGAGAAAGAGAAAGAACCAGTTCCTAGAAAAGAAACAGAAGTTTCAATAGCCAGATCACAACCACTTCAATTCCAAACTTTAGCTATCGATCCTAAACCATCAATACCCCAAAATTCTCCAAGGGAGGAAGGAATTCCGACCTTAAATCTTTCAGATACTGAGGGTTTAGACTTCTGGTTCCATAAGAGACCTTCAAGCAGGGATAATTCAAATCCTTGCAATAATGTTCCTCTTAGAGAATGTCATGGTTCCTTTTATGAAGAAGTCGAGGATGACATATCAAGTGAAGGAGAGCTAAGCCATATAGAAAATTCTATCAGCTCCCCTTTCCTGATCACAAGTACCAAATGGCTAGAATGTGTAGAATGGATGGATAAGGAAGAAGCCTTAATGGATTCTGAGTTTGGCTCAATTTCAAATGGTGAGTTCTTGACTCCCTTTGAAGATGAGATTCATCCAACTACAGAAGAGGACATAGGTGAGACCAATCCAGGAGAAACTCCGAACATTCAGATTGGAGACGAAGATAACATTAATGAGCATGAAATTTATTTCATAGCCACTTTTTTTACTCCATGCTCATATGTAACATCTTCCCAATCTATTGGTCTCTCCAACATCACCACATTTGAGATCTCCGACCCCCTCTTCCTTTCTATTTATTAAAACTTTAAAGGGCGGTTGTCGATGCATATGTCTTTAATAAGTATTGCAGATCTCGTTGAGTTGATCTTGATATAGGTCAGCGATGGAAGGGAAACATTTGCCGACATAAATTGATGGTTTCCCAAGGACAAGGTGTTGGGTATTCTTAACATCACTACCAAAAGTAGACAGCTTTCTAATTCTAGTAACGGTGCCAAAAATGCCAAACCTATCCCTCATACCACTTAAGCCAAGTTATGATCCCCAGCATGACATGAGAGACGCGGTATTGAAATATGCAATTGCTCTTCTAAATATATAATGAATGGAGTCTGCAAGCGCACAGATTAATACCGATGTAGCATTTTAACCGGGAAGTATTCCAGGTATCGTTATTTATATTTTTACCACTGGGAAGGGATTAACAATCATCAATATTGATTACAGAATAGAATATGAGATTGAGTATCTATCATTGCATGTATAATTGAGAACATTGTATCTAATTCTTTCATATAGGGGTAAGTGTCACATAAAAGATATATGAAATAATGAATAGTGACAAAGGTAATTAGTCTGATCATAACTTCGCCACATATATATATGATAAGCACCTCAATTAGATACTCTAGAAAGTCATTAGCATGGTATTAGAACGAACTACAAGAATATTTCCTAAGTTATTCTCAACTATATAGTCTAGCATTATCATAGTTAGTGCAAGCATACTTAGCAATCATTGTGAGACAAGACTACGCCCATGCATAGTGATATTAGCAAGGTAAATGAGAAACATAGCAATCACTCCCCTGTAATAATGTTGCTCTGCTAGCCCGATACACGAGAGGGGGACTATATAAGAATCAATGAAGCTGTCACTATCACGAACTACCCCACGATCTGGCATATTGGGTACAATCACAGATAAATACGGTATAAGCACCACGCCTACACAATATCTATCATTTACCCATGGATCTGATGGATAAACGCTATACAATCCTAAACATGTATATAGATCCAATCTGTCGAGGGTATCAGTAAGGGGTACCCTCACCGATGCACATAACGAGACTACCCGTACGCAGGTCGAGGCCCTCAACTCGATGCCCTGGTCATACATATGCGCGGTCGTCGACGACCGCAGCCTCGAAGACGGAAATAGCGTCGAGCGAATCGATCAGGGTCGAGCGCCAGCTACCGTCGAATACGGAAACGGGCTCGCACGAACCAGGAGGCGTCGAGCGCAAGGACGCCGCCCGCCGCCTGACGCGTGCACGAGAGCCAGGGCATTTAATGCGCCTGTCGCTTTCCCACCTAATACGCTGGTCACGGGAAGCGTGATAGGGAACAGGCACCCGTCCCGTCGTTCTTTTTGCAGCCTTCTCCACCAAACGACCCACAGCATGTCAGGACGCGGGAAGCAGGGATGGAACGTCTAATGAGGACCCCCTCGAGGTAGCCAAGGTCAGCGCTCTGGATATCAGGGCATTGCACGGCATCCGACCCTCGATCAGACATGGTTCCTTCTTGGAGACGAGGTGGGCGTCGACTGACAACATCGCAACCACTCCGCCGGATCTGCCGCCATACCGTACAAGCGTGCGACCGGTGAACCAGCCCAAGACGGCGCGCAGAGCAGGATACAGGGGCACGCGTAATCGTCATCGAGCTACCAAGATGGGATGGCTCGAGACCACGCCAGTACGGAGGCCTCGAGTAGGTCAGCGCGCCATGCTTCTATCGACCCCTACTCTGACACCTATACATGTACCCTAGGTCTCTCCTTGGAGCTATAAAAGGAAGGACCCGCGAGTAGATAGACACACGCAACACTACACCCATACGCAGTAGAACTCCCATACTCCATACCACGCTTGTATTCGCCCCTGTACAAGCACTTAGGTGCAAGATAATACAAACTTCCCTCCCCCGCTGAACGTAGGGCCTTCTCTTGCCCGAACCAGGATAAATCTTTGTGTCTTCTTGCATCACCATCTGGGAAAGGGAGCACGCATACAAATTTACTCGTTGGTGTGACCCCCGTGGCGAAAACACCGACAGTTGGCGTGCCAGGTAGGGGTCCTGCGTGTTTTTTCATCGATTTCCCATTCCTTTCCAGATGGCCACTCTCGCCTCGCCGATTCCGCGCTCCACGGTGATTTGGTTTGGGAGTCTCGAGTTCATGTCTACTGGCTCCGGCTATGACATGATCTTGCTCTCGATCAAAGGACCGGGAGGAGCTCGCGTTGCGCCAGCACGGTTGAGGGCCCCGAGATGCCCTCGCCACCACGCCTCCCCGCCCAAGAAGAGGCGTGGACAGCACCATCGTCGCCCCTCTGCCTCGTCACGACCTGCAGTTTGTGCTAGGCAGGAGGTGACACAGGAGCCGGCAGCCCCGCGTGCCGGAGCCATGGACGTGCCGGCTCAGTGTCACATGACGACAAGAGGAGACGCACCTACCGCCAGGCTACTTCCACACGGGTTGTTCACTCCAAGAAGGGCACTGCCATTCGGATTGGACAACGTCGCGGCATCGCTAGCCAGAGCGATATGCCCAAACGCCCAGACGTACGTGGAGAGACCAATGGTCCTCCCATGTAACTCTAAAGCACAACAACCGACGTCCGAATTGCCAGATTTCTCCTAGGTACGAGGCCTCCGTCGCCTAGGCCCTGGACGGTACACGATCACCTCACTCAGGCAGCGGCTGCTGGAGGAGAGACGTGGATGTTTCTATGCCGCCAAGCCGGACTCCGATTCCAAGACCGATAGCTACGACCCTACTAGGGACTGCTATCACATCGACGGAGCGGTAGAAACTACCGACGAGACGCAGGATGCAGCTGCGGGCGGTCGAGCCCCTGCGGCAAGGGAAGACCCCAGGACGCCTGGGAACGACGGACAGGTCGACCCGCTTCCACAGGAAGACAGGGCTGCGCAGCTCGCGCAGCTACGAGAGCTCAAGACCAAGCTTGACGAGGATCGTGAGCGCCTCGTCTTGCTCGAGCAAATCCTCGAGCAAGACTTGCCTTACCCGCCTAGCGGGAGTGTCCGTAGGCGTGCTCGAGAGGTACACCGGCAAATCATCGGAGACGCGGAGCCAGAGCAACCCGTCAACCGCTTCCCTCGAGCAGGCCAGAATGTAGTGGCAGCAACAATGCTGCTACGCAACATGCCAGAGTCATCGAACTCCCAAGCTCGACGCATTCGAGACGAGGTGCAGACTTTGCTCCAGGTAGTGGCGGTTCAACAAGCCGAAAGCTCGGCTTCTCTATGACGAGGAGCCGCCACTGAAAAGCGCGATGAGCCACCCCAAAATGAAAAGGAGGTTTCAGTCCATCAACAGCCACCCCCTCGAGGAAGAAAGACCACTCTTGTCCTCCCTGTCGACAATCAGCGTCGACACAACGCGTGGCATGACATCGAAGAGAGTCGACGCCGTCGGTATGGGGACGCGGAAGAGCGTGGTTACAGCGCACATCGCGGTGGGAGGTATGACAGCGACGAGGACCGGATGGCCCCCGAACCACCAGGCCCACGGGTGTTCAGCAGGGCAATCCGCAGCACGCCTACCAGCATCGCAAAATACAATGGTGAGACCAAACCAGAGTTGTGGCTGGCCAATTTTAGGCTGGCCTGTCAGCTAGGAGGCGCTCGAGGAGATGATCGAGCTATCATCAGACAGCTACCGCTCTTCCTCTCCGACACCGCCCGTCGATGGCTCGAGGAACTTCTAGCTAATCAGATCCATGACTGGGTCGATTTGGTTAGAGTCTTCGAGGGTAATTTCAAAGGGACCTACATACGGCCCGGGAACTCGTGGGACCTCAGCAAATGCAAGTAGAAGTCAGGAGAAACTCTTCGAGAGTACGCTTGACGCTTCTCAAAACAGCGCACCGAGCTGCCACATATCCCCGACCACGACGTCATCCTGGCATTTGTCTCTGATACCACTAGTCGAGACTTGGTGCGGGAATTAGGTCAAAATGGACCTCAGACCATCGATGAGCTCATGGACGTAGTGGCAAACTACGCAGCAGGAGAGGAAGCAGTCGGTGCCTTCTTTAGTTGTGAAGGAAGGAAAGGCAAGCAGCCTGCCGATGAAGATGGGACCCCCAGTCGAGGGCTCAAGAAGAACAAGAAGAAGCAGAAAGTGCGGCAGTTCAAGTAGGAGAACTTCGACGACGACCTCGTCGCCGCCATGGAGCGGAAGAAACCTCGAGGCCCCCCAGATGGGGGTATCTTCGATAAGATGCTAGAGGAACCATGCCCTTACCATAAAGGAGGAGCCAACCACAAGCTCAAGGACTGTCGTATGCTGAAAAAGCATTTCGACGGCCTAGGGTTCAGAAAGGACGCGCGCGACGACCCAAAGAAGGAGAAGGCGGCGACAAGGAGGGCAACAAGGATGACGATGGTTTCCCTGCCGTCCACAACTGCTACATGATCTATGGTGGGCCCTCAACGCAGTTGACTGATAGGCAGCGCAAGAGGGAACGCCGTGAGGTCTTCGCCGCAAGAATGGCGGTGCCCCAGTACCTCAGCTGGTCGAGCACACCCATCACCTTCGACCGAGAGGATCACCCCGACAAGGTGGTTGCCCCAGGCGTCTACCCGCTCGTCGTCGACCCCATCATTGTCAATACCCGGCTCTCGAAGGTGCTAATGGACGGATGCAGCAGCCTCAACATCATCTATCTCGAGACCCTCGACCTCCTCGGCATCGACAGGGGACGGCTCAAACCAAGCGCTGGCGGTTTCCATGGCGTCGTGCCAGGGAAAAAGGCGCTGCCAGTGGGTCGAATCGACCTACCCGTCTGCTTTGGCACGGCAGCCAACTTCAGGAAGGAGACGCTCACCTTTGAAGTGGTCGGGTTCCGAGGCACGTATCACGCCATCATCGGGCGCCCGGGCTACGCCAAGTTCATGGCCATACCCAACTACACTTACTTGAAGCTGAAAATGCCCGGTCCCAAAGGAGTCATCACCGTCAGCTCCTCCTTCGAGCACGCTTACGAGTGCGACGTCGAGTGCGTCGAGTATGGGGAGGCGGTTGAAAACTCCACCCAGCTCGTCGCAAAGCTCAAGGCCCTGGCCGCTGAGGCTCCAGAGCCCAAACGCCACGCGGGCAGCTTCGAGCCAGCAGAGGGGACCAAGAAGATCCCGCTCGATCCTAACAACTCCGACGGCAAGGTGCTGACGATCAGCGCCGACCTCGACCCCAAATAGGAAGCTGTGCTTGTCGACTTTCTCCGTGCGAACGCCGACATGTTCGCATGGAGTCCCTCGGACATGCCAGGCATACCGAGGGAAGTCGCCGAGCACTCCTTGGAGATTCGAGCCGGTTCCAAGCCAGTGAAGCAACGGTTGCGCCGATTCGACGAGGAGAAGCGCATGATCATTGGCGAGGAGGTCCACAAGCTTTTGACGGCCGGATTCATCAAGGAGGTTCACCATCCCGACTGGTTAGCAAACCCTGTACTAGTTAAGCAAAAGAATGGGAAAATGAGGATGTGTGTCGATTATACGAGTTTAAATAAAGCATGTCCGAAAGTTCCCTTTCCATTACCATGTATTGATCAAATTGTTGATTATACTGCGGGATGTGAAACCCTTTCTTTTCTTGATGCATTTTCTGGTTACCATCAAATAAAAATGAAAGAGTCCGACCAGCTCGCGACCTCTTTCAAGACACCTTTTGGGATGTATTGCTATGTAACCATGCCGTTTGGGCTTCGAAATGCGGGAGCCACGTACCAACGCTGCATGCTTCACGTATTTGGCAAGCACATAGGGTCGACGTTCGAGGCCTATGTCGACGACATTGTCGTCAAATCAAAGCGGCGAGGAGACTTGATCCAGGACCTTGAGATCGCTTTTAGCTGCTTACGCGTCAACCAGATCAAGCTCAATCCCGAGAAATGCGTTTTCGGCGTGCCTCGAGGCATGCTCTTGGGTTACATTGTTTCCCAGCGGCATCGAGGCCAACCCCGAGAAAGTCTCGGCCATCACAAGAATGGGGCCAATCCGAGACATCAAGGGTGTGCAGAGAGTCACGGGATGCCTAGCGGCGCTGAGCCGTTTCATCTCGAGATTAGGAGAAAAGGCGTTACCACTGTATCGACTTCTAAAGAAGGTCGAGCGTTTTTCTTGGACCCCCGAGGCTGAGGAAGCCCTCGAAAATCTGAAGAGAACGCTGACCTCAGCACCAGTCCTGGTCTCACCTCAACCTGCGGAACCACTGCTCCTTTACGTCGCCTCGACGACCCAGGTTGTCAGTGCGGCGGTGGTGGTCGAAAGGCAGGAGGAGGGGCACGCATTGCCAGTCCAGGGGCCAGTATATTTCGTCAGCGAGGTGCTCTCGGAGACCAAGGCACGTTACCCCCAAATTCAGAAGCTGATCTACACCGTAATCCTCGCCCGCCGTAAGCTGCAGCACTACTTCCTCGGTCACCCCATCACGGTGGTCCCGTCTTTCCCCCTGGGCGAGATAATCCAGAGTAAGGAGGCCACGGGAAGAATAGCTAAATGGTCGGTCGAGCTCATGAGTGAGACTCTCACTTATGCGCCTCGCAAGGCCATCAAATCGCCAGCTCTGGTGGACTTCGTCGCGGAATGGACAGACTCCCAGCTTCCCCCGACCCAGGTCCAGGCGGAGCTGTGGATGATGTATTTCGACGGGTCACTCTTGAAAACAGGGGCCGGGGCCGGCCTGCTGTTCATCTCGCCCTTGGGCATCCATATGAGATACGTCATCAGGATTCACTTTGCCGCATCTAACAATGTCGCAGAGTACGAGGCCCACGTCAACGGTCTCAAGATCGCCATCGAGCTAGGAGTCCGACGCCTCGACGTCCGAGGCGACTCCCAACTCGTCATTGACCAAGTGATGAAGACTTCAAGCTGCCATGACCTGAAAATGGAGGCGTACTGCAAAGAAGTCCGTCGACTCGAGGACAAATTCCATGGCTTTGAGCTCGTCCATGTCGCCCGACGCTACAACGAGGCAGCCGACGAACTCGCCAAGATCGCGTCGACCCAAGGCACGGTGCCACCTGACGCGTTCTCGAGAGATCTTCACGAGCCATCCGTCGACTTGGGCTTGGGGGCTGGCGTCGATGCCGATCCTGCCCAGCCAACCGACATCGTCGACGCACTGTTAATGTCAGCTGAGGCGATGGAGGTAGAACAGCGGCCCGGTCGACCGTTCGACTGGCGCACACCATTACTCGACTGCCTAATCCGCTGCGAGCTGCCAGAAGATCGATCTGAGGCCCGCCATATCGCTCGAAGAGCCAAGTCATACGTGATTTATGGCGAAGACAATGAGCTATATCGATGAAGCCCGACGGGGATTTTGCAGCGTTGCATCACCGTGGAAGAAGGCCGGAAACTCCTCGAGGATCTGCACTCGGGGGCTTGTGGCCACCATGCTACTCCACGGACCCTTATAGGGAACGCCTTCCGACAAGGCTTCTACTGGCCAACGGCCGAAGCAGATGCCGTCAAGCTCGTACGCTCATGTGATGGTTGCCAGTTCTACGCCAAACAGACGCATCTGCCCGCCCACGCTCTTCAGATGATCCCCATCACATGGCCATTTGCGGTGTGGGGGCTCGACTTAGTAGGGCCCCTACAAAAGGCGAAAGGCTGGTACACCCACTTGCTGGTGGCCACCGACAAATTCTCCAAATGGATCGAGGCTCGACCCATCACCAACATCCGCTCCGAGTAGGCCGTCCTTTTCTTCACCGACATCATCCACCGGTTTGGGATTCCCAACGTCATCATCACCGATAACGGCACTTAGTTCACCGGCAAAAAGTTCTTGAACTTCTACGATCAGCATCACATCCGTGTGAACTGGTCTGCAGTAGCCCACCCTCGAACTAACGGCCAGGTCGAGCGTGCCAACGGCATGATTTTGCAAGGACTCCAGCCAAGGATCTACAATCGCTTGAAGAAATTCGGCAAGAAGTGGGTCGAGGAGCTTTCATCGGTCCTATGGAGCCTGAGGACAACGCCAAGCAGGGCCATAAAATACACCCCATTCTTCATGGTCTACGGCTCAGAGGCTTTCCTCCCCACAGACCTCGAGTATGGGTCTCCTCGACTCAAAGCATACAACGAGTAATCAAATATGGAAACTCAAGAAAACGCGGTCGACCAACTTGAGGAGGCTCGAGACATGGCCCTCCTCAACTCTGCCAGATATCAGTAGAAACTTTGACGCTACCACGACAAGCACGTGCGCAAGAGGGACTTAAACGTGGGCGACCTTGTCCTACGACGGCGGCAAAGCAATCAAGGACGCCACAAGCTGACTCCACCTTGGGAGGGCCCGTACGTGGTAGCCGAGGTCTTGAAGCCAGGGACGTACAAGCTCGCGGACGAAAAGGGGGCGATCTTCACCAACGCGTGGAACATCGAACAGCTACGTCGATTCTACCCCTAGAAGTTCAAAACTTTATGTCCCTATGTACATTCTGTACCAAGGCCTTGTAAATGAATAAATAAAGCCTTTCCCTCAAGCGATTTACTTTCTCACAAATCTCGATGCCAGAAGGGAGTACCAACTATGACCCATCATAGTCAATACCCCCTCGGGGGCTACCAGGGGGGCAACCCCCCCCCCAAGTGTCGAAAAAACCAAGAAATTCTCTCTTCCTTACTTAGTAAACCTTGCACGTTCGAGTAGTTGAGGCGCCTCGAGCCCCTTAAGGGCCGAGGGACAACGAGTCTGAGAACTCCTACGCCCCCGGGCTATGGAAACTCTACACACTTCCTCACCCTCGAGGTGACCGAGGCTGTTTTTAACAAAAGATCGAACAAGGAATACAAACGTAGGCGCAAAGGGAAATAAAAGAACCTCGAGCGGAAAGATAGATAAACATTTAACAGTCACAAAAAGACATTGTACCACTTATAGAGAAGTTAATAGAGTATTATACAAGGGGCCCTAGGCACCCTAAGCAGGCTCGCAGGCCTCAGTCTTCAGCACGATCCTCACCACCCTCGCCTACGCCCGAGCTAGTCTCAGGAGGAAGCACCTCAGGCTCAAATAGCTTGGCCAGCCTCTCTCCAGGAGCCTCCGCGTCGTCGATCAAGGCGTGGAGCCTCTCTTCGTTCTCCGCGTCGGTCTTAGAGATGTCGGTGACGAAGCCGTGGGACACCACCTCCATGTCGTAGGAGAAGACCGAGCAGACAACCGCCATCGCCCGCTTCACCCCGATGTGGAGGGCATCCCGCACCCGATCTCTCAGCGTCGCGCCTAGGTAGCACAGCTGGTCGACCAGTGCGTCGCCTCGAGCGTCCTCCTTCGACTCGTCCATAGGCTCGACCTCCCAAGAGGTCGAGAGGTCGTTTATCGCCGTCCGCACTCGACGGTTCAAAGCAATCTCCGCCTCAAGCTGGGCCTTAGCACTACGGGCCTCGACTTGGGCGGCCAAGAGTTCGTCCTTAAGCCCTATAAATGCCAATACAAGAAGCTTTAGAAAAAACCAAGCACACCTCGAAAAAGAAATCCGACAAAGGAAACGTACCGCGGACATTCTCCTCCAGGGCCGTGTTCTCGCCGATTAGTCTGGTGTTGGCCCTCTCGATCTCTTTGTTGGAGCGGGCCAGCTCAGTGTTGGCAACGCGGAGATCCTCGATCGCCTGGCCAGCCTGAGCAATGGCCCCACTCTTCTCCAACAGCTCTCCCTTCAGACGTTCGACGTTGTCAGAGAGACTGCGGGATCGAGCCCGCTCCGCCTCGAGGTCTTCGAGGGCCTTCTTCTTTGCGTCCTCGACGACACCTCTAGCGACCTCACTGTCCACATACGCCACCTTCATCTTCTGGAAGGAGTCTCGGAGGGAGTCCAGGTCGGTCTTGAGAAGGCCCTTCTCCTTGTCCAGGTCTGCAATGACGCTCTTGTAGGACAGGGCCTCCTCCCGGGCTTTGGATGCGGCCTCCTCGACCGTCAGAGCTCGCTCCCGCAGCAGCGTCATCTCCTCCTCTGCCTTCTTTGAGGCCTCTTGAGCCTCGACCAGGGCAGCCTCCCTTGCCTTCTTCTCCTCCTCGAGCGCTATGAGGTCTTTGTAGGCCTTAAGGAGCTTTTCTTGCGACTCGAGGAGTTGGTCCTAGAGGACGGGGAGCTGCTCCCAGCCTCCTCTTGTGGCGTGAATGAAGCTAGACTTGATACGGGAGGTCTCTTTCATGTCCTACGAGCCGGGGGTCGAACGGTTAGAACACGAAACCAAAGGATCTATGAGAATTAAGGACCAAAAAATACTTACAAAGTAGGCCGGCCCGAGCCCGTTGTTGATGACGTCCGATAGGAGCCCCACCACGTGCTTCATCCAAAGGCGGAGCTCCTCAACGTGTTCCCATTTCGCCGCCTCCTTCCTGTCGTCCAGGAAGATGTTGGGCTCGGACGGATCGGTGGAAGCCCGGATGCGGATCCGATCGGGGCACCAGTTCTCCATCTCCTGGTCAGCCCGCGCCTTGACGCCGCGGATAAGGTCCTCGACGGTCTCGAGGGAGCCCCCATGGCGCAAGAACAGGTCGACGAGGCATGGGAACCGTCCGTCGTCATCCACCGTCTTCCAGGTACCGTCCTTACTCCCCGACGTCCCGATCTCGTCCTCCTCAGAGGGAAAACGGTCCTCCCACGCCCGACGCTCTCGGAGGAACCCTGGGGCGATCCCATCCATGCCGTAGATCGTCTTCCTGATCTCGGACTCGGGGTCGGCGGGGGTGCGCATCATGCAGGCAAGTGCCACCACACTGTCCGCTCGCCCCGGCTCTGCCCGGATCGCGGTGGGCGCCCCCGGAAGGAGCCACGCTGGGGTTGGAGGGCCGTACACCGGCAAATCCTCTTCCTGTTCTCCGGGCTCTTGCGGCGCCGGTGGTACTGGTTGGGGCAGACCTTGAGGCAGGGGCTCGAGCGGTCCTTCTTCTTGGCCCCCCTAATGCTGTTGCTGCCCCTCGAGCATTTGCTGCTGTTGCTCCACCTGCTGCTGCTGCTGCTGCTCCTGCTGCTGCTGCTGTTGCTGCTCCTGCTGCTGCTGCTGTTGTTGCCCCGCGTGTTCCTACGACTCTTGTCAGCGGCCCTGCTCCTGCGGCTGCCGCCTCGCCTCGCGCTCCCGCTCCTCCTCCTCCTCCTTCTTCCTCTGCTCCTCGAGGGTGCGGAGACCAGCAGGCCAGGGCGTCCGTTCCACGACAAAGGAGGTCGACGCCTCCTCATCCATAGGGCGGGCATCCCTCGACGTCTCGTTGCCGCCAGACGTGTCGCAGATGGTGATGGGATCCCCCTCGACCCCCGATCGGGGAGGCTCGGGGGCTCCCTCTTGCCCCTGGGTCTGGGCCACCTCGACCCGTGTCGGCGGCGACGGGGCAAGCTCGAGACGAGGCGGGGCGCTCTCAGCGACGGCCGAAGGCTGAGAGTCGGAGGAGCCTATAAAGCCAAGAATAAAGGTCGGTCATTGTAATGACCAACGTAAGAACATCACAAGTCCCAGAGGTAAGTCACAAACCTGGCTCCTTGGAGGCTGCTCCCATTTTGAGCCTCTTCGCCATTGAAGGCTGAGCCTACTCGAGCGTCCACTTTAATCTGAAACAAAAGGAACAAGCGTAAAAAGACCGGCATACAAGAAAACACAGAGGAACAGGAGAACAAAAGTCACAACGTCGAAGAGCTTACCCCACGGGGAGAACAGCTCGCCTGCCGGTGCCCCGACCGGTGGGCCTCGAGCCACCCCGTGTCAAGGTCCCAGACCCCTCGAGGACAGGCGTTGGCCTTGGCCCAGCAACTTCCCCTTGGTGGGCACCGGGACTGGTGCTCCTGCGGCCAGTGTCTCCTTTCTCGGAGGCCGCGGCACGACCGCGAGTCAGTGGCCCCGTCGCCTGAGGCCTAGCATGGCCACCCATCTTGGGCGCTGGGGGAGGGCGCGGGGCAACCTGACCAGTCGCGGGCACCGGGGGGGTGTCGGCACGAGGGCGGTGAGTTCCGCCTGGTCCCTCTTTTGGTGTCCCCATCCGCGGGGCGTCGACGTCACCTCGAGGCGGACCCTCGAGGATGCGGTCGAGGCGAGACGCCATCCCCTCGGAGTCATCGCTGTCCTCATCATCATCTCCACCATCATCGTCGTTGGGGGACTCTTCCTCAGGCTCCCCCCTCTGCCTGAATTTAGACTGACGTGCCTCTAATGCTTGGCGATCGAGGTTTTTCTTTTTCTCCCCTTTCTTCTTAGAGTCCTTGGCGGACTTTAACTTCTCGGCGAACCGGCACCGCGCGTCGCGATCAACCTCGTCCTCCTTCACTGGAGGCCTCGAGGACCGGACATCAATCCGTCCCTGCCAGAACAAAGGTGGATTTAGGAAAAAGGGAAGAAAAGAAACCCAGAATCAAGGCTGCGCACGAGAAGAAAGCATACCAGATCGATCGAGCCTACATCTGGCCTCATGGGGAAGCCGTTAACATGCTCTGGCTTGATGTCACCAGCAATGGCGGCCCTGACCCTGGCCGCGACTTCGTCGTTCGCCGGAGCCTCGCTTGACATCCGGCATGCCTCGAGGTCCCAAGATGAGGCGCCAGGAGCCATCTCGTCCATCCTCAGCGGTCGAGACATCAACGGGAGAACTCTCCGGTGATGGACGGCCAAGAGAACGAGGGCGGCGGTAAAGCCCTCCGAGCGCAGTTTCTTCATGACGTCGAGGAGGGGGTCGAGCCGAGATTGATGAACCTGGACGACGCCGTACGTCCAATTTTCCGGACGCTCCGTGATCAGACGCCCGGTGTAGGCGGGCAGGAGGTCGTCGTCATTTCTCAAGTAGAACCACTAGGAATCCCAGCGGGCGTGGTTGGTCGACAGTCCCACCGGGATGTACTCGCGCGGCCTCTCCGTCTTCTCGGTCCTCAACACGAGGTTGAGGCAACCTGCCAGAACAGGCTTCCTCACGCTGGTGGTCCCAGTGGGGGCGTTGAAGAGCTCGCCCCTGTAGAGGTGGAGCCACAGCTCCCAGTGGGGCATCATCCCCAAATAGCCCTCACACACCGCGGCGAAGACCGCGGCGACGGTGATGGCGTTTGGGGAGAAGTGCTGGAGCTCCACCCCGTAGTGCTGGCAGAGCGCCCGCATGAAGCGGCTCGGGGGAGCGCCCAATCCATGGCGGTGGAACTTGGCAAACGAAACCACATAGCCCTTGGGCGGCCTGGGCTCCCTGTGGTCCGCCGGCGGCGCGATCCACTCCGGCGACGACAGCGAGGTGCGGCGGCGCAGGAGTCCCTCCCTCTCAAGCTCTTGCAGCCGGCGCTCCGTCATCGACGATAGGCGCCAGTCATCGGCGGCGACAAGCCTCATAGGCATTCTAGCCGGAAGGATGGCGGATCCGCTATTACTCGAGGGGGGCACGCGCGCATAGGATGGCAAGGGAACTAAGGCAATGAGAGGGCTAAGGCGAGAATGAAGACGGGAGGCAGAAGGGAGAACAGCGGCGACGCCAGGACACATTTATAGGCAGCTGTCCACCAATGGGCAGATCCGATAAAAGAGGTAGCTCCCCTCCGTAAATGCGCCGTCTAATGGTCCTTTCCCTCCTCTCAGGTGGAGCGCCCCGAATTCCACGCCAACGCAGTGTCATAACGTCTCCCACCTAAAAAGGCGCGCCCAACGGGCAAGAAGGCGAACTACCCACGGTCTTTTCCTTCCCTTGTAAGCCAAGGAGTGCACCCGTGGAAGCCTCGAGAGGTCGCAGGCTGGCCCACTGAAAGGGTTCGATAGCCGATCTCGAGCACCAGAGTCAGGGATCCCTAGCGAGAGGTCGAAGATCGAGGTCCGCCTCGAAGACTTACTGGGGATGTCCAAGGTAGGGTCGAGACAGTTGAGAGGAATGCCCCCGACGGGAGGCATCGAGCCGCCGGACACTATCGAATGAGACCGGTATCCCCGACCACGTCGACCCTGCTTTATGAGAACGCCTCCGGGCTACAGCTGACCCCCTCGAAAGGGGCACAGGTTCTCACTTGGACTACCCGCTAGGAACTCAATCTGGGGTGGAAGACGCTCGCTCTATCGAGAGTACGTCAAAACCTCCGCGCAAAACGAGCCAATCAGAACCTTCCACCACTGGTGTCGATAGCGTTTCTGCGAATTAGGCAATATAACCCTTGAAGGAGTCAAAAACTCCTCCAAGGGCTCGGGGGCTACCCCCGCGGGGTCGCTCGCGCGCCCCCATGGAAATTCGATCGCAAAACAAAGCCTCCACTCGAGCGCCAGCGCTCAAATGGAGACTCGGGGGCTACTGTCGAGGGTATCAGTAAGGGGTACCCTCACCGATGCACATAACGAGACTACCCGTACGCAGGTCGAGGCCCTCAACTCGACGCTTTGGTCATACATATGCGCGGTCGTCGACGACCGCAGCCTCGAAGACGGAAATAGCGTCGAGCGAATCGATCAGGGGTCGAGCGCCAGCTACCGTCGAATACGGAAATGGGCTCGCGCGAACCAGGAGGCGTCGAGTGCAAGGACGCCGCCCGCCGCCTGACGCGCGCACGAGAGCCAAGGCATTAAATGCGCCTGTCGCTTTCCCGCCTAACACGCTGGTCACGGGAAGCGTGATAGGGAACAGGCACCCGTCCCGTCGTTCTTTTTGCAGCCTTCTCCACCAAACGACCCAGAGCATGTCAGGATGCGGGAAGCATGGATGGAACGTCTAATCAGGACCCCCTCGAGGCAGCCAAGGTCAGCGCTCTGGATATCAGGGCATTGCACGGCATCCGACCCTCGATCAGACATGGTTCCTTCTTGGAGACGAGTTGGGCGTCGACTGACAACATCGCAACCACTCCGCCGGATCTGCCGCCATACCGTACAAGCGTGCGACCGGTGAACCAGCCCAAGACGGCGCGCAGAGCCGGATACAGGGGCACGCGTAATCATCATCGAGCTACCAAGATGGGACGGCTCGAGACCACGCCGGTACGGAGGCCTCGAGTAGGTCAGCGCGCCATGCTTCTATCGACCCCTACTCTAACACCTATACATGTACCCTAGGTCTCTCCTTGGAGCTATAAAAGGAAGGACCCGGGATTAGATAGACACACGCAACACTACACCCATACGCAGTAGAACTCCCATACTCCATACCACGCTTGTATTCGCCCCTGTACAAGCACTTAGGTGCAAGATAATACAAACTTCCCTCCCCCACTGGACGTAGGGCCTTCTCTTGCCCGAACCAGGAGAAGTCTCTGTGTCTTCTTGCATCACCATCTGGGAAAGGGAGCACGCATACAAATTTACTCGTTGGTGTGACCCCCCATGGGGAAAACACCGACACAATCTAACTAAGCCAAGTATATAACTATGATAAACTAAGAACAATATAATCTTGAATATAAGCAAGTAGAGCAAAGTCATAAGCAATATATTGAAATAGAACAAAATCATATTCATAATATTGAAGAACAAAGAAAATTAGAAGAACAATTAGAAGCACAATTAGAGAATTACCAAGAATCCTCTTGACAGATCCGGAAACCAATCGAAGATTAAGTCCTTCTAGTTCTAATCCTATGTAGCTATGCTAATCTAGATGTCTAATTGATGTGGTGGCTCTAATCTTGATGAGAGGCTTCTTCTCCCTTGAAGAATAATGAATTAGGGTTGAGAGGCTCTCTCCTCCAGGGGCCAGGGGGTCTGGTTTTATAGTCCCTTCAAGTGAATATGGGCCGTTGGATCAAACCGACATTGATTGAACGGTTATCCTTGATCCTTTAGGTCGGTGGAGATCTCCCCCGAAACAGAGTCCTGATTGGACTCCAATAGAGGGCGGGTGCCCTGGTTACCTGGGCCGGCGCCCAGGTCCTGGCCCCATTCGGCCTCCGCTTCCTTCCCGTGGCTTCTGGAGTCTTCTAGATGTAAGAAAATTGCACGGCACGTTGATATCTCTATGTAACCCCGACGTGTGGGCCTTCCTTTCGTATTTCCTAATAACCCGCTGCAGAAATAGACAAACACAAAAACTCGTAGAATTCTGTCAGATAAAACCCTAAGTCTAGATGTCGATTTCATTTGGATCCTTTTCTTTGTTTATTTGATAATTAAATTTGATACTTAAGGACTGTCAACAAACTCCTCCAAGCTTACCTCTTGCTCGTCCCTGAGCAAGGATAGACTCAGCTATGAAAGTTGTTGTAATGCCTTTAAAAATTGACGGTACACATGCTTTTAAATGATGTCTTATCTCTGAGTTAGAGTAAACTGTCAAGACTTAAAACTTACTTACTTTACCTTTCACCATGGCACTTGTAACCGTCACTTCCATCTTGAGTTGTTAAAAGATATAACAGTCTAGTCAAGTGCCATGTCTCTTATTCTTGATTAGCTATAGCTCTGGAGTTTTTGCAGATTTTCAAATAAAACTCAGAGATTCCTTGTATGATTCTCTTAAATCTCTCTTTTGTCGTATTTCTGGATCCTTACCAAGGCAGTGATGGTATATGCATTCTCTCAATATATATGGTATTTATGGTATAAAGCATATTGCCTTCTCTCTCACCCTACTCTAATATGGCTTTAATATCTGGAGCTCATAGGTGGGAGATAAAGTATACATACTTACAAGACATTTATTGCATAGTCAAACCATGGATCCAAAGAAACAAATCAATAAGTCAAATCAAGATGTGCATGTGTGGCGAATGAATGGTGTATGGTGATGATGGTGTTAACAATGGTGGAAGTCTAATTCTTTTGCTCTTTGAGGGGATACATACCTTCCTTGCTTTTTGAAACTTTATGAGGAGAATGAGATGCTCTTCTTTTTCTTTTCTCTCAGGTGGGTATCTTGTACCCCTAATTCTACTATCGGACACTTGTCCATTTTTACCTCTCGTCTCACTTTTTCTTTTCTTTCGAGGTTCCGGGCACTTGCCCCTTTTTATTTCCTTGTATCTTTTTTTTCTCTTTTTTTAGAGCACTCATCTCTTGAGATAATATAGCAAGTGGTAGTAACAAGATAACTTGAGCATTTATTTCACAGGGAAAAACAGAAATGTTTTTGGCTATTCTCTCCCGGATTAGGAGTAGAATATTTTTAGGTGGTTCTAGAGATGGAAATGGGTGGATATATGTGGACGGTACTTCCGGAGTAGAAGCAGCATATGTGAGTGAACGTGCAAGTGAAATCTTGATTTAACCACATGACAAGCTCCTAAGGGTCTACACAGCTTGACCACACTCAATGCTCATAAGCAGTAAAAAGTAAATGTTGTGGCTCAAAGTCTAGCAAGCATGTATATATAGCTGTGGTAGGAATTTAAACTCTCATCATACAGGAACTCATCATGCAACATTTTAAAGATTTTCAAAGATAAAATTCTCCAGAATTCTAGCATCTCTAGGAACAGATAAACAGCAGCTCAACCTTCCCATATCATATCCGTTAACAACTTAGACTTCAGATCAAGTTTTCATCCCATAAGTTTAGGTCTAGAGCAAGCTTTAAATTATAACAGTTATGTCTAAACTAGTGAGAGAACTTCAAATGTGCAAATTAGGAAGAGCAACTATTCATCATATCCATGCTAGAGTTTTATTCAGATACAGATTAGCATAGCCACTTTATTTATTTATTAAACACACTAAGCAAAAGATATATATATATAAGTATAAAATCTTTATTTGGTTTTTCATAGTTATATTTTAATATAGTATAAGTATAAAGATAGATAGATAGAAATACTTATCGGGATAAATGGGGGTGCTCTCCCCCAAGCTGAATTTTGACGTAATTTCTCTTGATGTAGCTAGCAGGTGGCAGAGGTGTATTTGAAAGTCAGCAGCATTCTGACAGCGATTAGAATATCCTCCGTCTGCTAGTCTTCTTGATTCTTAAAATTCTGTGGAGCTCAAATAGACAACAAAGCTTGTGGAACTGATTAAGTGTTAGCAAAAATATCTATCCTTTATCATGTTGAGACTCCTCAATAACTATTACTCCCTATTTTTATATTTTCATTTTTATAGAGCTGAAAAATATTTATTTTATTTTTATGCCACCATAGTGAATGTACTTATGGGTTTTATGCCACTCGTCTACTCACATGGGGCTTACTGTTTTTCAACATTTTTATTTTCTTTTTAGGATAGTATAAATATAACTAATTAAGTAAACTATTTTAAATAATTGAAAGGGAAAGGATAACTACCAAGTTTACCTCTTGGCAAGGCGTTCGGTATTTTTAAGTCCTCCGAACGGGACTCTTCTCTTTCTCCATTGTCCTAAGATTCGTTGGGTGGCGTAGTCGGTACTTCCGGCGGCGCCTCCTCTTCATGTATAGTTGTCTTCTCTTTCCATACCTGACTCGGTGCTACGGTCTCCTTTGGATAATTCTGTTTAAACTATACGTCTTCTAACCTTACAACTTCTCCATCATAGTCTGCCCATCCGTCCTTGATGATTTGCCTCCTCTGGTTGCGGTTGCGTCGTTTTCTTACCTGCTTAGATTCTTCAAAGATATATTTAGGGTCAGTAAAATAACGGCGTACCTTCTCTAAGGGGAAGTGCATATGGACTTCTCCAGTTTTAATGTAGATGATTGCTTTAACGTTGCTGAGGAATGGTCTTCCAAGGATGATGGGTGGATCGTACTCATCTTCTCCCATGTCAATAACCTAAAAGTCTGTGTAGACAAAATGATCGTCTATTTTGACTGGGACATCAGTTACTGTTCCTTTAACTTCTCGAAATGTCTGATCTGCCATCTGGAGCTGAGTGTATGTTGGTCTTAGGGGCATGGTTCCGAACAAGAGACGATAGGTGACTGCGGCCATTATGTTGACGCCTGATCCGGTGTCGCAAAACGTCTTGTAGAAGTTGTATCCATTTATGGAGCAATAGATGCTTGGCATTCCTGGGTCATCCTTCTTGGTCAAAAACGGTGACTTAAGTTGGTGATCTTGGCCTCCATGAACTACAGTGATCATCTTAGCTGACTCGGTCCACACTTGCTTGTTCCTGTTCCTCCTGTTGGTCCTCTTCCTTGATTCACGACTGGATTGATCTAGGATTTGTGTAGTCTTGTTCCTGAAGAAAAACGTCTCCTTCCTCCCTTTGAAGTAGAAACTGATCTTGGCAGCACTAGCGTAGATGATAGCTCCCGAGGTGTTCAAGAATGACCTCCCTAAATGATGGGTGCCCTCTCATCATTACCGGTCTCTATCACCACGAAGTCTGCTGGGGCATATAAGGTACCAACTCGGACACAAAGGTTCTTCAATATTCCTTTTGGAAAACTTAATGCCTGATCTGCAAACTGCAAACACATGGTTGTCTCTAATAAAGGATATGTAAAGAATTTTTCATAGAGTACCCTGGGTATAATGTTGACGCTAGAGCCAAAGTCGCAGAGTGCTTCTGGGACGTTCACCATGCCGATGGAGATCGGGAAGACGGGCGTCCTGGATCACCTCTCTTGACTGGCAGAAGGTCAGTAGTGAATTCAGTGATGGGGTTACTCCAGTTATTACCTGCATCAAACATGTCTACAAGATTTGCAGATTCTAATCCTTCCGGTTGTGATGGTATACCGGGGTTAGTAGCAGGAACAGCAGCAGATATTTGATTTAACTGAGATTCAATCATTTTATTAAAGCTAATTTGATTCTTGATGGAAGTAGAGAAATTATCCATTCTATTATTTATATTTTCTAGCATTTTATCATTATATGCCAATTTCTTAGATAGGTTATCCATTAGTTTTCCTTGATTAGACACTAACTCTCTCAGAGGTGGAAAATTATTATTATTACTGTAAGAATTGTTACCTTGATAATTACCTGAGTAGTTAGGCCTCTGTTGATTCCAACCTTGATTTTGTTGAGGACGGTTGTAATAGTTGTTGTTGTTATTATTGATGTAGTTCACACCCTCAAGCATCTCAGGACAGTGATTGCCTGAGTGTCCAGTATCTCCACACTCCTCACAAGTCATGTGAGAGTCGTAGATGTGCATAACTTCTTTCTTATCTCCAGCTCTATCGTCGAGCTTCTTCATGAGCAGGTCTAGCTTTGCAGACAGCATGTCTACCTCCTTGAGCTGATGCATACCTCCACCTCTCTTGCGTGTCTAGGTCCTTTCTTCATTCTAGCCTTGGTTGGACGCCATCTTTTCCACAAGAGCTGTGGCTTGTGGTATAGTAAGTGATAAGAATGCTCCTCCGGCTGCAGCATCCATGGTCTCTCGGGCACTGTTGCCGAGCCCATGATAAAACATCTGCATCAATAGCCAACTCTCCATTCCATGATGGGGACATTCTAGGATGTAGTCTTGAAAGCGCTCCCATGCTTCTGGAACGGATTCATCATTTTATTGCTGAAAACTTGTAATCTTCCCACGGAGAGCATTGGTCTTGCCCATGGGAAAGAACTTAGCCAGGAAGTTTGTTGAGCAGAGTGCCCACGTAGTATTCTTCTCCTTTGTAGCGTAGAACCACAGCTTCGCTCTTCCTAACAGTGAGAATGGGAAGAGGCGAAGTAGTATAGCATCTCTGGGGACTCCTGATATGGTAAATGTATTGCAAATCTCCAGGAAGTGTTGTAGATGAGCACTAGCATCTTCGTGTGCCTTTCCACAGAACTGGTTGGATTGCACCATGTTGATAAGTCCAGGCTTGAGCTCAAAGTTGCCATCGATCTCTGCAGCAGGTCCAGTGCGGATGTTGTCCGTAGTGGGAGCTGAGAACTCGCAGATTGATTTGTTCGCCATGGCTTCGAACTCTGAAGACAAGTTTCGGTGATCTTCTTGATTGGATGAAGCTTCTTGCTGAAGTGTTGATGATCTCTTCTTGAGCTTGGCTCTAGTTCTTTTGAATAACGCTTCGGGATTGTCAACAAAATTTCCTAGAAGATGTCTTCTATTCATACATTCCCCTGCATAAGATAAAATAGAAAATATCAGGGTAAAACTGTATGAGAGAATAGATAAGCTCAATCATATTAGTGATGCGAATGATAACTCAAAATCTATATCCATTCCTGATTAGTAATCAACCTTCCCCGGCAACGGCGCTAAAAATGTTTGGTGGGTATTCTTAACATCACTACCAAAAGTAGACAACTTTCTAATTCTAGTAATGGTGCAAAAAATGCCAAACCTATCCCTCATACCACTTAAGACAAGTTGTCATCCCCAGCATGACATGAGAGACGCGGAATTGAAATATGCAATTGCTCTTCTAAATAAATAATGAATGGGATCTGCAAGCGCACAGATTAATGCCGATGTAGCATTTTAACCGGGAAGTATTCAAGGTATCATTATTTATATTTTTACCACTGGGAAGGGATTAACAATCATCAATATTGATTACAGAATAGAATATGAGATTGAGTATCTATCATTGCATGTATAATTGAGAACATTGTATCTAATTCTTTCATACAAGGGTAAGTGTCACATAAAAGATATATGAAATAATGAATAGTGACAAAGGTAATTAGTCTGATCATAACTTAGCCACATATAAATATGATAAGCACCTCAATTAGATACTCTAGAAAGTCATTAGCATGGTATTAGAACGAACTACAAGAATATTTCCTAAGTTATTCTCAACTATATAGTCTAGCATTATCATAGTTAGTGCAAGCATACTTAGCAATCATTGTGAGACAAGACTACGCCCATGCATAGTGATATTAGCAAGGTAAATGAGAAACATAGCAATCTCTACCCTGTAATAATGTTGCTCTGCCAGCCCACGATCTGGCATATTGGGTACAATACATGAGAGGGAGACTATATAAGAATCAATGAAGCTGTCACTATCACGAACTACCCCACGATCTGGCATATTGGGTACAATCGCAGATAAATACGGTATAAGCACCACGCCTACACAATATCTATCATTTACCCATGGATCCGATGGATAAACACTATACGATCCTAAACATGTATATAGATCCAATCTAACTAAGCCAAGTATATAACTATGATAAACTAAGAACAATATAATCTTGAATATAAGCAAGTAGAGCAAAGTCATAAGCAATATATTGAAATAGGACAAAGTCATATTCATAATATTGAAGAACAAAGATAATTAGAAGAACAATTAGAAGCACAATTAGAGAATTACCAAGAATCCTCTTGACAGATCCGGAAACCAATCGAAGATTGACTCCTAGTTCTAATCCTATGTAGCTATGCTAATCTAGATGTCTAATTGATGTGGTGGCTCTAATCTTGATCAGAGGCTTCTTCTCCCTTGAAGAACAATGAATTAGGGTTGAGAGGCTCTCTCCTCCCGGGGCCAGGGGGTCTGGTTTTATAGTCCCTTCAAGTGAATATGGGCCGTTGGATCAAACCGACATTGATTGAACGGTTATCCTTGATCCTTTAGGTCGGTGGAGATCTCCCCCAAAACAGAGTCTTGATTGGACTCCAACAGAGGGCGGGCGCCCTGGTTACCTGGGCGGGCACCCAGGTCCTGGCCCCGTTCGGCCTTCGCTTCCTTCCCGTGGCTTCTAGAGTCTTCTAGATGTAAGATAATTGCTCGGCACGTTGATATCTCTATGTAATCCCGACGTGTGGGACTTTCTTTCGTATTTCCTGATAACCCCCTGCAGAAATAGACAAACACCAAAACTCGTGGAATTCTGTCCGATAAAACCCTAAGTCTAGATGTCGATTTCATTTGGATCCTTTTCTTTGTTTATTTGATAATTAAATTTGATACTTAAGGACCGTCAACACAAGCTTAGAGTCTTAAAATAAGCACTGATCAGATTGTAACATGAGCTTTTAATTATTTGCAATATTACCTGGTGTATTGTGCATATAAGGATAATTGTAAAAATATTCCTTCGGGTATTCTTGTCACTAACCTTTCCAGGATTGGAGCAAGAAGATCAGATGAATGACAAGCACAAGGTATGTCCAACCAATCATCATGCAACACTGAATTAAATTCATCCAAACTTGAAATTTTGCAAAATTCAAGTTTGGGGCAGTACCTTACATAAAAAAAACATCCTTTGTCATGTTGCTATGTTGGTTGTCCCTACCTTTGAGACATGCTCAATTTGTTAAACGCTAATCATTCTATTTTCATCTCCACTTGAGTAAGATCTCTATAATGCTGTTATGCTACCTTTATCTATTCGCAAGTAAGTGTTGGTTTGAAAGTACTCGACATACTTCCATTCGCATTTAAATTAAGCGTGGTGCTTAGGTTAAATAGCCTTCCTTAATCTGATTAGACATGGAGTCTAGTTTGGTTACTGAACTAAAAACTGCCTGAGTAGACATTGGTATATTTTGTTGGACTAACCCCTGCAGGAAAACTGTCAATATCAACCTAGGAAGTCCTTAGATAAACTCACACTGGAGACAAAGAGAGAGACACATCAAGTTTAACAATTTACACAAGGAGGACGTAGCTCATAAGAGATGATCCCTGGAGGGTGCCACAAACACGATGCACAACCGCTAATAAAGGAAAGCTTCCACAAGGTGATACTATACCATCACTCTTCAAGTAAGGTAACATCTTAAAGTACTTGATTATCACTTTTATAAGCTTTTCCTTGGTTCTAGCTTTCACATAAATAAAGAGACAAACAGGTATGATTTATAACTCCAAATTAACCAACCCAACTGATTCAACTTGTTTAGTCCTTTAATCTTTGTTCCTAGTACTACCTCCAAGATCCCACACTCCTAATCATATGAGCTAAAATATTACACATTCAATCTTTGAGAGATATAAAGAAAAAGACATATACATAGATAGATTATCTTTCTATAAGGTTGAAGGGATCTGATCTGACAAATGTTATAAGTGCTACACTCATGAACTTATCATCCATCAACTTTGTCTTGCTCACTATGCTTAAGGTTAGAGAAGAACAAATACACTTTTGGTTTTGTTAGTGTTTTCCACCAACAGGGCCCATGCACTTGATCTCTGCCTTGTCTCTATGAGCAGGTACACTTCAAGCAAAACATGGAGGTGTTTTATAACTCTCAGACTCTACCAAGTGAAGGACCAGGATCTATGAGCATAAACACACTGAATAGGATACTGCCAACGCCGCACTTCGAACTACTGGGCAAATGAAGAACATGGGTGACACCGTATCAAGAGGTGCAGACGCCAAGGTCCTCACCTGAATCAAATGACGCACCTAAAGAATGAACACGGTGAGAAGTCTTGTCTAGAAGACTTAAAACATTGGATCCTTACCGGAAGATAAAATCGGTATTTATCCATATTTATCTTTTCTGCATTCCTTTTCCTTTTTATTCCATCACTTGCATTAGCATATTTACCTTTCCACATTAGCATTAGAAAAGAAAACAAAAAAAATTTTGTTCATTGCACTGCATCATAAAATCTAAAGCATAGATTTGTGGTTTAAAACCCATAGGTATATTGACTGCGGTGGCATAAAATAAATATATTTTCATCTTACAATACAAATATAAAAATAATAAGTGCACGATCCTGCTAAATAAATAAAATTTATTAGGAGGAATCTCAATATGATAAAGGCTAAGAGATATTATGCTAACACTTAACCAGTTCCACAAAGCTTTGTTGTCTATTTGAGCTCCACAGAATTTAAGGATCAAAGAAGACTAGCAGATGGAGGACATCCTAATTGCTGTCAGGGTACTGCCGACATTCAAATACACCTCCGCCACCTGCTAGCTACATCAAAAGAAATTACGTCAAAATCCAGCTTAGGGGAGAGCACCCCCATTTATCCAGCTAAGTGTTTCTACTCGTGTTTATACTTTACTCAAATAATAAAAAGATGCAAAATCATAAAAATCCAAATAAAGATTTTTGTGCTTATATATATATCTTTGCTTAGTTTGCTAAATAAATAAATAAAGTTTGCTATGAACCCTCATGATAAGCTATCACATGGAAATGATGAATAGTTGCTCTGCCATGACTAGTTCTCAAAATTGAAATCTCTCTCAAGTTTAGGCATGACTGTTATGAATTAAGATTTGCTCTAAACCTGAACTTGTGGGAAGAGTACTTGATCTAAAGACTAAGTCGTTAACGGATATAATATGGGAAGGTTGAGCTGTTGTTTATCTGTTCTTAGAAATGCTAGAATTCTCGAGAATTTTATCTTTGAAAATCTTTAAAATGTTGCATGATGAGTTCCTGTATGATGAGAGTTTAAAATCCTACCACAGCCACATGTACATGATTATTAGACTATGAACCATACATTTACTTTTTACTGCTTATGAGCATTGAGTGTGGTCAAGCTGTGTAGACCCTTAGTAGCTTGTCATGCGGTTAAAATCAAGATTCACTTGCACGTTCACTCATACATGTTGCTTCTACTCCGGAAGTACGCATCCACATACATCCACTCATTTCCATCTCCAGATGCACCCAAAGTTATTCTACTCCTATCTAGGATAGAATAGCCAAAAACATTATCCTATCCCTATTATTCCCCGTGAAATAAATGCTCGAGATATTTTGGTTACTACCACTTGCTACATTATTCTAAGAGGGTGAGTGCTCTGAAAAAAAAGAAGAAAAATACGAGAAAATAAAAAGGGGCAAGTGCCCGGAACCTCGAAGAAAAGAAAAAGTGAGACAAGAGGTAAAAATGGACAAGTGTCCGACAGTAGAATTAGGGGTACAAGATACCCACCTGAGAGGAAACAAAAAAATAATATAGAGCATCTCATTCTTCTCAAAAATCTTCAAAGTGCAAGAAAGGTATGTATCCCCTCAAAAGAGCAAAAGTAGAATTAGACTTCCACCATTGTTACCACCATACACCATTCATTCGCCACACATGCACATCTTGATTTGACTTATTGACTTGTTTCTCTGGATCCATGGTTTGACTATGCAATAAATGTCTTGTAAGTATGTATTAGCTGTCTCCCACCTATGAGCTCCAGATATCAAAACCTTGTTAGAGTAGGGTGAGAGAGAAGGCAATATCATTATGCCTCATACCACAAATACCACATACTTTGAGAGAAGGCATATATCATCACTGCCTTGGTAAGGATCC\n>URS000176A646 rRNA from 1 species \nTACAGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGGGCTCGTAGGCGGCCAACTAAGTCAGACGTGAAATCCCTCGGCTTAACCGGGGAACTGCATCTGATACTGGATGGCTTGAGTTCGGGAGAGGGATGTGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCATCCTGGACCGACACTGACGCTGAGGAGCGAAAGCCAGGGGAGCAAACAGG\n>URS0001DA5C55 misc_RNA from 1 species \nGATGAAGAACGCAGCGAAGTGCGATAAGTAATGTGAATTGCAGAATTCCGTGAATCATCGAATCTTTGAACGCAAATTGCACTTTCTGGTATTCCGGAGAGTATGCCTGTTTGAGGGTCAGTGTAATAAAAATAAATCGTGGTTGTTTGCCACCTTTTCGTGGTGACGCTTCGGAATTGAGTCGTCTTTACCCCTTCGGGTTAAGTGACTTAAAATTTTTTCATACGATTTCGAAACGTATTTAATGTATTATTTACGTTCACGAATATCGAATTTTTATTAGGTGCGGTCATTTTTCATGAATTCGCGTCTATAATTTTTTTTTTTTTTTGACCTCAAATCAGGTAAGAATACCCGCTGAACTTAAGCATATCAATAAGCGGAGGA\n>URS00001B9A8C rRNA from 1 species \nCACTGTCACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGATGAAGGCCCTAGGGTTGTAAAGCTCTTTCAGCGAGGAGGATAATGACGTTACTCGCAGAAGAAGCCCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCTAGCGTTGTTCGGAATCACTGGGCGTAAAGCGCACGTAGGCGGACTTTTAAGTCAGGGGTGAAATCCCGGGGCTCAACCCCGGAACTGCCTTTGATACTGGAAGTCTTGAGTCCGAGAGAGGTGAGTGGAACTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGCTCGGTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAG\n>URS0001494730 rRNA from 1 species \nGTGGGGAATATTGGACAATGGGGGGAACCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTTTGGTTGTAAAGCACTTTAAGCGAGGAGGAGGCTACCGAGATTAATACTCTTGGATAGTGGACGTTACTCGCAGAATAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCAAGCGTTAATCGGATTTACTGGGCGTAAAGCGCGCGTAGGTGGCCAATTAAGTCAAATGTGAAATCCCCGAGCTTAACTTGGGAAGTGCATTCGATACTGGTTGGCTAGAGTATGGGAGAGGATGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGATGGCGAAGGCAGCCATCTGGCCTAATACTGACACTGAGGTGCGAAAGCATGGGGAGCAAACAGGATTAGAAACCCTGGTAGTCC\n>URS0000295BDA rRNA from 1 species \nCCCTAGTAACTGCGAGTGAAGCGGGAAAAGCTCAAATTTAAAATCTGGCGGTCTTTGGCTGTCCGAGTTGTAATCTAGAGAAGTGTTATCCGCGCTGGACCGTGTACAAGTCTCCTGGAATGGAGCGTCATAGAGGGTGAGAATCCCGTCTTTGACACGGACTGCCAGGGCTTTGTGATGCGCTCTCAAAGAGTCGAGTTGTTTGGGAATGCAGCTCAAAATGGGTGGTAAATTCCATCTAAAGCTAAATATTGGCGAGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGAAAAGAACTTTGGAAAGAGAGTTAAACAGTACGTGAAATTGCTGAAAGGGAAACGCTTGAAGTCAGTCGCGTTGGCCGGGGATCAACCTTGCTTTTGCTGGGCGTACTTCCCGGTTAATGGGTCAGCATCAATTTTGACCGTTGGATAAAGGTCAGGGGAATGTGGCATCTTCGGATGTGTTATAGCCCTTGGTCGCATACAACGGTTGGGATTGAGGAACTCAGCACGCCGCAAGGCCGGGTATTTATACTACGTTCGTGCTTAGGATGCTGGCATAATGGCTTTAATCGACCCGTCTTGAAACACGGACCAAGGAGTCTAACATGCCTGCGAGTGTTTGGGTGGAAAACCCGAGCGCGTAATGAAAGTGAAAGTTGAGATCCCTGTCGTGGGGAGCATCGACGCCCGGACCAGACCTTCTGTGACGGATCCGCGGTAGAGCATKTATGTTGGGACCC\n>URS0000468D61 rRNA from 1 species \nGACTAACAATGGTTAGTTGAGTGGCTAAGCGAAAGTGATAAGTGACCCACCTGGGGAGTACGCTCGCAAGAGTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCAGGGCTTAAATGTAAGTTGCATGGACCAGAGATGGACCTTTCTTCGGACTACTTACAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCAGGTTAAGTCCTATAACGAGCGCAACCCCTGTTGTTAGTTGCCAGCAAGTAAAGTTGGGTACTCTAGCGAGACTGCCGGTGCAAACCGTGAGGAAGGTGGGGACGACGTCAAATCATCACGGCCCTTACGTCCTGGGCTACACACGTGCTACAATGGTCGGTACAGAGAGCAGCCACTACGCGAGTAGGAGCGAATCTTCAAAGCCGATCTCAGTTCGGATCGCAGTCTGCAACTCGACTGCGTGAAGCTGGAATCGCTAGTAATCGCATATCAGCCATGATGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCAAGCCATGGAAGCTGGGGGTACCTGAAGTCGGTGACCGTAAGGAGCTGCCTAGGGTAAAACTAGTAACTGGGGCTAAGTCGTAACAAGGTAACCGTAA\n>URS0001AC9055 rRNA from 1 species \nTGAGAGAAAGGGGGCCTCTGCTTGCAAGCTCTCGCTATGAGATGAGCCCGCGTCCGATTAGCTAGTTGGTAGGGTAAAGGCCTACCAAGGCGACGATCGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCCTGCGGGTTGTAAAGCACTTTCAATTGGGAAGAAAAGCCTGAGGTTAATAGCCTCGGGTCTTGACGTTACCTTTAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATCACTGGGCGTAAAGCGCGCGTAGGCGGCTTGATAAGTCAGATGTGAAAGCCCCGGCTTAACCTGGGAATTGCATTTGATACTGTCTGGCTCGAGTATGGTAGAGGGGGGTGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCAGTGGCGAAGGCGACCCCCTGGACCAATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGACTAGCCGTTGGGCTCATTTAAGGGTTTAGTGGCGCAGCTAACGCGATAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCAGCCCTTGACATCCAGTGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAGCACTGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCAGCACATAATGGTGGGAACTCTAAGGAGACTGCCGGTGATAAACCGGAGGGAGGTGGGGATGACGTCAAGTCATCATGGCCCTTATGGGCTGGGCTACACACGTGCTACAATGGCCGGTACAAAGGGTTGCGAAGCAGCGATGTGGAGCTAATCCCGGAAAACCGGTCGTAGTCCGGATTGCAGTCTGCAACTCGACTGCATGAAGTCGGAATCGCTAGTAATCGCGAATCAGAATGTCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTGGTTGCACCAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACGGTGTGGTCAATGACTGGGGTGAAGTCGAAACAAGGTA\n>URS000014146A rRNA from 1 species \nGATGAACGCTAGCGGCAGGCTTAATACATGCAAGTCGAGGGGCAGCGGGGTAGCAATACCGCCGGCGACCGGCAAACGGGTGCGGAACACGTACAGAACCTTCCTTTAAGCGGGGGAGTAGCCCACTAGAAATGTGGATTAATACCCACTAGTAATGTTTAATGGCATCATTAGATATTTAAAGTATTTATCACTTAAAGATGGCTGTGCGGCTGATTAGGTAGTTGGTGCGGGTAACGGCCCACCAA\n>URS0002127D47 rRNA from 1 species \nTAATTTATTGGGGGTAGAGCACTGAATGTGCTAGGGGGCCTACAAGCTTACCAACCCCAATTAAACTCCGAATACCGATTACATGATGTACAGCAGTGAGGCTATGGGTGATAAGGTTCATAGCCAAGAGGGAAACAACCCAGATCATCAGCTAAGGTCCCAAAATTGATACTAAGTGATAAAGGATGTGGAATCGCCCAGACAGCTAGGAGGTTGGCTTAGAAGCAGCCATCCTTTAAAGAAAGCGTAACAGCTCACTAGTCAAGGGGTTCTGCGCCGATAATTTCCGGGACTAAGTATCATACCGAAGCTATGGGATTCATTCGATTCGAATGAATCGGTAGACGAGCGTTCTATTAACTTGTGAAGGTTGACCCGTGAGGGCAGCTGGAGGAGATAGAAATGAGTATGCTGGAATGAGTAGCGATAAAGCCTGTGAAATGCAGGCTCGCCGTAAGCGTAAGGTTTCCTGAGTAAAGTTAATCTGCTCAGGGTTAGTCGGACCCTAAGCCGAGGCCGAAAGGCGTAGGCGATGGAAAACAGGTTTAATATTCCTGTACCAGTTTAATATTGTTTGAACTATGGGGGGACGCAGAAGTGAAAGGAGATCCCGGTTTTGATTGTCCGGGTTTAAGAGTGTAGGGAGTTCTGATAGGTAAATCCGTTGGAATAATCCTGAGACTCGAATAGGAGGGCTTAGCCCACAAACTCTCCCTAATCCTGCTGCCAAGAAAATCCTCTATGTTAGATATTTGACTGACCGTACCGTAAACGGACACACGTACGCGAGGAGAGTATCCTAAGGCGCTTGAGAGAATCCAAGTAAAGGAACTAGGCAAATTAGCCCCGTAACTTCGGGAGAAGGGGTGCCAATTAAGGAAAAGAACTTCGCGTTCTGCTTTTTATTTGGCCGCAGTGACCAGGCCCAAGCGACTGTTTACTAAAAACACAGGTCTCTGCTAAGTCGTAAGACGAAATATAGGGACTGACACCTGCCCGGTGCTGGAAGGTTAAATGGAGAGGTTAGCTTCGGCGAAGCTTTGAAACGAAGCCCCAGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCTGCACGAATGGTGTAACGATTTGGGCACTGTCTCTACTTGGAGCTCAGCGAAATTGAAGTGTCGGTGAAGATGCCGGCTACCCGCGGCCGGACGAAAAGACCCCGTGCACCTTTACTACAACTTATCATTGAATACTGATTCTGCTTGTGCAGGATAGGTGGGAGACTTTGAAGCAGTAGCGCTAGTTATTGTGGAGTCATCCTTGAAATACCACCCTTGTATTGTTAGTATTCTAATCCCATCCCGTGAATCCGGGTGAGAAACAGTGGTAGGTGGGTAGTTTGACTGGGGCGGTCTCCTCCCAAAAAGTAACGGAGGAACCCAAAGGTTCCCTCAGCATGGTCGGTAATCATGCGAAGAGCGCAAAGGCATAAGGGAGCTTAACTGTGAGGTCGACGGACCGAGCAGGTACGAAAGTAGGGCTTAGTGATCTGGTGGTTCCGTATGGAAGGGCCATCACTCAATGGATAAAAGGTACGCCGGGGATAACAGGCTTATCTCCCCCAAGAGTTCATATCGACGGGGAGGTTTGGCACCTCGATGTCGGCTCATCACATCCTGGGGCTGGAGAAGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGTGGTACGTGAGCTGG\n>URS0000ADD2ED rRNA from 1 species \nAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGCAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGAAAACTGGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACGCTGATGTGCGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAATCTTGACATCCTTTGACAACTCTAGAGATAGAGCTTTCCCCTTCGGGGGACAAAGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTAAGCTTAGTTGCCATCATTAAGTTGGGCACTCTAAGTTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGATTTGGGCTACACACGTGCTACAATGGACAATACAAAGGGCAGCGAAACCGTGAGGTCAAGCAAATCCCATAAAGTTGTTCTCAGTTCGGATTGTAGTCTGCAACTCGACTACATGAAGCTGGAATCGCTAGTAATCGTAGATCAGCATGCTACGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGCCGGTGGAGTAACCTTTTAGGAGCTAGCCGTCGAAGGTGGGACAAATGATTGGGGTGAAGTCGTAACAAGGTAGCCGTATCGGAAGGTGCGGCTGGATCACCTCCTTTCTAAGGA\n>URS0000EBB953 lncRNA from 1 species \nGGAAGAGAAGGAGGAGGAGGAGGAGGAGGAGAAAGTGGCTCTCAGCGGCCGGTCGGATTAAAAGTAACCAGACTCGTCCAGAAAACTGCGTCCAGGAAGGAAGTGACAGAAGACGAATGGGAAAAGGAGAACAGCTCACAGCGTTTGAAACATCGCGGCACCACTTTCAGATAAAAACATAGACCTGAATGGCATCATCCAGTATCCAAGGAAACCATGTTCTCTAAACATGAATATGCCTTTGGGGGAAGACAGAAGAACATGGAAGCCATGTGAAAAAAACGGATCCTAAGGCAGTTTTGAACATCTGGAGGCCTGATTTATTGGAGATTGCAAATGTACAGTGTAACATAGCTGTGGAGAGCGAGAAGATCAGGATTGTCAATGCTGTCATTGCTTTTACTGGAATCCCCAGCACGAATTGAAGGTCTCACTTTGCCACCTAGGCTGGATGCAATGCAACGGTATGTTGATCTTGGTTCACTGCAGCCTCAACCTCCTGAGCTCATGTGATCCTCCCACCTCAGTCCCCCACGTCGCTTGGATTACAGGCCTGTGCCACCACACCTGGCTAACTTTTTTTGTAATTTTTGTAGAGACAGGGTCTCACTATGTTTCCCATGCTGGTCTTTAATGCCTGAGCTCAAGCCATCCGCCTGCCTCGGCCTCCCAAATTGCTGGGATTACAGGCATGAGCCACCATGCCCAGCCTAATTCTTCTAAATCTTATCCTAGTAATTAAGCCAGAATTTTTCTCTGCCAAGACCAATAGATGGACCAAGAAGTACTCATCCTTGTAAACTTTCTTTGGATAAATTGCTTACATATAATAAATTCAGAGTTAAGTAATAAAAATAATGAACTACTGTCTTG\n>URS000194FCEC lncRNA from 13 species \nATCTCCAGACCCAGTCAGACTTTCAGACACTGAAGTTTTGGCTGACATTTTGACTACATCTTCGTGAGAGTGCCCAAGGCAGAACCACCCAGCCAAGCCACTCTGACTCCTGATCCATAGAGACAGTGTGCGACAGCACAGGATTATTGTTGTGCGAAGTCATGAGTATTTGAGGCAATTGTTATGTAGCTTTAGCTAATAGAGACCTATTCTGCGGCTTAGGAGGAAGTGAGAATAGAGCCAGTTTGGGGGCTCCAGGAACCTACAGTCTCCAGGTGACCAAGCAGACACTGACGAAATATGAAGGCGCTGGGGCTGGAGAGAGACGACGTCTACTGGGCCTGATAATGGACTCAAAACTACAGAAGTAAACACAGGAAGGAAAAAAGTACCGAGAGAGAGGGGTGAGCTGCTGACAGAGGCTTAGGGACCATTTGGAATCGCGCAGACCTGGATTCAAATCCTCACTCCATCACTTTAGTCTTGGGAACTCAAGCAAATTACTTAAACTCCTTATAGAGTCCCAGATTCCTGTAACAGCAGCATGGATCCTTGCTGCAATGAGGATTAAGCAGAATATGTCACTGAAAATGAAATGAAATGAGAAGCCCCTAACCCAGCCCCCTAGCTCATGG\n>URS00011AB3B6 rRNA from 1 species \nTGGCTCAGATTGAACGCTGGCGGTATGCTTAACACATGCAAGTCGAACGGTAGATACTTCGGTATCGAGAGCGGCGGACGGGTGAGTAACGCGTAGGAATCTGCCCAGTAGTGGGGGACAACCAGAGGAAACTCGGGCTAATACCGCATACGCCCTAAGGGGGAAAGCGAGGGATCTTCGGACCTCGTGCTATCAGATGAGCCTGCGTCGGATTAGCTAGTTGGTAGGGTAAAGGCCTACCAAGGCAACGATCCGTAGCTGGTTTGAGAGCGCGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATACCGCGTGTGTGAAGAAGGCCTTAGGGTTGTAAAGCACTTTCAGCAGTGAGGAAAAACTTAAGATTAATAACCTTAGGCTTGACGTTAACTGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGGGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCGCGTAGGTGGTTTGGTCAGTCGGATGTGAAAGCCCTGGGCTCAACCTGGGAACTGCATTCGATACTGCCTGACTAGAGTGTGGTAGAGGAGAGTGGAATTTCAGGTGTAGCGGTGAAATGCGTAGATATCTGAAGGAACACCAGTGGCGAAGGCGGCTCTCTGGACCAACACTGACGCTGAGGTGCGAAAGCGTGGGTAGCAAACGGGATTAGATACCCCGGTAGTCCACGCCGTAAACGATGTCTACTAGCCGTTGGGTTCCTTGAGGACTTAGTGGCGCAGCTAACGCATTAAGTAGACCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATATGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACCCTTGACATACAGAGAACTTTCTAGAGATAGATTGGTGCCTTCGGGAACTCTGATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTATCCTTAGTTGCTACCATTAAGAGTTGGCCACTTTAAGGAGACTGCCGGTGATAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGGGTTGGGCTACACACGTGCTACAATGGCTGGTACAGAGGGCTGCTAACTTGCGAGAGTACGCTAATCCCTTAAAGCCAGTCCTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGCTGGAATCGCTAGTAATCGCGGATCAGAATGCCGCGGTGAATTCGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTGGGTAGGCTAACCTTCGGGAGGCCGCTCACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAGCCCTA\n>URS00016A699B rRNA from 1 species \nTGGGGAATTTTGGACAATGGGGGGAACCCTGATCCAGCCATCCCGCGTGTGCGATGAAGGCCTTCGGGTTGTAAAGCACTTTTGGCAGGAAAGAAACGTCGCGGGTTAATACCCCGCGAAACTGACGGTACCTGCAGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTCGGAAAGAAAGATGTGAAATCCCAGAGCTTAACTTTGGAACTGCATTTTTAACTACCGGGCTAGAGTGTGTCAGAGGGAGGTGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAGCCTCCTGGGATAACACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCAACTAGCTGTTGGGGCCTTCGGGCCTTGGTAGCGCAGCTAACGCGTGAAGTTGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTC\n>URS0000BC3C0C rRNA from 1 species \nTTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGGCAATGGGCGCAAGCCTGACCCAGCAACGCCGCGTGAAGGAAGAAGGCTTTCGGGTTGTAAACTTCTTTTGACAGGGAAGAGCAGAAGACGGTACCTGTCGAATAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTACTGGGTGTAAAGGGCGCGTAGGCGGGATGGCAAGTCAGATGTGAAATCCAAGGGCTCAACCCTTGAACTGCATTTGAAACTGTCGTTCTTGAGTACTGGAGAGGTTGACGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGTCAACTGGACAGCAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGCC\n>URS0002274C91 rRNA from 1 species \nAATGCCGGATGCTCCGACTCCTCGCATGGGGTGTCGGGAAAGATTTCATCGGTATGGGATGGGGTCGCGTCCTATCAGGTAGTCGGCGGGGTAACGGCCCACCGAGCCTACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTTGATCGGGAGCAAGCCTTCGGGTGAGTGTACCTTTCGAATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTATCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTCGTCGCGTCCGGTGTGAAAGTCCATCGCTTAACGGTGGATCTGCGCCGGGTACGGGCGGGCTGGAGTGCGGTAGGGGAGACTGGAATTCCCGGTGTAACGGTGGAATGTGTAGATATCG\n>URS0001B5E2EE rRNA from 1 species \nGGGATAACTACTGGAAACGGTAGCTAATACCGCATAACGTCGCAAGACCAAAGAGGGGGACCCTCGGGCCTCTTGCCATCGGATGTGCCCAGATGGGATTAGCTTGTTGGTGGGGTAACGGCTCACCAAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGATACTGGCAAGCTTGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCACGGAAGTTTTCAGAGATGAGAATGTGCCTTCGGGAACCGTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTCCGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTGGATCAGAATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTAGGGGAACCTGCGGTTG\n>URS00005D6907 rRNA from 1 species \nTGCCCGAACGTAACACGACACCACCGTCCGCCAAATAACTACGAGTACAAACTTAAAATTTAAAGGACTTGACGGTATTTCACACTCAACCTAGAGGAGCCTGTCTACTAACCGATAACCCACGATTAACCCAACCGCTTCTAGCCCCCAGCCTATATACCACCGTCGCCAGCCTACCTTATAAAAGAAACAAAGTGAGCTAAACAGTAATACACTAAAACGACAGGTCAAGGTGTAGCTAATGAATCGGATTAGGATGGGCTACATTTTCTAACCCAGACTATACGAACCAGGCCATGAAACAAGCCTTCGAAGGCGGATTTAGTAGTAAGCCGAGAACATAATACTCAACTGAAACCAATGCAATGAAATGCGT\n>URS0000822125 rRNA from 1 species \nACATGCAAGTCGAGGGGCATCGGGATGTAGCAATACATTGCCGGCGACCGGCGCACGGGTGAGTAACACGTATCCAACCTGCCTTTTACTCGGGGATAGGCTTTCGAAAGAAAGATTAATACCCGATGGCATAATCTTCCGCATGGTAGAATTATTAAAGAATTTCGGTCATCAATGGGGATGCGTTCCATTAGGTTGTTGGCGGGGTAACGGCCCACCAAGCCTTCGATGGATAGGGGTTCTGAGAGGAAGGTCCCCACATTGGAACTGAGACACGGTCCAAACTCC\n>URS0001663DCE rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAACGCAGTGGGGACGGGTGCGTAACACGTGGGTAACCTCCCATCAGAGGGGATAACCCTTGGAAACAGGTGCTAAACCGATACTGATGGATGGACCCGCGGGGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCCACGATGCCTAGCGGGCCTGAGAGGGTGATCTGCCACACTGGGACTGAGACACGGGCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGTGTGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTATTAGAGAAGCGTTATCTAACCAGGAAGCCACGGCTAACTCCGTGCCAGCAGCCGCGGTAATTC\n>URS00009B24CA lncRNA from 1 species \nGGCCAGAAGAGCAGTTCTCCAGGCCCAGAAGTAAGCTACACCCACAATTCTGTATGCAGCTGTGAGAAAGGAGAGTGGAAATCCAAGTCAATGCAGTATCACCGTGTTCCCAATCACGAGTATTCCACTGGGCCCACTGGCTGCCAAGACATGGATGGGATCCAGTGGTGAGCCTGCCCCAGCACATGAAACACATGCTTGGGAAACAGTGCCTGACTGGATGGAGCCCTCTGGTACCCTCAAAGAGAAGCAACTCGCCTCATGACGGCAAGAACTGTAAAACAAAGCTAGGATTTTACCCCTACTGGGCCATCCACGCTTTTAGAACCACAGATTCTCAGGGAATGCAGCATTAACCTACATACAGCTAGAAAATTGACAGTAGCATATCTCAACCCAATTACCTTGAATCACAACTCTGGTAAAAGTTTTAGCAATGGAAGAGTTAAAATGATTCACTAGATGGAAGTTTTTGATAATTTGTTGACTTTAGCCATGGATAATTAAGAGTGATGGAATCCTCGTTTCACTATCAAGGAAGCTGCAGTCAAGGTCAAACAGATGAGCGCCCTGGAATTCCATGGAAGACAGCACAAAACCAATAAAACCACTGGTGTTCAGTT\n>URS000183F9F2 rRNA from 1 species \nGACGAGGGCGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGCTTGTTGCGTCAGCTGTGAAAACCCGCAGCTCAACTGTGGGCTTGCAGCTGATACGGGCAGGCTAGAGGTAGGTAGGGGAGAATGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATACTGACGTGGAGGAGCGAAAAGCGTGGGGGAGC\n>URS00021C87A3 rRNA from 1 species \nTCGCGTCGGGAGTGAAAACACCGGGCTTAACTCGGTGCTTGCTTTCGATACGGGCAGACTAGAGGTATGCAGGGGAGAATGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGTTCTCTGGGCATTACCTGACGCTGAGGAGCGAAAGTGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACACCGTAAACGTTGGGCGCTAGGTGTGGGGCCTATTCCATGGGTTCCGTGCCGTAGCTAACGCATTAAGCGCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGGTTTGACATACACCGGAAGCCTCTAGAGATAGAGGTCTCTTTGATACTGGTGTACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGTTCCATGTTGCCAGCACGTAATGGTGGGGACTCATGGGAGACTGCCGGGGTCAACTCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGTCCAGGGCTTCACGCATGCTACAATGGCCGGTACAAAGGGCTGCGATCCCGTGAGGGGGAGCGAATCCCAAAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCCCATGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACGTCACGAAAGTCGGCAACACCCGAAGCCGGTGGCCTAACCC\n>URS00006073C1 rRNA from 1 species \nAACGAACGCTGGCGGCAGGCCTCAAACATGCAAGTCTAGCGGGCGTAGCAATACGTCAGCGGCGGACGGGTGCGTAACACGTGGGAACGTACCCTTTGGTTCGGAACAACTCAGGGAAACTTGAGCTAATACCGGATGTGCCCGAAAGGGGAAAGATTTATCGCCAAAGGATCGGCCCGCGTTCGATTAGCTAGTTGGTGAGGTAATGGCTCACCAAGGCGACGATCGATAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTTGGGAATCTTGGACAATGGGGGAAACCCTGATCCAGCCATGCCGCGTGAGTGATGAAGGCCTTCGGGTTGTAAAACTCTTTCGACGGGGACGATAATRRCGG\n>URS0000627A27 tRNA from 1 species \nGCAGTCGTGGCCGAGTGGTTAAGGCGATCGACTAGATATCCATTGGGGTCTCCCCGCAAAGGTTCGAATCCTGTTGACTGCG\n>URS000100738B rRNA from 1 species \nTACAGAGACTGCAAGCGTTATTCGGATTCACTGGGCGTAAAGGGCGCGTAGGCGGCCACTGCAAGTCAGTTGTGAAATCTCCGGGCTTAACCCGGAAAGGTCAACTGATACTGCAGGGCTAGAGTGCAGAAGGGGCAACTGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCTGACACTGACGCTGAGGCGCGAAAGCCAGGGGAGCGAACGGG\n>URS00004CBF81 rRNA from 1 species \nAGAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGGCAGCACGGTAAGAGCTTGCTCTTATGGGTGGCGAGTGGCGGACGGGTGAGGAATACATCGGAATCTACCTTTTGGTGGGGGATAACGTAGGGAAACTTACGCTAATACCGCATACGCCCTTCGGGGAAAGCCGGGGACCAGCAATGGCCTGGTGCTGATAGATGAGCCGATGTCGGATTAGCTAGTCGGTGAGGTAATGGCTCAACAACGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCACGACCACACGTCGAACTGACGACACGGTCCA\n>URS00017EC46A rRNA from 1 species \nCCCTTAGATGTTCTGGGCCGCACGCGCGCTACAATGATGAATTCAACGAGTTTATAACCTTGGTTGAAAGGCCTGGGTAATCTTTTGAACTTTCGTCGTGATGGGGCTAGACCCTTGCAATTATTGGTCTCCAACGAGGAATTCCTAGTAAACGCAAGTCATCAGCTTGCATTGATTACGTCCCTGCCCTTTGTACACATTGCCCGTCGCACCTACCGATTGAATGGTCCGGTGAAATCTTCGGATTGAGACTTTGTTTTCTTCACGGAAAACGCTGTTTTAAAAAGTTGATTAAACCTTACCATTTAGAGGAAGGTGAAGTCGTAACA\n>URS000026EF3C rRNA from 1 species \nTAGGGAATCTTGCACAATGGGCGGAAGCCTGATGCAGCGACGCCGCGTGAGGGATGAAGGCCTTCGGGTCGTAAACCTCTGTCCTTGGGGACGATGATGACGGTACCCAAGGAGGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCGAGCGTTGTCCGGAATCACTGGGCGTAGAGGGTGCGTAGGCGGCCTAGCAAGTCCTGTGTGAAAGGTCTCGGCTTAACCGGGGAGGGTCATGGGAAACTGTTAGGCTTGAGTGCCGGAGAGGGCAGTGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCAGTGGCGAAGGCGACTGCCTGGACGGTAACTGACGCTGAGGCACGACAGCTGGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCCAGCCGTAAACGATGAGTGCTAGGTGTTGGGGGTATCGACCCCTCCAGTGCCGTAGTTAACGCAATAAGCACTCCGCCTGGGGAGTACGGTCGCAAGACTG\n>URS0001CAC1D5 rRNA from 1 species \nAGCGAACGCTGGCGGCAGGCTTAACACATGCAAGTCGAGCGGGCCCTTCGGGGTCAGCGGCGGACGGGTGAGTAACGCGTGGGAACGTGCCTTCTGGTCTGGAATAACCCTGGGAAACTCGGGCTAATACCGGATACGCCCTTTTGGGGAAAGGTTTACTGCCGGATGATCGGCCCGCGTCTGATTAGCTAGTTGGTGGGGTAACGGCCTACCAAGGCGACGCTCAGTAGCTGGTCTGAGAGGAGGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGTAGAAGTGGGGAATATTGGACAAGGGGCGCAAGCCTGAGCAAGCCAGGCCGCGGGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCGTTTATCCGGGACGATAATGACGGTACCGGAGGAATAAGCCCCGGCTAACTTCGTG\n>URS0000D28D64 lncRNA from 1 species \nAAGAAGTCCTACCACTGAAAGGATGTGCGGGTAGAAATGAGCAATTGCAACTAGAAGAGCCTGTGTGCCCACAATCAGGGGTGAGGAGGAGTGTCATGGAGCAGCTCTCTACTGCCCTGAGAATGACATCCCCACTGTTCACCATGGCCTTAAATCCCCTGCGAATTCCACCTCATCCTCTGCCACTTCCCGTCACTGCTCTGAAGATGCCCTGATCTTGTTTCAGTCCCTTGGATGTACCCAGCTCTTCTCCATCTTTGCATGTGTCATAGCCTCTTCCTGGAAAACCCTTCCTGCTGCTCATCCCAGAACTGACTCTCCATGTATTTACTCTTATTTTGAGAGAAGGGGGCATTTCCACCACCAGAAGGGAACTTGCTATCTTGGTAGCGTTGTCCCCTGACACCTGGCACATCTACTCTATACAGTCACCATTCAAGTGGATGTTGAATGAGTACACTTGTTTCACAGTTTGGTTGGGTAAGCCCCAAAGCTTGGTTCCCGGTAGGATCAGGCTTTATGAGTGGGCTGAGTTTCTATAAAAGTCTCCCTACCAGTTTCCAATCTTGGTGAAACTA\n>URS0000DCF6EE rRNA from 1 species \nTAGGGAATATTAGAAATGGACGAAAGTCTGATCTAGCAACACCGCGTGTGCGAAGAAGGCCTTCGGGTCGTAAAGCACTTTTTGGAAGGAATAGGAAGGAATGTACTTCCAGAATAAGTCTCGGCTAACTACGTGCCAGCAGCCGCGGTAACAAGTAGGAGGCGACCGTTATACGAATTTACTGGGCGTAAAGCGCGTGTAGGTGGTTCTGTAAGTAGGGCGTGAAAGCTCCTGGCTCAACTGGGAGAGGCCGTTCTAAACTACAGAACTAGAGGATGGTAGAGGGAGGTGGAATTCCAGGTGTAGCGGTGGAATGCGCAGATATCTGGAGGAACACCAGTGGCGAAGGCGGCCTCCTGGACCATTCCTGACACTCAGACGCGAAAGCTAGGGTAGCAAACG\n>URS000241AE0D lncRNA from 1 species \nTGGTTCAGATTTAATATAAATCCTAGTCTAGTCCCCTTGGGTTGCAAAGGAATCTCTCTTTCAGTTCCTTGAAATTTTTTGGTACAGGTGTATTGATGTTGTTGAACATACATCAATATCTTGTCAAAGTATAAGTATCTTTCTGAGTTTTGATGCAATGTCTCACCAGTGTTTTTCTCTCTTTCATCTCTCTACTTATTACACAGTAATAGACTATACTTCTTGTTTGGTGTAGAACAAAAAGCTTGATAATAGTTCGATCAAAGTATGTTTATGTCATTAGACCTTTGATTGTATATATATATGACTTGAGAGAAGATCTTCTTGATTGGAGCAGATCTTTGAGAGATAGGCAATCCAAAAGAATTGATCCTTGAAATGAACCTTAATTGATTCCTTTCAGAAATAAGTTGGAACTTTCCTATACTTGGACCCTGAAGTACGGCGTGATAGATGTTGCTTCCTCGATCAGCGTAACTTGATATCTTTTGCAAATCTTCCATATAATGCGTCTGATATGATTGCCCTTAACTTTCGTGATTAAGAATTGAGACTGGATATTGATCTTCCTTGATCCCTGTGATTTGGAACTAAGAGCAGAATTGATTCTTCAATCTTAGCCTTCCTTCTTTGGATAGCTTCTGAATCATTAGTTGGCTCTTACTTCCTTCTTTGGATAGCTTCCAGATCCTTGATTGCCTGCAATAGAAATAAGTTATTGTTTACCATTAAAACTCAGATCTAACATTAACAAGTATGAGTTGGAAATGGTTTAAAGGTCTTTTAATTATATATTAGGCTATCAACTAGGTAATTGGCTGTAGCAAGTATGATTTGATAGCTTTAAGAAATAGAAAATATCCCATTATAGTTGGTTACAACATAGTAGTTAAATAAAATTTTAATGGGAAAAGCATAAAAAGAACCCCAAACTTATTTCGGATTACCAGATACACATTTAAACTTTGCGAGTGTCTTGTGACTCCCTTATACTATTTTGAACTAGAATTATTAACTCCCTAAGGAGTCGTTTGGTATGAGGTATAAGTACAAATAGTGTTGGAATAAAAATTTAATACCACCTTAATATTTTATTTGGTTAGCAAACCTGAGATAAGTTATCTCGGGATTAAAATAAATACCGGGATAACTTATACCTTGTAGGGTGTGGAGTAATTAGTGTCGGGATAGCTTATACCTTCTTCTTAGAAATTATGTAAATATCATTTTTAATACAACATACCAAACAGTGGATAAAAAATAATCTCAGCATAACTAATCCCAGCATAACTTATCCTAGCATAACCTATATTCAAACCAAACGACCCTTAAGTGTTGAGGCGGTAAAGAAAGTGTAATCCGGGACATTTTTGATAGCGTTTTTATGCTTTTTCCAGATTTTACGTTCGCAATGTCTATATATCAAATACAATTTTGAAAACCATGCCACTTGATGGTGTACATAACTTGTTTGTTTTCGAAATGAATCTGATTTTTGCACCAAATCTGCGCGAGTTCCCTGAATTTATAGCTACGGGACCTATGAATTTTCTATTTTTCAGTTTTCTTAATTCTGAGCTAGCACTAGGCAAAGAAACTTTCATGAAAGACCCATAGAAACCAAGAGAATAGCAAAAGATACACAAGAATTGAAGAAGTATACAAAATTCAATTTGATAATGAAAAATCTGTGACATAAGTCTAGAGGTCAATATGTGACAGTTCATTCATAGTATTATGAACTCATGAGTAACTTCATGGATACTGTTAAGTGGTCCTAGCATAATTGAAATTTTGCTATTTTTTTTATCAACAGTATTAAAAGTTATATGATTTAAAAAAAAGATGTGGATTTAATTTTGTGGGCATGGGAGGTTTCCAAAATTGCAAATTAAAATTAAAGTTATTCATCATGAAAGAAAATCAGATACTCCACTAAAATGACAATTTAATTTTTATCTTATAATGATCTATCGTTTTGAGTCAATGACTAAACTATTCTATTTGCTTCCTTCGGAAATCCCATTTATTTGGAGAAGAAATCAAAAAAACAGTCAACAGATTCTTAAAGTATGAAAAAGACAATATTTAAGAATTAAATTGCCATGAGATGGCTTAAGAGTTAAGACTCGTGGGAATTCACCTCTTGCTTGGTTTTTGTCCAAAAATAAATTAAATGAATAAATCTTGTTGCGTGCAATATAATTGTGTAAGAATGACATTAGAAAATAGAGGAAAACTAAATTATAACACAAATATTTGTTGTTATAGCGAATCTACGGTATCTTACGTGTTGATTGTGTTATCATCTTCTCTGTCGTTGGTGTCTTTCACCGTTAGTTCTGGATCATCCGATAAGTCGTCGTCTTCTTCTTGGAATGAAATGGTGTTTTTTGTCGTTGTGATAGAAATATCTGTGGTTAAGGTGTTTTTGTGATGGTGGTGTGGAGTGGTGAGGTTGTGTGATAACACGGGTATGCCCCATCTATGTCCGTGTATTTCTTGT\n>URS000033F791 rRNA from 1 species \nACCGCCCGTCCAAGCCATGGGAGCCGGGAGTGCCTGAAGTGCGTGAGCGCAAGCAGCGCCCTAAGGTAAACCGGTGACTGGGGCTAAGTCGTAACAAGGTAGC\n>URS0002366112 lncRNA from 1 species \nTTTTAAAAGGCATCCAATAATTCTTGTGGCCATATATCAATTCATGTAAGTTTGATTGTAATTATTGGTGAAGGGGTTTCACTTCCCGTCTCTAAATAAAAATACTGATTCTTTAAGGTACATGCCACTAGGGATTGCGAGATTAACGAGTCTTTGGACATTGGAAGAGCTCCTTGTGAGTGGAGGAGGAGGTGTTGATGGTAGCAAAGCATGTGGGCAGTGGGCTTGAATCTCTTAAAAACTCGGAACTCCTCCAAGCGTAAGTATACGTATACTGGGAAATGTGTTAGATGTGGATGAGGCTAAGAGATTAGAGCTTGACAAAATGAAATACCTCTTTCATTGAGACTTAAATTTGATGGGGAAGAAGAAAAAGAAGAGGGAAGGAGGAAGAATGAGGATAATCAACTTGTTCTTGAAGCCTTGCAACCACCTCTGAATTTGAAGGAATTAGAGATTTGGTCATACAGAGGCAACAT\n>URS00001A8944 rRNA from 1 species \nAGAGTTTGATCATGGCTCAGGATGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAGCGATTTACTTCGGTAAAGAGCGGCGGACGGGTGAGTAACGCGTGGGTAACCTGCCTCATACACATGGATAACATACCGAAAGGTATGCTAATACAGGATAATATAAGAGATTCACATGGATTTTTTATCAAAGCTCCGGCGGTATGAGATGGACCCGCGTCTGATTAGCTAGTTGGTAAGGTAATGGCCTACCAAGGCGACGATCAGTAGCCGACCTGAGAGGGTGATCGGCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCAACGCCGCGTGAGTGATGAAGGCCTTCGGGTCGTAAAACTCTGTCCCCAAGGAAGATAATGACGGTACTTGAGGAGGAAGCCCGGCTAACTACGTGCCAGCAGCAGC\n>URS0000D1F0EB sRNA from 1 species \nGGGTCGCTGCGAACCCCGGCGTTCCGCGGTGGAGGGGTGCTATACTGGGATGCAGGCGCGGCAATCATGCCCTGGGAGCTAATGTAGAGCTTTGGATAATGCTTTTGCAAGTTGTACGAGAAGGGAAGTTCTTGGGGTTTCTGACCTCCTGCAGCCTCCTCTTGCCTCGGGCTGCCCAGATCTTGGCGGCTGAGGCTGGCTTACCTTCAAGCCGTTCCTTCATGGGATTTGCTGCTCCCTTCACCAACAAGCGAAAGGCTTACTCGGAGCGTAGAATCATGGGGTACTCAATGCAGGAGATGTATGAGGTGGTGTCCAACGTCCAGGAGTATCGTGAGTTTGTGCCCTGGTGTAAGAAGTCTCTGGTGGTATCCAGCCGTAAGGGTCACTTGAAAGCCCAGCTGGAGGTTGGCTTTCCACCTGTCATGGAACGTTACACCTCTGCAGTTTCCATGGTCAAACCTCACATGGTCAAGGTGAGGCCTGTATGGGAGGGATTGACAAGATTTTTTGTTTTTAGCAGTTTCATATGAAAGTGCTATTTTGGCCTTCCTTGTTAAGGACTTTATGTCCATGTGTCAAGTATTTCCCTAATATCAGAAAAGAAGGAAAATGGCTTTCAATTCCTTTATATTGTATCCTATACTTAGTAA\n>URS0000B6CEE1 rRNA from 1 species \nTTCCTACGGGGGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGGGGGATGAAGGCCTTCGGGTTGTAAACTCCTTTCGCTACCGACGAAGCCCTTTGGGGTGACGGTAGGTGGAGAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTGTCCGGATTTACTGGGCGTAAAGAGCTCGTAGGTGGTTTGTCGCGTCGTCTGTGAAATTCCGGGGCTTAACTCCGGGCGTGCAGGCGATACGGGCATAACTTGAGTG\n>URS000200AAC7 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTGTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATGGGGACTGAGGTACGGACCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGGTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS00019A43BA pre_miRNA from 1 species \nAGCAGAATTATTGAGTCATATGGTAATTCTATATTTAATTTATTAAAGAACTACCAAATTGTTTTCCACAGTAGCTACACCACTTACTTTCTTACCAGCAAT\n>URS00012BF748 rRNA from 1 species \nTACGTAGGGGGCAAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGTCCGGTAAGTCGGTTGTGAAAGTCCAGGGCTCAACCCTGGGATGCCGATCGATACTGTCGGACTAGAGTTCGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>URS0000AF9FF6 rRNA from 1 species \nAGGATTCCCCTAGTAACTGCGAGTGAAGCGGGAAAAGCTCAAATTTAAAATCTGGTAGTCTTTTGGCTGCCCGAGTTGTAATCTAGAGAAGCATTATCCGCGCTGGCACGTGTACAAGTGTCCTGGAATGGACCATCATAGAGGGTGAGAATCCCGTCTTTGACACGGACTCCCAGGGCTTTGTGATGTGCTCTCAAAGAGTCGGGTTGTTTGGGAATGCAACTCTAAATGGGTGGTAAATTCCATCTAAAGCTAAATATTGGCGAGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGAAAAGAACTTTGGAAAGAGAGTTAAACAGTACGTGAAATTGCTGAAAGGGAAACGCTTGAAGTCAGTCGCGTCGGCTGGGGATCAACCTTGCTTGCTTGGCTTACTTCTCCAGCTTGACGGGTCAGCATCAGTTTTGACCAGTGGATAAAGGTTGAGGGAATGTGGCACCTAGGTGTGTTATAGCCCTTGGTCATATACATTGATTGGGACTGAGGAACTCAGCAAACTCTTGTGCTTAGGATGCTGGCATAATGGCTTTAAGCGACCCGTCTTGAAACACGGACCAAGGAGTCTAACATGCCCGCGAGTGTTTGGGTGGAAAACCCGAGCGCGTAATGAAAGTGAAAGTTGAGATCCCTGTCGCGGGGAGCATCGACGCCCGGACCAGACCTTTTGTGACGGATCCGCGGTAGAGCGTGTATGTTGGGACCCGAAAGATGGTGAACTATGCCTGA\n>URS0000C86EDA RNase_P_RNA from 2 species \nGAGAGAGGAAGGGCGGCTCACGCACCGAAAGGTGTGAGGAAAGTCCCCCCACCGTTTGGACGCGCGGGCGTCCGCAAGGGCGCAGGGCGAGAGTCCTGGCAATTGCACAGAAACGCCACCGCCCCTCATGAGGGCGATGATTCCGAAAGGATGAGGTCGTGAGGCGGCGGATGAAACGGCAAACCCCGCGGGTGCAAGTGGGGAGTATGGTGGACGTCCAACCACCACCCCGTTGTACGCTAAGCCAAATGCCGCCAGAACAGAAGGGGGCTTACTCTCCTCACTC\n>URS0000DA6093 tRNA from 1 species \nGGTGGCTCAGTGGTAGAGCGCTTGCCTCGCATGCATGAGGCCCTAGGTTCAATTCCTCAGCACCA\n>URS00017E371D rRNA from 1 species \nGACGGAGGATGCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCCGCAGGTGGCAGTTCAAGTCTGCTGTCAAAGACCGGGGCTTAACTTCGGAAAGGCAGTGGAAACTGAACAGCTAGAGTATGGTAGGGGCAGAGGGAATTCCTGGTGTAGCGGTGAAATGCGTAGAGATCAGGAAGAACATCGGTGGCGAAGGCGGCTCACTGGTCCGGTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGG\n>URS0000BEF9DA tRNA from 1 species \nGACCTCGTAGCTTAGTTGGGAGAGCGTGCGCGTACAAAGCGTAGGCGGCGTCCATGCGTGGGTTCGAATCCCAAGGAGGCCA\n>URS000130260F rRNA from 1 species \nCCTACGGGGGGCAGCAGTGGGGGATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGGGTGAAGAAGTATTTCGGTATGTAAAGCCCTATCAGCAGGGAAGAAAGAAGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCGAGCGTTATCCGGATTCACTGGGTGTAAAGGGAGCGTAGACGGCCGTGCAAGCCAGGAGTGAAAGCCCGGGGCCCAACCCCGGGACTGCTCTTGGAACTGTGCGGCTGGAGTGCGGGAGGGGCAGGCGGAATGCCTGGTGTAGCGGGGAAATGCGTAGAGATCAGGAGGAACACCGGCGGCGAAGGCGGCCTGCTGGACCGCGACTGACGTTGAGGCTCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCCAGTAGTC\n>URS00023DD7C2 lncRNA from 1 species \nGTACCACTTGGCGAGCTCATCGTCAGCAGGGGAGACAGCGGCAGCCTTAGCTTTGGCAGGAGCTGCAGCCGCCTTCTTTTTGAAAAGGGCAACAGTTTTGAAGGTAGCAGAGGAGGATGGAGATGGAGCAGCAGGCCTTGCAACACCGCTAAACTTGACCGGACTTCCGAGCATCTCGGAGACGTATAGAGAGGTAGCTGCAGCCATTTGTAGCTAAACGGTGTCGCTGGCAAGAGGTAAAAAAAATTGAGGTCGAGTTGATGATGAGAA\n>URS00023CEA75 lncRNA from 1 species \nGCCTCCGCTTCCTTCCCGTGGCTTCTGGAGTCTTCTAGATGTAAAATAATTGCGCGTCATGTTGATATCTCTATGTAATCCCGACGTGTGGGCCTTTCTTCCGTATTTCCTGATAACCTCCTGTAGAAATAGACAAACACCAAAACTCATAGAATTCTGTCAGATAAAATCCTAAGTCTAGATGTTGATTTCATTTAGATCCTTTTCTTTGTTTATTTGATAATTAAATTTGATACTTAAGGACCGTCAACAAACTCCCCCAAGCTTACCTCTTGCTCGTCCCTGAGCAAGGATAGACTCAGCAATGGATCAGAAGTTGTTGCAATATCTTAAAAATT\n>URS0001CC7192 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTAGAACGCACAGTTTATACCGTAGCTTGCTACACCATACACTGTGAGTTGCGAACGGGTGAGTAACGCGTAGGTAACCTGCCTGGTAGCGGGGGATAACTATTGGAAACGATAGCTAATACCGCATAATATTGATTATTGCATGATAATTGATTGAAAGATGCTATTGCATCACTACCAGATGGACCTGCGTTGTATTAGCTAGTAGGTGAGGTAACGGCTCACCTAGGCGACGATACATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTAAGAGAAGAACGGGTGTGAGAGTGGAAAGTTCACACTGTGACGGTATCTTACCAGAAAGGGACGGCTAACTACGTG\n>URS0000E5BE8F tRNA from 1 species \nGCGGCGGGCTCCAGACTATATTAAGACGGGTATGATGACCTCTGGGATGATTGGAGTCTGGAGCTTTGGGATACCCGTCGGTCGTGGGTTCAAATCCCACCGGCCCCA\n>URS0000E04A9A lncRNA from 1 species \nCGTAGAGCTGCTGGTCAGAGATGTGACTTGGTGTTGCCACACTACTGACTTCACTCTGAAAAGGCCAGTTTGGAAAAGAAGCAGCCTCGTGTCGCGGGAAGCATTTGTTCCAAATTCTGTGCTGGTCTGGGACTGCTCTCCAGGTCAGCCGGGTAGACCGCATCCGTTTTGTTGAGTCAGGGCTCTGTAAGACTTGGTCCTTAGACGTTTTTCTTTCAGTCTCTGCTGCAACAAAGGGTAAATTAATAATGAGGTGCAGACAAATCGAGCCAAAGAGCTTTCAAGGGGAGCAACGTTATGGTTTCAGTGCTTACGTTCTACTTTCGGTCTCTGATTCTTCTGGGGTGCAAAACCACAAAAACCTTCTGTAGAGGCTGGAATCGGTTTCAGATTGTTCAGACAAGATCATCATTCTTATTCCTGACTCTTACCAGAGGCAGAGCTGAAGGTTGAGATATTTAAAGCTTTTCTTGTGGCCACATAGATGCTAAACTGTCAGAGATGGGGAGAGAGAATAATCAATTCATCTCTAATGTAAACCCACAGAAAAGGGCTTTTCAGTGAAAAGTAGTAAAAGTTTTACATTGACCGATGCCTCTGTGAGCTATTTGAGGTGGAGATAAACAACTAAAAGGGGAAGATAAAGACTTAAATAGGTCAATAGAAGTATTTTCAGAATTGTATTCCATATGTGAATATAGAACACTCAGAGGGAGCAGTCAACAGAAACAGCAGTGGTGCATCATTTTAAGCAAAAGACCTAGATGCATTAGTTTAGGGCATATTTTAATATGGTTTTACTGGTGAATAAATCAGTGTGGTTTTCCCTTATAGCA\n>URS0000DD8E81 rRNA from 1 species \nCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCGACGCCGCGTGAGTGATGAAGGCCTTCGGGTTGTAAAGCTCTGTTGAGGGAGAAGAAAAAAGCTGGGAGTAACTGCCTGGTTCTTGACGGTATCCCTTTAGAAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAAT\n>URS0000815E56 rRNA from 1 species \nTACAGAGGGTGCGAGCGTTAATCGGATTTACTGGGCGTAAAGCGTGTGTAGGCGGTTCGTTAAGTCGGATGTGAAAGCCCTGGGCTCAACCTAGGAATTGCACTCGATACTGGCGAGCTAGAGTACGGTAGAGGGCGGCGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAGGAACACCGATGGCGAAGGCAACCGCCTGGGCCTGTACTGACGCTGAGACACGAAAGCGTGGGGAGCAAACAGG\n>URS0001E053E9 rRNA from 1 species \nAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGGCAGCACAGTAAGAGCTTGCTCTTACGGGTGGCGAGTGGCGGACGGGTGAGGAATACATCGGAATCTACTTTTTCGTGGGGGATAACGTAGGGAAACTTACGCTAATACCGCATACGACCTACGGGTGAAAGCAGGGGATCTTCGGACCTTGCGCGATTGAATGAGCCGATGTCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGGGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTGCGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATACCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAAGAAAAGCAGCAGGTTAATACCCCGCTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGTG\n>URS000084AE89 rRNA from 1 species \nAGGAAATAGATACCCTGGTAGTCCCAGCCGTAAACGATGCTCGCTAGGTGTCAGGCATGGCGCGACCGTGTCTGGTGCCGCAGGGAAGCCGTGAAGCGAGCCACCTGGGAAGTACGGCCGCAAGGCTGAAACTTAAAGGAATTGGCGGGGGAGCACAACAACGGGTGGAGCCTGCGGTTTAATTGGACTCAACGCCGGACAACTCACCGGGGGCGACAGCAATATGTAGGCCAGGCTGAAGACCTTGCCTGAATCGCTGAGAGGAGGTGCATGGCCGTCGCCAGTTCATACTGTGAAGCATCCTGTTAAGTCAGGCAACGAGCGAGACCCGTGCCCACTGTTACCAGCATATTCTCCGGAATGATGGGTACTCTGTGGGGACCGCCGATGTTAAATCGGAGGAAGGTGCGGGCCACGGTAGGTCAGTATGCCCCGAATCTCCCGGGCTACACGCGGGCTACAATGGATGGGACAATGGTCCCTACCCTGAAAAGGGCTGGTAATCTCACAAACCCATTCGTAGTTCGGATCGAGGG\n>URS0001BF7771 lncRNA from 10 species \nagctatgaggcaaataagaactagaacttgaacatttgaaaaattctcagtatacccatattgcaagaaatgatgaagcacgctctggaaagaacactaagggtgtcatgggactaacttttgctggagagattagacttgtgactcatgagttcactcaaccatctcagtagaacctctgccctcttggactgaaagggacagagatttgacaaaatgtaagaaggcagtcagacttctggaattcctgggtaggaaatgggctgaaagggctacttgacaatgaatacatatcatttttcaagaaaagcaaagcatgattttgagagtagctcagaggccagcagggCTGTGGAAGATctgcctacacactgattttggatttctagccttcagaactctgagataatacatttctgattttatacaacctagtctgtgataacttgttatggcagcactaggaaacAATGAAACCTCTCAGCGTCTTTTGATAGTGCTTAATATCATCTCAAAAATCCCTTTTACCATGACTTCTATTACACCAAGGCTTTGAGCTTGTTACTATTACTACCTGTTTTTAATGCATTTTCCATGTTGCAACCAGAGTGTTCCTTTAATTGCTTATGTAACAGTTTATTTCCAGTGATTCTGGTTACATGGAACTCCTGCATGGCTATCTGGTTTGTTtttgtttgtttgtttgtttgtttgtttgttttgagacagagtctcactctgtcacccaggcgggagtgtggtggcacaatctcagctcactgcaacctctgcctcctgggttcaagcaattctcctgcatctgccacttgagtatccgggattaaagccctgtaccaccacacctggttaattttttggtagagacagtttcaccattatggcaaggctagtcttgaactcctgacctcagatgatccacccgcctcggcctcccaaaatgctgggattacaggtgtgagccacctcgcccggccACATggctatctttacagcaatgattcagagaccaggttcctggcatcctgttgctccaccattatatagaaccacttattgatggagagggaataataagtgagaatgggggatcacgtattggagattttaatggatgggactgacctagaagcaatgcacatctatctcttcacatttcattgattagaattcagtggcattaccacacctagataaaaaagaaaaaaaaaa\n>URS0000E4C665 rRNA from 2 species \nCTGAATAGGGCGCATAAGTAACAGGTCGTAGACCCGAAACCAGGTGATCTACCCATGTCCAGGATGAAGGTAAGGTAATACTTACTGGAGGTCCGAACCCACGCACGTTGAAAAGTGCGGGGATGAGGTGTGGGTAGCGGAGAAATTCCAATCGAACTTGGAGATAGCTGGTTCTCTCCGAAATAGCTTTAGGGCTAGCCTCGAGGTAAAGAGTCATGGAGGTAGAGCACTGTTTGGACTAGGGGCCCTTCTCGGGTTACCGAATTCAGATAAACTCCGAATGCCATGTACTTATACTCGGGAGTCAGACTGCGAGTGATAAGATCCGTAGTCGAAAGGGAAACAGCCCAGACCACCAGTTAAGGTCCCCAAATATATGTTAAGTGGAAAAGGATGTGGGGTTGCTTAGACAACCAGGATGTTGGCTTAGAAGCAGCCACCATTGAAAGAGTGCGTAATAGCTCACTGGTCGAGTGACCCCGCGCCGAAAATGTACCGGGGCTAAACATATTACCGAAACTGTGGATGAACCTCTTTAGAGGTTCGTGGTAGGAGAGCGTTCTAAGGGCGGTGAAGTCAGACCGGAAGGACTGGTGGAGCGCTTAGAAGTGAGAATGCCGGTATGAGTAGCGAAAGAAGGGTGAGAATCCCTTCCACCGAATATCTAAGGTTTCCTGAGGAAGGCTCGTCCGCTCAGGGTTAGTCGGGACCTAAGCCGAGGCCGATAGGCGTAGGCGATGGACAACAGGTAGAGATTCCTGTACCAGTGCTAATTGTTTAACCGATGGGGTGACACAGAAGGATAGGGAATCGCACGAATGGAAATGTGCGTCCAAGCAGTGAGTGTGAGAAGTAGGCAAATCCGCTTCTCGCGAAGCATGAGCTGTGATGGGGAAGGAAATTAAGTACGGAAGTTCCTGATTTCACGCTGTCAAGAAAAGCCTCTAGGAAGAGTAGTACTGCCCGTACCGCAAACCGACACAGGTAGATGAGGAGAGAATCCTAAGGTGAGCGAGAGAACTCTCGTTAAGGAACTCGGCAAAATGACCCCGTAACTTCGGGAGAAGGGGTGCTCTATTAGGGTGCAAGCCCGAGAGAGCCGCAGTGAATAGGCCCAGGCGACTGTTTAGCAAAAACACAGGTCTCTGCAAAACCGTAAGGTGACGTATAGGGGCTGACGCCTGCCCGGTGCTGGAAGGTTAAGAGGAGTGCTTAGCTTCGGCGAAGGTACGAATTGAAGCCCCAGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTAAGTTCCGACCCGCACGAAAGGCGCAACGATCTGGGCACTGTCTCAACGAGAGACTCGGTGAAATTATAGTACCTGTGAAGATGCAGGTTACCCGCGACAGGACGGAAAGACCCCGTGGAGCTTTACTGCAACCTGATATGGAATGTTTGTACCGCTTGTACAGGATAGGTAGGAGCCGAAGAGACGTGTGCGCTAGCATACGAGGAGGCAATGGTGGGATACTACCCTGGCTGTATGACCATTCTAACCCGCCACGCTTAGCGCGTGGGGAGACAGTGTCAGGTGGGCAGTTTGACTGGGGCGGTCGCCTCCTAAAGAGTAACGGAGGCGCCCAAAGGTTCCCTCAGAATGGATGGAAATCATTCGCAGAGTGTAAAGGCACAAGGGAGCTTGACTGCGAGACTGACAAGTCGAGCAGGGACGAAAGTCGGGCTTAGTGATCCGGTGGTTCCGCATGGAAGGGCCATCGCTCAACGGATAAAAGCTACCCCGGGGATAACAGGCTTATCTCCCCCAAGAGTCCACATCGACGGGGAGGTTTGGCACCTCGATGTCGGCTCGTCGCATCCTGGGGCTGTAGTCGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGCACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCCTATCCGTCGCGGGCGCAGGAAATTTGAGAGGAGCTGTCCTTAGTACGAGAGGACCGGGATGGACACACCGCTGGTGTACCAGTTGTTCCGCCAGGAGCATCGCTGGGTAGCTATGTGTGGCAGGGATAAACGCTGAAAGCATCTAAGCGTGAAGCCCCCCTCAAGATGAGATTTCCCATTTCTTCGGAAAGTAAGATCCCTGAAAGATGATCAGGTAGATAGGTTTGGAGTGGAAGTGTAGCGATACATGGAGCGGACAAATACTAATCGATCGAGGACTTAACCAAAA\n>URS0000CB5B26 rRNA from 1 species \nAATGGGGGAAACCCTGACGCAGCAACGCCGCGTGAGTGAAGAAGGCCTTAGGGTTGTAAAGCTCTGTCATATGGGAAGATAATGACGGTACCATAAGAGGAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCGAGCGTTGTCCGGATTTACTGGGCGTAAAGGATGCGTAGGCGGATATTTAAGTGGGATGTGAAATCCCCGAGCTTAACTCGGGGGCTGCATTCCAAACTGGATATCTAGAGTGTCGGAGGGGAAAGTGGAATTCCTAGTGTAGCGGTGAAATGCGTAGAGATTAGGAAGAACACCAGTGGCGAAGGCGACTTTCTGGACGATAACTGACGCTGAGGCATGAAAGCGTGGGGAGCAAA\n>URS0001773291 rRNA from 1 species \nTACAGAGGTCTCAAGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCTCGGAGCTTAACTCCGAAACTGCATTTGATACTGCCGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCGGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACGCTGAGGCACGAAGGCCCAGGGGAGCAAACGGG\n>URS0001DB2352 tRNA from 1 species \nGCCCCAGTAGCTCAGCTGGTCAGAGCGGTAGCCTTGTAAGCTACAGGTCCCGAGTTCAAACCTCGGTTGGGGCT\n>URS0002395A25 lncRNA from 1 species \nAATTTGTTTGGTTATTACCCTCTTTATTCCTTAATTTCTCTTCCAAGTCACGTACAAGAGTTGATACCTCCCTGGTAAGTACTCCGACATGAGCCAAGAGATCAAAAAGTTTGTCATGATGAATAAAGTCCTTGGGCATATCAGAAAGAATAAGTAATAGGAACTCCATCATGACATGAATGTTTCGAGCCCCTGAAGTGCTAGGGTGAATAACAGTTATCATATGCTCTTGTAGTTGAATGATATATTCTCTGAGAATATCCGGTGAGGTTTCCAGGAGCTTCTTAATGAAGCGTCCAACTTCTGCTGAAGTTGAAGCTTTCAAGTTTGTATAACATATGTGCATAACCTCCATTTCAGTCGGAACAATCTTCAAGAGTAGCTGGAAGAGTCGAGAGTCTCTATCATTCTGATCATCCTCATCTGAGTCTTCATCAATCTGATCCTCCCAAAGGAAGTGTCCTACTCTTTCAGCCATCAGTTGAAACAGAGGTAAGACATTCTCAACCGTCTCATGCTTAATGCAACCATTCACTATCAACCCATGGAAGTCTCTTATGTTGCCACATACATTCTGAAGAACTTCATATTGAGTCACTTCAGGAAATATCTTTTCAGCGTGATGCTTGGATAGATGATACAGATTCAAGAGGAGGAAGTCCAATTGCTCATCCATCATGGTGGCATCTGATTTATAAGAACGATGATACAAGCTGATACAATCATCCATATTACTAGTGAGGCTAGTAAGGACATCATCATCCAAAAGTGGTTGAAGCAGATTCTCAACCTCTTGTCTTTTTCTCGTCATTATATCTTCAAACTGCTCAAAATTGGAATAAGAAAGTTGAACATATGTACAAATAAATGCCATTTTCAATTTTAGATTTTCAACTTCATCTTTGTCAAGAGATTTTTGATTTTCCTCATTCTCTAGGAAAACCAGAACATCGGCAATGTCCTTGTTAAGAGCAGAGAATAACACCTGCCAAAATAATACATTTTAAAGCCACATATCTATAATTCAATACTTTACGGTTTACTCTATAAAATAACATACCAATGAGTTGTTTGCTTCTTCATTATCTTTTCGTTTTTCCATGATTCTACTTTTTCTCTAGACCTGATGAATAAAAAGTAGATAAAACTTTAACAGGAGAAAGAAGATGAAAAGATAAGAATAATCAATAATATCACTATTTTCACACATAGTAATTTTAGACTCGCACAATTGGAAATGTCAATCTTAATCACACATCAAAATGTTTATGACATAAAATCACAAACATAAAATCTCACAACTGTTAAGTAAAATGTCATTAAATTAATAATCTCTCTAATAATATTTTTCTCCTATCTCCTTGGGCTAATGGAAAAAGATTACTCTTTTATTTTGATAAAAACTAGTCTTCGGAACTTGCATCGCACGTCTGTCCCCTAATTGATATTAGTAAATTTTAATTTATATAGCTATGTTCAAATGTATGTCCTTTCATATGTAAGTTTAACATAAGAATTTAACTTTGCACAAAGTGTAACATGAAAATCTTGTGTTAGATGTTGGAGGTCTGATATATTAAATACTTCATGAAAAATGAACATTTATTTTATCAGAGGAATTAATATATTTTAATTATTAAACATAAATTTTAATAATCAAAAAAGAAATTGTCTATAAAAAAGATACGTATAAAGAAAAATATTACAAAATGTTTGGGCGGTATACCATCAAATTTATAGAAAAAATTAAAATTTCAAACGAAAAAAAAAGAATAAATAAAGACGTCGCATCCATAAAAAAAGACATCACATTTAAATATATAGACAAAATATTTTCATACTAATTGAATTACATTTTGTTAAAAGTAGACTTATTCTAGACAAAACATGCCTTACTCTAGACGAAACATATCATATGCATAAAAAACTATAATCATATATAATAATAAATAAGACAAACAGAAAAGAAGACATGAATATGTTAAGAATAAAGATAAATTGTATTTCTTGAACTATATATATATATATATATATATATATATATATATATATATATAAATGAATTCTAAAATAATATTATTCAATATATCATTTAGTCATTTTTTACTATACATTATTTTATTTTATTTTTTTACTTTTGCACTTATTTTGTACCTCTCTATAACAATTAAGTGCATGAATTTTTTGAATATTTGAGATTACATATAAAAAGGAAAAAGTACAAATATGTTGGTTTAAAAAGATAAATGATTATCAAACAATGAAAAATACATAATTATTATTCTATGGGATTTAGCATGTTTACCCTCAAAATAATTAATGATAAATACAAAATGTGATTAGCTTTATTATATATATCCTAAAAATAGAAGAAAGGATGAATACAAAAATACAGTAATTAACTACAAAGTTATATTTAAAAACTCAAAATGATAGAGATGTGAAAAATAAATATTTACTTACAACTTCATGTTGGAGTATATTCATCTTGTAACTATCATAGTTTACATATTCCTCAACAAAAAGAAGATGAATATGTATGAAATTTTAAAGGATTAAATAAAATAGTAAGAATTCTTATATTTACAAACTGGTAATGAAAATTTTACAAGGGAGGTAGACTAACCTACTGTAGTATGCGAGATGATTATAAACTTGAATAAAATAAGGAATATATATAATGTGGTGTGAGCGTGTTTGATAGACTCTTCATTACCCCCCACTTATCTTACAAATTAAAGTTGAAAGGTTATTAGACTCTTCATTATCTACATTTAATTAGTACATGAATATATGATGCATTAAGATCTTATTTGACTTAATATTTAATTAATTAAATAGATATTAATATTAATTTATTTTAGAGGTAAAATAAGGTTAAAATGATAATTCAACTTTGAGGTTAGAAGCTTCTCACTTATAATAATAATATATGATAATAGTAAGATTTTTTGTGAGAGTAGCTGAAATAGAATCAATAGAGATCTCCGATTAAGCATGTTCATACCTTTTTGACATATTTTTGTTAGACAGGTTGAAGTAAGAGATTGAAGTCTAGATCTAGAATTGCAAGATTAATAAAATACAATTCATTGACTTCACAAGTCCTTTAAATACCAAAAGTGCTCACTTAATCATTAAGTTTAGCAAAGAAGAAGATGGTACCTTTACACAAGCTGAAGTTTAGCTACAGAACCCTTTGTTTGAGAAATAATGCTGAACCTATTGGAGAAAAAAACAAGTGTAGTAGTTGAAATATACAATACAAGTCTTTTAGTAATGAAATATTAAAACACAAACCCATAAGTCTTTTTTTAATCAATGTCTTTTGTCTTTCAATTTTTATACTGGCGAAGATAAAAACAAGTGGTTGTCATTTCATCAAACACATTGAAGACATTGGCAATTTCCACATTATAGAATTTAATACAAAATATCAAAACATGAATTCTTGAAATGGAGTATAATAATTATTTTCTTCACAATGAATATACGTACTATATGTGTATATGTTCAATATAACCGGAGAAAACATTGCCAGAAAAAATAAATAACAGAGTTTAAAATATGTACTCAAAAACAATAATTAATATCATAAGTATAAATTAATGAGGAAAAAAAATTATACCGCGATACGAAAAAATAGAACGAAAAAAATTGAGTCCACTGAATGCACAATGTCCTCTTAAGGAAACTACTATTTCCCTCCAATTCCGAAAATTTAAAGAATTACATCCTCTTAGGATGAACGATGTTATTCACCCATATGGGTTCGGCTCTGGTGGGCGCCCACCCAGTGACTCTAATTCCTAAATTCGTCTATACTGTCAGTAACTCATTCAACAGCATCAAAGTAAGTACATGAATATTTAATTTTGCAGAAATAAAAGAAAATGATTATAATTGTTTTTTGTTTTAAAATAAGGGTGTGTAGTATGAAGGAAAACATTTCTCGGAAAATATTTTTTCAATTTTCTCATATTTGGTTGGATGAAATCATTTTTCTCAAATTTAAAAAAAAAAAAGACTTCCTTTCCAAACTTAAGGAAAACATTTTCCAAAATTCTTTTCTAACCTTCCCCTACCCACCACCTGCTAGCCCCCCACCCATACCCCTAAAAAGTTTAAGTTTAGTTTTTTAAAATATTTTAACTTCACAATTTCTTTTTTTCACCCCTACCCTCGACCCCCAACCCACCCCCTACCACCCCCATCCCCAAAAAAAATAATTTAAGTTTGTTTTTTAAAAAATATTTTAAACTTAAAAAATTTATTTTTTCACCCCCTACCCTCGACTTACCCACTCCCTACCAGCCCCCCTCCCCCCACCCCCCCACCCCCTCTTCAAAAAAAAAGTTAAGTTTGTTTTTAAAAAATATTTTAAACTTCAAAATTTCATTTTTTCACTCCTACCCTCGACTCCCCACCCCACTCCACTAGCCCCCTACCAGCGCACCCCCACCACGAAAAAAAATTTTAAGTTTGTTTTTTTAAAAAAATAAATTCAACTTCAAAAATTATTTTCTACTCTAGTAAAAAATAAAGATATTTCTCAAAAGTATTTTTCATTGAAAAAACAAACACTAAAATATTTTTCTAGAAAATATTATCTACTGACCAACCAAACATCAGAATATAAGTAAAATATCTACCTGTTTTTCAGAAAAACATTTTCCAAGGAATTTCCATCATACCAAACACACCCAAGAGTATATTCCTCTATTTATAGACAACAAAAGGTAATGTGAACAAATATTTATTGTGCCTTATTAGAAAGGATAGAACTATTTGTAAAAATTGCAACCCTTCGGAAAGTTTATAACGTTTCATAAAAGTCGCAACTCTTCATAAAAGTCACAACTCTTCATTAAAGTCGCAACTATATACATATATACAAATCTTATAGGGATGAACAAGTTTGAACAAGTTTCAGTTTTGTAAACTATCTTGATCTTCGATTAATTTCACGGGATATATAGATCTAGATCTACATGTACAAATAGTTTATCTTCTTTTTTTTGAAAGAATTTTCTTGTGTATTATGTACGAGTATAAATATACAGGAAGAAATGCAAAATTTTAGCACAATATGAAGTGTCTAATCAATCTTGATATTTAAGCACCCAAATTCAGTATTTCGCTTTGATAGGTTCATAATTAAGAATCAAAATAATAATAGAGACTAAAATAAAATTCATTGACTTTTCAAGTCTTTTTCATCAATTTTGTAAATATGTATATTCATATTACAAGTTGATAGACTTGTGGAGATTGTTAATTAGCTTGTGAATGAAGATGATGTGTGTGTAGATCATGGATTTGAGCCACTAATGTTTCTATACTAATGTTGGGTGTAGGCTGCGTTCTTGTTAGCGGAAACGTGAAATTAAAGAATAAGGAAGAACAATAATGAAAATAAGAAAAGAAGAAGAGAGTTTTGAAGCATGAACTAATTACCTCTGCAATATTAGAAGCCCTGCTCCTTGTTTCAGAAACAGAGTAATTGTTTGCCAAATGATCCAATTAATGTAGTTGAAACAAGATCTGGACTTTATTATTATTATTATTATTATAAGTCTTGTTATTCACATAGGAAGATTCCTAAATGAGATTATTAATTCAACTGGCTAACAATGAATTAATTACTTGAAAGGCCAACTTAACAAGAATAAAATATATATATATATACATCTTGACAGTTTGTTCATTCATAATACTAAAATACAATTCATTGACTTTTGAATTATACATCTATCATCTTTTTGGTGCTTCTAATTTTGAGTGACAACGACATTATCATATGTTACTTTTCTATATTACTGAAGTGGAAAACTCCAAAAGTTAATTTTTTTAAAAAAAATAAATAAATTCCATTTCCAATTTTTATTTTTTTTTAAAAAAAGAACATCCTTCGTTTCAGAAAGAATGATCTAGTTTGACTTGGAACGGAGTTTAGGGAAAGAAAGAAGATTTTTTAGTCTTGTAGTTCTAAATTAAAATTATGTCATATGTACCAAAATGTCATTTAATCTTATGGTCTTAAACATGTTACATGAAAAATTAAAATTAAAATATTGTCAAAAAAGGAAAGGTGTCATTCTTTTTTAAACAAACTAAAATTGAAATAGGAACATTCTTTTTTAACAAGAATAATATATATATATATATATATATATACTAGTTTGTGAGGACGTGCTTCGCACGTGTGTTTCATGTGACTTTTTATAGATACGTTAGAATAACTAAAATCTCATGAAAATATATATATATATATATATATGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTATGTATGTATGTATGTATGTATGTATGTATGTGTGTGTGTGTGTAAATTGTAATGAATAATAAAATGTAACAACTACAAAATTAAGAAGTCTAACAGAGTAAAAAAGATAAAAAGAAACACAATATTTAAGAAAAAAATACAATATAGACATTATTCTTATAAAATTGATGTATATATAGATGAAAAAATAAGTACAAAATTAGTACATAACTCTTTTAGAAAACTAAATTAAGAAGTCTAACAGAGTAAAAAAAGATAAAAAGAAACAGAATATTTAAGAAAAAATAAAATATCGACATTATTCTTATAAGATTGATGTATATATAGATGAAAAAATAAGTACAAAATTAGTACATAACTCTCTGAGTTTTTATTGATTCCTTTCATATCCTATCAAAATTCAAGAATCTTCATCATCTGTTTTTACTATAGAATAAAAATAATATCCTAATAATCTTGGTAGGGTTTCATGAGATAAAGAAGTTGAATTTATATAAACAGAATAGAAGGAATATCAAAAGATATCTTAAAGTTTTAGTTTAAATATTTGGAAGTTATGAATATGAAAAGATGAGAGTTATGAATATTAAGAGTATAAAAGTTAAATAAATAATTAGAAAATAATAATAAATAAATGAAAGAATATGAAAAAAAATTAAAGTTAGCAAACCATGTAAAAAGAACAACTAAAGTTCTTATCATGTAATTAAGCATTAATGAATTTAAATTTGTGAAGCTAGAGTCATTCTTTAATAATAATTAAGAGGACATTATTAAAGTGCATCTCCATTTTATAGATTTGCACCCTTTAAATTATTAAATTTAGTTATTTATCATAAAGGATAATACTTTATCCACAATTATATTATTCATGAGAGGGGTTAAGAAAAAAGTTATAAGAAAAGGAAAAGAAAAGAAATTTAGGTAAAGATTTTTTCTAAAAAAAATTATAATTATTATATACACATAGATTATAGATGATAAATATTAATAGATTAGATATTTAATTAGTAATTAATCTTAGGAAGTCCAAAAGTCATTAACATTTAATTAAATTTATACAATCAAATATTAAATATTTTATAACAATTTAATTTATAGTAAAGGTAAAAGCGTAATTCAACTTTCAACTTTTTTGTTCATGCTTTTAGTAATATATGATATATATATTGACGGTTTGTTCATTCATAATACTAAAATTCATTGACTTTTGAATTATACCTATCATCTTTTTTTGAGTTACCAACGTCAGGGGCAAATGTATATTGTCGAGACATGAATGATTTGGCTTTTAGATGAGATGGTCACATATATAATAACTTTAGGATCCACCCGAACCCAATGAGTCAATGACGATAGATTTTTCCTGTAATTAACTTTAAGGTTGATGAGGTGAAAGGAAATTTTACTCATTTCTACTTAATAAATTCAGTTGAGACTTTTATCAAACACATCTTTTAACATTAGCGGTTTTCACTACAAGACTTGATTTTTAAGCAGCAAAAATGGTTACTTATAACAATAGAGAACATGTTATAATGCTGCTGTCACTTAAATTATGCTCCATAATTTTCCTTTTTGATTTTTGTTAATCATGCTGACTGGATTAACTTGCACACATTTCAATCAATTTCACAAGATACCGTTCACTTTCAATTTGCATGCACTTTGACTAATTTCATGCTTAACTCTATTCGTCAAAGACATGGATAGATTATAGAAAAAAGGCAAAATACATAAATATGTCCTATTAACTTGACTTCAAATAACATTTATGACCTTCAACTTTGGGCATGCACAAATACACACTTAAACTTGTATAAAGTTTATCAAATAAACACACATGTCCTATATGATATCCTACATGTAATTTTTTGTCCTACGTGGTGTCCTGTAGGACTCGTGTGTTTATTTGTTCTATTTTATATAAGTTTAAGTTCTACTTGTTCATATTCAAATTAAAGTTGGAGGACATAAACGTAAAATGAGGTCAAGTTAAAAAGTACATTTATGTTATATGCCAATAAATCACCCTTTTCTTGCTGAACTGCATTGCTCGCTGCTCATGAAAGAGTATTAATTTCTTATTTTCCATGCTATGTATGATCAAATTTTGGACTATTTTGATAAAATAAAAGGTAAAAAAAGGCTCAATATGTTGAATATTTTTGGGTGTGGAGACGACGGGGCACTATCGATTTCTCACAACTTGAATTTTATTATATCAAAGTAAGAACCCGATACAGTCTTACAATCTTTACAACACTTGTTGTTTTCTTCAGCAACACTCTTTACTTGAGCATTCATTCTTGGTTGCTCTCTTGCTTTTATTACTTTGTTCTTGCTAGCTTGCCTACAACTCAAATGGACCACCTCTATTCACAGGAGGTGATAGAACAATCTAGCTAAACATATTTTTCTGCTATATCATAGAATATTCCTTTAATTACTTAATTCTAGAATTACCCTATCTAGAATACTAGTCTCTCTAGAATACACATTTAGAGATCTTCCTCAATTCTCCATAACTCCGGAATATTCTAGATTTTCTTGACTTGTCTTGAGTACATAATTAAGTTGGCGATGAATTCTTTAAAAAATATATTATCGAATTTTGAGAAAAAGTTTATTTATGTAGCTTGACTCATTTATGTCATTGTCGTTTGAGAAAAGACATATTCATGCTATTATTTTTTAGGCATATTACATGAATATGCCCTTTAACTTGATCTCCTTTCACATTTATGTCCTCCAACTTTGAATGTGCACAAGTACACACTTAAACTTGTATAAAATTAAACAAACAGACACAAACGTCCTACTGGCATCCTACATGAAAATTTGTGTCCTATGTGGTGTCTGTTAGGATTGAATTCACGCACTCACACTTGATGAATGAAGAACACAAGAACTTTCGAAAGAAAGAGATGAGAGATCTAGAGAGAGAAATATAAAATCCAATATTTCGTGGTAACACCCCGTGAGTAAACTTCCACGGTGGTGAGGTATATTTATATTAATAAATCAGAATATTTTTTATTGCAGAGAATAAATAGTAAAGCCTAAAATTTCCATAACCCCTGGCAATCTCACCGCGGAGGTTAAACCACATAAACAATTATATATATTAATCAAGCTCCACAACCTAACAGTGTCTTGCATGTATTATGACAAGTAGGACTCGTGTGTCTATTTGTTCGGCTTTACACTAATTTAACTGTCTTTTTGTGCACACTCAAAATTGAAGGACATAAATACAAAATAAGACTAAGTTAAATGGTATATTTATGTATTATACCTATTTTTTAATTCCAATTATGCAAAATCATTTTTTAAACCTGACCATTTATTATTCGACCACATCATTAATTTTAAAACGTGAATAATCTGACATATTGTCTTTGCCAATTTATCCTCCCAAATTGGGATGACACACCCAATTTTTATATTCTATTAATTGAGTATTGAGTACTGAGGTGATTTCTAATTAACATAAAATCATATATAAAACTATAAATATAGAAACATGTGAAATAAGATGATTATATGGTTACTAACATAATAAGATATGATTTGTAAAAAAAATTTATACACATCAATACAGTAAGGTTATTTGCTTTCAATTTCTATTACCACTTAACAATGAAATCAATTAATTAGCTATAAAGAGGCATATTTATGTAATTTCTAAAGAAAAATGGAATTGAGCATATTATTGTACTTATTTTATTATTTAAACCAAAAGTGACAAAACTTAAGGGACTAACTATTATATTTGAAGGGTACAAAATGGATACTATCCCTATACATAAGTGATAATTTTGTCTTAAAAAAGAACTCTGATTATTTCAGTTGCGATTTTGGTAAGCAGAATCTTGATCCTAAAAAGAAAAATACTTCATTATGATTTCTTCATTTTGAAGACAAGTTTGAGTTTGAAATTCTCATCGTGTTTGTCACCTACTATGTTTGAACTTCACCTCATAAGTTAAGTTCTATTTGTGTTTGTCGAACAATAATTGAATCAATGACATCTTTTGCCTCATATGCCACATCTAAAACACGTGGCCAGAGATCCTTGTACCATTCTTGCTCAATATTTCTTATCCATTCGAGGTCTTGTTTCACCAGCCCAACTTCTTCCTTTATCAAAGCAATTGAATAAGCATTGGAATCCAACAAATCATCTAAGTGTCTCTGTAGAAGATGCATGAAGAGAGGTCCATGAATGATAAACATGTTTGAGATAAACATCGTTCTACAACTTGATTTAGAACGATGTTGTGAGCTTATAATCAATATTATCCCTGAGGCTAGCAAAGGACACGATGCATGTCGTATTTACATGCAACGTTGTTGTCAACATAATATAAAATTGATTGAATCAGATTCTCAACCTCTCGTCCTTTGGCAGTCATTACATCTTCAAACTACTCCAAATCAGAACATTTCAGCTTTTCAACTTGATCCACATCAACAACTTTTTGATTTTTATCATTCTTCAATCTCTCTAGGAAATCCAGAACATCGATAATGTCCTTGCAAAGAGCAGAAAATAATACCTGCGAGAATAACACATATCAAATTTTTAAGGCCACACGATATCTACAATTCAATACTTTACTCTCTATCAAATACTAACATACCAATGAGTTGCTTGCTATTGTCGTTTTTCCATGATTGTAATTTTCCTTTCAAGTTCTGCATAAAAAGTACACACAAACTTTATCATGTAAGAAGTCACCCTGCTTCTCACCTAGTAAGAATTCACACTTACCGGATGTTTAATACCAAACTAATACAACTTATCATGGGTAGGTAATGATTTAATAAGGTGAATATAAACATTAACTAATCATAATTAAGTGATAATGTTGTCAGTGACGGAGTCAGAATTTTTGCCAAGAGTGTTCATACTTTAGGAAAAAACAGAATAATGAATAAAAAAATTGTCACACTTGGGCTCGAACTTGAAGCTAGAGGTATTCTTGCACAGCCTTAACTGCTGGGCTGACAACCTTTATTATGTCAAGGTTGTTCAACAATTAGTATATATCTAAAAAAAATCGATATTTAGTATATATTCGGAAATTTTTTTTGATGAAGGTTGTTCATCTAACCAACCTTGTCAAGCTATAGCTCTGCCCTGAATGTTGTGCATCTATTGATTTGTTGTAAATCGATGGTGTTAGTACGTATTTAATTCTCTCTCTTTCTCCTGCATTTTGTTTCTGTTTATAGATTTCATTTTCCTTGCATCATTTTTTACTTTTCGATAATTTTACTTCAATAGAGATGAGAGTAGCAACCTTTTTACTTGATGATGAAACTATATATCCTTTGCTTGCTTTGATATTAGATTTATAGTGCTCAAAATTCTTGAAGTAAACAGAATACGGTGAAAGAGAGTGAGCGCACTCTGCCTACATTCTTGTTCTTCAGGATATAACAATTCAATAACGTCGGTATAACTCAAGAAACTTCGAATTAATTTAATAGTCCAAAACTTCACAAAAAAAAATATTTTTCTTCAACATATAATTATTCTCTTTTATATAGTGAATATAGTCGAAGATTTTAGAGTATTTTTCTTTGTCTCGACTCTATTTTCACTATATTAATCTCAATATAAACACAATGTAGTATTCCTCGTCTTTTTCACTCCACATTTTCTTGTATATCTTTTGTTATCAAAACAAAGTAAGACCATCACTATTCAATGGTGATACTTCCTTGCAATAAATAAAAAGATTATAGAATAGTAAATAAAGTAAATAAATAGTCCAAAAGTTACACAAATTACAAACATAATGTATTCGAATAATAACATTCAAAATTCTTCTCTACTATATTAAACTTTGTTGTTTGAAATAAAGTCAAACCTTAAAATTTTGTGGATGCAAAATTCTAAAATTTAAAAATTACAGAGTACTAAATTAATAATTTTTATATATTCAATAAATTTCTTACTACAAATTACTCTTATATTAGAAAAGGCATGTTCAACATGCCTGCTTCATAGGTCTGAGGGTATTTTAGTCTTTTTAGTACTCCATTCTGGCTACGTGTCCTGTTGTTGTGCTTTCAATGTACACGTTACTGCAGACTACCGATACATCAAAAGTTCTCCTTTCTCCAGCATTCTGTTGAGGTAAGCTTCTTCATATGATTTCTTTGGTTTTTTTGTGATCTTCTTTGTTTTCCTCAAAATTGATGATTTTTTCTTCTTTTTCAGTTGGTTTTAGTGTTGATGTTCAATTTTTGTTATGTGGTTGTGTTTTTCCTGTTTAATTACTGATTTTTGCTTTGTTTATTACATGCAACAATTAATTTAGTCTGTCTTCATCATAATTCTTTTGAATCTTATCTGTTCATAGATGGTTCTTTGTCGAAATTAACTTTTTGGGTTCCTTAATTCCAGTTGTTTTTTCCATCATACTTCTTTTGGACTTCCTCTGTTTGTATATGTTGGTTTTCCATTGGAATTAACTTTTTGGGTTTCTTCATTTTAATCATATACTGTTGTGGGTTTCGCTTCGAGTTCTTTTTACATCATTGCATTAACTTTTTGAAATTATTTTAATTTACAGTGTGAAAATTTAAAGATCTGCAACTACTTATGCCAGAATTTGAACTATCGATGTGTCTTCTTAGCAAATTCAAGGATCTGGAACTACTTATACCAGATTTGAACTACGGGTATGTTCGTTGATGGTTTCTTACGCCCTTTATTCCGATTTTGCTCTTTGTCCTACATTAGATACGTCTATGAGCTTTCTTGCTAAAGTGCATCTTCATTATCTGAGTTGTGTGTACTGAAGGACCTGAGAGAATTAGAGAACCGATTATTATGGGTGCTTCGTTTGGTCATGGGGAGAAAGTCAATCTGCATCTAGCCAGGGAAGCTGGCCACTCCTATTGCCAAATTGTCCGTGCTGCTAATATGAGAGTCAGAGAGATAGAAAAGGCTCTTATTAGAGGCAATCATTGAGTATCCTACAACACACGTGTTTCAACACCATTTGCTATAGATTTGTTGACCAATCAAGTAAGTTTATTCATTTATAGCAACTGTTTGTGTTGGTTATTATGGAGAAAATTTTCTGTTCTAGCATCAATTTGGTCTGAAATGAAGGGTTGTTGCTTTAATCTAATCAAACTTGGAATTATTCTTTTGCTTATGTGTCATAGTTGATTCGAATGACATGCATTCAAACAATTGCTATGTTGTCGATGTCTTAAAGATATTCATGTATTATGATGTATGAATTTGTGTAGGTGCACTAACTATGATTCTAATGATGTATAAATGACATTTAACGAAGTTTCGACCCGACTATATGTGATCTGTATGTTGTGAATATTGTACAATGATTTGCATATGCTATTGGTTATGATACTTGACTTCATATGCATACCTGAAAAATATTAGATCTCACCTATATAAGTGCTCCCAAAAGCTCTATTAATTGGCAATATTACTTACTATTATTGTGTCTTAAAAATAAATTCTCAACAAAATGGGTTTTCAATGAGTTGTTGAACTTCTGCTTGTCTTACATTTGTATTTTCCTATTGGCTCATTTGTTTTTTTTAAAAAAGATTCATTGGCCTGTTCTGGTGAAAAATATTGTCAATAACTTAGAGCTATTGGAGTTAGCAATTTCTTTATTGAAAAACTGAAGATCTTCTCGAAATAGCTCTTATTACTCTTTTTATTAATCAAGTGGAGTGTCAATGGTATGATCAAAGAGAAGGTAATTGTATATGACGAGAGCTGATACATGAAAAATGCATTTTTTGAACTTGTCAAGTCTATCAGTGAGCCAAAATTGTGTTGTTGTTGTAGTTATAACTTATTATTCATTACAGCTGCATATAACTATGGCTATAGTATTATTGATGTAGTTACTTTGTGAAGAAGGTTGACTCATCATCCAACTTTATAGTGATAATTAAACAAGTTTATTTACTAGCTCTTCCTTTTGATTAAATTAACATAATTTTTTGTGTAGTTGTCCATATTAATTTTCAGGTTTTGTAAAAAATTGCATCCTTTATTTTCCTCTTTACTTTTTTTTCTATTTTTTTATTTGCTATTTGGATATTAATTGTTAAGTGTTAATTGCTATCATTTTTTATGCTATGCTTAGTTTGTGGACTAATAGTTCAAAGAAGCTTAGCAGTCGTCCCTATTCTAGAAATTGAATGGTAATTCTATATTTTATACTGTTAAATTTATATATTATCAGCTTAGCTTAGTAGGAGAAAGTTACAACATGTGGGAAATGAAAAGGCTAGAAATACTCAAAAATGAACCAAGCAAGTCATGGCTTTTGTTGGCTTCTGCAATAGGAATGAGATTACTATGCTAAAATAGAAAAATGAAGACCCCTTTGTAGAATGCAACATCATTATTTGTTCCTTGCATAAATAATCTAGCCCAAATTTTTTTGTTCCTTGCATAAATAATCTAGCCCAAATTTTTTTGTTCCTTGCATCAGTGTTATTATCCATGCTCTTGAATAATTAAAAGCATAATAGTTGCTCCTCTTTTTGGCACAAAAATACTGAATTCATATTATTGTGAGTTGTTTTTAGGAATATTATTAGTTGGCGAACAAACAATTAATTTTTGTTCCATATTTTCAAGACATCCATAAAGTTTCATCCCTTTAGAATATTGAAGGAAAAATATATCGCTGAGACATTTATTTGTTAAAGTAATTCATGGTTTGTAAACATCTTTTATTGAACTTGAAATCCTAATGTTTCTCTATTTAATTAAGGTAGAACAAAAAATGAGAAGGTATGTGCAGGTTTGGACAATGCGATGAGATGTGTTGTAAGAGTCATGTTCTGAAGGATTAACAATGGAGTGTTTATATTGTTCGTGCCCCTGACTCTACTTGCTATGTGAGGTTTGTCATCTCTCCGTTTTATCACTTTGAATTTATTATATGGATGGTTCCTCACTCTTTGAAAGTGTAAAATGTTTTTGTATTGATATTGTGCTGCTGTGACTATGTTTATTGATGCTCTTCTTATGGCCTTTTAGTTTCTATATTTGTAAGGAGTTTGAGATTTTTATTTCAGGGTTTGCCAATTGAGGATTTAGGAGTGCAAATGTATTCTTTCATTTCACAGCTGAGTTGAGCAGTCATATGTTATTGTTGTGCGAAATTCGAGATAATACGTGAAAATATAAACGCAAAAAACAAGACAACAGATTTACGTGGTTCACCAATAAATTGGCTACATCCACGGGGAAGAGAGGGAGCAGTTTTATTATGGAGAGGCAAAAACAGAATTACAGAATAGGGTTTGCCATAGCGTCTATATATAGTGCTAAGCTACGCCCTAACAGACTTGGGCCCAACATACAGAATTGACAGATAATTAAGGGCCCAACAGCGAGACCCCCGTCCTTTCTGTTGTAACGGGTCCGATTCAAGGCATTCAACAGTTATGATTAAATATTTCTATTTCAGATCCTCATACTACTTTTTAAATTACTACTGAAGTTTAGTAATTTGATTTCAGTCGTAGTTACGGCATGAGTGTGTTATCTAATATTTATATTCTATTTTTGAGTTAGTTTTTTATGTTAGTTATGTTGAAATTCATTTTATTAACATGATATTAAAATTATACCAGCACGTCCATGTTGTGTGATTTTCAATATTTATCGCCCTGCTGTGTTGGTGTGATAGGGTGTCTCCATAGATTTCCAGAGTGAAATGTTGTCTACAAATGATGGATAATAATATGCTGCGGCAGAAATGTTGAAGTAGTATATCAATTTCTTGCTCTTCATTATTAAAGAAAAATTAGTTAAGTAGTTTCCTCATTTAAATTTTAGTTGTTTAGTAATAATTTAGAATGCTAATACAAACTTTATACTTGCTTCACATGATGAGGCCTCAACAACATTGGTCTATAGAGAGTTCGTTTCAATGGTTTTCAACAAGGTGTTTAATTTGTTCCTACTCTAAAATGAATGTGTTAAAGGAAACTTAGACTGAATAAGAGGTTAGACGTATCTTCTCTTAGAAACACCCCTAAAAATTCAAGTTAGTGAGACTGACAATACTATCTTTGATTTGTAAATCAGTTTACTTTATTAGTGAATCGTGAATTTGTGATTAATAAGATTTGTAAATCAATTGTTCCAAGTAAAGTATAAAGAAACAATTTATATGCTACCAAACTTTGAACCATGAACTCCTCAAGCCATGTGTTGTGAAATATTGCTTTTGAAACTTTTGTATGTTGAAGTGTTTGTAACAGATGTAGGATGTGGACATGCTTTCTTCTCTTTATTTTTCTAGGGAAGTTGAGGCAGAATCTGAGAGTGAGAAAAAGCCTAAACAGATTTAAAAACTATTTATTTATTCATCATGTAGACTATTTAATTAAAAAGGAATACATCTTTAATTAAATGTAACTAAATCTGTTAGAACAATATCTAGGAGAAGAAGCTAAAATAGAATACAATAGACTACCAACTAAAAGGTTATACCATATAGAATTAACATCCTCTAAATAAATCAAAGTTACATAAGTTAGGAATTCCCTCTCCCAGCGCCAAAATGTGAGTCTAAACCTCTGTCTCCTACAATTTTATCTAATATTTAGTGTTAGTCCGCCTAAAAGATAATGAAATCCGCAGATTTGAACAGACCATAAAAGTTAATCCTGATGATGATGATGATGATGATGGTGATTCCAACACGGAAGACGATAGGGATAACAAAGAGAAGGCTGAGGAAGCTGATGATGGGAACAAAGACCGTAGTAATTGTAAGAGTGATCCGCTTATCACAGATCATGTTAGAGTCCTTTGGATGGATGAGTCTGAGTCTACAGAGAGTAGTAATAATGTCATAGTTGTCGATAGAGGATTTCTGCATGGTGATTATGTTGCTGCAGCTTCTGATCCAACAGGTCAAGTAGGACTCGTGGTTGATATCAATATATCTGTAGATTTATTAGCGCACGATGGCTCTATTTTTAAAAATGTCTCATCTAGAGAGTTGAAACGTGTTCGGGGTTTTACAGTTGGTGATTATGTTGTCCTTGGCCCTTGGTGGGGTAGAATTGATGATGTTTTTGATAATGTCACAGTGATGTTTGATGATGGTTCTGTATGTAAAGTTATGAAGGCTGACCCTTTACATCTTAAACCAGTTGGTAGGAATGGCCTTGAAGATGGACATTTTCCTTTCTATCCTGGTCAGCGTGTAAAAGCTAGCTTCATCGTCAGTTTTCAAGAATTCCAGATGGTTATCTGGCTCATGGAAAGCAAATAGGTTAGATTATGAATTCGACTCTGATACGTATATTATTTGGTAGGTCATTTTCTATTGACAGAATTATTTATATATATATATATATATATATATATATATATATATATATATATATATATATATATATAATTCAAAGAGTTATGTACTAATTTTGTATCTATTTTTTCATCTATATATACATCGGTATTATAAGAATAATGTCTACGTTGTATTTTTTCTTAAATCTGTTTCTTTTTGTCTTTTTTTTCTCTATTAGACTTCTTAATTTAGTTTTCTATGAATGTTTAATTACTGTAAGTCTTTACACTTATTTTGTAACCAGTTTCTGATAACGTGCATTGCACATTTGTCCCTTACGTTCATTACAATTTTTTTTATTTATTTAGAAGTGAGTTATAAGATATTGATATTGAAATTAACAATATTAATTTTACTATTTATTTTTTATTGATTAAAATAAATCATAAAATAGAATGGTGCATTTGCTATCAAACCAGAAAATGTGAATCATGACTTAAAATGTCTATGAATTCGTGATAGAAAAATAATAATAAATGTATCTAATGCCTTTAATGAAAGAACAAAGGCGCGAGACAAATTTATCAGAAATATAAATTTCAATTACACATTTTGCATTTTCTATAAAGAACATAAACATCGAAGCTTAACGACAATATGATAAGATTGTCTTGCGAACACAATTACTTGTGATAAGTCCATGGGTCTATATATGAGTATATTCTGATGATATGATGTTTCAGTATTCATGAAAAAATCATCACTCTATTCAAATAGTAAAAATAATTAATATGTTTTAGTTTTCAAATTTAATTTTTAATAAACAGAAAATAAATTAACAAAATAAAAAAAACAGACGAACCAATAATAACATTATAAACATGCTTATGATGAGTCATATATAATTTGAAGGAAACAATACTACAAATTCAAACTGAAGAGAAAATAATATCTAAGACATACTAAGATTAAAATATGTTCTCTAACTAAGATCTTAATCTTAATCACCCATAAATTAAATAGGGAAAGAAAAGACTCTTGTAAAAGAAATGATGATGTATACAATTTAAAAGCTTGTATGTGAAAATAAGAGAATAAATATATTGCATAAAAAAATTATAGATGCGAAAAATACCATGTGTGATTCTTAAAGGTAAAATTATTTTACTATTACCTGTAAATTATATACTTTCATCATATTTATTGTTGAAATTTCACCTTTTAAAAAATGAAAAACAAGCTAAGAAAAAAAAAGTAAAAAGGGTAAAAAGGAACAAATAAAGACTAATAAAATAGAGAAAGGAAAAAATCCAGTGAATATCCTGATTGAAACAGCGTTATAGAAATACTCGGATAAATCAATATACCTTGAATTTCAAGAACACTTCAAATTGCATCACATATAAATCTAAGAAGAGACATATTCTACAATAAGAGGAGGGGGGATGGGGGGTTGGAAGAAAACAACAACAAAGAAATAGTGTTAAAAATTTGACACCTTCCAATTTCAAAAAAGAAAAATGATGAAGGGTAGGGGATGCTGGAGGACTATGAGATTTCTAGGAACATAAAATCAGTTTCTCACCGTGTGGTTGTCGAGAAATCGCTGCAGACACCACACTTCATATGTTCTTCATGATTGTCTTAAAGTCTTCGATTTCTTAACTAAAATAACGTTCCTATATCTTCTATACCTTTTGAAATGTATATGAAAATGAAATAATTTACTTAAAGATAAACATAGTTTCTTTATTTACCTGAAGAAAGTCATTATTTCACTTGGAAAAAAGATTTATTACTTTCAATTGCCTTTTTGTTTATCCTATTCATGGTTATTTAAATGTAAGTTTAACTGTTGTCTTTTCATTTATCCTAATTATTGTAATTGAAGTGTGAATTTATTTTTTTCAGGTCATTAAAAATGAAAATATTATGCTTTTATTTTCATATAATGTTATATATATTCAAATAATGTTCAAGTGAAGGGTAAATTCGTAATTCAACTTTGAGCTAAAGGACTTCCCACTTATAATATAACTAGTCTCCGAGCACGTGCGTTGCACGTGTATCCCAAATAAAAATCAATAAAAAAATAAATGAAAACGTATATAATAAACTATTAGGAGAATTATGATGTTTTTTTCGAGTGTTCTTTCGATATTTTCGATCTACTGCACATTAGATAAGTCTCCAAAGCTTCCAAGAAAGACACATCAAGTTAAAGAATTAAAAAGGGAAAATGCGACGTTACTTAAAGTCATCTGGTATCCTTAATGTGTATCGTTACAAATGTAACTACTTCCTTAAAAACTTTCAGATATACCCAGACTTACATTTACAGGCTTACAACTACTATCCATCACTGTTAGAGAAGACTTGGAGTTGCTACATTTGTTGAAGAAAATGTGATATATTTTGCTAGCAAACAACTGCAATTTCAATTTATTATTAATAGTTTGAAAGTTTAAACATGGTTTCTTTTCTGTGGGAAGCTATGCGTAGAGAGTTTCAAAGAGAGTTGATCATCATTCAGCATCAAACCATATGTGTACAACAGCATTCAATTTTTGATATGTGTGATTATACCTTTCAAGCTATTTATTTTACCTATTAAAAAAATTAGAAAGTTATCATTCAAATGAAGTTAGCAAATCAAACGAAAAAATCTAGACTTAATAAGATTGTACCTGAAAATTAGAAGACATTTTTGTACCCACTTAACAATGGAAGCTTGTGTTGAATGACTAATATTGAGTATGTTTATGTAGTGTAGTCTTGGAGATTTGTTGATAAAAACTCTTTGATATTCCTCAATTACTTAATTTGATCCTTTTCAACTTCTCATAATTAGCAAAATACGTTTCAACTTCTATATTAATTGAAACTTTATTAGTGTTCATCCTATTTGGTTGTTTCACACATAGTAATTGAATAGACTGTTGAACTTCTTATTTTGTTCCTTTATTATGTAATTCAATATTACTATTTAATTAGATATTTAATTTATATTTGGGAAAAGTATTTTATTACTTTTTAATTTAGTATAGGGGCAAAGTAGTAATTCAACTTTACACTTTAGAGCTTCATGCTTATAATAATACTAGTTTCTGAGGACGTGTTTCGCACGTGTATTCTATGTGAATTTTTATAGATATGTTATAATGATAAAAAATTTATGGAAATATATATGTAAATTAATGAATAATATAATTTAACAATTACAAAATAAGAATAAAGACTTACGCAATAAAACATTCATAAAAAAACTAAATTAAGAAGTCTTATGGTGATAAAAAAAAAAGACAAAAAGAAACAGATTTAAGAAAGATCCAATGTAAAAATTGTTCTTATAAGACTGATGTATGTATAGATGAAAAATAAGTACAAAATTAGTACATAATTCTCTGTGTTTTTATCAACTCCTTTCATATCCTATCAAAATTCAAGACGTTTCTTCATCTACTTTAACTATAGAATGAAAATGATAGCCTAATAATCTTGGTAGGGATTTCATGAGATTAAAAAAGTTGAATTTATATAGATAGAATAGAAGGAATATCAAAAGATATATTAAAGTTTTAGTTTAAATATTTGGAGGTTATGAATATGAAAAGATGAGAGTTATGAATATTTAGAGTATAAAGTTGAATAAGTAATTATCAAATAATAATAAATAAATGAAAACTATGAAAAAAGAAGTTAAAATTAGCAAACCATGTAGAAAGAACAACTAAAGTTCTTATCACGTAATTAAGCGTTAATGAATTTAAATTTGTGAAGATAGAGTCATTCTTTAATAATAATCGAGAGGACATTATCAACGTGTGTCTCCATTTTGCAGATTTGCACCCTTTATATTATTAAATTCGTTATTTATCATAAAGGATAATACTTTATCCACATAAATTATATTATTCATGAGAGGAGTTAAGGAAAAAGTTATGAGAAAGAGGAAAATATAGCAATTTAGTAAAGACTTTTTTTTTAAAAAAAAATTATAATTATTATATACATATAGATTATAGATGATAAATATTAATTAATTGGATATTTAATTAGAAATCAATCTTTAGAAGTCTAAAAGTCATTAACCTTTTAATTAAATTTATACAATTAAATATTTAAATATTTTATAACAATTTAATTTATAGAAGGGGTAAAACTGTAATTCAACTTTCAACTTTTTTTGTTCATGCTTTTAGTAATATATGATATGATATGATTGTTACATTTTATTATTCATTACATTTTGCATATATATTTCCATGAAATTTAGTCATTCTAACGTATATATAAAAATTCACATGAAACACACGTGTGAAGCACAAAGATTTATATAATCAAAAATTCAAAATTGCTGATTTTCAAGATTATCAGCATAATTTCTTCCTCCCAAAGGAAGTGTCCTACTCTCTCAGCCATCAGTTGAAACAGAGGTAAGACACATTCAACAATCTCGTGATCAATGCAACCATTCACTATCAATCCATGGAAATCTCTTACGTTTCTACATACATTCTGAAGAACCTCATACTCCAGGAAACATCTTTTCAGCACGATGCCTCGCTAGATGATAGAGATTCAAGAGGAGGAAGTACAATTGCTCATCCATCATGATGGCATCTGATTTAGAATGACGATGATCATCCATATTACCGGCGAGGCTAGTAAGGACATCATCATCCAAAATTGCTTGAAGCAGATTCTCAACCTCTCGTCATTATATCTTCAAACTGATCCAAATCGGAATAAGAAAGCTGAACATATGTACAAATAAATGCCAGCTCCAATTTTCGCTTTTCAATTAGATCCACATCAACATCCTTTTGATCTTGTTCATTCTTTAATCTCTCCAGAACATTGGCAACGTCCTTGCGAAGAGCAGAAAATGACATCTGCCAAAAGACCAATCAAATTTACAAAGCCACATTTCTACCCTGCAATAACTGCTGACATGTTATATTTCAGTGCCCAAATATTTGACTTATACTTCCTCGATAGCTAACACATAGTCCAGTCACTTCAATGATATAAATAACGTTTGAACATTGGGACTGTACAACCATTCATTCTCAACTATAAATATTAATAGCCTACTATATGGCTTGTTTACCCAGAGTAATCGAAATTTAATTTGTAGACAAAATATAATGATACTAACTCGCTATATATTTAGTAGATAATGTGCTTGATTAAAATCTTACTAGAAAATGACATTTAGCTTGACTTCGGTGGATAATTGTGACCTTTAACTTTGCCGGTGCACAAGTATGCTTATCTGCCACAAAGGAAAGAGATAAGAAAGTTAATCAAACTTTCAATAGTCTCAGTTTGAAGTCAATGAAGTGATTGAGAGAACTCAGGTTCAAATTTCAGTGGAGTTATCTGATACCTGTTGCTGGTGCGTGTTTTCAATAGTCATGGCTCGATACATTAACTGTTTTTTTTCTGAGAAGGGATACATGAACTGTGTTTGTGATAAAAGAGATAAATTGATTGTTAGTTGTAAAACCAGAAGTTTCCAAGAGAAAGAACAATAATCCTAATTTATTAATTGTGTTGCTGCTTTTGATAAATGCCAGGGATAAATAAACAGTGTAATGAACTTCAGTGTTTAGTGAGATAACATAGTTAAACAATTGATGTCGAGTGAACTCTTTGAATAATTTAGTGGTCTGCCATATGAAGAATAACTTGATGTTGCACAAATCCTACATTTTGACAATTCATGTTTATCTTTCCTAGTTAGACGCTTCATTAGCTTTTGAGCTCTTCTTGTTCAGTGGCTCTTTTGCATAATTGGTTATCCAGCTTACGCTTTAAGGCACTTGGAATGGATGTGATAGAGGAGATTACCAACACTAGTAAGGAACTTCAAGATCTTAGGGTGTTTCCTTCTGATCCATGACCTAATGTATCCTTGACAGAGCAAGGCCTTGTAAGTGTCTCCATGGGCTGCCCTAAGCTTCAGTCAGTTTTATACTTCTGCCTCCAAATGATAAATGACGCCTTAGTTACTATTGCTAGGAACCGTCCTAACATGATCCAATTTCATTTATTATTGAGCCTCGAACTCCTGACTTGAACCACTTGATGCTGGTTTTGGGACATTGTGCAACACTGCAAGGAATTGCAGCAACTTTCTCTTTCTGGCATCCTTACAGATCGTGTGTTTGAGTACATCTGGGTCCATGCTAAGAAGTTAGAGATGCTTTCCTTAGCTTTTGCGGGGGATAGCGATCTATGTTAATCTTTCACCCGCGTATACTTGCTTGAGCCTTGTGTAGTTGTAGTGCTGGTTATGACCCTTTGTTGAGCGACTTTGCAGCAATATCATTTTAAAGTTCACTACACGGCCTAGCTTTTGTGATGAAAGTTCGCTGGGTTTGTTATAGAGTAGTATCAATATCGTTTTAAATCAGTACCTTGACTAAGCTTTGAGCATATAAATGGGACTTCAGACGAAGTTAGACATAAAGGAGGTTTGGACAGCCAAAGGCAAATCCACGGAGTAATCTATGAATTCATGTGAATCCCTCAATTTCTGTCAAAATCCTATACATATGTGAATCTAATTGTTATTGATATTAACATGAGGTCGCCACAAATACTTGTAAACATCAAATCCTGGATTCCTCTTGCATACGGATAATACAGATGTAGTAATATGCAGTCTACTAGAAAATTAATGTGTATGTGAATGGAAAGAAAAAAAATAAAGAGAGAACGACAATGGCAAACAACATAGCATAGGAATAGTAGTTTGGTATACAAGATTAATGTTTATAATATGAACTTCAGATAGTTACTTCAATCTGGACAAATTAACAAATGATACGTGTACTTATAAAAATTATATTTTTTGTTAAAAGAAACTAAGAGGAATCTCATAACAGGATATTTTAATCATATACAATATCACCCAGCAAAGTTCAACCATAATGCTACTTAAATAAGGGGATATTCTTCTGGCCAAGGATCTGAAGCTCGCTCCCTCCTCTCATATCTTCAGCGTATTCCTTAATCTTGAGAGCAGAATCTTCAAGTTGAGGACTCTTTACAATTTTGATAACTTTCAATGAATAAATATCTCCAAAACTAGGTGGAATCTCCTCAAGCTTACGACATCCCTGCAGTTTTAACTTCTCAAGATTGGGGAAGGATTCCTCTCCAACCTCCCACTTGGAAAGAGTCGCTAGACGCAAGTTCAAAAATTTGAGATTCTCAAAGGTGTCTTCCTCCCCCATGTTCCATTCTTCTCCCTGGATGATTGCATCATAAAGGGACAACTCTTCAAGGTTGGGCAGTCTCGCTATTGTTGATAGTGAATCGGATGTCAGAGGAAAGTCATGCAATGACAGTTGTTTCAAATTTGAAGGAAAGTGAAAATCCCACGGCCGATTTGTCTTTACAGAGGACCCACTGTGGTTTGTGTTTGAACTTTTAAAACCTACATTGAGTATTTCTAGTTCAGTTAGGCAATCCAATTTCGGGAACCAATGTTGCTCTGTTGAATAATCCCATGACTCCTTGAGTTCAAACTGAAGCATCTGAAGATTGGGAAACCTTTTGAAAATATTCTTTGTATCTTTCGAATAGGAAATCAACAGTTCCCCTAATATTCTCAACTTCTCTAACTTTGTGTCCTCTGCTATCAATATTGATTCATCTGCATCCATATCAAAGAAAGAACAAGCATCCGCGAACAGCACTCGCAGCTTTACAAGATCCCAAATTCTTGGTAATAGTATCAAGGTTGATTCTTTGTTTTCAACCCACAATAATTCTAGATTCCAGAGGTTTGAGAAAGACAAAGGCAGATATTTAACTTGTGTCCCAATTCTTAAGTACCTCAAATGATTCAACATGCATATTTCATTCAGCAAAGAATCGTTCACCATGATAAAAGAGGTATCCAGGACCAACACTCTAAGAAGCCTCAAGTGTCTTAGGTGAAATGTATCAAAAAGACTGTCATCCAGCTCGTCTCCAAAAATCCTCAAAGAATAGATGTGTTTACCAGAATGCCTTTTCTTATTTGAATCAAAAATGACAAAATTAAGCCCAAAGTGCTCCTCATCATCATCATAATCAATGGTAATTTGACGAGGCAACAAATCTGTTGGAGCACTTGATCTTATCTGATCAAACAAATTTTCCTTTCTTGCTTTTATCAAACAAAAGTCATGCACAAGATCATGAATTTGGAAATTCAGTGCATCACCTATCTCATTGAAACAAATTACCAAGCTACTGGAAATTAAATCATCCATATAAATCTTCACCACTTCTTCCATACTGTTCATCTCCGCCTTTCCCACAAATCCTTCAGCACCCAAATAAACATTAAACTCATAGATTGTCAATGAAGTGTCCTTCGGAAAACTTGCAAAATACAGCAAGCATGGCTTGAGGTGATGTGGTAAATGGTCATAACTTAATTCTATAACTTTCATCACTTCCACTTCACTGTTCAAAATAAAAGAACTCAAACTACTTTGAACTTCAAGCCACACACTCCTTTTCTTTTCCCTCCCAGCAATGACTCCAGCAATCAGATCAGCCACCAAAGGAAGCCCTTTACAATTTTCGGCAATTTCTTTACCGACATCTAATAGTTCATCAGGGCAACTCTCGTCCCCAAATGCCCTTTTCTCTAATAATTCCCAACTTTCATCAGGTCTTAGCAATCGAAGGTCAAGAGGATCAGTGTAGAGCTTTCCATGCAAAGCTACTTCCTTTTCTCGAGTTGTCAAAATAATTCTACTTCCTTTCTTAGCTTCAGGAAAAGGTCTTGTCACCTCATCCCATGTAGTAGTCTCCCACACGTCATCTAAGACAATAAGATACCTCTTTCCATACAGTTGTTTCCGTAGCTTATCAGGAACATCAATATTCTCACTCAATTTTGAATCTGAGTCACTAACTTGATTGAAAATTTTATTCAACAACTTCTTCTCATCACATCCTTGGTCGACCGTGCACCATGCACGAAGGTCGAAATGGCTAGAAACTGACTTATCATTGTATACTTTGTATGCCAAAGTAGTTTTACCTGAACCCGGCATACCAGTGATCGAAATGACATCTAGATCTGCCGGTCCACTGGTGAGCTTTCTAAGTATCAAGTTCGTCTCCTCCTCAAAACCTACAATTATTTTATTAGTTGTCAATGACTTTCTCTCAACTGGTTTCTTGGGAGAGTTCACAGCGATTAGACCTCTGTCCTTGGGAATGCTCTCATCTAAAGCAGAGATCTCTTCTTTGATAAGTTTGATCTTCTTTATGGTAATGGGAAGTGAGAAAATAAGATGTAAGAGACCATTATCTCGAACAATAATTGAATCTATGACATCTTTTGCCTCATAAGCCACATCTAGGACACGTGCCCAGATATCTTTATACAATCCTTGCTCAGCATCCACAAAGAATGATCTTATGAATTCCAGGTCTTGTTTCACCAACTCGATTTCTTCCTTTATCAAAGAAATTGAATAAGCATTAGAATCTAGCAAATCATTTAAGTGCATGTGTAAAAGATGCATGAAGAGTGGTCCATCACTCATGGGGAAGCAACATTGAGATGAATCCGGGGCTTTCAGATAAACATGTTTGAGATCTTTCTTGAGGAGTTCAATATTTTCCAGCAAGTCTAGGGTTGCACAATTTGTTTGGTTATTACCCTCTTTATTCCTTAATTTCTCTTCCAAGTCACGTACAAGAGTTGATACCTCCCTGGTAAGTACTCCGACATGAGCCAAGAGATCAAAAAGTTTGTCATGATGAATAAAGTCCTTGGGCATATCAGAAAGAATAAGTAATAGGAATTCCATCATGACATGAATGTTTCGAGCCCCTGAAGTGCTAGGGCGAATAACAGTTATCATATGCTCTTGTAGTTGAATGATATATTCTCTGAGAATATCCGGTGAGGTTTCCAGGAGCTTCTTAATGAAGCGTCCAACTTCTGCTGAAGTTGAAGCTTTCAAATTTGTATAACATATGTGCATAACCTCCAGTTCAGTTGGAACAATCTTCAAGAGTAGATGTGTTAGCTGGAAGAGTCGAGAGTCTCTATCATTCTGATCATCCTCATCCGAGTCTTCATCAGTCTTATCCTCCCAAAGGAAGTGTCCTACTCTTTCAGCCATCAGTTGAAACAGAGGTAAGACATTCTCAACCATCTCATGCTTAATGCAACCATTCACTATCAACCCATGGAAATCTCTTAGGTTGCCACATACATTCTGAAGAACTTCATATTGAGTCACTCCAGGAAATATCTTTTCAGCGTGATGCTTGGATAGATGATACAGATTCAAGAGGAGGAAGTCCAATTGCTCATCCATCATGATGGCATCTGATTTATAAGAACGATGATACAAGCTGATACAGTCATCCATATTACTGGTGAGGCTAGTAAGGACATCATCATCCAAAAGTGATTGAAGCAGATTCTCAACCTGTTGTCTTTTTCTCGTCATTATATCTTCAAACTGCTCAAAATCGGAATAAGAAAGCTGAACATATGTACAAATAAATGCCATTTTCAATTTTAGATTTTCAACTTCATCTTTGTCAAGAGATTTTTGATTTTCCTCATTCTCTAGGAAAACCAGAACATCGGCAATGTCCTTGCTAAGAGCAGAAAATAACACCTGCCAAAATAATACATTTTAAAGCCACATATCTATAATTCAATACTTTACAGTTTACTCTATAAAATAACATACCAATGAGTTGTTTGCTTCTTCATTATCTTTTCGTTTTTCCATGATTCTACTTTTTCTCAAGACCTGATGAATAAAAAGTAGCTAAAACTTTAACAGGAGAAAGAAGATGAAAAGATACGAATAATCAATAATATCACTATTTTCACATATAGTAATTTTAGACTCGCACAATTGGAAATGTCAATCTTAATCACACATAAAAATGTTTATGACATGAAGTCACAAACATAAAATCTCACAACTGTTAATTATTTACAAAAAAAGAAAAAGGAGTCCTGCTCGTTTACCATTACTTTTCCAACCTATACAAAGAAGAAAGTTATCGACTTAATAATTATAAATATGTGATTGTCAATCTAATTATTATTGATATTAATATGACGTCGACATAGAAACTAGTAAATATCAAATCCTAGATTCGTCTATGTGTATATGGCATATAAGGAGCCTACAAGAAAATTATTGTGCGTGTGAATGTAAAGAAAATAAAATAAAGAGAGAATGAGAATGGTAAACATCATCAAATGTATCTGTCTAACTTTTTTCTGCCAAAAAGTCTATAAGGTAAAGGTAAAGAAAACAGTAATAGGAATGATGTTTTCGTGTATAAGATTAATGTTTAAAATATCAGCTTTAGATTTGGCATCAACCTCAGATAAAGTTGTGTATGATCAAGTAGAAATCTATACTTGACATCGGTGTGTCTCATGGACATACTCATATGTGATGACGTGCCAAACGGACAAATCAACAAATGATACATGTTTTAAAAAACTTGTAAGTTTTCTAATCGAAACACCGAAAAGTCAAACAAATATGTAATCATATACAGATCTACTCATTAAAGCATAACTTACTGTCTATTCTGCTATGTTTCTTCTTTCTACTTTCCACCCATAATGCTTAAAAGCTAGTTAAATAACGGGATATTATTCCCTTATTTTGATTAAAATTAAGTAAAATGTCATTAGATTAATAATCTCTCTAATAATATTATTTTTCTCCTATCTCGACTTGGGCTAATGGAAAAAGATTTTTTCTGAGAGTAGCTGAAGTAGAATCAATAGATTAAGCATGTTCACACCTTTTTGACATATTTTTGTTGAAGTAAGAGATCGAAGAAGTAGTTTGGTTGAAAGGAGACTAATCAAATAGCTAGATCTAGAATTCAAACAAAGATTACTAAAATACAATTCATTGACTTCACAAGTCCTTTAAATACCAAAAGTGCAAGATTACTAAAATACAAATGAGTAGTTTTTGTTGAAAGGAGAACAACAAAAAGCTAGATCTTAACCATTTTCATGTTATTCTGCTGCGAATAAAGTTTAGCAAAGAAGAAGATGGTACCTTTACACAGGCTGAAGTTTAGCTACAGAACCCTTTGTTTGAGAAATAATGCTGAACCTATTGGAGAAAAAAACAAGTGTAGTAGTTGAAATATACAATACAAATCTTTTTGTAATGAAATATTAAAATACAAACCCACTGACTTCTCAAGTCTTTTTTTAATCAATGTCTTTTGTCTTTCAATTTTTATACTGACGAAGATAAAAACAAGTGGTTGTCATTTCATCAAACACATTGTAGACATTGGCAATTTCCACATTATAGAATTTAGGGAAAAGGGTCAAATATGCCTTAAAATATTTAAAAAGGTCTAGATATACCTAAAGTTTGTTCATTGATGGGCTCGCCATTCAATTTTTGGTCCAAATATGCCCTTATGACCACGTTAGTTGTCATGTTGGACATATCCAACTCATTTTTCATTTCTTTAAATGTCACTTGGAATTGTCATGTCATTTTGGTCTTACCACATAACATTTATATGAAAATGGAAAGATATTTGGACTCATAAACACCTAATCCGACCCTTAAATAAACCTCCTTTTAAATAAATTATCCGGCTAATTTTCAACAATTTTGTTTAATTTTTATTTTTTCAATACATTCAAAAAATGAGTAATTGTTAATTAAAAAAATAGGAAAATATGAAAAAAGTATAAGATTAACGCCAAAAATTCATAAATAATTATAGTAACCTAAATTCAATTTAGACACTTTTTTTAAAAAAATCATTTTTTTCGATAAATCCCGAAATGAGTAATTGATTAATAAAAAGTATGAAAAGATATAAAATTAACGCCAAAAATTAAAAAATAAATACCGTAACCCAAAATTCAACAATTTCAACATTTTTTTAATTTTTAATTTTTTCGACAAATCCCAAAAATGAGTTTATTAACAAAAAAATATAAAAATTACACGAAAAAATCAGAAATAAAAAATAGGAAAATATGAAAAAAAATATAAAATAAAAAAAATGGTTGAAATTATTGAATTTAAGTTTACTATATTTAATTGTGAATTTTGACGTATATTTTTTATTTTGTTTTCATATTTTTCCCTTTTTATTAAAAAATTACTCATTTTCGGGATTTGCCGAAAAATATAAAAAATTTAAAAAAATTGTAGATTGAAATGTTACTATATTTATTTGTGAACTTTTGGCGTTAATTTATATTTTTTTCCATACTTTTGATAATTTTTATTAATTAATTACTCATTTTCGAGATTTATCAAAAAATAAAAAATTTAAAAAAAATTGAAATGTTAGATTTAATGTTACTATATTTATTTGTGAATTTTTGGCATTAATTTTATATTTTTCATATTTTTTCTATTTTTTATTAATCAATTACTCATTTTCGGGATTTACCGCAATAATAAAAATTAAACAAAATAGTTAAAATTGGTTCAGATAGTGAATTTAAAAGGAGTTGATTTATGGGTCGGATTAGGTGTTTATGAGTCCGAATATCTTTCCATTTTCATATAAATGTTATGTGGTAAGGTCAAAATGACATGACAATTCCATGTGGCACTTAAAGAAATGAAAAATGAGTTGGATGTGTTCAACATGACAACTAACGCCCATAAGGACATATTTGGACCAAAAGTTGGACGGCGAGGGCATGAGTGAACCAAACTTTAAAAGGAGGATATATCTAGACCTTTTCAAATTGTTTAGGAGCATATTTGACCCTTTTCCCTAGAATTTAATATAGAATATCAAAATATGAATTCTTGAAATTGAGTATAATAATTATTTTCTTTACAATGAATATATGTACTATATGTGTATATGTTCAATATAATCGAAGAAAATTTTGCAGAAAAATAAACAACAGAGTTTAAAATATGTACTCAAAAACAATAATTAATATCATAAGTATAAATTAATGAGGAAAAAAAAACATACCGCGATATGAAAAAATAGAATGAAAAAAATTGAGAAAAAACAGTGTTGTCAGTCAGCGGCAGATCTATCAAGGCCCGTGAGGGTGCCACACAACCCACGAACTTCGAAGGAAACTCTATTTATATTTATATACAACATATGTATAAATAATAATAGTGCCACTTAGAGAACAAAAGTATTCTTTGGTGTAGTGGTAGACTATCAAGTTTACAAGCCATAGTCCAAGGGATCAACCCTATTGACAGCGCTTTTTTGTTTTATATTTTTCTTTTTAACCACATGCAGTGTTTCTTTTTTAAACTACAAGGCACATTCTCTTTTGATTTTGATTTTTTTTATTAACTTCTTATTAAGTATTAATCAATAATTATTTTTAACTAATTTAATTTAACTTTTTGATTTTTCTTTTATATGATTAAATATAATAAGAAAATTCTATTCACCGTTGAATTCTCCTTTTAACTTTGGAACAACAAAAGTTGTCGTTAATTAAAGCTTCAGGCTTTCATCCGTCGCTCAATCCTGCTCTCCTGTCCAGCCACAAGACGAATAATTCTATCTGAATCTAATATTGATTTTATCGATGAGTCTACTAAGCATTAGAGACAATTTAAAATTTGAAGATTTTGATGCACCAATACTATTTTAATTGAGATAGTTAACAAAATTTTTACTACAATTAACGAATAATGTAGTACTTGATTGGTTACTAATGGCTCGAATATGATTTATAAGCTAAACTTAAAATAAAAAATAATGAAATACGATTGAACTGTATTCTCGCGAGTGGTTCCTCTGGCTTGTAAACCAACTAAACAAGGGCACCTCTACGCTTCTTATGGGTGCACTGTTGATTATATCCTACTTTATGTCAGTATCTCACGATAGATATACATATATACATGTAATTTTTTTGAAGTTAACGGATGCACGTGCACCCCTATCAAATCATGTGGGTTCGGCTCTGGTTGGCACCCAGTGGCTATAATTCCTAAATTCGCCTCTGCTGTCAGTAAGTCATTCAACAGTAGCAAAGTACATAAATATTTAATTTTGCAGAAATAAAAGAAAAAGATCATAATTGTTTTTTGTTTTAAAATGAGGGTGTGTTTAGTATGAAGGAAAACATTTTTCGAAAAATATTTTCCAATTTTCTCATATTTGGTTGGGTCAAATATTTTCCAAATCAAATCATTTTCCTCAAATTTATGGAAAATGACCTCCATTCCAAACTTAAGGAAAACATTTTCCAAAACTCTTTTCTAACCTCCCCCTACCCACGCCATTCTACCAGTCCCCAACCCACCCCCTTCCAGCCCTCTACCCACCCACCCATACCCCTAAAAAGTTTAAGTTTAGTTTTTTAAAAATATTTTTAACATCACAATTTCATTTTTTTTTTCACCCCTACCCTCGACCCCCTACCACCCCCATCCCCAAAAAATAATTTAAGTTTGTTTTTAAAAAAATATTTGTAACTTCAAAAATTCATTTTTTTACCCCTACCCTCGACTTACCCTCTCCCTACCAGCCCCCCCCCCCCCAAAAAAAAATAAGTTTGTTTTTAAAAAATATTTTAAACTTCAAAAAAAAAAATTCACTCCTACCCTCGACCCCGCACCCCACTCCACTAGCCCCCTACAAGCCCACCCCCACCACGAAAAAAATTTTAAGTTTGTTTTTTTTAAAAAATAAATTCAACTTCGAAAATTATTTCCTACTCTAGTAAAAAATAAAAGACATTTCTCAAAAGTATTTTTCATTAAAAAACAAGCACTAAAATATTTTTCCAGAAAATATTATCTACTCACCTACCAAATATGAGAAAATCAGTAAATTATCTACTTGTTTTCCAGGAAAATATTTTCCAAGGAATTTCCGTCATACCAAACACACCCAAGAGTATATTCCTCTATTTATAGACAACAAAGGGTAGTGTCAACAAATTTTTATTGTGCCTTATTAGAAAGGATACAACTATTTGAAAAAATTGCAACCCTTCGGAAAGTTTACAACGTTTCATAAAAGTCGCAACTCTTCATAAAAGTCGCAACTCTTCATTAAAGTCACAACTTATTATAAAAGTCACAACTTTTCATAAAAGTCACAACTTTTGATAAAAGTCGCAACTTTTCATAAAAGACAGATTTTTTCTTCAAAGAGGAAGGCTCGTTTTAGAAATAAATAAATTTAAAAGAAAATTATTGCTTGTGGCGGCGCTACATAGGTGGTCCTAGGATTCTCTTTTATATAAATATATGAATTTTTTTATTAACGTGGTGTTCGGACCAACTTTCACACTTTGATCTGCTGAAATTTGAACCTAAAACCAAATGGTTCTCATTTCTCAGTCACTTCATGGACCATTAGGTCACACTGTTAGGTGCCCAGATATATTCATGTCCAAACATCCCTTGGCCAATTTCCATATACCATTATTCAACCTTGTATTATTAGTTTATTCTAATTTCACATTTTTAATGTTCAAACGCCCACTTATATTCTGCCTGTTTATATCAAAAAATTCCAACAGATTTGAATTCATGGCATACACTTGATATTTTCTCAAAAGTAAATACTTAATAGGGATAACGCACAAGTACCTCCTCAAACTATGACCGAAATCGCAGAGTCACACTTATACTATACTAAGGTCCTATTACCTCCTAAACTTATTTTATAAATAATTTTCTACCCATTTTCGACCTACGTAGCACTATCTTTTTGGCCCAGCGTGACATTTTTTTCTCAAACTGAAATTAAAATTTAAACTATTTTCTTTTAAAAAAAAATAATTTGAAGTTTTGATTTTTTTGGTTGGGGTGAGGTTTATCAGTTCTTGCAAAAGGCTTAGAATTATCAAAGGATCTGAAGCTAAAGGTTTAGCAAGTCTATAAAAACATGGACATATATATATATACACACATATATACAAATCTGATAGGAATGAACAAGTTTGAACAAGTTTCAGTTTTGTAAACTATCTTGATTTTCGATTAATTACACGGGATATATAGATCTAGATCTCATGTACAAATAGTTTATCTTTCTTTTTTTTGAAGAATTTTCTTGTGTATTATGTATGAGTATAAATATACGGGAAGAAATACAAAATTTTAGCACAATATGAAGTGTCTAATCAATCTTGATATTTAAGCACCCAAATTCAATATTTCGCTTTGATAGGTTCATAATCAAGAATCAAAATAATAATAGAGATTAAAATAAACTTCATTGACTTTTCAAGTCTTTTTCATCAATTTTGTAAATATGTATATTCATATTACAAGTCGACTTAGACTTGTGGAGATTGTTAATTAGCTTGTGAATGAAGATGATGTGTGTTGTGTCCATGTAGATCATGGATTTGAGAAGATCTAATATTTTTTTGGTAGTAAAACTTAACTAGTGAACTTAGCCGCGCTTCGCACGATCATAAATAACTCGCTTAATTTGTCAAAAAAAAGAATTAAAATAGTATTGATAAAAGTTTTGTGAAGGTTCTTTGTTGTGTTTAATTGAAATATATCATATTTGAAATCTTAATCAAGTTTAAATACTATTTAAGTTTTTGTATCCGTTTTAATTTTAAATCGCTTAAGCTAAAAGTTCACATTCAATGATCTCAGCCTATAATTTTATTGGATATGTGTAGCCCATGCTTTTATAATTTTATACAACTTTTTTAAAATCTATCTTTTATTTTTAGTATGTTTTTTGTTTTGTTTGTATCTTTCTCGCAAAATTGAAGAATTTAAACCCAAATAAACTTGTAAATTTTGAAAGCTCAAAACATCAAAATGTCATTATCCTCCTTGTTCATCAAATCAAAATAATTTTTAAATATTTATTGTGGTTCAAGAAAATCAATTATATTTTTATAAAATTACTCTTTTTCCTCCAAACATCGTAGTCTCTTACTATTTTCTTTTTAATGTTTATATTCTTCAAAAGTTGTTATCCTTTCGTCGATAATGATGAATCAACTCTCTTTTCATCTTTCACAAGTCATAAACTAATTTTTACTACAATGTAATATACTTATAAATTTATATATAAAAAAATATATTGAGAGACATAGAACCTCAATTACACAAAAAATGTAAAGTATTTGGAGAAATTAATTATTTGAAACAATCTCTTAAATGCATATAACAAATTTGAGAAATTCTTTTTAAACAAACTTTATCAAAATCCCATTGCAAGAAAGTTGAGTCTTTTTTATACCTTTTTTTTTTTTTTTGAAAAAAAAAGCTTATCTTGTAGCATATGCATACAAATTATATTATTTATTTTGAGATAAAAAAAATCAAATTTTATTGACTTGTCACGTGCATTTAAAGCATGAAGCTAATCATACTTTATCAATTTCCTTTTATTTTTCAAGGGAAAAGGGTCTGATTTACCCCTCAATTTTGTCATTTGGAGCTGATATACCCCTCGTTATAAAAGTGGTTTATATATGCCCTTACCGTTATTCAAACGGCTCACATATACCCCTGCCGTTACAAAATGGCTCACATATACCCTTCATTTAACGAAAGTTAAAAAATTAGTTTTAAATTTATATTTATTACTTGTAATTTTTTTTAAAAAATTATTTAGGGGTATATATGATTCTTCTATCAAAGTTCAAGGTATATTTTAATTTTTTTTCATACATAAATTATTTTTTGACTTCGCTTATTATAATTATTTGAGTTTCTTATTCTTATTTTGTTTTTTTCTTTCATTACTTAGTTTAAAGAAAAAAATTTAAACAATTTTTTTGTGTATTGTAATTTAATTTCGTATTCGAAGAAAAAATTTGGTCTACAATAAGTTTTACAAGAATATTAGTGAAACATAAACAAATTTGATTATCAAAATTATAATTATAAATTAGTCATTGAAACAAAAAAAATAAAAAAAAATATGTTTTACGAGGATTAAATTTACTCATATTAGATTATATATTTTATAAAATAAAAATAAAAATTTAGATTAAAATTATTTTTTTCATTTCCGTTAGAGGAAAAGGGTATATGTGAGCTATTTGTTTACAAGTAGGGGTATATATGAGTCACTTTCATAACAAGGGGTATATCAGCTCTAAATAACAAAGTTGAGAGGTATATCAAACATTTTTCCCTTTTTTCAATTTGTAAATTAAATATGAATTTAGTATGTCATGATTATTTCTATTAAATTAAGATATTATCTTGACAAACAAAATGTGAGATTACTATTTTTGAATTAATATTATAACCATAAATTTTATAACATTTTGAAAGAGTAGAGAATAGTAACAAAATTTGCATATGTTAATAATGACAGTGTGTTCATCAAACTTGAACTTAAATCTCAAATATTGTCATTTGTTCATTTTATCTTTCACCGTAAACAATAAAAATAATTCACATAAAAAATGAAGAATAAAAAGAATGAAAAAATCACCAACAATAATGAAGAAAATAACACAGACAAGAAAATAGAAGGAAAAACACTATAAATAAGAGACATCAACAAAACTAAAATAAAACAAATAATCTTATCTATTTTGTTTAAATTTTGAATTTGAATTCTCACAAACAACATAGGTATATGCTCATCCTATCTTTCATACAATAAACCAAAAAAAACTAATCACATATAATATAACATTATAAAATTAGGCATAACAAAGTGATGTACTTAAGTGTAAATATAATCAAGAAAAAAATAATTTCTTACCATTGATGAGGATGATATACTTTAGTATTTATAGTAATCAGTAAATTTGTAACTTAATTAAATAATATGAATTAAAAAAATAATATAGTAATAAATAAAATTGTAACTTATATTGATATTAATTGTTTTAATTATAATATAATAATATTTTTAAGAAGGAATAAAGAAAGGTTTAGGAAAAGGTGATAAATGGTAATGGTAGTGGGCTTAGTTTTTAAGTAACTGTTGGGCTGCAAGATTAATTACTCTTATTTACTGTGATATTTTAACTCATTTAGACATTTATACATTTTTAAGGGGGAAAAAGTCAGAATTTTTTTTTTTAAAAAAAGAAAAAACATATAACTGCAAATGCTGATCATTGGAGGGTGCCACATCAATAATTTTAGATTTAGCTTTATATTATTATATAGATTTCGCTCCCTTTATTGAAAACGTAAAATGTTAAATATTTTTTTATTCTTAATAAAGATTTTTAAATTTGAACCTTAATATATTAAATCATCTTTATTAGAAAAAACTTACTTCCAATTATAAAATCTCAAACACACAAAAAATGATAATTGAATGTTAATATATTTATCAAACATCGAGCGAGAAATGAAAAAAGAAGAAGGGAAGTATAGGTGCATTACTTAGAAAACGACCATTCACTAATGCTACAACCCCACAATGTGTAAATTGATTTGAACTATTGCTTTCAACTTCACTTTTTTAGTTTTTTTTTTCTTTACAAGAATAACAATTAAATCAAATGATTTGGTTTGAAAACAACACCAATTTTTTGAAAAGTATTCAGAAAATTATTTTTTCAACATTTAAACAAAATTTTAACTACTTTTTACTATATTCCAAAACGTCTCGTTAAAAAAGGAATATAAAATCTCAATCAGGTTAATTAATACAATAAGATTTTTGTATTTTTAGCTATAGTCATAGATGAATTTAAAATCATTTTAAAAAATTAAGTTATGAAAAATTATTCTATATATATATTAAAAAAGTTCTTACTAGAATTATTGAAAACTTTTAAGACCGTAAATCGTAATCAATCATCTAACTAGCTTTTATCCGTAATATTCGAATAATTTTCTTCGCTTTTCCAAGAGGAATATATGTTGTTTTATGTTAAAAAAACTTCTACATAAGATTATTATTATTTAGGGTTAATTATATATAGTGTGTGCATTAACAATGTCACAAACTCTCAATATTACAAAAAAAAATTAGAAATATAAATCCACGCAATTGTATAAAAAGGGGTTAATCAATATCCTAAAATAATAATAATGTAATAGCATTAACGTATGTTAATATGTTATATTACGAAATTCAAAAATATGTGAACTTTAAATAATATTGTCATCATTGTATGAAAGATTCACAATTTATATCACTTTTGTATAATTTATTTTTTTTAAAAAAAATTGATTGAATTAACCCTCTAATAGTAATAATAATAACAATAATTATACAAATTAGTATTTTAATTATGTCTATCTTAAATCATTTCAAATTATAATGTGTAATTGATTACTTTTTAAATCATTAGATTCCCTAAATTTCTAAAGCCAAAATCCATTACTTTTCGTCTCGTTATATTTATCGGACACGTGTCTATTCATATACAATGACATAATTGTCCCCACATAAAAAAAGTAACCCAAACACTTGACTCATCTTAACCATGGTTTCATTTTAACCCAACACATTTCCACCTCTTTTTGTTTTTTATAATATAAAAAATCGTTTGATAGCAGAAATATAAGTATTAAATTTTACATAAGTAATACCGTATTTAATAGTTGATTGAAAAAAAAGAGCTATTCATAAGAAAGTTTTAATCTTTTCATCTGGGGTTTAATACCTGTATTTGCTTGTAATTGAGGAAATGGTAGGTTTTGTAGAGCATTATTGCTTGAGTTCTTTAGTATTTACTGGTGAAAAAGAGTTCAAATCTTTGCACTGTTGTCTAAGTACTTTAGCCGTTGCCGGTGACTTCATTAAACTGATTTGATAGAACAGAAGGTTTTGTGGAACATTGGTGTCTGAGTACTTCAGCCCTTACTGGTTGGGATGAGTTTTAATCTATGCATCTGAGGAACTTTTCTTGCTTGTAATTGAAGCAGTGGGTTTTGTGGAGCATTATTGTGTGAGTACTTTAGTCTTTCTGGTGAGAAAAGTTCTAATCTTTGCATCTGGGGTTTGAATGTTTCTTGTTAGTAATTGAGGGTTTGAGGAAGTAGTAGGTTCTGTGAAGCATTCTCGTCTGAGTACTTTAGCCCTCCCACATTGTGTGAACAATCTCTTCTCATCGAGCATGCGTTTCCCCATCAGCTGAAGCAACACTGTTAATCTTTATCTCTGGTTGGTCGCTGATATTAAAGTTGGGGTTGTTATAACCAAAAAATCAGGGTACATTTGAAAATAAAATATAATTCAACATTCGAAAGCGGGTTATAAGTTGTTTTCCAAATTTGATTTACAACTTCGAACTTTTCGTACACAAACACTGGTTTTCGAATAAAGTGGACATTATATCAGAAAAAAAGTAAATAATATTTATGGGTCCTTAATTAAGTCTTTCAGTTCATTCCTCTGTTTTGCTTGATTGATGGTATTTCACAGTAGTTGGTGGCCATAGAGAAGAAATGCCTTAGTACTTTGAATCGCTTACTGGGTAAAGAAGCAAAAGCATATAGTGTATGACTTGGCTACAACAAACGAAAGGGATGTAAGAGGGCACAATTTCGTCCACCTTTAGAAACTAAGCATAAACTGAATCTAATTAAATTTTTGTTTTGATATGTGCACTTTACTAGCAATGTTGCACAGAAAGTGTGAACTACTGGTTCGGTGTTATAAGTAGTTCAATGATTTGAATTATTGAAAGGGTTGAATATCTTGTAACATGGTTATCAAATTAATGTTGCATTTTTATCTCTTTCCATTTGATTTATCACAACTCCTCTTATATTTGGACCTTCTTTTGCTGCTATTCTTGTTTAGCGCTGGGAATAAAAACTATAGAAGCAATGTAACTCGTTTTTTGCTGCAGGAACCTGAGAGAACTGGAACTGGGAGAAAGTGAAGCAGAAGACCTGAGTGGCCATTGGCTTAGTCATTTTTCTGATAGTTGTACATCGCTTGTGTCACTTAACATTGCTTGTTTGGCTTCTGAGGTCAGCTTCTCAGCTTTGGAGCGTCTAGTTGCTCGCTCTTCTCATTTTAGGACTCTTCGGCTCAATCGTGCTGTTCCCATTGAGAAACTTCCAAAGCTACTTCGTCATGCTTCGAAGTTGGTTGAATTTGGTACATGATCCTACTCTGCTGACATGCAGGCTGATGTTTCTGAAGTTTTCGTAAATGTATCTCAAGCATTTTCAGGCTGTAATCAACTTAAAGGCTTGAGTGGGTTTTGGGATGCTGTGCCAGCCTACTTTCCAACTATTTATCCAGTCTACTCCAAACTCACCTCTTTGAATTTAAGCTATGCTACCATTCAAATAGCTGATCTTTGCAAGCTCATTGGCAATTGTTTCAATTTGCAGCGGTTGTGGGTAGGTTCTAGCTTGTGTTTTACTTTTGTATACTTATCGAGTGTTTTCAATAGTCATGGCTCAATACATTAACTGTGTTTGTGATAAAATAGATAAATTGATTGATAGTTGTAAACACACAAATTTCCAAGAGAAGAACAATAATCCTAACTTAGTAATTGTCTTGCTAATTTTGATAATGCCAGGGATAAATAAACAACGTAATGAACTTCAGTGTTTACTTAGATAACATAGCTAAACAATTAATTTCGAGTGAACTCTTTGAATAATTTGCTGGTCTGTCATACAAAGAATAAGTTAATGTTGAATCCTAGTGTTGCACGAATCCTACACTTTGACAATTCATGTATATCTTTCCGGGTTAGACGCTTCCATTAGTTTTTAGGCTTTTCTTGTCCAGTGGATCTGCTGCATAATTAGTTATCCAGCTTACGCTTTAAGGCACTTGGAATGGATGTGATTGCAGGTTCTAGACTACATTGAAGATAGCGGTCTTGAGGAGATTGCCAACACTTGTAAGGAACTTCAAGAGCTTAGGGTGTTTCCTTTTGATCCATTTGCTCCAGGACCTAATGTATCCTTGACAGAGCAAGGCCTTGTAGCTGTCTCAATGGGCTGCCCTAAGCTTTAGTCAGTTTTATACTTCTGCCGCCAAATGACAAATGACGCCTTAGTTACTATTGCAAGGAACCGTCCTAACATGATCCGATTTCGTTTGTGTATTATCGAGCCTCAAACTCCTGACTACTTAATCCTTGAACCACTTGATGCTGGTTTTGGGGTCATTGTGTAACACTGCAAAAAATTGCAGCGACTTTCTCTTTCTGGCCTCCTTACAGATCGTGTGTTTGAGTAAATCGGGGTCCATGCTAAGAAGTTAGATATGCTTTCCTTAGCTTTTGCAGGAGATAGTGATCTAGGCCTCCTATATGTTCTCTCTGGTTGTGAGAGCCTCCGTAAGTTGGAGATTAGAGACTGCCCTTTTGGCGATGAGGCTCTGTTGGCTAATGCTGCAAAGCTGGAGAGTGGAGACCATGCGATCCCTTTGGATGTCTAATTGTTCAGTAAGTTTTAAAGCATGTAAGCTGCTAGCCCAGAAGTTGCCAGGCTTAATGTTGAAGTTATAAACGAGAGGGGTCATCCGGATACGAGACCAGAAAGTTGCTCTATTGAGAAACTTTATATACACAAGACAGTGTCAGGAAGGAGGTTCGACACTCCTGGTTTTGTTTGGACTAGGCTCCGGGCACGTGTATTCCAAATAAAAATCAATAAAAAAAATAAATGAAAACGTATATAATAAACTATTAGGAGAATTATGATGTTTTTTTCGAGTGTTCTCTCGATATTTTCGATCTACTGCACATTAGATAAGTCTCCAAAGCTTACCCATTTATAAGCAATTAAATGTACAGACAGTCATCAACAAGTAAAAATTCTAAGAAAGACACATCAAGTTAAAGAATTAAAAAGGGAAAATGCGACGTTATTTAAAGTCATCTTGTATCCTTAATGTGTGTCGTTACAAATGTAACTACTTCCTTAAAAACTTTCAGATTTACTCAGACTTACATTTACAGGCTTACAACTACTATCCATCACTGTTAGAGAAGACTTGGAGTCGCTACATTTATTGAAGAAAATGTGATATATTTTGCTAGCAAACAGCTGCAATTTCAATTTATTATTAATAGTTTAAAAGTTTAAACATGGTTTCTTTTCTGTGGGAAGCTTGCATAGAGAGTTTTAAAGAGAGTTGATCATCATTCAGTATCAAACCATATTGTACAACAACATTCAATTTTTGATATGTGTGGTTATACCTTTCAAGCTATTTATTTTACCTATTAAAAAAATTAGAAAGTTAGCAAATCAAACGGAAAAATCTAGACTTAATAAGATTGTACCTGAAAATTAGAAGACATTTTTGTACCCACTTAACAATGGAAGCTTGTGTTGAATGACTAATATTGAGTATGTTTATGTAGTGTAGTCTTGGAGATTTGTTGATAAAAACTCTTTGATATTCCTCAATTACTTAATTTGATCCTTTTCAACTTCTCATAATTAGCAAAATACGTTTCAACTTCTATATTAATTGAAACTTTATTCGTGTTCATCCTATTTGGTTGTTTCACACATAGTAATTGAATAGACTGTTGAACTTCTTATTTTGTTCCTTTATTATGTAATTCAATATTACTATTTAATTAGATATTTAATTTATATTTGGGAAAAGTATTTTATTACTTTTTAATTTAGTATAGGGGCAAAGTAATAATTCAACTTTACACTTTAGAGCTTCATGCTTATAATAATATATGATTATTGATGAAGATGCAACATCGACTCCATATAGCAATGGGGATTGCTCTTTGGCTTCTTCTTAGGAAGACTTCAGGTATTAGTTCTATGCTGATCTTTCACCTGCATTTACTTGCTTGAGCCTTGTGTAGTTGCAGTGCTGGTTATGGTGGCAGTGAAGCGCATGTGCCATTGATTTGACCCTTTGTTGAGTGACTTTGCAACAATTAATTACAAATAATGAGTTTAAACTCTTGTTGTTGTGCTATATCACTAAGGATAACTATTGTATTTTCAACTCTTATTGTTTTTTCTGTTGAAATGATGCTGTCAATGTACTTGTTGTCCTGTATTGTTGTAATTCTCCTTGAAGATAAATGGGAACCTTTCATTCATTTGAGTGCTGAAATCCGATTTAATTTGTTGAACGTTTAGAAGAAGGTATTTTATTGTTCTAGTACGAGTCAGCCTGATAAACAAACACTTACATAGGTATGATGACTGTTCATTTTCTCAATTTTATACCTACTCGTGCAAATCCAAAGTTAAAAGGTCATGTTTATGTATTATGCCAAATCTATACTCACATGTGTGCTTGCGATAAAAGAAATAGACAAATCAACAAATGATACGTGCATTTATAAAAATTATAATTTTTGTTGAAGAAACTTTGAGAAATCCACAAAAATATTTCATAACTGCAACAAAGTTTTCTTAATCATATACAATGTACCCTGCAAAGTACAATCTACTTTTCAACCATAATGCTACTTAAATAAGGGGATATTCTTCTGGCCAAGGATCTGAAGCTCGCTCCCTCCTCTCATTTCTTCAGCGTATTCCTTAATCTTGAGAGCAGAATCTTCAAGTTGAGGACTCTTTACAATTTTGATAAATTTCAATGAATAAATATCTCCAAAACTAGGTGGAATCTCCTCAAACTTACCACATTCCTGCAGTTTTAATTTCTCAAGATTGGGGAAGGATTCCTCTCCAACCTCCCACTTGGAAAGAGTCGGTAGACGCAAGTTCAAAAATTTGAGATTCTCAAAGGTGTCTTCCTCCCCCATGTTCCATTCTTCTCCATGGATGATTGCATCACAAAGGGACAACCCTTCAAGGTTGGGCAGTCTAGCTATTGTTGACAGTGAATCGGATGTCAGAGGAAAGTCACGCCATGACAGTTCTTTCAAATTTGAAGGGAAGTGGAAATCCCACGGCCGATTTGTCGCTACAGAGGACCCAATGTGGTTTGTGTTTGAACTTTTAAAACCTACACTGAGTATTTCTAGTTCAGTTAGGCAATCCAATTTCGGGAACCAATATTGCTCTGTTGAATAATCCCATGACTCCTTGAGAACAAATTCAAGCACTTTAAGATTGGGAAACCTTTTGAAAATATTCTTTGTATCTTTCGAATAGGAAATCAACAGTTCCCTTAGTATTCTCAAGTTCTCTAACTTTGTGTCCTCTGCTATCAATATTGATTCATCTGCATCCATATCAAAGAAAGAACAAGCATCCGCGGACAGCACTCGTAGCTTTACAAGATCCAAAATTCTTGGTAACAGTATCAAGGTTGATCCTTTGTTAGACACAAACAGACTTTCTAGATTCCAGAGGTTTGAGAAAGACAAAGGCAGATATTTAACTTGTGTCCGAATTCTTAAGTACCTCAAATGATTCAACATGCATATTTCATTCAGCAAAGAATCATTCACCATGATTAAAGAGGATTCCAGGTCCAACACTCTAAGAAGCCTCAAGTGTCTTAGGTGAAATGTATCAAAAAGACTGTCATCATAATCAATGGTAATTTTACGTGGCAATAAATCTGATGGAGCACTTGATCTTATCCGATCAAACAACTTTTCCTTTCTTGCTTTTATCAAACAAAAGTCATGCACAAGATCATGAACTTGGCAACTCGGTTCATCACCTATCTCATTCAAAAGAATTACCAAGCTACTGGAAATTAAATCATCCATACAAATCTTCAGCACTTCTTCCATACTCTTCATCTCCGTCTTCCCCACAAATCCTTCAGCACCCAAAAAAAACATTCAACAAATAGATTGTCAATGGAGTGTCCTTCGGCAAACTTACAAAGTGAAGCAAGCATGGCTTGAGGTGATGTGGTAAATGGTCATAACTTAATTCTATAACTTTCATCACTTCCACTTCACTGTTCAAAATAAAAGAACTCAAACTATTTTGAACTTCAAGCCACACACTCTTTTTCTTTTCCCTCCCAGCAATGACTCCAGCAATCAGATCAGCCACCAAAGGAAGCCCTTTACAATTTTTGGCTATTTCTTTACCGACATCTAATAGTTCATCAGGGCAACTCTCGTTCCCAAATGCCCTTTTCTCTAATAGTTCCCAACTTTCATCTGGTCTTAGCAATCGAAGGTCAAGAGGATCAGTGTTCAGCTTTCCATGCAAAGGCACTTCCTTTTCTCGAGTTGTCAAAATAATCCTACTTCCTTTCTTAGCTTCAAGAAAAGGTCTTGTTAACTCATCCCATGTAGTAGTATCCCACACGTCATCTAAGACAATAAGATACCTCTTTCCATACAGTTTTTTCCGTAGCTTATCAGGAACATCAATATTCTCACTCAATTTTGAATCTGAGTCACTAACTTGATTGACAATTTTATTCAACAACTTCTTCTCATCATATCCTTGGTCGACCGTGCACCATGCACGAAGGTTGAAATGGCTAGAAACTGACTTATCACTGTATACTTTGTATGCCAAAGTAGTTTTACCTGAACCCGGCATACCAGTGATCGAAATGACATCTAGATCTGCCGGTCCACTGGTGAGCTTTCTAAGTATCAAGTTTGTCTCCTCCTCAAAACCTACAATTATTTTATCAGTTGTCAATGACTTTCTCTCAACTGGTTTCTTGGGAGAGTTCACAACGATTAGACCTCTGTCCTTGGGAATGTTCTCATCTAAAGCAGAGATCTCTTCTTTGATAAGTTTGATCTTCTTTATGGTAATGGGAAGTGAGAAAATAAGATGTAAGAGACCATTATCTCGAACAATAATTGAATCTATGACATCTTTTGCCTCATAAGCCACATCTAGAACACGTGCCCAGATATCTTTATACAATCCTTGCTCAGCATCCACAAAGAATGATCTTATGAATTCCAGGTCTTGTCTCACCAACTCGATTTCTTCCTTTATCAAAGAAATTGAATAAGCATTAGATTCTAGCAAATCATTTAAGTGCATGTGTAGAAGATGCATGAAGAGTGGTCCATCACTCATGGGGGAGCAACATTGAGATGAATCCGGGGCTTTCAGATAAACATGTTTGAGATCTTTCTTGAGGAGTTCAATATTTTCCAGCAAGTCTAGGGTTACACAATTTGTTTGGTTATTACCCTCTTTATTCCTTAATTTCTCTTCCAAGTCACATACAAGAGTTGATACCTCCCTGGTAAGTACTTCAACATGAGCCAAGAGATCAAAAAGTTTGTCATGATGAATAAAGTCCTTGGGCATATTCAGAAAGAATAAGTAATAGGAATTCCATCATGACATGAATGTTTAGAGCCCCTGAAGTGCTAGGGGGAATAACAGTTATCATATGCTCTTGTAGTTGAATGATATATTCTCTGAGAATATCCGGTGAGGGTTCTAGGAGCTTCTTAATGAAGCGTCCAACTTCTGCTGAAGTTGAAGCTTTCAAATTTGTATAACATATGTGCATAACCTCCAGTTCAGTTGGAACAATCTTCAAGAGTAGCTTGAAGAGTCGAGAGTCTCTATCATTCTGATCATCCTCATCTAGCTCGGAGAGCCGAGAGTCTTCATCAGTCTGATCCTCCCAAAGGAAGTGTCCTACTCTTTCAGCCATCAGTTGAAACAGAGGTAAGACATTCTCAACCGTCTCATGCTTAATGCAACCATTCACTATCAACCCATGGAAGTCTCTTATGTTGCCACATACATTCTGAAGAACTTCATATTGAGTCACTTCAGGAAATATCTTTTCAGCGTGATGCTTGGATAGATGAAACAGATTCAAGAGGAGGAAGTCCAATTGCTCATCCATCATGGTGGCATCTGATTTATAAGAACGATGATACAAGCTGATACAATCATCCATATTACTGGTGAGGCTAGTAAGGACATCATCATCCAAAAGTGGTT\n>URS00015E57C9 rRNA from 1 species \nCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGACGAGAGTCTGAACCAGCCAAGCCGCGTGAAGGAAGACTGCCCTATGGGTTGTAAACTTCTTTTATATGGGAATAAAACGGTCTACGTGTGTGAATTTGAAAGTACTGTACGAATAAGGATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGAATGTTAAGTGAGGTGTGAAAGGTGCGGGCTTAACCGGGGAATTGCATTTGAAACTGGCGATCTTGAGTGCAGGAGAGGTAGGCGGAATGTGTGGTGTAGCGGTGAAATGCTTAGATATCACGCAGAACACCGATTGCGAAGGCAGCTCACT\n>URS0000C6D546 snRNA from 2 species \nAGCCATGTGGTGAGCACAAAGCGAACTATTCTTTCGCCTTTTACTAAAGAATACCGTGTGCTCTCCACGCTAAGTGGCATACGCCTATTTTTGTAGGGTCTTGCTTTTAAGCGAGC\n>URS0000C3F3E8 tRNA from 1 species \nGACGTCGTGCCGGAGTGGTTAACGGGTGCGCCTGCTACTTTTAGCATGTCAGTGTATAGGCTCTGCCTGCGTGAGTTCGAATCTCATCGACGTCG\n>URS0000B1CE7F rRNA from 1 species \nTGGGGAATCTTGGACAATGGGGGCAACCCTGATCCAGCGATGCCGCGTGAGTGATGAAGGCCTTCGGGTTGTAAAACTCTTTCACCTGCGAAGATAATGACGGTAGCAGGATAAGAAGCACCGGCAAACTCTGTGCCAGCAGCCGCGGTAAGACAGAGGGTGCTAGCGTTGTTCGGAATGACTGGGCGTAAAGGGCGCGTAGGCGGCCAATCAAGTCAGATGTGAAAGCCCCGGGCTTAACCTGGGATGTGCATTTGATACTGGTTGGCTGGAGTACGAGAGAGGAAAGTGGAATTCCTAGTGTAGAGGTGAAATTCGTAGATATTAGGAGGAACACCAGAGGCGAAGGCGGCTTTCTGGCTCGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAA\n>URS000118AF15 rRNA from 1 species \nTACGGGGGGGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGTGGCCAACTAAGTCAGACGTGAAATCCCCAGGCTCAACTTGGGAACTGCGTCTGATACTGGCAGGCTTGAATCCGGGAGAGGGATGTGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCATCCTGGACCGGTATTGACGCTGATGCGCGAAAGCCAGGGGAGCAAACGGG\n>URS00008D4438 rRNA from 1 species \nTACGGAGGGTGCAAGCGTTATCCGGATTTACTGGGTTTAAAGGGTGCGTAGGTGGATTGGTAAGTCAGTGGTGAAATCCCCAAGCTTAACTTGGGAACTGCCATTGATACTATTTGTCTTGAATACCGTGGAGGTGAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGAAGGCAGCTTGCTACGCGGATATTGACACTGATGCACGAAAGCGTGGGGATCAAACAGG\n>URS0000E895E3 lncRNA from 1 species \nCTTATCTGGTGAGGGAGGTTTTCCTTTGTTTCTGGAGCTTGGTTAAAGTAAGCCAAGCTTTATTTTTCTAACTTGAACTCTGACTAAGTAAATAATATTCTGATTGTCCTTAAAGATGCAGAGCATCTTACTCCGTGTGTGTGTGTGTGTGTTACAGCAGGGGTTCCTAACCTTTTTATGCTGCAGACTGGCAAACTGCAGACCAGAGATGACAGTGGACTGGAAGTGACCACAGACTGACAAACTGCGGACCAGAGGTGACTGTGGACCAGCAAACTGCAGACCAGCAGTGACCAGCATACTGGTACCAGACCGCAGTCTGAGGGTTGGGAACCCCTGTGTTACAGTAAAGCAAAAGCACAAAGTAGGAGGCATACTCTTAATTGGAACCCAGGTCAAGGAGATGGGTACCACAATGGCAGATGTGTGGATGGGACCAACCATGATGAATATCTTGCACAAAATTCAGCCTTGGATGAAGATAAAATTTGCCTGCCCTGGATCAACCTGGTAATCAAGTCAGTCCTGGGATTTATACCAAATTCTGGTGTTAATGCACCATGGACTCTTCAGTGCATGTTGCTTGGAGCCTTTGGTTCCTGCTGTTCACAGAATGCTGCAGATGGCTGCCTCAGCAGGAAGCCCTTCCCCCTTCCTTAATGGAGCTCGTGGGAATGCAGGGATCCTGGAACTGAAGCCCTCCTTCCCTTCCAAACCTCCTCTCCAAACCCCTACTGAGTAAAAGGAAAAAAATCCCCACATCCCTGGAAACATTTTTGCCAGCCTGTTTTTCAGTAAAATCTTAAATTAACCACTT\n>URS0000DD7A4F rRNA from 1 species \nAGGGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTTTTCGGATCGTAAAACTCTGTTGTCGGGGAAGAACAAGTATGATAGTAACTGATCGTACCTTGACGGTACCCGACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCTCGCAGGCGGTTCTTTAAGTCTGATGTGAAATCTTGCGGCTCAACCGTAAACGTGCATTGGAAACTGGAGGACTTGAGTGCAGAAGAGGAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAAC\n>URS0001657D77 rRNA from 1 species \nCAGCCGCCGCGGGAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGCAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCCCGGCTCAACCGGGGAAGGTCATTGGAAACTGGGAAACCTGAGTGCAGAAGAGGAGAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGAGACCCCTGTAGTCCCTGTCTCTTATAC\n>URS0000010E3A rRNA from 1 species \nTCAGTCGACTCCTACGGGGAGGCAGCATGGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTGTAAAGCACTTTCAGTAGGGAGGAAGGTAGTGTAGTTAACACCTGCATATTTGACGTTACCTACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGCATGCAGGCGGCCTGTTAAGTCAGATGTGAAAGCCCGGGGCTTAACCTCGGAATTGCATTTGAAACTGGCAGGCTAGAGTCTTGTAGAGGGGGGTAGGAATTTCAGGTGTAGCGGTGAAATGCGTAGAGATCTGAAGGAATACCAGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGATGCGAAAGCGTGGGGAAGCAAACAGGATTAGATACCCTGGTAG\n>URS00007A8810 rRNA from 1 species \nCCTACGGGAGGCAGCAGTAAGGAATATTGGACAATGCTCGCAAGAGTGATCCAGCCATGCCGCGTGCAGGAAGACGGCCCTATGGGTTGTAAACTGCTTTTGAACTAGAGAAAACCCTTCTACGTGTAGAAGGCTGATAGTATAGTTAGAATAAGCATCGGCTAACTTCGTGCCAGCAGCCGCGGTAAGACGAAGGATGCAAGCGTTATCCGGATTCATTGGGTTTAAAGGGAGCGTAGGTGGACTGATAAGTCAGTGGTGAAATCTCCGTCGTACCGTAACGAAGTAAGTCGACT\n>URS0001848EE8 rRNA from 1 species \nTACGTAGGGGGCTAGCGTTGTCCGGAATCATTGGGCGTAAAGTGCGTGTAGGCGGTCCGGTAAGTCCGCTGTGAAAGTCGGGGGCTCAACCCTCGAAAAGCCGGTGGATACTGTCGGGCTAGAGTGCGGAAGAGGCGAGTGGAATTCCCGGTGTAGTGGTGAAATGCGTAGAGTATCGGGAGGAACACCAGTCGGCGAAGGCGACTACCTGGCC\n>URS0001910395 rRNA from 1 species \nCCCTTAGATGTCCTGGGCTGCACGCGCGCTACACTGATGCGCTCAACGAGTTTACGATCTTGCCTGAAATGGCTGGGTAATCTTTTTAAAATGCATCGCGATGGGGATAGATCATTGCAATTATTGATCTTCAACGAGGAATTCCTAGTAAGCGCGAGTCATCAGCTCGTGCTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATTGAGTGATCCGGTGAATAATTCGGACTGACGCAGTGCTCAGCTTCTGGACGTTGCGTCGGAAAGTTTCATGAACCTTATCACTTAGAGGAAGGAGAAGTCGTAACA\n>URS00006E6EF3 rRNA from 1 species \nTGGGGAATATTGGGCAATGGGGGAAACCTTGACCCAGCAACGCCGCGTGAAGGAAGAAGGTCTTCGGATCGTAAACTTCTATCCTCGGTGAAGAGGAGAAGACGGTAGCCGAGAAGGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTGTCCGGAATGATTGGGCGTAAAGGGCGTGTAGGCGGCTAAGTAAGTCTGGAGTGAAAGTCCTGCTTTTAAGGTGGGAATTGCTTTGGATACTGCATAGCTAGAGTGCAGGAGAGGTAAGTGGAATTCCCAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTGCTGGACGATGACTGACGTTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGACTACTAGGTGTCGGGTAGCAGAGCTATTCGGTGCCGCAGCCAACGCAATAAGTAGTCCACCTGGGGAGTACGTTCGCAAGAATGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCTGCTCTTGACATCTCCCTGACCGGACTGTAATGAGTCCTTTCCCTTCGGGGACAGGGATGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCTTTAGTAGCCAGCGGTTTGGCCGGGCACTCTAGAGAGACTGCCAGGGATAACCTGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGAGCAGGGCTACACACGTGCTACAATGGCGTAAACAAAGGGAAGCGAGCCTGCGAGGGTAAGCAAATCTCAAAAATAACGTCTCAGTTCGGATTGTAGTCTGCAACTCGACTACATGAAGCTGGAATCGCTAGTAATCGCGAATCAGAATGTCGCGGTGAATACGTTCCC\n>URS00022CA99A rRNA from 1 species \nTGGGGGATTTTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGAGGGATGAAGGCCTTCGGGTTGTAAACCTCTTTCGCTGGGTTGAAAGGCCATGCTTTGGGTGTGGTTGATTTGAACTGGTAAAGAAGTACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTACTAGCGTTGTCCGGATTTATTGGGCGTAAAGGGCTTGTAGGTGGTTTGTCGCGTCTGTCGTGAAATCCTGTGGCTTAACCATGGGCTTGCGGTGGGTACGGGCAGGCTTGAGTGCGGTAGGGGAGACTGGAATTTCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGTTACTGACACTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS0000A0C1A7 rRNA from 1 species \nGTGAATGCTGGCGGCGTGGATGAGGCATGCAAGTCGAATGGGTTTAGACCCATGGCAGACGAGGTAGGAACACGTAGGTACGTACCGGAGAGTCAGGGATAACCTGGAGAAATCCGGAATAATACTTGATGGTCCCGAGAGGGTAAAGATTTATCGCTCTCTGAACGGCCTGCGTTCTATCAGCTTGTTGGTAAGGTAACGGCTTACCAAGGCTACGACGGATAGGGGAGGTGAGAGCCTGACCCCCACCGATGGAACTGCGACACGGTCCATACTCCTACGGGAGGCTGCAGTCGAGAATCTTCCGCAATGGACGAAAGTCTGACGGAGCGACGCCGCGTGGTAGATGAAGTCCTTAGGGACGTAAATACCTTTTATGAGGGAAGAAGTTTATTGACGGTACCTCATGAATAAGGGGCTCCCAATTCTGT\n>URS000254C320 misc_RNA from 1 species \nGAAGTGCGATAAGCAGTGCGAATTGCAGAACCGTGAGTCATCAGATTTTTGAACGCAACTGGCGCCGATTGGTCCTCCAGTCGGCATGCTTGTTTCAATATCTTGTTCTCTCATCACCCAAATCTTAATGCTAGAGATACCCTTCTCTGGTTAAGTATGAAAGCACTCTGTACTCTGCAGGCAATCCTTCGGGAGTTGCACTCAATGCAGCAGTCACATTGATTACAGTGTGAACTCATTGAGAGTTGAGAACAGTTCAGCTATGCTGTTAGTGCTTAGATAACTAAACTTACTTGCATTTGAAATCAAGCAGGATCACCCGCTGAACTTAA\n>URS000255DEA3 misc_RNA from 1 species \nTCGCGGCTTATCACCGGCAGTCCCCTTAGAGTGCCCAACCTAATGATGGCAACTAAGGGCGAGGGTTGCGCTCGTTGCGGGACTTAACCCAACATCTCACGACACGAGCTGACGACAGCCATGCAGCACCTGTGTTCCAGCCAGCCGAACTGAAGGGGTCCATCTCTGGTCCCCATACTGGACATGTCAAAGGTTGGTAAGGTTCTGCGCGTTGCTTCGAATTAAACCACATGCTCCACCGCTTGTGCGGGCCCCCGTCAATTCCTTTGAGTTTCAGCCTTGCGACCGTACTCCCCAGGCGGGGTGCTTAACGCGTTAGCTAAGGCACCGCAGGGGTCGATACCCGCTACACCAAGCACTCATCGTTTACGGCGTGGACTAC\n>URS000043B807 rRNA from 1 species \nTCGAGACCGAAACACAACGAGCGATTTTGTGAACCTGTAAAAATAAGCGGTGGCTCTTGCTGCTGCGATAAAATCCACCCGAGTCATCGCCTCATCCCCTCTTTGGGGTGGGGACGTGATGAAGGATGGATGAACCCTCAAATCGGCGCAGCGTTGCGCCAAGGGAATCTTGAAGCACAAGCCCATAAATGGGTTTCGTGGGATGGGGTGCTGTCGCACGCCATATTGATTGACACGACTCTCGGCAATGGATATCTCGGCTCTCGCATCGATGAAGAGCGCAGCGAAATGCGATATGTGGTGCGAATTGCAGAATCCCGCGAACCATCGAGTCTTTGAACGCAAGTTGCGCCTGAGGCCAACCGGCTGAGGGCACGTCCGCCTGGGCGTCAAGCATTTTATCACTCCGTGCCTACTCTCCCATTCATGGATGTGTTGCTAAGGCTCGGATGTGCACGGTGGCTCGTCGTGCCCCTTGGTGCGGCGGGCTGAAGGGCGGGTCATCTTCTCGTTGGCTGCCAACAATAAGGGTGGATTAAATAAGGCCTATGCTATTGTGTCAAGCGCGCCCGAGAGATGGTCATACTTTTTAGGTGATCCCAATTCATGCGTTGATCCATGGATGGCGTATCGAAT\n>URS0001EC40D3 rRNA from 1 species \nATTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGAACGGCAACAGGCCGCAAGGTTCCGCCGAGTGGCGAACGGTTGCGTAATGCATCGGAACGCGCCCAGTCGTGGTGGTTAACTACGCGAAAGATTAGCTAATACCGCATACGACCTCTGGATGAATACGGGTGACAGTAAGGCCTCGCTCGACTTGACCCGCCGATGTCAGATTAGGTAGTTGGTGGGGTAAAGGCTCACCAAGACAACGATCCGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGAACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGCAATGCCGCGTGCAGGAAGAAGGCCTTCGGGTTGTAAAGTGCTTTTGTAGGGAAAGAAACGGATCTGATTAATACCCGGGGCTAATGACGGTACCGAAAGAATAAGCACCGGCTAACTACGTG\n>URS000126A115 rRNA from 1 species \nTACAGGGGGTGCAAACGTTGCTCGGAATCATTGGGCGTAAAGCGCACGTAGGCGGTCTGTTATGTCGGATGTGAAAGCCCTCGGCTCAACTGAGGAAGTGCATCCGAAACTGGCAGGCTAGAGTACTAAAGAGGGTCGCGGAATTCCCGGTGTAGAGGTGAAATTCGTAGATATTGGGAGGAACACCAGTGGCGAAGGCGGCTACCTGGACCGGTGCTGACGCTGATGCGCGAAAGCGTGGGGAGCAAACAGG\n>URS00016D22DE rRNA from 1 species \nTACGGAGGGTGCAAGCGTTATCCGGATTCACTGAGTTTAAAGGGTGCGTAGGTGGCTTTGTAAGTCAGTGGTGAAATCTTAGAGCTTAACTCTAAAACTGCCATTGATACTGCTTAGCTTGAATCAAGTAGAGGTGGATGGAATAATACATGTAGCGGTGAAATGCTTAGATATGTATTAGAACACCGATTGCGAAGGCAGTTCACTATGCTTGTATTGACACTGAGGCACGAAAGCGTGGGGATCAAACAGG\n>URS0000FAD9B3 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGAAGCGACTCAAAGTTTTCGGACAGAGAGTTGACTGAGTGGCGGACGGGTGAGTAACGCGTGGATAACCTGCCTCATACAGGGGGATAACAGTTAGAAATGACTGCTAATACCGCATAAGCGCACAGTACCGCATGGTACAGTGTGAAAAACTCCGGTGGTATGAGATGGATCCGCGTCTGATTAGCTAGTTGGCGGGGTAACGGCCCACCAAGGCGACGATCAGTAGCCGACCTGAGAGGGTGACCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGAAAATAACGGTACCTGACTAAGAAGCACCGGCTAAATACGTGCCAGCCGCCGCTCGTAAAAC\n>URS000049D5CE rRNA from 1 species \nACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGGGATGCGTATCGGAAAGCTTCGGCCGGAAGATACGTTATCTAGTGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCTTATGGAGGGGGATAACAGAGAGAAATCACTGCTAATACCGCATAAGCACGCAGTACCGCATGGTAGAGTGTGAAAAGATTTATCGCCATAAGATGGACCCGCGTCTGATTAGCCAGTTGGCAGGGTAAAAGCCTACCAAAGCGACGATCAGTAGCCGATCTGAGAGGATGACCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCCATCAGCAGGGAAGATAATGACAGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGACGGAGTGGCAAGTCTGAGGTGAAAACCCTGGGCTCAACCCTGGGACTGCTTTGGAAACTGTTAATCTAGAGTGTTGGAGAGGTAAGTGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAAGAACACCGGAGGCGAAGGCGGCTTACTGGACAATAACTGACGTTGAGGCTCGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGAATACTAGGTGTCGGGGAGCAAAGCTTCTCGGTGCCGTCGCAAACGCAATAAGTATTCCACCTGGGGAGTACGTTCGCAAGAATGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAG\n>URS000101C2DC rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGTTCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGTGTGTCAAGTCAGGCGTGAAAGCCCCGGGCTCAACCTGGGAACCGCGCTTGAGACTGGCACGCTCGAGTTCGGGAGAGGATGGTGGAATTCTCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCGATGGCGAAGGCAGCCATCTGGACCGACACTGACGCTGAGGCGCGAAAAGCGTGGGGAGCAAACAGG\n>URS000172D02F rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAGTGGCGAACGGGTGAGTAATACGTGGGTAACCTGCCCTCTTTCTGGGATACGCCTTTGCAACGGGGACTAATACCGAATATAGGGGGATGGGCTCGCGGCCTATCAGCTGGTTGATGGGGTGATGGCCTACCAAGGCGGTGACGGGTAGCCGGCCTGAGAGGATGAGCGACATAAGTGGGAATGAGAAAAGGCCGAGAGTCGTACGGGTGGGAGCAGTGGGGGATATGGCACAATGGGGGAAAGACAGATGCAGCGACGCCGCGTGGGGGATGAAGGCAAGCGGGTTGTAAACCTGTTTAGCTATCGAACGGGTAGGTGGAGAAGAAGCGCCGGCGAACTACGTTCCAGCAGCCGCGGTAATAC\n>URS0000A77429 sRNA from 1 species \nTTTTTGGGTGATTAAAATCCATATATTTTGTTACACTAGTTTTCATTCTATTTGAGACAACACGTTTTGTATGTTTACACGATTGTACGGCCACCTCCAAACCACGGGTTCGATGACAGATCAGTGATCACCTCTTTATTGGTTTAGCAAACGACGGCCCTAACCTCGATCCTTTCTCTCGGTTCCTTCTCTAATGGGT\n>URS00004E56CD rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGGAGTTCCTTCGGGGACTTAGTGGCGAACGGGTGAGTAACGCGTGAAGAACCTGCCTTTCAGTGGGGGACAACAGTTGGAAACGACTGCTAATACCGCATAACATATATTGTGGGCATCCACGATATATCAAAGGAGCAATCCGCTGAAAGATGGGCTCGCGGCCGATTAGCTAGATGGCGGGGTAACGGCCCACCATGGCGACGATCAGTAGCCGGTCTGAGAGGATGAACGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGAGGCAGCAGTGGGGAATATTAGGCAATGGGGGGCAACCCTGGACCTAGCAACGCCGCGTGAAGGAA\n>URS000163D073 rRNA from 1 species \nATACGTAGGTGACAAGCGTTATCCGGATTTACTGGGCGTAAAGGGCGTGTAGGCGGTCTTGCAAGTCAGAAGTGAAATTCCTGAGCTCAACTCGGGCGCTGCTTCTGGAACTGCAGGACTTGAGTGCTGGAGGGGATAGCGGAATTCCTAGTGGAGCGGTAAAGTGCGCAGATATTAGGAAGAACACCGGTGGCGAAGGCGGCTATCTGGACAGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGGTTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATACTAGGTGTAGGGGGTATCGACTCCCTCTGTGCCGCAGTTAACACAATAAGTATTCCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAATGAATTGACGGGG\n>URS00025C2B18 rRNA from 1 species \nATGGCGATGGAGACGCCCGGGCAGGAAGGGCTCGATCCGGATGAACCAGCTCGCACCGAGCCCGGCCGCCTCAACAGGAGCTCGTATCTCTGCCTGCCAGCGGCTCACCGGAGCCGCCACTGCCGGCGACTGCCTCCCTCACCTTGTGCCCCTCCTCCTTCGCCTTTCTTCCTCTCTTCCCCGAGGAGCGGGGAGCCGGCGAATCCATCGGTCAGGAGCTGGGCGGCGCCCTCCATCATCGCCGTTGTTTGGGGAGGGACGCGGTCCTGGTCGATGCGGTATGGGGCGGGCGACGCGGGGCAGGAGGTGGCGGCGGGATGGAGGTACATGTGA\n>URS0001D99DCB rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCGAAAGTTCTTCGCTATGTGTAAAGCGGCGGACGGGTAAGTAATGCATGGGAATTTGCCTGGTAGTGGGGGACAACGTCTCGAACGGGACGCTAATACCGCATTAGCCCTACGGAGGCAAGGGGGGGTTCTTCGGACCTCTCGCTATCAGCTGAGCCCATGTCAGTTTGGCTCGTTGGTGGGGTAAGGGCCTACCAAGGCGACGATCGGTAACTGGTCTGAGCGGAGGATCAGTCGCACTAGAACGGGAACACGGTCCATACTCCTACGAGAGGCAGCAGTGGGGAATAGTGGACAATGGTCGAGAGCCTTGTCCAGCGAGGGCGAGTGTGTTGAGAAGGCCTTGGGGTTGTAAAGCACGTTCAGTGGTGATAAAGGTTTTTTACTTGATACGTAGGCAGAGTGATGGTACCTGCAGAAGAAGCACCGGCTAACTCCGTG\n>URS00025F9C51 lncRNA from 1 species \nTAGCTTTGAGAAACCTAGCCACACTTTCAGCACTCAGGCCTTTAGTGCTCATTGGAATAAGGTCCCCGCAATCCAATGTCGACCTACAAATGAAGTTTTTTACGGACAGGAGCATTTTTCTTCAACATGGAACTAACAGTCATGATTTTCTTCTCATAACGTAAATCTGAAAGGTCACTTGTTACATCCGACATCGGGCTGAAAATGTATACACATTGCATTGTGTTAAAAAGAATTATGATGGAAAAATAGTGAGATCTCTCTTTCTAGACTGTAGGGTGATGAACCTGTACCAATCATACTGTCTGTCTTATTTATCTGACAACTGTCCCGATACTGAAGAAAATGTTGACAGACAACACAATTAGGCTAGGAAGACTAGATGGTCAGTGATTCAAAATTACTAAATTTGAATTGTTACATAAAAAAAGTAACTGGTTTACAAATTATCCTAACAGTCAAAATTTGTTAAAGATATATTTTTAACCATTCAAAATTCAACTTTAAAGGTGGGGGGGGCAGAATTCATCACTAATGTCCTAGCTTCGAATCTAAGTAGCTCTGAATTTGATTGTAAACTACTTCATACTTAATCTCAAAATACTATTTTTATATTTGCTTATGTGTTTCATCCTGACATCTTCAGGGTTGCTAAGAACGGCATTCATACTCCAAAATTACAATTAAGTTCAGAACTTATTAGAAACATGTTTTTCTCAAGGGAAGTATGTGGCCTATTTGCCAAGAGAGAATTTTTTGTGTCAGAGCCTGTGCTCCCCCCCCTTTGGTTTTTGAATGCATTGTGCACAAGAGAAAACTTGGTCCAGAGCTTTCTCTATAAAACTGAGTGTTAATGTAAGAGAGTTGGCCAAAAAATAAGATAACTTATGTACAGGAATTATTGTAAATAAACTTGTAGGGTAGTACACTTTTTTTCTGCGTGTTACCTCTTGTACCCACATGATGATGATGTCAACTCTCTCCCTCTTGGCTTTACAACATTTTCATAATCCTATAATGATAAATATACATTACTCATTCAATTTTAACACAATACACTGGTAGATATGGTATTAATAGATTTAATTTTATATTAAAACACGATCCGAAAACACACACTGAACATGGTCACCAATACATTAAACAAAGAGAAGCAGAGAAATATTTGTTGCATATATAAGCACATGGATTAAATAGTTTGGTTCATTAAATAATAAAGAATCTACATCAAAGTGA\n>URS00009B757A lncRNA from 7 species \nAATTAGCCTCAGAGGTTTAAGACTTGCTTGCAAGTGTGCCTTCTGTTTATAGGTTAAGCTAGCTATTTTAATTCTATTATTTGTGAGTTCTCCATAGATGTAAAGTATGACGTAATTCATGTGCCAGGCCACATTGGAGATAGTCAGCTGCCATCGAGCCAGAGTTCCGCAGGCCCTCAGCCAGAGCTCCTCACCAGGGACCCTGCTAAACAGGCAAATCCGCATTCTAACACTGAGCAAAGATTCCTTTCTGAAGGTTGGGGAGTCTGGCATGCACCAATCAAAGGCCTTTCTTTATTGACCACAACACCCAAGACTGCCACCTGGGTAGCTTCCTTCCATACTCCTCACTTTAAATTTATAGCAGCAATTGCTTCTCAATGTAGTCACATGTGCTGGTATAATCTGCCTTTCTTTCTTTCTTTTTTTTTTTTTAAGATTTATTTATTTATTATATGTAAGTACACTGTAGCTGTCTTCAGATACTCCAGAAGAGGGAGTCAGATCTCATTATGGATGGTTGTGAGATGGTTGTGAGCCACCATGTGGTTGCTGGGATTTGAACTCCAGACCTTCGGAAGAGCAGTCGGGTGATCTTACCCACTGAGCCACCTCACCAGCCCGTAATCTGCCTTTCATAAGAATGAATTACAAGTAAAAATCTTGGGGTTTAGATTTTGTTTTGGTTTTTTTTGGTTATTTGAGGTAAGGTCTTATGTAGCTCAGACTGTTCTAGAACTTGCTGTATAACTGAAGCTGAACTTGAATTCCTGATTTGCCTGCTTCCACCTCCTAGGTACCACACAGAGGCCCTGTTTCTGTGGTGCTAGGATTTATTTTTATTTTATATACATTGGTGTTTTGCCTGCGTGTATGTATATCTGTTTGAAGATGTCAGATCACGTGGAGGTGGATTACAGATTGAACTTGCATCCTCTGGCCGAGCAGCGCCAATCTTAACCACTGAGCCATCTCTCTAGCCCTGGAAGCCAGGGCTTTATGCATGCTAGGCAAGTGCTTTCCAATTGAGCCACCTCTCCAGCTCTAGGGAATCTTAATATTATTTTATTCAAGGTACATTTATGCTTCTTTTGACTTAGATTAGATTTTATGAAGGTGTTCCATTTTCTAGTTTTTGGTTCACTCGTCTTAAAAACTTAGGAAGACTTTTAGTAATAATTTTCTACCTCTATATGAGACTTACTATTTTCAGAGAACTTTCAAGTTTCTATCTCATTTATTAATACTCCCAGAAAGACTCTGTGAAGCTAAGATGAACAGATATTTATTGCTATTATTGTTGTTTTCAGAATTTATTTACATTATTTTGCATGTATGACTACCTACATATGTGTCCATGGAGGCCAGAAGAGGTGTCAACACTTAAGACTTAAGAACTATTTTAAGGGGCTGGTGAGATGGCTTAGGGGTTAAGAGCGCCGACTGCTCTTCCAAAGGTCCTGAGTTCAAATCCCAGCAACCACATGGTGGCTCACAACCATCTGTAAGGAAATCAGATGCCTCTTCTGGAGTGTCTGAAGACAGCAACAGTGTACTTACATATAGTAGATAAATATTAAAAAACAAACAAACAAACAAACAAACAAAAAAAGAACTATTTTAAAAGCTATTTCAAAGGTTTGAATAGCTAAAACAAATCTAAAAGAGTTTAATAACTTAGTATAATAATATTAAGGTAATTATACTTTAACTAATCCACATAAACTGAACTTGGTTCTCTTTTTTTAAGATTCAAATAGATCTTAGTAACCTTTTTTAGTCTACCCTTCTTTCAAAGAAAGAAAATCAATATTCAGATAGGACCACAATATGTGATTCTGCTTGTTTATTCATTCATTTGTTTGATCACACCCATGCAGTTATTTATCCTGTATGTGCACATGCATGTGCACAGCATCTGTGTGGAGATCAGGGGACAGTTAACTTGTAGGGGCCTGTTCTATACTTCTGTTCTGTCATGTGAGTCCCAGGTATCACACTCAGATTATCAGACCTGGTAGTAAGCATTTAGCCCCCTGAGCCACCTCACCAGCCCAGATGTGGTCCAGTCTAATGCCACCATCTTATACCAGTTTCTGTGCAGAGAAAAACTTGATGTAGTTTGGGTTCCAATGGACTGGGCAGAATGTTCTCAGAGGCTTCGCAGTCGGCTGAAATGGGTCTCAGTGGAAGACATCACTCCTGAGCCCACTGGGGAGTGGCGTTCTCACCCATCAGTAGGACCTCCCAGCAGTATCTTCCAGAAGTAGAAATAAGTCACAAGGAAAGGAATTAAAGATGAAGTACAGTGAGGTGGCACAGCCCCTAGCCCTACCACTCAAGAGGCTGTGCGGTAGGAACACGGGAACTCCAGCGCCAGTCTGGGCTGTGAGCTCTTGTCTCAAAAAGCCAAACCATCGGTGTAAATGAAGTATAAAAGAGAATTTTATTTATTTCATTATTTTTTCATTTTCATGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGCTACACATGTACATTGCCTGCCATCCAAGGCTAGAATTAGAGTGGACCATGGTGCCTGCCTGGTGTTTGCTTATTCTTAGAATCCAGGCTTCTGTCCTCACTGTTGCATGGCAAATGCTTTAACTACTGAGCTGCTTCTACAGCTCCAAAGAGTATTTTAAAATCTATTGGCATTACAAAGCAACTGTAGCACAATGACTGGCATTATTTTAAAATGTGTATGTCGTTTTATTTATGACT\n>URS000181443A rRNA from 1 species \nCACGTAGGGGGCGAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGATTTGTAAGTCAGGGGTGAAATCCCGGGGCTCAACCTCGGAACTGCCTTTGATACTGCAAATCTCGAGTCCGGAAGAGGTGAGTGGAATTCCTAGTGTAGAGGTGAAATTCGTAGATATTAGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGTCCGGTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGG\n>URS00010F31BB rRNA from 1 species \nCCTACGGGTGGCAGCAGTGAGGAATATTTGTCAATGGACGCAAGTCTGAACCAGCCATGCCGCGTGCAGGAAGACGGCTCTATGAGTTGTAAACTGCTTTTGTACGAGGGTAAACGCAGATACGCGTATCTGTCTGAAAGTATCGTACGAATAAGGATCGGCTAACTCCGTTCCAGCAGCCGCCGTAATACGGAGGATTCAAGCGTGATCCGGATTGATTGGGTTTAAAGGGTGCGTAGGCGGTCGGATAAGTTAGAGGTGAAATCCCGAGGCTCAACTTCGGAATTGCATCTGATACTGTTCGGCTAGAGTGTAGTTGCGGGAGGCGGAATGTATGGTGTAGCAGTGAAATGCGTAGAGATC\n>URS00003180C5 rRNA from 1 species \nGGGTGGTAAATTTCATCTAAAGCTAAATATTGGCCGGAGACCGATAGCGCACAAGTAGAGTGATCGAAAGGTTAAAAGCACCTTGAAAAGGGAGTTAAACAGCACGTGAAATTGTTGAAAGGGAAGCGCTTGCGGTCAGACTCGGGCGCAGGGTTCAGCGGGTGCGTGTCACCCGTGCACTCCCTGCCGCCCGGGCCAGCATCAGTTCTGACGGCCGGTCAAAGGCCCCCGGAATGTGTCGTCTCTCGGGACGTCTTATAGCCGGGGGTGCAATGCGGCCCGTCGGGACTGAGGAACGCGCTTCGGCTCGGATGCTGGCGTAATGGCCGTAAGCGGCCCGTCTTGAAAAACACGGAC\n>URS00019A9808 lncRNA from 1 species \nTGAGTTCTTGATTAGAATAATTATATTATATGTATGTATAATATGTCAAAATATACTCTAATATCATGTATACATTAAAAGAACAAAGGAAAAGAACATCACTGGAATTGAAAAGGGCATGGTGATACAAGCTAATGGTACTAAGAACTTTTCAGTCGAATAATAGAAAAAAATTTTTTAAACTTCAAGTATTAGGTGAACATTTAGGAGTCATATAGAACTAAACATATAAAATAGCAAAAAAATCTCTCTGACACATCATAATCAAAATGCCTAACATAGTGAATAAGAATGGAATTTTAAAACTGCAAGGAAAAATGTCAGAGCCAGGCACAGTGGTACACCTGTAATCCCAGGGGCTCAAGAGGCTGCTACTTCAAATCTAGCCTTAGCAACTTATCAAGGAACTAAGCAACTTAGAAAGACCCTGTCTCTAAATAAGTTACAAATAATGGCTGAGAATGTGGCTCAGTGGTTAAGTGCCTCTTAGTCCAATCCCCAGTAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGAAACATGTCAGCACACATTAGAGGTAAACCAGTGCAGACAACTCCTCAGTTCTTCACACCATTTTAAATCCAGGAAGGCATAGAATGAGGTTATCTGATCTCTGAAAGAAAATTCCCAACCAAGATCACTATATACAGCAAAACCATCCTTTAGAATCAAATAAAAAATAAAAACTTCCAAAAATGAGAATATACTAAAAGAATTCATGACTACAAGGTAGCACTACATAAAATACTTAAAAAAATACTATCCATAGAAGAATTTAAAAATAATCTCAACTTGCCTCTAATGTGGGCTGCCATTTTTCTCTTTCAGCTTTTAAAATTCTATCTTTGTTCTGTGTAGTAGATGGTTAATTATGATGTGTCTTGGGAAGGATGTTTTTTCATCTTATCTATTTGGGGTTCAAAATTCCTCTTGTATTTGGATTTCACTTCATTCCTACAGTTTGGAAAACTTTTTGATATAGTTTCACTGAAAATTTTATACATTTCTTTAGTTTGTGTCTTGGTGCCTTGTTCACAAAGAGTCTTAGAATTGAGCTCTTAATGCTATCTCTGATTTCTTGTATATTCTGGTCATGATTTGTTACCTTTCATTTATTGTTGACTTTGCTTTTAAAATTGTATACTTCATCTTTGATATTAGAAAATCTGCCTTATGTGTGGTCTAATATATTGGTGATGCTTTCAGCTGAATTTTTTATTTGATTTATTATTTCTGTTCCAGAATTTGTTCTTTTCAAAAATTTCTGTTTATTTTAATATTATATCATTTCTGGTATATTATCTCTTAGTTCACTTCATAGCTATGCCTTTAGTACACTGAAAAATTTAATTAGCAGCTGTTTTAATCAGCTTATTTTGCTACTGTGAACTCAAGACCCATCAAGAAAAATATTAGAGGAAGAAAACTTGATTTGGGGGCCAACGGTTTCAGAGGTCTCAATCAATAGACAGCAGGCTCCCATCCTCAGGGCTCAAGGTGAGACTACTCATCATTGCAAAGGGAAGCAGTTCACATGATGAACAAAAGGCAGAGAGAGCGGTCTCCACTTGCCAGATACAAATATATACCTCCAAACCATGTCCTCAATTCCCACCTCAACCAGCTACAACCCACCACTGCAGTTACTACTCAGTCAATACCTATTAAGGGATTAATTCACTGGTTAGTTAAGACTCTCACAACTCTATTATTTCTCCTCAGAACCTTCTTGCGTTTTCTCACACATAAGATTTTGGGGAACACTTCATATCCAAATCATACATAAATTTTCTAAATTCTTTTTCTGGCATTTCCTCCATTATGATATCAATGGGATTAGTTGTATTGTGGGGTATTCGGAATGACTTGATTCATTGCTTTCCATATTGTTAGTATTCCTTAAGGGATATTTATCTCTTTTGCTTTTATATAAAGGACATTTTCTTGTTATGCTGTGGGTTGGGTGAATGCCTTGAGGTCCACATTTTCACTCAATTTAAATTTCCTATTATGTCTAGTCTCTAAGAGGACACTGAGAGGAGAGAGATTAATTTCAAGTAGTTACAACCACTTCAGAACAATTTCATACTCATAAATCTTTTAAAAACGTATTACAAATGTTCTCCAGAAATCCACTAGTCTGAGTGGTAAATGGGGGTGATTTTATTTAATTGGTTGATAAATTAGTTA\n>URS00020D7727 misc_RNA from 1 species \nGACGAAGAAACGCAGCGAAATGCGATAAGTAATGCGAATTGCAGAATTCAGTGAGTCATCGAATCTTTGAACGCACATTGCGCCCCGTGGTATTCCGCGGGGCATGCCTGTTCGAGCGTCATTTCAACCCTCAAGCCTGGCTTGGTGTTGGGCTCTGCCGTCCGCGGCCGGCCCTAAAGACAGTGGCGGCGCCGCATGGCCCTGAGCGTAGTACATCTCTCGCTCCAGGGCCCCGCGGTGGCCTGCCAGAACCCCCAACTCTATGGTTGACCTCGGATCAGGTAGGGATACCCGCTGAACTTAAGCATATCAATAAGCGGAGGA\n>URS0002581D6F miRNA from 1 species \nTGTGTATTTAGCAGTCTGTGTGTGTGTGTGTATTTAGCAGACTGTGTACTCAGCAGTCTGTGTGTATTCAGCAGTCTGCTAAATACCCATACAGACAGACTGCCGAGCAC\n>URS00017F4189 rRNA from 1 species \nTACGGAGGGTGCAAGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGCGGGCAGGTAAGTCAGTGGTGAAATCTCCGAGCTTAACTCGGAAACTGCCATTGATACTATTTGTCTTGAATATTGTGGAGGTAAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGAAGGCAGCTTACGACACAATGATTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGG\n>URS00025256B9 misc_RNA from 1 species \nTCCGGTTTGTCACCGGCAGTCTCGCATGAGTCCCCAACTGAATGCTGGCAACATGCGACGGGGGTTGCGCTCGTTGCGGGACTTAACCCAACATCTCACGACACGAGCTGACGACAGCCATGCACCACCTGTGAAGGTGCCCCGAAGGGAGGCCGTGTTTCCACGACTGTCACCTACATGTCAAGCCCAGGTAAGGTTCTTCGCGTTGCCTCGAATTAAGGCACATGCTCCGCCGCTTGTGCGGGCCCCCGTCAATTCCTTTGAGTTTTAGCCTTGCGGCCGTACTCCCCAGGCGGGGCGCTTAATGCGTTAGCTGCGGCACGGAACTCGTGGAATGAGCCCCACACCTAGCGCCCAACGTTTACGGCGTGGACTAC\n>URS00002B3B99 rRNA from 1 species \nGGAAAACCGTAGAGATACGGTCCCCCCTTGTGGTCGGTGTACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCTTATGTTGCCAGCACGTGATGGTGGGGACTCGTAAGAGACTGCCGGGGTCAACTCGGAGGAAGTGGGGACGACGTCAAGTCATCATGCCCCTTATGTCCAGGGCTTCGACACATGCTACAATGGCCAGTACAGAGGGCTGCGAGACCGTGAGGTGGAGCGAATCCCTTAAAGCTGGTCTCAGTTCGGATCGGGGTCTGCAACTCGACCCCGTGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGCCTT\n>URS00000C876E sRNA from 1 species \nTGGAGAGGTGGTCCAGGGTTACGTAAA\n>URS00005C10BC rRNA from 1 species \nGATGAACGCTAGCGGCAGGCTTAATACATGCAAGTCGAACGGGATTTAGGGGCTTGCCCTTAATGAGAGTGGCGCACGGGTGAGTAACACGTACACAATCTACCTTGTACAGGGGGATAGCCTTGGGAAACTGAGAATAATACCCCATAGTTTTTAGTTATCGCATGATGATTAAAATAAAGCTGAGGCGGTACAAGATGAGTGTGCGGATGATTAGGTAGTTGGAAGGGTAACGGCCTCCCAAGCCGACGATCAATAGCTGGCGTGAGAGCGCGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATATTGGACAATGGGCGGAAGCCTGATCCAGCCATGCCGCGTGGAGGATTAAGGCCCTCTGGGTTGTAAACTTC\n>URS0000CDD785 rRNA from 1 species \nTTTAATTGAAGAGTTTGATCATGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGTAACAGGAATTAGCTTGCTAATTTGCTGACGAGCGGCGGACGGGTGAGTAA\n>URS000241D8E8 lncRNA from 1 species \nGAAACTTGATCTGAGTGAAACCGCAATTGAAAGTCTACCTGCAAGCATTGGTAATTTGGAATCTCTTGAGAACCTTGATTTGAGTGGAACCGCAATTAAAAGCCTACATGCAAGCATTGGTAAATTGCAATATCTTCAGAAATTTTATCTGAGTGGAACCGCAATGGAAAGCCTACCTGCAAGCATTGGTAATTTGAAATGTCTGGATAAACTTGATCTGAGTGGAACCGCAATTAAAAGCCTACCTGCAAGCATTGGTAGTTTGAGATCTCTTGAGAAACTTGATCTGAGTGGAACTGCAATTGAAAGCCTACCTTCAAGTATTGGTAGTTTGAAATCTCTTGAGAACCTTGATTTGAGTGGAACCGCAATTGAAAGCCTACCTGCAAGCTTTGACAATTTGAATTCTCTTGTGAAACTTGATCTGAGTGGAACCGCGTTTAAAAGCTTACCTGCAAGCATTGGTAATCTGAAATCTCTTGAGAAACTTGATCTGAGTGGAACCGCAATTGAAAGCCTACCTGCAAGCATTGGTAATTTGAAATCTCTTGAGAAACTTGATCTGAGTGGAACCGCTGTTGAAAGCCTACCTGCAAGCATTGGTAATTTGGAATCTCTTGAGAAACTTGACCTAAGTGGAACAGCAATTAAAAGCCTACCTGCAAGCATTGGTAATTTGGAATGTCTTGAGAAACTTGATCTGAGTGGAACCGCAATTGAAAGCCTAC\n>URS00006EC10E SRP_RNA from 2 species \nGCTGGGCGTGGTGGCACGTGCCTGTAGTCCCAACTTCTCGGGAGGCTGAGGTGGGAGGATCGCTTGAGCCCAGGAGTTCTGGGCTGTAGTGCGCTATGTCAATTGGGCGTCCGCACTAAGTTCGGCATCAATATGGTGATCTCCCGGGAGTGGGGGACCACCAGGTTGCCTAAGGAGGGGTGAACTGGCCCAGGTCAGAAATGGAGCAGGTCAAAACTCCCGTGCTGATCAGTAGTGGAATCGCGGCTGTGAACAGCCACTGCACTCCAGCCTGGGCAACATAGCGAGACCCCATCTCTA\n>URS00007D8A7A rRNA from 1 species \nTGAGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGTCTTCGGATTGTAAAGCACTTTAAGTTGGGAGGAAGGGCAGTTACCTAATACGTATCTGTTTTGACGTTACCGACAGAATAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCGCGTAGGTGGTTTGTTAAGTTGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTCAAAACTGACAAGCTAGAGTATGGTAGAGGGTGGTGGAATTTCCTGTGTAGCGGTGAAATGCGTAGATATAGGAAGGAACACCAGTGGCGAAGGCGACCACCTGGACTGATACTGACACTGAGGTGC\n>URS0001F1218A rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCCTTTGGGGGTACTCGAGTGGCGAACGGGTGAGTAACACGTGCGTAACCTGCCCTTGACTTCGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAATCCTTGCTGCATGGTGGGGGTTGGAAAGCTTCGGCGGTTTTGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCTGGCCTGGGAGGGCGACCGGCCACATTGGGACTGAGATACGGCCCAGACGCCTACGGGGGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTCAGCAGGGGCGAAGCTTGTGGTGACGGTACCTGCAGAAGAAGCACCGGCTAACTACGTG\n>URS000062BC82 tRNA from 2 species \nGGGATTGTAGCTCAGTGGCAGAGCACTTGCCTAGCACATATGAGCCACTGAGTTCGATCCTCAGCCCCA\n>URS000041D298 rRNA from 1 species \nAGTCGAGCGAACGGATGAGAAGCTTGCTTCTCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATTTTGAACCGCATGGTTCAAAAGTGAAAGACGGTCCTGCTGTCACTTATAGATGGATCCGCGCTGCATTAGCTGGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAAACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACATATGTGTAAGTAACTGTGCACATCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGAAAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACGCTGATGTGCGAAAG\n>URS00020E5DB6 misc_RNA from 1 species \nGATGAAGAACGTAGCGAAATGCGATAAGTAGTGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCCTTGGTATTCCATGGGGCATGCCTGTTCGAGCGTCATTTGTACCTTCAAGCTTTGCTTGGTGTTGGGTGTTTGTCCTGAGGGACTCGCCTTAAAGTAATTGGCAGCCAGTGTTTGGTTTTGAAGCGCAGCACAAGTCGCGATTCAAGGCTATACACCAGCTTCCACAAGCCTTTTTCACTTTTGACCTCGTATCAGGTAGGGATACCCGCTGAACTTAAGCATATCAATAAGCGGAGGA\n>URS0002614DC9 lncRNA from 1 species \nGAAACAAGAGAGTGTGAGAATTGTCACGTGATCTCGATGACGCAACAGTATTAACCACTGTATTTAAGGCTTTTCTTTTGGCAATTGTGACAAATATTTGTGCCAGATGGTTTTCATACATCATGTGATGTACAAAACACGTCATTCTTTTATTAAGAAAGAGAACCTGACTTCAGTATCCTAGCGTACTTAGTAATCAATAGTTTCGTAAAGTTGTTCTTGTTTGTATACTTTGAGTGCGTGTTGTAATTATATTATAGTTGATAGTGGAGTATAATTATGAAGCTGAAGATCAAAGTAACATATTGTGGTGCCTGAGGGTACGAGCCCAAGTTCCAGAAACTTCAAAAGGAACTTGAGCAGAAATTTCCTGGAAAGTTAGACATTGTAAGTTACTACTTCATGCATTTGTGATTTGCAAAAAGGTTGT\n>URS0000D36178 rRNA from 1 species \nAGTCGTACGAACAGCGGAAAGTGCTTGCACTTTCCAAGTAAGTGGCGAACGGGTGAGTAACACGTGAATAACCTACCTCAAAGACTGGGATAACCATTGGAAACAGTGACTAATACCGGATAAAACCCAGTAGCACATGCTACAAGGTTAAAAGCTGCGTTTGCAGCGCTTTAAGATGGATTCGCGGTGCATTAGTTAGTTGGTGAGGTAAAGGCTCACCAAGACAATGATGCATAGCCGAGTTGAGAGACTGACCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCTGCAGTAGGGAATCTTCCACAATGGGCGCAAGCCTGATGGAGCAACGCCGCGTGTGTGATGAAGGCTTTCGGGTCGTAAAGCACTGTTGTATGGGAAGAACGGGTTTAAGAGGAAATGCTTAAGNAGTGACGGTACCATACCAGAAAGGGACGGCTAAATACGTGCCAGCAGCCGCGGTAATACGTATGTCCCGAGCGTTATCCGGATTTATTGGGCGTAAAGCGAGCGCAGACGGTTCGATAAGTCTGAAGTGAAAGCCCACAGCTCAACTGTGGAATGGCTTTGGAAACTGTCGAACTTGAGTGCAGTANAGGTAAGTGGAACTCCATGTGTAGCGGTGGAATGCGTAGATATATGGAAGAACACCAGTGGCGAANGCGGCTTACTGGACTGCAACTGACGTTGANGCTCGAAAGTGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACACCGTAAACGATGGATACTAGTTGTTANAGGGTTTCCGCCCTTTANTGACGAAGCAACGCATTAAGTATCCCGCCTGGGGAGTACGACCGCAAGGTNANACTCNAGNAAT\n>URS0001AD154A rRNA from 1 species \nCCTGGTTGATTCTGCCAGTAGTCATACGCTCGTCTCAAAGATTAAGCCATGCATGTCTAAGTATAAATACTTGTACTTTGAAACTGCGAACGGCTCATTATATCAGTTTTAATCTACTTGATAGTCCCTTACTACTTGGATAACCGTAGTAATTCTAGAGCTAATACATGCGTCAATACCCTTCTGGGGTAGTATTTATTAGAAAGAAACCAACCCCTCCGGGGTGATGTGGTGATTCATAATAAGCTTGCGGATCGCACGGCTTTTGCTGGCGATGGATCAATCGAGATTCTGCCCTATCAGCTTTGGATGGTAGGGTATTGGCCTACCATGGCTTTAACGGGTAACGGGAAATTAGGGTTTGATTCCGGAGAGGGGGCCTGAGAGATGGCCACCACATCCAAGGAAGGCAGCAGGCGCGTAAATTGCCCAATCCTGACACAGGGAGGTAGTGACAATAAATAACAATGCCGGGCCTTTTTAGGCCTGGCAATTGGAATGAGAACAATTTAAACCCCTTATCGAGGAACAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTGTGGGTGGAGCGACCGTCCCGACGCTTTGCGTGGGTGATGGTCGTCTCCGTCCATCTTTGGGTGGAATCCGTGTGGCATTAAGTTGTCGTGCGGGGGATGCCCATCTTTTACTGTGAAAAAATTAGAGTGTTCAAAGCAGGCTTACGCCGTTGAATATATTAGCATGGAATAATGAGATAGGACCTGGGTACTATTTTGTTGGTTTGCGCACCGAGGTAATGATTAATAGGGACAGTTGGGGGTATTCGTATTCCATTGTCAGAGGTGAAATTCTTGGATTTTTGGAAGACGAACGACTGCGAAAGCATTTACCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGATGATTAGATACCATCGTAGTCTTAACCATAAACTATGCCGACAAGGGATTGGTGGGCGTTGTTTTGACCCCATCAGCACCTTATGAGAAATCACAAGTTTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGAAATTGACGGAAGGGCACCACCAGGAGTGGAACCTGCGGCTTAATTTGACTCAACACGGGAAAACTTACCAGGTCCAGACATAGTGAGGATTGACAGATTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGTTAACGAACGAGACCCCTGCCTGC\n>URS0000B34B7F misc_RNA from 1 species \nATAAAAGTACCTCAGGCTGAGAAGAATTTGCAGATGAATGATATATCTTTCTATTTGTTAGTGTCAGTGCAAAAGTTTGTTTGAGACTTGGCCACTTTAAGTGAACAAGATATAAGATTGATTTATGGCTTACATACAAGATCAATTGTTCAAAAATGTTAATAAAAAATATAAAAAATTTCATATAAGATAAATTCATTACTTGGCCAAAAACATAAACTCCATGAGAGAGTGTCAAGTACATAAGAACATTGAAAGAAGTAAAATGGGAAAAAAGAACCTGGCTTACTCTAGGTTTTATTGTTGTGAACATCCTCATTTAAGAATTTTAATTAGCGATAAGGTAGCCAACTATGCTTTATTTTTTTTCTTTTTTGAATGAATGCTTTAAATTAATTTAAAAAAAATAATAACTTCAATTAGCAACAAATAAAAGCAATAATAATACTAATCTAAGAGAAGATGTTTAGAATAGCCTGGGATATGTCGATCGAGGCACGCAAATTCTGCGCTGTCCTTAGAGGTTAGCTAAGCTACTCCTATGATTGTTTTTTCATATTTGTTTACTTGAACCACCCTTCAACTTAATTGTCCAAGTGTTCATAGAGATAAATCAAAACTGTAATCAAATTTATATGTAATTTACTTGTTTAAGAATCACATTTTTGAACATTAAAAACTTGTTAGGCTTCTGCACAGTGACAAAGCCCAAGCCCAG\n>URS000228E453 misc_RNA from 1 species \nAACTTTTGGCAACGGATTACTCGGCTCGTGTGTCGATGAAGAGCGCAGCCAGCTGCGTGAATTAATGTGAATTGCAGGACACATTGAACATCGATATCTTGAACGCATATTGCGGCCTCGGGCAATCCCGAGGCCACGCCTGTCTCAGGGTCGGTTGAACGTCAATCGCGAAGCTGCTCTCCTCGCTCGCGCATTGGGCGTCGCAGTCGCTACCAGCGGCTGCGTCGCCTCAAGTTCAGACGGGTTGCTCGGTCTTCGACGCGTTCGCCTGACCGGGACGGTGACTCGACTCTCGTAGAGCGCACCATCTCCCGGGTCGTGGCGATTGTCGCTGACGTGCGGCGACCGCAAACATACTCACACTGACTTCGACCTGAGATCAGACGAGATTACCCGCTGAATTTACGCATATCAATAAGCGGAGGCT\n>URS0001A2104B lncRNA from 1 species \nGTGGAGGCGAAGTCAAGATCGAGAGCCGGAAGGTCAACTTTAAGGAGAAAGCTCAGCCCAAGGTGAGCTCGATGGATAATGTTAATCACGAGCCCGGAGGCGGGAATGTCAAGGCTGAGGGGGCGCAGGAGACTGCTGAGGGCAGCGGGGCTCCCTCTAGTGGTGTCTCAGCAGGCCCTGCCCAGGAGAATGGGCTGAAGGAGGGCGCCCCCTGCAGGAGTGAGGAGCTCCGGGACCCGCAGGGCCTGGACTCGCTCATCCCTGAAACAAGCATCTAACTCGACTTTTTGCTATCACTCTGCCCTCTTCATTTCCCCCCCCCGACCGCTTCCTCTCCTCCCCTTCTTTATGTCCTGTCCCTCCTCTGTCCTGTCTTTCTCCACACTCTCTGATGCAGATTGAGTCTTTCAAGCTAAATTTCCGCGAGAAGGCCCGCTCTCGCACGGACCACGGCGCCGACATCATCACCTGGCCCGTCTCGGGTGACAGCCCTGCCCCCCCCCACCTCGCTCCGCAGCAGCGTCTCGCTCAACGACTCCCTCGCGACCGCCGGCATCCCTCGCTCTCACACCACCCCGGCCCTCTCCTCCTCACAGGAACAAGGCTCGCTCACCGGACTCTGGATATGATTTCTGTCTTTTCATTGGCCCGCTGCTCTCTAAACCCCGCCCCCTACCATTGCTAAGACTCATGTGATTGGTGTGCTCTCTGTTGACGTTCTTGATTCCTGATTGGTGAGGCTGTACAGATTACAGTCATCAGGATGCGCTAAAAAATGAAGGCTGCTGACCCGAGGGTCTGTAAACTCTGAGGTTACACTCTGAGTACATCCTGCTACATCACTTGTTGTAGATCTGATCACATGCAAACACATCTGGACATCATCTCTAGCTGCCTTCAAGTCCTCATGGGAAGTTCGTACTTACGAGTTGTTTACGATGCGATCGTGTCATGTGATTTTAGATGGAAAAAATCACTTTCTGACCAAACCAAGAAGCTTCTTTTAGTGCCAAAGCAACAAAATGAAGAGCAAAGCATGTGCATTAGATGTGTGCATTTGATCATTCTAATGAATAGGGAATGTAGTTTGGTTTTGTGAAGATTTAATTCACGTTCACACTACATTTCGAGCATGCAAAGTGTCTACAGATTTAAAATACACTGAAAAAAAATAAAATAAATTGGTGCACGAACAGTTTTCGCTCAGAAACGGCTTAATTTCACAAACAATTACAAAGAAACCGCATGCAACGCGTTTGAATTAGACGCGCAATTGTAAAGTAGAAGAATTGAAATATTTTCCTTTATTTACTACTATAAAAAGAAAAAAAAATTGTAAAATGGTGTTTTTTTTTAATAAAAATATGCAATCTGCAATCTACTGAAATATACTGCAAGTCTGCAGATTTAAAGTTTGCTGTTTTTGTTTAATTCAGCTAAGACGTCACTCCACGTGCATGAGCTTGCTTTTCCTCTCTCCACGTTTGCATGCGTGTGAATCGAAGTCAGTAGAACGTAAAGTGTAGTGTGATCGTCCCTTTATGCCTCAAAAATTGTCTAAATGAATATTATCTGAAACTTTTACATCTAAAATGGCTAACAACAGCTCCAACTCGGAAAGTCCCCCAACATCAGATGTCAGATTTGGGTGGCGCTCGTCTCGTAAGCACGATCATTTCTGCTTGATTTGAAGGCAGCATCATTCAGCATACAGGGCTGTCATGTGACCCTCTCTCACCTTCACCCTTGACCTCCAGCAGAGCTGTCATCGGAGCACATAGGCTTTCTGAATCTCTCTCTAAAGCTGTTTTGTGATGGTGTGTTTGAGTGAATACTGTAGCAATGAACCGCTTTCCTTCGACTCTTCGTTTTATTTTTCGTGACCAGCAGATGTTTCCTTTTCCTTGTTATTGTAAAGCAATATAACAGTCTCCTATAATGCCTATAAGACATGAAACTCCACTTAAACGCACAGTAAACAGCACTCAGTGTCAAACGCAGCTCCAGACGGCTTCAGGAACGTGTAGAGGGTCTGAGGTGGACGTGTAACGAAAAATACCCTTGTGAAAAAGAAGAAACAATAATATTAATGAAATAAAAGCCCACTTAAGTGTACTTACAGTAGGCCGTTTCCTAACACACTTAAGTACGCTTTGCAATATTGTCAAATTAATTGTTTTAAAGTACATTTTAAATCATTATGTTTTGATAATCTTTGAAGACGTACACTTATTTTGACGTGTTGACTGTCATACTAAAGCGCATGTGAAATACTTGATTATAATCGAACTGTAGTGTTATGCGATATTACATTCAAAGTTATTTTACTCGGCTGCATTCATCATTACAAATGTATAATTAAAAATTTATTTAAATACATGACTTACAAGTTTAGTTTACCATGCATGCTTGTCATTGCAATCAGCAATACACTTTAACCGTGTTTCAAAGACACTAGAAGTATTTGTGAATCTGCGTATAAAGATGTACTTAAATCCTACTTACAGTAAATGGCTAAAAAACACTATAAAGTTCAGATCATTGCATTTAAAATAAATTTGAACCATTATAGACTTCATTTCAATTAACATACATTCAGTTCACACTTACAGTAAGTATATTCGTCTAAAGTGCATTGCTGTAATAAGTATACTTAAGTGTACTTCTTTTTCACAAAGGCAAGGGAAGTGTGGAGACACTAGATGTTGACTTGATGCTTGAGGGGTTTCTGTTGGGATTGAATAGTTGATGTTTTGGCATCATGTACAGTAGGTACAGTATGTTTTAAATGGAAGTGAGGATCAAGTTCGTGCCTGATAGAAATCGCATCCCTTCGGAGGGACGCAGAGACAGAATGTCAAAGCTTGAAAGCTTTTACGTACTTTTAATAGTTGCTTTACGAGAAACCAGTGAAATTGCGAGTGAGTCTGGTGGTGGTTTTACTTCTCTTATTCGTTTCTGCAGGTCTTTTTTAGGAGTTAAAGTGTGATCATGTGGGTTGAAACGTTCCTGCGGGGTTTTAATGGTGGAGCTTAATTCTCTTGTAGCATTTTACAATAGTTTATCTTCAGATGGTCGCACTGAATCACATGCTTAACACGAATCTGCTTGGTTTAGTGTCCTTTTGGTGTAATAATGGGGTAAGAGGACGTGGCCGTTCTTTTAGTGTTCATTTTGTCATCAGCTGAGGGCGATATGGAGGTCCGACGTACATTTATTTTTTATGAGTATGACAAATTATTGTTGCATCTATCTTGTCAGACCGTTTCAATCCCAGAACATACAAAGCAATAAGACTGTCACACTGACAGACCCCAGATTTCGACTTTTAGAAACCTACATCGTGCATGACGGCGTAAAGCATTCAGATCATGAAATATTACGCGATTGATCGAAAAATTTACGAATGCATGGCCATGCTACAAAATCAAGTTTCTGAGAGATAGCTACCTTATCTAAGATACAGATGGTAGACAACCAAAATGGGTAATACCGCCGCGCGTACCGCCGCCGCAGGGCCGCGGCGTTAACTTCAAGTCAGTCAAGTGTTAAAATCCTTCGCGAAACTACCACCAGGTGGCGCAAAGGGACGGATTGCGAACTGAATGTAATTGTAAAATGAGATAAAAGGAGGAGGTAAAACAACAATAACATTATGATATAACATTGTACCATCTTTAAAAAACCATTAAAAAATGTACAGTGAGTTAATTTCAAAATGTAGGATAGTCTTAGGCTACAGTTTACTCA\n>URS000030206D rRNA from 1 species \nGTGGGGTAATGGCCTACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCAGCAGGGACGAAGCGCAAGTGACGGTACCTGCAGAAGAAGCGCCGGCCAACTACGTGCCAGCAGCCGCGGTAAGACGTAGGGCGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGCTTGTCGCGTCGACTGTGAAAACCCGTGGCTCAACTGCGGGCCTGCAGTCGATACGGGCAGGCTAGAGTTCGGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGTTGGGCGCTAGGTGTGGGGGGCCTCTCCGGTTCTCTGTGCCGCAGCTAACGCATTAAGCGCCCCGCCTGGGGAGTACGG\n>URS0000C8846A pre_miRNA from 1 species \nGAATTACTCCCTTCGTTCCAAAATTTTTTGTCTTACATTTATGTAGATATGAATGTATGTAGTCATATTTTAGTATTTAGATACATCCATTTATAGACAAATCTAAGAAAAGAATTTTGGGACGGAGGAAGTACAAA\n>URS0001332FF6 rRNA from 1 species \nTACGTAGGGTCCGAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTTGTCGCGTCGGGAGTGAAATCTTACAGCTTAACTGTGAACTTGCTTTCGATACGGGCAGACTTGAGGCATTCAGGGGAGAACGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAGTGGCGAAGGCGATCTTCTGGACGGATACTGACGCTGAGGCGCGAAAGCTAGGGGAGCAAACGGG\n>URS00019FE4B3 tRNA from 1 species \nGGATTGTGGCTCAGTGGCAGAGCACTTGCCTAGCACGCGCTAGGCCCTGGGTTCAATCCTCAGCACCA\n>URS00021AA98B tRNA from 1 species \nGCGGGGTTGCCCTAGCCTGGTAGGGGGCAGGCCTGCTAAGCCTGTGGCCGATTTCGGCCGCGCGGGTTCAAATCCCGCACCCCGCGCCA\n>URS000050F67C piRNA from 1 species \nGCAGAAGCTCCACCACCACAGCAAAG\n>URS000242CB14 lncRNA from 1 species \nCGGCGAAGCTTTTCCGGTGAGTAATTGGACGGCACAGGGACGGTCTTCCGCGGTGGATTTTTCGGCGATCTCTACCGTTTTCCCCCAGAATTTCTCGATGAGAGGAGAGAGGAGGGTTCTCCTCCTTAAATAGGACTGGAGGGAGATCGTTTCCGACTCCGATTGGGAGCCGGCGAGAGGAGGAAGAAGACTCCCTTCGGGAGTCTTCTCCCCTGTTTTCTTCTCTTTTTTTTTTATTTTGGGCTT\n>URS000242DE7D lncRNA from 1 species \nTAAATCATCGAGCTCTTTTTGACTTAGTGTCAATACAATTTTATGAGATAATAATGTCTATTTCCTAAATCGGAAAAACGAAAAATACAAAAATAAAAATTTTTAAATACGATTTCGGATCTTAAGACTCTTTCCTGAATTGTCTTTCGACCTAAAGATAAATCAAGCTAAATTATAAATCAAACAACAATAAAAAAAATAATAAG\n>URS00022EBB93 tRNA from 1 species \nGGTGCCGTAGCCAAGTGGTAAGGCAAGGGTCTGCAAAACCCTTATACGTGGGTTCGATTCTCACCGGCACCTCCA\n>URS00019F1EF9 lncRNA from 1 species \nATGGAAATATCTTGGATCAAGTTGGATCCCATTACCTTGAATCATCGACAAATTCTTTCACTTATCGCATTCTCAATCTTTTCTTTATTTTTTATTACAATACATATCGACATGCTTTTGAAAAATATATCATTTACATAAACAGTTAATTTTTTAATATATAACGTGATGTTATCCATTCATCATAATATTTTAACATGA\n>URS0002545815 rRNA from 1 species \nGGCCAGGGAAAAGGACACGGAGGCTGGGACAGCGATGTCCCCGCTCGGGGGCGGCCTGGTGGAGCGGCCGCAGCCGCCCACCTATTCCGAGGTGGGTGCGGCGACTCCCCTATTCAGAGGGGGAGTCGGAGCAGGAGTAGTCGGGGGCTATAAAGCGGTGAGAGAGCGGAGGAGTTACCAGGAGAGACAGCTCCCCCTCTTCGTCGGCTCGGGGGACAGCGGCGGGCGGCAGCGAGTGGCGCCACTGGCGGAGGGGGCACGAGGAGGCTAACCAAGTTGTGGAGGCGGCAGAAGGCGACGATGGAGATGCAGCTGCGCGCGCTCGGCCCTCCGTGGTGTCGTGGCCTAGCTCGGCAGAAGAAGGAGCCTAGGGGCGGCAGCCAGCGGCAGCTAAGTAAGCGGAGGTCGTTGGGGCCGGAGGGGCTCTACGAGAGGGAGAGGCGATGGGGCTCTGGCGACAACTACGGGGACACTAGCTGATGCAGCTGCTGCTGGGAAGAAGGCAAAGTCGCTTCGAAGGTCTACCACCTAGGGACCTTGGTCTACGGTGGCGGCTACCTACGACGATGTACTTCTGGCGGCTGCTGGTACTCATCAATCCTCCAGGGTCCGTCCTCCAGAACGGAGAAGCTAGCAACAACGAAAACACGATCGGAAGAATTCCGTAGGAACAAATTGAATACATATATGAGTCTATAACAACGAAGGCGACTGAGAACACATAGCTCGATACATAAACTCGGGAGCTCCGGGGACCGAACATTATATTTCGAACATAATAAAACTAAACACAGATCTCAACACAACACTATAGAAGGGCACTCAGG\n>URS0002061C56 rRNA from 1 species \nAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGGCAGCACAGTAAGAGCTTGCTCTTACGGGTGGCGAGTGGCGGACGGGTGAGGAATACATCGGAATCTACTTTTTCGTGGGGGATAACGTAGGGAAACTTACGCTAATACCGCATACGACCTACGGGCGAAAGCAGGGGATCTTCGGACCTTGCGCGATTGAATGAGCCGATGTCGGATTAGCTAGTTGGCGAGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATACCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAAGAAAAGCAGCAGGTTAATACCCCGCTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGTG\n>URS0000EFE3C8 pre_miRNA from 7 species \nTTAAGGGAGTTATTGACTGGGCTTCCCACCACTTAAACGTGGTTGTACTTGCTTTAGACCTAAGAAAGTAAGTGCTTCCATGTTTTGGTGATGGTATGTTTTCCTTTATATTCATGCCTTT\n>URS00025F4A4B lncRNA from 1 species \nTATTTTTTACAATATATTTTTAATAAGAAAACTGTCAGTTTTCTTGTGGGGATTTTTGATGTTTTTATTGTATTAAAAACTATTGCAAATCAGCTTACAGTTTCAATGTAGGAAAAGGGGTCTGGCTCCTTAGGCAGGCCTGATGTGGGCCATAAATATGATACAAATTTTGAGAGCAGAAAAAATCACAGGGATATTTCAAACTTGCTGACTTTGTGTTACCCCGTAGGAAATGAATCTACCAATAATGGGCCTTATTATTCCACCTCCTGTAGACTAACAAGAGCAATTCTGGTTGTTTATTTAGATACACTGATTTTGCAGACTATACCTCGAGATGGTTGAGCTTAATGTGGTCATACTTATTTGACTAAGGGTAAATTTTTAGCTCTGGCAGAGAGCAGATGTAGCTGTCAACAACTTCCAAGCATAGCTGTCTTTAAGGGAGCTCTTTCTATTAACAGCAAACACTCAGTGAATGAGAGGGCAGTACTTGTACAGTGCATGTCCACAGTTACATGCATATGGCAAAGCATACTTCAGCTTTTGGTTTTGAAACTCATCTCCCACTAAGGCCAAAGCCCTGACATCCTTACTGCCGTGTGTCTGGGATTTTGTTTCAGCGTATGTCCAGTCTTATCTTATGAGCTGAACACCTTCAGTATGTATATGTGCAATTAGCAGTTTGTTCTTGCATGGGTCTGTCAGGGCTTGGGAGACATTCGGCATGTGCATGGGTAGGTTCCCCTGGCTTGATTTTTCTCTGTGAGGAACCTGGTTCATATGCATCGGCACTGCTCTGCAGCCAAGCCCTCATCTGAAAGTAATTGAGTGGCTCTCTTCAAACCTGCCTTGTTGCCCCAACCAAAACATTAGTGTGAGCCCAGTCCCTGACAGCTCACTGCGGTTGGCTCTCTGTGGGCTGATTTGCGTGCTGTGTTGACTGAGTTTCCTCTCAGCTCTAAAGACTGTGTATCATTTATCTATTTTTTTTACAGGTGTCATTATGCAAATTATGTATGCATACAAATATAAACACATATACACAAATCTTACGTGGATAAATATGTAAAAACAAACTTCAATTATACCTACAAACATCCATGTATATGTATATATTTGCCATAATATATTATTGCAAAGGTATTATCTCCACAGTTGATGATGGTCTGAATGCCATTGCAGCTACTGTTATTGTCCTTTGGTTGGAGTGATACCCGTCCAGCACTGCCCTTTATTAGAAGATTATCCGAACTTCTCAGTTATGCAAACAAACAAAAATGTATTCTGTAGGTTTGTTACATTGGTCACAATGTGAAGTGCATTTGTATGAATTGAAAGCACATGGGACTGCAAGCTATAGCTACATTACAAGTTTCCAAGGATATACTGCTGTCAATGTCATTTTTTTTAGCAAAAGTATCTTCACCAAACCTCAAACTACACCTCAAGAAGCCAAGAAATAATAATGGTGGTTTGAGGCATGAAACAAAGGATGGTATTGTTGTGTGGAGGAAGCAAGCACAACCTAGGTAGGTAAAGCATGGTAAGTCCAGGTGCAGTCTCACATCAGTGCCTGACTGCCTGCATTCCATTGGCTTCCTTGCTGCATTTATTTCTTTTCCTATGAGATGCCAAAGCCCCAGCCATGCTAGAGTGTGTGTCTAAGCAATGAGCTGCTCTGTTGATTAATCTGCTGTCGCTGTGGAGCAAATTGCTTGGCATGTTTTAGCTGTGACAGGTGGGTTTCTATTAGCCAGTGTTCACGTAGCTTGCACTATCCATCACATAAAGAATCATGTCATGTCAGAGCTGCATTGTGATCATGACAAGAAGACAGATCAGGTATCGTATAGGGGAAATAAAAATACATGCATGGTGCAAATAAAAAAAATCTTTAGGGTTTCTTTGTTTGTTTGCTTTGTAATTAAGAAGACACAGAGATGCAGGATGAAATTGGGAAATAGAAACTGATAACTGAGTTAGAGGGACATGGTTTTCATCCCAGAGGTTTTTACAGAGTACACAGGGATTAACTGAGTTGTTGAAGCTTGTACTCTCTCTTGCTAATTAAGCCTAAGTTCAATACAGAATAATTGCTTGTGCATTGCAGGTAAGGTGAAGGAGGGAACTCGTTGCTGTTGTGCAGTTCTGCAGCAGGCAAGACCTGAGCTGCATAAAAAAAAGCATTTATCTATGGTAATGTTTTTGTCACCTTTTTGATACTTTAGAAATATTCCTAATTCACTGTCTTCCAGGTAGAGAAGTTATTTCTATTATATAAATGATATTAAATATGTATATTAAAATGTAATGTCCTTTGGACAGTTCTAACTTGTGGGATGAAATGGCAAGGCAGATGGGGAAAATGTCTGTGGGAACAGGGGAGTAACTGGAAGATAAGTGAAAAAAACAGGATCTGACTATTAAAGACATCTGGGAGGTTTGTATGTCTAAAAAATTTGGGGATTTACAATCACAACATGCTATAAAACTGGAGTTGCAAATCAAACTTCTCTTACTTTATATGCCTTGCAGGGGGAGTGAGCCATGTTTTGTGAGTCAAACACAGAACAAAATAGAAACCCCCAAAACACCCCAAGCACACTGGGAAGTCACCCAGAGAGAAGAGATTACGTTTAGAAGAGCTTTTGTTCCCAGTGAGCTAAAGATATTAATACGCATCTGGTATACAATGATATCAGCATACTGAATTGCAGGAAGAGCAGGTTATTGGGGAGTCAGGATCTGTTGTTGAGATTTGTTTGTACTCAGTATTTAGCAAAAAGAAAAGGAATATAATTAGAAGACTGTGAACTGGGGTAAGAGTTGTTTCTTCTAAAGAAGAAACAATGAGGAGAGGATGTCTGCTGAAATAGTCTCTTCATGCAGGCAGCTCAGAGATGTCCACGGAAGGAAATCTGTTCAGTAGCCCATAATCGCTCTGAGTTCCATGTAGATGTTGATCTTTTGTTCAGCTGATTTCCTTTTGGTAGCTGTTTTCTGCTTTGCAATCAAGAGATAGAATAAACGGGACTCCTGCTTTTCCTTATTCTTATCGAACGACAGAGGAATCTTAAGGCCAGGTGTTGGTGTATGCTAGTTGCTCTCCAGGGAACAAAAGCAGCAAGCAGGTGGAGACAGAATGGTTCGCTTCCAAATGTTTCAGAGTTCTTGGGCTTGGGATGTGTTACCTCCTAGCTCAGTTCGACGCAAGGTGGTGGCTTGCAAAAGGAAGCCTCCCATGGCAGCCTTCAGCCAGCATAGCTTTACCAGGCTCCCGTTGAAATGAAGTGAGCGTTTAACTCAGATGATAACTGTGTGTCTTGTGGGTTCCTTCACATCTCCAGTCCGGTTACTGGGAAGTTTTCTCCTCCAACCACCCTTTGACTGTCTATAAATAAGTGTAACAAAAAGGGTACTGAGTACTAATTCACAGTGAATCACAGCTGAACAGTATGATCAGGTGAATCCCATAAAGAGAACTGACAGTGTATTCAGATCGGGTGTTTGCCATTCAAGGATCTGCACCTCTTATGATCTATTTGGGCCCATCTTTCTCTAGCCTTTAGAAAAGACTTCTAGAGTCTTGCTGGTTGTCTTATTAACATGTAGAGATGGCTAACTGGTGAATCACAGCTTCCTTTAAGTAGCCCCTGACATCTGTAGCATTTTGTCAAAGTGTAGAGGGAAATGAGATGAAAGGCTTAAAATGCTGTGTGGCTTTTCCAATTTTAAGTAATGTCAGACATTCTTTGAAGTAATTTGGCCTCTTGTGAAAAATGTTCCCTGTGTTCAAGGGCATCAAAACCAGGCAGCCCTCCTAAAAATAGTACATACTTATTTGTTGAGTTAAAAGTTTCACAGGTATCCTTTTTATGCATCCTACTTTGTTTATCTGTGAAGGTGCTCATTTGTTTGTTTTCCTTGCAAGATTCCTGAGAACGTTCTTATACTTCCAAACCACATTTCTCGAATCTGAGTATGGGAAGGGGGTAGTACATAGATTACTTGCTGAATATACTAAAACTCAATCATATTTAACTACTTTATGAAGTCTGTTTAAGTTTTGTAACATTTAACTACTTTAATTCTAGGCTAGATCCTCTTTTCTGCTAACTTGTTTTCCTAGTGAAAAAAGAGAAAATAATAGGTGCATTAATTGTTAGTTAAGGTAGCAGGCCATGGTGAACCTCTTAACATTCTCCTATTTTATGAGCATAAAACTTCTATTTTAATAATGCCTTGCAATAAAGGATCTTTTCATGGCAGCTAAATGATGTACAATGGTAATATTTCTACAAGAAAATTAGATTTTGATATTGCCTTGGTTTTCAGTGAAACAAAAGAATTTGTGAAGAACTTGAAAGAGAATACCACTCATCATCATGGACAGCTGATGAAGAAGACGGAACCAGGGAAGAGTGGTTGAGATTCTTTTTTTCTAGTTAAAGGAAGCAGGAGATGTTCTTGCTCTAGCAAACAGCACTGACATGATCAAGAATCTCTGAAAATCCCTGGAGAGATCTCTCCAAGTGAGCATTGAATTAACTTCCTTTCCTACTGTTCCACTCTGTACAAAAGAAGTCCTTCCTTCAAAAGTCCTTGGAATACAATGCTGTGTTTTGTAAGCAGAGTCCAGAAAAGCACAAACACCTCTAACAAAAGAATAGTAAATAATGGCTATTTCTACTCTCATTACCCTGGGCTGCACTTCCTCTGCTATCAGGCACTGTGACAGCAGGGAGGCAGGCATTCTCTTGCTACTTTATGATTCAGTAAGAAAAGGATGAGGTTCCAGAAGTGAAGGATGTAGAAGAGATGACTTCAGTTGGTGCACAAGACATTTATTTCAAGTAGCCGTTTCAGGGCTAAGACTTTGCCCACCATCTTCACCCCCTGCAGTACTCTGGTTTCTGAAACTTCAAGCCTGCTGAGCAAGCCTGTTAGGTTTCACAGAAGGAAAATTCAGATGTGTAGACTCAGGGGAGCTGGGGAGTCCTCTGCAAAGTGGACTTGAAAATACTTCTGCAATTTGCTGAAACAAGTAAACTGAAGTGCAGAAGAGAGGCTGAGACGTGGCAAGGAATCGGTTAATCCTGAAATGTAAAATATGTGAAAAATCTGCACTATTTTGATTTTTAGCATATATGGTATTGCTGGGTTAGGTTTCCTAGGGTTTCATATGTACAAAAAAATCACTCATCACAATACTGTGAAATAAATGCATTTACATGCCATACCAGAATCTGATATTATTTGCCTGTACAGGGTTTCATAAGGTGGACCTCTGTGGAAAATGACTTAAGACTTCCAGCAGTAACTTCTCCTTCTCTCTTGGAAGAGAAAGATATCCTTGTGCTCTTGGTTCTGTGTATTCTGGAGCTTTCCTGTCAGCTTGAGTGGATCAGAACAAGTCTGTCTCCATTGATCAGACTTCTGAAGATTAATGCTCAAACACTGAAACTTTCCCCACGCTGCACTGCTAAATTGATGCAGCAAAACACTTGAACACACACAATCAAACTGAAGTTTAAAACAAGTCACACAGAATTGAGTTTACCTTTGTATTAGTTTAAAATCTGCTTGAAGACCATTATCTTTGTGCATCCTTTCAGGAAAGCTTTATTAGGCACCAGAGGAAATTATTTCTAGACCAGATGTAACCTAAATACACTCCAGGATTGCTGCCCATTAGTTTTTGTTTTTAAAGACTGGAATAGAAAATTAAGTGCAAATGAAATGTTTAGGAAAGTATGACCATAACTACATCAATCTGATTATGCAATTAAATGGCCTTTATAATAATAAAAAAAAGACTGTGCTCTCTAAATGTTAGACATATGCCAGTAAACCAGTTTTACTTTCAGTTGCTGAATAAGAAGCGTGGGAGCGCATTGTTCCATTTCATTTTCTTCTCTGCTGCTTTCTGTTTAAAGTCAGACATAGCGAAAAAAGAGGAGCTCCTCAGTAAGAGCTGTAGTATGGTTTGTCCTTGATTTACACAAAGTCAATGTTGCTGTTTGAAACAGTCCCTCAAGTTGTTACTTTTAAATGTTAGCTTTAGCAACTCTAAAATTAGTTTTAGCTTAGCATGGTAACCAGGGGTTATTATTTTTCCCCTTCAATGAGAGGGAGTCTGAATATCAAATTCATACACTTTGGTCCTTCTTTGATTAATGAACAGGCTCTTTCAGTGTGTGGTTTAAAATGCACTTATAAAAATGAATTTTACAGCATTAATTTAAAAAAGTAATATATGAGTATGGAACTCCTGTTTCATCTTCCC\n>URS0001447AD9 rRNA from 1 species \nCACGTAGGGTGCGAGCGTTGTCCGGAATTATTGGGGCGTAAAGAGCTCGTAGGCGGTGTGTCGCGTCGGCCGTGAAAACCTGTGGCTTAACCATGTGGTCTGCAGTCGATACGGGCAGGCTAGAATTCGGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATATTGACGCTGGAGGAGCGAAAGCCGTGGGGAGCGAACAGG\n>URS00001955B1 rRNA from 1 species \nCGGGGTGCAGCAGGCGCGAAAACTTTACAATGCTGGCAACAGCGATAAGGGGACCTCGAGTGCCAGGATACAATCTTGGCTGTCGCGATGCCTAAAAAGCATTGCATAGCAAGGGCCGGGCAAGACCGGTGCCAGCCGCCGCGGTAACACCGGCGGCTCGAGTGGTAACCGCTATTATTGGGTCTAAAGGGTCTGTAGCCGGCCGGATAAGTCTTTTGGGAAATCCAGCTGCTCAACAGTTGGGCTTTCAGAAGATACTGTTCGGCTCGAGACCGGGAGAGGTGAGAGGTACTTCAGGGGTAGGGGTGAAATCTTGTAATCCTTGAAGGACCACCAGTGGCGAAGGCGTCTCACCAGAACGGATCTGACGGCAAGGGACGAAAGCTAGGGGCACGAACCGGATTAGATACCCGGGTAGTCCTAGCCGTAAACGATACTCGCTAGGTGTCAGCCACGGTGCGACCGTGGTTGGTGCCGTAGGGAAGCCGTGAAGCGAGCCACCTGGGAAGTACGGCCGCAAGGCTGAAACTTAAAGGAATTG\n>URS000146AAE0 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGAGTGGCGGACGGGTGAGTAATGTATGTGAAACTGCCTGGTGGAGGGGGATAACTACTGGACACGGTAGCTAATACCGCATACCATCGGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAAAGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGCACTTTAAGCGGGGAGGCGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCCGCCGCGGTAATAC\n>URS0001DA31B7 rRNA from 1 species \nAGTGAACGCTGGCGGTAGGCCTAACACATGCAAGTCGAACGGCAGCACAGTAAGAGCTTGCTCTTACGGGTGGCGAGTGGCGGACGGGTGAGGAATACATCGGAATCTACTTTTTCGTGGGGGATAACGTAGGGAAACTTACGCTAATACCGCATACGACCTACGGGTGAAAGCAGGGGATCTTCGGACCTTGCGCGATTGAATGAGCCGATGTCGGATTAGCTAGTTGGCGGGGTAAAGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAGTGGGCGCAAGCCTGACCCAGCCATACCGCGTGGGTGAAGAAGGCCTTCGGGTTGTAAAGCCCTTTTGTTGGGAAAGAAAAGCAGCAGGTTAATACCCCGCTGTTCTGACGGTACCCAAAGAATAAGCACCGGCTAACTTCGTG\n>URS00016B5AE1 rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGTTCGGATTTACTGGGCGTAAAGCGCACGTAGGCGGACTATTAAGTCAGGGGTGAAATCCCGGGGCTCAACCCCGGAACTGCCTTTGATACTGGTAGTCTTGAGTTCGAGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGACTGGTATTGACGCTGAGGTGCGAAAGCGTGGGGAGCAACAGG\n>URS00023938D4 lncRNA from 1 species \nTGGTCTATGTTAGTAGCTTGGACAATCTACATAGTACTTTAAAGAAGTTTTTTAAGTGATGGTTTGGACCGTATGTGGTAACAATTACTCATGATAATGTAACTTATTTGTTGCGGGAGTTAGATGGAACAAGGTTAAAAATACCAATTATAAGGAAGCGAGTAAAAATATTTAAATAAAAATATACGGAAATAAATATAGAAGACCTTATTGAGGACATAGATATTCATCAACAGGAAGATGAATTTGACTTGAATAACAAAAGTGATGAAGAGGATTTGAATGGAAACTTGAAGAACATATTATGAATCAAACAACAACTAGGTGATTTGGTGCATACCATTAGATGCACAGGTTCAGAGGGGATGTATGTCGTATTGTAACATGACTATATGATGAAAATATAAATTAAAAAGATTTTATTAATATTTAGTCATCTTGGATGTTAGAAATAGTGGCCAATTCCAGTACCAATATTCAAGGGCCAGTTAATGTCACTCTATTGTAAGTTATACCACCGTATGTGACATCAGCAATATGCTCTACCAACGTCATCAAATTTAGTATCCTCCATATCAACGGGACAACTAGAATTATTTTCTAACCCTATATGGAACAAGCCTAGTAGGTATGTACCGATGGAGACAACCAATATGCTTGATGGGGGTACAAGAAGACTATTTCGTTGTTTCTATTACAAACAGATTGGTCATTATGCTAATGAATGGTCCAATCCCAGACCCAGTGACAATTGTGCACTAGTGTGTGGGAATTGCAAGCAGTCAGAGCATACTTATTAGCAAAATAATGCTCCGTTCAATTTTAATAATCAAGATCCGCAAATCCAAAGTCAAGAAAGAAATTGAAGAGATAAATGGAAGACTCTAAGATTCTCTGATAAATTGAGTGGAATGTGTCTAAGCCGTTCTTACCGAGAGTCCGCAAAAGGAGATAGGACCAATTCAACAATTAG\n>URS00018A4A88 rRNA from 1 species \nTACGTAGGGGGCTAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCTGCTGTGAAAACTCGAGGCTCAACCTCGAGACGTCGGCGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAGCACCCGTGGCGAAGGCGGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>URS0000CC585E snRNA from 1 species \nTTGCTTTGGCAGCAAATAACTAAAATTGGAATGATACAGAGAAGATCAGCAGGGCCCCTGAGAAAGGATGACATGCAAATTCACACAGCATTCCATCACAGC\n>URS0001480F9E rRNA from 1 species \nATTGAACGCTGGCGGCAGGCTTAACACATGCAAGTCGAACGAGTGGCGGACGGGTGAGTAATGCTTGGGAATCTAGCTTATGGAGGGGGATAACTACGGGAAACTGTAGCTAATACCGCGTACCATAGGATGAGCCCAAGTGGGATTAGGTAGTTTGTGAGGTAAAGGCTCACCAAGCCGATGATCTCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGGCAATGGGGGAAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTCGTAAAGTACTTTCAGTCGGGAGGCGGTACCGACAGAAGAAGCACCGGCTAACTACGTGCCAGCCGCCGCGGTAATTC\n>URS0001FB3C4B rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGACGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAGACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATGGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGGCCAGACTCCTACGGGAGGCAGCAGTAGGGAATATTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACAAATGTGTAAGTAACTATGCACGTCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS0000CF422D rRNA from 2 species \nACGGGAGGCAGCAGTGGGGAATATTGCACAATGGAGGAAACTCTGATGCAGCGACGCCGCGTGAGGGAAGAAGGTTTTCGGATTGTAAACCTCTGTCCTTGGTGACGATAATGACGGTAGCCAAGGAGGAAGCTACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTACTGGGTGTAAAGGGAGCGTAGGCGGGAAGGTAAGTTGACTGTTTAAACTATCGGCTCAACCGATAGTCGCGATCAAAACTGCCATTCTTGAGTGAAGTAGAGGCAAGCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTGCTGGGCTTTAACTGACGCTGAGGCTCGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTA\n>URS0000E65B77 lncRNA from 1 species \nCTGATCTCTATTCCCGGATCTGCCTCTGGCTTCCTGCGTGACCTTGGGCTGGTCACCTACCTTTTCTTTTCTTTGGTTCCCAAATTGTAACATGGAAATAATTCTCTTCCTGCGGTGCCTCAGCCCCTGCTGCCTTTAGGGTGGTCGAGATCCTCTGACGGGAGGAAGGTAGCACGTTTCCACTGGAGAAATACTTACCCAGAGCACGGTAATTTGGGGGCGTGTTGGTGTTCACTCGGGTACAGCAGGGTGCGTGCTGCTGCTTGTGCTTTTTTTTTTTTTTAGTAGGCAAACCTGTGGTGGAAGTCAAATTCCGTTTGTGGTGGATGCAGAGCAACGTCAGCTGCAGCGTGCCCTTTCCTCACTAGGAGATGGTTACCTAGCCAAGGTCACTGCTGCTGCATGCCTGTATCACGCAGCGAGCCAGCCTCCTCTTCCTTCCACGGGCGCTGATCTCAGCGAGGCTTCCCCAGAGCCAGCTGCTCCCGGAATAGTTTGGGAATGAAATGTCACCGTTTGAAACTGCTGGATCCTAGCGCCTTCTCCGACAGGACTAGGTCGTATCTGTCTGACAACGCACCTACAGTGACTCTCTTAATTAAGTCTCCCTGCACTGCTGTGAGGGCAGCATTCTGTGTTCCTGCTCCAGCCTACGAGAGCCAGCCATTTCCACGCGGCAGCTCTGCCTCGTAGGCACTAAGAAATGGGCACCTTGAGCTGAAGTGCCATGGTTGTTGTAGTACTACTGGTGTACTACCGAGCGGTCCCGGGCGTGCTGACTGTAGCTGTCGCTGCCCCAGCCTGCTGCCAGAGGTTTGTG\n>URS000031FA0E piRNA from 5 species \nTGTAAACATCGTACACTCTCAGCT\n>URS0001CC563E rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGACGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATGGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATGAGCAGAAATGGAAAGGAGAAAGCGGAAAGCACAGTCAGGGAGGAACAAGTGGGGAAAATGGGCGAAGGGGGGCAAGACTGAGACAGAAATAAAGAGGGGGTGAAGAAGGTGTTAGGGTCGTAAAACCTGTTTGTTGGGAAAGAAAAGAAGCCGGCGAATACACAGGTGCCGTGAAGGTACCTAAAGAATAAGAAAAGGATAACTTCGTG\n>URS0002428F28 lncRNA from 1 species \nGTGAATAGTGGCCTCCTGGGTAAATGAAGGTGGTGGCGAAATGCGGTCACCTCGCTGCTCCCAAATATGGACCTGCTGCTGGAGCCATCCATAAATATATTGTCCACCCTGATACGGTCATCCCGCTGATAGTGTGTAAGGGACCTATGAAGGCTCCCCTGGTATAGGATGGGGACAGTGAAACTAGCGAAGCACACGCTCTGTGGCATGATACTCAACCATATCAAAGAAGATCATCGGGACCGAGGTGGCCAAAGCAGTCGGTCGACTGAGCAATAATAGGGCAACTGAGCTAGCAACTCGTCGCTGTATGGCGTCCAGATGAA\n>URS000018DC94 rRNA from 1 species \nAACGAACGCTGGCGGCGCGCCTAACACATGCAAGTCGAACGAGAATCCGGGGCAACCCGGTAGTAAAGTGGCAAACGGGTGAGGAATACATGGGTAACCTACCCTTGAGAAGGGAATAACCCGCCGAAAGGTGAGCTAATACCCTATACGCTATCTTTTTTTCGAAAAGGATAGGAAAGCCGGGTCGAGGACCTGGTACTCAAGGAGGGGCTCATGTCCTATCAGCTTGTTGGTGGGGCAACGGCCTACCAAGGCTACGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGCACTGAGATACGGGCCAGACTCCTACGGGGAGCA\n>URS000019B6AB rRNA from 1 species \nCCGTTGCCGGCGACCGGCGCACGGGTGAGTAACACGTATGCAACCTGCCCGTGGCAGGGGGATAAGCCGGGGGAAACCCGTCTAATACCGCGTAACGCGGCCTTGGGGCATCCCAAGGCCGCCAAAGGGAGCAATCCCGGCCACGGATGGGCATGCGGCGCATTAGCTAGTCGGCGGGGTAACGGCCCACCGAGGCGACGATGCGTAGGGGTTCTGAGAGGAAGGACCCCCCACACTGGTACTGAGACACGGACCAGACTCCTACGGGAGGCAGCAG\n>URS000060EFE9 rRNA from 1 species \nAGTGATTTTAAGTCATGCAAGTCGAACGAACCTTGTGTTCGTGGCGAACGGCTCAGTAACACGTGGATAACCTGCCCTTGGGACCGGGATAACCCCGGGAAACTGGGGATAAACCTGGATAGGTGATGCGGCCTGGAATGGTGCTTCACCGAAACACCCCTCGGGGTGCCCAAGGATGGGTCTGCGGCCGATTAGGTAGTTGGTAGGGTAACGGCCTACCAAGCCCATCATCGGTACGGGTTGTGAGAGCAAGAGCCCGGAGATGGAACCTGAGACAAGGTTCCAGGCCCTACGGGGCGCAGCAGGCGCGAAACCTCCGCAATGCACGCAAGTGCGACGGGGGAACCCCAAGTGCCACTCTTAACGGGGTGGCTTTTCAGAAGTGTAAAAAGCTTCTGGAATAAGGGCTGGGCAAGACCGGTGCCAGCCGCCGCGGTAACACCGGCAGCTCAAGTGGTAGCCGCTTTTATTGGGCCTAAAGCGTCCGTAGCCGGTCTGATAAGTCTCTGGTGAAATCCCGCAGCTTAACTGTGGGAATTGCTGGAGATACTATCATGACTCGAGGTCGGGAGAGGCTGGAGGTACTCCCAGGGTAGGGGTGAAATCCTGTAATCCTGGGAGGACCACCTGTGGCGAAGGCGTCCAGCTGGAACGAACCTGACGGTGAGGGACGAAAGCCAGGGGCGCGAACCGGATTAGATACCCGGGTAGTCCTGGCCGTAAACGATGTGGACTTGGTGTTGGGATGGCTTCGAGCTGCCCCAGTGCCGAAGGGAAGCTGTTAAGTCCACCGCCTGGGAAGTACGGCCGCAAGGCTGAAACTTAAAGGAATTGGCGGGGGAGCACCACAACGCGTGGAGCCTGCGGTTTAATTGGATTCAACGCCGGACATCTCACCAGGGGCGACAGCAGTATGACGGCCA\n>URS000043FDF3 rRNA from 1 species \nAGCAGCCGCAGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAATTTCAGGCCTGGCTGGACGGTCCGCCCTTCGGGTGAGTACTGTCTGTGGTCGGGTCCTACCTTCTGGCGAAGCGTCATGGCCTTAACCGGCCGTGGCGGGGAACCAGGACTTTTACTGTGAAAAAATTAGAGTGTTCAAAGCAGGCAAATCGCTTGGATACATTAGCATGGAATAATGGAATAGGACAATGGTTCTATTTGTTGGTTTCTAGGACCGTTGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGAATCGGGCGATGTTGAAAAAATGACGC\n>URS000076D469 rRNA from 1 species \nACGGAGGATGCAAGCGTTATCCGGATTCATTGGGTTTAAAGGGTGCGCAGGCGGAATGATAAGTCAGTGGTGAAATCCTACGGCTCAACTGTAGAACTGCCATTGATACTGTTATTCTTGAGTACACTTGAAGTGGGCGGAATGTGTCATGTAGCGGTGAAAAGATTAGAGATGACACAGAACACCGGTGGCGAAGGCATCACACTAAATTGTAACTGACGCTGGTGCGCTAAAGTGTGGGGATCAAATAG\n>URS00025935AF lncRNA from 1 species \nTTAAAATTAGCTAAAATTTGGTATGGAGCAGGTTAGTAAGTAAAGCAGGAATGCAGAGTTGCTTAGGCCGGTATGGAGCAGGTTAGTAAGTAAAGCAGGAATGCAGAGTTGTTATGGTTGGTATGGAGCGGGTTAGTAAGTAAAGCAGGAATGCAGAGTTGTTCAGGTTGTGTGATGCTTTTGTGTAATACCTCTTTAATTGGAACTCAACTGCAGAATTTTCTGAGGGCAGGAACAGTAAGTTTCACCTCCTATTATATTGGAGTGAAATCAGTGGACTGTATCTTTAAATAATAATCAGGAAAATGCCAAGTTAGTTCCAACTTGAATTTTAATAATGAAGTTTTAGCCTTAGCAGCAATCCTTATTTGTCAACAGAGAGTTTAAAGAAATTAAATACTATAATTAATTGATATGACTTGCTTTCCTTGACAAAAGATTTACTTAACTTAGAAGCACTCTGGCACTGGAAGGGTTAATTCACCCAATGGAGGAAGAGGAAGGAGTCTCTTTTAACAAACTGCAGTTTAGTAGTGAGAGAAAGGAAGTCCGTTTGTCCAAGCCGAGGTCTGAGAGAGGAGAAGGTAGAAATCCGTTTACAAGCCGAGGTCTGGGAGAGGAGAAGGTAGAATTCCGTTTATAAGCCGAGGTCTGAGAGATGAGAAGGTAGAATTCCGTTTACAAGCCAAGGTCTGAGAGAGGAGAAGGTAGAAATCCGTTTACAAGCCGAGGTCTGAGAGATGAGAAGGTAGAATTCCGTTTATAAGCCGAGGTCTGAGAGATGATAAGGTAGAAATCCGTTTACAAGCCGTGGTCTGAGAAGTGGAGCCGGTAGCATCGAGTAGAGCAGCTGATCTCACTGCCGCACCTGAGTGAATAATCCAGCACTTTGAATCTGGCGCGGTCTTCCTAAGTATCGTGGAAAGACCGCGTCAGAAAAAAGGGGCGGAGCTAAGTGCCGTGAACCCGGAAGTGGGTTCCGGCGGCAGCATGATTGTTAGGTATACCTGACAGTACCCCCTTCTCATGGGGCATCCTCTGGGTGCACTTATTTCGGTTTAAAGGGGTAGCGTTTGTGAAAAGCATCAACTAATCTCTTAGCATGAACATTAGATGAATCTTCCCAGGTATCTTCATCTGATAAGGTATTGTAAAGAGCCACGGTGGATACAAGAATCCAAAATCTTATGAATTTCATATTCTTCTTCACCTTGGACGATGATAGGTTCAGGAGTTGTTACTATTTCTCTATGGAAAGGATCAGGGATGTGTGGTTTAAGCAAAGAGACATGGAATACTGGATGAAGTTTAAAACTTGGAGGAAGTTTTAATTTAACAACGTTATCATTGATGATTGTAGTTATTTGAAAAGGACCAAGAAAAAGAGAGCTCAATTTCTTTGAAGGACGGTTTGTGGTAATATTTTTTGAAGAGAGCCAGACAAGATCCCCCACTTTATAAGGAGGGGGAATTCTTCTATTATGGTCAAAAAACTTTTTCTGGTAGTTTTGGGCGAGTTGAAGATTCTCCCGTAATTTAAGGAATAGAGAAGACATAAATTCATTTTTTGAAGTAACCGTGGGATTGGATGAAGAATTAGATGGGATGGGAAATGAGGACGGATGAAAACCATAGTTGGAGAAAAAAGGAGTCATTTTCGTACTAGAATGAATGGTATTATTGTAAGAAAATTCAGCCATAGGTAACAAAGTGGTCCAGTCATCTTGCAGGTATGAACAATAACATCGGAGATATTGTTCCAAACATTGATTAACTCTCTCTGTTTGCCCATTAGTTTGGGGATGATAGGCAGAAGAGAGTTTGCGTTGAATTTGAAGAGAGAGACACATCTCTTTCCAGAATTTGGAGGTAAATTGTGTCCCCCTATCAGAAATAATTTCTTCTGGAAGACCATGAAGCTTTACAATATTATCAATAAAGACTTTGGACAATTCTACGGAGGAGGGTAATTTTTTTTTAAAGAGATGAAATGGGACATTTTAGTGAAGCGGTCCACAACAACAAGAATAGTGGTGAACTGTCGGGATGGAGGAAGGTCAACAAGAAAATCCATAGAAATGGATTGCCAAGGTTTTTCTGGAATAGGTAAGTTAAGTAGTAATCCAAAAGGTTGGTTATGTTCAGATTTGGACCTTTGACAGATAGGACAAGTTTTGACATATAATTCAATTGTTCTATCTTGGCGAGGCCACCAATAATATCGTGAAGTTAGTTCAAGAGTTTTCTTTATTCCAGGATGTCCAGCTAGGGGTGAATCATGAACCATTTTGAGTAATTTGTTCCTAAGAATGGGAGGAATATAAATTCAATTTTTAAAGTAAAATATACCATCCTTTTTTGTTAAATTAGGTGTTTTGGGAAGTTCAAAATCCTTTTGATTCAAGTTCCTTAAGTCATCCTGAAGAGAAGAGAGGATCCCTATTATTTTGTTAGGAGGATAAACATCAATAGAAGTTTTAGAAGGAATTCGAGAAAGAGCGTCAGCCTTTTTATTTCTAGTTCCAGGTCTGTATATTAATTGGAAGTTAAACCGGTTAAAAAATAGGTTCCATCTAACTTGTCTAGCCGTAAGGGTTTTATTAGTATAGAGATATTCAAGATTTTTATGGTCTGTATAGACTATGATAGGTTGATTTGTATCTTCTAATAGATGGCGCCAATTTTCAAAGGCAGCTTTAACACTTAATAATTCCTTTTCACCAATAGGATAATTTTTTTCAGCAGAGCTCAAGGATCTTGAAAAGAATGCGACTGGATGAAGTGGATCTTGAGGAGTCTTTTGCTGAGAAAGAACTGCTCCGATAGCTGAATCTGATGCATCGACTTCTAGGACATACAAGAATGTTGGATTAGGTAGCTGTAGAATAGGTGCAGTTGTAAATCATTTTTTTAAACTGTCGAAGGCAGCTTGTGCATCTTTATTCCATTTGAAAGGACGTTTAGTACTGTTAAGGAGGTTAAGTGGATGTGATACCTCTGAATAGTTTCTAATGAATTTTCTATAGAAGTTTGCAAATCCAAGAAATCGTTGCAATTCTTTTGTAGTAGTAGGAACGGGCCAGTTAATAATACATTCGATTTTAGAGTTATCCATTTTCAGAGAATGAGGTGAAATAATGTATCCAAGAAAGGAGAGTTCAGTAACTTCAAAAAGACATTTCTCTGGTTTAGCGTATAATTTGTGAGTTCTCAATCTAGATAGAACACATCTTACATGCTTCCTATGTTCATCCAAATTGTTAGAATATATTAGAATATCATCTAAGTAGATAATAACACAAACATCTAAAAGATCTCTAAAGATATCATTTATAAAATGTTGGAATGTTGCAGGGGCATTACAAAGCCCAAAAGGCATCACTAGATATTCGTAGAGACCATATCTAGTCCGGAAGGCGGTCTTCTATTCATCATCCTGTTTTATTCTAATGAGGTTATATGCGCCTCGGAGGTCGAGTTTAGTGAATATAGTTGCAGTTCTTAACCTTTCAATTAATTCATTTATTAGTGGAAGAGGATAACGATTTTTTATGGTTATTTTATTTAAGGCTCTGTAATCTATAATGGGTCGGATGGTTTGGTCCTTATTCCTCACAAAAAATATACTAGAGGCAGCCGGTGAAGTCGAGGGTCTGATGAATCCTTTACGTAAATTTTCATTAAGATATTCTTTTAAGGTCTGTAATTCCTTTTCAGAAAGTGGATAAATGTGTCCATAAGGAATGGGAGCACCAGGTATTAGATCTATTGGGCAATCATATGCTCGATGAGGTGGAAGTGTTTCCGCTTCTTTTTTACAAAAGACATCTGAAAAGTCAGAGTAGAATGGAGGTATAATTGATTCCTGAGTAGTTTGGAGAATAGGAATATGTTGGTTCCATTGAAATTGGCTGGATTATTCTGTGATGCTTTTGTGTAATACCTCTTTAATTGGAACTCAACTGCAGAATTTTCTGAGGGCAGGAACAGTAAGTTTCACCTCCTATTATATTGGAGTGAATTCAGTGGACTGTATCTTTAAATAATAATCAGGAAAATGCCAAGTTATTTCCAACTTGAATTTTAATAATGAAGTTTTAGCCTTAGCAGCAATCCTTATTTGTCAACAGAGAGTTTAAAGAAATTAAATACTATAATTAATTGATATGACTTGCTTTCCTTGGCAAAAGATTTACTTAACTTAGAAGCACTCTGGCACTGGAAGGGTTAATTCACCCAATGGAGGAAGAGGAAGGAGTCTCTTTTAACAAACTGCAGATTTAGTAGTGAGAGAAAGGAAGTCCGTTTGTCCAAGCCGAGGTCTGAGAGAGGAGAAGGTAGAAATCCATTTACAAGCCGAGGTCTGGGAGAGGAGAAGGTAGAATTCCGTTTATAAGCCGAGGTCTGAGAGATGATAAGGTAGAAATCCGTTTACAAGCCGAGGTCTGGGAGAGGAGAAGGTAGAATTCCGTTTATAAGCCGAGGTCTGAGAGATGATAAGGTAGAAATCCGTTTATAAGCCGAGGTCTGAGAGATGATAAGGTAGAAATCCGTTTACAAGCCGTGGTCTGAGAAGTGGAGCCGGTAGCATCGAGTAGAGCAGCTGATCTCACTGCCGCACCTGAGTGAATAATCCAGCACTTTGAATCTGGCGCGGTCTTCCTAAGTATCGTGGAAAGACCGCGTCAGAAAAAAGGGGCGTAGCTAAGCGCCGTGAACCCGGAAGTGGGTTCCGGCGGCAGCATGAATGTTAGGTATACCTGACAGGTTGGTATGGAGCGGGTTAGTAAGTAAAGCAGGAATGCAGAGTTGTTCAGGCCGGTATGGAGCAGGTTAGTAAGTAAAGCAGGAATGCAGAGTTGTTATGGTTGGTATGGAGCAGGTTAGTAAGTAAAGCAGGAATGCAGAGTTGTTCAGGCTGGTATGGAGCAGGTTAGTAAGTAAAGCAGGAATGCAGAGTTGTTATGGTCGGTATGGAGCGGGTTAGTAAGTAAAGCAGGAATGCAGAG\n>URS0001BC7D2F tmRNA from 13 species \nGACGGGAUUUGCGAAGCCCUAGGAGCAUGCCGAGGGGCGGUUGGCCUCGUAAAAAGCCGCAAAAAAAUAGUCGCAAACGACGAAAACUACGCUUUAGCAGCUUAAUACCCUGCUUAGAGCCCUCUCUCCCUAGCCUCCGCUCUUAGGACGGGGAUCAAGAGAGGUCAAACCCAAAAGAGAUCGCGUGGAUGUCCUGCCUGGGGCUGAAGCGUUAAACUCAAUCAGGCUAGUCUGUCAGUAGCGUGUCCAUCCGCAGCUGGCCGGCGAAUGUAAAGAUUGACUAAGCAUGUAGUGCCGACGGUGUAGUAAUUUCGGACGGGG\n>URS00004B6BEF rRNA from 1 species \nCACGTAGTTAGCCGGTGCTTTTTCTGCAGGTACCGTCACTTTCGCTTCTTCCCTACTAAAAGAGGTTTACAACCCGAAGGCCGTCGTCCCTCACGCGGCGTTGCTGCATCAGGCTTTCGCCCATTGTGCAATATTCCCCACTGCTGCCTCCCGTAGGAGTCTGGGCCGTGTCCCAGTCCCAGTGTGGCCGGTCACCCTCTCAGGCCGGCTACCCGTCGTAGGCTTGGTGAGCCATTACCTCACCAACTACCTGATAGGCCGCGAGTCCATCCTTGACCAAAATTCTTTCCACAACCAGACCATGCGGCCAGCTGAAATATCCGGTATTAGACACCGTTTCCAGTGCTTATCCCAGAGTCAAGGGCAGGTTACTCACGTGTTACTCACCCGTTCGCCACTAATCCACCCAGCAAGCTGGGCTTCATCGTTCGACTTGCATGTGTTAACGCACGCCGCCAGCGTGTCCTGTAGCCAGGACGTCAAACGTCT\n>URS00023C0FDA lncRNA from 1 species \nGGAAATTAGAAATTAAAACTGTCACTAAAGGGCCCTATAGCGACAGAACCGTCGCTACAGGTGTTCTTGGTGTTCTTGATGCCTGCCCAGATCTTCAAGTCAGTGAACAAGGTAGGTGGTTTGACCGGATATAGATCTTTGGTCCTTACGTTTTCTGGGCTGCTAAAGTGTTAAGATTGTAGTACTTATGTAGTACTACAACTACAAACGACTGTCATGGCCATCATGCATCTAAACAGAAAGTTATAGGCCATCAAAATCCTTGTCAGACATGTTCTTCATTTTCTGGGTTACCCAGAAAATGAAGAACAGTCAAGGTACCTACTTTGGATCCTTATAGTTTGCAGTATAGGTCTTGTTTGTATAATATAGTGGTTCCATCATGTAGAAATAATGTCAGAGTACAACTACATACCCTCATATAAGTCTAATCAACATTACAGATGAGAGATTAAGGCCGGTCAAAGT\n>URS000109A09B rRNA from 1 species \nTACGTAGGCAGCGAGCGTTGTTCGGAGTTACTGGGCGTAAAGAGTGCGTAGGCGGTTTTCTAAGTTTGGTGTGAAATCTCCCGGCTTAACTGGGAGGGTGCGCCGGAAACTGCGAGGCTAGAGTGTGGGATGGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCTGCGGTGTAGACGGCTCTCTGGACCACTACTGACGCTGAAACACGAAAGCGTGGGTAGCAAACAGG\n>URS0000E5769B tRNA from 1 species \nAGCTCCGTGGTGAATAGATCATGTTGAATTGCAAATTCAAAGAAGCAGCTTTAACGCTGCCGGGGCTTC\n>URS00026126AE lncRNA from 1 species \nCCACAATGATGTTTTAGGGGCTCTGTTTTTTGTTGAGGCTTAAAATACTGTACTATTTGTTGATATATTTCAGACCACTGCGCCCCCAACCCGTGCCAGAACGGCGGTACGTGCCAACCATCAATCTGGCCCCACGAGCCCCACCTGATCACCTGCCAGTGTCCACCTGGGTTCGAAGGTCCTCTGTGTCAGTACACAGCTCTAGATCCTTGTAGTCTGCCTCTCAGCACAGGTTCTTGCTCAAGCAGAGAGTCGAGATGGTACTTTAACCAGCTCAGCGGACGATGTCAGAAGTTCACATATCTTGGTTGCCATGGCAATGCAAATAACTTTGCCTCCATTTTTGAGTGCCAAGAGAGATGCATCAAAGGATCATGCTGTACCCGCACCCCAAAAATTCGTAGTCAGAACATTGGATTTGACAGTCAAGGATATGATAAGTATGTCTGACTTTTTTTATGAGTTCTTCTGTGTCATTTTGTTGTTGGCTTATCATTGTGTTCACCTGTTTCAGTTGAAATATCTGCTGCATGAAAAAATAGAGGATGCAAAACAATTTTTGTGGTCTGTAATTTTTCAAAGTCCTCTGGGTTTTAAAAAAATAATAATTTAGGCGCAGTTTTCTTTGCTGTTTCTTCTTGAACACGTACAGTTTATTATAGTAGAACAGCCAAACCTGCCGTGATGGTCACCTGTTCTTGTTAAAAATAGATGGGTATTTTTTCACTAATCAACACGCTGTATGATGATACCAATAGCTCTAGCTATATGTCCAAATATTGATGAACGCCTGATTTCACCGCATCGTGACACATATTAAAATGATTCTGTCATAGAGGATGGCCTGTCTGAGATGACCACTTTTCTTCTGAGCATTGGGTGGTTATCTTGTAGGCCTACATTTGATAATACTTATATTTAAGAACTTGGTACCAGTATGCTGAAGTATGAATAAAGTAGTTCAATGTAATATACTGGTATACTACAGTACGAAAGTAGTCCAATATAATATTTTGGTAAGCTAAAATACGGAAATAGTCCTACATGATATTTTGGTAATCAAAAGAAATGGAAGTTGTGCTACACAATATTTTGGTAATCAAAAGTATCTCAAAATTCATCATTACTTTCCATTAGCTTTGAGTTTGTCTCATTCTGACTTGTTTGCTTGTCCCTTCTCAGTTGTGTTCAATTGTCTCGTGATACAGGTATGGATTCAATCAAGAGGGACTGAACAGATTTGGGGACAGGAGAAATGTTGACAACAGCTTCCCACTCAGTACCCGTCGCTTTGACGAGTCCGGTCTGGACTGGCAAGGTTATAACAGAGAGGGCTATGGTGAAGATGGCTTGAGCAGAGCTGGCTTTGACAAGTACGGCTTTGATGTGGACGGCTTCAACATCAGTGGGTACAGCCGTAGTGGAGAGTTTGACGGGATCATTGACTATGATGAAGAAGGATATGATCCTGAGGGATTTAACAGGTAATTCTTCCTTCTTTGTATT\n>URS0001321690 rRNA from 1 species \nCCCTTAGATGTTCTGGGCTGCACGCGTGCTACACTGATATTGCCAATATGTCATTCTTATCCGAAATGGATTGGGTAATCAAGTAATGAAATTTCATGCTTGGAATCGGTAATTGCAATTTTATCGTGAACGAGGAATTCCTAGTAAGCACTAGTCATCAGCTAATGTTGATTATGTCCCTGCCCCTTGTACACACCGCCCGTCGCTACTACTGATTGGGTGTTCAAGTGAGATGCTTAGACCCTTGTTGCATGGTTCATTATTGTGCTCCGAAAGGAAAAAGTTTCAAGCTTGAGTGTCTAGAGGAAGTAAAAGTCGTAACA\n>URS00004F4253 rRNA from 1 species \nGATGAACGCTGACAGAATGCTTAACACATGCAAGTCGATTCGATTTACCTTCGGGTATTGAGGATGGCGGACGGGTGAGTAACGCGTAAGGAACTTGCCTCTTGGTCTGGGACAACTGTTGGAAACGACAGCTAATACCGGATATTATGAGATTCTCGCATGGGAAACTTATGAAAGCTATATGCGCCAAGAGAGAGCCTTGCGTTCCATTAGCTAGTTGGTGGGGTAACGGCCCACCAAGGCGACGATGGATAGCCGGCCTGAGAGGGTGAACGGCCACAAGGGGACTGAGACACGGCCCTTACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGACCAAAAGTCTGATCCAGCAATTCTGTGTGCACGATGAAGGTCTTCGGATTGTAAAGTGCTTTCAGTTGGGAAGAAGAAAGTGACGGTACCAACAGAAGAAGCGACGGCTAAATACGTGCCAGCAGCCGCGGTAATACGTATGTCGCAAGCGTTATCCGGATTTATTGGGCGTAAAGCGCGTCTAGGCGGAAAAATAAGTCTGATGTTAAAATGCGGGGCTCAACTCCGTATTGCGTTGGAAACTGTTTTTCTAGAGTACTGGAGAGGTGGGCGGAACTACAAGTGTAGAGGTGAAATTCGTAGATATTTGTAGGAATGCCGATGGAGAAGTCAGCTCACTGGACAGANACTGACGCTAAAGCGCGAAAGCGTGGGGAGCAAACAGGANTAGATACCCTGGTAGTCCACGCC\n>URS00003E0BF5 rRNA from 1 species \nGCTCAGAAACTTAAATGACTTGAGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCTGGGCTCAAATGTATGTTGACGTATTCTGAAAGGGATACTTCTTCGGACAATATACAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGGTTAAGTCCCATAACGAGCGCAACCCCTATCATTAGTTGCCATCAGGTCAAGCTGGGGACTCTAATGAAACTGCCTACGCAAGTAGTGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTACGTCCAGGGCTACACACGTGCTACAATGGCCGGTACAAAGGGCAGCTACCTGGTGACAGGATGCTAATCTCAAAAGCCGGTCTCAGTTCGGATCGGAGTCTGCAACCCGACTCCGTGAAGCTGGAATCGCTAGTAATCGCGCATCAGCCATGGCGCGGTGAATACGTTCCCGGGCCTT\n>URS0001224666 rRNA from 1 species \nTACGGGGGGGGGCAAGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGCGGCCAACTAAGTCAGACGTGAAATCCCTAGGCTCAACCTAGGAACTGCGTCTGATACTGGATGGCTTGAATCCGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAATACCGGTGGCGAAGGCGGCATCCTGGACCGGCATTGACGCTGATGAGCGAAAGCTAGGGGAGCAAACGGG\n>URS000137232C rRNA from 1 species \nTACGAGGGGGGCAAATGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCTCGGAGCTTAACTCCGAAACTGCATTCGATACTGCCGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCGGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACGCTGAGGCACGAAGGTCAGGGGAGCAAACGGG\n>URS00009BFC8A lncRNA from 7 species \nCACAAAGAGAAGCTTTAAAAATCTTGCCTTCTGCCCCCTCAATTTCTTCTCCCTTCCTTCTCTATTTCCCACTGGTTTAGCGTGCCTGTCTCTCCCATTTTACCCTGCTTCAATCTCCTCCCAGTTGCTTCTGCTAGAGTTGCCTTTTGTCCTCTCACATCCCTAGGTCATCCTTGTTAGGGCTCTCCTGGCCTGGTTCCTTGTCCGCTTGAATTCCAGGGAGTGTTACAAGGTTTGGAGGTTTTTGCTTTACACATGGACCCAGAAGGAGCTGCAGCCTACAGGCCTCTCCCAAGAAGGCCTTTTCTCTGCCTGACTTTGGACTTCTCCCCAAGGTCAGGACAGTGTCCAGATGGCCCTGCTGCAGAATCTTTGCCTCCACTTCCTTCATCAAGAGGCTGTAGGTACATCTTGAGTTCATCTTGTGTCCTTCTGAAGCATTGCAGAGGGCAGCGGCTGCCTGGCATGGCACCGGTCCTGGGCATCACCCATGGGCCACCAGTGTTTTAGGGAGTGGAGAGCCTGGCTTGGGCAAGGACCTCAG\n>URS000260A6B2 lncRNA from 1 species \nTAAGATCTGGTGTACCAGCCATTACCCAAGTGTTAAGGTCTGGTATATCAACTATTCCCCAAGTGTTAAGGTCTGGTGTACCAGCTACTACCTATTGTTAAGGTCAGGTATATCAACTATTACCCAAGTGTTAAGGTCTGGTATATCAAGTATTACCCAAGTGTTAAGGTCTGGTATATCAACTATTACCCAAGTGTTAAGGTCTGGTGTACCAGCTACTACCTATTGTTAAGGTCAGGTATATCAACTATTACCCAAGTGTTAAGGTCTGGTATATCAACTATTACCCAAGTGTTAAGGTCTGGTATA\n>URS00002A34A8 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGACCTATGTTGAAACCTAGTGATATATAAGTTAGTGGCGGACGGGTGAGTAACGCGTGGATAACCTGCCATATACAGGGGGATAACACTTAGAAATAGGTGCTAATACCGCATAAGCGCACAGTTTCGCATGAAGCAGTGTGAAAAACTCCGGTGGTATATGATGGATCCGCGTCTGATTAGCTTGTTGGCGGGGTAACGGCCCACCAAGGCGACGATCAGTAGCCGGCCTGAGAGGGTGAACGGCCACATTGGGACTGAGACACGGCCCAA\n>URS0000F20FBF rRNA from 1 species \nCACGTAGGGCGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTCTGTTGCGTCCGCTGTGAAAACTCGGGGCTTAACCCCGAGCCTGCAGTGGATACGGGCAGACTAGAGGTAGGTAGGGGAGAATGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACGGG\n>URS000118C396 rRNA from 1 species \nTACGTAGGAGGCGAGCGTTGTCCGGAGTTACTGGGCGTAAAGGGTGCGCAGGCGGTGGCCCGCGTGGGCGGTGAAAGCTCCTGGCTCAACTGGGAGAGGGCCGTCCAGACGGGGTCACTTGAGGGGCGGAGAGGGGCGTGGAATTCCGGGTGGAGCGGTGAAATGCGTAGAGATCCGGAGGAACACCAACGGCGAAGGCAGCGCCCTGGACGAGACCTGACGCTCAGGCACGAAAGCTGGGGGAGCAAACAGG\n>URS00013DEF05 rRNA from 1 species \nTACGTAGGGTGCGAGCGTTGTCCGGAATTACTGGGCGTAAAGAGCTCGTAGGTGGTTTGTCGCGTTGTCCGTGAAAACTCACAGCTTAACTGTGGGCGTGCGGGCGATACGGGCAGACTGGAGTACTGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCTGGAGGAATACCGGTGGCGAAGGCGGCATCCTGGACCGACATTGACGCTGAACGGCGAAAGCTAGGGGAGCAAACGGG\n>URS000057D191 piRNA from 1 species \nTCTATTAGGAGCTGTCAGGTGTGTT\n>URS0002185586 lncRNA from 1 species \nTAACATGGTAGGAGCACAGGTTTTTGGGAATATGTGGAAACAGACTCTGTTTAGCAACCATAACCATTTTGACTTCAACTGTGAAGATAATGACAGACCGTAAAGGCCACACATTACCCATGTGAACTATCGTATGCTGCGTGTCATAAGTATGACGTTGACCTCCTGAACTCTCGGTTCTGTGTTGTTTGCGTTGCAGAGAATAAGGCAGTTGGAAGACATGATTGAGATGCAAAAGAGACAAGTAAAGGAAATAGAAGAAAAGTTTTTGTTCCTCTTCTTGTTTTTCTCTCTAGCTTTTATTCTTTGGCCTTAATGACACTGACATGGACCGACAACAGGTGCTAAGGTGCTCAGGTGGAGAGTGAGGAAGAGAAACACAACATTTTTTTTTTTTTTTTCATGCATTTATAGATGGTTCACAAACCTTATATGGCCTTTTTGATACACGTGCACTTTTGTGGAAAACATTTACCTGGAATGCAAAACAAAACCAGGACTTTGAAAAGTGAACAAATATCAGAGACATGTAAAAGAGGTATATCAGAGATTTTTTTTATTTTTTATAACGGAAATGTCCCCTACCATTTTTGGAAGTGGAACATTTAGCCAAACTCTAATGTGAGTTCTAAAAAGCAAGAACATTGTAACTGGAACTCTGAAGCAGGTCAATAAAGGAACAGAGCAACTGAGATGGAGACAGTGCCTCAGATGGATTTAGAGCCAGACAACGAAAGAGTGCAATCGTAGAGGAGGAGGAAGGAGGAGGAAGGAGAAAGAGTTGATTCAAAAAAGCAGGACGATTTCCAAACAGACGAGCCAAGTCCTGGGCATTCCCAGAAAGCTCAGTGCAGGAGGGTCTCCATGGAAACAGCTGGCGAAACGGCTGTCATGGCCAAAGTTCAATGAGCAAGAAGTGAAAGCTTTGTACTCCGGAGTAGAGCGACACCAGAGGACTACGGGGACAGAATGTGTCACCGGTCTGTGAAACACAAAGAATCCTCAATAGCTGTGACCTCCAGGTTTTGACCCATAGAGTGAACCGTCTAGAGCACAGCCTGAGAGACAACGTCAGCTCCTTTACTGAGTCTGAGAGCTTGCTGCACAACAGAGAGTTGGAGGTGCCAGAGCAGAGCCTGCTACAGAAGGTGGAGGACCTCACAGCACACTCAGTCCTCCACTGTCCCAGCATGCAGCGACGCCAGAGGCTGGACGAGCGGCTCCACGCGCTCAGGGAGGAGGTGCGCTTCATGGTGAGTAGAGACTGTACTGAGCTTTACATTAGCTTCAATGAGGCTTATAGAGTGAGAAGTACTCAAATGTACATGTCATGTAAGCTGTACTGTAAATTGTAGTATAAGCCTGTAATTATTGTGTAAGTGTAATTATTGTGTAAGTGTATTGTGAGTGTGGTTTAAATCTATCGTTTCTCAGGTGTAGTGCTATTGTGACTGTAGTCTCCCTCTCTGTTGCATTATATGAGATGTGTATGACATTACTCAGATGTGAGGAGTAACTGTGTCATAGTTCTATCATGACCGGTCCTTCCCAGTACCAGGAGAAGGAGCATAGGAATCGTGTGTGTGGAGGGAGAGGCTACAGTGCTGCCAGGCCCAGC\n>URS0000A07E96 rRNA from 1 species \nCACGCAGTAAACGATGATTACTAGTTGTTTGCGATACACAGTAAGCGACCGAGCGAAAGCATTAAGTAATCCACCTGGGGAGTACGTTCGCAAGAATGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGAGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCCGGGCTTGAAATGCAGATGACAGGGGCAGAGACGCCCCCTCCCCTCGGGGCATCTGTGTAGGTGC\n>URS000257F2CE snoRNA from 1 species \nGTTGCTTCATAATGGTGAAATCTCTCAAAATCGAATGAGAGAATCTCAAGTTTCCGGAGCATAGATTAAGCATTCTATCACCAGTATTAAACAGCTCGGTGCGTATACAATCGCAT\n>URS000210DF6D rRNA from 1 species \nAATTAATGAATTAATTATAATTAGTTAAATTTTATATGAAGTTCAATATTAAGTTTAGAAATATTGGCGGTGTTTTATTAAATTCTGAGAATCTTGCATAATTAAAATGATAGTACACAATTTATCTTATCTTAGTTTTGTTGGTTTATATATTGCTGTTTTATTTATGGTTTGGTTTTGATAAAATAGGTAAAAGGATTTTGTAGTAAGAAGTTCAAGTCAAAATATAGTTTTATTAAGGTTTATGTGAGTTGCTTTTGTTTAGAAAATAGGAATAATAAAGTAAAATGAAATTTTATATAAGAAGGGATTAGGTTGTAAGGGAAAAATTAATAAGTTTTCTTGATAAATTATATGAACATGT\n>URS00014E047D rRNA from 1 species \nGACGAACCGTGCGAACGTTGTTCGGATTCACTGGGCTTAAAGGGCGCGTAGGCGGACGGTCAAGTCAGGGGTGAAATCTTTCAGCTCAACTGGAAAAGTGCCTCTGATACTGATCGTCTCGAGGGAGGTAGGGGCATGTGGAACTTCCGGTGGAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGTGGGCTGGGCCGGAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS000238B563 lncRNA from 1 species \nATTCTCTCTCCATTTTAGAGAGAGAGTTGAGATGGAAATTATAATTTTCTCTCGATTTTAGAGAAACAGGTTTTTATTTTTTTGTGAGGCAAAGGATTTTGATTCGTGTCAATTTACGGCCTCTACCTCAATTGGACAGATGTGGCTCTCTTTACCTCTCTCAAAAATGTGTTTCTTCCTCCCTGTCCTTCCGGGTGAGAGTGTAAATAGATTTTGATCTGTGGTTTTTCGGCAGGAGATAGTTATTTGTGAGGGAGTCTCCATTTTCCTACCAAATAATTTGGTTGCATGTTTGTTTTCTTTTTCTCTTCCTTTGTGTTTTGCAGATGGAGGATTCCTGGCGGTGCTTTTTCTAGTTTGTTCTTCTGCCATTAGGAAACGATGGAGAGATCTATACTTTTCAATCTCGTAATCGACGCTTTTGTCCTAAGTTCTCATTCCTTGGCTCGAGAGGATGGTGGGTGGACTCGATTGCAAAAGTCTCTTTTCTCTTTCTATTGTATTCATCGTTCATCTCTCAACCTTGCTAGGGCTGCATGCGTTTTTCTGCTCGGTGCCATCCTTTGTTTCTATTGCTTTAGTTGCCGGAAAAGAACTACTGTTCGGAAAAAAAAAACTTATTTCCTCTTATCGGCCATGGCAACTGAGTTTTTGGGTCTTAGGGTTTCTATGTGTTTGAGTTGCCTCCAAATAAAAGTTTG\n>URS00021B94DD lncRNA from 1 species \nAGTTGGTGAACACAATAGCAAATCTTTTTAATAAAAATAACAGCAATAAAAAAATAACAAATATTTGAAATTTGATATTAAAATATGAACAATGACAAAAATACTGAAAGAAGTTACAATATTAACAAATATTGATATAAAACAATGGTTAAAAAATTGTCTTCATAAACAATAGCACGTGCATTTTTCTCGTGCAGTTACGTCAGGTGACCATGTATTCAGTGAATCACAAGTAATAAATAAACAAAAAATATGAGTGTGTCTTACCTGAGTTATACATGTTATAACCAACAAAAGTATTAAAAGTCTTAAAACATTTTTAAATATTATAATAATATGCCCTAGCAAGATACATAAACAATCAACCTTAAGAAAAACAATAACAAAAGTAAACCTAATTTAGGTAAACATGATAACATGGTACGCATTTAACAAAAAAAATTAAAAATTAAAAAAAAAATTCTGAAAAACTTGGATCATTTTTAGAACACAAAATATTAACATTGATGAAATAGTGTCATAGCCTATGAGGAAATCGTTTTAAAATCAAGTTACTTCCCAAATAACTGACATCTACTTTACATGTGTATATGTCTCATCCCCACTTTGAAGATGTAGATTTG\n>URS0000350E7B rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGGTAAGGCCCTTCGGGTACACGAGCGGCGAACGGGTGAGTAACACGTGGGTGACCTGCCTCTAGCTCTGGGATAAGCCTGGGAAACTGGGTCTAATACCGGATATGACTCCACGGCGCATGTTGTGGGGTGGAAAGCCTTGTGTGGCTAGAGATGGGCCCGCGGCCTATCAGCTTGTTGGTGGGGTGATGGCCACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGAGGGATGACGGCCTCGG\n>URS00015AB4C8 rRNA from 1 species \nTACGGAGGATCCAAGCGTTATCCGGAATCATTGGGTTTAAAGGGTGCGTAGGCGGGTATGTAAGTCAGTGGTGAAATCCTGGAGCTTAACTCCAGAACTGCCATTGATACTATATATCTTGAATATTGTGGAGGTTTGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCTATTGCGAAGGCAGCAGGCTACACATATATTGACGCTGAGGCACGAAAGCGTGGGGATCAAACAGG\n>URS0000254467 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCTTAACACATGCAAGTCGAACGGTAACATGAAGAAGCTTGCTTCTTTGATGACGAGTGGCGGACGGGTGAGTAATGCTTGGGAATCTAGCTTATGGAGGGGGATAACTACGGGAAACTGTAGCTAATACCGCGTAGAATCGAGAGATGAAAGTGTGGGACCTTCGGGCCACATGCCATAGGATGAGCCCAAGTGGGATTAGGTAGTTGGTGAGGTAAAGGCTCACCAAGCCGACGATCTCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGGACTGAGACCTGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGCAATATTGCGCAATGGGGGCAACCCTGACGCAGCCATGCCGCGTGAATGAAGAAGGCCTTCGGGTTGTAAAGTTCTTTCGGTAGCGAGGGAAGGCATTTATGTTTAATATGATCTAAG\n>URS0001ED777B rRNA from 1 species \nTCATATGCTTGTCTTAAAGATTAAGCCATGCATGTCTAAGTATAAGCTTTTATACGGCTAAACTGCGAATGGCTCATTAAAACAGTTATAGTTTATTTGATGGTCTTTACTACATGGATAACCGTGGTAATTCTATGGCTAATACATGCGCACATGCCTCTTCCCCTGGAAGGGCAGTGTTTATTAGATACAGAACCAACCCACCTTCCGGTGGTCCTCAGGTGATTCATAGTAACCGAACGGATCGCGTTGACTTCGGTCTGCGACGGATCATTCAAGTTTCTGACCTATCAGCTTTCGACGGTACTGTATTGGACTACCGTGGCAGTGACGGGTAACGGGGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACATCTAAGGAAGGCAGCAGGCAAATTACCCAATCCTGATTCAGGGAGGTAGTGACAAGAAATAACAACACTGGAAATTTCATTTCTAGTGATTGGAATGATAGGAATCCAAACCCCTTTCAGAGTAACAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGCTGGAAGCAGCCAGTCCGCCCTCAGGGGTGTGCACTTGGTGAATTCTAGCATCCTTCTGGATTTCTCCACACTTCATTGTGTGGAGTTTTTTCCAGGACTTTTACTTTGAGAAAATTAGAGTGTTTCAAGCAGGCTTGTCGCCTTGAATACTGCAGCATGGAATAATAAGATAGGATTTCGGCCCTATTTTGTTGGTTTCTAGGACTGAAGTAATGATTAATAGGGACGGTTGGGGCATTCGTATTTAACTGTCAGAGGTGAAATTCTTAGATTTGTTAAAGACGAACTACTGCGAAAGCATTTGCCAAAGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGCTCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGAGATAGGAAAACGTCATGCTTGACTTCTCCTGCACCTTATGAGAAATCAAAGTCTTTGGGTTCTGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGCGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTCACCAGGTCCAGACATAGGAAGGATTGACAGATTGATAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGTGATTTGTCTGGTTAATTCCGTTAACGAACGAGACCTTAACCTGCTAAATAGGATCAGGAACTTCGTGTTCTTGTATCACTTCTTAGAGGGACTTTGCGTGTCTAACGCAAGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCTGCACGCGCGCTACACTGATGCATCCAACGAGTTTATAACCTTGGCCGATAGGTCTAGGTAATCTTGTGAGTATGCATCGTGATGGGGATAGATTATTGCAATTATTAATCTTCAACGAGGAATGCCTAGTAGGCGCAAGTCAGCAGCTTGCGCCGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATTGAGTGTTCCGGTGAATTATTCGGACCGTTTTGTGGCGCGTTCGTGCCCGAAATGGGAAGTTTTGTGAACCTTAACACTTAGAGGAAGGAGAAGTCGTAACAAGGT\n>URS00019AFD52 lncRNA from 1 species \nGCTTAGGCCACCATGCAGCCTTATTTCTTGACCCTGCTTTAACTCCTACTCCTGATGTGAGCCGGAAAAGGACTCCCCATGTCCACCTTCTTTGGGTGTAGGTTCCATTTCTACCCCCAGTGGGGTCCAAAAAGGTTTCTCTTCGCCATTGCAGTTTCTTCTGCTGTTTCCTTGCATTCTGGGGCCCTGTTTGTGCACATAACCTTTGCCTCACCTATGTGGCCGCCTCTTGCCCCTGAGCGCTGGCCGTCCCTGTTGGACCGGCTAGTGACCTGACTCCATGGCCGCCCAGCAGTGCCATCGCAGGCCGGGCTGCCTTCAGGCAGACCCAGGCACACTTGCGGTATGTGAAAGCAAGCATTCCTGCCTTTCAGTCATGAAAAGAATGTCCTTGGCCTCTACGTTACGGTGACGCTAGTGGATAGCTTAGCCCGCACAACCCTGCCTCCTCCTCCCGGGGCCTGGGGCTGGCCCTCCTCTCCTGCCTCCCACACCTGGCCACCAGAACCCCTACCACCCTGCACCTGGTGGATCGCTCAGAGCGCACACCCCCTGGTGCTGACCAGTCGGGGAGCGCCTGGACGCAGCGACCTCTGGCCGGCTTTCGGTGTTCTCATGCGTGCGAAGAGAGCGCGTGAGGAAAGCCGCGCGGGGTCGGCAGGGTCGGCGGCCGGTGCGGACGCGCCTCGGCGGCGCGCGGCGGC\n>URS00001839AB rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGGAGTTGATCCTTCGGGATTAACTTAGTGGCGGACGGGTGAGTAACGCGTGGGTAACCTGCCGTATGCTGGGGGACAACAGTTGGAAACGACTGCTAATACCGCATAAGCGCACAGTACCGCATGGTATAGTGTGAAAAACTCCGGTGGCATACGATGGACCCGCGTCTGATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGTCGACGATCGGTAGCCGACCTGAGAGGGTGATCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGGGCAATGGGCGAAAGCCTGACCCAGCAACGCCGCGTGAAGGAAGAAGGTCTTCGGATCGTAAACTTCTGTCCTAAGTGAAGAGCAGAAGACGGTAACTTAGGAGGAAGCCCCGGCTAACTACGTG\n>URS00002AB1FD piRNA from 1 species \nTGGAAATGAAACAGTCTTTAATGTCTA\n>URS0001E049BC rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGGGCCTTGTCCCCTTTTTTTTTGGGGGTGGGGTTAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCCTCACTTCTGGATAACCGCTTGAAAGGGTGGCTAATACGGGGTGTTCTGGCCTGCTCGCATGGGTGGGTTTGGAAAGATTCGACCGGTTTTGGTTGTTTTGGTGGGGGATGGGCTCGCGGCCTATCAGCTTGTTGGTGGGGTGATGGCCTGCCAAGGCTTTGACGGGTAGCCGGCCTGAGGGGGTGGGCGGTCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGCGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGAGGGATGGAGGCCTTCGGGTTGTGAACCTCTTTCGCCAGTGAAGAAGGTCCTGCTCTTTGTGGTGGGGTTGACGGTAGCTGGGTTAATGAAGCGCCGGCTAACTACGTG\n>URS0000DC40A1 rRNA from 1 species \nAACTCAAATGAATTGACGGGGCCCGCACAAGCAGCGGAGCGTGTGGTTTAATTCGATGATACGCGAAGAACCTCACCCAGGTTTTGACATGCATGTGGTACCAAGGTGAAAGCTGAGGGACCCTTCGGGGAGCATGCACAGGTGTTGCACGGCCGTCGTCAGCTCGTGCCGTGAGGTGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTGTCGCCAGTTGTATTTTTCTGGCGAGACTGCCGAGAAAACCTCGGAGGAAGGAGGGGACGATGTCAGGTCAGCGTGGCCCTTACGCCTGGGGCTACACACACGCTACAATGGGCAGTACAACGGGTCGCGAAGCCGCGAGGTGGAGCTAATCCCATCAAAGCTGTCCTCAGTTCGGATTGCAGGCTGAAACCCGCCTGCATGAAGCCGGAGTTGCTAGTAACCGCAGGTCAGCATTACTGCGGTGAATACGTTCCCGGGCCTT\n>URS00009444FC ncRNA from 1 species \nCATCGAGTTGGTGCGCTAGGCCGCGACGAGTAGGAGGGCCTCGGCGGCGGGCGTAGAAGCCTAGGGCGCGAGCCCGGGTGGAGCAGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGTGGAGAAGGGTTCCATGTGAACAGCAGTTGAACATGGGTCAGTCGACCCTAAGGGATAGGCGAAGGCCGTTCTGAAGCGGGGTGATGTTCGCGTCGCCCCGGCGGACCGAAAGGGAATCGGGTTAATATTCCCGAACCTCGACGCGGAGATTGGCGCTCCGGCGCCTAGTGCGGCAACGCAAACGAACTCGGAAACGCCGACGTGGGTCCCGGGAAGAGTTCTCTTTTCTTGGTAAGGGGCGGCGACCCTGGAATCGGTTCGCCCGGAGATAGGGACATGGGCCCCGTAAAGCAGCACGTCTCTTGTGCTGTCCGGTGAGCTCGCGTCGGCCCTTGAAAATCCGAGGGAGACGGTGTAATTTTCGTGCGAGGTCGTACCCATATCCGCAGCAGGTCTCCAAGGTGAACAGCCTCTGGCCGATAGAACAATGTAGGTAAGGGAAGTCGGCAAACTAGATCCGTAACTTCGGGAAAAGGATTGGCTCTAGGGGCTGGGTCGGTCGGGCTGAGGTACGAAGCGGGGCGCGGCGCTGTACCGGACTGGGCG\n>URS0000B3F0C3 misc_RNA from 1 species \nAATAAGATTAAATTTTGTAACAGATCAATGAGATCCAGAGCAGACATTCTTAAAGACAACTAAGAAAACAAAAATCATATGTAGAATCTTTCAATATTACAAATGAAAAATCAAGATTTCCTTATTGCTCATCTACCGGTTTGAATCCTTAACAAATCGCAAACCAAAGCTATTATGGAAACCACAAAGTAGTACTCCAGCTTTCGCCTTCTCGGGCTTTTCCTTCAAGCTGTGTCCAATTCCATTCATTCTCCTCCTCCTCCACAATCTTGCCTTTAAAAATTCACTCCAAGGGTTAACCATAGAAGAGCGACAATGAGTACGATCGGAGCCCAAGAAAAGAGCGGTGCCGGGGACTGGACAAATTTTCCTCTGTCTCGGCGGCGGCGACGTTCTTGATCCTCCAAGAGATGGCAGTATCATGAGATGGCGTTCAATATGATGGCAAAGTGACACCAAACTCATATGAGTCGT\n>URS000206F7FE rRNA from 1 species \nATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGACGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATGGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCGACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACCCGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACAAATGTGTAAGTAACTATGCACGTCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS00022DD3B1 rRNA from 1 species \nCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAATTTCGGGGTTAGTAGGTTGGTCATGCCTCTGGTATGTACTGGTCTCACTGATTCCTCCTTCCTGATGAACCTTAATGCCATTAATTTGGTGTTTTGGGGAATTTGGACTGTTACTTTGAAAAAATTAGAGTGTTTAAAGCAAGCTAACGCTTGAATACATTAGCATGGAATAATGAAATAGGACGTTCGATCCTATTTTGTTGGTTTCTAGGATTGACGTAATGATTAATAGGGAGAGTCGGGGGCATTAGTATTCAATTGTAAGAGGTGAAATTCTTGGATTTATTGATGACTAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTAGGGGATCGAAGACGATCAGATACCGTCGTAGTCTTAACCATAAACTATGCCGACTAGGGATCGGATGATGTTAATTTTTTAATGACTCATTCGGCGCCTTACG\n>URS00017ABA52 rRNA from 1 species \nCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGCCGGAAGGCTGAACCAGCCATGCCGCGTGAAGGTCAGTGCCCTATGGGCGTTAAACTTCTTTTGTGCGGGAGCAATAATGGTCGCGTGTGGCCAGACGAGAGTACCGTACGAATAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGGGGATGCAAGCGTTATCCGGGTTTATTGGGTTTAAAGGGTGCCTAGGCTGGGAGGTAAGTCAGCGGGGAAATGCCCCCGCGCAACGGGGTGAAGTGCCATTGATACTGCCTTGCTGGAATGCGGATGCCGTAGGAGGAATGTGTGGTGTAGCGGTGAAATGCATAGATATCACACAGAACACCGATTGCGAAGGCATCTCACGAATCCGCGATTGACGCTGATGCACGAAAGCGTGGGTATCAAACAGGATTAGATACCCCGGTAGTC\n>URS0001280152 rRNA from 1 species \nGACTAACGCTGGCGGCAGGCTTAACACATGCAAGTCGAACGCATCCTTCGGGGTGAGTGGCAGACGGGTGAGTAACGCGTGGGAACGTGCCCTTCAGTTCGGGATAACCCAGGGAAACTTGGGCTAATACCGGATACGTGCGAGAGCAGAAAGATTTATCGCTGAAGGATCGGCCCGCGTCTGATTAGCTAGTTGGTGGGGTAATGGCCCACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGATGATCAGCCACATTGGGACTGAGACACGGCCCAAACTCCGACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCATGAGTGATGAAGGCCTTAGGGTTGTAAAGCTCTTTCGTCCGGGACGATAATGACGGTACCGGAAGAAGAAGCCCCGGCTAACTTCGTGCCAGCCGCCGCCGTAA\n>URS00025670D8 misc_RNA from 1 species \nAACGCACATTGCGCCCCTTGGTATTCCATTGGGCATGCCTGTTCGAGCGTCATTTACCCCTTCAAGCTCCGCTTGGTGTTGGGCGTCTGTCCGCGTTTCCGGCGCGGACTCGCCCCAAATCCATTGGCAGCGGCTCCGCCGGCTTCTCGCGCAGCACATTGCGCTCTGGGAGGCTCTCGGCGGGGCCCGCGTCCACCAAAGCAACCCCCCATTTTGACCTCGAATCAGGTAGGGATACCCGCTGAACTTAA\n>URS000223CBAB misc_RNA from 1 species \nAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAATTTCGGGGTCAGCAGGTTGGTCGTGCCAATGGTATGCACTGGCCTTGCTGATTCCTCCCTCTTGATGAGCCGTAATGCCATTAATTTGGTGTTGCGGGGAATCAGGACTGTTACTTTGAAAAATTAGGGTGTTTAAAGCAGGCAAGCGCTTGAATACATTAGCATGGAATAATGAAATAGGACGTTCGATCCTATTTTGTTGGTTTCTAGGATTGACGTAATGATTAATAGGGATAGTTGGGGGCATTAGTATTCAATTGTCAGAGGTGAAATTCTTGGATTTATTGAAGACTAACTACTGCGAA\n>URS0000D99911 rRNA from 1 species \nGGGTAAGTCGGGACCTAAGGCGAGGCCGAAAGGCGTAGTCGAAGGACAACAGTTTGAAATTACTGTACCACCGTAATCCGCTATGAGCGATGGGGTGACGCAGGAGGGTAGTGACGCGGACTGATGGATATGTCCGTCTAAGCAGTGAAGAGGCAGACCAGGGGAACTGAAACATCTAAGTACCCTGAGGAAGAGAAAACAATAGTGATTCCGTCAGTAGCGGCGAGCGAACGCGGAACAGCCTAAACCAAGGGGCTTGCCCCTTGGGGTTGTGGGACGTCTCACATGGAGTTACAAAGGAATATGGTAGGCGAAGAGGTCTGGAAAGGCCCGCGATAGAGGTAAAAGCCCTGTAGCCTAAACTGTGTTCTCTCCGAGACGGATCCCGAGTAGTGCGGGGCACGTGAAACCCCGTATGAATCCAGCAGGACCATCTGCTAAGGCTAAATACTACCTGGCGACCGATAGTGAAACAGTACCGTGAGGGAAAGGTGAAAAGCACCCCGGAAGGGGAGTGAAATAGAACCTGAAACCGTGTGCTTACAAAAAGTCAGAGCCCGATCTATGGGTGATGGCGTGCCTTTTGTAGAATGAACCGGCGAGTTACGTTTAACATGCAAGGTTAAGGTGAGAAGCCGGAGCCGCAGCGAAAGCGAGTCTGAATAGGGCGACTAAGTATGTGGACGTAGACCCGAAACCGTGTGATCTACCCCTGTCCAGGGTGAAGGTGCGGTAACACGCACTGGAGGCCCGAACCCACGCATGTTGAAAAATGCGGGGATGAGGTGGGGGTAGCGGAGAAATTCCAATCGAACTCGGAGATAGCTGGTTCTCCCCGAAATAGCTTTAGGGCTAGCCTCGGTGAATGGAGTGGTGGAGGTAGAGCACTGATTGGGTGCGGGGCCCGCAAGGGTTACCAAGCTCAGTCAAACTCCGAATGCCATTAACTTCTTGCCGGGAGTCAGACAGTGAGTGCTAAGATCCATTGTCAAAAGGGAAACAGCCCAGACCATCAGCTAAGGTCCCCAAGTGTGTGTTAAGTGGGAAAGGATGTGGAGTTGCACAGACAACCAGGATGTTGGCTTAGAAGCAGCCACCATTGAAAGAGTGCGTAATAGCTCACTGGTCGAGTGACTCTGCGCCGAAAATGTAACGGGGCTAAACACACCACCGAAGCTATGGCTAGATGCTTTGCATCTGGGGTAGGGGAGCGTTGTATGTGGGTTGAAGGTGTACCGTAAGGAGCGCTGGACAGCATACAAGTGAGAATGCCGGTATGAGTAACGAAAAGATCAGTGAGAATCTGATCCGCCGAAAGCCCAAGGTTTCCTGAGGAAGGCTCGTCCGCTCAGGGTAAGTCGGGACCTAAGGCGAGGCCGAAAGGCGTAGTCGAAGGACAACAGTTTGAAATTACTGTACCACCGTAATCCGCTATGAGCGATGGGGTGACGCAGGAGGGTAGTGACGCGGACTGATGGATATGTCCGTCTAAGCAGTGAAGCTGATGTGTAGGCAAATCCGCACATCAATAAGGCTGGGCTGTGATGGGGAGCGAAAATTGTAGTAGCGAAGCTGGGGTAGGGGAGCGTTGTATGTAGGTTGAAGGTGTACCGTAAGGAGCGCTGGACAGCATACAAGTGAGAATGCCGGTATGAGTAACGAAAAGATCAGTGAGAATCTGATCCGCCGAAAGCCCAAGGTTTCCTGAGGAAGGCTCGTCCGCTCAGGGTAAGTCGGGACCTAAGGCGAGGCCGAAAGGCGTAGTCGAAGGACAACAGTTTGAAATTACTGTACCACCGTAATCCGCTATGAGCGATGGGGTGACGCAGGAGGGTAGTGACGCGGACTGATGGATATGTCCGTCTAAGCAGTGAAGCTGATGTGTAGGCAAATCCGCACATCAATAAGGCTGGGCTGTGATGGGGAGCGAAAATTGTAGTAGCGAAGGTCATGATCTCACACTGCCAAGAAAAGCCTCTAGCCAGGAGAAGGTGCCCGTACCGCAAACCGACACAGGTAGGCGAGAAGAGAATTCTAAGGCGCGCGGAAGAACTCTCGTTAAGGAACTCGGCAAAATGACCTCGTAACTTCGGGAGAAGAGGTGCCTCGGTAGGGTGAATAGCCCGAGGGGGCCGCAGTGAAAAGGCCCAAGCGACTGTTTAGCAAAAACACAGGTCTGTGCGAAGCCGCAAGGCGAAGTATACGGGCTGACGCCTGCCCGGTGCTGGAAGGTTAAGGGGAGTGGTTAGGCCGAAGCTGTGAACCGAAGCCCCAGTAAACGGCGGCCGTAACTATAACGGTCCTAAGGTAGCGAAATTCCTTGTCAGGTAAATTCTGACCCGCACGAATGGCGTAACGACTTGGGCGCTGTCTCAACGAGAGATCCGGTGAAATTTTAATACCTGTGAAGATGCAGGTTACCCGCGACAAGACGGAAAGACCCCATGGAGCTTTACTGCAGCTTGATATTGAATTTGGGTACGATCTGTACAGGATAGGTGGGAGCCGTTGAGGCAGGAGCGCAAGCTTCTGCGGAGGCGCCGTTGGGATACCACCCTGATCGTATCTAGGTTCTAACCTAGTGCCCTTACCGGGTACGGGGACCGTGTCAGGCGGGCAGTTTGACTGGGGCGGTCGCCTCCTAAAGAGTAACGGAGGCGTTCAAAGGTTCCCTCAGAATGGTTGGAAATCATTCGCAGAGTGCAAAGGCATAAGGGAGCTTGACTGCGAGACCTACAAGTCGAGCAGGGACGAAAGTCGGACTTAGTGATCCGGTGGTACCGCATGGAAGGGCCATCGCTCAACGGATAAAAGCTACCCTGGGGATAACAGGCTTATCTCCCCCAAGAGTCCACATCGACGGGGAGGTTTGGCACCTCGATGTCGGCTCATCGCATCCTGGGGCTGAAGTAGGTCCCAAGGGTTGGGCTGTTCGCCCATTAAAGCGGTACGCGAGCTGGGTTCAGAACGTCGTGAGACAGTTCGGTCCCTATCTGTCGTGGGCGCAGGAAATTTGAGAGGAGCTGTCCTTAGTACGAGAGGACCGGGATGGACGTACCGCTGGTGCATCAGTTGTTCCGCCAGGAGCATGGCTGAGTAGCTACGTACGGACGGGATAAGCGCTGAAAGCATCTAAGCGTGAAGCCCCCCTCAAGATGAGATTTCCCAATTAGTAAGACCCCTTGAAGACGACGAGGTAGATAGGTTGGAGGTGGAAGTGCAGCAATGCATGGAGCTGACCAATACTAATCGGTCGAGGGCTTATCCAA\n>URS000235B2B5 lncRNA from 1 species \nAACTGTTGCGGCAGCCATGCTTGTGAGCTTATGATGTGCCGCTAGTTTAGTTTGTCGGTTTCTGTGAACCGTTCTCTGTGATGTATGATGTATTGCTGCTGTTAGCTGTAAATGTGTTGTATGATGAGTTGACTTGATGGTTCGTTTGAGGCTGTCTTGTGAAGGTTACTGTTAGTTAACATGAGTTAAACAAATACATACACTTGCTGCTGTTAGCTGTAAACATGAGTTGACTTGATGGTTCGTTTGAGGCTGTCTTGTGAAGGTTACTGCTAGTTAACATGAGTTAAACTATTACATGCACTGGGACCCATTTGACTAGTGGACCCATTTAATAAAAATAAAAATGAAATTGTTTAGACAAAAAGGCCACGGCCCAACAATAAAAAAGGCTGCAACGTTGGGCTTGGCCCATGAAGTCGACCAAAAATTAACAGAAAAAGGCTGAATTGTTGGGCTCGGCCCATCTAAAGCAGCGAAATGGACCGGGCTGATTCTTATCAACGACCTTTTCATTTGGTCGCAATTTTGCCACGTCAGATTGCCACGTCGGATCCGACGGGGCCTGGGCAGAGAGCTAGCGACCAAAATAGAAGGTCACAGAATCAACGACCTTTTGTTTTGGTCGTGGAATTCCACGACATTCTCAAAGAGAAGGTCGTTAATTTCAATTTACGACCGCCAGCTTTTGACCATCTATTTTTGGTCAAAAAAAGGTCGCAAATGAAAATCAATGACCTTTCAGTGACCAATAGTGAGGATTGCAAGTTGACATATTTCTTGTAGTGAATTCCGGATAACTTCATAATATATTATGAAGCCTCTGCTTGGCTCAATGGATAGGCGTACAAGTCGCCGCCACTGTGTTTTGATTAACTTCAACAACCAGTTGGGATGAATCATCAGCTGGGTTATTGACACAGCCCATACGGGATCATTTATAACCCGCCGAGGGTTCCGCTGTTTAACAATATGTCGGTTTATATCACGGTCAAGTATGGAGAATCTCAAGACAACTCCTCGAGTCGTCTTAAGACTCGGGGGCTACAATGACATGACTCAGCAAATCCTGCCAGCTTCAGCTAATTCAAGAACCCCGGGTCATTGGAGGGAAGATAACCCGGTCCCAGAGGCTACTGCTATATTGATGAAAATTTAAAGGCCGTCAGAAAATTCCTGGCTTAAAATGAAGAATTCGGGATTAAAATCCAGCTCAAGGGAAATCTATCTCTCATAAAGCTTTGAAGCTCTCAACATCCGGTTTAAAATTCCGGTTCAAAAAGAATCCTTCTCTCGCAAGTTCGAGTTCAAGAAAAATTAAAGGTTGCCAAAGAGAACTCGCTACCATGATGCGCGGTTCAAACATGGGTATCCTGCCTTATTGGCTTATCACATTATTGATCACTTGGGGGCTTGCTGCTCATTGAGCATAGCTATGACTACCTTCTTAATCCGGCTTGTACGCCATGATTACAAAATACTTGGGGGCTTCCTGCTCATTGAGCATAGCTGTGATTACCCTATTGATAACCCACTTGGAGACTTGATGCCCGGGTTAAAGGTACCAAAGAGAGTCTATTGCAGAGCACAGCTCAAACATAGGTACCCTGCTTTGATGGCTCAATATATATCACTTGGGGGCTCCCTGTTCATTGTAACATAGCTTTGGTAACCATTTTGATTGGCTTGAAACGCCAGGTGTATACACCAAAAAATTTCAGTTGATCCTGCCTTTTACGTCTGCCACTTCGCTCAGGTAATCCTGGAATGACCCACCGAACTCTTAACAGTCAATCTTATTAAGACCCTGAACTTGTCAAGGTTAAAACGGCGGTTGGTCATGTGAGGCCCGACTTATAAGGTTTGAATGAAGGATTAACTTAGCGGTTGTGCAAGCCTATGAAAAGCACTTGATGATTGAGGCCTGGCCGCCTATGAAAGCCTTGATTTTTTGTTATTTGTTTTTGAACGATGTTTGAGTTCATACCTTTTTTGATATATGGTTTAAACTGATTCAGGCCATGTAGCCTTAATCCTTATGACTCGTATTTGAGCATATTTGGGGTTTGATAACCCAGCCTGGCTTTGGATGATAAGTCGCCAGTATGCTTTGATTGTGCGCTGATGTCTACTACGCAACCTTCTTCTTGTAGACGTTGTTGGGCCTCCAAGTGCAGAGGTTTGTAGGACAATAGCAAATTTCCCTCAAGTGGATGACCTAAGGTTTACCAATCCATGGGAGGCGTACGATGAAGATGGTCTCTATCAAACAACCCTGCAACCAAATAACAAAGAGTCTCTTGTGTCCCCAACACACCCAATACAATGGTAAATTGTATAGGTGCACTAGTTCGGCGAAGAGATGGTGATACAGGTGCAATATGGATGGTAGATATAGGTTTTTGTAATCTGAAAATATAAAAACAGCAAGGTAACTAATGATAAAAGTGAGCACAAACGGTATTGCAATGATAGGAAACAAGGCCTATGGTTCATACTTTCACTAGTGCAATTTCTCTCAACAATAATAACATAATTGGATCATATAACTATCCCTCAACATGCAACAAAGAGTCACTCCAAAGTCACTAATAGCGGAGAACAAATGAAGAGATTATGGTACGGTACAAAACCACCGCAAAGTTATTCTTTCCGATCAATCCATTGTGCTATTCATATAAGTGTCACAAACAGCCCTAGAGTTCGTAGTAAAATAACACCTTAAGACACACATCAACCAAAACCATAATGTCACCTAGATACTCCAATGTCACCTCAAGTATCCGTGGGTATGATTATACGATATGCATCACACAATCTCAGATTCATCTATTCAACCAACACATAGAACCTCAAAGAGTGCCCCAAAGTTTCTATCGGAGAGTCAAGACGAAAACGTGTGCCAACCCCTATGCATAGGTTCATGGGCAGAACCCGCAAGTTGATCACCAAAGCATACATCAAGTGAATCAATAGAATAACCCATTGTCACCACGGTTATCCCACGCAAGACATACATCAAGTGTTCTCAAATCATTAAAGACTCAACCCGATAAGATAACTTCAAAGGGAAAACTCAATCCATTACAAGAGAGTAGAGGGGGAGAAACATCATAAGATCCAACTATAATAGCAAAGCTCGCCATACATCAAGATCGTGCCAAATCAAGAACACGAGAGACAGATCAAACACATAGCTACTGGTACATACCCTCAGCCCTGAGGGTGAACTACTCCCTCCTCGCCATGGAGAGCGCCGGGATGATGAAGATGGCCAGCGGTGAGGGATCCCCCACCCCTCCGGAAGGGTGCCGGAACTGGGTCCCGATTGGTTTTTGGTGGCTACAGAGGCTTGCGGCGGCGGAACTCCCGATCTATTCTGTTTTTCGAAGGTTTTTGGGTATATTGGTATATATAGGAGGAAGAAATACGTCAGGGGAGCCACGAGGGTGGAGGGCGCGCCCAGGGGGGTGGGCGCGCCCCCTGCCTCGTGCCCTCCTCGTTGATTTCCTGACGTGCACTCCAAGTCCCCTGGATTGCTTCCATTCCAAAAATAACTTTCCCAAAGGTTTCATTCCGTTTGGACTCCATTTGATATTCCTTTTCTGCGAAACACTGAAACAAGGGAAAAACAGAAACTGGCACTGGGCTCTTGGTTAATAGGTTAGTCCCAAAAATAATATAAAAGTGTTTAATAAAGCCCATAAACATCCAAAACAGATAATATAATAGCATGGAACAATCAAAAATTATAGATACGTTGGAGACGTATCAGCATCCCCAAGCTTAATTCATGCTCGTCCTCGAGTAGGTAAATGATAAAAACAGAATTTTTTATGTGGAATGCTACCTAACATAATTATCAATGTAATCTTTTTTATTGTGGCAAGAATATTCAGGTCCATGAGATTCAAGACAAAAGTTTAATATTGACATAAAAATAATAATACTTCAAGCATACTAACTAAGCAATCATGTCTTCTCAAAGTAACATGGCCAAAGAAAGTTCATCCCTACAAAATCATATAGTTTGGTCATGCTCCATTTTCATCACACAAGAATGCTCTCGTCATGCACAACCCCGATGACAAGCCAAGCAATTGTTTCATACTTTAGTAATATCAAAATTTTCAACCTTCACGCAATACATGAGCGTGAGCCATGGATATAGCACTATGGGTGGAATAGAATATGATGATGGGGGTTATGTGGAGAAGACAAAAAAGGAGAAACTCTCACATTGACGCCGCTAATCAACGGGCTAGGGAGATGCCCGTCAATTGATGTCAATGCAAGGAGTAGGGATTGCCATGCAACGAATGCACTAGAGCTATAAATGTATGAAAGCTCAACAAAAGAAACTAAGTGGGTGTGCATCCAACTTGCTTGCTCATGAAGACCTAGGGCACTTGAGGAGGCCCATTGTTCGAATATACAAGCCAAGTTCTATAATCAAAAATTCCCACTAGTATATGAAAATGACAAAACAAGAGACTCTCTATCATGAAGATTCTGGTGCTACTTTGAAACACAAGTGTGGTAAAATGATAGTAACATTGTCCCTTCTCTCTTTTTCTCTCATTTTTTTGGGCCTTCTCTTTTTTTATGGCCTTTCTCTCTCTTTTTTTTATAGTCCTCACTTGGGACAATGCTCTAGAAAATGATGATCATCACACTTCTATTTATTTACAACTCAATGATTACAACTCGATACTAGAACAAAGTATGACTCTATATGAATGCCTCCGGCGGTGTACCGGGATATGCAATGAACCAAGAGTGACATGTATGAAAGAATTATGAATGGTGTCTTTGCCACAAATACTATGTCAACTACAAGATCATGCAAAGCAATATGACAATGATGAACGTGTCATGATAAACGGAACGGTGGAAAGTTGCATGGCAATATATCTCGGAATGGCTATGGAAATGCCATAATAGGTAGGTATGCTGGCTGTTTTGAGGAAGATATAAGGAGGTTTATGTGTGAAAGAGCATATCATATCACGGGGTTTGGATGAACCGGCGAAGTTTGCACCAACTCTAAATGTGAGAAAGGGCAATGCACGGTACCGAAGAGGCTAGCAATGATGGAAAGGTGAGAGTGCGTATAATCCATGCACTCAACATTAGTCATCAAGAACTCACATACTTATTGCAAAAATCTACAAGTCATCAAAAACCAAGAACTACGTGCATGCTCCTAGGGGGATAGATTGGTAGGAAAAGACCATCGCTCGTCCCCGACCGCCACTCATAAGGAAGACAATCAAGGAACACCTCATGTTTCAAATTTGTTACATAACGTTTACCATACGTGCATGCTACGGGACTTGCAAACTTCAACACAAGTATTTCTCAAATTCACAACTACTCAACTAGCACAACTTTAATATCACTACCTCCATATCTCAAAACAAGCATCAAGTATCAAACTTCTCTTAGTATTCAGTGCACTTATATGAAAGTTTTTATTATACCCATCTTGGATGCCCATCATATTAGGACTAGTTACATAACCAAAGCAAACTACCATGCTGTTCTAAAGACTCTCAAAATAATATAAGTGAAGAATGAGAGTTCATCTATTTCTTCAAAATAAAACCACCGCCGTGCTCTAAAAGGATATAAGTGAAGCACTAGAGCAAATGACAAACTACTCCGAAAGATATAAGTGAAGATCAATGAGTAGTCGAATAATTATACAACTATGTGAAGACTCTCTAACATTTAAGAATTTCAGATCTTGATACTTTATTCAAACAAAAAGCAAAACAAAAGAAAATAAAATGACGCTCCAAGCAAAACACATATCATGTGGTGAATAAAAATATAGCTCCAAGTAAAGTTACCGATGAACGAAGAGGAAAGAGGGGATGCCATCCGGGGCATCCCCAAGCTTAGGCTCTTGGTTGTACTTGAATATTACCTTGGGGTGCCTTGGGCATCCCCAAGATTAGGCTCTTGCCACTCCTTATTCCATAGTCCATCGAATCTTTACCCAAGACTTGAAAACTTCACAACACAAAACTTAACAGAAAACTCGTAAGCTCCGTTAGCGAAAGAAAACAAAAAACCACTTCATGGTACTGTAATGAAATCATTCTTCATTTATATTGGTGTTAAACCTACTGTATTCCAACTTCTCTATGGTTTATAAACTATTTTACTAGCCATAGAGTCATCAAAATAAGCAAACAACACACGAAAAACAGAATCTGTCAGAAATAGAACAGTCTGTAGTAATCTGTAACTAACGCAAACTTCTGGAACTCCAAAAATTCTAAAATAAATTTTTGGACCTGAGGAATTTGTCTAGTAATCATCTGCAAAAAGAATCAACTAAATAGCACTCTCCAGTAAAAAGTTTAGCTAATCTCGTGAGCGCTAAAGTTTCTGTTTTTTTACAGCATGCTCATAAAGACTTCACCCAAGTCTTCTCAAATGTTCTACTTGGCACAAACACTAATTAAAACACAAAACCACATCTAAACAGAATCTAGATGGATTATTTATTCCTAAACAGAACCAAAAAGTAAGAAACTAAAATTAAGTTGGGTTGCCTCCCAACAAGCGCTAATGTTTAACGCCCCTAGCTAGGCATGATGATTTCAATGATGCTCACATAAAAGATAAGAATTGAAACATAAAGAGAGCATCACGAAGGATATGACTAGCACATTTAAGTCTAACCCACTTCCTATGCATAGGGATTTTGTGAGCAAACAACTTATGGGAACAATAATCATCTAGCATAGGAAGGCAAAACAAGCATAACTTCAAAACTTTAAGCACATAAAGAGGAAACTTGATATTATTGCAATTCCTACAAGCATATGTTCTTCCCTCATAATAGTTTTCAGTAGCATCATGAATGAATTCAACAATATAACCAGCACCTAAAGCATTCTTTTCATGATCTACTTGCATAGAAATTTTACTACTCTCATAAGCAAAATTCTTCTCATTCCGAATAGTGGGAGTATCATAAGAGACTTGAATACTATAAATTGTTTCCACATTAAAAGAGTAATGTTCAGAAAAAGGGTAATCAGAATCATGACAAGTTTTATAAATATAATCATCACTACTTTTTATAGCATAAGTTTCATCACAATAATCAGCATAAGTAGCAACTGTGTTCTCATCATAATCAATTGAAACCTCTTCCGAAATAGTGGATACATCACTAAATAAAGTCATGACCTCTCCAAATCCACTTTCATAAATATTAAAAGATTCAACACCCTCCAAAATAGTGGGATCATTACTTCCTAAAGTTGACACTCTTCCAAACCCACTTTCATCAATATAGTCATCATAAGTAGGAGGCATGCTAACATCATAACAAATTTGCATATCAAAACTTGGGAGGCTAAAAATATCATCTTCATCAAACATAGCTTCCCCAAGCTTGTGGCTTTGCATATCATTAGCATCATGGATATTCATAGAATTCATACTAACAACATTGCAATCATGCTCATCATTCAAATATTTAGTGCCAAAAATTCTAATGCATTCTTCCTCTAGCAATTGAGCACAATTATCGGAATCCTTATTTTCATGAAAGATATTAAAAAGATGAAGCATATGAGGTACCCTCAATTCCATTTTTTTGTTGTTTTCTTTTATAGACTAAACTAGTGATAAGGCAAGAAACTAAAAGATTCGATTGCAAGATCTAAAGATATAACTTCAAGCACTCACCATCCCGGCAACGGCACCAGAAAAGAGCTTGATGTCTACTAAGCAACCTTCTTAGTGTAGACGTTGTTGGGCCTCCAAGTGTAGAGGTTTGTAGGACAGTAGCAAATTTCCCTCAAGTGGATGACCTAAGGTTTATCAATCCGTCGGAGGCGTAGGATGAAGATGGTCTCTCTCAAACAACCCTGCAACCAAATAACAAAGAGTCTCTTGTGTCCCCAACACACCCAATACAATGGTAAATTGTATAGGTGCACTAGTTCGGCGAAGAGATGGTGATACAAGTGCAATATGGATGGTAGATATAGGTTTTTGTAATCTGAAAATATAAAAACAGCAAGGTAAGTAATGATAAAAGTGAGCACAAACGGTATTGCAATGATAGGAAACAAGGCCTAGGGTTCATACTTTCACTAGTGCAAGTTCTCTCAACAATAATAACATAATTGGATCATATAACTATCCCTAAACATGCAACAAAGAGTCACTCCAAAGTCACTAATAGCGGAGAACAAATGAAGAGATTATGGTAGGGTACGAAACCACCTCAAAGTTATTCTTTCCGATCAATCCATTGGGCTATTCCTATAAATGTCACAAACAGCCCTAGAGTTCGTAGTAAAATAACACCTTAAGACACACATCAACAAAAACCCTAATGTCACCTAGATACTCCAATGTCACCTCAAGTATCCGTGGGTATGATTATACGATATGCATCACACAATCTCAGATTCATCTATTCAACCAACACATAGAACCTCAAAGAGTGCCCCAAAGTTTCTACCGGAGAGTCAAGACGAAAACGTGTGCCAACCCCTATGCATAGGTTCATGGGCGGAACCCGCAAGTTGATCACCAAAGCATACATCAAGTGAACCAATAGAATAACCCATTGTCACCACGGTTATCCCACGCAAGACATACATCAAGTGTTCTCAAATCATTAAAGACACAATCCGATAAGATAACTTCAAAGGGAAAACTCAATCCATTACAAGAGAGTAGAGGGGGAGAAACATCATAAGATCCAACTATAATAGCAAAGCTCGCGATACATCAAGATCATGCCAAATCAAGAACACAAGAGAGAGAGATCAAACACATAGCTATTGGTACATACCCTCAGCCCCGAGGGTGAACTACTCCCTCCTCGTCATGGATAGCGCCGGGATGATGAAGATGGCCACCGGTGAGGGATCCCCCCCCCCTCCGGCAGGGTGCCGGAACAGGGTCCCGATTGGTTTTTGGTGGCTACAGAGGCTTGCGGCGGCGGAACTCCCGATCTATTCTGTTTTTTGAAGGTTTTTGGGTATATTGGTATATATAGGAGGAAAAAATACGTCAGGGGAGCCACGAGGGGCCCAGGAGGTGGGCGCGCCCCCTGCCTCATGCCCTCCTCGTTGATTCCCTGACGTGCACTCCAAGTCCCCTGAATTGCTTCCGTTCCAAAAATAACTTTCCCGAAGGTTTCAGTCCGTTTGGACTCCGTTTGATATTTCTTTTCTGCGAAACACTGAAACAAGGGAAAAACAGAAACTGGCACTGGGCTCTTGGTTAATAGGTTAGTCCCAAAAATAATATAAAAGTGTTTAATAAAGCCCATAAACATTCCAAACAGATAATATAATAGCATGGAACAATCAAAAATTATAGATACGTTGGAGACGTATCATGCGCTTGGAGTTCTGTGCTCTAAGTTTTTGGGTTGTTACCCTTGCTGCGTATGGCGCTGTAAGCCGGCTGTATGAACCGATTTCACAGGCCATGTAGCCTTGATTGTATGACTCATCATGGAGCATCTTTGGGTTTGATAACCCGCCCTGATAGCGGATGTTGAGTCGCCAAGATATCTTTGCATTGAGCAATCAAAATTATGATATTACATGCCTACGGGTCAATACCCGTGACGGATTATAATTATTGAGGTATCACCAGGATGTCAATCTCCAGGTATGTTTTTCAATAATGGTATGAATATTTTGGGTTTGGTAACCCGCCCTGGCTATGGACTTTAAGTTTCTAGAATACTTTGGATTGCGCAATTGGGATTATGCGCTTATGAATACTTGGGATGTGGCTATGTAAGCCGGCAATTTGAGCCAAATTTCTAGGTATGTTTTTAAATTGTTGGATGAATATGTGAGGTTTGATAACCCGCCCTGGCTTTGGACATTAAGTCGCCAGTATATTTTGGATTGCACCATTGGAATCATGCGCTTATAAATTATTGGATTGTTACCCTCACTGGATATGGCGATGTACGCCAGCGGTATAAATCAATCCTACAGGTATGTTTTCCTGGTTATATGAATATACGAGGTTTGATAACCCGCCCTAGCTTTTGACTTTAAGTCGCCAGTATGTTTAGGCTTGAATGTCCTTGCTTAGTCTTTTCGGTAATTACATAAGACTATATTATGTTTGGGTTGTTGCCCGCCCTGGCTTTTGACGTTAAGTCGCCAGGGCATATGTTGTTTAAACTGTGTAGAACATGCAGAGCTTTACACATAAGTAAGAATACTGCTATTGCTCATATGAATCATTGCGTTTAAACCCATCATCTGGCCATCTGAAGATATTGCCGGGTTATCCGGCTCCGGGCTATATTGTTCAATATTGAGTTTATTGAGGCTATGAGCTGCCAAAGTGATCTTGTCAAAAACTGGACATGATTATGAGCCGCCATGGATGGGGTTATCAATTCTTGATTTTTACAAAGGCTATAAGCCGCTGGATTGCAAAGTCCCGGATTACAATGGATGCGCATTAAGTCGCCATCGACCAAGAGCCGCCGGGTATTTAAATTCCGGATTTACTTGTCAAACAGATAAGGTATTCAAATCTTTAATAGCCAAACTTGGCTGGAGTTTCATTATAATATTGAATGATTGAGGTTTTCATACCGGATTATATGACCCGGCCGGACATGGCGCCTCACCAGAAACCCGGTTGATACTTGGCGACTCACTAGAGACCCGCCCGAACCTCAGCGACTCATTAGTAACCCGGCGGGCGGGTCAGACGATCGACAAGACCCAACGGCCCAGAAGGCGACTCGTGGGAAGGCCGGCTCGTGTTATGGTGGGCCGGCTTAAGATGAAAGGCTAAAGAATATTCTCCTAGAAAGAAAGCAAGACTAGGACTGCACTTGTAATAGAGTAGTCCTAGTCCTACTAGGACTCCACATGTAACCCGCCCCTCCAACTTAGATAAGGAGGGACAGGGCACCCCAAGAGGGACAAGTTTTCACGAGTTGGACAAGTTAGGGTTAGACAGACAAGTCTATAGCTATCGAGATAGAGCACCCTTGTAATCGTGATCATCATCATCAATATCAATGAAGCAGGATGTAGACTTTTACCTCCACCGTGAGGGCCGAACTTCGGTAAAAAACCTCGCGTCTCTCGCCCCACTCAACCCCTCTCAAGCTACCACATAGATGCGTTGGCTTCATGACTAAGTCCTCATACTAGGACATCTGCCGTGACAAATCCACGACAAGATTCAAGTGGAGGCAACATGTGGTGCACATCGAAAGTTTGGATTAGTAGTATAGCTTCGAGATGCACCACATGCTGCCTCCACTTGAACCTAATCCACCTCCATTTCACACACTGTTATGGACATAATGATATATCAACCTCATAATTGGTCCTGTATACAAATTTGTACAACGGCGTATAAATACACTAAAAGTAAAAAAATAAAAAACAGTATACTGGTAGCGCTGGACCGGAAACACGCTACTACTAGCTAGTTAGATTAGCAGTAGCGTGTGTTGCACGGGCTACTGCTAAGGAATAGCTGTAGCGCCTTACTAGTAGTGCGGTGACACGCGCTACTAGTAGATCAACGTCTTCAGTGGCATGTTCAGCAGCTGGATCTTCTCCGCGGTGGTCGGCACTACCATCGGGTTCCAGGTGATCCTCGTGGAGTTGTTGGGCACGGTTCACCTGAACGGGAGGCTGTGACTCATGAGTGTGTTGATCGGGTCGGTCAGCCTGGTTATCGGCGCCGTCCTCAAGTGCATCCCTGTTGGTTCCGGCAACGCCTCGTCCGATCGTCACGACGGATACCAGCCCATCCCCACCGGCCCTAGTGCCATGTGATTTTGAAGAAGTTTTGGTTGGTTTGTTTAGGAAAGGGGAAGATGTATGAATCTTTTAGAATCAAACTTTGCAGCTTCAGTTTTTTGTAGGAGGTACCGGAACAATTTTTTTGGATTGAGAAAACCGGACATACTTGTGGTAATGACGGTTCTGAGAAATTTAAGTTTCTATTTTTTTTCGTTGTTTTTGTTTTGTGCTTTCTAGCCAAATAGGACTATGGATTTCCATTGTAGGATTACTATGCAATGATAAATGCAGTTGCTTACTATCTAGTATCTATACACAAATCTTCACATTTAGGGTTATACTCATGCGGGTGACATGTGATTTCTGGAAGATGTTCTTTTTATTTATTTTTCCTTTTGGAGGAAAAGAATGTAGTGTTAAATGAACTTTTAAGTACAGTTTGAGCTTTTTCCCCACTCAGGCAAATGAAGTTTCTGAAATTTTATTGTAGAATCCTTATAAACAACAAAAAAAAACTGAACCATGCAGGAGACTTACATGTACTCCCTCCATTTCAAAATATACGGTGTATTAGTTTTTTCAAAAATAAAACATGTGCAAGCTTGACCAAGGTTTAAGAAAAAATTATCAATATTTACAATACCAAATTTGTAGCATTAGATCCTTCACTAAACAAATTCATATTTTCTTTATTTGGTTTTGTAGAAGTTCATATTTTATTCTATAATCTTGGTCGAACATATATAAGTTTGACTTGCACGAACCTGATTCACCTTATATTCCGGAACGGAGGAAGTAATTCGGTAATAAAGAGATCAGTACAACGCCAAAGATGGCACAACCGTTACATCGCCAACACCATGACCAAACTACGACACTTACATCACCAACAATGGCGCAACCTAAACAACACAATGAGAATGACCCAATACAACTCGGACTAGGGCAAGCGTCCAACACCAGGCATAAAGAACAGAGAAAGATCCTCTGCAAGAGCCTGCACAATAGCCCGACACAACACTACCCCAACGACGACTACCACGTCAACGATTACTGACGTACAAGCAATACTATTTGCAGCAACATAGGCATGACGTCACGAATACAAGAGTCCACCTCAGGCTGTAAGTGGGACGCTCCGCGGGAGGCCCGCGTCCGCCCCACATCTGCCGCGTAGATTAAGTGGAATTCCCGTTAAAGCCTGCATATTATTATGTGGGATATGTGGGTTTAGTAGGATACCCACAAAATTCATACAGATGCTTCTGTTGAAAGTCAACTTGAGGTGGTGAGCTACAATGACTGGTTCGTCGGGAGCTCGAACAGCTCGTGTGCATGATGCGCACGTACAGCCGGCATGCCTTGGCCTTGCCCTAGTGCTCTTGTGCCGTCGATGGAGCCTCTTGGAGCAAGAAAGACTGCTCGCTGAAACAAACCCAACAGTTCAGATCGCTGAATCAACTACTCCCTCCGTTCGGAGTCATTTTTGTGACAAGTAATTCCGAACTGAAGGAGTAGTAACTAATAGCCATACATTTACAAGTTTTCAGTAGAGTAGCATTTATATACCAGGTTAACACCTCACACATACACAAACACAGACACAAATACAAGCGTCCATGGCTGGACGCGGCGCGGCAGCCGGTGCTGGCGATGCACGGAGACAGGCTGTCGACGTGGCCGTCCAACAGGCCGCGGCCCTCACGGACACCGACGAGCAGGCCTCGGTTCCACGGACGTCGCACACAGGAGTACGTCCTCGAGCCTGCAGGACCGTCGGCGAGCGCGCCCGGCGGCCGGAAGCTGCGACGGAGGTAGACGGCGGCACTGCGGCGCCCACGGCGGAGATGGGCGATGACGCTAGTGCGGCCATAGAGGAGGTCGACGGAGTCGCTAGGTCGTCCATGGAGGAGGTGGACGACGAGGTAGGCCGGCCATGGCTGGCGGCGACCCCTAATCCCCGCAGCGTGTCCAGATAAGTGGGTTCGATGTGGGCATCGTGGGATAACCCACATATTCCACATATTGTGGTGTATTGACCGTGGGTGTCCACGAACGCAAAATAAACGGGCCTTTAAGTGGGCACCGCGGGTGGCCCGTGTCCACCTACAGCCTGAAGTCCACCATTCCAACGCCGCCAGGCTAGCCTCCATCCAGACCATACAAGGAGAGTCATGGGGGTGGGCATGCAAAACCGGAGGGGGGCAGCGACGACCAACCAGGGGCGCTAGCGAGGAAAAGGCGACGCTCGCGCAAAACAAACACTGACTATCACTAGCCTTCCATCAACACCAGTCACCACGGGTCTCTCTCGAACTCTCCATAGAAGACAGAACGCGAGAGGAATCCCAGAGGCGTCCGTTTTCCCGGTCCTTCCGCCGGCGACCTCGCCGCTCCTCCTCGCCTCTGATGGCCGTTTTGGCCTCAGCAGGAGGGGGGAGCTCCGGGGAAGCCCGGCCGTCTAGGTAGGTTCCAGGAGGCGCCGTTTAGATGTCGGCGGCGGCACCGTGTCAGAATAAATGTCGCCTGGCTTCAGCCGTGTTTCGTCGGAGATCTTGTCCCCGGCGAGAAGCCCATGGGTGCGTGGTTCATGTTGAGGATATGTGTTATGTGCATATTGTGTATTGGGCTGGCTTCCTAGTTCCTTGTATAATTGAGGTATGTGGCTCATCTTTGTATATCATATATACGTGCCTATGCACAAAGAGCAATACATCATGCAATTCACATATTCTATATAGTATCAGTTTTTTAGGTTCTCTCGCTTCCGCTGCCGCCGCCGTCGTGCGTCTCCTCCGCGCCGCCGCCGCCGCCGCCCGATCTCCTTGCCGCCAACAGTCAATCCACGGCCGCCGCAGCCCTCTGCCACCCGTTCGCCGACGCCAACCCTCCCGACGTCAATGACATCCGCAACCTCAACATCTTCGAGCGGGTGTCGGTTCGTCTTTCGCAGGCGAACTCCTCCTACTACACGTGGAAGACCTACTTTTCCCTCGTGTTTCGGGAGTATCATCTTGTTGATCACGTGGACGGCACCGTCGACTCCAGCCTTGTCCCCGATTTCCATGAATGGTCCACCATCGACACCACGATCATCCGATGGTTCTTCCTCACCATCTCGCCAGACCCCTTCCAGGCGGTTGTCCAAGACGGTGATGACGCATGCGCCGTGTGGACCAACCTGAACGGGCTCTTCACCGACAACAAGCTCCAGCATCGCGTTTTTTTTGCAGCAAGAGTTCTTTGGGTGTCACCAGGACAACACCTCCGTCGACGACTATTGTCGCCGCCTGAAGACTCTCACTGACGAGCTCCGCGATATTGGCGCGAAAATTGATGATGACCTCCTCCTCACCACGCTGACCGCCGGGCTCAACGAGGATTTCGGCAACGCCGCGGCGAACCTCAGTCTCATCCCCAACCCGTCCTTCGCCAAGTTCATTGTGTACCTCCGCTTGGAGGAGCAGCGGATGAAGCAGGTGAAGGCGCGGGCCATCCACACCGCCCTCGCCGCCGGCACCACCCATGGCGGGTCCTCGGCGCCTCCCGCTGCCCCGGCCGCGCCCCTGCCGCAGCGCCACCTGGCGCCGCTGCCGTACCCGGCGCCCCAGCAATCGGGGCTGCTCCCGCTGCCTTATGGGTCGCCCGCCCCTCCCGCAGAACGGCGCCGCGGGGGCCGGCGTGGTGGGGGCCACCGCGGCGGTCAGCAGCAGCAGCCGCAGGGCGCCGGCCAGCCCCGTCAGCAGCAGCAGCAGCAGTTCCAGGTGCCCCCTCCGTGGGCCTCCGGCTACAACCCGTGGACCAGTGTTGTTCATACCCACACCATGCCGGTTCCACGGGCTCCTGGACCGACCCTTCCCGTGCCGCGCCCGTCGGCGCATCAGGCGTATTACGCGGCTCCGCAGCCGTACGGAGGATACCCACTGCTGCAGCTGAGCGGCGCCTACGGTCTTCCTGCGGCCCCGCCGCCGCCCTTGCCGGCCCTGCCGCCGGCGCCTTGGGATCCGGTGCTCCTCGCTGCGCTGCACACCGCGCCTACGCCGAACAACTACACTGGAGGCGGTGATTGGTACATGGACACCGGGGCTACGGCTCACATGTTTGCTTATCCTGATAATCTTGCCTCCTTCACTCCCGTCACCACCGATCGGCGCATCATTGTCGGCGACGGTTCCACACTCCCTATCACACATGTCGGGCACACTTCTTTTCCTTCTAATTCCATGCCTATTACTTTGTCTAACATACTACTGTCACCTCATCTTATTAAGAACCTTGTTTTCGTTCGTTGTTTAACTCGTGAAAATCCTGTTACTGTTGAATTTGATGAGCCTGGTTTTTGTGTCAAGGACGCTCGAACCAGGATGGTACTTCACCGATGTGACAGCCTCGACGAGCTCTATCCGGTGCATCCGCCGTCCACACCGGTTGCTCTCTCCGCCGGTGTCAATCTCTGGCACGCTCGTTTGGGTCATCCCAACCCAGTCACACTTCGTCATATTCTTAGGAGTTTCAGTTTCAGTTGTAATAAGATAGAGGATCACACCTGTCATGTCTGTCGTGTCGGCAAACATGTTCGCCTCCCATTTAATAACTCCACCACCATAGCTTCTTTTCCTTTTCAGTTGATTCATAGCGATGTGTGGACCTCTCCGGTTCCTAGTAATTCGGGCTATTTATATTATCTGGTTATCCTTGATGATTATTCTCACTATGTGTGGACGTTTTCTTTACGACGAAAGTCGGATGCACTCTCCACTTTGTCGGCTTTTTACTCCTATGTCAGCACGCAGTTGGGCATCCCATCCTTGCTCTTCAGACTGACCATGGAAAAGAGTTCGACAACCTTGCTTTCCGCACCTTTCTGTCGCACCACGGCACAGTTTTTCGTCTCACATGCTCGTATACTTCATAGCAGAACGGTCGAGCTGAACGCGTCCTTCGCACTCTGAACGACTGCGTTCGCACGCTCCTGTTCCATGCTAATGTGCCGCCTCGTTTCTGGCCAGACGCACTCTCTACTGCTTCAGTTCTCCTTAACCTTCGCCCTTGCCGCCCACGATGGAACTATGCACCTCACCATCTTCTCTTCGGTACGCCCCCATCTTATGACGGCTTGCGTATTTTCGGGTGCCTTTGCTATCCTAGCACTGCCGACTCCGCTCCTCACAAACTCGCACCTCGTTCTATCGCTTGCATCTTCATCGGCTACCCCTCCAACTCCAAGGGATATCGGTGCTACGATCCCGTCTCCCACCGTGTGTTCACCTCCCGGCACGTTTACTTTGATGAGCATGTGTTTCCGTTTCAACAGGTACCCCCGGCTGTTCCTCCCGCCACCAGTGACGTGGGCTCCTCGACTCCTCTCCCAGGGCGCTCACACGCCTCTCTTGGCCCGCCCCTTGGCTTTGAGGCGCGCCCCCCGCATGCAGCGGCTCCTACCGCCGCGGCACTAGCGCCCCCGACATTGGCGCCCGCGGCCCCCCTGGCGCCCCTGGCGTCCCCGGCCCCCCGGCTCCCTCGGCGCCCCCGACGCCCCCGGTGCCCGCGGCCGGTCCGGTCACCCGCGCCCGAACGGGTTTTTTTCGCCCGAGCTCGCACTACGCCTCGGATGATTACGTCCATGCGGCTGATGACCCACAAGTATCGGGGATCTATCGTAGTCCTTTCCATAAGTAAGAGTGTCGAACCCAACGAGGAGCAGAAGGAAATGATAATCAGTTTTCAGTAAAGTATTCTCTGCAAGCACTGAAATTATCGGTAACAGATAGTTTTGTGATAAGATAATTGGTAACGAGCTAGTTTTCATCACGCTCATATGATTCGCGTTCGGTACTTTGATAATTTGATATGTGGGTGTACCGGTGCTTGGGTGCTGCCCTTACTTGGACAAGCGTCCCACTTATGATTAACTCCTATTGCAAGCATCTGCAACTACAAAAGAAGTATTAAGGTAAACCTAACCATAGCATGAAACATATGGATCCAAATCAGCCCCTTACGAAGCAACGCATAAACTTGGATTTAAGCTTCTGTCACTCTAGCAACCCATCATCTACTTATTACTTCCCAATGCCTTCCTCTAGGCCCAAACAATGGTGAAGTGTCATTTAGTCCACGTTCACATGACACCACTAGAGGAGAGACAACATACATCTCATCAAAATATCAAACGAAAACCAAATTCACATGACTACTAATAGCAAGACTTCTCCCATGTCCTCAGGAACAAACGTAACTACTCACAAATCATATTCATGTTCATAATCAGAGGGGTATTAATATGCATTAAGGATCTGAACATATAATCTTCCACCAAGTAAACCAACAAGCATCAACTACAAGGAGTAATCAACACTACTAGCAACCTACGGGTACCAATCTCAGGCTATGAGACGAAGATTGGATACAAGAGATGAACTAGGGTTTGAGAGGAGATGGTGCTGGTGAAGATGTTGATGAAGATTGACCCCCTCCCGATGAGAGGATCGTTGGTGATGACGATGGTGATGATTTCCCCCTCCCGGAGGGAAGTTTCCCCGGCAGAACAGCTCCGCCGGAGCCCTAGATTGGTTCCGCCAAGGTTCCGCCTCGTGGCGGCGGAGTCTCGTCCCGCAAGCTTGCTTATGATTTTTTCCAGGGTAAAAGACTTCATATAGCAGAAGATGGACACCGGAGGCCTGCCAGGGGGCCCACGAGGCAGGGGGCGCGCCCAGGGGGTAGGGCGCGCCCCCCGCCCTCGTGGCCAGGGTGTTGGCCCCCTCTGGTATTTTCTTCGCTCAGTATTGTTTATAATTCCCAAAAATAACTTCCGTGGAGTTTCAGGACTTTCGGAGTTGCGCAGAATAGGTCTCTAATATTTGCTCCTTTTCCAGCCCAGAATTCCAACTGCCGGCATTCTCCCTCTTCATGTAAACCTTGTAAAATAAGAGAGAAAAGGCATAAGTATTGTGACATAATGTGTAATAACAGCCCATAATGCGATAAATATCAATATCAAAGCATGATGCAAAATGGACGTATCAGCGGCGTCCACCTCTGAGCCGTCATTGTTGCCGTCCTCTGTTCGAGCCGCTCTTCGTGACCCGCTCAGGATGGCTGCGATGCAAGAGGAGTTTGACGCCCTATTGCGCAACCGGGCGTGGCAGCTTGTTCCCTGTCCCCGGCGCGCCAACGTGATTACCGAGAAGTGGGTCTTTAAACACAAGCTCCGTCCTGATGGTACCCTTGATCGCTCTAAAGTGCGTTGGGTCGTTCGTAGCTTCCGACAACGTGCTGGCATCGACTTCACCGACACCTTCGCTCTGGTCGTCAAGCCCGGCACAATACGCACGGTTCTCCACCTTGCGGTCTCCCGTGCTTGGCCGGTGCACCAGATGGACGTCTCCAACGCCTTCCTCCATGGTCACCTCGAGGAGAAGGTCTTCTGCCAGCAGCCCACCGGGTTTGTTGACCCGGCGCTTCCCGACCACGTGTGCCCGCTTTCGCGGTCCTTGTACGGACTCAAGAAGGCTCCGCGCGCTTGGTACCAGCGCATCGCAGCGTTTCTCCACCAGCTTGGGTTCCGTTCTACCCGCTCGGACGCCTCGCTCTTCGTCTATCATCAGGGCTCTGACACGGCCTACTTGCTGCTCTATGTCGACGACATCATCCTGACGGCTTGTACGGCTGGTCTCCTCAGTCAGCTCAAGGCTCGTCTTCGCGCTGAGTTCGCCATCAAGGACTTGGGTCCTTTGCACTACTTCCTCGGTGTCGAGGTGGTGCGCCGTCCGGATGGCTTCTTCCTTCATCAGCGGAAGTACGCTCACGAACTCCTGGAGCGCGCCGGCATGCTTAACTGCAAGCCCGCCGCTACGCCTATTGATACGAAGGCCAAGCTTTCTGCCACGGATGGTTCTCCTGCTTTGGATGCCGCTTTCTATCGGTCTATCGTTGGTGCTCTCTAGTACCTCACTCTGACTCGACCGGAGATCTAGTATGTCGTGCAGTAGGTGTGTCTTCATATGCATGCTCCTCGAGACGTCCACTGGGCTGCCGTCAAGCGGATTCTCCGCTATATCTGTGGCACTATGGATCTTGGCGTCACGCTTCACGCCTCCGCCGACACCGCCCTCACCGCCTACTCCGATGCAGACTGGGCGGGCTGCCCTGACACTCGTCGCCCCACTTCGGGCTATTGTGTCTACCTTGGATCCTCACTTATCTCGTGGTCGTCCAAGCGGCAGCCTACGGTCTCTCGTTCCAGCGCTGAGGCTGAGTATCGTGCGGTGGCCAACGTCGTCGCCGAGTGTTCGTGGCTTCGCCAGCTGCTTAAGGAGCTCCCTTCCCCTATTGACCGTGCCAGGATGGTCTACTGCGACAATGTCTCGGCGGTCTACCTCTCCGCTAACCCGGTGCATCATCGACGGACCAAGCATATTGAGTTGGATATTCATTTTGTTCAGGAACAGGTGGCCCTTGGCCTAGCCTTCTAGAGCTTGTTGCATGCCACTGTTATCTCTCAAACGAAAGAACATATAAATGTATCGCGATCCGTGCAGGTTATCAGTGACAACAGGCAAGGATCTCAAAGCAATGTTGGAGGGATGAGGATAAGAGGTTTCATATAGCTCGGCCTGCACAGGAACTTTCTGTATCTCCATTCACCGTTGTGCCGCCCTTAAATTGTTTCCGTAGGGTTCAGCCCGCGTAGAGCTTGCCGATCTGTACGGCAGTGTATCCAGCAGGGACAATATGATAAGTGGATACAGTAGCTGCATTTCCGTGTACCTCCTATACCCAACATATTGCACCAGCCACCCCAACTCATACAAGTTGTCAATTCTTCACTTTTTCATTCTTGCTAGTTTGGGTGCTACTATCTTGATAAGATGCAGACGGTCAGGAGGCTATGAGAACATGACTCCATAGAAAGGATATCCTTTATAAGAGTTGTTCAAGTTTATAATAGGAGGAGTTGGTGAGCGCATTAGATATCCATAAATTGAATCTAAAATAGAAATAAAGTCTCAAGGTTTACTACTTTCTATTCAATGGTATTTGCGTTATGTCAGTAATTTTGATGATGGGGCATTGGCAAATGCATCCATGTTGAATTTAGTGACGATTAGTCCTACCACCATAATATAGGCTACCAAGGTGAACTCGAGAGTGATTATCATAGTGGTCAACATCGCCAAATGGCGCCACTCCGTGTAAATCAACTCCCAAAACTTCGTCAGTTCCAACTCACTGCCAGCATGGTGGCCCACATGGTCGACTTTAATTGTCTCCGCATATTTCACAGGTGCACTGAAACTAACTCCATTGATTATTCACGCTCACACATTTTTGCGATGTCCTAGCACTCTCTGAGTCCATTCACATATGTTTCGATGCGTGCTGTTGATGATCGTGTAGCTACTTTAGGTGAACCTAATCATAGACACCCTCAGCGCGTTCATAATACAGCTACCAACCAATACTTCCTCTGATCACCACGATGGATACCAGTTGATCCCCACCGGACATGGACAAAGTGTCATGTGATGATATTTTAAACATGTTTTGTTCTTGCTTCTTTGTAGGAAGAAGAAGAAGAAGAAGAATCTGTGCTTTACAAATTGACTTTCCATCTTTAGTTTTTCTTCTGATATGTGACACCGGAATGGATTAAGATGGTGATTACACTTCCGACTTATTTGAGACTTTTCGATCAAAGTTTTCATCCGATGCTTTCTAGGTAACAACATATCTGAAACTTCTTAACCATGTCGGTTTCCATCAACAAAGGATTAAATGTTTCTTACATATAGACAAAAATTTCTTAGTAGAAAATTCCACCCAGAAACTCCTTCGGTTTCCATCTAGTAGTATCCTTTCTTTGGGCTTGGTTATAAGTTTTTGATGCCTCTAGAAGCAAAAGTTTAAATGAACACCTAATTTTTAGTTTGCTCATGGGAAGCATTTATAAATAATGCACTACAATCAAGAAGCACGGAAATAGTGGCTTCTGCAAGGCCGTAACTCCTACCAGCTTCTATTTTTTTGATAAAGGACATTTTATTGAATTGATATATCGAGGTGATACAATCGCATCGAAAGAATGCCCGACCTCTGCATAACTCCATGCACACAGCCAAAAAGTCCAACCGATCCAAAAAAATAAAATCGTCTTACAACTTAAAAAGATAAATTAGTCCAGCCTATGATGTGGCAGATCCTATCCGGAGATCACACCGCCATCCATGGGGGAGAAAACCTCCCTGGCTATACGCTCCAGCCGCGTAGACGCCATCATAAAACGGTCCCTGTCCTCCGGCCTCTGCAGGATATACCAAGTACGGAGCCATCGCGTACATACATGAATAATCTGCATAGGAGATGAAACACATTTTTTATTAAAAACCACATCATTCCTGGTAAGCCACAATGCCCAACATAAGGCAGCCGCCCCCACAAGAATATGTGCACAAAATTGTTTATCAATACCCCTCAACCAGTTGCCGAACATGTTACATGCACTAGGTGGTGGGTATAAATTTGAAGCTACTCGAACTATGGCCCAAACCGCCCAAGCGAACTTACACTCAAAAAATAAGTGCTTAATAGACTCGTCGTGTTGGCAAAAGACACACGCCTTGGTGCCTTGCCAGTTGCGTCGTGCCAGATTATCTCTAGTTAAGATGACCCCTCTGTTTAGGAACCAGAGGAATATCTTCACTCTTAGAGGGATTTTAAGCTTCCACAATTTCCTGTTATTAACTGGAACATCACAATGAACCATTGCATCATACATGGATTTGACTGTAAACTTGCCATTCCGATGCAAATTCCATCAAAAGATGTCCGGTTCATCTGACGGCTGAATAGCCTCTAGACGTATGAGTAGCTCATTCCAAGCTGCCAGGCGAGGTCCTAAAAGGTCCCTACGGAAGGAAATATCAGGGTTTTCTTGTCCCAAAACTTGTTTGATGGTGACAAATTTATGTCTAACAATCCTATACAAACTCGGGTATTGCACCATGAGTGGTGTGGTCCCTAGCCAGGTGTCTTTCCAGAATCGAATCTGGGAACCGTCCCTAACCGAGAAAGTCCCAAATTGGAAAAAGAATTCCTTGGGCTTCATGACTCTAGACCAAAAATGTGAGTCACCAGTTTTCCAATGGACTTGAGAAATGGCCTTGGATTCCACGTACTTGTTACGAATGATTTCCTGCCACACTCCATTCTCAGTGAGTAGTTTATAAACCCATTTGCTGAGAAGAGCAATATTTTTAATCTCAAGGTCCTGAATTCCAAGTCCCCCTTGACTTTTAGGTCGACATAATACAGTCCACCTAGTCAGTCGATATTTCTTTGATTCATTATCACACTGCCAAAAAAATCTAGATCTAAAGTAATCGAGACGCTGAAGAACCCCTTTCGGTAGATGGAAGAACAACAACATATATAAAACCATGTTGCTGAGGACGGAATTGATCAAGATCAATCGCCCCCCATATGACAAGAGTTTGGCTTTCCAACTGGCTAGCCGTTTCTCAAGTCTCTCTTCCACGTGCTTCCACTCAGCGATAGTTAAACGCCGATAGTGTATGGGAATACCCAGATACCGAATCGGGAACTGCCCGAGCTGGCATCCAAAAATGTCAACATACTTAGGTGCATATTCTGCAGCATCCCCGAAGCAAAAAAGTTTGCTCTTATGAAAATTAATTTTGAGGCCAGAAAGTTCCTCAAATGCACATAAAAGCAGCTTGAGATTTCTTGCTTTATCTAGATCATGATCCAAGAAAAGTATCGTGTCATCTGCATATTGTAGGATAGATAAACCCTCTTCTACCAAATGAGGAATGACACCGCTAACCTGACCGGCCACCTTAGCCCGCTCAACAAGGGTAGCTAACATGTCAGCCACAATGTTAAACAAAATGGGTGATGCGGGGTCCCCTTGGCGAAGCCCCTTCCTTGTCTGGAAATAGTTGCCAACCTCATCATTAACTTTGATGGCCACACTACCTCCAGAAACAAAACTCTCAACCCATCGACACCATTTTGGTGAAAACCCCTTCATGCGTAAAGTTTTCAACAGAAAGGGCCATTTAACTTTATCATAGGCTTTTTCGAAATCTATTTTAAAGATCACTCCATTCAACTTTTTGCGGTGAAGCTCATGTACCGTTTCATGCAGCACAACCACACCATCTAGTATGTTGCGTCCTTGCATGAATGCTGTTTGAGTGGGCTTGACGACATGATCAGCCACCCCGTTCAACCGGTTAGTTGCGACATTCGTAAAGATTTTGAAGCTTACATTGAGAAGGCAAATCGGTCGATATTGTTGAATACGACTGGCCTCCTTAATCTTAGGCAGTAGGATAATCTCCCCAAAGTTTAAGCGGGAAATATCAAGGTCTTCGGTATGCAGTTGGTTAAGCAACTGAACCAAGTCCGCCTTGATCACATCCCAAAAGCATTGATAAAACTCTGCCGGAAAACCATCCGGTCCCGGAGCCTTGTTGTGTTCCATTTGAAACACCGCGGTTCGAATTTCCTCTTCAGAAAACGGAGATGTTAAGAATTCATTTTCCGCTTTCGAAACTTGAGGGATGTCATTTTCCTACCAGCTTTTATACCCTTGTTACATGAATGCTCTAAAAGTTGCTCTGACTTGTTGTATGTATACCTAAAATTCCATTACTACATATATAGACATGTTTATGATTAATTTGCCACCTTCCTTGTTGGCCCGTCATCCGTCAACCAGGTTGCAACCCCAACCTCCCTCCTTTCCCTCCAACTCAATTCACTGTTGCACACCACCCTTGAATTGTTTCCATGTAGTACAACCCACACATAATGGATTAGCAACAATATGCTAAGTCACTACAAAACACACGATTGTTAGTAACAAAAATCCTCATGACGGGAAAGGAACTGTCACCTAAAATCATTTTCCGTGATGGTGGTTGTCACAAACTAATGCCGGCCCGGGCATCTTAGGTGATGGTCCGGTCTGATTTTAGGTGACGCTTTCCAGTGTCACAAGACATATGCATGTTCGGTGAAGATTTTTAGTGTCACCAATATCTTGGATGGGTTAGTGAAGGAAATATATAAATAGAAAAAAATTGGTCTATGAAATTCGAACTCGTGACCTCCCACATTTGTGCATGTAGGACTCAAAGTTTGGTCGCTAGGCTAGTGTTTAATTAGTGATAATACTTTGTAGCTCTATTTTTAGTATGTAGAATGGGACTACATGTACATTTCAATGAAATAAATAAAACAAAAAACACCTTACCTTGAGACTAGTCTAATTAAAAAGAAGACCCCACATGTCATGTCTTATTTTGAAACCTCCAAAGGAAAAATAGGTGTTATTAATGAGGCCTCAACCATGGCCATGGGCCTCATGTGAAGAGAGAGAGGTTTATTACTGGGCTAGTGTTTTATGAGTGGTAACTTTGCAGCTCAATTCTTTTGTAGTATTTCCAATGGCACTACATGTGCATTTCCGTGAAAAATAAAAAAAATCGTGTTCACTTGAAACTATTCTAATTAAAAAGTGGACCCCATCTGTCTTGTTTTATTTGAAAAGTAGGTGCTACATATGGGATTTGAACCCTTGTCATGGGACTCATGTGGAGAGACAAAACACTAGCCATTTTATATATGTTGCCTTGGTGTTGAAATAAATGAAGTTGCCCTACTTGGGTGCATATGTTACTAAGACGTGCAGGGTTTCGGCCTCAAGGCGGCTTCAAAATGAAAAAGTTCTCAGCATGAAAGTTTTTCGCCTCGTCGAAGCGAACAACATAGCTTTTTCATCACCTTAATCTGGTATCACATGCAATCTCCACAGCCGATACAATGTGAAAACTTTTGACCTATGTGAAATTCTGGACACACTTGTCCGAATTTGAAAAACATTTGCTTACACGATATCGATACTTTTGCATGTGCTCATCTCATGGCTTAGGAGATAGGTGAAAAGTCACATGAGAGTTACTAAAACTCTCAATGTACTTTTCTTTGACTGGGTGGATCTACTAGGATGTTTCTTAGACATTCAAGACAAATTATGATGTTTCCAATAACCAATTGTTCTGTTTGTACATGTAACTTTAAAAATGGACTGGACCATGTACTTCATCATTACTACTGATAAATTTAGCTTCATATTGCCATTTGTCAAGTCATACAATGATTTTCCTACTTTTTAAATGTCTAAAAATGAGTACGTTAAGCACAATGTAAAAATGTTTATAAACCATGAACTAAACCATGTATTACAGATACTTTCTAGTTTTGATATTTTTCTAGATCTCAATTTCAATTTTAAGGCTTTAAATGCATTTTCTATGCATTTTTCATCAAAAATAGCAACCACCCAAGTTCTGATAAAAAATGTGAACATTTGCATCGACTGATATTATTCGTTTAGGATATAGGTGAAAAGTTTGGTGATATTTAAAAGTAATCTTGTACTTTGCTTTGTAATGGGTCGATCTACTAGGATAATTCTTAGACATTCAAGTCAAATTATGAGGTTACTAATGAAAAATGATTTTATATGTACATGTAACTTTATTTTATAGTGGACCATGCCATGAAGTTCATCGATAGTATTGAGAAACTTAACTTCATATTGCCACTTGTCATAGTCACAATTTCTTTGTCCTACTTCACAAATACTTAGAAATCGGTACCTTGTGAAGCACCTTGCACGGATATTTATCCAACATGTTCTAGACTTTTTGTACATGAACTAAACAACAAATTAGAGATAATTTGAAATTTATGGTTTTTAGATCCCATTTGCTACATTTTAGAAATGAAATGCACTCTTTGGTTTTTTAGTCAGAAAACAGAAACCAACCAAAAACTGCTCGAAAAGTGGTAAACTTTGCATGGGATCATGTACGGGTTTAGGAGTTAGGCGATAAAGTCTCACAAGATTTGACAAAAGTTTCCTTCTTCTTTGCTTTGTAATGGGTGGATCTGCTAGGATATTCCTTAGACATTGAGGTCAAACTATGATATTTTAATGTCATATCATTTTATATGTACATGCAACTTTAAAAATTGACTAGACCATATAGTTCATCGAGAGTATGAGAAATTTAACTTCATATTGCCACTTGTCATGTCATAATATATCTTTCCTACTTTGCAAATACTTACAAATAGATACATTGTGGAGCACCTTGTATTAATATTTATCCATCATGCTCTACACTTAAAAAAATGGACTGGACCATGAACTTTACCATTAGTCTTTTTCAAGATGCTCCACATCATTAGACTTTACCATTAGTCTTGAAAGACATAACTTCATATTATCACTATCATGTCATAATATGTTTTTTTGTACTTCGTAGATGCCTAAAACCTAGTACCTTGTGGAGCACCTTTCAAAAGTATCCATATGAAACACTCATCTGCCTTCAAGCATCTTCCTATGCCTTCACGCGTCCGCCTCTCTCATCTTCCTCTGCCTTCGTGTATGAGAGCCTGAGCCTCCAGCCTAGCCTTTCCTCCTTCACCTCTTCATGTGTTCGTCCACCGGGAGAAGGATCTCACCCACGGATCTGGCGCTCTTGTTCAAATCCAGCTAGGAGAGGCCTCGGGCCACATGCCGGCGAGGTCCCCTACTTTGTGCGGCAGGGTTGGCATCATCCTCGCCATATCCATCTCCACCATCCCTCCTCTCTCACCGTCACTTCATCACCGGCGTCCTGATCCTCAACAACAGCTTGTAGGATCTGGCACCAGGGCATGGAAGTTTCCATCTCATGAGGCCATGGGCTCCGTGTTCAGCGGTGCGGCAACAGTCGGCGTGACAAAAATGGCCTCTCGGGTGCGTGTGGATCTACATGCGGAGCTTGACAAGTTGACATCCAGTGGTCACACCATGCCTGAGATGCGCCATTCAATGGTCGTCCGGTGCAGGAAACACAATGGGCCGGCGAGGAGTTTTGATTTTGTTGGCTTTGGTATTTGGTATTTTCTCCATGTATAAACCAATGGTCAACTTATTTATTCAATGATTCTTCATATTATACATATATATATATATATATATATATATATGAATGGAATGGTATGTATTAGGCGAATTGCATCATGTCACTAGCCAGGTAAAAGAGCATACTTTTTTGTTTTGTGAATTGTTTACTGATGGCGTGCTGTCAATAAGTGCACATCATAGGCATGTGTGCTCATTTGTGATGGTAAGATTAAAGGCACACCACCAATATTCCTATTAGTAGTGGCGTGGAGGTTGGAGGCACACCACCAATATGTAAAATACTGATGGCAAGTGGGCCACATGCCACCAACAACCACTTATCAGTGGCGTCATATCGGTGGCTAAGGCCGTGGGGCCCCTATGCCACTAAAGTAGTTTTTGGCATGCCATTAGTAGGGTTTTCTATAGTAGTGACAATTTTTCATGCAATAGTCATACAACTCATGGGTTGGTGTGGGGCGTGCTGATGGGTTGTTGTAGCGTTGTGAACCATGGGCTAGGAACAACCCAACAAAAAATAGCGCGCGAAAGAAGAGAGAAAGTTCTGGTTGCATGCTTCATGGGCCGGCCCATTATGCGGTTTTCCTGTGTCTTTTTCTAGCCGGTTATGGGAACGTTTTATATCCTCCCCTAAACCGTTTTTTTTTTCACCTTTTCACTTGTTTCTTCCATTTTATTTTTTATTATTAGCATTTTTATTTTTAAATTCATGAATATTAATGTGTTTTTTCTTTCGGTTTTTTTGATTTCTTTCTTTCCACCAATTTTTCCTATTCAGTTTTTCCATTTTCAAATTCCGAAGAATTTTTGAAATTAGCAAACCTTTTTGAATTCATGAATATTTTCTAAAATTCACAAACATTTTTTAAAATTCTCTTGCTTTTATAAATTTGTGAACATTTTTTCACTCAACGAACATTTTTCATTATTTGGGAACAATTTCAAAATTCATGAAGATTTTTCAAATTTGCAAGCTTTTTCGAAATCCATGTAAATTTTCAAATTCATGAACACTTTTTTGAATTTATGAACAAATTTTGAATTGGAGAACATTTTGTTTGAAATTAATGACCTTTTTGTATTCCTGGATAGTTTTTGAAATTCATGAACAATTTTCAAATCATCATTATTTTTGAAATTAGGAAAAAAAATAGATTCATGATATTCTTTGAATTTTGACCGTTTTAAGACTTCATGGACATTTTATGAAAACCCTAGAGATTTTTTAAATCATGGACTTTTCTCGAAAGTCAGAACATTTTTTAAATCCTCAAAAAATTTGAAATTGAGAACTGTTTGTGAAATTTCAAATATTTTTAAAAATTATTCATGAAAAAATTGAATAAAAAGAAAAAACAAAAAAAGAAAGAACAAAAATGAAATAAGACAAGAGCGGCCAGGCCGCACATGAGCTGGCCTAATGCGCGATGGGTGAGCTGTGGGGTGCGCGATTTGTGGCTATCTGCCGACGCACACGACAAATACAAGCTCCTGTTTGGGCCATCCTTTTTCGAGCTATTTTGGTCCTGGTTTTCCCAAAAGGAAGAGAGGAAAGAAAAGGAAATGAGCGAACGGCCCAAGAGAAAATTCAAAAGAGGGAAGAAAGCGTTCTGGCCATGGTATATGTGGCATGGTTCGTTGAGGTTTAAAAGATGAAACAATAATAAAATAAAAATGGCCTCGAAAAATATGATTAAATTAAACTAAACATGAAGATTCCAATAAAATAGCAGTTAGGGTCAGCAACCAACTTAGGGTGCTTAGGAAATACTTTTAGCTACCATCAAGGATCTGGTTCAAAAACCTTAAATCATGCCACGAGGTGACCTGGTTGTCCAGGACTCTTTTTTCAGTCTACAGCCTGACCATGTCTATGGTGCCCTCTAAGATTAGCAGATGCGGAAATTTTCCTTCCTAATGTGTCTCATCCCCATCATGTATGGAGGCCACCGTCTATCATTATCTCCCCTTATTTCCTTTGAGTCTCCTATCTTGATTCATTCCTATTAGGAGGGGTTCCTATTACCCATGTGTTACCTGTTAAGATGTGGTATGTGGATTGTGTATGTAAAACGGTGGTCACTACATAGCACACATATTCACACAAAATGTCTATCTACACAAATAATGTAATTACCCACACAATTGCCTAGACATCACTATTTATACCAAGAGCACTAGCTACCAGTTTCAATACTATAGATGAAGTTCTATAATTGGTAGCAGGGCTAGGCCCACCTACCCAACAACCTAAGAGATTCTTTTCGAGCCTCGTAATAATTGTAGTTCAATTACGTTCTTGTACAATGTTGCATCTAATTCTCCCTTCTCGTATTTTATTAACAAACCATTTGCTAATTTCAATTCAATGGCTGAAAAACAGGATCAACTCATCATGGAAAGAAAATAACTCTATCGGGCCATGATGTGCACGCTGGTTAATTAAGCCTTCAAACACTTTTGTGCACTCATCAATAGATTCGAAAATAACTAAAGGCATGCCCATGCTTGAAATACTGCTCGCATCGCCGGAGGGGTGGGGGTTGAGGCGGCTCAGGTGAAACCCTAGCTGCCCCCACCATGTCACCTCCTTTCCTCACCTCCATCGTCACCTTCAAATGACGCAAGTGGGCAATGTCCTCTCGGCCGGCGATAATGGCGGTGATGCCTTCATGTGCGGTAATCTCTCGCACAAGGAGCTCTCCAGTCATGCGGTGCGGTGATCTCAGAGGTTGTGACATATTCAATGGAGCTTGGGTGTCGCAGCAACATCCCGGGGTGCCCTAAGTTGTTGTGATGCCACTATGTTGTGTCGGAGGCGGCCGTTGGCGCGGGAGGCCGCGTGTGATGATGGGCCTTTGTGCTTTGATCTGGCAACGGCACCTCGTGGACTAGTCGGTAGTGGCAACAACAAAGCGACAACGGTGGCGGTGACACAAACACATGCATAGGAAGGTCGGGGTGATGCGGCTAAGGCTTGTCGCAACCACAAAGTTGTCGCCATGTCTCTGCACTATTGTCCCCGTCTCCTCAGCACCTGATTTTTGAAGCAAGTGCGCGTAAGAAGGATTCTGGTGATGTTTGGCTCTCTCTGTTTTGTGAGAGTTTTATGCTCGCATGCACAGATTCGATCATGTGGTGATATCTACGCTAAGGATGTGCACACGAGCGGCTACCTTTGAGCGTGAGTTCCATCAAATGGTTGGGATATTGATTTTCGTTACCATGGTGTGTCGATATCTTTCCATGCAGTTTCTTCTTCGGCAAAGGGTTGTCTGCAACACATGGTGTCTTTGGATTGGTGCACTACAAAAAAAAGACACATCCGTGATGATACGCCTTTGTCAGGGTAGATCACATTTTCTGTCACTCATGTATATCCGTGACGGTTTTATGAAAAATCATGATAGCCATACTTGTGCTGTCGAGGATGTGTTACATGACAAAATCACTTTATTATCATGGAACTGTCCACTTCCATGAGATTAAGGGCCTGTACTGAAGTCCTCCCACTCCACGCTTCTCCAACTTCAGATGTGGAGTCGGACAGAACGTTTGAGCTCCGTGGAGTCAGCTTTAGGGCTTGTTTGGGACTGCTCCGCTTCACTAAAATCAGTTTCACTCCATCAAATTCACTTTAGAGCAGTTTCATACAGAAGTTATGCATACCAAAGAGAATGTTTGGCTTCCATGTAGCTCCAGCTTCAAGAATGGAAAATTTGGTGAAAAGGAAATATTTGATTGGATGAGAGGGGAGAAACGAAGGGGTATCCACTTACTGGTGGCAGTGGTGGGTAATTTCCCCCCAACTCCAGCTTCTAGAGTTTTTTGAAGCACCCCCTCAAGAGCTTCATAAAAAACTGGGAGTTGTACCCCAGATTCTAGTTTTTTTGTGAGCGGCATATCGTGGAGCTACCCTGTTTGGCTAATGTTTTCTGAAGCGTAGCTGAATTTTAAGAAGCAGAGCAGTCCCAAACAGGCTCTTAAGAAGCGGTACAAGTCTGTAGTGCAAATTTCTGAAGCTGCTAAAGCCCAGCTTCACAAAACAAAGAAGCGAGGAGCTCCTACTAATTACAAGAGGATGCCACCGCGAAGTATAGAAAACGATTCGCGAAACGGCTCCCAGCCGCTCGTGGTATGCTCGCCTCGCTAGTTTCCTGTGCGAGCGCACGTGGCCAGCCCTCCTCCACACAACGATACAAGGTGGACTGCCTCCATCCGGCCCAAACTGGCACCCAACAGGCTCCCAGCTAGGACAAATCGTGAAGAGAAGCTACAAACACTGTTGAACGAATGGAATCGCCAGGTGAAGTTCGAAGCAAGCTCCAGAAGCTGGTTTTGTGGAGTTTGAGAAGCCCAAAGAGGTTCAGAATAGGCTCTAAATAGCACATCATAATTATATTCGTGAAGGGTTACCAAAATCTGGCAGTGATATGTCTCCAACGTATCTATAATTTTTTACTGTTCCATGATGTTATATTATCATTATTGGATGCTTTACAATTATTTTATAGCAACTTTATGTCATTTTTTGGGACTAACCTATTGACATAGTGCCCAGTGCCAGTTGCTGTTTTTTGCTTGTTTTGTACTTCGCATGAAATCAATATCAAACAGAGTCCAAACACAGCGAAACTTTTTCGAGAATTTTTATGGACCAGAACACCCAGGATGGGCCAGAGAAGTACTAGAGGGGTGCCCTGAGGGGGGCACAACCCACCTGGACGCGCCTGGGGGCCCAGGCGCACCCTGGTGGGTTGTGCCCACCTCGGTGGCCCCCCACACTTCCTCTTCGCCCTATAAATTGTCAAATATTAAAAAACCAAGGGTACCCCCTAGATCGGAAGTTCCGCCGCCGCAAGGCTCTGTAGCCACGAAAAACCAATCTAGACCCCGTTCCAGCACTCCGCCGGAGGGGAAATCATCACCGGTGGCCATCTTCATCATCCCGGCGGCCACCATGATGAGGAGGAAGTAGTCCACCCTCGGGGCTGAGGGTTTGTACCAGTAGCTATGTGTTTAATCTATCTCTCTCTCGTTCGCTCGCTCTCTCTCTCTCTCCCCCTCTCGTGTTCTTGAGATGGCATGATCTTGATGTATCGCGGGCTTTGTTAATATAGTTGGATCATATGGTATTTCTCCCTCTCTATCCTGTTGTGATGAATTGAATTTTCCCTTTGAGATTTTGTTTTATCGGATTGAATACTTTTATGGATTTGAGAGCACTTGATATATGTCTTGCATATGAATACTCGTGGTGACAATGGGGTATTATATTGATTCAATTGAGATATGTTTTGGCACTCAACTCGTGGATTCTCGAGGTGACATTGGGGTAATCTATGCATAGGGGTTGATGCACGTTCTCGTCTTTTGTTTCTCCGGTAGAAATCTTGGGGCACTCTTTGAGGTTCTTTGTGTTGGATTGAGTATTATGAATCTGAATTTGCTTTGGTGTTATTTTAGTACGAACTCTTGATAGATCGATCGGAAAGAATAACTTAATGTCATTTTAGTACGAACTCTTGATAGATCGGTCGGAAAGAATAACTTGGTGTTATTTTAATACGAAGTCTTGGATAGATTGATCGGAAAGAATAGCTACAAACAATTTTTTTCTTATGTTCCCCGCTAGATAAGAACTTTGGAGTGATTCTTCATCACACGTTGAGGGATGGTTATATGATCCAACTAGATTAGCATTGTTGAAAGATTGCACTAGCTAAAGTACGGACCCTAGGCCTCATTTTCAAGCATTGCAATACCGTTTGTGCTCCGTTTTATCAATTGCTACTTTGCTGTTTTTTATTGTTCCTATTATAAAAAACCAATATCTACTATCATTACTACGCTTTTATTACCATCTCTTCGCCTAACTAGTGCACCTATAAAAATTACCATTATATTTGGTGTGTTGGGGACACAAGAGACTCTTTGTTATTTGGTTGCAGAGTTGTTTGAGAGAGACCATCTTCATCCTACGCCTCCCACGGATTGATAAACCTTAGGTCATCCACTTGAGGGGAAATTGCTACTGTCCTACAAAACTTTGCGCTTGGAGGCCCAACACGACTCTACAAGAACAAGTTGTGTAGTAGACATCAGGCAGCAACTGTAATGGGTCATCACTAAGCTATCAGGTGCGGGTTCCAGATCCAATACCAGTTAACAACCCCGACCAATGACAAATTTCCACATGTTGGCTTCTCATTTGTCAACGGAGCCACGCGTCAACTCTTCCTTGTGATAGGTGTCACTCATCCAACGGATGATATGCGCCTATGAAACGAAGACACATGGCATGGCCCAACATTGGCCAGTTATAATGGCCAGCCCAGTAGGAGGCCCACAAGATTTGGGCACAACTTAGCGGGTCAGCCCACTAACAACCCTCTTGCAGATAGCTCAATTACAACTCTAGTCCATACATCCTAGTGACAATTCGGTGCGTCACCGCCCCGTTGGGTCTTCAGCATCATTACGACCCTTTGGTAGTTCTGGCCCATTAACAACCAGCTTTGTCTTTGGCCCAATTATGACCCATTGTGTCTTCCAGCCTATTAAAGGCATGTGGTAGACTCAGACTCATTTGCTGCCCAATGTTTCTTTCGGCCTGTTAGCGGCTCGTGGTGGAATTGAACCGTTTTCTATGTGATGTGTCTTTCGGCCTATTAATGGCCTAGGGTACACTTGGGCCCATTTACAACCCGATGTGTCTTTCGGTCTGTTAATGGACCAAGGTACACTTGGGCCCATTTGTTTTCCGAAGTGACTTTCGGCCTGTTAAATACACATGGTATATTTTGGCTCATTAATAACATGAGTTGGCTTTTGGACTATTAATTGTTTGTGATGTAGTTTGGCCAATTAAGGCCTGATTTCATTATCGGCTTGTTAATTGTCCGTTGTCTTGTTGGTACGATATGCCTTTTGGACTGTTAAAGGCCCGTGGTATCTTCTGGCGCATTTTAACAACCCATGGTGTGTTTGGGCTAAATGTGGCCCGAGGTTTATTCGGCCTGTTCACAGGTACTGGTGCGTTTGGTCCGGCCATACATTTCGGCTTGCTAATAGTTCAAACTGATTATGGGCTCATTTAAATCCCATAGACCGTGTCGGCCCATGAATGGCTCGTGATGATTTTGGCCAAGTTAGATTGACCGATACTATTTTGTAGTTGCGTTAGGACAATTCGAACTGATTATGGGCCCATTTAAAGCTCCCGCTTCAAGTTCATGCGATAGCACATCGACCTTCTGATTGTTAGGTTACCAAAATTGTGGTGCTCGTGCCCTGGTTTGTGTGTTTAGCTCTTTCTGATTTGTCTTCTGATTTGTTTCTATTGGTGGGAGGGATGCAAACTCGATAATGGCAATGGCGGTCATTCACCGGGGTGATAATGTTCTCAGTTTTATGTTTGTTGTCATATTTCTTAGATTTTGAATTTCGTGATGGTGATTACTCAATAGTTTTTTAGTTCGTTAATCATTTACTGATAATTTTTCAGTCCCATTTAGCATATTAGTTTGTAAGATGATTAATAGTTTTTCACATTTTCTTATTTCAGTCTGTGTTCAGTTCATCAATTATCAGTTAAACTAGATTTCAGTTTGTAGTGTTTTACTTTTGATTTTTAGTCTTTGTTTATTTTTGAGTCTTAATTTTTCAGGCTTGTATGTCTATGTCTTAGTCATAGTTCTTTTTTCAGTTAGCAAGCTGATGAATAGTCAGTTAGTTTTCAATTTAGGTCATTAGTCATTACTTATTAGCCATGTTTAGTCATCTATTAGTTAGTTCATCAGTATCTTCAGTTAGTCAAGTGTGTTCAAATTATCAGCTCATTTCATTTAATCTAACCTTCACTCGTTGTATAGGTTATCATTGTATTTATTTTCAGTCTTTCATCTTCTTCGAGTTGATCAGTCCATATTGTCTCCCTTAATAGTTAAGTTATTTAGTCATCTATCAATTACACTGGTAGAAAATGGGCCTTTAGTCCCGGTTCGCAAAGGCCTTTAGTCCCGGCTGTGCAACCGGGACTAAATATGCGCGACTAAAGACCCCCCCCCTTTAGTCGCGCCTCTTACGAACCGCGACTAAAGGCCCGTCCACGTGGGCGCCAGGGGTCCGTCGGGGCGGAGGACCTTTAGTCCCGGTTCTCGTGGCTAACCGGGACTAAAGGCCCGTCCACGTGGGCGCCAGGGGTCCGTCGGGGAGGAGGACCTTTAGTCCCGGTTCTCGTGGCTAACCAGGACTAAAGGCCTCCTCCGCAGGTTTAGGGTTTTAGCCCCCCTAAACCTGGTTTCTTTTTAATTTGTAGTGTTTTATTTCTTTTATATTTTATTTTGTGTTTTATTTTAATTTTGATGAAGTTTCAGTACACATATTCTACGCTACTATATACATGCATATGAAATTTCAAACAAGAAGAATTCAAGAGGAATATATAATATATATTCAATCTCGGGTGACCATATACAACTTCGAACAAGTTTCCATACACAATTAGGATGGATGACCATATACAACTTCGAACAAGTTTAAATCTCGGGTATGCATATAAATTTCTTCGTCCTCGGTATAGTGTTCTCCTTTAGGATTGATGACTTCCCTCATGAAAAATCCTGCTAATTCATCTTGAATTGGTCGGAAGCGAGCTTCTGGACTAAGCCTCCTCCGCAAGTTATCCGTCGCCTTCCGCACGCTATCCGATGCCTTCCGCTCAGAGGTGTGTCTCCGGATGTTCTCACAAACATAGTATCCACATAGATTGGTCCCCGGTGGCTGCTTATCCACACTAACTAACCTTCTAAAATCTAGCTCATGTTTGAATTCACCGACAATTTCTTCTGAGAACTGTCTCCAAACCCTACAGGGCAAAGAAAATTAAATGAACAAGGGAGTTATTAGTTACTTGATATTAGGAAATGAACGAAAGAGACCGATCGATATAGAGCTCAAATGATTGAAAATAATTACTTTTGCAGCAGTTTTCTCATGTCGGCCCAACGCTTTGGATCCGAATCCATAGAGTCCATGATTAGAACTCTGGAGGTGTGAAGTTCAATATTTAGCAGAATCCAGTGGAACCTGCGGACACGTTACATGCACAGTCATGCATAACTCATCGATTAGACATACCATGCATGGAGTAAACACAAGAGAATGGGCACAAGAGAGAAACACTCACCCAAAATGGTAAGGAAATAGAATATGACTTTTGAGTTGATGCTTTCTAAGAAACTTGTACAAGTCTTTCTCCACGTCTTCGGGGTGATTTTGTAACACATGTCCATTAACGATATGTGGGTCAATGAACCCAACATCATGGATGTTTCTTATTTTGCATTCCCAAATCTTCAATCTGCATAATAGCGTACGCAACAATATAGTTAGGACAATATATATATATATATATATATATATATANNNNNNNNNNCAACGCTTTGGATCCGAATCCATAGAGTCCATGATTAGAACTCTGGAGGTGTGAAGTTCAATATTTAGCAGAATCCAGTGGAACCTGCGGACACGTTACATGCACAGTCATGCATAACTCATCGATTAGACATACCATGCATGGAGTAAACAAAAGAGAATGGGCACAAGAGAGAAACACTCACCCAAAATGGTAAGGAAATAGAATATGACTTTTGAGTTGATGCTTTCTAAGAAACTTGTACAAGTCTTTCTCCACGTCTTCGGGGTGATTTTGTAAGACATGTCCATTAACGATATGTGGGTCAATGAACCCAACATCATGGATGTTTCTTATTTTGCATTCCCAAATCTTCAATCTGCATAATAGCGTACGCAACAATATAGTTAGGACAATATATATATATATATATATATATATATATATATATATATATATATATATATTTATTTATTTATTTATTTATAGTGCAGGCAATGAAGAACGAGATGAGGTAGAAATAAATCACTTACAGAACGTAGCAACTCAGCATAGATTTGTCGAGGTCGCGCAGATTGAACAGCTGGAACAATTCACTCATATGAACTTGTACAGAGTACCGTTTGGTGTGATGCTCCTCTGTAACATCCGCATAAACATATTCTTTGTCGGCCCATGTTATGAATTGCTTGTACCAACGTAGCAGATTTCGCATTTGTGGTGGTAGACTCTTTTCCCGCGCAGGCTCGACGAGAGGCCCATTCCGCACATATTGTAATGCTATCTCACATACTGGCGCATCCTCAAGGCCTAAGAAGGCACGAAGAGTCAAACCCATCTCGGACGCTTGTTTCATGGCACTCGCTACAGTCAATCCAAGTGCTGCCGCAGCTGCTATGATCTCGGGGTCCTCTTNNNNNNNNNNCACTCACCCAAAATGGTAAGGAAATAGAATATGACTTTTGAGTTGATGCTTTCTAAGAAACTTGTACAAGTCTTTCTCCACGTCTTCGGGGTGATTTTGTAACACATGTCCATTAACGATATGTGGGTCAATGAACCCAACATCATGGATGTTTCTTATTTTGCATTCCCAAATCTTCAATCTGCATAATAGCGTACGCAACAATATAGTTAGGACAATATATATATATATATATATATATATATATATATATATATATATATATATAGTGCAGGCAATGAAGAACGAGATGAGGTAGAAATAAATCACTTACAGAACGTAGCAACTCAGCATAGATTTGTCGAGCTCGCGCAGATTGAACAGCTGGAACAATTCACTCATATGAACTTGTACAGAGTACCGTTTGGTGTGATGCTCCTCTGTAACATCCGCATAAACATATTCTTTGCCGGCCCATGTTATGAATTGCTTGTACCAACGTAGCAGATTTCGCATTTGTGGTGGTAGACTCTTTTCCCGCGCAGGCTCGACGAGAGGCCCATTCCGCACATATTGTAATGCTATCTCACATACTAGCGCATCCTCAACGCCTAAGAAGGCACGAAGAGTCAAACCCATCTCGGACGCTTGTTTCATGGCACTCGCTACAGTCAATCCAAGTGCTGCCGCAGCTGCTATGATCTCGGGGTCCTCTTCCGGACCGGCTTTCACTATGAGCGGGGGGATCGATTGTTTATTCTGCATCCCGAGCTGGTCAACTTGTTTCCCGCTTTTTTTACTTTCTTCTTTCTCCTCCTTCAATATTTTTGCTTGCCTACGAAGTTCATGTCCATAGTCGTCAGGCATATTCAGCTCGGCTTGGGACGGTGTCGTCAAAAAATCCTTAGCCCACTTCTTTTGCTTCTCAGTGAATACTTGCTTGGGCTCAGGCTCTTTTATCGCCTTCATATCCGCCTTCCATTTCTCATAATGAGCAGACGCGGCCAATTTGGTTTCAGCTTCACTAAGTTCCCAAGGCCTTGGGAGGAGAGGCTTCAGTGATGGCTCCGGTACCCTTGTGGTCTTAGGTACATAAGGGTCCGGGTTAATAGTCCAGGAGCGGGTTTCCTTGCTATCCGCCTGCTTCTGCTTCTTCGCCGGAGGTGGATTGGGGGGCGTCGTACCCGCCGGAGGAGGATTGGCGGGCGTCGTACCCGCCGGAGGTTGTGGATCGGGGGACGGCGTCGAATGGCGTGAAGGAGGTGTAGGTGAACCACCACGACCACCACCACCGCCACCACCACCACCACCACCATCGGAGGGGGGTGGACTTGTTAGCCTTGGCGCCTCGCCTGGAAACACTATGTACTTCTTTTTCCATAGAATGATCTGGCGCTTGACATCTCCAAGTCTTCTCTCTCCTTCGGGTGTAGCTTTGTCAATCTCCAGGTCCTCAAACCCTTGGACTATGTATTCCACCGTGACACGAGCATAGCCATATGCAATGGGGTTGTTGTGGTGGAGTGCTCCAGGTGTACAGGGTAAAGCACTGCCGCTAGCTACCTTCGTGGAAACGTTCCCCACGGGATAATGCAGATCACATTCTTTCATCTCCTTTACATCATCCACGGGGTAGTGAGGCTCCGGTGCACGAATCTCGATCATCAGTGCACTAGCACCAGGCGGGGCATCCGTGGAAGCCACGCTGCTTCTCCGCTACTGGCTTCCGCGATCCGCTTCATGATCTTCATGCGGCCCTGCAGCCGATTTTTCTTTTACTAGTTCATGCACGGTCGGCTTCAACTCATGGAGTTCCGATGCAAACTTCGCCATAAGATCTGCATCCCGGTCCGTCTTTCTCTTACGGCTTCTGTAACAGTACGGGTCATTGTCCTGGGAAAACCCTACTTTCCACGGAACTTTGCCTTTGCCTCGTACACGTCCTCCGTGTTCATCATTCCCGAGGGCTGTTGTCAGTGCGTCTTTCTCTCTGTTGAACTTGATCAAGCCCTCTTGAGCTTGGATCATTGCGTCAATAAGGGCTTGGGTGGGAGCAAACTTTTTCTTCCGGTGAACACACAACCCTGTCTCCGGGTCTAGTGATCCCCCATGCCCGTACCACCAGCTTTTGGCCCTTGGGTCCCATCCCTCTGTACCTAGAGGGATTCCTCGCACCCTCAGGTCCTCCTCCATCTTCTGCCACTTAGACTCCGAAAGGCGGTATCCTCCTGGCCCCATAATATGATGGAACTTTTTCTTACTCGCATTATCCTTATTTTTTTCGATATTTCCTTGAAATGCTCCGATTGCTTTTGCCTCACAAATTCTGGCCAATCATCTTTCAGTTTCTCATGTAGTCCATTGAAATCCGGAGTCTTGCCCTTGTTGACATAGTCACGGGTTAAATTTTTCTTGAAGTTCCGGAATGCTTCGCCCATCTTCTGAAAAGCGAACTCTTTAACTAGCCTCCTCCTCTCACGTCCACCCGGAACCTCGTTACCAAATTCATCGACTTTGTTGTATTCCGGAGGTAGAATGAAATGTTCCATAGCTTTCTCCAGCAATCCTTTTTCGTTCTCTTGTCGACAAAACTGAAACCAAGACGTGCCTTCTTTGGCTCCTTCCATTCCTGGACGGTGATCGGGACGTTGTCTCTAACAACGACTCCGCATTGGTTGATAAACTTTGAGGTGTGCTGTAGGGGCTTGCCGGTTTCACTGACAAACTCAATGGCATATGTTTCTCCTGTTTTCATCGCCTTGGATTTGCCACGCTTTGTCGTACTCGATCCGGCCGAGGGCTAAAAAAAGAAAGAGAGTCGCGCGCATTAATACATATGTATTCACATTTCAGTAAGTTTGTATCACGAGAGGCTCAATGTATATATATACCTCGCCGGAGGTGGTTGCTACTTGCAATTCGAGATCGTCGTTTGTTGACGGTTGACCTCCGTCGACAATGTCCGTTCCTCCACCTTCTTGATCATCGACAATGTCTGTTCCACCGTCAAGGTTCAGAAAAGAAGAGACTACATCCTCTTCTTGCTCATATTCTGAGCCCGGCACATAAGGAATCTCGTTGTTTATGATGCCCATTAAATAACGTTCAGCCTCCGGATCCCTAAGCGGCTCGGCTCTATCGTCCGCCATATGTCACTCCTGCATGTAGTAAAAATTAATTAAGTATAAAGGAATTAAAAAATAAGATTAAGGAGACATAGAGGAGGAGGAATTAAAAAATAAGATTACTGAGCACTGCCAAGTATTTTGTTTTTCCTTTTCTTTTTCCTTTTCTTATTTTCTTTTTCCTTTTCTTATNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTTCTTCTTCCTTTTCTTCTACCTTTTCTTCTTCCTTTTCTTTTTCCTTTTCTTCTTCCTTTTCTTCTTCCTTTTCTTCTTCCTTTTCTTTTTCCTTTTCTTATTTTGTTTTTCTTGGTTTTCATTGGTTTTCTTTGTTTCTTTCTCGATTTTCTTGATTTCATTCCTTTGCATTGGTTTCTTTTGTTTTGTTTTCTTTGTTTTTCTTTTTGGTTTTCATTGGGTTTCTTTGTTATTCCTTATCTTTTGTCGATTTTATCGGTTTCTTTTTGCTTCAACACGTGTTAACTTTTTCAACCTTTTTCTTATACATCAGAAAGATTTTCATATATACATTTAACATTTTTAAACACATGATTAAGTTTTTTTTGAAAACTTATTTTTTTGGATGTATGGGTTTTTTTCATACACACTGTACATTTTTGGCATATATCTAATACATTTTCCTAATACATGTTTAACATTTTCCTAATACATGTTTAACATCTTCCAAACACATTTTAATATTTTTTGAACACATGGTCAACATTTTTCCTTCGTTTGTGGAGGCGGCGGCGGGAGGCGGAGGACGGCAGGCGGCGACGGGAGGCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNATCAAAAAATTCAGAAAAATAAAACTAATTCATTTTAAAACCTTAAAAATACAAATAATATATCAAAAAATTCAGTTCATCGATCCCTTGAAGGTTTGACAAAAGGTTTGATACATCATTCAGTTCATCGACCAAATACAAATCATCCGGATTCGCCATCGTACGTTTTAATTCACATGATCCATTCAACAAAGTTTGGTACAATACATTATTACACATCAATTCCTCCCTTGTGTCCCTGCTTGCTTACGATTGTGCCGTATCCATGGAGCATCCTCATCATTTAACTTAATGCTTGGGTCAGTGTTCACTTTGAAGGACAGAATTTCACCAAACATATTATAATCTTCTGACATGTCTGTCTTGTCCTCCACTCCCACGATGTTTCTTTTCCCTGAAAGAACAATGTGGCGCTTTGGATCATCGCATGATGTACTGATCGTTTTCTTATCTTTCTGTTTCCTCGGTTTGCTACTCATGTCCTTCAAATAAAAAACCTGAGCGACATCTTTGGCAAGGACGAAGGGTTCGTCAAGGTAACCAAGATTGTTGAAATCCACCATTGTCATTCCGTATTGCTCGTCCATCTTTACCCCACCTCCTGTTAGCTTGAACCATTTGCACCGGAACAAAGGGACCTTAAAGGAGGGTCCATAGTCAAGTTCCCATATCTCCTCTATGTAACCATAATATGTGACCTTTTGCCCATTCTCGGTTGCTGCATCAAAGCGGACACCACTGTTTTGGTTGGTGCTCTTTTTATCTTGGGCGATGGTGTAAAATGTATTCCCATTTATCTCGTACCCTTGGAAAATCGTTATAGTCGAAGATGGTTTCTTGGCCAACATGTACAGCTGATCTCTAACATCATTGTCATTCATTAAATGTTTTCGCAATCAACTGCCGAAAGTCTCCATGTGGGCCTTTCTAATCCAGGATTCAGGCTTCCCCGGGTTGTTCGAGTGTAAAATATTCTTGTGTTGCTCGAAGAACGGAGCCACCAAGCTGGAATTTTGCAGAACTGTGTGGTGTGCTTCAGTCATAGAATGACCGTCCATACATATCGTTGATTTCCTTCCGATCGTGCCTTTTCCACTTAGTCTCCCCTCGTGCCGCGATTGAGGAATACCAATCGGCTTAAGGTCAGGAACATAGTCAATACAGAACTCAATTACCTCCTCATTTCCATAGCCCTTGACGATGCTTCCTTCTGGCCTAGCACGGTTACGAACATATTTCTTTAATATTCCCATGAACCTCTCAAAGGGGAACATATTGTGTAGAAATACAGGACCGAGAATGGAAATCTCTTCGACTAGGTGGAGCAGGAGGTGCGTCATAATATCGAAGAAGGATGGTGGGAACACCAACTCGAAACTGACAAGGCATTGGACCACATCGTTCTGTAACCGTGGTAGATCTTCTGGATTGATTACCTTCTGAGAGATTGCATTGAGGAATGCACATAGCTTCACAATGGCTACTCGAACATTTTCCGGTAGGAGCCCCCTCAAAGCAATCGGAAGCAATTGCGTCATAATCACGTGGTAGTCGTGAGACTTCAGGTTTTGGAACTTTTTCTCCGCCATGTTTATTATTCCCTTTATATTCGACGAGAAGCCATACGGGACCTTCATACTGCTCAGGCATTCAAAAAAAATGACCTTCTCTTCTTTGGTAAGAGCGTAGCTGGCACGACCTTGAAACCATTCCGGATGCCGGCCATCTGGGTCTTTCAAAAGTTGCTGGTCCTGCCGTGCTTCCTTTGTATCATTTGTCTTCCCATACACGCCCAAGAAGCTTAGCAGGTTCACGGAAATATTCTTCGTAACATGCATCACGTCGATTGCAGAGCGGACATCTAGGACTTTCCAATATTCTAGCTCCCAAAATATAGATTTCTTCTTCCACATGGGTGCGTGCCCGTCAACTCCCCGCGGAACTGATTGTCCGCCAGGACCCTTTCCAAAGATGACTTTCAAATCCTTGACCATATCAAATATCTCAGCACCAGTACGTTCCGCAGGCTTTGGCCGGTGATCTGCCTTGCCGTTGAAATGCTTGCCTTTCTTTCTTACGTTATGATTTCGGGGAAGAAATCGACGATGACCCAGGTACACGTTCTTCTTACAATTAACCAAACGTACACTTTCAGTCTCATGTAAGCAGTGTGTGCATGCATTGTATCCCTTATTTGTCTGTCCCGAAAGGTTACTGAGAGCAGGCCAATCGTTGATGGTTACAAAAAGCAACGCTCGTAGGTCAAATTCCTCTCCTTTGTGCTCATCCCAGACACGTACACCAGGTCTGGCCCACAACTGTAAAATTTCATCAACTAATGGCCTTAGGTACACATCGATGTCGTTCCCGGGTTGCTTTGGACCTTGGATGAGCACTGGCATCATAATGAACTTCCGCTTCATGCACAACCAAGGAGGAAGGTTGTAGATGCATAGAGTCACGGGCCAGGTGCTATGGCTGGAGCTCTGCTCGCCAAAAGGATTCATGCCATCAGTACTTAGACCAAATCTTATGTTCCTTGCGTCAGCTGCAAAATCTTTGAACACTCTGTCGATCTTTCTCCATTGCATTCCATCAGCGGTGTGTCTCAACTCCCCGTCGGACTTACGGTCCTCTTTATGCCATCGCAACGACTTGGCATGCTTTTTGTTCCTGAACAGACGTTTCAACCGTGGTATTATAGGAGCATACCACATCACCTTGGCGGGAACCCTCTTCCTGGGTTTCTCGCCCTCAACATCGTCACCAGGGTCATCGCCTCTGATCTTATAACGCAATGCAGTGCATACAGGGCATTCATTCAAATTCTCGTATTCACCGCGGTAGAGGATGCAGTCGTTAATGCATGCATGTATCTTCAGAACCTCTAAACCTAGAGGGCAGACAACCTTCTTTGCTTCGTACGTACTGGAGGGCAACTCGTTATTCTTCGGAAACATGTTCTTCAACATTTTCAGCAAATTTTCAAATGATGAGTCACCTACACCTTCCTGTGCCTTCCATTTTAGCAAATCCAGTGTGCAGCCCAGCTTTTTCAGACTATTATCGCATCCTGGATACAACGACTTTTTGTGATCCTCTAACATGCGATCCAAATTCTCCCTATCCTTGTCAGTTTCGCAGCGTCTCCGTGCATCAGCAATGGTCCGACCAAGATCATCAGCGGGCTCATCATGTGCCTCTTCTTCACCTTCACCTAACCCTTCCCCACCTTCAGCATCATCCTCCATGAAAGTATCACCGAAATGATCATGATAGTTGTCATCGATATCATCCCCTTCTTCATCTTCTTCCATTCTAACCCCTCTTTCTCCATGCTTGGTCCAACAATTATAGCTTCGCATGAAACCGTGCCGAAGCAGGTGCATGTGAACGTCTCTTGAGGAGGAGTAACCCTTCTGATTCTTACAAACAGCACATGGACAGATAATAAAACCTTGCTGCTTGTTCGCATTTGCCACTACGAGGAAATCTTTCAAACCCGTAGTGAACTCGCCGGAGAGTCGGGGACCGTACATCCATTGCCGATTCATCTGCATTATTATTATATAAAGTATATAATTGACCATCATGCATTTGTTAAACTAACTAGCTAGAAATAATACAAATTAAACAATGAACTACACACATGCATATTTTATCAATGACACATGAAAGGTTCAAGTTGCTAACCGCGATCGCGAAGGAAAAATAAATGAGAAAGCTCAAGTGTGGCTCGGACACTTCGTATCATGTTTGTTTCAGGCTCTCAGGCATTTCATCGAACACCTTGTGTGCATAGGAGGAACCAAAAGCAAACCCGCCACCCCCTTCTGAATATTGTGAAGTGAGCTGAGTGAAGTGAAGTGAGCTGAGTCCTATATATAGGGATGGGCCTTTAGTCCCGGTGGCCTGGCCAACCGCGACTAAAGGCCTTCGGGGACCTTTAGTCCCGGTTGGCCAGGCCAACCGGGACTAAAGCCCCTCCCGTCCGCCAGCTGTCGACCGAGCGCGCTGGGCCCAGATAGTTGGTCGCGGGTCTCCTCCCGAACCGCAACTAAAGACCCCTTTGTCGCGGTTCGATTATTTTGGGGACTAATGGGGGCGTATGGAAGCCTCTTTTTCTACTAGTGTTAGTTCATCAATATCACTAGTAAGTTCAATGTGTTCTGTTCATTAATTAGTTCAATTTCTTTAGTATTCATTTGTTTATTCACTTCTTTAGTTTATATTACATCATTAATTCTTATAATTATCAGTGTTTTTTTTTGTTCTTTTCACATTCTCGTTTGGTGCACTATCTCACTACGACGAACAATGAACTACCATAGGTGGTATGTAGGGGTTTTCACGATTTCTTAGATATGTACTCTTCACAAATCATTATTTCATTATGCAGGCATGTCTATATATGTATCTTCACTCTTCACTCATTCTATATTTTGTCATTCATTCATCACTATTCACTTATCAGGACATTTGTTTCATCCTTTAAGTATTTTGTTAAGTCCATTCTCTATTCCTTAGTCATTTGTTCCATTTAACTTGATAACACAACATTTTATCATCGATTGGAACACTTTTTGTTCATGTGTAGTTCTGACCAGCTAATCAGTGATGGTCACTGCCTAGAACTAAGAATTAGAGTTATATGTACCTATGTTCTGATTCCAAATGTTTGAGTTATCATTAATACATTTTCATAGGTTTTTTTTATTTCCTATCATTCAAAGATCAGGACACTTTCAATCCATATTTTTTGGTGGAGTGTTGATGAATGGTGTGTGTCATACCTGGCCAAATGGCTCGGCACGGCCCGGCCTGCGGTAAACGTGCACGACACGACCCGCGACGGCACGACTAATAGCCGGGCCGTGCCGGGCCGGCCCACGGGCGGGAGCTCGCACCCTAGGCACGGCCCAGCTACTAATTGGGCCGGCCCACCTGAAGGAAATATGCCCTAGAGGCAATAATAAAGTTACTATTTATTTCCTTATTTCATGATAAATGTTTATTATTCATGCTAGAATTGTATTAACTGGAAACATGATACATGTGTGAATACATAGACAAACAGAGTGTCACTAGTATGCCTCTACTTGACTAGCTCGTTGATCAAAGATGGTTATGTTTCCTAGCCATAGACATGAGTTGTCATTTGATCAACGGGATCACATCATTAGGAGAATGATGTGATTGACTTGACCCATTCCGTTAGCTTAGCACACGATCATTTAGTATTCTGCTATTGCTTTCTTCATCACTTATACATGTTCCTATGACTATGAGATTATGCAACTCCCGTTTACCGGAGGAACACTTTGTGTGCTACCAAACGTCACAACGTAACTGGGTGATTATAATGGTGCTCTACAGGTGTCTCCGAAGGTACTTGTTGGGTTGGCGTGTTTCGAGATTAGGATTTGTCACTCCGATTGTCGGAGAGGTATCTCTGGGCCCACTCAGTAATGCACATCATTATAAGCCTTGCAAGCATTGTAACTAATGAGTTAGTTGCGGGATAATGTATTACGGAACGAGTAAAGAGACTTGCCGGTAACGAGATTGAACTAGGTATTGAGATACCGACGATCGTATCTCGGGCAAGTAACATACCGATGACAAAGGGAACAACGTATGTTGTTATGCAGTTTGACAGATAAAGATCTTCGTAGAATATGTGGGAGCCAATATGAGCATCCAGGTTCAGCTATTGGTTATTGACCGGAGACGTGTCTCGGTCATGTCTACATTGTTCTCGAACCCGTAGGGTCCGCACGCTTAAAGTTCGATGACGGTTATATTATGAGTTTATGTGTTTTGATGTAACGAAGGTAGTTCGGAGTCCCGGATGAGATCGGGGCATGACGAGGAGTCTTGAAATGGTCGAGACGTAAAGATCGATATATTGGACGACTGTATTCGGACATCGGAAAGGTTCCGAGTGATTCGGGTATTTTTCGGAGTACTGGAGAGTTACGGGAATTCGCCGGGGAGTATATGGGCCTTATTGGGCTTTAGGGGAAATAGAGAGGAGAGGCTGGGCGCCCCCCCAAGGCCTAGTCCGAATTGGACTAGGGGAGGGGCTGCGCCCCCTCCTTCCTTCTCTTCTCTCTCCCCTTTCCTTGACTCCTACTCCTACTACTTGGAAGGGGGGGAATCCTACTCCCGGTGGGAGTAGGACTCCTCCTAGGGCGCGCCATAGAGAGGGCCGGCCCTCCCCCTCCTCCACTCCTTTATATACGGGGAGGAGGGCACCCCTTGGAGATACAATAATTGATCGTTTGATCTTTTAGCCGTGTGCGGTGCCCCCCTCCACCATAGTCCACCTCGATAATACTGTAGCGGTGCTTAGGCGAAGCCCTGCGTCGGTAGAACATCATCATCGTCACCACGCCGTCGTGCTGACGAAACTCTCCCTCAACACTCGGCTGGATCGGAGTTCGAGGGACGTCATCGGGCTGAACGTGTGCTGAACTCGGAGGTGCCATGCGTTCGGTACTTGATCGGTCGGATCGTGAAGACGTACGACTACATCAACCGCATTGTGCTAACGCTTCCGCTTCCGGTCTACGAGGGTACGTGGACAACACTCTCCCCTCTCGTTGCTATGCATCACCATGATCTTGCGTGTGCGTAGGAATTTTTTTGAAATTACTATGTTCCCCAACAGTGGTATCAGAGCCAGGTTTTATGCATAGATGTCATATGCACGAGTAGAACACAAGTGAGTTGTGGGCGATATAAGTCATACTGCTTACCAGCATGTCATACTTTGGTTCGGCGGTATTGTTGGATGAAGTGGCCTGGACCGACATTACGCGTACGCTTACGCGAGACTGGTTCTACCGACGTGCTTTGCACACAGGTGGCTGGCGGGTGTCAATTTCTCCAACTTTAGTTGAACCAAGTGTGGCTACGCCCGGTCCTTGCGAAGGTTAAAACAACACCAACTTGACAAACTATCGTTGTGGTTTTGATGCGTAGGTAAGAACGGTTCTTGCTAAGCCCAGTAGCAGCCACGTAAAACTTGCAACAACAAAGTAGAGAACGTCTAACTTGTTTTTGCAGGGCATGTTGTGACGTGATATGGTCAAGACATGATGCTAAATTTTATTGTATGAGATGATCATGTTTTGTAACCGAGTTATCGGCAACTGGCAGGATCCATATGGTTGTCGCTTTATTGTATGCAATGCAATTGCCCTGTAATGCTTTACTTTATCACTAAGCGGTAGCGATAGTCATAGAAGCATAAGAGTGGTGAGACGACAACGATGCTACGATGGAGATCAAGGTGTCGCGCCGGTGACAATGGTGATCATGACGGTGCTTCGGAGATGGAGATCACAAGCACAAGATGATGATGGCCATATCATATCACTTATATTGATTGCATATGATGTTTATCTTTTATGCATCTTATCTTGCTTTGATTGACGGTAGCATTATAAGATGATCTCTCACTAAATTTCAAGATAAAAGTGTTCTCCCTGAGTATGCACTGTTGCCAAAGTTCGTCGTGCCCAGACACCACGTGATGATCGGGTGTGATAAGCTCTACGTCCATCTACTACGGGTGCAAGCCAGTTTTGCACACGCAGAATACTCAGGTTAAACTTGATGAGCCTAGCATATGCAGATATGGCCTCGGAACACTGAGACCGAAAGGTCGAGCGTGAATCATATAGTAGATATGATCAACATAGTGATGTTCACCATTGAAAGCTACTCCATTTCACGTGATGATCGGTTAAGGTTTAGTTGATTTGGATCACGTGATCACTTAGAGGATTAGAGGGATGTCTATCTAAGTGGGAGTTCTTAAGTAATATAATTAATTGAACTTAAATTTATCATGAACTTAGTCCTGGTAGTATTAGCATATCTATGTTGTAGATCAATAGCTCGCGTTGTTGCTTCCCTATGTTTATTTTGATATGTTCCTAGAGAAAAACTATGTTGAAAGATGTTAGTAGCAATGATGCGGATTGTATCCGTGATCTGAGGATTATCCTCATTGCTGCACAGAAGAATTATGTCCTTGATGCACCGCTAGGTGACAGACCTATTGCACGAGAAAATGCAGACGTTATGAACGTTCGGCTAGCTCAATATGATGACTACTTGATAGTTTAGTGCACCATGCTTAATGGCTTAGAATAGGGACTTCAAAGACGTTTTGAACGTCATGGACCATATGAGATGTTCCAGGAGTTGAAGTTAATATTTCAAGAAAATACCCGAGTTGAGAGATATGAATTCTCCAACAAGTTCTATAGCTAAAAGATGGAGGAGAATAGCTCAAGCAGTGAGCATATGCTCAGATTGTCTGGGTACTACAATCGCTTGAATCAAGTGGAAGTTAATCTTCCAGATAAAATAGTGATTGACAGAATTCTCTAGTCACGATCACCAAGTTAGTAGAACTTCGTGATGAACTATAATATGCAAGGGATGACGAAAGTAATTCCCGAGCTCTTCGCGATGTTGAGATCGACGAAGGTAGAAATCAATAAAAGAGCATCAAGTGTTGATGATTAACAAGATCACTAGTTTCAAGAAAAGGGCAAAGGGAAAGAAGGGCAACTTCAAGAAGAACGGCAAGCAAGTTGCTGCTCAAGTGAAGAAGCCCAAGTTTTGACCTAAGCCTGATACTGAGTGCTTCTACTACAAAAAGAACTGGTCACTGGAACAAAAGTATATTTGATATACATGTTATTGATGTGTACTTTACTAGTGTTTATAGCAACCCCTCGGTACTTGATACTGGTTCAGTTGCTAAAGAGTAGTAACTCGAAACGGGAGTTGCATAATGAACAGAAACTAGTTAAGGATGAAGTGACGATGTGTATTGGAAGTGGTTCCAAGATTGATATGATCATCATCGCACACTCCCTATACTTTCGGGATTAGTGCTGAACCTAAATAAGTGTTATTTGGTGTTTTGCGTTGAGCATGAATATGATTTGATCATGTTTATTGCAATACGGTTATTCATTTAAGTTAGAGAATAATTGTTGTTCTGTTTACATGAATAAAACCTTATATGGTTACACACCCAATGAAAATGGTTCGTTGGATCTCGGTCGTAAGTGATACACATATTCATAATATTGAAGCCAAAAGATGCAAAGTTAATAATGATAGTGCAACTTATTTGTGGCACTGCCGTTTAGGTCATATTGGTGTAAAGCGCATGAAGAAACTCCATGCTGATGGGCTTTTGGAATCACTTGATGCTTGCGAACCATGCCTCTTGGGCAAGATGACTAAAACACTGTTCTCCGGAACAATAAAGCGAGCAACAGATTTGTTGGAAATCATACATACTAATGTATGTGGTTCGATGAATATTGAGGCTCGTGACAGGTATCGTTATTTTCTGACCTTCACAGATGATTTGAGCAGATATGGGTATATCTTCTTGATGGAACATAAAGTCTGAAACATTTGAAAAGTTCATATAATTTCAGAGTGAAGTGGAAAATCATCGTAACAAGAAAATAAAGTTTCTATGATCTGATCGTGGAGGAGAATATTAGAGTTACGAGTTTGGTCTTCATTTCAAACAATGCAGAATAGTTTTGCAACTCACGCCACCTGGAACACCACAGCGTAATGGTGTGTCCGGACGTCATAACCATACTTTATTAGATATGGTGCGATCTATGATGTTTCTTACCGATTTACCACTATAGTTTTGGGGTTATGCATTAGAGACAGCTGCATTCACGTTAAATGGGGCACCATCGAAATCCGTTGAGACGACACCTTATGAACTGTGGTTTGGCAAGAAACCCAAGTTGTCGTTTCTTAAAGTTTGGGGTTGCGATGCTTATGTGAAAAAGTTTCATCCTGATAAGCTCAAACCCAAATCGGAGAAATGTGTCTTCATAGGATACCCAAAGGAGACAGTTGGGTACACCTTCTATCACAGATCCGAAGGCAAGATATTTGTTGCTAAGAATGGATCCTTTCTAGAGAAGGAGTTTCTCTCGAAAGAAGTGAGTGGGAGGAAAGTAGAACTTGATGAGGGAACTGTACCTGCTCCCTTATTGGAAAGTAGTTCATCACAGAAATCTGTTCTTGTGACTCATACACCAATTAGTGAGGAAGCTAATGATGATGATCATGTAACTACAGATCAAGTTACTACCCAACCTCGTAGGTCAACCAGAGTGAGATCAACACCAGAGTGGTATGGTAATCTTATTCTGGAGGTCATGTTACTTGACCATGACGAACCTACGAACTATGAGGAAGCGATGATGAGCCCAGATTCCGTGAAATGGTTTGAGGCCATGAAATCTGAGATGGGATCCATGTATGAGAACAAATTATGGACTTTGATTGACTTGCCCAATGATCGGCGAGCCATTGAGATTAAATGGATCTTCAAGAGGAAGACGAACGCTGATAGTAGTGTTACTATCTACAAAGCTAGAATTGTCGCAAAAGGTTTTCGACAAGTTCAAGGTGTTGACTACGATGAGAGTTTCTCACTCGTATCTATGCTTAAGTCTGTCCGAATCATGTTAGCAATTGCCGCATTTTATGAAATCTGGCAAATGGATAAACAAAACTGCATTCCTTAATGGATTTATTAAAGAAGAGTTGTATATGATGCAACCAGAAGGTTTTGTCGATCCAAAAGGAGCTAACAAAGTGTGCAAGCTCCAGCGATCCATTTATGGACTGGTGCAAGCATCTCGGAGTTGGAATATACGCTTTGATGAGTTGATCAAAGCATATAGTTTTATACAGACTTGCGGTGAAGCCTGTATTTACAGGAAAGTGAGTGGGAGTACTACAACATTTCTGATAAGTATATGTGAATGACATATTGTTGATCGGAAATAATGTAGAATTATTCTGCAAAGCATAAAGGAGTGTTTGAAAGGAGTTTTTCAAAGAAAGACCTCGGTGAAGCTGCTTACATATTGAGCATCAAGATCTATAGAGATAGATCAAAATGCTTGATAAGTTTTTTCAATGAGTACATACCTTGACAAGATTTTGAAGTAGTTCAAAATGGAACAGTCAAAGAAAGAGTTCTTGCCTGTGTTACAAGGTGTGAAATTGAGTAAGACTCAAAGCCCGACCACGGCAGAAGATAGAAAGAGAATGAAAGTCATTCCCTATGCCTCAGCCATAGGTTCTATAAAGTATGCCATGCTATGTACCAGATCCATTGTATACCCTACACTGATTTTGGCAAGGGAGTACAATAGTGATCTAGGAGTAGATCACTGGACAGCGGTCAAAATTATCCTTAGTGGAATAAAGATATGTTTCTCGATTATGGAGGTGACAAAAGGTTCGTCGTAAAGGGTTACGTCGATACAAGTTTTGGCACTGATCCAAATGACTCTATGTCTTGATCTGGATACATATTGAAAGTGGGAGCAATTAGCTAAAATAGCTTCGTGCAGAGCATTGTAGACATAGAAATTTGCAAAATACATACGGATCTGAATATGGCAGACCCGTTGACTAAACTTCTCTCACAAGCAAAACATGATCACACCTTAGTACTCTTTGGGTGTTAATCACATAGCGATGTGAACTAGATTATTGACTCTAGTAAACCCTTTGGGTGTTGGTCACATGACGATGTGAACTATGGGTGTTAATCACATGGTGATGTGAACTATTGATGTTAAATCACATGGCGATGTGATCTAGATTATTGACTCTAGTGCAAGTGGGAGACTGAAGGAAATATGCCCTAGAGGCAATAATAAAGTTACTATTTATTTCCTTATTTCATGATAAATGTTTATTATTCATGCTAGAATTGTATTAACCGGAAACATGATACATGTGTGAATACATAGACAAACAGAGTGTCACTAGTATGCCTCTACTTGACTAGCTCGTTGATCAAAGATGGTTATGTTTCCTAGCCATAGACATGAGTTGTCATTTGATCAACGGGATCACATCATTAGGAGAATGATGTGATTGACTTGACCCATTCCGTTAGCTTAGCACACGATCATTTAGTATTCTGCTATTGCTTTCTTCATCACTTATACATGTTCCTATGACTATGAGATTATGCAACTCCCGTTTACCGGAGGAACACTTTGTGTGCTACCAAACGTCACAACGTAACTGGGTGATTATAATGGTGCTCTACAGGTGTCTCCGAAGGTACTTGTTGGGTTGGCGTGTTTCGAGATTAGGATTTGTCACTCCGATTGTCGGAGAGGTATCTCTGGGCCCACTCAGTAATGCACATCATTATAAGCCTTGCAAGCATTGTAACTAATGAGTTAGTTGTGGGATGATGTATTATGGAACGAGTAAAGAGACTTGCCGGTAACGAGATTGAACTAGGTATTGAGATACCGACGATCGAATCTCGGGCAAGTAACATACCGATGACAAAGGGAACAACGTATGTTGTTATGCGGTTTGACCGATAAAGATCTTCGTAGAATATGTGGGAGCCAATATGAGCATCCAGGTTCCGCTATTGGTTATTGACCGGAGACGTGTCTCGGTCATGTCTACATTGTTCTCGAACCCGTAGGGTCCGCACGCTTAAAGTTCGATGACGGTTATATTATGAGTTTATGTGTTTTGATGTACCTAATGTAGTTCGGAGTCCCGGATGAGATCGAGGACATGACGAGGAGTCTCGAAATGGTCGAGACGTAAAGATCGATATATTGGACGACTATATTCGGACATCGGAAAGGTTCCGAGTGATTCGGGTATTTTTCGAAGTACCAGGGAGTTACGGGAATTCGTCGGGGAGTATATGGGCCTTATTGGGCTTTAGGGGAAAGAGAGAGGAGAGGCTGGGCGCCCCCCAAGGCCTAGTCCGAATTGGACTAGGGGGAGGGGCTGCGCCCCCTCCTTCCTTCTCTTCTATCTCCCCTTTCCTTGACTCCTACTCCTACTACTTGGAAGGGGGGAATCCTACTCCCGGTGGGAGTAGGACTCCTCCTAGGGCGCGCCATAGAGAGGGCCGGCCCTCCCCCTCCTCCACTCCTTTATATATGGGGAGGGGGGGCACCCCTTGGAGATACAGCAATTGATCGTTTGATCTTTTAGCCATGTGCGGTGCCCCCCTCCACCATAGTCCACCTCGATAATACTGTAGCGGTGCTTAGGCGAAGCCCTGCGTCGGTAGAACATCATCATCGTCACCACGCCGTCGTGCTGACGAAACTCTCCCTCGACACTCGGCTGGATCGGAGTTCGAGGGACGTCATCGGGCTGAACGTGTGCTGAACTCTGAGGTGCCGTGCGTTCAGTACTTGATCGGTCGAATCGTGAAGACGTACGACTACATCAACCGCGTTGTGCTAACGCTTCCGCTTCCGGTCTACGAGGGTACGTGGACAACACTCTCCCCTCTCGTTGCTATGCATCACCATGATCTTGCGTGTGCGTAGGAATTTTTTTGAAATTACTACGTTCCCCAACACCACCGACACGCCGGGCCCGCTATTTCGTCTGCTATTTGACGCATTGGGCGTTTTTAGCCTGTTTTACCTATTGGGCCATATAGAGATGTATAGAAAAAAAAACCGTAATCGATCCGTGCCGTGCCAGCCCGTGTGCTCAGGCTACCAGCCCAAGCACGGTCCAGGGCGTGCCGCATGCCGGGCCCGTTCCGTGCCTGGCACATGGCGGGTCGTGCCGGCATGCTCAGGGACCGGCCTGGTTAATTAGCCCGGCCCATTTGGGCAACTATAGTGTGTGTGTGATCACTGCATTTATATGTTTGGCCAAATAGTTGTCTATTTTTCGTAGAAGAGTTTCTGAATACACTTTATGTGTGTGTAATTTGTTTTTTTTAAAACGTGTGTGTAATTTGTTGGCATCTAGAAAGTACTAGAGGAAGTTGCTACGACCGTGTTGGCAGAAGCTGCAGCCAGCCATGGTGGAGCTAACCGGCTTCGACTCGTGTCACGACTGGCGGTGGCAAAAGCTACAACTGGCGTCGTCTCGTGCTATGACTTTTGGCGGCGGAAGCTACAACCGGCCACATTGACCGACATAGGTTTTTTGCTGGAACTAACGGTGGCAAAGCTGCAACCAGCGACGTCACTTGCTGGAACTGGCAACATTGAGTGTTGGCACTGGGTACGGCCATTTGCTAGAACCAGCCACATAGATTGTTGGGACCGAAAGGACGAAGCAAGCGGAGCAGATCCGACGGTTCACATTAGTCGCATCCTACGGCGCGGATTGCGACCGATCGAGGCTGGCGCCGATCGACCGGCGCCTGGCAATGGCCTAAACCAAAACGCACGTGCTTCTCGCAGTGGGGAGGTGGGGAAATGGCGTCGGTGAACAGTTGACCACTCGATCTATCCTCCTCACTTTTCCTATTTCCACTCCACCACGCGGTTCGGGCGCGCTCCAACTCCCAGCTCCATAAACTCCAGATCCATAGGAGTCGGCGCGCTGCAGCTCGTCCGCCGGCGGCAGCCCTCCCCACCGCCGCGGCCTGCCTTGCCCCGCCTTGAGTCGCCTTTCACCGCCGGGCTCCCCCCTTGTCTGCCTCCGGGCCCCTCCTTTTCTGCCGCCGTCGTCGACCATCTCCGCCGCCGTCCCCGACCACCGGACTCCCTCCTTGTCTGCCGCCGTCTTCCCCGACCACCGGACCACGCAGGCTGTGCGCCTCCTCTGCCTCCCCGACCACCTCGCATATCAACTGAATCACAGTAGGTGAGTGAAAAAAATTGCATTTTTCTTTGATTGGTACTAGTATTTTGCTGCGATGTGCTACGGTGGTGTGCTGCTGCTAGACTTGTGGATGGTCTGTAGGACTGATGATGTGCTAGGATGCTCATTTGGGGTTTGGGCGCTGGGGATTTGGGGTTTCGAGTATCAGATCTCTGGGCGATCTGGTCCGGCACTGGTGGTTGGTGGCGAATGCCGCCGGTTTTCGGTTAAGATCTCGCGAGCTTGGTGAACCCTTCGGATTTTTAGATTCACATCTGTGTGAAAGGTGCAAAATTTGCGGACCGAGATCTGATCCTGCTTACTCAAATCTCCTGGATCAGTGCAAATGTGTGGGCATTGTGTGTTCCGTTGGGAACCACATGATTACTTGATTTATTGGGACCAGGGGTTTAGTTTGTTCTTACTTGCAGTTGAGTTGTGCGTCAAAGCTTGGTCTCGTCATGCCTGAGGAAAACACTTAGCATTACGATTTGGTACATGGATATGTGTAAGATCAATCTCAATCCGTATACAATACAGGTCTCTATGGGCATGTTCATCTAGATTAGCATCTTTACTTCATAAACGGCGCAAAAATTCTGAGTATCTTGGAATGCTTTCTTTCCTTTTCTGGGAATGTGAAGGTTGTGACTGTGTAAACTGTGGGTCCTACAAATTGCAGTTTGCATTTAAAGAATAGTTGATGATAGTGTAGGATTCTAAATCTTTTTCTCACATTGCATAATGGTAAATGTAATATGCATGCCTTGATTCATCTAAGATCTAACTGAGCGGTGTTGGTTTTTCCATCTCCATTGAGCAGGTCGCTTGAGTTAATGTGCACCATATAGTGCTTTGTCTCTGTTAAATTGCTTATGAGATCAGTAAACTGCTATGGATATATGAAGCACAGCTGAAGAAGCCCATAGTGTTTCATACCAGTGAATGATCAATATTTTGTCTGTTTCAGATCTTAGTACCACTAGAGATGCAAGGAAGAATGACAGATTTATGGTAAACCCTGGTAAATATTCGTGGGAGGTCAACAAGTGGCGCCCTGATTAAGACTGCTACAACACTTTGTGGTTCATCTCTAATTAGTGATGGCGAGAATGAAGATCCCAAAGCGTTATGTCATAGTATTGCTGACATTCATCTGCACAAATGTTTGTTACGTTGAGCGTGTGGGTTTCTCGATTGCGTACACCGTAGCAGCTGATGCAATCAACGTGAATCAAGCAAACAAGGGCCTGATACTCTCCATGTTCTATTATGGTTATGTTTTGTCGCAAATTCCTGGTGGATGGGCAGCTCAGAGATTGGGAGGCAGACGTGTTCTGCTACTGTCATTCCTGTTGTGGTCTTTGATATGCGGTCTAATTCCACTGGACCCCAACAGAGCAGTCATTCTGGTCCTTTCTCGCCTTTTTGTCGGTGTAGCACAAGGTTTCATATTTCCTGCCATTCACACAGTCCTGGCACAATGGGTGCCACCGCAGGAGCGCTCTCGCTCAGTGTCATTAACAACCTCAGGGATGTACCTCGGGGCAGCTTGTGGCATGTTGTTTTTTCCAAGTCTGGTGAAGCACATGGGACCCCAATCTGTATGTTTAGTCGAAGCAGTACTTGGAGTAGCATGGTCTGTAATATGGTTGAAGTTCTCCAGTGAGCCACCTCGCACTGACCTTCCAAAAGTGGCAATGCCAAAAGTAGCATCTCGGGAGAAGATTAAGGCGCAATCAGTAGGGGTTGTTGCACCTCGCACTGTAAAGATACCATGGCGAAAGATTATCTTCAGTCTACCTGTTTGGGCAATTGTCGTGAACAACTTCACCTTCCACTATGCCTTGTATGTTATCATGAACTGGCTGCCTACCTATTTCGAACTAGCCCTTAAGCTTAGCCTCCAGGATATGGGATCGTCAAAGATGCTTCCCTATTTCAACATGTTTATATTCTCCAACATTGGTGGAGTGGTTGCTGATCACTTGATTACAAAAAGGATCTTATCAGTTACCAAGACAAGGAAGCTCCTTAACACCATTGGGTTTGTTGTCTCGGCTGTTGCACTCATGGCCCTCCCTTCATTCGGGACGCCCTCAGGGACTGTGATCTGTTCATCGGTGTCTCTTGGCTTTCTGGCTCTAGGAAGAGCAGGGTTTGCCGTGAATCACATGGATGTTGCTCCAAAGTTCGCCGGCATAGTGATGGGGGTTTCCAATACAGCTGGGACATTGGCTGGGATAGTTGGCGTTGGCCTCACGGGAAATATTCTGGAGGCTGCAAAGGCTTCTAACATGGATCTAACGAACTCCGAAACCTGGAAAACAGTCTTCTTTGTTCCAGCATACCTCTGTATTTTTAGTTCAGTCATTTTCTTGGTCTTCTCAACTGGTGAGAAGATTTTTGAATAGAGGATGATTATTTTTGCCTGTTCTTTTCTTGTCATTTACGGGCGGCGAGGCAGGATAGAAACACGGGAATCTCACATGTATTTTATTCATTATACCTGTCAGATTTCAGAGCTCAGACTGCATCCCACACATATTAAGACTTATGTTATGTTAGGAGGAATAACACTTGTCCGTAGTAAATTGTGTTATTTGGAATGATCCTATGACTCTGTTATTCCAGCTGGCTGGTTGGCCTATTTACAATACGTTGTGTAAGCTGGGCATACATCATCTTTGTTTTGTAAGTCATTTTCCTGGGGATAGGAAACAATGTGAATTGTGCAGCAAGAAGTCAGGATGACATGACAACATTTTGTTTGCTGGCAGGATCTGAAAAGAAAATGTGATTGGTCTACATTTGATCTAAATGAAATTTCTATTTAAAGGTAAATCTGACTGGAACATGGACGCTCCCTTTGGCTGTGTAGAGGCGCATTTTTATGTTTGATAAACCTGCTGGAAGATGTTTATTTCACTGTAAGTGAGCAGTAGAACCTGAAAAACCTGTGCCCACACATCCCTAGCAAGCTCCATTCCTTTACATTCACATGTTAGTTCAACTATATTGGGTAAAGTTGAGGGCCTCTTTGATTCATAAGGTTTCAAAAACACATTGATGTGCATAATTGGGTGTTTAATTCACAAGAATAGGACAAGTACAGGAAGCCTAAAATATTATGGTCAAATTAAGATTTAACCATATGCAAAGGTAAGATGAAGATATTATTATATGCTACTTAAGGCCTTTGCCTTGTTCTTCATGCATATGAATGTGAAAGAGAAATTTCAATGCTTTGAATCAAATGGATAAAATAGTAGGAAAAATCTTATTGATATGGTTTTCTTATGAATCACAGACACCATCAATGTAAAGTCTTGAGAAAACTACGCTTTGCAACCAGTAGTCATTACATATACCGCTGTCCATTGTGTCCTCTCGTGGAAAGTAGTAATCTAAACGCTTTTATATTAGTTTACGGAGGGAGTATTATTTTTGAACAAGAGCAGCAGGGCGGGATGGTGATCCTACCAGCTTACAATACAAGATACATTAACAAACAAACAAAAGGAATATAAAAAACAGAAATCTTGTCCACGCGTCGGCAAAGCAGAGACAATAGATTCATGGCCCTGTTTTCCCCAGTCATCTCGCACAGTTCAAGGTTAGAGTATATGCTTGTGGACTTTTATATAGAATATGAGAATGGGGAACTATCATTGAAAATCTTTTGTCAAGCCATCAAACGGGTGACAAGTGAAGTGTTTGGCTATTTTTGTGATTGTAAATGTTTATAGGGAAAAATATTTTTTGCCAGGTTTTTCATCTAAATATTCGATTATGAGCACTACTTTTTTTTCCGTTGCAGCTCAAATTTTTTTCCTATGAAAATTTTCATATCTATTTTTCTGTATCTTTCGATAACAGAAATTAATTTTCTATGGGAGTATGTCGCTCGGAGACATTTGGCAGTCTTCCTATTCTGAATTTCTTCCAGTAGCGTAGAGTTCAGACACGACTTGCTCTCTTATACTTTTCAAACTTCTGGCACTAACCTAGTTGCTGATGGCATTACCACTTGAGATATTTCCACCCCCAAAAGTACTGCTGCGAGCGCTGCCTTCAAGTTTCGGTTAGTCCAAAGCGTTTCAAGATGCCTCCCATTCCTAATGAACTACAGACGCACTTCCACTAACTTCTTCTATTTGCCATTCCTCTCACCCTCTCTCGAGGCTCTCAACTCAATTCTTGTTAACTAGGAGCTACTTGCTTCATAAGAAGAGCTAATATATGAGGTGGGAGGAAGACTACGGTCAAAAAATGGGTATGCAAGTATTGAGCAGGAGAAGGCAATGCATCCTTATATAAAGGCACGTGCCATAGGCCGAGAGTGTTCACCTCTTTTCTGAAAAAAGTATAGGAAGACACATGTACAAGAAAATAAAGTTGATACCTATGTGTGTTGCTTCAACTTTATAATGCGACCACAAGCACCTTACATAGTAGTATTGCTAGAATCCTAAAAAAAAATAGTATAGCTAGAAAAATACTCACTTCATTTCTTTATGTAAGGTGTATTATTTTTGGCACGGTGATCATGGCATAAAATTAGACAATTTCAGACAAAACTACCCTTGACAAATCATTGGTTAGTGGCAAGTAAATCAATTAGTCCAGGAAATAAAGAGGTATACACAATCAAGAGACAGATATTTTCCTTCTTTTCCTAGAAGGAGATATACATGCAATCATAAGAGAGATACTTTCCTATTTTCTGGAGGGCTAAGAACGGAATAAGGAGGAATTAGAACAAATGCACCTTAATTGTGAAATTTTATCAAAAAACAAATACAACTTTTTTTGATCGGTAACAAATACACCTTATATTAAGAAACAGAAGGAGTATATAACAATAGTAAAAGAAACAGGCCCAGCCCATTAAGAGAGGCAAGTCACGAACGAACGTGATCTCCTTTCTTTCGTTCTCTCCGATAACGCCGCTGCAATCTCATTCGTCTCCCAGTCTCTCCATATTTCTCTCCCCCAATTGATTGCCCCGAATTCCTAAGAGACTCCAACTCCCCAAGCTAATCAATTAATTTGTGTCACTGTCCCCATGGATTTCTTGGGTGTCTTTCATCATATAACTAACCCCAAAGCCATTAGTGGGCCGGAGAAGAGAAGCCGACGAGGACGCCAACCCGCGGCGTGGCCGTCCATCGTCAAGGCTCTGCCAGGGTCCGAGCCTCCGAGGGTAGTAGGCGGTGGAGTATTATGCTATATGACGAATTGATGCAATGATATTTGACCGGCTTGATCTTTTCTTTTACGTCAGTACAATGAGGTAGGTTCTGCTGTTTATGACATTGCTTGCATTTGGATTATTGGATAGCTGGAGCATGGGATTTCTTCCAATGTACTCCAAAATGAGTAAATTAACTGTTGGCCTAACTTATTACAAGTACCAGAGGAGTCTCGGGCAGAATAAAAGCTTTCATTACATTGGCCCAACTTGTTACAAGTACAAATGTTTACATTTGTTTTGTTGATTCTCATCTACCTCATGTGTTTTGCTCAAAGAAGTTTTTTTAACCCATGTGTCATATAATTTTACACGGAAACTCACGGATATTTTTATTGTTGTATCTCTTTTTTCCTTTCGATAAACTTTCAAATTCCAAAAAAAATCAAAATTTAAAAAACGTTTCATTTGAAAATATTTTCTCAAATTAAAAAATGCTTGTGGTTTTCAAAAATATAAAATTTGAAAATATATTCACAAACTAAAAAAATCGCTTTTAAAAATATGTTCAAAATTTAGAAACAATTTGAATTTAAAAAATGCTCATGTTCTCCTAATATTTTGCATTTTCAAAAAATATTATTTTTTTTCTAATTTTTTATCGCTTTTGTAAAATGTTCGCAAATTGTAAAAAAACTTTCACGTTTTCAAAGTAATGTCGTCCAATTTGAAAAGATTGTTCGTGTTTGCCAAAAAAGTGTAAAATTTGAAACACAATTCACGTTTACAAAAATGTTCATTTGAAAAATTCTCTCGTTTTCAAAATTTTACATTTTTGCAAAATGTGCAGAAATTTTAAATAATTGTTTCCGTTTTTGCAAAAAAAATATTCTAAAAAATTTCAATTTATATGCTGCAGTAGTCTCGTTGGTTACAGAATCCAGTTTCCTACAGGTCGGGTTGCTATAGTATCGGGTTGCTATAAGAAACTGGTGCGCTATATAAAACCCGACCCGCTACAATGTGTCTAAAGAAAATACCAAGAAGCCCCTTGAAGAAATTGGGGTCGCTACATGTTTTTTTTTTTTTGAGAATTGGGGTCACTACACGTGAGCGCGCCTCCGTGCGAGTGGGCTGGCCCAGGCGGGGCAGAGGGCACCTGTTTTGCACTGGCATTCATGTTTTTTTTTTTTGCTTGTGATTGTGCTCAAAAGGAACTGTGCTAATTTCATGGTATTTCACAACAAATCGAGTTACAATTTGCGTTTTCCCATCCTGTTTGATTTGATCTCACAAGGTCTTATGGCCTTAACCTTCACATATGTCCAGCATGTGCTGGTGAACTGGTGATAGGAAGCAACCGAGGCCTCCATTGCAACGGCAAGTGGAGGGACGTATTTCCGGATGCTTCCCATTTCCAACGCATCTGACCCCTCCTGTTATCATGTCATTCCCGTTTATCACTTTCTTCTTTCCATGTCTTAATCTCATTTGTGTCGATTTGGCGGCTTCAAATTGAGAAGCAGAGCTTGCTAAGATGGGTAGTAGGCTAAAGGAAAAGGAGTGCCCATCAATTGGATATATACTCAGCTGGGTTTGGAAGTATGAAGAGGAGCCATATACTTTATATATATGTGTAAATGGTGTGGGCCCGTGTAAAGATCGTCATAGTTTCTAGTTAAATATCTCCTGTGTACTACAACTCATCAATGATCTCTTGCTCTAGTAAAGTAGAGGATAGGTATCTCAGTGGCATTAGTGATATCTCAACTCATCAATTGTTTCTTGTTTCCATCTCCATGAACGTAGCAAGAAACCAGTTTCAAAAAAAGAAGTACCAATAAACCTACAGACACTTGCAGAGTTCTTTTTCTCACTACTCTGCTATTGAGGAGTAAATAGCAAAAAGCTACCACATTATAGGCTAGGGTTACAAAAAACTACCTCTTTTCTTAATTTCCCAAAATGCTAGCACAAATTTGGTTCGCTGTTCCAAAAAACACTAGTGAGTAAAGCGTTAACTTTTAACTGCGGTTATGACAACTTTGGCCCACCCGTCAGGTCTGATGTGGCATAAAACTCAACACCGTTAGCTTTGGCCGTTATGACAGGTGGAACCCACATGTCATTCACTTCCAAAAAAATAAAAAGCAATCGGGACCCTATACCTTTCTAGAAAAGCAATCGGATCACTGTAAATGTCTAAAAAAGCAATCAAGTCCCTGTAACTTTCTAGAAAAAAGCAATCGGGTCCTGTGAAAAAAATTAATCGGGTCCTGTGAAAAAATTAATCGGGTCCTGCTTGGCTGCCGGCGAGCTCATCCCTGCTTCGGCTGCCGCGGCCTAGGGTCGCCGCGCGCGCTGATCCTGGCTGCGCACCTTCCACTCGCCAGTGAGGAGAGCCAGAGAAGTGATGGGATGGCGAGGGAGCTCCAGCTCTCCCTTCATTGGCCTCCGCCGCCACTCCCGTGTATGTCCCTTCCCGCGCGCTTGACCGGGAGAGTCCCTCTTCTCCGGCACTGGTGACGCCAGCCCGGCCCGCTCACCCTCGCTTCCACGCTCCCCCCTTCCGATACCGACGCAGCAGTGAGTAGCAGCATGCAACGGCAGCGGCATGCAGCATCGGAGAATTGCGGCGGCGGCGGTGGAGAGCAGCAGCAACAACAACACACAGCAGCAGCGGTAGCTTCTGCCCATGGCGTTGGGGCTACGGGAGAGAGACAGAGCAAGGCGCATAGGGTGGGTGTCGTGATATAGAGAAGAGAAGAGAAGGGAGAGAAGAAGCTGACATGTGGGCCCCACCCGATCATAACCGTCAACTTAACTGTTTGTTTATATAACGGTGCTGACTTTTTTGCCACGTGGAACTGACGAGCGGGCCCTCCATGTCATAAACCAGATTAAACCATTCAGTCACTAGTGTTTTTGGAACAACAAACCAAATTTGTGGTAGCATTTTGGGAAGTTAAGAAAAATGTTAGTTTTTCGTAACCCTATCCCATAATGTGGTAGTTTTCTGCTATCTACTCTTTGTTTAAAAGGGGAAGTTAAGAAGTTGGCATCCATGTAATATATTTTTTGAAAAGGGAAATATATTAATATCACGAAGATGCCAATTTCTCTGTTTAAAATTTGCTCTAAAAGCCAAATCAAAATACACACATATTGTTTGAATGGATTATAATTTCCTCGTGGGCGCTGGAGCTCCACTCAGATCTACCCACACTCAGTCATACGAAGCCAAGGTCGGAATGCTGCGCCGTTGTAGGATCACAGCAATCACACATGCTAAGGTTGATCCTGTGTGTTGGTCCGGCTCTAGTTGATCCTCTGTGTCGCCATCCAAACTCGGGAAGGTCAAGTGCCCACTGCCACCATCACAACTCACATCATTGAGCGCCTACACTCGTCCAAGTACAAACATCATTGAGCGCCCAGTCAGACGAAGCCAAGGTCGGAATACTGCTCCATTTATAGGATCTGTCAGACCAGAGCCCTCCATCTCCTTCGCCATGGTCGCTCACTCGATCACAGTTGTAGCGCACGCTAAGGTTGACCCTACATGTTGCTCCAGCTCCAGTTGACCCCCTGTGTTGCCATCCAAACCCGGGACAGTGATGCACCCTCTGCTACCAGCATAAGCGACCGATCACCATTCACCCATCCCCACAATGCCGACGTCCCCTCCCACTAAACCCTCTCATGGCAACCCCAACACAAGCACCAAGAAGAATTAGTTCTCAGAGTTCGGTGAAGATGGCGAGCAGTATAGGGGAATAGGGCATAGCGCTAAATCACTCTTTGCATTGTTTGTCGTAGGTGTGAATTATAGCATGACTGATTGTCTTTCTTCCTGTTCATGTAGCTGGTCATTGGTACTTATCTTTACCATGAGTGGTAGTCTGTTATCTTGTTCTACAATTTGGCGTTTGCCAACTTGGTATACTGATCGTTGTAGCATTGCACTCTGCTTATCTTTAGTGAAATACGTGCACTGTGTGTTCTCGAAATCAGCATTGTACTCTGCTTCTCCTGGATTAAATATGTGTTCTTGGAAGAAACACCGGACTACTTTAAGTATTGCAATATATTTTATCAACAAGGTAAATAGGTTGCATGAAAAAAATTCAGTCAGTAGCCAAATTTAGTAAATCAAATATCGAGGAGGTAATTTTCTTTCAATTGGTTTTGGATGAAGATCTATTTCAGATTAAGTACTACTCATCTTATTAACTTGTAGTTCATGATTTTTTAATTGTATTCATAGATGTTGAATATTTTTTTTCAATAATACAGGAGATAACGTGAGTCTTCATTAAAAGCTGCATGATTAGTAACTCCCAGTATAGGAACATCTTCCCAATTTGGGCACTCGCAGAGTACCGGCACCGAGTCTTGGCTGGTGGCAGCTAGTACTTATGTGTTTAGGGGCAATGAATTTGTGCAGTCTGTAGGAATCTGCAGATCATTTATTTATTTATGTATGTTCATTGTTGATGAATATATAACCCAATATGTAAAACATATAATTTTGTGAGGGGTTCCGATCTCTTTAAAACATAAATCAATGCAATTCTAGATGGACAGATAGTAGAGTTCATCAGTTTATGTCATTGATAAGAGCGACTTTTTCAGAGAGCTGTAGTAATTTTCTGTAGATATATTTCCACCAAAGGGCAAATTAGGTTAATGCCGAAAATCAAATCAATTCTTTGGATGGAAATTTCAGTATATCGAAATGTGGGCTTGCAGCAATGGTACCGTCCTATGCACAATCCAGATCAAAGCAGCGCATTGTCCCCTTTGCTGAGCTCGCGGCCACCCCTAGTTGTGCCCAACCTGCACCCGCGAGATGAAAGCCGAGTTCCCTCTAGTCTTTAACCTTCACATCCTAGTCATTGCATATTCTGCATGTGGTGGAGAAAGGCAGCAATCGACGCCTCCGTTGCAACAGCAAGTGGAGGGACGTTTTTCCGGATGCCTCACATTTCCAGCACATTGCACACCCATCTAACCCCTCCTATTGTCATGTCATTCCCATTTATCACTTTCTTCTTTCCATGTCTAAGTCTCATTTGTGTCGGTTTGGCGGCCTCAAATTGAGAAGCAGAGCTAGCTAAGATGGGTAGTAGGCTAAAGGAAAAGGAGTTCCCATATACTTTATATATATGTGTAAATGGTGTGGGCCCGAGTAAAGATCGTCATAGTTTCTAGTAAAAAAGAAAATATCTCCTGTGAACTACAACTGATCAATGATCTCAGTGGCAGCAGTGATATCTCAACTCATCAATTGTTTCTTGTTTCCATCTCCATGAACGTAGCAATAGACCTCAAACGAAAAAAAAA\n>URS0000F1BCF3 rRNA from 1 species \nTACGTAGGGGGCTAGCGTTGTCCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCTTGGAGCTTAACTCCGAAACTGCATTCGATACTGCGGTGCTTTGAGGACTGGAGAAGGAGACTGGAATTCATGGTGTAGCAGTGAAATGCGTAGAGATCATGAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTC\n>URS0000D17570 sRNA from 1 species \nTCCCAGCCGGGTTCGTGTCGCCATGGGGCAGATCGAGTGGGCCATGTGGGCCAACGAGCAGGCGCTGGCGTCCGGCCTGATCCTCATCACCGGGGGCATCGTGGCCACAGCTGGGCGCTTCACCCAGTGGTACTTTGGTGCCTACTCCATTGTGGCGGGCGTGTTTGTGTGCCTGCTGGAGTACCCCCGGGGGAAGAGGAAGAAGGGCTCCACCATGGAGCGCTGGGGACAGAAGTACATGACCGCCGTGGTGAAGCTGTTCGGGCCCTTTACCAGGAATTACTACGTTCGGGCCGTCCTGCATCTCCTGTGAGTCCCCGCCCTGCACCCCCTCTAGGGCTCAGGAGGGCTTGGAGCCGACCCTCCCCACTGTCCCACCGGCCGGGCTGCCTGGACAGGAGCCACCCCCACTTACCTCAGTGTTTTTCCAAACAAAAATTCGGGTCCCTGGCTCTGGCAGGGCCTGTGTCTGCTGTCTAGTGTGCAGGATTTGTAAGGATCCACTCCAAATCCGAGTAGCTCCGATCCGTCGCCACGGTCTGGGGTCAGCAGGCACTGCTGGGGGGTCTTGCCTGGGCTTCCTGGTAGGGTGGAGGGTTCCGTGCTGTGTGTCTGGTGGTTACTGCCGGCTGAGGCCAGGAGACCCACACGTGGCTGGTTCCTCCGAGCAAGTGCCCCAGAGCCACTAGTGTCCACATCAAGGCCGAGAACACCCAGGACCGAAACAAGCCCTGGTCCGCGCACGTCCCCTGGGTGTTCCTTGTGCTGAGACTTTGCAGCCCTGGGCCATGCACGTCCCCTTGGTCTGCAGTCTGCCTTGTCCTGAGACTTTGTGGCCTTGGCCCCCAGACCTGGGGCTCCGTTCCCCTTTCTGAGTGCCCTTCTGTGTCCCTGCCTCTCACCCGCTGTCCCCCAGGCTCTCGGTGCCCGCCGGCTTCCTGCTGGCCACCATCCTTGGGACCGCCTGCCTGGCCATTGCGAGCGGCATCTACCTGCTGGCAGCTGTGCGTGGCGAGCAGTGGACGCCCATCGAGCCCAAGCCCCGGGAGCGGCCGC\n>URS00003EB83F lncRNA from 1 species \nCAGATTTAGGGCAAAGTTAACACTTCAAAAATATCTCCAGTAATTGAGTAAATTGCTCATCTGTCAAATTGGCTCTTTGGCAAATTACTCTGCTTGCACATATTAATAGCCAAGCTTAGCCAACTTGAAATATGGAGATTTACTGGAAATCACAGTGAAGTGAAGAGAGAGGCAAGAGCAGAATTGAAATTCCCACCTGGCAGCAAAAGAGAGTTATGCAGAGCCTATCAGGACCCGTGTTCACACCAGCACTTAGTTTGGAGGAAGCACCTGGAGGAGATGCAGAGTCCAGATGTGCGCCCTCTGCCGGAAGCCTACTGCACCAGGACGTAGGCCTGGAGTGGCCCTTAACGCATTTGGAAATCAGTCTTCACTAAAAAAACTTCCTCCAAAATGTTCTTTAACAGCCCTTTAAAAGCCATTGTTTCAAAACAGTCCAAGGTGGTGAACAATTAATATTTTCGATTTACATGAAGACTCTGGAGTAGGAATTACCTGAGTTGGAAACTCAGTTCTACTCTATTGGTATCAGGTTGCATTCTGTATCATCATTAAAATTTTCAGAAAAACTCTC\n>URS000039DFEA rRNA from 1 species \nGAATCTAGCTTCAGGTCTGGGACAACCACTGGAAACGGTGGCTAATACCGGATGTGCCGAAAGGTGAAAGATTAATCGCCTGAAGATGAGCTCGCGTCTGATTAGCTAGTAGGTGGGGTAAGAGCCTACCTAGGCGACGATCAGTAACTGGTCTGAGAGGATGACCAGTCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTCCGCAATGGGCGAAAGCCTGACGGAGCAATACCGCGTGAGGGAGGAAGGCTCTTGGGTCGTAAACCTCTTTTCTCAGGGAAGAACACAATGACGGTACCTGAGGAATCAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCCGCAGGTGGCTGTGTGTGTCTGCTGTTAAAGAGCAAAGCTCAACTTTGTAAAAGCAGTGGAAACTACACAGCTAGAGTGCGTTCGGGGCAGAGGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAAGAACACCGGTGGCGAAAGCGCTCTGCTAGGCCGCAACT\n>URS00007386F9 rRNA from 1 species \nGCGGCAAACGGGTGAGTAATATCTGGGAATCTACCCAAAAGAGGGGGATAACTACTAGAAATGGTAGCTAATACCGCATAATGTTGAAAAACTAAAATGGGGGACCTTTTTAGGCCTCATGCTTTTGGATGAGCCCAGACGAGATTAGCTTGTTGGTAAGGTAAAAGCTTACCAAGGCTACGATCTCTAGCTGGTCTGAGAGGATAGCCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCTATGCCGCGTGTATGAAGAAGGCCTTAGGGTTGTAAAGTACTTTCAGCGGGGAAGAAAAAAATAAAAATAATACTTTTAT\n>URS00008F63D8 tRNA from 5 species \nGTGCCCATAGCTCAGTTTGGTTAGAGCATCCGACTCATAATCGGCAGGTCCTCGGTTCAAGTCCGAGTGGGCGCACCA\n>URS00007B46A8 snRNA from 1 species \nCCCACCCTGGAAACGGCTCAGC\n>URS0000B49266 rRNA from 1 species \nAGAGTTTGATCATGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGTAGCACAGAGAGCTTGCTCTCGGGTGACGAGCGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATAATGTCGCAAGACCAAAGTGGGGGACCTTCGGGCCTCATGCCATCAGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAACGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGCGGGGAGGAAGGCGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCGATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTCAAGTCGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTCGAAACTGGCAGGCTAGAGTCTTGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGATTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAATCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCACAGAACTTNTTGGTGCCTTCGGGAACTGTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTTCGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCATATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTATGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTAGATCAGAATGCTACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTAGGGGAACCTGCGGTTGGATCACCT\n>URS00003BE16A rRNA from 1 species \nTGAACGCTAGCGGCACGCTTCATACATGCAAGTCGAGGGGCAGCATAAAGTACTTGTACTTTGATGGCGACCGGCGAACGGGTGCGTAACGCGTATGCAACTTACCTTTTACTAGAGAATAGCCAAGAGAAATTTTGATTAATGCTCTATACTCTTTTTAACTCACATGAGTTTTTAAGAAAAGCTCCGGCGGTAAAAGATGGGCATGCGTCCTATTAGCTTGTAGGTGAGGTAACGGCTCACCTAAGCTCCGATAGGTAGGGGTCCTGAGAGGGAGATCCCCCACACTGGTACTGAGACACGGACCAGACTTCTACGGAAGGCAGCAGTAAGGAATATTGGACAATGGAGGAAACTCTGATCCAGCGATGCCGCGTGAAGGAAGACGGCCCTATGGGTTGTAAACTTCTTTTATACAGGAAGAAACCTTTCCACGTGTGGAAAGCTGACGGTACTGTAAGAATAAGGATCGG\n>URS00025B9EB0 lncRNA from 1 species \nGGAGAATTGCAGTGATAAAAATGAATGTTTTACCGAGGCTACTCTACATATTTCACACAGCCCCACAGGTGATTCCGCAGGCATTTTTCAGGACACTCAAAACAGCAATCACACAATATATTTGGAGAGGGGAGAAGGCCCGCATTGGCTTTGACAAGCTCTGCTTACCAAGAAGCTGGGGAGGGTTAGCCTTGCCCGACATCAGAAAATACCACCAGGCTACAGTACTGCAGAGGCTCAAG\n>URS0001DE2DB5 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTTGAGCGCTGAAGGTTGGTACTTGTACCAACTGGCTGAGCAGCGAACGGGTGAGTAACGCGTGGGGAATCTGCCTTTGAGCGGGGGACAACATTTGGAAACGAATGCTAATACCGCATAAAAACTTTAAACACAAGTTTTAAGTTTGAAAGATGCAATTGCATCACTCAAAGATGATCCCGCGTTGTATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGATGATACATAGCCGACCTGAGAGGGTGATCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGGTGTCGGATCGTAAAACTCGGTTGGTAGAGAAGAACGTTGGTGAGAGTGGAAAGCTCATCAAGTGACGGTAACTACCCAGAAAGGGACGGCTAACTACGTG\n>URS0001C397AE rRNA from 1 species \nGATGAACGCTAGCGGCAGGCCTAATACATGCAAGTCGGACGGGATTCAGGAGCTTGCTTCTGATGAGAGTGGCGCACGGGTGCGTAACACGTATGTAACCTACCTTTATCAGGGGGATAGCCTCTCGAAAGAGAGATTAAGCCCGCATAAAATCACAGCACAGCATTGTGTAATGATCAAATATTTATAGGATAAAGATGGGCATGCGGAACATTAGCTAGATGGCGGGGTAACGGCCCACCATGGCGACGATGTTTAGGGGATCTGAGAGGATGGCCCCCCACACTGGTACTGAGACACGGACCAGACTCCTACGGGAGGCAGCAGTAAGGAATATTGGCCAATGGGCGGAAGCCTGAACCAGCCATGCCGCGTGCAGGAAGACGGCCCTACGGGTTGTAAACTGCTTTTATACGGGAATAAACCCAGATACGTGTATCTGGCTGAATGTACTGTAAGAATAAGGATCGGCTAACTCCGTG\n>URS0000EF62B1 lncRNA from 1 species \nGCTGCCACCTCTCTTGACTCCCTTGTGAGGAGATCGGCTCTTGCTCCTCCTCATGCCATGACTCTTTAATTTGCGGCTGGTCGACATGCCATTGTGACAAGGCACCATCAATCATCATGTCCCTTTACCAGGAGGGCCCGTGTCATAAGCCACTATATAAAGGGAATGATGGGTGGACTGCTTTGGACAAATGGACCTGCGGTAGGAGAGAGGGACAACAGTAGGAGCAGGCAGATCTTGCTGTTTCAACCAAAACCTCATGCTGACCAGAGTTGAGGAACAGAAGAAGATGGTGAAGGCCTGCAGGTATAGGTGTTCAGCATGTCATCTGAAATATTCCCCACAGAGGCAAAAAGAAAGGAAATTATCTCTGAAAAGGAATGGGAGGACAAGTCAGCAGAATATGTCAATGTTTTGGTTGAAGAAGCTGCTTGAATCTGGGCTTTTCTGTGCCATGTGTTCTCCCAGGGCCAGCACAAAGAAGGGCTTTTGGTGCAGGCCCAAGACCACCATAATCATCATTGATTATTCCTCTCCACGCCAGTGTCTCTAAATAAACTTTCTCTTCTTTCTCTGACAAA\n>URS0002429CE1 lncRNA from 1 species \nTTTTCTTGAATGGACAATAATGCGTTTTGTGTCCAAGTTTGCAACAAAAGTTGTATTTGCTTTGGTGTTGAACATGTAAGATGGGGCCTTTTATGAAGGTGGTTGGATTTTGGTGAGGACTTCTCACAAATCCGATTCCACTTCTTTTGGGAACGTGACCCTTGTTTGCAAGGATCATGTTCAGTGACTTGCTACCAACCTCGAATTTCTTCAAGGTGTCCTTAAGTAGCAAGTTTTCCTTTTGGAGAGTTTCTAGATCATGGCATTT\n>URS0001CE0F72 rRNA from 1 species \nGGGTTGTGAGGTTAAGCGACTAAGCGTACACGGTGGATGCCCTGGCAGTCAGAGGCGATGAAGGACGTGCTAATCTGCGATAAGCGTCGGTAAGGTGATATGAACCGTTATAACCGGCGATTTCCGAATGGGGAAACCCAGTGTGATTCGTCACACTATCATTAACTGAATCCATAGGTTAATGAGGCGAACCGGGGGAACTGAAACATCTAAGTACCCCGAGGAAAAGAAATCAACCGAGATTCCCCCAGTAGCGGCGAGCGAACGGGGAGGAGCCCAGAGCCTGAATCAGTGTGTGTGTTAGTGGAAGTGTCTGGAAAGGCGCGCGATACAGGGTGACAGCCCCGTACACAAAAATGCACATGCTGTGAGCTCGATGAGTAGGGCGGGACACGTGGTATCCTGTCTGAATATGGGGGGACCATCCTCCAAGGCTAAATACTCCTGACTGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAAAAGAACCCCGGCGAGGGGAGTGAAAAAGAACCTGAAACCGTGTACGTACAAGCAGTGGGAGCACGCTTAGGCGTGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTATATTCTGTAGCAAGGTTAACCGAATAGGGGAGCCGAAGGGAAACCGAGTCTTAACTGGGCGTTAAGTTGCAGGGTATAGACCCGAAACCCGGTGATCTAGCCATGGGCAGGTTGAAGGTTGGGTAACACTAACTGGAGGACCGAACCGACTAATGTTGAAAAATTAGCGGATGACTTGTGGCTGGGGGTGAAAGGCCAATCAAACCGGGAGATAGCTGGTTCTCCCCGAAAGCTATTTAGGTAGCGCCTCGTGAATTCATCTCCGGGGGTAGAGCACTGTTTCGGCAAGGGGGTCATCCCGACTTACCAACCCGATGCAAACTGCGAATACCGGAGAATGTTATCACGGGAGACACACGGCGGGTGCTAACGTCCGTCGTGAAGAGGGAAACAACCCAGACCGCCAGCTAAGGTCCCAAAGTCATGGTTAAGTGGGAAACGATGTGGGAAGGCCCAGACAGCCAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAAAGCGTAATAGCTCACTGGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAACCATGCACCGAAGCTGCGGCAGCGACGCTGATGCGTTGTTGGGTAGGGGAGCGTTCTGTAAGCCTGCGAAGGTGTGCTGTGAGGCATGCTGGAGGTATCAGAAGTGCGAATGCTGACATAAGTAACGATAAAGCGGGTGAAAAGCCCGCTCGCCGGAAGACCAAGGGTTCCTGTCCAACGTTAATCGGGGCAGGGTGAGTCGACCCCTAAGGCGAGGCCGAAAGGCGTAGTCGATGGGAAACAGGTTAATATTCCTGTACTTGGTGTTACTGCGAAGGGGGGACGGAGAAGGCTATGTTGGCCGGGCGACGGTTGTCCCGGTTTAAGCGTGTAGGCTGGT\n>URS00003281C0 rRNA from 1 species \nCTACGTGCCAGCAGCCGCGGTAATACGTAGGTCCCGAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGTTAGATAAGTCTGAAGTTAAAGGCTGTGGCTTAACCATAGTACGCTTTGGAAACTGTTTAACTTGAGTGCAAGAGGGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCGGTGGCGAAAGCGGCTCTCTGGCTTGTAACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGGTGTTAGACCCTTTCCGGGGTTTAGTGCCGTAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCCTCTGACCGCTCTAGAGATAGAGCTTTCG\n>URS00016D14C4 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAATGGATTGAGAGCTTGCTCTTATGAAGTTAGCGGCGGACGGGTGAGTAACACGTGGGTAACCTGCCCATAAGACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATAACATTTTGAACCGCATGGTTCGAAATTGAAAGGCGGCTTCGGCTGTCACTTATGGATGGACCCGCGTCGCATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCAACGATGCGTAGCCGACCTGAGAAGGTGGTCGGCCACACTGGGACTGAGAGACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCGTCCGCAATGGACGAAAGTCTGACGGAGCAACGCCGCGTGAGTGATGAAGGCTTTCGGGTCGTAAAACTCTGTTGTTAGGGAAGAACAAGTGCTAGTTGAATAAGCTGGCACCTTGACGGTACCTAACCAGAAAGCCACGGCTAACTACGTGCCAGCCGCCGCAGTAA\n>URS000090AB96 SRP_RNA from 1 species \nGCCGGGCGTGGTGGCGCATGCCTGTAATCCCAGCTACTCGGAAGGCTGAGGCAGGAGAATTGCTTGAGCCCAGGGAGCGAAGGTTGCAGTGAGCAGAGATCATGCCACTGCACTCAAACCTGGGCAACAGGGTGAGACTCTGTCTCAA\n>URS00023BAE1B lncRNA from 1 species \nCTGAACCCTTATCAGTAAAAGTTTATCCGGAGTCAGAGAACAGGGAATGGCACTCGACGCAAAAATCGGGCGAGGCCCAGCCCTAGATGTGGGTTCATCTACAGTGTGGGGGTTTTGGGGGACCAAACAAAGGCCCTAAAAATCCTGGAACCACTAGAGGCGGAGGTACCGAAAGATATTTCAAACAAAGGCCCTAAAAATCCTAGAAAAATCAGGCGGGATAAGAGGTGAAAGGTTTGCGGGGGACCAAACCAGAGGAATGTGGCAGAAGAAAAATGGAGGAGAAAGGGCACCT\n>URS00022ED730 rRNA from 1 species \nTGGGGAATTTTGGACAATGGGGGCAACCCTGATCCAGCAATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTTGTCCGGGAAGAAATCGCACCTGATAATACCGGGTGTGGATGACGGTACCGGAAGAATAAGGACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTCGGGTCCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTGTGCAAGACCGATGTGAAATCCCCGGGCTTAACCTGGGAATTGCATTGGTGACTGCACGGCTAGAGTGTGTCAGAGGGGGGTAGAATTCCACGTGTAGCAGTGAAATGCGTAGAGATGTGGAGGAATACCGATGGCGAAGGCAGCCCCCTGGGATAACACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGG\n>URS00010F344E rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTAGGACGCAGTTGCGAACGGGTGAGTAACGCGTAGGTAACTACCTATTAGAGGGGGATACCTATTGGAAACGATAGCTAATACCGCATACCTGTAGATGGATCTGCGTTGTATTAGCCAGGAGGTAGGGTAATGGCCTACCTAGGCAACGATACATAGCCGACATGAGAGGATGATCGGCCAGACGGGGAGTGCGGCACGGCCCAGACTCCTACGGGTGGCAGCAGTAGGGAATCTTGGGCAATGGGGGGAGCCCTGACCGAGCAACGCGGCGTGAGTGAAGAAGGTCGTCGGATGGTAAAGCTCTGTTGTTAAGGGAGCGGTACTTAAAGAGAAAGGGACGGCTAACTACGTGCCAGCAGCCGCGGTAATAC\n>URS0001F774E1 misc_RNA from 1 species \nGATGAAGAACGCAGCGAAATGCGATACTTGGTGTGAATTGCAGAATCCCGTGAACCATCGAGTCTTTGAACGCAAGTTGCGCCCGAAGCCATTAGGCCGAGGGCACGCCTGCCTGGGCGTCACACGTCGTTGCCCCCCCATCTACTCCTTCGGGATTGCGGGGGGCGGATGATGGCCTCCCGTGCGCCTCGCCGCGCGGTTGGCATAAATGCCAAGTCCTCGGCGACGCACGCCACGCCAATCGGTGGTTGCGAAACCTCGGTTGCCCGTCGTGTGCGGTCGTCGCGCATCGAGGGCTCGAAAAAATTGCCGGGTTCCGGCTCGGCTTTCAACGCGACCCCAGGTCAGGCGGGGTTACCCGCTGAATTTAAGCATATCAATAAGCGGAGGA\n>URS000076AF46 rRNA from 1 species \nGGTTAAGCGACTAAGCGTACACGGTGGATGCCCTGGCAGTCAGAGGCGATGAAGGGCGTGCTAATCTGCGATAAGCGCCGGTAAGGTGATATGAACCGTTATAACCGGCGATACCCGAATGGGGAAACCCAGTGTGACTCGTCACACTATCATTAACTGAATCCATAGGTTAATGAGGCGAACCGGGGGAACTGAAACATCTAAGTACCCCGAGGAAAAGAAATCAACCGAGATTCCCCCAGTAGCGGCGAGCGAACGGGGAGGAGCCCAGAGCCTGAATCAGCATGTGTGTTAGTGGAAGCGTCTGGAAAGGCGCGCGATACAGGGTGACAGCCCCGTACACAAAAGCGCATGTGCTGTGAGCTCGATGAGTAGGGCGGGACACGTGGTATCCTGTCTGAATATGGGGGGACCATCCTCCAAGGCTAAATACTCCTGACTGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAAAAGAACCCCGGCGAGGGGAGTGAAAAAGAACCTGAAACCGTGTACGTACAAGCAGTGGGAGCCCCACCACCAAAGCATTCTCTGGTGTTGAAGGCCCTGCAAAGCAGCATCGCGGTGGCGGAGCGTCGTTTGCGACGCCCAACACACAAAACAAGCGGTGAATGCTTTGGGGTGGGGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTATATTCTGTAGCAAGGTTAACCGAATAGGGGAGCCGGAGGGAAACCGAGTCTTAATTGGGCGTTAAGTTGCAGGGTATAGACCCGAAACCCGGTGATCTAGCCATGGGCAGGTTGAAGGTTGGGTAACACTAACTGGAGGACCGAACCGACTAATGTTGAAAAATTAGCGGATGACCTGTGGCTGGGGGTGAAAGGCCAATCAAACCGGGAGATAGCTGGTTCTCCCCGAAAGCTATTTAGGTAGCGCCTCGTGAATTCATCTCCGGGGGTAGAGCACTGTTTCGGCTAGGGGGCCATCCCGGCTTACCAACCCGATGCAAACTGCGAATACCGGAGAATGTTATCACGGGAGACAC\n>URS0001199C7A rRNA from 1 species \nTACGTAGGGTGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTCTGTCGCGTCTGCTGTGAAAACTCAGGGCTTAACCCTGAGCTTGCAGTGGGTACGGGCAGACTAGAGTGCGGTAGGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCATTTCCTGACGCTGGAGGCGCGAAAGCGTGGGGAGCAAACAGG\n>URS0000FE9A33 rRNA from 1 species \nTACGGAGGGTGCAAGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGCGGGTTGGTAAGTCCGTGGTGAAATCTCCGAGCTTAACTCGGAAACTGCCGTGGATACTATCAATCTTGGATATCGTGGAGGTAAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGTAGGCAGCTTACTACACGATCATTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGG\n>URS0001565352 rRNA from 1 species \nAACGTAGGAGGCGAGCGTTATCCGGATTCACTGGGCGTAAAGCGCACGTAGGCGGTCGGGTAAGTCGGATGTTAAAGCCCTTGGCTCAACTAGGGGAGGTCATTCGATACTGCTCGGCTTGAGGATGAGAGAGGAAAGTGGAATTCCCGGTGTAGCGGTGGAATGCGTAGAGATCGGGAGGAACACCAGTGGCGAAAGCGGCTTTCTGGCTCATTCCTGACGCTGAGTGTGCGAAAGCGTGGGTA\n>URS000144CD04 rRNA from 1 species \nCAGTCGCCGCGGTAATACGAAGGGTGCAAGCGTTACTCGGAATTACTGGGCGTAAAGCGTGTGTAGGTGGTTGTTTAAGCCTGTCGTGAAAGCCCTGGGCTCAACCTGGGAATTGCGATGGATACTGGGCGACTAGAGTGCGGTAGAGGATAGTGGAATTTCCGGTGTAGCAGTGAAATGCGTAGAGATCGGAAGGAACATCTGTGGCGAAGGCGACTATCTGGGCCAACACTGACACTGAGACACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCGTGTAGTCCCTGTCTCTTATAA\n>URS00000D01ED rRNA from 1 species \nAGGATGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGTCCTGTCTCGCAAGAGGCAGGGAGTGGCGGACGGGTGAGTACCACGTGGGTTATCTACCGTGAGGTGAGGAATACCGGCGAGAAATCGCCGACAAGACCGCATAGCCTCGGTGCAAGCCGAGGAAAGCTTTCTCGAGAGAGGGAGCGCCACACGAGGAGCCTGCGCCCGATTAGCTAGCTGGTGGAGTAACGGTTCACCAGGGCGACGATCGGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGGATTGAGAACGGCCCAGACTCCTACGGGGGGCAGCAGTGAGGAATTTTCGTCAATGGGGGCAACCCTGAACGAGCAACGCCGCGTGCAGGAAGAAGGTTTTCGGATCGTAAACTGCTTTTCTCGGGAAGAGAACGGACGGTACCCGAGGAATCAGCCCCGGCTAACTACGCGCCAGCAGCCGCGGTAA\n>URS0002347B5A lncRNA from 1 species \nTTCTATGTAAGTATACTTCCGGGGTCTTGCCTCCCTTCTGCCCTGATTCTTCCCTTGTGGGTGTGCTGTCCGCATGCGCAGTGGCCTGCTAGCCCTTGGAAAGGAAGCATACGCAGTGTTTACTGGAGTTGTACGCATGCTCACTCCAGGCGTTCTTCCCTTACCTGCCGAATGTCCCTAGGAGGTCATATACCAGTTAAACTGCCCCATTTTGCCTCTTAGTGTACATTGTGAGCCCACTCAACCAGTTCCTGAGATACTACTGGGAAGCTGCTGATCACCAGTTTCAGGTTTTTTCCATCTGTTGGGAAACTGCCTATCCCTTGTGCTCGCTGCAACCAATTATTATTTTAGGGAGACAGTTAACCGCCTGACCATCACCCGATGATCGCCTGATGTTCATGCATCCATGACTACATAAACTTTTTGGCCGTTTGACCAAATGGGGACATCTGGCATACTGCTATCAACCAATATCACTTACTATGTCATAGGCACTGAACCACAAGCCTTCTGCAGGAATGATCTCATTTAATTCTTACAGCAATCCTATGAGATAAGTAGTACTGATATTACCATTTTACTAATTAGAAACTTGAAGCTTGGCGAGGTTAAATAATATGTCCAAAGTTGCAGAATGATTCAGTAGCAGAGGCTCATTGAGGGGCAAACAAGATCAATCCAATCCCATTCCTGTGTGAAGAAGACAGACATTAAACAATTAACCAAATAAATAATTGATGATAGCTGTAATGAGTGCTATGACAGGTGCTGAGCCAAGGCATAACTTCTGTTCTGAGGGTTCAAGGAAAGCATTGTTCCCTGACAAAATGACATTCAGTCATGGACTCCCACAGTGCTTAGGAGCTGGCAAGGCAAAGGCTTGGGTAGGATGGTTGGGATGAAAGTAAGAATGAGGAGTGAACAGTATTCTAGCTGGGAGGGTCCAAAGTGGGAAGGGGCATGGCAGACCATGGAACTGAGAGAAGGCCAGCAGGCAGGCTGCAAAGAGGGTGAGGGAGGAGGCAGCACCAGATGAGATTGGAAAGCCAGGTTGGGGTGTCATGATAGAGGCTTTGTAGCCATGAGAAAATGTTGGGCCAGGCCAGGTGTGGTGGCTCACACCTG\n>URS000084D716 rRNA from 1 species \nTACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTTTTTAAGACAGATGTGAAATCCCCGGGCTTAACCTGGGGACTGCATTTGTGACTGTAAGACTAGAGTGCGGCAGAGGGGGGTAGAATTCCACGTGTAGCGGTGAAATGCGTAGATATGTGGAGGAATACCGATGGCGAAGGCAGACCCCTGGGTCGACACTGACGCTGATGCGCGAAAGCGTGGGGAGCAAACAGG\n>URS0000CD773A rRNA from 1 species \nTACGTAGGGTGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGTCGCGTCTGCTGTGAAATCCCGAGGCTCAACCTCGGGTCTGCAGTGGGTACGGGCAGACTAGAGTGTGGTAGGGGAGATTGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGATCTCTGGGCCATTACTGACGCTGAGGAGCGAAAGCATGGGGAGCGAACAGG\n>URS00011E7DCB rRNA from 1 species \nTACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTTGTTAAGACAGATGTGAAATCCCCGGGCTTAACCTGGGAACTGCATTTGTGACTGGCAAGCTAGAGTATGGCAGAGGGGGGGTAGAATTCCACGTGTAGCAGTGAAATGCGTAGAGATGTGGAGGAACACCGATGGCGAAGGCAGCCCCCCTGGGTCAAGATTGACGCTCATGCACGAAAGCATGGGGAGCGAACAGG\n>URS00002D8EF0 rRNA from 1 species \nAGCGGCGAACGGGTGAGTAACGCGTGAGCAACCTACCTTAGTTACTGGGATAGCCCGAGGAAACTCGGATTAATACCGGATATTCTTATTTAATCACATGATTTTCTAAGGAAAGGTCAGCCGAACTAAGATGGGCTCGCGTTCTATCAGCTAGTTGGTAGGGTAACGGCCTACCAAGGCTACGACGGATAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCTGCAGCAGGGAATATTGTGCAATGAACGAAAGTTTGACACAGCGACACCGCGTGTGGGATGACGGATCTAGGTTTGTAAACCACTTTCAGGAGGGAAGAAAACGACGGTACCTCCACAAGAAGCCCCGGCCAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTCAACAAGTCGGTCGTGAAAGTTCAGGGCTCAACCCTGAAATGTCGATCGATACTGTTGTGACTAGGATACGGCAGAGGTGAGTGGAATTCCGAGTGTAGCGGTGAAATGCGTAGGTATTCGGAGGAACACCAATTGCGAAGGCAGCTCACTGGGCCGCTATCGACGCTGAGGAGCGAAAGCTAGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCTAGCTGTAAACGATGGATACTAGATGTAGGAATTGGTTTAACGATTTCTGTATCGTAGCTAACGCGTTAAGTATCCCGCCTGGGGAGTAC\n>URS0000C7CC16 tRNA from 1 species \nTCTCTGGTAGTCCAGTGGCTAAGGCATTGCACTGCCAATGCAGGGGACCCAGGTTCGATCCCTGGTCTGGGAA\n>URS00000379BF rRNA from 1 species \nGGCTTTTTGATAATAATTTAAAGTCTTACCTGCTCTATGATATTTTAAATGGCTGCAGTATTTTGACTGTACAAAGGTAGCATAATCATTAGTTTTTTAATTGAAAGCTGGAATGAATGGTTTGATGAAAAAATATCTGTCTTTATTTAATGATTAAAATTTTATTTTTAAGTTAAAAAGCTTAAATTTTTTTAAAAGACGAGAAGACCCTATAGAGTTTGATATTAATTTTTTTTTATTTTAAATTTAGAATAAATTTTTTAATTAATGRTGAATATTTGATTGGGGTGATTAAAAAATTAATTTAACTTTTTTTATTTTATTTCATAAATTAGTGTATATTTGATCCAAAATTTTTGATTATAAGTTTAAATTACCTTAGGGATAACAGCGTAATTTTTTTAGAGAGTTCTTATCGAAAAAAGAGATTGCGACCTCGATGTTGGATTAAAATTTATATTTGGTAGTAGAAGCTGAAATATTGGGTCTGTTCGACCTTTAAAATTTTACA\n>URS0002047E1F rRNA from 1 species \nCCTACGGGTGGCAGCAGTAAGGAATATTGGTCAATGGACGCAAGTCTGAACCAGCCATGCCTCGTGGAGGATGAAGGTCCTCTGGATTGTAAACTTCTTTTATTTGGGAAGAAACTCCCGATTTCCATCGGGCTTGACGGTACCAGATGAATAAGCACCGGCTAACTCCGTGCCAGCCGCCGCGGTAATACGGAGGGTGCAAGCTTTATCCGGTTTAAATGGGTTTAAGGTGGGCAGGGAAGGCAGTGTAGAAATCTCCGGGCTTAACCCGGAAACTGCCATTGATACTATTTGTCTTGAATACTCTGGAGGTGAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGAGATGACATAGAACACCCATTGCGAAGGCAGCTCACTACGGAAATATTGACGCTGAGGCACGAAAGCGTGGGGATCAAACAGGATTAGATACCCTTGTAGTC\n>URS000059B2B0 rRNA from 1 species \nCTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGTGGTTTAATAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGTTTAACTTGAGTGCAAGAGGGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCGGTGGCGAAAGCGGCTCTCTGGCTTGTAACTGACGCTGAGGCTYGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGGTGTTAGACCCTTTCCGGGGTTTAGTGCCGTAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACTCT\n>URS00014BE65D rRNA from 1 species \nATTGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGATCGGTAACGCGGGGGCAACCCTGGCGACGAGAGGCGGACGGGTGAGGAACGCTTGGGAATCTGCCTATCAGCGGGGGACAACACGGGGAAACTCGTGCTAATACCGCATACGCTCTACGGAGGAAAGCCGGGGACCGCAAGGCCTGGCACTGATAGATGAGCCCAAGCCGGATTAGCTAGTTGGCGGGGTAACGGCCCACCAAGGCGACGATCCGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAGTATTGGACAATGGGGGAAACCCTGATCCAGCGACGCCGCGTGGGTGAAGAAGGCCTGCGGGTTGTAAAGCCCTTTCGGTAGGGACGAAAGCTCTCGACCTAACACGTCGGGAGGATGACTTAACCTACAAAAGAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATAC\n>URS00004D4C08 rRNA from 1 species \nATGCAAGTCGAACGATGAAGCCCTTCGGGGTGGATTAGTGGCGAACGGGTGAGTAACACGTGGGCAATCTGCCCTGCACTCTGGGACAAGCCCTGGAAACGGGGTCTAATACCGGATACGACCACTGAGGGCATCCTCGGTGGTGGAAAGCTCCGGCGGTGCAGGATGAGCCCGCGGCCTATCAGCTTGTTGGTGGGGTGATGGCCTACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCGACGCCGCGTGAGGGATGACGGCCTTCGGGTTGTAAACCTCTTTCAGCAGGGAAGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCGCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGCGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGCCTGTCACGTCGGATGTGAAAGCCCGGGGCTTAACCCCGGGTCTGCATTCGATACGGGCAGGCTAGAGTTCGGTAGGGGAGATCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGTTGGGCACTAGGTGTGGGCAACATTCCACGTTGTCCGTGCCGCAGCTAACGCATTAAGTGCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGTGGCTTAATTCGACGCAACGCGAAGAACCTTACCAAGGCTTGACATACACCGGAAAGCATTAGAGATAGTGCCCCCCTTGTGGTCGGTGTACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCCTGTGTTGCCAGCATGCCCTTCGGGGTGATGGGGACTCACAGGAGACCGCCGGGGTCAACTCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGCCCCTTATGTCTTGGGCTGCACACGTGCTACAATGGCCGGTACAATGAGCTGCGATACCGCGAGGTGGAGCGAATCTCAAAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCCCATGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCATTGCTGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACGTCACGAAAGTCGGTAACACCCGAAGCCGGTGGCCCAACCC\n>URS000030D236 rRNA from 1 species \nCATGCAGTCGGAGGTAACATTTCTAGCTTGCTAGAAGATGACGAGTGGCGGACGGGTGAGTAATGCTTGGGAACTTGCCTTTGCGAGGGGGATAACAGTTGGAAACGACTGCTAATACCGCATAATGTCTTCGGACCAAACGGGGCTTAGGCTCCGGCGCAAAGAGAGGCCCAAGTGAGATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCGACGATCTCTAGCTGTTCTGAGAGGAAGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGTTGTGAGGAAAAGTTAGTAGTTAATACCTGCTAGCCGTGACGTTAACAACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATCACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGCTAGATGTGAAAGCCCCGGGCTCAACCTGGGATGGTCATTTAGAACTGGCAGACTAGAGTCTTGGAGAGGGGAGTGGAACTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACATCAGTGGCGAAGGCGACTCCCTGGCCAAAGACTGACGCTCATGTGCGAAAGTGTGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCACACCGTAAACGCTGTCTACTAGCTGTGTGTGTCTTTAAGACGTGCGTAGCGAAGCTAACGCGCTAAGTAGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACACTTGACATGCTGAGAAGTTACTAGAGATAGTTTCGTGCCTTCAGGAACTCAGACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTAAGTCCCGCAACGAGCGCAACCCTTGT\n>URS0000D53B79 miRNA from 14 species \nTTTATTCTCAGTTTGTTGCTC\n>URS00018E852B rRNA from 1 species \nCAGCCGCCGCGGTAATACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTATATAAGACAGATGTGAAATCCCCGGGCTCAACCTGGGACCTGCATTTGTGACTGTATAGCTAGAGTACGGTAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAATCCCCTGGACCTGTACTGACGCTCATGCACGAAGGCGTGGGGAGCAAACAGGATTAGATACCCCGGTAGTCCCTGTCTCTTATAC\n>URS0001DF4263 tRNA from 1 species \nGGGTGATTAGCTCAGTTGGTAGAGCAGGTGACTCTTAATCACCGGGTCCACAGTTCGAGCCTGTGATCACCCACCA\n>URS00007C3FF8 rRNA from 1 species \nTGGGGAATCTTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGAGTGAAGAAGGCCTTCGGGTTGTAAAGCTCTTTTACCAGGGACGATAATGACGGTACCTGGAGAATAAGCCCCGGCAAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGATTGTTAAGTCAGAGGTGAAATCCCGGAGCTCAACTTCGGAACTGCCTTTGATACTGGCAATCTCGAGTCCGGAAGAGGTTAGTGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCAGTGGCGAAGGCGGCTAACTGGTCCGGTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCCAGTAGTCCCTGAGCGGGC\n>URS0000D54BB5 miRNA from 15 species \nATGGGTAGCACAAGGATTAATG\n>URS000041BA98 siRNA from 1 species \nTCAACCTAGGCTCTGATA\n>URS00000BB073 rRNA from 1 species \nGGCGGTTAGATAAGTNTGAAGTTAAAGGCTGTGGCTTAACCATAGTACGCTTTGGAAACTGTTTAACTTGAGTGCAAGAGGGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCGGTGGCGAAAGCGGCTCTCTGGCTTGTAACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTNCACGCCGTAAACGATGAGTGCTAGGTGTTAGACCCTTTCCGGGGTTTAGTGCCGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCCTCTGACCGCTCTAGAGATAGAGTTTTCCTTCGGGACAGAGGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATTGTTAGTTGCCATCATTCAGTTGGGCACTCTAGCGAGACTGCCGGTAATAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGCTGGTACAACGAGTCGCAAGCCGGTGACGGCAAGCTAATCTCTTAAAGCCAGTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGGAGTCGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGTCGGTGAGGTAACCATTNGGAGCCA\n>URS00002C2482 rRNA from 1 species \nTGCGCCTTGCCAGCCCGCTCGAAACTTAAAGGAATTGACGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGCCTTGACATGCAGAGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAACTCTGACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTACCAGCACGTTATGGTGGGCACTCTAAGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGGCCTGGGCTACACACGTGCTACAATGGTCGGTACAAAGGGTTGCCAAGCCGCGAGGTGGAGCTAATCCCATAAAACCGATCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGTGAATCAGAATGTCACGGTGAATACGTTCCCGGGCCTT\n>URS00007D10E7 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATGCATGCAAGTCGCACGCAGCACTCTTCGGAGTGCTGAGTGGCGCACGGCTGAGGAACACGTGGGCACCTGCCCGCGCGTGGGGGATAACCCGGCGAAAGCCGGGCTAATCCCGCATACGCTTGGCTCCCAATAGCCAAGCAAAGCGGCAACGCGCGCGCGGAGGGGCCTGCGGCCCATCAGGTGGTTGGCGGGGTAACGGCCCACCAAGCCGGTGACGGGTAGCTGGTCTGTGAGGACAACCAGCCAGACTGGGACTGAGAGACGGCCCAGACTCCTACGGGAGGCAGCAGCAAGGAATTTTCCCCAATGGGCGCAAGCCTGAGGGAGCAACGCCGCGTGCAGGACGACGGCCTTCGGGTTGTAAACTGCTTTTCGGAGGGACGAGAGTGACGGTACCTTCGGAATAAGCCCCGGCTAACTCTGTGCCAGCAGCCGCGGTAAGACAGAGGGGGCCAGCGTTGTCCGGACTAACTGGGCGTAAAGCGCGCGCAGGCGGTCGGAGGCGTCGGTGCTGAAAAGCTCCCGCTTAACGGGAGACGGCGTGCCGATACGCTTCGACTGGAGGGCGGGCGAGGGTGGTGGAAGTGCCGGTGTAGTGGTGAAATGCGTAGAGATCGGCTCGAACACCAGTGGCGAAGGCGGCCACCTAGCCCGCCCCTGACGCTGAGGCGCGACAGCGTGGGGAGCGAACTGGATTAGATACCCAGGTAGTCCACGCCGTAAACGATGCCGACTCGGTCTTCGTGGAGCGACAAGCTCCGGGGGGGCCCGAGCTCACGCGCTAAGTCGGCCGCCTGGGGACTACGAGCGCAAGCTTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCAGCGGAGCGTGTGGTTTAATTCGACGCAACGCGCAGCACCTTACCCAGGCTGGACATGGAGCTGCACAGCGGGGAAACCCGCTGGCCTTCGAGGGTGCTCCACAGATGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCCGCGGCCAGTTACACGTGTCTGGTCGGACCGCCCTTCGGGGAGGAAGGCGGGGATGACGTCAAGTCCGCATGGCTCTTACGTCTGGGGCGACACACACGCTACAATGACGCCGACAGTGCGAGGCGAAGGAGTAATCCGAAGCGAATCGCCAAACGGCGTCCCAGTGCAGATCGGGGGCTGCAACTCGCCCCCGTGAAGGCGGAGTTGCTAGTAACCGCGTATCAGCCACGGCGCGGTGAATACGTACCCGGGCCTTGTACACACT\n>URS00004C538B rRNA from 1 species \nAACGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGANCGAACCCTTCGGGGTTANCGGCGGACGGGTGAGTAACCCGTGGGAACGTGCCCTTCTCTGCGGAATAGGCTCGGGAAACTGGGTTTAATACCGCATACGCCCTTCGGGGGAAAGATTTATCGGAGAAGGATCGGCCCGCGTTAGATTAGGTAGTTGGTGGGGTAATGGCCTACCAAGCCTACGATCTATAGCTGGTTTAAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGAGGAATCTTGGACAATGGGGGAAACCCTGATCCAGCCATGCCGCGTGAGCGATGAAGGCCTTAGGGTTGTAAAGCTCTTTCAGTCGTGAAGATAATGACGGTAGCGACAGAAGAAGCCCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGACTATTAAGTCAGGGGTGAAATCCCGGGGCTCAACCCCGGAACTGCCTTTGATACTGGTAGTCTAGAGTTCGAGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGCTCGATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATGCCAGTCGTCGGCAAGCATGCTTGTCGGTGACACACCTAACGGATTAAGCATTCCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAACCCTTGACATCCTGATCGCGGTTACCCGAGAGGGTTCCCTTCAGTTCGGCTGGATCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTCGGTTAAGTCCGGCAACGAGCGCAACCCACACCCTTAGTTGCCAGCATTCAGTTGGGCACTCTAGGAGAACTGCCGATGATAAGTCGGAGGAAGGTGTGGATGACGTCAAGTCCTCATGGCCCTTACGGGTTGGGCTACACACGTGCTACAATGGCAGTGACAATGGGTTAATCCCCAAAAACTGTCTCAGTTCGGATTGTTCTCTGCAACTCGAGAGCATGAAGTCGGAATCGCTAGTAATCGCGTAACAGCATGACGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTGGGTTTACCCGAAGACGGTGCGCCAACCCTTACGGGGGGCAGCTGGCCACGGTAAGCTCAGCGACTGGGGTG\n>URS0000D271BB rRNA from 1 species \nGAGGAGAGCTTGCTCTCTGATTTAGCGGCGGACGGGTGAGTAATGTATAGGGAGCTGCCCGATAGAGGGGGATACCAGTTGGAAACGACTGTTAATACCGCATAATGTCTACGGACCAAAGTGTGGGACCTTCGGGCCACATGCTATCGGATGCACCTATATGGGATTAGCTGGTTGGTGGGGTAATGGCTCACCAAGGCGACGATCCCTAGCTGGTTTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGCGGGGAGGAAGGGGATGTGGTTAATAGCTGCGTCTTTTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGTATGTTAAGTTGGATGTGAAAGCCCCGGGCTCAACCTGGGAATTGCATTCAAAACTGGCATGCTAGAGTATGTGAGAGGGGGGTAGAATTCCAAGTGTAGCGGTGAAATGCGTAGAGATTTGGAGGAATACCAGTGGCGAAGGCGGCCCCCTGGCACAATACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCTACTA\n>URS0000CC6E85 SRP_RNA from 1 species \nGCCAGGAGAGGTGGCTCGTGCCTATAGTCCCAGTTATTTGGGAGGCTGAGGTGGGAGGATTGCTTGAGCCCAGAAGTTCTGGGCTGTAGTGCGCTGTGCCGATTGGGTGTCTGCACTAAGTTCAGCATCAATATGGTGACCTCCCGGGAGCGGGGAGCCACCCAGAGGGGTGAAACTAAGGAGGCATGAACCAGCCCAGGTTGGAAACGGAGCAGGTCAAAACTCCCGTGCTGATGAGTGGTGGGATCATGCCTGTGAATAGCCACTGCACTCCAGCCTGGGCAACATAGTGAGACCCCGTCCCC\n>URS0001C732DD rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGAGACCTTCGGGCCTAGTGGCGCACGGGTGCGTAACGACTGGGAACTTGCCCTTGGGTTCGGAATAACTCCCCGAAAGGGATGTTAATACAGGTTAATGTCTTAGGGCCAAAGATTTATCGCCTTTGGATGGGGCCGCGTTGGTTTGGCCAGTTGGTAGGGTAAAAGCCTACCAAGGGGACGATCCTTAGCTGGTGGGAGAGGAGGCTCAGCTACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGGAGGAGTAGGGAGTATTGGGCGATGGGCGAAGGCCTGATCCAGCAATGCCGGGTAAGTGATGAAGGCGTTAGTGTTGTAAAGCTCTTTTAGCCGGGATGATAATGACAGTACCGGGAGAATAAGCTCCGGCTAACTCCGTG\n>URS0000BDC546 lncRNA from 1 species \nGAACTTCCTACAGTCTGAACTGGCTGTCCTCGCTTTGTTTGTAGACAGCCACGGACATGAGTTAGGAGAGGAAGACTCGGAGGGATCACTGGCCCCAAGTGGAAATCGAGGAACCTTCCCGACCCAGGAGGGCCCCGAAGAACTCGAGGAGCAGGACTGCGGAGAACAACGGGCTGGGAGGTGCGAGCCCGCCGAGGGCCTCTTCCTGACCTCCCGTCAGGTGAGGGGTCACGGTCCTGGCTGGCATGAGTTTCTCTCAGGTCCTGGCTCACGGCTGCTCTACAGGTGCACTTTCCCGGGCTTATCCTGTCACTAGACATCTGGGCTATGACAAGAGCAGGACCTCCCGGTAGGAAGACAGAGCAGGACACAGGAGCCGGGAGCCAGCGTGAAGGGAGGAGGCAGTGAGCTGAAAGGGGTAAGGCCCTTGGCAGCGCATCAGCGTTTCTCAG\n>URS0000DCD19B rRNA from 1 species \nAACTTAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGTATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCCGGAGACCCTTAGGAAACTAGGGGGTGCTTCCATCTGGAAGAATCTGGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTGCTTCCAGTTACCATCATTAAGTTGGGGACTCTGGAAGGACCGCTGCGGTAACAACGCAGAGGAAGGTGGGGACGACGTCAAGTCAGCACGGCCCTTACGTCCAGGGCTACACACGTGCTACAATGGTCGGTACAAAGGGTTGCCAAGCCGCGAGGTGGAGCTAATCCCATAAAACCGATCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGTGAATCAGAATGTCACGGTGAATACGTTCCCGGGCCTT\n>URS000122ED6C rRNA from 1 species \nTACGAAGGGGGCTAGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGGTCTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGATCTTGAGTCCGGAAGAGGAGAATGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGGACGGTACTGATGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>URS000217E4C6 lncRNA from 1 species \nAACAGCTCTCCCCATCCCCGACTTGCTGAGCAGCCCTGGGCAGTCTACTCTACAGCTCTCGACCTCCCTGAGGTCCATCTAGGGAGGACACAGGGACAATAATTCAAACAAATGCTTTCACGTCGGTCTGAGCTAACAGAGGGGGTGACTGGGGTGGGGGCCCCCTGGGGAGAGAAGGAGGGAATGGAGAAGCCTTCCCAGTGTCCAGAGTCACCACTTATTTCAGAGACGCTGGCTTCTGTGGGCCACCCAGATCTTCCTTCTCCTCTTCAGTGAATGACAGGCGGGGACCAAAGTCCCATCGAGCCAGAAGGGTCATTTGATAGTCCCATTCTCTATTACTGGTGCCTTTACAGGTGAAAAACTAGCCCAGCTCCCACTTACCCAAGAACACATCACAGGCCTTCCAATGTCTCTAAGCACTGCCGGGGCCCCAGGGCCTGATCGAGAGGGCAGGCCCTGCGGATGGCCGTCCACCACAGGGGAACCTTAGGGACTGTCTATGGAAACTGAAAAGAGCCACTGGCACCTGTCTTTGTCCAGCGAAGAAGGGAGATGAGCGGCCCCACCCAGCCCTTAGAGCTGCTTTCCTTCCCTTCCCCCACAGCCCGTGCCCTGACCCGGGGTGAGGGCTGCCCTGGGGCCTGGGCGCCGGCCTGCTCTTTGCCTGTGTGTGCCTGCGAGTGGGAGACGGAGAGAACACTTGGGAGCGAGTCTTTCCTTCCTGAACTTCTATTTCCTCAACTATTAACAAGGAAATTGCATTAGGTGATCTGTGGGTCAGGGCTTCCTCCTCTCCAGGAGGAGGATGTTCTAGTCTTTTCTCGCTGCACGCAGTCCTGAGCTCCACTGCAGAGAGAAACCGAGAGCAGAACGTTCATTCCTAAGAGTGAGGTGTCCAGTGCCCAGCTCTCCCTGGCTTTCCTGCTTGGAAAAGGCAGAGGAGAATGGCTTACAAACGCCAAAACCTGGCCGGCGATCATGCTGTGGTTTGCAGAGAATTAGAAGGCATTGTGGATCTCGCAAGGTGTTTGTAGCCAGAGCAGAAATGCCTTGGCAGGAGAAGCCAGGCGCACCAGCCCAGCCTCGTGGGTGGGCCTCTCTGTTGGCCACCGGACAGGGGCTGCCAGGACGTTTCTTGCCCCCAGCTGCCCTAAAGTCATGAGAGAAAATGGGTCAGACTGCAGAGGCTTATCCTTCTGGGACTCAGCTTTACTGCCCTGTGGCTCCAAGAGAAATGAAGAATATTAATCAGAAATTAAAAAAAAAAAATCAGCTCCATCAAAGGCCCCAAACTAGGCAAAAGGTTGAAGAATCTGCTCTCTGCTTGTATCTCTCTGTCTAGAGGGTATCCTCCCAGCAACAGCTTGTAGGGATGCTGTTATGGGCCCTTCTCCCAAATCCATATATCCTAACCCCTAATACTTCAGATGTGACTATGTTTGGAGATATGGTCTTTACAGAGGCAATTACATTAAAATGGAGTAACTAGGGTGAGCTCGAATCCAGCAGAACTGTAGTCTTTATCAGAAGGGAACATTTGCCTGCGGACGCACATGGAGGAGAGACACCAGGAGAAGATGGGCGTCCCCAGCCAGGGAGAGCGGGCCGGGGTGGATTCTTCCTTTGCACCCTCAAAAGGAGCCCACCCTGCCAACGCTGTGATTGTGGACCTCTAAGCTCTGCTGTTTAAGCCACCCAGTTTGTGGCACTTTGTTAGAGCAACTCTAGCAAATTTCTCCAGATGCTGCTCTGTTGGGAGGTCTGCACAACCTTGAGACTGCCTGGACTCAGAAGAATGAGTCCGCATGAGGGGAAGGGTTCTGCCCTTGCAGTGCAGCCTTATTTTAACATGAAACAAAACTGATCTATTACTCTCTTCCCTCAGAGCCTAGTCTTTTAAATTTTTTATTTCTTTTGGTATTGGTTTAACACGTTTTATTGTTTTAATCCCTTTAGTCTTTTTATTTTGTGAGTTTAATGAGTTTACTTATCTCAGTCATTTTTTAATCCCGTTTTTTCTTTCTTCTAGCTATTTTATACTATGTCTTTTATCTCATCTTCTAGATCTTTTGGTATTATATTTTTATTTTCCGTCTGTTATTTCTAACCCTTTGCCTTATCGTGCCTTTGTTCCATCTTTTAATTTCTTTTTAGCTTATTTTTTTTATTTTTAGTTCATATTGTCGCTTGCCTGCTGCCTTTTTTTTTAACTACTTTTTATTTCTTC\n>URS000185AE94 rRNA from 1 species \nGACGGAGGGTGCTAGCGTTGTTCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCCTTGCAAGTCGGTTGGTGAAAGCCCGGGGCTCAACCCCGGAGGTGCGGCCGAGACTGCAGGGCTGGAGGCCGGAAGAGGAGGGTGGAATACCCAGTGTAGAGGTGAAATGCGCAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCTATCTGGACGGTTTCTGACGCTAAGACGCGAAAGCGTGGGGAGCAAACAGG\n>URS00013B9BDC rRNA from 1 species \nTACGTAGGGGGCTAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGCTCGGTAAGTCCGCTGTGAAAGTCGGGGGCTCAACCCTCGAATGCCGGTGGATACTGTCGAGCTAGAGTGCGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAATTGCGAAGGCAGCTCGCTGGGACGTCACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACAGG\n>URS00021EA825 tRNA from 1 species \nGCCGAGATAGCTCAATGGTAGAGCAACCGCCTTGTAAGCGGTAGGTTACGAGTTCAAGTCTCGTTCTCGGCT\n>URS0001B16A08 rRNA from 1 species \nACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCTACTAGCCGTTGGAAGACTTGATCTTTTAGTGGCGCAGCTAACGCGATAAGTAGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTGAGAATCCTTTAGAGATAGAGGAGTGCCTTCGGGAACTCAGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCAGCACGTAATGGTGGGAACTCTAAGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGACCTGGGCTACACACGTGCTACAATGGCCAGTACAGAGGGCTGCAAACCCGCGAGGGAGAGCCAATCTCACAAAGCTGGTCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTTGGAATCGCTAGTAATCGTGAATCAGAATGTCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTGGCTAGTCTAACCTTCGGGGGGACGGTCACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAGCCCTAGGGGAACCTGGGGCTG\n>URS000113661D rRNA from 1 species \nGCAGCAGCCGCGGGAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTCAAGTCGGATGTGAAATCCCTGAGCTTAACTTAGGAATTGCATTCGATACTGGGAAGCTAGAGTATGGGAGAGGATGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGATGGCGAAGGCAGCCATCTGGCCTAATACTGACGCTGAGGTACGAAAGCATGGGGAGCAAACAGGATTAGATACCCCTGTGTCCCTGTCTCTTATACA\n>URS000018AC20 rRNA from 1 species \nATTGAACGCTGGCGGCATGCCTTACACATGCAAGTCGAACGGTAACGGGCCTTCGGGTGCCGACGAGTGGCGAACGGGTGAGTAATGCATCGGAACGTACCTTTCAGTGGGGGATAACGTAGCGAAAGTTACGCTAATACCGCATATTCTGTGAGCAGGAAAGCAGGGGATCGCAAGACCTTGCGCTGATTGAGCGGCCGATGTCAGATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGACGATCTGTAGCGGGTCTGAGAGGATGATCCGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAAATGGGGGCAACCCTGATCAGCCATGCCGCGTGAGTGAAGAAGGCCTCGGTT\n>URS0001022610 rRNA from 1 species \nCAGTAGCCACGGGAATACGAAGGGGGCTAGCGTTGTTCGGATTTACTGGGCGTAAAGCGCACGTAGGCGGATCGATCAGTCAGGGGTGAAATCCCAGAGCTCAACTCTGGAACTGCCTTTGATACTGTCGATCTGGAGTATGGAAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGTCCATTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCCCGTAGTCCCTGTCTCTTATAC\n>URS0000FD5F85 rRNA from 1 species \nCCTACGGGCGGCAGCAGTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGAGGGATGAAGGTCTTCGGATCGTAAACCTCTGTCAGCAGGGAAGAACGGTCACTGTGCTAATCAGCAGTGAATTGACGGTACCTGCAAAGGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTATTGGGCGTAAAGCGCTCGTAGGCGGTATGTCAAGTCAAGGGTGAAATCCCCGCGCTCAACGTGGGAACTGCCTTTGAAGCTGGCAAACTGGAGTGTGTGAGAGGATAGTGGAATTCCAGGTGTAGGAGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGACTGTACCTGACGCTGAGGCGCGAAAGCGTGGGTAGCGAACGGGATTAGATACCCCAGTAGTC\n>URS000184CF18 rRNA from 1 species \nAACGAACGCTGGCGGCATGCCTAACACATGCAAGTCGAACGTGAAGGGGACTTCGGTCCCTGGAAAGTGGCGCACGGGTGAGTAACACGTGGATAATCTACCCGATGATCTGGAATAACACTTCGAAAGGGGTGCTAATACCGGATGAGCTTACGACGTCTTCGGACGACGCGGGAAAAGGGGGCTTCGGCTCCTGTCATCGGATGAGTCCGCGGCCCATTAGCTAGTTGGTAGGGTAATGGCCTACCAAGGCTACGATGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGCGCAATGGGCGAAAGCCTGACGCAGCAATGCCGCGTGAGTGATGAAGGCCTTCGGGTCGTAAAGCTCTGTCAGAGGGGAAGAAACTCCCGTCGGTTAATACCCGGCGGGCCTGACGGTACCCTCAAAGGAAGCACCGGCTAACTCCGTGCCAGCCGCCGCAGTAAAAC\n>URS00020C60CA rRNA from 1 species \nGACGAACGCTGGCGGCGCGCTTAACACATGCAAGTCGAACGGAAAGGCCTGCTTTCCCTTGTGGATTGCGGGTACTCGAGTGGCGAACGGGTGAGTAACACGTGAGTGATCTGCCCCCAACTTGGGTATAAGCCTGGGAAACTGGGTCTAATTCCCGATAGGACTGCAGGGTGGTGCCGGTGGTGGAAAACGATTTTCTAGTGGTGGGGGATGAGCTCGCGGCCTGTCAGCTTGTTGGTGGGGTAGGGGCCTACCAGGGCGGCGACGGGTAGCCGGCCTGGGAGGTGGGCAGGCGAAATCGGGCCTGATATAGGGCGGAGACTCCGGGGGGAGGCATCAGTGGGGGGGATGGCACAATGGGCGGAAGCCTGATGGGGGGACGCCGGGTGCGGGGTGACGGACTTCGGGTTGTAGGCGGGGATCCCCTGTGGTGGAGAGGGTGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTG\n>URS00023F918D lncRNA from 1 species \nCCATACATGTACCACTGCTACATGGTGCAGTAAATTCAACACACAACCTACCCCTTAAACCCTATGAGTTACAACATAGGCACCTGCACTATCAACTTCTCATGACTACTAACGAACATGTCACACAAGCATACAAGTTCAATGGAATACTTATAATAGGATTCTAAGCTCACATTGTCATAATAGTTACCATACATGTCATTCATATTATCAAGAAGATAAATACACATCTATATCACAATAAGGCATCCCATACATGTAGACTAAGATATATATATTACTTGGGATAATTCACTAACTGATATTGCCTGACTAAGCCCTACTTGGTCTTTAGTAATACTAATTTTAGTATTCAAGAACGATTAAGAACATTTTGATCAAAATCAAACCTAGTAGATCAATTAGGAAGATCCGCCCACTAGATTTTCAATCCGTAAATTCCTAAGGTCCTCAAATATTACATATAATAACATATTAAAGTTTGGTAACGATCTAACGGTCGGATCATCGATTGTTATAATATTCAAGTGGTGGTCTCTAACGAAAATATGTTCAAACGACGGGATTTCATCAATCGGATGACACATATTAACTCGAGGTATTGAATTTAGCATAGAAAGATAGAGTTGGCCCACTGGTTACTCACCGCCACATGCGGCGGTTTCTGGCAAACGAAAACCCAATTTTTTGACAAACTCCAAAAAATTACCAAATTTTATAGAAATGTAGAGCAAGTCAAGGGGAATAATTTTCATACCTGGGTCAAAGTTCAATTTGGCTA\n>URS000228E004 rRNA from 1 species \nGCATCTCTTGAATATCAAAGGTGAGCCAGTACAGGATGGACCCGCGTCTGATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCGACGATCAGTAGCCGACCTGAGAGGGTGATCGGCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGAAAGCCTGATGCAGCAACGCCGCGTGAGTGATGAAGGCCTTCGGGTCGTAAAACTCTGTCCTCAAGGAAGATAATGACGGTACTTGAGGAGGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCTAGCGTTATCCGGATTTACTGGGCGTAAAGGGTGCGTAGGCGGTCTTTCAAGTCAGGAGTGAAAGGCTACGGCTCAACCGTAGTAAGCTCTTGAAACTGGGAGACTTGAGTGCAGGAGAGGAGAGTGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTTGCGAAGGCGGCTCTCTGGACTGTAACTGACGCTGAGGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGAGTACTAGGTGTCGGGGGTTACCCCCTTCGGTGCCGCAGCTAACGCATTAAGTACTCCGCCTGGGAAGTACGCTCGCAAGAGTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGTAGCGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCTAAGCTTGACATCCCAATGACATCTCCTTAATCGGAGAGTTCCCTTCGGGGACATTGGTGACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCTTTAGTTGCCATCATTAAGTTGGGCACTCTAGAGAGACTGCCAGGGATAACCTGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGCTTAGGGCTACACACGTGCTACAATGGGTAGTACA\n>URS0000E6547F lncRNA from 1 species \nCCATCACCAACACCATGTCCTCCCTGGTGAAGGAGCTGCACTCGGCAGAGGAAGAAGACGAAGAAGAAACAGAGAAGCTGCAGAATGGGAAGGACCGAGGTGAGGAGACAAAGCTGTCTGAGAGCTCTGCAGCATTTTCTGACTCACTCAGGGTTCTCTGGCTCCCTTTGGAGCCCCACCAGGGCCTCTGGGTGCACGTGGGTGGCTCTGGGTGCCTCTGGATCAGATGGCTCTGGACCACATGGATGGCTCTGGATCAGATGTGCTGATGGGGTTCCATGGTGACCTCAGCTGGACACGTGTCCCTGTGCTGGGTCCCATGGTGTCCCTGTGCTGGGTCCCTCAGTGTCCC\n>URS000193CF2E rRNA from 1 species \nGTAGGTGGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTCCTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGGGACTTGAGTACAGAAGAGGAAAGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATTTGGAGGAACACCAGTGGCGAAGGCGGCTTTCTGGTCTGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGAGTGCTAAGTGTTAGGGGGTTTCCGCCCCCTTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGATACGGCCGCAAGGCTG\n>URS00011F5F41 rRNA from 1 species \nTACGTAGGGACCGAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGCTTGCTAAGTCTTGCGTGAAATCTCGGGGCTCAACCCCGAGCGGTCGTGGGAAACTGGCAGGCTAGAGTGCGGGAGAGGAGAATGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTCGGCGAAGGCGGTTCTCTAGTACGGTACTGACGCTGAGACGCGAAAGCGTGGGGAGCGAACAGG\n>URS00005015FB rRNA from 1 species \nTCTTCGGGATAGGTAGTAGTTAAGGTGATGGCTTAACTAGCCAAAAATTCTCGTAGTCGAAACTGAAAGGTTGATCGACCACATTGGGTCTGAAAAAACCCCAATGCAAGTTAGTACAGCAGTGAGGAATATTGGTCAATGGCCTAACGGCTGAACTGGCAACTTGGAGAAGTGGTAAGTCTTATTTTGATTAGATTATAATATATAATCTATAAGATTGTATTAATATTGAATAAAGCTTTGTTTATATATTGATAATGACAGTATATATATCGTGTCTTGACTAATTACGTGCCAGCAGTCGCGGTAATACGTAAGAGACTAGTGTTATTCATCTTAATTAGGTTTAAAGGGTACCTAGACGGTCAATATATCTTGTAAAATGTTAGTACTTGACTAGAGTTTTATATAAGAGGGCAGTACTTGAGGAGGAGAGATGAAATTCTATTATACCAAAGGGACTCGGTAAAGGCGAAGGCAGCCCTTTATGTATAAACTGACGTTGAAGGACGAAGGCACAGAGCACAAACAGGATTAGATACCCAAGTAGTCTTTGCAGTAAATGATGAATGCCATAGGTTNAGATTAA\n>URS000156E271 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCTTAACACATGCAAGTCGAGCGGAGATGAGGTGCTTGCACCTTATCTTAGCGGCGGACGGGTGAGTAATGCTTAGGAATCTGCCTATTAGTGGGGGACAACATTCCGAAAGGAATGCTAATACCGCATACGTCCTACGGGAGAAAGCAGGGGATCTTCGGACCTTGCGCTAATAGATGAGCCTAAGTCGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCTGTAGCGGGTCTGAGAGGATGATCCGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGGAAGCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTTTGGTTGTAAAGCACTTTAAGCGAGGAGGAGGCTACTGAGACTAATACTCTTGGATAGTGGACGTTACTCGCAGAATAAGCACCGGCTAACTCTGTGCCAGCCGCCGCCGTAATAC\n>URS0001EFA8A7 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGACGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATAGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGAAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACAAATGTGTAAGTAACTATGCACGTCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS000127A0CB rRNA from 1 species \nTACGTAGGGGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGTCAGGTAGGTCCGTTGTGAAAACTCGAGGCTCAACCTCGAGACGCCGATGGAAACCATCTGACTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGACGCAGATATCAGGAGGAACACCGATTGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACAGG\n>URS0000123E88 piRNA from 1 species \nTGATAAGTGTCCTCCAAATGGCCAGTGAGC\n>URS00015DB2A6 rRNA from 1 species \nTACAGGGGGTGCAAACGTTGCTCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGCTACTTAAGTCGGATGTGAAAGCCCCTGGCTCAACTGGGGAAGTGCACCCGAAACTGAGTGGCTTGAGTGCGAAAGAGGGTCGCGGAATTCCCGGTGTAGAGGTGAAATTCGTAGATATCAGGAGGAACACCGGTGGTGTAGACGGCTCACTGGACCGTAACTGACGCTGAGACACGAAAGCGTGGGTAGC\n>URS00006B5731 tRNA from 1 species \nTCCCTGGAGGTCCAGTGGTTAGGACTTGGTGCTTTCACTGCAGTGGCTGAGGTTCAATTCCTTGTCAGGGAA\n>URS0001521DBC rRNA from 1 species \nCCTACGGGTGGCAGCAGTGGGGAATATTGCACAATGGGGGGAACCCTGATGCAGCGACGCCGCGTGGGTGAAGAAGCGCCTCGGCGCGTAAAGCCCTGTCAGCAGGGAAGAAAATGACGGTACCTGAAGAAGAAGCACCGGCTACCTACGTGCAAGCAGCCGCGGTAATAAGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGGGCGCAGACGGCGATGCAAGCAAGGAGAGAAAGCCCGGGGCCCAACCCCGGGACTGCTCTTGGAACTGCGTGGCGGGAGTGCAGGAGGGGCTGGCGGAATTCCTGGTGTAGCGGTGGAATGCGTAGATATCAGGAGGAACACCGGTGGCGAAGGCGGCCTGCTGGACTGCAACTGACGTTGAGGCCCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCCTGTAGTC\n>URS0001374C98 rRNA from 1 species \nTACGTAGGGTGCAAGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGTTGCGTCGGCTGTGAAATCCCGAGGCTCAACCTCGGGTCTGCAGTCGATACGAGCAAACTAGAGTGTTGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCGGCTATCTGGCTCACAAACTGACGATCAGGCACGGAAAGCGTGGGGAGCAAACACGG\n>URS00005F7B23 piRNA from 1 species \nTCCGAAGTCACAAGTAGGCAAAGCTGGCCTT\n>URS0000A2FBFB rRNA from 1 species \nGACGGAGGAGGCGAGCGTTATCCGGAATTATTGGGCGTAAAGCGTCCGTAGGTGGCTGAGCAAGTCTTTTGTCAAATAGTGGAGCTTAACTCCATAGAGGCGGGAGAAACTGTTTAGCTTGAGTATGGTAGGGGTAGAGGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAAGAACACCAGTGGCGAAGGCGCTCTACTGGGCCATAACTGACACTGAGGGACGAAAGCTAGGGGAGCGAAAGGG\n>URS00023F966A lncRNA from 1 species \nCCATTCCAATCACATCTAATGCCTCCCTCGCTCGCCAGAGGTATGCCGACTCTTGCGAGGCTGCCATTAACGAGCAAATCAAGTAAGCATCCATCCATTAAAATCAAAAGCTCCCTTAAAATTTAGATATTAACAGAGGTTGAGGTTGATTTTTGGACAGTGTGGAATACAACGTGTCGTATGTGTACCATTCAATGTACGCCTACTTTGACAGAGACAACGTTGCTCTCAAGGGTCTTGCCAAGTAACTTTTTCTTACTACTACTACTGCCTTTCAATCTTAATCTAACTAAAGCAAAAATTTAATAATATGATAAAACTTGGTTCAGATTTTTCAAGGAATCAAGTGATGAAGAAAGAGAGCACGCTGAGAAGTTTATGGAGTACCAGGTTTCCCTCTCTTTTTTCCCCATTCTAGAAGTTGAAAAGAATATTGATTTGATTTGAGGGTTAATATATGTATGGTTTATGTATATGTGTGTAGAACAAAAGAGGAGGAAGAGTGACACTCCACCCTATCGTCTCCCCTATCTCTGATTTTGAACATGCTGAAAAAGGAGATGCCTTATATGGTATATATTTTTTTTTATACTTATACAAAAAAAAAAAACACTTTCTTTCTTGATTAATAAGTGTATACACAGATCTTGAAATGGTCTTATACTAATCTATATTATTTTCAGCAATGGAATTGGCCCTGTCTCTGGAGAAACTTACCAACGAGAAGCTTCTAAACCTTCACAGAGTATGTTCCCAAAACTTATCCATCTAAAGTCAATCAAATAAGGCATTCACTAATTTTAAAATAATAATTAAAAAAAACAGGTGGCATCAGAGAACAATGACCCACAGTTAGCTGATTTTGTTGAGAGTGAGTTTCTCGGAGAGCAGGTGTGTTTTTCTTTTGTTCGTTTTCTTAACTAGTGACTTGAAACTAGTACCCACTTTTAAATAAACATATTTTTCTCTCCCCCTTAGATTGAAGCAATCAAGAAGATCTCAGACTTCATCACCCAGCTAAGGATGGTTGGCAAAGGACACGGTACGCTGTTTGATCTAAACCTCCCCTATATTCAGTACTAGGACTAGAATTTCAGTAGTAATTTTTTTAGAAAAGCTTATTAAATTTTTATGTGTCTTTTGCAGGAGTTTGGCACTTCGACCAGATGCTTCTGAACTAGAGTGGGACCTCTATAAGTTCACTTTATGCTCTGGGGAGATTAAAAGAGAAGTAAACAGAAGAAGATTCTGTAAAAGTTGCTAGAGTGGAAGTTATTATTGGAGCAAAAATAAGATTTGTAGTACTAATAGTAGTAAGCTTTGTGTGTTAAGATGATGGGTTTTTTTTTGTAATAATTTCATAAGTTTAATCTATGAAGGTGGTTTTTGTTTCATATTTTCATGTTCTGACTATATATATGAACAAACGGAGACTTGAGTCCGATTAATAGGTAGAGAAACACTCTAACTAAACGCAATGCTGCAATTCAAAAGGTGAAAGAAGAGTTAAAAAAAAATAAGGAACCTGTGGATGAAGAACATGAAGCCTCGGTCACTCAGTGAGATAACTGAAAAGCAAACAAAGAAGAGTTAAAAAGAAAAGATATATGAATTGAGACTTTAACATAAGTGCAATGCAAGTTGTTTATATTTCCAAACAGTATGTTTGATCCAGAGCTAGTATCTGATGCCCTAACTTAGATTCTATCTTGAACACTAGACTAGACAGTCTTCT\n>URS000010D699 rRNA from 1 species \nAGGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTGGAGCGACGAACCAGGGCTTGCCCTGGGGCAGAGCCGCGAACGGGTGAGTAACACGTGGGTTACCTGCCTCGATGACCGGGACAACCCGAGGAAACTCGGGCTAATACCGGATGTGCCCGCAAGGGGAAAGGAAGCTTCGGCCTCCGCATCGAGATGGGCCCGCGGCCCATTAGCTTGTTGGTGAGGTAACGGCTCACCAAGGCTTCGATGGGTAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGGGCAGCAGTGAGGAATTTTCCGCAATGGGCGCAAGCCTGACGGAGCAACGCCGCGTGCAGGAAGACGGTTTTCGGATCGTAAACTGCTTTTCTCGGGGACGAGAACGGACGGTACCCGAGGAATCAGCCCCGGCTAACTACGTGCCAGCAGCCGC\n>URS00002998B4 rRNA from 1 species \nGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGATGAACCGGAGCTTGCTCTGGGGATTAGTGGCGAACGGGTGAGTAACACGTGGGCAACCTGCCCCAGACACCGGGATAACCATTCGAAAGGATGGCTAATACCGGATACGACCACTTCGGGCATCCGATGGTGGTGGAAAGGATTCTGGTCTGGGATGGGCCCGCGGCCTATCAGCTTGTTGGTGGGGTAATGGCCTACCAAGGCGACGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGAGGGACGAAGGTCTTCGGATTGTAAACCTCTTTCAGCAGGGATGAAGCGAAAGTGACAGTACCTGCAGAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCG\n>URS0000E6E834 lncRNA from 1 species \nGCAGCAGCAGCCAGCACAGTGTCTTTGGCACAGCCCAGGCAGACAGGTGGAGGAGAACTGAATCCTGCTTCTTGACAGCCCATTCTATCAGCCTTCATCTCCAACTTGTTAAATTTCCAACAAGTTGCTTCGTGCTCTCCTTTATCCACTGCCCCCAAGCATGGGAGGAGTTACTGCAAGTAGCCACAGAGCCACCTTCTGTTCTCCTGCAGCTTCCTCCTGCAAAACCCAACCACCAGTCCAGGAACACAAATATCAGCCAGAAGTGGTATGTGATTGCTTCCATCTGATTTGGAGAGGAATTGCTTTTCCAATAGTGGATGATTTGATCCAGAACTGGAGAACCAACCTGGCAGTCAGCAGCTTCATGAGACCAAATCTGACCCAGGGCCTCAGAGCTCTGCCAGCTGCAGGCAGGTGATCACAGAAGCTAGAACAGAGCAAAACAAAATTAAAAAAAATCCATGAACTAAGTGTAGAATCCATCTGAATTCAGCAAGATGGGCTGTAACAGGAGAAGTTTTATTTATTCCTTGACCTGAACTCAGCTCACACCCATCAAAGTGACAAAAGGTGATAAATATCCTTTGGGGTTCCAGGTAATTTCTTCCCTTCTGCTTTACCTGGCAGGGAATGTTTTTGGAAGATTAATGAAATACCCAGAATTTTGTGCATGTATATGTGTGTGCGTATGTGTGTATAGCTATTTATTTACTTACTTATATCTATAAACCAGCATTTTTCATGCAAACTGAGAATTCATCGACATGGTATTGTTCTTGTTGCAACCCAGGGAATTAAAGGATGCCGACAATTAATGGAATCACAGAAGTACAAGATGGTTTGGGTTGGAAGGCACCTTAAAGCTCATCTTGTTCCACCCCGTGCCCTGGGCAAGAACACCTTCCACCAGACCAGGTGGCTCCAAGCCATGGAACATACGCAGAGCTGGGGCAGACACACATGGGGGCACAAACACAGCTTCTGGTTTTTATTTCACAGTTCTGAGTTGTGGGTCTGTTTAGGAGGAAATAACCCCCCACACACACAGTAAGTGCAGGGTTTTCCAGGCCCCCTCCAAACATCCCCTGCAGGCTCCCCCTGATCATCCCTGCCAGGCCAGCAGCCCACCCCCACTGCTGTATTCAGTGGTACCAGGACACCTCCAGCTCTGTATCTGTGTCCTCCTGTTCTCAGGGAAACCCATGAGGATCAGTTTGCTTTTGTATCAAATTTACTTCTTTGCTGGTACCATTTTCTCTGCTTACTCATAAACACACCGAGCACCACAAACACTTTGGAAACTCAAATGACTCCTTACTGTGAAAACTGGGAGCAGAGCCTAACCCCCATCTGGGTGCACCCTCCTGTCAATGAGAGCAATGGGAGAGTTCTTCCAAATCAGCCCAGCTGAGCACAGGTGTTTCCTGATGTCCCTCCAAACCTGCAAGATTAATTTTCTGCCCATTTAGTCCTTGTGCTGGCAGTGGAGATGTCCTGGTCACAGTTTTTAGATGTCTTCTCTAGACTGAGGAATCAGAGTTCAGGCATAAACCACCTTCTTTTGGGACATGAGGAATAAAACTTCCATATCCGCAGCCCA\n>URS00019739F1 lncRNA from 13 species \nATGCAAGGTATCTGTGGAAGCCTGAAGACGCCAGAATTTTGTCTGCTTGTAATGAAGGTTTCAGGTCTTACAGATCCCTCGGCAAAGTCCATGCCCCCTAGCTACCCACAGTGTGACACTAGCGCTCTACCGTCTAGTTATGTCAGCATCACAGTAAGAATGCCCTCGCATCCGAACCATGATGGGAAATCAGCTGGCCACAGCAAGGCTGGAGAACCCTGTGTGTGCAGTCCTGCAGCACGGCCTTCTGAAGGCGCACCTCCTGCAGAGGTGTTGACGGGAAAGGCGAGGAAGAGGGGATAATGTGACCTGCTTTCACAGGAAGCTTCAGATCATTTCCCTTTGTCTCTGTGCCCCTTTGGGAGATTTTGATCCAATTTGCTGTGGTGAGAAGAAGCTCTCGACATTACAAGAGAAAAAAAAAAAACCCAAAACTTTCATTTTCCTCCTAAGAAATGAAATTTTATTTCTGGATGACAAGGGCTTTGGAAGGCCATGGTGTGGTAATGAGTGACCCTTTCATAGCTGTTGAACATCAGTAGGCGACACATCCAAAGTATAGAGGCAGCTCTTAAAATACCAGCTAAAGGAAGAATTTAGAGAACAGAATGTCTTTAAGGAACTGTGCGAATGTTATTGATTCTTTCAAATAATGGTGTAACCTCTGTGATACAGCAACAATCTTCATGAGCTGTATTTATAAGGAACTGAGCTCATGAAGACAGCATGGGGGGTCTGGCGATGCAGGGCCCTTTGTTAACCATTGTTCTATTATTAGTATTGTTAGCATTGCCCTGCACAAGTTATCCACTTTTTCTCCAGCCCCCTGGGTATTCAGCAGAAATGATTTAAGAATGCCTGTAACAGCTGGGTGCAGTGGCTCACACCTGTAACCCCAACACTTTGGGAGACCGAGGTGGGTGAATCACAAGGTCAAGAGGTGGAGACCATCCTGGCCAACATGGTAAAACCCCGTCTCTACAAAAAATTGAAAAAAAAAAAGTTAGCTGGGCCTGGTGGCGTGCACCTGTAGTCCCAGCTCCTTGGGAGGCTGAGGCAAGAGAATCACTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCTGAGATTGTGCCACTGCACTCCAGCCTGAGTGAGAGAGCGAGACTCCATCTCAAAAAAAACAAAGAATGCCTGTAACTTAGTCTCCTACTTGGCATCACCTAAGAGTTCAGGAGTGCAGTGACAGGTTAACTGAGCTCTTGCAGAAAGGTGCTGTGGACAGCGAGGTATAAGTCAGAGGAGTGACATGTTCTATGATGGGAAAGAAGAAAGCTGAAATCCCAAGGTGCTCCCTGACATTTGCCACTCACATAAACTGATGAGAGAGTTTGTTATTAAAGGCCTTTTTGTTTAATTAGAAATCAAACCAGAAGACCCTGGTGTCATAATTTATTCTCTTGCAAAATTATGTGATCAGAAGTTCCAGCCATAACCACAGAGGCATTGGAAGTTGGTAAATGATGCTCTGACTCAAAAGCTTCAAAGACATAGGAGGGGCAGAGGGAAGGAAATGTATCATTAATAAACAGCCTGAGCAAGTGGGCA\n>URS00014F887F rRNA from 1 species \nTACGTAGGGTGCGAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTCTGTTGCGTCAGGAGTGAAAACCCGGGGCTTAACCCCGGGCCTGCATTCGATACGGGCAGACTCGAGTGTGGTAGGGGAGACTGGAACTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCACTACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS00019CB411 rRNA from 1 species \nGGCTCAGGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAACGCGTTTCCGTTATTGATTTTAGATGCTTGCATTTAAATGATTTAACACGAAACGAGTGGCGAACTGGTGAGTAACACGTGGGTAACCTGCCCTTGAAGTAGGGGATAACACTTGGAAACAGGTGCTAATACCGTATAACAACCAAAACCACATGGTTTTGGTTTAAAAGATGGCTTCGGCTATCACTTTAGGATGGACCCGCGGCGTATTAGCTTGTTGGTAAGGTAATGGCCTACCAAGGCAATGATACGTAGCCGACCTGAGAGGGTAATCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGACGAAAGTCTGATGGAGCAACGCCGCGTGAGTGATGAAGGGTTTCGGCTCGTAAAACTCTGTTGTTGGAGAAGAACAGGTGTCAGAGTAACTGTTGACATCTTGACGGTATCCAACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGTTTCTTAGGTCTGATGTGAAAGCCTTCGGCTTAACCGGAGAAGTGCATCGGAAACCAGGAGACTTGAGTGCAGAAGAGGACAGTGGAACTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAAGAACACCAGTGGCGAAGGCGGCTGTCTGGTCTGTAACTGACGCTGAGGCTCGAAAG\n>URS000065A135 ncRNA from 1 species \nTGTCTCCTCCAACTGATCAAATATTGGATTCAGCCCGCTGCCGCAAGGAAGCGGGCTTTTTTTT\n>URS00000A33BD rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTAGAACGCTGAAGGAGGAGCTTGCTCTTCTGGAAGAGTTGCGAACGGGTGAGTAACGCGTAGGTAACCTGCCTCTTAGCGGGGGATAACTATTGGAAACGATAGCTAATACCGCATAAAAGTCGACATTGCATGATGTTGACTTGAAAGGTGCAACTGCATCACTAAGAGATGGACCTGCGTTGTATTAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCGACGATACATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGGGGCAACCCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTAAGAGAAGAACGAGTGTGAGAGTGGAAAGTTCACGCTGTGACG\n>URS000054A298 rRNA from 1 species \nGCTCAGTAACACGTGGATAACCTGCCCTAAGGTCCGGCATAACCCCGGGAAACTGGGGATAATACCGGATAAACCATAGATACTGGAATGTTCTGTGGTTAAAAGTTCCGGCGCCTTAGGATGGATCTGCGGCCTATCAGGTAGTAGTGGGTGTAAAGTACCTACTAGCCGACGACGGGTACGGGTTGTGAGAGCAAGAGCCCGGAGATGGATTCTGAGACATGAATCCAGGCCCTACGGGGCGCAGCAGGCGCGAAATCTTTACAATGCGGGAAACCGCGATAAGGGGACACTGAGTGCCAGCATATTATGTTGGCTGTCCACCTGTATAAATCACAGGTGTTAGCAAGGGCCGGGCAAGACCGGTGCCAGCCGCCGCGGTAACACCGGCGGCCCGAGTGGTAGCCACTATTATTGGGTCTAAAGGGTCCGTAGCCGGTTTGATCAGTCTTCCGGGAAATCTGACAGCTCAACTGTTAGGCTTCCGGGGGATACTGTCAGGCTTGGGACCGGGAGAGGTAAGAGGTACTACAGGGGTAGGAGTGAAATCTTGTAATCCCTGTGGGTCCACCAGTGGCGAAGGCGTCTTACCAGAACGGGTCCGACGGTGAGGGACGAAAGCTGGGGGCACGAACCGGATTAGATACCCGGGTAGTCCCAGCCGTAAACGATGCTCGCTAGGTGTCTGGGATGGTGCGACCGTTTCAGGTGCCGCAGGGAAGCCGTGAAGCGAGCCACCTGGGAAGTACGGCCGCAAGGCTGAAACTTAAAGGAATTGGCGGGGGAGCAC\n>URS00002125CA piRNA from 1 species \nTGCGATAGATATTGCTTCCTATCCTGGGCT\n>URS0000BE8870 snoRNA from 1 species \nAGGATCAGTGATGAGGACTGGTGGCGAACGAGTCACAGAGATGACTACACGTCTGCGACTCTGAGGTCTAT\n>URS0001BC925D snoRNA from 16 species \nGUCGACGUACUUCAUAGGAUCAUUUCUAUAGGAAUCGUCACUCUUUGACUCUUCAAAAGAGCCACUGAAUCCAACUUGGUUGAUGAGCCGAAGAACCUUUGUACCCAAGAGUGAGAAAAAAGAAUGUAUUAUUAGCUUGGUCCACAACCCUUAGCGGUUUGGCCAUCUACUCCCACAUUUUUGCUUUGCCUUUUGCAUAUGGUUUGUGUAUGGAUAGAGAACUUAGCUUGGUGGUUUAGAAGUAGGAAUUUCGAUUCUAUGCUUUUUGAACUUACCGGCUUUUUUCUUGUUUUAACUCCUGCAUGAACCGCCUUUUAAUUGGCGCGAUGAUCUUUGCCCAGUUUGUGGACUUCUUCGUGAGGGGACAAACGUAUUGGGUGGGUACAAAUGGCAGUCUGACAAGU\n>URS000199981D lncRNA from 1 species \nTTTGCAAACATAATTAAAACACAGACATGTTCACTAATACTATCTAAAAACATACAAGTGTCGTGAGTCTTTATTCACTTACTGTATGCTTGTTCTGTACTATTGCCACTTCCTATGGAGTAACGTCCAGTAGTAACACTGGCACATGGCACCTTCTCTGAGTCAGACTTTTATAATCAAAGTTGCCAATACAATGCCTGAGGTTGATAAGTAAGATACAGGGTTCTTCTTCTGAGTTATGTCAGTGGCTGTATAACTCTAAATACGAAAGAGATGTTTTACAAAAAAACAAAGGCAAGTGTTTTACATTAAATCTTATAAAACTGTACATAATAAAAGTCTACAACATGAAAACGGCCATTAAACTGTTGTGATAGTTACGAAATGTAGTAAATATAACAATGCTAATGTTTCATGTATTTATCATTAATCACTGTATTCATACAGTGCTGTTTGTATATATAAATATTCAATGGCACTGTAAACAGGTGTTGGAAAACACACATTTACTCTTAACCCATTAGAAGTTATTGTAGTACTTTTTAATCCAAAAGGTCAAAATGCATTAATGCATCATTGATTTAGAAAAATAGCCTTGTACTATGATGCACATTTTGACATTTTCTAGGGTAGCAATCAGGATGAAGCATAACAAAGAATGCCAGATTTCAGACTGGTTTACATTTACACCTACCATGACACAAAATTTTAAACATTAAATGTCATTAAATAATACACAGTTTATAAAACAGTTGATTTCAGAGATGCACAATACACAAAAATCTAGTTAGTGTCTAATGGGAGTTCCCAATAATTTATATCTCTGGGACCTTTATGAGAAATTTAAGTCTGTTTCTCTTTACCATCACGTAGGCAAAGTGAGTTTGAATTGAATTACCTTTTTCTTAGTCTGTACAGAGCTGCATTCAACTGGATAAAATATGCTTATTCATGTTTTCCACTGCTGGACATTCATCCAATAAGTCTTGAGCATATGCTTAAGCATCTGGTAATGGCATTTTGTGGGGCAAGGAAACTCACTATCTCTATCCCTCAGTAAACAAAGTGGTTCTAATTTTATCCATAGTTAAGGCAACTATACTGATATATTAGACACACCATATGCTTTTATGTTGCTGCCTACAATCTAAACGGTAAGAGCGAAAGGAAGTTTCAAACATGCTTTGATCTTCTTGACCACTCAGGAGTTTCATC\n>URS0000E66266 lncRNA from 1 species \nTCAACTTGTAACAGGTGCAGCATGTACCTTCCACTTCTTTTATTGACCGTGAATTGTCAAAACACAACTGCAGCATGATTCCGAATCAGGGCACGAGCTGGGGATGAAACCTTCACCTTCTTAGGAAGAAGATGAAGCCAGTAATCCAGAGGTCACCTGGTATGTGGGCCTTCTGATTTAAAGGCTTCTTTTGGGTCAGGAATTACTGGGGAAGCCATACGGAGTTAGTTACTCCACACAGAACTGAGAAGAGGTTTTGGACTTCCTCTTACAGCTGAAGTTTCTTCAACCCAGTTGTGCTGTTATTTAATTAGCATCGCCTAGGAAAGTCTGGTATGAAGTCTAAAATGTGTCTGAAAAGTGTAACCTTTGCATGTGCCATTGTAAATG\n>URS000194BC91 lncRNA from 1 species \nCCAGGGCCTGAACCCATGCCACAGCAGTGGCAATGCCAGATCCTTAACCACTAGGCCACCAGAGAACTCCCTTTTACTTGTTTTTTGGCCAATGTTCCAAGACATTAAAGGGTTAATCCTCCTAATTGAAGCTGAGATCTTTTTTTGTGGCATCATTTTTGACAAGAGAAAGTCCTCTAAAAAGGACTTGTTGAGCGTTAGGAGGTCTCCTCCTCAACAGCGGTAACAAATGTTCCCTTTGTTATAACTCGACCTCCAATTTTCTCTATTTTCAACCCTGCTATATAGACAGGAAAATTCCCCCAAGTAATCATCATGATGCTCTTTCAGATCCAAACTCCTTGGGCCTCTTCTCCGCAAAAAGTAACCTGGTATGAATTGTCCTCTAGAACAAGGTTAGAAGGGTAACTTGAAACCCAGTTGTACAAGAGCATAGAAGCTCCATGCCCTTTCTGAATAAAATTATAAAGACTTTAGATTTGGTACAGCCATACTGGAAGCCCTACTCCCGTGGGTCCTACTCCAGCGAAAGTGCCAGGAACTACAGACGTCAGCCCCATGTCCCTTGGTTGCATTGCAGCTAATTATTCACAACAGCAAAGAGGAAACAAAGATTTACTCTTTTCCTGAAAGTCTCCACCCAGGTTCCTCAAGAATCTTGAAGCGCCTTGTAGGTGCCTTGAATCCCGAGGCCAGCAGTGGCTATGCTGAGCTAAGTGATATCTTGGTCATCCTTCTGATCTTCCCTGGCTCTGTTTTAGTCCAGGACCCAAAGGCCATAGAGCTAGTGGTATTGAAAGAGCCAGGAATGACCACGAAGGATGCCCCGCTCCTAGGCTGCCTTCCTCCTTCTCTCCCTCTTTCTTGTTAAAATCTAGTGAACTACATAGATATTCTTCTATGGATATCTTGAAGGCTATTCCAGATATTCCTGAAAGGCTTTCCAATCAGCCCTGCCTACCCCTCTAATCTCAGTCTCCTGTCCTCCAAGTATTTCACCACTCAGAAATGTCAGACTTCCCCTTTCTTGGTGCATTTTAGGGATTTTTCGGTATCCCAAGGGAGGGATTCTGCACAAATCTCTTCTTCTTTTCTTGATTCCTAGGATGCCTATTCCTGGTTCAGCATAGTACAGGCTCAGACAATGGTACTCACTGTTGGACCGTTTATTTATAGCAGGTTGAGTATGAGTTGAGACATTGGACAGACGTGGCATTGGATCCTACCTCTTGTGACTTGCTAAGTTTGGGAACTAGGGAAAGTTATTTAATTTCTATGGACCTCATTTTCATCATTAGTAAAATGAGAATCCTTATGGCAAGTACTACTTTAGGATTATCGTAGTACCCGACAGACAGAAGGTTTCAATCCAGCTGTTATTAAGGGTCTGAAACTTGGAGTTCCCATCGTGTCGGATTCGTTAACCACTGCGCCACGGCGGGAACTCCAAAAATGAGTGATATTACTCCAAAGTTGCACACTTCCCCTGCGGCCCCTCATGCCAGGCTCCACTGCCTTGGTGGGGGCCACCTGCTCTTCTCAGGCCTGAGCATGGAGACCACCAAAAATGCCCCCTCACACCCTGCTCTCCCATCCTTCCTCTGAGCCCACTTTTCCCTTCTCTTCAGCTGAGGGAACTTCAGCCACTCACAGTATCTTAGAAGTATCTTTCACAACAAATAACAGTGCCTTTGAGAAGAGAGAACCCAAAACACTTTCCCTCATGGGTCTTTAAAACAGTCATTGGCTGTACCCACAGCAGGTGGAAGTTCCTGGGCTGGAGATCAAACCTGGGCCACAGCAGTGACCCAAGCCACTGAACTACAACCCTGGATCCTTAACCTGTTGAGCCACAGGAGAACTCCTAAAACACGATCATCTTCATGATCACGGAAGCAACATCCTCCACTATCATTTGCTATTGAGTGAACTAACATACATGAAATAGTTCTTAGGGCCTGACACATATTCAATGGGCATATATAGTACATATTAGCTCTTACCACTATCATGGGATTAAGTACATACTAAGTTTCAGGGTGCTATGCTGAATCCTTTCTATACCAAATCTCCTTTAATTGCTGTAAGAACTCCATGGGTGGAAGATATTTTATACCCATTTGAATTATTTACTTACTTAAAAAAATTTTTGGAGCATTTTATTTTACTTATTTTTATGGAAGTATAACTAATGTATAATATTATGTAAATTATAGGTGTACAATAGAGTCACAATTTTCAAAGGTCATACTCCATTTTTAGTTATTATAAAATAACTATAATCCCCATGTTGTACAATTAGTCCTTTTAGCTTATTTTATTTTATTATTTTTTGACTGTGTCCATAGCATGCGAAAGTTCCCAGGAGGGAACCCCATCCACAGCAGTGACAATGCCAAAGCCTTAACCACTAGGCCACCAGGAAACTCCAATTATAGCTTATTTTACACCTAACAGTTTGTACTTCTTAATCCTCAACCCCTTTCCCTCTCCCCACTGGTAACCACTACTTTGTTCTTTATATCTGTGAGTCTGCTGCTTTTTTGCTATATTCACTAGTTTGTTGTATTTTTTAGATTCCACATATAGGTGATATACAGTATTTGTCTTTCTCCAACTTATTTCACTTAGCATAATTCCCTCCCAGTCTATCCATGTTGCTGCAAATGGGAAAGTTTCATTTTTTTTCTTATGGCTAAAATATTACCTTGGAATACCCTTCATCTGTTGAGAGACACTTAGATTGCTTCCATGTCTTAGCAATTTTACACCCATTTTACAGATGAGGAAACAAGATGGTAAGAAGTCAAGTGCCCAAATTCATAGTGTTGATTCATTCTAGAACTGAATTCAAACCCAATCTCCACAGACTGTATTGTCTATCCCCGACGTCAACTGTGTTTGTGTTTAGGTGGGAATGACTTATGGGCAGTCTTTGAAAAAGACTGGGGAATCATCAAGCTGAAATGTTCTCTTGGATTTAAAAATTCTGTAATGAAGACTTAGATGGTTTACTAAAGGAGAAATACATCTGGGTTGGGGGGAGAGGAATAGAAGCAAGGAAGGAGAGAAGAAACATTTATTAGGTCTCCCAGTTGGCTTAGTGGTCAATTCAAACTTTATTTATTTGCTTTTTTTTAGGGCCACACCTGCAGCACATGGACGTTCCCAGGCTAGGAGTCGAATCAGAGCTACAGCTGCTGGCCTATGCCACAGCAACACCGTATCCTTAACCCACTGAATGAGGCCAGGGATCAAACCCACATCCCCATGGATACTAGTCAGGTTCATTTCCACTGTGCCACAATGGGAACTCCCCAATTCAAACTTTAAATCCAGGTTGGTCTCACCTCAGAGCCCAGCTTTCTGCCAAGGACTCCAGAGTTGTACACTTGTGCTCCAATTCTATAACTCCACTGCAAGTAATTTAACAATAATTTCATATTTTCCACTGAGACACTGAAACGTCTTATTGAAAGAGGTCAGGGAAGTCGCTTCCCCAGAGCAGAGTTGGAGAGACAGCTAGACAGTGGCACTGGGGGTGGGGGTGGCTTTCAGTGCAGAACTACGCAGAGGTGTGAAGACGAATGAGCTGGCCTTTTAGGTCTTTTCCAGTCCCCGAGCTCCAGGATTTATTTGGCCATGAAAATGTCAGGCTTTTTCTTCCATAAAATGATGTATGATGGTCTGAGTACATTCCCCAATCCCACCCCCACCTCCTCATATCTGATTAAAAAGCAAAGATTAAATCACTGAAAACAATGGAAAGGAAGGTTTTTCTCCAAGAGGGATGAGGTTTTCCTGAGACAAAGCAACAGGAGGAGCAGAGGGAGTACAAAGGAAAACGCAGGGGTCTGGGAGGGACAAGCTGAGCATAGAGCAGGTGGATGGATCCAGCAGAGAGTGGGGGCTGGGACAAAGGCCAGTTGCAGTTGGGTTATGAGGGCTATCAGCTTACATTAACCAACAGGCATGGAGTGGAAACCAGGGCTCTAGTTATGCAAACCAAATGAATGCATTTGAACAATTTGTGAACCATGTTTTTTATTTTTATTTTGAAAATTTTTTCTTGATATAGGATCTCAGTTTCCAGAGAAAGGACTGAACCTGGGCTGCAGGGGTGAAAGCACTGCATCATTATGACTAAACCACCAGGGAACTCTCTAGAACCATCCTTTTTTTGTTGGGTGTTTAGGGTTTTTTTTTTTTTTTTTTTTTTTTGGCTGGCTAGCAGCATGTGGAAGTTCCCAGGCCAGGGATCAAACCTGCAATCAATTGAAGTTCTCTTGTGGTGCAGATCTTTCACTTACTGCACTGCACGAGAACTCCTAGAACCATCCTCCCCCCACCTTTTTTTCCCCCCAGCACATGAAAGTTCCCTGGCCAGGGATCAAACCGGAGCTGGAGCTGCGACCTCCACCACAGGGGCAGCAACTCCAGATCCTTAACCCACTGTGCCAGGCCGGGGATTGAACTGGTGCCTCCACAGAGATAAACTGGATCATAATGCACTGTGCCTCAGCAGGAACTCCCTAGACCTATCCCTTTTTACCCAGGAGATATGAGGTCAGCCTTGAATCAGAACTCATTCATTCAACCAATACTCATCGCCGCCACTGTACCAGACAGAGTTCTGGGTTTGGAGGATACAGAAATGACCCAAGCAGTTCTAGTTCACTGCCTTTGGGAAGAGAGAAAATAAACACCACGATCAGTAGTAAAGCATGTGGTATTCTAGTTAGCATCAGGGACTAAGTAAAAAATAAAGCAGAGAGCCCAAGAGGAAACATCGGCGCAAGAGTCGGAGGTGGTAATGTTTGGGGGATTTGGCCAGGCATGATGCCTGACTGAGGGGGTCAGAGCAGAGGAAGGAAAGGACAGGGTGCTGATGACAGTGGGGCAGGAGGGTCCTAGGCAAGGGAGGGACAGTCCAGGTCCTGGGGTGGGAGAGGACCTGGTGCCTGAGAGACAGTGAGGACAACCAAGTAGCTGGGTAGGAGGTGGAGTCACAGAGCTCACAGGGGCCAGATCCTGCAGGGCACTGAATATACCTGAAAAGATTTTAGCTTTCAGATCCAGGGAGATGGGACTGCACCCTGGGAAAGGTAAAGCAGGGAGACCACCTAGGATGCTGTTGCAATAATCCAAGCAAGAGATGATGTTGGCGTAGACCAGCTGTAGTGGTAGCAGAGGTGGAGGAAAGTAGTTAATGTCTGGATATGTTAAAATGCTAGGCCTTCAGGGGTAAAAAGGAAGACAAGCCTCAGGAAAGGAGGGAAGCTCTTGCTAATGATCTGCCCTTAATACATCTGCCACCGTTTGTCATCTCAGCAAAAAAAAAACCCTGGAGGCTCCATTCAGACTGACTGTGCAATGGGACTCACTCATGCGCTTAGCTGGTTTCCACTGAGAGTTGGGACAAGGGGTTGTATTTTCCATATTTGCAGGTGACTGACTTCT\n>URS000240C156 lncRNA from 1 species \nGGGATAACTATCACTCCTCCATAATTGAATTCGGTTTTCATTTGTTTATTTATTTATTTTTTTTCCCACCTGTGGCATTGAGTTATTGATAATTGTCAAGTACTTTTCGGATTTGTATAATAATATAATTATTAATTATTATATGTTGGGGAAGAAGTTGTCGGTAAGGTCATTGTCTTAGTAACTTAAATGAGTTTTTAAGCAAAATAAGGACAAATATTTGTTGCCAGTGGTACTGATAATTTATTACAACTTTCATATACATGTATCTTTCATTGTTATAATAATCGCAAGATATTTCACACTGCTTGTTAATACTATCCAAAGAGTTGTTGACTCAAATGACTCTAAAACAGAGGTCTAAAGATGGATACACTACTTGATATATTTATTAAATTTTTTTATTTATTAAATTTTTAGTTTCTATTCTAAGATCCTAATTGATAAGAGTAATAAATCTTCATATTATTGTAAAACAGTGAACTAGCAGAGTATAAATGATAAAAGCAAGATCAATTCTTCACTACTGATTAATAAACAGATATGTAGATTAATTTTTTAAGTTGAATATTCGAAATTTCAACTAAATTTTTTCTTATTTAGTTAATTTTTTCCTGTTAAGCCAAGTGGGGGATTATGGTCAGTTAGTTCTTAATTTAAACTTAGAATCCCCCCCCCCCCCCCCTCCCCTTTCTTTAGCTTTCCTTTTTCAAGCTAACTAAAGATGCGAAGTTTATTTTGCCTTCTTCTGTTTTGTGGTGGTCCAGATTTGGTTTAGGTATATTGATTGAGAGTTATATAATTGTATAATTTTTGTTTGAAGGTATATAAATTAAGGACGCGTGCGATGTATTAACAATAATTTTTTGAAGTTACATTCGTTGTTGGTCGTTGATTGTTAAATGATAAATCTTTCCCATCAAACACTTTGCTCAGCGTCCATGCAATTATACACGAACGATGACACTTTTATTTTATTTTTTCTTTTTTATTATTATTATTTTTGGACCAATTAAGTTCATTACCCTAGTATTTTTAGCAAGACTTCGGTTCATACTTTGACTGGCAAAGAATTTTCAACTCAAATTTTAAGCCTAAAACAGAAGACCATTAACCCAAAAGAAAGAAACAAAATATGTTTCAGGAATTTGGTTAGATATCACAATCAAGTTATTATAAATATAATTTACTGGAGGGGCAACATTATCAGAGTCTTGAGTCATGGAGAAAAGCTGTGTCTGATATTTGATAATTTGAAAAGCAGGTATTAATTCTTTCCGTCCGAGGGTAACTAATACGGCACAGAAATTTTATTTTATTTTCTTTAAATATTATTATTTAACATTCAAACTCTTCATCCCTGATGACTTAATTTTGGGCTGGTCGGTTTCTAGATACAAACTATATATGGCATGTGTTAATCACGGAATAGTCTTCATGCAAATGGGAGACGTTCACACGGGAGCGGAGCCCACATTAAAATTTTAGGGACACAATTCTATATCACAAAATTTTAAAGAGTTAAAAAAATGGACTTAATTATTGGGTTAAACTGTTGAAATATTAAACTTGCATGATTGCATCGGTTAAATTATAAAAAAATCTCTCTTTTAAAAGTTAAATTTCTAAATTTATCATATATGTAAACTAAGTTTTTTTTTTTTTCTAAGACCAGCAGCAGGTGCCATGGCACCTAGTAGTTTTGCGGCAGCTCCGCTCCTGCTCACACACTTAGGTTACTTCTAAGTTACAGCTACTTTTTGTTGCAGACCATTTGTATTTTTATTTTTTAACATATTAAATTACAATCTAATAATATTCTAGTTTATACTTTGATAGTCTGATCATATGTTTCTTTTGATGAGTAAGAGACTTACTATGACCTCTTGACAAGTTTTACAATTTTCCCTCCTCCTATTGAGATTTCGGAGCAAAAAAAAAAAAAAAATCCACCAATATTTTTGGAAAAATAAATGTATTATGGATTAGATGGCTAATGTCAGTCTTATTTGCGCTTCTTTAACTTAAGTAACACCCTTTTGCAGCCTTCCCAACAAGGGTGCTGATACTTACCCTAAGTCAAACCCCGGACATTAGCGAATGACACATTTTTTTATAAAAATTACAACACAATTTTAGTTTGGATCTTTATAGAAATTAAAAAAACAAAAACTCATTTTCCTTAACACAATTCAAAAGCAACAAAACTCAATATACTGCTGCGAGTAACCAACCGTGGCCAAGCCACGAATCCCACTGTACCACTGCGAGCAGTCATATTCAAGCCACGACGTTTAAAATGTCTGTGCCTAGCTGTTCTAGCCACTGCTACTCGTGTAAGTTGAACTTGGGATTTTAAATATTTTCTGGAATTTTATGATTGAATTTATTATAGACTAATTCAGAGTGTTATTAGCATAAGAAATCTCATGGGAGTTCAAGAGAAGTTTCTTGTGCTCATAAAATAATTGGGATAATTAATTAATAAAACCAAGAAATTGCATACTTTTATGTTGTTATTTTGCAGTAGTTATTTTAAATATGATTTGAAAAAAAATTGATGTAGTAATGGAGAATTTGGAACAAGTGGATCAAGTCAAAGAATTGGAGGAATTGGAGGCATTAGACGAGTCTGATTTATAAGAAAATATTGAGTAATTCGAGGAGACCGAATTTGATAACAATGAAGATGTGAAAGAAAAAGTTGCTAAGCCTCAGGTTGGGGTGTGAAAGAAAAAGTAGCAGTGGCAATGGTTGATTTTGGGGTGCCGCTTTGTAAGTGGCCGTGGTTGTCGCGTGGTGGCTGTAGGCAGTGGCAGTGACAATGGCTGTGGTGTGGTGGTTTGGGTGATTTTGGGAGAGTGCTTGTGCTATGTGACTCTGGGGAGTATACTTTCTGCTTTGTGGTTGTCATTCACAACCATAAAGAATAAGAAAGTTTTTTATTTTATTTTATTTTGATATTGCTAAAGTTAGACGGTGCATTTTCATCCCAACAATAACTTTTGTAAAATTCTTCGTTTTGCGTTGTTTTACCTCTTAGTTTTTTCTGTTTGTATTGTTTGCATTTTTATATGCTACTTTTATCTCTCTCTCTCTCTCTCTCTACAAGGTAATTAGGATCATTACATACTCCTCTTATTTAAATGTTTTTTTTCCACTTTACTTTAATAAACTTCCCTTGTAGAGTTAAGATTTCACTAAAAAATTACTAATATTTATAGTCTGAAATTTGTTGTGGTTTTGTCTTGATAATTGTTTTTTTAACGCAATAAGATTTTGTCTCTAATACTTCGAAGGAAGTTTTAATAACATATACACAAAAGAGAATGTATTACCTTACTAATGGCGGGTGATTGCCAAGTCAATAAAACCATTATTTGTAAGTGCTATTTCACACTTATTATATAAACATTAACTTATTAACTAAAAAAGTTATGAGTAGATTTCTTTGTTTCTCCCTCCACTCGATACAACGGTAGCAATGTTTAAGCACTGGGAACTTGCCAAACTTTATTAAAGAGAAATCTCGCATTGAATTATTTGCATAATCAACGTAGATTCAAATAATTGGGCTCCCTAATGGGCCAATTGGGTTCCTCAATGAGCCTCAAATGGTCGAAGATATTTGTTAGGTCCAACTCTGTAGAAGTTCGGGCAAATCATATGCCATCCAATATTCCAAATCCTTTGAAAAAAGCAAAGGGTTAGACTACTGACACCCTTCCAATTTGGGGTATACAAGATATATACAATTGAATTCAACTCAATCAAATCAATTAATCCAACTTAAATTAATCTAATTTTATCGGACTGACTTTTTAATTAGATTAGATTATATTAGATTAGATTAGATTACAAAATAGAATATCTAATGTTATTATATTGGTAAATGGATCTATGTGTTAAAATCTAATATAAACTATTCTAACCAACTGATTCTCATTTTCTTTCTCTATTTTTTAAAAAGGTTACGTGGC\n>URS00021E5558 rRNA from 1 species \nGCTAAAAACCTAGCTCAAATTTACGCAAATGCCACAACCAAACAACTGTAACTAAACAAAACATTTTTAAATTTTAGTAAAGGCGATTGAAAAATACCTAGAAGCTATAACAATAGTACCGCAAGGGAAAGGTGAAATAAAAATGAAACAACTTTAAAGCAAAGCTAAGCAGAGACTTAACCTCGTACCTTTTGCATCATGGTCTAGCTAGTTCAACCAAGCAAAACGCAATTGTAGTTTGACACCCCGAAACTAGGTGAGCTACTTCAAAACAGCCTTTAAGGGCCAACCCGTCTCTGTTGCAAAAGAGTGGGAAGATTTTCAAGTAGAGGTGACAGACCTACCGAACCTAGAGATAGCTGGTTATTCAGGAAAAGGATTTAAGTCCTACCTTAAGTTTTTTTATACCACAAAATATAACAGTAGACTTAAGAGCTATTCAAATAAGGTACAGCCTATTTGAAACAGGAAACAACCTTAAACACAGGGTAATGATATTCTAAACGTGACCAAGTGGGCCTAAAAGCAGCCAACTTTTAAACAGCGTTAAAGCTCCATCACTTTATTTAACTAATAACATTAATATTACAAAACCCTTCACCACTACTGAATGACTCCATAACCATATGGAGAACACTATGCTAGAACTAGTAACAAGAAGAAGACCTCCTCCAAAATGTAAGTGTAAGCCAAAATGAACAACTCACTGGCACTTATCGTCTCTGAACTTAAAGTAGTAACTTCACAAGAAAATTCTACCCCCACAAACGTTAACCTTACACCAGAACATTACCGGAAAGATTAAAAAAAGAGGAAGGAACTCGGCAAATTTTAACCCCGCCTGTTTACCAAAAACATCGCCTCCTGAAATAACCATAGGAGGTCCAGCCTGCCCAGTGACAAAGTTAAACGGCCGCGGTACCCTAACCGTGCGAAGGTAGCGCAATCACTTGTTCTTTAAATGAGGACTAGTATGAATGGCATCACGAGGGTTATACTGTCTCCCTCTTTTAATCAGTGAAACTGATCTTCCCGTGAAGAAGCGGGAATACATCTATAAGACGAGAAGACCCCATGGAGCTTTAAACTCAGTATCAACTGCCCTCCCAATATATCCACCTAATTAAGCAGACATGACTACTAGTTTTCGGTTGGGGTGACCGCGGAGCAAAACAAAACCTCCACGATGAAAGGAATTAACCTCCTAATCAAAGAGCTACATCTCTAAGAATCAACAAATTGACATTTATTGATCCAATTTTTTGATCAACGAACCAAGTTACCCTGGGGATAACAGCGCAATCCATTTCAAGAGCCCCTATCGACAAATGGGTTTACGACCTCGATGTTGGATCAGGGTATCCCAGTGGTGCAGCCGCTACTAAAGGTTCGTTTGTTCAACGATTAAAACCCT\n>URS00018C7DE1 rRNA from 1 species \nTACGTAGGGTCCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTCGGTAAGTCGGATGTGAAAACTCAGGCTCAACCCGGAGACGCCATCCGATACTGCTGTGACTTAGTCTGGTAGGGGAACACGGAATACCTGGTGTAGCGGTGAAATGCGTAGATATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGCTCATTACTGACACTGAGGCGCGAAAGCGTGGGGAGCGAACAGG\n>URS0001E9E6F4 misc_RNA from 1 species \nGATGAAGAACGTAGCGAAATGCGATACGTAATGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCATATTGCGCTCTCTGGTATTCCGGAGAGCATGCTTGTTTGAGTATCAGTAAACACCTCAACTTCCATATCTTTTTTGAAATGGGAGTTGGACTTGAGTGATCCCAACGCTTTTCCTCACCGAAAAGTGGCGGGTTACTTGAAATGCAGGTGCAGCTGGACTTTTCTCTGAGCTATAAGCATATCTATTTAGTCTGCCTAAAAAACAGAATATTACCTTTGCTGCAGCTAACATAAAGGAGATTAGTTCTTGTGCTGACTGATGCAGGATTCACAAAGACGGCTTCGGCCGACTTTGTAAACTCGATCTCAAATCAAGTAAGACTACCCGCTGAACTTAAGCATATCAATAAGCGGAGGA\n>URS000057C40D tRNA from 1 species \nATTATTTTGGCAGATTAGTGCATTAAATTTAGAATTTAATTATGTAAAATAAATTACAAATAATAC\n>URS0001919D12 rRNA from 1 species \nTACGGAGGGAGCTAGCGTTATTCGGAATTACTGGGCGTAAAGCGTACGTAGGCGGCTTTGTAAGTAAGAGGTGAAAGCCCGGAGCTCAACTCCGGAACTGCCTTTTAGACTGCATCGCTTGAATCCAGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAAACACCAGTGGCGAAGGCGGCTCACTGGACTGGTATTGACGCTGAGGTACGGAAAGCATGGGGAGCAAACAGGG\n>URS000239B5F5 lncRNA from 1 species \nGGAAAAGGAGACAGGGAGTTCTGAGGTTATCCACTGCCATGGAGCCATCACTTTTGGCCAATTGTTGAGATGGAATCCAAGACCAGGAGAACGGTACACAATGATGTTGCAAGCATTGCACTTCGTTTTTACCTCAGAGATGCTCGGCATACAACGGAGACATGGCCTGTCCATCATGGAGAAAGTTCTTTCTCCGTGAGACCCAGGCG\n>URS000017EE1C rRNA from 1 species \nCAGCAGGTCACGCAATTACCCACTACCCGGCACGGGGAAGGTAGTGACAAAAATAACGATACGGGACTCATATGAGGCCCCGTAATCGGAATGAGTACACTTTAAATCCTTTAACAAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGTTCTGCGTGCTACGCTGTCGGTTCGCCGCCTGCCGGTGTAACTGGCATGCCGTGGCATGTCCTGTCGGTGGTGTTCGGGAGCCTCGTCTAGGTGGTGCCCTCGGACCGCAAGGTACGAGGTGTTCACAGGCCGGAGGTCCCCCCGTTCGCCTACTCTATCCTACCTAGGTGCTCTTCACCGAGTGTCGAGGTAGGCCGACACGTTTACTTTGAACAAATTAGAGTGCTCAAAGCAGGCTGAAATTTCTGCCTGAATAGTGGTGCATGGAATAATAAAACAGGACCTCGGTTCTATTTTGTTGGTTCTTAGGAACACGAGGTAATGATCAATACGGACAGGCGGGGGCATTCGTATTGCGACGTTAGACTTGGCAAATGCTTTCGCGGTGAAATTCTTGGATCGTCGCAAGACGCACAAGAGCGAAAGCATTTGCCAAGTATGTCTTGATTGATCAAGAACGAAAGTTAGAGGTTCGAAGGCGATCAGATACCGCCCTAGTTCTAACCATAAACGATGCCAGCCAGCGATCCGCCGATGTTCCTCCGATGACTCGGCGGGGAGCTTTTTCCCGGGAAACCAAAGCTTTTGGGTTCCCGGGGGAAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGAAACCTCACCAGGCCAGGACATTGGAAGGATTGACAGATTGATAGCTCTTTCTTGATTCAGTGGGTAGTGGTGCATGGCCGTTCTTAGTTGGTGGATCGATTTGTCTGGTTAATTCCGATAACGAACGAGACTCTAGCTTATTAACTAGGCGTTTTCCGGTGCCCTCGTCACCGGCGACACTCATTCTTCTTAAGGGGACAAGCGGCTTATAGCCGCACGAGATTGAGCAATAACAGGTCTGTGATGCCCTTAGATGTCCTGGGCCGCACGCGCGCTACACTGAAAGAATCAGCGTGTGCCTCCCTGGCCGAAAGGCCCGGGTAATCCGCTGAACCTCTTGCGTGCTAGGAATTGGGGCTTGCAATTGTTCCCCATGAACGAGGAATTCCCAGTAAGCGCGAGTCATAAGCTCGCGTTGATTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTACTACCGATTGAATGATTTAGTGAGGTCTTCGGACTGGCGGTAATCCCTATCGACTTGTCGGTATCGATGAACGCTGGAAAGATGACCAAACTTGATCATTTAGAGGAAGT\n>URS000219C8A1 lncRNA from 1 species \nACTGCCTCAACTGTTCGCTCAATGATTTCTGGACCCAAAATTCTGTTTTCCCCGACTTCATCCCAATGGATAGGGGATCTGCACTTTCTACCATAAAGAGCTTCATACGGGGCCATTCCTATAGTGGCCTGAAAACTATTGTTGTAAGCAAACTCCACTAACGGCAGGTGTGTCTCCCAACTACCTCCAAGATCCAAAACACATGCCCTTAGCATATCTTCCAAAGTTTGGATGGTTCTTTCTGATTGTCCATCCGTCTGAGGATGATAAGCTGTGCTAAACTTCAGTTTTGTCCCCATGGCTGTCTGCAAACTTTTCCAAAATTTAGATGTGAACCTCGGGTCTCTATCTGAAACAATGGTGACTGGGACTCCATGCAACCTGACTATCTCCTTGATGTATAAGTGTGCCAGCTGTTCCAAGTTAAAGTTTACTTTAATTGGAAGAAAATGGGCTGACTTCGTCAGACGATCCACCACTACCCAGATAGCATTGTGACCTTTTGCTGATCTCGGGAGGCCTACCACAAAGTCCATCGTTATGTGTTCCCATTTCCATTCTGGAATATCCAACGGTTTCAGTAATCCTGATGGCCTTTGATGTTCTGCCTTAACCTGTTGACAGATAATACATCTCTCCACGAACAGACCAATTCCTCTCTTCATGTTTCTCCACCAAAATACATCCCGGAGATCTCGGTACATTTTCGTACCACCTGGATGAGCAGAATAAGGGGTTGAATGAGCCTCTTCTAATATCTCATTTCTTATACTTTCATCCTTAGGTACACACAGTCTTCCTTTGAAAGTTAGCGCATTATCTGCAGATACTTCAAACCCTATATGTTTATCTGTACCAATCTCGGCCTTTATCTTCTGTAAAAATGGATCTTTATCCTGTGCCTCCTTGATTCGATCTCGAAGTGTAGGTTGAATCATGAATGCTCTTATTCTCGCTGAAATCTGAGTTGGCGGCGTGATAACTTCCAATCTCAATTTATCAAACTCCCTTATCAAGTGTTCCTGTACTGTGGGTAAAACTGCTAACTGTGTTCCTGTCTTTCTGCTTAGGGCATCTGCAACTACATTAGCCTTACCCGGATGGTAATGAATTGTGCAGTCATAATCCTTCACTAACTCCAACCATCTCCTCTGTCTCATATTTAGTTCCTTCTGTGTGAAAAAGTATTTGAGACTCTTGTGGTCCGTATAAATTTCACACTTCCCACCGTAAAGATAATGACGCCATATCTTTAAGGCGTGAACAACTGCTGCAAGCTCCAAGT\n>URS0000884EE1 rRNA from 15 species \nGGCGTGCTTAACACATGCAAGTCGAACGGAAAGGCCCTGCTTTTGTGGGGTGCTCGAGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTGACTTTGGGATAACTTCAGGAAACTGGGGCTAATACCGGATAGGAGCTCCTGCTGCATGGTGGGGGTTGGAAAGTTTCGGCGGTTGGGGATGGACTCGCGGCTTATCAGCTTGTTGGTGGGGTAGTGGCTTACCAAGGCTTTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGGAAGCCTGATGCAGCAACGCCGCGTGCGGGATGACGGCCTTCGGGTTGTAAACCGCTTTCGCCTGTGACGAAGCGTGAGTGACGGTAATGGGTAAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTGATACGTAGGGTGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGGGCTCGTAGGTGGTTGATCGCGTCGGAAGTGTAATCTTGGGGCTTAACCCTGAGCGTGCTTTCGATACGGGTTGACTTGAGGAAGGTAGGGGAGAATGGAATTCCTGGTGGAGCGGTGGAATGCGCAGATATCAGGAGGAACACCAGTGGCGAAGGCGGTTCTCTGGGCCTTTCCTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGCTTAGATACCCTGGTAGTCCACGCTGTAAACGGTGGGTACTAGGTGTGGGGTCCATTCCACGGGTTCCGTGCCGTAGCTAACGCTTTAAGTACCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGCCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGTAGAACCTTACCTGGGTTTGACATGGATCGGGAGTGCTCAGAGATGGGTGTGCCTCTTTTGGGGTCGGTTCACAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTCACTGTTGCCAGCACGTTATGGTGGGGACTCAGTGGAGACCGCCGGGGTCAACTCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGTCCAGGGCTTCACGCATGCTACAATGGCTGGTACAGAGAGTGGCGAGCCTGTGAGGGTGAGCGAATCTCGGAAAGCCGGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCTCATGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGGCTTGTACACACCGCCCGTCAAGTCATGAAAGTTGGTAACACCCGAAGCCGGTGGCCTAACCGTTGTGGGGGAGCCGTCGAAGGTGGGACTGGTGATT\n>URS0000B9E3AC rRNA from 1 species \nGCGCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAGGAAGAAGGACGGTACCTGAGTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGACGGCGAAGAAAGTCTGAAGTGAAAGCCCGCG\n>URS000252BD60 tRNA from 1 species \nGATAAGATGGCAGAGAGTTAAGTGCATTAGATTGTAAATTTAATAATGAGGGTTAGATTCCTTTTCTTATTA\n>URS000022CE74 rRNA from 1 species \nTTCGGGGTGAGTGGCAGACGGGTGAGTAACGCGTGGGAACGTGCCCTTCAGTTCGGGATAACCCAGGGAAACTTGGGCTAATACCGGATAAGCCCTTACGGGGAAAGATTTATCGCCAAAGGATCGGCCCGCGTCTGATTAGCTAGTTGGTGGGGTAATGGCCCACCAAGGCTACGATCAGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTTAGGAATCTTGGACAATGGGCGCAAGCCTGACGACGCAACGCCGCGTGGAGGACGAAGATTTTCGGA\n>URS00001AC001 rRNA from 1 species \nCGTACTCCTACGGGGAGGCAGCAGTGGGGAATATTGCACAATCGGGGGAAACCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTGTAAAGCACTTTCAGTAGGGAGGAAGGTAGTGTAGTTAACACCTGCATTATTTGACGTTACCTACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGCATGCAGGCGGCCTGTTAAGTCAGATGTGAAAGCCCGGGGCTTAACCTCGGAATTGCATTTGAAACTGGCAGGCTAGAGTCTTGTAGAGGGGGGTAGGAATTTCAGGTGTAGCGGTGAAATGCGTAGAGATCTGAAGGAATACCAGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGATGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAG\n>URS000182260B rRNA from 1 species \nATACGTAGGTGACAAGCGTTATCCGGATTTACTGGGCGTAAAGGGCGTGTAGGCGGTCTTGCAAGTCAGAAGTGAAATTCCTGAGCTCAACTCGGGCGCTGCTTCTGAAACTGCAGGACTTGAGTGCTGGAGGGGATAGCGGAATTCCTAGTGGAGCGGTAAAATGCGCAGATATTAGGAAGAACACCGGTGGCGAAGGCGGCTATCTGGACAGTAACTGACGCTGAGGCGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCAGGTAGTCCACGCCGTAAACGATGAATACTAGGTGTAGGGGGTATCGACTCCCTCTGTGCCGCAGTTAACACAATAAGTATTCCGCCTGGGGAGTACGGCCGCAAGATTAAAACTCAAAGGAATTGACGGGG\n>URS000010CDEA rRNA from 1 species \nTAGGCCTAACACATGCAAGTCGAACGGCAGCGCGGGTGCTTGCACCTGGCGGCGAAAGGCGAACGGGTGAGTAATACATCGGAACGTGCCCTAGAGTGGGGGATAACTAGTCGAAAGATTAGCTAATACCGCATACGATCTACGGATGAAAGTGGGGGACCGCAAGGCCTCATGCTCCTGGAGCGGCCGATGTCTGATTAGCTAGTTGGTGGGGTAAAAGCCTACCAAGGCGACGATCAGTAGCTGGTCTGAGAGGACGACCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGGGCAACCCTGATCCAGCAAAGCCGCGTGTGTGAAGAAGGCCTTCGGGTT\n>URS000217ECBF lncRNA from 1 species \nGGATGTTAAGAGAAGGGGTTGTTTAAGATAAAAGATAAATTCTATATTGATGTAAGTTAAATTTAAAATACTGATGGACTATCCAAGGTGAAGATGTCAAGTAGGTATTTGGGGAAATAGCAATCAAGTGCAAGAGACAGGGAATTTTCTTTTGGAACAATGAGAATTCTCCAAGCTTCCTCAACAGACAACTGGAAGTGGCAGCAAAGAGGCAGTGGAAAAGCAGCAGAATGGCAGTAGAATGGCAACAGCTGCACTGGGATCAGAGGCTGCACTGGGATCAGGGGCTGTGCTTAGATCGTGCTGAGTCATTGCTGGTGTTGGACGGAGTGACAGCGCGGAGGAGGATTACGTGTGCCAACTGCTGGATTTCCCAAGTTTGCCTGCCCTTGCCTAGGTGCGAGCTGAGGTGTGTGAGTGTCGGGGACTGATGGGTTTGGGGAGGCCTCAGCCCGGACGGCCCTCCGCGATCTGGGTCTGAAAACACGAGCCCCCGTCTCTTAGGAGGCGCGGGAAGGAAGGTACATGATAACTTCTGTAAAGAAAGATGGGATCAGACTTATGTTGAAAAAGGAAGCTGGTAAAATTCTCTGCTAGTGATTCATGTACCACTATGAAGCATTTGAGTCAATGGTTATGGATCTCAATCGACTCCACCATTTTCCAGGTCTCAGAACGGCTAGCGATTGGATGAACATTCTTTGATGTAACTGTTCTATTAATTCATTATATTAGTGGTGTAAAACTTTCTGGTTCTTGTTTGATCCAACTTTTATTTTCATTGTCCATTATTTTATTGTCCATGAAGATGACAAAACCTTTTCTACATTTTTCTGGCTTCAGAACTTCTCTTACCTCTGATTGCTTTGACTCTAAAGATGCTATAATAAAATTACTGATTGATATTCAACTG\n>URS00016BEEAD rRNA from 1 species \nTACGAAGGGTGCAAGCGTTACTCGGAATTACTGGGCGTAAAGCGTGCGTAGGTGGTTTGTTAAGTCTGTTGTGAAAGCCCCGGGCTCAACCTGGGAATGGCAATGGATACTGGCAAGCTAGAGTGCGGTAGAGGGTAGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGAGATCGGGAGGAACACCAGTGGCGAAGGCGGCTACCTGGGATGACACTGACGCTCATACACGAAAGCGTGGGGAGCAAACAGG\n>URS00011B15C7 rRNA from 1 species \nCCCTTAGATGTCCTGGGCCGCACGCGTGCTACACCGATGCATACAGCGAGTACTTTCCAGCTCCGCGAGGCAGCTGGTAATCAGCAATATGCATCGTGCTGGGGATAGATCTTTGGAATTATAGATCTTGAACGAGGAATTCCTAGTAAGCGCAAGTCATTAGCTTGCGCTGATTAAGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATTTCGAGTGATTCGGTGAACCTTTTGGACAGCGTCTGTCCTCGTGTCAGATGCTGAAAGTCAAGTAAACCATATCACTTAGAGGAAGGAGAAGTCGTAACA\n>URS000170A9F1 rRNA from 1 species \nAACGAACGCTGGCGGTAGGCTTAACACATGCAAGTCGAGCGCCCCGCAAGGGGAGCGGCAGACGGGTGAGTAACGCGTGGGAACATACCCTTTTCTACGGAATAGCTCGGGGAAACTGGAATTAATACCGTATACGCCCTACGGGGGACAGATTTATCGGGGAAGGATTGGCCCGCGTTGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCAATAGCTGGTCTGAGAGGATGATCAGCCACATTGGGACTGAGACACGGCCCAAACTTCTACGGGAGGCAGCAGTGGGGAGTATTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCTTGAATGATGAAGGCCTTAGGGTTGTAAAGCTCTGTCACCGGAGAAGATAATGACGGTATCCGGAGAAGAAGCCCCGGCTAACTTCGTGCCAGCAGCCGCAGTAATAC\n>URS00021A8CBE lncRNA from 1 species \nAATCATTTTGTTGTACAAGTCAGCATGAGTTATCAAAAGGACATGAAGGCACCCTAACATTATGGAAACAAAAATTTAAAAAATTTGCTGATTTAGTATGCTGGTATATAGATGTATGAATAAAAGTGCTCACATGGTCAGTTTTGGTCTACACTGTCAAATAATTTTGTTGCACAAGTCAGCAAGAGGTATCAAAACTACTGAAATTTTGTTACGTATCAATATTTTGAATAAAAGGAGGACATATGCTGGCACCCTAAATTTA\n>URS00020CA31D rRNA from 1 species \nGATGAACGCTAGCGATAGGCTTAACACATGCAAGTCGAGGGGTAACGTGTTGGAAGCTTGCTTCCGATGACGACGACCGGCGGATGGGTGCGTAACGCGTATGCAACTTGCCTCACAGTGGAGAATAACCCGGAGAAATCCGGACTAATACTCCATACACTCTTAAGTACGCCTGTACATGAGAGGAAAGATTTATCGCTGTGAGATAGGCATGCGTCCTATTAGGTAGTTGGTGAGGTAACGGCTCACCAAGCCGACGATAGGTAGGGGTGCTGAGAGGCAGATCCCCCACATTGGGACTGAGACACGGCACAAACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGAGGAAACTCTGAACCAGCCAAGTCGCGTGAAGGAAGAATGTCCTAAGGATTGTAAACTTCTTTAGCGAGCGAGTAAGGACTTCCACGTGATGGGAGTTTGAAAGTAGCTCGAGAATAAGTATCGGCTAACTCCGTG\n>URS0002179DC9 lncRNA from 1 species \nATTACTTTGTTTAGAAAAATTAACATTTTTCTGGTTATGATGTAAGACACACAAATAGCTACTTTGATTTTTATTTAACAAATACATGAACCATTCCCCATGCTCCGAATAAGTCATCATGAGTCTATAAAATCTTGTAACTTTTTTTAATGGTACTTGAGACAGTTTACATTGTTTTATAGAACAAAATACAATACTTCTAATTCTCCTCATACTGCCTTTCAACTCTACGGTGAGAGCTGTGCATAAAAACATAGCAGCTTGGGTAGCTCATGGGTTGCAACATAATCTCCGCATTGGGTTGGGCTGGGGGATGGCAAGGAAGGCATTCTAAGATATAAGTTCTGAGAATAAAGAAACAGAGATTTCCCTCAAGAAAATTTATACTTGTCTCCTTTATAAGCACAGGTCCCATACAAAAAGTATTATCACTGAATTGCTCTGTCTGACTTATAAGCTATAATTAAGATTCCAGTCTGATGTGGAGCAGCTTAAAATAGCATCACACACCCTGTTGATTCTTGCCTAGTTGAAACAGAAACATAAATTTGAGGGAAGAAGGTGGAAATGATTATTATCAATTCCCCTTTAATAATACTGATATAGGTATCCATGGGCACAGAAAATTAAGTAAAGTAAGTATTCCAAATTATCTCCCTCTTCAAATCGCTTATACCTGATTTTGGCTGGGCAGAGATTTACTAATAAGGAGGTGAGGGTTTACTTCCAGGAAAAGCTATAATAGTGAGACAGAAGTTCAGGGCAGAGCAAGCACCAAATATAGGGCAGTACAGATAGTGACCTGCTTGGGACCTAGGAACTAGGTAGCATGTGGAGTAGCAGGAGGAGAGCCTAGAAGACAAGCGCTTGACCAGTAAAGTGAGAAGACCTGCTCAATTTAGAGAAGGATTTGCAAGTAAGAAACAGAACATTTCTTGAGTATTTACCTAATTCTAGGTTGATACTAGGTACACTTCATTTAAACCTAACTTTAAAAAGTCAGAAATATCCATCATTTCACCAATTCACTCATATGGAAACTGAAGCTATGAGGTTCCCTACCATAAATCCCACATAATGAAGCTGGGACTCAAACGCCCGCATAATTTAAAACTTTGTGCCCTTTTATGCTAAC\n>URS00012349DE rRNA from 1 species \nCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGTTTTGTAAGACAGAGGTGAAATCCCCGGGCTCAACCTGGGAACTGCCTTTGTGACTGCAAGGCTAGAGTACGGCAGAGGGGGATGGAATTCCGCGTGTAGCAGTGAAATGCGTAGATATGCGGAGGAACACCGATGGCGAAGGCAATCCCCTGGGCCTGTACTGACGCTCATGCACGAAAGCGTGGGGAGCAAACAGGATTAGAGACCCCAGTAGTCCCTGTCTCTTATAC\n>URS0000B93F3B rRNA from 1 species \nTGAGCCTACGGGGGGCAGCAGTGGGGAATATTGCACAATGGGGGGAACCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAATCTCTATCAGCAGGGAAGAAGATGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGACAGTCAAGTCAGCGGTAAAAATGCGGTGCTCAACCCCGTACTGCCGTTGAAACTGCATCCCTTGAGTGCGCGAGAAG\n>URS0000854D01 rRNA from 1 species \nAGAGTTTGATCATGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACGGTAACAGGAAGCAGCTTGCTGCTTTGCTGACGAGTGGCGGACGGGTGAGTAATGTCTGGGAAACTGCCTGATGGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATAATGTCGCAAGACCAAAGAGGGGGACCTTCGGGCCTCTTGCCATCGGATGTGCCCAGATGGGATTAGCTAGTAGGTGGGGTAAAGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGTCTTCGGGTTGTAAAGTACTTTCAGCGGGGAGGAAGGGAGTAAAGTTAATACCTTTGCTCATTGACGTTACCCGCAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATCTGATACTGGCAAGCTTGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCGACTTGGAGGTTGTGCCCTTGAGGCGTGGCTTCCGGAGCTAACGCGTTAAGTCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCACGGAAGTTTTCAGAGATGAGAATGTGCCTTCGGGAACCGTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTCCGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGATCTCGCGAGAGCAAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTGGATCAGAATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTAGCTTAACCTTCGGGAGGGCGCTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTAGGGGAACCTGCGGTTGGATCACCT\n>URS0001C3A371 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACGGACGAGAAGCTTGCTTCTCTGATGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTGCCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATGATATTTTGAACCGCATGGTTCAAAAGTGAAAGACGGTCTTGCTGTCACTTATAGATGGATCCGCGCTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACCCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGAACATATGTGTAAGTAACTGTGCACATCTTGACGGTACCTAATCAGAAAGCCACGGCTAACTACGTG\n>URS0001B15B4F rRNA from 1 species \nCCTGGTTGTTCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTGTAAGTATGAATAAATTCAGACTGTGAAACTACAAATGGCTCATTAAATCAGTTATAGTTTGTTTGATGGTATCTACTACTCAGATAACTATAGTAATTCTAGAGCTAATACATGCAACAAACCCCGACTTCTGGAAGAGATGCATTTATTAGATAAAAGGTCGATGCGGGCTCTGCCCGTTGCTACGAGGATTCATGATAACTCGACGGATCGTACGACCATCGTACCGGCGATGCATCATTCAAATTTCTGCCCTATCAACTTTCGATGGTAGGATAGTGGCCTACCATGGTGGTGACGGGTGATGGAGAATTAGGGTTCGATTCCAGAGAGGGAGCCTGAGAAACGGCTACCATATCCAAGGAAGGCAGCAGACGCGTAAACTACCCAATCGTAGTTGCACTTTGGGATGGGCCGGCTGGTCCGCCTATGGTGCGCACCGATCGTCTCATCCTTTCTGTCGGCGATGCGCTCCTGGCCTTAACTGGTCGGGTCCGGTGCTGTTACTATGAAGAAATTAGAGTTCTCAAAGCAAGCCTACGCTCTGTATACATTAGCATGGGATAACATTATAGGATTTCGGTCCTATTACGTTGGCCTTCGGGATCGGAGTAATGATTAACAGGGACAGTCGGGGGCATTCGTATTTCATAGTCAGAGGTGAAATTCTTGGATTTATGAAAGACGAACAACTGCGAANCTGCGAAAGCATTTACCAAGGATTTTTTCATTAATCAAGATCGAAATTTTGGGGCTCGAAGGCGATTAGATACCGTCCTAGTCTCAACCATAAACGATGTCGACCAGGGATCAGCGGATGTTGCTTTTAGGAATCCACCGGCACCTTATGAGAAATCAAAGTTTTTGGGTTACGGCGGGAGTTTGGTCGCAAGGCTAAAACTTAAAGGAATTGACGGAAGGGCTCCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTCCAGACATAGTAAGGATTGACAGACTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTNGATGGCTGTTCTTAGTTGGTAGAGCGATTTTTCTGGTTAATTTCGTTAACGAACGAGACCTCAGCCTGCTAACTAGCTATGCGGAGGTATCCCTTCGCGGCCAGCTTCTTAGAGGGACTACGGCCTTTTAGGCCGTGGATGTTTGAGGAAATAATAGGTCTGTGATGCCCTTAGATGTTCTGGGCTGCACGTGCACTACACTGATGTATTCAACGAGTTTATAGCCTTGGCCGACAAGCTCGGGTAATCTTTGAAATTTCATCGTGATGGGGATAGATCATTGCAATTGTTGGTCTTCAACGAGGAATTCCTAGTAAGCGCGAGTAATCAGCTCGCGTCGACTACGTCCCTGGGCTTTGTACACACCACCCATCGCTCCTACCGATTGATTGATCCAGTGAAATGTTTGGATCACGTCGACGTGGGTGGTTTGCTGCCCGCGACGTCCCGAGAAGTCTATTGAACCTTATCATTTAGAGGAAGGAGAAGTCGTAACAAGGTTTCCGTCGGTGAACCTGCGAAAG\n>URS0002562826 rRNA from 1 species \nATGCCACCTGTTCAGGGAAATGGGCAAGCCCTAAACGGCAACAGTCAGCAATCTTCTCAGCAATTTCCAACGCCAATCTTGTGGCAGCCAACCAGCAACCACTCAATGCAACATGGCGAAGGATGTAGTCTGCCACCACCTAGCATGCCGAATCCATTGCCAGTAGCAGTTCCAGGATATTATCCACCTTTACCTGCTTTTGGACAGGACCACTGCACTAGTTTACCTAATGCAAGTTCTCAACTTGAATTTCGGAACTTCCCAGCGTACATGCCGTTTAATGATATTCCCCAGGGGAATTCCATTCTTGGATGGGAAGAATTTGTTGAAGATGTAAGTCATTCAAATGTCCGGCCACCAGTTGAAGAGCATTATGTAGATGCGTCATTTAGATGTAATCAAGTGCTACTTCAATGGGATGAGCCTCATATGGAGGTCAAGAAACGTTGGAACTTTCTTGATCAGCTCATGCCGCTGTATAGCACACAATCAGGGTTTTATAAAGAAGATTTCCCCAGTACGAGCCTCATGGATAAAACCCATAAGTTACTGGCCAGTATTTCATCAGACGATTCTGTTTGGAAGATAATTACCAGTGTTACGAGTCGAGCCACACAAACTCCTCAGAGGAGAGGTGTTCTCATTCGGCCCATTGAGCCATATGATTCAGATGATGGGCCACCAATTAAGAAGCAAAGGACCAAATATCAATTGCGATTTGTCAATACGGTGTGCAATGACTACTTCACACGGGAGAATATCAAATCAGAGGATGGAAATCTCTTAAAGGTGGCTTTGTATGATGAGAACAATCTGGTTGTCACATCTGGTCCGCTGTCTGCAGCTTTTGTGGAGATCGTACTACTTCATGGTGATTTCAATGCTGAAGGTCAAGATTATTGGACATCAGAGGAGTTTAGTGACTGCCTAGTGCATCCACAATCTGTAAAAGAACCACCAGCCTTGGGAGGTGATCGTGTCTTGACACTGACTGATGGAGAAGCAGACCTTGGTAATGTCTATTTCCGAACTTCCTCCTTCCATGCTAGAACTGAAAAGTTCAAGATGGGTGTTGAGATTAAAAATGTAAGAGAAGAGTGTGTTCAAGAAGGAATCACTAGCCCTTTTTTTGTGAGAGTTCGCCAAGGGGAAGAATCAATTGGCCAATGGATCACATCCCTCAAAGCATCGCTCAGAGTGAGCAAACAAGTCCCCCCGCTGGAGTGCGATGCTAGGAAATACGTCGACGCATTAGCAGTTAAAATGAGCACGGAGGAAAAATTCAAAACTGGAAAGCTTAAGGTAAAAAGGGAAAAAGATAAGAACAAATATGAGGAAGATCTCAGAATACTCATGGAAGACCACCAAGAGTTCACATTAAAAACCGAAGATATGCGAAAGGAAGGGCGTGCTGAGTTAAATCATTACATTCTATCTCCACCTCAGAGATCAATGGTTATCCAATCAACAAGATTTCGTCTAGTAATTGAAAATAGTGTGAGCAGAACAATTTACAAAAATAGTACTGTAAAGACCGAGGATGGCGGAGATCACATAAAAGTTGTCATGTACGATGGTGGCAAGCCAATTGCATTTGACCACCCTCTTGCTTCAATAACAGTTGACCTAGTTATCATTGAAGGAGGGTTCGATGAAAAGCGAGATTCGTGGTCTAAAGAGGAGTTTGAGGAAAGCATAATAGAACCAAGAAAAGGAATCAAAAGGCTAGTGAAAAATGGTACATTTGATTTGATTGATGGGAGGTGTGATCATCATGGTGCCATTATTATGGACAATTCACTACGAATGGAAGTTAAACTTGGAGTAAGGATCGCAGTGCATACAGACATAAGAGTTATTGAAGGGGTATCAAATCCTTTCAAAATGAAGGAAGTCCGGACAAGAGTACATGGAAAGAGTACTATTCCATACAAGGACGACGCGGTACATCGACTGAAGAAAATTGCCCTGAAGGGAAAACATTGGAACAATCTTGAGGATCAATATATTACCAAAGTGAAGCACTTGTTGCGCCATTATCACAAAGATAAATTTGGTCTCCAAAAGCTTGTTGACATGAAGAAAGAGGATTGGAATACCATGATTAATCATGCCACCATGTGTGTTCCTGGGGATGAGATCTATTCCTACTGTGTTCAAGAGGATAACTGTGAAATCCTATTCAATGATTTCTATGATCTTGTCGGTAAGATCACTGATGACTATGTTCCGTACAGTGTCAATGACGTCGATCAGTTTCCGCAGCTTAAAGTGAACAACTGGAAAAAGTCTGCGTATAAGAAGTTTGACGAGAGGGAGAACTCAGGGCTCTTTGGTCTTACTCCTGATTACTTCATGAACAATGGCCGCCCAGTCCGTGCAGCGCCCCTGAACAATGACGCAGGTCCTACTGTACAAGCATCTACATGGCAATATCCTAATGACAGGGCTGCACAACACGGCCTTAATAGAAGTGCAGTCTGCCAATACACAGATGCCTGGAGTCCGGCTTCTAAAAATACCAATCAAAATAATGTGATTCCTCCAACGACGACAGCAGATGGGAATGGGATGCTTGGGTCACTGACAATGGGGACAAGCAGCACCAGCGACATGAAGAAGAGCATGATGGAGGACGTTGCCAATGGTCTCTTCAATTGA\n>URS0000051310 piRNA from 1 species \nCAGGTCTTGTTTTAGTTGGACGAGGA\n>URS0000A621CB tRNA from 1 species \nAAAATGCCAGCTTTGGGAGTTGGTGATGAAGGTTCGACTCCTTTCTTTCTGA\n>URS000113D973 rRNA from 1 species \nTACAGAGGGTGCAAGCGTTGTTCGGAATCATTGGGCGTAAAGGGCGTGTAGGCGGTTTGGTAAGTCATGTGTGAAATCCCTCGGCTCAACCGGGGAACGACGCATGAAACTGGCAAGCTAGAGTACCAAAGAGGGCGGTGGAATTCCCGGTGTAGCGGTGAAATTCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCGATCTGGACGGATATTGACGCTGATGTACGAAAGCGTGGGGAGCAAACAGG\n>URS00001901B3 rRNA from 1 species \nTTAAAAGCTCGTAGTTGGATTTCTGGCAGGAGCGACCGGTCCGCCGCAAGGTGTGCACTAGGTCGTCTCCAGTCATCTTTGTGGGAACTGCTCTGGCATTAGGTTGTCGGGGTTAGGGAACACATCGTTTACTGTGAAAAAATTAGAGTGTTTAAAGCAGGCTTATGCCGTTGAATACATTAGCATGGAATAATAAGATAGGACTTTGGTGGTCTATTTTGTTGGTTTGCACACCAAGGTAATGATTAATAGGGATAGTTGGGGGTATTCGTATTTAATTGTCAGAGGTGAAACTCCCTTGGATTTATGAAAGACGAACTACTGCGAAAGCATTTACCAAAGATGTTTTCAGGGTAATCAAGAACGAAAGTTAGGGGATCGAAGATGATTAGATACCATCGTAGTCTTAACCATAAACTATGCCGACTAGGGATTGGTGGTCCGTTCATTATGA\n>URS00005FFC84 siRNA from 1 species \nTGACTTTGGAGCCATTCTTCCC\n>URS00005C67CE rRNA from 1 species \nTTAATTATAGTTAAATAGTATTGTGAAAGAAAATTGAAATAATTTGAAAAATTAATATTTTAAAAGAAAATTTAATTTATTGTACCTTGTGTATCAGGGTTTATTAATTAAAAATTATTTACTATAATTTTCTCGATTTTAAAAGAGTTAATATATTATAAAAGTTAATGTGACAAAATTATTTTATATAGTATATTAGAAATGAAATGTTATTCGTTTTTAAAGGTATCTAGTTCTTTAAGAAATAAATTTAATTTAGAAATATTATATTATTTAGTTAAATGTATTAATTAAATAATTATTTTATTTTAATATTTTATGGGATAAGCTGTGAAATAAATTATTAAAAATTTTTAAATAGTTTAATAAATATAAGCTTAGAAATAGTTATTATTAATGAAATTGTTATAATTTATTTTATAATATTTATTATTTATTAAATTTTAATTATGTATTAGAGTATTTATTTTAATTTAAAAAATAAAAAAATAATGATAAAATTAGTATATTATGATGTATAAATATGTGAAATTGATAAGTTTTTATAAAGAACTCGGCAAAAATAATGTT\n>URS0001988726 lncRNA from 1 species \nCACATGTTATGGACATTTTTATTTATTGACATGGTCAAATTAACAGGCAGCAGCATTTATTTTTAATGATAGCCTTGAAATCAGCCCAGGAAGAAAGTTAACATTGATGTTCAGAATACTGCATGCCATCCACATTTTTCCAGATGAAAGTATATTTTAAACTAATAATTAAATATTGTCACCCTAATTAAGTTACCTTGAGCAGGTGAGAGAAACACAGTTCTTAGTCATTGCAAATCTTGTTTGTCCTATTCTCAAGCTGTACAGAAAAACTACCCAGCAGGAGAAATTCGGCAAGCTCCATGGTTTAAAGTGTGCACTTAATTTAGGTGAATGATAAGCTGTGTCTATAAAGATTTGTGTTGGTCACCACGGAATGGAAGATTCCTGTGAAGTAGACAAGATGTAATTGCCAGTAAATATCAGTGCTAGCTTGGCCACACAACATTCACAGAGCAGGAGGGAATATCTTGGTATATTTATTATTACAGTGGGGAATTTTGACAGTCACCTTAATCACTCTTTGAGACAGGTAAAGAGAAAGGAACTGGGCAGCAGCACAGTTATCAGCTGGGTTAGAGAAAGCACACAGAGCAAAGGAGAATGAAGAGCATTTCACAAGGTATTTTAAACAGGTTTACATTGGGATGAAGATATTAGGAGTTTTTAGATATTAAGCACTTGTGGAAATTAAATCATTGCTTCATGCATTTAAAATTTACGCCCTAGAAGTACCTTCACAAACCAGACTGCCCACTTTAAAACTTCTGATCTACCCACCTTAAACAAGAATATTCTATAAATTACAAAGAAAGACTGGGAAATGATCTGTGTGTAATAGCTGAACCAAGCAATTTGCATATTTTCATGAATTACTGTAATGTGTTCTGCTTGTAATTTCACTTGTATACAAAGGATCACAGTTGCAAAAAGTACCAACTTTTCATGTTCAAAAGTGATTCAGGAGTCGAATTTCCTAGTCCAAAATGCTGAGACACTTAAAAATTAGAAGCTGAAATCATTGTTCTCTTCATTGCACTAGAAAGTTTTGCACTAAATCCTGCTCAGTGGCTTAGATATGAGCTGGAAATAATTTTTAGGAAAGCCCTGAACCAGGACACACTATTAGAGACTCCTTGGTTCTTTTGACTTGGCATTCACACATGTGCATGCAGATATGCAGATAGCCCTGTCATGATCTATTAAAAAAACAAACAAACAAAAAAATCTAGAAAAATCAATTTTCACTGAAAGATTCCAGTTTTTTTTCAGGGAAGAAAAGGTCTGTAAGCTTACCTGAGAAAAAGTTTCCACAGCAATTTTATTTTTTAAAAATGGTGATGAACGACCCACAGTGAACGTGGGAGAAGGATCCAATTTCTGCCCACGAGGGAGAAGAGTGTGTGCATGGTGGGCACCTCAGGCTGCAAGAGCAGGCACAGGATAGGGCATGGGCACGCAGGGCAGCTGCCTGCAGCTCCTGGCCAGTCTCAGCCTCTGTGGGGTCCCTTAGAGGGGTGAATTATTGTGCCCAGGGAGCTCCCCCCCCCATCCTGGCCAAGTCAGGATACATTTTTATAGCCCTTCTTCAAGTGATAGAAATATCAAGGGGAGGGCAAAATATATGGGAGGAGGGAAAGGGAGGCAGTTTCCAGTATTTGTCATTATTATAGGTTATATATACAGGAAGAAAGTTAATTAAGCTTTAAAAAATCCATCACACATCAATGGGTGCATTTTAATGAGTAGAAAAAGTTGAGATGTTTACTGCCAATTAAAGTGGTTTTTAAATAAGCATTAATTAACACAGAAATTCAGAAGAAAGTTATACCTTGTCAAAGAAAGGCCAGTGCAGTCTATGCCCACTTCTGCTCCCATTCATACTCAGATAGTAATTACCACCAACCCTATATTTTCCATAATAATGAGGAGAGGCTGTCATGGCTGTCAAACAAAAACAAAACAAAAAAAAAAAGAAAAAAAGGTGCTGCACAAAAATACCCTCAATCTGAAGTAAACTTTTGTTTTTAAATGTATAATAAAAAGCCACAGGAGACAGCAATATGGGGCAAGGCAGTGAGTGGGGCAGTCAGGCAGCCATGCCAGAGGCAGCTGCACACACATGGCTCCTTCCTAGGGAGCAGAGACTTTGGAACTCAGGATGAAGCCTCTCCAGACAGTCCAGCTGAAGAAAGACTGAAGAAAAGCCAAAGAAAAAGCAGTTCGTTCCTAGTTTCATCCCTAGCGCTGGAACTCGTGGAGGAGCTGATTCCCCTGTTAAAGCCAGAGGAGCTCGTTTTTTCCACAAACAAGTGCTGACAGACTAGCTCCATGCTTCCCAAAGTCAGATCAAAGCAACCACTGCAAATAAGTTCAGCTTGCATGTGCACTTCCAGCTGGAGCAACTGGTGACAGGAAAAACAGTACGACCCTCAATTCTGTCACTTCTCCATTCTTGCAGGATTTCTTAATAATTGTCAGGAGTTTCAGCTCTACTTCAGCTAGTGTCAAATCCTGATGGGACAGCAAAGGAAGTGATTTCTCCCATTGTTAGTCTGGTGAATGTTTAAATATCTTAGGAAAACCTTCCTTCCCCCAAATGCATCTTAGGCACCAAGTAAGATTTTCAAACTGCCTCATTGAGAATGGCTTCTCTCCTCACTTCCCCAGCTCCAGCTGTGGAGAGATAAAAACCCCACTGCCTTTTCAGACAGCAGAAGAGGCAGGTCACATAAAAATTTGTTAGTAGCCTAAGAAATTTTACAAAAATCTCTGGTGTAGTGTTTTTAAAGTTAATTTAAAAAACAAAACAAAACAAAACAAAAGAAGCAACAAAACACAGAAAAGAAGGCTGTAGATATGCACAGACTCCTGTTCCTAACCCTTGGCATTTCACTCAGATAATGTGCAGCCTCTCTGTAGCTTGTGTCTATCAGGGAGTATCTGGGAGCCTTTTTCCTACTCCATGTCCACAGGCAATATCTGCAGTAGAATAAAAAAAGGAGAGCATTAAATGCCATGGAAGTTTTGTTGAATGTAACTGGACAGGGCCTTCAGATCTTG\n>URS0000ADFB99 rRNA from 1 species \nTTCTAACAGAAATAATTGTTAGTAAATCCTGCTCAATGATTCGTTAAATAGCCGCAATAACTTGTGCTAAGGTAGCATAATAATTTGCCTATTAATTGTAGGCCAGAATGAAAGGATTAACATAAGAAATTCTTTATTCATTAAATAAATTTAACTTCATTTATAAGTAAAAAAGCTTATATTTTTTAGAAGGACGACAAGACCCTGTCGAACTTCACTAAAGTTTTACTGGGGCGGTAAAAAAACTAACACTTATTTTCCATTTACAAAATATAAACATAATGTTAATTCTAAACAAGTTACCGCAGGGATAACAGCATAATTTTTTCCTAAAGATCTTATTAAAGAAAAAGATTGTGACCTCGATGTTGAATAATTTATCTTATTGGGGCAGCACCTAAACAAGTAAGTCTGTTCGACTTTTAAAAAATTACA\n>URS00009AD4FC lncRNA from 7 species \nACGCCGGCGTGAGAGGGCACGGGGAAAAAGGTGGCTCTGGCCGGGGCGGCTCTGTTTCCTGGGGTTATGTAGCAGGGCTTGTCGGCTCGCGAGACCTCCCGCTGCCCTCGCCCGTGTCCTAGCGCGGGGTTTCTGCTCCGGGCGGAGGCCGTGTTCAAGCCCGCCGCGCTCCCTCGACGTAGAGCTCGCTCGTCCGCCCGTGGGAGCGTCCCGGCCGAGCTGCGCTGAGGGGGGAGGGGAGGCCATTTTGTCCCGACCGACTCCCCGGAACCGGGCGGAGCGGCTGGGAGAGGCTGCGGAGCCGCGGGCGCCGCCCCTCGGAGGCACGGGCGCCGCCACCGTCGGGGCTTCCTCGACGAGGCCGTTCGGAAGGTCTCCTGCTCCGTCTCGAGAGCTGCTTTCTCCTTCCGCACACGCTACCCGGCTGCTGCGGCCCCAGAACGCCCGGGTGAGGAGTTGGTTGTAGTGAGCAGTTCCGATCCCTTGGGGCTACCGGCGGCGAGCGCCCGAGCCGCTCCTCCCAATGGCGAAGAAGACGTACGACCTGCTTTTCAAGCTGCTCCTGATCGGGGACTCGGGAGTGGGCAAGACCTGCGTCCTTTTTCGTTTTTCGGACGATGCCTTCAATACCACCTTTATTTCCACCATAGGTAAGACCTGTGGGAGGATGGTGTGGGGGCTCTGTAGCCGCGAGCCGTTTTCTTTTATTCCAGACATCTTGCTTCCCGGAATTTACGCCTTTGTTCCAGTGATTCCGATTCCAGACGACAGACCTAAGTTACTGTTGGAATCGGAATAGCCTTACTGGGGCGGGGTCTTCCCATGCTTACCATCCGGTCTCAAGTCTCCTTCTCTGTTCGGTGCCTTCTGGCACAAAATATGCAGCATTTAGCAGCGTTCCAGAATCCGGTTTCTTTAAGTGACTTGCCTGGCCTTACCATAATTGCATGAAGTTACTTGATGTGCTATTTGTAATAGACGTAATTTAGTGGTTGGGATTGAAGCAGTACTGGCTATGTGGCAAAGGCCCGAATTGGGGGTCAAAGAGAAAATATTCTATCTGACTGTAACTTGGAGTAAACTTGAGAGTTGCAGAATCATTAAGGAAAATGAGAGGGGCGGGGGAAAGTGAGTTGGCTGTCTTGACTGAACCATTGATGTGTCAAACAATCGGAGGCCCTTCGTGCTTGGGGTGGGAATCTGGCATGGTTGGCTCACAGTGCTTTTTCAAGACCTCAACGAAGCAGATGGACGGTTTCTGTTTTCAACCCAATGGAATCAAGTCAAGTTCTAATGTTTTACTTGATGTTAGAATTTACAGGAAAATCTTTCGTCAGTCATGGCTCTAAGGACTTCTAATGTACTACCACATATTTCGGAATTACTTGGTATGGAAATAAAAACTGACCTTTTAAATGGGTTTCCTGTTTCGGAAATGAAAAGGGAAGGTTTCAAGAAAGTCGTTTTGACGCTGGCACCAACATCAATTTTGTCAAAGTAACTGTACATGACCACCCCCCTCCCTGGTTTTTTAAAGTATCCGGTGTCTTTCATTTTTGAACCTCAGCTCCGGCATTAGAGCAGTGCAGGAAAACTTGTGATAAATGTAACTAGCTTCACGATGAGAAGCGACTCTAGTGGTTTTCCTTAAGAATTGTGAAAATCTTGTTTTAACCAATTTATAGTATAGGATTTCCTTAAGACATATTTGTAAGTAGCTTAAGCATATTTTCGCAAAATATGCTTAAGTTATACTGCAATTAAGATGAGCAAATTTTTATTTAAAATAGGTTGTTTTACCTTACTGGTGGGCAGGATTGTCAAAATATCACGAAGCTTGAACTTGTCCTCTGCTTAGTGGGTTAGCACTTACACAGCACTAAGTTTGCTTTGAAGTGTAGCTGGGTCAGTCAGGTGGCTAGATCAGCAAATATTTATTGAGCACCAAGTTCTAGGCACTGTTAAAAGCGTTGAAAATAAGTGGTCGATACAATAGACCCCTTGAGCATTCTGATAAAGAAGGCAACAACAGTGTGCAAAGCACTAGAGTGAGGAGAGGGAGGAAGGGGAGTAGTCTGAATTATGGGGAATCTGCTTTGCATGGATGTTTAAAACGTAGTCTGAAAGACAAGTATGAATTGGATCAGAGGAGAGGTAGCCTCTTTGAAAGAGAATTTAGTGTGCGATCCTTTTTTTTTTAACCTGCTCTTGAGAACGGGTAGGTGAAAGTAGGAAGTAAAGTTTCCTGGTGAAGAAAGCTACTTAGCCCCCCAGCTGCCTGTCCTCAGGTACTGGGCATTGACTAACCTCATGCGTGGTAGGCAAGCTGCTGAGTTACACCTCCAGTCCTCCTTGTATCCATAGTCTTCATTGTCCTTTGACTTAGGGAGATGGGTTGTTTCCCATGCAGCCTGCTGTTTTGAATTCCTGGCTCCACAGGAATTGCAACTTTGGCTACAGTGTCTTATTCGACAGTGCAAATGCCATGTATGGTGCTTGTGAGGATTAATACAGGTCAGCGAGAGCAAAGCACCTAACAATGGTGCCAGGTACTTTGTAGGAACACAGTGCAGATTTGTGCAGAATATATGGCCTTCCTGATACTGGTGTGTGACAGAATAAGTTGCTTTATGGATTGAATATGTCTTGTGTGTAATGGCTGCTTGAATATCTGTTGGTGCTCTGCTAAACAATTATACAATAACCTCTGACATTTATACATTTTGATATAAAAACATTTGATGTTTTGACACAAGATTTGAATAAAGTAAGCTAAGAAAATGAACAAAATTCTGACAATTCTTAGTCCAGCTCATACTTGACTCTTTGCAGATTTTGAATTCTGTTAGCCTCATAAACTTTGGTAGTC\n>URS0000A9B0F3 lncRNA from 12 species \nTTTCCTTCCTCTTTTCAAGCTTATTGAAGGAGCCAAATCATTCCAATTCAGCCTGGACTGACCTTTATGTGCTTCATTTTAGTTTAAAAGAAACCCAAACTTCAGTTCTCTGGGATTCTGGGCTAAACATTAAGGAATCCATTCAAAGGTTGTACCTTCCTCCTCATGGTTAACCATTTCAAAG\n>URS00013E7246 rRNA from 1 species \nTACGTAGGGCGCGAGCGTTGTCCGGAATCATTGGGCGTAAAGAGCTCGTAGGCGGCCTGTCGCGTCTGCTGTGAAATCCCGGGGCTTAACCCCGGGCGTGCAGTGGATACGGGCTGGCTGGAGGCAGGCAGGGGAGAACGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGTAACTGACGCTGAGGAGCGAAAGCATGGGGAGCGAACAGG\n>URS0001D4A06F rRNA from 1 species \nAACGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCCCTTTCGGGGGAGCGGCGGACGGGTGAGTAACGCGTGGGAATATGCCCTTCTCTACGGAATAGCCTCGGGAAACTGAGAGTAATACCGTATACGCCCTATGGGGGAAAGATTTATCGGGGAAGGATTAGCCCGCGTTGGATTAGGTAGTTGGTGGGGTAATGGCCTACCAAGCCGACGATCCATAGCTGGTTTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCGTGGGGGAGGCGGCAGGGGAGAATCTAAGAAGTGGGGGGCAACCATGAGTGAGCACTGGCGGGTGAGGGATGAAGGCCTTGGTGTTGTAAAGCTGTTGACGGTGGGAATAAAATGGCTGTACCAGCAGAAGAAGCCCAGGACAACTCCGTGCCAGAAGACGAGTTAATAGTCAAAGACACACGTCTGAAC\n>URS00022CCAAD rRNA from 1 species \nTGGAAGCGTCTGGAAAGGCGCGCGATACAGGGTGACAGCCCCGTACACAAAAGCGCATGTGCTGTGAGCTCGATGAGTAGGGCGGGACACGTGGTATCCTGTCTGAATATGGGGGGACCATCCTCCAAGGCTAAATACTCCTGACTGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAAAAGAACCCCGGCGAGGGGAGTGAAAAAGAACCTGAAACCGTGTACGTACAAGCAGTGGGAGCACCCTTTGGGGTGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTATATTCTGTAGCAAGGTTAACCGAATAGGGGAGCCGCAGGGAAACCGAGTCTTAATTGGGCGTTAAGTTGCAGGGTATAGACCCGAAACCCGGTGATCTAGCCATGGGCAGGTTGAAGGTTGGGTAACACTAACTGGAGGACCGAACCGACTAATGTTGAAAAATTAGCGGATGACCTGTGGCTGGGGGTGAAAGGCCAATCAAACCGGGAGATAGCTGGTTCTCCCCGAAAGCTATTTAGGTAGCGCCTCGTGAACTCATCTCCGGGGGTAGAGCACTGTTTCGGCTAGGGGGCCATCCCGGCTTACCAACCCGATGCAAACTGCGAATACCGGAGAATGTTATCACGGGAGACACACGGCGGGTGCTAACGTCCGTCGTGAAGAGGGAAACAACCCAGACCGCCAGCTAAGGTCCCAAAGTCATGGTTAAGTGGGAAACGATGTGGGAAGGCCCAGACAGCCAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAAAGCGTAATAGCTCACTGGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAACCATGCACCGAAGCTGCGGCAGCGACGCTGATGCGTTGTTGGGTAGGGGAGCGTTCTGTAAGCCTGTGAAGGTGGCCTGTGAGGGTTGCTGGAGGTATCAGAAGTGCGAATGCTGACATAAGTAACGATAAAGCGGGTGAAAAGCCCGCTCGCCGGAAGACCAAGGGTTCCTGTCCAACGTTAATCGGGGCAGGGTGAGTCGACCCCTAAGGCGAGGCCGAAAGGCGTAGTCGATGGGAAACGGGTTAATATTCCCGTACTTGGTGTTACTGCGAAGGGGGGACGGAGAAGGCTATGTTGGCCGGGCGACGGTTGTCCCGGTTTAAGCGTGTAGGTGTGTGTTCCAGGTAAATCCGGTTCACTTTAACACTG\n>URS0000B7FAC1 rRNA from 1 species \nACCTACGGGGGGCAGCAGTGGGGAATATTGGGCAATGGAGGCAACTCTGACCCAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATTGTAAAACTCTTTAAGTGGGGACGAAGAAAGTGACTGTACCCACAGAATAAGCCTCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGAGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGACGGCTTGGCAAGCCAGATGTGAAAGGCTGGGGCTCAACCCCAGGACTGCATTTGGAACTGTCATGCTAGAGTGTCGGAGGG\n>URS00001F4C6B rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGGGGGTAGCAATACCTCAGTGGCGAACGGGTGCGTAACACGTGAAGAATTTGTCCAACGGCGGGGGAGTAGCCGGCCCAACGGCCGGGTAATACCGCGTACGCCCTTCGGGAGGCATCTCCTGATTGGGAAAGCCGCAAGGCGCCGATGGAGAACTTCGCGGCCTATCAGCTAGTTGGTGAGGTCATGGCTCACCAAGGCGACGACGGGTAGCTGGTCCGAGAGGATGACCAGCCACATTGGGACGTGAGACACGGCCC\n>URS000030270D rRNA from 1 species \nCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGGGCGCAGACGGTTACTTAAGCAGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCGTTCTGAGCTGGGTGACTAGAGTGTGTCAGAGGGAGGTAGAATTCCACGTGTAGCAGTGAAATGCGTAGAGATGTGGAGGAATACCGATGGCGAAGGCAGCCTCCTGGGATAACACTGACGTTCATGCCCGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCGATTAGCTGTTGGGCAGCTTGACTGCTTAGTAGCGAAGCTAACGCGTGAAATCGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGATTAATTCGATACAACGCGAAGAACCTTACCTGGTCTTGACATGTACGGAACCCTCCAGAGACGGAGGGGTGCCTTCGGGAGCCGTAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCATTAGTTGCCATCATTAAGTTGGGCACTCTAATGAGACTGCCGGTGACAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGACCAGGGCTTCACACGTCATACAATGGTCGGTACAGAGGGTAGCCAAGCCGCGAGGTGGAGCCAATCTCACAAAACCGATCGTAGTCCGGATTGCACTCTGCAACTCGAGTGCATGAAGTCGGAATCGCTAGTAATCGCAGGTCAGCATACTGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTGGGGGATACCAGAAGTAGGTAGGGTAACCGCAAGGAGCCCGCTTACCACGGTATGCTTCATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT\n>URS0001E386D7 rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGCTGCAGGGTACTTGCTCCTTCTTTCGGCTGCCGACTGGTGGACGATGCCTAGGTATCTCCCTATTTGTTTTTGCTTACGTCCTAACGTGGGCGCTCTTACCCCATACGTCCTTACGACCTACGTGTGGAATCTTCGGACCTTCCGCTCTCGCATGATCCTATGTCGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCGTAACTGGTCTGAGAGGATGATCAGTCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGGGTGAAGAAGGTCTTCGGATTGTAAAGCACTTTAGGTTGGGAGGAAGAGCAGTAAGTTAATACCTTGCTGTTCTGACGGTACCAAAAGAATAAGCACCGGCTAACTTCGTG\n>URS0001DD23C1 misc_RNA from 1 species \nGATGAAGAAGTAGCGAAATGCGATAAGTAGTGTGAATTGCAGAATTCAGTGAATCATCGAATCTTTGAACGCACATTGCGCCCCTTGGTATTCCATGGGGCATGCCTGTTCGAGCGTCATTTGTACCTTCAAGCTCTGCTTGGTGTTGGGTGTTTGTCTCGCCTCTGCGTGTAGACTCGCCTCAAAATAATTGGCAGCCGGCGTATTGATTTCGGAGCGCAGTACATCTCGCGCTTTGCACTCATAACGACGACGTCCAAAAGTACATTTTTACACTCTTGACCTCGGATCAGGTAGGGATACCCGCTGAACTTAAGCATATCAATAAGCGGAGGA\n>URS000221B86E rRNA from 1 species \nTGATCCCGGCCCAGAATGAATGCTTGCGACAAGCCTAATACATGCAAGTCGAGCGCACTTTTAGAGTGAGCGGCGAACGGGTGAGTAATGCGTAAGAATCTACCTTCTACATAGCCATAAATAGGTAAAGGCCAAGTCCGGTAGAAGATGAGCTTGCGTAAGATTAGGTAGTTGGTGAGGTAAGAGCTCACCAAGCCAGAGATCTTTAGCTGGTCTGAGAGGTTGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATATTGGTCAATGGGCGAGAGCCTGAACCAGCCATGCCGCGTGCAGGATGACGGCCTTCTGGGTTGTAAACTGCTTTTATATGGGAAGAAAAAGGTCTTGCGAGACAAATTGCCGGTACCATATGAATAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTGTCCGGATTTATTGGGTTTAAAGGGTACGTAGGCGGATTTTTAAGTCCGTGGTGAAAGCCTACAGCTTAACTGTAGAACTGCCATGGATACTGGAAATCTTGAATTCAGTTGAGGTAAGCGGAATTTATGATGTAGCGGTGAAATGCATAGATATCATAAAGAACACCTATTGCGAAGGCAGCTTGCTGGACTTGAATTGACGCTGAGGTACGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGATTACTCGCTGCTAGCGATACACAGTTAGTGGCCAAGCGAAAGCGTTAAGTAATCCACCTGGGGAGTACGCTCGCAAGAGTGAAACTCAAAGGAATTGACGGGGGTCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCTGGGCTAGAATGTGAGCGCTAGATTTAGAGATAGATCGTTCTTCGGACGTGAAACAAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCCTATCCCTAGTTGCTAGCAGTTCGGCTGAGAACTCTAGGGAGACTGCCGGTGACAAACCGGAGGAAGGTGAGGATGACGTCAAATCAGCATGCCCCTTACATCTTGGGCGACTCACGTGCTACAATGGTCGGGACAAAGAGATGCTACCCTGCGAAGGCAAGCTAACCTCAAAAACCCGATCTCAGTTCGGATTGCAGGCTGCAACTCGCCTGCATGAAGTTGGAATCGCTAGTAATCGCAGGTCAGCCATACTGCGGTGAATACGTTCTCGGGTCTTGTACACACCGCCCGTCACACCATGGAAGTTGGTAATACCCGAAATCGCGCGTCTAACCTTCGGGAGGACAGTGCCTAAGGTAGGATCAGTGACTATGGTGAAGTCGTAACAAGGTAGCCGTACTGGAAGGTGTGGCTGGATTACCTCCT\n>URS00005DE4A8 rRNA from 1 species \nGGCCCGCGCAAGCGGTTGAGCAAGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACCCTTGACATCGTGCGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAGCGCACAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCCTATTTGCCAGCGATTCGGTCGGGAACTTTAGGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGGGTAGGGCTACACACGTGCTACAATGGCCGGTACAATGGGTTGCAAAGCGGCGACGTGGAGCTAATCTCATAAAGCCGGTCTCAGTCCGGATCGGAGTCTGCAACTCGACTCCGTGAAGTCGGAATCGCTAGTAATCGTGCATCAGAATGGCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGACTGCACCAGAAGTGGTTAGCCTAACTTCGGAGGGCGATCACCATCGGTTGTACATATCT\n>URS00010C272E rRNA from 1 species \nTACGGAGGGTGCGAGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCCTGCTAAGTCGAACGTGAAATCCCCGGGCTCAACCCGGGAACTGCGTCCGATACTGGCAGGCTTGAATCCGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCATCCTGGACCGGCATTGACGCTGAGGCGCGAAAGCCAGGGGAGCAAACGGG\n>URS0001E10DE4 rRNA from 1 species \nGATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAACAGACGAGGAGCTTGCTCCTCTGACGTTAGCGGCGGACGGGTGAGTAACACGTGGATAACCTACCTATAAGACTGGGATAACTTCGGGAAACCGGAGCTAATACCGGATAATATATTGAACCGCATGGTTCAATAGTGAAAGACGGTTTTGCTGTCACTTATAGATGGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATATTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAGCTCTGTTATTAGGGAAGAACAAATGTGTAAGTAACTATGCCCGTCTTGACGGTACCTACTCAGAAAGCCACGGCTAACTACGTG\n>URS000163CC5A rRNA from 1 species \nCCTACGGGGGGCAGCAGTGAGGAATATTGGTCAATGGGCGGGAGCCTGAACCAGCCAAGTCGCGTGAGGGAAGACGGTCCTATGGATTGTAAACCTCTTTGGGCGGGGAGCAATGCCGGGCACGTGTGCCCGGAGGGAGAGTACCCGCAGAATAAGCATCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGATGCGAGCGTTATCCGGATTTATTGGGCGTAAAGCGCTCGTAGGCGGTATGTCAAGTCAAGGGTGAAAGCCCCGCGCTCAACGTGGGAACTGCCTTTGAAACTGGCAAACTTGAGTGTGTGAGAGGATAGTGGAATTCCAGGTGTAGGAGTGAAATGCGTAGATATCTGGAGGAACAGCAGTGGCGAAGGCGACTATCTGGCACATAACTGACGCTGAGGAGCGAAAGCGTGGGTAGCAAACAGGATTAGATACCCCAGTAGTC\n>URS0000FA15DB rRNA from 1 species \nGACGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAACGCAGTGGGGACGGGTGAGTAACACGTGGGTAACCTCCCATCAGAGGGGATAACACTTGGAAACAGGTGCTAAACCGATACTGATGGATGGACCCGCGGTGCATTAGCTAGTTGGTGAGGTAAAGGCCTACCAAGGCAAGGATGCATAGCCGACCTGAGAGGGTGATCTGCCACATTGGGACTGTGACACGGCCCAACCTCCTACGGTAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGCAAGCCTGACGGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTCAGAGAAGCGGTATCTTACCAGAAAGCCACGGCTAACTACGTGCCAGCAGCCGCGGTAATAC\n>URS0000AF79E1 sRNA from 1 species \nACCCGCTGAATTTAAGCATATTAATAAGCGGAGGAAAAGAAACTAACAAGGATTCCCTCAGTAATGGCGAATGAAGCGGGAATAGCTCAATTTTGGAATCTCCGCTTCGGCGGCGAATTGTAGTTAATAGAGGTGTTTTCTCAGGATGCGGTGTGGTTTCTAAGTCCCTTGGAACAGGGCATCATAGAGGGTGAGAATCCCGTATGTGGAACCGCACTTGTCCCTTCGATACACTTTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCAAAATGGGTGGTAAATTTCATCTAAAGCTAAATATTGGCACGAGACCGATAGCGAACAAGTACCGTGAGGGAAAGATGAAAAGCACTTTGAAAAGAGAGTCAAACAGTACGTGAAACCGTTAAAAGGGAAACGATTGGAACTAGCAGTGACAGCATGTAATCAGTGGTTTGCTTGTGTTGTGATGGTTGTGTCTTTAAAAAAGCTCTTCTTGATCAGCCTTGTGGACTATGCACTTGCGTGTTTGTCGTGTCAATGTCAGTTTCTTCGGCGGGAGAAAACCGGGGAAAAGGTAGCTTGGTTCTTCCAAGTGTTACAGGTTCTCGGGTATATCGCCCTAGGGACTGAGGAGTGCGGGTCGTGCCTTTTGGCAAGGAAGCCTTTTGATGCCGGTGTATGTTTCTGCCCGACTGCTTGCAGTGGTGTGGTTGCATGCATGGTAATGCTTGGGGTTTTCCATTCACGTCCCTCAGATATTGACGAAATAGTTTCAACCGACCCGTCTTGTAACACGGACCAAGGAGTCTAACATGTATGCGAGTCTCTGGGTGTAAAACTCGTGGGCGCAATGAAAGTAAACGTAGGTGAGACGCTTCGGCTGCATCATCGACCGATTTGGATTTTTTATGAAAGATTTGAGTATGAGCATATATGTTGGGACCCGAAAGATGGTGAACTATGCCTGAATAGGGTGAAGTCAGAGGAAACTCTGATGGAAGCTCGTAGAGGTTCTGACGTGCAAATCGATCTTCAAATTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCACCGAAGTTTCCCTCAGGATAGCTGGAACTTGTTCAGTTTTATCAGGTAAAGCGAATGATTAGAGGCCTTGGGGTTGAAACAACCTCAACCTATTCTCAAACTTTAAATAGGTAAGAAGTCTGACTTGCTTAACTGAAGCCAGACGATCGAATGTTGAGTTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGAACGCGGAGTTAAGGTGCCAAAATCAACGCTCATCAGACCCCACAAAAGGTGTTGGTACATCCAGACAGCAGGAAGGTGACCATGGAAGTCGGGACCCTCTAAGGATCGTGTAACAACTCACCTGCCGAATGTATTAGCCCTGAAAATGGATGGCGCTAAAGCGTTGTACCTATACTCCGCCGTTGTGTTAATAACGATGACACAACGAGTAGGTGGGCGTAAAGGTTTTTGTTCTTTTTGAACTTTTGTGACGAAGCTTTTGATGTGAATCTGAGTTGAACGGCCTTTAGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGACTGAAGTGGAGAAAGGTTCCTTGTGAACAGCAGTTGGACAAGGGTTAGTCGATCCTAAAAGATAGGGTAATTCTGTTTGAAATGGCTTTCTTGTAAAGCACCTTATTGAAAGGGAATCAGGTTAATATTCCTGAACCGGAATGTGGATATTTCTCTCTTCGGAGGGAATGTGTGGTAACGCAACTAAACTCGGTGACGCTGGCAAGTATCCCGGGAAGAGTTCTCTTTTCTTTTTAACGATTGCATTGACCATGAAATCAGGTTAACTGGAGATATGGTTAAATCGCAACCAGGGCCACCTTCGGGTAGCCGACGGTAAAGCACTGCAATTTTTTCGCAGTGTCCGGTGCATTCTTGACAGCCCGTGAAAAACCGAGGGAAATAATAATTCTCACATCCGGTCGTACTCATAACCGCAGCAGGTCTCCAAGGTGAACAGCCTCTAGTTGATAGAAGAATGTAGGTAAGGGAAGTCGACAAAAAAGATCCGTAACTTCGGGATAAGGATTGGCTCTAAGGGTTGGGCATGTTGGGGCCATCTCCTTTTTGGATTTGCCTGAAGCTCGTTGATTAGCGGGCGTGGATGCGCTTTCGGGTGCGTTCTGCCTGCTCGATTGACCTGTTGAGGGTGGTGGCTGAGGGGGGGGGTTTTTTCTCCTCTTCTCAACTGGCATGTAATTAGCAACCGACTTAGAACTGGTACGGACAGGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGCCGGAAATGGTGTTGACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCATTGTCCCTATCTACTATCTAGCGAAACCGCAGCCAAGGGAACGGACTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAAAGACATTGGAGGTGTAGCATAGGTGGGAGCTTCGGCAAACTTGAAATACCACTACTCTGATCGTTTTTTTACTTATTTAATGAAGCGGGAAGCGAGTTTTCACCGACTCAATTTTTGGGATTTAAGCTCCCCCTTTTTGGGGGGGTGATCCGAGTTAAAGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTCAAAAGATAACGCAGGTGTCCTAAGGTGAGCTCAATGAGAACGGAAATCTCATGTAGAACAAAAGGGTAAAAGCTCACTTGATTTTGATTTTCAGTGTGAATACAAACTGTGAAAGCATGGCCTATCGATCCTTTAGTCCTTTTTTGAAATTTAAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACTAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGAGTATCTATGATATAGACCACAGTTGTTGCAATAGTAATCAAACTCAGTACGAGAGGAACCGTTTGTTCGGACAATTGGTATTTGCCCTTGGTTGAACAACCAATGGGGCGAAGCTACCATCCGTAGAATTATGACTGAACGCCTCTAAGTCAGAA\n>URS0001793305 rRNA from 1 species \nTACGTAGGGGGCGAGCGTTGTCCGGATTTATTGGGCGTAAAGCGCGCGTAGGCGGTTTGGCAAGTCTGATGTGAAAACCCGGGGCTCAACCCCGGGCGTGCATTCGATACGAGCAAACTAGAGTGTTGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCAACAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGG\n>URS0000082604 rRNA from 1 species \nGAGTTTGATCGTGGCTCAGGATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAAGCACTTTACCACGATTCCTTCGGGATGACGGTTTAGTGACTGAGTGGCGGACGGGTGAGTAACGCGTGGGGAACCTGCCCCATACCGGGGGTAACAGCCGGAAACGGCTGCTAATACCGCATAAGCGCACAGTACCGCATGGTACGGTGTGAAAAACTCCGGTGGTATGGGATGGACCCGCGTCTGATTAGCCAGTTGGCGGGGTAACGGCCACCAAAGCGACGATCAGTAGCCGGCCTGAGAGGGCGACCGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCAACGCCGCGTGAGTGAGGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGGAAGAAGAAATGACGGTACCTGACTAAGAAGCCCCGGCTAACTACGTG\n>URS00023E414C lncRNA from 1 species \nCATGTTCACAATTTGGTAGCTGCTAGTTATTAGTCATTACATATAATATTTGAGATCAAAATATATTATTTTTTTAGGAAAAAAAAATCAAAGTATATGTAATGCAAGCTAGGAGGCCTAGCATGAGGTTCACTGTAATCTAGAGGAAGATTAAATTAACTAAGAAGGAATTAAACTAATTATAAAATAAAGAAAATATCAAACTCCAAAAATCTACGGGCA\n>URS000233A4B4 lncRNA from 1 species \nTGTTAACAAAAATAGAGTGGGGAATAGGGTTAGGCCATGACAGGCAATGATCCTAAGAGCTAGAGATCTCTCCCACCCCAACAGAGAGAGACAGAGAGACAGACAGAGAGAGAGAGAGGGAGACAGAGACAGAGAGAGAGACACACACAGAGAGAGAGAGACACACACGCACACACACAGAGAGAGAGAGACACACACACACACACACACAGAGAGACACAGAGAGAGAGAGAGACAGAGACAGAGACAGAGAGAGAGAACCCTAAGGTATTAATATTCCTGACTTGAATACCTCAGGCTTTTCCCAGCCAACTTCCACGTTGCTCTCCTATCCGTCTCCACACCTAATTCTTCTACCAAACCCTTCTGTCCACCCCAGGAGATTGTGAACTCAGGCACCAAATCCAACAAGCTCCCCGAGGAACTTACAACAGTCTGTTTTACAGAGAAGTAAATGTTGCTGAGAGAGAAAATTGTCAGGCCTCGGTGTTCCAGAGCAAGAGGCATTCCTTCATTCCCAGAGAGGCCCTGGGCCTCAGCAAGCAAGCCCGACAAGCCCTCCGCAGCCAGAATCCAAGCTTCAGGCTGCACCTCCCTCACCGCTGGGCCCTGGACAGTGAGGCTGCTGCTCAGAACCCCTCTCCTCAGAGGGAAATTCCTCAGGGCTGCCCCACCCGACCCGTTCTATCAGTCACTCAAGCCCTCTATCCTCTGTCACAGCCTGGCTCTGTCCCTTCCCATGCCCCAACCCCCAACCTCCCAGGACCCAGTATCTCAGGATTTCTGCCCTCCTCCAGCCCCGAGCAGCCTGGAAGCCAAGTGGCAAGGATGTAGTCAGCCGGGTGGGCCCTGAGAGCCGGTGGAATGGTGTCCATGTTGCAGGAAACAAGGGAAGGTGAGGGGTACAGGGGTGCCTGTGCCAGGCCACCACTCCACAGCTCATTCTTCTCTGAGGTTATTCCCCGACCCATACCCCTCTGGAGCCCACCCCAGCTGCTTCCTCTTCCTAGGGGTCTCCACCTGATGTTCTGTGAC\n>URS0001C069FB rRNA from 1 species \nATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGGATGAAGGGAGCTTGCTCCTGGATTCAGCGGCGGACGGGTGAGTAATGCCTAGGAATCTGCCTGGTAGTTGGGGATAACGTCCGTAAACGGGCGCTAATACCGCATACGTCCTGAGGGAGAAAGTGGGGGATCTTCGGACCTCACGCTATCAGATGAGCCTAGGTCGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCGTAACTGGTCTGAGAGGATGATCAGTCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGTGCGAAGAAGGTCTTCGGATTGTAAAGCACTTTAAGTTGGGAGGAAGGGCAGTAAGTTAATACCTTGCTGTTTTGACGTTACCAACAGAATAAGCACCGGCTAACTTCGTG\n>URS0000ECE6B7 rRNA from 1 species \nGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACTCTTGACATCCAGAGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAACTCTGAGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCCAGCGGTTAGGCCGGGAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGAGTAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTAGATCAGAATGCTACGGTGAATACGTTCCCGGGCCTT\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/uniprot_all__subsampled_1000.fasta",
    "content": ">tr|A0A3A3JCS5|A0A3A3JCS5_SALMO Octaprenyl diphosphate synthase OS=Salmonella montevideo OX=115981 GN=ispB PE=3 SV=1\nMNLEKINELTAQDMAGVNATILEQLNSDVQLINQLGYYIISGGGKRIRPMIAVLAARAVGYQGNAHVTIAALIEFIHTATLLHDDVVDESDMRRGKATANAAFGNAASVLVGDFIYTRAFQMMTSLGSLKVLEVMSEAVNVIAEGEVLQLMNVNDPDITEENYMRVIYSKTARLFEAAAQCSGILAGCTPEQEKGLQDYGRYLGTAFQLIDDLLDYSADGEHLGKNVGDDLNEGKPTLPLLHAMRHGTPEQSAMIRTAIEQGNGRHLLEPVLEAMTTCGSLEWTRQRAEEEADKAISALQILPDTPWREALIGLAHIAVQRDR\n>tr|K8XEW0|K8XEW0_RHOOP LexA repressor OS=Rhodococcus opacus M213 OX=1129896 GN=lexA PE=3 SV=1\nMKDDSSTDGSTPRVSGGSAAGLTDRQRRVLEVIRTSVNERGYPPSIREIGDAVGLTSTSSVAHQLRTLERKGFLRRDPNRPRAVDVRGLDEVAAGVAANASASAAVGLAAVKSGADGAPLPEPTFVPVLGRIAAGGPILAEEAVEDVFPLPRELVGQGSLFLLKVVGESMIDAAICDGDWVVVRQQNVAENGDIVAAMIDGDATVKTFKRTENEVWLMPHNPLFDPIPGNDAVILGKVVTVMRKI\n>tr|A0A0P0EB71|A0A0P0EB71_9MICO 2Fe-2S ferredoxin-type domain-containing protein OS=Microbacterium sp. No. 7 OX=1714373 GN=AOA12_02545 PE=3 SV=1\nMPRVTYIQPDGASSEVEASRGDSVMSAAIAAGVPGIVADCRGGLTCATCHVFVDEEWLERVGEKEPEEEEMLELTAVPATECSRLSCQIVLVDELDGLVVTVPEEQE\n>tr|A0A212KYF3|A0A212KYF3_9DELT Uncharacterized protein OS=uncultured Desulfovibrio sp. OX=167968 GN=KL86DES1_10311 PE=4 SV=1\nMNFPFIPKIVAFARQHTLALAAAVLVLIVFVVSFSGWRYYQYRQSSQYAYEILRDALKTGDTETIAELVDFNSLSRGLAKDLAQNYPFLKAGADQERQIGDMIQTALLKQSRTKQEPVKDEPDLKIRLKTALYALPPDFLAQLASSLSLQPPNDGTALLTAKVRHPLLDKNFLLILRMDQTPTGWRVRQLVNSPELVRQFREAQVERMTAQRQMILDKNAATEKRMKELFPLQPCSASAGLISDGSTLLVVVHVLARDIGTVSVNNMNLFTELSSATGELLLTRYLNAVQPTHPGEDFERNWTIELDGNSELGRRVLNGQPLQCKGAWKTLGLDNGEVLHISEAPAPIEEFQ\n>tr|A0A5H1ZRJ3|A0A5H1ZRJ3_DANRE Transmembrane channel-like protein (Fragment) OS=Danio rerio OX=7955 GN=tmc2b PE=3 SV=1\nXSSSSDNNSDDESMSEGEMARLKEEVEEKKKLIATLRNKPWRMKRRLKCLKEAQEFVEKFEGALGKGKGRRLYAFKVMMTKKLIKFNRDFENFKTACIPWESRIKEVESHFGSSVASYFIFLRWMYGLNLVLFGFMFGLVVIPELLMGIPYGSIPRKTVPREEQDSAMDFSVLFEFGGYCKYSILFYGFYNNQRTIGFLQFRLPLSYLLVGVGIFGYSLMVVIRTMARNANEGGDGGDEGNFTFCWKLFTSWDYLIGNPETADNKFASTTTSFKESIVDEQENLKDENIHLRRFLRLLANVLILCCLAGSGYLIYAVVKRSQDFAKRDRNELTWLQKNEVEIVMSLLGLVCPPLFEAIAELEDYHPRIALKWQLGRIFALFLGNLYTFLFALFDEVNGKLENEKQIKNQTVWALKEYYANYTLQYNITENIPPPNIAPADVIRGPCWETEVGIEFVKLTVSDIQVTYLTILIGDFLRALIVRFLNYCWCWDLEAGFPSYAEFDISGNVLGLIFNQGMIWMGAFYAPGLVGINVLRLLSSMYYQCWAVMACNVPHERVFKASRSNNFYMGLLLLVLFLSLMPVIYSIMTLPPSFDCGPFSGKDKMYDVITETIDKDLPPFMADIFSYASNPGLIISVVLLMVLAIYYLNAVSKAYQNSNLELKRKMQMQRDEEKNRRNNKDSTNQVMKDLEDLLPNKSLIPPPSVEETEKPAEQPSKSSKVTGKPGAAASGKGVHVQKDVSLAAANPRAPVTRAPGPRQPGPLPGNPRGPPPGQGMGRGRGGPPPRR\n>tr|A0A1H1BTM6|A0A1H1BTM6_9GAMM Short chain dehydrogenase OS=Pseudoxanthomonas sp. CF125 OX=1855303 GN=SAMN05216569_1554 PE=4 SV=1\nMTADPNLDQTLQLLEAIAADRTVLDMWPEEERVRLHKAIASIYHPEPKLRRKKTKELERERHAEKLRRADALLDQTGIRALRRAPVFTTPNYFPPAGFVAQDNVEERPEPLESPELRHCYVCKKKYTQVHHFYDQMCPECAEFNFAKRTELADLSGRVALLTGGRVKIGYQAGLKLLRAGAHLIVTTRFARDSAARYAQEPDFEQWGHRLEVFGLDLRHTPSVEAFCRELSAKYPRLDFIINNACQTVRRPPEFYAHMMEAETAALRDTPEHVRKLLGSYEGLRSHDLLPEASALQVAIKQGFPEVAGLTHAAELSQVPLLAEELLGQKHLFPEGRLDQDLQQVDLRGRNSWRLQMAEVPSVELLEVQLVNAIAPFLINARLKPLMLRTPERDKHIVNVSAVEGQFYRNFKTTRHPHTNMAKAALNMMTRTAAADYHGDGIHMNSVDTGWVTDEDPVELAARKTVQERFHPPLDIVDGAARIVDPIIHGINTGEHVWGQFLKDYRPTDW\n>tr|A0A217EZB4|A0A217EZB4_9SPHN Uncharacterized protein OS=Croceicoccus marinus OX=450378 GN=A9D14_19100 PE=4 SV=1\nMAAPLALAACGSGDDTEMMDDTAMAEGQMADGQMPMDGGDMSMMGSDSAMQTASAEGTVTAIDADAGTITVDHGAVPAIEWPAMTMAFEADEELRQDVAVGDTISFDFTTDESGNAITSITKK\n>tr|A0A1C5RVT8|A0A1C5RVT8_9CLOT Uncharacterized protein OS=uncultured Clostridium sp. OX=59620 GN=SAMEA3545292_01435 PE=4 SV=1\nMSGLYTITLNGVSEEVYNKAADYIQAHALRLNYRPEVSTIDCEFPDDLDPAKAPELSEAVIRKVHQQL\n>tr|A0A2M7MVT7|A0A2M7MVT7_9PROT Uncharacterized protein OS=Hydrogenophilales bacterium CG_4_10_14_3_um_filter_63_21 OX=1974028 GN=COZ24_06435 PE=4 SV=1\nMRTWLDLNGLCARKREQGEHPRPFWTLMKRYLPQNYRWNIVHEDDSLIIAGIEHGLHGHLGPNGARGNPKNLRSVGKANTGHTHSAGITEGVYTAGVFGQLDMGYNKGLSSWSHSFILTYENGKRTICTIRDGRAWR\n>tr|A0A1H5Q8D7|A0A1H5Q8D7_9PSEU Transcriptional regulator, LacI family OS=Amycolatopsis pretoriensis OX=218821 GN=SAMN05421837_101914 PE=4 SV=1\nMTTKSDDPEPCASRVTIARIAAETGVSVPTVSKVLNGRPDVAESTRARVEAVIGKYGYRRRADERSRRSRLLELMFHELESTWALEIIRGVEYVARENGMAVVLAESSGRHTPGQSWLESVLARRPVGIVSVCSDFTGGQLAKLRARDIPLVVVDPAGAPGPETPSIGATNWQGGLTATRHLVELGHRRIAMIGGPDGVLCSRARIDGYRTALETAGLAFDPALVRRGDFHVRSGYRELASLLTLPDRPTAVFAGSDLQALGVYEAARDAGLRIPDDLSVVGFDDLPVARWLTPELTTIRQPLQEMAAAGARLAISLARGTHPESHRLELATSLVVRQSTAAPARRAVPAGRG\n>tr|A0A1I0W1D7|A0A1I0W1D7_9ACTN NAD-dependent protein deacetylase, SIR2 family OS=Nocardioides alpinus OX=748909 GN=SAMN05192575_101623 PE=4 SV=1\nMTLAPTDRVESALDLLTTRPLVVLTGAGLSTDSGIPDYRGPGSTARAPMTYQEFVGSAEAQQRYWARSHLGWQRMGRALPNDGHRALAALDPVLLITQNVDGLHEAAGSRHLVALHGRVADVICLSCRTTSSRDDLEQRLDDLNPGWLEQHGWVESRPDGDVDLDDTSDFVVPTCACGGPIKPDVVFFGENVPADRVARCYAAVESLGPDGALLVAGSSLTVMSGLRFVKRAAQGGTPIVIVNRGATRGDPLASYTLDVGCSEFLTRLAELAG\n>tr|A0A4W2HU19|A0A4W2HU19_BOBOX Ubiquitin conjugating enzyme E2 L3 OS=Bos indicus x Bos taurus OX=30522 GN=UBE2L3 PE=3 SV=1\nEGAEARGDARPQQVALLPQLFDLLVLGQQRARLLRQVPRALVGQGLAKLQARAALSGHRRAHGPQELEEIRKCGMKNFRNIQVDEANLLTWQGLIVPDNPPYDKGAFRIEINFPAEYPFKPPKITFKTKIYHPNIDEKGQVCLPVISAENWKPATKTDQVIQSLIALVNDPQPEHPLRADLAEEYSKDRKKFCKNAEEFTKKYGEKRPVD\n>tr|H2DDU6|H2DDU6_9BACT Exported protein KikA OS=uncultured bacterium OX=77133 GN=kikA PE=4 SV=1\nMNRKMTVVSASLVGALSLFSQTAKADDWGCQVLLCLSDPRGPTTESECKPPIHKLWDHLRKGKPFPSCAMATNSRTGKRSYAQLVYDPYDPCPDGTKPAGGYIAQSQSADRKDWRRLQYAFSTHGRRYDSGGAWNMYEGNGPRACVGNHLGSYSVYRGNDDSNISVQVYDQVVWQQPQNPRAIDVFIDEAFHHRVRY\n>tr|A0A7D7KQY5|A0A7D7KQY5_9MAGN Maturase K OS=Neolitsea pallens OX=344110 GN=matK PE=3 SV=1\nMEELQGYLEMDGFRQQYFLYPFLFQEYIYALAHGHALNGSILYEPVENLDHDNKSSSLIVKRLITRMHQQNRLIISVNDSNQNRFVGHNNHFDSQMISEGFAVVVEIPFSLRLVSSLEEKEIAKSHNLRSIHSIFPFFEDKLSHLNRVSDILIPHPIHLEILVQTLHSWIQDTPSLHLLRFSLYEYWNSNSLITPKNAISLFSKENQRFFLFLSNSHVYECEFIFIFLRKQPFHLRSKSFGSFLERTHFYAKIEYLVVVLCNDFQKTLWLFKDSFMHYVRYQGKSILASRGARLLIKKWKSHFVNFWQCHFDLWSQPARIHIKQLYNHPFHFLGYLSSVRLNSSVIRSQMLENSFRIDTAIKKFETVVPIIPLIGSLAKAKFCNVSGHPISKPFRADLSDSEILNRFGRICRNLSHYHSGSSKKQSLYRIKYILRLSCARTLSRKHKSTIRAFLKRLGSEFLEEFFTEEEQALSLIFPTTSSPSHRSHRERVWYLDIIRINDLVSHL\n>tr|A0A839YFJ7|A0A839YFJ7_9SPHN Glutamyl-tRNA synthetase OS=Sphingomonas sp. BK580 OX=2586972 GN=FHY05_001379 PE=4 SV=1\nMSATEINERAVVTRFAPSPTGFLHLGGARTALFNLLFARHHGGTFRLRIEDTDRARSTQPAIEAILNGMRWLGLDWDGEEVYQFARADRHAAVAHRMIEAGHAYRCYLTSEELDAMRAAAQAAKQPLRIRSPWRDRTDWPADQSYVVRLRAPTEGATTIHDRVQGEVTVQNAELDDLVLLRSDGTPTYMLAVVVDDHDMGVTHVIRGDDHLNNAFRQLPIYRAMDAIEGGWPDPVYAHIPLIHGSDGAKLSKRHGAVGIEAYRDEMGILPEALDNYLLRLGWGHGDEEIIAREDAVRWFDLDAVGKSPSRFDLKKLEHLNGHYIRASDDSRLADLVAEKLGLDRDDTRRAVLAAAMPALKPRAANLNELADGTAFLFATRPLVIDTEAAPLLAGEAPALLARLHAALDAVHNWDTETIEAAVRQVADAAGVKLGQVAQPLRAALTGRRTSPGIFDVLVLLGRDESLARIADHQA\n>tr|A0A1B3Z9R2|A0A1B3Z9R2_9SPHN Uncharacterized protein OS=Sphingomonas panacis OX=1560345 GN=AWL63_09520 PE=4 SV=1\nMFDRCNDKALTVVSMCDDVPPAPERRSDARNLSILKAAILRTALGEELCLVRNISRGGLMAHIFSELEVGDPVKIEFRSSKIVRGRVVWRRPELMGVRFSQFIDIGEILTDPKPQPSHAARAPRVTVNVPARLRSGGRYQAAALGNISQGGARIYLSEPDRLGDDVVLSVAGLPVLTGSVRWRDDTAAGIAFSELLAFEDVGRWVSSHNIGVPPQLVE\n>tr|A0A7V8Z0K8|A0A7V8Z0K8_9BACT 2,3-bisphosphoglycerate-dependent phosphoglycerate mutase OS=Blastocatellia bacterium OX=2052146 GN=gpmA PE=3 SV=1\nMHKLVLIRHGESEWNKENRFTGWKDVDLSEKGREEAQAAGKLLKAEGFTFDESYTSVLKRAIRTLWIILDELDLMWIPETKSWLLNERHYGALQGLNKAETAAQYGEEQVQIWRRSFDIPPSIMEETDERHLGKDPRYCEIEAGKFPGSECLKDTVARVIPYFETAILPKVKDGKRIIVAAHGNSLRALVKYLDGISDTEIVNLNIPTGIPLIYELDDDIKPIKSYYLGDNEAIRKAQEAIANQGKAK\n>tr|A0A3C0TX47|A0A3C0TX47_9PROT Ribosomal-protein-alanine N-acetyltransferase (Fragment) OS=Alphaproteobacteria bacterium OX=1913988 GN=DCO82_10580 PE=4 SV=1\nVATHNEAAISLYKRQGFIAAGLRKAYYAPEPGQSTSTDALIMRCNL\n>tr|A0A1M3DHD8|A0A1M3DHD8_9SPHN DUF4142 domain-containing protein OS=Sphingomonas sp. 67-36 OX=1895849 GN=BGO24_13795 PE=4 SV=1\nMKLAAMTMTAAALALTACGHKETTTTMTTDNTVVATNDIAAVPTPSGGQSFANTAAASDAFEIATSKLALDKSGSAAVKKFAQKMIDAHTGSTARLKAIAAGAVPAITPDPTLTAGQQATVDSLKNLTGPDFDKAYAAAQVDGHQKTLDALKAYAATGDVPAFKDFATNLVPTVTAHLNMAKSLKP\n>tr|A0A661FLP6|A0A661FLP6_9GAMM ThiF domain-containing protein OS=Gammaproteobacteria bacterium OX=1913989 GN=DRR11_20880 PE=4 SV=1\nMTTDYTARFARQITLPQIGTVGQQRLADSHALIIGLGGLGSAASLYVANSGVGRLTINDFDRVDITNLPRQILFTEQDIDEFKTTATAKRLQQINPGIQIDEINQRLTEAALHEAVAASDIVLDCTDNFVTRGAINRACYAAQRPLITGAAIRFEGQLAVFRHDVPRGRHLPDNPCYNCLYTEEDENLEGCAGQGILAPVVGTIGCMMATEAIKLLAGIESLLNGKLWIYDALSVTTKTVRINARVDCPVCGVKA\n>tr|A0A225NGS3|A0A225NGS3_9RHOB PMT_2 domain-containing protein OS=Marinibacterium profundimaris OX=1679460 GN=ATO3_21925 PE=4 SV=1\nMRLGVLAVLALTLYRVVLLAFASADLFVDEAQYWAWGQNLEFGYYSKPPLIGWVIRAFTEVAGSDAPFWIRLPGPLFHGAAALVVLATARRLWGDVAGAATGIAYASMPGVALGALLISTDTILLPFFALALFFWLKLTERSSAGVALAMGAAVGLGMMAKYAAIYFVLGALFSVIFVRGARISWRDAALAALAFLVVFAPNILWNLQNGLTTVSHTADNVDWINDPSTRLRLNFSGLAEFFGGQFGVMGPVFFAAYLVVVARKIVTGDWPARWLIWMSLPIILLVCVQAILSRAYANWAAPAYVAAVILTAPWLFDRARRIYCAALGINLALSLALPLAAVFATSWTLNDRLVLGRYVGRAEASARILSTAREAGLTDVVATSRDLLADLFHAAKGTGIAPWSVPFEGHVPHYYAQRFPYPTGQSAPALYADFADVPPLCAPGTEVTELTRWDIPGGAYRGRTLVAWRVGPGCWTD\n>tr|A0A0E3SH12|A0A0E3SH12_9EURY Uncharacterized protein OS=Methanosarcina horonobensis HB-1 = JCM 15518 OX=1434110 GN=MSHOH_2470 PE=4 SV=1\nMIMNEHKTLWEKYFLNFRNVASPLRKPALFDWLYNSYRCLYLSCVDPSLVSRLTDLKTCLSMIGVAVDDSCDYALLREKNGGDKFSYEILSMLYNTDKIESGDYILLDAHLTNNMYIKTTIGIYSDLVRNQIASLPRYCDFRGEFLLAMRNVAESMEFSYLLNKNKIVYPFSHVVRSRAASTMIETHSLLDLMSSKNFDTSELGKAIVLFKLADIVAMLSNTINTWTREITERDYSCPVISLALEKKLIKFSDFERASTENLKEKLSPVSEVIEDELDKAILSMKEFAENSEIKSFDTSKFVNNYVNLYWQTDAMN\n>tr|A0A6P1BJ03|A0A6P1BJ03_9BRAD Isoprenylcysteine carboxylmethyltransferase family protein OS=Bradyrhizobium uaiense OX=2594946 GN=FNJ47_21045 PE=4 SV=1\nMNETSNPPRINLRRAAFTFVGLGTLLFLAAGTMRWAGAWVFLLEITIGGLITEAWLARHDPGLLAERRTARGQAGWDRIITSIMPLLWLTWLPLMALDAVRYQTSFIPVWLQCTGALMIAASFYIAYRTYRENSYAAPVVKIQRERGHTAVTTGPYAYVRHPIYAGGLLTYLGTPLLLGSWYGLAIVPVMAALLGLRSMMEERMLTAELDGYADYIARVRYRLVPMVW\n>tr|A0A7X6LY41|A0A7X6LY41_9NOCA Respiratory nitrate reductase subunit gamma OS=Nocardia veterana OX=132249 GN=narI PE=4 SV=1\nMTSTVWATLPYIAFTSFVLGHLWRYRNDQFGWTTRSSQIYESRLLRLGSPLFHFGMLGVIGGHVLGVLIPQSWTDAVGISEHLYHVIAVAAGSVAGVAVIAGIAILAYRRLRVPAVRKATTRNDVFMYVLLAAALITGLLNTVGSNLLWGTYNYRETVSPWFRSLFTAHPQPDLMVGTPWTFQAHGLIVLTLIAVWPYTRLVHMFSAPVGYLVRPYVVYRSKPVDTANKRKYARAWQTPVLPR\n>tr|A0A508XB42|A0A508XB42_9HYPH Diguanylate cyclase OS=Sinorhizobium medicae OX=110321 GN=EMEDMD4_790360 PE=4 SV=1\nMELQESAIYAGPPIASPEVRSQLLRPAVMAEVERLLGGRTRDIRLKGELGRLFEERSWSRTAKIIRAWMIWVTLLDVLTLGLNAILLPNAVALSMLPPACILPPAALATAFIWRKPRGVGLQRVSLVAGLFLILLSVALVGVSAGGEFYERHLNIMLFVAITAIIIFSIPLAWTVAVASFALALYLIFQLRNPMLDTGSAVAGTLFFTSGIVATVVARRTMTILAQKTFLLELRDKRRVAELADANARLERLAKTDPLTGIANRRWMMETLNRLWGAGAERPAGTAMLMCDIDDFKSLNDRLGHAEGDRCLVKVAGIIQSSVRRNRDHVARYGGEEFLVVLPGADVQAALATAERIRASVEAASLPNPASRVAPYVTLSIGVAAQGAAGEIIEPEKLQNQADTALYLAKQAGRNRVVLFRPE\n>tr|A0A820L477|A0A820L477_9BILA Hypothetical protein (Fragment) OS=Adineta steineri OX=433720 GN=OKA104_LOCUS48766 PE=4 SV=1\nVAYGGTTMHGIRHYCQFPFIYQGKQYTNCISDKPPHATPDQTVFDPWCSLTHNHDIDDQWGFCDIGVTDSTIYSICQNQLQTIQCSPGYVIDILTADYATKQDGTNSCNYNKNDCFQSDASTIENLCSGKTSCTVYHYAKTLVSCQNRLSTYLQIDYTCVPNDIETIMTYDICNNDSKPSGDIRRGFLISPNFPNVKNNINCIYDLHILKPHQD\n>tr|A0A841MMF6|A0A841MMF6_9CAUL Two-component system response regulator FixJ OS=Caulobacter sp. YL-Caulobacter OX=2723104 GN=HDO15_004474 PE=4 SV=1\nMSDAAPIGAQVVHVVDDDESARESLAFLLESADFEVAAYASAPAFLDALADARPGVIITDVRMPEMSGQELVARLGALKVKMPIVMITGHGDIPMAVEAMRSGVVDFIEKPFSESRMLDALGRAFKSVEAAPASNDQTAILKRIETLSERERQVLDGVVAGHANKVIARELGISPRTVEIYRAKLMTKMQADNLAALVRMTLSARGE\n>tr|A0A1E2YF14|A0A1E2YF14_PARBR GTP-binding protein rho2 OS=Paracoccidioides brasiliensis OX=121759 GN=GX48_00269 PE=4 SV=1\nMAQQQLQQLQTENVMRRYVDGKHLWSWKLVIIGDGACGKTSLLSVFTLGYFPTHYVPTVFENYVTDCRVDGRSVQLALWDTAGQEDYERLRPLAYSKAHVLLIAFAVDTPDSLENVRNKWIEEANERCPDVPIILVGLKKDLREDPLAIEEMRKKSLRFVSSKEGHDTAAQVGARKYLECSSLTGEGVDDVFEAATRAALLTFEKDRGSCCVIL\n>tr|A0A6N9C681|A0A6N9C681_9BACT FRG domain-containing protein OS=Candidatus Poribacteria bacterium OX=2026781 GN=F4X33_06180 PE=4 SV=1\nMNTQNSTDLQDYYLNGLNKIINEIMEKSADGNYIYRGEPKCYPTIASQLYLNRYAESNQRLTPIDVAQAFEIVMASNYLDSEAEKEFFPIASELRHYGSPVNYLDFTTDYNIALYFACAKHFACAKLGEDGHGKDGRIVLLQRNKETKEKYQIKPVQDPPNRAKAQKSVFVEPPDGFILSNDKDVKTVCIPKELKQWILIHLHRFQCISYQTLYHDIYGYIAQKDLRASAEEKHKSHEGTERWHIAQIEHSPYSVRYYYDLACYYGKDMYKYDCAIETFSKAILLKPDSVFAHINRGISYARNNILDRAIQDFVKVIPMLFKFPFSDALFLVYKSLGQVYDIRGDCHSAIEYYQKAQQLRFDDPVVAAYLDKSKRPQLSKLEYYVR\n>tr|A0A1H0ZCM6|A0A1H0ZCM6_9MICO DNA-binding transcriptional regulator, LysR family OS=Leucobacter chromiiresistens OX=1079994 GN=SAMN04488565_1638 PE=3 SV=1\nMNLEQLRGFVEIAQLGNFTRAAERLHLAQPSLSRQIAALETDLGVELLHRVRGHVAATPAGERLLPIARRMLADAETARHEMSDLAELRGGRIRLGATPTLCTSLVADVLAEFRARYPGIEIEILERGSRSLISALMEGALDLALIVTSVSSGAARAVLEREQILSERLVVVSDPNRPDPFAPEGAEARDPGRPVDLEELARVPQVLFPENYDLRATVDAAFRARGLTPLVAVAGAEMDAALSFARRGIGVAVVPAMVAADRPALRTAPLADDALARTVSVARRADMAPTRAGAALQAVIREIADRVTAPGAELSSLVTRVGEPAPLRSAAPPPA\n>tr|A0A1G6ZFJ8|A0A1G6ZFJ8_9BACL Uncharacterized beta-barrel protein YwiB, DUF1934 family OS=Paenibacillus sp. CF095 OX=1881033 GN=SAMN05428987_0174 PE=4 SV=1\nMSNMRPVHIRLHSRYEGEDVLQEMQGEAVLKGSVLYVRYEEPQVGPEGGTTRTTLKLGGQSIKIIRHGEVESEQTFELNRKLPGFYRSPYMSFALSTHTQKLELSIQGLSARAAWSYDFYRFDEESGHFAISLHIQEEPIS\n>tr|A0A654FXQ0|A0A654FXQ0_ARATH (thale cress) hypothetical protein OS=Arabidopsis thaliana OX=3702 GN=AN1_LOCUS20985 PE=4 SV=1\nMETPGASHDSFRGSPRRNSILSASNIIQAPISTLLEYSGLFRARPSPSHEAETLVSDDSSGLSNGEVAIRIIGNTEQDAETDTNALREPGHSELLGSSATQVDPMGGASEGASQAAPGDPAAGDAASRDSPYQRYDIQQAARWIEQILPFSLLLLVVFIRQHLQGFFVAIWIAAVMFKSNDILKKQTALKGERHISALIGISVAFTAHVVGVYWWFRKDDLLYPLIMLPPKSIPPFWHAIFIIVVNDTLVRQASMIFKCFLLMYYKNSRGRNYRKQGQLLTLVEYFMLLYRSLLPTPVWYRFFLNKDYGSLFSSLMTGLYLTFKLTSVVEKVQSFFTALKALSRKEVHYGSYATTEQVNAAGDLCAICQEKMHTPILLRCKHMFCEDCVSEWFERERTCPLCRALVKPADLKSFGDGSTSLFFQIF\n>tr|A0A7K9WNV0|A0A7K9WNV0_9PASS DMXL2 protein (Fragment) OS=Rhipidura dahli OX=667186 GN=Dmxl2 PE=4 SV=1\nLTGAQDGSVRMFEWTRPQQLVCFRQAGNARVTRMYFNAQGNKCGVADGEGFLSIWQVNQTTSNPKPYLSWQCHSKTTSDFAFITSSSLVATSGQSNDNRNVCLWDTLVSSGNSLIHAFTCHDHGATVLQYAPKHQLLISGGRKGYICIFDIRQRQILFTFQAHESAVKALALDPSEDYFVTGSAE\n>tr|A0A7Y9UAN0|A0A7Y9UAN0_9CELL YCII domain-containing protein OS=Cellulomonas hominis OX=156981 GN=GGD73_001711 PE=3 SV=1\nMPSLWHERPEEPPVGHDAGMPIFAVRYTYDARTDLQDAIRPEHRAYLQGVAERGELLGSGPFPEGPAGALLVFRTADRDALDAVLTADPFALAGVIAETEVRTWNLVLGPWAEHPAG\n>tr|A0A660XH96|A0A660XH96_9BACT TonB_dep_Rec domain-containing protein (Fragment) OS=Candidatus Marinimicrobia bacterium OX=2026760 GN=DRP89_06950 PE=4 SV=1\nAETFKSPELGDIEHRQLLAVIPGLSIRSYGGPAGITTLSLDGGPSSQTKVIVSGFDLTNAQNGEMDLSQLPGPFVENVSYIPQDENFYGSGSNESTIHLNPWSGKSGLSLSTGSYGHSSIHGTLNLHKNQWIGNFLIGKRHDDGNYPFKWRNESFKRENNYFDQKFISAQFNTVIQKRAFLRFLYLLSNQSRGIAGQSWNPSKNANRDDKLQIIGVKFGWTNKKGHGYIQTMYRYSWENYKNPMIAVNSFHRLSTWQFILNQEKKINEKIGVNLLFETKKDGLKSKDTNNHYRISYSTAITVPYFLSKTFKFQPAYCYDISPNLYYEHSYVLKLLTSLNFLFIKSLTIHQGRYFRYPTFNDLYWIPGGNPNLKPEHTDNVSLDINCHLIQDSDLEILLFYKSSDDLIQWTPISSYWQPKNIQHAVRKGYKIIYRWNSQNIPLEAFVHYSSNRTKDLSQGNCYGKPLRYAPEQTAAVGINWQPEPLSFHLQIHHTSERISMYSWPEDVILSEATLIFTSCAYTWKRPSGDIIIVFAMDNLTDKRYETIKGYPEPGRTFRMTISYQH\n>tr|A0A2U0ZQI9|A0A2U0ZQI9_9BACT ATP synthase subunit beta OS=Filimonas sp. YR581 OX=2135469 GN=atpD PE=3 SV=1\nMSNKGKIKQVIGAVVDVHFENDHSLPEIYNALEITRPSGEKLVLEVQQHLGEDSVRTIAMDGTEGLVRGMEVIDTGKAIAMPTGPGINGRLFNVTGDPIDGLPALSKTTSRPIHALPPKFEDLSTATEVLFTGIKVIDLIEPYAKGGKIGLFGGAGVGKTVLIQELINNIAKGHGGLSVFAGVGERTREGNDLLREMIEAGIMKYGDKFIHSMEEGGWDLSSVDMEGLKESKATFVFGQMNEPPGARARVALSGLTIAEYFRDGDGTGKGKDILFFVDNIFRFTQAGSEVSALLGRMPSAVGYQPTLATEMGLMQERITSTKSGSITSVQAVYVPADDLTDPAPATTFAHLDATTVLSRKIADLGIYPAVDPLDSTSRILTPAVVGEKHYNTADRVKLILQRYKELQDIIAILGMDELSEEDKQIVSRARKVQRFLSQPFHVAEQFTGLKGVFVSIDDTIRGFNAIMDGEVDEYPEAAFNLVGTLEEAIEKGKKLLAQAQG\n>tr|A0A231W898|A0A231W898_9BACI 2-dehydro-3-deoxygluconokinase OS=Bacillus sp. OG2 OX=1979526 GN=B9K06_14550 PE=4 SV=1\nMDVITIGETMVLFTPQTTGLMRYANQFSMTFGGAESNVAIGLTRLGHKAGWISKVGNDEFGKAMLSFISGEGVDTTQVLIDSEAPTGVYFKEPRRANDVRVYYYRKDSAASRLEPGDINEEYLSNANYLHLTGITPALSDNCRELVYEAVAMAKKHGVQVVFDPNLRKKLWPEDQARKVLLDLASKAAIVLPGIAEGEFMFGEKDPVKLGRLFLALGPAVVVLKLGEEGCMVFTKDLQAKVPGFPVDRVIDPVGAGDGFAAGFLSGMLDGLSLEDAATRANAVGAFVTMVDGDVEGLPEKDEILGMLENKFDDVSR\n>tr|A0A0B7HH50|A0A0B7HH50_9FLAO Tetratricopeptide repeat protein OS=Capnocytophaga cynodegmi OX=28189 GN=CCYN74_100115 PE=4 SV=1\nMTKKYLLIFIIVALILTILAFVFLPKKDSYSKIEKVDIVTNQGYAGSHSCKECHEQEYAEWELSDHFKAMQHADDKTVLGDFNDVTYTADGITSRFFKKNGKFYINTEDENGKYRDFEIVFTFGHYPLQQYLTKFGGGKMQVFRQSWDSRENKWFHQYAGEKIPPGDYLHWTNAGQNWNLMCSTCHSTNLQKNYNPLKDTYKTTYDELTVGCESCHGPGKKHNDFMRSSDYQKGISKNFFITLGVNTPQKTELNTCMPCHARRGEVTQHHTASDEIMDNYIPEIPITNIYFADGQALDEVYKYGSFLQSKMYHVSIKCTNCHLPHSGKLRMQGNQLCLQCHTPNYATSAHTFHKENTEASDCKSCHMPTRTYMGNDIRHDHNFAVPRPDLSEKYGVPNACNACHNDKSAKWASQAVEKWYGKERRPHFAENLIIGSLQNEKSLERLNELLTNSATPDIIRATAVHYLGGIYTEQSLQLVKKELNNSDAQTRYRAVIALGNFPIHLYENELISLLSDKVKAVRIATAYVFLSQKGWEQSKLLTSFESARKEYETFVLSQADFPVGSATAADYFTHLGDTDKAILFYERAIKKDKTLNHVRLNLATLYNGKGQNDKAWQILHQAQNYAPENAQVYYFMALLSSEEKDYNQAKKYFEKAMQLGMNNENIQRNYQSVIQIINKKN\n>tr|W2ZLA7|W2ZLA7_PHYPR Uncharacterized protein OS=Phytophthora parasitica P10297 OX=1317064 GN=F442_06838 PE=4 SV=1\nMQTRASIFAQHIPALHHVSSTLYRSQSAAVAASSPLSRVTSDRPAIRQQSRPDGDNG\n>tr|A0A1F9MIM0|A0A1F9MIM0_9DELT Metallophos domain-containing protein OS=Deltaproteobacteria bacterium RIFOXYA12_FULL_61_11 OX=1797896 GN=A2284_00320 PE=4 SV=1\nMVPTAADLVPFSIVLVPDTQYYTSKQGNGEENTYWKQMRWIRDHRETENILMAVHLGDITGSNEPEQWEIASAAHRILDQADLPYSVVPGNHDYLGKSSASFRSRTFFDSHFPASRFSGRAWFGGSLGSSNVNNYTLFENGAQKFLVLSLEYAPRKDTLCLAEDLLARHPDRRVIVATHCYLTKGGAYAEGCPNPDYGTVGAAGETVWDEFVSRYSSIFLVVSGHVNESAHAPRTGNAGNTVQQLVVDYQAEAACNAKSPDQCNDHCKAGTYTGNGWLRQLVFDPAVGQVQARTFSVEDGNTSVFPGGHPVLFCSELNKQGNDDYPSDPLAPDHAFSFTYEPLWTKPFVREDLGRRSFLDRTVNSVGEGQQERPAVAMAENGDFVAVWEDDSSKADGAGNRDIFLRGFLAGGCQKFPAQVINGNQNGQQRHPAVAVDRDGRAVVVWEDDTDGNGVFQVKARGFHADGSERLPVFTVNSEASGQQRNPAIGMSSDGRFVVAWEDVAGGNGAQILVRGFNADGSPLFPDRSGHTDTAGQHLEPTVALDASGAFVVAWQDDTDGNGYYQIHARGFDSAGKERFPKIVVNSVDTGQQYRPSLSLDQAGHFVVVWEDDQDKDGNSNLLARGFNADGTARFSDFAVVAGAGTHAAPSLAAGTDGSFVVAWQDDGDGNGTSQIHAKAFRADGSEWQARWTVNLQSAGQQLSPSVALAGKTLVVAWQDDLDGNEVYQILARGVDLP\n>tr|A0A1S7RCV2|A0A1S7RCV2_9HYPH Uncharacterized protein OS=Agrobacterium sp. NCPPB 925 OX=1631629 GN=AGR6A_Cc80407 PE=4 SV=1\nMSAEPVDTNDAYRPIMETVSTMVSSIDLSTRLTATRLALKAIKQQDDSSADQSSSTRTALLSSYGIDSSSSTNTRLAQLLAQYGEASGDDTQTEGTDTQPSSGDITKADFMKGLKGMLEELSKDPDKASQANAMLEALKAGTLTVSDPAEGARIKAWDVASDTETASKPSTEITTTGWSDFLKEHLKRDGSIYAKGASGAYVDTISGDNAFFGSVGSRYYYLTWPQAKNGTLTV\n>tr|A0A5X5WLM0|A0A5X5WLM0_SALET Diol dehydratase reactivase subunit alpha OS=Salmonella enterica subsp. enterica serovar Corvallis OX=593905 GN=pduG PE=4 SV=1\nMRYIAGIDIGNSSTEVALARQDETGALTITHSALAETTGIKGTLRNVFGIQEALALVAKRAGINVSDISLIRINEATPVIGDVAMETITETIITESTMIGHNPKTPGGVGLGVGITITPEELLTRPADSSYILVVSSAFDFADIANVINASMRAGYQITGVILQRDDGVLVSNRLEKSLPIVDEVLYIDRIPLGMLAAIEVAVPGKVIETLSNPYGIATVFNLNADETKNIVPMARALIGNRSAVVVKTPSGDVKARAIPAGNLELQAQGRTVRVDVAAGAEAIMKAVDGCGKLDNVTGEAGTNIGGMLEHVRQTMAELTNKPSSEIFIQDLLAVDTSVPVSVTGGLAGEFSLEQAVGIASMVKSDRLQMAMIAREIEQKLNIDVQIGGAEAEAAILGALTTPGTTRPLAILDLGAGSTDASIINPKGEIIATHLAGAGDMVTMIIARELGLEDRYLAEEIKKYPLAKVESLFHLRHEDGSVQFFPTPLPPTVFARVCVVKPDELVPLPGDLALEKVRAIRRSAKERVFVTNALRALRQVSPTGNIRDIPFVVLVGGSSLDFEVPQLVTDALAHYRLVAGRGNIRGSEGPRNAVATGLILSWHKEFAYGQ\n>tr|A0A4S1A4Z3|A0A4S1A4Z3_9BACT LPS biosynthesis choline kinase OS=bacterium M00.F.Ca.ET.156.01.1.1 OX=2563902 GN=EN799_28860 PE=4 SV=1\nMTDDLRAALATVPVLAGYDGPLERLGGLTNMVYRAGDVCLRIPGKGTEEYINRANEAVAAREAAKAGVSPEVLYADPETGRMATRFIAGAETMSPEKFKTRKGSAARAGEAFRKLHRSGAVFPFRFELFAMIDDYLKVLSTKDVALPAGYHDVVREAGSVRAALDAHPIELAACHCDPLCENFLDTGERMWIVDWEYSGMNDPLWDLGDLSVEGKFNEAQDEELMRAYFGGEARPAERGRVVIYKAMCDLLWTLWGLIQLANDNPVDDFRAYADGRFARCKMLMETAEFSGHLAAVRLG\n>tr|A0A5B8NLP5|A0A5B8NLP5_9CHRO 50S ribosomal protein L35 OS=Euhalothece natronophila Z-M001 OX=522448 GN=rpmI PE=3 SV=1\nMPKLKTNRAAAKRFRATGRGKIRRRKAFKNHLLEPKKTSRKRRLSKLTFVNERDAEKVEQMLPYMK\n>tr|A0A098VY33|A0A098VY33_9MICR ATP-dependent Clp protease proteolytic subunit OS=Mitosporidium daphniae OX=1485682 GN=DI09_143p40 PE=3 SV=1\nMQLIKAPVYTIAMGMAASMGSFLLAAGAPGHRKALPNSRIMVHQPSGGATGPAADIEIAAKEILRLRTLLNEIYARHTGQSLSTIERALDRDRYMTPEEAAGFGLIDGVLNATPSRQIL\n>tr|T2IPC9|T2IPC9_CROWT Transposase OS=Crocosphaera watsonii WH 0005 OX=423472 GN=CWATWH0005_4898 PE=3 SV=1\nMGLCVVQIAKVLNLNYCYRIYPDSSQEKELLDWLEICRGVYNYALRERKEWINSRKCKVNACSLHSEYIIPADQPFPDYYKQKKALTQAKKEYPSLKRVQSQVLQQVMGRLDKAFNFFWKRSFGFPRFKKYGQYRSINFPQFKENPITGYQIKLPKIGSVRINLHRPIPDGFVVKQVQIVKKASGWYAVICIQSDVKVPSPQPQGKSLGIDLGLEKFIATSQQELIARPRFFVELQSKLQWLQRRLSKKQKGSKNWHKAREKVARLHEHIYNTRKNFHYQVAHHLCDQANIIFAEDLNLKAMSRGMLCKHTLDAGFGGFLEILKHVAWKRDVYFEKVDANLTSQTCPNCGMVTGKKDLSQRVHECSNCGFITDRDVAAAMIVEQRGLAALGLGVKLPVEDEVIGDVRKKSSRASRRSRKAS\n>tr|A0A1G1DFT8|A0A1G1DFT8_9BACT Uncharacterized protein OS=Nitrospinae bacterium RIFCSPLOWO2_01_FULL_39_10 OX=1801683 GN=A2889_02485 PE=4 SV=1\nMVAVRRKLLTAQKMRKIYRRVKSVCLSVCLSVCLCKVDTILFIPHPPPSPQPSPRGRGREGQGEREYQ\n>tr|A0A524FY20|A0A524FY20_THOAR Response regulator OS=Thorarchaeota archaeon (strain OWC) OX=2053491 GN=EU527_15255 PE=4 SV=1\nMALEDAGFDVVAEAEDTENLLIQCQGNRPAVVIIDFNMDQIEIVRLIEHLLDIDPIVAIVVISDIADGQTEMVLAAGARAFLQKPFSMYDMTDIVRKVKPVY\n>tr|A0A853UB48|A0A853UB48_9MICO Uncharacterized protein OS=Dermabacter sp. HMSC06F07 OX=1581125 GN=HMPREF3157_09225 PE=4 SV=1\nMRGVSAKSLQSVLRRAAESTSANTPSTEIASELFEAVRVIDSSNQLVRLLSDPGRDEDLKADVVRRLFGGRVSEAALEVLLEASRCTWSEQNHLLEGIEFAGVSLVLDKARGRGTAHAVEEELFQVARLVEDTPELSEAFDSKRDDVPARVGIIERLLGGKVDEATVALAAQAVSFEPEAKVPARLLEFANFASAERDRRSGVVTSAIALSPEQQERLTRILSARYGGELSLNYEIDPSVIGGLRITIGDDLYDATIFGRVRDARERISA\n>tr|M0J625|M0J625_HALVA Uncharacterized protein OS=Haloarcula vallismortis ATCC 29715 OX=662477 GN=C437_14607 PE=4 SV=1\nMSATEETVRVWLVERTYSDDEQNLIILTYATPDGDQYFRKERALTSFSDVRETTAAVDADPDNLGSVDDPDLQAQYAAEATRMAEKHDPDDAI\n>tr|A0A2W5SS74|A0A2W5SS74_STANO Uracil-DNA glycosylase OS=Starkeya novella OX=921 GN=DI549_11565 PE=4 SV=1\nMASPSETLDDVLAAIRACRVCVEHPLGRPLPHEPRPVLHMGTRARILIAGQAPGTKVHGSGLSFNDRSGDRLRDWLGVDRETFYDGDSIAVAAMGFCFPGQDAKGGDLPPRRECARLWHDRLFAARPPFDLVVAVGATSQAYHLKRLGLERFATGGLTERVMRWREIWAASNQTRVLPLPHPSWRNTGWLKRHPWFEAELLPVLRQEVARIVGSAREGREPREPA\n>tr|A0A3G8GEA2|A0A3G8GEA2_9BURK Acylphosphatase OS=Pigmentiphaga sp. H8 OX=2488560 GN=EGT29_00430 PE=3 SV=1\nMQELDSTAPLETVLVRVTGRVQGVGFRLATVRRAHLVGVGGWVRNNEDGSVEALVQGTPDQVDQMLEWMRQGPPQARVDDLASERQFIDRRFARFEQQ\n>tr|W9AG96|W9AG96_9BACI Glutamate racemase OS=Oceanobacillus picturae OX=171693 GN=racE PE=3 SV=1\nMEQAIGVIDSGVGGLTVAYELMRQLPKEKLIYLGDTARCPYGPRSEEEVKKFTWELVDFLLEKNIKMLVVACNTATAFTLQELQEKLDIPVIGVIQPGARAAIKFTRNNNIGVIGTEGTIRSEAYTKALESIHSSIKVNALACPLFVPMVEQGILTGKKAQEVVESSLSPLMEGEMDTLILGCTHYPLLKQTIQNVMGEQVTVISSSEETARETSTILDVHNIIKTGDVIPVHEFYTTGELEIFIEIAKSIFKDPYLQMVTIKKAQLGQTQKT\n>tr|A0A5D2YB87|A0A5D2YB87_GOSMU HIT domain-containing protein OS=Gossypium mustelinum OX=34275 GN=E1A91_A08G187300v1 PE=4 SV=1\nMARAISPCIFCQIAGSSNSTPLLHSVRSLDDKVVAFKDINPSAFRHYLVVPVEHIPTVNDLQRRNEDYTLVSHMINVGETLLRRDAPQSNQYRFGFHQPPFNSVDHLHLHCFALPFIPRWKQLKYMSLGPLGGFIEAEKLLEKIKPLSPIPP\n>tr|A0A1L8DSH3|A0A1L8DSH3_9DIPT Putative ubiquitin carboxyl-terminal hydrolase 46 OS=Nyssomyia neivai OX=330878 PE=4 SV=1\nMGANISQLERDIGSDQFPPNEHYFGLVNFGNTCYSNSVLQALYFCRPFREKVLEYKAKNKRTKETLLSCLADLFYSIATQKKKVGSIAPKKFIARLRKEKEEFDNYMQQDAHEFLNFLINHINEIILAERNIKGKITTGNTETPPEPTWVHEIFQGILTSETRCLNCETVSSKDENFFDLQVDVDQNTSITHCLKCFSNTETLCSDNKFKCDNCCSYQEAQKRMRVKKLPMILALHLKRFKYMEQYNRHIKVSHRVVFPLELRLFNTSDDALNPDRLYDLMAVVIHCGSGPNRGHYISIVKSHGFWLLFDDDMVDVYIFLNCARKKN\n>tr|A0A428EVY3|A0A428EVY3_STRIT Uncharacterized protein OS=Streptococcus intermedius OX=1338 GN=D8829_03240 PE=4 SV=1\nMTKRYNINKIFESIITSRTRETFEVTESLIELGKIVGTRPVAFKQLYKAYRSLETSFSYTPVIGAPISCRFDYDKEEATLAYLDLSADLSLADFTDFMGVIDSVYSSIYPIGTVVELDLDLLPPHLHRLFTDGPGALVTITGRKLPVRGKFGEYIVDYLARLWPFGELPGVAPIYVNNMMIRQVHQEGLRNDWEDEFTEDILRSNQLSAQLVSTAFMRKEDNAVYVQELLKEATHELSH\n>tr|A0A436AXU5|A0A436AXU5_9HYPH Antibiotic biosynthesis monooxygenase (Fragment) OS=Mesorhizobium sp. M7A.F.Ca.CA.001.08.1.1 OX=2496691 GN=EN913_26470 PE=4 SV=1\nMSGFVVWVDFRLKPGARGRFRELVDANATASVRREAGCRRFDVTQARGEP\n>tr|A0A4Q2S8K2|A0A4Q2S8K2_9ACTN Maleylpyruvate isomerase family mycothiol-dependent enzyme OS=Nocardioides glacieisoli OX=1168730 GN=EUA06_04035 PE=4 SV=1\nMTRLPSETYLDHLRTESARFREVLTACDPAARVPSCPDWSAADLLWHLATVQRWWAEVVAARPTRPEEVDPPRPESYDELLATFDEWSAELARVLEAADPAEEAWNWSDDHTVGFILRRQAHEALIHRVDAELAAGDRTDLEPLLASDGVHECLAVMYGGCPPWGRWEPGEDLVRVDVTDTGEEFWVRFGIFSGTDPESGTTYADEEDFHVVDAPEDDAVEPDVVVDGTAAALDLWLWSRSDDEELSVVGDEAVLDRFRAIVGSPIN\n>tr|A0A2W5D315|A0A2W5D315_9PSED Recombination protein RecR OS=Pseudomonas kuykendallii OX=1007099 GN=recR PE=3 SV=1\nMSFSPLIRQLIDALRILPGVGQKTAQRMALQMLERDRSGALRLAHALNEAMERVGHCKRCRTLCEEELCPQCADPNRDDSLLCVVQAPMDVFAVDQTGFRGRYFVLKGHLSPLDGLGPEAIGVPELLARIAEGAFSEVILATNPTVEGEATAHYIAQLLIPKGLSVSRIAHGVPLGGELDLVDGGTLAHAFNGRKAITL\n>tr|A0A4P6U3H2|A0A4P6U3H2_STRSO Catalase OS=Streptomyces seoulensis OX=73044 GN=D0Z67_28970 PE=3 SV=1\nMTDIPRTTTDSGAPVESDEHSLTVGPAGPILLQDAYLIEQMAQFNRERIPERQPHAKGSGAFGHFEVTGDVTPYTKAAVFQPGTRTDLVARFSTVAGERGSPDTWRDPRGFAVKFYTSEGNYDMVGNNTPVFFVKDPMKFQHFIRSQKRRADNNLRDHDMQWDFWTLSPESAHQVTWLMGDRGVPRTWRHMNGYTSHTYMWINEAGEEFWVKYHFKTDQGIEFFTQDEADQMASADTDYHTRDLFEHIRDGEHPSWTLYVQIMPYADAAEYRFNPFDLTKVWPHGDYPLIEVGKMTLDRNPTDNHAEIEQLAFQPNNFVPGIGPSPDRMLLARLFSYADAHRYRIGANYAQLPVNAPITDVHTYSKDGAMAYRKTSDPVYAPNSKGGPAADTAEFGKPPTWHTDGDITRTAYATHAEDDDWGQAGALVREVLDDDARDRLVDNVVGHLLNGVTEPVLERAFEYWTNIDPKIGARIAEGVRAKADAKDPKAADQGNPARSSMQHKA\n>tr|A0A2U3P8A5|A0A2U3P8A5_9MYCO Endonuclease III OS=Mycobacterium numidiamassiliense OX=1841861 GN=nth PE=3 SV=1\nMNRTLAQAFPDAHCELDFRTPLELTVATILSAQSTDKRVNLTTPALFVRYTSALDYAQADRAELEELIRPTGFFRNKASSLIGLGQALVERFGGEVPSTMDELVTLPGVGRKTANVVLGNAFGIPGITVDTHFGRLVRRWRWTEDEDPVKVEHAVGELIERKEWTLLSHRVIFHGRRVCHSRKPACGVCLLAKDCPSYGLGPTDPLLAAPLVQGPETEHLLALAGL\n>tr|A0A3S5CJ78|A0A3S5CJ78_9PLAT Uncharacterized protein OS=Protopolystoma xenopodis OX=117903 GN=PXEA_LOCUS6098 PE=4 SV=1\nMLNQYYKIKKKSESVHEDSRRKNRELLERHNADLRLFDSESTRLGINTDALLGANTVSELIPPGASHLNNLARHFSAMQSVVIDTSSTSSSCGSTGRAAPTASGETNSSGRLVFANRNSMIVLNAGNTAHMSGHHVSMSESDSPGQNQR\n>tr|A0A1V2VH64|A0A1V2VH64_9BURK Aliphatic amidase OS=Herbaspirillum sp. VT-16-41 OX=1953765 GN=amiE PE=3 SV=1\nMRHGDISSSKDAVGVAVVNYKMPRLHTRGEVLENARKIAAMLVGMKQGLPGLDLVVFPEYSTHGIMYDRDEMFETAATIPGEETAIFSEACRIAGVWGVFSLTGERHEEHPRKVPYNTLILINDQGEIVQKYRKIMPWTPIEGWYPGDTTYVCDGPKGLKVSLIICDDGNYPEIWRDCAMKGAELVVRCQGYMYPAKEQQIMVSKAMAWMNNLYVAVANAAGFDGVYSYFGHSAIVGFDGRTLGECGTEEMGIQYAELSIGAIRDARRNWQSQNHLYKLLHRGYTGKINSGESPAGVAECPFDFYRTWVNDPQAARAQVEALTRNSAGTPECPMPGIPTEPAA\n>tr|A0A370VY99|A0A370VY99_9ACTN ABC transporter ATP-binding protein OS=Streptomyces sp. M7 OX=255705 GN=DWC19_11045 PE=4 SV=1\nMIGVAPPAYDPAAPTTAHTLPVGAPATVRAYVAELFRRHRRAFLLLVLVNTVAVVASMVGPWLLGGLVERVSDGAAGRDLRLELTVGLFVAALLVQAAFVRQVRLRGAMLGERMLADLREDFLVRSVGLPPGVLERAGTGDLLSRITTDIDRLANAMREAVPQLAIGVVWAALLLGGLVATAPPLAAAVLVAVPLLVAGCRWYFRRAPSAYRSEAAGYAAVAAALTETVDAGRTVEAHRLGERRIEQSDLRIKQWTAWERYTLWLRSVLFPVINVTHVTVLSSVLLIGGVFVLQGWIGVGQLTTGALIAQMLVDPVGLILRWYDELQVAQVSLARLVGVRDIEPDAGDARLTPDGRDVHADRVHFGYREGVDVLCKVSLEVAPGTRLALVGPSGAGKSTLGRLLAGIYAPRDGRVTLGGAELSRMPAERVRAHVALVNQEHHVFVGSLRDNLLLARTGAGDAELWEALRAVDADTWARALDEGLDTEVGSGGFALTPAQAQQIALARLVLADPHTLVLDEATSLLDPRAARHLERSLARVLDGRTVVAIAHRLHTAHDADLIAVVENGRVSELGSHTELVAADGAYAALWRSWHG\n>tr|A0A150FR67|A0A150FR67_CLOPD Uncharacterized protein OS=[Clostridium] paradoxum JW-YL-7 = DSM 7308 OX=1121328 GN=JWYL7_1169 PE=4 SV=1\nMGRLERTLEKKKNKKAKRVGYCIFILIIFMLILGVNIVDYRINTFMGNYNRALILRVYDFTKGLSLLQR\n>tr|A0A7G6UKH5|A0A7G6UKH5_PSEMX Uncharacterized protein OS=Pseudoxanthomonas mexicana OX=128785 GN=H4W19_14390 PE=4 SV=1\nMAVRYYISLPDPARARGGDPAFSFDAHGADEFAAQLQHALRTSSLFERWRARQDDPDDVDPGLGAVDPDAAVAGQQDDLSILLVARSSIPGHVLKHRLRLLAGRAWELRDVAAA\n>tr|A0A4Y8KC96|A0A4Y8KC96_9MICO Triosephosphate isomerase OS=Cryobacterium sp. Hb1 OX=1259147 GN=tpiA PE=3 SV=1\nMNINPRRTPLIAGNWKMNLDHLQAIAFVQKLAWNLKDAGHDTAAVEVAVFPPFTDLRSVQTLISADKLPLAFGAQDVSAHDSGAYTGEISGAFLAQLECQYVIIGHSERRTLHNESDEQVAAKVTAALKHNLVPLICVGESAEDLAVHGPSAVPVAQLRAALAGVTNAVDIVVAYEPVWAIGSGQAATPEQAEQVAAALRGVLSDTLGQDVADKTRILYGGSVKSTNIAAFMREPNVDGALVGGASLDIAEFSSIIRYQKHVGL\n>tr|A0A328IIY1|A0A328IIY1_9MOLU Thymidylate kinase OS=Candidatus Phytoplasma oryzae OX=203274 GN=tmk PE=3 SV=1\nMKFIAFEGLDGSGKTTQINLLKVVLTKEYRKKVTVIQGLGSSIIGPMLREMFLYQTKITPFTRMWLSFANMEQTQTEIIQPALENNHIILADRWIASTYAYQVFGHYLDIPLKKFHKLHCSFFFQPAITFYFDIKPAIGLIRKQQKLDYEPDLFEKKGIAYFEQVKRGYDYFFKKDFLVKNYNADIPKSILFKKVITFLKEKKIIEFRI\n>tr|A0A502MPE9|A0A502MPE9_9HYPH 4-hydroxybenzoate octaprenyltransferase OS=Mesorhizobium sp. B4-1-3 OX=2589889 GN=ubiA PE=3 SV=1\nMETVQSKVIQGRVADAPSGHWVYRVLPRWVWPYAQLARWDRPIGWQLLLWPCWWSAALAAGAYPRPTDPLLTLLPAPWYLLLFFIGAVAMRGAGCTYNDLADEDIDNQVERTRSRPLPAGKVTRRQAWAFVIIQALVGLAVLLQFNSFAIPLGIASLAIVAVYPFMKRITNWPQFVLGLAFSWGALMGWAVEFGDIDDPAIMLYIGSILWVIGYDTIYAHQDKEDDAIVGVRSTARLFGDNTKMWLTGLYGGALICFAIAFASAQAPIVALAGLIAAGAHMARQIIRLDINNPDQCLKLFKSNNQVGWLIFLGLIGGSVWIWLKPLV\n>tr|A0A3S1L2A4|A0A3S1L2A4_9HYPH Flagellar biosynthetic protein FlhB OS=Mesorhizobium sp. M1E.F.Ca.ET.063.01.1.1 OX=2496750 GN=flhB PE=3 SV=1\nMAEAVDKDSKTEEATEKKIRDTIEQGKLPHSRETAIFASFLAILVFAVFYAKDAVVDLGMFLSTFLEKPEAWPMDTETDVITLYEQVLIEIGRAVVSLLVLLVVAGIGASVFQNMPQLVGERIRPQLSRISIAKGWSRLFGVQGFVEFGKSLAKLAFAIAVLAFTLSEDHRRLLAGMITNPVSFGMVIRGIFVDILVSIVFVMGLIAVADIVWSRFHWRRDLRMTKQEVKDELKQSEGDPIVKSRLRSLARDRARQRMMTAVPRATLVIANPTHYSIALKYVREEDSAPVVLAKGQDLVALKIREIAREHNIPIFEDVALARSMYKQVSVDSVIPSQFYQAVAELVRIVYSKKAVRRVPS\n>tr|A0A6P7RXF0|A0A6P7RXF0_MUSCR Pendrin OS=Mus caroli OX=10089 GN=Slc26a4 PE=3 SV=1\nMAGRGGRSEPPQLAEYSCSYAVSRPVYSELAFQQQRERRLPERRTLRDSLARSCSCSRKRAFGVVKALLPILDWLPKYRVKEWLLSDIISGVSTGLVGTLQGMAYALLAAVPVQFGLYSAFFPILTYFVFGTSRHISVGPFPVVSLMVGSVVLSMAPDDHFLVPSGNGSALNSTTLDTGTRDAARVLLASTLTLLVGIIQLVFGGLQIGFIVRYLADPLVGGFTTAAAFQVLVSQLKIVLNVSTKNYNGILSIIYTLIEIFQNIGDTNIADFIAGLLTIIVCMAVKELNDRFKHRIPVPIPIEVIVTIIATAISYGANLEKNYNAGIVKSIPSGFLPPVLPSVGLFSDMLAASFSIAVVAYAIAVSVGKVYATKHDYVIDGNQESTGGKTQVAGLISAVIVMVAIVALGKLLEPLQKSVLAAVVIANLKGMFMQVCDVPRLWKQNKTDAVIWVFTCIMSIILGLDLGLLAGLLFALLTVVLRVQFPSWNGLGSVPSTDIYKSITHYKNLEEPEGVKILRFSSPIFYGNVDGFKKCVNSTVGFDAIRVYNKRLKALRRIQKLIKKGQLRATKNGIISDVGSSNNAFEPDEDVEEPEELNIPTKEIEIQVDWNSELPVKVNVPKVPIHSLVLDCGAVSFLDVVGVRSLRMIVKEFQRIDVNVYFALLQDDVLEKMEQCGFFDDNIRKDRFFLTVHDAILHLQNQVKSREGQDSLLETITLIQDCKDPLELMEAEMKEEELDVQDEAMRRLAS\n>tr|A0A1I3Q7I7|A0A1I3Q7I7_9DELT tRNA uridine 5-carboxymethylaminomethyl modification enzyme MnmG OS=Desulfomicrobium apsheronum OX=52560 GN=mnmG PE=3 SV=1\nMTIPTVPDIFDVIVVGAGHAGCEAAMAAAHMGMQTLLLTINADRIGHLSCNPAIGGLAKGHMVKEIDALGGMMGKWADQAGIQFRILNTRKGPAVRSSRAQIDRTEYVRVVQQDIFTCPNLFVRQETVASLTVEDGRVTGVVTTLGETIACRAALLTTGTFLQGLIHVGLDSFSGGRQGDPASHGLSPRLTELGFELGRLKTGTVPRLLKSSIDYSVMEEQAGDNPPRPFSFDSPGIKLRQLPCFVTYTTERTHEIIRTGFDRSPMFTGVIKGTGARYCPSIEDKIARFPEKDRHQIFVEPEGLTSHEVYPNGIPTSLPLDIQKALVTSIPGLEKAQIIRPGYAIEYDYVPPTQLKPTLETKLVRGLYMAGQINGTSGYEEAAGQGLWAAINAVLALRGEPELILTRSQAYIAVLVDDLVTKGTLEPYRMFTSRAEHRLLLREDNADERLTAIGRELGLVDDSRWQRFTRKQAAVNEIMTGLESIRVRPDAATKDLVEAMGGTIPQKSVSLKELLRQPELTIEVLAPLWPELENFDEEALEEAEIKAKYEGYLRRQQELVDRFEKMEQTALPEDMNYVGIPGLSREVTEKLTRIQPRTLGQAGRISGITPAALSCLEIQLKKIGRL\n>tr|R6KI73|R6KI73_9CLOT Type I restriction-modification system S subunit EcoA family protein OS=Clostridium sp. CAG:265 OX=1262787 GN=BN573_01150 PE=4 SV=1\nMKKVRDKYKMTELGEIPSEWHIEVLGECSNVTKLAGFEFTEYIEYIDDGEIIALRALNLKNGKLNLEDIKKIDKKVSESLTRSKLYINDVLFSYVGTVGEVALIEENDKFHLAPNVAKLTFNDSVVPKFALQYLMSSNMRNEINRYVTTTSQPALSMENIRKLKIIVPKKEEQEKISFILSTVDEQIDNVDALIEKNKELKKGLMQTLFTKGIGHTKFKNTEIGEIPEEWDVKKIGDICEVKGGKRLPKGYQLEDEDNAFPYIRVADMYMGGIRQDDIKYVPKDIVDKIKNYKISKDDLFISVAGTLGIVGQVPYELDGANLTENADKLCNIQINKLYLMKVLQSNIVQSIIEAEQTKSAQPKLALTRIKEFLIPVPSDIEQVKIASILMEVDEKIGQYKNKKQKLEELKKGLMQQLLTGMIRVTV\n>tr|A0A669D541|A0A669D541_ORENI Uncharacterized protein OS=Oreochromis niloticus OX=8128 GN=miga1 PE=3 SV=1\nVSVCCTQVMRAPNSENIHTVLRIRELPSHGQSVTMTHETLTSSQLSMRTAALRMVDLPLSVYSSLTQVRIVSTDTKKLVVATAFGAVSLLFLARRFQRRKGRKKVHPQHWEQAGLEFHPPAAGENDNTSQNITLSLNSKNGYSSDLVLSAGGYRKLSGSVMSLASVKSLNSSSSSTCANDSTCWDGVEDADSCSVLNLPVTTPENLYLMGMDLFEEALRRWEEALTFRSRQAEDDASCASVKTGAGDTIAEQSMEDVISAEFIHRLKALLHRAYRLQEEFEGVLGMSEPSSHMADILSREELDDACLRDSISIASTDSFVSAAEMSEHRELRSVFTLGHHPLYEEAHGNLYSVVIVPLTEMLECLGDLDFLAKLHCVRQAWQLILCDRTTWTFLADTGKKILSSIIVKAHKSPKRFEEVFEEMISFLEHTEHWENTELELATRGVKHLNFYDIVLDFILMDSFEDLENPPISIQNVINNRWLNSSFKETAVASSCWSVLKQKRQHMKVSDGFIAHFYSVCEQISPVLAWGFLGPKGSLHDLCCFFKDQVLHFLKDIFDLDKVRYCSVESLADDVLQLLHRRSELLLAYLGADSLRYLNGCNSPPVQLVPSALLEARVQ\n>sp|A3CWV2|FEN_METMJ Flap endonuclease 1 OS=Methanoculleus marisnigri (strain ATCC 35101 / DSM 1498 / JR1) OX=368407 GN=fen PE=3 SV=1\nMGVAIRDILADCKETLTWDDLSGIAALDAHNALYQFLSIIRQPDGTPLMNGAGRITSHLSGILFRTVNFLEKGIRPVFVFDGKPPEFKQETINERREHRARADEAWKTALREGDMEEAYKQASASARIDSHTIASSRELLDLLGIPWVQAPSEGEAQAAYMARQGKVTYAVSQDYDSLLFGSPVLVRNLTVSGRRKTRGRTITVNPERIVLSSFLDRLGVTREQLVKIGILVGTDFNPGIRGVGGKTALKIVRNGEFESVIAEKQPDFNPAPIRDFFLNPPVTDDYTLEWRTPDVEGVVEMLCGRYDFSEERVRSALAKVSVKATQKTLDAWF\n>tr|A0A3S4B8B4|A0A3S4B8B4_9ACTN MBL fold metallo-hydrolase OS=Streptomyces albidoflavus OX=1886 GN=EQK42_07550 PE=4 SV=1\nMRFIKKRHSCVRLEKESGTLVIDPGGFTEPDAALGADVLLVTHEHPDHFDEGRLRAALEASPAAQLWTLASVAEPMAAAFPGRVHTVGHGDTFTAAGFGIEVHGELHAVIHPDIPRVTNVGYLVDGEVFHPGDALTVPDRPVETLLLPVMAPWNKLSEVVDYVREVRPTRAYDIHDALLTDLALPVYERQIGALAGTDHHHLGPGTFTEV\n>tr|A0A5J4FE44|A0A5J4FE44_MICAE Uncharacterized protein OS=Microcystis aeruginosa NIES-4325 OX=2569534 GN=MiAbW_03334 PE=4 SV=1\nMYQMNKTAIDQWLKGVGAFLFQNFGVHLFIENQNNLKKA\n>tr|A0A5E7AN68|A0A5E7AN68_PSEFL Glyco_trans_2-like domain-containing protein OS=Pseudomonas fluorescens OX=294 GN=PS720_01060 PE=4 SV=1\nMASRKFGLNLVIVLAIAALFSGFWALINRPVTAPNWPEQISGFSYSPFQQGQYPQKDQYPTDDQMRRDLEIMSKLTDNIRTYSVDGTLGDIPKLAEEFGLRVTLGIWISPDLERNEREIQRAIEIANSSRSVVRVVVGNEALFREEITPEALIVLLDRVRAAVKVPVTTSEQWHIWEKNPQLAKHVDLIAAHILPFWEYIPMDKAGQYVLDRARDLKKLFPKKPLLLSEVGWPSNGRMRGGNETSPADQAIYLRTLVNKLNRQGFNYFVIEAFDQPWKVSDEGSAGAYWGVYNAARQQKFNFDGPVVAIPQWRVLAIGSVVLALLSLTLLMIDGSSLRQRGRTFLTFIAFLCGSVLVWIGYDYSQQYSTWFSVTVGILLALGALGVFIVLLTEAHELAEAVWTHKRRREFLPVEGDSDYRPKVSIHVPCYNEPPEMVKQTLDALAALDYPDYEVLIIDNNTKDPAVWEPVRDYCETLGPRFKFFHVAPLAGFKGGALNYLIPHTAKDAEVIAVIDSDYCVSPNWLKHMVPHFADPKIAVVQSPQDYRDQNESTFKKLCYAEYKGFFHIGMVTRNDRDAIIQHGTMTMTRRSVLEELGWADWCICEDAELGLRVFEKGLSAAYYHDSYGKGLMPDTFIDFKKQRFRWAYGAIQIIKRHTASLLRGKGTELTRGQRYHFLAGWLPWVADGMNIFFTVGALLWSAAMIIVPTRVDPPLLIFAIPPLALFVFKVGKIIFLYRRAVGVNLKDAFCAALAGLALSHTIAKAVLYGFFTTSIPFFRTPKNADNHGFWVAISEAREEMFIMLLLWGAALGIYLVQGLPSNDIRFWVVMLLVQSLPYVAALVMAFLSSLPKPAPKVELATAE\n>tr|A0A7S1LF74|A0A7S1LF74_ALECA Hypothetical protein (Fragment) OS=Alexandrium catenella OX=2925 GN=ACAT0790_LOCUS8164 PE=4 SV=1\nMCEAQIQKDDGDQKKQGHTAFATATMARDLAREAGDLRAEAEALHAMALAQERLDCFEEALRYADEAMDLYLELKDKRREAGELLSMADLSLCLGDFKQALIHAEDAMSIYQELGSKSEVEAIQTVYRVLVCRGDFQAARKIANRGLKRFHDLGNIKAQSQMMFMLINLNCKEGEIEYLTDKTRNKYKDALEVTQKALRLMHQLGEKQIEARLLVVLSALCLRLDRLDGALLAGQQALKMIKETGDTPWTSSARYFIENNSGLSSSNMGDVLFTLSHAYMKKDQHEEALALAQDLQQYFRENSNRRGEAAALMTINTCYLKLDLKPEAMKVAMQAQMLFNEAGDAAGEAYVLRALMDAEWEREDYAAAVRLGERAAALFREVEDRRSEAGVLYGIAVNNIHMAVRMGARVGDGGAGQRYYGERTRAITEALAKAQRAAENGVRLCKELMQETSKAGQLLAASLATLAQVHMFNSKPATALECADEAVILFREQGDYHSEGSALLQSADALRVTGQYEEAKEAAEEALSLCQKYEDEAGVMVAK\n>tr|A0A7R8YYH3|A0A7R8YYH3_HERIL Hypothetical protein OS=Hermetia illucens OX=343691 GN=HERILL_LOCUS11551 PE=4 SV=1\nMVAVPYLFNEVYDIFRKAPFYTVVLEVLLLISVVWVIFYNNKNKRKRYTPEQEEEIIAKWQPEPLVGDTPADHPALFPRIVEGRVGKRINVDGHDCLNLATHDYLGLLEDEGIRKAAITSLRKYGVGSCGPRGFYGTLDVHLELEERLAKFMEMEEAVVYSYGFSTIASAIPAYSKRVDIIFADEKVNFAIQKGLDASRSTIYYYKHNDMKDLERLLIEQQKRDEKNPKKAAKTRRFLVAEGIYMNTGEICPLPELVELRKKYKLRLFLDETISFGTLGENGRGLTEHFNVDRIEVDLIIGGLENSVASIGGFCVGSSFIVEHQRLSGLGYCFSASSPPLLTQAAICALDRFENEPKMFAQLQESTTKLHNKLGSLTHMSLGGNKISPVKHLYIKESRDVDTERALLKEIVGKCIEKGLAVIDAQYLEHIEKHCPRPSLRITANRLLEDKDIDFAFQTLEKVSSDILS\n>tr|A0A3D9YZA5|A0A3D9YZA5_9HYPH TYR_PHOSPHATASE_2 domain-containing protein OS=Methylovirgula ligni OX=569860 GN=DES32_1626 PE=4 SV=1\nMPRIHVCSLFQIADVTAATGARSLITVINQGIYVDRPPAIAPERHLQVAISDVCEETEGHILADSGHIQSLIDFVRAWDQAEPLVIHCFAGVSRSTAGAFIAACTLNPQVNEAEIARRMRRASPTATPNIHLVSLADQALGRDGRMITAIREIGRGAECFEAEPFALELY\n>tr|W1WC24|W1WC24_ECOLX Transposase_31 domain-containing protein (Fragment) OS=Escherichia coli DORA_A_5_14_21 OX=1403943 GN=Q609_ECAC02469G0001 PE=3 SV=1\nMSKKQSSTPHDALFKLFLRQPETACDFLAFHLPAPIHALCDMKTLKLESSSFIDDDLRESYSDVLWSVKTEQGPGYIYCLIEHQSTSNKLIAFRMMRYAIAAMQNHLDAGYKTLPMVVPLLFYHGIESPYPYSLCWLDCFADPKLARQLYASAFPLIDVTVMPDDEI\n>tr|A0A811T4R2|A0A811T4R2_9EURY Uncharacterized protein OS=Candidatus Argoarchaeum ethanivorans OX=2608793 GN=EMLJLAPB_00228 PE=4 SV=1\nMIENEKEIIFHPYALYKMNKRNISKQEVIKTLKEPHSGMDGQYGRRISQRVYGHHVLRVIFEEYEDHILVITAYPAKAERYLGRM\n>tr|A0A022PN75|A0A022PN75_ERYGU Uncharacterized protein OS=Erythranthe guttata OX=4155 GN=MIMGU_mgv1a007123mg PE=4 SV=1\nMLELRGMSELTEWLQAELRSAAPENDQRLVVFPRLEYLQIIYCRQLKSAPSHFPCLKELLIDGVESELPLVSICGINLISLTKLHIHSIDGLTCLPNCLFRKNQNLSMLVISGCRNLTHLVPCLEGGGTALRNLEIWDCPELRELPDDLHTLSALENLAIYGCSKLKTIPYPYETHNDDDDEQLLLGLSCLRRLFIEYCDELTNLPIELCAESLESLTLRGLMNLRMTMGTLIGYCMQKMPRLSELRIVDVPTTNNPWEIVGSVTLGNLRDLTISCDEYSVSAVDAILKASAKSLHRLTLLGTEHSRELPGQLQHLTALSELGLYDFGEMEELSDWLIGNNNNNNLSSSLQILHLSRCKKLRYLPSKEAMLHLTKLYISNCPMLHIKGGDSDYGSEWPKISHIPYVVLDWVQIPTHAQ\n>tr|A0A0N0T8W0|A0A0N0T8W0_9NOCA Chaperone protein HtpG OS=Nocardia sp. NRRL S-836 OX=1519492 GN=htpG PE=3 SV=1\nMETLEFQSEARQLLQLMIHSIYSNKDTFLRELVSNASDALDKLRLESFRDKDMVVDTDDLHIVIESDPAQRTLTVRDNGIGMTREDVVRLIGTIAKSGTAEFLRKAKEQQAGAGSDLIGQFGIGFYSSFMVADKVTLLTKYPHAEKGVRWESTGESTYTIEDVDDAPQGTSVTLHLKPSDDEDQLPDYTEPAKIREIVKRYSDFITWPVRLGGEEINSRKALWARPASEVTEEEYAEFYRHISHDWNAPLETIRMQAEGTFEYQALLFLPAQAPLDLFMRDGKRGVQLYVKRVFIMDDCAELMPEYLRFVKGVVDAADLSLNVSREILQQDRQIQLMRRRLVKKVLSSIKALMGSRPDDYAKLWREVGAALKEGLLSDADNRDAILEICSFASTHSAEAPTTLADYVSRMKDGQEHIYYMTGDSRTSVEHSPHMEALRAKGYEVLILTDPIDEMWVDAVPAFDGRQFQSVAKGQVDLETEEEKSAAKAKAEEFGDLLTWLQGLLEENVKEVRLSSRLTTSPACVVGDAHDITPTLEKMYKAMGQELPKIKRILELNPSHPLVEGLHKAFAAGERDALADTAELVYGLALLAEGGELADPSKFVKLVADRVQRTF\n>tr|A0A4V3UMH6|A0A4V3UMH6_9EURO PKS_ER domain-containing protein OS=Aspergillus tanneri OX=1220188 GN=EYZ11_013270 PE=4 SV=1\nMQRARVRAGKPEKLEHSSPQRFNIGAENPRKISRTKRNTRKYATFPTNSSTLTLLQPDLSSTRLELVDRPIPIANPDANEHLIRVHCTAPCAGELGWYAYVSLPDREPVPCDDMAGTVVTAPPNSPFQPGDEVYARSTFNRPGCARDYTVVVTDELARRPQNLSWAESAATPLSAETAWQALFEQSGIGGFSSSAWKGKRILVTAASSSTGMWLVQLGRIIGAQIIGTCGPNNVDLVRGLGAVDVVNYRSQSLREWGQNEENKVDLVIDCIGGQSLEDAWRCVRDQGIVISICRSPNEVKPAEVTAKEVRGLFFIMTPRRSDLEEITKLVEAGECRPLVDSVWPLEQFQSVFDRVEGRHARGKVVMDLRLNRKLES\n>tr|A0A1H5GDJ1|A0A1H5GDJ1_9ACTN Succinate--CoA ligase [ADP-forming] subunit alpha OS=Streptomyces sp. Ag109_O5-10 OX=1855349 GN=sucD PE=3 SV=1\nMAIYLTKESKVLVQGMTGGEGMKHTRRMLAAGTDVVGGVNPRKAGRTVDFDVPQCPNGLGGAPTAVPVFGTVAEGMAATGADVTVVFVPPAFAKAAVLEAADAGIGLAVVITEGIPVHDSVAFTSYARRNGTRIIGPNCPGLITPGQSNAGIIPADIAEPGRIGLVSKSGTLTYQLMYELRDVGFSTCVGIGGDPVVGTSHIDCLAAFEDDPDTELVVLIGEIGGDAEERAAAYIREHVTKPVVGYIAGFTAPEGRTMGHAGAIVSGAAGTARAKQEALEAVGVRVGSTPTETARLVLELLKAGS\n>tr|A0A2P7YVD5|A0A2P7YVD5_9ASCO Uncharacterized protein OS=[Candida] pseudohaemulonii OX=418784 GN=C7M61_001726 PE=4 SV=1\nMSTWQAHTDHSATSPRSTLPATKQLDSDATPRMSHLPTPLGELKLLVNNDLLRKNPNFVTSEAALSSTIEQLDLETLKISAYARLDFENYTFFVQTLQVVLGRKAVEDAAPTHHAVDVHLSSKKAISRRHAKIFYNFGTQRFEISILGRNGAFVDDQFVETGITVPLVDNTKIQIGDIPFTFVLPSLEPPEKKNATPAKPFNPSDAINLRSNLYLNPASPNRKKSLTDEQKKARRNLRADIVRRLSNARRKSLASSTNDEITALLKELEDIGDDDESDPFDKEVNELLRLGNLEAEEDELDELVKQHNLLQGIGVEDKDRKDVDVDMSVLDQEIASLAPLIDGQHPEKDAIDNKQGVYGRHGTTLATDTADNKNAPLMGRPAGPRMGKPAQIQPPANRAYGRQPVGPMYGYPNSGAYPQGYNSPYGSPAGYPTGARNSMYHPMMMPTRPPPPKLEVEVETISTVPVKSATIPFKAISTGVGNVQRPPVCVFKTLDIPLNKPKIPLRRKDAPSIKRPKSQGNKDITDQYKSKPTVSITAMITSVLRGPNSRKSGFTFSEICDGIKEFYPYYQYCPDGWQSMITHNLKTHNMFKREFKGGLDSEHLWVIDDDYLAEKERVRKKQQEVAMAKAKEAALKAVELRLKQLTPQYGAVGRPFMTPYASSFGQPRYPTSRDLSPPMPNGAPGQKPKSIAELASEIKRDSPGALNQSSYLPRLSLSPTVNSAEQSNSIKDQLAANRSASASLTNITSDVKTERSSPTPQPVAAAAAAVSANTNSGLVSKLLPMNADTKKSLGYLQKELFTLYKARKLSYNTATTTNIITKALATTIAQVNTIGAKAGCGDNALSFLVEKAPQQVSKILDIALTKSIKEVEGKLSNPTSKESTPVPTASPAASNIGLVQKPPASIESTSSASRPATPNSPAGGTPKPSYSGGLSRPHFSGMARPQNPSKPGALLKGPLFLSNKPRQEKRPAEETGEDPLKSIKLE\n>tr|A0A6P1IPK0|A0A6P1IPK0_9BURK AMP-binding protein OS=Hydrogenophaga sp. BPS33 OX=2651974 GN=F9K07_06005 PE=4 SV=1\nMTAQVATGWNLANIFDGVAARVPKDRPAIVHGDTVVRWGELDARSNRAARALLATGHTAGERVGFLSRNHPGYIEGFVACLKSRLIHVNLNYRYTVDELAGVLEDAGATALLYQQEFAPLVPALLERLPALRSRICLDGDGLGQATAQFQTMAAQGDASPLDASTREERDPLLLYTGGTTGRPKGVVWPGHHYRACQLESPLVQRRPANLGEHLDLVAANANPGRVLPACPLMHGAGISSTLAELLNGGTALLLAGARFDAHELWQLAERERASRVLIVGDVFARPMLAALDEQPGRYDLSSLKVISSAGLMWSEEVKAGLLRHMPWLVLADIYGASEAAGLGYAITTQDRATPTGRFEPGPRTVMVGDDGHIVPAGQEGEGWLARGEPLPEGYFGDPKKTAEVFRTIDGQRYAVPGDRVRRHADGSMQLLGRGSLVINSGGEKIYVEEVEEALKRLPGVDDVLVVGVPDVRWGSAIVALLRTDTPPDVQALRAGLAPHLAGYKMPKHFLAVDQLPRADSGKGDYKAARALAEQLLETT\n>tr|A0A7D8UVQ1|A0A7D8UVQ1_9HELO Aspartate--tRNA(Asp/Asn) ligase OS=Lachnellula cervina OX=1316786 GN=aspS PE=3 SV=1\nMTIILRAARHMIVRNTRTAVYVSPWRGAAASLVSSWLPSRGFHVSYRLAKEERWGREVEKPEDKERRGRSLEEQGVVEEQEEVEAEALKPQSFWEEFKGTSFVNLYLDNVPPPTFPFEKRIPSHFMALRVTTVGFLTKIVRLSDALTFAHINRGTGPEVLQLLSKNKETTKKLQSMRLNSAISVTGVIHKKYKPKVASKRKELEFEEGWFYLEELELEIEEITCLNTFDKDIGYGPEHVYRPENRHLQIRFDTNLQKALLYRSDVAACAREELKDFYEIETPILFKSTPEGAREFLVPTRRPGFAYALPQSPQQYKQMLMASGIHKYMQFAKCFRDEDLRADRQPEFTQIDLEMAWADGEVVMARVEKLIRALYKKFAAPDTQLQPLFQTPFHRITYDEAMSHHGSDKPDFRIPGLIQQVDHIVPDQLGKMLTHIEYPIFEACKIRLNGHPERIKKFVSMFFSTPVGEVFGKNIDGGPGVAVFDSSRPLEGLQTFGFEGAEKLKALYSNLPQQAFHGKEAHENATTFDDGDLIIVQARKNLPHSGGSTALGRLRIALYRAALAEGLLEPDLYHHYLWVTNFPMFTLENGVDPGQEGTAGFSATHHPFTAPKTAEDVDLLRTDPLMAKADHYDLVVNGVELGGGSRRIHSAKMQRFVMQEVLKMNPRRIEDFSHLLKALSAGCPPHAGLAIGFDRLIAVMRGVDSVKDVIAFPKSSKGEDMLVKSPRRISRKEWKRYHLQKIDLRTENSHKPMEKDATEKPKESKWTRFWNIVTIRK\n>tr|A0A1X1VYA0|A0A1X1VYA0_MYCGO Aminotransferase class V OS=Mycobacterium gordonae OX=1778 GN=AWC08_00950 PE=4 SV=1\nMREAFGEKFDVPAGYLDTAAIGLPFARVADTLVDTIAHWRAGALQVTDFDADVVAARNAWAQLVGVAPLDVVTGASVSQLVGLLAASVPDGTKVLTVHNEFTSVTFPFAAQQRRGITVTEARPAELLSQLRRHDLVAISAVQSADGFTVDLDELRAAAEAARVRVLLDVSQAAGWQQLRLHWAEFVVGAAYKWLLAPRGAAWMAVRRDVLADVVPQAANWSGAEDIWSGLYGLPLRLADNARRLDLSPVWFSQRGAAIALPWLAGLDLSAVRQHCVGLANATLAGLGLDPCNSAIISLGIAAEAAHRLVQAGAAISMRAGRVRLSFHLYNTMEDVELVLSALR\n>tr|A0A0C5V338|A0A0C5V338_9GAMM tRNA 2-selenouridine synthase OS=Gynuella sunshinyii YC6258 OX=1445510 GN=selU PE=3 SV=1\nMSRPDTDDYAAIFLHDTPMMDTRAPGEFLKGAFPHTVSLPLMTDNERAKVGTCYKQQGQQKAIELGHQLVSGTLKEERIQRWLEFARAHPDGYLYCWRGGLRSQIVQQWLQQAGCDYPRIKGGYKALRRFLIDTQERIVSNTRFRILAGHTGCAKTDLLTAVPGSIDLEGLAHHRGSTFGKRPAGQPSQIDFENRLAIALLRQDHQYPGATILLEDESRLIGRCALPETLRRRMAEAPLIIVESTLEQRVEHSFRNYILNKLAEWQQARGAEEGFTAFAEDLTTSLFKIRRRLGGLRYQELSAILEQALKQQQQGDDSLHREWIRILLRDYYDPMYDYQLSQKQGPVEFRGTATDIKNYLLTH\n>tr|A0A7K7XU01|A0A7K7XU01_9PASS SGSM2 protein (Fragment) OS=Mohoua ochrocephala OX=874463 GN=Sgsm2 PE=4 SV=1\nGVVEACLLHMLKRRAAGFLRTDKVAALFTKVGKTYAVAGDVCKKVQELQQQVESRKNQPNGQEPLKRQGSTTSKTPVLTPQAIKHIWVRTALIEKVLDKIVQYIVDNCSKYYEKEALLADPVCGPILASLLVGPCALEYTKLKTADHYWTDPSADELVQRHRIHGAHGRQDSPSKRPALGIRKRHSSGSTSEDRFAASAREYVESLHQNSRTHLLYGKNNVLVQPKDDLEAIPGYLSLHQSADSLTLKWTPNQLMNGTLGDSE\n>tr|A0A4R6GLC2|A0A4R6GLC2_9BACT Coenzyme A biosynthesis bifunctional protein CoaBC OS=Sunxiuqinia elliptica OX=655355 GN=coaBC PE=3 SV=1\nMRLKGKHIILGLTGSIAAYKAAYLLRGLVKEGAEVQVVMTPAAKEFITPVTMSALSGRPVASEFFAANDGTWHSHVDMGQWADLMLIAPVTAATLGKMAHGIADNLLVTTYMSAKCPVYLAPAMDLDMFKHQSTLNNLETLRSYGDVILEPGEGELASGLHGKGRMQEPEQLVEEVVAFFHSKKKLLNKKVLVTAGPTYEKIDPVRFIGNYSSGKMGFALAEELAKEGAEVILVTGPVHLKTTHPNIHRVDVESAMEMHNACLEHFPATDAAIMCAAVADYRPKEQADRKIKRNAGEMNIELQATEDIAAALGQLKTPSQRLVGFALETNDEKQNALAKMQKKNLDFIVLNSLQDNGAGFGVDTNKITILSKDNNAQEFELKQKTEVAVDIVKKLIGELTND\n>tr|A0A4S0Y8E6|A0A4S0Y8E6_9BACT UPF0102 protein EN806_46285 OS=bacterium M00.F.Ca.ET.163.01.1.1 OX=2563906 GN=EN806_46285 PE=3 SV=1\nMAERTLGHRRKAYRRGHRGEWLAALALMLKGYRILARRHRTRLGEIDLIARRGDLVLFVEVKARRTLIEAMEAIGHESERRIEGAADIWLSRQPDYGRLSLRFDMVAVLPWRWPVHVENAFYGRN\n>tr|A0A3G5P5X5|A0A3G5P5X5_9HIV1 Envelope glycoprotein gp160 OS=Human immunodeficiency virus 1 OX=11676 GN=env PE=3 SV=1\nMRVTGILRNCPRWWIWGILGFWMVMSYNVVGKEDLWVTVYYGVPVWKEAKTTLFCASDAKAYEKEVHNVWATHACVPTDPNPQEMELENVTENFNMWKNDMVDQMNEDIISLWEQSLKPCVKMTPLCVTLECQDANFTKANLTNTVTNNSDSIITNGTMKDVMKNCSFNATTELRDKKNKEYALFYRLDIIPLSGENNSASGNYRLINCNTSTITQACPKVTFDPIPIYYCTPAGYAILKCNNKTFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEGEIIIRSENITNNAKTIIVQLNKSIEITCTRPGNNIRKSVRLGPGQAFYATNDIIGDIRQAYCIINRTDWSETLQGVGKKLKEHFINKTIVFSPHSGGDLEVTMHSFNCRGEFFYCNTSKLFNSNSTANESNIELPCRIKQIINMWQGVGRAMYAPPIAGTIQCTSNITGLLLERDGGNHNGTETFRPTGGNMRDNWRSELYKYKVVEIKPLGIAPTGAKRRVVERQKRALGIGAMFLGFLGAAGSTMGAASIALTAQTRQLMAGIVQQQSNLLRAIEAQQHMLQLTVWGIKQLQARVLALESYLKDQQLLGIWGCSGKLICTTTVPWNSSWSNKSQNAIWGNMTWMQWDREISNYTDTIYGLLEESHYQQEKNEKDLLALDSWQNLWNWFDISKWLWYIKIFIMIVGGLIGLRIVFTVLSIINRVRQGYSPLSFQTLTPNPRGPDRLGEIEEEGGEQGRDRSIRLVNGFLAIAWDDLRSLCLFSYHRLRDLILVTTRVVELLGRSSLRGLQRGWEVLKYLGTLVQYWGLELKKSAISLLDTIAITVAEGTDRILELLQRICRAICNIPARIRQGLERALL\n>tr|F6HXQ9|F6HXQ9_VITVI Uncharacterized protein OS=Vitis vinifera OX=29760 GN=VIT_09s0002g00830 PE=4 SV=1\nMGVSFKISKTGSRFCPKVVLSDAPLNEEEEEIAKENSRIPDRNESLSNSTTRKLEADIIEGDEDVAGISGSSISSGGLLIPSDNEVSFTLNLFPDGYFIGKPSENETTHQAMLQDVPKLLHPYDRTSETLFSAIESGRLPGDILDDIPCKYVNGALLCEVRDYRKCASEPGFSVPCADGLPIVNKVCLRMSLENVVKDIPLISDNSWTYGDLMEVESRILKALQPQLCLDPSPKLDRLCEKPVPAKLNLSLSSVRKKRLRQMPEANITSSNKIHVKKISMDRAGESLNGRLRDSGPMSGAVMAQHVHENLAAQNVGPINILTPGPKSFVQDASNPALPLASPRSKYQVSVGNPKIMQDHGSGSVVNASGASSSIQDMMISYTDNVHGKRENQDDQLSPLSNMTKRQRLTAVGPEGIQQQHLVPHIDSFHGSDLQWKNAALLPHQLNARGNPYANTGIQKYPQQVFDGVLNQEAASASFAETEKLDRPELNRVKNDMHMGEIESNHLDPQQSRLQSRLPQQIPFMRSNSFQAPWNNITQHIEKDPRKERKLVQSPRVSAQGLVQSPLSSKSGEFSSGSLGPQFGPTATTAVLGASQKDKPAVTSVPPVVGTPSLTSSANDSVQRQNQMQIVPKRRSNSLPKAPAVGSPASVGNMSGPSNANSPSVATPPSADQTMLDKFSKIEIVVMRHQLNCKKNKVEDCPVKKPTFSPQELLGRLSMASHNEDIKDDTCKMPLSKSLAGGSMNVCKLRVLNFVQAERVVQGSVVSVVPRARSTMIMSEKANDGSVAVHHGDVVDGDFLSAEDYVSTLPNTHFADLLAAQFCSLMNREGYHLMEDRVQPKPARMNLASSNQSNAPGISPNNSAAEMQQYSETASGQPHNEVAKPTNSGNTPLNASQNLLANSRMLPPGNAQALQISQGLLTGVSLPTRPQQLNPQPLQQPQQQNPQSLIQQQHSQFQRSSLMLPTNPLSHLSAMGQNSNMQLGNHMVNKPSATLQLQMLQQQQQQQQQQQQQQQQQQQQQQQQQQQQQQQQQQQPMQRKMMMGLGTAVNMGNMGNNIASLQGLGNVMGIGGARGMGSTGISAPMGSISSMGNVGQNAMNLNQASSVTNMLGQQFRNPQLGTMAAKIRMLNPAILGGRQAGIAGMTGTRQMHSHPGSTGLSMLGQNLHRPMNPMQRTGMGPMGPPKLMTGMNLYMNQQQQPQQQFHLQQMQQQQQHHQQQQLQQQQLQQQQQQLQQQHQQETTSPLQAVVSPPQVGSPSTMGIPQQLNQQPQQQQPQQQQASPQQMNQRTPMSPQQMNQRTPMSPQQMSSGAVHPMGTGNPEACPASPQLSSQTLGSVGSITNSPMDLQGVNKSNSVSNT\n>tr|A0A7Y3TR66|A0A7Y3TR66_9FLAO IS701 family transposase OS=Flavobacterium sp. CLA17 OX=2724135 GN=HAV12_33835 PE=4 SV=1\nMPASRAARPTIHFVDEYCQLYEDLFPEVRSYEAFKLLHLGMISEIKRKSLPAIAKAVGLNNQQNLHHFLTESPWQVQQLRQKRLELTLKVLNGRSLILLIDETGDCKKGKSTDYVKRQYIGNVGKKENGIVAVTAYGLVDGMIVPLSFEVYKPRERLKEGEEYQSKPQIAATMIRQLQALGFEFELVLADSLYGESKVNFVDVLDELNLPYILAIRSNHALWLPQDQEVYQEPWQTFKRTFSNGTTETRHMAEVIYGKSHRKQYWLLTTDPDTLPDNSTSYVMVCAPAIKLKDIGDSYGFRTWIEYGLKQAKDALGWADFRMTRYEQIEKWWELVMSTFLMVSLFADPFNDSCPLAHQRFSQHPWWNNQSGWKNLLNNLRLVIQPLVCFNWLKHWLTVFPIASLQLGFEQLTQKMNQFICPRVHQLNLQLIFSSA\n>tr|A0A7G3FQZ2|A0A7G3FQZ2_9BACT CsbD family protein OS=Roseivirga sp. XM-24bin3 OX=2133949 GN=DCO95_02490 PE=3 SV=1\nMSATTDKLKGNWNIIKGKLKQNYADLTDDDLTYTEGQEDELLGRIQRKTGKTKDEIKDFIDSI\n>tr|A0A2T0UIC1|A0A2T0UIC1_9ACTN Acetolactate synthase OS=Glycomyces artemisiae OX=1076443 GN=B0I28_10654 PE=3 SV=1\nMSTPVKAPKPGPQAGSAGTQAAKAQPARPKAPRPAPPLGAPAAAPVLTGAQAVVRALEELEVEAVFGIPGGAILPAYDPLLDSEKVRHVLVRHEQGAGHAAQGYALATGRVGVCMATSGPGATNLVTPLADAHMDSVPIVAITGQVASTAIGTDAFQEADIVGITMPITKHSYLVTTGEEIPRVLAEAFHVASTGRPGPVLVDIPKDILSGSAPFVWPPKMDLPGYRPTTQPHGKQIREAAALIAEAKRPVLYVGGGVVKSGAHAELRELAELTGAPVITTLMARGAFPDSHPQHLGMPGMHGSVPAVHALQKSDLIVALGARFDDRVTGKLDSFAPEAKIVHVDIDPAEIGKNREVDVPIVGDCRAAIAAMTEAYADPGKERLKTWWETLDDLRGRYPLGYTDIDDGLLSPQYVIERLGALAPEDTIWTAGVGQHQMWASQFIKYETPGTFLNSGGLGTMGFAVPAAMGAKLGEMGRTVWAVDGDGCFQMTNQELATCAVEGIPIKVAVINNGNLGMVRQWQTLFYDKRYSNTNLSTHHSEASPRIPDFVKLAEALGCVGLRAETPEEVDAVIAQANAINDRPVVVDFTVGPDAMVWPMVPAGVSNDEILYARDVRPNFDDEGEI\n>tr|A0A1Z2XRM7|A0A1Z2XRM7_9FIRM DUF3502 domain-containing protein OS=Acutalibacter muris OX=1796620 GN=ADH66_10645 PE=4 SV=1\nMSKKILCLILTLALLATCFVGCADKGESKKESSSTPESSAAESSETQSSDTGDKTTDEEPYTVHFAYYIAKESPNMGALSDAVNELAMKELNMKVDLQALTQGTYHQQIPMMLAAGEPMDVFISRASEVGTFIESQYILDCTPYLDKMENAKAALGDDIQACYIGDFLAGFGSMAERATPGAMVVRKDIFDELGFKKEDFDYTLPNMGVLDQITEMYAKVKEKYPDMICFDGTAVPASCAFCFVDNLSSSFGVLETPESTTVVNWFETDMYRRLCEAAMEWYNKGYSSKDIAVNTDGGDVKMKGGNCFSYFQSWKPGVETEKKSQTGYDVEMIQLIDAPKTSYNVNTRLWSIANSSEDPEKAAQFLDWTYKSGEFTDLINWGVPGTDWVLNDDGQADYPEGVTAATVGYHNDKGFSYPNQFNGTLWAGAPKDLWEQYETWHATLKESAAFGFAFNSMPVATEMATLQTVYDKYQKTVGFGTLPDLDAAIQEFNDALYEAGLQKVLDEKQKQLDEWLANK\n>tr|A0A0Z8MB24|A0A0Z8MB24_STRSU Membrane protein OS=Streptococcus suis OX=1307 GN=ERS132461_01172 PE=4 SV=1\nMKKLLTNHFFYLTIAFLLILVIYFSGIDKRWIILASFLYFIPSQILYRRRLKERLQEDQPK\n>tr|K8FB40|K8FB40_9CHLO ATP-binding cassette transporter OS=Bathycoccus prasinos OX=41875 GN=Bathy12g02760 PE=4 SV=1\nMSAVDHRKENVEDPTNRLEQYASLCRDELEAHGGKLPSVEIKCDFDYTLHLPANKIDRSIKTVPGVLTDVAMKIPNKVREKISGKENDATKMEPFRVLKDVDCCFKAGSLTLVLAPPGHGKTSLLKAVGQILPSAVLSGGKGVTYSKMTAEELKEKDIDANRMAMYVTQQDEHLPFLTVRETTKFSHENATPTPTNEREEDVHSRKIDSVHRLLSLENCLDTIIGNDLVRGVSGGEKKRVTIGEAMVTNARVFCMDEISTGLDAAVTHNIIAALREWTRITNGTVIVSLLQPTPEVYELFDDVLCLRDGTPVYHGDVDKVVDHFCGLGFDSENAKKGDVADWLLSVLVDPLAHSKTGASNQFASGDGLRKGWVENSNGLYKKSIGETDCVDKSDGKNMIDLRTPFAKAQYSTAYPKAWPSMYKSVIKRQFQITLRNKVFLSARMFGALITSVVLGSVWFDLPLDRGFERLGMLLFCVLHISFSNFSELTFSVEQKYVAYKQLDYKLFPTFAYIVSSIATQLPIAVLETAIFSCILYPMVGLSMEFENWLVFFINLTCANVAMASFFRVVALLAPNMEAAQTFPGPVIAIMVIFAGFLISPEKMGVLHFLYWISLFAYSLRSLCQNEFLSDQFKYKVPLDPTAAAVYVQGYTGDPKTMAEFCEENAFPCEDAGKITLSTIDISSDKKYFWAGPIFSIGFFCLMTAIGYRALSKIRIQRNIGSSRTSSSEKKKDGENAEEVSISISKVDAEASQRALSFTPMSITWEDLEYTVKVPGEDGKPLSGSKKILNSVTSAAQPSRMLALMGASGAGKTTLLDVIAGRKSGGEMRGTIKLNGHVVKKETFARLTAYCEQQDLHNAFTTVKEALEFSATLRLPSDVSKDARKAVVDEALDILELRGIENRLIGVAGSPSGLSPGQRKVLTVGVELVSNAPVFFLDEPTSGLDSRAALIVMREVKKVANLGRTVITTVHQPSKEIFNLFDDMLLLQRGGYQVYFGPCGVNGKTFVDYLQKIPNAHALPDGMNPASWMLDVLGGTDSSNAGEKSALKKSKSTAAGSLQPAMTMKRSGSGGALNGLLLVERFKASQEGAAGTRLVKELCAKGEKSEMFAFASPYARSFLAQLRCLIQRASLAHNRDVAYNLGRIGILFVLYLLFGFVYFDLDASNETGVQAMVGVIFMTSIFAGIIFMNSVMPVRVRERAVAYRERTSFMYDAVPYSLSHAICEVPWVLLVTFVTVTPLYFMVGLVPTFEHYIFHVLMVFTVSMAFMSLGQLIACLCATIQTAQAGASAFIPICFLFGGLYLPYPQIPVYWKWAYFIDPVAYAIQGVTAPQFEHRGCTGAYPDGDCPTIQAFRGTYFETVDTLAYVEEKYDVQLSQKWYMLIYVAIFVLCMQTLHIIAFKFKKVVAR\n>tr|A0A0B7H5Q7|A0A0B7H5Q7_9FLAO Uncharacterized protein OS=Capnocytophaga cynodegmi OX=28189 GN=CCYN74_10172 PE=4 SV=1\nMNYILPFLSIITGFGTVLIFKPKNQRNIKLLLAFSGAFLLAMTVFTLIPEVFHSLEHSHEHDIHDHNTGKKIGLWIVIGILLQIILEFFSKGAEHGHMHHPHSELKNAFPWSLFISLSIHSILEGFPLHHHHHMVYGIFVHHLPIAMVLTIFFLDSGIGLKKTFIFLILFALMTPFGTLLAEFIPQLGRYHIQISAIVIGIFLHISSVILFETSENHKFNHIKLGTIILGFVAAYFT\n>tr|A0A7I6VAI1|A0A7I6VAI1_AERCA Membrane protein OS=Aeromonas caviae OX=648 GN=WP8S18E04_21180 PE=4 SV=1\nMNLMLYVSTVLIWGSTWIAIAWQLGPIPIEVSVLYRFALAALALFALLTVSGKFPRLPWAGQRYAALLGALLFSTNFLCFYHATLYIPSGLSAVIFASASIFNGLNLWLFEGKRPGLRWLQGSLLGLLGTLLLFWPVLADAQLGANGWKGLLFACAGTLCFSLGNLVSARGQRQGYHVLQMVPWGMVYGVALLQGWVTVLGQSLTLPTDPRYLAAMVYLAIFGSVIAFTAYLTLVGRIGASKAAYATVLFPLVALTLSTFYEGFVWQTVSIVGVVVSLIGNLVIFAPPVKAWRWPLSRAANGTCP\n>tr|H8X476|H8X476_CANO9 Histone-lysine N-methyltransferase, H3 lysine-36 specific OS=Candida orthopsilosis (strain 90-125) OX=1136231 GN=CORT_0C06550 PE=4 SV=1\nMNGNTKNSDYASPLFLDVEDKTEEALTKFQNLQISTYQSKSIAAPSNNKRPEYMTCDCEEEWDGEQEKNLACGEDSNCINRLTSVECTNRHCLCGDDCQNQRFQKRQYADVSVFQTELKGYGLKANKPISEGQFIYEYIGEVIDEGAFRQRMIEYDVKNYKHFYFMMLKPDAFIDATEKGSLARFVNHSCNPNAFVDKWVVGDKLRMGIFAKRKIAKGEEITFDYNVDRYGAQSQPCYCGEPNCIKFMGGKKQTDAALLLPEGIAEALGVTSRMEKAWLKENKHVRADQQKDDSTINEMFVQSLEVEPMQDADVSKVMAALLKSQQVSITRKLIMRMHMTDDPTVNSLMVKLHGYKTLSGVLQGVEDEDLIKMILEILSKWPAMTKNKISSSQIEDVVKEIEANSTNEEIRQLASDLLAQWSVLEMAYRIPKTQASDKSLMESYGRVSRSPEHSNGNTSGVINHDQSNFAQYSTNVSQVYSATLPKGPASVPNFGLPENWQAQFDPNTQKYYYYNVLTRETTWDKPGVSIPTRPKLPTGPSSMINQQPQTSHSSQYQNGPPSRNNNIEEEIARREEEKERRERESRAQELLNKERKLRELIEQAQSVKSTPEPEKKSKHKHKHEHKHRHGRTKSHEGKGTAALDDDARVSKESKHKSSSHQHKKKEVKETSLEAQWKHIMAKHVPNLLKSYVEEIGKDNVKGCAKEIVNNLASREAHKGVPPSSSKELDKHKLKKLKEYSDTYMDKFLSKYRSKHHGKRKLGEDEANATSREESRGIDSNVSLSNIDTNGEVESEENKKVKLDSGV\n>tr|A0A5N5DU29|A0A5N5DU29_9PEZI Inner centromere protein mis6 OS=Lasiodiplodia theobromae OX=45133 GN=mis6 PE=3 SV=1\nMHATIDALRTASTLPAKQRGEKVNAVVDAVCSHAYQHGLSRDHLQSIVAIVTRRNHLDQTSLTNLIKNLYPADRVSSDIVLAIVGSLGHGQAKPSAATQAALLKWIIAVIDALQDATVLSKLYGVLFNMLDTMTLRTPLCHLLSLITRRKHVRPFRIQQLLEMVRGSGQDPALVGLLRVYKDYYPEIIVGNAASGRTSFASAAQDEWRQRLQVIQDANADSNEQLYAQQDGFKVIRRGAKRAKASILPDVHTSYANEKSVTLEEVNSADGLVKNLERIELPNQLLASFKDPLLQKYLILKPSDTAARRLELWLESYLRETLETISSGTKNPDHFDELLDGMLNYTKATKDFKEFKASYLNPAEAAIVTSGTVDAYDRLVTFYTALVQNWNHAANTSRPDSGDAANDLITSTDFTGLTTHISNTILSLLTSQSHTPISTTTTILTYYTTLSTLSSGLTPLTIPTAPTLYTLLFQPSLATLSQLCTLLATYKRAFEADLQDHTTTAANLPRAVTNAFNGYLMDVANLLWRSRALTSTDPNAMACLCAPGVAAALHAYISTTLPPVLIPSANDNTTAPAPGTGPDYTLAALFGLPHNALTAPLARAAFRDLEDAHHGTSGSSNAPRHPPGPVTQRTLHRLARAGNNGNGNGNGNGGGAAGGGGGGLELSWKAYRVCVLEWLAERGVRGLRDFMFVTMKDLMKESAAAAAAAAAKTGATTTTATA\n>tr|A0A559MAT3|A0A559MAT3_9HELO VPS37 C-terminal domain-containing protein OS=Lachnellula willkommii OX=215461 GN=LAWI1_G004602 PE=3 SV=1\nMSSPSTAYPPYQPHRNSQSFDPNAPPAPPPKPSSQEVSRRSTPAGSQPLPPPPPPQPEGFGTYGASDDPRSFQQARFSSSEVLYAEQIQDPGERWLPKILEDKTFVTLRHKIKQDLADVLAKPDLLAALAHSTSTAHASIASAQEPLQAALTENIALASHLNELEARLAHLRSSTQAQLLSTHALERQWKQKQSDMDRALAPFSPSSLYQRLSQAVQEQEMVCRALEESFLEGDGGTATEREVVEWVRRYREATKVYYSRRERKERWDEGRVGGWR\n>tr|A0A3D4HVI7|A0A3D4HVI7_9BACT Uncharacterized protein OS=Patescibacteria group bacterium OX=2052139 GN=DIV45_01950 PE=4 SV=1\nMAKQLKLFEKSVKKKQLTKKLVVLGKKKGNFSCQARVPFSEPVGSPNRRSGPEATKLRKYPLKSLPLKKGRRGGDVNLLAPSSPSPSSGRRGEKRHWHWTDYFVSSPLKITPKKKRKTPVVFVMMSGGVDSSATAYLLKEQGFEVVGVYMKNWSFPIKRIDECPLYQDYKDMVKVCKFLKIPYQVWSFEKDYRKRVIDPFFKGYEAGLTPNPDVMCNTEIKFDDFFKKAMKLGADYIATGHHIRSRCADPRFSRHSGESLGRLQNLIIRSWTSQDDDAKXXSG\n>tr|A0A1X0VXM2|A0A1X0VXM2_9GAMM NGN domain-containing protein OS=Rouxiella silvae OX=1646373 GN=BS639_21155 PE=4 SV=1\nMKNWYLVYCNYNQEDRAIINLERQGVQVFCPMLSQDNHSPHKKGGYMFPRYLFCLFNPEVTSKTTINSTRGVSQLIKFGGRQEIIPNIVIESLMFYIERSPEAEFKGGESPNLKKLSEDLSAIIKGILSECESDKRVLLFFSLYSLIVRDIAKEIVKIPVKK\n>tr|A0A1F1KDD4|A0A1F1KDD4_9MICC GntR family transcriptional regulator OS=Micrococcus sp. HMSC31B01 OX=1581073 GN=HMPREF3105_05090 PE=4 SV=1\nMSRTGIGTVSLGSAPVSKADRAYQAILEGIRDQRHEPGDRLVLSQIAAELGMSVVPVREAIRRLQSEKLVAYERNVGATVVGIDPVEYRHTMETLALVEGFSTAQCAPHVTAEDLAAAREVNATMRAMTESETAWDPVTFTELNRRFHSILFEHHQNEHVHDLVHRGWNRLAALRSSTFAYVPGRAVASVDEHEHLLRLIEDGARFEEIEAAARAHRLNTLRAYLEHSAEPSA\n>tr|A0A7C4I6T5|A0A7C4I6T5_CALS0 TatD family deoxyribonuclease OS=Caldiarchaeum subterraneum OX=311458 GN=ENM30_04935 PE=4 SV=1\nMIDVHCHLTEEPLLSNLGEVIMEAKKSSVEAIITSGIGPADCEKVLSIVDGVYIYGSLGIEPYALEGYEKVIELIMRNRERVVAVGEVGLDYYWGKKETREMQAKVFREFIELAKSLDLPLVIHSRSAGKYALNILIEEKAERVVMHAFDGSAGEAERGAAKGYFFSVPPSVVRSEQKQKMVRRLGLENLLLESDAPVLGPERGVVNKPSNIAISAKAIASLKNIPLDKVVEKTTENAKNIFRI\n>tr|A0A2E7SH61|A0A2E7SH61_9EURY Thioesterase OS=Euryarchaeota archaeon OX=2026739 GN=CMA77_02820 PE=4 SV=1\nMTSDEIGVQRKFAPTSICFGCGPANEKGLQINSTRIEDGLELWFTPSSEHQAFPGMINGGIIGTLLDCHGNWAAAMSIMDARGDSEPPCTVTASYSIQLRRPTPADIPLHVTARVIELQDDRADVEMELYAEGKLCAKGKGLFVAVNEGHPAYHRWG\n>tr|A0A1J0GT11|A0A1J0GT11_9CAUD Uncharacterized protein OS=Arthrobacter phage HumptyDumpty OX=1913080 GN=SEA_HUMPTYDUMPTY_66 PE=4 SV=1\nMSLTRKERENNLVCRHCGRPIVRNTGPRHRWARALPKMEWLHNAKDFDPSKPIDCFTPEPKA\n>tr|A0A7G9IUQ7|A0A7G9IUQ7_MACNE NADH-ubiquinone oxidoreductase chain 5 OS=Macaca nemestrina OX=9545 GN=ND5 PE=3 SV=1\nMIMYTPIMMTTLISLTLPIFASLINPSKKHPYPNYVKTTVMYAFITSLTSTTLFICLNQETTIWSWHWMMTQTLNLTLSFKLDYFSMMFIPIALFITWSIMEFSLWYMSSDPNIDQFFKYLLIFLITMLILVTANNLFQFFIGWEGVGIMSFLLISWWHARTDANTAAIQAILYNRIGDIGLILAMAWFLLHYNSWDFQQMLALNSNPSSLPLMGLLLAAAGKSAQFGLHPWLPSAMEGPTPVSALLHSSTMVVAGVFLLIRLHPLMETNVLIQNLTLCLGAITTLFMAICALAQNDIKKIVAFSTSSQLGLMMVTIGINQPYLAFLHICTHAFFKAMLFMCSGSIIHNLNNEQDIRKMGGLFKTMPLTSTSLTVGSLALAGMPFLTGFYSKDLIIEATNTSYTNAWALFITIIATSLTSAYTTRTILLTLTGQPRFPALTNINENNPALLNPIKRLTMGSMITGFLITNSIPPTSPLQPTMPLYLKLSALYATALGFLAALDLTLMTNKLKMKNPSQTFKFSNMLGYFPTTIHRMIPYQNLLMSQNLALLLLDLTWLEKSMPKMISQTHITTSMTVSPQKGMIKLYSLSFLIPLTLTLFLMM\n>tr|A0A2D6YFP4|A0A2D6YFP4_9DELT Ribosomal RNA small subunit methyltransferase H OS=SAR324 cluster bacterium OX=2024889 GN=rsmH PE=3 SV=1\nMSEPRFRHLPVLLAEVLGSTPANSKNLLDCTLGGAGHSRALLGKFPKANLYGIDRDPAALAASRHRLAEYPGVTAIEQASFLELPYWAEKWRKPFDFILADLGMSSEQLAAPERGFSFLQEGPLDMRMDPFRQVETATQILQQRSEFEIRRLLQTYGEERFAPQIARAIVQHRANAPLVTTSELAELVERVIPRKFQKPNFHPATQTFQALRMEVNQEPQEINALLDFAIENLQPGGRLAIISFHSLEDRPVKQRFREWERPCRCPSDLPRCVCGLQALGVSLQRKPIVAGAEEIEKNPRSRSARLRVFERNAVCFPGXXKXSRN\n>tr|G3NV60|G3NV60_GASAC G_PROTEIN_RECEP_F1_2 domain-containing protein OS=Gasterosteus aculeatus OX=69293 PE=4 SV=1\nMNNVSVVRFFILSGINETNDYRVTLFTFTLLYYCIILILNTSIIMIIILDQNLHEPMYILLCSFCMNGLYGTTCFYPKFLLDLFSSSQQISYEWCLLQAFVIYSFPCYELSILAVMAYDRYLAICRPLHYQSVMTKRKVSQLICFSWFTPFCILSINIVLTSRLKLCGVNIDRLFCVNWKIVQLACYESDTFSNNITAYFTMLIFISHGLFVVWTYMHLIRTCVKSKDDRVKFMQTCVPHLVSLVTFIVAVVFDLLHIRFGSKDLPQSLQNFIAIEFLLIPPVMNPLVYGFKLKKIRNRILVYCPDAEATASLPGVQKRTPSKTVMHLCNTSSQRTTKNQSCILILSH\n>tr|S9V0M4|S9V0M4_9TRYP Npa1 domain-containing protein OS=Strigomonas culicis OX=28005 GN=STCU_11365 PE=4 SV=1\nMCTHGFFTHIIEDAADLLQEGSEAGMRLAREAIHTFETQFITSKSVSTHQKRAVLLGQRSILRLLVKALEYAPAAETAAQVLYRIIVELAESPSDYASSHLESVSGQGMPNYLLFTLLRQLRPKCSPLASHLVLFLLHTAPDLIRPFFARVSVHMTEEGGSTAMGRVAASTARVATLNVMTRILQLPLPYHLAARQATLEPVATKVRTFYTMSPREVADEICPAWVAEYVHRLVNGSTNLLMLTFAMQLTQAALIRAQAVMRVVAEIQEVARRPRGDGAGRALGGRRRRHAGRRDRLGGLQRPRACAAGGGGAQTRGVLAPHDAAAAAAADPARGGGRRRRREGAGEDGLCVPPHAPPHGPVRQGARAAAAVAERGARIAPAVHAVAAADRAGAAGRQRRFPVLAGDLHLGPLRAAHR\n>tr|A0A096XL47|A0A096XL47_9HYPO DNA-directed RNA polymerase (Fragment) OS=Thyronectria aquifolii OX=1491451 GN=RPB1 PE=4 SV=1\nVKKILEIVCHNCSKVLADKSDPEFVAAINTRDPKLRFNRVWAVCKKKRRCENEDRSEKKEKEEEYAPGLKPFVVENHGGCGNVQPQVRQAALQLKAAFEVAQEDGPKKKESMPITPEMAHGILRRISEADLRNMGLNSDYARPEWMVITVLPVPPPPVRPSISMDGTGTGMRNEDDLTYKLGDIIRANGNVKQAIREGSPQHIARDFEELLQYHVAT\n>tr|A0A1D5P1X9|A0A1D5P1X9_CHICK FHA domain-containing protein OS=Gallus gallus OX=9031 PE=4 SV=1\nMSVTSWFLVSSTGIRHRLPREMIFVGRDDCELMLQSRSVDKQHAVINYDKEKDEHWVKDLGSLNGTFVNDVRIPDQKYITLKLNDVIRFGYDILPL\n>tr|A0A2J8WE22|A0A2J8WE22_PONAB ARL8B isoform 4 OS=Pongo abelii OX=9601 GN=CR201_G0011344 PE=4 SV=1\nMIRLASWVWLLPPAGVRPCRAGAPRSRWRVRAEARSCGSRRRRRSSVLLSVLAPGRHHAGAHLPPAGLVPFALLEGGDGADARGAAVLGQDHLRQCHRVRSIQ\n>tr|A0A1V8U653|A0A1V8U653_9PEZI Uncharacterized protein OS=Rachicladosporium sp. CCFEE 5018 OX=1974281 GN=B0A51_10502 PE=3 SV=1\nMGEASVVASQWRMVEVGRVVLFSNGPFAGRLAAIVEIIDHKRVLVEGPSESKDLLVPRHSSPLAALSLTRIVIEKLPRGAGSAALQKLWQAQEVEGTWNKSTYALNKAKTMRRRELNDFERFKAMRLKKQVRFQHRKSFAAAKASA\n>tr|A0A7L3JVW9|A0A7L3JVW9_9PASS LTK kinase (Fragment) OS=Drymodes brunneopygia OX=626378 GN=Ltk PE=4 SV=1\nWAGGGGGGGGATYIFRQKDGIFEPLLIAAGGGGKAYLKAQDNSLDDVPLEQFENSTAVPGVSGRTGAAGGGGGWQDESLLPQAGKSLLEGGEGGQACPQALAKLQWTTSGGFGGGGGACTSGGGGGGYRGKSAGA\n>tr|A0A7J7IY04|A0A7J7IY04_BUGNE SLC39A1 OS=Bugula neritina OX=10212 GN=EB796_022902 PE=4 SV=1\nMKAATNTENTRRKSMLDRCISFLSCFAAGVFLGTCLLDLYPEVQTKLYSAVTLYISKDSKFACYPFGEAVMVAGFFLVLIVEQMVLALKEMSVESSTPANQNSQPGSSSQSKRVTYDSINSTTNEYAEHERLLRSNSRDNTQSRSRLGSLSSIRSIESRNNVHSQSDDQHEHSMHHDPSSHSPIRSLIMLAALSLHSVFEGLAVGLQDTEEGVLSIFGALILHKCIIAFSIGLNLVQSKLAVKAIIVSNAVFCFASPLGIAIGILITDFNSDADSSLLVNGILQGLACGTFLYVTFFEVLPHEFNKPKDRLLKLLFVIVGFAFVNGVLFLEMFLSKEPGCD\n>tr|A0A7I6S0I5|A0A7I6S0I5_9ENTR DUF446 domain-containing protein OS=Klebsiella sp. WP4-W18-ESBL-05 OX=2675713 GN=WP4W18E05_35930 PE=4 SV=1\nMTRHDSLRDQLLLIETLLRQHQHWQDDAPHESAFASDQPFCMDTLEPLEWLQWVLIPRMHQLRDSGMPLPKDFAIAPYYEMALDAAHPLRAIILPPLEQLDAFFTSDPH\n>tr|A0A2L2NMZ0|A0A2L2NMZ0_9NOSO Histidine kinase OS=Nostoc sp. 'Lobaria pulmonaria (5183) cyanobiont' OX=1618022 GN=NLP_1471 PE=4 SV=1\nMEPRHIDTEVTRLEALRQYQILDTEPEEAYDNLAQLAAFICGTPISLVNFIDENRQWFKAKIGLDVSEMPRNVGLSYLCQEQRNVVVISDTLADEKLASNPVVTGYPYIRFYAGVALITPKGDMLGTLCAIDQVPRQLSQKQVEALVGLSRLVIAQLELRRHVIEVSKVTEKLVAHEQAACAQSEATKTRITNLLESITDGFFALDQKWQFTYINGQAEQLLQKTRNELLGKNIWEMFPEIIGTTFDCEYHRAILEQVSVEFEEFYLPQQQWLKVHAYPAKDGLSVYFQNVTERRKTAEALRESEERWQLALNGNNDGIWDWNLKTNEVFFSTRWKEMLGYKDHEVSNRWDEWTKRIHPDEQDWVLQAFQDHFATKTPFYVCEYRVQCQDGSYKWILDRGQALWDTLGDIVRMVGSYTDITDRKRADEELKRQNLRSQLFAEITLKIRESLQIDEILKTSVTEVQKLLQADRVLIFRLEIDGSGTVVQEAVLPGWPVILGENIFDSCFKEEYIERYRQGRVSVMEDIEAAHIQPCHRKFLQQFAVRANLVVPILVRDGIWGLLLAHQCAAPRQWNQFETDLLQQLANQIGIALSQAQLLEKETQQSQELTRSNAELEQFAYVASHDLQEPLRMVTSYLQLLERRYKNKLDANADQFITYAVNGASRMQTLINDLLNYSRVSTRGQPFVPVDCSAVLEQVLANLQLAIADSKAVVTHDTLPQIMADATQLTQVFQNLIANAIKFCQNQQPRIHIGVARGDTNINGESLNVIPSADEWLFWVRDNAIGLESQYAERIFIIFQRLHGRGKYPGTGIGLAICKKIIERHGGQIWVESKPGQGSTFYFTIPDRALKQSSTL\n>tr|A0A4S4NBC8|A0A4S4NBC8_9RHOB Alpha/beta hydrolase OS=Aliishimia ponticola OX=2499833 GN=E4Z66_11820 PE=4 SV=1\nMPNYFETAEGRRIAYHKTEGAGPTIVFLGGLKSDMEGTKAVHLEAWAKAQGRAFLRFDYSGHGESSGTFEEGCIGDWHQDTLAAIDNLTTGPVVPVGSSMGGWQSLLLARARPNRIAGLVTIAAAPDFTEDGYWAGFSEAQKALLDSQGYVELPSDYMEPYHVSKRMIEDGRTHLVLRTPLALPFPVRCLQGTADTAVSTETALRLLDHADCEDMRLTLVKDADHRFSDPRCLAMIEAAVSDVLGI\n>tr|A0A6I4G232|A0A6I4G232_AGRVI Chemotaxis protein OS=Agrobacterium vitis OX=373 GN=GOZ89_08175 PE=4 SV=1\nMTARRSLGARSGFSSFAFYGVLLTLAVGGPVACAGQAYAAGPNTPASNGPSTAPVAGTTGPAKSLPAGGDSDNLPPYLMLRSLQFVQDSVVRGDHSAADMQRFLLTRIDKRLRTAVSSDFEDPRNVDAALIYTMSGGNPATLDYLVARDVDGHFDNRVSDMLRKYLSGKGVLVASSLGEMVPLYQNGRVGPYIALVAGNVTLVKDPAAALKFFDIARLVAPGTIVEEAALRRSFQIAMDTGQNRRAMAYANRYARRFLYSPYASQFADLLVQLVVDHFSELDKNDILATLATMDPDRQREVYLRIARRATINGNQALASLASSQAQSLAGLPDKNDPQALLYGGAALISTTDVKNALSTISQLPKDQLSASDNALLEAARAVAQEIITLPTAPQSPSASPSTPPPSGDYTAPDAPANVSDQQDPGAPANAKANVVPDAGVGTAPVSPASADAKQKPDPEFQTFMSGGRSKLEEIDKMLKGEGVTK\n>tr|A0A4Q3Y2I0|A0A4Q3Y2I0_9PROT ATP-binding protein OS=Alphaproteobacteria bacterium OX=1913988 GN=EON59_07995 PE=4 SV=1\nMIVGLDEPAFREKLKALLTPAQPISKPEHLHGRDKKLMLIDRALNSPGKHIFIFGDRGVGKTSLARTAAAIHAADEEGFAFIACDQGTTFFDMVEDIYRQLHRLYSLGKFKMDGIELSVPFLKIKANEAFGLPALRTINDAIETLKTIAPKDGVTPVVVIDEFDQLRSDTEKKYIADLIKQLSDQRINLRLIICGIGSSLDELIGVHLSTDRYLATIPLEPLPHDARWQILRTASDALGVTLDRNSEVRIGQLSDGFPYYVHLMGEQIFWQVLDDPKPIKSVSMEHYATGIRASIEEAQTSLKQAYEIATQKHKNSEDYEQVLWAVADGGILKRQVSEIYEKSYLPIMDQFEGRNPLPKNLFYQRLNRLKKATHGSIVIGSSTGWYGFKENVVRGYVRLRAERAGVEIGVDHILG\n>tr|A0A7C3NPT6|A0A7C3NPT6_9CHLR Dienelactone hydrolase family protein OS=Chloroflexi bacterium OX=2026724 GN=ENS08_10630 PE=4 SV=1\nMYQTHMYEGMLAETITHHGYQAEVINAYFARPLGAGPFPGMVVIHHMPGWDEWYREVTRKFAHHGYAAISPNLYYRAGHGTPEDVAAKVRAAGGVADDQAVGDIGGALQYLLSLPYINGKVGVFGTCSGGRHAFLAACRLKGFAAAVDCWGGRVVMSKEELTPMQPVAPVDYTQDLSCPLLGLFGDEDRSPSPEQVNQLEAALQAHGKVYEFYRYPGAGHGFFYYDRPNYRQEQAVDGWKKIWTFLEKYLKV\n>tr|A0A699THK2|A0A699THK2_TANCI Retrotransposon protein, putative, Ty3-gypsy subclass (Fragment) OS=Tanacetum cinerariifolium OX=118510 GN=Tci_880515 PE=4 SV=1\nMRQRRWLELLKDYDTNIQYHLGKANVVADALSRKSGMIVGIKVEEEIIRDLERLDIELYVRGQHGYWASLRVEFRLDDDNVLWQNTRLVVPNDASLREAILTEAYSSLFSIHLGSTKMYHDLKLHFWWSGMKRDVATFVSRCLVCQLVKIEHQRASGLLQPLDIPVWKWDEISMDFVTG\n>tr|A0A328S3F9|A0A328S3F9_9EURY GTP cyclohydrolase MptA OS=Methanosphaera sp. SHI1033 OX=1945632 GN=mptA PE=3 SV=1\nMSVPEFPDTQDKQPSAPISLTRVGVTGVKKLLKIERSGNKRPIILLPTFDAFVDLPSTQKGVHMSRNPEAISEIVDEATNEPEIHIETICANLVKKLLEKHEYAVNAETEAKSEYIINKLSPVTKKKTQETTQIISRAVAHKNEDGTINVKKMIGAEVVGMTVCPCAQESVEKDSKEKLLEFLDEETTEKVLKTVTFASHNQRGIGTILLEVSENQEVNVDDLISIIQESMSSPVCEILKRPDENRIVTNAHQNPVFVEDCVRNMVIGLLNKYPNLPDNSMVTIRQVNQESIHQHNAFAEKVASFGELRQENIQE\n>tr|A0A433MDU9|A0A433MDU9_9BURK Phosphoadenosine phosphosulfate reductase OS=Variovorax guangxiensis OX=1775474 GN=EJP67_02995 PE=4 SV=1\nMSIDIERINAELGRNAQGLVDWALGLGQPAIVTTNFRPFEAVILHLVTQVKRDVPVVWMDNGYNTEATYRFADEVTKQLGLDLHIYLPRRSRAHREAVEGPTPALDDPRHAAFTEEVKLEPFARALRETAPKVWFTALRATDTAVRAQMDPVSINPDGLIKVAPLLHWSSKDLHEYCVKHGLPNNFDYVDPTKGEDNRECGLHLAH\n>tr|A0A147H9Y5|A0A147H9Y5_9PSED Ribosomal RNA small subunit methyltransferase H OS=Pseudomonas psychrotolerans OX=237610 GN=rsmH PE=3 SV=1\nMNPVFHHVSVLLDEAVQALEIQPAGRYLDGTFGRGGHSRAVLRLLGGEGRLLGFDKDPQAIAAGQALAAEDARFEIVQRSFAELGDELVSRGWSGQVDGVLLDLGVSSPQLDDPERGFSFMQDGPLDMRMDPSRGQSAAAWIATAAEADIAQVFKEFGEERFAKRMARAVVQRREVQPFERTADLAKVLTEANPAWEKGKHPATRAFQGLRIYINRELSDLEQGLQAAYEQLAVGGRLVVISFHSLEDRIVKQFMRRLAKGEADQLPRDLPIRATVFEPSLRLLGKPIYASEGELAANPRARSAVMRVAEKLK\n>tr|A0A2F0BA01|A0A2F0BA01_ESCRO Ubiquilin-2 (Fragment) OS=Eschrichtius robustus OX=9764 GN=ESR_40773 PE=4 SV=1\nMQQLIQRNPEISHLLNNPDIMRQTLEIARNPAMMQEMMRNQDLALSNLESIPGGYNALRRMYTDIQEPMLNAAQEQFGGNPFASVGSSSSSGEGTQPSRTENRDPLPNPWAPPPATQSSATTSTTTSSGSGSGTSSSSATGNTVAAANYVASIFSTPGMQSLLQQITENPQLIQNMLSAPYMRSMMQSLTQNPDLAAQMMLNSPVFTANPQLQEQMRPQLPAFLQQMQNPDTLSAMSNPRAMQALMQIQQGLQTLATEAPGLIPSFTPGVGVGVLGTAIGPVGPVTPIGPIGPIVPFTPIGPIGPIGPTGPAGPPGSTGSGAPPGPTVSSSAPSETTSPTSESGPNQQFIQQMVQALAGANPPQLPNPEVRFQQQLEQLNAMGFLNREANLQALIATGGDINAAIERLLGSQPS\n>tr|A0A7U8PMI8|A0A7U8PMI8_BRUAO tRNA (guanine-N(7)-)-methyltransferase OS=Brucella abortus bv. 3 str. Tulya OX=520451 GN=trmB PE=3 SV=1\nMIDENHPMRAAGNFFGRRHGKPLRPHQSNLFEDLLPRLKLDLATPAPQDLRSLFEAPVEAVRMEIGFGGGEHLHHESGRYPQSGFIGVEPFINGMAKMLAALDQAPRPNLRLYDEDATAVLDWLPDASLAGIDLFYPDPWHKRRHWKRRFVSDANLDRFARVLKPGAKFRFASDIEHYVNWTLQHCRRHAAFDWQAESPADWNDAYEGWPGTRYEAKAFHEGRRAAYLTFIRR\n>tr|A0A2S5CXJ6|A0A2S5CXJ6_LYSSH Single-stranded-DNA-specific exonuclease RecJ OS=Lysinibacillus sphaericus OX=1421 GN=recJ PE=3 SV=1\nMILSKKRWQVKRPDAQLVQTLQNDLQLSAIAAKILAARGCTTSADAESLLNMTEANIHDPFLMHGMAEAVARIQQALENNEKILVYGDYDADGVTSTTVMLHVLLDLGADVSFKIPNRFLHGYGPSEALFREAHEEGIQLIITVDNGISGIEPIRVAKELGLDVIVTDHHEPGEELPQADIILHPRVPEGHYPFGELAGVGVAFKLAHALYGELPTHLFEFVAIGTVADLVPLVDENRYLVKRGMEEMRRSLSPWIQAMCEVASAEQATINEETIGFYFGPRLNAVGRLGEASPAVELLMAEDTAKATALAKQLNGCNAERKDIVKSITDEAIAFIEADKKIGDSLVLVVAGEGWNAGVVGIVASRLVELYYRPTIVLSLDFEKGTAKGSARSIEGFHLYNELAKNRDILPHFGGHPMAAGMTLPLEHVDELRTRLDAQARACLTEEQLTPVLAIDIPLKIDEISADAIEEIATLGPFGTDFPKPVYVLEDVEIATMRKIGAAENHIKMELTDGLEKLDSVGFNKGHLYHELTYGIKVSFTGDLQINEWQGRKKPQFMIEDVQTTEWQLFDIRGIRQTSRWLHTVPKEEAVFFAFRLETISYYQSLLGVPIELVDVELSNVEQTDYIVLLDLPHNVQLLENVLSKTAPTRIYAHFYMPDSQYFNGIPTREQFAWYYKFLKQRPAFPLDMHLPDLAKHTGWPLEALKFMTQVFFELNFVKMESGLTTVNMNAPKTALTEAPSYKQRSEQIEIEQKLVYAPYIELKQWFDERLNLYANTVS\n>tr|A0A0C2NMI1|A0A0C2NMI1_9VIBR Serine--tRNA ligase OS=Vibrio renipiscarius OX=1461322 GN=serS PE=3 SV=1\nMLDSKLLRTELDDTAAKLARRGFKLDVETIRTLEEQRKSIQVEVENLQSTRNSISKQIGQKMAAGDKEGAEEIKKQIGTLGSDLEAKKAELDALMAQLDDITLSLPNIPSDEVPDGKDENDNVEISRWGEPKAYDFELKDHVDLGEMADGLDFASAVKITGARFIVMKGQFARLHRAIAQFMLDLHTEEHGYTEMYVPYLVNSESLFGTGQLPKFGKDLFHTEPLAEKVNDEEPRKLSLIPTAEVPVTNLMRDTISDEADLPLKMTAHTPCFRSEAGSYGRDTRGLIRMHQFDKVELVQITKPEDSMAALEELTGHAEKVLQLLELPYRKVVLCTGDMGFGSHKTYDLEVWVPAQETYREISSCSNMWDFQARRMQARFRRKGEKKPELVHTLNGSGLAVGRTMVAILENNQEADGRIRVPAVLQKYMNGAEYIG\n>tr|A0A0B4FII0|A0A0B4FII0_METAF Src-like protein (Fragment) OS=Metarhizium anisopliae (strain ARSEF 549) OX=1276135 GN=MAN_04425 PE=4 SV=1\nMPAPTVEAPAVALSFANNFWGKEDAGVGPLLERMQSAKTTSDELKSFYSARASIEDEYARKLLHLSRKSLGSHEMGSLKTSLDTVRVEVESMAKQHQSIAAQMKSELEEPLAAFAGGMKERRKIVQSTVEKLLKTKIQQTQQVNKTRDKYEQECLKIKGYLAQGHMVMGQEERRNKAKLEKTQISLATANTEYESAVKILEETTTRWNREWKAAADKFQDLEEERLDFTKSSLWTFANVSSTVCVSDDASCEKIRLSLENMEVEKDIIHFITERGTGQEIPDPPKYINFCRGDVNDGQSEVSEDDNYSVAQFPRSINPAFRSSSPQPSTFESHHDPNSMLANNLAHREPREPPQPTSREAIVTPQKAPPPMRNSVDEQRRGQGQQKPPQYDVNQHGPLAAVPHDPYPMDGMTMLCRTGPPGPQSDRSSQPHSARPSSRESHSDYSIPTSLSSVEPPSGQASPVKQEPVETRSPEKRVLKKKSGFFQNHSPFRRKSTKEVQAPSQNRSTWHVAPGRAELERTASPEPIDANASLALGVGQNVLPVTTPDTRRRPGQGREQDVDQSDPIAMALAELKDVNLGKQSSLRMSADHYHGIATPGPGADPRSGRSSGREAPPSYNTQASVSRLGVPPPAVTSRAMKEATKKATDQSRAVFGNAGNRGASPASRPATRGSDMPRAASPAPTRSASPQPRMSGDSRYRSASPNPYSGHHRNASQASVSQQRGSGQGYYGSGSPHGSTRGSVRGASPASFRGDYDRPRSSYGGGSDMAVQLAPAGDDRYGSQRGRGAVDLYDGGSRPRSKSVADPSRQYTRDGRPILHFARALYMYQAAIPEELGFAKGDYLAVLRHQDDGWWEAEVHGGNGRVGLVPSNYLQPC\n>tr|A0A1H6SIL1|A0A1H6SIL1_9SPHN Uncharacterized protein OS=Sphingobium sp. AP50 OX=1884369 GN=SAMN05518849_101367 PE=4 SV=1\nMLRRRAQGWCPDTQRAFIDALSRCGVVAQAARSVGRSPRSAYHLRRRAGADSFAAAWDWALDMGLDESRARAIALIRGKRVRPIVRRGEVVGQRTDNDPRLMFAALNALGADQDGRRAAMPHRQRMALRHVITTLIDNGPFSPEEWARLVPALAAVAGASPRPDALS\n>tr|M6A221|M6A221_9LEPT ATP-sulfurylase small subunit OS=Leptospira sp. P2653 OX=1218600 GN=cysD PE=3 SV=1\nMNRSRLTHLEQLEAESIYILRETASQFERPALLFSGGKDSITLVHLALKAFRPGKFPFPLVHIDTGHNFQEALDFRDELASKIGEKLIVRYVQDSIDQGKAVEEKGKFPSRNGIQTVTLLDTIAEFKFDACIGGARRDEEKARAKERVFSVRDEFGQWDPKLQRPELWNIYNGKIGPGENVRVFPISNWTELDVWEYIRKENIALPSLYFSHKRQVIYRENLLFPVSKFITIDSNDRVEDKVVRFRTVGDMTCTAAVDSQADNIDDIILEIQTTRTTERGSRLDDKRSEAAMEDRKRGGYF\n>tr|A0A438U9M4|A0A438U9M4_HELPX 2-amino-4-hydroxy-6-hydroxymethyldihydropteridine pyrophosphokinase OS=Helicobacter pylori OX=210 GN=folK PE=3 SV=1\nMMREILISRFFPSLFKKRLDFSNRVVLGLGSNLKNPLKILKNCFLYFKNHSKIGKIFSSPIYINPPFGYTNQPNFYNATIILKTSLSLRHFFALVFYIERRFGRARKRDFKDAPRTLDIDIIAFNQVILRQNDLTLPHPKWNERDSVLVPLALQQILFKKGEW\n>tr|A0A4Y7J8A4|A0A4Y7J8A4_PAPSO Uncharacterized protein OS=Papaver somniferum OX=3469 GN=C5167_014818 PE=4 SV=1\nMSRGILVWFISSNLRFLDLDGGDCDNQLGAVEYVEEYFISSSKSQSLVRDYLGIHSLKSMRSGSLKLLGMSSMPIASEYEEIWAPEVEYLGIHSLRSMRSGAVALREVRLEKNSLFWKKCSSLTTLTKQATTQFRELRGAPPGSVNWEMQRQATARFCELSGGQMQLHTGLAFVFLLQIQLAELLKWNAGASWRCPAFGQRA\n>tr|A0A2T0RHF1|A0A2T0RHF1_9ACTN Transcriptional regulator OS=Pseudosporangium ferrugineum OX=439699 GN=CLV70_12320 PE=3 SV=1\nMRVRLLGTVDVHAGDEFRQVPGLRRKAILSVLALNAGRTVSAGRLLELVWGDRAPATGLNTVQSHVSYLRRILGARSAIVSRSPGFLLDLPGDATDAATAERLIHAGLRAADPARAAEHLRAALGLWRGSPLQGVTELPWLAEQARRLSKLELEARRALAEARLALGEHAELVPELQALAAQHPFDEQIQAQLVLALYRTGRQSDALAVVREVRRLLATELGIDVGSALSELETAVLQHDVAPARERIEPAPVPPAGPELVGRGRELGALLRHLDHRRPSGAVVPVVSGDPGMGKTRLLTELAVRAGQSGRTVLWGRAAEFEQQVPFALVMDALADHLAGTDPRRLDAVAGTDRALLREILPMLPAPENRTAARQAVEAERYLLYRAFRCLLEALAAPPGLLLVLEDLHWADQGSAELLAYLLRHPPRGPVVVAVSYRPRQMRGPLRQALGRAIQDGSADLVDLDPLSPAEADTLLPAELAADRRQHLYALSGGNPLYLLALAREGAAGPGEDDRSLGEQDPVPAAVREALRGELDALSAAETVVARAAAVVGNLAEVPLIAATAGLPEAEVSRALDALVGHDLLRPVPRTGRFQFRHPLIRRIAYDMAGPGWRVAAHGRAAAALARQGASAPEQAHHIESSARRGDPAAIDILRRAAAEVLHSSPGTAAHWLGAALRLVTDDHPPEVAQQLLGLRAQSLATSGQLAESREVLHRLRQAIPAEVTPERARLASWCAGVERMLGRHREANALLRAELARVADADGPVAATLLLALGARYIQPVPPGEPDWPRRALAAARRAGTPWMVAEALLQCVYADQAAGTWDASTRERLDEAAALVDARPDGELLELLHMVVWLATAETVYERLDDATRHVDRALGLARAAGQMYVVPGIHLLFVGLHMARGDLPAASRSLDEAREAVALAGTDTMMSMVLSRECTLAALTGDGKLAHRAGTEAVALAGRRGDYAAGVAVQALATAHLQAGEPAMCSSLLDGTEELPSTPTTRGTLYETLALAWSAQDRPEVAATWADRAEREVAVCPTPRRAGLAELARAHALRPVSASASAARAAAAARLFAGVDDRLLGGQAHLHTATALAADGQPGRARRELDRARTLFLSCGATALVDRTDQEERRIRR\n>tr|A0A4R4X727|A0A4R4X727_9ACTN Cupin domain-containing protein OS=Nonomuraea diastatica OX=1848329 GN=E1294_00855 PE=4 SV=1\nMRRLAAISGATAGSTRLWMGQTHVAPATRSSDHHHGASETAIYVVSGTPAFVFLEDAEEVRIEAGPGDYIYVPPYVPHREENPDPSQEAVVVIARNTQEAIVVNLPGLAG\n>tr|A0A7W1Q9P6|A0A7W1Q9P6_9ACTN Response regulator transcription factor OS=Actinobacteria bacterium OX=1883427 GN=H0W90_11130 PE=4 SV=1\nMRVLIVEDELKMASLLRRGLVEEGHAADVAPTGEDAVWMAQSHPYEAIVLDVMLPGLSGFETCRQLRNVGVWSPVLMLTARDGVDDRVAGLDAGADDYLSKPFSFAELLARLRALVRRGGGERPTELQVGSLRLDPASRRAWRGQVEISLSPKEFALLEAFMRRPGQVLSRLQLLEHAWDFAYENRSNVIDVYVRYLREKVDRPFDTDSIETVRGVGYRLSEDSDA\n>tr|G3MBJ6|G3MBJ6_9CAUD Gp134 OS=Bacillus virus G OX=1084719 GN=134 PE=4 SV=1\nMKSSKRVDERIVKDYRIIDSAWDEFSDYVGEHNIGTPLTVKQFEEIFSKLNRNNKFSPMKDYILESFRNDCYAWPFVEKNQ\n>tr|A0A5B1MAL1|A0A5B1MAL1_9MYCO SDR family oxidoreductase OS=Mycolicibacter arupensis OX=342002 GN=E6Q54_00665 PE=4 SV=1\nMSVLDKFRMDGRVVVVTGASSGLGVYFAKAFAEAGADVVLAARRVEKLAQAADLVAAAGRVGLPVATDIADPDAATAMVEAAMERFGRVDVLINNAGIGTAHPATRETPEQFREVIDVNLNGAYWAAQACGRVMQAGSSIVNISSILGLTTAGLPQAAYAASKAGLIGLTRDLAQQWGGRKGIRVNAIAPGFFASEMTEQYRPGYLESVSGRIVLGKMGDPEDLAASVLWLASDAGGYVTGQTIAVDGGFTIN\n>tr|U4PPA8|U4PPA8_9HYPH Putative pyruvate, phosphate dikinase regulatory protein OS=Rhizobium pusense OX=648995 GN=BN877_I0001 PE=3 SV=1\nMENKKSFFHLHLISDSTGETLMSAGRAVSAQFHASMPVEHVYPMIRNQKQLAQVIDLIDKEPGIVLYTIVDQQLAEFLDLRCHAIGVPCVNVLEPIIGIFQTYLGAPSRRRVGAQHALNADYFARIEALNFAMDHDDGQMPETYDEADVVIIGISRTSKTPTSIYLANRGIKTANIPVVPNVPLPESLYAATRPLIVGLVATSDRISQVRENRELGATGGFDSRRYTDRATIMEELKYARALCARNNWPLIDVTRRSIEETAAAILALRPRTR\n>tr|A0A1G9FD20|A0A1G9FD20_9SPHI Peroxiredoxin (Alkyl hydroperoxide reductase subunit C) OS=Pedobacter sp. ok626 OX=1761882 GN=SAMN04487898_112159 PE=3 SV=1\nMAIVGKKFPSVSIDAMSEMGDDLKINIFEEAVSKEKKVILFWYPKDFTFVCPTELHAFQAALPDFEKRNTIVIGASCDTNEVHFAWLNTAKENGGIEGVTYPILADTHRHLANILGILDQDVEYDEEGNESFSGSNVTYRATYLIDETGKVFHESVNDMPVGRNVKEYLRLIDAYAHVQKHGEVCPANWEEGKEAMNANRTGVAEYLSAN\n>tr|A0A2T6ZBV9|A0A2T6ZBV9_TUBBO Interferon-related developmental regulator-domain-containing protein OS=Tuber borchii OX=42251 GN=B9Z19DRAFT_1104137 PE=3 SV=1\nMSELRRKALGSGKTVSRKAASRQSSAASSRANSRNTSRAGSRAASRANTDDEGSLSDETTFSLGSVDELATIDAELDETTTLWQEELGDRVNQIIERKKSSSAGREESLTAYIRILCAKYAKDEILPKKSELLDAFVRSFKQGKTEKEALLAAKALAITIVTDPEDTLFDKLAPDFKRTITDHASLPLKNALIHALGAVTFYGGASAAETELIMDFLKDIVESDGHDIGAGDDAGVVAAALEEWGNLATQLDDAEEITRRSMSFLVDQLDSSEVLVQVAAGENIALLYEKSYTEAEEDEVVEDHSESGLGKNFIQKYKPYPRHDVLIHTLRGLSSGSKKYLSKRNKKTQHSAFVDILHSVENPMKGPRYSEALDKDNRVRGSRMTVRIHKKGLLRVERWWKLHRLQHLRRILAGGFLNHWIENPVIFESLSLFVEEI\n>tr|A0A811ATS3|A0A811ATS3_9GAMM Alpha/beta hydrolase OS=Acinetobacter variabilis OX=70346 GN=RYU24_01130 PE=4 SV=1\nMSHPLSSLEYQPDILGEGYEQATLEFPPDTEGTVVATLIRKKTDQPTSKAVLYIHGFIDYFFQTEMAERFNQQGFDFYALDLRKYGRSYMSHQKLYNVYHLSEYDAEISQALEIIGQEGHDTVLLSGHSTGGLITTLYAAHHPDRPLIKGLWLNSPFYDFNMTPFEKKFLVPKLSRLGKRFPEMLFPSRLNRHYVPSLHISYQGEWHFDLEWKKPSYHWVRLSFVHAIHEAQKEIHQGVRLNIPTLLMHAHKTTYPLRFNRNAQTSDVILQVHDMIEHAQKIQGDVQLCSIQNGVHDLVLSEKPVREQVYQQLFQWLENKAL\n>tr|A0A3N5TH00|A0A3N5TH00_9DELT TPM_phosphatase domain-containing protein (Fragment) OS=Desulfobacteraceae bacterium OX=2049433 GN=EHM30_15800 PE=4 SV=1\nSINKAESETSGEIAIMVLDSSDSYSEAETFGAFVLSGLFSLMLELIISYLIGSEPGWGHGGSGFPYGFLADAAKSASIWTYIPMVFVFYFAFKFLLSKAPEIKILFMSGRRIEETVRERAVMAFYEKGLYKTRDETGILIFISLLEHKVWILGDRGINAKIAPDFWEKIAAELSAGIGKKEYGKAACQAITKCGEELSRYFPIKKDDTNELTNEVIL\n>tr|A0A6H3NV40|A0A6H3NV40_9LEPT ParA family protein OS=Leptospira bandrabouensis OX=2484903 GN=EHR08_11550 PE=4 SV=1\nMKIITVASLKGGIGKTTTALYLSQALRSLGKKILLIDLDQNNNLSNFMIKQFPKGNDLDEKNILNMLKGYAEISEFIWESSDGIDLIPAKKDIKNIDIEFATDPILGLRFRNDLKSLNYDFILIDAHPATNTGLRCAILASDEIICPVEPSVWSSQGIDDIEIERQNASKAMKNEIKLRALISKCTLKKAEELKPILKKKGYQVFQTAIVNSEAIKVSNDISEFLNEKTGKAFPMFLSLAKEILK\n>tr|A0A2T6K4E5|A0A2T6K4E5_9RHOB NADPH:quinone reductase-like Zn-dependent oxidoreductase OS=Yoonia sediminilitoris OX=1286148 GN=C8N45_1303 PE=4 SV=1\nMKALVYQKFGPPENLVISDLARPEACSHEVLVRVAYAGVNSVDWKIGAGRIDHYRNAPFPLVTGRDFSGTVVEVGSHVRNFSVGDAVIGCLPGPGGSFAEYVATDALSLARAPSNLTLAEAASIPLVGLTCWQALVGSAKLSKGEVLYVLSGAGGTGSIAVQLGAALGAKVITTCSERNRDYVTGLGANYIFDYSKPNFTDDLIAEFPQGVDVVFSNVLGPLHRDAYRTLRPGGILVTIGESPLPAVAEKHGVDEIDLIVQPNGKQLTEIVTYLENGTIKPPSVSIHALVHGAHAMQNISEGHVRGKIVLQVS\n>tr|A0A6G0Z856|A0A6G0Z856_APHCR Dopamine beta-hydroxylase (Fragment) OS=Aphis craccivora OX=307492 GN=FWK35_00015581 PE=3 SV=1\nMKKRSASQRSFGHRWTTVVAAVVVFLSATCLVGHAGAEGRRVYTAPLDDTGRTAVYWTVDYGSRTVKFEAHFSGSGSPFDWFAVGFSDRGNHSGADFCVMWVDWKGVTGMLDTWTNDAGRISVDERQDCEEFNVARFHGGGTALTFTRKFDTCDDERDYLIQDGTTHIVWMVGGGPLFAVEGLLVSQARAKGMQRVQLLKPETPQVKLPNKVSKIDVLASKVNIPAEETTYWCHVMKIPLDLSFKHQIVRFESVIEESSRGVVHHMEVFHCEANANSRIPLYSGPCFSEKRPYKTQVCKKVMAAWAMGAAPFVYPEEAGLPIGGPDFNNYIMLEVHYNNPGLRKGMVDSSGIRLYVTPNVRKYDAGVIELGLEYTDKMAIPPKLEDFTLSGYCIAECTAV\n>tr|A0A7R9IK79|A0A7R9IK79_9NEOP Hypothetical protein OS=Timema tahoe OX=61484 GN=TTEB3V08_LOCUS7834 PE=4 SV=1\nMCQGLYRLLYVSWEGVTPRSRRTTRVTESLRVTEVSRRMEEPDSYYTSNYHLLEAGRILQPEGDDYKLVFISSDSSSKEEEGSYSDDADSSSTTSSVTGVPGFTLDDCDWDYFESSSMVRPVLKDWSWSNNKVSPLGADASVDQQQHSFGFDSPQLSSRRLIYSRPSRGDVDPMLETEEKKTPPARGVRSELSSSPLFLDSPLSSETGSSFLHRRRSPMNMSGGSYIEAPVSPSRYRRPLFQLSRGDSARSSGERSVEEITSSDHYYYGCPPPQQWKVRVGGEMEGKVEKCPPGGIVTEQRTSHSATTAERVRSPSCETCGGPSALFPPGVYGVPVPVPIPVPVPIPVLIPASLWSVGGQHATTTGDTVSVADIVYVGSSGAGDEPTNAGSVRIRIHSFQRPSHGLAGPWCAWPVDNSGVLISPMITDNSAALRGEAEKVPVGRVPDSDRELSDGVHSRGPQSEHLAGDGVHVHTLKTTSSNSHEGETITNSVNFDIMINSPFVELKESEVSCKVLLSVDKDRSDDSATAHECDKDVGDNKIKTNSSVLEQTEPEIEEMSAGKTLPTEPELNTSQSEICASYLTKVTYCEDILDSNMKTEPSDAVSEKSDDEHNSGIVLVNFKPIPSESYSDSLTERHRFIITPEPMSTSATGSDTDNDHPNRRKGYTADKNLLKTKKRRLRKCLHSNDDSKFLPRERMSSNCSSDSGSSADETCVKTPVKRKYYLAGGDMSESGDDAASDVSSDDSTAGHTTDNEEGHFSRVFVINSTQSTSEEENDDSDTGENKTIEECTVLMSESVDRSCDESNEVGVVVQLKHIMALSDEEDMSSHHSEVPKAISTSDTGIVVLKHVRDIPEEHSFASQVPWRSDETVQVLKTNNGVSRSEGKEETPERSTNCLNNICLPTAAGELNNSVNIDGEPEDKCFVHHNEVISKLVSDLKNEVDKMKCEFVARASSVSTGPDKRSITPEESGMVARLQEHLSSEHAGARLVLPPSGNSENLTPPPVDGWPSPPPDTATSLGEVESNQDPSSNVTERETSGIAASASEVDNILARSAVVINTSIKSDLSTFHEGSGDREVIKSEIGENCLSLQDICGGPCSRTNPNSSRDSGDSSPTSPAPTDNTDQTKSPVLHLENTPVENEEVTSETPGALVELYLIDEESPIAITKDTLGDQSAAITSGSSPADLIDEESPVAITKDTSGDQSAVITSESSPADVDTPNISVNTDDLNIPQIEKNIFSDITPVSQKSKEHNLEISSDQTVETLSNSSIRYICKESETGKSSKTIQNELPGSDHAAPSIELVGSESKSGPTDCETSITCDELSGTESFNDYKLKGSFKESSDIEDDRDIEHNLTTEEISCPQVVDSEETGVKFEGNISCNNDDVALDCSSVYSKSGSRDHSQSLEEVQTNTLEDKKGPSPVESFRSGGDTVTAAAESASVGRETTGEREVGCQGVLSVASEPLTVKQRRGDVCPEAGAAAVGSHLSRYTSLVMITQDNNSFLKSQETSPSVVSVVTSETTTVVPEERNGDIIVSHTNWEEDDDAIHEKVSGLAGYFTLTLETAGSTPSMKRPLVTKNKHFMNEYSPPLPAQESGEGESEDLVKVVTGGDTLSAVVCLEEGLADDDSWVEEMDDRNHEDEDFATTTPTEDSSSGDEACSSASYGDREAELRGYHRAALDFTLHTIVEESCEESDDGPAKRKKPRPTSASELEKYFFYELGGGSSGSPGSRNLNSFSDSCSSIYSESLESLRGDDVTGNGEDKRDPAEMASSRLEKYFLKEFMGFAGDNYRDSDGSGSVGSDSEGRPSPEQRRKRLVRARGTGRQHSSSLDNLVASEHSGSEQQTTDTLVESEGSSTETDTHDELGGSMTFEKPDGQFDTVKRKKKKRSVAGSSSPAISDLERRPTPTEFLEKTLTSSNVEDVPQAGGEEDMSSDEDGSKTPQPEFLLPADLSATRNKQQSRDSGFIGSCDDLLREQRSQSDSSSCSNSAEVAQKTKTGSDGSGSGSDHDPPSGERPVTDHAKSESKATQSNKNNRKPSISDDDKSQSCTLSMTSTSVPPTTALTRKDSFNNWSSDEETNLMMSKMRAFFKTMVIAANNTNGPQKTPQTSPSLRPRGMKPPQLVYFENELTRLMKTVPGIRDDQVKEIVEYLSSEDTWSDSYDSSDYTSSDLEGAAAYYQHAMNRSELQEEISASCQQIINKFDTSVEEDNEEDKNGKVSDKSVDNEPSGIRRDTAFVYQKLVASFNKMGSGEQSASSDTNSSPHSSPPLIDKVMHHIGSRLVALMHEVSGGEGAGEMTTSSPKVRYHHHRRLQHKMSVTSTTTEEEDDSHTDTESDSNARSGNELGHDLVGSSTYNPLLARSKSHDLLLEKESRNYSHYHPQHKESSSSGVSDIAEEREASDYERFSWRGSFESALMTSDSRTKLSLLSCGDGSTSSSALALAAKRRSAGDLLFASSSKSSSREQLDRVRSCGSIGGNNAGSVEDKIWGTCNRRNSIPDASAGSGASADGDDDDDDDDDDDDHDDDLRSGRSTTLPRSLQTSCSAGTNSLPRLPTTGPMSSSVPNTPNIHKAHSMHLFLQSQANVKSARYRPPGFNRPAAPKRAVSAPGMQPPHPRRDAARRRPQATSQVLETVKFYSSSKWLPIHDCEALLVYSLGYIPLSTDT\n>tr|A0A6J2QCM0|A0A6J2QCM0_COTGO AP2-associated protein kinase 1 isoform X2 OS=Cottoperca gobio OX=56716 GN=aak1 PE=4 SV=1\nMKKFFDSRRELVSSGPGSGVGGGGAGSGGGGTFIGRVFTIGRYQVTVEEIVAEGGFAIVFLVRTHQAVRCALKRMYVNNEHDLQVCQLEIQIMRDLVGNKNIVGFLDSSITAVGAGDVWEVLILMDFCRGGQVVNLMNQRLQTGFTEAEVLQIFCDTCEAVARLHQCNTPIVHRDLKVENILLHDRGHYVLCDFGSATNRFQNPQTEGVPVVDEEIKKYTTLSYRAPEMVNLYGGMIITTKADIWAMGCLLYKLCYFTLPFGESQVAICDGNFTIPDNSRYSQDMHCLIRYMLEPDPDTRPDVYQISYIAFKLARRECPVPNVHNSPIPAKLPEPVRASDAVAKKSQSKARLTDPTPTMETSIAPRQRPKAGQAQPQPISGILPIQPALTPRKRPNVAAGGPQAIGVGINVPTPAAAAVQAAAPQPAQTANMLSQPTPQHQQLLMKQQQATPFLSPQSNQQRQLIQTLQQQQQTSSQAFTLLQSKDKPVPPVIALQLHHRQHLAPVHETAASHLTPIPESAVAGPAADPEMAGRVIHKVGSLTPPSSPKMAPKSGHRRILSDVTHSAVFGVPVSKSTLLLQAAAAEASLNKSKSASTTPSGSPCSSQQSVYHPGDGDAQLALTAPNIQPSWNPFGDDNFSKLTAEELLNKDFAKLAETAAPGEKVTGSSENLIPGINAFPEKLIEGLKSPETSLLLPDLLTLVNPFNSSAENSANVKSEVCVDSLIPGLEAPQAQRHSGQPELNPASMPDSLTGEDSLLGCDLLSLTSPHGNQSGSALPSSSSCSSAPPGCGSGSCLEELPPGQTASDSAFLMSCGEKGNGDEFDPIPVLISKNSNQDVQGESNGYSVLDEGRETELQEGDSQANESCVHSSDEEDDDDDDYEEEEEEEAHKEEQQDEGAIESHAAAHDCSGSRPLLLDSEDEEEPGPQLALHSSPHSSTVPTQPSTTFHQPTPSTFAQNHSQHVHEPAQGADAAAADVFLKAPFPIVQEESADVFANAPFPRAHTAAPQPFDVFSQAPFGKRKEATVAHPSYAVTPDQGVLGQVVQQPFRPQALAKYSRHFEGPVPQQPVAAHRVVSNVSRQAAVASVPVGPLHLWTSEVSAVDPFVSAPFHLKATQEKP\n>tr|N2A2M6|N2A2M6_9LACO ATP-binding cassette, subfamily B, bacterial OS=Lactobacillus sp. ASF360 OX=97137 GN=C821_00970 PE=4 SV=1\nMDIFKKLGWFFKEEKKRYIIGVLFLALTSLANLVPPRVLGLMADELDKGHITWGQYGALILAIVAAAIVLYVLRYFWRKQIWGGAAELERKMRTRLFNHFMIMDKTFYQRHRTGDLMAHATNDVTAIQNVAGDGVLTLVDSLIMGLSTMIAMIVFVDFRLTIVALLPLPFLAWGAWKLGDHLHVAFDKSQAAFSRLNNKTQESVSGIKVLKTFGQGKEDTAAFEKMVDETIKINKHVFVWDSLFDPLGTLIIGLTYAITIIYGGFLVKQNILSVGQLVSFIAYIGNMVWPMFAIGYLFNILERGSASYDRVEKLLNEKSLITDENADETLTAKDIEGDLDYNIKSFAYPDEKDISVLKNIDFTLKPGQTLGLVGRVGSGKTTIIQLLLREFDNYEGKITLNGHDIREIPLNVLLRQISYVPQNNYLFSTSIQNNISFSQIDADNNQVVEAAKKSDLHNDVLQMPCAYQTLVGENGISLSGGQKQRMSIARALLKHSQILILDDALSAVDAKTENEILKSLKKERKGKTTLIATHRLTAVKNADLILVLKNGRIIERGSHDDLLQENGWYADMWRRQELEEKVGDENE\n>tr|A0A1J5KGW7|A0A1J5KGW7_9PROT Peptidase_M14 domain-containing protein OS=Bacteriovorax sp. MedPE-SWde OX=1860085 GN=BM556_01360 PE=4 SV=1\nMNLLKNEFEFIEELVKRSPDIVDHEVLDSVKFKNKSYDIHSFSIGPKDPEVPVLALFGGVHGLEQIGSHVVIAYLNYVIERLHWDKNFAALFEKVRLVSIPIVNPVGFKNFRRSNGNGVDLMRNSPISSKEKVFPILGGQLISSKIPWYRGDTNQMEKESQLMCDFVKDNVINSKNAISIDFHSGFGFKDRLWYPYACSKKKFDGIDNLKRIESLLDRTLPHHIYKVEPQSDHYTTHGDLWDYLYFHKKEHHPTMNYLPLTLEMGSWIWLKKNPLQLFSKLGLFNPIKDHRFNRAMRRHFLMIDFFLKAAANPDEWTA\n>tr|A0A6H1WSD3|A0A6H1WSD3_9BACT Ribonuclease 3 OS=Thermosulfurimonas marina OX=2047767 GN=rnc PE=3 SV=1\nMKELYPRLPELERRLGVRFRDPGLLVQALIHRSYAAEKKLPPGADNERLEFLGDAVLSAVITHLLFERFPEASEGELSRMRAWLVREERLARIAERLGLFEFVLVSRGEARSGGPKKASILAGALEAVIGAIYLDGGYGKVFECLRRLFARLLPQARRGMEADYRSRLQELTQALFRETPTYEVVSEKGPSHAPIFEVEVRVGERVLGRGKGRSKKEAAQEAARKALDILEKEK\n>tr|A0A371WXQ8|A0A371WXQ8_9HYPH Transposase (Fragment) OS=Fulvimarina endophytica OX=2293836 GN=DYI37_19485 PE=4 SV=1\nMARGDLTDEEWAVIGELLPSERGRKSRPAYDNRRFLNGMLFVLRAGCPWRDMDERYEKWNSVYVRFRRWAEQGVWDALLETLVETGLTDDWQ\n>tr|A0A7X8YS75|A0A7X8YS75_9BACT Uncharacterized protein OS=Acidobacteria bacterium OX=1978231 GN=GXY47_00410 PE=4 SV=1\nMARTMILLALIAAFCTTAAANTDATCDRACLEQWVDRYLAAMRDRDTSPEMFAPGLKFTEDGVRLPFGNEGLWHSMSGVGKYRFYVPDVEAQQVAFLGTVREKAPRSREESLSALALRLKIRNDRITEIEQIVIRPDSVNSSAGDFPPTGPAVEAMGAPHPVFAESIPEAERMSRKDLIETANHYFTGLENNDGKGYYPFTDDCVRFENGVDVLLNTNKETGEQTRTTCKQQFEEGVKGIVTRIRDRRFVAVDREKGIVFSFAFFDHDFIHWTWQLAELFKIENGQIRRIEAIFHRAPYGMNSGWSSFEKGISNEIQAP\n>tr|A0A1L3I1X5|A0A1L3I1X5_9RHOB Glutathione hydrolase proenzyme OS=Phaeobacter porticola OX=1844006 GN=ggt PE=3 SV=1\nMKHLFWAGILLAATPAWAQEAADAVAPEGAAETADAGFAAISEEVAAAIEAKEEGTPVEADNWMVAAANPHAVSAGAEVLRAGGTAADAMVAVQTVLGLVEPQSSGLGGGAFLVWYDAATGEVTTLDGRETAPLAATPTLFQDDSGEPLKFYDAVVGGRSIGTPGTPALLEAAHRRWGRAAWPGLFTAAIDLAEDGFAVSPRLAGLIEKDADRLSRWSDTADYFLPGGTPLAVGSTLKNPAYADTLRRLAAEGARGFYSGPVAEAITSAVRGAEGNPGVLSAMDLALYQVKERPAVCVAYRAFEACGMGPPSSGALTVGQILGMLGNYDLAELGADNPDAWRLIGDASRLAFADRGRYMADSDFVPMPTQGLVAQDYLATRATLLSGDDALPAVNAGAPEFDHALLLADDESIELPSTSHISVVDQYGNVLSMTTTIENGFGSRLMAAGFLLNNELTDFSFRSHREGVPIANRLEPGKRPRSSMAPTIVLKDGEPVLAVGSPGGSRIIGYVAKTIIAWADWGMDVQQAVALPHAVNRFGTYDVEAGTSAEDMTQPLTDMGFEVNARDLTSGLHLIEIGDGLKGGADPRREGIALGE\n>tr|A0A5B7FTI9|A0A5B7FTI9_PORTR Uncharacterized protein OS=Portunus trituberculatus OX=210409 GN=E2C01_042056 PE=4 SV=1\nMGWYEARSVGSLQELGMGMRMENFQQVAADIAELEEGGLERGWEVGEELVWDMVGTQ\n>tr|A0Y2I9|A0Y2I9_9GAMM Uncharacterized protein OS=Alteromonadales bacterium TW-7 OX=156578 GN=ATW7_12101 PE=4 SV=1\nMHVYTFAFKNIVDLYLSIGFNQVLTYTADLHVLFDMYKHRNIVALEYP\n>tr|W7X7N4|W7X7N4_TETTS Uncharacterized protein OS=Tetrahymena thermophila (strain SB210) OX=312017 GN=TTHERM_000096738 PE=4 SV=1\nMVMSNKINNVQDALLKIATFVINSNVVSNAKVDISYLTIHRFVLKIVELDIIYQIIMNVWRVIKLVSLAKVQQTQIAQLAKVIYISHLPAQNVHNAKTNNIQTIKIIVKVVSPFVRLVTAHQANNVQAVKISQLQAIYHLNVLLQINNIQNHYNIIFKMALSVLKYQVKI\n>tr|A0A5S3TR38|A0A5S3TR38_9GAMM tRNA-uridine aminocarboxypropyltransferase OS=Pseudoalteromonas sp. S4498 OX=579562 GN=CWC29_08935 PE=4 SV=1\nMKRNTCPVCRFPTNTCVCSYIGNTISNTTQVIIIQHPSEVKVAKNTAKLLALQLDRFTLYVGENTADFEELINFCRLNHVAVLYPNSHAKTLTTEYNFDQTLDAIILLDGTWKKATKLYNLNPWLSQLPSFQFDSVNASEYTIRKSKHEYSLSTLEAAAQFLEIVDQCETADLYKLQAGMVKEQMKLMPDDVKARY\n>tr|A0A859QKW3|A0A859QKW3_9HYPH DHA2 family efflux MFS transporter permease subunit OS=Ensifer mexicanus OX=375549 GN=FKV68_04155 PE=4 SV=1\nMNRIVPLILAIALFMEQMDSTVISTSLPAIAHDIGVGPITLKLALTSYMVALAIFIPLSGWMADRFGAKRIFRTAILVFIVGSVLCAISNSLIAFVLSRFLQGMGGAMMTPVARLVLVRGAPRSELVSAMALLTIPALVGPLAGPPLGGFITTYFSWHWIFLINVPVGIAGYVLSGIYLPAMERRNPPPVDILGFLLGGIAASGIVFGLSVISLPALPTSVGFASVSAGIAATLLYIVHARRHPAPVLDLKLFRNSAFRAATIGGTIFRISVGAIPFLMPLMLQIGFGLNPFESGLITFVGAIGAITTKFLARRVLAFAGFRTTLIVAAVVGGLLTFANGFFTPATPYLVMISILLLAGFARSFFFTSINALSFADIDDADASKATSMSAVLQQISLALGVAVAGAILEVQTSISGGPLGLEDFHIAFMIIAGANLLGAIPFLTMAKNAGASVSGHRLQMREAETTAGK\n>tr|A0A1H3LQ38|A0A1H3LQ38_9ACTN RNA polymerase sigma-70 factor, ECF subfamily OS=Asanoa ishikariensis OX=137265 GN=SAMN05421684_0874 PE=3 SV=1\nMVSLRDGGDLDVVPGLGPPGQTSFEEFYAAHFQSLTIQLYAYTRDLPGAQDVVQEAFCRALSRWKHVVDYDDPAAWVRRVAWNLATSRWRRTRTAAQFLRQQRPEHVAEPSPDRVALARALAALKPDHRKALILHYLADLPIAEIARQEGISENTVKSWLHRGRAALATQLSEEEADSA\n>tr|A0A0M1JIZ9|A0A0M1JIZ9_9GAMM Uncharacterized protein OS=Achromatium sp. WMS3 OX=1604836 GN=TI05_02375 PE=4 SV=1\nMTETTTPQIISIGPENTINEVVVFTSHAQIKRQITTPVQLGTNRFLIELHAFEVDADSLQAAVYGTGEIISVQYKEISVTEAETKQLDLNELKAQQHQLEDQRRTLKYTLEDCKKQRAFVDSALKQVETRDVLGKINIKELFENLQYMLEIVDTTYAKLSQQELDIFKKTQAIEEQLNLVQQQLATRPDVPSTHKIVEVLFNSKTSEKIKMEISYIVNYAIWKPFYKVDVTQDLTNLTIMMFAHIEQNTGEDWQQVKLSVSNAMPIQSTRLPELKSWHIQQPDIFECSTDPWDSNTQQAPLNGVQLDGSSNMEELTTSNLSDFPGSEVHTDDFASEADPLEEADLYIAYGRYEHAETVLLEYIKNHPNSNDAKNKLRALYLVTRNTQKLRELARNHPGKTYLQEILQHIENDDTAFPSSAPAATFIQAQDLQSSLAFEFQLPTLIDIPANGNETLLPLFTKIPKYGFFYYTIPKQDPLVYLVCQADLSNEWLPGRMNIHIGGRFVGNTILDEKQAGQELLINLGSVQDVKIKREKYLDEVSKRMFKGMLDRSNALRKVEIRIVIENLKEQEIQIKILDAIPVSSTDTIQIKDVTMTPEPTLKDWQSQQGVMQWDLNIAAKSVIEIRMQFIVKYPRNCQIAHLNID\n>tr|A0A7K5B0S4|A0A7K5B0S4_9FURN IL8 protein (Fragment) OS=Furnarius figulus OX=463165 GN=Cxcl8_1 PE=3 SV=1\nAILEGNGNLSCRCAKTTSAYISPKKYESIEIRPVGSTCRRMEIIIKLKAAGKVCVNPEAPWVTKLLKRIAST\n>tr|A0A842V0K5|A0A842V0K5_9ARCH Uncharacterized protein OS=archaeon OX=1906665 GN=GF352_04095 PE=4 SV=1\nMVKKTELMKEFEEETDQHAVWGGKVTKAFKEWKKERRLKKLVICPWCGKRVKNYTTHQCSRRRRWKG\n>tr|A0A1I8IUJ6|A0A1I8IUJ6_9PLAT TGF_BETA_2 domain-containing protein OS=Macrostomum lignano OX=282301 PE=3 SV=1\nTACLPAHSEPPSLQSTPTPPGSRSSIKTRPVGGRGEDPLLSRLFHWCGGSFCLSDQTCLEFERSRCLCLAAAICLCGCLLCADSAPAPTTFATPEPLVSSSTEEDAVSFLHKEFYSNAGTTKDGRVISDIIREELRRINLKYEGLSNMTVSTWRKFLRDAYMGVYLKQQSMSDRVTNLLYENLGISKGDVLLDVSEKEDLLTRIPDAILTRVYKWNARPMTRKFEESIFIGTPKTIQDLAGREHHGWSFIIDRSISEQRITKLSMSVHLTPKSRPLVKAMRISVYQLSNASDTLLSPGATRTKNVILSAAAMDEISVDFSADVKPIITKFFSPQSGDQIELFFLIECPQCKTKSDLNVAYLVMDCKVRIRETTGPEDQQNDRQKREASREPWPFEVAAASLFNNVTSSKDITKTQKCILEKMRMRHGQVSCCMMDFTYDLIHQSAVLAPRQLQINYCTGECHGQSEVNNAHSSLLQIFSHSQTSQLSHATREEISLCCVANTYRDFQVLTVVRKPGGGSNVQLKTIKDLSAETCTCA\n>tr|A0A0C4EGC0|A0A0C4EGC0_MAGP6 Uncharacterized protein OS=Magnaporthiopsis poae (strain ATCC 64411 / 73-15) OX=644358 GN=MAPG_11851 PE=4 SV=1\nMEDLGSGHESLGAASLVARLKALGGSVMAEKKARVRDNWAMRHDCLCFQVLTACAHMPCLPSASRCSPRRARQIREAVYDRVSPRHGHIRHGPVCAIQPRVEALDVHLQTPTGQRAVIARHVVQTTSVGFQQLYKPSLAGEHDYKGGGIHSPEYGGGGGELGQDGAGFEVVMTARSPRYMETLQNVTHPTTLGLYDIGVKEANGLAGLAAAGFPVVDGAPVASVATVAFA\n>tr|A0A178C6C2|A0A178C6C2_9EURO Clr5 domain-containing protein OS=Fonsecaea multimorphosa OX=979981 GN=AYO22_04817 PE=4 SV=1\nMASADGSPVDRKSKISKRSSNSYTSEEWRRHRPLITQLYFEEGRTLKDVAEYLKREYDFAPTERMYKSRLHTWGLDKKKKEHEMLDLVRQGLQQKGDDKDKVFLVRGRQVTLADALHYFNRKGIKDPSSLLEPQRSVSGDISSPEDADVKTPLSSNDDMLNATQDASDLEMTRSPMEMSEPEKPTLALRLRTSDVAAERLAMLQQALNIPELPPMPPFRTLSVESSVAQVTASAEDQRYQDVIFQNMQNHYMNLFTTRNLSIRNTTGTWTATSDDALADRFYYSMYHGYSFLWNGQRDRAFDNFYKAFALIEGLLKDDHVGFMIYIFDLIIRHDGTGYEEPLLMLLQHLADMAKTVFESEDHPIYVIAMHMHDATASRAWLAESTLRRLLDFFQDSIGYFHPETIALLQTFASGLLNREHFAEAAVRFQQLVDAFETTVNKRCYEVCYALRSTSEAFFHMEDYMRALQAIKASLERSQTLPRTEEREIYVRCLRGLAEISNKLGRKDEANETMQYVVDICRDAFGPEHPFTNRARMHLKTILKGDASSVSAIPPVVYRLGRGGSAAKYIWISRSSPTRLQA\n>tr|I2NKN2|I2NKN2_NEISI Proton-translocating NADH-quinone oxidoreductase, chain L OS=Neisseria sicca VK64 OX=1095748 GN=HMPREF1051_1935 PE=3 SV=1\nMNDMTLYLIIALVPLAGSLIAGLFGNKIGRAGAHTVTILGVAVSAVLSAYVLWGFIDGSRAKFDENVYTWLTMGGLDFSVGFLVDTMTAMMMVVVTGVSLMVHIYTIGYMHDEKVGYQRFFSYISLFTFSMLMLIMSNNFVQLFFGWEAVGLVSYLLIGFYFKRPSAIFANLKAFLINRVGDFGFLLGIGLVLAYFGGSLRYQDVFAYLPNVQNATIQLFPGVEWSLITVTCLLLFVGAMGKSAQFPLHVWLPDSMEGPTPISALIHAATMVTAGLFMVSRMSPIYEMSSTALSVIMVIGAITALFMGFLGVIQNDIKRVVAYSTLSQLGYMTVALGASAYSVAMFHVMTHAFFKALLFLAAGSAIIGMHHDQDMRHMGNLKKYMPITWLTMLIGNLSLIGTPFFSGFYSKDSIIEAAKYSTLPGSGFAYFAVLASVFVTAFYAFRQYFMVFHGEEKWRSLPEHHSDDHGEEHHGLGKNDNPHESPLVVTLPLILLAIPSVIIGYIAIEPMLYGDFFKDVIFVNADAHPTMHIMKEEFHGALAMVSHSLHSPVLYLAIAGVLSAWLLYVKLPHLPAKIAQTFRPVYVLFENKYYLDALYFNVFAKGTRALGNFFWKVGDTAIIDNGIVNGSAKLVGAIAAQIRKVQTGFIYTYAAAMVFGVLVLLGMTFWGLFR\n>tr|A0A233RNA1|A0A233RNA1_9ACTN Uncharacterized protein OS=Streptomyces sp. 2R OX=1883452 GN=BEH93_02570 PE=4 SV=1\nMKPRARALAVLSVVAMSIGGVTATATPAAAVGGCPSGKLCLYEGTNYNRLAVTSTSTQACVYLRNFGSGFGTGIASYVNNLPVNAVVYNYRGSTDTFAVAGTIRPGGFSSNSLGANFGVSGAVCMGGVSPS\n>tr|A0A1I9YL31|A0A1I9YL31_9BURK Polysaccharide deacetylase OS=Paraburkholderia sprentiae WSM5005 OX=754502 GN=BJG93_10115 PE=4 SV=1\nMKRCKALVKEMLAGFVVVSGLAWFTRKLLWRDRVAVLLYHDPDPDTLDRHLTYLRKLCEFVPLTDVSAPGRDRPRVAITLDDGHAGNAKLLPVFIKHNVRPTIFLCSRIVGRPRSHWWLHPGSLRIGHERLKRMTNDERLAALAAQGYQQDGDDRPTGLSIEQIQAMREHIDFQAHTRFHPILTHCSDAESAAEISDSRREIAALLQQPCEHFAYPNGNYGDREVEFVRAAGFKTARTCDIGWNDQHTDPYRLRTIIIDDAASTLRFAAQLSGIAVFLRYLREGGGWRGKFPQF\n>tr|A0A8A5HS67|A0A8A5HS67_ECOLX Uncharacterized protein OS=Escherichia coli O89m:H9 OX=2810406 GN=JSU13_20360 PE=4 SV=1\nMSGTIRALCHRAHQSSTTRDVALDRHVPGCEDILKEVIWAFSDFVRDHRGVYDPEARYPAGNPWYPVTGQF\n>tr|A0A0M1MZY3|A0A0M1MZY3_9MOLU 50S ribosomal protein L17 OS=Candidatus Phytoplasma pruni OX=479893 GN=rplQ PE=3 SV=1\nMGYSKLRRTTPQRKSLLRSLVSSLIVNEQIVTTFSKAKELRRVVEKSITLSKKNTLHARRQASLLMFDKKIDEDKTVLQKLFNELSSKYQDRPGGYTRIIKTESRKGDAAPMAIIQLV\n>tr|A0A1G7QPU8|A0A1G7QPU8_9EURY C2H2-type domain-containing protein OS=Halorientalis regularis OX=660518 GN=SAMN05216218_11345 PE=4 SV=1\nMWGYDTGNLMPECNYCDASFEQEGAYLEHLHTEHDESELSRIDRRRVADHVGDDEEGEFPTGPAIIGGTLLLTVGILVYVVFFLNIGGGSGPAAASGSVGDVEQTPYGLQTVHQHGTIDVIIDGNTLDFSQQQYQLQADAFHFESGNGVRWHKHAQGVTLEYAMSTLSIGVTDSSVTFQGTTYNESDPDTNVTVAVDGNDVDPSSYVLQDDDRIRIVANSS\n>tr|A0A4R2BCF3|A0A4R2BCF3_9BACI Histidinol-phosphatase OS=Mesobacillus foraminis OX=279826 GN=EV146_107111 PE=3 SV=1\nMVKDGHVHTHFCPHGTNDPFESYIEKALSLGYTEISFTEHAPLPLSFTDPTPLRDSAMDHSDLEEYFAEVNALKKKYGDKIKINAGLEVDYIEGYEKETAKLLDKIGPKLDDSILSVHFLKDPFGYSCIDYSPDHFRYMISAYGSIEQIHVNYYRTLIHSILADLGPYKPKRIGHITLVNKFQLKFPAPRTFSEEITQVLKAMKEYGYELDYNGAGTSKPLCREPYPPAEVIDQAVSLGIPLVYGSDAHRAKELGQGLDLMSKKLENRQ\n>tr|A0A5E4KIF3|A0A5E4KIF3_9ARCH Uncharacterized protein OS=uncultured archaeon OX=115547 GN=LFW28011_00478 PE=4 SV=1\nMADFEGLELNFTMANLPEYPPDFLPGISFGPLSRYFSGSDQKPPGGAEIEGNYLCNPFCSSCFLVNLHPANRVYAILFLHLKL\n>tr|A0A210RZX5|A0A210RZX5_9BURK Peptide methionine sulfoxide reductase MsrA OS=Polynucleobacter hirudinilacicola OX=1743166 GN=msrA PE=3 SV=1\nMNETLDKNQTTLERATLGGGCFWCLEAVYQQVSGVKSVVSGYAGGARPNPTYEAICTGVTGHAEIVDILFDPQVISFRDLLEIFFVIHDPTTLNYQGNDHGTQYRSVIFTHSDEQSNIAHEVVKELDDSKIYSRAVVTQIDVAPTIFPAEDYHQNYFVQHPNQGYCMAVVAPKLAKFRAKFKALIAPHYS\n>tr|A0A0M8WET4|A0A0M8WET4_9NOCA HTH hxlR-type domain-containing protein OS=Nocardia sp. NRRL S-836 OX=1519492 GN=ADL03_23475 PE=4 SV=1\nMHTAGFRNDIGVDQVECDTVSLPYRIGDKWTAHVLRALSPRRRRFTELRAGLPPVTAKVLSETLRTMERDGTVARESFDENPPRVEYELTGQGRKVLALLDLCCEWARENLVET\n>tr|A0A519KUV8|A0A519KUV8_9CAUL Uncharacterized protein OS=Brevundimonas sp. OX=1871086 GN=EON87_17510 PE=4 SV=1\nMRALILCAAAATALSACASTGENTYANSTAELAAQCRERGGILVPTGRPSTGRPETDNACQINGGASRIP\n>tr|A0A416ETJ7|A0A416ETJ7_9FIRM Threonylcarbamoyl-AMP synthase OS=Lachnotalea sp. AF33-28 OX=2292046 GN=DWZ56_01980 PE=3 SV=1\nMDTKVYNVEETGRCQEIFMEAGRVIRSGGLVAFPTETVYGLGGNALDARASEKIYAAKGRPSDNPLIVHIADLEELPDLVAEIPPMAETLMNQYWPGPLTLIFKKSLKVPPETTGGLDTVAVRMPDHEAAAMLIRASGVPIAAPSANTSGRPSPTRAKHVQEDLSGKVDMILDGGEVGIGLESTIIDVTGSDPVILRPGYVSLDMVKKLFEGVRMDKACTEPLKEGERPKAPGMKYRHYAPKAGLTIVEGGRAEVSSFINNHIQEESLAGNKVGVLCTEETAGCYPGGICKCMGRRADEETVAHNLFAALREFDEEEVSQIYSESFYGGQLGQAIMNRLMKAAGYHLIQV\n>tr|Q7P5J6|Q7P5J6_FUSNV Uncharacterized protein OS=Fusobacterium nucleatum subsp. vincentii ATCC 49256 OX=209882 GN=FNV0999 PE=4 SV=1\nMVGNLTDVMEKFDNNNVYSSLGLNRFKFDKNIGFYNLDANLFNLGETKDLSFTGKMSLVSDKKAYGLLVYDKIDDISYGSTIDHDLYTNLSLTKDNNKFRLNARYDYLYDMDPGSTSSDLMSRNERIGANFLLKENGLSISYDKRRGDDYRNFNFLEEDINTSARKRNVLGIDFSYTPTTVAKYEFNNFENIKASLGNYKVGNYTFTPSVSYNFLDRKLDTAKDTYRATVLGSNRLAEFNRFENIVYNNSLERRADLNLSNDNETYRIGFGKTTSEIWSREGLFDGTYRKYENKSKFYEIQLGRQNLPLGNIGTFGIDGTFRQDEFDGSSDKTNLINLKLNNDLYLYKAENLKVTNKFKAEIQKYNFSGNKNNEEGRLITKSDYIKFDNSLIFDGKSTVTTYNIGYKSSKNPYGKKNKSAEQFTTGLGIKFDENTNLSLKYTDDKRFTSKINSGKNVNDLSMKQYSINFETKKYDLGFANTDIDFVGDDFSTITDFREDINEHRIRAGYKFDNSKISLSYAEGKDKLKVDDGRYLDRKNRMYSVAYNIYGDVEQDFIGAFKTYRYGNTRIADDIRNTDVYSFSYAYRDKRFEQEELMKYATLEYEKPKDQITNDEIEQIRAILDRKSSFYNQFELARIQDETFRIGNYKKTLSAYVNLEKNNKRYSQTGNLKDSLSKFSGGLTVSYNRLGIGYTFTQKASWKNSGGSYKWSKDTKEHELSVYAKIGKPSQGWKIKTYAMFYDNKNDSTSSRNRKRSLDSIGVEIGKEMGYYEWAVSYENRYKTSSKDYEWRVGVHFTLLTFPNNSLFGIGAKNRGGTASTKPDGYLLDRPSQLKNSY\n>tr|A0A4Q3CBA2|A0A4Q3CBA2_9SPHI Alpha-amlyase (Fragment) OS=Sphingobacteriales bacterium OX=2044944 GN=EOP54_25765 PE=4 SV=1\nPAMMENSVIYEVNIRQNSPEGTFAAFSKDLPRLKELGVKVIWVMPIHPIGVKSRKEGLGSYYSIQDYKGVNKEFGTLEDFKAMVKAAHQNGIYVIMDWVANHTAWDHAWVTAHPEYYTKDKDGKMISPFDWTDVVELDFDNKDMRKAMIADMEYWLKEADVDGFRCDVAGEVPVDFWDAAAKDLNNVKPVFMLAEAEKPELMKNAFDMAYGWESHHIMNDIAQGKKTVKDWDTYMATKDSLWEKDDFTMYFTSNHDENSWNGTEYERMGDAAETFTALTFMVPGMPLIYNGQEYDFKKRLKFFVKDQLTKEKGKMYPVYEKLGALKNNNPALNGGKDAASYKRIATSADAAMLAFEREKGSDKVTFIANLTKVPQVFTVPVEGTFTNYMTGEKVTLTKGQKHNLAPWQYWILTK\n>tr|A0A2G2HQJ2|A0A2G2HQJ2_9PROT Pyruvate, phosphate dikinase OS=Robiginitomaculum sp. OX=2030823 GN=COA60_09450 PE=3 SV=1\nMTKWIYGFGGGTADGSASMKNLLGGKGANLAEMCSLGLSVPSGFTLSTEVCTNYLENQKTWPDGLQNQLAKALQVLEQQSGKSFGDAANPLLVSVRSGGRASMPGMMDTVLNLGLNQKTVEGLAELSGDRRFAFDSYRRFIQMYSDVVLGIDHDLFEEILDEHKDVQGFATEADTELAADDWEQITKLYLALVADELGHEFPDDPVDQLWGAIGAVFDSWTNDRAKVYRDLHDIPQSWGTAVNVQAMVFGNMGQTSATGVAFTRNPSTGESLYYGEFLINAQGEDVVAGIRTPQALTERAKAEIGDTEPSMEAAMPKVFAELTEVFKQLELHYKDMQDIEFTVERDQLWVLQTRSGKRTAKAALKIAVDMVAEGLITEREAILRVEPASLDQLLHPMLADGHNCPIICTGLPASPGAATGKVVFSSEEAVIMASRGEDVILVRIETSPDDIHGMHAAKGIVTARGGMTSHAAVVARGMGRPCVAGAGELKIDYSKGSFMVSGQTVHKNDVITIDGAKGHIFSGTATMVQPELTGDFGVLMFWADKVRRMKVRTNAETPVDVKTACDFGAEGIGLCRTEHMFFEESRIAAVREMILAKDKAGRIAALDRILPMQRDDFVEIFQIMGERPCTIRLLDPPLHEFLPHSEADVAQVSQATGIAVGELMSRAESLAEANPMLGHRGCRLGISYPEIYQMQARAIFEAQGKVKQQTGIMADVEIMIPLAATARELEILQGKIRQIAEQVTGDQGFAPEYKYGAMIELPRAALCAAELSEFASFFSFGTNDLTQTTLGLSRDDATSFLGDYICQGVFEKDPFVSLEQSGVGQLLEIATERSRQAKPDIKLGVCGEHGGDPASIHFFEGLGLDYISCSPFRVPIAKLAAAQAVLLREK\n>tr|A0A395H0X9|A0A395H0X9_9EURO Uncharacterized protein OS=Aspergillus ibericus CBS 121593 OX=1448316 GN=BO80DRAFT_465679 PE=4 SV=1\nMAGHRRFASTLTSAAMDIGFYGSVRRRVDGALWLPFRDSSFYPERPQIRSPSLIFPWTAIVALPVRNVQMSSWTRTHSCASRLRSRLSFLHVVTVGAVISLCYLFYTFAVPQLHRLQLRTDLSWYDLGLYGFGPSRSYVSFEYESPAVQISEWESGCDSRYTFFAPRGDSVAQPGPMILDSKGELVWMKYNWDVTQDFKVQRYQDTDYLTYWEGGETEGRGYGAWYMLDSTYTQRYVISPVGNHGGDLHEFNITPEGTALVTIYDPLPADLTSIGGPELGWIYDGVFQEIDIATGELIFEWRASEHYPISITYEKLGKSGRLRSFAFDFYHINSVDKDDNGNYIVSARHTHTVSCIDKNNGQVLWTLGGKLNEFRDLSDGKATNFAWQHDARWHANNTLTLFDNARHSSNDPENESRGMAIELNVAAREASLRAAYHHPQQMLSVSQGNVQMLDDSGRVLVEWGHSAAFSEFSADGQLLCNTHFGASAFFGFGRVVSYRAFKGTWVGRPQTVPDAEVLGDRVYVSWNGATEVVAWRLEVWETDDVHDNSFRVVAQFPKDSFETEIEIPNLELPLFRLAALDSDGNVLGITELLQREQGGSFEQVINPQYWIIVMAFVMSGVGLFVGLYTCCGWGQYFRRCRSRSSEYQLVAFSDSEAPV\n>tr|A0A828ZLR4|A0A828ZLR4_9BACI Uncharacterized protein OS=Lysinibacillus fusiformis ZB2 OX=1231627 GN=C518_0034 PE=4 SV=1\nMVFRPPYPYPMYPGGMRMPMPMQTPPQMSPQSFFPPGGFPVQPRIPGGFPMANGIGSFGGQMPMPPVQEASKVGSFLQQANSLFNTAKTYTPYIQQAMPMVKNIPSLLKLYKGFQGLPSAGGGATEAAGSDSKAAGSRRSSRQSASFTPPEPLPSKPRIFQPPM\n>tr|A0A2K5HSM9|A0A2K5HSM9_COLAP Histamine N-methyltransferase OS=Colobus angolensis palliatus OX=336983 PE=4 SV=1\nMASSMRSLFSDHGRYVESFRRFLSHSTEHQCMQEFMDKKLPGIIARIGDTKSEIKILSIGGGADFLIWGSSRVLKQNSCFIFCRTCQNDKSVMRIHDEHSSELPFGAARLKGTSSFPSFLVSFSLF\n>tr|A0A834YI29|A0A834YI29_9MAGN Uncharacterized protein OS=Tetracentron sinense OX=13715 GN=HHK36_028814 PE=4 SV=1\nMGRGRVELKRIENKINRQVTFSKRRNGVLKKAYELSVLCDAEVALIIFSSRGKLFEFGSAGNAVVAVMTKEELWLNSPEQIPSRPGDMGFVLILDLLSFPPISLSSLILFLQTHRSTYNLH\n>tr|A0A3S3PID2|A0A3S3PID2_9ACAR Cell cycle control protein 50A-like protein (Fragment) OS=Dinothrombium tinctorium OX=1965070 GN=B4U79_11510 PE=3 SV=1\nMPVNFVYEVNSERELQELKNKQTARDALRRQRLPAWEPILTPTAVLSSILLIGFALIVIGIMLLITIEQVNEKVIDYTNCVSSVNIRENCSTVIARNIYEPCWCIQRFSLDEDFGADAFFYYRLSHYHQNLRRYINSKDSKQLLGYDHRKKVSKKCEPFEKNFDPLQGQVLPIAPCGAIANSLFNDTFKLYFIENMSLIPVEIIETDISWPTDKKHLYINPPNMNFEGFTKPPYWRKYVFELDLNNSDNNGYQNEHFIVWMRTSAFPTFRKLWGRIDHKNRFSRSLPKGNYVLQINYNYPVISFGGAKSVIISNTSWLGGKNYFLGYAYIVCGTLFVILDIALFAIYYLYGY\n>tr|A0A3G9HIV9|A0A3G9HIV9_9PROT Porphobilinogen deaminase OS=Hydrogenimonas sp. OX=2231112 GN=hemC PE=3 SV=1\nMEKLIIATRGSQLAMWQAEYVKSELRKRFPEMEIEFEVVTSTGDKILDKPLALIGGKGLFTKEIEDVMLAGKAHMAVHSLKDVPTVMPEGLKLAAITKRDDIRDCFLSHKYRNIDDLPEGAVVGTTSLRRQMQLRAIRPDLKIKNLRGNVNTRLRKLAEGEYDAIILAYVGMKRLGLLESVPYHDPIDDNVMIPPSGQASLGIEIVDDERVAEIAAVLNDEDSALAARIERDFVSELEGSCQVPIAVNAKISAERVVVRAMVGLPDGTEILKEIIDAPKSEARDLGVRLADIMIEAGAKELLERAEAMAFKDERCERL\n>tr|A0A5E4QBA8|A0A5E4QBA8_9NEOP Uncharacterized protein (Fragment) OS=Leptidea sinapis OX=189913 GN=LSINAPIS_LOCUS7231 PE=3 SV=1\nMKYVSFSLIATLIFAGYVINTIWNLAEIFIPPECSRGERCFTSYLASNPVQHLVLYTSIKENPYRGGISDAAVNKVHTSLKFDYRKPAKIDLTLKIPRRTRNNGTLFMHAVLLDERRLYDDFIDIFRNEAIYTLPLVTYMDQKDETFNLLQGNNGQEIKPKKIVKPYSHIFKVAPLSILTDDLQLPVKKIPGELYPYVRVRNEKFLPIIQHNVLKSRISDLELLRSNTSEVNVTVEISPTSYGVLRLALHVRLALLQLQSLGFSEKDVDDAKGIFADTNLYLLSATVLIASCHLLFDFLAFKNDVSFWRS\n>tr|A0A093L9J8|A0A093L9J8_EURHL Melanotransferrin (Fragment) OS=Eurypyga helias OX=54383 GN=N326_02722 PE=4 SV=1\nAALGLERVRWCTISQQELSKCNDMSKAFGRAGILPPLECTAWGSAANCTQMIKEDLADAVTLDGRLIYQAGKEHGLKPVVGEVYDQEIGTSYYAVAVVRKNSSITIDSLKGVRSCHTGINRTAGWDVPVGYLTDSGRLAAMGCDLPQGKTVSDYFNASCVPGAIGVNYPSSLCQLCRGNSAGKSKCERNSQEQYYDYSGAFRCLAEGAGDVAFVKHSTVPENTDGRSLSSWAQRLRSRDFQLLCRNGNTADVTEWRTCHLARVPARAVVVRPDTDGAAVFQLLNQGQQRFNGVGTKFQMFDSAAYGAQNLLFRDSTMELVAITAQDYQAWLGEEYLRAVQALSCNPNTLPESLNWCVVSTEEIWKCGEMAIAFRKKNLKPAIQCISAKTKEQCMEMIQKKESDAVVLGGDDIYTAGKTYGLVPAAGESYSADDNSNAYYAVALVKRNLSNAFTISDLKGKKSCHTGLGRNAGWNIPIGILIKRGIIKTRDCDIPQAVSEFFSASCVPSAKLDSYPSKLCQLCVGDDSGNHKCSASSQERYYSYSGAFRCLAEDSGDVAFVKHSTVFENTDGKNTDSWAQNLNSSDFQLLCPNGARAEVTQFAECHLAQVPAQAVMVHPDTNVFALYGLLDKAQVYFGNSSNGNGFKMFDSSTFQGKNLIFKDSTVEIVPVEEKRTYAEWLGREYLESLEGMQTPQCSGAGNKIRPYLLVTVVSLLWCQAQGLD\n>tr|A0A4D6WVR2|A0A4D6WVR2_9FLOR Photosystem I reaction center subunit PsaK OS=Gayliella sp. OX=2575623 GN=psaK PE=3 SV=1\nMYINILLNISSNTVNWSPKIALIMIICNLLCITIGRYSIQVRGLGPSIPLIGSEGPGLPELLATTSLGHVIGAGTILGLRSQGII\n>tr|A0A255GDV3|A0A255GDV3_9ACTN Uncharacterized protein OS=Propionibacteriaceae bacterium NML 030167 OX=2016500 GN=CGZ94_12075 PE=4 SV=1\nMARERTEKRDRPEKRDRDKGDRDRLNTPGRESSRFPRIRMDGDTFGEFAEAFARFMGTAGFLMWMTIIIILWIAWNTLAPESVRFDPFPFIFLTLVLSLQASYAAPLILLAQNRQEARDRISVEDDRRQAAQSRADMDFLAREIASVRMNVGELATRDYIRSELRKELRELLAEHDEPAAGPERGSVGG\n>tr|A0A1X6Z5H1|A0A1X6Z5H1_9RHOB Uncharacterized protein OS=Roseivivax jejudonensis OX=1529041 GN=ROJ8625_01941 PE=4 SV=1\nMDAAFIVPVLALITLLAGTVYALWSKHVTEQAKADPAHPKSRLAADTPSR\n>tr|A0A4T0PB80|A0A4T0PB80_9BASI P-loop containing nucleoside triphosphate hydrolase protein OS=Wallemia mellicola OX=1708541 GN=E3Q18_02634 PE=4 SV=1\nMDTVTNSIFEEIKSEISALPEDQRYLVGIGGFPGSGKSSFTKHLTDKFTDSSIKAVAISMDGWHYTRDDPTAAFARRGAPHTFDAEAYTEFVQSLKLEPRVALEAPTFSHSLKDPTPSGTQVDTSVKVVIIEGNYVLLNEERWMKAANNLDKKIWVDIDEETTRQRLIKRHVESGICKDSQEAYDRAENNDLDNGRYARQNLVPDTQIIKSIEDEKFAI\n>tr|A0A4Q9TDA8|A0A4Q9TDA8_9GAMM Penicillin-binding protein 2 OS=Pseudoxanthomonas sp. NML171590 OX=2527958 GN=mrdA PE=4 SV=1\nMTMSRRRPLKNAHAEADQFRRRAALGFLGVFVCLAGLGAWYFKLQVLDHAEYATRSEANRIKLRPVVPARGSIYDRNGVLLAENIPAFRLDVVPDQAGDPDEWLDALGKVVALDPEEVKHFLAARKVSRGFRGITIKPKLSEEEIAALAVDRWRFPGVEVVPYLTRHYPYGPLLAHVIGYVGRVDEADLAQLGEGNSALTHVGKTGLERYYEQQLRGKVGYEKVETNVEGRALGVVGRVPAQAGTDLKLSIDIKLQQAMTEAFGQYEGAAVAMDPRTGQILGMVSLPSYDTNLFVNGISTRDFKALNENPSRPQFNRLVLGGVAPGSTIKPLMGLAGLDSGTRRPQDKILSTGMFYLPGVSRGWGDSHRGGHGWTDLRKSIAQSVNTYYYKLAVDMGITQVDAYMTKYGFGAPTGIDLAGEIGGIVPSPAYKMKSRKEAWYPGDTVNIAIGQGDWKVTPLQLVRAISGVADGQLRTPRLVMDTRNGFDQPWQPIAPGPTKPISDRPDNLQWVREGMMDTMRPGGSGYAIAVGAPYQMAGKTGTAQVVSRKGLAAVDPRSLPMHLRHRSLFEGFAPAQAPTIALAIAVEGGGYGASTAAPIARKIFDAWLLGKMPGDTPDAPDIVVPEDGTDTGAAPPAPSEIPGAPGPTPPPAPTAAPVPAEAPREPQAAP\n>tr|A0A1H3A3S6|A0A1H3A3S6_THIRO Uncharacterized protein OS=Thiocapsa roseopersicina OX=1058 GN=SAMN05421783_11845 PE=4 SV=1\nMTNAQCLYGHRPTPGWPGFARACRPSWRDDLCPTWIDLVVPPCSFRVFRDHEVAARRVVGHDGNDIPCFQAYDYRRLDLRSDDDEEYYLAVSYSESVSAWRLRDGRWLVHRRVELLGDEDAATSALSIDERMPR\n>tr|A0A1L7CG91|A0A1L7CG91_9CORY Threonine--tRNA ligase OS=Corynebacterium aquilae DSM 44791 OX=1431546 GN=thrS PE=3 SV=1\nMSDQPEREFAPFNVPAGTPVGAAMRELELPNKGPEAIVCVKDADGQLKDLSFVPDTTAEFTPVPANTEEGRSVIRHSCTHVLAQAVQAEFPGTKLGIGPAIENGFYYDFDAAEPFTPEDLKRIEKRMKKIIKQGQKFERRVYADQAEAREALANEPYKLELIEDKGNVDPNSDEATEVGSGELTGYYNLNPRTGDVEWYDLCRGPHVPTTKYIPAFALTRSSAAYWRGDQSNAGLQRIYGTAWESTEALEEYQHMLEEAEKRDHRRLGTELDLFSFPDEIGSGFPVFHPNGGIIRLEMEEHSRRRHIASGYSFVNTPHLTKGDLFSKSGHLDFYADGMFPPMQLDGEYDENGNCTKQPQDYYAKPMNCPMHNLIFASRGRSYRELPLRLFEFGTVYRYEKSGVIHGLTRARGFTQDDAHIYCTEDQLEAELTSVLDFIISLLRDYGLDDFYLELSTKDEGKFVGSDEIWEKSTAILQRVADTSGLDLVPDPGGAAFYGPKISVQARDAIGRTWQMSTVQLDFNLPERFNLEYTDSDGSKKRPIMIHRALFGSIERFFGVLLEHYAGAFPAWLAPQQVVGIPVAEAFSPHLEEITARLRDKGIRATVDTSDDRMQKKIRNHTTAKVPFMLLAGARDVEAEAVSFRFLDGTQVNGVPVDEAVELISAWITARRNEQPTEANLRG\n>tr|A0A7X7K3W6|A0A7X7K3W6_9CHLR Uncharacterized protein OS=Anaerolineales bacterium OX=2073117 GN=GX601_14875 PE=4 SV=1\nMVALRDDFAGELNRHWNTSLVGQGTLTMGESRMRLGVTGASSRRYSNAQIDDYQDLMRRRFPWAPPLRLSVRARFSGSAQTLRGTAGFGLWNDPFMMTGARPPNLPRALWYFFGSPPSNMKLDLHAPGHGWKAATIDALRPISLALGMIALPAVALMNVRPFYRALWPPIQRALHVQEAPLETDMAEWHTYEIEWSASHSYFRVDGTAVLTGAPSPRGPLGFVLWMDNQSLEITPWGRVRWGLLDIPDGQWMDVDWVELA\n>tr|A0A4R2CCK3|A0A4R2CCK3_9ACTN Polygalacturonase OS=Kribbella sp. VKM Ac-2500 OX=2512214 GN=EV642_10991 PE=3 SV=1\nMVQDKFSRKNFLRMTAGAALLPTAAALTAGQAAAAAAGTPDATAPLGPDGHGGPGWGHVGEILRETRPPRFHDRDFPITAYGAVGDGSTDATAAIRAAIEACHLAGGGRVVVPAGTFLTGAIHLRSNVNLHVSEGATLLFSTDPAQYLPVVLTRFEGMELMNYSPLIYARDCDNIAVTGTGTLDGQATWETWWSWVGPSGPDAQALTDLADRGVPVPERIFGAGHFLRAAFIETYHCRNVLIDGVTLLRSPFWEIHPVLSRNVTVQNVHIDSRGPNNDGVDPECSQYVVIRNCTFDVGDDCIAIKSGRGTDGLRVNVPSENILIEDCTMNIRYGAITIGSEMTGGVRNVFVRNCRIGSGYQYFGLYIKTNSVRGGYAENVYLKDIEISNLTKEVVSCNFYRGEGDTGPLTPRVRNVELRNITVGHARNAFSMTGYPRLPIQDFRLIDCTFTSIDAASTIQDVDLSFENFFVNGQPITDPAQLL\n>tr|A0A0A7RLM7|A0A0A7RLM7_9LACO Flagellar motor switch protein FliY OS=Liquorilactobacillus oeni OX=303241 GN=fliY PE=3 SV=1\nMSDSLSQAEVDALMAGNAVSKDEGQDNDNGMDEKTRQDIIGEVGNISMSQAATTLSSILNRRVSITTPHVSRMKFEEVLSAVHTPKVATVVEFKEGLAGSNLLLLEVKDAVVIADLMMGGDGNPKSSEFSELQLSAVAEAMNQMIGSASTSMATMINRKVDILPPAVKLWENASNIEYNGIVNAEEIYRISFSLSVEGLIESEIMQIFTKDMVDDITDAMLSDKATVIEREKAVSQPEQKEETKSAPKTASVDTKMMSKEQTKHVEVSKPEFQQLEENKVAEGDNLDLLLDVPLNLSVVLGRSEKTIRDILSFNSGSVVELDRLTDEPLEILLNGKPIATGEVVVINENFGIRITNILSPSQRIHRLK\n>tr|A0A3N0E5U7|A0A3N0E5U7_9ACTN Non-specific serine/threonine protein kinase OS=Nocardiopsaceae bacterium YIM 96095 OX=2487137 GN=EFW17_17180 PE=4 SV=1\nMTDQEHPQVPVHGDPADGDMPDAVLGARRDVVTFVESANQPDQLVRLWWVTVVLQIAEQHIPNLRMTNGHKHSVKYPRRSYAINSTSSARRYSTTSGRVGRPRLRPRPVTLRHTPRFRPPQPCGKIPVSLAVPNERVVATVRGTPSSGRHSAGPYELVRELGRGGFGSVHLGRDSAGRHAAVKLLHLNQAESARVRADFAREVDAARKVNPFCIAQVLDADLDADEPWIATEYIEGPTLLEAVRADGPRTGADLQRLAVSMATALTAIHRAGIVHRDLKPGNIMLASDGPRVIDFGIARGFEGTEFSVSQMVGTPNYMAPEQLEGNRLTPAVDVYAWGAVIVFAATGRNAFTAPSQAALIRRVLLGEPDLDGTPETLLPLVRRCLAKAPEQRPNAHALLEALLDGATPGTEPGADTGGTATPAPLPNVGPESDGAPPRGPAEPAEPAPPFVFADDSYHSPGDLASAMRRNWSAAVRVFANDQERALLRTWLLEDIDDRTVDRALLRRPPEDPEAVLTEFIAQVRPDLPPTYRGRDMRLSALRQTLRNHSGQPPAELHGLGSRVLRALARHHCVEEDHTCASGAPCKEYQRIHSEFVTRVERVRAATEQVDRTLRAESPQLADTVDVPALAASVTTTLLPGLLHPADETWPPREQRPRTHTEWYTALATAVGSDIPPELHEDRGVTLLYDATATRIAGIQDTEQLRVHTLERDLDRLMAGWRQATKTVFVRTFGGWCAVTLVSLPFFPWTGVFPSGVALVVGLVVVIGTLMAAGRPYAAQRHSLHTPPPDPSWREGRIATWLDGEITQAKQRAGRLPRILAHMTGGSTTG\n>tr|F1A946|F1A946_9CREN Acetyl-CoA carboxylase alpha subunit (Fragment) OS=uncultured crenarchaeote OX=29281 GN=accA PE=4 SV=1\nAMTDFVVMVEKAATMFVTGPDVVKTVLGEEVSFDELGGAMTHGTKSGVAHFVAKNEYDCMDIIKNLLSYIPQNNTESPPRVKTSDDPNRLDHNLLNMVPEDSLKPCDMKPIILSVLDDNKFFEIHELFAQNVIVGFGRMNGRTVGIVASHP\n>tr|A0A497UYM2|A0A497UYM2_9FLAO Uncharacterized protein DUF4230 OS=Flavobacterium lindanitolerans OX=428988 GN=CLV50_0313 PE=4 SV=1\nMRRILIIAGIVVAVILAFRFCEFKKDDRSTIEYDTNLIQERIVNVGKLIVTEGHFAEVLTYKDQEKYLMDLISFEKKALVIVNADVTVSYDLRQMKYDIDEKNKTITIKYIPKEEIKINPDIKFYDINQSRMNPFTGDDYNKINKSVKANLAKKIEKSSLKTNAQNRLISELSKILITTNSMGWTLRYDGQTVNEESIDKVLL\n>tr|A0A1V2ZGA3|A0A1V2ZGA3_9MICO SGL domain-containing protein OS=Rathayibacter sp. VKM Ac-2630 OX=1938617 GN=B0T42_04245 PE=4 SV=1\nMRRRAIAVPVLLAGALAGCTQAGDPAEEEAPPSVATAERVLQVTEVHEATGMTLLEGPAFGPDGSLYVVDVTAPPGEGKVLRIDLDDESVEPVWTDDSSALTSAQFGADGRLYVTDFLGGAVRSMTADGEDVREIAAGAVEGVPMQPDDLDFGADGALYVTDAAGAQDPYWEASGRVVRVDPATGSASVLADELPSPNGIAFSPDHRELWVSMNTGNRIDRLTLTGDGTEVATAFPAIHASPGIGQLDSIAVDADGNLYVGLHSRPEILVYDTAGALLQTVTVAESGLSSATNIAIRPGTTEAFATVSGSDGGFVHSFEALAEGMPQSNGG\n>tr|A0A1D8NL70|A0A1D8NL70_YARLL Catalase T OS=Yarrowia lipolytica OX=4952 GN=B0I71DRAFT_163235 PE=3 SV=1\nMSKELYANSKDDAVYSYSFGVPYPHHPYSSQRAGPTGPLLLQDTYLIDALAHFDRERIPERVVHANGGGAHGYFEVTDDISDITYAEPFQKIGYKCPTTVRFSTVGGERGSPDTARDPRGFAVKHKTDWGNWDMVGLNSPVFFIRDPVKFIHVNHSQKRDPQTNLTAGDDASNYWNYLVQNPESLHQVVYMFGDRGTPNGWRHMNCFSTHTYKMINKEGKLTYVQFHYKSDQGVKNFTGPEAAEMAGKSPDHDQKDLFFAIDNGDYPSWTVSLQTMTPEQAEEWEYSILDMTKTWPYDKFPLRKVGKLVLNKNAENFFEEIEQAAFSPSNLIHGIEASDDPVLQARLFSYPDTARHRLGPNFNQLPVNQARTFQKGSGCPFMAGNFQRDGNMAIHNQGNRPNYLSTIRPIQSVSVPNEDFKNTHDYCGVVTKEMEDESFKVQAEAAKKHNEKIWESSSYLYLSGFQESDAAQPRDLYERVYDDAAKQRMIDNVVDHASTIKQHGLKEQVAKYFGRISDDLGKKIAEGLGVPY\n>tr|A0A4R2XLQ7|A0A4R2XLQ7_9HYPH 50S ribosomal protein L2 OS=Rhizobium sp. GV031 OX=2135727 GN=rplB PE=3 SV=1\nMALKTFNPTTPSQRQLVIVDRSSLYKGKPVKALTQGLTKSGGRNNLGRITARFIGGGHKRTYRLIDFKRRKFEVEGTVERIEYDPNRTAFIALISYADGEQAYIIAPQRLAAGDKVIASEKAVDVKPGNTMPLQYIPVGSIIHNVEMKPGKGGQIARSAGSYAQLVGRDAGLAILRLNSGEQRLVPGSCLASIGAVSNPDHANINDGKAGRTVWRGKRPHNRGVVMNPVDHPHGGGEGRTSGGRHPVTPWGKPTKGKRTRSNKSTDKMIMRSRHQRKK\n>tr|A0A6F8T1T8|A0A6F8T1T8_9GAMM Superoxide dismutase [Cu-Zn] OS=Legionella sp. TUM19329 OX=2708020 GN=sodC PE=3 SV=1\nMNKLTTALISSLLSFNALHAAPMTTTLYTTDTNPTAIGTVEFEETPYGLLISPNLIKLPAGLHGFHIHQLPDCGDHGMSAGGHYDPTNTKSHKGPYGDGHLGDLPVLYVSSDGKANTPTLAPRLKLKDLTGLTLMVHAGGDNYSDTPSLGGGGAREACGVIK\n>tr|A0A3D0ZXQ6|A0A3D0ZXQ6_9GAMM LLM class flavin-dependent oxidoreductase OS=Gammaproteobacteria bacterium OX=1913989 GN=DEQ32_11910 PE=4 SV=1\nMKFGIFYEHQLPKPWSEGLEEKLFQDALDQVELADKLGIDYAWEVEHHFLEEYSHSSAPEIFLAAASQRTKNIRLGHGIRQVIANYNHPARTAECIATLDLVSGGRVDFGTGESSAILELGGFDIPVESKRQQYLESVEQICNMLAMDPYPGFDGQYFSMPCRNIVPKPVQKPHPPLWVACSNRDTIKMAARLGIGALTFAFVDPLEAQHWVDEYYSIIKSDECVPIGHTVNANICMVTSFSLHHNRAVAIERGLEGFEFFGYALGFLYGFGIHKPGRTDIFREFQAARNAKLVESPVEVGESLTGERGGIGTPDDMREHLRKFERVGVDQVTFIQQAGMNKHEHICESLEIFAAEVMPEFKSRETEREARKAEELAPFIEAAMARKQYMKMPKDDDIPVFPALGRSVVEGDADLTKKAVG\n>tr|A0A7Y7XFB0|A0A7Y7XFB0_9PSED Acyl-CoA dehydrogenase family protein OS=Pseudomonas gingeri OX=117681 GN=HX882_17635 PE=3 SV=1\nMNLHQYAETHEVTNQPPSLDGTNLYRIDLPLQEWARRFGAGWAESRIEAYGALAGGPLMEAGFLANQNKPVFVSHDRYGHRQDLVEFHPAYHELMRTAVEHGLPSLPWTDPQEGAHVARAAMTYLHSQAEAGTGCPLTMTFACVPALRLQPEIAGQWLPSILSTQYDPRNLGIAHKTGATIGMAMTEKQGGTDVRANTTRAYPVGAGGPGQPYELVGHKWFCSAPMCDAFLTLAQTDKGLTCFLLPRHRPDDSRNQFYIQRLKNKLGNCSNASSEVEFRGALAWMIGEEGRGVPTIIEMVAMTRFDCMVGSSALMRQALTQASHHCAHRLVGGRVLAEQPLMQNVLADLALESEAALALSLRMGRALDRLGDDHEAKFARLVTAVGKYWICKRAPAMINEAAECMGGAGYVEDSILPRLYREAPVNSTWEGSGNVQCLDVLRSLSKEPGVLEVLFSELGDGHGDKRLARHIEHLKLAFTDTHDIQYRARQLTEDIALALQAKLLLEAGNAEVSDGFIASRLEAGGRVYGTLPRGVNVEAIVARSTPQGG\n>tr|A0A218LFE2|A0A218LFE2_AGRCR 50S ribosomal protein L33, chloroplastic OS=Agropyron cristatum OX=4593 GN=rpl33 PE=3 SV=1\nMAKGKDVRIRVILECISCVRKGANEESTGISRYSTQKNRHNTPGQLEFKKFCRYCRKHTTHHEIKK\n>tr|A0A7W2KV63|A0A7W2KV63_9PSED Cytochrome c-type biogenesis protein CcmE OS=Pseudomonas asiatica OX=2219225 GN=ccmE PE=3 SV=1\nMNPQRKKRLLLIVGLLVGVGVAVGFALSALQQNINLFYTPTQIANGEAPLDTRIRAGGMVEKGSVQRSSDSLDVRFVVTDFNKSVPITYRGILPDLFREGQGIVALGKLNADGVVVADEVLAKHDEKYMPPEVTKALKESGQAASGGEARP\n>tr|A0A495JIB9|A0A495JIB9_9ACTN UDP-N-acetylglucosamine 1-carboxyvinyltransferase OS=Micromonospora pisi OX=589240 GN=murA PE=3 SV=1\nMPADLSAGVTAGVAADSTMADVDVIRVSGGARLAGEVHVVGAKNSALKLMAVALLAPGRSVITNVPRITDIAIMGEVLRRLGCEVSFGEDNGTSTGTIDGIPVVGVGDGVPAEVPPVDGAGPVRDVATTPSGEAQAAVDLGAAPGRARTVTIDVPAEPGTDADYDLVRRLRASICVLGPLLARRGYVRVAHPGGDAIGSRGLDMHVSGLARMGAEISGSHGFVIASAPNGLHGATIWLDFPSVGATENLVMAAVLAKGTTEIDNAAREPEIVDICAMLSAMGARIEGAGTSTIRIEGVSELRPVRHRTVGDRIVAGTWAFAAAMTQGDVTVTGASPGFLEIALDKVISAGGLVETRTDAFRVRMDRRPRAVDVVTLPFPGFATDLLPMAIGMASVSEGASLITENIFDGRFMFVNEMARLGADIKTDGHHAVVRGRERLSSAPVRATDIRAGAGLVIAGLCADGVTEISHVHHVDRGYPDFVADLRALGVEVERTTAPAEQAFTL\n>tr|A0A1G3BE39|A0A1G3BE39_9BACT Uncharacterized protein (Fragment) OS=Planctomycetes bacterium RIFCSPHIGHO2_12_FULL_52_36 OX=1801980 GN=A3E19_05430 PE=4 SV=1\nMGICLSRTIPVRDLFTGLFSGRGAVAIAGFVNKVGSKWYGTARLRRITAYCLLALFLCGLYSAEGVLGAQSVENPYPLFKHDAQHTGRSTFLGAQKANVKWSYPTEDHIISSPTVGGDGTVYVGGMDGNLYAIRPDGHTKWFYPAQSAIFSSPAIAQDGTVYFGCRDKVLFAVGPDMKEKWKFRMGGEILSSPTVGPDGTVYVGNWDGKLYAINQEGALRWTYQTGDSIVASSPAIAHDGTVYVGSRDRQLHAIDPASGKKRWGFQAGDKVDTTPCVGPDGTVYFGANDGILYALSPQGDPKWKFETGSWIYSSPSLGADGTVYFGAKDGKVYAVSPQGQKKWAFQTGDSVSSSPTLGSDGTVYVGSWDGKFYALGPDGQLKWSYDAGASIASSPAIDAEGTVYVGCDSG\n>tr|A0A552XCD5|A0A552XCD5_9LACT Carbohydrate ABC transporter permease OS=Lactococcus lactis OX=1358 GN=FNJ55_12300 PE=3 SV=1\nMKDSIGYKIFKVINAIILILIVIATVYPFWNVVVQSFSSENAITAGNVVLTPVGFNLETYKYVMSDPIFWINYKNTIIYTVVGTAISLFLTTTLAYVTSKKYLPGRKFFIGLSVFTMFFAGGLIPNYLLIKSLGWMNTMWAVTVPGALSIFNMLIMKSFFESMPDALEEAAIIDGATPFQILMRIILPLSKPILATMVLFYAVGAWNAWFGAFLYMDNKNLFPVSVYLRNLVKGATGAEAQSADEQSQVSSNIKAVTMVLTVLPVLIVYPFCQKYFVNGIMIGSVKG\n>tr|X6GFZ8|X6GFZ8_9HYPH Oxidoreductase OS=Mesorhizobium sp. L48C026A00 OX=1287182 GN=X737_09625 PE=4 SV=1\nMILQGRIAIVTGAGSGIGQAGSEAMAREGATVIVTDRDLDAARGTVDSIAAAGGRGEAIRVDVTDDAAVVGVIQDVADRHGRIDILHNHAGVQVAGSVEEIDGAGFDHSWAVNVHAQFVACQAVLPVMKRQRGGVILNTSSNSGVFLDRAMTAYITSKAASITMTRQIALDVARYGIRINSLCPGWVDTPFNDPYTDQLGGRKALEHAIANIVPMGRFATTDEIAEVILFMVSDKSSYMTGHALVADGGESLAGGTNSGQSITR\n>tr|A0A368JR03|A0A368JR03_9BACT Serine hydroxymethyltransferase OS=Larkinella punicea OX=2315727 GN=glyA PE=3 SV=1\nMSTLVTPITRDTQVFELIAKEQHRQESGIELIASENFVSKQVMEAAGTVLTNKYAEGLPGKRYYGGCEVVDEIEQLAIDRVKELFGASWANVQPHSGAQANTAVFVACLKPGDTILGFDLSHGGHLTHGSAVNISGKYFRPTFYGVEQETGVINYDKVEETAQRERPKLLICGASAYSRDWDYVRLRAIADSVGALLLADISHPAGLIAKGLLNDPMDHCHIVTTTTHKTLRGPRGGMIMLRNDFENPFGIKTPKGDLRMMSSLLDSGVFPGTQGGPLEHIIAAKAIAFGEALSDEFGDYANQIQRNAQAMAAAFVSRGYKIISGGTDNHLMLIDLRSKGLSGKLAENTLIKADITINKNMVPFDDKSPMVTSGMRVGTAAVTTRGMKESDMEQIVVYIDDVLMNHDNDAKIQVVKEEINSWMKAFPLYN\n>tr|A0A1M3KRH6|A0A1M3KRH6_9HYPH Uncharacterized protein OS=Devosia sp. 66-22 OX=1895753 GN=BGO81_01360 PE=4 SV=1\nMVEVKQLLSFPLPRNPAIVSPGLREILMSGSSLSGLPSLYDGKDMFRSAGNRMLWPKPLPAPLYGGATKGRIFSYVAGVIFVPNTVKGVVKNIKKDFWDDSIGKVIKAQMLGIDFQAMTAPPWAGEPPEDISDAVEAVFDAIESGTGKVDENLLYATYWSYRWFSMQKRGAVFLPLTDLVEVSVQQTKGGFLEHFKYEVGEHIGLTFETASGQRSTYYATMSYPDEDERLLRFVPPADRKKEYQSRKLSTEEATALIFADQRIRADIRAVMRTLLDEHLGPGVLPAAYAELSKTRTQDWSRGLDVYYEALRSTDYNVWHAHGDVLARMGSTCVAFRALPFARHGFTNPIDSIERGEPMTWVSIT\n>tr|A0A271J2M4|A0A271J2M4_9BACT Uncharacterized protein OS=Rubrivirga marina OX=1196024 GN=BSZ37_13095 PE=4 SV=1\nMGALADRVIVAAERQTGCEMPYLRTLADASGGAFARWMLAMPAAQFRQRAPRDAWHLARLGATVAQDCGTCVQIVVTVAQRDGMSVTTLRQALDDPGALYDDARAAYAFGFSISSQADDVADRVAEVEALFGHEAHVELAMAVATCQLFPVLKRGLGQSLACSLVTIEME\n>tr|A0A368CC63|A0A368CC63_9GAMM Phosphoribosylformylglycinamidine cyclo-ligase OS=Candidatus Thioglobus sp. OX=2026721 GN=purM PE=3 SV=1\nMGLTYKDSGVDIDAGNALVTRIKQAVKSTHRDEVLSDLGGFGGLFELASHKYKQPVLVSGTDGVGTKLKLAQQMNEHSSIGIDLVAMCVNDVIVQGAEPLFFLDYFATGKLDVDVSEDVITGIAHGCRLAGAALIGGETAEMPGMYNDGEYDLAGFCVAVAEKSDIITGQGIQQDDLIIGLHSSGIHANGFSLVNKLLAENNSTLTQDFNGTSLGATLLTPTTIYAKPVLQMLSAFPIKGLCHVTGGGITENLPRILPANIRADINTHAWQRLPIFDWIQTQGNVAEQEMLRVFNCGIGMIIVVTAEHQTAVEQIAKTHNIASNVIGKMSTTDATSHVNYL\n>tr|A0A1T1IFK7|A0A1T1IFK7_9PSED Gamma-glutamyltransferase OS=Pseudomonas sp. MF4836 OX=1960827 GN=MF4836_00365 PE=4 SV=1\nMLKFSAHEYPYPSQRQSVFARRGMVAASQPLAAEAGIEIMRQGGNAIDAAIATAAALTVVEPTGCGLGGDAFALVWTQGQLHGLNANGHAPAALSIEAVQAAGHQQMPLYGWEPVTVPGCPSAWAELSRRFGKLPFADLLQPAISLARDGFPLSPVVAHQWQIALDEFSPHRSALLEPWFDTFLIDGRAPRAGELFRNPAQARTLEELATSACESLYRGPLAQRMDAHSRATGGYLRATDLADYRAQWVEPIHINYRGVDVWEIPPSGQGLVALMALKILEGFDFDHRDSQQTWHRQLEAMKLAYSDGLHYITDPQHMRVAVADLLSDAYSARRREQIGEQAQPPKPGDPHASGTVYLATADAEGNMVSFIQSNYHGFGSGVVLPDSGIALQNRGQEFSLDPSHANCLAPGKKTFHTIIPGFLSQGGEALGPFGVMGGYMQPQGHVQMVMNLVDFGLNPQAALDAPRWQWLGEMKVGIEQGASRDLANALARRGHQVEIASDLTDYGRGQIILRDPDSGVLCGGTEPRADSHIAVW\n>tr|A0A3M3ZGU4|A0A3M3ZGU4_9PSED Uncharacterized protein OS=Pseudomonas syringae pv. tagetis OX=129140 GN=ALQ32_04322 PE=4 SV=1\nMFSLKKIALVTAAAAMLGSGPVLAQPDLPAQLDEARQEGSIWTAFALNKHLSPFKIDVDVEQGTAILKGKVENEVDRELAERIALDTKGIEKVDNQLEIDPAVASDPGTRTNMAQRFEDATLVATVKSKLLWSSVTEALSIDVDSKDGVITLKGRAQSPEAKELAGSLASNTDGVVSVNNLISLSAADSIAAKTQPQSVIPTEEMSDAWITSKVKASLIYSRTLDGLNIKVDTNAGVVSLNGVVANFAEKELAVEIARNIRGVKGVNGDALKVMARSAG\n>tr|A0A4R8QWY5|A0A4R8QWY5_COLTR Short-chain dehydrogenase chyC OS=Colletotrichum trifolii OX=5466 GN=chyC-1 PE=4 SV=1\nMARIFITGSSDGLGAIAAQKLVENGHQVTLHARNAQRAEDASKAVPGAEGVLVGDLSKLADVKKLAQEANSLGTFDAVIHNAGLFRGPFRKTDFGLPIMPSLTAVNVGAPYVLTALLNRPKRIVYISSGLHRGGDATFNDPTWVERGEARWNEDQAYSDSKLHVSTLASAVARLWPDVKSNSVDPGWVPTKMGGASASGSAEDGVATYVMLAEGADGGHVSGKYFKPGKQEDTPQPFTQDEKRQDQLLSLWGELTGVKFPAA\n>tr|L0HHT0|L0HHT0_METFS 2-oxoacid:ferredoxin oxidoreductase, alpha subunit OS=Methanoregula formicica (strain DSM 22288 / NBRC 105244 / SMSP) OX=593750 GN=Metfor_2322 PE=4 SV=1\nMTRTEFWQGNTACAEGALAAGCNFFGGYPITPSTEVAELMAAKLPKKGGVFIQMEDEIASMASIIGASWTGARAMTATSGPGFSLMMENIGFAAMTETPCVVVNVQRGGPSTGQPTMSAQGDMMQVRFGSHGDYAVIALSPATVQEMFELTAKAFNLADKYRTPVFLMADETVGHMREKILVPDSVEKIGRKPFVPGTPPFKVTDPDLIPGFPTFGTGQHVHVTGLTHDERGYPAATNPPLHAALVKRLVDKIENARDEMADYDIVNPDAEQVFVAYGGPVRTVMQVMHDKKDTNIGFLRIRTVWPFPEKALAKFKNAQRFLVPEMNLGQIAREIQRHVKVPVVPIPKLGGELHTPAELVKVLEGKA\n>tr|A0A0G0BS17|A0A0G0BS17_9BACT Sortase OS=Candidatus Roizmanbacteria bacterium GW2011_GWA2_35_19 OX=1618478 GN=UR68_C0020G0028 PE=4 SV=1\nMIVRTFYNPLVEETKYFVNKAANKQYIVADNFEANKIQPTIQENQSASKGILAKAFNIKPIEILSPEDPDFSIIIPKIGANSKVVPNVDTSDEKIYLDVLNRGVAQAAGTAYPGEGGHIFLFAHSTDYFWNVTTYNAIFYLLYKLEKNDEVDLFYKGQRYVYKVIGSEVVDPSQVQYLTRKTNREFLTLQTCWPLGTTLKRLLIFAVRVSE\n>tr|A0A2S7ULD4|A0A2S7ULD4_9VIBR Probable membrane transporter protein OS=Vibrio jasicida OX=766224 GN=BTO01_24490 PE=3 SV=1\nMEMIEPTMLLVLALVAFVAGFIDAVAGGGGMLTVPALLSLGLPPHIALGTNKLAASFASSTAAYTYYKKRLFKPQCWGRAFVATLVGATLGTLFVDAISTEWLEKALPLIILAAAMYTVFHKPPQSTHQSPTPEPCPMLNKKQYMQGLSIGFYDGLAGPGTGAFWTVSSMALYRLNILLASGLAKAMNFTSNFTSLVTFAVLGHINWVLGLTMGVCLMAGAFVGAHSAIHFGAKFIRPVFVTVVSVLAIKLAYDAWFVGLT\n>tr|A0A5E7K8T9|A0A5E7K8T9_PSEFL Uncharacterized protein OS=Pseudomonas fluorescens OX=294 GN=PS874_02483 PE=4 SV=1\nMRQPDIEIYLKDADVDYKAIAAWLGAALGPCTDWVQKGQTYKCKAGNVPVTWLPKAVGKWNSLFLESDQTPWEDDIACARAAFVALNVEVRCAPGTWVEEEGEETADRWMRISADGEEEITWKTA\n>tr|A0A0H4KSG7|A0A0H4KSG7_9RHOB Transcriptional regulator OS=Marinovum algicola DG 898 OX=988812 GN=MALG_01290 PE=3 SV=1\nMSGAARELGIAQPALSKQMSQLEHELDAQLFQRHSRGVTLTRAGEKLRQEAAELIRRMEAIRQAIHTEAEDVTGKVVVAVISSLAPTLATELYPRLEQEYPGISLHIVDFPSERAGQALLNEEADLAVMPNAATEFPQLRSRPLFEESFHFLTKATPRAPARTIRLSEAAEHPLVLPFRSHDLRRRIEEAAGSIGVTLNVKYQTGSINVIDAMVERGMVASIVPMTHWLDRIASGQVSARLVTEPGVSRVHSLCHRPVRDLAPAAKVVHDVIMTEVQSLVAAGKLSGKPVRA\n>tr|A0A7W0EWG2|A0A7W0EWG2_9DELT Uracil-DNA glycosylase OS=Desulfobacteraceae bacterium OX=2049433 GN=FP816_06960 PE=4 SV=1\nMETCIHCKYYFITWDSKRPHGCKAMGFKSREVPCVVVRKSSQGLDCLQFKRKDDKSK\n>tr|A0A174QDC4|A0A174QDC4_BACT4 RteC protein OS=Bacteroides thetaiotaomicron OX=818 GN=ERS852557_01330 PE=4 SV=1\nMKELLENILSEIDVEIDEIDLYGYDIVENSLSMVHRLQAVLNDLKTKLQTYSFPAKEDEITFFKTQKPEILGRLLFFYKIYRIETQCPNGSDDVIRSYINRELDNLTYFFNRNLDFYQYYRSHSTLYDEYYFVRGKSDLRLCTDSAQFDKDPNFSTGYDYKVAKIIANEMLRIYLNKRLVKLETNTQVEDNLQKCLKYPFRFTGKKVFLIELGYSLVSSGDINNGNVEIKEMMNFLGTVFQVELGDYYAAYIAMKERKKDRTAYLSRLQDSLVKRMDEDDSK\n>tr|A0A6B0Z2B0|A0A6B0Z2B0_9CHLR LLM class flavin-dependent oxidoreductase OS=Caldilineaceae bacterium SB0664_bin_27 OX=2605260 GN=F4Y42_21435 PE=4 SV=1\nMKFGAQVNCYLTTWDNIRAVIEAMEAGRWDSLWFADHYMPSSPKREEELLPAYEGYTLIAAAASITERMRLGNLVLGNTYRNPALVAKMAGTVDQISHGRFTLSIGAAWFQREHEAYGFDFPPMKERSDRLEEACALLRALFTADGPVDFEGRYYRLDQAPLSPGGYNNRQIPIMVGGTGERRTLRTLARYGDIMNLDGWAGGPMTQEYYFHKVGVLERHCENVGRDPSEIKRTILMPVKVTDDPAEAEAFIASRSLGEGTAAGPKDYVIERIGQFMDVGVDEIMFAGLLTRDVEQYHYFEEEILSAFD\n>tr|A0A5K1GDA5|A0A5K1GDA5_9MAGN Uncharacterized protein (Fragment) OS=Nymphaea colorata OX=210225 GN=NYM_LOCUS28356 PE=4 SV=1\nIVWAGRGADRKGETERGGVQTKKGKTAVGVREEREQVG\n>tr|A0A3A8NX55|A0A3A8NX55_9DELT Uncharacterized protein OS=Corallococcus llansteffanensis OX=2316731 GN=D7V93_32740 PE=4 SV=1\nMRRSSLQRRLQRGQAMAEYGVITAAFFGFTVLSWPFLIQLLRALNTYFQSIYYIIQSPIP\n>tr|Q8X4F5|Q8X4F5_ECO57 Uncharacterized protein OS=Escherichia coli O157:H7 OX=83334 GN=Z5883 PE=4 SV=1\nMQPDKLGAKKWMS\n>tr|A0A4W6DJV8|A0A4W6DJV8_LATCA Uncharacterized protein OS=Lates calcarifer OX=8187 PE=4 SV=1\nIAAHEGSANVVELLLKHGSDPLISDHQGQTPLSLASRQGHVKVLSVLLEWAKSQKPEIAAQMMEHVDSEGWTALRSAAWGGHSEAVRLLLDAGADVDGCDGEGRTALRAAAWGGHEEIVLTLLNYGAEVNKADSKGRTPLIAAAYMGHHEAVEILLDRNAEVDLADGDGRSALSVAALCVPTAAGVKGYGEVASLLLERGADPGHRDHDGMTPLLLAAYEGHDEVVELLLEAGADVDETAGPDGNVPAAAAVTPLLAAAAMGHMKTVSRLLFWGAAVDAIDCEGRTALCLAAARGSTEVVRALLDRGLDENHKDDLGWTPLHAAACEGHRAVCAALTERGSMARVGEMDIEGRTPLILAAQEGHWSTVRLLLDRRSPIDHRAYDGHSALSATLLERPC\n>tr|A0A2V8IIA6|A0A2V8IIA6_9BACT OmpA-like domain-containing protein OS=Acidobacteria bacterium OX=1978231 GN=DMF84_27170 PE=4 SV=1\nMNAVSEFIVALAVAATACIGATHSVSDADVRPQDAIDLILTAFQNYPLVALSDGAGHGQLETRDFFIGLIRDRRFPQTVRNIVIEFGNARYQSVMDRYVSGEAVTREELRHAWEDTTQVTGVWSLPMYEHMLAEVRAVNRPLPPALRIRVLLGDPPIDWSTVTSPADEDMNDWRDAHFAHVIEREIMNRTANALLFFGGAHLGRKVIFPNSLIHLLDARFPGRTFVLAALDAGRTDSRITKRLQGWTVPAGVSVRGTWLGKMDVQDIGFGFSRGVVEDDVDVVLLLSSAPPRQDEPPALTSSYGRELARRRALHQATLPFRGAKIRFEESRAAFATDADEPLQAVVSELFRDRGVRLLVKAFADPTESNAVALSTLRAELLVDWLAARGVERHRLVPKGCGALRPLTFGKTAADRAMNRRAELVRLTPTAGCEPTTATSPPHSGPPRRSSD\n>tr|A0A140H1J1|A0A140H1J1_9VIRU Nonstructural protein (Fragment) OS=Mamastrovirus 1 OX=1239565 PE=4 SV=1\nTAKQLRDSGLPARLTEEQLHRIWRGGPKKCDG\n>tr|A0A0C3DQN5|A0A0C3DQN5_9AGAM Uncharacterized protein (Fragment) OS=Scleroderma citrinum Foug A OX=1036808 GN=SCLCIDRAFT_63544 PE=4 SV=1\nAARKTTHKNVLYEVDSEDTVAWLRSPEGQRLFASKFGTEISLAYRPFSVLIEYVPIALELENPNVHRDIERRNNLPTRSIRSARWIKP\n>tr|A0A534C027|A0A534C027_9GAMM Homoserine kinase OS=Gammaproteobacteria bacterium OX=1913989 GN=thrB PE=3 SV=1\nMSAAPPRTRASAFAPASVGNVAIGFDILGFAVEALGDRVTVTSTAAPGVTISAVRGIADELPQRAEDNTAGRALLAMQEALQPKFGFTLEIDKGIPLGSGLGGSAASAVAAVVAANALLAEPCGQLELLRFAMAGEAVASGGRHVDNIAASLYGGLVLTVGIDHPRVKRIPVPASVRAVIVHPHMYLATANARAILRRSVELSDFVWQTAHLAGFISGCYTDDLDMIRASLEDVVIEPQRQALIPGFADVRRGAMAAGALGCSISGAGPSMFAWALEATAPKVLAAMREAFARHSLATDEWVVELRSNGARVIG\n>tr|A0A1N6JS24|A0A1N6JS24_9RHOB Ribosomal RNA small subunit methyltransferase E OS=Rhodovulum sp. ES.010 OX=1882821 GN=SAMN05444722_2370 PE=3 SV=1\nMTPMSDSRSAKIRLYVEQPLGEGQTVPLSRDQAHYLFSVMRLAAGDRVLVFDGRSGEWLARVAEAGKKGGTLVCEAQTRPLQPPPDLWLFFAPIKKARTDFIVEKAAEMGAARICPVQTDFTNAERIRRDRLQAHAVEAAEQCGGTFVPEVCEMRKLSEVLEGWPHGRRLMFCDEMLAGAGRALGDAAPGPWAILIGPEGGFSEAERDRLRALPFAHPVSLGPRVLRADTAAVAALTVWQQALGDWA\n>tr|A0A6G5A2B5|A0A6G5A2B5_RHIMP Putative secreted protein OS=Rhipicephalus microplus OX=6941 PE=4 SV=1\nMNFEKFAILLMFRHLSVCVALHIKIYTLDHFKGCRNDIYFCKFNTNLCFTREYIIYIELPPRLSTADRKRTSLHRGFLGSLLNAPKPAC\n>tr|Q3ZH33|Q3ZH33_9NEOB Rhodopsin (Fragment) OS=Exerodonta chimalapa OX=318317 PE=4 SV=1\nNFYVPMSNKTGVVRSPFEYPQYYLAEPWKYSVLAAYMFLLILLGFPINFMTLYVTLQHKKLRTPLNYILLNLAFSNHFMVLCGFTVTMYSSMHGYFVFGQTGCYI\n>tr|A0A5F2E027|A0A5F2E027_9LEPT DUF962 domain-containing protein OS=Leptospira licerasiae OX=447106 GN=EHR05_01230 PE=4 SV=1\nMTENKKYETLQEFWPFYLREHSNKMNRVFHFIGTTCALVFIVSAIFYLNAWYLLGALFSGYLFAWIGHFFLEKNRPATFIYPFKSFVSDWRMYFYTITGQLGKELEKAGVK\n>tr|A0A1H1IN95|A0A1H1IN95_9EURY DNA-binding protein SAMN04489842_3657 OS=Natronobacterium texcoconense OX=1095778 GN=SAMN04489842_3657 PE=3 SV=1\nMSERPDEEKLEELRQKKMEQLQERADGQDAEAQEAAQQQAEAQKKAVLRQHLTDDARKRLNTVKMSKPQFGEQVERQVISLARSGRIQGKIDDDKMKQLLKELKPDSKSFDIQRR\n>tr|A0A7M3A1Y5|A0A7M3A1Y5_PSEAI Cold shock-like protein CspD OS=Pseudomonas aeruginosa OX=287 GN=cspD PE=4 SV=1\nMLSGKVKWFNNAKGYGFILAEGRDEDLFAHYSAIQMDGYKTLKAGQPVNFEIIQGPKGLHAINISPATATTAAPSAPAPQEEPQATPVEA\n>tr|A0A2Z6N5H4|A0A2Z6N5H4_TRISU Uncharacterized protein OS=Trifolium subterraneum OX=3900 GN=TSUD_214070 PE=4 SV=1\nMKKLVIQVKRMNLTGFYITLFSNTYSHINRVLFYRERILSRESPSTVVHKIPESFQSATDYKNSFIPLLFEETRADLFSSLYGVSQAPFCEIANVSESRRLTTPFPEVQNQFIQFHHVLWLKSETTGNYKPVSGDLIALTHIRPKGLSELNTLESPYRIAYVKEARKEWKELPDRISVLTSKCMKMDIENDLGNNKELSSKCMKMEIRYDLWNNKELKLYAVHLMNMTTNVRIWDALNTISRVKIMKTMLGPSQIVAIRLHRLVMDSLEHDMYGLGDIVLFGHNKRMKLGSHTGLDNVFLDNRVEKLMQCFNPNTGWKTNLQYMIELLESMKESANNTESMKAFKEEFGKQREKLTFLMQILYTHISTSLISPEMVKEMLQALDLLRRLGISLSQAKFKIPANFQLLQISVILDEVCLKGL\n>tr|A0A832LQC9|A0A832LQC9_9BACT S1 RNA-binding domain-containing protein OS=Phycisphaerae bacterium OX=2026778 GN=ENS20_04560 PE=4 SV=1\nMIPTSYSQEAWPMSESSNDPLKEKFRPEEDPQVKKEVDAALAGVDVEQLLGGDQAAAARAVADGSSRERRGKVVGIGADDVIIDLGEKAQGIAPLSQFDQVRIGEEMDFILDRFDEAEGLWILTRKGAVSQNVTWETLEPGQIVECEATAMNKGGLEVKVKTLRGFLPSGQVDVVYLKDISIFLGQRFKVQVMQVDREKKNLIVSRKKIVEREREELRAKLLAELAEGQVRRGVIRSVTDYGAFVDLGGADGLIHVSEMSHRRIRHPSEVVKIDDIVEVKVLKIDPETRKISLSLKAVGADPWADAAARYAPGTEVTARVAKIESFGAFLSVEDGIDGLLPVSEISWQRIRHPADVLKEGETIKVVSIAVEPQQRKLTFSLRQAVPDPWGVVADKYPRGTVTTGKVTKVLDFGAFVELENGVEGLVHISELAARHVKNPAEAVQAGQQVKVRVLEVDREKRRISLSIRRSEEPKPPEPPSPEELKRREEEAKRLARKKEQRSKLRGGLDF\n>tr|A0A1J0GQZ4|A0A1J0GQZ4_9CAUD Uncharacterized protein OS=Mycobacterium phage Albee OX=1913041 GN=SEA_ALBEE_18 PE=4 SV=1\nMSASDRQPPGPYPEGFTEAVRPEDVDVSKCDHEFGVCFCVHDWRIHWGNLDRSGL\n>tr|A0A3B9GZ83|A0A3B9GZ83_9PROT Aminodeoxychorismate/anthranilate synthase component II OS=Hyphomonas adhaerens OX=81029 GN=DCG58_11365 PE=4 SV=1\nMILVLNNRDSFVFNLARCLTLAGADVEVEDSGRITINDIIRRRPEAIVISPGPSRPEQAGVSIAAVQTFGADLPILGVCLGHQVIAAAYGGSVRRSLTPSHGRTANIMHQGRHLFRGLPSPLPVGLYHSLTVDLEPNETGLQVDATAPDGEIMALSHVEHPVFGVQFHPESILTEQGQGLLGNFLRQYRSVPCL\n>tr|A0A349TMC4|A0A349TMC4_9GAMM UvrABC system protein B OS=Gammaproteobacteria bacterium OX=1913989 GN=uvrB PE=3 SV=1\nMSKPFQLESSFKPAGDQPAAIASLVEGLEDGLHAQTLLGVTGSGKTFTIANVIEQVQRPTLVMAPNKTLAAQLYGEFKEFFPHNAVEYFVSYYDYYQPEAYVPASDVYIEKDASINDHIEQMRLSATKALLERQDVIVVATVSAIYGLGDPNSYLQMVVHLDRGDRMDQRKLLRRLTDLQYTRNDMELRRATYRVRGDVIDIYPAESERHAIRIELFDDEVEKLSYFDPLTGALIKEVPRLTVFPKSHYVTPREKLLATLDDIKIELHERLKQLTSNNRLVEAQRLEQRTKFDLEMIQELGYCNGIENYSRYLSGRESGEPPPTLYDYLPDDALVVSDESHVSIPQLGAMYKGDRSRKETLVEYGFRLPSALDNRPLRFEEWESLTPQIIFVSATPGPYEEEHEGQQVRQVVRPTGLIDPELEVRPASTQVDDLLSEVNRVVALKERVLVTVLTKRMAEDLTDYLAEHDVRVRYLHSDIDTVERSEILRDLRLGNFDVLVGINLLREGLDIPEVSLVAILDADKEGFLRSERSLIQTMGRAARNLNGKAILYADTVTGSMQRAMDESNRRRETQLAYNEAHNITPIGVQKRVLDIMEGAYSAPGSRTRQRTRSVAEPQGDYGTLNFNDPYEIRKEITKLEAAMYEQAKNLAFEEAAATRDSIADLKQQLLRQ\n>tr|A0A0Q7TC29|A0A0Q7TC29_9HYPH Protein-export protein SecB OS=Pseudolabrys sp. Root1462 OX=1736466 GN=secB PE=3 SV=1\nMTTTNGGQSQDFNPEQVPQLNVVAQYIKDFSFENPNAPKSLIGGEQPQISIQINVNAAPMSDSDIEVVLQLSGKAETGGSLMFSFDLAFGGVFRIRNVPQESMNAVVLIECPRLLFPFAREIIATTVRNGGFPPLLLDPVDFVALYRQKMAQLGGQAPAQ\n>tr|A0A1H8PJE2|A0A1H8PJE2_9PSED Ca-activated chloride channel family protein OS=Pseudomonas sp. NFACC39-1 OX=1566195 GN=SAMN03159293_02848 PE=4 SV=1\nMFEFAWPWIFALLPLPWLMRLVLPAADSGEPALRVSFLGDLEGLVGRRARSNLPTWRQQAPFILLWLLLLIAAARPQWLGEPLPIAASGRDLLVAVDVSGSMDFPDMRWQDEDISRLALVQHLLGDFLESREGDRVGLILFGSQAYLQAPLTFDRRTVRLWLDEARIGIAGKNTAIGDAIGLALKRLRQRPANSRVLILVTDGANNGGEIDPLTAARLAAEEGVKIYPIGIGADPEESGTAGFVGVNPSLDLDEATLREIAQATGGQYFRAQDGQQLLAIKTTLDQLEPVTQQPTQARPAQALYQWPLAVALLLSVLLVARERWPDNPLQRLFTQPLFQPAEHSEWRRRLKRMRLGKRR\n>tr|A0A1C3Z1D9|A0A1C3Z1D9_9LACO Citrate lyase alpha chain OS=Lactobacillus apis OX=303541 GN=GA0061073_0264 PE=4 SV=1\nMENKVKRNLPDELMSDMKLKPFESVEVGNPEIKRIAPKVHVTTGENKVVDSLEEVIKKTLKDGMTISFHHHFRNGDFAFNKVMDLIIKLGYQNLTLAPSSLTSVMNDKVIEAIQKGVITNITSSGMRGTLGDFVSHGGLKNPVVFRSHGNRARSIEEGEIKVDVAFLGVPNSDPAGNANGQEGDAVFGSLGYALIDAQYADNVVLLTDNIIDYPNTPASIKQTQVDYVVKVDQIGDADKIGSGATRFTKDPKELKIAEMVNQVIVNSPYYKEGFSFQTGSGGAALAVTRYLRQSMINDGITASFALGGITKPTTDLLDEGLVKKIMDVQDFDKGAAASMAKNRNQQEIDASWYADPHNKGAVVNNLDVAILSALQIDTDFNVNVMTGSDGVIRGAIGGHQDAANAKMTIITAPLVRGRNATVVPSVETVVTPGDSIDVLVTERGIAINPKRKDLIEAFSKVPDLNIVDITELQQMAEKQVGVPKPLEYTDRTVALIQYRDGTIIDTIKQVKD\n>tr|A0A3S0XSH9|A0A3S0XSH9_9GAMM 10 kDa chaperonin OS=Legionella sp. km772 OX=2498111 GN=groS PE=3 SV=1\nMKIRPLHDRVVVRRMEEERTTAGGIVIPDSATEKPMRGEVIAVGAGKVLDNGDLRALAVKVGDVVMFGKYSGTEVKVEGKELVVMREDDIMGVIEK\n>tr|A0A5S9Q0P4|A0A5S9Q0P4_9GAMM ATP synthase subunit delta OS=Zhongshania aliphaticivorans OX=1470434 GN=atpH PE=3 SV=1\nMAELSTTARPYAKAAFEHALAASTLGEWSAMLVTAAAVSQQPEVMKFLSSPAMTTAQQAQMFIDVCADTFNAGGENFIKILAENKRLGLLPTISELFDAQKAIQERTVDVELTTAFALDSESEKRLAEVLGKKLAREVHVHTTIDPLLLGGVIVKAGDLVIDGSVRGRLAKLAEAINS\n>tr|A0A1H7GQD5|A0A1H7GQD5_RUMAL Uncharacterized protein OS=Ruminococcus albus OX=1264 GN=SAMN05216469_102219 PE=4 SV=1\nMKKFTMTNLYSYNELYLSLYLESEETLFVVHTERSECAGTPVTSISG\n>tr|A0A699MW03|A0A699MW03_TANCI Reverse transcriptase Ty1/copia-type domain-containing protein (Fragment) OS=Tanacetum cinerariifolium OX=118510 GN=Tci_766510 PE=4 SV=1\nMQEELHEFERLEVWELVPRPDKEEGIDFEELFALVSRLEAIRIFLAYAAHKNMVVYQMDVKTAFLNGNLWEDVYVSQPNGFVDPDNANHVYKLKKALYGLKQAPHAWYDMLSLFLLSXELVPRPDQVMVITLKWIYKVKLDEERQRLTSGLQISQNPRSIFINQSKYALESLKKYGFESCDPVDTPMVEKSKLDEDKEGKVVDPSHYRGMIGTLLYLTASRPDLQFAIC\n>tr|A0A1C4LAA2|A0A1C4LAA2_9ACTN Uncharacterized protein OS=Streptomyces sp. BvitLS-983 OX=1838282 GN=GA0115250_119211 PE=4 SV=1\nMTLFLGLGIAGIVLLVLSLIFDGVLEGFFGDFLDGLLSLPAIAGFVSMLGFGGAIVLGTTGLGVAGATVVGVLAGVVTGWVVLKLSKALMRDQTDATPRSADLVGTAGSVVTAIPASGYGEVLVYLGGQPLKLSAKSTAPLTRGTEIWVEASLSSTSVSVRPVER\n>tr|T2KLF8|T2KLF8_FORAG Uncharacterized protein OS=Formosa agariphila (strain DSM 15362 / KCTC 12365 / LMG 23005 / KMM 3901) OX=1347342 GN=BN863_18780 PE=4 SV=1\nMFKVKLAFMIKVLINNTATKNIHDKKNYIYLTKHQLYGVLPRFC\n>tr|E3RGL9|E3RGL9_PYRTT Uncharacterized protein (Fragment) OS=Pyrenophora teres f. teres (strain 0-1) OX=861557 GN=PTT_06956 PE=4 SV=1\nMLKDVIANNPDKTLTQCLDIVIDKLQLLHQAMTQQNGPSERALANQLISACQGVEACSAVLIRPASTFEA\n>tr|A0A7J6B8G4|A0A7J6B8G4_AMEME Sodium/hydrogen exchanger OS=Ameiurus melas OX=219545 GN=AMELA_G00035750 PE=3 SV=1\nMGSERKHHAAKGAWGTLRLCVLASLSVCLCLCRAEDSSMENIVTEKKAEESHRQDSVDLLVFILLLTLTILTIWLFKHRRFRFLHETGLAMIYGLLVGVVLRYGIHVPRDINNVTLSCHINASPATLLVNVSGRFYEYTLKGKISSNDVKDVQDNEMLRKVTFDPEVFFNILLPPIIFHAGYSLKRRHFFRNMGSILAYAFVGTVVSCFIIGLLMYGCVMLMKYTGQLGGDFFFTDCLFFGAIVSATDPVTVLAIFNELQVDVNLYALLFGESVLNDAVAVVLSSSIIAYQPEGNNSHTFEAMAMLNSLGIFLGVFSGSFALGVATGVMTALVTKFTKLRDFQLLETALFFLMSWSTFLLAEACGFTGVVAVLFCGITQAHYTYNNLSPESQVRTKQLFELLNFLAENFIFSYMGLALFTFQNHVFNPVFIVGAFLAIFLGRAANIYPLSFLLNLGRRNKISYNFQHMMMFAGLRGAMTFALSIRDTATYARQMMFSTTLLVVFFTVWICGGGTTQMLSFQHIRVGVDPDQDNSIGPEGLERRSTKQESAWLFRIWYNFDHNYLKPILTHSGPPLTATLPACCSPLARCLTSPQACENEGQLKDDDSDLILNDGDISLTYGDITVNTDATGTRTISIPAGAAGVHSDDALDRELTFGDHELVIRGTRLVLPMDDSEPPLRHREI\n>tr|A0A1I5AAM2|A0A1I5AAM2_9MICO VOC domain-containing protein OS=Mycetocola miduiensis OX=995034 GN=SAMN05216219_1297 PE=4 SV=1\nMFTPVHAFSGFSVDDIDAARSFYSEKLGLTVADDDMGILRITLPGGAEVIAYPKPDHTPATFTILNFVVSDVDAAVDELNGRGVTTKIYEDENLPTDEKGVMRDNGPTIAWFRDPAGNVLSVISQ\n>tr|V4K2D3|V4K2D3_9CREN Uncharacterized protein OS=uncultured Acidilobus sp. MG OX=1410573 GN=MGAcid_05220 PE=4 SV=1\nMLSHTVELMKSSQGERPDGLPGRGYLLTCTPAPR\n>tr|A0A1D6F6L1|A0A1D6F6L1_MAIZE Uncharacterized protein OS=Zea mays OX=4577 GN=ZEAMMB73_Zm00001d007456 PE=4 SV=1\nMLEPVDIGRDGKTVSCRIHDMVLDLISFLSNEEHFLTKVGEQQPISLDLPKKIHRLSLQISQEEEVKQLATMSFSHVRSLTVSTKVFQLMPKLSAFLVLRVLNLKKCKGVRNHHFKDICNMFHLRYLSLNAEFITEMPREIQNLQFLQVLDISNLGHKVKMPTIIHLRQLLRLCFRPMWGIRLPDGFGKLTSLQEVKGIITIKLPSMLHNLGCLTNLRTLAIDFCDWDESYEEPFIQCLSNLVSLKSMEIKGTMVSSLCSECDKLYPGPQHLCSIDIESTAVPRWMSSLCFLSSINIELLALGAQDFHVLGSIPSLRCLSIHVKETRDERLVIGKCYPFRCLTEMQIDYESMAVVFAPGSMQNLKELHLVFGVKEVMHKYGDCNFGLEHLMSLEHVSVKTMYSIMPEEVEAVKDEFQKSLDMNPGKPTLIVDYKYPIKRKIRSHAQAIRAAILFANAGRIPATEGL\n>tr|A0A6A9K9T2|A0A6A9K9T2_PSEAI Exodeoxyribonuclease III OS=Pseudomonas aeruginosa OX=287 GN=xth PE=3 SV=1\nMDTLKIATFNVNGIQTRLAALLAWLEREAPDIVCLQELKTPDARFPAAALERAGYGAIWQGQSAWNGVAILARDSQPLEVRRGLPGNASDPHSRYLEAAVDGLLVASLYLPNGNPQPGPKFDYKLAWFEHLIRHAAELMESGHPVVLAGDFNVVPSDFDIYDTRSWKKDALLQPESRECFERLLRQGWVDALRQRFPDRRLYTFWDYFRQHWQRDAGLRIDHLLLSASLADHLEDAGVDRWVRGEEHASDHAPAWVSLRLS\n>tr|A0A024VDL3|A0A024VDL3_PLAFA Uncharacterized protein OS=Plasmodium falciparum Vietnam Oak-Knoll (FVO) OX=1036723 GN=PFFVO_00427 PE=4 SV=1\nMAFMFKREGCYSKNRLNEVFRKNKSFVNQLMYDLTSFHYENYMKNKIHKNIMNNYNNIEKIQSMLNLINGEKENAYKIKTGYFYFRSGVPVITPHIEQTNEFAESNNYTYNFKNIKKKYLKEVYDSYKHKIGGTDPSVPHFYKHK\n>tr|A0A1Z9W0I5|A0A1Z9W0I5_9GAMM Cysteine--tRNA ligase OS=Oceanospirillales bacterium TMED91 OX=1986769 GN=cysS PE=3 SV=1\nMSLQIFDTLAREKRVFQPLEAEKIGMYVCGMTVYDHCHLGHGRVMVAFDAIVRYLRFRGFEVNYVRNITDVDDKIFXRAAERQIPFSALTAEMIDAMHADEAKLGCQLPNHEPRATANIDSMLRLXERLLERGAAYQGDSGDVYFRVGAFPEYGKLNNRNLDDMVAGARVAVAKDKEHPADFVLWKSAKAGEESWSSRFGPGRPGWHIECSAMSMDALGETFDIHGGGPDLKFPHHENEIAQSESATGCQFAQYWMHAGAVRVKDEKMSKSLGNFVTLAELFREFHPQVIRFFLLQSHYRSAISFSDDALVQAGAAYTRLVQALPDQLTSPSSDAIFQFQQFMDDDFNTPRAIALLFDLAAEGSEESGSSLLAIGKVLGLFATDKVTFLAEQQQLKAANSGLSDAAINALIAARKQARKDRDFFTADKIRDDLVAQGVVLEDAAGGTSWHRK\n>tr|A0A4U5PX20|A0A4U5PX20_POPAL Eugenol O-methyltransferase family protein OS=Populus alba OX=43335 GN=D5086_0000167450 PE=3 SV=1\nMASSIENHVSQVDEAKDENFGYAMQLALSSVLPMTLHTAIQLGIFEIITKAGPDVKLSAADIAAKLPTDNPDTPKMLDRILRLLASHQVLCCFVDGSERFYSLAPVSKYFVRNQNGVSLAPFMAMIQENVILQGWSQLKDAVLEGGVAFVRVHGVQAFEYPGLDPRFNQVFNTAMYNQTTIVNGHMLEKYDGFKNLKQLVDIGGGLGHTLKAVTSKYPQIKGINFDLPHVIEHAPAYPGVEHVGGDMFESVPKGDAIFLKWILHNWSDDHCLKLLKNCYKAIPEDGKVIVMESVLPITAKTSPAAKAISQLDVMMMMSQNPGGKERTEDEFMALATAAGFRGIKFETFVCHFWVMEFFK\n>tr|A0A2T6GMZ3|A0A2T6GMZ3_9PSED Isocitrate lyase/phosphoenolpyruvate mutase family protein OS=Pseudomonas protegens OX=380021 GN=C5U62_08510 PE=4 SV=1\nMDAQSLRANVFKALHERAGAFVIPNPWDAGSARMLVGLGFEALATTSAGNAFSLGRPDAEGAVSLEDTLNNVREIVGASSLPVAADLENGFSDSPEGCAQALLLAAASGVVGGSIEDASGRADEPIYDFNLAVERIEACVVAARSLPFPFTLTARAENLLHGRDDLPDTIRRLQAFAEAGADVLYAPGLRSAEEILQVVRAVAPRPVNVLMSGGLNLSVAQLAELGVKRISVGSALARAAYGAFYRAAEDIRDHGRFDFAERAMPFRQINQLFKQP\n>tr|A0A7R9P3G8|A0A7R9P3G8_TIMCA (California timema) hypothetical protein OS=Timema californicum OX=61474 GN=TCMB3V08_LOCUS1220 PE=4 SV=1\nMAGSEPASAWKESGKLFRENYLSSPDRDLNLDLFIAGSLAQHETSPLDNYATEATPEEIETSLDAALKAGYRHIDTAFAYKNEDAIGRVLKRWFDSGKIQRKDLFIVTKLPGTGNHAESVEKYIKLSLSALQMDYVDLYLIHSAVGKKDSDRGPAGSDHQAELDMNTDHVSVWKAMEAQVDAGRAKAIGLSNFNARQIKRIWSSARIKPANLQVELNVYFQQRELTAFCKALDITVCAYAPLGNPDFAKRISGKSDLKFSSPMEDPVVVKIAKKHNKTPAQVLLRWIIQRGIVVIPKSKTPSRIKANFEVFPSRVCIQRALLGVPREMEQL\n>tr|A0A7K2SMN5|A0A7K2SMN5_9ACTN Gfo/Idh/MocA family oxidoreductase OS=Streptomyces sp. SID8350 OX=2690337 GN=GTY74_01910 PE=4 SV=1\nMARSQEQGTEAQTGTPAPPSGQALGTLGVGMVGYAFMGAAHSQGWRTAGHVFDLPVRPALAAICGRDRAKVDAAAARHGWAAAETDWRALIARDDVQLVDICTPGDSHAEIAIAALEAGKHVLCEKPLANTVAEAEAMVRAAEAARARGQVAIVGFNYRKVPAITYARQLIADGRLGTLRHVRASYLQDWLVDPASPLTWRLKREHAGSGALGDLGAHIVDLAQYLAGELLTGVSAVAETFVRERPLLAGAPAGLSGRADTAELGEVTVDDAALFNGRLASGALASFEATRMAAGRKNALRLEINGELGSLAFDLERLNELSFHDHTEPAATSGFRRILVTEPEHPYLEAWWPPGHGLGYEHTFVHQARDVIRTIVEGTEPRPSFADGLQVQRVLAAVEESAAKNSVHTAVPS\n>tr|A0A6M1RBC6|A0A6M1RBC6_9GAMM Uncharacterized protein OS=Grimontia sedimenti OX=2711294 GN=G5S52_07050 PE=4 SV=1\nMQADQMRKGMIISKTCAVIAKGKSPQTTQPGYSLQSMRHGEPVNEDAIRAKAKQLGLDQQEQDLFVVIKRNLVHSKKVKDGQIAAFAKHVVQYCDSEADIYNALKGIEQQMAVMDHFIRYIHV\n>tr|A0A533RQR5|A0A533RQR5_9ACTN Uncharacterized protein (Fragment) OS=Actinobacteria bacterium OX=1883427 GN=FDZ75_06060 PE=4 SV=1\nMLEMRIGTIKTPWFLALAVVVALVAIASFALVAVAEPPMAEQSSNDVAHHWTARSAGVAPYTELAPAEAAAIDTAKKALTQPPLGVIRNADHGYGAAQGALDTMKAVSTAAPIVAGHELVLSNGTKAVRVYVNQDGSVKPLGSGTLWVSATPNKALSDHNDFDAAEIARGALALHAALDPGTA\n>tr|A0A2A8FPC4|A0A2A8FPC4_9BACI PucR family transcriptional regulator OS=Bacillus sp. AFS026049 OX=2033493 GN=CN563_06555 PE=3 SV=1\nMNTSITIEEILTRKHFNLTDIIAGSSGIKRQVKWVHCMEVTQISHLLNGNELILTTGLGWKDCDDTFLSYLRQLIECDAAGLCIEMGANTMAVPQCAIDLANERQFPIILFHEEVPFVEITQDIHSLIINKQYQMISNLENYSQQLNKNLLEIDHYEPILKFLHSYLHVQVILIFNENDIASIPKIKKKSTYQMVADIYEEKRKLDKTVLGQPIQVLGENYAELLICSNGRELTDFDSLILDRTATALAQHLLRELYIEEKKMSEESIWLTNWIEGEYSDEAIRERLSYIDPKMQLDGGIVCICKQHPKYNKNSAKLDGTYFKIMFRTVFEQYGFQIFSMEIQQHLVFILGDNRSSEDWKSRVTSALDRIMKMDVSGRNRMGLLSIGFGKHVQRLSEIYKSYETARETLLLQDTLPEDDRSFFYQDLHMHRMISLINKHGNLEETVYEYLGPVIEYDKQNNGELMPTLKTYLACNGSKQETSKQLFIVRQTLYHRLEKLEKLLGSDFMRSDKRLGLEFMIFALDFLQYSSRKISGKYVDKYIGR\n>tr|A0A6N6RG02|A0A6N6RG02_9HYPH sn-glycerol-3-phosphate ABC transporter ATP-binding protein UgpC OS=Brucella intermedia OX=94625 GN=ugpC PE=3 SV=1\nMASIDIQSVRKSYGEHAVLHGVDLEIKDGEFIVLVGPSGCGKSTLLRMIAGLEDITSGQVQISGKRVNELAPKDRDIAMVFQSYALYPHMSVADNMSYSMRLRKTPKEKIASAIQSTAAKLGLEPLLERRPKALSGGQRQRVAMGRAIVRQPKAFLFDEPLSNLDARLREQMRAEIKKLHGELKATSIYVTHDQIEAMTLADRIVAMHGGVVQQVGSPLELYDRPANLFVAGFIGSPAMNFLDVTYLEQDGGPRLKLKDGTLIALPQPLNLKDGAKATLGIRPEHVHIEKSAGLPADVDLVEPTGFGIILHLSLHGLPFKIFTLDRDALHMQGSIQVSFPAQHLHLFDGDGNRVEPRAVQ\n>tr|A0A522BP99|A0A522BP99_9BACT Transketolase family protein OS=Patescibacteria group bacterium OX=2052139 GN=EPN90_03525 PE=4 SV=1\nMELKPTRDGYGLGLVDAGKKDAKVVVLCADLSESTRSHWFKKEFPARFVQIGVSEQSMAAIASGLALAGKVPFISSYAGFSPGRNWEQIRTTITLNDANVKVAGAHAGVSVGPDGATHQMTEDLALMRTLPNMVVLAPCDMQETKKATVAVAGVYGPHYLRFGREKSPVFTTPATPFKIGRAEIFRFGRDVTIVACGILVHEALKAAEELRKKGIEAEVIDSHTIKPLDAKTILASIAKTGCVVTVEEHQVDGGLGAAVAEALGAARPVPLERIGVQNRYGESGEPIMLLEAFGLTSPYIAMAARRATARKAGKKVSEVPDYMAAAERRAVELKKQVISEALSRAPREWGGKKGNIKDLIKKSK\n>tr|A0A852SI39|A0A852SI39_9MICO Putative membrane protein YkoI OS=Herbiconiux flava OX=881268 GN=BJ984_000542 PE=4 SV=1\nMQKKTKIIGGATLAAVLVLGGTGIAYAATDGFEGSDALTGGDLDRAATVASEEIGGGSVTSAERDDDGYELELKGDDGRYYEVELDGSFGVVSSSADDRVGDTGSSGSGSGSGSGESGESGESGTGEAGGPADGGDDEGDGAGAGSASVDPDDLQGEELEKASAAAIAEAGGGSVTDAETSDDADHAYDVEVRLDDGTEVDIDLDASFGVVRTEK\n>tr|A0A0E0XWR4|A0A0E0XWR4_ECO1C Lipid A 1-diphosphate synthase OS=Escherichia coli O104:H4 (strain 2011C-3493) OX=1133852 GN=lpxT PE=3 SV=1\nMIKNLPQIVLLNIVGLALFLSWYIPVNHGFWLPIDADIFYFFNQKLVESKAFLWLVALTNNRAFDGCSLLAMGMLMLSFWLKENAPGRRRIVIIGLVMLLTAVVLNQLGQALIPVKRASPTLTFTDINRVSELLSVPTKDASRDSFPGDHGMMLLIFSAFMWRYFGKVAGLIALIIFVVFAFPRVMIGAHWFTDIIVGSMTVILIGLPWVLLTPLSDRLITFFDKSLPGKNKHFQNK\n>tr|A0A2V7LM58|A0A2V7LM58_9BACT Non-specific serine/threonine protein kinase OS=Gemmatimonadetes bacterium OX=2026742 GN=DMD60_00570 PE=4 SV=1\nMTEGDPRPCARNHRRSVRMLLRPRDRTAQLARNLVYTPRGTEGPVTVDLLLPDLQRALAGRYVLERRLGRGGMGVVYLARELRLDRRVAIKLLPPERATQPTARERFLREARTAAQLSHPGIVPIFAVHEVSDFVYFAMAYVDGDTLGRRVRRRGPVPYATAARLLEEVARALAYAHDRGIVHRDVKPDNILLDQTTGRALVSDFGIARVGSATTTGPQRVVGTAEFMSPEQVLGERVDPRSDLYSLGVVGFFALSGELPFLGPDDMTVLARQVSDPAPPLASVAPHVPHRLAEAIDRCLAKDPAERFPNGEALAAELAAALDRRAAVAVRAFVTEARQLSTTTLFYGAFAAVALPLLVLRLLEPDDPPTRAALVGSVATVVAVPLVVMVLRVRRLSKAGYGQADLVDALSAELGHRREELAFLYGEGPSPLERALRRLCYVCVAAAGAIVAALERVPALAGALGVPTLFGVVTAAALVAAVAARARTEHRTNPKGERRLRFWSGPLGRWLFTLAGLRVKRRATPAPGVLSPVVTPVPEARDA\n>tr|A0A1I3RF39|A0A1I3RF39_9DELT Glyceraldehyde-3-phosphate dehydrogenase OS=Desulfomicrobium apsheronum OX=52560 GN=SAMN04488082_103115 PE=3 SV=1\nMEKTRIGINGFGRIGRQVLKTIWQRHRDTLEVVAINDLFDTQTNAHLLRHDTSYGHFAAPVEADADTIRVGGEWEIKSFAQRDPKLIPWKSCGVDIVIESTGIFRTGPTAGQHLESGAKKVIITAPSKDEDLTVVIGVNEDKYDPAIHHIVSNASCTTNCLAPAVKVMHAKFGVAKGVLTTVHAYTNDQRILDLPHKDLRRARAAACNMIPTSTGAAKAVAKVIPEMAGRFDGYSVRVPVPAVSLVDFVAVLERDTTAEELKAAFKEASENELKGILGYAEEALVSSDFIADPHSGVVDADFTTVQAGNLAKVLIWYDNEWGYSCRVADLAHLMAQKGL\n>tr|A0A401RBY4|A0A401RBY4_STRA9 TetR family transcriptional regulator OS=Streptomyces albulus OX=68570 GN=SALB_07941 PE=4 SV=1\nMERAERGERILEAAGELLVAWGYRRVTIDEIARRAAVGKGTVYLHWKTKDALLLAVVLRAKSRSLHAQLARMRADPREILPSRMMRGYYLDFLAEPVLRALYTDDVDVLGRLNDVAKKELAELMAFNDGILLRYLAVLREHGLVRTDIDVRHQQYVLMSTATGFFMAEAMLADHAPDTPEVRADLFAATIRSAVDMPVEGFGAQTVGPPGRSGAPRARTVEEALVAARRDVLPLYEQAEEYGAREMRRQLRG\n>tr|A0A1X2LS66|A0A1X2LS66_9MYCO Dehydrogenase OS=Mycobacterium decipiens OX=1430326 GN=B8W66_16385 PE=4 SV=1\nMCVLRLLDMALERLCAEGLIKGPLRAGFGQEAVSIGAAAALGEGDITITTHRPHAQHVAIGGRLGPMVAAMTGSTAADIWGGDNQVLDAFPRGGLSAGPCVVKQSPSYAIGHAYRQWLADTGGITLCVTEDCDVNSAAFNEAANMAAVWQLPVVILVENIRCALSVRSDRHLREPQAYRRAAAYGMPGVSVDGNDVKAVRDCVTSAVLRARAGGGPTLVQAITYRTIDFSGSDRGGYRDLAGSEQFLDPLMFARRRLIAAGATRDRVAEEERAACQLVADAVAFAKAGSRRDSGARSQPPACV\n>tr|A0A380JP96|A0A380JP96_9STRE Myo-inositol-1(Or 4)-monophosphatase OS=Streptococcus equi subsp. equi OX=148942 GN=suhB PE=4 SV=1\nMEDKYAFAKTIIKEAGLFIKDRMKDSLAIEIKTQHDDLVTNVDQETQDFLISKIKKAYPSDHMIAEEGDICHAITDGKVWVLDPIDGTVNFIVQKANFAIMMAYYENGIGKFGLIYDVMADQLFSGGGDFAVTLNDQVLASYQDKPLDLSLIGCNAGMLSRNEYNLHQLIDQTLGVRVYGGAGICMTKVLKQQLMAYFSYIQPWDYAAAAIMGESLGYVLLTLEGEQPDFQSRQKVMFVPKSKLATIQSLLHINENNQ\n>tr|A0A2E6Z7C9|A0A2E6Z7C9_9GAMM DUF2061 domain-containing protein OS=Rheinheimera sp. OX=1869214 GN=CML21_09570 PE=4 SV=1\nMLKTTTFAIMHFTIAFAVTYAITGDLVLGGLVAVIEPAANTVAYFFHEKIWQRLQQKNTVQKSLTIFKKPALKW\n>tr|A0A1D2SEW3|A0A1D2SEW3_9BURK Ribosomal RNA small subunit methyltransferase E OS=Lautropia sp. SCN 69-89 OX=1660104 GN=ABS56_13610 PE=3 SV=1\nMIRTLDARQSHHLVRVLRLAAGAPVEGFDGKGARFDARIERADPKACAIRLLAPIAACTESPLAITLAQGISAAERMDWTVEKAVELGAHAIQPIVCARTQVRLDAQRLQRRHEHWARIVEAACMQCGRDHLPELGVPLAFERWLAATDRRAARTRIVLDPRGAVRLAALRVDAAQPVDLLVGPEGGFDATELEAARAAGFQAVRLGPRVLRTETAGLAAIAALQAIAGDF\n>tr|A0A1A8F559|A0A1A8F559_9TELE IK cytokine OS=Nothobranchius korthausae OX=1143690 GN=IK PE=3 SV=1\nMPETESYSNPLAPDDHELDDHRGGSQAKLTNDDFRKLLMTPRATPSSAPPTKSRHHEMPRDYNEDEDPAARRRKKKSYYAKLRQQEMERERELAEKYRDRARERRDGVNKDYEETELISTTANYRAVGPTAEADKSAAEKRRQLIQESKFLGGDMEHTHLVKGLDFALLQKVRAEITSKEKEEEDLMDKVQKETKKDLEPEEKIEFKTRLGRNIFRMVFRSGVSERNELFLPGRMAYVVDLDDEFTDTDIPTTLIRSKADCPSMEAQTTLTTNDIVISKLTQILSYLRQGTRHKKLKKKDKGKLDDKRAPEADLSIFDDIGDYIPSATSGTKPVKDKDRHRERERERERERNREDDSKSRRQSYFEKPRADEHQLMDVDAGPGSVRDQINMINEKFGGAAGSQWQGQEPGSQRRDSSKEHLGDFFGGSNSYAECYPATMDDLAVDSDEEVDYSKMDQGNKKGPLGRWDFDTQEEYSDYMNNKEALPKAAFQYGIKMSEGRKTRRFKETNEKAELDRQWKKISAIIEKRKKLEADGVDVKRPKY\n>tr|A0A5C8LAV1|A0A5C8LAV1_9FLAO Uncharacterized protein OS=Mesonia sp. HuA40 OX=2602761 GN=FT993_07960 PE=4 SV=1\nMKKIDKKEIITSTAKSIFGAIPFGGAALDELFFEYNGRLKQNRLNRFVKILAENFTEESDINLDNIKTEDFNDLFESVLRKVVQTKSEAKLIRFKDVLLNELKKPTKQAEINELYLNLISELTEQEIEILYNHRFFTEEFEEEVNEMNRHRDNMKSLKNQMDKESIIVDESKFLKPYENVKAQFENKKSKIDKVLKYRNADFYNLNENKFMFFKQRLFSKGLLIDDRMKRIGTLPFQSMGITEFGVEFIDFIKTSEKKITVGNTVYNK\n>tr|A0A1S6WTD4|A0A1S6WTD4_9HYPH 23S rRNA (Guanosine2251-2'-O)-methyltransferase OS=Bartonella sp. WD16.2 OX=1933904 GN=BWD162_004080 PE=4 SV=1\nMKEKVSKNSYFPHPRRQYRNTKSFNRMPSIHLKHRSTSSIQNIVYLYGIHSVKEALKNPKRVFNHLYATPNALQRLNITKSDLPCSLKLYPPKKLDELVGKDAVHQGVVLETETLKPRHLSELTNTNLIIVMDQITDPHNVGAIMRSAVAFKAGAIITTYRHSPQESGVLAKAASGALELIDYITVRNLAEALTEIHQAGFNSLGLDSESELPLETALTGKKIALILGSEGKGLRKKTRETVHSLARLNIPGDIKSLNVSNAAAIALYAAHNYLKH\n>tr|A0A538MZI6|A0A538MZI6_9ACTN Peptidase_S8 domain-containing protein OS=Actinobacteria bacterium OX=1883427 GN=E6F93_02950 PE=4 SV=1\nMAMLRNGGRPGGQSRSSALWGTGNNDDSRSNALWGKGGRGLVTLMAAVLVLGIPLAASAGGDDNTGPETQTYVSPGMLANASKHPDKTIHVIVTANAGDLPKSRILDKTLGSVDRRLGLIDGIALDLRANRLDQLAKIPGLTITPDAPAHPTGSTFSSKQLWVPNTGIDKLWNAPVANSTKTQSDLAVPAIAVVDSGVDTSKAADFGARVVQQVNLTTLPNNSPGDGRGHGTFVAGIAAGQATGYAGASPRSNIVSLDVMDDTGTARTSDVIAAAQWILDNKDKYNIKVANFSLHASNSSSFTHDPLDKAVEKLWFSGVTVVAAAGNYGYANAPSGVKYAPGNDPFVITVGAADMDGNPSPNNDTAPSWSAYGYTNDGFAKPELAADGRYMVGPIPAGSTLASQKASNIVSPGYIMLSGTSFAAPIVAGIAAQIIARNPTWGPDQIKGGLMETARPTPNATPGSLGLGEVNALKAVLLSGAPNPNKALEKFLGPDPSGGNLPAFNAVSWSDTAKANVSWDAVSWGDVSWGDSALAAVSWADISWSDVSWADSLSSADVSWADISWSDSSYEDAAEGDGAGNTTDSFADPADLAAAAADPDLQLPSDLVALQPSATTSLP\n>tr|A0A5E6PHC7|A0A5E6PHC7_PSEFL Alginate_lyase2 domain-containing protein OS=Pseudomonas fluorescens OX=294 GN=PS645_00335 PE=4 SV=1\nMIDLSTWNLTIPVGAPARVIETPRLVDGYSDAYFRAGNTLFFWAPVTGGTTSKSEFARSELRETYKDGELRNWKYPKADHRMTASLSVNQVPSEGRVVIGQIHIYQGKGPLLKVEYVYDKARQTGSVIANYRLKPGSADTKVVIAEDVDLNKRFTYEIRLSSAGYLHVISQGNRWGKQLSKSWQNKQLYFKAGAYALDNTGYKSEGAQVTFNKLEVKHSKG\n>tr|A0A4S2D6C4|A0A4S2D6C4_9MICO Redoxin domain-containing protein OS=Microbacterium laevaniformans OX=36807 GN=E5344_10370 PE=4 SV=1\nMNHRALIATASVLLVVGLLAGCGSSESLAQQYRNGNEKGYIAGDFQIVEIPDPDRGEPVAFEGVTETGETVTSDDYRGGVLVVNFWYAACGPCIVEAPLLEEVWQDYQDQGVAFLGVNTYDQPATALSFARDNNVTYPSVIDVNDGRVKLAFAQVTPIQATPTTLVIDQDGRVAARIIGQLASASILSTLVADTLAEDSS\n>tr|F2YA48|F2YA48_GLOPA Pectate lyase (Fragment) OS=Globodera pallida OX=36090 GN=pel1 PE=3 SV=1\nMLFVIISIVFAQLCQVHALCTFPASPKTTTVQSTINVASNTDYKYTTFVGGSGILNGGCDVKNGKMKYLMVLKNGVTIKNAIINTPGLGIYCEGNCVLENIYYKKLCYHATGFGYKSTSTSYTYQVIGGAGQGSPDKYFTQSGRGTTIIKNFCAEGKYGKVWCSCGNCIDQMPRSVQISNTKIQGPGLAIISANSNLGDKISISGLTLYGQGSPNTLTKYVCQTYNGLTKMATMQPTAKFRPTQAGTGTCAYSTSAIKIVN\n>tr|A0A2K4FSF4|A0A2K4FSF4_9PSED Uncharacterized protein OS=Pseudomonas sp. MPBD7-1 OX=2075549 GN=C1892_11745 PE=4 SV=1\nMTSKKTATAVSDLTLSPAANGPEVSKPSSPPRPLSTQQYLYFTETNTDRILDNLDGLRDTVFPRPPHLVDDEYDRAQQEFPSVCLIGLGRCGSNIALDVAELVYNARKFYLNEFNAEDKGYSDKGYSPAQWIRNNLRLGTSKASKPVFLVEPLVMLGDLDKDIAGRIRFSRKGEKSGFLRDYSKMKIMDLSEVHAGGAGNAPILGQYLAKIILNKDTQRFSSPDWKMIHSYLIDSCGIKANQSRLYFSIFSAGGGTGSGMASEFGLAQQYSYMNKTFDTKPMDEHDSKSGHSFVFEPIFTSGICVLPNISDHRSEMSEALHINAGRLLCKYLSEEWDFSYNFANEDSSEASVMGRIRPWNAMMLISNDIMRYAEESDDGNIQNIDVNAMEKHANQYISQQIFNILTAQAVTTDYDQNYFRRAGIDIGETIRLDANDLFMSLAGPVAIAYAESVVPETPVPSGDKFKVFEKEPPRLNIDDLFFRSIDLPHFNKVTQAIEGISLLPIESKRYRASLEQYKNSGYDAAALHDLHFFKNCSSVVSIVSLPKDYKLSYMDLNRLKTHLNSLFPNTTLKRYALVIGASANLSLTTLIAKSPCLSDDFLTLIVAFIKRCFARTPYRFDETLDNSILDFIINEDFDEARIDDLLNEFENPAKILDTNWYAIKPMYEKKYRELINDKDKFVSINDIRLSRDCVKKSIKYLREIYRHRIGKTKVISLNNHTGRTY\n>tr|A0A401T372|A0A401T372_CHIPU ENTH domain-containing protein OS=Chiloscyllium punctatum OX=137246 GN=chiPu_0015593 PE=3 SV=1\nMTSSSLRRQMKNIVNNYSEAEIKVREATSNDPWGPSSSLMAEISDLTYNVVAFSEIMSMIWKRLNDHGKNWRHVYKALMLMDYLIKTGSERVAQQCKENVFAIQTLKDFQYIDRDGRDQGINVREKSKQLIALLKDDERLRVERSHALKTKERMSSVTTAVGSNNQIMFGRGSSHPNLSTSQSDECGKIGGSPASYHGSTSPKISSELEQTRPQTSGEEELQLQLALAMSREEAEQIFKSATTAGSQPRNTVLTLSAQDEQHRRGDDLRLQLALEESRQKLQMPGMAPHKTETALLDLTDSTPSPLTQKSDPWGAPLPSTSTTKPDPWAAVSRPVSNDPWKQMAGSRLAAATSDPWGSSGRRLSGEQQSRSADPWGSAAAAPDRDPWAPTSPQVAPPFHSFSAADAAVTDEFSVFSHLRGSPRKVEGQGTGGRFEVLGDGLTTPATSVVTGCSDVFDMPSMSSTVPSKLPTPKHQPTTQKNPESFLGPNASLVNLDTLITHTTHPNVSTNPFLAQAVPVASANPFHSTPTQMSSSMMAVTQTPFGPVDVTATSFSAMPRVGAAPMVTMPAMQMPQSTGMQGMMGSNYVAMAAPPPTGQSASSTNPFLL\n>tr|A0A318DIN8|A0A318DIN8_9GAMM Extensin-like_C domain-containing protein OS=Dyella sp. AtDHG13 OX=1938897 GN=BDW41_11025 PE=4 SV=1\nMSVVRYLGLLILMVGVFIALLVASGWRPPYRYNPWARLDLRAEPDWLTRFRLYRLQHHNDQCLAALAQAGAEYRAVSDRPLVDGCGWQGTVMLRGTGQATLATPTVVTCPLAASLVMLDAHVLQPRAASTFGSPVAVIEHVGSYSCRNIRGDDGSALSSHARAEAIDITGFRLKNGHDISVMRDWKRSVSGAFLHQIQAQSCGYFGVALGPDYNAAHAGHFHLQAGAMGWCR\n>tr|A0A1R1WU44|A0A1R1WU44_9ACTN Uncharacterized protein OS=Streptomyces sp. M1013 OX=549798 GN=BSZ07_05050 PE=4 SV=1\nMETLAQFGDGGPGPWILLFPVIWALVIGGGITLLRRTVWRGRRGPARPGAVEDNSPITVLGHRFASGEIDEDEYWRRLSVLDEQFGRTGKGGAA\n>tr|A0A2S8IRD2|A0A2S8IRD2_BURCE Uncharacterized protein OS=Burkholderia cepacia OX=292 GN=C5615_17140 PE=4 SV=1\nMKKTTLKSVFLTGLLVLVPLAITLWVLGLIIGTMDQTLLLLPESWQPERLLGFHLPGIGAVLTLAFIFIVGLATRNFIGQKLVTWWNAVVRHIPVVGPIYTSVKQVSDTLLSSSGNAFRKALLIEYPRRGSYTIAFLTGTPGGDVLNHLTEEYVSVYIPTTPNPTSGFFLMLPKSEVIELDMSVDAALKYIVSMGVVAPPAPAPAPARRPVEPPL\n>tr|A0A2T4IVX8|A0A2T4IVX8_9HYPH Integrase OS=Mesorhizobium helmanticense OX=1776423 GN=C9427_13580 PE=3 SV=1\nMLVGYARTSTAEQDAGLLAQQRDLREARVEKLFSEQVSSIGHRKELETSLDFLREGDTLVVTKIDRLARSTSHLLAIVDRLEEKKVGLRILDFGGASVDTKSPSGKLMLTMFAAMAQFEREMMLERQREGIAKAKLDGKYKGRKPTARARSGEVIKLHIDGVGPTEIAKRLGMGRASVYRILEAPGE\n>tr|A0A8A6NMP5|A0A8A6NMP5_9ERIC InfA OS=Impatiens loulanensis OX=2822277 GN=infA PE=4 SV=1\nMKEQKWIHEGLITESLPNGMFRVRLDNEDLILGYVSGKIRRSFIRILPGDRVKIEVSHYDSTRGRIIYRLRNKDSRD\n>tr|A0A7C6PFE8|A0A7C6PFE8_9RHOO Uncharacterized protein OS=Rhodocyclaceae bacterium OX=1898103 GN=GXX56_08515 PE=4 SV=1\nMQLPITIELHRSRLQPRILALLLSVALIVVLFYPLPVPLRLIGVTLLALGGGWMVRQLRPQVAALQLLADGSLGIRGTDWNHPEFVPARMLQGATVHPWLTVLRLEAQEGQPYRLLLTPDCLLPEDFRRLRVFLRWRSTVSASDAPV\n>tr|A0A6P3QY80|A0A6P3QY80_PTEVA zinc finger protein 512B isoform X2 OS=Pteropus vampyrus OX=132908 GN=ZNF512B PE=4 SV=1\nMADPFCVGASRRLPGSSKSGPGKDGNRNEVRLPVRHDPPKLGLPVARGGQSVPSQAPLCFDPGSLASDRTEGKKKGRPKAENQALRDIPLSLMNQWKDEFKAHSRVKCPNSGCWLEFPSIYGLKYHFQRCQGGAISERLTFPCPFCEAAFTSKTQLEKHRIWNHMDRPLPAPKPGPVSRPVTISRPVGVSKPIGVSKPVTIGKPVGVSKPIGISKPVTVSRPVPVTKPVTVSRPVPVTKPVTVSRPVPVSKPVTVSRPMSVTKAVPVTKSVPVTKPVTTNKPVPMTKLVTVTKPVPVTKPVTVSRPIVVSKLVTVSRPIAISRHTPSCKMVLLTKSENKTRAAGRSSGKKRAADGLVACPIPPKQTRPENGEHGPSTLGQSSAFQLGTDPSGGPLSVGNRPSGGKEAPRAPGPVSPTEEGAERTKHRRKQKTPKKFTGEQPSISGTFGLKGLVKAEDKSRSYRARKQDGPSPEDVRKKAPAPASTVSKEVPAPTAHLAPGGPEEQWQRAIHERGEAVCPTCSVVTRKTLVGLKKHMELQDALKCQHCRKQFKSKAGLNYHTMAEHSAKPSDTEASEGSEQEERERLRKVLKQMGRLRCPQEGCGAAFSSLMGYQYHQRRCGKPPCEVDSPSFPCAHCGKTYRSKAGHDYHVRSEHAAPPPEEPEDKPPESEDLLGVERTPSGRIRRTSAQVAVFHLQEIAEDELARDWTKRRMKDDLVPETARLNYTRPGLPTLNPQLLEAWKSEVKEKGHVNCPNDCCGAIYSSVSGLKAHLAGCSKGDHLVGKYGCLLCAKEFSSESGVKYHILKAHAENWFRTSADPPPKHRSQDSLVPQKEEKSLAGGRKRGRKPKERPPEEPAPRTPPRQDDWPPGGRDKGVRGSAGRKVGAGKAPEK\n>tr|A0A081RSK0|A0A081RSK0_PHOTE Chemotaxis protein CheW OS=Photorhabdus temperata subsp. temperata Meg1 OX=1393735 GN=MEG1DRAFT_03734 PE=4 SV=1\nMSAIEAFNKLSGETAGEGYLVFTLGDEEYGIEILKVQEIRGYDQVTRIANTPAFIKGITNLRGVIVPIIDLRIKFAQETVTYNDNTVVIVLNLLNRVVGIVVDGVSDVLSLKAEQICPAPEFAVTLSTEYLTGLGSLDDRMLILVDIEKLLNSEEMALVDSVAKN\n>tr|A0A1V5AGS2|A0A1V5AGS2_9EURY tRNA (Guanine(10)-N2)-dimethyltransferase OS=Methanosaeta sp. PtaU1.Bin028 OX=1811687 GN=A4E47_00993 PE=4 SV=1\nMDGRDLKCGLEEAVASELWAFELSGEHATLPRSEALALLKVHSSSFKEVCLLDQCLIVRAPSIDAAALEARLAMSHRVLRVLAISSCSHSDLSFAASSIDIPRQTYRVRARSVGRSALSGYDVEVAVGRELFRRGYRADLSAPCQEIRCIVSQGLVVLGVEVARPDRSGFEGRRPHLKPFFYPGVLMPRMARALVNLTCVRPGERLLDPFSGTAGILVEAGLIGTRCVGLDVQMKIVRGSLANIDGIECSLLAGDARRLPFRDASVQAVVTDPPYGRSAAIRAASRDELLARSFEEMARVLQPGRRAVVVADHPIDDLLASAGFLQREIHSERVHRSLTRRIYISEI\n>tr|A0A4V3XAK0|A0A4V3XAK0_9APHY Uncharacterized protein OS=Phlebia centrifuga OX=98765 GN=EW026_g3689 PE=4 SV=1\nMSDASDILPPSLDLPPHLSAQKYFFVCTLTVAAWDTLVLSPRSWRLFRTKGWPFLKIAYHFLRIFMPVEFTIVGVAFFDTKWSQETCSHFFLFEPICTAILLAVCSAVHVIRINAIYDKDRRVFTPMVALYAIQILITAICCGFYRSTPLLIGQGCIAEPKHSWVGIYWISATMLYTASFGLALSRAIRSLKIKKISYWKLMLRDGLNLYAAVFLVNLVNMLFWFIITPTGPEDPIRTIVTSMSAVLTASMTLRIILSVRGTLEKGGSTGPVLSLQQPGTGTFNVPLGATESKTHDWVDDKASDQMGMSEVKGEGDFPVESGLGTPTSEDAPKGVKITIDTETAF\n>tr|A0A1M8A1H4|A0A1M8A1H4_MALS4 Similar to S.cerevisiae protein RKM2 (Ribosomal protein lysine methyltransferase) OS=Malassezia sympodialis (strain ATCC 42132) OX=1230383 GN=MSYG_0658 PE=4 SV=1\nMEQALAAYVARASGSPTLRVAVSDQVPAGRGLVTTGAVQAGETVLRLPPSVLLNPSQMARGRPVPWAPLRHAEEPCPNARPLSTHQLLACVLAQWRAARVAGPSTELSDRDAFFASMPSAFPTVPLSWALDGDTQLLSALPPRAARLHDKVQARFEADWRRLDALDEATRASIWASVSRPGIPAVRPRKADVLWGWLCVNSRCVYVDLRYVRHEDNFTLAPLLDMANHTFVQGKQCKVRYSAEGMELCAPAQCGLQAGDEVCITYGPHTNATLLTEYGFLLAPRDALRGASAWDGNPHAELAVDDAIAERFRAEGDEGAWKVQRLKEEGYSGDYTMHPEPAPAHVSHRLLMALWLLSMAMENKHTTQRLSLRARAALQAKQGLRCVYSPKEAARQWKQVTYGMPDSRHERPMRDVLCRLCTEMAEQRSALLEQLQGRHDEPASLVRLLLEEERDIAHRVQTSAERGEAW\n>tr|A0A4V6I9D8|A0A4V6I9D8_9BURK Glycoside hydrolase OS=Burkholderiaceae bacterium PBA OX=795666 GN=MW7_007585 PE=4 SV=1\nMAGAPPCVHAETARSRAIDVPGPWTTYYGAASKLDLQQVARTYRLLVIDADPGQHNFTPEQIAQLRDGGRNRVLSYLNIGSCERFRTYWRTTGTAIPGCGANRRAQRGVYHGYPDEVWMDPSDPDHQRLVLDYLAPRLVAQGVDGFYLDNMEIVEHGVRTDNGPCGDACRRGGLELVYKLRARYPQLTIILQNTAGPVTRMGQAGGVPFPTLLDGIAHESVFAPQHDADADAQLALWRAWSSERPEQRFWIGTLDYVGKCENVDRARKAAARSRARGYVPAVSDASAGQQRICDWPQPLAE\n>tr|A0A851NIW1|A0A851NIW1_9GALL PPARD protein (Fragment) OS=Penelope pileata OX=1118817 GN=Ppard PE=4 SV=1\nMEQLQEEVPEVREEEEEEEEAVTVTGGASDPSAGPDSSLPSSSYTDLSQSSSPSLSDQLQVGCEEAASGALSVECRVCGDRASGFHYGVHACEGCKGFFRRTIRMKLEYEKCERSCKIQKKNRNKCQYCRFQKCLSLGMSHNAIRFGRMPEAEKRKLVAGLTASEISCQNPQVADLKAFSKHIYNAYLKNFNMTKKKARGILTGKASSNPQPFVIHDMDTLWQAEKGLVWKQLVNGIPPYKEIGVHVFYRCQCTTVETVRELTEFAKSIPSFIGLYLNDQVTLLKYGVHEAIFAMLASIMNKDGLLVANGNGFVTREFLRSLRKPFNEIMEPKFEFAVKFNALELDDSDLSLFVAAIILCGDRPGLMNVKQVEEIQDNILRALEFHLQSNHPDAQYLFPKLLQKMADLRQLVTEHAQLVQKIKKTETETSLHPLLQEIYKDMY\n>tr|A0A1H7HQ73|A0A1H7HQ73_9LACT Transposase InsO and inactivated derivatives OS=Alkalibacterium pelagium OX=426702 GN=SAMN04488099_103146 PE=4 SV=1\nMKIIGLAESTYHYHAKRMNQPDPDREWKTLITKIFLDKDKRAGYRSIHDILIFMGYTINHKKVQRIMQELGLKCHKFSRKSRSYSSYKGTVGKIAKNLINRRFHSTIPLQKLVTDVTEMKCAQGKKLYFNPILDLYNSEIISYSISDTPNVDFVMQALEEALPIINKHATYRTTIHSDQGFHYQNKRWVKKLKENKVFQSMSRKGNCLDNASMESFFGIMKQEMYHSEPLKTFKELKKEIEEYIIDYNESRLKRKLNRQSPVQFRKNQGYTYAV\n>tr|A0A2D1KXX5|A0A2D1KXX5_9LACO 50S ribosomal protein L7/L12 OS=Lactobacillus farciminis KCTC 3681 = DSM 20184 OX=936140 GN=LF20184_09720 PE=4 SV=1\nMALDTQKIIDDLKDASILELNDLVKAIEEEFDVKAAAPVAAAGAAGGDAAAEKDSFDVELTEAGQEKVKVIKEVRGITGLGLKDSKDLVDGAPKVIKEGVAKADADDMKSKLEAVGATVTLK\n>tr|A0A2E5T8Y9|A0A2E5T8Y9_9GAMM Glyoxalase OS=Alcanivorax sp. OX=1872427 GN=CL551_10510 PE=4 SV=1\nMFNHIMIGSSDIERSERFYTAVLGVLGAGEPMRXXSXSGHIRLFYRHDGNTLAITQPINNEPATGANGGTIGFKCESPEQVKEFHDVAVANGGTSVEDPPGLREGPMGALHLSYVLDPDGNKLCGIHRLK\n>tr|A0A4R4X4E5|A0A4R4X4E5_9ACTN Uncharacterized protein OS=Nonomuraea diastatica OX=1848329 GN=E1294_04030 PE=4 SV=1\nMTTPDDYTYVRFGSMEQAYEELKKVVTELDRATDDLYADIKRELGPSWEGEAERFFEEKRQKWNAHEKAMGQQLFQAASAVNVANGNYQQAERRNIGIWTD\n>tr|A0A401SWZ4|A0A401SWZ4_CHIPU Uncharacterized protein OS=Chiloscyllium punctatum OX=137246 GN=chiPu_0013380 PE=4 SV=1\nMAQDTRVMTFYMELRTDPPGHCAITPPGSLYHDEPSPAQSVANTRSPCFLSPIVPPCTQRRSLPPDTKMDFLGFPGCKKGTASLVRTQSETNPFREFAPASSGRSTAPSSPVCIRTHPFCPVTLENTMGGDTRGRSSVVTFSYIEKARVKTVVNPFNVSVLPQGVKLAGMGQGSSIGWKSPQTSHKVSHGIISMPTPMESFDTRVSTVSVGSCREPSNSLIPNRSLLSSVGSASQRYSDAAAQSPCPGGKRAQSGNELRQGYPSKQVCTKALDLGTDLMTVATPNKTSSNHSIAAIPCVNPIGREIPNSPGLTQVEACMLVGEHSERAQRIAKARREFFYGTLEPQIPEDKADSKTWQAPVNPDNNTTREIAESKDQGASANGSLDAKLGTLSQGSAKVVNDLKSAPLSNGTSTDYKARDQLRAMKYSETDLDAVPIRHYQETNLDEVMTDYNITSSDGQELTHLMNSTLDSVQMDHPVPSRGFGRDQTTGNHEVCREEQSKAAEDDVFSELSSAADERSLEVEVKNLLPPVATIPIARSLSEEGTDTFSKQFESILESHRDKGTSYTSLDSMETLPSPSRNQGNYFTFDFPSLTSEIQVQIKENARLIEEEWSSADGEGCTNSAKASDWPDSPGCQATRTERKLGVSPMVGYSKSENTLTRCQLYAEGNLLKRALEIGDDEPKSEYSSSDSNLNHLVMDSESEMDSTEQLALGSTDTLANGNKTDQEAAKRLAKRLYYLDGFKRSDVARHLGKNNDFSKMVAEEYLRFFDFTGMNLDQALRAFLKEFALMGETQERERVLIHFSHRYHQCNPGAISAEDGIHTLTCALMLLNTDLHGHNIGKRMSCSDFIGNLEGLNDGKDFPKELLKVLYSSIKNEKLQWTINEEELRKSLSELVDERTDPSLKAMNRISGGSNPFLDIVQDPNAATYKHGFLVRKVHADSDGKKTPRGRRGWKTFYAVLKGMILYLQKDEYKSDKQLSEDDLKNAISIHHSLAVRAADYSKKPNVFYLKTADWRIFLLQAPNAELMQSWITRINLVSAMFSAPPFPAAIGSQKRFSRPLLPTTLTRLSLEEQIKAHDTRLKSMTVDLTEHRSYPPDKKVKGKELDEYKQKEEYLEFEKMRFSTYVSLLRAKLKSGTDDLDKFESALFDNIESEGNGLTKSHSSPSLHQEPPVMAIRVKRNTSERRSYRHSANTKHKL\n>tr|E3NQ34|E3NQ34_CAERE SUN domain-containing protein OS=Caenorhabditis remanei OX=31234 GN=CRE_07925 PE=4 SV=1\nMKYKTGAENKPFLRDVESPSDNPSNPFHFRKNEYFGNEKPIAKKESWHQVLNNRLRHYTVLEAFLFVFLVILLFKIYSLQSQIDTLERKLDSKKNAESHLMKTKEILEEKKVIHEIVQNVINPSSPFPKEKEGKVKLNSEFNAASLVLGASIETRQSSHSVSPGNSYFDIVSFALGSDQSAFSLLDRVELPVDKAWCTDDRKPVLTVNLADYIKPISVSYQHSKWNRTVPNGAPKLYDVVACIDGDCNQPLVSNCEYSKSGNQEQKCLISTGLPLVNKIQFRFHENHGNLNKTCVYLVRVYGEPSGSKEVKIQVKNQKEEEETAKICSRLAWFHDNIPVFYNGLASKNCSTLYSNNCCHECPNCCSECQINDSTLLNNLQFFIIFFVLFFILFPMYIAGISACCFGLKRFFGI\n>tr|A0A1Q7VVJ2|A0A1Q7VVJ2_9ACTN Uncharacterized protein OS=Catenulispora sp. 13_1_20CM_3_70_7 OX=1805055 GN=AUG49_18720 PE=4 SV=1\nMSSPSKFLRDLAKKTNTASAARAVLRAAHVKTGPSRLGDPRAGLPASVLPAGGNRITVENAKPGSANWRMGSGRSRAATDYERQIKGYASTDSVALGSAIDFHVAVXYGVAGAGGRTAAGPHSGPGNGTDRRGMASRMDAGHPHGLGLRNICRCPG\n>tr|A0A4R4JD96|A0A4R4JD96_PHOLU Flavin prenyltransferase UbiX OS=Photorhabdus luminescens subsp. mexicana OX=2100167 GN=ubiX PE=3 SV=1\nMKRLIVGLTGASGAIYGIRLLQVLQPVEGVETHLVISHSARQTLALETDYSLRDVQALADVVYDNRDIAAAISSGSFKTLGMVILPCSMKTLSGIVHSYTDGLVTRAADVVLKESRKLVLGVRETPLHLGHLRLMTQAAEIGAVIMPPVPAFYHQPQQIQDIIDQTVNRVLDQFDIELPHDLFTRWQGAKSVEI\n>tr|A0A1E3ZHP6|A0A1E3ZHP6_9BORD Nitrate/sulfonate/bicarbonate ABC transporter ATP-binding protein OS=Bordetella sp. SCN 67-23 OX=1660091 GN=ABS43_07680 PE=4 SV=1\nMNTAPVLEARGVARRFPNGVDALSPIDLTVRAGEFVTLLGPSGCGKTTLLRIFAGLDAPTAGSLRRHGEVDELSYVFQDATLMPWASVATNVRLPLDLERGPRRQPMEARRGRVREALERVGLTDFAAARPSELSGGMRMRVSIARALATEPSLLLMDEPFGALDDITRQHLDDELLGLAARQNLTVVFVTHSIFEAVYLSSRVIVLSRRPGRIVADIPIEAPTRDAAFRVSPAFAMQAARLQAALLEGQQ\n>tr|A0A2D4C9B4|A0A2D4C9B4_PYTIN Uncharacterized protein OS=Pythium insidiosum OX=114742 GN=PINS_010966 PE=4 SV=1\nMNPQQFASYVPQQQQMQGRVGSMGFAGQFATTGRVASSSSMASPVPIHAWTPPSPMEQQYFDMLFTMADEERRGAIGGRIAVAFFSRSNVDKTLLREQRSELSRNEFYVAMRLISMAQRGEAINVQRFYEMAAAPFPLPTLDGVPPPPSPQSSFVPGAPQPAVPTPSPMGGPQKGPFAITDEEKARYDGIFQQYDTDRDGFLQGGEAVGLFSKSGLDRMILRDIWAMADRTQDSRLDAKEFYIAMHLIVCISKRGLSMPTEAPQELLESPPVAPPAPEPKKDPMDAFAGLSPIQDSSDDPVDDGGAVGVNAGGPSAISK\n>tr|A0A0C1QX44|A0A0C1QX44_9CYAN Uncharacterized protein OS=Tolypothrix bouteillei VB521301 OX=1479485 GN=DA73_0227160 PE=4 SV=1\nMYTIDLTVRNTAFPISVERKSAEDAEQLYQLILTAMRSGNPDIVELQSEGKTEKKIAVRASEIAGVQVIQKDGSAAGTGRPPGFFALASE\n>tr|A0A7T0C4B3|A0A7T0C4B3_9BACT tRNA 2-thiouridine(34) synthase MnmA OS=Candidatus Nitrohelix vancouverensis OX=2705534 GN=mnmA PE=4 SV=1\nMTEKPKIVIAMSGGVDSSVAAALLKERGHEVVGISLQLWNYSGESDNRFGTCCSLDDLSDARRVAHKIDIPFYVLNLESEFRAEVVDYFVDEYLQGRTPIPCTLCNQKLKFDRLFQKAEAFGIERVATGHYASIVQVDGRYTIRRGEDRTRDQSYFLFNLSQSQLSRLEFPLADMAKTEVRRIATELDLVVAQKSESREICFVPDNNYAKFVASEAPHAFAEGEIVDKSGAVLGRHGGYPAFTIGQRKGLNIGGLKEPHFVTGIDPESNRITVGPKDDLIASEFYVSRANWCLDVTGPVEAEVQIRYRHSAAPAEVTPLENGRAKVSFYDPQLSITPGQAAVFYKDDCIVGGGWIE\n>tr|A0A2S9KN53|A0A2S9KN53_9BURK Hydroxymethylglutaryl-CoA lyase OS=Burkholderia ambifaria OX=152480 GN=C6P77_27700 PE=3 SV=1\nMTFPTAVKIVEVGPRDGLQNEKTFVPTDVKIALVDRLSRAGFRNIEAASFVSPKWVPQMADGADVMAGIERRAGTVYSVLTPNLKGFENALAARADEVVIFGAASEAFSQRNINCSIAESIARFEPVAKAAKDAGVRLRGSVSCTLGCPYQGEVPVASVVDVVERFAALGCDEIDIADTIGVGTPKRTREVLSAVTRVFPRERLSGHFHDTYGQALANIYAALFEGIEIFHASVAGLGGCPYAKGATGNVATEDVLYLMQGLGIDTGVDLAQVVAAGDFISNAIGRANVSRAGRALLAKAQSATDAPSCV\n>tr|A0A4U3MG24|A0A4U3MG24_9ACTN Winged helix-turn-helix transcriptional regulator OS=Herbidospora galbida OX=2575442 GN=FDA94_14520 PE=4 SV=1\nMSAVPPYDPDAPGPATYVYARVADHIAARILAGELVPGMRLPGERDLAAEYGVALGTARRAIEELRGRRLVVTLAAKGTYVARPEDIDPPTG\n>tr|A0A7Y4Z391|A0A7Y4Z391_9BACT Uncharacterized protein OS=Bacteroidales bacterium OX=2030927 GN=HOO91_10445 PE=4 SV=1\nMNNKNQILPEEIKSILLKYYDGCTTIEEELLLKKYFAQNQIPYSNISDKALLSFVNDNELSIFPENEIWNKILVTEKKVNKQRKTIRILSSIAASVLILISLSIWLFYPTKRVEILTDSYSNPHDAYNAVQKYLGLVSTKLSYAYNEIKPIEKLTIPCDAMQAFSTIDKNVKRLQQFDKLGASAHELERFSIISDIVIVDKN\n>tr|A0A257X4W0|A0A257X4W0_9PROT Uncharacterized protein OS=Methyloversatilis sp. 12-65-5 OX=1970398 GN=B7Z51_07255 PE=4 SV=1\nMSLSDIPDEMTLRLAADGRIECRRGTDAAAPAIRFDPAFFGQPESADAQRALGRFVFSLLQGMAPAAGTAAGPAIDGPASLLELAEKSLQQSAAAGFGQAIEALKDWPSVRTVADMLIARGPEQPR\n>tr|A0A800G627|A0A800G627_9CHLR Uncharacterized protein OS=Dehalococcoidia bacterium OX=2026734 GN=EYQ67_00675 PE=4 SV=1\nMPRLHLNPNRMIKDRGQGGRLRRALENLRKQHQWGDISDDEYRRERGIIMRQLKVHTSTIVMPTHLPNLERAANFLEDLPALWLHPGVTHEEREALVRQVFLRITIAGKEFVDIEPKPEYASLFATMVTAQKIGYQELESSRSPVSLLLLPSGISVFGI\n>tr|C8BFH5|C8BFH5_9HIV1 Reverse transcriptase (Fragment) OS=Human immunodeficiency virus 1 OX=11676 GN=pol PE=4 SV=1\nPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKVGPENPYNTPVFAIKKKDXTKWRKLVDFRELNKKTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDLVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIRXKQLCKLLRGAKALTEVIPLTAEAEL\n>tr|A0A2M9CET1|A0A2M9CET1_9CELL Uncharacterized protein OS=Sediminihabitans luteus OX=1138585 GN=CLV28_2224 PE=4 SV=1\nMREYDATPASTSRGQAALRWVLWIGGAALLAFGVLTALTTVPSTSQRINVLLWLAGGVVVHDAVLVPLALLVGVVVLPRVPPSWRPALRGGLLALAVLGIVAVALVAGAATRANPSVVPQDVGAALALAGIVLVVGVLVGMFLGGARRPR\n>tr|A0A1Q5JW10|A0A1Q5JW10_9ACTN Lysophospholipase OS=Streptomyces sp. TSRI0107 OX=1703942 GN=AMK31_31985 PE=4 SV=1\nMDDAREHVLTGTRGAITVREWAHPRPRYTALLVHGYGEHGGRYTETAGVLAEHGAAVFAPDHAGHGGSAGERVLIEDFEDVVADVRQVAERARAAYPGVPTVMVGHSMGGLISARYAQRYGGDLAALVLSGPVIGTWETPARLLAHDAAHGEIPDIPISPAALSRDPRVQAAYAADPLVWHGPMKRPTLRAFVRALQDVAEGGDVGPLPLLWLHGDDDRLVPLAGSRTGVERLSGGALTERIFPGARHEVFHETNKAEAFAEVTAFLDRVLGA\n>tr|Q87XS4|Q87XS4_PSESM Uncharacterized protein OS=Pseudomonas syringae pv. tomato (strain ATCC BAA-871 / DC3000) OX=223283 GN=PSPTO_4102 PE=4 SV=1\nMSAFFRLFLRFFAAQRHGLLEGVAHFVEAFVVQIVNAPGALCAQVDQFFIVAHGLPLSDTGKQCQ\n>tr|A0A2I2FRI4|A0A2I2FRI4_9EURO Uncharacterized protein OS=Aspergillus steynii IBT 23096 OX=1392250 GN=P170DRAFT_441696 PE=4 SV=1\nMSVPTVRRAFGSISKQRSLYSVRDRLHFGILVHLFNIALALVLLPLNNTILLAAYTAGYLSFVLSRSDPIQRRQAALRDVQFYPKTILVTGVDTPHGLAVARSCYHQGHRVVGVSVTETAIPSGESMSKALGAFYRIPKTKYVSRLLDVINREKADVWVPCSEKASVLDDAMAKQVIEGRTECKCITMDTELASMFGRPATFRQYLVEKELPVVENHQVQSRDSIHKILHRSPTKTYRISRPDPVTRENKIITLPKRTLSLTYSEVSEIQISKESPWTLQQQSRLGEFLAEMLVVHGHVKAIKVRPADDQSTWGRSRLDEGLTMSIHKLMERFALKGGYRMTGHICVRVMVDEEVDANQVRYALHINGCTQGAGAVNDLLQDASEQLVRGYLSVEAPHLNGFMASDSVDALRIQAAQSIVSTTPRPKFSLYQKLKEHDDENLFTVLYPVAQHIDTLISGTERALMFWRDWRFSIHDPLPWWWDAHVYQPLKELESIVSGAEVKEA\n>tr|A0A1Q5DAT6|A0A1Q5DAT6_9ACTN Nuclease SbcCD subunit D OS=Streptomyces sp. CB02058 OX=1703921 GN=sbcD PE=3 SV=1\nMRILHTSDWHLGRSFHRVPMLDAQAAYLDHLVETVRARSVDVVVVAGDVYDRAVPPLSAVQLFDDALHRLAAAGVPTVMISGNHDSARRLGVGAGLIARAGIHLRTDPADCATPVLLPDPEGGDVAFYGLPYLEPALVKDSLGASKAGHEAVLTAAMDRVRADLAARPDGTRSVVLAHAFVAGGEPSDSERDITVGGVAAVPAGVFDGVDYVALGHLHGCQTVTERVRYSGSPLAYSFSEHTHRKTMWLIDLGTGGDLVAERVECPVPRPLARLRGRLEALLEDPALDRHRGAWVEATLTDPARPDEPMARLLERFPYTLSLVFEPERTPDDPSASYAQRLRGRDDQQIAEDFVAHVRGGSGPSARERTVLRAAFDDVRVDDVTGEVSR\n>tr|A0A7Z7ZTA3|A0A7Z7ZTA3_9MICO Type III secretion system (T3SS) chaperone YscW OS=Cryobacterium psychrophilum OX=41988 GN=EDD25_0264 PE=4 SV=1\nMDESDDDAQTVRGTIVFPPAQRPEEPFTVIVQLEDVSRMDAPSRILAEVRLANRDFGAGRGRELPFRLPFPTELLDPAKAGPLRLNLRVHVRHTAVSHEPASRGIMTHVDVTEGDFVSTQSHPVPRGGALVRIPVQRV\n>tr|F9WTX3|F9WTX3_TRYVY Uncharacterized protein OS=Trypanosoma vivax (strain Y486) OX=1055687 GN=TvY486_0039130 PE=4 SV=1\nMLGKSCHQLQKNKKLIEMIDTRDECKSYTEKYSVSIRLSSYAEKLDEMNNLIEWKNEMVKLVGQTHKEVKSSAYRGNLWTVNDEKVKEVVQAIRNLTDKPVVTLELLETVRVSVVEANKTVNSTVNSMENVNKTMLSALEGNGTLLPQLVGQYSEVSAQLHERKGRLATTQGNINSTMKAIENALVDVAATESLVKYVNGLILLLSLFGYSSVSRQLRGAKIASETTHDTSDAKAAALMASELPGSAHSYASTAQVEIERETGSLESIKPQLMKHLNETGISISSLTTEACDKGLSKVFNGSLAVAFSRAAGLNSSGMAKAQEALKKLKAEAALVNAKLAYINGSLQQAEKAVQDVDQHDEAVMSTVKNSIVEVVSGAMKDLCETMKGLYTFRLASTSLNEEAEGILGNVSVLVGLSNVTRNKMNKAVKTVPNAAEYFGVANRELAVFARATNKIEKLHSTVQSDVASFLEEQMKRESHINTTHMPSL\n>tr|A0A1V0RMR8|A0A1V0RMR8_9RHOB Uncharacterized protein OS=Roseovarius mucosus OX=215743 GN=ROSMUCSMR3_01389 PE=4 SV=1\nMTIFTPLTAATNADRLEPSHDTVYSIAFAALLPSLADFIEAERDLDDICHSYDPAYGVWHRDAQVARMRLDSTLRHVHGLRVERPEDQPLRRMALLADAMLKDGAPERPQYLHRQMKLVFFRQFQVQGFGPTAHSRNAMLIQARHLIDAMMRLPLFDYSPDCAIAPDASAPADDLSPAFF\n>tr|A0A0J8BW32|A0A0J8BW32_BETVV Uncharacterized protein OS=Beta vulgaris subsp. vulgaris OX=3555 GN=BVRB_8g185090 PE=4 SV=1\nMRSKREREELTDGEVKRQRVEKDEEEEVSSPKTHAFENPLLPLASYNDDDEEEEEGNVKKAEVNGRKNEIVDDDEDDDDEEDFKFGQGKHNRLVVVRRDCPYLDTVNRQALDFDFEKFCSISLTNLNVYACLVCGKYYQGRGSKSHAYTHSLEAGHHVYINLKTEKVYCLPDGYEINDPSLDDIRHVLNPRFSKEQVEQLDKSKLWSRALDGSDYLPGLVGLNNIKETDFVNVTIQSLMRVTPLRNFFLIPENYQHCKSPLVHRFGELTRKIWHTRNFKGQVSPHEFLQAVMKASKKRFRIGSQSDPVEFVSWLLNTLHADLRSSKKNTSIIYQCFQGELEVKKEIQSKGTVERRLKGNDQNGGSENPNVITETSKMPFLMLGLDLPPPPLFQDVMEKNIIPQVPLFNILKKFDGETITEVVRPQIARMKYRVTKLPPYIILHMRRFTKNNFFVEKNPTLVNFPVKNLELKDYIPLPTPNDKEKSESKGNKKMQSKDHEKLRSKYDLIANIVHDGKPSEGSYRVFVQRKSEEQWYEVQDLHVSETLPQMVALSEAYMQVYELQQPH\n>tr|A0A430LAB7|A0A430LAB7_9HYPO Uncharacterized protein OS=Fusarium euwallaceae OX=1147111 GN=BHE90_012892 PE=3 SV=1\nMDSKNSLLYKNFHKHPAALVESASGIYLHTSDGRKILDATSGAAVACLGYDNKEVQKAVVDQLVSVPYCHPGFYKTKSAEDLADFLVDSTNGQMSKAVLCGSGSEAVEVALKLAKTHFSHLAIPQTERCHFIARVGAWHGATLGALTLGDFKVRKDPFVQLISQNSSRVSACSTYRGLRKGETEEAYVQRLAQELDDEFQRVGPNKVCAFVAETVGGSASGCAMPVKGYFPAMKAVCEKYGALLILDEVMCGMGRTGSLHAFEQEDVVPDILVVGKGLGAGYAPISAVMLNTKLVESFQKSGKGFAHGQTYMAHPQAAAAGLKVQQVIRDTNMVAHVQRMGDYLGSRLKERLLPLPWVGDIRGRGLFWAVEFVIDKKSKDPFPYSLGLHGMLHSKGMSKGYEISLFNANGGYDGYSGDHFLICPPFIVNEADVDEIVDRTARVIEDTFSELVNSAVWEKIAIQMDISTEAPVTDISVGETLVSVN\n>tr|A0A5I4QS92|A0A5I4QS92_SALET Mn2+/Zn2+ABC transporter ATP-binding protein OS=Salmonella enterica subsp. enterica serovar Agbeni OX=1967642 GN=znuC PE=4 SV=1\nMTSLVSLENVSVSFGQRRVLSDVSLELSPGKILTLLGPNGAGKSTLVRVVLGLVAPDEGVIKRNGQLRIGYVPQKLYLDTTLPLTVNRFLRLRPGTQKTDILPALKRVQAGHLIDAPMQKLSGGETQRVLLARALLNRPQLLVLDEPTQGVDVNGQVALYDLIDQLRRELDCAVLMVSHDLHLVMAKTDEVLCLNHHICCSGAPEVVSMHPEFISMFGPRGAEQLGIYRHHHNHRHDLQGRIVLRRGNGHS\n>tr|A0A6H0AMT6|A0A6H0AMT6_9MICO Transport permease protein OS=Clavibacter michiganensis subsp. capsici OX=1874630 GN=GW571_05855 PE=3 SV=1\nMTAVRPARPAADRAPSLPGVVPLGIHRVRYEVRRYFRQTDTIIFTFLFPVIMLSIFSVAFGSSGNLGTAPDGSGGVSAAAYYLPGMIAAGILLSGVQNLAVDIAMERSDGTLKRLAGSPLPVLSYFIGKGGQVIVTSLLQMVVLLLVARFAFGVELPTDAGRWATFAWVYALGITSSAVLGIALSRIPRSGASATAVITPIVLVLQFISGVYLTFTMLPTWLQDVAAFLPLKWMAQGMRAVFLPDALASVERGGTWDLAGVAVVLAVWLVGGTIAAVATFRWIRRDS\n>tr|A0A668RY45|A0A668RY45_OREAU VEFS-Box domain-containing protein OS=Oreochromis aureus OX=47969 PE=3 SV=1\nMAPHKQSHPVGLGSGGKPNGLYHHQPSSASMAAAKKPNMQLIQADHELFLQAFEKPTQIYRFLRTRNLIAPIFLHRTLTYMSHRNSRNNVKRKNYKVDNLLFKVEKMRGEQETHSLASNLQLTFTGFFHKAGKLSQDSENEQNSVSLEVLLVKVCHKKRKDVSCPVKQVPTGKKQVPLNPDTSAGVQAKLSSYPSLLVPSSEFEPSNSHMVKSYSLLFRVSRPGHPRTQINGLANGEIHHKEAVNRKRRSSALREEGETTFVAQMTVFDKNRRLQLLDGEYEVSMQEMEECPVGKKRATWETILDGKRLPPFESFSQGPTLQFTLRWTSDSADHSTAPVAKPLATRNSETNQDTRPSTLRATHTPTVKESVNTDVQTRREQVLSEPRQKLRIFYQFQYNNNTRQQTEARDDLHCPWCTLNCRKLYSLLKHLKLSHSRFIFNYVPHPKGAKIEVSINECYDGSYAGNPQDIHSQPGFAFSRNGPVKRTAVTHFLVCRPKRTKPSLSEFLESEDGDREAQRTYISGHNRLYFHSDSCLPLRPQEMEVDSEDERDPDWLKEKTVKQIEDFMDVNEGEKEIMKLWNLHGLFCLFMNEACLLFAEHHAAVIVKRNLCRNFLLHLISMHDFNLISTLTINQAMARLRLVESQSEASISDLPGTLSSTKGFLLAGSVCTCSVESRLRRLLGVKSAAVLQKEV\n>tr|I6XM23|I6XM23_9CAUD Uncharacterized protein OS=Pseudomonas phage MP1412 OX=1204517 GN=MP1412_18 PE=4 SV=1\nMDLEKLRRDWAEDPQLKFYAFDTVEELAAHLRKVHTDMMNGEHGCFGYLYRQQTLRLRELMKELQDERERKASGR\n>tr|A0A498P3D5|A0A498P3D5_LABRO VPS10 domain-containing receptor 3-like protein OS=Labeo rohita OX=84645 GN=ROHU_001246 PE=4 SV=1\nMRGRMIKMKDVLGFESSWTYWTLFCLCALLPLPASADITCASCFAPIRRNEAHAKPTAVVSRDFGSAKDGSTDKNWKWRLDGAQLSPEAHKKSPFVSRRQKLQNAHIPRAERTSPAGEKDGKVYPTWSPVETKVDRREKRSLSDSASGSRFEFRRTGGVDGTGKSPRQNEPHLITSTFALSGDAAHNQAMVLWSGHNSSEDGSQGSRVAEPVAVNTLTRGHIKPVKTHSGKTDARLFTVVYERVLRMFCQVILILTKLFDFNLGTVTESSLWRSVDFGTTYEKLTDKVMIRTMLSYLYVCPTNKRKILILSDPEVESSLLISSDEGATFQKFNINFYIMSLLFHPTQENWILAYSHDQRLYSSVDFGKKWILVHERVTPGRFYWALSGLDKEADLVHIEARTDSGQMQYITCRAQKCSEEGRQYPFSGRIDTNSLVVQDQYIFLQLTTAGRTTYFVSYQRGPFRTIQLPKYCLPKDMHIVSTDEGQVLAAVQEWNENDTYSLYISDTPGVYFTRSLPNLRTSRGLAGNLIVDVYKVAGVSGLIIANKKEDAQMRTYITYNKGQTWSLLQPPAKDTTGHDINCNLPSCSLHLHLQMSENPYTPDTISTKHSAPGIIVATGNVGPELSFANTGMFISSDAGNTWRQGEVCVMGERQVYMKRKPGTHCTLGREYSRVVSAEPCICTLYDFECDYGFERQASGKCAPAFWYDVSLPAHTCSHGQRYRNSTGYRKVLLNNCREGLKDTLSPRMQQCKPIAPSGLQLSTVNSQLTAVLGTNITFRVALQNPLITLEGSVSHTFTREGPNSVTVQVSAGGTVLQDVKIITVKDFFRSLLLSFSPNLEEHNPSVAEWRQDVGRVVRATLSQMSEVFMNALNQNLIQFDLKPDTRVTVSVSQLTLAPLVDSSVLPSGSAMLLLVSLGLVGLAILFIYKFKRKIPWIHVETEDTHEKEPEMISAVGQEKNGTRTTATSFTTCSTHTTHTPFPSNTGTHNSFSHLPPPRDLMEKELEAHNTGGLGVGERQRTRQIPNCTNV\n>tr|A0A424MM85|A0A424MM85_9GAMM Tryptophan synthase alpha chain OS=Gammaproteobacteria bacterium TMED112 OX=1986734 GN=trpA PE=3 SV=1\nMQNSNLLTVNKNKTAFIPYLVAGHTSNEVFSAALKLLNDVGADLIEIGIPFTDPIAEGKIIESAHHHALKNNFVLSEVCKIVKEFRTYSDTPVIAMGYTNSFINPSSEYIATKLSESGFSGVLIVDLPASEKSIINSFTEKKLNLVQLIAPTTQLNLIESFLENDPALIYYITQRGITGSTNLDLAEISEKLSSIKKLSNKPVVTGFGIKTVEDVKNLKNLTDGIVIGSPIVEKINLDSSLNALKEYLKPIVKAIKE\n>tr|A0A4P7QD82|A0A4P7QD82_9CORY Putative NUDIX hydrolase OS=Corynebacterium endometrii OX=2488819 GN=CENDO_01140 PE=3 SV=1\nMTFIPQPDAPGSNVTLRPEDSPAWMRPALGIDAAHAQRTMGDRAVTNGPWKKEAAVLVLLAGDSVEEGSVLLTHRSPRMRSHSGQIAFPGGRIDPEDLNAVDAALREAWEETGLDRSTVTPVEQWARLSIRATGNPVSPVLAHWHEPSPVGVASPNEADDVFTVPLADLIDPANRLTVGWGQWSGPAFHAQDYVVWGFTGGVLATLLERAGWAEDWDRDTVHPLHETLARSRNNERMR\n>tr|A0A257QSR6|A0A257QSR6_9PROT DNA topoisomerase 1 OS=Rhodospirillales bacterium 20-60-12 OX=1970565 GN=topA PE=3 SV=1\nMTDIVVVESPAKAKTINKYLGDGYHVLASFGHVRDLPPKDGSVKPDQDFAMLWESDSRGEKQVGAIAKALKGAKILYLATDPDREGEAISWHVRAMLEDKKALKGVTVKRVTFNEITKSAVTTAMAHPRELDQPLIEAYMARRALDYLVGFTLSPVLWRKLPGSKSAGRVQSVALRLICEREAEIEIFKAREYWTIEAGMITPAGAPFTARLTHLQGKKLDQFDLPNEAAAMAAKAAVQAGDFSVVQVEKKRTRRHPPAPFTTSTLQQDASRKLGFSAQQIMRTAQQLYEGVAIGGETVGLITYMRTDGVQMAREAIMAVRDRVKANFGTDYLPATPREYNSKAKNAQEAHEAIRPTDFGLSPDQAGRYLNAEQSKLYELIYKRALASQMQSAELDQTSVDISDAAGTTLRANGSILAFDGFLRLYREDMDDVADDDDAKILPPLAKNDPLKRGEVKAEQHFTQPPPRYSEASLVKKMEELGIGRPSTYASILTVLRDRNYVRLEARRFIPEDRGRLVTAFLTSFFARYVDPDFTAGLEEKLDLVSDGKADWRQVLRDFWRDFSAAIGQTTELKISDVIDALDEDLGPHFFPSRADGSDPRACQACGTGRLGLQLGRHGSFIGCSNYPDCQYTRRLIVDGEEGADTLKEGMKILGQHPETAEDVTLRRGPYGLYVQQGEPVDKEKPRRSSLSRGMNADDLTLDQALGLLSLPRLVGPDPQTGQKIEAGVGRFGPYVKMGSIYASLDKDDDVLAIGLNRAVMLIAKKAEGIRNVGPHPKDGADVMVRKGRFGPYAQHGKTVANLPRGTEIADITLDEAVALLAERGKTLAPKGKAKAGAKKPAKAAKIMATGDAAPKLKPKARPPVKAAKPKAAPAGTAKPAAKAKPKPKAAPKAAAKPSAKKAAARAK\n>tr|A0A087GHN3|A0A087GHN3_ARAAL RNase H type-1 domain-containing protein OS=Arabis alpina OX=50452 GN=AALP_AA7G126600 PE=4 SV=1\nMYIAESGTSVSAVLVREERGEQKPIFYVSKTLTDAETRYPQLEMLALSVVIAARKLRPYFKSHSIVVLSTFPLRSVLHSPSQSGRQAKWAVELSEYDIEYRGRSCAKSQVLADFLIQLLEGDVAKEDSSQEATLSGEWQLHVDGSSSKSSYGIGIRLTSPTGEILEQSFRLGFKASNNEAEYEAILAGIRLARAFNIEEISVFSDSQLVVNQFSGKYATKDERMEACLGLAKELAALFKKFMFTQIPRGENVNVDALANLASTSDPALKRMIPVEFIEFPSILPAVSLTIITRSQAARKIKVTQKRGENDGKDIVITDATKDNVEMSDATEDTPLTQTDPNPSRLPIANGSSYACY\n>tr|A0A549YU05|A0A549YU05_9CORY MMPL family transporter OS=Corynebacterium silvaticum OX=2320431 GN=EU799_09205 PE=4 SV=1\nMFSRWGDFAYRHRRVVPVAIVVFIVAIYGIFGIRLADRMSQEGWDDPGSSSTQAANIEQEVFGRDNSGDVVLLFSSEDGIAKNKNFDEIKRYLSDLKALHPNQIADVTSYFDNRNAQLLSKDGKTAFAAVSLRGDHEQTLKDFRAIKGNLKPKFDGVTVQVAGATAVADALDSGMAGDIKRAEVVALPLVAILLLFVFGSVVAAFMPLIVGILSILGSLGVLSILAGFAQVNVFAQSVVTLLGLGLAIDYGLFMVSRFREEMDQGRDIRDAVRITTSTAGKTVVFSAAMVAVALSGLLVFPQAFLKSVAYGAISAVGLAALLSITVLPSIFAMLGTRIDKWTLRRTKRSARTLADTWWYKLPAWAMKRSKTVVVSVVFLLIALTVPLAGITFGGINETYLPPNSDVRKAQSTFDQEFPAFRTEPIKLVVSNATNDQLIKVYQQANTVTGLTDRFKPSTATKDGTTVLSAGIAERKDNESVVKQLRAIEVPEGVSVHIGGTPAMEVESIEALFEKLPWMAIYIVLATFILMSLVFGSMILPAKAIIMTILGMGATLGILTAMFVDGIGSSLFNFSAGPLMSPVLVLIMAIVYGLSTDYEVFLVSRMVEARDNGESTDEAIKYGTAHTGGIITAAALIMIVVCGAFGFSEIVMMKYIAFGMVVALLFDATIIRMLLVPAVMHLLREDNWWAPRWVKRASEAMGHNSAPEPLPVASRPVESGDKPARRVEPAQPRVPVSAYMDDTSTMAPVKEPPAPQRPAAPRPTPPRPMPPRTPPRTDAPAFNPKRTWGSTPATSHNAGGADTVEGQGSHTPKRKLHHSRRETLVSDTTVVDPRTAGRSGRIASEDNELVPFSELVKRLREEH\n>tr|A0A662N443|A0A662N443_9EURY Thioredoxin-disulfide reductase OS=Thermococci archaeon OX=2250254 GN=trxB PE=4 SV=1\nMFSLTGLSTSGKDENKVRDVLVIGAGPAGYTAALYAARYGLDVDIISKDLGGQIALTDIIENYPGFPEGISGQELATRMYEQVKKLGVDVIFDEVVRIDPTECAYYEGPCKFEVKTKNGKSYKTKTVILAVGAEPRKLHVPGEDKFYGRGVSYCATCDGPLFKGKSVIVVGGGNTALQEALYLKSIGVNVSLVHRREGFRADKIVQDRFRESGIPMILNTVVTEIKGEAKVESVILKNLKTGETFEKKVDGVFIFIGYEPKTDFVKHLGITDEYGYIPVDMYMRTKVKGIFAAGDITNTFKQIAVAVGQGAIAAASAKELLEDWREKNLSE\n>tr|A0A7U9R2R0|A0A7U9R2R0_9FIRM HTH-type transcriptional regulator YesS OS=Lachnospiraceae bacterium OX=1898203 GN=yesS_1 PE=4 SV=1\nMKAFHFFRHSRTYRRMFLHTYVLYAASSLLLLLAAGLFLFYQDSHTIRNNTLQAAANLAYYADDRLSACQKLSASVGQSERLLSLSSNAATDLDFSLLDSTTLFAAQHDLVSAKALNRFAATLGVYLYNKGFVVSDYGTLTLESFYQSIFNMSPNVFSEYLRPLGSGSYLFLPRGAVEETGTPQHPLIVLSVIDSNSRRYGNLFIFMDERQMREDIEQLLNNRDMEYYLFAGEGQLVVSNRCADPKELSRIYSGLMENDSYQSNTGKYSGWTAFAGYSDAYLRERLHRRLWILAAGLAFLLLSGLPLTHAICRKNYAPIRELAYIVSSPEQRSDNRDMEYEALKSIISSIFKDKSLLEEQLLIYRPLLVNSMLLELLEGAQPRKEVLPGLQKLGIRFPYPYHVCCCLLTARATQDFLMSLAQATRDGETGCLYITFRKHLGIFLISASSPEKCGDAVTRLLALLAEVNPDAFLGVSDAVDDLEQLGAACQQSRSALEYLPSDPFSRGIYWSRVKSSGILKLALPTCLASLPNAFGTGQFAEARNNLNLYFQTISRCGLTKKEHLTHARDRLLEAISRAEKEHGLLFDSASLLNWTPEQPHALKCLQESAFLACDRLERDMLESREQQSLNAAQNLMDYLQLHLRDEDLSLSKLAETFQLSESSISRRIKQITDYNFLEYVNRKRIEYACSLLSETDLSVNDISKASGYVNDITFRRLFKKYMGVTPGEYRRQA\n>tr|A0A540WLW0|A0A540WLW0_9DELT LPS assembly protein LptD (Fragment) OS=Myxococcus llanfairpwllgwyngyllgogerychwyrndrobwllllantysiliogogogochensis OX=2590453 GN=lptD PE=4 SV=1\nMSLLVPLAAALLVSSAQIPLATQVQLPSGETVELAADFLTYEADKQLLTARGHCELRTGEMLLRSDEVTYDEANQVATATGNVMFVGPDGMAAVADDVHVDIRTFVATLKGGLFMQKKGVTQEALLTAKTPQELRAMGETPIILSGSRIRRTGPNAFVVDDLAFTPCECGPGTPTWRMEASSANVILGERATLTWPVVYIQSVPIFALPWVYLPLAERRTGFLFPSPQFSSLNGLGLEQPLFVTLGRSYDLTFTPGYYHGALVEKTHDPDGNSETKNTITYEEPRPNGVKGPRLLTEFRYVPSERTRGRATLGFLYDSRPKLDPTTLDFFRYPVDPNGIRKIIDAPRGLRGEASWQHFQDLGSGWYDRVDASVVSDGNYTRDLTADILVQGLDYLRSTATVFRRQEDSYAGLDVSLRQDIRWPYRFFQDNRVPAEVDPLRPDLPSPRTFQRLPGLVLSLPERPLLGGITGGLRAEFTRLAPIHEGFGDEGVDGIFRPNGNYLLLGVGDAPDPGQSNALFDSRDREARDRIDFTSRLSTSVALGDVARVTPSLSLRQDVWAGEYSGKSWQRGYPIGGLMLDTQLSRTWTGAKTSYRHSFAPSLELRYVPGGWG\n>sp|B8CSY5|RL21_SHEPW 50S ribosomal protein L21 OS=Shewanella piezotolerans (strain WP3 / JCM 13877) OX=225849 GN=rplU PE=3 SV=1\nMYAVFQSGGKQHRVEAGHTVRLEKLEVATGETIEFDQVLLVADGETVHVGAPLVEGGKVVAEVVSHGRAEKVTIVKFRRRKHHDKKMGHRQWFTEVKITAISA\n>tr|A0A815PV26|A0A815PV26_9BILA Hypothetical protein OS=Rotaria sordida OX=392033 GN=JXQ802_LOCUS53044 PE=4 SV=1\nMEELIRSVIQFDGALNQDVIQWLEYIEEVFDRVQLQTSNKYIAIQYFLTNSAATWFKYKKSNIPDWFTFKRELIEAFQSSSSFSSSHLLDRHQLIIKEEPQKLEQEQDILPVPASTSIISNKKNDSEDYQLDLVHDGSIKSLENLEVDDLEDKCLHEHEQGYYSSILVNTNDFDLDIQHQDADAADSCDTQQQGANVADVCDQLEQQGESVINSDSVQTDIEDTFEDFTRPMDSLTGNDSLINIVLPHDVQYLWSDKYKPRPPRILNKAHAVYNWNRYNKLHCNQDDSPPPTIQENQFNTVSTEWNYTYNHGLRFYFYNEMIQLRFSFQKTRKEVIVLRTLQHENIVGYKTVWCEHPPDDWQKKQEKSFQVPSSSEDSTTGFNTIHSISKESKSNQESNDDTSNPFHHSEKWVPLNANSDENKKAPEITNIRSEEEEDNNYEEQ\n>tr|A0A444Z367|A0A444Z367_ARAHY Rep_fac-A_C domain-containing protein OS=Arachis hypogaea OX=3818 GN=Ahy_B05g076446 PE=4 SV=1\nMISLFKSLISNGVVYAFAYFRVYNNRGSYHTTSHHFRMFVQAIPTVRPSFCNAILLYSIKLVPFTKIMGYFSQHPFLVDVARVITGVEGERKYVKDGKLIDMLLNVAVLGEMVERIKDFVAAGEQQVPVVIFQFATVKTFRGLHRCHEKPPHVEEKDVTHRIEEGDDILSSLRLVAVAERGAPSSPSRLRVWGFEEREKLAEERETVCCREASQYLSILSSKLAYVAEDEVLYSIERKTIKELRAVGFYIVLATVLDVEPALIWWYKSCVCSVKAKANADTYFYDGCNKDVNHVVDMYKLDLLVFYGTATTTFVVFDKEATALFGWTCTEMVKELNEKGKAGKDPIGFKEFLFKVELKTTGWCDSYDVSLISFELTILARWRDTQGLVKSGIAPAGPTTHFDGDDFLIFEKKRSIEQLKLSKEFE\n>tr|A0A379C7X7|A0A379C7X7_9FIRM Uncharacterized protein OS=Peptoniphilus lacrimalis OX=33031 GN=NCTC13149_01564 PE=4 SV=1\nMDKKTDAPTFTKEQFLNAKDPIGNVDALYAILEDGKEYTKEEALKIYEDFMNREVK\n>tr|A0A2I0I053|A0A2I0I053_PUNGR Uncharacterized protein OS=Punica granatum OX=22663 GN=CRG98_042231 PE=4 SV=1\nMVKQGFEGRSRRNRSPRWCQRHPKSLVAMVWAAQQRREGVVKETHKTHRIGRFNGILLKTDRFNGSDGSKLQFRFSGESDRTWCRFSEPAGPDHGPSPPATAPARSRSGCSLRSTPARYTFEGVVCLFVGEHCHHRGDEVPGGP\n>tr|A0A1L9V3M1|A0A1L9V3M1_ASPGL Chorismate synthase OS=Aspergillus glaucus CBS 516.65 OX=1160497 GN=ASPGLDRAFT_40709 PE=3 SV=1\nMSTWGQYFRVTTYGESHCRSVGCIVDGCPPGLQLTEDDIQPQLTRRRPGQSVLTTPRNEKDRAEIHSGTEFGHTLGTPIAIMVRNEDHRPRDYGGQTMEVFPRPGHADLTYLQKYGVKASSGGGRSSARETIGRVAAGAIADKYLRLVHNVEIVAFVSSVGREYLNPPTPEHPSGINPEFQQRLKGITRSIVDQFEPVRCPDQEASQRMIRVIERFRDEHDSIGGTVTCIIRNVPTGLGEPCFDKLEAKMAHAMLSIPATKGFEIGSGFAGCVMSGSAHNDPFVRQNRVLVTKTNHSGGVQGGISNGSAIYFTVAFKPPATIGRPQSTANYQLQDSVLEAKGRHDPCVVPRAVPIVEAMTALVLMDALMAQYARDAARGITGASGWGNKCV\n>tr|A0A7N5JEP9|A0A7N5JEP9_AILME Lipocln_cytosolic_FA-bd_dom domain-containing protein OS=Ailuropoda melanoleuca OX=9646 PE=3 SV=1\nMPPNLSGYYRFVSQDNMENYLRALDINVALRKLVCLLKPDKEIIHTGDHMTIRTLTSLRNYIMDFDLGVEFEEDLGPVDGRKCQTTTQTR\n>tr|A0A353MIV1|A0A353MIV1_9DELT DUF490 domain-containing protein OS=Geobacter sp. OX=46610 GN=DDY22_22195 PE=4 SV=1\nMRRAALYIGCALAGLLLLCLLGLFWLLDTTAGARFAVTALTGAAGFNISMQGVEGRLLDRLHLTGVRVSKPQLRAQIDRLDLAWEPRQLWNGHLQVHELAVSGVRVQDDRPATTEPPQLRWPRVSAPLRGLSAQLSRLKVKDLSYRHLEAAPLLVTELTGSLHFKDGLLSASQLSLLSPDGRVSGEIAAGLWHPSLRLDLAVVPAQPVQELDFFSLQARLLPGRLPEQLAGGIVVAGRSGGARRLELTGELGIAVNALNLRRLKLSRPGSRGTLTGDVSMLLSKPEPLFSLALRATDLDLAKELKLQLPTRLSGTVTFSGSLSNFLGSFDLANSGPGWQTASLAAQYRGGPTGVKLAPLTGKLLDGRLRGALEVAWSEGLRISGNLAGRGLNPGRLAAQWPGLVNLDLAGKLEMPEQGVARGELRGKLLESRLHGRDLQGELVAAFAGERLRIDRLLLRGRGFNLQGAGELDRRLNLAARVSDLSGLVPGAAGQLQADGWVRWRDGLFSGAASGQGANLAAAGVSAAALRLDARLGEGKSPPVYLDASLNRLRVGRFQADSALLTLQGTPASHTLTAKLSSSSFAEAPADSSAFAEASASAKTLAELRVALSGGYRDGVWRGELTRFSGRDGVGPWSLAAPTPLMLSAQRMRIAPLVINGLPGERVEVAGELERQPLSGAVRGAWGGLNLARANAWLDGVQLAGASSGDLSLRLLPGERLILTGRAEAKGTLVADGQRVDLERLAATLQGDAGGLRAAVDLTLAGGDGEAHLLFTSTDPASLALPKRGDLTLNWSEFDLALLRPVTPAGLIVDGRSAGLVRGKLLPGSKLELRGNAALDQGHLNWRAEGDELDASIDSAELSFSWRGGTQGAGKGGAGLLTLNARAAATGLYTSKGQRIALIRGTLRADADEQGSRAGLDLTLEEGGALRVDLSSDSPASLGIPETGDLAMEWGGIDPALLKPWLPGTLDLQGEFAGEASGRLLPGKRLEMAGQAEFSQGRAKWQGENGEVSANLRSANLSWNWRGETLSGALSLALAEYGQARGSFVLPIPARLPLLPDRNGALQGALAGRVQERGFLTAFLPGLVQESHGDLDLDLKLAGTWSDPRIAGSLQLSKAGAYLPTAGIRVSDVQLMARLEGDQVRIDNFRAVSGAGHIEGNLEARLEGWQVAEYSGTLSGERFQTVYLPELQMVTSPQLSFKGGGDSVTLRGELRVPEMLVSGPPVRQIVTPSGDVIMEGAPPASEGKPFPLALDGRIRVVLGEKVEVKASGIDAQLGGSMDLVLQGVDSITSSGEIRVVKGRYRAYGMDLEIVRGRVYYVDDPVDQPTLDILALRKVGDVRAGVTVAGFLKAPIVKLYSEPPMPEVDILAYMVLGHPLGASSEQGNMVAMAATSLFSLGESSSVQEQIKDRLGLSVLGVETVDTAGVGLMGYKEIPVTPTGEAQARPAAAESLLTVGKYLTPQLYLSYGRSLITGGNLFMLRYDISRRWQLETQSGSESGLDLYYKLEFN\n>tr|A0A1R3FS38|A0A1R3FS38_9VIBR Diguanylate cyclase OS=Vibrio sp. 10N.261.45.E1 OX=1903177 GN=BH584_20360 PE=4 SV=1\nMKVTRKYILRFSIALAVVSMILSAVQFNRTEKSLLESNQLFFRTIVNASYDIVDTTVNEAIKTYLKGITDTVASHVWHATPEQEIEQVKQIASELHIGQSGYIYLMSPQGVHLYHPFLQGKKRGHLTHIQKQLSIDSGMSEYFHANPHEISRRAKVAYSMRLPSGNTLVATTYKEELMYLVDIEGLKDKLRKYAFGDSGYVYIIDLKGDLVLHPDYEHKSLQSLIGYSSQLLIDRIATKPEGHFSYSVSSDSGTSSKNVFYKFYPYLNWVISAGILEQELNRNHSLLFISLMALVVSLLCIIVVLVLYLRHRHLKILDVASLDYLTGLPSRRSFIEQLKLKIAQRSPNSLTNVGVILLDIDHFKRVNDQYGHAQGDRVICEVAKSLKRFVNRRRLIARYGGEEFILVTFDCDERELFELSEALRLCIQQLQGLVSPVTISAGCCHAQALTDIETAIDQADKALYQAKESGRNNTQMYRENEYRVAYM\n>tr|A0A509DWZ7|A0A509DWZ7_9HYPH Uncharacterized protein OS=Thalassocella blandensis OX=2584524 GN=TDB9533_01798 PE=4 SV=1\nMQNKSSQATFENLTQFRTIRRKQMSGGTELPAMTPNEVTAKVVEDINFLRGRIDHIKKAKHANTNPSILKTYESMLESRETILAWLDENYHIQINQSAQVATASAKTSSN\n>tr|A0A7C3D3X0|A0A7C3D3X0_9BACT Ubiquinone biosynthesis protein UbiB OS=Bacteroidetes bacterium OX=1898104 GN=ENK07_06575 PE=4 SV=1\nMAITSAPRKLKRTRQVMSTLARHGLGAFAAGARRWYTTVLPYRKARPGVEAIPVEVRVRIALEELGTTFIKLGQVLSMRPDLIPHSLAQELEKLQDKAAPLPFDVVEKELARALGPDFREQLGEIEPEPLASASIAQVHRATLPSGEIVVLKIRRPGIKRQVETDLAILHDLARMAERTVTELELIEPTRIVEEFARTIRREMDFIREARNVERFRRHFRNDSTIYVPQLYWKFCRENLLVMEWIDGIKVSDVEHLRKAGLDPKIIAIRGAQAILKQVFEHGFFHADPHGANVFVIKGNVIVPLDYGMMGSLDDRLVRQIEDLLIGIVRMDVDRIMTVLENLGSIRPGTDTRSLYSELYDFLDRYYHVPLYQLNTPELVGELLDIVRRYRLRLPPDLVLMIRSLMLAEAGGRRLYPEFDMMTLAKPYVKRIIMRRLSLKRRIKEAPDTLEEVETLVRLAPKQVQSILSKASQGELSVRVDPAGIPEILHELDRSSNRLAFAMICAALVIGSSITISAGFGPFLFGFPLLGVVGFGLAALLGFWLLFSIMRGGKL\n>tr|A0A1Y0RNH2|A0A1Y0RNH2_9CYAN TonB_C domain-containing protein OS=Nostocales cyanobacterium HT-58-2 OX=1940762 GN=BZZ01_25955 PE=4 SV=1\nMSYVSLLKNIPEFLSQPTGIAAIASLGIHGAIALLLPIVPMASKPKQEQPSSKSSVGLVELSQAEQSRLPKPATPQLSLQPQAPVLPQVPPTNFANQSIPPLPPLPPPAASTELILPPLPKTDNLAVASLPKGQSLPILSKRDLQPDTSLRTKSRPFSPFVDRVKLGEPKPLESARIPDNIPPVQAANIPQEQDLVNTAAPMSSDQVATALPQGSTATQTTQPGDEVSQVARKQQLVTPVVQPPQARDSSIALGGQNLPQLPQGSNFTAPELPPLAAERSLSTPKTFAERFTEVKNQYPNLETKQPIAAIVDAKAGTEGNVEGDLVVNPQGQVESINFLDNSVASELKTSVREYFRQYFQSNPVQANGKPKFYPFNISFKLNSSNISKTPAQGLSTSSQVNQAQRSLVQRLRSVEVSSQPSKEPQKLNQVERLRSSSVNQQVSQTNQKTSAPQASQERQTSKQQVILRQTTSAPQTNKEEQTSRQQVVVRQSASSLQTNKEEQTSQQQVVVRQSTSAPQTNQEQTSQEEATNNQPSASIESSKKLLQQLRQIRDKRQTSNQEK\n>tr|A0A3G1T1W8|A0A3G1T1W8_APPPP Immunodominant membrane protein OS=Apple proliferation phytoplasma OX=37692 GN=imp PE=4 SV=1\nMEANQQKKILIGVGSVVGALVLYLILAWSISFWPFSSQSKQEIFDDLSNKITFSTDLEETNTIFNKAATERKKQFKEGFIDNKVNKLVELANKLTTPKITDGDKKTSFDSASASLKEITDNQTLLLNHNDDFWKAETNKTTVQGEIKKIIDAYVQFKTQIKTALDLK\n>tr|D4KZC5|D4KZC5_9FIRM Uncharacterized protein OS=Roseburia intestinalis XB6B4 OX=718255 GN=RO1_22070 PE=4 SV=1\nMGQSHNKSSFVLEKDRSAAKINHMEGMV\n>tr|A0A261RL90|A0A261RL90_9BORD Uncharacterized protein OS=Bordetella genomosp. 9 OX=1416803 GN=CAL26_00210 PE=4 SV=1\nMFSWFKQGLGAYAPAPVGASRRDKILGALGALLGLSCTEWIARHALGEASPWFIAPMGASAVLAFAAPASPLAQPWSLMVGNVSAALVGVFFSHLIPAPGLAAACSVAAAIAVMFALRCLHPPSGAVALTAVLGGPSIAQLGYGYALYPVAVNSAVLLCIAVVFNGVLKRNYPHRHVQAAPAALNRAATPLGFTGADLDEALRSHDQLLDISREDLADIVLEAERRASLRRFGGLACGQVMLRDAVVVRDDEPLDAALRLLDRHRLAALPVVDGQGHLLGLLAHGDASARTVRLASAPGAPSRASLARDCMRSEVAYATPAMPAIELARPMASGIACVPVVDDARRLVGVIHASQLIDALYQLALASGDSAAGNPAARRALDVAA\n>tr|U3PX63|U3PX63_POPTO Cytokinin dehydrogenase OS=Populus tomentosa OX=118781 PE=3 SV=1\nMAENPTITICLMAILFITRLASTLGKSKSWTGLLPPQIQTLDFARHLHVEPDAIKSVSSDYGIIVHENPAAVLYPSSIEDITSLIKFWYNNYTPFTVAARRHGHSVGGQAMASNGVVVDMTSLRNHKNGTGITVSKCPSLGFYADVGGELLWIDVLHSTMEHGFAPVSWTDCLYLSVGGTLSNAGISGTTFRYGPQISNVYEMDVVTGKGELVTYSSHTNSELFYAVLGGLGQFGIITRARIALEPAPNRVKWVRILYSDFSAFRRDQERLISINGRKQKNALAYLEGSLLMAQGPPNNWRSSFFPSSDIPKIMSLVTQHAIIYCLEVAKYYDDGTRHIVDQDLQQLLKGLSFVAGFMFEKDVSFVDFLNRVRSGEQKLHSQGLWDVPHPWLNLFLPKSRILEFNKGVFHDLVLKRNITTGVVLFYPMNRKKWDDKMSAVIPEEHIFYTVGFLHSSGFNDWQAYGHQNKDILKFCDTAGIEIKQYLPLYNSNKEWINHFGSKWRNFRERKAQFDPKMMLSPGQRIFNDI\n>tr|A0A5B7BHJ3|A0A5B7BHJ3_DAVIN Uncharacterized protein (Fragment) OS=Davidia involucrata OX=16924 GN=Din_037375 PE=4 SV=1\nQRRTVFNSDGSSKSKLQIDGDAASEDVGFDKIYPVESFSSESEGEEMEENSSRSYLKEVEQSKKKAGLERRLSASSLDSAGNDSSTIKMSSNLHDKNEPLSKEIVFDESDDETGNDQDNIPWLKHHDSSSDKKSNLPINEFPKTRQYNAAADEKHLYSQHSDRDRKPASMRTRRVHRD\n>tr|A0A327WVV0|A0A327WVV0_9BACT Outer membrane receptor for ferrienterochelin and colicin OS=Larkinella arboricola OX=643671 GN=LX87_02312 PE=4 SV=1\nMLVSIAAHAQAPVLFSGSVREITTQEPLQGVHVYVRDHRLGTVTNNAGYYTLALPARDSLTITFSSVGYQTVTRTISSHRPQPLDVYLIPGQTLNEVAIKAQAPLQKGSDLAQMSQIQLPIEQLNKIPALMGEKDVLRVLQLMPGVQKGSEGNAGVYVRGGGPDQNLITVDEAVVYNPSHLLGFFSVFNGDALKQVELTKGGFPARFGGRLSSVIEMSMKEGDRHDLHGTGSIGLIASRFTLEGPLQKGKSSFLLSARQCYLGALTQLLSPRPVSDLPSRSGFGDYNAKLSFDLGARDHVYVSGYTGSDQFRSQQTYDKQVLDAGLNWGNTTGTLRWTHRFSNRTSAHTALIFSQYRMRVVSEETVTAEAPGQPGAILRLEYLSSIRDLSLKQDWDLYAGSGHQLRFGFQITPHRFTPSAVVTAESQAASLSRTSDQAIQVVESGAYVEDFWQPTDRWRINAGLRLSYFWHKQTQYARPEPRLSVGYKLPGDWTLKGAYAQMNQYVHMLSNTGVGLPTDLWVPTTDRVKPQQSEQIALGVVKDINSDITLTVEGYHKTMKNNISYREGANFLVTDITATGDKARWEDNVTAGRGWSYGGEVMLQKKTGRLSGWIGYTLSWTQWQFAELNGGRRFFPRYDRRHDLSLVAVYELSKRINVSGTWVYGTGQALTVPLARYYASANNPEHTTTPAANPFIDTRNVKDYGEKNSFRAEPYHRMDVSLQFHTRRKSWENIWELSVYNAYNRRNPFYYSLEGKGGSEGIASKSVLYRYSLFPVIPTVSYRFTF\n>tr|A0A364VAY8|A0A364VAY8_9CORY Coproporphyrinogen III oxidase OS=Corynebacterium heidelbergense OX=2055947 GN=hemG PE=3 SV=1\nMTPRVAVIGAGIAGVSAAWELRRQLGPEANIMLVEAYDRIGGKLKTVNFAGGPVDMGAEAFLAFRRDFVELVEQVGLGHQLRAPSTEYTSSLYCRGQLVDVPAATVMGIPARGEDVQAILPAEERRRIDEERGGEPMTWEPGQDAAVGQLVEARFGRAVVDRLVTPLLGGVYSCGADGLGVRSTIPQLAAALDRAGAGGAQFYLSDVVADLLAVRTAGGARRSGPVFQTLAGGFRSLLEQMVLQADPEILFNTAVESIGRSREGWYLEPIGTVDGVVLAAPAPTAALLLRDVADTAAGILSDIELSSSVVVGMRFASDHGIPERSGVLLGPDAPTEAKAFTFSSRKWPHIAEHGGAFVRASYGTYDQPWYVELPDRALINFAAEDLEAITGERKRPEEYFVQRWHGGLPRYGVGYAEALKVAMDSVAAVPTFALAGAMVDGVGVPATAASGIAAARRLAADLSPSPRP\n>tr|A0A0N4SWJ4|A0A0N4SWJ4_BRUPA Uncharacterized protein OS=Brugia pahangi OX=6280 GN=BPAG_LOCUS6 PE=4 SV=1\nMTVRIKVENGFERITVDNNMYARQFRNTQHPVSGSIAVDGAAGEKNWSTGALRCIEARLTNQYCTSAAQRERRECRDASDARVEMRESC\n>tr|A0A2D1UI31|A0A2D1UI31_9INFA Protein PB1-F2 OS=Influenza A virus (A/swine/Iowa/A02215363/2017(H1N2)) OX=2007353 GN=PB1-F2 PE=3 SV=1\nMEQEQDTPWTQSTEHTNIQKEGNGRQIQRLGHPSSIRLMDHYLKIMNQVDMHKQTVSWRPWLSLKNPTQGYLRIHALKQWKLSNKQGWIN\n>tr|A0A7S3I079|A0A7S3I079_9SPIT Hypothetical protein (Fragment) OS=Favella ehrenbergii OX=182087 GN=FEHR0123_LOCUS5015 PE=4 SV=1\nMSIKCLAARQNKSAAINSYGELFMWGSSKNRSLMHASGNGHKDNLKLPTVFESETLLFTKVAVGNEHVAAITEDGRLFTMGTTEHGKLGHPPQELNEEEKQKERDRYKRAGYKPGGLDRSKPAFGFVEGELAGKKIVSVACGDKHTVCVTEDGAVYSWGNGRSGALGHSNTENSAEPKRVEGLSNIVRVDCGTDHTIALDSKGKLHSFGSNTYGQ\n>tr|A0A1S1HUD1|A0A1S1HUD1_PROST Uncharacterized protein OS=Providencia stuartii OX=588 GN=A3Q29_01410 PE=3 SV=1\nMQFPPCPKCQSEYTYTDNDMYICPECAHEWNDAEPVVESDELIVKDANGNLLVDGDTVTVIKDLKVKGSSSMLKIGTRVKGIRLVEGDHNIDCKIDGFGQMKLKSEFVKKN\n>tr|A0A369D4D8|A0A369D4D8_9BACI AsnC family transcriptional regulator OS=Bacillus sp. AG102 OX=2184001 GN=DEU45_10192 PE=4 SV=1\nMQLDRVDRKILNELYNDSRLSMRELAKRVNLSAPSTAERVRKLESEGVIQKYTIDIDYKKAGLVLDCILEITLKNGDTTRMQQFIQSYPSASFCYRVTGSLCYIVKISVPSLVELEEFINDVSSYATTVSHIVLSEVSLTPDIEHIFPED\n>tr|A0A370DS84|A0A370DS84_9GAMM RNA polymerase sigma factor RpoS OS=endosymbiont of Escarpia spicata OX=2200908 GN=rpoS PE=3 SV=1\nMDEPNDANAAGEDSVSSDKPEVSPKPETAQKLKKPNARAAREPNDAQMDATRLYLNEIGISKLLTAEEEVYFSRLAQKGDQSARQRMIESNLRLVVKIARRYMNRGLALLDLIEEGNLGLIRAVEKFDPERGFRFSTYATWWIRQTIERAIMNQTRTIRLPIHVVKEINVYLRAARQLAQTLDHEPSSEEIADLLDRPIGEVKRMLGLNERVTSVDTPYGKDADKPLLDTIPDERASDPTVDIQNDGLNANLDRWLEKLNDKQREVVERRFGLHGYENSTLEQVANELGVTRERVRQIQMDALRRLRDILERDGFSVDTIFK\n>tr|A0A2C5Z117|A0A2C5Z117_9HYPO Uncharacterized protein OS=Cordyceps sp. RAO-2017 OX=2004951 GN=CDD83_9509 PE=4 SV=1\nMKTDSLSPLFLLSVDASDGPRTTTCDRFVGCHRYDDCRQPTRRPTYANTIIIRTPPLPPAVMAGGRPTTPPTSIVPSPCVPRIMASLLPLISDTPSHGHARLGSGGDGRLAAARCCSSYRGRIRSHPACHRQSTRQNGRSWSVSPTETEMASF\n>tr|A0A6J3K058|A0A6J3K058_9HYME zinc finger protein 271-like isoform X3 OS=Bombus vosnesenskii OX=207650 GN=LOC117231473 PE=4 SV=1\nMNSEQHALPATTQAQQEDVNAGQSGRPSYPGGLATTTSLGNVGSTPHSSADLRVSVYHHSHHNSSHRSSGGGEASSKEPASSLNQEMALTSSSHHQSTPTHHHHQPSVSSSSHHSSLQPNSQQIPVSLPGLNLDGAHIPASVSHLQAAHAQMQQMQAAQQQQLHQQQQQQPQQQQQQQQQQSHHQMQSHQNAQNSGPTAHNQNAQRDDNKVKDESGSCTTERCSDNQVHCQVQCDLQLQTSQDLQQSLMQQQQQQQQQIGVNISGNSSSEGGSQNNTEKPEKEKELRQLNMTQFQVPDLKPGGHMMDVRTADGSVVKISAGNEQDLAKTLGVEMVQNMYKVNVEDINQLLAYHEVFGKLQSEIAAGTTLVGSTVPTQTVTTIQNGTPIVQQVQLNKFDIKSSDGEATPGPSASPVSVGSHACEICGKIFQFRYQLIVHRRYHTERKPFTCQVCGKAFLNANDLTRHGKCHLGGSMFTCTVCFHVFANAPSLERHMKRHATDKPYNCTVCGKSFARKEHLDNHTRCHTGETPYRCQYCSKTFTRKEHMVNHVRKHTGETPHRCDICKKSFTRKEHFMNHVMWHTGETPHHCQACGKKYTRKEHLANHMRSHTNDTPFRCEICGKSFTRKEHFTNHIMWHTGETPHRCDFCSKTFTRKEHLLNHVRQHTGESPHRCGFCSKSFTRKEHLVNHIRQHTGETPFRCQYCPKAFTRKDHLVNHVRQHTGESPHKCQYCTKSFTRKEHLTNHVRQHTGESPHRCHFCSKSFTRKEHLTNHVRIHTGESPHRCEFCQRTFTRKEHLNNHLRQHTGDSSHCCNVCSKPFTRKEHLVNHMRCHTGERPFVCTECGKSFPLKGNLLFHMRSHNKGSNAERPYRCDLCPKDFMCKGHLVSHRRSHSDERPHSCPDCGKTFVEKGNMLRHLRKHAAEGPPTQVSTPSAIPQSGVLPIPAAAVLVGHPLAPPAPPVVPQHTVVVPTPPGVLTSY\n>tr|A0A7V1JCS3|A0A7V1JCS3_9BACT Histidyl-tRNA synthetase (Fragment) OS=bacterium OX=1869227 GN=hisS PE=3 SV=1\nMNRPVQPPKGTRDFLPEEMLLRGKVIETLRECFALYGFIEIDSPVFEYFELLSRKCGSEIEKEIYTFDDKAKRKLGLRFEFTSPLGRYYAANRSRLVKPFKRYVIGKVYRYENTQAGRYREFYQADADIIGSYSMNVELELLNLAIFTLSKLGFGDYEIFINDRKILDGIVNAAGIGEDKKDTALRAVDKMAKIGEQGVIKEFAENGIAEDNYKSFMEFIELDKDLSDIGKLSALGGRINAAVKDEFIKNKALEGIEELLSILKNAEAIGLDFITYDPLLVRGLGYYTGPIFEIKSKDVSIGSFAAGGRYDNLVELYGARPEGACGISFGVERIIDIIKERDGKTLELQAFPVKLYVIYLSEDERSYAYKNAEALRLNGINTELCISNR\n>tr|A0A0F0I472|A0A0F0I472_ASPPU Classical c SDR OS=Aspergillus parasiticus (strain ATCC 56775 / NRRL 5862 / SRRC 143 / SU-1) OX=1403190 GN=P875_00053022 PE=3 SV=1\nMTKITIPTTPPSRSLQGKTAIVTGAGCLGNGIGNGRAIAILLASDGCNVLCVDRNLEWAERTVDMIKAQAEDALVEGKSNYGHATAIQADVTIAADCESIVSTALTTFNRLDILVNNVGISGAAGTAVDVDMEAWAKSLEVNVSSMVLVSKYAIPAMMKNERDEYSGMCGSIVNLGSVAGLRGGTPHLLYPTSKGAVVQLTRAMAAHHASDGIRVNCVCPGMLFTPMMYGGGMSEEAREARRKRSLLQTEGNGWDCATAVVFLAGPHARWMTGVILPVDAGTTAAVGIGMPKSASVNG\n>tr|M1EY39|M1EY39_9HYME Protein Wnt (Fragment) OS=Hypoponera sp. Mal1 OX=1157064 GN=Wg PE=3 SV=1\nLPAFRVVGDNLKDRFDGASRVMVSNSDRTRGNSNTITSNSASNSVHGHRDGPRRRHRYNFQLKPYNPEHKPPGPKDLVYLEPSPPFCEKNPKLGILGTHGRICNDTSIGVDGCDLMCCGRGYVREDVMVVERCNCI\n>tr|A0A452QU07|A0A452QU07_URSAM Uncharacterized protein OS=Ursus americanus OX=9643 PE=4 SV=1\nAKQNKDKKDEIIKRKEAPPHEGLEIEEPSSLGLMVGGPDPDLLTCGQCQMNFPLGDILVFIEHKKKQCGGSLGACYDKGLDKGSPPPSSRSELRKVSEPVEIGIQVTPDEDDHLLSPTKGICPKQENIAEPPPRGLCSVQATVFASGPSSEPGRPRKGRGPWQPVFLRQDGTGTRVDEGSHPAGPAASWGQASVS\n>tr|A0A4R6LBV2|A0A4R6LBV2_9FLAO Surfactin family lipopeptide synthetase A OS=Flavobacterium sp. P3160 OX=2512113 GN=EV143_10517 PE=4 SV=1\nMGYDLFTKLKKLNVTVKVTDGQLDIKAPKGVLDEELLIEIKTKKEDLINLIGKYTKDKANEKNQIPVAPKSEHYPLSSSQKRLWVLSQIDTANFSYNIPGLQVIEEVLNVNAFMLATQDLFNRHEILRTVFKSLDNEDVRQFVIAAEDFEFPFQQIDVDNDEVKLNEILAEVKNTIFDLEKGPLFKGVLVRVTDNKWVFSYNMHHIISDGWSMDIMINELLNNYILRRKDEFVSGLPLKIHYKDYAVWQQQRLADKEFDKEKNYWLTNLEGDLPTLAHFGDNPRPAIMTYNGSVVKRTIETLLIQRFKSFCQEQEGTLFMGCLSILNVLLHKYTEQEDFIIGSPVSGRTHKDLADQIGFYVNTVALRTQLEADNSFKEIFQQNKISTLNAIENQNYPFDELLDNLNVKRDLSRSPLFDVMISVQNENQLNQKADDLSYNEFLDRRVSKYDLTFTFVEKAASLTVELEYNMDIFSKETASTLLYHLENLLVEVLKNPSEEIKSINCLDSEEQFELLENFNNTEKQYPDTGSIVSFFREQVQKTPQNTALVYKDVSFTYLELDALSNQLSNYLEKQYLLDNEDFIAILLQKNEWQIIAILAILKAKCAYVPIASDYPESRIQFILEDTKCKLVITEEEIANFLNVQAEYSDVKTSSPLSPSHLAYVMYTSGSTGVPKGALIEHGGVIRLVKENNYVQLTGKEALLSTGSFSFDATTFEYWSMLLNGGKLVLCDENTLLSPHELSKIIKEEGITIMWFTVGLLNQIIDDNIELFEGLDTILAGGDKLSFTHIDRLQRSYPHLEIINGYGPTENTTFSLTHKIGILNNTNIPIGKPITNSTVYILDKNDNLVPKGVMGEICLGGAGLSRGYLNQPKLTREKFVSHIFKGNERLYKTGDLGRWLKDGTVEFLGRKDNQIKLRGYRIELGEIESVLSQHEAVNSSLVMVHQDNENEKVLVAYITVNTPVNISNLKQWLSERLPYYMVPNYLEVLDIFPLNVNGKVDRSKLPLPESINFDKREEYTEPATAFEKSLAKLWEEVLGISKVGLEDNFFDIGGHSLKATKLISKIHKEFQVKLKLKDLFVHASLQSQCKLIAEAQHSGYSKIPVLTKQNGYPLSLMQRRLWILSQHQAANIAYNMSGAYVFEGDLNVRILEEAFIQLIKRHEILRTSFKEDANREILQYVTEPENVSFTIKNIDLRGTEKLVLDKYLSEDLIAPFDLSSGKLFKANIYRISDNRWVFSNVIHHIISDGWSLGIIVNELLYLYNTLLTGGSVTLTPLNVQYKDYSSWQLKELSDSRLEFHKGYWINQFKGDLPVLDLSGGKQRPITKTYNGGVYNKIISAELSNKLAEFLKTEETTLFMGLLSAVNVLFYHYTKQEDITIGSPIAGRDHADLENQIGFYVNTLALRTIFLKNDTFKTVLAKVKEVVLGAHEHQLYPFDELVSSLNITRDMSRNPLFDVQVIVQNNQDTANTELKNLAVTAYQGELPQSSVFDLVFNFVESENGLATSIIYNSDVFDSERIEQFASHLEHLLAALLQDTELPIEEVKWLSEEEKQHLLSFNSKQMDYDQSKTVIEMVNDQVNKNPEAIAIAFEGTQITYLELHERSNQLAHFLLENYTIEPNDFVGIMMDRSELMFIGILGILKAGAAYVPIDPDYPVSRKEFILKDTNVKVLLTQSDYIFDLAYYQGEIFAMDLQMDTLTNSVTNSEINVLPEHLAYIIYTSGSTGNPKGVIVTHANLQHSLAPRNDVYVPIKCFLLLSSFAFDSSVAGIFSTLTNGGKLAITTNANIANVNFIADYIVAEKVSHLLTVPSYYKLLLMALQGKETALEEVTVAGETCPISLIEDHFKSKIGQSGCQLFNEYGPTECSVWSSVHKYEEGKPVTATIGKPIANTHIYILNDKEDLVPVGVIGELHIGGNGVTKGYLNNSELTNQKFVKDPFQKSGLMYKTGDLGRWNSEGEIEFLGRKDNQVKVRGYRIELNEVQYAIEQSGFIQSAVVLTKENKSGDNELYAYLVADEALNTSDLKNYLKDLLPGYAVPAHFITLSGFPATPNGKIDTKALLEIGDSDNRTGEDYVAPQTEEEIALVNIWQTVLDKEKIGVNDRFFDLGGDSIKVLKIVNGIYNEMRLEISISDVYTYANISKLADFIIHNKKSLDSRKAESTEARKDVVNYIDAIKNSVLESLDQNKSEAIEDLYPMSDIQKGMVYESLLYEGTSIYHDQIINQRQFVNFDISVFRLAMQLMVNKHEILRTGFNMHDYEQEVQIVYKNIEIPVVYQNLSHLDSLKEKEQVIGAFLQSELAKPFDLTSIPLFRMAAFNIGDDMIVFVSQCHHAIIDGWSDSMLLTELNNLYLNLLEDITFKPEKIKASYKNYVIEHEIDKKDTEIQSFWKEELQDSSKLNIFTNTPVSSIYGNILSENEVSELKLLASNSGTTVKEVSLSAYLYMLSILNADPDVVTGLVTNNRPSCEDGDKILGCFLNTIPLRFAINYEVTVKDFILEVQHKLIALKKYERLSLLQIASLSDNQQSNENPFFDVYFNYVDFYTYNKIKSEIKENSNPDKEEESVSLIGANKTNTFLDFNVNTTGDLYHASLSLTKILKSGLTVEQVNDLYFSILRSFIASPHQLLKSVDYLGAKEKHTLLHEFNDTKHEFPSETTLGELFIKQVKNTPDKIALVFQQKEFTFAELNEKSNQLAHYLKANYTLGANDLIAVALPRSEWMITAILAIHKIGGAYVPIDPKHPQDRIDYIVQDSASALIIDAKVLGEFQAVAENYSNENLTLINKPTDVAYVLYTSGSTGNPKGCILEHSGVVNRIQWMWEAFDYTNQDVILQKTTFTFDVSVWEIFMPLCWGTKMVLCSDEDVSIPQNIETLIKNHKVTCLHFVPSMLDVFIDSLFYEAYDFSNLSSLKQVITSGEALQLNTVKKWYEKLETPIQNLYGPTEASIDVTYYTTSKQDTVIPIGKPVWNTSIYILDANNNLVPIGCSGEIYLAGTGLARGYLNRPELTAEKFVANPFAPGEKMYKTGDIGKWTSDGNIIYAGRNDNQLKIRGFRIELGEIEQCLLEIETLDSATVLARKSASNEIDLVAYIVSNQELDVKGIKGTLKKKLPEYMVPNHFVKLETLPLTLNGKLDRKKLLAISTDSEGQTVEIVKPENDVEKKILQIWKEILSKEEISVTANFFEIGGHSLRAIKLQSMLKRKIGLDFSIKDIYNRPTIKRLASDKEKSNSLLIDLQINNRKNIIYFIPPLTGSSILYHPLAKVLSNEFDSVGFQYQGLEHGEEFSLSIKEMAKSFLDEIKNRQTHEPFIVLGYSMGAAIAFEIVRELEKYYSNIDLILVDRPTTVEADQLELQNMDHQANWLLAEYKKVIKLDEEQEKRTLAFLKNNLVLNNQYQLEGKISSNIYVFEATDNKYKGNMQNWQDYTNGDFKHHYLLGTHWDAVSEQNFESYRELFRSIYKKTSIETI\n>tr|I4C7D0|I4C7D0_DESTA Uncharacterized protein OS=Desulfomonile tiedjei (strain ATCC 49306 / DSM 6799 / DCB-1) OX=706587 GN=Desti_2801 PE=4 SV=1\nMSGKCKMLGLVMLLGLGVTVHAWAVGYERLEVDATKTRTNVVSSNGPAASIAEKCPALLDEVAGVITDLLSQFGIINKKAP\n>tr|M6VC02|M6VC02_9LEPT Acetylglutamate kinase OS=Leptospira noguchii OX=28182 GN=argB PE=3 SV=1\nMEKLLERVNHILEALPYITQYSGKTVVIKYGGAAMAKADLKESFAKDIVLLKYVGIHPVIVHGGGPEINRLLDNLKIPTEFVHGHRVTDTQTMEIVEMVLTGKVNKQIVSLINSQGGKAVGISGKDGNLAKATKAPVEIELEGKEKQLFDVGLVGKIESINPEILHNLQKEGFIPVISPVAENSEGESLNINADTFAGEIAGALKAEKLILLTDTQGILINQQLVTGLNRSKVKDYIRKGEISGGMIPKVECCLTAIDQGVRRTHIIDGRVAHSILIEIFTDQGIGSLIES\n>tr|A0A7G5XKD1|A0A7G5XKD1_9BACT Copper chaperone OS=Lacibacter sp. S13-6-6 OX=2760713 GN=H4075_07020 PE=4 SV=1\nMELITFKTNISNERALQRVAPLLNNAVGSSNWQLDVSGAENKLMVYSPGSINEMQVIDAVHKAGFYAVNIEDFYAIF\n>tr|A0A7X1L7W5|A0A7X1L7W5_9DELT Bifunctional protein PyrR OS=Desulfobacteraceae bacterium OX=2049433 GN=pyrR PE=3 SV=1\nMRKSEMVMDAKDIERTIIRMTHRILEVHKGAADLTLIGIQTRGVFLAKRIQDNIRAIEGTTVATGDMDITLYRDDWTRISHHPVVQATDILFSVDGKEIILVDDVLFTGRTTRAAMDAIMDFGRPDRIELAVLVDRGHRELPIQADYVGRFIETRRSEMINVGLRENDGEDKVLIEERQD\n>tr|A0A3R6LV74|A0A3R6LV74_9CLOT TetR family transcriptional regulator OS=Clostridium sp. AF35-15 OX=2293013 GN=DWZ76_13300 PE=4 SV=1\nMEISGNTCSLLNYKLYLNNNGLPEEKSMQQGNTKERIVEAYIELESERPVEKITVTALVERSRITRKTFYYYFKDIYDLMEYRMEREMKRVMEETMSQTDPEKALTQLYMYIMENQKHIRALSESVQFMALRRQMGEKVYQYFYNHLERMGMFKNLTMSEAAMAVQIIIFSVMGVAFDAPFKNEADVKERVATFMSVIRKCTGCDPTRNR\n>tr|A0A7C3N467|A0A7C3N467_9DELT Universal stress protein OS=Deltaproteobacteria bacterium OX=2026735 GN=ENV48_17320 PE=3 SV=1\nMYKKILVPLDGSQLAERALDPAEKLAQFFGSEIVLLQVIPFMPIYGAPELVTPLVVDEKHRESAERYLAALAEKLKAKGLQVSATVRTGQHVAGEILDFAKASAADLIVMNTHGRSGISRWFLGSVTLKVLSRSETPVLLIRSKP\n>tr|A0A1I6UAS3|A0A1I6UAS3_9EURY GTPase, G3E family OS=Halostagnicola kamekurae OX=619731 GN=SAMN04488556_3691 PE=3 SV=1\nMVTSLSEIPITVISGPLGAGKTTLVNRLLNDPGERRIAVIVNDMGEVNVDAELIADETEEGVVDLSNGCICCRLQGDLVDQATRLAEERSFDYLAVEASGISEPIPIARALTDGTEADSLPDRFRLDTTVSVVDAYGFWKAFDSEESLPDAAPDPERPLTEVLVDQIEFCDVLLLNKCDMVPDDARESIEAAIRELQPRATLHRTTYSDVDPSAVLDTGSFDFEAARRQQGWKRALAGDTANEHPDHDHSDDAVSAAEAHGVESFVYRRDRPFHPERFDAWLDDWDGEIIRAKGFAWVASRPETVLGVSQAGPSVQAGPIGEWGDDDPVTRLVFIGSDLDEAAVTTELDDCLASFDERTDEYSTDPFPRKSN\n>tr|A0A126S3A9|A0A126S3A9_PSEPU Heavy metal RND efflux outer membrane protein OS=Pseudomonas putida OX=303 GN=AWT69_001931 PE=3 SV=1\nMPIPRKIALLCLLLAGPAGAQGLSLDQALDAAFSQNPDFAAIGREIGIAEGERRQAGLIPNPELSWEVEDTRRDTSTTTVTLSQALELGGKRGARIEVAEAGQAIARLELERQRNSLRADVIQAFHAALRAQTALELAQQSQALTERGLRVVEGRVRAGQSSPVEATRAQVQLAQAEAAVRRARTERGVANQVLARLTGSAEARFDRLDASNLSPGPAPQAEPLLAKVEQTAEWRLAAAQIERGDASLGSEKAQRIPNLTVSLGSQYSREDRERVNVVGLSMPLPLFDRNQGNVLAAARRADQARDLRNAVELRLRSETRSALEQWGTAMGEVQAYDRTILPAAQQAVDTATRGFEMGKFAFLDVLDAQRTLIEARGLYLEALAQATDARAQVERIYGEL\n>tr|A0A7L9UZJ5|A0A7L9UZJ5_BIFLN Response regulator transcription factor OS=Bifidobacterium longum subsp. longum OX=1679 GN=BL7055_06065 PE=4 SV=1\nMDNDPFALDAMCAMISAVSKDFRVMWSTGSPAVAIEHCHNPHTRPEVLVLDMALGGITGADVCRRIRRRTGGTGIVCVTSYSVDVYQREAIASGAQGLFAKERLRTDIAVAIR\n>tr|A0A7W5LBF7|A0A7W5LBF7_9HYPH Diaminopimelate decarboxylase OS=Rhizobium sp. BK312 OX=2587080 GN=lysA PE=3 SV=1\nMNHFEYRDGILYAEDVPVPEIAKAVGTPFYVYSTATLERHYRVFAEAFDDVDAMVCYAMKANSNQAVLKTLGRLGAGVDVVSVGELRRALAAGIPASRIMFSGVGKTAQEMDAALEAGIYCFNVESEPELEVLNQRAVRAGKVAPVSFRINPDVDARTHAKISTGKKENKFGISWQRARAVYERAASLPGIKVTGIDMHIGSQITELQPFDDAFKLLRDLVETLRGDGHDIHHVDIGGGLGIPYRDDNNPPPLPDAYAEIVKNQLRGLNCKIVTEPGRLIVGNAGILVTEVIYVKDGGDKSFVIVDGAMNDLIRPTLYEAYHEIRPIAVGDVSTPRIKADVVGPVCETGDYLALDREMALPKPGDLLAVGSAGAYGAVQAGTYNSRLLVPEVLVKGNEFHVIRPRTTYEELIGLDSIPAWLEG\n>tr|A0A2S0UY05|A0A2S0UY05_9GAMM dTDP-glucose 4,6-dehydratase OS=Colwellia sp. Arc7-D OX=2161872 GN=rfbB PE=3 SV=1\nMKKLLVTGGAGFIGANFVHYWMEKYSADKVVVLDALTYAGNIANLDSVKDEDNFTFVHGNICDQALIETLLVEHSIDTLVHFAAESHVDRSITGPDAFIETNIMGTYSLLKAAKKVWLDGESIVEGHRFHHVSTDEVYGTLSPTDPAFTEDTAYAPNSPYSASKAASDHLVRAYHHTYGLNVTTSNCSNNYGPFHFPEKLIPLVITNILHDKALPIYGDGQQIRDWLYVEDHAYGIDLVLQNGRVGENYNIGGDNEWANIDIVKTISKLVEQEFVKNKDLATRFPAAKAAMTQNTESLITYVKDRLGHDRRYAIDATKTNNELNYQPKESFETGIAKTVAWYLNNEAWWQSVMDGSYQNWIAEQYS\n>tr|A0A7K9XDW7|A0A7K9XDW7_9GRUI KRBBB protein (Fragment) OS=Psophia crepitans OX=54359 GN=Klrb1b_1 PE=4 SV=1\nEDCVDRGAELVMPEDQDELGFLNEILQKPNRQFWTGLSVSPTGKGWTWLNGSRLDQSRFPLSPGDEGRRCGVLKGGRITSQNCSSEFQWICQKEATQL\n>tr|A0A0R2NXL2|A0A0R2NXL2_9ARCH RNA-binding protein OS=Nitrosopumilus sp. BACL13 MAG-121220-bin23 OX=1655561 GN=ABR53_02015 PE=4 SV=1\nMKSNLISKSETASLLKKISDAWGIEFPKMKNVKVHQILSDAQIITGDGLKILKINEDYLPFLSETEILKKFPSVEVDMGAVKFMCKGANLMRPGIKKFTEFEKEKLVCIVEETHHKFLAIGKSMVSSSELENMEKGEIIQNLHYISDRFWETGKTIYN\n>tr|A0A6I3FRK9|A0A6I3FRK9_9ACTN Uncharacterized protein OS=Actinobacteria bacterium OX=1883427 GN=F2575_05150 PE=4 SV=1\nMRLVHPLIWWLWALLLATFVIRADNILIAAAVACAVTLVVVKLKNDNYWSKSFALSIRLALLIIVVRMLIAITIGVPMPGQILFRIPSITLPSWMVGIRIGGDVTSQRLTSTFHEVIIIATVILLCGAANSLASPHRMIRSLPKAMYNLGVALSVATSVLPQIVKSIGRIQSAKRLRGQKTRGIRAWRGIALPLLEESLERALDLATAMEARGYGYHGKTTKYRAEPFTFIDLVMIASGVYLVLLSATLLSHFSVVVLALFSLVIVASPIAIVKR\n>tr|D5EYN5|D5EYN5_PRER2 Uncharacterized protein OS=Prevotella ruminicola (strain ATCC 19189 / JCM 8958 / 23) OX=264731 GN=PRU_0725 PE=4 SV=1\nMGIVAVLAVVRAEFPQLAEPRIAESHVEVNADSVAAAMPHTDFSATATAKKHKIYSVPSFKACFPDTQSVQLAAAMKWGVKRVKNREDAEKRKSELVYVGANPYVHIDKLYSSIPYLVPRAAVLLQDVGQAFFDSLYVKGIALHRPIVTSVLRTEADVTKLRRHNGNATENSCHLYGTTFDICYNRYETVQDPDGPARRAVRNDSLKYVLCEVLRDMREQGRCYIKYEVKQGCFHMTVR\n>tr|A0A0F8VXL6|A0A0F8VXL6_9ZZZZ Uncharacterized protein (Fragment) OS=marine sediment metagenome OX=412755 GN=LCGC14_3138660 PE=4 SV=1\nMYRGFRVLVDSALGTLAGAFATNSNRDRAGLLYDKNIAQHNGGVETGSNAYKNWDVLRGRVSANDDQVAVIGEGIVYEYTLGSTTWADASATARANDCFHIYFSCTAAQGASEIAKGGGDYGDTSGVKYIYEYSPWTALAATADIIVPNYYSLGAWANFRVPFPHNTYNTVSTIGDKFGNSTSPFEPATLDSNNFHLDHTGGTGFNQDNAEDFAPFTALELQGLIDYIVVSSGDGVALQADFKMRCTCYDTSDNVVVVDFTIPHRNNYFHVSLPLTQFKNYRARASRRWGDVISNLEPAELEIQEQFEWKNLCMISIQTQDSYDDQGRYFPEDGLFLK\n>tr|A0A1C4Z724|A0A1C4Z724_9ACTN Potassium-transporting ATPase ATP-binding subunit OS=Micromonospora matsumotoense OX=121616 GN=kdpB PE=3 SV=1\nMREKAMTTSTPAPHGTADAATAGTPATQGNRGGGLLDPRQLLRALPDALRKLDPRTLWRNPVMLIVEIGAAFTTVLTVADPSVFALAITVWLWLTVIFANLAEAVAEGRGKAQAAALRRAKTDAVATRALDWSRGAAPGTYRTESVPAPQLRQGDVVVVEAGETIPGDGDVVEGIASVDESAITGESAPVIRESGGDRSAVTGGTKVLSDRIVVMITQKPGESFIDRMINLVEGANRQKTPNEIALNILLSALTIIFLLAVVTLQPLAIFSKNFQAAAPDSNAVTDGGVTGIVLVSLLVCLIPTTIGALLSAIGIAGMDRLVQRNVLAMSGRAVEAAGDVNTLLLDKTGTITLGNRQAAEFLPVDGLDAAGVADAAQLSSLADETPEGRSVVVLAKNEFGLREREPGLMPHATFVPFTAQTRMSGVDQGAQGGAGGARRIRKGAAAAVMKWVRDNGGHPTEQVGQIVDEISGLGGTPLVVAEHVDGQPARALGVIHLKDVVKAGMRERFDEMRAMGIRTVMITGDNPRTAKAIADEAGVDDFLAEATPEDKLALIRKEQEGGRLVAMTGDGTNDAPALAQADVGVAMNTGTSAAKEAGNMVDLDSDPTKLIEIVEIGKQLLITRGALTTFSISNDIAKYFAIIPAMFAGIYPGLDTLNVMRLSSPESAILAAVIFNALVIVALIPLALRGVRYRPGAASKLLSRNLLVYGLGGIVVPFVGIKLIDLLIQFIPGVS\n>tr|A0A2V1NJD8|A0A2V1NJD8_9ACTN ABC transporter OS=Streptomyces sp. V2 OX=1424099 GN=DF268_33570 PE=4 SV=1\nMTSTTPHPDGALPRPAVQLTSVTRRYGPGVTALDDLSLTLPAGSFTAVMGPSGSGKSTLLQCAAGLDRPTSGSVRLDGTELTGLSERRLTLLRRAHIGFVFQSFNLLPSLTAAQNVALPLRLAGRRPSSARVREVLARVGLADRAGHRPGELSGGQQQRVALARALITRPRVLFGDEPTGALDSTTGREVLRLLRGMVDAESQTVVMVTHDPLAASYADRVLFLVDGRVHGELAGAGAETIAARMTGLTAAETPPGPRRTGPDPHGTADLHDTADPHGLRDPHDTGDPDSARPNPQGTPTARQETLPC\n>tr|R8RZS5|R8RZS5_BACCE Methyltransferase OS=Bacillus cereus HuB4-4 OX=1053211 GN=IGM_02991 PE=4 SV=1\nMNELEYKSFYDKVGRLNGWDFSKIKCETVGDTWDFYSEVKERCKPSHILLDVGTGGGENVLNIASSAKLLIGIDNSNGMIATAHSNLKKSGVQNVEFLQMGSEALTFPHAHFDIASSCHAPFLASELAKVMKKGAFFLTQQVSENDKLNLKEAFGRGQCLGERDGTLKEKYMNELISAGFDLVQVREYDVTDYYSRSEDLIFLLKHTPIIPRFGEQEEDFTILQKFIDTYSFEKGIRTNSKRFMIIAVKP\n>tr|Q8EYI3|Q8EYI3_LEPIN ABC transporter ATP-binding protein OS=Leptospira interrogans serogroup Icterohaemorrhagiae serovar Lai (strain 56601) OX=189518 GN=dppD PE=4 SV=1\nMIRIENLTISYYTKSGFGLKKSRIVAVDGVNLEIGKNEIIGLVGESGCGKSTLGRGLVKLLKPEFGSIYFEDKEITSLSSSEFFPFRKNIQIIFQDPYSSLNPRMTIAEILMEGLEIHEKTSREEAETKIKKILEKVNLSSDILSRFPHEFSGGQRQRIAIARALVLKPKFVICDESVSALDVSTGTQVLKLLVELKNEFGLSYLFISHDLGVVKSISDRIAVMYLGKIVELGNTKNIISSPAHPYTKALFQSTFDVYDRKKNRIPLKGEIPSIVNKPTGCHFHTRCPIARDLCKSEVPVWKEIRNGQKVLCHFPID\n>tr|A0A5X0ZI55|A0A5X0ZI55_SALET Bifunctional glutamine synthetase adenylyltransferase/adenylyl-removing enzyme OS=Salmonella enterica subsp. enterica serovar Stanley OX=192953 GN=glnE PE=3 SV=1\nMTPLSSPLSQYWQTVVERLPEGFTETSLSVQAKSVLTFSDFALDSVIAHPEWLAELESASPQADEWRHYAGWLQEALAGVCDDASLMRELRFFRRRIMVRIAWAQTLSLVDDETILQQLSHLAETLIVGARDWLYAACCREWGTPCNPQGVPQPLLILGMGKLGGGELNFSSDIDLIFAWPEHGETRGGRRELDNAQFFTRLGQRLIKALDQPTMDGFVYRVDMRLRPFGDSGPLVLSFAALEDYYQEQGRDWERYAMVKARLMGDNDDAWSRELRAMLRPFVFRRYIDFSVIQSLRNMKGMIAREVRRRGLKDNIKLGAGGIREIEFIVQVFQLIRGGREPSLQSRSLLPTLDAIAALHLLPENDVAQLRVAYLFLRRLENLLQSINDEQTQTLPADDLNRARLAWGMKAENWPQLVGELTDHMANVRRVFNELIGDDEADTPQEEERSEPWREVWQDALQEDDSTPVLAHLADEDRRQVLTLIADFRKELDKRPIGPRGRQVLDQLMPHLLADVCSREDAAVTLSRITPLLAGIVTRTTYLELLSEFPGALKHLIMLCAASPMIASQLARYPLLLDELLDPGTLYQPTATDAYRDELRQYLLRVPEEDEEQQLEALRQFKQAQLLRVAAADIAGTLPVMKVSDHLTWLAEAMIDAVVQQAWTQMVARYGQPAHLDERQGRGFAVVGYGKLGGWELGYSSDLDLIFLHDCPMDVMTNGEREIDGRQFYLRLAQRIMHLFSTRTSSGILYEVDARLRPSGAAGMLVTSADAFADYQQHEAWTWEHQALVRARVVYGDPQLTSQFDAVRRTIMTTARDGKTLQTEVREMREKMRAHLGNKHRDRFDIKADEGGITDIEFIAQYLVLRYAHEKPKLTRWSDNVRILELLAQNGIMDEHEAQALTVAYTTLRDELHHLALQELPGHVAQTCFSKERALVQASWRKWLVAV\n>tr|A0A846PBJ8|A0A846PBJ8_9BACT ATP-binding cassette domain-containing protein OS=Candidatus Latescibacteria bacterium OX=2053570 GN=GTO29_14730 PE=4 SV=1\nMNEPWIQLKNVHLSRGGRPVLKGVTADLAGRAIGLVGANGAGKSTLIGALLGVLKAESGMIHVLDLDLPRNAMQVRSRAGVMAEQAGVFPGGSGVDAVVFAAMLNGLSRRESLRKAHRALDALDVGEERYRPVRGYSTGMQQRCKLAMSLVHDPEILILDEPTVGLDPPGRTQLLNLIRDLRDEGRRILVSTHIMHDADFLCDELLLLEAGTVAFSGPIRDLIDTGVGVVVAAGEGLDAAFAETLGQRGYDIREQADEHITFEPNQDVELREFWQLAAERGAEVRALGRDLPSLESAVIRAMEHTDEQ\n>tr|A0A7U8ZSQ3|A0A7U8ZSQ3_VIBCL Uncharacterized protein OS=Vibrio cholerae MAK 757 OX=412967 GN=A53_02263 PE=4 SV=1\nMRYLAVLMMGLLTFPAFALTRVNLYQAEVAVDPQQSNADAAARVRGMEEVIVRATGSQDALKNDAVQKALRQSNQYITQISTQQEGAQSVMRLQFSAQHIRSLLSQAQLPFWPESRSNLLVWLVEEANYDRSVSWEHADTPLLNQMKVRARIRGLPLTVPVGDFDDVTGVQVSDLWGGFINPISIASQRYPTDAVLVVRAQGSELRWTLFDQLANTMVSQPKAPISGQASGEQAVTEMIDEISDYYARKSAVVVSSESSQSVLAQFSPLDSAQDFFVVENKLKRLSSVASLDILKVQGTQVTFNVHLLASVEEFTNEVVRMGQAVLMEMPPEEPVSADNNLLENSSLENSASEMPVDPSNPNNAAAQPQPVQPKTLYFSWQG\n>tr|A0A7W0QRE7|A0A7W0QRE7_9CHLR D-aminoacyl-tRNA deacylase OS=Chloroflexia bacterium OX=2448782 GN=dtd PE=3 SV=1\nMRVLVQRVREARVTVDDVEAGAIGPGLLLFVGIAATDGDGELRAMADKIANLRVFEDDAGRMNRSVLDLVAGGDPVGALVISQFTLYGDVRKGRRPGFTRAAAPEEAAPMIEAFAVCLANPGLVVERGVFGAHMMVSLTNDGPVTIWIDSDDLRQPRRGETSSAI\n>tr|A0A7L4YJJ8|A0A7L4YJJ8_9ACTN Uncharacterized protein OS=Epidermidibacterium keratini OX=1891644 GN=EK0264_02370 PE=4 SV=1\nMEQTLINDGLPFLGSALPADLAGVELRRAITEHRVLRMMRNTFRDARVPDSREVRVAAIALHAPKDAIVADDTVAWLQGVDTNDPRDRFSFSPSLIVPNHACRPQHPGVRVREGTIDDCDVVEEGGLRLQTNLRATADMLRLKWRPNALATADAMCRHNLIDKGELAEFIRPLRRLPGIPQARALVRLVDPRSMSWGESVLKLRLVDAGFPMPALQHEVNDPRIGVRYLDCAYVAPRVGVEYDGKEFHTAESDREHDAERRELLSDILGWRWEIARRDDLIGTNDALEWRVGEKLGLTPRPRSW\n>tr|A0A0P1FSG2|A0A0P1FSG2_9RHOB Uncharacterized protein OS=Thalassobacter stenotrophicus OX=266809 GN=THS5294_03520 PE=4 SV=1\nMRLLGAFSLVLGLLVAPEVAPAQGTSVVTGTGTGAVLRTLDKVTGAVFDVEVASGQTMGYGTLEITLSECRYPASNPAGDAFAHLTVMDGSKRQDIFQGWMIASSPALMALDHARYDVWVLRCITS\n>tr|A0A1C4RDB8|A0A1C4RDB8_9ACTN Uncharacterized protein OS=Streptomyces sp. DvalAA-14 OX=1839759 GN=GA0115240_152365 PE=4 SV=1\nMPTAPRTIDELQQALMANQQLPYGRTRTVGAEELVDAAEQFAEPIALVRTLLELQSAYVYGSEPRKSPVVFARLLALFDEQPDLFDERLRHELFWRFKWVANALRQLPEMPLASIQQWLTEMRTRYEKAGLGLQPYYGQAFQLAAHVGQDIAPAYELWAARTRTPLSDCEACEICDRALYHLRGGDDERALESWEPVLTGTASCQEEPARSISYALLPLLRTGRTDRARELHLAGYRACRHRPSMSGEVGRHLEFCALTGNEARGLELLAENRGLFDEVESPHANFDFLTGVEVLLQRVGLLGHGELPAAGYAGRVWSVAELRAEVRARADDLAARFDARNGTTAHTDRRRARLDRAPLLDALELTLRSRTLDVVAQAAPADAAAGAPVSAPAGAPVPRTPAAVSDSLPELILQARDLDERAHPDANACWARLRALVAAPDYTHPDDPAVGSFVRLRADLLADEASRVHEKEEYAVAAALFTQAGDLYDEAGEPGHAAFARGYALLAEAEQVTEPVKPPEPAEPADAAEAADAAEAAGPAEAGQPAAPAEPAERAAGADGANGAEKAEKAEKAEKAEKADRTGPAAAVEARVAALTGVHAAAVRLQEDTPGLAPYQEARLLRLRATALGLRLQASGNEEHAAPVLAEADLLREFATRHGVVTQISGARFLRATTWAIRGDLPAAHTEVDGLLDELKERGPAWHLPRALGLRARLRLGLGEAQGAHDDLTEALRLAADWPAEAVHTSRLQGDLAEVCMHLGRPDEALRHLTRSAELELRADQRAEAFTTYGNAAALSLDLGRVEDSIALLDSLLAEPDAVAGELNDRLLAQLRLTRARALHAGEDLKAATAEFVALAAESAGWDDDPGSHAMIAAETAVLLGEAGEFGPARQAAEQALAAHARAPRYEQLSNALRELARLQAEQQGPDGLTDALAFLADAGRIADEARAAGFEARGRSLDTALAYEHGRVNAYAGAYEDALAALDKALDLIGEPAPEDDRVEEWAESVRLAGVVEGLYLKRTAPALARLDAAIARLTSLGHPKEATPLTSLAARLRDDK\n>tr|F7Y857|F7Y857_MESOW SnoaL-like domain-containing protein OS=Mesorhizobium opportunistum (strain LMG 24607 / HAMBI 3007 / WSM2075) OX=536019 GN=Mesop_3059 PE=4 SV=1\nMNKNYEAIKAHYAGSDAMDLAAMMAPITGRTAWTEMAGFPYAGTYVGPDAIIAGVFKRIGEEWDGYNLKLEKLVDGGTTIVGIGTYSGTYKKTGKPMSARVVHVWEMEDGKVLSFEQFTDTRLVAAATA\n>tr|A0A2V6GK08|A0A2V6GK08_9BACT Aminopeptidase OS=Verrucomicrobia bacterium OX=2026799 GN=DMF43_07280 PE=3 SV=1\nMHDIRFDNLAKLLVEYSIRLGRNEAVLIEAFDIPDEMTIALIQAARKAGGVPFAQIYHTRVNRALAFEASDRQLNLLASHELARMKKMDAYIAVRGSNNITELSDVPAEKMKLLNKKMRPVQDQRVKKTKWVVLRWPTPSMAQLAGMSTEAFEDFYFEVCTLDYRKLQPGMKALKGLMEKTDRVEIKGPGIDLRFSIKAIPAVICGGDRNIPDGEVFSCPVKDSVEGHVTFNAPSIYQGIGFDGIRLEFKNGKIIDATSNETKKLNKILDSDPGARYIGEFSLGFNPRVLQPMRDILFDEKIAGSFHLTPGQAYEEADNGNRSQVHWDMVSIQRPEYGGGEIYFDGKLIRRDGEFLPKQLHSLNRSRTR\n>tr|A0A0F9KX35|A0A0F9KX35_9ZZZZ Uncharacterized protein OS=marine sediment metagenome OX=412755 GN=LCGC14_1274400 PE=4 SV=1\nMKPKNYKYLDGSGNQYNIQDDMRKTLEYVPVKPESSSSGIYDGGKYVKTEITIDQFNKIVSLLNSAIRKSEIHIKDRVKMSGMIIVEEEGNRNAYILDPYSEEKFSIETKLREIFEI\n>tr|A0A1L9MTS9|A0A1L9MTS9_ASPTC FSH1 domain-containing protein OS=Aspergillus tubingensis (strain CBS 134.48) OX=767770 GN=ASPTUDRAFT_130501 PE=4 SV=1\nMRFLCLHGAGTNAEIFEIQSGGISYDLAKYGHTFKYYDGCMEAEVEPRTSPRPPHLKIRKLKGLFTGPFYNHYPRDRAPGEYLAPAMKHVYDIIEREGPFDAVMGFSQGAALACAMIVHHAKTHQEPLFKVAVFICGAAPFDSTGNEVIPDTSAEGEYPVKIPTANIVGKQDELYPSSMHLSRLCEPSKMSFHDHGSKHMVPFDVENTNAMVAAIEATVQKALRGE\n>tr|A0A2V3TT51|A0A2V3TT51_9HYPH Flavin reductase (DIM6/NTAB) family NADH-FMN oxidoreductase RutF OS=Chelatococcus asaccharovorans OX=28210 GN=C7450_11941 PE=4 SV=1\nMADKTRLIVEGGDPAADPKAFRRALGSFPTGVSIITTPGLDAPAGVTANSFASVSLDPPLVLWSIAHTSRSHAAFRQSAHFAINILADDQVGVSQAFASASYDKFSLVDWHRGGTGSPLIDNALAYFDCVCEARHEGGDHTIMIGRVIEFGRSEGSPLAFSQGRYGITLDHPEVAAKARDRKFEEPGLDELPFLSLIAKAHYKEDADLEERRSAARYTQVGSKVLAGLYQSAPLTADELARRMYLDRREVDDSLNEFLADGHVAIFDGHRFALTESGKQRRRQMIEYLSRYQDEQLADINPADLIVATRVLKAFLTGPHQGKPDLHI\n>tr|A0A532EZD0|A0A532EZD0_9BACT LPS export ABC transporter ATP-binding protein OS=Nitrospira sp. OX=70125 GN=lptB PE=4 SV=1\nMTQSIHAESEALVGPIAVQQGHCLRATGLVKSFRGRKVVKGVAVEVYAGEVVGLLGPNGAGKTTIFDMMVGLCQPDEGEITFIGESVTNLPMYKRARRGIGYLPQESSVFRRLSVEHNVLAILEMLGYARKERSQRVDALLKELDLIHIRKSMAYALSGGERRRLEITRALAATPSFMLLDEPFAGIDPIAVADIQQIITRLKEKGIGILITDHNVQETLSIVDRAYIINEGLILEAGSPEAIVQSPTARAVYLGEQFKL\n>tr|Q08U50|Q08U50_STIAD Putative surface protein OS=Stigmatella aurantiaca (strain DW4/3-1) OX=378806 GN=STIAU_1615 PE=4 SV=1\nMNPAVPAQYTLTYNVTDSAANVAAPVNRTVTVQDTQGPTLVLNGPATAGLECGTPFNDPGATANDLCEGDLSGAVVRTGTLNQGAVGNYTLTYNVADQGGHTAAPVSRTVAVSDTLAPVVTINGPASLAVECGDNGFQDPGAMAEDACAGTLPATPSTEVDPAVPGVVAITYSATDPSGNTGVGNTGRTVTVEDTLPPTLALLGPANQPLECGTPYNDPGATADDQCAGDLTGSIQRTGSINNKQLGAQMVSYTVQDPGGRTAGPVSRTVTVDDSLAPAIAVNGPLDQVFECGSTYVDPGATANDLCATI\n>tr|A0A1X0UNC0|A0A1X0UNC0_9NOCA Putative fluoride ion transporter CrcB OS=Rhodococcus sp. 1163 OX=1905289 GN=crcB PE=3 SV=1\nMIAPARPLHLRPRALALVFAGGVIGTAMRYGIEIAIPQVIQGWPVATFSINLLGAFVLGVLLENMARRGADAGVRQQIRLLAGTGFCGAFTTYSTFALEAVLLTRDGHLPIALAYGVSTVFLGALAAWAGIVVGASMHVDRSAR\n>tr|A0A3N2GU17|A0A3N2GU17_9PSEU Uncharacterized protein OS=Amycolatopsis thermoflava OX=84480 GN=EDD35_2465 PE=4 SV=1\nMDPRDRADALLARAQSRGAFVVTPDAATSPMDASTTQQIPRNVVKEIDNDDPDTTAVVPSSVIESVQGSLAASKPDTHVNMTPVQPEEEVDGLVPTTKTQTGNSDFARRLEGL\n>tr|A0A3P9I8G7|A0A3P9I8G7_ORYLA One cut domain family member OS=Oryzias latipes OX=8090 PE=3 SV=1\nMELTMENLHSVSAHSQAGDLMSSPHARPSQSPSSTPRNLVSHAPSARSAMVSGMASLLEGSGGDYRTDPSGLSGHLHPSISMCETGMSLSNTYTTLTPLQHLPPISTVADKFHHPHSHHHAAAHQRLSAGNVSGSFTLMRDDHRGLTSMSNLYSHYPKEMSGMGHGSLSPLSSGLGSLHNSQQSLSAYGHSAHLSDAKMISPVPGFESHASMLSRSDQEHLARSLGGHGHGMISNLNGMHHHPHSHLHSQANGAVMLGDRERHGHGASQGVSGSNIQAEEINTKEVAQRITAELKRYSIPQAIFAQRILSRSQGTLSDLLRNPKPWSKLKSGRETFRRMWKWLQEPEFQRMSALRLAACKRKEEDRGRERSQVPKKQRLVFTDLQRRTLVAIFRENRRPSKEMQLTISQQLGLELSTVSNFFMNSRRRCPDRWDTEEHGVHGHGPSGNSSASPIQPGISSANTFSKA\n>tr|A0A3Q0S8Y1|A0A3Q0S8Y1_AMPCI Translocase of outer mitochondrial membrane 40 homolog (yeast) OS=Amphilophus citrinellus OX=61819 PE=3 SV=1\nMGSVLAAASPSPAPAAAGSGQGVPGLVSVPPGFTMPSVSSVPPASGSDQQTADAQSSLSNPGTYEECHRKCKEVFPLQMEGVRLLVNKGLSNHFQVSHTVTLSTLGDSGYRFGATYVGSKQTGPAESFPVLVGDMDNTGSLNAQVIHQLTTAVRSKIAIQTQQHKFVNWQCDVEYRGEDFTSAVTFGNPDILVGSGILVAHYLQSITPALTLGGELVYHRRPGEEGTVTSLLGRYTGENYVATLTLGGAGAHATYYHKANDQLQVGVEFEASTRMQDTTTSFGYQLDLPKANLLFKGTVDSNWVVGATLEKKLVPLPLTLALGAFLNHRKNKFQCGFGVTIG\n>tr|A0A7K3UVX5|A0A7K3UVX5_RHILE DUF21 domain-containing protein OS=Rhizobium leguminosarum OX=384 GN=GR236_14365 PE=3 SV=1\nMAIEGALAFLETYWPEILSITALVLMSAFFSGSETALTAVSRSRIHTLEANGDERAGLVRQLIERRDRLIGALLIGNNLANILSSSIATSLFLGLFGNSGVALATLAMTVILVIFAEVLPKSWAISTPDRFALAIAVPAKLFVTVVGPVSTFVNAIVRQILSLFGINLSRETSMLTAHEELRGAVDLLHREGSVVKADRDRLGGVLDLSELELSDIMVHRTAMRAINADDPPEAVVRAILESPYTRMPLWRGTIDNIIGVVHAKDLLRALAEPNMEPQNLDIVKIAQKPWFVPDSTNLEDQLNAFLRRKQHFAVVVDEYGEVQGIVTLEDILEEIVGDISDEHDIEIQGVRQEADGSVVVDGGVPIRDLNRALDWNLPDEEATTIAGLVIHESMTIPEERQAFTFYGKRFVVMKREKNRITKLRIRPAGEDGAKPA\n>tr|A0A6J5FC43|A0A6J5FC43_9BURK GAF domain-containing protein OS=Paraburkholderia humisilvae OX=627669 GN=LMG29542_08208 PE=4 SV=1\nMIGDPILAMTTSAENQLYALDEIALTLAQPCQRTAVYHTVEDVMQRLIGHRLFTLLAVLPGGHRVQRFWSSNETVYPPSGRKCLDSTPWGEVVLKNKKAWLGRNAADIRWAFADHALIASLGLGSVINVPIVVRGQLLGTMNLLHRENHFTVDDVTIAARVAPYLIPAFIEEVKTIEVS\n>tr|A0A7C4RW34|A0A7C4RW34_9BACT Adenosylcobinamide kinase OS=Fervidobacterium thailandense OX=1008305 GN=cobU PE=3 SV=1\nMILITGGVKSGKSTFALLMALRYKKRAFLATGVPFDDEMMERIRKHKEERKNLFDTYEEPVDIATILQKIDRHYDVIVLECLTTYLGNLLHYNEDVESRFNILVDVVKTMVSQLIIVTNEVGWGIIPENNLARRYVEILGRWNNELAKIAQEVYLVISGIGVRIK\n>tr|A0A221MBY2|A0A221MBY2_9BACI Cysteine desulfurase OS=Virgibacillus necropolis OX=163877 GN=CFK40_08985 PE=3 SV=1\nMNQIYLDHAATTPMATEVIDAMVPVYSEVFGNPSSVHAFGRKARHVLDQARRVFAKSIHADEKEIVLTSGGTEADNLALIGTALANKQKGNHIITTVQEHHAVLHAAEHLEGNGFEVTYLPVYEDGKIAVQDLRNALTDKTIVVSIMTVNNETGIIQPIHEVGELLNDHQAYFHTDAVQAYSLLTIDVKKDYIDLLTVSSHKVNGPKGIGFLYINKSVQVNPLQFGGEQERKQRPGTENVVSVVGFQHAVQLLIEQKEKRRETYTSYKKLFLETLEQAGVNFEINGEQSDAVPSIINISFPGTNVESLLTNFDLSGIAASSGSACTAGSVEPSHVLSKMYGANNDRTTNSIRFSFGLHNKKEDSIEAAERIASIVKRLISLQ\n>tr|A0A841Y9U4|A0A841Y9U4_9LIST Alpha/beta hydrolase OS=Listeria booriae OX=1552123 GN=HB847_15185 PE=4 SV=1\nMKKCVTFIALLIFLLAGCSTDKTTEQDMKNLPNLSAQTALILVHGTGGSTDTFDGFSDVFIDDYHTSNERIKLHIGTDGALTYHGIFSKKALHPIVQIGFADSIDASITQQAVWLRLAMEDLQKKYKFAAFDGVGHSNGGLVLSTYAQKYAKTAPTLERLVAIGSPYNDLDQDDNKGDLAFTDVPKATPLLQKYEKNRSKINPDLLVLSIASNIDDGSFSDDIVPVLSAFSSRLIFKNEAKTYLESYYKGEEYDHRTLFANPDIQKKIAWFLYEYPGDKKEISLAKN\n>tr|T0PB79|T0PB79_AERSA ABC-type transport system periplasmic substrate-binding protein OS=Aeromonas salmonicida subsp. pectinolytica 34mel OX=1324960 GN=Asalp_31750 PE=3 SV=1\nMIKKLILSTLLLCGLANAAAPASTLDAVLDRGVLRVGFDAGYQPFEMTNKQGQYIGFDVDLAKMVAKEMGVKVEFVNTAWDGIIPALLTDKFDVIMGGMTVTPQRNLRVNFADPYIVVGQTIVLRKDKAGEIKSFSDLNDPKYKIAVKLGTTGEQAVKRLIPKATLLQFETQDDAKLEVINGKVDAFVYDLPYNAIFASQNTGAVVHLDKPFTFEPLAWAIRKGDQDTLNWFNNYLRQIKGDGSYDRLYKKWFESNAWLNQLK\n>tr|A0A6C2U970|A0A6C2U970_9BACT Uncharacterized protein OS=Pontiella desulfatans OX=2750659 GN=PDESU_04858 PE=4 SV=1\nMDIKRWISLVAVMAVAGTVQAADPLVYEGFEYDTTTGGIESASLGGGVGLSGAWGSSDAAGSFFNVTSGSFSLGSLTVSSNKLKRTNTGGVEAIERTISASLPSEFWFSVLHETSATTQFGIGGGAFGDGSSGNGNMATGPGFGFTHKGGNLGAAVWPAGSAVSVSVGGTVAKSDNNVLLLVGHVKRNVGGNDTVDLYEVDATLVLPGAPLSTVSQPTAAGSLNTLTISSNRGPGIDEIRVGATYNDVVPASAAFTFNLTPDDTQDLLADYPAVVVSNSILTEYANSSSGVEITALNVMSVSNAITAITATPFTLSTPSPAITALDFAFDASAIKAITSATEAFTTTGTVDIVYKNLDDNVLQTNTVALKGTFSNPPFQFSSDSSLGLTLVAPATLVSNDIAVSYVEGRPGYTNVVISEVNILDEQHPGAFSANNPGAIQTTDVITVTFDDSFVGLGNKQSSTCTVEVVYGEAGSSIDYTNTVSVAAFNYDLSTGSVIQQVFGNAVNLNGPLGGGTLPMNNFEAFTNNWNHNGNFTQETSAGSITLSSSGNTRSAYNLVEANTAGSDNFGAQDTHILTNGLYRYEFDYEVLNTDGANVIWSFNAYGLIDQQLFSTSSNPDKVVLDIATGASGGVDVDIQNDGNGYYSEHGDGILAGTGDVARTTGYVYLNVKDNQDALFVMHRSGKCDVRLYDLVLTRVGDYELPVNSTNAVLAAQFEDSAVTNSIVVVGATETNTNGVNNTWRGTGLSHVDRKLKSNAADTAVRATGTIIHRNTAGYDDVGLQDTIALTEGTYELSLDVQVDGTFPSNDSIARVEFWALDQDTSGTNNYVKWDHAPGTGEYLKTNGNAKVTLLGSKTYTNTVTETLVLSDLNVQADQDVAIVFYHRYGPDFFIDNVELLRTGDLPLEGYSLWAEDNGLTAGVNDGLEDDAENGGLGDGLNNLMEYALGGDPLVDDAATVSPQTSEAGGFFYHVYNERTDDPSLTFIVDLNGNLTIPGGWGSAGLEAEERGLDDGEFQSVTNSTDMLEAAEFIRLQVEKD\n>tr|A0A2P9ADD5|A0A2P9ADD5_9HYPH Uncharacterized protein OS=Mesorhizobium delmotii OX=1631247 GN=BQ8482_111084 PE=4 SV=1\nMHRFCRAGKAAGVDDRDEGLQLIEIEWRFHRSHPSLVLMLKIRNIRWINQSNDGKFTTVHMTACESGPERPLFPAPIARLRPFEYEGD\n>tr|A0A3G3A397|A0A3G3A397_9HYME Cytochrome c oxidase subunit 1 (Fragment) OS=Ceraphronidae sp. BIOUG12096-H04 OX=2463984 GN=COI PE=3 SV=1\nFLMIFFLVMPIMLGGFGNWLTPIMIGAPDLAFPRMNNMSMWLLPPSLMMLLMSMMTNTGVGAGWTLYPPLTLTPYHDGMSMDLTIYSLHIAGISSIMGSINFLVTIYKMKPSHQTLTSLPLFCWSIMITSLLLLLSLPVLAGAVTMLLTDRNLNTSFF\n>tr|A0A7C1QH02|A0A7C1QH02_PSEAS AraC family transcriptional regulator OS=Pseudoalteromonas sp. OX=53249 GN=ENH79_16645 PE=4 SV=1\nMDVLSSVLSHFSLNANVFFSGNMCGTSDFSDDQGVGHLHLLRSGTLKVRSNSGFEVVLSTPSVIFFPHSTGHCLFSDKSDGADLVCAQISYQSGGHSPLLQALPFCLNYELTGNGLLEQSAFWIFEEAFKDASGKDLIIDRLCDVFLISVLRKVLKEGTIKSGMMAGLAHPQLAKVLIKIHQTPEQSWSLSAMAEECCMSRSKFADTFKRVIEQTPADYLADWRLSVAKKLILKNQNMDLVANQVGYENGSALARVFRKKTGQAPKEWLLSQQ\n>tr|A0A511X4K5|A0A511X4K5_9BACI Uncharacterized protein OS=Halolactibacillus alkaliphilus OX=442899 GN=HAL01_23460 PE=4 SV=1\nMELMLEQFMSLNLLNQFWITLFLIIPMVLIARTVVAGTRYSPILIIVIFGLSMGYILVETGVAEPGIGAFPMVNMVASATIIALVVSFFVGGQELRKIFSNKPLTNEEMVIPSQEEAVLGTTRTQIVMIIRSFFLLIGIESSSRVLIGGSTSALSNVYPLIAYIGIVGAIIFIDNRATITNKSLYIRKGIIEIIAIIGILYLSSLIAGGIESLIALPQIFFAMIISAALGALLYRWSFGPTIKALLFAGIPVVLAGNFMVGGSRIGEAFTIDGVNSLILYGFFGQLFFMFGGISLIMYFAKNNHVRNLAPGMAGALSHSGLTGACTAGDLGKEAAQRAPIMINIPFFGHIFVFSVLAISAERGELWTLPSIAIVAIGVLFTIISLKQLKKANNESNKEVKALMQFSFGWQLVAVFGGLLLLSFSQIPFLFTGMAQASAISHFGLFAAVQGGMFGAESASLIPFIFSMPFLVHPVVFFMFGKAMKDDGLMPVKTVHAISFIGLIGVVVSLFIV\n>tr|A0A7Z9M5B3|A0A7Z9M5B3_9CHLR Alpha/beta hydrolase OS=Dehalococcoidia bacterium OX=2026734 GN=EYN92_08525 PE=4 SV=1\nMPFYERGPVSIFYEEVGSGFPLMIIPGGGLNSSIASLDTSVPFNPMNTYKNDFRCIAADLRNADSGQSSGPLEIDRPWDAYSDDQLGLMDHLGIQEFLVMGFCIGGPMIHNLLRLAPGRIPAAALMQPSGFTSEHPDIFYQTNTERWGPPLCEMAPDITMDKVHDFLTNMYTNRADFVFTVSRDFVRSLQTPLLIAPDNIPAHPYETAMEVAELAPNAETTIFPWKDTPKNIDEAVKHARRFLKKHEPDISP\n>tr|A0A7X7DHL1|A0A7X7DHL1_9BACT Uncharacterized protein OS=Lentisphaerae bacterium OX=1932692 GN=GX634_11015 PE=4 SV=1\nMNPFPARTRPVRLAMVPLMVLFLGSAIRVGAWESLTFDLPSGGRESLWRDELARHWHGQTEKRIEGGRIDVLTGEYAIEVEFPHKWHEGLGQALHYANATDRQGVLAIIAYARGEAYLHGKSRRRLELIEEQCSANNIKMLVLFPNRPEEFIRHVAPIWIE\n>tr|A0A807R958|A0A807R958_PSEME 23S rRNA pseudouridylate synthase OS=Pseudomonas mendocina OX=300 GN=PSMEN_15330 PE=4 SV=1\nMTTPASPTSGVQLIEVAPDFAGQRIDNFLRTQLKGVPKTLIYRILRKGEVRVNKGRIKPEYKLQAGDIVRVPPLRLAERDEPEPVAQGLLERLEAAIVYEDKALIVLNKPAGIAVHGGSGLNYGVIEAFRQLRPDAKDLELVHRLDRDTSGLLMIAKKRSMLRHLHEALRGDGVDKRYMALVRGHWATAKKQVNAPLQKSNLRSGERMVEVDGEGKEALTLFRVLRRFGDFATLVEAKPVTGRTHQIRVHAKHAGHCIAGDSKYGDDDFTREIRELGGKRLFLHAYELHVPLPEGGVLKLEAPVDEMWAKTLERLSA\n>tr|A0A2T6KQJ4|A0A2T6KQJ4_9RHOB DNA repair protein RecN OS=Yoonia sediminilitoris OX=1286148 GN=C8N45_101426 PE=3 SV=1\nMLRGLDIRDMLIIDRLELTFQPGLNVLTGETGAGKSILLDCLGFVLGWRGRAELVRQGAEQGEVTAWFDLPAGHAAFAVLADAGISAEDELILRRVNTKDGRKTAWINDRRVSGEVLRALSETLVELHGQHDDRGLLNARGHRQMLDTYAQLDDDIAEVRSAWRSLSRARKRLSEAEALVAEAKAEEDFLRHAVAELDKIAPEPGEEATLDTQRRLMQAAERIIQDIAKAGEALGLNGAEGMVSDASRWLVGVADKAEGQLDPTLAALEQVMASLDEAQQGVSACLDALSFNPHELEEVEERLFAIRGLARKHGVLADDLSDFADGLRARLAVLDDSAADLAALQASVDESAADFGTKSDALHRKRVSAAAALDAAMSAELAPLKMERAIFATRITEGTPGPEGADDVAFTVATNPGAPAGPLNKIASGGELSRFLLALKVCLTQADAGLTMIFDEIDRGVGGATADAVGRRLAQLAQEGQILVVTHSPQVAALGGHHWRVEKRQDAQSTTSTVVPLDASARVDEIARMLSGDKITDAARHAARALIEA\n>tr|A0A2L0BX41|A0A2L0BX41_9CUCU Protein wntless (Fragment) OS=Cyclotoma sp. CSR020 OX=2055377 GN=wls PE=3 SV=1\nMALKTFFFPLVVGVIAWFWRRVHLVSRVPALLEYMLLSLGCTLAFLNCPIEYLTLWFDMPYMLLVSDIRQGVFYAMLLSFWLVFAGEHMLIQDNGEKNGIKLYWKHLSTIIIGCASLLVFDLCERGVQLVNPFYSIWITPIGSNLALTFIILAGISASIYFIFLCYMIWRVFKNISIKRSVLPSMSQARRLHYEGIIYRFNFLMMATVICAAITVIGFILSQVAEGQNKWDENMELELSSILH\n>tr|A0A1J6PS54|A0A1J6PS54_CAMJU Uncharacterized protein (Fragment) OS=Campylobacter jejuni OX=197 GN=A8118_08150 PE=4 SV=1\nMFGAKKNNTEIIEQLEKKCNGLEDILRSIGNTMAVIEFTTDGVILEANQNFLTTMKYSLSEI\n>tr|A0A4P8GRK2|A0A4P8GRK2_9MICC L-2-hydroxyglutarate oxidase OS=Arthrobacter sp. 24S4-2 OX=2575374 GN=lhgO PE=4 SV=1\nMVEDIGIIGGGIVGIAIARALSSRNLANVTVLEKEQRVAMHQTGHNSGVVHAGLYYAPGSLKAMLCQRGRELTRDYCREKDLPYRELGKLVVALTDDELPALADIERRSVANRVPGLRRLGAGALREIEPHVAGVAALHSPQTAVVDFVAITEALADDVRSSGGQILFGHEAIAISTGQGKVRVTTGRADLVFDRLIVCAGLQSDVVAGLVGASPAPRILPFRGEYWGLAAAKQHFVKGMIYPVPDPRFPFLGVHFTRGVYDTIHVGPNAVPALAREGYGWNRVSFKDTAASVMWPGARALAKQHWRMGAKEIAASLIKPLYYRQAHRFIPELQIGDLTAKTASGVRAQAWSLDGSLLDDFAIDQVGPVTLLRNAPSPAATSAMAIADHLLEHFIHLPK\n>tr|I0SJ56|I0SJ56_STRMT Bacterial sugar transferase OS=Streptococcus mitis SK616 OX=1095735 GN=HMPREF1045_0997 PE=3 SV=1\nMYSILKRLGDISISLIAITLFCPVFILIAIAIKLDSEGPVIFKQKRFGIHKKTFYVFKFRTMKVESPKYVATRDLQNPEQWITRVGAFLRKTSLDELPQLCNILVGDMSIVGPRPVVVSERDVIETREKYGANDVLPGLTGWAQINGRDNLSTDIKAKLDGYYVKNRSLITDIKCIVRTIPYVLKRKGIVEGSKRES\n>tr|A0A1F3KL50|A0A1F3KL50_9BACT Peptidase_S24 domain-containing protein OS=Bacteroidetes bacterium GWF2_43_11 OX=1797352 GN=A2X09_17370 PE=3 SV=1\nMAKRLDLKNALQTIKDFYYRNQRIPSLSETAGIFNYSSRNTALYLLNKLVETGYMTRGTKGRLLTTPKFHDKTKLLGSISAGFPAPEEEELRQSLSLDEFLIRKPSATYMLEVSGDSMIGAGILPKDFVLVEKGRTPAPGDIVIAQVDGEWTMKYYRMENGKAYLQAANAKYPDIYAKEELVIAGVVISCVRNYA\n>tr|A0A1A0T4H8|A0A1A0T4H8_MYCFO ABC transporter permease OS=Mycolicibacterium fortuitum OX=1766 GN=A5751_24895 PE=3 SV=1\nMTVGLAVRTHAASRPSNTRPSRRRSVVARLGVLGWTLAGMGITAALWSVIVATGRFPRQLFPSVPEILAAGQTLWTEGLLAADVSASLSRAAVGFAIGAVAGIAVAVLTATTRAGRSLLQPVLRVFSPIPTIGLVPLAILWFGLGENSKILVIALGVFVPVWINSHSGLASTPVDYLKAARCLGAGRWQTLSRVVLPEAAPDIASGLRVGAAMAFVLIVVAEMTGTTMGIGYRISQAQLFSQADRLIFCLIVLGIIGALCDQLVASVTSPFTRWAHEER\n>tr|A0A417V5I4|A0A417V5I4_9FIRM Deacetylase OS=Lachnospiraceae bacterium OM02-26 OX=2292908 GN=DXB19_04045 PE=4 SV=1\nMLRKITILILLILTVAQFTSSDSIQSAREFIQNNIYVWSETQEEKLPIYCVDTQKKQIALTFDTAWGNEDIQQILRILKQENVKATFFFCGDWISKYPTDIKTIYEEGHDIASHGDHHKYMTKLTDKQQQEEIQGVTQKIQGLLGIKIDLFRAPYGDYNESVVRNARKMNYYIIQWNVDSLDWQEPTKEQLIEKVCGHKNLSPGSIILMHTGTKCTKQALKQIIRNIKAKGYEFVSVSRLIYRSNYRIDPTGKQMKL\n>tr|A0A1H1FUZ1|A0A1H1FUZ1_9HYPH Uncharacterized protein OS=Rhizobiales bacterium GAS113 OX=1884352 GN=SAMN05519103_00535 PE=4 SV=1\nMAGGQTPGSFSKNFAWGHTGLRKLHESIRLGFADVLEPVSRKLWRSQSQIDNPGLDLIPVNFFLHNAAGQLTVDELVYQAVSQPYSLRFDRLALFAFNLSQVGRPPLKGPGRPAAWANEFVKEALWQNGVWRRSALAKPAMGAFLKTHIKGQSYWKCQTNYRRLFGLCGYLTGTSPTVNSGAADCQSAWKKDPVSAPKRDPSRRRARRIDPARGAGRGCAARRDRCPVGRSVWVQARFLKRQLSLPVSTISQ\n>tr|A0A0N0MN32|A0A0N0MN32_9ACTN Major facilitator superfamily MFS_1 OS=Actinobacteria bacterium OK006 OX=1592326 GN=OK006_1213 PE=4 SV=1\nMRTNACPTGSTTRYAAARRPSDTVTTVADQERPGTAAAPTAEHGRLGLALILVAAFMVVLDFSIVNVALSSIQRELGVSAATVQWVVTGYAIAFGGLLILGGRAGDLYGRRRLFLAGIAVFTAASLAGGLARDPVLLIASRVVQGSGAAMVAPAALSLITTGFPEGPRRTRALGLYGATASVGFVAGQVLGGVLVEFLTWRSVFLVNVPVGLAALLLAPRTLRESRSPRTGRHLDASGALLITLAVGALVFAVSRGGGTGIGSADVLVPLALSALAAAAFIANEHHHADPLMQPALLRLHGLRSAGVLMLLLGLWNGGEMLVLSVYLQQVLHMSPLAAGLTIAPQGVFGLATGLLGARLARHLGIQKVLVATGAAATIGFAALTRLPGSDGSHLPLAAVTLVGCGTAGMAFGSMVTASAGVADRDQGLVGGVINTSRQLGAAIGAALLPAVADAVDRTRHASTAVGDRAAMLAGLAAAALAPLVAMNAWRRSRHDGVARCAPRA\n>tr|A0A2A7X0U8|A0A2A7X0U8_9BACI Helix-turn-helix domain-containing protein OS=Bacillus sp. AFS002410 OX=2033481 GN=CN692_02510 PE=4 SV=1\nMTELGKFLKEAREAKGLSIDDVQELTKIQKRYLEAIEEGNYEILPGQFYVRAFIRQYAETIGVDVSGFLSDKPVVEDTVEANTITEEVKHEEIPSRASKLKEPLNNVKSSRVMDYLPRILIAILIMGICIAIYMMLPSKNDEKSADTNQSQTNSNSEIEKPKNNALDQVKNDNKKQTEKAKNDETKQEPTQKITVDAAQGKRTSISLSGTDVFKLEVVANGESYVDLKNASGKMFYSGILKQGQTQNYDLTEENEVTVNIGASNNVELRINDEVFKYPVSPTNAVHQKITIKNLKMNQ\n>tr|G3HRZ4|G3HRZ4_CRIGR Differentially expressed in FDCP 6 OS=Cricetulus griseus OX=10029 GN=I79_013619 PE=4 SV=1\nMELKKEEAARQRQRIAELEEMQERLQEALQLEVKARRDEEAVRLAQTRLLEEEEDKLRQLMHLKEEQERYIERAQQEKQELQQEMALQSRSLQHAQLQLEEVRQHRQRAGEDVEAAQRKLRQASTNVKHWNVQMNRLMHPIEPGDKRPTTSSSFTGFQPSPLARRDSSLKRLTHWGSQGSRTLAANSSERKSLNGGDETPILASASQEDKLDPAPEN\n>tr|A0A4D9CK05|A0A4D9CK05_MASLA Uncharacterized protein OS=Mastigocladus laminosus UU774 OX=1594576 GN=BLD44_003515 PE=4 SV=1\nMAKVNYKLTGKYLPPQIFILGICFVPGVTEVSSEQLTEIRRFIKSDRLLQHYLEQKILIIQD\n>tr|A0A1H9PEC9|A0A1H9PEC9_9HYPH Pseudouridine-5'-phosphate glycosidase OS=Rhizobium sp. NFR03 OX=1566263 GN=psuG PE=3 SV=1\nMTRPISHDLPIAYSAEVAAAKARGSAIVALESTIITHGMPYPGNLDMARSVEAIIRDQGAVPATVAVIDGTLHIGLDAELLEALAQTRGAMKVSRADLAFAIAERRTGATTVAATMIAAARAGIRVFATGGIGGVHRKAEETFDISADLEELACTGVIVVCAGAKAILDVPKTLEVLETRGVPVVTYDSEIFPAFWSRDSGLKSPLMLNSPAAIANFQRMRDRLGIDGGMLIANPVPEESEIPRDEMEIYIARALDNADRDKIIGKAVTPYLLQSIFELTDGRSLETNIALVENNARLAAEIAVALM\n>tr|A0A151WTB8|A0A151WTB8_9HYME RNase H type-1 domain-containing protein OS=Trachymyrmex zeteki OX=64791 GN=ALC60_09730 PE=4 SV=1\nMLITPALPAYQNSYYSTCTNVSYLSLPPNILKNLDTIPQQNIQPIFEDTFQRVLARAIVFYTDGSKVDDGTYVGSAVYSPQLDLHFMFKLSSYASVFSSEAWAIYNALLFALHNDFSCIVIVSDSKSVLDSLAGFRNRTNNYIISYIRALIEEAKFCNTQVSFIWVPSHCGIQGNEIADQLAKKAIREGAESNFMTPYSDLFSIPRMRLSKAFDSYIERTSRITGEYYFKNCYSHNNKPWFHDLRFSRIMITTMNRLRSNHFNLNHSLFRKNLIDNPSCPCGAPSQDLAHVIFFCPLTESHAAPIRLALNDLDQDSSQDPITVIIRALCNPSAKICRLFVSFGLACDRLF\n>tr|A0A2D1IHR8|A0A2D1IHR8_9ACTN Uncharacterized protein OS=Micromonospora sp. WMMA2032 OX=2039870 GN=CO540_27970 PE=4 SV=1\nMSGGGPRRGRRDNGLDAAEYAVAGDVDPRVGEHLLDVLAAGGIAAYLQPSADLNPVTRTTTVPARPVDRLYVDRSHLTTARDYLTQLADEGSDDPPRPDEPDIEAEWAKIVAGFHTTPTAGSHPWPAAEDVDDPVPPAGATAGRAEEPAGPTATDVRRLPYAADVSGVSLGRDRSDEPSLLDGLDTFGADLPGDAEEEHYTPPPPPPLPRFSKYAVLGVLCVVLGFLLFLSPTVVSLVDPAVVTLLGFTGILAGFVMLVWRLRPGDRDEDDPDNGAVV\n>tr|A0A3S0HSP6|A0A3S0HSP6_9GAMM Phosphoribosylamine--glycine ligase OS=Halomonas nitroreducens OX=447425 GN=purD PE=3 SV=1\nMKVLIIGGGGREHALAWKVAQSPRVETVFVAPGNAGTAREPGLENVAIGVDDLDGLVAFARDEDVALTIVGPEAPLVAGVVDRFREAGLAIFGPTAGAAQLEGSKAFTKDFLARHAIPSAEYRTFVAVEPALAYLAEKGAPIVIKADGLAAGKGVIVAETVEEAEAAVRDMLEANAFGDAGARVVIEEFLEGEEASFIVMVDGETVLSLATSQDHKRAFDGDSGPNTGGMGAYSPAPVVSETVFERIMARVIRPTVQGMAEEGHPYTGFLYAGLMIDTEGNPKVIEYNCRFGDPETQPILLRLTSDLAELCLAGARGELAGHGCDWDERAALGVVMAAGGYPGSYRKGDAIQGLEAAEATGCKVFHAGTAEGESGEVVTAGGRVLCVTALGEGVSAARDLAYRGVAEIHWPEALYRRDIAHRAIARERGER\n>tr|A7B7B1|A7B7B1_RUMGV DNA binding domain, excisionase family OS=Ruminococcus gnavus (strain ATCC 29149 / VPI C7-9) OX=411470 GN=RUMGNA_03477 PE=4 SV=1\nMNKQYVAICEKVALTIEEAAEYSNIGQNRISSLLKEPRCPFVLYVGTKKLVKRKEFEKFISESVEI\n>tr|A0A059AXC2|A0A059AXC2_EUCGR Uncharacterized protein OS=Eucalyptus grandis OX=71139 GN=EUGRSUZ_H01175 PE=3 SV=1\nMVMKVHGSVFSAPTMRVLIALHEKDLEFEFVFVDLRAGEHKKEHFLALNLSLHHRPPPPFGQVPAFEDGDLKLLVEAHQFDPAASKLHWELVYKSKIGMATDAAVVKDADKEANLAKVLDIYEARLSQSKYLSCDCFTLADLHHLSALTSLMGTLVKKLLDARPKVSAWVADIVTPPALAKVLTMRNQQ\n>tr|A0A2E3M894|A0A2E3M894_9RICK Diguanylate phosphodiesterase OS=Rickettsiales bacterium OX=2026788 GN=CMP19_12800 PE=4 SV=1\nMSQHHNSLATLPNRFAFIDTVSKCGVLHPSLSLMLVDVVRFSDVTTSLGINIGDRFLLEIANRIQSLFGGDIRLGRISGDVFGIAFLGTRSSGQMRDMFERLVEHFKTPMHHDGHAFIADFNVGVVTSEGQTFEITAFVSRGEAALKQAKENKYENFCLYNMQDKTDTGRSLALKADLKRALSQNELELYYQPKVNLQTLEVIGAECLLRWNHPLDGVLFPGPLIEAAESYNMMNELGYWTLEQAFRSLVDFDFHRLSLTLSVNISPTQLYDNHLIPSLKMLSKSYAMPLTRIELELTEDVALSNSLMVKRQLDELRALGVAISVDDFGKGYSNLAYIRDLDLSALKIDKTFVIELANHPVNRAIIEAAKIIGKAKNCDVIAEGVETIAQLHILREVGVTIGQGYLFSKAIPLNDFISLAQQEIIVGNSPLRA\n>tr|A0A4Z1G3Z5|A0A4Z1G3Z5_9HELO Methyltransf_25 domain-containing protein OS=Botrytis hyacinthi OX=278943 GN=BHYA_0421g00010 PE=4 SV=1\nMATVAAGSQAGHDTFDALNIEYEKAYRDNPFKIAAIKKAITLLDPGSKVLDVGCGTGVPVSELLAEAGLEVVGFDIAPKMVEFAQKRVKGTFSVSDMVQFQVEDTFSGVFMIFAHLQLSYAAVHAAVYKYVSALKPGGVFVLGQMPSDSYVKGEGNAAYDETRTYVEDYDAPFMGEPLPTFMMSEQGQRNFLTSMGLEIVSETIDQFQPDNEKCEPEMQQYIIARRPVDGTIVEPQPLPKNK\n>tr|A0A526YNJ2|A0A526YNJ2_9HYPH 3-isopropylmalate dehydratase small subunit (Fragment) OS=Mesorhizobium sp. OX=1871066 GN=E5Y60_26890 PE=4 SV=1\nMEKFTKLTGVAAPMPIVNVDTDMIIPKDYLNTIKRTGLGSG\n>tr|A0A0A1TZ67|A0A0A1TZ67_ENTIV Uncharacterized protein OS=Entamoeba invadens IP1 OX=370355 GN=EIN_043770 PE=4 SV=1\nMVSRLEMVFLANVVLKLTNYIDIHNFILVSHNCYESVKSLKTTPKLSSAIDLSWFLSHFYLDTVDFDEVQIPVEKYISSVQCIRNPNFLEDAIAGKLTQSYADTIFPKVVSLSLLYPVYEKDDPCNNLIISNSKKFMSLRRLSGDLEQISLFLKNLTDNGEAIGTKYPNLIVIDSYLESTIVLNETTLNLLRSVELYLKKSYNEKVCYVVAEVPEDRSLIDFVKKGKFYCKNAGSVMCNKDDIFGVCGDFELSGEVERKGEDLKILNERIGANLDAASAFSLTHKYMSNTEYSLELPDSVREYNICVSSLPELVDANYFKYPINFNKIEVLKLVSVSNVSLEVTNALNCLELKSCDFCVFTNDEDSLIAIEEIFVEDSKHIRFLTHSEAIVENVHLFSDTEIDFNWSIKNTENVEIVESRNVGFVGGIFSASCIFHVERSTDTVIKNGEQIASYIKEVNVANFVIGNTGETKSCVLANKHFVCHSVDYLINNHFSCYNEVTENVRSFRPERIVLFTINNFNETSAKVPYFEVKEKGCMLSLGLYDTKGSALTNSTYPIHVGWENGSLGIHTDDWCLYGLDIGGEGENVNVAFDKFESCECVIGCGYNNTRKEVFFTLNGKIVKKIEIPWKNIGAAFAVQRLGTLFVNTGDQKFTFDIENYK\n>tr|A0A7C0YEA6|A0A7C0YEA6_9FIRM Uncharacterized protein OS=Firmicutes bacterium OX=1879010 GN=ENF61_00215 PE=4 SV=1\nMKHKKEEEMVRRIKMFLMLLLGLGIFLAPLTFHVQDHRKGNGHLVKLDCFCGGDECGICIIPN\n>tr|A0A2Z6P333|A0A2Z6P333_TRISU TFIIIC_delta domain-containing protein OS=Trifolium subterraneum OX=3900 GN=TSUD_213440 PE=4 SV=1\nMNSPSPLQSAMLMGSPCFPNAISWSQDNLIAVASGNIVTILRPDLPNGPRGLIKVLPREPLIVGFVHRKDVVSGCLMPTSLYRDDKPVVQSISWSPLGMAANSGCLLAVCTSEGHVKVYRPPFCDFCADWIEVVDITERLYEYLQYTEFKDAGVPSSDFSEVPRIRPCLQKNALGQADSITPNDELLENVPDNQLSPLISADEYASRSAMLYSLVVSWSPLLRVASEFSPDPNTSASVSLLAVGGKSGKVSFWIFYQPDCYTIEESKTPTAVKFVGFLQAHNSWITTMSWLLFSFDSSNPLIILATGSSDGSVKVWLGDNDKLLKSSAVDQTSFSLLKEVITVNAVPVSVLSVTVHVQYPSKMLLAIGKGSGSIEIWLCDIPSREFDKLGSYDAHYYVVTGLAWAFGGRFLCSSSQDNGLRGWILHERRLEEMTTFSEMPRSNDSTCPSRDAYDSCFGVAVSPGNLVVATVHCFDVVKLNRMYEGRILRAAIEYLWIGGLQVDVWLKSPSPCYIEELPSFPEKELTYWAANIIWSLNQYQCLDKPLVFWDIIAALLAFKDNNSKYVEYLVIKWLSLSYLGSRTNLPPEEVLSRVISRLSDVPSRLLHLLNIMCRRVMLAQLDADQITTINSKGQNLEGVCPVIEEKMTKWIEILLGSERELRERHVGFSFSAVKTTTSHLEETPSQPGRWYPVGLAQMEQWVALNQEQIRDQLKLIATKVTHGKRFKTKRCSAVEPCSYCSAPVPFESPEFGFCQSKNRSNGNVKPHKLSRCAVCMEVCPSSPLWFCVCCHRNVFRLAPEPLFRMPSCCLDSDSSNRTSSEAVSSKPLCPFCGILLQRKQPDFLLSPAPV\n>tr|A5E9B7|A5E9B7_BRASB Hydrogenase maturation factor HypA OS=Bradyrhizobium sp. (strain BTAi1 / ATCC BAA-1182) OX=288000 GN=hypA PE=3 SV=1\nMHELGITRNIVKIVEEAAKGRRVKRVTLDVGQFSGVMPDAILFCFDIVAKGTLLDGALLDIQKIAGLARCRSCGEAFKTTSLYQACACGSRAIDRLAGEELKIREMEIEEAA\n>tr|A0A0J0YQQ3|A0A0J0YQQ3_9NEIS Probable allantoicase OS=Neisseria arctica OX=1470200 GN=alc PE=3 SV=1\nMELPDFATRFVNLASADFGAEVLSCSDEWFAAANRMLQTAPPVFVVGKFDDHGKWMDGWETRRKRYEGYDHAIVKLGLPGVIKGVDIDTSHFTGNFPPAASLDACRCTGVPDESTEWVTLVEAVSLQGDSHRFVEVDDEREWTHVRLNTYPDGGIARLRVYGLPKVDWDALPKDEVYETSAVENGGRIVAVSNAHYGVPFRLNMPGRGINMGDGWETARRRVPGNEWCIIELGTKTLIEKIEVDTAHFKGNYPDTVSIQAADVTFGTDESLVTQSMFWQTLLPQTKTEMDKQHFYTQADFNDLGAVTHIKLNIHPDGGVSRLRVWGKPVR\n>tr|A0A4S2D9L7|A0A4S2D9L7_9MICO Glyoxalase OS=Microbacterium laevaniformans OX=36807 GN=E5344_04275 PE=4 SV=1\nMTSIFVNIPTNDLERSVAFYRALGCAINPNFTDENAACVVWSDDIFFMVLRREFFATFTEKPVGEPREWAQASLSFSRGSRADVDAIVEAGLAAGGTEPHPAQDYGFMYSRDLDDPDGNSLGFLYMDPVAAEQGPPAEAS\n>tr|A0A2R2WQG2|A0A2R2WQG2_XANCI Uncharacterized protein OS=Xanthomonas citri pv. aurantifolii OX=76802 GN=TP45_21175 PE=4 SV=1\nMSLLVNAYSTLRTPLWPDFLPQAAVQHRDYADPALVDHLHGFVGYVNQAGDGQMTQSRYHLMRHVQRVRQHFSFQVDDADFGALAQWAEQANAVCFLADGSVRDPHGRVLISQGEPAIDDDAQVPYPPDALQRRAQQSSLLTAQGIRVPPSLPPVPGEAEARVRDAAVVSRRMLALFAVALRAEILATGDTPPSLDEVETRLPGVAAALSPQERAFFAQAAPDAQALANFGWRYEALAAQRALDNAQAAERTTLARRPLPELLDTLDRHLRLHWAVRQAGRSGQPLPAGIVPGVVYERHYALNWLLHFEDAEWDEVETPT\n>tr|A0A1M3MBX0|A0A1M3MBX0_9BACT Tryptophan synthase alpha chain OS=Paludibacter sp. 47-17 OX=1895899 GN=trpA PE=3 SV=1\nMNRINQLFKNKPSGIMSVYFTAGYPQLDDTLPILDALQANGVDLVEIGIPFSDPMADGVVIQESGHQALQNGMNLRMLFQQLTGMRSSVTIPLVMMGYLNPILQFGFHDFCRECRRVGVDGMIIPDLPMDDYLSEYKAIAEAFGLKFIFLITPETSDERIRIIDQQTDGFIYMVSSAAVTGTQQSFDSREEYFRRIESMKLKNPRLIGFGVSNKATFEMVNRYSSGAIVGSAFIKSLQSSCSVSEAVQALIQQLRS\n>tr|A0A418ESL0|A0A418ESL0_9STRA Uncharacterized protein (Fragment) OS=Aphanomyces astaci OX=112090 GN=DYB26_008272 PE=4 SV=1\nMTTTRASSIAAAASASPTLATTPTTHDVNDDMEEGAPTPIADAVPTHDANDTLTPGTAPTATLGDDDMTAAAAHRLEEDFPELDGSKATTPPPVPATNPWNWAATTGADMSKPRADDIGFHPATDAQLATLLQLQEQGTWSYDAVLALESSPRREAVGHLIMRPGVSTAKVSENRLFQA\n>tr|A0A7X8UWW0|A0A7X8UWW0_9BACT Methyl-accepting chemotaxis protein OS=Phycisphaerales bacterium OX=2052180 GN=GXY44_13280 PE=4 SV=1\nMSLKAKLFSSNMILAIVPVVLVSIIVHRTVRDGFRVSAAEAEAGLTTTIQTGREALIASGMTDLRHTAEHVYAMCAAQQEVLQQKVGYDLNVARDLLTQGGGITLMDEEIRWEAVNQFNRQTVSVSLPKMCVGTEWLGQNQEAGTTSPIVDRAQQLVGGTCTIFQRMNPEGDMLRVCTNVMGADGKRAIGTFIPARHPDGQVNAVVEAVRNGKPYLGRAFVVNAQYVTAYEPITDATGQVIGMLYVGVKEESAESLRRAIMSIKVGETGYVYVLNAKGATRGHYVISSQGQRDGEDLWMSKDADGHLFIQDICAKAITLKDNETVMVRYPWQNPGEPRPREKVVTLAYFAPWDWVIGVGSYEDEFFETVKAMEAEGAETLASLQEAGALAIGTVQKWSIGVGLAALVLSFFVAWFVSQGMSRALRRIIADLNEGANQVNAAADQVAGSSQHLAAGASEQASSLEETSSALEEMAAMTRTNASNAQQANGLADQARTAANQGDQTMEQLNQAMTGINDSSQKISKIIKVIEEIAFQTNLLALNAAVEAARAGEHGKGFAVVADEVRNLAQRSAQAAQETTQLIEDAVDKSHNGTQVATQAGQALAAIVKNVDAVTRLINDIAQASSEQAQGVEQVNMAISQMDKVTQQNAAGAEQSAAAAEELSSQSKVLKETVGNLVTLVEGRGAQIE\n>tr|A0A258R204|A0A258R204_9PROT Thymidylate kinase OS=Hydrogenophilales bacterium 28-61-11 OX=1970529 GN=tmk PE=3 SV=1\nMNMTGKFITLDGVDGAGKSTHIAFVADWLRRQGREVIVTREPGGTPLGETLRELLLHRDMDADTELLLMFAARQEHLAQLILPALARGAWVLSDRFTDASYAYQCGGRGIAAERVAALEAWVQRGFSPDLTLLFDVPPEVAEARRSAARAADRFEREAELFYNRVRQAYLDRAQADPQRIRVLDARHTIAELQAEITRLLQELA\n>tr|A0A6D1WBS5|A0A6D1WBS5_9PSED Arabinose 5-phosphate isomerase OS=Pseudomonas sp. JMN1 OX=2518650 GN=EXW70_13605 PE=3 SV=1\nMSQSSDLIQSAQRTIRLELEAVEGLLAHIDADFVRACEMILASKGRVVVVGMGKSGHVGNKIAATLASTGTTAFFVHPAEASHGDMGMITKDDIILALSNSGTTNEIVTLLPLIKRLGIQMISITGNPESTLAKAAEVNLNVHVAHEACPLNLAPTSSTTAALVMGDALAVALLEARGFTAEDFAFSHPGGALGRRLLLKVENVMHAGDELPHVQRGTLLKDALMEMTRKGLGMTVILETDGRLAGVFTDGDLRRTLDRTIDIHTATIDAVMTPHGKTARPEMLAAEALKIMEDHKIGALVVVDSDDHPIGALNMHDLLRAGVM\n>tr|A0A2L2WP68|A0A2L2WP68_9BACT Ribosomal RNA small subunit methyltransferase E OS=Prevotella sp. MGM1 OX=2033405 GN=PvtlMGM1_1921 PE=3 SV=1\nMKETRFFYVPNASISEELPEEEALHALRVLRLNVGDEIVLMDGCGKYYNAEVTFASNKRCVYKILEEHPQKCQWARHYHIAIAPTKMMERMEWMVEKATEIGIDEFSFLNCKFSERRIIKLPRIDKIVISAIKQSHKAWKPQVNDMIAFKQFISTPRAGLKFIAHCYTEIPRKYFFDELKTQGQMDDVTVLIGPEGDFSIEEVRLAIDKGYVPVHLGESRFRTETAAIAALMMMQLSDKLNGK\n>tr|A0A663BED7|A0A663BED7_9ENTR Crossover junction endodeoxyribonuclease RuvC OS=Klebsiella quasipneumoniae subsp. similipneumoniae OX=1463164 GN=ruvC PE=3 SV=1\nMVRTLLKLPANPQADAADALAIAITHCHVSQNAAQISETRLNLARGRLR\n>tr|A0A803PXS8|A0A803PXS8_CANSA Uncharacterized protein OS=Cannabis sativa OX=3483 PE=4 SV=1\nMSGSNTNHQETKCKIRKRNCSSSSSSSLVRKYRFKRTILMGKRGGSTTPAVTMWETTSSPAPVSMAETGKGKEAAPGKSVSARKLAATLWELNQKKDGTAKLDKLPKLPSQSASLPPDPSYTPISDRRRDDHAERVGHHRTMSAVTQKFQLTDYYLGGLDSLSTASLMEVEDHARAKTHHHQHHKKCVTNNGGSNKTRLKEVSSGLATSKELVKLLNHVCGLEEQRSLSTSLFSALRFELDRALIHVDRFMREQRSKGGEIEFLVKQFAEEKAAWRSKERERIREAMSCVAEELKAEKKLRKQTERLNKKIGCELADAKAALSKAVKELEREKRAKEILEQVCDELARGIGEDRAQVEELKRESEKVREEVEKERQMLQLADVLREERVQMKLTDAKYQFEEKNAAVEQLRNELETYLLNMDNNSRSYRWSYACGEELNEDEDEESRRVSVDRDFKGRKSISEKIQWGSICLNKSDSGLELDFGNKSQGNSDGVVSQAKKQEFEDEFKRYRSSIKGLADQILSGSEMVPIHGLTSPSRQWGKT\n>tr|A0A6N7L718|A0A6N7L718_SINTE DUF1109 family protein OS=Sinorhizobium terangae OX=110322 GN=GHK62_00935 PE=4 SV=1\nMETHELIKGLAADSRRTGMPMNTAWWAAVLIAIAIAAAVFFALLGPRPDIAGAAQTVRFLFKFVVTIALAASAFVPLRMLSRPETDPRGGLLYLAIAPALILAGVAIELVVAPAETWLTRLVGTNSLVCLTFIPLIGVGPLALLLLALRHGAPSHPALAGAIAGLTAGGIAATFYASHCTDDSPLFVATWYTIATAILALLGTLGGRYVARW\n>tr|A0A1Y4K2B0|A0A1Y4K2B0_9BACE Conjugative transposon protein TraK OS=Bacteroides sp. An19 OX=1965580 GN=B5F25_04455 PE=4 SV=1\nMVIKNLENKIKLVGIICVSVIIGCVIISLSSIWMARGMVADAQKKIYVLDGNVPVLVQRTSMEETLEVEAKAHVEAFHHYFFTLAPDDKYIQYTMEKAMYLVDETGLAQYNTLKEKGFYNNIMGTSAVFSIFCDSIKFDKEKMEFTYYGRQRIERRTSILMRELVTAGQLKRVPRTENNPHGLLIVNWRTLLNKDIEQKTKNNY\n>tr|A0A7X5XVZ8|A0A7X5XVZ8_9SPHN Murein tripeptide amidase MpaA OS=Sphingomonas trueperi OX=53317 GN=GGR89_000656 PE=4 SV=1\nMSIQISAAFDSGNIRVVAIEGDRVDCEIVLDHQSDFFQWFHFRVAGAKGRTLTFRILNAGSSAYPFGWPGYKARWSADRESWRMTETDYADGILSFTHHFQTDLTWFAYFAPYSMERHHDLVSRIALQEGVTHRQLGETLDGQPIDCLTMGEGPKQVWLYARQHPGESMAEWWMEGALEFLTDEDNAVAQALRTKATFHCVPNMNPDGSRRGHLRTNAAGVNLNREWHTPTPERSPEVLAVRNAMDATGVDFAMDVHGDEAIPANFLAGFEGIPSWTDALGEKFYEFGRRLAAHTPDFQTELGYDKSPPGKANLAMSTNQLAERFGAVSMTLEMPFKDHDANADPEFGWSPTRSKLLAHACLETLAGMIDTL\n>tr|C7LTP9|C7LTP9_DESBD Diguanylate cyclase OS=Desulfomicrobium baculatum (strain DSM 4028 / VKM B-1378 / X) OX=525897 GN=Dbac_0207 PE=4 SV=1\nMLNFFCGGQPVKERSSSRVSAPETAAQASFDPGRASWPSRIGIVRRVALLLFVLVLVPMGTTLAMLESGTVIDPVNMLVASLAVALGLLAPISRIGAHFLVLRDLRLLNEFCSQIQQGRYGARFPVGLEGDDEHEMLRLKRNMNWMAHHIETQTKKLHERLDESDLRKRFYEEMSYRDPLTGLYNRRYFDCFVPNALRDPARRQGVFLALLDCDGFKRVNDTHGHQVGDEVLATLGRVIGESVREGVDVGFRFGGDEFGVIFRTVDFSACLGACERIRVRFANSNADGCTVSIGLCAWSPALGHDMPDLVRSCDTCLYQAKGLGGNQVVTNETVSIPPRLSSPAPS\n>tr|A0A3D3VBE3|A0A3D3VBE3_9PROT Cysteine synthase A (Fragment) OS=Rhodospirillaceae bacterium OX=1898112 GN=DIT35_08550 PE=4 SV=1\nAARKLARLEGIPVGISSGAALAAAAEVGSREEMTGKLMVVLLPSFAERYLSTALFEGV\n>tr|A0A7X7I035|A0A7X7I035_9BACT DUF87 domain-containing protein OS=Fibrobacter sp. OX=35828 GN=GX639_08725 PE=4 SV=1\nMTFSPIEHNASLRIGSVEFVSPDELKVCLDLEAPDGISANAGIPRAFPRINSYVLIATEAGYIVAQVEWIAIEKTPFPKRKGFQDYGLVDLPYPTRKLRANPLGILKQNSNNQFEFQRGVQSFPSIGEPVLIPTDQQLQAIVESGKNRRIKIGSSPIAGNAEVMIDPDRLFGRHLAVLGNTGSGKSCSVAGLIQWSLAAARPKDSEPNARFIVLDPNGEYTKVFKDKGRVFHVGSDANSLQVPLWFWNSAEWCSFTQASAKAQVPMLKRALREIRSGGGRIASDVDLELRRKISSILISLRTQIRNGDNYEGWKFGPKLEAYKKDIEAFARHFSGHTTTLGEISNAITKALSFPHQTYIKKDGCIGYNDFPVVNIEPIENVIEKFLTTIGGLVFQNDFNEDIPLSFNSVQFADHIDNLAREDSNPHFFEFLVMRIRTMLADTHMQSILGDTVDMTLEKWLKTYIGDNNPTNGCVTIIDLSLVPAEIVHIVTSVISHMVFEALQRYHKHKKTSLPTVLVMEEAHTFVKKYKEEAENQSVSAMCCQIFEKIAREGRKFGLGIVLSSQRPSELSPTVLSQCNSFLLHRISNDKDQELVSRLVPDNLRGLLRELPSLPSQNAILLGWASELPIMVRMNDLNKSERPHSDDPDFWNVWTGKDECGNTVVRDVDWEKIAADWQGRIK\n>tr|A0A1Q6MVU0|A0A1Q6MVU0_9FIRM Phosphoesterase OS=Coprobacillus sp. CAG:235_29_27 OX=1896995 GN=BHW13_05765 PE=3 SV=1\nMKILLVSDSHGYDDELKKVLENVKCNLKIHCGDSCFDKNSPFIKEFAAIVDGNHDQGFFPLTATLPTALGNILITHGHKFNVYAGYDYLVEYMNKADIHICFHGHTHVPHYEIYKNKIFINPGSIMFNRGQSQCGSYAIVSVDDKLHVDFFDSRTQKKIPQSLIDKDQDILNEFKRFACQK\n>tr|A0A495SQH4|A0A495SQH4_9FLAO Helix-turn-helix protein OS=Chryseobacterium defluvii OX=160396 GN=BCF58_0976 PE=4 SV=1\nMKTSPKPYSILLFILLFHAVSSELRGQYSEFYQIRKRYEDRKENDTSALPLVQISIEKAKREKNYHELYNGYKFSGYFSESKNSKLIYADSAIEAAFLSKDEALISRAYMGKGIVYYYSFKKYKQALDQYLKAYEYSKKTKDQYQQNKLQYHIGVVKSYIGFYDDALDNLYPSKNYFYNESLKKDIHPNILFGIKRGYFNSLHQILVCYRNLRDYKRIDSLLALAVNDQNLKDNYTLEYGYFLKEKGINEFHKADFRSSITSLNQSLIPIKKAKDFAWESVCYAYLGKSYLRLNNEKKAIEYFTKVDSIFQKEEFMIPEVRDSYECLIQYYKTRGEAKSQLYYTGQLVKADNILNRKFPYLSSKIFREYDTSKLNETHHQEKKTLQREKVIFIGGTIFLLVIFLHRYWKEQNLQKNYRLLEERILNKNVKSNKTQDRQDNPYSLEIEKEILDDLLKKLEDFEKKNKFLESGITLYKLASKFQTNSTYLSQVINEYKGSNFKKYIGELRIEYITQKLYNDKKYLSYTIEGLAEECGIASRPNFSNLFQEYNGIRPRDFIKKRMEDLKNKENLEEGAISCE\n>tr|A0A182RGG3|A0A182RGG3_ANOFN Uncharacterized protein OS=Anopheles funestus OX=62324 PE=4 SV=1\nMEEFLEAIQCGQYEVVRAALKNSDLDLDHQDPAREGNSALHLATIAKHNKTRLIELLIEAGADCDLRNHANLTPAELALDNGSQYVAEFTLCKELDAVPDDQALRRLIRRGSVELLKIFLEKRAFDIHTKMKLIANLLDELTVKGVPIDRSMRVFLEYELIAHSYEDGTEGNATRQRRLGASGGASSKRKADGKVQSSTGETEADRRIELVLSYTKYLTDRYDDDNLNDLDDEFVVRLRAICECLYYLDGLDCCARSDWKLLKLIPLGELAYLCSVLLSILEKSVGFEMYKLVLNKHQIVSFLRAVSAELGTLVKASTRTVRTDRSFQWTPQLLLDLIVCIREQKLSQYVGRRRRACEDLQRIATTTCPLGAAEHDRVLVELGRRELIALQDGVLERGTKWGVADYVAYLRDDHPLTVGQLWHRYHPKLRLSKRQVAYAASRRELLSKIRARRLDELSRNKTKLLERELGARELQGSPSARTVRRRHRTVFGHIRRTYEQIWQMHTVKKIAYYVENALVIDLDDRSNATLCLMAIQRVMQFIGEVSKESQQHQATFARMLANLLDHVLSPLCTTATLTDADDLRESFSARCSVGKYFLHETLTGEQVRTIQERLKAVYRFCLYVINIQLIEAYKTFLGTAYRLRNTNQLQSYARYIGEHNLHTLSHIKFEHVFYDEKETARIVQELKKMYLGMSNELKLLSFIEKNIHFRFYHMQYHQTRLRVTLSNFAIVYRALKANPDYGCVRRLLHSYLHQSYQKYDISRSISISDANLALKELLRPYSSISENEDTLKVVRHLEELQHLMDPDRLFGINPVHRTGGHSSLEAARYQKFTRKLLKDMNASTLNDEEFQQLHDKLSRMYYGNIFLVQQRYHTLEEFFRTKGVALDETDLLTRRESDEEMLQELFDSKVNDVVEILEKFECTDVQNLCEVIEQLPPVVQFALEYGLLELLEILTSVNAIGSNRWHSLQCSTAVLCGHNLKTFLTGGRESQVLESLTLKSNATIFLNAIIFKQRSYELYGGRVDGRHCSKSKLMVSCFADKFANRLQWLEQQRILYETIRTGEVKLSTLRRQVRDGVEIGGQRFGSLMPNEMCHYGLIDCAIAGDFRAMIDLLTETDSTAESGVSSSERHHLLRYLLRRTTKSHFIAEPLERMKQEDRHTLVLYLCLFLGDVALFRQQLVRYNAYDELHLFVNSEDHRFVQQLLSELPDYDWSRTDANGMTILQKLVNAGNQPAIEDLIRRMSPEQLNSLCSMKYTALNLAARLNLVEIVRVLASAGIDLNVMSEDEKLPVFWLIQYGNSRTVVQQTIDAATELTAFSSELCLLHRAIEYDNEDVLRYLIEDCKVDPTRIYSNCNNVLHVAAGFDRCRIMRYLLTIPGLRKIVNNCNLVKNSPLNVACKEGYIRSARVLLAQGGASTETCGEYGLNALAFAMYTNNVKLARCLFRYDASIGNPLSSDFQPINMAIRNRNIRMLELLLRRGVDVNSAPLCFINAVYAQSRDIVQLLIGRGVKHVNHRDEFCQTALHLCVERDEYEMARDLIRYGAHINAKNRSGMTPLHLAVQRGNVRLVQLLLDHKCSVDELNYHGETPLIRAVASNNTKLVKILLNNGASIERLRNSDPPVLLYLVQENHEEILDYLLEHYQFNANEQDAYGNTLLYVATQHNHINIVKLLVDKYHAKTNPTNHKKLTPLMIARVKEYKEIFHFLEARLVEE\n>tr|A0A1S9BZC6|A0A1S9BZC6_9FIRM Oligoendopeptidase F OS=Oribacterium sp. C9 OX=1943579 GN=BXO88_02085 PE=4 SV=1\nMKFSEMPYERIDFTKLSKDFKELEERFEKAASGEEQYAVHEDFYKIYNHVMTESQIAMIRSDIDMSDEALLEEQQYFDENMPVFQNLVVSYRKKLFNSKFRPYLEERIGKVAFRNIELAMKSVDEKLIPLMQEENKLQTEYNKLLASARIPWNGEELNLSLMNPYLHNQDRTIRKEAWEKYSAFFVAHQEELDDFYDKLVKNRTKQGELMGHENYLPLGYARMNRNSFGRSDVEEFRKQVKKDFVPFAEKLHDIRRQQLGLSRLSYIDEGVYFTNGNPAPTGTPEEILAAGRKMYNELSPETGRFINFMCDSELFDVLGRKNKKTGGYMTMIPDYQAPFVFANFNGTSGDADVITHECGHAFQGYITAGDPVIEHNDITMEVAETHSMSMEFFTEPWMPLIFGNRAEDYVKMHFMDSVIFIPYGTMVDEYQDIVYSNPGLTPKARNEVWRDLERQYKPHLDYTGNEYFEKGGYWQRQHHIYDSPLYYIDYCIAGANALQYKVWMDQDYKAAWKSYLELCRLSASDFFDGLVKKSGLNNVFEDGCLRYVVKQLEEKM\n>tr|A0A355Z3B3|A0A355Z3B3_9PORP Uncharacterized protein OS=Porphyromonadaceae bacterium OX=2049046 GN=DD424_00560 PE=4 SV=1\nMQLKSSLKQLLVESRANPGFTSLYVGGVAFAVAFTMIFAIIYYVHLAPLYPEYNRSSTYYINNLTVRNDKTGAMNQSSVGIPFVREFVEKSKNIEYSTIVFQMQGFIQPPDQSGDFSVNIIDTNPDFFKLYSYEFVAGRPFNEAETESAINNIVVDSSVADRLFGVSEQAIGKEISISYRPYRIVGIVRSGNPVAYMSYANVFRPYTIRTKSANTSLKGDKCDYLGDYSVPIKFKDSRQAERFREELTEKVRRINAADSTGQRLDIQSAPISHTLRILSQRSNGENLSMTEYLKPLLITLLVLLIIPAINISGMIGGQMDRRLAEIGVRRSFGATRGHLTRQVMFENLILTLFGGIIGFAIAWIIIAFGRNMLLKLIIPAWECIDAPAEISTEMMFAPLVFIAALLLCLVLNLLSAYIPVRLSLRRPIISSLNSKR\n>tr|A0A195BT40|A0A195BT40_9HYME Uncharacterized protein OS=Atta colombica OX=520822 GN=ALC53_01728 PE=4 SV=1\nMAKNIGSILLLTFALSFVRADEYERQWNTPPELIPESIVKILDNEESQMRLLSLIPVTATVSLTGENNNAHSVSLDASLDGISFSESKIHDRPTGYETDGSSVSVSKSTTVSAGLSGISTAAAEAYNNGNNAKTESHSLSFGQSTATSFGTIENGQAITGAASSTGLSQSFTIGDNRRQFSQVGAVNMQYPTWSNIGPNNGYIDQRFKRPTLTISNIDPNNGYNDQRFNRPTLIISKPWDETNRPTLNIDVSDTSRQEQKPTIHIHKWQPNRRISRPDFSIKHQLHDIRNDRNHGSISLRIENKNFKQEYSGSDLISDLAQTVDKLFDIV\n>tr|A0A5B7XNA0|A0A5B7XNA0_9ENTR Mechanosensitive channel protein OS=Leclercia adecarboxylata OX=83655 GN=ybiO PE=3 SV=1\nMPWILLLLISLFCLPAQAVSLPGMPAATAQTPPPAEPDVEQKKAAYSALADVLENDTSRQELINQLRSVAATPPQEPVPKITPPEIADEKTVLENVTDISRHYGDALATRFAQLYRNLIGSPHKAFNPQTFTAAAQQFLILAGLVFAFYWLVRLCAWPLYRRMGSWGRKKNRETSSWIHLPLTIAGAFIIDLLLLALTLFIGQILSESLNTGNPTIAFQQALFLNAFALIEFFKAILRLIFCPRVPDLRPFAINDSAAHYWSLRLSLLSGIIGYGLLVAVPIISNQVNVQIGALANVLIMLCITVWALYLIFHNKRAITEGLLHLADRSLAFFSLFIRAFALVWHWLASAYFIVLCFFSLFDPGNSLKFMMGATFRSLAIVGVAAFVSGLLSRWLAKTITLSPHVQRSYPELQKRLNGWIGVSLKVARILTVCVAIMLLLSAWGLFDFWNWLHNGAGEKTVDILIRIALILFFSAIGWTILASLIENRLSSDIHGRPLPSARARTLLTLFRNALAVIISTITIMIVLSEIGVNIAPLLAGAGALGLAISFGSQTLVKDIITGIFIQFENGMNTGDLVTIGPLTGTVERMSIRSVGVRQDTGAYHIIPWSSITTFANFVRGIGSVVANYDVDRHEDAEKAQGALKAAVDELLEREDIRGLIIGEPSFAGIVGLTSTAFTLRVSFTTQPLKQWTVRFALDSMVKKHFDLANVRMPVQMYQLLPSPTGENTQIQNRT\n>tr|A0A1F1XSS9|A0A1F1XSS9_9MICO Esterase OS=Brachybacterium sp. HMSC06H03 OX=1581127 GN=HMPREF3159_00885 PE=4 SV=1\nMIRLRTDFFAESLGMGTSMVVLMPQAASGIGMEGSDAPGAGPSADGTADGGADAGGAGAADGPAVPVLYLLHGLSDDCTIWERRTSIERYATEKGIAVVMPEVRRSFYTDEAVGEAYWTFVAEELPRIVARTFRVSTAREDTFVAGLSMGGFGALKLALNHPERFAAAASLSGAVDLTSMDLDWTGTLAQRVWGGREIAGTADDLLGLLGKRDPAELPALFLDCGTEDQLIDQNRRFLAAAEQAEVEVASRLRPGAHTWEFWDEGIQDVLDWLPIRG\n>tr|A0A2D8DKP5|A0A2D8DKP5_9GAMM Oxidoreductase OS=Gammaproteobacteria bacterium OX=1913989 GN=CMQ67_01330 PE=4 SV=1\nMSDTYNAFVVDEIEDQFKSSIKSLPLPELQDGFVLIEVLYSSLNXKXALSASGNKGVTKSYPFTPGIDAVGKIRQSKDNNLKEGDEVIVTGYDLGMNTNGGFGEIIHVPSGWVVPXPNNLSMEEAISFGTAGITAAASVDAVLSKIDAPEXPVAVSGATGGVGSIAVGLLSKLGXDVTAITGKENSSQFLKDLGAKNIXLRDDFCSEKIRPLDKTKFSAGVDTVGGEILSRIISQVDRHGVITCCGNVNSIKLETTVFPFILRGIALQGIDSAESPITYKKYLWDKIASEWQIGYSKSSIKIIKLNELAPEIDKILNGNQQGXVVVKHGE\n>tr|A0A562L573|A0A562L573_9GAMM Aspartate--tRNA ligase OS=Luteimonas cucumeris OX=985012 GN=aspS PE=3 SV=1\nMRTHFCGLVDEALIGQTVTLCGWADVARNLGGLCFIDLRDHEGIVQIVAEPDADMAGNADVIAAASQVGYEDCLRVTGVVRRRQSVNDKIRTGQVEVVATKIELLNKAEPLPFHAHENAGEDIRLKYRYLDLRTPEMQRKMRTRIKLVQALRRWLDARDFQDIETPILTKATPEGARDFLVPARMHPGEFYALPQSPQLFKQILMVAGFDRYYQIARCFRDEALRADRQLEFTQLDMEFAWVGERDVQDTTEEMIRSVFREVMGVELASEFPRMTYAEAMRRYGSDKPDLRIALELTDVAELVRNCEFKVFSDWANHADGRVVALRAPGAAALSRKQIDDYAAHAAKHGAKGLAWMKIEDAAKGRDGINSPIAKFLDDATLAAIVSATGAQSGDAIFFGAATYKSASDFMGALRLKLGKDLGLVADGWAPLWVTDFPMFEWDDEEQRYVALHHPFTAPAVDDAADLRANAKTAVSRGYDMVLNGNEIGGGSIRIHNSQMQSTVFELLGIGAEEAEGKFGFLLDALRFGAPPHGGIAFGIDRIAALMAGTESIRDVIAFPKTTTAQCLMTGAPSPVPDKQLAEVHVSIRPKAQP\n>tr|A0A830CSJ2|A0A830CSJ2_9LAMI Uncharacterized protein OS=Phtheirospermum japonicum OX=374723 GN=PHJA_002054300 PE=4 SV=1\nMAMRTFYNEIKGMKVKELPAHLKPMFTIDYAKNSVKRGLDNYHAKYIETSSVDPLFHICFGGMIFSYLVALPEERRHLEHAKEHGGGH\n>tr|A0A5R2N5V0|A0A5R2N5V0_9HYPH 23S rRNA (Pseudouridine(1915)-N(3))-methyltransferase RlmH (Fragment) OS=Mesorhizobium sp. M2D.F.Ca.ET.145.01.1.1 OX=2563933 GN=rlmH PE=3 SV=1\nMKISVHAVGRMKAGPERELADRYFERFAKSGPAVGLEFAGITEIAEGRAQSASERQRDEGSRLQAQLQPGTALILLDERGKNLSSQDFASHIGQLRNGGRKALVLAIGGADGHDPPLRDQAELVMSFGALTWPHQLVRVMLGEQLYRVATRSEEH\n>tr|A0A7G8J7C1|A0A7G8J7C1_9SYNE Uncharacterized protein OS=Synechococcus sp. SYN20 OX=1050714 GN=SynSYN20_02147 PE=4 SV=1\nMVVDCLDHLFLILWSFTTFIDLGFRDLMFFDRLLHAFCFC\n>tr|A0A1L8E3I3|A0A1L8E3I3_9DIPT UDP-glucose 4-epimerase OS=Nyssomyia neivai OX=330878 PE=3 SV=1\nMSNGKTVLVTGGAGYIGSHCVVSLQEAGYQVIALDNFTNAVNNFKNESMALQRVAQITGKDVAFYKCDLLDKEALEQIFQQYKIDSVIHFAAMKAVGESMQQPLLYYKNNLIGMIHLLEVMKKHKVFNLVFSSSCTVYGEPKELPITEEKETGKVTNVYGRTKFFIEEMLRDISVAEEEWNIIALRYFNPVGAHKSGLIGEDPTKQFTNLMPYISQVASGKKDCLTIFGDDYDTPDGTGIRDYIHVMDLSTGHVKALEKLEKQHLRLKMYNLGTGKGVSVLELLQTFERVNNVKVPYVIEARREGDISSMYADPTLAETELGWKAECTLEEMCTDFWRWQTMNPNGYKTGIVNGH\n>tr|A0A1M3I4N8|A0A1M3I4N8_9SPHN 3-oxoacyl-ACP reductase OS=Sphingomonadales bacterium 63-6 OX=1895846 GN=BGO57_05825 PE=3 SV=1\nMSISFEGRVAIVTGAGGGLGRAYALELAKRGAKVVVNDLGGARDGTGHSDAALKVVEEIEAAGGEAMSNGASVTEYAQMVEMVAKAKEKWGGVHVLINNAGVLRDKSFSKMEPEDFEFVVKVHLFGSAYATKACWELMREQNYGRVMMTASSSGLFGNFGQANYGAAKLGLAGLAKTLHLEGAKYNIRVNTLAPLAATRMTEDIIPEQIFPMFAPENVVPAALFLVSEDAPNNVIVGAGAGGYHSAWVTMNTPVILPEGERSVEGFAAHWDQISSREGDFVPVSGMEQTQRVLAAIQKAAAGG\n>tr|A0A7C6JME1|A0A7C6JME1_9BACT ABC-F family ATP-binding cassette domain-containing protein OS=Petrimonas sp. OX=2023866 GN=GXX67_10465 PE=4 SV=1\nMATPILQIDKLTKSFGDLLLFRESSFGIAEGEKVGLIARNGAGKTTLLNILAGKEPYDDGRVVFRNDTRVAYLEQSPTFDPDLTVMEACFSSDNEVVRLIARYEEVIASGDTSNLEEVLTQMDFHNAWERELQVKQVLTWLNITDFQQKMGELSGGQVKRVALANVLISEPDLLIMDEPTNHLDLEMVEWLEERLTRSSVTLLMVTHDRYFLDRVCTRLLEIDDQQIYAYKGNYSYYLEKREERVMAQQAEVERARNLLRKELEWMRRQPQARGTKAKYRIDAFHDLAEKARGESAEQSVRFAAKGSYIGKKIFEAKNVSKRFGDIRITESFNYTFTRYEKMGIVGKNGTGKSTFVKMLLGEVKPDSGYFEIGETVRFGYYSQEGMEFDEQLKVLEAVQKIAEVIDLGEGYRLTASQFLQHFLFPPEKQYDYVYKLSGGEKRRLYLCTVLLKNPNFLVLDEPTNDLDILTLNVLEEYLAGFKGCLIVVSHDRYFMDKVVDHLLVFHGDAKIQDFPGNYSQYREWKAEEDRREAAEAKAEAVKIEAAKAEAINPGKGRVALPNGKTDELGVGSSGETDPETTDLTTHGSKKGEKKRLTYKERQEYESLEGEIERLEKEKESISELLSSGNLPAEELISQSERLSLLLEQIDEKMMRWLELSERA\n>tr|A0A839T1V7|A0A839T1V7_AZOMA Ribosome biogenesis GTPase OS=Azomonas macrocytogenes OX=69962 GN=FHR87_000879 PE=4 SV=1\nMAKRQLNRRQSWRIEKIQEERANRAARRESRLVDELEGGDLGREQEGLVIAHFGVQVEVEARQDELAGQIFRCHLRANLPALVTGDQVVWRPGNQGNGVIVAQLPRRTELCRPDSRGQLKPVAANVDRIVIVFAPLPEPHANLIDRYLVAAEHAGIQPLLLLNKADLVTAENQVRLETLLAVYRALDYPLLEVSARQGSGMDELKARLDGHVSVFVGQSGVGKSSLVNSLLPGLDTRVGALSELTGKGTHTTTTARLFHFPGGGELIDSPGIREFSLGHVTRAEIEAGFREFDDLLGRCRFRDCHHEHEPGCALLKALEQGRIHPQRMESYRHILSSLPQTEY\n>tr|A0A523ZWY7|A0A523ZWY7_9ARCH Transcriptional regulator (Fragment) OS=Candidatus Bathyarchaeota archaeon OX=2026714 GN=E3J20_08840 PE=4 SV=1\nHLYVVESADFLFLMRQTGMTFGNLSSHMSRLETAGYIDVEKEFVGKKPNTKLHLTEDGRAAFQEYRRNMRHVFGDLSS\n>tr|A0A0B5IZ06|A0A0B5IZ06_9VIRU Uncharacterized protein OS=Pandoravirus inopinatum OX=1605721 PE=4 SV=1\nMSQARRVGWRSRRPDAPIHYFFLLHRQTIAGEKRWSSFFGIVSVVLAPLFFSDKRPRPAPPAALSNRTRHGQAARLHTRKAHKACLLRHNQKSIIPSEKEEAEQEKGKQ\n>tr|A0A7W5U4L6|A0A7W5U4L6_9HYPH Surface antigen OS=Rhizobium sp. BK612 OX=2586988 GN=FHX13_001390 PE=4 SV=1\nMKLRTFFLVVPSLFAALALSGCSTTSSLGGGKSLFSSAKPPASATFINALDGGIVERTGIKLSDSDKQRALEAEYRALETSPLGQPVAWKGRNASGEVVPAAPYQVGSQNCRQYTHTVTVDGKPTTARGAACRNDDGTWTPLE\n>tr|A0A382FFA2|A0A382FFA2_9ZZZZ Uncharacterized protein (Fragment) OS=marine metagenome OX=408172 GN=METZ01_LOCUS214166 PE=4 SV=1\nVDKNIIAAGDKTTVEAAKEILWLGGNAYDAAVAAVFTSMTAEPALTGPGGGGHFMAYPADGRAVLFDFFVDMPSGVIEPN\n>tr|A0A835W1B8|A0A835W1B8_CHLIN Uncharacterized protein OS=Chlamydomonas incerta OX=51695 GN=HXX76_008806 PE=4 SV=1\nMEEARVAAVSVSGGVRQQPQVQAQAQTRAASPAASAADAGVGATAATAATPGFAAATATDSAAAATAVAASGPAAAGGGRRPSRSAAVRARSAITHQLHEEQLPLAKREKRDAEFSEQVSDVEGDGVAGTGAAPAAATTAAAEPCGSPPVGDAAAAKQRPRKLRLLPRAPNVICAACAKSCAARGGFFAQGTGAYTCSSCCSRNRIECGFYGPPGTHSLEEAGGRKHNAQQSRPRGISPSASASEGATAVRVVTAATAGTAATAAPGAKAPSGTAAVAGLAAAGGGQKAAAAKAAVARATARVHGAAGASTARKRLPPPPPRPPPPPPPLEDAVPAEDATPAGDATPAPAQPAPPKCTTCGAVRAPHKLTSPGFFARGTGAYTCHGCCVRNLKSAHGFYGPPGTRSLEEAGGRECAECGTQGANSTSWRLHPDRLGHYLCSSCSGRYESRKRKLDRSGGGGGGPAPKAQKRSLGGVVDKASGGGDAPAAAENATAPAAAGKGGSGTKRQRQLAEAAGAGSRSGADAAASSAAAAAPATPAATRQAQSQQPKRQGPTKAASGTVRQAAPAAAAPDGPPAGGGGGAAPAAAAGRPPPAPEPKCSGCSSSFKRTDNGLFGFFSHGTGAYTCHGCCSRNQHAQGFYGPLGTRSLEEAGGRACAGCGRQDATQWRPYPPRLGAYACAACISKHTRRMQQEAQDPEGLTAPADAPRRQTPQPPQQQQQQPKQQPKQQPKQQPKQQQSQQQSPGQGQRQSQPQASGSGPAHSCATPAAPQAQGRGARLGAAPSRAATSAAPAARAQASSQAGASTGLCGASDAAATAATASMSRSTNATAATAFTSSEWTSPAVDGIRCDFCGGRFVRAATGQFGFFARGSSVYTCHGCCCRNLSRYAFYGPPGTRSLQEAGGRECASCRTTQAERWLPHRFRLGLYLCRPCRCRQDKGTLPKVGGGARGNQQAAAAATKAAAPKAVAAKPVAAAGGSARAPPQRRTAAARSEHVVGSDDEELEEQAADGEEEVEKAEDEAEDEEAARSARQRLEQEAAARVRSSRALLAASVDASAVAVAGLIAAEQAAGRRGSSSSGNNSSSCRLPAPPKLEQVAGRISAWLQAHVCQQPLALLLGPSAKALGLDREDGLLGLEAEEQETWNVCRARVCGVWLRVAHQAMEPAAATSPAADAAATAAAAAAAAAAVEARAGAQPAAPSSPAAVQQFRMVAFRASTALASELARWLRSAPRLEVPRASPPPAAPLTPAHAPAARPVRPAGPAEAAQHTSAPGPSQCAAASAAGDGAAVSAGAEVGGGSGGGGSALPPRSPAGSASGSGPAAELPGEDIRVLEAALQPLLLRSVCEAMWLGLTEGSAGDGGVGGGRRRI\n>tr|A0A7X4ZEP7|A0A7X4ZEP7_9CLOT Sugar isomerase OS=Clostridiaceae bacterium OX=1898204 GN=D3Z55_07300 PE=4 SV=1\nMRNRMGKLKRNSIVALAAQIVNIISAFILPRLILSTFGSDVNGLVNSISQFLQIIGLLELGVGAVVESSLYKPLSERNNLKLSQIMTSATKFYKKIAIVLLIYSVGLVMLYPATVGQAYPFFDVAILIIALSVNSFAQYYFGMVNALLLNADQRSYIVQMLSIIATIANTVISVLLIYSGCSIQAVKVVSSFVFLSKPIFLNNYIKRHYQINYHEVYEVEPIPQKWYGIAQHMAHIVLDSTDVVILTIFSSLSSVSVYSVYNLVTNGMRSLVLSVGTGMQSLLGELIAKKEKGKLDTVFARLDWLIHTVAVVCFGCTMALVVPFVQIYTSGVTDINYVQSLFAFFISLAQCFRCIRLPYNVVILAAGHYKQTQSNYIVAALLNISISIFTVIRFGLVGVAIGTLVAFVYQNIWMAHYISKHIVCWPFKNFIRQTLIDLITLACGYAVTRSLYLGELNYVHWMLNGMLTSVIWIALSMIINFIFYRERLREIYYRYIRRLIG\n>tr|A0A7J5A9S6|A0A7J5A9S6_9FLAO RecQ family ATP-dependent DNA helicase OS=Flavobacterium luteum OX=2026654 GN=F6464_13185 PE=4 SV=1\nMQTALQILQKYWKHDAFRSLQNEIIDAVLNGKDTFALMPTGGGKSICFQIPGMMKEGICLVISPLVALMKDQVANLQKKDIKAIALTGGIKSEEMIDLLDNCEFGNYKFLYLSPERLQSDWILERLKNLPINLIAIDEAHCVSQWGHDFRPAYLKIAELKPHFPKVPFLALTATATPKVKEDIIAELNLLNPQIFQKSFARENIAYMVFEVEDKLFRIEQILRKNPQPSIIYVRNRKSCLEVSSQLQSLGIKSTYYHGGLSPKEKDKNMQLWMREEVQVIVATNAFGMGIDKANVKTVIHIQLPENLENYYQEAGRCGRDGEKAFSVILTSPSDIVQAESQFIAVLPDKSFLNTMYVKLCNYFQIAYGEGINEQFSFNLNHFCLKYGFPILKTYNAMQFLDRQGIISLSQEFTEKITLQFLISSKEVIRYVSLNPNDESIILNILRTYPGVYDMQTSFNLQLIAKKSNHSENEVLAVLHKLKEKEIIDYHSRNNDATLIFNEVREDERTINRVSKYLERQNNLKKEQLDAVLHYIQEKSVCRSKLILNYFGEKTDSVCGVCSYCISKNSKKRNTTTTTEAIIILLNKGDLNSREIEIKLKYNAEDIIFALQQLLDNDTIMVKPNNKYSIKL\n>tr|A0A7K6EWN1|A0A7K6EWN1_9PASS F162A protein (Fragment) OS=Grantiella picta OX=266360 GN=Fam162a_1 PE=3 SV=1\nLASLHPLLSLPDRAVKLLGKNIPSILRMSEGVDPKISRRLSIKPQEDLQPKSRSASGVPGYKPTNWEKRFLLWAGHYKKPEDIPETVSIETVRAAMTKLRVKFSYVMIALTIVGCITMVIRGKQAMKRHESLTSINLEKKAQWKAESASAKP\n>tr|B0YHV5|B0YHV5_ULVIN Ribulose bisphosphate carboxylase large chain (Fragment) OS=Ulva intestinalis OX=3116 GN=rbcL PE=3 SV=1\nILAAFRMTPQPGVPAEEAGAAVAAESSTGTWTTVWTDGLTSLDRYKGRCYDIEPLGEDDQYIAYIAYPLDLFEEGSVTNLFTSIVGNVFGFKALRALRLEDLRIPPAYVKTFQGPPHGIQVERDKLNKYGRGLLGCTIKPKLGLSAKNYGRAVYECLRGGLDFTKDDENVNSQPFMRWRDRFLFVAEAIYKSQSETGEVKGHYLNATAGTCEEMMERGQFAKDLGVPIVMHDYITGGFTANTTLSRFCRASGLLLHIHRAMHAVIDRQRNHGIHFRVLAKILRMSGGDHLHSGTVVGKLEGEREITLGFVDLMRDDYIE\n>tr|A0A2S8NPN6|A0A2S8NPN6_9MOLU Uncharacterized protein OS=Spiroplasma sp. ChiS OX=2099885 GN=C6B38_09260 PE=4 SV=1\nMKTLHEMIKDLTGIDVEQDKISDYLEEEVLYLHGAYLRYANLSCANLKGIKITKKQLDQLTVIEENE\n>tr|N8Y4E3|N8Y4E3_9GAMM Uncharacterized protein OS=Acinetobacter gerneri DSM 14967 = CIP 107464 OX=1120926 GN=F960_03962 PE=3 SV=1\nMKLDPQTALVHAERKAPQYIETVQAPIYRASTIIFKNTSALFDRHWTDDYDYSYGTHGTPTTYTLADNIAQIEGGHYCLLAPSGLSAINLVNSCFLSQGDEVWVADNIYGPNMEHLQDLAKRYGVIVKVYNALDVDSFQPSDKCKLLWLEAAGSVSLEFPDLVQLVKKAQALNILTALDNTWGAGLAFSPFDFSSEHLKVDISVHALTKYPSGGGDILMGSVVSQDKALHHKLFQTHAIQGISVSGDDVAQVQRSLASMQIRYEQQAKSALTLLAWLKQQKQFAQVLHPADPDAAGHQFWQEVCQTQKSAGLVSVIFNDHYDLTDIRKFCDNLNLFKLGFSWGGPVSLAMLYDLKKMRALDYPHLKQGFLVRFCIGLEEPNDLIQDIENALNKMK\n>tr|A0A7S0UZ86|A0A7S0UZ86_9CRYP Hypothetical protein OS=Hemiselmis tepida OX=464990 GN=HTEP1355_LOCUS251 PE=4 SV=1\nFWFGGEKEKVTDHCRSWRARSLAGGGRLGARLGGRPTGDLTRSRQLGMLFARLAGKAPFDSPGAWDSPSADADIGGADYGKPINLSIYKSIKDDQCSRRRTGCDWTVVGPVTARSRRWEFK\n>tr|A0A015LJQ4|A0A015LJQ4_RHIIW DNA helicase OS=Rhizophagus irregularis (strain DAOM 197198w) OX=1432141 GN=RirG_229180 PE=3 SV=1\nMSESPSRNRNENNTPEREQPSSPQTMSDAMLESPNRNRNENNTPEREQPSSPQTMSDAMLESPNRNRNENNTPEREQPSSPQTMSDAMLESPNRNRNENNTPEREQPSSPQTMSDAMLESPNRNRNENNTPEREQPSSPQTMSDAMLESPNRNRNENNTPEREQPSSPQTMSDAMLESPNRNRNENNTPEREQPSSPQTMSDAMLESPNRNRNENNTPEREQHFSPQTMSDAMLESPNRNENENNTSEREQRRSLTQTISDAADSTRNFISNALGLRQEQDNMSTPTHLRTENYSNVHTPRNLLSPATVASSLATPRSISSPRTPRRSQISHDNTPRKSQTSTPRRRINTNPENLAENPDNDLLKEYYEGIKSGSATPRTPRRQQRRGDIHSARSAKRLIDLDIQKGDEDVTMLEAEEKITTDQIWGTTIKVEEVRKSFKKFLKEFKLSDLSRRNGRSDDDPFYIEYLKIIERTEEFKFNLDTQNLLAFEDTHKLYYQIVRYPQEIIPILDYVVAQMYTELHEKEPKEDIRVFRVRPYNLGISKNMRELNPSDIDQLVCIKGLLIRSSPILPEMAVAFFRCSICDKSVEVEVDRSKIDEPSRCPRKQCNSSGTMVLIHNRSIFKDKQVCRLQETPDCIPDGQTPHTISLCLYDNLVDIARPGDKIELTAIYRSSPIRVNNRQRTIKSLFKTYLDVVHIRRSENIHENGDNDFTQIYHGLEDENKEVENVQEGFSHDHFSRDQKRKQLTFTEADIQYFKELSKNPLLYETLAHSLAPSIFGMDDVKKGILLQLFGGTNKLFRKSGSPRFRGDINVLLVGDPGTSKSQMLQYVHKIVPRGIYTSGKGSSAVGLTAYVTRDPDTKQMVLESGALVLSDGGVCCIDEFDKMSDGTRAVLHEVMEQQTVSVAKAGIITTLNARTSILASANPIDSKYDPKKSIVRNIDLPPTLMSRFDLIYLVLDKIDKQADWELATHLVSLYAEDSPFSASVNILPVETLAKYIHYARIHYNPIIGNDEAHKALVDAYVSLRRLGQDPRSSENIVTATTRQLESMIRLAEAHARMRLSNTVEMADVEEAERLLREAIKLSALDPETGRIDLDLITTGHGSYERRLLTVMREAFQKMLNRRNITSINWKKALEDFNEQSDVKINEKQFETMVNSLEQEGILRLAGNGNDREIITLNEDDE\n>tr|Q0V3S1|Q0V3S1_PHANO Eukaryotic translation initiation factor 6 OS=Phaeosphaeria nodorum (strain SN15 / ATCC MYA-4574 / FGSC 10173) OX=321614 GN=TIF6 PE=3 SV=1\nMAVRAQFENSNEVGVFSTLTNAYAIVAVGASENFYSVFEAELQDVIPICHATIAGTRIVGRLTAGNKKGLLVPTTTTDQELQHLRNSIPDSVKIQRIEERLSALGNVICCNDHVALVHPDIERETEEIIADALGVEVFRQTIADNVLTGSYMALSNQGGIVHPKTSIQDQDELSSLLQVPLVAGSVNRGSAVVGAGMVVNDWMAVTGLDTTATELSVVESVFRLGEGNGPSNINTTHKDAMVESFY\n>tr|A0A816CJR2|A0A816CJR2_ADIRI Hypothetical protein OS=Adineta ricciae OX=249248 GN=XAT740_LOCUS50392 PE=4 SV=1\nMSIIDVDDAKNRLQEYCQQRNLPLPIYSLIEKTGPDHSPMFQVEVIVDGMTFIGDRSTKKRVAEKLAASEALDYINKPQSPPKKIVNQQTKDPFTLFQSLNLEDESTEIESMEYD\n>tr|K1XWP4|K1XWP4_9BACT Site-specific DNA-methyltransferase (adenine-specific) OS=uncultured bacterium (gcode 4) OX=1234023 GN=ACD_80C00146G0003 PE=3 SV=1\nMAQLFWTGTIKSHTEILQWFDESKISLIKKLHQDWKNWLLAGETEYEQTFNQLFFWELLGYENRINRIPKGAVIGTGIADLTLWYFDEGKYSPDDIQIVCELKGAKTNLVKKQFWHGGLSAVGQWFSYKTGLKNCKRLIVSNFYEIRLYRDNQTDFEVWTLDELIDPKDNYSNLRKLYLLLHRENLLAHTGKSKTEDLLSHFREEQKEITVKFYKEYKQLRIELINDIKQHNPWISIEILIEKAQKIIDRLIFIFFCEDKGLLPDKKLKENIVRSREAGFSAWEVTKKFFGLIDKGSEQLGIPSGYNGWLFQKDDVLDNLEIGDSICKKFTDMTNYDFDDKLSVNVLGHIFEQSISDLENLKIDLLGQEVETWQLADTGKGRRKKDGIFYTPEYIVDYIVQNSVMKYLNEKEDELIKKYRGEKNDPKLVAKAEIEAYQAYQNILQNIKVLDPACGSGAFLVRVFDVLFEENKRVWSILNSLFDESETYKNILTNNIYGVDLNEESVEITKLSLWLKSAQKGKKLNNLDGNIKCGNSLIDDVFIAREKAFDWNVQFKEIMKNGGFNVIVGNPPYVRTQNLDKNSKSFFDEKYKVSYKNYDIYILFVEKAFSLLESDWVCSYIMPKKFINTDYWEKFKMFLYENNFIDSFVDFWTNQIFGDATTYTWIFVFTKGIKKTLNYKNIDDLNQFPPIWFDSINYSNLSWKDWILTNPKEKELFWKLQKESFLWEFTDRVFQGLVTGVDGIYIMEQKWNNLFSKENGKSYTFDCDIVFPLLKWTEIKRYSTPSANYKIIFPYKIVDWKAILIDEETMKNKYAEIYNYLKEFEIKLRTREWWKFDNQNWYSYSRNQNIALMPSKKILTQVLSNHSSLTLDEAWKYFFVWWWTAGWYWISIDSNWKLDYKYLLTLLNSSLLEWFLHKYASPFNGWYYAYSRATMEKLPIKEIPLSDQQPFVERADKMLALNKDLYELTGKFLHRIQDNLKIEKLTKKLEKFYELDFKYFLIELKKQKVLLTLAQQDEREPYFKECKEKILALKGEIERTDKEIDDMVFDLYGLSEEERKVVFNG\n>tr|A0A6I4N661|A0A6I4N661_9ACTN Transcriptional regulator WhiB OS=Streptomyces sp. BA2 OX=436595 GN=whiB PE=3 SV=1\nMDWRHNAVCREEDPELFFPIGNTGPALLQIEEAKAVCRRCPVMEQCLQWALESGQDSGVWGGLSEDERRAMKRRAARNRARQASA\n>tr|A0A2V5BXM8|A0A2V5BXM8_9GAMM 50S ribosomal protein L23 OS=Pantoea sp. AG1095 OX=2184004 GN=rplW PE=3 SV=1\nMIREERLLKVVRAPHVSEKASTAMEKTNTIVLKVAKDATKAEIVAAVEKLFEVEVKDVNTLVVKGKVKRHGQRIGRRSDWKKAYVTLKEGQNLDFVGGAE\n>tr|A0A4Q4HXK7|A0A4Q4HXK7_ECOLX IS3 family transposase (Fragment) OS=Escherichia coli OX=562 GN=EWK56_27125 PE=4 SV=1\nELPTYGYRRVWALLRRQAELDGMPAINAKRVYRIMRQNALLLERKPAVPPSKRAHTGRVAVKESNQRWCSDGFEFRCDNGEKLRVTFALDCCDREALHWAVTTGGFNSETVQDVMLGAVERRFGNELPASPVEWLTDNGSCYRANETRQFARMLGLEPKSTAVRSPESNGIAESFVKTIKRDYISVMPKPDGLTAAKNLAEAFEHYNEWHPHSALGYRSPREYLRQ\n>tr|A0A455L1B7|A0A455L1B7_9REOV Non-structural protein 2 (Fragment) OS=Rotavirus C OX=36427 GN=NSP2 PE=3 SV=1\nMAELACFVSFSLTEDKVKWFPINKKAVKTMLCAKVEKDQRSNYYDTILYGVAPPPEFRNRFKTTERHGLDYESDQYSEVVNLLADVLNMVSMPTEKFQFDIVKTVVQVRHLENLLLRIKDMDDILNENVKLRVKAVMIACNLVNETETTPLTESNDIVYQDSYFTITRLDYSSHKLLPLMTEEYKITINTKTDIPERDQTAFAAYIRYNFNKFAAISHGKRHWRLIPHSQLMAHAERLDRKIKSDKKHGRQFAYDDGDMAFVHPGWKACIGQLCGGTTFDVAKTSLYSVKTSKTVRTATNKIESDLISMVGN\n>tr|A0A2N9NG79|A0A2N9NG79_9BACT Glutaredoxin OS=Verrucomicrobia bacterium OX=2026799 GN=SBV1_130006 PE=4 SV=1\nMNKPKIVAYLKPTCGWSQGVRAIFRKYDLPYEDRDIINDPAQRQEMIERSGQMLSPCVEIDGSMLADISGEEVEAYLLAHNLVTPSNREADAPIDQPCAHEAPPSAPLHFRR\n>tr|A0A1X0RRK1|A0A1X0RRK1_RHIZD Chromatin modification-related protein EAF3 OS=Rhizopus microsporus OX=58291 GN=BCV71DRAFT_229219 PE=3 SV=1\nMYFVHYKGWKQTWDEWITEDRVLKYTESNRQKQKQLQEMNARLKTSRTPTRESTEPRGRKRYRDSDIERQRAEEETRRTEFKLIMPETLKGILVDDWENITKNRLVLNIPGEYTVDRILDEYKNQYPVKDDVLDEFIKGIRLYFNKTLGSLLLYRNEYDQYTELCADKEPSSIYGAEHLLRLFVEMPNLLAQASIDAETQNELKSRFEDFLNYMQEHEKDYFLNDYQTKA\n>tr|A0A1C3EUB3|A0A1C3EUB3_9PLAN Translational regulator CsrA OS=Planctopirus hydrillae OX=1841610 GN=csrA PE=3 SV=1\nMLVLSRKAGESLLIGQGLLGEGIQVTVVAVQGNRVRLGITAPAEVSIRRQEIVLDLPEVAGSEEPCAMSSESHSRTPEFV\n>tr|A0A810P5E5|A0A810P5E5_9MYCO Uncharacterized protein OS=Mycolicibacterium sp. TY81 OX=2759662 GN=MTY81_06740 PE=4 SV=1\nMPSTNWFERLTGFTEVDYESTCSRLSVDGNQLVSLVNGARYGTGTLRTPTLAELRATVTISDRGRTTVTCTVGDVGAMHGEPEFEGALFQVASQFNLLEMTHYTVTPEDGVTRYAHDHTQGPACAIAAGAGTIYRNYFAPVNGVPGQTADRQLNMLERLGLSLSTHLGRPISSLWRMENGYALCTADGLAAISDYLAAASPQTRDSLAGELAIGLHLGVEVTGVEPLPRQAVSQAYCSALPVAYSDVPQRYWEGFARLVLDSAYEATLLAAAESAANGWSNIVLLTRLGGGVFGNDDEWIDTAILRALKIVECAGLDVRLVSYGSVHPNMRGIADRWAR\n>tr|A0A2T0Q272|A0A2T0Q272_9ACTN Acetylornithine deacetylase/succinyl-diaminopimelate desuccinylase-like protein OS=Allonocardiopsis opalescens OX=1144618 GN=CLV72_105245 PE=4 SV=1\nMAEVSGEGVEGGRAEVEVVDLCRELIRIDTSNPGDHSGPGERVAAEYVAAKLDEVGLATQIFESHPRRTSVVARMEGEDPSRPPLLLHGHLDVVPADAADWSRDPFGGEIADGCVWGRGAVDMKDMDAMILAMVRERMRTGRRPPRDIVLAFLADEEAGGYFGAKWLVDHHPELFADCTEAVGEVGGFSFTVRDDLRLYLIETAEKGIAWMRLTATGTAGHGSMVNDDNAVTELAEAVARLGRHRFPLRLTKTVRAFLEEVCDAFGIEFDPDDEEAVAETVARLGPIATMIGATLRNSVNPTMLRAGYKTNVIPQTATAEVDGRFLPGLEDEYFATIDELLGPKVTRDSERQLPAVETDFSGALVAAMADALKAEDPAARAVPYCLSGGTDAKAFAELGIKGYGFAPLKLPPELNFAGMFHGIDERVPVDGLQFGVRVLNRFVDNC\n>tr|W1INK5|W1INK5_9GAMM Uncharacterized protein OS=Xenorhabdus cabanillasii JM26 OX=1427517 GN=XCR1_1340019 PE=4 SV=1\nMTEAQRTAFTVASGHFDITFLYLVCVGFFLAILFLWAAWAAVDVWNGWANEKVRNQTISQFAMRTAILLVVAVWMFAS\n>tr|A0A520JI48|A0A520JI48_SPHSX PIN domain-containing protein OS=Sphingomonas sp. OX=28214 GN=EOP67_16805 PE=4 SV=1\nMAGRMTTVVDASVAVKFSVEELGSAAASDLIRSEPRLVAPDLILTEAANAYWAMVRGSRLLMIHAERNLDDLPRYFDRLYPTGTLIQQALRIAFHLRHPVYDCVYLALATKLECRLITADRKFHLKAADHYPIDLLPFETD\n>tr|A0A2R7W9K3|A0A2R7W9K3_ONCFA Abhydrolase_2 domain-containing protein OS=Oncopeltus fasciatus OX=7536 GN=OFAS_OFAS008407 PE=3 SV=1\nMSGLESIRVGRAIEVEYLRLRPEAGRERTAGRFSSNMDRRYKVSGTHKFSNIILCVMVLKAWFSVSKDLIVNQQHVNKAIDLLDSIIQVEKENGIPLNRMIIGGISQGGMLAIDAVYRSYPKVAGCIAVSSVILDSNIFEAAKTRSKNPPLLMCVGSEDNAIGVELARESFQKIFKAGVPAEWKEFLGAHHELTVEELELIYERVKQLIPEKNL\n>tr|M4H1V8|M4H1V8_PLEBA Putative secretory peptide-20 OS=Pleurobrachia bachei OX=34499 PE=2 SV=1\nMRCFLILISLLALSSATAAWNPVVRDTFIPFDLESTPLQIKTDSTAGSEEQIWVRTYTADGSLVGGVGLKFTSSIQYAIGFCNNNLWVSLPVQPPEEVDKVWTIRKNTTAVSIECNGVEVLNYQLSESSDTRCVSTWGGDVVEKIMFHSSLDTASDSYRTAAVWCPVVRDTLIPFDLESTPLQIKTDLTAGSEEQITVDTYNIGSSFIGGVGVKFTSPIQYGISFCTTSWTVLPVQPGDEVDKIWTIRKTTTAVRIECNGLEVLNYQFSDSSASSCVSRWGGDVVEKILFYAYDTASDSYRVKPVKSVCPEFTVDGSVQESWNDTDIGQTVTINCQRKHVLDGSSERTCNAEGVWDSDAPLCRKLSEFRWEIEKLGVMGLRVFPYYS\n>tr|A1JIE2|A1JIE2_YERE8 Putative membrane protein OS=Yersinia enterocolitica serotype O:8 / biotype 1B (strain NCTC 13174 / 8081) OX=393305 GN=YE0246 PE=3 SV=1\nMPAFVISLWRQIVLSSPLFVLLALGYGLVRFGQWPSTITDGLTRFVFSLALPAMLFRMMCDFSERPAVDARLLIAFFGSCLVVFVIGRIIASRVFHLDGVSGSVFALGGIFSNNVMLGLPIATIMLGEKSIPAVALVLVFNGLILWTLVTISVEWARNGSPTLAGFAKTARSVLTNPLIIGIISGTLFSLTGLQLPQFIDQPVTMLGQVAPPLSLIVLGMGLAEYRVSEGWQISSAICFLKLIVQPMVIWALAWAMNLPALETQVVVLLGSMATGVNVYLMSRQFNVLTGPAAASLVMSTVLAAVTTPLILTIIGVGMS\n>tr|D5EZ65|D5EZ65_PRER2 Uncharacterized protein OS=Prevotella ruminicola (strain ATCC 19189 / JCM 8958 / 23) OX=264731 GN=PRU_0802 PE=4 SV=1\nMKATELAQQQIERAIRKIADKFPPTQEANVMTDIHFRVTQDTGELMAFDDNDEEINRCIIEDWIGDTSDNFFEEIPAVFRKCLDKMKDTIENMSILKPFSFVLENEDKESVAELYLVDDETVIFDPELMKGLDEDLDAFLKQLLAD\n>tr|S9WGT7|S9WGT7_CAMFR Uncharacterized protein OS=Camelus ferus OX=419612 GN=CB1_001879002 PE=3 SV=1\nMASNDTFYITTENSEMSTNIVELRQIHMETIPVETIPVETIPVETMALESIEGCEDISGSWVHGGHHQLPLMALQPLVISSPNPGDHDQEMIMVQTQEEVVGYFESDNLQAGNVENQILIPVDDDAFQQTLASLAASASSSAHSHSRTRSSQGKKPSGKKSCAGSKAEAASSSKVVTKKWEQKQVSIKTLEGEFSVTMWSANNNTDLKTGQTEEHPAPNFSENMTEKKLPPEGIPGVDFSDPKQLAEFTRMKPQNTKDETPRTIACPHKGCMKMFRDNSAMRKHLHTHGPRVHVCAECGKAFVESSKLKRHQLVHTGEKPFQCTFEGCGKRFSLDFNLRTHVRIHTGEKPFVCPFDCCNRKFAQSTNLKSHILTHVKNKKSQ\n>tr|A0A183M848|A0A183M848_9TREM Uncharacterized protein OS=Schistosoma margrebowiei OX=48269 GN=SMRZ_LOCUS12223 PE=4 SV=1\nMMVGGSQQETLDPGFLLLGTRHQGVPVILKKLVLPGGFDLVSLSFTVID\n>tr|K9U3M1|K9U3M1_CHRTP Sulfate ABC transporter, inner membrane subunit CysW OS=Chroococcidiopsis thermalis (strain PCC 7203) OX=251229 GN=Chro_3349 PE=4 SV=1\nMNSRMNNSKAKSREQKSWVPTILIVVAIAYVSLVLYIPALNVFIQAFSRGVGPFFANLTRPEFLHAVQLTVMLAAIALPLNTVFGLCAAWALTRHRFPGRAFVLSLIDLPFSISPVVAGLMIVLLYGRQGWFGGWLQDRGLNIIFAFPGMVLATAFVSMPFVAREVIPVLEELGSDQEEAAKTLGANDWQIFWRVTLPNIRWGLLYGLILTNARAMGEFGAVSVVSGNISGKTQSLPLFVEDAYKQYETEAAYSAAVLLALLAVVTLVLKEILERKTRIKDVE\n>tr|A0A090PRU2|A0A090PRU2_NONUL Uncharacterized protein OS=Nonlabens ulvanivorans OX=906888 GN=JCM19298_2278 PE=4 SV=1\nMVIMKRIIYILCAVVGFTAAAQQTPAPATNKSYTIMNATAHIGNGELIENSVIVIENGKITTVADATTVKMQPKGEVINASGLHVYPGIIACNTTLGLVEIDAVKASDDDREIGTFNPHIRSLIAYNAESRVVETMRLMVFLLLK\n>tr|A0A4S0ZDT7|A0A4S0ZDT7_9BACT NAD-dependent succinate-semialdehyde dehydrogenase (Fragment) OS=bacterium M00.F.Ca.ET.156.01.1.1 OX=2563902 GN=EN799_58250 PE=3 SV=1\nMPLCLPMIRRLKSPHLFGAIDRLPALGRPVGNKTFEVVNPSTGEVLAELPDMGVEETRAAVDKAYVAQSGWAALTARERSDVLWRWHQLIIDHAGDLAAILTAEMGKPLAEAISEVSHAAAYLQWYAEEANRVYGETISAPSTDRRMLVIKQPIGVVGTITPWNFPASMVARKISPALAAGCTIVLKPAEQTPLVAGAMFALAHQAGFPDGVVNLIYASEGDRVGRELCTNSKIRKISFTGSTEVGRLLMRQCSDQIKKVSLELGGNAPFIIFDDADIDGAVDGAVQAKFRNAGQTCVSANRIYVQSSVHDEFVKKFVERIRHLSVGDGFDAGVDIGPLIDKHALAKIESHIADAIAKGGTIRCGGQRIGKNGTFFEPTVLTEISSVMAVAQEETFGPLAPIIRFNDAD\n>tr|A0A5P2QPP3|A0A5P2QPP3_9RHOB Uncharacterized protein OS=Paracoccus yeei OX=147645 GN=FOB51_08200 PE=4 SV=1\nMQIVGICRFSLLGRGDWAAFRTIPQDKADENAEAVEARKASIFAPERLERRFTTFEHLTLASIRAQTDPDFTFVVLASELMPQPYRDRLAALCAAVPQVVLRFFPVIHAGTAQGQVFKELGIDYRQTLQFRLDDDDALCNVYIRRMRQAAGGIVPNAFPFAASFRDVLFCSVGGDHAGVYQWRSPFFSAGVALFHPSASIFGFGHYGMAERFTSISIPGHMSLVTHNGMNDTTLDEGRIRRQKMNLIDDEAATKAVERHFPYLTPEARAVAGLPV\n>tr|A0A252DKQ5|A0A252DKQ5_9NOSO DNA polymerase III subunit gamma/tau OS=Nostoc sp. RF31YmG OX=1932668 GN=dnaX PE=3 SV=1\nMSYEPLHHKYRPKSFAELVGQEAIATTLTNAICSSKIAPAYLFTGPRGTGKTSSARILAKSLNCLGSGKPTAEPCGVCDVCQGITKGYSLDVIEIDAASNTGVDNIREIIEKAQFAPVQCRYKVYVIDECLTGDSLVLTDEGLLRIDDPNIKNKRVLSYNDSSEKWEFKQVVRWLDQGERQTLVIKTTKGEIRCTGNHLVRTDRGWVAAKDVKEGVKILSPVNVDAAASFTNLATVESVYLAGVEQVYDIEVEDNHNFVANGLLVHNCHMLSTQAFNALLKTLEEPPKHVVFVLATTDPQRVLPTIISRCQRFDFRRINLEAMVKHLSAIAHKENIQISLDAVTLVAQIAQGGLRDAESLLDQLALLSGEIIPDRVWDLVGSVSERDLLGLLDAIAQDHAEAVLDCTRNILNRGREPLTILQNLAACYRDLLIAKTAPNRHDLVACTQQTWQAFIGLAQKLDITTILAGQKHLREAEVQIKNTTQPRLWLEVTLLGLLPSANIPVQAASVAPRVSAPVVSPSQPPITSSPPAVASPPVSPLSPPANNISALKAVPSQPPETITVSQPPEEPQPLHPPVQPVTPAASPPVPELIEDTEADFTQVWQQVLSNIQQIPRRELLRQMCHLMEFDGAYARVGVKSAWYKKVQTDLQMITAAFQQTFQREVKVSLEIGNPSTSTSAKKESSANGSSKLKQPSPPSYDKQIPPPAPVQPTPTPAPTKTEPTPKGNSGVQTLPPPTPTTSGDWETDEVAIAAQRLAEFFQGQIIRLSDDAAAFSETMVGSDLLDESDLDDE\n>tr|A0A0B2USS7|A0A0B2USS7_TOXCA Cullin-4B OS=Toxocara canis OX=6265 GN=Cul4b PE=3 SV=1\nMFRSTEEPGLILMEACDYSRKYLVEPPSNANFSSPVVSGRDLDGWDVGLEIFRDVIMNNDRVRMRTTSGIIKLIETEREGAQIDRQLVKSLLRMMSSLGIYQAVFERRFLETTTALYETEGRNLSRDLEVPAYLLHVKRRLDEESNRVDYYLDASTRKELMAVAEKSLIVDHMEAFIDKGVESMLSGNHCSDLKLMYSLLARTKNGLVLLKSAFAAYIKVCTDHIFASLMFTLLPGVESMLSGNHCSDLKLMYSLLARTKNGLVLLKSAFAAYIKVCTDHIGCGVESMLSGNHCSDLKLMYSLLARTKNGLVLLKSAFAAYIKKVGQAMVMDSARDKTLVADLLVMKSKLDNMLKSCFRNNEKFVQAEKDAFDYFINTRANKPAELVAKYLDSKLRSGNKESTDEELENLMDEVIVIFRFIQGKDVFEAFYKKDLAKRLLLGRSASVDAEKSMLSKLKQECGAGFTTKLEGMFKDMELSKDLAVAFKQYLDHGGPDRALQHSDGHIEFSVNVLTMGHWPSYEPMDVVIPPYLAEYQELFKRFYLSKHSGRKLQWQHSLAQVLLRAHFKPTVVKELQVSMFQALVLLLFNEKTEWAVEEISNATKIETNELERTLQSLACGKLRVLLKTPRGKDIKPKDRLTFNEECNDRLYRIRICQVQMKETAEEHSQTEEQIFQDRQYQIDAAIVRIMKTRKSLAHQLLISELFKQLRFSVKPIDLKKRIESLIEREYMCRDKDDCNTYNYVA\n>tr|A0A3R9XIK9|A0A3R9XIK9_9ACTN Uncharacterized protein OS=Streptomyces sp. WAC05374 OX=2487420 GN=E2B92_01640 PE=4 SV=1\nMDRSVWDGVERLRQWLDAKAAPATAGDVRLLRVLKIGEEYGEVAEALHGALGANPRKGASHTWQDVEQELCDVIVTSMVALATINGDGARLLDERVRHLVRRALPDEPA\n>tr|A0A0E1UTW8|A0A0E1UTW8_BURPE ATP-dependent endonuclease, OLD family OS=Burkholderia pseudomallei Pakistan 9 OX=595498 GN=BUH_4320 PE=4 SV=1\nMRLCRFEVRNFKCVEYASLEWEDLLVLIGENNAGKSTILSAIAAFLSGSAIKDPSLFRRHLTDVANAIELIGHFDGLSDEETTQVAVRGRMNGDRWVLKKRYWFEAGEDGESGGWKEALYSFSGAERFEGWPEADATWNAFPEEYQPLIAALPNRGVRPTNAARETLREAVRRQRPDLVAFGAPNWVPNPGGGGNWKSNANSILPRPILVRAVQEASDETNAKDASTYGKLVNLIVERSLAQRPEMVRLQEALDEVLALFRPDEANPQRQAQEVRDLQDRINRSLNEVVGGQALIRTEAPEIRSMVLPSTSLVIRDVEAGIDTDVGHQGHGLQRTLVITLLQSLADAQAQVVPGAALAPVRANILLIEEPELYLHPQMERLMRDVLYRLAEQASTQVACCTHSPVFLDIATKYRAIIRMFKTPQGDAAAHQVTQDLFPGQPLQADRQRLNTVARFDPTVNELFFAKRVVLMEEFSAIAAFERGAELMGLFERHLRLRREVSLVDCNGKSNIPAFQRVLNAFNIPYRVLHDEDPGNPAEQANNQNILALLVAGANQRHLVAPDLEGLLGYQAPRKNKPFLAVSTVEDLHAQGQLPAAFREAVCMAYFGQAVEPLPPP\n>tr|A0A5A7S8C7|A0A5A7S8C7_9NOCA TetR/AcrR family transcriptional regulator OS=Rhodococcus cavernicola OX=2495913 GN=FOY51_19370 PE=4 SV=1\nMPRSGAETRSHLLKVAGELFYAKGIRATGVDLVAVEAGVAPTTLYRQFASKDDLVGSYVEGVDLAFRDRFASAIAAAGAEPRDQIFAIFDDAIAQAAQDHFRGCPAQMALAEYPDPASSAHANAVTAKSWLLNSIAAVTERLDVDDSVALARQLFVVWEGMLASTMSMGSTGPAQQSRRIVEALLPGE\n>tr|A0A3A5ZLU0|A0A3A5ZLU0_9BACE Inorganic phosphate transporter OS=Bacteroides sp. AF25-38AC OX=2292924 GN=DWY55_04125 PE=4 SV=1\nMELLVIIIVLALIFDYINGFHDAANSIATIVSTKVLTPFQAVIWAAFFNFVAFFIAKCVIGGFGIANTVSKTVMEPYITLPIILAGVIAAIAWNLFTWWKGIPSSSSHTLIGGFAGAAIMAHGFEAIQLSIILKIAAFIFLAPLIGMVVAFGFTLLVLYICRRAHPHTAEVWFKKLQLVSSALFSIGHGLNDSQKVMGIIAAAMIAGHSEGLGMGINSIDDLPDWVAFSCFTAISLGTMSGGWKIVKTMGTKITKVTPLEGVIAETAGAFTLYLTEYLKIPVSTTHTITGAIIGVGATKRLSAVRWGVTKSLMTAWVLTIPVSALLAAGIYCIVSLF\n>tr|D6CL53|D6CL53_THIA3 UDP-N-acetylglucosamine 1-carboxyvinyltransferase OS=Thiomonas arsenitoxydans (strain DSM 22701 / CIP 110005 / 3As) OX=426114 GN=murA PE=3 SV=1\nMDKLRITGQRTLQGVVQASGAKNAALPLIAAALLTAETVQLNNAPQLMDVRTLAKLLRSLGAQVEQDGGQIRLSAAAVNHYEASYELVKTMRASVLVLGPLLARFGQARVSLPGGCAIGARPVDQHIKGLQALGADIAVEHGYIVARVATPSGRLRGARITTDMVTVTGTENLMMAATLAEGETLIDNAAREPEIVDLANLLRAMGAQIRGDGTSQIRIQGVDALHGASHRIIPDRIEVGTFLCAALAARGDVTVQGAEPAHQDALLDKLREAGAQIDTGADWVRLRADALPGGRPRAVSVRTTEYPGFATDMQAQFMAVNCLADGAARMTETIFENRFMHVQELMRLGAQIDIDGHTCVVHGVPQLSGATVMATDLRASAGLVVAALAAEGETVIDRIYHLDRGYDAMEVKLRGLGAQIERISDRISGK\n>tr|A0A150TBH6|A0A150TBH6_SORCE Uncharacterized protein OS=Sorangium cellulosum OX=56 GN=BE18_01125 PE=4 SV=1\nMKTHDGYVALLASGGKRKLRANSLLAYGDEESRFKAAVLFHEAAEIERRALSLLEDAAPETRLRAAVERCACLVMGLDVVEAARAFREVEEASAAVPQETANAHRDRLDPLYFAARQDLTELLKRAPVLVSSRFRWEEIAETDRSRARAELDALLQRFPGESTFHLVDARAALDERRFDDLGRAVRRAHRLCPDNPLLRAYMLLVTAQSIAYPGSATTREEAEAELDTAYQELNREPADGVVYLGFMTASLAAFLAAFYAGEDAAEAHGRRARWAAEIAAQRRSIISEDIGKYIEAAGPLIELLTTQPQMLTAIIENTLREALLNSDVGRASGESLQQPKAASLIRGVISQASRWLTPSAELAELSELALAA\n>tr|H3BNA2|H3BNA2_HUMAN Coronin (Fragment) OS=Homo sapiens OX=9606 GN=CORO1A PE=1 SV=1\nMSRQVVRSSKFRHVFGQPAKADQCYEDVRVSQTTWDSGFCAVNPKFVALICEASGGGAFLVLPLGKTGRVDKNAPTVCGHTAPVLDIAWCPHNDNVIASGSEDCTVMVWEIPDGGLMLPLREPVVTLEGHTKRVGIVAWHTTAQNVLL\n>tr|A0A7L4N192|A0A7L4N192_9AVES FA11 factor (Fragment) OS=Ceyx cyanopectus OX=390723 GN=F11 PE=4 SV=1\nSARTVRIVGGTDSSPGEWPWQVSLHVKLSRQRHLCGGSIISKQWILTAAHCITSLENLNIWRVYAGILKQSEINEDTPFFKVEEIIVHPQYKYAQTGYDIALMKLDKPMNFTDLQLPICLPSKEDANILYTNCWVTGWGYRKEKGRVQDILQKAAVPLMSKEECQARYRKRTIGDKVICAGYEEGGRDACK\n>tr|A0A373A0Y4|A0A373A0Y4_9ACTN DUF3117 domain-containing protein OS=Kitasatospora xanthocidica OX=83382 GN=DR950_28830 PE=4 SV=1\nMAAMKPRTGDGPLEVTKEGRGIIMRVPLEGGGRLVVELTPDEAQALGEALKKACG\n>tr|K9IQ04|K9IQ04_DESRO DNA polymerase subunit gamma-1 OS=Desmodus rotundus OX=9430 PE=2 SV=1\nMNRLLWKKVAGSTVVGPGPVPAPRRWASSSVSVPVSSNGQPQVRSSEGGQLRYNPLHIQMLSRGLHEQIFGLGAETPGEAAVRRSVEHLQKHGLWGQPDAPLPDVELRLPSLYGGDLDQHFRLLAQKQSLPYLEAANSLLQAQLPPRPPSWAWAEGWTRYGPAGEAEPVAIPEERALVFDVEVCLAEGMCPTLAVAISPLAWYSWCSRRLVEERYSWTSQLSPADLIPLEVPARTGSPAQRGQQEQLVVGHNVSFDRAHIREQYLVQGSLTRFLDTMSMHMAISGLSSFQRSLWMAAKQGKRKAQHDTQRAQKPRSKANGPVVSSWDWLDISSVNNLADVHSLYVGGPPLRKEPRELFVKGSMRDIRENFQDLMQYCAQDVWATYEVFQQQLPLFLERCPHPVTLAGMLEMGVSYLPVNQNWERYLAEAQSTYEELQWEMKKSLMDLANDACQLLSGERYKEDPWLWDLEWDLQEFKQKKAKKVKRKEPEATSPLPVEAAEAPGAPEDQEDPGPPSEEEESQRAVATRTCLEQLKGTTALLPKRPQHLPGHPGWYRKLCPRLDDPAWAPGPSLLSLQMRVTPKLMALTWDGFPLHFSERHGWGYLVPGRRDNLAHVPASTSPAPTGVTCPYRAIESLYSKHCLEQGKRQPEPQEAGLAEDFLLAEEWQMVEELGCLEVQAEAEVEPAEGAVAAQPPAPTGTGRPRGSQPAYHHGNGPYHDVDIPGCWFFKLPHKDGNSCNVGSPFAKDFLPKMEDGTLQAGPGGASGPRALEINKMISFWRNAHKRISSQMVVWLPRSALPRVVTRHPDYDEEGRYGAILPQVVTAGTITRRAVEPTWLTASNARPDRVGSELKAMVQAPPGYVLVGADVDSQELWIAAVLGDAHFAGMHGCTAFGWMTLQGRKSRGTDLHSKTATTVGISREHAKIFNYGRIYGAGQPFAERLLMQFNHRLTLQEAAEKAQQMYAFTKGLRRYRLSDEGEWLVRQLHIPVERTEDGFVSLRDLRKIQREASRKSRRKNWKVVAERAWTGGTESEMFNKLESIAMSDEPRTPVLGCRISRALEPSVAQGEFMTSRVNWVVQSSAVDYLHLMLVAMKWLFEEFAIDGRFCISIHDEVRYLVQEGDRYRAALALQIANLLTRCMFAYKLGLNDLPQSVAFFSAVDIDRCLRKEVTMDCETPSNPTGMERRYGIPQGEALDIYQIIELTKGSLEKRSQPGP\n>tr|A0A2N8M530|A0A2N8M530_9GAMM Short chain dehydrogenase OS=Alcanivorax sp. MD8A OX=1177157 GN=A15D_00345 PE=3 SV=1\nMKTVLITGAASGLGWALAQQAFALGYRVILADMNEVLLEARVEALAARDAERVTSRVLDVTNSDAVTLLVPWLEKHGGLDLLVNNAGITHRSLAEKTAMSVFQKVMAVDWQAPVELSVACLPLLKKSRGGIINIGSMAGWMPVLGRAGYCSAKSALGQFFEVMRGEVSRYGIHILMAYPSFLDTPIEKNALGHDGKPAAHARSMVGNMRTPEWMAEQVFEAYGKGRKRLFPDRFTWFASVLWRVAPDLYQRLMLRKFASELEQ\n>tr|A0A8A9J5M6|A0A8A9J5M6_SARS2 ORF1ab polyprotein OS=Severe acute respiratory syndrome coronavirus 2 OX=2697049 GN=ORF1ab PE=4 SV=1\nMESLVPGFNEKTHVQLSLPVLQVRDVLVRGFGDSVEEVLSEARQHLKDGTCGLVEVEKGVLPQLEQPYVFIKRSDARTAPHGHVMVELVAELEGIQYGRSGETLGVLVPHVGEIPVAYRKVLLRKNGNKGAGGHSYGADLKSFDLGDELGTDPYEDFQENWNTKHSSGVTRELMRELNGGAYTRYVDNNFCGPDGYPLECIKDLLARAGKASCTLSEQLDFIDTKRGVYCCREHEHEIAWYTERSEKSYELQTPFEIKLAKKFDTFNGECPNFVFPLNSIIKTIQPRVEKKKLDGFMGRIRSVYPVASPNECNQMCLSTLMKCDHCGETSWQTGDFVKATCEFCGTENLTKEGATTCGYLPQNAVVKIYCPACHNSEVGPEHSLAEYHNESGLKTILRKGGRTIAFGGCVFSYVGCHNKCAYWVPRASANIGCNHTGVVGEGSEGLNDNLLEILQKEKVNINIVGDFKLNEEIAIILASFSASTSAFVETVKGLDYKAFKQIVESCGNFKVTKGKAKKGAWNIGEQKSILSPLYAFASEAARVVRSIFSRTLETAQNSVRVLQKAAITILDGISQYSLRLIDAMMFTSDLATNNLVVMAYITGGVVQLTSQWLTNIFGTVYEKLKPVLDWLEEKFKEGVEFLRDGWEIVKFISTCACEIVGGQIVTCAKEIKESVQTFFKLVNKFLALCADSIIIGGAKLKALNLGETFVTHSKGLYRKCVKSREETGLLMPLKAPKEIIFLEGETLPTEVLTEEVVLKTGDLQPLEQPTSEAVEAPLVGTPVCINGLMLLEIKDTEKYCALAPNMMVTNNTFTLKGGAPTKVTFGDDTVIEVQGYKSVNITFELDERIDKVLNEKCSAYTVELGTEVNEFACVVADAVIKTLQPVSELLTPLGIDLDEWSMATYYLFDESGEFKLASHMYCSFYPPDEDEEEGDCEEEEFEPSTQYEYGTEDDYQGKPLEFGATSAALQPEEEQEEDWLDDDSQQTVGQQDGSEDNQTTTIQTIVEVQPQLEMELTPVVQTIEVNSFSGYLKLTDNVYIKNADIVEEAKKVKPTVVVNAANVYLKHGGGVAGALNKATNNAMQVESDDYIATNGPLKVGGSCVLSGHNLAKHCLHVVGPNVNKGEDIQLLKSAYENFNQHEVLLAPLLSAGIFGADPIHSLRVCVDTVRTNVYLAVFDKNLYDKLVSSFLEMKSEKQVEQKIAEIPKEEVKPFITESKPSVEQRKQDDKKIKACVEEVTTTLEETKFLTENLLLYIDINGNLHPDSATLVSDIDITFLKKDAPYIVGDVVQEGVLTAVVIPTKKAGGTTEMLAKALRKVPTDNYITTYPGQGLNGYTVEEAKTVLKKCKSAFYILPSIISNEKQEILGTVSWNLREMLAHAEETRKLMPVCVETKAIVSTIQRKYKGIKIQEGVVDYGARFYFYTSKTTVASLINTLNDLNETLVTMPLGYVTHGLNLEEAARYMRSLKVPATVSVSSPDAVTAYNGYLTSSSKTPEEHFIETISLAGSYKDWSYSGQSTQLGIEFLKRGDKSVYYTSNPTTFHLDGEVITFDNLKTLLSLREVRIIKVFTTVDNINLHTQVVDMSMTYGQQFGPTYLDGADVTKIKPHNSHEGKTFYVLPNDDTLRVEAFEYYHTTDPSFLGRYMSALNHTKKWKYPQVNGLTSIKWADNNCYLATALLTLQQIELKFNPPALQDAYYRARAGEAANFCALILAYCNKTVGELGDVRETMSYLFQHANLDSCKRVLNVVCKTCGQQQTTLKGVEAVMYMGTLSYEQFKKGVQIPCTCGKQATKYLVQQESPFVMMSAPPAQYELKHGTFTCASEYTGNYQCGHYKHITSKETLYCIDGALLTKSSEYKGPITDVFYKENSYTTTIKPVTYKLDGVVCTEIDPKLDNYYKKDNSYFTEQPIDLVPNQPYPNASFDNFKFVCDNIKFADDLNQLTGYKKPASRELKVTFFPDLNGDVVAIDYKHYTPSFKKGAKLLHKPIVWHVNNATNKATYKPNTWCIRCLWSTKPVETSNSFDVLKSEDAQGMDNLACEDLKPVSEEVVENPTIQKDVLECNVKTTEVVGDIILKPANNSLKITEEVGHTDLMAAYVDNSSLTIKKPNELSRVLGLKTLATHGLAAVNSVPWDTIANYAKPFLNKVVSTTTNIVTRCLNRVCTNYMPYFFTLLLQLCTFTRSTNSRIKASMPTTIAKNTVKSVGKFCLEASFNYLKSPNFSKLINIIIWFLLLSVCLGSLIYSTAALGVLMSNLGMPSYCTGYREGYLNSTNVTIATYCTGSIPCSVCLSGLDSLDTYPSLETIQITISSFKWDLTAFGLVAEWFLAYILFTRFFYVLGLAAIMQLFFSYFAVHFISNSWLMWLIINLVQMAPISAMVRMYIFFASFYYVWKSYVHVVDGCNSSTCMMCYKRNRATRVECTTIVNGVRRSFYVYANGGKGFCKLHNWNCVNCDTFCAGSTFISDEVARDLSLQFKRPINPTDQSSYIVDSVTVKNGSIHLYFDKAGQKTYERHSLSHFVNLDNLRANNTKGSLPINVIVFDGKSKCEESSAKSASVYYSQLMCQPILLLDQALVSDVGDSAEVAVKMFDAYVNTFSSTFNVPMEKLKTLVATAEAELAKNVSLDNVLSTFISAARQGFVDSDVETKDVVECLKLSHQSDIEVTGDSCNNYMLTYNKVENMTPRDLGACIDCSARHINAQVAKSHNIALIWNVKDFMSLSEQLRKQIRSAAKKNNLPFKLTCATTRQVVNVVTTKIALKGGKIVNNWLKQLIKVTLVFLFVAAIFYLITPVHVMSKHTDFSSEIIGYKAIDGGVTRDIASTDTCFANKHADFDTWFSQRGGSYTNDKACPLIAAVITREVGFVVPGLPGTILRTTNGDFLHFLPRVFSAVGNICYTPSKLIEYTDFATSACVLAAECTIFKDASGKPVPYCYDTNVLEGSVAYESLRPDTRYVLMDGSIIQFPNTYLEGSVRVVTTFDSEYCRHGTCERSEAGVCVSTSGRWVLNNDYYRSLPGVFCGVDAVNLLTNMFTPLIQPIGALDISASIVAGGIVAIVVTCLAYYFMRFRRAFGEYSHVVAFNTLLFLMSFTVLCLTPVYSFLPGVYSVIYLYLTFYLTNDVSFLAHIQWMVMFTPLVPFWITIAYIICISTKHFYWFFSNYLKRRVVFNGVSFSTFEEAALCTFLLNKEMYLKLRSDVLLPLTQYNRYLALYNKYKYFSGAMDTTSYREAACCHLAKALNDFSNSGSDVLYQPPQTSITSAVLQSGFRKMAFPSGKVEGCMVQVTCGTTTLNGLWLDDVVYCPRHVICTSEDMLNPNYEDLLIRKSNHNFLVQAGNVQLRVIGHSMQNCVLKLKVDTANPKTPKYKFVRIQPGQTFSVLACYNGSPSGVYQCAMRPNFTIKGSFLNGSCGSVGFNIDYDCVSFCYMHHMELPTGVHAGTDLEGNFYGPFVDRQTAQAAGTDTTITVNVLAWLYAAVINGDRWFLNRFTTTLNDFNLVAMKYNYEPLTQDHVDILGPLSAQTGIAVLDMCASLKELLQNGMNGRTILGSALLEDEFTPFDVVRQCSGVTFQSAVKRTIKGTHHWLLLTILTSLLVLVQSTQWSLFFFLYENAFLPFAMGIIAMSAFAMMFVKHKHAFLCLFLLPSLAAVAYFNMVYMPASWVMRIMTWLDMVDTSLSGFKLKDCVMYASAVVLLILMTARTVYDDGARRVWTLMNVLTLVYKVYYGNALDQAISMWALIISVTSNYSGVVTTVMFLARGIVFMCVEYCPIFFITGNTLQCIMLVYCFLGYFCTCYFGLFCLLNRYFRLTLGVYDYLVSTQEFRYMNSQGLLPPKNSIDAFKLNIKLLGVGGKPCIKVATVQSKMSDVKCTSVVLLSVLQQLRVESSSKLWAQCVQLHNDILLAKDTTEAFEKMVSLLSVLLSMQGAVDINKLCEEMLDNRATLQAIASEFSSLPSYAAFATAQEAYEQAVANGDSEVVLKKLKKSLNVAKSEFDRDAAMQRKLEKMADQAMTQMYKQARSEDKRAKVTSAMQTMLFTMLRKLDNDALNNIINNARDGCVPLNIIPLTTAAKLMVVIPDYNTYKNTCDGTTFTYASALWEIQQVVDADSKIVQLSEISMDNSPNLAWPLIVTALRANSAVKLQNNELSPVALRQMSCAAGTTQTACTDDNALAYYNTTKGGRFVLALLSDLQDLKWARFPKSDGTGTIYTELEPPCRFVTDTPKGPKVKYLYFIKGLNNLNRGMVLGSLAATVRLQAGNATEVPANSTVLSFCAFAVDAAKAYKDYLASGGQPITNCVKMLCTHTGTGQAITVTPEANMDQESFGGASCCLYCRCHIDHPNPKGFCDLKGKYVQIPTTCANDPVGFTLKNTVCTVCGMWKGYGCSCDQLREPMLQSADAQSFLNRVCGVSAARLTPCGTGTSTDVVYRAFDIYNDKVAGFAKFLKTNCCRFQEKDEDDNLIDSYFVVKRHTFSNYQHEETIYNLLKDCPAVAKHDFFKFRIDGDMVPHISRQRLTKYTMADLVYALRHFDEGNCDTLKEILVTYNCCDDDYFNKKDWYDFVENPDILRVYANLGERVRQALLKTVQFCDAMRNAGIVGVLTLDNQDLNGNWYDFGDFIQTTPGSGVPVVDSYYSLLMPILTLTRALTAESHVDTDLTKPYIKWDLLKYDFTEERLKLFDRYFKYWDQTYHPNCVNCLDDRCILHCANFNVLFSTVFPLTSFGPLVRKIFVDGVPFVVSTGYHFRELGVVHNQDVNLHSSRLSFKELLVYAADPAMHAASGNLLLDKRTTCFSVAALTNNVAFQTVKPGNFNKDFYDFAVSKGFFKEGSSVELKHFFFAQDGNAAISDYDYYRYNLPTMCDIRQLLFVVEVVDKYFDCYDGGCINANQVIVNNLDKSAGFPFNKWGKARLYYDSMSYEDQDALFAYTKRNVIPTITQMNLKYAISAKNRARTVAGVSICSTMTNRQFHQKLLKSIAATRGATVVIGTSKFYGGWHNMLKTVYSDVENPHLMGWDYPKCDRAMPNMLRIMASLVLARKHTTCCSLSHRFYRLANECAQVLSEMVMCGGSLYVKPGGTSSGDATTAYANSVFNICQAVTANVNALLSTDGNKIADKYVRNLQHRLYECLYRNRDVDTDFVNEFYAYLRKHFSMMILSDDAVVCFNSTYASQGLVASIKNFKSVLYYQNNVFMSEAKCWTETDLTKGPHEFCSQHTMLVKQGDDYVYLPYPDPSRILGAGCFVDDIVKTDGTLMIERFVSLAIDAYPLTKHPNQEYADVFHLYLQYIRKLHDELTGHMLDMYSVMLTNDNTSRYWEPEFYEAMYTPHTVLQAVGACVLCNSQTSLRCGACIRRPFLCCKCCYDHVISTSHKLVLSVNPYVCNAPGCDVTDVTQLYLGGMSYYCKSHKPPISFPLCANGQVFGLYKNTCVGSDNVTDFNAIATCDWTNAGDYILANTCTERLKLFAAETLKATEETFKLSYGIATVREVLSDRELHLSWEVGKPRPPLNRNYVFTGYRVTKNSKVQIGEYTFEKGDYGDAVVYRGTTTYKLNVGDYFVLTSHTVMPLSAPTLVPQEHYVRITGLYPTLNISDEFSSNVANYQKVGMQKYSTLQGPPGTGKSHFAIGLALYYPSARIVYTACSHAAVDALCEKALKYLPIDKCSRIIPARARVECFDKFKVNSTLEQYVFCTVNALPETTADIVVFDEISMATNYDLSVVNARLRAKHYVYIGDPAQLPAPRTLLTKGTLEPEYFNSVCRLIKTIGPDMFLGTCRRCPAEIVDTVSALVYDNKLKAHKDKSAQCFKMFYKGVITHDVSSAINRPQIGVVREFLTRNPAWRKAVFISPYNSQNAVASKILGLPTQTVDSSQGSEYDYVIFTQTTETAHSCNVNRFNVAITRAKVGILCIMSDRDLYDKLQFTSLEIPRRNVATLQAENVTGLFKDCSKVITGLHPTQAPTHLSVDTKFKTEGLCVDIPGIPKDMTYRRLISMMGFKMNYQVNGYPNMFITREEAIRHVRAWIGFDVEGCHATREAVGTNLPLQLGFSTGVNLVAVPTGYVDTPNNTDFSRVSAKPPPGDQFKHLIPLMYKGLPWNVVRIKIVQMLSDTLKNLSDRVVFVLWAHGFELTSMKYFVKIGPERTCCLCDRRATCFSTASDTYACWHHSIGFDYVYNPFMIDVQQWGFTGNLQSNHDLYCQVHGNAHVASCDAIMTRCLAVHECFVKRVDWTIEYPIIGDELKINAACRKVQHMVVKAALLADKFPVLHDIGNPKAIKCVPQADVEWKFYDAQPCSDKAYKIEELFYSYATHSDKFTDGVCLFWNCNVDRYPANSIVCRFDTRVLSNLNLPGCDGGSLYVNKHAFHTPAFDKSAFVNLKQLPFFYYSDSPCESHGKQVVSDIDYVPLKSATCITRCNLGGAVCRHHANEYRLYLDAYNMMISAGFSLWVYKQFDTYNLWNTFTRLQSLENVAFNVVNKGHFDGQQGEVPVSIINNTVYTKVDGVDVELFENKTTLPVNVAFELWAKRNIKPVPEVKILNNLGVDIAANTVIWDYKRDAPAHISTIGVCSMTDIAKKPTETICAPLTVFFDGRVDGQVDLFRNARNGVLITEGSVKGLQPSVGPKQASLNGVTLIGEAVKTQFNYYKKVDGVVQQLPETYFTQSRNLQEFKPRSQMEIDFLELAMDEFIERYKLEGYAFEHIVYGDFSHSQLGGLHLLIGLAKRFRESPFELEDFIPMDSTVKNYFITDAQTGSSKCVCSVIDLLLDDFVEIIKSQDLSVVSKVVKVTIDYTEISFMLWCKDGHVETFYPKLQSSQAWQPGVAMPNLYKMQRMLLEKCDLQNYGDSATLPKGIMMNVAKYTQLCQYLNTLTLAVPYNMRVIHFGAGSDKGVAPGTAVLRQWLPTGMLLVDSDLNDFVSDADSTLIGDCATVHTANKWDLIISDMYDPKTKNVTKENDSKEGFFTYICGFIQQKLALGGSVAIKITEHSWNADLYKLMGHFAWWTAFVTNVNASSSEAFLIGCNYLGKPREQIDGYVMHANYIFWRNTNPIQLSSYSLFDMSKFPLKLRGTAVMSLKEGQINDMILSLLSKGRLIIRENNRVVISSDVLVNN\n>tr|A0A2S2NUK6|A0A2S2NUK6_SCHGA Uncharacterized protein OS=Schizaphis graminum OX=13262 GN=g.56950 PE=4 SV=1\nMPYSIGSGFTRYTVGPSVRDVFGENEKIVFIIKLFAEYPAPKRSRDAFRLLSNGDIFFSTVVKNHFSGYRFLSMKNMKLCEKKYQRLSECVLEKRGSCEATSKTVKKNK\n>tr|A0A438P4J0|A0A438P4J0_HELPX DEAD/DEAH box helicase OS=Helicobacter pylori OX=210 GN=ECB92_03930 PE=4 SV=1\nMELNQPPLPTEIDDDAYHKPSFNDLGLKESVLKSVYEAGFTSPSPIQEKAIPAVLQGRDVIAQAQTGTGKTAAFALPIINNLKNNHTIEALVITPTRELAMQISDEIFKLGKHTRTKTVCVYGGQSVKKQCEFIKKNPQVMIATPGRLLDHLKNERIHKFVPKVVVLDESDEMLDMGFLDDIEEIFDYLPSEAQILLFSATMPEPIKRLADKILENPIKIHIAPSNITNTDITQRFYVINEHERAEAIMRLLDTQAPKKSIVFTRTKKEADELHQFLASKNYKSTALHGDMDQRDRRASIMAFKKNDADVLVATDVASRGLDISGVSHVFNYHLPLNTESYIHRIGRTGRAGKKGMAITLVTPLEYKELLRMQKEIDSEIELFEIPTINENQIIKTLHDAKVSEGTISLYEQLTEIFEPSQLVLKLLSLQFETSKIGLNQQEIDAIQNPKEKTPKPSNKKTQHEPARSFKKGHYREKGSKTNHHSKKPKRR\n>tr|A0A5D4XPJ5|A0A5D4XPJ5_9GAMM Uncharacterized protein OS=Luteimonas sp. XBU10 OX=1132694 GN=FZO89_00285 PE=4 SV=1\nMKAVAVSTVLLSSSLTAFAAMPEQVQFVGSIQHDDLTPVTFDLHLPSKQSATLKLADGSTLELVTPGGQASPDGARIRLLSPAGEIMHAATVPDPSLASTSFAYRICDGQVTYMSPAPAVVPDCGA\n>tr|A0A0W0TLV5|A0A0W0TLV5_9GAMM MFS domain-containing protein OS=Legionella geestiana OX=45065 GN=Lgee_2174 PE=4 SV=1\nMHTEKNKHYMWYAWFVCALGAVFYSYEYFLRISPSVMEEALRAHFELNSAGFGKLSAFYYYAYVPMQLPVGILMDRYGPRRLLTIACMICVLGTWMFAGTSVFWVAASGRFLVGLGSAFAFVGVLKLATLWLPEDRLALVSGLATALGTIGAMLGDNILGALVDSAGWQQTVNLTAISGILLVLVLWLGLRDHPDSDEESGSIENFRQSIRDLCIIARNRQIWINGLYGCLVYLPTTVLAELWGIPYLQHAHGMTRSNADFANSLLFLGFTVGAPMMGFLADKLHRRKLPMMTGALGAVIVMSIILYMPGLTAMQINVLMVLLGLLYGAQAIVFAVGRELSPDEAAGTAMAMTNMIVMLGAMFLQPLVGYLLDWSGDYRIALSVIPLGMLIAAVLVFFLKETHAHAPQ\n>tr|A0A556AMN3|A0A556AMN3_9BURK Putative glutamate--cysteine ligase 2 OS=Verticiella sediminum OX=1247510 GN=FOZ76_12590 PE=3 SV=1\nMHAIEFTPSRYNTLGIELELQLLDPRTLDLSGQAASLLEHIAGHPSADHVKPELTRAMIELNSSVHEHPAGLLAEMRELRDLVCEAGDAIGVRVAGGGAHPFTSWRDCDIHDSPRYRRLADLYGYLARQFTVFGQHIHLGVASGDAACGLIHRLSPYVPHFIALAASSPFREGEDTLFACSRLHALHSFPLAGHMPEHIRDWYQFEAHYTQMRSLGLTESLKDLYWDIRPKPELGTVELRVCDTPLTVEKACQLAAFAQALAIAVQRASAPTAAFWMAYETNRFQACRFGLHANYVTRAGERVRLIEHLRGTFEQLMPVADELGTTDLLGALREDALRLGNDARWLRARHHELRELPAVAAAAADVWRGEPAGAAQAGPGRRRVRASSEPIVHGLPLLPEGTPANLPPRLH\n>tr|L7JZ93|L7JZ93_TRAHO Uncharacterized protein (Fragment) OS=Trachipleistophora hominis OX=72359 GN=THOM_0239 PE=4 SV=1\nVHPVSPSDVVGLTMLICKTMMGFMGLRERVTSSHMVGPEGHELDLGITGPKFRRDTFITDIEVFAGLFSLTMPFPEPERVKCFNKHIDRSLFVKKFDSSRCEVDMQALVLYIDDFYTACRVTSSLCKYALGFISLCMRPEYGDFGSILSDSPTSLFVELEKFKATGMGSAPACALREPSDFLLWYDRLCSLRALFVNYLTTRNGRFRGLVEMCRIAKEVEKDIEKLESEYNAYLDSQEGFVQDYFRTWGLVGGRGPLFIHSVPMIDVYQACTDKFKNKVNSLVARDDSPVVALMQNLRENGGVLPPDLVERRERFWEWQKKIKKEQKPMRVPINDLLLEFQSEDSGAFVFERQMTFMNLHQAIIERVARCWLNSSLYNDDQSMCNMQ\n>tr|A0A6A1VVY6|A0A6A1VVY6_9ROSI Peptidyl-tRNA hydrolase ICT1, mitochondrial OS=Morella rubra OX=262757 GN=CJ030_MR4G021223 PE=4 SV=1\nMAIMRTTTSVILRGVVHLPSFSVSRFSALPGVGGTIGYTHRGISFGRIQCAASDSGDGRKVSARLSQVQQLLQEAEERALSADDEPTPKITIALLLRPEDVALVPYSISPVWSWKKRGKGPRGGQNSSTNSCIAWSFERVVTAKSYIGTVIGQQRFQPTFGWITDNYEAQLHFLYFWLFDWLDDSTIGSLQIIWLDHVTVNFARSGGPGGQNVNKVNTKVDMRFNVKSADWLSDRIKEKIIQMEKNRINKDGELVISSTKTRTQKGNIQDALEKLQVLKTPHCIRPYLYSVLEAIIDAASYVPPPPTEEQKKKIAKLAAIGEQKRLKSKKVLSEKKAFRRSRDSWD\n>tr|A0A2D5SZF1|A0A2D5SZF1_PSEAS Methyltransferase OS=Pseudoalteromonas sp. OX=53249 GN=CMK64_03795 PE=4 SV=1\nMSVCGLCGSDELQPYHQDKRRRYLQCTQCALVIVDERDRLSPEDEKAIYDTHENSLHDEGYRRFLSRAFEPTVERVPSHSKGLDFGCGPGPLLAEMFKEVGFEMACFDLFYANEPEVLTKTYDFVTCTEVIEHLSQPGEVLAKLLSLLDAGGPLVLMTKLIIDQNRFAQWHYKNDLTHIVFFSRETFNYVAAHFDCQVEFIGNDVIVLTKSKK\n>tr|A0A091NFS5|A0A091NFS5_9PASS Leucine-rich repeat-containing protein 45 (Fragment) OS=Acanthisitta chloris OX=57068 GN=N310_05272 PE=4 SV=1\nGVKLLLHGLCSNTTVKSLDLKGNNLRTVGAEALGKLLRQNKSIRSLTLEWNSLGMWEEGFSFFCQGLGANNFLQRLDLRNNQINHQGAAELAMALTQNDSLQELDLRWNNIGLLGGRALLNCLQSNRTLKKLELAGNNVPGDILKAVEQALDHNRDRETILSEAQNQVSILSKEVMSLKDEKNKQFLDLMDTVDKQKEEKARSERMSAAQISQLQEALDEHYSIVNSLKAKLQMTEAALALSEQKVHNLGELLNAMKQEQTSVAESHFKELQQQRQESADREDKLLHDLSAASEKNLLLRNQVGNQVLGREDQLFQVKQDLTNTTAELKLRAVQAEERLEMEKRRFKQSLEDMESLRVKEVDHMTQHIEASERSMQDRIQRLEAIRISLEEELSQVKAAALAERGQAEEELMKVRSQARLEEQQRLEHLEEKLRLMTESRDEAQNCCLKQKEMVAEAQARAKQCSMQADGLRRRLEELQQDLNRKEEEKVTEVNKVKVELQEQIGHLQAERTAQDGLREKIAALERQLKALSNNHREALLDKEGEMSLLLEKLRMKEAEISRMREEEAQRASFLQNAIMAYVQGSPLGTHSSRK\n>tr|A0A817VJW3|A0A817VJW3_9BILA Hypothetical protein OS=Rotaria sp. Silwood1 OX=2762511 GN=CBO169_LOCUS792 PE=4 SV=1\nMAYVCSPQHCYQKNLSREKNSSDPSLVVHVNKFDIVPKVLNDYTYRTEVYLQQREKQNIDKTSSSSTSATITTWKILKYQKEMLKNDQAEIDRALSTINSIHEIFNRSASIPYNQVYSSLYGDNNKSDHLMKTFCRCQNHFRKEDDDNHIQTISSSFVNFEDTDSDLDYNEDEEEKKKTYDSGYETFKLIPIDVDLHTQKNMEEHSTNHYDIPGLVLRRGQSFSFTVTFNKDYDIEQNQLYIRLAIGPRSMISKRTQIRLLVDGTPSGNGWSAKSIPIEDDDVKTKKKNCISLQINSPSDAIIGKYTLLLEVCPSKNDDKKFLNKQDPTLFLIEADLYFLFNPWNKDDACALSSSEQINEYVMNEHGQIYLGTSNKPQPIPWYFGQFERSTLLTALTLLDKAKLPAQNRIDPSIIIRILSSKICSNPGTNNGIFPSSYDTKVYSSENHGYTSSTGIFKQYLLSNCRSVQGGCGNNWQHAAILCSLSRSLGIPCRIVTIYNAACQTDGTEDNDTHWDTKQRPLHKLNFDLICSSHVWNECWMRRHDLPNDEQDWQIVDSTPVQMCDGIRRTGPCSVSSLKNDKLSFRWDSPFIHSTINGKKSHWIVYPDGHMELLDVQENIVGTKIITRSLDNEFEPSDITKNYKNLMKTYNKYDNITERINNDVDIELKIPDNIEFGDDITFELNANNKSNEIRTIATALTISILSNNDQKLIVSHDQPVQTLNLEAEKNDHIQLKVTSKQYASYGKQENIILKYYIHSLIKETDQTFTRDDNIVFNKYDIIKPILDDDVIEIGKPVLLKILIANTLSHPINSGQIYIDGLGINQIVHVNRSFAPKESTTLHIKLYPTRIGVSRLYVTFISNNVSSSTQTIPLEIIREPIKQQHERINAQEEPLLTTNTETSAETDEKIEIPSKEDKLVTQSNISDRQDETLIHEEEQHPLVQSPSSLSSSINIADEYQDDRTSNISQPKFELSTTEDDDDDIAELNLKKNQDESSPNPNTSSSLPHDSTLSLEKDKISVDSLDIAHDRRYGTNNNQ\n>tr|A0A819KK27|A0A819KK27_9BILA Hypothetical protein OS=Adineta steineri OX=433720 GN=JYZ213_LOCUS36401 PE=4 SV=1\nMELNKDNGSWIIHVTFKMGLVYMKWGRYDSAIRHFQGVLDYSSSIQSFPLEVIATFHEHLAMAYEKQRKYKEALNHWEKLLEIQTKIFEPFSIEIADTYLSMAENYLMLLEFGRVIEMWHKVKSVHLNPLSPNYNAASFLFNQMENPDTSSPEYIKTLLLQLRSHSASVKLKAQPSYISEKTEL\n>tr|A0A2P1NJ72|A0A2P1NJ72_9BURK GP-PDE domain-containing protein OS=Pulveribacter suum OX=2116657 GN=C7H73_05065 PE=4 SV=1\nMKRRAVFALLAGATLAACGGGGDDLEPDQSRPIVIAHRGASGYLPEHTLGGYELAMRLGADYIEPDLQLTRDGALVAMHDETLERTTNVAALFPPRSGGYKVADFTLAEIKTLAVKPTGTGKASYPGFAPGSATPWSVPTFDEVIRLAQSSRSLVGREVGIYPEAKQADPAMEDAILKALVQGGYSARSRVFIQSFSDQTLRSMHVKAQAQGNPLPQILLGAAVMGADGVARLGVIGQAAQPVLLTFKDVASFAQGVGVVINASAYPITKAYIDQAHAVGLKVHGWTFAQPEAGAAAAEYRRYLELGMDGMFSNYPDLAVKARDQYVRERQADWGARGPAHPH\n>tr|A0A7J2PPS0|A0A7J2PPS0_9ARCH Uncharacterized protein OS=archaeon OX=1906665 GN=ENH77_08385 PE=4 SV=1\nMTLRSRNESKINRFRALNNFLQNKYIILVFIGHKNQIDQTSTVIDVVDEFKIGSRYAYKLLEELESGRFIIKKAKVLKHGIYYSNYIITETAKSELREILKIITSIL\n>tr|A0A6T8JG47|A0A6T8JG47_9STRA Hypothetical protein OS=Proboscia inermis OX=420281 GN=PINE0816_LOCUS10274 PE=4 SV=1\nETGLLVDMDPSDQEKAGENLASALQGLLEEPERAIRLGKRGHAHVTERFGLEPFRREWNEIVTGAIPKGATRVSLRAAKNSANSVKQRMRTLARLLAFVAVVYQYGGEGLAVIQRKAAEHFKVIGTILRMVVALIAVMAIRYRS\n>tr|A0A6P7FQQ6|A0A6P7FQQ6_DIAVI farnesol dehydrogenase-like OS=Diabrotica virgifera virgifera OX=50390 GN=LOC114332982 PE=3 SV=1\nMVLSMKRWIGKVAVVTGASSGIGAAVAKQLVEEGLLVVGLGRRKEKIESLGNRLSGKQGKLFAVKADLTKEDDIKQAFKWATENVGPISILINNAGTHIRTGLLDGDTEAWKTTINVNLLALCIATREAIQSMRKNSIDGHIIHINSFLGHNVAPLPDLDVYPATKYGVTALTETLRVELNSFNLKTKITSISPGFVDTEIIADMKNNEEFKRNVPNLLNPEDIADGIIYALSTPPHVQVHELTIKPLGEKY\n>tr|A0A2G2QTX8|A0A2G2QTX8_9GAMM Heptose kinase OS=Porticoccus sp. OX=2024853 GN=COB19_03790 PE=4 SV=1\nMSCWFVDRAILSEAAAERFSSLDSVFATTGRRVTRCPISELILTEIGEKSYYVKRYSRRGKVIRRWLGRSRVRAEWENLLFFRGLGLRVPPIAAYGESGARGVLITEEVPGAIDLHSLVRQRPELLRDRNWLDQVVVQVADVAKQLHANSFAHNDLKWRNILVAGEVTPEVYLIDCPMGQTWWGPLLAYKKIKDIACLDKVAKYCLNRTVRLRFYLHYVGRDRLTAADKTFIRKVLAFFAGRE\n>tr|C7GZL0|C7GZL0_9FIRM Uncharacterized protein OS=Eubacterium saphenum ATCC 49989 OX=592031 GN=GCWU000322_00425 PE=4 SV=1\nMGYDDFFMDIGALFVVLIVAFLGNGLGEFSFKYVAREVFILALLSTAGAFVWTLILAYLKYKRSNNKSK\n>tr|A0A4S1VTE3|A0A4S1VTE3_ECOLX 4-aminobutyrate aminotransferase OS=Escherichia coli OX=562 GN=gabT PE=3 SV=1\nMSSNKELMQRRSQAVPRGVGQIHPIFADRAENCRVWDVEGREYLDFAGGIAVLNTGHLHPKVVAAVEAQLKKLSHTCFQVLAYEPYLELCEIMNQKVPGDFAKKTLLVTTGSEAVENAVKIARAATKRSGTIAFSGAYHGRTHYTLALTGKVNPYSAGMGLMPGHVYRALYPCPLHGISEDDAIASIHRIFKNDAAPEDIAAIVIEPVQGEGGFYAATPAFMQRLRVLCDEHGIMLIADEVQSGAGRTGTLFAMEQMGVAPDLTTFAKSIAGGFPLAGVTGRAEVMDAVAPGGLGGTYAGNPIACVAALEVLKVFEQENLLQKANDLGQKLKDGLLAIAEKHPEIGDVRGLGAMIAIELFEDGDHSKPDAKLTADIVARARDKGLILLSCGPYYNVLRILVPLTIEDAQIRQGLEIISQCFAEAKQ\n>tr|A0A4U1G485|A0A4U1G485_9SPHI Methyltransferase domain-containing protein OS=Pedobacter sp. RP-1-16 OX=2572196 GN=FBD94_20505 PE=4 SV=1\nMNQELEIIRDQQQEVWNKFSAGWKKWDTLTMDFLKPVGDEMIRLLNPKGNDMVLDIASGTGEPGLTIASMLTNGKVTLTDLSADMLEIARENGADRGIKNIETIVCDVCELPFEDHTFDVISCRFGFMFFPDMLLAIKEMARVLKPGGRIATAVWNIPEKNFWVTASMGVIRKNMDIPVPPPEAPGMFRCAEAGMMSDLFKQAGLINISEKEVAGKMNCGTTDTYWNLMTDVAAPVVAALSKADQATKDKIKAEVYETINQKYADGDVVIDSSAIVIYAEK\n>tr|A0A6G2IRX0|A0A6G2IRX0_STREE PTS fructose transporter subunit IIA OS=Streptococcus pneumoniae OX=1313 GN=GRB29_07185 PE=4 SV=1\nMKYLILVSHGGFAQGLKTSLAMFAEDKMDQVIALGLKNGSSVDDFAKECHQAVDHLTEEDTVIVLADIVGGSPLTTALTVLEEKGKLDTTVVLGGMNLPMALTSVVMKDDLEGDDFVAAVLPEASAALQEFKVATTTDNDEDDDI\n>tr|A0A847WTI5|A0A847WTI5_9BACI Geranylgeranylglyceryl phosphate synthase family protein OS=Amphibacillus sp. OX=1872500 GN=GX972_07265 PE=4 SV=1\nKQFGSMIDWSELTTEGYVILNPEAKAYQLTNCYLPDREDVIAYAQMAEQMFNLPILYLEYSGTYGDPELVRQVKQHLNKTQLVYGGGITTLEQAKEMAQYADTIVVGNSLYDNFAEAIETVHVKE\n>tr|A0A7W5HC73|A0A7W5HC73_9BURK Uncharacterized protein OS=Massilia umbonata OX=864828 GN=FHS02_002507 PE=4 SV=1\nMVHEEARPPQAARLPLPAPVVAQEIASPPQAAELPLPLPVVVHEMALPPHAAALPVPLPVVVQDIASPPHAASLPAPLPVVVQERARPPHAALLPTPLPVVVQEIARPPQSAWLPAPLPVDAQLIAIPPHAARFPGPEPVVMHDIARPPHAAQLPGPLPVVVQVAARPPQAA\n>tr|A0A085DW41|A0A085DW41_9GAMM Uncharacterized protein OS=Halomonas sp. SUBG004 OX=1485007 GN=DK37_25465 PE=3 SV=1\nMSLHQDLIERDRKVTFHASTHLRDFAHGDAPGRVITGGKGIHIVDKDGREFIDGFAGLYCVNIGYGRTEVAEAIYKQALELSYYHTYVGHSNEPQIELSERVLKIAGLNMSKVYYGMSGSDANETQLKIVRYYNNVLGRPQKKKVISRMRGYHGSGIASGSLTGLKAFHDHFDLPIDTIRHTEAPHYYLRAAEQHGLTELEFSAYCADKLEAMILEEGPDTVAAFIGEPVLGTGGIVPPPEGYWEAIQPVLDKYDVLLIADEVVCGFGRTGSDFGSHHYNMKPDLITIAKGLTSAYQPLSGVIVGDKVWKVLEQGTGEYGPIGHGWTYSGHALGCAAGLANLDIIERENLVGNAAETGAYFQQQLKATFEGHPLLGDVRGVGLMAALEFSPDAKQRLHFDPTLKVGPRVAAAAMEENLIARAMPQGDILGFAPPLTINRGEVDEMIGRAKRAIDRVTDELVRAGDLKTGQQEAAFTI\n>tr|A0A6A3RIU8|A0A6A3RIU8_9STRA Uncharacterized protein OS=Phytophthora fragariae OX=53985 GN=PF001_g20766 PE=4 SV=1\nMANLIKPITSGHDLIALAAKCDLTTDAVLDSTEVTKPLPHDKTYLILQRPADMDIGHWTCVHNGKYFDSMGEGPPTK\n>tr|A0A2A2IY53|A0A2A2IY53_9PSED Cell division protein ZipA OS=Pseudomonas sp. HAR-UPW-AIA-41 OX=1985301 GN=zipA PE=3 SV=1\nMDIGLREWLIVIGIIVIAGILFDGWRRMSGNKGKLKFRLDNSFGNLPDEDVDPNLLGPVRVKEKHAEPQLDEHDLPSMTATDGGKKRSEPFQGDLSLDEPVPTLLNPVDDEVKSESPREQVPVDEVLVINVIARDPEGFKGPALLQNILESGLRFGEMDIFHRHESMAGNGEVLFSMANGVKPGTFDLDDIDLFSTRAVSFFLGLPGPRHPKQAFDLMVAAARKLSSELNGELKDEQRSVMTAQTIEHYRQRIADHERRKLTQKR\n>tr|A0A2M9EG28|A0A2M9EG28_9GAMM Efflux transporter periplasmic adaptor subunit OS=Xanthomonadaceae bacterium NML95-0200 OX=2032577 GN=CO610_06720 PE=3 SV=1\nMSSQLRPNPPKRRGFWMPAIVIAVLAAGALWWWQGKRSGSDEGAFRTVQIEQGDIRVAISATGTLSAISTVTVGSQISGQVTEVLVDFNSPVKKGDVLARIDPSTYRAQIAQGDAAIASAQAVLRQAEANLRNVRADFSRKNELGAQQLVSRSDVDSARASLEQAEAQVNVARAQIRQQTANTQTTRLNLERTVIRSPVDGVVLMRKIEPGQTVAASLQAPELFTIAEDLSKMKIELGVDESDIGQVKAGQGVSFTVDAFPNRQFRGVVEQVRLAATTSNNVVTYPVVVTVDNSDGTLLPGLTVNAEIEVSKREGVLKVANAALRYKPSEATQALLGEAAASGGSGNARRGMSEKLPKIAAGLRLQPAQQQVFDEALAAMRAAQAERQGATRSGNGSAGGPPMMMRSGSAPDPAMMAQIRARMRERMQRQFAQFRSTLDDEQRAQWDSAMDALLNSNRAPLYLLVDGRPRRVMARIGASDGSSTEISGDFRAGDAVISGERAASSAR\n>tr|A0A2D7G1K4|A0A2D7G1K4_9GAMM Uncharacterized protein OS=Gammaproteobacteria bacterium OX=1913989 GN=CMP96_10680 PE=4 SV=1\nMDLLKELFSFLRARKKLWLAPIILIMVALGGLLVIAEGSVLAPFIYTLF\n>tr|A0A5E4IWU6|A0A5E4IWU6_9ARCH Protein-synthesizing GTPase OS=uncultured archaeon OX=115547 GN=eif2g PE=3 SV=1\nMPQAEFNVGVVGHVDHGKTTLTSALTGKWTDTHSEELKRGITIKLGYADVVFKQCTRCGFSSTKERCPKCGAPTQATRKIAFLDAPGHETLMATVIAASSIMDGALFVIAANEKCPQPQTIEHLMILEAAGIKNVVIAQNKVDLVTRQQALEHYKQIREFLKGTTYENAPIIPTAANSGGNLDSLVSALLETIKPVPRESGKTRMLVARSFDVNKPGTNVEKLYGGIVGGSIVSGVLKNGEEVRILPGALRTHKGKEHYQELSTKIVGIRVGDETLEEAKPGGLVALATTLDPSLTGADVLVGCLLFPAKDEPPVVYQTFSLEITPLSRLLEKFPSSFTPNEPLVLGVGTATTVGFVTKQKKKICELMLKKPVCASKTDVIAVMRRANNRWRLYGTAKLVS\n>tr|A0A209CHN7|A0A209CHN7_9ACTN Flavin reductase OS=Streptomyces sp. CS057 OX=1982764 GN=B9W61_33485 PE=4 SV=1\nMTATPDLAPAPTAATPELFRSVFRRHAAGVAVITAAGERPVGFTATSLTSVAAEPPLISFGVGTSSSSWPVLSEAAYVGVHILGEHQHELAATFARSGADRFGPSTEWSSGPEGVPLLAGVSAWLVCRVVTRVPAGDHRIVIAEAVSGAPSGAARPLVYHQGRFTALRD\n>tr|A0A1A7C0Q9|A0A1A7C0Q9_9BURK Porin OS=Janthinobacterium psychrotolerans OX=1747903 GN=ASR47_1005274 PE=4 SV=1\nMPIMKKSPLSLRAHQGASLLFLAISGTAAQAASLPEWTLGGFGTAGLVHSSERQADYSANVINRGGAGRTDRWSGSVDSRLGAQLGVEFTPRWSAVLQVIAEHNLQNSWLPVVEWANLKYQATPELSLRLGRIALPIYLAGDYRKPGYALEWVRPPVEVYGSLPVSNSDGVDASYRWQAGATNNLTQVFYGHTSIETDDGGKRARGRQLAGLSNTTTYGALTIRASALTAELTVDLVRPLFDAFRQYGLRGGQIADRYDADHKRVAIANLGVSYDTGDWFLQAEGSRLNTRSFLGDKSSMYLGGGYRLGAWTPYATYAKVKANVPNRDAGIDSAQPGAAYLNGQLNALLQRISSQHTISTGVRWDFLPDRAVKLQYDRLRPTGASSGTLVNVQPGFRTAHPIHVVSIALDFVF\n>tr|A0A124SC33|A0A124SC33_CYNCS Homeobox domain-containing protein OS=Cynara cardunculus var. scolymus OX=59895 GN=Ccrd_005381 PE=3 SV=1\nMEVARFEDEQQHKNKFFGFNSMSQDYIFNFSHGFERPSQDQQQQNHISHQIRRDKLRVQDFEPPAPASLVGLEQVDEGTGGAGGINPAVYETGAGMLSEMFNFPTGGPATELLENQINYQHHRNQRPNSATGDWYGNSTAQAMQLFLMNPSHESPSSQSSSHHHHHHNSSTSSSTLHMLLPNTVPSSTSTLHHQQSFGSTSGSGQGQFGPSTQFAWIPPGGTTHEGGGGGGDSHGLSLSLSSTLQHLEAAKVEELRIGDDPAATAMLYFNQSGSDPYRHLQLQGGGGGVMGSTHHPIHVGYGSSTVGVVKALRTSRYVKAAQELLEEFCSVGRGQFKINKSGSKPANNPNQNPSNSCGGASSASSKDHPPLSSAERIEHQRRKSKLLSMLDEANRLTKITIETKKSRWIGDTITTMVVNSFDLILGFGAAVPYTALAQKAMSRHFRCLKDAITAQLKHSCELLGEKDVGTSGVTKGETPRLKMLEQSLRQQRAFHQMGMMEPEAWRPQRGLPERSVNILRAWLFEHFLHPYPSDADKHLLARQTGLSRNQVSNWFINARVRLWKPMVEEMYQQESKEEADQHHNHSPHHRHQDDDDDDEDDDQEQEEDKENTKYHNHNHDQNQTDNDGHHHHHPPPQPSSAATQTSMHAPPPPLTSAPTYTTTTTTATDSAAKRSEINDSENDPSLLAINTQHCFSENQAMTYSYSNPIGGITTMAPPPPPPFDGDTCRRGSMLGAEYRTTTGNDAADIGSTLIRFGTTSGDVSLTLGLRHAGNLPEKTSFFS\n>tr|A0A1B1T822|A0A1B1T822_9NEOB KIAA2013 (Fragment) OS=Afrixalus dorsalis OX=367642 GN=KIAA2013 PE=4 SV=1\nPSKLSSISQLLQLWDLWKLTLQKRGCKSLVMAGAHGLMQGMMLSFGGLQFTENHLQFQSDPHVLHNSYALRGIHYNKDLINLAVLLDQDEKPFLHVSVKFQDKLVKLYACEAGCLNEPVELTSEIRGHTFPVLVTQPLTPLLYISTELTHLQDLRHTLHLKEILAHEEHMAKQYPGLPFL\n>tr|A0A251VB46|A0A251VB46_HELAN Putative pentatricopeptide repeat-containing protein OS=Helianthus annuus OX=4232 GN=PPR38 PE=4 SV=1\nMMNRIAFIKLRGNFTTSSFLLHSETPFSSFHIGLHSDTRNVSVNRSMFDKITNLNDALNLFDEMSHRHPLPSVVKFTRLLNVVTKMKHFTYALDLFKQMCSLGVPLDKYTLSIAIKCCCQLNRTKDGFAVLGSCFRRAIPPDVYIFSVLLDGLVLEDRILEAEMFFKKLIKQKLCEPDVVMYNTMIKGLCKFGNNVTAVALLRLMEQTNCKPSIVTYSTIIDSLCKDKMIDDAFKLFKEMVFDIGILPNVITYTSLICGLCKLGRWDEASKMLKEMEDENISPDVQTFNVLVDAFCKEGKVEEAEAVINIMIERGKVPNIVTYNALIDGYCLRGEMIKANTIFDSMTLRGLVPDVVTYSSLLNGYCKNLNIEKAEQMFHEMTVKGLKPDVVTYSTMIQGFFQVGRCVAARRLFDEMHARGQIPDQCTYGIVLDGLCNNHLVEDALSLFYLVGKSKLNSDIAVYNILIDGAGKNGKVEVARILFQGLIDKGLQPDVRTYNVMISGFCREGQLGEAKLLFLKMEESGCPPNNITYCVLLQGCLKNKHYDDVEMLLKEMDARGYSLDASTLSLFIDHIAAGLLDRSMLKLFNKLVPKELLDDPRLCDWESN\n>tr|A0A258FT73|A0A258FT73_9PROT Uncharacterized protein OS=Caulobacterales bacterium 32-69-10 OX=1970503 GN=B7Y99_04785 PE=4 SV=1\nMRCVAASLCEDTTTTVAALLRSTAQEMASLSDMSNRLHDLVARQMGAAVIHEQSVEEAQSIDLLVQHLETIGRFLHLLADEVPSSLAVDFSPIRDRLPLAALADRLGGEAGRRRLDDGDPGDLDLF\n>tr|A0A329S1R4|A0A329S1R4_9STRA Uncharacterized protein OS=Phytophthora cactorum OX=29920 GN=PC110_g12992 PE=4 SV=1\nMRATAAKQRHKRRRPTAGQDDEGTVAATAGDKNGADRGEDGDESHGVVIAAV\n>tr|A0A6A3VWU9|A0A6A3VWU9_9STRA Uncharacterized protein OS=Phytophthora fragariae OX=53985 GN=PF001_g28857 PE=4 SV=1\nMALLNRRFDSEDSATAIENLTAKLKKGIQAASTHFFEQEFPHDTREAILCTLDPTKTPLTPVQSGQAIRDHLEAIGRSTSKT\n>tr|A0A0D0XGW5|A0A0D0XGW5_9TREE Unplaced genomic scaffold supercont2.14, whole genome shotgun sequence OS=Cryptococcus gattii VGIV IND107 OX=1296105 GN=I308_04987 PE=4 SV=1\nMPFRKTPCLSKPIIQFKLPFSSFSYPPCTPPERGTPAQTPGLAMSQTSWPRAMAVSFMIVTPPGQYSTQFPSLYPTEYPAEAAIDESSESDDQSVEDLMSLVTENEDGQERRWDGKGQEPLEKDAICPGAPKLSPIDLPN\n>tr|A0A4Q1BKZ0|A0A4Q1BKZ0_TREME Uncharacterized protein OS=Tremella mesenterica OX=5217 GN=M231_04342 PE=4 SV=1\nMTGLTLPPLTLFLFSLLLFLLVGPTLVIASPDPTSPNVKRERLVAQAPSNTEITPIETKNIERGITTLPVLPRNDHPTSPPRLPRQPNRLVPQPTKRAEALIENDSVERFIDDVKVERRDEIGIGKRDDACSIAININLSDKTAPAIDLPSCLDGLDLQLGINLDLTDDDGGDDDCELGGGNFLAHSETSSNTKPPASTSKSANPGKSTPGNGGNDSDNIVALSWHVFGGNGYDGPSCGKTLTIVTSKGKQATAVVADECASCPDMYHVDMSTGLFSALGLDKSTGEYVVKWQCPDCVFEEDPTIGGCKNNPGGQYC\n>tr|A0A1S1XQS9|A0A1S1XQS9_9XANT Transcription-repair coupling factor (Fragment) OS=Xanthomonas alfalfae OX=366650 GN=BHL63_10710 PE=3 SV=1\nISQRLAALHRLPGLTRGVVIVPVQTLLQQLAPLSYIVGGSFDLTVGQRLDLDAEKRRLESAGYRNVPQVMDPGDFAVRGGLLDVFPMGADTPLRVELLDEDIDSIRVFDPESQRSLDKVDAVKMLPGREVPMDDASVERVLACLRERFDVDTRRSALYQDLKSGLAPSGIEYYLPMFFAKTATLFDYLDKRVLPVIATGVSNAADAFWTQAQNRYEQRRHDVERPLLPPDELYQSPDALRERLNKLARIEVWASDHARIDEAAPLGDQPLPPLPVAAKDAPAGQALATFLSHYPGRVLIAADSAGRREALMEVLAAAQLKPELVADVPAFLAGTLRFAITVAPLEDGFALDQPQIALLTERQLFPERANQPRRTRRVGREPEAIIRDLGELSEGAPIVHEDHGVGRYRGLIVLDAGGMPGEFLEIEYAKGDRLYVPVAQLHLISRYSGASAETAPLHSLGGEQWTRAKRKAAEKVRDVAAELLEIQARRRARAGLALQVDRAMYEPFAAGFPFEETGDQLAAIDATLRDLGSSQPMDRVVCGDVGFGKTEVAVRAAFAAASAGKQVAVLVPTTLLAEQHYRNFRDRFADYPMKVEVLSRFKSTKEIKAELEKVASGEIDVIIGTHRLLQPDVKFKDLGLVVVDEEQRFGVRQKEALKAMRANVHLLTLTATPIPRTLNMAMAGLRDLSIIATPPPNRLAVQTFITAWDNTLLREAFQRELSRGGQLYFLHNDVESIVRMQRDLSELVPEARIGIAHGQMPERELERVMLDFQKQRFNVLLSTTIIESGIDIPNANTIIINRADRFGLAQLHQLRGRVGRSHHRAYAYLVVPDRRSMTSDAEKRLEAIASMDELGAGFTLATHDLEIRGAGELLGEDQSGQMAEVGFSLYTELLERAVRSIRQGKLPDLDAGEEVRGADVELHVASLIPEDYLPDVHTRLTLYKRISSARDPDALRELQVEMIDRFGLLPDPVKHLFAIAELKLQANALGVRKLDLGENGGRLVFEAKPAIDPMTIIQMIQKQPKIYTMDGPDKLRIKLPMPEGADRFNAARGLLAALSPG\n>tr|A0A241PHY0|A0A241PHY0_VIBAN Coenzyme A biosynthesis bifunctional protein CoaBC OS=Vibrio anguillarum OX=55601 GN=coaBC PE=3 SV=1\nMRRIFEEKTMQTLAGKKILLGISGGIAAYKCAELTRRLIERGAQVQVVMTHAAKEFITPLTMQAVSGRPVSDSLLDPAAEASMGHIELAKWADLVLLAPATADLIARVAAGMGNDLLTTLILATNAPVAVSPAMNQQMYRNIATQENIATLKRRGMMIWGPAAGEQACGDVGPGRMLEPMQLVERCEFFFQTEVANNTLLAGKSLLISAGPTREALDPVRYISNHSSGKMGYAIAQAAAQLGAKVTLISGPVNLLTPPQVQRIDVESACDMHQQVMAQAQSHDVFISCAAVADYRPEIVADQKIKKTDASDHMLITMVKNPDIVASVAALNENRPFTVGFAAETQQVEKYARAKLLNKKLDMICANDVSVAGQGFNSNDNALTVYWQGGEQALPLSSKSALAHALMQLIASQL\n>tr|A0A4V1XBV3|A0A4V1XBV3_9PEZI Oxidored_FMN domain-containing protein OS=Monosporascus ibericus OX=155417 GN=DL764_002426 PE=4 SV=1\nMASPMSQSRLFEPLQIANGKITLKHRVVLAPLTRNRGTPLNPNSTCENPNRIWIPNDLMAEYYSQRTTDGGLLISEGIPPSLEGNAMPGVPGIFIQEQVEAWKRVTAAVHAKGGIIYAQLWHSGRANIPHLTGTPIVGPSSLPWDDPEECYMYPIPHTDTRVKLADHPPVEMTMSKIKQTIDDFRRAARAAMDAGFDGVEIHGGNGYLPEQFLSSNVNRRTDEYGGSPEKRCRFVLELMAEVAGAIGQENLAIRLTPFGLFNQARGEQRLETWGHLCRELKRDLPHLSYVSFVEPRYEQVFSEAEKQRFLDSWGLPDVDLLPFRRIFGETPFFSAGGWNDANSWGVLETGDYDALLYGRYFISNPDLVERLRHGRPLAPYDRSRFYGPFEDNSIGYIDYPPYKEDNDPPCEEDNGDEDRARRLSVL\n>tr|A0A1C5LQ41|A0A1C5LQ41_9CLOT 4-hydroxy-tetrahydrodipicolinate reductase OS=uncultured Clostridium sp. OX=59620 GN=dapB PE=3 SV=1\nMTKIILSGANGKMGKVIARCTEERNDCEIVAGVDLNTQAYSDFDIYPSFSECGESGDVIVDFSNPAVLDGMLDYALKTNTPVVIATTGYSPEQIEKIQKAAEQIPVFFSFNMSLGVNLLVSLAKKAAEVLGGQFDIEIIEKHHNQKIDAPSGTALMIADAINDTLDQTQKYMYDRHAQRKKRDKNEIGIHSVRGGTIVGEHEVIFAGHDELLSLKHQAMSKEIFAVGAVNAAVFLKGKPAGIYDMGKMV\n>tr|R7KGB8|R7KGB8_9BURK ATP synthase subunit delta OS=Sutterella sp. CAG:521 OX=1262977 GN=atpH PE=3 SV=1\nMAELSTIARPYAHAMLLALQDANKGPEEAADLAAVLDGIAQVVTTPELVSVIGDPKLSSEQIYDLIIAGLGQTKLPEEAANLLKVVVENGRLEAVPEIARQFRELKNQSEGVADAYIESAMPMTQAEVDDLVAGLGKRFPGLKLTPVVTINEALIGGVRVRVGDRVLDGSIQTRLAQMQEALTA\n>tr|A0A496GGQ1|A0A496GGQ1_HELPX Uncharacterized protein OS=Helicobacter pylori OX=210 GN=DD744_03805 PE=4 SV=1\nMRIKAYFLRFIALVLIVLLGFSACKNSQKSQDSQNNTTQQDSPKTYTAMDLNNQEYTITGDLDSLNISPDSNTPTLLVLSALDDFLKDYAPTFNILKKTFKDRLRVLILLNQPYSSDAIKDFIAPFQADLMILNPKDTALFDHLNHNALNHSFNMLLYHKHQLIKMYQGIVPAEMLQFDISNLKD\n>tr|A0A847F664|A0A847F664_9DELT Uncharacterized protein OS=Sandaracinaceae bacterium OX=2510337 GN=GX614_10825 PE=4 SV=1\nMSSPCLRIALIALLFALPSLSSADDGDLRLLRESIGYIEVADAADDEDPFDFNLSLGFRHDRVSGNITREMLSPVDGSVMQKVGDYSATRSYLDVAAEIGLYRDLAVRLMVPVLLSYDQSITDIESAATPLLGSQDAVSPTRSGIPEIIVGLAWQPMNQMRRADRPNWTWLFNVALPTGKVMSPCLDVPGSSCASNAGVSTGVVRLLPEWRLSYRFRYVETYGGLKGEIPFPTASRDSLFTPGGQLLGYRKTRPSIRGGFIVGAALIPWERRATHQRLAIDMRFHAHYVSGGRDFSPLFDVLGDPNLSPTPRFPEICEDGSVAGTGGVCNPGDPYATRFTGLTTTQSHGNIGGRLTLEIKAARYITFYVSSGLQWITSHLLTTESECNASVDPHPQDAINCNVGRPNPHYQREIDMVGNRFGVGNLTNLDLVLRAQGTF\n>tr|B4RA04|B4RA04_PHEZH Transcriptional regulator, Cro/CI family OS=Phenylobacterium zucineum (strain HLK1) OX=450851 GN=PHZ_c3099 PE=4 SV=1\nMPRPATDPAKAAQIKALRQQAGRWLKAAREAAGMTQAELAEKVGLRYYTFVSQVESGLGRLPIETQAAWATALGLDPGEFARTLLRYYEPELFRLLFETDSAQGRATA\n>tr|A0A1V2CHU8|A0A1V2CHU8_9FLAO Vgr family protein OS=[Flexibacter] sp. ATCC 35103 OX=1937528 GN=BXU01_03190 PE=4 SV=1\nMTPPTIIFGIDSKKISHFTSIELVQVINDHHRFEILVPHAAVESPLAYTLENAQAWLGKVVHIVLEEKNNFLGVVTNIDFDQEMGHSGNQIIVSGYSKTILLESGEKLHSWEELTLKDIVKEVVKNGAGEQLQNEINPEYTSKMDYQNQYLETDFQFIQRLAKQFNEWLYYDGEKLIFGKPKSFDSPISLTYNSEISKLKISVQAVPNKFSAFTYNESADKRYTAKSKDTVGGLPKLGNEAFASSKEVFATPAYTHGIVSTGDDLVLESFLKKKQESAAADTNFVSATTKNSKLRIGSIVTIQSSVLENKSLITQEVGSFIITEISHYATHLGEYENNFRAIPSKVLSLPEPDVAYPIAQTQQALVESNTDPQNKGRIRVQMLWQQGTQMKTAWLRVMTPDAGSSDKVGTNRGMVFIPDVGDHVMVHFRYGDPNRPFILGSVFHGKSGGGGGKDNNKRSFATRGGTSLVLDEEKNTFTATDPSGNMIMLNGDGTMTIYAPNKVDIQSKEINLIADEKVSISGVNEVSVDSKKVLVSGTDEVTVKSDTQITDEAPSINIKGKNTILAEGTVVDIDGKTMTNVKGGVVNLN\n>tr|A0A7X9ZH40|A0A7X9ZH40_STACP Pur operon repressor OS=Staphylococcus capitis OX=29388 GN=purR PE=3 SV=1\nMRYKRSERIVFMTQYLMNHPNKLIPLTFFVKKFKQAKSSISEDVQIIKNTFQKEQLGTVITTAGASGGVTYKPMMSKAEATEVVNEVITHLQEKERLLPGGYLFLSDLVGNPTLLNKVGKLIASIYMEEQLDAVVTIATKGISLANAVANVLNLPVVVIRKDNKVTEGSTVSINYVSGSSRKIETMVLSKRTLAENSNVLVVDDFMRAGGSINGVMNLMNEFKAHVKGVSVLVESKEVKQRLIEDYTSLVRLSDVDEYNQEFKVEPGNSLSKFS\n>tr|D2PK46|D2PK46_SULID UPF0148 protein LD85_1482 OS=Sulfolobus islandicus (strain L.D.8.5 / Lassen #2) OX=425944 GN=LD85_1482 PE=3 SV=1\nMTNESEVGVKKAAELLRQGATMLEEACPICKMPLFKLKNGDVVCPVHGKVYIVKSDDEEKIVKRNLQLDEIESILIDGLYLSAKKMKEDPLDSERIIQIIRYLDALERLRKIKINSSE\n>tr|A0A353T2J5|A0A353T2J5_9FIRM FAD/NAD(P)-binding oxidoreductase (Fragment) OS=Clostridiales bacterium OX=1898207 GN=DDW86_03375 PE=4 SV=1\nTTEQGEIRASYLVNAAGVYGEVVSEMVQERSFTIHPRKGEYLLLDKSQGNLVHSVIFQTPTKMGKGVLVAPTVDGNLLTGPTALDVSEKDDVGTTAEGLEKIRKEAGKSVPDIPFRDVITSFAGLRATPDTGDFIIEASGTVKGFLNVVGIESPGLTAAPAIGEYAVDLLGKEGLPLVPRGDFQPVRKPAVRFREQTDEEKQRLIRENPLYGNVICRCEIITEGEIVDSIRRPAGARSLDGVKRRTRAGMGRCQGGFCTPRVTAILARELRIPEERVTKKGKGSELLAEKRGPSC\n>tr|A0A3D6A882|A0A3D6A882_9FIRM Guanylate kinase (Fragment) OS=Lachnoclostridium sp. OX=2028282 GN=DHU73_00550 PE=4 SV=1\nKSATGKDTLYKEILKRRPKLRTVTMYTTRPIREGETDGVEYFFTDREELERQLASGKVIESRTYQTIAGPWTYYTVDDGQFDVADDESCLMIGTLESYEKMCAYFEAGKMVPVYIEVPDGIRLLRAVKREENQKKPNYREVCRRYLADEKDFSEENLERLGITKRYQNTDMEMCVEEILRDLDK\n>tr|A0A5P9EVH6|A0A5P9EVH6_9GAMM Uncharacterized protein OS=Microbulbifer sp. THAF38 OX=2587856 GN=FIU95_07605 PE=4 SV=1\nMKKITSKYPQYRAVLKNSIASFTLICASTLVQADTISTKIDLGEPFPFKMEDGVEYEVDLDIGYQFDSIDNACISTEVKGGNASKAFLELESEPAAGSFILGYSESHEIGMIYSFDFPTQENPNPVSELISFGFCAGRFNGSLLKRNFLDGEGKFTVSVSGGYVEFWDFKLVVEGDLSDIQLAIELDEPADFSVPSYGGRVNYDASIRNLDSSQSLITLDQWSVLTLPNGDNYPIHKSRDVVLNYSEAKDYTRNYLTIPEWFEAGDYELTWYVADPSTGVRVKDSLHFTKSAD\n>tr|A0A161IP46|A0A161IP46_9BACI Uncharacterized protein OS=Fictibacillus phosphorivorans OX=1221500 GN=ABE65_012790 PE=4 SV=1\nMKRQCLHMLTGFLFILLLTACIGEDYDAGPPELRLSVEEDLYALKQANVDWKTEEKEFKNKVEHFLTLGSEQKEIKLSPNQSAELILLENKEDDGEYTNETLEISLWKENEKIELTTKSSTDYSFSFPSDPGQYVLEVNFRTSNGRSQYVGNITLK\n>tr|A0A2W4W2P1|A0A2W4W2P1_9CYAN Uma2 domain-containing protein OS=Leptolyngbya foveolarum OX=47253 GN=DCF25_12600 PE=4 SV=1\nMIAAKDHPPKLTSEEYFAWEEKQLEKHEYIDGQVYAMSGGSVNHGRLAIRLTAMFDNHLEESSYITGNSDIKVNIVKTVDYTYPDASVTCDDRDQNTPNYFTYPCLIVEVLSDSTEAYDRGGKFRMYQNNPVLQDYLLVSSTRIEMDLYHKNENGDWLILTYQKGDMVTLKSIGLSFPIEQVYRGLSLQQPDQFY\n>tr|A0A1B2E8Q8|A0A1B2E8Q8_9BACL Serine/threonine protein phosphatase OS=Paenibacillus ihbetae OX=1870820 GN=BBD41_01205 PE=4 SV=1\nMLWILVIPVLNIFYAVLNQAHMPVYSLMTDLDAQIPFVPMFIIPYLIWYPFIIIVLFMLCIRERSVYYRTLLTQCLGLVACYIIFYLFQTTVERPTTMGTGIFEGLVNLVYSTDNPYNCFPSIHVLTSYLMIKGATACASYPNWERTAVKVCAWMIIASTLFVKQHVLLDIAGAIAVVELLWYGVGKLPLGQQSKFKGEVVRQNLTAD\n>tr|A0A044SS46|A0A044SS46_ONCVO Methionine--tRNA ligase OS=Onchocerca volvulus OX=6282 PE=3 SV=1\nLHLMIRSIKTICAIEGVSISSMRLKHFITTPIFYANGPPHIGHLYTALLADALNRWKLLKDGNIDSDNLLFTSGTDEHGLKIQRSATAAGYDPQSYCDNISGKFKDLFHVFGIHPNDFIRTTEVRHKEVVNHVWVTKELNKRGQIQLGKYEGWYSTIDECFYASDEVETLSGQTSTISKITGSVVEWVQEENYIFPLSKYLGTVRNWLNNCDVIRPKIYFPEALQHASIEGNLSLSRDRKRVTWGIAVPNDESQTIYVWFDALMNYLTVSGIFSNKKRINWPPTCQIVGKDILKFHAVIWPAILLALDLPLPKRIFVHSHWLVNGTKMSKSVGNVVDPFSVSKSLSEEGLRYFLLRQGTPQNDANFIMSKAVDVINTDLVNNVGNLLQRSLIEKLNPSQTYPTFYPDSFHNSLLELGEPLVKSVSCLAELYEEQFDELMIYKALEMLMEVMRQANGFFQFYEPWKELDNRKMSSLLYVCYEVLRICGILLQPVVPHYADHLLNRLGIKKNERGLDNVKFTIDSKYSGKPLGEYNGPIMDRIMCKTGTV\n>tr|A0A4D6LT85|A0A4D6LT85_VIGUN Uncharacterized protein OS=Vigna unguiculata OX=3917 GN=DEO72_LG5g291 PE=4 SV=1\nMPNDQEALGQLEDPHGSDGHNNSTGSGRHDDPNGSSELDNQDGLARSTTKTGRVGWVNDLNGPNGPNDPNGRHRSNDPNGPDRPDDSNMPICLTILIGLTGPMI\n>tr|A0A0S6UQD0|A0A0S6UQD0_9BRAD Sulfopyruvate decarboxylase subunit beta OS=Bradyrhizobium sp. DOA9 OX=1126627 GN=BDOA9_0130710 PE=4 SV=1\nMSKANLLDRRQVVSTLLANRKDVVAIGGLGASTNDMCAAGDHARNFYLWGGMGGAAMIGLGLALAQPKLPVLVITGDGEMLMGMGSLATIGLQKPANLSIAVLDNEAYGETGGQTSHTSAAADLVGIAKACGINDSRAVTTMADVEAFAKAVHDVSAGPRFANVKIDSANLERILPTRDGTYIVNRIRADLGFQPI\n>tr|A0A3R0JE73|A0A3R0JE73_SHIDY Anaerobic sulfatase maturase OS=Shigella dysenteriae OX=622 GN=DL723_09995 PE=3 SV=1\nMHVTAKPYSFQCNLKCDYCFYLEKESQFTHEKWMDDSTLKEFIKQYIAASGNQVYFTWQGGEPTLAGLDFFRKVIHYQQRYAGQKRIFNALQTNGILLNNEWCAFLKEHEFLVGISIDGPQELHDRYRRSNSGNGTFAKVIAAIERLKSYQVEFNTLTVINNVNVHYPLEVYHFLKSIGSKHMQFIELLETGTPNIDFSGHSENTFRIIDFSVPPTAYGKFMSTIFMQWVKNDVGEIFIRQFESFVSRFLGNGHTSCIFQESCKDNLVVESNGDIYECDHFVYPQYKIGNINKSELKTTNSVQLTAQKKRISAKCLKCVYKPICNGGCPKHRITKVNNETVSYFCEGYKILFSTMVPYMNAMVELAKNRVPLYHIMDVAKQMENN\n>tr|A0A1V2IM99|A0A1V2IM99_9ACTN Uncharacterized protein OS=Frankia sp. BMG5.30 OX=1834514 GN=BL254_17150 PE=4 SV=1\nMSAEPIILLDPATDAGLIVAATEHTFACQMQTFAWAAANTNLPASERAIARAMTGRARAVSPLTQAQMNAQLHQTGGSR\n>tr|A0A7V4T793|A0A7V4T793_9DELT Sigma-54-dependent Fis family transcriptional regulator OS=Desulfobacterales bacterium OX=2044940 GN=ENK36_05755 PE=4 SV=1\nMENILVVDDEKNYTMIIGEILQEEGYTSITASSGMEALDILNNEIIDLILTDVKMPGMSGIQLLEKIKELNPDIPVIIMTAFGSVEKAVDAMHRGAYTFILKPFENQALIAHIAKALSVYKIVQENSRLRDAISSRYSFDNIIGKSRPMQEIYEIIKKVAPSNASVLIEGESGTGKELVAKSLHYNSPRRNKPLIVVNCSAFAETLLESELFGHEKGAFTGASALKKGRFEISDQGTLFLDEIGELPISLQTKLLRVLQEKIIERVGGTLPIPVDFRLIAATNKNLEDEVKNGNFREDLYYRLNVVKTVMPPLRERSEDIPLLIKHFMDKYTNEQQLESRVSGITSEAVKILCDYQWKGNVRELENILESCILLGSGDMITPSDLPLQVRQNTSSFLDLDGIPQDVGLAETLTAVERRMIRRAMKLSGNVQTKAAQLLGIGKSGLNQKLKKFNLG\n>tr|A0A6G1U079|A0A6G1U079_9BACT Virulence protein E OS=Prevotella copri OX=165179 GN=F7D73_08405 PE=4 SV=1\nMNINIFNGYQSTEPAIIKFQQMVDIIRGDKQLAELTKRYRITHQREYKSQCYCFSVTCVFQGGKAKKDIIEVTGIGFSDFDHVPKEKLAELCAKLREDRHTLFFHITASGEGLRVLYRYEMKPGMTLEEQMKFYPTAFLHGNQYFSDLLGVEYDEHCCNLGRLMGAAYDPDAFFRPNAEPFSYDWLVARQQEKTLQDNATARLRREVKKIDRLYEDKLAKELEQEMKTYVAGSKNEYVSCLAYKLNAFGFSADAALEFICQEFPDYERPKAVVDSCYRQTEEHGKRKHELQNRRHEAGKSASVNDIIRFLGEHVDLRYNQITMRVEYRMKEESDGEDSSTPGLWQIINDRAVNTLWSEMSKTNRAAVQDFFRVIESNYVQPFNPFTDYLGSLPEWHEGDTDYIQQLADSVTIKGGEEQQKLWACYLRKWLVGMLAGWTLDDVVNNVIIVLIGAQGSGKSTWIAMLLPPELRQYFYTKTNASRLTKDDLLVLATYGLMLCEELDTMKPSELNQLKAAVTMLTIDERAAYAHFAEHRPHIASFAATGNNVQFLSDPTGNRRWLPFEVESIQSPREHPFDYPHIYAQALHLLRSGFRYWFTQQEIIELNLHNHKFEAPRLERELVALYFAHPTEEQHGIFMTASRALQIIGAGISQKLSAVYVGRAFCELGFRKVRVNHCWGYLVIERDGDMIKAQQVRLAMEAEDDYSQQETDPDLPF\n>tr|A0A806DEP4|A0A806DEP4_HAEI6 Catalase OS=Haemophilus influenzae (strain R2866) OX=262728 GN=hktE PE=4 SV=1\nMSSQCPFSHLAATNLTMGNGAPVADNQNSLTAGPRGPLLAQDLWLNEKLADFVREVIPERRMHAKGSGAFGTFTVTHDITKYTRAKIFSEVGKKTEMFARFTTVAGERGAADAERDIRGFALKFYTEEGNWDLVGNNTPVFFLRDPRKFPDLNKAVKRDPRTNMRSATNNWDFWTLLPEALHQVTVVMSDRGIPASYRHMHGFGSHTYSFWNEAGERFWVKFHFRTQQGIKNLTDAEAAEIIANDRESHQRDLYEAIERGDFPKWTLFVQIMPEADAEKVPYHPFDLTKVWPKKDYPLIEVGEFELNRNPENFFADVEQSAFAPSNLVPGIGASPDRMLQARLFNYADAQRYRLGVNYRQIPVNRPRCPVHSNQRDGQGRVDGNYGSLPHYEPNSFSQWQQQPDFAEPPLRINGDAAHWDYRNDDKDYFSQPRALFNLMNAEQKQSLFNNTAAAMGDAPDFIKYRHIRNCHWCDAAYGEGVAKALGLTVEDALKARDTDPALGQGGLL\n>tr|W7JTJ0|W7JTJ0_PLAFA Uncharacterized protein OS=Plasmodium falciparum UGT5.1 OX=1237627 GN=C923_00937 PE=4 SV=1\nMSLINKKNKENHNLIGKEEKIENDNTQDIKDNVYSSYSNDNNKYDNNNNTYDNNNNKYDNNNNNFNINTNYLMNICPLFYSFMIFFNQLNSRKKLMKIINIIDEEKCLDKDENEINKKILSSICHGGVWDELVTLYDPIYSSNYESFINRKKNDYNKIYDKPIEMNKNGQDMQSKGNYTTTKNSTTNYNNIQKNDLNKKFVDATTGNTYSDRITAQSYIHDNNDENNNIHNYIDEIDDMDNVHNVVNSCGVHLNDVHSFQKDREDNSSYSYRRNEHMSNNIDTICGSKNLLLNHKGTNQDNNIFERNKENVSNSSYNYINENNTFSEKNFSTCSILKRRNVYHNKDYRYCFSTSQQNDGKYLEQNKSNVLHNDDYNDYYNDEYNDDYYDADNVDVFHYINKNKSNSIISNNYPCDNTYNQNTNLNNDNCKTKNNINMPLNINYPYGISKDEMIHFKNYPYNYNDKYDFDEDISSLMKNLKTDDYTNDDIINIKKKKKKGSLINNKNITDITTYTNSSSSLYNKNNNNKNNNNNYYYTNTKDNFYYNYNQNYDIPKKTYDNISTSCEPNHYMKNSSNNSSHHHSVYEGRYTFNKLNKTNKYMYNSFLPNKQQSFFNNNYNNNYNNNNYHCDYSKFDSEDLIWKYYNNPSNNRNHIKNIHNLEKKYEHNINLASKVSSATWLIYLYELKRASFFINYYFYHLHLFIYFKNYFINYQKNYKLFQNNKWIILKRNYEKQKKKEKYWDMINMKEPEINVHTTCISKKLNDIKAKNVLNNNDHMNKEDKQKNVIDQENNNKQKSNKTHYDIFKRDMHEIIKCTVQNLNYCIDALFEKTKGDIYSLPFKIDKKNKNKNKKINNNNNNNNNNNNNNNNNNNNSNSSSCSSSCCCFNNTTNISPQLNNIHSFLNNKNCKQNNINKDSMTNSYGLILIEGKLIFVKFLYICIDKEKFWDESFLCRRDIRTVIHVKALDVLFISKNKLKKKIKKNIKKKAKNEKDNNLNNIINQNICNNDKKDIYFDIEQNLCTNNKSSQEFSSSNTSNIDNQFLSDDIIFCEQKNNLLKDSKLTHQQTYDINTNLQNNKNHFEEKISMYNNTHKKNDHYVNDDIINLWKCKQEKELSNNFIYNNKNNYIGILMEQNSNQDIFFKNNSKFIIKKNYIDQNNEHMDNMKTYQNDQTDMEKKKYNDENIFSINPCNFVTRINVKTIYVSGKHIHDDLKGTLLQKIDIKKEFKNDDEMNTFLQNQKDIYDEEIYCLRIISRNEIMRYKELIKIMKKGPYYYKNAKNILNNLNNLNNFNTPLQQTVPLCNFCGIKGMCNINTKHYKMSSIQEHVKNKFYTFMYHIFYKYKPKNQGGNIHNNNNNNNEDHLICNHSSKFKHINKEKRNKELPTNYENNIFNHTIVTSKDDQHNCLSDTNYRDNNLSDQCKNYSFHNIYNCDDHENKSELKNNREDKNDHDMYNIVEDIKHTQRNNQYNYKDIKVDNHYDNIIHMDKEKNIEKINIKSNYTKNNSEQYVNKIENFNDKKCESQNNIINNNNNINNINNNIKTELLHQNEINKNCINNNSTFPIKDKQIINNSKGIKNNILSEYYKIKKRQKSIDKISKLYKDEIKKKNNNDFIPHNKKIMRINNTINCLVGQRAQTNFLFLKKNHLNTTTENITTKIVTGAQNNNLNNVSLKKNNSGQMEENNTNDISYVPTFRKFQESKK\n>tr|H6AA47|H6AA47_PINCO Tubulin_C domain-containing protein (Fragment) OS=Pinus contorta var. murrayana OX=1115831 PE=3 SV=1\nQVYRSLTVPELTQQMWDAKNMMCAADPRHGRYLTASAMFRGRMSTKEVDEQMLNVQNKNSSYFVEWIPNNVKSSVCDIPPKGLKMASTFIGNSTSIQEMFRRVSEQFTAMFRRKA\n>tr|A0A7V8T8F4|A0A7V8T8F4_9GAMM Nuclease SbcCD subunit D OS=Pectobacterium versatile OX=2488639 GN=sbcD PE=3 SV=1\nMRIIHTADWHLGQYFYTKSRAAEHQAFLHWLIAQVEQHQVDAIIVAGDIFDNGSPPSYAREMYYSFVVALQRTGCQLIVLGGNHDSVAMLNESRELLACLNTQVIACASDDPAQQVILLETRQRQPGALLCAIPFLRPRDVLTSKAGQSGDEKQLALQEAITAHYLQCYQLACQKRDELGLPLPIIATGHLTTIGATASESVRDIYIGTLDAFPAQAFPPADYIALGHIHRPQRVTQSEHIRYSGSPIPLSFDELNSEKSVCLVSFAPDTPAQVEILPTPVTQPMQLIKGSLSDIEQQLTTFQNYQGEKPVWLDIEINTQDYLSDMQKRIQAMTEHLPVEVLLLRRTREQRLQAITQQDKETLNELSVHDVFERRLATETDMEDGRQQRVRTLFNQVIDELENSEPAQ\n>tr|E2ZKL4|E2ZKL4_9FIRM Alkaline phosphatase family protein OS=Faecalibacterium cf. prausnitzii KLE1255 OX=748224 GN=HMPREF9436_02217 PE=3 SV=1\nMKREDHVMKENKISRRSFLKFGAAASAAGMMAAAPVAANAAQPDADAAADEENCLLGLFQKPKYIFLFIGDGMGTAQIQSARFYKGTVDNNGAVTEADLSFTSFPTVGSVTTYDSTSFCPDSASTATSIATGHKTESGVINMCPWTRDVPYETIAEKLHAQKGYKVGIISSVNIDHATPAAFYAHQKTRKNYYQIGVELANSGFEYFAGGEFQKVNGDGAGPNNHEVAAQAGYNVVTTQAGAAALTAGAGKTLIIAENLADGKAMNYAMDAAAGEWQLTDYVKKGIELLDNPKGFFLMTESGKIDWACHANDAAASIHDVLEMSNAVQAAVEFQQKHPNDTLILVTADHETGGMAIGYKTTNYDTFLTNLAHQKMSYAKFDSTYVQNYIANKTPFEAAMQDVKANFGLTLPSDPDAANAGKLLLTDYEVQNLRTAYERTLKVGSASQKDMSQQDYEMYGTYIPFSMAICHTINHKSGMDHTTYAHTGAMVNVYANGVGAEKFGGVFDNTEIYHKLADLTKVK\n>tr|A0A8A6LC47|A0A8A6LC47_SARS2 Surface glycoprotein OS=Severe acute respiratory syndrome coronavirus 2 OX=2697049 GN=S PE=4 SV=1\nMFVFLVLLPLVSSQCVNLTTRTQLPPAYTNSFTRGVYYPDKVFRSSVLHSTQDLFLPFFSNVTWFHAIHVSGTNGTKRFDNPVLPFNDGVYFASTEKSNIIRGWIFGTTLDSKTQSLLIVNNATNVVIKVCEFQFCNDPFLGVYHKNNKSWMESEFRVYSSANNCTFEYVSQPFLMDLEGKQGNFKNLREFVFKNIDGYFKIYSKHTPINLVRDLPQGFSALEPLVDLPIGINITRFQTLLALHRSYLTPGDSSSGWTAGAAAYYVGYLQPRTFLLKYNENGTITDAVDCALDPLSETKCTLKSFTVEKGIYQTSNFRVQPTESIVRFPNITNLCPFGEVFNATRFASVYAWNRKRISNCVADYSVLYNSASFSTFKCYGVSPTKLNDLCFTNVYADSFVIRGDEVRQIAPGQTGKIADYNYKLPDDFTGCVIAWNSNNLDSKVGGNYNYLYRLFRKSNLKPFERDISTEIYQAGSTPCNGVEGFNCYFPLQSYGFQPTYGVGYQPYRVVVLSFELLHAPATVCGPKKSTNLVKNKCVNFNFNGLTGTGVLTESNKKFLPFQQFGRDIDDTTDAVRDPQTLEILDITPCSFGGVSVITPGTNTSNQVAVLYQGVNCTEVPVAIHADQLTPTWRVYSTGSNVFQTRAGCLIGAEHVNNSYECDIPIGAGICASYQTQTNSHRRARSVASQSIIAYTMSLGAENSVAYSNNSIAIPINFTISVTTEILPVSMTKTSVDCTMYICGDSTECSNLLLQYGSFCTQLNRALTGIAVEQDKNTQEVFAQVKQIYKTPPIKDFGGFNFSQILPDPSKPSKRSFIEDLLFNKVTLADAGFIKQYGDCLGDIAARDLICAQKFNGLTVLPPLLTDEMIAQYTSALLAGTITSGWTFGAGAALQIPFAMQMAYRFNGIGVTQNVLYENQKLIANQFNSAIGKIQDSLSSTASALGKLQDVVNQNAQALNTLVKQLSSNFGAISSVLNDILARLDKVEAEVQIDRLITGRLQSLQTYVTQQLIRAAEIRASANLAATKMSECVLGQSKRVDFCGKGYHLMSFPQSAPHGVVFLHVTYVPAQEKNFTTAPAICHDGKAHFPREGVFVSNGTHWFVTQRNFYEPQIITTHNTFVSGNCDVVIGIVNNTVYDPLQPELDSFKEELDKYFKNHTSPDVDLGDISGINASVVNIQKEIDRLNEVANNLNESLIDLQELGKYEQYIKWPWYIWLGFIAGLIAIVMVTIMLCCMTSCCSCLKGCCSCGSCCKFDEDDSEPVLKGVKLHYT\n>tr|A0A6B9XTV0|A0A6B9XTV0_PICSI Uncharacterized protein OS=Picea sitchensis OX=3332 GN=orf05555 PE=4 SV=1\nMRCYGHWNVMVPHPAQQIFESHLLQVYTVFHNFYKLAAIEWGMPAIMNSPCLAIDFFLPVGEKTLHSADHTPLCGCNSLCHSYLFESRVSFFSYYSPQRAV\n>tr|A0A2A4QF02|A0A2A4QF02_9GAMM Uncharacterized protein OS=Gammaproteobacteria bacterium OX=1913989 GN=COB83_09745 PE=4 SV=1\nMLKIIVGFIIVIILTGGVVTPSIEWINKVFHVKNGGIYLSIAFFICYFFLLAFRLIKKK\n>tr|A0A418RSL3|A0A418RSL3_9GAMM Antitoxin OS=Methylococcales bacterium OX=2304002 GN=D0528_03225 PE=3 SV=1\nMINEVNTAVFQQNLGEMLNQVQYRHDSILIKEDGKPVAALVDAQLFDRIRRFKNRFDTLSNQIANAYESVPQEDGLNEIDAIVSEIRHSQF\n>tr|A0A510B6M8|A0A510B6M8_9POAL Photosystem II reaction center protein L OS=Avena longiglumis OX=4500 GN=psbL PE=3 SV=1\nMTQSNPNEQNVELNRTSLYWGLLLIFVLAVLFSNYFFN\n>tr|A0A2D5H536|A0A2D5H536_9PLAN Antibiotic biosynthesis monooxygenase OS=Gimesia sp. OX=2024833 GN=CME31_26170 PE=4 SV=1\nMFCLNVILTLKDAADAEEIQGLLTEACRLSRTEPGCLRFDVYQSEGEPATFVLVEHWESEDAWQTHREAEAYTQIYQPQILPRVERVPYRMKMLLE\n>tr|A0A7L7BQ76|A0A7L7BQ76_9ENTR Alpha/beta hydrolase OS=Enterobacter sp. RHB15-C17 OX=2742619 GN=HVX06_10740 PE=4 SV=1\nMFSKLAYSTLALTVSLGTVISCQAEATGTDFATAFDHPQQINAGDLNVGYVDIGPKNGQPIILLHGWPYDIHSYAQVAPALAAKGYRVIVPSLRGYGTTRFLSDKTPRNGQPSAMAKDVVNLMDALNIKQAVFAGYDWGARTADIVAALWPERVKSLVSVSGYLISSQQIGKQPLPPKAEVQWWYQFYFATERGAEGYAKNTHDFARLIWSQASPDWKFSDATFDASAKSLDNPDHVAVTLSNYRWRLGLEKGERKYDSYEQKLATLPNITVPTITIEGGNNGAPHPAPQAYAGKFTGKYEHRTFGKTVGHNPPQEDPQDFVNAVVDADKL\n>tr|A0A7N0VAI1|A0A7N0VAI1_KALFE Uncharacterized protein OS=Kalanchoe fedtschenkoi OX=63787 PE=4 SV=1\nMENAEAFEASTAPLSLHDFFERMRQPAAAEFVKAIKSFVVSFSNKAPNHERDSAAVQDFLSNMERAFREHPLWAGCSVEELDCAGEGLEKYVMTKLFTHVFASLPDDLEVDRQLSDKMALLQQFIRPENLDIKPNFRNEASWLANPPQLHSNLLYIQRYRHHPRLVAEYAYYFTNMLSVESFITNINAKALSMDETEFEMNMESARALNLGLSADTSDMSDQNEQNLENTSNKEAVEIKQGFSNFKTDHVTRPPPSVSKSGKIELRHTKAESSIRKIPSMSDLENKGAFMLLNENRLSRVFQEYPYLFSQVGDLTLDDVESLLNNYKQLVFKYVSLAKGKGSEPLPPPFISMSNSQSQRATPADAERESIEEPVAEKTNNRNEANSWTDEGSIEVSQVPELNSPDYKMPEVSSAQVEADHDHDNS\n>tr|A0A3N0D1M1|A0A3N0D1M1_9FLAO NAD-dependent epimerase/dehydratase family protein OS=Sinomicrobium pectinilyticum OX=1084421 GN=ED312_22910 PE=4 SV=1\nMKVALIGATGFVGTNILKELVDRGHKVTAIARNPERSEIKGYHVTPVKADVLDTDRLAEILAGHDAVVSAFNPGWANPNIYDDFLRGAKAIQEAVKKSGVSRFVVIGGGGSLYLKPGLQVVDTPEFPAEIKSGADAARLYLEEIRKEKVLDWVFFSPALEMHQGITTGRTGKYRLGLENPVFDKDGRSVLSGEDVGVVIADELETPKHHRERFTAAY\n>tr|A0A6P0AN79|A0A6P0AN79_RHILE Siderophore-interacting protein OS=Rhizobium leguminosarum OX=384 GN=GR232_16200 PE=4 SV=1\nMDNNQFKDQASSTPGIERIRHDTRRRLLTVESVVDITPSMRRVVLAGDDLADFISLGADDHIKIFVPVADGSEERRDYTPRRYDNIERRLTIDFALHEAGPVTKWAIDADPGDRLEIGGPRGSAVVSKTVKRWLLIGDETALPAIGRRIEESGAGTVVTTIAAVTGPLEEQTFETSAELHLHWAHRPLSQATSATALLKLLSTVDIQPETFIWVAAEASVTRDIRAYLLERGCPLGWIKASGYWVFGKADTTEKFG\n>tr|A0A7K4JQ10|A0A7K4JQ10_GEOCA GT252 galactosyltransferase (Fragment) OS=Geococcyx californianus OX=8947 GN=Colgalt2_1 PE=4 SV=1\nVATDHNVDNTTAILKEWLKNVQNLYHDVEWRPMEDPQSYPEEIGPKHWPSSRFTHVMKLRQAALRAAREKWSDYILFIDADNLLTNPETLNLMIAENKTLVAPMLESRSLYSNFWCGITPQA\n>tr|A0A673XYG3|A0A673XYG3_SALTR Gamma-tubulin complex component OS=Salmo trutta OX=8032 GN=LOC115201020 PE=3 SV=1\nMSEFRIHHDVNELLSLLHVRGGDGAEVFIDLLQKNRTPYITTTVSAHSAKVKIAEYSKTPEDFLRKYDELKSKNVRNLDPLVYLLSKLSEDKEVITYISHLITVLCYVPITFVCNRMPKKGLKRLLMRQQVQPLLSLQPSAEVTRKMLRDRHNKKNPTQPNPVFPNWVYDRPALIGDFITGATAAGDPEVAIGTMPLPAQEQALVDDLLFVLVGVDGRDITAQPVLGRQNRSFIVDPTLDMSIKELVNRILPVASYYSTITRFTEEKSSFEYGQVNHALTAAMRTLMKEYLILVTQLEHLHRQGMLSLQKLWFYIQPTMRTMEILASIASSVDKGDCMGGSTLSLLHDRTFNYTGDSQAQELCLYLTKAASVPYFEILEKWIYRGIIKDPYSEFMVEEHELQKEKIQEDYNDKYWDQRYTIVQHRIPSFLQKMADKILSTGKYLNVVRECGRDVTCPDAKEVLYTLKERAYVEQIEKSYYYASKVLLDFLMEEKELVARLRSIKHYFLMDKGDFFVHFMDLTEEELKKPVDDIVPPRLEALLELALRMSTANTDPFKDDLKIDLMPHDVITQLLRVLAIETKQEKAIINADPTEVALSGLEAFSFDYIVKWPLSLIINRKALTRYQMLFRHIFYCKHVERLLCNVWISNKTAKQYALHRAKWFATAFALRQRMLNFVQNIQYYMMFEVMEPTWHIMEKNLKSASNIDDVLCHHTSFLDNCLKDCMLTNPELLKIFSKLMSVCVMFTNCMQRFTQSMKLDREMNRLSLEHGTMEGPPTQSERTEEQEKKRLTSKFLAEHVDALQSDACFEATVSKFDSNFSTLLLDLLDKLSVYSTNDCEHSMINIIYRLDFNGFYTERLERMAIERSQKAAA\n>tr|A0A5S5C3J5|A0A5S5C3J5_9BACL Uncharacterized protein OS=Paenibacillus methanolicus OX=582686 GN=BCM02_107172 PE=4 SV=1\nMTESNYKNWPTDEHARWIRMGHFFGKTLMEEVKGHAKERIDPASSVEERLAAEKAIRDTLYGFMMLLDGVIDSPIDQDHGVEFALVARVFNQDTREYLEEIELAPDGDGLCMGIHMWEDGEFE\n>tr|M5BKI9|M5BKI9_THACB Septin homolog spn3 OS=Thanatephorus cucumeris (strain AG1-IB / isolate 7/3/14) OX=1108050 GN=BN14_01267 PE=3 SV=1\nMAYRHRGRKNAKKGIQFTLMVVGASGTGRTTFVNTLCESEVLAPKIADNAETAHVEEGIRIKPVNVELEEDGTRIALTIVDTPGFGDNIDNEFAFQEIVGYLERQYDDILAEQSRIKRNPRFRDNRVHALLYFIPPTGHALREMDIELMRRLSPRVNVIPVIGKADSLTPSELKGFKKRVMEDIEHYGIPVYNFPYDVEEDDEETIQDNSELRAMLPFAIVGSGDEVEIDGQPVRARIYPWGVVEVDNPKHSDFSRLRSALLNSHLMDLKSLTDDVLYETYRTEKLSRMVHADNTDDSILPEDLATQSVRLKEEQLRREEEKLREIELKVQREINEKRQELLAKEESLRNLETRLAAQGSQAEF\n>tr|A0A6P8KJN9|A0A6P8KJN9_DROMA synapse-associated protein of 47 kDa isoform X6 OS=Drosophila mauritiana OX=7226 GN=LOC117143185 PE=4 SV=1\nMFSGLTNQFTSLVGAVKGGAGDEDVPAPTGDAPAAAPAASTSVEATASSAVDPEAAAAAGGEGLEGEEAGKSGWLGSAKGWLGNASIPSMPAMPSMPSMPAMPAMPSIPSIPGLRKGAGADGAEGAEGAVAGEGGAAASGAVSGGEDDDKSRYISATEGADSHPASGGGTPTGDEGQIGQGKGDEVKITTKVTQQAKHFGSFLSSAISKAGSKIKETVKDNTILDSFNKEQEAFIKGQGGVGNGAAPWIGHANEAKIKEEILGLSQDRRNFVRAPPAGVDFEFSYDTAYPTAIAIMAEDKALETMRFELVPKIITEENFWRNYFYRVSLIIQAAELGTLGADGVGQASSGEDANEVATKEKKSKTAQPAKGDSSVKAIAEQPKAVIEPEAQESDVQAAKSKAKAQAGKELGQKISESEFVSDDFQASSESDLAEIQDGMRKLGIDSMTQQALAPTDEEQWEKDLEAELKDYEVVDEGGTGGGGRRKGRKAGEDDTEADEDEPTISNLRTRSTNNDWEEYADLIEDTDDLKTLKCLKRTMLGYP\n>tr|A0A3S6F4D4|A0A3S6F4D4_YERET Fimbrial protein OS=Yersinia entomophaga OX=935293 GN=PL78_17300 PE=4 SV=1\nMNKTLLMALLFTLPGVALAATSNNTIKFQGEVAEQTCQVDINGSANTPIVLLPTVASASLSGPNSVAGKTNFTINLTGCNVASKETKISSVFQGMNVTPAGNLGNTGTAQFVAIQLLDSTDRPVILTSGPVEVPGITLATGATSASQDLSVQYISESGNAVAGSVMASAQYAITYP\n>tr|A0A2S1PWN1|A0A2S1PWN1_ORITS 56 kDa type specific antigen (Fragment) OS=Orientia tsutsugamushi OX=784 PE=4 SV=1\nGDRDFGIDIGNIPQAQAQAANPALNDDQRAASRIAWLYNCAGIDYRVTDPHNPIGPMVLIPTLLTIPKGNPNPAGNPPQRAHQPANFAILNHDLWRHLVVGLAALSNANKPSASPVKVLSDKITQIYSDIKPFADIAGIDVPDTSLPNSASV\n>tr|A0A126E925|A0A126E925_9RICK Uncharacterized protein OS=Rickettsia raoultii OX=369822 GN=UQ52_02815 PE=4 SV=1\nMNSTNQLQNNSLTNSWLKLGILSLGFAGLYSIILVVLRTPQLSSFFPNPHIFKSALIIHVNLSVLIWLLSVTASVWGGETSLRGEAKPRRGNLMKQYKIPEIAKFSTFARNDVFRLYPKLAFLATLLIAISPIAGHNPVMNNYIPMLENIVFILGLSLFGVTLLLYAINILYFFDWTNLNSLVNFTVLSTIIMFILSFVCFGWSYNGLQNIMQIIPIEIEFYYELLFWSGGHLLQFIYTQILIFIWVSLFRELIARELKFQKFYLFLLYLNFIFGILTLFGHIFYDIIDGAFKVFYTNHMKYLGGIAPVLCLIGMGVELVWVFVIPQLDREIQTKYQNNVIDLAIKLRDDTVTINDRVIKTILLCSITLFLLGGLIAMNITGINVAIPAHYHGSIVGISIACMGCSYLGIGRYQRHCERLKRAWQSHEVIQKLPRLPRRYFVPPRNDNIINFTFYLLTFGQILHILGLAFAGGYGVMRKDPNSVMPMSAKLLMGMMGGGGFIAIVGGLMFVYICVKVMFFKSIKLAHE\n>tr|A0A159KM53|A0A159KM53_9HEMI Cytochrome c oxidase subunit 1 (Fragment) OS=Corythucha sp. BOLD:AAG8847 OX=1793449 GN=COI PE=3 SV=1\nSWIIRXELSQPGPFIGNDQIYNVIVTAHAFIMIFFMVMPIMIGGFGNWLVPLMIGAPDMAFPRMNNMSFWLLPPSLTLLIMSSMVENGAGTGWTVYPPLSSNISHMGPSVDLAIFSLHLAGVSSILGAINFITTVINMRPSGMSLEKTPLFVWSVVITAVLLLLSLPVLAGAITMLLT\n>tr|A0A4U5P1N6|A0A4U5P1N6_STECR Uncharacterized protein OS=Steinernema carpocapsae OX=34508 GN=L596_013647 PE=4 SV=1\nMKQRKNALWEMQKLIDCLQSTKWLNVCCYLETDVTSFSINHVMVGPNLTLILDVCLLQVRYRYFDIRYRTAVYWKRNSCFSAFPTYFDKQK\n>tr|A0A3E4WUS6|A0A3E4WUS6_PHOVU Uncharacterized protein OS=Phocaeicola vulgatus OX=821 GN=DXC16_05095 PE=4 SV=1\nMDDKTGALEKLKAIMAKAEQVEMSSVKIGDIIYVPLDEEDGLILKDGYKDRNKYIVIIGFTPEGVAIGALLINSEIDSSKRSEELLDCQYPLMVRNYRDILDYDSWLDCSDIFELSKLKITEKNGKLKGCLISEDRERVMQFLRETEVFDNATKRRYGIIK\n>tr|A0A1R4HFW4|A0A1R4HFW4_9GAMM Secretion ATPase, PEP-CTERM locus subfamily OS=Crenothrix polyspora OX=360316 GN=CRENPOLYSF2_460006 PE=4 SV=1\nMYDGFYNLSKKPFQLNADSDFFFNSAVHKRALAYMRYGLTQGEGFVVVTGKPGTGKTMLVKELVNSLNSNDITIGIMVSSQVGADDLLKIISATFGLPYDGEDKATLLTRIERFFIQQAVDGKRVLMIVDEAQNLPKDSLEELRMLSNFEMSGKALFQTFLIGQLQLGETLFLPEMEQLRQRIVATYQLKPLEEEETKNYILFRLEKAGWQQTPQFEEEVFNAICAYTQGIPRRINTLCDRVLLFGYLDELSVIGLNAVNKVIADIEEEASIVTDEFHDVVALSASSNVSYSDGFSPQMEERIVALEKTVENLRNVLGRERALLRKAILIQLDMNEVYDDLGE\n>tr|A0A5D4XIW7|A0A5D4XIW7_9GAMM Integration host factor subunit beta OS=Luteimonas sp. XBU10 OX=1132694 GN=ihfB PE=3 SV=1\nMTKSELIEILTQRQAHLKADDVDLAVKSLLEMMAGSLAHGERIEIRGFGSFSLHFRPPRTGRNPKTGDAVALPGKHVPHFKPGKELRERVTAVIPLPAEE\n>tr|W7W772|W7W772_9BURK Transposase OS=Methylibium sp. T29-B OX=1437443 GN=Y694_04599 PE=3 SV=1\nMAMLAKIRRMHLRDGLSIREVARRTGLSRNTVRQWLREEGVTEPKYPERSTASVLDAWAEHLEAALRADAHRPVRERRTAKALFEQIRALGYAGSYPRVVVWVRRWRERQASAPRRAAFVPMSFELGDAFQFDWSCEYVFVGGLRRRLEVAHTKLAASRAFWLTAYPAQSHEMLFDAHARAFEALGGVPRRGIYDNMKTAVDKVGVGKARSVNARFQAMCSHYLFEPEFCNPASGWEKGVVEKNVQDRRRQVWREAGERRWSDLASLNAWLAERCRQGWEETAHPEWSELSVADVLQDERTRLMPCPKPFDGYVEQPVRVSATALVHFQRNRYSVPTRWVNEVLSLRAYPEAVVLVAEGVEVARHTRSFERELTFYDWQHYIALVQTKPGALRNGAPFKAMPEVLQTLQRHLLRHAGGDRVMAQVLAAVPVHGLEAVLVAAEIALEAGRPSAEHVLNVLARLKDGAPALRELTQPAPTLKEEPRADVQRYDSLREAQQP\n>tr|A0A6J6Q2H3|A0A6J6Q2H3_9ZZZZ Unannotated protein OS=freshwater metagenome OX=449393 GN=UFOPK2366_01453 PE=3 SV=1\nMFEWNEEQQMIRDAVRRFVDDEVRPHVEELEHGDLAPYDILRKLFATFGMDSMARDRFAKQIAREKSVAEMVARGETPPAPAAERSGGDGGGAAMSLIPIIELCRVCPGMVTAMGVSMGLTSAAIMSKGTIAQKERWALDLLTMDKVGAWAITEPGSGSDAFGSMRATARRDGDDYILNGSKTFITNGPYADTTVFICKLDDGGPIEQRKVVSFVLDRGIPGFVQSKRLRKMGMHSSPTGQLFLDDVRVGRDRLIGETEDQPAGGREGAKATFQQERSGVAAMALGIIEECLQLSVAYAKDRVQFGKPIGEFQLIQDKLARMEVARINVQNLVFRTIEMSAAGKTMSLAEASAMKLYSARAATEVALEAVQVFGGNGYMSEFRVEQLARDAKVLQIYAGTDEIQITHIAKELLRA\n>tr|A0A1X0ZA11|A0A1X0ZA11_PSEPU Hcp1 family type VI secretion system effector OS=Pseudomonas putida OX=303 GN=hcp PE=4 SV=1\nMPTPAYIAIEGKTQGNITKGAFTSDSVGNIFVEGHEDQILVQEVNHRITVPTDPQSGQPAGQRVHGPLIFTCALNKAVPLLYSALSSGEMLPNVELSWYRTSVEGTQERFFTTKLIDAVIIDIDLEMPHVQDKDNSNFTQFFKVSMAYRGIEWEHITASTAGADDWRKPKETAV\n>tr|A0A6I3MVR7|A0A6I3MVR7_9ACTN Uncharacterized protein (Fragment) OS=Actinobacteria bacterium OX=1883427 GN=F2940_05525 PE=4 SV=1\nMNTSPFRSVLIVCGVATFGLVACGAQESQPQPISFSLAASTRSASDVVGAPESSNSNSKIMAPNYSVEYVVDGKLADLGQEASSWRAQTNVVASDADLKKIATALGVKNTEVQTSSGDPYLSWYYSGAVSSEASSPPSVGMSDSDAETTAPDRTVVSPPVPENVPTKEEAQSIIQKMMAKMGVDVDDANIEINGDEYGIWATAWKTFDGMRSPMSWNIGLGANGAVTYAQGNFLKFDRGANYPVVNTTEAVKRLGNPRYSGWFGYGAVSSKEVLAKDSATIPSQEVVVQTIRLTKVSASLTPVIASDKTLWLLPSYEYLTSDGYTVSTLALDDKYIDQTPTSTVPDNDVNVTTPDAGSGSSGSSTGGTPAVDGGVVEPAPAPQTILPTEKDAKALVGLNEDEAVKIIEGNGWTYRIGSRDGEQFMLTEDYSASRLTLGIE\n>tr|A0A067Z5I4|A0A067Z5I4_GLUOY Uncharacterized protein OS=Gluconobacter oxydans DSM 3504 OX=1288313 GN=GLS_c18640 PE=4 SV=1\nMMTMNNEERDLIARFVARVGGGPQVTGPGQPPAAPLPPIDPEADRFIAENFQKYPEARYRITQMAVVQEAALAQAQNRIRQLEFQLQQAQQQLAQVQQSGGSKPGLFGGLFSGGNRPQQSAPPPGWGSQAAPPPNFMPQQQYAYPPGYQPGMFQRGGSGFLGSALTTAAGVAGGMMAANALEGLFSDHHGAGGDAAGGWGAGGDTIINNYGSDASASDPFGGAGTDAGSFSDSDFGGGGDAGGGGDFGGGDGGGGGFDDMF\n>tr|A0A4P7HFW9|A0A4P7HFW9_9NOCA 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase OS=Nocardia sp. CS682 OX=1047172 GN=ispF PE=3 SV=1\nMRVGIGSDVHPIEAGRPCWMAGLLFDGDDGCAGHSDGDVAAHALCDALLSAAGLGDVGAVFGTGRPEWAGVSGAAMLKEVRRLLDEAGFEIVNAAVQVIGNRPKIGPRRGEAQQVLGELLDAPVSVSGTTTDGLGLTGRGEGVAAIATALLQACR\n>tr|A0A5S4G1W4|A0A5S4G1W4_9ACTN HAMP domain-containing protein (Fragment) OS=Nonomuraea zeae OX=1642303 GN=ETD85_40700 PE=4 SV=1\nMSDPAVGTTRSAARTKRSRGPGEVGEPELRQLLAGLTAVRDGDFRTRLPDDADGLLGEIASVFNGMVDQLSLFTSEVTRVAREVGTDGRLGGQADVPAVSGTWKDLTESVNAMAGNLTDQVRSIAQVTTAVARGDLSQKITVHARGEILELKNTVNTMVDQLSSFADEVTRVAREVGTEGQLGGQADVKGVAGTWRALTDSVNFMAGNLTDQVRNISQVATAVARGDLSQSITVSARGEILELKNTLNTMVDQLSSFADEVTRVAREVGTEGNLGGQATVRGVSGTWKDLTENVNVMASNLTNQVRSIAQVATAVARGDLSQKITVEAKGEVAALAQTINTMVDTLGAFADEVTRVAREVGTEGQLGGQARVPNVAGTWKNLTDNVNSMADNLTNQVRSIAQVTTAVAKG\n>tr|X0VWK7|X0VWK7_9ZZZZ Uncharacterized protein (Fragment) OS=marine sediment metagenome OX=412755 GN=S01H1_51379 PE=4 SV=1\nMAYSLTFGDVAENHIGNQQIGSICHDGFTKAELLYAKTQFEVKGCTCELVELHKDV\n>tr|A0A439RUF8|A0A439RUF8_9HYPH PhzF family phenazine biosynthesis protein OS=Mesorhizobium sp. OX=1871066 GN=EOQ56_14750 PE=3 SV=1\nMLTRNYLLYDVFTTERLGGNPLAVVLDSKGLDTAAMQAIAGEFNLSETVFVLPPDNPKHRARIRIFTPDHEMPFAGHPTVGAAIALAEMAGDGDTAGIFVLEENIGPVRCAVSKHAGASFAEFDLAKLPEPLELSADPEAIGAALGLGPHEIGFENHRVSFWSAGVPYVTIPVADLEAAARIKLDNQAWSELAPRKSDWALASPYVYCRETVNHDSAFHVRMIVPGNPSYEDPATGSAAAAFAGAIMHFDGPREGVSQRWIEQGLEMGRPSRIRLELNVEGGKLAAARIGGHAVKVAEGKLFV\n>tr|A0A669NV56|A0A669NV56_PHACC Membrane associated guanylate kinase, WW and PDZ domain containing 2 OS=Phasianus colchicus OX=9054 PE=4 SV=1\nSKFRPHKEGEVPGVDYIFITVEDFMELEKSGALLESGTYEDNYYGTPKPPAEPAPLLVNVTDQILPGATPGAEGKRKRNKSVSNMEKTGIEPPEEEEEERPVVNGNDVTVTPESSEHEDKSTGVSGEVSSTQPCPAPGYTQPEEAKEDMDVTKQTKPEENDDLGPLPDNWEMAYTEKGEVYFIDHNTKTTSWLDPRLAKKAKPPEECKENELPYGWEKIDDPIYGTYYVDHINRRTQFENPVLEAKRKLQQHNMPNAELGTKPMQAQGFREKPLFTRDASQLKGTFLSTTLKKSNMGFGFTIIGGDEPDEFLQVKSVIPDGPAAQDGKMETGDVIVYINEVCVLGHTHADVVKLFQSVPIGQSVNLVLCRGYPLPFDPEDPANSMVPPLAVMERPPVVVNGRHNYETYLEYISRTSQSVPDVTDRPPHSLHSIPADSQLDSTFPPPAHDDNVSMASSGATQAELMTLTIVKGAQGFGFTIADSPTGQRVKQILDIQGCPGLCEGDLIVEINQQNVQNLSHAEVVDILKECPVGSETSLIIHRGGFFSPWKTPKPVMERWENQGSPQTSLSAPAMPQNIPYPPTLHRSSFPDSTEAFDPRKPDPYELYEKSRAIYESRRPDYKELDVHLRRMESGFGFRILGGDEPGQPILIGAVIAMGSADRDGRLHPGDELVYVDGIPVAGKTHRYVIDLMHNAARNGQVNLTVRRKVLPTGEPCPENGRSPGSVSTHHSSPRSDYATYANSNHAVSSSNATPPEGFTSHSLQTSDVVIHRKENEGFGFVIISSLNRPESGSTITVPHKIGRIIDGSPADRCAKLKVGDRILAVNGQSIINMPHADIVKLIKDAGLSVTLRIIPQEELNSPASAPSSEKQSPLAQQHSPLAQQHPLAQQQSPVTQHSPVAQPTLPQPLQLQGHENSYRSEVKARQDVKPDIRQPPFTDYRQSSTDYRQPPLDYRHPPVMDYQQPPPLDYRQPPLLDYRQHSPDTRQYPLSDYRQPQDFDYFTVDLEKGAKGFGFSIRGGREYKMDLFVLRLAEDGPAIRNGRMRVGDQIIEINGESTRDMTHARAIELIKSGGRRVRLLLKRGTGQVPEYDEPSSWSAPAATSPGLQEVALSLDDIISPLSSSHIAPPSDPSHQISPEPTWDIKREHDGRKPKELSVNGHKKKRLGEQRERSASPKKADRSKHDEPSWKGYSEGKTKVTDGGRLTSESRAVGHSVMMEAGAREHVCAGSSDEQFGRKGHLHPISTRSTNTTVRKATVSPGPWKIPGSDKLPGVLKSGTSAMSR\n>tr|A0A516QZI1|A0A516QZI1_9BACI Octanoyl-[GcvH]:protein N-octanoyltransferase OS=Bacillus sp. BD59S OX=2499213 GN=lipL PE=3 SV=1\nMSNSRSILSQPEWRIVDQSSLGPTFHALQSFAMDDTLCTSIGNGQSAATMRSWVHHNTIVLGIQDSRLPHLEEGISFLKENNFNVIVRNSGGLAVVLDEGVLNVSLLFQETEKGIDIDLGYDTMWHLIQEMLKDYDVTIEAKEIIGSYCPGSYDLSIRDQKFAGISQRRIRGGVAVQIYLCATGSGSERAALVRDFYNLAIQGEETRFTYPEIVPSTMASLSELLGETITVQDLMMRLLKTLQQFAPKLTPSQLTIDEIPLYETNLQRIIDRNNKALGLEK\n>tr|A0A7C4ETP5|A0A7C4ETP5_9DELT Uncharacterized protein OS=Desulfomonile tiedjei OX=2358 GN=ENV54_02205 PE=4 SV=1\nMLIHDKKTFGLGLLLFITFLIVLGIMFSPFFSGENALKASDKLFNSIAKGSTYYIPDLLKKAQAMGGAKFEATIKLKSDELAQKAQKVLTASGSQVSAAGAQLNVKGALGDVLSAALKDSDSMFHNRDSEVAQRYGFSGREALFVWWSLLKEVEKELTRQSKFKDAAFVSTVVKKGVEVGYNFFGIAPESALSKAGILTFALVFYVVYTLWWGIAILFLFEGLGLEMKAGAKKEV\n>tr|A0A0Q7FUL9|A0A0Q7FUL9_9GAMM 3'-5' exonuclease OS=Acinetobacter sp. Root1280 OX=1736444 GN=ASC84_16360 PE=4 SV=1\nMRLPVLVFDIETLTDLKSGAHLYGLDLPQDDLEQALAKLRRQESGMDFQRLALHEIVCISGLWIDENGVMKLFSFSREHYTETEILQKFLSIFDKRHPTLVSWNGSQFDLPVILFRAMYHGLSAPSLFDQGEIDTQKRYNNYQNRYHNRHVDLMDVMAMFNGRHFQKLDDVAHLLGYPGKRGISGYFVPEYVNTQQWLKLTSYCEGDVLNTWLIFLRWALLKGQISLQDHRLWIQASIHYLQGQTQQHEFLNVWRETSQRTEFTQADFSSTPD\n>tr|A0A5K1MIC2|A0A5K1MIC2_ACIBA Uncharacterized protein OS=Acinetobacter baumannii NIPH 615 OX=1217641 GN=F978_03533 PE=4 SV=1\nMKIKEMPKIKVRNQVALSPLLHKGGMHETEKPRAQHRRNRQDTKQQLKKGVW\n>tr|A0A7L3CZ56|A0A7L3CZ56_PLUSO MX protein (Fragment) OS=Pluvianellus socialis OX=227228 GN=Mx PE=3 SV=1\nQGEEHTLYNQYEEKIRPCIDLIDSLRALGIEKDLALPSIAVIGDQSSGKSSVLEALSGIALPRGNGVVTRCPLELKLKRIPATQAWKGKMCYRNSSVELQDASEVEKAIREAQNVVAGTRGAISGELISLEIWSPEVPDLTLIDLPGIARVAVGDQPKDIGEQIKMLLKKIIGCKETLNLVVVPCNVDIATTEALKMAQEVDPSGERTLGILTKPDLVDRGTEESIVNIIRNLVVPLKKGYMIVKCRGQQDIHDKLALTAAIQQERRFFENHKYFSLLLDEGKATIPCLAEKLTNELVRHIIKTLPTLENQVREVLQKTLQDLQKYRRGTPRTESERLIFLTDLIKLFNQDISQMMRGEEQLYGNEVRLFTKIRREFRTWEVTLLESAAKVKNNVPSKVWKYEDQYRGREFPGFNNYRTFEDIIKEQIIELEEPAVEIMSNVIGLVEEKFMEVTKRHFANFHNLNRAAKTRIEHIREKQAEEAERHIRTQFKMERIVYCQDDAYINDLQSVKQEGATKAGNEKGLLVGSVSNQETSFVQEMGASKRLCNQIPLIILSSALHDFGDQLQTTMLHLLQEKDKLSHLLQEDSEAAKQRTYLSQRVNRLTKACQYLRDFTLV\n>tr|A0A1H2WI61|A0A1H2WI61_9ALTE Ribonucleoside-diphosphate reductase OS=Marinobacter mobilis OX=488533 GN=SAMN04487960_104173 PE=3 SV=1\nMSTAALAEPQSPASSLQVIKRNGTLVSFDPAKITVAVTKAFLAVEGDQVSGSARIHDSVARVTEQVVQAISRRLKAGGKVHIEDIQDQVELALMRAEEQKVARAYVLYREAHAQERASRAAPVEAHPSLTVKQRNGQVAPLDLGLMKFQVEQACGGVDGVDAAAVVNEALKGLYDGIPEADVLSALVMTARGRIEQEPGYSQVTARLLLEQLRMEAAGALALPLQASLPSVYPQALTAFVHAGIRYELLDEALAAFDLERLGAALKPERDGQFGFLGLQTLYDRYFLHWQGARLELPQVFFMRVAMGLALREDDPNARAIEFYNLLSSFDYMASTPTLFNSGTRHSQLSSCYLTTVGDDLEEIYGAIRDNALLSKWAGGLGNDWTPVRALGSHIKGTNGNSQGVVPFLKVVNDTAVAVNQGGKRKGAVCAYLESWHLDIEEFLELRKNTGDERRRTHDMNTANWVPDLLIERMRRDQDWTLFSPSDVPDLHDLYGNDFRTRYEEYEARAARGELPLHKTVPAKQLWRKMLTVLFETGHPWITFKDPCNLRSPQQHVGVVHSSNLCTEITLNTSAEEIAVCNLGSVNLAAHINGGELDVQRLERTVNTAVRMLDNVIDINFYAVPQARESNLRHRPVGMGLMGFQDALYQLKLAYSSPEAVEFADLAMEQISYFAIRASAELAAERGAYPTYEGSLWDQGILPIDSIQLLADARQDGDLSVNTEARLDWTPVRELVAKHGMRNSNVMAIAPTATISNIVGVSQSIEPAYQNLFVKSNLSGEFTVVNPSLVAELKAEGLWDNVMVNDLKYFDGSVQQIERIPAEIKARYATAFEMDARWLVEAGARRQKWLDQAQSLNLYMAEPSGKKLDALYQLAWERGLKTTYYLRSLGATGAEKSAPVQAAPAPQVCSIDNPDCEACQ\n>tr|W6TAY6|W6TAY6_9LACO Terminase OS=Lactobacillus fabifermentans T30PCM01 OX=1400520 GN=LFAB_00210 PE=4 SV=1\nMIEYVDQVLSGQVLAGQKIKWACERFKRDLSRSKDDSFPFYYDEDKAAQAVKFIELMPKTDGSQLTMQPFQKWIISELYGWREKTTGNRRYDRAFISMARKNGKTYLASGMAANGLLRERQPARNRQVLFVSNALKQAKLGYDMLSSGLRQVRKQSKYMRQRIKVQKQAITDLETDSQALALASDTSTLDGYAGTTVILDEWHEAKDRKVYNVLKSGQAQEDNSLLAVISTSGLNLNVPMHAEYDMLTDVLKGKTEADRYFVAIWELDDREEVYDQANWIKANPLFSEPHVKQRMTEKIKADVDLAIKQNNLIPILVKNFNMWLQASEDSYISADDWAAGKLAKVPDLHNRDAYIGIDLSKSNDLTAVSWLVPIGNGQFYCDSHSFVGTKYGLDSKIKRDGIDYRSMERAGECSITRLDSGVIDYDELFDYVQNLVGKYNWKVKAIAYDPYNAQTLITKFEKLSYPLFEVRQGTKTLNIPTRNFRDQLYDDKIKHNGNKILAYAVNNAILKVLNNGWQLDKARNSNRIDPIAALINAFVAGMDYYQESEAQQHAEDYYKTATAADLF\n>tr|C5LGB5|C5LGB5_PERM5 Subtilisin OS=Perkinsus marinus (strain ATCC 50983 / TXsc) OX=423536 GN=Pmar_PMAR016847 PE=4 SV=1\nMPSRVDYDLRNRRIDEKESKIEEILLTGSNGDNDDDAMEHKDNDIVIIKLEACIIDSFVDGEGDGAVIVAVIDSGIDYTHPDLVDNIWINKDEIPGSDNIDNDANGFIDDIYGWNFVHNTNNIMDDNGHGTHIGGIIGAKGSNNIGATGIAWDVAIMPLKFLNADGIGRVSDAMRALDYAIQMGATISQNSWTCHKCDDTTTTNYNAIKMAIQKAGNAHGSINFYATPVDIKNAIMNSVDTDPNLEMKCLSSGILNAYRALNTVIHNNNKNKKKKNDHLHKSKTSSSVINIIISTTTTMNDDYICGDAFCNKYVGSVMTVSDE\n>tr|A0A2E9Q7Q3|A0A2E9Q7Q3_9SPIO Aspartate transcarbamylase OS=Spirochaetaceae bacterium OX=1898206 GN=CMN76_04620 PE=3 SV=1\nMFDQSKIHPLLKQPVVSRDGIRGIERPRHLLESIPEDAEPLRSLAGMHIVSARQFDRNKILQLGRLAASYETQPDLIHPPLRGKILVSAFYEPSTRTRLSFESAWHRLGGDIMSITDPNTTGIAKGESLADVGEMFNNYGDVVVLRDSSEDSVYAMLDSLRIPIINAGNGIDEHPTQALADIYAMLKWRPDFGSGNLSEEEKITIGVIGTPNRMRTVRSLLLLLSLFSDSIKKVYIVNPASDVLDKEQDEELRAAGLKLEVVHKLRDILPEIDVVYINSIAWVGDSYETLTGDIKLTSESQLKQGAIILHPLARGEELDESLDGTSHNWYFSQARGAVFIRMALLTCLVHRINLVVDSPVEQPDSN\n>tr|A0A520KE24|A0A520KE24_9ARCH Uncharacterized protein OS=Candidatus Verstraetearchaeota archaeon OX=2250257 GN=DSO09_03215 PE=4 SV=1\nMKKSRIIPIMSIIFTLLLILIIIINQVQWQNHEYYYELRRTIGLPSIAIGTNYEGTRNPLLDIFVRALYDVPGGHDYVVSSSFIDTPLKLKDFFERIPGFNMTVMREGK\n>tr|C4NUU6|C4NUU6_ECOLX Aminoglycoside O-phosphotransferase APH(6)-Id OS=Escherichia coli OX=562 GN=strB PE=4 SV=1\nMPPVFPAHWHVSQPVLIADTFSSLVWKVSLPDGTPAIVKGLKPIEDIADELRGADYLVWRNGRGAVRLLGRENNLMLLEYAGERMLSHIVAEHGDYQATEIAAELMAKLYAASEEPLPSALLPIRDRFAALFQRARDDQNAGCQTDYVHAAIIADQMMSNASELRGLHGDLHHENIMFSSRGWLVIDPVGLVGEVGFGAANMFYDPADRDDLCLDPRRIAQMADAFSRALDVDPRRLLDQAYAYGCLSAAWNADGEEEQRDLAIAAAIKQVRQTSY\n>tr|A0A1Q7EW51|A0A1Q7EW51_9CHLR DUF218 domain-containing protein OS=Chloroflexi bacterium 13_1_40CM_68_21 OX=1805084 GN=AUH33_06650 PE=4 SV=1\nMTNDDGDLAEFPEVAVVLGGGMSASGVPSPSTAARAHAASQLAHHRPSLAVIASGSHGDDPAPAKSEAAVMADLISKAGVPRERIFLEERSRDTIGNGVEVAARYLAKIEPRPLYLVTSPFHLERALVVFRNVLGFAWQVQAVAAEQTDDDLARANSETTFLQETFAFFEGIRPGDFPAVEKRYRARQVR\n>tr|A0A519RZM3|A0A519RZM3_9SPHI Ankyrin repeat domain-containing protein (Fragment) OS=Pedobacter sp. OX=1411316 GN=EOO86_13990 PE=4 SV=1\nMNIYQIEQAYIQGKSLDEIKELYQSEIVGITDEQQVEVWEQVCGFANVEMIDYLIAQGWRTAGVENRNGDTLLHFLATPLHSYDYFISEKRVFECTKKLLEAKVSPLRKNSEGNTALMLGAKVAYTEMLEAYAEIGAKIDFTDRKGNTTLHILAEYSYSAVSDFETALERLMIHQRESNFDENNQRQVQVRHELEWRHNVTKARFNQFITFAIVAREFGIDPFQKNNEGQTAVDIAIYRKSKSIGAILKGVDFDDQERASLYFNAGGMDVHQACVHKDVEALTALITLGENLNEAYDKENDKHNGMTPLAIAMMEHSYEITDLLLKNGADATLRDSKSWHPFRYLFTPNSSVNVNFERFKEKTFQRILKAYID\n>tr|A0A429HFY5|A0A429HFY5_9ACTN YceI domain-containing protein OS=Streptomyces sp. WAC 05379 OX=2203207 GN=DMH26_27780 PE=4 SV=1\nMGLTARIRTRDGWAVSHAVVTVTDMTGTQVLRLEADTEGAVRDADPLAPGAYTVIVTAVGYAPAAASAIVTASGRAEVGTVTLARQGGTELPPPGPWTVDPAHSSVAAVAQHLGISSVHGRFTRFSGAIEIAPDDIAKSRVDAVIRADSIDTGNGMRDGHLKSPDFLDVERYPEITYRSTGLTAAAGTDRWTVHGELTMHGVLRPVDLDLAYLGTGADPWGGTRAAFRATTELHRDDFAMNYNQVVQAGIAAIGTTLKVELDIQAVQGETLPQA\n>tr|A0A7K9HDP6|A0A7K9HDP6_9AVES NCF2 factor (Fragment) OS=Bucco capensis OX=135168 GN=Ncf2 PE=3 SV=1\nMSLVETIQLWQEGVCAADRKEWRAALDAFTAVQNPPAKICFNIGCIHLVLGKLAEAEQAFTRSISCDKHLAVAYFQRGIVFYQRQNHEKAIEDFKEALTQLRGNHLIDYKILGLRYRLFACEILYNIALVYATMEDWKKAEEHLALAVNMKSEPQHNKIDRAMEAILKQKVCELVTISAGKLFRPNEKQVAQLEKKDYLGKAMVVASVVDKDDFSGFAPLQPRASGPPPRPKTPEILRALQGQPHRVLYEFIPETAEELQVLPGNIVFVLKKEKDNWATVMFNGKKGIIPCNFLEPVELQNKLHIQEETPLEDEIPESPHSTAPEKPRRPAPVYHLQVVEAAVTSPYILKVHYNYTVTLQVKPGLSYMELLDLVCKKLELQPEHTQLRYKPVESQALVTLSMENLDVAWSQSKGNCLTVWCEITEGEGFLLPQEATLEMGPTQVVAQYSYEATQPEDLEFQAGDVILVLSKVNEDWLEGQCNGKIGIFPSAFVQ\n>tr|A0A368E3B5|A0A368E3B5_9PROT SDR family NAD(P)-dependent oxidoreductase OS=SAR116 cluster bacterium OX=2024888 GN=DBW67_07180 PE=4 SV=1\nMFRYDNKIVVVTGCGSIAAGIGNGRAMAMAFARQGAKVIGTDRNLEAANQTLEMVHQEGGLMEVVGLDSLDDMSVLAFFEDVLAREERIDVLVNNVGQSEPGGPYDMALETWRGQFALNIDTAFMAIKHVLPSMRARKNGAIINVSSVAGMRYIGKPQVGYAAAKAALVQMTKTTAIIEAPHNIRLNCVVPGLMHTPLVQVLAQKYAGGDTEAFVAKRNNQVPMGRMGDAWDVAHAAIYLGSDEASYVTGTELVVDGGITATTP\n>tr|A0A7L4KQA5|A0A7L4KQA5_9CORV Kinesin-like protein (Fragment) OS=Callaeas wilsoni OX=1347786 GN=Kif2c PE=3 SV=1\nAMDSRLCRNVHPGVIIKIQRSNGSIHKATVKVVNVEHSCVTVEWSEDGATKGKEVDINDVIAINPELLELPPADVKENVPLQDNVTLQKQKRRTTLSKIPAPREAVRGRSRMSAITESQCSFQEDEMAVDPCTSLQTRKYLLLPAGRTRASGLGCVPEASLSSVNGNTENHLPAARTSSSESPVRRRSNIVKEMEKMRSKREEKRAQISEIRIKRAQEYDSTCPNWEFARMIKEFRETLNCQPISISDPIEEHRICVCVRKRPLNRQELLKKECDVVTVPSKCVLMVHEPKQKVDLTKYLETQTFRFDFSFDETSSNEMVYRFTARPLVETIFEGGKATCFAYGQTGSGKTHTMGGDFSGRTQNASKGIYAFASQDVFLLLNQPRYRSQNLEVYVTFFEIYNGKVFDLLNKKAKLRVLEDGKQQVQVVGLQERPVGCAEDVIKMITIGSACRTSGQTFANASSSRSHACFQIILRRRGQMIGKFSLVDLAGNERGADTSSADRQTRMEGAEINKSLLALKECIRALGQNKSHTPFRESKLTQVLRDSFIGANSRTCMIAMISPGMSSCEYTLNTLRYADRVKELSPHDGGIDAQSQMETEEIETSTEGSGLQFSFSKDEEEELSPHIFSYREVMTQISEREEKVVEQLKELRQRMITELDYLLGMAEKPDYDLETFVSRAKYFVEDSSRNFLSVRETLDALGTAMQLEEQASKQIS\n>tr|A0A2D9JC90|A0A2D9JC90_9BACT Protein translocase subunit SecA OS=Rhodopirellula sp. OX=2024855 GN=secA PE=3 SV=1\nMSESSARETTNPNELDSSGVPLSSSSTEETGPDPXWTPPDPVLSEATALDPLAPNEPLEDAGNXVETTQEAVVRRSSDPSANKKKWTKASNWRPRMVRWQRXLARVNALESTLQAEDDQTIRKRSLALRYRAMAGEKLSEXLPEAYAXCREAGRRSLSMRHYDVQILGGIALFEGHXTEMQTGEGKTXTATLPLYLHSXVGKGAHLATVNDYLAKRDAEWMMPLFEMLGVSVGIIQTEDDQGGRRKSYGAAITYGTAKEFGFDFLRDRLXLRAQNRMQTEMLGSGDGGFSNSGDQVVMRGMHFXLVDEADSILIDXARTPLIIGSIEDTVRDQIIETYKWAAENAPXFELDEHFEIDDETKRYELTARGRSXVRALPKSDLVRTMGLVDMYEYIERSXKTHREFLLNRQYVIRPSEKDPNVDEIVIVDEFTGRLAEGRKWRDGIHQSIEAKEGVEXSVPTGQAARITVQDLFLRYPHLAGMTGTAATSAGELRKIYRTPVVRVPTNRPPQRIQLPSRVFGTLNSKFEAIAKEVEEXHATGRPVLVGTRSIXKSVLLSKLLDDLGXEHEVLNANXVERXAEIVAEAGGRGKVTVATNMAGRGTDIKLSNDVEQIGGMHVICTXLXXAARXDRQLIGRCGRQGDRGSYRQYLSLDDDILKGGYGAIKYEKLKKRGEATSGSVDRLAAMFHKAQRKVERRHFRDRMVLMHHEKERKXMQREXGQXPYXDTPD\n>tr|A0A256Z8B1|A0A256Z8B1_9ARCH Uncharacterized protein (Fragment) OS=Candidatus Bathyarchaeota archaeon ex4484_231 OX=2012512 GN=B6U79_02805 PE=4 SV=1\nMNKKLRLLSVFLLLLASFSPVVQAEASCTGSVRRWYSFRELAWGDMNSWADVDGNWVKDEQEIISPCILVSVTFGRGRVICIGDEGFLSNVLVNEADNLRLGLNIIAWLAEAEGNRHRVLFDSAHNEMQDIGSGDPWRGYSIFAGKLRKAGYTVEKNTA\n>tr|A0A4Q8BRW3|A0A4Q8BRW3_9ACTN Xaa-Pro aminopeptidase OS=Streptomyces sp. CNZ288 OX=2512147 GN=EV377_6800 PE=4 SV=1\nMDKPLARPHTGSHDLDVSAALHTFMGSAWAPSPLPSGVRVPGYDALAGRRARLSARFPGERLVLPAGELKVRSNDCDHRFRPHSAYAWLTGLTGEDQAGHVLVLEPAGAEGHEAALYVRPRSDRSTDEFYRDRRYGEFWVGRRPDLGEAAELTGLACRDLDDLAKLTAGPRPPARVLAGVDARTDGLFDRGPHSAAEPDRDAELGTYLAELRLLKDEWEVGQLQLAVDHTAAGFEDVVRALPAALRHPRGERWIEGVFQTRARAEGNGTGYETIAASGAHACVLHWIRNDGPLDPGHLLLLDAGVETDTLYTADVTRTLPLSGRFSRIQRQVYELVLAAQNAGIAALRPGARFRDFHRAAMAVIAEGLYDWGVLRITPEEALAPDSGLYRRYTLCSSGHMLGLDVHDCAKARASQYLDGVLEAGQVLTVEPGLYLQPDDETLPPELRGIGVRIEDDLVVTEDGARLMSDALPRDPDAVEEWMGTLLDGFRPGA\n>tr|A0A068CJ75|A0A068CJ75_9PLVG Protease (Fragment) OS=Human immunodeficiency virus OX=12721 GN=pol PE=3 SV=1\nPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEINLPGRWKPKMIGGIGGFIKVRQYDQVPIEICGYKVIGTVLIGDTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKQKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLGWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYSGIKVRQLCKLLRGTKALTE\n>tr|A0A2Y9SHQ2|A0A2Y9SHQ2_PHYMC Fibroblast growth factor receptor OS=Physeter macrocephalus OX=9755 GN=FGFR3 PE=3 SV=1\nMGAPACALAFFVAVAVVMTGAVSGSPGMEQRVVRRAAEVPGPEPGPRELVFGSGDTVELSCPLPAGAPPGPAVWVKDGVALAPSDRILVGPRRLRVFNASHEDAGAYSCRQRPSQGVLCRFAVRVTDAPSSGDDEEGEDEAEDTAGAPYWTRPERMDKKLLAVPAANTVRFRCPAAGNPTPSISWLKNGKEFRGEHRIGGIKLRHQQWSLVMESVVPSDRGNYTCVVENKFGSIRQTYTLDVLERSPHRPILQAGLPANQTAVLGSDVEFHCKVYSDAQPHIQWLKHVEVNGSKVGPDGTPYVTVLKSWISESVEADARLRLANVSERDGGEYLCRASNFIGVAEKAFWLRVHGPQAAEEELVEAGEAGSVYAGVLSYGVGFLLFILVVAAVTLCRLRSPPKKGLGSPTVHKVSRFPLKRQVSLESSSSMSSNTPLVRIARLSSGEGPALANVSELELPADPKWELSRARLTLGKPLGEGCFGQVVMAEAIGIDKDRAAKPVTVAVKMLKDDATDKDLSDLVSEMEMMKMIGKHKNIINLLGACTQGGPLYVLVEYAAKGNLREYLRARRPPGTDYSFDACRLPEEQLTFKDLVSCAYQVARGMEYLASQKCIHRDLAARNVLVTEDNVMKIADFGLARDVHNLDYYKKTTNGRLPVKWMAPEALFDRVYTHQSDVWSFGVLLWEIFTLGGSPYPGIPVEELFKLLKEGHRMDKPANCTHDLYMIMRECWHAVPSQRPTFKQLVEDLDRVLTVTSTDEYLDLSVPFEQYSPGGQDTPSSGSSGDDSVFAHDLLPPAPPGSGGSRT\n>tr|A0A0R1W6U3|A0A0R1W6U3_9LACO CDF family cation diffusion facilitator OS=Lactobacillus suebicus DSM 5007 = KCTC 3549 OX=1423807 GN=FD16_GL000874 PE=4 SV=1\nMGGVFSGSLALLSDAFHNLGDSAAILLGYFAQLIGRHPETERRTYGYRRAEIIFALLNSIFLIVISVFLIFEAAKRFSHPQPINGELMLIVAVVGLLANLASAFLLQGGSKDSLNIKATYLHILSDALSSVGVIIGALFIWFTDISWIDPVITILVAIYICYETWPIIHQTLSILMQSSPELDYACIKKDIKQIDGITGVHHVHAWMIDEHRIIFSVHINLKDMKLSEVEPIYQRIETLLKNKYHICHITIQAEVERGIEETMFNTPADKATTSDEVE\n>tr|A0A0B1R8M8|A0A0B1R8M8_9GAMM DUF262 domain-containing protein OS=Pantoea rodasii OX=1076549 GN=QU24_03595 PE=4 SV=1\nMANDDKTLNLFPIDYPFETLCSRMESNPVKLKLNPDFQRKYKWDQDGWQRSSKFIESCLMRIPLPSCYFAEENDGNHIVIDGVQRLTTIQKFFNDEFSLEGMTTFKELEGKKFSELGSLRSELESTTIRCIVLRKENPKALIREIFSRLNQGAVKLSDQEIRHALYPGGFDDLLNELGGIEAIKNFGLAETTTVKRDSREPDEQVLRFFAFYDDGFAEHFNNTLKDFLDDQMETFSTLEEDRLNEMREIFKSSLQKCEKIFGDDTFTNPTVRRKRKGLVHYDILMPTIGKLSDEVVNDKAENIRQAWEDLCSSNEFKRTLSGGLQNKSSVIRRRDSWTKLLKEVTDGKD\n>tr|A0A3E4PQR0|A0A3E4PQR0_9FIRM DUF3794 domain-containing protein OS=Dorea formicigenerans OX=39486 GN=DXC93_09950 PE=4 SV=1\nMLNIYRQGKTFTDQFYVDEDYNVPDTKADIREVIESDAVMEEIDLKLVENYIRITGRLAFQVLYVADNSDNTLSSLEGKIPFEEMYYVDETLEETLFLKAAQTELTVNLIHSRKINVKAMAEVTMSSDSQVSEEVTTGIESGEQIYTKYQEKQILTLHTVKKDTYRIKEQLTISGTKESIGNILWKEVLSRRLDTRLEADTLKLQGELLVFCLYESVDGKTDWICENVPYEGQVECFGAEEGMYHQIYPILTDALLEPAMDEDGEMRLLGIEATLSMRFFLCTEEKIQILDDLYSLKTCCVPAYTQCKVENVLMQNHSKCKIAERLSLPEIKDDILQICYSDARIQVEQMTVQDTGIQIEGVLHIRFMYVRPDDQIPFALWQGMIPFSWLLESNEVQEDMTLDMMPSLEQLGISLLGNGEIEVKAVLAFRSFLRGKVTFRNIDSVEEKEIDYKVLEQRPGIIGYIVKEGDELWNLAKYYGTTKEGIMDINHMESEQLKCGDKLLIFKENASIL\n>tr|A0A285F1R0|A0A285F1R0_9PSED 3-oxoacyl-[acyl-carrier protein] reductase OS=Pseudomonas sp. LAMO17WK12:I10 OX=1286371 GN=SAMN05660489_00338 PE=4 SV=1\nMTESILVTGSSRGIGRAIALRLAQAGYDLILHCRSGRSEAEAVQAEVEALGRQARILQFDVTDRASCKAVLEADVEAHGAYYGVVLNAGLTRDGAFPALSEDDWDTVLRTNLDGFYNVLHPLIMPMIRRRAAGRIVCIASVSGQVGNRGQVNYSASKAGLIGAAKALAIELGKRKITVNCVAPGLIDTAMLDENVPVDELLKMIPAQRMGTPEEVAGAVNFLMSAEAAYITRQVLAVNGGLV\n>tr|A0A1B9FWL6|A0A1B9FWL6_9TREE Nuclear RNA export factor 1/2 OS=Kwoniella bestiolae CBS 10118 OX=1296100 GN=I302_07512 PE=3 SV=1\nMAPGTSNSNNNNSRGGRPTRGSNNARNPTGTPPIVKQLQTISGKAEREHSKSELTKKLHGEEMKEWIRKRVIADGVLDMSNLPNDPWLKENGILPPGHPNAPPNAGTVFWRIIEGVVQKGAGITVLTLSLANNNLEHLAQLSKLPLTLPDIRALDLSGNPIKNIGELDNLRAAGEKKGKATSGAGSLKSLVEIKLNDCFFRERMLQQPDGPNIYKHDILRRFPGLRILDGVELERIILPIDRKPKVRLTDEQKAAFVAKPFAFPCDVQGGFSEEGVKEAAMQFCAKYFTLFDNDRNALIPGYAPNALISISANTLPSRSAYQVEAQKTRANRPQPVSFEAWTNLPSRNFFRGITTIRARMDSLHNPADAERLLRWWNKVVPRTKHPLSDPERWCFDTWVLDGEGENTKLCLMIQGEFEEMPSGTYRSFSRTFILSPAPPGSLAANAGWPAIALSDTMTVHSYLGTFAFDERNRSLATHGVTIQPPSLPATAPVNGAATGNDALIAQMSQQTRMNAQFSTMCLEQNGWNFEAALKNFEEIKGSIPPEAFV\n>tr|A0A1Q6Z6P7|A0A1Q6Z6P7_9ARCH Uncharacterized protein OS=archaeon 13_2_20CM_2_53_6 OX=1805020 GN=AUI07_07525 PE=4 SV=1\nMKKSSDPADMVLREIEEMGKKSFIPSIGPLKGRILADIVREHKPRLILEVGALYGYSAILIAKNSPAHAQITTVEKDPKNARITQENVARAGLDDMIEVIQGDAIIILPELPGPFDLVFLDAEKIQYLAYLKAIEAKLHQGSVIVADNVGVFRDQMMDYLNYVRTTGRYRSRTVETLLEFSETTKDAMEISEKRY\n>tr|A0A7Z6L1Z8|A0A7Z6L1Z8_9NOCA Low molecular weight phosphatase family protein OS=Rhodococcus sp. AQ5-07 OX=2054902 GN=CVN56_03915 PE=3 SV=1\nMHVLFVCTGNICRSPTGERLARAYAAEAGVSGFTASSAGTRAMVGHPIEPTAARVLAGLGGDPTEFQARRMTTALASDADLILTMTESQRDKVLAMAPARLKRTFTLREAARLGSLADARTVEDLAAARPRFRAAEPEDVMDPMGKEENVFHEIGLEIADLLGPLLSRLRFGER\n>tr|A0A5T8G289|A0A5T8G289_SALER Phage terminase large subunit family protein (Fragment) OS=Salmonella enterica OX=28901 GN=DQ454_26965 PE=4 SV=1\nPPTTGILSLYNRGDRRRWYWPCPHCGEYFQPSMENMTGYRDSADPMVASEAARLQCPHCHKLTEPQQKRELNNRGVWLREGQHIDRDGNITGEARRSRIASFWMEGPAAAYQTWAQLVYKLLTAEEEYERTGSEETLKAVINTDWGLPYQSRRSLEARSSDALMARAEDVSKRTVPDGVRFIVATVDVQGGKKRRFVVQMVGYGAYGERWIIDRYNIRYSLRVNENGESQPVNPAAMPEDWDLLRTDVLDKEYPLAGDPEQFMPVLAMAVDSGGEDGVTDNAYAFWRRCKRRGVAGRVYLFKGDSTRREKLITKTYPDNTERSDRKAKARGQVPLYLLQTNALKDRIAAALEREEPGANYIHFPDWLGPWFYEELTYEERGADGKWKKPGRGNNEALDLMCYAHALVIIRKYEQINWEKPPGWARLPEKGAAKTTQPVGARRQEQHEGGEKAVKARKKKILPAWGGGSGGGWL\n>tr|W9B5Y0|W9B5Y0_9BACI 3'-5' exonuclease DinG OS=Oceanobacillus picturae OX=171693 GN=dinG_1 PE=3 SV=1\nMERFVVIDLETTGHSAVKRDKIIEVGIVVIEENEVVDSYGTFLNPGKSIPEFISSLTGIRDEDVKDAPTFEERAEEIAALFEDSYLIAHNVPFDMGFINAEFAAVGRELLQNPVLDTVELARVLYPKAPSYKLGQLAEYLGIHHEDPHRALSDAYVTAKLFLKLRERLDNLPYETITHLIRLEKMLKSDLFALLADRENELAFSTQEDPELETFQGLAFKKIKETKNTPQTRIGSYGDFLDAIYEEGGTLSQQMARYEKRTGQREMSETIYDAFQSRRHALIEAETGTGKSLAYILPAIYDAVISGQRLVISTFTTQLQTQLLEEEIPLIRNLLPFPFKVALLKGKSHYISLEKFERELLSTEKDNYDITLTKAMILVWLTETQTGDIDEVQLPSSGYLFFRRVSTDTEAHVDPQSPWFLRSYYQKARKAAQQADIVITNHALLATDIFNDYQLLPSYDKVIIDEAHHFEETASKHYGLKLDYMNMQYTLNQIGETNDPKFIGQLITKYRDFIEEEMIDRWDDLIIDAKYETDDLFRGIFQYVAEQNKHQKSLSDIGRTQYRFENSKEDTAKWDTILEMTNRLMFFLRDLIYILARLDQNLAKQYEDKYDKNEVEQYIEQLQQYMDHLESLFLAADSPKFVKWVEVETYGAKNAVYLYSEPTDISGFLSTDFFAKKESVILTSATLTMKNSFTFIKERLGLTDEEIETKKIPSPFSYKDQVQLMIPTDFPDIKHGNQDDFIYATCEAIFSLAEITSGRMLVLFTSYDMLKKSYYLLKEIMDTSTYALIAQGISSGSRSRLKKNFQTFDQSILLGTSSFWEGVDIPGEDLSSLVIVRLPFQPPDHPIFEAKSANLKENGKNAFMELSLPNAVIRFKQGFGRLIRSNTDRGIVFVCDSRIIQARYGKYFLDSIPEIPLTKDTTQQLMRKAEEWF\n>tr|A0A0D3HJS1|A0A0D3HJS1_9ORYZ Uncharacterized protein OS=Oryza barthii OX=65489 PE=4 SV=1\nMATKATTALLLLAAAAAALLCHVHVAVAAADSEPCDPSDITIATVKTGRVVGGLPEFQVTIGNECSCPEGDVVLSCLDGVPAGVDRSKIHTAGNDGLCLVNDGLQIVKGSPVVFTYAASAPISLAFDNASPRCQR\n>tr|A0A481QYF4|A0A481QYF4_9PSED Pilus assembly protein PilO OS=Pseudomonas sp. DTU12.3 OX=2073078 GN=C2E19_18930 PE=4 SV=1\nMRIPRLIVHEYLQGLGIPGLAGLALLLIAVAWALGGLLPGWQSLQHLSQQTQEATEYLAKVEDGSIAPPVVPQRQLDDFRNKLPAQPQATVAIDRIYALAAQEHITLARGEYALGVDPKTHLARYQILLPVRGSYPQLRRFVHALLGQLPAVVVEDLELQRKKIGDTDLNGRIRLTLFLSRS\n>tr|A0A412E108|A0A412E108_BACSE Transposase OS=Bacteroides stercoris OX=46506 GN=DWY58_15645 PE=4 SV=1\nMEPSIKDKYIILGFIFVAICMISFFITIIIAASFNQDNFVRLIVFVCSNLLGWLLYLSFQTVIFDTYEIYRIKFGKKEMKEITTETVALQEEEPQNTIEPVTQIAEGASSDAHPIELNIDPKRHEEIRSSYKDEQDKENERRIRMVVEYIHFYMPRIADEETVNHVCNEVSNWMNKNNYKPKPIKRRLTQDISNIPLRHFIWNIAERCMYKRYYNGDNRARFVKELFPREFSETDIATIKNFKVDPLKSPIPIDEPEDGKPDFHYPNGYLRKE\n>tr|A0A448JZC9|A0A448JZC9_PASAE Membrane-fusion protein OS=Pasteurella aerogenes OX=749 GN=acrA PE=3 SV=1\nMTKKRFFLLFIVIVALAAGYFYYGNKNDKTITYLTETVQRGNLQKTVIATGTIRAYNRVEVGAQVSGKIEKIYVTLGQKVKTGDLIAQIDSSTQQNTLDTATAKLASYQAQLKAKKVAYSVAKSSYDRLAKLYAKKSVSLDEFESAKDTLATAEAAIEEIDASIKQAEIEVNDAKTNLGYTKIVAPIDATIISIPVSEGQTVNANQTTPTIVQVADLSKVLIKPEISEGDITKVTAGMEVKFSTLSDPDKIYRATIDSVDPAMTTLTDNEYTESVSDTNAVYYYANVVVENPDNNLRIGMTTQNTITIADVKNTLLIPTMTLKKQNNKVFVNVLTTANQVEQREVQIGLNDDMNTQILSGLNEGEKVVSSQVAAGETVGTVRGPKMF\n>tr|A0A1T0CT31|A0A1T0CT31_9GAMM Pilus assembly protein OS=Moraxella pluranimalium OX=470453 GN=B0680_01190 PE=4 SV=1\nMTVQKGFTLIEMLVVLAIIAVMAMVAIPAYHAMMQRFESQSSKRHIAEAIRRAKIEANLHQKDIILCPYGVNEQCDRLGQVGLLVFVDKNSNNRLDDADIVSMKQPLDLRYGLLSMRVSLGRHYIKFMSDNAKPRGHIGNIRYCNTEQNNSLSHLTTINMHGVVTAKSGDVVSIDCG\n>tr|F8J9Q9|F8J9Q9_HYPSM DNA (cytosine-5-)-methyltransferase OS=Hyphomicrobium sp. (strain MC1) OX=717785 GN=HYPMC_1709 PE=4 SV=1\nMEKLKLLDLFSGIGGFSLGLEASGYFEPVAFCEIDTFPQSVLARRFVGVPIYGDIRALTAERLRADGIMVDAICGGFPCQDISVVVLDPFGGSGTTALAAETTERKWILIERDEEYAEKAMARIRDHVLGESHPAPAKKKRTPAALPKPTHEIAQVSLF\n>tr|A0A1U8LF61|A0A1U8LF61_GOSHI tubby-like F-box protein 5 isoform X1 OS=Gossypium hirsutum OX=3635 GN=LOC107926834 PE=3 SV=1\nMIQMSLKSIMRELKELKDGIGNMSKRGDQSKLWRSRTRSHVAPDEAPLESQLSEQSPWANLPPELLLDIIQRVEESETAWPARAVVVFCAAVCRSWREITKEIVKTPEQCGRLTFPISLKQPGPRESPIQCYIRRDRTSSTFLLFYGLVPSEGESDKLLLAARKVRRATCTDFVISLVADDFSRASNTYVGKLRSNFLGTKFTVYDSQSPCDSRIQSTARPRRRFHSKQVSPRLPACNYIIGTVTYELNVLRTRGPRRMHCILHSIPVSAIQEGGTAPTPSALPQSLDEQLSPLHSSKGKEPIVDIISPSIQATPVFSPGSREPLALKNKAPRWHEQLQCWCLNFKGRVTVASVKNFQLVAAVEPSHNVSPEEQEKVVLQFGKIGKDIFTMDYRYPLSAFQAFAISLSCFDTKPACE\n>tr|A0A212IWF4|A0A212IWF4_9BACT Chaperone protein htpG OS=uncultured Dysgonomonas sp. OX=206096 GN=htpG PE=3 SV=1\nMQQNGKIGVTTENIFPIIKKFLYSDHEIFLRELVSNAVDASQKLKTYASLGEFKGELGNLSVKVKIDKDNGTLTISDNGIGMTNEEIDKYINQIAFSSANEFLDKYKKDANSIIGHFGLGFYSSFMVSKKVEIITRSFKEGAEAVKWSCDGSPKYTIEAVEKAERGTDIILYIDDENKNFLEQGEIDKLLKKYCRFLPVPIVFGKKTEWKDGKSVETEEDNVINDTNPLWTRKPADLKDEDYKKFYQELYPFSDEPMFWIHLNVDYPFKLTGVLYFPQIKSNVDMNRNKIQLYSNQVFVTDSVEGIVPEFLTLMHGVLDSPDIPLNVSRSYLQSDQNVKKISNHITKKVADRLEEIFKNDRSRFEEKWDSLKIFIEYGMLTDDKFYERAQKICLLKNTDAKAFTFEEYKTLISSDQTDKDGNLIYLYASNKDEQYFYINTAKDKGYDVILFDGQLDVHMAGMLEQKFEKSKFVRVDADTIDNLIPKEDSKEVNLTDKQKEELNEAFTSQLPKIEKTEFIIDYKALDEKAQPIQITQNEFMRRMKEMSAMQTGMGFYGEMPNSFNLVLNIEHPLIKKIMGDIDNKDKEAVNLYATENRDIRQLIDLALLSNGMLKGEALNNFVKRNMENI\n>tr|A0A1F0KNA7|A0A1F0KNA7_9MICC Long-chain fatty acid--CoA ligase OS=Rothia sp. HMSC066H02 OX=1739503 GN=HMPREF2999_09040 PE=4 SV=1\nMKVFSTPAEVLVDPSLNLTSIVERHRADSSNPVLYRRQMSPGNWQPVRAQQFHQMVTDLAKGMIASGIRPGDRVGIMSRTRFEWTVIDFAIWYAGAISVPVYETNAPAQAAWALAHSEATAIFVEDEKLLARIAEAEEFASTTQEPMQLKHRWVIENGDLDTLSTRASEVSDEQLEQVRSAAGCDDLATIVYTSGTTGRPKGCALTHGHFLNLSANTRLVEPEIANSRNSSILFLPLAHVLARLIQVLALDAGLVIGHSPNIKNLASDLDSFKPTMLLVVPRVFEKVYEGAMAKAAKGGKFNKSLFERSTDIAVRWSQAKVEGRVPLKLAAQYALYDKLVYSKLRAALGGELRYAVSGGGPLGERLAHFFHAVGVQVVEGYGLTETCAPIAVGRINPYQIGMLGPLIPGAEGYIAEDGELLVRGVGVISSYYKNPEEDAHAFTEDGWFRTGDLARFDERGYLKIVGRKKEIIVTAGGKNVIPGIAEGHLRTSPLVSQAMLVGDEKPFISALVTLDPDTLPEQLEHLGLPRSLSIPEAAVHPAVRAAIQKLVDEANQLVSRAEGIREFRIMNRDLTEEDGYLTPSQKLRRAKILQDFSSYVDEMYGKVSDSTSDSLARLQEYAAEQSEKFAELREQAAERLHEYADQQTERLAELREQAAEKFEELREQAVERMQKPQEDKTETKEDAERSEKTNDDSEHETATPAKGVEAKKADTQRSEGEDS\n>tr|A0A370IAZ5|A0A370IAZ5_9NOCA Uncharacterized protein OS=Nocardia pseudobrasiliensis OX=45979 GN=DFR76_102294 PE=4 SV=1\nMKIALVGILAGLGLLTAAPAHAAALTPDYAQPPNGAGVDPGHNLTPVWSPIQVPALDDVDTASTTTITAHPYLAPWAHERVPIPAGTAVELRGAARVRIPEANGKTLVVNPNGHCYFDGPNAVSGDLTPTALTPVRIDTSAFQLTIEPTLYRH\n>tr|A0A5K3FDK5|A0A5K3FDK5_9CEST Uncharacterized protein OS=Mesocestoides corti OX=53468 PE=4 SV=1\nMDSVWLLLCTIAKLVFTIIWLMLVVIFRTGKCAVRTAAWVIVKCARFVGIRRKRIHFALMGETQGLVEETTGPIAPWRLVREGLDPEKYRGNYPVLRTHVPPVTTPQPRLVCRSFRATGTGRQVRGRPGAGEIVLRGSTKYRSFAALH\n>tr|A0A4U1DEZ0|A0A4U1DEZ0_9BACI Uncharacterized protein OS=Bacillus kyonggiensis OX=1037680 GN=FA727_10130 PE=4 SV=1\nMQTLERKGAGGVVVNPNRDKFLKEQRDLKQQYLGGARDNRTEMKSDPEYNNKNDTDISVGATGREVEEE\n>tr|A0D4D9|A0D4D9_PARTE PUM-HD domain-containing protein OS=Paramecium tetraurelia OX=5888 GN=GSPATT00013372001 PE=4 SV=1\nMKSQIVNNQRYYSCQDEDGNSTRMLRNSNNSVRILTDIQLPQQMSKSTQDAYEKGESEMKNNIFDNVIKENIIGFSIDIYNHYIIQCILEKGLSEHKSYVLRQVVENMDLFCYRKYAYKIVQACLTQFQNNQIIQYIIDNIKRLQFDQYGNLIISTLLDTIQNDEQFAQIINKLQIDKIKYHQYGCVILINMVTCPKANHVGPIINKLIQESIQLSKSQFSNYIIQKMLKERTIEQNKVLINEFLIPNFVELSCNKFGSNVCEIMVTKSLAYQLQNLWNLVIKQYDFYLFQESEITFEQ\n>tr|A0A1S1CB24|A0A1S1CB24_9MICC Uncharacterized protein OS=Rothia sp. HMSC061D12 OX=1715161 GN=HMPREF2682_07995 PE=4 SV=1\nMQYKARKHYETYYQKIAEAEKDPAVVKGENADGKTYILEKDKLAMVVGKNNEYIIFHQHDGNWSRLRPNGELELTYSDRAWVRVMPDGERIAVKASGNTNIAYHQGDVSEDIITSLKTPEVPAQVEGFASVPQKPVKPKKLGTVVGTK\n>tr|A0A1Q4EHA6|A0A1Q4EHA6_9PROT Carrier domain-containing protein OS=Thiobacillus sp. 0-1251 OX=1895858 GN=BGP19_06145 PE=4 SV=1\nMDTRQTLADIAIKEFQCDPEKIKEDASIKDLGIDSLGLLEFIFRIEEVFAIRVDNEDAEKVQTLTDIANLVDRLRTMAAA\n>tr|Q48M18|Q48M18_PSE14 Type III effector HrpK1 OS=Pseudomonas savastanoi pv. phaseolicola (strain 1448A / Race 6) OX=264730 GN=hrpK1 PE=4 SV=1\nMRISSSPSPALGSIVNQPTSGELAAETPLAKVSLTQSSAGGDQAFVQFGQANDNTSFFSDAEQSGSSLMSLLTRSSNSESTSSVDQDSDQVSPITSVLSTASASPAASASGPANAPSATDAAFLDNSEYSSPEALKRWDPMVAHLPPEEREQAAKELNRPIAAAWMAREHGPNADKAMAFINANPALKTAVDVGKDGGNADGKITNKDLKAFAKNMEKAADNADKDLAKYMEDNPGADPQSLEMVRSAAVMRANMPLATAADPHHAVGAPDKTDVDGNVSAEGLKALIKSNPGLSGTLKQSSNMWSQAGFLSQVDEAGLTGRKKAAHSPDQVFDASNMSEWIRKSAPKNGGQFASMLSDAATLNSVAGIDISKLNAQVFEKPKAYTGAQKAAVMIKLQQTQQSVIAGRDLRNTEKTEAGLNERIAQLQADPDVQEYLNKSIPEQERSLVSSDSALQKAVTEQVQNVNSGKALQTDLATADKAVGKHNPDPDYSGAITGLSAQLQLQKDLFPDAQVPTAQQVFNNQPDEVQTKIADSYVRNFSEGGALKQLLGQKKSDAGESLQTADNQKAAYESVLPADFVNGERESYTASTLSELQNSKKGRKLLEGKTDEEGGPSLAAQLAEQGIGGKAFNSVMGFASVSDRLASGDKLGAAQSIIDSSRLGAEAIKGGIDTGAKMMGREASAGLGRLGGQMIGRAVGLVAGEATGLAAGAALGAAIPVIGWAIDGAMALGFGISAIIDAVKKHKAQKAFDHNVDPVLDQFGIAKAH\n>tr|A0A7C6ZKE3|A0A7C6ZKE3_9FIRM Ribulose-phosphate 3-epimerase OS=Syntrophaceticus sp. OX=2699755 GN=rpe PE=3 SV=1\nMQIKIAPSILTADFSKLGDVVKELEKCGADQLHLDIMDGHFVPNLTFGPPVVASLSQITSLPFDVHLMVEHPEGLFSAFATAGAKSLTVHAEACTHLHRTVQMIKDLGIRAGVALNPATPLSFVEYILPDLDIVLIMTVNPGWGGQAFITTMCEKIRKLRMMLKDSGSPAELQVDGGINQQTVKSVVEAGANSLVIGSALLMERDWGQAIEQYRSLAVEAARDSWWCSS\n>tr|A0A089X985|A0A089X985_STRGA Uncharacterized protein OS=Streptomyces glaucescens OX=1907 GN=SGLAU_22790 PE=4 SV=1\nMSATPKSQLPVRGGDRKPARVRPYSLTGGRTRFGHVLLVETFVASTAALEAPEERRELTNGSLTTRVMPEMLAIVELCRRMRTVAEIAALLKMPLGVVRVLLSDLADQGKIRVYGTGTGHGTGRPNRALLERVLSGLRRL\n>tr|A0A849PEY0|A0A849PEY0_9MICO Acetyl-CoA C-acetyltransferase OS=Calidifontibacter sp. DB2511S OX=2732509 GN=HK411_11245 PE=4 SV=1\nMPEAVIVSTARTPIGRAFKGSLKDIRPDDLAAQIVQAALAKVPGLDPTLVEDLYLGCAEPWAEQGSNMARVVAVLSGLDHVPAATVNRFCASSVQTIRMAAHAIKAGEGDVFISGGVECVSRYADFAGAGGSKADWQNPKFADAIKRTEQIAQDNTTWTDPREQGLLPDIYIAMGQTAENVATSRGISRQRQDEWGVSSQNRAEKAIADGFFEREITPVTLPDGSTVSKDDGPRAGVTLEKVSQLQPVFRENGTVTAGNCCPLNDGAAAVVVMSDTKAKELGLTPLARVVSTGVSALSPEIMGLGPVEASKQALARAGMTINDMDLYEINEAFAAQVLPSADDLGMDFDKLNVHGGAIALGHPFGSTGARITTTLLNGLQSTDGTFGLETMCVGGGQGMAIIYERLS\n>tr|A0A415DY63|A0A415DY63_9FIRM Amino acid permease OS=Emergencia timonensis OX=1776384 GN=DW099_13175 PE=4 SV=1\nMDTKKHEGSFKKAIGPFSGISIVAGMVIGSGVYYLGSYVLERTGLSMGWSLVAWIVGGFITIVGGLCFAELGASMPVAGGQTVYLSKAYSPAFGFINGFSCFLLTGSGGVAALAMAAVTAYRTVFEISDIMVKVLAIAIILVLMVINLLGVREMTFYQNFSMVIRMVPILMIIIAGFVMGKESPDLSLSLAGTSAEGGGVTAVISMIGFATFASLWAYDGWYNLNTVAEEMKNPKKDLPFAIITSLIGVTLIYVLFYLAVYKVLPSEDIAEMINSGNLYLGNEVVSRTLGGTGIWILLICMTIGIVGSANVNTLCDPRTYYAMAKEGYFPKLFGHLSEKHGVPSYGIIVSAGMAVLLVIFNSLQELTDMLIFTTSILNLMTIYGVLIMRKKYPDIERPYKVWGGKFTIYLTSLMYVVLMVNEFIDAPKAAITGVGITVAGLIVYLYFKKKNGGEEYKGEGIE\n>tr|A5I032|A5I032_CLOBH Putative non-heme chloroperoxidase OS=Clostridium botulinum (strain Hall / ATCC 3502 / NCTC 13319 / Type A) OX=441771 GN=CBO0840 PE=4 SV=1\nMGYYIRVEPNVKIYVEDLNPEGNKTIVFLHGWPGSHNLFEYQFNQLPKMGYRCVGIDTRGFGNSDKPWSGYGYDRLSDDVRCVVEALKLHDFTLLGHSTGGAMAIRYMARHKGHGVSKLALIDAAAPSLIKRPNFPYGLEKEDVIKIIQGTYNDRPKMLRDFGDTFFFQHITEPFSDWFFQLGLQAASWATAAIANTWINEVLFSDLETINVPTLIIHGIHDKVVPFELGEIQNKMIKHSKLIPFKYSGHGSFYDQRDKFNKELVKFIEE\n>tr|A0A3D2U5H6|A0A3D2U5H6_9PLAN Tagaturonate/fructuronate epimerase OS=Planctomycetaceae bacterium OX=2026779 GN=uxaE PE=3 SV=1\nMTDIPGPCQTLGTIPSFGFGDRIGLATPGHVLAMQRSGQGILPIFPQQSIREMARTDRSPDDVMNDALTGMREAGWDGITGADADHLKTNTDAEITAEAGYTFFTIDPSDHVDEKADTYDEATLRERFAEIQHDLTWLGDYRGRKLTLETGARIECTEQACLRAGVKYGRAINHAIELAGHIAAVQGQAGRDYEIELSVDETDHPTTLAEHYIIADRCLVDGIRLISLAPRFVGDFEKGVDFKGDLEQLVRSLADHAALARHLGPYKLSLHSGSDKLAMYAMLAQATRGCYHVKTAGTSYLEALRVAARHDVSLFREVIEFSRGRFEIDRATYHLSATIDSAPPAEEISDPIELERLYLGLWSEVPVGEGFTGLGRQILHCTFGSVLTDSRLGPRLRSLLETHQDTYTEVLADHFGRHLDALQAGLSQSG\n>tr|R7KQJ7|R7KQJ7_9BURK 50S ribosomal protein L11 OS=Sutterella sp. CAG:521 OX=1262977 GN=rplK PE=3 SV=1\nMAKKIVGYIKLQVPAGKANPSPPIGPALGQRGLNIMEFCKAFNARTQGVEPGLPIPVVITAYADKSFTFIMKTPPATILIKKAAKIQKGSSRPHTDKVGKITRAQAEEIAKTKMPDLTAADMDAAVRTIAGSARSMGITVEGL\n>tr|A0A2G9V0G2|A0A2G9V0G2_TELCI Uncharacterized protein OS=Teladorsagia circumcincta OX=45464 GN=TELCIR_02714 PE=4 SV=1\nMHDIFDVVARIHVKWVRVVARTCSLILMVLDVMKPLKHKQLLEYELEGFGIRLNKQPPNIGFKKKDKGGINLTQLISLAELGSLEEEHFCFDVPTKALMNQMGETVLRITSKGHAADGVASTKSQRNTSANAAGLRKKV\n>tr|A0A4Y1VGS1|A0A4Y1VGS1_BACUN Protein kinase domain-containing protein OS=Bacteroides uniformis OX=820 GN=Bun01g_11110 PE=3 SV=1\nMFTLAKRQQLGNYIITFQVKEGDYAETYRVKDADGKNRFLKLINCAKLHRTQFDANGNILEVQIAKTLNHPNVVKYHDNGEVVLDGRKFAYIVFDYISGETASQYIAREGSLSVYDAKTIVLGILNGIKFLHTQQEPIMHNDLTIQNVMLDMSKGTNVPRIIDFGYARYLSQGSSSFNKNGLSPFYLAPEALNGVFSVKSDIFSSGAILYNLIFGIPPYFVDLSDCKNDATAQREKIDAQRELPLHIPDNDKFELDEQIMNIMRKALASDIEERFKSADEFIRALNGDIKIARIDNQKKAKSGKTPTKKVSYSVPKGKGFSAIAGMEELKEQMRVEVIDALNSPEEYAKYGLTIPNGMLLYGPPGCGKTFFAKHFAEEVGFNFMLIKPSSLKSRFVNATQENIAQMFKDAEENAPTIIFIDEMNELVPNRDSDVHEMARSAVNEMLAQMDRTGERGVFIIGATNYPDMIDPAILRAGRLDKKYYIGTPDFKARSLMFELYLKSRPYDFGLDYEKLAQLTENYVSADLEMIVNDASRIALRQKSRITMVILEDVISKTKPSLTKSELDKYLRIKAAMAGEQIQQSRRRIGF\n>tr|A0A3L6ZV02|A0A3L6ZV02_9MICO Multicopper oxidase family protein OS=Mycetocola manganoxydans OX=699879 GN=D9V29_08490 PE=4 SV=1\nMPNSISLRQQLSRRTFLSAGLSGAALLALAGCTPTPAFLSPTSARVAKTEAARKATGATTKVALRASTGAIDLAGTSAQTWSFGSIPAPIIRLAQGDELDATIQNTLPDATTVHWHGLALRNDMDGVPNLTQDAIAAGSSFRYRFTAPHPGTYWFHPHVGTQIDRGLYGALIIEDPREPLAYDDEWVVILDDWLDGVTATPEEVLAELSKGMKEMAGMEGMMMRMGNTLMGAESDALGGDAGDVYYPHYLINGRPPADPETYTSAPGKRVRIRMINAGGDTAFRVALAGHTLTVTHTDGFPVEPLDVDSVLVGMGERYDVIVTLGDGAFAFVAEAEGKNARAFAVVRTGSGATPASNVTVSEITGRLATADGLRAASEVVLPNKKPDRELTIRLRGSMKKYDWSLDGRPFTMDDPMIKPYSIAEGERVRVNFVNTTSMWHPMHLHGHTFQHAGGGPRKDTSIVLPDRTLTVDFDADNPGRWLAHCHNIYHGEVGMMGVFAYTG\n>tr|A0A817XL60|A0A817XL60_9BILA Hypothetical protein OS=Rotaria sp. Silwood1 OX=2762511 GN=BAC187_LOCUS7404 PE=4 SV=1\nMAYLNLASAANSTTSSTSSPYSHVNSNGGVSTIPPSLVSNSPSIFGSVGGGKQWTTIGQPTSSSSSSTLTQQLLMKQQQNILNNQQTNPLSSSSSSSHFDSILGLTMASALASSSQTQIEKNFELQQEDFPPLPHRSNSHEPTSSSTNVQPLYQSQYSSSSSSSNLHQPITNGYSSSQQQQQQQQHSQSQSPISFKTSIDALSTLINRRQTSVNNKTTSLTNNSTSSTTNPQQISSTSTTNINGLPSSTITDQYGLVGLLQMIQQAEKNPETSTLLNYDLTTLGLSMESQNDLYPSFLSPFSDSQARPYEIDYQVPFEYQMGLQIRDKLPPLNFNTLNEDTLFFLFYLFGNDHVQLLAAAELYRRDWRYHKEERIWLTRIKNIMPDQKYDTYETGVYCVFDVQLWRKTHKSMRIDYEKLDVNPVLKQDLFASKLLQQQSPVQPQFAPVSSYNTNSSR\n>tr|H6QSH4|H6QSH4_PUCGT Uncharacterized protein OS=Puccinia graminis f. sp. tritici (strain CRL 75-36-700-3 / race SCCL) OX=418459 GN=PGTG_11407 PE=4 SV=1\nMAGSLSLILLCLQVVSTVLGNSDPSAQIHRRSPQKPSKPPVSNTKANAKPVPFGFGSKVTGGGNAAPQTPKDPAELEAWLNDPAPRVILISKTYDFTSPNITKTSGW\n>tr|A0A2U8VWI3|A0A2U8VWI3_9HYPH Uncharacterized protein OS=Methylobacterium sp. 17Sr1-43 OX=2202828 GN=DK427_22560 PE=4 SV=1\nMEHVSEGDPQAGPAFGRTASLLAEIAVILRVDPVIFFDGEIRKRVDQDLAVDELADLLALLRSVDGPDLRAAARDLIRALKRNEADED\n>tr|A0A0B7NY01|A0A0B7NY01_PROFF Uncharacterized protein OS=Propionibacterium freudenreichii subsp. freudenreichii OX=66712 GN=PFCIRM138_07065 PE=4 SV=1\nMTEAKNPWLSHPAEPEPDTPVAIEEHVRPATGPVAPQRGVPAPDRADQLPLFDRRQNADVWWLGVHGGAGESSLSVVLPGSAAADHGWPQTPGEQPARVVLVARSNMRGLRAAQAAATQWASGLVPGVDVLGLVIVADAPGRLPRPLRDFAHLVGGGVPRTWTVPWIESWRLGEPPALSDAPREVRRLVDELHALIRPGADGTTN\n>tr|D7SV11|D7SV11_VITVI Uncharacterized protein OS=Vitis vinifera OX=29760 GN=VIT_04s0008g06260 PE=4 SV=1\nMVGLSVGEKHFIQGGIAQDLRTDGRRRLTYRPFNVETGVIPQANGSARVRLGGTDVIASVKAELGKPSPSQPDKGKVNIYVDCSPTAAPMFEGRGGEELSTELSGALQHCLLGGKSGAGAGIDLSSLVVVEGKVCWDLYIDGLVVSSDGNLLDALGAAIKAALTNTGIPKVEVAVGASGDGLPEVDISDDEYLQFDTSGVPVIVTLTKVGRHYIVDATLEEESQMSSAVSVSVSGQGRICGLIKRGGAGLDPSVILDMISVAKHVSEQLMNKLDSEISAAEAFEEES\n>tr|A0A352XE32|A0A352XE32_9CYAN Phosphoenolpyruvate carboxykinase (ATP) OS=Cyanobacteria bacterium UBA11367 OX=2055774 GN=pckA PE=3 SV=1\nMNQQNYAVESQRRNLHQAHQTSSPVHEQIERHSYTLGSLGMKNLGMVYHNLSVPQLIEKAVARGEGVFADNGALCVKTGKYTGRSPSDKFIVDEPSIHDEVDWNRVNVPLTQEKFDQLYRRMLAYVQGRDLFIFDGYVGADPQYRLSVRVINQLACQNLFAHQIFIRPTEEELQTHEPELTIIAVPGLQGDPDLDGINSEAFIVISFEKRIVLIGGSHYAGEIKKSAFSFMNYLMTKQGVLPMHCAANMDDDGNTALFFGLSGTGKTSLSADTTRHLIGDDEHGWSDRGVFNFEGGCYAKTLHLSHENEPQIWEAIHFGAVLENVILDEETREPDYDDESLTQNTRVAYPVEYIPNCAIPGIGSHPKTVIFLTADAFGVLPPIAKLTNSQAIYHFISGYTSKLAGTERGITEPQATFSCCFGKPFLPLCADVYGEMLYERLVKHNVDVYLVNTGWTGGSYGVGKRIAIQDSRAMVAAALNGELNRVRFYPDPIFKILVPEAVPGVDSDILDPRKTWSDSEAYEQQAQALAKKFVANFQQFNNVSQEIKQAGPSLD\n>tr|G5ZW58|G5ZW58_9PROT Putative phytoene/ squalene synthase OS=SAR116 cluster alpha proteobacterium HIMB100 OX=909943 GN=HIMB100_00002480 PE=4 SV=1\nMRPMKLSAYSDLRRHAPRLALTLLFQTEEQKQILAFLLLFGLELDRISALASEPMLALIRLKWWEDQLEVKTDEAGPLAGYLHQQLSSAHLKKADVIKLIDLWTMSVQAGQADQSENWAELIDLMAAKVNVQSSELARQIGRAVALSRSGQPSGVIPSARDIHKACGQGAEFLICLAYLAAESQKRDLNSSPFLVLGLLKQVLFKPASR\n>tr|A0A183VZ29|A0A183VZ29_TRIRE Uncharacterized protein OS=Trichobilharzia regenti OX=157069 PE=4 SV=1\nLCVHIFSCQTCGKEFIQPSNYSRHLRIHTKERPYSCKLCSAEFLYSTSLKRHQQRNHGVELLRCQLCQKTFLNESCLIRHRTGCELRACVKTADEGLCTQLL\n>tr|A7LFU4|A7LFU4_CAPHI Galectin OS=Capra hircus OX=9925 PE=2 SV=1\nMDSLPNPYQQSVSLTVCYMVKIKANLLSPFGKNPELQVDFGTGTGEGGDIPFRFLYCDGMVVMNTLKDGSWGKEQKLHTDAFVPGQPFELQFLVLENEYQVFVNNKPICQFAHRLPLQSVKMLVVRGDIVLTSVDTL\n>tr|A0A4R7X8B1|A0A4R7X8B1_9NOCA Uncharacterized protein OS=Rhodococcus sp. LP_11_YM OX=2485207 GN=EC908_103210 PE=4 SV=1\nMTLTTDITVGEVLPQLSIYGDPTFVVSAALATRDFQDVHHDRDLAQKRGSKDIFVNILTDTGLVQRFVTDWAGPRAVLTSIKLRLGVPWYAYDTLTLSGTVTSYDEDLVSLAVVGKNSLGDHITAQVTLAFPASGSNGDIENGDIE\n>tr|A0A838UPM3|A0A838UPM3_9CHLR AAA family ATPase OS=Ktedonobacterales bacterium OX=2306968 GN=H0X24_05985 PE=4 SV=1\nMPGRTPTAKPMPGQTSDPLPGVQHRGGMCSLGKSSRFAMIPGGLCAIRCRDHEGKRRIEKISHAFSVPPLSMAKREGASAQGRSLCARAFPIWVHCQNFTSEPSQTTLLITQSATLAKELLHSNLDEAAARLAATWLKDGARFPTMVREYREEFEQGAFDFLAFFFHEIILSEKYRPLFQAANGLELLKTQQHMAHDVTAIRGMLELLINHQVPSREEERLGHLMTYLARGNNATSEEQTTAPHHLWKLRTPRQFVGRDADVHWLTQRLSTPPPGDRISGVRGIGGIGKTALVGHVVTRLQQGGAFPAGIVVVNCSELHDVRDIWAEVAQSFGCQVDSPLGGEQLAHLMHETLRERDALVVLDDVQGEVRFTELVQPFAGTTPQIVVTSRLAFGAFPPEALWEVRELSSDHAVDLFRQCYGQPVDADEAALLPQLVAALYHHTLAVRLAGCYAAECQRDLGELLAELRADPLALPAEDQNRMVALILEKSLQNIERIHPLCRQIFTGLAAFGTPEFSREAAVALATYLDHQAPGFAIDRLIRYGLLEAASPHAGSVKVHQSRLHLHPLLYTLALQHFTQADGAQQQPLYSTICRY\n>tr|A0A1H9KCN1|A0A1H9KCN1_9BACT Uncharacterized protein OS=Lewinella agarilytica OX=478744 GN=SAMN05444359_12049 PE=4 SV=1\nMVAQTQQGRYELTPYAPHAYVFTTERGNTYIVRFIRYWQEEVVELYIKKELEVFEIYFEVMEIKDKGYDRRIQFTIIGAIVDFLAENDRVGFFDIKREDGRGLELLRVYRIWLKMYERNRKEKSIMLNRIVSIPDQFDSHIACLVHPNNKSFKGQNVDQLMDSVLKEIFPRATLTPF\n>tr|A0A7J9HNJ9|A0A7J9HNJ9_9ROSI RIX1 domain-containing protein OS=Gossypium harknessii OX=34285 GN=Gohar_003306 PE=3 SV=1\nMARFDQLENMYDLGLKPVMLRSLIRQYLPAENHPLNLNNSCFELPSLVSIVQTHCLLSELDSQSIDPKLINTWKSAVDDWLSCLLSLLSSDMSDKCWVGICLLGVTCQECSNQRFLSSYSIWLNKLLSHIQPPADSQLVKIASCTSLADLLTRLARFPEVKKDGNLLAGKLVQPVLKLLNEDNVEAVWEGAANLLYALIAFFPASIHHYYDKVQLMVAGTGRSFFGGWGVKVLEKEDIGVMAYFLGCLNVEAAIASKILSGKYSTKTLKKLGYFLALLPKAKGDKDSWSLMMQKFLISINDHLNEAFQGVEEEAKSDEARRLLVPPGKDLPLPLGGASFKGTSSERLPTATISTLMFCCCKMLTSSYPVQVTVPVRSILALVERLLRVDGSLPHTMLPFMTSVQQELICSELPVLHAYSLELLIAIIKGMRRQLLPHSAYIVRVVTRYFKRCSLPELRIKLYSIIRMLLVSMGVGIAIYLAPDVIENASNDLNSLGGEDIETSPANTDPATGALPQLSNRKRKHGAKTGSLEEKQDAASPKVGESNTHQMTPITVKMAALDTLEVLLTVGAASKSESWRSSIDSLLMKTAINSCKRGWGNLESNIFLPHESASVWADFQFSSLRALLTSFLAPARTRPPYLSQGLELFRRGKQEAGMKLAQFCAYALFALEVLIHPRALPLDDFYSACHNSTDGASNRFLENIYSGSQKQNTSFLSAMRRTEQGGVESHDDDLYDRWLQNENENQNENENIPVEDMKDQTSRPNDPSFTNVLEVREQEPAAANADVHMRTENEIVMQPWHLEESVPKSQGVASAKAVMSPPVGTNPEGSEIESKTPLSASDRLNDTNHDMFSCVDKVDGFDHVAGKTSSTLPNAEKGSSSMVHLDSDSSMDSFPGIVDADPDTDADSD\n>tr|A0A239QJE5|A0A239QJE5_9FIRM Redox-sensing transcriptional repressor Rex OS=Clostridiales bacterium OX=1898207 GN=rex PE=3 SV=1\nMRSSTLSKATMGRLPLYLQFIRTVQTENVSSATVARALGLGEVQVRKDLASICPAGMPKIGYPTERLREDLEAVLGMKQTIPAVVVGAGKLGRALMAYDGFREYGLEIAAAFDTRVTDSSHERKPILPMEEMTGWCREHEVHIGILTVPAGAAQEAADQMVNSGITAILSFVSVPIRVPDTVTVKHENIALSLACLKIVAGMSNETTEEDSHGSEDL\n>tr|A0A1R4IEU8|A0A1R4IEU8_9ACTN Potassium channel protein OS=Luteococcus japonicus LSP_Lj1 OX=1255658 GN=FM114_01400 PE=4 SV=1\nMVPGNGTNDDTLLTAGITRAAGFVTAIDDDADNVHATISARALNPELFIVSRASTKAVMHKLEPAGADRAISPYVMAGRRAVQLATRPGAVTCPSAWRRSESMRSWMASPWPTCVVAGWQPWPSATTTATTRPTRPSTVCCAWGRR\n>tr|A0A1D7XM32|A0A1D7XM32_9CLOT MBL fold metallo-hydrolase OS=Clostridium taeniosporum OX=394958 GN=BGI42_10650 PE=4 SV=1\nMDLRITTLIENNPDKDNLLLSEHGLSLYLEIDKIKVLFDTGKSGDFIKNAEKLKINLNDLDYVILSHGHYDHSGGFKSLVENTNKSFDLIVGNGFFNKKYKLLEEDKYKFNGNSFDEKFIDKNNISIRYVNNDLFKITKDIIFFSNFEKNTDFEMINKKFYIKKDNQYVKDDFLDEIVLAVKHEKGLIVVLGCSHIGVVNILKTIIKRTNMPIYAVIGGSHLIEADELRLNNTIEFFKENNIKLLALSHCTGENAIKKFQYEFGNNFIYNNTGNVIEII\n>tr|A0A0P1BF93|A0A0P1BF93_9BASI Zn(2)-C6 fungal-type domain-containing protein OS=Ceraceosorus bombacis OX=401625 PE=4 SV=1\nMSHVTSSPIWHEGAFSAEQYRQSAPAVPLQMVPPNAQLRGRMPPSLGHARHFTTPIAAPAQGPTIAHDEARPSDSNGLTPSCSRCRQKKLRCDFQTPCSNCIGKGLQSECHKDVRIPRGRKRPKAESQLTDEEEIVKLRKRLAELEERAGGGRLTPSTSSANSLGGRVSTRSDKPLRHRHHATGPADDRSGGNSSPGSRSHLSSSFVTATRDIIGSQEGLSIHLPLSGSASSDSFRSVPHGSTVPSPHSASVNESVLMKPQTRTRSSKPLILSPLLPAERALRSLETVANPSAARTICGTSERDGLLKRLTGLSDDVPNAYWSDPANAEERIALFVEARAAIPDPIVVEELARTFLYRANHCGGHVVYTPWHKAATELLSIASPEQAVSAPMFQDVSNLGLWFLILSVGYHFHPNNGPTSHTRGFAAVHALRKSGIDPSVRWYGIAKRALAIEKDYVLKSLPALQCASLFLLLGRDDPAWLRMLRAMTIAGARDMGLPRLGSASYAREMTTNDFVRLETAVRVWNFLCVRDWCWSQRDGSYSLHPSQMTTRLPLNLNDADLEAGTTESKSSSNWTEMSFVIAQVGLAHCVREAADLRNANLDDTSRAVVECIDESFRRFLSAGLPHFYSVNSREATPPIMAPQRWMLHQQVFHQLLLVHRNHIASPVGRSTCLSLALGTLELFKQLRMMCPVIEGMYVNSHHLFAAGTLLLLDLFNDNVDDEHRANVRDKVSAAVQYMSPAPRAKQLLSTLLDEEAQYYEATRDRKAYVQRDRTLDLATLCDRVAEVIEQTPGLPRDDVNAIDDVRMPDHHLMPALIGLQSPTSDFNQTKPNLEHHLSQDKVGPNSAFEDPRFFGFDHRQGNTSASPSSRPNTGLMPRRGTVLSPALPSPAELARRAPRILAEGAITLPSIGVDHNLSSNQHNSFNIHPSFRSAVALYHQSRKAHLKNV\n>tr|A0A5D8QFW2|A0A5D8QFW2_9THEO Stage 0 sporulation protein A homolog OS=Calorimonas adulescens OX=2606906 GN=spo0A PE=4 SV=1\nMDKKYRIAIVDDNKEFCTILKSYLEKEEDLEIVGTANDGNQGLKIIQEMQPDLVILDIIMPYLDGIGVLEKISSLDLIKFPRLIILSAIGQDTITQKAISMGIDYYIVKPFNMDTLLQRVREVLNIKESRTLKLYETSSSKYKWREEPNLEILVTNVIHEVGIPAHIKGYIYLRDAIIMVIENMDLLGAVTKELYPAIAKKYNTTPSRVERAIRHAIEVAWGRGKIETIDNIFGYTIQKNKGKPTNSEFIAMIADKLRLELKVS\n>tr|A0A2W5ZP71|A0A2W5ZP71_9BACT ATP-grasp domain-containing protein OS=Candidatus Dormibacteraeota bacterium OX=2052315 GN=DLM67_22145 PE=4 SV=1\nMTEPAILFVNLRGVPSEDRSALIAARRLGYQVDLIGPSLPAHAAGLVREFRLADTDDPEQGLRAARALAERASPAGVVTWGDRGVELVALIGQELGLRALSPAAGRRARHKVAMKQAVAHLPGIVGSHVGVVERSDLAPALRQVGFPAVLKPAAAAGSAGIFEVRDRDQAEAAFDRLAGWLQGAPRPFRGDGQGELILEELIEGPEFSLEGWVHEGGVTIAGVTDKWTTDGFHLEYQHVHPSGRLDSEQSVLRKGAELVVRTLGLDHCAFHLECKLTPRGFRLIEVAGRTGGDYIGSHLVPLSTGLDFHGNCIRVACGFPPRMEPVDSLCAGVRFLLARNEGIFLGLDGLAEVLQMGDVEQVFIEVPVGSALRLPPDDYDLQRVAAVVARGPEHSAVIETLDRAARCCAPRVERWDGHR\n>tr|Q1Q6C1|Q1Q6C1_KUEST Uncharacterized protein OS=Kuenenia stuttgartiensis OX=174633 GN=kuste2370 PE=4 SV=1\nMDLNEKIKEDLKSSMKAQDKMRTSVLRMMLADIKIAETSGKPRDQIDYAAVVQGYQKKLKKTREEYERLSLPEKTREIDNELAIVEEYLPKQLSDEDVQKIVDEVVDENKFTGKEFGVAMKLIMNKCGGTADGKKVLTILKQKLGC\n>tr|A0A3A9BJV2|A0A3A9BJV2_9BACT DNA primase OS=bacterium D16-54 OX=2320104 GN=D7X87_23470 PE=4 SV=1\nMNVFEAVRENGITARQAAEHCGIKINRNGMAVCPFHKDKNPSMKIDRRYYCFGCGEKGDAIDFVAKFYGLGKKDAAVQIAAAFGISFDDNGGRKPPPIRKRKLSPEQRFERVEKKCFRVLSNYLCRLREWQEQYAPHKAEEEWHPLFCEALEKKDYIEYLLDVLLYAPLSERVELVTDYGEEVLKIERRLEQCTEGTAGGTGKNYEQDGAGGTAGNMV\n>tr|M3NA57|M3NA57_HELPX Uncharacterized protein OS=Helicobacter pylori GAM244Ai OX=1159035 GN=HMPREF1407_01122 PE=4 SV=1\nMKIIKNGIMIGTLGALLLSGCSSFDAQRFACLPKDHSSKDASTKKEAQYIPKGFFDPYSSNLNHWDSTF\n>tr|A0A0B8PB49|A0A0B8PB49_9VIBR Putative ammonia monooxygenase OS=Vibrio ishigakensis OX=1481914 GN=JCM19232_3271 PE=4 SV=1\nMKPALNSVSTLAIAFATSALFVLLSVPLGEMFGSIIAIILLSKWGIKTKVPTHTLIFVQLALGLSVGGLIPPSFFATGFPLTMLIGLVVCMSLQVLCGYWLLQRFSWSKSDSLLASIPGAMAAVMVLNESQKTPSARSSSYIPFD\n>tr|A0A1A8U716|A0A1A8U716_NOTFU ATPase, Ca++ transporting, plasma membrane 1b (Fragment) OS=Nothobranchius furzeri OX=105023 GN=ATP2B1B PE=4 SV=1\nVYFAGQLYKKVPEPDLIPAKILDLLTLGIGVNCAYTTKIMPPERDGGLSRQVGNKTECALLGFSLDLHRDYQAIRNEIPEEKLFKVYTFNSVRKSMSTVLKNSDGSYRMFSKGASEILLKKC\n>tr|C3DIS9|C3DIS9_BACTS Oxidoreductase, aldo/keto reductase OS=Bacillus thuringiensis serovar sotto str. T04001 OX=527026 GN=bthur0004_18590 PE=4 SV=1\nMKYTKLQKAGLNISKLGLGTNAVGGHNLYADVNEEEGKQLVEEAIQQGITFFDTADSYGVGRSEEMVGEVLKGKRHKLILATKGGIQPLLNGETYINNEPSYLRNAVENSLRRLQTDYIDLYYLHFTNSETSYIDSIGELTRLKEEGKIRSIGISNVNIEQLKEANQHGHIDVVQSPYNMLERTAEEELLPYCIEAGISFIPYGPLAFGILGGKYTEDFKLNEVDWRQNVNLFEENTYKSNFKKVEKLKGLAKENDIEVSHLALAWLLNKEGIDTVIPGGKRAEQIRESVKAVDVALNKRVMKEIQSILED\n>tr|A0A659QZ73|A0A659QZ73_SALET MFS transporter (Fragment) OS=Salmonella enterica subsp. enterica serovar Wilhelmsburg OX=1960126 GN=C9F09_13540 PE=4 SV=1\nSDWPLNRGNSLSVARILPVICGMLLSCVIVIANYTSSEFVVIAAMSLAFFAKGFGNLGWCVLSDTSPKEVLGIAGGVFNMCGNMASIVTPLVIGVILANTQSFDFAILYVGSMGLIGLISYLFIVGPLDRITLTSSAA\n>tr|G8G1N4|G8G1N4_9HELO NADH-ubiquinone oxidoreductase chain 4 (Fragment) OS=Phialocephala helvetica OX=242229 GN=nad4 PE=4 SV=1\nMLLTLLLLTPILGIFAISTGISYELS\n>tr|A0A4Q2K9X0|A0A4Q2K9X0_9FIRM Uncharacterized protein OS=Candidatus Borkfalkia ceftriaxoniphila OX=2508949 GN=ESZ91_10490 PE=4 SV=1\nMIDFEALKRFIEAKRTPPRKVLRAAFKIDAECEPRALCGAAETDENALRERIGKRGKTFSEMLFYWIDARGEKDSDVYKRAGVDRKLFSKIRSDANYTPKKRTAILFAFALSLNEDQARDLLARAGYSLSDADTTDIIVQYFLQTDNHDLSELDEALVRFGEQPVYSE\n>tr|A0A841U1R9|A0A841U1R9_9BACL Aldehyde dehydrogenase family protein OS=Cohnella xylanilytica OX=557555 GN=H7B90_11630 PE=4 SV=1\nMNGTATIDNYIGGWRPPASGRRVPSLNPARRSETVGLVPDSDRTDLDAAVAAAEAARRSWRKLAGSQRGALLFKAADLLESRMDEIGRAMTREMGKTIGEAKGETARGAAILRYYAGEGMRPIGDVIPSTDAEALMYTTRVPLGVVGVISPWNFPVAIPLWKIAPALIYGNTVVWKPAIETAVTAALVMECFHDAGFPAGTVNMVVGDGAAIGQGIAEHPGIHGVTFTGSNAVGKRVGQIALARGAKYQLEMGGKNPIVVAADADLDLAVDATISGGLRSTGQKCTATSRVIVVREVYETFKEKLLAKIKTLTVGDGLDAETWLGPCASEKQYETVIGYIRKGREEGAELLVGGERPSHPSLADGFFVTPAVFDRVTTGMTIAREEIFGPVLALMEAGDLKEAIELANDTEFGLSASLYTRDLANALAFAQEMEAGLIRINAETAGVELQAPFGGMKGSSSHSREQGQAAIEFYTAVKTVFVKP\n>tr|S3MU72|S3MU72_9GAMM Pyridoxal phosphate homeostasis protein OS=Acinetobacter rudis CIP 110305 OX=421052 GN=F945_02860 PE=3 SV=1\nMNELHRARREVLEHIQKACEQANRSADEVQLLAVSKTHPSQAIEQLYQSGQRAFGENYLQEALDKIEALKALEIEWHFIGHVQRNKTKHLAEKFAWVHGVDRLIIAQRLSQQRPAGLAALNICLQVNIDQQDSKDGCAVADVVDLVREISALPNLRLRGIMVIPAPHNHQAFNAAAELFQQVKTEHVHAQDWDTLSMGMSADLQAAITAGSTMVRIGTALFGQRSYDLS\n>tr|A0A7I7TGD8|A0A7I7TGD8_9MYCO Uncharacterized protein OS=Mycolicibacterium helvum OX=1534349 GN=MHEL_56620 PE=4 SV=1\nMAHSIELLIDQRADTAVRQMWHALADGGLPSRHRVPSGTRRPHITLVAAERIAPGIDRVLGGLAEELPLPVVLGAPLVFGTDRLTLARLVVGSAALLALHDEVYGLCRPFAFNVFAHSAPGRWTPHITLGRRFTPAQVGEALAAVDGIAADIRASIVGLRRWDGDAKREYLMVN\n>tr|A0A4V2FIN5|A0A4V2FIN5_9HYPH Ribulose-bisphosphate carboxylase large chain OS=Rhizobium sp. BK696 OX=2512157 GN=EV569_4023 PE=4 SV=1\nMAQRFTVTYFIRGADAAEAKARALDIALEQTVEIPRAAVPKGYVEDVILGRLEGLEQVRDGRSGFLATISYSEDDVGGDFLQFLNIVFGNSSIKPGLKVEDIGLSSGILDLCRGPRHGIAGLRARAGIGQTPLLMSAIKPVGLSTKELASLAHDFAIGGVHFVKDDHGLVDQRTSPFSERLRACVAAVGEANAKTGGRTSFVPNITGPATAIVERAKEAQEAGAGGVMIAPALAGYDIIRTLAADQDFTLPVVSHPAFSGANVVSPDCGFTHRTFFGTLHRLMGADAVIYPNFGGRFGFSREECLSISAACAAEMGGLNTIAPAPGGGMTLDRVAEMRAAYGNDIMYLVGGALLVDPGGVIAACQRLVSKIYD\n>tr|B4DA31|B4DA31_9BACT Uncharacterized protein OS=Chthoniobacter flavus Ellin428 OX=497964 GN=CfE428DRAFT_5771 PE=4 SV=1\nMADDSSRYERKDFSPKAVGLSGLGLIVVCVISAVLIRHFEKDLNQFFAYQGRATWTSSPTMQPPEPRLQTNSAREFAEMRAQEEAELHSYGWVDRQYGVIHIPIDAAIKIALERGLPVRKSTPTAAATPVPAPATPTPAPKSAQ\n>tr|B1ZML6|B1ZML6_OPITP Stress responsive alpha-beta barrel domain protein OS=Opitutus terrae (strain DSM 11246 / JCM 15787 / PB90-1) OX=452637 GN=Oter_1073 PE=4 SV=1\nMSLTSRRQFLATSALATAAAVSPSHAAGTSAMPKLVHHVFFWLKNPSSKEDLATLLAGIRSLGAIETIRSIHVGVPASTEKRDVVEASYSASELLLFDDVEGQNAYQAHPVHQKFVQDCSGLWSKVVVYDSVSVDVPAGSKP\n>tr|A0A4Q1QFK1|A0A4Q1QFK1_9GAMM ATP-dependent zinc protease OS=Idiomarina sp. 29L OX=2508877 GN=EST55_04790 PE=4 SV=1\nMTTIGWREWGHLPELGISNIHMKVDTGAKTSCLHAFQLEPFMKKGEEWLRIFVHPKQDSQEEHVCEAKVHDKRDVTDSGGHTETRYVIKTRLVLGSFDQKVELTLTNRDTMKFRMLLGRQAMRGHFLVNPDASHLLGDVK\n>tr|T2C928|T2C928_9BETA U7 OS=Human betaherpesvirus 7 OX=10372 GN=U7 PE=4 SV=1\nMKNFETMAEQYKTLPCVGQLNDGLLRELKNLCRFTDFPGIRLLTERHRNECLSLIWPKNLWLRLAQPVDVAGYSEQQLAELNDHYQGFKENLCLIGAIQIGRKDVPIFVGKSSRIFCHDLEDDVLYYIAEDFDKFVRFGILGTNVITCSEPVYTRFYYDGPKFEKLETLKDLGLLQEPLNLNSSLRFNRKTALALKALRRNYISMLSELDELARCKTLAEIEHFVSINTGLKLRLETPIFTALILQDRKNIHCSTSDQKRFEEQEALFEKVVVLGFLNISAEDYGLRPILCIGETGAIYYYDWIDKVLTRIADCLLTFARIGFARYCGDFGYDKIGKVTARFGRLSTLGSAPVQQYSWYLKIVPVCNDVCIEPTPDLPSFDFAVELLLSSYGEGMEIVRNGIKCCLAWPPNYVLIFGEFYHFKCRRSVITYDWSNLVGADEFLCAVGYAHPNYREPDPDFDPFVMYCSSNKMLALDTVTDELYIIAESPAHFCSIGLRNFPPFARIELDIELDRLWYGETKCSGEEFVLLQKNIPALKNFVNRQCGQKIRIDAFQNFDLSFCSSNDIHYITGSGILEKILRRKYVVIGTCARCQVEPNCRAVILLGPNFHIYVYCDNKINKVARSIREFIRRGFEELLYKERYALNWHDDSLIYVSESEAENLNRMLNGESPILRKKPRHMYPRCDRLLKNMPSILFAVHSSEISNPLVQSVTKFLHPIIIPNGDTELKYIVPVTESRLINGLQASAAGRFGIKGLRLCSDGVIWNRLIDYEYEMFKYPSTFTRADKFLLQLRDLKFMEDFDPKWQCITKLAAVGFYSGASLFNLGAKPGIGYWCRYLCEYLSMLFFKLDGKLKELSKESKQKLGGFSCAFWSESFKTEMQNKTESFFRRDFFDRFQLYLLEHFLLFCGCEECRYNFFRFKNVGTMKKNPGSVKLHFFPALGKIDLPIFPHLSEKYSNLSMFVAKDLCLSFIEGQIEHSRFPISVTVDMGQDKRNLLNILSNIVFLLFIIQTLNSVLFTELKMYYDVYLDELKNLESSMECEMKLGSKGCMNNIVYFNMLKQVKDIVRNPGTSSNFIFNCLEVIKMSFEIPYYKNYDETNFMESFYLHHLYIQRQPAKHTDLVAANNLAPGFFIVNAKEKSFIDVLERSIVNIEAEYLSNTKNINGAMALFFSGLKYFGNFGNGNFQTSPEKDVRAVGYKLGGLDKIQNDLCYFANVETLACVGVDASDGNE\n>tr|A0A5C4V3X6|A0A5C4V3X6_9ACTN Pyruvate dehydrogenase (Acetyl-transferring) E1 component subunit alpha OS=Streptomyces sedi OX=555059 GN=pdhA PE=4 SV=1\nMGRTQARTAAGKSTAGKTTAGKSTSGKAKPTARKSAAGNATANGAANGKPPAKKATTRKPAASGTAAKPAARKPAAKKPAAGKSPARGTAARTKPADGPEMVQLLTPEGERVEHPDYPLTVSHEELRGLYRDMVLSRRFDAEATALQRQGELGLWPSMLGQEAAQIGSGRALRADDYVFPTYREHGVAWCRGVDPTQLLGMFRGVNHGGWDPNSNNFHLYTIVIGSQTLHAAGYAMGVAKDGGDAAVMAYFGDGASSQGDVAEAFTFAAVYQAPVVFFCQNNQWAISEPTERQTRVPLYQRAQGYGFPGLRVDGNDVLAVLATTRAAAEQTRSGQGPVLIEAFTYRMGAHTTSDDPTRYRRQEELESWEARDPILRLRRHLDREGAADEAFHSELEAESETLARRVREAIRTMPDPDPIAMFDHIYADGHTLVDEERAEFAGYLASFADHEGN\n>tr|A0A5B2V3L5|A0A5B2V3L5_9PSED Chaperone SurA OS=Pseudomonas brenneri OX=129817 GN=surA PE=3 SV=1\nMNVKIKLSDCLRPLMLGALFLGTAAAHAAVQPLDKVVAIVDNDVIMQSQLDQRVKEVQQTIAKRGGGVPPTSVLDQQVLERLIVENLQLQIGDRSGIRITDEELNQAVGTIAQRNNMSIDQFRAALARDGLSYEDARDQIRREMIISRVRQRRVAERVQVSEQEVKNFLASDLGKMQLSEELRLANILIPTPDSANAEQLNAAAAKTQAIYDRLKAGADFAQMAIAQSGSDNALEGGDMGWRKAAQLPPPFDRELSAMEVGGITQPARTPGGFIILKLLERRGGEASLKDEVHVRHILVKPSEIRTEAQTKELAQKIYERIEGGEDFATLAKSFSEDPGSALNGGDLNWIDPRALVPEFQQVMNDTPQGVLSKPFKTQYGWHVLEVLGRRATDNTTQAREQQALTVLRNRKYDEELQTWLRQIRDEAYVENKLPGAEPTGTDQAAQ\n>tr|A0A1D1ZL49|A0A1D1ZL49_9ARAE 60S ribosomal protein L35a-4 (Fragment) OS=Anthurium amnicola OX=1678845 GN=RPL35AD PE=3 SV=1\nFLFSYTHPHISYKMGKAVRLYAKGRVLGYKRSKVNQSPNTTLVKIEGVTAKEETQFYLGKHIAYVYRAKREKAGSKIRIIWGRIARPHGNGGVVKARFRKNLPPKTFGASVRIMMYPSRI\n>tr|X0K267|X0K267_FUSC4 Uncharacterized protein OS=Fusarium odoratissimum NRRL 54006 OX=1089451 GN=FOIG_02629 PE=4 SV=1\nMTALAQVALLRLGASRAMISLFDCQHQHIIAEATPALRISAHANPPSSGSDSLWLCGTAIPRSYGICDRVLVYPEFGGPQQASLASELPVTVISNLAENEEYRNTWYYKARPEHRFYAGVPIRTRRGINIGVFCILDNEPRETLDEASLQVMRDVSASILGQMELTRSGDGRRPGERMVRGLGSYVEGKTTISGWQNSSTHAFNTDASTEEGSLNQTQQKIQNQRDNAAAAADTESISTPDTFVLESPSQNRPTSPFHPTDKTPHSVPTGEESRSQQLNQIFSKAANILRESIEVEGVLFLDAGIGSFAGRIRSGSLRRNSRTHDRSSSSSSSSSSPGKGNISVSSPRNSADSRSSGAMCPILGFSTSVSSSINGEAPAGRSRTIPERQLQMLLRRYPKGKIFNFDGYGVMASSDPASEDSAMAVFQAQKARSIQEGQRGDNQKSRKVNDPYSRKNEGMAIRDVFPGARSVAFVPLWDSHRERWFSGCFVYTMTPTRIFTVQGELSYLAAFSAVIMADVAMMESSIVSLATTSLLSSLSHELRSPLHGIVLCAELLRDTALDVFQGDVLRSLEVCGRTLLDTINHLLDWTRINNFVKAPSGQSPNSGIAFVRGAQSNQRSGPTDGMMHITSNLDLDMLVEEVVECIYAGHTYQQQSLSLVHDDKPNEELNRDPFTRLDGMDVADSIKAGEKISNGAGPDAVLVMLDIDPAVNWAFHVESGALRRIIMNLCGNALKYTTRGYVKVSAYQDTPGQSRLRDRVVHIDITDTGAGIGQDYLNHRLFAPFAQENIHSSGAGLGLSLVRKFVRALGGSIHVQSKVGTGTRIAVKLPLEAVSVDSTETISDREEFQSQAIELSGLRVCINGFTPFGGGGSESQRWNSREFDERALLQKVCHDWLRMHVVDSLHNAEYLPDLILCDESHLETIANQPRDELSSPVVVVCRSAAVARSLDRSHRSQRKLNWGLFSFISRPVGPRKLAKAFVLCFRRWTKLQATAADRASVSTRLDEPPTVSTAETDLVQHGSDDKNRGYFDIAPTLSPKKRRAHWNDDGTRTPLPSMPALQLPTIPRDQRFLLVEDNAINMKILQTYMKKMGVEYDSASDGLQALECYKAQEGCYKCILMDISMPVMDGFEATRQIRGFEKASDLPRRHIVAISGLASKDAQEDAFANGLDLFLSKPVQLKELSRILKSRGLI\n>tr|A0A813QIU7|A0A813QIU7_9BILA Hypothetical protein OS=Adineta steineri OX=433720 GN=IZO911_LOCUS5098 PE=4 SV=1\nMCGIKRCCRNCCPNGCCGFCKPPKQVQQQVDTLIHLKEAVTASETRYGFIKFYPGVRTVDNNYTCPMFAIHLYRQGKLNANMAQDNRTVTYAGRNHQQTHQGEKQFISTQNASAEEEVIMVPLEDVIHISYKADVKIGMQADIKSHVTPVHERSENCCDRCCAPIVNCCRKTRDCCCCHSRQEENKVAPFVQNTTTIINANSNRNEDYVEQDLPLPKVKESCWSKCCNPCRCWCCRKKRLVRLIKRTNTKAARQAERVITMTIQYSKYSNLDTASHTRLLSNQHQLEYFKAKFQPDAELEFYLINDTEFEPMNFDVKKNEAEVLCRTVMQLKGMKNRYPSADELDKILDQPQQRIFGTIFHEPILQLPSNAEIQRVT\n>tr|I2FGU6|I2FGU6_9ANNE Cytochrome c oxidase subunit 1 (Fragment) OS=Megascolecidae sp. Esik120 OX=942496 GN=COI PE=3 SV=1\nTLYFILGIWAGMIGAGMSLLIRIELSQPGSFLGSDQLYNTIVTAHAFLMIFFLVMPVFIGGFGNWLLPLMLGTPDMAFPRLNNMSFWLLPPSLILLVSSAAVEKGAGTGWTVYPPLASNIAHAGPSVDLAIFSLHLAGASSILGAINFITTVINMRWSGLRLERIPLFVWAVVITVVLLLLSLPVLAGAITMLLTDRNLNTSFFDPAGGGDPILYQHLF\n>tr|A0A2I7QPQ3|A0A2I7QPQ3_9CAUD Coil containing protein OS=Vibrio phage 1.034.O._10N.261.46.B7 OX=1881189 GN=NVP1034O_23 PE=4 SV=1\nMATVAAIAGVIGAVTGVVGAVQQRKAAKKATAEQKRQNALNNRVQEVNQRRDIRRSIAASRAQQAQLEQGGIDFGVQGSSIVAGAQGAAQTDLATSIGSGFANQGASAGFAASRNRQADAMLDVQNNIYTDVSNFAGNFTHAGVNEVYKSELTGLFS\n>tr|A0A537DGT1|A0A537DGT1_9PROT Thiamine pyrophosphate-binding protein OS=Betaproteobacteria bacterium OX=1891241 GN=E6H40_11730 PE=3 SV=1\nMENERPLASPKQNEIWGSDAIAALLRELDIPYIALNPGASFRGLHDSLVNYLGNERPQLLLCLHEESAVAIAHGYAKASGRMMGVALHSNVGLMHATMAIFNAWCDRVPMLILGATGPWDAARRRPWIDWIHTSADQGALVRDYTKWDNQPASVPAAWEALLRAAQIANTAPRGPTYVNLDAALQETKIGPLPPLPDVSRYRAPEAVLPKAELIDAAAQLLSAAERPVILAGRFARTGAGWKSRVALAEKLQASVLTDLKAGASFPTDHPLHVAPPATFLHENAREALREADVVLSLDWIDTAGALKQAWGDAPIGAKVILVSPDAHAHRGWSMDYQGLPPADVYLMCEPDAVVPLLLEAVEPRAAAAAEQRAEETTTDKTLSLRALADGFNTATAGLNVCLARLPLGWNGAYRHFKHPFDYLGGDGGGGVGAGPGMIVGAALALNDSGRMVAGILGDGDFLMGVTALWTAAHYRIPCLLIVANNRSFYNDELHQERVAHERGRPVENKWIGQRIDEPDIDLASMAGAQGAFGIGPVTDLAELQPSLARAIELVREGNVCVVDVRVVPGYDSSVSGSPARR\n>tr|A0A7L4GLY1|A0A7L4GLY1_PODST SESN3 protein (Fragment) OS=Podargus strigoides OX=8905 GN=Sesn3_1 PE=3 SV=1\nGRLEAVTQQMGYHPQYLDSFLKTQHYLMHMDGPLPFDCRHYIAIMAAARHQCRYLVNLHVLQFLRAGGDPQWLRGLDFIPPKLRNLNEINKILAHRPWLITKEHIEKLLKISEWSWSLAELVHAVVLLAHCHALASFVFGCGCEQDEGLGGRGLLKPLSPGNQCFCEATAGNGCSQELLRISRKRSLDSCMELDSLRERMQRIHVETEGREEMRLLQQDREEGEGQGAEVGHHSDPPAGLSPLADTDGEVTGATNLACYMQDPDFGYQDFARRDEDQTQVFRVQDYSWEDHGFSLVNRLYSDIGHLLDEKFRMVDGLQSSAMAKRQGCEPSVFKRGIWNYIHCMFGIRYDDYDYAEVNQLLERMLKVYIKTVTCYPEKTNPEMFDRFWKQFKHSEKVHVNLLILEARMQAELLYALQAITQYMI\n>tr|A0A6A3AK87|A0A6A3AK87_HIBSY C3H1-type domain-containing protein OS=Hibiscus syriacus OX=106335 GN=F3Y22_tig00110462pilonHSYRG00339 PE=4 SV=1\nMYTSRHVVFDELQFPFAKLHEKVSNEYNTHASSSSLQIVAVVHKFQHVLAEGYDNNSMTNNSPATVSSNYFSSNVAATSNSQNEAQEDVVDSSSATQNDATQDDDAHEETVVPQSVNECTPSEGVNSDMPTNTHHMMTRSKCGVFKPKVRKETVQAEFDALLTNNTWTLVKLPEDRTAVGCYDFKDTYNPIIKFSILNIVLSIAVTRKWCIRHVDVNNAFLNGKLAEDVFMQQSPGFEKYAVDESVLVCKLNKALYGLRQAPRNWHDKLKTSLIRLGFTESKADVSLFVRIDADCRIYILVYVDDIIITGDSSPSIDSIVHALSRDFSLKDLRSLAYFLGIKVKRTEEAMLLSQRKYIIELLEKICLLNATPTVTPMIGASKMTQEVGALLSDAREYRSIVGALLYVCHTRPDIAFSVNKATQFMHAPRELHLAAVKRILKYLASTLNYSLTFSSNDVSQDVVAFTDADWGGSLDDRRSVSGHAVFLGHCLVIWCSKKQKIISRSTMEAEYRIIADAAVEVMWMSSLLCELGVKHRNMPVEWCDNTSTVALSTNPVYHSRSKLVDMDVHFVREKVAANQLQVNYVHASHQVADVNPTESGSSGQLLLDASNFPERPDQPECRYYMNTVTCKYGSDCKYHHPKEMIANSTINGIGPLWLPSRPPSSVFDSSALTYQRMSPTAHLSETPLPSKLTDWTGNTESVSKKHQNTEMKNSDDPAEQAALTHSLQISSKNSQDD\n>tr|B6WSE8|B6WSE8_9DELT Tyrosine recombinase XerC OS=Desulfovibrio piger ATCC 29098 OX=411464 GN=xerC PE=3 SV=1\nMGRHIEKDTMEEELDPRTTLEIESFLAWLDVQRGLSPTTQIAYGTDLRQLALFLAQRGASLARPAEVSKKHIQAWLARLYALGEAKSTMARKLAAARTFFRYQQRMGRTENNVAAQVRNPKQEQRHPRVLNVDQAFAVLDTPDALAGTGSPRIPPATGDALAARDHALAELLYGSGLRISEALGLDVTDLRLDESVVRVFGKGARERMSPLSDTSVTALRAWLEQRGTLAPEGEKALFVGARGGRLDRREAMRRIERLCRNAGVEPVSPHALRHSFATHLLDAGADLRSVQELLGHQRLTTTQRYTRVSLERLMHLYDEAHPRAQKK\n>tr|A0A6A7M004|A0A6A7M004_9PROT Uncharacterized protein OS=Rhodospirillales bacterium OX=2026786 GN=GEV13_06010 PE=4 SV=1\nMWVNAREVPRFYPNAVTLAHDDASIAEQLSNIEVLQKSNLPGRWAVKDSFQALDLSRRGFDVLQEASWIRSVMPTGSSATDIEWQRETQGKAPWPYDDPNFAMFTGRRGFSVVAGGMLYRAAGVAGLSNVVAEAADAVTVWRSLILLASRTFPRLPVVGYESGGELAAALDAGFEIGDPLKIWVRARD\n>tr|A0A2T0N3A0|A0A2T0N3A0_9ACTN Uncharacterized protein OS=Nonomuraea fuscirosea OX=1291556 GN=B0I32_10527 PE=4 SV=1\nMTEKIPVDLWFDPSCPFAWVTSRWLLEVEKVRPIQPRWRQMSLYFLNEEKDVPADYLERAAKAMGSVRVIAAAAAKHGEHVIGQLYTGLGTRLHNQGLSKEPERLREVIEGALDDAGLERSLAEAMHSEEYDATIRASHDEGIGLVGQEVGTPVIRVGDNAFFGPVITRILRGDDAGKLWDGVLAVTQFDDFFELKRTRTRRPQFD\n>tr|A0A3A6JJ78|A0A3A6JJ78_9FIRM Uncharacterized protein OS=Coprococcus sp. AF38-1 OX=2302943 GN=DW025_00330 PE=4 SV=1\nMAIRKDGPQKAVMREMMRDYLKNNDISIKDGTDVNSIMCDMMFVILEGALDEKLGYSKMTVELFTSFRV\n>tr|A0A4R1JNC6|A0A4R1JNC6_9GAMM Ribosomal protein S18 acetylase RimI-like enzyme OS=Celerinatantimonas diazotrophica OX=412034 GN=EV690_2119 PE=4 SV=1\nMIQYRPMQINDYDSVMALWLQTEEMLLREADSQTNIAHYLARNHNLSFVAENENHEIIGAILVGTDGRRGYIQHLSVALECRSQGIGRDLIAKAVKALKEIGIAKTHLFVNIANENAKKFYQRLGWQVREEVRMYSFNSSEDTQI\n>tr|A0A7S6MMK8|A0A7S6MMK8_9GAMM Flagellar assembly protein FliH OS=Gammaproteobacteria bacterium OX=1913989 GN=HRU78_01625 PE=4 SV=1\nMIASNFVPKEKLTAYQRWEMDSFEAPELSQEAQEAGKESNDQSDSQPQVSLPTEEEIAAVLRSAKEQGYAAGLQEGHTAGHAAGYAEGRALAESEVKAEVARMQTLLTKLDQDLQQMDQQVAASLLELAIALTKKMVTEALKLQPELIVPIVQEAIRNLPNATQHPRLFLHPEDAKLVLAHLHEQLEQDHWSIREDEQLIRGGCRIEAGGSEINGSLEVRWQRVLSTLGQTDEWLNKAD\n>tr|A0A852D8G1|A0A852D8G1_PASAF PDIP3 protein (Fragment) OS=Passerina amoena OX=142471 GN=Poldip3 PE=4 SV=1\nQLAFSPLEGTKMTVNNLHPRVTEEDIVELFCVCGALKRARLVHPGVAEVVFVKKEDAITAYKKYNNRCLDGQPMKCNLHMNGNVITSDQPILLRLSDTPSVKKEGEPRRSSASASSNPPAEVDPETILKALFKSSGVSASVQPTEFKIKL\n>tr|A0A2T7IVZ0|A0A2T7IVZ0_THEOR Uncharacterized protein OS=Theileria orientalis OX=68886 GN=MACK_00001413 PE=3 SV=1\nMDGKNPYEFESLVSLMRMNFASIVEKVKGMKVLILDSETSKIISLVYTHSYLLENEVLLTLNIDDGTIFNPDPNVTVDSNLKYLKGIYIVSPNXESLNXISSELKNPHFKEYYVYFTNKVKEDLLELMAKSDTLEIVKGVYEYFVDFYVLDECLFTLNIANLQSLYKDDVNMMLDFSVSKMVNSLFSVCCMLNQIPTVVYRRNNPILQTIANKLQADFNNNNLNLQSIIQSYNNYNSKNPTADHSGCVLLILDRREDCITPLMNQWTYRAMIHEMLKINNNKVMXEDTEYILGNNDDFYGKHLFDEFADVESDLNVLINENKPANSDIYKILESLPEQSKTLNDTTRHVKVLHELSKHIQKNKLLDSGILEQDIATNRRNVINELAEFLNDKTAPTYEKLRVALIFCLKNPGDTNKVNRVKDYLKMNRLDQHVGLVDLCLKLAKFRPVSKTNQDFTLSSLKDKFNKVSLESQSPYLQYKSQLHSTCYNLIKGKLDVELYATMPSAYDLGYTLKHKPASVSIKFFYSSRRTVGDVTYDRPHQITDEMPKVSELDVYKEVLSGEKRKSIRRSDFLKFTGGKRPLISSHLHANLIASGLVVWAVVAFFLTFKVMKPESYEWVENERRRIEAAKQKIALIKKDQENKALAQ\n>tr|Q3JRW6|Q3JRW6_BURP1 Putative membrane protein OS=Burkholderia pseudomallei (strain 1710b) OX=320372 GN=BURPS1710b_2292 PE=3 SV=1\nMSTLTSPPLSVAAPSMRGRLNGVLFVGLFALAVTSVAQLPAVAHLGLSPLIVGIVAGALYGNLLREGMPASWAAGVDFSARKLLRIAVAFFGLRVSLQEIAQVGVPGLAVSALVVASTLAVGTWAGIKLMKLDRDTALLTAAGSAICGAAAVLAFESALRSKPHQSAMAVGSVVLFGTLSMFAYPLAYRAGWLHLDATGLGLFFGGTIHEVAQVVGAASDVGPEVARVATIVKMTRVMLLVPVLLVLGAWLARSARRSTAAGRGAPRKLAVPWFALGFLGFVIVNSLQMLPAAAIGTLNALDTFALTMAMTALGIETRMSQIRAAGPRALMTGLILYAWLVFGGYAIVWATQRWLG\n>tr|A0A661D2Y2|A0A661D2Y2_9GAMM Uncharacterized protein (Fragment) OS=Gammaproteobacteria bacterium OX=1913989 GN=DRQ40_10815 PE=4 SV=1\nQDTDPEPEPEPEPEPEPEPEPEPEPEPEPEPENTDDSDELEPVPSNKLSDYLTKSLGGSISDKDNNSVDEVEVDPQTKIESDAGVESELGSEQDQLLSMVADIEAEEADPPIVEDAAESSDEQNQPEDTKSVYGSEIEALSAKVKARTSELKAEAEKAQIRLDSNLEVKTSFDVELQLDKGSELEPNLENDSNLSATDIDLVNDEDFNLEQPEEQPEEQPEEQPEEQPEEQPEEPLPSEEQLDSMLSEVRALEQDKTLKNEKAEEPVVAKSTQDELQAILSSIPSFSDMNKK\n>tr|A0A6N6VZN6|A0A6N6VZN6_9BURK Magnesium transporter OS=Paraburkholderia madseniana OX=2599607 GN=FSO04_44420 PE=3 SV=1\nMATELLSAQNTDHFPLDRGYLFSGNGVGREIDANTAIEWLKHRDDDSTEFIWLYFHDIPTVPEGWPLQHVQVPEAFGDTLKEGSRSTRITHVYQTLIAVLNDVEYDLERKTSLKVATLWVNVGVHYLISVRNSPLRSVNQLRLAVEAVETFRSPMALLIHLLQEQADVLIGIVRTAAQAANDVDETLLAGRLPTRSGLGGIRRDLVRLRRLLAPEPAALFRLVSRPPHWVLEEDAQSLRQSAEAFSLTLRDMAGLQERIKLLEEEIADRVAEHTNRSVLILTAVAVIALPVNLISGLLGMNIGGLPFKYQPFQGLDQDVPPLARLSRRAVL\n>tr|A0A063XZJ1|A0A063XZJ1_9GAMM Biotin synthesis protein BioH OS=Nitrincola lacisaponensis OX=267850 GN=ADINL_1947 PE=4 SV=1\nMLSIESLAGQGADLVLVSGWGSDSGIFDPLLPLLSPYFRVHRVLWQTSGWPADDGQLRYQLLNCLRRQAPSRAIWVGWSLGANLALTLADSFPEKVSRLVTLAFNPCFVQRDDWSCAMPQTEFLHFQQNFLTAPAATLKRFQALQVMGSVDRRQVIAALQSSPAHLPPARLSQLLQLLADDLRPQLKRLSQPQLHCLGAQDTLVPCASLLAAYPHLNPQVELRCYAQSAHLPFLSEASRWCEDLRQWCQA\n>tr|A0A7V9MZW3|A0A7V9MZW3_9PROT Pentapeptide repeat-containing protein OS=Alphaproteobacteria bacterium OX=1913988 GN=H0U98_14635 PE=4 SV=1\nMMLPLPAMAADPAAVAKIHGGIVDCVGCNLAGADLSNTCVKDHDLHGADFTGADATLMCMSFANFTGVSFRGAELSGANLAGAKMDGADLTGAGTSITSFLGTDLTKVKGLTQKQLDIACGDATTRLPPGLNIHTCE\n>tr|A0A3A5H6E9|A0A3A5H6E9_9ACTN Recombination protein RecR OS=Nocardioides sp. K1W22B-1 OX=2321396 GN=recR PE=3 SV=1\nMYEGIVQDLIDELGRLPGVGPKSAQRIAFHLLQADPADVRRLADVLIQVKAKVKFCSICFNVSEEEQCRICRDPRRDPSVICVVEEYKDVAAIERTREFRGRYHVLGGAISPIDGIGPDQLRIRELLIRLADGAVTEVILATDPNLEGEATATFLTRNLKPLGLRVTRLASGLPVGGDLEYADEVTLGRAFAGRRSADD\n>tr|E9F284|E9F284_METRA Cytochrome b-c1 complex subunit Rieske, mitochondrial OS=Metarhizium robertsii (strain ARSEF 23 / ATCC MYA-3075) OX=655844 GN=MAA_06282 PE=3 SV=1\nMASLTSASRLCLRSAAKPAMPAVRALSTTAMRSDSAASSYQSPFKMGSDKGSSIPDFGKYMSKKGEGNNKLFSYFMVGTMGALSAAGAKSTVQEFLVNMSASADVLAMAKVEVDLNAIPEGKNVIIKWRGKPVFIRHRTQDEIDQANKVNVASLRDPQTDDERVKQPEWLVMLGVCTHLGCVPIGEAGDFGGWFCPCHGSHYDISGRIRKGPAPLNLEIPEYDFPEEGKLVVG\n>tr|A0A2M7QIU8|A0A2M7QIU8_9BACT Restriction endonuclease (Fragment) OS=Candidatus Roizmanbacteria bacterium CG_4_10_14_0_8_um_filter_33_9 OX=1974826 GN=COY87_02155 PE=4 SV=1\nMLFKNDWEKTVYESENKIIDFENKLKNITQFPKGKERDCIVKSRINQN\n>tr|B1KM11|B1KM11_SHEWM AAA ATPase central domain protein OS=Shewanella woodyi (strain ATCC 51908 / MS32) OX=392500 GN=Swoo_4641 PE=3 SV=1\nMDNNYINSMEQALSLSPDNFILRITLIQALYEHQQLSTALSLLKEVESCQVEQELHQILAAKIFIESGDGENALLFLSSNLPEVKILKAKAYQILNEFSLAREFYVEAVKENSSLEDIDFARELRVAKDALDNSKRIKLTVVANDDTDAVEVTRLIKPREEVISFSEVGGLADVKKQIRKKIITPFQKPSLFQRFKKKVGGGILLFGPPGCGKTLLARATAGECNATFINVVISDILDMYIGESEKKLHAIFEQARQNTPSVIFFDEIESLAAKRQHTREATSAKLVSQFLSELDGFAQNNHGVLILGATNVPWALDPAFRRPGRFDRVVFIAPPDVDARTDILKGLLKDRPGGESVDAQKIARLTSGFSGADLMNLVETAVDEAIDHSIESGEEVPLNQTFVKEALKEVNPTTLEWLTMARNYAKYANDSGQYNEVLAFLRKHGK\n>tr|A0A2T7C6Y6|A0A2T7C6Y6_9POAL Glyco_trans_2-like domain-containing protein OS=Panicum hallii var. hallii OX=1504633 GN=GQ55_9G257400 PE=4 SV=1\nMAPTTVVGSSSQLSPHPNVLLLVPLPLVASRPPTPPPSAGRSYHHGITPTPTHPALSKPNRKKGARSQSCCTRAHPPPHSSLRSVRSKQGTQPARVPMPALAAAAAAWALRAAVWACLAASAMLVAEAAYMGLASLVAAVALWRRPGRRYRWEPMPGGVGGDVEAGPAAAAEFPMVLVQIPMYNEREVYKLSISAACALTWPPDRIIIQVLDDSTDPIIKELVELECLDWASKKINIKYEVRNNRKGYKAGALKKGMEHIYAQQCDFVAIFDADFQPESDFLLKTIPFLVHNPKIALIQTRWEFVNYDVCLMTRIQKMSLDYHFKVEQESGSFVHSFFGFNGTAGVWRVSAINQSGGWKDRTTVEDMDLAVRASLNGWEFLYVGDIRVKSELPSTFQAYRHQQHRWTCGAANLFRKMAWEIITNKEVSIWKKHHLLYSFFFVRRVIAPLVTFLFYCVVIPLSAMVPGVSIPVWGLFYIPTAITCMNAIRNPGSLHLMPFWILFENVMSMHRMRAALSGLLETARANDWVVTEKVGDPAKDDLDVPLLEPVKPTECVERIYIPEILLALCLLICASYDLVLGSHKYYLYIYLQAFAFIVMGFGFVGTRTPCS\n>tr|A0A3N5TBJ3|A0A3N5TBJ3_9DELT NlpC/P60 family protein OS=Deltaproteobacteria bacterium OX=2026735 GN=EHM37_16680 PE=3 SV=1\nMGRLVRGTMILPFFVLMAAGCTPKYDYTIHKPRVVYQQPSRQALRTSLGEILGKKYVWAEEGPEAFDCSGLTYYAFGRMNLEIPRVSSDQAQGGVEVPRDALQYGDLVFFDTGKNFTGTVTHVGVYIGDEKFQQASTNYGKVVISSLNDSNYANRFLTARRYLTDAASPRQTPTGWARNHGY\n>tr|A0A418MJS3|A0A418MJS3_9BACT Uncharacterized protein OS=Fibrisoma montanum OX=2305895 GN=DYU11_05040 PE=4 SV=1\nMKSALSKGLLVVAVLSLASCDYQKYNTIRQSDYRGNDPYVYGPNKDSAAIQSKYKYTPNPALEERTQKIREKLFGAGTIGEGA\n>tr|A0A2Z5TXE8|A0A2Z5TXE8_9MYCO Putative lipoprotein LppW OS=Mycobacterium pseudoshottsii JCM 15466 OX=1136880 GN=lppW PE=4 SV=1\nMRARPLTMLTAAAAVALVVSLVLTGCEAKVQAKAYGTDDRESSRQQSQPQQQQLIELLLRAITPPEDPAALLPSAGLVGVQERIQRATEEAAAKGATITVAILDRATHQLVSNGKTSIIATASVSKLFIADELLLRASQGKNTLSAQDRQALENMLRSSDDGAAEQFWGELGGDAIVTEIATRYGLAATAPPSDGRWWNTFSSAPDLIRYYEMLLDGEGGLPLQSAAIIVNDLAQSTPNGIDGYPQRFGIPDGLYAEPVAVKQGWMCCIGADWMHLSTGIIGSDRRYIMVIESLQASDDATARETITQAVKTIFPAGRI\n>tr|A0A839NTR2|A0A839NTR2_9SPHI Large subunit ribosomal protein L5 OS=Sphingobacterium sp. JUb56 OX=2587145 GN=FHR29_003793 PE=4 SV=1\nMTYVPRLKVKYAEEIRTALKEKFQYKSVMQVPKLEKIVVSQGVGAATSDKKLIDNALSELTLITGQQAVATKSKKDISNFKLRKGMPVGARVTLRDNNMYEFLDRLIAVSLPRIRDFRGINDKGFDGRGNYNLGITEQIIFPEINIDKINKIQGMDITFVTSAGNDVEALELLKQFGLPFKNQNTNNNG\n>tr|A0A432QAS4|A0A432QAS4_9DELT Bifunctional 4'-phosphopantothenoylcysteine decarboxylase/phosphopantothenoylcysteine synthetase (Fragment) OS=Desulfobulbus sp. OX=895 GN=DSY50_03665 PE=4 SV=1\nPARYLSNRSSGKMGYALARVARRRGGRVTLVSGPVNLAPPPDVECVNVLTAAEMHQAVMERAADSSIIIKAAAVADFKPQESSPRKIKKSGADLTLELTANPDILAGLGKARTDHQLLVGFAAESDNHEDEGQRKLYDKNVDLMVVNDILGEKTGFDVDTNQVTLITRKNVLPLPFLSKEETAGRILDKILELSRK\n>tr|A0A840G848|A0A840G848_9BRAD 3-carboxy-cis,cis-muconate cycloisomerase OS=Bradyrhizobium sp. CIR18 OX=2663839 GN=GGD65_001449 PE=4 SV=1\nMSTSLSPLLAPMLSSAAMRAVCDDRSTLQNMLDFEAALARAEAATDVIPASAVVSIEAACKADSFDMTALAEAATRSGNLAIPLVKMLTANVGKADTEAARYVHWGATSQDVIDTATMLTLRAGLDALDADLSRAIRGFAALARSHRNTAMVARTWLQHALPMPFGLKAAEYAASLARARCRLRRLSREGLALQFGGAAGTLAALGDKGLAVAERLAQELNLPLPEAPWHTHRDRIAEAASAFAILAGTCGKIARDVSLMMQTDVGEAFEPAGEGRGGSSTMPHKRNPVSAASALGAATMAPQLAATIFAAQVQDHERSAGPWHAEWPTLPQLMLVTSGALAAIVDIAEGLDVDAARMRSNLDATHGLIMAEAVTFALADKIGKSDAHHLIEAASKRAVAEKKHLREVLTADSQVTAHLSPEKIAALFEPMAYQGASQALIDRLLDSLDRK\n>tr|A0A7N8WV28|A0A7N8WV28_9TELE Transducin-like enhancer protein 4 OS=Mastacembelus armatus OX=205130 PE=3 SV=1\nMYPPARHPVPHQPGQPFKFTVTESCDRIKEEFQFLQAQYHSLKLECEKLASEKTEMQRHYVMYYEMSYGLNIEMHKQVGNFFFFFLLECQQEVKPHYSRCQMNAQQQLQAQHLSHGHAIPVPLTPHPAGLQPPLPPGAGTASLLALSSALSHQLPLKDERKHHDNNSEHPRGKDCPVCVYLKIKCPSVCVCQESDGEKSDDNLVVDVSNEDPASPHGSPAHSPRENGLDKNRLLKKDAPLSPSSVASSSSTPSSKSKEINLKSTTPVSKSSTPTSRSDALTPSSTATPGLRSAPGKPSGVDTLAPGLRTPLAVPCSYPGPFGMVPHPGMNGELSGVGAAYTGLHNISPQMSAVAAAAVYSFVVGFDPHHHIRVPGLPPNLSGIPGGKPAYSFHVSADGQMQPVPFPPDALIGPGIPRHARQINTLSHGEVVCAVTISNPTRHVYTGGKGCVKVWDISHPGNKTPVSQLDCLNRDNYIRSCRLLPDGRTLIVGGEASTLSIWDLATPTPRIKAELTSSAPACYALAISPDSKVCFSCCSDGNIAVWDLHNQTLVRQFQGHTDGASCIDISNDGTKLWTGGLDNTVRSWDLREGRQLQQHDFTSQIFSLGYCPTGEWLAVGMENSNVEVLHVTKPDKYQLHLHESCVLSLRFAHCGKWFVSTGKDNLLNAWRTPYGASIFQSKESSSVLSCDISIDDKYIVTGSGDKKATVYEVIY\n>tr|A0A3D9SW97|A0A3D9SW97_9ACTN Uncharacterized protein OS=Thermomonospora umbrina OX=111806 GN=DFJ69_4288 PE=4 SV=1\nMLTSKTKVAMGGVALGVIALWLIPGWILTLLVLGAIAVPVAAYLMLDPSQRRKVRARGRKRLGA\n>tr|A0A2U3LCS8|A0A2U3LCS8_9DELT PC4 domain-containing protein OS=Syntrophobacter sp. SbD1 OX=2043167 GN=SBDP1_820009 PE=4 SV=1\nMAKEPQIVHSFPKNPLEEVRSSVTYYKGKQYVDIRIYYKGDDGEFHPSKKGVTLSVELFPELETGFQKLKEALEEEQ\n>tr|A0A173RRC4|A0A173RRC4_9FIRM Auxin efflux carrier OS=Faecalibacterium prausnitzii OX=853 GN=ERS852582_00615 PE=3 SV=1\nMELALITAQQVAVLFLLIGTGMVAVKTGVLKLENKQALSNLLVYIIVPAMVVNSYRMEFSAQILHNLLAAFGMSVLSVLLGTVITLLLTARKTGSRMPIFRFACIFSNAAYMGFPLISALFGSEGLLYASAYVTVFNILLWTLGYGLVSGGSSVKEIARSLVRTPVLYAIVVGLGIYLLQIPLPALITQPLELLAGVNTPLSMLITGMLIAAGDVRSIVTDKHIWKLASVRMLLIPAATLALFGVLGFHGTATQVVTLLECCPAAAITSVFAVQFGHDEHFAAGSVVLTTLLSIITLPLCALIITMVM\n>tr|A0A3M1TWK5|A0A3M1TWK5_9BACT Uncharacterized protein OS=Bacteroidetes bacterium OX=1898104 GN=D6730_19965 PE=4 SV=1\nMLIGQNPCVCIHKGFFFERKNRLPSAAHNNAAVGALSYRNVKNTGPMAPKGDKCLIFNFRK\n>tr|A0A7C3Z4Q6|A0A7C3Z4Q6_9BACT Uncharacterized protein OS=bacterium OX=1869227 GN=ENW92_06685 PE=4 SV=1\nMSKFNETIRGIEDRLDLLQDNIQAIKDDLKILDSISTKIDVLTEQVKSHDIILNGNGSEGLKSKISRFEEIISVLKEKIDNIVTLLFGDLNNEGIKSKINLIDFKIGLISAIGGVAGAVAVTIMSDTIVNLIKKIF\n>tr|A0A2T6RAW0|A0A2T6RAW0_HELPX Methionine--tRNA ligase OS=Helicobacter pylori OX=210 GN=metG PE=3 SV=1\nMQKSLITTPIYYVNDVPHIGHAYTTLIADTLKKYYTLQGEEVFFLTGTDEHGQKIEQSARLRNQSPKAYADSISAIFKDQWDFFNLDYDGFIRTTDSEHQKCVQNAFEIMFEKGDIYKGTYSGYYCVSCESYCAISKTDNTNDKVLCPDCLRETTLLEEESYFFRLSAYEKPLLDFYAKNPEAILPIYRKNEVTSFIEQGLLDLSITRTSFEWGIPLPKKMNDPKHVVYVWLDALLNYASALGYLNGLDNKMAHFERARHIVGKDILRFHAIYWPAFLMSLNLPLFKQLCVHGWWTIEGVKMSKSLGNVLDAQKIAMEYGIEELRYFLLREVPFGQDGDFSKKALIERINANLNNDLGNLLNRLLGMAKKYFNHSLKSAKITAYYSKELEKAHQILDNANSFVPKMQLHKALEELFNVYDFLNKLIAKEEPWVLHKNNESEKLEALLSLIANALLQSSFLLYAFMPKSAVKLASAFNTEITPDNYERFFKAKKLQDMILQDTEPLFSKMEKIERTEKAGEASPEKNEKEKKDRKEKAPLKQENYIGIEDFKKVEIKVGLIKEAQRIEKSNKLLRLKVDLGEGRLRQVISGIALDYEPESLVGQMVCVVANLKPAKLMGEMSEGMILAVRDSDNLALISPTREKIAGSLIS\n>tr|A0A6P8YKE1|A0A6P8YKE1_THRPL Non-specific serine/threonine protein kinase OS=Thrips palmi OX=161013 GN=LOC117644815 PE=4 SV=1\nMEIVGDYEYNSKDLIGHGAFAVVFKGRKRKDPNYVVAIKSISKKSLAKSQNLLGKEIKILKELTELHHENVVALLDCKESPLQVFLVMEYCNGGDLADYLSVKGTLSEDTIRLFLRQLAGAMKALYAKGIVHRDLKPQNILLSHSGGKPCPQPQEIRLKIADFGFARFLQDGVMAATLCGSPMYMAPEVIMSLQYDAKADLWSLGTIVFQCLTGKAPFQAQTPQALKNFYEKNANLSPKIPAGTSPELRDLLLGLLRRNARERMTFDSFFTHPFLQREAEPTPAPPMPGELPPSPRALFQPPATQSPTHKARLDTCGSQPVPANIPSDHSSDSNPERPSRTRTSSASAASPPRPSFLPISEPIPVPTHRDAFQQRQSIHSQDNEPSKGSVPRSQPINMRRASDQRAANATPDLSSLSPPAVQFMIGTPPNGGCGQRRRSASGSSCETPPPVSTWQVTPTSSPLRRSGASSPLLSGPLAVLPSILGSPNRMSENNNMRQSPLMPFGSRAMTLPEISEAGNFQRLFQDANQPSNIDAPLTFLAPELPEETLLEREHNETLAKLHFVLALSDCVLELAGSRGTPLAALTESVNLGGGGSPNGSSNITGNGVISEGARRAEQLVLLVRALQLLSSGLSLATQQIRAGHLQPSSSVKSVVGIMNQKFRQCLADCKQLNTPGLLQKAGVDPATTNIAADKILYNHAIQMCQSAALDELFGNPEDCFQRYQTAQILLHSLSQQVHHQQDRALLTKYKDAVEKRLFVLQQQGFIYSTQCFTHLA\n>tr|A0A151YSI4|A0A151YSI4_9GAMM Mandelate dehydrogenase OS=Acinetobacter lactucae OX=1785128 GN=AWW73_12870 PE=3 SV=1\nMSRKLINVEDYRLQAKRTLPRIIFDYLEGGAEDEKGLNHNRTIFDQFRLKPKRLVDISQRDISCKIFNKKWDAPFAIAPTGLNSSLWPHADSILAKSAAKANIPFMLSTASNMSIEAVAKSCDGEKWFQLYVVHQELAVKMVQRALSAGYTTLIITLDVGVNGYRERDIRNGFAIPLKFSPSLILDGMMHPGWSLRFLSQGMPKLANFESSEAHSLEVQNALLKRQMDTTFNLESLKKIRDLWPHTLLVKGLVRQEDALKAIEAGADGVILSNHGGRQLDCSISPMETLYEVSQTIEQPVLIDSGFRRGSDIVKALCLGANMVCLGRATLYGLAANGEAGVDDVIQLLKQDVDRTLAQIGCPSVSQLNKEYIT\n>tr|A0A502DVG8|A0A502DVG8_9MYCO Uncharacterized protein OS=Mycolicibacterium hodleri OX=49897 GN=EAH80_27785 PE=4 SV=1\nMERTDRRKAQAAIIGGTALLAMGIIGGAAGGPGDGKTALVSGGSMQTGETTTLTYTGTIAPVKAVPSVKATPH\n>tr|A0A6P7I339|A0A6P7I339_9TELE caM kinase-like vesicle-associated protein OS=Parambassis ranga OX=210632 GN=camkv PE=4 SV=1\nMPFGCLTIGEKKDYNSPSDVTDKYDLGQIVKSEEFCEIFRAKDKTTVKMYTCKKFMKKDGRKVRKAAKNEIFILKMVKHPNILQLVDVFETKKEYFLFLELATGREVFDWILDQGYYSERDTSNVVRQVLEAVAYLHSLHIVHRNLKLENLVYYNRLKHSKIVISDFHLAKLENGLIKDPCGTPEYLAPEVVARQRYGRPVDCWATGVIMYILLSGNPPFYDETDDDDYENHDKNLFRKILAGDYEFDSPYWDDISDSAKSLVARLMEVDQDQRLTAQEAINHEWISGGAASDKNIKENVCAQIEKNFARAKWKKAVRVTTIMKRLRAPEQSDSRSTSPAAGTPADTAAPPADPAAPSSAAVPEVSPAAVTELPAGAPPEAGAGAAAEEPQPPNPALQVAEPASRCNGEASAILHTAAEAGDEQG\n>tr|A0A521F3G2|A0A521F3G2_9RHOB Do/DeqQ family serine protease OS=Ruegeria faecimaris OX=686389 GN=SAMN06265380_11652 PE=4 SV=1\nMRKVLCSLLLTVAAVSAKAETKVPQTQVEISLGFAPVVKQAAPAVVNIYAKIVREGRSNSLFSDPFFQDFFGGGFGEPRPRVQNSLGSGVILTDDGYVVSNYHVVGSATEIRVVTTDRREFSAEVVLGDQESDIAILRLKDAEALPSIDMRDSDLVEVGELALAIGNPFGVGQTVSSGIISGLARTGTATGNARGYFIQTDAAINPGNSGGALIDVNGDLIGINTSILTRSGGSNGIGFAIPANLVAEFLRQAQAGNDSFVSPWAGMAGQHMSADIAESLGLVIPQGVVISDLHALSPLAEAGLQVGDVVTHVDGDEVNSPAEMKFRMSVAGVGGTSVVTRLRGEDRAELEVALVKAPEVPAAEVTTLNDETVMPGLTVSRINPAVIARLGLLLSQTGVVVVDAGRYGGRSGLRPGDVVDGINGARVERPADVVKALTDPGRRINLDILRGGRPVSLRFRL\n>tr|A0A1H9D944|A0A1H9D944_9BACT Monosaccharide ABC transporter substrate-binding protein, CUT2 family OS=bacterium A52C2 OX=1855383 GN=SAMN05216548_102373 PE=4 SV=1\nMKSIRSLAVALALGVAAVVSAQAEAADITVGFVPGTVSDPFFQAMKKGAQQAADRLGMKLNWQGSSGEYSPQQQLPFVDAMLANNVSVLIFCPTDPDSMQASVTKAQIQGIPVITVDTTVTDQSSVTSFITGDNVAGGRQAAQTLAEQIGNKGKVFIMATSPSATTNTLRRQGFEEEMKNHPDIKIVGIQYSQSQPDRATSAVNTVLLDQPDLAGVFALDGTNTQGAVAAIRNSGKTGKVKLVGYDAYQAEVDALKDGVVTALVAQRPSEEANMAMEFALAKVSGKDTDKIQKNAVIPNVVITKDNLSENEKYVYSE\n>tr|I7C407|I7C407_PSEPT Sulfate adenylyltransferase subunit 1 OS=Pseudomonas putida (strain DOT-T1E) OX=1196325 GN=cysN PE=3 SV=1\nMSHQSDLISEDILAYLAQHERKELLRFLTCGNVDDGKSTLIGRLLHDSKMIYEDHLEAITRDSKKVGTTGEEVDLALLVDGLQAEREQGITIDVAYRYFSTAKRKFIIADTPGHEQYTRNMATGASTCDLAIILVDARYGVQTQTRRHSYIASLLGIKHIVVAVNKMDLKGFDEGVFESIKADYLKFAEAINLTPSSLHFVPMSALKGDNVVNHSEQSPWYAGPTLMEILETVEVSADRNFTDLRFPVQYVNRPNLNFRGFAGTIASGVVHKGDEIVVLPSGKSSRVKSIVTYEGELENAGPGQAVTLTMEDEIDISRGDLLVHADNVPPVTDQFDAMLVWMAEEPMLPGKKYDIKRATSYVPGSIASITHKVDVNTLEQGAASALQLNEIGRVKVALDTSIALDGYDSNRTTGAFIVIDRLTNGTVGAGMIIAPPVLPHGSTGHHGKQAHVSTEERALRFGQQPATVLFSGLSGAGKSTLAYAVERKLFDMGRAVYVLDGQNLRHDLNKGLPQDRAGRTENWRRAAHVARQFNEAGMLTLAAFVAPDAEGREQAKALIGKERLVTVYVQASPLVCRERDPQGLYAAGGDNIPGESFPFDVPLDADLVIDTQATSVDEGVKQVLDVLRQRGAI\n>tr|A0A2P5F9R2|A0A2P5F9R2_TREOI Son of sevenless protein OS=Trema orientale OX=63057 GN=TorRG33x02_095620 PE=4 SV=1\nMARRTAQVLDSIHLMNTTQIFKESIRVILLHPTQFHSISIFLFSPLPISLFISHLLIHHFPNIPSSTISLTHNLFGFPLPKLFSKTMIHIIICFPSSITFSLLGRAAIVQAVSDIYNGINLDGRRLFMRSGLTWIKLLYTTFWEYLIVFGLLGVFALNLVIMPKMFHAFGICSEILGFWGVLGVLGIPFCVAFAHVMVVGNLARVLSVLEGNCYGFESLLKAKSLMEGRRQIALVMALLSNIGFRLVESLFEFRMCKGINLWEGPLLVSMYSSVLVFDTVMNVVFCYACKSFNDQ\n>tr|S1PYQ0|S1PYQ0_ECOLX Starvation-sensing protein RspB OS=Escherichia coli KTE182 OX=1181728 GN=A13A_01543 PE=3 SV=1\nMKSILIEKPNQLSIIEREIPTPSAGEVRVKVKLAGICGSDSHIYRGHNPFAKYPRVIGHEFFGVIDAVGDGVESARVGERVAVDPVVSCRHCYPCSIGKPNVCTTLAVLGVHADGGFSEYAVVPAKNAWKIPEAVADQYAVMIEPFTIAANVTGHGQPTENDTVLVYGAGPIGLTIVQVLKGVYNVKNVIVADRIDERLEKAKESGADWAINNSQTPLGESFAEKGIKPTLIIDAACHPSILKEAVTLASPAARIVLMGFSSEPSEVIQQGITGKELSIFSSRLNANKFPVVIDWLSKGLIKPEKLITHTFDFQHVADAISLFEQDQKHCCKVLLTFSE\n>tr|A0A0D8JWE6|A0A0D8JWE6_COCIM Uncharacterized protein OS=Coccidioides immitis (strain RS) OX=246410 GN=CIMG_11771 PE=4 SV=1\nMVHPEPDRIQTGIANDAPVNRLLLPSTSLLDTQFTRTPLGFRGGPDEFPADVDKEFTKSE\n>tr|Q4S6C8|Q4S6C8_TETNG Chromosome 9 SCAF14729, whole genome shotgun sequence (Fragment) OS=Tetraodon nigroviridis OX=99883 GN=GSTENG00023347001 PE=4 SV=1\nLLLGLFVVCGLALLGLLAFVSWKFAGAARQPAKACCSGSSLSPERHPLQPPLPLPPSPQHPLVTMATEKVKDPAGSLGFLEAAVKISHTSPDIPTDVQLSMREHFLRRTQRMQRQTTEPASSTRHNSFKRHLPRQMQVGSLDLGNDYVLEKEEKSTSLGRIQPELYQQKDLESEDSSKNSSGKNCGSINFSLKYDYENQALLVDILKAVDLPAKDLCGTSDPYVKVYLLPDRKKFQTRVHRKTLNPTFSETFRFPVPYEELAGRKLHMSVFDFDRFSRHDMIGEVELDNLFDLSDLSRETNVWRDIQYATSESVDLGEIMFSLCYLPTAGRLTLTVIKCRNLKAMDITGYSDPYVKVSLICDGRRLKKKKTSIKKNTLNPSYNEAIIFDIPPDSMDHVSLHISVMDYDLVGHNEIIGVMRVGCNAEGLGRDHWNEMLAYPRKPVAHWHPLLEPKKSEKEWKARTASFDSQGSCPSPRPPASP\n>tr|A0A4Y6N1A7|A0A4Y6N1A7_SALET AI-2E family transporter OS=Salmonella enterica subsp. enterica serovar Indiana OX=286783 GN=D4X88_10560 PE=3 SV=1\nMLEMLMQWYRRRFSDPEAIALLVILVAGFSILFFFSGLLAPLLVAIVLAYLLEWPTARLQAIGCSRRWAASIVLILFVGILLLMAFVVMPIAWQQGIYLIRDMPGMLNKLSDFAATLPRRYPALMDAGIIDAMAENMRTRMLNMGDSVVKYSLASLVGLLTLAVYLVLVPLMVFFLVKDKEQMLNAVRRVLPRNRGLAGQVWNEMNQQITNYIRGKVLEMVVVGVATWLGFLLFGLNYSLLLAVLVGFSVLIPYIGAFVVTIPVVGVALFQFGLGTEFWSCFAVYLIIQALDGNLLVPVLFSEAVNLHPLVIILSVVIFGGLWGFWGVFFAIPLATLIKAVVHAWPDGQVTDTSS\n>tr|A0A265NA24|A0A265NA24_9BACI Serine/threonine dehydratase OS=Virgibacillus indicus OX=2024554 GN=CIL03_13610 PE=3 SV=1\nMVTVKNIYKAREQISDVINKTPILSSSQLSSICGNRMFFKAEHLQKTGAFKIRGATNKVKQAVKDGATFVTAASSGNHGQAVAYIANELGVPATIVVPEDVNPSKEAAIKAYNGEIERCGLTSAERLPRAEALAAENNGGVIPPYDDPLIIAGQGTVGLEILDQLDGVDVVVVPIGGGGLISGILTAIKEIKPSIKVIGVEPEKANDTYQSIQQGKITSIKEAATIADGLRTSQPGSLTFPIVQKYVDEIVLISEAEIRKALFFILQRMKQLIEPSSAVTVAAAMFDKLNVRDKNVVCVLSGGNVDLKQLGEMNPEK\n>tr|A0A2A5WAU1|A0A2A5WAU1_9GAMM Sulfite dehydrogenase OS=OM182 bacterium MED-G28 OX=1986256 GN=CNF02_07660 PE=4 SV=1\nMGPKKQNRREFLKQGAAIAGGAAVGAASQSASAQLPGPEGFLHGRDDIVAYGQRSRFIESKRIPHGGRHSPDTFGLDFHIATPLQDQHGVITPSSLFYMGTTRGSYIPDIDPEKHRLMIHGLVDNPLVFTMEELKRLPSVTRMHFVECAGNRSNRRHTTVQETHGMTSNAEWTGVLLSTLLKEAGVKEGADWIVAEGVEEVKGASSIPMTKAMDDTLLAYSMNGEPVRPQQGFPLRMLAPGFEGIFNVKWLRRIKVVDQYYMTYNDYGHLTQDPATAALGYQIGPKSVIVHPSGGQTLPGAGYYQVSGLAWSGGGKVARVEVTTDGGETWFDAEIRGEPQAMAHTLFAFEWEWDGSPCELQSRCIDEIGQVQPSRAEVAEFWNQPADQPPRVRGQDNSIQPWRIESDGSIHNAIA\n>tr|A0A1J5QM58|A0A1J5QM58_9ZZZZ L-cystine import ATP-binding protein TcyC OS=mine drainage metagenome OX=410659 GN=tcyC PE=4 SV=1\nMSPTEEPPPMGEVLLSVHGLSKSFGANPVLRSIDLTIERGRVLALIGPSGSGKTTLLRCLNGLELADGGTINTPGELTLDFTTPPTRSQLNALRDRSGMVFQHYNLFPHKTVLQNVLEGPLVVQRRPRAEATASALELLARVGLSEKTHTYPFQLSGGQQQRVGIVRALALQPQLLLFDEPTSALDPELVGDVLRLIKELAADGWTMVIATHELEFAREVAHEIAFLDAGTILERGHPSQLLRDPQHERTRQFLHRVLHPF\n>tr|A0A0M0J7I6|A0A0M0J7I6_9EUKA Cyclin-y-like protein 1-like protein OS=Chrysochromulina tobinii OX=1460289 GN=Ctob_004972 PE=4 SV=1\nMGDEGLTLCARTWRPALLMAIVIASKVVYDEKVYLADYRDMLPEFCLDAASAQELELLKLVNYNTTVRRGQYARYYYALEDVARNQSSNQIFAARS\n>tr|A0A7X6ZE57|A0A7X6ZE57_9FIRM Sporulation sigma-E factor-processing peptidase OS=Syntrophomonadaceae bacterium OX=2093811 GN=spoIIGA PE=3 SV=1\nMTGHKVYADLTLIINLLMDAVILWAAAKLAGFKFSYTRIFFTAMLGAIYAVGYLFYPMNIFYSFPLKIIFSCFLILLAFYPQSWKDLKRAFQYFYLINFIAAGAITGFASLTAGMKHINNISILWLLMGVIIVIGLGKWGQKYLVNRIIPQLLNYMVEIKFNGHQCSGSGFLDTGNMLRDPLTNRPVLIAEYAWLKNFLPLDLIEFFETGSSETEILSFAANSTWADRVRVIPFSSIGRHNGLLLGFRADEINVSLGDRNICHKNLIVAVYRSKLCQDGHYQMLVPAEILQSG\n>tr|R6ZSV7|R6ZSV7_9BACE Putative CTP pyrophosphohydrolase OS=Bacteroides fragilis CAG:47 OX=1263046 GN=BN669_00524 PE=4 SV=1\nMKSIEVVAAVIRLGEKYLCVQRGQTKFSYTSFRYEFPGGKVEEGESLQEALQREIMEEMDYVIEVGEKLLTVHHTYPDFEITMHAFLCHPVGQRYVLKEHIAAQWLSTREMAILDWAEADKPIIRKISEQ\n>tr|A0A535V1X9|A0A535V1X9_9CHLR APC family permease OS=Chloroflexi bacterium OX=2026724 GN=E6I76_01260 PE=4 SV=1\nMRGGRARRKEFDKVAEGYLQAKEESVKPTTQLGRLRRALLGRPLASKQQIHERLTKVKALAVLSSDALSSVAYATEQILLVLGAAGAAAYSYSMPIMVAILVLLIAVGLSYRQTIKAYPKGGGSYIVASDNLGPLAGVVAGSALMTDYVLTVAVSVASGVDSIVSAASAMQAYRVELCVAFVAILIVGNLRGIRESGSIFAAPTYLFIGGILLMLVVTGLRWGTGNVHEATPMLGKATQQVSIFLILRAFASGCTALTGVEAISDGVPAFKPPEWRNARTTLTVMVVLLATMFMGITISARATGARAYDSSDPNYQTVISQLAHTAFGSTFLYYYVIGATTAILVLAANTSFSDFPRLFFFMARDDYAPHLFKRLGDRLAFSNGIIVLGGLAILLLVVFRGRTDALIPLYTIGVFVAFTMSQAGMVSRWLRLREPGWQHGLAMNAVGMTLTAIVFVVTAGDKFTEGAWIVLVLIPLLVMTFFSIHRHYSEVTVDLATETPTSPDELKPVVIVPLADLNGPALQSLALARTLSDQVIAVHISDDPDEIARLKAKWEAWGDHVPLEVIESPYRSLVRPLLAYIDAIDRQRRDDTIVVVLPEMVATRWWHQVLHNQTALRLKAALLFRPGTVVVNVPYHLRRYQHQRRRLRARHGGDDAL\n>tr|A0A7T7DGS6|A0A7T7DGS6_9BETA Cy128 OS=Cynomolgus cytomegalovirus OX=1919083 PE=4 SV=1\nMETHLFSDLAFEQVFEEDPQLPLHVVLDPVDLSFAEAETVRYVYYRSDPDPVGRWRRAAFRVFLRPFELLTYLRDAGLMVAPTVRVVCHHALFTTLGIRCAEQRLSGAQMLYLRLVWNEERFRDWEFLVRDLLREEMSVCQSTEPADRPDPSLLMTDAMLELAKSSSTTAPFFEMPSSGTGNNNASSASAADESSQVERRVIQFLRGDSELTYHAGPLEPPSKIRGHEIVQPRIEVNPDVIYASGPHEDDRTSKTDEWQKGGVMRLGSVWDVRQRLRLHVLWYAQSFWRSRGLKYEDREEDLRLTLDSYFDRLSVEYQVLREVYREIKAVLRSDRMVAQKFSCHLSIETSWLLIWELFDRALELWRDQADVNSCIIKALAHKLRSKAQSSHGNSVSAGKTNPTETWYADVVRCVRAEVNLGLEVQVETCSQSGLWLVRGRDGQLRKWITQPQTYVLYATPGLVFHWVLPGGFAISSRVCLDGVGRDHFERFQMSAPVLTKRMLLETGWTRTEASGVPSCGL\n>tr|A0A852XDT0|A0A852XDT0_9MICO GTP-binding protein Era OS=Microbacterium esteraromaticum OX=57043 GN=GGD75_001854 PE=4 SV=1\nMTEQTRSGFVTFVGRPNVGKSTLTNALVGEKIAITSEKPQTTRRAIRGIVNRPDGQLVIVDTPGIHKPRTLLGERLNDLVEQVLGDVDVIGFCVPATEKVGPGDRRIAASLDGYPRAKKVAIVTKTDAADKDDIVERLMEVDSLREDWAAVIPLSALTREQLDVLADEMLQLMPVGPRLYDEGVVTDESTDDRIAEMIREAALEGVRDELPHSIAVVIDDVEPRGDSDLTDVYASIIVERDSQKAIIIGHKGSRLRSVGATARAGIEELLGTRVFLKLHVKVAKEWQRDPKQLGRLGF\n>tr|A0A7G9B3G3|A0A7G9B3G3_9FIRM MarR family transcriptional regulator OS=Oscillibacter sp. NSJ-62 OX=2763056 GN=H8790_11715 PE=4 SV=1\nMDKTERQTTKITREAAKLTLQTMRAEGGTAEFDFIHLVRHYPGITQAELREALKIDKGAAARRAAHLEAKGYLVRRENPADGWSQLLYATEKAEKLKNSKAGIESAFKRLIS\n>tr|A0A2K6TWZ0|A0A2K6TWZ0_SAIBB DNA repair protein OS=Saimiri boliviensis boliviensis OX=39432 GN=XRCC3 PE=3 SV=1\nMRPLFCLSCEVNHPGDQPTDRMDLDLLDLNPRIIAAIKKAKLKSVKEVLHFSGPDLKRLTNLSSPEVWHLLRTASLHLRGSSILTALHLCQQKERFPAQHQRLSLGCPVLDALLRGGLPLDGITELAGHSSAGKTQLALQLCLAVQFPRQHGGLEAGAVYICTEDAFPHKRLQQLMAHQPRLRTDVPGELLQKLRFGSQIFIEHAADVDTLLECVNKKVPVLLSRGMARLVVIDSVAAPFRCEFDSQASIPRARCLQSLGATLRELSSAFQSPVLCINQVTEAVEEQSTVHGPPGFWDERISPALGITWANQLLVRLLADRLREEEAALGQPVRTLRVLFAPHLPPSSCSYTVSTEGVRGTPGTQSH\n>tr|A0A2M7XMW0|A0A2M7XMW0_9BACT Uncharacterized protein OS=Candidatus Shapirobacteria bacterium CG_4_9_14_3_um_filter_36_12 OX=1974877 GN=CO168_02590 PE=3 SV=1\nMVETELLKNLKTYFGYDGFRALQEEVVGATLAGKDSLVLMPTGGGKSICFQLSALMLPGITLVISPLIALMKDQVDSLKNNGIKAEFINSSLTTGEILRIETEIIGGKIKLLYVAPERLVLPQFLEFLKTIKISLIAVDEAHCISEWGHDFRPDYRNLTILRQNFPSVPIMALTASATEKVRQDIGLKLNLNNHQLFISSFNRPNLYYTVLPKRNTFEQLLSLVEKYKNNSIIIYAFSRKETDELAVNLSTQGYQALAYHAGLESNIRREVQDKFIKDEVKIIVATIAFGMGIDKSDVRLVVHYSLPKSVESYYQETGRAGRDGEKSECVLFYSYGDTAKQNYFIRMMTDGVVRLNAQKKLREMVNYCELKSCRRQYLLKYFGEELGNNCQSCDCCVKSPPTPSLTKEGNLNLFEKLRILRKQIANQNKVPPYIIFSDATLREMVSFLPKNETEFLKINGVGAEKLKRYGRQFLETINSQNAPKVFLSGTYLETQKMWVAGLSIEQIAKNRGYTNETIINHLEKIIESGVQLNLDKIIFDPTRLKIIKDAFAQTNDTKLAPIKAILDDDYSYEEIRLGRLMVAK\n>tr|B4ELZ0|B4ELZ0_BURCJ LysR family regulatory protein OS=Burkholderia cenocepacia (strain ATCC BAA-245 / DSM 16553 / LMG 16656 / NCTC 13227 / J2315 / CF5610) OX=216591 GN=BCAM2812 PE=3 SV=1\nMTEQSKNLQSGYAAHAYPLADLTRPLPPLAAIQSFVAAAQLGSVSKAADHLCRTQGAVSRQIQQLETHYRCALFVRHVSGLTLTAEGNALLTVAVNVLTQLVRHADVHARATSVLTLKLPSTFAVRWLLPRLPDIQRAMSGTELRISTSADDTPDFTTSDVDAVVVRGTGQWTGMEAIPLFAEMLTPMCAPALAASLRSVADLAQVELLHPGPSHAEWRCWLDHVGARQVDAGRGLVFDTLELTLAASMEGHGVAIGDPRMARDRLRAGSLVTPFEDVARDGLSYFLVYPPQRAAQPKIRALADVLLRLAREDR\n>tr|E9HNJ7|E9HNJ7_DAPPU Uncharacterized protein OS=Daphnia pulex OX=6669 GN=DAPPUDRAFT_116105 PE=4 SV=1\nMPCSVVLNENVLHISWELALYGASRISFSDHSAHCFRRKLQCCPCHTPPGVSCGQQLGKCVYVREIFVLRFRSVYPSLAREWLPRIRRWCSWSDLKSVVDKFASLACCKLGYIIPHPKIMASRIGAYRSGSVLAGGRQAGVTVRPGIQYRLMGLGKLAILFAHECPPHLVHFVRFVWDGTGRSAVLRRHQGADGNVAAAGPASSGSLAEEHQRRRAAARPARRQGSRPGLHGEPATDVGDGPQQRRDDGQPDRQSNVGPVVDGSTSAFGRTQEPHRHSVSRLEDSATQTQMEESFFSENKDGTEIQLSSAGVRLSETESGLRRQRIRRRAQQRRFLTDPRPPPNDEEFRWKSRQRYSDDSGSESDDEQHLPGLRYHQQQQQQRPNLSQYVSDSGAPGTGGSGGDGSSQGLSNINTVHLEPLVKSSQVATDLAVRSQSILSNVGTESSGQNNSGFSDLVARSEEDINSSALSRRTDSAILLLDHIGSPSEQQMMNGPDGENLNRSSSSLNKKTTTHSPLMDDVESSRKRTKSERRSEHEGSSAHPPTATHPHSERIKYKAEIPISVIRAAQAKTRRYNLERKIFQQLLDWKQMQIRIGQANEHQLRLVQGGRTLLPLVDSATDREDAATTNGLKYGDVIETESANGTSRTTTTTMPVEKGTHTTQRCPHAMYACTTLPPALAARPCPALPLVISRFSMDVVVEPIDFDSFEGLLVSFLNDSAVPYHKHHRPVTQQHQQPQQPTNHPGTAKLTTENGRIILPKLNLNNNINGHQKSNAPANKGNH\n>tr|A0A6P1MDY7|A0A6P1MDY7_9FIRM Type II secretion protein F OS=Aminipila sp. CBA3637 OX=2697030 GN=Ami3637_02060 PE=4 SV=1\nMLTYFIAFFAAILTYFIILLIKKNSGREFIENRLNKYLNKDAISRIQDQFYKEKIEKYKKKKDRNFKIASKEFSDYLAMSGIKLRASEFIYIWIIMTYLPILIISLSGLSIVTAAGFAIVGFIIPPLFIHKSRRKRQTEFNKQLGESLVVMSNCIKSGFTFQQSMESIANDMQPPISVEFTKTLREMRFGVNKNDALHHMVNRVQNNDLGLLVSAVITSEQVGGNLSEILDTISDTIKDRIRIKQEVRVLTAQGRMSGIVIGLLPIFIIILLMILNPQYFLSFFETSIGKIMIGVSILMELIGFVIINKIVDIEY\n>tr|A1JPW7|A1JPW7_YERE8 Peptidoglycan D,D-transpeptidase MrdA OS=Yersinia enterocolitica serotype O:8 / biotype 1B (strain NCTC 13174 / 8081) OX=393305 GN=pbpA PE=3 SV=1\nMKKEPNPFRDYSAESALFVRRALVAFLGILLLSGILVANMYNLQIVRFEDYRTRSNENRIKLVPIAPSRGMIFDRNGTPLAMNRTIYQLELMPEKIEDLPATLNALRPIVDLTDEDIANFEKERKRSRRFTSIAVKTPLTEVQVARFAVNQFRFPGIEVKGYQRRFYPYGSALTHVIGYVSKINDKDVERLDKEGILANYAATHDIGKLGIERYYESVLHGKTGYEEVEVNNRGRVIRQLHEQPPQAGKDIYLTLDLHLQTYIEQLLSGSRAAVVVTDPRTGGILALVSNPSYDPNLFVDGISNKDYQGLLNDPNRPLINRATQGVYPPASTVKPYIAVSALSAGVITKNTSLFDPGWWQLPGSEKRFRDWKKWGHGRLNVTKALEESADTFFYQVAYDMGIDRLSSWMSKFGYGEYTGIDLSEERAGLMPTREWKQKRHKKPWYQGDTIPVGIGQGYWTATPIQMAKALMTLINDGAVKTPHLLQSTRIDGVLVPYKQEDSTQIGDIHSGYWEIAKDGMYGVANRPNGTGRKFFEGTPYKAAAKSGTAQVYSYETYNAHKVAEHLRDHKLMVAFAPYENPTVSVAMILENGGAGPAVGTITRQILDHILLGDNNTELPDAAPLPPGVEAD\n>tr|A0A7K2NHN8|A0A7K2NHN8_9ACTN Indole-3-glycerol phosphate synthase OS=Streptomyces sp. SID5468 OX=2690295 GN=GTW54_22445 PE=4 SV=1\nMITTVLMIEKPLAPVDVQLVTTLHSDEAVSFVVLMQPRGDQERLLRALDDVALGELREAAREEEEPEGDQALAPAVHALEHSLKALRATGAEAVGQIVEEHPLDLLRSVVEQTGADEVIVLTAPHLVEEFFHRDWASRARHKVGVPVLKLYAHND\n>tr|A0A132DP21|A0A132DP21_BURVI NAD(P)H quinone oxidoreductase OS=Burkholderia vietnamiensis OX=60552 GN=BvRS1_03110 PE=4 SV=1\nMKAITFKEFGDAEVLQLAEVAAPEVRPDDLLVRVHAAGVNRADLTHRRGGYGRPNFGDSTIMGLEIAGEVIETGSSVQGYKVGDRVMGVVGGGAYAERARIDWRMAMPIPATLDYVHAAAIPEVFVTAHEALLHLGRLQRGDAVLIHAAAGGVGSAAVQLAYATGATIFATAEASKLERIVQLGVDHAIDYKTQDFSEVVASRTGKRGVDVVIDFVGAPYFSRNVASLANGGRLVQVGILGGGGDVSVSLEQILYRHLQIIGTVMKSRDQSEKHAMVRRFREHWLDRFAGGAGLEPVVDSVFPLADAAAAHRRMESAVNVGKIILTMSEDS\n>tr|A0A1G8CMD4|A0A1G8CMD4_9PSED Peroxiredoxin, Ohr subfamily OS=Pseudomonas panipatensis OX=428992 GN=SAMN05216272_101672 PE=3 SV=1\nMHSIKALYTATATATGGRDGRAVSSDGILDVKLSTPRELGGQGGAATNPEQLFAAGYSACFIGALKFVASQSKRQIPADSSITGKVGIGQIPGGFGLEVELNISLPGLDRTVAEELVAAAHQVCPYSNATRGNIEVRLNVAV\n>tr|A0A1Q8LW97|A0A1Q8LW97_9PSEU Methyltransf_21 domain-containing protein OS=Pseudonocardia sp. Ae717_Ps2 OX=1885573 GN=Ae717Ps2_3992 PE=4 SV=1\nMTGPRLSFVGRSRVRARRLLARLLRAVPGRTVDWAHRHWITDDGRTDPRWAPVARLLFHRPLHQTVVTVPGSGGIRLHVVGARLERTLYWFGEQGYEPGEAAWWRLLCSRATAVLEIGSNIGWYTTVGAAAAPVGGYLAVEANPEAARATRRNLELNGLGHGAVLTAAAVGQGAPSSLYLALPDQESFSAAPTGSYLRGHTEGTADRAARRSLTVPTLSARHLITGRDLVKLDVEGAEAGILESALDIILRDRPILLVERMPDTPRLDRVLEQLVGGGYLVLRLGTQLQPAGPRPPVDEHYDVLLVPAERGAVPVHLGDLR\n>tr|A0A165XXG3|A0A165XXG3_9BILA Cytochrome c oxidase subunit 1 (Fragment) OS=Keratella cochlearis OX=204738 GN=CO1 PE=3 SV=1\nTLYFIFGIWAGFIGLSMSLLIRLELGVVGPFLSDEHLYNVIVTAHAFIMIFFMVMPISMGGFGNWLIPLMLGVADMAFPRMNNLSFWLLIPSFTFLLLSSILDSGVGTGWTVYPPLSDSKYHSGISVDLAIFSLHLAGISSILGSINFLTTIICSRTTKVISLDRMPLMLWAISVTAILLITSLPVLXGAXSMLLTDRNLNTSFFDP\n>tr|A3XB71|A3XB71_9RHOB Uncharacterized protein OS=Roseobacter sp. MED193 OX=314262 GN=MED193_21946 PE=4 SV=1\nMLWTTIQNAILVSMIDLYSAEPDFEAEITILRVEEGGRTVPPHNYIRWDFGYAEDNPLEPRRNLSANIYMIYPNFLNEDGVPIPKGVPLNGTYNAYMHILVRDMVDYHQSRLSVGTNFNCHEGSRIVARGTVTKLRAISP\n>tr|A0A7V5NXA8|A0A7V5NXA8_9PROT RNA polymerase sigma-54 factor OS=Hellea balneolensis OX=287478 GN=rpoN PE=3 SV=1\nMALAPKLQQKQAQGLTMTPQLQQAIKLLAMTNLELQLFVEEQLQSNPLLERGTGTENRRGENVPEGKPDEAGPEELQLGEASPVALEALDVSAETLEPDSAPSDLPSSGGEIDWSRAGNGGSFNPSSGLDRLENTAAQKTLKQVLSEQLVIAFPSGQERLIGAHLIDQVDENGYLHASLSEMAERLGVEQTQLETILAKLQTFEPCGVMARSLSECLRLQLREKGELDGPMQRLLDNLELLARHDMQGLAKCCGLDREALGAYVKRLKALAPKPGLAYGSDVAQAVAPDVFVRARPDGGWAVELNTETLPQILVNARYYAEVCSSAKDEKVKSYMSECAQNASWLVKSLDQRARTILKVASEIVRHQDAFFAYGVNHLRPLTLKTIAEAIDMHESTVSRVTANKYMATSRGLFEMKYFFSNSISASDGGEGHSAESVKHKIKILISEETTANSVLSDEKIVRLLRDQGIDLARRTVAKYREMLGIPSSVARRRILKNK\n>tr|A0A255T6L9|A0A255T6L9_9BACT Zinc ABC transporter permease OS=Prevotella sp. P2-180 OX=2024224 GN=CIK98_17110 PE=4 SV=1\nMDNDNIIIRLARPDEAEHVAKLIMTAMTEECCLWFCGKDHDIGDFHKVMTELVKQEDSQYSFLNTLCAVDSHDNIVGILTSYDGGRLHEFRQRFIEAAKMAWGIDHSNIPDETGPGELYLDSLAVEPSSRGKGIASKLIEASVDKARKMGLPFTGLLVDTSNPRAEALYTRLGFRVEGTNQWGGHPMRHMVKLTSNR\n>tr|K7P3Q2|K7P3Q2_PINMU Uncharacterized protein (Fragment) OS=Pinus mugo OX=28528 GN=UMN_1037_01 PE=4 SV=1\nSSISPAAASSSENSTVTGTPSSSSSNSRVNTPAGDGTAGLYGFSLEVRDALTEQAHCSVTAEECSTVPVPAPYTGLVALDCGSLGTMDQQIHINPELLNSGDLLNSSSFSFGDLIGSSNLAGVTLADLQWKLQQ\n>tr|A0A1C7MXD4|A0A1C7MXD4_GRIFR Uncharacterized protein OS=Grifola frondosa OX=5627 GN=A0H81_00337 PE=4 SV=1\nMERCAAPYLAESSRSEGCRSVEENWAPRAIVHTDVYRFLGYTNIHLLHCNAPERNTFSTGLLTNHLTQWLRHVTFVRVLTYLFSAQTDVKETVLYGVN\n>tr|A0A439ZYD0|A0A439ZYD0_9HYPH Uncharacterized protein OS=Mesorhizobium sp. OX=1871066 GN=EOS34_27205 PE=4 SV=1\nMAPNARAHDALLTTAQPHGWTYPFACCSGYDCREVAENAIRERPEGYVIEDTGEVIAYTDSRIKNSPDGVFHWCSVAGANDGHTVCLFAPQRGF\n>tr|A0A2E6K1T8|A0A2E6K1T8_PSESP Uncharacterized protein OS=Pseudomonas sp. OX=306 GN=CML01_16865 PE=4 SV=1\nMKISNHDHSSSNPGDEAPPGTPGTGENICPVCNGSGRTEAGECKNCGGTGKVIEGIGGA\n>tr|A0A4V6KLH6|A0A4V6KLH6_SERFO Immunogenic protein MPT70 OS=Serratia fonticola OX=47917 GN=NCTC12965_00545 PE=4 SV=1\nMKKLLCTALCSSLLFSSVSMAAMMSDTVMVGGAAMYPSKNIVENALNSKDHTTLVAAVKAAGLVDTLQGAGPFTVFAPTNEAFAKLPAGTVDTLLKPENKAALTGVLTYHVVAGRYDMKQLEKKIKEGHGTAELKTVNGQPLWIMNNGPPQYSAQRWPRSYCQHQHL\n>tr|W9XCM7|W9XCM7_9EURO MFS domain-containing protein OS=Cladophialophora psammophila CBS 110553 OX=1182543 GN=A1O5_01390 PE=4 SV=1\nMSEKITAPFLKLYRHLFPKGRNVQNDTAEKAIPPESLIVVLQDIGRVDEVIRRELQDISEEEILSIAKRIKRLLDVCLVSMAWIMFALNSFDRSSLGNARVMGLQKDLDMNSNQYGLAMMLLFIAYVLAQVPSNYYLARGRPSIYLPVVMVLWGCVCTATAFVTTPSQLYVVRFFLGLLEAPFCVGCLFLISSWYTRTELGLRSAILLTAPMMANAFSGLIAFGIYDTIDGARGLEAWRWLFIVGGVCTVFVACVGFYVLPDFPSNTRYLSEKEIAVAQLRMIANGVQDDESDYGRWRGLVMAVRCWQVWVFAGMFLLLAIGASVHNFFPSVVNTLGFSRNTTLWMTAPPYLIGVVVTIANSLCADRHRNACPHVVAPAALAMLGFLLFLLDQSSTRSGVWVRYAAAFLMIVGAHSGYPVVLSWAQKTIRGPKEMRACAIAIINTSGSISQLSMALIYVFTDRHIRTVSKPMGTEVYTVDVLEYHLRAGSDFTCDLHAPSNPCLKLRCDAKSVGCFDEISNWRANPLLISFPVF\n>tr|A0A193ATP2|A0A193ATP2_9INFA Nucleoprotein OS=Influenza A virus (A/South Dakota/20/2016(H3N2)) OX=1866071 GN=NP PE=3 SV=1\nMASQGTKRSYEQMETDGDRQNATEIRASVGKMIDGIGRFYIQMCTELKLSDHEGRLIQNSLTIEKMVLSAFDERRNKYLEEHPSAGKDPKKTGGPIYRRIDGKWMRELVLYDKEEIRRIWRQANNGEDATSGLTHIMIWHSNLNDATYQRTRALVRTGMDPRMCSLMQGSTLPRRSGAAGAAVKGIGTMVMELIRMVKRGINDRNFWRGENGRKTRSAYERMCNILKGKFQTAAQRAMVDQVRESRNPGNAEIEDLIFLARSALILRGSVAHKSCLPACAYGPAVSSGYDFEKEGYSLVGIDPFKLLQNSQIYSLIRPNENPAHKSQLVWMACHSAAFEDLRLLSFIRGTKVSPRGKLSTRGVQIASNENMDNMGSSTLELRSGYWAIRTRSGGNTNQQRASAGQTSVQPTFSVQRNLPFEKSTIMAAFTGNTEGRTSDMRAEIIRMMEGAKPEEVSFRGRGVFELSDEKATNPIVPSFDMSNEGSYFFGDNAEEYDN\n>tr|A0A270NRH6|A0A270NRH6_STEMA Uncharacterized protein OS=Stenotrophomonas maltophilia OX=40324 GN=CEK00_00720 PE=4 SV=1\nMLLVLLAPLVSRWLAQGHVAAAAPVAAMDHAMHAEHAQHAMEGHHDHHAMAMPHGETAKKPPADPHADHEMGVDCDYCLIAARLITLLVAAVLLLAPMVPVCRALRGAVQALPQRIGGTLGARGPPALMAA\n>tr|A0A0S2CGT9|A0A0S2CGT9_9AGAR DNA replication licensing factor MCM7 (Fragment) OS=Hebeloma hiemale OX=91672 GN=MCM PE=3 SV=1\nLLQVNAYTCDVCGSETFQDISNKTFSPILDCQNENECKKNGIHGSLHMQTRACRFSPFQEVKIQEMPDQVPVGHIPRSMTVHVNGNLTRLMNPGDIVHIGGIFLPIPYTGFQAIRAGLLTDTYLEAHHIDQLKKQYSEMELTPEIEXKIAALQKDPNLYEMLASSIAPEIYGHEDVKKALLLLLVGGVTKVTGDGMKIR\n>tr|A0A1S3XHK0|A0A1S3XHK0_TOBAC Chlorophyll a-b binding protein, chloroplastic OS=Nicotiana tabacum OX=4097 GN=LOC107765079 PE=3 SV=1\nMASMASMAATGSSATVVRATPFLGQTKYANPLRDVVPMGSAKFTMSNELWYGPDCVKYLGPFSAQTPSYLTGEFPGDYGWDTASLLADPEAFAKNRALEVIHGRWAMLGALGCITPEVLEKWVKVDFKEPVWFKAGAQIFSEGGLDYLGNPNLVHAQSILAVLGFQVVLMGLVEGFRINGLPGVGDGNNLYPGGQYFDPLDLADDPTTFAELKVKEIKNGRLAMFSMFGFFVQAIVTGKGPLENLLDHLDNPVANNAWLYATKFVPGS\n>tr|T1TFT7|T1TFT7_HHV2 Helicase-primase primase subunit (Fragment) OS=Human herpesvirus 2 OX=10310 PE=4 SV=1\nADPRRFHFHAPPMFSAAPREIRVLHSLGGDYVSFFEKKASRNALEHFGRRETLTEVLGRYDVRPDA\n>tr|A0A7M4AVR9|A0A7M4AVR9_9ARCH RRM domain-containing protein OS=Candidatus Poseidoniales archaeon OX=2163009 GN=D7I13_00030 PE=4 SV=1\nFTATQDQLNALVASHATVNEVILAMGPGGKPKGFGFVFIAEKDKGEAVVAALNNSDFEGRNIKVDIAKAKGGKGGGRGGNAGGNNSGKSARELQALREEGEGGKKRKRRQRQKKD\n>tr|A0A2G4HE61|A0A2G4HE61_9FLAO Phosphoserine aminotransferase OS=Flavobacteriales bacterium OX=2021391 GN=serC PE=3 SV=1\nMKKHNFTAGPCILAPEVLEGAAAAVQDFEGMGLSLLEISHRDKKVVAVMEEAQQRVLQTLGLGDDYAVLFLQGGASSQFAMVPFNLLRSEGKAAYLNTGTWASKALEEANKLAPGQAVELASSAEQNFSYIPKGFAIPSGLDYVHYTSNNTIFGTQMKAFPKADSLMVCDMSSDIFSRQLPFGQFDLIYAGAQKNLGPAGATLVVVRKEILGKSGRAIPTMFDYPVHIKGESMYNTPPVFSLFVSLLTLRWMDSQGGLLEMERRANARSAALYGEIDRNPLFKGSAAAEDRSPMNACFLLHDEAKYQAVFDALAKEAGLVGLPGHRSVGGYRASMYNALPQTSVDALVEVMREVERRA\n>tr|A0A737VAW6|A0A737VAW6_SALET Putative transport protein YbjL OS=Salmonella enterica subsp. enterica serovar Sendai OX=363568 GN=ybjL PE=3 SV=1\nMNINVADLLNGNYILLLFVVLALGLCLGKLRLGSVQLGNSIGVLVVSLLLGQQHFSINTDALNLGFMLFIFCVGVEAGPNFFSIFFRDGKNYLMLALVMVGSALLIALGLGKLFGWDIGLTAGMLAGSMTSTPVLVGAGDTLRHSGIASTQLSSALDNLSLGYALTYLIGLVSLIVGARYLPKLQHQDLQTSAQQIARERGLDTDANRKVYLPVIRAYRVGPELVAWTDGKNLRELGIYRQTGCYIERIRRNGILANPDGDAVLQMGDEIALVGYPDAHARLDPSFRNGKEVFDRDLLDMRIVTEEIVVKNHNAVGRRLAQLKLTDHGCFLNRVIRSQIEMPIDDNVVLNKGDVLQVSGDARRVKTIADRIGFISIHSQVTDLLAFCAFFIIGLMIGMITFQFSNFSFGIGNAAGLLFAGIMLGFLRANHPTFGYIPQGALNMVKEFGLMVFMAGVGLSAGSGISNGLGAVGGQMLIAGLVVSLVPVVICFLFGAYVLRMNRALLFGAMMGARTCAPAMEIISDTARSNIPALGYAGTYAIANVLLTLAGTLIVIIWPGLG\n>tr|A0A195DVT9|A0A195DVT9_9HYME Uncharacterized protein (Fragment) OS=Trachymyrmex cornetzi OX=471704 GN=ALC57_10841 PE=4 SV=1\nEGSRYDSHSAQSTQDRRKLLKRTRSLAVISEDDSRQDREAANFRLGQSTFDLPRRHQLIPRAKLIDRNSLKDRFILLTFYKRFKVIQMQILFKSNRSRGSLCSRLSKSQQHLSDSYERFNEAKSYHSRSTCGLYSISSGLESLPDPLSYTRKNRIDPDRLNILDWPDPPRRYRSVQNLDTVSGLVDIVEDNWPIEGNRSIDCIYTQFARYNDVSCLRSAVLGLLNILAGLRSLLPTLVKRKRKEHRSLDSILFEDDGELEYFDVLNLLPLSNIRLEYNETDLSSDSNFARKKIHGLRDLRVLEYNEPNEVSPTRSSNATDEEKCKEHEVNDESEKELRENLNSEGTSKRTDSNRRQHRETDESFGADSKINSVNQFTDQYSPSSSKIDHRRTDVENFVISCEEEDQKFEEIEDYKSIWISDENQNKMSRRPQVLKVVDNDVTRRRHRRSVVEIDAIVEDVPKDKRSQEITEEVNERLNASIITSINNVNEKDEGHGRKAKEATTPENAENGATVDDARNFLERKSTEKEAVRNKQNEGRFERIVKETSNILGKACSVVKGSLGFEARSESSDLGLGSESGSDSRRRSMDDGIEDDRPSKKVENSNNSATLRTDDSKKSHTNLTRSRSCVDSIECQDDGQEFDHVRYKIVKSHMFSKNMFNTARGDVTYEGLMQYLREYSFQELLMDNNVVIIEPVRAETIERKSSPLTRTEPKCKIAGAIQKKTENHERNGERSQSGGTAKSSRQSSIKKHFFYQPIRVNRELIDEELPDPDTVRNVRRMFENTLEKKKISDAEFSRDDKTRRSVSMKDLTTIDDNRYDEISDKTREESRSRCSSRAKDLTRLFETKSASSTISIAKEEIGSPRCESKTRILAQSFEARSGNTSPSGSNCSKNKIGRYHHHHHHHHHHHHQNWDSGSVSSGVSSDYPDTDPGSGAHCTSSDDEDVNCNDDDADTRGPGHYVSQDVLRKIRECGTSVTYYGGKVVNMHNGPLVSPLIGNGFKRIDESNDYVKFKLVKSNSCDSRLELTGRFVEGQSLRRTRDRCADLRQCTIAETPSIEITSIDSRQKDEVQRDEDVEQIEQMKREPPVVIGLEPKKEDSKESRKIFKADFKLGDLDDSRSNYPSKFMPSALTRWEVNSSWKVGNDFGKMEFEEFEVLEDSLNGISEQNKYTQAS\n>tr|A0A7K9E8D5|A0A7K9E8D5_BARMA Beta-MPP (Fragment) OS=Baryphthengus martii OX=176943 GN=Pmpcb PE=3 SV=1\nQCVHAGTGRLRASRAATEVVLNVPETRVSPLENGLQVASEDSGLSTCTVGLWIDAGSRYENEKNNGTAHFLEHMAFKGTKKRSQLDLELEIENMGAHLNAYTSREQTVYYAKAFSKDLPRAVEILADIIQNSTLGEAEIERERGVILREMQEVETNLQEVVFDYLHATAYQKTALGRTILGPTENIKSINRNDLVEYITTHYKGPRMVLAAAGGVPHDELLDLAKCHFGNLPSAPEGGLPPLPPCSFTGSEIRIRDDKMPLAHIAIAVEAAGWSHPDTIPLMVANTLIGNWDRSFGGGVNLSSKLAQIACHGNLCHSFQSFNTCYTDTGLWGLYMVCEPSTVQDMVHFVQREWIRLCTSVTENEVARAKNLLKTNMLLQLDGSTPICEDIGRQMLCYKRRIPIPELEARIEAIDAQTIREVCTKYIYDKHPAVAAVGPIEQLPEYNKICSGMYWLRE\n>tr|A0A498AHI4|A0A498AHI4_9ACTN Phosphoglucose isomerase-like protein OS=Micromonospora sp. M71_S20 OX=592872 GN=DER29_1292 PE=3 SV=1\nMIDGAAGVSGRREPDEALLDDPAALAEHDPGGMLRHTASAGAQVRETAALAAEANLQVLADEGRPRAVVIAGIGTAGRTGDVLATVAGPRCPVPVIPHRSAGVPGWVGAADVVIAVSASGRSPEALGAAEAAHRRGARLVAVGAPDSQLQSVAERARAPFIPVPRRAPARASLWALTVPVLLAARTLGLVKVNEADLAETAARLDAEADRCRPTAESFVNPAKSLALGLAGSVPIVWGSSPLATVAARRFGDTLSANARYPVVSGALGEAGRGRVGLLDGVFGGLAEGERDIFADPDAEAPSGTRLRLVLLRDGGLNPEDDADEPLDVEERRADAVQTLAERRGVRCDVVTAEGGSALERLASLVAVPDFASIYLALAHGLDPMAVPAITEMKELANQ\n>tr|A0A3D8YU66|A0A3D8YU66_9BACL HTH domain-containing protein OS=Sporosarcina sp. BI001-red OX=2282866 GN=DVB69_12070 PE=4 SV=1\nMRTKVAIFGSEEFCQRALQFTEQRSDIILDLYPYTIPSEAPDLLKKLLPCDAILFSGSLPYVASTDVLQSIPVPAIYLKQDETEITTTLLAISIHHSLELEKMSIDVRDCSVLENVLADIKADEQRPLTYQLEKNYVLEEVVQFHASAYANSPSNVAVTSVHAVYDRLTEQGIPVFKMISVKSSFLKTIDRVCQEALLQKSETSKIAAGILDNSILTTEVKDIYKRLAQVLHAHCIHSEEGFLFYTTQGAIQSALHTPLFQQLAVQVSGQLAFGSGRTLTAAKENAVSALRYMQTEHNAGPYLLDEKKELHNLIQTNGSAIELRVIEPILTEIAEKTALSPAVLSKLVTFGQSQQSTQFTANDLASHLGVSRRTAERTIKKLLTSEYVNTVGEEMTYRQGRPRAVYELNFPVY\n>tr|G9Q7I1|G9Q7I1_9BACI Uncharacterized protein OS=Bacillus sp. 7_6_55CFAA_CT2 OX=665957 GN=HMPREF1014_02623 PE=4 SV=1\nMIDKIKNAVEDMYEDEAKDLLQSILIQLNLLEENYSEDTIKNLMDIPKQLTSNPTYKRNVKESAHVHIAFDDSTAGCLKYMLSQEELFEESVVAFSEFFSIGPIYRLHTNEGQLARQKWLINNLTAYDSYFEEEYLSRFIATIEELHTIPVETPITIWKADNAHEHVGLSFVMAQLKDKKNIRVINTSEASREILKQEYDIRGTGELPPESLALFQKSFIKLPYLTEEKRMKFENEWDRLSESIECLRVWKENEVHSVQEDYFDQFIIECAKSVGADREFLKAPRVIGEALGLVEQLVGDTFLEYRLKQLIKQEVFEFEGSLDEMRFYSVKLRK\n>tr|A0A5N7CTG2|A0A5N7CTG2_9EURO Uncharacterized protein OS=Aspergillus pseudonomiae OX=1506151 GN=BDV37DRAFT_266922 PE=4 SV=1\nMYLSVLSFVDSDSLTSKQQQHYALALYFDWKCAITGKIYQSHSDQTFHAVSKGKFYRAVMARFLDTKMLQFATLCQDLESFDWLTTTTSKMWSDNPNRTLEESFQILEAFDFISNFMLLHILEGPGTFADWVISSDEHQAFTQDPNDSFLNNWISLLRRLQPYLSPFDILVAFRMDEIDLQTLQYFNSLLSLEEYDLKSPIYEIEKEVCCKLSEEYDVADHVWKMYRNHGWRNGARGTSFNEHLSVGAIASEIIGFECHRRNWWELMKQSSKASPYGVRFSLPSCYLSTFNERMDEDEDIHFIITKDDLLTLNH\n>tr|A0A210QLV9|A0A210QLV9_MIZYE Uncharacterized protein OS=Mizuhopecten yessoensis OX=6573 GN=KP79_PYT04528 PE=4 SV=1\nMVGQRGNRGGGRGGGAWGDDSQDMGAMGGSMLGGYGTQSDTSMYAQGGKKRSYNDSQDGYSMPNYYDSTSTDPYFRGMDPPASRFVKTESTQQPDQYASYYENWDSGYYNQGNDSQSSYSDYGSSPQQSGGGYNQSSDFSQDVDFPSNNTSGFNKGYNKNQQSWNKRGGGGGGGGGRGGRGQQQQQQQPWGRGGQGMRGGGRGNNRGNQGGGMMGKRGQQKPGFPPQKAFPGPMRGNKRGRGGRGGNAMVPPIHSLAKVSVPDVTKMSIAEKIRRFCLYLQAETNKVNSIQTIENALTGSKLGLKTEYEVEELMRVAGRWMYTGYLKLDSIFLTRSVGANKKEVKHDVYTKGLDIVKTKTVAEIFALKDPGVEAIRSELTNSLEVKKEGLGKTESLQVAKQAMEEMTNTYSTKHDGFDKLMTYLRESTNLPESQISCIEQGISASHCGLTHTFDGQMVRLPTGKLFFRGSLTIAEVVVAVGTGYKKKDAKVQTYERALEALRTKTMAQILKSVPEAEAVTGVVQEKVPTVPEKDRSSQTLLEKMTEITQLIKEAQFRENNINYLDVTAIHLGFTPTCIYRKLESEGNKTMIACELYLDSILMATGEAERRKDAQVETYNSAWDVLCTTAPDYILKEHKRLKPGDQDDPSVMDVWVKGSGKPNANTNMPGLKRNKMDPNEAWKTVDVIVLMEHEDWSFDRQRQAFCILNYSSTFNGMLLQWQTEHDGNMFKSTINLQHKMIGEASALGKNTSRNLAAACALFKLYETQHVIRISRRDDTKLWVEYPEIKTKAEALRVASGAPMEEVVATPTPADGEEKPSIPANKWVVQVAEQMITQHIAKQTLDELTFGPGMPFSESKEVRQIARNLDLKHDIRQQEGQSYLIIHKRMTPQEMIKILQANNSQSGKYSLVDKDTLPTYQNILPEIEKHEAMRNTGNTEGASKKKIKKEDISMTDLS\n>tr|A0A7Y7LU15|A0A7Y7LU15_9BURK DNA-binding transcriptional LysR family regulator OS=Variovorax sp. SG517 OX=2587117 GN=FHT32_002399 PE=3 SV=1\nMDSEALATFLTVHRQGGVSAAATALSRTQSAISRRLALLEEELDAPLFERVGRGLRLSQAGEALLPHAEKVAAAMGDAVAAVQAAKSDAAGTVHIAAVGTLASSGLATVLAKLRQSLPGLDVRLQTATSAEVSEKVRASDVAVGLRYYEDPSPDLLCKVIHHEQLVVACAPSHPLAGTRLKSLVRLSKERWLAFPQPPRRTEPHAEAIFSQFLVRGVERIDWSAVDSLTAQKRLVEAGFGLAFLQESGIAEEVARGSLALIRIDDLDVRVPVACVVRRSAFLSRATRALLAELERAEL\n>tr|A0A2A7QG65|A0A2A7QG65_9LACO ClC family H(+)/Cl(-) exchange transporter OS=Lactobacillus sp. UMNPBX18 OX=2042029 GN=CP369_02605 PE=4 SV=1\nMESRKEVFHRYNQFNQLIRAIIIGILTGLVVSVFRLIIQHFLQLVTASFAYFHSHPLWLIPWTIGSIILALLLGWLAQSYHDIKGSGIPQVEGQLTNQFDEKWWPVLWRKFLGGIFAIGSGLYLGREGPSIQLGATIGQGVEEKAKVGHLNRQIGIASGAAAGLSAAFNAPIAATIFILEEVYHNFSPVIWLATFVSSLCSNIISMQFFGLRPVLNVPYNHMLPNNLYWHLIALGILLGILGRLYQIVILHLNGWTARIPKLSPIAYPIIPFLLVIPIAWYFPITLGGGNELIIILRSLPFSLALFVGLFVLRFVFSMISYGSQLPGGIFLPILTLGAILGAVYCALMVRLGLMPVRYLPNFIIYGMAGYFACISKAPFTAILLITEMVGSLAHLMPLALVAVVAYLVVDALHGEPVYTAMFNAFIGNNPQPARHKEDVTMSITIYAGAQLDGCKIKDFPWPTDCIVMVVYRGEEKIIPNGQTKLQAGDTLILRANSATTRQAYHEISRAAHYAQG\n>tr|A0A0R2BHK3|A0A0R2BHK3_9LACO Uncharacterized protein OS=Lapidilactobacillus dextrinicus DSM 20335 OX=1423738 GN=FC84_GL001267 PE=4 SV=1\nMRIIFIGDVMGPIGQETLTTYLPKLKAKYRPQLTIVNGENIAMGKGITKSLYKTILTAGADVVTMGNHTFDKDDIYEFIDDANKLIRPANFPAQHTPGKGYVLTKVNQTTVGVINLQGRVFLDSIDDPFAKVDEILAEIQAQCDYIFLDFHAETTSEKEAMGYYVDGRVTAVVGTHTHVQTNDAKILPKGTAYLTDVGMTGPYDEILGMRKERVIERFLNHRPVRFETPLSGRGQLNGCVIDFSSTKNAARKIELIQITPDQPFLE\n>tr|T1BH73|T1BH73_9ZZZZ Translocation protein TolB (Fragment) OS=mine drainage metagenome OX=410659 GN=B1A_07070 PE=4 SV=1\nNSDSSINYDGSQIAMMQGNGNVYRIAIMDRKLDNQTRFISPGPMDGSPSYAPNGSMLLYAATDNNGKGVLYEVADNGSVRQRLSLVNGTVQSPSWGPYRVPPSTQP\n>tr|A0A7W7F9L6|A0A7W7F9L6_9SPHN Spermidine synthase OS=Sphingosinicella soli OX=333708 GN=GGQ98_002410 PE=4 SV=1\nMLPRVLIDTAKIPGGGELRLIQRGTEFSIMLGANELMNSRLKGSEESLASLSCGKIQSRPQPRMLIGGLGMGFTLRAALAKLPADASVTVAEFVPSVVAWARGPMAHIFDGCLDDPRATVAVEDVADLIGDVRSHYDAILLDVDNGPDGLTHPDNDRLYSRKGLIAAREALRPGGILAVWSAAPDHAFKNRLIKVNFEVEETVVRTNGERRGARHIIWIATRPS\n>tr|A0A1H5CGP3|A0A1H5CGP3_9MICO Peptidoglycan/LPS O-acetylase OafA/YrhL, contains acyltransferase and SGNH-hydrolase domains OS=Ruania alba OX=648782 GN=SAMN04488554_0368 PE=4 SV=1\nMVSTATQDRGRIEGLDGVRALAIVAVLIFHLRPLSLPGGYLGVDVFFVVSGFLITTLLVRELRANRELDLTAFWTRRARRLLPALATVVAASVALAFFAGDDLLVNIGRQVVGALTFSNNWLEISAGSSYFNATSPQLFVNFWSLAVEEQFYLLWPLLFVLIMATTRTGRQRVGVVLGLAAASALLMALLYTPGEDATRVYYGTDTHAFGLMIGAALALSAAGESWNLLAQTWYRRARVLLALGALGGLVALMLVLDPTQPMAYRGGILAASLLTALVLGALPGPTNLLHLIFRLRPVAWIGERSYGIYLWHWPVILLIAAFAPPTAPDSVASWVQRGAALVLTLAVSAASYRWIEMPVRRDGFRATGRRVLAALTAPGGLTPPRVAFLSTTAVLALFAVAVATAPDRSQVQIAMDEASGVVEASGGESGSVAGSTESPQTGSGETDGESSETDGGQTVDGAAEGPGAQISGFGDSMMYVAAPGLSATFPGMSIDAESNRQWPAVAETVAAALDEGTVRDVVVIAAGTNAGVREPEIVRETLDLLGPDREVVLVNIYGSSFWVEESNENLAEIAADYPNVVIADWHQAALDHPEDLQPDRIHPDMEGMYLYADIVQAALEELGVG\n>tr|A0A5I0WZT4|A0A5I0WZT4_SALET Type II toxin-antitoxin system RelE/ParE family toxin OS=Salmonella enterica subsp. enterica serovar Oslo OX=1005394 GN=G4H23_002326 PE=4 SV=1\nMRIFKTRWFNREAKSHTIKDDELSEAINAVLQGKADNLGGGVYKKRLNQNRDRAIVLAKGGEHWFYTFLYAKQDMANISYRELAGFRELAKHYACLTEDQITALINNKELVEVRHVSKN\n>tr|A0A2S8FEH7|A0A2S8FEH7_9BACT Uncharacterized protein OS=Blastopirellula marina OX=124 GN=C5Y96_14010 PE=4 SV=1\nMPLLVSGICLLVPSLLAAAPQADFEKILSPILEDAVRRSLPTSFKDESDWGSTHEFTKRLKVRGKWDSLKLERVREAKNHGDWVRYLGHIEDPNQHVRIWIENLSVGPTRSTCQIHARVEFQGEAEYQQWVRGVRLLGVSVVTEATVKIHLDVQLDSKWDMSSLVTSAELTPTVTGGQIELERFYVHRIGKAHGEVAEQIGEQLEGTLAKKLAKKEEKLVREANKAIAKELENGTVKLDLVDYLKKQLLK\n>tr|A0A069RH84|A0A069RH84_PEPLI Putative transposase InsK for insertion sequence element IS150 OS=Peptoclostridium litorale DSM 5388 OX=1121324 GN=insK PE=4 SV=1\nMICETLSITRSAYYKYKKRVKPEKEKQDELLCSLILEYHAMYDGILGYRRITMFINRLNQTTYSENYVHRLMSYLGITARIRKKKVNRKRVKPDYVKDNILARDFTAKTPNEKWLTDVTEFSIPKDSRKLYLSPIMDLYDNSIIEYEFSFRNSNQLVFKMFDRAVANNPGARPIFHSDRGFSYTNNAFKSKIKNAGMIQSMSRVGKCIDNGPMEGFFGILKSEMFYGKIFKSLDDLVDKIKEYIVFYNERRFQKRLKCLAPIEYRNKALIA\n>tr|Q1ZM26|Q1ZM26_PHOAS Uncharacterized protein OS=Photobacterium angustum (strain S14 / CCUG 15956) OX=314292 GN=VAS14_08110 PE=4 SV=1\nMTLIERLKDEQKAAMKAKDKPRLGAIRLVLAAIKQREVDEKITLNDDDVLVVLTKMVKQRRDSVAQYEAAGRQDLADVEHAEISVLAEFMPQPLTEEEISALMDEAIAATGAATMQDMGKVMGVLKPQIQGRADMGIVSKLVKTKLG\n>tr|A0A1C1VV15|A0A1C1VV15_9PSED Phosphatidylethanolamine-binding protein OS=Pseudomonas sp. S3E12 OX=1873126 GN=BB029_27630 PE=4 SV=1\nMNIRSILPALSMAVTLSGYAADFSLTSRDIADNRPLTRREVFQGFGCDGGNTSPELSWKNAPAGTKSYAITVYDPDAPTGSGWWHWTVVNLPASTHSLPSGVGANLPAGAVQGRTDYGQPGFGGACPPVGDKPHRYQFTVWALKVDKLPLDNQASGALVGYMLNANVLAKATITSTYGR\n>tr|A0A161XBG4|A0A161XBG4_9CELL Histidine kinase OS=Oerskovia enterophila OX=43678 GN=arlS PE=4 SV=1\nMRRRVLQATVAAVAVAVLLLGFPLAFLGAQFVLANEMDQLQGRVDTLARNIDNRLAQNEPIPQSVLDNASVGRPGELPAYVFVNLPDGEQMTAGEVVTGRANEAADRTDQNATVALSTSFAESYWKAAQIVLLVVAASVVAFAAGIAMAVWQANRLSAPLVYLAASAEQLGSGQVRPRLEPSGVEEIDLVAAELARSSDRLAGRLAAERQFASDASHQLRTPLTALSMRLEEISMASDDPAVQEEARISLEQVERLVTVVDDLLTQSRRAQGGTTEAVRLIEVVRQQEEEWVPTFAQAGRELVIDVPEGYQVLATPGALAQVLATLIENSLKHGAGTTTVRARPSGTSGAVAVEVGDEGEGVSDEMAPRVFERGATSGAGTGLGLALARDLAAADGGRLELAQRRPPIFALFLAGVPRTLDPRVVLPTGTLISARGGRRRRRGRGPEVEPR\n>tr|A0A0D0Y6D7|A0A0D0Y6D7_9TREE Small nuclear ribonucleoprotein Sm D1 OS=Cryptococcus gattii EJB2 OX=1296103 GN=I306_06210 PE=3 SV=1\nMKLNNETVTIELKNGTVIHGTITSVDPQMNTHLKSVKLTLRSQPSSQPPLSLDSIAIRGNNIRYFILPDSLPLDTLLVDDAPKPKKKKEGAAARGARGAARGARGARGGGRGAPRPRGRGF\n>tr|D0TP63|D0TP63_9BACE 4Fe-4S binding domain protein OS=Bacteroides sp. 2_1_22 OX=469588 GN=HMPREF0102_01363 PE=4 SV=1\nMNVAELDIDKCSGCGLCASVCSKHSISIVPDDSGFLRPIVDKNTCVDCGLCVKRCVIVNPRKQTIPQKTYAAIRQDKDRIALSSSGGVFAAVAEYVLLKKTNWVVVGSTLDETVSANHIIVDNVVDLKNLYGSKYVQSETTGIYKKIQILLDDSKSVLFSGTPCQVAAIQRYTNNHPNLWTIEVICHGVSNNKMFNSYLDMYKRNEIRMFYFRDKEQGWSFNNKIVYQNGKEKKINHRMSSYMTYFLKGETYRDCCYCCPYAKPERCADITIGDFWGILQTRPDLNNKIDIEKGVSCVLVNTDKGISMVGNAELELYDVEYDAIRKENGPVNEPSHHTVKRDLVLAEWGKKKDWTDVHTFWKKNDRKITFVLWSMIPVSLQHKIRVMLGKR\n>tr|A0A2A2CDI5|A0A2A2CDI5_ECOLX Spermidine/putrescine import ATP-binding protein PotA OS=Escherichia coli OX=562 GN=potG PE=3 SV=1\nMNDAIPRPQAKTRKALTPLLEIRNLTKSYDGQHAVDDVSLTIYKGEIFALLGASGCGKSTLLRMLAGFEQPSAGQIMLDGVDLSQVPPYLRPINMMFQSYALFPHMTVEQNIAFGLKQDKLPKAEIVSRVNEMLGLVHMQEFAKRKPHQLSGGQRQRVALARSLAKRPKLLLLDEPMGALDKKLRDRMQLEVVDILERVGVTCVMVTHDQEEAMTMAGRIAIMNRGKFVQIGEPEEIYEHPTTRYSAEFIGSVNVFEGVLKERQEDGLVLDSPGLVHPLKVDADASVVDNVPVHVALRPEKIMLCEEPPANGCNFAVGEVIHIAYLGDLSVYHVRLKSGQMISAQLQNAHRHRKGLPTWGDEVRLCWEVDSCVVLTV\n>tr|A0A168G2W8|A0A168G2W8_CORDF Sulf_transp domain-containing protein OS=Akanthomyces lecanii RCEF 1005 OX=1081108 GN=LEL_05631 PE=4 SV=1\nMATVLSGAAFGAAMIAAGFYNPAVVISQLKFENWHMVQAFLAATASSIAYYAISDRAGYASLQPRASSPIGLFGSTYDGNVLGGALLGAGMALSGSCPGTLFAQMAAGVHTGFYALAGAVVGGVLWTGILSKAVARARARAGSKPETVTVNQHLGVSKPAAMLLYEAGFAAVIIVTSLYTPRFPGTKMSGALGGFLISLSQLASIATRGSMIGISGSYGELGGLLWAGLAGDAASKPKSYPNVLFAVSAGAGALLLARLAPVLVEAPALEVAPAVAVLGGALMVVGARMAGGCTSGHGISGISLLSTSSLITIATTFAVGFVVATLVY\n>tr|A0A3N2RNP2|A0A3N2RNP2_9ENTR Uncharacterized protein OS=Kluyvera ascorbata OX=51288 GN=EB837_25720 PE=4 SV=1\nMSEPRLGNLITVLLPARSYKINCALTTEKLMPGIEQFACRLLLIFDQLYPSELQNYFGLTDREREVLLDGLLANRLININPDGHIEASSFLRKHAASNGGKPSLVKYQERTEEVAFDLLTLSICKPQPNRRFTSGLPELLPRHQIGGDAAAVTEAFSSQFRHHLLLSRNSEYERQRTRLYKIMGCSSHEMVQLPIEIEVSYDASAGSIEPQKFTRSYEYLGNTRLPLSNELEAHIADFLGEHKLDEFGIDCEDFCKLANDKVLLQFANGYKFDYSGWIEAREQRKTGYGTSLTTGMLGAVYLPHNSKLFISMLHNALRDYVGKTAPKALWYSSKVPLWGANGSQLSRFNRDLGDILGNYADDKIARISLLHPSADEGEKRQERKRHLGRFPTGIGLTSEAKFDRLEILLIPDVIALVQYHGQPNSDSALTLPIGYITVEPERLELLKNLMIKRIEGVVATINWSESKLENLTSLLPVEFLIKLNKKSGEDVDAAIQKMQIANRAETARAILSLRK\n>tr|A0A1A7ZNK3|A0A1A7ZNK3_NOTFU HFM1, ATP-dependent DNA helicase homolog (Fragment) OS=Nothobranchius furzeri OX=105023 GN=HFM1 PE=4 SV=1\nDTAVKTTCPVYKHARAGQHGTCVLTWYLPGHFNHWTTKANTTADLPKTLHVVLEQILNRHPPFGNQIRDSVRHLPKYSVTLEQLPRFGSDTAEVVARVNLKNQADLLSRRTAPGHHFVSLIIGDADNNVAFLQKITDSMLLKSGSWSKKIQVAKPVKGNEISVHLISSDYVGLDIQQRFTMQFSASRTFGSEIPYNTIEQRPQLTAQTPLSAAQRDKASPAEEQGSTYPGHKRQCNHLCKNKTLCAHDCCKVGVAVGRKRSTNHESSFSSYLTDLRNRSDALVQTPVKRLKMGNGPLAVSMQRFAFKPKENLSPVSCYSENEYKAGQMDLAADDSSQLKDISCLNDPDPGTFSDADGAENRTRTTQNPAATQQMFLKDSSARIMSRTGGEPLKSGVNQTKTSTSVHSNWSAATSEQEALQIPAVTFDLGNEWDDWEDFDEENLLHTAAALVPQCRTKPEPQIQQRVDYTSGCPTGSSPVFLSCSQTKCQGTTITTPLRSISAAASCEIRKFDPSPITNILNDEITGKTPEMFFKPPPETQVNRRCDFFHTVDVPLRSDLSLDRSKEEETFFGIFDGIF\n>tr|A0A7C6JKA3|A0A7C6JKA3_9BACT 3-isopropylmalate dehydratase small subunit OS=Petrimonas sp. OX=2023866 GN=leuD PE=3 SV=1\nMEKFTTITSTCVPLPIENVDTDQIIPARFLKATTREGFGDNLFADWRYDKAGNPKGDFVLNNPTYKGEVLVAGKNFGSGSSREHAAWAIGGYGFKVVVSSFFADIFRHNALNNGILPVAVSEEFLGELFVSVKGNSKATVTVNLQEQTITNNETGKSESFNINAYKKECLLNGLDDIDFLLSNRDKIEAFEKQRVYSY\n>tr|A0A7X6IU76|A0A7X6IU76_9PSED EscU/YscU/HrcU family type III secretion system export apparatus switch protein (Fragment) OS=Pseudomonas sp. BG5 OX=2722817 GN=HER21_45805 PE=4 SV=1\nGLMRVFGKQALWEGAKALLKTVAIGVALWIVVSGLVPVLMASGSHNITWLLEQAAGGAAALLQVAVVVGIILAALDVAVVMRRNRKHT\n>tr|A0A7Z1UA43|A0A7Z1UA43_9GAMM Methyl-accepting chemotaxis protein-2 (Aspartate sensor receptor) OS=Erwinia sp. AG740 OX=2183904 GN=DFO54_1118 PE=4 SV=1\nMSVFGRYVRNLKVSHKLYGGFGIVLLLVVLASTFSSARFFAIRDLYIKSSIMNEMGNFIDLTRIARIKFTYTLNDDNLTNLNKYLQQARQLNDKAKALKWDETYQGDFKNVEQDFADYTQNIDRIKSSVEGMNEVTKGISALDQQAAPGDALYTLSNDINLLRQYHQTSVLYGQLVDKVHLLQKENSDAAFKAVKSAYDQAKKSFDSLNSTLPGEVKNSISELGDRIERYNQSGVKYNDKVNQLKASDSALRATGDKLISDIDGVLKKIGARNNDIINNSVFQTVICGITAVILGLLIAWSVTRQITRPVIANLKLAEKIASGDLSASVTVERHDELGQLTLAMMSMTEKLRQLIADIRHSVYSVAKASSEIAAGNHDLSSRTEQQSSAIVETAASMEQLTATVKNNADNARHASQISEQATDNANRGGDIIHRVVQTMGEISGSSKKISDITSVINSIAFQTNILALNAAVEAARAGEQGRGFAVVAGEVRNLAQRSSQAAKEIEGLISESVSRVNTGTVLVSDAGSAMDDIVASVKRVHDIMGEIASASDEQSRGIAQIGGAVSEMDSTIQQNAAMVHESSAAANSLEDEAARLSQLVSVFRLSAQDEPQTSGHTAMLASRLRRPEIANRQAALPGSNTTPGTIANTSADNWTTF\n>tr|A0A810LQW6|A0A810LQW6_9ACTN Uncharacterized protein OS=Actinoplanes ianthinogenes OX=122358 GN=Aiant_38990 PE=4 SV=1\nMAGASDNGGWPPPDGGSSDDLPDLPEEWGVIVIPDDLSELSDEVEAVRAELHLAPPPNRWQRFARRPAVRRLRRAGALLLRAPVLIVSMAILVTVASLFASAWPGTPRQPATQRTSDTTTTPAKTLPALDLIGADGQAVPLLAHRPMVVIITDGCDCERLIAETVAAVRQDVSVLAVSTTAPSATASQGGLAPAQTPRADGKTVLYLQDPTGHLRERAGLTSARDGSAATFVVNKAGDVLRVCQHVVSVAAFEADLARI\n>tr|A0A6B8MQP2|A0A6B8MQP2_KLEOX Helix-turn-helix domain-containing protein OS=Klebsiella oxytoca OX=571 GN=GJ746_00670 PE=4 SV=1\nMDNSINQVIDSFIKGQAVIGRVRFSTESRPASEKAVSVDFPRLEIMLEGQLRDPAIKSEYAQLTPHDVLYIPAGGWNDPQWLMPSTLLTILFDKQQLEFVLCHWDGNALNVLDKQQVPRRGPRVGSFLLQALNEMQMQPQEQHTARCIVTSLLSHCADLLGSQAQTSSRSQALFEAIRKHIDAHFAEPLTRESVAQAFYLSPNYLSHLFQKCGPMGFNEYLNHIRLEQARMMLKGHDMKVKDIAYACGFADSNYFCRLFRKNTERSPSEYRRQYHSQLTEKTSSAKN\n>tr|A0A1Q3WCK3|A0A1Q3WCK3_9BACT Ribokinase OS=Spirosoma sp. 48-14 OX=1895854 GN=rbsK PE=3 SV=1\nMPGQILVVGSSNTDMVVQTTKLPAPGETVLGGTFFMNPGGKGANQAVAAARLTGNVTFVAKVGTDIFGEQAVAGFRQEGINTTYIQSDPDHPSGVALINVDAAGENCITVAPGANAQLRPAETNPALMSAEADALVLVQLEIPLDTVVHVISEAATRGLRVILNPAPAQPLPDELFPNLFLITPNETEAELLTGIRVDDLSSAGQAAQKLHAMGVSNVIITLGSKGAYLSTGTQSQLIATPPVKAVDTTAAGDCFNGALAVALAEGQPLPDAITFACKAASISVTRMGAQASMPRRNEVNE\n>tr|A0A2D8DNN8|A0A2D8DNN8_9ALTE Uncharacterized protein OS=Marinobacter sp. OX=50741 GN=CMG78_10605 PE=3 SV=1\nMKLAKFIGSALVALTISAPAIAQQSPGGQPDQVAQLAQMVGLSEEQQTEIRGIIDDMQGEIGELRQDARSLQEDLQEQIKPDYDESAIRDNAAKLGDVTGEIAALSALMQAKVDAVFTQEQRDELDRRMKQMQQQMQQQRQMMQPQGQQ\n>tr|A0A842MKE0|A0A842MKE0_9ARCH Uncharacterized protein OS=Thermoplasmatales archaeon OX=2268204 GN=H5T45_04690 PE=4 SV=1\nMKKIICLFIFLALMGCLKSEKEVEKETAEGFEVLSVFFSETEDYNTVLLNMKVKWVGKEKGAPRCDIYFPPQERLEMGIGPIENGPSIVEPLYQEGSEVKTAILKEFIARSFYPDYIAPEFGKSYYAQIKFYWPSLNETYEWQGNVGWSE\n>tr|A0A7X3C2Y9|A0A7X3C2Y9_9LACO Xylose isomerase OS=Secundilactobacillus folii OX=2678357 GN=xylA PE=3 SV=1\nMAEDLWNMKNIEYAGNKDLGSGAQFHYYNPDEVIGGKKMRDWLRFSVAYWHTFDQRLVDPFGDGTAMRPYDKYTDPMDNALAKVDYAFEFYRKLGVDFLAFHDRDLAPEGDTLRETNKNLDKVVDKIVEYQKTSGMKVLWNTSNLFTNPRFVAGAGTSPYADIFAYSAAQLKHSLEIGKRVGSENYVFWGGREGYESLWNTNMKLEQEHAAKLFHMAKDYANEIGFDAQMLLEPKPKEPTTHQYDFDAATTIAFMKTYGLDKDFKLNLEGNHANLAGHTYQHEIRVAREAGLLGSLDANQGDKLIGWDIDEYPSNLYETTAAMYEVVQEGGIGPRGGLNFDAKPRRSSFEANDLFYGHIVGMDSFAAGLRVALKMKEDGVLDKIVADRYSSYKSGIGADIESGKATFKTLEDYTLDKTQADLRAATSSDHLEQIKDIINHYIVNVLGK\n>tr|A0A5N6QTR5|A0A5N6QTR5_9ROSI Uncharacterized protein OS=Carpinus fangiana OX=176857 GN=FH972_006142 PE=3 SV=1\nMGTLVHDAQNVDSDIYLSLGLTELRKGVPAIPRVLSLLSSLLERSVQKNEILLEATQIKDVVTIFHGLRAPTLSIRQYIDRIFKYSGCSPSCFVVAHIYVDRFLQSTEVHLTSLNVHRLLITSLMLAAKFIDDAFFNNAYYAKVGGVSTAELNRLEMKFLFSIDFRLQVTIETFGRYCLQLEKETAEGLQIERPFKACGIKESWSNKDDSSCAPTVAQ\n>tr|A0A0D6QGJ2|A0A0D6QGJ2_9DELT Putative ECF RNA polymerase sigma factor SigI OS=Anaeromyxobacter sp. PSR-1 OX=1300915 GN=sigI PE=4 SV=1\nMTDTGETFEAQRPALLALAYRMLGELARAEDVVQEAWIRWQRRPGEVDSPKAFLLTTVARLCLDELGSARARREESRSDRLPEPVELDRAGLGRVELLDRISMAFLVLLQRLTAAERAVLLLHDVFDMTHAEIAARLEKSEPACRQLLRRARENVATERRTLRTSRDEHQRLLAAFMEASARGDQGALLDLLAEDAVLVADAGPGVVRYGRIRNVGRPVVGGLKVAALLASVARQRVGPPLELRERTLNGEPAAVAFEGGRPVSAILLGVAEGKVRHVYLQADPERLRHVGSLD\n>tr|A0A178W037|A0A178W037_ARATH (thale cress) hypothetical protein OS=Arabidopsis thaliana OX=3702 GN=AXX17_At2g00490 PE=4 SV=1\nMEACSRKRRRRRAYTTSTTGYAAVFFCGIFVFAQFGISSSALFAPDHYPSLPRKAGHFHEMASFQAPKATVSFTGQRREEENRDEVYKDDKRLVHTGPNPLHN\n>tr|A0A1F8I579|A0A1F8I579_9PROT Rhomboid family intramembrane serine protease OS=Caulobacterales bacterium RIFCSPHIGHO2_01_FULL_67_30 OX=1797584 GN=A2795_02220 PE=4 SV=1\nMSDPDGRFAAPPNSEGPKSERLFNAPVAVVLIALSMPVLFFFQRQLPDMGASMAFAPIDLQNGRWGGLFTAMLLHGSWTHALMNAIGALAFGAPVARLFGDRIGPTVFLLFYIGCGVVAALGYGLVHWGSTEAMVGASGAVFGLIGAATRLMGGRGRVLSLFDRRVIGASIAWMAVNAVTGLIGYAPGADGARIAWEAHAFGFIAGLLVIGPLGRAFGKGPLPMGTSARPESDV\n>tr|A0A3Q8V945|A0A3Q8V945_9ACTN DUF4132 domain-containing protein OS=Streptomyces sp. WAC 01438 OX=2203204 GN=DLM49_03910 PE=4 SV=1\nMGWLAAGEAYEVALVDGRVVARQATPDAPAGQEHTPRKTLPAEIRDRPEVVELQRFAQWLDRHAAECAAQVTTWMVSSLPVPAGLLARVWPDEAWRTALRDIVVVGDGPDETGFLRDARDTGELSVVNLDGETVRLNLPTVTMPHPVLLPDLEELRVFAAESGMVQGVEQLHRATWRKPEGIAPGTTRVTEFAEAEYRSWFHLTARATSLGYKIAGSAVVDRIRDAGRIVTASVGMSDPYSEEKAWTGHLTWGDADGQGTLPLTEVGPVAWSEGMRMAAALHAGRSEGTEGSR\n>tr|A0A7Z7G4Q5|A0A7Z7G4Q5_9BACL Drug resistance transporter, EmrB/QacA subfamily OS=Paenibacillus sp. OK076 OX=1884379 GN=SAMN05518670_2026 PE=3 SV=1\nMSQARLKERDDVKKGPILFVMILGAFLATLNQTVMSVATPELMGDFNISAATAQWFTTGYMLVNGVLIPITAYFMQRFSTRQLFQASMFIFLIGTIISALASNFGTLLTGRMVQAAGAGIIMPLLMHVILTLFSPEKRGAAMGMVGFAIIFAPAIGPTLAGYILEHYTWQTMFYGMIPLTVIVIGFAFVYLKNVSERVKLKFDTLSVLLSTIGFGALLYGFSRAGSLGWSSAEVIICLAAGVVALGLFTWRQLASANPLLDLRAFKYNMFSLTTIINIAITMIMYADMMLLPLYLQNARGYTALESGLLLLPGALVMGFLMPITGRLFDRFGAKWLAIIGMVITIVTTIGFIDLTDSTSYTYLVLMSTGRRIGMALLMMPIQTAGLNQLPPRLGPHGTAISNTVRQVAGAVGTSLLVSVMTSRTTAHVQDMVATGAAKGLTQQQLGMESMIQGINDAYVVIIGIAVVGLLLSFFIKRTKQATEEDSKQPVRQKVSMNTN\n>tr|A0A4Y7SBP5|A0A4Y7SBP5_9AGAR Uncharacterized protein OS=Coprinellus micaceus OX=71717 GN=FA13DRAFT_1647367 PE=4 SV=1\nMLGSAKLSRLGGHIAFLGDRFSLVQAARASIEKKAKALYYPVEPPNNEKYNPTRPPKYNLKDLPRRSQAHYWKVIELLNLAKTKTARATISRDSGIVALPACAASPAFLHPSYFPLDPFHLFYENITPFLWDLWTVDSTPGESVHVPSPKIARFGVLVAEAMRTLPPAFCGPVRNPHLKRQSQYKAYEWMALFHWYILPIGLELEFPPALLRNFSYLVEAVEIAMTVQSHSISDLQSLEDLIVDFLLQYEHLYVGDDPEKVQRCRLCIFQLIHVPIHIMWYGSIRLSSQATVERSIGEVGRKITSRKEPFAHLSNIIVEQEIIRVLSLYYPELTHKGATTTNTTRSDTRQKIRISKSENLSEELAHHLSAIFRDPFITWLTHLGQGRNSEGKTSGTLQPTNQHKQMFGEVISFYAITNADNETVEVAVYRPLVDVCQPLKTVIQGRWPSASAKVKIAAVEVESICTVVGIWAAPQSENIYILRKHPGLLMLTPLERGIQEDTERDEMDD\n>tr|A0A1B4C1D0|A0A1B4C1D0_9BURK Esterase OS=Burkholderia diffusa OX=488732 GN=WI26_24630 PE=4 SV=1\nMRGSMNLVRAFWLLLLLAAAGPALAFQTRIVAIPSAAMNQTLKATVVLPDDYARPRHGPERSVERFPVVYLLHGSGGDHTDWTANTHIAALADRYRVILVMPDGGHESWYIDSPFDSGSRYETFVGDEVVSYVDMHFRTIATKGARAITGLSMGGFGALRIALDRSDTFGAVGSISGAVDPRCCEDEPGIDHVFGDPGRHPSFWNRNAIVENARAFVRAHLDLTIDCGRDDSFVGSNRTLHQRLVALGVPHDYAERPGGHTWDYWAHAIRYQMQFFAASFQHGGYA\n>tr|A0A2E7H1W3|A0A2E7H1W3_9EURY Uncharacterized protein OS=Euryarchaeota archaeon OX=2026739 GN=CMB34_05090 PE=4 SV=1\nMLLSACEGISVADAYVKADRMTYEAIAPSYRAYVEADENLDEPSKQSRYRLLQTWELRINSNTKNK\n>tr|A0A0E0KM68|A0A0E0KM68_ORYPU E2F_TDP domain-containing protein OS=Oryza punctata OX=4537 PE=3 SV=1\nMDGSTTIPLPQPPRPPPPAPAPAPPQVFLRRSVLPPPQTGPHRVAPAPPPPGAHVHYFRAASPIPIFRAAASSRPPRPPPTTAPAPPPPPAAPAVTPARPVAVAPPPPPATTTATATEEVAAPATGNPMANTADNEEKNEREAVQSEVPKGETVQGPDKECTTGTVKGIKRPRKPKGFKKGSLRSNEGDAGASLFSPNNCRYDSSLGLLTKKFINLLEGAEDGTLDLNKAAETLEVQKRRIYDITNVLEGVDLIEKTLKNMIRWKGFDMSKPKERERQISALKEEIESLYDEESRLDDEIMEAQEKLNALRVDEDRRKLLYVSKEDINAIPRFQGSTLIAVNAPRGTYIEVPDPNLDMDIYKDLDNQEKHYQIVFRSAMGPVDCFLISNHQETFNADQQMADDLDAAVTSGSSQALQQMDYVQAPEIGESNGVREHTSEPSKRDDPVPGIVKIVPSDDDIAADYWLSSDADS\n>tr|A0A3N1VCH1|A0A3N1VCH1_9ACTN Hemerythrin HHE cation binding domain-containing protein OS=Streptomyces sp. 2132.2 OX=2485161 GN=EDE04_6244 PE=4 SV=1\nMDSEHVAPARPYGPAAADLTGVRVAHRAILADIERLAGLLAALAAAAEPAGPARAGAIAGYVHRFNDAVRGHHREDRTLWPVVLDAVPDAAEAAAGLAGFVADHEALDAVQADCDAAAARFAAEPGRHAGLLAGLLAVQRDLLAAHIEAEERHVLPVITRRVPGAAYAAARARVRRADRSPDPAWSRAWLLSHATEDETRRLLAVAGARPAAVEPELREYAAQASAVFAG\n>tr|A0A2S6FD50|A0A2S6FD50_9PSED DNA topoisomerase 4 subunit B OS=Pseudomonas laurylsulfatiphila OX=2011015 GN=parE PE=3 SV=1\nMATPSASSYNADAIEVLSGLDPVRKRPGMYTDTSRPNHLAQEVIDNSVDEALAGHASSVQVILHADHSLEVSDDGRGMPVDIHPEEGVSGVELILTKLHAGGKFSNKNYQFSGGLHGVGISVVNALSTEVRVRVKRDGNEYQMTFKDGYKATELEIVGTVGKRNTGTSVFFAPDPKYFDSPKFSISRLKHVLKAKAVLCPGLLVSFEDKATGEKVEWHYEDGLRSYLVDAVSEFERLPDEPFCGSLAGNKEAVDWALLWLPEGGDAVQESYVNLIPTAQGGTHVNGLRQGLLDAMREFCEFRSLLPRGVKLAPEDVWERIAFVLSMKMQEPQFSGQTKERLSSREAAAFVSGVVKDAFSLWLNAHPETGMLLAELAINNAGRRLKASKKVERKRITQGPALPGKLADCAGQDPMRSELFLVEGDSAGGSAKQARDKEFQAILPLRGKILNTWEVDGSEVLASQEVHNIAVAIGVDPGAADMSQLRYGKICILADADSDGLHIATLLCALFVQHFRPLVDAGHVYVAMPPLYRIDLGKEIYYALDEAERDGILDRLVAEKKRGKPQVTRFKGLGEMNPPQLRETTMDPNTRRLVQLTLEDFEATSEMMDMLLAKKRAGDRKTWLESKGNLAEVLG\n>tr|A0A3R7JJI1|A0A3R7JJI1_9EURY Helix-turn-helix domain-containing protein OS=Haloarcula sp. Atlit-47R OX=2282132 GN=DVK00_02090 PE=4 SV=1\nMRFIEEIVVDDFLPTFRSLLADALRERGLTQSEVADLLGISQSAVSKYVHGDVARQEDLLAHRGLEELVERLADGLADGDMSPVQALVETEVFIRELEQGGVLAQIHEDAVPELGDYDDEFAVHDPDSQLRAAERTLASVRRGLSVLENTSGFATLIPAVGSNLVQCLPDAESIEDVAAVPGRILDVKGRATIPADPEFGVSEHVATLLLAARTAGSDARAVLNVRYDDGVVAALREAGRTVVEFDAEERVEPAVAAALADDPGVDVLYHTGAMGIEPVVYLLGDDAVSVAETAREIL\n>tr|A0A1D3UJH6|A0A1D3UJH6_TANFO Uncharacterized protein OS=Tannerella forsythia OX=28112 GN=TFUB20_01002 PE=4 SV=1\nMDIGQIRKDVHAYYHSIFNDKYGRYVRILELFPPIKESDCILDYGCGTGCVSQYFYNKYKCKVDAVEQSEIELTKAKISFQRGG\n>tr|A0A4Q7MI29|A0A4Q7MI29_9BURK Enoyl-[acyl-carrier-protein] reductase [NADH] OS=Kerstersia gyiorum OX=206506 GN=EV679_2606 PE=3 SV=1\nMRSANLAGKKGLVVGIANDQSIAWGAARAMRASGAELAVTWYSDKSLPYVTPLFDEIGATLRLPLDVSDTAQQQALFDTLRERWGRLDFLVHSVAFAPRDDLHGRVLDSSAAGFAQAMDLSCHSFIRLARDAEPLMAQGGSMMTISYLGAQAVMPGYGIMGPVKAALEASVRYLASELGPRGIRVNAVSPGPLETRAASGIAGFDSLIKDSMERAPLRHTLDIEDAGALCAFLASDAARAISGSTLFVDNAFHILN\n>tr|G5HTX5|G5HTX5_9FIRM Uncharacterized protein OS=[Clostridium] citroniae WAL-17108 OX=742733 GN=HMPREF9469_06037 PE=4 SV=1\nMGLFGNIIKPLQGKLTTKQEENMKKVAEVFKEKTGKDYQTAVVWKMTTKKKLTKTVYTYYNWIIGYGVNADHIPEIVFIPVDPKWEWIGDPIYCPKTNSEMVQDKKTTLFALKNSQLEDGKMDLQLISSMAMMSNYLMDVNYMFEYDKLNEYCLEHWVGK\n>tr|A0A0Q8RTN2|A0A0Q8RTN2_9SPHN Uncharacterized protein OS=Sphingopyxis sp. Root214 OX=1736491 GN=ASE06_19140 PE=4 SV=1\nMPLDGSLGTTNAARATVTIEYSATDRSYTVTTDGRSQTFRPADIDAARSSAAATVYIRTNGGTADVLTLTKPGTSGRLTYQYVAGGFWERTVSGATSTSGSVDGFAYGVETPDAALPRSGTANYGIDLIGVMGYPNSAPSPLAGRGTLYVDFAKGSIVITGEADGGTTFNGTATIASASNNFSGRFEYYSLGSMTGQIDGRFFGPGAQEVGAAWHVKNNGGNAAAGIILGRKNPDTPVNSDFVNIANSQFFENSGVILKATYANGSNNSSNKLTQASDFLVHYDAGYKSYTIVAGDKAEFFGPDRVPDNAAPGSHWTKGIGTTRSTLQFLNGGTHVTGARYVFTDGDATSSFVTSNFFIYGFPTANADIVRSGTSFFKSSIAGSMTDQGYDSLLDIAGPGVIQVNFATGAIDIRGAFDIVYRPITGPRAVGNGSYTGTAQLASSANSFTGSIELAASDTYRGDLSGRFYGPAGKELGAIFKASDSGGDVAAGTITASLDPSANASTKALADLTETTVFISSKAQAGITVDQPSGRQFSLGPPSVSRTGLQPRITYDPQTGSYIVREFGGDHQDQLLETLRFGTADRDTAASDAKFDVFNVASGNTTHRISLLRPGAGNPAIQLTYASFIGLVSKTVEGAPINRDTTRYSYFALGTPTAETLMPRSGTGTYNGLATGYGTVRGIGFAEYDISGTSKLSVNFTSLATQLDLTLAGRNLADGTNFNFGDFIFNGALGYSLVDGQRLNQISMGLKRDTLPPGSSGDAFGHLYGPAGQEHVTPFGMQVRGADGSETVIGGVAYGKRD\n>tr|A0A6N7CL63|A0A6N7CL63_9NOCA HTH-type transcriptional regulator IscR OS=Rhodococcus sp. T7 OX=627444 GN=iscR PE=4 SV=1\nMKISGGVEWSLHCCVVLSQAEGPVPTARLADLHGVSKSYLAKHLQSLARAGLVHPTEGRDGGYVLTRAPGDITVLDVVQAVDGDAPAFRCTEIRQQGLLAAPPEQCKTPCGIARVMADAERAWRSTLSGVTIADLAATLDVTVLKATLEASG\n>tr|A0A678Y985|A0A678Y985_9INFA Polymerase acidic protein OS=Influenza A virus OX=11320 GN=PA PE=3 SV=1\nMENFVRQCFNPMIVELAEKAMKEYGEDPKIETNKFAAICTHLEVCFMYSDFHFIDERGESIIVESGDPNALLKHRFEIIEGRDRIMAWTVVNSICNTTGVEKPKFLPDLYDYKENRFIEIGVTRREVHIYYLEKANKIKSEKTHIHIFSFTGEEMATKADYTLDEESRARIKTRLFTIRQEMASRSLWDSFRQSERGEETIEEKFEITGTMRKLADQSLPPNFSSLENFRAYVDGFKPNGCIEGKLSQMSKEVNAKIEPFLRTTPRPLRLPDGPLCHQRSKFLLMDALKLSIEDPSHEGEGIPLYDAIKCMKTFFGWKEPNIVKPHEKGINPNYLMAWKQVLAELQDIENEEKTPRTKNMKKTSQLKWALGENMAPEKVDFDDCKEVGDLKQYDNDEPEPRSLASWVQNEFNKACELTDSSWIELDEIGEDVAPIEHIASMRRNYFTAEVSHCRATEYIMKGVYINTALLNASCAAMDDFQLIPMISKCRTKEGRRKTNLYGFIIKGRSHLRNDTDVVNFVSMEFSLTDPRLEQHKWEKYCVLEIGDMLLRTAIGQVSRPMFLYVRTNGTSKIKMKWGMEMRRCLLQSLQQIESMIEAESSVKEKDMTKEFFENKPETWPIGESPRGVEEGSIGKVCRTLLAKSVFNSLYASPQLEGFSAESRKLLLIVQALRDNLEPGTFDLGGLYEAIEECLINDPWVLLNASWFNSFLTHALK\n>tr|A0A2N6J824|A0A2N6J824_9BURK Lrp/AsnC family transcriptional regulator OS=Herbaspirillum sp. BH-1 OX=2058884 GN=HBH1_03049 PE=4 SV=1\nMELDTTDLRILNILQENSSISNLELASRINLSPSPTLARVKRLETEGIISRYVALADPHLLGLKVNVFVKVILERQGAEALAQFETAVSAFDEVMEVYLMTGDEDYLLRIVVPDLLTLEHFIVDHLTKIPGIKNIRSSFALKQIKYKTALPTPKIKTRR\n>tr|K2Q3C7|K2Q3C7_9HYPH Uncharacterized protein OS=Agrobacterium albertimagni AOL15 OX=1156935 GN=QWE_16493 PE=4 SV=1\nMATILLQAAGAALGSVFGPVGAAIGQAAGALAGSMIDRSLLSGTREVNGARLSSARISGASEGTVIPRLYGTARLGGTLIWATRFEEETVTERTGGKSSGGTRTTTYRYFANLALGLCEGPIAGVRRVWADGRELDTTEIEMRVYRGTESQPADPLIAAKQGADNAPAYRGLAYVVFERLPLDDFGNRIPLIQFEVIRPVGALEEKIRAVTMIPGATEHGYATVRISDAPSEGAKRWLNRNTLVAATDWQASLDELQALCPDLESVALVVAWFGTDLRAGDCRVLPGVEVGYRNEESRPWSVAGLARGDAYVVSRHSGGPAYGGSPSDESVIEAIRDIKARGLKVTLYPFVLMDIPAGNGLPDPYGGAEQAAYPWRGRITAYPPGSDKTASARAQVSSFVYRSDGYRRLVLHYAALAAAAGGVGAFLLGSELRGLTVLRDEANAFPFVEALVALAGEVRGLLGGGTAISYGADWTEYFGHQPPDGSGDVFFHLDPLWASPHIMAVGIDNYMPLADWRDEDLEAESPDGFTGADDAEGFARTLTSGEGFDWFYASEADRRARVRTPITDGAYGKPWVFRFKDLKSWWENPHFNRIGGVEQASPTAWVPRMKPFWMTEVGCGAVDKGANQPNIFVDAKSAESGRPYFSAGARSDSQQRRFLEAHLDHWTGSLLPPDMVDPSHVYAWTWDARPYPAFPQNMALWADGSNWRTGHWLNGRLGTATLADTIAAILRDHGFADFDVSEVAGDLGGYVKGDLTSARDLIEPLLELFQIDVIEDAGRLKFRTRPTASLAAREITVLADIADRPLWSETRGHDSDFASEALVTFYDPASDYVEASVRSRKVEAATDRQLARDLPAAMPEETALAAAEGWLRDNRLARRTVQLALGPQEIVVEPGDVLRFPEGPEGRFLVQGIDEGFERRLTLRAFAGKVSAPVPVVEPGRVVDGGGAAGFAPVVQFLDLPRLEGASHAGDASVAAYGRPWRRLAVSSSPEAEGYRLRLTLDRPATLGRLVEPLLPGPVGRFDGANALVVEVLAGAFASANRMAVLSGANRIAVRTGTGGWEVIGFVEAEEIAVGHFRLTGLLRGLGGTEDAMAAGAAAGAEIVALDEAVRSLGLANAERGAAQNWILEPMGLVSELSGPHVFAGGLRAETPLSPVHAKVRRQATGDLAITWIRRSRIEAEAWTEGEVPLDEAEERYRLEILDGGTVLRVVEVTEPAWTYAGADELTDFGVPQTALGLRIRQLGRLAAGMPLQAVVPID\n>tr|A0A373NFP0|A0A373NFP0_9FIRM Histidine kinase OS=Ruminococcus sp. AF31-14BH OX=2293173 GN=DWZ26_10045 PE=4 SV=1\nMIETIMLIVVIFVLSGVFWYSFFYQKEKKLFNRLQQMLDCAIDGELERTEISEEKYSALENSMKQYIDSSFLAKKNQQEQKEVIQKLISDIAHQTLTPISNLKVYGEIISEMSNENQEEIATILEQTEKLDFLIQSLVKLSRMESGIIAVHPEDTAIAQMFASVQQQFNVKAMEKDISLSLFDTDLHAMCDAKWTVEALGNIVDNAIKYTACGGNVQIKTEQYSFFVKIDIIDDGIGIEKEEIPKIFGRFYRSLSVADQPGVGIGLFLAREIIQAQKGYIKVTSKRGKGSTFSVFLPIAKKE\n>tr|A0A538LIU9|A0A538LIU9_9ACTN Alpha/beta hydrolase (Fragment) OS=Actinobacteria bacterium OX=1883427 GN=E6G01_13160 PE=4 SV=1\nEAAPIPGPNGKSLGPSELVDAGLIPTYEPAADSQFYDALSSALNDRPGQMLALAAAYQESVDYPLYASVECIDSPHPEGSAAFRAFAQELASLSPRFGAAIANELLPCAYWSAPVRSVVGPVTAPDAPPMLVIGTTGDPATPYDQAVRVAQTLAHGRLLTFVGDRHAAYGASQCAADAEAAYFVDLTLPPEGTTCTR\n>tr|A0A7K0C3Y3|A0A7K0C3Y3_9ACTN Uncharacterized protein OS=Actinomadura macrotermitis OX=2585200 GN=ACRB68_61920 PE=4 SV=1\nMAVFGVDYAWGRPGAAALKRSGVRFACRYLSHDTGGKNLTRAEAAELSAAGIWLVVVWESTASRALSGRAGGAADAREAARQAAACGMPADRPIYFAVDFDATAGQQAAINAYLDGAASVLGRRRVGLYAGLGPVRRAFDAGKITYGWQTYAWSGGRWDGRAQLQQYSNDHTVNGVDVDYDRAVAADYGQWRVGVSPQEDDMPDYVSVGTTTAQPLPPGAWTTVVWDAEYSDAGRQHADKGGPGVLNGPARYSLTAAVRIVGVPAGTRIQARAIEADAGGFEAGAVQDFTSAGEETNLLYGISADSVAKDRSVRFQVLQHGAQAAAIGGGSAKLLYWRG\n>tr|A0A173CWC4|A0A173CWC4_9NEOP Cytochrome c oxidase subunit 1 (Fragment) OS=Bucculatrix sexnotata OX=687279 GN=COI PE=3 SV=1\nIFGMWAGMVGTSLSLLIRAELGNPGSLIGNDQIYNTIVTAHAFIMIFFMVMPIMIGGFGNWLVPLMLGAPDMAFPRMNNMSFWLLPPSLLLLISSNIVEMGAGTGWTVYPPLSSNIAHGGSSVDLAIFSLHLAGISSILGAINFITTIINMRTNKMSFDQMPLFIWAVGITALLLLLSLPVLAGAITMLLTDRNLN\n>tr|Q0JI52|Q0JI52_ORYSJ Os01g0823700 protein OS=Oryza sativa subsp. japonica OX=39947 GN=Os01g0823700 PE=2 SV=1\nMESATEKVRRTPSSCLLLRISDICKVRSVGVAPTVREKPKADGSATGESSEDGGAHLKVHPHHVSDHESVSECSSARCEEAFVERLLDAISGLKLSYVNLQQALVPYDPEEITIADERFTSELQETAGLKDLYVNMNKWRNPMYQCYVGSRIQEQQKLAVELQAGMCKRDSEIVCLRAELDELERKNMELEEKIGQSALQKEGSFAIGMGVSTDMFMELFELSTKSIHDFAKLVVRWMKLSRWNLGNLTSPIDNSVVYDKRSHKNYAVEAYFACMMLMGHKEEYLSLDVFDYVMSFSDPFDALMKAPDSCFGRFCREKYLAILPPSMEDSFFGNLDHRSFVENGGHPRTPFYQAFVTMSRYVWASLTVARSLNPRAEMFYVKGGTEFRSKHMECVPSKITKEGDKVSVGFTVMPGFKIGCTVIRCRVYLSMVNERNF\n>tr|A0A7S0VQU1|A0A7S0VQU1_9CHLO Hypothetical protein (Fragment) OS=Polytomella parva OX=51329 GN=PPAR00522_LOCUS21823 PE=4 SV=1\nKGNQYTNRNYNPHHNDRGDGDEGNSSHCSSDDDGNVDRVATTLKKGNKDSELIDSSFHYREMEVKEERSDTWSGLSNLFHPIASPSAEQILEQLQMIGRTRQLERDRLKQGLQGEESSAESHVAS\n>tr|A0A7N0VGN9|A0A7N0VGN9_KALFE Smr domain-containing protein OS=Kalanchoe fedtschenkoi OX=63787 PE=4 SV=1\nMASSTPPPHCSITTTNPRSHSRTKSNRVVSLTNPTPSAAAAGAPPCCASSKPLCPAKTHPLASASPSSPRNPNFPSLSDFSGRRSTRFVSKMHFGRHKPSPTSSRHTSVAEDALHQVIRVNATDHRALDAVLHAFAPNLSGSDDYTFLLRELGNRGDCSKALRCFDFAVQRERRKNEQGKLATAMISVLGRMGKVDLARKVFDDAAAQGYGNSVYAFSALISAYGRSGYCDDAIQVFEAMKKSGLRPNLVTYNAVIDACGKGGVEFSRAANILNEMLSDGVLPDRITFNSLLAVCSRGGLWEAAQNLFSEMIYRGVDQDIFTYNTMLDAFCKGGQMDLAFQTMSEMNSKNICPNVVTYSTMIDGYAKAGRLSEALNLLEEMKYAGIGLDRVSYNNLLTIFAKLGRFDEVVNVCKDMESSGIRKDTVTYNALLSGYGKQGKYDDVKKVFQAMRHEHISPNLLTYSTLIDIYSKGGLYQEAMEVFTDFKKTGLKADVVLYSALIDALCKSGMVETAISFLDEMTKGGIKPNVVTYNSIIDAFGRSAIKDFQTDSPAEASELQNESSSSTLPPARSQNGNRIGSGFIKILGHLAAEKPCYLKKYDGKPLEILCILAIFHKMHELEIKPNVVTFSAILNACSRCSSFEEVCMLLEELRLFDNKVYGVAHCLLMGCRGSVWVQAQSLFDDVKQMDSSTASAFYNALTDMLWHFGQKQGAQLVVLEGKRRHVWENLWSDSCLDLHLMSSGAARAMVHAWLLNIRSIVFEGHELPKLLSILTGWGKHSKVVGDGTLRRHIEALLNSLGAPFRLAKCNLGRFISTGINTYMIMMLPSL\n>tr|A0A2V6QIG5|A0A2V6QIG5_9BACT 5,10-methylene tetrahydromethanopterin reductase OS=Candidatus Rokubacteria bacterium OX=2053607 GN=DMD80_16590 PE=4 SV=1\nMRLGLALPNASPEGRPLTGPALIAGTRAVERAGFDSLWCFDSIGRGSMIPDPLIAVSVAATVTERLTLGTGILQVPLRRPVELAHRILTAHLICGGRLLLGVGAGSTKADFDAVGVDFDTRMQQMEEALALMRRLWQGEKVGPAQLNPWPAALGGPKLLIGSWAGSRWIPRAAKDFDGWIGSGARSSVAALRDGIKRFREAGGQRAIATNIPVDLEAPTAPMPEEGQFHLRCDPTTAAQRLRMLADLGFDDAVLVTRRYGDADLAALRALWP\n>tr|A0A7Z7G3P1|A0A7Z7G3P1_9BACL UPF0310 protein SAMN05518670_2319 OS=Paenibacillus sp. OK076 OX=1884379 GN=SAMN05518670_2319 PE=3 SV=1\nMNEQAKHDLMANNTEIQQTHTREFLSHQLDIEAESDEGNRYWIGVVSASHVEKGVEGGFAQLCHGKVASLRRMNAGDWLIYYSPRTSMQGGKVLQAFTAIGRIIDDQVYTYHVSDSFVPHRRNVHYYPCQQVKIADLLDQLILTRGQARWGYPFRYGHLQIQREDFLKIAVAMLGTEAENLLTGNKKN\n>tr|A0A1I0CXW7|A0A1I0CXW7_9FIRM D-alanyl-D-alanine carboxypeptidase OS=[Clostridium] aminophilum OX=1526 GN=SAMN04487771_100922 PE=3 SV=1\nMKSNLFHWKRYLWILSAAGILTVSATPAVVFAAPETGAASTAAQSGSEASAIAETTETATKALYGTSPQQAQSARVASIAAQAAATAGTGEEASAAVASIAAAAAETAAQEVTEDAQAWPSDTGIFSEAGVVIDVDSGCVLFGQNMHQQKAPASITKILTALVVLEHVDNLDQMIPYSHDAVYNTESGSGNKYGLDEGDSLSVRDALYLMLLASSNQSANALAEYVGGTREGFVQMMNDKVAELGCRDSHFANPSGLNDDTQLTSCYDMALIGMAAYRNERLLEIGSTRSHKITTPTKNNPNGINVKMEHKLLITEDPNSENYYPFAVAGKTGYTSIAGQTLVTYAVKEGRRLIAVTMKSRQKTHYTDTINLLEFGFNRFENVPVAEQETAISQASGNVTLGDSTFDAADLSVEETVMTVPKNLSVTDLERTVLTGEDMPAPAPDGAAAYIQYSYRDRVTGGAYVTAESLRAKETGATGTEGNRRTKAESGDNIFSKAAKGIGSFFAGIGDAVRNLSVPGIIAIAAVAGLAILTVIAFFTYSVQKRRENERLERRRTRLREMGVSEEEFAEMVGRRRRSRGEKNSSRDFSAETYRVTEAGNSPADHHGRAEDVKSPAVPQTEALKTETPENPDDSFLDEDFGMDGELITEEDPEKRQPHV\n>tr|A0A445NDM6|A0A445NDM6_STRNE Putative glycosyltransferase EpsJ OS=Streptomyces netropsis OX=55404 GN=epsJ_2 PE=4 SV=1\nMVKLSVIVPFFNVQTYAPDTLRSLRANARADFEFILVDDCSTDETPDILRRAERELPGAVLVRHEKNGGLATARNTGLERARGEYITFLDGDDWLAPGYYEQLLDVIEGLGVEFVRTDHVQCTARARTVHRVPHGRRGVVLSPRDAILPADRSTSVDYAYAWAGIYHRRLLDEGLLHFRHGLRTAEDRPWIWRLHREARTFAVAGLLGVFYRRGVASSLTQIGDVRQLDFLRAFDQVIDETSRDADAEILLPKAVRTYCAIISHHLGSIERFEPAVARTLRSKSAAALRRMPQDLLKDALNSMDDDRAARLRRLRRRPAPAGVTG\n>tr|A0A1G5TNQ2|A0A1G5TNQ2_9HYPH Uncharacterized iron-regulated membrane protein OS=Methylobacterium sp. UNC378MF OX=1502748 GN=SAMN02799622_03000 PE=4 SV=1\nMSRARSFRQSMAWLHTWSGLVVGWVLFAIFVTGTASYYRTDISHWMRPELSDSSSDPAAAATRAGAFLQKAMPNAAGWSVRLPNAENPAVEVYWWPHPGGPYHHALLDPATGEPARVRDTRGGDFLYRFHFELSLPPIWGRWIVSVCAMILLIALISGIVTHRRIFADFFTFRRDRSAQRGWLDAHNVMGVLALPFHLMIVYTGLVTLSAMLMPWGMKAVYGNDPLRYYAEAGLATPGVAPAGRPGTPLPLGELVARAAAAGGAVPEVMLVTRPGDAGATVTAYFEEPMGLAHLHPQIAYGADTGSEIARVGEPGAATRTGAVMAGLHEAHFAAAPLRLLFFLCGLMGAATVASGLVLWTVARAPRGADPEGFGLRLVRLLNIGTIAGLPVGLAAYFLANRLLPLGLEARADWEIRVFFAAWITAAIAASLYPRRRAWSVALAVPACAFLVIPVIDAVLVGQPRFLAFDAAMAVVGLALVAGSRLAARPRPAESRLVEANLSRTVEA\n>tr|Q71P98|Q71P98_9BRYO Protein PsbN OS=Homalothecium laevisetum OX=184649 GN=psbN PE=3 SV=1\nMLTLCTIILIKLIKNKPFFWNYLKMETATLVAIFISCSLVSFTGYALYTAFGQPSKELRDPFEEHED\n>tr|A0A3B0J0J5|A0A3B0J0J5_9RICK Uncharacterized protein OS=Wolbachia endosymbiont of Aleurodicus floccissimus OX=2152762 GN=WBAF_0556 PE=4 SV=1\nMRLKLAYTNTIHLKHDFNIGDIETKKLCHSKIMLRFQEKAVSSQISCVTEINFGRIAIATANDKQASVYYIFKQNVKHMGNHVLFKVRVGRVATHIFVSDPNLAKIIKCLTIRVMIYIIMAII\n>tr|A0A4T0N0J3|A0A4T0N0J3_9BASI Tudor domain-containing protein (Fragment) OS=Wallemia mellicola OX=1708541 GN=E3Q01_03257 PE=4 SV=1\nSAEEISQYELQLEQVKETLTADPTNAELIGLKDELSNLIDLLKASTAPAQTAPSTSEQPPQSKGKDSKDVKIFKAGEDIMAKYNDGKFYPAIVKAVSGIHPKIVYTINFRGYEGTQQVQPNQIKAMDPHTKISLTNKRQRDSQKSLTSIEDEKERERKRKKSEKKAEAREQKNSEMNNKQNNWQKFAKKANKKGIHIAGSEGRSIFKTPDNPYGRVGVTGSGKPMTEQKSVRDKHVFVPTLEDQ\n>tr|A0A2I2A5J4|A0A2I2A5J4_9GAMM YigZ family protein OS=Hydrogenovibrio sp. SC-1 OX=2065820 GN=CYQ88_04895 PE=3 SV=1\nMAYLEPVNAVVEETEIKKSRFIAYAKKVVSRQQAMEYVSELRVAYPDARHVCWGYVIGDPNNSTNSGCNDDGEPSGTAGKPILSQIHYSNIGNVVVVIVRYFGGIRLGAGGLVRAYRESAQKGLKALQTEDYIPKLELSLDCPYEEEALIRRVMASLQGEITDAIYTTQVNLLVSIPTHSLTLLQDQLASLSATIIEN\n>tr|A0A7W8SVI5|A0A7W8SVI5_9BURK Membrane fusion protein (MFP) family protein OS=Paraburkholderia sp. WSM4180 OX=2723099 GN=HDG39_006657 PE=3 SV=1\nMNFNIFKRGKKKAKLTKGDAAFMSDIRESLLTQSTPGSMIMLYVILTVLAGGLTWAYFARVEEITHGEGTIISKSREQVIQSLEGGILEQLDVREGDIVKKGQVLAKIDPTRAETSYREAWSKSVGLKATIARLRAEAYEQPLTFPDDVKAVPTVVKQETLAYNARRRALNDSVTALEKSYSLSNKEIGLAEPLAAKGLVSEVELLRMRRQANELRSQIVERRNRFQADANSELTKLELELAQTSETVVGRADVLQRTTVIAPVYGTVKNIRFNTIGGVIQPGEHIMEIVPLEDQLLVEARIKPSDVAFLHPDQPSTVKITAYDYGIYGGLKGTVQHISPDTLKDDQKAAAGRPDATYYRVLVLTDSSELHAGGKSLPILPGMVATVDIRTGEKTILDYILKPIFKAREAFRER\n>tr|A0A421K520|A0A421K520_9GAMM Alpha-amylase OS=gamma proteobacterium symbiont of Stewartia floridana OX=1968599 GN=B6D75_05870 PE=4 SV=1\nMSVDELDTRLLGHLSLLYGEQQAATLLPKLHELIGRHIEVRQGKRLEIPRWDEKDSVLIGYGDSIQYPGMTPLASLKQFLDRRLNGVFSMVHVLPFFPYSSDDGFSVSDFRSVNPELGDWQDIRELGENFSLLFDLVLNHMSREHLWFVNFVHDEEPGRDYVVQVSPDENLSMVVRPRSTPLLSRVRTPRGMLDVWATFSNDQIDLNYANPEVLLEFIDILLDYIRRGARAVRLDAVAFLWKEIGTSCIHLPQTHEVIKLFRTLLDVLEPGAILLTETNVPHQENISYFDQGDEANMVYQFSLPPLILHAIMCQTTEFLVPWARSLEQETLPEGCTYLNFTASHDGVGLRPLEGLVPDEDLDELLDMMRRRGGYVSMRATTEGRDRPYELNISYFDAFAAEDDDVDPWHIARYMLSQTLPLSFRGIPAVYINALGATPNDPLGVERTGMTRSINRRKWDGAELERLIDLPLTDAGQVFPEYIRRLRIRSGIKAFHPDAPQRVLDMPDGILALERTSLDGGQRVYAIHNMTGDLRSVDISALGGASRRWFDALHQVVPDMDGDGVRFRPYQTVWLMAKG\n>tr|A0A182WP14|A0A182WP14_9DIPT Uncharacterized protein OS=Anopheles minimus OX=112268 PE=4 SV=1\nMSPCVNFRLANLLSHKS\n>tr|A0A6P5JSA5|A0A6P5JSA5_PHACI probable aminopeptidase NPEPL1 OS=Phascolarctos cinereus OX=38626 GN=NPEPL1 PE=3 SV=1\nMANVGLQFVASAGDGDPQSRPVLLLGQLQNLHRVPWSHLRGKLQPRVTEEIWQTALGTLNPNPTDSCPLYLNYATVAALPSRVSRHNSPSAAQFITRLVRNCLPGGTNRCILMVCERSEVFASACALARAFPLFTHRSSASRRTEKTVTVEFFLVGQNNGPVEVTTLKCLTSATEGVRLAARIVDTPCNEMNTDNFLEEIKKVGKDLGIVPTIIRDEELKQRGFGGIYGVGKAAVHPPALAVLSHMPEGATQTIAWVGKGIVYDTGGLSIKGKTTMPGMKRDCGGAAAVLGAFRAAVRQGFKDNLHAVFCLAENSVGPNATRPDDIHLLYSGKTVEINNTDAEGRLVLADGVSYACKDLGADIILDMATLTGAQGIATGKYHAAVLTNSEEWEAACVKAGRNCGDLVHPLVYCPELHFSEFTSAVADMKNSVADRDNSPSSCAGLFIASHIGFDWPGVWVHLDIASPVHAGERATGYGVALLLSLFGGASEDPLLNMVSPLGEDADPQGDMERDCKRRRLV\n>tr|A0A5J6X1V6|A0A5J6X1V6_9GAMM Histidine kinase OS=Aeromonas simiae OX=218936 GN=FE240_18420 PE=4 SV=1\nMPRSLLSRMLLLLLLAILLSQTILTGIWMQQIQKRELDGMLSTTRNLAMSAASTVSFFKSLPLQYRHIALDQLRNMGGSRFFVSLNEEEIRINPIPDSERKTMVLSEVKAILGNKLSDTMAIKVNFSHPEDLHVFNNDTLLADLPSSWARYTLSLEPINPPVLVIQIEIKRGEWLYLAALLPAPYMTLDDTVMPANQVRFIALMTVFLCFFTFLLVRWQTRPLRRLAKAAVNLGKDIDQPSLKEEGASEIVAATRAFNIMQHRIRRYIGDRELLFSSISHDLKTPITRLRLRVELLDDETQITKFNKDLDELELMVKGALQTVKDTDIHENMAQIDVDGMLHQLAESLNLREERLTIEGHCKHPYRGKPLALKRCIANLVDNGIKYGKKVRIIILDDDEMLILFIMDEGPGLPEEQIERIFEPYYRFDTEKPGNGLGLGIARNIAHAHGGDLVLENRPTGGLQATLSLPRQ\n>tr|A0A1Q6SWC2|A0A1Q6SWC2_9FIRM Aspartate--ammonia ligase OS=Subdoligranulum sp. 60_17 OX=1897022 GN=asnA PE=3 SV=1\nMSHITIPEGYQSLLGLYDTQKAIGLIKTIFQEKLCMALHLKRVTAPLFVMQGSGLNDDLNGVERPVSFDVPSLNEQAEVVHSLAKWKRYALYKYGFRPGQGIVTDMNAVRRDEELDNLHSIYVDQWDWERVITADQRTLEFLQETVRDIVDAVCATSDELRWKFPELKNNIHLGREVAFITTQELEDRYPDFTPKQRENAFAKEHGTVCIMQIGGRLKSGQPHDGRAPDYDDWTLNCDILFWHKPLDCALELSSMGIRVDADALRRQLDAAGCPQRAELPFHKLLLDGTLPLTMGGGIGQSRLCMLLLGKAHVGEVQVSLWDDATVQACRNSGVELL\n>tr|A0A7W1W6Z4|A0A7W1W6Z4_9BACT S46 family peptidase OS=Acidobacteria bacterium OX=1978231 GN=H0X49_12420 PE=3 SV=1\nAAENLFNKFEGKERRSAEETFAESIAERENFDTPEKVIKLYDLSLSDLQKRYPNIVEFMTALGQEKSAVTARTAKFNGEIDRLRLLYQQGMAEMKGIQPYPDANSTLRFTYGNVRGYSPREAVTYSPFTTLRGMIEKDSGEIPFDVPQKLIDLQRTKDFGRFGVGDTVPVNFLATTDIIGGNSGSPIMNAFGEQVGIVFDGNYEGLGNDLFYNEAVGRTIAVDIRYVLFVTEKFGGAGWILGEMNIKGRTPVKARSAAAE\n>tr|A0A1Z2QUG4|A0A1Z2QUG4_9ASTR Ribosomal protein L14 OS=Legenere valdiviana OX=2010882 GN=rpl14 PE=3 SV=1\nMIQPQTYLNVADNSGARKLMCIRIIGASNRRYAHIGDVIVAVIKEAVPQMSLERSEVVRAVIVRTCKELKRDDGMIIRYDDNAAVVIDKDGNPKGTRVFGAIAEELRQFNFTKIVSLAPEVL\n>tr|A0A239R358|A0A239R358_9FIRM Exodeoxyribonuclease III OS=Lachnospiraceae bacterium OX=1898203 GN=SAMN06297422_103139 PE=3 SV=1\nMKLISWNVNGIRACVNKGFMDTFNTLDADILAIQESKMQKDQLILETPGYHQYWNYAKKKGYSGTAVFTKKEPLGVTYGMGIEEHDQEGRLITLDMGDYYFVCVYVPNSQNELKRLDYRMKWEDDFRKYLNDLKAEKPVIICGDLNVAHEDIDLKNPSANHRNAGFTDEERGKLTELLESGFTDSFRKLYPDMTDIYSWWSYRFNARERNAGWRIDYFLVSDDIKDKISEAGIHTDIYGSDHCPVELDIDL\n>tr|A0A498QHK7|A0A498QHK7_9MYCO Uncharacterized protein OS=Mycobacterium attenuatum OX=2341086 GN=LAUMK136_05508 PE=4 SV=1\nMPHAESTVGPALMVAHSGASSHASAPGRDRLEPRAVSRELRASDPEVWQTGLHAASEDAPLRVVGNTPSGMFVDGRRKGSVTVSDKTIVRFGDPTGGKALTFEVVRPSNSPEEQRREQRPSDQSDGHTGEADPGVVRAGAAAAARRRELDISQRSLAADGIINAGALIAFEKGRSWPRERTRAKLEEVLQWPPGTIARIRQGESVGYQAPSPTAQADDEAQPTEGPASLIAQAVAAAVDTCSLAIAALPPPEDPEFTERAAPILADLRQLEGIAVQATRISRITPELIKALGAVRRYHDKLMTLGATAPGATLAQRLYAARRRANLSTSETAQAAGVAEEMIVRAEAEEALPAEAAEAIEALIHQIN\n>tr|X0B5K4|X0B5K4_FUSOX Uncharacterized protein OS=Fusarium oxysporum f. sp. raphani 54005 OX=1089458 GN=FOQG_17891 PE=4 SV=1\nMVGRPKETSACSGKSGPGSRPDNPVGRGSVWGPEEGSSPARNRASARGTAGRLSMSSRSLYTGRRGRTRMSVGQEDGI\n>tr|A0A345E3A3|A0A345E3A3_9EURY Sodium:calcium antiporter OS=Haloplanus rubicundus OX=1547898 GN=DU500_09665 PE=4 SV=1\nMRRQALTALGGAAALTLPWVVTYLSGMAHSLATGTVVLVSGLSVLGASFLLAWGAETAEKDVPRAFAIAVLAVLAVAPEYAVDALYAWNAGVHAGTARGVEAGNLAVANMTGANRILIGIGWAGIALFTVYRAGSGDDPAVESRSGFLADAVTLDHDIGLEIVFLFLATLWAFLVPLGGGIDILDMAFLVGLYIAYIAVILKGDVDPDEAHVGVPAYLQRFPKPYRAATVIGLFVYSGLMIFTAVEPFAHGLEQLGQNIGIPSFFMIQWIAPLASESPELIVVVYLVNKARSTAGFNALISSKLNQWTLLIGTLVVVYSIALGQYGALPFDQKQSGEIWLTAAQSFFAISLLVNFEISVREAIVLLVLFLTQVLSEFLLIRGILELPISDYQLLLVFTGIYIVLGTTLFVARRHALGSIVRDSAGTVSDAFSSSGEPRGAD\n>tr|A0A1E5AGD2|A0A1E5AGD2_9RHOB Peptidoglycan-binding protein OS=Rhodobacteraceae bacterium (ex Bugula neritina AB1) OX=1868286 GN=AB838_08000 PE=4 SV=1\nMTPPRSLLRGRQAPPLLLALLATLAACVQPQPGGPGSETGRYAPPGAAPGTCWSKHTAPAVIETVTRQVLAEPEQQDANGRVIRPATFRTETRQEIVRPRQEQWIEIPCPAMMTPDFIRTIQRALTARGLYRGPVHGRMDAATRRAVQRYQAPLGPDSGTLTLTSARRLGLVAVPG\n>tr|A0A0K0DCJ6|A0A0K0DCJ6_ANGCA Ge1_WD40 domain-containing protein OS=Angiostrongylus cantonensis OX=6313 PE=4 SV=1\nMGMGDPCVPADHLSPSLARIGAYTAQNDITITLLIIGRSCIVNLGAILFTSVSVIYSSTLDGSDGVIKFANGNNVRALKGRFLTVQGDLIAFRFFNEHTGDVIRIINRVSRNRRLIKGFSKAPVDLCFATHLPLLAVVDGESNLHVYSVASDCQDVETYINIMNWPGSTSNSTPRVVWCPYVAENPSDPSDVVNMLALSKKNSVYVVNLSILKERGSRMTFEEALAVEEAVLSVEMEEDVTAVCISPDSTAVAIARADGVVSFYVMNSNESGLKFAHTWNPQMNRPIVELFFLDGARHIKNQEQFWRHCLVVAEGGRRLALFECENWRCLGRVRFESSVEMATFAVHVDPQARYVHILDIDGSNVFCIELEYSDHPRFAGVTQVTFSHPIIAIVPYEHVYIFIEYSLDDEFDGDRTRNEVLAHYIAIGHRSLLQLDVHLELAELPKPNVDVVPLIKTDAGRDEAERNNEGPSNLLTMVHPPAMNSTSTITYEKLLELVKDMSDKIEQLSVRVERADIERRSAATNEHILSQLQCFKEEFSLREDRLLANVSDLIETNHRETINVVRNALNENSVAVENSIQANHKVFFSAVLCELFTYDMNITYLLLCFLKIVDNLKLPYCSSA\n>tr|A0A1P8LAL0|A0A1P8LAL0_9INFA Polymerase basic protein 2 OS=Influenza A virus (A/Washington/101/2016(H3N2)) OX=1936961 GN=PB2 PE=3 SV=1\nMERIKELRNLMSQSRTREILTKTTVDHMAIIKKYTSGRQEKNPSLRMKWMMAMKYPITADKRITEMVPERNEQGQTLWSKMSDAGSDRVMVSPLAVTWWNRNGPVTSTVHYPKVYKTYFDKVERLKHGTFGPVHFRNQVKIRRRVDINPGHADLSAKEAQDVIMEVVFPNEVGARILTSESQLTITKEKKEELRDCKISPLMVAYMLERELVRKTRFLPVAGGTSSIYIEVLHLTQGTCWEQMYTPGGGVRNDDVDQSLIIAARNIVRRAAVSADPLASLLEMCHSTQIGGTRMVDILKQNPTEEQAVDICKAAMGLRISSSFSFGGFTFKRTSGSSVKKEEEVLTGNLQTLRIRVHEGYEEFTMVGKRATAILRKATRRLVQLIVSGRDEQSIAEAIIVAMVFSQEDCMIKAVRGDLNFVNRANQRLNPMHQLLRHFQKDAKVLFQNWGVEHIDSVMGMVGVLPDMTPSTEMSMRGIRVSKMGVDEYSSTERVVVSIDRFLRVRDQRGNVLLSPEEVSETQGTERLTITYSSSMMWEINGPESVLVNTYQWIIRNWEAVKIQWSQNPAMLYNKMEFEPFQSLVPKATRSQYSGFVRTLFQQMRDVLGTFDTAQIIKLLPFAAAPPKQSRMQFSSLTVNVRGSGMRILVRGNSPVFNYNKTTKRLTILGKDAGTLIEDPDESTSGVESAVLRGFLIIGKEDRRYGPALSINELSNLAKGEKANVLIGQGDVVLVMKRKRDSSILTDSQTATKRIRMAIN\n>tr|A0A0A9C7I2|A0A0A9C7I2_ARUDO Uncharacterized protein OS=Arundo donax OX=35708 PE=4 SV=1\nMRSKSARMRRLVPPTTFSRYRETSSGGRRKQSVLTTTKDCSSMGLWAIRGEHSLVLCSTSFLWVPAVRRVSAAGPPLAFPL\n>tr|A0A834SHI8|A0A834SHI8_9FABA Uncharacterized protein OS=Senna tora OX=362788 GN=G2W53_041746 PE=4 SV=1\nMVGSLKPSRITRRKTCCASEPNTSVRVVFAIRSGFDAPIGVVLAWEERGSCLDIFRTRNRGRISKTLMDYEAKDLLLGVVLAWEERGSCLNIFRMKNHGRISESFMNYEAKDLLRKSADHVLTYSGRQIMVGSQKPSRITREKTCCASESNTSVHVVLANRTGFDAPIAVVLAWEERGSCLNIFWMTNRCRISETFTNYVAKDLLRKSEDHVLTYSGRQIKVGSLKPSRITMQKTCCASEPNTSVRVLFAIRSGFDAPIGLVLAWEERGSCLNIFWTTNRGRISETFMNYEAKDLLRNESNTSVRVVFATRSGFDAPIGVVLAWDESGSCHNIFRTTNLGWISETLTNYEAKDLLRNRLGMGGTWIMSELIPDDKSRSDIRNLHELQGKRLVAQSDLRNLHELRGKILSAQVSQTRWFPLYLRTGVVLMLQLESSWHGRSVDHVLTYFRMTNRDRISETFRNYEAKDCCANESNTSVRVVFVNRSGFAAPIAVFMAWEERGSSLNLFRTTIRSRISETRPFVLYLRTIVVLLLQLESSWHGWSVDLDLTYFGRKSRFKISESFTNYVAKDLLRNRLGMGGVWIMPYHITDDKSRPDLRNLHELRGKRLVALVSQTRRFALYLRTGVVLMLQLESSWLGRSLYHVLTYSERQIMVGSQKPSRITRQKTCCANDSNTSVRVVFANHSGFDALIGVVLAWEERGSCLNIFRMTNSCWILETFTNYEAKDLLRN\n>tr|A0A7T9DJD5|A0A7T9DJD5_9ARCH Uncharacterized protein OS=Candidatus Diapherotrites archaeon OX=2026736 GN=IPJ89_04390 PE=4 SV=1\nMSASFKVVIILTAEAHHAEVLSGIHKQFKDFFDYSEQAVYIYLDDHHVVWNKKFGELVGYATPAAAFKSKKHFLELFVDASSQKKLVKAFSNAMESGAGSSNTIVWKHKSGKKKKTTTILVPIPYDGHLLALHFIQ\n>tr|A0A8B6DBA9|A0A8B6DBA9_MYTGA Uncharacterized protein OS=Mytilus galloprovincialis OX=29158 GN=MGAL_10B009134 PE=4 SV=1\nMTTVPTTSELTTEPTTSEMTTEPTTSQMTTEPTTTEMTTEPTTSESTTEPTTSEVTTELTTSEMTTEPTTSELTTVPTTSDMTTERTTSENQNRTTTSELTTEPTTSELTTEPTTSEMTTEPTTSDVTTVPTTSEMTTEPTTSELTIEPTTSDMTTEPTTSEVTTVPTTSEMTTEPTTSEMTTVPTTSEVTTEPTTSEVTTEPTTSDMTTEPTTSESTTEPTTSDMTTEPTTFEVTTEPRTSDMTTEPTTSELTTEPTTSEITTEPTTSEMTTEPTTSDMTTEPTTMR\n>tr|B7M9W0|B7M9W0_ECO45 Uncharacterized protein OS=Escherichia coli O45:K1 (strain S88 / ExPEC) OX=585035 GN=ydgC PE=4 SV=1\nMGLVIKAALGALVVLLIGVLAKTKNYYIAGLIPLFPTFALIAHYIVASERGIEALRATIIFSMWPIIPYFVYLAALWYFTGMMRLPAAFVGSVACWGISAWVLIICWIKLH\n>tr|A0A7X8AQI6|A0A7X8AQI6_9ACTN DUF2142 domain-containing protein OS=Propionibacterium sp. OX=1977903 GN=GX412_13535 PE=4 SV=1\nMSRLARALVAIAVAAAALVVGVAWSFASPPVSSPDEDYHLGSIWCPPPAEESGCRMGTVDGKPVVWVPEVMAQRPCYVGRLGDSAACQDELSATELVPSIRFDQGDYPGQYYRIMHAFVGPDLDRSVLTMRVVNVVVAVLLVGAALVLAQPHAGRAATYALFAGLVPTGVFIVASVNPSSWAFVGLTTLWIALNSLAQASGTALRVANGALAVSGAVLASVARGDTGPFVAVIVLALGLLHVRRRPDRGWLAVAAITLAVGAWSYLGSGQAGVAPTVTDVEGRNFGEVLAHNLVEILQVPAGILGVGPWGALGWLEIPMPTSVHVPTISLAGMLLFQGLRRLDRRKALALAVVAGALLALPFYMLMRNLEIAGIQPRYVMSLLPLLFALCLLHPGAVAAYRFTRAQAVLAWVMVTTAHSVALLTTLRRYVTGLDGSYLLGRGGEWWWSSGPSPLAWWLAGSAAYGLAALTLVATAGIERPAASVGRHE\n>sp|P36783|VE2_HPV14 Regulatory protein E2 OS=Human papillomavirus 14 OX=10605 GN=E2 PE=3 SV=1\nMENLSDRFNALQDQLMNIYETAANTLESQIEHWQTLRKEAVLLYFARQNGVTRLGYQVVPTLAISEAKAKQAIGMVLQLQSLQKSQFGSEPWSLVDTSGETFRSAPENHFKKGPVSVEVIYDNDKDNANAYTMWKHIYYQDDDEQWHKSASGVNHTGIYYMQGTFRNYYVLFADDATRYSKTGHWEVKVNKETVFTPVTSSTPPESPGGQADSNTSSKTPTTATDSTSRLSPADSRKQSQQANTKGRRYGRRPSSRTRRTTETRQRRRSRSKSRSRSRSRSRLRSRSRSQSSERRSRYRSRSRSRQKEVSRITTTTRGRGRGSSSTSSKRSQRARGRGRGGSRGRRSSSTSPTSSKRSRRESESSRQRGISPSDVGKSLQSVSSRNTGRLGRLLDEALDPPVILVRGDPNTLRCFRNRAKQKFTGLYRAFSTAWSWVAGDGTERLGRSRMLISFFSFNQRRDFDQTVKYPKGVDRSFGSFDSL\n>tr|A0A7Y4GUD3|A0A7Y4GUD3_9BRAD NAD(P)/FAD-dependent oxidoreductase OS=Bradyrhizobium australiense OX=2721161 GN=HCN58_21515 PE=4 SV=1\nMLNKVNKPKLVVIGNGMAGVRTVELLLDRAPDLYDITVFGSEPYGNYNRILLSPVLAGEKTVDDIMLNTEQWYDDNGITLRKGEMIEMIDRRTCEVVTREGARVPYDRLLIATGSNPIMLPLPGKDLPGVIGFRDIQDVEHMVQASTSYKNAVVIGGGLLGLEAANGLMKRGMNVTVVHLLDTLMERQLDQVAGGLLRKSLEERGMVFKMPAQTEAILGEDRVTGVRFADGEVIPADLVVMAVGIRPNVELARKAGLYCERGIVVSDTMQTYDGRIYAVGECVQHRRQTYGLVAPLFDQAKVCANHLAMKGFATYDGSVVSTKLKVTGIDLFSAGDFAPGADKEEIVMQDASRGVYKRIILRDKKIVGAVLYGDTIDGPWYFQHLRDGTDVSQMRERLVFGAANLGDGGHSGKNSVAAMSDDAEICGCNGVCKGTIVKAISEKKLFTIDDVRAHTKASSSCGSCTGLVEQVLAFTLGGDYSAAPKVKPMCACTDHSHDDARRVIVENGLKTIPDVMKFMDWKTPNGCHSCRPALNYYLLATWPGEYRDDQQSRFINERVHANIQKDGTYSVVPRMWGGVTTPDELRAIADVADKFNIPTVKVTGGQRIDLLGVKKEDLPAVWADLNDAGMVSGHAYAKGLRTVKTCVGSEWCRFGTQDSTGLGIKLEKFMWGSWTPAKVKLAVSGCPRNCAEATCKDVGVVCVDSGYEIHFAGAAGLHIKGTEFLAKAATEEETLEIIAALTQLYREQGWYLERMYKWCDRVGLDAIRNQVVDDVANRKTLFSRFTYSQQFSQSDPWAARAQRGVDRNEFTPLAELELA\n>tr|A0A4P7ND20|A0A4P7ND20_MAGOR Uncharacterized protein OS=Magnaporthe oryzae OX=318829 GN=PoMZ_04838 PE=3 SV=1\nMAFAHQLGAARLLLRQHRFGLAQSSCRRNMATLSQKLSNEPAVIKPSAAEIKNKTLSSRNLEIAVRHLHADGLVVVEDAVPHADLDALNAKMVPDARYLQSLGENGPFNYNQGNLQQDPPPVAEYFFPSIFTNKIATQITSSILGPRPKWTFCSANSAMPPSSPDSPPQRQPVHSDADFDHPHHPFALVVNVPLVTMTLHNGSTELWLGTHHLSDLSAQEGAHGERASGRIKQRLLDARRSTRGPCQPVVKKGSVVVRDLRLWHAGMPNLSRDEVRVMLAFIHFAPWYRNPMRLRLGEDVKARIEDVAAELDVPVDWVGREEVLGEYLRRGFGNSYDFGQEA\n>tr|A0A3D1Q1J9|A0A3D1Q1J9_9FIRM MFS domain-containing protein OS=Lachnospiraceae bacterium OX=1898203 GN=DER20_01345 PE=4 SV=1\nMAKNVERLQAREAKELIRREKQLGARSNKFYLIYLFMILSLIYITDEIASTISIQFQANIVTEFFVKNMGMEYGAGLSLFSAIGFISYPVTLLIIFYRPLADKFGRKPFLVINTLCMGLGLFLVYLSKDIYVYMIGGTLMGFMVSHDMQCVYILECSDAKSRARNYAIVKAVAILGTLLVPLLRATLMQNVSERWHVVYLVPAIVGFVMSLFALLFAKETNAFLIKRIEYLKTPIEEREQRSKEGREQNAQGGILTAVKFAFKHRQLRFLIIACCCFYLASLGTATYSTVMAKSALMTEEEITLALFLYPVGNALFTLISGFVSDKFGRKVTIVAMSCSALTCYLLFIFSGMFKWTPYLTGFAIGGFMGSYWGAGDTIGGIMFSESSPTNLRSSVTVINTLLNGVMGGLATVITMILLPIIPERMFGYMYLGLTVPGLVGAIVIMWLFVGETRGLDLKTVTGTEWDKPKKVKEEQQEGE\n>tr|A0A484R0A0|A0A484R0A0_9ZZZZ Uncharacterized protein OS=plant metagenome OX=1297885 GN=ANDA3_0622 PE=4 SV=1\nMTPCLLLRGMCGDLMWAGRGRIAEKRGEMAPLRHRGKSLVSFAGAALRGTPAWCAMPRRRACRHRLRHQFGAGMSTR\n>tr|Q5DYX4|Q5DYX4_ALIF1 DUF4123 domain-containing protein OS=Aliivibrio fischeri (strain ATCC 700601 / ES114) OX=312309 GN=VF_A0952 PE=4 SV=1\nMHEQSYLVVNPLEDKEVIERFYHYGGGNAFPLYLDTEFDAQKEIGPWLLPYPPKEFLAYFANKPSGFRIYFSDDIETHIQHWKSLTFAGLDGELVLFRYYDRVVLEAMLVSFNQKELSLFLGSSECIEIISSVGSLCSYENSASQVSYKSEPWWKIEKHHSSYSVERHAWITERLAWQRLPSLMKEIYEKNSDIQSQLINHLIEGRAHRLENEELEAYSMNMLIKDSKQQSHDIYEAWYLDSAQIKTVKQVENLVTRSELQQGTQI\n>tr|A0A132B1M6|A0A132B1M6_9HELO S-adenosyl-L-methionine-dependent methyltransferase OS=Mollisia scopiformis OX=149040 GN=LY89DRAFT_633225 PE=4 SV=1\nMHDDEEDTNAIEAESSDGFDGDSAYAGSSAGSLTETLASTIARGIEEHGRTYAAYGNEEYGLPIDEEELDRIDMSHAKYSMLLEKRLFVAPINPQPQRVLDIGTGTGIWAIEMADKYPSAEVLGLDIAPTQPSWVPPNCIFQIDDVEMPWTLGVETFDYIHARDLLLSIRDWPRLVEQSFDHLKPGGYLELQCVYPRIRCDDGSTPPQTGLEQFSAHAQEASVRIGCPLDACTRYAEYMSSAGFEDVVEKRFKMPSAPWAKEKRMKLIGAFEMHNLLKGISGMSLRMFSKGYGWSREEIEVFLVQVRKDIQNLKYHTYYEFIVVYGRKPGGSGATANHSSV\n>tr|A0A6H5HNS4|A0A6H5HNS4_9HEMI Uncharacterized protein OS=Nesidiocoris tenuis OX=355587 GN=NTEN_LOCUS22830 PE=4 SV=1\nMIDDLRFLRLSAIPPWETFTLSIVRLLNPFRPMGPSCVIAFKDVFSFHQSLVITCHFGSTWKLCTTAPFSPTNDPHNWIIIGLHWSHNEPYCGMEMIPASLHCRRVTALRKFTRWQQLKEPATISWRILVKTVVIAGLLSVFIDQCERETILNCKGSGAHGRSIWRVEFGHNGDRFLRPSLVVFEDDTDMSFDLDVEYLTPHGSTAPWNPLLVSHRCFLEALFHSSGTQSEVQNRFISEYAEGLKSWAVISVGIVSTVLLNLIMVKQNKKSEARLLDEQTNYEGEFPFPVPDSVFADVERRTSTKRATKNSSGDIINIEPPVKTDRRMSGDHAFTTDPLEEQARSSPRVVAWGPIDRKTPSQMSNINKDPTIQQNLEGITEMKGSPEIYPSKEFSRRISQEGPSGAQRPSNAMSPMVAANPKGVHTFTDSSKSSLGSQVTSDMSMSMTSLSWVDATVEREPFEYKDEQLPRERGNPTNRSV\n>tr|A0A5W0I3M7|A0A5W0I3M7_SALTM Transcriptional regulator (Fragment) OS=Salmonella enterica subsp. enterica serovar Typhimurium var. 5- OX=1620419 GN=AT998_25380 PE=4 SV=1\nMRNVIIYGINWTNCYALQSIFKQKYPEKCVKTCNSLTALLHSLSDMPDAGLILALNPHEHVYLFHALLTRLQNRKVLVVADRLYYIDRCVLQYFGVMDYVLKDELSCAIRSEREKLRLPEAWLRFCHRPQKKTVAATYAFNAGETPEEVLFNINQYAWWNLPPGVTQAKYALLILLSSGHPAIELAKKFGLGTKTVSIYRKKVMYRLGMDSSPLSLFRGLKLDAHLQRTAFAHNPAVPDDNCALP\n>tr|A0A177BXN8|A0A177BXN8_9PLEO Peptidase C45, acyl-coenzyme A:6-aminopenicillanic acid acyl-transferase OS=Paraphaeosphaeria sporulosa OX=1460663 GN=CC84DRAFT_1169559 PE=4 SV=1\nMDAQKQNLIITKITQAGKPTIVQVTEAGIIGKIGFNSSGVGTLLNAIKVHGVDASRMPVHFGLRAALESNTAREAVQKLESYGMAASAHILISDSSEALGLEFTKSTFAHCKADGKGRIAHANHLLLEHPGEVDTVWLKDSPVRVKTMTNNTEKLSTEPSWEDISRLFEDEHGFPHSICRQGQDGGSTTLFNIVIDLKAKKGVVRLGRPTQAEETVSLEL\n>tr|A0A7R9KXX5|A0A7R9KXX5_9ACAR Hypothetical protein OS=Medioppia subpectinata OX=1979941 GN=OSB1V03_LOCUS10746 PE=3 SV=1\nMSKKPEDIVVSGMSGRFPLSVNTDEFAKNLFSGVDMVTEDDSRWPIGLYDMSGRMGKLDCYKDFDSPFFGLNDQIIAESDPQARLLLEVAYEAMMDAGVNPQELRGTKTGVYVGVSIYSMTDGYPEDGQPDLHESMQTLMVQTLANMKTLYSSRISFANDFKGPCLVVDTACSASLSALTLACNDLLLGNTDYAIVCGTHMDFEPFIFQFQQELGICSPDGMSRVLDAAANGFVKAEAVCCVFLQRRQCARRLYGHILTARMNVDGHKKMGMQRRLYGHILTARMNVDGHKKMGMFFPSSEAQEELMRMTYTDAGIDPKKMTFFEAHATGTKVNYMHSCYN\n>tr|R5P6Y1|R5P6Y1_9BACT Uncharacterized protein OS=Prevotella sp. CAG:1092 OX=1262919 GN=BN465_01592 PE=4 SV=1\nMKQLLFLLIMITGACTFTSCDKSDDTVDPIKENLFNSKYIVNDAGCCVLDGLQPIRAEIINDEVKGYGWKVIGIYKIMDNGKLSQKDYRDMVYGSGYTDYWFKADNNLIGFLHGDVSGKNYINTEWSYDDSKGYIMRYSADLSISERYMQVLYVATLQGKEFYLYTIQKLGYTTIKNDTTKPFYGLVIYQRMTDKELAEIKKEYKLQL\n>tr|A0A1Q2H2K3|A0A1Q2H2K3_9GAMM Acyl_transf_3 domain-containing protein OS=Pseudoalteromonas aliena OX=247523 GN=B0W48_18560 PE=4 SV=1\nMIRINYIDNMKAAGIILVVLGHAAWLNESIYILIYSFHMPLFFFMSGYLASRQHPIKKALIKLNHRLIIPFGFFFFVSFCVWLPLHFFGGGQASNMPWFDPLFRLITAQADSFHINGVLWFFPCLIVISVLQIVIFSKMKLITAFITSAVILSFLLVNVGLIKTRFYWCISIYKFVDTL\n>tr|A0A416WAN5|A0A416WAN5_9FIRM Uncharacterized protein OS=Eubacterium sp. AF15-50 OX=2293103 GN=DWW50_03425 PE=4 SV=1\nMTNNEIWENIRHNNMKRDGVNNPIKVDNFVYEIYSLMKERDFSIIESDEIVKSLSGLIENDKKLILREPLKTVEKYNKEG\n>tr|A0A7X1RI95|A0A7X1RI95_STRMT GNAT family N-acetyltransferase OS=Streptococcus mitis OX=28037 GN=GEZ71_00850 PE=4 SV=1\nMELRRPSLADKETVLEMMEEFEKYQSPHDGGFWDTENFSYEEWLESNQNQEMGINLTEGWVPAIQLVAFSVKGKAIGFLNLRLRLSNFLLEEGGHIGYSIRPSERGKGYAKETLRQGLQVAKEKNIKKALVTCSVNNPASRAVILANGGLLEDVRDGVERYWIEVANE\n>tr|Q2VZI8|Q2VZI8_MAGSA Predicted membrane GTPase involved in stress response Membrane GTPase LepA GTPase-translation elongation factor Translation elongation factor EF-1alpha (GTPase) OS=Magnetospirillum magneticum (strain AMB-1 / ATCC 700264) OX=342108 GN=amb4183 PE=4 SV=1\nMELRNIAIIAHVDHGKTTLVDAMLRQSGTFRENQQVAERVMDSNDLEKERGITILAKCTSVEWKGTRINIVDTPGHADFGGEVERILSMVDGVVVLVDAAEGPMPQTKFVTGKALGLGLRPIVVINKVDRGDARPHEVHDECFDLFAALDADDNQLDFPTMFAVGRDGWADDSLDGPRKDLSALFDLIVAHVPPPRRDLEAPFSMLATTLEADPYLGRVLTGRIYSGTAKLNMQVKGLSHDGQLLDSSVSPSCWPSAASSAFRWKAPRRATSSPSPA\n>tr|A0A5M4AG34|A0A5M4AG34_9BACT Uncharacterized protein OS=Prolixibacter sp. NT017 OX=2652390 GN=NT017_31240 PE=4 SV=1\nMKTINIFKAVAILFFTFAAFSCNDLFNWGTRDYSTQLEIGVTKGGAALKSATNDPIYYLDNCELITADAIRISIATPDPGGGDPIPIDDMQDKILPLHAVGNGVASDLIMLLPGTYVVTKFEVLQLVDAGNGGTKYETIMATPMQNSAFSGYVNTPLNYEFEVELYQKKRLLMEVLCFEPTDVASFGFVWTGVDVILGDEICLYVSQCTSNGTETWGPADYSATFYTMIDEQNVGEVYASSGTSSEGWICFPLWSGATDYGVGVHIVYDGSVEEDFIITAAEVNQILLDLQQEPVEAGTGYYLYEIPCPVVP\n>tr|A0A1G2MCL2|A0A1G2MCL2_9BACT Uncharacterized protein OS=Candidatus Taylorbacteria bacterium RIFCSPHIGHO2_02_49_25 OX=1802305 GN=A2W52_04225 PE=4 SV=1\nMLEEQTPTQTYPPELKRIKTFQSDVEELIQKQQISKAAIALAESERRVKKEEVSAQPSAPAPAYSAKILTLSGGLPPAAPKWNTSTLLAVVVLVLAVLGMGTGVYFFLKQNAPLQISPPRVNVKSGTAITLNTKESREKIVEKIRSHVQALSVPQNEVRVIPIVLDGKTITTTELLEEIEASVPAALLRALGTEPVLGVHGFRGGQPFLLFSVHSYDHAFDGILSWEPNLLREVGPLFGISVRNILGRVASTTSDILENTLTIKDVIIRNKDARVVLGPGEEKIFLYSFLDKETLVLTTNTDTLQFLIGKAWGGRLR\n>tr|A0A3Q0R773|A0A3Q0R773_AMPCI Interferon regulatory factor 8 OS=Amphilophus citrinellus OX=61819 PE=4 SV=1\nMSNSGGRRLKQWLMEQIQSAQYSGLQWEDESRTMFRIPWKHAGKQDYNQEVDASIFKAWAVFKGKYKEGEKAEPATWKTRLRCALNKSPDFEEVTERSQLDISEPYKVYRIVPEEEQKHGKSPMMAVTATTSSGEITDMDCSPELEELIKEEEGCSIQASPEYWSQGSINAFPLHQDPLPSSSLSSALCQMMISFYYGGKLMHSTLVTHPEGCRISPQQHLGRGALYSSDSMQSVYFPPAELIEFERQRYVTRKLLGHLERGVLVRANQEGIYIKRLCQSRVFWSGLGEVGSQYGSMPGKLDRDAVVKIFDTGRFLQALQLYQEGQIPAPDPTVTLCFGEELNDHNSAKSKLIIVQITAVNCQHLLETMNVRRSQPYCNNPNLEMPDEVVTDQMARIYQDLCSYSGTQRPACYRDNMPITA\n>tr|A0A7L0PVY4|A0A7L0PVY4_9AVES EHD3 protein (Fragment) OS=Mesembrinibis cayennensis OX=1118748 GN=Ehd3 PE=4 SV=1\nMFSWLGTDDRRRKDPEVFQTVSEGLKKLYKTKLLPLEEHYKFHEFHSPALEDADFDNKPMVLLVGQYSTGKTTFIRYLLEQDFPGMRIGPEPTTDSFIAVMQGDVEGIVPGNALVVDPKKPFRKLNAFGNAFLNRFVCAQLPNPVLESISVIDTPGILSGEKQRISRGYDFAAVLEWFAERVDRIILLFDAHKLDISDEFSEVIKALKNHEDKMRVVLNKADQIETQQLMRVYGALMWSLGKIVNTPEVIRVYIGSFWSHPLLIPDNRKLFEAEEQDLFRDIQSLPRNAALRKLNDLIKRARLAKVHAYIISSLKKEMPSMFGKDNKKKELVNNLGEIYARIEREHQISPGDFPNLRKMQDQLQAQDFSKFQPLKSKLLETVEDMLANDIAQLMVLVRQEESQRPTQMVKGGAFEGTLHGPFGHGYGEGAGEGIDDAEWVVARDKPMYDEIFYTLSPVDGKITGANAKKEMVRSKLPNTVLGKIWKLADIDKDGMLDDEEFALANHLIKVKLEGHELPNELPSHLLPPSKRKITE\n>tr|A0A815YX94|A0A815YX94_9BILA Hypothetical protein OS=Rotaria magnacalcarata OX=392030 GN=KQP761_LOCUS19763 PE=4 SV=1\nNNGTLVAGGNGQGSVLNQLNSPACLFVDRDHSVYVSDYSNNRVMKWVEGAKEGIVVAGGQGGGSALTQLNYPVGIFVDALGTLYVADSRNHRVMRWAQGAKQGTVIVGGNDQGAGANQFNTPIGLSFDRHGNLYVGDWNNHRVQRFSIE\n>tr|A0A2V4LES8|A0A2V4LES8_PSEAC Peptidase OS=Pseudomonas alcaligenes OX=43263 GN=DMO17_00310 PE=4 SV=1\nMRSTTLRRWSFVHTWTSLICTLFLLLLALTGLPLIFHHEIEHLLGEAPQLRELPADSPRLSLQQLVEAAERHRPGEVVQYLGWEEDEPNGVVTIMAATAGTEPNSSHTFMLDARTGEAVEMPAANGGFMMLMLRLHVDLFAGLPGKLLLAFMGILFVVAMVSGVVLYAPFMRKLKFAEVRRDKSTRLRWLDLHNLIGIVTLTWALTVGVTGVISACADLLIEAWRNDTLATMVEPYRDAPPLTERAPADELLRIAGEAVPGMRPDFIAFPGTRFSSAHHYAVFMVGSTHLTSHLWTPVLIDARSLAVTAVGDRPWYMDALAMSQPLHFGDYGGRPMQILWALLDGLTIIVLGSGLYLWWVRRRAPRQALRDEVAA\n>tr|J3LRP0|J3LRP0_ORYBR Uncharacterized protein OS=Oryza brachyantha OX=4533 PE=3 SV=1\nMRGGGRDDEEAAHKLKSMDVDKLENGANGADTPPRPALKYHGWRAMPFIIGNETFEKLGTLGTSANLLVYLTQVFHMRSVDAATLLNGLNGTTSLAPIIGAFLSDAYLGRYLALAIASVASLIGMFLLTMTAGAEGLHPAECGVGEACEKATSGQFAVLFISFAFLVLGSAGIRPCSMPFGADQFDPHTESGKRGINSFFNWYYFTFTSAMLVSATVIIYVQSNVSWPIGLGIPTALMFLACVLFFLGTRLYVRVTPEGSPFTSIVQVFAAAARKRSLKQPKDPKQDLFDPPHTSAIVTKLAHTDQFRCLDKAAIVAGPDEVRSAGGGGPAPANPWRLCSVQQVEEVKCLIRIVPVWSTGIIYYVAVVQQSTYVVLSALQSDRHLGKSFQIPAASFTVFAMLAQTLWIPIYDRLLAAAPPQGHRQGRGAHAPAAARHRHRALHGGHGDVGHRRGPEAAHRADAADAGDDHHRRRHLRHVQPVDGAAAHGAGPLRGVQPHQPDRVLLQGDPGAHAERRRRAGLLQPRARQLPQRLPRHHRAPDHRLRQQLAGAGPQQGEARPLLLDDRRHWHLQHRLLHDLRQVVQVQGSSQLRSESLFIWVVN\n>tr|A0A177BWM7|A0A177BWM7_9PLEO SEC14 cytosolic factor OS=Paraphaeosphaeria sporulosa OX=1460663 GN=CC84DRAFT_1169075 PE=4 SV=1\nMAATGAKELTLDPKYDDYDYPTTAPTPQNGHPGHTTPEQDAQVHQLRAMLEQAGYTKNLDTLTLLRFLRARKFNVELSKQMFIDCEKWRASYADVGVEELVRTFDYKERPEIFKYYPQYYHKTDKDGRPVYIEQLGNVDLTAMAKITSQERMIQNLVCEYEKMADPRLPACSRKSGYLLETSCSIMDLKGVGIAKATSVYGYLQAVSAISQNYYPERLGKMYVINAPWGFSGVWSVVKRFLDPVTVNKIHILGSGYQKELLAQVPAENLPKLFGGSCDCPGGCELSDAGPWQDDQWVKPPKWAKKAEDKNVIDNTGVPAPTADAPQQPLTGAGPEGVEPAAAPAQNPNTANSA\n>tr|A0A371GLZ4|A0A371GLZ4_MUCPR H(+)-exporting diphosphatase (Fragment) OS=Mucuna pruriens OX=157652 GN=CR513_26426 PE=4 SV=1\nMFPGATLFLFTEYRYLTMFMGVFGALIFLFLGSVKGFSTQSEPCIYNKGNMCKPALASAICSSVAFLLGALTSVLSAFLLVLYIAINLFKLYYGDDWEGLYHCITGYGLGCLSMTLFERVGGGIYTKAADIGADLVGEVEHSIPEDDPCNPANFICTSVFFLQYEILLTPGSPLLIPIPNKCWKQNLGGFYHPPIDQSFLFSLPRHTLDPCYRKLQEPVNSAPTKPGSTALIPVDRIGYCRQHRR\n>tr|A0A5E8VDI2|A0A5E8VDI2_9BRAD ArgE/DapE family deacylase OS=Bradyrhizobium sp. LVM 105 OX=2341115 GN=D6B98_18630 PE=4 SV=1\nMNAETQQRILDAVDAGFEAQLATTRDFVAIPSTRGAEGPCQDMIGDLLRERGYEVDDWHIDVDDLKDLRGFGPIEHDFSKARSVVGTYRPQTNDGKSLILQGHCDVVPAGPLELWDTPPFSPVIKDGKMFGRGACDMKSGTIGALYALDAIKAAGFKPTARIHFQSVIEEESTGVGALSTLQRGYRADACFIPEPTGGKMVRSQVGVIWFRLRVKGHPTHVAFAGSGANAIMAAYHLIQALQKLEIEWNERAKADRHFKTLNHPINFNPGIIKGGDWASSVPAWCDVDCRIAVLPGWSIADHQKEIMACVAAAARNHRFLANNPPEIEWSGFLSEGYELTDAAAPEAAFAKAFGKVYGGVPEDLVFTALTDTRFYGLNHGIPSLCFGASGGEMHGFNEFVDLESLKKTTKAMALFIAEWCGLEKA\n>tr|A0A498CZE4|A0A498CZE4_9GAMM Uncharacterized protein OS=Acinetobacter cumulans OX=2136182 GN=D9K80_11310 PE=4 SV=1\nMGVAIDLTNTERRVSTAEFAMRMNVSEKELYDRIRDGRIKAPAKDGRKNYWLNSYVLECITGVEDGASLLV\n>tr|A0A853LVH8|A0A853LVH8_9MYCO Acyl-CoA dehydrogenase OS=Mycobacterium colombiense OX=339268 GN=A5628_13360 PE=4 SV=1\nMLLELDDDQRLWRETVRGALTKQCPPSLVRAIAEGGADGGDLWQWYIEQGWTELTSAESLVELTLLLEELGRASDPTPFLATTTQFAPLVGDRVPQDGAGAAVYSGVTACRDRGGWVLEGAARYVLDADRADQLAVVTPAGVFVVEAKAASSRRVAAIDPVLHLADLRFNEVHVSDAHRIASDTERAWHIALTGMAITIVGACQRIVDMVLEHLKQRYQFGVPIGSFQALQHKAADMHVAIERARALAYLSALTIVADDPRRRLFAAMAKAAAGEAQSLVVQHGLQCFGAMGFTWENDLQFAIKRAKAGELMLGDAAEHRALIAREYRAADF\n>tr|A0A3B3U8V4|A0A3B3U8V4_9TELE DENN domain containing 3 OS=Poecilia latipinna OX=48699 PE=4 SV=1\nMAELPSGLLEACVVVGAPSDKLRELPQHTKSSELPLLDPEVLQVHAPPFVSIEANSNHVIGPAFSRVQRRRSFIKKKRRDRAAEGVSNGDSSSRHEASPVPATEDISVPKDLDLIALPQLCFPDGLQLASEQKDDAYHFLVFTDLFGNRTHGVVVHYYRAVQSFQDSVFQNGHRWNAPKSRLFAPFAVCIISKFPYYNALKDCLSCLLVQLRTVRQADLEETIREFSAKLSLVPLPPPGQLHVSFSLRPLQVVLPSRDDQDSPVVDLNLHLPLLCFTHTALLQVLSCLLQEQRIVFFSSDWARLTLVAESLLLYLQPLSWQQPYVPVLARGMLDFLMAPTAFLMGCHINHFEEIAAETEDLILVNVDDGFIQTSWSEAVDLPALPLAAAECFISRAESLQLQYDLELCHLGTGTDVNTLRSQRRGWQQKLNSQIQNIALELVVNIFRGVQDFLNHEHRVFNSEEFLRTREPDDQLFYRKVLETHIFHSFLRDRLNRKRDSFSRMEQMTQSHAHRNRAMTESPRRPPMSELSRAGPDRKLSKRLGASLPNLDQPINESVPLNANRLLSIRKISPDSGLKFLQKPLKVFRLPEFPPPLAYHYVQNYYSDMVASLGKAINATPPDESALLARYHYLRGLVNTVSNRRLDALEDFHSLYKTDAGIFPSQMVNSLIDSLPDVERVQADRRPEIKRLISRLKREQERERATQGTGQEDAAVKRFQLPKKYMHLEEFVKCVQESGIVKDQGTIHRLFDALTVGHQKQVGPDLFRVFYTIWKETEAEAQEVCLPASVLEHIDAAECVFKLSSSVKTSRGVGKIAMTQRRLFLLTDGRPGYVEVAQYRDLEEVRVSSAPFLVLRIPSLKIRVHGRKETFEANLKTETELWNLMIKEMWAGRSIADRHKDPQYMQQALTNALLMDAVVGSLQSSKAIYAASKLAYFDRMSLEAQMMVPSTTSETLKHKINPSVEFAVPQAVDVLLYTPGQLWVSVGGGKVMVYDASSWSLIQTCQVGNARLNCMLGVDRDQVWMGSEDCVIYIISLVSMVCNRQLTEHRAEVTGLALDNEKYCHKVAYSCSAEGTVMAWEVSTLQVKRHFRLSCDRLQSVYSCGGVLWCCARDGIMEVWRNGTLKQHINLPEQQRVTFSSALLITESEELWSVCVDSAEVYIWHIKNTSRPINRVMLQDCIGCYCMIQVKNQVWVGGMGRSSTKGKIYILDTERYEVLKELHGHIDKVTALCSAEDRYVLSGAAKHDGKVAIWKVEDRGLDSSKC\n>tr|A0A6P9APX4|A0A6P9APX4_PANGU pentraxin fusion protein-like OS=Pantherophis guttatus OX=94885 GN=LOC117655567 PE=4 SV=1\nMVEASIIPVGDPNVAVGKLSSQSSTFEEKGESRKAIDGSLANIYTNGDCTLTKKDFEPWWMVDLISAFQVSAVVITNRGDCCESRIQGAEILIGDLPQKGGTMNPRCATINSMERGETMSFNCAGMQGQYVTITIPGRYEYLTVCEVQVLAYPWLRIVHGGRSPVLDSDTDSGLQGRVLSFPNESKDSFVIISPMQPFNLMEFTLCMRIAVEYLDEHEIILFSYHSQRDELRVLREAMGHFGLHMGGRSVRFALPDLSPLGSHICVTWESVFGLTAFWMNGKSSIRKVHNMGHILQAGGTAMLGQDQGAQNMSDQQKPHFVGEITDLYMWDYVLKSHDIQKVFQAHEFPRGNIFDWKILSYKIRGNVMVLPKG\n>tr|A0A087WPU9|A0A087WPU9_MOUSE La-related protein 4B (Fragment) OS=Mus musculus OX=10090 GN=Larp4b PE=4 SV=6\nMTSDQDAKVVAEPQAQRVQEGKDSSHLMNGPISQTT\n>tr|A0A4Q7AXS9|A0A4Q7AXS9_9GAMM Efflux pump membrane transporter OS=Acinetobacter bouvetii OX=202951 GN=EXE25_14110 PE=3 SV=1\nMSQFFIRRPIFAWVIALFIILLGVLSIPKLPIARFPSVAPPQISITAIYPGATPKTLNDSVVTLIEREMSGVKNLLYYSSSSDSSGTATITATFKPGTDVELAQVDVQNKIKAIESRLPQTVRQQGLMVDAASSGFLMMVGLSSPNGKYSEIDVSDYMTRYVIEELKRVEGVGKVQNFGAEKAMRIWVDPDRLISYGLSIKDVNTAIQNQNLPISPGRIGDVPALTGQQITIPLTAQGQLETVEQFKNISLRAQQNGANVRLSDVARVEIGAQMYNFAILENGKASTAVAIQMSPGANAVKTAEGVKAKIEQLSPALPDGMKFSIPYDTAPFVKVSIQKVIATLLEAMVLVFIVMFIFLHNVRYTLIPAIVAPIALLGTFSVMLLAGFSINVLTMFGMVLAIGIIVDDAIVVIENVERIMATEGLSPVEATSKAMKEITNPIIGITLVLAAVFLPMALAAGSVGIIYRQFTITMSVSILFSAFLALTLTPALCATMLKPIDLNHKKKGIFAWFDRSFEKLNNRYERSLFKVIQHKTIAMLCFLSIVIVLIFSFKQVPTAFMPEEDQGWFMTSIQLPADATQERTRKVVAEFQNHLDQETGIKDNMAVLGFGFSGSGQNTAMYFTNLLPFEERTITAQEVVNNANMAMAESSEGQTMSVLPPAIDELGNSSGFSLRLLDRGNIGMPALREAQDQLLALAAQSKLVADVYPEGLPDGSSVQLKIDRDKLQALGVNFSDVTDIISTSMGSMYINDFPNQDRMQQVIVQLDAKSRMSIEDILQIKVNSQSGKLVSMSEIITPIWQHSPQQYNRYNGRPSLSITGSPAAGMSSGQAMSEMENLIKQLPKGVGYEWTGISLEEKQSESQTLFLLLLSMLVVFLVLAALYESWSIPLSVMLVVPLGLIGAFLAVMLRGMPNDIFFKVGMITIIGLSAKNAILIVEFAKALRVEGMGLVEATVAAAKLRLRPILMTSLAFTCGVIPLVIASGASSETQKAIGTGVFGGMISATVLAVIFVPIFFIVVMSTVEKFSKRKAAH\n>tr|M6TB98|M6TB98_LEPIR Transposase DDE domain protein OS=Leptospira interrogans serovar Bataviae str. HAI135 OX=1085538 GN=LEP1GSC170_1474 PE=4 SV=1\nMKNKLMPLVDKILLRKRAIIESVNDELKNICQIQHTRHRSFCNWAVNLLSGLVAYSFFPKKPSLNLRSKDNLQLLISP\n>tr|A0A2D0KA88|A0A2D0KA88_9GAMM Adenosine deaminase OS=Xenorhabdus ishibashii OX=1034471 GN=add PE=3 SV=1\nMIDIQLPLTDLHRHLDGNIRPETILDLARQHNIPLPAYELEALRPHVQIIENEPNLVSFLQKLDWGVTVLADLEACRRVAVENVEDAVNAGLDYAELRFSPYYMAMKHQLPVEGVVEAVIDGIHSASQQHDIQIRLIGILSRTFGEQACTEELAGLLAHKQHITALDLAGDELGFPGHLFEQHFIRARDAGWNISVHAGEAAGAESIWHAIRELGATRIGHGVKAITDPTLMDYLAKNGIGIESCLTSNLQTSTVSSLPAHPLKQFLEHGILASINTDDPAVEGVEIRHEYTVAAPAAGLSPAQIRQAQINGLATAFLSEAEKQALKTKVANR\n>tr|A0A2K6SAF3|A0A2K6SAF3_SAIBB 35 kDa nucleoporin OS=Saimiri boliviensis boliviensis OX=39432 GN=NUP35 PE=3 SV=1\nIQPPLSGFNMFSPASIGQPRKTTLSPAQLDPFYTQGDSLTSEDHLDDSWVTVFGFPQASASYILLQFAQYGNILKHVMSNTGNWMHIRYQSKLQARKALSKDGRIFGESIMIGVKPCIDKSVMESNDRCALSSPSLTFTPPIKTLGTPTQPGSTPRISTMRPLATAYKASTSDYQVISDRQTPKKDESLVSKAMEYMFGW\n>tr|A0A0D6JIV9|A0A0D6JIV9_9HYPH Probable membrane transporter protein OS=Candidatus Filomicrobium marinum OX=1608628 GN=YBN1229_v1_3342 PE=3 SV=1\nMGRESVGDVGFMDIGMTWAGFSMLAFSLLAAGVIVGFLSGLLGIGGGGILVPVLYETFAALGVDPAIRMHMAIGTSLAVIIPTSLRALMAHSAKGVVDWVAVRRIGPWIVIGVVLGIMFADQVTGTTLKWVWVVFGTLFAAKMAFGRDTWRLGHDLPALPKLEIFSVLVGIISVLMSIGGAAFIVTFLTLYGRPILTAVATSSAIGPLIAIPGAIGMMWAGWGHPGLPPLSLGFVSLLGAALIVPSSVLVAPVGVRLAHGVSRRKLELAFAVFLVVIVLRFLSSLILE\n>tr|A0A353GX24|A0A353GX24_9FIRM Aspartokinase OS=Firmicutes bacterium OX=1879010 GN=DDW50_18565 PE=3 SV=1\nMKVIVQKFGGTSVATREGRENVASKVKEALGKGLGVVVVVSAMGRNGDPYATDTLIGLARGVLKYIKPRELDLLMSCGENISTVVMVQTLKAHGIEASAFTGGQAGIITDHHFNNARIIEIKPDNLWKCLEEGKVAVVAGFQGVTKDGEITTLGRGGSDTSGSALGVALHAELVEIYTDVDGIMTADPRLVPQAKPLPVMTYNEVCEMAHLGAKVVHPRAVEIAMEGRIPLRIRSTFSNNLGTLISDGTSIGDIEIRNGKVVTGLAQIAEMALVKIISKVDLNQNGAVLKIFQVLAGAGISVDMIQVAPLNIAFIIKEDLVDKAKEALSPLGLELLVEKGYAKVAIVGSGMRGIPGVMARMVKGLQKEHIAIYHSTDSHTNIACLVKQEDMCGALQALHDEFELAE\n>tr|A0A1N6LEK7|A0A1N6LEK7_9BURK Amino acid/amide ABC transporter substrate-binding protein, HAAT family OS=Paraburkholderia phenazinium OX=60549 GN=SAMN05444165_6866 PE=4 SV=1\nMAAKWGRVVAAALAAMVMTAAYAAGETGVPSSSAAPGGKPIQLALIEGMSGPFANAGAAVERNLRFGVEAVNAHGGVKLADGAHPLELVVLDSKGSPEEALLQLRAAADRHIGYVLQGNSSAVAAALIGAIDKQNSREPDNRELFLNYSADDPALTNAACSFWHFRFDAHAGMRMDALADVIQHDPSVRKVYLLNQDYSFGHDVSALARSALAAKRPDIAIVGDEFHPIGRVKDFAPYIAKIRASGADAVVTGNWGNDLTLLVKAAREQGLDTKFYTFYGNSLGAPAALGDAGVKRVIAVADWHPNAGGAASDAWYKAFRARYPAAQDDYPVLRMELMVEMLAAAMNKAGSAEPEAVAKALEGMKFDNGFHPSWMRAEDHQMIQPLYVMEMDKAGTPGVRFDNEGSGYGFRTVLALPPGRTVAPATCRMTRP\n>tr|A0A850WM95|A0A850WM95_FREMA SIM1 protein (Fragment) OS=Fregata magnificens OX=37042 GN=Sim1_1 PE=4 SV=1\nKEKSKNAARTRREKENSEFYELAKLLPLPSAITSQLDKASIIRLTTSYLKMR\n>tr|A0A482IAK4|A0A482IAK4_9DIPT Cytochrome c oxidase subunit 1 (Fragment) OS=Tipulidae sp. BIOUG26266-C02 OX=2544765 GN=COI PE=3 SV=1\nFIMIFFMVMPIMIGGFGNWLVPLMLGAPDMAFPRMNNMSFWMLPPSLTLLLASSMVENGAGTGWTVYPPLSAGIAHTGASVDLAIFSLHLAGISSILGAVNFITTVINMRSSGITLDRMPLFVWSVVITAILLLLSLPVLAGAITMLLTDRNLNTSFFDP\n>tr|A0A2A8TFK0|A0A2A8TFK0_9BACI Transition state regulator Abh OS=Bacillus sp. AFS017274 OX=2033488 GN=CN380_26055 PE=4 SV=1\nMKSTGIVRKVDELGRVVIPIELRRTLGINEKDALEIYVEQERIILQKYKPNMTCQVTGEVSDDNMKLADGKLILSPEGAELLIKEIQASMEPAK\n>tr|A0A531KVX5|A0A531KVX5_9HYPH M20 family metallopeptidase (Fragment) OS=Mesorhizobium sp. OX=1871066 GN=E5X43_21305 PE=4 SV=1\nMDTVPIDRWESDPFSGEQRDGRIYGRGSCDTKGSLAAMLIALSSLGERQPRATVVLAASIDEEYRKLGARAIADSGVTYEGAVVGEPTELELVVAHMGSVRWQIEVQGVPAHTSKPHLGVNAITGMAKVVLALDEHHRSLVSRAQHPLVGSAQLTVSLIEGGLELTTVPPVCRIWVDRRLIPGEQPQDALAEVESILEGLRQGEDKINVRSLLPALEDPPPISSESSRIAAVAAAACAHVAGTGEQKGATGGSDANQLSLAGIPCVIIGPGRTAQAHTNNEFVEIAQLIKAAELYQKIM\n>tr|A0A2D5TAC4|A0A2D5TAC4_9GAMM Uncharacterized protein OS=Gammaproteobacteria bacterium OX=1913989 GN=CMP85_02235 PE=4 SV=1\nMTFDLVTDRNTCPLLDTRSFVMLRTTCRTHYRDDEAWALRTRDVLLRVSTLTPRQTLGLNYLYKYALQFDAPVGSTEWFQNIVNWLDFKSSIRIVHSFMFETRPKLLYSLDFGTLSPGPRMLWQRLWCRYERVYKKHLKKRKSDLFDVVPCKKRRVLCH\n>tr|A0A833PV08|A0A833PV08_BURL3 HTH-type transcriptional regulator NimR OS=Burkholderia lata (strain ATCC 17760 / DSM 23089 / LMG 22485 / NCIMB 9086 / R18194 / 383) OX=482957 GN=nimR_1 PE=4 SV=1\nMTANDYAAGTTFPEHAHGRGQFAFASRGTISVSTPHGRWLVPPQRACWVPAGVRHEMTMTGPVTMLNTFVSGDAAQEAGLPEQCGVYGVSALLRQLIDDAIDLPALYDVDGRAGKLMALLVAEIATMPRLSLHAPLPADARLAKVCRHLLASPSIAADLDQVAADAGVSRRTFTRQFRAQTGVSFAAWRQQVCMLSAIARLSDGQPVTRVALDLGYASASAFTSAFRRILGDTPSRYLEIRR\n>tr|V7PXT1|V7PXT1_9BACT Cupin_2 domain-containing protein OS=Parcubacteria bacterium RAAC4_OD1_1 OX=1394712 GN=O210_OD1C00001G0424 PE=4 SV=1\nMKKGFKENIEKLTEENNNFRKVLYTGASSQLVLMSLLPNEEIGMEIHNENDQFFRFEKGSGKVIIDTTEYEVKDGDAVVVPMGARHNVIAGEEGLKLYTIYSPAHHKDGIVRETKEEAEQNEADFDGQTTE\n>tr|A0A1L8MN76|A0A1L8MN76_9STRE D-alanyl-lipoteichoic acid biosynthesis protein OS=Streptococcus bovimastitidis OX=1856638 GN=A9Q68_01415 PE=4 SV=1\nMNEKRKILMLFIGKTVLFYLIFILLIYIFDYLGHGQSAFIYNEF\n>tr|A0A846M925|A0A846M925_9BACI 2,3-bisphosphoglycerate-independent phosphoglycerate mutase OS=Saccharococcus thermophilus OX=29396 GN=BDD39_000516 PE=4 SV=1\nMSKKPVALIILDGFALREETYGNAVAQAKKPNFDRYWNEYPHATLTACGEAVGLPEGQMGNSEVGHLNIGAGRIVYQSLTRVNIAIREGEFDRNETFLAAMNHVKEKGTNLHIFGLLSDGGVHSHINHLYALLRLAAKEGVKNVYIHGFLDGRDVGPQTAPKYIKELQQKIKEYGVGEIATLSGRYYSMDRDKRWERVEKAYRAMVYGEGPTYRDPLECIEDSYQHGIYDEFVLPSVIVREDGSPVATIKDEDAIIFYNFRPDRAIQISNTFTNEDFREFDRGPKHPKNLFFVCLTHFSETVKGYVAFKPTNLDNTLGEVLSQHGLRQLRIAETEKYPHVTFFMSGGREEKFPGEDRILINSPKVATYDLKPEMSAYEVTDALLKEIEADKYDAIILNYANPDMVGHSGKLEPTIKAVEAVDECLGKVVDAILAKGGIAIITADHGNADEVLTPDGKPQTAHTTNPVPVIVTKKGIELRKDGILGDLAPTMLDLLGLPQPKEMTGKTLIIKK\n>tr|A0A5C3E0M0|A0A5C3E0M0_9BASI Related to MRPL44 - mitochondrial ribosomal protein, large subunit OS=Ustilago trichophora OX=86804 GN=UTRI_01617 PE=4 SV=1\nMSIAAASLKHITAMSFEFAPLSASQASRSMRLLLARLPTKAPMPGMDLPDISTKTVATDALQKIEITYKNKQKLVLDHVASETRLSDLVKKIEEPARALRLKEEGL\n>tr|A0A812PJQ8|A0A812PJQ8_9DINO GrpE protein OS=Symbiodinium sp. CCMP2592 OX=631055 GN=grpE PE=4 SV=1\nMLDRVSAGPTDCLLGKCLCKDGYCADGDMCKPQVCFAGAEPPRFRPNRWLAFYSGMSDLEQFPEYEELEEEYVQFVLRISPVPLLFLLLGVVVSITTCACLCCGGSGYHFSMDFSDMTHDETKGFVSGTTGNAVIGDEEFARRAWKKRPSCFPMFCAALLIILLCFFGGLTRIVNAAWTEYIIVSSLDRAMDNAADIANASLTINETVTHLHDKLLELPLTCKTDSKAAKQVLYTFVHSALGAIDDYVEQVYFIVETVQPIPDQIGKFKQLTHRAKPFFASLPLAPLWLVAFICIGIVVEATCTTCCRSSSLARCVDVGLKLSALLFGLIVFVVAVLVCVETIVLIALSKFCEDVDHNVLSYVNSTTYNISYIIPEIANYYIRGGDRNPIDEYDTLAMKYINQIQDYYNQAAIGVAGLGMACPAFFDLDVNAIATKARGILGKARELLKGENIYPYYRKVIRAGICNVVISGVGHPS\n>tr|A0A5C6ACY5|A0A5C6ACY5_9BACT Isoleucine--tRNA ligase OS=Rhodopirellula pilleata OX=2714738 GN=ileS PE=3 SV=1\nMTVPPPKPSSKPSLPSSVDLSSTSSAGGFRAADGSPSFPKLEEEVLAFWDANQIYEQSLARRADAPTFVFYEGPPTANGMPHPGHCLTRAIKDVFPRYKTMRGYRCERKAGWDTHGLPVEVEVGKELGIHSKEEIEAYGVEPFIQKCQQSVWRYMQQWQTLTRRLGFWVDLEKAYVTYHQSYVESVWWSLKNLFDRDLLYQGHKIVWWWAQGGTALSAGEVGQGYREVADPSVYVLFPLIDDNNKKTKRSLVVWTTTPWTLPSNMYAAVKADLDYAVVEDSETGEQLILAEALVETLAGKIKRELRTIETVSGRSLVGMRYVPPFENYRDTLADPVGELKDGGSDSLYWRVVAADFVTTDSGSGLVHLAPAFGEVDHEVLVEERMRFVDGQRPDLLCAVGPDGKFTDDFPSLKGEWVKAADKTLTRDLRERGLLLHLEQYLHDYPFCWRAEEDPLIQYPRESWFIRTTKFRDLMLKNNSKIGWQPEHIQDGRFGNFLESNVDWALSRERYWGTPLPIWVCQSTGRMEAIGSYDELLAKPGVEGTEVWAQAKAENPELVDDLRVHKPYIDAVTYASPFEDGARMKRVTEVIDCWYDSGAMPFAQWGWPHQNHDRFAEQFPADFISEAIDQTRGWFYSQLAISTMLFGEGASIGTDLNTDVPTVSTDAAQDYPHPFRNCIVLGLMLSQWYEAANESGPKTIVLTEEETAEHADLKFTKKTGKMSKSLRNYRSPSEIFDRYGADAMRWYFFANQAPWNSIIYADQAIRDSIPEFLLRLYNTFSFFTIYAEIDGFDPTLAADADDQLSPASLASATTYRDVSQRSEIDRWILSELNRTLEVVVERMDKLDNYNACQAITSLLDGLSNWYVRRSRDRFWGSDKASQDKLDAYWTLYESLVQLTKVIAPFVPFLADKLWQELTRPFGDRVLRSVHLTDYPTADSSRIDASLSESMKVLREIASLGRSARADAKLKVRLPLSKVEVILANDSQIGWLESHDQLVLEELNVKAVEYTTEGGDYVQYNVVPNFKRLGPKVGKNIPLVKKMLGEADGNELLGQLQTSGKVTLAMPDGPLELDNEDIEVRLKAREGWAAAQGTSCVVVLNTEVTDALRREGIAKDLIRAIQSQRKEMKCEYTDRIEVAIVSDDADTEAAIAAHREMICEETLAIRLADQPLQAIDATSIENGQLFVAKVPGE\n>tr|A0A165E1C3|A0A165E1C3_EXIGL Uncharacterized protein OS=Exidia glandulosa HHB12029 OX=1314781 GN=EXIGLDRAFT_725429 PE=4 SV=1\nMSAPAAQDDADAMDVDATPTPKPARAPRRRRGRPQPPHVQTPRSATAPTTDAHVPFPTSAGPPSPTKSPTKQRSMPDHAFRRPSSPTKTRSSWFDASDTDLTSLGRSTSPTKSGSWASSRSSRSSSPSKSSRSSARPPSPTSLPWAEGRIPPSPSKTSLSSGPDSPQKVRNRPPSLRLHDNPDGIDPSTIVGKVLKRVHRGAAHPNLTLVFADDSVVQVKIEGYHPNARGLSKELEMDSSLDDFLASSAASTVDLLILDCALVRLTDKAFERSDSDASNDSRWSQDHLGLAFKFEGMPHRWYSVWATMQDFDDDGICRFRSYDDVFLSPVAQTPRRPRHARKNSKQIV\n>tr|A0A7C1SJJ1|A0A7C1SJJ1_9SPIR ZIP family metal transporter (Fragment) OS=Spirochaetales bacterium OX=2026792 GN=ENI06_01135 PE=4 SV=1\nMIFTWFTNQHPILQALLATIFTWLVTALGSAMVFFFKEVKRKVLDSMLGFAAGVMIAASFWSLLAPAIAMAEESGAIPWIPALVGFLMGGLSLRLIDIFLPHLHLGLPMEQAEGVKTSWHRSVLLVLAITLHNIPEGLAVGVAFGALYHNLPGASLAGAIALALGIGIQNFPEGAAVSIPLRREGLSVSKSFWFGQLSGLVEPVAGVLGALAVVVMKPILPYALSFAAGAMIFVVVEELIPEAQMEKNTDIATMGAMLGFAVMMTLDVALG\n>tr|A0A2M6W0D3|A0A2M6W0D3_9BACT Uncharacterized protein OS=Candidatus Magasanikbacteria bacterium CG10_big_fil_rev_8_21_14_0_10_43_6 OX=1974650 GN=COU33_04145 PE=4 SV=1\nMNVFRVWRKIQNTSNSEKTVLIIGDIKNKIKGLGGDYLSPIVFFLQKSGKLLFLANFVIMRV\n>tr|A0A0K2J648|A0A0K2J648_PORGN RND family efflux transporter, MFP subunit OS=Porphyromonas gingivalis AJW4 OX=1403336 GN=PGJ_00014360 PE=3 SV=1\nMQLSGYRVVWLPFIFLMALSVVGCNGGKKKTADTSSGEDMELFTSGGDTIDVQIAELKLGPFDRQIVSHGKLRARETAVLQFEDSRQPLHRLYVRNGQHVVQGQKIAAVDDRTALLEVQKSEDEFKQRELDLQDVLVGMGYSPHDKSDIPADKLALACIKSGYNIAESNYKQAQLRLKHVCLTAPISGVVADLHAQEHTIPESGKPLCRIIGDNGFEVVFEVLESELSAIRTGERVEIRPVALRDVTAEGVLQEINPSVDDRGMVQVSAGLRNPSKNLFDGMNVEVRINQRMEERMVIPKSAVVLRSDKPVVFSVRNGTAAWNYVDIEAENAESYCIVSKTLKPGEMIVVDGNANLAHKTPVALRR\n>tr|A0A2G5ISA1|A0A2G5ISA1_9ACTN Uncharacterized protein OS=Streptomyces sp. HG99 OX=1958787 GN=B1C81_17685 PE=4 SV=1\nMTTPPPQGQNPFAQGQQPYGQPPQGQNPYGQQPGQPGFPQQGAPYDPVPPQRPKRGIKQYLRIAVIVFAVIAAGVGWIASRDDANTAKVGDCMSISNPESTTDPGLEVVDCSSSKAKYKVEEKKSDNSGCDRTKYSEYTETGKNDFTLCLSEYSAK\n>tr|B9YBS2|B9YBS2_9FIRM Resolvase, N-terminal domain protein OS=Holdemania filiformis DSM 12042 OX=545696 GN=HOLDEFILI_03279 PE=4 SV=1\nMDAQEVMHMTDYSKITALYSRLSVGDEDRDGGESNSIQNQKIFLENYARGQHLTNIRHYIDDDESGRFFDRSAYSRMMDDVENGKIGVCIMKDLTRWGRDYLQVGNAMEIFRRNNVRFIAVNNGIDSEKPDTLEFAPFINIMSEWYAKDISKKVKTGIKTKGMSGKPIVTEAPYGYVKDPDNKDFWIIDEEAAEVVRLIFRLFIGGKNRNQIAVHLKNEQIPTPTFYMKDRGRGTCKNKTLNEDNRCKWNKATLTNILTRQEYCGDVVNFKTTKHFRDKHNHYVDRSQWHITENVHEPIISRSDFETVQRILENAPVKRPNGDGEIHPLSGLLFCKDCGAKMHIRIDYRNGGKRHVAFCSEYHKGKAKNPKCHSPHIMDADLLMQTIAEVLKKIEDYSISNRAEFEALVKKNLAMQQTDQTKKQQKRIPQITTRLEQIDKVLNKLYEDNALGTIPQDRYEQMSQKYSEEYYALKAELATLQEQLSAYENAGGRAQKFLKLTERHAAFTDLTPAILNEFISRIEVHERDQKRARYAIQHISIYFNYIGKFENEVTQLAEPTEQEIRQMREEIEEAKKEKSRAYHRQYSREYRARNLEKQREYDRMKAREYRARRKAQAAAQPAQ\n>tr|A0A317E7E7|A0A317E7E7_9PROT XdhC /CoxI family-like protein OS=Zavarzinia compransoris OX=1264899 GN=DKG75_13590 PE=4 SV=1\nMIEPDLFAKVYDLQEAETPFVLATVVRTVSVTAAKAGAKAVILADGTVAAGWIGGGCARGATLKAAQDSLADGQPRLISVQPDDQMEEQGLLNGETRDGVRYAHNHCPSRGTMDIFVDPVLPRPELLVMGTSPVARVLVALAGEFGFRVMAAAPAAAHGQLSLADRLIDGFVPPPANGLRYVVVATQGADDFAALSAAVALDVPYIAFVGSRRKAESLRGDLLDAGVPAARLAALKAPAGFDLGAVTPEEIALSILAEAVAVRRRGIASPAP\n>tr|J9VWE8|J9VWE8_CRYNH Pre-rRNA-processing protein TSR4 OS=Cryptococcus neoformans var. grubii serotype A (strain H99 / ATCC 208821 / CBS 10515 / FGSC 9487) OX=235443 GN=CNAG_06340 PE=4 SV=1\nMSPSSPAGSSSSSLCYTNTLLALPDGPIPSSHRDLISHTTSFIGGYPTFPALPSSSCSTKKVGNTPSEINCGICHKPIPLLAQVYCPPEDGENDRTIYVFACPRVGCQKREGSIRAWRASVRNEEYVRDVEEKRKAAEKAAQEERERARKNPFTVDEAARLNGSALFGTASPLFGGAAHNPFAPPNPVPAMATLSVSDDRPAPTPITSGPSRTFTPPIPAYHPVQYLSTIEEYIPPVDDDVSVASSDDDESPEQKAEWREEGWEKVLPRNVDEVFENFVRRLDQADGGKKQVLRYELGGMPLPYSSASPLTRKLFPGCEKPLAKDEELDLSALYTPKFIPTCPRCGGKRVFELQLVPSLINILRPHTISTTGEAPKASFPKAATEEERKKELAKLAAGVKEEASKDEEGEMEWGNVLVYGCERDCVGVGEEWVGVEWEATLEL\n>tr|A0A2T0PRW1|A0A2T0PRW1_9PSED Flavin reductase (DIM6/NTAB) family NADH-FMN oxidoreductase RutF OS=Pseudomonas sp. NFACC11-2 OX=1566246 GN=OE22_101713 PE=4 SV=1\nMSSLCDTAFDTRAFRRALGNFATGVTVVTAATEDGRKVGVTANSFNSVSLDPPLILWSIDKRSSSHEVFEAASHFAVNVLAADQIDLSNNFARPKEDRFAAIQFETGEGGAPVFVDCSARFHCEKFQQVDGGDHWIMIGKVVAFDDFGRSPLLYHQGAYSMVLPHTRMTKREEGQSPSSHFQGRLSHNLYYLMTQALRAYQASYQPRQLCTGLRTSEARMLMVLENDAGLNLCDLQREVAMPVREIEEAVANLKRKGLVSDEGERVRLTAKGIDETEGLWAIAKEQQDKVFGQFSEEQVEHFKQVLKGVIRGA\n>tr|A0A7H5EXY5|A0A7H5EXY5_9BACT Rhomboid family intramembrane serine protease OS=Lewinella sp. W8 OX=2528208 GN=E1J53_0011935 PE=4 SV=1\nMFFPIGDDQVHRGFTPFFSYGFIALNVMIFFYQSSLGEAGAEFIYNYGSIPLEFERGEDYHTLITSIFLHGSWMHLIGNMLYMWIFADNIEASIGNVPFLIFYFLGGLAASLCHIYFNAGSQIPAVGASGALSAVMGAYIVMFPKSNIRGYLLFFRINVAAWVFLGFWFFQQSQAGYASLGDTSGGIAWWAHIGGFVFGVLCGFFFRQRYGVPELDRGRDRYA\n>tr|A0A1A3D3H4|A0A1A3D3H4_9MYCO Uncharacterized protein OS=Mycobacterium sp. 1245805.9 OX=1856862 GN=A9X00_01450 PE=3 SV=1\nMVQCASEISWDPADTDGLSEDWLDRLLDAVDGNTVVRTPVGMLFAGVSQIERLLAHPALKVPVVEQYELMGVSEAILERARRVILGLDGAPHTRLRRLVSRAFTQRAVERLAETMRSYLVPRLDDVDGEVDFIDEIVGDYPAAIIGGLLGLPAADLPHLTSIAQVITSSQFSLDVDRAHQYLAAAAECDAYLADLVTSKRKAPGDDILTHLTQVGVEGDSLSDAEIVSLCASLMNAGIDTTRNQISLGMTLFARLPEQWNRLRDESVLVGNAVEEILRFLPVTPLLTRLNTEALTFDGVDVPERTYISLGVAAANRDSTLNTGDALTFDVSRPNPRHFTFGHGAHFCVGAALARLEMRELLTQMVSRFVSVEVVGQAPRRSAMGVYGVKNLTLRLDRQRQNAS\n>tr|A0A2P8DYT4|A0A2P8DYT4_9BACT Uncharacterized protein OS=Cecembia rubra OX=1485585 GN=CLV48_110110 PE=4 SV=1\nMRTLLSIFAISIFISSCVQQGVDKEAQRIVDQSIKAHGGALYQEALISFDFRERHYSIFKSPSKYEYIREFTDSTGFVRDVLNNDGFQRTVNDTPVDLPEDRIRAFSNSVNSVAYFAFLPYGLNDAAVIKTYLGETELEGNSYHIVKVTFRQEGGGEDYDDEFLYWFHKEKYTMDYMAYSYHTDGGGVRFRKAIKQHQVNGLLLLDFENYKPEEKNTSVDKMEGLYKEGKLELLSEIRMENIKVSF\n>tr|A0A1U9N7G6|A0A1U9N7G6_9GAMM Muramidase FlgJ OS=Cellvibrio sp. PSBB023 OX=1945512 GN=B0D95_04590 PE=3 SV=1\nMQSIDTGIKVPQVQDNYFDPNSLNSIKAMGRDRDPQAIKEVAKKFEGLLVQQMLKSMREANDVFGEGSFLDSQTTRFHRDMLDQQMVLDLTSGPGIGLADHFYRQMMQNYGSTMRPEGGVKNTDSSALGEITPRTANKTSVAEQASVDALDDWIQDFMRMSDNVQMQALGDGDEQQVPAVPAINYALIPQLLSKQAIGTVRGGQKSSISPTQENFVMMLKPHAERAAAELQISPDVLIAQVALETGWGKHVIHDRSGNNSFNLFNIKAGGQWQGEKVNVNTLEYRNGIAAQEKSDFRKYNDYSESFSDYVRLMKNNPRYEKVLATGTNSSAYADALQSAGYATDPHYAKKIKSLLNSDVIKSLDLASVTENMQADLLQTGAQAILSLAASASRHIVE\n>tr|A0A411GH85|A0A411GH85_ENTCL ABC transporter ATP-binding protein OS=Enterobacter cloacae OX=550 GN=sapD PE=4 SV=1\nMPLLDIRNLTIEFKTGEGWVKAVDRISITLAEGEIRGLVGESGSGKSLIAKAICGVAKDNWRVTADRMRFDDIDLLRLSPRERRKLVGHNVSMIFQEPQSCLDPSERVGKQLMQNIPGWTYKGRWWQRVGWRKRRAIELLHRVGIKDHKDAMRSFPYELTDGECQKVMIAIALANQPRLLIADEPTNAMEPTTQAQIFRLLSRLNQNNNTTILLISHDLQMLSKWADKIDVMYCGQTVETAPSEDLIGAPHHPYTQALIRAIPDFGSAMPHKSRLNTLPGAIPLLESLPIGCRLGPRCPYAQRKCIETPRLTGAKNHLYACHFPLNMERE\n>tr|A0A7X8MBI3|A0A7X8MBI3_9BACT Type II toxin-antitoxin system HicB family antitoxin OS=bacterium OX=1869227 GN=GX408_15355 PE=4 SV=1\nMRTLKYTYWQDGNFYLGYLIDYPDYQTQAKSKEELIENLKDLLHDIESGDIPFIRKIEELVLA\n>tr|A0A1V3S1A0|A0A1V3S1A0_9PSED Alkyl hydroperoxide reductase C OS=Pseudomonas sp. A25(2017) OX=1945865 GN=B0E42_23545 PE=3 SV=1\nMPIINSQVKPFNATAFKNGEFVPVSDADLKGKWSVVFFYPADFTFVCPTELEDLADNYAEFKKLGVEIYSVSTDTHFAHAAWHNTSPAIGKIQYTMIGDPTHVISRNFDVLIEEVGLADRGTFVINPEGQIKIVEINDGGVGRDASELLRKIKAAQYVAAHPGEVCPAKWKEGEATLAPSLDLVGKI\n>tr|A0A2V9NH91|A0A2V9NH91_9BACT Uncharacterized protein OS=Acidobacteria bacterium OX=1978231 GN=DMG98_20865 PE=4 SV=1\nMNDEETIMKHKLTTALLLALCVPIASATTWYVNGVSGSNSNNCKSPTTACKTIGHAISLAVSGDSIIVAHAIYAENLAIGKNLTILGSGAATTIIDGGGTATVVTISNGTHVTLSKMTIRNGNASGVVVIGFMRAISGGGINNSGTLTLTNSTVSGNLAPIPCIHFFVFCEIRGGTAWGAGIYNSGALIISNSIISGNQAGGYCNATCSSFGGGIYNRGTLLMIKNSTLTGNIADTACSTSISCAVGVGGAFYTVGGTVTLNNSTVTANIADRCSGMCGGTGGAIVNGSGNLAVNNSTVSGNYPAGGIFNSGTATLQNSILANNSGRNCRGIITSHGYNLSSDGSCPFSNTGDLNNTNPLLGTLGNYGGSTQTIPLLSGSPAIDSGNPNGCTDGQGHLLKTDQRGKPRPDIEDTAGCDRGAFERQSD\n>tr|A0A7D3VXP3|A0A7D3VXP3_9ACTN TPR repeat protein, SEL1 subfamily OS=Actinomadura verrucosospora OX=46165 GN=ACTIVE_7586 PE=4 SV=1\nMPVRPWSPEDLGRPTDGTWADVAFGLGEIYECEGDLGQAADWFRRAAESGHAAAALRLGAVLGRMADDGADGSAEDLLAEATRWLSGAQDIATPDAIELITDMLNRHQRQAARRGLEPAVATG\n>tr|A0A370P2G6|A0A370P2G6_9BURK ABC transporter permease OS=Cupriavidus lacunae OX=2666307 GN=DN412_03430 PE=4 SV=1\nMKSIRLGHAVATVCVVQLLAASPYAVAQGKGSYSQDTVKIGVLTDMSGIFADLGGKGSVTAAQMAIDDFREQNTPPFKIELLQANHQNKADIGASRAREWFDVENVDMITDVINSGVALAVAKVAQNKNKMVMVTGSGTARLHDEDCNPNTIHYGWDARTFANAHVRAQTEQRRKSWFFLSVDYALGRSLEQDATAAIMANGGTVAGSVRHPLSAPDFSSYMLQAQSSKAQVVGIANAGADLVNAVKAANEYGVTRTKSLAGLAATITDVHAMGIDATQGMVVVEDFYWDLNDRTRAWSRRFFDKQKRMPNFVQAATYSAVLTYLKSVLAARSDDSNVVLKQMKQLTINDVFANNGKIRDDNKMVHDVYVMEVKKPQESKAPWDYYRVRRTVAGSDASQPLSASKCPMVKKGI\n>tr|A0A1A8TK33|A0A1A8TK33_9GAMM Peptidyl-tRNA hydrolase OS=Marinomonas spartinae OX=1792290 GN=pth PE=3 SV=1\nMTGFKLLVGLGNPGSEYENTRHNAGAQWIEALARQSQCSLRTEKKFFGQFGKVSIAGEECYLLIPTTYMNLSGKAVQAVCQFYKIPPEQILVIHDELDIPPGTAKLKKGGGHGGHNGLKDIIARLSNNREFGRLRIGIGHPGHASQVANYVLKKASQDEYRKIEQTIDESLRYIDDIVGGNLNTVMNQLHSFKA\n>tr|A0A373QD60|A0A373QD60_9FIRM Uncharacterized protein OS=Firmicutes bacterium AM55-24TS OX=2292896 GN=DXA10_01295 PE=4 SV=1\nMEEFFNRTDKKYKIIMLCVIVCIIIVAYIGSQLHDDNHLIVGRWEEVGDCWMDELEFFSDGTYSSDKDNYFGSYTIEDGRIRLGGVLMSDLVYSYKLDGDTLILYKKDIDDGDEYRRVK\n>tr|A0A7K2JSV5|A0A7K2JSV5_9ACTN DUF2470 domain-containing protein OS=Streptomyces sp. SID5910 OX=2690312 GN=GTW67_25625 PE=4 SV=1\nQELEAAELDPLATSEAGMLTHFVDDHPELVPLLLRLVRPGPDRGVRRALPVGIDRYGLTLRLELARGHRDVRLPFNRPVRDIDHVGAQIHALLSAARRLSHPGHLLT\n>tr|A0A6N9SLE2|A0A6N9SLE2_9PROT Cell division protein FtsL OS=Ferrovum sp. OX=2609467 GN=ftsL PE=3 SV=1\nMSRSDILLFVCVVVLALGVIHGQQHARRLFIDLQQARDQQVQLQTEGDQLQIEEGTLSASRRVEDRAIRGLKMQLPKSEQKRLVVLGQPGSTP\n"
  },
  {
    "path": "src/alphafold3/test_data/miniature_databases/uniref90__subsampled_1000.fasta",
    "content": ">UniRef90_A0A8C0C0Z5 NADP-retinol dehydrogenase n=1 Tax=Buteo japonicus TaxID=224669 RepID=A0A8C0C0Z5_9AVES\nMATLVPRIVLITGCSSGIGLAVAVRLAQDPQQRFHVIATMRDLRKKEKLEEAAGPALGKTLSIQRLDVCSDSSVAECMENIPGGRVDVLVNNAGVGHVGPVESISVEEMKRIFETNFFGVVRMIKAVLPDMKRRQSGHIVVISSVMGLQGIVFNDVYAASKFAVEGFCESLAVQLLQFNVXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXPAFRTQTNSLYTPLVALKYADPSGDLSVRTYYRLLFNYGTLFHLSMAALRCLTCGCFRRRVTPL\n>UniRef90_UPI001863CDCB tumor necrosis factor receptor superfamily member 19L isoform X1 n=2 Tax=Megalops cyprinoides TaxID=118141 RepID=UPI001863CDCB\nMMRNHLRCSALVLLSLLGLRGALATQCGWGKVLTSEGCVCLQCPVGQEPSKACGQAEGPEEVVRCQACSAGTFSDTYDSDLCRPHTSCAALNRLLMSPGSTERDATCGDCMPGFYSAAKEKSSSPDSCVRLIPRPLVRVLRNVGKGVARGTGRGPANATNVRSAEEKNTEYAVFALVPIFCVMGLLGILICNILKKKGYHCTAEKEGGDEEAPTPQKEGNSGPYIVDDPNEDTISVLVRLITEKKENAAALEELLLEYESKQMSISKASSIKFPVLPHLPHQFRSLPRLCPHQHHLHTINGLAPRAGNGSCCSRCSQKKWPELLLPPIDTHKTTTVGGKNPLPGEVTILSVGRFQVAQIPEQKALPAELTPPESSDTDSVDTSHTEAADEKSLLGVSSLSSSSTWTKSKQEDRKFVIRLGETNLVI\n>UniRef90_UPI00049204AA adenosylmethionine decarboxylase n=1 Tax=Paenibacillus pinihumi TaxID=669462 RepID=UPI00049204AA\nMEYSTFGRHVAVDTWGVDFELLNSAEFLQAQMVEAAESCGATVLSVQAKQFEPQGATVLVLLSESHLSIHTYPEKGFAAMDCYTCGETVDPQMAIDYMLSVLKPKTVHAKKLVRGMGELKVEEPVMQQAELV\n>UniRef90_B8CVZ9 Putative CoA-substrate-specific enzyme activase n=1 Tax=Halothermothrix orenii (strain H 168 / OCM 544 / DSM 9562) TaxID=373903 RepID=B8CVZ9_HALOH\nMGKYYLGVDVGSVSTDMALIDPFGNLIEKIYLRTKGQPIEVIKRGLKKLKENYGSIKVAGVGTTGSGRKLAGVMLGADVIKNEITAHAVAATHLVPDARTVLEIGGQDSKIIILKDGIAVDFAMNTVCAAGTGSFLDQQAARLGISIGEFSRLALKARSPVRIAGRCSVFAESDMIHKQQLGHDLPEIVAGLCEAMVRNYLNNVAKGKDIKPPVVFQGGVAANIGIKKAFEKELHTEIYVPEHNGVMGAIGAALLAMEEVRSRKKETSFKGFEVTEFKFKTTSFECKGCPNRCEIVNINQDGKTIARWGSKCLKWDMTEDKKKEEVNLNPS\n>UniRef90_A0A7R9F0M8 BESS domain-containing protein n=1 Tax=Timema bartmani TaxID=61472 RepID=A0A7R9F0M8_9NEOP\nMSSRSLVAGGGGSVRQPTPSSGVKLAGEDFNKDKMYEPKHTKRLVRVLTVVAYVFSVSLAAIMLSVYYVFLWNPRDARHPRLPPPTPPTCQPAQVISMYDNYSTEVGMRKEALQRLHLHGRRVVNHLVKTTFNRADWNLNPNLQQPARTTSASSVEDAEEQSAEDEVESQTDLGPNQLTERSKPTQNNQKSPVRNNTCELEFQLSQFMTLHKERQKDDPDKDDRAFFESLLPSLKSLDTDEKLNFRIHQLTLSLVNNRRAVFFTPSSHPAVLI\n>UniRef90_A0A2A9MK67 Ras family protein n=1 Tax=Besnoitia besnoiti TaxID=94643 RepID=A0A2A9MK67_9APIC\nMRDPSCWQFPSHSSSQESEAVAWAPPRGPGQSGAGRFEGEGGEATACSALSPAGCPLPPFSVPSASVSSSASLTPLCYAVRSVPSSPHSLPVPAPPPVPPPVAIAPSSFLSPPRSPSLLPSCPSSSSPPVQSSSPLVSPLHAFSPSWAPDLLSRSPSPAVCRKRTEEFSSVPPSPEWRAESRFPTSHRSLLDSPVCRPAVVAGGGVAAGGFLSEGEGAAPPGGEIGSEEEDDGASVASSSSDASTAFLRILVVGDQGTGKSFLLHSLCHSPDPQSEFQRPCPAHRGRRGLREQVDTRASDAGAADEKSAPRQDGTGSRLEHSGSRAQLRRGTPDRRDAVHGVGVRMDASEQLERDADAPFSSFASVELTEWPRRADAETGGTQAGRIRGLPEDGRPRAEPRASEPCLAESCVSAPSEQSGDSTSVPRSPSLSPSASPVPSPSSSFSFSLPTSFCPASSSRPPAPVAPPRAASSSSPASSSAAPVARAASAEAAAAAQPAACEDASRQRECTCEADEQQCPACRLPGSYEWTCGVRIFHMFWELPPRERGSKDRQRQSSPGSSSSESSADSLSERGRPAASYPLLPESDASCASGAAAARSAGAATRCLVEFWEVGGTEMLESVRSLAYGQEFDGVWVCFDSRSAASFHHAALWTRELCVHLHLPSSLLFPSSGPQAPLSLAPRSYEAAAPSSSLRSFLPAPAVFQSFACSRRVRRWRRHQEHNAAGEARQRSAEGAAHEVQSLTSFFQMLPTSTVGKVTRAAASAVVRLGSTVASPVVSLVAGERERETDDSATDREEDEMARLKPEREGRGRRKFSAKPSRPFRKGSRRTARFASSLLTSASSVRPPPGMPERDGEEEPREDGEGGGTSVEEKDVELGVLEGGRETLESPADAECRADTASAAKEGTAPTLEAAAFPKGQQGAGPGPEDPDGASSRAFANLEKELTHQQFAVRLLQGVCPVLLVGTKEDLLLSSTAARQTSNESAGGGCEVDEKGLSPFLKHLRSRASVLSGFLSSSSPEAAAGCAVGEDDEDGRGGEAACRASDPSCAAPALCLEEDIGGGTPSRLQTPFSRAYFTQNSFVKARDNIFARLCGTLGPRRVPSGDARLALDGDAGVKLNRRICHLLNSSPLVLTSAVGRTVDPAALSAFFSDALLCQTLFRERSREKKVRRRSKAKSRGARPPVDVMQHVEDAPALLSPLPSPSLRASPGVALSDSANVRRVGVGAGDAAKQTAPVGEAEDGGATPPHARGRAQQPCQDPRLGEERELSADPEPRESPVAEDRPAEERDGKLDGKSRPQTPFSDVAAAAVAAGAAAAAIQWLH\n>UniRef90_M3EC79 DDE_Tnp_1 domain-containing protein n=1 Tax=Streptomyces bottropensis ATCC 25435 TaxID=1054862 RepID=M3EC79_9ACTN\nMPDAPSARSSLFRAGDRLGPEPLRVLFATTVKPMATEATTGAFWRGLRLPAVDGTCWDPCGQRSRRGRLREAGQRPRDGPERVSPGADGRSGGGGHACGAGRGTRRLAAPGESPLVGRLPGSYGPGQLVLADREFLGTGLWWAFTTTGADPLGALSGGQAPEDC\n>UniRef90_A0A4Y2GBA1 Uncharacterized protein n=1 Tax=Araneus ventricosus TaxID=182803 RepID=A0A4Y2GBA1_ARAVE\nMSRPLFVIGAKKARNPRPQNKDERVSPHSLQPTTCPDGPEVANDRRARASTVHLRAPLMPKKEERAAACHLQMEIKREAVQFRFAGQSGAEYRLSRASHFGQVARGRHAPSVEKRGERGLTIFLRFLVSKMPWSPEAVRETHMPLCLRRPAMFGSCCFNLDGFGQMARYEGCRWGLRSRRAARGILANCAVMRAPGKGSSHRRFLKSCAEYPDDMQMSSGLFIAVCPVHELPLRFLLAVLLDLEEDVDRCIEHEDHQAKPFISVHELPLRFLLEVLLDLEEDVDRCTEHDGDEEHDGHQGEQIGQEDQVGLKHFSL\n>UniRef90_UPI001E28E105 low molecular weight phosphotyrosine protein phosphatase n=1 Tax=Paracoccus sp. MA TaxID=2895796 RepID=UPI001E28E105\nMPPPSVLFVCLGNICRSPLAEAALRAAAKRAGAGLLIDSAGTGDWHLGHAPDRRAQAVAARAGIDISTLRARQVAAEDFRRFDHIVAMDRQNLADLRRIAPLDGRARLSLLLDHVPGRAGQSVADPYFGEAAGFETTWHDVTAGTQALLRLLLGPD\n>UniRef90_A0A522C2W7 MBL fold metallo-hydrolase n=1 Tax=Frankiales bacterium TaxID=1909291 RepID=A0A522C2W7_9ACTN\nMSTFRVEHLSTSGTFSLDGQTFDVDNNVWLLGNDHEVLVLDAPHDAAAIERAVAGRAVVAIACTHAHDDHVRYAPELAERLSTQVLLHPADRVLWDLTHPDRAPDGELRDGAVLEVAGTRVEVLHTPGHAPGAVCFSVPSEELLFSGDTLFAGGPGATGRSYSDFDTILGSIRSRLAPLPPATTVHTGHGPSTTIGAELPSYDEWVRRGH\n>UniRef90_Q1PS67 Telomerase reverse transcriptase n=8 Tax=Oryzias latipes TaxID=8090 RepID=TERT_ORYLA\nMTSGDLSSVLNILRSLYKRTRTLEEFADGVVFREGRRAALLQPSDTHSFKSFVRGVFVCSDEELQDVPSCNQTCTFPELLAFILNSLKRKRRRNVLAHGYNFLGVAQEDRDADHFRFQGDLSQSAAYIHSSDLWKKVTARLGTDVTRYLLGSCSVFVLAPPSCVFQICGVPAYDRVSMTTASSGFLLRPPSRKHKSFQVGKKTRSANLTKTGSVGDVEESRKRRRVESEVSTRKRKRESEEEESRERRRGVHHEERRQHEAVLDESTLSGKSGENDAAAVKPPPETSAAPPPLEGGPSWRSGAFPPLPSSQCFIRTLGFLYGGRGMHGFCLNRKRRTAAGPRRLQGQDLVRLVFFEGLPYLNGQERKPKKLPLRYFNMVPVFGRLLQRHRKCRYSSVLHRMCPVVELSRAAQGELSSLIPQHCAPHRVYLFVRECLTAVVPEELWGSDHNRLQFFSRVRGFLKSGKFERISVAELMWKIKVMDCDWLKLRRTAGRFPPSELAYRTRILSQFLTWLLDGFVVGLVRACFYATESVGQKNAIRFYRQEVWSKLQDLAFRRHIAKGEMEELSPAQVASLPKGTVISQLRFIPKTDGMRPITRVIGADSNTRLHHKRIRDLMSMLQARVRSAPALLGSTVWGMTDIHKVLRSLAPAQKDKPQPLYFVKVDVSGAYDSLPHDKLKEVITEALSPVQEEVFTVRHYAKIWADSHEGLKKAFARQVDFSDGSMGSTSMKGFVMSLQKSSKVHHAVLVEQAFGSNLRGKDALQFFTQMLTGSVVQHGKKTYRQCRGIPQGSVVSSLLCCLCYGHMENVLFRDIKNKGWLMRLVDDFLLITPDRNQAQSFLSILLAGVPQYGVVANPQKVVVNFQGSEGGGAFPDIRVLPPHCLFPWCGLLLDTRSLDVCKDYSSYAGLSLRYSLTLGSAHSAGQQMRRKLMSILRIKCHPLFLDLKTNSLESAYKNIHKLVLLQACRFHVCVQSLPFAQTVAKNPTYFQQMIWDMAHYANALIRRSNTGLVLGDGAQKGSVQYEAVELLFCLAFLRVLSKHRPVYKDLLPRLHKWKRRLERLLGDLRLARVRQAANPRALLDFLAMQM\n>UniRef90_A0A6B3G495 Alpha/beta hydrolase (Fragment) n=1 Tax=Streptomyces sp. SID7982 TaxID=2706094 RepID=A0A6B3G495_9ACTN\nMPRSLQAALILLHVLFVATLVGAIRALSTASSVDAVDGYLLGLLLYASLPGVAVFVLSLYVRHGGVRAWYGLLAVLAWIVLGALAELSGGGAEGQGVARLAVPVAVIVLLCRPESRRWFRSGLEQRAEQRLFSFARMMRLRRDGGQTALEYLGLVLVVVALVGGLMATGTGQQLTAEIRSAICELTGSSCPAPGRDVAAGGGSGDGGADGGGDRDTSSSGADGMSGEGESSLTGGTGSTGTTGENATSGTSGTTATAGSPGDTATTGSPGDTATTGAPNTPQGSTPFPQGDFIAPVDAGRPAGPHGGGFIGGFLGDGVGGDVRGVVGAVLRPGETGQRIADQWARDTRGAEQKWARGDYIGAAWDWNKAVGGAGAGLAIPGSGARVDAEVRDAERAHLGERIPQNATPAQRKAWWDGLSPEERERYIELLPERIGNLDGIPVLAR\n>UniRef90_A0A833ECX2 Enoyl-CoA hydratase/isomerase family protein n=1 Tax=Caldiarchaeum subterraneum TaxID=311458 RepID=A0A833ECX2_CALS0\nMSRQYQDIIYDKSYHSHTALIQINRPHELNSYVLNTLREMIDAFDDAMWDDNIQFIVLTGAGDKAFCTGGNVREYAEIYNRKPSDWWKWGEIYGRFLDVIMHCGKPVLARVNGIVAGGGFEFVAASDLAVAAEHAKFISPGPRVGMTSIGGLSQWLPLHIGLKRTAQVVMTSDEIPARQALEWGIVNDVVPYEGLDDKVKEYIDRMLELSPTSLHYFKVHLNWWRDLVWRLTWEHAKEFFSLNIGGIEPAEGLHAFKEKRRRRYREIRGDIGRGVDPRYPHGPYMLSCNGCGAKYLPLASSYCLNCGKPIKG\n>UniRef90_UPI00046BDA5A protein O-mannose kinase n=1 Tax=Eptesicus fuscus TaxID=29078 RepID=UPI00046BDA5A\nMEMKPQDGRRSPPHREVPPVVGLLLALAVMNALLYLCLDRFFIAPRRSAPDPRHCPSGHFRVGRMNNCSAWLSCEELRTEVRQLKRVGEGAVKRVFLSEWKERKVALSRLTSLEMKDDFLHGLQMLKSLQSQHVVTLLGFCEEDNTILTEYHPLGSLSSLEATLNLSKYQTVNTWQQRLQLAMDYVGIIHYLHHSPLGTRVMCDSSDLPKTLSQYLLTSNFSIVVNDLDALPLVNRSAGALVKCGHRELHGDFVAPEQLWPYGEDVPFRDDLMPSYDEKIDIWKIPDVSSFLLGHVEGSDMVRFHLFDIHKACKSQTPAERPTAQAVLDTYQKVLSLLRDTVTSQTREML\n>UniRef90_A0A0F9NQL3 HTH_7 domain-containing protein n=1 Tax=marine sediment metagenome TaxID=412755 RepID=A0A0F9NQL3_9ZZZZ\nMKINVSIEKEYIKCPVCNGAGKIEEIHSDIKIKHAIVIKLFNEGYTYRKIMKLTGYKSTNSISDILIKNKMKLEKPIKNR\n>UniRef90_UPI001866D008 ABC transporter permease n=1 Tax=Fluviibacterium sp. MJW13 TaxID=2720031 RepID=UPI001866D008\nMGARILNALFVTAVLLGLWQALVTLADLPPFILPGPVRVAQALWNNAGLIGWHALVTFSEVLAGLVLGSLLGIVTALQLATSGLARRLIRPALVLTQALPVFALAPILTLWLGYGLWSKVLMAVLIIYFPVTSAFFDGLMQTPRGYLDLAQTMQATPRQRLWRIRVPAALPGLASGLRLAAVYAPIGAVIGEWVGASNGLGYLMLLANGRAKIDLMFAALVVLACLTLTLHVLVSRACDRLTARMV\n>UniRef90_A0A5C5WGI8 Periplasmic protein n=1 Tax=Botrimarina hoheduenensis TaxID=2528000 RepID=A0A5C5WGI8_9BACT\nMPALSTPALAVPALADLAPLESRVQEALTGSPYLVASNRLRVEAGEGRVSLHGHVGSFFEKQMAQEVARRIDGVQQVENLLTVAWA\n>UniRef90_A0A2K9F958 Lysine biosynthesis protein LysW n=1 Tax=Paracoccus tegillarcae TaxID=1529068 RepID=A0A2K9F958_9RHOB\nMPAREAHQPITINCPHCGGESILADACARWNVETQEWELSTVYDDKTCADCGIEVSAEERSVQEGA\n>UniRef90_UPI0014593CCD alpha/beta hydrolase n=2 Tax=Aromatoleum aromaticum TaxID=551760 RepID=UPI0014593CCD\nMKTWVFLRGLTRESGHWGGFLETFACIVPDSRIVALDLPGTGARHRETSPGDVPRIAEDCRSTLFRLGVDPPYRLLALSLGAMVALAWADRHPAEIAECVLINTSLRTYSPFYRRLRPRSYARLLYLALRDDARACETMILRLTSGQRDERLVDEWVTLRVRHPVTLANAVRQLFAAARYRPPRDRPAPPVLVLASRNDRLVHVACSKAIAAAWNCSLRIHPYAGHDLPLDDGAWVAEQVRHWTDGGGA\n>UniRef90_A0A0F8UN67 Cupin domain protein n=3 Tax=Aspergillus TaxID=5052 RepID=A0A0F8UN67_9EURO\nMFIRPPLEIQVTSRQIPQWNCIPNTSIQSKPLMIYHQAFAASPEELKQHFRMVGEVTPGWVYTMYSQTHFHSTTHEVLGVVSGSAYLCFGGEGNPGRFETRVEKGDMIIIPAGVGHRLLHEPDLDKGSFKMVGAYPQNKTWDMCYGQSGDEEKCRNIESLGWFQADPLYGTDGPALRV\n>UniRef90_A0A2C9GSP0 Glutamate-gated chloride channel n=2 Tax=Anopheles TaxID=7164 RepID=A0A2C9GSP0_9DIPT\nMLDHASKAPKSAGWIKLNVFRMASGHFFCAIFYFACLCSASLANNPKVNFREKEKKILDQILGAGKYDARIRPSGINGTDDKATQVFVNMFLRSISKIDDYKMEYSVQLTFREQWLDERLKFDDIGGRLKYLTLTEANRVWMPDLFFSNEKEGHFHNIIMPNVYIRIFPYGSVLYSIRISLTLACPMNLKLYPLDRQVCSLRMASYGWTTADLVFLWKEGDPVQVVKNLHLPRFTLEKFLTDYCNSKTNTGEYSCLKVDLLFKREFSYYLIQIYIPCCMLVIVSWVSFWLDQGAVPARVSLGVTTLLTMATQTSGINASLPPVSYTKAIDVWTGVCLTFVFGALLEFALVNYASRSGFIVFLCETNTINVNNIFAHGQTSVATHRSVYHFRFYCIRSFILSPPTHPQLNRHTHFRFRITPVNQPPTAISPVTPSVKHSHNYERYLVLFVPHLGSFDAFSLFLEKQNLFSFEPPVPGILLFYNNQKFNYFHPFLFALNIRLLLGIVGLTFPLTFSPIWHVNI\n>UniRef90_S5G9S1 1-phosphatidylinositol 4,5-bisphosphate phosphodiesterase gamma n=17 Tax=Percomorphaceae TaxID=1489872 RepID=S5G9S1_PAROL\nMCAARFSGCLNGCAEEAAAGAAGPVMASRMMDWTEAGPRILHSLEMGTVMTVFYQKKSQRPERRTFQIRQDTRQIVWSRNPDKVEGEIDIREIRELRLGKGSRDFERYPEEARKLDSAHCFIVLYGLEFRLRTLSVAAFSEEEVNIWVTGLNWLMIDTQRAPAPQQIDRWLRKQFEVMDRNHEGSVTVKEVKALLPQVNYRVPNMRFLKDKLQEVEARSDLSYPNFAQLYRTLMFDAQRSIIEQLELAFPLRNVDRPELCQISLYDFQKFLQMDQKESWASELSRVREFLMGYMMGGPHPEPMLQLDEFLTFLFSKENSVCDPRLSPVVLDDMKRPLSQYWISSSHNTYLTGDQFSSESSLEAYARCLRMGCRCIELDCWDGPDDLPIIYHGHTLTSKIKFLDVLHTIKEHAFVTSEFPVILSIEDHCSVVQQRNMATHFKKVFGDLLLVKPVDNNAEELPSPHQLRRKILIKHKKLVEGTLYEEVTSASYSENDISNSLKNGILYLEDPIDHTWTPHYFVLTSNKIYYSEETSHYQTADEEEDDEGKEEHNNNNNNNEQHCAERWFHGKLGGGRDGRQVAEKLLREYCEGGAKDGTFLVRESETFVGDFTLSFWRSGRVQHCRIHSRQESGSTRFYLTDNLVFDSLYCLICHYRVTPLRCNEFEMRLGNPVPQPNAHESREWYHSSLSRVQAEHMLMRVPRDGAFLVRKRSEHNSFAISFRAEGKIKHCRIQQEGRLFMLGSSAEFESLVDLVSYYEKHPLYRKMRLRYPINEDTLGRMGTTELDYGALYEVRTPHFYVEANKMPTARCTVKALYDYRAQREDELCFPKQALILNVDKQEGGWWLGDYGGKKQLLFPANYVEEVPSSPTREQEDVSTENSPLGTFLKGFIDVPSGHVVVHKDGKNSRPYVSTIHSQHLSSHPVQTLDVAADSLEDLTSWVAKIREAAQNADARMQEEKQMERRKKIAVELSELVVYCRPVPFNEDKIGTERTCYRDMSSFPETKAGKFATRSRGKRFLQYNRRQLSRVYPRGQRLDSSNYDPLPMWLCGSQLVALNFQTPDKPMQLNQALFMLGGGSGFVPQPDIMRDDAFDPFDKDSLHVEPITIQLQVLGARHLPKNGRSIVCPFVEVEICGADYDGCKCKTDVVADNGLNPVWVQKQFVFDIHNPTFSFLRFTVYEEDMFSDPNFLAQATYPVRLLRTGYRSVSLKNSYSEELELASLLVHIEIVNAKEEDDENLYTSIQLLRDRTSELSSQVSVLERSGSADLSYQQSLEELRAAQDQLSELVEARNRRLTEKKRREKLRQQVAAKRS\n>UniRef90_A0A3L6FD03 NAD(P)-bd_dom domain-containing protein n=4 Tax=Zea mays TaxID=4577 RepID=A0A3L6FD03_MAIZE\nMEDTIMAPSTLIIKSMSSMVDQVAAAVRSPAQEFYIKSRLLLRDPEKALTLFGKQDESVLQGVTHVICCTGTTAFPSKRWDGENTPERVDWNGIRNLVSALPQTIKRLVLVSSIGVTKYNEIPWSIMNLFGVLKYKKMGEDFVRNSEYHSRLSCIQVFTEKFFGGSEIYSDMIQAVCRPGRLTDGPYTSYDLNTLLKATTGERRAVVIGKGDKLVGEVSRLVVAEACIQALDIESTEGQMRLIQ\n>UniRef90_UPI000CE4C9A8 pyroglutamyl-peptidase I n=1 Tax=Arthrobacter sp. GMC3 TaxID=2058894 RepID=UPI000CE4C9A8\nMILLTGFEPFGGESFNPSWAAAQQAAASLTASGLPARALQLPVEFGTSADVLRRALATDPFDLVIAVGQAGGYGTLMLERVAINVDDALFPDNAGHSPVDEPVVAGAPAAYFSTLPIKACLQALQDAEIPARVSQSAGTYVCNHIFYALMNALADMPGVRGGFLHVPYSPEQVTDGKHPSMDVAQVARGLELMVRTSLATEKDLKLGAGTTH\n>UniRef90_A0A1G2CBS7 POTRA domain-containing protein n=1 Tax=Candidatus Liptonbacteria bacterium RIFCSPLOWO2_01_FULL_45_15 TaxID=1798649 RepID=A0A1G2CBS7_9BACT\nMPKENPVLWSDVRSREERRRARIFSSLVFLIISAFLIFGAWAVIYSPLFKIKSVEITGNKSVSDGDIMELATAEIPRGSFWKSVFGTGNILTWPDGFSGESLKFLPELKSFSVQKSYGQRKIKITVEEKKPFGVWCLLGARISADETQISADTKNNISENQPQNLRESAADCWWFDSSGVIFRKAIGVEGNLIASLDDYSQKNIGLNSKILPDEFIPNIFSIFRAVSASGLSVKEMRLNDLALQEIEVDTYNGLPADLSAIALATAEALAKAGPKIYFSLRFSADNVPEVIKSLKEKTTFGSLQYVDFRVENRVYYK\n>UniRef90_A0A410GDA7 Glutamate--tRNA ligase n=2 Tax=Alcaligenaceae TaxID=506 RepID=A0A410GDA7_9BURK\nMTTSTPTQVRTRFAPSPTGYLHLGGARTALFSWAFARHHQGVFVLRIEDTDLERSTPEAVQAILDSMDWLGMQPDEGPFYQMQRMDRYREVIARMLKEGTAYYCYSSPAEIEAMRDKARAAGLKPRYDGTWRPEAGKTLPSPPAGRKPVVRFRNPVDGVTAWNDLIKGPISFDNTELDDLIIARPDGTPTYNFCVVVDDWDMNITHVLRGDDHVNNTPRQINILRALGATLPEYGHLPMILGPDGEKLSKRHGAVNVMEYEGQGYLPEAMINYLARLGWSHGNDELFTREELVAWFDTRHLTKSAAQWDPKKLNWVNAHYIKTTTDADLAAHVAPRIRTRGGDPDAVDLLAVMALLKDRAETLEQLADGAMLFCAPFSPADPELQAQYLDDGAKSLLAAFAAKASDLAEWNTESLDGLIKELLTEHGVKMPKLGLPLRLAVTGQKQTPAIGAVLAIIGRERVLQRLAAA\n>UniRef90_A0A481SX22 Putative ras-related protein Rab-2A n=1 Tax=Franklinothrips vespiformis TaxID=297892 RepID=A0A481SX22_9NEOP\nMSYAYLFKYIIIGDTAVGKSCLLLQFTDKRFQPVHDLTIGVEFGARMITIDGKQIKLQIWDTAGQEAFRSITRSYYRGAAGALLVYDITRRETFNHLTTWLEDARQHSNSNMVIMLIGNKSDLETRREVKTEEGEAFAHEHGLIFMETSAKTADNVEEAFINTAREIYEKIQEGVFDINNEANGIKIGPQKSSTDPSLPSSGQGAGQGSGCC\n>UniRef90_A0A2A5J168 GGDEF_2 domain-containing protein n=3 Tax=Rhodococcus TaxID=1827 RepID=A0A2A5J168_9NOCA\nMSQPLNASPALLSIFWHSREDYSMAQWWIHFDLAGIQRYVFASRTLLDAIGRAAQVEDATDRAVLTAAAVLPEGVEVEFGAAGALILTTEATEFDNPEQPPQRVKDAVSAYTRWLYEVSDAFTPVVAIQYVRGGEEQQAQMAAADLLRQARHKRIPGVGSAVPPGVLRCALTGAPATDFLPPASEIPVAAEALTARRRGRTWHEAQQSKILASAPLPDGLSVDLPVQIDHLGRTEGASSHVAVLVIDVNDLGAALRTLPPDTLHARSAVADHLRALADELAEHLVHRVCSAIEITAGVPSIAGAPTALSFPLHQAPSPSRAAEPDALSCLTADRSTLDSPGEDLGQTAAPARWSLPLRPWVIAGDDLVLVCESRLAWDLATAAMNWIGEPATSGARTDLAGLGPAFGTGGRLSLTVGIGIAVVPVGYSLAAAHDLAAGLCKNAKKQRRDNKWTGHVLDWHRGPSAIADVLAHRARSDLRSGLRPYRYAPKQAPDESHTSTPTWSDVMTLLDADSPGSMRGPTVDEKSHGWASRRNWVKTDLLAAARSTGNNAVENALAAKNTREKVLTDAPMAELNIDGNSWQECDRANLIVDVIDLLDDHLDLTAAVSPS\n>UniRef90_UPI0002377054 shikimate kinase n=1 Tax=Verminephrobacter aporrectodeae TaxID=1110389 RepID=UPI0002377054\nMQIRCALVGMPGSGKSTLGRQLAQHSGVPFIDLDQRLEQTLGCSIRSYFEVAGEACFRDLEAQALADVAQQPGGMLLSTGGGAVLRADNRDVLRRFGSVFYLHALPEEICRRVQHDRTRPLLQGGNPLKRLRALYAQRDGLYRETARHVIETGRSSVRTLVGMAALQLEQDLAADAAQRAAE\n>UniRef90_A0A251XIF6 RibD_C domain-containing protein n=1 Tax=Clavibacter michiganensis subsp. michiganensis TaxID=33013 RepID=A0A251XIF6_CLAMM\nMLDDAGTRTWLEDLYRPGSADHVRLNFVASVDGSVVGADGTSDSLSSVVDRRILGVIRELADVVLVGAGTVRAERYVLPAGRPWQSPPRRAIWRVTASTRTPRRAASSCSARRRRATAPSRRSTACRRRS\n>UniRef90_A0A5F0LGG4 N-acetyltransferase family protein n=6 Tax=Herbaspirillum TaxID=963 RepID=A0A5F0LGG4_9BURK\nMTTSIRPATTADAAAICEIYNHYVLTTTISFELEAVSTEEMAQRIVEVSAIFPWLVYEEDGRILGYAYATKWKARKAYQQSVESSVYMAKDSGGKGVGTKLYSALFAELKACGVHAVMGGIAQPNPGSIALHEKMGFVKVAHFAQVGRKFDQWIDVAYWQLIL\n>UniRef90_A0A849U3X0 Glycolate oxidase iron-sulfur subunit n=1 Tax=Methylococcaceae bacterium TaxID=1933926 RepID=A0A849U3X0_9GAMM\nMFEFMDMEYDQAVDASEQTGPYIPEAGECMRCGQCVSSCPTFRLFQIDEETPRRRIRTISKVLVENLPISDDERHHLDNCTQCRACETVCPSRMAYGQLFDLARAQFQAEPGSLAKLAFKLIENKSWRRRLMPLLAIYLKSGLQKPLRRIGLLKKLGLAEAEALVGNPALQALATSYSARAAMRGRVALFTGCIAEHFDRDTLLAAIKLLNAIGYEVLVPPQQGCCGAIHQHNGQSAVGLINNNIAVFNALDVDAVLHTASGCGAMLSEYQADDDAAAELFKQRLQDIYDFLLKHWPDDLQLMDSTLNVAVHEPCSQRNILKNQQSVYALLQKISTISITPLADNQVCCGAGGSYMLTHPDNSGQLRELKRQAIGAAQADLVVSSNFGCAVFLSSDSVRVAHPLILLAGQLQ\n>UniRef90_A0A3R7NVI0 Saposin B-type domain-containing protein n=2 Tax=Trypanosoma rangeli TaxID=5698 RepID=A0A3R7NVI0_TRYRA\nMRKDHQMRTFIITVCILVVLLFSSAVAAKKEKPLHIPFPKDAVDGISCGVCTFVVKQVYRDVLVLFNASIRRRVRMSEDDVLTALEDVCNPFAETGQWIRRITITHKRETAPFLGVEELQVYTKCKRTCSTVVEACEGVLDHESMDMLSPRLLHLTEYADADKFAEALCDRSPICTKRWGLTASRYDELTTMIDEDTMEEIDPKEMEVERMMDHMERKENRRHSIFYRDEIVKMQEAILRGDKEAVAKVDPSIADLSEEEFAAVQAMVRGKNNEKLRSGTHRADDEGKARDTQRRKHRESDGGEGDLENFELEQEDL\n>UniRef90_W6KER4 Cytochrome b5 heme-binding domain-containing protein n=1 Tax=Phytomonas sp. EM1 TaxID=479712 RepID=W6KER4_9TRYP\nMLSSLLGFNLWQKKWPLLSDEEICKHNNRMSLWIVSGNSVYDVTSFLNSHPGGDAILLRCGGGSKNCAEDFALHSQFGQRQWERLKIGEISEASTTKKSIFYGKEYSATDPEEEEEAALC\n>UniRef90_A0A7W4J316 Amino acid ABC transporter permease n=1 Tax=Gluconacetobacter asukensis TaxID=1017181 RepID=A0A7W4J316_9PROT\nMIDWHFIAIIMPRLLRACGQTMGISLCSLSLATILGLSVALLRLSPIRVLGTAAWTYVWLVRGTPLLLQLFALYYAVPLTGLRLDPWLAGVLALGFNSAAYFSEIFRAAIQSIPPGQSEAAIAIGMGPATTLWKIVLPQALRPALPPYIGQAITLIKNSSLVSVIAVPDLMQTAQSIYSVTFKVVEVMLATGVLYLFMTTLLQIAQTWLERRLNYYTVK\n>UniRef90_UPI00174618E5 clostripain-related cysteine peptidase n=1 Tax=Phormidium tenue TaxID=126344 RepID=UPI00174618E5\nMYAQRLLRSSRLFDSDRQASFDQASRSASLFSSDSPRDTTRAGQRNRAAAAKSAKRQPRRQKTRSVGSAADWTVMVYMAGNTLERFGIQDFLEMANVGSDSRINLVVQFDRTAGGNTSYGNWTDTRRGLVRAGDMPNAFWGNGLGELNMGSTATLKNFVDWGTNTYKANRYALVMWGHGDGFNVSYDDNTGDGISGSELSSVLSSTGNKIELVGTDACLMATTEFAYQIADNASIFVGSQELEPGTGWNYTTTLQDLKANPTMSAAQLGSSIVTRYGQAYPTGNETFSAINLLALRSSNASSLTNTLNSFASTALTSATSSDLSILDSLRDYFANDFGDATYRGSEDLCDVGNLFSNLVNRLDISAAVRTAAQSVLTAYDSTVLQNYSATPGRSTGLSLYFSDRNSIPKSSYTSRLYGFLATTQWDEFLQGWLWN\n>UniRef90_A0A1A2YYB8 MarR family transcriptional regulator n=1 Tax=Mycobacterium kyorinense TaxID=487514 RepID=A0A1A2YYB8_9MYCO\nMGRIEDAPLGYLLYRVGAALRPEVAAVLRPLELTLPEFVCMRILSMYPGMSSADLARQTNVTPQAMNTVLRKLEDVDVVARPATVPSGRALPATLTTAGRALLKRAEAAVREADARILSKLSASEQREFKRMLEALGSD\n>UniRef90_UPI0003641618 heavy-metal-associated domain-containing protein n=2 Tax=Streptomyces TaxID=1883 RepID=UPI0003641618\nMTAQTDTQGSVTTVYKVSGMSCGHCEGSVSGEISGLPGVSSVKAVASTGEVTVVSAAPLDDEAVRAAVDEAGFELVGQA\n>UniRef90_R9J9S0 DNA repair photolyase n=1 Tax=Lachnospiraceae bacterium A4 TaxID=397291 RepID=R9J9S0_9FIRM\nMKNLKEDYFNPFFSHIYVEKSVRNHARTQNILAKFPSAQIIEIGHYKDVFCRSRQNIRLQHCAQKLILAARQGTLLYEGAPVCQRFGNEHFYYVSCAMNCIFDCAYCYLKGMYPSANIVVFVNLEDIFAEVERVLENHPLYLCVSYDTDLLALEPLIGFVQEWCAFAAKHAQLTIEIRTKCANKAFVQSIVPMPNVIYAYTISPQAVIDAFEHHTASLSDRLFCAAALMRAGCPVRLCFDPMIYLPGWKTHYSEMMNQVYRSIAVDQLLDVSIGTFRISQDYLKNMRKQAKDSAVIWFPFQKEDGYCHYPAPLMEEMESFLTAQIAEKIDREKIFRWNV\n>UniRef90_A0A6I6SRI0 Gamma-glutamylcyclotransferase n=2 Tax=Halomonas TaxID=2745 RepID=A0A6I6SRI0_9GAMM\nMRLSHVVLAASAALLAIVGWLWLTMLSPLTYDRPDHLPEIDEGEHAVFVYGTLRFAPVRWVVMGRAGETEAAVLEGFRREGLDLAEAPDERVQGEIVVVDADELERLDRYERLGIRYQRVPMRLADGRVAWVYRRLNEITQASESPATD\n>UniRef90_A0A373XTP8 Dihydropteridine reductase n=1 Tax=Ruminococcus sp. AF17-11 TaxID=2293150 RepID=A0A373XTP8_9FIRM\nMNTDKIYAEQLANEYTPKDTSKVVALRKLDAKAKLPATIFTYTFGIISALIAGVGMCLSMKVIGSGSDAMFILGIIVGIIGFVGVAVNYPIYKKLLNKGKKKYAFEIVQLAKEISEKDM\n>UniRef90_A0A366JGF4 FAD:protein FMN transferase n=1 Tax=Marinomonas rhizomae TaxID=491948 RepID=A0A366JGF4_9GAMM\nMRKKILFSVFLLIAIAVVYRLSVFTPELASFSGPTMGTTYTVKFFTTKEVGDAWVVKEDVDAALVRVNSLMSTYDPNSELSLFNTLPAGQSAVISDDMAYVVDKALLISEMSGGEYDVTVGPLVNLWGFGPGKHEDKVPSQELIDEAKSRVGYQYLKLDGRRLMKEKDIYVDLSSIAKGYGVDAVARVLQDRGIESYLIEVGGEIVSKGLKPDGAPWRIAIESPAGGHDIAERIISVTDVAVATSGDYRNYFEKNGVRYSHTISPISGRPITHRLVSVTVVDKTTTMADGLATAVTVLGPDKGFEFVQKNGIAAYLLVKTDFGFEEHSSDAFKAYLK\n>UniRef90_UPI0019100A88 hypothetical protein n=1 Tax=Aliterella atlantica TaxID=1827278 RepID=UPI0019100A88\nMVLIDNPNTRVTVRNIVQTLVFEDEEENTISETNGCLVGKLIEVRFGLLRSCGKEK\n>UniRef90_UPI0013E3DCB5 hypothetical protein n=1 Tax=Streptomyces sp. B29(2018) TaxID=2485016 RepID=UPI0013E3DCB5\nMSNVDELRDLPALLQRVDFREEVVPHTAGAIEVFFGECREMPLRAVDPTKPRERHV\n>UniRef90_A0A8C8YVF0 Actin binding LIM protein family member 2 n=1 Tax=Prolemur simus TaxID=1328070 RepID=A0A8C8YVF0_PROSS\nMSAVSQPQAAHSPLEKPPSTAILCNTCGNVCKGEVLRVQSKYFHIKCFVCKACGCDLAEGGFFVRQGEYICTLDYQRLYGTRCFSCDQFIEGEVVSALGKTYHPDCFVCAVCRLPFPPGDRVTFNGKECMCQKCSLPTSVGSSAHLSQGLRSCGGCGTEIKNGQALVALDKHWHLGCFKCKTCGKLLNAEYISKDGLPYCEADYHTKFGIRCDGCEKYITGRVLEAGEKHYHPSCALCVRCGQMFAEGEEMYLQGSSIWHPACRQAARTEDKNKETRTSSESIISVPASSTSGSPSRVIYAKLGGEILDYRDLAALPKNKAIYDIDRPDMISYSPYISHSTGDRQSCGEGDQDDRSYKQCRTSSPSSTGSVSLGRYTPTSRSPQHYSRPAGTVSVGTSSCLSLSQHPSPTSVFRHHYIPYFRGSESGRSTPSLSVLSDSKPPSSTYQQAPRHFHVPDTGVKDNIYRKPPIYKQHATRRSDGEDGSFDQDNRKQKTSWLILKGDTDTRTNSPDLDSQSLSHSSGTDRDTLQRVQGDNFHSRPPYSKSDSLPGHGNNGLDHRNANLAPCGADPDASWGMREYKIYPYDSLIVTNRIRVKLPKDVDRTRLERHLSPEEFQEVFGMSIEEFDRLALWKRNDLKKKALLF\n>UniRef90_UPI002036F24A dirigent protein 23 n=1 Tax=Beta vulgaris subsp. vulgaris TaxID=3555 RepID=UPI002036F24A\nMNKFRLPTSFICVVLTFYIVNVSSAKTPSWAKTERYGHEHKTVIQFYFHDVRSGDAPTVALIAQPVEARSFASGFGNLFMADDPLTVSPDPNSKLVGRAQGFYGSASQESVSYIMGLTYGFVDGIYNGSSVVIFGRNSIVNRVREFPVVGGTGIFRMARGFAVAQTYFHNSTTHNAIVVGYNITVFHLELAMGRAGPDHGPGPRAEVEYGPGQARGP\n>UniRef90_UPI000C85D657 HNH endonuclease n=4 Tax=Vibrio TaxID=662 RepID=UPI000C85D657\nMNWVIYVANATTKNFDIGLNQGIWGHKEIFSTVNTDKIKVGDTLYFVHHLTFMRDDNGNVIKGAPRVAAEHYKGSISTLVETRVTKGFYIDKKTVWPDDIYPNRYNFEVIEKHQNLPFSDEFFSSEFVQAVRTSTLTKGLAIELEGEHGEVYASNENIDLEYFEGNTVFRRHLVRERSTKLVNDKKRSVRDANLKLACEVCGFDFEDTYGERGYDYIECHHKNPLSESNGQKTKLKDLALLCSNCHRIIHRSRPWISVDELKEILNERASEATV\n>UniRef90_A0A507FHA7 PRP1_N domain-containing protein n=1 Tax=Chytriomyces confervae TaxID=246404 RepID=A0A507FHA7_9FUNG\nMFHKPAFAPDFLSKKPPPNYIAGLGRGATGFTTRSDIGPAREQAPEEVAPPAIGPMMGGPAIGPGMPGMPPGANGDAPKKPLDDDDEQFQDPDNETGLFNTAPYEADDEEADRIYEEVDKAMDERRRARREAREREELERYRKERPKIQQQFADLKRGLAAVSQEEWAALPDVGDLVRKKGTKKKLPDRYTPSADLITIGGGFGSTVSGGGDAASGFATSIDPRMMGGLSTPAGTASVAGDQSGILTDFVQFGQGRNKVLGLKLDQMSDSVSGQSTIDPKGYLTDLNSMVTKTDAEISDIKKARQLLRSVITTNPKHAPGWIAAARLEEVAQKIVAARELAAKGCEECPKSEDIWLESARLNSTENAKIILATAVRHIPTSVKIWLRAQSLEQDVKAQKRVLRRALEFIPNSVKLWKAAVSLEEDSDDARILLSRAVECVPLATELWLALARLETYENAKKVLNKARTAIPTSHEIWITAAKLEEQQGNIGSLDKIIPNAVTRLAQKGSTLDRDSWIKEAEECEKEGFVGTAQAIIKATIGIDVDDDDREGTWLEDAESSVSHGAIATARAIYAYALQVFPQEEGIWRKAAFLEKSHGTRESLEEVLQRAVKYCPQAEILWLMGAKEKWLAGDLPGAKGILASAFEANQNSEQIWLAAIKLEVETGEYGRAQALLLQARTKADTDRVWMKSAMLERQLGNLPVAMSLLEEAITKFPQFGKLWMIKAQIEEHQLSNVVAARDTLSKALKAVPKSSPSAVTLWLMASRLEERAGQLTKSRALLEKARLLNPKQPELWCEAIRVESRASNQAIADALISKALQECPTSGLLWSEAILSESRPQRKARSKDAWMKSENDPLVLVTVARLFWSERKVEKARNWFARAVKVNPDLGDSWAWWLKFESVQEGDTTKMVADIVAKCKAAEPHHGERWQACAKDLSNTGRSVEEILKMVASSLPVTV\n>UniRef90_B2YJ48 Cpn60 (Fragment) n=2 Tax=uncultured soil bacterium TaxID=164851 RepID=B2YJ48_9BACT\nATILAQSIYREGVKAVAAGANPMALKRGIEKAVEAVVEDVKKLSKEVKDNETIAQVGTISANGDAEIGKTIADAMKKVGKDGVITVEESKTMTTELQTVDGMQFDRGYLSPYFITDPDRMECVLEDPYILIHEKKISNMKDLLPLLEQIARSGKPLLVIAEEVEGEALATLVVNKLRGTLNACAV\n>UniRef90_A0A6I7QH38 Translocation/assembly module TamB n=1 Tax=Bacteroidia bacterium TaxID=2044936 RepID=A0A6I7QH38_9BACT\nMVIIIMMPFIAYAFLQSSRVQTYLVGHLTDYFSRELQTEISVGSVDIRLFRSVILKDVIINDRQGDLILEMRKMRFELGKLSFQNRSLVIKELEFRDAFLNLFKDKQEENYNFQFLVDYFSSPTVANGHNRWEFTCEAFKLTNASFWHLDLNRKSGVNGFDPANFYVSGFYLAMNQIEIVDNTLSLALDYLYYNESSGFIIDYLSGNFLLKHGQLDIDNFIFRTDGSDLNFSLSAKYGSFTSLEELVADLRFQMDIGKSVLHLADLGHFIPGLYGVNDTMKIEGAFEVLGDTLTGDNVLVEYGLKSRFDGDFQLKNFLGGSDMRLEFTARTLQSNFNEIAALNLPVSLEKSKPEFPPFLYNLGDFEFSGRIYGGLHSFQSEGSLASSIGTTYANLLMQRDNESMPYQYQAKVNTRNLDIGRLFGIGASAGKATLELNIKGEGFHPDNLDLLVDGHIASVELASYTYNDISFQTEFLNQNLNGQLGVKDQNLLLDITANAQFDKEIPFFDVLVNIEHANMTKLALFQKDSLVESLLKTHIHFNGKVSSLDSFEGDLVFREIRYEEIPLEQDHHSSRYLVFTDSIFINSKKWSPDNQHIRLRSGFADADVHGKLHLTALPRNLKESVQNILPFGEPDLSGYTGTEYYQDQDIQFSFHFKDTRILSELFLPALSLSGNSWLNGHYRSADHHLIFIAHADTLALENRRFLDLNIGGTHGENNYSITFDSKRLMVSDSLHFDLVSLQSGWKEQSLDVKLEWQGTNGDESGIGVISGHANVYDKNHIEFSFLPSYALIHGDLWRINIDNKIIVDSSRIEVSGLMVYHGDQFIRADGVLSDHPRDRMMVSFSNFEVAYSDLFLGESNFKFGGILDGYVTFTALYQSPSIGAGLTIQNFAFNHQELGDLQLSSIWQFDKQAFLVDGKITSKADDQEHNLLTLSGSVYTGQNIGRYDLGISLHNMKMEVWRPYVQSFSENFKGLATGELHLGGPLNSPELTGQVRLMETSMHIPYLNVTYFLEDDVRFTKNAFVFEDVAIRDTLGNIAKASGAILHNSLRGFGLDLHIRPSNTIVFNTTAVDNSIYHGTGFVTGLAHLHGPVNDITMDITARTNRGTRVILPLNSAGEVRENHFITFVARNPENNLPLMPPPDLSGNITLNFDLEVTPEAEVLLMFSPPFGDIIRGRGNGNLKLEIPPDGAFNIYGDYVITEGEYLFNLQNIINKRFRIEQGSTIRWTGDLNDADVEMQAAYRLRTSLYDLFVGEGIDSETVEMFRRRVPVETLLILQDRLFNPTISFDIQVPGGDENTREMIERVITTEQEMNRQVFSLLVLNRFLPSREDQYNTALGFGVGSTSSELLSNQLSNWLSQISTDFDIGINYRPGDEITSQEVELALSTQLFDNRVTIDGNFGVAGNQTASGQPTQATNQIIGDVNVEVMITPEGKLRVKAFNRSNTFDIIHTNAPYTQGIGVFYRKEFDRLEELFRRNRIPEIPVDSD\n>UniRef90_A0A6G6Z3X8 (2Fe-2S)-binding protein n=2 Tax=unclassified Bradyrhizobium TaxID=2631580 RepID=A0A6G6Z3X8_9BRAD\nMFKRSDQDKRPSVQIFVDGAAIEARAGDTVSAALLASGRDVRRATAVNGAPRLPYCMMGVCFDCLVTIDGVGNRQGCLVPVTEGMQIEIQKGKREIGR\n>UniRef90_A0A7K0PYB7 M50 family peptidase (Fragment) n=1 Tax=Actinomycetia bacterium TaxID=1883427 RepID=A0A7K0PYB7_9ACTN\nMLGRSVSVMPGRYPSSPGLSPRRPGVVGWTAMTEIWDRVGATSPPLPPLWLGVTAVLALVLVVQRDLWRVTRNAVTIAHEGAHGVAALVTGRR\n>UniRef90_A0A177HN16 Cell wall protein-like n=1 Tax=Streptomyces jeddahensis TaxID=1716141 RepID=A0A177HN16_9ACTN\nMPSLKLAPLYLRAEEKGSDSVQRHSSLSGYASMIACRLAFGRGSDSPRAPRTLRMYVSSAPSSARTSVTSMPPSVSVPVLSRQTVSTRASPSIAGSSCTRHCFRPRRMTPIAKATEVSSTSPSGTIGTMPPTVRAIASLKPESSVSSASWLMIRPRAVGIIIHVTYLRIVEMPVRSSEWTSVKREASSASCAAYASRPTLVAVNAPPPATTKLPDITGSPGFLTTGSASPVSSDSSISSPSASATAPSTTILSPGPISIRSPRTISEVLISADTPSRRTVGLASPINARESSVFLARSSWMMPMPVLARIT\n>UniRef90_UPI00083E5566 3-deoxy-7-phosphoheptulonate synthase n=1 Tax=Streptococcus himalayensis TaxID=1888195 RepID=UPI00083E5566\nMTFKALSQPINVKEVRSNYKLEGASLQRKEERDAALNAIIRGEDDRILLVIGPCSSDNEEAVLEYAKRLAALQETVKDRIFMVMRVYTAKPRTNGDGYKGLIHQPNATAAPSLINGIKAVRKLHYRVITETGMTTADEMLYPENLPLVDDLISYMAVGARSVEDQQHRFVASGADLVTGLKNPTSGNLTVMFNGIYAAQNKQSFLFGNTEVETSGNPYAHAILRGAINEYGKNVPNYYYDNLLDTIAQYEKMGLENPFIIIDTNHDNSGKQYLEQVRIVRQTLINRAWNEKIHRYVRGFMIESYLEDGRQDEPDVFGKSITDPCLGWDHTEQLVREIYETLGK\n>UniRef90_UPI0003685307 undecaprenyl-phosphate glucose phosphotransferase n=1 Tax=Gayadomonas joobiniege TaxID=1234606 RepID=UPI0003685307\nMGKRGYLREHQHAFSSLYRVIDVVLICLTLFVSWDCFAGLDTKQHYFVAIVASLIFLYLAETFGLYRSWRLARFYQLARTITFVWSVTFLSTVFVAVLLEIPEGVSQLVFVSWGLVGTFLLSAWRYAYYVAIKKLRKKGFNTRSVAIIGHTRVGKELYKQIRLHSEAGLKFVGFYEDRMPQRYMGDKYSSDFIRGSAEDAIKAAQRGEIDQIYIALSLKQEDRISQLLVELGDTTADVHFIPDFFVFNLVQSRMGYVGNLTTLSVFESPYAGTNSWLKRAEDIIFSSIILFIISPVLLAIAIGVKVTSPGPVIFKQYRYGLDGKRIKVWKFRSMTTMDNGDKVVQAKKGDARITPFGGFLRRTSLDELPQFINVLQGRMSIVGPRPHAVAHNEEYRKKINYYMMRHKVKPGITGWAQINGWRGETDTLEKMEKRIEYDLHYIGNWSVWFDIKIIFYTVFKGFLDKNAY\n>UniRef90_A0A7V0QHY8 3HCDH domain-containing protein n=1 Tax=Deltaproteobacteria bacterium TaxID=2026735 RepID=A0A7V0QHY8_9DELT\nMMGGSMKEKILVLGRGEIARSLFDICKQTELSVTFLESADELGPQLRDTDIIVQFVADGLELPHLKESDFIGKYKVWLIEVIDQSVTRAAGRMGCSERIVGFSISKSFQERRFIEVIGGERTGSDAVTTARNLFERLQFTVVISKDHPGYILNRVVASMINEAIYVSMYGLAQMEDIDQMMRLGANFPMGPFEYADYLGLDRVLKTLEWLAEELGPQYRPCPLLRRKVEAGLLGKKTGKGFYEYGI\n>UniRef90_UPI001106F8B2 antibiotic biosynthesis monooxygenase n=1 Tax=Eubacteriales TaxID=186802 RepID=UPI001106F8B2\nMICTLVRFHIKHGCGDRFLELARTSVEQTRLEKGNISYDMGPELGKTDTFIFFERWKNQESVDIHESQTYFQSFDRAAGELMDGPVEVFKMEPPF\n>UniRef90_A0A2E6YUS8 SLT domain-containing protein n=1 Tax=Halieaceae bacterium TaxID=2026743 RepID=A0A2E6YUS8_9GAMM\nMKNVLGIVTLVLSMGSLPGISLAASDDDRAALTTDLSKALTEDNEFQDRFDAEVWLVDMQQRLAPLVPDAQERLDLLTQVHQQASRVVLHPELVLAVIEIESHFDRYAVSRAGAQGLMQVMPFWKNELGRPEDNLTDTATNLQYGCHILRFYLDREDQHLSRALAAYNGSSGSERYPNKVRDAWQTRWRTQPIDW\n>UniRef90_UPI001D0CC098 thioredoxin n=1 Tax=Roseitranquillus sediminis TaxID=2809051 RepID=UPI001D0CC098\nMLELGGRKEDAATDLIKDSTEATFMQDVVDASRDVPVIVDFWATWCGPCKQLTPALEKAVTEARGKVRLVKVDVDRNQQIAAQLRIQSIPTVYAFWQGQPVDGFQGAVPPSQIKEFIERLVKLGGGDDGDPLAEAVEAAETMLAEGAAVDAAQTFAAILGEAPTNAAAYGGLVRAHLAMGEADRAAQLIDAAPAEISGSPELEAARAQLELARQAEKAGPVAELQQAVEADPTNHQARFDLALALHAKGDVAGAVDQLLELFRRDREWNEAAAKTQLFTIFDALKPQDPIVLNGRRRLSSMIFA\n>UniRef90_A0EUM8 Protein Nef (Fragment) n=1 Tax=Human immunodeficiency virus 1 TaxID=11676 RepID=A0EUM8_9HIV1\nMGGKWSKNSLGGWPKVRERMRRAEPAADRVEAEPAAVGVGAVSQDLAXXGAITSSNTAATNABCAWLEAQEDEEVGFPVRPQVPLRPMTYKAAXDLSHFLREKGGLEGLXHSQKRQDILDLWVYHTQGYFPDWQNYTKGPGIRYPLTFGWCFKLVPVEPEKVEEANEGENNSLLHPISLHGMDDPEREVLVWKFDSSLAFHHRARELHPEYYKD\n>UniRef90_UPI0021B1B406 hemerythrin domain-containing protein n=1 Tax=Mycobacterium sp. SMC-2 TaxID=2857058 RepID=UPI0021B1B406\nMTSAWRSSDLAEAFREDHAVLGRGLHEVSEHLRAGNDQAAKARAERVDREAGAHIAFEEQFFYPALRRTLGDAEVDGLYEEHGEGLSVIKALAQLPEGAELTEADRRTLLQASELTESHVAECGELFGVMGRIPPDEQQALYRELLSLREESPRWTEFAARTKEG\n>UniRef90_A0A7D4A833 Superfamily I DNA and RNA helicase-like protein n=6 Tax=Actinomadura TaxID=1988 RepID=A0A7D4A833_9ACTN\nMTERHLVALTKPEPSPVLDPGEAATRAVDGVLADLGGGHRGVVVDSPPGAGKSTLVVRAAAHLAEAGERLMIVAQTNEQVDDLIERIATKHSQLTVGRLSASGYLPSERVLAHPSVRVAQKADDLAEHTIVIATAAKWATLSDGSWPWAIVDEAYQMRSDMLLRIAGRFERALFVGDPGQLDPFSTVEVERWAGLSWDPMRSAVSVLLAHNPGLPVHRLPVSWRLPASAAPVVSDAFYPFTGFRAGTSDGDRRLEYGARGMGTTYDHALEEAAATGWALYELPARHTLRTDSEAVRATAALAVRLLQRGPVAHSELGSKPVDATRVAIGAAHRDQVTAIRAALGEHGEGITVDTANRLQGREYDVTVMLHPLSGRRDATAFHLESGRLCVLTSRHRHACIVVARAGIPELLDAHPSTEPVHLSVPVKFPDGWEANQSILAHLARHRVAAD\n>UniRef90_UPI00132F9BB1 sulfatase-like hydrolase/transferase n=1 Tax=Klebsiella pneumoniae TaxID=573 RepID=UPI00132F9BB1\nLRNSGSTFSLVYFSDHGLAFKERGKDVQYLAHDDKYQQNFQVPFMVISSDDKAHRVIKARRSANDFLGFFSQWTGIKAKEINIKYPFISEKKAGSIYITNFQLQKVD\n>UniRef90_A0A554VFG8 AtpZ/AtpI family protein n=2 Tax=Flavobacteriaceae TaxID=49546 RepID=A0A554VFG8_9FLAO\nMGGTIFLCAYGGKKLDAYYELEKQWFTMGLVLFGVTASIYLVIKQLNRINKSDR\n>UniRef90_A0A7C1UAD0 CBM-cenC domain-containing protein (Fragment) n=1 Tax=Phycisphaerales bacterium TaxID=2052180 RepID=A0A7C1UAD0_9BACT\nMNVRWRSQGDFCESTCSDGGRGHNNRGALSKRRTTMYKQLMFPICLTVVLGLTARASEPFGHWPFDGHVNDVAGSANGTFFGGSPDYVNGRIEQAIRFDGVDDYVEVMVENLDAYTITAWVMPDRVEPASIVVRTSPSGTTTHWSHQMRIAASGQFEHYVWDGAAQTALGTTQVEAGNWYF\n>UniRef90_A0A6P0WQH9 Type II secretion system protein n=1 Tax=Caldora sp. SIO3E6 TaxID=2607806 RepID=A0A6P0WQH9_9CYAN\nMNICELPQKLLPQKKTTQPNQSGFTIIESLVAIIVISILMLGLSPVIFLSVAARVQSRRVERGTEVARTYIDGVRSGAIPATNVVVGAATDRTLEAGPVPTALNPVDWSDPGGLYCVDLDASGGCEAGSMNDMVVQGFRTPGDADRGYLLGVRVYRAHAFSGGEPLQKGQTQSSFSGTLGNSKVPVVEMTTEIPPSGAFQDNFSEWCARLPNTNPISTCN\n>UniRef90_UPI0006E338CE trehalose-phosphatase n=1 Tax=Streptacidiphilus griseoplanus TaxID=66896 RepID=UPI0006E338CE\nMGIPEPTTPAGAEGLAALVADPAHSVIALDFDGTLAPIVPDPDQARAHPGVVPALARLAPQVGAVAVVTGRPAGVAVRHGGFAGVPGLEHLVVLGHYGAERWDAVTGEVRAPHIHPGVASVRAELPGFLDRIGAWEGTWVEDKGRAVAVHTRRTEDPDTALEQLRTPLLELAARHGLMGEPGRMVLELRPPGVDKGVALTGFLHERKARSVLYAGDDLGDLAAYDAVTRLRTEGVAGLLVCSAAEGEEPVGRLEERADLVVGGPSGVVGLLDALADEMGAPRP\n>UniRef90_UPI001CB69EC9 polyubiquitin-A isoform X6 n=1 Tax=Frieseomelitta varia TaxID=561572 RepID=UPI001CB69EC9\nMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDDRTLSDYNIQKESTLHLVLRLRGGMQIFVKTLTGKTITLEVEASDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGGQ\n>UniRef90_A0A6M3XMR9 UDPG_MGDP_dh_C domain-containing protein (Fragment) n=2 Tax=viral metagenome TaxID=1070528 RepID=A0A6M3XMR9_9ZZZZ\nANPFGFVSEAREKQSKWLAKLIKREQERRKLPVVIMGLTFKHNTNLTTDSPAILLMEQLEDMGVKTSAYDPVVMPSRPKDVPSIYFIATRWVKFSTFPYAKGSLIIDPWGFFGVAPEGCELFSIGRNR\n>UniRef90_A0A7W1P943 DUF4625 domain-containing protein n=1 Tax=Acidobacteria bacterium TaxID=1978231 RepID=A0A7W1P943_9BACT\nMKKPPLQRRTISVPVPELPPGKYKLVIIAESRGAVARSEVLAYEVR\n>UniRef90_UPI001F566F06 DUF6516 family protein n=2 Tax=Shinella zoogloeoides TaxID=352475 RepID=UPI001F566F06\nMQARLILKTRRHIGEAMFADLVIWRVPEPLRGSRHPFKYRLAFVADGICVMRYDNEAGKGDHKHIGAEEQPYAFQSIEKLLLDFDADMKGWIDGNADRED\n>UniRef90_A0A1I7GQJ1 Glycine--tRNA ligase beta subunit n=4 Tax=Burkholderiales TaxID=80840 RepID=A0A1I7GQJ1_9BURK\nMTAPSNLLVELFVEELPPKALQKLGDAFAQVLLEQLTAQGLATGASQCTAYASPRRLAAHITAVLPQAADKAVSQKLMPVSVGLGADGQPTPALLKKLTALGADASAAAALKRVHDGKAEVLYFESTAKGALLAEGLQKALDEAVAKLPIPKVMRYQLQDGWSSVNFVRPAHGLVALHGASVVPVAVLGLQSGRATQGHRFEAAASPVALRDADSYAAQLRDEGAVIASFAERRAEIVRQLQAAADKVGGGVRPIEDAALLDEVTALVERPNVLVCQFEQEFLAVPQECLILTMKANQKYFPLLDAEGKLTHQFLVVSNISPQDPSAVIQGNERVVRPRLADAKFFFDQDRKKTLVSRVEQLAKVVYHNQLGTQGERVERVRAIAKAIGAQLFEALAAQHRIDGTQDAEVVQDYLMTCVDNAALLAKTDLVTDMVGEFPELQGIMGGYYAVNDGLPDDVAHAIEDHYKPRFAGDALPRNNVGLVVALADKLETLVGMFGIGNLPTGDRDPFALRRHALGVIRMLAERDLPLDLSALLAAATPAFGGKIEDATAQLADFIYDRLAGSLREQGYSAQEVDAVLALRPQRLALVPKQLAAVRAFAALPEAPALAAANKRVTNILKKAGEVDAHVNPELLQEQAEKDLYVALQRFVPEANAQFLAGDYTGSLQTLAVLRAPVDAFFDDVMVNAEQLDLRLNRQGLLKTLHDAMNRVADLSRLAA\n>UniRef90_A0A835R703 Transmembrane protein adipocyte-associated 1-like n=1 Tax=Vanilla planifolia TaxID=51239 RepID=A0A835R703_VANPL\nMMAYYGLIWIVSVLNLTWCILQAWQCTPTKEFSWNLLSLCTKSGMLFLEVSLISFLLQGNQAGDLEALTRTFVVSGVIVAVDVLLKAVYVFGFGVPMFLDGVGPSNHVKWGLWIVHKLLLAAVYVLILFMYHSKWREMLPAQPAFRNYICVMFSINALSLFSCLLMENGAGFGYWLLSLVTLCYHSLYLPFLYITFLADFFREEDMRLENVYYSEMKDAGFFDADWD\n>UniRef90_A0A806X1Y9 DUF4091 domain-containing protein n=1 Tax=[Enterobacter] lignolyticus TaxID=1334193 RepID=A0A806X1Y9_9ENTR\nMLNPCIDDPDEHLVFLDDGRVEPALINGQESRKGKASIQYLGLARAELLQMRARHRRTVIAAIRHTIAALEEGRDPGTDLDDLLTLLSSKEAYVAYTRTLVRTHMSAYIEALGL\n>UniRef90_A0A1V9ZKS3 Secreted protein n=1 Tax=Achlya hypogyna TaxID=1202772 RepID=A0A1V9ZKS3_9STRA\nMAGRERRAWCSWLLVLLYALTVRGNQLLVISQPATMTAGDMLSPPVLQIVDDTGLVLSDINTGTVTVSIETNPLMYAVLSGTSGLAFPIVAGVVTCSGLSINLVASGYTLSFVALSYGLQTSSNPFDIILGPPYQLSMYTYIGVAQGGTPFSPQPTVAIVDKGGNLVASVSSGSVSVAILNNPVGGILTPAIAHTVYFYEGFGKFYDLQIDKAGGPYTLKFTCDASLNLPGGNSYTTFPFTVAIGPPRTMFIAAYPLAAFGGEAFVTQPMIQLLDAGGNTLQTQPSMQIAATIYANPSGGRLYPATETSASVINGFASFKNLRIDLAGNNYMLRFAITMLNVLGVYAETGLAVVGPSLNVYLGALFSLQVLRPPESAIADGQPFYTQPVLVLRDRGNNTISTENLALVSVSMVPSLALYNNLIVSTANSPIATITDVTLLFSPFSAPFGAGTDLFINVTFSQQIMATGSIVLQMNSAPGALATCNTLLTWSNRLTFGYGITAGDAAAALNYASTSALTLQGGATLVDRLGVPASLILPAAGLRPAVVVDTTAPSIVSVGCVPPFVAGTYGPGQVVSLLVTFSAPVSIYSTLMPYLLLNTLPAQSAIYSSGNQTASLVFQYIVGPTDAVATLDVVAALNTNGGLLRRAGTALKQDALLQMPATASSRLPAQCPLVISSVVPAIDATVGVTSATPNGVYATGDRIFITVPFTALVAVSGIPLLALNTGRNAAYSSGSGSSVLTFQYIVQAGDSVAALDYASPAALMLNAGTIQRFVTAGSPLLDVNIDLTATTASNRNLGQTAALVLNGLAPTVVSVAFPVAPTTYTRGGTVAITVTFSYAVVVQGQPSILLNTGVAATYASGSGSTALVFNYRVQLGDATTDLAYAPTSTIVLNGGSILQQSSTPSLAAQLMLPWPPAIVNAPVTIDPALTAVTTVVSITADQVAGEYGQNQVIQITVTFSDAVQIVGGVRLALTTQTVAYASGSGTKALVFLYIVQPNDATSSLNIASASPFTCTAGGGCSIANANYLAANLDCTGLTLQPTAIVINTVAPSVVSVAALTPAPTINRGTFVVGDLIQILIVVSKAVDVQPSPSVFPTKVPTLLLNTGQVAYFTGYDNGDRTRLLFQYTVAVGDATPNLQYASTGALTLNYNQASIRRLATNPTTPMNLLLPVVANLGTNLVVDTSRTPIVINVASITADGTYFVGDVIAIRVTFSEYVVVSGIPVLLLNLGVYDRSAVYVSGSGSTSLVFQYTIGQDDFSKDLSYIDLRSLYNPPGASILFQSTNPTVAANCQLPLPGSAGSLSANSNLQVLGGTPYIVDIAFLSPNATYTVDNTIDVQVTFSAKVVVSGTPFLRMASGPSLRQAFYVPTVGASTTVVFRYRVQTGDVSMDLDYADTAAIQLNGGSILTAPTLLTSIPVQPANLQLNPPGGALTGTRTVQTVAGVVNYVNLGIDTMGLGYIFYFATATVVTSVQFDVTYSAVWEVRNAPLNEQNRGDRTGSSVDITTGVAVVGSAGAKARQYNVQVVTASGSATKYVNEIQYVQTTCVQRDAIQVLTSSAAPGSTLGGYFTLMLGAEGPTRRLAYNFDATQLKVALELDFGFDAAAVEVTRTPNTFCGCFDAYAWTITFHTDGEIPTLLARSYLTGVSATVGDGTGGASALVLSLPPVVNGQFALRYGALVTASMPSNVDATTMANRLTTDLNLPILSVQRSLPTVQAGYTWSITFYASATIFNPNELEPAPLLLTGNQVLLSVTTVQEGQAPLYGNFRLSIAGHTTPNIAVTASAGDVQTALQTLPEVTSVAVTRSAVNPSGGYSWTITFLQINLMSTYGLVLNSLGTLPPLTPMTLVNGAPILMGTSATIMVNYAGVNPSANSPAGFGNAPGESAGSVTIFVPRNLQWIQSANLLGSDTQSGDNFGAAVAINTAGTQVDRGRKEIQTLTCTADGGSFTLTFLGITSPPISFAATAATLQAAIARLLNVPLSQIAVSTYTNLCAGIGVAVTFATPDLSTETGNVPNLVPDGSSLTSSGGPGSIVVQEIAPGTYRLDGTEAKGATCGGAYFYQASAGMWSQMAKMLPMDGSEGTSSEFGASVALENTYAVVGAPAAADSVGEAYVYIFNGLTWSFFQKLTCAPYAGTKGDRFGEVVKVSGSTIAISAPGYASNLGAVFVYKLVSGVFLSHEKIQAGDLSAGDRFGSAIALDMAVSTLVVGTERQATATGAVYVYYSRDVYFALQQKLQGSDTRVNDGFGHSVAVVRNVLLVGANANFGATTPLTTRKAVQSIVTSATSPIRAGSTFLVGFRQFSIGFENDYVMSTPIPFDASAVLLQVILQRTLNTGALVVTRLGPDANNGYTWYVTFAGSTAAVTRFAVDGTGLKGSNADVAASVLVAVPPIVRSNTYVFTRTGTFWREQATLRPTNKQYFSLFGHSVALSRNGYHAAVGAPNADTLFTGVNSGAGYVFDLGFLDFQLSASAYSVLEGGTISIPVQRCGPLGLTCTMKSTSVEGFIDLDTGDAVTDRAGTNNVPSKMLKYIGPYQQLAMLDMAAVTSGAKYYPGIWGPEPYPQVPMGRYLLPSWVGTAESRAQFYGSAETRSLWIDSQFDYQGHSDYTPTDVAMAFAVNSITSTALIQTTDDMVFEYPDETINVRLSVPGMWPSYPSQFWSQITILDNGDGGFGTKSYTAILLSSATAPVAHGTAVALLDAFNLAAVGEPGEVHPTTRVACGAVLIYLATSGIWALEATLRPPTCIAGSGFGTSVAIDGSYGTVRLVVGAPSALTPTVFVYVRNSATATWNLETAFTEPAAASTSANYGGSYAVDIFGYNIVVGASGLECTFVYTYTTTGWLPAVVLRANDYATDVVYLQNVVHEFEFGAAVSIGQRSIVVGAPRANYGTSRQLDTTFLGTGAAYVYYLPAQVQTITLNIDVLVTAGQFVLSLGGASTSRLNYAISDVDMTTAIQALIPSVQVTRAGTTETGFTWRVTILSEVTTVPLLVATWRGYGCSTCIAFNTGYTADPGRQVDVTSTAALGTWTFHQRLTAADGNRADRFGAAVDLDGDSIIIGAYGSFSLTTTTWDFETGDLTGWVQTGTAFGSQPTFGENVRARASGYLSSYLKSASGILNFEGRYWVGTYEARPGAGRTQQYTPFSCAFMNDDCKATGYTTPDSSIAGSAQGDGPMGTLTSQPFSILGSAIRFRIGGGCNLATVYVELLVDGLSVRKATGRCRESLHRVAWNVTAFTNRTGQIRIVDDTDSVNWGHINVDDFQFDWPVQQPSTEKAGAAYVFYRSTSTTSYGVCQGVPKLQCAWMLQARLVASDKRDHDMFGFSVGINDALGMAVIGAYGQSIVNLNNSIAGGDDAGSLYLFIKTPALLDGVGSIITPQRWPAFETAKLQAVNKAPNAQFGYALSQSNGRVAVGSPGMQRGIGTAYVLDTQFIQVSFASDEVAVNENDVNGQAIVVLYRAGDTSAPLTIEYGGFVKAMNKVTMLARYATSDLTGAGVDATRFAQCMAMPIQNRIRCGRYQQTSGVATFPVGGTSLAIAVPIMNDWCYAEGQTHVAFHLNPPGGDVILGEQFTLRIRIDDDDFGRTAC\n>UniRef90_A0A1W1Y6B4 EAL domain, c-di-GMP-specific phosphodiesterase class I (Or its enzymatically inactive variant) n=1 Tax=Oscillospiraceae bacterium TaxID=2485925 RepID=A0A1W1Y6B4_9FIRM\nMTPVGTTYLENYTPAADVLVVAVCVVFVILIRSAYINRTRSFRYLRHMIYMAVVASVSNLIFHGILPRAATLPNILIYLPHLLFHASLYSILWLQVQYLKETVRLTFRENRLYTVLSSSGLVALIVLEIVQPLFGFGFYMGADNTLHREIPAFIFGYVFFVLLMLSMLLKYREMIFRAILVGILSSVSISFLLMLIQEWVGETSYTVFTFLFPIYALLYLAHSNPYDLEIGAVDERAFTDLVAISYEHKDELYLMSLYMHDYDGKGQHYPEELQKMIKHFVYKFFKHPTLFLISGGHMILVVRTSSDPGYLEGAEKMIEEFMKLYSEYKIDYKIVYTKNDVRLAEDNDVVNFIKYLHFDMDENSISKPGDKEIEAYLRYKYIVSELVDINNKHDLNDPRVLVYCQPVLNIKTGKYDTAESLMRLDLPKTGLIYPDEFIYIAERLKYIYTLTQIILNKTCLKIKEMLENGYYIQRISVNFSVYDIREPDFCETVEKIIRDSGVPYDKVAIEITETQNERDFENIKKRIDELKESGVRFYLDDFGTGYSNFERIMELPFDIVKFDRSLVIASGSGNKYKSMVSNLAMMFDNGDYSVLYEGVENDEDEKRCIDMNAKYLQGFKYSKPIPIERLTEYLDKGHED\n>UniRef90_A0A7W3YDD2 Molybdopterin-synthase adenylyltransferase MoeB n=1 Tax=Lysobacter penaei TaxID=2759900 RepID=A0A7W3YDD2_9GAMM\nMEIERIPPAEALRRQRAGTVLVDVRASHERAAGAAEGALGIVRETLEADPTAALPDREAPVMLICQMGGRSLKAAEALRAAGYARVASVEGGTERWRDEGLPLVRDEANADFYERYSRHLRLPEVAEAGQRRLQAARIAMVGAGGLGSPAAFYLAAAGVGTLVLADDDMVDRSNLQRQILHTEARIGTAKVESARIALNALNPSTRVEAFPERITAANVERLLEGADLVIDGADNFPVRYLLNDACVKLGTPLVYGAVHRFEGQASVFDAGRHRGEAPCYRCLFPEPPPAEAAPNCAEAGVLGVLPGLVGLVQATEALKLLLGIGEPLRGRLLQVDALSMRFRETRLGADPDCPVCAPGRPFPGYIDYAAFCAGG\n>UniRef90_A0A8H6JB52 AB hydrolase-1 domain-containing protein n=1 Tax=Colletotrichum sojae TaxID=2175907 RepID=A0A8H6JB52_9PEZI\nMAATKAPRSLGIVLIHGGFHQSTCFALAKSRLEAAGFSPVLGVDLTSVGTNPSVTLDDDARSIQAAIEPHIDAGREFLALAHSYGAGKKGGIRAAIYLTANMPPKKGASALSVLPPGLDIVDVGDDGLVRANAKAKAAFYGPDMSDETADACMAALLPQSSAALFGGASVGLDELTVPAYYILCEKDQTIAPATQQEIIATIPTLRRVLRNPGGHSAFITEVDRFVEQVVEIAEEVEREGEVEA\n>UniRef90_A0A4Q9GHY3 histidine kinase n=1 Tax=Hansschlegelia quercus TaxID=2528245 RepID=A0A4Q9GHY3_9HYPH\nMTSEPRLRDGSTLRRHDGAVRPLSASERKIEEAAHEIRTPLGGLLALADLLLAEDLTDAARGHAEAMKDAARHLFGVATTLLGGAETGAASLGMSRFLDRTVPPIAARAAVQSLSFQLLRGPGVPERVTADESWLRQIIDNLADNALRATRSGGIELAVDCIGEDANSALVRFAIRDTGPGLGDDPKALFARYAQGDEPGAAGIGLSLVARLAHRMSGRLEAANRPEGGAEVAAVVRLATQSEPVRHAGAQLKILIAEDNIVNQRVVATILNQFGHDYDIVGDGEAAVAAASTGAYDLVLMDAAMPHLDGLRATRRIRSMDTPAADVRIVGVTARAFAHEIADFIAAGADAVVTKPISIAELWRVIGADVRKAG\n>UniRef90_A0A429S8T5 PLP-dependent aminotransferase family protein n=2 Tax=unclassified Streptomyces TaxID=2593676 RepID=A0A429S8T5_9ACTN\nMANGRVVHTADRTIGSRQLAALLPPPVLARPGYRALAEAIRTLILDGRVALHIRLPAERELAECLGAGRATVTGAYDLLRESGYARSRRGSGTFTELPDGHRPVGAHALLGAGGSGGFLPDGDPGIDLAIAAMGAPDGALAEALAQAAPRLPAAARTPGYLPFGLPDLRAAVAERFTRRGLPTRPEQILVTAGAQQALTLVVSLLCRAGDRVVTENPTYANALDALRHARLRTAPVAVTDAGWDLEIAESTLRQTVPRLAYVIPDFQNPTGALMPEDQRLALLAATRRTGTWLVVDETLADIALDVPAPAPLAALAARGGADHVVTIGSLSKTHWGGLRVGWVRATAKLVAELTAVRAATDMTGSVLDQLVALPLLDGLERTLPARLEQLRVQRAALIEALQRHTPEWSWTVPPGGLSLWVDLGEPVSSALAERAAAAGVHIGRGARFGVDPGTFEHRLRIPYTLPPERLDEGVRRLAAAFHDGVPLAPAVDRPHWVA\n>UniRef90_UPI001F223AC7 type VII secretion system-associated protein n=1 Tax=Streptomyces sp. GQFP TaxID=2907545 RepID=UPI001F223AC7\nMADFSHTDKQSIQTFIDGDLASFIGDLKKILAGDPSMKDFENGVYTDRTAGAIEKGKPIMMGRIDRNDLMTGTSFTDALSTSISTVVDVLTAQQDTFDEIDEGLRTTLHELFKTQGDNLGNISAEEFSTSMSDSGFDDSSSSGDSTGDNGSDSTDGESA\n>UniRef90_A0A4S4FJ12 4-aminobutyrate--2-oxoglutarate transaminase n=1 Tax=Glaciibacter flavus TaxID=2565934 RepID=A0A4S4FJ12_9MICO\nMTTIDAPARTVGGPDIVQERRLVTSIPGPLSRALMTRKTDAVAAGVGATLPVFAAAAGGGVVVDVDGNSLIDLGSGIAVTGVGNSHPRVVEAVKAQLDAFTHTCFTITPYESYVAVAEALNRLTPGDHLKRSALFNSGAEAVENAVKIARHHTGRQAVVAFDHAYHGRTNLTMGLTAKNQPYKNGFGPFAPEIYRAPLSYPFRDGGIDGVTAARTAILQIEKQIGAENLAALIIEPIQGEGGFIVPAAGFLPTLLEWSRANGVVFIADEVQSGFGRTGAWFASEHEGIVPDLVVTAKGIAGGLPLSAVTGRADIMDAAQVGGLGGTYGGNPLACVAALAAIESYASEGLIERAGDIGRLLIDRLTALQASDPRIGDVRGRGAMIAIELVDPETDAPDAALTARVASAAHAQGVIVLTCGTYGNVIRFLPPLTIGDDLLTEGLDVIAEALATA\n>UniRef90_A0A7W5AC37 glutamate dehydrogenase n=5 Tax=Actinoplanes TaxID=1865 RepID=A0A7W5AC37_9ACTN\nMAVADEAATDSDQTVLDDVPNAERLVAQAVEQAGDDHTTASLVGRFWRFAPDEELVGYTPQEMFAAAAEHRELARNRLPGELKLAITEPSGSQSHSVLRIVTDDMPFLVDSVIALLNAHNLQVYLTVHPLIVVRREPLGALAQLEAEVEPDDAIEGDLVESWIRIEIDPVRRPEAREQLLNEVRRVLTDVRDAVEDWPRMRQRALVISDELAAARGSKNPSPVPDKDLTDSIELLKWLANDHFTFLGYREYRLDDGVLSAVPGTGLGILRGASKPRRLAEEMAPEIYERAMEKRLLVITKANSRASVHRSAYLDYIGVKLFNEAGEVVGERRFLGLFSSSAYRTSVRELPVVRRKVQEVMDRSGLSPRGHSGKDLLQILETYPRDELFQIKTDDLYEAVIGVLRMAGRRQLRLFLRRDGYGRFISCLIYLPRDRFTTGNRLRMQEILLRELNGVGVDYTTRVTERMLARVHFIVRTDPAAPPGQLDPNELAERLADATRMWDDDFSLVLERKLGDEQARRLFQRYSAAYPESYKNTHTPYEGMQDLAKLELLEEPGQLAMHLFRRRRLGADGTPQPDERDVRFKVYRYGEPMMLSAVLPVLHSLGVRVTDERPYEIRRPDGTIYLYDFGLLPPAGHRELAEVRPQVENAFAAAWRGETEVDGFNELVLRAGLTWRQVVVLRAYAKYLRQAGNVFTQQYVESTFTAYPEIAGLLVRLFEVRFSPALPIGEAERTRRAGELRGRITELLDQVESLDQDRILRSYLTLIEATLRTSFYQRGAEGRPKSYVAFKLDPQAIPELPQPRPKFEIFVYSPRFEGVHLRFGAVARGGLRWSDRREDFRTEVLGLVKAQMVKNSVIVPVGAKGGFVLKQKPGDRDEAVECYKRFITALLDVTDNILSGKIVPPEDVVRHDGDDPYLVVAADKGTATFSDIANEISVRKDFWMGDAFASGGSAGYDHKKMGITARGAWESVKKHFRDLGTDTQSEDFTVVGVGDMSGDVFGNGMLLSQHIRLVAAFDHRHIFLDPDPDSSISYAERRRLFDLPRSSWADYDASLISEGGGVYPRSAKSIPVSPQVRAALGLGEASTISPAELMRAILKAPVDLLFNGGIGTYVKGAAESHAEVGDKGNDAIRINGSELRVKVVGEGGNLGLTQRGRIEFARAGGRVFTDFIDNSAGVDCSDHEVNIKILLGGAVVDGELSLPERDDLLAAMTGEVGELVLRDNYEQAMALGNARSQAHSLLPVHRRQLKSLEERGELNRELEALPSDLELAARYENGQGLTPPEFAVLLAYVKISLEREVLTDELVDEAWTTDVLSGYFPTPLRERFAGRMAGHRLRREIISTALVNEVVNRGGTSFVYRAMEESGASAADVIRAYVVVRDVFGLEEIWAAGEALDNRVPTSAQTLVFLETRRLLDRAVRWLVSTRRSPLDVPGEIAKLRPGISALLPLLPEVIVGAERRALFDRIAELVAKDVPEDLAAAVSRVFYGFGLLDVLETAAAIDRDAEEVAQVYFVLSERFGVDALLSHISRLPRGDRWQTLARMALRYDLYAALAALTAEVLHSTPSSAPPEDRVSEWEQVNAASIARASNAMGDVDDSPADLAALSVLLRQIRTLVKTSSAG\n>UniRef90_A0A2E6Q8T7 Oxidoreductase n=1 Tax=Rhodospirillaceae bacterium TaxID=1898112 RepID=A0A2E6Q8T7_9PROT\nMSVPLFTPIELGNVTLANRIVVSPMCQYSAVEGSATDWHLMHLGNYALSGAGLLIHEATAVVAEGRISHSCLGLYSDKNESALARVLEFCRGISDIPLGIQLAHAGRKGSCERPWEGRGPLSGENAWQTDAPSALAMADNWPTPNAVSIEEMKAIKAAFVTATERAIALDYDLIELHCAHGYLLHEFLSPLANAREDDYGGNLANRMRYPLEVFEAVRAAWPEGKPLGVRISATDFAEGGWEIADSVVLSDALKGLGCDYVTCSGGGVTFDQTIELEPGYQMPGAEAVKRETGMPVMAVGMIRDPKFANTAIADGKTDMVALARGFLYEPRWPWRAAYELGVDAAYPPQFERAAPSAWPEAFPDQSD\n>UniRef90_A0A5F7ZVD1 Secreted protein n=1 Tax=Macaca mulatta TaxID=9544 RepID=A0A5F7ZVD1_MACMU\nLPEAASLQSSHFYSVPCHNPTVHALCPNIHFLFFLFLLRLSFALVAQAGVQWHDLGSPQPPPPGFKRFSCLSRLSSWNYRHAPLHTPNFVFLVETGGFSMLVRLSRNSHVRRVGRSLFTDEEGNCSSESMTVWLR\n>UniRef90_A0A5B9Q9U5 Glyco_hyd_65N_2 domain-containing protein n=1 Tax=Bythopirellula goksoeyrii TaxID=1400387 RepID=A0A5B9Q9U5_9BACT\nMKIHLWEIVLFLLAISVANSVARESESELVWFDRPATHFTESSPLGNGRLGAMIYGGTIDETVVLNESGMWSGSTQEADRLGAAEFLPEIRRLLFLGKNVAAEKLMNEEFTCTGQGSGHGSAAELPYGSYQTLCKLQIKFLQNETAPSVQNYRRELDLHDAVVRIEYSRNGVDYLREAFVSFPDQVFLYRFTANKKNSLSFDVSLSRSERSNTKNVGKDELQIEGQLDDGKEGETGVGFCSRVRVLHDGGMVTTQDGTLKVRSANSVVLLVSAATDLEALVSQVDEDIYKATEVVLDRAAAKPFADLLKDHISDYQNYYNRVGLRLAPTRIDSRSKLPTEERLHANWRDTQDNSLAALYFNFGRYLLISSSRPGGRPANLQGIWASEIQTPWNGDWHANINVQMNYWPAEVCNLAELHEPLFRLIESLVEPGSQTAQIYYNARGWVSHVLANPWGFTSPAERVSWGSTNTCSAWLCQHLWEHYLFTQDREFLLSVYPIMKEAAQFYLDTLVEHPTQEWFVTAPSTSPENRFLLPNGEEASICIGATMDMQILRSFLYACREAANELDCDEVFRTQLSDVIGRLAPTRIASDGRIMEWDQEYPEKDPEHRHVSHLWGLYPGDEISNSQTPELAAAARKSLNVRGDSGTGWGLANKIAMWARLHDGDRAHRLLQQHLHPVTHGQRKQQWSGGTYPNLFDAHPPFQIDGNFGATAAIAEMLVQSSISDIDNIKHVNIELLPALPTAWPEGEVRGLCTRGGFEIALNWKDGKLGDVEIHSRHGLPLQLRYKSQEVTLTPARGEKVHFDGDLKLLSTPKSAVVPPSGSNK\n>UniRef90_A0A417XX54 SCP_3 domain-containing protein n=1 Tax=Nocardioides immobilis TaxID=2049295 RepID=A0A417XX54_9ACTN\nMPSRLRPADPVDVSRALAGVSGGTADRAELRLLTKHFLALLEERAPGRSVEVRVPPFAAVQVIEGVRHTRGTPPAVIETDAETWVALATGELAWADALASGRAQASGERTDLSPYLPLG\n>UniRef90_A0A512JR32 Fusaric acid transporter n=1 Tax=Methylobacterium gnaphalii TaxID=1010610 RepID=A0A512JR32_9HYPH\nMTLPGWRDWVFAIKTFGAAILAMYLAMWIDLPRPYWALGTVFITSQVLAGATRSKAIYRVCGTLLGAVVSVILVPNLANAPELLTIAIALWVAVCLYFSLLDRTPRSYLMMLGGYTAALIGFPAVGDPGTMFDTAVARAEEITLGILCASLANTVVLPQSVAPLIAGRLDHWLTDARGWIVSVLSHTSNAGDTQSKRLKLASDAIAFDALATPLRYDMSGAERSAEAMATLRQHMLMFLPIVSALSDRIEVMRRAGTMPSRLETLLDDVAAWLAAGRIDEIEAQGLRSRADALCPPMSQQASWTDLVLASLLARLNNFIDLRQDARLLQRHILDGTLTTERLAFSYTAAARTIRHRDHGMALLSAIGVFLSVLLSCTIWIATGWPDGAGAPMMAAVGCCFFAAQDDPAPSIVGFANSAIIGGIASAIYLFAVLPLATNFEMLTLALAPALLTCGVFMTQPKTAPIAMGAAVNGSAMIALQGSYTGDFAAFANSSIAVIAGMWVAALVTRLVRSVGAGWAAHRLRSVNRRSLAQAAERQGAQNGLELAAIMLDRVGLIAPRLTSLPPGDAEWTADLLAEVRVGINVVELRRNRRALSNEARKAVEALLAALARHFHAKALIPPTGLLADIDAALDAVIADRLHAARGVALMGLVGVRRALFPEAPDYKARRTATSEPGWAA\n>UniRef90_A0A3D3L9U4 Heat-shock protein Hsp20 n=2 Tax=Verrucomicrobiales bacterium TaxID=2026801 RepID=A0A3D3L9U4_9BACT\nMKITRFNPSLNLGRVADFDQWLRNPFAAFPLMGQLLGDFAPAFTSGRPATDVHEDKDNYYACFELPGVKKEDLKVEIHDRLLNVSAERKEKNGEQESSLTLCRSISVPEGVNAEGISARLEDGILVVTLPKQEHRKPKLIEIA\n>UniRef90_M4NI99 Dipeptidyl aminopeptidase/acylaminoacyl peptidase n=11 Tax=Rhodanobacteraceae TaxID=1775411 RepID=M4NI99_9GAMM\nMSSKTGSSRVLGALVMGALSAGVAAQARTLSADDYARAERFMSYNTVPLVDHAVPKVEWLDDGHFWYVDHDAAGDHFVRMDAASGKTAPLFDQAKLAVALGKAGGKPVDAKKLPVTGYEARPDGRVDIAVRGKHYVCDLAAVEASCVDRTALVKTGKEPGALSPDKQSEAFIRDWNLWLRDVASGKETQLTTDGVENFGYATDNAGWKHTDNAIVEWSPDSKRIATFQQDQRKTGEMYLVSTNLGHPKLEQWKYPLVGDKDVTMIERVIVDVAAKKVLRLQMPPDQHRSTLCDDVSCGPDGGWDDVKWAADGKTLAFVSTSRDHRHEWFRIADANTGKVRTVFEEVVPTYYESGNGAVNWRYLPETNEAIWFSERNNWGNLYLYDLTSGKLKRAITKGEGNVTELLKVDPKTRTVWFRGVGRTAGVNPYYQQFFKVSLDGGKPVLLTPEAADHTVTLSPDGRAFVDAYSTPTTPPVIVLRASDDGRKVASVATADIARLKAAGWVPPIPFTVKGRDGKTDLYGMMFKPTHFDPSKKYPIIDYIYPGPQTGSVRGRSFSAARADHQAMAELGFIVVAIDGMGTPWRSKAFHDAYFEHVEDNTLPDQVAGLKELGKQYPWIDLDRVGIWGHSGGGNATAAAMFHYPDFFKVGWAESGNHDNRNYEDDWAEKWQGLLVTNKDGKTNYDAQANQSFAKNLKGRLMLVHGTMDDNVPPYQTLLVADALIKANKDFDLLLIPNVHHGYAEATPYATRRRWDYFVQYLAGNTPPHEYQLKAWPWR\n>UniRef90_A0A1B7P3P8 UDP-N-acetylglucosamine transferase subunit ALG13 (Fragment) n=1 Tax=Emergomyces africanus TaxID=1955775 RepID=A0A1B7P3P8_9EURO\nMDSSKRARKLCFVTVGATAPFNALVLEVLGEPFLEALRINNYTDLRIQHGQMGESTFQEFKLQNGTMAKEKYGLDITGFDFNLAGLKNEMLDVKADVDANKAEGFIVSHAGSGTILEVLRLGIPLMVVPNPQLLHNHQDELAKQLAVSGYVIHGKL\n>UniRef90_A0A2T5J629 Type I site-specific deoxyribonuclease n=1 Tax=Mucilaginibacter yixingensis TaxID=1295612 RepID=A0A2T5J629_9SPHI\nMNEHEFQTYVAQIIGQLFPTLQEGQIEQEHAFSLKFGHHAVVIDGKEPGKYAKSAIYDILLKFQGKPFALLELKKPGNGIEPEDIRQGVSYARLTQPICPLTILTDGTTTQLINTFDGEPFKEEAMDIQFIENLFRQGLLLSANSLKNAISTLLEADHRVIFDVINTISHNAFEQLRGDPEDISKPIMRDFKVARSAERKIWDQLEKTPGVFLTGEPFVGKTNLLYQLFETAKNAGQALLYINAADQNYNIFRRLSNFITMRMRYPVTEERVKEWLLLSSNRSPQDRLVVVYDHFRHDTDEHLKADIAELFDVFEADNNRVILATDNANYDLLTTTAGRTTTNFYRERFARIRLKTFSSKEFELANQLLYDRYGGMVLPGGIFAGEYRNPRVWRLIAKAIRAERTQATALGIIEAVPSFQFLQLISNHWHFDAQTRQDFKALSVAFMESMPLRNEQGDLKLMALNLPVIAEQELKKHLENEVIERLKLAGLLERRLLPDDRWVFLPKLPELIAKNAGEHLKARFQPLLLADFHQHYPEFLEAYQYLPFGEIIAAQTIVHWGYQQELDLFSAFIRKLQSDKPEIETATGGGLVRLYLPEKGHITLPIEPGEEQKYIGNLFPYLILSHLVTLQFVDDSQHPDMERARCIAAVGQTNFQVRSLNVNTFYEPMPTNHEVGNIGNITHSGIGIVEPIVQAMQANIIQSPQVIDILFRHALEKKYYRLLHRIYIAARYSDGLGSPESDALCESIQARYMDHFNKMMAFAIADKGATRSERRKIEKGLRKRDRKQKK\n>UniRef90_A0A841IL00 Beta-N-acetylhexosaminidase n=1 Tax=Nocardiopsis algeriensis TaxID=1478215 RepID=A0A841IL00_9ACTN\nMRLPAPYALACVGLALSTAACTLLGEVNPSEEDGGSPTEESFEPVLAPRLLEEMDLGDKIGQLMVLTAQGTTAAENAALIETYRPGGLIYFDANLTGAEQIASLSAGVQEIAAEQGAGVPLFLGIDQEQGLVARLPVGTSFPDAMAVGATGDTGQAVLRATTTAAELNALGINLNYAPVADVNTDPDNPVIGIRSFGSDPALVSEMAVAEAGAYAEAGIVPVVKHFPGHGDTDVDSHTGLPVIDMPRDEWEAEHLPPFRAAVDAGVDAVMTAHVIMPQLDAGTDPATLSPAIIDGILRGELGYDGVVTTDALNMEGVRQDHTDGEIAVRALEAGVDQLLMLPDPAAAVAAITEAVEQDRLTEERIDESVLRVLVLKERRGVLEADPVDPAAAEAALSDPAHAEAAQTVADASATLVRNESGLLPLAAGARVRVEGTGADRLAGALAEAGLEVVTEGADAVVVGTNGARGSAEQSAPVEAARAQGLPVVVVAQGGPYDLEAFPGVEGFIAVYSSVDVSLAAAAGVVAGEVEPTGTLPVDIPGADVAAGTGLGF\n>UniRef90_A0A5C6Q7Q0 OmpA family protein n=1 Tax=Colwellia sp. C1TZA3 TaxID=2508879 RepID=A0A5C6Q7Q0_9GAMM\nMNYIMTILLTLAISGCSIQIQEMTPEPTVQKADLADIEADGIINARDQCQDSFVGASVANNGCGSDRIEELKHKLQVNFIPNSYTVEWRFLSEIKKLAEFMKDNPRAKLTIEGHTSKRGTKVLNQILSQNRAQAIQNILVNKFMVEQARITAIGYGFDRLLLAGDDEYIHARNRRIVAKLSREKLLTDMKWTIYSVDQAEE\n>UniRef90_M3I5W0 Oxidoreductase, short chain dehydrogenase/reductase family protein n=2 Tax=Leptospira interrogans TaxID=173 RepID=M3I5W0_LEPIR\nMASFNSSGKMNAFVIKHDVTNFDQVETVFQKAIKSMKGLDEIYYASGVMHNIKPDEFDVEKDISMLNTNLLGCVAWLNPAANLFQKQKSGKIIGISSIAGDRGRRGNPVYNTSKAGMNTYLEALRNRLSVLGVQVLTVKPGFIDTAMTKGMKGLFWLISAKEAAEIILKAADSGKENIYVPARWGLVGLIIRCIPSFIFRRLSI\n>UniRef90_A0A3E0HEB5 Serine/threonine protein phosphatase PrpC n=1 Tax=Kutzneria buriramensis TaxID=1045776 RepID=A0A3E0HEB5_9PSEU\nMSTAHDLTYGRRAAVATRRGVRDHNMDAPALFQASTGVVVAAVVDGIGNDPDGAATMHLIAETAVRIGATKGALAGVLAGAALVEDPGVENHMPDGVIVLALAVPGRPTHLAWVGDSHAYSWDGDTLSRRTDPHTMGAYLRGNGAVDLAPLHDSWVRVTLTSATVTNVAVSSIPANELVVLVSDGLDTLPHDELEALVREHQDNPDTLADAIVAAARETEDGYRDDATAIVLTTAG\n>UniRef90_A0A6A5YPJ8 TauD domain-containing protein n=1 Tax=Lophiotrema nucula TaxID=690887 RepID=A0A6A5YPJ8_9PLEO\nMAPIALPIVESIKETDTVQPKKDSLALPEPARKRLEDAGIDLSSGYPYRPAKPLYLDDVYNIRNEEREFVDAGSRADPEKKALLSAAKEVIHLTGHIGTEIVGLQLKDLTDQQKDELALLIAERSVVFFRDQDITPQQQKALGEYYGEIEIHVRIQPQVPSVPGVPGTTVIWPALQATEFAASFRQTGGASRWHTDLVHERQPAGITHLHNDTIPSLGGDTLWASGYSAYEKLSPDFRKIIDGKEAVYRSAHPYLDRKNPTAGPKFIERTHPLVRVHPATGWKALWVNRAMTVRIVGLDKAESDLILGYLYDVYERNVDIQVRFKWTQGTSALWDNRITIHNASWDYEGKEPRHGTRVTSLAEKPYFKADAPTRRQALGLAGPGDI\n>UniRef90_A0A285NT28 Acetoin utilization deacetylase AcuC n=1 Tax=Natronoarchaeum philippinense TaxID=558529 RepID=A0A285NT28_NATPI\nMRFGYSETCLDHDTGDRHPETPDRLRAIKEGLKRKHGVEYVEADSADVETVAAIHDREYVEEVREFCADGGGNWDPDTVAVEGTWDAVLQSAGLSAWAAERAMDGDSGRETPFALGRPPGHHAVVDDAMGFCFVNNVAVAAQHALDDTAAESVAIVDWDVHHGNGTQDIFYERDDVLFCSTHEEGIYPGTGGSGETGTGDGEGTTLNLPMPAGAGDADFAAAFERVVEPAVESFDPDLLLVSAGFDAHRHDPISRLRVSTDGYGVLTGRLRDLADETDTALGFVLEGGYGLDVLAEGVAMVHEVFDGLDPVQPDDDVDDDVEELLTGLRSRHPLLVGN\n>UniRef90_A0A1A8J6Y5 Ectonucleoside triphosphate diphosphohydrolase 5b (Fragment) n=1 Tax=Nothobranchius kuhntae TaxID=321403 RepID=A0A1A8J6Y5_NOTKU\nMKPTVLLLLLVLLAVSGPSRAQVRSSHLDLPRILPSLSRPANHSRIFYAVMFDAGSTGTRIHVYTFIQNGSEKLPVLDNEMFHSTKPGLSAYADSPETAGETVRRLLKVAKKAVPRLDWKRTPLVLMATAGLRLLPVEKAQALLDQVKGFTRHCRDPRWGCFYK\n>UniRef90_UPI000DD31245 peptidylprolyl isomerase n=1 Tax=Paraliobacillus TaxID=200903 RepID=UPI000DD31245\nMKKLAIAATIAAGMITLSACSSDDSETVVETASGNITQEAFYEELKELSGSTVLEQMVTQTILEDNYEVDEDQLDEQLQVYKDQYGDQWETILTSSGYADEEAFREDLKLQLLQQEALIEDIEVTDEEIEQRYERMQTEIEASHILVADEETAIDIKAQLDDGADFATLAEENSTDTASAAEGGSLGYFTAGDMVAEFEEAAYSMEVDAISDPVETTNGWHIIQVTDKRDAEEAPEPLEDIRDDIRDEIALTKVDDTAAQEKLDQLMEDADIDVKIEEFEDLFTAEEETATE\n>UniRef90_A0A6P0X9G7 AI-2E family transporter n=1 Tax=Okeania sp. SIO2D1 TaxID=2607792 RepID=A0A6P0X9G7_9CYAN\nMQQILNQLKKWGEKYLHFDLISLFLIGYATAIILSIDNYIIRILTFFPLLLLLLVDLVILLFAPEKLREIYSKTTLFICTLTAALLLVWII\n>UniRef90_UPI001B3ACF38 ribonuclease P protein subunit p14 isoform X1 n=1 Tax=Toxotes jaculatrix TaxID=941984 RepID=UPI001B3ACF38\nMSFIWRSVFNKPRLCLSSIAAALPPCRLLHVGQRASLTKAFSSHDVELFAKLTGDNNPLHLDPVYASSTSFEAPIVHGVLINGLISAVLGTKMPGPGCVFLHQEIRFPGPLYVGEEVLAEAEVLKIKMSFALITVKCSVKDKVVMEGEVMVMMPEDQQKRG\n>UniRef90_A0A1M7FK69 Uncharacterized protein n=2 Tax=Flavobacterium TaxID=237 RepID=A0A1M7FK69_9FLAO\nMNTYADNNKENKKQQTPSAIHKKDNRDTALPVTDSHLSSVAAQLQLQEIANNSPQVKQAFQLQAIANAHAALPIQKKDLITTQSVFQLQKLERGKLNVVGEHHSESNQRRGQEIDIAEREVGGEYWTENNFRIRETKSPGENAVRDTTGDPRILGDALYLRIVESIQYVYEAKNNFEKEWKHWTTQNLNKEELPILKGELQPLLVICKNHTLEANKLAKAYMYNEEFKTLPEFVSDQIVQMYKLLPETEKLFLILVETWKSYTLEQLILKKFLSSFNVFGSNIDILNIYAAQIGGASRTDTSKLRSYEMDNAADFAHDRIGVWKIGFDHVKDIKEDMQHNDTKNYILINREEFNHEYKELPILVEDQMVKQK\n>UniRef90_UPI001FB4782B PTS system mannose/fructose/sorbose family transporter subunit IID n=1 Tax=Coprobacillus cateniformis TaxID=100884 RepID=UPI001FB4782B\nMGALIPSVVNAKFAYTFTQGEVSIAVQELADKIMPSLAPCLVVLLTYWLLGRKKMNSTRVTLLLVVLGILAFNLMIFA\n>UniRef90_A0A2T6FJL9 tRNA (guanine-N(7)-)-methyltransferase n=4 Tax=Cellvibrio TaxID=10 RepID=A0A2T6FJL9_9GAMM\nMKPEFKPKSIRSFVIRAGRITVGQKNAFDKYWPGMGLSLFNGAINPDVVFGRQAPLVIEIGFGMGDSLLEMAANEPDKNFIGIEVHPPGVGRLISTASQQGLSNLRVYMADAMDVLEDCIPDGSIDRLQLYFPDPWHKKKHHKRRIVQPAFIQKLRPKLKMDGVLHMATDWQPYAEHMLEVMNSATGFATDFTETGFAPRPDYRPVTKFEKRGERLGHGVWDLLFKKTA\n>UniRef90_UPI0012F6EEC0 DUF927 domain-containing protein n=1 Tax=Methylobacterium sp. WSM2598 TaxID=398261 RepID=UPI0012F6EEC0\nMSEALFATEMQRLDEAGVEEPSEVRANQERHGGIRWPKGFRMRADGLWYEPEGDEEAMRVSGPFRVPGLARDPAGSGWAVTIEWKDRDDRPHRGFVSYADLVGDGVDWLRPLAAAGLPVTIGTKALRLLKRALYELECTARVRLIRRSGWYRGAFVLPERTIGSAPGEEAVFEGRLDAARYASAGTLEQWVDAVAAPAAGNSRLLLALAVAFAGPVADLLEDEGGGVNLKGASSVGKSTLLVAAGSVWGGGARAGFTQTWRATGNGLEGVAKAHSGTVLILDELGELEAREAGSTAYLLVNGLGKARATRDAELRARHEWRVMLLSAGEVGLADKITEGGKRARAGQLVRLVDVTADAGRGLGIFDDTKGMEPAPFSNMIKSAALKVYGTAGVGFVSGLANDPDRYAAAARRRIAEVSRNLLVGLPEADGQATRAAHRFALIAVAGEMARAVLNLPWAEGEVDGAIKTCFDAWRATRGGDGPGELVAALEAIRSAIERHGEARFRNLDQHDGGAAPIRELLGYRQSRDGDVIYAFTATGWAETLAGTADPKSIVKMLFERGVLFAGRDRTHRHFVKFHGQPIGTYAVRASAVLDTEAA\n>UniRef90_A0A7Y9LCB2 DUF2264 domain-containing protein n=2 Tax=Microlunatus parietis TaxID=682979 RepID=A0A7Y9LCB2_9ACTN\nMSKPGESWTRDDLVQFTDRSLLALRRWATPGRARFDLPGPRVGSGPERDGLEAFARSFLAVGFRLSAAEIDSHDHAGWYAAGLAAGTDPESPEFWPSLRELPQARVEAAAIAIALHESRRWIWDALTPAVKQRVIDWLSGSVGIAYPDNNWRWFQNVTQAFLRSVGGPYDQAELDENLTFLDDCYLGDGWYSDGRPDRRTGNVDWYVGWVMHLFSLWYCRMSEGEPGIAELQARYAERLRPYLTDAADLFGADGAPLHQGRSLVYRHAVVGALWTGAVFDANPLPLGRLRRTALGAIRFFAERGAFDEDGLLSLGWLGRFEPMRQPYSGPGSPYWASLGLAGLVLPESHPVWAEPEQPTPIETGDVVRPIRPIGWLVSGTADDGIVRVINHGVDHSTATPAPENPYYNRYGYSSVTGPVPAPAGTADGAVDQQVALIDPDGRWSQRPMIERVAVDDHRASSRQRARFARTEPEQGFDDGPELTCVSLVRGSVEVRAVRFDDHDQASAALVISGYAVPRKPAEGARTGLHSAVTALTEGGSSGSSVHPVANAFGADLEVPWCRFEHPEPGRWYVIALCLGEREPAWPTLADTPSGPVITWPDGTTDPL\n>UniRef90_A0A0S6VXT7 FGE-sulfatase domain-containing protein n=1 Tax=Candidatus Moduliflexus flocculans TaxID=1499966 RepID=A0A0S6VXT7_9BACT\nMSNTTQTRIREKIIMIGISLFILISLGITWFVLYAIIAIKRQNAHRSAILEGLGFSPVANPPAAFVEYITTLHHHVKTSKPRLKLDHVFQQRIGNADVYLFELIDNGSEHSKHYEVVAYVSPSLRLPRFLLNPVLPTKEAKPDENSAIFKVLNSMFRYNHKVEFPDVPEFEERYTLSITDEQDDSEIQNTFTPPVTAGLLNSPSQYSMLGWGDTITERSRLKITTKTTIEEAKAMLEDILSLFLLFENQGASSTVNVRALDSSLSRNLAGKNEIPAALKTFEKSVKIIAALFAISFLLTGASFIFKAVSFQKEQAASQEEAVHEMPAPPIATPTPAPELPPKLPELTGFACAETNGHLECVEPLTGMILVNIPVAQSDMCGAKTEYWLGKYEVTQEEWEKLMGTNPSFFNRSKLGDGYKRHPVEQVSWDDAQAFLQVLNSRYKDKGVKFDVPSTAQYQRGCQAGMNAEWPYGTRDATQLDAYAYHNGNALGSSHIVGEKAGNAFGLYDIIGNIYEWSRDTNFTLKMTDGNAEFIPDKDGRKDLLGGSWKTDPDSQRCTMIPAELPAARRNDVGFRVAVEPVAP\n>UniRef90_A0A7Y4V1B9 Transposase n=4 Tax=Mycobacteriaceae TaxID=1762 RepID=A0A7Y4V1B9_MYCFO\nMQRPIEPAQYLSLAYTDRLIELGIAPSVGSRGDSYDNALAEAVNAAYKTELINRGKPWRGVDDVELATAEWMAWYNQERLHEALGYVPPAEYEAALKGASHPASQPTPALVPN\n>UniRef90_UPI001490A0B5 MlaD family protein n=1 Tax=Muricauda amphidinii TaxID=2735167 RepID=UPI001490A0B5\nMKLTREVKTGIIVLAGIVALIFGLNYLKSSPFFENNKTFYAVYSHVGGLQPGTQVSINGLNVGNVQSIRFLDSSGKLVVTFTVGKDFDFSKNSVAELYDTGIIGGKGIQINPVFDKAPNAQSGDTLTSNIKPGITELVQQKLTPLQMKVEGAVSHADTLLMNVNEILDEPTKRDLKLAIGTLNEVVTSFKGSADKLNLLLENNKEQLDSSLKNVDNITSNFSKLSDSLANAGLAQTVSDFQTTVESLNTILSKIEKGEGTLGKLTHDEELYNNLSEVSRELDLLLQDFRLNPKRYVNVSVFGKKQKDYELPENDPAQKQD\n>UniRef90_UPI001BCFD6CE universal stress protein n=2 Tax=Roseibium polysiphoniae TaxID=2571221 RepID=UPI001BCFD6CE\nMSFKTILAVAEFTEDVKSRLKSAVDLARTQDAHLAVLLVGEVPSLPFYGYGGAGYTKVWMEEGEERAAALKAVQEDVEAALAKEGISFDVRAHQAIVAREDNLVARHAIYSDLALILRSGDGELNTVERQAIDGALFDSGRPLLFLPKPDVPQTVGQNILVAWNSRAEAAEALSDAMPFLVGAGKVTLLLVDPVSGPDDHGESPGADMALVLARHDVEVEVRQVSSNGSSIAEVLNREAKTLGADLIVMGAYGHSRMRQTILGGTTREMLEETACPLFLAH\n>UniRef90_A0A6B0S860 PAN2-PAN3 deadenylation complex catalytic subunit PAN2 n=2 Tax=Bovinae TaxID=27592 RepID=A0A6B0S860_9CETA\nMNFEGLDPGLAEYAPAMHSALDPVLDAHLNPSLLQNVELDPEGVALEALPVQESVHIMEGVYSELHSVVAEVGVPVSVSHFDLHEEMLWVGSHGGHATSFFGPTLERYSSFQVNGSDDIRQIQSLENGILFLTKNNLKYMARGGLIIFDYLLDESEDMHSLLLTDSSTLLIGGLQNHILEIDLNTVQETQKYTVETPGVTIMRQTNRFFFCGHTSGKVSLRDLRTFKVEHEFDAFSGSLSDFDVHGNLLATCGFSSRLTGLACDRFLKVYDLRMMRAITPLQVHVDPAFLRFIPTYTSRLAIISQSGQCQFCEPTGLANPADIFHVNPVGPLLMTFDVSASKQALAFGDSEGCVHLWTDSPEPSFNPYSRETEFALPCLVDSLPPLDWSQDLLPLSLIPVPLTTDTLLSDWPAANSAPAPRLRAPPVDAEILRTMKKVGFIGYAPNPRTRLRNQIPYRLKESDSEFDSFSQVTESPIGREEEPHLHMVSKKYRKVTIKYSKLGLEDFDFKHYNKTLFAGLEPHIPNAYCNCMIQVLYFLEPVRCLIQNHLCQKEFCLACELGFLFHMLDLSRGDPCQGSNFLRAFRTIPEASALGLILADSDEASGKGNLARLIQRWNRFILTQLHQDLQELEVPQAYRGAGGSSFCSSGDSVIGQLFSCEMENCSLCRCGSETVRASSTLLFTLSYPEGSNSDKTGKNCDFAQVLKRSICLEQNTQAWCDNCEKYQPTIQTRNIRHLPDILVINCEVNSLKEADFWRMQAEVAFKMAIKKHSGEISKNKEFALADWKELGSPEGILMCPSIEELKNVWLPFSIQMKMTKNKGLDVCNWTDGDEMQWGPARAEEEHGVYVYDLMATVVHILDSRTGGSLVAHIKVGETYHQRKEGVTHQQWYLFNDFLIEPIDKHEAVQFDMNWKVPAILYYIKRNLNSKYNLNIKNPIEASVLLAEASLARKQRKTHTTFIPLMLNEMPQVGDLVGLDAEFVTLNEEEAELRSDGTKSTIKPSQMSVARITCVRGQGPNEGIPFIDDYISTQEQVVDYLTQYSGIKPGDLDAKISSKHLTTLKSTYLKLRFLIDIGVKFVGHGLQKDFRVINLMVPKDQVLDTVYLFHMPRKRMISLRFLAWYFLDLKIQGETHDSIEDARTALQLYRKYLELSKNGTEPESFHKVLKSLYEKGRKMDWKVPEPEGQTSPKTCRALVDELEWEIAQVDPKKTIQMGSFRINPDGSQSVVEVPYARSEAHLTELLEEVCDRMKEYGEQIDPSTHRKNYVRVVGRNGKSSELDLQGIRIDSDISGTLKFACESIVEEYEDELIEFFSREADNVKDKLCSKRTDPRVRPPWLYSLRPPGYSELRRTPARLKGALRLAGRLLRLELPGLCAFRPTAGENLKDILADLIPKEQTRVKAFRQQHGKTVVGQITVDMMYGGMRGMKGLVYETSVLDPDEGIRFRGYSIPECQKLLPKAKGGEEPLPEGLFWLLVTGQIPTEEQVSWLSQEWAKRAALPSHVVTMLDNFPTNLHPMSQLSAAVTALNSESTFARAYSEGINRTKYWELIYEDSMDLIAKLPCVAAKIYRNLYREGSSIGAIDPKLDWSHNFTNMLGYTDAQFTELMRLYLTIHSDHEGGNVSAHTSHLVGSALSDPYLSFAAAMNGLAGPLHGLANQEVLVWLTQLQKEVGKDVSDEKLRDYIWNTLNSGRVVPGYGHAVLRKTDPRYTCQREFALKHLPQDPMFKLVAQLYKIVPNILLEQGKAKNPWPNVDAHSGVLLQYYGMTEMNYYTVLFGVSRALGVLAQLIWSRALGFPLERPKSMSTDGLMKFVDSKSG\n>UniRef90_A0A8C0HHE9 G protein-coupled receptor 158 n=1 Tax=Buteo japonicus TaxID=224669 RepID=A0A8C0HHE9_9AVES\nMPHKRKLPIPTQTSRPPPNASLLPPGTARPLRRANCSGRYELASLAGKSRFTSHPTLHGALDTLTHATNFLNMILQSNKSREQNLQEDLEWYRALIRSLLEGDPNISRAAITFSTEPFSSTPQVFLQASRHESQVLLQDLSSSAHRLANASVETEWFHSLKRKWRPHLHRKVLNTGPKTLENSWKRRESFTADKNHIRWSSPYLECENGNYKPGWLVTLSAAFYGLRANLLPEFRGVVKVDINLQKVDIDQCSSEGWFSGTHRCHLNNSECMPIKGLGFVLGAYKCICKAGFYHPNIFSVDSFQRKDAENRFSGGELSEEVYTCLPCREGCSYCTDDTPCYAQEDKYLRLAIISFQTLCMLLDFISMLVVYHFRKAKSIRASGLVLLETILFGSLLLYFPVVILYFEPSVFRCVLLRWVRLLGFATVYGTVTLKLHRVLKVFLSRTAQRIPYMTGGRVMRMLAVILLIVFWFLVGWTSAITQNLERNIPLIGQGQTSDHLIFNMCLIDRWDYMMAVAEFLFLLWGVYLCYAVRTVPSAFHEPRYMAVAVHNELIISAIFHTIRQVIYSKVSLMPFLEQWVMHSSGCLLDQTCSVHTSFAIHFALQDELKKLYAQLEIYKRKKMIANNPHLQKKRCSKKGLGRSIMRRITEIPETVTRQCSRDEKDLMEHSAVKNMATLRKNPQDSTSSAKPKEETLKNRVFSLKKSHSTYDHVRDQTEEPNSLTTESTEVIATENSLLDSLNGNKLTKNAPEKVEAVSTESVPLVCKSVSAHNLSADKKPLHPRTSVLQKSLSVIASAKEKTLGLTGKTQSLEESTKSHKSQQKGKEASKKHSASDKGEHKDSHRKNSTHSEETKKTHKSGIMKQQRVSQTPANPDTGPGKSLHKDNFNIGEVCPWEIYNQTPGPVPSDSKVQKHVSIASSEPEKNHPSQPKVKTHHKLKTPEGYQQSNQKSPEKVEAPTRETQEQQVFENEKKQSNSKSQVSPGLKCENVNRYTPNTCAGEREELPQKAPEKENLNKLAEQKKNASCEGNVLSSDSHKPSSYLQQPLASRAEVCPWEYDTPDLPNAERSVALSNTSAISANKTATPRK\n>UniRef90_A0A2T6DUT4 Endoribonuclease L-PSP n=1 Tax=Opitutaceae bacterium EW11 TaxID=2161865 RepID=A0A2T6DUT4_9BACT\nMDLTTPSPQPFLRSAQSLAEDLESEIYATPESEARSSWTHRGCRVEVRASERDSFAEFHVTGLVECAGSAAELAEIVLEEVASVLASRRIQPIQEKLYGLTAIRGEVMKRRETAYRRRRLDPSVPTTWIQGLPLLGCDFVGIQIWGVAPYGGETCVTTVENPSTGAGRLWKGRGFRMLHLPCVRGIQHDGKLAAGPASQADWMFTNAEQGLAAHGFSYSQVVRTWIYVDRLLDWYGDLNCVRTAHYRRLGFGTTGGPAFPASTGIQGRFEEEECLVDVLALETDGRHATAAPVTRSPRQDQSFNYGSAFSRGMTLDVEGRRTIHISGTASINTAGDSTHLGDAEMQSLETLMSIAAILQEQGGTLENITSATLFCKTREAWEAWRRVSQLLRLPAFPKVCVLADVCRDNLLVEMEAVAVI\n>UniRef90_A0A8S9K9L2 Transcription termination factor MTEF18, mitochondrial n=1 Tax=Brassica cretica TaxID=69181 RepID=A0A8S9K9L2_BRACR\nLEAACALSGFGFPWNKLGRLYREERSVFLQSGDEIGSLLGRLSGVGFSTVAVAGVCLAFPSVLRGGVEIGCLFVKVKRLFEEFGSEDVVEENVESWYAFGRKIRVFYDLGFESEEMWELMGRNRSLFIECSEEALMRKTDYFCRFGVGKEEAALLILRNPDVMSFDLEKPVISVKGVLKHFGLSEDEVDALSLKHPHVFGRNRMKNLPHVVRALGLHERIFDKLKNGTYHLLSSYSLMKPDEDIDREYQRGLEEIQNLRCKTHSFQKLDFLHQIGFAENGLTMKTLQHVHGTAVEIQERFQVLLDSGIDFSKACMLIRSSPKSLNQKPHSIQEKIRFLCEEMGDSLEYLEVYPAYLCFDLENRISPRFRFHKWLVEKGLSEKNYSIASIVATSEKAFIARLYGIHPAIPKHYFERFSYRKDRTTVS\n>UniRef90_UPI000836FEF3 nuclear transport factor 2 family protein n=1 Tax=Rhodococcus phenolicus TaxID=263849 RepID=UPI000836FEF3\nMTTTPAESTGEAGIAERITRLEDLEAIRLLDARYCRHLDDGNWDALMDLFTEDGEFDGLSHPRGRTEMRAFFAGLAEDGLTAFWHFITNLEIDLDGDRATVRSFLWQPCVTDGVAGIAAGRYTDQVVKIDGRWLYKVKQVRFHFFGPLESGWDENLFALDSARRAAVRA\n>UniRef90_A0A523XA31 Phosphomannomutase/phosphoglucomutase n=1 Tax=Candidatus Cloacimonetes bacterium TaxID=2030808 RepID=A0A523XA31_9BACT\nMNKEIFRTYDIRGKADIDLTNEVVEILGKSYSIFLPSNAKRIGIGRDIRLSSERIKNNFVKGLLSTGIDVVDFGVIPTPLLYFTVHTHALDGGVEITGSHNPKEYNGLKMLVGKNTIYGDEIQEIRRIADKGVFRKGIGSYEEKETVNEYINDILDRISLGKRKLKIIFDTGNGTTGPVVKRLYSKLPFEFEILFEEPDGSFPNHLPDPTIPEYLNDLIQRVKESKADLGIAFDGDGDRIGAIDEKGRIIWGDKLLAIYSKEVLRKRQGAKIIFEVKCSNGLIEYIKEKGGVPLMWKTGHSLIKAKMKEEDAPLAGEMSGHMFFGDNYYGFDDAIFASLRLIELLSRTQNPLSLLADEVPSYFVTPEIRVDCPDSEKFKVVEDVKKTFEKEYNIIDIDGVRVVFPDGWGLLRASNTQPILVLRFEAKTEEALSRIKKSFTQILEKFPFIKI\n>UniRef90_UPI00048A2204 TolC family protein n=1 Tax=Anaerovibrio lipolyticus TaxID=82374 RepID=UPI00048A2204\nMRNNRFKTLTALVISGVMTMSMAGTAMAETMDVDIEDCVNMAMANNHTVKSAIDDYDSAVWARHEARRMHGPTLNWTSAAQHIGGKFYDAHNVNSMYTNTVAVSMPIYTGGQLEGSIKAADLALDANELALEATKQGIKAKTQAAYYSALNCRNQIKVAQNSVKTLEEHLRNVNAQFGAGTVAKSDLLASQVQLSNAQLNLVSSQNNYDVAIATLNNVVGLPTGTELNLKDELGYVPYEISLDQCSEYAQLNRPDILAAEYKVKIAEAQLDVASSGNLPKVNATVSKTFAGEKPFSADERPVDNFYQQNTWYAGIGISWDIFDNNVTQAKVKQAKAAIEKAKEAAQEARDTGDLEVRTAYLNLTAAEKSISTAKVAMEKAQEDYTIAQVRYGAGVGTNLDVMDAEEKLTTAQSNYYNALYKYNSSKAALDKAMGLMVDLDVTQLQEKLAKN\n>UniRef90_A0A0N8K910 Oligoendopeptidase PepF n=1 Tax=Bacteroidetes bacterium HLUCCA01 TaxID=1666909 RepID=A0A0N8K910_9BACT\nMSEKKTSNGAETIYWDLSDLYTSGEDPNIRKDQHRLRDLASTFAARYRGTLATAHAGDLAEALRTYEEINDLLGKMGSFAYLQWSTNTENISYGQLMQQINEFSSELSQQLVFFDVEWLALEEERAAELIADERLKSWKHYLTASRRYKKHILSEKEEQILTAKSVTGSQAWVRYFDETLGAARFELDGEQLTEQEVLSKMHEPDRELRQRAADSLTRGFREHRRTLTFIFNTLLVDKFTNDTLRKYPSWISGRNLSNQIADDTVETLVESVQKFYPTVQRYYKLKKQLLGYDSFFEYDRYAPLLQTESRVSWSDAQTMVLDAFNGFNPEMGRIARRFFDENWIDAAIRPGKRGGAYSASTVPSVHPYVFMNYDGRLRDVQTLAHELGHGVHQYLSREQGILQADTPLTTAETASVFAEMLVFQKLLAELTDPREKLALLMGKIDDTIATVFRQVSMNRFEDAIHTARRQEGELSAERFSELWRKTQTDLYGDSVQLTENYDLWWCYIPHFLHTPGYVYAYAFGELLVLALYNRYENGAENFPQRYEQLLRAGGSDWPENLVSKLDVDIKDSTFWESGLAIIDQLVDQAEQLSAQAGMGQ\n>UniRef90_A0A3M6WIU0 C3H1-type domain-containing protein n=2 Tax=Hortaea werneckii TaxID=91943 RepID=A0A3M6WIU0_HORWE\nMAGKKPCHLFQLGRCKYGNGCKYAHVKDPSFKRKACINFAKGTCHRGKTCTYSHDQADIDLWGASNDQDTAANASGPSHVDNSQAMFKNWRYNIPQEVGTPTPLGINLGRFFKQAAELIDGDAGRMQEVIVLLASEGGVQRIIELLEQPLDKCHPDILPRLFNTQIICFLEIITHKHVTVSAILKPRLTTIYNIVWGEGGQQAMKLFSAVAQHLQTLRLMGQGEGSSTNTTAIHAIECALTALDKLTEVNTSAQVHDGLKRVAEAFAILFKEPMTDQVRFAVKPSQRHLRRVEQRLGLGQAIPTQSEGKQHKGERAFFTLERPGPGELNIDGVAPRYDNDHVDIRGISILPTTLEIQFAGAEYLPLTDPTQWHIGGLEGLLDRHFRLLRADTVGQLRDTAKTELARLQAPEARGPTQQNKQRTSRAFVYGNATIVDATFTSQNGIEFAISFDQPGKVQRKKKNERKDWWQNSKTLSDDALVCLLSSLGSAIFLTVVPEPKNPKKDAAKGEQQTSIHKQYDLWSNGQRAHVIVKPAQQDGIELILRELSSSGNARLSLVEFPSVLLPAFQPTLRAMQRLTETLEVPFAEVLAPVSTRDNPTREIEIQPPNYATRPGFQFDLSVVTTNGKALRFTPGRDIDGAAAELAQYSIVSSLSRSLALIQGPPGTGKSYTGVQLVKILLAHKKACNLGPILCSLERLLDEGVSNIVRIGGRSKSDRLANVNLREVAHRLDLTKTEKSERFRLTKEVEDEVTELKLILRSMSELGSQSSIEEYLREWQPQHHHQLFSNIDEEGFITVNRHQDSELQQWLNSVPWDQKKRRPVAELENADLRQMTARERRRLYRDWTAKAAHKVQEKFDRALTEYNNAKEQQDDIRTETDQRALRQANIIGITTSGLARNLDLLRRVNAKVLVCEEAGEVLESYLLTALLPSVEHAILIGDHQQLRPHVQNYDLSTESRGGAQYALDVSLFERLVQPQDILAHPLPFCRLQVQRRMHPSISQLVQETLYPNLQNAESVNPIPDVVGMRRRLFWMHHEQIEDHAGDGLKTSHTNSYEVEMTAALVKHLVHQGVYKSEEIAVITPYLGQLRLLRRKLASSFEIVLNERDDEELLKDAGNGIEGDPPSTDVPLRRPSVARGTLLNALRIATVDNFQGEEAKVVVISLVRSNRERKPGFLKTPNRINVLLSRAQHGMYIIGNSDTITGDAGSKAGSVEMWENVLDIFRTNDNFGTALELCCPRHQDTPMSVQQPSDFVRLSPEAGCNLLCDQKLSCGHACTSKCHSDMLHDAVFCSKPCYRLDQDAPIRAKRNACMVLIKDVNVQLECRHIHKSLRCFEYQDPSKVQCQVPVTWTVPGCEHQVKEPCSTDVYSDDYKCRAMCSAILPCGHLPATAKKSARRVQPSAKPVVFTVRVARHAVSLLQLSSRPSMPFALCRSLRLASLLEEVSSDIEVYFLDSKLLTSYCRCEKTLSCGCRCPSVCGEACPTSDFCQVHGSEHIESLNADLVMLCAYRDVDLDEDPCIFPPCGHVFTATSMDGTMEMAAHYEIDPLTGAFTALKSTSEPFSSQELKTCPECRGSLRSINRYGRIVRRALLDEGAKKLTAWANRTHHDLSERLANDQCRLLDSLEMARKPSQNVKLTNSIDDQLREVKRLKYSKRYRQTFAIRTAVKNFSDRLIVDEQPYQRVRDLVETRRRQQLASSSATDIAEFSFASEELQLHEHLQAMLLLVRTEIVILSDVIAMHDKADGPVKGILKLQFDANRLQCTELAEEAARTVNVRQEVEAHIFWAKFAAMECGTSMATEEEGDADVSDYLERLRDKAITHLDTAEAICKRFTANEPDPTSDLSDELAEVRRMLDEGISSSEMRMVVAAMAKEFRGTGHWYRCVNGHPFTVGECGMPMQLARCPTCGEGIGGQHHRPTAGVQHANDIEERFGRMAI\n>UniRef90_UPI001FBC0094 HlyD family type I secretion periplasmic adaptor subunit n=1 Tax=Methylobacterium sp. E-016 TaxID=2836556 RepID=UPI001FBC0094\nMTHALVVPPPPIQMDWRKPVLTAYLVILLAFGGGAGWASVAKLESAAIAPGVVIAQSNKKTVQHFEGGIVREILVRDGDQVQEGQVLLRFDETQARASLDTIRSQQAVARIQEARLIAERDQTGKIILPENVASRAHEPAVARAIEDQQSNLRERATYLRSQVDVLNSKILQTEQEVRALTNDADSTKQQLVTIDQELGGLRQLLAKQLVPVSRVAALERERIRLQGMLDRAISDAKKGAQSIGETRLTIIQTQKQFLQQVSTDIIEVRKNLSDLIEKERVAQDVLSRLDVRAPRTGIVQSLKVFTIGAVIRPGDTILEIAPTGDQLTVSVQISPNDVDSVSEGLRAEVRFPTYHSRRVPIMLGKVRSVSYDRVTDAQNPQNIYFQGEVVVQASTVPSEIKDKLKPGMPAEAIITTGEQTPLDYFLGPLFDRVSHGLREK\n>UniRef90_A0A7R8VGG4 JmjC domain-containing protein n=1 Tax=Timema douglasi TaxID=61478 RepID=A0A7R8VGG4_TIMDO\nMHYLLNSGFDYPIVVDDPNGLEMAVPTNFNALQLLDYIDGMQQVKAIDVMSQNIITIYLIDFVDYFLSPYRWHPINLLSVEMSQTSLRDAIQPPLISRILDWSEIAWPADCSEPKSDVQRYCLVSTKRSFTDFHVDFGGSSVWYHVVKGEKILYLIKPTAANIQLFIQWTNTSKHNNSFFGDHVDDCFMLILTEGQTLFLPTGWIHAVYTPEDSVVFGGNFLHDLNIPLQMEIYKMEKATHTRQMYLYPQFEELNWYAGQHILQVICNTNIVGAVPRKYLMQGIRALIPMLNLWLTKNEDGQPFTSIMCQNLIRDLKRELKIGELNTKMLTTPRPGRESKRQRKKTFNADFYYFPAANKVASKASVAKVPLGGSTSPNQSNVSSQKIPLSLCSLPIMSHDLQEKGSSDSSSNKTSHSSSPTLSKDMIHAPETIQQNELKMLCSQIPNQLEEAHALFSTERVDSATILTQMSHQVSESLNSQTITRQKMESTSSQSKQPHTAREESSSFWQASVLGNVPTLKVVLNRLANVPEPVTYPYSTNSVTTKKHHTAACTITSRESQDNNCQPWFVQAHTLCSKKELKMKVKAVSDSSKQTTPRDVYDFHASEDENSLLIDDQSSIESWHTNMQSKVNRKSPNSSVSSPTLSLGSSTQSDSIGLPYVKVNRIDELLKASALTGSGGTSPSTRDAIQGMLSISCSGSSSTSKMPIKTRSKKQHYEMVDDAQELVDEVHRDDDFVYPSLDVSDGEEPLNKRSKKRNIDEAWNPSARIGRLVPRTDRPTRYIKKNQAIEKGLEAAAAKRANLPPPKRPYNKKKTSDTPIPSTPGTLPKKEMPKEIKGIKCKHRQMGEKVTRGERKRKREGRKRQKSQGTPQGQQRSMLETLLPSRSRPFQLLGDEARMRVIFTMLVSLPNSS\n>UniRef90_A0A1K0ILZ2 SPOR domain-containing protein n=1 Tax=Cupriavidus necator TaxID=106590 RepID=A0A1K0ILZ2_CUPNE\nMRVQSPASAPAPDAAPRSALPSATLAAACIEIGGFSAQAARRATEDLAAAALRVEAFARQEQVRWWVHLPAQPTREHAERKLAELRRRNVTEYSLVTAGTPEATTYTVSLGLFRERERAQQYLDSLRGHGVRTAMLTEAARPLTRQWLRVRDADHAARARLEAMRQRYGAEDVLACS\n>UniRef90_A0A6H5GIQ7 Zonadhesin (Fragment) n=1 Tax=Nesidiocoris tenuis TaxID=355587 RepID=A0A6H5GIQ7_9HEMI\nGGINHPGPSGTSCYRNQFSEVTLSANFDQIRSNSTSRSIQLRDQTRLRDQTQLQVQRQHRDRIQLRVQTQHRDRIQLIDQSQLRVQTELRDQIQLRIQTQLRDQIQLRDQSQLRVQTELRDQIQLRDQSQLRVQTQLRDQIQLRDQSQLRVQTQLRDQIQIRDQSQLRVQSQHRDRIQIRDQINFEFKLNFEIKFNFEFKLNFEIKVNFEIKFNFEFKLNFEFKVNIEIEFNFEIKVNFKIKVNFDFKLNFEIKFNFEFKLNFEIKINFEIKVNFEFKPNFEIEFNFKIKVNFKFKVNFETKFNFEFKINFEIKVNFEFKLDFEIKFNFKIKVNFKFKVNFEIKFNFEVNGSIVIVLKSRIGTELQKKLFLIHIYSESLPEQVSVCPFDNIFGCSPTNMYPEKIEKIIFYYLIRTPQFLCGRSSNFINTYLILLTGLTRQQFGGVRPCRDKHFSSRNLKKGRKPMPPQ\n>UniRef90_A0A067KLY9 PPR_long domain-containing protein n=1 Tax=Jatropha curcas TaxID=180498 RepID=A0A067KLY9_JATCU\nMAVKLSHSYFFNSYKPDDASFKQMGAPKRDLLVNPRIRKSNPTKKQMSETPKRGMIKPNSLSLTRSLCEFVDSGAMDNALYLFEKMNQPDTYIWNVIIRGFSNKGLFQEVIDFYHRMEYEGIGIDNFTFPFVIKACGRLLSFIEGKKVHGKLIKIGLDRDIYVCNSLIDMYFKFGFVEVAEKVFEAMPLRDLVSWNCMVNGYRVIGDGLKSLMCFKEMLGLGEKPDRLSMISSLGGCSIGCCVRGGKEIHCQVIRNGLELDIMVQTSLIDMYAKCGKVDYAERVFNEMTCKNIVAWNAMIGGYAINGHFLESFTCLKRMQEDNLIPDAITMINLLPSCSKFGTLLEGKCIHGYAIRKMFLPHLVLETALVDMYGKCGQLKFAECVFGRINEKNMVSWNAIIAAYVQNGRNEEALELFHCLRNQTLKPDAVTIASILPAYAELATVTSLVWSMKGGNCSIL\n>UniRef90_A0A521B5K5 Uncharacterized conserved protein n=1 Tax=Saccharicrinis carchari TaxID=1168039 RepID=A0A521B5K5_9BACT\nMSEKNLTVTSNKTGQLFDAKGQLLSPPSQWSFLPAGDAGVTRKVTANGKYWRVVFKKGRRIMSKGVWAPTQVIEMAKKEMEATRSTDDYLKKKEYNAKRRKKQQQAYEIEFCAEVEKFLNFHSDYAPVARAMAILVTRHAVPVGSGTVARTAMIPVHERAARAVIAWMRHQTTAYDHMKIARIKGERREVRRMLAQESTRLMNNYRRGLPIPFTCPLKKALDKIISP\n>UniRef90_A0A517WN20 Putative adenylyltransferase/sulfurtransferase MoeZ n=1 Tax=Gimesia aquarii TaxID=2527964 RepID=A0A517WN20_9PLAN\nMKWTCAVVFTLLITSMGFAVEHTKDSLATIKKNVESKKAVLVDVREKGEWDAGHVKGAIFLPLSSLQDGITAAEQKKLPQDKVVYLHCAVGFRAKIAASLLKKYNDKVRPLPQGYEELIESGFQKSK\n>UniRef90_A0A0F5FR09 Serine hydroxymethyltransferase n=2 Tax=Devosia TaxID=46913 RepID=A0A0F5FR09_9HYPH\nMSAATSLPLFPHFFSDSVAETDPELAKAISDELARQQGEIELIASENIVSQAVLEAQGSVLTNKYAEGYPGRRYYGGCQFVDVAETLAIERAKQLFGVGFANVQPNSGSQANQGVYQALLQPGDTILGMSLDAGGHLTHGAKPNQSGKWFNAIQYGVRKQDGRVDMDQVRQLAREHKPKMLVAGFSAYSRIMDWAEFRAIADEVGAILFVDMAHVAGLVAGGVYPSPFPHAHVATTTTHKTLRGPRGGLILTDDEDIAKKINSAIFPGIQGGPLMHVIAAKAVAFKEALSPEFKLYARQVVANARVLADTLVKGGLEIVTGGTENHLMLVDLRPKGLTGKATETALGRAHITCNKNAVPFDPEKPAVTSGVRIGTPAGTTRGFGEAEFRHVGELILEVLDGLAANGDENNAAVEEAVREKVKVLTDRFPIYGQ\n>UniRef90_A0A6F8V0N0 Prevent-host-death protein n=1 Tax=Bosea sp. ANAM02 TaxID=2020412 RepID=A0A6F8V0N0_9HYPH\nMARRDLNARLDQATHALCTRVERAHAVPAGATLRFRQGKPLAPVIFTILESADWDRSALPARDGYPFR\n>UniRef90_UPI0014890022 alpha/beta fold hydrolase n=1 Tax=Ruegeria sp. HKCCD8929 TaxID=2683006 RepID=UPI0014890022\nMRFLPVLVAVVWLAACTDRSSFVLVPDAVDVGTPRTVFAASARAREADGSYGYRRADRLQFLELTVSIPPTHTPGSLNLSYGRPDPETQFVLAGQEVFASPEPLRQRLLNDQREHGSALREVTLFVHGYNATQNETAFRAAQLANDIEIPGSLMIYSWPSRARAFGYAYDLDSMLFARDGLEQTIRQLKASGAERIVLVAHSMGAALSMEMMRQAEIREPGWSDRMLEGVVLISPDLDVDVFRTQMDRIGTVPQPFVVMVSRKDPALNISARLRGTAESRRLGNIDSIDRIADYPVDVIDTTAFSGDAASRHFVAATSPALVTLLSSAPAMGEAFGPEETSFDFLIPGGVEVSGRAKEIILARPGENR\n>UniRef90_UPI00049064DE HAMP domain-containing histidine kinase n=1 Tax=Paenibacillus sp. UNC451MF TaxID=1449063 RepID=UPI00049064DE\nMRGLYRRFAFTFICITCGILLIASIVFILETHYHFALYQHQSMDMGADNAQLNAHFEQALVQSVIWTAVGGIALASVVSLYVAKRMTSPLLEMKAAAMKMAEGNLQARTKLVGNDEITDLGLSFNHLAEQLEKQEQLRKTMTADVAHELRTPLATLKSHMEAMIEGIWEPSAKRLKSCHEEIERLIHLVGDLEQLTHLDSPHFQLHMKSENMVSIASQCVQAMQAAFQLKGVQLTLHKPNEDIFAIVDRQRVCQIIINVLSNALKYTPVGETVAVTMAGDHRSSTATISVRDTGIGIESRELPFIFERFYRTDKSRDRKSGGSGIGLTIAKKLTEAHCGKIEIQSEVGRGTTVQIHFPIKSKKSSLSTQDLQKSRI\n>UniRef90_A0A2J8RU61 MAP4K4 isoform 8 (Fragment) n=1 Tax=Pongo abelii TaxID=9601 RepID=A0A2J8RU61_PONAB\nGRHVKTGQLAAIKVMDVTEDEEEEIKLEINMLKKYSHHRNIATYYGAFIKKSPPGHDDQLWLVMEFCGAGSITDLVKNTKGNTLKEDWIAYISREILRGLAHLHIHHVIHRDIKGQNVLLTENAEVKLVDFGVSAQLDRTVGRRNTFIGTPYWMAPEVIACDENPDATYDYRSDLWSCGITAIEMAEGAPPLCDMHPMRALFLIPRNPPPRLKSKKWSKKFFSFIEGCLVKNYMQRPSTEQLLKHPFIRDQPNERQVRIQLKDHIDRTRKKRGEKDETEYEYSGSEEEEEEVPEQEGEPSSIVNVPGESTLRRDFLRLQQENKERSEALRRQQLLQEQQLREQEEYKRQLLAERQKRIEQQKEQRRRLEEQQRREREARRQQEREQRRREQEEKRRLEELERRRKEEEERRRAEEEKRRVEREQEYIRRQLEEEQRHLEVLQQQLLQEQAMLLHDHRRPHPQHSQQLPPPQQERSKPSFHAPEPKAHYEPADRAREVEDRFRKTNHSSPEAQSKQTGRVLEPPVPSRSESFSNGNSESVHPALQRPAEPQVPVRTTSRSPVLSRRDSPLQGSGQQNSQAGQRNSTSIEPRLLWERVEKLVPRPGSGSSSGSSNSGSQPGSHPGSQSGSGERFRVRSSSKSEGSPSQRLENAVKKPEDKKEVFRPLKPADLTALAKELRAVEDVRPPHKVTDYSSSSEESGTTDEEDDDVEQEGADESTSGPEDTRAASSLNLSNGETESVKTMIVHDDVESEPAMTPSKEGTLIVRQTQSASSTLQKHKSSSSFTPFIDPRLLQISPSSGTTVTSVVGFSCDGMRPEAIRQDPTRKGSVVNVNPTNTRPQSDTPEIRKYKKRFNSEILCAALWGVNLLVGTESGLMLLDRSGQGKVYPLINRRRFQQMDVLEGLNVLVTISGKKDKLRVYYLSWLRNKILHNDPEVEKKQGWTTVGDLEGCVHYKVVKYERIKFLVIALKSSVEVYAWAPKPYHKFMAFKSFGELVHKPLLVDLTVEEGQRLKVIYGSCAGFHAVDVDSGSVYDIYLPTHIQCSIKPHAIIILPNTDGMELLVCYEDEGVYVNTYGRITKDVVLQWGEMPTSVAYIRSNQTMGWGEKAIEIRSVETGHLDGVFMHKRAQRLKFLCERNDKVFFASVRSGGSSQVYFMTLGRTSLLSW\n>UniRef90_A0A1V5E6B1 LPG_synthase_C domain-containing protein n=1 Tax=Syntrophaceae bacterium PtaU1.Bin231 TaxID=1811718 RepID=A0A1V5E6B1_9DELT\nMNFKKLEVADYAALKPYFDPIPYRLSIYSLPSLIAWGDCVFETRYAVEGDLLVIANESQLRPDDRHLILPVSPGGDPSPERLRAIALESGHRRYWCACGNYVERHRQGLEPLFHIEEQPEFEDYVYLAEDLAELRGNRFVRKRNLIHQFEREFMRNGSRASVEPITRESVPECLAFLEAWCVQRDCDVDGDIDLACERRAVITSLEQLEALDLRGILVRLDERVCAFGIASRLNGDTGILSYEKAFSDVKGLYQFLDRECAKRLFAGCRYINKESDMSLPNLAAMKRSYHPVLRVKSYRLTLR\n>UniRef90_UPI000D0912D6 B3 domain-containing protein Os12g0592300 isoform X2 n=1 Tax=Rosa chinensis TaxID=74649 RepID=UPI000D0912D6\nMELEERPSFFKVLVDGFSQQLRIPRAFVKNFNGRVPRMCGLRGPCGNLWAVNLKEIKDRVVFHNGWQSFAKHHFLEVGDFLTFTKDDGSIFDVIIYDKSYCEKNVEAAKSRIGNVVDRTINNHIILGKRPALDLVEETSIGSISFNSENPFFTTIFTREFQAK\n>UniRef90_A0A0N0N6B7 Amidohydrolase 2 n=1 Tax=Actinobacteria bacterium OK074 TaxID=1592327 RepID=A0A0N0N6B7_9ACTN\nMFKEFVVSGDSHIIEPVDLFKTRLPKNLRERALWEEEFTLEEPIVPGGHTEFKKLHTIGFDGWTISKYRQTGGITPDGEPEHIIRDMNLDGVDASVMFPNLSLFVLFTDDHELSMAHAKVWNDWIAERYLQYKDRLRPTAAIPLTYIPDAVAEIERCSRLGIGAILLPDVPPELPYWSSEYDPVWAAADAHGMPVFFHVATGGVKVKESSSATATTVRGMVSSMNMGKGQLTDAMVASRTMSAGGSGAAGPQGIIADLVAGGVCERFPNLHFNLIEYSAGWLVSYMGFMDKLWKTGTGQDPDWWLGFWDDSRSPKDQPTMGRMFAVNQRWPWPLKPSEYVRRQIHVQFADDPTAVKCRNITGLSTIMWGNDYPHAEGTFRSSADCIAENFEGVGDEDRAAILGGTLADIVHFDKSKKLAPVAENA\n>UniRef90_A0A4Q9KAX3 VWA domain-containing protein n=1 Tax=Propioniciclava sinopodophylli TaxID=1837344 RepID=A0A4Q9KAX3_9ACTN\nMVPLISFFHPERLWLLALVPVLLLLYGALLQRSRTRSRTQGIDNLAKVMPKQAAWKRHIAVLAAVVSLAALVVAFAQPKDAVDVPRERATVVLAIDVSRSMEATDVDPNRLDAAKEAASGFVDLLPRGFNTSLVAFAGSSSIITPPTQDRGLVKRAIDNLQLAPSTAIGEGIYSALDAMLLVPQDPNDPEESTPGAIVLLSDGYTNIGRSSTVAARDAKEAGYPIYTIAYGTPNGYVVSNGRREPVPVNPAELNAVARESGGEAFQAGSREELQRVYASIARSVGYEKVDQEVTEFYAGIALGFAVLASLAVLSLAARWP\n>UniRef90_UPI0004DC9B9D PE family protein n=1 Tax=Mycobacterium tuberculosis TaxID=1773 RepID=UPI0004DC9B9D\nMSLVIVTPETVAAAASDVARIGSSIGVANSAAAGSTTSVLAAGADEVVSAAIATLFGSHAREYQAISTQVAAFHDRFAQTLSAAVGSYVSAEAT\n>UniRef90_A0A2E4XJ01 Enoyl-CoA hydratase n=1 Tax=Acidimicrobiaceae bacterium TaxID=2024894 RepID=A0A2E4XJ01_9ACTN\nMEEIQLTQEENIATVTINRPQVKNAVTSDMWDELQRVFTELGYRDDVRAVIVTGAGDDFCSGADVGGMGSRSEGPRLHQLDAMRKVGDCCLSLFNMPKVTIAKVSGVAVGAGMNLALSCDLVVASENARFSEIFAQRGLSVDFGGSFLLPRIVGMQKAKELVLLAEVISASKAHEMGLTNYVVPREQLDEKVLDLATRAASGPPRALAMSKAMLNKSFANSIQDALDQEGTSQTVNFTTKDVSEAMKAFQEKRSPRFKGW\n>UniRef90_A0A7S1QCM4 Guanylate cyclase domain-containing protein n=1 Tax=Alexandrium catenella TaxID=2925 RepID=A0A7S1QCM4_ALECA\nTSLAGGGDATVAREELVSECRHKLGRSPTNVHLAWSDPHWLIQPRGAWVIGHELQGHFRFNMSADPFAANAIDCRRFDLNTVVLIITGILTCLVFAVTYVHLRTYAVVAVSTTFISLACATGIFGVWMRWVDCRTSGLHDHNMVFRHLATSCFQVANFNGTMYANAMQKHGKLVIAFESNFRHVRQVSRSEVWFGSLSEAFLLVLVIAAHVTFRHKRMQTREARYELMCRRPRLVRCLLENISFLDQLPPRDRTMMAFTLKRVYDEDDGKKFSDLEERYREMLSMKPSPSDLDGVGSSFWPAAVYSLVRALIPSTYRQFIPTATTPGSGMQAYANAVPEENTLWMLSALLRVVMTFCVYLFVLFSIKEASRRYTRTMQVWLVFDSKWHFPSQTSLAGDPMTETVQVSMDDEGECLHMLDRNHQPPIGNFSSEHCCSPRDSEDDGNIVNTQEVKDKLTTWWAWREYLIIDYTDKRVRLEFHLVVAVAMLVVSAVLICVDDFKEGFRPPQLLDIDESMSWFRGHVNSLSFQTAWDLLFLTWPVLNAINTAATMNRLIESHLQKIKHLADLLNEAGIGLPVGADSSPAGQSDVSPQDDVGPSIRNIFRVAKAELASGGSNATRFLNIVPINRQTFAIAGTVLSLFTGGQFMEIFNNLLGAVNGS\n>UniRef90_A0A193G2U0 General secretion pathway protein GspM n=2 Tax=Bordetella bronchialis TaxID=463025 RepID=A0A193G2U0_9BORD\nMKVSARRAPRLLLPAPLLARCRDTAERASRYWTRLTPRERRLLRALGAILTAAAVFALGLRPAWRDIERWRDELPRLRAQAAAVDALVQEARALKREQGNRIPARDMEEALRASLARAALGGTQQVGKTPDDKAWRIAFDDASPAALFDWLAHAPAFLHLRVVQVHIVRPRDSLGRPIPARATGTLVLRDAGDAAIGARP\n>UniRef90_A0A0B8NUT2 OMP_b-brl domain-containing protein n=13 Tax=Vibrio TaxID=662 RepID=A0A0B8NUT2_9VIBR\nMIEAETMDHEIRATWTRQGVQPYFEFRSQANGAENAQGDSLVNNAFVFGASYGF\n>UniRef90_A0A7S3J898 STI1 domain-containing protein n=1 Tax=Euplotes harpa TaxID=151035 RepID=A0A7S3J898_9SPIT\nMLKSLDNLRAAHPGCRQQISLLPPQQMIRKIGDMKNDDPQMTMRGMDKEELSHMQRIMGSMESMAADRSMQFPQVPEDILRRDMEEDQDNSNHNEPEEE\n>UniRef90_A0A653T2G2 Glycosyltransferase EpsD n=2 Tax=Microbacterium sp. 8M TaxID=2653153 RepID=A0A653T2G2_9MICO\nMSQRSELRTHHRRDLLSDPELPPASAPRVAHLAHTTVAGGAELGLARMLRADAPWRASVLLPPVPAEDGAFAGLPASIPIHRIGVAQPHGASGASAMSAFSLGVRLVAQAVATRRHPSFRQADLIVANSTRAAAYGALAAFGSRKRFLVHLHDITDRETLGGFGLRMMTRIVLPRADGVIANSQATLASAEPYLRPDAVREVIAGASGLTGAARGAREPGPLRVGMLARIDPWKGQLLLLEAFAQAFPGGDEILEFAGGAPFGHADFAVELRDRARALGIADRVHLLGHVEDVDRLLRRWDVGVQASLRAEPLGFNVLEYLDAGLATVVAAEGGPVEWVRDGVNGLVVAPRDVGALAAALRRLGADAGLRSRLGDAARSTPGLATDHVVAQQHAAAYLRVIAQRR\n>UniRef90_UPI001B319B05 hypothetical protein n=1 Tax=Bacillus suaedae TaxID=2822140 RepID=UPI001B319B05\nMAINYKQCINCESKNTLNLLYGMPTDDASKQAKEGKFKLGGCCVIVGGPEYCCNVCESEWNKEQAIDAAYEKIIGLNAYVGGFFGASYNVDLDLISGSAAWSHWENGEEVASECKALKETTVKKLIEELKIINFLNWKREYIEPGVLDGTSWSVELIREGRNLKRSGANKFPEEWDDFCKLVRRMTGKRFS\n>UniRef90_A0A516GYM1 YdcF family protein n=1 Tax=Ferrovibrio terrae TaxID=2594003 RepID=A0A516GYM1_9PROT\nMARKDRDDEESTPFFTRISRWLMLLATIGLLWLGGGIAYVERVESIPAPAETKTDAIVVLTGGAARLATALRLLNENKADRLLVSGVAQTATKATLLQAVLPTMPDAAQASSNWQGIDLQLLFDCCVDLGFEADDTAGNAAETASWAAARGYRTIRLVTANYHMPRAQVEFGRYLSGMTIVPHPVRSDAMRVEDWWQRRAATVFLLGEYSKYLAALLRARLGTQLTATLEQKPQTVPVQPAAAPTQEKPTEEKPQ\n>UniRef90_A0A7C9L683 Alpha/beta fold hydrolase n=1 Tax=Sediminimonas qiaohouensis TaxID=552061 RepID=A0A7C9L683_9RHOB\nMTVVQDPAANADLPVVVMIHGSGWHAQQFDRLAWALRDVAELRAVTLRGHGADPVRRGDVDYIGQLEDDLASAIGDVAPGRKVVMLGHSSGGGLVVRFAGGPHDGMIDAAILLAPFLKHNAPTTRTDAGGWARPLTRRIIGLSMLNMVGIHEFDHLTAIHFAMPKKVLDGPLGHTATTAYSWRLNLSYAPRRDYKADIAALPPFVLIAGADDESFRADEYEPLMSGVTDKGRYHVLPGVGHLGVVDAPQTETLIREALRAL\n>UniRef90_UPI001BA7DB86 DUF2130 domain-containing protein n=1 Tax=Bradyrhizobium sp. AUGA SZCCT0177 TaxID=2807665 RepID=UPI001BA7DB86\nMTFKATASDAHEPVVRCPNCSHDIRLTESLAAPLLEENRRRFQEQIAQKDAEVARKSEVLLKERDDLARARDQVEEQIKQRLAVERNQLIAAEGKKAQEAAAVELQAKSTEAAELRRTLEANNVKLAEAQKAQADVLRKKRELDDEKRELDLTVEKRVQSSVEDVRVKARQEADDAARLRISEKDHTIESMTRTIEELKRKAEQGSQQTQGEVFELELEEILRGRFPTDMIEPVAKGELGADVVQQVNEASGQPAGIILWETKRTKNWSDSWLAKLREDQRRCGADVALIVSHALPKHVEYFDLIDGVWVAHPRCALPVAVSLRQALIAVSNTRLVQQGQQTKMEQVYQYLTGTKFKQRVDAVIEKFNDMRDDLDKERKFMICQWAKRETQILSVVESTVGMVGDLQAIAGKAMPEIPSLDLPLLEISDAAE\n>UniRef90_UPI001447B9A0 helix-turn-helix domain-containing protein n=1 Tax=unclassified Cryobacterium TaxID=2649013 RepID=UPI001447B9A0\nMPEAATKKQTLAWLKTVSGELATATLKRLDDTLPWYREMPPGRRSAVGLVAQAGITSFMQWYDDPSSTPWIAADVFGAAPRELLRSVSLTQTLQLIKVTVEVVEERVKGRDESLREAILLYSREIAFGAADVYARAAEARGLWDARLEALVVDSILSGEYDDELPSRIAALGWHGHGEVSVLVGTAPKMLDVDMLRRTARHQDADVLIGVQGSRLVLVIGRAQPASVNEDEGTAPPKPFLDIAMELEPGFGDGFLVLGHEVPSLVDASKSAKAALAGFAVARSWRNAPRPTLADDLLPERALAGDPLARATLITRIYRPLQAHSTELLSTLWSYLDNGRSLEATARELFVHPNTVRYRLKRVSEVIGYDATGARESLILQAALIVGSIAEHDTPRRR\n>UniRef90_UPI00131B79F4 3-hydroxybutyryl-CoA dehydrogenase n=2 Tax=Chachezhania TaxID=2603319 RepID=UPI00131B79F4\nMTIKSVGVIGAGQMGNGIAHVMALAGYDVLLNDISQAALDKARATIEKNMVRQVSRGAISEDEMKTAMGRMTTSMTLSDVGQTDLVIESATERESIKQAIFEDLLPSLKPNTILTSNTSSISITRLASRTDRPERFMGFHFMNPVPVMKLVELIRGIATDEATFNACKEVVARLGKTSATAEDFPAFIVNRILVPMINEAVYTLYEGVGSIESIDTSMKLGAAHPMGPLELADFIGLDTCLAIMNVLHDGLADTKYRPCPLLTKYVEAGWLGRKTQRGFYDYRGEVPVPTR\n>UniRef90_A0A0B5L654 Gag polyprotein n=1 Tax=Human immunodeficiency virus 1 TaxID=11676 RepID=A0A0B5L654_9HIV1\nMGARASILSGGKLDMWEAIRLRPGGKKKYRLKHLVWASRELDRFALNPSLLETAEGCQQIMNQLQPALKTGTEELRSLFNTVATLYCVHHRIKVSDTKEALDKIEEIQKKQKTQQAVADAGNNSTVSQNYPIVQNAQGQMVHQSLSPRTLNAWVKVIEDKGFSPEVIPMFTALSEGATPQDLNMMLNIVGGHQAAMQMLKDTINEEAAEWDRLHPIQAGPLPPGQLREPRGSDIAGTTSTIQEQIAWMTNNPPIPVGDLYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFFKTLRAEQASQDVKNWMTQTLLVQNANPDCKSILRALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQAQQPNIMMQRGNFKGQKRMIKCFNCGKEGHLARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGRIWPSSKGRPGNFPQSRPEPTAPPAESFGFGEEITPSQKQEQKDKELYPSASLKSLFGNDPLSQ\n>UniRef90_E1GWA8 Anaerobic ribonucleoside-triphosphate reductase n=8 Tax=Prevotella TaxID=838 RepID=E1GWA8_9BACT\nMQNFTITKRDGSKEMFSLDKIMGAILKAFESVNAPTDLAAVSKILSDLTIHNDITVEDIQNQVEQALMKEGYYDVAKSFIVYRHQHSQDRETQDKIKFLTEYCGASNAATGSKYDANANVENKNIATLIGELPKQGFIRINRRLLTDRIKQMYGKELANEYLDLLTHHFIYKNDETNLANYCASITMYPWLIGGTTAIGGNSSAPTNLKSFCGGFINMVFIVSSMLAGACATPEFLMYMNYFIQKEYGKDYWKNADKVVDLSLRQRTIDKVITDYFEQIVYSLNQPTGARNFQAVFWNISYYDKYYFESLFGNFYFPDGSQPDWEGLSWLQKRFMTWFNKERTRAVLTFPVETMALLTENGECRDKEWGEFTAEMYSKGHSFFTYMSDNADSLSSCCRLRNEIQDNGFSYTLGAGGVSTGSKSVLTINLNRCIQYAVNKGEDYKLFLDHIIKLCHKVQLAYNENLKNFLKNKMLPLFDAGYININRQYLTIGINGLVEAAEFMGLDITPNEDYKHFVQGVLGLIEQNNKAFRTKEAMFNCEMIPAENVGVKHAKWDREDGYFVPRDCYNSYFYRVEDTGLTILDKFKLHGAPYIEHLTGGSALHMNLDEHLSKAQYKQLLTVAAKEGCNYFTFNIPNTVCNDCGHIDKRYLKECPCCHSKNVDYLTRVIGYMKRVSNFSQPRQQEAAKRFYAGSDKME\n>UniRef90_A0A3S4JM46 imidazolonepropionase n=1 Tax=Klebsiella aerogenes TaxID=548 RepID=A0A3S4JM46_KLEAE\nMVFSHKKITFPCAIVDFTGVMKINVYTTHDKLSAMTEATSELVIWRNGRLATLNPDHAQPYGLLERHALLVRDGRIAAIVAEDDVPSGRSIDLEGRLVTPGLIDCHTHLVFGGSRAQEWEQRLNGVSYQTISASGGGINSTVRATRDSSEAELLALAQPRLERLLREGVTTLEIKSGYGLDLPNERKMLRVARQLADHNGVELSATLLSAHATPPEYQGDANGYITLVCETILPTLWQEGLFESVDVFCENVGFSPQQTERVFQAAQALGIPVKGHVEQLSSLGGAQLVSRYHGLSADHNRVSDGRGRGGDARKRHRGSPAPRRVLLP\n>UniRef90_UPI001653AF6D hypothetical protein n=1 Tax=Lewinella lacunae TaxID=1517758 RepID=UPI001653AF6D\nMPRLKKILLTLLLLTVLAAVFRGPLYRTLVDYESVGASTNYTVKDEKLADLIASKVNRRTDLGITEAIKLSLSITSSQLHFTADNNDVDPNKLVTSKATHCVGYAAFFAATCKYVLSQQKLASSWTAEPQEGQLYFLGTNLHQYFHSAFLKDHDFVAIENHVTGEVLAVDPTIKDYFHIDFIRLRP\n>UniRef90_A0A0T0M9T5 Peptidase C51 domain-containing protein n=1 Tax=Chryseobacterium sp. Leaf394 TaxID=1736361 RepID=A0A0T0M9T5_9FLAO\nMFKENLILFAVFVMTLVSCKETEYRQKTNQKEPEKELSKKIPEKNILIVEAIKKFGPEISSTYEKAVCTELVIQIIEKFHHLEERDKFRIRIITDGNIQDLIKENSPIPKGVFYALTEKGIGIPIKKEDVLEGDFVQFWTPTWGHCGIVKSISLEKQEMELYSSFPSTKGYGIQKFKIPEYTFFVRVK\n>UniRef90_A0A1Y4S3Z9 Hydrolase n=1 Tax=Lachnoclostridium sp. An131 TaxID=1965555 RepID=A0A1Y4S3Z9_9FIRM\nMERLKYLFFDLDMTLLRDDKSISDEALAYLRDLKKRKDVRYGIATGRAWTAIEPLIERFGLDTLFDVIVMDNGSEIYDLAEGRRERLGIIQTEQMKQLLDAFGGYDFLAVAFHNPKGFFTTKISYRTERVLINNRLSGYHDPYKEEFEATARVMLLFLIEDQERVLEAVRLHPVPGIHGMLSEPEVYDFLCEGVSKAEGIRHYVTANGDRIEQTVVFGDSENDLEMIQKCGVSVSMKNGTEAVRAAADYVTGYTNNEDGVFRFLKEHEDWFQEG\n>UniRef90_C7ZDV9 Succinate-semialdehyde dehydrogenase n=9 Tax=Fusarium solani species complex TaxID=232080 RepID=C7ZDV9_FUSV7\nMPYSAPKLKDPSLFVGKNYVDGQWIESVSGKRFDVHDPASGALIGSCPESVAQDAEQAIKIAAAALPEWRSRTGRNRSRILRRWYELVIENKEDLATLITWENGKAGPDAAGEVLFAASFLEWFAEEAPRVYGDVIPHSAPGFRVSVIKEPVGVVGLITPWNFPAAMITRKLGPALAAGCTAVVKTAGETPFTANALLVLGERAGVPKGVINSIAALENTPEIGQTLCASDVVRKISFTGSTRVGKILMNQSSDTLKKLSLELGGNAPFIVFDDADLDLAIAGAIASKFKCSGQTCVCSNRIFVQKGIYSQFVEKLKAVVSKFQVGHGFDSKTTHGPLVTAAAAERVDDLVKEAVKAGAKVEVGGKRRTDLGKSRPNFFEPTILTNVTTDMRLVRDEIFGPLAPIFSFDNEDEVVDIANKCDVGLASYIFTQDVNRVARVTELLHFGMVAVNTGIMSDAAAPFGGVKHSGMGREGSKYGIEDYLHVKTIVTGNVNVVHRALL\n>UniRef90_UPI001F05B46E response regulator n=1 Tax=Desulfobulbus alkaliphilus TaxID=869814 RepID=UPI001F05B46E\nMHLSTASAMHDEGESYPMKEIRLLTDRLHQEIAEKTRALEKFRHLFEGAENGILVARGDTIEFANPALKHILGHDAEKITSEPFITFIHPDDRATVLDRHIRRMRGEDLEKSYDFRVVASDGSVRWINLSAQIINWDGDLANLSFVNDITERKTAEKEHEKLQEQLFQAQKMETVGRLAGGVAHDFNNMLGVILGYSEMALSQMAADHPLHGALHGINQAAQRSADLTRQLLAFARKQTITPRIIDLNETVEGMLKMLRRLIGEDIDLIWLPGRNLCPVKMDPAQIDLILANLCVNARDAIKGHGKVTIETGLTSFDDAWGAVHTGVVPGEYVLLAVSDNGCGMDQETINHMFEPFFTTKEQGQGTGLGLASVYGAVTQNNGFIDVESEPGQGATFKIYLPQYVIRTEPLPVQDQVGATMRGHETILLVEDEPVILKMLRTMLEHQGYTVLTAGSPEEAIRLAEEHSSRIDLLMTDVVMPGMNGLDLARNLLSRYPGIKTLFMSGYTDDVIAHHGVLDEGVHFIQKPFSMRVLGEKLREALEG\n>UniRef90_A0A8B8IMG2 serine/arginine repetitive matrix protein 1 n=4 Tax=Nymphalini TaxID=171576 RepID=A0A8B8IMG2_VANTA\nMSSRRNGSVSRAAEAASKNRLHMDRNPQHSRITDPSNPAGRRKEIDNVMKRARQASPGSWDRKLLEVEEKDPNRWRHTGYKQMYLDGSGSASPRRSRSPRRSRSPSRRSRSPRKSRSRSPRRRSPLRRSPARRRRSASPRARRTRPPPRPPSPPDPRKSSPSGSSASSCSDESCSVCSAKNKKVPPKPIKPGVRTSPSPPRTKRPAPPVAARAVQPTRELLKARESSKRSREEKVLEWQRSQLAVRPAPPIPPAHIKREGERRPRPPRPERPDRPDRTDRVSPAAIAAALADSDSDSESDASSEPPPQRLTLSERFGKMAQWSAARCARLENMRITRRDSALHVHIERDDAAPAAPDAPRADYPGLDPAPVGSYPEELLAVAPGGLPSWDDVRVRYDYYKKRGYLRGLTLGDYVKWEEWWYKYQEWLKRERAYERWAEGEGGTSRRERRRRGGRHRRS\n>UniRef90_R6N0F5 Polysulfide reductase n=2 Tax=Firmicutes TaxID=1239 RepID=R6N0F5_9CLOT\nMESTLFKISEPSRVSGVLYGPITLVYGLGGIALTLADKYILSKIKCNKVLKIILSFIILALILTTVEFLSGYLCKLIFNTEMWNYHNKPYHIGKYICLEYIPLWGLLGTLIIYVLKPFFDKIIKLIPKEATYLLYLIMILDIIITLFTK\n>UniRef90_A0A506TYF2 Sigma70_r2 domain-containing protein n=1 Tax=Pararhizobium mangrovi TaxID=2590452 RepID=A0A506TYF2_9HYPH\nMTRKNMHINKRINFVIERRFPSFYEEIENVLDQAVDKYQTQNIRDPRIISYIISKCDTDTAVLVSRENDVDLLNDKDKISKDEKINKYLEIFEEYESRIHSFSSEELNAAYKEEKKLEENENLREMMAWDERQEFSDPMASADFDTWLSMATWTVDEAVSLSLAKEPGTVDRSSGFYKFSLKTGSPFISEYEKRTDQLSRAIKAQDLDKPLRPEAVMAWFQGQGMQGAFGGRVHHIARYDEEVEVLRRENERLKRLVTSPEKLETNSVLGLYRLCLGMAICRYEYRTDMRNGAAKSIAGEFAEVGLSITDDTVRKHLQRASKELGFEWKTRSPFEVRSKLRAKPKSD\n>UniRef90_UPI000A646756 hypothetical protein n=1 Tax=Colibacter massiliensis TaxID=1852379 RepID=UPI000A646756\nMADIKKVINEKKEALRQICKGFTSNNTGGCCGVSLPPEEQAELKRLKEGKT\n>UniRef90_A0A7L5ZNR0 Tetratricopeptide repeat protein n=1 Tax=Exiguobacterium profundum TaxID=307643 RepID=A0A7L5ZNR0_9BACL\nMLARLAIALFWAAIFFGLGAWSGGHLRPIGDALVTGXANTGEKAVRLWTWARHGAPDAAPDASPATTAAALVDKGRAAFARGDLQGAVEAYREALELRPGDADILGELGNVYYTSGQTAEAALAFHAAAEALIDSGRIEAARALLPAVRAAAPTLAADLDTRLAAAAPVTQ\n>UniRef90_A0A4T2C462 DUF445 domain-containing protein n=2 Tax=Subtercola vilae TaxID=2056433 RepID=A0A4T2C462_9MICO\nMKLLATGLLVLMAVIFAVSFALQARYPWLQYVRAASEGGMVGALADWFAVTALFRRPLGLKIPHTAIIPTRKNEIGESLGEFVEENFLSDAVVQEKLASVGVSRVVSGWLSQPANAHRLTNEIAGGLTGALSFLSDDEIRSVIEGLARTHLVGRDWSPQIGELASSVLATGHQHIAVDLLVDKAEQWLAANPESFTALVSKRLPSWLPSFVDRLVDDRVYREALKFVQSVQANPGHPLRKALDEYLLRLADDLQHDPAMMKRVEALKEQVLDDPRLRELAALAWQAIKDALTASLENPESALRLTIESTLVDVGTRLASDARLASTVDTWVANAASHLLASYRHDIAAVISETVSRWDGKEASQKIELQVGRDLQFIRINGTVVGSLAGLAIFAVAQGLLSAF\n>UniRef90_A0A2M9FV78 Enoyl-CoA hydratase n=1 Tax=Minwuia thermotolerans TaxID=2056226 RepID=A0A2M9FV78_9PROT\nMNTTSEVAVGRVDGVVEGGIGWIVFDNQRRHNAMSMAMWEQLSEVLDKHVADPEVRVIVLKGAGDKAFVSGADISEFEKRRSTPEQSDAYSDAGTRAYTALADCPKPTVAMIHGYCLGGGLAIAVNCDIRIAAEGSTYSIPAAKLGIGYMVAGVERLLNLVGPAWTKEIFFSARRFEAAEALNMGLVNRVVPLENLADDVLTTAKQIASNAPLTIAAAKMAVDELLKDSANRNLGACERAIAACMQSSDFVEGRRAFMEKRPPRFTGA\n>UniRef90_A0A2D7S292 Cysteine synthase n=1 Tax=Flavobacteriales bacterium TaxID=2021391 RepID=A0A2D7S292_9FLAO\nMSNNIKEDLLLFNELVDVFLEEERLKPVTEYIEPNNVQQLLDIKLENNGLSKDKFKEALKQLILNTPKSSSKLFFNQLFGGRHSKAVLGDLLAAILNNSMATYKIAGPQVSVEKEILCQVYKLIGYNKNPGGTFPTGGSMSNFMSLVMARDKVNLEIQQKGITRKLVAYTSENAHYSVSKNASFIGLGKSNVRYIKSDLYGRISVMEFEKQVEKDLKNGFTPFYLNATAGTTVLCAFDNVNELSKCCKKNNMWLHLDGAFGGSVIFSDKYKRLVKGVNLTDSFCFNAHKTLGAPLSTSILVVKDKQDLYNSFNSKANYLYQTHGNEFNLGQTSFECGRRNNALKFWTMWKAIGLKGIASIVEEQFQLANAARKYIISNQDYSLYSFDDSLSICFNYKNFDPEDLCTKLFEMNSLMVGYGTFKKNRFIRLVIVNGENSLDDVTRFFGILERFTEEHQEHIKKI\n>UniRef90_UPI001867027B BppU family phage baseplate upper protein n=1 Tax=Staphylococcus cohnii TaxID=29382 RepID=UPI001867027B\nMAIYKNKDITTNIESEKLSINNSNTSFYTEDKGSAALRIFIKYRDGAFNLNDTNLTPTLDLFHNDGSIWRDEPLEVIMSDKGLLQYNIPDNVIAHAGLIKAKLFLRNAEQSVHVANFTFDIKDSGIEEAVAKEINVNIVDDTVKRIMNEQPELFKGEKGDDANPEDVKVLLEPYVDEKTNQEFEKLSSAKQVDGEVINARGSDKSLKSRLENPNYVPTKDEMNTKVIATHYDKKPMVTFIDDDGRTEVLQKWEPILQEKGNKLTIALVSSWIDNKESTVIKWEDVYRLKEQYGVEFVNHTYEHKHAQQLTDAEVDAEFRKNKEVLKREGLTHDIIVQPYGENTDSVRRISRKYAKANVSVKEGVNTLPLDTYRLFRISLGEDLYTTFEQYKAILDEAISKNAWVIFKSHSQYTSFDENQLQLIRQIIDYCRENGFIEATMEEGLRDRGNLIDVGDYTLKAKDSDYFILDKEGNIHSRKFAKNYYTLKYNTVDFNTPITNFEDMTTSTLAIVSTNSQGFPNNASGQLLTTKSESLVLSYQLYLPNNSNEIYKRRWNTKTNNWTEFELITPAMKELKTRHYAGNVDLNGQNTVDVVITNSVLDTMNFNTGDVISATVETPLPNGIMYNVFITEKNKITIRYSNVTTEKITIPATYFNFRITYK\n>UniRef90_A0A7J2S7S4 DUF5050 domain-containing protein n=1 Tax=Thermoplasmatales archaeon TaxID=2268204 RepID=A0A7J2S7S4_9ARCH\nMRRSYVKTIKSNSKMMKNTSLICISLLLINVLGSTGVLQNCGKKEEQVYFNFISRSMPHGRIIFQSLRDAPLGNPNSIKKYWELYSMDVDGSNVTRITRNLYWEHQPDISPDGNKIVFAIHYNPSIDTKETDSGWEIAVMDIDGTNLTRLTSNDKLDACPHWNHDGTKIVYVSDTYGNFSCFDIYIMDPNGENVTKLTNAGIGEFYADPSFSFSDGKSKILYIHSKGYTSNWDIYMMNEDGSDQHLILSTNNKYLAYHDPMFSPDDSAIVFSAKLNENGNHGIPIYKIFTARVDGSNIRQITDNDDESDVVPQYSPDGGKIVYFTWKWNGVVFERKIRIINIEGTNERIISSFSPEEMPSWYPRYIRIEKPVEKHLYIADREIIRLLKNTVIIGKITIKADAYDENGVEKVEFYIDDELKNTDYIMPYSWLWDEFAFGMHEIKVIAYDNEGNADTDEMEVAIFNF\n>UniRef90_UPI001D13EC9B DUF485 domain-containing protein n=1 Tax=Saccharopolyspora sp. HNM0983 TaxID=2781240 RepID=UPI001D13EC9B\nMRPPVAAGPPDYRAVVDSAEFQQLRTRFRAFVFPMSALFLAWYLTYVVIAAYAPAFMGTPVLGLINVGLLMGLGQFVSTVLIALGYRRYAERRVDPLIDDLRADPPREGDR\n>UniRef90_UPI0021BCFAD5 translation initiation factor IF-2-like n=1 Tax=Macaca thibetana thibetana TaxID=257877 RepID=UPI0021BCFAD5\nMALNSGRRKEATLQKGVRTALEHSQERSLGGRPEWLRGPGGPGGPRSPAGQPLQPAGSDSRSSANTALGATPTSTRGHLPSLPPPDLQDRIYPGRPPARVSAPSRLGLSPPCTEMAAAGSLLPQPVAASSGPGWPRPPCVSRGTHCAVPVPPVLS\n>UniRef90_A0A4U3CDX7 ATP synthase subunit b n=1 Tax=Blastococcus sp. CCUG 61487 TaxID=1840703 RepID=A0A4U3CDX7_9ACTN\nMNILAAEQSVLVPPVGEIIIGLIAFAIVLFVVVKFVAPRFEQVFQARREAIEGGIERAEVMQAEAKAALEQYRAQLAEAREEAAQIRDAARAEGQQILEELRAQAQEESARIVARGEEQLATQRQQIVQELRGQIGTLAVDLAGRVVGESLADDARRSGTVDRFLAELDGMSAAGNGQGGAVPAGESNR\n>UniRef90_A0A450TCR7 Uncharacterized protein n=1 Tax=Candidatus Kentron sp. FM TaxID=2126340 RepID=A0A450TCR7_9GAMM\nMDKKSPFLAQFLARMSAFERENTMFLLVFHPVSADVIFWECTPFSVLLPGHFLFFSHVFGPPSLPQGAKYHSLGLWR\n>UniRef90_A0LFP1 Ketoisovalerate ferredoxin oxidoreductase, delta subunit n=1 Tax=Syntrophobacter fumaroxidans (strain DSM 10017 / MPOB) TaxID=335543 RepID=A0LFP1_SYNFM\nMNKAREDKFTQARSALCKGEAGRTGDWRSVRPRIDHAKCIPSKNRRPSCFICWLYCPEGVVKRSIPVEIDLDYCKGCGICAEECPGKAIEMVEEHEEA\n>UniRef90_A0A351GGH7 TonB-dependent receptor n=1 Tax=Bacteroidetes bacterium TaxID=1898104 RepID=A0A351GGH7_9BACT\nMVKKILNLILFLGLSFLSVAQTTTVTGTVKDTTGQTVIGAAVVVKGTNNGKITNENGAFSLNIQDPKTAILQVSYSGYKTNEVAVNGGKNIEIVLRENSLGLSEVMVVGYGTSTKKEFTGANSKVDGEDLQKLNIPRFDQALQGQVSGVNISTNSGSPGGGASIRIRGLSTFGDNDPLILVDGVVFDAAGLNSLNPDDIASVNVLKDATAGIYGVRAANGVILIETKKGKRNSKPSISISSYFGVQSTSRKLDLLNATEYATLKNEMFANGGDDVPFSNVNLLGEGTDWQAEVFQNAPIQSHNITISGGSEKTTYSIGGSYFTQDGIVGLDKSNFTRMNARVNLSTQMSDKLRLTSVFLYTKEQRSTLRENQIGSVLYNTVNAFPTDSVRTSDGRYSYLEEVSDIINPIAQMENTFNEANVNKFVGKEELAYDITDNLTFTNRLSYNYAIVDDKVFSPLVWYGPGKAPNTALNEDLDPTSVEIAPGTSVDRGASVYEQRASYSDLNFESFLNHEVRIKSLHRIKTTAGLSVFTRNGQAVNGTAYNIPNNDLEFADISANLAPGGYLNNTGSFQFQERLLSTFIRGEYGYGSRFNGSFILRRDGSSKFGPNNRYGIFPTVSGSWVISEEKNYAIDRMKFLKLRVSYGISGNDQIDNFAYRGLLNGEGHYVFDDIITQGVAIGRASNPDLKWETTRQFNIGTDFTFLHSFDVTMNYFIKNTRDLLFQPEVSAVLGTYGAGSFPPFINAGDVSNKGFELEVGYKTKSSKIWNLSTGLNATFIRNKVIKTPKGVDFLPGASFGVGGGTATRFQEGYAIGYFIGYETDGIFQSQEEIDNSPVVQEGAKPGDLRYKDINNDGKISFSDDSDKTQIGTPIPKVTLGFNVKVDYKGIDLSGNLFASLGQQIVRNYERQQPYANQLAYNINRWTADNPSQEYHRLTTDLTRNTVFSDFYVENGSFLRLRNLQLGYTFNPLLLKKAKIQSARVYISANNLLTITQYQGFDPDIGSSGGTLAAGIDYGFYPQARTLMTGLSIKF\n>UniRef90_A0A565C3H5 BHLH domain-containing protein n=1 Tax=Arabis nemorensis TaxID=586526 RepID=A0A565C3H5_9BRAS\nMNLLNSDDNLSMIEALLTSSDLCPLTPPNLSLETTLQKRLHAVLNGTHEAWTYAVFWKPSYYDYSGDSVLKWGDGIYKGDDGNSPRRRMKTTAEKDHRSNVLRELTSMIAGEGFPVMSDGDNDVEVTDTEWFYLVSMTWSFGSGSGLAGKAFATYDPVWVTGSDQIYGSGCDRARQGGDLGLQTIVCIPSDNGVLELGSTEQIRQNSDLFNKIRFLFNFERSKDFSGAPSLMPNELENGNLSXXXXXXXXXXXXXXXLVYKQIQNSLIQDLNFSTATFTSARDIPGEILSFGDDGIRISENPNHNSYSDQIPNEAGKISTGGQKFDSSYQFNIDDSDQYKIDDSILVLENKRPKKRGRKPAHDREVPINHVQAERLRREKLNKRFYALRAVVPNISKMDKASLLGDAIRYIHELKSKAKNTESEKNAIQIELNKLKEAITGRRENAISSVGEKDAITEIDVKIIGFDAMIRVESSKRNHPGARFMTALMDLELEVNHASISVINDLMIQQATVKMGSRSYTEEQLRVMLISKI\n>UniRef90_U4LXJ3 Similar to Putative alpha,alpha-trehalose-phosphate synthase [UDP-forming] 106 kDa subunit acc. no. O14081 n=1 Tax=Pyronema omphalodes (strain CBS 100304) TaxID=1076935 RepID=U4LXJ3_PYROM\nMSTGTTFVAALHLPYTVQFRSKESRPSSSKSLSSRSLPPPIPETRANVPQLTLSTLRNDLAKTPYGEPIATPMPNLLESLGHGNIATSPTPPLTPTTTTAEELFFRVPSTNSIALGSPSDPSMRRIPTIPAARPKATPFLPGGENVVGRGYFDIPVTEKLAPATRPSRRRSSVASGASIYSQQEQDDWTIEKTDFGNGGLKNAVEASQDASENVYVGTLGFGTDTLDEATKVAIEGRLREDHNCLVAYTSNADFDGHYNHYCKEVLWPVFHYLIPDHPKSKAFLDHSWQYFEALNRSIADVIIKDYKKGDTVWVNDYHLLLVPKMVRDALGPDARIGFFLHVGFPSSEIFRCLAHREKLLAGILGATMVGFQTEEYVRHFLQTCSRLLNVEVQENGVLLDSRLVNVVTLPIGIDPIQLAEKRNEQEVTNWTEQLQQRYAGKKLLVARDKLDGVRGVKQKLLAYELFLKKNPQWVGKVVLIQVALTTTSIVESQSTVSDIVTRINCTYSTLDYQPVVYLHQDITYHQYIALLQIADALVVTSLRDGMNLTSHEFVYLQDKHHAPLILSEFTGSAAIFGGAEISVNPWDHSMCARALERALTMPSQEKEERWKKLYARVTGHTAAHWFSEFLSKLEDAWEEQQRCGSAHIPRLSAKILAEQYSAARKKVFFLQYEGTLVSWGSSSSTVVTSPQRIMDTVNDLMEDPTNVVYIMSSRTVQDLEQIFLRVPSVGLFAEGGCFLRPFGKEKWIRLADPELPWKSSVRDILDYYVERTPGTWIEERSCSFIWHLEKAEDKASAQRQAGDCGNHVNGSCESFDVHAIPVTGGLLVECRRWNKVNACRLVLEHMEERKWVVDWILVAGSGRDDEGVFEWANGLRVEEGEEKEGKSKREVVTVRVGTGHTQAKATTNGVAGVVTALQRLANISVNEST\n>UniRef90_A0A8S0R5G1 Eukaryotic translation initiation factor 4B2 n=2 Tax=Olea europaea subsp. europaea TaxID=158383 RepID=A0A8S0R5G1_OLEEU\nMSKSPWKNIGDWAAESERAEAEEREQAEQAAAAAQAGGGNFPSLKEAVNTKQKKKTKMSLQEFTMQPSYGSGSAPPSRGLTQEEMFRLPTRPKERPPDEMQHGRHGGGFPSYGNRPGSGYGDGYSDRPTREFENRRSYGGFEDENRRGPTRVSGFDQQTSRADGVDNWASGKKALPDYTSGPAGRPARYSSLGGSSDGISRADEVDSWVATKKPFVQSQPPQQARSSGFGRLEPDRWTRNEGERQRLVLDPTKSDRGGDADVLVKVNKSNPFGAARPREEVLAEKGLDWKKMDMEIEVKKQQHSVSSSRPTSSQSSRPGSTHSSRSESLTTLQSGMAEGAAKQTPKMNPFGDAKPREVLLEQKGLDWRKIDLELEHRLVERPETEEENSLKEEIEHLKKEFLEKSGEEQSCLQDLILKREKDLELLRRELDDKVRYSQKVFERPGSGAGRDAISIERPSRLAPYEEPRAGFPERPPSRPGAHEDPRAGHSERPRSRPGLSEKYRPGFPERPSRPGLYEESRSVFTERPSRSGSYEETRAGFSEKSPSLSQAYQDPRAVDYMERPRSRGTVNSRTRPIDDRKASQGGGVRGFVGSRDVDRSRPRW\n>UniRef90_A0A1V5GBZ2 DUF11 domain-containing protein n=1 Tax=Firmicutes bacterium ADurb.BinA205 TaxID=1852897 RepID=A0A1V5GBZ2_9FIRM\nMATFYNQATLSYNGTVTNSNITAGEILEVLSADKYAVTSTYSADSDIVYIISIVNSGSSPVSNITVTDDLGAYPFGEEEDYAVPLTYNEGSVGYYINGIQQTPPTVADLSPLTITGITVPAGGNALIVYSARTNAFAPLGAGASITNTASISGTGFGTITASEQITADNAIDLAITKALSPSTVEANGEVTYTFVIQNFGGNAVTPADDVIFSDSFSPAIGSLTAEYNGTAWYEGTNYRYSETSGVFSSLSGQITVPAAQFIQDPATGEWSVQPGISTLTIKGNIL\n>UniRef90_UPI001F36B3C5 hypothetical protein n=1 Tax=Alicyclobacillus tolerans TaxID=90970 RepID=UPI001F36B3C5\nMTTVFFKNLQINSVSQTSGVFHGDNYLGGFVSKTKSNEGFGEVSGQKNVVVECLDLVLDLDTLDTVVKKPPSPSSE\n>UniRef90_W8SRT6 Transcriptional regulator, LysR family n=4 Tax=Alphaproteobacteria TaxID=28211 RepID=W8SRT6_9RHOB\nMDWDKLRIFHAVADAGSLTHAGDTLHLSQSAVSRQIRALEEGLNTTLFHRHARGLILTEQGELLFDATKHMTKRLDAAAARIRDSEEEVFGELRVTTTIGFGSLWLAPRLPALYAKYPDLRIDLMLEERVLDLPMREADVAIRMKEPSQADLIRRKLMAINMRLYASPSYLEKNGTPQSLEELSEHRLISQNANSAQVSAGAVLVRELTSYDVGSHLTVNNYFGVLQGVIHDLGIGVLPDYLTQDFPEMVRVLPNVESNEVPVFLAYPEELRQSKRIEAFREFVTEEVIAHRKRLKESLGAQAG\n>UniRef90_A0A0S8K1U0 Acyl-CoA_dh_1 domain-containing protein n=1 Tax=Anaerolineae bacterium SM23_84 TaxID=1703388 RepID=A0A0S8K1U0_9CHLR\nMRVIHEYTRGCGRREEGGVYLVSELSPLGTLPPWVAIEPPILYGGEHFRGYIYVNGDQLLAGDEEGTWLIGPSLDRLIGEEWKLTLGMPLKIRQKFGICAGLKTVEDVTEKLADLGLYSDKMYPEIATDIHRALEYLKQLDTPAEGAASQLKMAQRLGLSGAQILARCWLIARQLLWDLPLRDPHNDIRVELRKDLARVMVLVGALEDARDLLTGRSREARATGRRSGALTEANTAAAPAPPNGGPARVERWPSVWLHAGRILRAAYSSSIVARSPCFVINSSHFCQTASWNCSRVPRSARLSASCRKSAHAGNGNLIAS\n>UniRef90_A0A5P8D839 Lipoprotein n=1 Tax=Mycobacterium phage Marshawn TaxID=2652423 RepID=A0A5P8D839_9CAUD\nMNRTLKGLAAAVAAATAVTVVGCSSDADVASDNLSKASEQFEVSRRIVAINGVTDKYLFVVEGRCSLEYPENRTEIVCKLDDGNLIKHVVRQSDNVTLIMEQTNGTAVSTDHYRVIFKPEVIIPNVDRP\n>UniRef90_A0A1X7C2T9 histidine kinase n=4 Tax=Cellulosimicrobium TaxID=157920 RepID=A0A1X7C2T9_CELCE\nMLRRLSVRGKILAALAVPVLVLFAAAAIISAQAISTARDASQTSALVAALAAQDAAGTEIAAERTYAFLDARGASEDAEAQMMAQREKTDKALDVRDRAYERLDTSALDPRVREALADTIADRSDLQSVRQAIDRSGLGQLQRNSLYGNLIDDALEVPRTLADTTPDRGLAQYLDTYVLLDELLAQQALEQPVAGAVLQAAQVGQESIATNQQAAVLVTTGDELAKRTQTAVRQLPGELRLETATATYNQIRQNLMGSRPGATPASQAAEWPALSQADRDQTAPVRDAVRVETEKKASDLAAAATTRAVVTILVTLAAVILSVLVAGLIARAIVNPLRRLTDAAEDVRDQLPKLVEQVAVPGQGPGIDLAPIAVESTDEVGQLATAFNDVNETTIRVAREQAALRGSIAEMFVNVARRDQVLLNRQLAFLDDLERSEEDAGTLSNLFRLDHLATRMRRNAESLLVLAGIDSGRRVRQPMPASDVIRTASSEIELYDRVRLNLVVDPLMLGHNALNAAHLLAELLENATMFSEPHTPVEVTTGRDENFVYVTVRDHGLGMTPEEIADANRKVATHAASDVVGAQRLGLFVVGRLADRLGAKVRFSAGGDEQGTEVVVSFPAVLFVPDSSVPLPQPTDPLETSTQAAAQQLAGPAAAPALPAPEAPAPFAAPAATASFPAVEPEAPAAVPVDIDALTDGTTQTGMPRRRSRTVDPAAAAPSASFASGPQTGAIVLPPLATPALPDQLPAADEAWTPPAEVADAGSALPSRARPAATPVEPVSAEIPVLDVSTRSALFSSFRPMGDRPAENPVELPAAPDVTATDIPLVTEVPTGSAPVPQDAWSPQPAPAEEPVAQAWPAPEAQAWAPEQAWAPEQPAVAAEQPPAAPEQPAEQSWAPAQAADTWAPSSVGDESLDATRVVPPVPAEPAEEATVARVPLAERAPAVSAPAAPEARPAEDVPVVESANAAAPAEDIPAELTFEALPRFEELMADLPTRRSLRESQARKRGLFGRRPRTTATPQARPAGTSASAAPAATAPAPAGPSAPAPSAPAPAAPAAAATPTAAPVAPSIPVAPQEPAAPARTSAFAPRADQPAPAASFAPPTTPAEEQVPASPEAAYTPLETAYSATEAPAAPQPSYEPSYAAPEQAYAPDVAPSEAGREPAPARDSWAPEPADAAEPAGYGPPSPLVRRPVSETTLEPLEPGYISDSVEARSDWMASAVLYEEMSTLLQGSTDFQEATLADSNDGIYQPLKVDATTASGLARRSRGEEREGYVDRFTARIDRDPEQLRARLSAFQSATARGRVEGQDETSSTWDPQAVDYVPDSAPQAR\n>UniRef90_A0A6G5YKI4 Haemolysin XhlA n=1 Tax=Bacteriophage sp. TaxID=38018 RepID=A0A6G5YKI4_9VIRU\nMDYMDDYRQQVTDARFQDLKEVINTRFDDMNSRLVTISKQLDNYETKDHAASEINHLAFRCDDLEQKLQDAEDELAKFREGIYRKAALLTTVLSSIVSLVFGILQFVIH\n>UniRef90_UPI00190A6268 non-ribosomal peptide synthetase n=2 Tax=unclassified Streptomyces TaxID=2593676 RepID=UPI00190A6268\nMEKYRSLPAVGDTVVQLPDAGIPELFERQAAMTPDAVAVVSGDASMTYGELDAGASGVARELLRRGVGPESVVAVAFPRSPELLVALLGVLKAGAAYLPTDPDYPAERVGFMWGDARPVLLLTTAGTAVDLPDSCPRLTLEDLSPADAAPGGRTPYGGPAVHADQLAYVIYTSGSTGTPKGIGVTHRDVVALAADRRWYGGAHERVLLHSPLAFDASVYEIWVPLLNGGRVVVDPDGDLTPGGLSRLVADHGITAVFLTTALFNLLVDEDVRCLAGLREVWTGGERVSPAAFRQAVDACPRTTFVHVYGPTETTVFAVCRPMDPARPVGGDVPIGRPMDHTRTYVLDGSLRRVPPGAAGELYVAGAGVARGYLNRSALTAERFVACPYGTAGERMYRTGDVVLTTPDGELVFQGRADAQVKVRGFRIEPGEIESVLLAHPDVAQAVVTAREDRGAGTGKQLVGYVVPAGAGDGGAALDSASLVGELRTFVAERLPEFMMPAALVVLEQLPLTPNGKLDRTALPAPEFTAMTYRAPRSAGEETLAGIFAEVLGLGRVGIDDDFFTIGGDSIRSIQVVTRARAHGVSVSAGEIFRHRTVTGLAEAAAANARDGGSPVLAELDGGGVGPMPLMPVAKWIEELGPGFDRLSQAMVLELPAGIDRGGLAATVTAVLDRHDLLRARLIPDGLLVDPPGSVDADRLIRDVTCDGQWSGEPWRHLLVGELDEAAGRLDPAAGVVAQFVRFEPPSGPGRLLVVLHHLVIDGVSWRILMPDFAAAWKRIRAGEAPEPAGTLTSARRWAHALVDDAAGAARMAELPLWRSTVDGPDPLLGSRRLDPAVDVRSTVEKVRVLLPVPVTEALLTAVPTVFHGGVNDGLLTGLALAVGQWRRTRGVDEPSTLLTLEGHGREEDAVPGADLSRTVGWFTSVFPVRLDLAGIDLDEAFAGGPAAGAALKAVKEQLLAVPGRGIGYGLLRYLNPETAEVLRAYPMGQIGFNYLGRFSAADMPEELRGLGWTGTAELAEFTELAELDAGHDAAMPALSEVDINATVTDTAAGPRLGAVFGAPTGVLSPAEVRELADLWCAALRGLARYAAEPGAGGLTPSDVPLVSVGQREIEAWEKVYPALVDVWPLTALQSGLLHHSMLAGADADTYQVQLVFGFEGAVDASRMRAAAQALLDRYASLRTAYVPDSAGDFVQLVVEGVTLPWREVRVAAEAYEEFLAEERSVPFDTAAPPLLRTTLVRIGAERTELVLTAHHVLFDGWSEPILLHDLLCLYASDGSAPADPPSFKDFLAWLARRDQEQSVRAYARALEGVTGPTLLAPADPATGAAGFGELDVDLTAAEAQMLARRAADLGTTLNSVVQAAWAVLLAELTGGSDVVFGATVSGRPPTLAGVDSNVGLFINTLPVHVSCAPWKTLARVAADVQSAQAALLDHHDCGLADLHEATGLGVLFDTLVAFQSYPFDNTSIAEASSAAGLGVPSFRSIGGSHYPLVVMAEQDPHLRLRLQYRHSAFERDAAGRMADRFLRVLRAFLADPAGRVGAVGIRTPDERNTSRPEPGTPEVSVPELFVRRAAAMPDAPALVVDEVPVTFRELNARADRLAGACLGLGLGPDSVVAVRCSDPVDQVVALLGVLKAGACFLPIDPEDPPQWSDAVVRDAGPRAVVVDQEAAGPSWGVPRIRVEAPAGDSGPADGGPTGPALPGHMAYVDYVPDESAQPCGTAVTRGGMAARVPRFETFFPGETLAVGPGTRATDLLLALCAGRTVEVRKEAPSAHGDAPDSDRVQVLSPSLAPAAAEAVGELYVTGDVGRGHPGRPGLTAQRFVADPYGTAGSRMYRTGVLGPQGAPGTPAVGSPEVRTGRRAVESVLLAHPGVARAAVVTDGPGLVGYVVADGQAAVVADELRAFVARHLPDRLVPSALVEVDRLPMTANGRLDRRRLPAVAGEQHRTARGEREVLLSRLFSDVLGREEIGIDDDFFALGGNSLLATRLIGRIRNELGVEVSIRSVFQYTTIAELDAQWDDIATASGPRLRKTSRK\n>UniRef90_A0A4R1FKP2 Lipoprotein n=1 Tax=Nocardia alba TaxID=225051 RepID=A0A4R1FKP2_9NOCA\nMGVVSEIEGSRRRIMMSRSVSYTLPAVVAVALVSAGCGSATPKPAPRAASATLTTTSKPPLTTSRSATPTTTAAKSAAVGVCVDKTTNVRVADDRCDTGSSTHSRFWYQHTDTFVYPAIGVAVALAAGSFLRPTTGEVFDRGAPTDGGTVARGGLGKARPDSSGGGGSAGS\n>UniRef90_A0A5E4BYY0 Calmodulin protein 4-like n=1 Tax=Marmota monax TaxID=9995 RepID=A0A5E4BYY0_MARMO\nMTTVTIVNQVELAVTRVQGGRLTSPRAFPSLLTLLFGGFLDRNGELDFSTFLTIMHTQIKQEDPKKEILLAMLMADKEKKGYIMASELRAKLTRLGEKLTQKEVEDLFKEANIEPNGKVKYDEFIQKITLPVQDY\n>UniRef90_UPI00101D8BA6 hypothetical protein n=1 Tax=Sphingosinicella sp. CPCC 101087 TaxID=2497754 RepID=UPI00101D8BA6\nMTDGARLFLDAWTHARPQPPARRAATLLARLGGEAEPERLPIGVRDRRLLELFAGMAGAHLAGVAECDSCGGAIEVAASVDMLMSGPPTAPILVEIDGERVPVRFPTTHDVLAAVAAPDPSRRLAELCAGKGELGAGEAEQVGAALLAADPLLDPQIAVTCPDCGAETVFGFDVGAFLWAKVEDRARHLLSQIHRLACAYGWTESEILKLPEARRAAYLELSAA\n>UniRef90_A0A8D2QA42 NME/NM23 nucleoside diphosphate kinase 3 n=1 Tax=Zonotrichia albicollis TaxID=44394 RepID=A0A8D2QA42_ZONAL\nSSGSKPSIRTNSFPSPCLEASPPELNLSSCLPGLVPSAQLQHPGSQRSVCSVQASEELLKEHYSALRDRPFYGRLVKYMSSGPIVAMVWQGLDVVKTVRSMIGETNPAESRPGTIRGDFCVEVGKHSCAKPARNESAFPEQKFSLLCSDQS\n>UniRef90_A0A8D2AEW9 Espin n=1 Tax=Sciurus vulgaris TaxID=55149 RepID=A0A8D2AEW9_SCIVU\nMAHSEEAALLPGNHVQNGCAADPKASRELPPPPPPPPPPLPEAQSSLPPAPPLPLEGAGSGQRRSSSSTGSTKSFNMMSPTGDNSELLAEIKAGKSLKPTPQSKGLTTVFSGSRQPATQPDTQVPPVSPAPSRARSPTPPAVGPQPLLNGSIVPAPPAIPAPGVQLNVETLVPTHDEQGRPIPEWKRQVMVRKLLVKMQEEEEQKRKEEEEEARLASLPAWRRDLLRKKMEEEREQKRKEEERQKQEEIQREKEQSEKLRTLGYDESKLAPWQRQVILKKGDIPKY\n>UniRef90_UPI001E3E9EE4 hypothetical protein n=1 Tax=Mucilaginibacter roseus TaxID=1528868 RepID=UPI001E3E9EE4\nMMISIAACKNDNDNNPEPSVESVTIDGTSYPTVKIGKQQWISINYSGKGGVFYNGDRDVKYGKLYTRKEAQAIKLQDGWRLPTRSDFVKLASNFPNISADGYVNLKPEGVLKLASSSGWRDKSGDNSSGFNALPAGICKVEADGDNDYSYRGIATQFISSTTETFNDNGATRARTTTFFLQIANSSSQPPTTETAGGVVDVIRADDYRFSVRFLRDID\n>UniRef90_A0A7W0CLV6 S1 motif domain-containing protein n=1 Tax=Nonomuraea soli TaxID=1032476 RepID=A0A7W0CLV6_9ACTN\nMLSIQQRIADELGVREGQVSAAVDLLDGGSTVPFIARYRKEVTGALDDAQLRTLEERLRYLRDMEERRAAILESIESQGKLTDELREQILAAETKARLEDIYLPYKPKRRTKAQIARELGLEPLADALLADPSLDPVATAGPYVVEGLADAAAALEGARAILIERFAEDADLIGSLRERMWSYGQVSSRVKEGKEEAGAKFSDYFEFAEPFTKLPSHRILAIFRGEKEDVLSVALEPEEGDEYELRIASRFGVSDQGRPADKWLNETVRWAWRTRILVHLGIDLRTRLWQAAEDEAVRVFAANLKDLLLAAPAGARTTMGLDPGLRTGVKVAVVDKTGKVVETATIYPHEPKRQWDQSLAVLGALCQRHGVELIAIGNGTASRETDRLAAELVKHMPGITKIVVSEAGASVYSASEYASKELPELDVSLRGAVSIARRLQDPLAELVKIDPKSIGVGQYQHDVSETKLSRSLDAVVEDAVNAVGVDVNTASAPLLTRVSGIGSTLAASIVAHRDGNGPFRSRTALKDVPRLGPKAFEQCAGFLRIPGGDDPLDSSAVHPEAYPVVRRILTSAATDLKTLIGNTAALRSLKPADYVDDTFGLPTVTDILGELEKPGRDPRPAFKTATFKEGVEKISDLAPGMILEGVVTNVAAFGAFVDVGVHQDGLVHVSAMSRTFVKDPRDVAKPGDIVRVKVLDVDIPRKRISLTMRLEDETEQPTSGGAAGGGSGRGPRQSGGRPGGPRPASQDGRSTDTRPARDGAGGDASGRGGSRDGSARQGAGSGGAGSGSGRDGARGNRDNRGQRGDRSGDRAGDRSGDRAGDRSGDRAGDRSGDRGNDRGNDRRGGQRSGGDRRQDRSAPSGAMAEALRKAGLGGGSDTR\n>UniRef90_UPI00068DFD47 tetratricopeptide repeat protein n=1 Tax=Herbidospora cretacea TaxID=28444 RepID=UPI00068DFD47\nMNPPEASGEAAVHNEITNGVFFSAVIQGRDITVQLPPQITPALSGMPAGSPAFTGRDLDLRDVLDVLAPVGTTDGSVPSTAVSSAAVVVTAVGGMGGVGKTELAIQAARTALDCGWFPGGVLFVDLFGYDKARRVEPGEALGGLLHALAIPGDHIPSDTEDRARLYASVLAAYAAAGRRVLVVIDNVCSAEQARPLLPTDGSSKAIVTSRHTLGMLGARLLDLKVLAEAEAVALLTRAVDIARPGDTRVSDHPEEAAELAHLCGYLPLALQIIAALLAENPVRPLSTMIEELADESSRLDEMEYGEVAVRAAFELSYRHLAAQEARVFRLLPVNPGPDVSTQAAAVLTGLEAVPARRLLERLARAHLIEHGLGYGRWRMHDLVRLFAEEHGRADAAADGRADALTVLLVHYHSTATAACHHLAATDRDAAKGGFGGRGDALTWLDAERANLVAATHTAAGHDPHRAIARDLPIRLGPFLQLRRHFDDWVALTTAALDAARELGDRRGEARASGDLGLAFRYSRRFDESISAHREAARIWRELGDRGGEARALSNLGLALQEVRRFDDAVAANQESLNIQRELGDRSGEARSLGTYGNALVLKRQFDEAVNVYRKARDIFHAMGDQSMEAAILANLGVALHELRRLDEVAVTYQDALRIYRELEDRHGQARTLTNLGHLLLEEQQLNLNDAVTNLQDALVLFRELEDRHGEARALNNLGLALQGLGQPNVAVTVHQQAVNAFRELEDRHGEAQALCNIGRSLLELMRFDEAIPHLRSALDLFAKIEDRHGAAQVLINQGVALTGLRRFDEAVAAIEEARDVFRELGDQHREAIALTNLEEIRRHR\n>UniRef90_A0A7C6BF04 Glutamate synthase n=1 Tax=Rhodobacterales bacterium TaxID=1948890 RepID=A0A7C6BF04_9RHOB\nIMMRSGAKSVTLITASGLPGPDTAPDDLINVVPCELEEAVEEGLQIIDHATVGRLIMKGSRVTGVEIVSLKKEVGKDGRKRRVASFGTERVVSVDMVVPCVGEQVDPEAFEGYIDGAYFWPDNPYGRIAEGVYAIGDARGNRGTVAAAIGDGRIAAEAVAAELSGEIDPPADERPVMELDGLNTAYYASTARVKVGKLAVSERTFEAEIEGAISRSEALAEAQRCLSCGNCLACDNCWTMCPDNAVIKTTELARDGSHYVFDYDYCKGCGICAQECPTGYIQSVPETS\n>UniRef90_UPI0008A66679 hypothetical protein n=1 Tax=Streptococcus sp. HMSC072D07 TaxID=1739495 RepID=UPI0008A66679\nMVKSLCISDSREGIIEHIPKGAIAYYLPNPRGRKKVFFTKETLLLMYHLIRLKYFSREMILDQYFILTGKELYNDALYSLIGNSRMPICQFSSNYNIGRTKFMYVPKVFASWLLSVIPQIPELAELTEVTEYDGSHYSLITNRMNGGTYGIKKINLHDANTRSLALKIGRALIENKVGVSPSELNITYFFPTNRELISVVPDAVIFVQGERYYIEYDRNTEQHFKLLGKIIGYFEESYYKGDTIFFVFDNISEPKDNYLNARVMNFISNVHNVKFKDSGLTYYEQAQQNKVSLYALPYVNAISQIAEVIHLELDHDSTKEDIELVDRFKNEHLVPYEVLSADLVDEPDSPFDLTLTYIDDFFDKKEMPLLKLNYGDISNPDYFENLYKEYKDVYPQCGIIFSASISKQYYPIPHDDFFLAIYIR\n>UniRef90_UPI0019112769 ABC transporter substrate-binding protein n=1 Tax=unclassified Pseudomonas TaxID=196821 RepID=UPI0019112769\nMTKPLETLWYTHSPVPTGLGIAVQSGRLAEAFTPFGTNIQSLRESSEREVREAHYDHHLQNSVRHGGNIPAIWAYASGVETRVLGLSWSDEVQLILTTEESGVRSIRDLKNRRFGIPKWANVQIDFTRAQALRGLENALKLEGLAVGDVELVDYPYGGTYSDDAKRHLYGAEVSLGTSRVSRRNNELIGLLRGDIDAIFLKGAHAVHLAHEFGLRVVVDTGSHPDPLIRSNNGTPRTLTVDRHLLENHFDASRTLVDTVLRTEQWAWANPVETRRFLARELNTSEYWVAAAYGDDAHRRLRTALDSRSIEALQDFTEFLFRWGFIPRRFDVKAWIDFRVLESVIGSTSRLAV\n>UniRef90_A0A7C7DC20 2-isopropylmalate synthase n=1 Tax=Firmicutes bacterium TaxID=1879010 RepID=A0A7C7DC20_9FIRM\nMRQVFIFDTTLRDGEQSPGVNLNVEEKVEIATQLAKLRVDVIEAGFPVASPGDFAAVEAVASQIKGPTIAALARTMEKDIDKAWEALRYAERPRIHTFIATSPVHMRYKLRKSPDEVLRMAVEAVRHAKSLTNDVEFSAEDAARSDRGFLREIFEAVIEAGATVINIPDTVGYSTPWEFADLVSYVKANTAGIDRVTISVHCHNDLGLAVANSLAAVTAGATQVECTINGLGERAGNAALEEVVMALRTRKDYFDVSVGIDTTHIYRTSRLVSSLTAVFVQPNKAVVGDNAFAHESGIHQDGILKERTTYEIMTPESVGLPESRLVLGKHSGRHAFSEKLKALGYSLTRDEMEKAFNRFIELADKKKQVSDRDIEAIVEDELVATPGFFELEYIHVISGNHAVPTATVRLKTVDGSVEEAACGDGPVEAVFKAVDAAAKLETHLVSYSLNAVTGGKDALGEATVRIKDNGDTYVGRGTSTDVIEASAKAYVQAINKLLHNRRTFSKAAAPAGAAGVSRPVQDALGTSGS\n>UniRef90_A0A8H6QPS6 Uncharacterized protein n=3 Tax=Aspergillus TaxID=5052 RepID=A0A8H6QPS6_9EURO\nMAPTKEAASSTSTSTSTSSSSPSSCPTNSASDANTNISDHGSGDSKTLAVGVGVGVSLGVVSLISLIWGVYERRKRQQLLNSMPSMMPMNSDPYAPPAVAKNQYTEPQELAP\n>UniRef90_A0A6P6W929 uncharacterized aarF domain-containing protein kinase At5g05200, chloroplastic-like n=4 Tax=Coffea TaxID=13442 RepID=A0A6P6W929_COFAR\nMAGVSLMRGMVNDGCLSIFHHQSRQLAPVTVRVSSRSRSTAARKLQFLSKRSSFYARYSQSRDIFTSRVQDRMEKLPKLVEDIVQTSLSTGPRGALRLAQGIQAVLGVGSEWLADLSKTANSSTTLPTEMQLGLLSPLYLRRLFERMGATYIKLGQFIASAPTLFPPQYVQEFQYCFDRVPAVPFADIQAILREELGQPIDAIFEYVDPTPLASASIAQVHGARIRGTQEDVVIKVLKPGIEDTLVADLNFVYIVARILEFLSPELNRASLVAIVKDIRESMLDEVDFKKEAANIESFRRYLEAMGLTRQATAPKVYLQYSTRRVLTMERLYGVPLTDLDSISALVPSPEASLITALNVWFGSLLACETFHADVHAGNLWLLRDGRIGFLDFGIVGRISPKTWAAMEIFLQSLATEDYNSMASALIDMDATNKDVDSMAFARDLEKIFSSIQDLDTEIVVATARGPNTSTTAVAANVIVDERQMNALFLDLVRVSESYGLRFPREFALLMKQLLYFDRYTRLLAPNLDMLRDQRITIVPNQRSRRIY\n>UniRef90_UPI001C62E845 hypothetical protein n=1 Tax=Qipengyuania flava TaxID=192812 RepID=UPI001C62E845\nMAIASVWVLSGGLGGGSLLTWVVGLPGFLFFGGAMVGFVAALFDRRVKVSVSPQGLVVYPHSPRPIALRSIKRIGTQQSQVRILLHKPSKYPVEGRWRKALIAISSGIQRANGDVWMFCQLYDCSAREMVDAIRAARPRTKFEQEIDAVVASWDENGGPYGDAAHG\n>UniRef90_A0A1E7NDJ8 3-dehydroquinate synthase n=37 Tax=Actinomycetia TaxID=1760 RepID=A0A1E7NDJ8_KITAU\nMTDTTVRIHVGGSAGHDPYDVLIGHQLLGELAPLIGTRAKRVAIIHPEALAATADAIREDLAGEGYEAIALQVPNAEEAKSAEVAAYCWSVLGQTGFTRSDVVVGLGGGATTDLAGFVAATWLRGVRWISMPTTLLGMVDAAVGGKTGINIAEGKNMVGAFHPPVGVLADLGTLETVPRHDYVSGLAEVIKCGFIADPAILDLIEADPEGAKSPAGPHTVELIRRAIQVKADVVSGDLKESGRREILNYGHTLGHAIERNERYKWRHGAAISIGMVFAAELGRLAGRLDDETADRHRTVLASVGLPLSYRADAWPKLLDAMKIDKKSRGDLIRFIVLDGLGKTSVLEGPDPSLLVAAYAEVSA\n>UniRef90_A0A1E3H4Y8 2-keto-3-deoxy-L-fuconate dehydrogenase n=1 Tax=Methylobrevis pamukkalensis TaxID=1439726 RepID=A0A1E3H4Y8_9HYPH\nMTDRLKGKTAIVTAAAQGMGRTAVLAFAAEGARVLATDVNAERLAALADVPGVTTRLLDVTDGAAVAALAAEAEAPDILFNCAGFVHHGTVLDCDEAAWDFSFDLNVKSMYRMIRALLPGMLDNGGGSVINMASVASSVIGAPNRFVYGASKAAVIGMTKALATDFVARGVRFNAVCPGTVESPSLEGRMRALGDYETTRAAFVNRQPMGRLGTAEEIAHLVVYLASDESAFMTGQAIVIDGGWSNT\n>UniRef90_A0A374BYN1 ParB/RepB/Spo0J family partition protein n=2 Tax=unclassified Firmicutes sensu stricto TaxID=84086 RepID=A0A374BYN1_9FIRM\nMSEGKMNIGSAEGDQVLELDINRLRAFKNHPFKVTADMSMVELKDSIEKYGILNPFIVRPVPEGYYEIISGHRRKFAAKQLGYTKVPVIIKVMKNDEAIVAMVESNLQAGLIFV\n>UniRef90_A0A254RGW8 Endoglucanase n=1 Tax=Fibrobacter sp. UWR2 TaxID=1964352 RepID=A0A254RGW8_9BACT\nMSFKKLITTSTASVIALFIAACGDSDSGLRPVNENPDTPSSEAAVDPSSSSVADTSAQIPPVTGTGLLIDDLEDGDGSTLIGSGWYTYDDHDNGGASVITTPNVTEKGDPLPTATDNGSLYAFTVNYTLDKGDYAYDPYVGWGLLVPDAIDCSNFGGISYWYKGGKHEIHVETTDVTDYDVHLATVPASREWKQVSIRFKDLAQGGWGEEVAFDPFHIRAVSFQAKGDKVTDSLSIDNLYFQDTSEVEKDKPDMTIMDPIIPTVVIPEDLTISSPLQEKAMKYLNKGINITNWLEENKAYFKGKFKFDESDVKLMADNGIKSLRFPIDLDSYATNRDEFVADTTDTVELKFDDENLFAVLDSFVEWTGKHNMSFVIDYHEYDNSYNITSSKNARYIKMMANVWKHVAAHYASNEREDIFYELLNEPDMTNGAVKSPAWHAAAQEDVDSIRTVDTKHTIIFGDAEWYSISVLSKSEPLNDDNVIYAIHTYEPFIFTHQSASWAETKTIKNLMFPYDKEKWSEYSADFGVTKSTPSHIKNSLKNYNRTGSMEAILKSVVPAKKWAIEHNVPVIINEFGAYNLKTDKQSVLNYMSAMRTISDTLQIPLTHWGYTGGFALFDSEDGVKGTKLIDGMKEAYGL\n>UniRef90_A0A0A9IMK9 Protein Iojap-related, mitochondrial n=1 Tax=Arundo donax TaxID=35708 RepID=A0A0A9IMK9_ARUDO\nMPSVEGQQAGKWVVIDSGSIIIHALEERAREYYDLESIWSKEVSSNISVQELETSLVKTRRRNHSQKPMKSI\n>UniRef90_A0A4D4MEH6 Mrr_cat domain-containing protein n=1 Tax=Streptomyces avermitilis TaxID=33903 RepID=A0A4D4MEH6_STRAX\nMHQRGLPRKSSHPRAESAPGGPGRAARDSKGAAAYRERKLHKLRNKLTLAEVDRLLTIQETRWMQDMQDGHADGFGATNVWFPSTPTQAIDWRACEHIAAEHLRALGIADAEVTPARGDAGIDVRSEIAIAQVKHQRTPVGRPALQNLVGAAGPAHRGEIKPLKFFYSTSGYAKPAVEYARVNDVILYVINPATGCVSFVSTLYATSVSMPGLIR\n>UniRef90_A0A3B3QJW8 Cingulin like 1 n=5 Tax=Mormyridae TaxID=31092 RepID=A0A3B3QJW8_9TELE\nMEMESYRVGGISGGSLPPAYLAHECPSRPVSSGPGRYGLSIRVQGIGGHPYVVLNNREREPSPCKELESNGHSADGDPAEQYGQDRYTPPWEQHPDDSLVEYRSHKQMLFAGSHNGVTEFQESQKKPSTLLNFQRHPELLRPYDPENNSLNLEDLPVLTPRPASLSETGSLPCSQLTRGMSPSLDKPGTSATPVYQDRFPQQSEAQVQSLPRRHAPSPDRPAFQVQPETQEMLLPEPTPQSRQPVRPEAQVQQKPQLETQVQSPPHQQAKPQKPVQPTPQDQQKPQTEAAALAPSAPDAGQQARVAPPASTSTGSSLERSRRKPDVLLLRRHDSSGPVLQSQHSSHSSSSPSSTSRPLLGDPLESLGSDPINRHQNRRYIPFMPGTGRDIDTGSIKAVEELIDKFDGKEGLQRRGRAGRRNRINPEERKRSRSVDSAFPFGIRGDTDYLEEFSKNQGRSTEHVLRPSQLRQLKGALAQDFSGPTSPPRGKDGASAVARGRSAPGSPQGTALHSASSALGCRTAVSRSSTLPLESKGGDEPKSIRSFKVLTGMAAASPAVSMISSSKKNEADNPVTPDLLKDQQTLSQQTNEETAKQILFNYLKDGNPDNDDTTKRKVNLVFEKIQTLKSRAAGNVQGDNNPPEAASEVKALQDQKNQLEKEVTVLKKQLEEETKKTAGPTEVQENAGMRDLRMELVRSMEECARLQELLSKAEEELRTTMEELFQVKMEKEKHQTEIRDLQDQLSEMHDELDGAKRSESEGGEQEDVLEEMMQLKLDFQELLQVKEEQEELLRRRERELTALKGALKEEVATHDKEVDTLREQYEEEIRKLLSCVEDAKQNNVSVCREKQEVEAAKGVAESRVERLSLETERLRRRVQELENEVAKLNRIIDESKLQEGRLTDHMRHLEKENSLLGDSLAEVREQEEAMSRANRALTTRLEDVQRNLTKLTQDHKDLNEKLKEERIQKEQFKRTKDEIEDERRLLDRTVEKLQKEMCDMVEASQTSTQDLQVQIDEYKEKNRRELAELQRQLQERGVELENSRMATRKLQEEVSHLEEDLKQCKKERDEAVLREKKLELKVFDLEVELENVSHSKQDRPRYSKITEDRITQLEMDLEEERNNGDLLMDRIEQGRKQVEEMRNELLQERAMRQDLECDKVALERQNKDLKSRVTHLEGSQKSNKESLVSQLEGRIQELEERLEGEERDRANLQLVNRKLERKVKELMIQVDDEHTALQDQKDQLHLRLKALKRQIHEAEEEIERQEHGKKKLQRELEEQLEANEQLQGQILGLRNEMRRKNTTAPSLKDLDDNDDDMSTDGEIYYRSASGYKRSNHNPIS\n>UniRef90_A0A3P9PT27 Chromosome 11 open reading frame 87 n=1 Tax=Poecilia reticulata TaxID=8081 RepID=A0A3P9PT27_POERE\nMLAAPAASHCVKCVTTIRFTHFSPALPDCFIVAEASGLPAPPQRCLGGLQPNNGTCAEQLSVSLFPPLSSTLALLVLVAVLVGIILVSLATFLFHKRKLRNRKIQRAQEEYERDSRSPARAGPGAGEPARPCVIVRPVRRDEKPSRVTGCVRVAAEPWPRSTGSPHGRQKKPSGIQYF\n>UniRef90_A0A183N228 Secreted protein n=1 Tax=Schistosoma margrebowiei TaxID=48269 RepID=A0A183N228_9TREM\nMGQGLELHDFISLFIEVFDFLLLLLCTVRHGWGVGQVLIANFFSTFLVNDSLFLLEVCKIFEGISTADDLFTLPILNGDE\n>UniRef90_A0A2U8W4D6 DUF2092 domain-containing protein n=2 Tax=Methylobacterium durans TaxID=2202825 RepID=A0A2U8W4D6_9HYPH\nMSTAEPTVVRPAPKFCRNVSTRALPRACACTSIPRGARPRSGSGRQSGGSNAAALRRPAAEARASQPRCPRDREETMARPRDAIGLLAALVLCMTAPERAAAQQPAAAQPAQGVEPAAVALLKAAGDTLAAAKSLRFTAIAVHDVPNAEGQSIFYTVRSRVEFRRPDRLRVVTDGDGPSREFIVDGRTLTLFRPEADTVATAPAPASLDAALKAEVAATGESQAFADMLLTNPAQALTNGLTRAFVVGRSRLVGGVETDVVAFADRDAQAQVWIGVQDRLPRQLYVTETGAPGRPRNAVTFSDWMIDPPIEDRIFSTAHTEGARSVPFPNPDF\n>UniRef90_A0A419WT42 Uncharacterized protein n=1 Tax=Marinifilum flexuosum TaxID=1117708 RepID=A0A419WT42_9BACT\nMNKNTKVIEKYYEQIKANIELGLSPADFANKCVSDYVLIQDNEIKRKREEREKKKKNKIIKKQKEQAKTNIQEREKDLARTILYTKKMVKPITNTSEIDSKNANINPEQRRANKIAKLNINSLSSKMHVTDEVKDLGRLSTKEFDKNTVEGAINSLKMASRMLDLMRGGDDDSDEDYDDDIDE\n>UniRef90_A0A6S4NGA2 GRAM_POS_ANCHORING domain-containing protein n=2 Tax=Lactobacillus johnsonii TaxID=33959 RepID=A0A6S4NGA2_LACJH\nMPTDAEIIQAIGGLKSGDVYINGFTNGQMPVNVGSYQVKITDQLLQRLQAAFPDYDWDAVSGNNGTARSGSSDSDPIDARHEPATYVITPADTTVTINGAEHIKYGENSTIQYGSDNGYSITITAPVKNETTDNEHEPIYTDLKLETGDLEFVTTPGNVGTYEVKLSAQGLKKLQALTGSTNYSWTQASEARANFFVDQMPVTITVGGNEQNVTYSSNDWLKAIKENPQGYTLTVMTENGTTLNYQAKDGDLIFSQTPGDVGSYQVVLSAQGLDNIKQALGTNYAYPQAASDVTTYGTFNVNQGEVTISLDGSDSKIYDGKTTVPADLNIGKYNLTYSAPVYAPDGSPQTIKLTSDDLQFANGDPINAGTYTVELSPAGQAKLKNLTGNNGDNYKWIFNTQATYTINSATDASASLSGSNQMIFNGSPVTTAEINNGGNIVVNLNFPGSTENSIYHLQDGDYIWNDGAAPTNVGTYTIKLTQAGLAHLQAAIDQYAGSGNAKISADSLTGSATFEIVPKSITDVTISGKDQEKTYDGQAASLDVNDLTISATNLVTDSPLSMKDISASDFDWYDAQGKKLDAIPADAGTYEARLKPSALQALQKDNPNYSFNTASGTIKYTINQKAATDTLDGNGNKVYNGQETTVSDVLNSITWTPSGIVDGQSLDLSKLSDADYAWYTKNADGTYTEMAGLPTNAGTYYLKLKDSSIAKIQVANPNYSFATGAISGEYTYVITQANAVITLPNTSDQTVTWTGNPATIDPANFIPEITTDNPNEKTIVLPSTLQLTASDYEFSQNGKVISAPSEVGTYQVRLTEAGWQKVQNAIAENTNYTWNYQGEGNYHIEKATANVTLDGSASTIYTGNSVVIPATAGVVNGINVKLSNGQTYVLKPEDLEFVNDQGNQIPAPTDAGTYKVRLTKIALDQIRNIESNHYNYTYNNDAVDFTIEKANADVITSGSYDVVYNGQTPEINVDKITNTIATNNDVKLTAPTLTADDYEWVDETGKVITDPVNVGTYYLKLKDSSQSKIANNSNYIWNFKGLASVTISKANATIGFNGNQETSYTGSVIAVDPDKFEVKLSNGQTYQLTDKDIQVIGNPINVGTYKVELSQAGIDSIKAADSNYNYSYDDSQGVLVIVPAKASATISGSQTTQDLELDPHNYSVVLTLNGQQQTITGLTASDFVFSKDGHPAQLTEAGTYDVELSGDAINKIRQENPNYNIDFSSTATFTLENSSQTINYVDADNNVIGSTNISGHIKGTKLPFTPEIPVGWVASDPSDVPTEITINNGTTIIKIKHGTTNVDHNNPVPDGAKTVTGEVIDGAHASDLNQTITRTINVTNPDGTKSTEVQTAKIYRDASYDNVTGEVTYGEWSTGSWKEFSPAEIEGYSASEKVVPAVEVKDGQKNVTVDITYTANEQSGIISYQDEAGKEISTTPLSGKTGETVTVNPEIPAGWELVPGQEIPKTVTATGEGIPTVVIKIEHGITNVDHNNPVPDGAKTVTGEVINGAHASDLNQTITRTINVTNPDGTKNTEVQTAKLYRNASYDNVTGAVTYGEWSTGSWKEFSPAEIKGYTASEKVVPAVEVKDGQPDETINITYTANEQSGIISYQDEAGKEISTTPLSGKTGETVTVNSEIPAGWELVPGQEIPKTVTATGEGIPTVVIKVENSTIIVTPETPEKDIPNGKVPGNPSKNYPEMEKLEVAPTRAIILIKPDGSRENIIQKVIFTRSATFNEVTGEITYSAWKLSNSDDHEALWEAYEPMSISGYTVMNVNQEKVTPDTPNTQLEVTYIPINRPAVTATQTIHFVDEKGKLVESKIYTGKFGEVISVSLSVPKGYSLRNGQSLPTQITIENGMITINLKSESKHPIPNSENKQKPSVTPNTPDAHTDKNNLSSKDNKVVKSHGEKLINTNHVDHVVINQKATRKGTKASSQTYGEKHFESRHMLPQTGAHSENPIFTALGMLAVGLGLFGLSDRRKKKDK\n>UniRef90_A0A438IK19 Retrovirus-related Pol polyprotein from transposon RE2 n=1 Tax=Vitis vinifera TaxID=29760 RepID=A0A438IK19_VITVI\nMLVTVFHSGPLILFPNHSGQPHRRRISTTPATFSGEIFQRPIFRETTTYSETPEADLHASGNPTGNRHLTRPLARPDISFPNRGHTQVVGYTDTDWAGLPTDRRSTSGYCVFIGGNLISWKSKKQDVVVRSSAEAEYRAMTLATCELIWLRHLLRELRFGKDEQMKLICDNQAALHIASNPVFHEMTKHIEVDCHFIREKIASGCVATSFVNSNDQLADIFTKSLRGPRIKYICNKLGAYDVYAPA\n>UniRef90_A0A847NUJ3 DUF1653 domain-containing protein n=1 Tax=Mollicutes bacterium TaxID=37628 RepID=A0A847NUJ3_9MOLU\nMDIKIKGIYRHFKGHLYIVECIATHTETLEELVIYRNLETNEIWARPSHMFLAEVNKNNQKYRFELQK\n>UniRef90_A0A8B9BS21 vesicle-fusing ATPase n=1 Tax=Anser brachyrhynchus TaxID=132585 RepID=A0A8B9BS21_9AVES\nMASSTLYVVFTHRKPPHSPQTSQTAPWPSPEPRPPGGSALPGSPPLAPQPAPEGGPLPAAGSGQLGQLHAHPPVLVGPPPQPCPAAPVMCLLRGISGDDKVPKMLRAGLAQLSLSSMKSAGACIGRPVLLSAAEGRQEVCTAWPTTGFPGGKVGLSETTQKSLKVNLGDAVTVQPVTGAVIQAEEVDVKLRDKDACIKAEEMSVCLLRNLDGKVVLPGNLLAFSFYGKLCNIVVMRVKGTDGTELTAPATSSETQEPDLEKSDLEASALDLSLQLSGLDLDDNPEAVSVSTPSRRMDPASPVPPSSAVASGGHGPAEGALTGSPGVGADLPHGSQPAGTGGREGLLPPGKAGAASSTDSFYYISSRTRIQFVETRTGVADDGDCESRVTYDMIGGLNSQLKTIRETVELPVKQAELFKSYGIPPPRGVLLYGPPGTGKTMIAKAIANEVGAHVTVINGPEIISNPKSVLASTRCRPSIIFIDELDALCPKREGAQNEVEKRVVASLLTLMDGIGSEGSEGQLVVLGATNRPHALDAALRRPGRFDKEIEIGIPNAQDRLDILQKLLKKVPHSLTAAELVQLADSAHGYVGADLAALCKEAGLYALRRALGKRANPSDNEVAGSVMIAFNDFLQGMNDVRPSAMREVAVDVPKVSWSDIGGLEDIKLKLKQAVEWPLKHPEAFIRMGIQPPKGVLLYGPPGCSKTMIAKALAHESGLNFLAVKGPELMNKYVGESERAVREIFRKARAVSPSVLFFDEIDALAVERGSSSGAGNVADRVLAQLLTEMDGIEQLKDVTILAATNRPDMIDKALLRPGRIDRIIYVPLPDAATREEIFRLQFRSMPVSEEVCLVELVQQTHKYSGAEITAVCREAALLALQEDINAKFIMGRHFRYALTVVTPRNPDSLIQFYADYQQQSGLHAL\n>UniRef90_L8JDR2 APH domain-containing protein n=1 Tax=Photobacterium marinum TaxID=1056511 RepID=L8JDR2_9GAMM\nMIQPQLKRIAGNAYRMMFGLRPEVCNLQETFYGWVVFVASPGSRKAVVKFSREIGRLAKEVQGLERLSQVLTCPVPEVLFFGREEGHDYIMLEWLDGESAHNLPDDPVALEQFRESYTDVLLALHEHQSQKGFEIGDDEFVPDFIQAYESWMSPVLRYVQSSCSPFSSKLKDAYAGLWENREEILSPLNQIASLVHDDCHVGNVLFDPRTYKVAAIVDPCDVGFKHYELDLFHLYDVRPDLRLVERYQEKKKLAEGFEWRRWFFSLWDDAKHSRNMGWYDERWLVSKVALFEASYAGR\n>UniRef90_A0A3M7QPY3 Uncharacterized protein n=1 Tax=Brachionus plicatilis TaxID=10195 RepID=A0A3M7QPY3_BRAPC\nMNLFIITRFSQIDLIKLNSRQNYVKTTFLRNINNFIFKQYNKEFNFKIFIMIILLYIMDTIDRIIRPLVQTAIGAIMQVLPVTIVLVSFWICGHMASIRYM\n>UniRef90_UPI0010AADB8D class I SAM-dependent methyltransferase n=1 Tax=Halorhabdus amylolytica TaxID=2559573 RepID=UPI0010AADB8D\nMKRSLDDHAARFDQAADSYDEDGSPEYRAAAALVIEHAAPEPDDVVLDLGTGTGAIALALADDAGAVIGRDISEGMLEQAREKAAERGLESVTFDEGRFREPNVSGDRSVDVVVSNFAMHHLDDDAKREAIETIADLEPRRFVLGDVMLFGEADPEEPFYSPAVDDPATVGVLADALTDVGFALTAVEPVHEQVGVLVAERSEPTEDERA\n>UniRef90_A0A8S1JP47 Histidine kinase domain-containing protein n=2 Tax=Paramecium TaxID=5884 RepID=A0A8S1JP47_PARPR\nMENKAIKYLGMGLNVLISVFLALTECFIYELSDSIIMDIVLILCGTFFSWIFITQQLGWKKGDISPFFYWALAIKRITLVGTYRSEFIYFLFGFLNGIYSSKLVVKDQKRYFQKARTSFQVILILVLILFNFLTNTFQYQIILIIFNIILLLLLGIYDNIEIQPINSKQQDFNTDQRNTQAELKKCQTIIQQYQSSKSIWEQFNYLTDDWICKIDINKYKFNRSWESKEQSFVLKNFLQENKTNLNQFLNSLIIVGQSSNASVQLQYELQENNTLLQWLEKNYLQENRQNQQNFEKQKQLKDTKTNKQQVQDDQQSILSPQNDGKYIIQKDQSQDFSRLQATPLNMDQQVFANKKFLQCQLCLNQIIYNLNLSIFLIDDDKSNEIKQQSIIIQMKNIDRLIKSEIIDQQRSLFYRFISRLSFHSSQMLKSVCLIKKSIQLQLKEFDSIKSSNFNSSFNDIVLRKSERHIGGLFNAQQTFANQTSEQNTNQKITSTHSNPHESQILNMQQLQIAYFQQSQEIFKQIEKLNFDLIIMKQNNFNFFELFSHTKLDIEQFNILSSFNIVKDIFQQNPLLNQHNIIITQEINHETQVIIQSDRQKFKQILINIINNSIENFEHNFNIKKYQNYENPQIQQRYLKSKQDLKQQNMIVIKAQSDQDRIIIEIQDNGGGIDEEQLKNRLNECKFGLAASQKLLRYLAYDTRKPLEIINYEKCTTGVKGTIIKFVLPITFDNFQQNEDSNQSESLIISNIRDKV\n>UniRef90_A0A7S4ARR9 CCHC-type domain-containing protein n=3 Tax=Pseudo-nitzschia australis TaxID=44445 RepID=A0A7S4ARR9_9STRA\nEEHSETIEEHVAGLDRILEYPRVNEEIEIEEELAEEDSISSEESDSEFSCGETSSDSGIGSEDSWSTYSYNDLYTESDTDLYSELDSDSEESDGSSMKKSRRLYFGGEKGEFENFMIKWKTRGAKKGYSPYIMDKRHEDLPETGLMMDWTGVAKDVKKRQKKALRLHNYCIADLQEACEPWMVTAWIEESIGTTDEKRRAYPFGRVWIVLKAMITHYRGFSMLDINRFDIDKATIKMLPNENPDAIFNRIYAVRQKYAHQKDLQISDSSWVGLAVNGCTEAYRPVFMSAYSQNKHLPPKEIMAKLKDIAQDNFASMVQSKEIVSKFVTSDEVGLFAGIGPKTAKDKWRKGQECYLCGSKKHKAYNCPKKNQTNTGGGNGGGNGGGKTQNRGKSHANVECYYCHKKY\n>UniRef90_A0A7K4MZ21 C2H2-type domain-containing protein n=1 Tax=Marine Group I thaumarchaeote TaxID=2511932 RepID=A0A7K4MZ21_9ARCH\nMNFFRRNKEIVITGTTCKFCGMEFSAPDRMVKHMLKAHGKPKKNKGSSCPNC\n>UniRef90_UPI00110FA3E4 hypothetical protein n=2 Tax=Streptomyces TaxID=1883 RepID=UPI00110FA3E4\nMSTARYLALIDLLRTREFPAQRRRTESGFSGPGYHTVELSAAGEPAGEPAGEDAADQVEARERCLAEHDALVAVLDGRWGEAQVFGLWSLLERSVGGEAVPAPWDELSAGFDSLHLWRADGRWIAVGLALDAEGPSYALAAVVTGIDPP\n>UniRef90_A0A847PHQ1 GTPase n=1 Tax=Candidatus Atribacteria bacterium TaxID=2053509 RepID=A0A847PHQ1_9BACT\nMFLKKQNVLIMGAAGRDFHNFNVFFRNNENFNVAAFTATQIPDIAGRKYPPELSGPLYPDGIPIFPEEDLPELIKKHNINQVVLAYSDLPHQYVMERASLVLAHGADFRLMGPDNTMLKAKVPLISICATRTGSGKSQTTRKVSAILKEMGKKVVVIRHPMPYGDLSDQIWQRFKTYDDLDRYECTIEEREEYEPHIDVGNIVYAGVDYGEILKRAEQEADIILWDGGNNDIPFYHTDLHIVVADPHRVGHELTYYPGLVNMMMADVVVINKIDTADQENIVQLRDHIAKIVPEAITIDAASPIKVDHAELIRGKKVIVVEDGPTLTHGEMQFGAGIVAAQKYGAAEIIDPRPFAVGSIKDTYQKYPGIGMVLPAMGYGSKQMQELESTINSIDVELVIIATPIDLSRVMKIEKNNVRVKYDLQEIGSPNLKEILLQKLS\n>UniRef90_UPI0005F56F2E NADH-ubiquinone oxidoreductase subunit 8 n=2 Tax=Myrmicinae TaxID=34695 RepID=UPI0005F56F2E\nMMGPLQIFTLSGKLAPRFLRIAPKGVSVYLSRNKYYYVREDKEQNWTDIMEAASTHMFFHELFRGFGIILSQVFREPATINYPFEKGPLSPRFRGEHALRRYPSGEERCIACKLCEAICPAQAITIEAEERADGSRRTTRYDIDMSKCIYCGFCQEACPVDAIVEGPNFEFSTETHEEMLYNKEKLLNNGDKWESEIASNIHADHLYR\n>UniRef90_A0A1G0YLB9 Methyltransf_11 domain-containing protein n=2 Tax=PVC group TaxID=1783257 RepID=A0A1G0YLB9_9BACT\nMSAAEYPETADIETSSDDYAGRFSGPIGEWMLGVQEQIALKVLSDRPGATVLDVGGGHGQLALPLCHRGFKVTVLGSADSCRRRIQGVVDEGLCKFLVGNVVELPFPAKSFDVAMSFRLLPHCERWPTLIAELCRVSRHAVIVDYPTTQSVNAFAPMLFGAKKKVEKNTRAWRMFGQGEIRQAFRQNGFSQLSLRKQFFLPMALHRMLNKPAFSKTAENLCRFLGLTAGLGSPVILKAVWDEDR\n>UniRef90_UPI001572454A MerR family transcriptional regulator n=2 Tax=Nocardia TaxID=1817 RepID=UPI001572454A\nMKSSRTLTIGELAQRFGLGTHVLRYWESMGLLEPARRAGGQRLYEHADLERVALILMGKEAGLTLGELATVLSTADPRDHRDLLCHHVEELERRITQARAAKELIEHVLACPHSLAECEHAREHIAARIPPLPRNSASV\n>UniRef90_A0A8C2IYT9 Slow myosin heavy chain 3 n=1 Tax=Cyprinus carpio TaxID=7962 RepID=A0A8C2IYT9_CYPCA\nMGDAQMAEFGAAAPFLRKSDIERLEAQTRPFDMKKACFVPDTEEEFVKATIISRDGDKVTCENSKGTTVTVKEIDVHPQNPPKFDKIEDMAMFTFLHEPAVLFNLKERYAAWMIYTYSGLFCVTVNPYKWLPVYNQEVVLAYRGKKRSEAPPHIFSISDNAYQYMLSDRENQSILITGESGAGKTVNTKRVIQYFASIAASPTKKETSDKKGTLEDQIIQCNPALEAFGNAKTIRNDNSSRFGKFIRIHFAASGKLASADIETYLLEKSRVTFQLKAERDYHIFYQILSQKKPELLEMLLITANPYDYAFISQGETQVASIDDADELMATDEAFDVLGFTQEEKNSIYKLVGAIMHYGNMRFKQKQREEQAEADGTEDADKSAYLMGLNSADLIKALCHPRVKVGNEWVTKGQNVQQVSYAVGALSKSVYEKMFLWMVVRINQSLDTKQPRQYFIGVLDIAGFEIFDFNTFEQLCINFTNEKLQQFFNHHMFVLEQEEYKKEGIEWVFIDFGMDLQACIDLIEKPMGIMSILEEECMFPKASDATFKAKLYDNHLGKSANFQKPRIVKGKPEAHFSLVHYAGTVDYNINNWLVKNKDPLNETVVGLYQKSTMKLLSILFANYASADSGELSKEKKKKGSSFQTVSALHRENLNKLMTNLRSTHPHFVRCIIPNETKTPGAMENPLLMHQLRCNGVLEGIRICRKGFPNRILYGDFKQRYRILNPAAIPEGQFIDSRKGAEKLLGSLDIDHNQYKFGHTKVFFKAGLLGTLEEMRDDRLALIITNIQARARGLLSRVEFQKIVERRDALLVIQWNIRAFMGVKNWPWMKLYFKIKPLLRSAEAEKEMANMKEEFLKLKEAYAKSEARRKELEEKMVSLLQEKNDLQLQVQTEQDNLCDAEERCEGLIKNKIQLEAKAKELTERLEDEEEMNAELTTKKRKLEDECSELKKDIDDLELTLAKVEKEKHATENKVKNLTEEMAALDEIIAKLTKEKKALQEAHQQTLDDLQSEEDKVNTLTKAKAKLEQQVDDLEGSLEQEKKLRMDLERAKRKLEGDLKLTQESLMDLENDKQQLEERLKKKDFEISQLNSKIEDEQVMAAQLQKKLKELQARIEELEEELEAERAARAKVEKQRADLSRELEEISERLEEAGGATAAQVEMNKKREAELQKLRRDLEEATLQHEATAATLRKKHSDSVADLGEQIDNLQRVKQKLEKEKSELRLELDDVVSNMEQLAKAKVLVSTLAFLLFSRQLEEKDSLVSQLTRGKQSYTQQIEDLKRQLEEEIKAKNALAHAVQSARHDSDLLREQYEEEQEAKAELQRSLSKANSEVAQWRTKYETDAIQRTEELEDAKKKLAQRLQDAEEAVEAVNAKCSSLEKTKHRLQNEIEDLMVDVERSNAAAAALDKKQRNFDKVLAEWKQKYEESQSELESSQKEARSLSTELFKLKNSYEESLDHLETMKRENKNLQEEISDLTEQIGESGKNIHELEKIRKQLEQEKAEIQAALEEAEGSLEHEEGKILRAQLEFSQIKADIERKLAEKDEEMEQSKRNQQRMIDTLQTSLESETRSRNEALRLKKKMEGDLNEMEIQLSQANRQASEAQKQLKGLHGHLKDIQLQLDDALRSNDDLKENIAIVERRNNLLQAELDELRSLVEQTERGRKLAEQELLDVSERVQLLHSQNTSLLNQKKKLEGDNSQLQTEVEEAVQECRNAEEKAKKAITDAAMMYFLYTLNNGLNNAFSFHTSCMFVRELENEVEIEQRKASESVKGVRKYERRIKELTYQTEEDRKNLARLQDLVDKLQLKVKSYKRAAEEAEEQANTNLGKFRKIQHELDEAEERADIAESQVNKLRAKSRDTRAAKKTSMMNLVQTDHKYHIN\n>UniRef90_A0A6G7V9X9 Purine-binding chemotaxis protein CheW n=1 Tax=Caldichromatium japonicum TaxID=2699430 RepID=A0A6G7V9X9_9GAMM\nMSAEHLQEAAVDEEGTESADVHQFVTFVVGGEVFAVDMAPVQEIIRLPAVVRVPLAPSSLLGLANLRGKVLPIILLRRIFGFPEQAHDDATRALVIDVGQPLGFVVDRVASVISVRSEQIEPVAGIQGTFNSELLTGILKDVGGFAMVMVLNFARLVAQEFAEIAQIARGTAMTGGVLDSSADNEDKEASDELQLVSFAVAGQEYAIDITSVQEIVQIPETIVHVPNSPTHVLGLMTLRERLLPLVSLRSLFALPARALDEKSRIVVVALGQAAVGIITDSVSEVLRVPLAQVDRMPGLLAREDALSDITEICRLDGGRRLVAILSVDNMFKHTVVQEALKTVDGMNANTHDEQPGEDRSDEEEQLVVFRLAESEFGVPIESVQEIVRLPDELTPVPKAPAYVEGVINLRGAVLPVIDQRKRLGLPPIERNDRQRIMVFVLNGVRTGFIVDTVTEVLKIPKAAIETAPRLSGEQARLLGRVANLEQQGRMIQLIEPAHLIDTTELADLNT\n>UniRef90_UPI001A9564E1 hypothetical protein n=1 Tax=Segetibacter sp. SYSU D00508 TaxID=2810307 RepID=UPI001A9564E1\nMVLITLHEILLVVTAISFLLLPKLFFKYLPSPYEFYCKIASGILLLLVIWIPEPGDQQSQLLLQVLLTLLTTYYMCKNVMEYRKRKTGITHHK\n>UniRef90_UPI0020C6B0B3 SPOR domain-containing protein n=1 Tax=Deinococcus sp. JMULE3 TaxID=2518341 RepID=UPI0020C6B0B3\nMIGALVLLLLGGFGTLLLRPQAGTPVSAAADSGTDAPATDTTTLDSVPGAPGSTESTDAATAPVSTTEITAPTGQDSVTSPGSDAPQADGSANPGSVPSTDGADTPVIAAAPIGTPDPTLTDTQTAPQTEDADPASADPASDTPATDPAAPAARTGGAVPTSEQRTPLRSDYRITLGTFGSDAAAQSATQGVGALGYTVYPITVAAGVVAQVGPFADEATAREALADVQRAYPGAVLYPPRDRSLSTPSTPATTGATAETAQTTPAEPATPAPTATTPTYLQVGAFDRLESAQNLVQQLRDLGYNPTVNAPAGKKVTVLVGPYTGDPLTRTETRLQENGLDSFRVR\n>UniRef90_A0A2Z6TDT3 Spore coat protein n=1 Tax=Burkholderia vietnamiensis TaxID=60552 RepID=A0A2Z6TDT3_BURVI\nMRALRRSFQPYFQPHFQPHFQPHFQPHFQPHFQPHFQPHFQPHFQPHFQPHFQPHFQPHFQPHFQPHFQPHFDPNSPPYSQPPP\n>UniRef90_A0A5Y2QT59 PLD phosphodiesterase domain-containing protein n=3 Tax=Enterobacteriaceae TaxID=543 RepID=A0A5Y2QT59_SALER\nMNQLIHNAEHYIYIENQFFVSAFGEPSVPDNAPYSPEAKEIARLDRIKAVTTKLVYGDSDKQPVNQIAQWLGDRIKNVIYARYTHDFHVCIVLPVHPEGKLDDGAVMAQVHLTRQTLVSGSKSLLNRVRQALWVRQQLDEDPRANWSKLIPALEKRCETEKKYEEISFEACAKYVTLLNLRGYAELAAYPDKKIAVTEQIYVHSKLMIVDDRYVLVGSANINERSLQGNRGYLATVLAGAGSNLALEGTPV\n>UniRef90_A0A1J9RUE5 Cation chloride cotransporter n=1 Tax=Diplodia corticola TaxID=236234 RepID=A0A1J9RUE5_9PEZI\nMASRGGSSRMPSRLHSRSNFTTRSAQDDSHQLQRRWSLSQMSAQDEAEPLLAAGPRRRRPVSVPRENRTFGSFLSALFTRRASTRSRSGHRRTRSSGTDRCKPASAPAKLGTFAGVFVPTTLNVLSILMFLRFGFILGQGGLLGMMGLLVACYAINLLTTLSVSAIATNGTVRGGGAYYLISRSLGPEFGGSIGIVFYLGCVLNTGMNAVGLVACFVQNFGSTHGSWANWLPDDFWWQYLWATVVLAVCTVICLAGSSLFARCSNALLIILLVATFSIPVSTLVQTPFSNVKLGIEYTGLSLETLKGNLLPNLTQGAAGSGLKGRETWQDLFGILFPATGGIFAGASMSGDLEAPSKSIPKGTLYGLALTFVTYTIVIISMAASITRLSFYNNDNVIQVVNVSGALVLLGEFASTLFSTLMGVIGSAKLLQALARDKLIPGLLVFAQGSKAADEPMLAIGLTYVLSQLTMLADINQIASLVTMAYLMTFLVTNLACFLLKVASAPNFRPSFHFFNWWTAAIGAIASALTMFFVDGLSASACFATIVLIFLIIHYTTPPKAWGDVSQSLIYHQVRKYLLRLRQEHVKFWRPQILLFINDPRRQYKLIQFCNSLKKGALFVLGHVIVTNDFAGAVPEVKKQQSAWTKYIDFSRIKAFISIVISPNIEWGTRNVVLSAGLGGMKPNIVVMGIYNLNDLRTNPLVDVPSPQPEHTQGTANGTAPHRLKSKGKWKIAEENKLRGQLPTDAIRKESAVTPQSYVTILEDLLLRLQMNVAIAKGFQDLELPAPRPSRLERVLDALHAKSADEEEGTKKYIDLWPIQMSAEVAAPSDGTQSILTTNFDTYTLILQLGCILNTVPSWKRAYRLRVAVFVEYESDVEEERARVKALLYNLRIEAEVMVLWLASGDLQSYEIIVNGQADESYREARQDIEEALREEAWWQDIQKLRQRQTGAITPMEELAQIEGFLETASNWPGTAFRQGDRETKSKRFADIKDMLIERRRTSVGSLKQMGVSMGMRTHRLPPGLDGQESSSDGSSSGGESEAECSDSDRSASSENDPQTESDEGTLSPMRRARSERESTSSFPSTPRQQSQPRRGELLPPAPTAAANSDSTLVTSQPPTNAGSHQSPPTFTSKPVPRTEVAADDGPGPSIMFAEPLSPEEQRERRFGTSIYTRSGSPQVAAPLPGPANPDESGSDSPSTPGSPGAASSSMSQASGFPLQQSVPLSFNDLPCRAQHLILNELIRRESGKDQRTAVVFTTLPSPVEGTCEDEHASVRYLADLEVLCQGLPPVMLVHSNSMTVTTNL\n>UniRef90_UPI001F1A8850 DUF6338 family protein n=1 Tax=Pelomonas sp. P8 TaxID=2906762 RepID=UPI001F1A8850\nMNLALPTVVVFILLLPGFIFRSRLKRVERTSLDFSPFGAVVAEAVFFAAVLHAAALLLLFWVTGALPDLALLLTLLAPSPAPLNAIPAIGQHAGLVTGYFGLLLVASWLVPTLTRWLITVGRLDRLGHPLSPIARFHQAPWYYLLTGADFAADELPDYIRVTAVVDVGKGAVLYRGTLEEWFTNPDDGQLDRIVLSAASRRPFELDKPLDGSDGGAERFYPIDGDYFVLRYEHMLSLNVQYMRIIEQPDDDLPDDEEADTPAAQ\n>UniRef90_V4QRW5 Methyltransferase n=1 Tax=Lutibaculum baratangense AMV1 TaxID=631454 RepID=V4QRW5_9HYPH\nMQSEILEGYATAGPELIALYEAVPSAEIYALVRDLLPPGPARAADIGAGTGRASPRCWRRPGS\n>UniRef90_A0A0D3GCY4 Uncharacterized protein n=1 Tax=Oryza barthii TaxID=65489 RepID=A0A0D3GCY4_9ORYZ\nMNLSATYDSRTSDVESSVVARGDLWRAEASHSSAAAAAPPLFMVQLGPVLFVRDTTLLFPVHLSKRHLIWYGFERKNGVHSVCPAYWSAHRRWFFMSMICLNPFTCSFMDMQFPNGQLRYVAGDGFTTRAFLPLYRGIFQAHVKFPGEKKFSYSFKVSCQMNSKPYLNLLHLNSEVSLLHHIARLVLLTIFFQNRSGGSITPMVQWPDKSLSLGTVQTLSWKRCGLIICPTFGGSRPGLSMELIHSVNENAGVVCGYSHTASPSAYASVSIGRSKLNGSAASSGLVLRVDAPLQSFGRPWFSIQMNSGLEF\n>UniRef90_K3XLW2 Ras-related protein RABE1c-like n=2 Tax=Setaria TaxID=4554 RepID=K3XLW2_SETIT\nMAAPPARARADYDYLIKLLLIGDSGVGKSCLLLRFSDGSFTTSFITTIGIDFKIRTIELDGKRVKLQIWDTAGQERFRTITTAYYRGAMGILLVYDVTDESSFNNIRNWIRNIEQHASDNVNKILVGNKADMDESKRAVPTAKGQALADEYGIKFFETSAKTNLNVEQVFFSIARDIKQRLSETDSKPEDKVVNIRQDQGAEASSSQKSACCGS\n>UniRef90_A0A8C0C567 Uncharacterized protein n=2 Tax=Accipitrinae TaxID=8955 RepID=A0A8C0C567_9AVES\nMSKQVVNSSETVTPGPNEGTGVVGISPENEPQNAPSQAPAAMARLPRSLSNDNKTLSSEEAKPNDFERTKVGICKLSSTPVQANSTLQRESVETFPCKHTPGAGVAGQAAIPHCKIPALQSTDGDANLNLGKSTLEQNNAKGAWVTLSQSTVVLGTDGNTSVLPGRVEGVSWLLVGFLSPAFNSWE\n>UniRef90_A0A2B7X7V6 Replication factor A protein 3 n=1 Tax=Polytolypa hystricis UAMH7299 TaxID=1447883 RepID=A0A2B7X7V6_9EURO\nMSLSTPRLLPEHLHAFAPAPHKSARTVRILGTVSSLRGEHASITCGSHGEVTLVLNRDSHIQMGRVVDVIGKVVEVEGGLGVRVLGAADCGDPKDVDYKIYEELVDVTHRFKEIFYDE\n>UniRef90_UPI001663C50F hypothetical protein n=1 Tax=Belliella aquatica TaxID=1323734 RepID=UPI001663C50F\nMKKVLHTLAAILISVVSYAQVGIGTDNPDNSAMLQVASSEKGFLLPQMTSTQRNAVSSPANGLQVYDTTTNSIWFFNGSYWVNTQAMATVGDVKSGLQTNDHSGWVLLDGRSIGTLSDNQKAAASALGLSGTLPNAADAYLVQNGGSMGAISGSNTVTLTQANLPNVSFSGTAASAGGHTHTVDPAPVDTDSKGNHTHTVDPAPVNTDTKGEHTHTGSVGGSNWLGGGTLTGGFNAGTFPFQIPNLTINPAGDHFHTVDIPSTTSSENGAHKHSIDIPSTTSSSNGAHTHDVTVSSGGSATPVNVAPKSLSVNMFIYLGL\n>UniRef90_A0A3Q3E9K7 Hydroxycarboxylic acid receptor 1-like n=3 Tax=Hippocampus comes TaxID=109280 RepID=A0A3Q3E9K7_HIPCM\nMDLDLRSTPAPGGGGGGCPPVGIQLEGVILPPVLTVDVVLGLLGNAVALWVFCFRVKSWSANTVFLVNMVAADFLALVSLPLRIDALLRGHWVFGDVVCRLNLFLMFSNRTASIALMTVIAFYRYVKVVHPHHRFNRMSKRQAGILSLVVWLLVSSPRVPMLAYNHIKELFLKKKTSFTITNYFKRYLKRLLAGIVILVETHRVLTVLEFVIALALLVFYSVQISRSLKRRQMGNVAKVRKAMRVCAAVVAIFLVCFLPTTITTLGLWVSRSLRPWDCAAFYALTQLNIVSLSLNFLNSALDPILYVFSSSVFRKELLAAVPPRLRCKRAVEGTSSVSTSQSTGQVELESVKMTAGSEAS\n>UniRef90_A0A3N0Y0W4 Complement factor I n=1 Tax=Anabarilius grahami TaxID=495550 RepID=A0A3N0Y0W4_ANAGA\nMPYKCPRQDYHVCTLDGSEYYSMCQTKAISCRSNKPVFSHISTTCRAEEKVKVTVEDSGSHKVVMINTRLGKMFVCGNDWNMAAANVVCRNPLNVARGAAEVTKIKNRILDRDTKWPTECMSVRCTGSELSLAECTIYNPQPITENTVAIAKCYNEPKGAFSSF\n>UniRef90_A0A124ILI9 30S ribosomal protein S15 n=1 Tax=Gracilibacter sp. BRH_c7a TaxID=1734398 RepID=A0A124ILI9_9FIRM\nMLTPEKKKDIITKFQQHEGDTGSPEVQIAILTTRINELTEHFKTHKKDHHSRRGLLKLVGQRRALLNYLKKNDVNRYRKIVSDLGMRR\n>UniRef90_A0A4C1ZDE1 Tubulin_C domain-containing protein n=1 Tax=Eumeta variegata TaxID=151549 RepID=A0A4C1ZDE1_EUMVA\nMTVSFLCSGGDAPPQGLCFQNLNMRIHSYAHSNIFAEYYTSYVTDALYKQISKPKFSFWARRGKTVVALCVPFGVSPYRAALSSSPYTDREFLDSSVNIMRRAHDQSIGGGSAVWDLTIKRRPLRDRGVRYETCTALCE\n>UniRef90_A0A2J6IBB8 Endonuclease/exonuclease/phosphatase n=1 Tax=Marinilabiliales bacterium TaxID=2053303 RepID=A0A2J6IBB8_9BACT\nMKILKLIFFIALSVNLSSQSIMSFNIRYNNPNDGNNSWENRKFELTDLITKYRPDIFGIQEGLYEQNEYIKEQLANYTYVGVGREDGNKKGEFSPIFYDSLKYELIETKTYWLSDTPSEVSVGWDASMERISTFGAFRNINTKDTLYIFNCHYDHIGKKARRKSSKLIIKLIEDKGLLIKNLVVMGDLNSMPEDAAIKILKNKLTDSFEVSNYLKEESIQTYNNFDNQYISNKRIDYIFTRNIYVSSHKIIREKRSNGLFISDHFPVLIQFRNN\n>UniRef90_A0A0F2Q2J6 Cupin_2 domain-containing protein n=1 Tax=Clostridiaceae bacterium BRH_c20a TaxID=1629719 RepID=A0A0F2Q2J6_9CLOT\nMNKKIRDEIERSLNLKIIDEQSFSWGESYSLQLESKMDFDKYSKKNSRNVAVVTVKPNIKHESHTHYGYDEILYGLEGETIHWANSKKTYLQKGQLVLIPAEGQHIMVNNSPVPAKFLSIVYPTIPERWRR\n>UniRef90_UPI00037CD391 VWA domain-containing protein n=1 Tax=Gilvimarinus chinensis TaxID=396005 RepID=UPI00037CD391\nMANSLIRVSVLLWAAFFCFHSHAQSPSPSAALVDADVRLLVDISGSMKNTDPDNLRQPALELMVKLLSESAYGGVWTFGEQVNMLVPFSRSDEDWQRRALEQTSRINSVGLFTNIGEVLHRATEVPAKTSSADVILLTDGKIDVDKNAGVNSRERNRVLSELLPEIAEKNFRLHTIALSADADSELLQQLSRTTDGHHLVAKNADELMQAYLQIFDQAVPAKRLPLENNRFLVDDQVNEFTALVFRAPTAEPTQLLMPDGKALSASSHGDNTQWYSADGYDLITITNPAAGRWQLKAQESAQNRVTVVSDLQLYVESLPNNLLAGNALTLAYALQEKGNNLTDADFLDLITAEIVVMNVTRDVSWNLALTDQPDKATGVFTHELPTFNERGQYRLRLRVDGKTFAREFQHQLQVGSMFAVQLDKAVQSSQVKYTLNVKTDSEFVNTDKTSVVAHVKHSSGESELRALKKVSDTQWQLTLTPAKPMRTLIELNASGELTDGREFNEVLPSQYVQFPQEGDPLVVQEDSELAMLKQQIETERAALANEERLADTVAKTPAAKSQTSSPVSESQDDKQEAGFESGPDSAEETDEGGINWPMIAAITLGNLLLIGGLYWAYRRFSAKDVQSELDEIEQQLQAAPNEPSGQATEQQKKEAVALDDDNSVSVLDSLDESSLPMDDFSFDDESDKK\n>UniRef90_A0A853FEG6 5-formyltetrahydrofolate cyclo-ligase n=1 Tax=Pusillimonas soli TaxID=659016 RepID=A0A853FEG6_9BURK\nMNDSTRNNATPLRTRLKQRRAAMDPVERSRGALLIRGRLYTWLATTRTRLREAGRPVPENIAAFWPLDEEPSLLPLLQQWVEEEGYRVSLPVVTVAGAPLQFRIWTPDAPMQPGAYGIHEPAGEIAPPPDIILVPALGYTRQGDRVGYGKGYYDRTLAALREQGHAFTSIGIAWATGDLSGDSHAPEPHDYRLDSILTDKGWAVPAPVIA\n>UniRef90_UPI0021E303A4 FERM domain-containing protein 5 isoform X1 n=2 Tax=Acomys russatus TaxID=60746 RepID=UPI0021E303A4\nMLSRLMSGSSRSLEREYSCTVRLLDDSEYTCTIQRDAKGQYLFDLLCHHLNLLEKDYFGIRFVDPDKQRHWLEFTKSVVKQLRSQPPFTMCFRVKFYPADPAALKEEITRYLVFLQIKRDLYHGRLLCKTSDAALLAAYILQAEIGDYDPGKHPEGYSSKFQFFPKHSEKLEKKIAEIHKTELSGQTPATSELNFLRKAQTLETYGVDPHPCKDVSGNAAFLAFTPFGFVVLQGNKRVHFIKWNEVTKLKFEGKTFYLYVSQKEEKKIILTYFAPTPEACKHLWKCGIENQAFYKLEKSSQVRTVSSSNLFFKGSRFRYSGRVAKEVMESSAKIKREPPEIHRAGMVPSRSCPSITHGPRLSSVPRTRRRAVHISIMEGLESLRDSAHSTPVRSSSHGDTFLPHVRSSRADSNDRVAVIADEAYSPADSVLPTPVAEHSLELMLLSRQINGATCSIEEEKESEASTPTATEVEALGGELRALCQGHGGGPEQQQVNKFVLSVLRLLLVTLGLLFVLLLLLIILTESDLDIAFFRDIRQTPEFEQFHYQYFCPLRRWFACKIRSVVSLLIDT\n>UniRef90_A0A485M2C4 Transcriptional regulatory protein ZraR n=1 Tax=anaerobic digester metagenome TaxID=1263854 RepID=A0A485M2C4_9ZZZZ\nMPSKERKLAKKNIRILIIDDEESIRDGCQQILTRQGYEPTATADGMTGLELARTGAFDVILLDLRMPRIEGLEILRILKSEHPVASKIIVITGYGTIPVAVEAMRLGAHNFITKPFSAAELKLAVQDCLSEKSEERPTGDSLSMIIGTSDYVEELKETIRRVAKTDSTVLITGESGTGKELVARTIHSLSARSNKPFVPVDCSSLVHNLMESELFGHIKGAFSGATENRDGRFQTADKGTLFLDEISNISLDVQAKLLRVIQEQEVPRVGSSIPEKIDVRLITATNKDLRVEVQNGTFREDLFYRISVVPIHIKPLREHRSDIAPIAFHYFDIFRSRHGSKAQSLSPEVVKSLTSYTWPGNIRELKNTIERLCVLCDHEEVTLSDILYYGQDTCSKAPVVDPFSGKMTLVEVEKEHIEKALHHFNNQINKTARFLGIDRKTLRTKIRNYGIEIKDDE\n>UniRef90_UPI00103184EA hypothetical protein n=2 Tax=Streptomyces TaxID=1883 RepID=UPI00103184EA\nMSAGNNGMSTPEGGDDPFGYLYRPEDGQAPAQQPQQPSYHQVRPVGERRPYGGQRSGYGYPQPQSAPPQHDPHYAAPEAQPGGGGYHSGGPPGPYQNGGEPPRRNTLLIGAIAVVTAVVLGVGAALLFSNNDAGGDDDRADDSSEVNPTPDVPDDEDEGDTDEDGADEDETGEDEEDPEDSGDLPVADFNGADITLSNGAIVGGGQLEGARSSDGSYITGLNNNNSTVSWQFDFDGTPGDYRVYVGYTVEDGDQLMSWAINDSLRGDELEFKDHRKSGAYKDNWTYTWKQVYLNEGSNLLQIGCGGDDTCDVVIDGLVVTPHADGMEPW\n>UniRef90_A9YMW7 Ac78 n=2 Tax=Betabaculovirus TaxID=558017 RepID=A9YMW7_9BBAC\nMQQHLDIPFDRLTVPDVVDAIPLKLAYSKESDDNNKPPVVPSAQAVYGSREEKSAQSDMSNVWFIALACITVLVVIMLISYYIVSVLRTNNAPLRDYDDDDFE\n>UniRef90_UPI00188515FC mitogen-activated protein kinase kinase kinase kinase 4 isoform X15 n=1 Tax=Peromyscus leucopus TaxID=10041 RepID=UPI00188515FC\nMANDSPAKSLVDIDLSSLRDPAGIFELVEVVGNGTYGQVYKGRHVKTGQLAAIKVMDVTEDEEEEIKLEINMLKKYSHHRNIATYYGAFIKKSPPGHDDQLWLVMEFCGAGSITDLVKNTKGNTLKEDWIAYISREILRGLAHLHIHHVIHRDIKGQNVLLTENAEVKLVDFGVSAQLDRTVGRRNTFIGTPYWMAPEVIACDENPDATYDYRSDLWSCGITAIEMAEGAPPLCDMHPMRALFLIPRNPPPRLKSKKWSKKFFSFIEGCLVKNYMQRPSTEQLLKHPFIRDQPNERQVRIQLKDHIDRTRKKRGEKDETEYEYSGSEEEEEEVPEQEGEPSSIVNVPGESTLRRDFLRLQQENKERSEALRRQQLLQEQQLREQEEYKRQLLAERQKRIEQQKEQRRRLEEQQRREREARRQQEREQRRREQEEKRRLEELERRRKEEEERRRAEEEKRRVEREQEYIRRQLEEEQRHLEILQQQLLQEQAMLLECRWREMEEHRQAERLQRQLQQEQAYLLSLQHDHRRPHPQPPPPQQQPQQDRSKPSYHAPESKPHYDPADRAREWSHLASLKNNVSPVSRSHSFSDPSPPKFAHHHLRSQDPCPPSRSEALSQSSDSKSEVPDPTPKAWSRSDSDEVPPRVPVRTTSRSPVLSRRDSPLQGSGQQNSQAGQRNSTSIEPRLLWERVEKLVPRPGSGSSSGSSNSGSQPGSHPGSQSGSGERFRVRSSSKSEGSPSQRLENVAKKPEDKKEVFRPLKPAGEVDLTALAKELRAVEDVRPPHKVTDYSSSSEESGTTDEEEEDVEQEGADDSTSGPEDTRAASSLNLSNGETESVKTMIVHDDVESEPAMTPSKEGTLIVRQSAVDQKRASHHESNGFAGRVHLLPDLLQQSHSSSTSSTSSSPSSSQPTPTMSPQTPQDKLTAHETQSASSTLQKHKSSSSFTPFIDPRLLQISPSSGTTVTSVVGFSCDGMRPEAIRQDPTRKGSVVNVNPTNTRPQSDTPEIRKYKKRFNSEILCAALWGVNLLVGTESGLMLLDRSGQGKVYPLINRRRFQQMDVLEGLNVLVTISGKKDKLRVYYLSWLRNKILHNDPEVEKKQGWTTVGDLEGCVHYKVVKYERIKFLVIALKSSVEVYAWAPKPYHKFMAFKSFGELVHKPLLVDLTVEEGQRLKVIYGSCAGFHAVDVDSGSVYDIYLPTHIQCSIKPHAIIILPNTDGMELLVCYEDEGVYVNTYGRITKDVVLQWGEMPTSVAYIRSNQTMGWGEKAIEIRSVETGHLDGVFMHKRAQRLKFLCERNDKVFFASVRSGGSSQVYFMTLGRTSLLSW\n>UniRef90_A0A0S9PKG7 4-hydroxybenzoate polyprenyltransferase n=3 Tax=unclassified Agreia TaxID=2641148 RepID=A0A0S9PKG7_9MICO\nMSAAFAAASVGLFTPTTDTPGAHTWSSAILLFVIYLALLLRYRVTDEWKDFAHDSAVYPDRPVQRGVVSPRTLFVIGAGAFAVELLGVLLIGGALGFVLYLPVLAYSALTVFEFFSAPRLERHFTLSFVLHEAIYLPLFLWVAVVLGAAPDWRTAAGVLACTALFVSVELARKFSPRFDTEGRVVLDTYSAVWGRGRTLGAMVVLVVLSGVLATTAGAGLASPVIAVVAAAVALARPASDRWVTTVVAIHLPLQAAAMLS\n>UniRef90_A0A835JN83 Dentin sialophosphoprotein-like n=1 Tax=Salix dunnii TaxID=1413687 RepID=A0A835JN83_9ROSI\nMDLEHGSGTHSESHQEVIDGTGGSDNEDTYPRLRVRIGSSGRLQIDPEKIEGSESGKYSESHSEVINGSDSDKHIEPKPEFTVIEGDIYMPTIKFGSSYSSSSSSSSPSSSGSSLYDLFDVIPKESADPGAGSADFESSNKPHEVTQPASKDHENGVSIDNSHRSEENEDGSSDHALTPPVSGATCESLAHNMSPKQSPPLQVMERPGGYDPLRIPSSIFENNKGTQPMDWSVASNESLFSIHVGNNSFSRDHVLLFGDPGKSGDITKSGESIMFSPLPPREMVTNDNQSSVPDMETNKQKGGSSGMADNTVKDPAEYQNEEDNTNQAVSWKSPSSSNRSYGSGDSVKSFSFPIKASTLAHIMPKFTFSLLYMDVFIFADLLCEFSPDRNACVLGMLVFYA\n>UniRef90_A0A0Q5NNY0 Response regulatory domain-containing protein n=2 Tax=Pedobacter sp. Leaf176 TaxID=1736286 RepID=A0A0Q5NNY0_9SPHI\nMRYKILIVDDDEIALFLHEMVVGDCGPIDDAETFSSAETALSYLGDINDGSCEYLILLDINMPQMNGWEFAEVVKNHPLREKIKIVMVSSSVEKKDIERADSSVVIDDYLIKPLREEQILTLKEQPKFRAFFNDHQ\n>UniRef90_UPI001D111BD5 2-oxo acid dehydrogenase subunit E2 n=1 Tax=Haladaptatus pallidirubidus TaxID=1008152 RepID=UPI001D111BD5\nMVEIIRIPKLGLSDYGDLVSWEAEDGEHVTAGDVVAIIESEKASAEVEAPTDGTLLGRYVEEGEEIEIEVGKPLAVIGDEGEEIPDISAIEDGSEVSTEGNSGKDNSSKNRATSSDDGSDVITDVKATPRAKRLATEKDVNLKQIEGTGPQDAVSEEDVQAFLESSDTDTKGDEQEVETEQSSSAGLTVTDSRKLTGTRKTIAKRLSQSAREKPHVMGTREVSVERIQALQSRLSERYGVEVSLNDIILFFVGRVLQDLPEFNAHFEDSQHKLIDEVNIGYAVDGPKGLVVPVIDDVTGRSLAELAERRRNLVGKVLDNEFTTVDLQDGTFTVTNVGVFNMDVSYSIINPPEVGILAIGRRKQAPVERDGEVEFETVVTMSLTIDHRVLDGADSGAFLECLAEYLEYPGNALESVQNEQESV\n>UniRef90_A0A7Y3X359 DUF637 domain-containing protein n=1 Tax=Flavobacterium sp. CLA17 TaxID=2724135 RepID=A0A7Y3X359_9FLAO\nMPTLSNLVAPKLGFSNGLVGNVMTGLLSNVISKAVQPNYTAQMNRQADEVGTRLLTTVGYSQSSLMNVSSSTRHAQIRAKVQQLIGSNSSSSWWSSGR\n>UniRef90_A0A2H0L707 IPTL-CTERM sorting domain-containing protein (Fragment) n=1 Tax=Candidatus Peregrinibacteria bacterium CG11_big_fil_rev_8_21_14_0_20_41_10 TaxID=1974792 RepID=A0A2H0L707_9BACT\nDADNNGIGDACDDPIATCEGVVLAPNCTTGNLCDNGDTMPGTEVCNIPNGVVEITCEDRPELCTDNCTDPTIVLNISRHTGDLCDTGEFCADGSERSGHWEVGDNCNYYPDECKVECDAFCVPNPNEECVPVTNNGEVTNNGGITNNGQIANNGDTHNNDTTNNGGDKIPAAPDTGCNVSTIDTPLQARDQIWALLMLAMAAGAMGYSKQRK\n>UniRef90_UPI0020C3A1E9 DUF2243 domain-containing protein n=1 Tax=Halomarina sp. BCD28 TaxID=2961595 RepID=UPI0020C3A1E9\nMARTTTRRALVAAGVFGFGFSGLIDVLVLHHVLQLHHLVSGLYPMDTLSGLRTNIRADGLFSLAMVGIAGVGAGLLWQSERRTEAPLALRPVAGAALVGLGAFDLFDVLVDHVLLGLHQPTMQGGVYNPHWAAVSLLFVAAGWLLYRSGRDAEDVTRDTAETANDRTE\n>UniRef90_A0A6P4XS04 protein timeless homolog n=1 Tax=Branchiostoma belcheri TaxID=7741 RepID=A0A6P4XS04_BRABE\nMDLYMMNCELLATCSALGYLEGDTYHKEPDCHETVKDLIRYLRREDETRDIRQQLGASQIVQTDLIPIIKQYHDDKALFETIIRLLVNLTQPAIVCFGKVPKDKMFRHYFLDVVSYLQGYKVAFADGEVWTVLSRKLYELLQLDWENRQEEDSLLIERMLLLVRNILHVPADPEEEKRTDDDASVHDQVLW\n>UniRef90_A0A7C3W5F8 4-hydroxythreonine-4-phosphate dehydrogenase PdxA n=1 Tax=candidate division NC10 bacterium TaxID=2072417 RepID=A0A7C3W5F8_9BACT\nMKRPLIAVTMGDPAGIGPEIVVKALQDEEVMAASRPLVIGDRGVLEQAARFCEFQGKIRVVGGPEEGAYTLGTIELLDLENVELASLKIGAVQGMCGRAAFEYIQKAAELASSGRVDAIATAPINKESLRAAQVDFIGHTEILSALTGATDPLTMFQVRTLRVFFLSRHVPLQRACELVTRERVLSYIQRCSEALRQIGVAEGTLAVAGLNPHSGEHGLFGEEEVKEIEPALREAQRLGCRVVGPVPADLVFHQALQGQYSAVLSLYHDQGHIPTKMVDFERTVSVTLGLPFLRTSVDHGTAFDLAGTGKASAASMKEAILVAARYLRDFRRP\n>UniRef90_A0A1G3PK91 DUF4294 domain-containing protein n=1 Tax=Spirochaetes bacterium GWF1_49_6 TaxID=1802189 RepID=A0A1G3PK91_9SPIR\nMKHTLFLLLLLSCFSHLFAAPVNYPEIFGQDFMKALNISIEIKAQVVKLSKEMKADPELVLPAAFPELIRYSLFRDSMELFTLEVFYVNFGSGVNDFSVGIFQMKPSFVEQMENYLNTHDELKMYRPVFVYKFPNDPSAVRKERIERMTKIDWQIRYLVLFSKIAEQVFPKQPGQTKSELVKFYAGVYNTGFWKTKEQILKTMALNIFPNGMSYPGEQNNYSDIALYFFENYWQKFLKDDSIKSFPLR\n>UniRef90_A0A6A5RRK3 4F5 domain-containing protein n=1 Tax=Didymella exigua CBS 183.55 TaxID=1150837 RepID=A0A6A5RRK3_9PLEO\nMKETAHAEKLEKANVKELKAANKLYNNKIKEQKREAAAAAKEVRDRKCAEERVAIDARKAQRLKDKQARDAQKASQLPNKGKRKASKAPQAPAAKKRRSAQPRSGAVAAAAAPPRGTHTTRSGRTATLYK\n>UniRef90_A0A7W8D7Z3 6-carboxy-5,6,7,8-tetrahydropterin synthase n=1 Tax=Chiayiivirga flava TaxID=659595 RepID=A0A7W8D7Z3_9GAMM\nMPLTIFKVFQLEAAHRLPHVPPGHKCARVHGHSFKVEVHVGGPLDPTLGWVMDFADVKAAFAPLHEQLDHHYLNDVPGLDNPTSERIAQWIWERLQPTLPGLARVVVHETCTSGCDYRGPTA\n>UniRef90_UPI001069C9AA uncharacterized protein LOC114541692 isoform X1 n=2 Tax=Dendronephthya gigantea TaxID=151771 RepID=UPI001069C9AA\nMEKDKERSDKNVNEVQPVQTVPVERRVKTKALKGIYHSILMQNSKKTKSIEEPPPVKKQCVSAEEDDAPDDDDVYTTTMIEKQTYCALIPQKFKSLNDLCFSGVLQNCLAVISNVFTPKLAKNGNHFLKISITDPTHYGSYELMWFSKPTEFPNIYRTGEIVLLKGIKCQKYNEIHQILKNFTTNICVIPLDDDPPLMKKARQPLERYESKFGDAIKFLKKWRNSNITATTFSQLDVITTAVEGSSFNFCVKIMKLTELTCDSYCLTVWDGSRPSLQARAREENSNAKANACDVDEEELVDIIVLDQNRSIKKYNLRPLNVLALYDVTLNTDRRLELNMENEESGFTVVKPYCHVARYVPAREQRQEHTWNFKGW\n>UniRef90_A0A356NIC5 Probable dual-specificity RNA methyltransferase RlmN n=3 Tax=Verrucomicrobiales TaxID=48461 RepID=A0A356NIC5_9BACT\nMLPSLQSITPEILKSQLVDWKQPAYRGDQILDWVYHKRAVTVDSMSNLPKDLREQLDKNFKCYLPDCMQKQGSDDTTQKFLWKLNDGAFVESVLIPANPALYGEASDRHTLCISTQVGCAYGCKFCASGLDGWKRNLEPEEILGQLLAIEHHFQPKLKQGQGRKVNNLVIMGMGEPMANYENLMKALKIANAPWGCNIGARKITISTSGLAPQIVALSREPFQFRLAISLHGATDEVRSRIMPINRKYPIKDLMDACRQYLNKKGKMITFEYILIEGVNDGQNQIQPLADWARELHAKVNLIPYNTVEGLPWSRPEEDIQESFLEGLLSRGINATLRREKGHDIDAACGQLRLKVEKGLTE\n>UniRef90_A0A1V5K701 Cell division protein FtsL n=1 Tax=Candidatus Aerophobetes bacterium ADurb.Bin490 TaxID=1852830 RepID=A0A1V5K701_9BACT\nMAEFSNRFLRGLNAGSVRPARGGANKAVGLILLLSLPFLLVVWFYTQSAKLSYDITELTRERDSLKSQNKMLEMKVQVAMSGSGIEHIARERYGFRPAKPGDVQVIKKEYGALGLF\n>UniRef90_A0A8H3UYL2 Carboxypeptidase n=2 Tax=Venturia inaequalis TaxID=5025 RepID=A0A8H3UYL2_VENIN\nMSRFVALIACVFALLNGLSIARETMDERARSSRQRRSEMMTPVRRSPLESRDNSTWRFLNSKSQAYAVDSLPDLDFDLGEMYAGQIPIGNDTSRNMFFVYEPTISEPVDEVVIWFNGGPGCSSLEAFLQENGRFIWGWGQYSATENLYTWVNLTNVLWVEYPVGLGFSTGNVTATSEEETAADFVAFFKNFLDIFAIKNFKIYVTGESYAGRYVPYVSAAMLDENNKESFDLAGALMYDPVIGQYEYVGQTIPAVPYIQEYSKFFNFNQTFMDQLASAHESCGYADFIDKYMVFPPAGVQPWLEGGFNNKSAECDVWDLAWAAAFQPNPCFNVYEISSMCPILSDPLAYPSDLQYQYDGMGGIYFNRSDVKAAIHVSQDLSWSECSGPVFVRSAGGLYGNGDTSLDPIQYVLPKVIEATNRVLVANGDYDFELITNGTLLSIQNMTWNGALGFQSAPTTEIDITLPDLQWQATFEASGLGGYDGPGQGIMGVQHYERGLMWAETFQSGHMQPQFQPRSSYRHLQWLLGHIDTLYVAKAMTNPENEYVSLNKQRCMNEVLVAQADEVKNLLIGAFNTPPGYRPAHAKGTVLTGTWTPTTLPSPLTKAWHIQTPTTVLARFSNNTGIPTIPDTDPNATPKGLALRFNYPPAAADGKRKHTDIVAHSTPHFPARTGAEFARFLKALGEGAAAVDGFLGTHPHTLEFVQAAKPLPVSFGTEAFFGLNAFKFVAGDGVETYVRYEFVPVAGVAHLSDEQARGKGADYLAEEIRERIGRGPVGIKLIVQVAEEGDVVDDITVHWPAERAKVELGTVWLDAVDEEGLETQKKTIFDPIPRVEGIEPSADPILDFRAALYLISGRERRAA\n>UniRef90_UPI0003871D39 macrophage-capping protein n=4 Tax=Falco TaxID=8952 RepID=UPI0003871D39\nMAPSDPRSPPERANPPGGTRGGAVRPPGVRLAVRRLHIWRVEKLRPGEVPKATWGTFFSGDAYLVLHNGPDERAHLHLWMGRDSSRDEQGACALLSTQLNALLGERPVTHREVQGNESDVFMEYFPRGITYQEGGVDSAFKPTRPSAGAGPVCKLYQVKGKKNIRASEQDLSWASFNTGDCFILDLGETLFVWCGARCNILERSKAQELAMAIRDGERGGKARLEIVVDGEEPPEMLQVLGPKPTLQEGSPEEDVVADQRNAGAAVLYKVSDMTGRMDLSQVATSSPFSQSLLCSDDCFVLDDSAGGKVYVWKGRKASEQERQAALKVAEEVITRMGHSPRTQVEILPQGHETPLFKQFFTSWK\n>UniRef90_UPI002022F6CD restriction endonuclease subunit S n=1 Tax=Pediococcus acidilactici TaxID=1254 RepID=UPI002022F6CD\nMSNKVPQIRFNGYSDAWEERKLGDVGDTFTGLTGKTKEDFGHGSAKFVTYVNVFQNPIATLDQLDAVEIDEKQNQVQKDDVFFTTSSEIPEEVGMSSVWTYDTKNVYLNSFTFGYRPRVSFDLNYMASMLRSPSIRKKITFLAQGISRYNISKTKMLEIEIPAPNLSEQKKSVRSSNS\n>UniRef90_UPI001CBE7AE7 immune inhibitor A n=1 Tax=Kangiella taiwanensis TaxID=1079179 RepID=UPI001CBE7AE7\nMKIKLLAGLLAAAIIPSVNAAALESGAQVSPKDPALVNHERIIYWLEKRGELDANATDSQREAALATYLKGVRSNNVALPKIEQARLQRQQTSYLKGESKSHKRTDEKTVKVLAVLIDFPDLKHNAHGLTSGDTDMYYSSYPVSHYQDLMFSTTGFTGPSGQNFTSGYQYYQNESGGTFNFTGQTFGWVTADNNAKHYGQNDPDSNDNDKNVPALIKEAVTKAVAANSINLADYDIEDPYDLDGDGNVDEADGMIDHVMVYHSSIGEEAGGGNLGEDAIWSHRFFVDTNTNGYTIPGTGKKLFGYTIQSIDAATGVVVHEFGHDLGVPDEYDIAGSAVGSPVGYWSVMAGGSWAGEVAGTQPTGFSPYARAYFQSVYGGDWIDEQTVDFKAMATGSQNFDLVEAVNHNGLNQIRIDMPKPLVDFAPPYSGSYQYYSDEGHYLNNALSFDVNIPASGNSVLSMKARWDIEVDYDYAQVLVNGNPIAGNHTKVNNQYHSGVTHFITGESKTISGAEGALGWLDLTFDLSAYAGQSVTVEIKYVTDPAVGGYGLVIDDLVLNNGSDIFTDGAETEGSLTLNGFLRVSDKTDGKAQHYWVQLRSENGQDEGLKRTVYTPGVLVWFADEAYSDNKVEEHPGHGFLGVVDADQNPIKRNGSIASSSLQVIDAAFGLYNQKSYSGDSHLSSTATFDDSLDYSLPQQPESGLVLPTHGLSIEVTAQATNSSTATVKISKATPALTADFGFDIDYKQVAFSNNTKGGDANYTYAWDFGDGSAVSVDANPTHTYAQSGVYTVTLTVTDGEATVDSKSKSVSIADELQAEIVSSVNGAKVSVSGNAVGGSPDYTYSWDFGDGATSSNRSGEHTYALTGEYTITLSVTSSDKQAVEVSKVVQVVAALNASMNTSANGLKVNFTSNVGGGDGNYSYSWNFGDGSSATGANPSHTYASAGSYDVAFTVADSTGVEVTVNKTISVAEKSSGGGGGGSGNILLLMLLAAGLVLRRKS\n>UniRef90_A0A0D2KAI6 Pentatricopeptide repeat-containing protein n=2 Tax=Fonsecaea multimorphosa TaxID=979981 RepID=A0A0D2KAI6_9EURO\nMSMSLVHCLSDSVSSSGSFSRTFSRPFSISTSNFSASITSTKRPQRRSTSKSWLEDLSPRFFTDTPIYPDVLRIKPLTSNGAPPQDLSSLRPPPLPFIPPPQSNRNGRITLLQRLRYWWRRAAVMRKFYKQRIAQTRQNRKECALLSKRLPRMFVEHPDRAAIYGGSTFTVNDKSFPIPRISRREFQLLVQYGYDNWGFALAVRALPTSEKPEEDRNRQLKALCNRYDWFARNRNDKLDNVTDNSNLSHTAQAEEVFTLLQRRLLRWHYVVVDDALCKLIPWVPFAWTVYAARFFDRWCADYYRIITADTVLIMRQGGFNTLSADDIYDYCVKCASPTFISYAKQALQDGVNPANEAMRKAMIPVLDARAKRMLSIDWTRLKPHALGRIEPFSRVKDLKQPDSVWGRK\n>UniRef90_UPI001CCE8B09 LacI family DNA-binding transcriptional regulator n=1 Tax=Celeribacter litoreus TaxID=2876714 RepID=UPI001CCE8B09\nMSEPDRISSKNLTMQDIAKAAGVSPMTVSNCFRYPDRVRPKTRETVMNVAAQLGYVPNMSAGLLAAGSSQVIGAVLPSIRNSAFYRYVAGLRQAATERGHELITMIAETPEEELSAVQTLLGLRVAGIALVAGPHVADLRQLLALSGTPVVESWGGEDAIGCGVAYDVGAASRELTQHLIKQGRRRIGFVQVLGGGEQRYTMRFPGFQKVMFDAGLADNLVLTVRAADGFGSGARILNEFLSLEPRLDAILCPTDVVAAGALFECQRRGLDIPGDIAIAGWGDYDIGRQLSPTLTTITPFSFDIGAGAVKMLLEGGAERPNSLLTPYALEVREST\n>UniRef90_A0A7D6Z791 AAA family ATPase n=1 Tax=Nocardia huaxiensis TaxID=2755382 RepID=A0A7D6Z791_9NOCA\nMAPNHQPFAQVRETHTGVVFLCGERAYKVKKPVVTDFLDFGTAAARERACARELELNRRFAPDVYLGLAQLSDPTGGPDEPVIVMRRMPDSARLADRLDADEEAPELSALAELLARLHDAARRGPEISAAGTPAAVRARWQALLHSLREQPLGALDPDDVEYAELLAGRFLDGRGDLLAQRIAQGRIVDGHGDLLAEDIFVLPDGFRILDCLDFDDALRYVDRLDDAAFLAMDLEFRGHSRLAEDFLREYLRRSGDAPPASLRHHYLAYRALVRAKTDRLRAAQGDPEAGGQARRHLRLTLRHLAAGAVRLVLVGGLPGTGKSTVAAQLGRLTGAEVISSDTVRAELRARGAITGRAGVFGAGAYRPQAKHAVYTQMLERARERLAHGVPVILDAAWTDVAERRRAVRLATDTCSDLVQLCCTCPGTMAAARMRTRAHGDSEATPAIAEAMAVAGEYWCGATLLDTTDTLEHTVAAALREWDAAPLRAPRRPESSSLPSR\n>UniRef90_Q31A46 General secretion pathway protein C n=1 Tax=Prochlorococcus marinus (strain MIT 9312) TaxID=74546 RepID=Q31A46_PROM9\nMKKFIKFLFFVFICGLVSNSHLVLTKDDNRSKKEIKLHELPIKIKNSKNNQIQLKTLPLPLIEVAANSVNSERNPFLELNKSIEEIGINPKKFFTLTGIIQTGEQLSAMLKSSDGVNLFKEGENINKNLKIKKISLENETVIFTDGENEFKLEFSEK\n>UniRef90_A0A848CYM8 YqaJ domain-containing protein n=2 Tax=Aneurinibacillus aneurinilyticus TaxID=1391 RepID=A0A848CYM8_ANEAE\nMSNLINRSAAEALRRQISEAAEAQRGHEMVSDFLTMMDRWHGSAEVWDDTLEAEILEQQAYAIRRLKVFPPRGTTYFSPSSANSCKREMYVKLTGAARDNSDSQPHQGRWQRAGTAFGDTIQRDLLFIEKHYEKKFGEKPPFVPERTAHGFPMWERFARKFHSVEHRGYTVNFLGQPDGILRYKDGTRVGLEIKSKQTTSAQTTEYSMRGPKEDHVKQCVVYSIMYGVDDYLIVYGNLSKKAWVMTPEEYAKNPDLRAFYIHVSESDRQALLDDFVDVLQAVKDGNPPRLDVEKWTFNNYKTACALSLTDAELEDIRKQVRQVGRSRLPDWKKQAYYDALDFIERVRKEAM\n>UniRef90_A0A1G5F3R4 Aldehyde dehydrogenase n=2 Tax=Desulfoluna spongiiphila TaxID=419481 RepID=A0A1G5F3R4_9DELT\nMDTQQEMNKMETSLATMKRAFASSPMPSLNTRIGMLKNLKTALIEYTGKISSAMSDDYGKRSEIDTLIADIAPCIANINHTVGHLHEWMEPSKRDSGPLLSTASVEVIYQPLGVVGIVVPWNFPVMLSIGPLISAIAAGNRAMLKMSEFTPHTNKVLGEMLQSVFDEAYVNVFEGEAEVSAAFTALPFDHILFTGSTTVGRHVMRAAAANLTPVTLELGGKSPVIVADDVSMEMAVERIIYGKSLNNGQVCVAPDYVFLPEGRVESFIAEYKKQYGDLFPDGVDSENLTSMANTRQFNRIEGLLNGETEKQTRIEPCHGNSRDNAKNRLVTHMIVDPAKDSEVMTEEIFGPLLPLIPYGDVQEAMAYIQGNPRPLALYLMTFDEDLQQQVKTTVHSGGMCINDSVFHLAVDDAPFGGVGESGMGNYHGFEGFLTLSHSKTVMTSGTKHNIKHLFAKDDNAFKKAVLEAMLR\n>UniRef90_A0A1X1T8H9 Chromosome partitioning protein ParA n=11 Tax=Mycobacteriaceae TaxID=1762 RepID=A0A1X1T8H9_9MYCO\nMSADYDRLFHSPDAAQTPDEATLHVDRDALMRSNAAAPAPAGGSNHADGAVPPPLPITQPRTQTAPAPPPRHAEITTQMPPTTQMPPTTHMPPTTHMPPTTHMPPTTQMPPTTQAPPAQSPAPQRPPNGMMRTPQTNLPGGARFEAPRQATTPAPRPAPAPPPSAHFADAPPTEAAWPHGQPPAQPAPTSAAAMGNHRAIDALSHVGVKSAVKMPSQRGWRHILYLLTRINLGLSPDELYEMDLHARIRRNARDSYQIGVLGLKGGVGKTAVTVALGSTLAKVRGDRILAIDADPDAGNLADRAGRQSAATIADLLSDKELARYNDIRAYTSMNGANLEVLSSEEYSQARREFNDDDWKGATEVVSRYYNLVLADCGAGLFQPSSRAVLATVSGLVIVASASIDGARQAAVTMDWMRQNGYQDLLSRSCVVINHIVPSKPNIDVDDLVQQFERHVAPGRVIVLPWDKHIAAGTEIHLDLLDKVFQRRIIELAAALSDDFDRLERR\n>UniRef90_A0A0R3QEL7 SH3 domain-containing protein n=1 Tax=Brugia timori TaxID=42155 RepID=A0A0R3QEL7_9BILA\nMEKIKVINGLRTTISSLPVRESRKALRYLGRIKRTKRVKAVALECGLLRKLLPGFIVYFNVMLRKELVASGVRYGVMEAVAEHDFNATAEDELSFRKNQILK\n>UniRef90_UPI001944A0FC hypothetical protein n=1 Tax=Levilactobacillus andaensis TaxID=2799570 RepID=UPI001944A0FC\nMEREQQRLDTGLAAELNAALKTKRTQLELLQLLYGQTPRSQRQCSSVATEQVVRTDAE\n>UniRef90_A0A672LGG0 C-type lectin domain-containing protein n=3 Tax=Sinocyclocheilus grahami TaxID=75366 RepID=A0A672LGG0_SINGR\nDQNDLDLKIQDQVIHLTFLLVFQRGSRCLVLITVGLGLICVLLLVFIILQHITITAERDRIKSYKNTAEEFNQTINSLQDNHTDLTIKKSQLQDNFNSLSQKNLELESQVRSLSDQLKKESKRGQICCFWSSSLLMHVYSFLKCLCKNLCGLDGFFLSNEFKSWSDSRQYCRDHGADLVIINSGEKQVSFLWIGLSDRQQEGNMKWVDNSPLKQGFWLKGEPNDQGGDEDCIELMPSNPVLNNWNDLSCSEKRKGICQK\n>UniRef90_A0A538MFC4 Thiamine-phosphate synthase n=1 Tax=Actinomycetia bacterium TaxID=1883427 RepID=A0A538MFC4_9ACTN\nMRLHAIVEDLASARAAVEGGATVVQLRCKGASTDELVEAGRGFGVLEAAFVVNDDVEAALRLGADGVHLGRDDPGAERAVAAGLLLGTSAARVEEARAGEALGAAYVGAGPVWATPSKPDADPPIGLDGLAEICAAVSVPVVAIGGVDASSAGDCIRAGAAGVAVIRAALDAAAVRAAVDAAL\n>UniRef90_A0A7V9WRH6 Nucleotidyltransferase family protein n=6 Tax=Streptococcus porcinus TaxID=1340 RepID=A0A7V9WRH6_STRPO\nMEVIDKLISQNAELMNLLKLIKGLDLPDSWLCAGTLRNFIWNKLSNHNEILTTDIDLVFFDPNMTYQESLALEQSIMRKFPQYNWDVKNEVYMHYHTPAASAYSSACDAISKFPEKCTAIAARLDDKNQLELFLPYGEADILQFQVNPTPYYTENRERHKKYNQRQYQKNWSSTWPQLKVSFFPE\n>UniRef90_UPI001CD804F7 response regulator n=1 Tax=Desulfuromonas sp. CSMB_57 TaxID=2807629 RepID=UPI001CD804F7\nMGHKVPKILVVDDEENARLALRVILQQEGYQVDSVANGLEALEFLRRHRVNVVISDIKMPQMNGLAFLRELNRRYPSTRVIMVTAHGGIESYLEAIHLGAFEYIHKPVRVEELKWVMSKMFNEGRTAKAN\n>UniRef90_A0A167SRD8 Uncharacterized protein n=1 Tax=Fibularhizoctonia sp. CBS 109695 TaxID=436010 RepID=A0A167SRD8_9AGAM\nMCHCGAECHHNINLFEVSQKSDHTSSEVQLIGLLFPYVARLWQRVNITLIAAAVCSRNGDLFGDVEMAAS\n>UniRef90_A0A5B7IY87 Secreted protein n=1 Tax=Portunus trituberculatus TaxID=210409 RepID=A0A5B7IY87_PORTR\nMLRLMLLSGWILHYHYATTLPRAPPCQCLTPSRPCRHLPLVKTRQQNMEYRLGPAECRRVLCNATPHSQSGLPPPCSFRPSDQHPTTPLVFPPLPQHTL\n>UniRef90_A0A6M0BSB5 Uncharacterized protein (Fragment) n=1 Tax=Okeania sp. SIO2H7 TaxID=2607802 RepID=A0A6M0BSB5_9CYAN\nMLNLAVIYIDNIFTNVEKKETGDRRQEMEKGVRRQESGDRRWKKESGDRSQETGVRRQELELCFLERSLKKELIDRMKREPAKN\n>UniRef90_A0A7S1N3F1 RRM domain-containing protein n=1 Tax=Eutreptiella gymnastica TaxID=73025 RepID=A0A7S1N3F1_9EUGL\nVEATAAGAAPTESKAKGTKRKRLPPASEDAAERPPPSKKERKGQLVSATTPKEVAALPPPPADVREVWMTNLPVIVSEKDLYAAYEELGWEAITKVKWMQRTHAAGTSFRRCAYVTFATPDLARRACTLDVEIKGKKPKLELTNPHHVHKSLELFTQGWPTQITDKQVHEAFLLLGLTGITAIRWLPKKGNRLSCFLDFDSKEARDKVLQGGTLQYKGRTVLVQKPLNTLPSDQRTAADRSAKSCELFLDPCFKAMTNDIIQTHYESTLGPDTVVTVRRWQNRGWVVFKTHELALQASKMKPPRNPGKEQVLVRWRLNAK\n>UniRef90_A0A4Q3K0R9 MBL fold metallo-hydrolase n=1 Tax=Myxococcales bacterium TaxID=2026763 RepID=A0A4Q3K0R9_9DELT\nMASLGEGNGKHPADFGVGVRPLTEVSPASGKPVLAFASHAHVDHIGSLHLYERRAGHPLEAHTFAAMDDLGTLAPEFIGIEGAVTASPSPGWTMADYALVPAPLTELLGEGDHVDLGDRRFTVLHLPGHSPGSIALLDERNGDFFSADAIYDEGLVDDIPGADIETYLRTMRRLADLDVGTVYAGHGEIMDRKQMRDVALGYIASKGG\n>UniRef90_UPI000719B42D xenotropic and polytropic retrovirus receptor 1 homolog n=1 Tax=Priapulus caudatus TaxID=37621 RepID=UPI000719B42D\nMSTARTCMLPTMLKDLLYAAQDEAPNADAVDDDHVQRFLANFEERFFRKSDQELVKINTFFSEKLAEAHRKWANLKSELGELEERDRNHVSGHQRRKLSSVVQRAKNKKEPAVRNLPQLKLAFSEFYLSLILLQNYQQLNFTGFRKILKKHDKLMQTETGSQWKSVNVASAHFYINKDIDRLIQETEVGRGYYEAIIPRNSGVRPWHSSEDHAGW\n>UniRef90_UPI00123D7996 HNH endonuclease n=1 Tax=Roseibium aquae TaxID=1323746 RepID=UPI00123D7996\nMIEAPQSFVVREECGKAAFQNGFRRKREEREGWAGFSSTTVPGTIHLAAASAQGPWFLALDHTGVVEELDIPVVDIAGPGLARYAFETLGQVYAVLPRIYQLAASLPDAPLQEFETKVKDLPKTTEAERLVVQRIGQDIFRSGLLEYWQGRCPLTGISDEPLLRASHIIPWKDCESDAERLDVHNGLLLSALWDAAFDRGLVSFDDVGQPIFSPALGEHARSELRWQQPIALTEKHRARLAWHRSHLFKAEQ\n>UniRef90_A0A3B6R914 Homeobox domain-containing protein n=2 Tax=Triticum TaxID=4564 RepID=A0A3B6R914_WHEAT\nMSPSTSPESGISAGTKRGLEHTSSGVFPAASSDEDDGGGDGAGGRKNLRMSKDQSAVLEECFKTHSALNPKQNKALANRLGLRPQQVEVWFHNRRARTKLKQTALKAAPQAHNGASEGPLTTLTMSLSRKRVASTSSASACTVPRFSANAGTGMPMPSLKEWQFFCAFRDTGAMYGGSSRLAKVVKPAR\n>UniRef90_A0A401M0J4 Potassium channel protein n=3 Tax=Bacteroides TaxID=816 RepID=A0A401M0J4_9BACE\nMKSALSDFVWEKKGIYGILHVVILLMSLFLVISISIDTFKGIPFYTQTSYMKVQLWICIWFLFDFVLEFFLARHKWHYLRSHFVFLLVAIPYQNIIAYYGWTFSPEVTYMLRFIPLLRGGYALAIVVGWLTHNRASSLFISYLTMLLATVYFSSLAFFVLEHKVNPLVVGYGDALWWAFMDVTTVGSNIIAVTVTGRVLSVVLAALGMMMFPIFTVYVTNLIQRFNDQKNKYYQQQTTQQESVVSQGQTSPQGQTSQQSPTEKSAS\n>UniRef90_UPI001FE9B9A5 beta-lactamase family protein n=1 Tax=Sphingomonas colocasiae TaxID=1848973 RepID=UPI001FE9B9A5\nMLALALLSLPAALAAQAPVPSDTPGKTASGISYTQPRDWTMTVKGSATIFAAPEANLNIAVVDAGEAESAQAAAAKAWAAYRPDAARTVRLVSPAARGDGWDERVGIAYETSPNERATVSALALRKDKGWTVVITDGAESTANKRSAATSVIQGSLRPAGYAPETFAGKAAHRLTPDRIQAIRDFVAESAKQLEVPGVGIALIDQGKVVWEGGVGVREIGGNEPVTAHTKFMVASNTKGMATLLLSVLADEGKLRWDQKVTDLYPAFRLGSDAVTQSTLVRHLVCACTGLPRKDYAFILADAGAPASDTFRQLAETQPTSKFGELFQYNNLMASAAGYLGGSLAYPKMELGAAFDKAMQTRIFGPLGMRDTGFDNAAAEKGDWARPHGLDVDGRMVEIPNTFNHLIVPHRPAGGAWSSAADMARYAQLELSKGLTPEGKRLVSEANLLERRKHGVPIGENGWYGMGLMERVVSGVTVVTHGGTLQGYHSSFFVLPDAGIGAVILTNADPGASMIAPYLRRLLEVVYDGKPEAAQDVAAVAARIKAQAQARRAKLTVPGDPAVLAGLATTYRSQIDGKISFSDRGGAKWMKAGFIEGPVATRKNADGTVSIVSAGGGAIGVEAVVGSKDGARTLTVRDSQHDYVYTEVR\n>UniRef90_A0A536UTK9 SCO family protein (Fragment) n=1 Tax=Betaproteobacteria bacterium TaxID=1891241 RepID=A0A536UTK9_9PROT\nREFKFYYSAQQADAQGNYTVDHGAGVYVFDPRGRLRLMMRPGSAVDAMAADVAQLLKE\n>UniRef90_A0A290RU70 Cytochrome b561 n=15 Tax=Pseudoalteromonadaceae TaxID=267888 RepID=A0A290RU70_9GAMM\nMFKNTPTSYGLIAITLHWLMAFTVFGLFGLGLYMVELTYYDSWYKGSLDLHKSIGITLAAVLIFRILWRVFSPKPRPLSQNKTVNHIAHTAHIVMYLILAVIVVAGYLISTADGRAIAVFSIFNIPALDYNFDGQADIAGKIHYYGACTLIGLAVLHALGALKHHFIDKDKTLTRMIKPKEY\n>UniRef90_A0A7W1BD12 DUF1570 domain-containing protein n=1 Tax=Actinomycetia bacterium TaxID=1883427 RepID=A0A7W1BD12_9ACTN\nMTASLDECWLKITRAESHFDIVKSAIHGFLQPNPERIAGQLDAESGEEVYYTRRYPGTRREWSIIIGDALQNWRNALDYIVCGLVRMNGEEPSSSNAFPIVDRESDYPAQSKQRIARVYPGSEAVVEGLQAFNRGNAPEDDPLCRLRDMNNWDKHKALHTTTHVVQLESAWPVRMSEDPSAGKFVSGAFERERPLARIPADRELGQAYAEMVFDATFDIAFEGGPPLTEGLEVIETLQQIGDFVRFETLPRFAQFFA\n>UniRef90_A0A7C3X0Q5 Aldehyde dehydrogenase family protein n=1 Tax=Candidatus Hydrogenedentes bacterium TaxID=2030809 RepID=A0A7C3X0Q5_9BACT\nMSKKELKVINPYTEKEVYSFPMDTIEDAYQKIENAYKAFQEWRFTSMNTRKELCLKFMKEFEKNRDNIAHEITEQMGKPLQQSQNEINTMLDRAQYMISIAEQTLADEYLPEKPGFVRYIRHEPIGVVLDIAAWNYPLLIAVNVIVPAIMAGNAVIVKHARLTPLCGKAFVEAFEKAGAPKGLIQDIIADHQVIDAVIKHPKIGFVSFTGSVRGGHEVVQSASTRFINQGLELGGKDPAYVCADADFDYAVANCVDGAFYNAGQSCCAVERIYVEKPIYNQFVEAFVELTRQYKLGDPMQKETTLGPLAVSSARQFLKKQVEEAVAQGGKLVVSPDEFEVPDQGWFFAPAVVADAPQKSSLMQEESFGTVIGILPVHNDEEAIEYMNDSPYGLTASIWTSDFERAKRIGERVETGTFYMNRCDYLDPALPWTGVKDTGRGASLSHYGYYQLTQLKSMHLRIKW\n>UniRef90_A0A7Y5VDB2 Rhodanese-like domain-containing protein n=1 Tax=Saprospiraceae bacterium TaxID=2202734 RepID=A0A7Y5VDB2_9BACT\nMFGLFQRTSSDYKNLNADDFRKAIEHDKNAVVLDVRTPAEAHGGKIKGAKVINFMDPGFATAISKLDPGKSYYVYCRSGVRSANACQVMAKNGFKELYNLRGGVLDWPFQLL\n>UniRef90_A0A1F2RY10 Lactamase_B domain-containing protein n=1 Tax=Acidobacteria bacterium RIFCSPLOWO2_02_FULL_68_18 TaxID=1797185 RepID=A0A1F2RY10_9BACT\nMTGRYVGIVAALALGGASATLQDATSVLNDAARALGASELRTVQYSGTGFVYAFAQSYRPGGPYPKFHATYSRAIDFERGLSRDETVRTQFEDPPRGGGGQPLYRDARAAGVVTENSPWGAGALALTPHGFLQAAMRATPTISTRRVGGGTVTVISFTARERYRVDAFVNGQHLIDRIETRAANPILGDMLIETTFAEYRAFGGVQFPTRIAQRQGGFPTLEIAVTDVRPNAAVALEAPEGGAPQPARSEGQRIAEGVWYLAGRPDPNSQLVEFRDYTVLIESSVTEARALLNLAEARRLVPGKPVRYHVNSHHHGDHAAGLRAMVAEGVTLITHETNRPFYEQTVLRNPHTLAPDLLARNPRPPAWVWVNDKYVLSDPTRTLELYHVENGHAANLLMGYIRQEKLLIITDIFNDFGEPRPNDPPSGLVSPYYAALGDRIRRLGLDVERIAPSHGTGTVPAERLWKALEGKVQAPPVAGR\n>UniRef90_A0A7J5FRL1 Transposase n=3 Tax=Bacteroidales TaxID=171549 RepID=A0A7J5FRL1_PHOVU\nMGIDDQNKLVNAGFQIIRKDDYPSPRIKFCTGRNGSWKTYKKFETKAERDRAFALLLKDEKIISD\n>UniRef90_A0A0E3X9I7 Group-specific protein n=1 Tax=Staphylococcus phage IME-SA2 TaxID=1610831 RepID=A0A0E3X9I7_9CAUD\nMDYREKMVSQGQPPLSNFEYYHVIVPYLVGVIVIILSIIFRDSLYSAQSGFGVIITSFIYMLVYVIIGLVGSFVLTIFQARKARQYQTQEDNNEVQ\n>UniRef90_A0A2K2F967 Protein jag n=1 Tax=Pseudoclostridium thermosuccinogenes TaxID=84032 RepID=A0A2K2F967_9FIRM\nMSYTIEKSAKTVQEAISAALEELNADENEVEVEVIDEGNKGIFGIIGTKLARVRVTLLDTPAKKAQDFLEDIFSKMGIAPEMELTEEDDTLSIKIKGKDIGIIIGRRGETLDSLQYLTSLVANKNGGKYKRVIIDVENYRQKREETLIKLANRLADRVVKYKKSVTLEPMNPYERRIIHSTLQNHKSVETYSVGEEPNRKVVIAPK\n>UniRef90_A0YFF1 Hcy-binding domain-containing protein n=1 Tax=marine gamma proteobacterium HTCC2143 TaxID=247633 RepID=A0YFF1_9GAMM\nMVMSKVVLLDGGMGQELLRRSSQKPHSMWSARVLLEEPEIVEAVHRDYIEAGARVITLNNYSATPERMAREGHPELFDILQKKAIDIAKRARDNSPRARDHDIKIAGCLPPLFASYKPELAPNFEECLERYRVIADIQKADVDLFICETMSSIKEGTASAVAAASTGLPVWLGLTLEDNLEGRLRSGETLADAMAPIVDLGVEALLLNCSMPESINAAIGTLINGYDTVGAYANGFTSIAALKPGGTVEELQARQDLSPNGYAKFALSWVDSGAKIIGGCCEVGPAHIAELEQQLLAKGHEICSAL\n>UniRef90_A0A2T9WSI7 Nucleotidyl transferase n=1 Tax=Nanobsidianus stetteri TaxID=1294122 RepID=A0A2T9WSI7_NANST\nMSLYTLILAGGFAKRFRPLSDYVPKPLFPVGGVPLIYYIIEKALETGSDGIIISTNKKYEYHFRHILASLYSFYEPSQIGKIRLVIEPSNSEENKLGSIGGLHYAIKEMGINNNLLILLGDNLFSFNLNKIIKLGNENNSIALAIYDVKNPDNAKNYGVVKIENNIIKEFYEKPQNPLYTTISTGIYYIPREKLYLLDEYMNSNYSKDSMGNFFEYLIKRGEKLYGYIYIMTIMNIGLILVQ\n>UniRef90_G2I2J0 Competence-damage protein n=10 Tax=Komagataeibacter TaxID=1434011 RepID=G2I2J0_KOMMN\nMNPTACLLVIGNEILSGRTQDVNVQYIARRLSETGITLSEVRIIPDIRTVIVRNVTETRAAYDNVFTTGGIGPTHDDITSACVAESFGVPWVHHPETFRLLEAHFAPDAFNAARQRMATMPQGATPIRNSVSVAPGFTMGNVHVMAGVPRIMRAMFEEVLPTLPHGTPVTSQAWHANGLYEGALAASLEAIQHCYPTVDIGSYPYRLDESQRGVCLLCKGTDTQAVQDAATAVRNLIVEMGFRPQAGEPAKA\n>UniRef90_UPI0008255106 DegT/DnrJ/EryC1/StrS family aminotransferase n=1 Tax=Bacillus acidicola TaxID=209389 RepID=UPI0008255106\nMISTQLRNIPFSPPDLTEKEIEEVIKTLKSGWITTGPKTKEFEKKIAEYVGVNKAVCLNSATAAMELTLRILGVGPGDEVITSAYTYTASASIIEHVGAKIVLVDTAPNSFEMDYKKLAEAITEKTKVIIPVDIAGKMCDYDTIFEIVESKKELFNSNNELQGLFNRVIVMTDAAHAFGAERRGMKCGQVADFTTFSFHAVKNLTTAEGGAVVWRDIFGLDNEWLYKQFMIYSLHGQSKDALAKTQKGAWEYDIVYPAYKCNMTDIMASIGLIQLDRYEKLLQRRREIIEMYDKALSPIGVQSIQHFGEDFSSSGHLYLARIPEINEQHRNEIIVKMAEAGIACNVHYKPLPMFTAYKNLGFDIKDYPNAYNQYVNEITLPLHTLLSDEDVEYVVGNLKWNLNEI\n>UniRef90_A0A455ZFP0 Paeninodin family lasso peptide n=1 Tax=Elizabethkingia anophelis TaxID=1117645 RepID=A0A455ZFP0_9FLAO\nMVKKKDYIPPKLEVEIVEMECGIAANSAAVSPQTVNGNTDEAQTDWNGNDDTTIDTPF\n>UniRef90_A0A7S3Z719 RNase H type-1 domain-containing protein (Fragment) n=1 Tax=Lotharella globosa TaxID=91324 RepID=A0A7S3Z719_9EUKA\nWSLLLAPKAFLKRATSMQRRTLKRFLSLPTCAGGDVAEVYAAIAPLDVLLHRLCAGTLVRMVSAEDHEGRLAYRRYLDSDQPIKDIRRKVSTWKSPFGVMLKAAQALGLPLFPRAKRVRHAMAKSNVNVNVPVFKNFNKKFSERCKKKAREFAESVIANIPSDEYTLYTDGGQCDDHKFAAVCGVKDNMESFTLCFRLTGAAVSSHVAEVYAIKAAILWSIKHDVKVHIVSDSQAAIRATLSPASQCIHARKVHTLLANSKVASLVWVPSHVGLPGNERADAIASGGDHSTIVRVPTSVSDYTNRIKLRALEIWNDRWKRSKNSKELHRLMPNVPHDRSHILGCITARIMARLRTGYCSVASFLHRHKLKDSNLCGRCLDVGKHRVETVAHFFVCKANRPHSTAVLVDFTAILGHRPTSLSEVLDVNLYLSKQI\n>UniRef90_K3VTF1 Adenylyl-sulfate kinase n=2 Tax=Fusarium pseudograminearum TaxID=101028 RepID=K3VTF1_FUSPC\nMTLKKLTLPYYAPNAEASDKYPSFCPRLKPSDCNKKVERPAPIVHINGFPGVGKSTIAKKLHEHINKWKIKVVQHHELDLLANTIKTPETFDHEQLRRATRALALNTIAESEDRLDTCYVFEDFALNNQGGFRIMEEYRLLALRRGCSLIRIELTCDDVAYKTRLKDQGRIDFRTENDYPRRSCLTCTDQRLVTSPILCRGFSDGGLKSLDVSSKPELWTAMSAAHHVMVTWNAGL\n>UniRef90_A1DJ33 Cyclic nucleotide-binding domain-containing protein n=11 Tax=Aspergillus TaxID=5052 RepID=A1DJ33_NEOFI\nMERVRKTFFNPLATSKAQVEKILEGLPVGSAHPFSLEQILLCRTENGIEEIDISSYPENFFFNAMDLGEMGEILLRRMAGFQSHLKVFEDFQITQAPSSTFKIPIVSDQITILAVSERTPTYYDFCFADESCNACCWLARNTFPGITHSGDILNGQDLLDYVKINKDSLIEKEICVFISGYQSTLITRFLGTHPALLVADHVDKVLYIIPVPLDAATIGDATICCPLVIKRDGDSLIYSILPTATTDRGMMCDSNKLVSPAFPEAIKRADFTMCTPDLTTRKTAPANDSVVEDTASNSENLRKIITKENAIFTTDSAALPSFIDLEKTQIIRFGTGLEFKLPDEEVPMREEPSAIVLPCIFGTELQGPVLLATGTVPSNVPFPNENALRDYYKQLKNAVVIVDERMTDNARNLASAYRINALFIVQLTPETEPKDTNGVISLMDLANINAVTALAGPQSLILVQISEKYYFYRGIANRAHLNTSGLAFGADVTSVLESVGIGSILDPRIERVINLGDANSIVLPTTGQLVQPQDLQKLFEEISVDQIQNLEEDISAVVPQLQVLLNQKDLQELSRALVTALSTKISNAATPLRDSYTKFLTQDYRMEDPKSVQKKNKMLGELRKITKDMQKALEPVISCLANMISSQTTSKRTHDLKRLVRQTTIQNNVEAVKSMTFETLSGYLEEYAGDMGVMLLNIETTPYRELLGNLKNSAIDASQCCALDSRILHLEGFDAGIIMEQSQTKHNGPLKSTIGPSQPILALPYLSQSSGTGSMLAWVLRWMEKCNEPHIAALRIIMRSTLGQAVASREHDIQPSSPETGHLMSALLMAAMSKLAAMRTSKPVELEKAEDTVTRLMRGLFGNLLTIAGSGIRPLSMVWQLFGLNPQYDLPTSSAEWIWYENVVALYPYTGWPLRQFHGNLEKLLDKAVIRVVTKNENLARIKASRTAEMVKFCKLRNIQLEHSRTIITVFMRMLTAEDIDLQPVAARLLAQLPHKLERQSQSYTRMIMYLNHLARGGERRVNDDLTAANVYTSRSATFAELKKQVCEACKRSDWARMKEACQEIMTKHVEIAALWRVKPESLKIQNMKLYKALLAADFDDIDQNTQIKNIELTRQVLGDAENKRVPWQVGKKGQFGSSIEPLDEVFLHEIMTGEKSEPAPPATIDDFKGEEERAMIETEDEFAEFESSLRAEFIKTMQKNLSAEEVCDIINVPVSAMRVFIKALNPEFIWEDLAVNFKSVILELVKDRSNRVESRPVRRLLRIEVRKNLQIEG\n>UniRef90_UPI001C2561C3 uncharacterized protein LOC121770608 n=1 Tax=Salvia splendens TaxID=180675 RepID=UPI001C2561C3\nMSAIEKKIEMEDEEKEMIDHWSHKHPLTLVDTTGSDRCYGCERSFSSGEQAYGCSIPGCEYSELLHEECSAMAREIRHPLHTQHILSQRHSQELFRCLICEGIIYSIGYKCTSSGCGYQVHLMCAHDKGVVDANHPEHELKLWRRRCSFKCDACGITSRGSSYTCIKGDCQYWIHVRCASLPQTLKREDHHHSLSLSSYIPPEYIKYNYKCDVCSKALLLKYWIYHCQICRFIVHIKCAFNKPPPPLTDASIGKDIVRLPMNEVAVELVTPFVMRQRGGEVGTLIPPFLIPATAVFDEEDELVNMKYKFLHHQHHLTLVSSTSQHPQILGEEEDEENYGVRWELICDGCITPISSSSSSSYYYMSCSECKYNLHLACFHLPPQLYSLPLHQHDDHQLVLQSCDKHQPWNYETCSVCEYPMNGLFYSCTACDFEVDIKCACMPDTIHHAAHPRHLLKHVTQSDLGRDINRWSLSCAATCGQHVVNYDCYRCCNSSCDFIVHVRCAVLLASVSSRRWDEQHPLLLTYDATVNRPGDFYCDQCETQMNPRSWMYHCRPCDVSFHPRCFITTSGEYRNIKMGQEYDVNEETHPHPLTFQLLTTKRRCNICHINNYELQGFYCALCNFFICYNFCGKGMIAKGDLKAVDLGKLSVLDH\n>UniRef90_A0A0G1JNZ0 Integral membrane protein-like protein n=1 Tax=Microgenomates group bacterium GW2011_GWA2_44_7 TaxID=1618500 RepID=A0A0G1JNZ0_9BACT\nMGNPSTRQFLLVAALALFLRLILIPHPGFLADIAYWKWWTKDSAQNGLVHTITQTGINYPPLYLTIMKATGHIYGLFANLNNDIQYWDKGNLLFLFLIKLPFILADLSVGYLIFWLLRRFYQRNLSHLGHLSNLPLLGAAFWLLNPGVIYNSALWGQTDSLGVVPILLAYLFAVSGRPIFAGALTGIAFFLKAQSIPLILFLYLYLYLKNGLLTTVKSGAAAVTAGLIVTSPFFLTHTMDRIISTIFTSVGYFPYASLYAFNLWWLVIRGASFQFPDQTLVGNLLSYRTIGFTLFWSAFGFLAFVLWQTALKKNAQELTERFLLSTPLVILSMFLLPTEIHERYLLPFFAFALLPLAFDAISARVKNIKLYLFSYAVLSLIWLLNLHFVMIKNYPENEQPILSLISPSMPVLGVVFSAVSVTLYLVFFGVFLKRCLPTNLKSRILAIGLLILLPLGLLSLQAAPVIKAKSQSKVLLSEIKPTFVRQGWGELSKDKSVAGGNLSTWYFFSWKGLGTHANSQIDFNLDGHYRRLETNVGVDTGGGEAASVEFLILGDDKVIAKSGILKKWQYQKSLVADLTGVKKLSLVVTDAGDGINGDHADWLYPTLYK\n>UniRef90_K2AFW7 Extracellular solute-binding protein family 3 n=2 Tax=Bacteria TaxID=2 RepID=K2AFW7_9BACT\nMKKLLLASALLAFGAGLASAEVVRLATEGAYPPFNFIDDKGEIAGFEREFGDEICKRAALECTWTTNEWDSIIPNLQSGNYDVIIAGMSITEERGKIITFSENYYPPAASAYLAASADADVKGGVVSAQVSTIQAAYVAESGATLLEFPTPDETVAAVRNGEAVAVFADKDYLRPFADESNGALMFVGDDISIGGGVGLGMRQSDTELKAKMDAAIQAMKADGSLNTLIEKYFGAEGLKF\n>UniRef90_UPI001E5627F1 hypothetical protein n=1 Tax=Streptomyces sp. VRA16 Mangrove soil TaxID=2817434 RepID=UPI001E5627F1\nMRTLHGEWTKFRTVPGQLWTLPALPLAMIVCTALIAAGAHPEQEGTLDVTALSLSGVYFAQAVAVLVAVAVVSAEYPRMMRTTLAANPRRGTVFTAKTLLAAGAVGVLALPGVTGALLTGRAVLTGGAARLPLSSWPLWRATLGTAVYLLLVALLTTGIALIVRHAAAAVGTALTLLYGPYLATLIIEMPDHALHLVQKISPMTAGLAVQTVGGAGGTSPWSPGAGLAVTAVYAAGALVAGWGMLRWRDA\n>UniRef90_A0A3B1DZ09 Chromosome partition protein Smc n=1 Tax=hydrothermal vent metagenome TaxID=652676 RepID=A0A3B1DZ09_9ZZZZ\nMKLNSSGKTATIFLVIFSVLLISMTAISVFIFQKEKEMRIESEGDLEKKRSEVIELKTEMREVKRKNFLLQEKNKEADERVNSLMDEVELEKGLKEEVKQENVALEEKVEMFIIARKKLDEKIKKKKEDSQKKVAEFKTLLQAEAERLKEIESLKKVNKELEQKNKDLQGQVTKILEEGKLLKEDNKGSEVIKEMGEVKKKVKNKVELEPIIVTPASGKIAKDNKEKKSVQEEVAQTVANSMKGRIISVDRETEFVIVDLGKKSGIKMGQVMSVYRGKEYLGDIKITRIQPKMSAADLIPPFSSRIVHKNDQVVVK\n>UniRef90_UPI0012E1D502 hypothetical protein n=1 Tax=Pseudorhodobacter antarcticus TaxID=1077947 RepID=UPI0012E1D502\nMRSLISSSAQAVACRAPAVTAVTAVTAVTAVTAVTAVTAVTAVTASLIRVSVLIKPL\n>UniRef90_A0A2D9X1Q0 Protein TPX2 n=1 Tax=Actinomycetia bacterium TaxID=1883427 RepID=A0A2D9X1Q0_9ACTN\nMKELDSPRNFSRDLQTPARILKVTRGKKKVTRATKLLPIGQSKKLENKFVESKRSAFKTVKPKGKLSPIQEVTQKTDKDSNTSLRSVETPLSRSLELPPPPPAPKKERAGRLEPLAQGIETNFYKNYYSL\n>UniRef90_A0A7V6UPT2 Thiazole synthase n=3 Tax=Bacillales TaxID=1385 RepID=A0A7V6UPT2_9BACL\nMTDKLVIGGYEFQSRFILGSGKFSLDLMEAVVEYGEAEIVTLALRRANTGGEENIVHYIPENITLLPNTSGARNAEEAVRIARLARELGCGNFVKLEVIHDSKYLLPDNYETIKATEILAKEGFIVMPYMYPDLYVARSLVDAGAAAVMPLGAPIGSNKGLATKNFIQILVDEINVPIIVDAGIGRPSQACEAMEMGVDAIMCNTAVATAGDVALMAKAFKLAIEAGRSAYLAGLGRVLDFKAEASSPLTGFLED\n>UniRef90_UPI0005738328 YqcI/YcgG family protein n=1 Tax=Pseudomonas putida TaxID=303 RepID=UPI0005738328\nLRGVHARDPHPWPQAIPADPHDSGWSFCYAGMALFINMNFPGHHQMKSRNLGNHITFVINPRENFDEVANADTESGKRIRARIRERVQHYNDGVMPDSLGFFGQADNFEWKQYQLQEAGSLNPSRCPFHANVHAAPDTQIEN\n>UniRef90_A0A158Q2K6 Cytochrome P450 n=1 Tax=Dracunculus medinensis TaxID=318479 RepID=A0A158Q2K6_DRAME\nMSVLGIVIVISMAAWMTWMLLRKVSSIFNKINIIQGPSPLPVIGNIHQIHFKPDDFFEQAQGIAYMLQKNGERMTRIWFSGWPWVLLYGAEECEAILSSNRTLKKPFQYGFLSDWIGEGLLISDPKKWRPRRKLLTPAFHYDILKDFVGIYYKHGRTLLSKFENMIGEHYNEIFHIVSYCTLDVICEAALGINPDAQNKPSPYLDSVWRMKYIIHQRTIKAQYYPKIFFNLFGNGSECKKHIKILHDFTGKAIKERKRLADEAGGIENLLKSESKRENEKISINFFTSLFIYFRNQNISGKKRMAFLDLMLDMHSKGDLSLDGIQEEVDTFTFEGHDTTSASMNWFLHLMGTNPDIQRKVQKEVDDVLGKVNLTRLMTDLEERPITYEDLGELKYLEACIKETLRLYPSVPILARLLQEETKIKNNTLPKGTGVIIVPSMVHRDPRYWPDPEVFNPDRFINNEVKHPYSYIPFSAGARNCIGQRFAIMEEKCILALLMRHLKVKSELRTDQMRVSGELVIRPFFGNNIRFAKRTYGDYTQIA\n>UniRef90_A0A3S1DSJ7 Alpha/beta hydrolase n=2 Tax=Halomonas TaxID=2745 RepID=A0A3S1DSJ7_9GAMM\nMLTKEQVVARNNVTIVGSGEKTLMLAHGFGCDQQMWRHLIPHLKERYTLVLFDYVGSGQSQISAFSESRYRALEGYAKDVTEICQALNLTQVHLIGHSVSGTIGLLASIAHPELFASQVMICPSPCFLNMPPDYYGGFECADIEELLGLMDRNYIGWANYLAPLVMGLENSELLTSELSDSFCSTDPVVAKAFAKATFFSDYRHLLPQAKHEALLLQSQQDSLASPDVGHYMHAHMPGSTLRLLASEGHCLHMTHPELVAQEINTWLRD\n>UniRef90_UPI001F334FC1 bifunctional ornithine acetyltransferase/N-acetylglutamate synthase n=1 Tax=Ktedonobacter robiniae TaxID=2778365 RepID=UPI001F334FC1\nMYTNFCSFSIKRLIHLCSKVACRLLVHILRDLLCERLRRCTVKVTVADAESFAQAKRVAKVVVNFPLVKTAIFCADPNWGRIAMVIGKCEAQTAIVLEKVSI\n>UniRef90_UPI001EE7BB04 hypothetical protein n=2 Tax=unclassified Micromonospora TaxID=2617518 RepID=UPI001EE7BB04\nMAVPVTALLAGCAPATAVAGGATGPVSARRSPEGSYAVGVRTNPNAAFPPRPLADTARRRRPLAERAA\n>UniRef90_A0A5E3WRX4 Oxidored_FMN domain-containing protein n=1 Tax=Peniophora sp. CBMAI 1063 TaxID=718367 RepID=A0A5E3WRX4_9AGAM\nMSTTDKVIPTLFKPTKLGNLLLNHRVVLAPLTRFRADDDSVHTELAVEYYRQRSSTPGTFLITEATVIAPQAGGYPNAPGIWNNEQVAAWKKIADVVHGNGCPIFMQLWSIGRVAVPEVLEKYGHDVVGPSAIALDANHATPRALTVDEIKEYVQLYAQAARNAIRAGFDGVEVHSANGYLLDEFIQSNSNHRTDEYGGSIENRIRFTAEVVEAIAAAVGPERTSVRLSPWSRFQAMRMPDPIPTFNALVQRLADTQPALAYLHIVEPRVNGEADATDVGEDNNDVLKKIWSPRPLVVAGGFSLETALQVSERQENVLVAMGRYFISNPDLPRRWQEGFALAPYERQYFYSRGSRGYTDYAPYVEATKIAV\n>UniRef90_A0A350NT93 COX3 domain-containing protein n=1 Tax=Flavobacteriales bacterium TaxID=2021391 RepID=A0A350NT93_9FLAO\nMFWTSSEFMIKNTTPAPSNRRDVFDGVEPAVRERTKKMLMYFIIFAVVMLFAGFTSAYIVSNMGQYWVNIEPTSAFWVSNVLLVLSSIGLWSAVRSMRENHKQRAVLALAFTLISGIGFTISQAEGWKTLAEMGLGWTTTDHESGLEAYRWNSIESLLESDAIYGQDYTISRGGEPLLFDASKNEFYASNDALMVRPITRDVARTSNSGASYLWILIAVHILHLTFGFIYLVINGIRVVQGTIHAKDVVQLESLSIYWHFMGALWLYLFVFLFFLH\n>UniRef90_A0A1J5ICS2 Polar amino acid ABC transporter permease n=2 Tax=unclassified Syntrophobacteraceae TaxID=869804 RepID=A0A1J5ICS2_9DELT\nMDLTKFFLVVAAVAGLLAVGTERLGYHWQWYRMPRYLVRIGDGGWRPGPLLDGVLITFKISGLSLILCFSFGLVAALFRLSHSYLARLLARLYVELIRNTPLLVQIFFIYFVLGPVLGITRFTSAVLALSLFEGAYAAEIFRAGILSIPRGQWEAARSLGLSTYKCYRAVILPQAVRHVLPPLTSQAISLVKDSALVSTIAIYDLTMQGQAIIAETFLTFEVWFTVAAIYLIITVILSILVNVMENRLRVTG\n>UniRef90_A0A5B8ASF5 DUF4760 domain-containing protein n=1 Tax=Georgenia wutianyii TaxID=2585135 RepID=A0A5B8ASF5_9MICO\nMSVEVWVTLGGVILAGLLAWHQLRASLYVRRREFEDIYVQRYWEISNRLNLDLRIGSYSGGDFAELADAEDKDAQYLAMWDYLALCEDQIDLRKSGNVTDEAWAVWSSSIAGTVSRYPYEAFYDLIEQGLDEAHVDESDRPWEHLRTLRHDPGAGLPDPYPLSGTGWRQRWRRYATGRRERVALTGLEVERLKMRRR\n>UniRef90_K1JNL9 ATP synthase subunit b n=2 Tax=Sutterella TaxID=40544 RepID=K1JNL9_9BURK\nMNINASLFLQMVVFFLGAWITMKYIWPPLIHAIEERQKKIADGLSAANKGEKALAIATEQGKAIEADARARATTIVSDGEKRAQSIVDEAKAQAQVEADRIIENARAEAAQEMQRAREALRNEVAALAVAGAEQILAREVDKTVHAAMLEQLKAKL\n>UniRef90_A0A1J4Z6F5 Chemotaxis protein n=2 Tax=Hydrogenophilales TaxID=119069 RepID=A0A1J4Z6F5_9PROT\nMTTQRSFSIFDTAWGSGILGALAVAGPLAGTLAGGPWWPLVFALMAVALAVVCARHRLRQNAWMEKIRRMAADIADGHLSSRLTHVSDARSLAPVVTAFNDAMDRIEAAFREMSGALTAQEAGYTARHAQVIGQVGDYSHVLNTFNTVLASISKHKQAEAYNHMVVRVQSLNAAHLIPDLALTQADFARIVKEEEQVIDLASGSSQKANESAVAVEAMHQGFQRLQALIGEVSAAILDLSAKSSEINQAIDTIHALANQTNLLALNAAIEAARAGEAGRGFAVVADEVRKLAGHSKDAAMQIGNTMQALVSETQSMVVSAEEMRAITEESGRAAADISSEFSQIVSRSSETLRRAKTALTVAFASLTKCDHVVYKQRAYQTIVAGDESLRQQVDVDHHNCRLGKWYAGEGREQFGQLEAFREIDRPHAAVHDAVRQMLALTHQRTWQNDTAQMERVFAELQRMEDASEQVMSVLIALPEQASASSVPG\n>UniRef90_UPI0018C1FAF3 GIY-YIG nuclease family protein n=1 Tax=Actinoplanes sp. NEAU-A11 TaxID=2792083 RepID=UPI0018C1FAF3\nMTSSGTRPDDVPTDRARTEEALRLLSGVPTGLDVAVKMLSRGGGVYAWWAAPSIFPDLPGPSNLSVPSLRLLYLGRATSLRGRILRNHLRRSGSSTLRRTLAGLLTCEGYRTTWTDRVVLIPEDESRLTAWMYTHLRLTWAEDPEPATIEAELVRRLHPPLNVHGVDPEHIQPAVVAAKNSYNASSRPTERPPTL\n>UniRef90_A0A7C3K6X1 Ribosome maturation factor RimP n=1 Tax=Firmicutes bacterium TaxID=1879010 RepID=A0A7C3K6X1_9FIRM\nMTREAIVAQVEALVEPIAQRYALEVADVELLGQGARTLLRVTVEQPAGAERVGVDELARFSEALSRQLDLRDLIPHAYTLEVTSPGLDRPLKKDRDFQRFAGREVQVTTFVPVEGRRHFTGRLVGLEAGEVRLEVAGHPVRLPRAQVASARLSIDENELKRDLSGGGRAAR\n>UniRef90_A0A1E1W481 Chloride channel protein (Fragment) n=4 Tax=Pectinophora gossypiella TaxID=13191 RepID=A0A1E1W481_PECGO\nGGYATVGAAAFTGAVTHTVSTIVIVIEMTGQVTHLLPIMAAVLAANAVAALLQPSCFDSIILIKKLPYLPDLLSSASRMYDICVEDFMVRDVKYIWNRMTFQQLKDLLKENKTIKSFPLVDSPTSMVLLGSIHRWELVRVIEKQVGRSRRLQVAAQWLRDAERRRQENEAKKRRPSRFEVTPAPDMLQVPGTGMTRGSSLTTKDQGGLIPSPGQLFRPKSILKKTNSFTLTRGLVSPGVPQTPLSP\n>UniRef90_A4ERI7 Ubiquinone biosynthesis accessory factor UbiK n=1 Tax=Roseobacter sp. SK209-2-6 TaxID=388739 RepID=A4ERI7_9RHOB\nMGTIERLAEKLAEDTLKVQDALGEDRFYMEVAQVLGAASQSLEEAFLTEIRVSLADRKAREFISKKLAQVQRELEEKAKG\n>UniRef90_A0A7Y0XJK6 DZANK-type domain-containing protein n=3 Tax=Limosilactobacillus reuteri TaxID=1598 RepID=A0A7Y0XJK6_LIMRT\nMKKCPYCNTLNPDDAEVCENCGKPLKGRMLALVCPNCGKVNALGSRECSVCHTKLSQSNHQLVSREITPRKNNKRWGYIALIAFGILIALFTYLGGRYARSTSIPGKIEALEFE\n>UniRef90_A0A1Z8PZI4 HemY_N domain-containing protein n=1 Tax=Micavibrio sp. TMED27 TaxID=1986607 RepID=A0A1Z8PZI4_9PROT\nMIKAFWFAIKVGLVVAIAIWIAERPGFVRIEWLDYVATIQMGFFLLLCVIAILISIFVYRVIAAIVNFPKTYQRYLEVRGYEKGVRALTLGMAAVAAGDEKIAVYQAHRATKLMPEDTGLTNLLTAQAARLDGREDDAVRAFARLLENKEASFLGVRGLLQAAIDKGDYETAKNLVDRALGLYPKQGWILKTAFDVYVRAEDYTEARVLLKRAAKAGTVKSETLHSDLAALYLAEALQDFEAARNERGIKLIKQALKKSKDFIPASVALIQYYIDNNDISSASKLLKKYWRREAHDLYVPQWLSIYKGASSEDKLKHMQSLLKINEKNAVACMETGKAALESSLWGEARKYFEKAESIEPTASLYRSYAQLEELSIHDEAAARTWLEKAINAPVERQWVCQETGRLYTQWKPIAQPHGAFNSMIWGRSTDLQSDNALLIHSGQSTMQGLVHAV\n>UniRef90_UPI001FFBE095 hypothetical protein n=3 Tax=unclassified Bradyrhizobium TaxID=2631580 RepID=UPI001FFBE095\nMEKTTMRLAQKFWLVFLALGAAIAVQGAPASAQQRLEGQVLLAGEPVVSATVTLWTAGADQPRQVTQTQTGADGRFALSTPPGAGNAPTYLVAKGGTAGGAANTGVNNAIALMVLLGDPLPRAVTVNELTTVASAFAAAQFIKGEAISGNPLGMRIAAGNVPNLVDPATGQWGKVLLDPLNSTRTTTLANLNTLGSLITAFATTTNEDWRARFLKAATVPGGATPKNVIEAMTGIARKPWAQPKELYALFDEAYPQPKDGARRKAPFVPYLAYVPDDFVLSLCFAGGGVYSAGRLMFDAESNLWSGQNWMAGSQSGVNQSIGGGVVKLSPNGTALSPPITGFTGMGIDGVGWGTAVTKDKVWLTSFNGKILVLDFDGHPIGTESDFPFKEKFLGLMGIGVAANGDVWIADGSDNQLLHFPGGRVTDGRIVKVGGLKSPFDIVIDAQNRVWVSNSQSDKVVRFPADDPSKAESFRAGIGVRALALDSKSNVWVASNMSLDFPPPVIPDGASIMEQFKIAAGHMLKVLETNPHMVTGVVNMIRPDGSQPAPTGFTGDKAVSVPWGLNIDGNDDVWIGNFWGRGVVLMAGDNTKGHPAGTKMGDAIHVFKGGSIQMLTDVSIDPAGNVWAANNWNDLNGAASPDPTRPTSTWGGGSGITVIYGVAAPVQPPRMGMVRKP\n>UniRef90_UPI0019539C4C hypothetical protein n=1 Tax=Serratia marcescens TaxID=615 RepID=UPI0019539C4C\nDVGGRKFEMSDMAYVIRGLGYIKSKEDVENISLGQYNGIPVRVKDLGNVQMGGDLRLGIFDQNGNGEVVGGIV\n>UniRef90_I3SW78 F-box/LRR protein n=7 Tax=Trifolieae TaxID=163742 RepID=I3SW78_MEDTR\nMSSNSTSEDVISALCINEALTDDELRSILAKVDSEKDKETFGLVCKRWLRLQSTERKKLSARAGPHMLRKMADRFTRLVELDLAQSISRSFYPGVTDSDLAVIANGFRCLRILNLHNCKGITDVGMKAIGDGLSLLHSLDVSYCRKLTDKGLSAVAKGCCDLRILHLTGCRFVTDSILEALSKNCRNLEELVLQGCTSITDNGLMSLASGCQRIKFLDINKCSTVSDVGVSSICNACSSSLKTLKLLDCYRIGDKSILSLAKFCDNLETLIIGGCRDVSNDAIKLLATACRNKLKNLRMDWCLNVSDSSLSCILSQCRNLEALDIGCCEEVTDTAFHHISNEEPGLSLKILKVSNCPKITVVGIGILLGKCSYLEYLDVRSCPHITKAGLDEAGLHLPDFCKVNFNGSINEPAVLL\n>UniRef90_UPI001F28D147 RimK-like ATPgrasp N-terminal domain-containing protein n=1 Tax=Thiomicrorhabdus immobilis TaxID=2791037 RepID=UPI001F28D147\nMSHFYVVVDSLTDWKPYYSSQDVITFDDYLERVNDRSKKRIRVINLCRDYRYLKTGYYCSLLAEARGHHVLPSLMTINDLGRKSLSSIQLTDTSQLVNRLPLGNEGEQLTFRCWFGKTLNPALAKLAAKLFEKFPTPLLEITLQFKQHWQVKQVKGVSLKALVDPAEQEAFAETFEKFSLQMWRKSKTRKAYRYDLAILVNPDDPLPPSDDAALKQFKKAANQLGIATEFITRKDYMRLAEFDGLFIRETTSVEDHTYQFAKKAEAEGLMVIDDALSILRCTNKIYLADLLNTHKIPTPKTVIINQPSEQALLKLENEIGFPMVLKIPDGSFSRGVVKVENAEELTEQAKILLKQSVMLLAQEYMYTQYDWRIGILNNKPLFACRYYMVDDHWQIYKHESQDTQSGGFETLPTFEAPKAVIDIALKAAKLIGNGFYGVDIKQSGDRVVIIEVNDNPSIDSGVEDKYLGEELYHEIMKDFLLRMESLGR\n>UniRef90_A5W1W3 Antibiotic biosynthesis monooxygenase n=32 Tax=Proteobacteria TaxID=1224 RepID=A5W1W3_PSEP1\nMVKVALFVRLKAKPGKEKDVESFLLGGLPLVEEEPATTAWFGIRLGPSTFGIFDAFPDEAGRQAHLSGKVAAALMANAAELFAEPPSIEKVDVLAAKLPS\n>UniRef90_A0A167MC44 Ribosomal RNA-processing protein 43 n=4 Tax=Cordycipitaceae TaxID=474943 RepID=A0A167MC44_CORFA\nMPEVGLSRATFAKLSPHPYLLANLEPSNQDIPPARSNGRAPDEARTPEVNLSSLSHAHGSSLVRIGDTTAICGVRGETILTANIPNYRASNAASELRDYDLLVPNIELATGSSPQNLPGGPPSTLAQTLSTRVYSLLHSSQLLDAADFRIWHTQTADLTAADDEEMQDADADADGEDQAQFNNERQVIAYWVLYIDIFFISLDGNQFDAAWAATLAALRDTKLPRARYDPDSELIVCSRKDPKPLSLNGFPIACTAAVFTGKETDRPTEGKYWVLVDPDTLEESLCDESLTVVADCSGGTTSLLSVSKHGGTVLTPKHLRSKQLLGFVEKRWKGFADAMSV\n>UniRef90_A0A1V6I1U0 TonB-dependent Receptor Plug Domain protein n=1 Tax=Bacteroidetes bacterium ADurb.Bin035 TaxID=1852799 RepID=A0A1V6I1U0_9BACT\nMKKQKILLIIMLIFNISLSSQITINGKVIDRDSQKPLSFANIKIAGTFLGTVSGNDGSFSLQVKSLPVTLIISFIGYQTDTIVVNENQFLTIYLAPKSILTDEITVTAIRLDDNSPKNFTNLSIEKIQSLKTGQDLPLILNFTPSVVATSDAGNGVGYSDIRIRGTDITRINVTINGVPYNDPESQGVFWVDIPDIASSADNIQIQRGVGTSSFGTASFGASINILTGVMKNDPFVELQTNGGSFNTWGASAKFATGLIKDNWYLEGRLSHQYSDGYIDRAWSNLNSTYLSGGYYGKNTIVKGLFMAGIEKTYQAWGGVPKEYLDDPILRRYNPYTYENETDNYWQYHYHLNVTQKINDKNTLNATLFYIDGLGYYEQYKDNKKLSNYNIPPVILIDTTSNDTIMINSMDIIQRKYLENDFYGAIMSHIFDNNKNLKIRTGLNLYQYDGWHYGKIIWMQYAHNTPINYEWYRNKSIKKEFSLFTKIDYAINEYFNLFTDLQYRYIDFAIKGTDDAFISDTLTKYYNFFNPKLGLVYKISKKDELYLLLGMSHREPNRDNLMLINEDSLKPVPETLYDLELGYSRYFSKGIVNINTFYMYYDNQLVLTGKINDVGDPIMQNVPTSYRAGVELIWNFNFTKWLSWDANCTFSENKIKKMKIYIDDYDLWPQQRIYQVENRPISFSPSIVASSILTFKPISNLSVSIQSKYVSKQYIDNTGDEECVIDPFFVNNIRLDYCIKGKKFDKINLFVNFNNIFNEYYETNAWVYRYYEAGNEYKDFGYFPQATFNVLAGLNFYW\n>UniRef90_UPI0019146668 MarR family transcriptional regulator n=1 Tax=unclassified Pseudomonas TaxID=196821 RepID=UPI0019146668\nMNPELQLAAPYLPALASYIETVLGDSPTFSGWDQTSRLPYYLNSSYFILQMTLLGQTCIVLLENQQRSVSLPDVKKHMDALRQLTESPLVFVTETLASYERKRLIERGVQFIVPGNQLFIPELGLDLREYFRARQEKTEFMSPATQAMVIHLLMNDWKHSLQLSQATLGQPFKYSKMTISRAVKELKGLGLITVEADKQQHIEIHVPARQLWQNARKHMRSPVKRTLWLNRVPLLDGQPLLLAGESALARQTLLVEPWLAIYACSSETLNALQNAAEPITEVAPEEAACALQIWSYDPTVYAWAVPYVDPFSLILSLQDSKDERIQIGLSQLEGDMKW\n>UniRef90_A0A7C6YG77 Uncharacterized protein n=1 Tax=Actinomycetales bacterium TaxID=1911520 RepID=A0A7C6YG77_9ACTO\nMNEYVEYPASAEAACRSTYKPASRLPGPGHEERLALSSPAVSSGA\n>UniRef90_A0A8J7E1C9 Glutamine-dependent NAD(+) synthetase n=1 Tax=Nodosilinea sp. LEGE 07088 TaxID=2777968 RepID=A0A8J7E1C9_9CYAN\nMKFAIAQLNPTIGDLAHNAQQVLNAARQADQLGAQILVTTELVLCGYPPRDLLLRPSFIQAMAQTLEDLALALPPHLAVLVGYAAANPKARYSGEKPLFNSTALLQGGQVQQVFHKQLLPTYDVFDEDRYFAPGQGPSSFTLPCGDWGIRVGVTICEDLWNDEEFWGGRSYARNPIADLAGDGVDLVINLSASPYSLHKAQLRSAMLAHSAARFRCPILYANQVGANDDLIFDGASLAFDRQGELVARLPAFQAGLAVVDYDPVKGDLTPGEVAPLPTDDNEALWSALVLGVRDYTHKCGFAQAVIGLSGGIDSALVAAIAAAALGPDNVLGVLMPSPYSSAHSVSDALALAQALGIAHQTLAIGPLMADYDQVLDPLFADTSPGIAEENIQSRIRGNLLMAISNKFGHLLLSTGNKSEMAVGYCTLYGDMNGGLAVIADVPKTRVYALCQWLNQQVGQGSNGAIAPVTLGTLATRVSAQGLIPQNILDKPPSAELKPGQVDQDSLPPYDVLDDILDRLVQRHESIADMVAAGHDAAVVEKVLRLVSRAEFKRRQAPPVLKVTDRAFGMGWRMPIANRWRSEAAVHPLTAEQLLEA\n>UniRef90_L2GXC0 SWIM-type domain-containing protein n=1 Tax=Vavraia culicis (isolate floridensis) TaxID=948595 RepID=L2GXC0_VAVCU\nMHFHTLEMLVMVVIFVHADLLKLKSVCKCAEEGSYQCQNVNNPNVKGNGGTTRKACITDDLYAGIFADVVGKDGLTDSHPRTDNAAHSQIMGCSSAPCPCDELLSDEMVEDASNLMRKSYQQNVEHSSCRIAARGDSPNNEEKLNVSDQPVCTRIGVEKECDQDNEENNDENAYWFGSYISSAIQNGCRTVSSIVEEVFSMFQGCGLWIDPSDERNEEFIDEAIDNMSESGNGTDNELKKAGKLLARTCKCFIREFFWCTIGLCDKISGVIGKRKVKYRDANIGSDKNKDKYSNLERTCTCEAYIKRAACRHGSGLKGKKGKAVEHVSDSIYCEFMRAFEQEKHGLTMQELIERVASRGEHRGTQIVDSKKCFNGCDEVQDVTKRSNFYETVELAIKMVSLMGVLLFMVALVATVLHHWTK\n>UniRef90_A0A3D1CV37 Single-stranded DNA-binding protein n=1 Tax=Candidatus Pacebacteria bacterium TaxID=2053589 RepID=A0A3D1CV37_9BACT\nMSVRSLNKVMLIGNLTRDPNLRFTPTGTAVCSFGIATNRAWTPSDGGEKQERVDFHNIVSWAKLAEICGQLLHKGDKVYLEGRIQTRDWKTEEGVEKRITEIIIDNMMLLSNGRGGAMGGNDQDGAGEDLGQTAPTPVSATTTRAKTKPAAKTDNEVEVVEDVSDDIPF\n>UniRef90_W0ZCU4 Geranylgeranyl pyrophosphate synthase n=2 Tax=Microbacterium TaxID=33882 RepID=W0ZCU4_9MICO\nMQGSPDAIQAVSQRLERFVSARVDEAADAGPLARPILELSAATLQGGKRLRAAFCYWGWRSVTDATGTDEIVAAAAALEVFHAAALVHDDIIDNSDTRRGHPATHRAFEGAHLAGGWTGDAAAYGRSSAILAGDLLVAWSDDLFEEGIADAPADRARAARRRYAEMRRDVTVGQYLDIAAETVPAPDAEQLGRALHVASFKSARYSVQQPLLIGAAIGGGSTEQQEALRDFGHPIGMAFQLRDDVLGVFGDSAATGKPSGDDLREGKRTALIAFARQELPASVRRTLDELLGDPDLEDTQVRMLQDTIRDSGALDRVEDLIASYTREADRALSGAPLDNASVGALRDLARAAVHRVA\n>UniRef90_A0A1I9RWB5 Major capsid protein (Fragment) n=1 Tax=Feline calicivirus TaxID=11978 RepID=A0A1I9RWB5_9CALI\nWSTPRFRPITINISVSNGAKLGXGVATDYIVPGIPDGWPDTTIAEKLTPAGDYSITTXSGNDITTAAEYDKADVVKNTTNFRGMYICGSLQRAWGDKKISNTAFITTGTVDNNNIKPSNTIDQXKIAVFQDTHAXXSVQT\n>UniRef90_A0A7S1QBK8 Pentapeptide repeat-containing protein n=1 Tax=Neobodo designis TaxID=312471 RepID=A0A7S1QBK8_NEODS\nAPEHAVALDTVRTALSAPSHTALIEDALEGRPLRGVDLSALPKDVQCSVRRVDLRDASVVGCSFFAGANFDLADCRRTDFTGSQFRDISFAGATLRGAKLQRCTFKHCVFRRCDIRDADLCGATFVGCDFTLCDMSGCTTSGDTTFFEPQSWWRSRREEWRGTKPFVNLDAEEATQQMAARDDSRSRPRGGRPRNTPRRGKTWTKKISTKR\n>UniRef90_UPI001F4247D0 hypothetical protein n=1 Tax=Xanthomonas citri TaxID=346 RepID=UPI001F4247D0\nMFGEGAEIRFAYQSFKWANLAAKNAGVSVAIIGLTRRNGGTKQIFIANEDGVVTVRTVSNISPYLVPGDNVLVSPRSKVPDERAPMQFGNHPYYANELMLSLDEASGMVGEDARVAEFIRPLYGSRESISGTPRTCLWITDENLALAQEIPAVWARVEKVRKDRKTKTKDVQAKKLVETPWRFRDQYEAESSLLVVPIVSSENRPYLPVVLLSKEAIVHNKAFALYDAPLWNFALIVSKMHLVWVAAVCVRLEMRYSYSNTLGWNTFPVPTLTEQNKADLTRCAEDILLARESHYPATIADLYGPDNMPDDLLRAHERNDEVLERIYIGRRFRNDTERLEKLFDLYTKMTAGQGKPKKKAKK\n>UniRef90_A0A3C0QT04 Magnesium chelatase n=1 Tax=Ruminococcus sp. TaxID=41978 RepID=A0A3C0QT04_9FIRM\nMIQTFAEKLHNSMAKAIVGKDDVIDRVIAALLCRGHILLDDIPGTGKTTLAKALASSIGCHHSRIQFTPDLLPSDVTGIHWFNQKTQEFTFRKGAVFTNILLADEINRTTPRTQSALLECMQERQVTLDGETMSLAEPFFVIATQNPIETQGTYPLPEAQLDRFFICLHLGYPEKEAERLILTGASQTISEPVCTVEELIQAQNAVENVLVSEPILEYLLAIAEKTRKDRTTIIGLSTRGLQALQLCSKAWAGMQGRNYVIPEDVQAVAPEIIAHRLIMKGGERLQRMEFRHESALRMVEEVSVPVE\n>UniRef90_UPI000A359F7A tubulin polyglutamylase TTLL5 isoform X13 n=1 Tax=Heterocephalus glaber TaxID=10181 RepID=UPI000A359F7A\nMPVVMARDLEETESSSEDEEVVSQEDHPCIMWTGGCRRIPVLVFHAEAILTKDNNIRVIGERYHLSYKIVRTDSRLVRNILTAHGFHEVHPSSTDYNLMWTGSHLKPFLLRTLSEAQKVNHFPRSYELTRKDRLYKNIVRMQHTHGFKAFHILPQTFLLPAEYAEFCNSYSKDRGPWIVKPVASSRGRGVYLINSPNQISLEENILVSRYINNPLLIDDFKFDVRLYVLVTSYDPLVIYLYEEGLARFATVRYDQGAKNIRNQFMHLTNYSVNKKSGDYVSCDDPEVEDYGNKWSMSAMLRYLKQEGRDTTALMAHVEDLIIKTIISAELAIATACKTFVPYRSSCFELYGFDVLIDSTLKPWLLEVNLSPSLACDAPLDLKIKASMISDMFTVVGFVCQDPAQRAATRPIYPTFESSRRKPIQKPQRSRPLSASDAEMKNLVGPPREKMSEKLGGSVLGLSMEEIKVLRRVKEENDRRGGFIRIFPTSETWEIYGSYLEHRTSMNYMLATRLFQDRGNTRRSLLTGRTRETRGLVKFQDYCHIRLKMTTDGMPELKVESVNSKAKLHAALYERKLLSLEVRKHRRRSGRLRALKPKYPVITQPAEMNGKTEAESEEEEEEVALDNEDEEQEASQEESAESLAENQGKFAPPLTIGIENLPKENSMEVPVWNNKGEQGCKIETQEPEPNFNLMQILQDNGNLSKVQARIAFSAYLQHVQTRLMKASGGQTFSASWAAKEDEQMELVVRFLKRASSNLQHSLRMVLPSRRLALLERRRILAHQLGDFIVVYNKETEQMAEKKSKKKFEEEEEDGVNAENFQKFIRQASEAELEEVLTFYTQKNKSAGVFLGTHSKSSKHSQTLSDNGAKGDHPEMIEEVKIKQPKHQQATEILSDKLSPSLCHPNKHHSGVAKAQKEGEDGSLYSKRYNQSMVTAELQRLAEKQAARQYSPASHITLLTQQAANLNMASGAINRSSASTPPSLRPVISPSGPAWSIQCDPHAPESHSSPPGSRRLQAGGFAWEGEIENNAYSKATGVVPQHKYLPTAGSYQLHFALQHLEQQKLQSRQLLDQGRARHQAIFGSQILPNSNLWTMNNATGCRISGATASGQKPTTLPQKVVPPPSSSTSLVPKPPTNHKQVLKKATSQRASKGSCEEGQLSELQSSLNTTAFVPLPSSTDHLSSFQKGMRQETRTPNPWLDHLPKGTRELKTTRVL\n>UniRef90_UPI0016748451 MarR family transcriptional regulator n=1 Tax=Streptomyces xantholiticus TaxID=68285 RepID=UPI0016748451\nMPDLSHGATDADVAAVNSLRSAVMRLGRRLKHQRVDETLSPTEMSVLGTLATCGSATPGELARKEHVQPPSMTRIVALLEAKGLVRLEPHPADRRQKVVTQTEQAETMLEESRRKRNAWLATLAEGLDDEEWAKLRAAAPVLEKLAHLQ\n>UniRef90_UPI0003C1277F tubulin polyglutamylase complex subunit 2 n=1 Tax=Latimeria chalumnae TaxID=7897 RepID=UPI0003C1277F\nMDDNENSSISGFLDRLTLGVTKILETRPGVTEVKFFEKEPVERHVIISWEQRNCCTLPEDLKNFYLMTDGFHITWNVKFDDVPMQLGSMVINSILKLCRLKGSSVYALPHAPTLAILESDSDEEANESQPEKPHFDSRSRLFELDSCGGHGKVCLVYRNAKP\n>UniRef90_A0A6J1YNG1 Voltage-dependent P/Q-type calcium channel subunit alpha n=1 Tax=Acinonyx jubatus TaxID=32536 RepID=A0A6J1YNG1_ACIJB\nMWKASRVPDPMFSPRSYDALHDGGRGPPAADGTAGAPQDARGPRMSGPCPGPPLKRRGGVVDHRDVILAHQAHKIHSTPQARRKEWEMARFGDEMPARYGGGGSGAAAGVVVGAGGGRGAGGSRQGGQPGAQRMYKQSMAQRARTMALYNPIPVRQNCLTVNRSLFLFSEDNVVRKYAKKITEWPPFEYMILATIIANCIVLALEQHLPDDDKTPMSERLDDTEPYFIGIFCFEAGIKIIALGFAFHKGSYLRNGWNVMDFVVVLTGILATVGTEFDLRTLRAVRVLRPLKLVSGIPSLQVVLKSIMKAMIPLLQIGLLLFFAILIFAIIGLEFYMGKFHTTCFEEGTDDIQGESPAPCGTEEPARTCPNGTKCQPYWEGPNNGITQFDNILFAVLTVFQCITMEGWTDLLYNSNDASGNTWNWLYFIPLIIIGSFFMLNLVLGVLSGEFAKERERVENRRAFLKLRRQQQIERELNGYMEWISKAEEVILAEDETDGEQRHPFDVGALRRATIKKSKTDLLNPEEAEDQLADIASVGSPFARASIKSAKLENSTFFHKKERRMRFYIRRMVKTQAFYWTVLSLVALNTLCVAIVHYNQPEWLSDFLYYAEFIFLGLFMSEMFIKMYGLGTRPYFHSSFNCFDCGVIIGSIFEVIWAVIKPGTSFGISVLRALRLLRIFKVTKYWASLRNLVVSLLNSMKSIISLLFLLFLFIVVFALLGMQLFGGQFNFDEGTPPTNFDTFPAAIMTVFQILTGEDWNEVMYDGIKSQGGVQGGMVFSIYFIVLTLFGNYTLLNVFLAIAVDNLANAQELTKDEQEEEEAANQKLALQKAKEVAEVSPLSAANMSIAVKEQQKNQKPTKSVWEQRTSEMRKQNLLASREALYNEMDPDERWKASYARHLRPDMKTHLDRPLVVDPQENRNNNTNKSRAAEPTVDQRLGQQRAEDFLRKQARYHDRARDPSGSMGLDPRRPWAGSQEAELSREGPYGRESDHHAREGGLEQPGFWEGEAERGKAGDPHRRHAHRQGGSRESRSGSPRTGADGEPRRHRAHRRPGEEGAEDKAERRSRHREGSRPARGGEGGEGDGPEGGERRRRHRHGPPASYEADAARREDRERRHRRRKENQGSGVPVSGPNLSTTRPIQQDLGRQDPPLAEDIDNMRNNKLATAGSAGAHDSLGRPGLPQSPSRTGNSTDPGPAPAPPAVAANPQNAAGRRAPNNPGDPSDPGPPKTPENSLIVTNPSSTQTNSAKTARKPDHTTVDIPPACPPPLNHTVVQVNKNANPDPLPKKEEEKKEEEEDDPGEDGPKPMPPYSSMFILSTTNPLRRLCHYILNLRYFEMCILMVIAMSSIALAAEDPVQPNAPRNNVLRYFDYVFTGVFTFEMVIKMIDLGLVLHQGAYFRDLWNILDFIVVSGALVAFAFTGNSKGKDINTIKSLRVLRVLRPLKTIKRLPKLKAVFDCVVNSLKNVFNILIVYMLFMFIFAVVAVQLFKGKFFHCTDESKEFEKDCRGKYLLYEKNEVKARDRQWKKYEFHYDNVLWALLTLFTVSTGEGWPQVLKHSVDATFENQGPSPGYRMEMSIFYVVYFVVFPFFFVNIFVALIIITFQEQGDKMMEEYSLEKNERACIDFAISAKPLTRHMPQNKQSFQYRMWQFVVSPPFEYTIMAMIALNTIVLMMKFYGASVAYENALRVFNIVFTSLFSLECLLKVMAFGILNYFRDAWNIFDFVTVLGSITDILVTEFGNPNNFINLSFLRLFRAARLIKLLRQGYTIRILLWTFVQSFKALPYVCLLIAMLFFIYAIIGMQVFGNIGIDVEDEDSDEDEFQITEHNNFRTFFQALMLLFRSATGEAWHNIMLSCLSGKPCDKNSGILTPECGNEFAYFYFVSFIFLCSFLMLNLFVAVIMDNFEYLTRDSSILGPHHLDEYVRVWAEYDPAACGRIHYKDMYSLLRVISPPLGLGKKCPHRVACKRLLRMDLPVADDNTVHFNSTLMALIRTALDIKIAKGGADKQQMDAELRKEMMAIWPNLSQKTLDLLVTPHKSTDLTVGKIYAAMMIMEYYRQSKAKKLQALREEQNRTPLMFQRMEPPSPTQEGGPGQNALPSSQLDPGGGLLAHESSMKESPSWVTQRAQEMFQKTGTWSPERGPPTDMPNSQPNSQSVEMREMGRDGYSDSEHYVPMEGQARAASMPRLPAENQRRRGRPRGNNLSTISDTSPMKRSASVLGPKARRLDDYSLERVPPEDTQHHHQRRRDRGHRASERSLGRYTDVDTGLGTDLSMTTQSGDLPSKERDQERGRPKDRKHRQHHHHHHHHHPPPSDKERYAQERPDHGRARARDQRWSRSPSEGREHMAHRQGSSSVSGSPAPSTSGTSTPRRGRRQLPQTPSTPRPHVSYSPVIRKAGGSGPPQQQQQQQPAARPGRAAPSGPRRYPGPAAEPLAGERPPAGGHGSSRSPAMERRGPGPARSESPRACRHGGARWPASEGPPGPRHHGYYRGSDYDEADGPGGGGGEEPRAAAYDAPPPARRACSPRTPRAPGPAACASPSRHGRRLPNGYYLAHGPARPRGPGPRRGLHEAYSETDDDDWC\n>UniRef90_A0A7W4JVT6 Chromosome segregation protein SMC n=1 Tax=Gluconacetobacter azotocaptans TaxID=142834 RepID=A0A7W4JVT6_9PROT\nAAEAAERARAAARRALDRVEAHIALGRLERERHDEATRLDRLEHAEAEVARAGLRLAACTMDDARMAAIRQAERAVQTARAASRAQATVLNVVLEDGAEGRLVLDGRVLQTGSVDLTDSATLRIDGVGTIRIEPASGDRARLRAELTAAEDALRRMLNQAGCADPDAAETALAQRRQADLALNAARSVLSHLLPGTQDVAAAMAEARRRVAALDERIARQAASLAHGPNPADAAGGEPGVDVAATHDAALRAMQAADARAADARQALFAPDETLRQAAADLAGVRAEEQSAREAAARLVRDMAAARTAEADDVLSARQETARAALAQAGQAVQRAEAARPEGTEALADAAIRRQERLIQDGQARLGTLRQDMAALEARIRAAEGDGLDERIAGQERLRESCAAECAVCTREVKILHCLRDTLTAAERAATERYLAPLCRAIQPALAALFPRAGVTMEADFSVSRLTRRMDEPFDTLSDGTREQIAVLVRLGLADLLRARGRPAMLVLDDALTYSDAGRLERLFDILTDAADRMQILVLTCRAELFTGLGARPLTVEAVDKVQ\n>UniRef90_A0A327SST6 Ferredoxin-NADP reductase n=2 Tax=unclassified Kitasatospora TaxID=2633591 RepID=A0A327SST6_9ACTN\nMDLETPPPDLYGRPRADRFFARLTAFGDRYSPALGRPGLRRSPRRPEARPVPPLHLVVVSHRVVAEDVAELRLADPSGGMLPPWQPGARIVLTLPSGRARHYSLCGDPADRHAYRIAVRRIADGGGGSVEVHDDLHVGVRLRVRRPRNGFAFCGEEKVLFLAGGIGVTPLLPMARAARQAGLDWRLVHTGRTAAALPFTDELRALDPARVTVRTDDEHGLPDAAELLAHAPRGAAVYVCGPAPMLLAVQRALPGSPAAALHFERFGAAPIRDGHPFGIRIDGRTLTVPADRSALDVAREVRPDLPYSCRQGFCGTCVLKATGGTPEHRDRRLTAEQRAAGLILPCVTRAAAGETLVLEV\n>UniRef90_UPI0002D87B73 type II secretion system minor pseudopilin GspI n=3 Tax=unclassified Sphingomonas TaxID=196159 RepID=UPI0002D87B73\nMPDRMRPDERGFTLIEMMVALAVFSLAALALIRLEGATIRGATTLDTTLMAQIVARNVAYTAMTDGRAPTIGAASGIEQNGGRSWAWTRVVQPTGDARILRIDVTVLDPGGRRAGHLTVVRDGATRP\n>UniRef90_UPI000FEB7CF9 aspartate-semialdehyde dehydrogenase n=1 Tax=Streptomyces cavernae TaxID=2259034 RepID=UPI000FEB7CF9\nMAQARSGRPTLAVVGATGAVGTVMLQILSQHADIWGEIRLIASPRSVGRKLTVRGEEVEVVALAEAAFDGIDVAMFDVPDEVALKWAPVAAGRGAVVIDNSGAFRMDPDVPLVVPEVNPHRARVRPRGIVASPNCTTLSMIVALGALHAEFGLRELVVTAFQAVSGAGHAGVIALRRQLSLVAGTELGTSPGDLRRAVGDDTGPFPEPVALNVVPWAGSLHENGWSSEEMKVRDESRKILGLPHLPVAATCVRVPVVTTHSLTVHARFEGDVSVDGAREILATAPGVVLFDDPAAGEFPTPADAVGTDPTWVGRVRRALDDPTALELFVCGDNLRKGAALNTAQIAELVAEELTGR\n>UniRef90_A0A7X3VZR8 Xanthine dehydrogenase family protein molybdopterin-binding subunit n=3 Tax=Dehalococcoidia bacterium TaxID=2026734 RepID=A0A7X3VZR8_9CHLR\nMTTTEREETKFKVVGTRPVRHDGIEKVTGQALFGADIDLNGLLHGKVLRSPHAHARVVSIDTNRAESLPGVHAVITGDDLTPAGPMERGGGNRTDAILAQGKVLYKGHPVAAVAANSPHVAEEAITLIDVTYEPLPSVTNVEDAVAPSAPVLHEGWDDPSNGVPSSELDSPNAASLERHVRGDLEAGFAEADLVVEREFRTKTVHQGYIEPQNGTASWSPEGRLTIWCSSQGHFGIRDAVAELLDIPVSQLKVVPMEIGGGFGGKLTAYLEPLAAVLSKKSLRPVKMTMTRAEVLEASGPTAGSHVKVKIGVTNEGRITAASGKFLFEGGAFGGGPVAPACAAIFAPYNLENVRIDGYDIVTNKPSTRAYRAPGAPIVAYAVESVMDEIAEMLDIDPMEFRLLNVAREGIRRADGVMNGRIGAAEVMEAVRSHPHYVAPRDGANHGRGVAMGFCRNNTGPACVIANVQDDGRISLIEGSVDIGGSRTVIAQQLAEVLGIPVEDVNPSIGDTDSIGFTSNTGGSGAAFKSGWAAHEAARDIIAQLTERAALIWDVSPEQVRYEDGGVEHVSDTELRMSFREIAGMLPDSGGPVVGRANLNPVGQSGSYSANIVDVEVDPDTGKVDILRYTAFQDVGFAIHPSYVEGQIQGGTAQGIGWALNEEYFMSDDGAMLNTSLLDYRMPTTLDLPMIETVLVEVNNPGHPFGVRGVGEANISPPMAALANAIHDATGLRLRELPMNPQAVSKAIQEKAG\n>UniRef90_A0A6G4ZTC8 Sodium:solute symporter family protein (Fragment) n=1 Tax=Chlamydiae bacterium TaxID=2081524 RepID=A0A6G4ZTC8_9BACT\nMFLDLFFAGLFLAGLYFFGIRKSEKVQTESAYLIADRKIGLFPLTATLVMTEFNTATLISFSSLGYLAGKRALSLPLVFLIGLLFYAVSVAKKWKGFDGISVASYFSKRYGRDIGIIASIALFMAMSGFSAVYVKSLLLLFSPFFPSIEPWVLSGVLVALVLVMILRGGLLSIIRTDVFSFIVILGFFPLVALFAFKTPLGTPHEMIDVSSHLPVRFVISLVVLTMFTYILAPWYGQKIFAAKSQKTAFLSVFFAAIIVFVLYGLAVMSTWFLRKNGAEVSNPEQAFPMAMMLTLPSGLKGLGYAILFAASATTLSGVWSAMCSLAVGDFLKAKNSYKRSMGLTLMFALLSFVLANVLVDKVLDKLILANIPIAALSFALLAGFYWKRTSRFGVYLSMFVGWVCGIGSYLYFGEAGGYTWYWAMWGIPAT\n>UniRef90_A0A7G9G4R0 Ribosome assembly RNA-binding protein YhbY n=2 Tax=Lachnospiraceae TaxID=186803 RepID=A0A7G9G4R0_9FIRM\nMNSRQRAYLKSLAMTIDPVMQIGKSSLTPEITEAVSEALEARELVKVNVLKNCLDDPRMIAEALAERTRSQVVQVIGKKIVLYRESKTKKKLELPK\n>UniRef90_P59908 Photosystem II protein Y n=4 Tax=Bacteria TaxID=2 RepID=PSBY_PARMW\nMLGIDARLFLVVAPILAAVSWAAFNIGRAAVGQLQLLIKRSRA\n>UniRef90_A0A645HJN1 CN hydrolase domain-containing protein n=1 Tax=bioreactor metagenome TaxID=1076179 RepID=A0A645HJN1_9ZZZZ\nMGDGIQFWGQSFIAGTSGEILAKASADKEENLLVNLDLAEVDATRTHWPFLRDRRIDAYGDLTRRLID\n>UniRef90_A0A3A4YZV3 Sulfurtransferase TusA family protein n=5 Tax=Deltaproteobacteria TaxID=28221 RepID=A0A3A4YZV3_9DELT\nMTDITPNETLDCRGLSCPMPILKTKKTIGNMKSGQILEILGTDPGTRNDLPAFAKRSGHEYLGEKQDEGFSRFYIKVK\n>UniRef90_A0A4U5NX06 Peptidase S1 domain-containing protein n=1 Tax=Steinernema carpocapsae TaxID=34508 RepID=A0A4U5NX06_STECR\nMGAVHLFAVFGLLALVEAKELKLVSCFFTFQNVNRAVFSSTTASKVPFCARLELTKEPFKGQFRHIACSTLTSQFIFTSAHCVTFTANGAVFVGITDMATAFNDPNKQFVDFTPTDVIIHPEFSHKKGNGIALVKVRSL\n>UniRef90_UPI0020216C25 phage major capsid protein, P2 family n=1 Tax=Halomonas sp. ATCHA TaxID=2945104 RepID=UPI0020216C25\nMRKDTRIAYNRLLDRIAQLSGVPSAKEQFAIEPSVQQTLESKIQESSEFLSSVNIIGVDELKGQKLGLGVTGPIASRTDTTQKDRTTSDVSSLESHDYECVATEFDTHITWAKLDAWAKFPDFQTRVRNAIVRQQALDRIMVGLNGTTAAAETDRVANPLLQDVNIGWLQQYRTHAPARVLSEGANAGEVRVGPSGDYENLDALVYDVVNEMLDPWFRESTDIRAICGRKILADKYFPLINQEQAPTEQRALDMILSQKRMGGQQAARVPFMPDGTLLITPPENLSLYWQNGSRRRYLEDNPKRNRIENYESSNDAYVIEDYGFGCLVENIVFGDWSV\n>UniRef90_A0A3M1UPZ1 Chain-length determining protein n=1 Tax=Gammaproteobacteria bacterium TaxID=1913989 RepID=A0A3M1UPZ1_9GAMM\nMHELYEQLLTQLRGIWRFRWVIPTVAWVLFVAAAVVILRLPDEYRATATVYVDTHSILRPLLRGLAVTGNAEQRVRIMTKTLLTRPNLEKLMRMTDLDVKAATPAEREDLLDSLAARIRVESSRRGENLYKLSFEDPDRKLARKVVQALVSIFVEGLLGQSREDTDTAQKFLDRQLAAYAQRLNEAEKALADFKRKHVGMMPGEGKDYYASLKEEEEKLETARLQLRELENRRRVQRRQLAHLDEEESLFDLDPAEGGSLATPYDARIEALHQRLDELLLRFTDRHPDVIETRRLLAELEAKRKAFLAQARQEHKATGGSDPVRAQLQVLLSETESQIAALRTRVKAYEARVEKLRKMVDTIPKVEAQLKQLTRDYEVYKQQYEALLARRQQADISEKAEVSADDVKFRVVDPPHVPLTPSGPPRLLYLGLAVLGSLAAGVGLALLLHLLRPTFQDVRQLRDTLHLPVFGSVSIAVTDEIRRKRRMEMLSFGTIVLLLFGFYGMALFAELFQLGIIRQLHLHP\n>UniRef90_A0A1T4V4Z1 Arabinogalactan endo-beta-1,4-galactanase n=2 Tax=Eubacterium TaxID=1730 RepID=A0A1T4V4Z1_9FIRM\nMKKRSLQKVISTILCTAMVASLTSCSIGKGGKSEKPKETGIFADIVNPELSDKHKGDAVESSVLVNKVEGLSEGFIKGMDISSLIAEEQSGVKYHDKDGNEADLLKILKDSGYNYVRVRVWNDPYDANGNGYGGGNNDIDKCVEIGKRATENGIKTLVDFHYSDFWADPNKQSAPKAWANMGIEEKEKAIYEYTKESLNKLKTAGVDVGMVQLGNETNAWLCGEINWINITTLMNSAAKAIREVDKNIIIAVHFADPSSQERYKNYLQILQNFEVDYDVFGTSYYPYWHGSLENLTEILKFAAETYNKKVMVMETSWAYTPDDLDGHGNTIGAGANVVKNYSYTLQGQVEVINDVVQAVVNVGDAGIGVCYWEGGWIPVPEGDAPRSEKWEKYGSGWASSYSAEYDPDDAGKWYGGCAWDNQAMFDENGNILESLYTFDYCYTGTKCDVAIDEVANTECTIRIGDEIKLPETVTAIYNDRHTEEISVKWEEISESAKYSMQESGAQKYVIKGVASVSGTDYDVTCDVNMIEPNYVENQSFEDDSEEGMKVWTIEDRAKDDAEHELFNMDKITDAYTGTHALHWYSKTKCDFTVTQKITGLKPGKYKASCQVQGGDTTNGAFKLTVESNGKTYEEPTEVTEWAVFRQPTIENIVVGKDGTATISFTVYAEANGTKGPWGTVDDFLFNPVEKNK\n>UniRef90_A0A1H3EFD9 Cyclic nucleotide-binding domain-containing protein n=1 Tax=Ruminococcaceae bacterium YAD3003 TaxID=1520816 RepID=A0A1H3EFD9_9FIRM\nMYVICYGKSPKALEAGGKLIKDIGGRYITGTELLTGSFVIAEGETKCAIVMILPLEAAIRAMGETVTDKTRDLPVIAVSPEGHYAAIIKRGNSVYEQGTDEVYAAVLKSMGPFCFSEFESKSEITSDLTKLISKYNMAVNSEAVLDKVNAAINSGEKINVYTDLPIVFADPVIDPMTYSLHSYPYDLRDEFIKQYKATKNDKNVPSVFITCTYLGDEEDDTNLILVPKLLSLGIEIKVKTDPGYCRPAIRQSLINHLLNPMSVAKVAATYSARESEMVTGIAEELGAEVISYDAEQIANANAPMSMTFNPEKKNDTATALAFLASSEGSIVIRRATSAKGLVFSAAMNRDNIILPE\n>UniRef90_A0A3B0X686 Sel1 repeat family protein n=1 Tax=hydrothermal vent metagenome TaxID=652676 RepID=A0A3B0X686_9ZZZZ\nMNHFSPLALILLLACALSSTSLAASKNKKPGPPDDFEKGLIAYQKKDYATSLMLWFPLADAGNPQAQYRLGKMYLDQKDQRKDPAEAANWIKKAAIQKHAAAQSLLGQMYLKGVGVKRSFSKSAKWLLKAARKKDREAQYILAKLYYYGDGVDKSAPKAAYWYKKAAKQNHTAAQNKLALMYLTGEGIKKKHKKAKQWFEKAALAGSTHAQINLAKLYLNNEVVKKDSHKAFKWYQKAAITGNAEAQNQLGEMLENGVGTQKNIKQAINWYKKSAAHNYPQAHYNLGRAYVNGYGITKNFKKGIAHFHQAAEKGNGKAQKDLGVAYYTGKGITPDSAIAYAWFYVAAANNVADARKTTNALYKKLTAEDKKKAIALATEYKRKYFIRPE\n>UniRef90_A0A4Y2D9G6 Uncharacterized protein n=1 Tax=Araneus ventricosus TaxID=182803 RepID=A0A4Y2D9G6_ARAVE\nMVSFDDVWRAIACPWLSPHHCPSGIDLDVKSRLIRKEYVSPLLWCPTATFTGHSRALTCAGDKGTQTTGRRANIPPSCSLHDIVWRDMVLPASTESCDVSCRAVSVLRRLAH\n>UniRef90_A0A2K9NRQ2 Peptide ABC transporter ATP-binding protein n=1 Tax=Bacteriovorax stolpii TaxID=960 RepID=A0A2K9NRQ2_BACTC\nMLLEVSKLNIHFKSDRSPEPIHAVRDLSFTLKQGEMLGVVGESGSGKSITNMALMGLLPDTAIVRAEKANFNGHNLLNLKEKEWQKVRGQEIAMIFQDPMTALNPFLSVQFQMVETIQGHLKLSKKDAIDKSIELLNLVGIPSPKDRLKSYPFELSGGMAQRVMIAMAISTNPKLLIADEPTTALDVTIQKQILNLIKMLQEKNNMSVILVTHDLGVVSEYSERLQVMYAGEIVETGATADLVRHPRHPYTHALLASRPGAVVDDKKRIPKTPLPSISGIVPAFHQRPLGCQFNPRCQYMTHECQQGHIAIVGEGPQNDNFREYRCIHPIEEAIR\n>UniRef90_A0A521V9W9 T9SS type A sorting domain-containing protein n=1 Tax=Saprospiraceae bacterium TaxID=2202734 RepID=A0A521V9W9_9BACT\nMQPITHCMKKHLTLALLSLASILAAQPDSLTQEYIHGNNIGALLNSNGSLFWDGGNGHFIAGEDGRSLVRAAGLWIAGVGKAGNLKGAIQMYNEDGRSDFVPGLLGDTVNAENWNHIWKVTGEDILLHIRDWETDGVLDDTIASIFGWPGRGNPFFEQYNGFPLPDINSHQLAPFYDVNLNGVYEPHFGDFPMNDTRSCGSAPVPAELSWFSFHDNTPHSESNMAPLQIEVSTEVTAYRCTDNQFANNSLLLFYKITNLAQEDIDSCYFGVFFDFQIGCPNDDYMATYPEKNIFYAYNSDGYDEDCSPYNGFHDQPPVVAVTLLRGPRNEFLEELPLSVIMPIHEGSTIPGQAPPEQPAEYYNYLTGRGKDGIPLTNGGTGYNPGSTDYTNIIFPGRPGMDTTGWTELNAGTLPGRRRVLASYGPFTLQPNAVNAIQLIITQIPGTNGPLLENLDALYDSLFEAFGFLYNGCIDPTPLYPKCTEDIEIPPLPPPPPLPEEFIISPNPVSKILTIQIKDPGNVERLSIYDATGRLVFEKKMLTDVLEIDVAGWPKGTYFVRLGKGDEQFVKGFVVMRR\n>UniRef90_A0A6L2N053 Extensin-like n=1 Tax=Tanacetum cinerariifolium TaxID=118510 RepID=A0A6L2N053_TANCI\nMSDVSSAVTYTLVYTDSEPWRYYGEDSAETGPPRIIVLQPVAPPSLDYVPGPEHPPSLDYVPGPKHPPSPIEIPYVPKPEYPEYLAPSNDEVPLEDQPLRADASPIAASPDYLADSDPEEDPEEDPEDDQADYPVDGGDGDNEPFDDDDTDDEDPEEEPFEEDDEEEEEHLASADSPAAALLSPPLLVPSLPLPLPSPLITSSVDTGASLSYREAGIRMRALLPSTSRRTDILGADMPPQKKACLTTPAPGFEIGE\n>UniRef90_A0A3P8RZN5 Otopetrin 2 n=1 Tax=Amphiprion percula TaxID=161767 RepID=A0A3P8RZN5_AMPPE\nQGRGEPCGEQCSPWPRCSPCKCVTSDNPCEPCRMTVKDRETEEVHLSNNINAVGQTESASEPDLNDSSTEVVRERSRNWGWLLSGIICVNILILGCALVSGSAYNNVKISTPDLQVFLIIILLLTSIWMVYYVIYTARTENAVVYKDDHAGPVWLRGGLVLFGLLICNICFGFMVLKYESNCEIVLQTYFLWVHAKDCVQLQRNISRCGLMLTLSTNLVLWMTNPSARKHIITLLSFGTISCLTAGYGDDKCKCSHTSCSMFKEAYYYLYPFNIEYSLFASAMAYVMWKNVGRVAAEHGHHDIKFSLRDIFLGPVFGVLLVFTGLATFIVYEMEMKKDDHDADKKDQAVMMHFVMNIVIVTLMSVSSVIGCAIYRVDHREHVSEKNPTRSLDVGLLVGASLGQFIISYFSIVAMVATGAKGYLNGLNLAWSILMVIQLGLQNFFIIEGLHREPFHEVEPVAVVPNPYVLEPSKDLSIPEGPVMDTKPNPELTAHSHTPEHRHKLVWKRRVLKEVCVFLLLGNIILWIMPAFGARPQFDHDTETEFYKFNMWAAVVNIGLPFGIFYRMHSVASLFEVFLCS\n>UniRef90_A0A267H7W8 ATP synthase subunit e, mitochondrial (Fragment) n=2 Tax=Macrostomum lignano TaxID=282301 RepID=A0A267H7W8_9PLAT\nYLLLLFLLFKMLNYLMSASRASKLTFLASLAFTGFSVSFVLWTQKSERDAVKQGVLADIERQKLYEETLQKRAA\n>UniRef90_UPI00201FA0E7 ABC transporter ATPase n=1 Tax=Flagellimonas sp. 2012CJ39-3 TaxID=2942214 RepID=UPI00201FA0E7\nMLVDFETLPDTARIWIYQSNRSFSPEELEEINQALSQFLNEWTAHGSTLQAGFEVKYKRFIVIGLDQSQASASGCSIDASVHFIQGLEQKYGVELMDRMNVSFKQGEYIAYKSLKDFKKMAKAKSISKNTTVFNNLVANKLEYSEHWEVPASESWHSRFL\n>UniRef90_A0A674GZ47 Rap1 GTPase-GDP dissociation stimulator 1-like n=2 Tax=Estrildinae TaxID=40155 RepID=A0A674GZ47_TAEGU\nMRTSESASESKGEAQGIHLTVTINCTVAPRANNRGGRPGPSDLTETLNKHLEHLGLCGDGTEAEDQILESLNGILLAITEDKQRSFHLLRGSKIFPTLAKILKGNPRCAVKAAHVLSEIAKNEEMKKPCIEADLVLTLIPLLESTDQEMLLHAGRAIGRICYDNRSLQEELVKVGVIPSLVRILTDYADSEPLVHVALLALYNLADLDSAKEALSMTKVAEQLVKQLRRAESHEKLEIVFEVLQALAENDALKVQLVDAGVPEVLSEILLRLQGSSQAEDTCIMKAASDLIVSLLLGDGNCLRMFQLGVVHQLLDLLEKQVQSGDTSVQQAALSALQSLAVPVVSKVQMLEEGVAERIEALLRAESPPVQFKLLGTLRTLADGQADAAEILGQDPQLLSRLVQWCSVSDPSGICGEANRLLASILHHNRSQEVVKAIQAAQGVKHLVSMTTNEHAAMQNEALNALAIASAIDLETLEESFKESQLVQSLHKLLRDDNTSPEVKYNSMGLLCRLLNSGDLRQEIEEDKIKDTLEKLCSHSNADVVKGATTTLQVLRGETPH\n>UniRef90_A0A6L8ETX0 Helicase C-terminal domain-containing protein n=1 Tax=Candidatus Poribacteria bacterium TaxID=2026781 RepID=A0A6L8ETX0_9BACT\nMSRANYSNREALNDALKVYLQAMYSFVSECLDEQSIRDFLKLQSSDDLMEDIEVKDIANLIKSYSYWSKCFKEKFKIIDRDNTRYYDARSVTSLIVEGRNQLSHQWLRELDPEFTRTQLFFITDILGKIKRSDAQREVEVIRDELFNDTTEQLVTIGVEDEKAKYEKSIAEMEKRLASAEKNKKKLSKQIVDNAVKLDEKTEELEKRSEQLVSAKLSKQECEKQRDSISKQLKKVQTAHSACKEHITTISNQLTTAETERDDYKERFETASRKREEAETEWQACEESLIAMRKLFTIAAIGNQTVQVVYPPIQTDSTIRILDRRNVEKKNYLLELLEQKQPTVIYVQSEERIDQLLALVGPEKADVIGEHNERISEAEEREILEKLQSGELIAVVSNTAFSTLASPHRIEHFVFCHLVPGLDEFFRQCTPAFASEKHAYLHLIYNSEQDIKGLDQKYPDRKTLEKFYPELRKLAETNGDLIRPESLYNELDIAKQGIETGLAIFEELQLLERNDEGIRLLPPAGNKLEASEIYRRGEQIKNGAADFQAFQFEQSIEQIWEALLKELNVDNEHILEASRVYEVRAFQDAIEDSRAQSESSTDAVEDDNAVDSEDAVAKPTLKSARANAKVTEEDVTEIRSRSAAGESDSELAEADSEKKPEVKQSEFWQPIRAGEFGELFTGKPVPVSNEGWIAKTVRNIGVCLYLTNQRCYVQVYFHGANGSERREKIMTLFPKSEYTYAYRDSSRETKVQFPVLDKGRKDQDDWDEIREKLVAMGTDIYNKIDASDL\n>UniRef90_A0A4D9D465 MFS domain-containing protein n=2 Tax=Monodopsidaceae TaxID=425072 RepID=A0A4D9D465_9STRA\nMEAPFLAPESSGSSQDGNVASQETVIQRHPWRVHGSRYFQLILLCILILNNAVVWVAFSAITPATAAVYGVSPGLVNIVALSFQMLFLPGTIAGYMLKERWGLRLTLLAGAFMTALSAAIRFVSLYVPPVSLRNASTDGHDVNNGGGAYALLLLGTSLAALAQPLLLNTPPDLAVHWFAVKERDLVTSLAFMCSPLGSALGVTLAPVFVSEAGADTEEDVSGSHRNDARGGLRLFLLAQLGMSVATTLLAHAGATDRPPTPPSRAAALGSQREEERVHSSDASGSRVLCMPLAWELVAPDLRRCLLCNPSFLLLLFCFGIGLGFFNALLTLLGQLLAPCGYSEAEAGALGGIFLGTGLVGAVMAGVLLDASHRYGLLLKSGFLGAWAASLFVVFTLRPDNFLVLALCFGLLGFTMLPLLPVAIENGVEITYPDVPEFFSSGLLLSAGNLTGIPLAFIFAWTIDSYEGSCRKLWKPAAVLVVVVTTACALPVLGYRPRAFGRWEAEKEQRREGLEGCGHDVATRDA\n>UniRef90_A0A833JG99 Uncharacterized protein n=3 Tax=Komagataeibacter medellinensis TaxID=1177712 RepID=A0A833JG99_9PROT\nMVVTMLFATVLFVVFVTVFVATLFTVLTTLAVVLTMVVTMLSMVFAVIVFSVGDNRQGQTKGSSKQKCFFHVNHFLLIN\n>UniRef90_A0A8S3R600 ANK_REP_REGION domain-containing protein n=1 Tax=Mytilus edulis TaxID=6550 RepID=A0A8S3R600_MYTED\nMNSWKMLLDNFGSLRDCEWFDVHLAIKSALESAFLYMDKSFIDYISFTYGKKTVDLNYFLNFACQNGKEIVVRWIFEQFETNHIDIIAPLLSVCRKGNKELVVYLLRKCCIEDLNLNATMQAACESGTLDVVTMLWEKFNFDIFDVESCFKSSCRKGNLNIVKWLYESFDKALFHDISVLNLACISSNIELVEYLIINFLKTSDNEMTKIEECLSYCNSSMLRFFVGKYGCDLFDLDHILSVGLSENNAEFVIWSLTNFDFKSVDLNNAVKLACQNGNFRLHTSGETRLVEWFLNSNCYESLELQQASNVSCARGKIDVVIMLHKRYNEKACNVKAAVNNACFSGSIETVYWLLNTFQEKDADLDVALAMACGNGKNNLVMWLLEKYDMKFNMKLAILETFKASLKKERSNGKLSENSSFELLNWMLKECGNHILDIKISVLLACKQGKIGHVKWLFDKFSETCRDINPSEALEAACHGFDTFAIYLFLVKRFRNRKFDLQKVMQYACEFGNDQIVEDLLKRFDKNKLNVREGIFAACLKGHLNVLRVLWLYAKPKYFREKRLVNLVSNSENSEMVNWLIAAVDR\n>UniRef90_A0A6M3SAA8 L2 (Fragment) n=1 Tax=Human papillomavirus 35 TaxID=10587 RepID=A0A6M3SAA8_HPV35\nKRASATQLYRTCKAAGTCPPDVIPKVEGNTVADQILKYGSMAVFFGGLGIGSGSGTGGRSGYVPLGTTPPTAATNIPIRPPVTVESIPLDTIGPLDSSIVSLVEETSFIESGAPVVTPRVPPTTGFTITTSTDTTPAILDVTSISTHDNPTFTDPSVLHPPTPAEXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXPIPGSRPTTRLGLYSKGTQQVKVVDPAFMTSPAKLITYDNPAYEGLNPDTTLQFEHEDISLAPDPDFMDIIALHRPALTSRKGTIRYSRVGNKRTMHTRSGKAIGARVHYYQDLSSITEDIELXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXSNTTIPLSSGYDIPITAGPDXXXXXXXXXXXXXXXXXXPIXXXXXXXXXXXXXXXXXXXXXXRKRIPXFFADVSVAV\n>UniRef90_A0A7C6DX07 Oligosaccharide repeat unit polymerase n=1 Tax=Candidatus Bathyarchaeota archaeon TaxID=2026714 RepID=A0A7C6DX07_9ARCH\nMGTVDLLVFVILGALCYFALRFSRFVYGDYFAPVGIFFGVNLASLAFYHLRLIPMVPLSSQAYALIAVAFFSFFTGALTATPTVALRGQPLRKRASSRHVWNSKGLGLFYYFSACVALAGWVFFVTQIVPPGWVRNLWMLQGDYEFPYHLGYTLVAGIAVPPSFVLLGAVRGKTTLPMIFFLITTVFALAIVGIKSYLTIAIATSLIVWATIHPGRLKWKHLAFLALCLVGFMALYDHFIDIFVPRHFPGSRFPTILAFLERPYLYLVGPWAAMSVVMAAPPPQAQWGQVTLFPLWKILGPGGLSVMERVPQYLPFVDIGPSMFNVYSLIGEVYWDWGWVGVILICFLLGFISTRLYVKAQNSRNWIDYLSTGFFSYGLFISFFAYYYRETLIFLLIYPVVIGPLVSKLVSSLRVPRVRPVGIKI\n>UniRef90_A0A1M5D686 DNA-binding transcriptional regulator, Lrp family n=2 Tax=Caldanaerobius TaxID=862261 RepID=A0A1M5D686_9THEO\nMDKCMDVIELLYENSRLTDEQIATMTGLDTEEVKNIIKKLEDEKVLLKYRALVNWEKTQKEVVHALIEVRVTPQQGHGFNAIAERICQFDEVTSVSLVSGGYDLAVEVEGKTMKEIALFVAERLAPIDGVLSTTTHFILKKYKQEGVFFTDGPEDQRLVVTP\n>UniRef90_A0A353M699 ATP synthase protein I n=8 Tax=root TaxID=1 RepID=A0A353M699_9GAMM\nMAVKSKLPKIQLIIILVTVAYFSTLGAGLSAAYGGLISLMNTGLVNRHTNKQREDLTISAQAGVGMMAISVIMRMAMVVSLTLAGHFLLKLSTDALIVSLVLGLIGFLIDKMLSNGGQ\n>UniRef90_A0A8T0H0I4 Cytochrome c oxidase subunit 1 n=1 Tax=Ceratodon purpureus TaxID=3225 RepID=A0A8T0H0I4_CERPU\nMINHSEGSTVKIMFYWGYFVSSSRKTGQWMSSSSFHTDIFTNGFYVGLHEASLIVLIAWFFPSPSICSSQSASVLFVIIASVSSCCKKNDCSPSLAMLHICSTIIKRVAIQFKCTH\n>UniRef90_A0A536S874 SGNH_hydro domain-containing protein n=1 Tax=Chloroflexi bacterium TaxID=2026724 RepID=A0A536S874_9CHLR\nMMHRVVAVDLLILVLLAGCNAASTATARVTPSPSGTSSPIATATPSSSASLNSVRYVAIGASDTVGVGAVDPARGSWPARIAALLPSGAAYVNLGVSGSLALQAQREQLPGAVAQRPTVVTVWLAVNDLNATIDPASYQDALGAIVDGLVQGTSAMIFVGNVPDLRGVPVYASVDKARLLAGITAYNDAIARVAARSATRVFVVDLFTGSAALVSTATVATDGFHPSDAGYQLIADRFAGAMRAKGIPLRS\n>UniRef90_A0A1Q9YEZ7 Translation initiation factor IF-3 n=2 Tax=Erysipelotrichaceae TaxID=128827 RepID=A0A1Q9YEZ7_9FIRM\nMSKGRYSIINNRKVAPNNVNDDLFNEKIPFREVRLIDSNGDQLGVKSKREALEIAYRQNLDLLCVAPKARPAVCKILDYGKYHFEQQKKAKEAKRKQHTVELKALRLSPVVDTHDFETKLRQARKWIEQGMKVKIDMRFRGRMMTRQEVGKQIMNDFLEQLSDIASVEKKPSLEGNTMSLILAPQKKK\n>UniRef90_A0A1R4ENY9 LigA domain-containing protein n=1 Tax=Corynebacterium glutamicum TaxID=1718 RepID=A0A1R4ENY9_CORGT\nMTLTPEDMQLFKDLRMTEFGRVIQEIIDDPDRDHDSFEDKIQQALYAQRDARDNRRIEKLLKAAGLSYTAAALERFDVTGDRGITADRLLRLGPATG\n>UniRef90_A0A7J9XK46 Phenylacetate--CoA ligase family protein n=1 Tax=Pseudonocardiaceae bacterium TaxID=1873463 RepID=A0A7J9XK46_9PSEU\nMSNANSTAPASRRGAAQRLSEYRRYWDEDRETMDPRLREKKIVERIQNQLRYVYAKVPFYRRHYDAHGFTPDMVTSLEDFTTKVPVITKKMLVADQAEHPPFGSYLGVERSELTRIHGSSGTMGTPTMYGVSRRDWAGAGKFSCMALWCAGLRPDDVVHISFPFTLFFGGWGLLQAAEQLGACTFPVGTMVSTERQIELLQRLDCDVLVATPSYVNHLGTTARAHGIDVRASAISVAVMGGEPGASIPAVRESLHQLWGEVSLIDLAAGSTSEMYPFTTSMGCLESDGGVHLFQDENYTEVVSIEDPNEPVPPGTSGAVVATHLWRDSQPMIRFWTGDEGVIDTEPCPCGRTYPRMPKGVYGRLDDMLLVRGANVYPSAIESVVRGVEGSGGEFRIIVDRPADLDEITVEVERDAALATDRAPALQATLQEQFKNALGVRVAIRVVEPATFEQQTFKARRVIDRRSSS\n>UniRef90_A0A7S3PQM2 SSD domain-containing protein n=1 Tax=Aplanochytrium stocchinoi TaxID=215587 RepID=A0A7S3PQM2_9STRA\nMLKDGAIDQSEEEGCVGSLKRRYLESMHKRTKTHCGGCFAIVLLLSFTVSAAYEFLQGDADFADPNQPATLAFDAVELSRELFDIAAEESEEESNHFEGVSFGYEWKDGRSENIFTPKNLQTICTIEQIMFAQSAYGFDLCDPRNINTTQTCVTSFTEEGVDTSIAGNFYRFENASFNFEDCHLLADEVVGNYSDLIYTSLSLSDSSPARFFVNSKTKSTITRSTLLLSHPVEKTAEEKLLDMEQDYFDFFGMEATLFRSVYRNPATLGDIKMSFFNIVLLENEFERMLPSDFIMAFGSMTFVAVWMGIYTKSLFLTVCCTGYILFSIPVSLFMYKVVFRILYFDFIHVLVIFIILGIGADGTFVVIDAYKQSRLLLDDDLERLVYSWSRSTATVFNTSFTTVVAFVVTGFTPLIPLSTFGIFAALCITVNFVFVCTIVPSTVILWERWFVKDKEKGVEKSEVVPELKKENSNSSFEGHFKSKDEAKHTLDALVEGNNRVFEHYYVPAILKCKQVFVLLGLVIGILGVYGVTKVSQLTKPEQWFPEDHTQSIFIEKLILEFLSGEEGEYAEVTVFWGIDKVERDYPARYSGDTETYDDKVIFDDSFDITDFQTQLAIIKMCELLENRTCDEDTCGGFTTLLFPETNTYQGMCTMREFHNWWNVEKNFSVPLNSANETLFYERLGLFVVENPEMARHVGIIGGVVKFFSIEYIMTLKILAPGSEVQNYVDIMDNIIEKYKSFAPASAQSVDYSSPDFVEYALELSLQETVIKGLAITFPIVFVVLLLATGNWILAAFSVIAIAFIVVTVMGFVFAALGWELGIAESIVSIMIVGLSVDYAIHLGHMYTVAGKSEGFESREDKFHYAVLTMGPTVLAGGMTTLGAGAFLFGAQITFFGKMGVLLVLTVTCSLFYSLVFLMSVAAWFGPQGTYANLNRTCSKQ\n>UniRef90_H6QP23 RNase H domain-containing protein n=1 Tax=Puccinia graminis f. sp. tritici (strain CRL 75-36-700-3 / race SCCL) TaxID=418459 RepID=H6QP23_PUCGT\nMAGARRWIGLEALEAGYSAACGEILGSRISGYSMYTDSMCVHNSTNRTFGWARS\n>UniRef90_UPI00197E61F8 hypothetical protein n=1 Tax=Salmonella enterica TaxID=28901 RepID=UPI00197E61F8\nGRGGGGGRGGDRGRGEGEEEKGEGEGGERGGKKGRRGKEKDRKEERGGRGEGGKREREKEKKGREKGGGKENIGKKKGKRRRRRKGKKEEERGEKKKRKRRKGRRKRGGGKEERKRGKKKKGRKEEEGKRKRGKRKEGRKREEGEGEKRRGEGEKERGRKGERKRETRKKKRERRGEG\n>UniRef90_UPI00082B7ECA thermonuclease family protein n=1 Tax=Sphingomonas soli TaxID=266127 RepID=UPI00082B7ECA\nMLAALSLLIAAAPAGAACVAVDGDTLRCGDERVRLLGIDAPELPWHCQQGRHCAPGDPYASTRSLRAALSRGPVSLRRFGTDHYGPTLALVSAGGVDLSCWQLSHGQAIYKSWWDNGGQLARICPAAR\n>UniRef90_A0A1V6AN80 Heptaprenyl diphosphate synthase component I n=1 Tax=Firmicutes bacterium ADurb.Bin146 TaxID=1852882 RepID=A0A1V6AN80_9FIRM\nMNNTKKLTISAIFTALAIAISIAESYIPYSAIAPGVKLGLANVIPMTLLYVLGPLYAISVQAVRIIVTGLLRGNLVTFFFSFFGGMASTVLCALIKKQKIIEFSVIGLSVIGAVIHNTAQFFTALVILKNINILWYIAILAIFAVIAGVLTGIIAKYTIKAIERYSRSI\n>UniRef90_V7ICF6 Signal peptide protein n=17 Tax=Eikenella TaxID=538 RepID=V7ICF6_EIKCO\nMQKYILTTLLLACATTAGADNFRPQKLALIHSLYVPYQNGNTVHAHPERHFSADLRAVYQEDKQHTAPNEVGCIDYDPIIAGQDWDSASLNRTLNIRPLANGRIEAVFQQFPGDFSATQVQFVLQCSPNGRCLVDDIYSATPGHRLVSFKRSVRRCISEMTNQH\n>UniRef90_UPI001C0085A9 TIGR02680 family protein n=1 Tax=Nocardioides sp. LMS-CY TaxID=2840457 RepID=UPI001C0085A9\nMTLTQIPTEGIETADQTPPKHHPYRWRMNRAGLVDVWYYYDTEFDLSGGRLVLRGTNGSGKSRALELLLPFVLDADRRKMDATGSGKVSLVELMKAGAADRTTRAGYVWLELARSVDPTDPADAELHESGTTEQHTTIGAHIRFSRSTGEAKVHYFTTDLRVGYDLELLSPTRETLPRDKLADLIGADRITTSPGTHRDRVRATVFTLTGDAGAERYAGLLQLLHTLRSPDVGNRIEEGRLPQILSDALPPLDERALNAAGEQLDGLSETRLAQGRLEAALGHVNTFFDTYRRYAATAVSDSAENTTKAASAAEAAVKDAKNRATVHAELDKARGENQARMGELDESIADLSGTIAGIKQSSAYADARDLDEREKRVEALGAAAVAALVTAERARGAEGREVRTANEAAAKGVSASERAAAAVEKARTKVDAAGVSGGLPASIAATTAPASVLTEPVRLTRDGDPTPLDRPVPVQLSVTPDDLGSAVEQARLVQVSATERGRQAAGRLDKAQALDVQRGKVEAAERRAEEADQRANEAEEVDLERQVELTTAADTYASQWRDWVSAAATVAAFGAEPDLTGTGIDAVLADAPIVIGDLSEDDLTELDHVAGMLAETVREQHTHTIAELDAADQVDDAVRNNLKVERTQLESAVDPSPTTPTWIRPRGVDAIPLWRAIDFGDDLDATDRAGLEGALLASGLLLADLHRDGTLHAENGQLLLTPTGPVDETPVTGKLIADPGSPMPVEVVEAVLARIGFGDRRSGGATTPAGVWVAPDGSWGSGPLTGRYLQPVARHIGTTARAEARRVRLAAIEVELAQLADAAEVRAAARAEARAARDRLGAVTRNAPRTQAVSSARVRAADATNRAAKERSRAHEAAMQASELRTAWSRDVSEHRAICSEFNLPHTADDLQVVRHATGEAESACRDLSNLLDQLITVVADHADAVGRAGDRTDERVEDELRAATEWTTWHREASELESVRSSIGQEAEAAKAELRECETTRKTLEGELDKARTLDSRLGVEVGTAEAEARAAAERVTTTHEDLAATFDQFRRRLEMPGITAAAFAEPPETIELSEVTPAAVRKAVTRTAAGLRRHSQGADENTLFGPQRTLERDLSGSYDVITEVRDGVRLIELSDATGRRSIADAAAELTRTVEEGRNALSERERSVFTEFVLGGVAEELRRRLDQADELIAAMNASLATIRTSHGIGVKLRWKISESSDPAVVRIKELVSTAGAVRSADQTAELTELLKDRVNEAFELDESAGYATHLHDALDYRSWHTVEVIILGPKSGQERRISRKARLSQGETRFVSYVALFAAIDAYLSGLPDTGRALRLLLLDDAFAKVDNRTIGELMGLLVRLDVDFAMTGHALWGDYPQVPALDCYEVRRVEGSAAVTTHVRWDGHTRHLRAAPR\n>UniRef90_A0A3A5MMX1 DUF2236 domain-containing protein n=2 Tax=Cryobacterium TaxID=69578 RepID=A0A3A5MMX1_9MICO\nMHELAGESVLIAAGGRSILLQLADPQIGHGVADHSNFAQRPLDRLNGTLSYVYAIACGTPAEAAHATARVNRAHKPVQSDGAGGGPAYSAYTPQLQLWVAATLYDSAITMYELIYGRLDDDRADDIYREYAALGTALQVPPGLWPATRADFAAYWQRRLGELATDAATRSVARQLLHSPTGPLWLKLGMPFARFLTIGLLPAHVRDLFDLEWTPGAERRFRRTLRVIRAVYPALPERIRHWPKNHYLRSLRASMAAVG\n>UniRef90_A0A4Y9ZFN4 homoserine kinase n=1 Tax=Dentipellis fragilis TaxID=205917 RepID=A0A4Y9ZFN4_9AGAM\nMQLSFITLALAFSALSVSAAPHSLAERAGKGGNKGGNANKGNANNDKGNNDAGAKAGGGGGDLQTSLTLDPSVLAKGFESDGQAQQEAGQVPSLTSSNNFINFCATTKKPITNGQQIKGGSCNPAPMGVIAATDKMPSSKFVFPKNTQTIKANQQFDVQMAIQNIVTGNFVNPNTNYYAAPQHTDDSGTIIGHTHFVIEKLDAIDQTKPTNPGTFAFFKGVNTAAKDGVLSVSVDKGLPAGIYRLASINAAANHQPVLVAIAQHGSLDDMVYFFVTEDGQPDAAAAGAQGNGTAAADVKGGAAADGQGGAAAAKGGDGAGAKGGQAQAAKGGNAQGGKGVYWLSGSGYYTVRTAMSTAPRSFTIRVPATSANIGPGFDVATPMSRPPSPTPARGADEVPLDPYKNLTTRVALYVLRCHDIPLLPSHLSIHVNNEIPFGRGLGSSGAAVIAGVLLGSALGNLNLPRERMLDYALMVERHPDNVTAALVGGFVGSYLRELDAAATQAASVPLSEVLPEYPPDAGPEWGTNPPKPPMGIGHYVRFGWAPAIRAVAIIPQFELSTAKAREVLPESYSRKDLVFNLQRLAVLTTALAQSPPDPELIYEAMKDRVHQPYRRGLIPGLPEVTSSITPKSHPGLLGICLSGAGPTILALAVSGFDAIAEDARKIFKEKGVEVIWKLLDVVSEGSLIKEED\n>UniRef90_A0A1J3I6D3 Retrovirus-related Pol polyprotein from transposon TNT 1-94 n=1 Tax=Noccaea caerulescens TaxID=107243 RepID=A0A1J3I6D3_NOCCA\nMTTTRIDVDRFDGTGDFSLWKVRMLAHFGVLGLKDILTDETLLRDSPTTGAASKEELDAAKKDPQKGIAAEASSSMDPGQELRVCCELQNLI\n>UniRef90_UPI0020262455 photosystem reaction center subunit H n=1 Tax=Flavobacterium anhuiense TaxID=459526 RepID=UPI0020262455\nMDADNRTIGTIDNLWVNKDMQRVVYLDVKADKTLIEDSQREVHENIADGNEKEFMYRDGDSHLIIPIGSVNINKDTKTVMASGIGYDTFRRTGRFNTQQRFDRNYERAVLRSYYPDNDPSVGYDADDDTFYSRKEFGNR\n>UniRef90_A0A4Z1PND5 DDE-1 domain-containing protein n=1 Tax=Venturia nashicola TaxID=86259 RepID=A0A4Z1PND5_9PEZI\nMLRSKMICEKPVLWLRQQHTSAQDLVDAEIDTHGRIHFAGTSAAAWKIGDAYCKVKSYIPGMEYEADSINFVCSKVPTIPLPEVIHTWVDEELCRAFLILSQVKGKTLAECWHSLSSEQRTIIARTIASFCTLLAQNSESSLQSVAGRRISM\n>UniRef90_A0A7V3M636 TNase-like domain-containing protein n=1 Tax=Proteobacteria bacterium TaxID=1977087 RepID=A0A7V3M636_9PROT\nMRAVAIAVLLTLGACGPQLGSLEKGETGRVVRAYNGDTLELDSGLRVFLAEIDAPQGENAYAAQAQGELEALALHRDVQLAYGGARRWVGRAREGQAAAPEAAIAHVFVKSEGGRWFWLQHELVSRGAAYVRPRRDNHARTPELLALEAQARAAERGLWDRREYRSLSVRAAARLATESGGNCMRGDAPYRVIEGEVGEARVSESRALLRMEGAPAETTFALVVFGDNFRAWDGAPLASLNGARIRARGPLGVYAGEPQLCLEHASQLEVLTD\n>UniRef90_A0A1C6CXG8 Membrane protein of uncharacterized function n=1 Tax=uncultured Clostridium sp. TaxID=59620 RepID=A0A1C6CXG8_9CLOT\nMKRVSLFIIVNAISLYLVSLLMNSMYIGSFGALIILTIIFGALNLTVKPILEFLSLPITFLTLGLFLLIINAIVLKLAFGLVPGVYLYGFVNAIGASILLSIVNTIIYKILD\n>UniRef90_UPI00097C6FDA NAD(P)H-quinone oxidoreductase n=1 Tax=Pseudomonas sp. KK4 TaxID=1855729 RepID=UPI00097C6FDA\nMTLPHTMTHIEITQPGAPEVLQPRQVPVPTPGDGDVLIRVHAAGVNRPDALQRAGKYPMKPGMNPIPGLEVAGEVVAVGSGVRTFNIGDRVCALTNGGGYAQYCAVPASQTLPIPEGVDWLHAAAIPETYFTVWANLFEMGGARTGHRALIHGGTSGIGTTALMLCREFGIEAFATAGSADKCAVIGELGAQAINYRDQDFAKVIAEKTAGKGVDVVLDIMGGSYLNGNVAALGMEGRLVMLGFLGGAVAKEVDLLSIMAKRAIVTGSLLRSRTREEKAAIAQQLREHVWPVLAAGRCLPMIDKVYPLADASLAHARMEGGDHIGKIVLSVVQ\n>UniRef90_A0A3D2TG15 Serine protease n=1 Tax=Planctomycetaceae bacterium TaxID=2026779 RepID=A0A3D2TG15_9PLAN\nMTPIVRAVRDARPAVVNIQGQKSVSESAEGTPTSPRQVNGMGTGVVIDSRGYILTNHHVVAGVRRINITLAGGQTYVASVVAYDKTTDLAVIRIRTPSPLQTIRLGTSEDLMEGEAVIAVGNAFGYEHTVTTGIISALHRNVQVNEKQQYLDLIQTDASINPGNSGGPLLNIDGEMIGVNVAVRAGAQGIGFAIPLDKALEIAARLLSIEKLDNHWHGMTALSLDGPTGPVTIARLDRKSPAERSGLQRGDQLQRIGKTSIHRPLDVERALLGRGSGERVPLIVRRGDETLKLDLRLANRSHKRSRGTTRQLSSAIALQQASWDTLGLKLEVEPLDSFQELEVPYRGGMRVVSVRPGSSAAKQGVQTGDVLVKMHRWTTASEKDIRFIVEHADTLARAGKVKFYVVRGEETFFGHLSVAKRSESAVR\n>UniRef90_A0A7I7W7J5 6-phosphofructokinase n=1 Tax=Mycobacterium branderi TaxID=43348 RepID=A0A7I7W7J5_9MYCO\nMIKRIALNGHRATIVTLTMNPALDITTSADRVLPTDKIRCRGTRYDPGGGGINVARVARVLGASVSAVFPAGGPAGDMLANLLVGEQVPFHRVRIASSTRESLTVNEESSGQQYRFVLPGPQLTFSERAQCLDELRMAASSARFVVASGSLPPGVPAEFYQSVADVCRELGARLVLDTSGTGLQHITSGVYLLKPSVRELRECIGRDLGTEAEQVDAVQELIARGVAEVVVVSLGAQGALLVTKQGAQRFPAIHMRSGSGVGAGDAMTAAVTVGLCRGWPLAKSVQCGIAAGAAMLMTPGTAVCRRDDVERLFELAAEPVDLSSVSR\n>UniRef90_A0A499UVA6 Secreted protein n=1 Tax=Streptomyces antimycoticus TaxID=68175 RepID=A0A499UVA6_9ACTN\nMLGAEVVTLGLQLDVLRKGGGEHLQALGHDFLADTVTGDHCEANAARHTGTLPLVPWIDIAVPAFGQPPSGNHPFTPCMVRC\n>UniRef90_A0A5P1EE21 Pyr_redox_2 domain-containing protein n=1 Tax=Asparagus officinalis TaxID=4686 RepID=A0A5P1EE21_ASPOF\nMGNARDRLASKFAAKNAGLWSMDPNQIEEHKGNYANEFIERVRLCDVSAVIQEVMESYEVEINGKVFKKAKKVVVIGGGYIGMEVATATIGWNLDTTEDDDVNSANEGSLPHLRPMGTVVNRHPRHGNRHTRAYGDVLHPSRLQPAGGLMASLCSLVQRFVNRAQQYHKGTVVC\n>UniRef90_A0A8K0D6L2 Peptidase S1 domain-containing protein n=1 Tax=Ignelater luminosus TaxID=2038154 RepID=A0A8K0D6L2_9COLE\nMAKPTFLVLVCFLLMETYESRRQLKDYPFMKFSGIDDYPFHEEEASSLRNKMVPLVVNPPEQLQPPGFSIVVFRRSSIIGSGAIIAKYFALTICTLLKNLGEETFDLTPITKIQYVLHNSSVDDVDVITPIIHKLIPHPHCGNMKKWNPKANIGLIQTKEPMDKTASLRYPLLLTSGQPIPKGEYILSNFRIKNPNAINIKQAIWYVISKPASHQLCRNLFRADRQAYDTQTNLCMSYVHVGDADSCKGDLGIPLSVRHKNRDYLIGFSVHKHYCGSPKEVASFILVGPNKKWIESTIKKLQS\n>UniRef90_A0A6B2C3S4 DEAD/DEAH box helicase n=2 Tax=Thermoprotei TaxID=183924 RepID=A0A6B2C3S4_9CREN\nMQPDFTIEVPTFSIPYSNMYLSDSLRLNTFQAEAYNKINNRRDLVLVAPTGSGKTLILLLNNISAQDKIRGFAALYPNNTLLINQMRTVEEILIEHLEAKEVERVTSGCDNEGNKTEICKEEIFPLKIYKINRGKAEGPWSDTEYAAIMALSGKYIKPTSEETKSDVVYRLVEKLYEYSRKNNLYVIVFATPDTYLLVSTGAYRNFELVGKTLHNILVALVNEKSIDELDNILRRTKVLTRDQVSKSLSVYHQLLNQLPLFIDEFHLYSPFELSALYVIIKIYKSMSDLPIVFSSATPAKEIINELRDAGINPEMLNAEIIHGGDGFHVKGDSVIEVIGVDTGKKGLPAYYEAAEKVPGIVTEDLFDEVKEIDRYKDGRALIILERLWMVTRLAEELSKKGIRPDCIASIVPSKICAKGSNVIVGSEATTQGVNLGKIVWGITAGVSSEDVIQRIGRFGRKGVSSKIYLVLPKHVLEKNLPKSTMNYYELTEWLSKVYLDYPKRKKDVSNIIPSEFYNVRKKLIHAYALSSMVRVSGMKGLGEIDLKKEEALKLLNSFIGDSRALVNLLVFRRTGFSVEFIDIKYGEQGEASIGLIARNFKVLAYKGGKLEIDLSQSERQELVLSLNKEPRSFVNKFIDIRTLLKLLKGSLKIGDSLMLDEKSVGEGLVYVVDAGEDLAEYLSYTGEGARTVYTGGSEIRYAIMFI\n>UniRef90_A0A6P0Q7Z9 VanZ family protein n=1 Tax=Microcoleus sp. SIO2G3 TaxID=2607795 RepID=A0A6P0Q7Z9_9CYAN\nMPSHRSWFFALWFYLGILAAISLAVYLKIIPSKITKIQPIDTILHFIFIGFLAYIGHLSIKKYKIKIFQIFLPIAPIIVLFFSFIDEFIEIFIWRAGFDKLDSAADFCGVIFFTWLAERRHT\n>UniRef90_A0A0N4VJ66 LisH domain-containing protein n=1 Tax=Enterobius vermicularis TaxID=51028 RepID=A0A0N4VJ66_ENTVE\nMVEQCDKLLNFLSNEDSVKSNTEDLAIVAMFAPQPKAQATTRPAQMLTSQSEASAKENHKLYKVLGGIVLKVRLAGYVYEYLILNGATKTAECFKSEYLSTITKAMPTLQSSDPPGFLQNWFFLFWDLYSAAPEKRDSCEASQEAKAFHEFGFMNPSHGVPTGPVSGPMMNGMHTSHMFSSAAPSPLSLGPGPGGDGMMPGGGYYPPRSAQPGPSGSTSQASPISGVPSAGNFAAVPPRYGMPAARNGPPGPGGMPPAGFPGGAPPHMFTGSEQMRPLPAQRLPPNAGPMRMPTGYPGMRPNGPMRYTSPMYMESPTGAPFSNTMMPNGAMCSSSAASMMSSPGPGGPMQSGPESQDPRSYMMMSSASSMQYMHPEGSMTPGAGGRGSAGPPCSTSDPQMTSLLNGDEMKHSPASTHGGISCGTPSATGGPGSQAAVGGPGSVAGAGVGGPGSVHSQSGGSTGGQGGPPISQGGNAVSGQEEASEISKIKQSLFDDMKYGGKEESTTDNYHQYP\n>UniRef90_Q0I9X6 Membrane or secreted protein n=1 Tax=Synechococcus sp. (strain CC9311) TaxID=64471 RepID=Q0I9X6_SYNS3\nMNLTKFILRASLLVLAVLVAVAFVLVRRDSIVGGDSFVGDQTKSQRFLVRNGRDRTQSPSTSNSY\n>UniRef90_A0A1B6BJ90 Fe-S oxidoreductase n=1 Tax=Fusibacter sp. 3D3 TaxID=1048380 RepID=A0A1B6BJ90_9FIRM\nMKTLFMTLNSKYIHSNLAIHSISKYIKRYCTHYDALHDDVLVKEYTINQSQDDILRELIEIDADVIVCSSYIWNIEALIILFSNYRKLNHNSYIIFGGPEVSYDAKDKLEKQAFLDMIAMGEGERTITQVLDLIYEQFKNSNPRNALTANFSHVSGVAYRAGDLISVNSKRIPIEPLDEIPFVYDDFTPFENRILYYESSRGCPYSCSYCLSAAEKGVRFYSLERVFNDLNVFLEKKVSQVKFVDRTFNVDKEHALSILRYLIEHDNGITNFHFEMTATLFDEDYFKLLLNAREGLFQFEIGVQSTYKETMIAINRPIAFDKLKINCMRLLKMGNIHIHLDLIAGLPHEGYERFLRSFDDVFEMNPHALQLGFLKILKGTPIMATQEKHGYEFRKQTPYEVLYNRYIRFEDLTKLKNLETVLEYYYNSGKFKHSIQYLLKTEKGTPSDFFLKLCDYFKAHDLMYIAHSTANLYDILYEFYQENYENHALFNDLLKFDYYYAHMKGLRPFFVMSEIPQFNTRRLHYLKALEHQELINPFYVGMQSKQILKTVEFITLNYDIIALIQSQYEFIEAKLNVVLFDYQRANHAIEPSKYFKVELPVI\n>UniRef90_A0A2E4DAR7 ABC transporter domain-containing protein n=1 Tax=Halobacteriovoraceae bacterium TaxID=2026745 RepID=A0A2E4DAR7_9PROT\nMKYRLNRKFIPWLVLHSIEYWYYYLGALFCLVMLHHFSSEIPMLAKELGDLAIAGKLDEIEIKTFFLLAIYILFFRTLSRLLFFYPARIQQRNLRMELVNRLEVAPPRNYKNYNEGMLFQTLYNDLNRIRGFVGFALLQFGNIIIATYIFVPKIRDFNPDFLVAFTPLIGTVFCFALIVGGFFPFVKRQMDQYADVQNFLLESYEAKKTIQNYHAEKDFYKYFDEVSGKELKTFFISSIGRVISFPLVKLGFGASLIWAALIVKNDNLPASDLIYFSSFLFLILEPLMFVSWIGIVTTQGYAAWVRIKSLVRDLSAPLTADWLVNQSGLESVRMPLWDHEIEVEFPKNQWSVIVGETGSGKSWLIENYAQYLQVKGKRYSLIHQEPYIYNDTILDNIFLGQEVTLEKLKLAKEYLHKFGLDILAKNMDDLLSLELGENGKRVSGGQAKRIALIRSLVADVDFVLWDDPFSSVDLILEAKILDDLQKEASLKNRTFVLTSHRLSTVRACDHITYISKSQGIIEKGKIEIILNQKSRVDEFFNKQMA\n>UniRef90_A0A0C5PBV5 TrfA n=11 Tax=Enterobacterales TaxID=91347 RepID=A0A0C5PBV5_ECOLX\nMTDNKTHSELDKLKEAALAQRKKTIDEKNTQKQLTLFDIAPWPDSMRALPNDYARSALFTVKNKRQPREALQKKEIYHINKDVRITYTGLELRADDDELVWQQVLEYAKRKPMGEPITFTFYELCQDLGWSYNGRYISKAEECLTRLQATAMQFISDRVGQLESVSLIGRFRVIERGTRSSRCEVMIDKEMVLLFAGDHYSKFVWEKYRKLSPTARRLFDYFGSHREPYPMKLDTFKLMCGSDSDRIKKWREQVNKACVELKESGLIHSAWVDKDRIYCKRSTDEPKSDGDT\n>UniRef90_UPI00036E30A4 DUF4170 domain-containing protein n=1 Tax=Methyloferula stellata TaxID=876270 RepID=UPI00036E30A4\nMSQEAPAQLLHLVFGGELENLEGATFKDLSKVDLVGMFPDYASAYAAWKSRAQATVDNAQIRYFIVHLHRLMDPAKGE\n>UniRef90_A0A151E9N9 DUF3467 domain-containing protein n=1 Tax=Euryarchaeota archaeon SM23-78 TaxID=1803821 RepID=A0A151E9N9_9EURY\nMEKKEMPLIQNLDNNPLLSNQHAIVHNPDKFIIDFKGLYPQFTPDNKPQMVLTHKVVVLEPYVAKEFVKSLSDNIKKYEDKFGKIKEPKAVEKARKESKKADKKNKSTTPRPSYMG\n>UniRef90_A0A8S5REQ6 ABC transporter permease n=1 Tax=virus sp. ctkyY8 TaxID=2827995 RepID=A0A8S5REQ6_9VIRU\nMHTSVLSRIVRVFQMILTELSTKRRILTLFLWVGVVI\n>UniRef90_A0A6P6A4G9 zinc finger protein 6-like n=1 Tax=Durio zibethinus TaxID=66656 RepID=A0A6P6A4G9_DURZI\nMAENSISNKSSSADMAPDKQSDQKPSSSLKLFGFSLTEQDEILEKAEDFGESRKFECPFCHRVFANSQALGGHQNAHKRERQRARRAHFHSHQRFIAAAPVLSSHAVRSMPPSFPRGFSSNSAGKLVSQPGYYPSQPLLLPPTPSQYTPRIYIARPLHFGTAGPGFAEFSGKLPEADIGIDLHLKLSPSGS\n>UniRef90_UPI000767A53D serine/threonine-protein kinase 17B isoform X2 n=3 Tax=Vespertilionidae TaxID=9431 RepID=UPI000767A53D\nMFTIFLLLQKCLETVLSRGKFAVVRQCISKSTGQEYAAKFLKKRRRGQDCRAEILHEIAVLELARSCPHVINLHEVYENTSEIILVLEYAAGGEIFNLCLPELAEMVSESDIIRLIKQILEGVYYLHQNNIVHLDLKPQNILLSSIYPLGDIKIVDFGMSRKLGNACELREIMGTPEYLAPEILNYDPITTATDMWNIGIIAYMLVTHTSPFVGEDNQETYLNISQVNVDYSEETFSSVSQLATDFIQSLLVKNPEKRPTAEICLTHSWLQQWDFGNLFLPEEMSSPPQDQDHTTRSSEDKTLKSSCNGTCEDREDKENIPEDSSVVSKRFRFDDSLPSPHELVSDVLC\n>UniRef90_A0A0F5JDP3 N-acetyltransferase n=21 Tax=Tannerellaceae TaxID=2005525 RepID=A0A0F5JDP3_9BACT\nMGVVIKEVTSKKELKKFVKFNIDLYKDNPYHIPGLIEEEMVTLDKKKNPAFEVCDAIYFLAYKDGKIVGRIAGMINRRSNEVWNQQRARFGFLDFIDDAEVVDALFNAVEKWAKEQGMKEIHGPLGFTDMDHEGMLIEGFDQLGTMAAIYNFPYYPQHLERMGYEKDQDWHEFKIYIPEGVPDKHLRIGEIVKKKYGLKTMKFKKTKEIWPYAQKIFETLNEAYAPLYGFAPLTQKQIDYYVKMYIPMIRLDLVTLIIREEDDTVVGFGISLPSLSHAMQKAKGHLFPFGWIHLLKALKTKPKVIDLYLTGVLPEYQNKGVNALLFNDLIPVYIGLGVEYAESNPELASNNAVQAQWDYFKREHHKTRRAFIKKLK\n>UniRef90_UPI001C659291 IS30 family transposase n=2 Tax=Arthrobacter sp. AQ5-06 TaxID=1914304 RepID=UPI001C659291\nRAAIPSEPSKRQGDLGHTHHPRVIETLRQLRSHPQQNRKEGDLIIGKGNQSAIGTLVERSTNYTMLVHLPDGYKAEQMRDALAAKIKTLPAALRHSLTWDQGIEMQDWKTVKIDTGIEIYFCDPHSPWQRGINENTNGLLHQYFPKGTDLSIHSAADLDWVAQELNDRPRKRLEFRKPIELIENLLLQRPPESADPSTGRRVGARANLLIRS\n>UniRef90_A0A6G1SZ52 Flagellar basal body rod protein FlgB n=1 Tax=Dehalococcoidia bacterium TaxID=2026734 RepID=A0A6G1SZ52_9CHLR\nMNTLFDTTAMRAAKAALTGLSRRQEAISANVANIDTPGYTRRAVSFEGALEAEVMRSQGAAAPGELVRTDAAHLAHRGGSQLGGAGASGDVTRDVVSARNDGNTVSVDEEMLLLVETQLRYQALTQSVGRRLSTLRSVIRG\n>UniRef90_UPI001939DEA2 hypothetical protein n=2 Tax=Microvirga TaxID=186650 RepID=UPI001939DEA2\nMHLFGALELEIRPGTPDNPASVKIALLRYTRGEDGRLFITPECTSFEEIEGQINSLQDELDEIRERAQRAFQVT\n>UniRef90_A0A7W0G2E6 HNH endonuclease n=1 Tax=Acidobacteria bacterium TaxID=1978231 RepID=A0A7W0G2E6_9BACT\nMRGEFSNPTRRQAFERAGGRCEICAIPFTPGKFAYDHRDPEWMCGDSTLGNCQVICNQCHADKTAVDAGNRSHVKRLIDRQLGIPKRKGPPMAGTRASGWKKLMNGQVVERR\n>UniRef90_A0A4Y3PSW6 BPL/LPL catalytic domain-containing protein n=4 Tax=Paenibacillaceae TaxID=186822 RepID=A0A4Y3PSW6_BREPA\nMPFYWWEQTPVQLLATVSRPYRGEVLIPFSVDEAYARLCSQEPTTAPVIHLWRHEKAIVLGARDAKLPHAAEAVRQLEAAGYQTAVRPSGGAAVPLAPGVINLSLVMPVAASDLNPEPFFLRMVELIRATLGDDGAKMSSGEVEGAYCPGTYDLAIAGYKFCGIAQRRLTRAVAVQAFINVEGCGRTYEEIIQSFYEKAAMGAPGEQFPQVQPGRMASLSELGVSGGVEGFVLRLQELLHAHAESSVAVLDACPDSLAHEAKQALDLLKGRHRQLVGS\n>UniRef90_UPI001657DD0C hypothetical protein n=1 Tax=Sphingomonas sp. JC676 TaxID=2768065 RepID=UPI001657DD0C\nMTIRSRPSLWLALVVPPLAWYGFQQGLATTLRGACGAAGVPLGPLWGAGSIALCIGAGWFARPRPGQQSSDRLLSQLGVLAAGLFSLAIFYQSVATMIIPPCAR\n>UniRef90_B7K1R7 Transcriptional modulator of MazE/toxin, MazF n=1 Tax=Rippkaea orientalis (strain PCC 8801) TaxID=41431 RepID=B7K1R7_RIPO1\nMVTYNQFDVVVVPFPLTDKTTSKKRPALVISDMAFNLSLKKIVMAMITTSGHSSWMFDVSIVNLAASGLKSPSLIRMKLFTLDDALIVRKIGTLTQSDQERVKNSLKQLFKLL\n>UniRef90_A0A846C4J9 Cobyrinate a,c-diamide synthase n=1 Tax=Okeania sp. SIO2F4 TaxID=2607790 RepID=A0A846C4J9_9CYAN\nMSLIVAGERSGVGKTTITLALLAYLKQQHLKVQSFKVGPDYIDPMFHQYVTGKPCRNLDPVLTSEVYVQQCFGRNIQDVDCALVEGVMGLFDGVRFFDPPLPPLERGEKDDGDGCFPSFASTAHISRLLNLPVLLVLDCSRLSASVAAIAHGFVSFDPSINFAGLILNRVGSDRHLQLLQNSLKCINSPILGVFRRHQNISIPDRHLGLVPTDEMPDLDILINDLANLAKTCFDWEKLLPILKVENEIYQYLLSSQVCSDQTIYLPSLVANNFEKKRSEILIGVARDRAFNFYYQDNLDILEELGAKILFWSPLKDENLPVGIQGLYFGGGFPEVFAQQLSENFMVRKAVKEAIISGMPTYAECGGLMYLSEAIIDFNSNSWEMVGILPTKAVMGKSLKLGYRQAISNIDTPLLVANTQVYGHEFHRSELTEAPPMPLYKMWRVDEKKNQSQATFEGWNFEIVHASYLHLHWGNRIDIPRRFIEQGSRGVREWGRSQNKNN\n>UniRef90_A0A1T0CQ58 Prevent-host-death protein n=2 Tax=Moraxella TaxID=475 RepID=A0A1T0CQ58_9GAMM\nMMIDFATLPITVQERIVNLQEPVSILKDGQVVAVLSPKSYDAKFDFARIQASVSSGQVAVPKTATADIDAFDRWLADVAP\n>UniRef90_C5M2E7 Topoisomerase I damage affected protein 11 n=1 Tax=Candida tropicalis (strain ATCC MYA-3404 / T1) TaxID=294747 RepID=C5M2E7_CANTT\nMDIDEQLRYLALKEMCVVEIKDHITNLNNKLNEHQKELHHLREIIQRSLYKELSTGNSLAKATETRPRQNSNPRDEAIARTRRRRSSLFNDHHNKDFVTPPINDTTTNNTTPATVTTTANPESTSRIWSGLSKPLNLIQQFDTLIQNEFEKSLLSEKDQQVHNDQSRKLEKQISHQSKSSEGSISSIGSINSPLQSKSVNPRPIPMPKPYHNKPSKSDDMMQSVSSSLWSFVNDVKANVLSSLQEDERERKISGQNPPARMYNLDTGSTVDISQTSIAVEDDESETELLEPLASDEEDNVIETLDLSMYKR\n>UniRef90_A0A6B8KL02 Type VI secretion system contractile sheath small subunit n=1 Tax=Methylocystis heyeri TaxID=391905 RepID=A0A6B8KL02_9HYPH\nMARPSDSGQKFISRNRPPRVQIVYENPNNAEEKIELPFVMGVMADLSGNASGVEKQEVAQRKFLDIDMDNFERRMEAISPGVSLRVANKLADEPGEKLSINLKFQRMEDFGPAAIAEQTPALKKLLDARTQLANLLRYMDGKVAAEEQLRKLLKDPQLMAALRQHFPDQQNNEQ\n>UniRef90_A0A1Q3DY06 Dipeptidyl-peptidase V n=2 Tax=Lentinula edodes TaxID=5353 RepID=A0A1Q3DY06_LENED\nMVHSSFQFKEGADVFTPKDLMELGRPGVGVANHAGDFVIIPYSKYSFEEKKNHKSIYVAPLESTVKPFKLPLVEGGEAFWLNGKTLAYVVESEQKNLEIFALDVLYQPSTNDSAAVLSTNAPILLGSFPTTSASNFRYSTDGYLVFSDSVYSDGNLTTVKEQDEAWENRGNTALVYDRTYERHWDHWVGPKTQSLFSVRLVQDPNHMWTFGSEFVNLLAGTGHSSPVEPFGGTDDFYVSKQSVIYTTLDPAFEEERAWHTKQNVYIVSITAAGKPRELTSGSQGATRSPVLNDAGDKAAWLELDEDGYESDRAKIVIYDLKKDVRFTLTQKWDRSPGSLAFSKEGDFIYFTADDHALVKVFVLPIPSTPAKSTTDPSLSPKYLNPVTIVEDGASSGLQTLPYGRILISKSSFTSPNDVFLVKGLDALQAQITQSNGTARFTGEIDQVTNFTAPDLEGKNLSKGENFWFKGANDIDVQGWILKPKGWKHGEKKAFPILLLIHGGPQGAWEDQWSTRWNPNVFAQQGYFVVAMNPTGSTSFGQAFTDAIAGDWGGKPFVDLQKGWKYVLENYPEVDADRAVAAGASWGGYAINWIQGHPEFDFGFKALVCHDGVFDSNYNGFSTDELFFFNHDWRGRPWDKNSEEVLRKFNPANFVHKWSTPQLLIHGSKDYRLPETEGIGAFHALQQLHIPSRLVIFPDENHWVLNHGNSLKWHYEVLRWFDQFVGKKD\n>UniRef90_A0A2N1ZL77 DNA repair protein RadC n=1 Tax=Gammaproteobacteria bacterium HGW-Gammaproteobacteria-12 TaxID=2013794 RepID=A0A2N1ZL77_9GAMM\nMTAFSPSRAACASRIGGWAGYRPATAEQILDAARKVIDQKVQRGAAFTSSELVKDYLIAKLGGFEHEVFAALFLDAKHRLIQYVEMFRGTIDSASVYPREIVKEALRLNAAAVIFAHNHPSGIPEPSQADKVLTQRLKEALALVDVRSLDHIIVAGQRTVSFAELGLL\n>UniRef90_UPI0021149202 TonB-dependent receptor n=1 Tax=Pseudomonas sp. LD120 TaxID=485751 RepID=UPI0021149202\nMDNLSLTLGNRFDHSEKYGNHNSPRAYVVYHPHPDWAVRGGVSKGFRAPSLKEGSAGAATESRGRGCGSLRPLGYVTGSCWMAGNPNLMPETSTNKEIGVAFEHDGWEAGLTYFHTDFTDKIEYGPLGQYQGRWWTMLENVDKARTRGWEGTTRVPLGDSVTWRTNATYMLESRNLSTGEDLISSPKLSAFSALDWQINDRLSTELSAQHVGKQRGMGNDFVQSYTTYDLTANLAVTKWLTLNGGVQNLMDKDLRDGSTNFYVPGRAFFAGATTYF\n>UniRef90_UPI0020420B8D Na+/H+ antiporter NhaC n=1 Tax=unclassified Staphylococcus TaxID=91994 RepID=UPI0020420B8D\nMGKKSENSDKNHKTKKPLGLTSALVTLTIMISTMLFTVAVLEKEPHIPLMIGTAVAILITMLHGYEFSEVEEMMYKGIRHALPAIVIIILVGLIIGSWIGSGVVATMIYYGLQLIDPRFFLAVVLILCGIVALAIGSSWSTMATVGVASMGIGISMGISPGMVAGAVICGSYFGDKMSPLSDTTNLASGLTDVDLFEHIKHMFYTTIPALIIAVVAFFFMGLQFGGKHFDTKKVEGILTTMQDNFTISPWLLLIPLIVILLVVVKVPAIPAICVGIILGFFAQIFVQGDSLTDALTALQTGYKIDSGNKMVDELFTRGGLESMFYTISLTLVAMTFGGVLEYSGMLSALINVILKFAKSTGSLIASVIVSCIGTNFTCSEQYISIIVPSRMYASTFKEKNLHPKNLSRALEDGGTLTSVFVPWNTCGVFIASTLGVSVMEYAPFAIVNYLVPIISIIYAYIGFKIVKLNDDRDTSLKEKPLSQSKPV\n>UniRef90_U6R8E6 Transposase n=4 Tax=Phocaeicola massiliensis TaxID=204516 RepID=U6R8E6_9BACT\nMRYALDIIKKWQFNFPILKYVTGKSGYNVKIRKLLDQIDREVKIFDKDSFDNIYNALYTMGSSKLCRKTHLDMLTKVQVNMYVSGHHKEGSSAVKHNSSLILKDRFIFMCAAYKQLNVIEK\n>UniRef90_A0A534PU07 MarR family transcriptional regulator n=1 Tax=Deltaproteobacteria bacterium TaxID=2026735 RepID=A0A534PU07_9DELT\nMRLLWAVDHSLQSASKRMESTYGITGPQRLVVRIVGRFPGIAAGRVAEILHVHPSTLTGILKRLEARSVLQRRSDPRDARRALFGLTAKGRKLDSVKTGMVEQAVRRVLTRDGEKVAAAQEILAALAEELEIEE\n>UniRef90_C4GAH0 TonB-dependent receptor n=2 Tax=Shuttleworthia TaxID=177971 RepID=C4GAH0_9FIRM\nMSRADFRAENLGYLAQSQEIAGAVSGLNFGEQSGIVIIENVPQRSEDNGYKI\n>UniRef90_UPI001F50FB05 type I restriction endonuclease n=1 Tax=Enterococcus faecium TaxID=1352 RepID=UPI001F50FB05\nMIRVLGEGHNQWTYRPDLKSEEDLWVNLRQKIISNNQAELNDSPLTDKEFETIKTELLLRTKTPFEAAKWLKGENGMARITIEREDPQLGSASLILYSNQDIGGGISTYEVVHQIAKRGSNIEARDRRFDVTLLINGLPIVQIELKQVTA\n>UniRef90_A0A061J7E0 Secreted protein n=2 Tax=Trypanosoma rangeli TaxID=5698 RepID=A0A061J7E0_TRYRA\nMSPRRVCLSLQLHLCGAKLPFSLTSGGGCRYAHTGRPSTSFLWFSHKREKAARNVTFPPEATCSPSRAASKMSVVGGTLASSSSPPLLLDPPFTPVPGESQALRQRTNCGAPSFLLLYVCGTCKSPLFCSSEYAASSSLGQHSSGWPSFTAPVCNSVLQLRSLLQRSAVQEGGQTPLTATLAARGLRVEGEMRRQTRGGGCERLRPRTWREECLRDENKRSDPTVLEGCCTKCGRAVCRVVMERRRGVKYVVNPTAVNAELTECSDPGVASTPHPSQLPH\n>UniRef90_A0A4Q8QWM3 Lipoprotein n=4 Tax=Bradyrhizobium TaxID=374 RepID=A0A4Q8QWM3_9BRAD\nMLLRTCLAVIAALIVSASSAQAQAPTTHQTQPVQFRTLFKVLPDPRGEFVRQCAPHMLGRWAHPEAVCGCLHDYAAATVEDPDLREALLRGISETGVPTIETDWVPPSKQSEIGPTFTKIAKPTLQCMFDPATE\n>UniRef90_A0A7W2L3H7 NADH:quinone oxidoreductase n=3 Tax=Pseudomonas TaxID=286 RepID=A0A7W2L3H7_PSEPU\nMNRFCLLVAGLAPLLGATSSVAQGTAIGMSMLVLILAHQVLLSPLRSQLQGARYWLASLLIVAALASCLQLVLRAWALPLALSLGDFPLLIGVQCLATDSLLPNQGRWRQLLRYLSGLLFISVLLGASRQWLAEGLGLHLASLPSGALLLLGLLLALYNCLRPGPARQGKR\n>UniRef90_A0A2V8UVF1 PNPLA domain-containing protein n=1 Tax=Acidobacteria bacterium TaxID=1978231 RepID=A0A2V8UVF1_9BACT\nMAGVWPKRYHFVDGGYYDNYGVATLVEWLEDVSHAQSVQPEILLLQIRDSPENGPPRPAEGQAGFLSQMLAPFFTIFRFRDAGQIAHGNLEYCSRQSLETASGVLLSPGLTTPRR\n>UniRef90_A0A839QHS3 Uncharacterized protein n=1 Tax=Paeniglutamicibacter cryotolerans TaxID=670079 RepID=A0A839QHS3_9MICC\nMSKPRNKKNTARPALRAAPAPVVNQSTQRTPEQARGNGNVIVLAAVGATILLFWYFHLLVLNQMSDLSGGLAMPDQMMGGYSVADIEALRAAMNSDAIGQLNYVHKTAGMLFPLFLALTTMLVVNLHTVRGPVRWVLWAVPMLFAIVDLWENAAIDALFNGPLDPGAVSLASTLTTISWVLLFATAAVLVGVLIASFITTFKAKWSEAGLS\n>UniRef90_A0A100YU56 IstB_IS21 domain-containing protein n=2 Tax=Atopobiaceae TaxID=1643824 RepID=A0A100YU56_9ACTN\nMGIVGSMGDFHADTGRDGRETRPQVLITPEEAIARGFAREAPPPVRCAHCGRQLRPLGIPVFGSIAWVSHEPCECDGSVRERMEEEQRILEERAMERERRLDRSGIPLRFRRAAPTEAQCIAYADAISGSTSDGLFIHGPVGTGKTHNAAAVAIAASDRGLRTVFTSAIAIFSNIRETFDGGGSSKRALERYASCEMLVLDDLGKESSSRWSLMTLFTIVNARYEGMRPTVITSQYTLGQLRARLASTGEAETAAAIVSRIAAMCADVTLSGPDLRGDAWKPLGMQTMQRTCDVAKRSKLDNFR\n>UniRef90_A0A7H8S915 ATP-binding protein n=1 Tax=Lentibacillus sp. CBA3610 TaxID=2518176 RepID=A0A7H8S915_9BACI\nMVEALKQTNFTAEPGELIVVVGPSGSGRVHPDDCRRSSNAESWEVINKHNITQMKEKKRSNIRLHEIDISGIPIWSISDSG\n>UniRef90_A0A834H4E1 Transmembrane protein n=2 Tax=Rhododendron simsii TaxID=118357 RepID=A0A834H4E1_RHOSS\nMIEDRRGGGGAPHAAIFAVVVVAVVVISVVLGDQGQVLTDFIAELLSPVGLLLLPIGLLLVIVFLSSDAGSAFSGLFSTGEPDTIHRVSGSPVGVALFLALLLFLLYSRVSIFGGDDGSDE\n>UniRef90_A0A830HN61 MYND-type domain-containing protein n=2 Tax=Pycnococcus provasolii TaxID=41880 RepID=A0A830HN61_9CHLO\nMSTGKDVSLVMELCHSSPLGHVVLHEVLRTTVANPDAWPALFPAEERSDGDDDDARHCQQPWNRAISLLRTMSHVSQLARSVATADALWKPAVHRLFEEKAFVCTEALKLKEEGKWRKAYFAACRRVREPRLTQGELCSINFHKRMKKCAGDAWLLRDPYWVTHGARCATMRFLDDGHAETSGEQVSEAAVPTNDEGANERADTAVDNGAPTTLAQLHPPPGAVSTRRKWRFSETGGGRGGPLGAFVRLSDGVREFPTFVVSFHRDTWSPYLESCWAVAASWQLKPEGEDSCMDDANLAISVDAQKAEALAYNCGLPMPEVRSPLEMKNAIAEILEKRDEDQRRLLHAMGIQDEEDDEDNRETTAVEEHDVATTSAGASATPTNSTTTNFDAIIQANRDFLSSFDSRWNAVKRRFDRAINRSIATIALGMTGDVDHAEALLTGSQARRSGGGADERRFEEDEEEQ\n>UniRef90_UPI00207B9FB4 hypothetical protein n=1 Tax=Streptomyces hygroscopicus TaxID=1912 RepID=UPI00207B9FB4\nMCGICPSLRLPGGAFDVHLRPSAACPFDASTGHRFTEAGVPVCVHPERVGLPAAEYATAGLPLPWETPPPASPDEVAVWVRAALDAAPPDACAEVIERATEILRAADPELDVVAVLRTALS\n>UniRef90_A0A386HU81 ATP-binding protein n=3 Tax=Arachidicoccus TaxID=1769012 RepID=A0A386HU81_9BACT\nMPELIVGRDAEKKILKEVLDSKEAELLAVLGRRRVGKTFLIRNYYSKQLVFECTGMHEVSLMEQLSNFSNALQQAMKLQVPLAIPDSWLQAFTFLSDFLQAKPEKQPMVILFDEFPWLHTPKSGFLAAFGHWWNNWASRRPQLKVVICGSAASWMTENVLHNRGGLHNRVSRNIRLLPFSLKETEAYLVSRGISLDHYQILQLYMAMGGIPQYLKQVGRGESATQVIDKLFFEKGGMLKTEFDVLYRSLFNNASHHESIVRQLAKRAKGMSRAEVIKACGLTTGGTTTRLFEELEQSGFISQSIPFEKTSRDAIYKLLDEYSLFYLKFIDRARATGTGTWHKLAQGQSYNSWSGYAFEAICQKHIQQIKEVLGIGGVYTEASGWRYTSKTGETGTEIDLLLDRQDRCINLCEMKFSGQEFVINKKYASELDNKVNVFKEQTGTKKTIFLTMITTYGTKQNIYYTGRITSEVKMEDLFR\n>UniRef90_A0A6I6M0J7 PEP-CTERM sorting domain-containing protein n=2 Tax=Pseudoduganella flava TaxID=871742 RepID=A0A6I6M0J7_9BURK\nMPMKRLATIAVLGAALTAAFASPAAHAATSVATLSGLHVAIIDLTPDDGVAPSLTFMSTGGLVSAGVGTAGGMDTVTDFLRSGNVTAHNAIGGTASVAALYEGQVQAMGSVGNYGDFISQSWLYSNFTLGANTQLVLTGHASLGTDFAAGNPNNVGSASVYIEIVDDQDGGGISLMETYSNEVTSYTAGPVGANDDFTLTFTNASANALLARMTLSAHAEGLVSAVPEPSTWLMLGAGLALTGTLARRRRAQQAN\n>UniRef90_E0RVU6 Flavodoxin/beta-lactamase domain-containing protein n=3 Tax=Butyrivibrio TaxID=830 RepID=E0RVU6_BUTPB\nMNGVKKVTDGIFWIGGSDRRLERFENIFPIPEGVSYNSYFIDDDKTAVFDTADITISDQYLENLKDCLDGRKLDYLVVLHMEPDHCSLISTVTGLFPEVTVVGNAKTFQIMEQFFPEAAGFNKLEVKEGDSLSTGNHNFKFVTAPMVHWPEVLFAYDDTSKALLCADAFGTFGALDGGLFADEYDFEKVFLNSARRYYANIVGKYGMQVQAVLKKAQGLDIQMLLPLHGPVWRKDIAWFIDKYQKWSTYEPETEDIVVIYGSLYGHTASAAEAVAASIRNKTKAGVKVYDVSGTDVSYLIGEVWRCKNIVIMCPTYNNGIYPPMESFIADMAALGVQNRSFALAQNGTWAPVTVKLMTEKLQTLKNVTILEESLTIKSALHKKDTDSLEAFTDAIVKA\n>UniRef90_UPI00034ADB16 hypothetical protein n=1 Tax=Wolbachia endosymbiont of Wuchereria bancrofti TaxID=96496 RepID=UPI00034ADB16\nMLTEISIDDLVRAKPMAGKKTVVSFTERENIREMPNKPQKHKFIANIIYSNTSTQTGDCILKFHPAA\n>UniRef90_A0A3P8ZCD7 calcium/calmodulin-dependent protein kinase n=1 Tax=Esox lucius TaxID=8010 RepID=A0A3P8ZCD7_ESOLU\nMATIVTSTRFTDEYQLYEELGKGAFSVVRRCVKKSSGQEFAAKIINTKKLSARDHQKLEREARICRLLKHPNIVRLHDSISEEGFHYLVFDLVTGGELFEDIVAREYYSEADASQCINQILESVQHIHQHDIVHRDLKPENLLLASKMKGAAVKLADFGLAIEVQGDQQAWFGFAGTPGYLSPEVLRKDPYGKPVDIWACGVILYILLVGYPPFWDEDQHKLYQQIKAGAYDFPSPEWDTVTPEAKNLINQMLTINPSKRITADQALKHPWICQRSTVASMIHRQETVECLRKFNARRKLKVRYFLYLYMSPPSFLTPPFCLNPVIYIFSLFTPLSLLGSDPHHNAGVKELLRWVCLPPSLQLQSGGRSELYSILGSPSIVNTILREGSTESCNTTEDEDMKEMETRGGLRDGDSQYRHSRGENGFYIAVSLNFCLNSSPPDLLSGFLFLARKQEIIKITEQLIEAVNNGDFEAYTRICDPGLTSFEPEALGNLVEGMDFHKFYFENLLSKNSKPVHTTLLNPHVHLIGEEAACIAYIRLTQFVDAQGRPRSSQSEETRVWHRRDSKWLNVHFHCSGAPAAPLQ\n>UniRef90_UPI001A9C264E hypothetical protein n=1 Tax=Intestinimonas butyriciproducens TaxID=1297617 RepID=UPI001A9C264E\nMRIIENADKEFAAEMHKAVKDNNGYCPCFIEKTPDTKCMCKEFREMEEGACHCGLYIKVK\n>UniRef90_UPI0003B3D06B CCA tRNA nucleotidyltransferase n=1 Tax=Flavobacterium antarcticum TaxID=271155 RepID=UPI0003B3D06B\nMNYSKDLQNPIFDVIAKASEQLNVESYVIGGFVRDLLLNRTAKKDIDIVAVGSGIELALKVSELLPKNPKVQVFKNYGTAMLRFEDTDIEFVGARKESYNFDSRKPLVENGTLEDDQNRRDFTINALALSLNKTNFGALLDPFNGLVDLEQKTIKTPLNPDVTYSDDPLRMMRGIRFASQLDFEIAAESFASITNNKDRISIISGERIVEELNKILMTDKPSTGFLLLYKSGLLDYILPELTDLNQVEEIEGHTHKNNFYHTLEVVDNIAPNTNDVWLRWAALLHDIGKAPTKRFTKKQGWTFHGHEFLGGKMVKKIFERLHMPLNQKMKFVQKMVIMSSRPIVLAQDEVTDSAVRRLVFDAGEEVDDLMTLCEADITTKNPSKFKKYHNNFNLVRQKIIEVEERDHVRQFQPPISGEQIMELFNLKPGREIGTLKESVKEAILEGHIPNEYEAALEFVTKKALKMGLNKD\n>UniRef90_UPI001912B9C1 DUF86 domain-containing protein n=1 Tax=Cyanobacterium sp. IPPAS B-1200 TaxID=1562720 RepID=UPI001912B9C1\nMVFALVKAIEIVGEAAGKVSKEYQINHPEISWTAMISMRNRLVHAYFDINKKILWQTLKKDIPELVNILTELLDE\n>UniRef90_A0A8J2SN30 3-isopropylmalate dehydrogenase n=1 Tax=Pelagomonas calceolata TaxID=35677 RepID=A0A8J2SN30_9STRA\nMKLSLALLAACSDALIAPPAPKPTKTQLRAVAAPQDSYKITLLPGDGIGPEITTATVKALVAAGKTKGVTFDFDEQLLGGCAIDKEGTPWPDKTLKSCQAADSILMAAIGGPKWDGNPRELRPETGLLAMRQQLGLFANLRPAKAIPQLLDASSLKREVVEGVDIMVVRELCGDVYFGKPAGIYTDDAGVRWGQNNMIYSEPEIERIARVAMDVAQKRQGRCCSIDKANVLDVSQLWKDVVIRVHGECGQGVELSHMYVDNAAMQLVRWPKQFDTIVCGNIFGDILSDEASMLVGSLGMLPSASLPSEGPGVFEPIHGSAPDIAGTDAANPLAMILSAAMMCQYDLLQPDLAKLLEDAVEAVLDAGYRTRDIVNEGNADETLVGCKEMGDLVAAKVAELAA\n>UniRef90_U4L0U5 Uncharacterized protein n=1 Tax=Pyronema omphalodes (strain CBS 100304) TaxID=1076935 RepID=U4L0U5_PYROM\nMMVNSAAFADRQSIPLLS\n>UniRef90_A0A8I0SUD4 Octanoyltransferase n=1 Tax=Magnetococcales bacterium TaxID=2026759 RepID=A0A8I0SUD4_9PROT\nMVHPPENTHPYDLMRLGQMDYAQALAIQQQRVETLIAHGGPNLLMLLEHPPVYTIGRSGKSGEILDAIPTREHINIIATDRGGRVTYHGPGQLVAYVIRDLRPDTGRILDHVRRLEETIIGTLACFGILGTRERANPGVWVGNEKIAALGVRIRRGITYHGIAINRDPDLDHFSGIIPCGIRDRGVTSMARLGFKTTAEELEECLLAAFAKVFAARWTQ\n>UniRef90_A0A3D9YY19 Heat shock protein HspQ n=2 Tax=Methylovirgula ligni TaxID=569860 RepID=A0A3D9YY19_9HYPH\nMNVKPRKAKFGIGQIVKHRKYPFRGIIYDVDPVFANTDEWWLAIPEEVRPRKDQPFYHLYAENADTEYVAYVSEQNLLPDTSGDPVRHPQVEEMFTRADDGGYRVKTVRLN\n>UniRef90_UPI001E452D4C zinc metallopeptidase n=1 Tax=Aegicerativicinus sediminis TaxID=2893202 RepID=UPI001E452D4C\nMGIGLGYYILIGAIALVSWAVSAQLKSKFKKYSQVHLQNGMSGKEIAEKMLADNGIRDVQVISTAGQLTDHYNPKNKTVNLSEPVYHQRNAAAAAVAAHECGHAVQHATAYSMLQLRSKLVPVVSITSQMSQWLIIGGLVLGAAAGVGLGYWVAVAGLAMMGMATLFSFITLPVEYDASNRALAWLENKHMLNREEHAAASDALKWAARTYLVAAIGALASLIYWALQIFGGRD\n>UniRef90_A0A5C5TAF6 Sorbosone dehydrogenase family protein n=1 Tax=Reyranella sp. CPCC 100927 TaxID=2599616 RepID=A0A5C5TAF6_9HYPH\nMRPIIKKVLLGTVAIIAIVAAAAAFLIRGDTAKLPDEASVGPNPTLPQPTRSLVPTVSIATARGWPQGAKPVPAAGLSVQAFAAGLDHPRWLYVLPNGDVLVAETNAPARPQEGRGVKGWIADLLQNRAGAGVPSANRISLLRDADGDGVAEVKTPFITGLNSPFGMALVGQDLYVANTDAVVRFPYTVGATRIDAPATKIADLPAGPLNHHWTKALIASPDGAHLYVTVGSNSNVGENGLDNEARRAAILRIDRATGQIGVFASGLRNPNGMAWQPETGVLWTVVNERDELGSDLVPDYLTSVKEGAFYGWPFSYWGQHVDARVVPPRPDMVAKAIAPDYALGNHTASLGLVFGAGTSLPAMYRSGAFIGQHGSWNRKPRSGYKVIFVPFASGRPSGAPVDVLTGFLSDDDAAFGRPVGVVTDRTGALLVADDVGNVIWRVTSIGR\n>UniRef90_A0A1S1R6I4 Secreted protein n=1 Tax=Frankia sp. BMG5.36 TaxID=1834512 RepID=A0A1S1R6I4_9ACTN\nMVEAATASGAGIAKAADRAGPVLDRLDDALVPRTGRALEAVVGAAAATSRTVTAGLLRLALRTRLLPGPPEPPAPAPRPRTADGGSGPDAGSSPSPAAARDASASAVAEGPSVGRALLERGARIAVLGLVAMIVLSAAAALLPGMDGQPRTEPASPPPGGAPAGQADAAVVPSVTIGPTAGESTADYVGGADQSLVALAEAAPEADLLAVVSLNDYRTPDGLQALLATYRVTQVFFTVPGSGTVHQAEVRTPVDDVLAALAAQAAESSRRAATATDPAARERASAQAQTMRGGRSCSCLFAAVVRASAARLLALRQDSSVRVIDAAPPATLENAVRFIPVTPESR\n>UniRef90_A0A8B6C0H3 RING-type domain-containing protein n=2 Tax=Mytilus galloprovincialis TaxID=29158 RepID=A0A8B6C0H3_MYTGA\nMTDIPPNVSLPLLGIGLISLLLSFIFCIYMWRLRCRAREERGYNRIQFKEKNKKFSSMCAVCLEEFRNYEYIAICRCKHCFHMNCLLQWLKHRNFCPMCKATVQRVPSGERSSLIIMPQQAVPSTSNEPPVEGAQNV\n>UniRef90_Q0RVU7 Biotin carboxyl carrier protein of acetyl-CoA carboxylase n=1 Tax=Rhodococcus jostii (strain RHA1) TaxID=101510 RepID=Q0RVU7_RHOJR\nMSDTHTLKTSIPGIFYRRPSPSEPVYVEVGQEVATGDIVGLVEIMKSFHSVPSDLAGTVVRFLVEDGAEVSPGQDIVELARS\n>UniRef90_A0A8H6B9I7 HAD family hydrolase n=4 Tax=Dekkera bruxellensis TaxID=5007 RepID=A0A8H6B9I7_DEKBR\nMRPRMPKLITADAYGTLYAPRFSIPKQYNDVTARFGVVIPENQLEKKWLNSYHTVKKTYPNYGKAAGLTVDEFWRKVLVRIYGKCQEHPEMIGMIIDKLGKKESYKVFRDFVSLAEWAVWEKEIPFCVASNADSGVTHLVIKEFGMETFLDSQDIYLSYDLELWKPNPEFFNRIIDDQLARLRGIRSTDPNYLEERRKLLQSSWHVGDEYENDVKCAMAAGMGAILVDRSITNPELAIQKRGERFYVVSSLDRVRQIFEK\n>UniRef90_A0A5J9WI98 Phospholipase A2 homolog 3 (Fragment) n=1 Tax=Eragrostis curvula TaxID=38414 RepID=A0A5J9WI98_9POAL\nMASVLAFSRCSLLLLLLLLATTASHALNVGNLLGTPPAGSQGCSRKCESEFCTIPPLLRYGKYCGILYSGCPGEKPCDALDACCMVHDHCVAAHNNDYLNTRCNENLLRCLDSVSPAGPTFPGNDCDVGRTKFVIRGVIETAVVAGKILHKRDDGH\n>UniRef90_UPI00200ED720 hypothetical protein n=1 Tax=Serratia sp. arafor3 TaxID=2824122 RepID=UPI00200ED720\nMMRYKDIPAEEQQNGPPNTDPASIMHTRLVIGDNVIMASDSCPADPTGATHRAYSLSIRSENVEQGGSITMPFQPAFWAKGFGMLTDKFGVNCRTV\n>UniRef90_A0A2W6USA3 Glycosyl transferase n=1 Tax=Microbacterium sp. TaxID=51671 RepID=A0A2W6USA3_9MICO\nMSKEPRVVLVAVPLMARSGVYRSTHDLVRAASAAGHQWQALIGMRPQASGDALATPGVREVPFDARGVGGISQIRALIDSVPEVRDADVIVSMITQTDIAVSRARAREDRGWIAWVRGKPWPAAGEQNLARRLLLRAWETRALRSADAVWATTPVLADEFASACQAAIVPAGIPSSRRIAHGEDATSPLVWAGRVDIDKRPELFSRIVELTGHPGRLYGDGPLKDRLASRRVTGLDWAGWRPSGELWSDASVFVGTSSREAFGRSAVEAAAAGIPIVIAREYGAAPLLFTDETLRRACVIDSADPEAWANAVRALLTDRQLRMAVSDHVHSNAQTLTIEASVDAAARRAAALLEGGCK\n>UniRef90_A0A327NX72 ISXO2 transposase-like protein n=1 Tax=Algoriphagus yeomjeoni TaxID=291403 RepID=A0A327NX72_9BACT\nMNIINFVQYFPDEESCEVYLKSYREKAGIRYKTCKSITKHYWFSTGKFFECSCCRRRSSLKSGTVMERSKLSLHVWMTAFMLMAATKKGFSCLEFQRQLGLCRYDTAFRLMHKIRVVMGKRDALYTLTDMVEMDEAYIGIATDKKVKENLKRGKGSQRKASVAVSAESIPLEDLETGKTSRFCGYYKMEVLGKVDGEHAEKFIKKNTSGEIVLFTDKNTAYEHIEDIVETHFTVISGKESTNDTLQWVHKAISNLKRKLLGINHMITYKYLQNYLNEFVYKLNRRYFGDRLFDRLIIAGIYPYVQ\n>UniRef90_A0A3N1WFC1 D-alanyl-D-alanine dipeptidase n=1 Tax=Erwinia sp. JUb26 TaxID=2485126 RepID=A0A3N1WFC1_9GAMM\nMDDIQLTDIATSLPQVKIDLKYATADNITGQPIYCEHRCLLHPDAAAALVRSAHIAAIAGFTLLIYDAYRPQKAQMNLWQACPDPDYVIPVSQGSNHSRGTAVDVTLIDEQGSIVDMGSGFDEMHERSHPWHPSVSARALRHRLMLSAIMLEGGFKGIATEWWHFELPGAADYPLLTDIFDCYPPPSAA\n>UniRef90_A0A7J3I7R8 Na+/H+ antiporter subunit C n=1 Tax=Ignisphaera aggregans TaxID=334771 RepID=A0A7J3I7R8_9CREN\nMSDLLISLAFRTAMIAFVFNTAIALYGVLSRPSLIKKFLCLIMFTDSINIFAIFIGFRYIPGSYPSPPILEDIPTSVRDIERLISMAVDPLPQAMILTAIVIGIACNMFLLSLILMYYKHYGTTDIHVTEEAEAYEETLE\n>UniRef90_UPI000C1F926A ATP-binding protein n=1 Tax=Limosilactobacillus fermentum TaxID=1613 RepID=UPI000C1F926A\nMDFLKFEDLSFSSAFSEPKEDIHLEYKTATWKLPKNFWETVSSFANTDGGLIVLGVKEDKDNHKYEITGVDDPIVVRQEIFNGNSNSECLSSPVIHDSDVKLVDCFDRTIIEVLVHPEQYNKRPLEAHGIAYVRTDDGDRKATEEQLKYFLVEHQQEIDTRLLRNFDLEDINSLDLDEYVTVLRKNTNTRYKDLESLAFDLGVFRRDRTSNGKDRLLTEGGLLFFGKYKVKSKMLV\n>UniRef90_UPI001C270FE8 TRAP transporter substrate-binding protein DctP n=1 Tax=Desertibacillus haloalkaliphilus TaxID=1328930 RepID=UPI001C270FE8\nMKSFFVIFCLFIISIVTTACVQDGSNNNGSQSSENSEDTITLRVSSSLSPQNGWWAGFFIPWMESVEEKSEGKVQFDYFTAEELLSVGEELQGMREGTIDIAAPLWTVYDPQRFPLSEVTMLPLTDSDPMMASLAYSELVQSELELVDGKTYADYEFVEKGIKALPIPTTEQYVISTKDYEFNTIEDFEKVSLRSPSRVHEVFANEVGINTVTLPSTELFDSVNRGAMEGSFFSISDWTGYGMQDVFNYTLEGINLGHYSGVWAMSEDKWNSLPKEIQDIMIEAAIEQIPGGAQLWMDRSIENKENSIEDGGVFATTADLEPEAEEMVLQGMENTWYEWIEMTESNGHPGTQIAKLWRDLIVEQGGTVPESIMNLE\n>UniRef90_A0A140IHG3 Sodefrin-like factor n=1 Tax=Cynops pyrrhogaster TaxID=8330 RepID=A0A140IHG3_CYNPY\nMRAIIATVVLLQALITGDCLLCEQCFALQTSSCSGIFKQCSPDVTHCVAGLENNTLGTHVILTAFKDCLDPSQKAACGREVSFTAPAASLWTSRTCCDSDFCNGGDVQVPPPDDTPNGYICEGCGSDQSAKPCTATEYVQCSGKQNACGTFYGTASRPGKTGEEYTFKGCTTQDFCIAGIFHMAGMQAYDYYVLKCSPALKV\n>UniRef90_UPI0021C67275 ABC transporter transmembrane domain-containing protein n=1 Tax=Mycoplasma gallisepticum TaxID=2096 RepID=UPI0021C67275\nMLGVAAVGFTFGYLGGRSIIIASVEFAKQLRVNIFERYQSFSVKNTDKFEKASVLTRMTTDINFIHQSIQSGRTAIRGMSVFLFSLVLMFVTS\n>UniRef90_A0A5P2U3Z0 MFS domain-containing protein n=2 Tax=Kluyveromyces lactis TaxID=28985 RepID=A0A5P2U3Z0_KLULC\nMAVKEEVLGKQAVSTHAVAANEHDLDEKQQEEFLNEYGLPDKLRFTRSLVLRKTEILAQQYDSWYWKAVLLFSVFLCSYGYGLDGSVRSVYTTYATNSYNTHSLLSTISIINLVIGASAQVFFARLSDVFGRLTLLIVATVFYSVGTIIQSQAYDVQRYAAGAVFYNVGLVGVVLQVILILSDFSSLRWRLFYTFVPSWPFIINMWVSGNVVDAANPLENWSWSIGMWAFIFPLTCLPLVCCILHMRYRASKTEAWRHLKVEKTYYQSHGLLQTLIQLFWKLDVVGVLLLTVTLGCILVPLTLAGGVSQKWNNPHVIAPFVLGFVLLPMFVVWESKWALDPIAPFKLLKDRGVWSALTIQFLIYFVYQMAVGYLYTILVIAVDESTTSATRITSVYSFTAAVASPFFALVVTRSKRLKPYIITGCSLWMVAMGILYHFRSGKDSDKGIIGGLVLWGLTSTLFTYPVTVSLQSITSHENMASVTALNYTVYRIGGAVASAASGAIWTQLLYKKLLKEMNGDAALATAAYGSPFDFILDYPWGTPTRDAMVESYRYVQKYEVLVALVFTVPMFILSMFLRDPPLTDDQAQENLKEGEYINTEHDDPIAAWMDDKWTRLTGGRKKE\n>UniRef90_A0A2N6BMK7 Serine hydroxymethyltransferase n=2 Tax=Deltaproteobacteria bacterium TaxID=2026735 RepID=A0A2N6BMK7_9DELT\nMILIASDHGGFEVKEAIGEHLKARGLEVEDLGTTNTDSVDYPDFAKKLARRVADEPQSKGILICGTGIGMSIAANKVPGIRAALVADTFSAKMAKEHNNANVIAVGGRTNTPEEAKSLVDAWLDAEFEGDRHARRLNKISQMEVSCGVARSISAEDPEVFSAMMGELRREEDTIVLIASENYASTAVLEAQGSVFTNKYAEGYPGARYYGGCEFTDKVETLAIERAKKLFGAEHANVQPIAGSAANMAAYYALINPGDKVVSMSLAHGGHLTHGAKVSFSGRLYDIVHYFVEEDTGKIDYDKLAELVKREKPRLVVAGASSYSRTLDFQRFREIADSVGAYLMVDMAHIAGLVAGGSHPSPVPYADIVTTTTHKTLRGPRGGLILCKAKYAAAVDKAVFPGLQGGPLVHTVASKAVAFREAMTDGFKQYADMVVKNAARMAEGFKKAGYDVVSGGTDNHLFLLDLSSRGLTGDAAEKSLDRAGITCNKNAVPYDKLPPTVTSGIRIGTPILTTRGMGEEEMDKVVELIIRVLENVGDAKVEASVREDVAALCRQFPFYADFLAD\n>UniRef90_A0A2V8W5K0 DUF393 domain-containing protein n=5 Tax=unclassified Acidobacteria TaxID=305072 RepID=A0A2V8W5K0_9BACT\nMISLVSEYTDGKGRHARGWLFFDAECKFCTRIARWLAPILEKRGMALAPLQDPRVGALLGLAREDLMREMQFLLSDGSRFGGADAAVALAREIWWGRPLVWISKIPGMMEILRKGYHWVAASRSCAAVSCPANEPSPRV\n>UniRef90_A0A0A9RIL1 DUF5753 domain-containing protein n=1 Tax=Arundo donax TaxID=35708 RepID=A0A0A9RIL1_ARUDO\nMQRVPLQVPLHHPPGQGHLLAHREHERLAIARRTAGRPANPADVLARVTGVVEEHHVVHVSKVDAS\n>UniRef90_A0A1Z4M0Q0 Outer membrane efflux protein n=1 Tax=Calothrix parasitica NIES-267 TaxID=1973488 RepID=A0A1Z4M0Q0_9CYAN\nMIAVAALNTQSAKADSNSLRQMQTIPNYSIPTSEETTGNFQLSVPSEVIPPDDVEKQLTSDESKSVLDALSPNPNPLQYPTRPEEVQIQKIQAITLEQALELARRNNRELQVGLLELQRAQAAVKESQASLLPNAGLSAEVARQQSAQNQLAVESTNIGTDEATTAFNGSLQLSYDLYTGGRRNAQIGQAKERLRVQELAVEVLEEEVRLNVSTEYFDLQQADEEVRIANAAVVNARASLRDAQALEQAGVGTQFDVLRTRVNLANAQQQLTNAVASQQVARRRLVTRLSLPQSVDIAAADPVKLASLWNLTLENSIVLAYQNRSELQQQLAQRNINLLDRRLALSALKPQVSLVASYSLLDQFDDSVSLTDGYSVGVQANLNLFDGGRAKAQAAQAKANAKIAETQFADTRNQIRFQVEQAYSGLQSNLENVQTSNAALEQARESLRLARLRFQAGVGTQLEVIDAENALTTAEGNNIRAILDYNRALASLQRSVTSRAIP\n>UniRef90_A0A0W0Z402 Type I site-specific deoxyribonuclease n=1 Tax=Legionella spiritensis TaxID=452 RepID=A0A0W0Z402_LEGSP\nMKKTFDKLDKLKLEQLDNPNYLPKIQNFLPQLKSDFEQHVAPGEFDPIKQADNWLEVVRNLANNKHPAINKDSLKKIEKIYDLLGGQDEDAFRLLDMYQSIDTVNSEQVASKTKKIVADYRAHLANKIEEKGFIISSEDNSIVSLNEGEITPKQQKLLNRYEAISALDERIHNKRILDESDKSEAKQALDICLKNKPEWSEKPFLQKLTDVLSVGIKPLYKAFFSKETRLKEELDQVISGPKR\n>UniRef90_A0A2Z6DW79 GTPase HflX n=5 Tax=Proteobacteria TaxID=1224 RepID=A0A2Z6DW79_HYDTE\nMFERPRFGERAWLVQIDFGEGRVAERLEELRQLVVSAGAEIVGALTVRRAKPDPATFLGSGKVTELAALVREHGADLVVFNHALSPAQQRNLEQALACRVVDRNTLILDIFALRAKSAEGKLQVELAQLEYLSTRLVRGWTHLERQRGGIGLRGPGETELETDRRLIGARVNRLKARLQRLEKQRATRRRGRQRYGVPQVSLVGYTNAGKSTLFNALTKAQTYAADQLFATLDTTSRRIWLPQTGNVVLSDTVGFIRDLPHDLVAAFHATLEEVKEADLLLVVSDLASPDNDAQREAVTETLRQIGAESVPVLEVGNKIDLLDQSPEVVRDGCGTIRRVTVSAATGAGLELLRAAIDERLHTATNASSGEKNTETNSASTQDHTEPFWEPLEREVSPCP\n>UniRef90_A0A2M7SV67 PolyA_pol domain-containing protein (Fragment) n=1 Tax=Chloroflexi bacterium CG_4_10_14_0_8_um_filter_46_9 TaxID=1973937 RepID=A0A2M7SV67_9CHLR\nMDLASKINSYFPKELLELLQDTSAEANKLGQRVYLVGGIVRDLLIGYPNFDLDLVTEGDAIELANRIARMSEAKLVIHPRFNTAKIKSGDFAIDIATARSETYASHGALPTVTPCPIEKDLFRRDFSINAMAISLTPEHYGELLDPYHGKDDLDAHLIRILHPGSFTDDATRILRAIRYEQRLGFNLEHETAQLLKRDISMLNTISGDR\n>UniRef90_A0A0G1DQW2 peptide-methionine (R)-S-oxide reductase n=2 Tax=Candidatus Magasanikbacteria TaxID=1752731 RepID=A0A0G1DQW2_9BACT\nMNDQEFREKLTQEQYHILRERGTEAPFSGKFLDHKEDGSYTCAACGNVLFASGAKFDSHCGWPSFDRDMGEGTVTFLDDTTLGMTRTEVRCAQCGSHLGHIFDDGPTETGKRYCINSLSLGFQSVDKR\n>UniRef90_UPI000FD1EFED acyltransferase n=1 Tax=Mesorhizobium sp. M7A.F.Ca.ET.027.02.1.1 TaxID=2496655 RepID=UPI000FD1EFED\nMTHQFGMKPRLVGLDVARIFAALAVMVFHLGFWSWAVKGSTPQSVVQGAAAFPELAPFTFWGRFGVEIFFVISGFVIAFSAASATPWQFIRARFLRLVPAALICATMTFVVAITIGLLPTSTLVDRYIRTLTFNPYAPWIDGVYWSLGVEISFYVLIAALLMIRRFSWIEPVAAIIGTASSFFWVWILAATLGYVHPPVSMIDGRSMDLLMITYGAYFATGVFLWSSLMIKPNAARSVALLLFVAGGLAGIYMNAPAYFAKIIDPSLRCVPAVVWLFAISFIVLATRFDYLIVSRMKPGMLAAIRLCGMATYPLYLLHDIIGAAVLRMLVLQDIDRFVALTYTFALMIALSLAVTLAVEPPFRKAISRVIDFRVLRPTTAEASQKA\n>UniRef90_A0A2E6BIU5 Dephospho-CoA kinase n=4 Tax=Gammaproteobacteria TaxID=1236 RepID=A0A2E6BIU5_9GAMM\nMTQTLKSERLIIGLTGGIGSGKSAATRFFSELGITVVDADELSREVVKPGEPALQAIVAHFGDGVLLDDGQLDRRQLRQRIFDDHNERKWLEQLLHPLIRQEIITRLTASTSPYTLLSSPLLLETDQQRLCSRVLLIDAPESLQIERTIIRDNSSEATVKAIMESQMARHARIERADDIIVNDGDLNQLKDAVAAQHQRYLEMTQ\n>UniRef90_V7F2Q5 Stm1_N domain-containing protein n=1 Tax=Mesorhizobium sp. LSJC264A00 TaxID=1287321 RepID=V7F2Q5_9HYPH\nMPETPKDKDLEKGDEVLRRLLKTPPKPHGDKAAKEKPEARPAKRSQNAKAK\n>UniRef90_UPI0018E26317 uncharacterized protein zgc:113436 isoform X1 n=2 Tax=Cyprinodon tularosa TaxID=77115 RepID=UPI0018E26317\nMLSVDSLQVAEEEMVESSSNKLSDIYTFVAKGSLPLTMNPLQKKNFKRYAKKFIFEEGKLFYVGPKKEEKREVVIEAKRKMQIFLDSHLSDVGRHLGQKKTVHRIQSRFYWLGIIKDVVEWIKVCETCRQTERNKNLARTVRPARVEAPWDIVGIDFIGPFTETRRGNRSVVLFIDYFSKWPEAFPVQTVDPLSVARCVSNCIYRFGATKTVVCAQKPEFCEEVSKVLHEKWKLVQRVSALDQPQLNPLHDCSGPLLKEAVEQMVAEKQADWDDFLDPVLFLFRTSSNPTTKFAPYSLMFSRKANPPGETRLTPPQYDEPETDGCREQDGCREQDGCREQDGCREQDGCREQDGCREQDGCREQASTCMNIMREQQNAVKQMVIANMNAAYKQEKKRKKAKRRMQSASPATLKVTEPLFAAGDSPSAKKVKDSLYLSFPVETVLATEPNGAEGVKTELAYRLAQPDVH\n>UniRef90_A0A672QD87 Serine/threonine-protein kinase VRK1 n=3 Tax=Sinocyclocheilus TaxID=75365 RepID=A0A672QD87_SINGR\nMPPKSKAGGAKKARAPTKRKLAEEFPPGEVLTDNAKKKWKLGSPVGQGGFGLLYLANEDSSGSVGAAAPYVIKVEPSENGPLFSELKFYMRAAKPDLIGAWMKSRKIDYLGVPKYWGSGFHEKGGKRYRFMVMDRFGTDLQKKFEGNEKKFPRKLVLQLGLRLLDILEYIHDHEYVHADIKASNLLLSYTNPNQVYLVDYGLAYRYSPEGVPKEYKEDPKRCHDGTIEFTSIDLDFDVSTNDAGPPSIKTPKRKKAEEKGQSADETEGTPAKKRRAPQKKDVNGAKKTASPAKRPAKKEAQASSEPAVKKSRGRPKKNS\n>UniRef90_UPI0013C2E1C0 hypothetical protein n=1 Tax=Trinickia diaoshuihuensis TaxID=2292265 RepID=UPI0013C2E1C0\nMVAVGNGKGAAGRGNGKSTVVDEAAVVAGLIFLKTIPCSCAPAATVHAAGGAALFEEDDEDDEDAADDEDAADDEDAADEEDAADEEDAADEEDAADEEDVADAAERGLNPGEPG\n>UniRef90_A0A2X1W8T8 Ovule protein n=1 Tax=Photobacterium damselae TaxID=38293 RepID=A0A2X1W8T8_9GAMM\nMCQKLYKLLIYYYSVCYFRILVRFTVLKNHGYLFAVKFKKSCTSGWLNLLSGSDYNRDMITLVLISLRIY\n>UniRef90_UPI001FFDE7FD SusC/RagA family TonB-linked outer membrane protein n=1 Tax=Sinomicrobium weinanense TaxID=2842200 RepID=UPI001FFDE7FD\nMKAMMCKRKTIYVLSAFFFYCQFMLAQQKTVTGVVTDADDGMPLPGVNIVIKGTTKGVSSDFDGNYSIEAPEDAVLVFSNLGYASREVPVAGQSTITITLSADAQELEGVVVTALGIKRETKRLGYAMTEVKGDELAKTNTVNPVQALQGKAPGVSIGSSDGGLFGNSKIQIRGVSALNSNNNQPIFVVDGVILDNNVSDSSADWEGNPNDYGNMLKNLNPDDYESISILKGAAATALYGSRGLNGVVLIKTKDGSGTRGLGVSVKQSVGIDHVYRQPDIQYEYGVGTRAGAVSYGERDANGNYYRFSNNQFYTNDDGIPTLIEHPSSLGYGPKYDGRPIIGYDGEMTTYSPAKDNLLDAYDTGWNTNTSVSLSGGHDKGNFFLSLSHNDRSGTLPNNSFKRDALLFSGAYQLADWLRADASISYTTSKSKNARNDLSQFFINGTYANGYNPSKYRQRQFWQASHGGIPNSDYSDKYAYVPGKSIWFEYSMNNAGSEEQVTRPIVRLTADVAEWLSITAEGNMNYYTTKYERKDWGSGFLNDGGEYQMRHNTDKSYTGKLTANFQKDLTPDITAQLLVGGELWKQEKSETDVRTDGGLIVPGQFFLENSKRNLISSGKVYGTKQISSLYFLSSFGYKDQVFLDITGRNDWSSSLVYTNGEGNYSYFYPSVSSSWLFTQTFNTPDWFTFGKLRASWAQVGSDTDPYAINKGYGIGRYQMDGDKFIYTNDITTTLVDKNIKPERKNSYEIGMDIRFFNNRLGVDFAYYNEIIKNQIGEIPFPQESGYNNYFTNIGTLSNYGVELSVTGTPVKTKNFTWNTTFNYWKNTTKIKDLHEDYGEYKALGGDVAYGNFRIGSVAFKGGEYGVLMSDSSPKKWQSDNPDDPRNGMNVLKWVDSDRGAFYERSYEPERVGKVQPDFEGSLNNSFTYKGISLSVLLDARFGGHIASYSNRYGTSYGWLETSLRGRSPEHGGMTWTSQYSDSQGQQFNDGVIPNGVFAEGQTVTAPNGSTVDVGGLTYQEAMDNGYVEPTHASYFNYYTNSWSDGVVNDDWFSEVKYIALRNISLGYNFPKSVSDKLGAKNFYVSFNARNLGYLYNSLPNNLNPESFRGTSSSDSFRERGFIPYTASYTMTIAIDF\n>UniRef90_X1TZX9 KTSC domain-containing protein (Fragment) n=1 Tax=marine sediment metagenome TaxID=412755 RepID=X1TZX9_9ZZZZ\nGFEYDPKVKDVFRLLMTPERYNTLYHRSKAAKTRIDRS\n>UniRef90_A0A2E0MWS0 Asparaginase n=5 Tax=unclassified Euryarchaeota TaxID=115531 RepID=A0A2E0MWS0_9EURY\nMTEQDRPSSVSHGRPGSGIYPSNPLGEKHEGIPTGRDVEWEPLVDFRRLDVSENTIHGAISWVHGDEVIHSFGGNVLVYGRSMMKPLLMKIFTDVLDDVLTDEQKAIACSSHNGDTEHVATAQSILTESEWGLMQCPLDVPLVQFGRQVRRPRRWFHTCSGEHAALLRALRLKGINRAGYTLPTSSWFQDFIDLLNSMLHPDWKPLRIAKDGCGLPTVSNTVDELATLFSALVRTKDDDWIWDAMCKHPDLIGGFNRLDSTIIKAGEGRVLAKEGADGLLGIAIEHDDWPKGLGIVIKIAHGWNSQATWYVARAVLGVLGIQLRNPYPLHRQKAFIVPGIVPEMYLKQLESVVTWDEWDPDQDRFQILENQDNLARNPHGNEGRM\n>UniRef90_A0A348B110 Shikimate kinase n=1 Tax=Sulfodiicoccus acidiphilus TaxID=1670455 RepID=A0A348B110_9CREN\nMQARAFGGISVVNAVPAWLGSTMAINLVVSVEIEEGDGREEGLIGYVLSYLRNAYSLPPLRVKVYSSLPQGGGLKSSSAVTVALIEAVSRLFNLRLDPPFLSAKLSLEGGFSLTGAYDDAFAAYRGGVSLTDNKSISLLKHLQPPEGLVFLVVPKEGRTADPRLLRRYSKTFEAIFQLALQGKLLEAMKINGVLVAEILGYDLSPIEVALSRGAIAAGVSGNGPSIFAACNEGDEGPVEDSLSRYGRVVRVEAVRIEGEDLQGQG\n>UniRef90_A0A5S4GRQ6 ABC transporter substrate-binding protein n=2 Tax=Streptosporangiales TaxID=85012 RepID=A0A5S4GRQ6_9ACTN\nMRRTAKIISVAMLAVAAAACAPSTAGNAPSTAATAKALPGPSLDANFDLEALVAAAKKEGSLLVYDSSGDIEEVAKAFTAKYGIAMEGVKSDTPQTAEKMIREHAADNVTIDAAMYEDGGVLVGQLAPQGVTQTWIPQDLKEQIPAENQNPLLALSKATVFAYNTKLSPGGCPVKNIWDLTEPEWAGKLVMQDPLGKPTVLSFFTQLDAHGNQALEQAFQAKYGKALKTEEKSAAYEWVKRLAGNRPVLTGSDEDISGAVGAPSATDKKIGFMSISKFRNNEDKGYTQSTCEGMAPFTGFSYPKYVAIASKSKHPNAAKLYVHFIMTEEGVKHEIGEGGISGNSTVKPLVTPAGLSDWQGQLFHTDPKGLLGDMQNRQTISDFWRVNKS\n>UniRef90_A0A453IYK0 ADH_zinc_N domain-containing protein n=2 Tax=BOP clade TaxID=359160 RepID=A0A453IYK0_AEGTS\nMALPTQGWGKTIILGVEMHGAPLTISSLEILHGKCVMGSLFGGVKPKQDIPILADKYLNKELELDKFITHEVGLKDINTAFDLLLQGKSLRCTIWMDK\n>UniRef90_UPI0021183352 helix-turn-helix domain-containing protein n=1 Tax=Bifidobacterium longum TaxID=216816 RepID=UPI0021183352\nMGEVYSHLSEEERQVIQIEVGNGASIRGIGAMLGRSPSSISREIKRNTWFPSNENESYRPVLLQCLFDRFGSVFPQCGLMVFPGVVIVSR\n>UniRef90_A0A4R6PNK8 Sucrase ferredoxin n=4 Tax=Nocardia TaxID=1817 RepID=A0A4R6PNK8_NOCIG\nMNPFEGMVCSAAAADLPLLGTAVHATGWLCIEHPGAWGRDVLGDEVLGPEITAELAARTSAAKVRPTLIRRPGRYEFTGTRTVLLASARPEGSWCVRFEITDLRELFDIDLHLVDGPAPEIDVPVDDPIVLVCAHGKRDQCCARLGRPIAAALAAEQPGRVWEASHTGGHRFAPAVVLLPSGLTYGRVDIPAARDLLAAADTGEVSLTGLRGRSCYPPIAQLAEVAVREQVQAPADALTVALDPTPTHDPTLAGAAVVTHRDGRRWRVTTRTASAPPRQASCNAKPKPAGYLEPVSIEQLPTL\n>UniRef90_A0A7W0RJ01 DNA ligase (ATP) n=1 Tax=Nocardioidaceae bacterium TaxID=1871072 RepID=A0A7W0RJ01_9ACTN\nMDLPVMPPLSPMLAKVAKTVPSPEAFEGGLLYEPKWDGFRCIVFRDGDEVELGSRNERPLTRYFPEVVEAAKASLPDRCVIDGEIVVPIDGRLQFERLLERIHPADSRVRKLAVETPASLVAFDLLAIDDEALLGTPLGERRPRLEQALAGATDPIHVTPASDQLSTAEEWFAVFEGAGLDGIVAKPCASTYQPGARAMIKVKHVRTADVVLAGFRLHKKSTEQHPLLGSLLLGLYDDNGRLQHVGVSAAFPADRRAELVRELQPLVVEPADHPWAEWAIAEAGGDRMPGAQSRWNAGKNLSWVPLDPALVAEVGYDHMEGTRFRHTTQFKRWRPDRTPESCTYAQLEEPVNYDLDDILV\n>UniRef90_UPI001C08EAC3 hypothetical protein n=1 Tax=Tamlana agarivorans TaxID=481183 RepID=UPI001C08EAC3\nMKNVLTLTKKGILMVAMLATVLGFANADDKVIVKRDAKKTSITLEDVKQGDLVSIKDNQGIIIFKESVEATGTYKKGFDLTGLENGDYVFEISKDLEVNTIPFTVNTTNIEFDEAEESTYYKPHTKHEAGLLYVTKLCSENEAAIINIFTEVAAGEYEMIHSELIEDALVIEKVYKLNTGNYKITIHSNNKEYTKFINN\n>UniRef90_G0R3Q1 Transmembrane protein (Fragment) n=1 Tax=Ichthyophthirius multifiliis (strain G5) TaxID=857967 RepID=G0R3Q1_ICHMG\nMEQERQYIQNQFKNDKNNLINQINFNNENIKLDDKQIKLLKEKKNITRDMLKQHYLQELKKNKGLQNTSMVWITKALLNINEDVNQSEIFPSIIDQQSVSYLIEYAQSEINYDELTFMLQKQQLQNISSSKLEENNFDKNYLNTQYQYNINTIKNKVSKLAQQTVKIKNPLLIQSSKTSIPNLVWEDTESAQKSSN\n>UniRef90_T0DQ77 Globin n=3 Tax=Alicyclobacillus TaxID=29330 RepID=T0DQ77_ALIAG\nMLSQETRDIIKSTVPVLETHGTAITTRFYQLLF\n>UniRef90_A0A2C9KHU1 SHNi-TPR domain-containing protein n=1 Tax=Biomphalaria glabrata TaxID=6526 RepID=A0A2C9KHU1_BIOGL\nMATESSTSAVDSVEKLEVMKKAADLLAQGKRNMLCGEVPKAVNLFEEAVQLLVKECGELSRDCADAYFSCGSALLELGRMETNVLGTALEGVEVEEEKEEEESEQFEKPPAEDDSVRQQLREEVYEAMAEGEREKDMQKTDKEIKDGEDGGASQMETVTDENKDNVADKSDLKESITAAGDADKELKKEEIPETNSTVEDKSLTESKINEVKPADSNTVADKDETKDQLEKPKQEEEMEVVEKNSEKSEISHKAHEDAAQSAEAEKETASENAVDTAMDIDEKKDVELEDESEADKDDEETEETVDEEEAVEGDESADGEKDEDVPNFQLAWEYLDLAKVIYLKNESKEDQLKAAECHLKLGEVSMETEQHTIAVEDLLSALKIQQKYLAPDDRLIAETHYQLGLAYGLGKEFKLSIEQYQLAISVIEAKIASLKKVLEDEQIDAENKENLETNPELKKFADEIKELQDLIPEMKNKTEDARIEENDLQKMKAIVKENLFPSGTTKEFGSPSKKSGGSVTSGDVDENGERKASDIAHLVRKKRKPEEDTSAPSEQEVKKIRQEVVSDDVNVETKVDDEAKMNVDEQVNTEESQVNSDNSNINVEPKVNGDEPKVNGDEPNVNGDEPKVNGDEPGVNGDDIKVSGDIIESKVISKVEVSPTEDAKMNGDTETPSIETSASTEVAPMAT\n>UniRef90_Q883V3 histidine kinase n=513 Tax=Pseudomonadaceae TaxID=135621 RepID=Q883V3_PSESM\nMSDSGRADALLAQLPREGRGRLKVFLGAAPGVGKTYAMLQAAHAQLRQGVRVMAGVVETHGRAETEALLNGLPQQPLLRTEYRGMTLEEMDLDALLKAAPSLVLVDELAHTNAPGSRHTKRWQDIQELLAAGIDVYTTVNVQHLESLNDQVRGITGVQVRETLPDWVLQEAFDLVLIDLPPRELLERLRDGKVYVPEQARAAIDAFFTQTNLTALREMAMQTAAAQVDNDLAQGYRQLGQSAPAVRGRMLVGIDGDMHAERLVRHASRVAQRRHLPWSAVHVDDGQTLDEQSRARLQNAQQLAERLGGEAVSLRAGEVARTLVQHAIERRASVVLVGQSRRHWRRRVFGGGVAARLLREGHGLEISVLDDSEELPDQPPRARPAREVVWFDYGLAFVATLIASLVAWGVAGVLALPNISLIFLAAVLLVAVRSSMGPALACAGLSFLAYDFLFIPPSFSLNIQREEDVLTLLFFLLMSALTGKLAARQRRQLQALRDTQEQTSELLDLSRKMTAATDRKAVLNAAEQHFSGWKELYLCLVDRDTQGGLVVETGGPLTFSEAERAAADWAWQHDQPAGSGTGTLPSGRWWWWPITAEEGPLALLGVCAREGQSFTDQHRRLLAALTQPLAQALARAQLAQELEAARLHGETEQLRSALLASVSHDLRTPLTSMRGSIDSLLALGEAIALEDRRELLEGTRDEAERLDRYIQNLLDMTRLGHGALKLARDWVSPADIVGSALNRLRAVLTPLQVSTQVTGDLPLLYVHAALIEQALVNVLENAARFSPLGGRLQVTAGVVDSELFFSVSDEGPGIPEDERAKIFDMFYTAARGDRGGQGTGLGLAICQGMIGAHGGRLTVEEGIDGLGTRITLFLPLQAQPDAEMEEPA\n>UniRef90_Q2KHZ9 Glutaryl-CoA dehydrogenase, mitochondrial n=28 Tax=Pecora TaxID=35500 RepID=GCDH_BOVIN\nMALRGVYAQLLNRGPGLRVFRSWSSATAQTEKGEKTQSRSAKPSRPEFDWRDPLLLEEQLTADEILIRDTFRTYCQERLMPRILLANRNEVFHREIISEMGELGMLGPTIQGYSCAGVSSVAYGLLARELERVDSGYRSAMSVQSSLVMYPIYAYGSEEQKQKYLPRLAKGELLGCFGLTEPNHGSDPSGMETRARHNPSSRSYILSGSKTWITNSPVADLLIVWARCEDSCIRGFLLEKGMRGLSTPRIEGKFSLRASSTGMIIMDDVEVPEENVLPGVSGLAGPFGCLNNARYGITWGVLGAAEFCLHTARQYTLDRIQFGVPLAKNQLIQKKLADMLTEITLGLHACLQLGRLKDQDKAAPEMVSLLKRNNCGKALDIARQARDMLGGNGISDEYHVIRHVMNLESVNTYEGTHDIHALILGRAITGIQAFVAGK\n>UniRef90_UPI0021D8BFC3 hypothetical protein n=1 Tax=unclassified Shewanella TaxID=196818 RepID=UPI0021D8BFC3\nMALRLADIPYYLNPTYQSDGRVKIDSPQQLCIYLIGPDTVEKVRKTLNFFATISKICLVRREKLHIDFSNLQNFTAAASVLLFSEITRAQLVTEIADVVTFTLPKTPDVLKLFRGFGLYKAIMPGGNRKLINLFDDDHPYQSGTDPNKFLISTILNLKNQGLELSNPETRIIHRGIQEAMLNVIHHAYEHETDVSSGIGSRWWQLSFCKHDSKSVAFIIYDKGISIPESIAGKLPVNITTDAEAIEFAFQKGVTRYTDKPTRGKGSEDIKDVTTVKDNSKLLVYSGNGMYYINRERGDTRKLSLPASINGTMIEWLIPYE\n>UniRef90_D9WD85 Integral membrane protein n=2 Tax=Streptomyces violaceusniger group TaxID=2839105 RepID=D9WD85_9ACTN\nMGADVNEEEIARAVEEGMRRNDVRRAAAWRKARDQEARNLLKGLGCMALVFIVFIVLMVKNPGG\n>UniRef90_UPI001FB071F5 discoidin domain-containing protein n=1 Tax=Clostridium perfringens TaxID=1502 RepID=UPI001FB071F5\nMLKNRERMKRLIACGIAASIVSVNGLSVLASELNKSDKVNLALNKKTVASSREVNDKWGAELITDGIKDKPSDPNAKPGNSRWASSRSVPQWIYIDFEEATTFDQVDILWDGAYSRNYKLEVSNDGETWEEVYATSEGKGNQESINLGEDITANYLRVSCEDTAHEWGNVSIYEVEVYDNENEENVTPPETETGVNIALNKTATASASETNTLTPDKVVDGDTSSRNSRWSSGGFSNGAKQWITIDLEKESTFDKVRLFWEAANAKVYEIQTSNDNENWKTVHRNEAGKGGTEVIELSEKENARYVRVYCEENNPAVWSSVSLYEVEIYNGEIPSSGDLDEVLNSLEVPTINKGDSKLQMPEVPKGFEIKFIGADYNQIRLLNKQNL\n>UniRef90_UPI00166CCB99 hypothetical protein n=1 Tax=Kroppenstedtia guangzhouensis TaxID=1274356 RepID=UPI00166CCB99\nMEKFGLAVKVDGEELLLLEIEVENDGKKVISDLPGSIRKLAESMAILIEENGNPLEEVAK\n>UniRef90_A0A1G6XTJ4 RNA_ligase domain-containing protein n=1 Tax=Niabella drilacis (strain DSM 25811 / CCM 8410 / LMG 26954 / E90) TaxID=1285928 RepID=A0A1G6XTJ4_NIADE\nMPVIKLETLVSADPETCFDLSRSIDLHRFSTVQTGERAIAGKTSGLIEAGETVTWQARHFGVRQKLTSKITAYQRPVHFRDEQQRGAFRFMKHDHYFSAVEAGTLIKDVFEFQSPLGVLGRLTDAIIMRRYLTRFLTKRNRVIKDIAESGMGACLVAAERNPYILERAGAFSYTHDGFIQEEALLRACYAWADVETIFAYKQDLLTTDEVCLDLFTRNGMRVFISESCSGWDRFLQKLSEQFPSLSEGWEWEVAQPPFKTNLALLFDRRGRTLTQAETDCYGGAHKP\n>UniRef90_A0A0G1M8D9 Single-stranded DNA-binding protein n=1 Tax=Parcubacteria group bacterium GW2011_GWA2_45_30 TaxID=1618834 RepID=A0A0G1M8D9_9BACT\nMLVEGRLQTRSWQDQQGQKHWRTEIIAERIQLGPKPGGGGYEGAGIENENFEPAQNQARGPAAPKAVPPEETTPIIDIAEDEEINVKDIPF\n>UniRef90_A0A388PNR4 PPM-type phosphatase domain-containing protein n=1 Tax=Opitutae bacterium TaxID=2026771 RepID=A0A388PNR4_9BACT\nMFSSTKKNQTLRWVNCLSGARGLVDQFPFRLPAGSPSPQVTVSPATQGLTLTPTPGRRPLVNGLAIDGPVTIAETSTLQLEDGLLALSLEEADTFRDLRTDAWMLFDAASGELLGEFAPADLLDRANDLGRPPEHLACTPTGLEVGFSLSLAAPLLSPREEIATRGPGPALLAAEQNRGAHLCPVCWTRFDAGDALSIAVHEDLRGDPILGSDARLRFQPTRFNDQGLALDPMGLACTDLACPHCRRQLPPGYLDMPHRILSLIGAPSSGKSYYLAVLTRELQERLPKDFGLAFKDGDPSGNMLLNQMRNTLFSAATPEEALLGKTALEGATYEKLPRLGRLVSLPRPFIYALSRPGARKQETSLILYDNAGEHFEPGVDIHDSPGAMHVATSAGLIFLFDPTANARFKARLIGVEDPQLSLKGRVDQQDSILAEMETRIKRVMGLAHDQRIATPLAFVVGKCDTWSRLLSSPLEPVTTPTGLDLAAIERNSQRVRAVLLDLCPGLVASAESLAEEIRYFAATSFGHNPVVIQQGPNKGRIAPDPQRLAPAHVEEPVYWLLHRASPELLPSAPRVNLEKSPAASRP\n>UniRef90_UPI0005BA3CE0 TSUP family transporter n=4 Tax=Streptomyces TaxID=1883 RepID=UPI0005BA3CE0\nMPDIALSTLVLLCLAALVAGWIDAVVGGGGLLLLPALLIGLPNATYPYVTGTNKAVAIVGTTGAAVTYVRKTKVPVWTAVRVGLAALAGSTAGALFTTAVDEEILRPLIIVVLVAVAAFVILKPSFGARPEGEDRAPLTRARVVTAIVLVGGGIGFYDGLFGPGTGTFLVLALTAVLHLDLVTASATAKIVNVCTNAGALAMFAYQGTVYWQLAALMAAFNLAGGMAGARMALSKGSGFVRGVLLVVVLSMVAKLGWDQWS\n>UniRef90_A0A5Q2W0C9 Substrate-binding domain-containing protein n=2 Tax=unclassified Pseudactinotalea TaxID=2649176 RepID=A0A5Q2W0C9_9CELL\nMAVSVRDVAALAGVSVGTVSNVLNRPEKVAPATVERVQGAIGELGFVRNDAARQLRAGRSSTLAMVVLDVANPFFTDVARGAEERAAEDGLTVLLGNSDDQAEREALYLEQFEQQRVRGVLITPVAEDMPLLRQLRERGTPVVLVDREVGDRTFSSVAVDDVAGGRLAVEHLLDGGRRRIAYVGGPVGTRQVIDRLSGARRAVAAVDGASLETVETRALTVHQGREAGEAIAGRDRADRPDAIFAANDLLAIGVLQGLQRSKVEVPTEVALIGYDDIDFVQSTVVPLSSIKQPAHLIGRTAVELLLQDAAGAGSPPEQVVFDPELVVRESTQTT\n>UniRef90_UPI000D3822E6 PAS domain-containing protein n=1 Tax=Mangrovicoccus ximenensis TaxID=1911570 RepID=UPI000D3822E6\nMEREAGMPDKAGDLGEHVWADVLSAVDRTYAELIEYQEKLEARNNELQVLQDFLASVLASISDVLVVVSRDGLIEDASRSFCDAIGQKIGALRGQTLEGFFAEPARSQVGGAIAAAIRERRESVLEVDLAGAEEPVPLEFSVTAVIS\n>UniRef90_A0A5B1CRN5 DNA-invertase hin n=1 Tax=Rubripirellula obstinata TaxID=406547 RepID=A0A5B1CRN5_9BACT\nMKNRNIIAAYLRCSSDDQSTEAQRADLERYLEREGFDLSRVQWFIDEGTTGDNLDRPAFEELDRLIANGAVATVVVWKLDRLSRSMIDGLTTVSRWLESGVRFVSTTQAFDFRGTIGKMVAALCFGFAEIEQQSRRERQAVGIQHAKANGTYKGRAKGATKAGVDPSRAKELRSKGLTFREIAAALGVSAPTARSYCMA\n>UniRef90_UPI001CB8FAB8 hypothetical protein n=1 Tax=Nostoc sp. 'Peltigera membranacea cyanobiont' 210A TaxID=2014529 RepID=UPI001CB8FAB8\nMPELFAGIERQDDSFPVPYPDANIPQAWAAGSIFLLIRTILGLKADASKQQLKVQPNLPDCLPDLELTNLSVGDATVGLRFWRNGEQTQWEVTHLDGELEVSTT\n>UniRef90_UPI00200782AC uncharacterized protein n=1 Tax=Purpureocillium takamizusanense TaxID=2060973 RepID=UPI00200782AC\nMDCDICHRGHDPQRLPFLCAVDARNQVYDARLKNLHLLIENDKLQAQIAKASGDDTPATTAQLALARQRLAEDRTDQILAAADKLRAEIQAARDDIKARRAALARRRSDLSSVSTGLVDRRARQQHEVEKSLQMLRFRWSQSAEDMAQTRAFLCTEALRLYGLKRTRKSNTSRYDYQIGKVPIVDLTSMDSLTPEIISTSLAHVAHIVMLVSHYLAIRLPAEITLPHRDYPRPTIFNLPGSYQHGPFAFPSASSSMTPMPSSAQIRDPESHHVPRPRPLFVDKPLPQLSKEDPTTYSFFLEGVTLLAYNIAWLCSCQGVSIGDKGSFEDMCHMGRNLYNFVLASQLQGYVQPAEPTNKGSNADNNNGVESRSNWIGRYSHGTSYYYLGGMEGTDFVRTFKLPSPMKLADKLKKKLLGDTPGADWEVLDDDAWKPEDGRTDQSGAKALSGALADKGGLDGTGATRSGTNGWTKVKHRT\n>UniRef90_A0A2H5YHE1 Methylmalonyl-CoA carboxyltransferase 5S subunit n=4 Tax=Bacteria TaxID=2 RepID=A0A2H5YHE1_9BACT\nMGVRVTDTTLRDAHQSLLATRMRIEDMLPIAPLMDEVGFHSVEVWGGATFDTCLRFLREDPWERLRRLKQCFRRTPLQMLLRGQNVVGYRHYADDVVEKFVELAVKNGMDIFRIFDALNDLRNLETAIRAVKRYGGHAQGTICYTISPVHTIDLYARLAQELVEMGSDSICIKDMAGILRPYEAYELVKRLKDTVPVPVQLHTHSTGGLAPLAVLKAIEAGVDVVDCAISSLSLGTSQPPCESLVATLHGTPYDTGLDLELLSQIADYFAQVRRKYAAFEGEVTVDVGVLIHQVPGGMISNLLSQLREMGAADRLPEVLAEIPRVRAELGYPPLVTPTSQIVGTQAVLNVLAGERYKQVTRETRAYVQGYYGRPPAPIDPDVQRKVLGDADVISGRPADHIPPELEKARADLGELASSEEDVVSYVLFPQVAREFLEWRARGGGLEPEEVAAIAVALAQDHARPQPAAAPRREVSLWKVAGRRRLLNRAGVP\n>UniRef90_UPI0014216B0F DUF5668 domain-containing protein n=1 Tax=Alkalibacillus almallahensis TaxID=1379154 RepID=UPI0014216B0F\nMKQSQSFLAITLIGFGLYFLIQQYDIPILSQFGNWPSILVILGVAFLFSAYGNNQHDNILPGIILFGLGVHFHLLQHQVNWIDHWGMYTLIIGIAFILRAQKKRQGTIIGIIFIVISFLALSAFAMPTWLGWLDVVFNMIEQFWPILLIIIGFVMLFKK\n>UniRef90_UPI001E50B040 type II secretion system protein GspM n=1 Tax=Bordetella sp. LUAb4 TaxID=2843195 RepID=UPI001E50B040\nMKRPDDKDVSVPANAGRQSARGPDTPPAPVRGLAPTFATWRLKLRDALRPVAAWHAALTPRERRLVDVGGIVLALFLVFTFAIDPALTTIARSRNELPALRAQAAAVASLTNEAQRLRQHGGRTSNAPLAQTDIDESLRRAGFAPDSWRITQEVGNGNGGGNGNAGKPAVWRVELKQAPSTALMRWSDNVPAELRLRVANVELIRASTEYGRPIPGKVNGTVRLAASVGN\n>UniRef90_A0A2T2YAG9 MFS transporter n=2 Tax=Adhaeribacter TaxID=299566 RepID=A0A2T2YAG9_9BACT\nMKRTLAASRWYRLIPVAFITYSLAYLDRANFGFGAASSMATDLNITPATSSLLGSLFFLGYFFFQVPGAHYAAHNSAKKLIFWSLILWGGLATATGLVSNVNLLIVIRFMLGVVESAVMPAMLILLSNWFTKTERSRANTFLILGNPATILWMSILSGYLINAVGWRWMFILEGLPAVVWAFFWWRLVDDKPTKASWLTEPEKRALAEQLQAEQQGIKPVKNYAEAFKSRTVILLSFQYAFWSIGVYGFVMWLPSIIKAAPNMDIVKTGWLSSVPYVLAIIGMFSASYFSDKTLNRKAFVWPFLLIGALAFYGSYAIGSDNFWLSFVLLILAGGAMYAPYGPFFAIIPELLPRNVAGGAMALINSMGALGSFAGAYIVGYLNSSTKSFGASYLFMAGSLLLSALITLYAVRGTRTKTPEPIKQAV\n>UniRef90_A0A7N1A149 DELLA protein n=1 Tax=Kalanchoe fedtschenkoi TaxID=63787 RepID=A0A7N1A149_KALFE\nMKRENQYLYPNPDSSGAGSSSGGKGKVCWEDDPLPESGMDELLAVLGYKVKSSDMAEVAQKLEQLEEVMGSVREDGLSHLASETVHYNPSDISNWIENMLSEFVPAGFDSSLQPLPPASVHSFIPQLDSSASVNFPGFGGGDTSLPDYDLKAIPGNQIIYSPKQQQQQIDELGGNANKRLKTTVTATEAPLTTSTRPVVLVDSQEAGVRLVHTLMACAQAIQQSKLEVAGTLVNQIGLLAASQAGSMRKVATYFAEALERRIFNCHPQESVNPSFTDLLLMNFYEACPYLKFAHFTANQAILEAFSGKKEVHVIDFSMNQGMQWPALMQALALRPGGPPAFRLTGIGPPSPDNTDRLREVGLRLAQLAETIHVDFEFRGFVANSLADLDASKLELNPSDTESIAVNSVFELHRLLARPGAIEKVLSVIREIKPEIVTVVEQEANHNGPVFLDRFTESLHYYSTLFDSLEGSASSQDKVISEVYLGRQICNVVACEGPDRVERHETLDQWRLRFGSAGFEPVHIGSNAFKQASMLLDLFSGGEGYRVEENNGCLMLGWHTRPLIATSAWRVGSTGPS\n>UniRef90_UPI0021515D3C SDR family oxidoreductase n=1 Tax=Streptomyces sp. KMM 9044 TaxID=2744474 RepID=UPI0021515D3C\nMRIVIAGGHGQIALRLERLLAARGYEVAGIIRKPEQADELRKLGAEPVVLDLESASVEEVAERLRGADAAVFAAGSGPGSGVARKEAVDKASAVLFADAAVRAGVRRFVVVSSMGADPAHEGDEVFDVYQRAKGEADAYVRGLDALAWTILRPGSLTDGAGTGLVRLEARTGPGPISRDDVAAVLAELLKDSSTAGLTLELISGPSPIPAAVKSVAGE\n>UniRef90_A0A850P7D6 ArsC family reductase n=1 Tax=Ameyamaea chiangmaiensis TaxID=442969 RepID=A0A850P7D6_9PROT\nMTLTLYGIKACDTMKKARVWLETHAIDVVFHDYKTAGIDRRTLERWVAAKGWETILNRAGTTFRKLPEADRLALTPERAVTLMLAQPSMIKRPVLEGDGTLIVGFRPEFYETLLSA\n>UniRef90_A0A559KBH2 ThrE_2 domain-containing protein n=2 Tax=Paenibacillus sp. JC52 TaxID=2163881 RepID=A0A559KBH2_9BACL\nMMLAAYFGGPVSALAELAVVYIGRFLKEGAIGYVQMAIGITAALGTGLFYRYCRG\n>UniRef90_S6GGD3 Lipoprotein n=1 Tax=Osedax symbiont Rs2 TaxID=1330035 RepID=S6GGD3_9GAMM\nMQTHQINSWLLFSCLSALTGCANNYPLLQQQIETDNTLYRSGSHSISVSALLQNASTGTVAKVPQKKVQTPFQLRFNDTEVELNYVQQQRLQDYAQSLSAAVLSVHCGAGNSSSTLQAVSIALRRCQKIQRFLSGIQQQSQALVQADTPSQLITVAAANRQSGI\n>UniRef90_A0A7V9G8G6 AraC family transcriptional regulator n=1 Tax=Planctomycetes bacterium TaxID=2026780 RepID=A0A7V9G8G6_9BACT\nMAQSLRKTAFTIGPACRERFLPLDRPAGLVLRDLGVHLAGISDLARPYEIGRPGVDFHCVLYTVSGAGWCELEGLPPSVGPGDMLVLPAGTSYGYGIAADSWRILWFHFDDGRGLGQALHGRKPAIHAAASIPRLQAAMEGFLAEARETDPESLRAAGLHAELIACYLGRELAADIDPRVAAVRHRLQKLWDDVDRDLRHPWSVAALAGRVHESQINLYRLCARHFRVKPMAMVTRLRMERAKQLLRETDEPLKRIADWVGYHNEFAFSTAFKRFTGSNPRDFRKRKRS\n>UniRef90_A0A804R300 LigA n=2 Tax=Zea mays TaxID=4577 RepID=A0A804R300_MAIZE\nMRPRPPRVHDRSRQAAARQKPLPHVPHRAHHADDHVRQPDVRRRRHHATGSRLRPGHPLRPPPRRGAPHRPPRPRGLHDALHTAPRDARQGGRLRHVVPGRRGRGGLLLHHPVRRRARARAAGVRLHAVRRVDGRAHAAVTGAGRGGVRGLRGDGRNGRSARDAAGAGSSHAVSADEEGPELRVAGVPRQALHGGRRGHREHGGRAGAVHPRGHRRRPLRAKTPRSGRLPDRPGPASQAAVRARRRRAGSSTAARVREVARRAAPSVRRAALLWEHGRQLPVAPGPRDRRRPRAQRAPLPVGAPWPATAGRFQVPDGRQRPRAAPGRVPGEDEGPRPRVAHVGAAEGHPRQPRRRRLRHPLRLELHPREPVARRTDGALAAVRGAAPERVRARGRHGRRRRHAGGQEARQLRRGGGAGARGPVPDGRVGGEGEEGAGEGHGGEGPEPERRGQRRVVGRVGAETGARDFAQARRQGVCHRKRGEHGQRRRSRISGQNNMIPRTRRNRRRPRINRRPPCDPSGTAHVVWHCSQSPCAL\n>UniRef90_A0A1Q9JNL8 Sugar ABC transporter permease n=2 Tax=Roseburia sp. 499 TaxID=1261634 RepID=A0A1Q9JNL8_9FIRM\nMQPFRQSKQKWIPTVRNKKVPKWVLGLLFLAPSLLGVAVFVLVPFADVVRRSFLDAMGKEFAGISNYESVFQNEAFQLAAGNTIKFILICIPLLLLVSLVCALLINGLKGYQEFFKTTFLFPMAIPVASVVLLWRLFLDRNGFFNEGVRLFGLSPVDWMNSEKAFGVLVFTYLWKNVGYDMILWLAGLAAIPKERYEAASVDGAGRWQTFRYVTLPGLRSSVFVIGILSLVNCFKVFREAYLIAGDYPHESIYMMQHLFNNWFVSLDIQKMTAASVVMAIVMLVIMSLVWYRNERSQE\n>UniRef90_A0A7C7UU56 Septum site-determining protein MinC n=1 Tax=Aquificaceae bacterium TaxID=2053503 RepID=A0A7C7UU56_9AQUI\nMIEIKGKTTPVIYITIKEKGNIEALIQEISKKLNNKIFEGSLVIIENPEVLSEWERKKVEEILKKLTKGVFEKQKEEKEENRLLIINKSLRAGQRVEHKGDILILGDVNKDAEVLAGGNIIVFGKLRGIAKAGLIGDDIAP\n>UniRef90_A0A535UZE8 M24 family metallopeptidase (Fragment) n=1 Tax=Chloroflexi bacterium TaxID=2026724 RepID=A0A535UZE8_9CHLR\nFAWFGDRTAFVGFRLPHQFFPSGRRLEEGMPYILDVAPIVGGYTADIGYAACLGENPVHARLLADLAEYRELLLAGVRARRSLRTVYEDVDRLIDRHGYVNRHRAYPFGVIAHRVGTVGGRGPRPTVAGFGLRALRSLAHDGVMGRRGGWSPLWGPGRASDHPPTPGMWAVEPHIGFRGVGVKFEELLVVTESDAFWLDDDLPHVRRWRGAAAAVPA\n>UniRef90_UPI00166AE77F antibiotic biosynthesis monooxygenase n=1 Tax=Ornithinibacillus halotolerans TaxID=1274357 RepID=UPI00166AE77F\nMYAHMTNGTIDFLMKLTEKHPTIPFHFMSGTSKDVAYYEGVKKKYFQAGRSFEILVQLGEIQEQGYVVMNHIPVLDEGRPVFEDNFRKRKDEIHHQKGFQAFRLLKPLKGNTYVVFTQWDSANSYEQWKNSKEFQKAHTNIKPPAYFADRPFVNVYQMIEEE\n>UniRef90_A0A1M3B6X1 K(+)-insensitive pyrophosphate-energized proton pump n=1 Tax=Chlamydia sp. 32-24 TaxID=1895742 RepID=A0A1M3B6X1_9CHLA\nMLSYDYGFVIACGFLAILYGIIMIRYILSLSSGNEKMQSIASAIQEGASAYLNRQYQMITLVGIVIFALLTWILGWHVGIGFLIGAILSGLAGYIGMNISVRANVRTTEAAKKGLSEALGVAFKSGAITGMLVVGLGLLGITGYYLYLKWHNVPMRELLEALVGLGFGASLISIFARLGGGIFTKGADVGADLVGKIEANIPEDDPRNAAVIADNVGDNVGDCAGMAADLFETYCVTLVGTMLLAGVFFQGAILEKMMFYPLAICAVCIIASLFGTYFVKLGTSNNIMNALYKGFVSTAIFSAAGIWAVTKYVLGTDVIYENNGISFNGMNLFYCALTGLAVTGLIILITEYYTLGKYRPVKSIAESSKTGHGTNIIQGLAVSMEATALPVITICAGILIANANAGLFGIAVAATSMLALAGMVVALDAYGPVTDNAGGIAEMSNLPAEIRKTTDALDAVGNTTKAVTKGYAIGSAGFAALVLFAAFLQDLTRYFPASADQCSFNLTNTYVLVGLLIGGLLPYLFGALSMMAVGRAAGSVVVEVRRQFKEIPGIMDGSGKPDYGKAVDLLTKSAIKEMILPSLLPVGAPILLYVIINAFVGQNEAFVALGSMLLGVVITGLFVGLSMTSGGGAWDNAKKFIEEGNFGGKGSDAHHASVTGDTVGDPYKDTAGPAINPMIKIANIVALLLLAILAAMSNQ\n>UniRef90_A0A3B4T4F2 Coiled-coil domain containing 142 n=4 Tax=Seriola TaxID=8160 RepID=A0A3B4T4F2_SERDU\nMDQNNPETLKDPGGEPGLTADWNNSESVCPEKEQRRCLVTEDVTTNGSWSQSSISRSLQRAETLLRTTFNPSLKWLFHSRSQDEDAEEGHFVVAHNLVSRSSARLLRLQQALLTVAPQWQLVGGAQVGSPQVCVKGIPEREAEGGVVLVPSSSSLQGPYRTLWRLLEQRSLLLFIHEYTRRARLAAAYISRVSHLLEEQLRRPHLTPHQTLSSLSSFRVSLGSLSQELRVHLNHWSCLFSKVQSDHYLRPALVQQTRLLVEIKQTLDSLGLQALVLMEHYVCVILSAVAQAELDSVPREVLQDILAGTDVYNQAVEEQRAQRSATQLRTAVLLRAHHSTLDPGLPHSKQHHPAAFSVRELTVILAVHHAETAAEQLRSWASAQSCQVCQVHHTQEAGTSSVRSSISCGTCTLRPEWTWEQLQHTFLIPPPLLSSHQPTLQLHQDSAENHLPVLAKPTSVQQRPDCSDKDPTSQCQTHIPRNSPIQASVETVDLAQPHVENCEPPQTISPPSESSHRLSAPPVSAVCQQERSSVELLFQLLVSCSDLLVPLVSHTEAPAEPLLPHTPTDVTVTAPIISTDDSVELNRLSTDLNTEGSQADWAELDMTTRLETTCSSGFQRDRDPEGEGTVGLEGTAVAPDCVRPHSVQWLDLGQSLVFADLLGQYRALLWTLCSRALWLQMFVPPAGNAAGSINLQDNHRGFQILDRLSRASKTEDLVPKECRAMLEDFRLNLLVCTAHAQWDYVLCRGLGSALKDKCLIDGSHSVMSSSKMMSVTMEHFLLLTPPLLSSLCCQLSDSRSSGSSSLLTLHRQSVSLVLATVQLSTFWILSKAYQFLSSWSLNRFLLITQGDLKELRESLEVMVRQTRSLMMTPDSDYYSSLLLRQQLEALDRAVSELQTFSSLVLKTFSSDCKRMSGEIFEQTMPSSVHWKHSHRTGFPSSPSEYASLAAQTVIGQVLEGVAPLSDDARVQALSVTMTAFLEAWMEHILKQKIKFSVQGALQLKQDFDSIRELIQSDRYGLSADLHQHLLSLRVFQQVDSAVVCLLQQPQAKPYLQSRTWEPFTRCCPAGSRDSSDAAVGSSITNLGYVEGEDLTQADPSVMTSDLPPVDPSNPGEPYLAPSLALGPVQQEWLDLRIHGSARRWRLPGLQCLSKSEP\n>UniRef90_A0A4Z1JUV9 MFS domain-containing protein n=3 Tax=Helotiales TaxID=5178 RepID=A0A4Z1JUV9_9HELO\nMSQGEQIKDSDHVAVPTSEKQASSDSQESSDVEKKASFTTPDGIVEDTSFVYMTGWRLHLMRLCCAISMFLVNMEVSIIGTSLISITNDLRGFSQMGWVVTGYLITYTGLLIIWAKISDIYGRKPAMIISMLIFTVFSGGCGAAHTMMQLIVCRVFQGVGAAGAVSLALVAAYEMVPKDKYPLQAALIGSAIALGSLVGPLIGGGVSEHSTWRWVFLINVPVGVVCAALLYISVPSNFPYHGRPVLPHPITNSLSRLDISGASLLLGATVLLVTVLLEAGIEFAWKSGTAIALIILSGILFVAFMLNEKVVSKEKRTQEAVFPFRFLSNRPWMGTLLMSFLSGVPYNIIVIDIPQRFQAIDSISPFTSGLRLIPFNFSISLSSILVNIIAKQRVPPIILLFIGSIIQLVGMSLFSTLPENGTLPNTIYGWEVLTGFGMGWVMGICLLLPPAVVEGRDLAISGGSLLQFRVLGGVLGLAISTAIMNNHLTSHLTPLLGAEQLSLLLQSTREIENLSEELRIETVKAFAYGYNMQMKVNVAFSVVQVLIVGVMWTRNGKGWRGQIEVVEKQILKE\n>UniRef90_A0A3C1JH31 Ovule protein n=1 Tax=Acidimicrobiaceae bacterium TaxID=2024894 RepID=A0A3C1JH31_9ACTN\nMHLSTRAWDNHLEFIMLKGKNPKLTCRLYGATQMVSMANQSQNFFKKYTKLSLNRKTLWQTWTAGILIA\n>UniRef90_A0A7V7MZ47 catalase n=1 Tax=Proteobacteria bacterium TaxID=1977087 RepID=A0A7V7MZ47_9PROT\nKTDMFARFSTVAGERGAADAERDIRGFALKFYTDEGIWDLVGNNTPVFFFRDPLKFPDLNHAVKRDPKTNMRDANNNWDFWTLLPEALHQLTILMSDRGLPVGYRNMHGFGSHTYSLLNKDNVRHWVKFHFVTQQGIENLSDEEAAKVIGMDRESSQRDLFEAIKNKDFPKWKMFIQVMTEEQAKTYRFHPFDLTKVWSKKDFPLIPVGEFELNKNPENYFQDVEQAAFNPTNIVPGIGFSPDKMLQGRLFSYGDAQRYRLGVNHYQIPVNKPTCPYHAYHRDGAMRVDGNYGGSKHYEPNSYGEWQEQPEAQEPPLELSGDAYAHNFRDDDEDYFTQPGDLYRIIKADGKADLLFNNTAANIGGAEKFIQIRHIRHCYQADPEYGEGVAKALGLSMDEVNNFDMKPHDQWAPRPSQE\n>UniRef90_A0A258AK22 Histidine--tRNA ligase n=1 Tax=Verrucomicrobia bacterium 12-59-8 TaxID=1970608 RepID=A0A258AK22_9BACT\nMASFRTVKGFRDFFPEECALRNYITETWRSVARRYGFVEYEAPLVESTDLYRKKSGDEITNQLYCFLDKAEREISLRPEVTPSLARMATARQRDFKKPIKWFQIGPCFRYEEPQEGRGREFIQFNADILGDSSPATSAELIALAIDVMREFGVSADDFIIRLSNREIWSIFLADKNIAEEHTTTFLSIIDKIERARPEETEKKLALIGLTTAEVRAFMSSTDENHPAFAALRENLTARGLWQFIRIDATIVRGLAYYTGVVFEVFDLKHGLRALAGGGTYDKLCALMSDGGVDMPAAGFAMGDVVLGILLKRTPGAQMKLTSAYLAASSIDAFVVVADEAQRPHALAAVQSLRAAGIRIDYSFGSQKVGKQFQAAEDRKARFAIVFGAEYPEVVIKNLIARSQCAVPASGLVGEVQKMLAEPAVGPLIA\n>UniRef90_A0A078FTM1 BnaC01g23140D protein n=1 Tax=Brassica napus TaxID=3708 RepID=A0A078FTM1_BRANA\nMLLIDWKVTTVNASRVPTFRPHLTAERYILSPDLMWLCCNPNFRLDVFVTLSMFDSNTVSFHKRLEAMRGDPRKWLEVVSILMPLQEHTFISIRRLMLERATFTSWSPLMKHGNGNSLPSHVPDALPGRGRGGDGLGTFPKCFRDSGDGKCFWGRVARCTHAVPVSINFKFSRFPSPYLSPYPFRCNIVLHRTGLPSAAPLLRGYAKVETLTISERNEFIITALTQDIDFICTGKVTSSKIEKMMMFCCLL\n>UniRef90_A0A369H8Y5 Uncharacterized protein n=1 Tax=Ophiocordyceps camponoti-saundersi (nom. inval.) TaxID=2039874 RepID=A0A369H8Y5_9HYPO\nMAAANPFWWPMTIHKDVRFFQGQPNAPPHPPEARRRKEKLYREAMRKDDYDWASAYALEPVVKDISCDESTCARLCLDAFDDEPGLGRGRRGVWGFWFDFEHGACPMKRCWLDNDWSRKEDVLHWKIGGDRAVFDGLGYPTRDVVLLPGAFIVESLIYSCGDGW\n>UniRef90_A0A7K6ALI1 Cytochrome P450 1A (Fragment) n=2 Tax=Upupiformes TaxID=57389 RepID=A0A7K6ALI1_UPUEP\nMLAAMKAAMSLVETQGIVSATEVLLAAAVFCLVFLLIQSLRQHVPQGLKRPPGPRGYPILGNVLELRKDTHLALTRLSQKYGDVMEVKIGMRPVLVLSGLDTIRQALVKQGEDFMGRPDLYSFQYISNGQSLAFSTDSGEVWKARRKLAQNALKTFSIAPSPTSSSTCLLEEHVSKEADYLVTKLLQVMEKQKSFDLNQYLVVSVANVICAICFGKRYDHNDEELLKVVNLNNEFGDVAASGNPADFIPVLQYLPSHTMKLFKDVNKRFNFFVGKIVQEHYTSFDRGHIRDITDSLIEHCQEKTVGEDAHISLSNKKIINIVNDLFGAGFDTVATALSWSFMYAALYPDIQKKIQEELDQTIGWERRPRLSDRSMLPYTEAFILEVFRHSSFLPFTIPHSTTKATVLNGYYVPKDTCVFINQWQVNHDEKLWKDPSTFNPKRFLNATGTEIKRMEGDKVLAFGLGKRRCIGETIGRWEVFLFLATMLQQLEFSLLSGEKVDITPQYGLTMKYKRCEYFQVKKRSPVKNS\n>UniRef90_A0A2E0V7U8 DNA-binding protein n=2 Tax=Verrucomicrobiaceae TaxID=203557 RepID=A0A2E0V7U8_9BACT\nMNKAELIETVQGSLGRDATKRSAEDAVAAVLGAIANGVRTEGKVQLIGFGTFAAKTRKARMGRNPKTGEPMHIAASKSVGFKPSASLKASLAEPTEPTPPSA\n>UniRef90_A8UFE2 Peptidase_M24 domain-containing protein n=1 Tax=Flavobacteriales bacterium ALC-1 TaxID=391603 RepID=A8UFE2_9FLAO\nMTRTIPVSGKYNDRQKAVYNAVNRVKKEATKMLVPGTLWEQYHVEVGKLMTSELLGLGLIDKADVQNENPDWPAYKKYFMHGTSHHMGLDTHDYGLLNEPMQANMVFTVEPGIYIPDEGFGIRLEDDVVIQDSGEPFNLMRNIPIEIEEIEEIMNS\n>UniRef90_A0A2V9IHY2 DUF4488 domain-containing protein n=2 Tax=Acidobacteria bacterium TaxID=1978231 RepID=A0A2V9IHY2_9BACT\nMNRSLRAAVIGSVMLWLAALGLAAEKKPKSGPLTGTWECVSHGGPQGDMKFTLYLEQNKETVNGTVSSPLGSTELTSASFKKNTLEIHIDTDQRNYLLIGRYKDGQLAGAWSTNEDQKGTWEGKKSAQTTSQP\n>UniRef90_A0A2R6HCQ5 DUF4265 domain-containing protein n=1 Tax=Halobacteriales archaeon QS_4_69_34 TaxID=1919177 RepID=A0A2R6HCQ5_9EURY\nMIDGGRGAGEGAPPDVPHWDDEYVDRVSDRLLSNYDLEKDYRVRGEVFPLYGQLSMTSHKQFLHPALSYARHDSAEHLFVRRVGSVTVAELERLVALAHDLADEWIVADEEHFGTEFTFALVVPAIPDEVRAFVADFSDRTLLKYGYYGHYEVNLVVVAPGREAHVASEGADVWRAFAPWADTDGEQPGLIDRLLGVLGR\n>UniRef90_A0A3B9ERX6 Glutamine amidotransferase type-2 domain-containing protein n=1 Tax=Rhodospirillaceae bacterium TaxID=1898112 RepID=A0A3B9ERX6_9PROT\nMCGIFGIILKDRSAAPKDAFEHDLSLLYKASMARGRDATGLALHDSRNVHLIRRDCSPKQMLASDAYRRVVREGYAAQAAAPLAAFGQCRLVTNGSLAIEANNQPVVAGNVVGAHNGIVVNDGDLLPSEAPKTSAGGGTTALAETVHAANDTTRLMEAIDGALNRLGNLRRAVGEVFLRLEGEASIVVMSRLDGAMTLATNTGSLYFLSRADGSAFAFASERPFLRRLIAEGYVFTDVGDDAVVHLKPGEFLHLVPGRTTFDHGSLTDAAVAPDSGKQADPDNEPPVAAPVIRASNSAGGLLRCTACVLPHTYPGISFDDKGVCNFCRNHQHQKVHGRAALEQLLDKHRRNDGCYDCIVGLSGGRDSSYGLHLLKTEYGMNPVAYTYDWGLTTDQSRRNQAIMCSKLGVEHVLRAPDIAKKRRHVRKNINAWLERPRMGMVPLFMAGDKDFYQLGRDLKRDYEVDLTVFCSGSLLEQRQFFVGFCGVHDHVTYTARLYGYTPKVKAQLALYYLSQYLLNPRYINESFFDSVRSFFTSFLFKDDFLYLYEYIDWDEREIDRTLRDLYDWQSDSGYGRNQWRMGDGQTAFTNYIFHAVAGFSEFDNFRSNQIREGLIERDEALKLVEEDNQPKWGALEYFAYVIGINLDEVLARINNIPKLY\n>UniRef90_A0A7X7D244 Cytochrome c domain-containing protein (Fragment) n=1 Tax=Acidimicrobiales bacterium TaxID=2201156 RepID=A0A7X7D244_9ACTN\nMSDHESGGEPSVPEVPEPPATAATAAGSAERSQTRRRLRIASLTGVAVALAAVGAFAYKQIKPVVDAQRYATVTYEVPVAPQLTAASGETLLRIDPTRSSLTYEIEETFAGAKRSTATGSTAGIAGDLALNTARLEDSRVGQIVVNIEQFESDNNLRDARIRQDFLQSHRYPLATFDFEEIEGLSGQLEEGETYEFQMLGHVTVKERPAASTWDVTASYDDGVLTATATATAKLSRFDAGPISIAGLVQTEDEVLLTLELTAVEPSANDIATTVERAGRLEAGSQEAPSYEQVIEPILEQHCASCHNSGQFGAHTLTLDDAGDVQAVSDGLKTVTQTGYMPPWFASDEGVELAHKPTISDEEIAALAAWSDAGGPLDVDPETPLDPTKEAAELLPRQDQELRIEPYTGSL\n>UniRef90_A0A1F5NZ36 50S ribosomal protein L28 n=2 Tax=Bacteria candidate phyla TaxID=1783234 RepID=A0A1F5NZ36_9BACT\nMITPMKSCDVCGKGSKMVGHRIKLRGHYNPTNWTRKYPNLQKTVTPAGEKAVACVQCIKTFAKPARPVKARVLAKTTASAK\n>UniRef90_A0A091DCM9 Spindlin-4 n=2 Tax=Fukomys damarensis TaxID=885580 RepID=A0A091DCM9_FUKDA\nMSPPAVPPTGIDGVSAYLMKKRHTHRKQRRKPTFLTCRNIVGCRIQHGWKEGNEPVEQWKGTVLEQVSVKPTLYIIKYDGKDSVYGLELHRDKRVLALEILPERVPTPRIDSGLADSLIGKAVGHVFEGEHGTKDEWKGMVLARAPVMDTWFYITYEKDPVLYMYTLLDDYKDGDLRIIPDSSYYFPTAEREPGEVVDSLVGKQVEHAKDDGSKRTGIFIHQVVAKPSVYFIKFDDDIHIYVYGLVKTPKKAVVTAAAWAVPSTIHHWRSGPPTKIIRKLRKITKLLCLQRMTTAFQIRTRSIAFSPQTPKLLEEIVGETDQAVAKNWDQGTYEDNLEGLRVFDKEGKGKVMGTEPRSVLITLGEKMTEEEVETVLAGHKDSNG\n>UniRef90_A0A4U3LSB8 aldehyde dehydrogenase (NAD(+)) n=8 Tax=Herbidospora TaxID=28443 RepID=A0A4U3LSB8_9ACTN\nMTRQIVSVIGGKDEPSGTPYVSRNPARLKEVVAEVALADAATFAAACRNAAAAQHDWARVPAPVRGRVIASIGRLVETNAEALARLVSEEIGKPYAEALGEVREIVDTCDFFIGEGRRLYGQTVPSEMPDKNLFTFRTPVGVAAVITAGNFPVAVPSWYLVPALLCGNSVVWKPAEYAAASASALHRIFSAAGLPEGVFNVVFADGEQTFAGLETALGEGTVHKVGFTGSSEVGRKIGELCGRHLQSPCLELGGKNPMVVMPDADLTLATEGALFAGFGTAGQRCTSLGTVIVHESIHSDFVARFTAAAQSAHVGDPARKVLMGPLLDQKFADRYEEFLTWIGDHHTVTGPVGRITEANPCGHFLGDDPNEGLFYHPVIVDGVRPTDRLFLEETFGPIVGVTTFSTLDEAIELANLPGYGLSSSIYTRDPQSAFRFRAGVSAGMVSVNNSTSGAEAHLPFGGNGKSGNGSRQSGMWVLDQFTRWQAMNWDYSGRLQKAQMDVAEITPDLEFTL\n>UniRef90_A0A250G1B9 site-specific DNA-methyltransferase (adenine-specific) n=4 Tax=Capnocytophaga TaxID=1016 RepID=A0A250G1B9_9FLAO\nMNDLKMNIPAKQSTKNKFGQYFTPEVIANFMISLANISNESKILEPSCGEGVFLNLLKEKGYHNLSAFEIDKELSKDFDFVRYESFISAKIDEKFDLIIGNPPYIRWKNLEEELKQELLKNETWNKYFNSLCDYLYIFILKSIELLSEKGQLIFICPEYWMNTTHSVSLRNYMVQNGYFEEIYHFNETPIFDKVTVSTVIFKYVKNCVRKEKIQISKYHSNKKLNNEILENLKNKKTFKDTYHFDIDQFKLNERWILQPEKLKRKLEVLENNCFKKNQSTLLSLFDENKREFHTIGDFCDIGNGLVSGLDKAFQINGCLLTKEENQATINVIKAKNINPYIANNITKYIYIEEGLEESEFIKKYPNFYLHFQKYKSQLEKRYQYNRKINYWEWVFLRNISLFKKQEKRIFVPCKERISNKNYFRFALVDKDVFPTQDVTAIFRKPNTSESIEYILAYLNTPIVFDWLKANGIVKGNIVEFSEKPISSIPFRTIDWSNGKEVEIHNFISESIRNYLKRPNELLLNLINESFSNLLCVK\n>UniRef90_A0A7J5EE96 Hemerythrin domain-containing protein n=1 Tax=Flavobacteriales bacterium TaxID=2021391 RepID=A0A7J5EE96_9FLAO\nMTKKTPQKRATELVSLSHEHHHALVFCVRLKKASQTTPEITQNYVRYFWENHISSHFDNEEKYLLHLMPTAPLKEQFLSEHNEIRVLVNQLLTSAEEVMNNALLLSEKLNQHIRFEERILFPEIEKFASKKELQAVALQLNKSADCPVFFPEFWK\n>UniRef90_UPI001175E0D4 diacylglycerol kinase zeta isoform X2 n=3 Tax=Euacanthomorphacea TaxID=123369 RepID=UPI001175E0D4\nMEQPEEDQPPQHDTSLQDGEEPFTSTSVASSSSSSSSNTELPSVPPAPRCLHTSRTFTGLRIFCRRKALSKSGLQHVAAQPGASTPSRTDPLVEPSGTIDWTDNAQFGDHIWFETSGSGDFCYVGEQYCIAKTLQKSVARRKCAGCKISVHTMCMEQLEKINFRCKPSFREPGSRAVRESNVVRHHWVHRRRQTGKCRQCGKGFQQKFSFHSKEIVAISCSWCKQAYHNKVTCFMLQQIEECCSLGAHAAVIVPPTWIIRVRRLQSSLKSSKKKKRTSLKCSKSSKKGTEIQDGRWKPFLVKPLPSQLMKPLLVFVNPKSGGNQGAKIIQSFMWYLNPRQVFDLTKGGPREGLELYAKVPNLRILACGGDGTVGWVLSVLDQLKLRPQPPVAILPLGTGNDLARTLNWGGGYTDEPVTKILSHVEDGNIVQLDRWNLQVEPNPEARPEERDEHQTDKLPIDVFNNYFSLGFDAHVTLGFHESREANPEKFNSRFRNKMFYAGTAFSDFLSGSSKDLAKHIKVVCDGTDLTAKVQEMKLQCLLFLNIPRYCAGTMPWGHPSEHHDFEPQRHDDGCIEVIGFTMTSLATLQVGGHGERLHQCKEVTLTTYKSIPMQVDGEPCKLAPSIIHISLRNQANMVQKAKRRISMPHLNDQQPVPEKLQIRVNRISMAAYEALHYDKDQLKEASTPLGVIIVPGDSDLETCRSHIERLQDNLDQVDTATGQDQDAMKAECLSSQKLSPKWCFLDCTTADRFYRIDRAQEHLNYVTEISQEELYILDPELVLKETVGTSPGMPDLVDSYGEECQDHQRQFAFPCSPSSPSSSTTPRVRDCQRKRISSDSSVAEALAQSSSKTTLCRRGAKILNVHRSNTTLADFRPMLSSTSATSSDTEKELELINCVKTEDLDRLMELHQQGADILLQDSRGCTLLHHAVEAGSKDIVKYLIGNVPTSHLDITEKETGETALHKAATSCQRTICHILVEAGASLMKTDLQGETPKQRAEKAEDQELAEYLENRQHYQMIQREDQETAV\n>UniRef90_A0A396NWZ4 PBSX family phage terminase large subunit n=3 Tax=root TaxID=1 RepID=A0A396NWZ4_9FIRM\nMSDLTKLIAPSFYGVHHDIKAGRHTHYWLKGGRGSTKSSFISVEIILGMMQDAAANALVLRKVAVNLKDSVYEQLLWAIEALGVENLWQAKLSPLQLSYLPTGQRILFRGADEPKKIKSTKFRKGYCKYIWYEEADEFAGMQEIRTINQSLMRGGSSFFVFYSYNPPKSQSNWVNRECLQPKANRLVHTSDYRRVPPAWLGDAFLQEAEYLKELNEKAYRHEYLGEVVGSGGAVFDNVTVEEITDAEIAAFDRIYNGVDWGFYPDPWAFNRMHYDAARRTLYIFGELTRHRTGNAETARLLRQYGVQDTDLITADSAEPKSVADYRCYGLFCRGAVKGPGSVDYSMKWLQALVRIVIDPVRCPDTAKEFTAYEYDRNKEGEVISGYPDRDNHHIDAVRYGTEPIWKRRGQ\n>UniRef90_W6SGZ7 Putative MATE family multidrug efflux pumps n=2 Tax=Clostridium bornimense TaxID=1216932 RepID=W6SGZ7_9CLOT\nMENTISESSFSKSIIRIALPITLQSMIRSSFSIIDQVMIGQLGSESIAGIGLGGKFASIYSVVLGAITATAAIMISQYMGQKNVKNVRRSFHVNLLVALFITVLFTFASLLFTEQIFSFYTKDSVTKELGKSYLQIYAWSFLPIALSGMAEAMLCCMEMAVFPLVASVSSLFVNTALNYILIFGKFGLPELGVKGAAIGSVVAQIISCLLTLVFLLWQLRKKKMNLSFDIRFNGNEYISYIKILTPLLICEFMWSLGENVYSAIYGNISTNDCAAMTMTSPIQGLMIGALCGLSQAAGIMVGKSLGNQNYEKAYNDSKKLMKYGLIVSIALSILLILLGKVYTGIYNVAAAVKQTAYALLVVFAIVSPVKVQNMILGGGIIKSGGKTNYIMWIDIIGTWGFGVPLGLLSAFVLKLPIIYVYFILSLEECVRLAISLILFKRKSWMQKI\n>UniRef90_A0A8B8PLS0 segment polarity protein dishevelled homolog DVL-3-like n=1 Tax=Rhodamnia argentea TaxID=178133 RepID=A0A8B8PLS0_9MYRT\nMTTDIDSNSYFTETEDDSMSCSNYSETTCDTFISQRRNRYYNERSNGRSPNHHHGNQDTYRHTNSRARNIDNISQSSSSTTTSASQSDATAVHCITVYLVLTNENFLGLHIYANTLEGRDEGIYVDGVTENSAVALDGRIEPGDKIMQVNDVSLEELDNEEAVKVLKDAVIKRGPLKLVVAKFVDNNKDPVNGIVDPKEAIHPIDTAAWVAHAQAITMPRISSEMANSATSSPSFGSNAQDTDCIRPASAGMSRLNTGLRLNKATTDIQEIIEHMRMPNIGLEIKDREWLKIHIPKAFLGSDLIKWLERNVYGFSSNRDAKKFASRLLKEGYIRDPISKKSFNSKSYYTLEA\n>UniRef90_A0A6L9YVB8 Efflux transporter periplasmic adaptor subunit n=1 Tax=Moorena sp. SIO4A3 TaxID=2607836 RepID=A0A6L9YVB8_9CYAN\nMPIASCLARSAITVAAAAEVEATKGVITAMASLQQSQASVRAEQANQARALASLAQAKADMKKAIAARNLAETEMKRYQRLWQQGVVSASDRDRAVTQFQDAQAAVEAAEAGIVSAQSQIRAAQASLEAARGELIAAQAQIDTAESAVSSAKAQLNKRNVILKDTVLRAPFDGIVAYLNIREGL\n>UniRef90_UPI0020C880D2 PfkB family carbohydrate kinase n=1 Tax=Alsobacter sp. SYSU M60028 TaxID=2962936 RepID=UPI0020C880D2\nMDALFIGQTYIDVTFLADRMPTGDEKSVARDYAVSFGGNAVTAAFCCAKLGVVPDLLTSLADDWLGRMFLDMAAKYRISVHGRKVRESSLSFVLPNNGKRAIIRCRDDHYLHPFPILNIGNIRALHLDGHQGDAAMHYARVCRERGVLTSLDGGGLRENTHDLLGFIDVAICAERLAEQMNLSPEGLLAYLKERGVKIGGVTMGEKGMLWYDEQGVIRRQPPLAVPASAVIDTSGAGDVFHGAYVYSAMQRPDAPWREHFAFARAASTYKIQHLGNEEGLPSLADIERIVSEYREAA\n>UniRef90_A0A4R7D5Q2 peptide-methionine (S)-S-oxide reductase n=1 Tax=Maribacter caenipelagi TaxID=1447781 RepID=A0A4R7D5Q2_9FLAO\nMKNVNKVGFGGGCHWCTEAVFMSLNGVIKVEQGFIAPKEHLTSFSEAVIVDYDSNVIELKDLVAIHLDTHRSTENHSMRNKYRSGIYFFKQEDELVLKEIMTDVQQDFETPLITAIFPFGAFKSSEDRYHNYYFKDTEKPFCKTHISPKIKMLKEKYAKHVSAKVQ\n>UniRef90_A0A2J6HZN0 tRNA dihydrouridine synthase DusB (Fragment) n=1 Tax=Marinilabiliales bacterium TaxID=2053303 RepID=A0A2J6HZN0_9BACT\nMSGTDNLYLAPFQGITGAVFREVYTRYFVGVDKLFTPFFTGIYKKKNLTTRSDELDKIHHNKIPLVPQILSKDADEIMRFGEFCSEKGFTEINWNLGCPYPRVANKKRGSGMLPHPKMVAEILSRVQGHLPVQLSVKCRLGYHTPDEIFKLIPVFNQFDI\n>UniRef90_A0A3G9IWN6 Uncharacterized protein n=1 Tax=Paenibacillus baekrokdamisoli TaxID=1712516 RepID=A0A3G9IWN6_9BACL\nMAAEPMIFIFTGTSGSGRKTIAKQIGSELGLYHVLSCTTRVPRATEGQDRDYHYISHDEFVELERSGQLLQSTTIGKERYGIRHQELDRALANGKHAYLILNSEGASLFKNLFKDRVIRIFIYVDKQTVRERLERKGTPYDVVDRYLDQYTEEVVYRKQCEHTIENVELIRTLEQIRTAINSHL\n>UniRef90_A0A661X5S4 Ion_trans_2 domain-containing protein n=1 Tax=Caldiserica bacterium TaxID=2052147 RepID=A0A661X5S4_9BACT\nMRIYLFLFFMVGVSILWLWFLFFITRKLTGAKVIAVIIIALVGLVVFFGIKYYSFYLYDPKSFYIIPAHKLTYGGVRLFDFIYFSFVTITTLGYGDIIPLHTLTKILTILEVLMGVSFVGLILGRIVIKRES\n>UniRef90_A0A2M7LC39 Copper chaperone PCu(A)C n=1 Tax=Sphingomonadales bacterium CG_4_10_14_3_um_filter_58_15 TaxID=1974093 RepID=A0A2M7LC39_9SPHN\nMNKISIMLAASASLLLASCGQGDVLYADKAVVNLSPVEGNPSAGYMNLHGGRTDVALVGVTSDDVLRMEMHETVEKDGMASMNQLKEIPVPAGKTVKLEPGGKHLMIWGVGAGSQQRGLLKMTLIYSNDDRIEIDAVVKKVGEAAPAVE\n>UniRef90_A0A6H2DTH0 YbhB/YbcL family Raf kinase inhibitor-like protein n=1 Tax=Mycoplasma sp. 1654_15 TaxID=2725994 RepID=A0A6H2DTH0_9MOLU\nMIKIEIKDVKDGVLDTQFGNANLGGKYKNTVSFPIKWSKVKDAKSYAITLVDLEASGAMGIVFIHWIAANIKTNKLSWDFSFEHKDKIYQFENSITDKAENYLLKAFYTEHPNGVYYGPFPPDQDHNYEFRVYALNVDDIFGSHPQLKNNNLFYDDFINLIHNKVIDQGFTTFLYRAKTKINADYTLEKLDKSPKELNAPLKKEKQNFYAIEHPVDFQIFSNSLEKINDNTFLLDINNLMSLANLGYFHGKELELQWNKVDSVQEYVILLYSIAETKTLGVGLVEWVKVGIRSKDFPNNVISSLNSKESVKISNTFSSISLFNIAKLADLDETAFDYIKNGYGLCYIPYLTNNQGNYILNVYGLNQEIDWEQYQKELNRELNLADVYRKIKSKVIAKSEKIIKISPTLI\n>UniRef90_X1LS14 Ribosome-binding factor A (Fragment) n=1 Tax=marine sediment metagenome TaxID=412755 RepID=X1LS14_9ZZZZ\nASIKKLKEEKTVISFFLIKSFLNKKTFAFLNPNLKRSIRIKIADRLPVKIKISFLSK\n>UniRef90_UPI0011132975 hypothetical protein n=1 Tax=Enterobacter kobei TaxID=208224 RepID=UPI0011132975\nMISYKVEFPTQKTVGFKVNGYSSAEGLDCKMVEAIGGDVKVQLDQKTMLTVPYREDITADFTLEGYKQRAETYAKTMIDQIVNAAQHRAADDLIQEVTNAVVSSELFSQLS\n>UniRef90_UPI0004D08E5E LOW QUALITY PROTEIN: U7 snRNA-associated Sm-like protein LSm11 n=1 Tax=Galeopterus variegatus TaxID=482537 RepID=UPI0004D08E5E\nNVLTRMPLHEGSPLGELHRCIREGVKVNVHIRTFKGLRGVCTGFLVAFDKFWNMVIKPFSRAWGTSXRLNLLYLFDRLKLQDSSKKEADSRSAVEDSTLSRYSQTSTWKVASVWGRGDTDRGSRRRSRSVPSSLQASAREESRSEMSGRTTRTEGSSAGGTFSRATTLSRGQSCKKKRKPKVDYQQVFTRHINQIFIRGENVLLVHLAQ\n>UniRef90_A0A8J2R764 THAP-type domain-containing protein n=1 Tax=Daphnia galeata TaxID=27404 RepID=A0A8J2R764_9CRUS\nMVRPCCICGIKKNSEAATKGIRFFKFPSTKSESHSNWIKTIRHHSTKISRPFTPRRNSIVCSSHFEDSCFNRSYRKLQLKQGSIPTIFNFDDSSKKVFSTACDVTSKADEEKEGNTEGNVSSSSLRDYASDGSSSLSPPVLLPLQDVNSDFEETIEDPPDLELYHINHDYDESTGLTSFADLDMIKMDHIGSVADILGPDPYMQDESIVMDERPDSSVGEERDEVDGQTILSFTSAEEMHEFAHREASSRLTKTNDFRQIKGWRNKFQQLTPSLSPSPCSSPVSLPARSAISASENSKSPLPTHFSRLCQNPSTSFEMKNLKENGASCEKNSPNLDTQQRPTSPVEEGCIVPSEETAETTEEMANSSLESTLPLPDLIAHSEETKETFQEERKEPLEEGMKKSLEDERKKPLEEETKEPLEEETSELLEETDELMEETAEPSDESTEAFPELGIDGLISYDYAKFAASAACFPFDEKRGKTFKKADNSLTASKKVSPRPKNSATRTRINKQSAVQHVQILPIVDIDEIPSGDMTGFDDSMEEVVVQEEEYVEVYDVPGNLVLPTADCGQLFCRLGCICDILIKTKNRTKVSVEHCGLPECMLQCVCGYQKGKPSSRKCFASLLKGNESFYSKINWSGERRRRERRVPERFSEFHLGNESSSSVSNRSSEEFKQVESKSKNNSHHRAGNSHSSRSSSPFKNASPPQSHSVSPQSVQDSLPCPPKNRKWEPFRVKVCADEIKLLRWDSFVSLSKVYIAPDHDIFCMEHTMYGCPCIETDRRIIRIPSEYVPLPVIDTTKNTENKSPTSSAKKVKAKNVTSSPSAKNVAKKHTNPNMRLAPKSKVMEENAAPAAPQEPVAKTSSLSKMRKILSDERFQLQKLMTEEKTRAFDEEVDLTVRQGQTVQLVAWIRFHRIYHAGRIHIRFLSRRAGPVILVMRPTEIVAADITCDIQDMKGNTNSPEIVKELLDPCISPEETSRYAFLLCDGVKWELVGCLSLKASNDAPPPTSTVPPASLDTPTLFPSPPSPQHSISTTEVPSVVLDEQNAQQKRVAAQMKFLARCPPRTRDEVSPDPSAIQRSSALELKRMQLEERLSVINSKLTLQPPKQSVSFKQFKNKSRASMAPILQPIIPTVSVVETPVIVEELPPSSLSAADPSIQAPRPKTVRRAGKRKPDMTYLIPDQCILPDDPEEMPVVSLTEELPEAQPKKNSQNLPDSVVSQEGKDPNQTLYPAAEKLAMFSRLIINSRNDSMSGGNFSNFEDSSMTASKLSRPAKRPPPKLERIPTPPLPVAVPLPLIAPESTVPNIPPSEMTFIKLQPIGSSLPNGISGQNTVRRIRILTPNSTVNGGSGNSLLPVLTSRNGWEPNLIQQQRLHWSSKGVKPPVNAKITPTPVISDSLITVLPVPTSLGTGQNVSTLTSSCATNASDIVQFIGPVPNQDGKTPAITSDLQVPDWSTQLLMKANAVASTSISLAGVKLLQQKQRGKSTSPPVVNAEPSKETESTSCVFPKIFTAEVITVKSPPGNASQRLKIIYEAMVGQHRDFCPSRASMILPLHNVDDQWCIVAINQVPDSGFQVPGVTVFIPRDMLGRAASAAMERKARVSFPLHFKLKNDGSALKSGFEVYGTPQLPHHVFVGPFPFNYIESCTPLSMMNNNVCMFVIKLTKPIPVSVSDCAKEVQQLKPTEQTEEVIQSTETKSTVNTPEPISETSPSTIEEVSVTSTPVSSNKSSSEADHTASSEATEVSESTLLNTKDSESAEIQIVDEKINSNPKSLSQLPGSSLLRQPIQSESVKRTKKPIRMFVARTPGLPPVNIKLFSENSVVVDHPFLSGEKKMFTSLEKAKTWLQTLAIRNCNVEVKKSKTSNSAEDSWANSDFTEDEEIDVCGQTQGESQEQEETVDSASTTSRSPKRIRRLTEKARILAASKSKSSRNSGSTTSSFKRSQDKLPLPRKVGSSRKNSIQRMLHIQKEQERRGLLGKLIRDLDALCASSSGTRAKIVVLKNATILVGQLEQQAKEMEALYQNLKEQRTTLLTLREQIFNKLPPNASQIFSCFMESVPLPSRHLAMIENNRIKRYRPQVPDRQSQNRVAVIVPNNALLSESVDVAQGGYVLTGVES\n>UniRef90_R8UAD6 HTH cro/C1-type domain-containing protein n=1 Tax=Bacillus cereus VD184 TaxID=1053242 RepID=R8UAD6_BACCE\nMEIKKFIALTLFDLRNDEGYNRENFAELAGISLNAYASIENGKSLIKIDTLHTLLSELSLPLSVFFRRVEAKIESSK\n>UniRef90_UPI0021CAFDB3 AAA family ATPase n=1 Tax=Acidiferrimicrobium sp. IK TaxID=2871700 RepID=UPI0021CAFDB3\nMAIANQKGGVGKTTTAVNLGAGLAELGYRVLVVDLDPQGNASTGLGVNARNLEASVYDVILHDVPMEDVIEPTTLRNLFVVPATIDLAGAEIELVPAFSRELRLRRAVESVADDYDFVIIDCPPSLGLLTVNGLAAASEVVVPIQCEYYALEGLGQLLRNVNLVQTNLNPRLEVSTIVLTMYDARTRLAEQVVGEVRQHFGDRVCRNVVPRTVRLSEAPSFGQPIIVFDPSSRGAIAYRELAKEVSGGAAQRVG\n>UniRef90_A0A176TEJ0 Cytochrome-c peroxidase n=1 Tax=Polaribacter atrinae TaxID=1333662 RepID=A0A176TEJ0_9FLAO\nMKKLILSFLIIQLISSCTKEDVYEPFIFYNPEIEVAIPVNFPELNNSFYTNKPTKYGVKLGEKLFFDKKLSANNTISCSSCHIQANAFSDGISEAIGIYGRVGFRNTPPVQNMAFMQFYNWDGNKQALESQPLVPIITHEEMDSSILEVISKLETEEEYLHLFYNAFGDSKITGDRIYNSIAQYEYTLISANSKYDKVKRNEGETFTENEILGYKTFQDKCATCHSTELFTDQSFRNIGFPKNPNTDEAGRARVTGKTEDISRFRVPSLRNIEYTAPYGSFGQFATLKEVLDYLDNGVLEADNLDSVLKENNNQIPITEEEKDNLILFLKTLSDTDFIGQ\n>UniRef90_A0A5C6S3D4 SDR family oxidoreductase n=1 Tax=Phaeodactylibacter luteus TaxID=1564516 RepID=A0A5C6S3D4_9BACT\nMDFTGKRVLITGGSRGIGRAAAVAFARAGARVAINFHSNKEAAEEAIKAMPGNGHFAVRADISKPDAVFRMVGAVAEELGGIDILVNNAGVFFPHPVAQSDYAAWQESWSQTIGINLMGAAHTSYCVARQMMGQGMPGKILFVSSRGAFRGEPEHTAYGASKAGMNALAQSLAQELAPYHIFVGAVAPGFVETDMAAHVLDGEGGAAVKAQSPTGRVARPEEIAHCILFLATEGAAYATGCILDVNGASYLR\n>UniRef90_A0A1V6YXR8 Abhydrolase_3 domain-containing protein n=4 Tax=Penicillium TaxID=5073 RepID=A0A1V6YXR8_PENNA\nMSSIYAPAWDEFVQEIGPLLMTGSTVEDLYKDSEVNIQKIISKYEIPPPDNSVKTEDIKLNYAWIRVFTPPSATGNEPVGLFMHGGGWIMGSVDHEDAACRHITKSTGMKVVSIGYRLAPKFKFPRGLNDCVEATLWTLKHFSLSSVVLMGGSAGANLAFGVALRLIDAGVGDKVRGIVALVPCTVHPDAVPEDKKEHFTAYQENAVHTVNTLAAMKCFLDSYAPPPDDKYFSVLLHPRLQDLKKVYIVECGTDTLRDDARLMKGALEEAGVPIMYDDYPGYPHYFWSYPSPALAKASEEFHTNMFRAIKWINME\n>UniRef90_A0A0M2PUS6 Imidazoleglycerol-phosphate dehydratase n=2 Tax=Prochlorothrix hollandica TaxID=1223 RepID=A0A0M2PUS6_PROHO\nMTAQGIAVFDIDGVVRDVGQSYRRAIADTVEQFTGGAFRPTLDQIDGLKAEGIWNNDWLGSQELIYRYYEGQGQSRESISLTYDEVVDYFQRQYRGANLEDPSQWDGYINQEPLLMGAPYLQQLAAAGIAWGFFSGATRGSADYVLQRRIGLQFPPLVAMGEAPDKPDPLGLLKVVEQLTHSLGLSPTLPVLYAGDTVADLYTIREAQSQAPDRPWWAVGVLPPHVQEPGPRRQAYEQRLWDAGAHRVVSRVTDLTPGAIGQLFREGA\n>UniRef90_A0A1Y4NII1 Topoisomerase n=2 Tax=Lachnoclostridium sp. An169 TaxID=1965569 RepID=A0A1Y4NII1_9FIRM\nMPGVTKEQIQQARETDLFAYLQFHEPTVLKRDGPNYRHREHDSLVYVTGKKYWYWNSRGRSINALDYLIEIRGYDLVDAVNQLLGTDTRSVSIPKSSRAVTDQERNVAGEQRKQGNPSAESFSLPWARRCATFAVSYLRRRGISSEVILKCFRLGIFYEARYKGEAVCVFVGKDDEKKARFACMRSIMGKLKKDVYGSDKRYSFCYPPEHPGSRQVAVFEAPIDALSHATLQEVEGWKWDGYRLSLGGTSGVALFSFLERHPEILRVTLYMDNDLAGLVNARKIRSALHKDPMFKHIRVGINPPRTGKDYNEKLLCRLQQIKEDPDVSRQKEAAISI\n>UniRef90_UPI001AE5D1C9 PTS transporter subunit EIIC n=1 Tax=Vagococcus allomyrinae TaxID=2794353 RepID=UPI001AE5D1C9\nMNAFITLVNKRVTPFATKLSRNIWIASLQDAIMSTLPLTLVGSVISVLSILNSYFPKFPDLSPISSFSFGIIGLAISFVLPVYILQRKKMDNKKNLAGIANVGLYLMLVLAQINENGELVFAGDSFGSGGMFLGILSGYFTAIIFILLAKFTFFKDSEAIPDYIVSSFDSFMPILIILTIAYLVVFTFNINFFEILTKILLPLTNFGQSYLGLLAFVFVTTILYSFGISPWLLYGLFYPIQLAGIAENTQLISQGLAATNINTGEVVQGLITLGGMGTTLPLAFMLIKSKSARLKAIGKAGIVPSIFNINEPIVFGAPIMLNPLLMIPFWLNSFINPTIVYFALKSGLVAIPTKVFNLWFIPAPIQGYLVSGDWKGILLSLVVLAVATAIWYPFWKAYDLEQLELEGEAK\n>UniRef90_A0A1X9YSF4 Conjugal transfer protein TraG n=1 Tax=Pontibacter actiniarum TaxID=323450 RepID=A0A1X9YSF4_9BACT\nMQTGENAQALRKIIDMTRLISLTLLILHAYVHLYRAFAAWQLTWPLLDRLLDRVLASGLLDGFHRSKFLALGFLAISLLGTRGRPSEALRPRTGWACLAAGLLLYTASSLFLYLPWPVTKAALGYLALLTTGYLLMLSGGTLLARVVRLRLQRPDIFNRANEAFPQEERLLENAYSVNLPARYTLRGKLRRSWINIINPFRGLLVLGTPGAGKSYFVIRHVITQHIRKGFTMFVYDFKFDDLSRIAYNTWLRQRPHDPVPPAFYTINFDDLSRSHRCNPLEPATMRDITDAAEAARTILLGLNREWIRRQGDFFVESPINFLTAVIWYLRCYRDGEFCTLPHVIELMQLDYDSLFTCLRTEKEIEVLINPFVNAYLHDVMEQLEGQIAAAKVAMARLSSPQLYYVLSGNDFTLDINNPDAPKIVCMGNNPQKIQVYGAVLSLYVTRLVKQVNQKDKRPSSLIFDEFPTLYLSSMDSLIATARSNRVATCLGLQDLSQLRKDYGREQAEVIAGIVGNVVSGQVTGDTAKQLSERIGRILQDRASVSINSSDTSVSRSTQLEAALPPSRIAGLSSGEFVGLVADDPDCRIERKAFHSEILNDHAALQREQESYLPLPQVRQLDQAVVQKNYRQIKQDMEELVSSEMERLLQDPSLRHLVIRK\n>UniRef90_A0A4U1HMG8 Asparagine synthase (Glutamine-hydrolyzing) n=1 Tax=Polyangium aurulentum TaxID=2567896 RepID=A0A4U1HMG8_9DELT\nMCGIFGYVTKKRAVGGPRALGAALRALRHRGPDDEASIELTSGDSRCGLAHTRLAIIDLSPAGRQPMSTADGRFTLVYNGEVYNHPELRKQLEALGVSFRGTSDTEVLLEAFARWGEAAIPRFRGMFALGIWDADRRSLLLARDHMGIKPLYFTAGPDGLAFASEVRALVAAGFAEPRPSRRAIASYLATGSVAEPDTIFEGVSPLPPGTILEYTDAGPRLSPYWELPLETAPPADRASAIEDVRATLADAIRLRLVADVPLGVFLSGGMDSTVIASFAARASSRPLNTFTVTFDEEAYSEERHAAEVARRIGSEHHQVRLSGGETMKSLPAAIDALDQPSVDGFNTYFVSKAARAAGLKVALSGLGGDEVFAGYASFSRFGPLLAAGRAGRRMMPLFDRAARALGKPFGALPQRGRKLLDALRAGGSPEKTYGVMRSMFDLGQISALLSPELAHEAASLPLNVPERLEPLVERGAMDPENAYSALEISNYLRNTLLRDTDVMSMSHALEVRVPLVDHVLVERVIRLPGDMKVGGGLNKPLLAAAAGDLPESVLRRPKMGFCLPFAEWMKGPLRGWAEEALLGEATRRLGFLNADAVARLWRAFLEGDRRVSASRVFCLITLAAYFGSHEALF\n>UniRef90_A0A6C0E3C4 Methyltransferase n=1 Tax=viral metagenome TaxID=1070528 RepID=A0A6C0E3C4_9ZZZZ\nMQFWKNCLQFFNLVKSTEQQGVSETEASHAKAKAEEPSKEPEVEDEKVKDVVAQESPIEPEVDHVEAEAEAEAEEALVEPEVAHVESEAEAEEALVEPEVDHVESEAEAEEALVEPEVAHVESEAEAEEALVELEVAHVESEAEAEEALVELEVAHVESEAEAEEALVEPEVAHVESEAEAEEALVEPEVAHVESEAEAEEALVEPEIAHELELNTYFNNDPFEYFRSEHTQEKDLLDSDSE\n>UniRef90_A0A4R3GCS8 Conjugative transfer protein TraD n=2 Tax=unclassified Rhizobium TaxID=2613769 RepID=A0A4R3GCS8_9HYPH\nMARTSTSDARKKDTREKIELGGLIVKAGLRYEKRTLLLGALVELKQRLGDDAGERLRLTLIGAKAFGDDA\n>UniRef90_A0A150G0L4 Myb-like DNA-binding domain containing protein n=1 Tax=Gonium pectorale TaxID=33097 RepID=A0A150G0L4_GONPE\nMARKKKCHDAKAQKKHSVKGTNTAWSDGEKLILAQAVSEVMPGAANADNIDWPVVARAVPGRTAKQCREKWLSDLRPGIKKGAFTLKEECVLIMAHSKFGNMWAKIAKYLPARSANAIKNCWSSRGRAKELQKVHTLLYLYILLVDVASKEPQEAGRRGKRRREGEDGAAAADNADAVKKAKEEYRELAAAHKLVPLKAFLVDIDHYLSDADGTSPAMRDPRPEIWIMGRGKSRVPVAGEVDRNRCLPLGHDDDDDDDDDDDEQTTTNGNGSGNDDGQRHEMPCDERAGGRPRAMPPVPSVGPGGGGGGGGNGDGGGNGDSCGAAMAAWNASEGERKAEAVDEGSAARGKVGRKGSAGSTARDGSHSFRTAATSNASAGAEQAVPLLEPPSGAYHPCVGGAIGTGDSGALGQQRTESPQHPAPFVFASYGMPGPLREALDAAERTARPQGPQGPQGPQGPGDASFEACLRTLGQRLAERDEQLGRRGGEGGDGGGGGGGQEGDWLCPLDAALRGNAREGGRGRESTPGRDLRRGRRASWSGGAFPSPSPPSFWDTREIDAHFAAELGHPLPGSGFGEADHHRDTPQQQCRSDCACGFHATGCPAAQAAAATQAWAPAPAPVPGWGRVSAGAFHPQQLAPALQNQLIQTPPATAAPSYGSVLPFHSLPGLTAPWEPHHQPPPPLRPATSAPAPFALAALSEPGLVPQQHYGLHGGMTAAPGVAHQAGGGVAGAGAGGAYAAAAFALAPPQPPQYMMLPPRPVWQHGPRLEVDAIRRARFHAEALM\n>UniRef90_A0A7X9ZMZ4 Endolytic murein transglycosylase n=2 Tax=Sphingomonas sp. G-3-2-10 TaxID=2728838 RepID=A0A7X9ZMZ4_9SPHN\nMIVLILVALAAGFGVLQIWAGPGPSRANVSVIIPEGASLTRAANELEKAGAIRSARVFVVLSQVFGGSEPIKAGEYRIPAGLRQSDVLAMLQGGKTLQRMVTVTPGTPSILVYEALMKAPHLTGEIEIPAEGSVLPDSYAYNRGDTRQMVLDRMQKAMVNYLAKAWEKRAPGIAVNNPRDALILASIVEKETGKAEERGLVAGVYSNRLKRNMKLQADPTIIYPITRGKALGRRILRSEIDAVNDYNTYSMTGLPKGPIANPSRASIDAVLNPAQTNAVFFVADGTGGHVFNETYEQHDAAVQKWREIRRQRGEIQ\n>UniRef90_X5MP23 NADH dehydrogenase n=1 Tax=Candidatus Phaeomarinobacter ectocarpi TaxID=1458461 RepID=X5MP23_9HYPH\nMGIRVSDVAFVRFQAPDLDQMEAFLSDFGLVRAARTEDALYMRGAGSDPFVHVTHKGEPGFAGIAFLADSVADLEVLAAMEGASPVEDITEPGGGKRVRFVDPNGHKVEVVADRELVPTLPVRRNTPGNEATHSQRVDAALRSGEGPAQVMRLGHCVLNVIDFRQSEAWYKERFGLVTSDEIEIEKDMSIGAFMRCDQGDKPVDHHTLFLLGTGAAGFNHAAFEVANVDDLMAGNSHLQAKGYTHEWGVGRHFLGSQIFDYWRDPWGHTVEHWTDGDLFTSDTPPNMQGIDTLLGVQWGPPPPPTLGT\n>UniRef90_A0A259M653 DUF3298 domain-containing protein (Fragment) n=1 Tax=Hyphomonas sp. 34-62-18 TaxID=1970392 RepID=A0A259M653_9PROT\nMNHPLNRRVAPLAAVFLLGLIGACGEPPKPDASDTDHGEATVEDYVRGPHNGRLLEDGAFALEMTIFETGVPPQYRIYPYKDGAPLDPSSVDLTVKLHRLG\n>UniRef90_A0A060AF13 Flagellar FliJ protein n=1 Tax=Staphylococcus phage 6ec TaxID=1500386 RepID=A0A060AF13_9CAUD\nMNYIERIYSELVDLKGTVNILQIEMKEINSKFEDILIKIRETEFNVSQSVEMYKRLQEFLQERRLLRAQIEEMEVQYEILGGDEQLKKYEKALDFKEVKKDREFKKDKKYYRDKKYYNNFREDLKEKAIDLYHIV\n>UniRef90_UPI001F0D41BD helicase-associated domain-containing protein n=1 Tax=Arthrobacter silviterrae TaxID=2026658 RepID=UPI001F0D41BD\nMAHFGWHHPRPARRVAKALAGFLSEAELLGLSGAGALTDHGRAIVHRDWDGALALVAAALPEPVEHLLLQGDLTAVAPGFLAPELAAELALLADPEGRGAAGVYRFSAASIQRAFSAGRTAEGILSFLAQHSATPVPQPLEYLLRDAQSRHGRFTVGQAGTYLTAEDAAALAELLAGGAAAALELTAISPTAAVSPRSAAEVVSALRAAGHSPGIAPGTPLAAGSDDGGTRRGTTSGAPRSRDRAAQSGPEMLAPHEVARLLAEEADETFEGGAGPDADSGAATAAVVLASAAEAAAAAQLGLLRSRPAWTPGTGESAPALALEQLHAAVRGKQAVWLTAVGSDGHPERRQLFPVSVAGGRVRVFDPGSGRERAIGIHRVMGVEIIAKGKGAP\n>UniRef90_A0A6G0IZR0 Cilia- and flagella-associated protein 300 n=1 Tax=Larimichthys crocea TaxID=215358 RepID=A0A6G0IZR0_LARCR\nMAGDESDVERAFRLRYGRHRDNTAQMSHVLRYITDGGVKEHFSQFGDVSGDKLVKFGSFWRTEPAPISAAKIRECQHFFSHLSGLAAFFTKSAKRTKLLDEICHAKTACLVCTVYERREELVELFEFVVDSHNDFDDDAVHSMALLTGFEFCFLLATFNSVFSFSDMLFGILQNKEYDMQFCLSSIDDFCSTTEREKVKFDSINEDTVREVGGPCGHRAQRVGDVRAVYQQVYCAFEIVL\n>UniRef90_A0A2R6KP62 Cation transporter n=2 Tax=unclassified Halobacteriales TaxID=38063 RepID=A0A2R6KP62_9EURY\nMSRASSLRRVGALVLVANIGLFAAKAVVWQTTGSLAVGSEAANSLADSAYSAVVLAGLYLTTQPADADHPHGHERIEPFVSLVVAGGIFLAGGAVAYNAITTVLSGSVTVSRGPTAAVVLAVGGVVKFGLYRYVLGVATDEQSPALRATALDNRNDILAAGAALAGVLGAQVGVPVLDPIAALAVSVAIGYTGVEVVRDNLSYLVGGAPPEELRAEILSRALDHPDVAGAHDVVAHYVGPEVDVSLHIEIEGATTVREAHEIETAVVRAVGETPEVDDVFVHVDPKELDEWKTDSEVDRLAVFEES\n>UniRef90_A0A6L5DZ66 CHAT domain-containing protein n=2 Tax=Marinifilum sp. N1E240 TaxID=2608082 RepID=A0A6L5DZ66_9BACT\nMKNILKKILLFSLLLVFLSGENLNLAHNSILFSVSEVKTNPDSLLVQQFDRAFQFLRKGDFQYAEQSFRNATNTIENGIVNNKILVYRTYVNFGVLLGRIGKSQEALKYYNLSEQFTIDNFGVNSQKLVPLYVNMGNIFAEAEDLFKAQTYYEKALNLIGNAKSRFLPKIHNNLGTVYYKKRQYNLALQSYKESLRLKELAKTGDKFSSLNGIANCYKRSGNFNEAELFYSKSIYEIKRIGGDNSYQLGDVYLNYAVFQNESKNYNKVLPYLTLAYKVYSSNYGLKHPDTAHCLFNFGDWYHDTNKKYDIALEYYQKAIVSELDNFQDSSIYINPNLNEIEPQLSILQILKGKARALKSLYSTSNKISDLDFGLQTYDLCLNIIDKIRIGYQDEESKFYLSKNEKDTYTVAIEIAVELFQLTGDVSYKEKAFKYAERSKAASLMSSLNDVNAKNFGGIPQELQDEEIQLRKDIASYREKIYEERKKASPDRKKISDWQGVLFDLNEKYNQMVLRFEEDYPEYYALKYDNHTIDIEELQSRLEDNDVLIEYSISDSALFTFTITSSSFEVTRQNLDKDSFESHLEEVRNCLKTNDFAEKSADYYKRYTKSAFHLYKELFQNQPNNLDNKNLMIVPDGKMAYIPFGVLLKNEADSTRMNYRGLDYLIKSNTITYHNSATLGFSIESAGFSFSSNKSVLAFAPSYEDVNDSILYAERAYRDKLYPLPGVKEEVNNISKVIPGDLYVDDFATERNFKDHASDYDVLHLAMHTIIDDENPMYSKLVFTQVEDTTQDGLLNTHEIYNMNFNARMVVLSACNTGDGKLMKGEGVMSLARGFFYAGCPSIIMTLWTVEDQTGSNLMTNFYNFLSQGLKKDEALRQAKLEYLKTADPLKSHPYFWSGYVTMGDVEPLYDFNLKSNIAYMAFGSLGLIFLLIAFRRFRAKKMTA\n>UniRef90_A0A1H7CBQ7 Negative transcriptional regulator, PaiB family n=3 Tax=Paraburkholderia TaxID=1822464 RepID=A0A1H7CBQ7_9BURK\nMYIPAHFEENRLEALHRLIADYPLGSLVTVGPNGLDANHVPFEFDAGKGPHGTLRAHVARANPVWQEVAERPDALVIFQGPSAYISPTWYPSKHETHRQVPTYNYMVVHAHGPIVVRDDEAFVRGLVARLTRKMEAGEPVPWKMGDAPADYISQMLGAIVGIEIELTKLTGKWKLSQNKASADRRGAADALNERDSDEQRAVADAMLAAPPNLD\n>UniRef90_A0A1R3VCA4 MOSC domain containing protein n=10 Tax=Mesorhizobium TaxID=68287 RepID=A0A1R3VCA4_9HYPH\nMQALTEIGTVSELWRYPASSLAGERRDVISVGSETIDGDRLFGLVDASDGEIARPDREAKWHKVPLIRARLSQARQLEIATPQGDWLPAPGAECDGAVSAFLGFAASIRPFRQKDAPDYAGLLTAERYRKAPIHLLTTASLARLKALHPEGVADPRRFRPNIVVDVAAIEGSFPETEWIGRKLAIGDLLLTISEPCRRCGFTIIAQDGFDHDAAILRNLVRHNAHNFGVYCTVDRPASVGVGEMMRLV\n>UniRef90_A0A4C1WBZ0 Uncharacterized protein n=1 Tax=Eumeta variegata TaxID=151549 RepID=A0A4C1WBZ0_EUMVA\nMPATFRTANPGWVHAATPTRKEDADMTNARVPRDLMLFSRSTSLAAGLRRFSQRLKLSPTNTARAPPAGMSTGDNPWRPPTDFDAKAAFDLIEFDHLSYVRLTHCPPLLSSDL\n>UniRef90_A0A4Y9ZGX7 Fip1 domain-containing protein (Fragment) n=1 Tax=Hericium alpestre TaxID=135208 RepID=A0A4Y9ZGX7_9AGAM\nMRGWFVHSFLAVAELRVEPGRGSNGTASEIETHVGEIVRRAKRASDSRLSFRCRFDQHTLEGEGSPGQLPTTMDDDDFLYGGSAEPEPVPTTPAPEPKPVVAAIEAETIVPDIPFGKREPSSGPITPLTPLDVKDESRNGSVIPPDIGVVVQEAAVMEEVVQVDAKMETEEQEQEEEEEEVEIEEESEDDIEFIMEPPTRSLDLRPSRPVQPRVPSATATFTPTKAPLAAGPSLTTEYTPRERGAPPKPAVTXPSAPPSVSVPPSLPPGPSAEPMQPEQPKIEEGPEPSTLPLVTAPPSHPQINPDIPGTLDGRSILDIDLANMSEKLWRRPGADISDWFNYGFDELSWEAYCYRRRELSDVSSMLKTNVL\n>UniRef90_A0A515EVL7 DUF502 domain-containing protein n=2 Tax=Rhodoferax TaxID=28065 RepID=A0A515EVL7_9BURK\nMVWLPLAITLWVLLWLVGLLDAVFASFLNGLSAVTPESLGPRLERLHAIPGLGVVLVFSAMLVTGALVSNVAGRWWVKQWDRLFTNIPIVKSIYNSVKKVSDTLFSSNGNAFRTALLVQYPRQGSWTVAFQTGSPSGEVASHLGADFVSVYVPTTPNPTSGFFLMLPKADVIELDMSVDEALTYVISMGSVAPGAQASKIPVSQ\n>UniRef90_I9LJW7 Phage_Mu_F domain-containing protein n=1 Tax=Pelosinus fermentans B4 TaxID=1149862 RepID=I9LJW7_9FIRM\nMDADSKAIIVQFLATVDKILLDGDFTTSKMLDLNKAILTLKNDYTKLIREGTVKATESAKKLKGVEFKAYKAEVQRLLSAQEVAAAEQVFILGKITAEFGGGLDAKVIDSVWNKVWPDALNVDDRIKRLSAKVKEFTERTIKQGISEGNSAANISRILREHFVIEGLEGKAAFRLAAHTTNMVYQATQAEISIQATFVMGIRIVRGMFGKISPKCPICYEHGGDSYKEYFKSYFGGRDIDLWVLANMPPYHSNCSCGIEQITEDAITFIQRARTEYALKNA\n>UniRef90_A0A7R9TH37 IPPc domain-containing protein (Fragment) n=1 Tax=Micromonas pusilla TaxID=38833 RepID=A0A7R9TH37_MICPS\nMAMGAGARASSIEDAEGPHPLTKAWAGRIKNAKVRAAFMDEPIAGYTSARDLKVLCGTWNTNGKSPPADLDVSRWLDASSRPDVVVVGFQEIVPLTAGKVLAVEDDKATREWEAIIERALNDAATTATTTAAAAAAPKNAAAFASDTSWQRAGQPPRTQTPQSAAGWTSFDSPGVSGGGGGWTSFDAPAFPGAAAAAAGRDRYIRLASKQLVGVYITVYVNASTAEHTRDVRVHTVSTGFNIGLNLGGFKTPDITLGNKGGAAVWMRVYSTPIVFICSHLSAGSKEGDAEKRSADFGEIVTKLSFPAPPSASSDGVAEKPAGVADAHAAVWLGDLNYRLNLPDDRVRAAIASGNCASLLGSDQLLLERAARKAFVGWIEAPVTFPPTYKYRPGTNTYSGAGDAGAEDENGGGGENGDAGGARVKVSAKEEKKKRTPAWCDRILWRGRDIRQNSYARAELTQSDHKPVLAEFTIVARELQPERLQETLDSLRRRLDAEEAASQPRCTLENPQADFGDLKHGETKAISFRLVNSGDVPARWGFVPGGA\n>UniRef90_A0A2W4M120 Oxidoreductase n=1 Tax=Proteobacteria bacterium TaxID=1977087 RepID=A0A2W4M120_9PROT\nMRLAPRVGFLGVGWIGSARLASLAASRTAHIAAVCDPSPEARARAHEVVPEASLFEHYEELLEVPLDGVVIATPSGLHARQCVAAFERGLAVFCQKPLATSAAEVQRVIGAARASDRLLRVDFCYRHTRALSVARELVASGELGPIHSVELVFHNAYGPEKAWALDPDLAGGGCLMDLGVHLVDAALWVLGSPRVERAVGRRFREGQRLAPHSSTLEDFAVGLLDLDGGVSASLACSWWSSFGDHARIRAEFLGARGGVVVENVAGSFYDFACDRLRNATRERLVSPPDDWGGRALVSWVAELRASPKYRPEPELLEVARSVDLLLGRDPTAASASEPERVDAAGVV\n>UniRef90_UPI00140DB29E hypothetical protein n=1 Tax=Psychroflexus maritimus TaxID=2714865 RepID=UPI00140DB29E\nMKNLSYLLFLFPVLCFSQIDLSPILTSGLEDANKFTSSYLEPGLDAVAFNLSNGWYSSAKAKGLGSFEIAIIGNASFVSEDQQSFELNTNEYDFLEFSDGSSAKNVANVLGENDPSITALSVYTDEFGNEQTVSFELPDGLSGSGLNFVPTAALQANVGLVFGFEAVVRALPEVKSENNKFRFYGFGLKNEFTKWIPGTKALPISIAGMINYSKFDARFALEETVLINGNDQRIDLGLETWAIDLIVSTRLPVINFYAGGGYVMANSTYGLNGTYQINDGPNSGETIVDPISNSSSLNGYRATLGTRLSLGIFKLFADYSFQEFSSVSVGMGFGI\n>UniRef90_A0A0S4HPD3 SLT_4 domain-containing protein n=5 Tax=Pseudomonadaceae TaxID=135621 RepID=A0A0S4HPD3_9PSED\nMKQWRTWLPVLMLLTLTGCATPPPKDQNNLCNIYREYPDWYEDSLKMQEKWGTPQHVAMAIMKQESSFISDALPPRDYLLWVIPWGRVSSAYGYAQAQDPVWGEYKNGTGNGGSRDNFDDAIMFIGWYTTGTQRQLGISKWDAYNQYLAYHEGRGGYRNGTHLSKPWLIQVARKVEQQSQSYNSQLKLCRQALEDNRSWFF\n>UniRef90_A0A392UKT4 Ig-like domain-containing protein n=1 Tax=Trifolium medium TaxID=97028 RepID=A0A392UKT4_9FABA\nMVTIPNFKAPGANLTVRCKSRNISNNSCWLAITAEHADTLFLLKASATTFAFPG\n>UniRef90_A0A231P0P2 Aspartate 1-decarboxylase n=4 Tax=Desulfovibrio TaxID=872 RepID=A0A231P0P2_9DELT\nMLKILRAKLHGIRVTQCALDYHGSITLDPEVCRLAGILPLEFVYIWNKNSGQRISTYVIFGEAGSRCCILNGAAARTCQIGDEVIIGAFEYVSGPQDICHREPVVLTFDAQNRIEERLRYVVAQDGEDMAFSIVPDPL\n>UniRef90_A0A8H4AAK2 Nucleus protein n=3 Tax=Gigaspora TaxID=4873 RepID=A0A8H4AAK2_GIGMA\nMPDESGHKRQRVSKACDSCRRKKVKCDGVQPVCGNCSTFNLDCTYNDATKKRGPPKGYIEAIETRLHRMESLLGGLVHSNDPFAEAVLAELMQDDPRPSRRSGNMEFTWKNGSLSTHGDTGRSGGSEVQSPENVLTSEAKDNSIDDLNEIMGILSIDENRQVRYHGRSSGFYLLKNSERYKNGILSLSDNSPKENLISTQNLESLKRPELTTLPPQEISDHLLETYFTHIHPLLPIIYKPIFFNRLKDRNNPPFLLLNAIYALAARYSDRPELRKVIQDSQTAGDEFFDRAKALLDNDYDKSHITTIQALIIMAIRDIRIDNTTRSWIYIGMAARMAQDLGIHRNNEKWQPISLSHEEKEEQKRAFWSCFVIDRIASTHMGRPLGIDEKDVDAAYPSEDEDDEYELLPFKMIHATSSTLLSSPASTNSSVLGSPMSPASTIINKDSPNAAHSVSRFNCLIKLCEIMGRIIQNIYAIRCNVSSANSTVTSILDSSLTSWYVNLPPHLQYNSSSDQHYDTTTLNLHGLYYSTLILLHRPYANTIGKNPSHNICTTAANAITDIADLMRQRKQLRHSPTTVIYCTFSAAVIHTYNAIQPDITISQPARVNLEKCLKILGDLITIWPLTYKYAVILTELANLRDAQLDVNMEQKNDGSEDGFNSRKHINPPIILDQHERQARYHPLNNKIITSHNNKGSSTQSQMFNPVSLNHSQTYERHPVMGFGNPITISSQSSSSYNQTQKSQLQLHHDLPESAQMFNNPFGYRYITSSTADQQTQHTMGGTDPYAAPGVVSTNNRIGNDTINSINSDLWFSQNAELNERSSYFGSQQMQQSVSPFSSPPSLHSQPQALMQIPLLHDDGNDVNMFADNHAFAAIGVGNCGNRRGNTSPVYY\n>UniRef90_UPI0013A69B69 DUF2079 domain-containing protein n=2 Tax=unclassified Actinomyces TaxID=2609248 RepID=UPI0013A69B69\nMTAARLRPDRPLTRLLDGLPAALAVVVGAAAMIVYSVGQWRAMQVPSWDLAIFSELAKAYSRLEAPVVPIKGEGYNLLGDHFHPLLVLLGPVWRLFPTPLALLVVQDLLLAISAWPLTRLATRLLGRLAATVLGLFYVLSWGFQGAVASQFHEIAFAVPLLAWAAVAFVEGRWRSCALWLAPLVLIKEDLGLTVLMAGLAIALRGWQGAAQQPTHRGPAWWRRLSTARLGVLVALFGAAAFLLTVLVLLPALSPSGTWEYGLTGGGGADTSLIARLLSSEVKLQTLGALVGTAGLIGLTSPWMALVLPTLSWRFLSSNEFYWGWQNWHYNAILIPIALGALLDAVARLQAAPDAPATEVPGTPTPGTQQPDPEAPHATPGWSAVPMWARWAAALGVVLPLATGLLTLRDLPLWSITRSGYGAPSPRTQAAAQVMDLIPAGASVETDLGLLAYLVPDHTVYWVGTSEVDTDYVVVDSLSSAWGGNPPTDAAAWATGQSQNGAVYELVLDEGGYQLARRVS\n>UniRef90_W7AVG7 RMI1_N domain-containing protein n=4 Tax=Plasmodium vinckei TaxID=5860 RepID=W7AVG7_PLAVN\nMKRLIEKNVIKINYNTFVNQYKKAFKCEKDIIDEELYEHFIINPFTYSRPFGCLLPNYNNTETYYLNGINIFEVVDYVNINERLYKVENSGDNEDDSDQNEDSFNFPDNSGNEDTIDYSNSEGEYGNGNKKGKKNKKSNKNSESIKTKGHTKGTNRNINSSNITQAKKSNNKYRRIFRFLLFDGKYFIYAYEYEYNEIFNYLETNKYKYPKIILYNNPVIRRKVILLKKNQVIILFKGNTTIEQNSSSIKDEEECYDITDINKKSYFNYTNKQEELIPISTKNESNSYNWSGNYNMPNQNRHRNDDPNYLSRENNVRNFYYEDNKIKNTYTNSGTTKDEKNYNYFHNNNNSKGYNRFTLQENNNNSDKYEHFKSYTPLKQAPNFNENVHNKNFTQTNSPNNNPNRIWINNQSNINKDSFHTNNSNNNNQLIDLTEGFFSSKFFQKSPDISNTCDDVIILDD\n>UniRef90_A0A6I7QQX8 ABC transporter permease n=1 Tax=Spirochaetaceae bacterium TaxID=1898206 RepID=A0A6I7QQX8_9SPIO\nMFLRMALLNLLKHRRRTILIVFAIMVSVLVMEVMAGMFEGMRVNFFRNLTRESGHIQIHAPGYRDRLNPFTLDYVISGYEEITAALREIDGVLEAEEVLHFGALLEHEGRDLTMAGVGVRKGTRFYRDVREGIRGGTFPGDDAQADHTASGVLLSVAVARLLNLEQGDRVNVIVEDSTGSPYYLQLPLTGLFETSSPDLDEYTFFIDHESAQDLVYLEGGTIEIRLRLLHADEADAVAARIPGHLRRAGIDADLDVRTWRELHGGLTSLLEMMDFFILAMNVFVIIVVASVITNAILMNVFERMRVIGTMRAIGLKRRSAGAMILAEGAIQGVIGSALGLAAGIPIVLYFSVNGLDWGGISEAFGMGSSYYYFGYSLHNSVISALGGVLVALSGSLYAAWVGMRLTIMEALHHV\n>UniRef90_J4S719 Universal stress family protein n=5 Tax=Burkholderia cepacia complex TaxID=87882 RepID=J4S719_9BURK\nMHRHPFKGHAMYSNILVALDGSDTSSRALDAALDLAAQTGARLTPVYVVDFLVPAYDTFGYDPSILIDAFREEGLRVTEDAAHRMTARGVTGTPQISNVAPAGEDIAHRIVTVADDIGADLIVMGTHGRRGFRRLVLGSVAERVLRQATCPVLMIPASCASKASADTAAASIEKEPS\n>UniRef90_A0A849MVB4 Uncharacterized protein n=1 Tax=Roseicella sp. DB1501 TaxID=2730925 RepID=A0A849MVB4_9PROT\nMTLVFIALLALSWTGLSLAVLAMLMKRLGPPRQAAWRAFGLSLAVNTMGAAYATPGEPLSAVILILLCHALLLPPLLLAARREGQREGQRP\n>UniRef90_A0A1G9RLY4 NlpC/P60 domain-containing protein n=2 Tax=Actinomyces ruminicola TaxID=332524 RepID=A0A1G9RLY4_9ACTO\nMSPFKSLHRCTSTAVSVSAAAAAALSIAVALPAAPAQAVVQFDTTSDLMSASGLSGTVYTAGDEAADDGAGMSFSVTNTLPDGIEGNIAVPLADDTWAVPQGLPTSPTREADSAAVEDLISRAQTFYDAGGQLIWDSSRPTPLTGTVVRDSTTAPYGVTCSTFVSMVLLGWDYQHTTYTADTNTQVGYAVDFGVDPTTSKIWRANNLASWFYANGDLWLETDGNYQRGDILFFSEQDPEGRIDQVRSGAESTYFGNVYHAAIYLGDGMLIHSTGTGNGVNITTLNPLLEADLSFVARPTFTAEAANTGQAAESGDDATAQGETTESAGDDAAPTETTGSEGQDSSQDGTTGTTGTTGAGGVRAVTPVSPNRQYSRPIEDHRGWMSR\n>UniRef90_UPI001F24B592 CHAD domain-containing protein n=1 Tax=Streptomyces sp. GQFP TaxID=2907545 RepID=UPI001F24B592\nMAQQHLEPTDPTTAGPVTADALADYLRAQATEFLRALRLHRETGTASSAPSAEEPVDAARALRHAARRITGTLHTFRPLLDPTWSETMHPELAWLSGTLAREHAYAARLERLLLALQRLSGAVPLPAQAGVAVGSRSARAERVGTAEPGTAGPPTHPATPDRSNLTVGAAKAGALLERQLTLARTRAHSAALQALGSSRFHAVADNVAVLASEVPLTPAATTTPTDLRPLAAAADERLCDAVNALPLLTAGHPYNAEALVHGLSPDPAPHPQDAPWHHVRLLLRLRRYAHEVLDGDEARVDVRMLTAGTALNRHRDASEAAAAAAAAARTPRIAPATAYALGVLHADQRHEVEAARFAFQQSWEKKAMSTR\n>UniRef90_A0A0R1J1V1 N-acetylmuramidase n=3 Tax=Companilactobacillus TaxID=2767879 RepID=A0A0R1J1V1_9LACO\nMPQKRNYNRRRRRKNKYNQPLIIFLTIIILLGAGVFGFRRYSEYKQEAQTEQVETEHNAFVKKVAPYAIYLGKEYGVLPSITIAQAILESDWGRSTLAKDYNNYFGVKGSDPSNTKVLQTKEYTDGQWVTINGRFRVYSDYRESMKDHAELLVNGTTWNSQQYQQVIHSKDYIEAAVALQTDGYATDPGYTSKIIRVIQKYNLKKYDEGIK\n>UniRef90_A0A1Q6SW29 Glycerol-3-phosphate cytidylyltransferase n=2 Tax=Firmicutes TaxID=1239 RepID=A0A1Q6SW29_9FIRM\nMNEKQPVIGYTTGVYDLFHIGHLNLFKNAKGMCDRLIVGVTVDELVEYKGKKAMIPFEDRIEIVRSCRYVDAAVPQYDMDKLTAARKLGATVLFVGDDWYGTEKWKKYEREFAEYGIRIIYFPYTKGISSTKITEALNSVRRDDLSDLK\n>UniRef90_A0A4V6IDT8 DUF4309 domain-containing protein n=2 Tax=Chryseobacterium taihuense TaxID=1141221 RepID=A0A4V6IDT8_9FLAO\nMKRRIIAFAVLFLFSAGIYFLLYHKDKNLNFIPENADAMILIDKKKLTRQYLSAFIAHPSQWFIESSESEKKRSVFKAGLKIPDFLQIFHLKNSKLTEWYAVFDIENPQKLLVFLKEHKFKNLGQNLYIKDMLYIKIADQKCYAGISGHDFEKIGRPLNGIFGDKKLNADHFMEEGTGSLSFISGTRTRNFSIELKDREIEIKNASNIENYASFISQLSKEDLFINAELNKENIKVFNKVLPDFFKDLSEVNHLKMNAKLKQVKDTIISYGYDDDFNEIEEISYQEIVQPDYMIQLETQDPAKIWKHFRSENLINDKNEFTGIPFQPNRVYQSDNGIVIKSVTEQSLHSQKKGKNFILIKNDPLLFSFSKGLNDFKYLKDIEYFFYGNKGQDFFLTLKLKDQKLPLILQ\n>UniRef90_A0A4R2KRA3 Purine hydroxylase delta subunit apoprotein n=1 Tax=Marinisporobacter balticus TaxID=2018667 RepID=A0A4R2KRA3_9CLOT\nMFRINFTINNKGYTVDVDEALRLVDLLRDKFQLTGTKEGCAEGECGACTVIMDGRTVQSCLVMAFQADGSNITTIEGLEREDGLHPIQRAFLDAGAVQCGFCTPGMVLSSKALLDKNSNPSREEIREGLSGNLCRCTGYNKIVDAVALASKYLKEEESDGASENSRK\n>UniRef90_A0A0G1RJJ4 S23 ribosomal protein n=2 Tax=Parcubacteria group TaxID=1794811 RepID=A0A0G1RJJ4_9BACT\nMDKLSNNGKYDLEERTAKFAECIIDFVRTIKQDAVNRRIIDQLVGSAGSTGANYCEAVEAESKKDFIHKVGIVKKEIKETKHWLRLFARANPERAEEMRKFWKEAHELLLIFSKISRSSRGQ\n>UniRef90_A0A0Q9NGW8 Helicase n=2 Tax=unclassified Arthrobacter TaxID=235627 RepID=A0A0Q9NGW8_9MICC\nMIDNDEIFEEAPASLQDLIDNDLDGLLNVPEKAKKVTSSDRLERAFLEIVEFRRTHERLPSSATREIAERKLGARLEGILANDEKIAALKHLDTEFELLAVEAAPESLDELLDSDDLDDLLGDDSGILDVSDLPVIKRPESPDSVAQRVKAEDFDLFEPLFKAKHAELAEGTYSLVPFTGMDLIREGAFFVLSGVMCFVAEVGEDVDLIVGGKPRQKQRLRLVFENGTESAMYKQSLMTRMYEAQGQVLARTGHDATEALDADVESGHIYVLQSLSKDPVVAGMKDLHKIGFSTTKVETRIKNAAKSPTYLMAPVKVLADYRLYNVRASWLEHLLHRVFAEVRLDLTQVDRKGRDYDPSEWFVVPLETINKAVAMIMSGEITDYVYDAQLKKLVERQQAGWE\n>UniRef90_T0Z4L1 Delta-aminolevulinic acid dehydratase n=1 Tax=Leptospirillum sp. Group IV 'UBA BS' TaxID=1260983 RepID=T0Z4L1_9BACT\nMSYAVKYASALYGPFRDAMMSGPQFGDRSSYQMDYRGIRDALREARLDAEEGADILMVKPALAYLDIITRVSEGPDLPVAAYQVSGEYAMICAAGQNGWIDQDRVMIETLTAIRRAGAQMIVTYFAVAAAKLLSLRP\n>UniRef90_A0A8H7V2K7 ADF-H domain-containing protein n=1 Tax=Mucor plumbeus TaxID=97098 RepID=A0A8H7V2K7_9FUNG\nMSLNVSDSALIDKYEDVRDDKSETNWVFFDFADGKPDRLQVAGSGNGGLAEFVAQLKPEVAGWGYLRMNMSNDEYSQRIKFVLVPWCGEKVGIMRKAKLSIQISDVKNVLRNFHIEVPASQTSELTESEILTRLRRAGGANYDRQSSNY\n>UniRef90_A0A538BAD3 Trypsin-like peptidase domain-containing protein n=1 Tax=Actinomycetia bacterium TaxID=1883427 RepID=A0A538BAD3_9ACTN\nMQMFTAGSQCTANFVYYDGTNVYVGQAAHCSGTGGNTETNGCTSGTLPVGTQVDVDGASKPGVMVYNSWITMQRLGEKDANTCQYNDLALVKLDPSDVASVNPSVPHWGGPVGLDTTGTTPGEKVYSYGNSELRGGVSQTSPKEGTSQGDTGAGWSHTVMTYNPGIPGDSGSGFLDATGNALGVLSTIDVGFPTGVTNGVGDLAKELSYLHAHESSFASVQLVDGTDPFQAGTLPGLGGLLGGLGLA\n>UniRef90_A0A2E1DI39 Two-component sensor histidine kinase n=3 Tax=Flavobacteriaceae bacterium TaxID=1871037 RepID=A0A2E1DI39_9FLAO\nMRENNISLSSRIFYYMMVFIVVESIMIAGVTLYQFNNQNSEYHEGRLERKEKNLLTDLKYEIDKSGINSIDALSNSMILEVADVHNLEFELYSLEGFLLKSSTALTGVRGTTIIDQQIVDYFKNENPSRYVEDDTNTNYFKSSYNLVTNFKNEPLGIIYIPYFADDTSSKQELTGFLIRLGFVHGNMILIAFVIAYFISNFVTKSLDSIGETIKKTNLQNQNVKINIDNTPREVVALIDSYNTMIDELKSSAVKLAKSERETAWREMAKQVAHEIKNPLTPMRLSIQTFERGFSKGQEFTKERIKEFSDSLIQQIDTMSSIATAFSDFAEMPEPKKELLNVVEVVGLAIDIFNKDHINFNSSNKVIQANFDRTQLIRVITNLLKNAFQAIPEDRTPEIKVSILEKDDNVNISIADNGYGISKTDTEKIFEPSFTTKSSGMGLGLSMIKSIISAYNGNITFSSKSNVGTTFNITFPKN\n>UniRef90_UPI000DC13EC3 piggyBac transposable element-derived protein 4-like n=1 Tax=Melanaphis sacchari TaxID=742174 RepID=UPI000DC13EC3\nMTRNRFFELRSCFHVVDNKAIPKENSDKFVKIRPMYNSFIKRCAQLPVEQNLSVDEQTVPFKENLSIKQYIRGKPSLWGIKNCLLCGQSGLVYNLLLYQGSSTQIDENMQKNFGLGGAIVLKLVENVKPNKHFLFFDNYFSSYNLFCCLLKYKILAAGTI\n>UniRef90_J4GUB1 Zn-dependent exopeptidase n=1 Tax=Fibroporia radiculosa TaxID=599839 RepID=J4GUB1_9APHY\nMAGNKPSAKLEKQPGTIPAPVVSSPAPARGRCLLRRTVLVGIAAIATFYYVGSLVCQINREINAQQGLWLAKAFGGHSQKGFKHKAAPFGKVAEEIFLAVPNPASALATSRQYATAPHLAGSEGDYKTATDFLALLQSELGISASSPLPVFPAGSSESRGATLSITSSSPSKPSAWIDVYYPVMNTPLDRSLEILDEDGNAVWAANLEEQADETDSDAGKYADAVPTFHGLSRGGEAAGKLVYANYGRKQDYDALVASGVELNGTIVITRYGGIFRGLKVKGAQDLGAVACLIYSDPRDDGTVTQENGYEAYPNGPARNPTSVQRGSTQFLSIYPGDPTTPGYPSYENSTRTEGTNIPTIPSLPISWANAKVLLDEIEEGGGNRTISLVNHVDDRVIPIWNTMGVIPGYIKDEVVVIGNHRDVAHCIRAAWVLGATDPSSGTASIHEVIRGLGVLLKQGWKPLRTILIASWDAEEYGLIGSTEWGEDFADWIDEHVVAYVNLDSSVSGSSFYSAASPSLSHFMRSAAETIAHPTKPGLTLWDATKDKGPLYGNHIDAEALSVYEEEQAQMAADDLGVNVLGSGSDYTVFLQRIGVASTNNGFKSTLSDPVYHYHSVFDSERWQELYADPGFLRHVAIARFLGLQTLRLADSIVLPLNTTHYSVQLDAYLDKVEQLRSSMALDVDFSSLRESISSLRAASVALDNEKSEAESELRHLIRRIARRKFVRDHIRKAWCKLRKIFRKPCKHRKHEAGEEYGHRGNEEHARPRAGHAHPASPARTIEGRTVKPRVGRWAGMLKEQREREHGRDSADKHVRGQKCHIEAHDGKDKELREAFVRAVKRVRAANKKLVAFERGFIHPDGIRDREWYRHLGVAPGKWLGYGATTLPALTESITFDANATMAKYEAGRLKVLFDKLAEEIQV\n>UniRef90_L7KPS4 DUF697 domain-containing protein n=2 Tax=Gordonia aichiensis TaxID=36820 RepID=L7KPS4_9ACTN\nMDDVRAQPSTLDAVGAQSGQTSVSAGGRVVVAAAGGVDVEALVEACREVGASRGAPTIDFVGFDSDHGHAATSAAVFVIDPASAVVDDEEIAVLHELTAAVGNVALVCGRIESFWDWPRIVRGYRAELDPDELLPVFAVSATAALAGAVDESGIGDLIEWFSTPASAVGDGVAAGTPTPAGEVMSVGDARMRADALATRRARLLAQRDRGRSDRLASLRAGIVRVRAQSSADIATRVRELAAGAEHRSNAVTNADVEATATWLDREIAGLVADIDAVTHARLDAVASSTLVGLDVDDPPVQRADEPMGTRRDVPSGRRTGEDAMVLVIGASTGIGIGRLAVAPLASVHTLQWISMPAALLLGLAVAVWVIRMRRAATTRAQVRTWVGEVLADARTRVERRVAMVLSEAESRIGGQLLRAYERQGRRIADEVAEIDERLRELRTAVTGRSEK\n>UniRef90_UPI001C5DEC67 DUF917 family protein n=1 Tax=Saccharothrix obliqua TaxID=2861747 RepID=UPI001C5DEC67\nMREISAADLPALMTGSRLLSASTGFIVDACLDWVAELVDRHGPVPLVGVADLPPESPCAAIAMVGSVTALAELPPTGEEPELAVRALEARLGHPLRAVMPLAAATVNALFPIAAAAVSGLPLVDCDGMGRVLPLIQQSTYALAGLPLTPLAAVGAAGDVVVVDAAATRADPLLRAAVTTAGGWMLCAMNPTTAGHLRNAAIPGAVSRLIDVGRVLRTAADHTALLDDLTRVLGAKLLGSGRVVELSHDTRPTGPGLPANPTSVAVVEYTGAGRLIRLEAQNEFLLATVDGAVAAAVPDLLCLLDRRERRVVDPESVVVGDHVDVLVIPAAPVWHTPEGLRLAGPRAFGFPVGHPREGISP\n>UniRef90_A0A653DFF8 CCHC-type domain-containing protein (Fragment) n=1 Tax=Callosobruchus maculatus TaxID=64391 RepID=A0A653DFF8_CALMS\nMESFVAPPRKTNFMEPDLAYVQVDEDRSIVDQGSSKANSTSKQFRCYRCNQPGHRAAGCTAGMSKKKKPKATDESLTNSLGFTQICSLENNSKSIAELLKENEELKEIIQQNQAIISEKEKLINQLLKENDHLQSHYNLINSNIIEKDTIVGTIDKITKRLENLEKQPSPISYASVANKQLGTPQKSLKKLVIKPKGKQNCSDTKKDLNKNINLSKLQIKIEAVNDTRDGGVELKLQDKYVNILKNEMDQVLLRKYEVMEEKKILPKIKIVGYKTREKPTMEEIKEKLIRENYFLHEEDIRVTYLNYIVQHNYYTIHAEVSG\n>UniRef90_A0A0F8X3M4 Glyco_hydro_2_N domain-containing protein (Fragment) n=1 Tax=marine sediment metagenome TaxID=412755 RepID=A0A0F8X3M4_9ZZZZ\nMLLYNSPDLQFSTMNLQRSTEKIVFCLLLICLQTSLLKAEKTDTGNPRTSYTINEDWSFTPQGLAFGYRPLAKDPGAEIISLPHTWNTQDPFDGKYTYRRGISWYRKELVVSEKLKGKRLFLYFEGANQVSDVYINSVFVGQHKGGYTAFAVDITDYATFGREEPNLIAVQVDNSHDNHIPPLSVGYALYGGIYRDVRLIATSPVHFKVSDHASSGIYIATPEVSDKMARVDVRGTLVNNTNE\n>UniRef90_A0A3Q9BJ05 Cytochrome P450 CYP721A63 n=1 Tax=Panax ginseng TaxID=4054 RepID=A0A3Q9BJ05_PANGI\nMNPFLLILLLLVISLLKFIHKFIWIPLSIQNHFRQQGIRGPNYRPFFGNTAEIRRWMMAEAKSSRTDFNHDIVVQRVMPHYYNWSMEYGKNFLYWFGAKPRLAIAEPDLIKVILMNTNGAFRKLKLNPSASLLFGDGLIELVGEKWAVHRRITSQAFNMERVKDWVPEMVASTMKMLDKWEEERGGRDDYEVDVHKELNKLSADIISRTAFGSNFEEGKRIFELQDQQTDLVLQAVRSIYIPGFKFLPTKKNRMRWRLDKETRHSIRTLIERSYTTQDKTKCLLTLLTSPYKNQENEEERLSSEEVIDECKTFYLAGKETTANHLTWTLLLLALHQEWQRKAREEVFQVCRNGEIPTADNLMDFKIINMILNETLRLYPPPVMLMRETCKNVKLGGFDIPAGTQLLLPMAAIHHDTEIWGADAKEFNPMRFAGSRKQLASFFPFSLGPRICVGQNLSVVEAKIIIAMIVRQYYFEVSPSYVHAPRQLLTMQPQFGAQILLRRISE\n>UniRef90_A0A6L5FCG8 Thiamine pyrophosphate-binding protein (Fragment) n=1 Tax=Acidimicrobiia bacterium TaxID=2080302 RepID=A0A6L5FCG8_9ACTN\nMTTVGHQVGLAVASFGARYAFGVVGSGNFHMTNGLIDGGSVFVPARHECGAATMADAYARTSGELGVVTLHQGCGLTNALTGITEAAKSHTPMLILAADTSSGAERSNFNIDQDAIAASVGAVPERVFSGSTHLDDLIRARNIAMGTGATVVVNVPIDIQTEEVPRQPDPTPFAPGPPLSPDDDSVEGFGRLLENAERPVFVAGRGARSEPARDSLLALSEQAGALLATSAAAKGLLVGSPWNLDISGGFATPLAAELIMGADLIVGWGCSLNMWTMRHGRLISQGTKVVQVDTDADALGAHRPIDLGVLGDVSETARAVSGTVSHGETRYRTDEVAQRIAEEGRWRDVPYHDRGDGERIDPRTLTIGLDDILPADRVMGLDSGNFMGYPSMFLDVPDERGFCFTQGFQSIGLGLATTIGAALAQPHRLPVAAVGDGGILMGASELDTVVRLGLPMVV\n>UniRef90_A0A2J6L521 XH domain-containing protein n=2 Tax=Lactuca sativa TaxID=4236 RepID=A0A2J6L521_LACSA\nMEEMENTTDDEKTTSLKASILSKYDEVFHAHTSDIKKVNEKITVDCEKFLQYYEDSCSQMEASSKSLQQQEYEITKKELKIQKAKSKQELKKRVRERLLSCKQLLNESCTSKRLLEGVKDELVILRKRRAELESQLKAENYESLESEITQLETALQAIQDDDCIDLQEQMKILQTKLIQKNEQIEEKKHQETIFRLAIETKNKELQEARWELIDGLKTYPIGGVIGTKRMGLVDSNPFFVGCTSSEKKKESATKFASLCKHLIEDPNWHPFTRKSDGSEIINEEDGKMVILKSECSVEQYGAVVTALVERNRYHKNGRNLMEEVWNYRENREVTLIEGIEHILKEWKIQKQRKR\n>UniRef90_A0A2A4LJ60 Corrinoid adenosyltransferase n=2 Tax=Alphaproteobacteria TaxID=28211 RepID=A0A2A4LJ60_9PROT\nMVKLNKIYTKTGDKGTTMLTSGDIVPKFDLRIEAYGCVDELNAQLGMACILAKKGSKLADLLQYIQHDLFDLGADLSTPKVEGEAPDAALRIIASQVSALEQNIDEFNANLTALKSFVLPNGTQLAVQLHICRTVTRRAERIVAQLMSEQAEQTNAESLKYLNRLSDLFFVLSRYDNDLSGQGDILWKPAKNR\n>UniRef90_U7P8K1 Tryptophan-rich sensory protein n=2 Tax=Halomonas TaxID=2745 RepID=U7P8K1_9GAMM\nMTPTRSALILLGWLALVMLAALTGIATPPGAWYAGLSKPPFTPPNLAFPIAWTLLYLLMALAAWRATLEAPAAMRWHTLWPFVAQLAANALWSPLFFGLHWMGAALAVLLLLWGLILLTLCRFAAVSRPAAWLLVPYLAWVSYAAYLNAATWWLTG\n>UniRef90_A0A4S5EQE4 Transposase n=1 Tax=Candidatus Frankia alpina TaxID=2699483 RepID=A0A4S5EQE4_9ACTN\nMPPSRPDARARAEALKPLLRTAHQREQVDQAVAAADGRWNVALDALKRKLPTVADRLAAADALVGWAGDHPSVARARCAEPAADPA\n>UniRef90_UPI0004150940 Nif3-like dinuclear metal center hexameric protein n=1 Tax=Peribacillus kribbensis TaxID=356658 RepID=UPI0004150940\nMELLHQMVQKLDQELRIDDYGKDSGFSRFIPAVYEPAGFEWDMFFEKKFTELFNGLMLKGGPEVSKVFLAVFPADEVLEKFIAEAKEGDLLFMHHPLVMECGDPQGKWGQGFIPVKERYLRQIKEKKLSLYTCHTPLDYHQELGTNGAMAKALNGNVIDRCLPNEFGEYLVWICEIPSKSTQMLLSELKEIFEIPYVDFEGPAAGRIEKAAIIAGCGDKVSWMEEALRKGAQAYITGEIHCHINNEYGRRRYSEMMEFATRSPIPLIGVSHAASEFLVMKTLMKDWFEANFKVETVMLRQDQWWV\n>UniRef90_UPI000C18D182 helix-turn-helix domain-containing protein n=3 Tax=Lysinibacillus TaxID=400634 RepID=UPI000C18D182\nMAFEYLAQYTTFESIADMDTAVENHMAAHYYDLTESERAIVFKLASHSLENPGACHLKAATIAAALEISTKTVYRSVKRLEELGIIEKVPSTKLNGIKGASIYRILPHVPSSVSQRETAQAISNDAVSETFTENQSSKSFNHLSFKTSTLQEIYNNTHAEKEAHKEYMNEYQVMLFDFMSSLPLADNLKDELHKVVLAAQVQNASDFIKAKNVLFKIAMDIKEGILTVTSTLRAVFTGAYNKAVQRSNMKLSKSSSIEETADRERLVPFYNWLNERDSRSEICSRPNLENWLEW\n>UniRef90_UPI0021CC4CFF uncharacterized protein LOC127046616 n=1 Tax=Gopherus flavomarginatus TaxID=286002 RepID=UPI0021CC4CFF\nMLERGHDRDTMQCRIKVKELRNAYCKAREGNRHSGAAPMTCRFYKELDAILGGDPTTNPRTTMDTSERGGEVEAEEKRGEEETESESTGVGGDTLESQEVCSQELFSSQEEGSQSQQPVLGEGQAEERVPATLSSQLPVLTAAQRLQNLWKKPRKSKDDLLQTVMDHSARENKKLQDWRERESRIHQRNAAARKKSTKQLISILARQVDSIHAGRALPRHPPIPKLFPLCPNVSSKPPSPASRFLPPPAASNTCTFTNQP\n>UniRef90_UPI00167E4099 hypothetical protein n=1 Tax=Streptomyces echinoruber TaxID=68898 RepID=UPI00167E4099\nMTVHDDLASVQRCLDDLTRSVGRLEKQLGSTSLDLRRVRTDADHLRESVALLRAAAAAGPTAARPELVTIPDTPYDGSLWTDSDDEGLGARDRHAP\n>UniRef90_A0A3B0UW67 FAD-binding PCMH-type domain-containing protein n=1 Tax=hydrothermal vent metagenome TaxID=652676 RepID=A0A3B0UW67_9ZZZZ\nMAQFSPVSEAVLAALTAVVTSDNISTAEAERQLHAQDMSQHAPSLSEVVVWPTTAQQVANVLRIANENHIPLTPWGAGSSLEGNPIPLFGGILLSLQRMDQIITLHEDDFQVTVQPGIGYKDLNEFLGRHASFLPQTREPMPPLAACWQTMQQAAAR\n>UniRef90_A0A085F9L8 Transcriptional regulator MarR family protein n=4 Tax=Massilia TaxID=149698 RepID=A0A085F9L8_9BURK\nMGERYLKSVRLLAECMQGFERFSGESVRQHGLTHAQFDIIATLGNTPGMSYKELGERTLITKGTLTGVIERLEQKGLVLRERSSDDKRSFFVRLTPAGDGIFRDVFPRVIAHGKQLFSSYGEADFDALENVLRKLRDQIAAGSLPPQPPQAKELP\n>UniRef90_UPI001662A726 hypothetical protein n=1 Tax=Pedobacter quisquiliarum TaxID=1834438 RepID=UPI001662A726\nMKLKNLSILAVLGLLAYSNHAEAQLLKKFQKTLEDKASQKVDDVLNGKKKATSPAAESTAAKDAPPPVEEVYSFTPGSTILFESDFKRDSKGSMPKRWKTSSTGSVVSIPDMPGNWLALAPRTTYKIDSLLKAPENFTIEFDLVTRSDEAKDIGSMAFGFARDNSIKNYISDAYNDNGITNTQFHFHNRDINNSSSDTKVYNTLSYPFANYANGLLHVAIAVEGETMRVYVNRSKVLDTRMLRKDLPKYFYLSAPFSYDNQAKVYFGNFVMSKS\n>UniRef90_UPI00168950BE sulfotransferase family 2 domain-containing protein n=1 Tax=Leptolyngbya sp. FACHB-16 TaxID=2692800 RepID=UPI00168950BE\nMKIYNPDQPLFSLHIPKTGGSSLEYVLATWFNKRKFPILRNRPKLERILSIGSLDFQIQRTLGCGFYFHYKNHRRNEVPRRVPLGKTYGFLRPTKQPECVHGHFSDYNTGENVFDFYPEASQFIMVLRDPLEMHISLYHYTKRMIEDNSLYWNGQKRDEFQFNSLDQWILERDFFLLKSLPWNLKAENFKGIIDKYFVHVCVLENFQESLNKLADKLGFEPVKIPQVNTTLRCEMSSSEAAIAFREKYSLEYAIYDYAKTLS\n>UniRef90_A0A7V7X2U6 Outer membrane protein assembly factor BamA n=1 Tax=bacterium TaxID=1869227 RepID=A0A7V7X2U6_9BACT\nMQKKRSTAKNKIVYISVLKFIHSTTERKFSLMKKLFLHRLPIVLVMALISCLFTVHIAAQTQGLAGRPKIASIKVEGNLKSDAELIIIASGLSVSQEFNADDITKAIENLWEMNVFKDIQVYGEQVEDGIEVVIVVKEYPRLESMDLEGQDNIDEEDIRGKMGLYTSQTVSPQHIKKAIERIKRKYAEEGYLNADVEITTYASQNDSNKVLLKIKITEGAKVKIRGINFFGNYSFADAKLEGTFDDTKSKSGVFRWFKGGDFDEKKYREDVKKLIAYYKKKGYRDFQVVNDSTYYAKNKKDFFIDIHVEEGVKYRIGDVRWTGNTLFSNEELSHAFGFSRGEIFNQEKYDKNMQEQVNAMYYDRGYIFAQIVPIEKPVSKDTLDLEFIVTEGNQVYIEKVEIRNNTKTKEKVIRRDVVAFPGEKFSREALIRSQRNLMVLNYFENVIPDVQPISQDKVNVIMTVTEKPTDTANLSMGYSAQDGLIGSAGVAFNNFLGNGQIVSLNLQLGGAGYRVFSVGFSEPYLFDTRTSFGASFYFSLDGNRRAQYVGYKQRSFGGSISFGRRLKWPDDYFLANWSVGYANSTLKPLSLSNLFPQFTYGQQQSLTLTQVIQRNSKDAAEFPKSGSVYTLTTDFGFVSIDTSGYANAVRVLPQNYTRHTFRAENYYPTLWSFVLYTDFTMGYSRTFKRNPLVEEIPQLDRFYMGGSALDIGSIQLRGYGGRGVGPQESGFAAGGASMVKYSAEIRLPVIPSPTMYILGFAEAGNVFRSLSETDPFKVKRSFGYGFRLFMPLVGVIGLDVAYGLDKTNKNRNFPRFHFQLGQQF\n>UniRef90_UPI00217ED0B7 hypothetical protein n=1 Tax=Herbiconiux sp. CPCC 205716 TaxID=2970912 RepID=UPI00217ED0B7\nMADWHPVQTLHANSWIFPRPGTTEPFAEIRHLPVKVGERTVWAFRAVSWRRPRHLIGAGYFGTLEDAARECHRVALASAVPSVLNEQRR\n>UniRef90_UPI001E5ED8EC ribonuclease HII n=1 Tax=Bordetella petrii TaxID=94624 RepID=UPI001E5ED8EC\nMGQNSLFAETPDFTGVLMAGVDEAGRGPLAGGVYAAAVILDPDRPVAGLADSKVLIAERREELALLIQERALAWCVASATVPEIDTLNILRATLLAMQRAVDGLAHVPQVAMVDGNQAPKLRCTVQTVIKGDALVPAISAASILAKTARDADLLRLHALYPQYGFDQHKGYGTVLHMDRLREHGPCPEHRRSFAPVRDRLAGLP\n>UniRef90_A0A2T2ULY6 SET domain-containing protein-lysine N-methyltransferase (Fragment) n=1 Tax=Proteobacteria bacterium SW_6_67_9 TaxID=1919227 RepID=A0A2T2ULY6_9PROT\nQRVYVGRSPIHGWGLFAREHLERDAHIGTYLGPWAQRNGSHVLWVDTGEGWIGRRGFNRLRYVNHSKRPNAEFDGFDLYARRTIRPDEEITIDYGWDDD\n>UniRef90_UPI001B816F5E CvpA family protein n=2 Tax=Neokomagataea TaxID=1223423 RepID=UPI001B816F5E\nMQSFSDLAHGSLDALTRFDDVVLALIILSGLGGFVRGFATEISGLFSWVMAIAVTNRLHMMFEPYLAPYVHDVWLLQIFSGILVFLVTLLFLAMVGRKIAGIARVGLLSGVDRVLGLGYGLFRGYLVIVTLCLIGGAFFETTASYLMQRSLTAPYIVAGETRLVGYLPLSWRSHLASLATSGHDAR\n>UniRef90_UPI0013CE7A73 prepilin-type N-terminal cleavage/methylation domain-containing protein n=1 Tax=Metabacillus litoralis TaxID=152268 RepID=UPI0013CE7A73\nMKFKLAKLFTYNKGFTLIEVLLSIVIFSILTLGMLALFSQAMTYTQKSENDTLGVYAARNMLNFMEQQSFEEIKKIYIDHLKSRGEGSITILNKGICEDWYKDMESDGYELCDLAFNPTINNREINVSVELKKHDDQSLQDLLIPIKVFVQWDKDNESTLEGFITNEKLR\n>UniRef90_A0A4D6HJA5 DNA-3-methyladenine glycosylase 2 family protein n=1 Tax=Halapricum salinum TaxID=1457250 RepID=A0A4D6HJA5_9EURY\nMTTVTDSPHAALRSDEYLGPLVERHGPVEVEPAEDFFQRFVVSILRQQVSMESAAATRERLFESVEVTPNGILAADKQVLRDAGLSRQKTRYVRNVAEAFIEEGYSRAYFEGMDDDAVRAELTEIPGVGPWTADMQLLFSLGRPDVFPVGDLGIRTRMARLFDDLAVEDRAVMRERSERWKPYRSYASLYLWRATES\n>UniRef90_A0A3P1S3R7 FMN-binding protein n=1 Tax=Erysipelotrichaceae bacterium OH741_COT-311 TaxID=2491058 RepID=A0A3P1S3R7_9FIRM\nMKKTVQLMLFLAIVSAIAGGILGYVNSITAPVIEKMAIAAEQKNLELLFPNGEFKALEFKDETGLVKGVYQVEGQGYVFKVETVGYNSSTPIVYMVAFSNEGNIIGFKELQQQETNGIGSRVFTDEYSQGLLKKTNKDNYDTLTGATVTSTAVVKGLNASRDLFNTINGLEKVETVEQEPKEVQAVKVLINQDWSVYDAQVTVEGSTYQVNVKGYGLLEGDSSHFDYVRNEFMIEIEDQKIKSITLVTFGDTPNIGDKAVDQTYLDQFIDKTMDDEVDLVTGATYTSNSVIASVLAALQAAGQ\n>UniRef90_A0A5C7IGY6 Galactinol--sucrose galactosyltransferase n=1 Tax=Acer yangbiense TaxID=1000413 RepID=A0A5C7IGY6_9ROSI\nMPSLSESRRRLLQVSSALLKKAWSILQRLGIWRFQEIYARSFANRLTNIKENHKFQKNGKEGHRVEDAALGLRHIVSDIKENRDLKYVFVWHAIPGYWGGVRPGVTEMEHYESEMAYPVSSPGVQNNEDCECLNSLAKNGLGLVNPEKVFTFYNELHSYLASAGIDGVKVDVQNILQTLGAGHGGRVKLTRKYRQALEASIVRNFRNNGIISCMSHNTDGLYSAKQTAFIRASDDFWPRDAASHTIHIASVAYNTSLHPMAEYHGAARAVGGCAIYVSDKPGQHDFYLLKKLVLPDGSILRAKLPGRPTRDCLFSDPARDGKSLLKIWNLNDFTGVMGVFNCQGAGWCKIGKTNLIHDEQPGTISGYVRAKGVDYLSRLATDQWTGDTIVYSHLGGEVVYLPKNATIPITLKSREYEVFTVVPVKEFSNNEAKLAPIGLIKMFNSGGAIKELRYDEAEGTAAADMKVRGCGLFGAYSSARPKMIQVDSEEVQFGYNEESVLQENKVIPGIKVDKGTVELAGTNQYNKTGARFAKWRAVLKIGPKRAI\n>UniRef90_A0A2V5VET0 Divalent metal cation transporter (Fragment) n=1 Tax=Verrucomicrobia bacterium TaxID=2026799 RepID=A0A2V5VET0_9BACT\nVLYLQQKGFRYIEALVITLIATIACCFGAELIFSKPNLMSVMLGFVPGPHIVTNQEMLYVSIGIIGATVMPHNLYLHSSIVQTRKFEQSPQGKREAIKYASIDSTGALMFALFINAAILILAASVFHWSGHQEVAAIQDAYQLLSPLLGVGFASALFAIALLASGQNSTLTGRAIAIVPAVLVIGIFGESKTTQLLIASQVVLSMQLGFAVWPLMRFTNEKAKMDEFANLLWLKILSWTTAAIIIVLNVKLLFDTFMPDSVLKAFYNFLRLPAPQ\n>UniRef90_A0A6P0P8U6 Tandem-95 repeat protein n=5 Tax=unclassified Okeania TaxID=2634635 RepID=A0A6P0P8U6_9CYAN\nMGTEGDDLAFGSVFSDTYSALGGNDIVFGQEEGDSLLGQEGNDQINGNRGNDTVSGGLGDDSLRGGRDADSVLGDAGNDTVFGDRGSDTVRGGEGRDVIYGGKENDDVAGGEENDFVSGDIGDDTVAGDGGNDTLLGQDGNDIISGGAGLDVIRGGEGTDSISGNEDNDSLSGNQGNDTLDGGTGDDVLSGGKDDDLLLGDAGADTLNGERGNDTLDGGEANDILSGGKGNDSIDGGQGDDLLIGGRGDDTLTGGEGEDSFVIVDFEESDNLYTVTDFNTTDDLLSLEGGLTFEDLEISDEGGNTVIRNADGNTLAILIGVDSGTLNSGNFFPTPETPFPTATPTPTPTPTDSPDPSPTPTDSPDPSPTPTDSPDSTPSPTPTDSPDSTPSPTPTDSPDSTPSPTPTDSPDSTPSPTPTDSPDSTPSPTPTDSPDSTPSPTPTDSPDSTPSPTPTDSPDSTPSPTPTDSPDSTPSPTPPDPGEVTPPSLNDPPTDILLDNDSVEENSEAGTVIGTFTTEDPDESDVHEYRLVDDADGRFALNEDQLVVAEGTNLDFEQQETYDIQVRTFDNAGENLTKSFTIALLNVNDPPEITIPDDQQLVNEGEQLDIVGIEVTDPDAGDGELEVTLETTNDGNLTLNSTSGLTFTTGDGQADAEIVFTGSLENINQSLNTLTYTGNNSGSDSISISVNDQGNTGLGEPQTDTALINLSINDLPLVGTNTELVVNTQETGIIDNTLLETTDDSKTSLIYTVTELPTRGNLLVDGGSFTSFTQEDIDQGLLTYEHDNNDTKNDSFSFSVSDQVGGETTDTFEIRVNVPPNITSKNLSLDEDTQEEITNKNLLAEDPDTDAVAETLIYEVTELPTSGKLQLGKAILEVTDTFTQEDIDQGSLSYQHTGDEPGTDTFSYVVTDQDGGTTSGLLNININPGDTSPIAGDDVFETNEDTAITINKSELLANDSEADGEQITITEFAADNIKNGTLAETTESFIYTPNENFSGQESFTYTITDTQGFTDTATVNINVTPVADTPNLEISTPNVSGTDIEELPLGIAASLVDTSGSENLSITISGVPAGATLSAGTDQGDGSWVLTPEELTNLTISPPGDRETGTTFSFDLTVTATATETANDATATQTGTISVQVEALNDAPVLTDLGNLALTTINENEVNNTGTPVASIIAGAVTDADGGASSGIAITQIDNSNGLWQYSVDDGTNWVDVSNSNTTLLKATTSDRLRFVPNTDFFGDATIQFRGWDTTDGSSNTSELTDISTIGGTNAFSEGVGTANILVNDIPEITKNSELVVNFGGTGSISQNLLQTTDGDNGTNAFTYTVTTEAAAGILQLEDNPTNTFTQENINSGLVIYEHTATNTNDDSFSFRVIDVDGGKVTDTFNIRVNEPPVGTTTDLSAFIGQSKVIPTENLQFIDPDVETATPASLQYTLTEVPTLGELQQGGETLAVGSKFTQENLDNGEISYATTTASIGTDSFNFLVTDQDGGTTSGLLNINIVEANRPPEVEADKTVTLEEDNNATLDIPAPTDPDGDALTITVDSIPNAEIGQVLLSNNTSVTALQQLTTEQLTSLTFVPVANANGAAGTFSYTVDDGNDENSSSTQVINIDVTPVNDLPIAIDDGPVFTNLGNVITIDVLGNDSDIDGPDPLSITTLSNDEPLGILNNLGTQVQYTAVFGTGTDLFQYTITDGLDEATATATVNILDVSNDPDFLVGGEFNDNFDGSGGDDTLEGLAGNDTLAGDDENDSLVGGDGNDSIDGGDDDDIFIGGLGADTLSDDNGNNTFVYTSADDGGAKFNAADAASIGTAISAGLYDRITGFEDLGVVGGDTIAFSSTVIPAVDNIATDVQTTNISGNVLIAGNPGLFAYEVEGKTYLIYDANGDNTVGDDSQILAELEDVSGVVALDINDDFTII\n>UniRef90_A0A7K7WYR9 TENX protein (Fragment) n=1 Tax=Mohoua ochrocephala TaxID=874463 RepID=A0A7K7WYR9_9PASS\nHFHTHHHPLSTTAAAQPEELPLTSEEPQHEKHRTESPASEAPLVRAVLGELRVSSVTPNSAQLQWSVPEGSFDSFMLQYRDAQGQPQALPIDGGSHSVTVPRLSPSHRYRFHLYGLRGRKKIDHVSTEAVTGTQEQEELPLPSEEQKHEKLQTEAPPSDAPLMRAVLGELKVSSVTPSSVGLQWSVPEGSFDSFMLQYRDAQGQPQALPIDAGSHSVTVPGLSPSRRYRFHLYGLQGRKKTDRVSIDIITAQPEELPLPTEEPQQEKPETKPRPSEGSPVRAVLEELRVSSVTPNSVQLQWSVPEDSFDSFMLQYRDAQGQPQALPIDGRSHSVTVP\n>UniRef90_UPI001131192E phosphatidylinositol 5-phosphate 4-kinase type-2 alpha-like isoform X3 n=1 Tax=Oncorhynchus nerka TaxID=8023 RepID=UPI001131192E\nMAKELPTYKDNDFINDGQKICIDDDNKKMFLEKLRKDVEFLAQLKLMDYSLLVGIHDVERAEQEEVESEDNEGDDEGESDGGIGTPPDSPSNTLDSTKPLSPGEFDPTIDVYAIKSNDGAPRKEVYFMAVI\n>UniRef90_A0A101DIC7 DNA repair protein RadC n=1 Tax=Desulfonauticus sp. 38_4375 TaxID=1635258 RepID=A0A101DIC7_9DELT\nMPNKNKPHYLGHRQRLKKKLRENPEALADYEVLELLLGYALPRKDTKPLAKTLLAKFKNFKQLLFAKEKELENIEGVGPGISTFWLALREFLSRASVQEFQKTKQKITSPQDVYNLLAPKLIPLSKEEVWLVMLDNKHQLIKMSRLSQGTLDSSPIYVREILEQVLLNQAKAFILAHNHPSGEPTPSLADLEITRKIEEACKNLEVSFLDHLIISKQGYQSLKEQGF\n>UniRef90_UPI001D97EE8E Choline kinase n=1 Tax=Passalora fulva TaxID=5499 RepID=UPI001D97EE8E\nMQSHRSSQVFSVFSVTFNPTARPNSRFGVQPHLYSCSSSTRSREEPLTDIRASCPWNHRRSLSALYHIWLRLPPLGPRSRHQSARNSDGREARDDTSCVSITMPHSEQPSPMSSGLVKPKLEECASPSSYLGLNRAASPRSTPKSVSISHHAETISPLILGQRKEDEESDLSPRRPAVISARSRRLSGRPASYGSPGLKPLTPALDGAVHSDERDAADSQHDGHHHIDALVDQVSMWIKDRRAKRSKRKEKRSARREARGAKASDGDVDEPEKSQRRDSDASDSSVDLENLERIIASNLSLRRSSVRRSSISLKSKASVRRLLRKQSTVSDSEEVDVSVPGCDAFLDNSKTLAYTGGASDLSDNDGDELRQVPSYRDFDAWAKFKFDIVRIIHTLRLKGWRKVALEMSSAIAVKRLSGALTNAVYVVSPPADLSLEKYDESGKVVGVSKAPPKLLLRVYGPQVEHLIDREAELAILQRLARKQIGPRLLGTFVNGRFEEYLHAQPLTPKELRDPATSRQIAKRMRELHEGIELLDQERSDGAFVWRNWDKWFQRVEHIVTRMDNQIKALPEDAKPTGQQAWMRRGYICGVPWAQFREIVEKYRMWLKAQYGGSKEVRDQLVFAHNDTQYGNILRMTPSGESPLLLPANTHKQLVVIDFEYANANTRGLEFANHFTEWCYNYHDERKPYAFNSSWYPTPEEQDRFLRAYVRHRPQDGLSTPQTGPSTPSSEVSTPPVKRATSSISDFMLDARHPQSARPNAAKEEEAAKAAEDLEIGRLANETRIWRLANTAQWVAWGLVQAKVPGMPDFDPDSPTSELTSDTEPEELLGERAEEYRQLAKEQAGEDEEEDEEFDYLGYAQHRALFFWGDAVQMGFVKAEDLPEETRSKLKTVPY\n>UniRef90_A0A0E3NZ95 Probable dihydroorotate dehydrogenase B (NAD(+)), electron transfer subunit n=2 Tax=Methanosarcinaceae TaxID=2206 RepID=A0A0E3NZ95_9EURY\nMIPLNATIEKIMEESPFIRTFVFDHRFEEMEPGQFVMVWVRGVDEVPMGLSRKNSITVQNVGEATAKLFELKEGDSFGLRGPLGKGFSSPAAGEKILVIAGGVGAAPLAPYAEAASTAGAKVHTILGARSGGDLLFEERFAAAGVLDITTDDGSKGTKGFVTDVLKKIDVSSYDNIAVCGPEVMMGFIFKILQEKEVLDKSEFSLHRYFKCGIGVCGACCIDRSGLRVCKDGPVFSGVQLVDSELGKYARDASGRRVKI\n>UniRef90_A0A8T4KUD5 Pacifastin domain-containing protein n=1 Tax=Candidatus Aenigmarchaeota archaeon TaxID=2093792 RepID=A0A8T4KUD5_9ARCH\nMKGVSLPVNAVIIIALAAVVLLVLSTFFLMGTGPSMSNIEAQRVFEEQCPKIKCEKFVTPGTPAFGGLYKNFFDACQRLYGISGTDSEKSKCFFYCNCGALTSECNTDCTICKNFPVDKERCFAELEKKHGLGCKNSCF\n>UniRef90_C0HI41 Uncharacterized protein n=1 Tax=Zea mays TaxID=4577 RepID=C0HI41_MAIZE\nMEGCRGRHQSHPPHAIDGARGKTAHLLPTPNLLPFQLKQHRRLVAVWLLVKAPADKGKMEHTTAAVSSVRWVCRSRCKATARSSWEAMVTANFGLWLANTCCRAPDYGSQGEVMLTFAENGSSKVGVRFDKQIPGAIDLGGSCELDHGLLCSVDSLCLDGPGWEDRAKHSFDVVFEVMEFLFFLEHAGELHIIIFRGKIESKLDQNKHYKLTKLPSGGHKHQCTKGSINLEEKQTNHLNSTKDLQ\n>UniRef90_UPI001CDD57D1 hypothetical protein n=1 Tax=Vibrio vulnificus TaxID=672 RepID=UPI001CDD57D1\nMVENLVSGLVSGLIVVLITLVISRVWTLIVVPWFEERVYKDVKIEGKWFSYYTGGMLGRQEVITLKRHGHQITGTMVCTNIGQPDHGEQYNIHGTFKNLILPLVYENDNQSKTDRGTITLKSTFSAKKLVGQISYYSCREDIINTSIVTWYRTQEDMEAAKNSHETRLKEGFNPQGLIPTEDVVHDGVDKAQVG\n>UniRef90_A0A267E9L2 NDT80 domain-containing protein n=3 Tax=Macrostomum lignano TaxID=282301 RepID=A0A267E9L2_9PLAT\nMINGGFEDRDNFFLEEEHLTTSLEPHQFDPRLSNAEFIRASVLDGQKIKEELFGICESPFDQQDPSQFDSSVTYAPPATPAFVQPEALYVDQPSRIKRGYDESSSTLEVQTYRRPTSCGGGIDSCLAPPVAKRRLGHNRLQLVQTSVPSSSPSNSSSDAQSPAELGSSGAAAGQPTVAAATQPTSIVISSGPNSMATVGEYDKWSTAAQSFVRRSTIRETDALQCSAANRVGLSTSESRQIYAVDSKTAVDRITTELPPTRPPPAPPPPLSLVPSQQQNGDADVVHPPPPLRFQPWDAAPALTLLEVKPVSQNLQPASISFKIEVDKGFQFSGKEGIWICQKKNHFQITCQVSVTGCQWAVGASSGPQPVTGFRVNLYGVKAESPLDSLVSLEQSEVNRTKRLFAPIPVAMPGGGRFVRVVAQRLHFASTTLNNQRKRGDLHPDQRFFQLVLALEALTETSVAPVQRYISRFIIVRASNPGQFDSASASAVPDNPPAPTPLPQRQPPPQQRSPLPQSSMPPTVEEAATPEDAVGAWISDRPGVVYYSGNVGINTPNPAEALTVEGNLQLRGNLLQPSDARIKSIERELSPAEQLANISRIKIYSYSLSPNDVSDTGVIAQEVAGILPDAVHASSTERVPTGEPLLLVNKDRIYMENVGAVKQLGELTASLDCRIGELERMRSKLCRLRDSLRSSSSSSSTVTAAAAAAAAAAAATASSGCLVGSPRFRSVGTQSSLELEAGLPWPPNLPPPQPPPPPPPPPPPPPPPTLPKSTTPSLTVPASAAAAAAAAGQDQRNRRPRLCSHQHPVAQTLHQQQQQHQQQQRRSSFRFNVVLVALLVTLIVCFLGLASLLLIEKLLPHLSGPGFVGSRNGSSTVSSSGGGSSGGSSGSGPATPPGGGWPRPLHGASSHTTPPEPTPTQKPTPFRPASCGAGGGPCPPVRCCRGQQKLANGNSSGSGGAGSGSGDVIALFESAGDRSGSRGGSSDASSGSGNAAFWELLGAQLISPALGNWSLADAASMHCGSSSGSSSGSGSDVGGHRRRLLRYGGCTGSNLTFHLLLSNSFPLDARLSLRLTMSETLLAVRHCPPVESLSRCDGSGGPGAAADSQSSGCTPVLGDQRGFDCDVSAAASHLLHLAKFRLAAEAKNLCQLESSGLGKEFVELTVLLERQEFGC\n>UniRef90_A0A2E8JXE6 Creatininase n=1 Tax=Planctomycetaceae bacterium TaxID=2026779 RepID=A0A2E8JXE6_9PLAN\nMNSEAPWRLDETTLGDLEDRCTEPDDPGFDVAVIPFGCTEPHNLHLPYGTDTIESLAIGDRICGHAWRQGARVALLPAIPYGTTTNQAGVRLTLNLMPTTILAITRDLVASLVRHGVRRIVLLNSHGGNDXKWXLRELHDGPSPSAHLFLVDWXRAXRDVSDRIIEQPDDHAGEMETSILMAVRPDLVRHRSDGSLDADDGEVRSTSFEAVEKGWVSITRPWHLLTTNTGAGNPHAATAEKGETLLEILEERFGSFLVELAKGEPGPSFPFPDE\n>UniRef90_A0A8J4EGG7 RGI_lyase domain-containing protein n=1 Tax=Virgisporangium ochraceum TaxID=65505 RepID=A0A8J4EGG7_9ACTN\nMRAWNRRRFAALAVAAVCLVGVPLPASAAPGAPAGGGHGRVQLEKLDRGLVVATTTGGAFLSWRLLGHEVTGRTSSGMKGPGFEVYRDGRRIATVTDSTNYLDPAGTAGSTYQVAPVRGRKSAPARAWSTTHLDLPLRKPADGVTPAGEAYTYSANDLSVGDVDGDGAYEYIVKWDPSNSKDVSQVGYTGNVYIDAYELDGTPLYRIDLGVNVRAGAHYTQFLVYDFDGDGRSELMFKTAPGTKIIRYDRSGAVRSERFVSLPREDVAKGVTHADDYRMSAADYFEHLVTMFQGWHDHPEVEAGRWPATLEQAFGIAPAYTYPLSREDATALANHFVDVYAPARSARNQLRNFAGFIVDGPEYLTVFEGATGRELQTVRYEPGRHDDGLMWGDYAMARIEPGNRVDRFLATVAYLDGRRPSAVFARGYYTRSTLVAYDWDGRRLHKRWYVDSGWTPMTNPFNDSPHGRDGTDPEFRTLTTQGFHSLSSSDVDGDGKQEIVYGAATIDHDGSLLYSSFAPLPEGSASPGTQARLGHGDAMHVTDIDPTRPGLEIYTVHEGAAGAPYGHAMRDAKTGQVLFGTYSGRDTGRGMVGDILPEHAGLEAWATTGMGLWTAQGQKLGDTIPGTNQSIRWAADLSTQIVDGALEVTPTIQDHRRGTLLTAANTLTNNGTKGNPGLVADIFGDWREELLLRTADSSAIRIHLSTEVTTHKLYTLMHDPQYRAEVARQQTTYNQPSYTSFHLGTGTDWARVPVPTASYR\n>UniRef90_A0A372F876 ZU5 domain-containing protein n=1 Tax=Emticicia sp. C21 TaxID=2302915 RepID=A0A372F876_9BACT\nMKTLQTVAITLLSLLGLISCETDQQNPKPEQPSKGTPTEVGKPLGAVTAKMIGAQGGNISTPDGKVTLTFPAGALSKETNITIRPVENKAWGNVGIGYEFGPDGSEFAKPVTFTYRYTDKEISGVSLDNMALAFQDQNKIWQATAPLTVNKTQKTITGSIKHFSWWSMITKYRLTPEYDTVLIKQTKELQIEYLESEWPWSNKPDSDILLLVPLVAPKLADRTAISKIYLNGVDCTTTLPKDQSSGLLGFANKDNKAVVMYTAPNKKPNAAYNPVAISIELQHAGKAKLMLVSNLYIDTENTFSIDGSDPTSIAINAAYGAGALYISFEDNMSNVLRVYTEHFAPGTYTFNIKDTNIAAMHHSKKKAGGSVYEHCRDEKSESGRIVIDRIYQSNGKTVIQGSVTGKVCTLHDTDEKCNIIKHETMTVSAKFTTVVMM\n>UniRef90_A0A7K4IPH3 DUF420 domain-containing protein n=1 Tax=Candidatus Bathyarchaeota archaeon TaxID=2026714 RepID=A0A7K4IPH3_9ARCH\nMALWIADVNFVLQFVILGVLSVGLFYKQRGKFVFHGSTMLIAVVLNAVSFFLVMWPSFVAFDFTVLDSPLKVVSLTHGILGGIAEILGLFLVVAWGVQKKMQSCIRRKIVMRITILLWLIALVLGILLYAGLYGIITI\n>UniRef90_A0A662SB18 TMP_3 domain-containing protein n=1 Tax=Candidatus Korarchaeota archaeon TaxID=2056630 RepID=A0A662SB18_9ARCH\nMLRNAGIDPTTGSLKAIGDAVAALGGGQEKFNRVLIAFAQIAAKGRVQAEELLQLMEAGIPVQKILQEELGLTNEQIAEIGKLGIDAQVVLDALFSGMQRRYGGAMAELMQRFTGIISNLRDQWDLWLRDIMNAGPWQTLTALLKMALDHINRLKEEGKLDEWAEKIGKRVEDTFWNMAIGTATAIDALKEPILAVWGIIEDMWEGFKKLPSWIREIGIVAAIVGGKKGAAVIASLSWLVETLGRSVKGFEYAWKGWISWKDYITANKEELEKLIQEADRAHKTTGELGDISLDTSSKMGNLEQKVRQIRKEVEKYIETLKDEQKQERKPTETPTAKIPVEFVFDEEKLQKLYQDTIDQINKTILQGQELQAYRAEKWYEQMMENIDTLLEAGQITGEEWSRLFDRIEEGYQKLLEKSGESFDYMQEFAIQAARNMQTAMSDFFFDVMTGKFESFKEYIQGLANTISRIISEILAKLALAKIFGAFGWQAGIAALGLAKGGIVPGPVVPIKQFQYGGIVDRPTLFLAGEGRYPEAIVPLPNGRAIPVQIINKTEEKPIVVHIHIQTPDVESFRASRAQIATEITMALARARR\n>UniRef90_A0A0F8B2Q3 Putative Ras-related protein Rab7 n=4 Tax=Sordariomycetes TaxID=147550 RepID=A0A0F8B2Q3_CERFI\nMSAGKKGLLKVIILGDSGVGKTSLMNQYVNKKFSASYKATIGADFLTREVLVDDRQVTMQLWDTAGQERFQSLGVAFYRGADCCVLVYDVSNAKSFDALDSWRDEFLIQASPRDPDNFPFVVLGNKIDVEESKRVISNRRAMAFCQAKGGIPYFETSAKEAINIEQAFEVIARNALAQEESEEFSGEFQDPINIHIDNDRDGCAC\n>UniRef90_A0A846WZ52 Signal peptide protein n=1 Tax=Tsukamurella spumae TaxID=44753 RepID=A0A846WZ52_9ACTN\nMIARRLSVIGTVALATLAVVPGVAQAAPVNTARTILAAHEFPLGSTGYKVETETLKPFDEPDNANTPCSRFIRTMFERLGGAQVTNAQVTRGTTEVEVAVVNRPMAALMAEGFPTCEAQVDPRARSTVLAAPGDLTRLRPFVFRDADEMQAWVDLRGISVNVTATTKNRGPADAETFWQTLRAQVAKVERQP\n>UniRef90_A0A6P6DIM4 protocadherin beta-14 n=1 Tax=Octodon degus TaxID=10160 RepID=A0A6P6DIM4_OCTDE\nMIVFLNTASFGPRETLEMLLSKAPAKRQVTAILFLLLLREVGSETIKYSVLEESDRGSFVANLEKDLGLGLGELAVRGAQVRSKGSKQHLQLEQSGNLLLREKLDREELCGDTDPCLLPFQVLLKNPLQFIQGELQLQDINDNDPEFLENEILLKISESSRPGTPFPLKIAQDLDVGNNTVQNYTISTNSHFHLVTRDHNDGRKYPELVLDKALDHEEQPEMMLTLTALDGGSPPRTGIAQVHIMILDINDNAPEFGQGLYKVQVPENSPIGFHIITVSARDLDAGTHGELSYTFFQSSSQVMQTFEINTNTGEIRLKKLLDYEETKFYHVEVEASDGGGLSGKCTVKLEVMDVNDNAPELITSLLISDIPENSPETVVAIFEISDPDSGDNGKMVCSIQNHLPFNLKSTVENFYTLLTEGALDREKKSEYNITITVTDLGTPRLKTQHTITLQVSDINDNAPTFTQSSYTLFVPENNSPALLIGTISATDRDSGSNAQVTYSLLPPQHPHPHPQPHPQQQPQPDLASLVSINADTGQLFALRALDYEALRAFEFRVGAADRGSPALSSEALVRVRVLDANDNAPFVLYPPHNASAPYAPRHRLLVQVRDNGEPPLSASVTLHVLLVDGFSQPYLPAAEAAPERAQPASLTAHLVVALATVSSLFLLSLLLFVALRLCRRSGPAALGVCSAAPEGPFPAHLVDVSGTGTLSHSYQYEVCLTGGSGTDEFKFLKPFFPNLPPPNAAQQTEGSAMVRNSFGFH\n>UniRef90_A0A0H3GRA2 Bifunctional protein PutA n=3 Tax=Enterobacteriaceae TaxID=543 RepID=A0A0H3GRA2_KLEPH\nMGTTTMGVKLDDATRERIKSAASRIDRTPHWLIKQAIFNYLEKLENDETLPELPALLSGAANESDDASEPTEEPYQPFLEFAEQILPQSVSRAAITAAWRRPETDAVPMLLEQARLPQPLGEQAHKLAYQLAEKLRNQKTASGRAGMVQSLLQEFSLSSQEGVALMCLAEALLRIPDKATRDALIRDKISNGNWQSHIGRSPSLFVNAATWGLLFTGKLVSTHNETSLSRSLNRIIGKSGEPLIRKGVDMAMRLMGEQFVTGETIAEALANARKLEEKGFRYSYDMLGEAALTAADAQAYMVSYQQAIHAIGKASNGRGIYEGPGISIKLSALHPRYSRAQYDRVMEELYPRLKSLTLLARQYDIGINIDAEEADRLEISLDLLEKLCFEPELAGWNGIGFVIQAYQKRCPFVIDYLIDLATRSRRRLMIRLVKGAYWDSEIKRAQMEGLEGYPVYTRKVYTDVSYLACAKKLLAVPNLIYPQFATHNAHTLAAIYQLAGQNYYPGQYEFQCLHGMGEPLYEQVVGKVADGKLNRPCRIYAPVGTHETLLAYLVRRLLENGANTSFVNRIADNTLPLDELVADPVSAVEKLAQQEGQAGLPHPKIPLPRDLYGSGRSNSAGLDLANEHRLASLSSSLLNSALHKWQALPMLEQPVAEGEMQPVVNPAEPKDIVGYVREASDAEVQQALTSAINNAPIWFATPPQERAAILERAAVLMESQMPTLMGILVREAGKTFSNAIAEVREAVDFLHYYAGQVRDDFDNETHRPLGPVVCISPWNFPLAIFTGQIAAALAAGNSVLAKPAEQTPLIAAQGVAILLEAGVPPGVIQLLPGRGETVGAALTSDERVRGVMFTGSTEVATLLQRNIASRLDPQGRPTPLIAETGGMNAMIVDSSALTEQVVIDVLAPRRQRRPALLRPARALPAGRGRRSHLNHAARRHERVPDGQSGAPDHRYRSGYRCGSEREYRTPYSGDARQRPHRLPGGA\n>UniRef90_A0A0X8F9Q8 Lipoprotein n=4 Tax=Aerococcus TaxID=1375 RepID=A0A0X8F9Q8_9LACT\nMRKKVFLLVAVFALFLTACGSSSKETTHVKLGVVGDKNDQWEYIQKELKDKENIDLELVKFTDYRGPIVALEDGSIDLHAALTEIFMEEVNKEGGYSNTTIAYTTLNPMGVFSEKIDSLDDLRDGAVVALPNDVSNESRALLLLQTAGLIKLDPDKGLLPSISDITENPKNLNFKSMAANQTARSLGDADIALINNDMASDAGFVPTQDSIYLEPVAESSKPYYNVIAARQNEKDKDVYQTIVKYYQTDEVAKIIDEMTNGSSIPVWDKDQ\n>UniRef90_UPI001E506DDD EcsC family protein n=1 Tax=Mycobacterium florentinum TaxID=292462 RepID=UPI001E506DDD\nMGTVATAMGVDAAVLTACSAVVAHDALYYGYDPLDPAEEIFMMHVIALGLAETEPAKVAAYQQLTLLTESLARNAAWQQLDRQVAVKVIQKFAVKFAQDLTLKKLVQLVPGLGVGLGAALNWTTVGEIADAAYWAYRERFLYERAPNSSPSQPISRAPRTTIDYRSISKTSSSRKASSSTANANHGDPTAPTHYRDGQANKGRAPVDHIATADAIAAAAHAGQVDKAGMPYIGHVRRVASYVDPANTDAVVAALLHDVIEDTGLTAADLAERGIPQAAIDAIELLTRRDDQPSADYYRRISAHPTAGKSSSRTWPTTPIPNGWQT\n>UniRef90_A0A117EBF1 DUF5753 domain-containing protein n=6 Tax=Streptomyces TaxID=1883 RepID=A0A117EBF1_9ACTN\nMTSKLSRIETAKSPTKPNDLEDLLDLYAGLGRDVDDELRAALLALTNEGVRRGWWHSYRGTLTPVYEDLISLEAEAESVSYWQLGAIPGLLQTSEYAREIIRATAMSADVEARVDALVEVRLARQVVLTRETPLTLRAIISEAALRSTSGVDGLMDEQLGRLLTMGKRPNVHIQVLPSDAPLHAGQVGSFVILGFGPHADLDVVHIEGLSSASYIIEEREKVATHRDAWQRLTTTALPPEASTELITEIRKSV\n>UniRef90_A0A6J2SVJ9 carboxypeptidase B n=1 Tax=Drosophila hydei TaxID=7224 RepID=A0A6J2SVJ9_DROHY\nSLNSFKIYEVATKSRSAGDGLDFSKLANNDSYYELYYSNDAATHVLVHPDAQPEFIELLNGNTLSYKIVNHDAGLSLHREFETNRKLRNAHPYRGRLGTERYYSHGEINQYIEDLAKQHPTRVLVKTVGRSYEGRWLKTIRITNGDGRANKNVILMDGGFHAREWISPAAVVYAIGELVDNYEAYAQLLLDYDWVILPVVNADGYEYTQVSPDTRMWRKTRQPSSAACIGIDPNRNFDFHWNETGASSDPCSETYAGPKSFSEPEAIVVRDLIRGLADRGKMYLTVHSYGNYILYPWGYIDELPDTWEDLDEVGRAGGDAIKAATGTIYKVGCSTQLLYPAAGASDDYAFNAGFPISFTMELPAGGDNYFNPPPEDIDRLVKETWVGIVAMAQKVVEKYPLN\n>UniRef90_A0A4Q6E3N3 Glycosyltransferase n=1 Tax=Sphingobacteriaceae bacterium TaxID=2021370 RepID=A0A4Q6E3N3_9SPHI\nMDVSIIIPYYNAGNYLPDAISSVRQLLRRTDISCEIVICDDGSTDPYSIEILSGLEKEGLFTIARQPNKGPAAARNTAVKNSTGKYLVFLDSDNKLRERLVEKGIEILGSNKADVVYGNAAFFGESTKPLFTQGELNIPLLMARNYIDMCAIVRREVWETTGGFDEGEELRKGQEDWDLWLRAIKAGFRFLYVDEVLFDYRVRAASLTNDDSLERYNKAREYIYSKHPDFFKQSFFWLSDQLYAYQQDKRTPFRSFFKYLYLKYFKGGK\n>UniRef90_A0A1W9W8B2 Prenyltransferase n=1 Tax=Anaerolineaceae bacterium 4572_78 TaxID=1972460 RepID=A0A1W9W8B2_9CHLR\nMKNHSRSTKDLSFASNKLSSKIVSKPKSKVRLRTIALPAEHGSWGFVLEPICLGLGVAPSWAGLCLAIGVFALFLLRRPLKIILTDWQNHTTPPPPLKRRGAMRTVIAKRFVMGYGLIAVLGLISGVWLAGWESLYPLLIAVPFSMIFIAYDVKNKSRTWQAEFAGPTAFSLAAASIALAGGWAYNVSFALTGALFARAIPSVLYIRARIRLDKNKPHNKLLAIGMHVVGLIFVAVLTVGAYNHKPLLPTLAEVGLGIFLVLMMIISTRL\n>UniRef90_A0A3N5LLQ8 OmpR/PhoB-type domain-containing protein n=1 Tax=Acidobacteria bacterium TaxID=1978231 RepID=A0A3N5LLQ8_9BACT\nMKELPEEKTALTQELDRIVKSEAFRSSESLRRLLLYLGNKSLAGEAGDLKEYVVGVEAFGKSSAYDPQLDASVRIQAGKLRQKLQEFYRTEGMEDTVVVSLPKGHFQLDFELRSKPQERQQLQSVPRKWKIAVWSLAAATLLCCSCIAYLLLSVPSGNQPDGNGRLTADLRAIWDPVLKDDRPLVVAVGTPLFTKIGQGFYRDPAINEWNHSAVPSHLERLRDTLGATTLIPAPIYTGIGEATAAFLLCRLLSSEKDLEVRRSSALSWDDVKENNMIFVGCQKYNLQLRDLLSQQDFFMDGNHITNRRPRKGEPHSFTGTCPPDSAYVTQDFAVVTKLPNVQGRELFALAASSTEGTWAASEFLTNEIHARELVSLLRTPSGEMPDSYQVVIRARFRGQVPFEMAIVAERGASPAKSEATDTQTRR\n>UniRef90_R8W248 Undecaprenyl-phosphate glucose phosphotransferase n=3 Tax=Butyricicoccus pullicaecorum TaxID=501571 RepID=R8W248_9CLOT\nMKGFLQLCRSQLLSGISLGLALMVSALFAVYSFGDSAISARWMNLLPCMTVLYMLAGVLLMAWHRRPPRRRPATPYLSGLNARYIWVLPAFLWWLLFRLTGFDVLERCLLFNLILLAVLWTVEYSMARRMAKALNGALGTRTPTVMPASLIVDLDDCPKGIEAFCIEIERYCIKNHIDYQFIERDKPAIVLMNGVKHRVELGVYYGYVPGWFLKFTEL\n>UniRef90_UPI0006692FD6 MazG-like family protein n=2 Tax=Pasteurella TaxID=745 RepID=UPI0006692FD6\nMKLTNEQLIDNIKQWARDRGLDTGSTLGKQFVKLMEEFGELCSGLAKQKTDVIADSIGDMIVVMVVMNTIYDNLPLQLKSDSDDKLLIKETMQRLESKYKQDQINTLSEHYFNHYDRRVSFAVGALNALGDETSRIDVFGKDTNIDFMSEAMFSLFRELYNLATAFGLNVNDCLNQAWNEIKDRKGKMIGGAFVKEGDLKDGQ\n>UniRef90_A0A387BQQ7 Alkaline phosphatase family protein n=1 Tax=Gryllotalpicola protaetiae TaxID=2419771 RepID=A0A387BQQ7_9MICO\nMATLPNAYSQSVSLAAVLASCFAAVERGAPQLPLAPVDAAVVVLADGLGALPLKARAGHARTIAPRLNRATTIESGFPTTTAAALATLCTGVFPGQHGITAYEAVDPEADRVFNHLSGWKTGPDPATWQRVPTLFETHAATGIRSYLVGQARYADTRLTQAVHRGAEYVPAKSIAERMSAAISLARAGRAVVFVYVPELDMAAHQYGWQSPEWTAALEELDAGMAQLERGLGKAQGALLTADHGMVDIADSGKLFFDREAELIEGVRHVAGDYRCVQLHLEPGATAGDLERLAQVWHEAEDDRAWVATRDEAIAAGWFGPSGVADEVLPRIGELLIAARSQVVYYDTRSTNAGNWSMVGQHGSFSPDEVRVPLIGFGAFA\n>UniRef90_A0A4Y2A7J8 RNase H type-1 domain-containing protein n=1 Tax=Araneus ventricosus TaxID=182803 RepID=A0A4Y2A7J8_ARAVE\nMSKKIRILHPPKSEFVSVYRTPSRKSVPIFIMMKFKFLDINSIPRFPPVGSKSFFAASCDFHVFSYHIETEVHQFRIRDECSVFQAELLCIAQAVNWIRTNENLSSNFLICSDSLSSLYALNCITSPNRLIVKTQTNLNFLHGRGVKVFFSFVRGHIGIYGNERADWLAKEATKLIDFIPVTVRKSFYKSVFKKHVISQWNNLHQISHNAKSTKEFFPSIHGRLKAVHFVPNFRVTQFLTGHGNFKAYLKRFNLSRTDLCSCSSGEIQDVNHLILSCPKFTPARCLLVSTLKKNNFAWPPSFSTLFQNKTCFASFCEFIDGIFPHTI\n>UniRef90_UPI0018ED6A80 IS30 family transposase n=2 Tax=Dyella sp. ASV21 TaxID=2795114 RepID=UPI0018ED6A80\nSLTWDRGKEMADHRRFTLATDIQVYFCDPQHPWQRGSNENTNGLLRQYFPKGTDVSVYSQAKLDAVARRLNERPRQTLNFETPAERFQQCVAMTG\n>UniRef90_UPI0020CC1823 hypothetical protein n=1 Tax=Phocaeicola vulgatus TaxID=821 RepID=UPI0020CC1823\nMTTLSSIADYVTDKISSNDISLNEYVTTDCILQNKKGREIATNLPPQPCSLAHYKRGDVLIANIRPYLKKVWFADIDGGASSDVLVFRAKEGHSPSFLYAVLLQDAFFDYVMQGAKGSKMPRGDKDQILRYKMPTLSCSEESIGTLFMNIDSKIRLNEQINQNLPKLDHSSEGAEARHVA\n>UniRef90_UPI0021123217 secretion-regulating guanine nucleotide exchange factor isoform X3 n=3 Tax=Delphinidae TaxID=9726 RepID=UPI0021123217\nMEREPSATAAAPAAAALFAWGANSYGQLGLGHKEDVLLPQQLSDFCNPGCVKRITGGGGHSAVVTDEGSLFVCGLNKDGQLGLGHTEDVLYFTPCKSLLGCPIQQVACGWDFTIILTENGQVLSCGSNSFGQLGIPHGPRRCVVPQAIEPLREKVVSIAAGLRHALAATASGMVFQWGTGLASSGRRLCPGQTLPLFLTAKEPSRVTGLENSQAVCVLAGSDHSASLTDAGELFVWGSNKHGQLTSHAAFLPVPQKIEAHWFQNEKIAAVWNGWTHLVAQTETGKVFTWGRADYGQLGRTLESHEGWKPKKQDPSVRCSRPSKSTPSSLHCLTGATEQRLLPDAGICQWLVSGSPWSSRLVSSAALSPRVSCGSEHNLAVIEDLVLFQSLAFQVVSPQQCYPSTSQHSGFVVLRMGHWSCHHRLSVSGFRFPARPCEGDVHVTCLPSHDSRFRTKALR\n>UniRef90_U3A3Q0 Fimbrial protein n=3 Tax=Vibrio TaxID=662 RepID=U3A3Q0_VIBPR\nMETMKTFVNNFINDEEGLTLLEYILGAALIVAALLSIGFWDTLASKFTDVASEISGINPTP\n>UniRef90_A0A2E3DER3 Phenylalanine--tRNA ligase alpha subunit n=2 Tax=Euryarchaeota archaeon TaxID=2026739 RepID=A0A2E3DER3_9EURY\nMDXVDLSPNELKLLKCLRVGTLTPHEASLKSELGEKETMSAASWLRSKGLVNILEESTTFLFPNEEGKKYAEQGLPERRAVEWLNQMGESLVDELPLDDDEKKVVIGWLKRKKFAELEKTEEGLKLIPTGNIDETPDENLLVILSRKPLAESEIDKEGLALLKGRQVLSSKEEISRTFTLTEEGQNFDVDSIDEGMIGELTPEIIKSGSWKDKTFQKYSTETSIESSDFATLHPLTRFTEEIRSIFLQMGFSEIEGDYVESAFWNMDVLFIPQDHPARDLQDTFYLSEPASFVINDQDLVEQVKAIHEDGGETESAGWGSKWSKEKAQQALLRTHTTVGTIRHLSNNPDPPVRVFSVGRVFRREALDATHLPEFTQVEGIIVEPEANFGMLIGVLKEFYRRMGFHDVRVRPAYFPYTEPSLEVEVRFGDKWLELGGAGIFRPEVTAPFGIEHPVLAWGLGLERLAMLHLGIKDIRMLYQSDLQWLKETV\n>UniRef90_A0A842MRA5 LLM class flavin-dependent oxidoreductase n=1 Tax=Candidatus Bathyarchaeota archaeon TaxID=2026714 RepID=A0A842MRA5_9ARCH\nMSLKSFKQLNFVGTPEDLMQSMQPYLDLDVTFFMLYFGDLPYGDSIKIFAETILKELS\n>UniRef90_A0A3Q7RJQ3 complex I assembly factor TIMMDC1, mitochondrial n=41 Tax=Carnivora TaxID=33554 RepID=A0A3Q7RJQ3_VULVU\nMAVRPRAPQCFLCGRLGPLPRVFAAGAVAAEAGALAGDQELPEYAESGWDRLRDLFVKDEQQRTSKELENIYKAAVSAGIIGWAYGGIPAFIHAKQRYVEQSQAEVYHNRFDAVQSAHRAATRGFIRYGWRWSWRTTVFVTIFNTVNTGLNVYRNKNALSHFVIAGAVTGGLFRINLGLHGLVAGGIIGALLGAPVGSLLMAFQKFYGETVQERTQKDRKALHELKLEESKARLQFTQLLPEEIESSLQKNQSKDDVKKIEALLNLPRNPSSTNKQDKD\n>UniRef90_A0A0F9E616 Deacetylase sirtuin-type domain-containing protein (Fragment) n=1 Tax=marine sediment metagenome TaxID=412755 RepID=A0A0F9E616_9ZZZZ\nMKTIDLFPPCTIENCEDKTPLHKHILDLQQEFLDASERFVAL\n>UniRef90_UPI0021BE6A85 DinB family protein n=1 Tax=Deinococcus sp. Marseille-Q6407 TaxID=2969223 RepID=UPI0021BE6A85\nMTQADPRAQASTLAFARLLPKLFRGGQAFLSVEEIISDISPEQAAQQPERLPHSVASLLDHVNWWNRWMLDILESGEAKPYPEHAADTWREVPAGEWNAVKTEFYDLLARIDAHAARPDLSNPVNFEETVGELLADFALHTAHHFGQIISVRQSIGAWPPSGGGDTW\n>UniRef90_A0A1S3XUT0 cytochrome b5-like n=2 Tax=Nicotiana TaxID=4085 RepID=A0A1S3XUT0_TOBAC\nMPTLTKLFTMEEASQHNTKGDCWVVIDGKVYDVSSYLDEHPGGDDVVLAATGKDATDEFEDAGHSKDARELMEKFFIGELDSTSPPIPELEIVKKAAKNIPQKVKEITKQYWFIPVAVVGISVVVGFLYTRKK\n>UniRef90_A0A8T1TPU1 Secreted protein n=2 Tax=Phytophthora cactorum TaxID=29920 RepID=A0A8T1TPU1_9STRA\nMKVALSFFVVVLLSPMTGSSWLAAGNWCLGYTRVLVAGLELMVKDCSAFMFTIVGALEYGSGIIQNGRQVCIC\n>UniRef90_A0A443J140 Ribonuclease n=1 Tax=Siminovitchia fortis TaxID=254758 RepID=A0A443J140_9BACI\nMIIHSIVPHEHIFPANKDDFSNQTECIWNNIPLLVEQDGHKCKVIRIMSSNPSDYLKSEIQPGSHLYINEVHFS\n>UniRef90_A0A2T0LCA4 Bh protein n=1 Tax=Planifilum fimeticola TaxID=201975 RepID=A0A2T0LCA4_9BACL\nMEFQELQTELYCIKCEENEMHVLTYLNQRLYKARCEGCGHELFISPDPRKVLYDEFLQRIVTKPERISRELKENPRRIVTLPYRVISKPYRMYKEMQGLRQFIAQGKSRNGSKIS\n>UniRef90_UPI00203278C4 MarR family transcriptional regulator n=7 Tax=Curtobacterium TaxID=2034 RepID=UPI00203278C4\nMQFVSRAEEAGRTVRVKDLSKHLGLTGPAITGMVDRLEHSGHISRVPNPDDGRSRYIELTDAARRDYARAMDGTNKHLHDLMASFSERERARFVRIIDRIVAAVDLGAPSP\n>UniRef90_A0A6A5UJA8 SET domain-containing protein n=1 Tax=Bimuria novae-zelandiae CBS 107.79 TaxID=1447943 RepID=A0A6A5UJA8_9PLEO\nMGFVSHPESCVNSLPCLFGSGYTVEGQKTSVEAHGGLQIEVIPKYQDHLRRWFQDTDGHVKTLDLNDVDIDWSQNLNEHDTPASIGLRVGQSVRSYAEPALQRKPLNVEGVAGQRDAVTPQAKYWTSNINASFSLSDPLLVPEFSMWNTKAHAATPATATVTTEAWETTLFSGKKKKAKAKNQWSLGSNEGVYLLNLEIHSSCDTLPEQEPAAEEVLEVQTRDPKAMGLAIDGKIVQDIY\n>UniRef90_A0A849VSC1 High-affinity branched-chain amino acid ABC transporter permease LivM n=2 Tax=Phyllobacterium TaxID=28100 RepID=A0A849VSC1_9HYPH\nMADVQNTERDSVFAKALKEGIISGAIALGLFCLIVGFRTEQNIRNELILTQRWGLLAIFVLVAAVGRFLVTYTAPMRAERKKLHKVAEAREPSAFRKSFPKIGLGLLFLYPALVVLILSAYQGSMMGGLQASLKYVDNFGIQILIYVMLAWGLNIVVGLAGLLDLGYVAFYAVGAYSYALLSAHFGLSFWLLLPMAGIFAATWGIILGFPVLRLRGDYLAIVTLAFGEIIRLVLINWTAVTKGTFGISGIAKATLFGIPFTPGPTGFAAMFGLPNSGVYYKIFLYYLILCLALLTAWVTIRLRRMPVGRAWEALREDEIACRSLGINTTTTKLTAFATGAMFGGFAGSFFAARQGFVSPESFVFLESAIILAMVVLGGMGSLVGIAIAAAVMIGGTELLRELEFLKLIFGPDFTPELYRMLLFGLAMIVVMVWKPRGFAGSREPSAFLHERKMISGEFTKEGHG\n>UniRef90_A0A370FR42 NTE family protein n=4 Tax=Pseudacidovorax TaxID=433923 RepID=A0A370FR42_9BURK\nMSASALPLPGRRPKVNLALQGGGSHGAFTWGVLDALLENGRLALDGISGASAGAVNAVALAHGFAKADDAGDPARTAARQAARETLERVWRRVAGVGAPGALASQFMRMLFGQAPAFPSLTTDPWASPYQFNPLGINPLRTLLDQEIDFDALATLDSPRVYVSATQVRTGRAQIFHGAQLTLSAVMASACLPTMFQAVEIDGEPYWDGGYSANPALLPLIENCDSADIVLVQLNPLHRADTPRTPHEIAQRVDELAFNASLISQMRSIDFMQQLLADGRLQEGRQFRQLRLHRIDIDSALDDPLPSSSKLSTDIAMIEQLFERGRHAAQDWLARHIDDVGRRTTIDIQADYVAGAPLPTEPVAKRAPQLRSA\n>UniRef90_A0A024U664 TAZ-type domain-containing protein (Fragment) n=1 Tax=Aphanomyces invadans TaxID=157072 RepID=A0A024U664_9STRA\nMTSTPFSSSTSTAPMTDGGATLSIQLPLPEQVAVLATHHSEIQLSQTEIHADSTTFLSRVQRYADTGKVDVDGLTATDAAALVHILRRLHATFVKQIDCDEIKCDASRKCPKCGASRVPSSPETSPQRNGTGTTPMSPTAASFRLNGSNSPPADVDMT\n>UniRef90_UPI0016706687 nitrate reductase subunit beta n=2 Tax=Streptomyces TaxID=1883 RepID=UPI0016706687\nMRVMAQIAMVMNLDKCIGCHTCSVTCKQTWTNRAGVEYVWFNNVETRPGQGYPRRYEDQDRWRGGWELTRRGRLRPRSGGRLRRLASIFANPLLPGIRDYYEPWTYDYRTLTEAPAGDDFPVAAPRSLISGERMDTIPWSANWDDNLGGMPGHGPDDPVLARMSQKVRLEFEQSFMFYLPRICEHCLNPSCVAACPSGALYKREEDGIVLVDQDRCRGWRMCVTGCPYKKVYFNHRTGKAEKCTFCYPRVEAGLPTVCSETCVGRLRNLGVLLYDADRVREAAATPREQDLYEAQLSLFLDPHDPAVAGAAERAGIPLAWLDAARRSPVYDLIATHRVALPLHPEYRTMPMVWYVPPLSPVVESLTATGHDGEDEHNLFGAIASLRIPVAYLAELFSAGNTGPVDTALRRLAAMRAHRRRLNLGERPDASIAGSVGMSTEQLDDMYRLLALAKYEDRYVIPTAAVGDARALEESALGGCSLDFEGGPGMGGGHGSGPFGEASGRPAPATVETFHALRARATDDRPADTAGPGARVNLLNWDGNGRPDGLFPPRTGRDGDDADGDGDGDGDGRRR\n>UniRef90_UPI0002DB281B autotransporter domain-containing protein n=1 Tax=Chlamydia abortus TaxID=83555 RepID=UPI0002DB281B\nMLCPPPTPEPEPEPPLEGATSLTKLKEANLGSIPSPMGIMHSSVESSETTDNSVFTFEGNSGLTFSENSSDKCGGAIYAKNLKIVSGGPTVFTNNTAKKTGGAIADGGTLSLTAESGDIIFKGNTSNGGTPNAINIGSKAQITDLRASQGRSIIFYDPISFQPEAGTGGTLTEADGTLKINAPDPLPEKSSLPSMGRLMIRAEGDGQPTSKSYTGTVVFSGKSTTKAKEVTNIFLFPSPVELTAGRLVLSDGALFSATSFTQKDADSCVMLEQNTQLQASNSMDLKNLWVNIKDLNSSTFARVSAMGSSGNVNVSGPIIFTVSDPDFYNNPKLAQQLSREFLKISATRGQVTVSDNSNITNDKEETHLGYQGIWKLTWEDSPTGGSGNEKVANLNWQPLGYIPTMDDTQSYTSLVPNSLWGMVADVTAIQRLIEGEANSATGKDIWGAGLSNFFQGKKTHRNRKFRNFSSGYAVGVSSQSLHNFKFSFGFCQLFGQAKDYGETRIHEKILSGSLYTEYSTELLPILKFLAGTSVFKPKILKQVPEDFLVKFQSQSGYFYGDNSMKVRYSDGTQTHSSWENHCYSGDIGTSITLPIKSKDGLLQKATPFVKVQSVYIYQKGFHEKGLRRRAFSHTYLTNISLPLGIKIHGDSLSKDLHYELSAAYVGDAYRHNPKNITMPIVTHVVTTPWLTTATNLQRHAAQFACSGDYALTSYIHLFAQGSIELRKSARGYHANAGSSIHF\n>UniRef90_A0A7C1IRV4 Glycosyltransferase family 2 protein n=1 Tax=Chloroflexi bacterium TaxID=2026724 RepID=A0A7C1IRV4_9CHLR\nMFLSLIFPAHNEEHRLPPSLMAANAFLAKQPFESEIIVVENGSQDLTAVVAEAFAAEHPRVRVIRERGRGKGLAVRRGMLEARGQFRFFADVDLSMPIEEVSKFLPPQLGGFDVAIGSREAPGARRFNEPAYRHVQGRVFSNLVKWFALPGFEDTQCGFKCFTAHAAEDLFRTQTFDGMSFDVEVLFIARQRGYKILEVPIDWYYRSESRVDPLREPLRMLRDIFTIRRNWAAGKYVKREA\n>UniRef90_UPI001E5CF05F helix-turn-helix domain-containing protein n=1 Tax=Streptomyces sp. UNOC14_S4 TaxID=2872340 RepID=UPI001E5CF05F\nMADHDETVFFRGGDISALHALVGAEFSPYRLRVTGSCPRAEGSFRRLGRGALSVYELGYGVDADVLPGELPDFYHVHIPLAEHGVLTVDGKEPDSPLSVVGPGQRLVMSWRGDSLNQIVHVPRRTVDRAVAVRLGEPPASVVRFDPSLREENAPVRAWLSVVRAYVEGAEGGLLSASPLAQGHFEQLLVHGLLDTQPHTLGGALRESAAVPPAAVRRAVVFCDEHAHEPISVADIAQAARVSLRALRSGFRAHLGTTPLGHLRRVRLTRAHDDLRAAALGDTAESVTDIALRWGFTHLGRFAQAYRDAYGRTPSQTLRGEG\n>UniRef90_UPI001E4F729E glutamate--cysteine ligase n=1 Tax=Blastococcus atacamensis TaxID=2070508 RepID=UPI001E4F729E\nMGVEEELLVVDANGRPVPKGPQALDVASRAGEGEDVNLHDRAEHGEVETPETAHLMPELKAQQLELGTPVCSTLDDVRRELRHWRGRADAAASAVGARVAALATSPVAVEPVPTEGERYARLNEAFGLTAWDVLTCGCHVHVSVADDEEGVAVLNRIRVWLPVLTAMTANSPYWRGRDTAYASFRSQVWHRWPSAGPNGPFADAADYHRLVDEVLATETVLDTGMIYFDARLSAKWPTVEVRTADVALRVEDAVTLSGIVRGLVETAAREARAGGAVPHMRPEVLRLAAWRAGRSGLSGNLVHPPTGRPAPATDVLAELVDSIRPALSDAGDEQAVEQGVRAILERGTGADLQRRVHRETGDPAAVVRAAVEATHEDADRATAEATG\n>UniRef90_A0A8J3L304 Aminotransferase n=1 Tax=Catellatospora coxensis TaxID=310354 RepID=A0A8J3L304_9ACTN\nMTVSHGPESGRPARFPVASMSDLVDRPVRYDLAESTSPPLRLDELLDGDVADRLGALEIGYGTSQGDAELRALIAAGAGVSPADVLVTAGGSSGMFLLAFTLCRPEDHAVVVTPCFPPARAALDALGCRVTPVALSFDDGYRLDVDAVAAALTPQTRLVSLASPQNPSGVRFTEQELRALLGRMAVAAPHAVLLVDETYRQSCYGAAPVPRSTAGLSPRVVTCSSVSKAHGAPGIRVGWLTVTDPALYESLRVAKFNTLITGSGVDELLAAEVLRREEQILGVRRTALATALDTLDRWTAGHRDAVEFVRPDGGALCCLRLRADRYDDQAVRRFHEELAKRETRVGLGGWFGEPDRVFRLGFGHLPAPDFRTALERLAEALAVA\n>UniRef90_UPI001BED38F5 hypothetical protein n=1 Tax=Arthrobacter sp. ISL-28 TaxID=2819108 RepID=UPI001BED38F5\nMKSKLLFGAGIAAGYVLGSRSGRAAYDKLKARATSIWDSKPVQDKVTAATEVVKEKAPEVGDQLSEAARRAGTVLSSAIHRDASKSADATSGGTSASVGTSVSSGTSASATSTSGTGASGTGASTGAGAGGDTLGSGHVPAHSTHPETVNLGTTSDVESDPARNDAMGQDWSDEGGATDAGAATNVDSKRH\n>UniRef90_A0A3B9ZLU8 ABC transporter permease n=1 Tax=Prolixibacteraceae bacterium TaxID=2053594 RepID=A0A3B9ZLU8_9BACT\nMNKSFLILKREYLTRVKKKSFIIMTLLIPLFMAAFTILPAYLASMDDKEERTIAVYDPTSLILGKLEDQGYTKFHYIPEQQYNELRKDFKSGQFYALLYIPENILTTNQAELISDKQITFDIKNMVSGRIGTIIETEKMQQVINETGMPDLEKKLAATKTHIELTTIKLGEEGKAVKSSTEIAMAIGYACGFLIYMFVLLYGTMVMRGVMEEKSSRIVEVIISSVKPFQLLFGKIVGIGLVGLTQIALWIILGIGISTGATFFMGGGSAATAVHAQDIMSGGKAMEQMASSNAAHGNVALDIIQMIGNLNLPLIFFALFFYFIGGFLLYASLFGAVGSAVDSDEDAQQMMFPIMMPLIFSIIMLFPVVKNPEGALAFWVSMIPFTSPVTMMVRIPFGVPVWQIILSMSILVATILGTIWVAGKIYRTGILMYGKKVNLKEIVKWLFYKN\n>UniRef90_A0A136MJX9 Homoserine dehydrogenase n=2 Tax=unclassified Candidatus Omnitrophica TaxID=1047005 RepID=A0A136MJX9_9BACT\nMAKEVKTGLVGFGVVGTGLVQCLQNNQHQIDDRAGIPIRLKTIADLDILTPRDADTSGIHLTTDVNDILNDPEIDVVVELIGGTGFAYDLITQALNAGKDVITANKALLALRGQDLFNLAHKKNRLLLFEAAVGGGIPIIQALRTGICSTEVERIYGILNGTANYILTRMEEAHLDFDVALIEAKAKGYAEADPTYDIEGHDTTHKILLLSQLAFGCQIRFDDIYREGITRLTFFDLQMARELGYRVKLLAIAKREGDRLDIRCHPALIPLSSQLAAVNGVYNAMVVAGHPVGTVMFYGPGAGGPATGAAVASDLMEVARQIQRGNQRRNDYSFDYRNLAIKPVGESACPYYIKLNVLDRPGVVAQVTAVLAEQSISIASFIQKERREPHEAVPIVLTTHEASESAMELAVEKIATLDSVVERPFLIRIENLQ\n>UniRef90_UPI0017897FD0 DUF1906 domain-containing protein n=2 Tax=unclassified Paenibacillus TaxID=185978 RepID=UPI0017897FD0\nMAKGFDCATPLTDSTAAAFKRDGYVFVARYLVPSSWKALSVKEVQSICNAGLQIVSVFETTADRALGGRSAGLKDGAIALDLAAQMGQPPGSTIYFAVDFDATPAQMSSVIAYIKGASEATPGYNTGVYGSYAVVEAVYAAGACSRFWQTYAWSGGKKSSVANIYQYLNDIVVNGIGIDLNESYGQEGWWSTIPADYMLNPEDANKLIGFMKAGYEAANDAAGKEDFHRLANELRKASGQPEQ\n>UniRef90_A0A377GHF6 Sulfate transporter ychM n=2 Tax=Legionellaceae TaxID=444 RepID=A0A377GHF6_9GAMM\nMLAIVESYRAGLLTSKYWIQNLIAGLIVGVVALPLAMAFAIASGVKPEQGLYTAIIAALIVGIFGGSRVQIAGPTGAFVIILANITAQYGIDGLQIATLFAGFILVFMGFLKLGAVIKFIPDPVIVGFTGGIGVIIFVGEWNDFFGLSVHIPLNAPFYLKLLALIRAFPNLDWSTVGLAGLSLFLILITPKFLKRVPGPLIAMVVATVLQTLFHFKSVATIGSTFGGITQTLPQFHLPQIQLEYAFNLIGPAFTIALLGAIESLLSATAADGMSATRHHSNQELIGQGLANILSPLFGGFAATGAIARTATNIRNGGNSPIAAIVHSIFLILVIVLLAPFASNIPLCTLAAILFVVAYNMSDVPHFIYMIKHAPSYDLLVLITTFLLTIFTDLVVAVNVGVILAMLLFVRRMGQFVAIEQQDHETLKNELSDIILPKNTVVYTIQGPFFFGAAEKLERAFMITHSDPKNIIFRLKDVPFMDITGLQTFIEIIEQFHKRHINVYLCEAKSNVKNKLMNIGVMHLIKGERIFPTLKDTIKKLQN\n>UniRef90_A0A0N0UYH6 Lipocalin-like domain-containing protein n=1 Tax=bacterium 336/3 TaxID=1664068 RepID=A0A0N0UYH6_9BACT\nMKINLILKFLVLVAIFTFSCKKKSEPTPKDLLTAHIWIGVNLNYNVNTFGFSDAQIVNTDSTAVEFTKDNIVIFYTRDVNTGLLTERNRQTYTLSSDSKKIEISSTDGLLSPEIQASLSVFGITVPTSINIEKITTTELILKGSLQQNINIPQLPIPVPLTANYTWTYRN\n>UniRef90_UPI001CF7C5F2 V-set and immunoglobulin domain-containing protein 2 n=1 Tax=Varanus komodoensis TaxID=61221 RepID=UPI001CF7C5F2\nMTGKMKAPAPPHLTLTSATQLPRHPLTGLGACVDVTVPHGQVMQKKGLNVTLPCNYQTSVDKAFMLEWKFSPGSTSPDGGKQILYFTSNTLYKPGAQAKRLHLLQDPPTLGIATIQLTDLRSSDAGIYTCEVNNPPDFYGTSFGQIELIVLMAPSSPVCRGTTSVSVGSNTTLTCNSTEGVPAPIYSWKRLDSKSPLPVSNTVQNEKTGTLELLNVSLALAGIYQCTSSNEFGQKTCQITLQVTAMAQAGVIAGAVIGVLLALLLLVGIAFYVLHRRKQKRNKKAQSIYSANEIREDATAPGISETSLQKKDSKSELHLLESESSRPGSASTTKSQLKHLFI\n>UniRef90_A0A6M3IHK1 Putative peptidase n=2 Tax=viral metagenome TaxID=1070528 RepID=A0A6M3IHK1_9ZZZZ\nMKIERRCLPITELRTIRDEGQRPKISGYAAVFNMLSEDLGGFREKIDPGAFKKSLGASDTRMLWNHDSNYVLGRKSAGTLKLKEDEHGLKIENIPPDTQWARDLLVSIERGDVTQMSFGFRIEEDKWEEKEGKETIRTLVSISDLMDVSPVTYPAYPDTEVALRSLDEWRAQNDPEHANAAGDHSEDANAPESVPFQALHRRRGLELKLKNERAE\n>UniRef90_A0A7L9FI35 Magnesium-translocating P-type ATPase n=1 Tax=Infirmifilum lucidum TaxID=2776706 RepID=A0A7L9FI35_9CREN\nMSSEGEWVERDARELVPGDIVFLRLGSIVPADAKVIDGNVLVDQ\n>UniRef90_A0A538JN64 DUF5666 domain-containing protein n=1 Tax=Actinomycetia bacterium TaxID=1883427 RepID=A0A538JN64_9ACTN\nMGTRTIKAVSAVTALAGVAAITGMVAYERGESHASSATVRYAVHLDGLAVVDGLDHVSRGHELRVAGSYDGRRGTLTITRN\n>UniRef90_A0A6L5NWZ8 Methyl-accepting transducer domain-containing protein n=1 Tax=Shewanella sp. XMDDZSB0408 TaxID=2664453 RepID=A0A6L5NWZ8_9GAMM\nMFFKKSKAAKVNQSTTAEVLKGSSNRVADKLALTQYSLILCYLPPSLAAQDVSQLTKQLTQRCGDVITIMSSGTISGTENIYNSPDESNVVIHAFPKSMISDVSVAKISIPAHTTDKEIHRHKNSLKSSLKGVNFNFDVDLKDTFILSYFSGLNAFENQTVESILNSGNENFSTHIIGGSAGGKLDFKSAAVAHNGNFSESQLLLVAVKLHPDFGYAINKTHNFAKNRISFVVAKSDNTTRTVTHVLDDNGNLTSIVSYLCSALSCSKQELSAQLANKQFCVDIEGDVMIRSVAAVDLEKESIAFFCDMAFGETIYMVTQEDFATKSNREFDKFTNDLTAKYCQEIDTIIGIDCVLRRLQNDPKVLKQVRLNNVKSHAAFSSFGEIHGQHQNNTSVLVAIYRKQTQSPHASVKRYFVALTEVARYYLAVELNRERFIGELKTSLIDELNHYEGIVVSSTEDLLRLSELSGLIDGEQQTVSQLINELLAKGESQAQIRQDLEARVTELKNSSKQILNVMSSIDAIAEQTNLLALNAAIEAARAGEAGRGFAVVADEVRSLASKSQQDIGRSREAIDSVELSIANISKSVDILTTTSVQMEQSIESAMEQTKKIAELTSKSSQIATHGLSSAQANQNEHVRIQAQKDKLTSLL\n>UniRef90_A0A265NDR7 Hemerythrin domain-containing protein n=1 Tax=Virgibacillus indicus TaxID=2024554 RepID=A0A265NDR7_9BACI\nMAITGPALRHLDSHRSIHQGAYAEARDITDVMNRLFYDNRMEDCLKAANALVEYWETRVIAHADTEDEGFYKELLEKKPELTKEIHMFSRDHDLFRKIVADIKEEISEEEKVTKNMVNQFNALLIIKKHHNKGEEENLFTE\n>UniRef90_A0A838GFU4 Carbohydrate ABC transporter substrate-binding protein n=1 Tax=Chloroflexia bacterium TaxID=2448782 RepID=A0A838GFU4_9CHLR\nMATSWARLYNQDLFTQAGIEAAPTSWSELIDAATRLNEAGITPCAGSWNPSWFGRHFLSDFYSTEYEALTGCDGSPGQSPQDEAAAIKAGILSTDDPRFMAWWPFFKGLTDLWSPEYLAQELSVADEGAQEDFQAGQSAMFYSGSWIPRTLQTVGIEFELGSFSFPQLTTEDIEFATNVDVAGVVGGPNAAFQYAMSTPESNTTLEEEGKEAAVIDFLHYIGTPEVIEKVVNELGSFAPTWPGTTPVTGLETFAEQANTGLRVVNIGNSSATILPSWERLFGLYLSGNLELEEAANQFQRELDRGVQGYEEDNPDLDIDSCFAS\n>UniRef90_A0A1C0A8Z2 LYZ2 domain-containing protein n=1 Tax=Orenia metallireducens TaxID=1413210 RepID=A0A1C0A8Z2_9FIRM\nMNKPKFKVIFLLVIMIFLAMMGYFWTSLFNSKEVNLKQDDSTGEALVSEEEAEPITEEAQEVQEVEQNSFTNIAYDSYKDWERLLEEYNYNINQELVEIPRVKVEKFPEDIGEISDVAKKKKIFLSIILIGAYHVNQDLIEDRRRLQSIAKQYSISDKIGLEDEEWLNQLKKEYSVKSDDLQESLDLLLVKVDIIPLSLVLAQAACESGWGTSRFTRVANNIFGEWTFSKMVAGVVPKDRPVNATYKIRKFDTIEESIKSYINNLNSHYAYEELWKIRANLREREERLDSLKLAEGLLNYSQRRELYIDELRDIIKYNNLQKLDSLLEE\n>UniRef90_A0A382ZW10 Tripartite tricarboxylate transporter TctB family protein (Fragment) n=2 Tax=root TaxID=1 RepID=A0A382ZW10_9ZZZZ\nMPLDRAIAGIFILICLIYGYTAFVPMEEGLLPFELNMTFLPNTLPKYLSVLGIVIGLVIVLQPRYEGASDSDPNEIDQKKLLQYKFSQALFLLGLMLAYALLLRPIGFVTTTTLFLAFGGIILGERRLVIL\n>UniRef90_UPI0009B405AA mixed lineage kinase domain-like protein n=1 Tax=Monopterus albus TaxID=43700 RepID=UPI0009B405AA\nMDFIDPILSIASQIYTLVENVQANKKRCRRVSDRVRALEELVKSIEKRKTVETSGNVTKALKELYHTLEAAQKLVKKYTLATWVKRILKSSSHEDEFNIVNERLNNAFQVLSGALQLEQGNVLCKVFALASREEEDKMDGKEDDAELGKLLLEHIKDQEEKTKAMQRTFDELKTSVEMVIEKLNKPSITSEGIRMIKLEELKNRRPFMKTPTSEVFKGQYHGFTVAIKRYTGLVNTSPREVRNIFTKEVETMKRFESPNILRMFGICIQDEDGPSPEFLIIMEYCEKGSLRQVLDSDCKLSWLKKACMCLDAAQGLYRSVIWLLDKFICVRNDRNMGRREEKPRYTGVIKKVKCHFECDIL\n>UniRef90_UPI001CA7B725 uncharacterized protein LOC122510909 n=1 Tax=Leptopilina heterotoma TaxID=63436 RepID=UPI001CA7B725\nMPSSCIVDKCISASLIRKGRKLSLFKPRESTLELWRQIVPTKDNKELLKSHVVCELHFNENDMDKTFKTIINGVQHEMQKEKISLKVGAVPSLLLSNVKDKLDYSQIIKEKQIIALPSKNWSVVRTSEFIVWINWINNNPHTDRRIILYPDMKIKVFVYGNEVKEKDMDVKSVGDLIALFEKLEKFFPCGSSGTCRSENCIGFIIQKEKHERGRKFVLCAACSKFTKKINRQKRESDKLMKVKCKIEKLYKNSKNTHQKCKRLLDKV\n>UniRef90_A0A257RIT0 Peptide deformylase n=3 Tax=Acetobacteraceae TaxID=433 RepID=A0A257RIT0_9PROT\nMASAADERADLDSAHAQRYTKNPSFANLNASKFSRFRAGPVCETRQLRHLCIMAILKLARMGHPVLLTRADPVADPTAPEIRRLLADMIETLDDAGGVGLAAPQVHVPLRLFIYKVPERRVSTIEGDEPRGLSAVINPQLTLLDGDPIEDWEGCLSIPGMTALIPRAARLILTGTDASGAKFTRQAAGFHARVIQHEADHLDGILYPTRMTDLRMIGFTDEITKFREDILAVHHNPTL\n>UniRef90_A0A6A4KJ17 Peptidyl-prolyl cis-trans isomerase (Fragment) n=1 Tax=Rhododendron williamsianum TaxID=262921 RepID=A0A6A4KJ17_9ERIC\nMSSSSDKVRASHILIKHKGSRRKASWKDPDGHVITSTTRESAVAQLKALRDDIVSGKAKFNDSPLVSPIVAPPNAAAISVSLLASAVFSRIRLFRSKIQSPSVRIFYYEAMLSLVLFCKSVPI\n>UniRef90_A0A329J1P4 Phage infection protein n=1 Tax=Pseudomonas sp. RIT 412 TaxID=2202161 RepID=A0A329J1P4_9PSED\nMNTQKLILGLAFSVLATGAFALPTVHGTSAVAENGSSHTHIERVAADGADRVGANRVAENGSDRTALGRIAADGADRVGANRVAENGSDRTALGRIAADGADRVGANRLS\n>UniRef90_A0A6A3LY11 Reverse transcriptase domain-containing protein n=2 Tax=Phytophthora rubi TaxID=129364 RepID=A0A6A3LY11_9STRA\nMSPSSTRSRARRRRRMRRRASAASSTPDEVSSVLSGEAPHDCGEQLYTLVNGVTGDVDSDIGLDPLPSLNALLELEEMPVADFGEALKAGDLAEVVMIRPEDELNSSSLLDEAVLEDTKQALNARSGSAILKDPSDPLYSLVVEFGDVVSKVPPMGLPPDRGVRHEIDLVPGTKYCVMRQWPLPKEQCDVIDAFFRAKHAAGLVRESKSPHSTPTFCVRKSNGKWRIVHAFNKLNAATIPAQTPIPRKDVLQNNMVGCMLYSALDLVDGYYQLLMRASDIPLTAVSTPSGMLWEWLAMPQGLSNAPATFNRLVTQLFRPHRAYAQTYFDDIFVHSRAEHGKSDMENHIDHLRAVLECMRANKLYANADKCIFGAEEIPFLECFIGKRGLRADPAKVKAIVDWPVPANQKDLRKWLGLANYLHKYSENYAELARPLPTLLKKDAEWCWDTGQQEAFEAIKESLLQAPILALPDPDRPFSVVCDASDFAIGCALLQADGEGHERVIAFESRQLKAAEKNYPVHDKELLAMKYVLVKFRVHLLGSKPFVIYTDHASLRTATQSPHLSQRMARWLSFFAEYNFEVKYKPGRQNVLADALSRRPDYELAHVTSVTSSISEMIREAYARDDVCVALLRALGSEEFQNSDIKLSARLRARLHRYSLEGQMLYYSTGSDDTPRAVVPHDEDLKNRILYEAHDVPASGHLGREKTYSSVSRHYWWPKLYQWVKTYVSTCETCQRVKP\n>UniRef90_A0A850EYH4 Ribosomal RNA small subunit methyltransferase D n=2 Tax=Enterobacteriaceae TaxID=543 RepID=A0A850EYH4_9ENTR\nMKRPHSAGGGQIRIIGGQWRSRKLPVPDSPGLRPTTDRVRETLFNWLAPWVTRARCLDCFAGSGALGLEALSRYAASATLLEKDRIVAQQLRKNLETLKAPQGEVVNTDTLSFLAHPGTPFDLVFVDPPFRKGLLNETLHLLEHNGWLADEALIYVESEVENGPPNVPHTWSLHREKVAGQVAWRLYHREVTTGE\n>UniRef90_A0A2M7RS75 Methicillin resistance protein n=2 Tax=Candidatus Gottesmanbacteria TaxID=1752720 RepID=A0A2M7RS75_9BACT\nMIVKEITDKKIWEAYITQYSPNSLFQSWNWGEVAKKLDDRTNNTKLWRLGFYLNNKLFGIAQVVKVKAKRGIYIQVRHGPILSEWSKKNILMVTDYLKKIGCKENAYFIRMNPLISSSEDNKQIFKEIGFIDAPIHAMDGELVWVLDLNKKKEEIFSGMRKTTRYLIRKGEKLGVKIFKSQNKEDIDNFLILYKKTATRHHFIPHKGIKEEFVTFLKDKQIILFRGYYNNRLLSAALILFYNKQAIYHHSASIEQKVPVSYVLQWEVIKEVMNRGISIYNFWGIAPEDNLHHPWVGLSMFKKGFGGRKVEYLHTKDFILSPKYYFTYLFEYGRKIIKRY\n>UniRef90_A0A3D0LW13 DUF4870 domain-containing protein n=1 Tax=Betaproteobacteria bacterium TaxID=1891241 RepID=A0A3D0LW13_9PROT\nMSPSADDPPFPECPDPPGQTLAVIAEVLYLMNLLLLPGFAFLILLGLYFKEGGAPQLARCHLRQTVAASLWAVALLGAANGLILLLGGYAMPATWVVVILYFTVCHSTLVLLGVLGLAKAMAGRTFIYPVVGRRCDG\n>UniRef90_A0A5C9DQB6 CopG family transcriptional regulator n=1 Tax=Spirochaetes bacterium TaxID=2202144 RepID=A0A5C9DQB6_9SPIR\nMKNITLSMDEKVLRAGREYARRHNISFNVLVRRLVEQAVLSTKDSWLDDTFSLMDTLHASTENVMWTREELYRV\n>UniRef90_A0A438CFM9 Beta-xylosidase/alpha-L-arabinofuranosidase 2 n=1 Tax=Vitis vinifera TaxID=29760 RepID=A0A438CFM9_VITVI\nMSGGGFDISFAKNDDKIASILWVGYPGEAGGAAIADVIFGFYNPSGRLPMTWYPQSYIDKVPMTNMNMRPDPASGYPGRTYRFTLGKPFTHLEMD\n>UniRef90_G1PVF8 Synaptotagmin like 5 n=10 Tax=Vespertilionidae TaxID=9431 RepID=G1PVF8_MYOLU\nMSKNSEFINLSFLLDHEKEMILGVLKRDEYLKKVEEKRIRKLKNELLEAKHRSGKIQQETSRVCVYCQRNLGLIFDRGNPCQACSLRVCSECRVSDLDGSWKCTVCAKVAQLRIITGEWFFEEKAKRFKQVNVLGTDVVRQSILRRNPGGAKEIQSQEKNHQDAEKSNTSPSTGQKASHDESKEKGFLLSKFRSAARGEIIITPNTESGWSYSMDLDSRNFRHLKSAPSSDRRNTGSSDLNDKEVGPGTLKSSQSSGMTPVTHRSPAPSPCNITPVISREHGFENSLDLAAIEGTSEDFTKNHCTNTSGTPSIAVSRASLSSDQSQSELDLSGSFKEDLKDTVNLRSKYVPGALDKDLDSSEETEESIDDVVSSRFSANTHSLASGLSRNSQAGSDKKWTYLNVPDIDSDTASLNSMLSVYSETGDYGNVKVSGEILLHISYCYKTGGLHIFVKNCKNLAIGDEKKQRTDAYVKSYLLPDKSRNNKRKTKIRTGINPEFNETLKYTISHTQLETRTLQLSVWHYDRFGHNSFLGEVEIPFDSWNFENPSDEWFVLQPKMELSTDIGLQYKGELTVVLRYIPPDEYLMFPPGQLQAHTGKKTFKRGTKKPPVLSGGILEVLIKEAKNLTVVKSGGTSDSFVKGYLLPDDKKVTKHKTLVIKRSVNPQWNHTFMFCGLHPQDIKNVCLELTIWDKEAFSSNIFLGGVRLNSGSGVSHGKTVDWMDSQGEEQHLWQKMADNPGTPVEGILMLRSSMGKRQL\n>UniRef90_A0A1G4YLJ9 Acetyltransferase n=2 Tax=unclassified Nitrosospira TaxID=2609267 RepID=A0A1G4YLJ9_9PROT\nMNYDVFNGDADGLCALHQLRLAYPVKAELVTGVKRDIKLLDRVQAGAGDWVTVFDISLDSNRSRLMQLLEAAVHVEYFDHHYAGEIPRHINLVSHIDVSADVCTSILVDRSLEGRFRLWAVVAAFGDNLGQSTRSLVGSMGLAESQIEQLAGLGKYLNYNGYGDSVDDLHFHPAKLYEEMKPYPDPFDFIARSTAFNLLAAGFRDDMAMAGSLLPLSEEPCHAAYLLPDAPWARRVVGVFANRLATDHPSRAHAVITPTRHGDYAVSVRAPIAKPEGADMLCMKFETGGGRKAAAGINRLPMDELDRFLAIFAEQFD\n>UniRef90_A0A104MTA2 DUF2384 domain-containing protein n=17 Tax=Burkholderia TaxID=32008 RepID=A0A104MTA2_BURPY\nMTRHAHAIKGTVAILDVETEAALRSAVGAATMLGPDRARALLRLSDEQLGHLFKIGIAQAIDLAATVTFGIAAAATRDKKKSADPARHVKPAARTDGVPADFERGALSERQTLVAEGRLLPAIEVRVGLGITRQALSKAVAAGRIFTLDVGAGQYYPAFYLAGDIDRKTLGKVAQRLGSLPGWSKWQFFTAPKASLGNITPLEALSRGKVEQVERAAAAFAER\n>UniRef90_UPI0021C2958F uncharacterized protein LOC126978868 n=1 Tax=Leptidea sinapis TaxID=189913 RepID=UPI0021C2958F\nMSFLLIYPAVAALTLFIIVVIMVMLRFGATCCKLRHTAFANQEDWLEEEAYEQKVSYA\n>UniRef90_M0NT14 DUF3194 domain-containing protein n=1 Tax=Halorubrum kocurii JCM 14978 TaxID=1230456 RepID=M0NT14_9EURY\nMPSESTDEPTDEEVVRTAAEAAEGVVFAHYDQSAVTDLDVTVTFEEGVLDVDVYLNAPDDPDPDVVAREAAETAGEAVDELFAA\n>UniRef90_A0A8C6TNC3 THAP-type domain-containing protein n=1 Tax=Neogobius melanostomus TaxID=47308 RepID=A0A8C6TNC3_9GOBI\nMPSACYAMGCTNALSQKKGLAFYKFPKDPVRRQKWITRDEPTHANVRKRQSFVYYLPFL\n>UniRef90_UPI000522A661 ubiquitin carboxyl-terminal hydrolase 15-like n=3 Tax=Amniota TaxID=32524 RepID=UPI000522A661\nYLVDSRWFKQWKKYVGFDSWDKYQMGDQNVYPGPIDNSGLLKDGDSQSLKEHLIDELDYILLPTEGWNRLVSWYTLMEGQEPIARKVVEQGMFVKHCKVEVYLTELKLCENGNMNNVVTRRFSKADTIDTIEKEIRKIFNIPGEKETRLWNKYMSNTFEPLNKPDSTIQDAGLYQGQVLVIEQKNEDGTWPRGPSTPKSPGASNFSTLPKISPSLSNNYNNMNNRNVKNSNYCLPSYTAYKNYDYSETGRHNEQPGLCGLSNLGNTCFMNSAIQ\n>UniRef90_UPI000401F0EE valine--tRNA ligase n=1 Tax=Desulfuromonas sp. TF TaxID=1232410 RepID=UPI000401F0EE\nMEPKLPKGYEPREVEEKWYAVWEQAGFFRADENSPKPHYSIVIPPPNVTGVLHMGHALNNTLQDILCRWKRMTGHEVLWMPGTDHAGIATQNVVEKQLAGEGKDRHELGREKFIERVWQWREESGGQIINQLKRLGASCDWERERFTMDEGLSRAVREVFVRLFEEGLIYRDNRLINWCPRCHTALSDLEVEHEEKKGHLWHLRYPVQGTDRFLVVATTRPETMLGDTAVAVNPGDERYADLIGRKVLLPLVDREIPIIADEYVDREFGSGAVKITPAHDFNDFEIGKRHDLEFINILDESGNINENGGPYDGLERYEARRKVVADLEAQGLIEKIDDYANAVGECYRCRTVIEPYMSKQWYVDVKPLAKEAIAAVEEGRTKIVPQQWEKTYYEWMYNIQDWCISRQIWWGHRIPAWFCDACGEITVSRQDPTECAQCGSADIRQETDVLDTWFSSALWPFSTMGWPDQTETLAKFYPTSCLVTGFDILFFWVARMMMMGIKFMGEVPFTEVYIHALVRDAQGQKMSKSKGNVIDPLTVIEEYGTDAFRFTLAAFAAMGRDIKLSTERIAGYRNFANKLWNASRFALMNLEDFNPEKVDLDKLELTLADRWILSRLSETAKEVDTALTGYKFNDAANALYSFTWHSFCDWYIELIKDELYGDDPQAKACAQAVLFTVLEQLLRLLHPFMPFITEEIWQALPGRRPEKSIMHAACPNGEDLPVDAEGAEKMERIMDVVKAIRNIRGEMDVAPSRQIAAVLDCKSESSAAVMREGEGYVKALARVNDLICGVEVERPAQAATQVAGEVEILLPLAGLIDVGEEEKRLEKEIAKVEKDVAMFSKKLSNEKFVSNAPPEVLEKDRGKLAAAEEKLGILQESLKKIQALK\n>UniRef90_A0A4S4L702 BAG domain-containing protein n=1 Tax=Phellinidium pouzarii TaxID=167371 RepID=A0A4S4L702_9AGAM\nMAYFCTPSSYASTFYDSPFSRRRPSPPPTTYYSRSNAYDPYVRAIAEEQVARSALQDAIQREQEARRRRTQEEARARARAQETARARSRAARQHAGMFYGLPARYQYADYPECGYGYGYEYGDEGDEDDEIKDTYSPFIHFYSTPEFVSKQGSAPPMSRSSSLRPSQQELRAKETEGQSSSKESTPKVSIPINTPSSQTSQHSDQVRNEAVLKIQTIYRKHVARKAALTEIESIRQRFETQCNAFSFPSVLDFQDDPASPEASAAPEERPRLAYTAHNTPVHVHEDALVKMLQALDSVESHGDATVRDVRRTLVRAVEEELGRVDAAVRRVWEELVVQAKAESHKTTEEPMEVLLDLASESDTTVEAVVDQPALAADQALPTMDVESASIAESIVQPVAEKTESGMEEPEARTFPPAEKTNIESTTSTAAESPFDEIAIDDVPIPSTIDNALGQMAHPISTLAPPPPAADVVFEPIPISEPPLNADSETDSEVETPSQPAVAFPAAQVVSAEDRQDDREEEDDTVLVEETLKTPDGYEKNSETAVVDTEFVLV\n>UniRef90_A0A401PBY0 Tripartite motif containing 62 n=7 Tax=Chondrichthyes TaxID=7777 RepID=A0A401PBY0_SCYTO\nMACSLKDELLCSICLSIYQDPVSFGCEHYFCRKCIAEHWSRQDQSSRDCPECRRSFRDPLLSPSLKLSNIVERYSAFPLDAILQAQRNSFPCKDHDKVKLFCLNDKCLVCFFCDEPALHEQHHVTNIEESFEEIQRELKDQYEVLQDSEHGHVKALQLLKRQLSETKSSAKSLRATIAEAFERLHRFLKEKQKSMLEELETDTARTLNDIEQKIQRYSHQLREVQEGMQILQEKLVEADKLLFLEGINITLERLKGKIHETNLTYEDFPTSKYMGPLQYTIWKSLFQDIQPVPAALTLDPITAHQRLILSDDCTIVAYGNLHPQPLQDSPKRFDVEVSVLGSDSFDGGVHYWEVMVSEKTQWMIGVALESVNRKGSIQIQPSRGFYCIVMHDGNQYSACTEPWTRLNVKSKLEKVGVYFDYNKSLLTFYNADDMSWLYTFREKFTGKFFPYFSPGQSHANGKNVQPLRINTVRI\n>UniRef90_D5ASH9 Membrane protein, putative n=3 Tax=Rhodobacter TaxID=1060 RepID=D5ASH9_RHOCB\nMETLPILVPPVLNLVSAIAVGALIGTERERRKGEGPARSPAGLRTFAIASTAGAVGFSLGGAVLLAVVAASVAGLLAVSYGKRPHQDPGLTTEIVLLLTVLLGGLCIPAPQMAAAIAVTVTVLLHLKAWLHTLVTTLISKDELDDALIFAAATLVILPLVPDRPMGSWLALNPHSLGIVIVLVMAIGAAGYLAVRLFGARFGLPLSGALSGFVSSTATIGAMGARALQSPEMRAACVAGAVLSTVATVLQMALVLAAVSLPTLRQMILPLVFAGVTAVVYGVVLTLAAMRHPAPEAPGPGSAFSLKTALIFGTVLALVLVLAAGLQAHFGGSGVLLAATAAGLVDTHASAISVATLVAAGKVAPEAAAVPILAGLSANTATKILVAAISGGRGFALRVVPGLVLVILAAWAGSLFW\n>UniRef90_A0A7S3BTX3 Protein kinase domain-containing protein (Fragment) n=1 Tax=Prasinoderma singulare TaxID=676789 RepID=A0A7S3BTX3_9VIRI\nGAAPSASPPRALPAAGGLGPRRSQQSTVPMARTALRAPTARSTARAAARSSRGSRGNHRRAVAAALVGPEAAGALDALALAQQAAEHGVHHAALPSLAEGIGPQCALYDCGDMTYRSTLDLELRKELGGLTLQGKAIIGGVGLYLLATPGVLWGFIDTYIVRLLQRALSPAYRLRDFELGQRLGKGAFGEVFRATCLREGASEDQVVLKRADDYGAEEVWMNGRVSRLPVSTNFARYLGAFRETGRDGSEQTWLAWRYEGDFTLSTYMRRKDFPECLEVSLLGESLEGESKARRRSAVVRELMRQLFEALDAALG\n>UniRef90_A0A812J0M9 Mfhas1 protein n=5 Tax=Symbiodinium TaxID=2949 RepID=A0A812J0M9_9DINO\nMQKLAKHQNALGQYSSLGTEVFFTEFGADWTSYRSARNRRRVDFSGPQWSLETLEGEQENGLMHKQFIREHIEVLNLAKNKLTDIGCLNAMKDTRAFEFRRLQILNASRNMLTFVKLVNPSLTEINLSHNELIKLPDFSSLTQLSKLLLSHNYIDDMLDQFGQLQKLRVLDLSSNRFFWRPTLFKKQLGHLERIHLEELRFWPNPFAEGFKEYQFITASTLTSLTSLDGFQIDSDLRFQLRVQADQLQLNIADFSIFDVRVEDRGKVGEAEEKCSCRGTSRHHARALLGPHSKHFIPAFLGGREQEVAGVVGILETLKLGDRNVPPQQSGGKVPLLTELIEAMRKSLDQPNDLLKHVYDLEQKVVASDFASGTCHMRHCMQLSVLCLALKLQVLQHPSCNRTSSQVSCMWNAHFWDRRRLMLAEDGERKQRSYMKPAEADRAAAEFADKMQQVLGRFESVQDVLVMCLVRMLGCGNRQLSERCGTLLAEWVDANAEELHDRMDSMSEALFNDLRHALVVGIKSVNEKPMACYEASHGAREPEDDSELEQTEASWHILAALRRFGPSRLYDKVVSPWRARVLRPFLPALCRETKEVLGPDQPPDRWSKYQGFDSFSEDVAEVLEVQEKNLVSCEEKCVRQGFGGFVVEATDELGMVKVCFKQQSPQTLASLRRSSAKRTLHVRPLGRPPKRPNKAAEEGGGRNHAWEAWVDGLAVLVTATSDSQNAAYCVSYFDAHLAVTKHESDKQGFTEAALLGSSEANNAFVRLLQLARNLMQAYGDAGLKAARHFLEAKLHTNCWARARRRLQEGGSPLPVSRLSEMNPDDVALISELVGILHTMVKCGDLEISNQAMNDILAENGMDVFEMLLEVAASSADPDPLFLAISYESVYVFVQSDIMRPRVLSKVISRLRETAILLPYIRGPYIKDVPNEKYMQLWCKCELKYGMKNDARERLEKRYTSLDPDEHSQWRELVPEIRELQNTMMHRTLLGIVKIIQLFSDLARRDDSPPSLKMVTDNVCGGFVKSKKALGEIPGDLLNANDRERLLIGPTTGLVTCPDFDVRVESLICIRHVLEATPDQFDLEEMGWLLNYLTSVGMGIGKQGQFLTEVIDLIKMFVRNNSRTGQSFRNKFAKYAIRECFEMLTVNSRRETHGNKEEAKAKADLTAKIIELLKDCSRPLSGGLRKFLRRVDLLQSIREVLQQEERTSSNPATQILDIWTGRDIRQVLLPIVTSPAFDVHGPVVHAALMRLADVLQAYSWTDVPPTDEAGPWPGLTMLYRLLDYRDAIENEDSGYQQEYFMNSRGLDPLLDFAHRFFAANEDLNILLNRVQDKLAQELGEKERSLRAKWEGRQQDVHQSEASVKTKQEEQTMSEVVQDCLTARLRSLNEGAAAHFRCNLNQYDQKKQEFSLSKLAKVYQNYWKDNENRANQEVQERGDAVYELLRIPDKIAIDGQLRDVQDLGRVPRKQRRIRQPHRDFEKLMYQALSAHKIMKQMLCDSSKRDHNEVARWCQYEPDANGPPSVLAIGLLDFLQDNQALAIDAGLRPREELLVQDKYKYFRRHDRRTNLSCIVLEFPDARCLLAALQEFLKRAQRLFLYQVRNRFRLASDLGEYCIALKFQLQLKDSSIHYSELRMCLSGKSKKNNTVQQYRDTMRKVEEILQSSCDVPTSETTLVAQYLSTMLRSRSIHHSDIIFLRCKDVNLEVDGEEVFAQSAELTSCQLFVIEREAGDGVVKTGDRIRLKSKFTQKYLDVHASGHLRCRLADFSEDYDMTFTVEAIGCRDDYALSRCGMKGSLTEFRSLHTETSLRLKVSASNFVTVRQGANFLTSFGEKLSVKSEPNDAAHEAGQVFTIFRDGALLLDFHSTHSGSRAAIRTLALETSDEILQKTMMEAHMRTEISNGDVDVQGSSFRTVPPEFKTMMWSIAGHFRHVGHSKHAASHEASSLHKLWTRASKNLAAILRCLFVMMEFPQCVGGRRYVLDTFATRMTQHSSLPRIIALVSAVQLVRKEKMPDGELDLTCALLPKKFMRFCSALLSNLWVCQKPDEIEAIFTVPREQERHERELATIDRERMHLLSMVGSYTCDMVVKPMLDKLRVAGQRPLSRDEVLVFQDFASLCMALVQSIFDNEMRCLSLSNQASHHHHHHGTTAISDKERAGPQSGQSPSHKDAVAIPQNVDDGEQGDALNTNVLLASNADKRRANTLSQASWTYVTHFRAGISSATLAVMTRQDARAAVVAEIIPPITIKALVHLFLYALHQEAIAFRSATRDTEIPVRVISGIINQCVTALAALMTLTGKSNAEVGPTEDAPDASGSCDYDVCEAISQAMTEGAQLVPRARVAQLQAERGADCLRAHVQKMMEEGSFEFSSHRGPKLNLSTERVSTVGFVWTRLAGDIQACASPCFYDKQLFLNDRPRIVMHQDTRCLLVTTTRFRMILLRVPARASVMPQPADLHVLSEPRNMQDLKRVIFDLRTLNSVLESVKDRQVSKCPQSFVRMRQILCLVWDGEEGLKFQRLVFESSGRRRSFQEVLRKVPRKQQDTGEEDGKKETASIRMRARGILESAVKSTSLESLRETCQVRRGGIPLVSVTFVQSTGGLGLNAQLDMLVLTRCSVTVVSFNSFWSKFWRSDDESHYEREVTQASLDTDSEDDRLPDFSESVVATSNDHADKCEALHGPWDLEDLQGVWFLSEASPKVRLQFGSTLEVTFLSDGERQRFRRHLATILAEGAVPRAGKASQAWAVVPTDKTDIKTIQKETGAVQNGRLALTRGEGDDVARDVLPSVCFRSRCALWSGSPHKASSGKFAEHATFGGEADALNKRVACTGDDSEEDEWVVLLEVVEGLRSARAAFSDAEYQVLYSQVHSAWDPGRRFCNPLQRGAVRFCLEEHHVHAEELLASSRILSVAASTLTTLLLQAPSESLFWSSDEANASRDAERLVEGAVRSTFRNISSSMQHHLHLAQELDSFSLTEGQLKAFVSILEHLVDPRVQDLGLAVAKALDQYFQGGVTGEQDVKLLLLQATQPRIVEIRELWHEVKLGALHGPGLGWGVAVNPANLFVLQSFGQPVTYQPRQQEHSQAFWVAAATFEQARVLLLHLEALLRTFGMTINAHGLLQSLSGSSEPFLSQLLACHSDDAEAAEMGTEHDLSRYRRMACSIKYGSAGIDVIASIGGSHPGLAPAQS\n>UniRef90_A0A6A6N897 Receptor-like protein EIX2 n=1 Tax=Hevea brasiliensis TaxID=3981 RepID=A0A6A6N897_HEVBR\nMAWNQLRQWSGIACHNTTGAVLAVDLPNSSGRQPLGGEIRASLAKLKSLKHLDLSGNNFTGKIPHFLSSLENLQYLNLSYAGFSGAIPPNLGNLSSLQFLDVSYWGLTVDNLEWVSGLLSLKYLAMNSVDLSKLGGEWIEPLNKLPLLSELHLEYCGLSGFSYSLPSLNFTSLKVLNLQGSLFKAKLPTWLANISSLVSVDIGNSWLTGRIPLGFGELPNLQSLKLNYNLKLSASCFQLFARSWKKIQILDLSINGLHGVISEAHFHRLGKLEKISLSENSFVLNVSSIWVPPFQVIALEMGSCHLDPLTVKCSNDSNNGGDNYPDGGGKADQTDNGNGFIDKWFYMSIGVGFAAGLLLPYLVFAMKRSWGGVYFAFVDGTAYRLSSEKMKAAARRRNRGAR\n>UniRef90_S7SN88 Polysaccharide biosynthesis protein n=4 Tax=Geobacillus TaxID=129337 RepID=S7SN88_9BACI\nMRTVASMVAPVSNALYPVSAKLFKKSNDVAIKYLKKFLFIGSLVFMLAGVGMVVFSNVIVLVMTGEENIEIQYLLLIMAFIPLSIYINNIYGTQIMLNLYLEKVFKYLIITNDISLPVLSYILTLNFNLWGASFSLLITEILLTVSMVVYVEFIKKQGFLGVLKK\n>UniRef90_E6QXG0 Secreted protein n=1 Tax=mine drainage metagenome TaxID=410659 RepID=E6QXG0_9ZZZZ\nMWRQVYKWLLIYLLRWMGYWFDEMGSCGSFGTVFRVANDCNGVVCWFGIARGAIVHLVALSFDYGLESFRYLAGALAVWYSLSSVGSGKFTCCTEYCDGQAPIGLGNHCVACVVAADGDGD\n>UniRef90_A0A3N7FFK6 NADH-ubiquinone reductase complex 1 MLRQ subunit n=2 Tax=Populus TaxID=3689 RepID=A0A3N7FFK6_POPTR\nMASSRWIRPEVFPLFASVGVAVGICAMQLVRNICTNPEVRVTKENRAAGVLDNFKEGEKYAEHGLRKFVRNKTPQIMPSINGFFSDPDLPTN\n>UniRef90_B8A485 PHD finger protein 3 (Fragment) n=1 Tax=Danio rerio TaxID=7955 RepID=B8A485_DANRE\nMASRHHADHEMTGAGVRQSPSDGEHNQSGFLQDRRQAGQMQRRQTASRGRVRGRRLGPARKAAESYNRESTCSEEHDRDNSPDEKREALLSRRF\n>UniRef90_UPI001F4BB424 secondary thiamine-phosphate synthase enzyme YjbQ n=2 Tax=Belliella TaxID=232244 RepID=UPI001F4BB424\nMKLFQKEIKLRSYPRGYHLITDVIQSQFPEIKLVHQGVLQIFIKHTSAGLTINENADPTVRKDFETFVNELVPESYPRFIHTYEGSDDMPAHLKSSFLGNSLQIPITGGKLNLGTWQGIYLCEFRDFGGARSLVLTAFGV\n>UniRef90_UPI000F8ECADA GntR family transcriptional regulator n=1 Tax=Pararhodobacter zhoushanensis TaxID=2479545 RepID=UPI000F8ECADA\nMNADAPSGPEALVRDVLQGLAEGRFVPGQRLAEPDLMARYGLGRSTVREGLGRLAASGIVVQAPHRGAQIRLLGRRAAQDVLRVTDLLLGLAARQAAEAVAAGADPAPLIAAARDYDAAVPGERARIRARYYRALTTLAGNAELDRLLPLLQVHLIRAQLRLNRPPGRPARTALVAAVAAGRPDAAEDAARSHIRALIAALPNLPDNAFAPD\n>UniRef90_A0A7X9B2E4 Leucine-rich repeat protein n=1 Tax=Lentisphaerae bacterium TaxID=1932692 RepID=A0A7X9B2E4_9BACT\nMKKLLQRKRRSASTLLAALMTFFLFVGASARGQGAPDPEKDYAYEPYSYGSASGVIITAYLGNEEVVTTPAHLGGQPVIAIGPGVPRVLIDQDMEPDWGTKGFCNTPVTDLTVSEGVLFIDDAGLGNDALTRISLPASLQELGGNPFFAQYNAPNAELVITVAAGNPNFAIEPNSGALIQNGTHLIFWPTLAARAAAVDGLLTIPDGVTHIGTRILAWNRYYDPDARANVYAFTRIAFPAGVTHIADCAFYACHLESLTLPTSLTSLGLWVSFTALDLPASLAHLGGHPSPHQGHLR\n>UniRef90_A0A1H4NAP5 MFS transporter, AAHS family, 4-hydroxybenzoate transporter n=1 Tax=Beijerinckia sp. 28-YEA-48 TaxID=1882748 RepID=A0A1H4NAP5_9HYPH\nMETEALNVTSLIDDRPIGGLQIAVIILCALVNMLDGIDTQSIGVAAPFIAEGLGIPVAQFGPIFSAALLGAALGAIGFGAVADRLGRKPLLLVALLLIGVFTLLTAHASSVKWLVVYRFLAGAGLGGATPCFIALTSEYAPARNRAACVTLMWAGFPLGAMLGAFANSFLLPAFGWRAIFYIGGLLPLIVAMILIIWLPESLKFLVNRGAFDAARRILQRMGIKTEPGTKLTTNEHKQEGLPLRQVFSEGRGLLTLLLWVPFFISFGILTVAVLWTPTLLRLNGISPAMTAFVVAFNGLGALFGQGLAGRLVERFGALRTLVPAFILGALATAGLGYGASSVAAASFFIGLNGLFLGLASGGAIALAALLYPTAVRSSGVGLGMAMGRFGQVVSPLIAGGMLGAGFNAGQIMVVIGSGALVGALFVIWFRILAARRHIATVGTEASTG\n>UniRef90_A0A848GUV0 Signal peptide protein n=1 Tax=Ramlibacter agri TaxID=2728837 RepID=A0A848GUV0_9BURK\nMKLAVLALSLLACGSAFAQAAATAPEPDYTASVNIGAVTDYRYRGISQSRLQPALQGGADFAHKSGFYIGTWASSIKWVKDAGGNADAEVDLYGGYKFNGGPVAFDVGALRYLYPSSQLAVSPNTTELYVSGTYGPATLKYSHAITNLFGFADSKNSYYVDLNATFDTGYWGLTVTPHIGYQGIKNNSGFSYTDWSVALGKDFGNGFSASLAYVDTNNSNYRSPDGKDLGRATAVLGVKYTYSF\n>UniRef90_UPI00214A619A hypothetical protein n=2 Tax=Lachnospiraceae TaxID=186803 RepID=UPI00214A619A\nMIRNIYTKTLDSGPITPVSARKEKEKALSWRNTLMEHQKHLDKTLSQCISEDEYRLTAMELDCLEHVIQLDDFYDFCTDYMCEHGIDTVVDIGCAYGHQSEAFLEENLGYIGIESSGDSPKWNIDKCMYLTEKYPCKIPDGCRFAVSNMCFEYFINDYEALAHDFDTVILSGLGKNTKVFELFDVEEIHYRPLIDSNAIWNLFILTNKHIGD\n>UniRef90_A0A0D6A1E3 Transcriptional regulator n=1 Tax=Lactobacillus acetotolerans TaxID=1600 RepID=A0A0D6A1E3_9LACO\nMTDVVRKDVKQRLENGDYSCAKELTLSMFSGKWKIVILFHLGTDGPYRFNQLMRLLPKTSHKVLTNQLREMEEDQLISRTVKSDS\n>UniRef90_A0A2H6N9Y6 Cytosolic carboxypeptidase 1 n=1 Tax=Micrurus lemniscatus carvalhoi TaxID=129465 RepID=A0A2H6N9Y6_MICLE\nMWHCTVKVLKYGILLPFLNRTKIAQDIERLIHPNDIIDRVVYDLDNLSCLVPDEGDVLKFNSKFESGNLRKVIQIRKNEYDLILNSDINSNHYHQWFYFEVSGMRTGNAYRFNIINCEKTNSQFNYGMQPLMYSVQEALGGRPSWIRTGTDICYYKNHFSRSSIAAGGQKGKSYYTITFTVTFHHKDDVCYFAYHYPYTYSALMMHLQKLESTNNPQQIYFRQHLLCETLSGNNCPVVTITAMPESNYYEHICQFRNRPYIFLSARVHPGETNSSWVMKGTLEYLMSNTPGAQNLRESYIFKIVPMLNPDGVINGNHRCSLSGEDLNRQWQNPNPDLHPTIYHAKGLLQYLAAIKRLPLVFCDYHGHSRKKNVFMYGCSIKETIWHTNVSAASCDLIEDLGYRTLPKILSQAAPAFCMSSCSFVVEKSKESTARVVVWREIGVQRSYTMESTLCGCDQGKYKGLQIGTHELEEMGAKFCTGLLRLKKLTSPLEYNLPSTLLDIENELIESSCKVTSPTTYVLEEDEPHFLEEVDYSAESNDEPDIDLANNAGDYEPCLHEDGLSDSEITRTHLP\n>UniRef90_UPI00197F5B0B hypothetical protein n=1 Tax=Pseudomonas viridiflava TaxID=33069 RepID=UPI00197F5B0B\nISHKIQFLQWVAGCLIRGGLPAMNDDAVLLTYRVDCIAGKPPPKVKCLPRDSATAKTWWCLPQSEFAAR\n>UniRef90_A0A1E5KYP1 Zn-finger containing protein n=1 Tax=Enterococcus rivorum TaxID=762845 RepID=A0A1E5KYP1_9ENTE\nMGQVWMERLMRWNAKLQHFLKGRYARMDQLNKTMLIGSIVLIIANSFLPTSVLRWIGLALIVFIYYRFLSKRIYVRANENTKYLKIHNRIFGKIKKIKLRFQQRKIYKYFTCPSCKQSLRAPKGKGQIKVTCSKCHQQFSKKV\n>UniRef90_E3MKT5 Eukaryotic translation initiation factor 3 subunit A n=1 Tax=Caenorhabditis remanei TaxID=31234 RepID=E3MKT5_CAERE\nMAPNYFQKPEAALKRAEELIQVGKESDALDTLHDTIKARRHKQWTQTHEAIMIKHMELCVDLKKQHLAKDALFQYKALTQQINVKSLETVVEHFLKLAESKTEEAQKQSIEKVEEIGDLDQGDVPERLLLAVVSGAAAQDRMDRTVLAPWLRFLWDSYRNCLELLRNNAQVEHLYHQISRHSFSFCLRYQRRTEFRKLCDLLRMHLNQIQKHQYAPNVNSFRVKLTSPESLALMQDTRLVQLDTAIQMELWQEAYKSAEDVHGMMQLSKDKDKRTVKPSSYVNYYDKLALVFWKAGNSLFHAAALLQKFIIYKDMKKSFTQEEAQEQATRVLLATLSIPEGSDSPSDLSRNLDIEEQHVANMRLLSNLLRLPIAPTKNGILKEAARIGVPEASGQIAKDLYKLLESNFSPLKVAKDVQAVLDTITRPDHQQYVESLQAVAAVKALKQVSVIYEAISWERIRKIIPFYSDLALERVVVEASKHRIVKAQIDHRADCVRFGSSDATLAGGVDECDNNEGFTGDDTQLGVEGVRNHLEAMYTRLRVLVEGLDAEKRRKEMVRKIENHVTSYEKNRPTEIDRIHRRKKMLENYKENWERVKAEKTLQAATEQAKREEAARAEEMKRLEEQNKESERKRKQAEAEEIQKKIKQDQLYKMQQNAIYQAIIKEKGLDQFRDMDPEQVLREQRERLDKERAETQRRLQQQEKNFDHHVRALHLEEMNERRAVMHMRMNEAPKLHDQYEEQRITKEM\n>UniRef90_UPI001D11B2C3 phosphoribosyltransferase family protein n=1 Tax=Aquihabitans sp. Kera 3 TaxID=2884263 RepID=UPI001D11B2C3\nMTTAEPIEEREALTYELFGTAIRDLAHQVDDSGWEPDWILSIARGGLLIGGALAYALGMKNVATMNVEFYTDVEQRRDVPVVLPPVLELVHLADTKVLVADDVADTGETLQLVRDMVADTVAEVRTLVVYEKSRSVIRPDYVWRRTDRWIDFAWSAQPPVTRRPGVF\n>UniRef90_UPI001CFFCFA9 GNAT family N-acetyltransferase n=1 Tax=Arthrobacter sp. ES1 TaxID=1897056 RepID=UPI001CFFCFA9\nMSVSFLQVRPLTDADAAVLGAWAEDELFCRHAGWTSSSPAKVCDFWIRQIKDPPTGLLRLAAESVDRELLGYMDLHGTDPESRELGFLVGPSRRWGHGLGRRIAEAGLTYGFTELSLERIWAEAVAANVASVQILRSLGMRETGRGEAETFLETNSYYLQFEILRDAWELGADR\n>UniRef90_A0A1C6SX88 Beta_helix domain-containing protein n=2 Tax=Micromonospora rhizosphaerae TaxID=568872 RepID=A0A1C6SX88_9ACTN\nMTALPSASARTAPSASTPPPRRSTSPSPRSAANPRHSLKAGKNSRAGCALPKYPSPDCTGVPAGTRLATLRLNLDNDSYAVYEAGAVIDRKHIPGNLLIRAPNVTVKDSQIDGTVFNDYNGRLHPFTIVDSTIGPATGCITAPGLAYANYTAKRVRIRGHDDGFRVATPGNVRIEDSYAKLCWNPPELAPPDGSHSGGIQADCRAGECVGIWFNHNTIDNRGPNGNSGITMMSFDGNPVRNVISNDNLVMGGGYSIIYWWTTGPNFELHNNRVVEGTYVYAPADANGTCAHQNWSGNTLVTIDARYNVTSTVGPLPCIQ\n>UniRef90_A0A0H4BB36 Uma2 domain-containing protein n=1 Tax=Synechococcus sp. (strain WH8020) TaxID=32052 RepID=A0A0H4BB36_SYNPY\nMWQQQPDYARYKEKLNGEGWLVNRQEGMLLQIKPDTPTQHAQFVLVSYYHLSARIGKPVRQQRMLRHLGIEMWINLQKIGWERCLAPQN\n>UniRef90_A0A496XIQ2 Alkaline serine protease n=1 Tax=Gammaproteobacteria bacterium TaxID=1913989 RepID=A0A496XIQ2_9GAMM\nMRHHTRAVGLLVCLLSSAVQSAPAPETETLQVMLQGGSSQELTQLVETQGGTITHDLHIINAVGALLTQAQLDKVLKSPLVTRHIDDLSVSEAPDEPDESTCEVGGALELDYDTRGLRWTLYNKLPAPAILETLELTWPATLGTVEKISLGDTTIDPELYRDTQIGTLKLQFSGPAAPVLTGKADLRVDLKSPSLLHTSDLPLRQRDFTITASFLGDCSTKLIPGYENNHENFYYASVAGADALHLQGITGKGVTVAVLDSGLWEHEALVNDTSGKPRVLARYDAIKNISGNEVFDESGHGTHMTSVIAHSGAVTVDGKPTGSFKGTAPNVNLVAVKAFDVEGQGDLLDIVRAVQWVVDNRETYDIRVLNLSFSARPRWHYWEDPINQTIMRAWASGIIVIAAAGNTGPDPMTIGSPGNLPYVITVGAMTDSWTPDNRDDDYIPDFSSRGPTPTAHIKPDIVAPGGHITGLTRPNSTLMLEHPDYMLSTGEFVMTGSSQASALVSGIAALLLELEPNLSPDDIKCKLLSSAEPAIHRDGFLAYSPFQQGHGQVNATRAVTLGQIGCGNSDMNIRLDISGVKHFQGPAIVESDGNASLPGLSKIVSPEPSERGLSKTRKWGVKAHIERLDPAVTDLESSEISPIDWQKIYRQEKTAMESLIHEPPE\n>UniRef90_A0A520FEH4 3-isopropylmalate dehydratase large subunit (Fragment) n=1 Tax=Sphingomonas sp. TaxID=28214 RepID=A0A520FEH4_SPHSX\nMRSRPQTLYEKIWAAHVVERRDDGTCLVYIDRHLVHEVTSPQAFDGLRLAGRKVRRPDLTLAVPDHNLPTTQRVDAAGRELPIADPESAAQLDALRRNTTEFGIDYIDANAVQQGIVHVIGPELGFTLPGTTLVCGDSHTSAHGALGALAFGIGTSEVEHVLATQTLLLSPSKTMEVRVDGTLGFGVSAKDVILSIIGKIGAAGGTGHVIEYTGEVIRALSIEGRLTIANMSIEGGARAGLVAPDDTTFAYLKGRPLAPTGAAW\n>UniRef90_A0A842QUU5 Flap endonuclease 1 n=1 Tax=Candidatus Bathyarchaeota archaeon TaxID=2026714 RepID=A0A842QUU5_9ARCH\nMGVDLKSILVKDTIKLDELKGKVITIDASNILHQFLSTIRKPDGTPLTDSQGNVTSHLIGLFYRTLKMMREFSVKPVYVFDGEMPDLKTDVVEKRAERRREAKKKWSKAKQVGKDEKAFKEAVKTGFLDDQMIKDAKLLLNNMGLPIVQAPAEAEAQCAYMTHDEEIYAMNSRDYDSMLFGASKLLRYMTISNKDNIEIIDLDKFLNHHEISWAQLVDMGILIGTDYNEGVFRVGPKTALKLIKRHGSIEKIPEKYQKKLDENYADVRKLFLDPPLIEDYSLEFKEINRNGVMQFLCEERGFPHERVLNNLEK\n>UniRef90_A0A4Q3S4G9 Acyltransferase domain-containing protein (Fragment) n=1 Tax=Chitinophagaceae bacterium TaxID=1869212 RepID=A0A4Q3S4G9_9BACT\nMKAYIFPGQGAQFSGMGKELYENEQAKAMFEKANEIIG\n>UniRef90_A0A1Z4EIA0 Peptidase M24 n=1 Tax=Mycobacterium shigaense TaxID=722731 RepID=A0A1Z4EIA0_9MYCO\nMVLALTGYVWQQDVGAVFRRDTVLITDGGVDVLTDSPSWG\n>UniRef90_A0A672Z142 Cytoplasmic linker associated protein 1a n=1 Tax=Sphaeramia orbicularis TaxID=375764 RepID=A0A672Z142_9TELE\nMDLNMEDLLEQLMHKDLGRRIQVGQEILELIPDQDKFPELEQDQTLLDRMVDTVAGSWVNSSNFKVGVASTCLIKGLCLCLIATLNVSFSHLSMNCLVEIYRHVGERVRMDLGKKGLPQSRLNVIFSRFDEVQRSGNMVLSPLSGETYLLTPQTDGGGAGAVDEQDFIQSFDDVPTLQIYSNREVEETMTKIRDVLSDDKRDWELRVAALKKVRSLLLAGAVEFDGFLQQLRLMEAPFKLSVKDLRSQVVREACITLGHLSSVLGGRFDHAAEAIMPALLNLVPNSAKVMATSGVAAIRLILRHTHYPRLIPIITSNCTSKSVAVRRRCFEFMDLLLQEWQTNALERHGTVLMETIKKGIHDADAEARSVARKCYWGFHGHFSREAEQLFQTLESSYQKALQAHLRSGDSLMSLPASDRSSSSSQEIVFLTPASTSSSGSLHRSRSDVDVNAAATATARTRMPAVPAAMQAPPFSSASALPPGSYASLGETHLTTLSFGGSLWTAGRVLKHFHCFPAGSRSGSPGRLLSSTYGRIPRPTMGTAAATGCISGGTMEKGRPRGHRSQGCSRETSPSRSARSRIPRPSMSQGCSRETSRESSRDTSPARGFSPLDRLSHQARISASVNAMRILNTGTEVEAAVADALLLGDSRSKRRPARRRYESPGMYSDDDANSDASSACSERSFSSRNGGVAPHFLRQTEDVAEVLNHCASANWSERKEGLLGLQNLLKGQRTLSRVELKRLCEIFTRMFADPHSKVFSMFLETLVDFIVLHRDDLQDWLFVLLTQLLKKMGADLLGSVQAKVQKALDVTRESFPFEQQFNILMRFIVDQTQTPNLKVKVAILRYIHALARQMDPADFVNSSETRLAVSRIITWTTEPKSSDVRKAAQVVLIALFELNTPEFTMLLGALPKTFQDGTTKLLHNHLRNLCFLRPQASSGTALGRTPPRPPSSRGSPLTSPTNCSHGGLSPSMLDYGSENLNSEEIYSSLRGVSEAIQNFSFRSQEDLMESPRSDGMSGVAASSESAVEVGGRTALDNKTSLLNTPSPRSFAGPRFRDYNPYNYSDAIGSTDKVATKEALYEDAVDPAEQLELVGDLLKALSQAQGGEPGLDERRRTLLELLKVAREDSLVVWEEHFKTTLLLLLETLGDKDHTIRALAMRVLKEILRNQPARFKNYAELTIMKTLEAHKDSHKEVVRAAEEAASTLAGSIHPDQCIKVLCPIVQTADYPINLAAIKMQTRAIERIAKEPLHQLLPDIIPGLLQGYDNTESSVRKASVFCLVAIYSVIGEELKPYLAQLTGSKVPWESLRLVCTCADVGIQSHVKGMGKESVWLEMFF\n>UniRef90_A0A7W5NUZ0 Glycosyltransferase involved in cell wall biosynthesis n=5 Tax=Pseudoxanthomonas TaxID=83618 RepID=A0A7W5NUZ0_9GAMM\nMNTMAARLPAQDADTLVSVIMPVYNAEQTLRRSADSVLAQSFGQLELILIDDGSRDGSAAIVEELARRDERVVAVRQPNGGVAAARNTGLRAARGTHIAFLDSDDWWEPRKLELQLAWMRETGAMVCYASYQRVAEDGRLLSKVSPPLEVDYRRMLGSNHIGNLTGIYDRRLGEASFQKMGHEDYVFWLDRVRRAGSAVRVPGDAPLAYYLVRNGSVSANKLRAAGWQWRIYRQVEGLSAPRAAWYMLQYIRHALWKRKPVTT\n>UniRef90_A0A534HYX9 DNA alkylation repair protein n=1 Tax=Euryarchaeota archaeon TaxID=2026739 RepID=A0A534HYX9_9EURY\nMAGPVERMREDLVRQLDAAKRPGKLGAQAYLGSPVPVLGVPVPDLRKIVSGFKKTHKDVDAKTLNPLAASLWDGATFEEKAVAINLLDACLKILDEDSWTLLNRWAGEATGWGLCDWLGMGLIAKIVYRQPRRFQEILGWTKSTNPWRRRIAVYALRNFVFAGELDKPFRLLERLLYDPEVWVQRAVGTWLRECWKKDPRRTEAFLRKHVRGLPKVVITVATERAPAVFRAELRRGREPEAR\n>UniRef90_A0A2N2AM00 Precorrin-6Y C5,15-methyltransferase (Decarboxylating) subunit CbiT n=1 Tax=Firmicutes bacterium HGW-Firmicutes-8 TaxID=2013789 RepID=A0A2N2AM00_9FIRM\nMSDKQWIYRTGGIPDELFARDEVPMTKAEVRAVTLAKARLQESHVIWDIGAGTGSISIEAALMAVTGKVFAIEKKPEGVQLIKKNIEIFAVANITVCSGIAPEALQGLPEPDRVFIGGSGGNMAEIIRYVHEKMPIGGRVVVNAIVLESLVTSVETMKKYGFGDIDVTQVSIAKTVDVGRLHMFKSHNPVFIISGEKTTNQLTVKKETTEGLAQRSCNQF\n>UniRef90_A0A2G2LVQ5 DNA-binding response regulator n=1 Tax=Robiginitomaculum sp. TaxID=2030823 RepID=A0A2G2LVQ5_9PROT\nMQSTEQEKAHLLVVDDDDRIRDLLRTYLSRHGYRISVASDAKRVRRLLKTLEFDLVVLDVMMPGEDGISLTRFLRQSSAIPIFLLTARGAPEERIEGLRAGADDYLSKPFEPEELLLRIGAILRRKGTTIGSGATLQFGPWRFTPSTGELVGTKGRVSLTDNEARLLAALCKRPGEAFSREALSRDTAAIERSVDVQIARLRRKIEDNSRFPQYLQTVRGAGYRLLAHHVSETSSA\n>UniRef90_A0A699XL38 Secreted protein (Fragment) n=1 Tax=Tanacetum cinerariifolium TaxID=118510 RepID=A0A699XL38_TANCI\nMPSAPMMASCLACTPLANVMSPDDVSTSTHCSLVSSWTATLCGDTPDLVVDDKLDRLASTFFLQSAVHEHLVHVLTVEHV\n>UniRef90_UPI001FF62731 hypothetical protein n=1 Tax=Amycolatopsis sp. WQ 127309 TaxID=2932773 RepID=UPI001FF62731\nMPPTQTFMVVAVLRDDTDLAEFAALRNDEEKQLELLRSAGRIGAHYISPARRATFVEVIADDEKQVAETLATLPFARFFDADVYPTAPPDAAEIAYRARAATA\n>UniRef90_A0A8S5L7T1 Large Terminase n=1 Tax=Myoviridae sp. ctKHS5 TaxID=2823541 RepID=A0A8S5L7T1_9CAUD\nMKSKEFLAELRAYADSLRQKVEAEFDGWDDSLQAIAERRKKVFDPVTGYDYFVSHYFPHYVRSPHRSELHDYLFATLPEVLADPKSVNMATAAPRGEAKSTLVSQLLTVYCLITQQKRYALIVMDSINQAYPMLESIKVELEFNQRLKIDFPEVAGQGRVWQATTILTKANQKVEIAGSGKRLRGLRHGAYRPDLVILDDIENDELVRSAEQRDKLHDWLKKTVLPLGVPGEKMDVVYIGTILHYDSVLNRTLSSKAWKTAKFKALKKMPDDMALWDKWESFYLNEGEAVADAFYYANRAAMDKGAEISWAARPLLALMKIRARDGHATFDSEYQNDPVSSEDAIFANAIRYWTELPSDLIYFGALDPSLGKAGASRDPSAILVGGYQRSTGKLYVVEAQIKKRLPDLIIEDVIRLHKQYHCQRWFVETVQFQEFLKDELVKRSAQRGCPVPATAIKPNTDKMLRIESLQPHMVNGLIMLHGSQATLIAQLRHFPKADHDDGPDALEMLFKNAASCAAPIEWMGLDALDDDEYDDNDLGYSKWKH\n>UniRef90_A0A651EH65 DNA-binding response regulator (Fragment) n=1 Tax=Rhodobacteraceae bacterium TaxID=1904441 RepID=A0A651EH65_9RHOB\nMATIALVDDDRNILTSVSLALEAEGFDVRSFTDGVAALAEFGRNAPDLAVLDIKMPRLDGMELLRRLRLKSDLPVIFLTSKDEEIDEVLGLRMGADDYIRKPFSQRLLIERIRAVLRRREAAVEGEREEDDRPLTRGRLTMDPLKHDAFWGGQEVTLTVTEFLILRALAQRPGVVKSRDQLMDVAYDDQVYVDDRTIDSHIKRIRKKFR\n>UniRef90_A0A1C9CI92 Acyl carrier protein n=2 Tax=Rhodochaete parvula TaxID=110510 RepID=A0A1C9CI92_9RHOD\nMEKHSISDRVKNIVSEQLGVNLDEVTDQASFVDDLGADTLDTVELVMAFEEEFSFEIPDEDAEKIKTVAQAMEFIQQKVEATAT\n>UniRef90_A0A2E7B655 Type IV pilus biogenesis protein PilP n=1 Tax=Hyphomonas sp. TaxID=87 RepID=A0A2E7B655_9PROT\nMLTLPLLAKMSSAAVAAAITASLTYGQYNIASGPNGSGLMPPASVLHPNARPGAMLDPLAEMASAMTSLKQERAKADRNRAMIDWLAGLQTRFTVQRFETGLVYKVRYAAAGXAGTVLQDXVAVPYGPELPXAVSLQAGXGGXVRVEGLSCSGQETLSEMDAGAGEQAVETAAMSRAEAYLXQPXAADPALPADCLMARLKRG\n>UniRef90_A0A3N2C5J3 Vegetative cell wall protein gp1-like n=1 Tax=Plantibacter flavus TaxID=150123 RepID=A0A3N2C5J3_9MICO\nMQTPPASRGSSTPPEPEAVPGPPRPPSSPGHRADPCRSPSRPSRSLSRPSRSPSRPLPVTEQPAPVTEPVEVPHTEAPRPTTLPGGPSTSSGNEYPHPGHASQPRSPSNPPRSPSNPHRSLSLSKCHTPKPPAPQRSPGALRHFDKLSAAKLRERTSLPRSPIRPSRSLSLSKCHTPKPPDPRRHPGGPSTLRQAQCGAAQGTDIPPPVTEQTAPGH\n>UniRef90_A0A5J4QFG3 Virulence protein (Fragment) n=1 Tax=termite gut metagenome TaxID=433724 RepID=A0A5J4QFG3_9ZZZZ\nMEDIPMKENEDIGGRKSKNEQIESYLQERYDFRFNTVKSKPEFRPKNGNHPFSPVTKFDLNSLKREMDRTMGIATSSDNVRTILESDFSPKIHPVREYFNRLPRLDPDINNYTWQLSQTVRVANSDKWLEYLVKWLVGVVANALHDVGCQNHTCLVLTGEQGRFKTTWLDHLCPPSLQSYLFTGKIDPQNKDVLTLIAEYLFINIDDQLKALNKRDENELKNLITTPAVKYRRPYGVYIEEYSHLASFMASVNGNDFLTDPTGSRRFLPFEVISIDME\n>UniRef90_UPI0014789B01 phosphoribosylformylglycinamidine cyclo-ligase n=1 Tax=Leucothrix arctica TaxID=1481894 RepID=UPI0014789B01\nMEENKTSLTYQDAGVSIETGNALIDRIKPHAKRTKRPEVLGGLGGFGALMSIPSRYENPVLVSGTDGVGTKLKLAIDMNRFDTIGVDLVAMCVNDIIVTGAEPLFFLDYYATGKLNNDDAENVIKGIADGCEQAGAALIGGETAEMPGIYREGDFDLAGFSVGVVERDAIIDQSSVANGNVLIGLASSGPHSNGYSLVRKVIEVSGAKLDEKFSDKEETLLGDALLEPTIIYVKPLLKALKQFDIKALAHITGGGLTENLPRVLPSNCKAVIDLTSWDRPEIFNWLQKEGNIEDMEMLKTFNCGIGMVLVVAEDQADEVINSFKLQDIKSFKLGQISAAETEEAYVEYV\n>UniRef90_A0A1I7TZE8 G_PROTEIN_RECEP_F1_2 domain-containing protein n=2 Tax=Caenorhabditis tropicalis TaxID=1561998 RepID=A0A1I7TZE8_9PELO\nMDKKYMNCTRCELCATADVIYGTPFMEYSILLRLLTAPLATMGMGLLSATIVKTKGIHINTKVILFVLCISAITCNTGITIDCLYKFFISNVMPDYMQCDFQVFNPQYGLVIRHIEMLGSMCLSTSSIALAVERTVATIFYRNYPSKPTLGSILVVVQIHDYKFYHFITTWQALLNVLAISVFIILWIINYYRMKIIENSHLQVVLARYNLHENMSTTCLMAPIIVVLCLMVFSAELIILLFTPQYDEDTVVTHKVLDEVIEYSFYPELQLTLIPIFFIALILVLITQSKKLRENFLLVSNLSICFPVKVHTTDSRSSSESSSSEGSSSIHWNSKMDGLSITPQVPKF\n>UniRef90_A0A3M2HUF5 Spermidine synthase n=2 Tax=Stutzerimonas TaxID=2901164 RepID=A0A3M2HUF5_9GAMM\nMKRFVLIDTAQIPDDGGALCLFEYGEDFVIKIQGGNGNQLMNTRTHGSEDALAEIPCRKIAQRPHPRVLIGGLGMGFTLASALRHLGEDAEVHVAELVPGVIEWNRGPLGEKAGMPINDPRARVLRSDVADILKNEPQGFDAIMLDVDNGPEGLTRKSNSWLYSSAGLEACAKALRPKGLLAVWSASADQAFSQKLARSGFNAEEVQVFAHGNRGTRHTIWIAEKRE\n>UniRef90_A0A2T1LZU9 histidine kinase n=1 Tax=Aphanothece hegewaldii CCALA 016 TaxID=2107694 RepID=A0A2T1LZU9_9CHRO\nMKEQDIKRQFLDEAGDYLNVIESALLGCSTKEITSAQFDAVLRAAHSIKGGAAMMGYQTLSDFAHRLEDFFKVLKSHSKPEIDETVESLFLSSVDQLRQISSFYRQGAETIAPEWLSEQVEPIFQGLLDRIGELTPEKSLSLLSEDVGEEMTVLIFETEVESCLQGLESIIAQPQPTNLREEILSISQELGGLGEMLQLPQFSRLCTSIYEHLKSATEGIDAIALSAIQAWRRAQAMVIVGQKEAITSEFLLNHSTVIPTLETETTSPEELKIETVSTEEKTLRVSSSLLTELADLFGEMSIGRNSMDLQLQRLRRLFNLLNQRIQRLESSSQALRSLYDQRIQGYTSSVIPIKTNSVKPHLALFDNLEMDNYSDLHPLSQEVMETIFQIEEVANDLDIYLAETEKTAKDSQQTFELIQSQLTKARMRPLTDLIAHFPRALRDMSLKYGKPVELKIQGETTRIDRTILESLNDPLLHLLRNAFDHGIEDPEKRKEVGKPPQGTITISASTVRNHTIIQIQDDGAGINLDKIRSQAHKMGLDEDIIAKATIDDLLNLIFEPGFSTAENKSELSGRGVGMDIVKTQVQQMQGDIKVSTLAGQGTTFTITVPMTLSLIRVLLIEVEQMLMAVPCNAIEAMILPEPSQIIQFKGQTFLKEESELFPLIYLKDWLNIPTVYTQRDHESLPSIDKPTILKIALGNNYIGLWVERYWGEQEVTIRPVEGNLKLPNGFTGCTILGDGCVVPLIDPALLLQPSFPPSFLSSSFISNSQPTAQKATLLVIDDSINVRRLLALTLEKAGYQVEQAKDGQDALEKLQRGLGVQGIICDIEMPRLDGYGFLANYKTDSIGQNIPVVMLTSRSGEKHRSIAMNLGASAYFSKPFQEKLLLQTLQSLIKN\n>UniRef90_A0A0R0EP28 Glutamyl-tRNA(Gln) amidotransferase subunit C, chloroplastic/mitochondrial n=4 Tax=Glycine subgen. Soja TaxID=1462606 RepID=A0A0R0EP28_SOYBN\nMTSKGLLRGASLTANAVWHRSSFFPKVTVSVHPKLVKFQSFSSTTACSSLPPPDLPRLAKTAQISLTPNEVEEIAPKIQQVIEWFGQLQGIDLESVEPSIRAGSL\n>UniRef90_UPI0015687092 helix-turn-helix domain-containing protein n=1 Tax=Ensifer adhaerens TaxID=106592 RepID=UPI0015687092\nMVDGIPSFFVYGEPEQPLEPGFFHVETVMARRGLHHGQVKAHKHDQLAQVTYWLRGRGSYFIEDKVLDFSAPAVSFVPSGIVHGFSVEPRESDAIVISIADGLMLSVRAQTALAIDVPVMIAGVSGDSQWQRLSQLMDIIADEYATAAFGTQSMMASLASAILTQIARLASFAPSPSQSPDMMLAMQLRRMIDAHFRENWTVGRYTDALGSTPHLLAKATGAAFGMQVKELINERRLLEAKRLLLFTIRPLEDIAYEIGFRDAAYFSRFFRLRTGVAPSDWRQLKLGQTASSP\n>UniRef90_A0A261KVG4 Transposase (Fragment) n=1 Tax=Hydrocoleum sp. CS-953 TaxID=1671698 RepID=A0A261KVG4_9CYAN\nMILYHFEKRILRPDCIILLSALAQVGHNSPDLIAYAFRSGLFRLPGGTSQTLPKEPVNYTLDQVGDSLKRLELATPKLKQSVVDACAYRTPKWIYKI\n>UniRef90_A0A2T5BQX3 Heme-degrading monooxygenase HmoA n=1 Tax=Rhodovulum imhoffii TaxID=365340 RepID=A0A2T5BQX3_9RHOB\nMPTISRSNEFQTVITTFEVTPGTCQDLLDALSEAYASFISRQPGFIGAGLHVNDAQTRIANYSQWVRREDFQAMLRSEEMRDRNRRFTELSKSFEPVMYDVFESYD\n>UniRef90_A0A1G9W8E7 Neutral/alkaline non-lysosomal ceramidase, N-terminal n=1 Tax=Daejeonella rubra TaxID=990371 RepID=A0A1G9W8E7_9SPHI\nMKKLFSCIIISVQIILLSERPAAQENSHSGWKAGVASVVITPEESLWMAGFAHRTKPSDGKLHELWAKALVIEDASGKQALLITTDLSGIPKSISDSIRNQLEKRFKFSRSQIIFNTSHTHSGPVLVDALWDLYPLDDTQKERITKYTKKFELQIESIVRKALGSMKPVNISSENGITRFAVNRRNNIENKIDAQTDLKGPSDYAVPVIRVSDQKGKILALAFGYACHNTVLHGYEWSGDYAGYAQITLEKAHPGATALFFQGCGGNQNALPRKTVPLATQYGKELALAVDAVLEGEMKILEPKLSTAYSEVKLELEKAPSKDELLTIVSKETGYIKNWALNMIKKADKGETFISSYPYPVQFWQLGNQSIVALGGEPVVDYAINLKKVFGPDLFVMGYSNDVMAYIPTAEILREGGYEGHTSQMAFGMPAKWKESIEPTIMREVMILAEQLGVKAKPKP\n>UniRef90_A0A5C5YMF9 Putative electron transport protein YccM n=1 Tax=Posidoniimonas polymericola TaxID=2528002 RepID=A0A5C5YMF9_9BACT\nMTPLSSLAAILRRAASLEIVVLAFAFLFALATGVEGQEAYDRPVSSAPQPDDIGAGYQTPEVQRTSPRSAALQMLDVVLLIGGMAAIAWVSRRGRRRWVVTAVTLASLAYFGFYRQGCVCPIGATQNVAASLSDASLATPMVVLAFFLLPLAASLLAGRVFCGGVCPLGAIQDLVLLRPVQTPQGVDRWLGMFRYVYLGLAVWFAVLPAGQRDFVICRFDPFVGFFRLNGPAWMLGVGVALLLLGTVVGRPYCRYLCPYGGLISVVSRFAIWPVRITPDEELDCGLCVDSCPFGAIKDLRAKPSECLACARCFAHCPRQQLAWGEIELVELDELVSSAKCVAQRSGGNE\n>UniRef90_A0A1I0ZIW2 Enediyne biosynthesis thioesterase n=1 Tax=Amycolatopsis marina TaxID=490629 RepID=A0A1I0ZIW2_9PSEU\nMAYYEIRHIVGFEETNLVGNVYYVNYLRWQGRCREMFLKEKAPAVLEEVRADLKLFTLKVDCEFFAEITAFDELSIRMRLEELTQTQIQFTFEYVQLAEGRENLVARGRQRIACMRGPNTATVPARVPEELRTALAPYAEDVKGARTESAAVPATGV\n>UniRef90_UPI0013C30B07 phosphatase PAP2 family protein n=1 Tax=Euzebya tangerina TaxID=591198 RepID=UPI0013C30B07\nMVRQAFSRLPGAVALSRATTDLGSMFMVAGAAAMLLAGGRVRRAGEVAAAGALGWTVAHQAKKVFDRPRPYEAEATPRLIAEPTGSSMPSGHAAVAMATATVLAGRAGPGRRWVWLLMPAWVPLTRIHLGVHYPTDTMAGLILGHGLGRLVVAVSDHRSRRQPQDDGRVV\n>UniRef90_UPI001C0550E4 protein PRRC2C isoform X12 n=1 Tax=Corvus kubaryi TaxID=68294 RepID=UPI001C0550E4\nMSEKSGQSTKAKDGKTKYATLSLFNTYKGKSLETQKTTVAARHGLQSLGKVAISRRMPPPANLPSLKAENKGNDPNVNIVPKDGTGWASKQEQHEEEKQPDVPQTQPKPAVPAPPEAAPVAKSWANTKPGGQEGPPIPINSYFQQEFPSLPAAGDQEKSGKDKDAPEDGSGPNLRPQNQDPKALGQEDASATPAEQNDGQKAGDKRDVRLPQVPQPKLNGQQQPPISSQYRAMMPPYMFNQYPRMAYPPSMQGPTRFPNSEPGRGPRGRGPPSWCSEPIERPSILSASELKELDKFDNLDAEADEGWAGAQSEVDYTEQLNFSDDDEQGSSQKEKESGDEQTPSKDSQSPDGQKETEEQTNAKSATQVSAAAAKGSYSKSSQLDQDRGPPQPSIHERGGPALPPKSILPPHPPPPDRQMGRQGPFPPKPVPDDDEIWKQRRRQQSEISAAVERARKRREEEERRMEEQRKAACAEKLKRLNEKFGCVTKPSREDPLKEREREREREREREREREREREKEREREREREKEREKEKEKEREREKEKEKEEKEKLEKAKEQEVEKEKEKEVEKEEKENEKEKEEEKPAHDVPEPVEPVATPVVEKQESETKNNKKEKEDQAVFTRQDSGRNEKEVSQVTHENEPDSGSQPRPAVSSGYSKQFQKSLPPRFQRQQEQMKQQQWQQQQQGVLPQSAPSQPSSGPVPPPQHRPLYQPMQPHPQHLASMGFDPRWLMMQSYMDPRMMSGRPAMDMPPIHPGIMPPKPLMRREQLEGSAAGSDSFEHMARSAREHTVPLSEPRMMWGSDPYPHAESQQSSSPPKVLEEPDDLRSEAHLEQERVAVPASAYPVEHNQLDSHPKTEFFRESGEVEVQKFPSRPLEDVQPLQTDTPNTAVNFEAVNEKVTRSSPELVPVGESHSSLKRSISHGSSHSLKSEDQRSETAANIPKLSNRPIEAKETIERLEIKPKKEILITNRTSEGPKPEKTFKPKSETRWGPRPGYGRRDEGGDRPVRRSGPIKKPVLRDMKEEREQREEREQRKEKEGEKTASEKPGKPEKSDKKEAPQVPLPQAEPERSTSSSAPLAKKITQDAAPVPASQESSQPEAAAKAVVQPPAPAVQQQLPAAQPAAAQLPPAIPQAPATQPAVQPPPHAQPPAPASKEEKQAEKVVSKEVVEKPRLETRPVKREPGLPPRTYWKEARDRDWFPDQGYRGRGRGEYYSRGRSYRGSYGGRGRGSRGHNREYPHYRDPKPRSEHVPSGPVRQREESETRSESSDFEVIPKRRRQHGSETDSDSEVHESASDTLLSDKDSIIKGKHPKREERADGKKPPKPLSFKPENNIRVDNRSLEKTYVRDDENKPKPGFLPKGEPSRRGRGGMYRRGGRDPGGRPPRPSTIRRPAYRDNQWNPRQTEIIKPEDGEPPRRNEHYGPIPIDKRPPKFERKFDPNRERPRRQRPARPPRQDKPPRFRRLKEREAASKMSEVVTSSTTSATVSNAVNEPSNPALDVSGSKTPDLSNQNSSDQANEEWETASESSDFNERRERDEKKTADAAAQVAAKAGENAGVPKREIAKRSFSSQRPGIDRQNRRGNNGPAKPGRNFSGPRSERRSGPPPRSGKRGPFEEQAAPVPGVDPANSNALHQEDGGVAAAGQKTTKDASGKKREEPKAGPKKPKEKVDALSQFDLNNYASVVIIDDHPEVTVVEDSQSNLNDDGFTEVVSKKQQKRLQDEERRKKEEQTVQVWTKKGSSEKGRGQNSKLPPRFAKKQQQAAAAAAQQAQAQPPCPAQSPAQPQAPVPTQSQAAGGTASTDYTVSGKVLQNTQAHNGLGAELWDNKVPPTAVLNDISKKLGPISPPQPPSVSAWNKPLTSFGSATSPEGTKPGQEGGVDLGIETIQFGAPASSGSDNEVGPVLSEKSTDKLPEPKEQRQKQPRAGPIKAQKLPDLSPVENKEYKPGPIGKERSLKNRKVKDAQQGEPEGQEKPSPTSVRSPEPVTTKETKAASELSTEIGTMISVSAPEFGTNTKESVTDYTTPSSHPNTVATSSTKMEETLVTNVPLPHTLPLPRRETLQQSSSLTPVSPATVDLTLKMESARKAWENSPNMGEKSSPVTSAASPIAGGSSSSSTGPSSGTYSSFSSASMPPIPVASVTPTTSLSGAGTYTTSSLSTKTASTSDPPNICKVKPQQLQTSSLASASHFSQLSCMPSLIAQQQQSPQVYVSQSAAGTTAQIPAFYMDTSHLFNTQHARLAPPSLAQQQGFQPGLSQPASVQQIPIPIYAPLQGQHQAQLSLGAAPAVSQAQELFNSSLQPYRSQQAFMQSGLSQPSPVVLSGTALHNFPAVQHQELAKAQSSLAFQQTSNTQPIPILYEHQLGQASGLGGSQLIDTHILQARATLTQASNLYSGQVQQPGQSNFYNTAQSPSALQQVTVPLPGSQISLPNFGSTAQPLIALPQSLQPPLQHTPPQAQAQNLSRPAQVTQPFRGLIPAGTQHSMIAATGKISEMDLKAFGGGIDVKPGTPPVTGRSTTPTSSPFRASSTSPNNQSNKMNSIVYQKQFQSAAAAVRMTQPFPAQFAPQILSQPNLLPPLVRAPFTNTFPAPVQRLPVVLHSQMPSQMTTGLMSHPQLPRVARGPCGSVPGARGTQAQAALKAERDMKVSM\n>UniRef90_A0A1A2FR64 MPAB_Lcp_cat domain-containing protein n=1 Tax=Mycobacterium sp. 852002-51057_SCH5723018 TaxID=1834094 RepID=A0A1A2FR64_9MYCO\nMKGPATRIADLLNPAAVLLPAANVIMQLSLPGVGYGVLESPVDSGNVYKHPFKRARTTGTYLAVAAIGTESDRALIRGAVDVAHRQVRSTPSSPVSYNAFDPKLQLWVAGCLYRYFVDQHEFLHGPLDDYSAEAVYRDAKRLGTTLQVPERMWPPDRAAFDAYWKRSLDQLRIDPPVREHLHGVASMAFLPWPLRMLAGPFNLFATTGFLAPEFRAMMRLDWSRSQQRRFDWLLVALRLADRLIPHRAWLFSYRLYLWDMRSRARRGRRIA\n>UniRef90_A0A7C8PLT4 Uncharacterized protein n=1 Tax=Orbilia oligospora TaxID=2813651 RepID=A0A7C8PLT4_ORBOL\nMPTGRFREQFRRFIASEILAASIASGPPKDLSRLEMPKYPIQTRPPKMPSESTRAASTESATLVRIAEYVFDEKYSNQNKFN\n>UniRef90_R5PHK2 Glycosyltransferase group 1 family n=1 Tax=Prevotella sp. CAG:487 TaxID=1262928 RepID=R5PHK2_9BACT\nMAGRLALKTCALGYVSDDKRIAVIYNAADIYVLPSVEDNLPNTIMEAMACGVPCVGFRTGGIPEMIDHGKNGYVADFRKADDLAAGMHRLLCGDDYEAMSRAAVSKVHIHYSQQSVAMRYIEVYNETAAMKKYII\n>UniRef90_A0A067SRJ6 HET domain-containing protein n=2 Tax=Galerina marginata (strain CBS 339.88) TaxID=685588 RepID=A0A067SRJ6_GALM3\nMPAIKAAGIDNSRTLYDIVHGCCVTLFACTWLSIHPNICAPSDSDWTSRRRRLKTMLCALIVPELVLVWALRQRTGAKKIAEKQKEKKWTRYHGFFISMGGFNLFCDGKRIPLSPKRLEQLEECGWIAWPGISEREIKDKSKGDFLSKGIAVSQTLWFVVQCIARFEQGLAVTELELVTMAFVVLNVALYWAWWDKPLDVRCPVDVKIKEGITLPQVEDLFYRDDTRSDPPNRLQLPSFRILKLSTEEGIQPTYPDQTFFLRKFMTFIHPKGPHGCLHRMIISLARPFSDMLSSTEIPRGADCVPTFYAPSGDSRSDYSDEYSIALGLGFAILFGLSHCVGIWVNLSFPTEIEQDIWRVTAIAITAAPLAFQLLGGLVLALGSPEPERPWSGVFMYGCLVIWYLILIAYIFSRFVLLVLPLIAMRALPGSAFDDISWAKFLPHI\n>UniRef90_A0A8J4Y4H5 Neurofibromin n=1 Tax=Chionoecetes opilio TaxID=41210 RepID=A0A8J4Y4H5_CHIOP\nMCVCVTPSPVPSPVTRHRFCSHPDDKKRAKVAMILDKLITLTIEEVEMYPSIQAKIWGNIGQVSELIDMVLDSFIKRSVTGGLGSGQAEIMADTAVALASANVASVAKKVIGRLCRVIDKTCTSPTQTLEQHLMWDDIAILARYLLMLSFNNCLDVARHLPYLFHIITFLVTTGPVSMRASTHGLVINIIHSLCTCTKPTFLGKFVCFVAVFVCRFFRP\n>UniRef90_UPI0021698233 SPOR domain-containing protein n=1 Tax=Mucilaginibacter sp. X4EP1 TaxID=2723092 RepID=UPI0021698233\nMKNTASYLKTKIGWIGYCIFFVLFILPALSHAQTRGKVEVVKDPLIDTLIARRASLGKNVAVGDDATSGYRVQIFFGSNRQDAYSAQARFLGEYPDTRTYILYTEPNFKVQVGDFRTKLEAQKLQNDLRDKFTSLFIIQGKINPPKTDASND\n>UniRef90_A0A8T9PFL0 O-antigen ligase family protein n=1 Tax=Leucobacter sp. H25R-14 TaxID=2932245 RepID=A0A8T9PFL0_9MICO\nMAESKTRLGVSAYAICVFIFTLGSNGVRNLVGWPAFLALAVVLTGLGIVLFVRLKPERFRWYRLPAPIYWFLILAALSILWSQYRLESVLGVAAQLATTVLAVVVAFVLSWHEVLRTLGTALRYLIGLSFLFELWVALFVRAPLLPWWMEEPEGETPKLLYWSRDLLFSGGPIQGLVASSVLLGFLGLLGVIIFAIQLRAGLVRPFSGWCWLALSLLTILLTRGATVWVALAAVVVGLVVALWARRLGPERRVPLYVTSGALLAAVIALTLFARDTVFGLLGKSGDMTGRLETWQKVIELAEQRPWFGWGWISYWAPWAEPFASLDRKAGLQVMSAHNAWLDVWLQLGIVGLLAFAPIVVLTMWRTWFRAVDQPRRGHGPALPYATSSLWPFLVIIALLVQSLTESRLLIEGNWVLLILLAVKSRFDFQLPSLDAEPTRLPWRRVPIPQERLVPYKRDPRD\n>UniRef90_A0A1Q9V6M8 TetR family transcriptional regulator n=1 Tax=Saccharomonospora sp. CUA-673 TaxID=1904969 RepID=A0A1Q9V6M8_9PSEU\nMPKYVDHEGRRTEIVEATWRLIAERGIEEATMRAISESLDMANGALKYYFPDKNSIIRAAFEHVVAATNARVRERVGEATGLAALRAFCVEMAPLTELTKLEARVVLPFWQRALSDPDLERLHTDSVTLLRAHIVEFLQQARAEGTVRASTPDDVLADQLLAMLIGLQALALLDQDGTGEAAQLRMIDAFLDSLA\n>UniRef90_UPI0015550403 DUF3990 domain-containing protein n=1 Tax=Palleniella intestinalis TaxID=2736291 RepID=UPI0015550403\nMLVYHTSDVQLNIPDTVHSRGNLDFGRGFYTTRLKEQAIKYGERFVALGHDAYLHTFDYTPCSNLRIKTFDSYDEEWLRFVCSCRKGGTEYEQFDIIEGGVANDKVYRTVDFFMTGIYTLEQALQQLVYHKPNHQICFITRKAIDLCLRLSDCRKLNI\n>UniRef90_A0A2G2GAA8 CSD domain-containing protein n=1 Tax=Arcobacter sp. TaxID=1872629 RepID=A0A2G2GAA8_9PROT\nMKESKGFIMKGKLFNCSNGATSSEHCFVIADGGKHGYFVSSKKADGPLMNGACISFELEDQKKGSIVTDVHILD\n>UniRef90_UPI000314C431 metal ABC transporter permease n=1 Tax=Bartonella rattaustraliani TaxID=481139 RepID=UPI000314C431\nMYAFFLAPFIDFHFMQNALIGSILLSISACPVGVFLMLRGMSLTGDAISHAILPGVAAAFLFRGFSLISMTLGGLIAGFIVVLATALISRNSFQKEDASLTVFYLIALAAGVMIVSLKNSATDLLHFLFGSVLALDTQAIFLITTIMVITVCSLYILWRALLVESFDPFFFKSLSPLSKYVHLSLLGLVVLNLVGGFQSLGTLLSVGIMMIPAITARFWLSRLGPICILSILLGIIASICGLLLSFHLSLPSGPAIIIAAGSLYLFSCFISPRGFIVAWFPHLFYNYFLNLKK\n>UniRef90_UPI00210245CE peptidoglycan endopeptidase n=1 Tax=Sandaracinobacter sp. RS1-74 TaxID=2913411 RepID=UPI00210245CE\nMGGAFRPQGRGEEGLDCLGLALRALAAGGCRVDMPRLPMRGHSVEQVHGWLCAAGFARLEVEEASPGDLLLSFPATRQAHLAVRTAEGFVEANAQLRRVVERPWGGGGVWDSAWCIGAGAVKGRG\n>UniRef90_A0A2E9K2A4 AraC_E_bind domain-containing protein n=1 Tax=Alteromonadaceae bacterium TaxID=1916082 RepID=A0A2E9K2A4_9ALTE\nMVLVSKTTDSTAMNEPEPALVQFEGVKLAQLVHRGSPQTLMASVGAFIQWRKLNGSPPSQSRTFNIFYSDPLNTEPAAFTFGIAAEHSKDIAPNSQGVSEAHIPALHCLSWIETGSDGKLQQRIEQVIGEGGYDWHFEQFPPFIERLHFYPDVPMAEAISRVYLPVQAQ\n>UniRef90_A0A8T1N0L7 Fibronectin type-III domain-containing protein (Fragment) n=1 Tax=Clonorchis sinensis TaxID=79923 RepID=A0A8T1N0L7_CLOSI\nMSITLDRLDECSETWMGIFAINFAGDSPVSPLVKLISPSAPTAPNDVRFNVDRRTRKIHITWKDTSVCPTTNYTLSDVQKGWLVTTVNREAYLDFGVPCYHYQIHIKGANTGGQGPASDVIRFFTPHNFDAPTNVRVTTEPSVPDVEVSWLATGVCHSIQYMVTLYVAGVIVKTEVTESLNVILRDLEKCKPSSITVKKYTQWWSGDESGRTEFQIPGVPSAPKLIGATTEQNVPSATVSWTYDGACTSTDFLVTVYATAESVPEPVRASGLSTSIGGLPMCVDLVFGVVGRNQFGSGQETKSSPIRIDAVPSAPKLIEATTEQNVSSATVSWTYDGACTSTDFLVTVYTTAGSVPEPVRASGLSTSIGGLPMCVDLVFGVVGRNQFGSGQETKSSPIRIDAVPSAPKLIGATTEQNVPSATVSWTYDGACTSTDFLVTVYTTAGSVPEPVRASGLSTSIGGLP\n>UniRef90_A0A843CS01 PAS domain-containing protein (Fragment) n=1 Tax=Methanomicrobium sp. TaxID=2052684 RepID=A0A843CS01_9EURY\nMTVKEITKVLEEALMGNYSVRVNVDEAEDELKELAETVNTAIEFIIDSKRTCDNVSMMIQQNPYPMMLLDRNFMPIDVNAAYEKLMGYSKDQILTMLASDYKSRRISGDNTETLFTAGHNTETLVEIDFKDGRKLFVEQRGVPLRDSDGNVEMGLFVFKNVTNEVIEKEEITKQLEQIKVLQGRSEVIVQENPMPILLCDKNF\n>UniRef90_UPI0004174C5D hypothetical protein n=1 Tax=Mesorhizobium sp. WSM3224 TaxID=1040986 RepID=UPI0004174C5D\nMPFTVIWYGRSGIVDKMSFDAEKAARDYAMSMFQTRKGDDGIVAVEVRKDNGAVVFSHSEN\n>UniRef90_A0A1N6TYF1 Putative signal transducing protein n=2 Tax=Marinobacterium stanieri TaxID=49186 RepID=A0A1N6TYF1_9GAMM\nMLVTIARYTYPYEAQIARALLDSEGIDAFIADEQTINMQWLYSDALGGVRLQVAQEDVMRAQRILQDDRETPLVELEGEDRPACPVCGSRDTEYYQIGRRWAFLMFLAIDFPLFRVQDGIRCHSCGAISKQHSDAARH\n>UniRef90_A0A7Y4ZJH0 3-keto-5-aminohexanoate cleavage protein n=1 Tax=Polyangiaceae bacterium TaxID=2268199 RepID=A0A7Y4ZJH0_9DELT\nMSSHDAHYAGELVDGARMLALFGDLATELLIRIDGDEGLFRAYESVEFLAPVLAGDYIEASAELLTLGNTSRKMAFVAKKVVSNLRAHGVSPSAAEVLDEPLVVCRAIGTCVTPKSLQRRPKGLYMPGLPPGPEPEASPIVTPVSNDVILTAAIVGAEVTRAQTKYLPITPQEIADEAARCREAGAAVIHLHVRNDDGTSTQSKERYAEVLEAIAKKTDCIVQTTTGGAVGMPIEERAGPLACKPEMATLNCGTINFGDDVFVNSRPDIRKLAKLIREAGSIPELECYEVGHVEEALALFREEHIQAPLHFQFVLGVAGGIGAREENVHYLRSLVPPEATWGVAAVGRHQVPMTELAMRLGGHARVGLEDNIYLSKGVLSEGSAPLVARAAAFAREIGRTPADPTRARQLLGLTK\n>UniRef90_A0A0N5BVH2 Calponin-homology (CH) domain-containing protein n=1 Tax=Strongyloides papillosus TaxID=174720 RepID=A0A0N5BVH2_STREA\nMTDNRLTEIPQIIIEKMKLLETLILAKNVIKTLPTCMKGFNSLNYLDLSSNNLTTIPSAIYSLPLQILLLSNNKLDTVSGDIVQMAPTIQELDFSKNRITSITSNISLLKQLRKLNLRSNRLGALPSEMASLDLYSLDISANRLTHIPVEFCSMQSLIHLSILDNPLLSPPIEIVLKGREHIFKYLQSAISSDVDYRGNYTDWSTNRNSFINATIRRPKNAEKVAAKAKRFAALNSSDSGYTSTGDDQRHSYDMEFSRNSLASIDENHKKETIIINKEYNGCLNNDDEGVDLSHTPKDVRKLNLIEECNDVNNSNNNNNNDINMDSSIYTTLASVTVTDSTYIKPNNIVVKDKEPKNEENPDSVLESTSPTTSESHSPLSESMASLSSPDGENNSTLVIESPNVKDNSNILVPISSNESPPKASNNRTLKPPTKKSPPSKVQSKLSVPSQGKSTLLIKKEPTISKLMKPSITTAIPTPRISKLTPPKKSMSISSSRSTTPSTPISPSNDDDVELMKKLLGSKLLAVTKEDEISKQLSSGVLLCNFVNKLKPRTIPVVMASLSPSQPVPLPKAKKNAENYVNAAKKLGLSEVCFTIFIISSF\n>UniRef90_A0A1H1DUL9 Lipoprotein n=2 Tax=Pseudovibrio sp. Tun.PSC04-5.I4 TaxID=1798213 RepID=A0A1H1DUL9_9HYPH\nMVGTQVANTLLKNTGRALLLIGIGASLAGCGSIMSSDSDLEASSSEAPATERTFDLSVLQAPAMCPSLQELSGTTILAKYPRGKEKTPENLTFQAVITDWARTCKRVGKDSAMKLGIAGNITPGPAWKGGEIFLPIRVAVTNEVDDVEKTTYSKLFSVPVTLGAGSPSATWAFVEEGIILPNETGQNVVFGFDEN\n>UniRef90_UPI00097132DB hypothetical protein n=1 Tax=Herminiimonas arsenitoxidans TaxID=1809410 RepID=UPI00097132DB\nMKQVLNIFIVGSILLSSQPVFAQSTTTVEADSQSYSVSALTERYPANSIQSSTAASSALADVTKARSFIESRFAAGQRACYKEFFTNSCLAKVKEQKRADLAVIKPIEIEANAYTRHAKVAESDRRLAEKAAQSEGRATASTQNKTDAASGKSTEANDLTKDAQRKVRAENYAKKNADYAERQKLLRENEQADAKKRAENVERYEAKVRESEARQKEVAAKKAEKAREQANKQ\n>UniRef90_UPI000FD9191E proton-conducting transporter membrane subunit n=1 Tax=Rhodobacterales TaxID=204455 RepID=UPI000FD9191E\nMTTAFSLSFLAPVLLIAAALAAFRTPGRRPGAVPQISEVAALGALGLVALGLIQVIVAGPAVSSLFDGAGVLALRADPVSATLALLVAFIGWIVLRYSRTYLDGEAREGAFHGLMLVTLAAVLIFVMSGSLWLLVAATIATGLGLKRLLLFYADRPEARRAAAKFGLVWHGGDAALIAAALVLTSAHGTGDLSAIAASNGGAGIAGHMAAGLLVLAAILKTACFPLHGWLTEVMEAPTPVSALLHAGIINSGGVILIKTAPLVQTSPGAMAALVMIGGFTALFGAAVMLTQSAVKTSLAWSTVSQMGFMLLQCGLGLWALALLHIVAHSLYKAHAFLSSGGAVAAVAAIRKPGPVAVPDLGAVLKSFGLALLLYAAIAGLFSVAIGPKTAQALALGAILVFGVAYLVAQGLADTAPAELTRRTVAASLAATLAYFSFQAVAQWVWGADLPAAPAPGPLEWALIVLAVLSFGMVALAQSLFPLWAHHPATAGLRVHLANGLYLNALLDRAIGGFRTTKSS\n>UniRef90_A0A8J4S172 DNA ligase n=2 Tax=Phytophthora kernoviae TaxID=325452 RepID=A0A8J4S172_9STRA\nMPAEDERAALRLSFGALCRVLEKLERTPKSDAKLRLLFSDALRAQLGGGDLYPLIRLVLPQLDRDRTYNLKEKMIAKIYIDVLGMASASKDAQKLEHFNDPNVIASKYVGDFAAVLYEVLLYRSLARDRQNERTLQDIIGLIDALEQADSSAMRKKVVMRLATEFSASEQKWIVRIVLKDLKVGLRHERVLNFLHPDAMKMYNHTNDLHKVCTDLRNSAVRYVPQLEPFRVFSPMVAKQVTFGECITAINADTFVMEPKLDGERITCHVQGKQVQFISRNGVNYTELYGTSMTPHVLSQLMPGVDCILDGEMMVWDNTEYQFREFGLLKNVANAMRNGDATNRWLCYTVWDVVYLGGSPKAESLIHEVFKGPREVSAVMGLPLHARRKLLLRILSPLDHRITIIEQTAVNAKSPKERHDIVMAEVDRQISNGGEGVIMKDLNAHYMCGESSRRAKKWLKLKPDYAGMTTDLDVLIIGGFYGTGRRRSGNVSAFLLGVLAQSVDENAAAETLKPGASCPMVYTFARVGTGYNLEELEQMRQELDPYWQPWDDNNIPPHLNGWKPQKYYLKPDLWIDPRHSKVLEVYGFELTYTTLYQTGLTIRFPRCKSIRNDKEWYQCINLQDLNAARGSLSIKRAGEIALGQKSTAKRAPKRQVLRARRAGGVLANYSQAALDGLEQECDVFEGKEFCVLPGKYDAPPPNSVSAIPSGILEEHAKHMSKQMVEKLLHSFGGSIVQNPIAESTNYVVAAGDAGFKVVNLKKQGHFNIVHISGSPPITAATGNDYGTSDRVQVEQLQPIVRKLRHQGLQEPPTVTKEWVEQSVEQRTQLPVEKFFVAM\n>UniRef90_A0A239J7H2 Amino acid ABC transporter substrate-binding protein, PAAT family n=2 Tax=Streptomyces TaxID=1883 RepID=A0A239J7H2_9ACTN\nMSERSSLSRRGFLSRTAAVGGLAAVPGLLAACSRTQAGTGAPTGDGDLLATLRKQGYVRVGFAGEAPYGYRDGNELAGEAPTLHGEIFTALGVPELRPTLTDFGALIPGLTADRFDVVSAGMAITPDRCRKVIFSEPEFVSPTALMVREGNPKGLSDLLSCAREKATVGVLSAAVEADYADAAGVPLTSVKSLAKQQDGVDALLADRIDAFALTGISLRWLARTNDGAAVEVLDPFLPVVGGRRQYSPGGAVFRPGATGLRDAFNKELGKITADPGRYTSLIGKYGFTKAEVPPATLRTAQLCKA\n>UniRef90_UPI001877F83B 2-oxo acid dehydrogenase subunit E2 n=1 Tax=Microbacterium sp. YJN-G TaxID=2763257 RepID=UPI001877F83B\nMIAEFRLPDLGEGLTEAEVVQWLVKPGDTVALNQTLAEVETAKAVVELPSPYEGTVSSLHADAGETVAVGAPLIAFDIGGDTPDSEPDGDEAATGEAADGGSAEKDAAPDAEKAQPNLVGYGAQPASSGRPARRVRRGGAGATATADAAVIEAAPHDALPPSAAEPAVGERPRSTPPVRAHAKRLGIDLVLVAAQVGDRVITRADVDAYAERVGAAAPVGTEQDAEMVPAAPPAPRGERAQTRIPIKGVRKHTAQAMVRSAFTAPHVTTFHTVDVTATMELIEQLRADRSLAEHRIGPLVVVARAVCLALGRNPSLNATWDEDAGEIIQNHFVDLGIAAATERGLIVPIIRDAERMSLPELADALQQLTQTVRAGKTGPADLAGGNFSITNIGVFGIDAGTPILPPGQSGILAVGAVRRQPWEHRGEIALRQVMTLSVSFDHRLVDGAEGARFLKDIADLLEQPGRAMLF\n>UniRef90_UPI0004BB0B65 T9SS type A sorting domain-containing protein n=1 Tax=Alkaliflexus imshenetskii TaxID=286730 RepID=UPI0004BB0B65\nMKLRLSLLAFLLVLAVDGMLGQQVWFFSEGTGATFYDQGIVDVANLGGSSFEYTHPPGLPQFNDKVPCSATAWSGSTSLKFNYTSAASGNWKATIYRSDWSVADITGMEFLGFYLYAGSGLPASALPKIGLVANRLGGGGDATSLLYDLSAHNDDVPADQWVEVKIPLSVFIEDGGNALLDFTRVKGVVFSQSEVNGVPRLLFIDDIKAFVSMDVVPPVSQLKAEGFDSHVELRWQQPLDFLSYRIYARYAGSEDYVQIAETDKDYYLHFVPQSARNTEISYKVEAFSQDKESDAVTIQATVRDFTDEELLDMFQRYTFRYFWEGAHQPSGMALERTNGDGRTVASGATGMGLMAMVVAYERAYEERAEIKTRILKILEFLENCERHKGAWAHWYNGDTYQTQPFSSLDDGGDLVETSFVAQALITLRNYFRDEDAQSVQIRQKATLLWEAIDWNWYRNGNQNVLYWHWSPNHGFAMNMKIQGWNESLITYVMAAASPTFGINKETYTQGWARNGSMVNPRTYYEHPISLSPNWGGPLFWIHYSHLGLNPKGLSDQYADYWQEHVNTAKIHHAYAVNNPLGHQNYSENNWGLTASDDPFGYTAHEPMNNDNGTISPTAALASMPFTPMESMKALKYFYRERGADLFGLYGPYDAFNDNMGWVQKSYIGIDQGPIVVMIENHRTGLLWKHFMADAEVQAGLDKLGFSYQATSAAPGLEHSELINLFPNPAVDNVSIELPHHLVGRQIAVAIYATDGSQVYSSVFESSETIYTINCSAVQNGFYLLKMVSGSRVYRAKLIIRK\n>UniRef90_A0A6I9VL36 secernin-1 n=6 Tax=Bactrocera TaxID=27456 RepID=A0A6I9VL36_BACDO\nMSATGDCFIVQSPNTAENTIIFGRNALDADALTEAQEVQYYNANVALEGKPDGGADVVKANGEILRMILQKTQTGIWGGDVGANDHNVCIAVSWSAEEPANDSDTLRSTDIVRLTLAIAKTAVDAVERIGNLVANHGSDNAKFSFVVCDTKEVWLVSSGAKLWAAHQVADGFLRLTNKGLSVKTAIDKSTDDLGDALKTLGLWDGEGDLNFASCFDAAETAEAEWSGEAPNGDGSYTLTSMFDTLRSAADSATSRSASVSVLTNGISCHWFTATPNASESVFKPFVFAPNPKISPLTKVPPDNTHTLLHKLHAQRKPNAVEDLKALEAACVEELNAYLAEHPNADEELDELMKDCVEAEVKFYR\n>UniRef90_A0A2Z5ZAZ3 Uncharacterized protein n=1 Tax=Nitzschia sp. PL1-4 TaxID=2083272 RepID=A0A2Z5ZAZ3_9STRA\nMIYINFNILLNFFLILYIFFIYTLQVIRPEIVTDTDVMLMSLLVLYNWVLVIQGWKFDPIMLFSQYILILLILTLEWENIRLRGFILILKKIINNK\n>UniRef90_UPI001BB17932 GATOR complex protein DEPDC5 isoform X7 n=1 Tax=Microtus oregoni TaxID=111838 RepID=UPI001BB17932\nMRTTKVYKLVIHKKGFGGSDDELVVNPKVFPHIKLGDIVEIAHPNDEYSPLLLQVKSLKEDLQKETISVDQTVTQVFRLRPYQDVYVNVVDPKDVTLDLVELTFKDQYIGRGDMWRLKKSLVSTCAYITQKVEFAGIRAQAGELWVKNEKVMCGYISEETRVVFRSTSAMVYIFIQMSCEMWDFDIYGDLYFEKAVNGFLADLFTKWKEKNCSHEVTVVLFSRTFYDAKSIDEFPEINRASIQQDHKGRFYEDFYKVVAQNERREEWTSLLVTIKKLFIQYPVLVRLEQAGGFPQGDNSTSAQGNYLEAINLSFNVFDKHYINRNFDRTGQMSVVITPGVGVFEVDRLLMILTKQRMIDNGIGVDLVCMGEQPLHAVPLFKLHNRSVPRDSRLGDDYNIPHWINHSFYTSKSQLFCNSFTPRIKLAGKKPTSEKTKNGRDTSLGTPKESENTLPIQVDYDAYDAQVFRLPGPSRAQRLATCRSVREQENHNRKSASSCDVSSSPSLPSRALPTEEVRSQASDDSSLGKSTNILMIPNPHLHQYEVSSSLGYTSTRDVLENMIEPPQRDSSAPGRFHVGSAESMLHVRPGGYTPQRALINPFAPSRMPMKLTSNRRRWMHTFPVGPSGEAIQIHHQTRQNMAELQGSRQRDPTHSSAELLELAYHEAAGRHSTSRHPGDSMSLNFGATEELSASLLSNSGAGLNPRTQNKDSPEDGVSTSPDPMPGFCCTVGVDWKSLTTPACLPLTTDYFPDRQGLQNDYTEGCYDLLPEADMDRRDEEGVQMTAQQVFEEFICQRLMQGYQIIVQPKAQKPSTTVPPPLSSSPLYSRGLVSRNRPEEEGQYWLSMGRTFHKVTLKDKMITVTRYLPKYPYESAQIHYTYSLCPSHSDSEFVSCWVEFCHERLEEYKWNYLDQYICSAGSEDFSLIESLKFWRTRFLLLPACVTATKRITEGEVHCDIYGDRPRADEDEWQLLDGFIRFVEGLNRIRRRHRSDRMIRKGTAMKGLQMTGPISAHSLESTGPPVGKKGTSALSALLEMEASQKCLGEQQATVHGKSSTQAAESSSVAMTPTYVDSPRKDGAFFMEFVRSPRTASSAFYPQASVDQTAALVSDSASLGVSTCQSLDRGSNQTLGNSQNIGEQAFPSANSDCSAQQHAASSLTSSSTLVEILEAMKHPSTGVQLLSEQKGLAPCCFISAEVVHWLMNNVEGVQTQAMAIDIMQKMLEEQLITHASGEAWRTFIYGFYFYKIVMDKEPDRVAMQQPTAPWHTTGVDDFASFQRKWFEVAFVAEELVHSEIPAFLLPWLPSRPASYASRHSSFSRSFGGRSQAAALLAATVPEQRTVTLDVDVNNRTDRLEWCSCYYHGNFSLNAAFEIKLHWMAVTATVLFEMVQGWHRKATSCGFLLVPVLEGPFALPSYLYGDPLRAQLFIPLNLSCLLKDGSEHLFDSFEPETYWDRMHLFQEAIAHRFGFVQDKYSASAFNFPAENKPQYIHVTGTVFLQLPYSKRKFSGQQRRRRNSTSSTNQNMFCEERVGYNWAYNTMLTKTWRSSATGDEKFADRLLKDFTDFCINRDNRLVMFWTNCLEKMHASAP\n>UniRef90_A0A317JBS3 DUF2959 domain-containing protein n=1 Tax=Chlamydiae bacterium TaxID=2081524 RepID=A0A317JBS3_9BACT\nMSLKEECKQLSDLFHRAAEGQSIDLQQVFAQSLQFFERLKVELKEEDPQRRQEAMAMLMEIYQHMIKDTKLICETSGMTEEQLVSFAENPTNFSPEQWASIQESREKISHAGQDLAKALEQLSSSQGEKKPHDPTKKSKKSDWMRS\n>UniRef90_A0A8J7MXB5 Tripartite tricarboxylate transporter substrate binding protein n=1 Tax=Candidatus Odyssella sp. TaxID=2589116 RepID=A0A8J7MXB5_9PROT\nMAAVAVAASALAVSTVAQAAWPERPVTIIVPAGAGGGTDATARLLAKQLQDELRQPFNVVNQGQASGLVGHTNISQARPDGYTLGIIYPYYQFNLSGQSQLDHSSFTPIALYNMDPSALSVAANSQFRTAQEALAFIRANPGRVRMSCGGSCGGSWDLPLAGLLVRLGIDPRTVVMVPSGGAAPGLQELVSGGVEMIACSLPEAAALISANRVRPLMVLASERAGNFPDVPTAREATGQDHTGGAWRAVAGPPGLPPEVVATMERTLERIWRSDEFQNAMRQRGFGLRWANSRDTAAFLLQHEREWTDGMTALGMVRRAPR\n>UniRef90_A0A661CEU1 Ferredoxin (Fragment) n=1 Tax=Gammaproteobacteria bacterium TaxID=1913989 RepID=A0A661CEU1_9GAMM\nTQVTLYNTEQLLASDRQTQGLISQQTQQFAQIAEQRSQSDSGGGFGGFLKGLVSVAANVFLPGSGVIAGALVGVVSDVVQGKDLDEALIGGAKDIVGEHCPPCAPAMDVAEGLVQGKEPGDILLNVAKNQLGNYCPECTPFVDVADGLLTGEDPLTTLEHFAKSQLGDACPECVQVWDTAKGIAQGVPPEQLITDLVGHQIGQQCPDCMPAVQAIQGVVAGQPIETVLQNSIGTQLKTYCPECAPVVDIAQQVVAGESLDHILGQAATQALSQSCPECLPAVAVVRSLANGQSPITVLKQALAEPLQTACPSCGTLFEVAEDLAAGKDITDTLTTAAQNQVATVCPECVPAWQTAEKMLQGDDPKTVISALVTDKITEHCPDCAPTLDMVQQIAQGKNPLELVVETTQRQLAKDCPECGEVLQTIIPIAQQAAFDTKQKVLAHLQSQRYNAGFSKEISETLNVSKELMETLQNFL\n>UniRef90_A0A2N0DCP7 TPR_REGION domain-containing protein n=2 Tax=Rhizobium sullae TaxID=50338 RepID=A0A2N0DCP7_RHISU\nMRTRPDQLDENILTLFNRACRQSRWEVAEHLLRALEASSDEGDGCEPPCVRSPLTDAYLSIASLHSKQ\n>UniRef90_A0A819ZRA3 G_PROTEIN_RECEP_F1_2 domain-containing protein (Fragment) n=1 Tax=Adineta steineri TaxID=433720 RepID=A0A819ZRA3_9BILA\nMPLNIVQLDLIGRYLNIYLGSFMLIAGLLGSCINLWLFTRHRFRKSSCSRFVIASSLFDILHLIVALFLRVLADGFGKDPASSSVIGCR\n>UniRef90_A0A533XQ95 DUF3108 domain-containing protein n=1 Tax=Nitrospirae bacterium TaxID=2026887 RepID=A0A533XQ95_9BACT\nMKRVFSQTPSMIRLVGFILTMLLMVGGFMEASGTAEESDQKADAIPAGDYVLYDQVVTRKFLTSATQLVVIDRMTRLRLSPDQEGPTTIDTFQEQGYFDGELPADLVREFSAVNRQPSRLEGRFHFGVGYRFATGDTIEEPEVSLARPVTVARARPVQAPSVLDRLAFSRVARSLLNDDALLYVEALRPDGTGAGFLVWFRRQGGSLTLFDTEVAWAIQAQVEPEEGPLLAP\n>UniRef90_A0A7C1TM52 OmpA family protein n=1 Tax=Gammaproteobacteria bacterium TaxID=1913989 RepID=A0A7C1TM52_9GAMM\nMHARTRFVVLFLGAMLAVSGCATDEYGRPREMTDTEKGAIIGAATGALLGLATRREAKYGVLYGIVGGVAGGAVGAYMDKQKKDFEKQLAPELDRGVIYMEKLPQNRLLVGMTAATAFEVDSTRIKPGFNPVLDKIARILNKYGKTHLTIIGHTDSTGSRAYNQKLSERRAEAVKQALLARNVIPERITTAGAGEDHPRASNATPEGRRKNRRVEIIIEPIVEPEG\n>UniRef90_UPI0005283947 DNA polymerase III subunit gamma/tau n=1 Tax=Bordetella bronchiseptica TaxID=518 RepID=UPI0005283947\nMTYLVLARKWRPRSFDTLIGQDHVVRALTHALDTQRLHHAWLFTGTRGVGKTTLSRILAKSLNCENGITSKPCGQCRACTEIDAGRFVDYLELDAASNRGVEEMTQLLEQAVYAPGAGRFKVYMIDEVHMLTGHAFNAMLKTLEEPPPHVKFILATTDPQKIPVTVLSRCLQFNLKQMPPDAIVGHLQAVLGEEQIGFEVPALRLIGQAAGGSMRDALSLTDQAIAYSAGNLSEEAVRGMLGTIDQRHLVRLLDALASGDAAGVLAVADELAVRGLSYAGALADLAVLLSRVAIEQRVRGALPQDDPLTEDITRLAAALHPDAVQLFYSVAVHSRGELTLSPDEYAGFVMACLRMLALNGEAGPATAVQAPRADTTPRAAAPAAAAPAETRPEPTPAPALAPQAAAAPRAVARSESKPQPAPEPEPAPRPAATPVAATPPAVAEPEPVAAPAVQARAAEPEPAPAPVPPWEDLPEAVAAPAPAQPAAAPAPVAADDDGPPAWVDEAIPDEAGGGFVPEHSFTADPDDEFETLAPAAAAMPAPRAPTPRRESGGRGRAARSRLADMSPTGWPELAARLPVTGLAAELARQSEWAGVQGDAVLLRVAVRTLAESESRVRLQTVLCEHFGQGLRLEIEVGVTGDGTAHAVAQIERAARQQAAEDAVAVDPFVQALVADFGGRVVPGSIRHVDNPPAA\n>UniRef90_A0A0B1P2W7 Putative rna binding protein n=1 Tax=Uncinula necator TaxID=52586 RepID=A0A0B1P2W7_UNCNE\nMGEKTSSRNHQSRKERKAKKRAVENSIPDIPTPELELEPEPVSLATKSAEEVKQLQLDNSLNANEPQGNKRKRNKDGNGESGDNDEEEIDKKKKSKKRNKNLSNKEAKFCEVLKNSVSEATRENINYKNNGEEQRYSPLVKDEGKKKEKKKDSKTKKSNSIIATNNTEEGSSPLLDQEKSSSQKSSKKERKTAKLNVVALKHDHLQNGKNSDDHSGNENMDISKEGLKDSTSTIVTTTTITPPTTTTTSVDEKISKKKKHKKKNSQDPDQSIPKSTSTIIQNTNLPSKRSIKKTSENLVEKVSSSPPRGKSRFIVFVGNLPYTATKDSIMSHFSKLKPLSVRHLTKKEDSSKSRGIAFVEFENFDTHKTALKIMHHSIFDDGKSEPRMINVELTAGGGGNTEDRKTKIKVKNEKLNEERIRRVEEDKAKLKKEEEKKSGLGKESSLKDDQNSSESHIHPSRRRMITA\n>UniRef90_UPI001E8E8CDE uncharacterized protein n=1 Tax=Fusarium flagelliforme TaxID=2675880 RepID=UPI001E8E8CDE\nMDGPSHSTLPLNPVSVFFSKSSQPALFWSEFPSWASLSLPSLLFSPLFCFALHCASILESWSCVASITFVTSSAPTSTLIPQLHQPPSKRLINFCFTSQRKEDQDFTTSASYYTPSRPRHTASRVPLVVQPHLAVATRLIVLHNDETDFSTTPSETLSLPQYRKTVIVRVRTAEHSEAC\n>UniRef90_A0A369W8G8 Formate dehydrogenase subunit gamma n=1 Tax=Pelagibacterium lacus TaxID=2282655 RepID=A0A369W8G8_9HYPH\nMALQDPGPDAAAQTRNIIADMTHLEGPLLPMLHAVQAAFGHVPQEALPVIADTLNISNAEIHGVVSFYHDFRRAPAGRHVLKLCRAEACQSMGSEAVAAKLTALLGVRSGETSPDQAVTIEPVYCLGLCSCAPAALLDGEPIGRLDDERIVAIVERVRP\n>UniRef90_A0A7I8XJZ7 (pine wood nematode) hypothetical protein n=1 Tax=Bursaphelenchus xylophilus TaxID=6326 RepID=A0A7I8XJZ7_BURXY\nMEDGVEEKAWSVVWYGNMHKGFDLTHFGMGFIHLNLKFAVTVDAPEYDAIPTAHLAFHTSQMSMAGAVAS\n>UniRef90_A0A6M4IS34 M42 family metallopeptidase n=1 Tax=Gemmatimonas groenlandica TaxID=2732249 RepID=A0A6M4IS34_9BACT\nMLSESSVAFLKRLLDTPGPSGFEGAPARVWRAEAATFSTVKADVVGNSLATVEGSGGPTILLAGHIDEIGVIVTYIDENGYIYFEPIGGWDPQVLVGQRMRFLGRNGDVFGVIGKKPIHLMKPEEREKASKITDLWVDIGVKNKAEAMEHLEIGDAGVIDARVMEMPNNRIVSRAIDDRIGAFVVLEALRRYAAKPGAARVIAAATAQEEIGYAGGGARVAAQQLDAKMAIAVDVTFATDHPGVEKKELGEHNVGGGPVLTRGSIVHPVVFRLLADTAKKLEIPYSVHAAGRFTSTDADGIHLTRDGVATALLSIPNRYMHSPNELVSLDDLDRAADLIAEACRAVTSETDFTAR\n>UniRef90_A0A836I9D3 60S ribosomal protein L22 n=18 Tax=Leishmaniinae TaxID=1286322 RepID=A0A836I9D3_9TRYP\nMVAVRAKVGSRSHIRQKQLAKGKKVFKIDCSIPAADGIFSEDVLGNFEQFFQDNTKLNGRKGKLTEKVRLTMKDNVLIITTTMVYRKKYFKYLTKKFLKKKDLRDWIRILSTGKGTYQLKYFNIQDQEE\n>UniRef90_A0A8S9ZRV0 Leo1-like protein n=1 Tax=Meloidogyne graminicola TaxID=189291 RepID=A0A8S9ZRV0_9BILA\nMDMENFENGKIIPSQIRNFTVKDFGNSNEAKIELSKPHEELSIHGGRNLFIGNSSGSSSNKNRSRKRNDDNESNEPENCDELPPRQQRRNDGSSESDN\n>UniRef90_Q8GPG3 Dimethylsulfide dehydrogenase subunit beta n=5 Tax=Rhodovulum sulfidophilum TaxID=35806 RepID=DDHB_RHOSU\nMVKRQISMVLDLNKCIGCQTCTSACKLQWTNRNGREYMYWNNVETHPGPGYPRNYEHSGGGFDEEGALKIGITPSAEDYGIPWEYNYEEALMTGTDPWLRPNVKPTWGANWNEDEGRGEYPNSYYFYLPRICNHCANPGCLAACARNAIYKRQEDGIVLVDQERCRGYRYCITACPYKKVYFNEQISKAEKCIFCYPRIEKGLPTACAKQCVGRIRFIGYLDDEAGPVHLLVERYKVAIPLHPEWGTKPSVFYVPPLAPPRIGDDGEPTEETRVPLAYLKELFGEAVVPALETLKTERAKKQSGAESELMDTLIGYRHPEMFKLS\n>UniRef90_A0A3N6CGQ7 ABC transmembrane type-1 domain-containing protein n=46 Tax=Paenibacillus TaxID=44249 RepID=A0A3N6CGQ7_9BACL\nMGKSFDLSLVLDFIPELLRYLHITLIVLGGSIVLGLVGGVLLAIPRLYRIPVLSQLATLYVSFMRGTPILIKLFLVYYGLPELLKPIGIDLSRTDPLLFVIVTYALSDAASFAEIFRGAVRSVDKGQTEAAYAAGMTTFQSFRRIVVPQALIVAFPNMANTLIGSLKDTSLAFSIGVMDMVGRGQTLISATSHALEVYISLSVVYYVIVIVLEKGFAFAERRLQRHERKRVVHKPAIRAKRLKEVVQKVRF\n>UniRef90_A0A1F8MA83 Ovule protein n=1 Tax=Chloroflexi bacterium RBG_13_51_36 TaxID=1797625 RepID=A0A1F8MA83_9CHLR\nMGNEVGNKAEKNGESSTNQADNKVNQSLGLKYLETDQKRNLGLAGTNLEATQKLPPKHVETNLETDLETNRKLTRKPDPKLTQVDSNPDICGN\n>UniRef90_A0A285JE01 Two component transcriptional regulator, LuxR family n=2 Tax=Arsukibacterium TaxID=336830 RepID=A0A285JE01_9GAMM\nMHKVLLVDDQKLIRDGIKSLLGLSGKVVVVGECVDGSGVLTACSQLQPDVILLDLSMPVMNGVQTLASLKQAGVSTPVLILTTFDEHELVLKSISYGARGFLLKDVSLETLVQAIATLADGGSWFAPNITERLLGSIRQTSDAGFSMPAQLEPLSDKELEILQLMAAGYSNKEIAAALYKSEGTVKNQCSAILAKLGVRDRTRAVLLALELGLIN\n>UniRef90_UPI0008F89955 permease n=1 Tax=Haloprofundus marisrubri TaxID=1514971 RepID=UPI0008F89955\nMSVVDQLVSAAELVIGMTWETWWALVLGFTLSGAVEAFVSEERMTDLLGDDGWREATLGTAFGAASSSCSYSAVGTARTLFKKGASGVAALAAFMFASTDLVFELGLVMWVLLGWQFVLGEYVGGLVAVVVMVAIFRYVVPQSWFDHARERVRENDDEECAACGMDADGDEAVYADAFPDAVFCCEGCLTAYENRTDAAGETSLRERVFSVAGWKSAASATTKDWEMLWDDIAIGFLIAGVVGAFVPTTWWTALFGADGSLEAVAVNVVIGVVIGILTFMCSVGNVPFALVLWTNGLPFGGILAFIYGDLLIPPLVNLYRKYYGWRLAAALSLSLFVSAVVAGVVVHTLFDGLGLIPTQGTVGGTLSGEYTTVLNLALTPVFLAQVYVTFGRDGVERRLAAGAAKLLRLAEWVVGTVAVLGTATGVVAGVVDAFGDVLHDAGDRARESVRHARVRALRRVRGREMPSPGTADATAEQTESDE\n>UniRef90_A0A251SHM8 Ovule protein n=1 Tax=Helianthus annuus TaxID=4232 RepID=A0A251SHM8_HELAN\nMNLRTCNKVDTVLRMHLLMNHITRRSNRIWVMGYTGMKVDTEVTVDTVVMVDTGVKVVTVYTIDLGMKLDTVDTKNMVDMVMSPVTHHFMNHLPRAIHFK\n>UniRef90_A0A081IBZ0 THO complex subunit 2 n=10 Tax=Plasmodium (Vinckeia) TaxID=418101 RepID=A0A081IBZ0_PLAVN\nMSLNFSDDDIYENKGDEIPYENNLNEDIENNEVNFNGDPYGDEYADEFERNANIEEEEQKEKKKKKTITFQLKNLFNETALKQINSDINKKRKNEKRNSYNDDYSNMMDQDEFEEQYSDNDELKKYVQDEKNKIKQLVDEKDELWDMYIYLNLKKKKRKIDYTEERYTSAIKKVLDSFCSEYKNMVIENLFKNKIFEKYLIVSDIDIFFKNNNIENVYKNTTTPVINKKNSLLEIKKRLVDIYNKGNCFNYLKEVSVDNRTRLNGVAEDEYGFENDESINEDKNEYMFNDNSKRGELDTNFIIEREKINLKINKLEHKYIKLIQTVKQYKRKHLRTNFNLFMNLINEVTSKLYFSIHNVLLMNDGENNLADIYKTIRRKYNIHDVLNKVQNLTQKKEVYEHYRSYLIYKYKSTYPICNNTFKNHQMEENINIFNFKKTYNTKFTNNFSLLQDENDLGDEHFNKVENSTSANKTDINANNNMNTNNKKVEENIFAQDIYEEDFFNIDTQNKESDIKTDSWEDREKNNETHPNTNSFASTKQDTQNKLNTPNEPTTIEETPLERAKRIAREKKKKLMESQAKIL\n>UniRef90_UPI001C2DB369 hypothetical protein n=1 Tax=Catellatospora tritici TaxID=2851566 RepID=UPI001C2DB369\nMSEQNIADAQIVVKSDMGRNHELEFDYDIVVVAGERGRQLAAAQAESILEILEPFGPPAEPSDRPGPEPDETSSRAELM\n>UniRef90_A0A1V6QLK6 FAA_hydrolase domain-containing protein n=2 Tax=Penicillium TaxID=5073 RepID=A0A1V6QLK6_9EURO\nMSSINIPWTRLVRYSSSADGPVKYGEPVASPNADLGQLANEGKLQVKQLSGSDPFSLQTTDVTEGVFCLYGPLAPKDVPIIRCIGLNYKTHILETGRPLPTCPTIFTKPGPAVADHDSPVPIPTIAQEQCDYEGELVIVIGRDGKNISEADALDYVAAYTAGNDVSARDWQREAGKAGPVPQWGFSKSFDKYAPLGPCLVRQDQLNEANNLSLRTLVNGEVRQDSHTSDLCFGVRKLVAFCSQGQTLQKGSLIMTGTPGGVGLFMKPPNFLKDGDEVSVEIENIGTLRNIMKFEE\n>UniRef90_A0A0C2I283 TPR_REGION domain-containing protein n=1 Tax=Pseudomonas batumici TaxID=226910 RepID=A0A0C2I283_9PSED\nMSTRNWPRHLLCLSLSLPLGSALACGPDFPLRLLEDRAQSLADLPETNFQFEVNRLGEAVAGLKPATEATLTPYWDSDDNTKPYREQRDKVEASELPENLRAEVARLRNLADPQQVETEGASLPAELRLYIAGAVAFQSGDAQRAVDYFRQVLALPADQRKLRSTWAAYSLGRALVALSAQAEAGVDTPADSAAPVVTSPELQAQARLAFQQTRALSAGDFSDPLELGIASLGEEARLARFDNDWNRAIALYASQSRLGSNSGYTSLKQVAGELARLPDDELGALLKEKNVQALLTAYVLSRVGGFFDEQPEADQRLSRMVLASVAGSLDNADRLAALSYQKGDYAGAKAFVGHAGDGGLAWWVRAKLALRDGDKVQAAAAYAKAAKAFPKDEVWGPRRAPDWSFESIQPGCRVQGESAILALDRGDYLQAFDQLYRSQDIYWLDAATVAERVLTLDELKTYVDAHVPAPPAAKPEDKDNYVRRPVAAQLRELLGRRLLREGRYDEAPKYFDSPELQATARDYGRDRQQAVSRWTATGRAESLFAAATLARKSGMEILGYEMAPDYRALDGYYSLGAAELKPGPFLETAEVQRQQASVAKPDRRYHYRWVAADLANQAADQLPHSSQAFAAVLCKAANWVAGSDEEIQYYQRYVEQGPYVSWAANFGRQCQAPDFDQANRRYLTQPLNSVRSALRPYKVALVVGGLALFGGLAALWVRRRKAKL\n>UniRef90_UPI001EF2088A response regulator n=1 Tax=Actinoplanes cyaneus TaxID=52696 RepID=UPI001EF2088A\nMAEDDPDIREISLLLMRRAGHRVISAEDGAQGWRAVLFHDPDLVISDVDMPEMDGLELCAKIRGNPATELTPIIFISGVLMPDDDRVITAGATALLHKPFTAAEMLSCVNASLAAGAKAGRDTK\n>UniRef90_A0A7Y2JY00 TetR/AcrR family transcriptional regulator n=1 Tax=Massilia aromaticivorans TaxID=2725995 RepID=A0A7Y2JY00_9BURK\nMRQKTEAKRQAILAAAGAVFREHGFETSSVSDIAARVGGSKATIYSYFPSKEALLMEVILSAAETRSVTVFSEVLALGDVVTGLRRIGEAHLSFISTAEAVALARLAITAGERSTLGREFYTRGPLVMIENLAAFLAASIARDELRPGDPRQMAESLKALYEAGIVERHLLGDLKGLEGVDLAVHAAQAVDIFLAYYGKA\n>UniRef90_A0A1R3UIW8 Inner membrane protein n=2 Tax=Nocardiopsis TaxID=2013 RepID=A0A1R3UIW8_9ACTN\nMNFNSLSALAFRVVAVFEAFTWVGLLVGMYFKYLGNGSELGVQIFGPLHGGAFVAYGLVALLAAYRFRWGAWPTLVALAASVPPLGTLLADWWLHRTGRLDPERAETVRTPEPVA\n>UniRef90_A0A222G883 Uncharacterized protein n=1 Tax=Cognaticolwellia beringensis TaxID=1967665 RepID=A0A222G883_9GAMM\nMEANKLARLSCLFEKAVANNAKLLEKHELDELYNEFINDGRDHIKNTVVAFPKGLRRTAS\n>UniRef90_UPI00190B6181 septal ring lytic transglycosylase RlpA family protein n=1 Tax=Paraburkholderia TaxID=1822464 RepID=UPI00190B6181\nMSNGQELVTSAPVTPRLIEGSPPMLVAGAENRLDAETPPLPYNHGHVAHFWQSGLASWYGKVFHGRRTASGEQYDMYALTAAHRTLPLGSYVRVTALRDARSVVVRINDRGPYARGRVIDLSYVAAAALGLSRTGTMRVRIESVGKQDSQRVALDCKCTEVETGG\n>UniRef90_A0A148KMI4 Alginate lyase n=2 Tax=Paraglaciecola hydrolytica TaxID=1799789 RepID=A0A148KMI4_9ALTE\nMLLTPCSYSATDTHQNTLPASHSALAEGELLGDFTKLDPSKKPSENFDLEDWSLTLPTDLNKDKKADMIYEKPLSSGFELKPLFYTADDGGMVFACPNVGAKTSNNTKYARTELREMLRRGDTHIKSQGITGNNWVFSSAHGSDRRNAGAVEGSLEATLAVNRVSTTGDEKMLGRVIIGQIHATDDEPIRLYYRKLPNNNKGSVYFAHEINGGDDVWLDLIGSRSHTLADPEDGIELDEKFSYKITVENDILFVTLVRQGKTNITQSLDMSQSGYNKSNQYMYFKAGVYNQNNSGDPKDYVQATFYHLDNQH\n>UniRef90_Q90X71 carbonyl reductase (NADPH) n=2 Tax=Anguilla TaxID=7935 RepID=Q90X71_ANGJA\nMSTNKVALVTGSNKGIGFAVVRALCKEFPGDVYLSARDVDRGTAAVENLKTEGLNPFFHQLDITDPASVRHARDFFKEKYGGLDVLVNNAGIAFKVADSTPFGIQAEVTLRTNFLATRDLCNEFLPIIKPGGRVVNVSSGMSSIALKSCSSELQARFRSNDITEEELVMLMEKFVQEAQKGEHTHKGWPNTAYGVSKIGVTVLSRIQARRLREERAGDQILLNACCPGWVRTDMAGPNATKSPDEGAVTPVYLALLPVGATEPQGQFVSEKQVQVW\n>UniRef90_A0A5M9QSU3 DUF4134 domain-containing protein n=5 Tax=Lactococcus TaxID=1357 RepID=A0A5M9QSU3_9LACT\nMKKNKIILGISLVGFIASMFLPSFQGIDIKVFDYTKMNYFELVKEKWWIYVLLLIILVLIRTLSIEKSKILSSIFVSGFIFFKLSLLSLENGHLFINGYPVLWGYAVATLFGLLVSFSLLIDTYKDRG\n>UniRef90_UPI00146DA424 glycosyltransferase n=1 Tax=Flavobacterium silvaticum TaxID=1852020 RepID=UPI00146DA424\nMKTITVFTPTYNRAHCLTILYDSLLRQTSDDFEWLVIDDGSVDETKQLVQGWIDEGRIPITYKYKENGGMHTGHNTAYAMISTELNVCIDSDDYLPDDGIEKMITLWRRDGSNKYAGMIGLDVTIKGAVIGTQFPEGLKECTYSELAPRYKVVADKKLVYRTEVVKKYEPYPVFPDERFVPLYFPIVIDRDYKVLCYNEVFCIVDYQPDGSTIGIFKSYFRNPKGFAHSRKIEMIYDPFWKRKVKSAMHYVANAIMTKNANFLSESPKKLLTFLSIPGGVALYLYLNRKKNQDRDISKGYKR\n>UniRef90_Q9AAQ7 TonB-dependent receptor n=4 Tax=Caulobacter vibrioides TaxID=155892 RepID=Q9AAQ7_CAUVC\nMKKISGLRLCGDNVAALIVRPRVLKKVLEWSASCLQCATSPQSVFAPLSQGGIQKMTNTKTTATAGRRKAFVIALLSGACFAEAALAQSTPAPAADQAAVDEVVVTAFRKSLATALEVKRKDVRVSDGISSEDIGKFPSENIAEAIQRIPGVQISAINGRGSTISIRGLGPQYALTTVNGQAFKSSNFTDGFRYDVIQTELASGIQVYKSPTADMDAGGLAGTVNIDTVHPFDVKGRQIIVAGKLQQQELIGGNPTGKYGLTYVDHFLDGKLGVFLGGGYQELKDRGDYLWMDRWTVSNNVYTPARLRYRRIDRETKRSMINGAVQWKPTEHLQMDLIGTYAEDKTTQNIHQQVFLFTTPSASNVVPITVANGTSTKVQVNNFRLENNQQYENRPQSTSALTTKLHYTGLENWDFNAVAHYSRGNAKHNEEAAVLGINIPSATVDIADPKNVIFTTSTALTNTAQYAPTTLIRNTYPTGAFRTVGSHESAAQFDAKRYLDWGILESVQVGAKTRSEVLKRYVIRKDNQVVPASFSPTMANSGIAVTNFLDGQMTLPNAWVSPNLDAYREALKAQGISVYEGFDPLGSYRVERDLTSVYAMANLRGEVLSKSYRANIGVRNESTDQTIKGYIGSTANPQNTEVRLAAGNYTAKKSYDNLLPSANLSVDLTDNLLLRVAAAKVLVRPIIDSSNQLARTMTSATDTTGRRIFTISSGQGNLNPMTANQLDLTLEWYYGQGNGLSAGYFSKKVKNGVFSQLTCPTSYESVALSRDSSGVCVAANGDNYMITESFNDSRVVDIHGYEVNWQQSLDAWLPIEGFGLIANYTHVTPAKSTTGFRLANLSEHTANGTVYWENQKFSARLSANYRSAYDQTSVESFFAGPLGHTIKARTQLDLNLGYNFNERLSFAFAAMNINNAQEEAYLINASRWQETAVTGPSYFLSFQYKM\n>UniRef90_A0A1J5H2U3 DUF3598 domain-containing protein n=1 Tax=Oscillatoriales cyanobacterium CG2_30_44_21 TaxID=1805292 RepID=A0A1J5H2U3_9CYAN\nMRSQWECLLKNLGNWKGSFARLNPQGAILEDIPSETILELKEDRQTMRQTVRRFIDGQPQDLVLEYQNLNKSTTFFENGAFSQGSPQFAPYAEFGTEMGLIDGDRRLRLVLLYDKAAQLDRITLIREHLAHSENSQPPILTLHDLLGKWEGEAITIAADWSEPEVIATKTEWNQNGDRVTMSLQMGTQSLTATAFINPFQPQILTFPQDQVQTLFLPDGASLTCPVAIAPRQSFRLSVSWLLEPNLHQRMIRAYDAKGAWSSLSLVTERKTM\n>UniRef90_A0A157SJD7 Acyl-CoA transferase n=8 Tax=Bordetella TaxID=517 RepID=A0A157SJD7_9BORD\nMSQRSAPLTGIRVLDLTRVLAGPWCTQNLADLGAEVTKIERPGAGDDTREWGPPYLKDEHGNDTTEAAYYLSANRNKLSVALDIATPRGAELVRELAAQSDVLVENFKVGGLRKYGLDYDSLSQINPRLIYCSITGFGQTGPYASRPGYDFMIQGMGGLMSITGERDDLPGGGPQKAGVAVADLMTGMYSTVGILAALHERARSGLGQHLDMALLDCQVAMMANQNLNFMTSGKAPRRAGNAHQNLVPYQVFAARDGHLIVAVGNDSQFRNYSRVIGLPELSADPRYATNPQRVQNRDTLVPLLAERMATGERDRWLAELEAAGVPAGPINTLDQVYQDPQVLARNMRLELPHPTAGKVPMAASPLKFSGSPVQYRHAPPMLGQHTRQVLQERLGLSEDDIQALAQPRA\n>UniRef90_A0A223S709 Alpha/beta hydrolase n=1 Tax=Nocardiopsis gilva YIM 90087 TaxID=1235441 RepID=A0A223S709_9ACTN\nMGLPVVLVHGLRLSGTMWRPQQELLEAQGRRVVAVDLPGHGTRRGQEFTLPAAIDAVAEAIDAVGGRALLVGLSLGGFVSIAVAAAHPGRVAGLVAAGCTARPAQTLAQVYRIPAVLLDRLPDHGQAVNERFHRLTLPTDGAAAALDGGLAMEAARAVIDEISDMEVLEALGAYEGPVWLINGARDPFRIHERQFLEACVDGRLLNVPRAGHMVSLDQPENFAKLVGDIADVASVRAAEAPPGAARSHGPGV\n>UniRef90_A0A8K0DS69 DDE Tnp4 domain-containing protein n=1 Tax=Ignelater luminosus TaxID=2038154 RepID=A0A8K0DS69_9COLE\nMDAILKLKKVEKLSKLVKLKRLHEHKNKRLWSREWLLRRDSKELGACSFVEHELQEEDYNLYKNYLRMDKCVFEKLLRLIEEDIAKQDMQFRKSISPRFRLMITLRFLATGETFTSLSYSTRVGVSTLSTFIPEVLSAIYKNLCKLYLKVPSTTQEWKTISNEFLTQWNVPNTVGAMDGKHVVFRPPKSAGSHYYNYKGTHSIVLLAIVDASCRFLYIDVGTNGQISDGGVFEDCDFAVELNRHSLNIPEDTPLPGMTIPVPHVLLADAAFPAQQHILKPFPMKDMTKHQRIYNYQISRGRRIVENAFGILVNRFRVLLNPISLARDKVVLITQACCVLHNYIKTESHEQIIKAQDSENIKKITIQLYIMLHTPEDVQVSDILSHENNLKNTLIIMVQYLGRITKHNVFIIV\n>UniRef90_UPI00177E212B Fe-S biogenesis protein NfuA n=1 Tax=Blochmannia endosymbiont of Colobopsis nipponica TaxID=2681987 RepID=UPI00177E212B\nMIDITNIAQEHLTKLLSQQKPGTQIRIFVIEPGTYNAECGISYCFAENINPSDIKIRFKSFSVYINKTNLPYLKDTEIDLIFNQTESQLTIKAPNARMCQPNDDAPLDKKIEYILQSKINPVLAQHGGSVKLIEITKDMSAIIQFSGGCNGCSMVNLTLKESIEKELLQKFPELKKICDLTEHQHGKHSFY\n>UniRef90_UPI001054CDFC AAA family ATPase n=1 Tax=Occultella glacieicola TaxID=2518684 RepID=UPI001054CDFC\nMGRTNYLIEGLSGTGKTTVCDELQRRGHHAIHGDRELAYRGDPETGRPTAGFGHEHHIWDVDKVRALVADREHAATFFCGGSRNFSKFIDLFDGVFVLRVDLATLNRRLDERPDQEWGGGQPTERDRIVHWHRTNTDVPANGIAIDATAPVERVVDEILRRCETDR\n>UniRef90_A0A146FHF8 Short-chain dehydrogenase n=1 Tax=Aspergillus kawachii TaxID=1069201 RepID=A0A146FHF8_ASPKA\nMTRTWVVVGASRGIGLEFVRQLASSGERVIAAVRSLSSAEQLFGLLSQYTRNGAPLITVEECDVTKPDSIDDFSHNVEKAVRDGGLRLTNVILNAGINQYPNRATEMYAYRP\n>UniRef90_A0A0A0MRI8 Obscurin (Fragment) n=3 Tax=Hominidae TaxID=9604 RepID=A0A0A0MRI8_HUMAN\nAGKTMAIAAQGACRSLTIYRCEFADQGVYVCDAHDAQSSASVKVQGRNIQIVRPLEDVEVMEKDGATFSCEVSHDEVPGQWFWEGSKLRPTDNVRIRQEGRTYTLIYRRVLAEDAGEIQFVAENAESRAQLRVKELPVTLVRPLRDKIAMEKHRGVLECQVSRASAQVRWFKGSQELQPGPKYELVSDGLYRKLIISDVHAEDEDTYTCDAGDVKTSAQFFVEEQSITIVRGLQDVTVMEPAPAWFECETSIPSVRPPKWLLGKTVLQAGGNVGLEQEGTVHRLMLRRTCSTMTGPVHFTVGKSRSSARLVVSDIPVVLTRPLEPKTGRELQSVVLSCDFRPAPKAVQWYKDDTPLSPSEKFKMSLEGQMAELRILRLMPADAGVYRCQAGSAHSSTEVTVEAREVTVTGPLQDAEATEEGWASFSCELSHEDEEVEWSLNGMPLYNDSFHEISHKGRRHTLVLKSIQRADAGIVRASSLKVSTSARLEVRVKPVVFLKALDDLSAEERGTLALQCEVSDPEAHVVWRKDGVQLGPSDKYDFLHTAGTRGLVVHDVSPEDAGLYTCHVGSEETRARVRVHDLHVGITKRLKTMEVLEGESCSFECVLSHESASDPAMWTVGGKTVGSSSRFQATRQGRKYILVVREAAPSDAGEVVFSVRGLTSKASLIVRERPAAIIKPLEDQWVAPGEDVELRCELSRAGTPVHWLKDRKAIRKSQKYDVVCEGTMAMLVIRGASLKDAGEYTCEVEASKSTASLHVEEKANCFTEELTNLQVEEKGTAVFTCKTEHPAATVTWRKGLLELRASGKHQPSQEGLTLRLTISALEKADSDTYTCDIGQAQSRAQLLVQGEAAKCARA\n>UniRef90_A0A5A9P3B1 Leucine-rich repeat and calponin-like proteiny domain-containing protein 3 n=1 Tax=Triplophysa tibetana TaxID=1572043 RepID=A0A5A9P3B1_9TELE\nMAASVLHSAESAVPSFTVGHPARATGIHGLSNAPGPGSWNRSLDRALDEAAATGVLNLSGRKLKEFPVIVNFLSKTTHYYLSRNRLPELPVEVCMFVSLENLNLYQNCLRSLPESLINLQSLTYLNISRNQLSTLPAHLCRLPLKVLIACNNKLVSLPEDLGKLRHLTELDVSCNEIQTLPPQIGQLETLRDLNIRRNHLVRLPPEVAELPLVRLDFSCNKVTSIPVCYRNLRQLQSIILDNNPLQSPPAQICIKGKIHIFKYLNMEALVKRKRKNRLLNTPELSCNCLSSVERERKKERDKKKDRGVAEDLGDKRWSGNEASGFQPVEGRSQLASAPILNYACLLITQLMSLCVLTLSSGESRCTHTHSVRESRVQCFYSCRCGCVCKRVAGVTSGSEKQISAERRCYELRQADYLLTSQTFTMGRWHRTHDVCMVFQLCVCEHNKSSPSPTKLSPTDTCYLKSHVSCSISESVPLQTVHSHRRLRPLYGKSQSNRNFIVKRTQSLRLKHTYTGEEADLIEQLRRNIECRLKVSLPSDLGAALTDGVVLCHLANHVRPRSIPSIHVPSPAVPKLTMAKCRRNVENFLEACRRIGVPQKQLCLPLHVLEERGLSQVAGTVQALLDMAPPKQTSSFTL\n>UniRef90_A0A1C6D475 Translation initiation factor IF-2 n=4 Tax=Eubacteriales TaxID=186802 RepID=A0A1C6D475_9CLOT\nMAKLRVYELAKELGKESKDVLTVLASKNIEVKSHASSLSDEQVDMVRKSLSPKAQVQSQARPQSQVQRPSAPAGEAAAHAPEARPQQEVPKKKPNIIQVYNPQNSQQASLNRQSGRPQAGRPGQNPRPQGQRPMGSQQGARPAQGQGQPGTRPVQGQGQPGTRPVQGQGQQGTRPVQGQGQPGTRPVQGQGQPGTRPVQGQGQQGTRPVQGQGQPGTRPAQGQGQPGTRPVQGQGQQGTRPMQSQGQQGARPVQSQSQQGTRPAGQAGNQGVRPNGSYQGNQGQRPQGQQGSQNRPAGASQYNRPNGQQGNSSQRPAGNQQSYGSNRPYGQQNNNGNRNTAAGQGQRSGQGQYNRPAQGDRPNGRPNQGSGQYQNQGSGQYQRNSQGQGGQRSGQGQYGNRPYQGQNGRPQGQNNRSQGTRPGGAPSMRDGLTIPKPPQTKATEKQNVTSRAERGDRNDRSRDKDRNGRNDRRGYQDNRPNQRNMGGKGRNNAPAPKPVQQEPKEVTIRTIILPETMTIKELAEKMKVQAAAVVKKLFLQGSVVTVNQEIDFEKAEEIALEFNCIAEAEVKVDVIEELLKEEEEDPATLIPRPPVVCVMGHVDHGKTSLLDAIRNTHVIDKEAGGITQHIGAYTVSIDGQKITFLDTPGHEAFTAMRMRGANSTDIAILVVAADDGVMPQTIEAINHAKAAGIEIIVAINKIDKPSANIERVKQELTEYELIPEDWGGSTIFAPVSAHTHEGIDNLLEMILLTAEVCELKANPKRRARGLVIEAELDKGKGPVATVLVQKGTLHVGDSIAAGSSYGKVRAMMDDKGRRVKEAGPSTPVEILGLSDVPNAGDIFVSPENDKEARNFAQTFISEGRERLLEDTKAKMSLDDLFTQIKAGNVKELGIVVKADVQGSVEAVKQSLLKLSNEEVVVKIIHGGVGAINESDVILASASNAIIIGFNVRPDATAKNTAEREGVDMRLYRVIYDAIADVEAAMKGMLDPVFEEKVLGHAQVRQTFKASGVGTIAGAYILDGIFQRNCTVRLTRDGVVIYEGPLASLKRFKDDVKEVKSGFECGLVLEGFNDIKEEDLVEAYTMVEVPR\n>UniRef90_A0A315BXB9 MFS domain-containing protein n=3 Tax=unclassified Limnohabitans TaxID=2626134 RepID=A0A315BXB9_9BURK\nMMFGNVVIGTGVMMAAGTLNDIVDSLSISVATAGQLISSSALLVCFGAPVLAAVVAGWDRRKLLVGSLLWYALWHFLAALSPGFYSLLGFRAMAMLAAAIFTPQAASCIGLLVKEHQRGQAMTFVFLGWSVASVLGMPLGSWIGGHFGWRWSMGLIALLSVIGAYWLWRQMPSKVLPPALSGAAWRQTLTSRTIWVTLSVTMMLAAGQFVLFSYLAPYVKERFGVSPAQFSLMLLAYGSMGFVGNALLSRFIDRIGPSRCILISLSSMCLSVLIAGEVTHATGMALALGFWGLGGFSSNSAQQARLASQAPWLASASISLNTSAMYAGQAIGATVGGWTIVHQGMSALPQRGLIGLLLAIGLSLLATRYARLHPLRSPEKA\n>UniRef90_A0A2N7D5J4 Flagellar basal-body rod protein FlgC n=2 Tax=unclassified Vibrio TaxID=2614977 RepID=A0A2N7D5J4_9VIBR\nMSFTDIYSIAGSAMTAQTVRLNTVASNLANADAVSANPDDAYKALKPVFATVYNKSQLSAEQALYPNAEVRIVDVVQSQSQAEQRFEPSNPLANQEGYVYYPGIDVVTEMADMMSATRSFETNVEVLANVKSMQQGLLRLGEGR\n>UniRef90_UPI001CF99253 hypothetical protein n=1 Tax=Pseudomonas sp. L5B5 TaxID=2883205 RepID=UPI001CF99253\nMLQTLWVLLNWEAWGESLVIAFIPFLLFVWVGALVTMLVLRFRGRISIFWASQLAGGVAGVAATLAFMMAANFVVDYKAYRESVRQLEAQERLQPKPESPNVETQPVELAGGMAGLESMKIFMALLSYRADSKRLRESDRQLGEKELLQTQKTSQTVEVQSVSSPENVLGEVSDSSGHR\n>UniRef90_A0A8K0MZ08 Auxin-responsive protein n=1 Tax=Cocos nucifera TaxID=13894 RepID=A0A8K0MZ08_COCNU\nMATSASIGVAGKELGVISEASSPLKRYNGLRPLLGSKQMASFAAMRKPNGPFPSLPSLKSPRIRAVASPTVAAPKREKDPKKRIVVTGIGLVSVFGSDIDTFYNKLLEGQSGISLIDRFDASSYSVRFGGQIRDFSSKGYIDGKNDRRLDDCWRYCLVAGKRALDDANLGPEVLQSMDRSRIGVLVGTGMGGLTAFSNGVEALIQKGYKKITPFFIPYSITNMGSALLAIETGLMGPNYSISTACATANYCFYAAANHIRRGEADIMVAGGTEAAILPTGVGGFIACRALSQRNDEPQKASRPWDKDRDGFVMGEGSGVLIMESLEHARKRGATIIAEYLGGAITCDAHHMTDPRSDGLGVSSCIVKSLEDAGVSPEEVNYVNAHATSTLAGDLAEVNAIKKSMIGHCLGAAGGLEAIATIKAITTGWLHPTINQNNLEPDVTVDTIPNVKKKHEVNVGLGEQDLTEELWRLCAGPLVEVPRVNERVFYFPQGHMEQLEASTNQELNQKIPRFNLPSKILCRVFNVQLRAEPETDEVYAQITLHPEPDQSEPTSLDPCPPETRRPMVYSFCQPRRHLLTTGWSTFVTSKRLVAGDAFVFLRFTGTVVGVEDVSSQWTDSKWRSLKVQWDEATNILRPDRISPWEIEPFNTTAPTLNAMHPVLVKNKRPRLPMDMVGYTVLEPTSPFWYSGTTHSHELDGLSSVDANSSATQVIWPCMQKENKGNGVKNGPGSCDPMVLDDWLKGLHSPIKSPPASLTDVSLKLFQDMNDETKVASWPVNPGSMMEQQPVLKLGNGVEEWKKPEVRSSSCRLFGIDLMNHSKSTTVSEKAIAAPAFTKSIAPIEGPSKATASVDESDQQQSGLSKASREHKQGLDSSPKEIQSKHHGSTRSRTKVHMQGMAVGRAVDLTNLVGYNELITELEQMFEIKGELRQRNKWEVVFTDDEGDMMLVGDDPWP\n>UniRef90_A0A2E7GD31 50S ribosomal protein L18 n=1 Tax=Bdellovibrionaceae bacterium TaxID=2026715 RepID=A0A2E7GD31_9PROT\nMSVKVRKRTDKKKVVRFKRKRKIRSTVEGSSERPRLCIFRSNTNVYAQLIDDQKGHTLASASTKDAELKDQKSTVEGAKQVGALLAKRAQAKKIESVVFDRNGYLYHGRVKALADAAREAGLKF\n>UniRef90_UPI0011841962 trans-aconitate 2-methyltransferase n=1 Tax=Catellatospora sichuanensis TaxID=1969805 RepID=UPI0011841962\nMWNPETYLRFADERGRPFHDLLARVDAEQPRQVVDLGCGPGNLTATLTARWPGAQVRGIDSSPEMIEKAVADQGGPGPVSYQVGDVREYLPGPEVDVIVTNAVLQWVPGQEELVGRWARALRPGAWLALQVPGNHDGPAHRALRELCASSRWSALLGEIAEQPRSVPGSQEYARLLRAAGCAADTWETEYVHQLPVTGGPHPVLTWLTGTALRPVRAALAEQPGAWEAFCVALEPALISAYPADGAIVDFPFRRVFAVGRRTAAPS\n>UniRef90_A0A0M8PST9 Uncharacterized protein n=1 Tax=Lysinibacillus sp. FJAT-14222 TaxID=1932366 RepID=A0A0M8PST9_9BACI\nMSRLGQHDVGHEGVITRRDAFSLRSSMCSLQGLIFDANPQGVAQSQLQSTNSYSMYPLPIAII\n>UniRef90_A0A7Y9F3N0 YtxH domain-containing protein n=1 Tax=Nocardioides marinisabuli TaxID=419476 RepID=A0A7Y9F3N0_9ACTN\nMSRGLWFVAGAGAGVYAMVRGRRAAEALSADGLRDRAGALALGARMFRDEVAQGRAEAEDQLRQRLAAARPREIDSPHPTERTTEQEGTS\n>UniRef90_UPI001967ED96 hypothetical protein n=1 Tax=Janthinobacterium lividum TaxID=29581 RepID=UPI001967ED96\nMQQDSGTAKAVPLNYFYRGVTVSKKQKTIVNHRSAVSGRFVTERYVKSHPATTVTEHNRISAPAKPLKRR\n>UniRef90_A0A5A8ADR5 GNAT family N-acetyltransferase n=1 Tax=Chryseobacterium sp. SN22 TaxID=2606431 RepID=A0A5A8ADR5_9FLAO\nMEHLTNFTYSDIKSELFRLKSKEMKANFFMTELQFNRLWSENKIQVFKTEKACFLLTDDDGFKRLYFIASDIEEIKYFLNNEIKNSDTDISVETVGNSKYLQDIRDAFLQNGFYEYSSMVRMSKIRNQVEEVDFENIHLLAADNKEEFQELYRKYFDKFVERIPAIEEIEGFIENKNAYYFSDNNEIQGFIVFEYYGITSHLRYWFVHPDYREKRIGSKLIQLFFNLGENIRRELFWVIESNENAIKRYKHFGFVEEDMHNLILINKNKKYEEPNY\n>UniRef90_A0A2D7PFG9 NADPH:quinone reductase n=1 Tax=Candidatus Pelagibacter sp. TaxID=2024849 RepID=A0A2D7PFG9_9PROT\nMKKIFIAFGHHNTKNSFNASIRDTFIEEAKKCGHNIDLVNLFDEQEKLPFYNQNINPPPQLVLDYRKRLEKCDVMMLIGSCNNLRLNAILENWIDWVLHPKWFFTYRSLLPGNKYFKNYGYPVAGAMKGKLGVVSITYGGPMISYQSFSFFDNIPYRRLKKSVFQLGGLKTKYLRFYSILPEMEKKEFENHMLKVRKFAKSL\n>UniRef90_A0A415FL20 DUF2953 domain-containing protein n=2 Tax=Ruminococcus sp. AF46-10NS TaxID=2292072 RepID=A0A415FL20_9FIRM\nMTAVQSFLGIPSKIFKKIRNLTLTIKKFCGKINWYKEFINHAQTRAALSLVWKDGKKLVRHVLPTRITGKITFGCEDPSITGTVLAVLGMTIPFHKNAIAVTPLFDSENVLEGEVMLKGRIYGIMLLKTAAELYFNKHIKYVIHRWRHKEVNHGERE\n>UniRef90_A0A7G8QAU1 SmpA_OmlA domain-containing protein n=1 Tax=Dyella telluris TaxID=2763498 RepID=A0A7G8QAU1_9GAMM\nMSKLSISLSIALLASAGLGTPAVASAESLLVNRVQQEKTMDLPSRGMSMAEVEKKYGAPQRKLSPRGGGSSKQPVINRWDYSNFIVYFEQSHVIHAVLNTPAGNNTNPASAN\n>UniRef90_A0A6J4UR21 3-oxoacyl-[acyl-carrier protein] reductase n=1 Tax=uncultured Thermomicrobiales bacterium TaxID=1645740 RepID=A0A6J4UR21_9CHLR\nMSDRARFAGKVALITGGGSGIGAATARLIAAEGGSVAVLGRTAATVKATATAIGGAGGRALAIAADVSREEAIDAAFTRAIEAFGRIDVVVANAAVQLHRRDLPIHEQDFAAWRETQEVNLGGAFLTCRAGVRQMLAQGEGGAIVIVSSVTALAGTAAQNPSYTASKGGLVSLSRALAVKYAPDHIRCNVVCPGALAAPPDVEEIDNAARERRLVGQIPLGRLGDFAEIAPMIAFLASDEASYATGGTFVVDGGLTAT\n>UniRef90_A0A8T9LM70 LytTR family DNA-binding domain-containing protein n=2 Tax=unclassified Dyadobacter TaxID=2625061 RepID=A0A8T9LM70_9BACT\nMMNTKQLTAKIVIVDDEFFVRQTLVSMIANIPNAMVVGEAEDVGSGIELILEKEPDLILLDIKMPVRSGFDLLEELTHCQQQYGLIFVSGYPDEALTAVQKAAPYFHSDFVVKPIDPVILQTKFSIFYNKWQAAKEQESELAGLLETGIPQIAYKSDQLVFQNSQLFHCIDIDDILYCESANRQINVYCSQYEHINIPNTTLDAIERMLPADAFIRIGKSHILNKSAIRFIQKGNRPKCILARNGKSYEVQLYASNVEKVEQSYSITRK\n>UniRef90_A0A811MPR2 Rep_fac-A_C domain-containing protein n=1 Tax=Miscanthus lutarioriparius TaxID=422564 RepID=A0A811MPR2_9POAL\nMGSSEDDFTPLSELTVGMNKCRVRVRVSRLWESFNPKNDISFGLDCLLIDDQGETMQARVLPDYIDQFEGQLIEGKTVVNEIEGDIDSIPLHSFEFIDFKNLHSMCDDISILRDVLGHIVYVGDLQEVEKKSRTIEICNATIQNLSGRKLGVTLYGDIACGFAEDMLEKGQKASGVAVFAGMRVESSHSVCSTTCSKYYLDLEIPEVQEFCENLSIQQENPVSEKSQAQKLAESWRTIEQLKRLNPKDYDEDTKFLCRVSLIDIDCTSGWCYLGCNTCYKSMYRAPRKYKCSRCGPIKRPINWYKLKTMVQDATGTMNLMIFCEVAEELVGVSAEELVDEIEDDEEWFTLPDEIEDLLGSTHTFQVFDKHLSGSFSVYAIMDDDTVPVPAATTSQCKEESVPEGSVNAAVPSPATTQCKAEPGMAAPAPAMIPCKEEPVLEENFSMVVPAPTTKHECKEEPFLEHSVNMAVLKPTITQCKVEEPVPKGSAGTGEARLKSTRLQKPNKRLLGDDWIN\n>UniRef90_A0A5C7TQB5 Conjugative relaxase n=1 Tax=Rheinheimera sp. TaxID=1869214 RepID=A0A5C7TQB5_9GAMM\nMLSIQTLGTMTKDKVAYYTELAATGYYTEAEEPAGQYFGKLASVLNLDQKAVTQEDLLELAKGFDTKGKALVANAGDEHRMGIDLTFSAPKSVSVCFGLAGTELRTAIQKAHESAVKAALTYAEQNFIQVRHGFEDNQQRRMINTGNALFALFEHGSSRSNDPLLHTHAVLLNFSQVKNGEFRCLEAPDLFNYKKALGALYRAELANQLEALGLKTEADEEFFKVTKVPDELCKLFSKRSNEIHDLLQEGGFTRANAKLKQNAALFTRQAKTHQSRETLYKNWAVEAEQISTWKPEQAFTKDRNQNKVDTEKLLESLTEKKSLFTYPDFLEQVFIHFQHAGLSSREAEEFAKATLESKAIRRIQHPQAGICYTTEQQYQLEMSFYKEMTEYLDRWRTAHARCPAFLPAWL\n>UniRef90_UPI001A901165 agmatine deiminase n=4 Tax=Halomonadaceae TaxID=28256 RepID=UPI001A901165\nMHPTHCPSSVAPSAATPAAQGYVMPAEFAPHDACWMLWPQRPDTWRLGAKPAQQAFVAVASAIAESETVYVGVNDDQYENARHQLPAHVRVVELSSNDAWMRDVGPTFLVHPDKGLALVDWEFNAWGGLKDGLYFPWDKDRRIRPKIAEMLGIPCFDVEVVLEGGAIHVDGEGTLITTEECLLNPNRNPGMDRATMERRLQDSLGIQKVIWLPRGCYLDETDGHVDNLCCFVGPAEVALTWCDDDTDPEYAICREARAVLEASTDAKGRAITVHPLPQPGPLTIAEDEASGIDRLASSHPRRPGDRMAASYVNFYIGNRVVVMPQLDPRHDATVMDILARLFPDRRVVGVPAREILLGGGNIHCITQQQPRP\n>UniRef90_A0A6L8CSU2 VWA domain-containing protein n=1 Tax=Gammaproteobacteria bacterium TaxID=1913989 RepID=A0A6L8CSU2_9GAMM\nMSGPLSPTPPASRMLEFAGYLRRHGYRIGVGELPDLFRLVDRGARDPVLTRRGLRALCCRTHDEWREFDRHFNRFWFPVESEQVAPASVPGGLPDSPGQTLVGLAGTSDREPDSTHGQSDIEGSGAGRQRTLGKADFRFLRDRTAMHEVESLVERLGQQLRRRLGKRREISPRGGHLDMRRSLRRSLATGGLPLKLVWSRPRPVPLHLVVLHDVSHSMTWNNPLLFRFVRGLMQNFRGSVAFAFHTRLFEVTPFFRERSLERMLARLDAGENLWLGGTCIARSLAEFNRHHAGTLLRSDSHVLIISDGFDTDDPEMLRTELSRIRLRCRQILWLNPMLGREGVTLTEASLSARLPEVHRFLPANSLDGLRAAVENLSRTGPRTRPGGTPPVHGQDSRQGDGH\n>UniRef90_A0A1G8EYP0 Catechol 2,3-dioxygenase n=3 Tax=Agrococcus TaxID=46352 RepID=A0A1G8EYP0_9MICO\nMPVTGPDFVSLQVRDLAGSQAFYERYLGLERSPAGPPHAVVFTTTPIAFALRDLVEGTDLDASQPGLGVALWLHATDVQQIHDALVADGHAIAVAPFDGPFGRTCTLVDPDGYLVTLHDRA\n>UniRef90_A0A1F9IIM5 GlnD_UR_UTase domain-containing protein n=1 Tax=Deltaproteobacteria bacterium RIFCSPLOWO2_02_FULL_50_16 TaxID=1797881 RepID=A0A1F9IIM5_9DELT\nMISWVFNIFGMTVEATRQGMTYLEKKAKPKLIDVAEGTFLAEKAREMHIAMRQLLQNHSVERQCSDVKRRARKRVKENIIKAYDRDDVVDEITVRLTDAAMADSFYKKWFAH\n>UniRef90_A0A1F5VQL0 CZB domain-containing protein n=1 Tax=Candidatus Fischerbacteria bacterium RBG_13_37_8 TaxID=1817863 RepID=A0A1F5VQL0_9BACT\nMGIAITGSDMLCKRITEGFVQQQESVQGKVFYSERIETDFDELLQKERINREVPGSWENTQAVRANKVESSVIRGKEECSRLENVMKEFEEMHNRLSEIITYTMNGRQFNAQELLAFQAEMHRITNYIEMVSKIIEQGINGVKHTLQTQV\n>UniRef90_A0A2P8AWN7 HTH_17 domain-containing protein n=3 Tax=unclassified Micromonospora TaxID=2617518 RepID=A0A2P8AWN7_9ACTN\nMTTPKRPERGTPRPARHLTIADVCDDLGISRSTFYDWRAKRKGPPARKLPNGEIRIERRDYETWLETLYEEAA\n>UniRef90_A0A1M6QX74 Putative addiction module component n=1 Tax=Rubritalea squalenifaciens DSM 18772 TaxID=1123071 RepID=A0A1M6QX74_9BACT\nMATLSELENEVLRLPKDQRVSLIHRILEKSELPENSDVKNLWNAEILERIERLDANSTECHSASDVFQAIDEQFAQ\n>UniRef90_A0A1M7QN82 Germination protein, Ger(X)C family n=1 Tax=Gracilibacillus kekensis TaxID=1027249 RepID=A0A1M7QN82_9BACI\nMIRVIVLLIFSILLSGCYDRIELEQQSYVIAIGIDKTEQEGVYSFTYQIANPEIGSAAVQSGPDEPPTEIVTVNGSDILSSTYTANSFVSKKITLDHTKIIVISEELARSEDFIRVIQSASRTPQIRRSVQMLVSKEKAIDFINNNEPIMEKRPHKYYQFMLNRAVQTGIIPKSTLHRFFQITEGDADLFLAIYATTEQSDQKKNTEGFEDKYIAGEIPQIGGSPTQFMGSAVFKEGQMIDILDGEETRVAQMLDKTLEMEDYLATIPDPKMPEYRISYNYYQKKEPIININYYKNKPTEIDVNISFQVEVIAIPSLIMYSQSKKDQQTLQEALTQRLEEKTNALIEKTQNSYKSDAFYWSLYIRKHFKDIKEYEDADWHKNIYPNAKINVTYELEKMEFGKMINDSNLEDVRD\n>UniRef90_UPI001E451F19 hypothetical protein n=1 Tax=Methylococcus sp. BF19-07 TaxID=2743472 RepID=UPI001E451F19\nMLWPAWILPEDVFRSIWERVRPVFLASMGQQRIPFTLAEPLARVYLPLAAWVVAHKKDGPFVLGVNGAQGSGKSTLCEFLALILREGYGCKVAGFSLDDIYKTRSERERLAREVHPLLVTRGVPGTHDVGLGLQTLDRLTTAGPEIAVALPAFDKSIDDRCPMSAWPQTSAPVDIVIFEGWCVGCLPQSGEHLVRPINALEAGEDADGSWRTYVNEQLGGPYAELFGRLDRLIMLKVPDMECVYQWRSLQERKLAAAIGNGSSGHRLMDETALRRFIMHYERLTRHMLAEMPARADVTLFLDENHGFARVHINE\n>UniRef90_A0A8X7XX04 Uncharacterized protein n=2 Tax=Populus TaxID=3689 RepID=A0A8X7XX04_POPTO\nMNQSSSKTHNQKCPSAALPEQPTKIRRRKKQQHHQPSFRRNALQDLNNGGIDTTSIDNSSNASSLSSIEAPRGCLRFFLSHSSSSSSSAKTPFSSSSSNQRLKKVKPSRTPKSAPSMRPTKEKPISKKVEKGKRNHPPCLYQWQSGKKRASSRNEVGDSKVSSFLDSSGSLVKNKLKSGPGELKKVMIDGVCEGSGANLTPLCKVGSGSGLNLGVGGKVMNDDCYEKSSNGKAESNSTSSNTKTPPVQPSVSPEIQCGSSMKLMTVETITPATCYGAGHVVSGVTDKRKCRPRGILAGGEAKALGSFDSDDDIEQANDVGLIENSDVSMLPLPIDASMHWLLSPCDEKDEGQKDNSRNRSRRFRRLEERAIHNSPASPSSGYGGFSPELCNTSANRSISTVSAGRRSASLLSPSALPVPQFQGFLGTPLCDNFPVSSLEEETENRHCTDGENSPFSIGSLGSGNIIQTPQSDTSCDRRVGASGTQVDGKRKKCNFDSDLNSVAEQLQMTSLSPMSHASVWDPTNSSFRFDSLTMPSNSVDLSKFHKILEERNSWFSNSTIENVSQSQMRISWREGLMSRMFEMDEFDCCRYLSDEEDDGNVCNIDCLKSHKSPQLNVEAATDHISINGIGSTEFVKKEQDTGGKTKDGLPSQPPCSCAESISTDGGGLVRSDDSDWTLWSKDSEVNMGNLIEYIDLAGCGPGGKSQLHYKVDGARGLFADIGFTIFGSLVFEEWLAEVERQSMDKLQEMSQAYLELVANLPCHVRIKGKLSQESVPDLVSSSFVFPLIIREKEEPDRAERGSCVLMEGLIPLVCKAFRKNKTRRQYECLSVGTALSYNISDFYTHEAPKSELHFQPSMENTNSQKKVHRRFWSVHEDFSGGFSSPAVRSTTAASPQTKQLARFRSQRV\n>UniRef90_A0A853BRY5 Anti-sigma regulatory factor (Ser/Thr protein kinase) n=1 Tax=Streptomonospora nanhaiensis TaxID=1323731 RepID=A0A853BRY5_9ACTN\nMAQCDGVDDDVGIYTLRACRTFAGAARECREARLWARRHMRPFPDVADAVELVVSEFFGNAVRHTASGQPGGTVFVSLVGLVSGALHLEVHDEGPRRGAPRTTARVLAPDLERPDGRGLFLAAALTKEWGRLPLHGGPGYAERGYTSIFDPDLDHETSDYVGPMITWAEFSTSFRAAPASAAAHHAG\n>UniRef90_X0WKB2 GH26 domain-containing protein (Fragment) n=1 Tax=marine sediment metagenome TaxID=412755 RepID=X0WKB2_9ZZZZ\nTGSRPLGEYEPAGTWGSYGINHWLYVAAEDPLYGQAAKDYWGTVNVKGSGNIPLFLDCWFWCGGPENDDTPPAWDGHRILGHTESMNRFCINRHQQGINGVFLDYSARKVWLKELWHVKWARNFNVNYPGPYWETEAPWMAQFKAH\n>UniRef90_UPI0012FA07AB hypothetical protein n=1 Tax=Nocardioides alkalitolerans TaxID=281714 RepID=UPI0012FA07AB\nMTTLMLDQARTDDATTAPTDVRDVAGGLEDELFEQAVGEQVAGLTTMPSISTIHCLTSRHDTTLLPRL\n>UniRef90_A0A2E0G851 Peptidase n=1 Tax=Candidatus Marinimicrobia bacterium TaxID=2026760 RepID=A0A2E0G851_9BACT\nMIKKNKHIIFIIIFYSLFVESLFSSDTIVYRVPIQGVIDLGLPTYIERIINEAESNQAEAIIFDIDTFGGRVDAATQIKDAILDSDVPTIAFINRRAISAGALISLSCEKIYMTGGATIGAATAVDMSGNKASEKVISYMREEMASTAENRNRNTDIAKCMVDEDLSFTYVIIDNDSIEVTDLEGRKEGKLITLTTEQALKYKMADGLAEDLDELLSLLELSGAEVKTFYENWSENLVRFLTNPVVASLLTTFGFLGILFELQSPGWGIPGTFGAVCLTLSLSASVIVKLATKSDLLIVFFGLSLLMVEAFLIPGFGIAGLAGIGVILWGLYMLLLPDVPVSQEIYDSAMTGLTIGLIGAIIAVILLFRMMTKTKFWIKLTSPGIESSEEGYNTSLGLENLIGETGVATSDLRPSGWVLVNNEKIFVVTEGEFVDKDQEIKILSVDGNRVVVRINN\n>UniRef90_UPI0012BBE16F YeaH/YhbH family protein n=1 Tax=Sansalvadorimonas verongulae TaxID=2172824 RepID=UPI0012BBE16F\nMSSIIIDRRRNSKGKSTVNRERFMRRYRRQIQKAVNDAVNSRSITDTDSGEEITISRKSLSEPFFHHGEGGDRDQTHPGNKEFVTGDRFPKPKGGKGKGKGGGGGDASDSGEGLDDFAFQINRDEFLEYLFDDLELPNMVRKELKESSEFAFRRGGFTSAGAPDRLNVIRSLRGAHARRIALSGKDRKEIRALKRELREMEVSPDDTNEARAEEIKLRIKELNEKIKRLPFIDDFDLKFNNLIKVPLPSSSAVMFCVMDVSGSMTRDIKDMAKRFFFLLYMFLQRNYEKVEVVFIRHHAEAKECDEHDFFYARETGGTVVSSALTLARDIIDERYDPKKYNIYVAQASDGDNWEADSPKCSKVISEDMMKNLAYYAYVEITDRHHQNLWHEYKKLEQAHPDHFAMSHIKGPTDIYPVFRELFEKKEAMA\n>UniRef90_A0A6A6R4P4 MFS domain-containing protein n=1 Tax=Lophium mytilinum TaxID=390894 RepID=A0A6A6R4P4_9PEZI\nMRLLGESGLISKRRYPCIYTKMVLILLPHFQRLQELCRHRSWNGLLIFHAFWCCSVYHYTVRALFTFLFAMGFSVGSCMSFAIPFNVLDSRCAWLSTSERRAQFVLYNMPGCGVR\n>UniRef90_A0A8J4XW43 Uncharacterized protein n=1 Tax=Chionoecetes opilio TaxID=41210 RepID=A0A8J4XW43_CHIOP\nMAIYLFTRQDPSRPHPPAGKKDAVNWDQHAILLEGRKKTPPGVGWSFDSGLTDTSHVRKVAKNAAWKLELHPTRLRTSWTGSGSRHIYKSQVRSLMEYSPLAWSSYPPSYRCLLDRVQARAQRLARLKAPEDAAQIIQPLQQRRDVAGMWGHVQKGHRMQLLQLAELRLNPGPGPPIYPCGPQHRHQGLAIREDGKITSAPSYPAMVDYGTPFGAPDDLTFTPSMHAFKSGVNAWLQEADEALDGDEGWLLPITSHKASRPLHSEPFVPVAWMVD\n>UniRef90_UPI001FD5AA06 methyltransferase domain-containing protein n=1 Tax=Nocardioides sp. W7 TaxID=2931390 RepID=UPI001FD5AA06\nMVAQAIPSRIRWAVEFMDVQPSDHVLEIGCGPGAGAEAICSKLETGKLFAIDRSESGVDRTKRRCAKYVASGRLTVRQIDLATLRVPVKRLTKVYAFNVNLFWVRECPDEIALLHERVLPGGAVFLFYEVKFPDQMPTIVEKASAALAGGGFRVSVVEQKTPAVVGVIGRR\n>UniRef90_A0A7X8TA91 L-idonate 5-dehydrogenase n=1 Tax=Rhizobium sp. P32RR-XVIII TaxID=2726738 RepID=A0A7X8TA91_9HYPH\nMKAVVIHAAKDLRVEERQEEALEPGQVAIAIEAGGICGSDLHYYNHGGFGAIRIREPMILGHEVAGTIKAVGEGVSRLAAGDRVAISPSRPCGSCEYCLKGQQNHCLNMRFYGSAMPMPHIQGAFRQRLVAEEWQCHKVAEGISINEAALAEPFAVTLHAVARAGSLLGKRVLVSGCGPIGALAIIAARAHGAREIIASDVMDAVLKKALSIGADRAINVADDPQALDAYSTNKGYFDVQFEASGNESAVRSGLGVLKPRSTLVQLGLGGDIAIPQNILVAKEIEMKGTFRFHEEFGLSVDLINARRVDLKPLLTGVFPLDDAVAAFEAAGDRSRNMKVQLAF\n>UniRef90_A0A1F6CIC4 SsrA-binding protein n=1 Tax=Candidatus Kaiserbacteria bacterium RIFCSPHIGHO2_01_FULL_53_31 TaxID=1798481 RepID=A0A1F6CIC4_9BACT\nMELIKNKKAHLKYVPLENFSAGIELIGQEVKALKNKLGSLEGARVVVRGGEAFIVGMTIPAYQAANAPKNYDPERPRRLLLAKAEIAELAAAESKKGLTSIPFGVYTAHNFVKAHVAIVRGKGKADRREDLKKRDAEREAGRILKNR\n>UniRef90_A0A3M1TVI0 AarF/ABC1/UbiB kinase family protein n=1 Tax=Deltaproteobacteria bacterium TaxID=2026735 RepID=A0A3M1TVI0_9DELT\nMLDAFGRVEVNRKTVEFAGLSATGYVRGGRAAPREEHAPGTPSVSKSSALRTVYANLMATRTAIRDVRRFRQIAGVLARHGFGFLFSRFSRKDPEVAKAVDEALQEAPSAPQVPQALPYAQLARRARAALEDLGPTFIKFGQILSTRPDLLPQAFCDELQNLQDDVPPMSIEEVNAVIRRELGSEPTEIFAEFDETPLAAASIAQVHRARLKSGEEVAVKVQRPGIAAIIEADLDILYFLARQLTVAVPETRLFDPPGIVREFERAIRKELDFSAEARHMKKFARNFREVDYIHIPEVYDRYSTAKVLTMEFIEGVKITDAVEQGLADGEVLAKRLLWALFKQFFQDGFFHGDLHPGNIYVLPGNRVCYLDFGLVGRLTPEMKDRVIDLLFAVGRQDFDALARVLFEMGIREGPVDYDAFVADVYEVAERYFDGTPLAEIDVGGLFRELVEGAMRHHMRMPTTYTMVFKALMTVEGLGKRIAPEMDLVEEAQPFIAELLRERYSPERLWKKASEALYTTSRLLRQVPPAMTRVFEDIDAGRLTFQIDAPRLDDYLEDRRRSDVMWGTGLAYATLMICATLALSWDEYRILGFPALSFIGYLLALPTGLWFFNHWWRR\n>UniRef90_UPI00210E2C07 response regulator n=1 Tax=Stutzerimonas stutzeri TaxID=316 RepID=UPI00210E2C07\nMDIPLSQRLSFKQASLTVLLALTLGGAFGLTRAVLDYASERDGINRKAQALLTVTTAAADHALREQDARLADQLVHGLLQAPAVLRAELRAADGTPLAIASRHPTESGWRRRLSDRLFGAELHLTLPLADGRGSQHLLLDTWPHGQRFLRRAGLGLAGGLTSSLLLSLALLGLSHLLLTRPLGSLVAALGSRDAQRSARTPLPCPAGHRHDEIGALVGACNEQLARLDSEIAQRRAAEEHLTRALGELEGRVAERTAELERANRELLASNRELQLAQRTTQEMAQARAHFLASMSHEIRTPLNGLLGMLALALDSPLPPQVRQQLGIAHDSGRGLVELLNGVLDLSKFEAGQLELERIPFDLASLVEDTASLLAQNAAPGVELTCLIAPDLPGEVIGDPLRVRQIVSNLLANALKFTRHGRVDLRLIANPDGILLEVRDTGIGIAREALARIFQPFAQAEAGISRQFGGSGLGLSLTRRLCEAMQGTLEVDSQPGLGSRFSVRLPLATHAAATSLPSLHGRVVALCSRRSGLSELLDAWLPAWGIEYLRLDTDASLAGLEVDLLISDCPECLHGRRPQANAAILLVCSYGDFLPEGEAQALQPLEQLPRPLSRAALYQALQRGLGQPLGAGPAQTDEPRRPRILLVEDNPVNQLVVKGLLGRLGLTVEMARQGEQALKLLAQQNFDLVLMDCNMPILDGYETTRRLRREPRHAHLPVVALTANALPEERERCLQAGMNDYLSKPLRREELEAVLARWLPNCLQPA\n>UniRef90_A0A6G6VZM2 Multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit n=1 Tax=Microbacterium sp. 4R-513 TaxID=2567934 RepID=A0A6G6VZM2_9MICO\nMSSQVTGVGVSNEGEFGANEWLVEELYEQFKIDRNSVDKAWWPILENYHPVDEAAPAVPAAPSAPASEAAAPTQAQPGASEPRPVTAPIPVIGAQPVARTTAKPAANQPIPAQAPAAVPSTGEASTEEDQVTVLRGMTKTLAANMDESLTVPTATSVRTVPAKLMIDNRIVINNHMARTRGGKVSFTHLIGWAIIRALKEFPSQNVFYAEIDGKPSVVAPAHVNLGIAIDLPKPDGTRSLLVPSIKRADTLTFGEYLASYEDLISRARGNKLTAGDFQGTTISLTNPGGIGTVHSVPRLMKGQGCIVGAGALEYPAEFQGSSEKTLVELGIGKTITLTSTYDHRVIQGAGSGEFLKKVHELLIGQRNFYEDIFAALRIPYAPIHWASDINVDIAERVDKTARVQELINSFRVRGHLMADIDPLEYVQRTHPDLEIENHGLTFWDLDREFVTGGFGGKRIMKLRDILGVLRDSYCRTIGIEYMHIQDPGQRAWFQEHVEIKYQKPGHDEQLRILSKLNEAEAFETFLQTKYVGQKRFSLEGGESLIPLLDEILQGAAQSGLDGAAIGMAHRGRLNVLTNIAGKTYGQVFREFEGSVAVGSKSGSGDVKYHLGTEGTFVADGGDELPVLLAANPSHLETVDGVLEGITRAKQDRKPIGTFSWLPILVHGDAAFAGQGVVVETLQMSQLRGYRTGGTIHVVVNNQVGFTTVPGDARSSIYATDVAKTIQAPIFHVNGDDPEAVVRVAQLAFAYREQFHRDVVIDLVCYRRRGHNEGDDPSMTQPLMTNLIEAKRSVRRLYTEALVGRGDITEEEYEKAKLDFQNGLEVAFAETHAAQTGTHPVVPDAEASAPVSGAPETTGVPTEIVQLIGDAFVNKPDGFTVHPKLQQLLDKRLDMSRNGGIDWAFGELLAFGSLLIEGTNVRLAGQDARRGTFVQRHAVLHDRANGQEWIPLANLGDSQGRFWVYDSLLSEYAAMGFEYGYSVERADSLVLWEAQFGDFANGAQSVIDEYISAAEQKWGQQSSVVLLLPHGYEGQGPDHSSARIERYLSLCAQDNMTVARPSTPASYFHLLRRQAYARPRRPLIVFTPKAMLRLRGATSKVEDFVNGTFQPVLDDDRGVDKGAVTRVLLHAGKIHWDLRAELEKNPNPEVALVRLEQFYPAPIQELNAVIDSYPNAQLYWVQDEPENQGAWPFIALEVVKHLHGRTIRRISRSAAASPATGSPKVHAVEHAELMKKALTTTSR\n>UniRef90_UPI0014206272 serine hydrolase n=1 Tax=Chryseobacterium sp. Tr-659 TaxID=2608340 RepID=UPI0014206272\nMKKLTLAFLISLSFNMFAQSVNDKIKLFESNLNYWDQLKTKKWSLKERMALYNANAVSIAVIKNYKVEWVKAYGFADISENRPATTQTLFQAASISKSINSLGILKLVQEGKLGLNDDINNYLKTWKFPYDDAVSKGKKISIANLLSHTGGLSVGGFGGYEKGEKLPTIIEILNGTAPANSNAVRSIFEPGSKFEYSGGGTVISQLILENTTGEKYEDYMLKNVLVPLGMNSSSFNQPPSKDKEALFAAAYVNGKEVTGKYHIYPEKAPAGLWTNPTDLAQYIIETQLSLLGKSNKVLSKEMSAKRIENNLGVFLNDFKGTKYFGHSGRNEGFTCHYVGSLEDGNGIIVMTNGSNMKLVEEIVSSIASLNQWKNYPLEPMKESIALTIRKECEKNIDKGIALYKKLKNTLPNNYNFSDENELNNLGYEFLRSGNIDSAIKIFNLNVYEFPKSANVYDSRGEAYLNKKEYQLSKEDYSKVLELDPTQQNAREMLLKIKKETGK\n>UniRef90_A0A7S1LBN8 Cation_ATPase_C domain-containing protein (Fragment) n=1 Tax=Alexandrium catenella TaxID=2925 RepID=A0A7S1LBN8_ALECA\nPNYVLDVCKTWVGRDGSVEAFSDAAREDAMRTIDILSSQALRVLAIAVRPMAQLPFDPEEDQDSSADEKMGILCQDLTLMGLVASIDPPRAGVRDAVQAAQNGHIRVMMITGDYLKTAAAIAQDVGILEPDVGERGALDCTSLRPSGDYLPDLKIDELTKDARVFARAKPEDKLEIVKSLQRQGLVSAMTGDGVNDAPALNAADIGVAMGIQGTEVAKGASAMILTDDNFVSIVGAVEKGRVIYAGIQKFVAFIMSVHIAEVLQIFICIVSELPVMRTPLQILYLILVTDLAPSIALGLEPGQAGIMNDRPRPKKQPILLWWMWVSTVANAAILTAIIISVYIWGLDTFVNERNVKMISRMVVDEEANGLPGHTKRGLEQAQTVAFISLVWSENIRAYTSRSFDSPVCKELCTNRYMQGAIGVAQAALYTAIFLPGLSDILGLKGADIGLKGWIAALVGAGACLVACEAYKALQWLAG\n>UniRef90_A0A7J6FTG0 Calcium-binding protein CML44 n=2 Tax=Cannabis sativa TaxID=3483 RepID=A0A7J6FTG0_CANSA\nMSPLSTYDLKRIFQKLDKNGDDLVSLEELSWLLERINNGSVHHQFSKTELESLVGKSSLNFDEFLFFYESISSKHNDEIDDEVEEIIISDLVKAFKVFDQNDDGFISCEELQSVLIRLGLMEENSTDKDCKTMINAFDANSDGQLDFEEFKTMMLLTITS\n>UniRef90_A0A0P7TU97 Main olfactory receptor family H subfamily 129 member 1-like (Fragment) n=2 Tax=Scleropages formosus TaxID=113540 RepID=A0A0P7TU97_SCLFO\nTDLKTDFAVAYRDIVGSGKVGVHEAAHGPGVDQSLSLHFPSALRQTNEYSETNETVLGNTTSNRSLMVIMKICFVSPFFGVFLYCIVVMLHTFILHRQFWDSSRYILFVYMLINDTLQLLSSVLLFLFVMADLHISFACCAPLLFLSTATFQNTPLILATMSLERYVAIFYPLQQPAAWHADHIWVIILSLWLISCIIPTVDFSLGGLRISIDVLLTPVLCKTQALNSSPVQMLFKVILNGLFFTLVAIIILFTYIRILLETRKMRQDRASVSKALHTVLLHGLQLLLCMMSLTHPITEGLIIQHMGWLQDNISFFNYFCFVLLPRFLSPLIYGLRDDMLRKKIRGAIFCCSTKGAQQVTDKHILK\n>UniRef90_A0A0Q7EWN4 Carnitine dehydratase n=3 Tax=Massilia group TaxID=2895353 RepID=A0A0Q7EWN4_9BURK\nMTPAEPSLPLSGIRVLDLTRLLPGPAATMQLADLGAEIIKIEDPGPGDYARAMGPVRKEVSQFFVAVNRGKRFLRMDLKDAAQREQLLAMVEQADVLVESFRPGVMDKLGLGWDVLRARNPKLVMCAISGYGQDGPYAMLAGHDINYVGYAGMLDQNAAPDGRPALPNLQVGDLLGGAQAALQGILAALVAVKMGGMGRFVDVSMTDAVFANNIMPLVAVNNGGDAAPGRDLLTGGVPCYNVYRTSDGRYMAVGALELKFWQACCDVLQRPDLKARHWQLGQQVGGPDALAVQAELEAVFAQRTLAQWTEAFAGSDCCVSPILRTSEALVHPLFQARGMAVRAVHESEGEYWAAAGPLKFKA\n>UniRef90_A0A7W8G837 VWFA domain-containing protein n=1 Tax=Treponema ruminis TaxID=744515 RepID=A0A7W8G837_9SPIR\nMPKRHLALILIISLFHSSILFSENAENEAGEVLSLKQIDLLIDTTAYNDALRELSRYIAAHPNDFDRAQKRISRVMKLREEYNKGADSLVELIRNGDESKSEKLAKIAELESSELESNENVIEFTNLARRTVTLGEILILYDRIMREGVALVRSEKFSDAAVKFEEGFAIKNEVSDLVFDVENHSFAAEGTPVVYESDITEPVRKSVSNIRSLVAGNLVSASMESRINDCEKAFNEYMRAVSARDVNSISAALKNVNAAFEKYAALRNKIIADAKVLEAADILANERNPLLYGTSYITFHQKFILGDESNPDTGIIGAFDAYFNSRVERMKDKTNEAVLETLNLLITNLPEGKIYSLANKIDAEQKNVAVAKMYSQFARYVHDLYNLEKNLDGSTVGEKFSGYASSMSFVSEYLSDLSLAYKSAQELAWEKANPEKIDKNDFSDPVLAYNLKKLLRYEQIKADSKSYISLVNEEEKKQKEFFDKKSEREKEIEELRRISGGRLRISGAQKRTTAGVQISDNPLDFRKQIGYFLSLNEQNLKEARNHAKGLWGYMASAYSALAKKDYDHYEKLCSDTEKLLTGGLASSSDSDFSSEFIKKYPIEAKDSALKINQEISIKKTELLEKREVLNGGEEYRMSESDYNKGTLALDKIILDFDSLYAKNQTLAEEAIPKIRDYENLIRNADEQYEIALRAFKKEDFENANIAVDSASEKYAEALDIEYSEKIRAMREETLNELAVKIQRAEYEKVLREVFALKDKAAIAYYSSSFDTAETLLVTAQSRWSKVSTEEDSEIEDMLNIVKTIKSIEYGRVLLQSDPHYPELSYSLDMAKQSFEKGVKLKNDGNTVKANEAFNLALTNIRNVQNVYPLNKEARLITLKIQQELDPEGFPRQFENQYNAARLNANKNERLADLEDLYAINPKYPGLAQEIYDIKDSLGMFPKKEVKKEVKRSADSKIAEAKKAFKDAGSDEAKLNKALLLANEAIAIDGTSKAAKELKLQIQLKIGASATAILSQNDEKMYAEAARLFNQRRFADAKGIMDNLLKGAAAKKSRKVIDLNNRLLKRL\n>UniRef90_A0A847Q3W9 DUF814 domain-containing protein n=1 Tax=Candidatus Fermentibacteria bacterium TaxID=2044591 RepID=A0A847Q3W9_9BACT\nMDGVYISAVACRLSEELTGRTCSRVTRPFAGGLGLSIGGRMLLLDARPPSPAAWLGDDGADDGDPAPQPWSDGLAGTRLEEVRQEGLDRILVFEFSRVRRYCNPLMRLIFEMTGRNCNLILADSGSRILACTRIVSRSMSRVRTVRPGETYEGPPSSGAGLGSWREDRVLEALGKATSPEEIHPLLEGVGPATAGAILEESRASGRKVPEVVAVLGSALESREFAPWASVHGPMPIRLGEGAPIADVLSPPSGGGPAGACRKAAVEILEARRAFLERKLEKLRSVLDGVPSEDLLRLRGAILLANIPRVPRGAEEVVLPDWDGMEHRIPLRPGRSAVENAQRYFRKARNAAVERSRLESSIRETRAAIGELDAALAGGSGQCRIDRLAGAVGATRGAEARSPAGRAMGGGWTCLVGRSARENDEITFRIAGRDDIWLHARGAAGAHVVLRHESRGQTPPRAVLEAAAALAAASVRNRPDVVPVDYTKVRYVRKFRGAGPGEVVYTGEKTLFVRLCSARRGGARPGEAK\n>UniRef90_UPI001FF9ECF4 transglycosylase SLT domain-containing protein n=1 Tax=Bradyrhizobium sp. 1 TaxID=241591 RepID=UPI001FF9ECF4\nMPRDRAHFRFGATWRNVAAAALLLASSCAHAGDGEQYTAGAPDLGAAETATSRAEIRRIVDSETGKANLPADLADAVIFVESGYNSSVVGSVGEVGLMQVRPETAAMLGFRGTAEELAKPDANIHYGVLYLARAWRLSGGDLCRTLMKYRAGHGEETMTPRSQVYCNRARNHLLAMNSPVATGATAAPAPAPVPSTVVATTTTSIARSPKALSRPKEVYARFRQGTAAASRAYWAAHEARISLIKARIETRWKRVASR\n>UniRef90_A0A0K2UCG6 Uncharacterized protein n=1 Tax=Lepeophtheirus salmonis TaxID=72036 RepID=A0A0K2UCG6_LEPSM\nMWPTVHSLIQTLVLLLPDLQP\n>UniRef90_UPI001E440651 type IV secretion protein Rhs n=1 Tax=Chryseobacterium gleum TaxID=250 RepID=UPI001E440651\nMAEFSVKTLPNDKIMKLYDKKIQLFSSFILSLCSVLGFSQTILYQAESTSRTVQDPQTVVLAPGFRASSTSSNPFVAKIGPATENPGGGPTDSNAGSNNPSGTTAPDGKSFHDTKGNIEVNGAGQLQFTLPIALPPGVKSVAPQVNLVYTSGSSNGIAGYSWNLSGVTTISRVGKNIEKDGEVKGIQLDYSDYYSFNGQRLILKSGEYGKDGAEYITENYSNIKIKSFGSIPGQVWKGPEYWEVTFEDGSQSWYGTIASGNSTARTPLEYNIVKWKDAQGNYITYNYTQNNSNNVAVISSITWGGNETLNKPHFNTIEFTYLPRKIVEISYLKGILFKQDKILDQIKVKANGSPFKSYSIQYSETQNIVNNDSNNKINYDFVEKIVEINSEGKEANPITLSTNPLLTGSNEFDFGDYDNIITTGDYNGDGLIDFIVRQPAQNSRPEGYYLYFNALNNSNPSFVYLGATSVFWPSSSLTTVNIKSADNFIKPRQGLVITKSNVGYNPPSTGNIELAYYSIKSDASVINTYNNPLVFEYSKTIQSNNYLFDSSLYPPETDPEYLGGLNQSGLSVLKEVDIDSDGISELVLPIEDKKCKYVVIVPDPPKGRWQCKTLGYRYIAVDNDNIQNNTISIIPGTTSKNILSKGGIMDFDNDGKQDIMFLEPTDSKVNVTFYTQVINSGSNNSSPVSLTTEAPLNNLKQYELKKVGNNYTINLKNTISVKGLADGLQFGDLNGDRNIEVLLPVGHPYINRLQGWSIYLNTGNGLQEDIQGLMPYFPYTSSNTDNYSYTIPKLMDLDNDGKSEIINSNVSFGPDVIPSNGSYHSSWYIDSYGEASYDPNNSQFKWSFAKKRIFSSVRNEVVVSPIFGDFRVNNSSSKILFLIKGINGNNERKIISYKHYSLNPDKNISLISQGSQNYYIDYKELDPSFNSNIYAPVKKEQYPFVEMDRLSQTFGVSQLRQTDGQTVRKQDFRYRGYIVNLHGNGVTGFRQAARSSWYADGFENTKIWSGTEMDPLNEGVPVKEWSIRTNNENQIFPADISENNTQLLSFKSTNYQIDKLLNGQVVSTVADSDKPKVVTVVAPKISRVKDFLTGTITESTITYGNYYLPSQSVSNVNNGYAITTSTSEYIHNPSGIGSDYYIGRPKSKINVVQAYGDTKSSKEEYIYENSFVKTLKTWNRDNTGYLQETYNYDGFGNVTGKVISNSIDSQTQTTTSSYDPKGRFVVKKTDNLGLETNITYNDWGQILTQTDPLGNVLTNTYDGWGKILTSKTNLAGTITYQYEKDNNSNIIVTQNDPDGNISKKFTNKLGQEYKTSTKAFGQGQYITKTILYDALGRKTSESEFTFSPDGLGGPWNLVAYDDTVFPTKVTATSFNGKQMETSMSGLTTTVKELNGYQRTTSKTTDVLGNIIYSTDKGGTIQFTYNAAGEQIKAQYGENIITTKYDSWGRKSEFNDPSNGIYKYEYDGFGQAKKITSPKGTKEYTYNNLGQLISQKEISTADGGQATNKLISYSYDNKGRLISKSGTSKGQAYSSNISYDLQGRLLSSSESSNGKYFIQKGITYDDKARVISCEKQLYSSGTLTKVQIENVYSIWNGELYQVKDKATGKILWELKETNAKGQVLKSKLGAADINNVYDANGLLANVNHSSQAKPGILQLSYSFDTIKNELKSRITGGDFNITESFDYDDNNRLVNWTNPVTGIKPTTSRNVYDVKGRIILNDQVGTVKFENSTKIYQPTGMTLNAAGEHNYNNDLIQSIIYNENNDPVFIDGMKGDAAFQYGLTSMRQRVTYGGNFSTDGEGKFTKFYSEDGSFEVVKDNTTGKEKHILYIGGTPYESNIVYLKNFSESSGSYKFLHKDYIGSILAISDEAGNKLEQRHFDAWGNFTHLQIGNGSIITDQNTILTLSKDLAIDRGYTSHEHFVEVGIIHMNGRLYDPLLRRFLNADENIQDIFNTQNYNKYGYVLNNPLMFNDPSGEFIWFLGAAWAAAHVFLAGVITAAVIGTAVGLAAYSLGVAISGSKWQLGGALKSMFWGGVSGAVTFGIGSAFTPVAGTVLTLTDKVASAMAQGLVHGFAQGVLSMMQGANFAHGFASGASGSWGASLFGAFAGSFANSAAGTVVSGALLGGVASELTGGNFWEGAVIGGVVAGLNHYLHKIETTNKIRKRIDKYYNDKSVADASVKKGFLQDLTKIFPEIYELTAKNFAIANEENLKQFNESTGADYVLIDKTIVSDGGNGENINGITSMKDGSVLISPHRTRTALGFAATWYHEGIHSLHLVTGMFKAWEIKYGAKEALRITEFYAHSMTDAMSGLSMTSSLAFSRYYPSLYIQSLSSFLRP\n>UniRef90_A0A1A9ZG83 RNA_pol_A_bac domain-containing protein n=1 Tax=Glossina pallidipes TaxID=7398 RepID=A0A1A9ZG83_GLOPL\nMTCIPEPRIARIFTQEKDTKSSPHESQRKRHENSNTFDNVCAIDMYGHQISSNNIRIKIYSGQIKWWPKGKQAQIYIESDVGPIDDDILITQMRPGHELDIRLAAVKGIGKDHAKFSPVATAFYRLLPEMKLKKDVVDVELRWKFQTK\n>UniRef90_A0A0B6Z514 Protein CASP (Fragment) n=1 Tax=Arion vulgaris TaxID=1028688 RepID=A0A0B6Z514_9EUPU\nPFKMAANVQLMCQYWKNFDLQELQRELDTTATELANRQDESEGSRKRLVEQSREFKKNTPEDIRKVVAPLLKSFQLEVDSLSKRSKATEAAFLSVYKKLIDLPDPVPTLEHAQNLQKKAHKVQDLEIENKQLRETLEEYNHEFAEVKNQEVTIKQLKEKLKEHEERVEATAQNRAKEKERELQRTFAEKERQLQETQLIVARKLGEAEHQIATLHRALETAQSELFEVKAKYDEATSAKSDEMEIVMADLERANERATSAERQVERLKQQLTLAAESLNHQDEEDITQQNLASDQAMDILKRSTLEVELAAKEKEIAQLVEDVQRLQASLNKLRETTSAQVTKLEEELTAKNHAFRILEDRLRTQEDYEEVKRELRVLKSIEFANVSSEESHNEESKSLEMRLLEKNKSLQTENTHLKVVNSGLTDQVRKLQEEYKEAAATVQEQKSLITQLEEDLRNINAFSSMFRGDAEGEPGPPDANSEAMASIVKEVTQLTSGKFSKSAADSLLPIIQSQRERYRLRAQELEAQTLSQQQQVTLLQNEMDKLRSDNVKLYEKIRFLQSYPNKDGTREGAATDDVTSSYSSQYEDRLDPFTYFSRAERQRRYHELKPYDKITLSMGRLIMGNRTARVFAFFYTVILHVLVFLVLYKLAHTESCKRDMAADWHQRYSEHMMKVHGEEGQHVD\n>UniRef90_A0A1V5QNZ9 Transcriptional repressor NrdR n=1 Tax=Betaproteobacteria bacterium ADurb.Bin341 TaxID=1852821 RepID=A0A1V5QNZ9_9PROT\nMKCPFCGAEDTAVVDTRINDEGDIVRRRRSCKVCDKRFTTYERAEIRLPQVVKKNGSRTEFNRDKLRASLDLALRKRPVTTEAVDAAITDIEEKLLAMGEREVTSQQVGELVMRELKRLDKVAYIRFASVYRNFEDVSAFSRAIKEVK\n>UniRef90_A0A1S8RD89 Acetate CoA-transferase YdiF n=24 Tax=Clostridiaceae TaxID=31979 RepID=A0A1S8RD89_CLOBE\nMVKIINSKEAADLVKDNNVLATSGFALLGVPESLIKRLEERFLEENSPKNLTLMFAAASGDRGSKGLNHLAHEGLTGRVIGGHFGLAPKIGALIRDNKTYAYNLPQGVMCHMFRDKASNRTGTITKVGLNTFVDPRVEGGKANSITKDDIVQVIDILGEENLIYKCPKIDIAFIRGTYADEKGNITMDHEATYSEAACIAQAVKNCGGTVVVQVEKIVKFGTLDPRAVKIPRIYVDYIVEAEDKEDQAQILGYNYDPSLTGEANMVVDGLAPLKLDERKIIGRRAAMELVKGQVVNIGIGMPEAISNVANEEGICDYFTLTVEPGAIGGIPQGGNKFGASINPECMYDQPTQFDFYDGGGLDIAFLGLAEVDKQGNINVSKFGPKVPGCGGFINITQSSKKVVFCGTFTAKGLDIKIEDGKLKIINDGSNKKFVDSVQQITFSGNRATKLKQPVMYITERAVFELKEDGLHLTEIAPGVNLEKDILAAMDFAPIVDKDLKLMDARIFEDKVMGLN\n>UniRef90_A0A7S4VIJ8 Gp_dh_C domain-containing protein n=1 Tax=Alexandrium monilatum TaxID=311494 RepID=A0A7S4VIJ8_9DINO\nTACGAFQEDTELVQISTKVLPLLAEEDPTDVQSLQDCAGALPAGDVPPGVTTALLGASVVPWKEPSAGPPAVGHMVDCSAIDAPRSPLSGSPIAVSSLLALIRAVSACDRTMKLTLEGMAS\n>UniRef90_A0A7R8ANC3 Zn(2)-C6 fungal-type domain-containing protein n=1 Tax=Aspergillus puulaauensis TaxID=1220207 RepID=A0A7R8ANC3_9EURO\nMSTRKSQSSRKRPLRLPTIAPKDDMTPLRSHDGTPAAIRATVIQPRLRFPPRSRTGCWTCRSRKIKCDEVHPQCNQCARLGHICDYQPRLCFRDDTRRVMERMPDVKTEGNSVWDPTKMSLWRERLGTSDSIPCDLLPDFSKLISDEDREKKAQGSVPGTYHVVAVPESFARLPEYTEDAFETVPGDPYWSPPSESSSHDLMDEVTTSEDPNVVILSQFRDSRKQPYSNRPSHTQSPESELRPTSVSVETIYTSLQNIPEDEISESIDLEAYDMTLLDHFENIVWMQLIPGDYGYLEANIFEQEASNFPPLLHVMMALSALSLVQQGNNHYMDVLQYYDQALPSLQSSLQNCDDVLSDGLFLTHFLLLIYQIAYTTPNNGLNLWSHHLSRLLQLSLLRQSVTEQERYPLIIWLTCHVDLYALLSGASEGAYVRAAIESHLLPETEFLLYPVGLQNSSVMHPDEYDPRSLIMRLYRECFILSARFGLFTAEVKGSKMAYTEPIFRELENMRAAFKHLWNSDEVQFFIESQSNMPKPSQHSFYQLSILFHTSLLFTCTSFGRIESELEKEIQHHTNAILHLAEKMIAQGRHNGPLFLTFPLFLSGAVTSSHTAKMTALKLLAQLGETELGYKAATTSSMLRIVCETQLQHWRSGGSVREIDWSEVAANHGFRLVNYG\n>UniRef90_A0A2E4T8P5 AarF/ABC1/UbiB kinase family protein n=4 Tax=unclassified Alcanivorax TaxID=2638842 RepID=A0A2E4T8P5_9GAMM\nMSKDTIVNEMRANLAREREGLALVRNTARGAFRVFETVGVVGRQGLGWLLGDREALPRHLRRTFESLGATYIKLGQFIASSPSLFPEEYVSEFQKCLDRTPPLPFHYIRETVEAELGAPLDTLYEWVDPKPLASASIAQVHAARLKNGADVVIKVQRPGVRQVLLTDFNFLYASARLVESLAPGLSRSALSGVIEELQAGMLEECDFLQEARNLDAFNRFLAETGNVAAVAPRPVASHTTKRVLTMERFHGVPLTDLQVLRRYTDDPAGTLITALNTWFSSLMVCDFFHADVHAGNLMLLEDGRVGFIDFGMVGRIRPEAWQGMMAFFEAIGSGDVPAMARAMAMVGMTSEEVDVDALARDISALQDRLTDVDASALVQADRNDREVNQLLTDLVRIGEGHGIRFPREFALLLKQFLYFDRYVQALAPELDMFSDQRVDLFGTLDQLPGDEPLH\n>UniRef90_UPI00156E65B2 VOC family protein n=1 Tax=Flavobacterium sp. 7E TaxID=2735898 RepID=UPI00156E65B2\nMSKNITGIHHVTAIAGGAQKNLEFYAGILGLRLVKKTINFDAPEVYHLYYGDEQGNPGSVLTFFPYQGLKMGRHGKGMLNTTTFSVPLDSIAFWTERLSRFGIAFKPPQERFQNEIVIYFEDYDGMGLELVFNDTDSRVGYYNGAINESNAIRGFHNVEIWQEGYELTAGVLTQQLNHTLIAEKGNRFRFAAQESSGNYVDILCAPDSLKGLAGSGMVHHLAFKTPNKTSQEAIRTIIVDRGLNPTPILDRKYFTSIYFKEPGGVLFEIATEAPGFAIDEDAEHLGEELQLPEWFESRRAELNSKLPNISIDHNKFL\n>UniRef90_A0A6B3SK05 ABC transporter ATP-binding protein/permease n=1 Tax=Noviherbaspirillum galbum TaxID=2709383 RepID=A0A6B3SK05_9BURK\nMRRYSASSPEPAANQGTRNDWVTLKTLFPYLWAYKWRMLLALIFLIGAKLANVGVPLVLKKLVDNMSIEPNHPQALLVLPVGLLVAYGALRVSTTMFTELREFVFAKVTQRAVRTIALQVFRHLHALSLRFHLNRQTGGMTRDIERGTRGISSLVSYTLYSILPTLVEIALVTGYLVLHYDIWFAVITFIALGVYIGFTVAVTEWRTNFRRTMNELDSKANTRAIDSLINYETVKYFSNEDFEARRYDQSLENWETAAVKSQTSLSLLNTGQSLIIAIAVTLILWRATQGVIAGTMTLGDLVLVNAFMIQLYVPLNFLGVIYREIKQSMADMERLFQLLEQHREVADAPDAKPLAVRGAEVRFSHVNFSYESKRQILFDVDFSIPAGTTTAVVGHSGSGKSTLSRLLYRFYDIQSGSITIDGQDLRDVTQASLRAAIGIVPQDTVLFNDTIEYNIGYGKPEASKDDIVAAARAAHIHDFIVSLPDGYATMVGERGLKLSGGEKQRVAIARTLLKNPSILIFDEATSALDSKSEQAIQAQLKEVAQDRTTLVIAHRLSTIADAGQILVLDHGRIIERGTHGQLLAADGAYAQMWARQQAHRDEQTASPAAPDLDASAA\n>UniRef90_A0A2N3HH73 Sialate O-acetylesterase n=2 Tax=Confluentibacter flavum TaxID=1909700 RepID=A0A2N3HH73_9FLAO\nMTVKCFLFISCISMNTAVYAEIKLPAIFGSNMVLQRNSEVSVWGTAKTKSKVTVSTSWNNRSYETTSDKEGNWKIKVSTPEAGGPYIIKMSDGQELVLDNVLIGEVWLCSGQSNMERTLRGAGNDPILGANEAILKSNNPSIRFFTVERAKSEEPEDNFKGDWKVCNRSTAPDFSATGYFFGNLLQEILDVPVGLISSNWGGTQIQRWLDEGTIKTFAPEHWESSPSTLFNAMINPMLNFNIKGVIWYQGESNRENPEIYDEMMVKLVQNWREKWGIGNFPFYYCQIAPYEYDNKVNSAFLREAQLKASKEIPNSGMVSLLDVGEERNIHPANKRAAGERLAYFALKETYGIEGISARSPEYLDMKIEGSTVELNFSENLTSFGKELKLFEVAGKNQIFYPAKARIKGKGIILVSEEVAEPVAARYGFKNFVDGDLYNIHGIPASSFRTDKW\n>UniRef90_A0A672QUX7 Galactose-3-O-sulfotransferase 2 n=3 Tax=Sinocyclocheilus grahami TaxID=75366 RepID=A0A672QUX7_SINGR\nMLPPQRIAGRERRAFRWRTAIPWTTCVRVACCSRLRFMWFALVVLTVLCGALQMLGVVRQARSSKVLKLVSEQLVRMPAEMYRPVKHKDWENLWSVSAAIVEEPLDLQPFIQRKDESENPHSEEGRDQVLEDTRKKLSSSTKAAPPIEAIKLWLDQYFPNQPQRPAFPKRTPEIHKPPPSDDKTDKQTVKSLVDDTAMCHPKNHIVFLKTHKTASSTILNILYRYGESHNLTFALPLNMQSQLFYPAFFAAHFVEGVRTRSVEEFHILCNHMRFSSQEVRKVMPKDTFYFSILRNPVSMMESLFVYYKAIPAFRTVKSLEEFLIQAPENDTELDKRSAEVIAAVERDFPLILISEYFDESLVLLKHALCWSLDDVSSFRLNSRSERSRRPLSAEIAEWVKEWNSLDWRLYQHFNATFWKRIDSTLGRAKLQQEVELLSAKRRKLEKMCLQEGGAVDPAQVQDSSLKPFQYGAAVIQGYNLRLGLSNATRQLCHRLITPELQYTSALYTKQFPHLADVRAVAANKFAASRSTAMHRAVKHYFDLTYQYK\n>UniRef90_A0A8E0G9R0 MaoC_dehydrat_N domain-containing protein n=6 Tax=Burkholderia TaxID=32008 RepID=A0A8E0G9R0_BURTH\nMRATPAERRDDALRIVTDLVSPAPAAALAATLDRDAHPRAGDPLPPLWHWLYFWTAARQSSLGGDGHPRTGGFLPDPGLPRRMAAGGRVRFIAPLAIGSSATRTSRVASLERKAGRSGRLAFVTVEHRIESSGALAIHEEQDIVYREPAEPGAPSPPRQAAPDGAHWQREIAPAETLLFRYSALTFNGHRIHYDRAYAQHAEGYPDLVVHGPLIATLLLDLVSRSMPDAVVTDYAYKAVRPAFVGRALTLCGRLAPDGRSAELWAKDHEGSLTMSARASLVR\n>UniRef90_A0A3P6UJT8 Mediator of RNA polymerase II transcription subunit 13 (Fragment) n=2 Tax=Gongylonema pulchrum TaxID=637853 RepID=A0A3P6UJT8_9BILA\nMCLSLIRDTGEQENIGWEDVLTARQYMEYIDLSGYATQFKYQKVISSLHSIASALASCCGLGAFQSNTVMIEYPSQAALSGLPDSLLYHYHMHRVCVQHSNLVVVKGTFPLKMQ\n>UniRef90_A0A8J6DP79 Uncharacterized protein n=1 Tax=Galemys pyrenaicus TaxID=202257 RepID=A0A8J6DP79_GALPY\nMDGVMRMPGPTDRTERTNRTDSTDEHQRAAAVESSREVEMHMPASQPLAPMPAMYLTTSTNKSMKSHGGLQDSSSLTRLPRTILTLAPVPPFLPLQMIMENRM\n>UniRef90_V5RHL7 Single-stranded DNA-binding protein n=1 Tax=Spiroplasma apis B31 TaxID=1276258 RepID=V5RHL7_SPIAP\nMNNVNIIGQIEGTPQLVFNSKNGEKKLFKFILRVPRNYKNKDGIITDDFINVKVWSNVLGDEYEYYDQSFVGIEGRIISFGSTDSVTYGNEIVANKIIHIA\n>UniRef90_A0A074WYW5 Ubiquitin carboxyl-terminal hydrolase n=29 Tax=Aureobasidium TaxID=5579 RepID=A0A074WYW5_9PEZI\nMSGGWNTIESDAGVFTYLLENLGVKNVQFEELISLDAQSLGQLSPLGVIFLFKYNNDGRKSDGPLDGQFDFEATYNLDDAGSGGDGKGKVWFAAQTIQNACGTQALLSVLMNKDNADGVELGPHLTDFKDFTAAFPPDIRGEALSNSDLIRDTHNSFARSSPFVSDETRMATQDDDLFHFIAYTSINGKLYELDGLQEAPINHGPCAPTDFAEKVIPVLQRRIERYPSNEIRFNLLAMCQDLRVKAREFGDEDMVYREEEKRRAWQWENALRRHNFVGFVGELMKGVTAAKIADGSYDAWIEDSKQKTKKKLEEGKKKGYNPDEMEM\n>UniRef90_A0A413WZM4 Secreted protein n=1 Tax=Bacteroides uniformis TaxID=820 RepID=A0A413WZM4_BACUN\nMFYGINFLWPASGCFLYLVSKARSAGCARNDNSVSFHHAMFAHQCWNSEKYGIKFLEEMLLSNKREYKLLSFI\n>UniRef90_A0A8S3J9F7 Glycylpeptide N-tetradecanoyltransferase n=1 Tax=Rotaria magnacalcarata TaxID=392030 RepID=A0A8S3J9F7_9BILA\nMNTYIFNDDIFLATADQILEELADESVVDLRSHWPILPLLQINLYHVPPQPKKVQEWTIVEVDNDDILTPYPYPSDPMIAERFYEEYSSGNKQKSMENEPGKSKTEEKVFKKNNNATEEAMDPSMTLDATMIENNPEIRKMFLDAAVKQESSLVLKYKYGSFFFKNNNNNTVNLLECLM\n>UniRef90_UPI00197D08DB FMN-dependent L-lactate dehydrogenase LldD n=1 Tax=Novosphingobium sp. GeG2 TaxID=2726189 RepID=UPI00197D08DB\nMIPLSVFDYRSAAKRRLPKFLFEYIDGGSYAETTLRRNMADLQEISLNQRVLRDVSSIDLTTDLFGQTIDLPLVLAPVGLAGMNARRGEVQAVRAAQEKNIPFTLSTVSACSLPEVARATTRPFWFQLYMLRDRGFMREMLETAQEARCKTLVFTVDMPVPGTRYRDYRSGLAGAPGIVGRARRLFQAAMKPQWAWDVGLRGRPHTLGNVAPLLGRNTGLEDFFAWMRTNFDPSASWSDLEWVRERWPGTLVVKGILDVDDAKEAIHAGADGVIVSNHGGRQLDGVVSSAQALPAIAEALSGQATIMVDGGIRSGLDVVRMIALGADAVMIGRAWAYALAARGELGVSNLIDTIRSEMLVAMALTGETNVHNLCTNNIIR\n>UniRef90_A0A358QV57 Na/Pi cotransporter family protein n=1 Tax=Desulfotomaculum sp. TaxID=41211 RepID=A0A358QV57_9FIRM\nMWHVVILGLIGGMGLLLYGMQILSEGLQKIAGAKLRTLMSTLTQNRLSALAVGATITVLFQSSTATTVILVGLTSAGIMSLKQTLGVILGADIGTTVTAQLIALKVTEIALPIVGLGATIIFFTKRERYRRYGQVLMGFGLLFLGLKIMSDVMYPLRENPMFPEMMAKMSDNPLLAMLIAAVFTFLIHSSAASIGIIMVLSMQHLVSLHAAIYLLFGANIGTSFTAILSSLGSSRESQRVATAHLLFKVAGVIVFLPFVGPFIALMEKITDSPGYQVANAHTFFNIALAIAFTPFVSQFANLLMKIVPEKRKIGEVFGPRYLDIKLINTPAIALGLATKEINRTFDYVYEMTRDTLLMLEKNDASIISTVAKKEDRVDILFKEISQYLTNVLRQPHSRGEFVKCMGLINIVNDLEHIGDIIEKNVTYLAQCKIDGHCTFSEEGWDDISIMHKKVCDLMQMTSTAFVTSNHDLADRAYKLQPEITKMERHLRVLHIHRLRISGSTEEEGALYLDLINALLRISEHVRNIAWEVANEGLEFTASGERVATDER\n>UniRef90_A7HUX0 Short-chain dehydrogenase/reductase SDR n=1 Tax=Parvibaculum lavamentivorans (strain DS-1 / DSM 13023 / NCIMB 13966) TaxID=402881 RepID=A7HUX0_PARL1\nMASGNTLSGKVAIVTGGASGIGRAIAHAFANEGAKVVIADVEEETGEKTAAEIVEGGGEAIFRYCDVGERLDVRNLVCAAGDAFEKVDILVNNAGVVSKGSDFLTLEEEEFDRVIRINLKGHFLVGQAVAQRMVAQIEEGHAPGTIINMSSINAVVAIPAQAAYSASKGGIKQLTEAMALSLAPYGIRVNAIGPGTIQTAMAGNVNENPGANKMLLSRTPLGRVGQPEEIASIAVFLASDGASYMTGQTVYADGGRLSLNYTALPMAKKKGEEKKE\n>UniRef90_A0A3L7A326 GNAT family N-acetyltransferase n=1 Tax=Mycetocola tolaasinivorans TaxID=76635 RepID=A0A3L7A326_9MICO\nMTTESMLPLNQRVTAPTQLPVPTGTEGVTWRPATAADLPAILTLDRAVEAVDDPRHVTTIEALTVDFAASGFDPAADSLLAETTDGTVIAYGTAHAEPEARSVVKVHVPGAVHPEYRGRGLGTALLDWQEARAAQHLAASDLAVPGWISTGAAEHAESPRGFLTTRGYVERRWWMELTRDLSDAIPELPLHADVRLEPLTEELSEATRQAFNDSFRDHWGSQPTNEEDWKKYGSVSTLRGDLSALAVTSDNEVAALVIVSVDPAQWEAAGYRFGYIDLVATRRDWRGKGLAKSLLAQVLRNLKAEGLERAALDVDSESPTGALRLYESVGFAPEARSVSLVREF\n>UniRef90_A0A0A8VBS4 Transposase n=1 Tax=Yersinia ruckeri TaxID=29486 RepID=A0A0A8VBS4_YERRU\nMTALIRRHLRPLYLSLDLTSVVQDSPWAEALSWLRMVFSKKQTLLQRPLAECPPETLPERLRPYLLEFGEDGEPTGLNAGRYEFWLYRQIRKRFKSGEFHLNNSLRHRHLSDELVPEGEQAAVLAAMNIPFLQKPVKTQLKALESELHRQWKAFNRELKQGKLKHLEYDQQTQKLTWHKSVVSRHKAQEKSFYEQLPFCDVTDVFRFVNEHCRFLPAMKPLQPRYAKNEVDADSLMAVIVAQAMNHGNHVMARTSDIPFHVLETTYEQYLRLASLLTANDCITDAIEALPIFPLYSFDPGTLYGAVDGQKFGVERPTVKARHSRKYFGRGKGMVAYTLLCNHIPINGYLIGTNDYEGHHVFDICYRNTSEVKPTAITGDMHSINKANFAILHWFGLRFEPHFTDLNRQLQELYCTRDPSAYKKCLIQPAGQIDLNLIIREKSNLDRIVATLGLKEMTQGTLIRKLCTYTTTNPTRQAVFAYDLLVRSIYTLKYLRDPQLERNIRRSQNRVESYHQLRAAVAKVGGKKELTGKNDIETEISNQCGRLICNAIVYYNSAILSRLLERLETEDNTKGIEALPRISPVAWQHILLNGHYIFQSNNEIIDLDALVAGLKLR\n>UniRef90_K7W9Y4 Glycosyl transferase group 1 n=17 Tax=Nostocales TaxID=1161 RepID=K7W9Y4_9NOST\nMAGKDIKLSSASASILTLGTGWFPNNPGGLERYIYELIHKLAASQDQVELCGVGLPLDAKNTQIKLTNLACPDSKISSRLWSIRDNFQKTRLGKPDAINLHFALYSFPILDILPKGVPVTFNFHGPWASESQEEVVNKKLSVWLKEKIIEQSTYNRCDRFIVLSKAFGQILHQKYQVPWQKIHIIPGGVDINHFQNNLSRQEARIKLGWPTNRPILFTSRRLVHRMGIDKLLQAIAMIKVGIPDIWLAIAGRGHIQALLQQQARELGLENNVQFLGFVPENDLPVAYQAADLTVMPSQSFEGFGLAILESLACGTPVLCTPVGGMPEILQKFSPDLITEAITVESIADKLAQVMLGKLPLPSREECRNYTIKNYDWTNIAQQVRQVLLA\n>UniRef90_S4SV14 Cytochrome c oxidase subunit 3 n=3 Tax=Scarabaeoidea TaxID=75546 RepID=S4SV14_9SCAR\nMSAKNHPYHLVDASPWPILGALSAMISMVGIIKWFHMFNSTLLLLGLSITSLIMYQWWRDISREGTFQGLHTYPVTMGLRWGMILFITSEVFFFISFFWAFFHSSLAPSIELGMNWPPKGVIPFNPIEIPLLNTLILLTSGLTVTWAHHSLMENNFTQATQSLILTVTLGVYFSVLQAYEYMEAPFTIADAAYGSTFFMATGFHGIHVIIGTTFLFTCLMRHLNNHFSSIHHFGFEAAAWYWHFVDVVWLFLYISVYWWGS\n>UniRef90_A0A6G1DB44 Epidermal patterning factor-like protein n=1 Tax=Oryza meyeriana var. granulata TaxID=110450 RepID=A0A6G1DB44_9ORYZ\nMGHLLLLLLALLLLASSVHAKSAAFTEEKGVAGITVVIGSRPPSCEGRCRSCGHCEAVQVPISPQELQKKSGQVDSKKKKKLGHGDRAAAAAGGRTMPDSYDDHSNYKPLSWRCKCGGLILNP\n>UniRef90_B5HBE5 CsbD family protein n=4 Tax=Streptomyces TaxID=1883 RepID=B5HBE5_STRE2\nMGISDQFKDKAQELADQAKQKAGKGDQSERARRAREEVSERTQQGREQQGARSRESMQERGENAMRERRDRVEDYDA\n>UniRef90_UPI001D7ADF37 heterokaryon incompatibility protein-domain-containing protein n=1 Tax=Truncatella angustata TaxID=152316 RepID=UPI001D7ADF37\nMDDDLERQHQEFINRPLRDELPCDRCANLKLSTELFNESFDIGEIELTNILVDHFIFREVNSEYCSSCVDLMRRIDRQEITIRPRRILGFNSESEGDDLLVRSTFQINPDLRPLLCRVDNDSKTFDWGSESKSFGTYTTSDIVGPDHIRHVGDTPNYDAIKVWLGHCLRSHKQCNYSGDLKSALEMIFLIDIEKRQVVTYPKNGEHAPEYFALSYVWGGYKGVSYKPHSTLPYPLPQTIEDAIFVTKRLKLGYLWVDAVCIDQDDDVQKKEQISLMASIYRGAVATIIPLSSNTSDDGFPRVHSGSRRSNQLSLDFGHGKCLQQKLPRLADAIHEAKWNTRCWTFQEKLLSHRRIYFTDHQVHLSCAELVCCEAWHDETHYHNNPEEEDYLIMNPPNREDDLFTQNDHDCDIVSDFENIVNQYLERELEKPEDILHAFSGILEELKQHKFPDGFHQGLPKEDFQHSLLWRAGKVYGVMVDKISGKKYGGLSQATKREFLPQLPSWSWISWRPISGIKFYRLPDQTREPEIYSLKPWVHISDTKQVQLYEGSVAFRRKWEKLVLAHHGWSQNFTSPYITINQDLKQDRAIPAHRSNLHEHARLCVEGIVLQLPFQFMRRNTRVRTTSSYTTRYTRDLELTICDHIISKRLDVEWHFDRRFDRTKKYEEALKSSPLLLLDAYLQTDGGILIPGDFVLNLELLVLSWNGLLARREGTVTVRLKLDRKLKNLKSLVLGHHSITSRDGIDWPSDRVGQVDDTKSDGFASLRIDTERMN\n>UniRef90_A0A6A7C4R0 Thioredoxin-like protein (Fragment) n=1 Tax=Piedraia hortae CBS 480.64 TaxID=1314780 RepID=A0A6A7C4R0_9PEZI\nLTLTTTEARCVVHFAKEEFARCRTMDTALEQLAKRHVETRFVRLEATEAPWVVERLKVRVLPCVMGFVGGKSVARITGFEGLGGGREEQSGFSLGKLERKLVEYGVLER\n>UniRef90_UPI001FE2688D hypothetical protein n=1 Tax=Winogradskyella ursingii TaxID=2686079 RepID=UPI001FE2688D\nMRQKLRHSSAVFFTILFVALLSAPTIITSFDDSIDISFFYSLSEEEENEKNFKLVFETDSDSEIFFDAKKRKGKGIYKFKKYPKPHLNLVSPPPEFIS\n>UniRef90_M5C988 Delta14-sterol reductase n=1 Tax=Thanatephorus cucumeris (strain AG1-IB / isolate 7/3/14) TaxID=1108050 RepID=M5C988_THACB\nMPLGTELRTGGRIKYKINAFSTMLLALGLTLGWIINFGPESFTFIYDHWVGLCTASLINSFIQATWCYYISTKNEETRTLAVGGNSGNVLYDWFIGRELNPTIGSFDIKSFNELRPGLILWLLCNISSACEQLTRRGTLIPTDSMGLVLLFQGLYVADALYNEPAIFTTMDITTDGFGFMLAVGDLAWVPFTYSLQARYLAFNHVELGPFWTCIIFVIHAVGYWIFRGANNEKNDFRNGKNPKNLTSLQTERGTRLLTSGWWGMCQHPNYLGDWIMSVSYSLPTGFNTPITYFYCIYFLILLLHRQTRDDDHCRKKYGKDWDTYTSIVPWRMFPYIY\n>UniRef90_UPI001CF80729 YggS family pyridoxal phosphate-dependent enzyme n=2 Tax=Dechloromonas denitrificans TaxID=281362 RepID=UPI001CF80729\nMRKGSDDGETRPVSSSGTPPRQDELGRYPRPSSLEDFRRNLAAVRARIDAACRRVGRDPASVRLLPVSKTVDEGQIRLSYAAGCRLLGENKVQEAHRKWQAMADLIDLRWSVIGHLQTNKAKWVARFAAEFQALDSLRVAEALERRLQIEGRSLDVFVQVNTSGEASKYGLPPADVQAFLQALPGFPALRVRGLMTLALLSGEAERVRQCFIRLRTLRDQLRQSAPVGTCLDELSMGMSGDFEIAIEEGATVVRVGQAIYGARALPNSHFWPSETNTRESP\n>UniRef90_UPI001010A2DF DUF58 domain-containing protein n=1 Tax=Cellulomonas endophytica TaxID=2494735 RepID=UPI001010A2DF\nMVLTGRAVLLAAAGVVALALVPSAGTVLVWAVLVALVCVVDALLAASPRRVAVHREVPASVRLSQSATCTLTVTNVGPRRLRGLVRDAWQPSAGAVVDRHRVDLPPGEGRRLRTVLVPTRRGDRRADLVTVRTVGPLGVAGRQASVPVPARLRVLPEFASRRHLPSRLARLRELDGRSAVQVRGAGTEFDSLREYVVGDDVRSIDWRATARRNDVVVRTWRPERDRRVLLVLDTSRTSAARVGDAPRLDAALEAALLLAALASRAGDRVELLAYDRRVRARVVGASGPRLMPALADALAGVEPTLVEADWPGAAAQVRERLSRRALVVLLTALEPAAVEAGLLAVVGPLAQRHQVVLASVADPEAEDLRRGRGDAAAVFDAAAAERAGLERAAVALRLRQRGVEVVDALPDDLAPALADRYLALKAAGRL\n>UniRef90_A0A7J2IPL5 (Fe-S)-binding protein n=1 Tax=Candidatus Bathyarchaeota archaeon TaxID=2026714 RepID=A0A7J2IPL5_9ARCH\nMSSKMYELFKKTLEKYLPGKGVTKRITPDQLELKRFEDLEHYKDVLYFCGKCGQCRYVFQEAYWSRVCPSGELKKFEAYYLGGKNLLLWGVLSGKLKWTENLAKILYHCTLCGNCTQQCQIPEIHHYALEWLFAARIESVKRGIAPMPEHRKFGEWTKKEHNPYMELHTDRQKWISSDIRRELPEKADIVYFVGCTSSYREIQVAKAMLDILTSLKLNFTILKDEWCCGSPLFWTGQIDIAKECAKHNIEEIEKSGATIVVTSCAGCYRMIKEIYRNKFGLEYSFEVLHAPEFLLSLVKDGTLPLENEISEKVTYHDPCHIGRHMGLYEPPRELLKNIPGIELIEMTRNRRNAWCCGAGAGVKSAFKDLALFAAHERLKEAQSTEAEILATSCPFCERNLRDAAKAYNVNIKVVDIIELIKYSM\n>UniRef90_A0A2E3V0Q5 Response regulatory domain-containing protein n=7 Tax=Chloroflexi TaxID=200795 RepID=A0A2E3V0Q5_9CHLR\nMNNLSEKNRNQKILIVDDEHMSDLMRSVLRRLEVDGFNTIVVKPKGNMGTGDEYEIQTLFALEEHHPDAILLDVRFGEYDTDRFKGLSILKKIVERNNKIPVLMFTQYAQGPYRDTAVTATLSVDANVDFIDKLASPEEVVLRLRRLIGSSPEKVMIGDIFEIDSDNSAVYAIVDGKKEIVKDVQGMKLEILKELAAALYRSEGELVPFSKLERFSFGEDSRASLRVRIRELKISLGKSIGREFSANELIINVRNRGYRLIHPE\n>UniRef90_UPI00189E7165 hypothetical protein n=1 Tax=Halomonas sp. KAO TaxID=2783858 RepID=UPI00189E7165\nMASRTSASLSPQAPLSRHLRSSLRLSRWSGQSSPRLPRLIEPAFHLEVEFDAESGELVGMERVRIDAMRRREEAP\n>UniRef90_UPI0006E14DC3 hypothetical protein n=1 Tax=Streptomyces neyagawaensis TaxID=42238 RepID=UPI0006E14DC3\nMTHPTAVPLAVASLEPALLFAAAAVLTVLAVPSGVWLIRRRPTRIGRERPTAPAVWVAALAAIGCTAYSADTSWRFAADYLDMAGTTERAAMFAAAELALFATALMARQNLASQGAPGLPGVLVWIITGVQVIPAYAESGPIGGTVRAFVGPVMAAMLWHQAMGIELRLRKPGASSRGVTATLGREARERLLSRLGIAERDRDAAQITRDRATARAVTLATRLAGRTPKQRGNWRGRRITRRLQGALARADVGTDPEQLGVLLDQLAARRHATALATVDLPSPWTRPLLSPPHGRRDQPSLAPHQVAVGDQVTPQCHAVPKAGPETKMDSPRIRDRPEEGHMGPALGTEPAGDGDRPRPVPETGDRGAAGDLAADAAAGHGAKGDQASAVPGTEDAQDGDETSEGDGDKTAAQGSDIPSRTPFPYNGDHLVPRTETGAGTESTGDRPQTVPARRRPKASRTRTRGGQGKPSRRQPQLSVDQLVTQLRPHVPRLLERDGNAEVTRTQLREIMRAHNIGIRNDRLTPVLERLRREAATSTTKKRSAR\n>UniRef90_UPI0005A97BD1 hypothetical protein n=1 Tax=Streptacidiphilus anmyonensis TaxID=405782 RepID=UPI0005A97BD1\nMSSAVLATRETSAAPRSGLRPRGVTWLTWRQTRAALLVVTLGYAAALAYLLYQHHQFDVTTVRLRGLHCSTDTRDPVSVITANCNLAALAVMQAASGVHRLATVALAAPGLLGAVLAAQPLAVDLERGRHRLLWSQSVSPRRWFTQRMLLPAAILLVLSAVLSVALRWAVLWTHPALPIEDWSFDNASDALAPVYPLLTLAAFALGAVVGLLLHRVIAALGITLALYGVLLYGMAQVRPYLVPLHRKVVGPGDPWPSGDWVYDSGPVVHGKDFSYSACPVATGCDKEPSWILYHPLSQFGPMLWVETGMLAALTAGLVALAYRRLLALTR\n>UniRef90_A0A5B9QW56 Alkaline ceramidase n=1 Tax=Roseimaritima ulvae TaxID=980254 RepID=A0A5B9QW56_9BACT\nMTHPPKSLKPHPGFKGRIGIAREDITPPVGIYSRNWGAAQHDTADSIHRPLTLTALTISASSTDEPLILIDADLGWWRPLDLFQQFQQRLLEELSLESSRLIFALTHTHAAAPLMKPDPALPSSEPLGPWLERVYQATVSAIRRALADADEAILDWHHGRCALAAVRDFPDPDPAANRILCGFNPAAVADDTLLVGRITDASGTVRATLVNYACHPTTLAWANTTISPDYIGAMRETLEAATGATAFFLQGMSGDVAPKHQYVGDVEVADRHGRQLGFAALATLQDMQPAGRQLYFDEVVESGAPLAAWRHRPHALSSELRAVEIAADLQIKDWPTAEELEQQRLACEDRALEERLRRKRDIRRSLGDGSSSPLAVHAWRIGDAVLVGCGGEAYSQLQQELRSRFPELAVICMNLINGSVGYLPPADLYDVDIYPVWQTPFARGCLEHIRETMTSAIEELVR\n>UniRef90_UPI000D340775 DUF1566 domain-containing protein n=1 Tax=Muricauda amoyensis TaxID=2169401 RepID=UPI000D340775\nMNKTSKLTHLFILTILLIGFGCSNDDDAGSPISLEDLAVSMDENPSNGQTVGMVETVGGTAMNFSIVSQSPAGAMDIDSSSGELTVANASLFDYETNATITATIDAENAENTATITVTLNNVNEVSAQALEVTMDENPTNGDVVGSLQATGTASGFTITSQTPAGALTIDSATGELTVADATLFDYETNPTLTATVTLEDAQNPVTVTVNLDNVFEVTVQDITLSVDENPTDGQVIGIVQTSGATATNFNIVSQTPNGALNIDAATGELSVVDPNLFDFETNPTITATVIVDDAENPATVTINLNDVDEITVQPGNFTIDENPSNGDSIGTLQATAGSSLTYTITFQNPVGAFSIDQNTGELFVADETLFDFEANPNMFATISVDNGTYSVSANVFVALNNLNEIGEFKYGGVIFWIDPADNGHGLVSAITDQSTSATWGCQGTLISGTGTGIGSGDTNTAAIIAGCATPGIAADIASNTTIDGYSDWFLPSRSELNQMYAQKAIIDATAIANGGTAFPPSVFYWSSTEANSNTAWAVFFDNGNNGGFNKGVSTFYQVRVVREFDLGN\n>UniRef90_UPI0013DE5835 hypothetical protein n=2 Tax=Pseudoalteromonas TaxID=53246 RepID=UPI0013DE5835\nMKVTLNKKSIKSLSANPATIIRAQETPQIGGGRVIDESFWVCINTRSNCEGTKRCPFD\n>UniRef90_W9ZDG4 DUF4097 domain-containing protein n=1 Tax=Fusarium oxysporum f. sp. melonis 26406 TaxID=1089452 RepID=W9ZDG4_FUSOX\nMDFSSFDLPFTIAEDHTAQPVSTGSAYDFRETIDGTLARRSLANTPDCLISKLAGLKLDSSSAVFRSRIVAVANEDKGVMVKGDGKPIDLLSGSLSIEQVPDKPSFSISSDKVAIQGYYLPGEDDVIIHGHGHDNNELEIAKYSSATGKMASPRVVGTQFRLDDGVWQVSEPSGMQFHLYVFPKTYFLHLTSKPSKRPRLEDGESTPRP\n>UniRef90_UPI0010938F88 DUF3108 domain-containing protein n=1 Tax=Mesorhizobium sp. M4B.F.Ca.ET.172.01.1.1 TaxID=2563950 RepID=UPI0010938F88\nSSRYENGVYSIDGSVSAAGLAKRFDDTRGTISSKGTISSQKMVPQAFRADYTSGKKASLVDIRFGNGNVTSTKVVPAPEKRDPKSWVPLGAGDLKSVLDPMAA\n>UniRef90_A0A095C0S5 Integral membrane protein n=5 Tax=Cryptococcus gattii species complex TaxID=1884637 RepID=A0A095C0S5_CRYGR\nMKENYAVENALGTIGAVLWMVQILPQIIKSHREKTTKGLSASLMFIWALASFFLGAYIVAQKLSIPLQVQPQAFGVLAAVSWCQCLHYERGYSLKSVWAIFIAFCCVFAGFEAGSVYALWAGQRNGVEWPVLMYGYISAVLLAVALLPQYWEIYKYREVIGISLLFMVVDILGGVFSFLSLFFRNDLDIAAFVSYSLVVVLDGIVVILYFILNPIAERRRARQAGRHSDSEAKIEGSSSVGMSTVPTLVGHGLMIDKEVQDGDRRQDNVRVDSEMEQSRVDDRDKMKAGGAEVEVHGPDAQGHETTGSSGEHSEESVKTIK\n>UniRef90_D7WDM9 Glycogen synthase, Corynebacterium family n=7 Tax=Corynebacterium TaxID=1716 RepID=D7WDM9_9CORY\nMMTREYPPEVYGGAGVHVTELTRFMRDIVDVDVHCMGEPREGENIYVHGVDPELTEANGAIKTLSTGLRMAHAADNVDVVHSHTWYTGLGGHLAGLLHGVPHVVTAHSLEPDRPWKREQLGGGYDISSWSEKNAMENADAVIGVSTGMKKAILEAYPNIDEDKVHVVLNGIDTEDWHRVAPSDAESNGVIERLGVDTSKPVVAFVGRITRQKGVPHLVKAAQDFDEDIQIILCAGAPDTPEIADETQALVDKLREGRGGVYWVTDMLPKEEIREIYSAADIFVCPSVYEPLGIVNLEAMACETAVVASDVGGIPEVVVDGETGTLVHYDKDDTETFEKDLAEAVNTLAADADLTKRYAQAGLARVKKEFTWDKIAQETVDIYKSLI\n>UniRef90_A0A0K6GGW7 DPBB_1 domain-containing protein n=1 Tax=Rhizoctonia solani TaxID=456999 RepID=A0A0K6GGW7_9AGAM\nMRSTQILAVLAVLATSVSSMSIGHVPNQLTHRRHAAEVHESVIQARGARRAVFAQNTPEMAKRDDAPRRRKRGINQRRCAPKTTTGLPQTASVPSTSSAAPTSSAAPTSSVVPTSSAHTTSAASATTPEPEPTSSQAETTTSAKAKYTKPSAQTPTKTSTSVKPTATDDDSGSSSGSTYTGQATYYGTGLGACGITSSDTDYIAAASQLLFDGFDGYKGSDPNSNPICGKKVKANYQGKSVTITIVDRCVACAKYDLDFSPSAFSQLADQALGRLSGMTWSFIS\n>UniRef90_A0A1Y1CLL0 PAS domain S-box protein n=1 Tax=Labilibaculum antarcticum TaxID=1717717 RepID=A0A1Y1CLL0_9BACT\nMVEQKVLRSRILELLFKGESESAILNELVHQAQLIASDSICSILCVDEKGKRLLLGAAPDLPDFYNKVIHGTPIRHGVGSCGTAAFTGERVIVEDISTHPFWKNVKNLAKEADLGSCWSEPIKDPSGKVLGTFAIYHRTPNSPNPKDLELISELSDLTAIVLDRYKIIKRLEESENKYKVLANAGNEAIFILEGDKIVEVNKRAEIITGYSEMELSGMSIYNFLAKEYWITPYSDESRKFRHKIKAVGVNKNGLNVSVIVRIKNSTFKGKVVCLLSVRDVTNYINAKIELSKLSQSIIQSPVSVVITNVDGDIEYVNPKFNKLTGYSLEEVIGENPRLLSSGNNKAELYKSMWQEIKSGNVWRGEFQNKKKSGELFWEFATISPLKDDREQIINFIAVKEDITDRKRQEQIQRIILNISNAVFTQMTLVEFIQFIREELSSIMDTTNFFVALYDDETELFSLPFHDDEHDSFEKFPKGKTISGWVVDHETALLATAEKLDELEAKGEIDLVGEPSKIWLGMPLKGKEKVIGVLVIQSYIDENVVTEEDKNMLELVSQQISISIEQKRTEQELHKALRDATESDRLKSVFLATMSHELRTPLNAVIGFSELINNEIDLETAVEYSKMVNQSGQNLLNIVEDLFDISLIQSGAVKIKQENYSLLNLFYEISAVINVEQKVLNKEHIELKINFPSDYNDFFIKTDPHRFKQVYLNLLKNALKFTDRGSIEYGFTKSDLKSGIVLQFYVKDTGIGIPEEVQESIFGLFRQANEKLSRKYNGVGIGLSISKSLTELLGGKIWFDSIPEEGSTFYFTHPIK\n>UniRef90_A0A2N8BAE4 Mandelate racemase n=1 Tax=Pseudomonas sp. FW305-25 TaxID=2070636 RepID=A0A2N8BAE4_9PSED\nMKIISIKVFQFDVPLKEKYSLSGGRLQYASLDTTIVLVTTDSGLVGVGESCPWGATYLPAYAKGVRAGIDELAPHLLGENPLHLDQLNERMDVMLPGHPYVKAAIDLACWDILGKHCQLPVYTLLGGRFQDSVALQSSIPTDDAAQMMAHLERARNQGYRTHSCKVGTGIDDDVAQIKYLLDQRVPGEVITFDVNRAWTVAEAVAVMNSVADPTVCFEQPCESMDQCRAVRELTRNPIILDESIVTFADLVQAQRQNIAQLIGLKIGRVGGLTKARQMRDFCIHHGIRMNIEDVGGTQVSDSAVMHLAASTPRRFHRASWNCCRHHEVQLAEGSFDIRQGRAYLHDSPGLGLTLDPRQFECPIAQYS\n>UniRef90_A0A8G2BJ52 Transmembrane transcriptional regulator (Anti-sigma factor RsiW) n=2 Tax=Thalassobaculum TaxID=526215 RepID=A0A8G2BJ52_9PROT\nMSTRNGNGTNGSGSIEDWEVGAYVDDELSPQRRREIAAAAGASPELAARIEVYTRHKSLLAGLASRPVDDEIPEQMRAAATRLSRATTVHGWMRRGRQVMVAQARIAAVLVIGAVVGWTAQEILAPRPGNATDGPLAFIDEATEAHRTLALAPMFATDVGSVDFAKLSEMFSEGIDPAGLRANGLILSKVDMASTDQGPAVQFLFFDREARPVSLLLSVNSASLHSVGVPDGEMVVTSYNDFAVAFGRRDSIAFVVTAALPERRVGEIARQLVASAGF\n>UniRef90_UPI001B3A3E04 LPS assembly protein LptD n=1 Tax=Pseudoalteromonas sp. MMG010 TaxID=2822685 RepID=UPI001B3A3E04\nMNKSWGILMLSVVSTSSLADTELTHKLCGVSMLTRTWQPMQGLELGTVDIKADEVEFLGTQSAEFNGNVDINTLDMSLSAQSALLDKERSLLNATGPITYQNSVSTVHSTGLNADLNNSEISLLGANYNLTEQLGKGGAEKLTVNNSGLLLMNASFTACPGEIPVWAIEADEINLSREEGWGETYNAVLRILDTPVLYLPYFTFPLDERRKSGLLTPSFSSSDSYGLETITPYYWNIAPNYDATITPRYMSRIGLQLQTEFRYLTDTSKGLVGIEYLNEDDSEPELDSRYMFHWQQKSYFGENWRASVDITNVSDDNYLTDLTSNYANTTDTQLYRTGALTHLGDTWRTDIKIQSFEVLGDHDESYTALPQINFTQTAPWRINHFDFSISGELSHFINGSTEVEVDEATRLHIEPKVRFGYEQYAWSFLSEVSLLQTNYKQHGDLDGTQYSSSVSRTLPKVRLYSQLNFERDTSFFFEDGIQTLEPQMQYLYTPNKDQTDIALFDTVNLQEDFFGLFRDTRFSGVDRIAGANQLTIGATTRLFSSKSEEVFNFSAGQIFYLSDSAKPTEQGITEETNYNALFAAQTMVHWHRRWYLSGGIQYDTDGKQMIQSNVTLDYKGDNNQLVQLNHRYANDVSGNTIEQVGMFTSVPISDEWQFIASYHKDIENKRSIEVLTGLQYESCCWAVQITGQRQIKTDLNQAIDQDQATFDSSIRLNFVLKGLGSKSSYDAQKLLQQSIFGYRRPYFLNN\n>UniRef90_UPI0016098D3D hypothetical protein n=3 Tax=Rhizobium TaxID=379 RepID=UPI0016098D3D\nMQNALLDYADLISLLTAVGTFVAIVAGVVELIKARREHVRAKEQEFNSSYLTISDAYHQLLELSVEYPHLGIFPWQEEPADLSPDDLVRRDIFYEMMISIFERAYLERHKTPEIAEHFWPGWETFLRRQIEKPSFRKYWGIFDGEGAFGAYDKRFEAFAKRLDGGLPGQDGV\n>UniRef90_A0A3N5IFY8 Peroxiredoxin (Fragment) n=1 Tax=Planctomycetaceae bacterium TaxID=2026779 RepID=A0A3N5IFY8_9PLAN\nMSDWLEPGTPMPSFTLADHTGAKVKSSQWKGKPLAIYFYPKDDTPGCTKEACAFRDASQPLEK\n>UniRef90_A0A2Y9K040 AP-3 complex subunit sigma-2 isoform X3 n=13 Tax=Boreoeutheria TaxID=1437010 RepID=A0A2Y9K040_ENHLU\nMIQAILVFNNHGKPRLVRFYQRFPEEIQQQIVRETFHLVLKRDDNICNFLEGGSLIGGSDYKLIYRHYATLYFVFCVDSSESELGILDLIQVFVETLDKCFENVCELDLIFHMDKGGLSAAPARAVSAVKNINLPEIPRNINIGDLNIKVPNLSQFV\n>UniRef90_A0A379GMX6 Inner membrane ABC transporter permease protein ydcV n=7 Tax=Morganellaceae TaxID=1903414 RepID=A0A379GMX6_PROST\nMNTIKTNNGQKVVKISLIFFIFINVVWLGLPFTMAILWSLVDPQHPWSYPDLFPQKLSLARWKIVWEQTSLATALFNSYTIAPAVAILSLLLATPTAYAFGRMTFKGKAVAEMLTLIPLVMPGMIIGIFFSSMLISLNISNTFMSIVIGHTVLTLPYSIRIMSAGFKSIPQDIIDASRDMGASFWGTFCNAFLPMLKPSLLASLIFCLVRSLEEFSISFVLGSPDFITVPTILYSFLGYSFVRPDAAVVSMILVIPNVILMIIIERLLKGNYLSQSTGKA\n>UniRef90_A0A382A9E5 Swi3 domain-containing protein (Fragment) n=1 Tax=marine metagenome TaxID=408172 RepID=A0A382A9E5_9ZZZZ\nLRPTPGRKDKEHDDGGLNENNDDEEDLEESLKISIKMPKASLFESAGFNVKQQKKVASIFESAIKSTTRQVGKQIHEHYSKVHKKRLAEHQQLIENRLNTYLDVVVEEWVETNRPAVRSSLRTELSENFLNGLQKLFTEHYIDVPESKTDVVKSLTQHVETLKRQVNEQYTEKLKLHRLAETANKKRIVATFARDMSESQAGKLEKLAEDTQYVNANDFREKLSMLKESYFEKQPSRATRLPEENVQEVTETGVAKGEADMVADAITRQAKSSDW\n>UniRef90_F8A565 histidine kinase n=2 Tax=Cellulomonas gilvus TaxID=11 RepID=F8A565_CELGA\nMSPAPGTRWGLAARLLAALVVVLAVAAFTAWLVASAVGPGLFHEHMVRAGLQDHDSAVLHAERAFRDASAVSLALALGAAAITSAAVSVVLAGRIGRSLATVSKAAARLGAGEYESRVPAAGLGAEFDDLADSFNTMAARLRDADRLRARLLADVAHEVRTPVATIAGYLEAVQDGAQPMDEATMTVLADQAARLTRLAQDLAAVTRAEAGDLVLNVEPVPTRDLLEQTAAAWRDRAAAAGVHLALDPDAGSGAGPVAVDRHRIAQVMDNLVANALRHTAAGGTITLRARAVDDPSRVALAVRDTGKGIAPEHLPHVFERFYRADTARDRASGGSGIGLAICKALTEAHGGTITAASAGVGAGATFVVTLPAINSGP\n>UniRef90_A0A651I330 T9SS C-terminal target domain-containing protein n=1 Tax=Saprospirales bacterium TaxID=2026790 RepID=A0A651I330_9BACT\nMKSSFFLLPLLFFGTLNMCFSQVPFIEVLNPNEVSLDSTEAVRYDSIVGFGENYQKYLIRINPIQNYVSLDTITISIPLAEIGEIQFVTTAIEYRNDSSFSLTGYNLSGGFLNFTLLESEIGANMFIPESQSLYQFNSISESYAVMLRYPNWTGFESIGCITTGEDGDQEDYYPDEFSGPDSLNYAQERSICDHNRIRVLVLFTTQGRNESFLRGSNMNRDAQRLIDELNLSIANTGISRSRISFALADTRLLGSFVEDDEDEDIQGDVELLSNNQEAQEMRDEVLADIVVLITGNVYGNIFGVARDIRASESRAYAISTYEFTFNGNLTGTHEIGHLIGTRHQRCRRCPSACDPKWSKYKGYKVGSDMRTIMHVQGCGRTRVNVWSSSGAKFMGQSTGNTNNRNSGILKNRASKVACFREGVPPIPPPPPLSIYYIEGPLFLCPDNAFPQYEVHYNQNVFQNPIFNWDISENGLFNWTTIIGKIKNGNPVTLTQPNNLPDVFWLRATVSDPSGTTASTTIQVRKRDEPYSCNTFLRILREANEQDGTNSEYILYPNPTNNDIFVSGIVGKVWYKIFSSAGELIKIGTDNLSKDQELNISLTYFPAGLYFMELIMENNESHVMKLVKK\n>UniRef90_A0A4S8PU73 DUF4240 domain-containing protein n=1 Tax=Glycomyces buryatensis TaxID=2570927 RepID=A0A4S8PU73_9ACTN\nMDTTKALKKGRNLIPDEVFAKLVTRIEAEHHFDADMAARCVDQAAAYLAACASSTAPLSPSMAADIGWHMFILHTRDYADFCEQVAGRFIHHVPHDEPAEQSTEDVQAILDRSSAAIRKAGYQVDTELWRADGGAGKCNGCHSGCHDDPAPVPPFHEG\n>UniRef90_UPI0018E12798 fasciclin domain-containing protein n=1 Tax=Aquamicrobium zhengzhouense TaxID=2781738 RepID=UPI0018E12798\nMRMTFALAAGLIAIAIPAHAQDKDIVDTAVAAGEFTTLAAALDAAGLVQTLKGEGPFTVFAPTDAAFAKLPAGTVEELLRPENKEKLAAILTYHLVPGKVMAADVVSLDEAKTVNGETIEIQVDGNSVRVNDASVTATDVAASNGVIHVIDQVILPPEG\n>UniRef90_UPI0010459B45 aminoglycoside 6-adenylyltransferase n=1 Tax=Streptococcus downii TaxID=1968889 RepID=UPI0010459B45\nMRTEPEMFDVILQIAKSLKVEAVAMSGSRTDTKAPKDEFQDYDVVYVVDDLDNLTSDLSWLDQFGTRIIEQHNVLGNRRLYLMLFEDGNRIDLTLCPTEYIQEWVDSEAGFTVLEDPKGLFAPYSPSPQRYWISLASQTDFEKACNEFWWVSAYVVKGICRKQVIYATDHLYGICQQELLKVVAWQVAADNGTVDVGKNYKYLFQYLPAEKEKEFSALLDFSSVEKLIQSLFATMQLFHQEAQFLANKMGFDYDKEVAEKMIQYAKERLN\n>UniRef90_UPI000E3E49EC hypothetical protein n=1 Tax=Paraliobacillus sp. X-1268 TaxID=2213193 RepID=UPI000E3E49EC\nMRNVRGAKELSKYLESIGAPISESTIFSLLREGKIPHQRPSPRILIFNLNAIDEWLNLK\n>UniRef90_A0A286TUH0 Signal transduction histidine kinase (Fragment) n=1 Tax=Candidatus Scalindua japonica TaxID=1284222 RepID=A0A286TUH0_9BACT\nCELGKEGAFIWVNQTAAEMFGYKSPEEMIGTKVNEIYVNIDDGRTQLEMLEKHGVLSNTVYLCKNKSGDCFYAECTSHLVKDKKGKQCRIEGIIRVITERKKSEYRLIAQHAVTKILSESETIKIAFQGILKVICEALDWDFGSLWLEHDNVLRCVYLWHVPGLQFSEFKKKTKEISFLPGIGLPGRVLSKGKAAWIKDVVVESNFPRATAASKVGLHGAFAFPIIANTEILGVIEFFSQKPEEPDKELLNMMEAIGSQVGQFIKRKQADEQVSKLSRAVEQSPVSVVITDTKNNIEYVNRKYTEVTGYSLEEVKGKNPIVLKTVEENVEEHKELWKTITSGKEWQGEFCNFNKNGEIYWESESISPIKNCDGIITGFIQLKEDITERKLVQSHLKTQLEVAKVLAESNTIREASTRIIEVVCIALGWDLGEVWIYDKQQYILRNTEIWHLPSLNFSEFKDITCRTTFSPQKGLPGLVWQTAKPLWIEDVARDSNFLRASVADKEGLHGAFGFPIAIDNVVLGTICFFSREIRRPDDKLLNMMSSIGNHIALFIERKQADEQISKLSRAVEQSPASVVITDTKGNIEYVNRKFTEVTGYSFEEVKGKNPRVLKSDERNSVDYKELWDTISSGKEWRGEFKNKNSDGKAYWEFASISPIKNNQGVTTGYIAIKEDITVHKNLEQQLMHAQKMESIGHLAAGIAHEINTPTQYIMDNTRFLQDSFNDINKLLEKYSHLLETCKSGSVESELIEEIEVAVRELDEDFLVDEIPNAITQSLEGLDRVKNIVYAMKNFSHPDNENKKPIDINKAINNTITVARNEWKYVAEVKTDFDSSLTSVPCFPGEFNQVILNLIVNAAHAIGEEPGNGNEGKGIIVISTLCDGEWAEIRVSDTGTGISGDIRKKIFDPFFTTKEVGKGTGQGLSLVHSTVVGRHNGTITLDTELGKGTTFIIRLPLCTSSSEIVKV\n>UniRef90_A0A2N9EE18 Myb_DNA-bind_3 domain-containing protein n=1 Tax=Fagus sylvatica TaxID=28930 RepID=A0A2N9EE18_FAGSY\nMGTGIYAREDAKLWPARLEKLFIDIMVEEMHKGNMPMGIFKLKTWCKILEELNLRSKQSFKLKQVKAKYNRLKQKYRVFSQLLQQNGFVWHGETNSVTASDEVWESYLYANPDAERFREKGCEHYKLLGILFNKLIAMGFMAFASTQDAPDTDEERELDEAYRNGAFIDVDSDSQDDHEKKVSQKRTKRSGKCPMRSEAKGRKRSRKADEFSELNDAIRAFAEQTKLMLEAKVARMKEKEKRKQQRDEFSIPNCVNALESLGDLDMNTYTLAIKKFSTAEWREAFMSLSSNARKKAWLDCLK\n>UniRef90_L7LLZ8 Phosphoribosylformylglycinamidine synthase subunit PurS n=9 Tax=Gordoniaceae TaxID=85026 RepID=L7LLZ8_9ACTN\nMARVVVDVMPKAEILDPQGQAIVGALGRLGFAGVADVRQGKRFELEVDGTVDDAALERIAEELLTNTVIENFNVTRVAE\n>UniRef90_Q1IWN5 Nitrogen regulatory protein P-II n=7 Tax=Deinococcus TaxID=1298 RepID=Q1IWN5_DEIGD\nMKLITAVVRPERVQQVKAALFEAGISGLTLSRVSGHGGEQEIVEHYRGTRVMVEFRDKVEFRMAVSEPFVEVAIRAICESARTGEVGDGKIFVQPLERVVRIRTGEEDNAALTPVTETRLTPGLPVRHAR\n>UniRef90_A0A534D3W2 Lipoprotein (Fragment) n=1 Tax=Gammaproteobacteria bacterium TaxID=1913989 RepID=A0A534D3W2_9GAMM\nMFREKRFVSLVLGVSLLAPGCGESTESVSPLQTLPASRGQLLNNPPTKLGSFSVSDLLSRLSGSQMGRELIKLAFSPTCSVDT\n>UniRef90_A0A2G2QLC1 C4-dicarboxylate ABC transporter n=1 Tax=Cycloclasticus sp. TaxID=2024830 RepID=A0A2G2QLC1_9GAMM\nMVSENKLPLAVVFLFLMLGVIWWPSFSNLGDLFGYAAKAEYKGVSLLNFFRAELVVLVTVWAVLISYKEQNDMVDGNAYVTRFLILVMFVIGQVFMGFFAGGFLVHQDASWYQVIHEANEVMPSQAVILLVCYPLYLFFGGSAFIYAKTRLPKFLKGKEFSFMVLTFAPLAFLPYYDSSFMQAKKDLFEIAYLSVYWLLSVGWVVIGVLYIILKASQGIFKGLSDPYGEM\n>UniRef90_A0A562TCA1 Toprim domain-containing protein n=1 Tax=Chitinophaga japonensis TaxID=104662 RepID=A0A562TCA1_CHIJA\nMKKLMCAEAKQIDLVDYLASLGHRPQKVRNQDYWYLSPLREEKTPSFKVNRQLNVWYDHGTGKGGDLIDFGTLYFGCSVSDLLDRLSHHQPAPSLSLHPPTHASRQHSGPASFAGERKDASGSRIVILDARPLAEPSLLEYLQKRCIPLEIATRFCKEVDFLLYGEKRTVIGFRNNAGGYELRSGNFKGSSSPKDVTFIDNHAGEITVFEGFFSFLSFQTINNNQQDTVSNCLILNSLSFFEKSRPLMEQHGKVHLVLDRDAAGIHHTQKTLQWDRDKYQDRSDFYHGHKDLNEWLVHHHHSQKEPQRLRRRP\n>UniRef90_UPI0017892BBC TlpA family protein disulfide reductase n=1 Tax=Plantactinospora soyae TaxID=1544732 RepID=UPI0017892BBC\nMRRPRRARLGALLAVAAALALALVGCSGEDDWKDDCTTKGGVIECAPEHRPQAPKVTGELLSGGNYDLAQDRGQVAVINFWGSWCAPCRAEADDLEATYQATRERGVRFIGINIQDGRDKARAFEEAFKVTYPSLFDPPSRLALAFDIPPNSIPATVVLDREGRIAVVIRTAVTRETLEPILTRVAAEQAAPGGGPN\n>UniRef90_A0A3M8TKU5 Tail assembly chaperone n=2 Tax=Pseudomonas putida group TaxID=136845 RepID=A0A3M8TKU5_PSEPU\nMKQPERITLVLRASEAAPLSSILPFTKLGDLVSAGRGLAVIAGFSEGDLQARLAECEAQLQEADVLLREAIAYVNDELVNVEYRDILIARIDRLLDRDQAQQAEKPREQEP\n>UniRef90_A0A357MHW4 SseB domain-containing protein (Fragment) n=1 Tax=Rhodobacteraceae bacterium TaxID=1904441 RepID=A0A357MHW4_9RHOB\nMTEAPKTPETPETALDAAHAAMQAAPADDAARLRFFERVADSELFLLLKREASGDQVDPESFELADGTFVLAFDREERLAAFTGRASPYLALSGRVLARMLAGQGIGLGLNLEVA\n>UniRef90_UPI0004CC520E alpha-L-rhamnosidase N-terminal domain-containing protein n=1 Tax=Streptomyces cellulosae TaxID=1968 RepID=UPI0004CC520E\nMTYTDGSATSLVTDKDWLTADGPTTFDQVYSGEKDDARRADELEEWRSAGHRAARAGQLLRTVPRVPRHACRGDYPRRPSAAHSGLVQDRVDDLSHLVPALMTADRAVLSLPGRDDRPDQLPRLQVALAPAPRTARTVAAADHAG\n"
  },
  {
    "path": "src/alphafold3/test_data/model_config.json",
    "content": "{\n  \"evoformer\": {\n    \"max_relative_chain\": 2,\n    \"max_relative_idx\": 32,\n    \"msa_channel\": 64,\n    \"msa_stack\": {\n      \"msa_attention\": {\n        \"num_head\": 8\n      },\n      \"msa_transition\": {\n        \"num_intermediate_factor\": 4,\n        \"use_glu_kernel\": true\n      },\n      \"num_layer\": 4,\n      \"outer_product_mean\": {\n        \"chunk_size\": 128,\n        \"num_outer_channel\": 32\n      },\n      \"pair_attention\": {\n        \"num_head\": 4\n      },\n      \"pair_transition\": {\n        \"num_intermediate_factor\": 4,\n        \"use_glu_kernel\": true\n      },\n      \"shard_transition_blocks\": true,\n      \"triangle_multiplication_incoming\": {\n        \"equation\": \"kjc,kic->ijc\",\n        \"use_glu_kernel\": true\n      },\n      \"triangle_multiplication_outgoing\": {\n        \"equation\": \"ikc,jkc->ijc\",\n        \"use_glu_kernel\": true\n      }\n    },\n    \"num_msa\": 1024,\n    \"pair_channel\": 128,\n    \"pairformer\": {\n      \"block_remat\": false,\n      \"num_layer\": 48,\n      \"pair_attention\": {\n        \"num_head\": 4\n      },\n      \"pair_transition\": {\n        \"num_intermediate_factor\": 4,\n        \"use_glu_kernel\": true\n      },\n      \"remat_block_size\": 8,\n      \"shard_transition_blocks\": true,\n      \"single_attention\": {\n        \"key_dim\": null,\n        \"num_head\": 16,\n        \"value_dim\": null\n      },\n      \"single_transition\": {\n        \"num_intermediate_factor\": 4,\n        \"use_glu_kernel\": true\n      },\n      \"triangle_multiplication_incoming\": {\n        \"equation\": \"kjc,kic->ijc\",\n        \"use_glu_kernel\": true\n      },\n      \"triangle_multiplication_outgoing\": {\n        \"equation\": \"ikc,jkc->ijc\",\n        \"use_glu_kernel\": true\n      }\n    },\n    \"per_atom_conditioning\": {\n      \"atom_transformer\": {\n        \"attention\": {\n          \"key_dim\": 128,\n          \"num_head\": 4,\n          \"value_dim\": 128\n        },\n        \"num_blocks\": 3,\n        \"num_intermediate_factor\": 2\n      },\n      \"per_atom_channels\": 128,\n      \"per_atom_pair_channels\": 16,\n      \"per_token_channels\": 384\n    },\n    \"seq_channel\": 384,\n    \"template\": {\n      \"dgram_features\": {\n        \"max_bin\": 50.75,\n        \"min_bin\": 3.25,\n        \"num_bins\": 39\n      },\n      \"num_channels\": 64,\n      \"template_stack\": {\n        \"num_layer\": 2,\n        \"pair_attention\": {\n          \"num_head\": 4\n        },\n        \"pair_transition\": {\n          \"num_intermediate_factor\": 2,\n          \"use_glu_kernel\": true\n        },\n        \"shard_transition_blocks\": true,\n        \"single_attention\": null,\n        \"single_transition\": null,\n        \"triangle_multiplication_incoming\": {\n          \"equation\": \"kjc,kic->ijc\",\n          \"use_glu_kernel\": true\n        },\n        \"triangle_multiplication_outgoing\": {\n          \"equation\": \"ikc,jkc->ijc\",\n          \"use_glu_kernel\": true\n        }\n      }\n    }\n  },\n  \"global_config\": {\n    \"bfloat16\": \"all\",\n    \"final_init\": \"zeros\",\n    \"flash_attention_implementation\": \"triton\",\n    \"pair_attention_chunk_size\": [\n      [\n        1536,\n        128\n      ],\n      [\n        null,\n        32\n      ]\n    ],\n    \"pair_transition_shard_spec\": [\n      [\n        2048,\n        null\n      ],\n      [\n        null,\n        1024\n      ]\n    ]\n  },\n  \"heads\": {\n    \"confidence\": {\n      \"dgram_features\": {\n        \"max_bin\": 50.75,\n        \"min_bin\": 3.25,\n        \"num_bins\": 39\n      },\n      \"max_error_bin\": 31.0,\n      \"no_embedding_prob\": 0.2,\n      \"num_bins\": 64,\n      \"num_plddt_bins\": 50,\n      \"pae\": {\n        \"max_error_bin\": 31.0,\n        \"num_bins\": 64\n      },\n      \"pairformer\": {\n        \"num_layer\": 4,\n        \"pair_attention\": {\n          \"num_head\": 4\n        },\n        \"pair_transition\": {\n          \"num_intermediate_factor\": 4,\n          \"use_glu_kernel\": true\n        },\n        \"shard_transition_blocks\": true,\n        \"single_attention\": {\n          \"key_dim\": null,\n          \"num_head\": 16,\n          \"value_dim\": null\n        },\n        \"single_transition\": {\n          \"num_intermediate_factor\": 4,\n          \"use_glu_kernel\": true\n        },\n        \"triangle_multiplication_incoming\": {\n          \"equation\": \"kjc,kic->ijc\",\n          \"use_glu_kernel\": true\n        },\n        \"triangle_multiplication_outgoing\": {\n          \"equation\": \"ikc,jkc->ijc\",\n          \"use_glu_kernel\": true\n        }\n      }\n    },\n    \"diffusion\": {\n      \"atom_transformer\": {\n        \"attention\": {\n          \"key_dim\": 128,\n          \"num_head\": 4,\n          \"value_dim\": 128\n        },\n        \"num_blocks\": 3,\n        \"num_intermediate_factor\": 2\n      },\n      \"conditioning\": {\n        \"pair_channel\": 128,\n        \"prob\": 0.8,\n        \"seq_channel\": 384\n      },\n      \"eval\": {\n        \"gamma_0\": 0.8,\n        \"gamma_min\": 1.0,\n        \"noise_scale\": 1.003,\n        \"num_samples\": 5,\n        \"step_scale\": 1.5,\n        \"steps\": 200\n      },\n      \"eval_batch_dim_shard_size\": 5,\n      \"eval_batch_size\": 5,\n      \"per_atom_channels\": 128,\n      \"per_atom_pair_channels\": 16,\n      \"per_token_channels\": 768,\n      \"transformer\": {\n        \"attention\": {\n          \"key_dim\": null,\n          \"num_head\": 16,\n          \"value_dim\": null\n        },\n        \"block_remat\": false,\n        \"num_blocks\": 24,\n        \"num_intermediate_factor\": 2,\n        \"super_block_size\": 4\n      }\n    },\n    \"distogram\": {\n      \"first_break\": 2.3125,\n      \"last_break\": 21.6875,\n      \"num_bins\": 64\n    }\n  },\n  \"num_recycles\": 10,\n  \"return_distogram\": false,\n  \"return_embeddings\": false\n}"
  },
  {
    "path": "src/alphafold3/version.py",
    "content": "# Copyright 2024 DeepMind Technologies Limited\n#\n# AlphaFold 3 source code is licensed under CC BY-NC-SA 4.0. To view a copy of\n# this license, visit https://creativecommons.org/licenses/by-nc-sa/4.0/\n#\n# To request access to the AlphaFold 3 model parameters, follow the process set\n# out at https://github.com/google-deepmind/alphafold3. You may only use these\n# if received directly from Google. Use is subject to terms of use available at\n# https://github.com/google-deepmind/alphafold3/blob/main/WEIGHTS_TERMS_OF_USE.md\n\n\"\"\"Single source of truth for the AlphaFold version.\"\"\"\n\n__version__ = '3.0.1'\n"
  }
]